Warmup Train [1][0/3239]	Time 43.246 (43.246)	Data 14.447 (14.447)	Loss 6.9597 (6.9597)	Top-1 acc 0.000 (0.000)	Top-5 acc 0.000 (0.000)	lr 0.05000
Warmup Train [1][10/3239]	Time 0.443 (4.612)	Data 0.001 (1.315)	Loss 6.8436 (6.8894)	Top-1 acc 0.000 (0.036)	Top-5 acc 0.391 (0.568)	lr 0.05000
Warmup Train [1][20/3239]	Time 0.570 (2.663)	Data 0.001 (0.693)	Loss 6.7979 (6.8365)	Top-1 acc 0.000 (0.074)	Top-5 acc 0.391 (0.763)	lr 0.05000
Warmup Train [1][30/3239]	Time 0.520 (1.964)	Data 0.001 (0.470)	Loss 6.7589 (6.8118)	Top-1 acc 0.000 (0.076)	Top-5 acc 0.781 (0.706)	lr 0.05000
Warmup Train [1][40/3239]	Time 0.344 (1.609)	Data 0.001 (0.356)	Loss 6.7133 (6.7908)	Top-1 acc 0.000 (0.133)	Top-5 acc 0.391 (0.715)	lr 0.05000
Warmup Train [1][50/3239]	Time 0.606 (1.393)	Data 0.001 (0.289)	Loss 6.7023 (6.7748)	Top-1 acc 0.000 (0.138)	Top-5 acc 1.172 (0.682)	lr 0.05000
Warmup Train [1][60/3239]	Time 0.531 (1.246)	Data 0.001 (0.242)	Loss 6.7192 (6.7639)	Top-1 acc 0.391 (0.147)	Top-5 acc 0.781 (0.749)	lr 0.05000
Warmup Train [1][70/3239]	Time 0.530 (1.144)	Data 0.002 (0.208)	Loss 6.7250 (6.7569)	Top-1 acc 0.000 (0.149)	Top-5 acc 0.781 (0.759)	lr 0.05000
Warmup Train [1][80/3239]	Time 0.419 (1.061)	Data 0.001 (0.183)	Loss 6.6921 (6.7510)	Top-1 acc 0.391 (0.159)	Top-5 acc 1.172 (0.786)	lr 0.05000
Warmup Train [1][90/3239]	Time 0.507 (1.000)	Data 0.001 (0.164)	Loss 6.7262 (6.7458)	Top-1 acc 0.000 (0.146)	Top-5 acc 0.391 (0.790)	lr 0.05000
Warmup Train [1][100/3239]	Time 0.430 (0.948)	Data 0.001 (0.150)	Loss 6.7158 (6.7421)	Top-1 acc 1.172 (0.159)	Top-5 acc 1.172 (0.801)	lr 0.05000
Warmup Train [1][110/3239]	Time 0.353 (0.908)	Data 0.002 (0.137)	Loss 6.7165 (6.7379)	Top-1 acc 0.000 (0.165)	Top-5 acc 0.391 (0.823)	lr 0.05000
Warmup Train [1][120/3239]	Time 0.555 (0.874)	Data 0.001 (0.127)	Loss 6.6833 (6.7344)	Top-1 acc 0.000 (0.174)	Top-5 acc 0.781 (0.843)	lr 0.05000
Warmup Train [1][130/3239]	Time 0.545 (0.845)	Data 0.002 (0.117)	Loss 6.6889 (6.7307)	Top-1 acc 0.000 (0.179)	Top-5 acc 0.781 (0.841)	lr 0.05000
Warmup Train [1][140/3239]	Time 0.466 (0.818)	Data 0.001 (0.109)	Loss 6.7086 (6.7285)	Top-1 acc 0.000 (0.186)	Top-5 acc 0.391 (0.859)	lr 0.05000
Warmup Train [1][150/3239]	Time 0.518 (0.799)	Data 0.001 (0.103)	Loss 6.6699 (6.7249)	Top-1 acc 0.000 (0.189)	Top-5 acc 0.781 (0.867)	lr 0.05000
Warmup Train [1][160/3239]	Time 0.475 (0.781)	Data 0.001 (0.097)	Loss 6.7306 (6.7230)	Top-1 acc 0.781 (0.194)	Top-5 acc 1.172 (0.852)	lr 0.05000
Warmup Train [1][170/3239]	Time 0.423 (0.765)	Data 0.002 (0.091)	Loss 6.6876 (6.7206)	Top-1 acc 0.781 (0.201)	Top-5 acc 1.172 (0.861)	lr 0.05000
Warmup Train [1][180/3239]	Time 0.486 (0.751)	Data 0.001 (0.087)	Loss 6.6826 (6.7190)	Top-1 acc 0.000 (0.199)	Top-5 acc 0.781 (0.844)	lr 0.05000
Warmup Train [1][190/3239]	Time 0.648 (0.738)	Data 0.002 (0.082)	Loss 6.6750 (6.7169)	Top-1 acc 0.000 (0.192)	Top-5 acc 0.000 (0.843)	lr 0.05000
Warmup Train [1][200/3239]	Time 0.478 (0.727)	Data 0.001 (0.078)	Loss 6.6982 (6.7162)	Top-1 acc 0.781 (0.194)	Top-5 acc 0.781 (0.841)	lr 0.05000
Warmup Train [1][210/3239]	Time 0.682 (0.717)	Data 0.001 (0.075)	Loss 6.7178 (6.7143)	Top-1 acc 0.391 (0.194)	Top-5 acc 1.172 (0.848)	lr 0.05000
Warmup Train [1][220/3239]	Time 0.411 (0.708)	Data 0.001 (0.072)	Loss 6.6454 (6.7126)	Top-1 acc 0.000 (0.186)	Top-5 acc 1.172 (0.843)	lr 0.05000
Warmup Train [1][230/3239]	Time 0.646 (0.700)	Data 0.001 (0.069)	Loss 6.7206 (6.7113)	Top-1 acc 0.391 (0.181)	Top-5 acc 0.391 (0.835)	lr 0.05000
Warmup Train [1][240/3239]	Time 0.575 (0.691)	Data 0.002 (0.066)	Loss 6.7068 (6.7100)	Top-1 acc 0.391 (0.182)	Top-5 acc 0.781 (0.841)	lr 0.05000
Warmup Train [1][250/3239]	Time 0.517 (0.683)	Data 0.001 (0.064)	Loss 6.6808 (6.7087)	Top-1 acc 0.781 (0.185)	Top-5 acc 1.562 (0.856)	lr 0.05000
Warmup Train [1][260/3239]	Time 0.483 (0.677)	Data 0.001 (0.062)	Loss 6.6831 (6.7076)	Top-1 acc 0.000 (0.181)	Top-5 acc 0.391 (0.867)	lr 0.05000
Warmup Train [1][270/3239]	Time 0.394 (0.671)	Data 0.001 (0.060)	Loss 6.6997 (6.7067)	Top-1 acc 0.000 (0.179)	Top-5 acc 0.781 (0.875)	lr 0.05000
Warmup Train [1][280/3239]	Time 0.582 (0.665)	Data 0.001 (0.058)	Loss 6.6875 (6.7062)	Top-1 acc 0.000 (0.179)	Top-5 acc 0.781 (0.884)	lr 0.05000
Warmup Train [1][290/3239]	Time 0.529 (0.661)	Data 0.001 (0.056)	Loss 6.6356 (6.7045)	Top-1 acc 0.000 (0.177)	Top-5 acc 0.391 (0.882)	lr 0.05000
Warmup Train [1][300/3239]	Time 0.631 (0.656)	Data 0.001 (0.054)	Loss 6.6520 (6.7037)	Top-1 acc 0.000 (0.174)	Top-5 acc 1.172 (0.881)	lr 0.05000
Warmup Train [1][310/3239]	Time 0.506 (0.651)	Data 0.001 (0.053)	Loss 6.6561 (6.7027)	Top-1 acc 0.391 (0.176)	Top-5 acc 0.781 (0.880)	lr 0.05000
Warmup Train [1][320/3239]	Time 0.542 (0.647)	Data 0.001 (0.051)	Loss 6.6957 (6.7018)	Top-1 acc 0.000 (0.175)	Top-5 acc 1.172 (0.879)	lr 0.05000
Warmup Train [1][330/3239]	Time 0.538 (0.642)	Data 0.001 (0.050)	Loss 6.6811 (6.7008)	Top-1 acc 0.391 (0.172)	Top-5 acc 1.172 (0.876)	lr 0.05000
Warmup Train [1][340/3239]	Time 0.601 (0.638)	Data 0.001 (0.048)	Loss 6.6849 (6.7002)	Top-1 acc 0.391 (0.174)	Top-5 acc 0.391 (0.885)	lr 0.05000
Warmup Train [1][350/3239]	Time 0.574 (0.634)	Data 0.001 (0.047)	Loss 6.6507 (6.6996)	Top-1 acc 0.391 (0.176)	Top-5 acc 1.172 (0.890)	lr 0.05000
Warmup Train [1][360/3239]	Time 0.455 (0.630)	Data 0.002 (0.046)	Loss 6.6384 (6.6988)	Top-1 acc 0.391 (0.177)	Top-5 acc 2.344 (0.901)	lr 0.05000
Warmup Train [1][370/3239]	Time 0.525 (0.627)	Data 0.001 (0.045)	Loss 6.6718 (6.6979)	Top-1 acc 0.000 (0.177)	Top-5 acc 0.781 (0.905)	lr 0.05000
Warmup Train [1][380/3239]	Time 0.463 (0.624)	Data 0.001 (0.044)	Loss 6.6918 (6.6973)	Top-1 acc 0.391 (0.180)	Top-5 acc 1.562 (0.910)	lr 0.05000
Warmup Train [1][390/3239]	Time 0.290 (0.619)	Data 0.001 (0.043)	Loss 6.6560 (6.6969)	Top-1 acc 0.000 (0.184)	Top-5 acc 0.000 (0.913)	lr 0.05000
Warmup Train [1][400/3239]	Time 0.536 (0.616)	Data 0.001 (0.042)	Loss 6.6341 (6.6962)	Top-1 acc 0.391 (0.187)	Top-5 acc 0.781 (0.925)	lr 0.05000
Warmup Train [1][410/3239]	Time 0.583 (0.614)	Data 0.001 (0.041)	Loss 6.7031 (6.6956)	Top-1 acc 0.391 (0.187)	Top-5 acc 0.781 (0.927)	lr 0.05000
Warmup Train [1][420/3239]	Time 0.531 (0.612)	Data 0.002 (0.040)	Loss 6.6559 (6.6948)	Top-1 acc 0.000 (0.191)	Top-5 acc 0.781 (0.930)	lr 0.05000
Warmup Train [1][430/3239]	Time 0.550 (0.609)	Data 0.001 (0.039)	Loss 6.7213 (6.6944)	Top-1 acc 0.000 (0.191)	Top-5 acc 0.000 (0.936)	lr 0.05000
Warmup Train [1][440/3239]	Time 0.666 (0.607)	Data 0.002 (0.038)	Loss 6.7244 (6.6939)	Top-1 acc 0.000 (0.190)	Top-5 acc 0.391 (0.946)	lr 0.05000
Warmup Train [1][450/3239]	Time 0.343 (0.605)	Data 0.001 (0.038)	Loss 6.6519 (6.6932)	Top-1 acc 0.391 (0.192)	Top-5 acc 1.172 (0.949)	lr 0.05000
Warmup Train [1][460/3239]	Time 0.559 (0.603)	Data 0.001 (0.037)	Loss 6.6659 (6.6928)	Top-1 acc 0.391 (0.191)	Top-5 acc 1.562 (0.952)	lr 0.05000
Warmup Train [1][470/3239]	Time 0.393 (0.601)	Data 0.001 (0.037)	Loss 6.6770 (6.6922)	Top-1 acc 0.000 (0.193)	Top-5 acc 0.781 (0.955)	lr 0.05000
Warmup Train [1][480/3239]	Time 0.555 (0.600)	Data 0.001 (0.036)	Loss 6.6513 (6.6921)	Top-1 acc 0.000 (0.194)	Top-5 acc 0.781 (0.952)	lr 0.05000
Warmup Train [1][490/3239]	Time 0.418 (0.597)	Data 0.001 (0.035)	Loss 6.6749 (6.6915)	Top-1 acc 0.000 (0.195)	Top-5 acc 0.391 (0.959)	lr 0.05000
Warmup Train [1][500/3239]	Time 0.448 (0.596)	Data 0.002 (0.035)	Loss 6.6822 (6.6910)	Top-1 acc 0.000 (0.194)	Top-5 acc 0.000 (0.957)	lr 0.05000
Warmup Train [1][510/3239]	Time 0.584 (0.594)	Data 0.001 (0.034)	Loss 6.6942 (6.6903)	Top-1 acc 0.781 (0.198)	Top-5 acc 0.781 (0.961)	lr 0.05000
Warmup Train [1][520/3239]	Time 0.553 (0.593)	Data 0.001 (0.034)	Loss 6.6634 (6.6901)	Top-1 acc 0.391 (0.199)	Top-5 acc 0.781 (0.963)	lr 0.05000
Warmup Train [1][530/3239]	Time 0.629 (0.591)	Data 0.001 (0.033)	Loss 6.6884 (6.6895)	Top-1 acc 0.000 (0.200)	Top-5 acc 0.000 (0.970)	lr 0.05000
Warmup Train [1][540/3239]	Time 0.425 (0.589)	Data 0.001 (0.033)	Loss 6.6634 (6.6892)	Top-1 acc 0.391 (0.199)	Top-5 acc 1.172 (0.970)	lr 0.05000
Warmup Train [1][550/3239]	Time 0.358 (0.588)	Data 0.001 (0.033)	Loss 6.6783 (6.6888)	Top-1 acc 0.000 (0.199)	Top-5 acc 0.391 (0.969)	lr 0.05000
Warmup Train [1][560/3239]	Time 0.551 (0.587)	Data 0.001 (0.032)	Loss 6.6611 (6.6882)	Top-1 acc 0.391 (0.199)	Top-5 acc 1.172 (0.976)	lr 0.05000
Warmup Train [1][570/3239]	Time 0.367 (0.585)	Data 0.001 (0.032)	Loss 6.6494 (6.6877)	Top-1 acc 0.000 (0.198)	Top-5 acc 2.344 (0.978)	lr 0.05000
Warmup Train [1][580/3239]	Time 0.477 (0.584)	Data 0.001 (0.032)	Loss 6.6271 (6.6872)	Top-1 acc 0.781 (0.200)	Top-5 acc 1.562 (0.984)	lr 0.05000
Warmup Train [1][590/3239]	Time 0.472 (0.583)	Data 0.001 (0.031)	Loss 6.6883 (6.6868)	Top-1 acc 0.000 (0.198)	Top-5 acc 1.172 (0.989)	lr 0.05000
Warmup Train [1][600/3239]	Time 0.521 (0.581)	Data 0.001 (0.031)	Loss 6.6781 (6.6865)	Top-1 acc 0.391 (0.198)	Top-5 acc 1.172 (0.987)	lr 0.05000
Warmup Train [1][610/3239]	Time 0.389 (0.579)	Data 0.001 (0.030)	Loss 6.6144 (6.6861)	Top-1 acc 0.391 (0.196)	Top-5 acc 1.562 (0.989)	lr 0.05000
Warmup Train [1][620/3239]	Time 0.376 (0.578)	Data 0.001 (0.030)	Loss 6.6590 (6.6858)	Top-1 acc 0.391 (0.194)	Top-5 acc 1.953 (0.983)	lr 0.05000
Warmup Train [1][630/3239]	Time 0.544 (0.576)	Data 0.002 (0.030)	Loss 6.6425 (6.6853)	Top-1 acc 0.000 (0.193)	Top-5 acc 0.781 (0.985)	lr 0.05000
Warmup Train [1][640/3239]	Time 0.377 (0.575)	Data 0.001 (0.029)	Loss 6.6786 (6.6848)	Top-1 acc 0.391 (0.196)	Top-5 acc 0.391 (0.991)	lr 0.05000
Warmup Train [1][650/3239]	Time 0.690 (0.573)	Data 0.001 (0.029)	Loss 6.6257 (6.6841)	Top-1 acc 0.000 (0.194)	Top-5 acc 1.953 (0.992)	lr 0.05000
Warmup Train [1][660/3239]	Time 0.570 (0.572)	Data 0.002 (0.029)	Loss 6.6559 (6.6837)	Top-1 acc 0.000 (0.194)	Top-5 acc 0.391 (0.998)	lr 0.05000
Warmup Train [1][670/3239]	Time 0.481 (0.571)	Data 0.002 (0.028)	Loss 6.6341 (6.6835)	Top-1 acc 0.391 (0.196)	Top-5 acc 0.391 (0.996)	lr 0.05000
Warmup Train [1][680/3239]	Time 0.612 (0.571)	Data 0.001 (0.028)	Loss 6.6544 (6.6832)	Top-1 acc 0.000 (0.198)	Top-5 acc 1.172 (0.999)	lr 0.05000
Warmup Train [1][690/3239]	Time 0.537 (0.570)	Data 0.002 (0.028)	Loss 6.6015 (6.6827)	Top-1 acc 0.391 (0.201)	Top-5 acc 1.562 (1.004)	lr 0.05000
Warmup Train [1][700/3239]	Time 0.748 (0.570)	Data 0.001 (0.027)	Loss 6.6033 (6.6823)	Top-1 acc 0.391 (0.201)	Top-5 acc 1.172 (1.007)	lr 0.05000
Warmup Train [1][710/3239]	Time 0.328 (0.569)	Data 0.001 (0.027)	Loss 6.7269 (6.6820)	Top-1 acc 0.391 (0.203)	Top-5 acc 0.391 (1.011)	lr 0.05000
Warmup Train [1][720/3239]	Time 0.607 (0.568)	Data 0.001 (0.027)	Loss 6.6616 (6.6816)	Top-1 acc 0.000 (0.203)	Top-5 acc 1.953 (1.012)	lr 0.05000
Warmup Train [1][730/3239]	Time 0.524 (0.568)	Data 0.035 (0.027)	Loss 6.6184 (6.6812)	Top-1 acc 0.391 (0.200)	Top-5 acc 0.391 (1.007)	lr 0.05000
Warmup Train [1][740/3239]	Time 0.492 (0.567)	Data 0.001 (0.026)	Loss 6.6367 (6.6809)	Top-1 acc 0.000 (0.200)	Top-5 acc 1.172 (1.010)	lr 0.05000
Warmup Train [1][750/3239]	Time 0.426 (0.567)	Data 0.001 (0.026)	Loss 6.6817 (6.6806)	Top-1 acc 0.000 (0.201)	Top-5 acc 0.781 (1.008)	lr 0.05000
Warmup Train [1][760/3239]	Time 0.490 (0.566)	Data 0.001 (0.026)	Loss 6.6747 (6.6803)	Top-1 acc 0.000 (0.202)	Top-5 acc 0.781 (1.011)	lr 0.05000
Warmup Train [1][770/3239]	Time 0.599 (0.565)	Data 0.001 (0.026)	Loss 6.6618 (6.6799)	Top-1 acc 0.000 (0.204)	Top-5 acc 0.781 (1.014)	lr 0.05000
Warmup Train [1][780/3239]	Time 0.498 (0.565)	Data 0.002 (0.025)	Loss 6.6779 (6.6795)	Top-1 acc 0.000 (0.206)	Top-5 acc 1.172 (1.018)	lr 0.05000
Warmup Train [1][790/3239]	Time 0.524 (0.564)	Data 0.001 (0.025)	Loss 6.6643 (6.6792)	Top-1 acc 0.391 (0.206)	Top-5 acc 0.391 (1.018)	lr 0.05000
Warmup Train [1][800/3239]	Time 0.376 (0.563)	Data 0.001 (0.025)	Loss 6.6419 (6.6789)	Top-1 acc 0.000 (0.206)	Top-5 acc 1.562 (1.020)	lr 0.05000
Warmup Train [1][810/3239]	Time 0.547 (0.562)	Data 0.001 (0.025)	Loss 6.6394 (6.6786)	Top-1 acc 0.000 (0.206)	Top-5 acc 0.781 (1.022)	lr 0.05000
Warmup Train [1][820/3239]	Time 0.454 (0.562)	Data 0.001 (0.024)	Loss 6.6571 (6.6784)	Top-1 acc 0.000 (0.205)	Top-5 acc 0.391 (1.021)	lr 0.05000
Warmup Train [1][830/3239]	Time 0.516 (0.561)	Data 0.001 (0.024)	Loss 6.6855 (6.6783)	Top-1 acc 0.000 (0.207)	Top-5 acc 0.391 (1.021)	lr 0.04999
Warmup Train [1][840/3239]	Time 0.598 (0.561)	Data 0.001 (0.024)	Loss 6.6764 (6.6779)	Top-1 acc 0.000 (0.207)	Top-5 acc 1.172 (1.025)	lr 0.04999
Warmup Train [1][850/3239]	Time 0.630 (0.560)	Data 0.003 (0.024)	Loss 6.6721 (6.6774)	Top-1 acc 0.000 (0.208)	Top-5 acc 0.391 (1.025)	lr 0.04999
Warmup Train [1][860/3239]	Time 0.621 (0.559)	Data 0.001 (0.024)	Loss 6.6831 (6.6772)	Top-1 acc 0.000 (0.208)	Top-5 acc 0.391 (1.026)	lr 0.04999
Warmup Train [1][870/3239]	Time 0.509 (0.559)	Data 0.001 (0.023)	Loss 6.6471 (6.6771)	Top-1 acc 0.391 (0.208)	Top-5 acc 0.781 (1.023)	lr 0.04999
Warmup Train [1][880/3239]	Time 0.435 (0.558)	Data 0.001 (0.023)	Loss 6.6559 (6.6768)	Top-1 acc 0.391 (0.208)	Top-5 acc 0.781 (1.025)	lr 0.04999
Warmup Train [1][890/3239]	Time 0.589 (0.557)	Data 0.001 (0.023)	Loss 6.6559 (6.6766)	Top-1 acc 0.391 (0.210)	Top-5 acc 0.781 (1.025)	lr 0.04999
Warmup Train [1][900/3239]	Time 0.375 (0.556)	Data 0.001 (0.023)	Loss 6.6642 (6.6762)	Top-1 acc 0.391 (0.212)	Top-5 acc 1.172 (1.028)	lr 0.04999
Warmup Train [1][910/3239]	Time 0.368 (0.555)	Data 0.001 (0.023)	Loss 6.6288 (6.6760)	Top-1 acc 0.781 (0.214)	Top-5 acc 2.344 (1.032)	lr 0.04999
Warmup Train [1][920/3239]	Time 0.469 (0.555)	Data 0.001 (0.023)	Loss 6.6281 (6.6756)	Top-1 acc 0.000 (0.214)	Top-5 acc 2.344 (1.035)	lr 0.04999
Warmup Train [1][930/3239]	Time 0.501 (0.555)	Data 0.001 (0.022)	Loss 6.6241 (6.6754)	Top-1 acc 0.391 (0.214)	Top-5 acc 1.562 (1.036)	lr 0.04999
Warmup Train [1][940/3239]	Time 0.537 (0.554)	Data 0.001 (0.022)	Loss 6.6720 (6.6750)	Top-1 acc 0.000 (0.214)	Top-5 acc 0.391 (1.033)	lr 0.04999
Warmup Train [1][950/3239]	Time 0.540 (0.554)	Data 0.001 (0.022)	Loss 6.6552 (6.6747)	Top-1 acc 0.781 (0.216)	Top-5 acc 1.562 (1.035)	lr 0.04999
Warmup Train [1][960/3239]	Time 0.563 (0.553)	Data 0.001 (0.022)	Loss 6.6523 (6.6744)	Top-1 acc 0.391 (0.215)	Top-5 acc 0.781 (1.036)	lr 0.04999
Warmup Train [1][970/3239]	Time 0.507 (0.553)	Data 0.001 (0.022)	Loss 6.6134 (6.6740)	Top-1 acc 0.781 (0.217)	Top-5 acc 1.562 (1.044)	lr 0.04999
Warmup Train [1][980/3239]	Time 0.495 (0.552)	Data 0.001 (0.022)	Loss 6.6746 (6.6738)	Top-1 acc 0.000 (0.217)	Top-5 acc 0.781 (1.046)	lr 0.04999
Warmup Train [1][990/3239]	Time 0.551 (0.552)	Data 0.001 (0.021)	Loss 6.6127 (6.6735)	Top-1 acc 0.391 (0.217)	Top-5 acc 0.781 (1.044)	lr 0.04999
Warmup Train [1][1000/3239]	Time 0.424 (0.551)	Data 0.001 (0.021)	Loss 6.6424 (6.6731)	Top-1 acc 0.000 (0.217)	Top-5 acc 0.781 (1.047)	lr 0.04999
Warmup Train [1][1010/3239]	Time 0.628 (0.551)	Data 0.001 (0.021)	Loss 6.6249 (6.6727)	Top-1 acc 0.000 (0.218)	Top-5 acc 1.172 (1.050)	lr 0.04999
Warmup Train [1][1020/3239]	Time 0.523 (0.550)	Data 0.001 (0.021)	Loss 6.6188 (6.6724)	Top-1 acc 0.000 (0.217)	Top-5 acc 0.000 (1.050)	lr 0.04999
Warmup Train [1][1030/3239]	Time 0.587 (0.550)	Data 0.001 (0.021)	Loss 6.6401 (6.6722)	Top-1 acc 0.391 (0.216)	Top-5 acc 0.781 (1.049)	lr 0.04999
Warmup Train [1][1040/3239]	Time 0.670 (0.550)	Data 0.001 (0.021)	Loss 6.6595 (6.6719)	Top-1 acc 0.391 (0.215)	Top-5 acc 0.781 (1.048)	lr 0.04999
Warmup Train [1][1050/3239]	Time 0.484 (0.549)	Data 0.001 (0.021)	Loss 6.6597 (6.6716)	Top-1 acc 0.000 (0.215)	Top-5 acc 1.172 (1.049)	lr 0.04999
Warmup Train [1][1060/3239]	Time 0.430 (0.549)	Data 0.002 (0.020)	Loss 6.6316 (6.6712)	Top-1 acc 0.000 (0.217)	Top-5 acc 1.953 (1.057)	lr 0.04999
Warmup Train [1][1070/3239]	Time 0.478 (0.548)	Data 0.001 (0.020)	Loss 6.6454 (6.6709)	Top-1 acc 0.781 (0.217)	Top-5 acc 1.172 (1.057)	lr 0.04999
Warmup Train [1][1080/3239]	Time 0.520 (0.548)	Data 0.001 (0.020)	Loss 6.6299 (6.6706)	Top-1 acc 0.000 (0.216)	Top-5 acc 0.781 (1.059)	lr 0.04999
Warmup Train [1][1090/3239]	Time 0.437 (0.548)	Data 0.001 (0.020)	Loss 6.6468 (6.6703)	Top-1 acc 0.000 (0.217)	Top-5 acc 1.172 (1.061)	lr 0.04999
Warmup Train [1][1100/3239]	Time 0.593 (0.547)	Data 0.001 (0.020)	Loss 6.6285 (6.6702)	Top-1 acc 0.000 (0.216)	Top-5 acc 1.562 (1.060)	lr 0.04999
Warmup Train [1][1110/3239]	Time 0.597 (0.547)	Data 0.001 (0.020)	Loss 6.6663 (6.6700)	Top-1 acc 0.391 (0.217)	Top-5 acc 1.172 (1.060)	lr 0.04999
Warmup Train [1][1120/3239]	Time 0.472 (0.547)	Data 0.001 (0.020)	Loss 6.6925 (6.6696)	Top-1 acc 0.000 (0.218)	Top-5 acc 1.172 (1.061)	lr 0.04999
Warmup Train [1][1130/3239]	Time 0.646 (0.546)	Data 0.001 (0.020)	Loss 6.6938 (6.6694)	Top-1 acc 0.781 (0.220)	Top-5 acc 1.953 (1.062)	lr 0.04999
Warmup Train [1][1140/3239]	Time 0.170 (0.546)	Data 0.001 (0.019)	Loss 6.6641 (6.6692)	Top-1 acc 0.781 (0.220)	Top-5 acc 1.562 (1.061)	lr 0.04999
Warmup Train [1][1150/3239]	Time 0.434 (0.545)	Data 0.001 (0.019)	Loss 6.6159 (6.6689)	Top-1 acc 0.391 (0.221)	Top-5 acc 0.781 (1.062)	lr 0.04999
Warmup Train [1][1160/3239]	Time 0.628 (0.545)	Data 0.001 (0.019)	Loss 6.6302 (6.6686)	Top-1 acc 0.391 (0.222)	Top-5 acc 0.781 (1.063)	lr 0.04999
Warmup Train [1][1170/3239]	Time 0.477 (0.544)	Data 0.001 (0.019)	Loss 6.5892 (6.6682)	Top-1 acc 0.391 (0.222)	Top-5 acc 1.953 (1.066)	lr 0.04999
Warmup Train [1][1180/3239]	Time 0.665 (0.543)	Data 0.001 (0.019)	Loss 6.6934 (6.6681)	Top-1 acc 0.000 (0.223)	Top-5 acc 1.172 (1.065)	lr 0.04999
Warmup Train [1][1190/3239]	Time 0.527 (0.543)	Data 0.001 (0.019)	Loss 6.6408 (6.6679)	Top-1 acc 0.000 (0.222)	Top-5 acc 1.562 (1.067)	lr 0.04999
Warmup Train [1][1200/3239]	Time 0.605 (0.543)	Data 0.001 (0.019)	Loss 6.6758 (6.6676)	Top-1 acc 0.391 (0.221)	Top-5 acc 1.172 (1.069)	lr 0.04999
Warmup Train [1][1210/3239]	Time 0.448 (0.542)	Data 0.001 (0.019)	Loss 6.5983 (6.6673)	Top-1 acc 0.391 (0.221)	Top-5 acc 0.391 (1.070)	lr 0.04999
Warmup Train [1][1220/3239]	Time 0.641 (0.542)	Data 0.001 (0.019)	Loss 6.6558 (6.6670)	Top-1 acc 0.391 (0.222)	Top-5 acc 1.953 (1.074)	lr 0.04999
Warmup Train [1][1230/3239]	Time 0.733 (0.542)	Data 0.002 (0.018)	Loss 6.6086 (6.6666)	Top-1 acc 0.781 (0.223)	Top-5 acc 1.172 (1.075)	lr 0.04999
Warmup Train [1][1240/3239]	Time 0.605 (0.542)	Data 0.003 (0.018)	Loss 6.6101 (6.6663)	Top-1 acc 0.781 (0.222)	Top-5 acc 1.562 (1.074)	lr 0.04999
Warmup Train [1][1250/3239]	Time 0.504 (0.541)	Data 0.001 (0.018)	Loss 6.6460 (6.6661)	Top-1 acc 0.000 (0.223)	Top-5 acc 0.391 (1.075)	lr 0.04999
Warmup Train [1][1260/3239]	Time 0.446 (0.541)	Data 0.001 (0.018)	Loss 6.6126 (6.6659)	Top-1 acc 0.391 (0.223)	Top-5 acc 1.562 (1.080)	lr 0.04999
Warmup Train [1][1270/3239]	Time 0.584 (0.541)	Data 0.001 (0.018)	Loss 6.6514 (6.6657)	Top-1 acc 0.000 (0.224)	Top-5 acc 1.172 (1.082)	lr 0.04999
Warmup Train [1][1280/3239]	Time 0.528 (0.541)	Data 0.001 (0.018)	Loss 6.6531 (6.6654)	Top-1 acc 0.000 (0.225)	Top-5 acc 0.781 (1.084)	lr 0.04999
Warmup Train [1][1290/3239]	Time 0.374 (0.540)	Data 0.001 (0.018)	Loss 6.5852 (6.6651)	Top-1 acc 0.391 (0.225)	Top-5 acc 2.344 (1.085)	lr 0.04999
Warmup Train [1][1300/3239]	Time 0.485 (0.540)	Data 0.002 (0.018)	Loss 6.5903 (6.6648)	Top-1 acc 1.172 (0.225)	Top-5 acc 2.734 (1.088)	lr 0.04999
Warmup Train [1][1310/3239]	Time 0.512 (0.540)	Data 0.001 (0.018)	Loss 6.6457 (6.6647)	Top-1 acc 0.781 (0.227)	Top-5 acc 0.781 (1.088)	lr 0.04999
Warmup Train [1][1320/3239]	Time 0.599 (0.540)	Data 0.001 (0.018)	Loss 6.6545 (6.6644)	Top-1 acc 0.781 (0.227)	Top-5 acc 1.562 (1.088)	lr 0.04999
Warmup Train [1][1330/3239]	Time 0.333 (0.540)	Data 0.001 (0.017)	Loss 6.6287 (6.6641)	Top-1 acc 0.000 (0.227)	Top-5 acc 0.781 (1.089)	lr 0.04999
Warmup Train [1][1340/3239]	Time 0.595 (0.540)	Data 0.001 (0.017)	Loss 6.6186 (6.6637)	Top-1 acc 0.391 (0.228)	Top-5 acc 0.781 (1.093)	lr 0.04999
Warmup Train [1][1350/3239]	Time 0.460 (0.540)	Data 0.001 (0.017)	Loss 6.6599 (6.6636)	Top-1 acc 0.391 (0.228)	Top-5 acc 1.172 (1.092)	lr 0.04999
Warmup Train [1][1360/3239]	Time 0.351 (0.539)	Data 0.001 (0.017)	Loss 6.6434 (6.6633)	Top-1 acc 0.781 (0.230)	Top-5 acc 1.562 (1.093)	lr 0.04999
Warmup Train [1][1370/3239]	Time 0.557 (0.539)	Data 0.001 (0.017)	Loss 6.6476 (6.6632)	Top-1 acc 0.000 (0.229)	Top-5 acc 1.172 (1.092)	lr 0.04999
Warmup Train [1][1380/3239]	Time 0.201 (0.539)	Data 0.001 (0.017)	Loss 6.6131 (6.6629)	Top-1 acc 0.000 (0.229)	Top-5 acc 0.391 (1.094)	lr 0.04999
Warmup Train [1][1390/3239]	Time 0.664 (0.539)	Data 0.001 (0.017)	Loss 6.6120 (6.6627)	Top-1 acc 0.391 (0.230)	Top-5 acc 1.562 (1.094)	lr 0.04999
Warmup Train [1][1400/3239]	Time 0.437 (0.538)	Data 0.001 (0.017)	Loss 6.6676 (6.6624)	Top-1 acc 0.391 (0.231)	Top-5 acc 1.562 (1.095)	lr 0.04999
Warmup Train [1][1410/3239]	Time 0.458 (0.538)	Data 0.001 (0.017)	Loss 6.6527 (6.6622)	Top-1 acc 0.000 (0.230)	Top-5 acc 0.781 (1.094)	lr 0.04999
Warmup Train [1][1420/3239]	Time 0.369 (0.538)	Data 0.001 (0.017)	Loss 6.6108 (6.6619)	Top-1 acc 0.781 (0.231)	Top-5 acc 1.562 (1.097)	lr 0.04999
Warmup Train [1][1430/3239]	Time 0.482 (0.538)	Data 0.001 (0.017)	Loss 6.6344 (6.6617)	Top-1 acc 0.000 (0.231)	Top-5 acc 0.391 (1.096)	lr 0.04998
Warmup Train [1][1440/3239]	Time 0.432 (0.537)	Data 0.002 (0.017)	Loss 6.6313 (6.6614)	Top-1 acc 0.391 (0.231)	Top-5 acc 1.562 (1.097)	lr 0.04998
Warmup Train [1][1450/3239]	Time 0.485 (0.537)	Data 0.001 (0.017)	Loss 6.6169 (6.6611)	Top-1 acc 0.391 (0.232)	Top-5 acc 1.562 (1.098)	lr 0.04998
Warmup Train [1][1460/3239]	Time 0.276 (0.537)	Data 0.001 (0.017)	Loss 6.6158 (6.6609)	Top-1 acc 0.000 (0.232)	Top-5 acc 1.172 (1.100)	lr 0.04998
Warmup Train [1][1470/3239]	Time 0.564 (0.537)	Data 0.001 (0.017)	Loss 6.6461 (6.6607)	Top-1 acc 0.000 (0.231)	Top-5 acc 1.172 (1.100)	lr 0.04998
Warmup Train [1][1480/3239]	Time 0.608 (0.536)	Data 0.001 (0.016)	Loss 6.6005 (6.6605)	Top-1 acc 0.000 (0.231)	Top-5 acc 1.562 (1.101)	lr 0.04998
Warmup Train [1][1490/3239]	Time 0.547 (0.536)	Data 0.001 (0.016)	Loss 6.6868 (6.6601)	Top-1 acc 0.000 (0.231)	Top-5 acc 0.391 (1.102)	lr 0.04998
Warmup Train [1][1500/3239]	Time 0.493 (0.536)	Data 0.001 (0.016)	Loss 6.5971 (6.6599)	Top-1 acc 0.000 (0.232)	Top-5 acc 1.562 (1.105)	lr 0.04998
Warmup Train [1][1510/3239]	Time 0.603 (0.536)	Data 0.001 (0.016)	Loss 6.6114 (6.6596)	Top-1 acc 0.000 (0.232)	Top-5 acc 0.391 (1.104)	lr 0.04998
Warmup Train [1][1520/3239]	Time 0.543 (0.536)	Data 0.001 (0.016)	Loss 6.6052 (6.6594)	Top-1 acc 0.000 (0.232)	Top-5 acc 0.781 (1.103)	lr 0.04998
Warmup Train [1][1530/3239]	Time 0.503 (0.536)	Data 0.001 (0.016)	Loss 6.6627 (6.6592)	Top-1 acc 0.000 (0.233)	Top-5 acc 1.172 (1.107)	lr 0.04998
Warmup Train [1][1540/3239]	Time 0.504 (0.536)	Data 0.001 (0.016)	Loss 6.6323 (6.6589)	Top-1 acc 0.391 (0.233)	Top-5 acc 0.781 (1.109)	lr 0.04998
Warmup Train [1][1550/3239]	Time 0.541 (0.536)	Data 0.001 (0.016)	Loss 6.6173 (6.6587)	Top-1 acc 0.000 (0.233)	Top-5 acc 2.344 (1.112)	lr 0.04998
Warmup Train [1][1560/3239]	Time 0.581 (0.535)	Data 0.002 (0.016)	Loss 6.6172 (6.6585)	Top-1 acc 0.781 (0.234)	Top-5 acc 1.172 (1.111)	lr 0.04998
Warmup Train [1][1570/3239]	Time 0.545 (0.535)	Data 0.001 (0.016)	Loss 6.5939 (6.6582)	Top-1 acc 0.000 (0.235)	Top-5 acc 0.391 (1.112)	lr 0.04998
Warmup Train [1][1580/3239]	Time 0.548 (0.535)	Data 0.001 (0.016)	Loss 6.6156 (6.6581)	Top-1 acc 0.000 (0.236)	Top-5 acc 0.781 (1.114)	lr 0.04998
Warmup Train [1][1590/3239]	Time 0.352 (0.535)	Data 0.001 (0.016)	Loss 6.6494 (6.6578)	Top-1 acc 0.000 (0.236)	Top-5 acc 1.172 (1.116)	lr 0.04998
Warmup Train [1][1600/3239]	Time 0.452 (0.535)	Data 0.001 (0.016)	Loss 6.6114 (6.6575)	Top-1 acc 0.000 (0.236)	Top-5 acc 0.781 (1.117)	lr 0.04998
Warmup Train [1][1610/3239]	Time 0.591 (0.535)	Data 0.001 (0.015)	Loss 6.6305 (6.6573)	Top-1 acc 0.781 (0.237)	Top-5 acc 1.172 (1.119)	lr 0.04998
Warmup Train [1][1620/3239]	Time 0.559 (0.534)	Data 0.001 (0.015)	Loss 6.6167 (6.6570)	Top-1 acc 0.391 (0.237)	Top-5 acc 1.172 (1.121)	lr 0.04998
Warmup Train [1][1630/3239]	Time 0.521 (0.534)	Data 0.001 (0.015)	Loss 6.6186 (6.6567)	Top-1 acc 0.000 (0.238)	Top-5 acc 0.781 (1.124)	lr 0.04998
Warmup Train [1][1640/3239]	Time 0.628 (0.534)	Data 0.001 (0.015)	Loss 6.6055 (6.6566)	Top-1 acc 0.391 (0.238)	Top-5 acc 0.781 (1.124)	lr 0.04998
Warmup Train [1][1650/3239]	Time 0.543 (0.534)	Data 0.001 (0.015)	Loss 6.5960 (6.6562)	Top-1 acc 0.781 (0.238)	Top-5 acc 1.172 (1.127)	lr 0.04998
Warmup Train [1][1660/3239]	Time 0.450 (0.533)	Data 0.001 (0.015)	Loss 6.5947 (6.6560)	Top-1 acc 0.391 (0.239)	Top-5 acc 1.172 (1.129)	lr 0.04998
Warmup Train [1][1670/3239]	Time 0.575 (0.533)	Data 0.001 (0.015)	Loss 6.5837 (6.6558)	Top-1 acc 0.781 (0.239)	Top-5 acc 2.344 (1.131)	lr 0.04998
Warmup Train [1][1680/3239]	Time 0.192 (0.533)	Data 0.002 (0.015)	Loss 6.6041 (6.6555)	Top-1 acc 0.000 (0.239)	Top-5 acc 1.172 (1.133)	lr 0.04998
Warmup Train [1][1690/3239]	Time 0.502 (0.532)	Data 0.001 (0.015)	Loss 6.6209 (6.6553)	Top-1 acc 0.000 (0.240)	Top-5 acc 0.391 (1.134)	lr 0.04998
Warmup Train [1][1700/3239]	Time 0.546 (0.532)	Data 0.001 (0.015)	Loss 6.5967 (6.6550)	Top-1 acc 0.781 (0.240)	Top-5 acc 1.562 (1.132)	lr 0.04998
Warmup Train [1][1710/3239]	Time 0.581 (0.532)	Data 0.001 (0.015)	Loss 6.6225 (6.6548)	Top-1 acc 0.391 (0.240)	Top-5 acc 2.344 (1.133)	lr 0.04998
Warmup Train [1][1720/3239]	Time 0.566 (0.532)	Data 0.001 (0.015)	Loss 6.6182 (6.6545)	Top-1 acc 0.391 (0.242)	Top-5 acc 1.953 (1.135)	lr 0.04998
Warmup Train [1][1730/3239]	Time 0.571 (0.532)	Data 0.001 (0.015)	Loss 6.6062 (6.6542)	Top-1 acc 0.391 (0.242)	Top-5 acc 1.562 (1.138)	lr 0.04998
Warmup Train [1][1740/3239]	Time 0.472 (0.532)	Data 0.001 (0.015)	Loss 6.6001 (6.6540)	Top-1 acc 0.391 (0.243)	Top-5 acc 0.781 (1.139)	lr 0.04998
Warmup Train [1][1750/3239]	Time 0.609 (0.532)	Data 0.001 (0.015)	Loss 6.5769 (6.6537)	Top-1 acc 0.781 (0.243)	Top-5 acc 1.562 (1.139)	lr 0.04998
Warmup Train [1][1760/3239]	Time 0.558 (0.532)	Data 0.001 (0.015)	Loss 6.6243 (6.6535)	Top-1 acc 0.391 (0.243)	Top-5 acc 1.172 (1.141)	lr 0.04998
Warmup Train [1][1770/3239]	Time 0.525 (0.532)	Data 0.002 (0.014)	Loss 6.6173 (6.6533)	Top-1 acc 0.391 (0.244)	Top-5 acc 1.562 (1.144)	lr 0.04998
Warmup Train [1][1780/3239]	Time 0.495 (0.532)	Data 0.001 (0.014)	Loss 6.6320 (6.6529)	Top-1 acc 0.391 (0.245)	Top-5 acc 1.953 (1.148)	lr 0.04998
Warmup Train [1][1790/3239]	Time 0.484 (0.532)	Data 0.001 (0.014)	Loss 6.6208 (6.6527)	Top-1 acc 0.000 (0.244)	Top-5 acc 1.953 (1.147)	lr 0.04998
Warmup Train [1][1800/3239]	Time 0.547 (0.531)	Data 0.001 (0.014)	Loss 6.5734 (6.6524)	Top-1 acc 0.000 (0.244)	Top-5 acc 1.562 (1.148)	lr 0.04998
Warmup Train [1][1810/3239]	Time 0.513 (0.531)	Data 0.002 (0.014)	Loss 6.5773 (6.6522)	Top-1 acc 0.781 (0.245)	Top-5 acc 0.781 (1.149)	lr 0.04998
Warmup Train [1][1820/3239]	Time 0.479 (0.531)	Data 0.001 (0.014)	Loss 6.6067 (6.6520)	Top-1 acc 0.781 (0.246)	Top-5 acc 1.172 (1.150)	lr 0.04998
Warmup Train [1][1830/3239]	Time 0.411 (0.531)	Data 0.001 (0.014)	Loss 6.6647 (6.6518)	Top-1 acc 0.000 (0.246)	Top-5 acc 1.172 (1.152)	lr 0.04998
Warmup Train [1][1840/3239]	Time 0.589 (0.531)	Data 0.001 (0.014)	Loss 6.5904 (6.6516)	Top-1 acc 0.000 (0.245)	Top-5 acc 0.391 (1.153)	lr 0.04998
Warmup Train [1][1850/3239]	Time 0.355 (0.531)	Data 0.001 (0.014)	Loss 6.6217 (6.6514)	Top-1 acc 0.391 (0.245)	Top-5 acc 0.391 (1.152)	lr 0.04997
Warmup Train [1][1860/3239]	Time 0.486 (0.531)	Data 0.001 (0.014)	Loss 6.6091 (6.6511)	Top-1 acc 0.000 (0.245)	Top-5 acc 1.172 (1.154)	lr 0.04997
Warmup Train [1][1870/3239]	Time 0.506 (0.531)	Data 0.001 (0.014)	Loss 6.5853 (6.6509)	Top-1 acc 0.391 (0.246)	Top-5 acc 1.562 (1.155)	lr 0.04997
Warmup Train [1][1880/3239]	Time 0.514 (0.530)	Data 0.001 (0.014)	Loss 6.6132 (6.6508)	Top-1 acc 0.391 (0.247)	Top-5 acc 0.781 (1.156)	lr 0.04997
Warmup Train [1][1890/3239]	Time 0.564 (0.530)	Data 0.001 (0.014)	Loss 6.6062 (6.6505)	Top-1 acc 0.000 (0.247)	Top-5 acc 0.391 (1.157)	lr 0.04997
Warmup Train [1][1900/3239]	Time 0.515 (0.530)	Data 0.001 (0.014)	Loss 6.6082 (6.6503)	Top-1 acc 0.000 (0.248)	Top-5 acc 1.172 (1.157)	lr 0.04997
Warmup Train [1][1910/3239]	Time 0.312 (0.530)	Data 0.001 (0.014)	Loss 6.6101 (6.6500)	Top-1 acc 0.391 (0.248)	Top-5 acc 1.953 (1.156)	lr 0.04997
Warmup Train [1][1920/3239]	Time 0.577 (0.530)	Data 0.001 (0.014)	Loss 6.6121 (6.6498)	Top-1 acc 0.391 (0.248)	Top-5 acc 0.781 (1.158)	lr 0.04997
Warmup Train [1][1930/3239]	Time 0.567 (0.530)	Data 0.001 (0.014)	Loss 6.5767 (6.6496)	Top-1 acc 0.391 (0.248)	Top-5 acc 0.781 (1.157)	lr 0.04997
Warmup Train [1][1940/3239]	Time 0.580 (0.530)	Data 0.001 (0.014)	Loss 6.5683 (6.6494)	Top-1 acc 0.781 (0.248)	Top-5 acc 1.953 (1.157)	lr 0.04997
Warmup Train [1][1950/3239]	Time 0.631 (0.529)	Data 0.001 (0.014)	Loss 6.5826 (6.6492)	Top-1 acc 0.000 (0.249)	Top-5 acc 1.172 (1.157)	lr 0.04997
Warmup Train [1][1960/3239]	Time 0.543 (0.529)	Data 0.001 (0.014)	Loss 6.6083 (6.6489)	Top-1 acc 0.391 (0.249)	Top-5 acc 1.562 (1.158)	lr 0.04997
Warmup Train [1][1970/3239]	Time 0.519 (0.529)	Data 0.002 (0.014)	Loss 6.5856 (6.6486)	Top-1 acc 0.391 (0.250)	Top-5 acc 0.781 (1.161)	lr 0.04997
Warmup Train [1][1980/3239]	Time 0.415 (0.529)	Data 0.001 (0.014)	Loss 6.5889 (6.6484)	Top-1 acc 0.781 (0.250)	Top-5 acc 2.344 (1.164)	lr 0.04997
Warmup Train [1][1990/3239]	Time 0.549 (0.529)	Data 0.001 (0.014)	Loss 6.6588 (6.6482)	Top-1 acc 0.000 (0.250)	Top-5 acc 0.781 (1.163)	lr 0.04997
Warmup Train [1][2000/3239]	Time 0.529 (0.529)	Data 0.001 (0.014)	Loss 6.6238 (6.6480)	Top-1 acc 0.000 (0.249)	Top-5 acc 0.000 (1.165)	lr 0.04997
Warmup Train [1][2010/3239]	Time 0.468 (0.529)	Data 0.001 (0.013)	Loss 6.5937 (6.6478)	Top-1 acc 0.000 (0.249)	Top-5 acc 0.391 (1.166)	lr 0.04997
Warmup Train [1][2020/3239]	Time 0.582 (0.529)	Data 0.001 (0.013)	Loss 6.6059 (6.6476)	Top-1 acc 1.172 (0.249)	Top-5 acc 2.734 (1.167)	lr 0.04997
Warmup Train [1][2030/3239]	Time 0.498 (0.529)	Data 0.001 (0.013)	Loss 6.5801 (6.6473)	Top-1 acc 0.000 (0.248)	Top-5 acc 1.953 (1.167)	lr 0.04997
Warmup Train [1][2040/3239]	Time 0.557 (0.529)	Data 0.001 (0.013)	Loss 6.6228 (6.6472)	Top-1 acc 0.781 (0.248)	Top-5 acc 3.125 (1.169)	lr 0.04997
Warmup Train [1][2050/3239]	Time 0.685 (0.529)	Data 0.001 (0.013)	Loss 6.6300 (6.6469)	Top-1 acc 0.000 (0.249)	Top-5 acc 0.781 (1.170)	lr 0.04997
Warmup Train [1][2060/3239]	Time 0.345 (0.528)	Data 0.001 (0.013)	Loss 6.5863 (6.6467)	Top-1 acc 0.000 (0.249)	Top-5 acc 1.172 (1.172)	lr 0.04997
Warmup Train [1][2070/3239]	Time 0.504 (0.528)	Data 0.002 (0.013)	Loss 6.6363 (6.6465)	Top-1 acc 0.000 (0.249)	Top-5 acc 1.562 (1.173)	lr 0.04997
Warmup Train [1][2080/3239]	Time 0.378 (0.528)	Data 0.001 (0.013)	Loss 6.5878 (6.6463)	Top-1 acc 0.781 (0.250)	Top-5 acc 1.172 (1.175)	lr 0.04997
Warmup Train [1][2090/3239]	Time 0.419 (0.528)	Data 0.001 (0.013)	Loss 6.6007 (6.6461)	Top-1 acc 0.000 (0.250)	Top-5 acc 0.781 (1.176)	lr 0.04997
Warmup Train [1][2100/3239]	Time 0.530 (0.528)	Data 0.001 (0.013)	Loss 6.6080 (6.6460)	Top-1 acc 0.000 (0.250)	Top-5 acc 1.172 (1.178)	lr 0.04997
Warmup Train [1][2110/3239]	Time 0.597 (0.528)	Data 0.001 (0.013)	Loss 6.5771 (6.6457)	Top-1 acc 0.000 (0.250)	Top-5 acc 0.391 (1.179)	lr 0.04997
Warmup Train [1][2120/3239]	Time 0.443 (0.528)	Data 0.001 (0.013)	Loss 6.6072 (6.6455)	Top-1 acc 0.781 (0.251)	Top-5 acc 1.562 (1.182)	lr 0.04997
Warmup Train [1][2130/3239]	Time 0.482 (0.528)	Data 0.001 (0.013)	Loss 6.5856 (6.6452)	Top-1 acc 0.000 (0.251)	Top-5 acc 1.953 (1.183)	lr 0.04997
Warmup Train [1][2140/3239]	Time 0.539 (0.528)	Data 0.001 (0.013)	Loss 6.6393 (6.6450)	Top-1 acc 0.000 (0.251)	Top-5 acc 0.781 (1.184)	lr 0.04997
Warmup Train [1][2150/3239]	Time 0.575 (0.528)	Data 0.001 (0.013)	Loss 6.5820 (6.6449)	Top-1 acc 0.391 (0.251)	Top-5 acc 2.734 (1.185)	lr 0.04997
Warmup Train [1][2160/3239]	Time 0.478 (0.528)	Data 0.001 (0.013)	Loss 6.6016 (6.6447)	Top-1 acc 0.000 (0.252)	Top-5 acc 0.391 (1.185)	lr 0.04997
Warmup Train [1][2170/3239]	Time 0.565 (0.528)	Data 0.001 (0.013)	Loss 6.5998 (6.6444)	Top-1 acc 0.000 (0.251)	Top-5 acc 0.781 (1.185)	lr 0.04997
Warmup Train [1][2180/3239]	Time 0.449 (0.528)	Data 0.001 (0.013)	Loss 6.5979 (6.6442)	Top-1 acc 1.172 (0.251)	Top-5 acc 2.344 (1.187)	lr 0.04997
Warmup Train [1][2190/3239]	Time 0.572 (0.527)	Data 0.001 (0.013)	Loss 6.6825 (6.6440)	Top-1 acc 0.000 (0.252)	Top-5 acc 1.562 (1.189)	lr 0.04996
Warmup Train [1][2200/3239]	Time 0.514 (0.527)	Data 0.001 (0.013)	Loss 6.6071 (6.6438)	Top-1 acc 0.000 (0.252)	Top-5 acc 1.562 (1.191)	lr 0.04996
Warmup Train [1][2210/3239]	Time 0.647 (0.527)	Data 0.001 (0.013)	Loss 6.5980 (6.6435)	Top-1 acc 0.000 (0.252)	Top-5 acc 1.172 (1.194)	lr 0.04996
Warmup Train [1][2220/3239]	Time 0.597 (0.527)	Data 0.001 (0.013)	Loss 6.6496 (6.6434)	Top-1 acc 0.391 (0.253)	Top-5 acc 0.781 (1.195)	lr 0.04996
Warmup Train [1][2230/3239]	Time 0.554 (0.527)	Data 0.001 (0.013)	Loss 6.6031 (6.6432)	Top-1 acc 0.391 (0.253)	Top-5 acc 1.953 (1.196)	lr 0.04996
Warmup Train [1][2240/3239]	Time 0.634 (0.527)	Data 0.001 (0.013)	Loss 6.5688 (6.6429)	Top-1 acc 0.391 (0.253)	Top-5 acc 1.562 (1.199)	lr 0.04996
Warmup Train [1][2250/3239]	Time 0.564 (0.527)	Data 0.001 (0.013)	Loss 6.5954 (6.6427)	Top-1 acc 0.000 (0.253)	Top-5 acc 2.734 (1.199)	lr 0.04996
Warmup Train [1][2260/3239]	Time 0.509 (0.527)	Data 0.001 (0.013)	Loss 6.5885 (6.6425)	Top-1 acc 0.391 (0.253)	Top-5 acc 2.344 (1.200)	lr 0.04996
Warmup Train [1][2270/3239]	Time 0.449 (0.527)	Data 0.001 (0.013)	Loss 6.6100 (6.6424)	Top-1 acc 0.391 (0.253)	Top-5 acc 0.391 (1.200)	lr 0.04996
Warmup Train [1][2280/3239]	Time 0.549 (0.527)	Data 0.001 (0.013)	Loss 6.5927 (6.6421)	Top-1 acc 0.000 (0.253)	Top-5 acc 0.391 (1.200)	lr 0.04996
Warmup Train [1][2290/3239]	Time 0.375 (0.527)	Data 0.001 (0.012)	Loss 6.5703 (6.6419)	Top-1 acc 0.000 (0.253)	Top-5 acc 1.172 (1.202)	lr 0.04996
Warmup Train [1][2300/3239]	Time 0.510 (0.527)	Data 0.001 (0.012)	Loss 6.5983 (6.6416)	Top-1 acc 0.000 (0.253)	Top-5 acc 0.781 (1.202)	lr 0.04996
Warmup Train [1][2310/3239]	Time 0.348 (0.526)	Data 0.001 (0.012)	Loss 6.5912 (6.6414)	Top-1 acc 0.000 (0.254)	Top-5 acc 1.953 (1.203)	lr 0.04996
Warmup Train [1][2320/3239]	Time 0.566 (0.526)	Data 0.001 (0.012)	Loss 6.5741 (6.6412)	Top-1 acc 0.000 (0.254)	Top-5 acc 1.172 (1.205)	lr 0.04996
Warmup Train [1][2330/3239]	Time 0.616 (0.526)	Data 0.001 (0.012)	Loss 6.5910 (6.6410)	Top-1 acc 0.000 (0.254)	Top-5 acc 1.172 (1.204)	lr 0.04996
Warmup Train [1][2340/3239]	Time 0.612 (0.526)	Data 0.001 (0.012)	Loss 6.5647 (6.6408)	Top-1 acc 0.000 (0.254)	Top-5 acc 1.953 (1.205)	lr 0.04996
Warmup Train [1][2350/3239]	Time 0.642 (0.526)	Data 0.001 (0.012)	Loss 6.6165 (6.6406)	Top-1 acc 0.000 (0.254)	Top-5 acc 0.781 (1.205)	lr 0.04996
Warmup Train [1][2360/3239]	Time 0.466 (0.526)	Data 0.001 (0.012)	Loss 6.6223 (6.6404)	Top-1 acc 0.000 (0.254)	Top-5 acc 0.000 (1.205)	lr 0.04996
Warmup Train [1][2370/3239]	Time 0.436 (0.526)	Data 0.001 (0.012)	Loss 6.5769 (6.6402)	Top-1 acc 0.000 (0.254)	Top-5 acc 1.172 (1.204)	lr 0.04996
Warmup Train [1][2380/3239]	Time 0.516 (0.526)	Data 0.001 (0.012)	Loss 6.5706 (6.6399)	Top-1 acc 0.391 (0.255)	Top-5 acc 1.172 (1.206)	lr 0.04996
Warmup Train [1][2390/3239]	Time 0.540 (0.526)	Data 0.001 (0.012)	Loss 6.5920 (6.6397)	Top-1 acc 0.391 (0.255)	Top-5 acc 0.781 (1.208)	lr 0.04996
Warmup Train [1][2400/3239]	Time 0.589 (0.526)	Data 0.002 (0.012)	Loss 6.5428 (6.6395)	Top-1 acc 0.781 (0.255)	Top-5 acc 1.953 (1.208)	lr 0.04996
Warmup Train [1][2410/3239]	Time 0.432 (0.526)	Data 0.002 (0.012)	Loss 6.5207 (6.6392)	Top-1 acc 0.781 (0.256)	Top-5 acc 2.734 (1.210)	lr 0.04996
Warmup Train [1][2420/3239]	Time 0.386 (0.526)	Data 0.001 (0.012)	Loss 6.5784 (6.6389)	Top-1 acc 0.391 (0.256)	Top-5 acc 1.953 (1.211)	lr 0.04996
Warmup Train [1][2430/3239]	Time 0.381 (0.526)	Data 0.001 (0.012)	Loss 6.5354 (6.6387)	Top-1 acc 0.391 (0.257)	Top-5 acc 2.344 (1.212)	lr 0.04996
Warmup Train [1][2440/3239]	Time 0.552 (0.525)	Data 0.001 (0.012)	Loss 6.5706 (6.6386)	Top-1 acc 0.000 (0.257)	Top-5 acc 1.172 (1.212)	lr 0.04996
Warmup Train [1][2450/3239]	Time 0.559 (0.525)	Data 0.001 (0.012)	Loss 6.6118 (6.6383)	Top-1 acc 0.391 (0.258)	Top-5 acc 1.172 (1.215)	lr 0.04996
Warmup Train [1][2460/3239]	Time 0.526 (0.525)	Data 0.001 (0.012)	Loss 6.5696 (6.6381)	Top-1 acc 0.391 (0.257)	Top-5 acc 2.344 (1.216)	lr 0.04996
Warmup Train [1][2470/3239]	Time 0.530 (0.525)	Data 0.002 (0.012)	Loss 6.6058 (6.6379)	Top-1 acc 0.391 (0.257)	Top-5 acc 0.391 (1.218)	lr 0.04996
Warmup Train [1][2480/3239]	Time 0.521 (0.525)	Data 0.002 (0.012)	Loss 6.5747 (6.6377)	Top-1 acc 0.391 (0.258)	Top-5 acc 1.953 (1.220)	lr 0.04995
Warmup Train [1][2490/3239]	Time 0.353 (0.525)	Data 0.001 (0.012)	Loss 6.6371 (6.6375)	Top-1 acc 0.391 (0.258)	Top-5 acc 1.953 (1.221)	lr 0.04995
Warmup Train [1][2500/3239]	Time 0.490 (0.525)	Data 0.001 (0.012)	Loss 6.5588 (6.6372)	Top-1 acc 0.781 (0.259)	Top-5 acc 1.562 (1.222)	lr 0.04995
Warmup Train [1][2510/3239]	Time 0.520 (0.525)	Data 0.001 (0.012)	Loss 6.6172 (6.6370)	Top-1 acc 0.000 (0.258)	Top-5 acc 1.172 (1.224)	lr 0.04995
Warmup Train [1][2520/3239]	Time 0.533 (0.525)	Data 0.001 (0.012)	Loss 6.5539 (6.6367)	Top-1 acc 0.391 (0.260)	Top-5 acc 0.781 (1.225)	lr 0.04995
Warmup Train [1][2530/3239]	Time 0.503 (0.524)	Data 0.002 (0.012)	Loss 6.5640 (6.6365)	Top-1 acc 0.781 (0.260)	Top-5 acc 3.906 (1.228)	lr 0.04995
Warmup Train [1][2540/3239]	Time 0.474 (0.524)	Data 0.001 (0.012)	Loss 6.5853 (6.6363)	Top-1 acc 0.391 (0.260)	Top-5 acc 1.953 (1.228)	lr 0.04995
Warmup Train [1][2550/3239]	Time 0.653 (0.524)	Data 0.001 (0.012)	Loss 6.6099 (6.6361)	Top-1 acc 0.000 (0.260)	Top-5 acc 1.172 (1.229)	lr 0.04995
Warmup Train [1][2560/3239]	Time 0.626 (0.524)	Data 0.001 (0.012)	Loss 6.5837 (6.6359)	Top-1 acc 0.781 (0.261)	Top-5 acc 1.953 (1.232)	lr 0.04995
Warmup Train [1][2570/3239]	Time 0.502 (0.524)	Data 0.001 (0.012)	Loss 6.5936 (6.6358)	Top-1 acc 0.391 (0.261)	Top-5 acc 1.562 (1.232)	lr 0.04995
Warmup Train [1][2580/3239]	Time 0.597 (0.524)	Data 0.001 (0.012)	Loss 6.5945 (6.6355)	Top-1 acc 0.781 (0.261)	Top-5 acc 1.562 (1.233)	lr 0.04995
Warmup Train [1][2590/3239]	Time 0.434 (0.524)	Data 0.001 (0.012)	Loss 6.5635 (6.6353)	Top-1 acc 0.391 (0.261)	Top-5 acc 1.562 (1.234)	lr 0.04995
Warmup Train [1][2600/3239]	Time 0.536 (0.524)	Data 0.001 (0.012)	Loss 6.5800 (6.6351)	Top-1 acc 0.000 (0.261)	Top-5 acc 1.172 (1.235)	lr 0.04995
Warmup Train [1][2610/3239]	Time 0.509 (0.524)	Data 0.001 (0.012)	Loss 6.5927 (6.6349)	Top-1 acc 0.000 (0.260)	Top-5 acc 0.391 (1.235)	lr 0.04995
Warmup Train [1][2620/3239]	Time 0.363 (0.524)	Data 0.001 (0.012)	Loss 6.5754 (6.6347)	Top-1 acc 0.000 (0.260)	Top-5 acc 1.562 (1.236)	lr 0.04995
Warmup Train [1][2630/3239]	Time 0.344 (0.524)	Data 0.001 (0.012)	Loss 6.5684 (6.6345)	Top-1 acc 1.172 (0.261)	Top-5 acc 2.734 (1.238)	lr 0.04995
Warmup Train [1][2640/3239]	Time 0.528 (0.524)	Data 0.001 (0.012)	Loss 6.5899 (6.6343)	Top-1 acc 0.781 (0.260)	Top-5 acc 0.781 (1.237)	lr 0.04995
Warmup Train [1][2650/3239]	Time 0.563 (0.524)	Data 0.001 (0.012)	Loss 6.5659 (6.6340)	Top-1 acc 0.000 (0.260)	Top-5 acc 1.172 (1.239)	lr 0.04995
Warmup Train [1][2660/3239]	Time 0.406 (0.523)	Data 0.001 (0.012)	Loss 6.5838 (6.6339)	Top-1 acc 0.391 (0.261)	Top-5 acc 1.172 (1.240)	lr 0.04995
Warmup Train [1][2670/3239]	Time 0.525 (0.523)	Data 0.002 (0.012)	Loss 6.5563 (6.6337)	Top-1 acc 0.391 (0.261)	Top-5 acc 0.781 (1.241)	lr 0.04995
Warmup Train [1][2680/3239]	Time 0.579 (0.523)	Data 0.002 (0.012)	Loss 6.6099 (6.6334)	Top-1 acc 0.000 (0.261)	Top-5 acc 0.000 (1.241)	lr 0.04995
Warmup Train [1][2690/3239]	Time 0.589 (0.523)	Data 0.001 (0.012)	Loss 6.5698 (6.6332)	Top-1 acc 0.000 (0.261)	Top-5 acc 1.953 (1.242)	lr 0.04995
Warmup Train [1][2700/3239]	Time 0.579 (0.523)	Data 0.001 (0.012)	Loss 6.5748 (6.6329)	Top-1 acc 0.391 (0.262)	Top-5 acc 1.562 (1.246)	lr 0.04995
Warmup Train [1][2710/3239]	Time 0.567 (0.523)	Data 0.001 (0.012)	Loss 6.5831 (6.6327)	Top-1 acc 0.391 (0.262)	Top-5 acc 0.391 (1.247)	lr 0.04995
Warmup Train [1][2720/3239]	Time 0.521 (0.523)	Data 0.001 (0.012)	Loss 6.5853 (6.6325)	Top-1 acc 0.391 (0.262)	Top-5 acc 1.172 (1.247)	lr 0.04995
Warmup Train [1][2730/3239]	Time 0.653 (0.522)	Data 0.001 (0.012)	Loss 6.5778 (6.6323)	Top-1 acc 0.000 (0.262)	Top-5 acc 0.781 (1.247)	lr 0.04995
Warmup Train [1][2740/3239]	Time 0.544 (0.522)	Data 0.001 (0.012)	Loss 6.5520 (6.6321)	Top-1 acc 0.391 (0.262)	Top-5 acc 1.953 (1.247)	lr 0.04994
Warmup Train [1][2750/3239]	Time 0.514 (0.522)	Data 0.001 (0.012)	Loss 6.5735 (6.6319)	Top-1 acc 0.000 (0.263)	Top-5 acc 1.562 (1.249)	lr 0.04994
Warmup Train [1][2760/3239]	Time 0.543 (0.522)	Data 0.001 (0.012)	Loss 6.5461 (6.6317)	Top-1 acc 0.781 (0.263)	Top-5 acc 1.562 (1.249)	lr 0.04994
Warmup Train [1][2770/3239]	Time 0.547 (0.522)	Data 0.001 (0.011)	Loss 6.5537 (6.6315)	Top-1 acc 0.000 (0.264)	Top-5 acc 0.391 (1.251)	lr 0.04994
Warmup Train [1][2780/3239]	Time 0.421 (0.522)	Data 0.001 (0.011)	Loss 6.5950 (6.6313)	Top-1 acc 0.000 (0.263)	Top-5 acc 1.172 (1.251)	lr 0.04994
Warmup Train [1][2790/3239]	Time 0.423 (0.522)	Data 0.001 (0.011)	Loss 6.5693 (6.6311)	Top-1 acc 0.000 (0.263)	Top-5 acc 0.781 (1.251)	lr 0.04994
Warmup Train [1][2800/3239]	Time 0.665 (0.522)	Data 0.001 (0.011)	Loss 6.6003 (6.6309)	Top-1 acc 0.000 (0.263)	Top-5 acc 1.562 (1.251)	lr 0.04994
Warmup Train [1][2810/3239]	Time 0.420 (0.522)	Data 0.002 (0.011)	Loss 6.5636 (6.6308)	Top-1 acc 0.781 (0.263)	Top-5 acc 1.953 (1.252)	lr 0.04994
Warmup Train [1][2820/3239]	Time 0.368 (0.522)	Data 0.001 (0.011)	Loss 6.5449 (6.6306)	Top-1 acc 0.781 (0.263)	Top-5 acc 1.953 (1.252)	lr 0.04994
Warmup Train [1][2830/3239]	Time 0.424 (0.522)	Data 0.001 (0.011)	Loss 6.5812 (6.6304)	Top-1 acc 0.000 (0.263)	Top-5 acc 3.125 (1.255)	lr 0.04994
Warmup Train [1][2840/3239]	Time 0.382 (0.522)	Data 0.001 (0.011)	Loss 6.5997 (6.6302)	Top-1 acc 0.000 (0.264)	Top-5 acc 0.781 (1.256)	lr 0.04994
Warmup Train [1][2850/3239]	Time 0.544 (0.522)	Data 0.001 (0.011)	Loss 6.6099 (6.6300)	Top-1 acc 0.391 (0.263)	Top-5 acc 2.734 (1.257)	lr 0.04994
Warmup Train [1][2860/3239]	Time 0.465 (0.522)	Data 0.001 (0.011)	Loss 6.5757 (6.6298)	Top-1 acc 0.391 (0.263)	Top-5 acc 2.344 (1.257)	lr 0.04994
Warmup Train [1][2870/3239]	Time 0.573 (0.522)	Data 0.001 (0.011)	Loss 6.5859 (6.6296)	Top-1 acc 0.000 (0.263)	Top-5 acc 0.781 (1.259)	lr 0.04994
Warmup Train [1][2880/3239]	Time 0.651 (0.522)	Data 0.001 (0.011)	Loss 6.6090 (6.6295)	Top-1 acc 0.000 (0.263)	Top-5 acc 0.000 (1.259)	lr 0.04994
Warmup Train [1][2890/3239]	Time 0.306 (0.522)	Data 0.001 (0.011)	Loss 6.5547 (6.6293)	Top-1 acc 0.000 (0.263)	Top-5 acc 2.344 (1.261)	lr 0.04994
Warmup Train [1][2900/3239]	Time 0.489 (0.522)	Data 0.001 (0.011)	Loss 6.5610 (6.6291)	Top-1 acc 0.391 (0.263)	Top-5 acc 1.562 (1.262)	lr 0.04994
Warmup Train [1][2910/3239]	Time 0.464 (0.522)	Data 0.001 (0.011)	Loss 6.5479 (6.6289)	Top-1 acc 0.000 (0.263)	Top-5 acc 0.781 (1.262)	lr 0.04994
Warmup Train [1][2920/3239]	Time 0.464 (0.522)	Data 0.001 (0.011)	Loss 6.5653 (6.6288)	Top-1 acc 0.000 (0.263)	Top-5 acc 1.562 (1.263)	lr 0.04994
Warmup Train [1][2930/3239]	Time 0.517 (0.522)	Data 0.001 (0.011)	Loss 6.5378 (6.6286)	Top-1 acc 0.391 (0.263)	Top-5 acc 0.781 (1.262)	lr 0.04994
Warmup Train [1][2940/3239]	Time 0.681 (0.521)	Data 0.001 (0.011)	Loss 6.5850 (6.6284)	Top-1 acc 0.391 (0.263)	Top-5 acc 1.172 (1.262)	lr 0.04994
Warmup Train [1][2950/3239]	Time 0.617 (0.521)	Data 0.001 (0.011)	Loss 6.6075 (6.6283)	Top-1 acc 0.391 (0.263)	Top-5 acc 0.781 (1.262)	lr 0.04994
Warmup Train [1][2960/3239]	Time 0.480 (0.521)	Data 0.002 (0.011)	Loss 6.5680 (6.6281)	Top-1 acc 0.781 (0.263)	Top-5 acc 4.297 (1.263)	lr 0.04994
Warmup Train [1][2970/3239]	Time 0.454 (0.521)	Data 0.001 (0.011)	Loss 6.5011 (6.6279)	Top-1 acc 0.781 (0.263)	Top-5 acc 3.516 (1.264)	lr 0.04994
Warmup Train [1][2980/3239]	Time 0.526 (0.521)	Data 0.001 (0.011)	Loss 6.5644 (6.6276)	Top-1 acc 0.391 (0.264)	Top-5 acc 0.781 (1.265)	lr 0.04993
Warmup Train [1][2990/3239]	Time 0.559 (0.521)	Data 0.001 (0.011)	Loss 6.6224 (6.6275)	Top-1 acc 0.000 (0.263)	Top-5 acc 0.000 (1.265)	lr 0.04993
Warmup Train [1][3000/3239]	Time 0.520 (0.521)	Data 0.001 (0.011)	Loss 6.5631 (6.6273)	Top-1 acc 0.391 (0.263)	Top-5 acc 1.172 (1.265)	lr 0.04993
Warmup Train [1][3010/3239]	Time 0.327 (0.521)	Data 0.001 (0.011)	Loss 6.5583 (6.6270)	Top-1 acc 0.391 (0.263)	Top-5 acc 1.953 (1.265)	lr 0.04993
Warmup Train [1][3020/3239]	Time 0.491 (0.521)	Data 0.001 (0.011)	Loss 6.5386 (6.6269)	Top-1 acc 0.000 (0.263)	Top-5 acc 2.344 (1.265)	lr 0.04993
Warmup Train [1][3030/3239]	Time 0.567 (0.521)	Data 0.001 (0.011)	Loss 6.5169 (6.6267)	Top-1 acc 0.781 (0.263)	Top-5 acc 1.562 (1.266)	lr 0.04993
Warmup Train [1][3040/3239]	Time 0.454 (0.521)	Data 0.001 (0.011)	Loss 6.5499 (6.6265)	Top-1 acc 1.562 (0.264)	Top-5 acc 2.344 (1.268)	lr 0.04993
Warmup Train [1][3050/3239]	Time 0.463 (0.521)	Data 0.001 (0.011)	Loss 6.5283 (6.6263)	Top-1 acc 1.953 (0.265)	Top-5 acc 4.297 (1.269)	lr 0.04993
Warmup Train [1][3060/3239]	Time 0.402 (0.521)	Data 0.001 (0.011)	Loss 6.5519 (6.6261)	Top-1 acc 0.000 (0.265)	Top-5 acc 1.172 (1.270)	lr 0.04993
Warmup Train [1][3070/3239]	Time 0.457 (0.521)	Data 0.001 (0.011)	Loss 6.5933 (6.6259)	Top-1 acc 0.000 (0.265)	Top-5 acc 0.781 (1.272)	lr 0.04993
Warmup Train [1][3080/3239]	Time 0.492 (0.521)	Data 0.001 (0.011)	Loss 6.5502 (6.6257)	Top-1 acc 0.391 (0.265)	Top-5 acc 0.391 (1.272)	lr 0.04993
Warmup Train [1][3090/3239]	Time 0.330 (0.521)	Data 0.001 (0.011)	Loss 6.5829 (6.6255)	Top-1 acc 0.000 (0.266)	Top-5 acc 0.781 (1.273)	lr 0.04993
Warmup Train [1][3100/3239]	Time 0.687 (0.521)	Data 0.001 (0.011)	Loss 6.5371 (6.6253)	Top-1 acc 0.391 (0.266)	Top-5 acc 3.125 (1.274)	lr 0.04993
Warmup Train [1][3110/3239]	Time 0.434 (0.521)	Data 0.001 (0.011)	Loss 6.5647 (6.6252)	Top-1 acc 0.391 (0.266)	Top-5 acc 1.562 (1.275)	lr 0.04993
Warmup Train [1][3120/3239]	Time 0.485 (0.520)	Data 0.001 (0.011)	Loss 6.5598 (6.6250)	Top-1 acc 0.000 (0.266)	Top-5 acc 0.000 (1.275)	lr 0.04993
Warmup Train [1][3130/3239]	Time 0.619 (0.520)	Data 0.001 (0.011)	Loss 6.5832 (6.6248)	Top-1 acc 0.000 (0.266)	Top-5 acc 1.953 (1.275)	lr 0.04993
Warmup Train [1][3140/3239]	Time 0.336 (0.520)	Data 0.001 (0.011)	Loss 6.5491 (6.6246)	Top-1 acc 0.391 (0.266)	Top-5 acc 2.344 (1.277)	lr 0.04993
Warmup Train [1][3150/3239]	Time 0.560 (0.520)	Data 0.001 (0.011)	Loss 6.5276 (6.6244)	Top-1 acc 0.000 (0.266)	Top-5 acc 0.781 (1.278)	lr 0.04993
Warmup Train [1][3160/3239]	Time 0.386 (0.520)	Data 0.001 (0.011)	Loss 6.5475 (6.6242)	Top-1 acc 0.000 (0.266)	Top-5 acc 2.734 (1.280)	lr 0.04993
Warmup Train [1][3170/3239]	Time 0.620 (0.520)	Data 0.001 (0.011)	Loss 6.5540 (6.6240)	Top-1 acc 0.000 (0.267)	Top-5 acc 1.562 (1.280)	lr 0.04993
Warmup Train [1][3180/3239]	Time 0.561 (0.520)	Data 0.000 (0.011)	Loss 6.5563 (6.6238)	Top-1 acc 0.781 (0.267)	Top-5 acc 1.562 (1.282)	lr 0.04993
Warmup Train [1][3190/3239]	Time 0.525 (0.520)	Data 0.000 (0.011)	Loss 6.5956 (6.6237)	Top-1 acc 0.391 (0.267)	Top-5 acc 0.391 (1.282)	lr 0.04993
Warmup Train [1][3200/3239]	Time 0.583 (0.520)	Data 0.000 (0.011)	Loss 6.5794 (6.6235)	Top-1 acc 0.000 (0.267)	Top-5 acc 0.781 (1.283)	lr 0.04992
Warmup Train [1][3210/3239]	Time 0.515 (0.520)	Data 0.000 (0.011)	Loss 6.5604 (6.6233)	Top-1 acc 1.172 (0.268)	Top-5 acc 1.562 (1.283)	lr 0.04992
Warmup Train [1][3220/3239]	Time 0.421 (0.520)	Data 0.000 (0.011)	Loss 6.5507 (6.6231)	Top-1 acc 0.000 (0.268)	Top-5 acc 1.562 (1.284)	lr 0.04992
Warmup Train [1][3230/3239]	Time 0.393 (0.520)	Data 0.000 (0.011)	Loss 6.5837 (6.6230)	Top-1 acc 0.391 (0.268)	Top-5 acc 0.781 (1.284)	lr 0.04992
Warmup Train [1][3239/3239]	Time 2.110 (0.520)	Data 0.000 (0.011)	Loss 6.5695 (6.6228)	Top-1 acc 1.235 (0.269)	Top-5 acc 3.704 (1.286)	lr 0.04992
==========Warmup Valid [1/40]	loss 6.443	top-1 acc 0.409	top-5 acc 1.659	Train top-1 0.269	top-5 1.286	flops: 442.4M
Warmup Train [2][0/3239]	Time 8.185 (8.185)	Data 6.495 (6.495)	Loss 6.5368 (6.5368)	Top-1 acc 0.781 (0.781)	Top-5 acc 2.734 (2.734)	lr 0.04992
Warmup Train [2][10/3239]	Time 0.471 (1.259)	Data 0.001 (0.598)	Loss 6.5422 (6.5535)	Top-1 acc 0.000 (0.213)	Top-5 acc 1.953 (1.385)	lr 0.04992
Warmup Train [2][20/3239]	Time 0.456 (0.907)	Data 0.001 (0.314)	Loss 6.5323 (6.5583)	Top-1 acc 0.781 (0.242)	Top-5 acc 2.734 (1.544)	lr 0.04992
Warmup Train [2][30/3239]	Time 0.505 (0.781)	Data 0.001 (0.214)	Loss 6.6009 (6.5633)	Top-1 acc 0.000 (0.239)	Top-5 acc 0.781 (1.525)	lr 0.04992
Warmup Train [2][40/3239]	Time 0.379 (0.712)	Data 0.001 (0.163)	Loss 6.5695 (6.5644)	Top-1 acc 0.781 (0.286)	Top-5 acc 1.953 (1.543)	lr 0.04992
Warmup Train [2][50/3239]	Time 0.718 (0.676)	Data 0.001 (0.133)	Loss 6.5398 (6.5657)	Top-1 acc 0.391 (0.299)	Top-5 acc 1.172 (1.524)	lr 0.04992
Warmup Train [2][60/3239]	Time 0.366 (0.650)	Data 0.001 (0.112)	Loss 6.5608 (6.5641)	Top-1 acc 0.000 (0.295)	Top-5 acc 0.781 (1.511)	lr 0.04992
Warmup Train [2][70/3239]	Time 0.482 (0.631)	Data 0.001 (0.098)	Loss 6.5828 (6.5648)	Top-1 acc 0.391 (0.297)	Top-5 acc 0.781 (1.452)	lr 0.04992
Warmup Train [2][80/3239]	Time 0.595 (0.615)	Data 0.001 (0.086)	Loss 6.5522 (6.5645)	Top-1 acc 0.391 (0.304)	Top-5 acc 1.953 (1.471)	lr 0.04992
Warmup Train [2][90/3239]	Time 0.694 (0.603)	Data 0.001 (0.077)	Loss 6.5800 (6.5641)	Top-1 acc 0.391 (0.313)	Top-5 acc 1.172 (1.494)	lr 0.04992
Warmup Train [2][100/3239]	Time 0.485 (0.595)	Data 0.001 (0.070)	Loss 6.5406 (6.5626)	Top-1 acc 0.781 (0.325)	Top-5 acc 1.172 (1.520)	lr 0.04992
Warmup Train [2][110/3239]	Time 0.549 (0.589)	Data 0.001 (0.065)	Loss 6.5435 (6.5622)	Top-1 acc 0.391 (0.338)	Top-5 acc 1.562 (1.562)	lr 0.04992
Warmup Train [2][120/3239]	Time 0.515 (0.583)	Data 0.001 (0.059)	Loss 6.5373 (6.5614)	Top-1 acc 1.172 (0.362)	Top-5 acc 1.953 (1.579)	lr 0.04992
Warmup Train [2][130/3239]	Time 0.578 (0.578)	Data 0.001 (0.055)	Loss 6.5895 (6.5603)	Top-1 acc 0.781 (0.358)	Top-5 acc 1.562 (1.607)	lr 0.04992
Warmup Train [2][140/3239]	Time 0.424 (0.573)	Data 0.001 (0.052)	Loss 6.5536 (6.5600)	Top-1 acc 0.000 (0.363)	Top-5 acc 1.953 (1.632)	lr 0.04992
Warmup Train [2][150/3239]	Time 0.548 (0.571)	Data 0.001 (0.049)	Loss 6.5493 (6.5593)	Top-1 acc 0.391 (0.362)	Top-5 acc 1.172 (1.612)	lr 0.04992
Warmup Train [2][160/3239]	Time 0.363 (0.567)	Data 0.001 (0.047)	Loss 6.5511 (6.5590)	Top-1 acc 0.391 (0.357)	Top-5 acc 1.953 (1.630)	lr 0.04992
Warmup Train [2][170/3239]	Time 0.623 (0.564)	Data 0.001 (0.045)	Loss 6.5789 (6.5591)	Top-1 acc 0.781 (0.359)	Top-5 acc 2.344 (1.647)	lr 0.04991
Warmup Train [2][180/3239]	Time 0.472 (0.560)	Data 0.001 (0.043)	Loss 6.5460 (6.5591)	Top-1 acc 0.000 (0.352)	Top-5 acc 0.781 (1.616)	lr 0.04991
Warmup Train [2][190/3239]	Time 0.632 (0.558)	Data 0.001 (0.041)	Loss 6.5539 (6.5585)	Top-1 acc 0.781 (0.356)	Top-5 acc 1.562 (1.618)	lr 0.04991
Warmup Train [2][200/3239]	Time 0.598 (0.554)	Data 0.001 (0.039)	Loss 6.5684 (6.5587)	Top-1 acc 0.000 (0.344)	Top-5 acc 0.000 (1.599)	lr 0.04991
Warmup Train [2][210/3239]	Time 0.501 (0.551)	Data 0.001 (0.037)	Loss 6.5231 (6.5580)	Top-1 acc 0.000 (0.348)	Top-5 acc 1.562 (1.624)	lr 0.04991
Warmup Train [2][220/3239]	Time 0.587 (0.547)	Data 0.001 (0.036)	Loss 6.5825 (6.5576)	Top-1 acc 0.781 (0.354)	Top-5 acc 2.344 (1.624)	lr 0.04991
Warmup Train [2][230/3239]	Time 0.599 (0.546)	Data 0.001 (0.034)	Loss 6.5697 (6.5574)	Top-1 acc 1.562 (0.357)	Top-5 acc 2.344 (1.620)	lr 0.04991
Warmup Train [2][240/3239]	Time 0.491 (0.544)	Data 0.001 (0.033)	Loss 6.5440 (6.5573)	Top-1 acc 0.391 (0.370)	Top-5 acc 1.953 (1.635)	lr 0.04991
Warmup Train [2][250/3239]	Time 0.394 (0.543)	Data 0.001 (0.032)	Loss 6.5421 (6.5567)	Top-1 acc 0.000 (0.369)	Top-5 acc 1.172 (1.628)	lr 0.04991
Warmup Train [2][260/3239]	Time 0.542 (0.541)	Data 0.001 (0.031)	Loss 6.5822 (6.5567)	Top-1 acc 0.000 (0.373)	Top-5 acc 1.172 (1.643)	lr 0.04991
Warmup Train [2][270/3239]	Time 0.439 (0.540)	Data 0.001 (0.030)	Loss 6.5530 (6.5568)	Top-1 acc 0.000 (0.369)	Top-5 acc 0.391 (1.656)	lr 0.04991
Warmup Train [2][280/3239]	Time 0.465 (0.538)	Data 0.001 (0.030)	Loss 6.5109 (6.5566)	Top-1 acc 0.391 (0.361)	Top-5 acc 1.172 (1.645)	lr 0.04991
Warmup Train [2][290/3239]	Time 0.442 (0.537)	Data 0.001 (0.029)	Loss 6.5901 (6.5566)	Top-1 acc 0.781 (0.362)	Top-5 acc 0.781 (1.647)	lr 0.04991
Warmup Train [2][300/3239]	Time 0.605 (0.537)	Data 0.002 (0.028)	Loss 6.5231 (6.5563)	Top-1 acc 0.000 (0.362)	Top-5 acc 2.734 (1.670)	lr 0.04991
Warmup Train [2][310/3239]	Time 0.522 (0.537)	Data 0.001 (0.028)	Loss 6.5431 (6.5565)	Top-1 acc 0.391 (0.360)	Top-5 acc 2.344 (1.665)	lr 0.04991
Warmup Train [2][320/3239]	Time 0.574 (0.536)	Data 0.033 (0.027)	Loss 6.5709 (6.5568)	Top-1 acc 0.000 (0.360)	Top-5 acc 1.172 (1.665)	lr 0.04991
Warmup Train [2][330/3239]	Time 0.430 (0.535)	Data 0.001 (0.026)	Loss 6.5529 (6.5563)	Top-1 acc 0.391 (0.358)	Top-5 acc 1.953 (1.669)	lr 0.04991
Warmup Train [2][340/3239]	Time 0.684 (0.534)	Data 0.001 (0.026)	Loss 6.5851 (6.5561)	Top-1 acc 1.562 (0.363)	Top-5 acc 1.953 (1.678)	lr 0.04991
Warmup Train [2][350/3239]	Time 0.482 (0.534)	Data 0.001 (0.025)	Loss 6.5501 (6.5560)	Top-1 acc 0.391 (0.357)	Top-5 acc 1.172 (1.684)	lr 0.04991
Warmup Train [2][360/3239]	Time 0.471 (0.533)	Data 0.001 (0.025)	Loss 6.5577 (6.5562)	Top-1 acc 0.391 (0.357)	Top-5 acc 1.562 (1.677)	lr 0.04990
Warmup Train [2][370/3239]	Time 0.424 (0.532)	Data 0.001 (0.024)	Loss 6.5256 (6.5558)	Top-1 acc 0.391 (0.363)	Top-5 acc 2.344 (1.683)	lr 0.04990
Warmup Train [2][380/3239]	Time 0.489 (0.532)	Data 0.001 (0.024)	Loss 6.5381 (6.5561)	Top-1 acc 0.391 (0.360)	Top-5 acc 1.953 (1.677)	lr 0.04990
Warmup Train [2][390/3239]	Time 0.306 (0.531)	Data 0.001 (0.023)	Loss 6.5382 (6.5560)	Top-1 acc 1.172 (0.361)	Top-5 acc 1.953 (1.680)	lr 0.04990
Warmup Train [2][400/3239]	Time 0.552 (0.531)	Data 0.001 (0.023)	Loss 6.5662 (6.5559)	Top-1 acc 0.781 (0.361)	Top-5 acc 2.344 (1.678)	lr 0.04990
Warmup Train [2][410/3239]	Time 0.332 (0.531)	Data 0.001 (0.023)	Loss 6.5149 (6.5560)	Top-1 acc 0.781 (0.364)	Top-5 acc 2.734 (1.680)	lr 0.04990
Warmup Train [2][420/3239]	Time 0.641 (0.531)	Data 0.001 (0.022)	Loss 6.6088 (6.5560)	Top-1 acc 0.000 (0.361)	Top-5 acc 0.391 (1.674)	lr 0.04990
Warmup Train [2][430/3239]	Time 0.514 (0.530)	Data 0.001 (0.022)	Loss 6.5570 (6.5556)	Top-1 acc 0.000 (0.359)	Top-5 acc 3.906 (1.676)	lr 0.04990
Warmup Train [2][440/3239]	Time 0.490 (0.529)	Data 0.001 (0.021)	Loss 6.5784 (6.5554)	Top-1 acc 0.000 (0.357)	Top-5 acc 1.562 (1.677)	lr 0.04990
Warmup Train [2][450/3239]	Time 0.561 (0.529)	Data 0.001 (0.021)	Loss 6.4850 (6.5552)	Top-1 acc 0.391 (0.357)	Top-5 acc 1.953 (1.670)	lr 0.04990
Warmup Train [2][460/3239]	Time 0.344 (0.527)	Data 0.002 (0.021)	Loss 6.5217 (6.5550)	Top-1 acc 0.781 (0.357)	Top-5 acc 1.953 (1.668)	lr 0.04990
Warmup Train [2][470/3239]	Time 0.612 (0.526)	Data 0.001 (0.020)	Loss 6.5312 (6.5549)	Top-1 acc 0.391 (0.357)	Top-5 acc 2.734 (1.665)	lr 0.04990
Warmup Train [2][480/3239]	Time 0.323 (0.524)	Data 0.001 (0.020)	Loss 6.5332 (6.5546)	Top-1 acc 0.000 (0.359)	Top-5 acc 0.781 (1.666)	lr 0.04990
Warmup Train [2][490/3239]	Time 0.594 (0.524)	Data 0.001 (0.020)	Loss 6.5311 (6.5544)	Top-1 acc 0.000 (0.361)	Top-5 acc 1.953 (1.672)	lr 0.04990
Warmup Train [2][500/3239]	Time 0.469 (0.524)	Data 0.001 (0.020)	Loss 6.5697 (6.5538)	Top-1 acc 0.000 (0.361)	Top-5 acc 1.562 (1.680)	lr 0.04990
Warmup Train [2][510/3239]	Time 0.758 (0.524)	Data 0.001 (0.020)	Loss 6.4653 (6.5537)	Top-1 acc 0.391 (0.360)	Top-5 acc 2.734 (1.688)	lr 0.04990
Warmup Train [2][520/3239]	Time 0.541 (0.523)	Data 0.001 (0.019)	Loss 6.5781 (6.5538)	Top-1 acc 0.000 (0.358)	Top-5 acc 1.562 (1.681)	lr 0.04990
Warmup Train [2][530/3239]	Time 0.479 (0.523)	Data 0.001 (0.019)	Loss 6.5318 (6.5536)	Top-1 acc 0.391 (0.355)	Top-5 acc 2.734 (1.680)	lr 0.04990
Warmup Train [2][540/3239]	Time 0.526 (0.523)	Data 0.001 (0.019)	Loss 6.5841 (6.5535)	Top-1 acc 0.000 (0.353)	Top-5 acc 1.953 (1.683)	lr 0.04990
Warmup Train [2][550/3239]	Time 0.562 (0.523)	Data 0.001 (0.019)	Loss 6.5411 (6.5532)	Top-1 acc 0.391 (0.352)	Top-5 acc 2.734 (1.681)	lr 0.04989
Warmup Train [2][560/3239]	Time 0.556 (0.523)	Data 0.001 (0.018)	Loss 6.5071 (6.5529)	Top-1 acc 1.172 (0.354)	Top-5 acc 3.125 (1.679)	lr 0.04989
Warmup Train [2][570/3239]	Time 0.504 (0.523)	Data 0.001 (0.018)	Loss 6.5218 (6.5524)	Top-1 acc 1.172 (0.353)	Top-5 acc 2.734 (1.686)	lr 0.04989
Warmup Train [2][580/3239]	Time 0.563 (0.522)	Data 0.001 (0.018)	Loss 6.4826 (6.5520)	Top-1 acc 0.781 (0.354)	Top-5 acc 3.125 (1.686)	lr 0.04989
Warmup Train [2][590/3239]	Time 0.419 (0.522)	Data 0.001 (0.018)	Loss 6.5785 (6.5518)	Top-1 acc 0.000 (0.354)	Top-5 acc 1.562 (1.689)	lr 0.04989
Warmup Train [2][600/3239]	Time 0.397 (0.522)	Data 0.001 (0.017)	Loss 6.5191 (6.5516)	Top-1 acc 0.000 (0.352)	Top-5 acc 1.172 (1.697)	lr 0.04989
Warmup Train [2][610/3239]	Time 0.368 (0.522)	Data 0.001 (0.017)	Loss 6.5101 (6.5514)	Top-1 acc 0.391 (0.353)	Top-5 acc 2.734 (1.697)	lr 0.04989
Warmup Train [2][620/3239]	Time 0.507 (0.522)	Data 0.001 (0.017)	Loss 6.5242 (6.5513)	Top-1 acc 0.000 (0.354)	Top-5 acc 1.562 (1.700)	lr 0.04989
Warmup Train [2][630/3239]	Time 0.456 (0.522)	Data 0.001 (0.017)	Loss 6.5268 (6.5510)	Top-1 acc 1.562 (0.355)	Top-5 acc 3.516 (1.706)	lr 0.04989
Warmup Train [2][640/3239]	Time 0.532 (0.522)	Data 0.001 (0.017)	Loss 6.5368 (6.5506)	Top-1 acc 0.000 (0.354)	Top-5 acc 1.562 (1.707)	lr 0.04989
Warmup Train [2][650/3239]	Time 0.545 (0.522)	Data 0.001 (0.017)	Loss 6.4874 (6.5504)	Top-1 acc 0.781 (0.356)	Top-5 acc 2.734 (1.710)	lr 0.04989
Warmup Train [2][660/3239]	Time 0.678 (0.522)	Data 0.001 (0.017)	Loss 6.5349 (6.5502)	Top-1 acc 0.000 (0.354)	Top-5 acc 1.172 (1.711)	lr 0.04989
Warmup Train [2][670/3239]	Time 0.423 (0.522)	Data 0.002 (0.017)	Loss 6.5524 (6.5500)	Top-1 acc 0.000 (0.357)	Top-5 acc 0.391 (1.716)	lr 0.04989
Warmup Train [2][680/3239]	Time 0.526 (0.522)	Data 0.001 (0.017)	Loss 6.5567 (6.5497)	Top-1 acc 0.000 (0.359)	Top-5 acc 1.562 (1.721)	lr 0.04989
Warmup Train [2][690/3239]	Time 0.280 (0.521)	Data 0.001 (0.016)	Loss 6.5177 (6.5493)	Top-1 acc 1.172 (0.363)	Top-5 acc 2.734 (1.722)	lr 0.04989
Warmup Train [2][700/3239]	Time 0.562 (0.521)	Data 0.001 (0.016)	Loss 6.4914 (6.5491)	Top-1 acc 0.781 (0.361)	Top-5 acc 1.953 (1.716)	lr 0.04989
Warmup Train [2][710/3239]	Time 0.391 (0.521)	Data 0.001 (0.016)	Loss 6.5190 (6.5489)	Top-1 acc 0.781 (0.362)	Top-5 acc 3.125 (1.719)	lr 0.04989
Warmup Train [2][720/3239]	Time 0.522 (0.520)	Data 0.002 (0.016)	Loss 6.5100 (6.5487)	Top-1 acc 1.172 (0.362)	Top-5 acc 2.344 (1.713)	lr 0.04988
Warmup Train [2][730/3239]	Time 0.219 (0.519)	Data 0.001 (0.016)	Loss 6.4686 (6.5484)	Top-1 acc 0.000 (0.362)	Top-5 acc 1.172 (1.713)	lr 0.04988
Warmup Train [2][740/3239]	Time 0.557 (0.519)	Data 0.001 (0.016)	Loss 6.5233 (6.5482)	Top-1 acc 0.000 (0.364)	Top-5 acc 2.344 (1.717)	lr 0.04988
Warmup Train [2][750/3239]	Time 0.421 (0.519)	Data 0.001 (0.016)	Loss 6.6056 (6.5480)	Top-1 acc 0.000 (0.364)	Top-5 acc 0.781 (1.721)	lr 0.04988
Warmup Train [2][760/3239]	Time 0.582 (0.519)	Data 0.001 (0.016)	Loss 6.5362 (6.5479)	Top-1 acc 0.391 (0.365)	Top-5 acc 1.172 (1.728)	lr 0.04988
Warmup Train [2][770/3239]	Time 0.469 (0.519)	Data 0.001 (0.016)	Loss 6.5673 (6.5475)	Top-1 acc 0.000 (0.367)	Top-5 acc 2.344 (1.734)	lr 0.04988
Warmup Train [2][780/3239]	Time 0.426 (0.519)	Data 0.001 (0.015)	Loss 6.4926 (6.5470)	Top-1 acc 0.391 (0.368)	Top-5 acc 1.953 (1.739)	lr 0.04988
Warmup Train [2][790/3239]	Time 0.539 (0.519)	Data 0.001 (0.015)	Loss 6.5501 (6.5470)	Top-1 acc 0.391 (0.366)	Top-5 acc 0.781 (1.738)	lr 0.04988
Warmup Train [2][800/3239]	Time 0.489 (0.519)	Data 0.001 (0.015)	Loss 6.5316 (6.5467)	Top-1 acc 0.781 (0.368)	Top-5 acc 1.953 (1.740)	lr 0.04988
Warmup Train [2][810/3239]	Time 0.659 (0.519)	Data 0.001 (0.015)	Loss 6.5285 (6.5466)	Top-1 acc 0.391 (0.368)	Top-5 acc 2.344 (1.739)	lr 0.04988
Warmup Train [2][820/3239]	Time 0.511 (0.519)	Data 0.001 (0.015)	Loss 6.5566 (6.5465)	Top-1 acc 0.000 (0.366)	Top-5 acc 1.562 (1.737)	lr 0.04988
Warmup Train [2][830/3239]	Time 0.513 (0.518)	Data 0.001 (0.015)	Loss 6.5337 (6.5462)	Top-1 acc 0.391 (0.367)	Top-5 acc 1.562 (1.738)	lr 0.04988
Warmup Train [2][840/3239]	Time 0.549 (0.519)	Data 0.001 (0.015)	Loss 6.5663 (6.5461)	Top-1 acc 0.000 (0.367)	Top-5 acc 1.562 (1.739)	lr 0.04988
Warmup Train [2][850/3239]	Time 0.571 (0.518)	Data 0.001 (0.014)	Loss 6.5711 (6.5457)	Top-1 acc 0.391 (0.369)	Top-5 acc 1.562 (1.742)	lr 0.04988
Warmup Train [2][860/3239]	Time 0.534 (0.518)	Data 0.001 (0.014)	Loss 6.4749 (6.5455)	Top-1 acc 1.172 (0.371)	Top-5 acc 2.734 (1.744)	lr 0.04988
Warmup Train [2][870/3239]	Time 0.512 (0.519)	Data 0.001 (0.014)	Loss 6.5052 (6.5453)	Top-1 acc 0.391 (0.371)	Top-5 acc 1.172 (1.751)	lr 0.04988
Warmup Train [2][880/3239]	Time 0.621 (0.518)	Data 0.001 (0.014)	Loss 6.5172 (6.5450)	Top-1 acc 0.391 (0.372)	Top-5 acc 1.953 (1.750)	lr 0.04988
Warmup Train [2][890/3239]	Time 0.460 (0.518)	Data 0.001 (0.014)	Loss 6.5233 (6.5449)	Top-1 acc 1.172 (0.374)	Top-5 acc 3.516 (1.753)	lr 0.04987
Warmup Train [2][900/3239]	Time 0.542 (0.518)	Data 0.001 (0.014)	Loss 6.4477 (6.5446)	Top-1 acc 0.781 (0.375)	Top-5 acc 1.953 (1.756)	lr 0.04987
Warmup Train [2][910/3239]	Time 0.514 (0.518)	Data 0.001 (0.014)	Loss 6.5258 (6.5444)	Top-1 acc 0.000 (0.374)	Top-5 acc 1.172 (1.756)	lr 0.04987
Warmup Train [2][920/3239]	Time 0.538 (0.518)	Data 0.001 (0.014)	Loss 6.5528 (6.5441)	Top-1 acc 0.391 (0.376)	Top-5 acc 0.391 (1.755)	lr 0.04987
Warmup Train [2][930/3239]	Time 0.602 (0.518)	Data 0.001 (0.014)	Loss 6.6013 (6.5441)	Top-1 acc 0.000 (0.377)	Top-5 acc 1.172 (1.758)	lr 0.04987
Warmup Train [2][940/3239]	Time 0.466 (0.518)	Data 0.001 (0.014)	Loss 6.5461 (6.5441)	Top-1 acc 0.000 (0.377)	Top-5 acc 1.562 (1.761)	lr 0.04987
Warmup Train [2][950/3239]	Time 0.393 (0.518)	Data 0.001 (0.014)	Loss 6.5258 (6.5442)	Top-1 acc 0.000 (0.375)	Top-5 acc 1.562 (1.760)	lr 0.04987
Warmup Train [2][960/3239]	Time 0.550 (0.518)	Data 0.001 (0.014)	Loss 6.5007 (6.5441)	Top-1 acc 0.000 (0.376)	Top-5 acc 1.172 (1.758)	lr 0.04987
Warmup Train [2][970/3239]	Time 0.470 (0.517)	Data 0.001 (0.013)	Loss 6.5608 (6.5439)	Top-1 acc 0.391 (0.378)	Top-5 acc 1.953 (1.763)	lr 0.04987
Warmup Train [2][980/3239]	Time 0.487 (0.517)	Data 0.001 (0.013)	Loss 6.5419 (6.5437)	Top-1 acc 0.000 (0.376)	Top-5 acc 1.172 (1.766)	lr 0.04987
Warmup Train [2][990/3239]	Time 0.307 (0.516)	Data 0.001 (0.013)	Loss 6.5452 (6.5435)	Top-1 acc 0.000 (0.376)	Top-5 acc 0.781 (1.769)	lr 0.04987
Warmup Train [2][1000/3239]	Time 0.411 (0.516)	Data 0.001 (0.013)	Loss 6.5071 (6.5433)	Top-1 acc 0.391 (0.377)	Top-5 acc 3.125 (1.772)	lr 0.04987
Warmup Train [2][1010/3239]	Time 0.486 (0.516)	Data 0.001 (0.013)	Loss 6.5553 (6.5430)	Top-1 acc 0.000 (0.377)	Top-5 acc 0.000 (1.776)	lr 0.04987
Warmup Train [2][1020/3239]	Time 0.512 (0.516)	Data 0.001 (0.013)	Loss 6.5302 (6.5427)	Top-1 acc 1.562 (0.379)	Top-5 acc 2.344 (1.783)	lr 0.04987
Warmup Train [2][1030/3239]	Time 0.630 (0.516)	Data 0.001 (0.013)	Loss 6.4694 (6.5424)	Top-1 acc 0.781 (0.380)	Top-5 acc 2.344 (1.784)	lr 0.04987
Warmup Train [2][1040/3239]	Time 0.376 (0.516)	Data 0.001 (0.013)	Loss 6.4616 (6.5419)	Top-1 acc 0.391 (0.382)	Top-5 acc 4.297 (1.792)	lr 0.04987
Warmup Train [2][1050/3239]	Time 0.489 (0.516)	Data 0.001 (0.013)	Loss 6.4886 (6.5416)	Top-1 acc 0.781 (0.384)	Top-5 acc 2.344 (1.797)	lr 0.04986
Warmup Train [2][1060/3239]	Time 0.497 (0.516)	Data 0.001 (0.013)	Loss 6.4838 (6.5415)	Top-1 acc 1.172 (0.384)	Top-5 acc 1.953 (1.798)	lr 0.04986
Warmup Train [2][1070/3239]	Time 0.558 (0.516)	Data 0.001 (0.013)	Loss 6.6286 (6.5414)	Top-1 acc 0.781 (0.383)	Top-5 acc 1.562 (1.796)	lr 0.04986
Warmup Train [2][1080/3239]	Time 0.531 (0.516)	Data 0.001 (0.013)	Loss 6.5252 (6.5411)	Top-1 acc 0.781 (0.384)	Top-5 acc 2.344 (1.804)	lr 0.04986
Warmup Train [2][1090/3239]	Time 0.430 (0.516)	Data 0.001 (0.013)	Loss 6.5214 (6.5408)	Top-1 acc 0.781 (0.387)	Top-5 acc 2.734 (1.811)	lr 0.04986
Warmup Train [2][1100/3239]	Time 0.496 (0.516)	Data 0.001 (0.013)	Loss 6.4771 (6.5405)	Top-1 acc 0.781 (0.389)	Top-5 acc 3.125 (1.813)	lr 0.04986
Warmup Train [2][1110/3239]	Time 0.527 (0.516)	Data 0.001 (0.013)	Loss 6.5208 (6.5401)	Top-1 acc 0.781 (0.389)	Top-5 acc 3.906 (1.818)	lr 0.04986
Warmup Train [2][1120/3239]	Time 0.607 (0.516)	Data 0.001 (0.013)	Loss 6.5294 (6.5398)	Top-1 acc 0.391 (0.390)	Top-5 acc 2.344 (1.825)	lr 0.04986
Warmup Train [2][1130/3239]	Time 0.646 (0.516)	Data 0.001 (0.013)	Loss 6.5438 (6.5396)	Top-1 acc 0.391 (0.391)	Top-5 acc 3.516 (1.831)	lr 0.04986
Warmup Train [2][1140/3239]	Time 0.544 (0.516)	Data 0.001 (0.012)	Loss 6.5343 (6.5394)	Top-1 acc 0.781 (0.391)	Top-5 acc 2.344 (1.837)	lr 0.04986
Warmup Train [2][1150/3239]	Time 0.386 (0.516)	Data 0.001 (0.012)	Loss 6.4941 (6.5391)	Top-1 acc 0.781 (0.393)	Top-5 acc 3.516 (1.840)	lr 0.04986
Warmup Train [2][1160/3239]	Time 0.307 (0.516)	Data 0.001 (0.012)	Loss 6.5436 (6.5389)	Top-1 acc 0.000 (0.393)	Top-5 acc 1.562 (1.839)	lr 0.04986
Warmup Train [2][1170/3239]	Time 0.565 (0.516)	Data 0.001 (0.013)	Loss 6.5352 (6.5388)	Top-1 acc 0.391 (0.393)	Top-5 acc 0.391 (1.840)	lr 0.04986
Warmup Train [2][1180/3239]	Time 0.511 (0.516)	Data 0.001 (0.012)	Loss 6.4864 (6.5386)	Top-1 acc 1.172 (0.395)	Top-5 acc 3.125 (1.846)	lr 0.04986
Warmup Train [2][1190/3239]	Time 0.464 (0.516)	Data 0.001 (0.012)	Loss 6.5241 (6.5385)	Top-1 acc 0.391 (0.395)	Top-5 acc 1.953 (1.847)	lr 0.04986
Warmup Train [2][1200/3239]	Time 0.475 (0.516)	Data 0.001 (0.012)	Loss 6.4702 (6.5381)	Top-1 acc 0.781 (0.396)	Top-5 acc 3.516 (1.847)	lr 0.04986
Warmup Train [2][1210/3239]	Time 0.523 (0.515)	Data 0.001 (0.012)	Loss 6.5185 (6.5380)	Top-1 acc 0.391 (0.396)	Top-5 acc 2.734 (1.849)	lr 0.04985
Warmup Train [2][1220/3239]	Time 0.527 (0.515)	Data 0.001 (0.012)	Loss 6.5098 (6.5379)	Top-1 acc 0.391 (0.398)	Top-5 acc 2.344 (1.853)	lr 0.04985
Warmup Train [2][1230/3239]	Time 0.415 (0.515)	Data 0.001 (0.012)	Loss 6.5181 (6.5376)	Top-1 acc 1.953 (0.400)	Top-5 acc 3.516 (1.857)	lr 0.04985
Warmup Train [2][1240/3239]	Time 0.508 (0.515)	Data 0.001 (0.012)	Loss 6.6040 (6.5376)	Top-1 acc 0.000 (0.399)	Top-5 acc 1.172 (1.858)	lr 0.04985
Warmup Train [2][1250/3239]	Time 0.743 (0.515)	Data 0.001 (0.012)	Loss 6.4978 (6.5374)	Top-1 acc 0.781 (0.402)	Top-5 acc 2.344 (1.862)	lr 0.04985
Warmup Train [2][1260/3239]	Time 0.610 (0.515)	Data 0.001 (0.012)	Loss 6.5594 (6.5372)	Top-1 acc 0.391 (0.401)	Top-5 acc 3.125 (1.864)	lr 0.04985
Warmup Train [2][1270/3239]	Time 0.515 (0.515)	Data 0.001 (0.012)	Loss 6.5931 (6.5370)	Top-1 acc 0.000 (0.401)	Top-5 acc 1.953 (1.866)	lr 0.04985
Warmup Train [2][1280/3239]	Time 0.584 (0.515)	Data 0.001 (0.012)	Loss 6.5078 (6.5369)	Top-1 acc 0.781 (0.400)	Top-5 acc 2.344 (1.867)	lr 0.04985
Warmup Train [2][1290/3239]	Time 0.393 (0.515)	Data 0.001 (0.012)	Loss 6.4620 (6.5366)	Top-1 acc 1.172 (0.401)	Top-5 acc 3.906 (1.871)	lr 0.04985
Warmup Train [2][1300/3239]	Time 0.620 (0.515)	Data 0.001 (0.012)	Loss 6.4938 (6.5363)	Top-1 acc 0.391 (0.405)	Top-5 acc 1.953 (1.876)	lr 0.04985
Warmup Train [2][1310/3239]	Time 0.488 (0.515)	Data 0.001 (0.012)	Loss 6.4732 (6.5360)	Top-1 acc 0.781 (0.407)	Top-5 acc 2.344 (1.879)	lr 0.04985
Warmup Train [2][1320/3239]	Time 0.625 (0.515)	Data 0.001 (0.012)	Loss 6.5165 (6.5358)	Top-1 acc 0.000 (0.408)	Top-5 acc 1.953 (1.876)	lr 0.04985
Warmup Train [2][1330/3239]	Time 0.523 (0.515)	Data 0.001 (0.012)	Loss 6.4701 (6.5355)	Top-1 acc 0.781 (0.410)	Top-5 acc 2.344 (1.879)	lr 0.04985
Warmup Train [2][1340/3239]	Time 0.503 (0.515)	Data 0.001 (0.012)	Loss 6.5145 (6.5354)	Top-1 acc 0.000 (0.411)	Top-5 acc 1.953 (1.880)	lr 0.04985
Warmup Train [2][1350/3239]	Time 0.467 (0.515)	Data 0.001 (0.012)	Loss 6.4659 (6.5351)	Top-1 acc 0.391 (0.412)	Top-5 acc 1.953 (1.882)	lr 0.04985
Warmup Train [2][1360/3239]	Time 0.552 (0.515)	Data 0.001 (0.012)	Loss 6.5209 (6.5351)	Top-1 acc 0.000 (0.412)	Top-5 acc 1.562 (1.884)	lr 0.04984
Warmup Train [2][1370/3239]	Time 0.415 (0.515)	Data 0.001 (0.012)	Loss 6.4983 (6.5349)	Top-1 acc 0.781 (0.411)	Top-5 acc 2.344 (1.883)	lr 0.04984
Warmup Train [2][1380/3239]	Time 0.394 (0.515)	Data 0.001 (0.012)	Loss 6.4970 (6.5348)	Top-1 acc 0.000 (0.410)	Top-5 acc 3.516 (1.887)	lr 0.04984
Warmup Train [2][1390/3239]	Time 0.538 (0.515)	Data 0.001 (0.012)	Loss 6.5465 (6.5347)	Top-1 acc 0.391 (0.409)	Top-5 acc 2.344 (1.886)	lr 0.04984
Warmup Train [2][1400/3239]	Time 0.515 (0.515)	Data 0.001 (0.012)	Loss 6.5643 (6.5346)	Top-1 acc 0.000 (0.411)	Top-5 acc 1.172 (1.888)	lr 0.04984
Warmup Train [2][1410/3239]	Time 0.454 (0.515)	Data 0.001 (0.012)	Loss 6.5129 (6.5344)	Top-1 acc 0.000 (0.412)	Top-5 acc 2.734 (1.895)	lr 0.04984
Warmup Train [2][1420/3239]	Time 0.364 (0.515)	Data 0.001 (0.012)	Loss 6.4854 (6.5343)	Top-1 acc 0.000 (0.415)	Top-5 acc 3.125 (1.899)	lr 0.04984
Warmup Train [2][1430/3239]	Time 0.507 (0.515)	Data 0.001 (0.012)	Loss 6.4822 (6.5342)	Top-1 acc 0.000 (0.415)	Top-5 acc 1.953 (1.903)	lr 0.04984
Warmup Train [2][1440/3239]	Time 0.424 (0.515)	Data 0.001 (0.012)	Loss 6.5058 (6.5340)	Top-1 acc 0.000 (0.417)	Top-5 acc 1.953 (1.906)	lr 0.04984
Warmup Train [2][1450/3239]	Time 0.506 (0.515)	Data 0.001 (0.012)	Loss 6.4902 (6.5338)	Top-1 acc 0.391 (0.418)	Top-5 acc 1.953 (1.910)	lr 0.04984
Warmup Train [2][1460/3239]	Time 0.639 (0.515)	Data 0.001 (0.012)	Loss 6.4741 (6.5335)	Top-1 acc 0.391 (0.420)	Top-5 acc 2.734 (1.914)	lr 0.04984
Warmup Train [2][1470/3239]	Time 0.644 (0.515)	Data 0.001 (0.011)	Loss 6.4949 (6.5332)	Top-1 acc 0.391 (0.419)	Top-5 acc 2.344 (1.916)	lr 0.04984
Warmup Train [2][1480/3239]	Time 0.322 (0.514)	Data 0.001 (0.011)	Loss 6.4786 (6.5330)	Top-1 acc 0.391 (0.420)	Top-5 acc 1.172 (1.919)	lr 0.04984
Warmup Train [2][1490/3239]	Time 0.495 (0.514)	Data 0.001 (0.011)	Loss 6.5298 (6.5328)	Top-1 acc 0.391 (0.419)	Top-5 acc 0.781 (1.919)	lr 0.04984
Warmup Train [2][1500/3239]	Time 0.384 (0.514)	Data 0.001 (0.011)	Loss 6.4419 (6.5327)	Top-1 acc 0.781 (0.418)	Top-5 acc 3.125 (1.921)	lr 0.04984
Warmup Train [2][1510/3239]	Time 0.597 (0.514)	Data 0.001 (0.011)	Loss 6.5237 (6.5325)	Top-1 acc 0.391 (0.419)	Top-5 acc 1.562 (1.922)	lr 0.04983
Warmup Train [2][1520/3239]	Time 0.342 (0.514)	Data 0.001 (0.011)	Loss 6.5542 (6.5324)	Top-1 acc 0.000 (0.418)	Top-5 acc 1.562 (1.924)	lr 0.04983
Warmup Train [2][1530/3239]	Time 0.340 (0.514)	Data 0.001 (0.011)	Loss 6.4903 (6.5321)	Top-1 acc 0.391 (0.418)	Top-5 acc 3.516 (1.926)	lr 0.04983
Warmup Train [2][1540/3239]	Time 0.483 (0.514)	Data 0.001 (0.011)	Loss 6.4627 (6.5320)	Top-1 acc 0.781 (0.418)	Top-5 acc 2.734 (1.928)	lr 0.04983
Warmup Train [2][1550/3239]	Time 0.580 (0.514)	Data 0.001 (0.011)	Loss 6.5375 (6.5320)	Top-1 acc 0.391 (0.418)	Top-5 acc 0.781 (1.927)	lr 0.04983
Warmup Train [2][1560/3239]	Time 0.502 (0.514)	Data 0.002 (0.011)	Loss 6.5047 (6.5318)	Top-1 acc 0.000 (0.419)	Top-5 acc 1.172 (1.930)	lr 0.04983
Warmup Train [2][1570/3239]	Time 0.668 (0.514)	Data 0.001 (0.011)	Loss 6.5016 (6.5316)	Top-1 acc 0.781 (0.419)	Top-5 acc 2.734 (1.933)	lr 0.04983
Warmup Train [2][1580/3239]	Time 0.479 (0.514)	Data 0.001 (0.011)	Loss 6.5637 (6.5315)	Top-1 acc 0.000 (0.420)	Top-5 acc 1.172 (1.932)	lr 0.04983
Warmup Train [2][1590/3239]	Time 0.366 (0.514)	Data 0.002 (0.011)	Loss 6.5117 (6.5311)	Top-1 acc 0.000 (0.420)	Top-5 acc 1.953 (1.934)	lr 0.04983
Warmup Train [2][1600/3239]	Time 0.602 (0.514)	Data 0.001 (0.011)	Loss 6.5115 (6.5310)	Top-1 acc 0.391 (0.421)	Top-5 acc 1.172 (1.935)	lr 0.04983
Warmup Train [2][1610/3239]	Time 0.577 (0.514)	Data 0.001 (0.011)	Loss 6.5364 (6.5308)	Top-1 acc 0.391 (0.422)	Top-5 acc 1.562 (1.939)	lr 0.04983
Warmup Train [2][1620/3239]	Time 0.468 (0.514)	Data 0.001 (0.011)	Loss 6.4592 (6.5306)	Top-1 acc 1.172 (0.423)	Top-5 acc 3.906 (1.939)	lr 0.04983
Warmup Train [2][1630/3239]	Time 0.492 (0.514)	Data 0.001 (0.011)	Loss 6.5190 (6.5305)	Top-1 acc 0.391 (0.422)	Top-5 acc 1.172 (1.941)	lr 0.04983
Warmup Train [2][1640/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 6.4989 (6.5302)	Top-1 acc 0.781 (0.424)	Top-5 acc 2.734 (1.944)	lr 0.04983
Warmup Train [2][1650/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 6.4978 (6.5301)	Top-1 acc 0.391 (0.424)	Top-5 acc 1.172 (1.945)	lr 0.04982
Warmup Train [2][1660/3239]	Time 0.431 (0.514)	Data 0.001 (0.011)	Loss 6.5360 (6.5299)	Top-1 acc 0.391 (0.425)	Top-5 acc 2.344 (1.947)	lr 0.04982
Warmup Train [2][1670/3239]	Time 0.423 (0.514)	Data 0.001 (0.011)	Loss 6.4866 (6.5297)	Top-1 acc 1.172 (0.425)	Top-5 acc 2.734 (1.948)	lr 0.04982
Warmup Train [2][1680/3239]	Time 0.580 (0.514)	Data 0.001 (0.011)	Loss 6.4808 (6.5295)	Top-1 acc 0.391 (0.424)	Top-5 acc 2.344 (1.948)	lr 0.04982
Warmup Train [2][1690/3239]	Time 0.566 (0.514)	Data 0.001 (0.011)	Loss 6.5211 (6.5293)	Top-1 acc 0.781 (0.427)	Top-5 acc 1.562 (1.952)	lr 0.04982
Warmup Train [2][1700/3239]	Time 0.622 (0.514)	Data 0.001 (0.011)	Loss 6.5206 (6.5292)	Top-1 acc 0.781 (0.427)	Top-5 acc 2.734 (1.957)	lr 0.04982
Warmup Train [2][1710/3239]	Time 0.409 (0.514)	Data 0.001 (0.011)	Loss 6.5296 (6.5290)	Top-1 acc 1.172 (0.427)	Top-5 acc 1.953 (1.958)	lr 0.04982
Warmup Train [2][1720/3239]	Time 0.381 (0.513)	Data 0.001 (0.011)	Loss 6.5010 (6.5289)	Top-1 acc 0.391 (0.427)	Top-5 acc 3.906 (1.959)	lr 0.04982
Warmup Train [2][1730/3239]	Time 0.503 (0.513)	Data 0.001 (0.011)	Loss 6.5403 (6.5287)	Top-1 acc 0.391 (0.429)	Top-5 acc 1.562 (1.961)	lr 0.04982
Warmup Train [2][1740/3239]	Time 0.679 (0.513)	Data 0.001 (0.011)	Loss 6.5191 (6.5286)	Top-1 acc 1.562 (0.430)	Top-5 acc 3.516 (1.963)	lr 0.04982
Warmup Train [2][1750/3239]	Time 0.456 (0.513)	Data 0.001 (0.011)	Loss 6.4631 (6.5284)	Top-1 acc 0.391 (0.432)	Top-5 acc 2.734 (1.969)	lr 0.04982
Warmup Train [2][1760/3239]	Time 0.303 (0.513)	Data 0.001 (0.011)	Loss 6.4674 (6.5281)	Top-1 acc 0.391 (0.434)	Top-5 acc 3.906 (1.973)	lr 0.04982
Warmup Train [2][1770/3239]	Time 0.482 (0.513)	Data 0.001 (0.011)	Loss 6.5034 (6.5280)	Top-1 acc 0.391 (0.434)	Top-5 acc 2.344 (1.978)	lr 0.04982
Warmup Train [2][1780/3239]	Time 0.500 (0.513)	Data 0.001 (0.011)	Loss 6.4527 (6.5277)	Top-1 acc 1.172 (0.436)	Top-5 acc 3.125 (1.979)	lr 0.04982
Warmup Train [2][1790/3239]	Time 0.504 (0.513)	Data 0.001 (0.011)	Loss 6.4708 (6.5274)	Top-1 acc 0.781 (0.437)	Top-5 acc 2.734 (1.983)	lr 0.04981
Warmup Train [2][1800/3239]	Time 0.487 (0.513)	Data 0.001 (0.011)	Loss 6.5393 (6.5272)	Top-1 acc 0.000 (0.437)	Top-5 acc 1.172 (1.985)	lr 0.04981
Warmup Train [2][1810/3239]	Time 0.551 (0.513)	Data 0.001 (0.011)	Loss 6.5067 (6.5270)	Top-1 acc 1.953 (0.440)	Top-5 acc 4.297 (1.987)	lr 0.04981
Warmup Train [2][1820/3239]	Time 0.438 (0.513)	Data 0.001 (0.011)	Loss 6.4749 (6.5268)	Top-1 acc 0.391 (0.441)	Top-5 acc 1.953 (1.989)	lr 0.04981
Warmup Train [2][1830/3239]	Time 0.557 (0.513)	Data 0.001 (0.011)	Loss 6.5802 (6.5267)	Top-1 acc 0.391 (0.441)	Top-5 acc 3.516 (1.992)	lr 0.04981
Warmup Train [2][1840/3239]	Time 0.652 (0.513)	Data 0.001 (0.010)	Loss 6.4902 (6.5266)	Top-1 acc 0.000 (0.440)	Top-5 acc 2.734 (1.994)	lr 0.04981
Warmup Train [2][1850/3239]	Time 0.354 (0.513)	Data 0.001 (0.010)	Loss 6.5136 (6.5264)	Top-1 acc 0.391 (0.441)	Top-5 acc 1.172 (1.996)	lr 0.04981
Warmup Train [2][1860/3239]	Time 0.489 (0.513)	Data 0.001 (0.010)	Loss 6.4371 (6.5261)	Top-1 acc 0.781 (0.444)	Top-5 acc 3.906 (2.002)	lr 0.04981
Warmup Train [2][1870/3239]	Time 0.410 (0.513)	Data 0.001 (0.010)	Loss 6.4246 (6.5260)	Top-1 acc 0.000 (0.445)	Top-5 acc 3.906 (2.006)	lr 0.04981
Warmup Train [2][1880/3239]	Time 0.565 (0.513)	Data 0.001 (0.010)	Loss 6.4431 (6.5258)	Top-1 acc 1.172 (0.446)	Top-5 acc 2.734 (2.008)	lr 0.04981
Warmup Train [2][1890/3239]	Time 0.533 (0.513)	Data 0.001 (0.010)	Loss 6.5129 (6.5258)	Top-1 acc 0.000 (0.445)	Top-5 acc 0.391 (2.005)	lr 0.04981
Warmup Train [2][1900/3239]	Time 0.425 (0.513)	Data 0.001 (0.010)	Loss 6.5476 (6.5255)	Top-1 acc 0.000 (0.445)	Top-5 acc 2.344 (2.010)	lr 0.04981
Warmup Train [2][1910/3239]	Time 0.305 (0.513)	Data 0.001 (0.010)	Loss 6.4292 (6.5253)	Top-1 acc 1.562 (0.447)	Top-5 acc 4.297 (2.015)	lr 0.04981
Warmup Train [2][1920/3239]	Time 0.483 (0.513)	Data 0.001 (0.010)	Loss 6.4627 (6.5250)	Top-1 acc 0.781 (0.447)	Top-5 acc 3.125 (2.017)	lr 0.04980
Warmup Train [2][1930/3239]	Time 0.572 (0.513)	Data 0.001 (0.010)	Loss 6.5179 (6.5249)	Top-1 acc 0.391 (0.446)	Top-5 acc 0.391 (2.016)	lr 0.04980
Warmup Train [2][1940/3239]	Time 0.484 (0.513)	Data 0.001 (0.010)	Loss 6.4559 (6.5247)	Top-1 acc 0.391 (0.446)	Top-5 acc 2.734 (2.019)	lr 0.04980
Warmup Train [2][1950/3239]	Time 0.423 (0.513)	Data 0.001 (0.010)	Loss 6.5024 (6.5245)	Top-1 acc 0.781 (0.447)	Top-5 acc 2.734 (2.020)	lr 0.04980
Warmup Train [2][1960/3239]	Time 0.472 (0.513)	Data 0.001 (0.010)	Loss 6.5078 (6.5243)	Top-1 acc 0.781 (0.449)	Top-5 acc 2.734 (2.023)	lr 0.04980
Warmup Train [2][1970/3239]	Time 0.571 (0.513)	Data 0.002 (0.010)	Loss 6.4973 (6.5242)	Top-1 acc 0.000 (0.448)	Top-5 acc 2.344 (2.023)	lr 0.04980
Warmup Train [2][1980/3239]	Time 0.529 (0.513)	Data 0.001 (0.010)	Loss 6.4922 (6.5238)	Top-1 acc 0.781 (0.449)	Top-5 acc 1.562 (2.028)	lr 0.04980
Warmup Train [2][1990/3239]	Time 0.695 (0.513)	Data 0.001 (0.010)	Loss 6.5185 (6.5236)	Top-1 acc 0.000 (0.449)	Top-5 acc 1.172 (2.029)	lr 0.04980
Warmup Train [2][2000/3239]	Time 0.538 (0.513)	Data 0.001 (0.010)	Loss 6.4917 (6.5234)	Top-1 acc 0.000 (0.451)	Top-5 acc 2.344 (2.032)	lr 0.04980
Warmup Train [2][2010/3239]	Time 0.374 (0.512)	Data 0.001 (0.010)	Loss 6.4652 (6.5233)	Top-1 acc 0.781 (0.451)	Top-5 acc 3.125 (2.033)	lr 0.04980
Warmup Train [2][2020/3239]	Time 0.331 (0.512)	Data 0.001 (0.010)	Loss 6.4940 (6.5231)	Top-1 acc 0.781 (0.452)	Top-5 acc 2.734 (2.034)	lr 0.04980
Warmup Train [2][2030/3239]	Time 0.505 (0.512)	Data 0.001 (0.010)	Loss 6.4512 (6.5229)	Top-1 acc 1.562 (0.452)	Top-5 acc 3.516 (2.034)	lr 0.04980
Warmup Train [2][2040/3239]	Time 0.332 (0.512)	Data 0.001 (0.010)	Loss 6.4889 (6.5227)	Top-1 acc 0.391 (0.452)	Top-5 acc 1.562 (2.035)	lr 0.04980
Warmup Train [2][2050/3239]	Time 0.525 (0.512)	Data 0.001 (0.010)	Loss 6.5075 (6.5225)	Top-1 acc 1.953 (0.454)	Top-5 acc 3.516 (2.038)	lr 0.04979
Warmup Train [2][2060/3239]	Time 0.687 (0.512)	Data 0.002 (0.010)	Loss 6.5207 (6.5223)	Top-1 acc 0.781 (0.455)	Top-5 acc 1.562 (2.042)	lr 0.04979
Warmup Train [2][2070/3239]	Time 0.368 (0.512)	Data 0.001 (0.010)	Loss 6.4823 (6.5221)	Top-1 acc 0.391 (0.455)	Top-5 acc 1.172 (2.042)	lr 0.04979
Warmup Train [2][2080/3239]	Time 0.552 (0.512)	Data 0.001 (0.010)	Loss 6.4592 (6.5219)	Top-1 acc 0.781 (0.455)	Top-5 acc 3.516 (2.045)	lr 0.04979
Warmup Train [2][2090/3239]	Time 0.532 (0.512)	Data 0.001 (0.010)	Loss 6.5082 (6.5217)	Top-1 acc 0.000 (0.455)	Top-5 acc 2.734 (2.046)	lr 0.04979
Warmup Train [2][2100/3239]	Time 0.591 (0.512)	Data 0.001 (0.010)	Loss 6.5278 (6.5216)	Top-1 acc 0.000 (0.455)	Top-5 acc 1.562 (2.049)	lr 0.04979
Warmup Train [2][2110/3239]	Time 0.571 (0.512)	Data 0.001 (0.010)	Loss 6.4633 (6.5214)	Top-1 acc 0.391 (0.455)	Top-5 acc 2.344 (2.050)	lr 0.04979
Warmup Train [2][2120/3239]	Time 0.539 (0.512)	Data 0.001 (0.010)	Loss 6.5894 (6.5213)	Top-1 acc 0.000 (0.455)	Top-5 acc 1.953 (2.052)	lr 0.04979
Warmup Train [2][2130/3239]	Time 0.537 (0.512)	Data 0.001 (0.010)	Loss 6.5246 (6.5212)	Top-1 acc 0.391 (0.455)	Top-5 acc 1.562 (2.054)	lr 0.04979
Warmup Train [2][2140/3239]	Time 0.517 (0.512)	Data 0.001 (0.010)	Loss 6.5650 (6.5210)	Top-1 acc 0.391 (0.455)	Top-5 acc 2.344 (2.059)	lr 0.04979
Warmup Train [2][2150/3239]	Time 0.506 (0.512)	Data 0.001 (0.010)	Loss 6.5418 (6.5208)	Top-1 acc 0.391 (0.455)	Top-5 acc 1.562 (2.059)	lr 0.04979
Warmup Train [2][2160/3239]	Time 0.438 (0.512)	Data 0.001 (0.010)	Loss 6.4874 (6.5206)	Top-1 acc 0.391 (0.456)	Top-5 acc 3.516 (2.062)	lr 0.04979
Warmup Train [2][2170/3239]	Time 0.577 (0.512)	Data 0.001 (0.010)	Loss 6.4734 (6.5204)	Top-1 acc 1.562 (0.457)	Top-5 acc 4.688 (2.068)	lr 0.04979
Warmup Train [2][2180/3239]	Time 0.448 (0.512)	Data 0.001 (0.010)	Loss 6.5100 (6.5202)	Top-1 acc 0.000 (0.457)	Top-5 acc 1.562 (2.069)	lr 0.04978
Warmup Train [2][2190/3239]	Time 0.647 (0.512)	Data 0.001 (0.010)	Loss 6.4805 (6.5200)	Top-1 acc 0.781 (0.457)	Top-5 acc 2.344 (2.068)	lr 0.04978
Warmup Train [2][2200/3239]	Time 0.461 (0.512)	Data 0.001 (0.010)	Loss 6.5204 (6.5199)	Top-1 acc 0.000 (0.458)	Top-5 acc 1.953 (2.072)	lr 0.04978
Warmup Train [2][2210/3239]	Time 0.399 (0.512)	Data 0.001 (0.010)	Loss 6.4489 (6.5197)	Top-1 acc 0.781 (0.458)	Top-5 acc 3.516 (2.073)	lr 0.04978
Warmup Train [2][2220/3239]	Time 0.714 (0.512)	Data 0.001 (0.010)	Loss 6.4467 (6.5195)	Top-1 acc 0.000 (0.458)	Top-5 acc 1.953 (2.076)	lr 0.04978
Warmup Train [2][2230/3239]	Time 0.465 (0.512)	Data 0.001 (0.010)	Loss 6.5261 (6.5193)	Top-1 acc 0.391 (0.459)	Top-5 acc 2.344 (2.080)	lr 0.04978
Warmup Train [2][2240/3239]	Time 0.596 (0.511)	Data 0.001 (0.010)	Loss 6.4545 (6.5191)	Top-1 acc 0.391 (0.460)	Top-5 acc 3.125 (2.084)	lr 0.04978
Warmup Train [2][2250/3239]	Time 0.440 (0.511)	Data 0.001 (0.010)	Loss 6.5335 (6.5190)	Top-1 acc 0.391 (0.461)	Top-5 acc 2.344 (2.085)	lr 0.04978
Warmup Train [2][2260/3239]	Time 0.492 (0.511)	Data 0.001 (0.010)	Loss 6.4968 (6.5188)	Top-1 acc 0.781 (0.462)	Top-5 acc 1.172 (2.089)	lr 0.04978
Warmup Train [2][2270/3239]	Time 0.504 (0.511)	Data 0.001 (0.010)	Loss 6.5279 (6.5187)	Top-1 acc 0.000 (0.463)	Top-5 acc 2.734 (2.092)	lr 0.04978
Warmup Train [2][2280/3239]	Time 0.318 (0.511)	Data 0.001 (0.010)	Loss 6.4662 (6.5186)	Top-1 acc 0.391 (0.462)	Top-5 acc 1.562 (2.093)	lr 0.04978
Warmup Train [2][2290/3239]	Time 0.567 (0.511)	Data 0.001 (0.010)	Loss 6.4726 (6.5184)	Top-1 acc 0.000 (0.463)	Top-5 acc 1.172 (2.091)	lr 0.04978
Warmup Train [2][2300/3239]	Time 0.594 (0.511)	Data 0.001 (0.010)	Loss 6.5342 (6.5183)	Top-1 acc 0.000 (0.462)	Top-5 acc 1.562 (2.093)	lr 0.04977
Warmup Train [2][2310/3239]	Time 0.316 (0.511)	Data 0.001 (0.010)	Loss 6.4608 (6.5181)	Top-1 acc 0.391 (0.463)	Top-5 acc 1.562 (2.095)	lr 0.04977
Warmup Train [2][2320/3239]	Time 0.536 (0.511)	Data 0.001 (0.010)	Loss 6.4551 (6.5180)	Top-1 acc 1.172 (0.463)	Top-5 acc 3.906 (2.095)	lr 0.04977
Warmup Train [2][2330/3239]	Time 0.478 (0.511)	Data 0.001 (0.010)	Loss 6.4933 (6.5178)	Top-1 acc 0.000 (0.464)	Top-5 acc 2.344 (2.097)	lr 0.04977
Warmup Train [2][2340/3239]	Time 0.642 (0.511)	Data 0.001 (0.010)	Loss 6.4428 (6.5176)	Top-1 acc 0.000 (0.463)	Top-5 acc 2.344 (2.097)	lr 0.04977
Warmup Train [2][2350/3239]	Time 0.608 (0.511)	Data 0.001 (0.010)	Loss 6.4817 (6.5174)	Top-1 acc 1.172 (0.465)	Top-5 acc 1.953 (2.100)	lr 0.04977
Warmup Train [2][2360/3239]	Time 0.583 (0.511)	Data 0.001 (0.010)	Loss 6.4505 (6.5172)	Top-1 acc 0.391 (0.465)	Top-5 acc 3.516 (2.102)	lr 0.04977
Warmup Train [2][2370/3239]	Time 0.558 (0.511)	Data 0.001 (0.010)	Loss 6.4229 (6.5170)	Top-1 acc 0.781 (0.465)	Top-5 acc 4.688 (2.105)	lr 0.04977
Warmup Train [2][2380/3239]	Time 0.428 (0.511)	Data 0.001 (0.010)	Loss 6.4851 (6.5169)	Top-1 acc 0.391 (0.465)	Top-5 acc 2.344 (2.104)	lr 0.04977
Warmup Train [2][2390/3239]	Time 0.420 (0.511)	Data 0.001 (0.010)	Loss 6.4615 (6.5167)	Top-1 acc 0.000 (0.465)	Top-5 acc 0.781 (2.105)	lr 0.04977
Warmup Train [2][2400/3239]	Time 0.557 (0.511)	Data 0.001 (0.010)	Loss 6.4808 (6.5165)	Top-1 acc 0.781 (0.466)	Top-5 acc 3.516 (2.109)	lr 0.04977
Warmup Train [2][2410/3239]	Time 0.399 (0.511)	Data 0.001 (0.010)	Loss 6.4699 (6.5164)	Top-1 acc 0.781 (0.467)	Top-5 acc 1.562 (2.112)	lr 0.04977
Warmup Train [2][2420/3239]	Time 0.513 (0.511)	Data 0.001 (0.010)	Loss 6.5201 (6.5163)	Top-1 acc 0.391 (0.468)	Top-5 acc 1.953 (2.114)	lr 0.04977
Warmup Train [2][2430/3239]	Time 0.466 (0.511)	Data 0.001 (0.010)	Loss 6.4435 (6.5162)	Top-1 acc 1.172 (0.469)	Top-5 acc 2.734 (2.115)	lr 0.04976
Warmup Train [2][2440/3239]	Time 0.630 (0.511)	Data 0.001 (0.010)	Loss 6.4534 (6.5160)	Top-1 acc 0.781 (0.469)	Top-5 acc 3.125 (2.117)	lr 0.04976
Warmup Train [2][2450/3239]	Time 0.597 (0.511)	Data 0.001 (0.010)	Loss 6.4561 (6.5158)	Top-1 acc 0.391 (0.469)	Top-5 acc 2.734 (2.119)	lr 0.04976
Warmup Train [2][2460/3239]	Time 0.580 (0.511)	Data 0.001 (0.010)	Loss 6.4592 (6.5156)	Top-1 acc 0.391 (0.469)	Top-5 acc 1.562 (2.121)	lr 0.04976
Warmup Train [2][2470/3239]	Time 0.435 (0.511)	Data 0.001 (0.010)	Loss 6.4593 (6.5154)	Top-1 acc 0.781 (0.471)	Top-5 acc 2.344 (2.126)	lr 0.04976
Warmup Train [2][2480/3239]	Time 0.490 (0.511)	Data 0.001 (0.010)	Loss 6.5232 (6.5153)	Top-1 acc 0.000 (0.472)	Top-5 acc 3.125 (2.129)	lr 0.04976
Warmup Train [2][2490/3239]	Time 0.521 (0.511)	Data 0.001 (0.010)	Loss 6.4142 (6.5151)	Top-1 acc 0.781 (0.472)	Top-5 acc 5.078 (2.132)	lr 0.04976
Warmup Train [2][2500/3239]	Time 0.572 (0.511)	Data 0.001 (0.010)	Loss 6.5009 (6.5150)	Top-1 acc 0.391 (0.472)	Top-5 acc 1.562 (2.132)	lr 0.04976
Warmup Train [2][2510/3239]	Time 0.319 (0.511)	Data 0.001 (0.010)	Loss 6.4247 (6.5148)	Top-1 acc 0.391 (0.472)	Top-5 acc 3.906 (2.134)	lr 0.04976
Warmup Train [2][2520/3239]	Time 0.490 (0.511)	Data 0.001 (0.010)	Loss 6.4894 (6.5147)	Top-1 acc 0.391 (0.472)	Top-5 acc 1.172 (2.134)	lr 0.04976
Warmup Train [2][2530/3239]	Time 0.276 (0.511)	Data 0.001 (0.010)	Loss 6.4570 (6.5146)	Top-1 acc 0.391 (0.473)	Top-5 acc 1.562 (2.137)	lr 0.04976
Warmup Train [2][2540/3239]	Time 0.385 (0.511)	Data 0.001 (0.010)	Loss 6.4829 (6.5144)	Top-1 acc 0.781 (0.474)	Top-5 acc 1.953 (2.139)	lr 0.04976
Warmup Train [2][2550/3239]	Time 0.447 (0.511)	Data 0.001 (0.010)	Loss 6.4963 (6.5143)	Top-1 acc 0.391 (0.474)	Top-5 acc 2.344 (2.142)	lr 0.04975
Warmup Train [2][2560/3239]	Time 0.575 (0.511)	Data 0.001 (0.010)	Loss 6.5739 (6.5142)	Top-1 acc 0.000 (0.474)	Top-5 acc 1.562 (2.141)	lr 0.04975
Warmup Train [2][2570/3239]	Time 0.502 (0.511)	Data 0.001 (0.010)	Loss 6.4788 (6.5140)	Top-1 acc 1.172 (0.475)	Top-5 acc 2.734 (2.144)	lr 0.04975
Warmup Train [2][2580/3239]	Time 0.520 (0.511)	Data 0.001 (0.010)	Loss 6.4498 (6.5139)	Top-1 acc 0.391 (0.475)	Top-5 acc 2.344 (2.145)	lr 0.04975
Warmup Train [2][2590/3239]	Time 0.547 (0.511)	Data 0.001 (0.010)	Loss 6.4638 (6.5137)	Top-1 acc 0.781 (0.476)	Top-5 acc 3.906 (2.149)	lr 0.04975
Warmup Train [2][2600/3239]	Time 0.467 (0.511)	Data 0.001 (0.010)	Loss 6.5092 (6.5135)	Top-1 acc 0.000 (0.476)	Top-5 acc 1.562 (2.150)	lr 0.04975
Warmup Train [2][2610/3239]	Time 0.468 (0.511)	Data 0.001 (0.010)	Loss 6.4227 (6.5134)	Top-1 acc 0.000 (0.477)	Top-5 acc 1.562 (2.150)	lr 0.04975
Warmup Train [2][2620/3239]	Time 0.553 (0.511)	Data 0.001 (0.010)	Loss 6.5090 (6.5133)	Top-1 acc 0.781 (0.476)	Top-5 acc 1.172 (2.151)	lr 0.04975
Warmup Train [2][2630/3239]	Time 0.519 (0.511)	Data 0.001 (0.009)	Loss 6.5253 (6.5131)	Top-1 acc 0.391 (0.477)	Top-5 acc 2.344 (2.153)	lr 0.04975
Warmup Train [2][2640/3239]	Time 0.341 (0.511)	Data 0.001 (0.009)	Loss 6.5041 (6.5130)	Top-1 acc 0.391 (0.476)	Top-5 acc 1.953 (2.154)	lr 0.04975
Warmup Train [2][2650/3239]	Time 0.602 (0.511)	Data 0.001 (0.009)	Loss 6.4563 (6.5128)	Top-1 acc 0.781 (0.477)	Top-5 acc 2.734 (2.154)	lr 0.04975
Warmup Train [2][2660/3239]	Time 0.368 (0.511)	Data 0.001 (0.009)	Loss 6.5070 (6.5127)	Top-1 acc 0.391 (0.477)	Top-5 acc 1.953 (2.155)	lr 0.04974
Warmup Train [2][2670/3239]	Time 0.463 (0.511)	Data 0.001 (0.009)	Loss 6.5076 (6.5126)	Top-1 acc 0.391 (0.478)	Top-5 acc 2.344 (2.155)	lr 0.04974
Warmup Train [2][2680/3239]	Time 0.475 (0.511)	Data 0.001 (0.009)	Loss 6.4589 (6.5125)	Top-1 acc 0.391 (0.478)	Top-5 acc 3.516 (2.157)	lr 0.04974
Warmup Train [2][2690/3239]	Time 0.496 (0.511)	Data 0.001 (0.009)	Loss 6.4475 (6.5124)	Top-1 acc 0.781 (0.479)	Top-5 acc 2.734 (2.159)	lr 0.04974
Warmup Train [2][2700/3239]	Time 0.490 (0.511)	Data 0.001 (0.009)	Loss 6.4574 (6.5122)	Top-1 acc 0.781 (0.480)	Top-5 acc 2.734 (2.162)	lr 0.04974
Warmup Train [2][2710/3239]	Time 0.624 (0.511)	Data 0.001 (0.009)	Loss 6.4981 (6.5122)	Top-1 acc 0.000 (0.481)	Top-5 acc 2.344 (2.163)	lr 0.04974
Warmup Train [2][2720/3239]	Time 0.388 (0.511)	Data 0.001 (0.009)	Loss 6.4805 (6.5120)	Top-1 acc 0.391 (0.482)	Top-5 acc 1.953 (2.166)	lr 0.04974
Warmup Train [2][2730/3239]	Time 0.345 (0.511)	Data 0.001 (0.009)	Loss 6.4931 (6.5119)	Top-1 acc 0.391 (0.482)	Top-5 acc 2.344 (2.166)	lr 0.04974
Warmup Train [2][2740/3239]	Time 0.498 (0.511)	Data 0.001 (0.009)	Loss 6.4165 (6.5118)	Top-1 acc 1.562 (0.483)	Top-5 acc 3.125 (2.169)	lr 0.04974
Warmup Train [2][2750/3239]	Time 0.376 (0.511)	Data 0.001 (0.009)	Loss 6.5055 (6.5117)	Top-1 acc 0.391 (0.482)	Top-5 acc 2.734 (2.170)	lr 0.04974
Warmup Train [2][2760/3239]	Time 0.584 (0.511)	Data 0.002 (0.009)	Loss 6.4603 (6.5115)	Top-1 acc 0.391 (0.484)	Top-5 acc 2.344 (2.173)	lr 0.04974
Warmup Train [2][2770/3239]	Time 0.490 (0.511)	Data 0.001 (0.009)	Loss 6.4729 (6.5114)	Top-1 acc 0.781 (0.484)	Top-5 acc 2.344 (2.176)	lr 0.04974
Warmup Train [2][2780/3239]	Time 0.438 (0.510)	Data 0.001 (0.009)	Loss 6.5001 (6.5112)	Top-1 acc 0.391 (0.485)	Top-5 acc 3.125 (2.179)	lr 0.04973
Warmup Train [2][2790/3239]	Time 0.455 (0.510)	Data 0.001 (0.009)	Loss 6.4822 (6.5110)	Top-1 acc 0.391 (0.486)	Top-5 acc 1.562 (2.182)	lr 0.04973
Warmup Train [2][2800/3239]	Time 0.422 (0.510)	Data 0.001 (0.009)	Loss 6.5035 (6.5109)	Top-1 acc 0.781 (0.486)	Top-5 acc 2.344 (2.182)	lr 0.04973
Warmup Train [2][2810/3239]	Time 0.523 (0.510)	Data 0.002 (0.009)	Loss 6.5057 (6.5108)	Top-1 acc 0.391 (0.487)	Top-5 acc 2.344 (2.183)	lr 0.04973
Warmup Train [2][2820/3239]	Time 0.583 (0.510)	Data 0.001 (0.009)	Loss 6.4840 (6.5106)	Top-1 acc 0.391 (0.488)	Top-5 acc 1.953 (2.185)	lr 0.04973
Warmup Train [2][2830/3239]	Time 0.411 (0.510)	Data 0.001 (0.009)	Loss 6.5441 (6.5104)	Top-1 acc 0.000 (0.489)	Top-5 acc 1.562 (2.189)	lr 0.04973
Warmup Train [2][2840/3239]	Time 0.552 (0.510)	Data 0.001 (0.009)	Loss 6.4727 (6.5104)	Top-1 acc 0.781 (0.490)	Top-5 acc 3.906 (2.190)	lr 0.04973
Warmup Train [2][2850/3239]	Time 0.470 (0.510)	Data 0.001 (0.009)	Loss 6.4554 (6.5102)	Top-1 acc 0.391 (0.490)	Top-5 acc 3.125 (2.193)	lr 0.04973
Warmup Train [2][2860/3239]	Time 0.495 (0.510)	Data 0.001 (0.009)	Loss 6.4899 (6.5101)	Top-1 acc 0.391 (0.490)	Top-5 acc 2.734 (2.195)	lr 0.04973
Warmup Train [2][2870/3239]	Time 0.515 (0.510)	Data 0.001 (0.009)	Loss 6.4940 (6.5099)	Top-1 acc 0.000 (0.490)	Top-5 acc 0.781 (2.196)	lr 0.04973
Warmup Train [2][2880/3239]	Time 0.519 (0.510)	Data 0.001 (0.009)	Loss 6.4358 (6.5098)	Top-1 acc 0.391 (0.490)	Top-5 acc 1.562 (2.197)	lr 0.04973
Warmup Train [2][2890/3239]	Time 0.622 (0.510)	Data 0.001 (0.009)	Loss 6.4405 (6.5096)	Top-1 acc 1.172 (0.490)	Top-5 acc 2.734 (2.198)	lr 0.04972
Warmup Train [2][2900/3239]	Time 0.444 (0.510)	Data 0.001 (0.009)	Loss 6.4767 (6.5095)	Top-1 acc 0.391 (0.490)	Top-5 acc 1.953 (2.200)	lr 0.04972
Warmup Train [2][2910/3239]	Time 0.364 (0.510)	Data 0.001 (0.009)	Loss 6.4886 (6.5094)	Top-1 acc 0.000 (0.490)	Top-5 acc 2.344 (2.203)	lr 0.04972
Warmup Train [2][2920/3239]	Time 0.388 (0.510)	Data 0.001 (0.009)	Loss 6.4955 (6.5092)	Top-1 acc 0.781 (0.491)	Top-5 acc 3.125 (2.205)	lr 0.04972
Warmup Train [2][2930/3239]	Time 0.550 (0.510)	Data 0.001 (0.009)	Loss 6.4258 (6.5091)	Top-1 acc 1.172 (0.492)	Top-5 acc 3.125 (2.207)	lr 0.04972
Warmup Train [2][2940/3239]	Time 0.585 (0.510)	Data 0.001 (0.009)	Loss 6.4785 (6.5090)	Top-1 acc 1.172 (0.493)	Top-5 acc 3.125 (2.209)	lr 0.04972
Warmup Train [2][2950/3239]	Time 0.578 (0.510)	Data 0.001 (0.009)	Loss 6.5048 (6.5088)	Top-1 acc 0.391 (0.494)	Top-5 acc 3.906 (2.212)	lr 0.04972
Warmup Train [2][2960/3239]	Time 0.634 (0.510)	Data 0.001 (0.009)	Loss 6.4861 (6.5086)	Top-1 acc 0.781 (0.495)	Top-5 acc 2.734 (2.214)	lr 0.04972
Warmup Train [2][2970/3239]	Time 0.325 (0.510)	Data 0.001 (0.009)	Loss 6.5069 (6.5085)	Top-1 acc 1.562 (0.495)	Top-5 acc 1.953 (2.213)	lr 0.04972
Warmup Train [2][2980/3239]	Time 0.597 (0.510)	Data 0.001 (0.009)	Loss 6.4320 (6.5084)	Top-1 acc 1.172 (0.495)	Top-5 acc 3.125 (2.213)	lr 0.04972
Warmup Train [2][2990/3239]	Time 0.564 (0.510)	Data 0.001 (0.009)	Loss 6.4215 (6.5082)	Top-1 acc 0.000 (0.495)	Top-5 acc 1.953 (2.215)	lr 0.04972
Warmup Train [2][3000/3239]	Time 0.450 (0.510)	Data 0.001 (0.009)	Loss 6.4440 (6.5080)	Top-1 acc 1.172 (0.496)	Top-5 acc 2.344 (2.218)	lr 0.04971
Warmup Train [2][3010/3239]	Time 0.547 (0.510)	Data 0.001 (0.009)	Loss 6.4557 (6.5077)	Top-1 acc 0.391 (0.497)	Top-5 acc 3.125 (2.220)	lr 0.04971
Warmup Train [2][3020/3239]	Time 0.488 (0.510)	Data 0.001 (0.009)	Loss 6.4221 (6.5075)	Top-1 acc 0.781 (0.499)	Top-5 acc 3.125 (2.223)	lr 0.04971
Warmup Train [2][3030/3239]	Time 0.487 (0.510)	Data 0.001 (0.009)	Loss 6.4923 (6.5073)	Top-1 acc 0.781 (0.499)	Top-5 acc 2.734 (2.224)	lr 0.04971
Warmup Train [2][3040/3239]	Time 0.493 (0.510)	Data 0.001 (0.009)	Loss 6.5149 (6.5072)	Top-1 acc 0.781 (0.499)	Top-5 acc 2.344 (2.227)	lr 0.04971
Warmup Train [2][3050/3239]	Time 0.517 (0.510)	Data 0.001 (0.009)	Loss 6.4499 (6.5071)	Top-1 acc 0.391 (0.501)	Top-5 acc 3.906 (2.230)	lr 0.04971
Warmup Train [2][3060/3239]	Time 0.473 (0.510)	Data 0.001 (0.009)	Loss 6.4817 (6.5069)	Top-1 acc 0.781 (0.501)	Top-5 acc 2.344 (2.232)	lr 0.04971
Warmup Train [2][3070/3239]	Time 0.523 (0.510)	Data 0.001 (0.009)	Loss 6.4862 (6.5068)	Top-1 acc 0.000 (0.501)	Top-5 acc 1.562 (2.233)	lr 0.04971
Warmup Train [2][3080/3239]	Time 0.362 (0.510)	Data 0.001 (0.009)	Loss 6.4040 (6.5066)	Top-1 acc 0.781 (0.502)	Top-5 acc 3.125 (2.235)	lr 0.04971
Warmup Train [2][3090/3239]	Time 0.574 (0.510)	Data 0.001 (0.009)	Loss 6.4675 (6.5064)	Top-1 acc 0.391 (0.501)	Top-5 acc 1.953 (2.237)	lr 0.04971
Warmup Train [2][3100/3239]	Time 0.493 (0.510)	Data 0.001 (0.009)	Loss 6.4897 (6.5063)	Top-1 acc 0.000 (0.501)	Top-5 acc 3.125 (2.237)	lr 0.04971
Warmup Train [2][3110/3239]	Time 0.661 (0.510)	Data 0.001 (0.009)	Loss 6.4610 (6.5061)	Top-1 acc 0.781 (0.502)	Top-5 acc 0.781 (2.238)	lr 0.04970
Warmup Train [2][3120/3239]	Time 0.451 (0.510)	Data 0.001 (0.009)	Loss 6.4287 (6.5060)	Top-1 acc 0.391 (0.502)	Top-5 acc 1.953 (2.239)	lr 0.04970
Warmup Train [2][3130/3239]	Time 0.433 (0.510)	Data 0.001 (0.009)	Loss 6.5128 (6.5059)	Top-1 acc 0.391 (0.503)	Top-5 acc 2.344 (2.240)	lr 0.04970
Warmup Train [2][3140/3239]	Time 0.379 (0.510)	Data 0.001 (0.009)	Loss 6.4501 (6.5058)	Top-1 acc 1.172 (0.504)	Top-5 acc 4.297 (2.244)	lr 0.04970
Warmup Train [2][3150/3239]	Time 0.587 (0.510)	Data 0.001 (0.009)	Loss 6.3817 (6.5056)	Top-1 acc 0.391 (0.504)	Top-5 acc 5.078 (2.246)	lr 0.04970
Warmup Train [2][3160/3239]	Time 0.358 (0.510)	Data 0.001 (0.009)	Loss 6.4477 (6.5054)	Top-1 acc 1.562 (0.505)	Top-5 acc 4.688 (2.249)	lr 0.04970
Warmup Train [2][3170/3239]	Time 0.467 (0.510)	Data 0.001 (0.009)	Loss 6.4319 (6.5052)	Top-1 acc 0.000 (0.505)	Top-5 acc 2.734 (2.252)	lr 0.04970
Warmup Train [2][3180/3239]	Time 0.397 (0.510)	Data 0.000 (0.009)	Loss 6.4502 (6.5050)	Top-1 acc 1.172 (0.505)	Top-5 acc 3.516 (2.255)	lr 0.04970
Warmup Train [2][3190/3239]	Time 0.514 (0.510)	Data 0.000 (0.009)	Loss 6.4429 (6.5048)	Top-1 acc 0.000 (0.506)	Top-5 acc 1.562 (2.257)	lr 0.04970
Warmup Train [2][3200/3239]	Time 0.368 (0.510)	Data 0.000 (0.009)	Loss 6.4575 (6.5046)	Top-1 acc 0.000 (0.507)	Top-5 acc 1.562 (2.258)	lr 0.04970
Warmup Train [2][3210/3239]	Time 0.572 (0.510)	Data 0.000 (0.009)	Loss 6.4340 (6.5044)	Top-1 acc 0.781 (0.507)	Top-5 acc 4.297 (2.262)	lr 0.04970
Warmup Train [2][3220/3239]	Time 0.521 (0.510)	Data 0.000 (0.009)	Loss 6.4229 (6.5042)	Top-1 acc 1.562 (0.508)	Top-5 acc 5.078 (2.264)	lr 0.04969
Warmup Train [2][3230/3239]	Time 0.613 (0.510)	Data 0.000 (0.009)	Loss 6.4850 (6.5040)	Top-1 acc 0.781 (0.509)	Top-5 acc 5.859 (2.268)	lr 0.04969
Warmup Train [2][3239/3239]	Time 0.899 (0.510)	Data 0.000 (0.009)	Loss 6.5604 (6.5039)	Top-1 acc 0.000 (0.509)	Top-5 acc 0.000 (2.270)	lr 0.04969
==========Warmup Valid [2/40]	loss 6.278	top-1 acc 0.682	top-5 acc 3.270	Train top-1 0.509	top-5 2.270	flops: 442.4M
Warmup Train [3][0/3239]	Time 9.729 (9.729)	Data 9.015 (9.015)	Loss 6.4560 (6.4560)	Top-1 acc 0.391 (0.391)	Top-5 acc 2.734 (2.734)	lr 0.04969
Warmup Train [3][10/3239]	Time 0.620 (1.431)	Data 0.002 (0.838)	Loss 6.4009 (6.4405)	Top-1 acc 0.781 (1.065)	Top-5 acc 3.125 (3.303)	lr 0.04969
Warmup Train [3][20/3239]	Time 0.652 (0.996)	Data 0.001 (0.440)	Loss 6.3993 (6.4385)	Top-1 acc 0.000 (0.893)	Top-5 acc 3.516 (3.330)	lr 0.04969
Warmup Train [3][30/3239]	Time 0.625 (0.838)	Data 0.001 (0.301)	Loss 6.4614 (6.4371)	Top-1 acc 0.781 (0.743)	Top-5 acc 2.734 (3.125)	lr 0.04969
Warmup Train [3][40/3239]	Time 0.664 (0.761)	Data 0.001 (0.230)	Loss 6.4859 (6.4408)	Top-1 acc 0.391 (0.762)	Top-5 acc 2.734 (3.096)	lr 0.04969
Warmup Train [3][50/3239]	Time 0.503 (0.710)	Data 0.001 (0.185)	Loss 6.4209 (6.4426)	Top-1 acc 0.391 (0.751)	Top-5 acc 1.562 (2.926)	lr 0.04969
Warmup Train [3][60/3239]	Time 0.473 (0.677)	Data 0.001 (0.156)	Loss 6.4731 (6.4420)	Top-1 acc 0.391 (0.743)	Top-5 acc 1.562 (2.965)	lr 0.04969
Warmup Train [3][70/3239]	Time 0.435 (0.652)	Data 0.001 (0.134)	Loss 6.4974 (6.4451)	Top-1 acc 0.781 (0.721)	Top-5 acc 1.953 (2.888)	lr 0.04969
Warmup Train [3][80/3239]	Time 0.550 (0.634)	Data 0.001 (0.119)	Loss 6.4579 (6.4459)	Top-1 acc 0.781 (0.719)	Top-5 acc 3.125 (2.918)	lr 0.04968
Warmup Train [3][90/3239]	Time 0.477 (0.619)	Data 0.001 (0.106)	Loss 6.4393 (6.4462)	Top-1 acc 0.391 (0.730)	Top-5 acc 2.344 (2.902)	lr 0.04968
Warmup Train [3][100/3239]	Time 0.500 (0.608)	Data 0.001 (0.096)	Loss 6.4890 (6.4472)	Top-1 acc 1.172 (0.743)	Top-5 acc 3.125 (2.866)	lr 0.04968
Warmup Train [3][110/3239]	Time 0.514 (0.600)	Data 0.001 (0.088)	Loss 6.4072 (6.4469)	Top-1 acc 1.172 (0.736)	Top-5 acc 4.297 (2.872)	lr 0.04968
Warmup Train [3][120/3239]	Time 0.476 (0.594)	Data 0.001 (0.081)	Loss 6.4702 (6.4477)	Top-1 acc 0.391 (0.713)	Top-5 acc 2.344 (2.883)	lr 0.04968
Warmup Train [3][130/3239]	Time 0.518 (0.587)	Data 0.001 (0.075)	Loss 6.4368 (6.4473)	Top-1 acc 1.953 (0.722)	Top-5 acc 4.297 (2.907)	lr 0.04968
Warmup Train [3][140/3239]	Time 0.593 (0.582)	Data 0.001 (0.070)	Loss 6.4728 (6.4472)	Top-1 acc 0.781 (0.712)	Top-5 acc 3.125 (2.901)	lr 0.04968
Warmup Train [3][150/3239]	Time 0.588 (0.578)	Data 0.001 (0.066)	Loss 6.4186 (6.4475)	Top-1 acc 1.172 (0.714)	Top-5 acc 4.297 (2.913)	lr 0.04968
Warmup Train [3][160/3239]	Time 0.591 (0.571)	Data 0.001 (0.062)	Loss 6.4083 (6.4481)	Top-1 acc 1.172 (0.708)	Top-5 acc 5.078 (2.911)	lr 0.04968
Warmup Train [3][170/3239]	Time 0.515 (0.568)	Data 0.002 (0.059)	Loss 6.4621 (6.4479)	Top-1 acc 0.391 (0.688)	Top-5 acc 4.297 (2.929)	lr 0.04968
Warmup Train [3][180/3239]	Time 0.542 (0.563)	Data 0.001 (0.056)	Loss 6.4200 (6.4479)	Top-1 acc 1.562 (0.697)	Top-5 acc 3.906 (2.937)	lr 0.04967
Warmup Train [3][190/3239]	Time 0.505 (0.559)	Data 0.001 (0.053)	Loss 6.4487 (6.4481)	Top-1 acc 0.781 (0.697)	Top-5 acc 2.344 (2.931)	lr 0.04967
Warmup Train [3][200/3239]	Time 0.512 (0.553)	Data 0.001 (0.051)	Loss 6.4162 (6.4481)	Top-1 acc 0.781 (0.690)	Top-5 acc 3.516 (2.909)	lr 0.04967
Warmup Train [3][210/3239]	Time 0.446 (0.551)	Data 0.001 (0.048)	Loss 6.4715 (6.4479)	Top-1 acc 0.391 (0.685)	Top-5 acc 3.125 (2.912)	lr 0.04967
Warmup Train [3][220/3239]	Time 0.578 (0.550)	Data 0.001 (0.047)	Loss 6.4251 (6.4482)	Top-1 acc 0.781 (0.686)	Top-5 acc 3.125 (2.902)	lr 0.04967
Warmup Train [3][230/3239]	Time 0.559 (0.549)	Data 0.001 (0.045)	Loss 6.3997 (6.4479)	Top-1 acc 1.953 (0.683)	Top-5 acc 3.906 (2.876)	lr 0.04967
Warmup Train [3][240/3239]	Time 0.562 (0.547)	Data 0.001 (0.043)	Loss 6.4101 (6.4474)	Top-1 acc 0.391 (0.694)	Top-5 acc 3.125 (2.880)	lr 0.04967
Warmup Train [3][250/3239]	Time 0.651 (0.546)	Data 0.001 (0.041)	Loss 6.3285 (6.4469)	Top-1 acc 1.562 (0.691)	Top-5 acc 4.688 (2.873)	lr 0.04967
Warmup Train [3][260/3239]	Time 0.406 (0.544)	Data 0.001 (0.040)	Loss 6.5124 (6.4479)	Top-1 acc 0.000 (0.681)	Top-5 acc 0.391 (2.856)	lr 0.04967
Warmup Train [3][270/3239]	Time 0.623 (0.542)	Data 0.001 (0.039)	Loss 6.4016 (6.4480)	Top-1 acc 1.562 (0.688)	Top-5 acc 3.906 (2.861)	lr 0.04967
Warmup Train [3][280/3239]	Time 0.531 (0.541)	Data 0.001 (0.038)	Loss 6.4720 (6.4475)	Top-1 acc 0.781 (0.678)	Top-5 acc 3.125 (2.880)	lr 0.04967
Warmup Train [3][290/3239]	Time 0.573 (0.540)	Data 0.001 (0.036)	Loss 6.4108 (6.4475)	Top-1 acc 1.172 (0.677)	Top-5 acc 3.906 (2.902)	lr 0.04966
Warmup Train [3][300/3239]	Time 0.495 (0.539)	Data 0.001 (0.035)	Loss 6.4338 (6.4479)	Top-1 acc 0.000 (0.684)	Top-5 acc 0.781 (2.895)	lr 0.04966
Warmup Train [3][310/3239]	Time 0.402 (0.537)	Data 0.001 (0.034)	Loss 6.4304 (6.4473)	Top-1 acc 0.391 (0.682)	Top-5 acc 2.344 (2.903)	lr 0.04966
Warmup Train [3][320/3239]	Time 0.528 (0.536)	Data 0.001 (0.034)	Loss 6.4379 (6.4468)	Top-1 acc 0.391 (0.685)	Top-5 acc 3.125 (2.913)	lr 0.04966
Warmup Train [3][330/3239]	Time 0.547 (0.535)	Data 0.001 (0.033)	Loss 6.4815 (6.4470)	Top-1 acc 1.953 (0.693)	Top-5 acc 3.125 (2.936)	lr 0.04966
Warmup Train [3][340/3239]	Time 0.715 (0.534)	Data 0.001 (0.032)	Loss 6.4967 (6.4473)	Top-1 acc 1.172 (0.687)	Top-5 acc 2.734 (2.934)	lr 0.04966
Warmup Train [3][350/3239]	Time 0.674 (0.534)	Data 0.001 (0.031)	Loss 6.4363 (6.4472)	Top-1 acc 0.781 (0.690)	Top-5 acc 3.906 (2.939)	lr 0.04966
Warmup Train [3][360/3239]	Time 0.473 (0.533)	Data 0.001 (0.030)	Loss 6.3798 (6.4466)	Top-1 acc 1.172 (0.690)	Top-5 acc 6.250 (2.940)	lr 0.04966
Warmup Train [3][370/3239]	Time 0.490 (0.532)	Data 0.001 (0.029)	Loss 6.4522 (6.4467)	Top-1 acc 0.781 (0.689)	Top-5 acc 2.344 (2.931)	lr 0.04966
Warmup Train [3][380/3239]	Time 0.353 (0.531)	Data 0.001 (0.029)	Loss 6.4324 (6.4463)	Top-1 acc 0.781 (0.692)	Top-5 acc 4.297 (2.951)	lr 0.04966
Warmup Train [3][390/3239]	Time 0.482 (0.531)	Data 0.001 (0.029)	Loss 6.4129 (6.4464)	Top-1 acc 2.344 (0.696)	Top-5 acc 5.469 (2.959)	lr 0.04965
Warmup Train [3][400/3239]	Time 0.649 (0.531)	Data 0.001 (0.028)	Loss 6.4275 (6.4464)	Top-1 acc 1.172 (0.691)	Top-5 acc 3.125 (2.957)	lr 0.04965
Warmup Train [3][410/3239]	Time 0.437 (0.530)	Data 0.001 (0.027)	Loss 6.3723 (6.4458)	Top-1 acc 0.781 (0.686)	Top-5 acc 3.906 (2.954)	lr 0.04965
Warmup Train [3][420/3239]	Time 0.659 (0.529)	Data 0.001 (0.027)	Loss 6.5151 (6.4461)	Top-1 acc 0.391 (0.686)	Top-5 acc 1.562 (2.946)	lr 0.04965
Warmup Train [3][430/3239]	Time 0.458 (0.528)	Data 0.001 (0.027)	Loss 6.4280 (6.4464)	Top-1 acc 0.000 (0.683)	Top-5 acc 3.906 (2.947)	lr 0.04965
Warmup Train [3][440/3239]	Time 0.443 (0.527)	Data 0.001 (0.026)	Loss 6.4882 (6.4462)	Top-1 acc 1.172 (0.684)	Top-5 acc 1.953 (2.941)	lr 0.04965
Warmup Train [3][450/3239]	Time 0.512 (0.526)	Data 0.001 (0.026)	Loss 6.4297 (6.4460)	Top-1 acc 0.781 (0.683)	Top-5 acc 1.562 (2.938)	lr 0.04965
Warmup Train [3][460/3239]	Time 0.593 (0.525)	Data 0.001 (0.025)	Loss 6.4162 (6.4456)	Top-1 acc 0.781 (0.680)	Top-5 acc 3.906 (2.939)	lr 0.04965
Warmup Train [3][470/3239]	Time 0.504 (0.525)	Data 0.002 (0.025)	Loss 6.4782 (6.4451)	Top-1 acc 1.172 (0.683)	Top-5 acc 3.516 (2.952)	lr 0.04965
Warmup Train [3][480/3239]	Time 0.598 (0.525)	Data 0.001 (0.024)	Loss 6.4882 (6.4446)	Top-1 acc 0.391 (0.682)	Top-5 acc 3.125 (2.955)	lr 0.04965
Warmup Train [3][490/3239]	Time 0.535 (0.525)	Data 0.001 (0.024)	Loss 6.4542 (6.4445)	Top-1 acc 0.000 (0.679)	Top-5 acc 2.734 (2.960)	lr 0.04964
Warmup Train [3][500/3239]	Time 0.409 (0.524)	Data 0.001 (0.024)	Loss 6.4764 (6.4443)	Top-1 acc 0.781 (0.681)	Top-5 acc 1.562 (2.959)	lr 0.04964
Warmup Train [3][510/3239]	Time 0.492 (0.524)	Data 0.002 (0.023)	Loss 6.4595 (6.4442)	Top-1 acc 0.391 (0.683)	Top-5 acc 3.516 (2.964)	lr 0.04964
Warmup Train [3][520/3239]	Time 0.479 (0.524)	Data 0.001 (0.023)	Loss 6.4875 (6.4442)	Top-1 acc 0.391 (0.685)	Top-5 acc 1.953 (2.965)	lr 0.04964
Warmup Train [3][530/3239]	Time 0.446 (0.523)	Data 0.001 (0.022)	Loss 6.4687 (6.4443)	Top-1 acc 0.781 (0.682)	Top-5 acc 3.906 (2.962)	lr 0.04964
Warmup Train [3][540/3239]	Time 0.667 (0.523)	Data 0.001 (0.022)	Loss 6.4095 (6.4440)	Top-1 acc 1.172 (0.677)	Top-5 acc 4.688 (2.965)	lr 0.04964
Warmup Train [3][550/3239]	Time 0.374 (0.523)	Data 0.001 (0.022)	Loss 6.4776 (6.4437)	Top-1 acc 0.781 (0.677)	Top-5 acc 2.734 (2.970)	lr 0.04964
Warmup Train [3][560/3239]	Time 0.475 (0.523)	Data 0.001 (0.022)	Loss 6.4307 (6.4431)	Top-1 acc 1.172 (0.678)	Top-5 acc 1.953 (2.973)	lr 0.04964
Warmup Train [3][570/3239]	Time 0.551 (0.522)	Data 0.001 (0.021)	Loss 6.3893 (6.4429)	Top-1 acc 0.000 (0.677)	Top-5 acc 4.297 (2.973)	lr 0.04964
Warmup Train [3][580/3239]	Time 0.394 (0.522)	Data 0.001 (0.021)	Loss 6.4481 (6.4431)	Top-1 acc 0.391 (0.674)	Top-5 acc 2.734 (2.974)	lr 0.04963
Warmup Train [3][590/3239]	Time 0.448 (0.521)	Data 0.001 (0.021)	Loss 6.4403 (6.4428)	Top-1 acc 1.172 (0.674)	Top-5 acc 5.078 (2.977)	lr 0.04963
Warmup Train [3][600/3239]	Time 0.527 (0.521)	Data 0.001 (0.021)	Loss 6.4403 (6.4428)	Top-1 acc 1.172 (0.671)	Top-5 acc 3.125 (2.978)	lr 0.04963
Warmup Train [3][610/3239]	Time 0.637 (0.522)	Data 0.001 (0.020)	Loss 6.4073 (6.4429)	Top-1 acc 1.172 (0.670)	Top-5 acc 2.734 (2.967)	lr 0.04963
Warmup Train [3][620/3239]	Time 0.511 (0.522)	Data 0.001 (0.020)	Loss 6.4342 (6.4429)	Top-1 acc 0.391 (0.668)	Top-5 acc 5.469 (2.968)	lr 0.04963
Warmup Train [3][630/3239]	Time 0.616 (0.521)	Data 0.001 (0.020)	Loss 6.4322 (6.4426)	Top-1 acc 0.781 (0.674)	Top-5 acc 1.562 (2.978)	lr 0.04963
Warmup Train [3][640/3239]	Time 0.507 (0.521)	Data 0.001 (0.020)	Loss 6.4293 (6.4421)	Top-1 acc 0.391 (0.673)	Top-5 acc 2.344 (2.981)	lr 0.04963
Warmup Train [3][650/3239]	Time 0.355 (0.521)	Data 0.001 (0.019)	Loss 6.3976 (6.4418)	Top-1 acc 1.172 (0.677)	Top-5 acc 4.297 (2.981)	lr 0.04963
Warmup Train [3][660/3239]	Time 0.587 (0.521)	Data 0.001 (0.019)	Loss 6.3232 (6.4414)	Top-1 acc 1.562 (0.678)	Top-5 acc 3.516 (2.987)	lr 0.04963
Warmup Train [3][670/3239]	Time 0.674 (0.521)	Data 0.001 (0.019)	Loss 6.4722 (6.4416)	Top-1 acc 0.781 (0.679)	Top-5 acc 3.906 (2.982)	lr 0.04963
Warmup Train [3][680/3239]	Time 0.530 (0.520)	Data 0.001 (0.019)	Loss 6.4534 (6.4416)	Top-1 acc 0.781 (0.677)	Top-5 acc 2.344 (2.972)	lr 0.04962
Warmup Train [3][690/3239]	Time 0.376 (0.519)	Data 0.001 (0.019)	Loss 6.4275 (6.4416)	Top-1 acc 0.781 (0.675)	Top-5 acc 3.516 (2.970)	lr 0.04962
Warmup Train [3][700/3239]	Time 0.532 (0.518)	Data 0.001 (0.018)	Loss 6.4360 (6.4416)	Top-1 acc 0.781 (0.674)	Top-5 acc 3.125 (2.972)	lr 0.04962
Warmup Train [3][710/3239]	Time 0.500 (0.518)	Data 0.001 (0.018)	Loss 6.4805 (6.4415)	Top-1 acc 0.781 (0.671)	Top-5 acc 2.734 (2.970)	lr 0.04962
Warmup Train [3][720/3239]	Time 0.640 (0.517)	Data 0.001 (0.018)	Loss 6.5125 (6.4415)	Top-1 acc 0.000 (0.670)	Top-5 acc 1.172 (2.971)	lr 0.04962
Warmup Train [3][730/3239]	Time 0.526 (0.517)	Data 0.001 (0.018)	Loss 6.3907 (6.4411)	Top-1 acc 0.000 (0.672)	Top-5 acc 3.906 (2.978)	lr 0.04962
Warmup Train [3][740/3239]	Time 0.497 (0.516)	Data 0.001 (0.018)	Loss 6.4372 (6.4411)	Top-1 acc 1.172 (0.674)	Top-5 acc 4.297 (2.986)	lr 0.04962
Warmup Train [3][750/3239]	Time 0.491 (0.516)	Data 0.001 (0.017)	Loss 6.3824 (6.4409)	Top-1 acc 0.781 (0.677)	Top-5 acc 3.906 (2.992)	lr 0.04962
Warmup Train [3][760/3239]	Time 0.501 (0.516)	Data 0.001 (0.017)	Loss 6.3956 (6.4407)	Top-1 acc 0.391 (0.677)	Top-5 acc 2.344 (2.988)	lr 0.04962
Warmup Train [3][770/3239]	Time 0.582 (0.517)	Data 0.001 (0.017)	Loss 6.3954 (6.4404)	Top-1 acc 0.781 (0.680)	Top-5 acc 3.906 (2.993)	lr 0.04961
Warmup Train [3][780/3239]	Time 0.680 (0.517)	Data 0.001 (0.017)	Loss 6.3596 (6.4399)	Top-1 acc 0.391 (0.682)	Top-5 acc 2.734 (2.996)	lr 0.04961
Warmup Train [3][790/3239]	Time 0.626 (0.517)	Data 0.001 (0.017)	Loss 6.4179 (6.4395)	Top-1 acc 1.562 (0.681)	Top-5 acc 3.906 (2.996)	lr 0.04961
Warmup Train [3][800/3239]	Time 0.562 (0.517)	Data 0.001 (0.016)	Loss 6.4263 (6.4393)	Top-1 acc 0.000 (0.679)	Top-5 acc 3.516 (3.003)	lr 0.04961
Warmup Train [3][810/3239]	Time 0.569 (0.516)	Data 0.001 (0.016)	Loss 6.4433 (6.4390)	Top-1 acc 0.391 (0.681)	Top-5 acc 2.734 (3.008)	lr 0.04961
Warmup Train [3][820/3239]	Time 0.628 (0.516)	Data 0.001 (0.016)	Loss 6.3770 (6.4386)	Top-1 acc 0.391 (0.681)	Top-5 acc 1.953 (3.008)	lr 0.04961
Warmup Train [3][830/3239]	Time 0.529 (0.516)	Data 0.001 (0.016)	Loss 6.4823 (6.4385)	Top-1 acc 0.391 (0.680)	Top-5 acc 1.172 (3.003)	lr 0.04961
Warmup Train [3][840/3239]	Time 0.388 (0.516)	Data 0.001 (0.016)	Loss 6.4046 (6.4383)	Top-1 acc 1.562 (0.683)	Top-5 acc 3.125 (3.012)	lr 0.04961
Warmup Train [3][850/3239]	Time 0.574 (0.516)	Data 0.001 (0.016)	Loss 6.4786 (6.4383)	Top-1 acc 0.391 (0.682)	Top-5 acc 2.734 (3.010)	lr 0.04961
Warmup Train [3][860/3239]	Time 0.565 (0.516)	Data 0.001 (0.016)	Loss 6.4496 (6.4382)	Top-1 acc 0.391 (0.680)	Top-5 acc 3.125 (3.013)	lr 0.04961
Warmup Train [3][870/3239]	Time 0.470 (0.516)	Data 0.001 (0.016)	Loss 6.4143 (6.4380)	Top-1 acc 1.953 (0.680)	Top-5 acc 5.078 (3.016)	lr 0.04960
Warmup Train [3][880/3239]	Time 0.528 (0.516)	Data 0.001 (0.015)	Loss 6.3621 (6.4379)	Top-1 acc 1.172 (0.681)	Top-5 acc 2.734 (3.013)	lr 0.04960
Warmup Train [3][890/3239]	Time 0.596 (0.516)	Data 0.002 (0.015)	Loss 6.3681 (6.4378)	Top-1 acc 1.172 (0.684)	Top-5 acc 3.906 (3.021)	lr 0.04960
Warmup Train [3][900/3239]	Time 0.604 (0.515)	Data 0.001 (0.015)	Loss 6.4254 (6.4374)	Top-1 acc 0.781 (0.688)	Top-5 acc 3.516 (3.030)	lr 0.04960
Warmup Train [3][910/3239]	Time 0.549 (0.515)	Data 0.001 (0.015)	Loss 6.4554 (6.4374)	Top-1 acc 1.172 (0.691)	Top-5 acc 5.859 (3.033)	lr 0.04960
Warmup Train [3][920/3239]	Time 0.557 (0.515)	Data 0.001 (0.015)	Loss 6.4428 (6.4374)	Top-1 acc 0.391 (0.690)	Top-5 acc 1.562 (3.031)	lr 0.04960
Warmup Train [3][930/3239]	Time 0.333 (0.515)	Data 0.001 (0.015)	Loss 6.4023 (6.4372)	Top-1 acc 1.562 (0.691)	Top-5 acc 2.734 (3.033)	lr 0.04960
Warmup Train [3][940/3239]	Time 0.345 (0.515)	Data 0.001 (0.015)	Loss 6.3975 (6.4370)	Top-1 acc 0.391 (0.692)	Top-5 acc 3.125 (3.031)	lr 0.04960
Warmup Train [3][950/3239]	Time 0.585 (0.515)	Data 0.001 (0.015)	Loss 6.3448 (6.4370)	Top-1 acc 1.172 (0.693)	Top-5 acc 5.469 (3.035)	lr 0.04960
Warmup Train [3][960/3239]	Time 0.363 (0.514)	Data 0.001 (0.015)	Loss 6.3909 (6.4369)	Top-1 acc 0.000 (0.691)	Top-5 acc 3.906 (3.038)	lr 0.04959
Warmup Train [3][970/3239]	Time 0.485 (0.514)	Data 0.001 (0.015)	Loss 6.4545 (6.4368)	Top-1 acc 1.562 (0.692)	Top-5 acc 3.125 (3.042)	lr 0.04959
Warmup Train [3][980/3239]	Time 0.506 (0.513)	Data 0.001 (0.015)	Loss 6.3909 (6.4366)	Top-1 acc 0.781 (0.697)	Top-5 acc 3.125 (3.049)	lr 0.04959
Warmup Train [3][990/3239]	Time 0.569 (0.513)	Data 0.001 (0.014)	Loss 6.4030 (6.4366)	Top-1 acc 0.391 (0.696)	Top-5 acc 2.344 (3.049)	lr 0.04959
Warmup Train [3][1000/3239]	Time 0.565 (0.514)	Data 0.001 (0.014)	Loss 6.3960 (6.4364)	Top-1 acc 0.781 (0.695)	Top-5 acc 1.953 (3.046)	lr 0.04959
Warmup Train [3][1010/3239]	Time 0.655 (0.514)	Data 0.001 (0.014)	Loss 6.4278 (6.4363)	Top-1 acc 0.391 (0.695)	Top-5 acc 3.125 (3.046)	lr 0.04959
Warmup Train [3][1020/3239]	Time 0.452 (0.513)	Data 0.001 (0.014)	Loss 6.4290 (6.4360)	Top-1 acc 0.391 (0.697)	Top-5 acc 0.391 (3.044)	lr 0.04959
Warmup Train [3][1030/3239]	Time 0.455 (0.513)	Data 0.001 (0.014)	Loss 6.4403 (6.4358)	Top-1 acc 0.391 (0.700)	Top-5 acc 4.297 (3.048)	lr 0.04959
Warmup Train [3][1040/3239]	Time 0.516 (0.513)	Data 0.001 (0.014)	Loss 6.4360 (6.4356)	Top-1 acc 1.172 (0.704)	Top-5 acc 5.078 (3.053)	lr 0.04959
Warmup Train [3][1050/3239]	Time 0.417 (0.513)	Data 0.001 (0.014)	Loss 6.4339 (6.4354)	Top-1 acc 0.781 (0.705)	Top-5 acc 1.953 (3.055)	lr 0.04958
Warmup Train [3][1060/3239]	Time 0.535 (0.513)	Data 0.001 (0.014)	Loss 6.4563 (6.4355)	Top-1 acc 0.391 (0.704)	Top-5 acc 3.516 (3.054)	lr 0.04958
Warmup Train [3][1070/3239]	Time 0.506 (0.513)	Data 0.001 (0.014)	Loss 6.4513 (6.4351)	Top-1 acc 1.172 (0.707)	Top-5 acc 3.125 (3.061)	lr 0.04958
Warmup Train [3][1080/3239]	Time 0.526 (0.513)	Data 0.001 (0.014)	Loss 6.4556 (6.4351)	Top-1 acc 0.781 (0.710)	Top-5 acc 1.953 (3.061)	lr 0.04958
Warmup Train [3][1090/3239]	Time 0.406 (0.513)	Data 0.001 (0.014)	Loss 6.4616 (6.4349)	Top-1 acc 0.781 (0.710)	Top-5 acc 5.469 (3.061)	lr 0.04958
Warmup Train [3][1100/3239]	Time 0.757 (0.513)	Data 0.001 (0.014)	Loss 6.4432 (6.4347)	Top-1 acc 0.000 (0.711)	Top-5 acc 2.344 (3.063)	lr 0.04958
Warmup Train [3][1110/3239]	Time 0.544 (0.513)	Data 0.001 (0.014)	Loss 6.3740 (6.4345)	Top-1 acc 0.781 (0.712)	Top-5 acc 5.078 (3.068)	lr 0.04958
Warmup Train [3][1120/3239]	Time 0.525 (0.513)	Data 0.001 (0.013)	Loss 6.3375 (6.4342)	Top-1 acc 1.172 (0.715)	Top-5 acc 6.250 (3.074)	lr 0.04958
Warmup Train [3][1130/3239]	Time 0.443 (0.513)	Data 0.001 (0.013)	Loss 6.3824 (6.4340)	Top-1 acc 0.391 (0.716)	Top-5 acc 2.734 (3.080)	lr 0.04958
Warmup Train [3][1140/3239]	Time 0.553 (0.513)	Data 0.001 (0.013)	Loss 6.3671 (6.4338)	Top-1 acc 0.781 (0.718)	Top-5 acc 3.125 (3.083)	lr 0.04957
Warmup Train [3][1150/3239]	Time 0.524 (0.513)	Data 0.001 (0.013)	Loss 6.4315 (6.4334)	Top-1 acc 0.781 (0.719)	Top-5 acc 3.125 (3.087)	lr 0.04957
Warmup Train [3][1160/3239]	Time 0.625 (0.513)	Data 0.001 (0.013)	Loss 6.5059 (6.4332)	Top-1 acc 0.781 (0.718)	Top-5 acc 3.125 (3.091)	lr 0.04957
Warmup Train [3][1170/3239]	Time 0.498 (0.513)	Data 0.001 (0.013)	Loss 6.5004 (6.4330)	Top-1 acc 0.781 (0.719)	Top-5 acc 2.734 (3.097)	lr 0.04957
Warmup Train [3][1180/3239]	Time 0.510 (0.513)	Data 0.001 (0.013)	Loss 6.4567 (6.4331)	Top-1 acc 0.391 (0.717)	Top-5 acc 2.734 (3.094)	lr 0.04957
Warmup Train [3][1190/3239]	Time 0.496 (0.513)	Data 0.001 (0.013)	Loss 6.4394 (6.4329)	Top-1 acc 0.781 (0.717)	Top-5 acc 4.297 (3.094)	lr 0.04957
Warmup Train [3][1200/3239]	Time 0.358 (0.513)	Data 0.001 (0.013)	Loss 6.4057 (6.4327)	Top-1 acc 0.781 (0.718)	Top-5 acc 3.125 (3.097)	lr 0.04957
Warmup Train [3][1210/3239]	Time 0.487 (0.513)	Data 0.001 (0.013)	Loss 6.3607 (6.4324)	Top-1 acc 0.781 (0.718)	Top-5 acc 3.516 (3.100)	lr 0.04957
Warmup Train [3][1220/3239]	Time 0.328 (0.512)	Data 0.001 (0.013)	Loss 6.3865 (6.4322)	Top-1 acc 0.391 (0.717)	Top-5 acc 3.125 (3.105)	lr 0.04957
Warmup Train [3][1230/3239]	Time 0.377 (0.512)	Data 0.001 (0.013)	Loss 6.4507 (6.4318)	Top-1 acc 1.172 (0.716)	Top-5 acc 3.906 (3.112)	lr 0.04956
Warmup Train [3][1240/3239]	Time 0.488 (0.512)	Data 0.001 (0.013)	Loss 6.4408 (6.4317)	Top-1 acc 0.391 (0.715)	Top-5 acc 1.562 (3.110)	lr 0.04956
Warmup Train [3][1250/3239]	Time 0.675 (0.512)	Data 0.001 (0.013)	Loss 6.4523 (6.4316)	Top-1 acc 1.172 (0.718)	Top-5 acc 3.516 (3.112)	lr 0.04956
Warmup Train [3][1260/3239]	Time 0.468 (0.512)	Data 0.001 (0.013)	Loss 6.4179 (6.4315)	Top-1 acc 1.953 (0.720)	Top-5 acc 3.906 (3.115)	lr 0.04956
Warmup Train [3][1270/3239]	Time 0.386 (0.512)	Data 0.001 (0.013)	Loss 6.3833 (6.4313)	Top-1 acc 0.000 (0.719)	Top-5 acc 3.125 (3.114)	lr 0.04956
Warmup Train [3][1280/3239]	Time 0.587 (0.512)	Data 0.001 (0.013)	Loss 6.4191 (6.4311)	Top-1 acc 0.781 (0.721)	Top-5 acc 3.516 (3.116)	lr 0.04956
Warmup Train [3][1290/3239]	Time 0.497 (0.512)	Data 0.001 (0.013)	Loss 6.3977 (6.4310)	Top-1 acc 1.562 (0.721)	Top-5 acc 5.859 (3.117)	lr 0.04956
Warmup Train [3][1300/3239]	Time 0.511 (0.512)	Data 0.001 (0.013)	Loss 6.4597 (6.4309)	Top-1 acc 0.781 (0.721)	Top-5 acc 2.344 (3.117)	lr 0.04956
Warmup Train [3][1310/3239]	Time 0.686 (0.512)	Data 0.001 (0.013)	Loss 6.5073 (6.4309)	Top-1 acc 0.781 (0.723)	Top-5 acc 3.906 (3.121)	lr 0.04956
Warmup Train [3][1320/3239]	Time 0.356 (0.512)	Data 0.001 (0.013)	Loss 6.3876 (6.4308)	Top-1 acc 0.391 (0.722)	Top-5 acc 2.734 (3.120)	lr 0.04955
Warmup Train [3][1330/3239]	Time 0.621 (0.512)	Data 0.001 (0.013)	Loss 6.3377 (6.4308)	Top-1 acc 1.953 (0.725)	Top-5 acc 6.641 (3.126)	lr 0.04955
Warmup Train [3][1340/3239]	Time 0.333 (0.512)	Data 0.001 (0.012)	Loss 6.3643 (6.4307)	Top-1 acc 1.172 (0.726)	Top-5 acc 6.250 (3.134)	lr 0.04955
Warmup Train [3][1350/3239]	Time 0.519 (0.512)	Data 0.001 (0.012)	Loss 6.4354 (6.4305)	Top-1 acc 1.172 (0.726)	Top-5 acc 3.125 (3.135)	lr 0.04955
Warmup Train [3][1360/3239]	Time 0.499 (0.512)	Data 0.001 (0.012)	Loss 6.4040 (6.4305)	Top-1 acc 0.781 (0.728)	Top-5 acc 2.344 (3.135)	lr 0.04955
Warmup Train [3][1370/3239]	Time 0.536 (0.512)	Data 0.001 (0.012)	Loss 6.4377 (6.4302)	Top-1 acc 0.391 (0.730)	Top-5 acc 1.562 (3.140)	lr 0.04955
Warmup Train [3][1380/3239]	Time 0.454 (0.512)	Data 0.001 (0.012)	Loss 6.4555 (6.4301)	Top-1 acc 0.391 (0.730)	Top-5 acc 3.125 (3.141)	lr 0.04955
Warmup Train [3][1390/3239]	Time 0.679 (0.512)	Data 0.001 (0.012)	Loss 6.4575 (6.4302)	Top-1 acc 0.000 (0.730)	Top-5 acc 1.562 (3.140)	lr 0.04955
Warmup Train [3][1400/3239]	Time 0.503 (0.512)	Data 0.001 (0.012)	Loss 6.3535 (6.4300)	Top-1 acc 2.344 (0.732)	Top-5 acc 7.031 (3.145)	lr 0.04955
Warmup Train [3][1410/3239]	Time 0.468 (0.512)	Data 0.001 (0.012)	Loss 6.4406 (6.4300)	Top-1 acc 0.000 (0.731)	Top-5 acc 1.953 (3.142)	lr 0.04954
Warmup Train [3][1420/3239]	Time 0.738 (0.512)	Data 0.001 (0.012)	Loss 6.3321 (6.4297)	Top-1 acc 0.391 (0.732)	Top-5 acc 5.078 (3.145)	lr 0.04954
Warmup Train [3][1430/3239]	Time 0.602 (0.512)	Data 0.001 (0.012)	Loss 6.4272 (6.4298)	Top-1 acc 0.781 (0.732)	Top-5 acc 1.953 (3.146)	lr 0.04954
Warmup Train [3][1440/3239]	Time 0.500 (0.512)	Data 0.001 (0.012)	Loss 6.4408 (6.4297)	Top-1 acc 0.781 (0.734)	Top-5 acc 3.516 (3.149)	lr 0.04954
Warmup Train [3][1450/3239]	Time 0.615 (0.512)	Data 0.001 (0.012)	Loss 6.2991 (6.4294)	Top-1 acc 1.953 (0.735)	Top-5 acc 5.078 (3.154)	lr 0.04954
Warmup Train [3][1460/3239]	Time 0.468 (0.512)	Data 0.001 (0.012)	Loss 6.5106 (6.4293)	Top-1 acc 0.781 (0.736)	Top-5 acc 3.906 (3.160)	lr 0.04954
Warmup Train [3][1470/3239]	Time 0.409 (0.512)	Data 0.001 (0.012)	Loss 6.4157 (6.4291)	Top-1 acc 0.000 (0.735)	Top-5 acc 4.297 (3.161)	lr 0.04954
Warmup Train [3][1480/3239]	Time 0.496 (0.511)	Data 0.001 (0.012)	Loss 6.4116 (6.4289)	Top-1 acc 0.391 (0.735)	Top-5 acc 2.344 (3.164)	lr 0.04954
Warmup Train [3][1490/3239]	Time 0.400 (0.511)	Data 0.001 (0.012)	Loss 6.3698 (6.4287)	Top-1 acc 1.172 (0.737)	Top-5 acc 4.688 (3.171)	lr 0.04953
Warmup Train [3][1500/3239]	Time 0.423 (0.511)	Data 0.001 (0.012)	Loss 6.4520 (6.4285)	Top-1 acc 0.000 (0.738)	Top-5 acc 2.734 (3.175)	lr 0.04953
Warmup Train [3][1510/3239]	Time 0.635 (0.511)	Data 0.001 (0.012)	Loss 6.3549 (6.4283)	Top-1 acc 0.781 (0.739)	Top-5 acc 5.078 (3.182)	lr 0.04953
Warmup Train [3][1520/3239]	Time 0.582 (0.511)	Data 0.001 (0.012)	Loss 6.4577 (6.4281)	Top-1 acc 0.000 (0.739)	Top-5 acc 1.562 (3.181)	lr 0.04953
Warmup Train [3][1530/3239]	Time 0.508 (0.511)	Data 0.001 (0.011)	Loss 6.4599 (6.4280)	Top-1 acc 0.000 (0.738)	Top-5 acc 3.125 (3.181)	lr 0.04953
Warmup Train [3][1540/3239]	Time 0.580 (0.511)	Data 0.001 (0.011)	Loss 6.4168 (6.4277)	Top-1 acc 1.172 (0.739)	Top-5 acc 4.297 (3.184)	lr 0.04953
Warmup Train [3][1550/3239]	Time 0.580 (0.511)	Data 0.001 (0.011)	Loss 6.4097 (6.4275)	Top-1 acc 0.781 (0.740)	Top-5 acc 1.562 (3.184)	lr 0.04953
Warmup Train [3][1560/3239]	Time 0.572 (0.511)	Data 0.001 (0.011)	Loss 6.4311 (6.4274)	Top-1 acc 1.172 (0.740)	Top-5 acc 2.734 (3.186)	lr 0.04953
Warmup Train [3][1570/3239]	Time 0.541 (0.511)	Data 0.001 (0.011)	Loss 6.3726 (6.4273)	Top-1 acc 0.781 (0.740)	Top-5 acc 3.125 (3.187)	lr 0.04953
Warmup Train [3][1580/3239]	Time 0.400 (0.511)	Data 0.001 (0.011)	Loss 6.4605 (6.4270)	Top-1 acc 0.000 (0.742)	Top-5 acc 2.344 (3.191)	lr 0.04952
Warmup Train [3][1590/3239]	Time 0.627 (0.511)	Data 0.001 (0.011)	Loss 6.3618 (6.4267)	Top-1 acc 1.562 (0.742)	Top-5 acc 5.859 (3.196)	lr 0.04952
Warmup Train [3][1600/3239]	Time 0.629 (0.511)	Data 0.001 (0.011)	Loss 6.3618 (6.4265)	Top-1 acc 0.781 (0.746)	Top-5 acc 3.516 (3.201)	lr 0.04952
Warmup Train [3][1610/3239]	Time 0.473 (0.511)	Data 0.001 (0.011)	Loss 6.3971 (6.4263)	Top-1 acc 0.391 (0.747)	Top-5 acc 1.953 (3.204)	lr 0.04952
Warmup Train [3][1620/3239]	Time 0.544 (0.511)	Data 0.001 (0.011)	Loss 6.4582 (6.4261)	Top-1 acc 0.391 (0.746)	Top-5 acc 3.906 (3.206)	lr 0.04952
Warmup Train [3][1630/3239]	Time 0.396 (0.511)	Data 0.001 (0.011)	Loss 6.3652 (6.4260)	Top-1 acc 0.391 (0.744)	Top-5 acc 3.125 (3.204)	lr 0.04952
Warmup Train [3][1640/3239]	Time 0.498 (0.511)	Data 0.002 (0.011)	Loss 6.3645 (6.4258)	Top-1 acc 1.172 (0.744)	Top-5 acc 4.297 (3.206)	lr 0.04952
Warmup Train [3][1650/3239]	Time 0.767 (0.511)	Data 0.001 (0.011)	Loss 6.4031 (6.4257)	Top-1 acc 0.391 (0.744)	Top-5 acc 5.078 (3.207)	lr 0.04952
Warmup Train [3][1660/3239]	Time 0.488 (0.511)	Data 0.001 (0.011)	Loss 6.3979 (6.4255)	Top-1 acc 0.000 (0.745)	Top-5 acc 3.906 (3.214)	lr 0.04951
Warmup Train [3][1670/3239]	Time 0.516 (0.511)	Data 0.001 (0.011)	Loss 6.3857 (6.4253)	Top-1 acc 0.391 (0.745)	Top-5 acc 5.078 (3.215)	lr 0.04951
Warmup Train [3][1680/3239]	Time 0.452 (0.511)	Data 0.001 (0.011)	Loss 6.4821 (6.4252)	Top-1 acc 0.000 (0.745)	Top-5 acc 4.297 (3.214)	lr 0.04951
Warmup Train [3][1690/3239]	Time 0.534 (0.511)	Data 0.001 (0.011)	Loss 6.3837 (6.4253)	Top-1 acc 0.000 (0.745)	Top-5 acc 4.297 (3.216)	lr 0.04951
Warmup Train [3][1700/3239]	Time 0.465 (0.511)	Data 0.001 (0.011)	Loss 6.3952 (6.4251)	Top-1 acc 0.781 (0.747)	Top-5 acc 4.297 (3.215)	lr 0.04951
Warmup Train [3][1710/3239]	Time 0.374 (0.511)	Data 0.001 (0.011)	Loss 6.3931 (6.4248)	Top-1 acc 0.781 (0.748)	Top-5 acc 3.906 (3.220)	lr 0.04951
Warmup Train [3][1720/3239]	Time 0.349 (0.510)	Data 0.001 (0.011)	Loss 6.3496 (6.4246)	Top-1 acc 0.781 (0.749)	Top-5 acc 3.906 (3.219)	lr 0.04951
Warmup Train [3][1730/3239]	Time 0.346 (0.510)	Data 0.001 (0.011)	Loss 6.4144 (6.4245)	Top-1 acc 0.391 (0.751)	Top-5 acc 2.734 (3.223)	lr 0.04951
Warmup Train [3][1740/3239]	Time 0.570 (0.510)	Data 0.001 (0.011)	Loss 6.4001 (6.4243)	Top-1 acc 1.562 (0.751)	Top-5 acc 3.906 (3.225)	lr 0.04951
Warmup Train [3][1750/3239]	Time 0.372 (0.510)	Data 0.001 (0.011)	Loss 6.4001 (6.4242)	Top-1 acc 0.391 (0.751)	Top-5 acc 2.344 (3.224)	lr 0.04950
Warmup Train [3][1760/3239]	Time 0.461 (0.510)	Data 0.001 (0.011)	Loss 6.4329 (6.4242)	Top-1 acc 0.781 (0.753)	Top-5 acc 1.953 (3.224)	lr 0.04950
Warmup Train [3][1770/3239]	Time 0.437 (0.510)	Data 0.001 (0.011)	Loss 6.4450 (6.4242)	Top-1 acc 1.172 (0.753)	Top-5 acc 3.906 (3.224)	lr 0.04950
Warmup Train [3][1780/3239]	Time 0.384 (0.510)	Data 0.001 (0.011)	Loss 6.4247 (6.4242)	Top-1 acc 0.781 (0.753)	Top-5 acc 3.125 (3.225)	lr 0.04950
Warmup Train [3][1790/3239]	Time 0.510 (0.510)	Data 0.001 (0.011)	Loss 6.3931 (6.4239)	Top-1 acc 1.172 (0.754)	Top-5 acc 4.297 (3.229)	lr 0.04950
Warmup Train [3][1800/3239]	Time 0.707 (0.510)	Data 0.001 (0.011)	Loss 6.4152 (6.4239)	Top-1 acc 0.781 (0.754)	Top-5 acc 2.734 (3.227)	lr 0.04950
Warmup Train [3][1810/3239]	Time 0.373 (0.510)	Data 0.001 (0.011)	Loss 6.3946 (6.4238)	Top-1 acc 0.781 (0.755)	Top-5 acc 5.859 (3.232)	lr 0.04950
Warmup Train [3][1820/3239]	Time 0.337 (0.510)	Data 0.001 (0.011)	Loss 6.3413 (6.4235)	Top-1 acc 0.781 (0.754)	Top-5 acc 2.344 (3.231)	lr 0.04950
Warmup Train [3][1830/3239]	Time 0.501 (0.510)	Data 0.001 (0.011)	Loss 6.3993 (6.4234)	Top-1 acc 0.391 (0.756)	Top-5 acc 4.297 (3.234)	lr 0.04949
Warmup Train [3][1840/3239]	Time 0.739 (0.511)	Data 0.001 (0.011)	Loss 6.4195 (6.4232)	Top-1 acc 1.562 (0.758)	Top-5 acc 3.125 (3.238)	lr 0.04949
Warmup Train [3][1850/3239]	Time 0.606 (0.511)	Data 0.001 (0.011)	Loss 6.3907 (6.4230)	Top-1 acc 1.953 (0.760)	Top-5 acc 5.078 (3.241)	lr 0.04949
Warmup Train [3][1860/3239]	Time 0.497 (0.511)	Data 0.001 (0.011)	Loss 6.3828 (6.4229)	Top-1 acc 0.000 (0.761)	Top-5 acc 2.734 (3.244)	lr 0.04949
Warmup Train [3][1870/3239]	Time 0.501 (0.511)	Data 0.001 (0.011)	Loss 6.3890 (6.4228)	Top-1 acc 0.391 (0.760)	Top-5 acc 3.125 (3.244)	lr 0.04949
Warmup Train [3][1880/3239]	Time 0.510 (0.511)	Data 0.002 (0.011)	Loss 6.4354 (6.4227)	Top-1 acc 0.781 (0.759)	Top-5 acc 2.344 (3.243)	lr 0.04949
Warmup Train [3][1890/3239]	Time 0.505 (0.511)	Data 0.001 (0.011)	Loss 6.4020 (6.4226)	Top-1 acc 1.562 (0.761)	Top-5 acc 2.344 (3.243)	lr 0.04949
Warmup Train [3][1900/3239]	Time 0.519 (0.511)	Data 0.001 (0.011)	Loss 6.3751 (6.4224)	Top-1 acc 0.391 (0.761)	Top-5 acc 2.734 (3.246)	lr 0.04949
Warmup Train [3][1910/3239]	Time 0.511 (0.511)	Data 0.001 (0.011)	Loss 6.4018 (6.4223)	Top-1 acc 0.000 (0.760)	Top-5 acc 3.125 (3.246)	lr 0.04948
Warmup Train [3][1920/3239]	Time 0.421 (0.511)	Data 0.001 (0.011)	Loss 6.4341 (6.4222)	Top-1 acc 0.781 (0.760)	Top-5 acc 2.734 (3.246)	lr 0.04948
Warmup Train [3][1930/3239]	Time 0.540 (0.511)	Data 0.001 (0.011)	Loss 6.4041 (6.4222)	Top-1 acc 1.172 (0.761)	Top-5 acc 2.734 (3.246)	lr 0.04948
Warmup Train [3][1940/3239]	Time 0.606 (0.511)	Data 0.001 (0.011)	Loss 6.3443 (6.4220)	Top-1 acc 0.781 (0.762)	Top-5 acc 4.297 (3.249)	lr 0.04948
Warmup Train [3][1950/3239]	Time 0.339 (0.511)	Data 0.001 (0.011)	Loss 6.4285 (6.4219)	Top-1 acc 0.781 (0.763)	Top-5 acc 1.562 (3.250)	lr 0.04948
Warmup Train [3][1960/3239]	Time 0.518 (0.511)	Data 0.001 (0.011)	Loss 6.3678 (6.4216)	Top-1 acc 1.172 (0.765)	Top-5 acc 4.297 (3.256)	lr 0.04948
Warmup Train [3][1970/3239]	Time 0.509 (0.511)	Data 0.001 (0.011)	Loss 6.3441 (6.4214)	Top-1 acc 0.781 (0.763)	Top-5 acc 3.516 (3.256)	lr 0.04948
Warmup Train [3][1980/3239]	Time 0.341 (0.511)	Data 0.001 (0.010)	Loss 6.4138 (6.4213)	Top-1 acc 0.781 (0.763)	Top-5 acc 2.344 (3.255)	lr 0.04948
Warmup Train [3][1990/3239]	Time 0.506 (0.511)	Data 0.001 (0.010)	Loss 6.3934 (6.4212)	Top-1 acc 0.391 (0.764)	Top-5 acc 3.906 (3.258)	lr 0.04947
Warmup Train [3][2000/3239]	Time 0.436 (0.511)	Data 0.001 (0.010)	Loss 6.4034 (6.4211)	Top-1 acc 0.391 (0.763)	Top-5 acc 3.125 (3.257)	lr 0.04947
Warmup Train [3][2010/3239]	Time 0.488 (0.510)	Data 0.001 (0.010)	Loss 6.4622 (6.4210)	Top-1 acc 0.391 (0.764)	Top-5 acc 1.953 (3.259)	lr 0.04947
Warmup Train [3][2020/3239]	Time 0.585 (0.511)	Data 0.001 (0.010)	Loss 6.3999 (6.4209)	Top-1 acc 0.391 (0.763)	Top-5 acc 4.297 (3.260)	lr 0.04947
Warmup Train [3][2030/3239]	Time 0.374 (0.510)	Data 0.001 (0.010)	Loss 6.3457 (6.4207)	Top-1 acc 0.781 (0.765)	Top-5 acc 1.172 (3.260)	lr 0.04947
Warmup Train [3][2040/3239]	Time 0.508 (0.510)	Data 0.001 (0.010)	Loss 6.3509 (6.4205)	Top-1 acc 0.781 (0.767)	Top-5 acc 5.469 (3.261)	lr 0.04947
Warmup Train [3][2050/3239]	Time 0.569 (0.510)	Data 0.001 (0.010)	Loss 6.4114 (6.4204)	Top-1 acc 0.391 (0.767)	Top-5 acc 2.344 (3.263)	lr 0.04947
Warmup Train [3][2060/3239]	Time 0.541 (0.510)	Data 0.001 (0.010)	Loss 6.4201 (6.4204)	Top-1 acc 0.391 (0.768)	Top-5 acc 1.953 (3.264)	lr 0.04947
Warmup Train [3][2070/3239]	Time 0.522 (0.510)	Data 0.001 (0.010)	Loss 6.3384 (6.4202)	Top-1 acc 1.172 (0.768)	Top-5 acc 2.734 (3.264)	lr 0.04946
Warmup Train [3][2080/3239]	Time 0.548 (0.510)	Data 0.001 (0.010)	Loss 6.3984 (6.4201)	Top-1 acc 0.391 (0.768)	Top-5 acc 3.906 (3.265)	lr 0.04946
Warmup Train [3][2090/3239]	Time 0.528 (0.510)	Data 0.001 (0.010)	Loss 6.4194 (6.4200)	Top-1 acc 0.000 (0.770)	Top-5 acc 2.734 (3.267)	lr 0.04946
Warmup Train [3][2100/3239]	Time 0.439 (0.510)	Data 0.001 (0.010)	Loss 6.4331 (6.4200)	Top-1 acc 0.391 (0.771)	Top-5 acc 2.734 (3.269)	lr 0.04946
Warmup Train [3][2110/3239]	Time 0.458 (0.510)	Data 0.001 (0.010)	Loss 6.3767 (6.4198)	Top-1 acc 1.172 (0.770)	Top-5 acc 6.250 (3.272)	lr 0.04946
Warmup Train [3][2120/3239]	Time 0.601 (0.511)	Data 0.002 (0.010)	Loss 6.3738 (6.4196)	Top-1 acc 2.344 (0.771)	Top-5 acc 4.297 (3.273)	lr 0.04946
Warmup Train [3][2130/3239]	Time 0.445 (0.510)	Data 0.001 (0.010)	Loss 6.4258 (6.4195)	Top-1 acc 0.000 (0.770)	Top-5 acc 4.688 (3.275)	lr 0.04946
Warmup Train [3][2140/3239]	Time 0.593 (0.511)	Data 0.001 (0.010)	Loss 6.3933 (6.4193)	Top-1 acc 0.000 (0.770)	Top-5 acc 5.078 (3.276)	lr 0.04946
Warmup Train [3][2150/3239]	Time 0.464 (0.511)	Data 0.001 (0.010)	Loss 6.3828 (6.4192)	Top-1 acc 0.000 (0.769)	Top-5 acc 3.516 (3.276)	lr 0.04945
Warmup Train [3][2160/3239]	Time 0.458 (0.511)	Data 0.001 (0.010)	Loss 6.3652 (6.4191)	Top-1 acc 0.391 (0.769)	Top-5 acc 1.953 (3.277)	lr 0.04945
Warmup Train [3][2170/3239]	Time 0.469 (0.510)	Data 0.001 (0.010)	Loss 6.3368 (6.4189)	Top-1 acc 0.391 (0.771)	Top-5 acc 4.297 (3.281)	lr 0.04945
Warmup Train [3][2180/3239]	Time 0.489 (0.511)	Data 0.001 (0.010)	Loss 6.3669 (6.4188)	Top-1 acc 1.172 (0.772)	Top-5 acc 3.125 (3.281)	lr 0.04945
Warmup Train [3][2190/3239]	Time 0.528 (0.511)	Data 0.001 (0.010)	Loss 6.4129 (6.4187)	Top-1 acc 0.781 (0.771)	Top-5 acc 1.953 (3.280)	lr 0.04945
Warmup Train [3][2200/3239]	Time 0.472 (0.511)	Data 0.001 (0.010)	Loss 6.3574 (6.4185)	Top-1 acc 0.000 (0.772)	Top-5 acc 3.516 (3.280)	lr 0.04945
Warmup Train [3][2210/3239]	Time 0.479 (0.511)	Data 0.001 (0.010)	Loss 6.3985 (6.4184)	Top-1 acc 0.781 (0.772)	Top-5 acc 3.906 (3.281)	lr 0.04945
Warmup Train [3][2220/3239]	Time 0.495 (0.511)	Data 0.001 (0.010)	Loss 6.3967 (6.4182)	Top-1 acc 1.172 (0.773)	Top-5 acc 4.688 (3.285)	lr 0.04945
Warmup Train [3][2230/3239]	Time 0.651 (0.511)	Data 0.001 (0.010)	Loss 6.3626 (6.4180)	Top-1 acc 1.172 (0.775)	Top-5 acc 2.734 (3.288)	lr 0.04944
Warmup Train [3][2240/3239]	Time 0.547 (0.511)	Data 0.001 (0.010)	Loss 6.3493 (6.4179)	Top-1 acc 0.781 (0.776)	Top-5 acc 5.469 (3.291)	lr 0.04944
Warmup Train [3][2250/3239]	Time 0.545 (0.511)	Data 0.001 (0.010)	Loss 6.3823 (6.4177)	Top-1 acc 1.172 (0.778)	Top-5 acc 5.469 (3.295)	lr 0.04944
Warmup Train [3][2260/3239]	Time 0.533 (0.511)	Data 0.001 (0.010)	Loss 6.3339 (6.4177)	Top-1 acc 0.781 (0.778)	Top-5 acc 3.516 (3.296)	lr 0.04944
Warmup Train [3][2270/3239]	Time 0.568 (0.510)	Data 0.002 (0.010)	Loss 6.3858 (6.4176)	Top-1 acc 0.781 (0.780)	Top-5 acc 4.688 (3.300)	lr 0.04944
Warmup Train [3][2280/3239]	Time 0.499 (0.510)	Data 0.001 (0.010)	Loss 6.3030 (6.4173)	Top-1 acc 0.781 (0.780)	Top-5 acc 4.297 (3.302)	lr 0.04944
Warmup Train [3][2290/3239]	Time 0.493 (0.510)	Data 0.001 (0.010)	Loss 6.4014 (6.4171)	Top-1 acc 1.172 (0.780)	Top-5 acc 3.125 (3.302)	lr 0.04944
Warmup Train [3][2300/3239]	Time 0.521 (0.510)	Data 0.001 (0.010)	Loss 6.3670 (6.4169)	Top-1 acc 1.172 (0.779)	Top-5 acc 5.078 (3.304)	lr 0.04944
Warmup Train [3][2310/3239]	Time 0.594 (0.511)	Data 0.001 (0.010)	Loss 6.4034 (6.4168)	Top-1 acc 1.562 (0.779)	Top-5 acc 3.125 (3.306)	lr 0.04943
Warmup Train [3][2320/3239]	Time 0.618 (0.511)	Data 0.001 (0.010)	Loss 6.3946 (6.4167)	Top-1 acc 1.172 (0.779)	Top-5 acc 3.125 (3.305)	lr 0.04943
Warmup Train [3][2330/3239]	Time 0.677 (0.511)	Data 0.001 (0.010)	Loss 6.3883 (6.4167)	Top-1 acc 0.781 (0.779)	Top-5 acc 3.516 (3.303)	lr 0.04943
Warmup Train [3][2340/3239]	Time 0.550 (0.511)	Data 0.001 (0.010)	Loss 6.3868 (6.4165)	Top-1 acc 0.000 (0.780)	Top-5 acc 4.297 (3.307)	lr 0.04943
Warmup Train [3][2350/3239]	Time 0.532 (0.511)	Data 0.001 (0.010)	Loss 6.4004 (6.4163)	Top-1 acc 1.562 (0.782)	Top-5 acc 6.250 (3.311)	lr 0.04943
Warmup Train [3][2360/3239]	Time 0.382 (0.511)	Data 0.001 (0.010)	Loss 6.3829 (6.4162)	Top-1 acc 0.781 (0.780)	Top-5 acc 5.078 (3.310)	lr 0.04943
Warmup Train [3][2370/3239]	Time 0.418 (0.511)	Data 0.002 (0.010)	Loss 6.3726 (6.4161)	Top-1 acc 1.562 (0.781)	Top-5 acc 5.078 (3.312)	lr 0.04943
Warmup Train [3][2380/3239]	Time 0.549 (0.511)	Data 0.001 (0.010)	Loss 6.3032 (6.4159)	Top-1 acc 1.562 (0.782)	Top-5 acc 3.516 (3.314)	lr 0.04943
Warmup Train [3][2390/3239]	Time 0.494 (0.511)	Data 0.001 (0.010)	Loss 6.3223 (6.4157)	Top-1 acc 1.953 (0.783)	Top-5 acc 3.516 (3.316)	lr 0.04942
Warmup Train [3][2400/3239]	Time 0.592 (0.511)	Data 0.001 (0.010)	Loss 6.3042 (6.4154)	Top-1 acc 1.562 (0.785)	Top-5 acc 5.078 (3.320)	lr 0.04942
Warmup Train [3][2410/3239]	Time 0.478 (0.511)	Data 0.001 (0.010)	Loss 6.4082 (6.4153)	Top-1 acc 0.781 (0.785)	Top-5 acc 3.906 (3.322)	lr 0.04942
Warmup Train [3][2420/3239]	Time 0.495 (0.511)	Data 0.001 (0.010)	Loss 6.3291 (6.4152)	Top-1 acc 1.172 (0.785)	Top-5 acc 4.688 (3.322)	lr 0.04942
Warmup Train [3][2430/3239]	Time 0.425 (0.511)	Data 0.001 (0.010)	Loss 6.3673 (6.4150)	Top-1 acc 0.781 (0.785)	Top-5 acc 2.734 (3.324)	lr 0.04942
Warmup Train [3][2440/3239]	Time 0.562 (0.511)	Data 0.001 (0.010)	Loss 6.4221 (6.4148)	Top-1 acc 0.000 (0.785)	Top-5 acc 2.344 (3.326)	lr 0.04942
Warmup Train [3][2450/3239]	Time 0.453 (0.511)	Data 0.001 (0.010)	Loss 6.3966 (6.4147)	Top-1 acc 1.562 (0.786)	Top-5 acc 3.516 (3.328)	lr 0.04942
Warmup Train [3][2460/3239]	Time 0.459 (0.511)	Data 0.001 (0.010)	Loss 6.3582 (6.4145)	Top-1 acc 1.953 (0.787)	Top-5 acc 3.906 (3.329)	lr 0.04942
Warmup Train [3][2470/3239]	Time 0.522 (0.511)	Data 0.001 (0.010)	Loss 6.3156 (6.4144)	Top-1 acc 2.734 (0.788)	Top-5 acc 3.516 (3.330)	lr 0.04941
Warmup Train [3][2480/3239]	Time 0.495 (0.511)	Data 0.001 (0.010)	Loss 6.3604 (6.4141)	Top-1 acc 0.781 (0.789)	Top-5 acc 4.688 (3.336)	lr 0.04941
Warmup Train [3][2490/3239]	Time 0.333 (0.511)	Data 0.001 (0.010)	Loss 6.3714 (6.4139)	Top-1 acc 1.172 (0.789)	Top-5 acc 3.906 (3.338)	lr 0.04941
Warmup Train [3][2500/3239]	Time 0.375 (0.511)	Data 0.001 (0.010)	Loss 6.3316 (6.4137)	Top-1 acc 1.562 (0.789)	Top-5 acc 4.688 (3.340)	lr 0.04941
Warmup Train [3][2510/3239]	Time 0.403 (0.511)	Data 0.001 (0.010)	Loss 6.4031 (6.4136)	Top-1 acc 0.391 (0.789)	Top-5 acc 3.125 (3.344)	lr 0.04941
Warmup Train [3][2520/3239]	Time 0.214 (0.510)	Data 0.002 (0.010)	Loss 6.3297 (6.4134)	Top-1 acc 0.781 (0.788)	Top-5 acc 4.297 (3.343)	lr 0.04941
Warmup Train [3][2530/3239]	Time 0.581 (0.510)	Data 0.001 (0.010)	Loss 6.3725 (6.4131)	Top-1 acc 0.781 (0.788)	Top-5 acc 5.469 (3.346)	lr 0.04941
Warmup Train [3][2540/3239]	Time 0.566 (0.510)	Data 0.001 (0.010)	Loss 6.2782 (6.4130)	Top-1 acc 0.391 (0.788)	Top-5 acc 4.297 (3.347)	lr 0.04940
Warmup Train [3][2550/3239]	Time 0.479 (0.510)	Data 0.001 (0.010)	Loss 6.4028 (6.4128)	Top-1 acc 1.953 (0.789)	Top-5 acc 4.688 (3.349)	lr 0.04940
Warmup Train [3][2560/3239]	Time 0.549 (0.510)	Data 0.001 (0.010)	Loss 6.3413 (6.4127)	Top-1 acc 0.391 (0.789)	Top-5 acc 3.125 (3.349)	lr 0.04940
Warmup Train [3][2570/3239]	Time 0.517 (0.510)	Data 0.001 (0.010)	Loss 6.3392 (6.4125)	Top-1 acc 1.562 (0.790)	Top-5 acc 3.125 (3.353)	lr 0.04940
Warmup Train [3][2580/3239]	Time 0.261 (0.510)	Data 0.001 (0.010)	Loss 6.3104 (6.4123)	Top-1 acc 1.562 (0.790)	Top-5 acc 3.516 (3.351)	lr 0.04940
Warmup Train [3][2590/3239]	Time 0.620 (0.511)	Data 0.001 (0.010)	Loss 6.4101 (6.4122)	Top-1 acc 0.391 (0.790)	Top-5 acc 3.125 (3.353)	lr 0.04940
Warmup Train [3][2600/3239]	Time 0.655 (0.511)	Data 0.001 (0.009)	Loss 6.4333 (6.4120)	Top-1 acc 0.781 (0.791)	Top-5 acc 3.516 (3.354)	lr 0.04940
Warmup Train [3][2610/3239]	Time 0.593 (0.511)	Data 0.001 (0.009)	Loss 6.3613 (6.4118)	Top-1 acc 1.172 (0.792)	Top-5 acc 3.125 (3.356)	lr 0.04940
Warmup Train [3][2620/3239]	Time 0.630 (0.511)	Data 0.001 (0.009)	Loss 6.3857 (6.4116)	Top-1 acc 0.781 (0.793)	Top-5 acc 2.734 (3.357)	lr 0.04939
Warmup Train [3][2630/3239]	Time 0.550 (0.511)	Data 0.001 (0.009)	Loss 6.4213 (6.4114)	Top-1 acc 1.172 (0.793)	Top-5 acc 3.516 (3.359)	lr 0.04939
Warmup Train [3][2640/3239]	Time 0.726 (0.510)	Data 0.001 (0.009)	Loss 6.3293 (6.4113)	Top-1 acc 1.953 (0.794)	Top-5 acc 5.469 (3.361)	lr 0.04939
Warmup Train [3][2650/3239]	Time 0.584 (0.510)	Data 0.001 (0.009)	Loss 6.3496 (6.4110)	Top-1 acc 0.000 (0.795)	Top-5 acc 3.125 (3.366)	lr 0.04939
Warmup Train [3][2660/3239]	Time 0.386 (0.510)	Data 0.001 (0.009)	Loss 6.3217 (6.4109)	Top-1 acc 0.391 (0.794)	Top-5 acc 1.953 (3.368)	lr 0.04939
Warmup Train [3][2670/3239]	Time 0.584 (0.511)	Data 0.001 (0.009)	Loss 6.3915 (6.4107)	Top-1 acc 0.781 (0.796)	Top-5 acc 4.297 (3.369)	lr 0.04939
Warmup Train [3][2680/3239]	Time 0.490 (0.511)	Data 0.001 (0.009)	Loss 6.2878 (6.4104)	Top-1 acc 2.344 (0.796)	Top-5 acc 5.469 (3.371)	lr 0.04939
Warmup Train [3][2690/3239]	Time 0.282 (0.510)	Data 0.001 (0.009)	Loss 6.3911 (6.4103)	Top-1 acc 1.172 (0.797)	Top-5 acc 4.688 (3.372)	lr 0.04938
Warmup Train [3][2700/3239]	Time 0.573 (0.511)	Data 0.001 (0.009)	Loss 6.3963 (6.4102)	Top-1 acc 0.391 (0.797)	Top-5 acc 3.516 (3.374)	lr 0.04938
Warmup Train [3][2710/3239]	Time 0.369 (0.511)	Data 0.001 (0.009)	Loss 6.4157 (6.4101)	Top-1 acc 0.391 (0.798)	Top-5 acc 3.125 (3.375)	lr 0.04938
Warmup Train [3][2720/3239]	Time 0.546 (0.511)	Data 0.001 (0.009)	Loss 6.3347 (6.4099)	Top-1 acc 0.391 (0.798)	Top-5 acc 3.516 (3.378)	lr 0.04938
Warmup Train [3][2730/3239]	Time 0.476 (0.511)	Data 0.001 (0.009)	Loss 6.3895 (6.4097)	Top-1 acc 0.391 (0.799)	Top-5 acc 3.906 (3.381)	lr 0.04938
Warmup Train [3][2740/3239]	Time 0.350 (0.510)	Data 0.001 (0.009)	Loss 6.4058 (6.4096)	Top-1 acc 0.391 (0.800)	Top-5 acc 3.125 (3.384)	lr 0.04938
Warmup Train [3][2750/3239]	Time 0.591 (0.510)	Data 0.001 (0.009)	Loss 6.3214 (6.4093)	Top-1 acc 0.781 (0.800)	Top-5 acc 3.516 (3.388)	lr 0.04938
Warmup Train [3][2760/3239]	Time 0.473 (0.510)	Data 0.001 (0.009)	Loss 6.3485 (6.4090)	Top-1 acc 0.781 (0.802)	Top-5 acc 3.125 (3.393)	lr 0.04938
Warmup Train [3][2770/3239]	Time 0.587 (0.510)	Data 0.001 (0.009)	Loss 6.4579 (6.4089)	Top-1 acc 0.391 (0.803)	Top-5 acc 1.953 (3.394)	lr 0.04937
Warmup Train [3][2780/3239]	Time 0.263 (0.510)	Data 0.001 (0.009)	Loss 6.3632 (6.4088)	Top-1 acc 0.781 (0.803)	Top-5 acc 2.734 (3.397)	lr 0.04937
Warmup Train [3][2790/3239]	Time 0.522 (0.510)	Data 0.001 (0.009)	Loss 6.3840 (6.4086)	Top-1 acc 1.172 (0.804)	Top-5 acc 3.125 (3.398)	lr 0.04937
Warmup Train [3][2800/3239]	Time 0.528 (0.510)	Data 0.001 (0.009)	Loss 6.3550 (6.4084)	Top-1 acc 1.172 (0.805)	Top-5 acc 3.125 (3.401)	lr 0.04937
Warmup Train [3][2810/3239]	Time 0.542 (0.510)	Data 0.001 (0.009)	Loss 6.3598 (6.4083)	Top-1 acc 0.781 (0.805)	Top-5 acc 3.906 (3.401)	lr 0.04937
Warmup Train [3][2820/3239]	Time 0.493 (0.510)	Data 0.001 (0.009)	Loss 6.4049 (6.4082)	Top-1 acc 0.000 (0.806)	Top-5 acc 2.344 (3.402)	lr 0.04937
Warmup Train [3][2830/3239]	Time 0.517 (0.510)	Data 0.001 (0.009)	Loss 6.3809 (6.4080)	Top-1 acc 1.172 (0.806)	Top-5 acc 5.859 (3.403)	lr 0.04937
Warmup Train [3][2840/3239]	Time 0.542 (0.510)	Data 0.001 (0.009)	Loss 6.3125 (6.4077)	Top-1 acc 1.953 (0.807)	Top-5 acc 4.688 (3.407)	lr 0.04936
Warmup Train [3][2850/3239]	Time 0.639 (0.510)	Data 0.001 (0.009)	Loss 6.3113 (6.4077)	Top-1 acc 0.781 (0.806)	Top-5 acc 4.688 (3.407)	lr 0.04936
Warmup Train [3][2860/3239]	Time 0.521 (0.510)	Data 0.001 (0.009)	Loss 6.3693 (6.4075)	Top-1 acc 0.000 (0.807)	Top-5 acc 2.344 (3.410)	lr 0.04936
Warmup Train [3][2870/3239]	Time 0.524 (0.510)	Data 0.001 (0.009)	Loss 6.3515 (6.4073)	Top-1 acc 0.781 (0.807)	Top-5 acc 3.516 (3.412)	lr 0.04936
Warmup Train [3][2880/3239]	Time 0.497 (0.510)	Data 0.001 (0.009)	Loss 6.3631 (6.4071)	Top-1 acc 0.781 (0.808)	Top-5 acc 3.906 (3.415)	lr 0.04936
Warmup Train [3][2890/3239]	Time 0.509 (0.510)	Data 0.001 (0.009)	Loss 6.4227 (6.4069)	Top-1 acc 1.172 (0.810)	Top-5 acc 5.859 (3.421)	lr 0.04936
Warmup Train [3][2900/3239]	Time 0.501 (0.510)	Data 0.001 (0.009)	Loss 6.3612 (6.4067)	Top-1 acc 0.000 (0.810)	Top-5 acc 2.344 (3.423)	lr 0.04936
Warmup Train [3][2910/3239]	Time 0.584 (0.510)	Data 0.001 (0.009)	Loss 6.3891 (6.4065)	Top-1 acc 1.172 (0.811)	Top-5 acc 3.125 (3.425)	lr 0.04936
Warmup Train [3][2920/3239]	Time 0.463 (0.510)	Data 0.001 (0.009)	Loss 6.2363 (6.4064)	Top-1 acc 1.562 (0.810)	Top-5 acc 2.734 (3.423)	lr 0.04935
Warmup Train [3][2930/3239]	Time 0.624 (0.510)	Data 0.001 (0.009)	Loss 6.2771 (6.4061)	Top-1 acc 1.172 (0.810)	Top-5 acc 5.078 (3.424)	lr 0.04935
Warmup Train [3][2940/3239]	Time 0.283 (0.510)	Data 0.001 (0.009)	Loss 6.3986 (6.4060)	Top-1 acc 1.953 (0.810)	Top-5 acc 3.906 (3.425)	lr 0.04935
Warmup Train [3][2950/3239]	Time 0.527 (0.510)	Data 0.001 (0.009)	Loss 6.3859 (6.4059)	Top-1 acc 0.391 (0.810)	Top-5 acc 2.734 (3.426)	lr 0.04935
Warmup Train [3][2960/3239]	Time 0.582 (0.510)	Data 0.001 (0.009)	Loss 6.3785 (6.4057)	Top-1 acc 0.781 (0.811)	Top-5 acc 4.688 (3.430)	lr 0.04935
Warmup Train [3][2970/3239]	Time 0.485 (0.510)	Data 0.002 (0.009)	Loss 6.3485 (6.4056)	Top-1 acc 1.172 (0.811)	Top-5 acc 5.078 (3.430)	lr 0.04935
Warmup Train [3][2980/3239]	Time 0.374 (0.510)	Data 0.001 (0.009)	Loss 6.4099 (6.4055)	Top-1 acc 0.781 (0.812)	Top-5 acc 2.734 (3.433)	lr 0.04935
Warmup Train [3][2990/3239]	Time 0.458 (0.510)	Data 0.001 (0.009)	Loss 6.4079 (6.4053)	Top-1 acc 0.391 (0.812)	Top-5 acc 1.953 (3.435)	lr 0.04934
Warmup Train [3][3000/3239]	Time 0.474 (0.510)	Data 0.001 (0.009)	Loss 6.2598 (6.4051)	Top-1 acc 0.781 (0.814)	Top-5 acc 4.297 (3.438)	lr 0.04934
Warmup Train [3][3010/3239]	Time 0.521 (0.510)	Data 0.001 (0.009)	Loss 6.3233 (6.4049)	Top-1 acc 0.781 (0.813)	Top-5 acc 6.250 (3.440)	lr 0.04934
Warmup Train [3][3020/3239]	Time 0.497 (0.510)	Data 0.001 (0.009)	Loss 6.3561 (6.4047)	Top-1 acc 1.172 (0.814)	Top-5 acc 3.516 (3.441)	lr 0.04934
Warmup Train [3][3030/3239]	Time 0.469 (0.510)	Data 0.001 (0.009)	Loss 6.3926 (6.4046)	Top-1 acc 0.391 (0.815)	Top-5 acc 2.344 (3.441)	lr 0.04934
Warmup Train [3][3040/3239]	Time 0.455 (0.510)	Data 0.001 (0.009)	Loss 6.3706 (6.4047)	Top-1 acc 0.391 (0.815)	Top-5 acc 3.125 (3.441)	lr 0.04934
Warmup Train [3][3050/3239]	Time 0.452 (0.510)	Data 0.001 (0.009)	Loss 6.3230 (6.4045)	Top-1 acc 2.344 (0.816)	Top-5 acc 5.469 (3.444)	lr 0.04934
Warmup Train [3][3060/3239]	Time 0.644 (0.510)	Data 0.001 (0.009)	Loss 6.4357 (6.4044)	Top-1 acc 2.344 (0.816)	Top-5 acc 4.297 (3.445)	lr 0.04933
Warmup Train [3][3070/3239]	Time 0.368 (0.510)	Data 0.001 (0.009)	Loss 6.3357 (6.4042)	Top-1 acc 0.391 (0.817)	Top-5 acc 2.734 (3.448)	lr 0.04933
Warmup Train [3][3080/3239]	Time 0.528 (0.510)	Data 0.001 (0.009)	Loss 6.3254 (6.4040)	Top-1 acc 1.172 (0.818)	Top-5 acc 5.078 (3.452)	lr 0.04933
Warmup Train [3][3090/3239]	Time 0.385 (0.509)	Data 0.001 (0.009)	Loss 6.3245 (6.4038)	Top-1 acc 1.172 (0.819)	Top-5 acc 3.906 (3.452)	lr 0.04933
Warmup Train [3][3100/3239]	Time 0.567 (0.510)	Data 0.001 (0.009)	Loss 6.3798 (6.4036)	Top-1 acc 1.172 (0.820)	Top-5 acc 4.688 (3.453)	lr 0.04933
Warmup Train [3][3110/3239]	Time 0.435 (0.510)	Data 0.001 (0.009)	Loss 6.4116 (6.4035)	Top-1 acc 0.391 (0.820)	Top-5 acc 3.125 (3.455)	lr 0.04933
Warmup Train [3][3120/3239]	Time 0.578 (0.510)	Data 0.001 (0.009)	Loss 6.4100 (6.4033)	Top-1 acc 0.391 (0.820)	Top-5 acc 3.125 (3.458)	lr 0.04933
Warmup Train [3][3130/3239]	Time 0.648 (0.510)	Data 0.002 (0.009)	Loss 6.3176 (6.4031)	Top-1 acc 1.172 (0.821)	Top-5 acc 4.688 (3.461)	lr 0.04932
Warmup Train [3][3140/3239]	Time 0.472 (0.510)	Data 0.001 (0.009)	Loss 6.3465 (6.4030)	Top-1 acc 1.172 (0.821)	Top-5 acc 2.734 (3.463)	lr 0.04932
Warmup Train [3][3150/3239]	Time 0.522 (0.510)	Data 0.001 (0.009)	Loss 6.3119 (6.4028)	Top-1 acc 0.391 (0.822)	Top-5 acc 4.688 (3.464)	lr 0.04932
Warmup Train [3][3160/3239]	Time 0.578 (0.510)	Data 0.001 (0.009)	Loss 6.3991 (6.4027)	Top-1 acc 0.391 (0.821)	Top-5 acc 2.734 (3.466)	lr 0.04932
Warmup Train [3][3170/3239]	Time 0.627 (0.510)	Data 0.001 (0.009)	Loss 6.4146 (6.4026)	Top-1 acc 1.953 (0.822)	Top-5 acc 6.250 (3.467)	lr 0.04932
Warmup Train [3][3180/3239]	Time 0.453 (0.510)	Data 0.000 (0.009)	Loss 6.3323 (6.4024)	Top-1 acc 1.172 (0.823)	Top-5 acc 4.297 (3.469)	lr 0.04932
Warmup Train [3][3190/3239]	Time 0.523 (0.510)	Data 0.000 (0.009)	Loss 6.3514 (6.4023)	Top-1 acc 0.000 (0.823)	Top-5 acc 2.344 (3.469)	lr 0.04932
Warmup Train [3][3200/3239]	Time 0.574 (0.510)	Data 0.000 (0.009)	Loss 6.3355 (6.4021)	Top-1 acc 1.562 (0.825)	Top-5 acc 3.516 (3.473)	lr 0.04931
Warmup Train [3][3210/3239]	Time 0.373 (0.510)	Data 0.000 (0.009)	Loss 6.3082 (6.4019)	Top-1 acc 1.172 (0.826)	Top-5 acc 5.859 (3.476)	lr 0.04931
Warmup Train [3][3220/3239]	Time 0.508 (0.509)	Data 0.000 (0.009)	Loss 6.2544 (6.4017)	Top-1 acc 3.125 (0.827)	Top-5 acc 6.250 (3.479)	lr 0.04931
Warmup Train [3][3230/3239]	Time 0.543 (0.509)	Data 0.000 (0.009)	Loss 6.3707 (6.4015)	Top-1 acc 0.000 (0.828)	Top-5 acc 1.562 (3.480)	lr 0.04931
Warmup Train [3][3239/3239]	Time 0.437 (0.509)	Data 0.000 (0.009)	Loss 6.3398 (6.4014)	Top-1 acc 0.000 (0.828)	Top-5 acc 3.704 (3.480)	lr 0.04931
==========Warmup Valid [3/40]	loss 6.131	top-1 acc 1.184	top-5 acc 4.950	Train top-1 0.828	top-5 3.480	flops: 442.4M
Warmup Train [4][0/3239]	Time 8.218 (8.218)	Data 7.546 (7.546)	Loss 6.3693 (6.3693)	Top-1 acc 0.781 (0.781)	Top-5 acc 4.688 (4.688)	lr 0.04931
Warmup Train [4][10/3239]	Time 0.364 (1.289)	Data 0.001 (0.700)	Loss 6.2973 (6.3271)	Top-1 acc 1.953 (1.030)	Top-5 acc 5.469 (4.332)	lr 0.04931
Warmup Train [4][20/3239]	Time 0.330 (0.914)	Data 0.001 (0.372)	Loss 6.3641 (6.3329)	Top-1 acc 0.000 (0.911)	Top-5 acc 3.125 (4.297)	lr 0.04931
Warmup Train [4][30/3239]	Time 0.584 (0.786)	Data 0.001 (0.257)	Loss 6.3362 (6.3380)	Top-1 acc 2.344 (0.958)	Top-5 acc 5.078 (4.272)	lr 0.04930
Warmup Train [4][40/3239]	Time 0.505 (0.720)	Data 0.001 (0.194)	Loss 6.2331 (6.3422)	Top-1 acc 1.172 (0.857)	Top-5 acc 5.859 (4.154)	lr 0.04930
Warmup Train [4][50/3239]	Time 0.358 (0.676)	Data 0.002 (0.157)	Loss 6.3132 (6.3429)	Top-1 acc 0.000 (0.835)	Top-5 acc 3.906 (4.098)	lr 0.04930
Warmup Train [4][60/3239]	Time 0.513 (0.657)	Data 0.002 (0.134)	Loss 6.3489 (6.3409)	Top-1 acc 0.781 (0.884)	Top-5 acc 3.906 (4.118)	lr 0.04930
Warmup Train [4][70/3239]	Time 0.531 (0.636)	Data 0.001 (0.115)	Loss 6.3989 (6.3425)	Top-1 acc 0.000 (0.869)	Top-5 acc 2.734 (4.055)	lr 0.04930
Warmup Train [4][80/3239]	Time 0.569 (0.624)	Data 0.001 (0.101)	Loss 6.3232 (6.3406)	Top-1 acc 0.781 (0.883)	Top-5 acc 4.688 (4.114)	lr 0.04930
Warmup Train [4][90/3239]	Time 0.543 (0.609)	Data 0.001 (0.091)	Loss 6.3760 (6.3414)	Top-1 acc 0.781 (0.859)	Top-5 acc 2.734 (4.065)	lr 0.04930
Warmup Train [4][100/3239]	Time 0.572 (0.600)	Data 0.001 (0.082)	Loss 6.3610 (6.3416)	Top-1 acc 0.391 (0.847)	Top-5 acc 3.516 (4.080)	lr 0.04930
Warmup Train [4][110/3239]	Time 0.593 (0.593)	Data 0.001 (0.075)	Loss 6.3120 (6.3426)	Top-1 acc 1.172 (0.866)	Top-5 acc 3.906 (4.082)	lr 0.04929
Warmup Train [4][120/3239]	Time 0.632 (0.587)	Data 0.001 (0.069)	Loss 6.3684 (6.3415)	Top-1 acc 0.000 (0.852)	Top-5 acc 1.953 (4.026)	lr 0.04929
Warmup Train [4][130/3239]	Time 0.517 (0.582)	Data 0.001 (0.064)	Loss 6.3479 (6.3422)	Top-1 acc 0.391 (0.847)	Top-5 acc 1.953 (3.978)	lr 0.04929
Warmup Train [4][140/3239]	Time 0.384 (0.573)	Data 0.001 (0.059)	Loss 6.3645 (6.3428)	Top-1 acc 0.781 (0.878)	Top-5 acc 5.078 (3.995)	lr 0.04929
Warmup Train [4][150/3239]	Time 0.597 (0.570)	Data 0.001 (0.056)	Loss 6.3205 (6.3415)	Top-1 acc 2.344 (0.926)	Top-5 acc 5.078 (4.010)	lr 0.04929
Warmup Train [4][160/3239]	Time 0.488 (0.564)	Data 0.001 (0.053)	Loss 6.3133 (6.3410)	Top-1 acc 0.391 (0.920)	Top-5 acc 3.906 (4.006)	lr 0.04929
Warmup Train [4][170/3239]	Time 0.518 (0.561)	Data 0.001 (0.050)	Loss 6.2624 (6.3395)	Top-1 acc 0.781 (0.930)	Top-5 acc 4.297 (4.014)	lr 0.04928
Warmup Train [4][180/3239]	Time 0.603 (0.556)	Data 0.001 (0.048)	Loss 6.3715 (6.3385)	Top-1 acc 1.953 (0.937)	Top-5 acc 3.516 (4.031)	lr 0.04928
Warmup Train [4][190/3239]	Time 0.595 (0.554)	Data 0.001 (0.046)	Loss 6.3242 (6.3387)	Top-1 acc 1.172 (0.945)	Top-5 acc 4.297 (4.023)	lr 0.04928
Warmup Train [4][200/3239]	Time 0.614 (0.552)	Data 0.001 (0.043)	Loss 6.4031 (6.3399)	Top-1 acc 0.781 (0.948)	Top-5 acc 1.953 (4.023)	lr 0.04928
Warmup Train [4][210/3239]	Time 0.695 (0.551)	Data 0.001 (0.042)	Loss 6.2987 (6.3397)	Top-1 acc 3.516 (0.972)	Top-5 acc 7.422 (4.028)	lr 0.04928
Warmup Train [4][220/3239]	Time 0.503 (0.549)	Data 0.001 (0.040)	Loss 6.2476 (6.3398)	Top-1 acc 1.562 (0.981)	Top-5 acc 6.250 (4.023)	lr 0.04928
Warmup Train [4][230/3239]	Time 0.488 (0.548)	Data 0.002 (0.038)	Loss 6.3316 (6.3400)	Top-1 acc 0.391 (0.974)	Top-5 acc 3.516 (4.025)	lr 0.04928
Warmup Train [4][240/3239]	Time 0.552 (0.546)	Data 0.001 (0.037)	Loss 6.3559 (6.3396)	Top-1 acc 1.953 (0.974)	Top-5 acc 6.250 (4.026)	lr 0.04927
Warmup Train [4][250/3239]	Time 0.421 (0.544)	Data 0.001 (0.036)	Loss 6.3480 (6.3395)	Top-1 acc 0.391 (0.965)	Top-5 acc 2.734 (4.021)	lr 0.04927
Warmup Train [4][260/3239]	Time 0.592 (0.543)	Data 0.001 (0.035)	Loss 6.3502 (6.3397)	Top-1 acc 1.172 (0.970)	Top-5 acc 3.516 (4.033)	lr 0.04927
Warmup Train [4][270/3239]	Time 0.576 (0.543)	Data 0.001 (0.033)	Loss 6.3751 (6.3398)	Top-1 acc 0.781 (0.973)	Top-5 acc 3.516 (4.039)	lr 0.04927
Warmup Train [4][280/3239]	Time 0.497 (0.542)	Data 0.001 (0.032)	Loss 6.3223 (6.3391)	Top-1 acc 1.172 (0.986)	Top-5 acc 6.250 (4.062)	lr 0.04927
Warmup Train [4][290/3239]	Time 0.662 (0.542)	Data 0.002 (0.032)	Loss 6.3172 (6.3390)	Top-1 acc 1.172 (0.991)	Top-5 acc 3.906 (4.085)	lr 0.04927
Warmup Train [4][300/3239]	Time 0.395 (0.541)	Data 0.001 (0.031)	Loss 6.2908 (6.3387)	Top-1 acc 0.781 (0.982)	Top-5 acc 3.516 (4.083)	lr 0.04927
Warmup Train [4][310/3239]	Time 0.564 (0.541)	Data 0.001 (0.030)	Loss 6.3801 (6.3383)	Top-1 acc 1.562 (0.991)	Top-5 acc 2.344 (4.098)	lr 0.04926
Warmup Train [4][320/3239]	Time 0.677 (0.540)	Data 0.001 (0.029)	Loss 6.3629 (6.3385)	Top-1 acc 0.391 (0.995)	Top-5 acc 2.344 (4.102)	lr 0.04926
Warmup Train [4][330/3239]	Time 0.498 (0.539)	Data 0.001 (0.028)	Loss 6.2929 (6.3386)	Top-1 acc 0.781 (0.997)	Top-5 acc 2.734 (4.105)	lr 0.04926
Warmup Train [4][340/3239]	Time 0.692 (0.538)	Data 0.001 (0.028)	Loss 6.3523 (6.3379)	Top-1 acc 0.000 (0.989)	Top-5 acc 2.344 (4.092)	lr 0.04926
Warmup Train [4][350/3239]	Time 0.598 (0.537)	Data 0.001 (0.027)	Loss 6.3808 (6.3387)	Top-1 acc 0.781 (0.987)	Top-5 acc 3.125 (4.080)	lr 0.04926
Warmup Train [4][360/3239]	Time 0.421 (0.536)	Data 0.001 (0.026)	Loss 6.3557 (6.3386)	Top-1 acc 0.391 (0.983)	Top-5 acc 3.906 (4.075)	lr 0.04926
Warmup Train [4][370/3239]	Time 0.569 (0.536)	Data 0.001 (0.026)	Loss 6.3526 (6.3385)	Top-1 acc 0.391 (0.974)	Top-5 acc 2.734 (4.063)	lr 0.04926
Warmup Train [4][380/3239]	Time 0.467 (0.535)	Data 0.001 (0.025)	Loss 6.3509 (6.3384)	Top-1 acc 0.000 (0.969)	Top-5 acc 1.953 (4.052)	lr 0.04925
Warmup Train [4][390/3239]	Time 0.293 (0.534)	Data 0.001 (0.025)	Loss 6.3349 (6.3387)	Top-1 acc 1.562 (0.962)	Top-5 acc 5.859 (4.048)	lr 0.04925
Warmup Train [4][400/3239]	Time 0.568 (0.533)	Data 0.001 (0.025)	Loss 6.3745 (6.3387)	Top-1 acc 1.172 (0.966)	Top-5 acc 2.344 (4.038)	lr 0.04925
Warmup Train [4][410/3239]	Time 0.355 (0.532)	Data 0.001 (0.024)	Loss 6.3382 (6.3383)	Top-1 acc 0.391 (0.962)	Top-5 acc 3.125 (4.036)	lr 0.04925
Warmup Train [4][420/3239]	Time 0.492 (0.531)	Data 0.001 (0.024)	Loss 6.3157 (6.3380)	Top-1 acc 0.781 (0.963)	Top-5 acc 4.297 (4.042)	lr 0.04925
Warmup Train [4][430/3239]	Time 0.330 (0.530)	Data 0.001 (0.023)	Loss 6.2749 (6.3378)	Top-1 acc 1.172 (0.964)	Top-5 acc 5.469 (4.054)	lr 0.04925
Warmup Train [4][440/3239]	Time 0.448 (0.529)	Data 0.001 (0.024)	Loss 6.4180 (6.3376)	Top-1 acc 0.391 (0.965)	Top-5 acc 3.516 (4.048)	lr 0.04925
Warmup Train [4][450/3239]	Time 0.661 (0.529)	Data 0.001 (0.023)	Loss 6.2256 (6.3364)	Top-1 acc 1.562 (0.967)	Top-5 acc 7.031 (4.057)	lr 0.04924
Warmup Train [4][460/3239]	Time 0.414 (0.529)	Data 0.001 (0.023)	Loss 6.3379 (6.3366)	Top-1 acc 0.000 (0.969)	Top-5 acc 3.906 (4.052)	lr 0.04924
Warmup Train [4][470/3239]	Time 0.481 (0.528)	Data 0.001 (0.022)	Loss 6.2899 (6.3358)	Top-1 acc 3.125 (0.967)	Top-5 acc 6.250 (4.073)	lr 0.04924
Warmup Train [4][480/3239]	Time 0.503 (0.528)	Data 0.001 (0.022)	Loss 6.3351 (6.3356)	Top-1 acc 1.562 (0.966)	Top-5 acc 6.641 (4.073)	lr 0.04924
Warmup Train [4][490/3239]	Time 0.562 (0.528)	Data 0.002 (0.022)	Loss 6.3044 (6.3350)	Top-1 acc 0.781 (0.963)	Top-5 acc 6.250 (4.079)	lr 0.04924
Warmup Train [4][500/3239]	Time 0.564 (0.528)	Data 0.001 (0.022)	Loss 6.3539 (6.3356)	Top-1 acc 0.391 (0.955)	Top-5 acc 3.516 (4.065)	lr 0.04924
Warmup Train [4][510/3239]	Time 0.513 (0.528)	Data 0.001 (0.021)	Loss 6.3207 (6.3358)	Top-1 acc 1.953 (0.960)	Top-5 acc 5.469 (4.071)	lr 0.04924
Warmup Train [4][520/3239]	Time 0.662 (0.528)	Data 0.001 (0.021)	Loss 6.3859 (6.3359)	Top-1 acc 1.562 (0.961)	Top-5 acc 3.125 (4.064)	lr 0.04923
Warmup Train [4][530/3239]	Time 0.540 (0.527)	Data 0.001 (0.021)	Loss 6.3347 (6.3357)	Top-1 acc 0.000 (0.956)	Top-5 acc 3.125 (4.068)	lr 0.04923
Warmup Train [4][540/3239]	Time 0.629 (0.527)	Data 0.001 (0.020)	Loss 6.2636 (6.3358)	Top-1 acc 2.344 (0.961)	Top-5 acc 7.422 (4.068)	lr 0.04923
Warmup Train [4][550/3239]	Time 0.479 (0.527)	Data 0.001 (0.020)	Loss 6.3577 (6.3358)	Top-1 acc 2.344 (0.962)	Top-5 acc 5.859 (4.081)	lr 0.04923
Warmup Train [4][560/3239]	Time 0.462 (0.526)	Data 0.001 (0.020)	Loss 6.2991 (6.3360)	Top-1 acc 1.172 (0.962)	Top-5 acc 5.859 (4.077)	lr 0.04923
Warmup Train [4][570/3239]	Time 0.545 (0.526)	Data 0.001 (0.020)	Loss 6.3656 (6.3359)	Top-1 acc 0.781 (0.966)	Top-5 acc 3.906 (4.084)	lr 0.04923
Warmup Train [4][580/3239]	Time 0.506 (0.526)	Data 0.001 (0.019)	Loss 6.3305 (6.3359)	Top-1 acc 1.172 (0.965)	Top-5 acc 5.078 (4.076)	lr 0.04922
Warmup Train [4][590/3239]	Time 0.507 (0.525)	Data 0.001 (0.019)	Loss 6.3267 (6.3357)	Top-1 acc 1.953 (0.966)	Top-5 acc 2.734 (4.077)	lr 0.04922
Warmup Train [4][600/3239]	Time 0.618 (0.525)	Data 0.001 (0.019)	Loss 6.4232 (6.3356)	Top-1 acc 0.391 (0.968)	Top-5 acc 3.125 (4.078)	lr 0.04922
Warmup Train [4][610/3239]	Time 0.592 (0.525)	Data 0.001 (0.019)	Loss 6.3283 (6.3355)	Top-1 acc 1.172 (0.969)	Top-5 acc 3.516 (4.078)	lr 0.04922
Warmup Train [4][620/3239]	Time 0.639 (0.525)	Data 0.001 (0.019)	Loss 6.3174 (6.3352)	Top-1 acc 1.562 (0.974)	Top-5 acc 5.078 (4.082)	lr 0.04922
Warmup Train [4][630/3239]	Time 0.468 (0.525)	Data 0.001 (0.018)	Loss 6.3058 (6.3353)	Top-1 acc 0.781 (0.977)	Top-5 acc 4.688 (4.084)	lr 0.04922
Warmup Train [4][640/3239]	Time 0.454 (0.524)	Data 0.001 (0.018)	Loss 6.4083 (6.3349)	Top-1 acc 0.781 (0.977)	Top-5 acc 2.734 (4.082)	lr 0.04922
Warmup Train [4][650/3239]	Time 0.501 (0.524)	Data 0.001 (0.018)	Loss 6.3050 (6.3345)	Top-1 acc 1.172 (0.978)	Top-5 acc 4.297 (4.093)	lr 0.04921
Warmup Train [4][660/3239]	Time 0.326 (0.523)	Data 0.001 (0.018)	Loss 6.3296 (6.3346)	Top-1 acc 0.781 (0.981)	Top-5 acc 5.078 (4.102)	lr 0.04921
Warmup Train [4][670/3239]	Time 0.474 (0.523)	Data 0.001 (0.018)	Loss 6.3018 (6.3341)	Top-1 acc 0.781 (0.980)	Top-5 acc 2.734 (4.110)	lr 0.04921
Warmup Train [4][680/3239]	Time 0.278 (0.522)	Data 0.001 (0.018)	Loss 6.3429 (6.3338)	Top-1 acc 0.781 (0.981)	Top-5 acc 4.688 (4.107)	lr 0.04921
Warmup Train [4][690/3239]	Time 0.644 (0.522)	Data 0.001 (0.018)	Loss 6.2962 (6.3330)	Top-1 acc 0.391 (0.979)	Top-5 acc 4.297 (4.107)	lr 0.04921
Warmup Train [4][700/3239]	Time 0.453 (0.521)	Data 0.001 (0.017)	Loss 6.2408 (6.3326)	Top-1 acc 1.562 (0.982)	Top-5 acc 5.078 (4.116)	lr 0.04921
Warmup Train [4][710/3239]	Time 0.536 (0.521)	Data 0.002 (0.017)	Loss 6.2777 (6.3323)	Top-1 acc 1.953 (0.983)	Top-5 acc 4.688 (4.122)	lr 0.04921
Warmup Train [4][720/3239]	Time 0.576 (0.521)	Data 0.001 (0.017)	Loss 6.3316 (6.3322)	Top-1 acc 1.562 (0.982)	Top-5 acc 3.516 (4.118)	lr 0.04920
Warmup Train [4][730/3239]	Time 0.608 (0.520)	Data 0.001 (0.017)	Loss 6.2798 (6.3316)	Top-1 acc 1.953 (0.985)	Top-5 acc 4.688 (4.121)	lr 0.04920
Warmup Train [4][740/3239]	Time 0.585 (0.520)	Data 0.001 (0.017)	Loss 6.3873 (6.3311)	Top-1 acc 1.562 (0.986)	Top-5 acc 4.688 (4.136)	lr 0.04920
Warmup Train [4][750/3239]	Time 0.645 (0.520)	Data 0.001 (0.017)	Loss 6.3785 (6.3308)	Top-1 acc 0.391 (0.988)	Top-5 acc 3.516 (4.141)	lr 0.04920
Warmup Train [4][760/3239]	Time 0.387 (0.520)	Data 0.001 (0.016)	Loss 6.2662 (6.3306)	Top-1 acc 3.125 (0.990)	Top-5 acc 5.859 (4.142)	lr 0.04920
Warmup Train [4][770/3239]	Time 0.463 (0.520)	Data 0.001 (0.016)	Loss 6.2998 (6.3304)	Top-1 acc 1.562 (0.993)	Top-5 acc 5.078 (4.151)	lr 0.04920
Warmup Train [4][780/3239]	Time 0.483 (0.520)	Data 0.001 (0.016)	Loss 6.3788 (6.3304)	Top-1 acc 0.391 (0.992)	Top-5 acc 1.172 (4.153)	lr 0.04919
Warmup Train [4][790/3239]	Time 0.408 (0.520)	Data 0.001 (0.016)	Loss 6.2572 (6.3301)	Top-1 acc 0.781 (0.991)	Top-5 acc 4.688 (4.151)	lr 0.04919
Warmup Train [4][800/3239]	Time 0.756 (0.520)	Data 0.001 (0.016)	Loss 6.3238 (6.3300)	Top-1 acc 0.391 (0.989)	Top-5 acc 3.906 (4.154)	lr 0.04919
Warmup Train [4][810/3239]	Time 0.328 (0.520)	Data 0.001 (0.016)	Loss 6.3325 (6.3297)	Top-1 acc 0.391 (0.988)	Top-5 acc 5.078 (4.160)	lr 0.04919
Warmup Train [4][820/3239]	Time 0.429 (0.519)	Data 0.001 (0.016)	Loss 6.3380 (6.3298)	Top-1 acc 0.781 (0.988)	Top-5 acc 3.516 (4.157)	lr 0.04919
Warmup Train [4][830/3239]	Time 0.569 (0.519)	Data 0.001 (0.016)	Loss 6.3402 (6.3297)	Top-1 acc 1.562 (0.990)	Top-5 acc 5.859 (4.164)	lr 0.04919
Warmup Train [4][840/3239]	Time 0.589 (0.520)	Data 0.001 (0.016)	Loss 6.2424 (6.3295)	Top-1 acc 0.781 (0.994)	Top-5 acc 6.250 (4.175)	lr 0.04919
Warmup Train [4][850/3239]	Time 0.628 (0.520)	Data 0.001 (0.016)	Loss 6.3007 (6.3294)	Top-1 acc 1.953 (0.993)	Top-5 acc 5.469 (4.171)	lr 0.04918
Warmup Train [4][860/3239]	Time 0.460 (0.519)	Data 0.001 (0.015)	Loss 6.2601 (6.3292)	Top-1 acc 1.562 (0.994)	Top-5 acc 4.297 (4.171)	lr 0.04918
Warmup Train [4][870/3239]	Time 0.688 (0.519)	Data 0.001 (0.015)	Loss 6.2394 (6.3293)	Top-1 acc 0.391 (0.994)	Top-5 acc 4.688 (4.170)	lr 0.04918
Warmup Train [4][880/3239]	Time 0.444 (0.519)	Data 0.001 (0.015)	Loss 6.3351 (6.3292)	Top-1 acc 1.172 (0.994)	Top-5 acc 4.688 (4.171)	lr 0.04918
Warmup Train [4][890/3239]	Time 0.565 (0.519)	Data 0.001 (0.015)	Loss 6.2982 (6.3288)	Top-1 acc 1.172 (0.997)	Top-5 acc 4.297 (4.176)	lr 0.04918
Warmup Train [4][900/3239]	Time 0.514 (0.519)	Data 0.001 (0.015)	Loss 6.2667 (6.3287)	Top-1 acc 1.562 (0.999)	Top-5 acc 5.078 (4.184)	lr 0.04918
Warmup Train [4][910/3239]	Time 0.630 (0.519)	Data 0.001 (0.015)	Loss 6.3382 (6.3285)	Top-1 acc 0.781 (1.002)	Top-5 acc 4.297 (4.186)	lr 0.04917
Warmup Train [4][920/3239]	Time 0.579 (0.519)	Data 0.001 (0.015)	Loss 6.3701 (6.3282)	Top-1 acc 2.344 (1.003)	Top-5 acc 4.688 (4.187)	lr 0.04917
Warmup Train [4][930/3239]	Time 0.609 (0.518)	Data 0.002 (0.015)	Loss 6.2520 (6.3279)	Top-1 acc 0.781 (1.002)	Top-5 acc 4.297 (4.187)	lr 0.04917
Warmup Train [4][940/3239]	Time 0.349 (0.518)	Data 0.001 (0.014)	Loss 6.2888 (6.3276)	Top-1 acc 1.172 (1.003)	Top-5 acc 4.297 (4.197)	lr 0.04917
Warmup Train [4][950/3239]	Time 0.634 (0.517)	Data 0.001 (0.014)	Loss 6.2481 (6.3275)	Top-1 acc 2.734 (1.004)	Top-5 acc 8.984 (4.202)	lr 0.04917
Warmup Train [4][960/3239]	Time 0.164 (0.515)	Data 0.001 (0.014)	Loss 6.3174 (6.3273)	Top-1 acc 0.781 (1.006)	Top-5 acc 3.516 (4.201)	lr 0.04917
Warmup Train [4][970/3239]	Time 0.374 (0.513)	Data 0.001 (0.014)	Loss 6.2898 (6.3270)	Top-1 acc 0.781 (1.005)	Top-5 acc 4.297 (4.206)	lr 0.04917
Warmup Train [4][980/3239]	Time 0.396 (0.512)	Data 0.001 (0.014)	Loss 6.3469 (6.3269)	Top-1 acc 1.172 (1.004)	Top-5 acc 3.125 (4.207)	lr 0.04916
Warmup Train [4][990/3239]	Time 0.446 (0.512)	Data 0.001 (0.014)	Loss 6.2802 (6.3266)	Top-1 acc 2.344 (1.007)	Top-5 acc 4.688 (4.214)	lr 0.04916
Warmup Train [4][1000/3239]	Time 0.614 (0.512)	Data 0.001 (0.014)	Loss 6.3636 (6.3261)	Top-1 acc 0.391 (1.005)	Top-5 acc 5.469 (4.220)	lr 0.04916
Warmup Train [4][1010/3239]	Time 0.525 (0.512)	Data 0.001 (0.014)	Loss 6.4033 (6.3260)	Top-1 acc 0.391 (1.005)	Top-5 acc 1.953 (4.223)	lr 0.04916
Warmup Train [4][1020/3239]	Time 0.343 (0.512)	Data 0.001 (0.014)	Loss 6.2592 (6.3259)	Top-1 acc 1.562 (1.009)	Top-5 acc 4.297 (4.221)	lr 0.04916
Warmup Train [4][1030/3239]	Time 0.391 (0.512)	Data 0.001 (0.014)	Loss 6.3318 (6.3257)	Top-1 acc 0.000 (1.012)	Top-5 acc 4.297 (4.226)	lr 0.04916
Warmup Train [4][1040/3239]	Time 0.395 (0.512)	Data 0.001 (0.014)	Loss 6.3085 (6.3255)	Top-1 acc 1.562 (1.014)	Top-5 acc 2.344 (4.230)	lr 0.04915
Warmup Train [4][1050/3239]	Time 0.473 (0.512)	Data 0.001 (0.014)	Loss 6.3113 (6.3253)	Top-1 acc 0.781 (1.015)	Top-5 acc 4.297 (4.231)	lr 0.04915
Warmup Train [4][1060/3239]	Time 0.514 (0.512)	Data 0.001 (0.014)	Loss 6.2881 (6.3251)	Top-1 acc 0.781 (1.016)	Top-5 acc 3.906 (4.232)	lr 0.04915
Warmup Train [4][1070/3239]	Time 0.674 (0.512)	Data 0.001 (0.014)	Loss 6.3110 (6.3248)	Top-1 acc 1.953 (1.020)	Top-5 acc 6.641 (4.239)	lr 0.04915
Warmup Train [4][1080/3239]	Time 0.510 (0.512)	Data 0.001 (0.014)	Loss 6.2711 (6.3247)	Top-1 acc 1.172 (1.020)	Top-5 acc 5.469 (4.240)	lr 0.04915
Warmup Train [4][1090/3239]	Time 0.403 (0.512)	Data 0.002 (0.013)	Loss 6.3226 (6.3245)	Top-1 acc 1.172 (1.021)	Top-5 acc 4.688 (4.241)	lr 0.04915
Warmup Train [4][1100/3239]	Time 0.404 (0.512)	Data 0.001 (0.013)	Loss 6.3046 (6.3242)	Top-1 acc 1.172 (1.023)	Top-5 acc 6.250 (4.248)	lr 0.04915
Warmup Train [4][1110/3239]	Time 0.594 (0.512)	Data 0.001 (0.013)	Loss 6.3584 (6.3242)	Top-1 acc 1.172 (1.023)	Top-5 acc 5.078 (4.253)	lr 0.04914
Warmup Train [4][1120/3239]	Time 0.495 (0.512)	Data 0.001 (0.013)	Loss 6.2456 (6.3241)	Top-1 acc 1.172 (1.023)	Top-5 acc 2.734 (4.251)	lr 0.04914
Warmup Train [4][1130/3239]	Time 0.645 (0.513)	Data 0.001 (0.013)	Loss 6.2683 (6.3237)	Top-1 acc 1.562 (1.026)	Top-5 acc 6.250 (4.253)	lr 0.04914
Warmup Train [4][1140/3239]	Time 0.387 (0.513)	Data 0.002 (0.013)	Loss 6.2532 (6.3232)	Top-1 acc 1.953 (1.029)	Top-5 acc 4.688 (4.262)	lr 0.04914
Warmup Train [4][1150/3239]	Time 0.612 (0.513)	Data 0.001 (0.013)	Loss 6.2453 (6.3228)	Top-1 acc 1.172 (1.032)	Top-5 acc 5.078 (4.271)	lr 0.04914
Warmup Train [4][1160/3239]	Time 0.682 (0.513)	Data 0.001 (0.013)	Loss 6.2904 (6.3224)	Top-1 acc 0.781 (1.033)	Top-5 acc 2.734 (4.273)	lr 0.04914
Warmup Train [4][1170/3239]	Time 0.470 (0.513)	Data 0.001 (0.013)	Loss 6.2747 (6.3223)	Top-1 acc 0.781 (1.033)	Top-5 acc 3.516 (4.274)	lr 0.04913
Warmup Train [4][1180/3239]	Time 0.460 (0.513)	Data 0.001 (0.013)	Loss 6.3124 (6.3220)	Top-1 acc 0.781 (1.032)	Top-5 acc 3.906 (4.271)	lr 0.04913
Warmup Train [4][1190/3239]	Time 0.487 (0.513)	Data 0.001 (0.013)	Loss 6.3147 (6.3217)	Top-1 acc 1.953 (1.033)	Top-5 acc 6.250 (4.278)	lr 0.04913
Warmup Train [4][1200/3239]	Time 0.519 (0.513)	Data 0.001 (0.013)	Loss 6.2117 (6.3215)	Top-1 acc 1.562 (1.035)	Top-5 acc 5.859 (4.279)	lr 0.04913
Warmup Train [4][1210/3239]	Time 0.531 (0.513)	Data 0.001 (0.013)	Loss 6.3794 (6.3215)	Top-1 acc 0.781 (1.035)	Top-5 acc 2.734 (4.278)	lr 0.04913
Warmup Train [4][1220/3239]	Time 0.570 (0.512)	Data 0.001 (0.013)	Loss 6.3116 (6.3212)	Top-1 acc 0.781 (1.036)	Top-5 acc 3.906 (4.280)	lr 0.04913
Warmup Train [4][1230/3239]	Time 0.583 (0.512)	Data 0.001 (0.013)	Loss 6.2733 (6.3209)	Top-1 acc 0.391 (1.039)	Top-5 acc 3.516 (4.283)	lr 0.04912
Warmup Train [4][1240/3239]	Time 0.599 (0.512)	Data 0.001 (0.013)	Loss 6.2682 (6.3207)	Top-1 acc 0.391 (1.039)	Top-5 acc 7.031 (4.283)	lr 0.04912
Warmup Train [4][1250/3239]	Time 0.499 (0.512)	Data 0.001 (0.013)	Loss 6.2800 (6.3203)	Top-1 acc 1.172 (1.040)	Top-5 acc 5.078 (4.285)	lr 0.04912
Warmup Train [4][1260/3239]	Time 0.557 (0.512)	Data 0.001 (0.013)	Loss 6.2594 (6.3199)	Top-1 acc 0.781 (1.040)	Top-5 acc 4.297 (4.290)	lr 0.04912
Warmup Train [4][1270/3239]	Time 0.646 (0.512)	Data 0.001 (0.013)	Loss 6.2083 (6.3195)	Top-1 acc 0.781 (1.043)	Top-5 acc 5.469 (4.294)	lr 0.04912
Warmup Train [4][1280/3239]	Time 0.564 (0.512)	Data 0.001 (0.013)	Loss 6.3428 (6.3192)	Top-1 acc 1.172 (1.048)	Top-5 acc 3.906 (4.302)	lr 0.04912
Warmup Train [4][1290/3239]	Time 0.576 (0.512)	Data 0.001 (0.013)	Loss 6.2295 (6.3188)	Top-1 acc 0.781 (1.050)	Top-5 acc 3.906 (4.308)	lr 0.04911
Warmup Train [4][1300/3239]	Time 0.553 (0.512)	Data 0.001 (0.012)	Loss 6.2910 (6.3184)	Top-1 acc 1.562 (1.050)	Top-5 acc 5.078 (4.311)	lr 0.04911
Warmup Train [4][1310/3239]	Time 0.505 (0.512)	Data 0.001 (0.012)	Loss 6.2715 (6.3180)	Top-1 acc 0.781 (1.050)	Top-5 acc 3.906 (4.314)	lr 0.04911
Warmup Train [4][1320/3239]	Time 0.549 (0.512)	Data 0.001 (0.012)	Loss 6.1966 (6.3174)	Top-1 acc 2.734 (1.052)	Top-5 acc 5.469 (4.316)	lr 0.04911
Warmup Train [4][1330/3239]	Time 0.586 (0.512)	Data 0.001 (0.012)	Loss 6.3359 (6.3170)	Top-1 acc 0.391 (1.053)	Top-5 acc 3.125 (4.322)	lr 0.04911
Warmup Train [4][1340/3239]	Time 0.576 (0.512)	Data 0.001 (0.012)	Loss 6.3564 (6.3165)	Top-1 acc 1.172 (1.053)	Top-5 acc 2.734 (4.326)	lr 0.04911
Warmup Train [4][1350/3239]	Time 0.534 (0.512)	Data 0.001 (0.012)	Loss 6.3044 (6.3164)	Top-1 acc 0.391 (1.052)	Top-5 acc 3.516 (4.321)	lr 0.04911
Warmup Train [4][1360/3239]	Time 0.575 (0.512)	Data 0.001 (0.012)	Loss 6.2700 (6.3161)	Top-1 acc 1.172 (1.054)	Top-5 acc 4.688 (4.328)	lr 0.04910
Warmup Train [4][1370/3239]	Time 0.533 (0.512)	Data 0.001 (0.012)	Loss 6.2895 (6.3158)	Top-1 acc 0.781 (1.054)	Top-5 acc 4.297 (4.329)	lr 0.04910
Warmup Train [4][1380/3239]	Time 0.803 (0.512)	Data 0.001 (0.012)	Loss 6.3458 (6.3155)	Top-1 acc 0.391 (1.054)	Top-5 acc 3.516 (4.330)	lr 0.04910
Warmup Train [4][1390/3239]	Time 0.482 (0.512)	Data 0.001 (0.012)	Loss 6.2623 (6.3152)	Top-1 acc 0.000 (1.053)	Top-5 acc 3.125 (4.331)	lr 0.04910
Warmup Train [4][1400/3239]	Time 0.395 (0.512)	Data 0.001 (0.012)	Loss 6.3266 (6.3150)	Top-1 acc 1.172 (1.056)	Top-5 acc 4.688 (4.332)	lr 0.04910
Warmup Train [4][1410/3239]	Time 0.656 (0.512)	Data 0.001 (0.012)	Loss 6.2953 (6.3147)	Top-1 acc 0.391 (1.054)	Top-5 acc 5.078 (4.337)	lr 0.04910
Warmup Train [4][1420/3239]	Time 0.485 (0.512)	Data 0.001 (0.012)	Loss 6.3383 (6.3146)	Top-1 acc 1.172 (1.055)	Top-5 acc 4.297 (4.340)	lr 0.04909
Warmup Train [4][1430/3239]	Time 0.568 (0.513)	Data 0.001 (0.012)	Loss 6.2760 (6.3143)	Top-1 acc 1.172 (1.057)	Top-5 acc 5.469 (4.345)	lr 0.04909
Warmup Train [4][1440/3239]	Time 0.608 (0.513)	Data 0.001 (0.012)	Loss 6.2626 (6.3141)	Top-1 acc 1.562 (1.057)	Top-5 acc 3.906 (4.348)	lr 0.04909
Warmup Train [4][1450/3239]	Time 0.522 (0.512)	Data 0.001 (0.012)	Loss 6.2660 (6.3138)	Top-1 acc 0.781 (1.059)	Top-5 acc 5.859 (4.354)	lr 0.04909
Warmup Train [4][1460/3239]	Time 0.526 (0.512)	Data 0.001 (0.011)	Loss 6.2777 (6.3136)	Top-1 acc 0.781 (1.063)	Top-5 acc 6.641 (4.365)	lr 0.04909
Warmup Train [4][1470/3239]	Time 0.575 (0.512)	Data 0.001 (0.011)	Loss 6.2204 (6.3132)	Top-1 acc 0.781 (1.064)	Top-5 acc 5.859 (4.371)	lr 0.04909
Warmup Train [4][1480/3239]	Time 0.522 (0.512)	Data 0.001 (0.011)	Loss 6.2864 (6.3131)	Top-1 acc 1.172 (1.064)	Top-5 acc 3.906 (4.374)	lr 0.04908
Warmup Train [4][1490/3239]	Time 0.182 (0.512)	Data 0.001 (0.011)	Loss 6.2967 (6.3130)	Top-1 acc 1.562 (1.065)	Top-5 acc 6.250 (4.381)	lr 0.04908
Warmup Train [4][1500/3239]	Time 0.576 (0.512)	Data 0.001 (0.011)	Loss 6.2177 (6.3128)	Top-1 acc 0.781 (1.067)	Top-5 acc 5.859 (4.380)	lr 0.04908
Warmup Train [4][1510/3239]	Time 0.359 (0.512)	Data 0.001 (0.011)	Loss 6.2040 (6.3127)	Top-1 acc 2.344 (1.067)	Top-5 acc 5.469 (4.378)	lr 0.04908
Warmup Train [4][1520/3239]	Time 0.527 (0.512)	Data 0.001 (0.011)	Loss 6.2892 (6.3126)	Top-1 acc 1.172 (1.066)	Top-5 acc 4.688 (4.376)	lr 0.04908
Warmup Train [4][1530/3239]	Time 0.603 (0.512)	Data 0.001 (0.011)	Loss 6.2202 (6.3123)	Top-1 acc 1.562 (1.069)	Top-5 acc 4.688 (4.383)	lr 0.04908
Warmup Train [4][1540/3239]	Time 0.389 (0.512)	Data 0.001 (0.011)	Loss 6.3214 (6.3122)	Top-1 acc 1.172 (1.071)	Top-5 acc 2.734 (4.387)	lr 0.04907
Warmup Train [4][1550/3239]	Time 0.493 (0.512)	Data 0.001 (0.011)	Loss 6.2858 (6.3120)	Top-1 acc 1.172 (1.072)	Top-5 acc 5.469 (4.391)	lr 0.04907
Warmup Train [4][1560/3239]	Time 0.505 (0.512)	Data 0.001 (0.011)	Loss 6.2417 (6.3117)	Top-1 acc 0.781 (1.073)	Top-5 acc 4.297 (4.398)	lr 0.04907
Warmup Train [4][1570/3239]	Time 0.488 (0.512)	Data 0.001 (0.011)	Loss 6.2302 (6.3114)	Top-1 acc 0.781 (1.072)	Top-5 acc 5.469 (4.399)	lr 0.04907
Warmup Train [4][1580/3239]	Time 0.658 (0.512)	Data 0.001 (0.011)	Loss 6.1939 (6.3110)	Top-1 acc 2.344 (1.075)	Top-5 acc 5.859 (4.404)	lr 0.04907
Warmup Train [4][1590/3239]	Time 0.581 (0.512)	Data 0.001 (0.011)	Loss 6.3337 (6.3109)	Top-1 acc 0.391 (1.074)	Top-5 acc 5.078 (4.406)	lr 0.04907
Warmup Train [4][1600/3239]	Time 0.405 (0.512)	Data 0.001 (0.011)	Loss 6.2261 (6.3106)	Top-1 acc 0.391 (1.076)	Top-5 acc 5.078 (4.413)	lr 0.04906
Warmup Train [4][1610/3239]	Time 0.562 (0.512)	Data 0.001 (0.011)	Loss 6.2512 (6.3103)	Top-1 acc 0.781 (1.078)	Top-5 acc 4.688 (4.417)	lr 0.04906
Warmup Train [4][1620/3239]	Time 0.475 (0.512)	Data 0.001 (0.011)	Loss 6.2725 (6.3101)	Top-1 acc 2.734 (1.079)	Top-5 acc 6.641 (4.423)	lr 0.04906
Warmup Train [4][1630/3239]	Time 0.534 (0.512)	Data 0.001 (0.011)	Loss 6.2429 (6.3098)	Top-1 acc 1.172 (1.080)	Top-5 acc 4.297 (4.425)	lr 0.04906
Warmup Train [4][1640/3239]	Time 0.550 (0.512)	Data 0.001 (0.011)	Loss 6.2811 (6.3097)	Top-1 acc 1.562 (1.079)	Top-5 acc 2.734 (4.424)	lr 0.04906
Warmup Train [4][1650/3239]	Time 0.509 (0.512)	Data 0.001 (0.011)	Loss 6.3212 (6.3094)	Top-1 acc 1.172 (1.078)	Top-5 acc 3.906 (4.425)	lr 0.04906
Warmup Train [4][1660/3239]	Time 0.631 (0.512)	Data 0.001 (0.011)	Loss 6.2116 (6.3090)	Top-1 acc 1.562 (1.079)	Top-5 acc 5.078 (4.424)	lr 0.04905
Warmup Train [4][1670/3239]	Time 0.593 (0.512)	Data 0.001 (0.011)	Loss 6.2783 (6.3087)	Top-1 acc 2.344 (1.082)	Top-5 acc 3.516 (4.428)	lr 0.04905
Warmup Train [4][1680/3239]	Time 0.609 (0.512)	Data 0.001 (0.011)	Loss 6.2363 (6.3084)	Top-1 acc 2.734 (1.084)	Top-5 acc 5.859 (4.430)	lr 0.04905
Warmup Train [4][1690/3239]	Time 0.596 (0.512)	Data 0.001 (0.011)	Loss 6.2311 (6.3082)	Top-1 acc 0.000 (1.083)	Top-5 acc 4.688 (4.434)	lr 0.04905
Warmup Train [4][1700/3239]	Time 0.551 (0.512)	Data 0.001 (0.011)	Loss 6.2938 (6.3079)	Top-1 acc 1.172 (1.086)	Top-5 acc 4.688 (4.439)	lr 0.04905
Warmup Train [4][1710/3239]	Time 0.527 (0.512)	Data 0.001 (0.011)	Loss 6.3015 (6.3077)	Top-1 acc 1.172 (1.085)	Top-5 acc 3.906 (4.438)	lr 0.04905
Warmup Train [4][1720/3239]	Time 0.626 (0.512)	Data 0.001 (0.011)	Loss 6.1763 (6.3074)	Top-1 acc 0.781 (1.084)	Top-5 acc 6.250 (4.436)	lr 0.04904
Warmup Train [4][1730/3239]	Time 0.556 (0.512)	Data 0.001 (0.010)	Loss 6.2158 (6.3071)	Top-1 acc 0.781 (1.085)	Top-5 acc 3.516 (4.438)	lr 0.04904
Warmup Train [4][1740/3239]	Time 0.602 (0.512)	Data 0.001 (0.010)	Loss 6.3285 (6.3069)	Top-1 acc 1.172 (1.089)	Top-5 acc 4.688 (4.440)	lr 0.04904
Warmup Train [4][1750/3239]	Time 0.485 (0.512)	Data 0.001 (0.010)	Loss 6.2553 (6.3064)	Top-1 acc 1.172 (1.090)	Top-5 acc 3.125 (4.445)	lr 0.04904
Warmup Train [4][1760/3239]	Time 0.366 (0.511)	Data 0.001 (0.010)	Loss 6.2610 (6.3061)	Top-1 acc 0.781 (1.092)	Top-5 acc 5.469 (4.452)	lr 0.04904
Warmup Train [4][1770/3239]	Time 0.492 (0.511)	Data 0.001 (0.010)	Loss 6.2821 (6.3058)	Top-1 acc 1.172 (1.092)	Top-5 acc 5.078 (4.457)	lr 0.04904
Warmup Train [4][1780/3239]	Time 0.348 (0.511)	Data 0.001 (0.010)	Loss 6.2437 (6.3054)	Top-1 acc 1.953 (1.097)	Top-5 acc 7.031 (4.462)	lr 0.04903
Warmup Train [4][1790/3239]	Time 0.501 (0.511)	Data 0.001 (0.010)	Loss 6.3428 (6.3052)	Top-1 acc 0.391 (1.099)	Top-5 acc 3.906 (4.470)	lr 0.04903
Warmup Train [4][1800/3239]	Time 0.557 (0.511)	Data 0.001 (0.010)	Loss 6.2419 (6.3050)	Top-1 acc 1.953 (1.101)	Top-5 acc 6.250 (4.474)	lr 0.04903
Warmup Train [4][1810/3239]	Time 0.602 (0.511)	Data 0.001 (0.010)	Loss 6.1924 (6.3047)	Top-1 acc 2.344 (1.103)	Top-5 acc 6.250 (4.479)	lr 0.04903
Warmup Train [4][1820/3239]	Time 0.367 (0.511)	Data 0.001 (0.010)	Loss 6.2590 (6.3044)	Top-1 acc 0.000 (1.103)	Top-5 acc 4.688 (4.482)	lr 0.04903
Warmup Train [4][1830/3239]	Time 0.615 (0.511)	Data 0.001 (0.010)	Loss 6.1689 (6.3042)	Top-1 acc 3.125 (1.103)	Top-5 acc 5.469 (4.483)	lr 0.04903
Warmup Train [4][1840/3239]	Time 0.576 (0.511)	Data 0.001 (0.010)	Loss 6.2620 (6.3039)	Top-1 acc 1.953 (1.107)	Top-5 acc 5.859 (4.490)	lr 0.04902
Warmup Train [4][1850/3239]	Time 0.541 (0.511)	Data 0.001 (0.010)	Loss 6.2558 (6.3036)	Top-1 acc 1.172 (1.110)	Top-5 acc 5.859 (4.496)	lr 0.04902
Warmup Train [4][1860/3239]	Time 0.520 (0.511)	Data 0.001 (0.010)	Loss 6.3326 (6.3034)	Top-1 acc 2.344 (1.110)	Top-5 acc 5.859 (4.497)	lr 0.04902
Warmup Train [4][1870/3239]	Time 0.470 (0.511)	Data 0.001 (0.010)	Loss 6.2643 (6.3031)	Top-1 acc 0.391 (1.110)	Top-5 acc 4.688 (4.501)	lr 0.04902
Warmup Train [4][1880/3239]	Time 0.420 (0.511)	Data 0.001 (0.010)	Loss 6.1985 (6.3027)	Top-1 acc 1.953 (1.112)	Top-5 acc 5.078 (4.504)	lr 0.04902
Warmup Train [4][1890/3239]	Time 0.422 (0.511)	Data 0.001 (0.010)	Loss 6.2716 (6.3025)	Top-1 acc 1.562 (1.113)	Top-5 acc 5.859 (4.507)	lr 0.04902
Warmup Train [4][1900/3239]	Time 0.501 (0.511)	Data 0.001 (0.010)	Loss 6.2049 (6.3021)	Top-1 acc 1.172 (1.115)	Top-5 acc 5.078 (4.512)	lr 0.04901
Warmup Train [4][1910/3239]	Time 0.571 (0.511)	Data 0.001 (0.010)	Loss 6.2412 (6.3018)	Top-1 acc 1.172 (1.118)	Top-5 acc 2.344 (4.518)	lr 0.04901
Warmup Train [4][1920/3239]	Time 0.510 (0.511)	Data 0.001 (0.010)	Loss 6.2799 (6.3015)	Top-1 acc 1.172 (1.120)	Top-5 acc 4.297 (4.524)	lr 0.04901
Warmup Train [4][1930/3239]	Time 0.563 (0.511)	Data 0.001 (0.010)	Loss 6.3128 (6.3012)	Top-1 acc 0.781 (1.123)	Top-5 acc 3.906 (4.527)	lr 0.04901
Warmup Train [4][1940/3239]	Time 0.640 (0.511)	Data 0.001 (0.010)	Loss 6.2456 (6.3008)	Top-1 acc 1.172 (1.125)	Top-5 acc 7.031 (4.534)	lr 0.04901
Warmup Train [4][1950/3239]	Time 0.441 (0.511)	Data 0.001 (0.010)	Loss 6.2870 (6.3006)	Top-1 acc 1.953 (1.127)	Top-5 acc 4.688 (4.538)	lr 0.04901
Warmup Train [4][1960/3239]	Time 0.346 (0.511)	Data 0.001 (0.010)	Loss 6.2772 (6.3003)	Top-1 acc 1.172 (1.129)	Top-5 acc 3.906 (4.541)	lr 0.04900
Warmup Train [4][1970/3239]	Time 0.620 (0.511)	Data 0.001 (0.010)	Loss 6.2179 (6.3001)	Top-1 acc 0.391 (1.130)	Top-5 acc 7.422 (4.547)	lr 0.04900
Warmup Train [4][1980/3239]	Time 0.578 (0.511)	Data 0.001 (0.010)	Loss 6.1883 (6.2997)	Top-1 acc 1.172 (1.131)	Top-5 acc 4.688 (4.550)	lr 0.04900
Warmup Train [4][1990/3239]	Time 0.365 (0.511)	Data 0.001 (0.010)	Loss 6.1697 (6.2993)	Top-1 acc 2.344 (1.134)	Top-5 acc 6.641 (4.557)	lr 0.04900
Warmup Train [4][2000/3239]	Time 0.711 (0.511)	Data 0.001 (0.010)	Loss 6.3173 (6.2990)	Top-1 acc 0.391 (1.132)	Top-5 acc 3.906 (4.559)	lr 0.04900
Warmup Train [4][2010/3239]	Time 0.379 (0.511)	Data 0.001 (0.010)	Loss 6.1458 (6.2987)	Top-1 acc 1.562 (1.132)	Top-5 acc 6.250 (4.562)	lr 0.04900
Warmup Train [4][2020/3239]	Time 0.533 (0.511)	Data 0.001 (0.010)	Loss 6.2445 (6.2985)	Top-1 acc 3.516 (1.132)	Top-5 acc 7.812 (4.568)	lr 0.04899
Warmup Train [4][2030/3239]	Time 0.424 (0.511)	Data 0.001 (0.010)	Loss 6.2915 (6.2982)	Top-1 acc 1.953 (1.132)	Top-5 acc 5.859 (4.572)	lr 0.04899
Warmup Train [4][2040/3239]	Time 0.497 (0.511)	Data 0.001 (0.010)	Loss 6.2275 (6.2979)	Top-1 acc 0.391 (1.133)	Top-5 acc 3.906 (4.577)	lr 0.04899
Warmup Train [4][2050/3239]	Time 0.561 (0.511)	Data 0.001 (0.010)	Loss 6.2345 (6.2976)	Top-1 acc 1.562 (1.133)	Top-5 acc 4.297 (4.580)	lr 0.04899
Warmup Train [4][2060/3239]	Time 0.677 (0.511)	Data 0.002 (0.010)	Loss 6.2429 (6.2973)	Top-1 acc 0.781 (1.133)	Top-5 acc 2.734 (4.582)	lr 0.04899
Warmup Train [4][2070/3239]	Time 0.528 (0.511)	Data 0.001 (0.010)	Loss 6.2351 (6.2970)	Top-1 acc 1.953 (1.135)	Top-5 acc 4.688 (4.590)	lr 0.04899
Warmup Train [4][2080/3239]	Time 0.391 (0.511)	Data 0.001 (0.010)	Loss 6.0709 (6.2966)	Top-1 acc 1.562 (1.136)	Top-5 acc 8.203 (4.592)	lr 0.04898
Warmup Train [4][2090/3239]	Time 0.553 (0.511)	Data 0.001 (0.010)	Loss 6.2939 (6.2962)	Top-1 acc 0.391 (1.135)	Top-5 acc 5.859 (4.592)	lr 0.04898
Warmup Train [4][2100/3239]	Time 0.462 (0.511)	Data 0.001 (0.010)	Loss 6.3518 (6.2961)	Top-1 acc 1.562 (1.135)	Top-5 acc 6.641 (4.598)	lr 0.04898
Warmup Train [4][2110/3239]	Time 0.564 (0.511)	Data 0.001 (0.010)	Loss 6.2228 (6.2959)	Top-1 acc 1.953 (1.136)	Top-5 acc 5.469 (4.599)	lr 0.04898
Warmup Train [4][2120/3239]	Time 0.619 (0.511)	Data 0.001 (0.010)	Loss 6.2455 (6.2956)	Top-1 acc 0.781 (1.137)	Top-5 acc 2.734 (4.602)	lr 0.04898
Warmup Train [4][2130/3239]	Time 0.428 (0.511)	Data 0.001 (0.010)	Loss 6.2540 (6.2953)	Top-1 acc 0.000 (1.137)	Top-5 acc 4.297 (4.606)	lr 0.04898
Warmup Train [4][2140/3239]	Time 0.514 (0.511)	Data 0.001 (0.010)	Loss 6.2194 (6.2951)	Top-1 acc 2.344 (1.140)	Top-5 acc 4.688 (4.608)	lr 0.04897
Warmup Train [4][2150/3239]	Time 0.560 (0.511)	Data 0.001 (0.010)	Loss 6.2648 (6.2948)	Top-1 acc 1.562 (1.140)	Top-5 acc 5.859 (4.611)	lr 0.04897
Warmup Train [4][2160/3239]	Time 0.448 (0.511)	Data 0.001 (0.010)	Loss 6.3079 (6.2946)	Top-1 acc 0.781 (1.142)	Top-5 acc 4.297 (4.612)	lr 0.04897
Warmup Train [4][2170/3239]	Time 0.564 (0.511)	Data 0.002 (0.010)	Loss 6.2341 (6.2942)	Top-1 acc 1.172 (1.144)	Top-5 acc 4.297 (4.617)	lr 0.04897
Warmup Train [4][2180/3239]	Time 0.560 (0.511)	Data 0.001 (0.010)	Loss 6.1611 (6.2939)	Top-1 acc 2.344 (1.144)	Top-5 acc 4.297 (4.617)	lr 0.04897
Warmup Train [4][2190/3239]	Time 0.545 (0.511)	Data 0.001 (0.010)	Loss 6.2591 (6.2936)	Top-1 acc 0.781 (1.146)	Top-5 acc 5.078 (4.620)	lr 0.04897
Warmup Train [4][2200/3239]	Time 0.658 (0.511)	Data 0.001 (0.010)	Loss 6.1896 (6.2932)	Top-1 acc 1.172 (1.146)	Top-5 acc 5.078 (4.623)	lr 0.04896
Warmup Train [4][2210/3239]	Time 0.547 (0.511)	Data 0.001 (0.010)	Loss 6.2897 (6.2929)	Top-1 acc 0.391 (1.147)	Top-5 acc 3.516 (4.627)	lr 0.04896
Warmup Train [4][2220/3239]	Time 0.409 (0.511)	Data 0.001 (0.010)	Loss 6.2190 (6.2926)	Top-1 acc 1.562 (1.148)	Top-5 acc 4.297 (4.629)	lr 0.04896
Warmup Train [4][2230/3239]	Time 0.582 (0.511)	Data 0.001 (0.010)	Loss 6.1996 (6.2924)	Top-1 acc 1.172 (1.147)	Top-5 acc 4.688 (4.631)	lr 0.04896
Warmup Train [4][2240/3239]	Time 0.622 (0.511)	Data 0.001 (0.010)	Loss 6.1646 (6.2921)	Top-1 acc 1.172 (1.149)	Top-5 acc 6.250 (4.632)	lr 0.04896
Warmup Train [4][2250/3239]	Time 0.517 (0.511)	Data 0.001 (0.009)	Loss 6.0881 (6.2918)	Top-1 acc 0.000 (1.148)	Top-5 acc 6.641 (4.632)	lr 0.04895
Warmup Train [4][2260/3239]	Time 0.417 (0.511)	Data 0.001 (0.009)	Loss 6.1959 (6.2914)	Top-1 acc 1.953 (1.150)	Top-5 acc 10.156 (4.639)	lr 0.04895
Warmup Train [4][2270/3239]	Time 0.595 (0.511)	Data 0.001 (0.009)	Loss 6.1613 (6.2911)	Top-1 acc 1.953 (1.152)	Top-5 acc 5.859 (4.645)	lr 0.04895
Warmup Train [4][2280/3239]	Time 0.426 (0.511)	Data 0.001 (0.009)	Loss 6.2504 (6.2908)	Top-1 acc 1.172 (1.152)	Top-5 acc 4.297 (4.645)	lr 0.04895
Warmup Train [4][2290/3239]	Time 0.410 (0.511)	Data 0.001 (0.009)	Loss 6.2348 (6.2905)	Top-1 acc 0.781 (1.154)	Top-5 acc 5.469 (4.650)	lr 0.04895
Warmup Train [4][2300/3239]	Time 0.481 (0.511)	Data 0.001 (0.009)	Loss 6.1201 (6.2901)	Top-1 acc 3.125 (1.156)	Top-5 acc 10.156 (4.659)	lr 0.04895
Warmup Train [4][2310/3239]	Time 0.557 (0.511)	Data 0.001 (0.009)	Loss 6.2864 (6.2897)	Top-1 acc 1.172 (1.157)	Top-5 acc 3.516 (4.665)	lr 0.04894
Warmup Train [4][2320/3239]	Time 0.673 (0.510)	Data 0.001 (0.009)	Loss 6.2213 (6.2894)	Top-1 acc 1.953 (1.160)	Top-5 acc 5.078 (4.669)	lr 0.04894
Warmup Train [4][2330/3239]	Time 0.742 (0.510)	Data 0.001 (0.009)	Loss 6.2678 (6.2890)	Top-1 acc 1.562 (1.161)	Top-5 acc 5.078 (4.673)	lr 0.04894
Warmup Train [4][2340/3239]	Time 0.385 (0.510)	Data 0.001 (0.009)	Loss 6.2910 (6.2888)	Top-1 acc 1.562 (1.161)	Top-5 acc 3.516 (4.673)	lr 0.04894
Warmup Train [4][2350/3239]	Time 0.467 (0.510)	Data 0.001 (0.009)	Loss 6.1500 (6.2886)	Top-1 acc 1.172 (1.161)	Top-5 acc 7.031 (4.675)	lr 0.04894
Warmup Train [4][2360/3239]	Time 0.497 (0.510)	Data 0.001 (0.009)	Loss 6.1675 (6.2882)	Top-1 acc 1.172 (1.162)	Top-5 acc 4.688 (4.677)	lr 0.04894
Warmup Train [4][2370/3239]	Time 0.384 (0.510)	Data 0.001 (0.009)	Loss 6.1938 (6.2880)	Top-1 acc 0.781 (1.161)	Top-5 acc 5.078 (4.678)	lr 0.04893
Warmup Train [4][2380/3239]	Time 0.483 (0.511)	Data 0.002 (0.009)	Loss 6.2825 (6.2877)	Top-1 acc 0.781 (1.161)	Top-5 acc 4.688 (4.682)	lr 0.04893
Warmup Train [4][2390/3239]	Time 0.556 (0.511)	Data 0.001 (0.009)	Loss 6.2157 (6.2873)	Top-1 acc 1.953 (1.162)	Top-5 acc 4.297 (4.687)	lr 0.04893
Warmup Train [4][2400/3239]	Time 0.550 (0.511)	Data 0.001 (0.009)	Loss 6.1464 (6.2871)	Top-1 acc 2.344 (1.164)	Top-5 acc 8.594 (4.689)	lr 0.04893
Warmup Train [4][2410/3239]	Time 0.436 (0.511)	Data 0.001 (0.009)	Loss 6.1587 (6.2867)	Top-1 acc 2.344 (1.165)	Top-5 acc 4.688 (4.691)	lr 0.04893
Warmup Train [4][2420/3239]	Time 0.578 (0.511)	Data 0.001 (0.009)	Loss 6.1954 (6.2863)	Top-1 acc 1.172 (1.167)	Top-5 acc 6.250 (4.700)	lr 0.04893
Warmup Train [4][2430/3239]	Time 0.676 (0.511)	Data 0.001 (0.009)	Loss 6.1335 (6.2860)	Top-1 acc 1.562 (1.167)	Top-5 acc 5.469 (4.704)	lr 0.04892
Warmup Train [4][2440/3239]	Time 0.760 (0.511)	Data 0.001 (0.009)	Loss 6.2063 (6.2858)	Top-1 acc 1.172 (1.167)	Top-5 acc 4.688 (4.708)	lr 0.04892
Warmup Train [4][2450/3239]	Time 0.633 (0.511)	Data 0.001 (0.009)	Loss 6.1741 (6.2854)	Top-1 acc 1.172 (1.167)	Top-5 acc 5.859 (4.710)	lr 0.04892
Warmup Train [4][2460/3239]	Time 0.547 (0.511)	Data 0.001 (0.009)	Loss 6.2197 (6.2851)	Top-1 acc 1.172 (1.169)	Top-5 acc 5.078 (4.711)	lr 0.04892
Warmup Train [4][2470/3239]	Time 0.381 (0.511)	Data 0.001 (0.009)	Loss 6.2202 (6.2847)	Top-1 acc 1.953 (1.171)	Top-5 acc 5.469 (4.715)	lr 0.04892
Warmup Train [4][2480/3239]	Time 0.397 (0.511)	Data 0.001 (0.009)	Loss 6.2237 (6.2843)	Top-1 acc 0.391 (1.171)	Top-5 acc 4.297 (4.718)	lr 0.04891
Warmup Train [4][2490/3239]	Time 0.457 (0.511)	Data 0.001 (0.009)	Loss 6.1400 (6.2840)	Top-1 acc 2.344 (1.172)	Top-5 acc 5.859 (4.719)	lr 0.04891
Warmup Train [4][2500/3239]	Time 0.516 (0.511)	Data 0.001 (0.009)	Loss 6.2588 (6.2837)	Top-1 acc 1.172 (1.172)	Top-5 acc 5.078 (4.722)	lr 0.04891
Warmup Train [4][2510/3239]	Time 0.585 (0.511)	Data 0.001 (0.009)	Loss 6.1843 (6.2834)	Top-1 acc 2.734 (1.175)	Top-5 acc 7.422 (4.727)	lr 0.04891
Warmup Train [4][2520/3239]	Time 0.678 (0.511)	Data 0.001 (0.009)	Loss 6.2855 (6.2831)	Top-1 acc 1.953 (1.178)	Top-5 acc 4.297 (4.731)	lr 0.04891
Warmup Train [4][2530/3239]	Time 0.518 (0.511)	Data 0.001 (0.009)	Loss 6.2084 (6.2828)	Top-1 acc 0.781 (1.179)	Top-5 acc 2.734 (4.736)	lr 0.04891
Warmup Train [4][2540/3239]	Time 0.414 (0.511)	Data 0.001 (0.009)	Loss 6.2630 (6.2826)	Top-1 acc 2.734 (1.180)	Top-5 acc 4.688 (4.735)	lr 0.04890
Warmup Train [4][2550/3239]	Time 0.472 (0.511)	Data 0.001 (0.009)	Loss 6.1904 (6.2822)	Top-1 acc 2.734 (1.181)	Top-5 acc 8.203 (4.739)	lr 0.04890
Warmup Train [4][2560/3239]	Time 0.560 (0.511)	Data 0.001 (0.009)	Loss 6.1731 (6.2819)	Top-1 acc 1.562 (1.181)	Top-5 acc 7.031 (4.744)	lr 0.04890
Warmup Train [4][2570/3239]	Time 0.378 (0.511)	Data 0.001 (0.009)	Loss 6.1175 (6.2815)	Top-1 acc 3.516 (1.182)	Top-5 acc 8.594 (4.751)	lr 0.04890
Warmup Train [4][2580/3239]	Time 0.363 (0.510)	Data 0.001 (0.009)	Loss 6.2112 (6.2811)	Top-1 acc 1.172 (1.183)	Top-5 acc 4.297 (4.753)	lr 0.04890
Warmup Train [4][2590/3239]	Time 0.288 (0.510)	Data 0.001 (0.009)	Loss 6.1686 (6.2808)	Top-1 acc 2.344 (1.186)	Top-5 acc 7.422 (4.762)	lr 0.04890
Warmup Train [4][2600/3239]	Time 0.507 (0.510)	Data 0.001 (0.009)	Loss 6.1298 (6.2804)	Top-1 acc 2.344 (1.188)	Top-5 acc 7.031 (4.768)	lr 0.04889
Warmup Train [4][2610/3239]	Time 0.438 (0.510)	Data 0.001 (0.009)	Loss 6.1957 (6.2800)	Top-1 acc 1.562 (1.188)	Top-5 acc 6.641 (4.772)	lr 0.04889
Warmup Train [4][2620/3239]	Time 0.567 (0.510)	Data 0.001 (0.009)	Loss 6.1940 (6.2796)	Top-1 acc 1.172 (1.189)	Top-5 acc 7.812 (4.778)	lr 0.04889
Warmup Train [4][2630/3239]	Time 0.456 (0.510)	Data 0.001 (0.009)	Loss 6.2739 (6.2793)	Top-1 acc 0.391 (1.189)	Top-5 acc 5.078 (4.780)	lr 0.04889
Warmup Train [4][2640/3239]	Time 0.519 (0.511)	Data 0.001 (0.009)	Loss 6.2722 (6.2790)	Top-1 acc 1.172 (1.191)	Top-5 acc 3.516 (4.782)	lr 0.04889
Warmup Train [4][2650/3239]	Time 0.481 (0.511)	Data 0.001 (0.009)	Loss 6.2653 (6.2787)	Top-1 acc 0.391 (1.192)	Top-5 acc 5.078 (4.784)	lr 0.04888
Warmup Train [4][2660/3239]	Time 0.529 (0.511)	Data 0.001 (0.009)	Loss 6.1619 (6.2784)	Top-1 acc 1.562 (1.192)	Top-5 acc 8.203 (4.787)	lr 0.04888
Warmup Train [4][2670/3239]	Time 0.484 (0.511)	Data 0.001 (0.009)	Loss 6.2261 (6.2781)	Top-1 acc 0.781 (1.193)	Top-5 acc 5.469 (4.790)	lr 0.04888
Warmup Train [4][2680/3239]	Time 0.641 (0.511)	Data 0.001 (0.009)	Loss 6.2030 (6.2777)	Top-1 acc 1.172 (1.195)	Top-5 acc 4.297 (4.795)	lr 0.04888
Warmup Train [4][2690/3239]	Time 0.636 (0.511)	Data 0.001 (0.009)	Loss 6.1372 (6.2773)	Top-1 acc 1.172 (1.196)	Top-5 acc 7.812 (4.798)	lr 0.04888
Warmup Train [4][2700/3239]	Time 0.611 (0.511)	Data 0.001 (0.009)	Loss 6.1227 (6.2770)	Top-1 acc 1.172 (1.197)	Top-5 acc 6.641 (4.802)	lr 0.04888
Warmup Train [4][2710/3239]	Time 0.640 (0.511)	Data 0.001 (0.009)	Loss 6.1598 (6.2766)	Top-1 acc 1.953 (1.199)	Top-5 acc 7.812 (4.806)	lr 0.04887
Warmup Train [4][2720/3239]	Time 0.487 (0.511)	Data 0.001 (0.009)	Loss 6.1889 (6.2763)	Top-1 acc 1.562 (1.199)	Top-5 acc 3.906 (4.808)	lr 0.04887
Warmup Train [4][2730/3239]	Time 0.527 (0.511)	Data 0.001 (0.009)	Loss 6.1330 (6.2759)	Top-1 acc 1.953 (1.199)	Top-5 acc 7.422 (4.812)	lr 0.04887
Warmup Train [4][2740/3239]	Time 0.455 (0.511)	Data 0.001 (0.009)	Loss 6.2263 (6.2755)	Top-1 acc 1.562 (1.200)	Top-5 acc 5.469 (4.817)	lr 0.04887
Warmup Train [4][2750/3239]	Time 0.601 (0.511)	Data 0.001 (0.009)	Loss 6.1195 (6.2752)	Top-1 acc 1.953 (1.200)	Top-5 acc 6.641 (4.821)	lr 0.04887
Warmup Train [4][2760/3239]	Time 0.439 (0.511)	Data 0.001 (0.009)	Loss 6.1955 (6.2749)	Top-1 acc 0.781 (1.200)	Top-5 acc 4.297 (4.823)	lr 0.04886
Warmup Train [4][2770/3239]	Time 0.510 (0.511)	Data 0.002 (0.009)	Loss 6.2237 (6.2747)	Top-1 acc 0.781 (1.202)	Top-5 acc 3.906 (4.826)	lr 0.04886
Warmup Train [4][2780/3239]	Time 0.483 (0.511)	Data 0.001 (0.009)	Loss 6.2501 (6.2744)	Top-1 acc 1.172 (1.203)	Top-5 acc 3.906 (4.830)	lr 0.04886
Warmup Train [4][2790/3239]	Time 0.500 (0.511)	Data 0.001 (0.009)	Loss 6.1250 (6.2740)	Top-1 acc 2.344 (1.204)	Top-5 acc 5.859 (4.834)	lr 0.04886
Warmup Train [4][2800/3239]	Time 0.384 (0.511)	Data 0.001 (0.009)	Loss 6.1113 (6.2737)	Top-1 acc 3.125 (1.206)	Top-5 acc 7.812 (4.836)	lr 0.04886
Warmup Train [4][2810/3239]	Time 0.362 (0.511)	Data 0.001 (0.009)	Loss 6.1877 (6.2734)	Top-1 acc 0.781 (1.207)	Top-5 acc 4.688 (4.842)	lr 0.04886
Warmup Train [4][2820/3239]	Time 0.467 (0.511)	Data 0.001 (0.009)	Loss 6.1502 (6.2730)	Top-1 acc 0.391 (1.208)	Top-5 acc 5.469 (4.845)	lr 0.04885
Warmup Train [4][2830/3239]	Time 0.552 (0.511)	Data 0.001 (0.009)	Loss 6.2401 (6.2727)	Top-1 acc 0.000 (1.208)	Top-5 acc 3.906 (4.850)	lr 0.04885
Warmup Train [4][2840/3239]	Time 0.699 (0.511)	Data 0.001 (0.009)	Loss 6.1559 (6.2724)	Top-1 acc 1.953 (1.210)	Top-5 acc 6.250 (4.855)	lr 0.04885
Warmup Train [4][2850/3239]	Time 0.603 (0.510)	Data 0.001 (0.009)	Loss 6.1423 (6.2721)	Top-1 acc 3.516 (1.211)	Top-5 acc 8.203 (4.859)	lr 0.04885
Warmup Train [4][2860/3239]	Time 0.528 (0.510)	Data 0.001 (0.009)	Loss 6.2615 (6.2718)	Top-1 acc 0.781 (1.212)	Top-5 acc 5.469 (4.863)	lr 0.04885
Warmup Train [4][2870/3239]	Time 0.457 (0.510)	Data 0.001 (0.009)	Loss 6.1895 (6.2715)	Top-1 acc 1.172 (1.213)	Top-5 acc 8.203 (4.869)	lr 0.04884
Warmup Train [4][2880/3239]	Time 0.614 (0.510)	Data 0.001 (0.009)	Loss 6.0827 (6.2712)	Top-1 acc 1.953 (1.214)	Top-5 acc 8.594 (4.874)	lr 0.04884
Warmup Train [4][2890/3239]	Time 0.585 (0.510)	Data 0.001 (0.009)	Loss 6.2682 (6.2710)	Top-1 acc 0.391 (1.215)	Top-5 acc 4.688 (4.876)	lr 0.04884
Warmup Train [4][2900/3239]	Time 0.530 (0.510)	Data 0.001 (0.009)	Loss 6.1573 (6.2707)	Top-1 acc 1.562 (1.215)	Top-5 acc 7.031 (4.877)	lr 0.04884
Warmup Train [4][2910/3239]	Time 0.407 (0.510)	Data 0.001 (0.009)	Loss 6.1448 (6.2704)	Top-1 acc 1.172 (1.216)	Top-5 acc 4.688 (4.879)	lr 0.04884
Warmup Train [4][2920/3239]	Time 0.368 (0.510)	Data 0.001 (0.009)	Loss 6.2494 (6.2701)	Top-1 acc 1.562 (1.218)	Top-5 acc 5.859 (4.882)	lr 0.04884
Warmup Train [4][2930/3239]	Time 0.641 (0.510)	Data 0.001 (0.009)	Loss 6.1330 (6.2698)	Top-1 acc 0.000 (1.218)	Top-5 acc 4.688 (4.886)	lr 0.04883
Warmup Train [4][2940/3239]	Time 0.424 (0.510)	Data 0.001 (0.009)	Loss 6.2302 (6.2695)	Top-1 acc 0.000 (1.219)	Top-5 acc 2.734 (4.889)	lr 0.04883
Warmup Train [4][2950/3239]	Time 0.400 (0.510)	Data 0.001 (0.009)	Loss 6.2042 (6.2693)	Top-1 acc 1.953 (1.219)	Top-5 acc 5.859 (4.891)	lr 0.04883
Warmup Train [4][2960/3239]	Time 0.490 (0.510)	Data 0.001 (0.009)	Loss 6.2395 (6.2690)	Top-1 acc 1.953 (1.221)	Top-5 acc 5.469 (4.897)	lr 0.04883
Warmup Train [4][2970/3239]	Time 0.536 (0.510)	Data 0.001 (0.009)	Loss 6.1878 (6.2686)	Top-1 acc 0.391 (1.222)	Top-5 acc 5.078 (4.901)	lr 0.04883
Warmup Train [4][2980/3239]	Time 0.492 (0.510)	Data 0.001 (0.009)	Loss 6.2010 (6.2683)	Top-1 acc 2.344 (1.222)	Top-5 acc 7.812 (4.905)	lr 0.04882
Warmup Train [4][2990/3239]	Time 0.529 (0.510)	Data 0.001 (0.009)	Loss 6.1015 (6.2680)	Top-1 acc 0.391 (1.223)	Top-5 acc 5.469 (4.910)	lr 0.04882
Warmup Train [4][3000/3239]	Time 0.400 (0.510)	Data 0.001 (0.009)	Loss 6.1322 (6.2677)	Top-1 acc 0.391 (1.222)	Top-5 acc 6.641 (4.915)	lr 0.04882
Warmup Train [4][3010/3239]	Time 0.567 (0.510)	Data 0.001 (0.009)	Loss 6.1418 (6.2673)	Top-1 acc 0.781 (1.223)	Top-5 acc 6.641 (4.920)	lr 0.04882
Warmup Train [4][3020/3239]	Time 0.483 (0.510)	Data 0.001 (0.009)	Loss 6.2503 (6.2670)	Top-1 acc 1.953 (1.224)	Top-5 acc 7.422 (4.923)	lr 0.04882
Warmup Train [4][3030/3239]	Time 0.521 (0.510)	Data 0.001 (0.009)	Loss 6.1585 (6.2667)	Top-1 acc 2.344 (1.225)	Top-5 acc 7.812 (4.926)	lr 0.04882
Warmup Train [4][3040/3239]	Time 0.567 (0.510)	Data 0.001 (0.009)	Loss 6.1579 (6.2664)	Top-1 acc 1.953 (1.226)	Top-5 acc 5.078 (4.928)	lr 0.04881
Warmup Train [4][3050/3239]	Time 0.586 (0.511)	Data 0.001 (0.009)	Loss 6.1992 (6.2661)	Top-1 acc 2.344 (1.227)	Top-5 acc 5.469 (4.931)	lr 0.04881
Warmup Train [4][3060/3239]	Time 0.697 (0.511)	Data 0.002 (0.009)	Loss 6.1888 (6.2659)	Top-1 acc 1.562 (1.226)	Top-5 acc 4.688 (4.934)	lr 0.04881
Warmup Train [4][3070/3239]	Time 0.194 (0.510)	Data 0.001 (0.009)	Loss 6.1811 (6.2655)	Top-1 acc 0.781 (1.227)	Top-5 acc 4.297 (4.936)	lr 0.04881
Warmup Train [4][3080/3239]	Time 0.354 (0.510)	Data 0.001 (0.009)	Loss 6.1517 (6.2652)	Top-1 acc 1.953 (1.227)	Top-5 acc 3.906 (4.936)	lr 0.04881
Warmup Train [4][3090/3239]	Time 0.220 (0.510)	Data 0.001 (0.009)	Loss 6.2586 (6.2649)	Top-1 acc 1.562 (1.230)	Top-5 acc 4.688 (4.941)	lr 0.04880
Warmup Train [4][3100/3239]	Time 0.502 (0.510)	Data 0.001 (0.009)	Loss 6.1658 (6.2645)	Top-1 acc 0.391 (1.232)	Top-5 acc 5.078 (4.946)	lr 0.04880
Warmup Train [4][3110/3239]	Time 0.556 (0.510)	Data 0.001 (0.009)	Loss 6.1898 (6.2641)	Top-1 acc 0.781 (1.233)	Top-5 acc 5.078 (4.948)	lr 0.04880
Warmup Train [4][3120/3239]	Time 0.473 (0.510)	Data 0.001 (0.009)	Loss 6.1991 (6.2639)	Top-1 acc 1.172 (1.233)	Top-5 acc 6.641 (4.951)	lr 0.04880
Warmup Train [4][3130/3239]	Time 0.404 (0.510)	Data 0.001 (0.009)	Loss 6.1304 (6.2636)	Top-1 acc 1.953 (1.233)	Top-5 acc 5.469 (4.953)	lr 0.04880
Warmup Train [4][3140/3239]	Time 0.559 (0.510)	Data 0.001 (0.009)	Loss 6.0546 (6.2632)	Top-1 acc 0.781 (1.234)	Top-5 acc 6.641 (4.956)	lr 0.04880
Warmup Train [4][3150/3239]	Time 0.680 (0.510)	Data 0.001 (0.009)	Loss 6.1962 (6.2629)	Top-1 acc 0.391 (1.234)	Top-5 acc 4.297 (4.958)	lr 0.04879
Warmup Train [4][3160/3239]	Time 0.566 (0.510)	Data 0.001 (0.009)	Loss 6.1844 (6.2626)	Top-1 acc 2.344 (1.236)	Top-5 acc 6.250 (4.960)	lr 0.04879
Warmup Train [4][3170/3239]	Time 0.650 (0.510)	Data 0.001 (0.009)	Loss 6.1668 (6.2624)	Top-1 acc 0.781 (1.236)	Top-5 acc 5.078 (4.960)	lr 0.04879
Warmup Train [4][3180/3239]	Time 0.520 (0.510)	Data 0.000 (0.009)	Loss 6.0988 (6.2620)	Top-1 acc 2.734 (1.236)	Top-5 acc 7.812 (4.964)	lr 0.04879
Warmup Train [4][3190/3239]	Time 0.421 (0.510)	Data 0.000 (0.008)	Loss 6.1276 (6.2617)	Top-1 acc 1.562 (1.238)	Top-5 acc 6.250 (4.968)	lr 0.04879
Warmup Train [4][3200/3239]	Time 0.383 (0.510)	Data 0.000 (0.008)	Loss 6.1056 (6.2614)	Top-1 acc 2.344 (1.239)	Top-5 acc 6.641 (4.973)	lr 0.04878
Warmup Train [4][3210/3239]	Time 0.615 (0.510)	Data 0.000 (0.009)	Loss 6.1485 (6.2611)	Top-1 acc 1.562 (1.241)	Top-5 acc 7.031 (4.975)	lr 0.04878
Warmup Train [4][3220/3239]	Time 0.380 (0.510)	Data 0.000 (0.008)	Loss 6.2338 (6.2608)	Top-1 acc 0.781 (1.241)	Top-5 acc 5.469 (4.981)	lr 0.04878
Warmup Train [4][3230/3239]	Time 0.492 (0.510)	Data 0.000 (0.008)	Loss 6.1221 (6.2605)	Top-1 acc 2.734 (1.243)	Top-5 acc 8.984 (4.986)	lr 0.04878
Warmup Train [4][3239/3239]	Time 0.983 (0.510)	Data 0.000 (0.008)	Loss 6.2244 (6.2602)	Top-1 acc 2.469 (1.244)	Top-5 acc 7.407 (4.992)	lr 0.04878
==========Warmup Valid [4/40]	loss 5.889	top-1 acc 1.950	top-5 acc 7.211	Train top-1 1.244	top-5 4.992	flops: 442.4M
Warmup Train [5][0/3239]	Time 9.315 (9.315)	Data 8.850 (8.850)	Loss 6.0997 (6.0997)	Top-1 acc 1.953 (1.953)	Top-5 acc 7.031 (7.031)	lr 0.04878
Warmup Train [5][10/3239]	Time 0.543 (1.444)	Data 0.002 (0.867)	Loss 6.1122 (6.1598)	Top-1 acc 1.562 (1.989)	Top-5 acc 5.859 (6.072)	lr 0.04877
Warmup Train [5][20/3239]	Time 0.482 (1.004)	Data 0.001 (0.456)	Loss 6.0832 (6.1528)	Top-1 acc 1.172 (1.562)	Top-5 acc 8.203 (5.934)	lr 0.04877
Warmup Train [5][30/3239]	Time 0.389 (0.844)	Data 0.001 (0.309)	Loss 6.1135 (6.1562)	Top-1 acc 1.562 (1.600)	Top-5 acc 8.984 (5.948)	lr 0.04877
Warmup Train [5][40/3239]	Time 0.673 (0.768)	Data 0.001 (0.238)	Loss 6.1103 (6.1528)	Top-1 acc 1.172 (1.677)	Top-5 acc 6.641 (6.298)	lr 0.04877
Warmup Train [5][50/3239]	Time 0.394 (0.715)	Data 0.001 (0.191)	Loss 6.1905 (6.1532)	Top-1 acc 0.781 (1.647)	Top-5 acc 7.422 (6.327)	lr 0.04877
Warmup Train [5][60/3239]	Time 0.554 (0.683)	Data 0.001 (0.161)	Loss 6.0872 (6.1518)	Top-1 acc 1.172 (1.633)	Top-5 acc 7.812 (6.333)	lr 0.04877
Warmup Train [5][70/3239]	Time 0.706 (0.660)	Data 0.001 (0.139)	Loss 6.1603 (6.1476)	Top-1 acc 2.344 (1.651)	Top-5 acc 7.422 (6.448)	lr 0.04876
Warmup Train [5][80/3239]	Time 0.495 (0.640)	Data 0.001 (0.122)	Loss 6.1155 (6.1458)	Top-1 acc 0.781 (1.611)	Top-5 acc 8.594 (6.506)	lr 0.04876
Warmup Train [5][90/3239]	Time 0.494 (0.626)	Data 0.001 (0.109)	Loss 6.0616 (6.1459)	Top-1 acc 3.125 (1.601)	Top-5 acc 9.375 (6.456)	lr 0.04876
Warmup Train [5][100/3239]	Time 0.521 (0.617)	Data 0.001 (0.098)	Loss 6.1332 (6.1410)	Top-1 acc 0.000 (1.609)	Top-5 acc 7.031 (6.548)	lr 0.04876
Warmup Train [5][110/3239]	Time 0.359 (0.607)	Data 0.001 (0.090)	Loss 6.2639 (6.1453)	Top-1 acc 1.172 (1.587)	Top-5 acc 3.906 (6.542)	lr 0.04876
Warmup Train [5][120/3239]	Time 0.514 (0.599)	Data 0.001 (0.083)	Loss 6.0824 (6.1458)	Top-1 acc 0.781 (1.611)	Top-5 acc 7.031 (6.486)	lr 0.04875
Warmup Train [5][130/3239]	Time 0.584 (0.593)	Data 0.001 (0.077)	Loss 6.2178 (6.1495)	Top-1 acc 1.953 (1.601)	Top-5 acc 6.641 (6.408)	lr 0.04875
Warmup Train [5][140/3239]	Time 0.424 (0.588)	Data 0.001 (0.071)	Loss 6.1650 (6.1495)	Top-1 acc 1.562 (1.612)	Top-5 acc 8.594 (6.411)	lr 0.04875
Warmup Train [5][150/3239]	Time 0.521 (0.583)	Data 0.001 (0.068)	Loss 6.2144 (6.1495)	Top-1 acc 0.781 (1.604)	Top-5 acc 4.297 (6.405)	lr 0.04875
Warmup Train [5][160/3239]	Time 0.489 (0.580)	Data 0.002 (0.064)	Loss 6.1463 (6.1486)	Top-1 acc 2.344 (1.601)	Top-5 acc 7.812 (6.434)	lr 0.04875
Warmup Train [5][170/3239]	Time 0.550 (0.576)	Data 0.001 (0.060)	Loss 6.1428 (6.1484)	Top-1 acc 1.953 (1.590)	Top-5 acc 5.859 (6.424)	lr 0.04874
Warmup Train [5][180/3239]	Time 0.651 (0.573)	Data 0.001 (0.057)	Loss 6.1404 (6.1486)	Top-1 acc 1.172 (1.586)	Top-5 acc 7.422 (6.468)	lr 0.04874
Warmup Train [5][190/3239]	Time 0.425 (0.569)	Data 0.001 (0.055)	Loss 6.1593 (6.1484)	Top-1 acc 1.953 (1.595)	Top-5 acc 6.641 (6.477)	lr 0.04874
Warmup Train [5][200/3239]	Time 0.401 (0.567)	Data 0.001 (0.052)	Loss 6.1575 (6.1476)	Top-1 acc 2.344 (1.607)	Top-5 acc 6.250 (6.507)	lr 0.04874
Warmup Train [5][210/3239]	Time 0.504 (0.565)	Data 0.001 (0.050)	Loss 6.1538 (6.1472)	Top-1 acc 0.781 (1.585)	Top-5 acc 3.516 (6.454)	lr 0.04874
Warmup Train [5][220/3239]	Time 0.667 (0.562)	Data 0.001 (0.048)	Loss 6.2456 (6.1481)	Top-1 acc 0.391 (1.564)	Top-5 acc 2.344 (6.404)	lr 0.04873
Warmup Train [5][230/3239]	Time 0.545 (0.559)	Data 0.001 (0.046)	Loss 6.1204 (6.1491)	Top-1 acc 3.125 (1.564)	Top-5 acc 9.766 (6.382)	lr 0.04873
Warmup Train [5][240/3239]	Time 0.521 (0.555)	Data 0.001 (0.045)	Loss 6.0578 (6.1492)	Top-1 acc 1.562 (1.579)	Top-5 acc 6.250 (6.393)	lr 0.04873
Warmup Train [5][250/3239]	Time 0.472 (0.553)	Data 0.001 (0.043)	Loss 6.0949 (6.1486)	Top-1 acc 0.781 (1.573)	Top-5 acc 7.031 (6.401)	lr 0.04873
Warmup Train [5][260/3239]	Time 0.591 (0.551)	Data 0.002 (0.041)	Loss 6.2279 (6.1481)	Top-1 acc 1.172 (1.576)	Top-5 acc 4.688 (6.386)	lr 0.04873
Warmup Train [5][270/3239]	Time 0.580 (0.549)	Data 0.001 (0.040)	Loss 6.1242 (6.1478)	Top-1 acc 1.953 (1.570)	Top-5 acc 7.422 (6.370)	lr 0.04873
Warmup Train [5][280/3239]	Time 0.419 (0.547)	Data 0.001 (0.039)	Loss 6.0921 (6.1482)	Top-1 acc 1.953 (1.571)	Top-5 acc 6.641 (6.368)	lr 0.04872
Warmup Train [5][290/3239]	Time 0.481 (0.545)	Data 0.001 (0.038)	Loss 6.1331 (6.1482)	Top-1 acc 3.516 (1.577)	Top-5 acc 8.203 (6.371)	lr 0.04872
Warmup Train [5][300/3239]	Time 0.467 (0.544)	Data 0.001 (0.036)	Loss 6.1515 (6.1476)	Top-1 acc 1.562 (1.579)	Top-5 acc 7.031 (6.399)	lr 0.04872
Warmup Train [5][310/3239]	Time 0.479 (0.543)	Data 0.001 (0.035)	Loss 6.1525 (6.1468)	Top-1 acc 1.953 (1.581)	Top-5 acc 7.031 (6.423)	lr 0.04872
Warmup Train [5][320/3239]	Time 0.565 (0.542)	Data 0.001 (0.034)	Loss 6.0527 (6.1465)	Top-1 acc 1.562 (1.581)	Top-5 acc 8.594 (6.446)	lr 0.04872
Warmup Train [5][330/3239]	Time 0.472 (0.540)	Data 0.001 (0.034)	Loss 6.1895 (6.1465)	Top-1 acc 1.953 (1.586)	Top-5 acc 4.688 (6.447)	lr 0.04871
Warmup Train [5][340/3239]	Time 0.533 (0.539)	Data 0.001 (0.033)	Loss 6.2202 (6.1463)	Top-1 acc 1.562 (1.589)	Top-5 acc 6.641 (6.454)	lr 0.04871
Warmup Train [5][350/3239]	Time 0.438 (0.539)	Data 0.001 (0.032)	Loss 6.1653 (6.1457)	Top-1 acc 1.953 (1.598)	Top-5 acc 4.688 (6.455)	lr 0.04871
Warmup Train [5][360/3239]	Time 0.602 (0.538)	Data 0.001 (0.032)	Loss 6.1728 (6.1452)	Top-1 acc 1.562 (1.586)	Top-5 acc 8.203 (6.449)	lr 0.04871
Warmup Train [5][370/3239]	Time 0.469 (0.538)	Data 0.001 (0.031)	Loss 6.0527 (6.1446)	Top-1 acc 2.344 (1.584)	Top-5 acc 6.250 (6.437)	lr 0.04871
Warmup Train [5][380/3239]	Time 0.470 (0.537)	Data 0.001 (0.030)	Loss 6.1425 (6.1447)	Top-1 acc 1.172 (1.575)	Top-5 acc 5.078 (6.423)	lr 0.04870
Warmup Train [5][390/3239]	Time 0.505 (0.536)	Data 0.001 (0.030)	Loss 6.1500 (6.1444)	Top-1 acc 1.172 (1.571)	Top-5 acc 3.906 (6.417)	lr 0.04870
Warmup Train [5][400/3239]	Time 0.433 (0.535)	Data 0.001 (0.029)	Loss 6.0942 (6.1438)	Top-1 acc 1.562 (1.575)	Top-5 acc 5.469 (6.420)	lr 0.04870
Warmup Train [5][410/3239]	Time 0.586 (0.535)	Data 0.001 (0.028)	Loss 6.0886 (6.1434)	Top-1 acc 1.562 (1.592)	Top-5 acc 8.203 (6.432)	lr 0.04870
Warmup Train [5][420/3239]	Time 0.397 (0.534)	Data 0.001 (0.028)	Loss 6.1287 (6.1430)	Top-1 acc 2.344 (1.605)	Top-5 acc 8.203 (6.448)	lr 0.04870
Warmup Train [5][430/3239]	Time 0.583 (0.533)	Data 0.001 (0.027)	Loss 6.1869 (6.1428)	Top-1 acc 0.781 (1.609)	Top-5 acc 5.859 (6.457)	lr 0.04869
Warmup Train [5][440/3239]	Time 0.516 (0.533)	Data 0.002 (0.027)	Loss 6.1716 (6.1414)	Top-1 acc 1.172 (1.617)	Top-5 acc 6.641 (6.479)	lr 0.04869
Warmup Train [5][450/3239]	Time 0.573 (0.533)	Data 0.001 (0.027)	Loss 6.1185 (6.1411)	Top-1 acc 1.562 (1.606)	Top-5 acc 7.812 (6.467)	lr 0.04869
Warmup Train [5][460/3239]	Time 0.438 (0.532)	Data 0.001 (0.026)	Loss 6.1651 (6.1409)	Top-1 acc 2.344 (1.609)	Top-5 acc 5.078 (6.454)	lr 0.04869
Warmup Train [5][470/3239]	Time 0.514 (0.532)	Data 0.001 (0.026)	Loss 6.1862 (6.1408)	Top-1 acc 0.781 (1.610)	Top-5 acc 5.859 (6.458)	lr 0.04869
Warmup Train [5][480/3239]	Time 0.531 (0.531)	Data 0.001 (0.025)	Loss 6.1157 (6.1401)	Top-1 acc 1.562 (1.613)	Top-5 acc 7.812 (6.484)	lr 0.04868
Warmup Train [5][490/3239]	Time 0.485 (0.530)	Data 0.001 (0.025)	Loss 6.0667 (6.1396)	Top-1 acc 0.781 (1.617)	Top-5 acc 8.203 (6.497)	lr 0.04868
Warmup Train [5][500/3239]	Time 0.541 (0.530)	Data 0.001 (0.024)	Loss 6.0345 (6.1392)	Top-1 acc 2.734 (1.627)	Top-5 acc 8.984 (6.513)	lr 0.04868
Warmup Train [5][510/3239]	Time 0.635 (0.529)	Data 0.001 (0.024)	Loss 6.0832 (6.1389)	Top-1 acc 1.172 (1.634)	Top-5 acc 4.688 (6.518)	lr 0.04868
Warmup Train [5][520/3239]	Time 0.542 (0.529)	Data 0.001 (0.024)	Loss 6.2003 (6.1387)	Top-1 acc 1.172 (1.632)	Top-5 acc 6.250 (6.521)	lr 0.04868
Warmup Train [5][530/3239]	Time 0.297 (0.527)	Data 0.003 (0.023)	Loss 6.1461 (6.1388)	Top-1 acc 1.172 (1.632)	Top-5 acc 7.422 (6.515)	lr 0.04868
Warmup Train [5][540/3239]	Time 0.541 (0.527)	Data 0.001 (0.023)	Loss 6.0976 (6.1381)	Top-1 acc 0.781 (1.634)	Top-5 acc 6.641 (6.517)	lr 0.04867
Warmup Train [5][550/3239]	Time 0.516 (0.527)	Data 0.001 (0.023)	Loss 6.0904 (6.1382)	Top-1 acc 2.734 (1.636)	Top-5 acc 7.422 (6.509)	lr 0.04867
Warmup Train [5][560/3239]	Time 0.654 (0.527)	Data 0.001 (0.023)	Loss 6.1303 (6.1383)	Top-1 acc 1.562 (1.628)	Top-5 acc 6.250 (6.493)	lr 0.04867
Warmup Train [5][570/3239]	Time 0.350 (0.526)	Data 0.001 (0.022)	Loss 6.1152 (6.1374)	Top-1 acc 2.344 (1.629)	Top-5 acc 7.812 (6.509)	lr 0.04867
Warmup Train [5][580/3239]	Time 0.535 (0.526)	Data 0.001 (0.022)	Loss 6.1033 (6.1371)	Top-1 acc 1.172 (1.628)	Top-5 acc 7.031 (6.497)	lr 0.04867
Warmup Train [5][590/3239]	Time 0.412 (0.526)	Data 0.001 (0.022)	Loss 6.0539 (6.1369)	Top-1 acc 2.734 (1.626)	Top-5 acc 8.594 (6.505)	lr 0.04866
Warmup Train [5][600/3239]	Time 0.568 (0.526)	Data 0.001 (0.022)	Loss 6.1025 (6.1366)	Top-1 acc 1.172 (1.624)	Top-5 acc 4.297 (6.509)	lr 0.04866
Warmup Train [5][610/3239]	Time 0.423 (0.525)	Data 0.001 (0.021)	Loss 5.9120 (6.1355)	Top-1 acc 2.734 (1.630)	Top-5 acc 8.984 (6.527)	lr 0.04866
Warmup Train [5][620/3239]	Time 0.432 (0.525)	Data 0.001 (0.021)	Loss 6.1308 (6.1354)	Top-1 acc 1.172 (1.633)	Top-5 acc 6.641 (6.529)	lr 0.04866
Warmup Train [5][630/3239]	Time 0.542 (0.525)	Data 0.001 (0.021)	Loss 6.0257 (6.1350)	Top-1 acc 4.688 (1.642)	Top-5 acc 9.766 (6.547)	lr 0.04866
Warmup Train [5][640/3239]	Time 0.341 (0.525)	Data 0.001 (0.021)	Loss 6.1125 (6.1352)	Top-1 acc 1.172 (1.644)	Top-5 acc 4.688 (6.547)	lr 0.04865
Warmup Train [5][650/3239]	Time 0.492 (0.524)	Data 0.001 (0.021)	Loss 6.0978 (6.1350)	Top-1 acc 2.344 (1.642)	Top-5 acc 9.375 (6.546)	lr 0.04865
Warmup Train [5][660/3239]	Time 0.624 (0.524)	Data 0.001 (0.021)	Loss 6.1818 (6.1350)	Top-1 acc 1.562 (1.643)	Top-5 acc 6.641 (6.534)	lr 0.04865
Warmup Train [5][670/3239]	Time 0.597 (0.524)	Data 0.001 (0.020)	Loss 5.9886 (6.1342)	Top-1 acc 4.688 (1.653)	Top-5 acc 8.984 (6.544)	lr 0.04865
Warmup Train [5][680/3239]	Time 0.645 (0.524)	Data 0.001 (0.020)	Loss 6.2032 (6.1339)	Top-1 acc 1.562 (1.655)	Top-5 acc 5.078 (6.553)	lr 0.04865
Warmup Train [5][690/3239]	Time 0.476 (0.524)	Data 0.001 (0.020)	Loss 6.0546 (6.1335)	Top-1 acc 1.953 (1.655)	Top-5 acc 7.422 (6.558)	lr 0.04864
Warmup Train [5][700/3239]	Time 0.521 (0.524)	Data 0.001 (0.020)	Loss 6.0277 (6.1328)	Top-1 acc 1.562 (1.655)	Top-5 acc 7.422 (6.566)	lr 0.04864
Warmup Train [5][710/3239]	Time 0.669 (0.524)	Data 0.001 (0.020)	Loss 6.0620 (6.1324)	Top-1 acc 2.344 (1.652)	Top-5 acc 7.812 (6.570)	lr 0.04864
Warmup Train [5][720/3239]	Time 0.636 (0.524)	Data 0.001 (0.019)	Loss 6.1349 (6.1322)	Top-1 acc 3.516 (1.659)	Top-5 acc 7.422 (6.572)	lr 0.04864
Warmup Train [5][730/3239]	Time 0.717 (0.524)	Data 0.001 (0.019)	Loss 6.1610 (6.1316)	Top-1 acc 1.172 (1.661)	Top-5 acc 7.422 (6.584)	lr 0.04864
Warmup Train [5][740/3239]	Time 0.536 (0.524)	Data 0.001 (0.019)	Loss 6.1651 (6.1313)	Top-1 acc 1.172 (1.667)	Top-5 acc 3.906 (6.589)	lr 0.04863
Warmup Train [5][750/3239]	Time 0.593 (0.524)	Data 0.001 (0.019)	Loss 6.1563 (6.1310)	Top-1 acc 1.953 (1.672)	Top-5 acc 7.031 (6.601)	lr 0.04863
Warmup Train [5][760/3239]	Time 0.480 (0.523)	Data 0.001 (0.019)	Loss 6.1152 (6.1312)	Top-1 acc 2.344 (1.674)	Top-5 acc 7.812 (6.610)	lr 0.04863
Warmup Train [5][770/3239]	Time 0.625 (0.523)	Data 0.001 (0.018)	Loss 6.1132 (6.1309)	Top-1 acc 0.781 (1.679)	Top-5 acc 6.250 (6.616)	lr 0.04863
Warmup Train [5][780/3239]	Time 0.554 (0.523)	Data 0.001 (0.018)	Loss 6.0837 (6.1308)	Top-1 acc 0.391 (1.681)	Top-5 acc 8.203 (6.621)	lr 0.04863
Warmup Train [5][790/3239]	Time 0.512 (0.523)	Data 0.001 (0.018)	Loss 5.9782 (6.1303)	Top-1 acc 2.734 (1.681)	Top-5 acc 10.938 (6.633)	lr 0.04862
Warmup Train [5][800/3239]	Time 0.515 (0.521)	Data 0.001 (0.018)	Loss 6.0548 (6.1299)	Top-1 acc 3.125 (1.687)	Top-5 acc 8.594 (6.646)	lr 0.04862
Warmup Train [5][810/3239]	Time 0.564 (0.521)	Data 0.001 (0.018)	Loss 6.1270 (6.1297)	Top-1 acc 2.344 (1.685)	Top-5 acc 9.766 (6.648)	lr 0.04862
Warmup Train [5][820/3239]	Time 0.350 (0.521)	Data 0.001 (0.018)	Loss 6.1421 (6.1295)	Top-1 acc 2.734 (1.690)	Top-5 acc 5.469 (6.652)	lr 0.04862
Warmup Train [5][830/3239]	Time 0.640 (0.522)	Data 0.001 (0.018)	Loss 6.0790 (6.1292)	Top-1 acc 1.172 (1.691)	Top-5 acc 5.859 (6.656)	lr 0.04862
Warmup Train [5][840/3239]	Time 0.407 (0.522)	Data 0.001 (0.017)	Loss 6.0642 (6.1286)	Top-1 acc 2.734 (1.695)	Top-5 acc 7.812 (6.668)	lr 0.04861
Warmup Train [5][850/3239]	Time 0.525 (0.521)	Data 0.002 (0.017)	Loss 6.2110 (6.1286)	Top-1 acc 1.953 (1.696)	Top-5 acc 6.641 (6.668)	lr 0.04861
Warmup Train [5][860/3239]	Time 0.425 (0.521)	Data 0.001 (0.017)	Loss 6.0912 (6.1284)	Top-1 acc 1.953 (1.691)	Top-5 acc 7.812 (6.664)	lr 0.04861
Warmup Train [5][870/3239]	Time 0.610 (0.521)	Data 0.001 (0.017)	Loss 6.1728 (6.1279)	Top-1 acc 1.562 (1.693)	Top-5 acc 5.469 (6.672)	lr 0.04861
Warmup Train [5][880/3239]	Time 0.593 (0.521)	Data 0.001 (0.017)	Loss 6.1183 (6.1278)	Top-1 acc 1.953 (1.693)	Top-5 acc 7.422 (6.667)	lr 0.04861
Warmup Train [5][890/3239]	Time 0.414 (0.521)	Data 0.001 (0.017)	Loss 6.1246 (6.1269)	Top-1 acc 0.781 (1.692)	Top-5 acc 5.078 (6.676)	lr 0.04860
Warmup Train [5][900/3239]	Time 0.349 (0.521)	Data 0.022 (0.017)	Loss 6.1125 (6.1267)	Top-1 acc 2.344 (1.693)	Top-5 acc 8.594 (6.685)	lr 0.04860
Warmup Train [5][910/3239]	Time 0.390 (0.521)	Data 0.001 (0.017)	Loss 6.0958 (6.1263)	Top-1 acc 2.344 (1.696)	Top-5 acc 7.812 (6.686)	lr 0.04860
Warmup Train [5][920/3239]	Time 0.541 (0.521)	Data 0.001 (0.017)	Loss 6.0674 (6.1256)	Top-1 acc 1.953 (1.703)	Top-5 acc 7.812 (6.694)	lr 0.04860
Warmup Train [5][930/3239]	Time 0.522 (0.521)	Data 0.001 (0.016)	Loss 6.0410 (6.1252)	Top-1 acc 2.734 (1.705)	Top-5 acc 8.984 (6.699)	lr 0.04860
Warmup Train [5][940/3239]	Time 0.622 (0.521)	Data 0.002 (0.016)	Loss 6.1096 (6.1248)	Top-1 acc 0.781 (1.706)	Top-5 acc 3.906 (6.697)	lr 0.04859
Warmup Train [5][950/3239]	Time 0.446 (0.520)	Data 0.001 (0.016)	Loss 6.1145 (6.1245)	Top-1 acc 1.562 (1.706)	Top-5 acc 7.812 (6.710)	lr 0.04859
Warmup Train [5][960/3239]	Time 0.629 (0.520)	Data 0.001 (0.016)	Loss 6.0540 (6.1243)	Top-1 acc 1.562 (1.706)	Top-5 acc 8.984 (6.713)	lr 0.04859
Warmup Train [5][970/3239]	Time 0.612 (0.520)	Data 0.001 (0.016)	Loss 6.0503 (6.1244)	Top-1 acc 1.562 (1.709)	Top-5 acc 7.812 (6.717)	lr 0.04859
Warmup Train [5][980/3239]	Time 0.556 (0.520)	Data 0.001 (0.016)	Loss 6.1106 (6.1241)	Top-1 acc 1.172 (1.709)	Top-5 acc 7.422 (6.727)	lr 0.04859
Warmup Train [5][990/3239]	Time 0.409 (0.520)	Data 0.001 (0.016)	Loss 6.1483 (6.1240)	Top-1 acc 1.562 (1.708)	Top-5 acc 6.641 (6.723)	lr 0.04858
Warmup Train [5][1000/3239]	Time 0.510 (0.520)	Data 0.001 (0.016)	Loss 6.0636 (6.1237)	Top-1 acc 1.562 (1.712)	Top-5 acc 8.594 (6.733)	lr 0.04858
Warmup Train [5][1010/3239]	Time 0.555 (0.520)	Data 0.001 (0.016)	Loss 6.0720 (6.1231)	Top-1 acc 3.125 (1.717)	Top-5 acc 6.641 (6.733)	lr 0.04858
Warmup Train [5][1020/3239]	Time 0.724 (0.520)	Data 0.001 (0.016)	Loss 6.1836 (6.1229)	Top-1 acc 0.781 (1.716)	Top-5 acc 4.688 (6.734)	lr 0.04858
Warmup Train [5][1030/3239]	Time 0.638 (0.520)	Data 0.001 (0.015)	Loss 6.0795 (6.1226)	Top-1 acc 1.172 (1.725)	Top-5 acc 6.641 (6.747)	lr 0.04858
Warmup Train [5][1040/3239]	Time 0.530 (0.520)	Data 0.001 (0.015)	Loss 6.1003 (6.1223)	Top-1 acc 1.172 (1.728)	Top-5 acc 7.031 (6.754)	lr 0.04857
Warmup Train [5][1050/3239]	Time 0.423 (0.519)	Data 0.001 (0.015)	Loss 6.1729 (6.1223)	Top-1 acc 0.781 (1.731)	Top-5 acc 6.250 (6.754)	lr 0.04857
Warmup Train [5][1060/3239]	Time 0.360 (0.519)	Data 0.001 (0.015)	Loss 6.0418 (6.1219)	Top-1 acc 3.125 (1.733)	Top-5 acc 12.109 (6.764)	lr 0.04857
Warmup Train [5][1070/3239]	Time 0.615 (0.519)	Data 0.001 (0.015)	Loss 6.0381 (6.1215)	Top-1 acc 2.734 (1.735)	Top-5 acc 8.203 (6.774)	lr 0.04857
Warmup Train [5][1080/3239]	Time 0.541 (0.519)	Data 0.001 (0.015)	Loss 6.0873 (6.1212)	Top-1 acc 3.516 (1.732)	Top-5 acc 6.250 (6.770)	lr 0.04857
Warmup Train [5][1090/3239]	Time 0.509 (0.519)	Data 0.001 (0.015)	Loss 6.0075 (6.1208)	Top-1 acc 1.172 (1.730)	Top-5 acc 7.422 (6.771)	lr 0.04856
Warmup Train [5][1100/3239]	Time 0.473 (0.519)	Data 0.001 (0.015)	Loss 6.0698 (6.1205)	Top-1 acc 2.344 (1.730)	Top-5 acc 8.203 (6.778)	lr 0.04856
Warmup Train [5][1110/3239]	Time 0.590 (0.519)	Data 0.002 (0.015)	Loss 6.0096 (6.1200)	Top-1 acc 3.516 (1.735)	Top-5 acc 8.984 (6.790)	lr 0.04856
Warmup Train [5][1120/3239]	Time 0.618 (0.519)	Data 0.001 (0.015)	Loss 6.1497 (6.1199)	Top-1 acc 1.562 (1.733)	Top-5 acc 4.297 (6.792)	lr 0.04856
Warmup Train [5][1130/3239]	Time 0.522 (0.519)	Data 0.001 (0.015)	Loss 6.0333 (6.1195)	Top-1 acc 2.734 (1.737)	Top-5 acc 6.641 (6.794)	lr 0.04856
Warmup Train [5][1140/3239]	Time 0.516 (0.519)	Data 0.001 (0.014)	Loss 6.0940 (6.1193)	Top-1 acc 2.344 (1.740)	Top-5 acc 7.422 (6.801)	lr 0.04855
Warmup Train [5][1150/3239]	Time 0.543 (0.519)	Data 0.001 (0.014)	Loss 6.1385 (6.1190)	Top-1 acc 1.172 (1.742)	Top-5 acc 4.688 (6.803)	lr 0.04855
Warmup Train [5][1160/3239]	Time 0.714 (0.519)	Data 0.001 (0.014)	Loss 6.1596 (6.1191)	Top-1 acc 0.781 (1.742)	Top-5 acc 7.812 (6.800)	lr 0.04855
Warmup Train [5][1170/3239]	Time 0.314 (0.519)	Data 0.001 (0.014)	Loss 6.0757 (6.1188)	Top-1 acc 1.562 (1.744)	Top-5 acc 7.812 (6.807)	lr 0.04855
Warmup Train [5][1180/3239]	Time 0.621 (0.519)	Data 0.001 (0.014)	Loss 6.0715 (6.1186)	Top-1 acc 1.562 (1.744)	Top-5 acc 6.641 (6.807)	lr 0.04855
Warmup Train [5][1190/3239]	Time 0.391 (0.519)	Data 0.001 (0.014)	Loss 6.0576 (6.1183)	Top-1 acc 1.562 (1.745)	Top-5 acc 6.641 (6.812)	lr 0.04854
Warmup Train [5][1200/3239]	Time 0.492 (0.519)	Data 0.001 (0.014)	Loss 6.0987 (6.1181)	Top-1 acc 2.344 (1.747)	Top-5 acc 7.422 (6.820)	lr 0.04854
Warmup Train [5][1210/3239]	Time 0.444 (0.518)	Data 0.001 (0.014)	Loss 6.0383 (6.1178)	Top-1 acc 3.125 (1.749)	Top-5 acc 7.812 (6.824)	lr 0.04854
Warmup Train [5][1220/3239]	Time 0.542 (0.518)	Data 0.001 (0.014)	Loss 6.0701 (6.1177)	Top-1 acc 2.734 (1.754)	Top-5 acc 5.859 (6.823)	lr 0.04854
Warmup Train [5][1230/3239]	Time 0.424 (0.518)	Data 0.001 (0.014)	Loss 6.0271 (6.1176)	Top-1 acc 2.344 (1.753)	Top-5 acc 8.984 (6.824)	lr 0.04854
Warmup Train [5][1240/3239]	Time 0.671 (0.518)	Data 0.001 (0.014)	Loss 6.2102 (6.1176)	Top-1 acc 0.781 (1.756)	Top-5 acc 5.859 (6.824)	lr 0.04853
Warmup Train [5][1250/3239]	Time 0.662 (0.518)	Data 0.001 (0.014)	Loss 6.0621 (6.1174)	Top-1 acc 1.562 (1.758)	Top-5 acc 7.422 (6.828)	lr 0.04853
Warmup Train [5][1260/3239]	Time 0.638 (0.518)	Data 0.001 (0.014)	Loss 6.0990 (6.1172)	Top-1 acc 1.562 (1.758)	Top-5 acc 7.422 (6.825)	lr 0.04853
Warmup Train [5][1270/3239]	Time 0.494 (0.518)	Data 0.001 (0.014)	Loss 6.1153 (6.1171)	Top-1 acc 1.172 (1.760)	Top-5 acc 8.594 (6.824)	lr 0.04853
Warmup Train [5][1280/3239]	Time 0.497 (0.518)	Data 0.001 (0.013)	Loss 6.0912 (6.1167)	Top-1 acc 0.781 (1.761)	Top-5 acc 7.812 (6.832)	lr 0.04853
Warmup Train [5][1290/3239]	Time 0.563 (0.518)	Data 0.001 (0.013)	Loss 6.1097 (6.1164)	Top-1 acc 2.344 (1.767)	Top-5 acc 6.641 (6.837)	lr 0.04852
Warmup Train [5][1300/3239]	Time 0.349 (0.518)	Data 0.001 (0.013)	Loss 6.0586 (6.1162)	Top-1 acc 1.562 (1.769)	Top-5 acc 7.812 (6.841)	lr 0.04852
Warmup Train [5][1310/3239]	Time 0.555 (0.518)	Data 0.001 (0.013)	Loss 6.1442 (6.1159)	Top-1 acc 0.781 (1.771)	Top-5 acc 5.469 (6.844)	lr 0.04852
Warmup Train [5][1320/3239]	Time 0.461 (0.517)	Data 0.001 (0.013)	Loss 6.0563 (6.1154)	Top-1 acc 1.172 (1.772)	Top-5 acc 9.375 (6.859)	lr 0.04852
Warmup Train [5][1330/3239]	Time 0.580 (0.517)	Data 0.001 (0.013)	Loss 6.1020 (6.1150)	Top-1 acc 2.734 (1.777)	Top-5 acc 7.422 (6.870)	lr 0.04852
Warmup Train [5][1340/3239]	Time 0.549 (0.517)	Data 0.001 (0.013)	Loss 6.0531 (6.1144)	Top-1 acc 1.953 (1.782)	Top-5 acc 7.422 (6.881)	lr 0.04851
Warmup Train [5][1350/3239]	Time 0.402 (0.517)	Data 0.001 (0.013)	Loss 5.9963 (6.1141)	Top-1 acc 2.734 (1.783)	Top-5 acc 10.156 (6.879)	lr 0.04851
Warmup Train [5][1360/3239]	Time 0.684 (0.517)	Data 0.001 (0.013)	Loss 5.9735 (6.1136)	Top-1 acc 1.953 (1.782)	Top-5 acc 10.547 (6.877)	lr 0.04851
Warmup Train [5][1370/3239]	Time 0.411 (0.517)	Data 0.001 (0.013)	Loss 6.0373 (6.1136)	Top-1 acc 3.906 (1.785)	Top-5 acc 11.328 (6.883)	lr 0.04851
Warmup Train [5][1380/3239]	Time 0.382 (0.517)	Data 0.001 (0.013)	Loss 6.1203 (6.1134)	Top-1 acc 1.562 (1.788)	Top-5 acc 6.250 (6.887)	lr 0.04850
Warmup Train [5][1390/3239]	Time 0.486 (0.517)	Data 0.001 (0.013)	Loss 6.1219 (6.1132)	Top-1 acc 2.734 (1.789)	Top-5 acc 10.547 (6.889)	lr 0.04850
Warmup Train [5][1400/3239]	Time 0.406 (0.517)	Data 0.001 (0.013)	Loss 6.2000 (6.1131)	Top-1 acc 0.781 (1.789)	Top-5 acc 4.297 (6.896)	lr 0.04850
Warmup Train [5][1410/3239]	Time 0.516 (0.517)	Data 0.001 (0.013)	Loss 5.9812 (6.1126)	Top-1 acc 2.734 (1.793)	Top-5 acc 8.984 (6.902)	lr 0.04850
Warmup Train [5][1420/3239]	Time 0.340 (0.516)	Data 0.001 (0.013)	Loss 6.1062 (6.1122)	Top-1 acc 0.781 (1.792)	Top-5 acc 4.688 (6.904)	lr 0.04850
Warmup Train [5][1430/3239]	Time 0.430 (0.516)	Data 0.001 (0.013)	Loss 6.1043 (6.1119)	Top-1 acc 2.734 (1.795)	Top-5 acc 8.594 (6.910)	lr 0.04849
Warmup Train [5][1440/3239]	Time 0.357 (0.516)	Data 0.001 (0.013)	Loss 6.0774 (6.1115)	Top-1 acc 1.172 (1.796)	Top-5 acc 7.812 (6.921)	lr 0.04849
Warmup Train [5][1450/3239]	Time 0.405 (0.516)	Data 0.001 (0.013)	Loss 6.0592 (6.1112)	Top-1 acc 1.562 (1.799)	Top-5 acc 8.203 (6.932)	lr 0.04849
Warmup Train [5][1460/3239]	Time 0.549 (0.516)	Data 0.001 (0.013)	Loss 6.0970 (6.1108)	Top-1 acc 2.734 (1.800)	Top-5 acc 7.812 (6.942)	lr 0.04849
Warmup Train [5][1470/3239]	Time 0.537 (0.516)	Data 0.001 (0.013)	Loss 5.9888 (6.1105)	Top-1 acc 1.562 (1.804)	Top-5 acc 7.422 (6.949)	lr 0.04849
Warmup Train [5][1480/3239]	Time 0.621 (0.516)	Data 0.001 (0.013)	Loss 6.0213 (6.1102)	Top-1 acc 2.734 (1.806)	Top-5 acc 7.812 (6.952)	lr 0.04848
Warmup Train [5][1490/3239]	Time 0.506 (0.516)	Data 0.001 (0.013)	Loss 5.9740 (6.1098)	Top-1 acc 3.125 (1.812)	Top-5 acc 8.203 (6.957)	lr 0.04848
Warmup Train [5][1500/3239]	Time 0.478 (0.516)	Data 0.001 (0.013)	Loss 6.1671 (6.1096)	Top-1 acc 1.172 (1.814)	Top-5 acc 5.469 (6.960)	lr 0.04848
Warmup Train [5][1510/3239]	Time 0.492 (0.516)	Data 0.001 (0.013)	Loss 6.1049 (6.1091)	Top-1 acc 1.172 (1.815)	Top-5 acc 8.203 (6.966)	lr 0.04848
Warmup Train [5][1520/3239]	Time 0.519 (0.516)	Data 0.001 (0.013)	Loss 6.0105 (6.1088)	Top-1 acc 1.172 (1.816)	Top-5 acc 8.984 (6.972)	lr 0.04848
Warmup Train [5][1530/3239]	Time 0.604 (0.516)	Data 0.001 (0.013)	Loss 6.0422 (6.1084)	Top-1 acc 2.344 (1.817)	Top-5 acc 6.641 (6.977)	lr 0.04847
Warmup Train [5][1540/3239]	Time 0.417 (0.516)	Data 0.001 (0.013)	Loss 6.0111 (6.1081)	Top-1 acc 3.516 (1.821)	Top-5 acc 11.719 (6.983)	lr 0.04847
Warmup Train [5][1550/3239]	Time 0.563 (0.516)	Data 0.001 (0.013)	Loss 6.0197 (6.1078)	Top-1 acc 2.344 (1.819)	Top-5 acc 6.641 (6.986)	lr 0.04847
Warmup Train [5][1560/3239]	Time 0.607 (0.516)	Data 0.001 (0.012)	Loss 5.9541 (6.1073)	Top-1 acc 3.125 (1.821)	Top-5 acc 9.375 (6.990)	lr 0.04847
Warmup Train [5][1570/3239]	Time 0.345 (0.516)	Data 0.001 (0.012)	Loss 6.0574 (6.1069)	Top-1 acc 1.953 (1.823)	Top-5 acc 8.203 (6.994)	lr 0.04847
Warmup Train [5][1580/3239]	Time 0.496 (0.515)	Data 0.001 (0.012)	Loss 6.0919 (6.1066)	Top-1 acc 2.734 (1.824)	Top-5 acc 8.594 (7.003)	lr 0.04846
Warmup Train [5][1590/3239]	Time 0.609 (0.515)	Data 0.001 (0.012)	Loss 5.9764 (6.1063)	Top-1 acc 4.297 (1.829)	Top-5 acc 11.328 (7.011)	lr 0.04846
Warmup Train [5][1600/3239]	Time 0.611 (0.515)	Data 0.001 (0.012)	Loss 6.0467 (6.1059)	Top-1 acc 1.953 (1.833)	Top-5 acc 8.203 (7.018)	lr 0.04846
Warmup Train [5][1610/3239]	Time 0.629 (0.515)	Data 0.001 (0.012)	Loss 6.0627 (6.1057)	Top-1 acc 2.344 (1.833)	Top-5 acc 9.766 (7.024)	lr 0.04846
Warmup Train [5][1620/3239]	Time 0.552 (0.515)	Data 0.001 (0.012)	Loss 5.9105 (6.1055)	Top-1 acc 2.734 (1.834)	Top-5 acc 8.984 (7.029)	lr 0.04845
Warmup Train [5][1630/3239]	Time 0.629 (0.515)	Data 0.001 (0.012)	Loss 6.0494 (6.1052)	Top-1 acc 1.953 (1.833)	Top-5 acc 6.250 (7.029)	lr 0.04845
Warmup Train [5][1640/3239]	Time 0.574 (0.515)	Data 0.001 (0.012)	Loss 6.0300 (6.1049)	Top-1 acc 3.516 (1.837)	Top-5 acc 11.328 (7.036)	lr 0.04845
Warmup Train [5][1650/3239]	Time 0.546 (0.515)	Data 0.001 (0.012)	Loss 6.0792 (6.1047)	Top-1 acc 1.562 (1.836)	Top-5 acc 8.203 (7.038)	lr 0.04845
Warmup Train [5][1660/3239]	Time 0.523 (0.515)	Data 0.001 (0.012)	Loss 6.0296 (6.1043)	Top-1 acc 1.953 (1.838)	Top-5 acc 8.984 (7.049)	lr 0.04845
Warmup Train [5][1670/3239]	Time 0.423 (0.515)	Data 0.001 (0.012)	Loss 6.1382 (6.1040)	Top-1 acc 2.734 (1.839)	Top-5 acc 7.422 (7.053)	lr 0.04844
Warmup Train [5][1680/3239]	Time 0.437 (0.515)	Data 0.001 (0.012)	Loss 6.0751 (6.1038)	Top-1 acc 1.562 (1.840)	Top-5 acc 7.422 (7.054)	lr 0.04844
Warmup Train [5][1690/3239]	Time 0.578 (0.515)	Data 0.001 (0.012)	Loss 6.0530 (6.1035)	Top-1 acc 2.344 (1.843)	Top-5 acc 8.203 (7.059)	lr 0.04844
Warmup Train [5][1700/3239]	Time 0.438 (0.515)	Data 0.001 (0.012)	Loss 6.0821 (6.1034)	Top-1 acc 1.953 (1.844)	Top-5 acc 6.250 (7.059)	lr 0.04844
Warmup Train [5][1710/3239]	Time 0.517 (0.515)	Data 0.002 (0.012)	Loss 6.0552 (6.1030)	Top-1 acc 3.516 (1.848)	Top-5 acc 8.594 (7.064)	lr 0.04844
Warmup Train [5][1720/3239]	Time 0.408 (0.515)	Data 0.001 (0.012)	Loss 6.0333 (6.1026)	Top-1 acc 0.781 (1.849)	Top-5 acc 11.328 (7.075)	lr 0.04843
Warmup Train [5][1730/3239]	Time 0.510 (0.515)	Data 0.001 (0.012)	Loss 6.0447 (6.1022)	Top-1 acc 1.953 (1.851)	Top-5 acc 8.594 (7.080)	lr 0.04843
Warmup Train [5][1740/3239]	Time 0.563 (0.515)	Data 0.001 (0.012)	Loss 5.9921 (6.1020)	Top-1 acc 3.516 (1.854)	Top-5 acc 10.156 (7.084)	lr 0.04843
Warmup Train [5][1750/3239]	Time 0.656 (0.515)	Data 0.001 (0.012)	Loss 6.1123 (6.1018)	Top-1 acc 1.172 (1.853)	Top-5 acc 7.812 (7.089)	lr 0.04843
Warmup Train [5][1760/3239]	Time 0.634 (0.515)	Data 0.001 (0.012)	Loss 5.9913 (6.1014)	Top-1 acc 2.734 (1.854)	Top-5 acc 7.031 (7.093)	lr 0.04843
Warmup Train [5][1770/3239]	Time 0.539 (0.515)	Data 0.001 (0.012)	Loss 6.0538 (6.1010)	Top-1 acc 1.172 (1.857)	Top-5 acc 8.203 (7.098)	lr 0.04842
Warmup Train [5][1780/3239]	Time 0.545 (0.515)	Data 0.001 (0.012)	Loss 5.9940 (6.1007)	Top-1 acc 3.906 (1.862)	Top-5 acc 10.547 (7.106)	lr 0.04842
Warmup Train [5][1790/3239]	Time 0.360 (0.515)	Data 0.001 (0.012)	Loss 6.0646 (6.1004)	Top-1 acc 1.562 (1.862)	Top-5 acc 5.859 (7.111)	lr 0.04842
Warmup Train [5][1800/3239]	Time 0.568 (0.515)	Data 0.001 (0.012)	Loss 6.0194 (6.1002)	Top-1 acc 3.125 (1.862)	Top-5 acc 10.156 (7.114)	lr 0.04842
Warmup Train [5][1810/3239]	Time 0.645 (0.515)	Data 0.001 (0.012)	Loss 6.1385 (6.0999)	Top-1 acc 1.562 (1.865)	Top-5 acc 7.031 (7.120)	lr 0.04841
Warmup Train [5][1820/3239]	Time 0.371 (0.515)	Data 0.001 (0.012)	Loss 6.0973 (6.0996)	Top-1 acc 0.781 (1.866)	Top-5 acc 7.422 (7.126)	lr 0.04841
Warmup Train [5][1830/3239]	Time 0.392 (0.515)	Data 0.001 (0.012)	Loss 6.1625 (6.0993)	Top-1 acc 1.172 (1.870)	Top-5 acc 5.078 (7.132)	lr 0.04841
Warmup Train [5][1840/3239]	Time 0.418 (0.515)	Data 0.001 (0.012)	Loss 6.0148 (6.0990)	Top-1 acc 0.781 (1.868)	Top-5 acc 6.250 (7.135)	lr 0.04841
Warmup Train [5][1850/3239]	Time 0.423 (0.515)	Data 0.001 (0.012)	Loss 6.0394 (6.0988)	Top-1 acc 2.734 (1.870)	Top-5 acc 9.375 (7.138)	lr 0.04841
Warmup Train [5][1860/3239]	Time 0.437 (0.514)	Data 0.001 (0.012)	Loss 5.9641 (6.0984)	Top-1 acc 0.781 (1.873)	Top-5 acc 7.422 (7.142)	lr 0.04840
Warmup Train [5][1870/3239]	Time 0.511 (0.514)	Data 0.001 (0.012)	Loss 5.9893 (6.0981)	Top-1 acc 1.172 (1.873)	Top-5 acc 7.422 (7.148)	lr 0.04840
Warmup Train [5][1880/3239]	Time 0.449 (0.514)	Data 0.001 (0.012)	Loss 6.0527 (6.0978)	Top-1 acc 1.562 (1.875)	Top-5 acc 7.422 (7.152)	lr 0.04840
Warmup Train [5][1890/3239]	Time 0.557 (0.514)	Data 0.001 (0.012)	Loss 5.9697 (6.0975)	Top-1 acc 1.953 (1.878)	Top-5 acc 8.984 (7.160)	lr 0.04840
Warmup Train [5][1900/3239]	Time 0.555 (0.514)	Data 0.001 (0.012)	Loss 5.9031 (6.0971)	Top-1 acc 3.516 (1.879)	Top-5 acc 10.156 (7.167)	lr 0.04840
Warmup Train [5][1910/3239]	Time 0.727 (0.515)	Data 0.001 (0.012)	Loss 6.1089 (6.0969)	Top-1 acc 2.344 (1.881)	Top-5 acc 7.422 (7.173)	lr 0.04839
Warmup Train [5][1920/3239]	Time 0.564 (0.515)	Data 0.001 (0.011)	Loss 6.0787 (6.0965)	Top-1 acc 1.172 (1.883)	Top-5 acc 7.812 (7.179)	lr 0.04839
Warmup Train [5][1930/3239]	Time 0.508 (0.514)	Data 0.001 (0.011)	Loss 6.0934 (6.0963)	Top-1 acc 1.172 (1.882)	Top-5 acc 8.594 (7.180)	lr 0.04839
Warmup Train [5][1940/3239]	Time 0.376 (0.514)	Data 0.001 (0.011)	Loss 6.0473 (6.0960)	Top-1 acc 3.516 (1.884)	Top-5 acc 10.547 (7.186)	lr 0.04839
Warmup Train [5][1950/3239]	Time 0.493 (0.514)	Data 0.001 (0.011)	Loss 6.1091 (6.0957)	Top-1 acc 1.172 (1.882)	Top-5 acc 5.469 (7.189)	lr 0.04838
Warmup Train [5][1960/3239]	Time 0.600 (0.514)	Data 0.001 (0.011)	Loss 6.0098 (6.0954)	Top-1 acc 3.125 (1.883)	Top-5 acc 8.594 (7.199)	lr 0.04838
Warmup Train [5][1970/3239]	Time 0.431 (0.514)	Data 0.001 (0.011)	Loss 6.0589 (6.0951)	Top-1 acc 1.172 (1.884)	Top-5 acc 7.422 (7.204)	lr 0.04838
Warmup Train [5][1980/3239]	Time 0.528 (0.514)	Data 0.001 (0.011)	Loss 5.9620 (6.0948)	Top-1 acc 2.344 (1.885)	Top-5 acc 9.375 (7.207)	lr 0.04838
Warmup Train [5][1990/3239]	Time 0.568 (0.514)	Data 0.001 (0.011)	Loss 6.0512 (6.0944)	Top-1 acc 1.953 (1.886)	Top-5 acc 6.641 (7.212)	lr 0.04838
Warmup Train [5][2000/3239]	Time 0.469 (0.515)	Data 0.001 (0.011)	Loss 6.0877 (6.0942)	Top-1 acc 2.734 (1.888)	Top-5 acc 8.203 (7.213)	lr 0.04837
Warmup Train [5][2010/3239]	Time 0.590 (0.515)	Data 0.001 (0.011)	Loss 5.8950 (6.0938)	Top-1 acc 4.688 (1.891)	Top-5 acc 11.719 (7.219)	lr 0.04837
Warmup Train [5][2020/3239]	Time 0.493 (0.515)	Data 0.001 (0.011)	Loss 6.0506 (6.0935)	Top-1 acc 1.953 (1.891)	Top-5 acc 7.422 (7.222)	lr 0.04837
Warmup Train [5][2030/3239]	Time 0.428 (0.515)	Data 0.001 (0.011)	Loss 6.0091 (6.0932)	Top-1 acc 1.953 (1.891)	Top-5 acc 7.812 (7.224)	lr 0.04837
Warmup Train [5][2040/3239]	Time 0.435 (0.515)	Data 0.001 (0.011)	Loss 6.0628 (6.0929)	Top-1 acc 3.516 (1.892)	Top-5 acc 7.422 (7.228)	lr 0.04837
Warmup Train [5][2050/3239]	Time 0.540 (0.515)	Data 0.001 (0.011)	Loss 6.0278 (6.0925)	Top-1 acc 2.344 (1.896)	Top-5 acc 10.547 (7.240)	lr 0.04836
Warmup Train [5][2060/3239]	Time 0.401 (0.515)	Data 0.001 (0.011)	Loss 6.1598 (6.0921)	Top-1 acc 1.172 (1.897)	Top-5 acc 8.203 (7.244)	lr 0.04836
Warmup Train [5][2070/3239]	Time 0.492 (0.515)	Data 0.001 (0.011)	Loss 6.0755 (6.0918)	Top-1 acc 1.953 (1.898)	Top-5 acc 6.641 (7.252)	lr 0.04836
Warmup Train [5][2080/3239]	Time 0.572 (0.515)	Data 0.002 (0.011)	Loss 6.1132 (6.0917)	Top-1 acc 1.562 (1.898)	Top-5 acc 7.812 (7.253)	lr 0.04836
Warmup Train [5][2090/3239]	Time 0.401 (0.515)	Data 0.001 (0.011)	Loss 6.0612 (6.0914)	Top-1 acc 1.562 (1.899)	Top-5 acc 6.641 (7.259)	lr 0.04835
Warmup Train [5][2100/3239]	Time 0.520 (0.515)	Data 0.001 (0.011)	Loss 6.0351 (6.0910)	Top-1 acc 1.953 (1.898)	Top-5 acc 8.984 (7.264)	lr 0.04835
Warmup Train [5][2110/3239]	Time 0.626 (0.515)	Data 0.001 (0.011)	Loss 6.1158 (6.0908)	Top-1 acc 1.172 (1.899)	Top-5 acc 8.203 (7.269)	lr 0.04835
Warmup Train [5][2120/3239]	Time 0.402 (0.515)	Data 0.001 (0.011)	Loss 6.0380 (6.0906)	Top-1 acc 2.734 (1.899)	Top-5 acc 9.375 (7.271)	lr 0.04835
Warmup Train [5][2130/3239]	Time 0.453 (0.514)	Data 0.001 (0.011)	Loss 6.0230 (6.0902)	Top-1 acc 3.516 (1.902)	Top-5 acc 10.547 (7.280)	lr 0.04835
Warmup Train [5][2140/3239]	Time 0.548 (0.514)	Data 0.001 (0.011)	Loss 6.0237 (6.0900)	Top-1 acc 3.906 (1.902)	Top-5 acc 10.547 (7.281)	lr 0.04834
Warmup Train [5][2150/3239]	Time 0.521 (0.515)	Data 0.001 (0.011)	Loss 6.0162 (6.0898)	Top-1 acc 2.734 (1.904)	Top-5 acc 11.328 (7.287)	lr 0.04834
Warmup Train [5][2160/3239]	Time 0.424 (0.514)	Data 0.001 (0.011)	Loss 6.1547 (6.0898)	Top-1 acc 1.953 (1.904)	Top-5 acc 7.812 (7.292)	lr 0.04834
Warmup Train [5][2170/3239]	Time 0.554 (0.514)	Data 0.001 (0.011)	Loss 6.0090 (6.0894)	Top-1 acc 1.562 (1.907)	Top-5 acc 10.156 (7.297)	lr 0.04834
Warmup Train [5][2180/3239]	Time 0.541 (0.514)	Data 0.001 (0.011)	Loss 5.9688 (6.0892)	Top-1 acc 2.344 (1.908)	Top-5 acc 8.203 (7.296)	lr 0.04834
Warmup Train [5][2190/3239]	Time 0.484 (0.514)	Data 0.001 (0.011)	Loss 6.1575 (6.0890)	Top-1 acc 0.391 (1.908)	Top-5 acc 6.250 (7.298)	lr 0.04833
Warmup Train [5][2200/3239]	Time 0.598 (0.514)	Data 0.001 (0.011)	Loss 6.0438 (6.0886)	Top-1 acc 1.562 (1.910)	Top-5 acc 5.469 (7.303)	lr 0.04833
Warmup Train [5][2210/3239]	Time 0.560 (0.514)	Data 0.001 (0.011)	Loss 6.0882 (6.0884)	Top-1 acc 1.562 (1.910)	Top-5 acc 8.984 (7.310)	lr 0.04833
Warmup Train [5][2220/3239]	Time 0.459 (0.514)	Data 0.001 (0.011)	Loss 6.0576 (6.0881)	Top-1 acc 3.125 (1.913)	Top-5 acc 8.203 (7.315)	lr 0.04833
Warmup Train [5][2230/3239]	Time 0.471 (0.514)	Data 0.001 (0.011)	Loss 6.0247 (6.0878)	Top-1 acc 2.344 (1.916)	Top-5 acc 7.031 (7.321)	lr 0.04832
Warmup Train [5][2240/3239]	Time 0.610 (0.514)	Data 0.001 (0.011)	Loss 6.0698 (6.0875)	Top-1 acc 1.953 (1.917)	Top-5 acc 10.547 (7.327)	lr 0.04832
Warmup Train [5][2250/3239]	Time 0.535 (0.514)	Data 0.001 (0.011)	Loss 6.0146 (6.0872)	Top-1 acc 1.953 (1.918)	Top-5 acc 10.547 (7.333)	lr 0.04832
Warmup Train [5][2260/3239]	Time 0.467 (0.514)	Data 0.001 (0.011)	Loss 6.0385 (6.0869)	Top-1 acc 2.344 (1.921)	Top-5 acc 7.812 (7.339)	lr 0.04832
Warmup Train [5][2270/3239]	Time 0.458 (0.514)	Data 0.001 (0.011)	Loss 5.9305 (6.0865)	Top-1 acc 2.734 (1.924)	Top-5 acc 11.328 (7.346)	lr 0.04832
Warmup Train [5][2280/3239]	Time 0.336 (0.514)	Data 0.001 (0.011)	Loss 5.9739 (6.0862)	Top-1 acc 2.344 (1.925)	Top-5 acc 7.422 (7.348)	lr 0.04831
Warmup Train [5][2290/3239]	Time 0.429 (0.514)	Data 0.001 (0.011)	Loss 6.1030 (6.0859)	Top-1 acc 3.906 (1.927)	Top-5 acc 9.375 (7.354)	lr 0.04831
Warmup Train [5][2300/3239]	Time 0.467 (0.514)	Data 0.001 (0.011)	Loss 6.0262 (6.0855)	Top-1 acc 1.953 (1.930)	Top-5 acc 7.422 (7.358)	lr 0.04831
Warmup Train [5][2310/3239]	Time 0.421 (0.514)	Data 0.001 (0.011)	Loss 5.9356 (6.0854)	Top-1 acc 1.562 (1.932)	Top-5 acc 10.547 (7.360)	lr 0.04831
Warmup Train [5][2320/3239]	Time 0.606 (0.514)	Data 0.001 (0.011)	Loss 6.0876 (6.0851)	Top-1 acc 2.734 (1.934)	Top-5 acc 7.422 (7.364)	lr 0.04830
Warmup Train [5][2330/3239]	Time 0.492 (0.514)	Data 0.001 (0.011)	Loss 6.0427 (6.0848)	Top-1 acc 3.906 (1.938)	Top-5 acc 7.812 (7.371)	lr 0.04830
Warmup Train [5][2340/3239]	Time 0.457 (0.514)	Data 0.001 (0.011)	Loss 6.0232 (6.0845)	Top-1 acc 2.344 (1.941)	Top-5 acc 7.422 (7.376)	lr 0.04830
Warmup Train [5][2350/3239]	Time 0.596 (0.514)	Data 0.001 (0.011)	Loss 6.0555 (6.0843)	Top-1 acc 3.125 (1.942)	Top-5 acc 8.203 (7.379)	lr 0.04830
Warmup Train [5][2360/3239]	Time 0.565 (0.514)	Data 0.001 (0.011)	Loss 6.0251 (6.0840)	Top-1 acc 3.125 (1.946)	Top-5 acc 7.812 (7.385)	lr 0.04830
Warmup Train [5][2370/3239]	Time 0.449 (0.514)	Data 0.001 (0.011)	Loss 5.9703 (6.0837)	Top-1 acc 1.953 (1.945)	Top-5 acc 10.156 (7.385)	lr 0.04829
Warmup Train [5][2380/3239]	Time 0.633 (0.514)	Data 0.001 (0.011)	Loss 5.9682 (6.0832)	Top-1 acc 2.734 (1.946)	Top-5 acc 7.422 (7.393)	lr 0.04829
Warmup Train [5][2390/3239]	Time 0.569 (0.514)	Data 0.001 (0.011)	Loss 6.1570 (6.0830)	Top-1 acc 2.734 (1.948)	Top-5 acc 9.766 (7.403)	lr 0.04829
Warmup Train [5][2400/3239]	Time 0.515 (0.514)	Data 0.001 (0.011)	Loss 5.9703 (6.0828)	Top-1 acc 0.781 (1.948)	Top-5 acc 5.469 (7.407)	lr 0.04829
Warmup Train [5][2410/3239]	Time 0.483 (0.514)	Data 0.001 (0.011)	Loss 5.9633 (6.0824)	Top-1 acc 4.297 (1.954)	Top-5 acc 10.938 (7.417)	lr 0.04828
Warmup Train [5][2420/3239]	Time 0.490 (0.514)	Data 0.001 (0.011)	Loss 5.9672 (6.0821)	Top-1 acc 1.953 (1.956)	Top-5 acc 12.109 (7.423)	lr 0.04828
Warmup Train [5][2430/3239]	Time 0.491 (0.514)	Data 0.001 (0.011)	Loss 6.1699 (6.0819)	Top-1 acc 1.953 (1.957)	Top-5 acc 5.469 (7.425)	lr 0.04828
Warmup Train [5][2440/3239]	Time 0.530 (0.514)	Data 0.001 (0.011)	Loss 6.0913 (6.0816)	Top-1 acc 3.125 (1.960)	Top-5 acc 5.859 (7.430)	lr 0.04828
Warmup Train [5][2450/3239]	Time 0.312 (0.513)	Data 0.002 (0.011)	Loss 6.0782 (6.0813)	Top-1 acc 1.562 (1.960)	Top-5 acc 5.859 (7.435)	lr 0.04828
Warmup Train [5][2460/3239]	Time 0.629 (0.514)	Data 0.001 (0.011)	Loss 5.9753 (6.0810)	Top-1 acc 3.125 (1.964)	Top-5 acc 9.766 (7.442)	lr 0.04827
Warmup Train [5][2470/3239]	Time 0.415 (0.513)	Data 0.001 (0.011)	Loss 5.9044 (6.0807)	Top-1 acc 4.297 (1.966)	Top-5 acc 11.328 (7.449)	lr 0.04827
Warmup Train [5][2480/3239]	Time 0.636 (0.513)	Data 0.001 (0.011)	Loss 6.0087 (6.0804)	Top-1 acc 3.516 (1.968)	Top-5 acc 12.109 (7.457)	lr 0.04827
Warmup Train [5][2490/3239]	Time 0.516 (0.513)	Data 0.001 (0.011)	Loss 5.9030 (6.0800)	Top-1 acc 4.688 (1.970)	Top-5 acc 10.938 (7.464)	lr 0.04827
Warmup Train [5][2500/3239]	Time 0.464 (0.513)	Data 0.001 (0.010)	Loss 5.9980 (6.0797)	Top-1 acc 1.953 (1.972)	Top-5 acc 7.812 (7.469)	lr 0.04826
Warmup Train [5][2510/3239]	Time 0.621 (0.513)	Data 0.001 (0.010)	Loss 5.9588 (6.0793)	Top-1 acc 4.688 (1.974)	Top-5 acc 10.156 (7.473)	lr 0.04826
Warmup Train [5][2520/3239]	Time 0.591 (0.513)	Data 0.001 (0.010)	Loss 5.9957 (6.0790)	Top-1 acc 3.516 (1.978)	Top-5 acc 8.594 (7.481)	lr 0.04826
Warmup Train [5][2530/3239]	Time 0.533 (0.513)	Data 0.001 (0.010)	Loss 5.9190 (6.0788)	Top-1 acc 2.734 (1.979)	Top-5 acc 10.938 (7.482)	lr 0.04826
Warmup Train [5][2540/3239]	Time 0.477 (0.513)	Data 0.001 (0.010)	Loss 5.9874 (6.0784)	Top-1 acc 4.297 (1.982)	Top-5 acc 10.156 (7.489)	lr 0.04826
Warmup Train [5][2550/3239]	Time 0.470 (0.513)	Data 0.001 (0.010)	Loss 6.1286 (6.0781)	Top-1 acc 0.781 (1.984)	Top-5 acc 6.641 (7.497)	lr 0.04825
Warmup Train [5][2560/3239]	Time 0.384 (0.513)	Data 0.001 (0.010)	Loss 6.0364 (6.0779)	Top-1 acc 1.953 (1.985)	Top-5 acc 7.812 (7.502)	lr 0.04825
Warmup Train [5][2570/3239]	Time 0.758 (0.513)	Data 0.001 (0.010)	Loss 5.9600 (6.0775)	Top-1 acc 4.688 (1.985)	Top-5 acc 10.156 (7.504)	lr 0.04825
Warmup Train [5][2580/3239]	Time 0.391 (0.513)	Data 0.001 (0.010)	Loss 5.9596 (6.0772)	Top-1 acc 3.906 (1.988)	Top-5 acc 9.375 (7.509)	lr 0.04825
Warmup Train [5][2590/3239]	Time 0.500 (0.514)	Data 0.001 (0.010)	Loss 6.0600 (6.0768)	Top-1 acc 3.125 (1.992)	Top-5 acc 7.422 (7.516)	lr 0.04824
Warmup Train [5][2600/3239]	Time 0.477 (0.514)	Data 0.002 (0.010)	Loss 5.9545 (6.0765)	Top-1 acc 3.906 (1.995)	Top-5 acc 8.984 (7.522)	lr 0.04824
Warmup Train [5][2610/3239]	Time 0.542 (0.514)	Data 0.002 (0.010)	Loss 5.9590 (6.0762)	Top-1 acc 1.953 (1.997)	Top-5 acc 6.641 (7.525)	lr 0.04824
Warmup Train [5][2620/3239]	Time 0.428 (0.513)	Data 0.001 (0.010)	Loss 5.9623 (6.0759)	Top-1 acc 3.125 (1.998)	Top-5 acc 9.766 (7.529)	lr 0.04824
Warmup Train [5][2630/3239]	Time 0.480 (0.514)	Data 0.001 (0.010)	Loss 6.0847 (6.0756)	Top-1 acc 3.906 (1.999)	Top-5 acc 11.328 (7.536)	lr 0.04824
Warmup Train [5][2640/3239]	Time 0.575 (0.513)	Data 0.001 (0.010)	Loss 5.9211 (6.0753)	Top-1 acc 2.344 (2.000)	Top-5 acc 9.766 (7.538)	lr 0.04823
Warmup Train [5][2650/3239]	Time 0.370 (0.513)	Data 0.001 (0.010)	Loss 5.9491 (6.0750)	Top-1 acc 1.953 (2.001)	Top-5 acc 7.812 (7.540)	lr 0.04823
Warmup Train [5][2660/3239]	Time 0.360 (0.513)	Data 0.001 (0.010)	Loss 6.0305 (6.0747)	Top-1 acc 0.391 (2.001)	Top-5 acc 7.812 (7.546)	lr 0.04823
Warmup Train [5][2670/3239]	Time 0.663 (0.513)	Data 0.001 (0.010)	Loss 6.0073 (6.0744)	Top-1 acc 2.734 (2.003)	Top-5 acc 7.422 (7.552)	lr 0.04823
Warmup Train [5][2680/3239]	Time 0.404 (0.513)	Data 0.001 (0.010)	Loss 6.0105 (6.0740)	Top-1 acc 0.391 (2.004)	Top-5 acc 6.250 (7.557)	lr 0.04822
Warmup Train [5][2690/3239]	Time 0.638 (0.513)	Data 0.001 (0.010)	Loss 6.0372 (6.0738)	Top-1 acc 1.953 (2.006)	Top-5 acc 7.812 (7.560)	lr 0.04822
Warmup Train [5][2700/3239]	Time 0.590 (0.513)	Data 0.001 (0.010)	Loss 6.0099 (6.0735)	Top-1 acc 3.125 (2.009)	Top-5 acc 10.547 (7.569)	lr 0.04822
Warmup Train [5][2710/3239]	Time 0.506 (0.513)	Data 0.001 (0.010)	Loss 6.0273 (6.0731)	Top-1 acc 1.953 (2.014)	Top-5 acc 6.250 (7.576)	lr 0.04822
Warmup Train [5][2720/3239]	Time 0.510 (0.513)	Data 0.001 (0.010)	Loss 5.9237 (6.0729)	Top-1 acc 1.953 (2.014)	Top-5 acc 8.203 (7.579)	lr 0.04822
Warmup Train [5][2730/3239]	Time 0.583 (0.513)	Data 0.001 (0.010)	Loss 5.9924 (6.0727)	Top-1 acc 4.688 (2.015)	Top-5 acc 12.109 (7.586)	lr 0.04821
Warmup Train [5][2740/3239]	Time 0.394 (0.513)	Data 0.001 (0.010)	Loss 5.9468 (6.0724)	Top-1 acc 2.734 (2.017)	Top-5 acc 12.500 (7.592)	lr 0.04821
Warmup Train [5][2750/3239]	Time 0.372 (0.513)	Data 0.001 (0.010)	Loss 5.9373 (6.0721)	Top-1 acc 3.125 (2.018)	Top-5 acc 10.938 (7.594)	lr 0.04821
Warmup Train [5][2760/3239]	Time 0.430 (0.513)	Data 0.001 (0.010)	Loss 5.9668 (6.0718)	Top-1 acc 2.734 (2.020)	Top-5 acc 8.594 (7.600)	lr 0.04821
Warmup Train [5][2770/3239]	Time 0.642 (0.513)	Data 0.002 (0.010)	Loss 5.8839 (6.0715)	Top-1 acc 1.562 (2.022)	Top-5 acc 9.375 (7.607)	lr 0.04820
Warmup Train [5][2780/3239]	Time 0.552 (0.513)	Data 0.001 (0.010)	Loss 5.9607 (6.0711)	Top-1 acc 1.953 (2.025)	Top-5 acc 8.203 (7.616)	lr 0.04820
Warmup Train [5][2790/3239]	Time 0.553 (0.513)	Data 0.001 (0.010)	Loss 5.9579 (6.0708)	Top-1 acc 1.172 (2.026)	Top-5 acc 8.984 (7.622)	lr 0.04820
Warmup Train [5][2800/3239]	Time 0.375 (0.513)	Data 0.001 (0.010)	Loss 5.9615 (6.0703)	Top-1 acc 1.562 (2.029)	Top-5 acc 6.250 (7.633)	lr 0.04820
Warmup Train [5][2810/3239]	Time 0.519 (0.513)	Data 0.001 (0.010)	Loss 6.0132 (6.0700)	Top-1 acc 2.344 (2.030)	Top-5 acc 8.984 (7.635)	lr 0.04820
Warmup Train [5][2820/3239]	Time 0.530 (0.513)	Data 0.001 (0.010)	Loss 5.9768 (6.0696)	Top-1 acc 2.344 (2.034)	Top-5 acc 10.938 (7.643)	lr 0.04819
Warmup Train [5][2830/3239]	Time 0.483 (0.513)	Data 0.001 (0.010)	Loss 6.0002 (6.0693)	Top-1 acc 2.344 (2.036)	Top-5 acc 10.938 (7.650)	lr 0.04819
Warmup Train [5][2840/3239]	Time 0.662 (0.513)	Data 0.001 (0.010)	Loss 5.9709 (6.0690)	Top-1 acc 3.906 (2.039)	Top-5 acc 11.328 (7.656)	lr 0.04819
Warmup Train [5][2850/3239]	Time 0.462 (0.513)	Data 0.001 (0.010)	Loss 5.9787 (6.0687)	Top-1 acc 3.516 (2.041)	Top-5 acc 7.031 (7.662)	lr 0.04819
Warmup Train [5][2860/3239]	Time 0.443 (0.513)	Data 0.001 (0.010)	Loss 5.9872 (6.0684)	Top-1 acc 1.953 (2.043)	Top-5 acc 7.422 (7.667)	lr 0.04818
Warmup Train [5][2870/3239]	Time 0.459 (0.513)	Data 0.002 (0.010)	Loss 5.9667 (6.0681)	Top-1 acc 2.344 (2.043)	Top-5 acc 7.422 (7.672)	lr 0.04818
Warmup Train [5][2880/3239]	Time 0.718 (0.513)	Data 0.001 (0.010)	Loss 5.8899 (6.0677)	Top-1 acc 2.734 (2.045)	Top-5 acc 9.375 (7.680)	lr 0.04818
Warmup Train [5][2890/3239]	Time 0.617 (0.513)	Data 0.001 (0.010)	Loss 6.0024 (6.0673)	Top-1 acc 1.562 (2.047)	Top-5 acc 7.812 (7.688)	lr 0.04818
Warmup Train [5][2900/3239]	Time 0.528 (0.513)	Data 0.001 (0.010)	Loss 6.0198 (6.0670)	Top-1 acc 3.125 (2.050)	Top-5 acc 9.766 (7.692)	lr 0.04818
Warmup Train [5][2910/3239]	Time 0.675 (0.513)	Data 0.001 (0.010)	Loss 5.9516 (6.0666)	Top-1 acc 1.953 (2.053)	Top-5 acc 8.203 (7.697)	lr 0.04817
Warmup Train [5][2920/3239]	Time 0.499 (0.513)	Data 0.001 (0.010)	Loss 6.0045 (6.0663)	Top-1 acc 2.734 (2.055)	Top-5 acc 10.156 (7.703)	lr 0.04817
Warmup Train [5][2930/3239]	Time 0.403 (0.513)	Data 0.001 (0.010)	Loss 5.9543 (6.0659)	Top-1 acc 1.562 (2.056)	Top-5 acc 7.812 (7.708)	lr 0.04817
Warmup Train [5][2940/3239]	Time 0.353 (0.513)	Data 0.001 (0.010)	Loss 5.8215 (6.0655)	Top-1 acc 3.906 (2.058)	Top-5 acc 13.672 (7.718)	lr 0.04817
Warmup Train [5][2950/3239]	Time 0.497 (0.513)	Data 0.001 (0.010)	Loss 5.8555 (6.0651)	Top-1 acc 3.906 (2.062)	Top-5 acc 10.938 (7.725)	lr 0.04816
Warmup Train [5][2960/3239]	Time 0.445 (0.513)	Data 0.001 (0.010)	Loss 5.9566 (6.0649)	Top-1 acc 1.562 (2.063)	Top-5 acc 10.547 (7.731)	lr 0.04816
Warmup Train [5][2970/3239]	Time 0.513 (0.513)	Data 0.001 (0.010)	Loss 6.0465 (6.0647)	Top-1 acc 4.688 (2.064)	Top-5 acc 9.766 (7.735)	lr 0.04816
Warmup Train [5][2980/3239]	Time 0.694 (0.513)	Data 0.001 (0.010)	Loss 6.0011 (6.0644)	Top-1 acc 0.781 (2.066)	Top-5 acc 9.375 (7.743)	lr 0.04816
Warmup Train [5][2990/3239]	Time 0.485 (0.513)	Data 0.001 (0.010)	Loss 5.8997 (6.0640)	Top-1 acc 3.125 (2.067)	Top-5 acc 10.938 (7.748)	lr 0.04815
Warmup Train [5][3000/3239]	Time 0.505 (0.513)	Data 0.001 (0.010)	Loss 6.0214 (6.0637)	Top-1 acc 1.562 (2.068)	Top-5 acc 8.594 (7.751)	lr 0.04815
Warmup Train [5][3010/3239]	Time 0.564 (0.513)	Data 0.001 (0.010)	Loss 5.9508 (6.0634)	Top-1 acc 2.344 (2.069)	Top-5 acc 9.766 (7.756)	lr 0.04815
Warmup Train [5][3020/3239]	Time 0.599 (0.513)	Data 0.001 (0.010)	Loss 6.0565 (6.0632)	Top-1 acc 2.734 (2.071)	Top-5 acc 8.203 (7.761)	lr 0.04815
Warmup Train [5][3030/3239]	Time 0.471 (0.513)	Data 0.001 (0.010)	Loss 6.1473 (6.0630)	Top-1 acc 1.953 (2.072)	Top-5 acc 5.078 (7.765)	lr 0.04815
Warmup Train [5][3040/3239]	Time 0.374 (0.513)	Data 0.001 (0.010)	Loss 5.9061 (6.0626)	Top-1 acc 1.562 (2.073)	Top-5 acc 10.938 (7.774)	lr 0.04814
Warmup Train [5][3050/3239]	Time 0.412 (0.513)	Data 0.001 (0.010)	Loss 5.9511 (6.0623)	Top-1 acc 2.734 (2.073)	Top-5 acc 13.281 (7.779)	lr 0.04814
Warmup Train [5][3060/3239]	Time 0.552 (0.513)	Data 0.001 (0.010)	Loss 5.9328 (6.0619)	Top-1 acc 3.125 (2.076)	Top-5 acc 8.203 (7.784)	lr 0.04814
Warmup Train [5][3070/3239]	Time 0.447 (0.513)	Data 0.001 (0.010)	Loss 6.0586 (6.0616)	Top-1 acc 1.562 (2.077)	Top-5 acc 5.078 (7.789)	lr 0.04814
Warmup Train [5][3080/3239]	Time 0.449 (0.513)	Data 0.001 (0.010)	Loss 5.9614 (6.0614)	Top-1 acc 2.344 (2.078)	Top-5 acc 8.984 (7.793)	lr 0.04813
Warmup Train [5][3090/3239]	Time 0.700 (0.513)	Data 0.001 (0.010)	Loss 5.8949 (6.0610)	Top-1 acc 3.125 (2.080)	Top-5 acc 14.062 (7.800)	lr 0.04813
Warmup Train [5][3100/3239]	Time 0.610 (0.513)	Data 0.001 (0.010)	Loss 5.8548 (6.0606)	Top-1 acc 2.734 (2.082)	Top-5 acc 10.156 (7.807)	lr 0.04813
Warmup Train [5][3110/3239]	Time 0.678 (0.513)	Data 0.001 (0.010)	Loss 6.0000 (6.0603)	Top-1 acc 2.734 (2.084)	Top-5 acc 10.156 (7.816)	lr 0.04813
Warmup Train [5][3120/3239]	Time 0.545 (0.513)	Data 0.001 (0.010)	Loss 5.9343 (6.0600)	Top-1 acc 3.125 (2.088)	Top-5 acc 10.547 (7.824)	lr 0.04812
Warmup Train [5][3130/3239]	Time 0.558 (0.513)	Data 0.001 (0.010)	Loss 5.9694 (6.0597)	Top-1 acc 1.562 (2.089)	Top-5 acc 8.594 (7.829)	lr 0.04812
Warmup Train [5][3140/3239]	Time 0.649 (0.513)	Data 0.001 (0.010)	Loss 6.0331 (6.0595)	Top-1 acc 2.344 (2.090)	Top-5 acc 9.375 (7.833)	lr 0.04812
Warmup Train [5][3150/3239]	Time 0.474 (0.513)	Data 0.001 (0.010)	Loss 5.9896 (6.0591)	Top-1 acc 2.734 (2.092)	Top-5 acc 8.203 (7.840)	lr 0.04812
Warmup Train [5][3160/3239]	Time 0.534 (0.513)	Data 0.001 (0.010)	Loss 6.0578 (6.0588)	Top-1 acc 2.344 (2.093)	Top-5 acc 10.156 (7.845)	lr 0.04812
Warmup Train [5][3170/3239]	Time 0.564 (0.513)	Data 0.001 (0.009)	Loss 5.9874 (6.0585)	Top-1 acc 0.391 (2.094)	Top-5 acc 7.031 (7.850)	lr 0.04811
Warmup Train [5][3180/3239]	Time 0.506 (0.513)	Data 0.000 (0.009)	Loss 6.0198 (6.0581)	Top-1 acc 1.953 (2.097)	Top-5 acc 8.594 (7.856)	lr 0.04811
Warmup Train [5][3190/3239]	Time 0.643 (0.513)	Data 0.000 (0.009)	Loss 5.9908 (6.0578)	Top-1 acc 3.516 (2.101)	Top-5 acc 10.156 (7.863)	lr 0.04811
Warmup Train [5][3200/3239]	Time 0.505 (0.513)	Data 0.000 (0.009)	Loss 5.8922 (6.0575)	Top-1 acc 3.125 (2.102)	Top-5 acc 10.938 (7.867)	lr 0.04811
Warmup Train [5][3210/3239]	Time 0.304 (0.513)	Data 0.000 (0.009)	Loss 5.9193 (6.0572)	Top-1 acc 3.125 (2.105)	Top-5 acc 12.891 (7.872)	lr 0.04810
Warmup Train [5][3220/3239]	Time 0.478 (0.513)	Data 0.000 (0.009)	Loss 5.9933 (6.0570)	Top-1 acc 5.078 (2.107)	Top-5 acc 8.594 (7.877)	lr 0.04810
Warmup Train [5][3230/3239]	Time 0.470 (0.513)	Data 0.000 (0.009)	Loss 5.8190 (6.0566)	Top-1 acc 4.688 (2.112)	Top-5 acc 14.453 (7.885)	lr 0.04810
Warmup Train [5][3239/3239]	Time 0.327 (0.512)	Data 0.000 (0.009)	Loss 6.2286 (6.0564)	Top-1 acc 1.235 (2.115)	Top-5 acc 6.173 (7.889)	lr 0.04810
==========Warmup Valid [5/40]	loss 5.570	top-1 acc 3.591	top-5 acc 12.184	Train top-1 2.115	top-5 7.889	flops: 442.4M
Warmup Train [6][0/3239]	Time 13.127 (13.127)	Data 12.077 (12.077)	Loss 6.0066 (6.0066)	Top-1 acc 1.953 (1.953)	Top-5 acc 9.375 (9.375)	lr 0.04810
Warmup Train [6][10/3239]	Time 0.575 (1.684)	Data 0.001 (1.100)	Loss 5.9791 (5.9483)	Top-1 acc 2.344 (3.196)	Top-5 acc 10.938 (10.121)	lr 0.04809
Warmup Train [6][20/3239]	Time 0.430 (1.118)	Data 0.002 (0.578)	Loss 5.8955 (5.9380)	Top-1 acc 4.297 (3.311)	Top-5 acc 11.328 (9.803)	lr 0.04809
Warmup Train [6][30/3239]	Time 0.384 (0.914)	Data 0.001 (0.396)	Loss 6.0580 (5.9444)	Top-1 acc 1.172 (2.923)	Top-5 acc 5.469 (9.778)	lr 0.04809
Warmup Train [6][40/3239]	Time 0.195 (0.816)	Data 0.001 (0.303)	Loss 6.0005 (5.9554)	Top-1 acc 2.344 (2.725)	Top-5 acc 8.594 (9.518)	lr 0.04809
Warmup Train [6][50/3239]	Time 0.559 (0.749)	Data 0.001 (0.246)	Loss 6.0290 (5.9631)	Top-1 acc 1.953 (2.650)	Top-5 acc 9.375 (9.367)	lr 0.04809
Warmup Train [6][60/3239]	Time 0.625 (0.706)	Data 0.001 (0.206)	Loss 5.9325 (5.9580)	Top-1 acc 3.125 (2.798)	Top-5 acc 10.547 (9.503)	lr 0.04808
Warmup Train [6][70/3239]	Time 0.753 (0.671)	Data 0.001 (0.178)	Loss 6.0461 (5.9579)	Top-1 acc 0.781 (2.789)	Top-5 acc 7.031 (9.524)	lr 0.04808
Warmup Train [6][80/3239]	Time 0.462 (0.651)	Data 0.001 (0.156)	Loss 5.8651 (5.9538)	Top-1 acc 3.906 (2.826)	Top-5 acc 12.500 (9.578)	lr 0.04808
Warmup Train [6][90/3239]	Time 0.543 (0.637)	Data 0.001 (0.139)	Loss 6.0502 (5.9546)	Top-1 acc 1.562 (2.842)	Top-5 acc 7.812 (9.594)	lr 0.04808
Warmup Train [6][100/3239]	Time 0.654 (0.623)	Data 0.001 (0.126)	Loss 5.9253 (5.9497)	Top-1 acc 3.516 (2.854)	Top-5 acc 7.812 (9.619)	lr 0.04807
Warmup Train [6][110/3239]	Time 0.437 (0.613)	Data 0.001 (0.114)	Loss 5.9823 (5.9487)	Top-1 acc 2.734 (2.847)	Top-5 acc 8.984 (9.579)	lr 0.04807
Warmup Train [6][120/3239]	Time 0.358 (0.606)	Data 0.001 (0.106)	Loss 6.0715 (5.9506)	Top-1 acc 2.344 (2.847)	Top-5 acc 9.375 (9.585)	lr 0.04807
Warmup Train [6][130/3239]	Time 0.575 (0.599)	Data 0.001 (0.099)	Loss 5.8966 (5.9482)	Top-1 acc 2.734 (2.857)	Top-5 acc 12.109 (9.652)	lr 0.04807
Warmup Train [6][140/3239]	Time 0.437 (0.592)	Data 0.001 (0.092)	Loss 5.9523 (5.9495)	Top-1 acc 1.953 (2.798)	Top-5 acc 8.203 (9.619)	lr 0.04806
Warmup Train [6][150/3239]	Time 0.535 (0.588)	Data 0.002 (0.087)	Loss 5.9914 (5.9504)	Top-1 acc 1.172 (2.778)	Top-5 acc 7.812 (9.592)	lr 0.04806
Warmup Train [6][160/3239]	Time 0.348 (0.582)	Data 0.001 (0.081)	Loss 6.0801 (5.9514)	Top-1 acc 1.172 (2.747)	Top-5 acc 7.422 (9.605)	lr 0.04806
Warmup Train [6][170/3239]	Time 0.612 (0.580)	Data 0.001 (0.078)	Loss 5.9296 (5.9515)	Top-1 acc 2.734 (2.748)	Top-5 acc 8.594 (9.613)	lr 0.04806
Warmup Train [6][180/3239]	Time 0.648 (0.576)	Data 0.001 (0.074)	Loss 5.9536 (5.9501)	Top-1 acc 1.562 (2.762)	Top-5 acc 7.422 (9.630)	lr 0.04806
Warmup Train [6][190/3239]	Time 0.605 (0.572)	Data 0.001 (0.070)	Loss 5.9538 (5.9500)	Top-1 acc 3.516 (2.781)	Top-5 acc 8.594 (9.670)	lr 0.04805
Warmup Train [6][200/3239]	Time 0.509 (0.569)	Data 0.001 (0.067)	Loss 5.8459 (5.9501)	Top-1 acc 3.516 (2.799)	Top-5 acc 11.719 (9.657)	lr 0.04805
Warmup Train [6][210/3239]	Time 0.552 (0.566)	Data 0.001 (0.064)	Loss 5.8702 (5.9496)	Top-1 acc 2.344 (2.786)	Top-5 acc 9.766 (9.642)	lr 0.04805
Warmup Train [6][220/3239]	Time 0.534 (0.564)	Data 0.001 (0.061)	Loss 5.9904 (5.9494)	Top-1 acc 1.953 (2.768)	Top-5 acc 9.375 (9.647)	lr 0.04805
Warmup Train [6][230/3239]	Time 0.531 (0.562)	Data 0.001 (0.059)	Loss 6.0106 (5.9497)	Top-1 acc 3.125 (2.775)	Top-5 acc 8.203 (9.649)	lr 0.04804
Warmup Train [6][240/3239]	Time 0.436 (0.558)	Data 0.001 (0.056)	Loss 5.9702 (5.9483)	Top-1 acc 1.562 (2.780)	Top-5 acc 8.203 (9.672)	lr 0.04804
Warmup Train [6][250/3239]	Time 0.378 (0.557)	Data 0.002 (0.055)	Loss 5.9519 (5.9490)	Top-1 acc 3.516 (2.759)	Top-5 acc 12.500 (9.663)	lr 0.04804
Warmup Train [6][260/3239]	Time 0.469 (0.556)	Data 0.001 (0.053)	Loss 5.8886 (5.9494)	Top-1 acc 2.734 (2.778)	Top-5 acc 14.062 (9.659)	lr 0.04804
Warmup Train [6][270/3239]	Time 0.487 (0.554)	Data 0.001 (0.052)	Loss 5.9949 (5.9495)	Top-1 acc 2.344 (2.768)	Top-5 acc 8.984 (9.611)	lr 0.04803
Warmup Train [6][280/3239]	Time 0.657 (0.553)	Data 0.001 (0.050)	Loss 5.8710 (5.9475)	Top-1 acc 5.469 (2.784)	Top-5 acc 16.406 (9.654)	lr 0.04803
Warmup Train [6][290/3239]	Time 0.397 (0.551)	Data 0.002 (0.048)	Loss 5.9430 (5.9468)	Top-1 acc 4.297 (2.792)	Top-5 acc 11.328 (9.685)	lr 0.04803
Warmup Train [6][300/3239]	Time 0.478 (0.549)	Data 0.001 (0.047)	Loss 6.0473 (5.9463)	Top-1 acc 1.172 (2.794)	Top-5 acc 5.078 (9.690)	lr 0.04803
Warmup Train [6][310/3239]	Time 0.543 (0.547)	Data 0.001 (0.045)	Loss 6.0013 (5.9469)	Top-1 acc 2.734 (2.792)	Top-5 acc 7.812 (9.688)	lr 0.04802
Warmup Train [6][320/3239]	Time 0.437 (0.545)	Data 0.001 (0.044)	Loss 5.8972 (5.9465)	Top-1 acc 3.906 (2.793)	Top-5 acc 12.109 (9.680)	lr 0.04802
Warmup Train [6][330/3239]	Time 0.353 (0.543)	Data 0.001 (0.043)	Loss 5.9492 (5.9466)	Top-1 acc 2.734 (2.789)	Top-5 acc 10.547 (9.665)	lr 0.04802
Warmup Train [6][340/3239]	Time 0.449 (0.542)	Data 0.001 (0.042)	Loss 5.9143 (5.9466)	Top-1 acc 3.516 (2.789)	Top-5 acc 11.328 (9.681)	lr 0.04802
Warmup Train [6][350/3239]	Time 0.539 (0.541)	Data 0.001 (0.041)	Loss 5.8821 (5.9462)	Top-1 acc 1.953 (2.790)	Top-5 acc 10.938 (9.684)	lr 0.04801
Warmup Train [6][360/3239]	Time 0.487 (0.540)	Data 0.001 (0.040)	Loss 5.9925 (5.9459)	Top-1 acc 2.734 (2.786)	Top-5 acc 8.594 (9.674)	lr 0.04801
Warmup Train [6][370/3239]	Time 0.455 (0.540)	Data 0.001 (0.039)	Loss 5.9554 (5.9457)	Top-1 acc 3.516 (2.788)	Top-5 acc 10.938 (9.715)	lr 0.04801
Warmup Train [6][380/3239]	Time 0.495 (0.539)	Data 0.001 (0.039)	Loss 5.9432 (5.9462)	Top-1 acc 3.906 (2.782)	Top-5 acc 12.109 (9.703)	lr 0.04801
Warmup Train [6][390/3239]	Time 0.699 (0.539)	Data 0.001 (0.038)	Loss 5.9082 (5.9466)	Top-1 acc 3.906 (2.781)	Top-5 acc 10.938 (9.686)	lr 0.04801
Warmup Train [6][400/3239]	Time 0.607 (0.538)	Data 0.001 (0.037)	Loss 5.9520 (5.9467)	Top-1 acc 1.953 (2.780)	Top-5 acc 7.031 (9.673)	lr 0.04800
Warmup Train [6][410/3239]	Time 0.504 (0.537)	Data 0.001 (0.036)	Loss 5.8811 (5.9466)	Top-1 acc 2.734 (2.780)	Top-5 acc 9.766 (9.685)	lr 0.04800
Warmup Train [6][420/3239]	Time 0.606 (0.537)	Data 0.001 (0.035)	Loss 5.9751 (5.9468)	Top-1 acc 3.125 (2.778)	Top-5 acc 7.422 (9.671)	lr 0.04800
Warmup Train [6][430/3239]	Time 0.516 (0.536)	Data 0.001 (0.035)	Loss 5.9564 (5.9470)	Top-1 acc 3.906 (2.788)	Top-5 acc 8.984 (9.684)	lr 0.04800
Warmup Train [6][440/3239]	Time 0.647 (0.536)	Data 0.001 (0.034)	Loss 5.8972 (5.9460)	Top-1 acc 5.078 (2.795)	Top-5 acc 12.109 (9.712)	lr 0.04799
Warmup Train [6][450/3239]	Time 0.404 (0.535)	Data 0.001 (0.033)	Loss 5.9421 (5.9467)	Top-1 acc 3.516 (2.792)	Top-5 acc 10.156 (9.710)	lr 0.04799
Warmup Train [6][460/3239]	Time 0.344 (0.535)	Data 0.001 (0.033)	Loss 5.9643 (5.9465)	Top-1 acc 3.906 (2.794)	Top-5 acc 11.719 (9.716)	lr 0.04799
Warmup Train [6][470/3239]	Time 0.383 (0.533)	Data 0.001 (0.032)	Loss 5.9088 (5.9465)	Top-1 acc 1.562 (2.787)	Top-5 acc 14.062 (9.725)	lr 0.04799
Warmup Train [6][480/3239]	Time 0.373 (0.533)	Data 0.001 (0.032)	Loss 5.9569 (5.9465)	Top-1 acc 4.297 (2.791)	Top-5 acc 8.203 (9.718)	lr 0.04798
Warmup Train [6][490/3239]	Time 0.517 (0.532)	Data 0.001 (0.032)	Loss 5.9614 (5.9458)	Top-1 acc 2.734 (2.791)	Top-5 acc 8.594 (9.733)	lr 0.04798
Warmup Train [6][500/3239]	Time 0.483 (0.531)	Data 0.001 (0.031)	Loss 5.8337 (5.9450)	Top-1 acc 1.172 (2.793)	Top-5 acc 9.766 (9.753)	lr 0.04798
Warmup Train [6][510/3239]	Time 0.713 (0.531)	Data 0.001 (0.031)	Loss 5.9792 (5.9447)	Top-1 acc 3.516 (2.796)	Top-5 acc 9.375 (9.775)	lr 0.04798
Warmup Train [6][520/3239]	Time 0.600 (0.531)	Data 0.001 (0.030)	Loss 6.0035 (5.9445)	Top-1 acc 1.953 (2.797)	Top-5 acc 8.594 (9.787)	lr 0.04797
Warmup Train [6][530/3239]	Time 0.450 (0.530)	Data 0.001 (0.030)	Loss 5.9960 (5.9444)	Top-1 acc 2.344 (2.804)	Top-5 acc 10.547 (9.799)	lr 0.04797
Warmup Train [6][540/3239]	Time 0.472 (0.530)	Data 0.001 (0.029)	Loss 5.9000 (5.9444)	Top-1 acc 3.125 (2.809)	Top-5 acc 11.328 (9.805)	lr 0.04797
Warmup Train [6][550/3239]	Time 0.541 (0.530)	Data 0.001 (0.029)	Loss 5.8937 (5.9439)	Top-1 acc 2.734 (2.822)	Top-5 acc 10.156 (9.819)	lr 0.04797
Warmup Train [6][560/3239]	Time 0.425 (0.529)	Data 0.001 (0.028)	Loss 6.0028 (5.9443)	Top-1 acc 1.172 (2.814)	Top-5 acc 5.859 (9.801)	lr 0.04796
Warmup Train [6][570/3239]	Time 0.497 (0.529)	Data 0.001 (0.028)	Loss 5.8030 (5.9442)	Top-1 acc 4.297 (2.814)	Top-5 acc 12.891 (9.802)	lr 0.04796
Warmup Train [6][580/3239]	Time 0.389 (0.527)	Data 0.001 (0.028)	Loss 5.9601 (5.9440)	Top-1 acc 2.734 (2.815)	Top-5 acc 10.938 (9.818)	lr 0.04796
Warmup Train [6][590/3239]	Time 0.595 (0.527)	Data 0.001 (0.027)	Loss 5.9971 (5.9437)	Top-1 acc 3.516 (2.817)	Top-5 acc 12.109 (9.822)	lr 0.04796
Warmup Train [6][600/3239]	Time 0.174 (0.525)	Data 0.001 (0.027)	Loss 5.8833 (5.9439)	Top-1 acc 1.562 (2.821)	Top-5 acc 11.328 (9.820)	lr 0.04796
Warmup Train [6][610/3239]	Time 0.553 (0.526)	Data 0.001 (0.027)	Loss 5.8324 (5.9433)	Top-1 acc 4.297 (2.822)	Top-5 acc 12.109 (9.833)	lr 0.04795
Warmup Train [6][620/3239]	Time 0.742 (0.525)	Data 0.001 (0.026)	Loss 5.8556 (5.9429)	Top-1 acc 3.125 (2.829)	Top-5 acc 11.328 (9.834)	lr 0.04795
Warmup Train [6][630/3239]	Time 0.526 (0.525)	Data 0.001 (0.026)	Loss 6.0380 (5.9427)	Top-1 acc 0.391 (2.825)	Top-5 acc 7.031 (9.839)	lr 0.04795
Warmup Train [6][640/3239]	Time 0.499 (0.525)	Data 0.001 (0.026)	Loss 5.8295 (5.9422)	Top-1 acc 3.516 (2.822)	Top-5 acc 12.891 (9.845)	lr 0.04795
Warmup Train [6][650/3239]	Time 0.526 (0.524)	Data 0.001 (0.025)	Loss 5.7874 (5.9416)	Top-1 acc 5.078 (2.829)	Top-5 acc 10.938 (9.858)	lr 0.04794
Warmup Train [6][660/3239]	Time 0.639 (0.524)	Data 0.001 (0.025)	Loss 5.9872 (5.9410)	Top-1 acc 3.516 (2.837)	Top-5 acc 7.422 (9.874)	lr 0.04794
Warmup Train [6][670/3239]	Time 0.498 (0.524)	Data 0.001 (0.025)	Loss 5.9821 (5.9403)	Top-1 acc 2.734 (2.841)	Top-5 acc 10.156 (9.893)	lr 0.04794
Warmup Train [6][680/3239]	Time 0.580 (0.524)	Data 0.001 (0.024)	Loss 5.8404 (5.9398)	Top-1 acc 4.297 (2.846)	Top-5 acc 13.281 (9.908)	lr 0.04794
Warmup Train [6][690/3239]	Time 0.494 (0.524)	Data 0.003 (0.024)	Loss 5.8564 (5.9393)	Top-1 acc 4.297 (2.851)	Top-5 acc 12.891 (9.930)	lr 0.04793
Warmup Train [6][700/3239]	Time 0.601 (0.524)	Data 0.001 (0.024)	Loss 5.8162 (5.9388)	Top-1 acc 3.906 (2.854)	Top-5 acc 11.719 (9.939)	lr 0.04793
Warmup Train [6][710/3239]	Time 0.526 (0.524)	Data 0.001 (0.023)	Loss 5.9137 (5.9386)	Top-1 acc 3.125 (2.860)	Top-5 acc 9.766 (9.946)	lr 0.04793
Warmup Train [6][720/3239]	Time 0.301 (0.523)	Data 0.001 (0.023)	Loss 5.9493 (5.9382)	Top-1 acc 2.734 (2.861)	Top-5 acc 9.766 (9.964)	lr 0.04793
Warmup Train [6][730/3239]	Time 0.719 (0.524)	Data 0.001 (0.023)	Loss 5.9240 (5.9375)	Top-1 acc 3.516 (2.866)	Top-5 acc 9.766 (9.975)	lr 0.04792
Warmup Train [6][740/3239]	Time 0.534 (0.524)	Data 0.001 (0.023)	Loss 5.9731 (5.9374)	Top-1 acc 3.516 (2.865)	Top-5 acc 9.375 (9.984)	lr 0.04792
Warmup Train [6][750/3239]	Time 0.420 (0.524)	Data 0.002 (0.022)	Loss 5.8533 (5.9369)	Top-1 acc 4.297 (2.870)	Top-5 acc 13.281 (10.001)	lr 0.04792
Warmup Train [6][760/3239]	Time 0.465 (0.524)	Data 0.001 (0.022)	Loss 5.8573 (5.9368)	Top-1 acc 3.125 (2.873)	Top-5 acc 10.938 (10.000)	lr 0.04792
Warmup Train [6][770/3239]	Time 0.561 (0.524)	Data 0.001 (0.022)	Loss 6.0093 (5.9365)	Top-1 acc 1.172 (2.875)	Top-5 acc 5.078 (10.014)	lr 0.04791
Warmup Train [6][780/3239]	Time 0.632 (0.524)	Data 0.001 (0.022)	Loss 5.9450 (5.9357)	Top-1 acc 1.562 (2.873)	Top-5 acc 10.547 (10.028)	lr 0.04791
Warmup Train [6][790/3239]	Time 0.522 (0.524)	Data 0.001 (0.022)	Loss 5.8969 (5.9349)	Top-1 acc 2.344 (2.876)	Top-5 acc 12.500 (10.044)	lr 0.04791
Warmup Train [6][800/3239]	Time 0.401 (0.523)	Data 0.001 (0.021)	Loss 5.9396 (5.9347)	Top-1 acc 1.562 (2.878)	Top-5 acc 8.984 (10.047)	lr 0.04791
Warmup Train [6][810/3239]	Time 0.617 (0.523)	Data 0.001 (0.021)	Loss 5.9190 (5.9340)	Top-1 acc 4.297 (2.886)	Top-5 acc 9.375 (10.061)	lr 0.04790
Warmup Train [6][820/3239]	Time 0.415 (0.523)	Data 0.001 (0.021)	Loss 5.9270 (5.9338)	Top-1 acc 2.344 (2.879)	Top-5 acc 9.766 (10.058)	lr 0.04790
Warmup Train [6][830/3239]	Time 0.542 (0.523)	Data 0.001 (0.021)	Loss 6.0580 (5.9336)	Top-1 acc 5.078 (2.885)	Top-5 acc 10.547 (10.064)	lr 0.04790
Warmup Train [6][840/3239]	Time 0.605 (0.522)	Data 0.001 (0.021)	Loss 5.9180 (5.9331)	Top-1 acc 1.172 (2.892)	Top-5 acc 8.203 (10.078)	lr 0.04790
Warmup Train [6][850/3239]	Time 0.365 (0.521)	Data 0.001 (0.021)	Loss 5.8836 (5.9325)	Top-1 acc 2.734 (2.894)	Top-5 acc 8.984 (10.077)	lr 0.04789
Warmup Train [6][860/3239]	Time 0.625 (0.521)	Data 0.023 (0.020)	Loss 5.9452 (5.9325)	Top-1 acc 3.516 (2.899)	Top-5 acc 12.500 (10.085)	lr 0.04789
Warmup Train [6][870/3239]	Time 0.518 (0.521)	Data 0.001 (0.020)	Loss 5.8871 (5.9324)	Top-1 acc 2.734 (2.904)	Top-5 acc 11.719 (10.089)	lr 0.04789
Warmup Train [6][880/3239]	Time 0.501 (0.521)	Data 0.001 (0.020)	Loss 5.9109 (5.9321)	Top-1 acc 1.562 (2.899)	Top-5 acc 10.938 (10.093)	lr 0.04789
Warmup Train [6][890/3239]	Time 0.617 (0.521)	Data 0.001 (0.020)	Loss 5.9033 (5.9320)	Top-1 acc 3.516 (2.899)	Top-5 acc 12.891 (10.094)	lr 0.04789
Warmup Train [6][900/3239]	Time 0.619 (0.521)	Data 0.001 (0.020)	Loss 5.8603 (5.9318)	Top-1 acc 1.953 (2.896)	Top-5 acc 12.109 (10.106)	lr 0.04788
Warmup Train [6][910/3239]	Time 0.609 (0.521)	Data 0.001 (0.020)	Loss 5.8586 (5.9313)	Top-1 acc 2.734 (2.900)	Top-5 acc 13.672 (10.116)	lr 0.04788
Warmup Train [6][920/3239]	Time 0.555 (0.521)	Data 0.001 (0.019)	Loss 5.7804 (5.9312)	Top-1 acc 3.906 (2.902)	Top-5 acc 14.453 (10.122)	lr 0.04788
Warmup Train [6][930/3239]	Time 0.610 (0.521)	Data 0.001 (0.019)	Loss 5.9823 (5.9310)	Top-1 acc 3.906 (2.906)	Top-5 acc 11.719 (10.131)	lr 0.04788
Warmup Train [6][940/3239]	Time 0.438 (0.521)	Data 0.001 (0.019)	Loss 5.7053 (5.9308)	Top-1 acc 4.297 (2.907)	Top-5 acc 15.625 (10.138)	lr 0.04787
Warmup Train [6][950/3239]	Time 0.578 (0.520)	Data 0.001 (0.019)	Loss 5.8852 (5.9308)	Top-1 acc 4.688 (2.908)	Top-5 acc 12.500 (10.140)	lr 0.04787
Warmup Train [6][960/3239]	Time 0.533 (0.520)	Data 0.001 (0.019)	Loss 6.0149 (5.9307)	Top-1 acc 3.516 (2.910)	Top-5 acc 7.422 (10.141)	lr 0.04787
Warmup Train [6][970/3239]	Time 0.577 (0.520)	Data 0.001 (0.019)	Loss 5.9226 (5.9304)	Top-1 acc 4.688 (2.914)	Top-5 acc 14.062 (10.148)	lr 0.04787
Warmup Train [6][980/3239]	Time 0.494 (0.520)	Data 0.001 (0.018)	Loss 5.9842 (5.9301)	Top-1 acc 3.125 (2.911)	Top-5 acc 11.719 (10.153)	lr 0.04786
Warmup Train [6][990/3239]	Time 0.617 (0.520)	Data 0.001 (0.018)	Loss 6.0020 (5.9300)	Top-1 acc 1.562 (2.913)	Top-5 acc 10.156 (10.157)	lr 0.04786
Warmup Train [6][1000/3239]	Time 0.598 (0.520)	Data 0.001 (0.018)	Loss 5.8908 (5.9297)	Top-1 acc 3.125 (2.912)	Top-5 acc 12.109 (10.153)	lr 0.04786
Warmup Train [6][1010/3239]	Time 0.505 (0.520)	Data 0.001 (0.018)	Loss 5.8692 (5.9293)	Top-1 acc 2.734 (2.906)	Top-5 acc 10.156 (10.149)	lr 0.04786
Warmup Train [6][1020/3239]	Time 0.592 (0.519)	Data 0.001 (0.018)	Loss 5.8851 (5.9288)	Top-1 acc 2.734 (2.915)	Top-5 acc 10.156 (10.162)	lr 0.04785
Warmup Train [6][1030/3239]	Time 0.459 (0.519)	Data 0.001 (0.018)	Loss 5.8985 (5.9285)	Top-1 acc 5.078 (2.917)	Top-5 acc 10.156 (10.164)	lr 0.04785
Warmup Train [6][1040/3239]	Time 0.664 (0.520)	Data 0.001 (0.018)	Loss 5.8372 (5.9282)	Top-1 acc 3.516 (2.913)	Top-5 acc 11.328 (10.166)	lr 0.04785
Warmup Train [6][1050/3239]	Time 0.482 (0.519)	Data 0.001 (0.018)	Loss 5.9280 (5.9284)	Top-1 acc 5.078 (2.912)	Top-5 acc 11.719 (10.166)	lr 0.04785
Warmup Train [6][1060/3239]	Time 0.435 (0.519)	Data 0.001 (0.017)	Loss 5.9606 (5.9279)	Top-1 acc 2.734 (2.916)	Top-5 acc 11.328 (10.174)	lr 0.04784
Warmup Train [6][1070/3239]	Time 0.514 (0.519)	Data 0.001 (0.017)	Loss 6.0272 (5.9278)	Top-1 acc 2.734 (2.919)	Top-5 acc 6.250 (10.180)	lr 0.04784
Warmup Train [6][1080/3239]	Time 0.494 (0.519)	Data 0.001 (0.017)	Loss 5.8370 (5.9277)	Top-1 acc 1.953 (2.919)	Top-5 acc 12.109 (10.179)	lr 0.04784
Warmup Train [6][1090/3239]	Time 0.530 (0.519)	Data 0.001 (0.017)	Loss 5.9372 (5.9274)	Top-1 acc 1.562 (2.919)	Top-5 acc 10.156 (10.190)	lr 0.04784
Warmup Train [6][1100/3239]	Time 0.455 (0.519)	Data 0.001 (0.017)	Loss 5.8737 (5.9269)	Top-1 acc 3.906 (2.919)	Top-5 acc 11.719 (10.197)	lr 0.04783
Warmup Train [6][1110/3239]	Time 0.412 (0.518)	Data 0.001 (0.017)	Loss 5.8904 (5.9266)	Top-1 acc 3.906 (2.923)	Top-5 acc 11.719 (10.206)	lr 0.04783
Warmup Train [6][1120/3239]	Time 0.338 (0.518)	Data 0.001 (0.017)	Loss 5.8801 (5.9261)	Top-1 acc 2.344 (2.926)	Top-5 acc 12.891 (10.222)	lr 0.04783
Warmup Train [6][1130/3239]	Time 0.384 (0.518)	Data 0.001 (0.017)	Loss 5.8989 (5.9259)	Top-1 acc 1.953 (2.925)	Top-5 acc 12.500 (10.228)	lr 0.04783
Warmup Train [6][1140/3239]	Time 0.656 (0.518)	Data 0.001 (0.017)	Loss 5.9050 (5.9258)	Top-1 acc 3.516 (2.927)	Top-5 acc 10.938 (10.238)	lr 0.04782
Warmup Train [6][1150/3239]	Time 0.618 (0.517)	Data 0.001 (0.017)	Loss 5.9101 (5.9257)	Top-1 acc 1.953 (2.930)	Top-5 acc 10.156 (10.239)	lr 0.04782
Warmup Train [6][1160/3239]	Time 0.411 (0.517)	Data 0.001 (0.017)	Loss 5.8374 (5.9253)	Top-1 acc 6.641 (2.933)	Top-5 acc 16.016 (10.248)	lr 0.04782
Warmup Train [6][1170/3239]	Time 0.429 (0.517)	Data 0.001 (0.016)	Loss 5.7986 (5.9251)	Top-1 acc 5.078 (2.938)	Top-5 acc 14.453 (10.253)	lr 0.04782
Warmup Train [6][1180/3239]	Time 0.447 (0.517)	Data 0.001 (0.016)	Loss 5.9093 (5.9250)	Top-1 acc 2.734 (2.941)	Top-5 acc 10.156 (10.254)	lr 0.04781
Warmup Train [6][1190/3239]	Time 0.458 (0.517)	Data 0.001 (0.016)	Loss 5.9447 (5.9249)	Top-1 acc 2.344 (2.940)	Top-5 acc 8.984 (10.258)	lr 0.04781
Warmup Train [6][1200/3239]	Time 0.477 (0.517)	Data 0.001 (0.016)	Loss 5.8866 (5.9245)	Top-1 acc 0.781 (2.940)	Top-5 acc 10.156 (10.265)	lr 0.04781
Warmup Train [6][1210/3239]	Time 0.377 (0.517)	Data 0.001 (0.016)	Loss 5.8874 (5.9243)	Top-1 acc 3.516 (2.947)	Top-5 acc 9.766 (10.282)	lr 0.04781
Warmup Train [6][1220/3239]	Time 0.637 (0.517)	Data 0.001 (0.016)	Loss 5.8795 (5.9240)	Top-1 acc 3.516 (2.948)	Top-5 acc 10.938 (10.290)	lr 0.04780
Warmup Train [6][1230/3239]	Time 0.387 (0.517)	Data 0.001 (0.016)	Loss 5.8627 (5.9239)	Top-1 acc 3.125 (2.947)	Top-5 acc 12.500 (10.289)	lr 0.04780
Warmup Train [6][1240/3239]	Time 0.432 (0.517)	Data 0.001 (0.016)	Loss 5.9200 (5.9237)	Top-1 acc 1.953 (2.947)	Top-5 acc 10.156 (10.294)	lr 0.04780
Warmup Train [6][1250/3239]	Time 0.494 (0.517)	Data 0.001 (0.016)	Loss 5.8992 (5.9235)	Top-1 acc 3.906 (2.945)	Top-5 acc 11.328 (10.294)	lr 0.04780
Warmup Train [6][1260/3239]	Time 0.524 (0.517)	Data 0.001 (0.016)	Loss 5.8621 (5.9233)	Top-1 acc 3.516 (2.948)	Top-5 acc 12.109 (10.301)	lr 0.04779
Warmup Train [6][1270/3239]	Time 0.505 (0.517)	Data 0.001 (0.016)	Loss 5.9134 (5.9233)	Top-1 acc 4.297 (2.946)	Top-5 acc 9.766 (10.299)	lr 0.04779
Warmup Train [6][1280/3239]	Time 0.403 (0.517)	Data 0.001 (0.016)	Loss 6.0018 (5.9233)	Top-1 acc 3.906 (2.952)	Top-5 acc 10.156 (10.305)	lr 0.04779
Warmup Train [6][1290/3239]	Time 0.407 (0.517)	Data 0.001 (0.016)	Loss 5.8246 (5.9230)	Top-1 acc 3.906 (2.954)	Top-5 acc 14.062 (10.313)	lr 0.04779
Warmup Train [6][1300/3239]	Time 0.638 (0.517)	Data 0.001 (0.016)	Loss 5.9547 (5.9227)	Top-1 acc 2.344 (2.958)	Top-5 acc 9.766 (10.323)	lr 0.04778
Warmup Train [6][1310/3239]	Time 0.373 (0.517)	Data 0.001 (0.016)	Loss 5.9777 (5.9225)	Top-1 acc 2.344 (2.957)	Top-5 acc 7.812 (10.325)	lr 0.04778
Warmup Train [6][1320/3239]	Time 0.564 (0.517)	Data 0.001 (0.016)	Loss 6.0028 (5.9223)	Top-1 acc 4.297 (2.961)	Top-5 acc 7.031 (10.323)	lr 0.04778
Warmup Train [6][1330/3239]	Time 0.417 (0.517)	Data 0.001 (0.016)	Loss 5.8708 (5.9218)	Top-1 acc 3.516 (2.966)	Top-5 acc 12.500 (10.343)	lr 0.04778
Warmup Train [6][1340/3239]	Time 0.565 (0.517)	Data 0.001 (0.016)	Loss 5.8832 (5.9214)	Top-1 acc 1.562 (2.969)	Top-5 acc 10.156 (10.350)	lr 0.04777
Warmup Train [6][1350/3239]	Time 0.516 (0.517)	Data 0.001 (0.016)	Loss 5.7832 (5.9209)	Top-1 acc 1.172 (2.970)	Top-5 acc 8.984 (10.353)	lr 0.04777
Warmup Train [6][1360/3239]	Time 0.660 (0.517)	Data 0.001 (0.015)	Loss 5.8367 (5.9205)	Top-1 acc 5.859 (2.978)	Top-5 acc 10.938 (10.358)	lr 0.04777
Warmup Train [6][1370/3239]	Time 0.483 (0.517)	Data 0.001 (0.015)	Loss 5.8779 (5.9202)	Top-1 acc 2.734 (2.980)	Top-5 acc 10.547 (10.360)	lr 0.04777
Warmup Train [6][1380/3239]	Time 0.454 (0.517)	Data 0.001 (0.015)	Loss 5.8886 (5.9200)	Top-1 acc 2.734 (2.983)	Top-5 acc 11.719 (10.363)	lr 0.04776
Warmup Train [6][1390/3239]	Time 0.404 (0.516)	Data 0.001 (0.015)	Loss 5.9698 (5.9196)	Top-1 acc 3.906 (2.987)	Top-5 acc 11.328 (10.369)	lr 0.04776
Warmup Train [6][1400/3239]	Time 0.497 (0.516)	Data 0.002 (0.015)	Loss 5.8505 (5.9194)	Top-1 acc 3.906 (2.989)	Top-5 acc 14.453 (10.377)	lr 0.04776
Warmup Train [6][1410/3239]	Time 0.561 (0.516)	Data 0.001 (0.015)	Loss 5.8852 (5.9194)	Top-1 acc 1.562 (2.989)	Top-5 acc 11.328 (10.379)	lr 0.04776
Warmup Train [6][1420/3239]	Time 0.440 (0.516)	Data 0.001 (0.015)	Loss 5.8927 (5.9190)	Top-1 acc 3.516 (2.994)	Top-5 acc 9.375 (10.384)	lr 0.04775
Warmup Train [6][1430/3239]	Time 0.461 (0.516)	Data 0.001 (0.015)	Loss 5.8903 (5.9188)	Top-1 acc 5.469 (2.999)	Top-5 acc 10.156 (10.383)	lr 0.04775
Warmup Train [6][1440/3239]	Time 0.475 (0.516)	Data 0.001 (0.015)	Loss 5.9323 (5.9186)	Top-1 acc 1.562 (2.999)	Top-5 acc 8.203 (10.386)	lr 0.04775
Warmup Train [6][1450/3239]	Time 0.358 (0.516)	Data 0.001 (0.015)	Loss 5.9172 (5.9183)	Top-1 acc 3.125 (3.001)	Top-5 acc 10.156 (10.387)	lr 0.04775
Warmup Train [6][1460/3239]	Time 0.523 (0.516)	Data 0.001 (0.015)	Loss 5.8620 (5.9180)	Top-1 acc 2.734 (3.004)	Top-5 acc 12.109 (10.394)	lr 0.04774
Warmup Train [6][1470/3239]	Time 0.365 (0.516)	Data 0.001 (0.015)	Loss 5.7894 (5.9176)	Top-1 acc 3.906 (3.009)	Top-5 acc 9.375 (10.411)	lr 0.04774
Warmup Train [6][1480/3239]	Time 0.611 (0.516)	Data 0.001 (0.015)	Loss 5.7935 (5.9171)	Top-1 acc 4.297 (3.012)	Top-5 acc 12.109 (10.423)	lr 0.04774
Warmup Train [6][1490/3239]	Time 0.574 (0.516)	Data 0.001 (0.015)	Loss 5.8850 (5.9169)	Top-1 acc 4.297 (3.019)	Top-5 acc 10.547 (10.432)	lr 0.04774
Warmup Train [6][1500/3239]	Time 0.666 (0.516)	Data 0.001 (0.015)	Loss 6.0159 (5.9167)	Top-1 acc 0.781 (3.016)	Top-5 acc 7.031 (10.436)	lr 0.04773
Warmup Train [6][1510/3239]	Time 0.604 (0.516)	Data 0.001 (0.015)	Loss 5.7728 (5.9161)	Top-1 acc 3.516 (3.020)	Top-5 acc 17.188 (10.449)	lr 0.04773
Warmup Train [6][1520/3239]	Time 0.413 (0.516)	Data 0.002 (0.015)	Loss 5.9418 (5.9158)	Top-1 acc 1.953 (3.020)	Top-5 acc 12.109 (10.454)	lr 0.04773
Warmup Train [6][1530/3239]	Time 0.449 (0.516)	Data 0.001 (0.015)	Loss 5.8632 (5.9156)	Top-1 acc 3.516 (3.018)	Top-5 acc 9.766 (10.457)	lr 0.04773
Warmup Train [6][1540/3239]	Time 0.566 (0.516)	Data 0.001 (0.014)	Loss 5.8204 (5.9150)	Top-1 acc 3.516 (3.024)	Top-5 acc 8.984 (10.462)	lr 0.04772
Warmup Train [6][1550/3239]	Time 0.518 (0.516)	Data 0.001 (0.014)	Loss 5.9978 (5.9151)	Top-1 acc 2.344 (3.029)	Top-5 acc 7.812 (10.465)	lr 0.04772
Warmup Train [6][1560/3239]	Time 0.372 (0.516)	Data 0.001 (0.014)	Loss 5.9279 (5.9149)	Top-1 acc 1.953 (3.034)	Top-5 acc 7.812 (10.466)	lr 0.04772
Warmup Train [6][1570/3239]	Time 0.537 (0.516)	Data 0.001 (0.014)	Loss 6.0947 (5.9148)	Top-1 acc 2.344 (3.042)	Top-5 acc 7.422 (10.475)	lr 0.04772
Warmup Train [6][1580/3239]	Time 0.455 (0.516)	Data 0.001 (0.014)	Loss 5.8665 (5.9145)	Top-1 acc 5.859 (3.047)	Top-5 acc 10.547 (10.476)	lr 0.04771
Warmup Train [6][1590/3239]	Time 0.599 (0.516)	Data 0.001 (0.014)	Loss 5.8959 (5.9142)	Top-1 acc 5.078 (3.051)	Top-5 acc 12.109 (10.480)	lr 0.04771
Warmup Train [6][1600/3239]	Time 0.286 (0.516)	Data 0.001 (0.014)	Loss 5.8400 (5.9140)	Top-1 acc 3.906 (3.053)	Top-5 acc 9.766 (10.483)	lr 0.04771
Warmup Train [6][1610/3239]	Time 0.516 (0.516)	Data 0.002 (0.014)	Loss 5.8687 (5.9136)	Top-1 acc 4.297 (3.053)	Top-5 acc 13.672 (10.490)	lr 0.04771
Warmup Train [6][1620/3239]	Time 0.393 (0.516)	Data 0.001 (0.014)	Loss 6.0042 (5.9135)	Top-1 acc 3.906 (3.054)	Top-5 acc 11.719 (10.500)	lr 0.04770
Warmup Train [6][1630/3239]	Time 0.584 (0.516)	Data 0.001 (0.014)	Loss 5.8004 (5.9133)	Top-1 acc 2.344 (3.056)	Top-5 acc 10.547 (10.498)	lr 0.04770
Warmup Train [6][1640/3239]	Time 0.470 (0.516)	Data 0.001 (0.014)	Loss 5.8227 (5.9130)	Top-1 acc 5.859 (3.059)	Top-5 acc 12.500 (10.500)	lr 0.04770
Warmup Train [6][1650/3239]	Time 0.463 (0.515)	Data 0.001 (0.014)	Loss 5.8769 (5.9130)	Top-1 acc 2.344 (3.060)	Top-5 acc 10.547 (10.501)	lr 0.04770
Warmup Train [6][1660/3239]	Time 0.475 (0.515)	Data 0.001 (0.014)	Loss 5.9187 (5.9127)	Top-1 acc 3.125 (3.064)	Top-5 acc 9.766 (10.506)	lr 0.04769
Warmup Train [6][1670/3239]	Time 0.419 (0.515)	Data 0.002 (0.014)	Loss 5.7129 (5.9126)	Top-1 acc 5.078 (3.063)	Top-5 acc 14.062 (10.505)	lr 0.04769
Warmup Train [6][1680/3239]	Time 0.523 (0.515)	Data 0.001 (0.014)	Loss 5.8043 (5.9123)	Top-1 acc 3.906 (3.064)	Top-5 acc 14.453 (10.512)	lr 0.04769
Warmup Train [6][1690/3239]	Time 0.637 (0.515)	Data 0.001 (0.014)	Loss 5.8697 (5.9121)	Top-1 acc 3.906 (3.067)	Top-5 acc 13.672 (10.515)	lr 0.04769
Warmup Train [6][1700/3239]	Time 0.510 (0.515)	Data 0.001 (0.014)	Loss 5.8600 (5.9119)	Top-1 acc 5.078 (3.071)	Top-5 acc 12.109 (10.520)	lr 0.04768
Warmup Train [6][1710/3239]	Time 0.525 (0.515)	Data 0.001 (0.014)	Loss 5.8633 (5.9114)	Top-1 acc 1.953 (3.076)	Top-5 acc 7.031 (10.532)	lr 0.04768
Warmup Train [6][1720/3239]	Time 0.455 (0.515)	Data 0.001 (0.014)	Loss 5.8785 (5.9113)	Top-1 acc 5.078 (3.077)	Top-5 acc 12.500 (10.532)	lr 0.04768
Warmup Train [6][1730/3239]	Time 0.383 (0.515)	Data 0.001 (0.014)	Loss 5.7717 (5.9110)	Top-1 acc 5.469 (3.076)	Top-5 acc 14.844 (10.534)	lr 0.04768
Warmup Train [6][1740/3239]	Time 0.490 (0.515)	Data 0.001 (0.014)	Loss 5.8949 (5.9107)	Top-1 acc 3.516 (3.079)	Top-5 acc 11.719 (10.535)	lr 0.04767
Warmup Train [6][1750/3239]	Time 0.461 (0.515)	Data 0.001 (0.013)	Loss 5.8672 (5.9106)	Top-1 acc 3.125 (3.081)	Top-5 acc 12.109 (10.543)	lr 0.04767
Warmup Train [6][1760/3239]	Time 0.423 (0.515)	Data 0.001 (0.013)	Loss 5.8862 (5.9102)	Top-1 acc 2.344 (3.085)	Top-5 acc 9.766 (10.550)	lr 0.04767
Warmup Train [6][1770/3239]	Time 0.626 (0.515)	Data 0.001 (0.013)	Loss 5.9653 (5.9102)	Top-1 acc 2.734 (3.087)	Top-5 acc 8.984 (10.552)	lr 0.04767
Warmup Train [6][1780/3239]	Time 0.494 (0.515)	Data 0.001 (0.013)	Loss 5.8689 (5.9099)	Top-1 acc 1.953 (3.089)	Top-5 acc 8.203 (10.555)	lr 0.04766
Warmup Train [6][1790/3239]	Time 0.590 (0.515)	Data 0.001 (0.013)	Loss 5.8749 (5.9099)	Top-1 acc 3.906 (3.089)	Top-5 acc 10.156 (10.556)	lr 0.04766
Warmup Train [6][1800/3239]	Time 0.529 (0.515)	Data 0.001 (0.013)	Loss 5.9007 (5.9097)	Top-1 acc 3.906 (3.091)	Top-5 acc 10.938 (10.564)	lr 0.04766
Warmup Train [6][1810/3239]	Time 0.476 (0.515)	Data 0.001 (0.013)	Loss 6.0049 (5.9095)	Top-1 acc 2.734 (3.093)	Top-5 acc 9.375 (10.571)	lr 0.04766
Warmup Train [6][1820/3239]	Time 0.518 (0.515)	Data 0.001 (0.013)	Loss 5.8092 (5.9093)	Top-1 acc 4.688 (3.098)	Top-5 acc 14.844 (10.574)	lr 0.04765
Warmup Train [6][1830/3239]	Time 0.575 (0.515)	Data 0.002 (0.013)	Loss 5.8784 (5.9092)	Top-1 acc 3.125 (3.103)	Top-5 acc 14.453 (10.577)	lr 0.04765
Warmup Train [6][1840/3239]	Time 0.524 (0.515)	Data 0.001 (0.013)	Loss 5.9511 (5.9091)	Top-1 acc 1.562 (3.103)	Top-5 acc 9.375 (10.583)	lr 0.04765
Warmup Train [6][1850/3239]	Time 0.420 (0.515)	Data 0.001 (0.013)	Loss 5.7842 (5.9088)	Top-1 acc 3.516 (3.105)	Top-5 acc 15.234 (10.590)	lr 0.04764
Warmup Train [6][1860/3239]	Time 0.502 (0.515)	Data 0.001 (0.013)	Loss 5.7355 (5.9085)	Top-1 acc 5.469 (3.108)	Top-5 acc 15.625 (10.598)	lr 0.04764
Warmup Train [6][1870/3239]	Time 0.410 (0.515)	Data 0.001 (0.013)	Loss 5.8585 (5.9082)	Top-1 acc 5.469 (3.116)	Top-5 acc 11.328 (10.609)	lr 0.04764
Warmup Train [6][1880/3239]	Time 0.606 (0.515)	Data 0.001 (0.013)	Loss 5.8404 (5.9079)	Top-1 acc 3.125 (3.119)	Top-5 acc 7.812 (10.613)	lr 0.04764
Warmup Train [6][1890/3239]	Time 0.599 (0.515)	Data 0.001 (0.013)	Loss 6.0636 (5.9077)	Top-1 acc 1.953 (3.119)	Top-5 acc 8.203 (10.617)	lr 0.04763
Warmup Train [6][1900/3239]	Time 0.495 (0.515)	Data 0.001 (0.013)	Loss 5.8141 (5.9074)	Top-1 acc 5.469 (3.123)	Top-5 acc 11.719 (10.626)	lr 0.04763
Warmup Train [6][1910/3239]	Time 0.467 (0.515)	Data 0.001 (0.013)	Loss 5.8576 (5.9072)	Top-1 acc 0.781 (3.124)	Top-5 acc 10.547 (10.630)	lr 0.04763
Warmup Train [6][1920/3239]	Time 0.590 (0.514)	Data 0.001 (0.013)	Loss 5.8647 (5.9071)	Top-1 acc 2.344 (3.125)	Top-5 acc 10.547 (10.632)	lr 0.04763
Warmup Train [6][1930/3239]	Time 0.408 (0.514)	Data 0.029 (0.013)	Loss 5.7658 (5.9067)	Top-1 acc 5.469 (3.127)	Top-5 acc 16.016 (10.643)	lr 0.04762
Warmup Train [6][1940/3239]	Time 0.515 (0.514)	Data 0.001 (0.013)	Loss 5.8899 (5.9062)	Top-1 acc 2.734 (3.132)	Top-5 acc 12.500 (10.655)	lr 0.04762
Warmup Train [6][1950/3239]	Time 0.497 (0.514)	Data 0.001 (0.013)	Loss 5.8386 (5.9060)	Top-1 acc 1.953 (3.131)	Top-5 acc 10.156 (10.660)	lr 0.04762
Warmup Train [6][1960/3239]	Time 0.424 (0.514)	Data 0.001 (0.013)	Loss 5.9106 (5.9060)	Top-1 acc 3.906 (3.131)	Top-5 acc 10.156 (10.665)	lr 0.04762
Warmup Train [6][1970/3239]	Time 0.495 (0.514)	Data 0.001 (0.013)	Loss 5.9993 (5.9058)	Top-1 acc 3.125 (3.134)	Top-5 acc 8.984 (10.670)	lr 0.04761
Warmup Train [6][1980/3239]	Time 0.519 (0.514)	Data 0.001 (0.013)	Loss 5.8715 (5.9055)	Top-1 acc 0.781 (3.134)	Top-5 acc 8.984 (10.673)	lr 0.04761
Warmup Train [6][1990/3239]	Time 0.590 (0.514)	Data 0.001 (0.012)	Loss 5.8590 (5.9053)	Top-1 acc 1.562 (3.138)	Top-5 acc 10.938 (10.680)	lr 0.04761
Warmup Train [6][2000/3239]	Time 0.618 (0.514)	Data 0.001 (0.012)	Loss 5.7501 (5.9050)	Top-1 acc 3.906 (3.141)	Top-5 acc 14.062 (10.684)	lr 0.04761
Warmup Train [6][2010/3239]	Time 0.522 (0.514)	Data 0.001 (0.012)	Loss 5.8361 (5.9046)	Top-1 acc 1.953 (3.144)	Top-5 acc 8.594 (10.690)	lr 0.04760
Warmup Train [6][2020/3239]	Time 0.497 (0.514)	Data 0.001 (0.012)	Loss 5.8248 (5.9045)	Top-1 acc 5.078 (3.145)	Top-5 acc 11.719 (10.693)	lr 0.04760
Warmup Train [6][2030/3239]	Time 0.663 (0.514)	Data 0.001 (0.012)	Loss 5.7783 (5.9043)	Top-1 acc 2.344 (3.148)	Top-5 acc 14.453 (10.699)	lr 0.04760
Warmup Train [6][2040/3239]	Time 0.425 (0.514)	Data 0.001 (0.012)	Loss 5.8668 (5.9042)	Top-1 acc 4.297 (3.150)	Top-5 acc 12.109 (10.702)	lr 0.04760
Warmup Train [6][2050/3239]	Time 0.425 (0.514)	Data 0.001 (0.012)	Loss 5.8506 (5.9039)	Top-1 acc 3.906 (3.153)	Top-5 acc 15.234 (10.715)	lr 0.04759
Warmup Train [6][2060/3239]	Time 0.514 (0.514)	Data 0.001 (0.012)	Loss 5.8108 (5.9037)	Top-1 acc 2.734 (3.154)	Top-5 acc 10.938 (10.720)	lr 0.04759
Warmup Train [6][2070/3239]	Time 0.459 (0.514)	Data 0.001 (0.012)	Loss 5.9328 (5.9034)	Top-1 acc 4.297 (3.156)	Top-5 acc 9.375 (10.727)	lr 0.04759
Warmup Train [6][2080/3239]	Time 0.387 (0.514)	Data 0.001 (0.012)	Loss 5.8850 (5.9032)	Top-1 acc 2.734 (3.156)	Top-5 acc 8.594 (10.731)	lr 0.04759
Warmup Train [6][2090/3239]	Time 0.423 (0.514)	Data 0.001 (0.012)	Loss 5.9186 (5.9028)	Top-1 acc 3.906 (3.162)	Top-5 acc 13.281 (10.738)	lr 0.04758
Warmup Train [6][2100/3239]	Time 0.691 (0.514)	Data 0.001 (0.012)	Loss 5.8787 (5.9025)	Top-1 acc 3.516 (3.164)	Top-5 acc 10.547 (10.744)	lr 0.04758
Warmup Train [6][2110/3239]	Time 0.478 (0.514)	Data 0.001 (0.012)	Loss 5.7898 (5.9021)	Top-1 acc 3.125 (3.166)	Top-5 acc 10.938 (10.753)	lr 0.04758
Warmup Train [6][2120/3239]	Time 0.549 (0.514)	Data 0.002 (0.012)	Loss 5.8460 (5.9017)	Top-1 acc 4.297 (3.171)	Top-5 acc 12.109 (10.766)	lr 0.04758
Warmup Train [6][2130/3239]	Time 0.496 (0.514)	Data 0.001 (0.012)	Loss 5.8272 (5.9014)	Top-1 acc 1.953 (3.170)	Top-5 acc 11.328 (10.768)	lr 0.04757
Warmup Train [6][2140/3239]	Time 0.455 (0.514)	Data 0.001 (0.012)	Loss 5.9846 (5.9012)	Top-1 acc 1.562 (3.172)	Top-5 acc 8.594 (10.773)	lr 0.04757
Warmup Train [6][2150/3239]	Time 0.555 (0.514)	Data 0.001 (0.012)	Loss 5.9238 (5.9011)	Top-1 acc 2.734 (3.174)	Top-5 acc 13.281 (10.777)	lr 0.04757
Warmup Train [6][2160/3239]	Time 0.506 (0.514)	Data 0.001 (0.012)	Loss 5.8483 (5.9010)	Top-1 acc 5.078 (3.175)	Top-5 acc 12.891 (10.776)	lr 0.04756
Warmup Train [6][2170/3239]	Time 0.417 (0.514)	Data 0.001 (0.012)	Loss 5.8669 (5.9005)	Top-1 acc 5.859 (3.179)	Top-5 acc 14.062 (10.784)	lr 0.04756
Warmup Train [6][2180/3239]	Time 0.330 (0.513)	Data 0.001 (0.012)	Loss 5.7457 (5.9002)	Top-1 acc 2.734 (3.182)	Top-5 acc 11.328 (10.791)	lr 0.04756
Warmup Train [6][2190/3239]	Time 0.550 (0.513)	Data 0.002 (0.012)	Loss 5.8814 (5.9000)	Top-1 acc 2.344 (3.181)	Top-5 acc 12.109 (10.795)	lr 0.04756
Warmup Train [6][2200/3239]	Time 0.716 (0.513)	Data 0.001 (0.012)	Loss 5.8969 (5.8996)	Top-1 acc 4.297 (3.184)	Top-5 acc 7.422 (10.800)	lr 0.04755
Warmup Train [6][2210/3239]	Time 0.633 (0.513)	Data 0.001 (0.012)	Loss 5.6907 (5.8995)	Top-1 acc 5.859 (3.187)	Top-5 acc 16.406 (10.809)	lr 0.04755
Warmup Train [6][2220/3239]	Time 0.626 (0.513)	Data 0.001 (0.012)	Loss 5.8766 (5.8992)	Top-1 acc 3.906 (3.190)	Top-5 acc 13.281 (10.814)	lr 0.04755
Warmup Train [6][2230/3239]	Time 0.466 (0.513)	Data 0.001 (0.012)	Loss 5.8045 (5.8989)	Top-1 acc 3.906 (3.192)	Top-5 acc 15.234 (10.822)	lr 0.04755
Warmup Train [6][2240/3239]	Time 0.550 (0.513)	Data 0.001 (0.012)	Loss 5.9868 (5.8988)	Top-1 acc 3.125 (3.195)	Top-5 acc 7.422 (10.825)	lr 0.04754
Warmup Train [6][2250/3239]	Time 0.436 (0.513)	Data 0.001 (0.012)	Loss 5.8602 (5.8985)	Top-1 acc 3.906 (3.197)	Top-5 acc 12.500 (10.836)	lr 0.04754
Warmup Train [6][2260/3239]	Time 0.542 (0.513)	Data 0.001 (0.012)	Loss 5.9016 (5.8984)	Top-1 acc 7.031 (3.200)	Top-5 acc 10.938 (10.840)	lr 0.04754
Warmup Train [6][2270/3239]	Time 0.576 (0.513)	Data 0.001 (0.012)	Loss 5.8531 (5.8980)	Top-1 acc 4.688 (3.208)	Top-5 acc 12.500 (10.850)	lr 0.04754
Warmup Train [6][2280/3239]	Time 0.489 (0.513)	Data 0.001 (0.012)	Loss 5.7828 (5.8978)	Top-1 acc 2.734 (3.211)	Top-5 acc 14.062 (10.855)	lr 0.04753
Warmup Train [6][2290/3239]	Time 0.509 (0.513)	Data 0.001 (0.012)	Loss 5.9493 (5.8977)	Top-1 acc 4.297 (3.213)	Top-5 acc 11.328 (10.860)	lr 0.04753
Warmup Train [6][2300/3239]	Time 0.381 (0.513)	Data 0.001 (0.012)	Loss 5.9001 (5.8975)	Top-1 acc 2.734 (3.215)	Top-5 acc 10.156 (10.868)	lr 0.04753
Warmup Train [6][2310/3239]	Time 0.618 (0.513)	Data 0.001 (0.012)	Loss 5.9092 (5.8973)	Top-1 acc 5.078 (3.221)	Top-5 acc 12.109 (10.875)	lr 0.04753
Warmup Train [6][2320/3239]	Time 0.350 (0.513)	Data 0.001 (0.012)	Loss 5.7809 (5.8971)	Top-1 acc 4.297 (3.224)	Top-5 acc 12.891 (10.879)	lr 0.04752
Warmup Train [6][2330/3239]	Time 0.593 (0.513)	Data 0.001 (0.012)	Loss 5.8003 (5.8968)	Top-1 acc 3.125 (3.227)	Top-5 acc 12.109 (10.886)	lr 0.04752
Warmup Train [6][2340/3239]	Time 0.396 (0.513)	Data 0.001 (0.012)	Loss 5.8208 (5.8965)	Top-1 acc 2.344 (3.227)	Top-5 acc 14.062 (10.890)	lr 0.04752
Warmup Train [6][2350/3239]	Time 0.642 (0.513)	Data 0.001 (0.012)	Loss 5.9397 (5.8962)	Top-1 acc 1.953 (3.229)	Top-5 acc 8.203 (10.892)	lr 0.04751
Warmup Train [6][2360/3239]	Time 0.645 (0.513)	Data 0.001 (0.012)	Loss 5.9630 (5.8960)	Top-1 acc 3.906 (3.231)	Top-5 acc 10.547 (10.897)	lr 0.04751
Warmup Train [6][2370/3239]	Time 0.543 (0.513)	Data 0.001 (0.012)	Loss 5.7172 (5.8956)	Top-1 acc 3.906 (3.237)	Top-5 acc 17.188 (10.909)	lr 0.04751
Warmup Train [6][2380/3239]	Time 0.538 (0.513)	Data 0.001 (0.012)	Loss 5.7930 (5.8954)	Top-1 acc 4.688 (3.237)	Top-5 acc 10.547 (10.915)	lr 0.04751
Warmup Train [6][2390/3239]	Time 0.512 (0.513)	Data 0.001 (0.012)	Loss 5.7343 (5.8951)	Top-1 acc 4.688 (3.241)	Top-5 acc 10.547 (10.917)	lr 0.04750
Warmup Train [6][2400/3239]	Time 0.298 (0.513)	Data 0.001 (0.012)	Loss 5.8180 (5.8948)	Top-1 acc 5.078 (3.247)	Top-5 acc 15.234 (10.928)	lr 0.04750
Warmup Train [6][2410/3239]	Time 0.573 (0.513)	Data 0.001 (0.012)	Loss 5.8161 (5.8945)	Top-1 acc 3.516 (3.249)	Top-5 acc 11.328 (10.934)	lr 0.04750
Warmup Train [6][2420/3239]	Time 0.579 (0.513)	Data 0.001 (0.012)	Loss 5.7665 (5.8944)	Top-1 acc 6.641 (3.252)	Top-5 acc 14.844 (10.937)	lr 0.04750
Warmup Train [6][2430/3239]	Time 0.502 (0.513)	Data 0.001 (0.011)	Loss 5.8492 (5.8941)	Top-1 acc 3.906 (3.255)	Top-5 acc 11.328 (10.945)	lr 0.04749
Warmup Train [6][2440/3239]	Time 0.507 (0.513)	Data 0.001 (0.011)	Loss 5.9169 (5.8939)	Top-1 acc 2.734 (3.256)	Top-5 acc 9.375 (10.952)	lr 0.04749
Warmup Train [6][2450/3239]	Time 0.650 (0.513)	Data 0.001 (0.011)	Loss 5.8460 (5.8935)	Top-1 acc 4.297 (3.262)	Top-5 acc 8.984 (10.958)	lr 0.04749
Warmup Train [6][2460/3239]	Time 0.386 (0.513)	Data 0.001 (0.011)	Loss 5.6919 (5.8933)	Top-1 acc 3.906 (3.263)	Top-5 acc 15.234 (10.962)	lr 0.04749
Warmup Train [6][2470/3239]	Time 0.496 (0.512)	Data 0.001 (0.011)	Loss 5.7483 (5.8929)	Top-1 acc 6.250 (3.268)	Top-5 acc 14.062 (10.970)	lr 0.04748
Warmup Train [6][2480/3239]	Time 0.516 (0.512)	Data 0.001 (0.011)	Loss 5.8756 (5.8928)	Top-1 acc 3.125 (3.268)	Top-5 acc 10.938 (10.973)	lr 0.04748
Warmup Train [6][2490/3239]	Time 0.361 (0.512)	Data 0.001 (0.011)	Loss 5.8815 (5.8925)	Top-1 acc 1.172 (3.269)	Top-5 acc 11.328 (10.980)	lr 0.04748
Warmup Train [6][2500/3239]	Time 0.416 (0.512)	Data 0.001 (0.011)	Loss 5.9114 (5.8923)	Top-1 acc 4.297 (3.271)	Top-5 acc 12.500 (10.986)	lr 0.04748
Warmup Train [6][2510/3239]	Time 0.505 (0.512)	Data 0.001 (0.011)	Loss 5.7955 (5.8921)	Top-1 acc 5.469 (3.272)	Top-5 acc 13.672 (10.988)	lr 0.04747
Warmup Train [6][2520/3239]	Time 0.584 (0.512)	Data 0.001 (0.011)	Loss 5.8480 (5.8918)	Top-1 acc 2.734 (3.274)	Top-5 acc 10.156 (10.991)	lr 0.04747
Warmup Train [6][2530/3239]	Time 0.552 (0.512)	Data 0.001 (0.011)	Loss 5.6782 (5.8916)	Top-1 acc 3.906 (3.275)	Top-5 acc 14.062 (10.992)	lr 0.04747
Warmup Train [6][2540/3239]	Time 0.542 (0.512)	Data 0.001 (0.011)	Loss 5.8609 (5.8915)	Top-1 acc 2.734 (3.277)	Top-5 acc 11.328 (10.991)	lr 0.04746
Warmup Train [6][2550/3239]	Time 0.454 (0.512)	Data 0.001 (0.011)	Loss 5.7694 (5.8912)	Top-1 acc 3.516 (3.278)	Top-5 acc 12.500 (10.994)	lr 0.04746
Warmup Train [6][2560/3239]	Time 0.465 (0.512)	Data 0.001 (0.011)	Loss 5.8505 (5.8910)	Top-1 acc 2.734 (3.279)	Top-5 acc 11.328 (10.997)	lr 0.04746
Warmup Train [6][2570/3239]	Time 0.324 (0.512)	Data 0.001 (0.011)	Loss 5.8468 (5.8906)	Top-1 acc 5.078 (3.283)	Top-5 acc 11.719 (11.004)	lr 0.04746
Warmup Train [6][2580/3239]	Time 0.482 (0.512)	Data 0.001 (0.011)	Loss 5.8578 (5.8904)	Top-1 acc 4.297 (3.285)	Top-5 acc 11.719 (11.008)	lr 0.04745
Warmup Train [6][2590/3239]	Time 0.597 (0.512)	Data 0.001 (0.011)	Loss 5.8650 (5.8901)	Top-1 acc 2.734 (3.288)	Top-5 acc 10.156 (11.016)	lr 0.04745
Warmup Train [6][2600/3239]	Time 0.611 (0.513)	Data 0.001 (0.011)	Loss 5.8622 (5.8899)	Top-1 acc 2.734 (3.290)	Top-5 acc 10.547 (11.021)	lr 0.04745
Warmup Train [6][2610/3239]	Time 0.605 (0.512)	Data 0.001 (0.011)	Loss 5.9030 (5.8897)	Top-1 acc 3.516 (3.290)	Top-5 acc 10.156 (11.025)	lr 0.04745
Warmup Train [6][2620/3239]	Time 0.395 (0.513)	Data 0.001 (0.011)	Loss 5.7735 (5.8894)	Top-1 acc 4.688 (3.291)	Top-5 acc 10.938 (11.033)	lr 0.04744
Warmup Train [6][2630/3239]	Time 0.592 (0.513)	Data 0.001 (0.011)	Loss 5.7940 (5.8890)	Top-1 acc 3.516 (3.292)	Top-5 acc 10.547 (11.038)	lr 0.04744
Warmup Train [6][2640/3239]	Time 0.482 (0.513)	Data 0.001 (0.011)	Loss 5.7775 (5.8886)	Top-1 acc 6.641 (3.298)	Top-5 acc 17.188 (11.049)	lr 0.04744
Warmup Train [6][2650/3239]	Time 0.417 (0.513)	Data 0.001 (0.011)	Loss 5.7706 (5.8884)	Top-1 acc 5.078 (3.301)	Top-5 acc 11.328 (11.055)	lr 0.04744
Warmup Train [6][2660/3239]	Time 0.608 (0.513)	Data 0.001 (0.011)	Loss 5.7483 (5.8882)	Top-1 acc 5.859 (3.302)	Top-5 acc 12.891 (11.058)	lr 0.04743
Warmup Train [6][2670/3239]	Time 0.685 (0.513)	Data 0.001 (0.011)	Loss 5.8516 (5.8881)	Top-1 acc 6.250 (3.302)	Top-5 acc 14.453 (11.058)	lr 0.04743
Warmup Train [6][2680/3239]	Time 0.417 (0.513)	Data 0.001 (0.011)	Loss 5.7608 (5.8878)	Top-1 acc 3.906 (3.304)	Top-5 acc 8.594 (11.060)	lr 0.04743
Warmup Train [6][2690/3239]	Time 0.285 (0.513)	Data 0.001 (0.011)	Loss 5.8662 (5.8875)	Top-1 acc 2.344 (3.306)	Top-5 acc 13.281 (11.066)	lr 0.04742
Warmup Train [6][2700/3239]	Time 0.508 (0.513)	Data 0.001 (0.011)	Loss 5.7926 (5.8873)	Top-1 acc 5.469 (3.310)	Top-5 acc 13.672 (11.073)	lr 0.04742
Warmup Train [6][2710/3239]	Time 0.442 (0.513)	Data 0.001 (0.011)	Loss 5.7126 (5.8872)	Top-1 acc 4.297 (3.312)	Top-5 acc 15.234 (11.078)	lr 0.04742
Warmup Train [6][2720/3239]	Time 0.487 (0.512)	Data 0.001 (0.011)	Loss 5.7883 (5.8869)	Top-1 acc 1.562 (3.313)	Top-5 acc 11.328 (11.084)	lr 0.04742
Warmup Train [6][2730/3239]	Time 0.437 (0.512)	Data 0.001 (0.011)	Loss 5.7675 (5.8866)	Top-1 acc 3.516 (3.313)	Top-5 acc 14.844 (11.091)	lr 0.04741
Warmup Train [6][2740/3239]	Time 0.426 (0.512)	Data 0.001 (0.011)	Loss 5.7094 (5.8864)	Top-1 acc 2.734 (3.312)	Top-5 acc 15.234 (11.094)	lr 0.04741
Warmup Train [6][2750/3239]	Time 0.561 (0.512)	Data 0.001 (0.011)	Loss 5.8713 (5.8862)	Top-1 acc 2.734 (3.316)	Top-5 acc 9.375 (11.098)	lr 0.04741
Warmup Train [6][2760/3239]	Time 0.511 (0.512)	Data 0.001 (0.011)	Loss 5.8416 (5.8860)	Top-1 acc 3.125 (3.319)	Top-5 acc 9.375 (11.103)	lr 0.04741
Warmup Train [6][2770/3239]	Time 0.528 (0.512)	Data 0.001 (0.011)	Loss 5.8083 (5.8856)	Top-1 acc 3.906 (3.320)	Top-5 acc 12.500 (11.110)	lr 0.04740
Warmup Train [6][2780/3239]	Time 0.669 (0.512)	Data 0.001 (0.011)	Loss 5.7364 (5.8855)	Top-1 acc 3.125 (3.321)	Top-5 acc 16.797 (11.116)	lr 0.04740
Warmup Train [6][2790/3239]	Time 0.457 (0.512)	Data 0.001 (0.011)	Loss 5.7054 (5.8852)	Top-1 acc 5.469 (3.324)	Top-5 acc 16.406 (11.123)	lr 0.04740
Warmup Train [6][2800/3239]	Time 0.446 (0.512)	Data 0.001 (0.011)	Loss 5.7140 (5.8849)	Top-1 acc 7.031 (3.327)	Top-5 acc 14.453 (11.128)	lr 0.04739
Warmup Train [6][2810/3239]	Time 0.576 (0.512)	Data 0.001 (0.011)	Loss 5.7822 (5.8848)	Top-1 acc 5.469 (3.329)	Top-5 acc 14.844 (11.132)	lr 0.04739
Warmup Train [6][2820/3239]	Time 0.495 (0.512)	Data 0.001 (0.011)	Loss 5.8516 (5.8846)	Top-1 acc 4.297 (3.331)	Top-5 acc 10.156 (11.136)	lr 0.04739
Warmup Train [6][2830/3239]	Time 0.474 (0.512)	Data 0.001 (0.011)	Loss 5.8641 (5.8845)	Top-1 acc 0.781 (3.330)	Top-5 acc 8.984 (11.136)	lr 0.04739
Warmup Train [6][2840/3239]	Time 0.383 (0.512)	Data 0.001 (0.011)	Loss 5.8467 (5.8843)	Top-1 acc 3.516 (3.332)	Top-5 acc 12.500 (11.137)	lr 0.04738
Warmup Train [6][2850/3239]	Time 0.525 (0.512)	Data 0.001 (0.011)	Loss 5.7080 (5.8841)	Top-1 acc 5.859 (3.336)	Top-5 acc 15.625 (11.141)	lr 0.04738
Warmup Train [6][2860/3239]	Time 0.601 (0.512)	Data 0.002 (0.011)	Loss 5.7861 (5.8838)	Top-1 acc 6.641 (3.338)	Top-5 acc 16.406 (11.149)	lr 0.04738
Warmup Train [6][2870/3239]	Time 0.640 (0.512)	Data 0.001 (0.011)	Loss 5.7680 (5.8835)	Top-1 acc 2.734 (3.340)	Top-5 acc 9.766 (11.152)	lr 0.04738
Warmup Train [6][2880/3239]	Time 0.610 (0.512)	Data 0.001 (0.011)	Loss 5.9009 (5.8832)	Top-1 acc 4.688 (3.342)	Top-5 acc 11.719 (11.160)	lr 0.04737
Warmup Train [6][2890/3239]	Time 0.459 (0.512)	Data 0.001 (0.011)	Loss 5.7154 (5.8829)	Top-1 acc 4.297 (3.341)	Top-5 acc 15.234 (11.165)	lr 0.04737
Warmup Train [6][2900/3239]	Time 0.614 (0.512)	Data 0.001 (0.011)	Loss 5.8448 (5.8826)	Top-1 acc 3.906 (3.345)	Top-5 acc 9.766 (11.171)	lr 0.04737
Warmup Train [6][2910/3239]	Time 0.468 (0.512)	Data 0.001 (0.011)	Loss 5.8490 (5.8824)	Top-1 acc 4.688 (3.347)	Top-5 acc 11.719 (11.176)	lr 0.04737
Warmup Train [6][2920/3239]	Time 0.499 (0.512)	Data 0.001 (0.011)	Loss 5.8870 (5.8822)	Top-1 acc 4.688 (3.348)	Top-5 acc 12.891 (11.179)	lr 0.04736
Warmup Train [6][2930/3239]	Time 0.513 (0.512)	Data 0.001 (0.011)	Loss 5.7871 (5.8821)	Top-1 acc 3.125 (3.349)	Top-5 acc 10.938 (11.182)	lr 0.04736
Warmup Train [6][2940/3239]	Time 0.623 (0.512)	Data 0.001 (0.011)	Loss 5.7981 (5.8818)	Top-1 acc 3.516 (3.352)	Top-5 acc 13.672 (11.191)	lr 0.04736
Warmup Train [6][2950/3239]	Time 0.585 (0.512)	Data 0.001 (0.011)	Loss 5.8743 (5.8816)	Top-1 acc 2.734 (3.351)	Top-5 acc 11.719 (11.195)	lr 0.04735
Warmup Train [6][2960/3239]	Time 0.752 (0.512)	Data 0.001 (0.011)	Loss 5.7978 (5.8813)	Top-1 acc 3.906 (3.353)	Top-5 acc 13.672 (11.203)	lr 0.04735
Warmup Train [6][2970/3239]	Time 0.525 (0.512)	Data 0.001 (0.011)	Loss 5.6768 (5.8810)	Top-1 acc 7.422 (3.359)	Top-5 acc 19.531 (11.209)	lr 0.04735
Warmup Train [6][2980/3239]	Time 0.466 (0.512)	Data 0.001 (0.011)	Loss 5.9144 (5.8807)	Top-1 acc 5.078 (3.363)	Top-5 acc 12.109 (11.216)	lr 0.04735
Warmup Train [6][2990/3239]	Time 0.507 (0.512)	Data 0.001 (0.011)	Loss 5.7426 (5.8803)	Top-1 acc 4.688 (3.365)	Top-5 acc 12.891 (11.225)	lr 0.04734
Warmup Train [6][3000/3239]	Time 0.354 (0.512)	Data 0.001 (0.011)	Loss 5.7699 (5.8801)	Top-1 acc 4.297 (3.366)	Top-5 acc 17.969 (11.229)	lr 0.04734
Warmup Train [6][3010/3239]	Time 0.498 (0.512)	Data 0.001 (0.011)	Loss 5.7635 (5.8799)	Top-1 acc 5.078 (3.370)	Top-5 acc 12.500 (11.231)	lr 0.04734
Warmup Train [6][3020/3239]	Time 0.538 (0.512)	Data 0.001 (0.011)	Loss 5.7255 (5.8796)	Top-1 acc 7.422 (3.374)	Top-5 acc 16.406 (11.238)	lr 0.04734
Warmup Train [6][3030/3239]	Time 0.495 (0.512)	Data 0.001 (0.011)	Loss 5.7758 (5.8793)	Top-1 acc 4.297 (3.378)	Top-5 acc 12.891 (11.244)	lr 0.04733
Warmup Train [6][3040/3239]	Time 0.403 (0.512)	Data 0.001 (0.011)	Loss 5.7369 (5.8789)	Top-1 acc 6.250 (3.380)	Top-5 acc 16.797 (11.251)	lr 0.04733
Warmup Train [6][3050/3239]	Time 0.545 (0.512)	Data 0.001 (0.011)	Loss 5.8262 (5.8788)	Top-1 acc 2.734 (3.381)	Top-5 acc 11.719 (11.253)	lr 0.04733
Warmup Train [6][3060/3239]	Time 0.554 (0.512)	Data 0.001 (0.011)	Loss 5.7017 (5.8786)	Top-1 acc 4.688 (3.385)	Top-5 acc 16.016 (11.261)	lr 0.04732
Warmup Train [6][3070/3239]	Time 0.515 (0.512)	Data 0.001 (0.010)	Loss 5.8763 (5.8783)	Top-1 acc 2.734 (3.387)	Top-5 acc 12.500 (11.265)	lr 0.04732
Warmup Train [6][3080/3239]	Time 0.586 (0.512)	Data 0.001 (0.010)	Loss 5.8759 (5.8781)	Top-1 acc 2.344 (3.388)	Top-5 acc 7.812 (11.268)	lr 0.04732
Warmup Train [6][3090/3239]	Time 0.618 (0.512)	Data 0.001 (0.010)	Loss 5.8316 (5.8778)	Top-1 acc 3.906 (3.391)	Top-5 acc 12.500 (11.274)	lr 0.04732
Warmup Train [6][3100/3239]	Time 0.556 (0.512)	Data 0.001 (0.010)	Loss 5.8049 (5.8775)	Top-1 acc 2.734 (3.393)	Top-5 acc 14.453 (11.281)	lr 0.04731
Warmup Train [6][3110/3239]	Time 0.458 (0.512)	Data 0.001 (0.010)	Loss 5.8828 (5.8774)	Top-1 acc 3.516 (3.394)	Top-5 acc 9.375 (11.285)	lr 0.04731
Warmup Train [6][3120/3239]	Time 0.445 (0.512)	Data 0.001 (0.010)	Loss 5.8507 (5.8772)	Top-1 acc 2.344 (3.397)	Top-5 acc 12.109 (11.290)	lr 0.04731
Warmup Train [6][3130/3239]	Time 0.541 (0.512)	Data 0.001 (0.010)	Loss 5.7838 (5.8769)	Top-1 acc 4.688 (3.398)	Top-5 acc 13.281 (11.297)	lr 0.04731
Warmup Train [6][3140/3239]	Time 0.389 (0.512)	Data 0.001 (0.010)	Loss 5.7713 (5.8766)	Top-1 acc 2.734 (3.402)	Top-5 acc 9.375 (11.304)	lr 0.04730
Warmup Train [6][3150/3239]	Time 0.497 (0.512)	Data 0.001 (0.010)	Loss 5.7472 (5.8765)	Top-1 acc 7.031 (3.405)	Top-5 acc 14.844 (11.308)	lr 0.04730
Warmup Train [6][3160/3239]	Time 0.533 (0.512)	Data 0.001 (0.010)	Loss 5.7464 (5.8763)	Top-1 acc 3.125 (3.407)	Top-5 acc 13.281 (11.311)	lr 0.04730
Warmup Train [6][3170/3239]	Time 0.648 (0.512)	Data 0.001 (0.010)	Loss 5.8320 (5.8760)	Top-1 acc 4.297 (3.410)	Top-5 acc 12.109 (11.319)	lr 0.04729
Warmup Train [6][3180/3239]	Time 0.505 (0.512)	Data 0.000 (0.010)	Loss 5.6948 (5.8758)	Top-1 acc 5.859 (3.413)	Top-5 acc 15.625 (11.324)	lr 0.04729
Warmup Train [6][3190/3239]	Time 0.456 (0.512)	Data 0.000 (0.010)	Loss 5.7360 (5.8755)	Top-1 acc 5.859 (3.416)	Top-5 acc 15.234 (11.330)	lr 0.04729
Warmup Train [6][3200/3239]	Time 0.659 (0.512)	Data 0.000 (0.010)	Loss 5.7989 (5.8752)	Top-1 acc 4.297 (3.421)	Top-5 acc 12.891 (11.336)	lr 0.04729
Warmup Train [6][3210/3239]	Time 0.544 (0.512)	Data 0.000 (0.010)	Loss 5.8321 (5.8752)	Top-1 acc 4.297 (3.424)	Top-5 acc 12.891 (11.338)	lr 0.04728
Warmup Train [6][3220/3239]	Time 0.369 (0.512)	Data 0.000 (0.010)	Loss 5.8961 (5.8751)	Top-1 acc 5.078 (3.426)	Top-5 acc 13.281 (11.344)	lr 0.04728
Warmup Train [6][3230/3239]	Time 0.516 (0.512)	Data 0.000 (0.010)	Loss 5.7453 (5.8749)	Top-1 acc 6.641 (3.428)	Top-5 acc 16.797 (11.350)	lr 0.04728
Warmup Train [6][3239/3239]	Time 0.400 (0.511)	Data 0.000 (0.010)	Loss 5.7325 (5.8748)	Top-1 acc 6.173 (3.430)	Top-5 acc 17.284 (11.353)	lr 0.04728
==========Warmup Valid [6/40]	loss 5.355	top-1 acc 5.312	top-5 acc 16.139	Train top-1 3.430	top-5 11.353	flops: 442.4M
Warmup Train [7][0/3239]	Time 9.086 (9.086)	Data 8.427 (8.427)	Loss 5.8082 (5.8082)	Top-1 acc 3.516 (3.516)	Top-5 acc 10.938 (10.938)	lr 0.04728
Warmup Train [7][10/3239]	Time 0.434 (1.393)	Data 0.001 (0.791)	Loss 5.7583 (5.7827)	Top-1 acc 3.125 (4.616)	Top-5 acc 12.891 (14.062)	lr 0.04727
Warmup Train [7][20/3239]	Time 0.481 (0.972)	Data 0.001 (0.419)	Loss 5.8544 (5.7826)	Top-1 acc 5.469 (4.762)	Top-5 acc 12.109 (13.858)	lr 0.04727
Warmup Train [7][30/3239]	Time 0.538 (0.824)	Data 0.001 (0.284)	Loss 5.7005 (5.7834)	Top-1 acc 5.469 (4.662)	Top-5 acc 14.062 (13.659)	lr 0.04727
Warmup Train [7][40/3239]	Time 0.531 (0.744)	Data 0.001 (0.215)	Loss 5.8043 (5.7860)	Top-1 acc 1.953 (4.421)	Top-5 acc 11.328 (13.386)	lr 0.04726
Warmup Train [7][50/3239]	Time 0.654 (0.696)	Data 0.001 (0.174)	Loss 5.8000 (5.7901)	Top-1 acc 4.297 (4.389)	Top-5 acc 11.719 (13.228)	lr 0.04726
Warmup Train [7][60/3239]	Time 0.481 (0.661)	Data 0.001 (0.145)	Loss 5.8402 (5.7906)	Top-1 acc 4.688 (4.470)	Top-5 acc 13.281 (13.300)	lr 0.04726
Warmup Train [7][70/3239]	Time 0.633 (0.640)	Data 0.001 (0.127)	Loss 5.7588 (5.7899)	Top-1 acc 4.688 (4.451)	Top-5 acc 14.062 (13.215)	lr 0.04726
Warmup Train [7][80/3239]	Time 0.536 (0.624)	Data 0.001 (0.111)	Loss 5.7488 (5.7896)	Top-1 acc 4.297 (4.369)	Top-5 acc 11.719 (13.228)	lr 0.04725
Warmup Train [7][90/3239]	Time 0.574 (0.612)	Data 0.001 (0.100)	Loss 5.7858 (5.7911)	Top-1 acc 5.469 (4.344)	Top-5 acc 11.719 (13.075)	lr 0.04725
Warmup Train [7][100/3239]	Time 0.630 (0.605)	Data 0.002 (0.091)	Loss 5.7425 (5.7937)	Top-1 acc 2.734 (4.285)	Top-5 acc 16.406 (13.161)	lr 0.04725
Warmup Train [7][110/3239]	Time 0.556 (0.596)	Data 0.001 (0.083)	Loss 5.7460 (5.7936)	Top-1 acc 5.469 (4.311)	Top-5 acc 13.281 (13.183)	lr 0.04724
Warmup Train [7][120/3239]	Time 0.510 (0.585)	Data 0.001 (0.076)	Loss 5.6814 (5.7937)	Top-1 acc 5.469 (4.245)	Top-5 acc 14.062 (13.084)	lr 0.04724
Warmup Train [7][130/3239]	Time 0.601 (0.581)	Data 0.001 (0.071)	Loss 5.9060 (5.7938)	Top-1 acc 3.125 (4.219)	Top-5 acc 10.938 (13.076)	lr 0.04724
Warmup Train [7][140/3239]	Time 0.528 (0.572)	Data 0.001 (0.066)	Loss 5.8370 (5.7932)	Top-1 acc 3.125 (4.217)	Top-5 acc 14.062 (13.132)	lr 0.04724
Warmup Train [7][150/3239]	Time 0.548 (0.567)	Data 0.001 (0.062)	Loss 5.7465 (5.7929)	Top-1 acc 4.688 (4.178)	Top-5 acc 14.062 (13.144)	lr 0.04723
Warmup Train [7][160/3239]	Time 0.426 (0.560)	Data 0.001 (0.058)	Loss 5.7879 (5.7932)	Top-1 acc 2.344 (4.185)	Top-5 acc 12.109 (13.155)	lr 0.04723
Warmup Train [7][170/3239]	Time 0.556 (0.560)	Data 0.001 (0.055)	Loss 5.8003 (5.7917)	Top-1 acc 3.906 (4.235)	Top-5 acc 13.672 (13.245)	lr 0.04723
Warmup Train [7][180/3239]	Time 0.585 (0.556)	Data 0.001 (0.053)	Loss 5.6635 (5.7901)	Top-1 acc 4.297 (4.260)	Top-5 acc 12.500 (13.260)	lr 0.04723
Warmup Train [7][190/3239]	Time 0.356 (0.552)	Data 0.001 (0.050)	Loss 5.8015 (5.7910)	Top-1 acc 4.297 (4.276)	Top-5 acc 10.938 (13.271)	lr 0.04722
Warmup Train [7][200/3239]	Time 0.408 (0.551)	Data 0.001 (0.048)	Loss 5.8456 (5.7916)	Top-1 acc 5.078 (4.287)	Top-5 acc 11.719 (13.305)	lr 0.04722
Warmup Train [7][210/3239]	Time 0.482 (0.549)	Data 0.001 (0.046)	Loss 5.8194 (5.7918)	Top-1 acc 5.469 (4.295)	Top-5 acc 12.891 (13.265)	lr 0.04722
Warmup Train [7][220/3239]	Time 0.673 (0.547)	Data 0.001 (0.045)	Loss 5.8696 (5.7928)	Top-1 acc 5.469 (4.315)	Top-5 acc 11.719 (13.258)	lr 0.04721
Warmup Train [7][230/3239]	Time 0.609 (0.546)	Data 0.001 (0.043)	Loss 5.7120 (5.7904)	Top-1 acc 4.297 (4.312)	Top-5 acc 14.844 (13.266)	lr 0.04721
Warmup Train [7][240/3239]	Time 0.568 (0.545)	Data 0.001 (0.041)	Loss 5.7182 (5.7897)	Top-1 acc 3.125 (4.295)	Top-5 acc 14.062 (13.262)	lr 0.04721
Warmup Train [7][250/3239]	Time 0.651 (0.544)	Data 0.001 (0.040)	Loss 5.8678 (5.7895)	Top-1 acc 5.078 (4.297)	Top-5 acc 11.719 (13.249)	lr 0.04721
Warmup Train [7][260/3239]	Time 0.347 (0.542)	Data 0.001 (0.038)	Loss 5.6740 (5.7890)	Top-1 acc 4.297 (4.280)	Top-5 acc 16.797 (13.256)	lr 0.04720
Warmup Train [7][270/3239]	Time 0.516 (0.542)	Data 0.001 (0.037)	Loss 5.8704 (5.7895)	Top-1 acc 3.125 (4.249)	Top-5 acc 12.891 (13.241)	lr 0.04720
Warmup Train [7][280/3239]	Time 0.496 (0.541)	Data 0.001 (0.037)	Loss 5.7498 (5.7899)	Top-1 acc 6.250 (4.244)	Top-5 acc 16.406 (13.246)	lr 0.04720
Warmup Train [7][290/3239]	Time 0.505 (0.540)	Data 0.001 (0.035)	Loss 5.7704 (5.7907)	Top-1 acc 3.906 (4.228)	Top-5 acc 16.406 (13.236)	lr 0.04719
Warmup Train [7][300/3239]	Time 0.378 (0.540)	Data 0.001 (0.035)	Loss 5.8776 (5.7910)	Top-1 acc 3.125 (4.214)	Top-5 acc 10.938 (13.194)	lr 0.04719
Warmup Train [7][310/3239]	Time 0.523 (0.540)	Data 0.001 (0.034)	Loss 5.6918 (5.7901)	Top-1 acc 6.641 (4.225)	Top-5 acc 14.062 (13.197)	lr 0.04719
Warmup Train [7][320/3239]	Time 0.367 (0.538)	Data 0.001 (0.033)	Loss 5.7283 (5.7899)	Top-1 acc 5.078 (4.237)	Top-5 acc 12.109 (13.223)	lr 0.04719
Warmup Train [7][330/3239]	Time 0.562 (0.537)	Data 0.001 (0.033)	Loss 5.8315 (5.7905)	Top-1 acc 2.734 (4.251)	Top-5 acc 9.375 (13.205)	lr 0.04718
Warmup Train [7][340/3239]	Time 0.586 (0.536)	Data 0.001 (0.032)	Loss 5.8108 (5.7901)	Top-1 acc 4.688 (4.263)	Top-5 acc 13.281 (13.224)	lr 0.04718
Warmup Train [7][350/3239]	Time 0.609 (0.535)	Data 0.001 (0.031)	Loss 5.6952 (5.7897)	Top-1 acc 5.859 (4.267)	Top-5 acc 14.844 (13.226)	lr 0.04718
Warmup Train [7][360/3239]	Time 0.677 (0.535)	Data 0.001 (0.030)	Loss 5.7319 (5.7898)	Top-1 acc 6.250 (4.273)	Top-5 acc 13.672 (13.213)	lr 0.04718
Warmup Train [7][370/3239]	Time 0.639 (0.534)	Data 0.001 (0.030)	Loss 5.7013 (5.7894)	Top-1 acc 3.516 (4.280)	Top-5 acc 10.547 (13.202)	lr 0.04717
Warmup Train [7][380/3239]	Time 0.327 (0.532)	Data 0.001 (0.029)	Loss 5.7476 (5.7893)	Top-1 acc 3.906 (4.277)	Top-5 acc 13.281 (13.209)	lr 0.04717
Warmup Train [7][390/3239]	Time 0.570 (0.532)	Data 0.001 (0.029)	Loss 5.8046 (5.7893)	Top-1 acc 5.859 (4.286)	Top-5 acc 12.891 (13.241)	lr 0.04717
Warmup Train [7][400/3239]	Time 0.492 (0.530)	Data 0.001 (0.028)	Loss 5.7764 (5.7885)	Top-1 acc 4.297 (4.296)	Top-5 acc 11.719 (13.246)	lr 0.04716
Warmup Train [7][410/3239]	Time 0.436 (0.529)	Data 0.001 (0.027)	Loss 5.7520 (5.7882)	Top-1 acc 3.906 (4.279)	Top-5 acc 13.672 (13.259)	lr 0.04716
Warmup Train [7][420/3239]	Time 0.483 (0.527)	Data 0.001 (0.027)	Loss 5.7610 (5.7881)	Top-1 acc 4.688 (4.282)	Top-5 acc 11.719 (13.265)	lr 0.04716
Warmup Train [7][430/3239]	Time 0.478 (0.526)	Data 0.001 (0.026)	Loss 5.8367 (5.7884)	Top-1 acc 3.906 (4.283)	Top-5 acc 12.500 (13.236)	lr 0.04716
Warmup Train [7][440/3239]	Time 0.523 (0.526)	Data 0.001 (0.026)	Loss 5.7796 (5.7881)	Top-1 acc 3.125 (4.283)	Top-5 acc 10.938 (13.230)	lr 0.04715
Warmup Train [7][450/3239]	Time 0.350 (0.526)	Data 0.040 (0.025)	Loss 5.7575 (5.7875)	Top-1 acc 4.297 (4.286)	Top-5 acc 11.328 (13.235)	lr 0.04715
Warmup Train [7][460/3239]	Time 0.555 (0.526)	Data 0.001 (0.025)	Loss 5.8740 (5.7876)	Top-1 acc 4.297 (4.286)	Top-5 acc 13.672 (13.235)	lr 0.04715
Warmup Train [7][470/3239]	Time 0.483 (0.526)	Data 0.001 (0.025)	Loss 5.7168 (5.7871)	Top-1 acc 5.078 (4.284)	Top-5 acc 13.281 (13.241)	lr 0.04714
Warmup Train [7][480/3239]	Time 0.640 (0.526)	Data 0.001 (0.025)	Loss 5.7238 (5.7860)	Top-1 acc 3.516 (4.290)	Top-5 acc 17.578 (13.242)	lr 0.04714
Warmup Train [7][490/3239]	Time 0.422 (0.526)	Data 0.001 (0.024)	Loss 5.7075 (5.7859)	Top-1 acc 4.297 (4.295)	Top-5 acc 14.844 (13.244)	lr 0.04714
Warmup Train [7][500/3239]	Time 0.480 (0.526)	Data 0.001 (0.024)	Loss 5.8448 (5.7855)	Top-1 acc 3.516 (4.289)	Top-5 acc 12.891 (13.247)	lr 0.04714
Warmup Train [7][510/3239]	Time 0.446 (0.526)	Data 0.001 (0.023)	Loss 5.7853 (5.7850)	Top-1 acc 4.297 (4.285)	Top-5 acc 14.453 (13.256)	lr 0.04713
Warmup Train [7][520/3239]	Time 0.446 (0.526)	Data 0.001 (0.023)	Loss 5.8511 (5.7851)	Top-1 acc 3.125 (4.282)	Top-5 acc 12.109 (13.261)	lr 0.04713
Warmup Train [7][530/3239]	Time 0.415 (0.525)	Data 0.001 (0.023)	Loss 5.8151 (5.7864)	Top-1 acc 3.125 (4.278)	Top-5 acc 14.062 (13.236)	lr 0.04713
Warmup Train [7][540/3239]	Time 0.507 (0.525)	Data 0.001 (0.023)	Loss 5.8240 (5.7862)	Top-1 acc 3.125 (4.274)	Top-5 acc 12.891 (13.248)	lr 0.04712
Warmup Train [7][550/3239]	Time 0.541 (0.525)	Data 0.001 (0.023)	Loss 5.7076 (5.7862)	Top-1 acc 4.688 (4.262)	Top-5 acc 14.453 (13.239)	lr 0.04712
Warmup Train [7][560/3239]	Time 0.446 (0.524)	Data 0.001 (0.022)	Loss 5.7009 (5.7862)	Top-1 acc 5.078 (4.266)	Top-5 acc 15.234 (13.251)	lr 0.04712
Warmup Train [7][570/3239]	Time 0.439 (0.524)	Data 0.001 (0.022)	Loss 5.8088 (5.7856)	Top-1 acc 3.906 (4.263)	Top-5 acc 14.844 (13.268)	lr 0.04712
Warmup Train [7][580/3239]	Time 0.543 (0.524)	Data 0.001 (0.022)	Loss 5.7562 (5.7855)	Top-1 acc 3.906 (4.255)	Top-5 acc 10.547 (13.262)	lr 0.04711
Warmup Train [7][590/3239]	Time 0.735 (0.524)	Data 0.001 (0.021)	Loss 5.7689 (5.7852)	Top-1 acc 4.297 (4.259)	Top-5 acc 12.109 (13.262)	lr 0.04711
Warmup Train [7][600/3239]	Time 0.542 (0.524)	Data 0.001 (0.021)	Loss 5.8752 (5.7855)	Top-1 acc 3.906 (4.267)	Top-5 acc 11.719 (13.266)	lr 0.04711
Warmup Train [7][610/3239]	Time 0.511 (0.524)	Data 0.001 (0.021)	Loss 5.7898 (5.7853)	Top-1 acc 3.516 (4.266)	Top-5 acc 14.062 (13.261)	lr 0.04710
Warmup Train [7][620/3239]	Time 0.384 (0.524)	Data 0.001 (0.021)	Loss 5.7711 (5.7847)	Top-1 acc 4.297 (4.268)	Top-5 acc 14.453 (13.278)	lr 0.04710
Warmup Train [7][630/3239]	Time 0.485 (0.524)	Data 0.001 (0.020)	Loss 5.8057 (5.7845)	Top-1 acc 4.297 (4.262)	Top-5 acc 12.500 (13.267)	lr 0.04710
Warmup Train [7][640/3239]	Time 0.334 (0.523)	Data 0.001 (0.020)	Loss 5.8079 (5.7846)	Top-1 acc 3.906 (4.258)	Top-5 acc 11.719 (13.266)	lr 0.04710
Warmup Train [7][650/3239]	Time 0.534 (0.523)	Data 0.001 (0.020)	Loss 5.8061 (5.7847)	Top-1 acc 4.688 (4.257)	Top-5 acc 10.938 (13.264)	lr 0.04709
Warmup Train [7][660/3239]	Time 0.449 (0.523)	Data 0.001 (0.020)	Loss 5.6676 (5.7847)	Top-1 acc 4.688 (4.258)	Top-5 acc 14.844 (13.266)	lr 0.04709
Warmup Train [7][670/3239]	Time 0.478 (0.522)	Data 0.001 (0.020)	Loss 5.7621 (5.7844)	Top-1 acc 4.688 (4.257)	Top-5 acc 14.844 (13.268)	lr 0.04709
Warmup Train [7][680/3239]	Time 0.508 (0.522)	Data 0.001 (0.019)	Loss 5.7211 (5.7846)	Top-1 acc 5.469 (4.255)	Top-5 acc 16.406 (13.261)	lr 0.04709
Warmup Train [7][690/3239]	Time 0.557 (0.521)	Data 0.001 (0.019)	Loss 5.8287 (5.7839)	Top-1 acc 3.516 (4.250)	Top-5 acc 10.938 (13.271)	lr 0.04708
Warmup Train [7][700/3239]	Time 0.478 (0.521)	Data 0.001 (0.019)	Loss 5.8483 (5.7832)	Top-1 acc 2.734 (4.255)	Top-5 acc 14.844 (13.293)	lr 0.04708
Warmup Train [7][710/3239]	Time 0.592 (0.521)	Data 0.001 (0.019)	Loss 5.5998 (5.7827)	Top-1 acc 8.203 (4.267)	Top-5 acc 17.969 (13.300)	lr 0.04708
Warmup Train [7][720/3239]	Time 0.521 (0.520)	Data 0.001 (0.019)	Loss 5.8901 (5.7831)	Top-1 acc 3.125 (4.261)	Top-5 acc 10.547 (13.299)	lr 0.04707
Warmup Train [7][730/3239]	Time 0.354 (0.520)	Data 0.001 (0.019)	Loss 5.8902 (5.7833)	Top-1 acc 6.250 (4.277)	Top-5 acc 12.109 (13.306)	lr 0.04707
Warmup Train [7][740/3239]	Time 0.497 (0.521)	Data 0.001 (0.019)	Loss 5.9449 (5.7832)	Top-1 acc 5.078 (4.278)	Top-5 acc 12.500 (13.308)	lr 0.04707
Warmup Train [7][750/3239]	Time 0.604 (0.521)	Data 0.001 (0.018)	Loss 5.6756 (5.7823)	Top-1 acc 6.641 (4.288)	Top-5 acc 15.234 (13.324)	lr 0.04707
Warmup Train [7][760/3239]	Time 0.543 (0.521)	Data 0.001 (0.018)	Loss 5.8405 (5.7824)	Top-1 acc 3.516 (4.288)	Top-5 acc 10.547 (13.312)	lr 0.04706
Warmup Train [7][770/3239]	Time 0.512 (0.521)	Data 0.001 (0.018)	Loss 5.8408 (5.7818)	Top-1 acc 4.297 (4.281)	Top-5 acc 13.281 (13.325)	lr 0.04706
Warmup Train [7][780/3239]	Time 0.425 (0.520)	Data 0.001 (0.018)	Loss 5.7262 (5.7814)	Top-1 acc 5.078 (4.283)	Top-5 acc 14.062 (13.329)	lr 0.04706
Warmup Train [7][790/3239]	Time 0.403 (0.520)	Data 0.001 (0.018)	Loss 5.7899 (5.7810)	Top-1 acc 2.734 (4.283)	Top-5 acc 15.625 (13.335)	lr 0.04705
Warmup Train [7][800/3239]	Time 0.573 (0.520)	Data 0.001 (0.018)	Loss 5.6634 (5.7805)	Top-1 acc 2.734 (4.278)	Top-5 acc 16.797 (13.347)	lr 0.04705
Warmup Train [7][810/3239]	Time 0.424 (0.520)	Data 0.001 (0.018)	Loss 5.7896 (5.7798)	Top-1 acc 3.906 (4.273)	Top-5 acc 11.719 (13.360)	lr 0.04705
Warmup Train [7][820/3239]	Time 0.606 (0.520)	Data 0.001 (0.017)	Loss 5.6966 (5.7797)	Top-1 acc 2.734 (4.277)	Top-5 acc 12.109 (13.363)	lr 0.04705
Warmup Train [7][830/3239]	Time 0.490 (0.520)	Data 0.001 (0.017)	Loss 5.7988 (5.7793)	Top-1 acc 2.344 (4.278)	Top-5 acc 11.328 (13.367)	lr 0.04704
Warmup Train [7][840/3239]	Time 0.359 (0.520)	Data 0.002 (0.017)	Loss 5.7328 (5.7790)	Top-1 acc 3.516 (4.285)	Top-5 acc 12.500 (13.372)	lr 0.04704
Warmup Train [7][850/3239]	Time 0.355 (0.519)	Data 0.001 (0.017)	Loss 5.7375 (5.7785)	Top-1 acc 4.297 (4.292)	Top-5 acc 17.578 (13.390)	lr 0.04704
Warmup Train [7][860/3239]	Time 0.609 (0.520)	Data 0.001 (0.017)	Loss 5.8469 (5.7781)	Top-1 acc 5.859 (4.296)	Top-5 acc 13.672 (13.401)	lr 0.04703
Warmup Train [7][870/3239]	Time 0.504 (0.519)	Data 0.001 (0.017)	Loss 5.7533 (5.7774)	Top-1 acc 3.906 (4.302)	Top-5 acc 12.109 (13.411)	lr 0.04703
Warmup Train [7][880/3239]	Time 0.372 (0.519)	Data 0.001 (0.017)	Loss 5.6773 (5.7773)	Top-1 acc 5.078 (4.315)	Top-5 acc 16.016 (13.424)	lr 0.04703
Warmup Train [7][890/3239]	Time 0.588 (0.519)	Data 0.001 (0.017)	Loss 5.7122 (5.7773)	Top-1 acc 6.250 (4.310)	Top-5 acc 16.406 (13.424)	lr 0.04703
Warmup Train [7][900/3239]	Time 0.625 (0.520)	Data 0.001 (0.017)	Loss 5.6791 (5.7770)	Top-1 acc 3.906 (4.309)	Top-5 acc 18.750 (13.437)	lr 0.04702
Warmup Train [7][910/3239]	Time 0.271 (0.519)	Data 0.001 (0.016)	Loss 5.6110 (5.7763)	Top-1 acc 6.641 (4.313)	Top-5 acc 17.969 (13.451)	lr 0.04702
Warmup Train [7][920/3239]	Time 0.519 (0.519)	Data 0.001 (0.016)	Loss 5.7896 (5.7757)	Top-1 acc 3.516 (4.320)	Top-5 acc 13.672 (13.465)	lr 0.04702
Warmup Train [7][930/3239]	Time 0.392 (0.519)	Data 0.001 (0.016)	Loss 5.7168 (5.7750)	Top-1 acc 5.078 (4.325)	Top-5 acc 11.719 (13.475)	lr 0.04701
Warmup Train [7][940/3239]	Time 0.511 (0.518)	Data 0.001 (0.016)	Loss 5.7594 (5.7748)	Top-1 acc 3.516 (4.330)	Top-5 acc 13.281 (13.485)	lr 0.04701
Warmup Train [7][950/3239]	Time 0.331 (0.518)	Data 0.001 (0.016)	Loss 5.8028 (5.7746)	Top-1 acc 2.734 (4.331)	Top-5 acc 12.109 (13.487)	lr 0.04701
Warmup Train [7][960/3239]	Time 0.464 (0.517)	Data 0.001 (0.016)	Loss 5.8100 (5.7749)	Top-1 acc 3.906 (4.331)	Top-5 acc 14.062 (13.488)	lr 0.04701
Warmup Train [7][970/3239]	Time 0.493 (0.517)	Data 0.001 (0.016)	Loss 5.8198 (5.7748)	Top-1 acc 5.078 (4.327)	Top-5 acc 13.672 (13.477)	lr 0.04700
Warmup Train [7][980/3239]	Time 0.474 (0.517)	Data 0.001 (0.016)	Loss 5.7176 (5.7747)	Top-1 acc 5.469 (4.332)	Top-5 acc 13.672 (13.478)	lr 0.04700
Warmup Train [7][990/3239]	Time 0.492 (0.517)	Data 0.001 (0.016)	Loss 5.5630 (5.7743)	Top-1 acc 7.422 (4.335)	Top-5 acc 18.750 (13.483)	lr 0.04700
Warmup Train [7][1000/3239]	Time 0.607 (0.518)	Data 0.001 (0.016)	Loss 5.8110 (5.7741)	Top-1 acc 3.516 (4.329)	Top-5 acc 12.500 (13.484)	lr 0.04699
Warmup Train [7][1010/3239]	Time 0.552 (0.517)	Data 0.001 (0.016)	Loss 5.8061 (5.7737)	Top-1 acc 1.953 (4.324)	Top-5 acc 10.156 (13.481)	lr 0.04699
Warmup Train [7][1020/3239]	Time 0.526 (0.517)	Data 0.001 (0.016)	Loss 5.8389 (5.7736)	Top-1 acc 3.906 (4.331)	Top-5 acc 12.500 (13.491)	lr 0.04699
Warmup Train [7][1030/3239]	Time 0.624 (0.517)	Data 0.001 (0.016)	Loss 5.8443 (5.7731)	Top-1 acc 3.906 (4.332)	Top-5 acc 13.672 (13.495)	lr 0.04698
Warmup Train [7][1040/3239]	Time 0.573 (0.517)	Data 0.001 (0.015)	Loss 5.6965 (5.7728)	Top-1 acc 5.859 (4.333)	Top-5 acc 13.672 (13.504)	lr 0.04698
Warmup Train [7][1050/3239]	Time 0.609 (0.517)	Data 0.001 (0.015)	Loss 5.7265 (5.7722)	Top-1 acc 3.906 (4.336)	Top-5 acc 14.453 (13.515)	lr 0.04698
Warmup Train [7][1060/3239]	Time 0.595 (0.517)	Data 0.001 (0.015)	Loss 5.6432 (5.7718)	Top-1 acc 7.812 (4.335)	Top-5 acc 17.188 (13.521)	lr 0.04698
Warmup Train [7][1070/3239]	Time 0.597 (0.517)	Data 0.001 (0.015)	Loss 5.8052 (5.7716)	Top-1 acc 6.641 (4.337)	Top-5 acc 15.234 (13.525)	lr 0.04697
Warmup Train [7][1080/3239]	Time 0.563 (0.517)	Data 0.001 (0.015)	Loss 5.7412 (5.7715)	Top-1 acc 3.516 (4.334)	Top-5 acc 14.062 (13.519)	lr 0.04697
Warmup Train [7][1090/3239]	Time 0.590 (0.518)	Data 0.001 (0.015)	Loss 5.8226 (5.7716)	Top-1 acc 3.125 (4.338)	Top-5 acc 12.500 (13.523)	lr 0.04697
Warmup Train [7][1100/3239]	Time 0.456 (0.517)	Data 0.001 (0.015)	Loss 5.6648 (5.7717)	Top-1 acc 5.469 (4.339)	Top-5 acc 17.969 (13.524)	lr 0.04696
Warmup Train [7][1110/3239]	Time 0.640 (0.517)	Data 0.001 (0.015)	Loss 5.8382 (5.7717)	Top-1 acc 3.125 (4.343)	Top-5 acc 12.500 (13.532)	lr 0.04696
Warmup Train [7][1120/3239]	Time 0.657 (0.518)	Data 0.001 (0.015)	Loss 5.7134 (5.7713)	Top-1 acc 6.250 (4.346)	Top-5 acc 15.625 (13.543)	lr 0.04696
Warmup Train [7][1130/3239]	Time 0.579 (0.517)	Data 0.001 (0.014)	Loss 5.7211 (5.7709)	Top-1 acc 3.906 (4.349)	Top-5 acc 16.016 (13.551)	lr 0.04696
Warmup Train [7][1140/3239]	Time 0.625 (0.517)	Data 0.002 (0.014)	Loss 5.7295 (5.7709)	Top-1 acc 3.516 (4.347)	Top-5 acc 13.281 (13.554)	lr 0.04695
Warmup Train [7][1150/3239]	Time 0.702 (0.518)	Data 0.001 (0.014)	Loss 5.7182 (5.7705)	Top-1 acc 5.859 (4.353)	Top-5 acc 14.844 (13.573)	lr 0.04695
Warmup Train [7][1160/3239]	Time 0.559 (0.517)	Data 0.001 (0.014)	Loss 5.6975 (5.7699)	Top-1 acc 2.344 (4.352)	Top-5 acc 14.453 (13.594)	lr 0.04695
Warmup Train [7][1170/3239]	Time 0.661 (0.517)	Data 0.001 (0.014)	Loss 5.7195 (5.7699)	Top-1 acc 6.250 (4.352)	Top-5 acc 16.016 (13.594)	lr 0.04694
Warmup Train [7][1180/3239]	Time 0.608 (0.517)	Data 0.001 (0.014)	Loss 5.7650 (5.7700)	Top-1 acc 4.297 (4.354)	Top-5 acc 12.891 (13.595)	lr 0.04694
Warmup Train [7][1190/3239]	Time 0.539 (0.517)	Data 0.001 (0.014)	Loss 5.7283 (5.7699)	Top-1 acc 4.688 (4.353)	Top-5 acc 12.500 (13.595)	lr 0.04694
Warmup Train [7][1200/3239]	Time 0.530 (0.517)	Data 0.001 (0.014)	Loss 5.6993 (5.7698)	Top-1 acc 5.078 (4.352)	Top-5 acc 15.625 (13.600)	lr 0.04694
Warmup Train [7][1210/3239]	Time 0.442 (0.517)	Data 0.001 (0.014)	Loss 5.6868 (5.7694)	Top-1 acc 5.469 (4.358)	Top-5 acc 16.016 (13.608)	lr 0.04693
Warmup Train [7][1220/3239]	Time 0.396 (0.516)	Data 0.001 (0.014)	Loss 5.9140 (5.7690)	Top-1 acc 1.953 (4.356)	Top-5 acc 10.547 (13.612)	lr 0.04693
Warmup Train [7][1230/3239]	Time 0.461 (0.516)	Data 0.001 (0.014)	Loss 5.7866 (5.7689)	Top-1 acc 5.859 (4.352)	Top-5 acc 11.719 (13.615)	lr 0.04693
Warmup Train [7][1240/3239]	Time 0.570 (0.516)	Data 0.001 (0.014)	Loss 5.7448 (5.7686)	Top-1 acc 6.250 (4.359)	Top-5 acc 15.234 (13.625)	lr 0.04692
Warmup Train [7][1250/3239]	Time 0.395 (0.516)	Data 0.001 (0.013)	Loss 5.7286 (5.7683)	Top-1 acc 5.078 (4.361)	Top-5 acc 18.359 (13.631)	lr 0.04692
Warmup Train [7][1260/3239]	Time 0.598 (0.516)	Data 0.001 (0.013)	Loss 5.7591 (5.7680)	Top-1 acc 3.125 (4.361)	Top-5 acc 8.594 (13.637)	lr 0.04692
Warmup Train [7][1270/3239]	Time 0.556 (0.516)	Data 0.001 (0.013)	Loss 5.7862 (5.7676)	Top-1 acc 3.516 (4.368)	Top-5 acc 13.281 (13.654)	lr 0.04692
Warmup Train [7][1280/3239]	Time 0.530 (0.516)	Data 0.001 (0.013)	Loss 5.6817 (5.7675)	Top-1 acc 5.078 (4.368)	Top-5 acc 12.891 (13.655)	lr 0.04691
Warmup Train [7][1290/3239]	Time 0.503 (0.516)	Data 0.001 (0.013)	Loss 5.6662 (5.7672)	Top-1 acc 4.297 (4.369)	Top-5 acc 13.281 (13.657)	lr 0.04691
Warmup Train [7][1300/3239]	Time 0.695 (0.516)	Data 0.001 (0.013)	Loss 5.6747 (5.7671)	Top-1 acc 3.125 (4.367)	Top-5 acc 15.625 (13.653)	lr 0.04691
Warmup Train [7][1310/3239]	Time 0.549 (0.516)	Data 0.001 (0.013)	Loss 5.8715 (5.7667)	Top-1 acc 2.344 (4.364)	Top-5 acc 7.422 (13.655)	lr 0.04690
Warmup Train [7][1320/3239]	Time 0.545 (0.516)	Data 0.001 (0.013)	Loss 5.6505 (5.7664)	Top-1 acc 6.250 (4.371)	Top-5 acc 12.891 (13.657)	lr 0.04690
Warmup Train [7][1330/3239]	Time 0.648 (0.516)	Data 0.001 (0.013)	Loss 5.7295 (5.7661)	Top-1 acc 2.734 (4.372)	Top-5 acc 12.500 (13.662)	lr 0.04690
Warmup Train [7][1340/3239]	Time 0.550 (0.516)	Data 0.001 (0.013)	Loss 5.6586 (5.7659)	Top-1 acc 4.688 (4.371)	Top-5 acc 14.453 (13.668)	lr 0.04689
Warmup Train [7][1350/3239]	Time 0.489 (0.516)	Data 0.001 (0.013)	Loss 5.8845 (5.7656)	Top-1 acc 3.906 (4.378)	Top-5 acc 12.891 (13.670)	lr 0.04689
Warmup Train [7][1360/3239]	Time 0.610 (0.516)	Data 0.001 (0.013)	Loss 5.7765 (5.7650)	Top-1 acc 3.906 (4.386)	Top-5 acc 13.672 (13.680)	lr 0.04689
Warmup Train [7][1370/3239]	Time 0.421 (0.516)	Data 0.001 (0.013)	Loss 5.7243 (5.7649)	Top-1 acc 7.031 (4.387)	Top-5 acc 15.625 (13.680)	lr 0.04689
Warmup Train [7][1380/3239]	Time 0.484 (0.516)	Data 0.001 (0.013)	Loss 5.8201 (5.7648)	Top-1 acc 2.734 (4.386)	Top-5 acc 10.547 (13.684)	lr 0.04688
Warmup Train [7][1390/3239]	Time 0.519 (0.516)	Data 0.001 (0.013)	Loss 5.6594 (5.7647)	Top-1 acc 5.859 (4.387)	Top-5 acc 14.062 (13.690)	lr 0.04688
Warmup Train [7][1400/3239]	Time 0.511 (0.516)	Data 0.001 (0.013)	Loss 5.6261 (5.7641)	Top-1 acc 6.250 (4.389)	Top-5 acc 15.625 (13.696)	lr 0.04688
Warmup Train [7][1410/3239]	Time 0.547 (0.516)	Data 0.001 (0.012)	Loss 5.7682 (5.7638)	Top-1 acc 5.859 (4.393)	Top-5 acc 14.453 (13.701)	lr 0.04687
Warmup Train [7][1420/3239]	Time 0.608 (0.515)	Data 0.001 (0.012)	Loss 5.7342 (5.7635)	Top-1 acc 5.859 (4.397)	Top-5 acc 14.453 (13.710)	lr 0.04687
Warmup Train [7][1430/3239]	Time 0.443 (0.515)	Data 0.001 (0.012)	Loss 5.7732 (5.7628)	Top-1 acc 7.422 (4.400)	Top-5 acc 16.016 (13.721)	lr 0.04687
Warmup Train [7][1440/3239]	Time 0.465 (0.515)	Data 0.001 (0.012)	Loss 5.7386 (5.7625)	Top-1 acc 7.031 (4.405)	Top-5 acc 16.406 (13.731)	lr 0.04687
Warmup Train [7][1450/3239]	Time 0.577 (0.515)	Data 0.001 (0.012)	Loss 5.7169 (5.7622)	Top-1 acc 5.469 (4.412)	Top-5 acc 14.453 (13.745)	lr 0.04686
Warmup Train [7][1460/3239]	Time 0.492 (0.515)	Data 0.001 (0.012)	Loss 5.6886 (5.7619)	Top-1 acc 3.125 (4.411)	Top-5 acc 13.672 (13.750)	lr 0.04686
Warmup Train [7][1470/3239]	Time 0.475 (0.515)	Data 0.001 (0.012)	Loss 5.6866 (5.7616)	Top-1 acc 5.469 (4.415)	Top-5 acc 16.797 (13.754)	lr 0.04686
Warmup Train [7][1480/3239]	Time 0.620 (0.515)	Data 0.001 (0.012)	Loss 5.6696 (5.7613)	Top-1 acc 7.422 (4.416)	Top-5 acc 16.797 (13.759)	lr 0.04685
Warmup Train [7][1490/3239]	Time 0.564 (0.515)	Data 0.001 (0.012)	Loss 5.6902 (5.7609)	Top-1 acc 5.469 (4.426)	Top-5 acc 17.188 (13.771)	lr 0.04685
Warmup Train [7][1500/3239]	Time 0.533 (0.515)	Data 0.001 (0.012)	Loss 5.8504 (5.7608)	Top-1 acc 2.344 (4.427)	Top-5 acc 11.328 (13.774)	lr 0.04685
Warmup Train [7][1510/3239]	Time 0.408 (0.515)	Data 0.001 (0.012)	Loss 5.7139 (5.7606)	Top-1 acc 4.297 (4.431)	Top-5 acc 14.844 (13.782)	lr 0.04684
Warmup Train [7][1520/3239]	Time 0.436 (0.515)	Data 0.001 (0.012)	Loss 5.7317 (5.7604)	Top-1 acc 5.469 (4.432)	Top-5 acc 13.281 (13.786)	lr 0.04684
Warmup Train [7][1530/3239]	Time 0.532 (0.515)	Data 0.001 (0.012)	Loss 5.7305 (5.7602)	Top-1 acc 7.031 (4.436)	Top-5 acc 16.406 (13.793)	lr 0.04684
Warmup Train [7][1540/3239]	Time 0.614 (0.515)	Data 0.001 (0.012)	Loss 5.7647 (5.7600)	Top-1 acc 4.297 (4.437)	Top-5 acc 15.234 (13.801)	lr 0.04684
Warmup Train [7][1550/3239]	Time 0.527 (0.515)	Data 0.001 (0.012)	Loss 5.7406 (5.7595)	Top-1 acc 2.734 (4.443)	Top-5 acc 12.109 (13.810)	lr 0.04683
Warmup Train [7][1560/3239]	Time 0.575 (0.515)	Data 0.001 (0.012)	Loss 5.6940 (5.7590)	Top-1 acc 7.031 (4.444)	Top-5 acc 17.188 (13.820)	lr 0.04683
Warmup Train [7][1570/3239]	Time 0.528 (0.515)	Data 0.001 (0.012)	Loss 5.6867 (5.7589)	Top-1 acc 6.641 (4.444)	Top-5 acc 17.969 (13.822)	lr 0.04683
Warmup Train [7][1580/3239]	Time 0.474 (0.515)	Data 0.001 (0.012)	Loss 5.7755 (5.7588)	Top-1 acc 3.516 (4.446)	Top-5 acc 13.672 (13.824)	lr 0.04682
Warmup Train [7][1590/3239]	Time 0.346 (0.515)	Data 0.001 (0.012)	Loss 5.7802 (5.7587)	Top-1 acc 3.125 (4.450)	Top-5 acc 12.109 (13.825)	lr 0.04682
Warmup Train [7][1600/3239]	Time 0.530 (0.515)	Data 0.001 (0.012)	Loss 5.8226 (5.7585)	Top-1 acc 3.516 (4.454)	Top-5 acc 12.109 (13.829)	lr 0.04682
Warmup Train [7][1610/3239]	Time 0.534 (0.515)	Data 0.001 (0.012)	Loss 5.7275 (5.7583)	Top-1 acc 4.297 (4.456)	Top-5 acc 14.844 (13.831)	lr 0.04682
Warmup Train [7][1620/3239]	Time 0.687 (0.515)	Data 0.001 (0.012)	Loss 5.6631 (5.7579)	Top-1 acc 5.469 (4.458)	Top-5 acc 11.719 (13.835)	lr 0.04681
Warmup Train [7][1630/3239]	Time 0.565 (0.515)	Data 0.001 (0.012)	Loss 5.6861 (5.7578)	Top-1 acc 5.078 (4.458)	Top-5 acc 16.406 (13.840)	lr 0.04681
Warmup Train [7][1640/3239]	Time 0.655 (0.515)	Data 0.001 (0.012)	Loss 5.6610 (5.7574)	Top-1 acc 6.641 (4.463)	Top-5 acc 19.531 (13.854)	lr 0.04681
Warmup Train [7][1650/3239]	Time 0.418 (0.515)	Data 0.001 (0.012)	Loss 5.6667 (5.7572)	Top-1 acc 5.078 (4.463)	Top-5 acc 16.016 (13.858)	lr 0.04680
Warmup Train [7][1660/3239]	Time 0.507 (0.515)	Data 0.001 (0.012)	Loss 5.7574 (5.7569)	Top-1 acc 2.344 (4.463)	Top-5 acc 13.672 (13.863)	lr 0.04680
Warmup Train [7][1670/3239]	Time 0.637 (0.515)	Data 0.001 (0.012)	Loss 5.8082 (5.7569)	Top-1 acc 4.688 (4.461)	Top-5 acc 15.625 (13.867)	lr 0.04680
Warmup Train [7][1680/3239]	Time 0.556 (0.515)	Data 0.001 (0.011)	Loss 5.7528 (5.7565)	Top-1 acc 4.297 (4.467)	Top-5 acc 13.281 (13.878)	lr 0.04679
Warmup Train [7][1690/3239]	Time 0.553 (0.515)	Data 0.001 (0.011)	Loss 5.7133 (5.7561)	Top-1 acc 3.906 (4.473)	Top-5 acc 16.797 (13.886)	lr 0.04679
Warmup Train [7][1700/3239]	Time 0.514 (0.515)	Data 0.001 (0.011)	Loss 5.7963 (5.7562)	Top-1 acc 3.125 (4.470)	Top-5 acc 11.328 (13.885)	lr 0.04679
Warmup Train [7][1710/3239]	Time 0.300 (0.515)	Data 0.001 (0.011)	Loss 5.7733 (5.7559)	Top-1 acc 3.125 (4.471)	Top-5 acc 11.719 (13.884)	lr 0.04679
Warmup Train [7][1720/3239]	Time 0.535 (0.515)	Data 0.001 (0.011)	Loss 5.7265 (5.7556)	Top-1 acc 5.078 (4.474)	Top-5 acc 12.891 (13.890)	lr 0.04678
Warmup Train [7][1730/3239]	Time 0.485 (0.515)	Data 0.001 (0.011)	Loss 5.6629 (5.7554)	Top-1 acc 3.125 (4.470)	Top-5 acc 14.844 (13.888)	lr 0.04678
Warmup Train [7][1740/3239]	Time 0.263 (0.515)	Data 0.001 (0.011)	Loss 5.8238 (5.7553)	Top-1 acc 2.344 (4.468)	Top-5 acc 11.719 (13.890)	lr 0.04678
Warmup Train [7][1750/3239]	Time 0.353 (0.514)	Data 0.001 (0.011)	Loss 5.7345 (5.7553)	Top-1 acc 6.250 (4.470)	Top-5 acc 12.500 (13.889)	lr 0.04677
Warmup Train [7][1760/3239]	Time 0.427 (0.514)	Data 0.001 (0.011)	Loss 5.6674 (5.7552)	Top-1 acc 5.078 (4.469)	Top-5 acc 14.453 (13.887)	lr 0.04677
Warmup Train [7][1770/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 5.7536 (5.7549)	Top-1 acc 7.031 (4.472)	Top-5 acc 17.188 (13.898)	lr 0.04677
Warmup Train [7][1780/3239]	Time 0.478 (0.514)	Data 0.001 (0.011)	Loss 5.7635 (5.7547)	Top-1 acc 5.078 (4.475)	Top-5 acc 14.453 (13.903)	lr 0.04676
Warmup Train [7][1790/3239]	Time 0.429 (0.514)	Data 0.001 (0.011)	Loss 5.7791 (5.7545)	Top-1 acc 3.516 (4.473)	Top-5 acc 12.500 (13.907)	lr 0.04676
Warmup Train [7][1800/3239]	Time 0.641 (0.514)	Data 0.001 (0.011)	Loss 5.7337 (5.7542)	Top-1 acc 3.906 (4.475)	Top-5 acc 12.891 (13.913)	lr 0.04676
Warmup Train [7][1810/3239]	Time 0.424 (0.514)	Data 0.001 (0.011)	Loss 5.7815 (5.7540)	Top-1 acc 5.078 (4.475)	Top-5 acc 12.500 (13.917)	lr 0.04676
Warmup Train [7][1820/3239]	Time 0.486 (0.514)	Data 0.001 (0.011)	Loss 5.6653 (5.7536)	Top-1 acc 5.469 (4.482)	Top-5 acc 15.625 (13.927)	lr 0.04675
Warmup Train [7][1830/3239]	Time 0.611 (0.514)	Data 0.001 (0.011)	Loss 5.8037 (5.7533)	Top-1 acc 3.516 (4.484)	Top-5 acc 16.797 (13.936)	lr 0.04675
Warmup Train [7][1840/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 5.7360 (5.7530)	Top-1 acc 1.562 (4.482)	Top-5 acc 13.672 (13.939)	lr 0.04675
Warmup Train [7][1850/3239]	Time 0.560 (0.514)	Data 0.001 (0.011)	Loss 5.6673 (5.7527)	Top-1 acc 3.906 (4.485)	Top-5 acc 14.062 (13.941)	lr 0.04674
Warmup Train [7][1860/3239]	Time 0.700 (0.514)	Data 0.001 (0.011)	Loss 5.6429 (5.7525)	Top-1 acc 3.906 (4.487)	Top-5 acc 17.969 (13.945)	lr 0.04674
Warmup Train [7][1870/3239]	Time 0.511 (0.515)	Data 0.001 (0.011)	Loss 5.5948 (5.7523)	Top-1 acc 6.250 (4.490)	Top-5 acc 18.359 (13.950)	lr 0.04674
Warmup Train [7][1880/3239]	Time 0.500 (0.515)	Data 0.001 (0.011)	Loss 5.8507 (5.7522)	Top-1 acc 6.641 (4.492)	Top-5 acc 10.547 (13.947)	lr 0.04673
Warmup Train [7][1890/3239]	Time 0.585 (0.515)	Data 0.001 (0.011)	Loss 5.7011 (5.7519)	Top-1 acc 4.297 (4.497)	Top-5 acc 12.891 (13.948)	lr 0.04673
Warmup Train [7][1900/3239]	Time 0.523 (0.515)	Data 0.001 (0.011)	Loss 5.6278 (5.7516)	Top-1 acc 4.688 (4.502)	Top-5 acc 19.922 (13.957)	lr 0.04673
Warmup Train [7][1910/3239]	Time 0.485 (0.514)	Data 0.001 (0.011)	Loss 5.7594 (5.7515)	Top-1 acc 5.859 (4.503)	Top-5 acc 14.453 (13.964)	lr 0.04673
Warmup Train [7][1920/3239]	Time 0.599 (0.515)	Data 0.001 (0.011)	Loss 5.6715 (5.7513)	Top-1 acc 4.297 (4.506)	Top-5 acc 15.625 (13.969)	lr 0.04672
Warmup Train [7][1930/3239]	Time 0.534 (0.515)	Data 0.001 (0.011)	Loss 5.6316 (5.7511)	Top-1 acc 4.297 (4.507)	Top-5 acc 16.406 (13.971)	lr 0.04672
Warmup Train [7][1940/3239]	Time 0.406 (0.515)	Data 0.001 (0.011)	Loss 5.7007 (5.7511)	Top-1 acc 4.688 (4.510)	Top-5 acc 17.188 (13.977)	lr 0.04672
Warmup Train [7][1950/3239]	Time 0.508 (0.515)	Data 0.002 (0.011)	Loss 5.7327 (5.7510)	Top-1 acc 6.641 (4.513)	Top-5 acc 17.188 (13.978)	lr 0.04671
Warmup Train [7][1960/3239]	Time 0.421 (0.515)	Data 0.001 (0.011)	Loss 5.6835 (5.7508)	Top-1 acc 6.250 (4.516)	Top-5 acc 15.625 (13.983)	lr 0.04671
Warmup Train [7][1970/3239]	Time 0.634 (0.515)	Data 0.001 (0.011)	Loss 5.8813 (5.7509)	Top-1 acc 2.734 (4.515)	Top-5 acc 10.547 (13.982)	lr 0.04671
Warmup Train [7][1980/3239]	Time 0.355 (0.515)	Data 0.001 (0.011)	Loss 5.7601 (5.7507)	Top-1 acc 4.688 (4.515)	Top-5 acc 12.109 (13.985)	lr 0.04670
Warmup Train [7][1990/3239]	Time 0.414 (0.515)	Data 0.001 (0.011)	Loss 5.7541 (5.7506)	Top-1 acc 4.688 (4.514)	Top-5 acc 13.672 (13.987)	lr 0.04670
Warmup Train [7][2000/3239]	Time 0.494 (0.515)	Data 0.001 (0.011)	Loss 5.7908 (5.7504)	Top-1 acc 4.688 (4.516)	Top-5 acc 10.547 (13.987)	lr 0.04670
Warmup Train [7][2010/3239]	Time 0.471 (0.515)	Data 0.001 (0.011)	Loss 5.8629 (5.7504)	Top-1 acc 3.516 (4.516)	Top-5 acc 12.891 (13.986)	lr 0.04670
Warmup Train [7][2020/3239]	Time 0.759 (0.514)	Data 0.001 (0.011)	Loss 5.7377 (5.7502)	Top-1 acc 4.297 (4.517)	Top-5 acc 12.891 (13.988)	lr 0.04669
Warmup Train [7][2030/3239]	Time 0.581 (0.514)	Data 0.001 (0.011)	Loss 5.6128 (5.7501)	Top-1 acc 6.250 (4.518)	Top-5 acc 14.062 (13.991)	lr 0.04669
Warmup Train [7][2040/3239]	Time 0.461 (0.514)	Data 0.001 (0.011)	Loss 5.7652 (5.7499)	Top-1 acc 3.125 (4.518)	Top-5 acc 14.453 (13.998)	lr 0.04669
Warmup Train [7][2050/3239]	Time 0.411 (0.514)	Data 0.001 (0.011)	Loss 5.6944 (5.7497)	Top-1 acc 5.078 (4.520)	Top-5 acc 15.625 (14.003)	lr 0.04668
Warmup Train [7][2060/3239]	Time 0.484 (0.514)	Data 0.001 (0.011)	Loss 5.7919 (5.7495)	Top-1 acc 5.469 (4.521)	Top-5 acc 13.281 (14.004)	lr 0.04668
Warmup Train [7][2070/3239]	Time 0.368 (0.514)	Data 0.001 (0.011)	Loss 5.6949 (5.7492)	Top-1 acc 6.250 (4.524)	Top-5 acc 14.453 (14.006)	lr 0.04668
Warmup Train [7][2080/3239]	Time 0.380 (0.514)	Data 0.001 (0.011)	Loss 5.6068 (5.7489)	Top-1 acc 7.422 (4.529)	Top-5 acc 16.016 (14.009)	lr 0.04667
Warmup Train [7][2090/3239]	Time 0.337 (0.514)	Data 0.001 (0.011)	Loss 5.7787 (5.7487)	Top-1 acc 5.078 (4.529)	Top-5 acc 12.500 (14.011)	lr 0.04667
Warmup Train [7][2100/3239]	Time 0.608 (0.515)	Data 0.001 (0.011)	Loss 5.5583 (5.7485)	Top-1 acc 7.031 (4.529)	Top-5 acc 17.578 (14.011)	lr 0.04667
Warmup Train [7][2110/3239]	Time 0.465 (0.514)	Data 0.001 (0.011)	Loss 5.7301 (5.7481)	Top-1 acc 4.688 (4.530)	Top-5 acc 12.109 (14.014)	lr 0.04667
Warmup Train [7][2120/3239]	Time 0.520 (0.515)	Data 0.001 (0.011)	Loss 5.6655 (5.7479)	Top-1 acc 3.906 (4.535)	Top-5 acc 15.234 (14.022)	lr 0.04666
Warmup Train [7][2130/3239]	Time 0.551 (0.515)	Data 0.001 (0.011)	Loss 5.6998 (5.7475)	Top-1 acc 4.297 (4.538)	Top-5 acc 16.406 (14.030)	lr 0.04666
Warmup Train [7][2140/3239]	Time 0.506 (0.515)	Data 0.001 (0.011)	Loss 5.5789 (5.7473)	Top-1 acc 7.031 (4.540)	Top-5 acc 19.531 (14.033)	lr 0.04666
Warmup Train [7][2150/3239]	Time 0.610 (0.515)	Data 0.001 (0.011)	Loss 5.6402 (5.7472)	Top-1 acc 5.078 (4.544)	Top-5 acc 14.062 (14.033)	lr 0.04665
Warmup Train [7][2160/3239]	Time 0.689 (0.515)	Data 0.001 (0.011)	Loss 5.7818 (5.7470)	Top-1 acc 5.469 (4.548)	Top-5 acc 14.062 (14.045)	lr 0.04665
Warmup Train [7][2170/3239]	Time 0.380 (0.515)	Data 0.001 (0.011)	Loss 5.7168 (5.7469)	Top-1 acc 5.078 (4.552)	Top-5 acc 16.016 (14.048)	lr 0.04665
Warmup Train [7][2180/3239]	Time 0.586 (0.515)	Data 0.001 (0.011)	Loss 5.7387 (5.7467)	Top-1 acc 4.688 (4.552)	Top-5 acc 14.453 (14.052)	lr 0.04664
Warmup Train [7][2190/3239]	Time 0.422 (0.515)	Data 0.001 (0.011)	Loss 5.6426 (5.7465)	Top-1 acc 4.297 (4.554)	Top-5 acc 18.750 (14.058)	lr 0.04664
Warmup Train [7][2200/3239]	Time 0.511 (0.515)	Data 0.001 (0.011)	Loss 5.6970 (5.7461)	Top-1 acc 3.516 (4.557)	Top-5 acc 17.188 (14.067)	lr 0.04664
Warmup Train [7][2210/3239]	Time 0.478 (0.515)	Data 0.001 (0.011)	Loss 5.6749 (5.7458)	Top-1 acc 7.031 (4.558)	Top-5 acc 17.578 (14.072)	lr 0.04664
Warmup Train [7][2220/3239]	Time 0.474 (0.515)	Data 0.001 (0.011)	Loss 5.8563 (5.7456)	Top-1 acc 5.859 (4.561)	Top-5 acc 14.453 (14.080)	lr 0.04663
Warmup Train [7][2230/3239]	Time 0.586 (0.515)	Data 0.001 (0.011)	Loss 5.7411 (5.7456)	Top-1 acc 5.469 (4.560)	Top-5 acc 16.797 (14.082)	lr 0.04663
Warmup Train [7][2240/3239]	Time 0.464 (0.515)	Data 0.001 (0.011)	Loss 5.6934 (5.7454)	Top-1 acc 5.078 (4.560)	Top-5 acc 13.672 (14.080)	lr 0.04663
Warmup Train [7][2250/3239]	Time 0.478 (0.515)	Data 0.001 (0.011)	Loss 5.6836 (5.7452)	Top-1 acc 5.078 (4.562)	Top-5 acc 12.109 (14.087)	lr 0.04662
Warmup Train [7][2260/3239]	Time 0.401 (0.515)	Data 0.001 (0.011)	Loss 5.5933 (5.7448)	Top-1 acc 3.906 (4.562)	Top-5 acc 13.672 (14.090)	lr 0.04662
Warmup Train [7][2270/3239]	Time 0.512 (0.515)	Data 0.001 (0.011)	Loss 5.6393 (5.7446)	Top-1 acc 4.297 (4.564)	Top-5 acc 19.922 (14.100)	lr 0.04662
Warmup Train [7][2280/3239]	Time 0.585 (0.514)	Data 0.001 (0.010)	Loss 5.6728 (5.7443)	Top-1 acc 2.734 (4.568)	Top-5 acc 12.891 (14.106)	lr 0.04661
Warmup Train [7][2290/3239]	Time 0.474 (0.514)	Data 0.001 (0.010)	Loss 5.6960 (5.7442)	Top-1 acc 6.250 (4.569)	Top-5 acc 15.625 (14.112)	lr 0.04661
Warmup Train [7][2300/3239]	Time 0.606 (0.514)	Data 0.001 (0.010)	Loss 5.6558 (5.7437)	Top-1 acc 4.688 (4.575)	Top-5 acc 17.188 (14.130)	lr 0.04661
Warmup Train [7][2310/3239]	Time 0.459 (0.514)	Data 0.001 (0.010)	Loss 5.7466 (5.7434)	Top-1 acc 3.125 (4.580)	Top-5 acc 11.328 (14.139)	lr 0.04661
Warmup Train [7][2320/3239]	Time 0.477 (0.514)	Data 0.001 (0.010)	Loss 5.7361 (5.7430)	Top-1 acc 5.469 (4.583)	Top-5 acc 17.188 (14.146)	lr 0.04660
Warmup Train [7][2330/3239]	Time 0.555 (0.514)	Data 0.001 (0.010)	Loss 5.6797 (5.7427)	Top-1 acc 5.859 (4.589)	Top-5 acc 14.844 (14.151)	lr 0.04660
Warmup Train [7][2340/3239]	Time 0.741 (0.514)	Data 0.001 (0.010)	Loss 5.7857 (5.7426)	Top-1 acc 4.297 (4.591)	Top-5 acc 12.500 (14.153)	lr 0.04660
Warmup Train [7][2350/3239]	Time 0.500 (0.514)	Data 0.001 (0.010)	Loss 5.6598 (5.7424)	Top-1 acc 2.734 (4.589)	Top-5 acc 13.672 (14.153)	lr 0.04659
Warmup Train [7][2360/3239]	Time 0.488 (0.514)	Data 0.001 (0.010)	Loss 5.6583 (5.7421)	Top-1 acc 4.297 (4.591)	Top-5 acc 12.109 (14.154)	lr 0.04659
Warmup Train [7][2370/3239]	Time 0.514 (0.515)	Data 0.001 (0.010)	Loss 5.6443 (5.7419)	Top-1 acc 4.688 (4.591)	Top-5 acc 12.500 (14.155)	lr 0.04659
Warmup Train [7][2380/3239]	Time 0.458 (0.514)	Data 0.001 (0.010)	Loss 5.7914 (5.7417)	Top-1 acc 5.078 (4.593)	Top-5 acc 12.109 (14.157)	lr 0.04658
Warmup Train [7][2390/3239]	Time 0.715 (0.515)	Data 0.001 (0.010)	Loss 5.5792 (5.7415)	Top-1 acc 3.906 (4.596)	Top-5 acc 17.578 (14.165)	lr 0.04658
Warmup Train [7][2400/3239]	Time 0.310 (0.514)	Data 0.001 (0.010)	Loss 5.7182 (5.7413)	Top-1 acc 5.078 (4.599)	Top-5 acc 13.672 (14.166)	lr 0.04658
Warmup Train [7][2410/3239]	Time 0.557 (0.515)	Data 0.001 (0.010)	Loss 5.7603 (5.7410)	Top-1 acc 5.859 (4.602)	Top-5 acc 12.500 (14.172)	lr 0.04657
Warmup Train [7][2420/3239]	Time 0.564 (0.515)	Data 0.001 (0.010)	Loss 5.6900 (5.7408)	Top-1 acc 5.078 (4.606)	Top-5 acc 15.625 (14.173)	lr 0.04657
Warmup Train [7][2430/3239]	Time 0.545 (0.515)	Data 0.001 (0.010)	Loss 5.6899 (5.7408)	Top-1 acc 5.859 (4.606)	Top-5 acc 13.281 (14.171)	lr 0.04657
Warmup Train [7][2440/3239]	Time 0.407 (0.515)	Data 0.001 (0.010)	Loss 5.7475 (5.7409)	Top-1 acc 6.641 (4.608)	Top-5 acc 17.188 (14.171)	lr 0.04657
Warmup Train [7][2450/3239]	Time 0.503 (0.515)	Data 0.001 (0.010)	Loss 5.6764 (5.7407)	Top-1 acc 5.078 (4.610)	Top-5 acc 13.672 (14.173)	lr 0.04656
Warmup Train [7][2460/3239]	Time 0.542 (0.515)	Data 0.002 (0.010)	Loss 5.4847 (5.7401)	Top-1 acc 8.594 (4.618)	Top-5 acc 21.094 (14.185)	lr 0.04656
Warmup Train [7][2470/3239]	Time 0.616 (0.515)	Data 0.001 (0.010)	Loss 5.6228 (5.7400)	Top-1 acc 4.688 (4.618)	Top-5 acc 16.797 (14.188)	lr 0.04656
Warmup Train [7][2480/3239]	Time 0.689 (0.515)	Data 0.001 (0.010)	Loss 5.6414 (5.7397)	Top-1 acc 7.812 (4.620)	Top-5 acc 17.578 (14.192)	lr 0.04655
Warmup Train [7][2490/3239]	Time 0.497 (0.515)	Data 0.001 (0.010)	Loss 5.6494 (5.7394)	Top-1 acc 5.078 (4.621)	Top-5 acc 17.188 (14.196)	lr 0.04655
Warmup Train [7][2500/3239]	Time 0.472 (0.515)	Data 0.001 (0.010)	Loss 5.6145 (5.7391)	Top-1 acc 4.688 (4.621)	Top-5 acc 15.234 (14.201)	lr 0.04655
Warmup Train [7][2510/3239]	Time 0.383 (0.515)	Data 0.001 (0.010)	Loss 5.7196 (5.7388)	Top-1 acc 4.688 (4.625)	Top-5 acc 15.234 (14.204)	lr 0.04654
Warmup Train [7][2520/3239]	Time 0.368 (0.514)	Data 0.001 (0.010)	Loss 5.7299 (5.7386)	Top-1 acc 2.344 (4.625)	Top-5 acc 12.109 (14.209)	lr 0.04654
Warmup Train [7][2530/3239]	Time 0.491 (0.514)	Data 0.029 (0.010)	Loss 5.7763 (5.7384)	Top-1 acc 4.688 (4.625)	Top-5 acc 12.891 (14.211)	lr 0.04654
Warmup Train [7][2540/3239]	Time 0.680 (0.514)	Data 0.001 (0.010)	Loss 5.6876 (5.7382)	Top-1 acc 5.859 (4.628)	Top-5 acc 20.312 (14.215)	lr 0.04653
Warmup Train [7][2550/3239]	Time 0.475 (0.514)	Data 0.001 (0.010)	Loss 5.7700 (5.7381)	Top-1 acc 5.469 (4.628)	Top-5 acc 13.281 (14.217)	lr 0.04653
Warmup Train [7][2560/3239]	Time 0.363 (0.514)	Data 0.001 (0.010)	Loss 5.5452 (5.7378)	Top-1 acc 6.641 (4.630)	Top-5 acc 17.969 (14.225)	lr 0.04653
Warmup Train [7][2570/3239]	Time 0.626 (0.514)	Data 0.001 (0.010)	Loss 5.6641 (5.7374)	Top-1 acc 5.078 (4.634)	Top-5 acc 15.625 (14.231)	lr 0.04653
Warmup Train [7][2580/3239]	Time 0.708 (0.514)	Data 0.001 (0.010)	Loss 5.6526 (5.7370)	Top-1 acc 4.688 (4.638)	Top-5 acc 17.578 (14.239)	lr 0.04652
Warmup Train [7][2590/3239]	Time 0.605 (0.514)	Data 0.001 (0.010)	Loss 5.6767 (5.7368)	Top-1 acc 7.031 (4.641)	Top-5 acc 14.844 (14.242)	lr 0.04652
Warmup Train [7][2600/3239]	Time 0.364 (0.514)	Data 0.001 (0.010)	Loss 5.6345 (5.7366)	Top-1 acc 7.422 (4.644)	Top-5 acc 17.969 (14.253)	lr 0.04652
Warmup Train [7][2610/3239]	Time 0.657 (0.514)	Data 0.001 (0.010)	Loss 5.7241 (5.7363)	Top-1 acc 4.297 (4.644)	Top-5 acc 15.625 (14.256)	lr 0.04651
Warmup Train [7][2620/3239]	Time 0.394 (0.514)	Data 0.001 (0.010)	Loss 5.7433 (5.7361)	Top-1 acc 4.297 (4.646)	Top-5 acc 15.234 (14.264)	lr 0.04651
Warmup Train [7][2630/3239]	Time 0.642 (0.514)	Data 0.001 (0.010)	Loss 5.5615 (5.7359)	Top-1 acc 6.250 (4.646)	Top-5 acc 16.797 (14.268)	lr 0.04651
Warmup Train [7][2640/3239]	Time 0.430 (0.514)	Data 0.001 (0.010)	Loss 5.6613 (5.7356)	Top-1 acc 3.125 (4.647)	Top-5 acc 14.844 (14.269)	lr 0.04650
Warmup Train [7][2650/3239]	Time 0.505 (0.514)	Data 0.001 (0.010)	Loss 5.6214 (5.7353)	Top-1 acc 6.250 (4.650)	Top-5 acc 14.062 (14.274)	lr 0.04650
Warmup Train [7][2660/3239]	Time 0.559 (0.514)	Data 0.002 (0.010)	Loss 5.6715 (5.7351)	Top-1 acc 6.250 (4.651)	Top-5 acc 14.844 (14.280)	lr 0.04650
Warmup Train [7][2670/3239]	Time 0.440 (0.514)	Data 0.001 (0.010)	Loss 5.7091 (5.7349)	Top-1 acc 5.078 (4.652)	Top-5 acc 14.062 (14.283)	lr 0.04649
Warmup Train [7][2680/3239]	Time 0.529 (0.515)	Data 0.001 (0.010)	Loss 5.5689 (5.7346)	Top-1 acc 8.984 (4.655)	Top-5 acc 16.406 (14.287)	lr 0.04649
Warmup Train [7][2690/3239]	Time 0.524 (0.515)	Data 0.001 (0.010)	Loss 5.7121 (5.7345)	Top-1 acc 3.516 (4.655)	Top-5 acc 11.719 (14.288)	lr 0.04649
Warmup Train [7][2700/3239]	Time 0.598 (0.515)	Data 0.001 (0.010)	Loss 5.6733 (5.7344)	Top-1 acc 6.641 (4.656)	Top-5 acc 16.016 (14.292)	lr 0.04649
Warmup Train [7][2710/3239]	Time 0.448 (0.515)	Data 0.001 (0.010)	Loss 5.6812 (5.7342)	Top-1 acc 3.906 (4.657)	Top-5 acc 17.188 (14.296)	lr 0.04648
Warmup Train [7][2720/3239]	Time 0.489 (0.515)	Data 0.001 (0.010)	Loss 5.6536 (5.7340)	Top-1 acc 3.906 (4.660)	Top-5 acc 17.969 (14.299)	lr 0.04648
Warmup Train [7][2730/3239]	Time 0.564 (0.515)	Data 0.001 (0.010)	Loss 5.7382 (5.7339)	Top-1 acc 7.812 (4.661)	Top-5 acc 13.672 (14.302)	lr 0.04648
Warmup Train [7][2740/3239]	Time 0.650 (0.515)	Data 0.001 (0.010)	Loss 5.8168 (5.7338)	Top-1 acc 3.906 (4.663)	Top-5 acc 13.281 (14.301)	lr 0.04647
Warmup Train [7][2750/3239]	Time 0.514 (0.515)	Data 0.001 (0.010)	Loss 5.6246 (5.7336)	Top-1 acc 4.688 (4.664)	Top-5 acc 17.969 (14.305)	lr 0.04647
Warmup Train [7][2760/3239]	Time 0.498 (0.514)	Data 0.001 (0.010)	Loss 5.5925 (5.7333)	Top-1 acc 3.516 (4.666)	Top-5 acc 16.406 (14.310)	lr 0.04647
Warmup Train [7][2770/3239]	Time 0.583 (0.514)	Data 0.001 (0.010)	Loss 5.6921 (5.7329)	Top-1 acc 4.688 (4.668)	Top-5 acc 14.844 (14.317)	lr 0.04646
Warmup Train [7][2780/3239]	Time 0.564 (0.514)	Data 0.001 (0.010)	Loss 5.5845 (5.7325)	Top-1 acc 5.469 (4.669)	Top-5 acc 19.141 (14.322)	lr 0.04646
Warmup Train [7][2790/3239]	Time 0.398 (0.514)	Data 0.001 (0.010)	Loss 5.7790 (5.7324)	Top-1 acc 3.516 (4.670)	Top-5 acc 11.328 (14.322)	lr 0.04646
Warmup Train [7][2800/3239]	Time 0.530 (0.514)	Data 0.001 (0.010)	Loss 5.7399 (5.7322)	Top-1 acc 5.078 (4.671)	Top-5 acc 14.062 (14.323)	lr 0.04645
Warmup Train [7][2810/3239]	Time 0.413 (0.514)	Data 0.001 (0.010)	Loss 5.5065 (5.7319)	Top-1 acc 8.203 (4.675)	Top-5 acc 19.531 (14.334)	lr 0.04645
Warmup Train [7][2820/3239]	Time 0.665 (0.514)	Data 0.001 (0.010)	Loss 5.6210 (5.7317)	Top-1 acc 3.125 (4.675)	Top-5 acc 13.672 (14.338)	lr 0.04645
Warmup Train [7][2830/3239]	Time 0.465 (0.514)	Data 0.001 (0.010)	Loss 5.7129 (5.7315)	Top-1 acc 3.906 (4.676)	Top-5 acc 12.500 (14.343)	lr 0.04644
Warmup Train [7][2840/3239]	Time 0.552 (0.514)	Data 0.001 (0.010)	Loss 5.6298 (5.7313)	Top-1 acc 4.297 (4.675)	Top-5 acc 12.500 (14.346)	lr 0.04644
Warmup Train [7][2850/3239]	Time 0.526 (0.514)	Data 0.001 (0.010)	Loss 5.6102 (5.7311)	Top-1 acc 5.469 (4.677)	Top-5 acc 17.969 (14.353)	lr 0.04644
Warmup Train [7][2860/3239]	Time 0.629 (0.514)	Data 0.001 (0.010)	Loss 5.7087 (5.7308)	Top-1 acc 4.688 (4.678)	Top-5 acc 15.234 (14.362)	lr 0.04644
Warmup Train [7][2870/3239]	Time 0.661 (0.514)	Data 0.001 (0.010)	Loss 5.7161 (5.7307)	Top-1 acc 3.125 (4.678)	Top-5 acc 15.234 (14.364)	lr 0.04643
Warmup Train [7][2880/3239]	Time 0.603 (0.514)	Data 0.001 (0.010)	Loss 5.6502 (5.7305)	Top-1 acc 6.250 (4.680)	Top-5 acc 17.578 (14.367)	lr 0.04643
Warmup Train [7][2890/3239]	Time 0.497 (0.514)	Data 0.001 (0.010)	Loss 5.6641 (5.7303)	Top-1 acc 4.688 (4.681)	Top-5 acc 14.062 (14.371)	lr 0.04643
Warmup Train [7][2900/3239]	Time 0.532 (0.514)	Data 0.001 (0.010)	Loss 5.7981 (5.7300)	Top-1 acc 5.078 (4.685)	Top-5 acc 16.797 (14.382)	lr 0.04642
Warmup Train [7][2910/3239]	Time 0.394 (0.514)	Data 0.001 (0.010)	Loss 5.6590 (5.7297)	Top-1 acc 4.297 (4.688)	Top-5 acc 14.844 (14.388)	lr 0.04642
Warmup Train [7][2920/3239]	Time 0.635 (0.514)	Data 0.001 (0.010)	Loss 5.7210 (5.7295)	Top-1 acc 5.469 (4.690)	Top-5 acc 13.281 (14.393)	lr 0.04642
Warmup Train [7][2930/3239]	Time 0.714 (0.514)	Data 0.001 (0.010)	Loss 5.6798 (5.7292)	Top-1 acc 4.688 (4.694)	Top-5 acc 14.062 (14.400)	lr 0.04641
Warmup Train [7][2940/3239]	Time 0.442 (0.514)	Data 0.001 (0.009)	Loss 5.6251 (5.7290)	Top-1 acc 4.297 (4.695)	Top-5 acc 18.750 (14.401)	lr 0.04641
Warmup Train [7][2950/3239]	Time 0.522 (0.514)	Data 0.001 (0.010)	Loss 5.6192 (5.7287)	Top-1 acc 4.688 (4.698)	Top-5 acc 15.234 (14.408)	lr 0.04641
Warmup Train [7][2960/3239]	Time 0.510 (0.514)	Data 0.001 (0.009)	Loss 5.7364 (5.7285)	Top-1 acc 4.297 (4.699)	Top-5 acc 15.234 (14.412)	lr 0.04640
Warmup Train [7][2970/3239]	Time 0.526 (0.514)	Data 0.001 (0.009)	Loss 5.6192 (5.7282)	Top-1 acc 5.469 (4.702)	Top-5 acc 19.141 (14.421)	lr 0.04640
Warmup Train [7][2980/3239]	Time 0.550 (0.514)	Data 0.001 (0.009)	Loss 5.7600 (5.7280)	Top-1 acc 3.516 (4.706)	Top-5 acc 11.328 (14.424)	lr 0.04640
Warmup Train [7][2990/3239]	Time 0.422 (0.514)	Data 0.001 (0.009)	Loss 5.6251 (5.7276)	Top-1 acc 5.859 (4.710)	Top-5 acc 15.234 (14.432)	lr 0.04639
Warmup Train [7][3000/3239]	Time 0.530 (0.514)	Data 0.001 (0.009)	Loss 5.5360 (5.7273)	Top-1 acc 7.031 (4.714)	Top-5 acc 17.578 (14.442)	lr 0.04639
Warmup Train [7][3010/3239]	Time 0.454 (0.514)	Data 0.001 (0.009)	Loss 5.6455 (5.7271)	Top-1 acc 7.031 (4.718)	Top-5 acc 18.359 (14.448)	lr 0.04639
Warmup Train [7][3020/3239]	Time 0.602 (0.514)	Data 0.001 (0.009)	Loss 5.6793 (5.7268)	Top-1 acc 7.422 (4.719)	Top-5 acc 17.578 (14.453)	lr 0.04639
Warmup Train [7][3030/3239]	Time 0.420 (0.514)	Data 0.001 (0.009)	Loss 5.6105 (5.7267)	Top-1 acc 4.688 (4.721)	Top-5 acc 15.234 (14.458)	lr 0.04638
Warmup Train [7][3040/3239]	Time 0.484 (0.514)	Data 0.001 (0.009)	Loss 5.6949 (5.7264)	Top-1 acc 5.469 (4.724)	Top-5 acc 17.969 (14.465)	lr 0.04638
Warmup Train [7][3050/3239]	Time 0.534 (0.514)	Data 0.001 (0.009)	Loss 5.6978 (5.7262)	Top-1 acc 5.859 (4.726)	Top-5 acc 17.188 (14.470)	lr 0.04638
Warmup Train [7][3060/3239]	Time 0.428 (0.514)	Data 0.001 (0.009)	Loss 5.5548 (5.7260)	Top-1 acc 4.688 (4.728)	Top-5 acc 18.750 (14.475)	lr 0.04637
Warmup Train [7][3070/3239]	Time 0.167 (0.514)	Data 0.001 (0.009)	Loss 5.7815 (5.7256)	Top-1 acc 4.297 (4.733)	Top-5 acc 16.016 (14.483)	lr 0.04637
Warmup Train [7][3080/3239]	Time 0.475 (0.514)	Data 0.001 (0.009)	Loss 5.6126 (5.7254)	Top-1 acc 4.688 (4.735)	Top-5 acc 16.797 (14.489)	lr 0.04637
Warmup Train [7][3090/3239]	Time 0.469 (0.514)	Data 0.001 (0.009)	Loss 5.7366 (5.7252)	Top-1 acc 5.078 (4.738)	Top-5 acc 14.453 (14.493)	lr 0.04636
Warmup Train [7][3100/3239]	Time 0.527 (0.514)	Data 0.001 (0.009)	Loss 5.6686 (5.7249)	Top-1 acc 4.688 (4.740)	Top-5 acc 15.234 (14.496)	lr 0.04636
Warmup Train [7][3110/3239]	Time 0.379 (0.514)	Data 0.001 (0.009)	Loss 5.6294 (5.7247)	Top-1 acc 5.469 (4.741)	Top-5 acc 18.359 (14.502)	lr 0.04636
Warmup Train [7][3120/3239]	Time 0.598 (0.514)	Data 0.002 (0.009)	Loss 5.7479 (5.7245)	Top-1 acc 7.422 (4.745)	Top-5 acc 15.234 (14.507)	lr 0.04635
Warmup Train [7][3130/3239]	Time 0.466 (0.514)	Data 0.001 (0.009)	Loss 5.7119 (5.7244)	Top-1 acc 5.469 (4.745)	Top-5 acc 15.234 (14.510)	lr 0.04635
Warmup Train [7][3140/3239]	Time 0.565 (0.514)	Data 0.001 (0.009)	Loss 5.6352 (5.7243)	Top-1 acc 3.906 (4.746)	Top-5 acc 16.797 (14.513)	lr 0.04635
Warmup Train [7][3150/3239]	Time 0.664 (0.514)	Data 0.001 (0.009)	Loss 5.6628 (5.7243)	Top-1 acc 6.250 (4.746)	Top-5 acc 16.797 (14.511)	lr 0.04634
Warmup Train [7][3160/3239]	Time 0.577 (0.514)	Data 0.001 (0.009)	Loss 5.6921 (5.7239)	Top-1 acc 6.250 (4.751)	Top-5 acc 14.062 (14.520)	lr 0.04634
Warmup Train [7][3170/3239]	Time 0.530 (0.514)	Data 0.001 (0.009)	Loss 5.6311 (5.7236)	Top-1 acc 7.031 (4.754)	Top-5 acc 17.188 (14.528)	lr 0.04634
Warmup Train [7][3180/3239]	Time 0.603 (0.514)	Data 0.000 (0.009)	Loss 5.5815 (5.7233)	Top-1 acc 5.469 (4.759)	Top-5 acc 18.359 (14.539)	lr 0.04633
Warmup Train [7][3190/3239]	Time 0.633 (0.514)	Data 0.000 (0.009)	Loss 5.6003 (5.7231)	Top-1 acc 3.906 (4.759)	Top-5 acc 14.062 (14.543)	lr 0.04633
Warmup Train [7][3200/3239]	Time 0.501 (0.514)	Data 0.000 (0.009)	Loss 5.6940 (5.7228)	Top-1 acc 7.031 (4.763)	Top-5 acc 14.844 (14.547)	lr 0.04633
Warmup Train [7][3210/3239]	Time 0.504 (0.514)	Data 0.000 (0.009)	Loss 5.6107 (5.7225)	Top-1 acc 5.859 (4.764)	Top-5 acc 18.359 (14.552)	lr 0.04633
Warmup Train [7][3220/3239]	Time 0.702 (0.514)	Data 0.000 (0.009)	Loss 5.6562 (5.7223)	Top-1 acc 5.078 (4.766)	Top-5 acc 16.797 (14.553)	lr 0.04632
Warmup Train [7][3230/3239]	Time 0.624 (0.514)	Data 0.000 (0.009)	Loss 5.5888 (5.7221)	Top-1 acc 3.906 (4.766)	Top-5 acc 14.062 (14.554)	lr 0.04632
Warmup Train [7][3239/3239]	Time 0.267 (0.514)	Data 0.000 (0.009)	Loss 5.9043 (5.7219)	Top-1 acc 6.173 (4.767)	Top-5 acc 9.877 (14.556)	lr 0.04632
==========Warmup Valid [7/40]	loss 5.112	top-1 acc 7.377	top-5 acc 20.852	Train top-1 4.767	top-5 14.556	flops: 442.4M
Warmup Train [8][0/3239]	Time 11.041 (11.041)	Data 9.334 (9.334)	Loss 5.5902 (5.5902)	Top-1 acc 4.688 (4.688)	Top-5 acc 15.625 (15.625)	lr 0.04632
Warmup Train [8][10/3239]	Time 0.308 (1.553)	Data 0.001 (0.859)	Loss 5.5836 (5.6411)	Top-1 acc 3.125 (5.114)	Top-5 acc 18.359 (16.051)	lr 0.04631
Warmup Train [8][20/3239]	Time 0.477 (1.058)	Data 0.001 (0.459)	Loss 5.7177 (5.6460)	Top-1 acc 5.078 (5.469)	Top-5 acc 12.891 (16.053)	lr 0.04631
Warmup Train [8][30/3239]	Time 0.578 (0.881)	Data 0.001 (0.312)	Loss 5.7847 (5.6517)	Top-1 acc 8.594 (5.696)	Top-5 acc 15.625 (16.079)	lr 0.04631
Warmup Train [8][40/3239]	Time 0.528 (0.789)	Data 0.001 (0.237)	Loss 5.5762 (5.6474)	Top-1 acc 8.594 (5.802)	Top-5 acc 19.141 (16.244)	lr 0.04630
Warmup Train [8][50/3239]	Time 0.632 (0.736)	Data 0.001 (0.191)	Loss 5.6706 (5.6424)	Top-1 acc 6.250 (5.890)	Top-5 acc 16.016 (16.314)	lr 0.04630
Warmup Train [8][60/3239]	Time 0.618 (0.700)	Data 0.001 (0.160)	Loss 5.6111 (5.6473)	Top-1 acc 3.906 (5.680)	Top-5 acc 13.281 (16.214)	lr 0.04630
Warmup Train [8][70/3239]	Time 0.637 (0.674)	Data 0.001 (0.138)	Loss 5.5817 (5.6444)	Top-1 acc 5.078 (5.645)	Top-5 acc 19.531 (16.131)	lr 0.04629
Warmup Train [8][80/3239]	Time 0.566 (0.653)	Data 0.001 (0.121)	Loss 5.6624 (5.6458)	Top-1 acc 5.078 (5.618)	Top-5 acc 15.234 (16.146)	lr 0.04629
Warmup Train [8][90/3239]	Time 0.342 (0.637)	Data 0.001 (0.108)	Loss 5.6269 (5.6444)	Top-1 acc 4.297 (5.546)	Top-5 acc 16.016 (16.144)	lr 0.04629
Warmup Train [8][100/3239]	Time 0.525 (0.627)	Data 0.001 (0.099)	Loss 5.6277 (5.6440)	Top-1 acc 3.516 (5.434)	Top-5 acc 14.844 (16.085)	lr 0.04628
Warmup Train [8][110/3239]	Time 0.602 (0.616)	Data 0.001 (0.090)	Loss 5.5675 (5.6422)	Top-1 acc 4.297 (5.427)	Top-5 acc 17.578 (16.114)	lr 0.04628
Warmup Train [8][120/3239]	Time 0.606 (0.606)	Data 0.001 (0.083)	Loss 5.6502 (5.6379)	Top-1 acc 5.859 (5.446)	Top-5 acc 18.359 (16.261)	lr 0.04628
Warmup Train [8][130/3239]	Time 0.570 (0.599)	Data 0.001 (0.077)	Loss 5.6622 (5.6389)	Top-1 acc 4.297 (5.412)	Top-5 acc 15.234 (16.224)	lr 0.04627
Warmup Train [8][140/3239]	Time 0.505 (0.593)	Data 0.001 (0.072)	Loss 5.5637 (5.6401)	Top-1 acc 6.250 (5.402)	Top-5 acc 16.797 (16.221)	lr 0.04627
Warmup Train [8][150/3239]	Time 0.491 (0.589)	Data 0.001 (0.067)	Loss 5.5230 (5.6406)	Top-1 acc 6.641 (5.389)	Top-5 acc 18.359 (16.153)	lr 0.04627
Warmup Train [8][160/3239]	Time 0.671 (0.583)	Data 0.001 (0.063)	Loss 5.6582 (5.6432)	Top-1 acc 5.469 (5.394)	Top-5 acc 16.406 (16.074)	lr 0.04627
Warmup Train [8][170/3239]	Time 0.613 (0.579)	Data 0.001 (0.060)	Loss 5.6231 (5.6459)	Top-1 acc 5.859 (5.412)	Top-5 acc 18.359 (16.036)	lr 0.04626
Warmup Train [8][180/3239]	Time 0.574 (0.575)	Data 0.001 (0.057)	Loss 5.6368 (5.6453)	Top-1 acc 4.297 (5.417)	Top-5 acc 12.500 (16.061)	lr 0.04626
Warmup Train [8][190/3239]	Time 0.471 (0.571)	Data 0.001 (0.054)	Loss 5.7206 (5.6449)	Top-1 acc 5.078 (5.385)	Top-5 acc 13.281 (16.061)	lr 0.04626
Warmup Train [8][200/3239]	Time 0.637 (0.567)	Data 0.001 (0.051)	Loss 5.6563 (5.6448)	Top-1 acc 7.031 (5.377)	Top-5 acc 16.406 (16.054)	lr 0.04625
Warmup Train [8][210/3239]	Time 0.510 (0.562)	Data 0.001 (0.049)	Loss 5.5880 (5.6432)	Top-1 acc 8.594 (5.434)	Top-5 acc 19.141 (16.125)	lr 0.04625
Warmup Train [8][220/3239]	Time 0.454 (0.559)	Data 0.001 (0.047)	Loss 5.6274 (5.6431)	Top-1 acc 7.031 (5.453)	Top-5 acc 17.969 (16.131)	lr 0.04625
Warmup Train [8][230/3239]	Time 0.583 (0.556)	Data 0.001 (0.045)	Loss 5.5313 (5.6422)	Top-1 acc 6.641 (5.491)	Top-5 acc 17.969 (16.144)	lr 0.04624
Warmup Train [8][240/3239]	Time 0.428 (0.553)	Data 0.001 (0.044)	Loss 5.7044 (5.6417)	Top-1 acc 3.516 (5.498)	Top-5 acc 9.766 (16.144)	lr 0.04624
Warmup Train [8][250/3239]	Time 0.416 (0.552)	Data 0.001 (0.043)	Loss 5.6751 (5.6420)	Top-1 acc 3.516 (5.515)	Top-5 acc 15.234 (16.134)	lr 0.04624
Warmup Train [8][260/3239]	Time 0.535 (0.551)	Data 0.001 (0.041)	Loss 5.7286 (5.6403)	Top-1 acc 3.125 (5.524)	Top-5 acc 16.016 (16.165)	lr 0.04623
Warmup Train [8][270/3239]	Time 0.516 (0.550)	Data 0.001 (0.040)	Loss 5.6809 (5.6395)	Top-1 acc 3.125 (5.541)	Top-5 acc 14.062 (16.167)	lr 0.04623
Warmup Train [8][280/3239]	Time 0.501 (0.548)	Data 0.001 (0.039)	Loss 5.4946 (5.6388)	Top-1 acc 6.641 (5.541)	Top-5 acc 20.703 (16.189)	lr 0.04623
Warmup Train [8][290/3239]	Time 0.417 (0.546)	Data 0.001 (0.037)	Loss 5.6927 (5.6395)	Top-1 acc 5.078 (5.552)	Top-5 acc 14.453 (16.177)	lr 0.04622
Warmup Train [8][300/3239]	Time 0.529 (0.545)	Data 0.001 (0.037)	Loss 5.6575 (5.6399)	Top-1 acc 4.297 (5.539)	Top-5 acc 15.625 (16.151)	lr 0.04622
Warmup Train [8][310/3239]	Time 0.369 (0.544)	Data 0.001 (0.036)	Loss 5.6541 (5.6406)	Top-1 acc 5.469 (5.519)	Top-5 acc 16.016 (16.135)	lr 0.04622
Warmup Train [8][320/3239]	Time 0.583 (0.543)	Data 0.001 (0.035)	Loss 5.5633 (5.6406)	Top-1 acc 7.422 (5.550)	Top-5 acc 18.359 (16.148)	lr 0.04621
Warmup Train [8][330/3239]	Time 0.568 (0.543)	Data 0.001 (0.034)	Loss 5.8228 (5.6413)	Top-1 acc 4.688 (5.544)	Top-5 acc 12.500 (16.123)	lr 0.04621
Warmup Train [8][340/3239]	Time 0.515 (0.542)	Data 0.001 (0.033)	Loss 5.6748 (5.6418)	Top-1 acc 4.688 (5.529)	Top-5 acc 12.891 (16.096)	lr 0.04621
Warmup Train [8][350/3239]	Time 0.597 (0.541)	Data 0.001 (0.032)	Loss 5.6166 (5.6423)	Top-1 acc 7.812 (5.539)	Top-5 acc 15.234 (16.091)	lr 0.04620
Warmup Train [8][360/3239]	Time 0.531 (0.541)	Data 0.001 (0.031)	Loss 5.6025 (5.6411)	Top-1 acc 5.859 (5.554)	Top-5 acc 17.969 (16.128)	lr 0.04620
Warmup Train [8][370/3239]	Time 0.519 (0.541)	Data 0.001 (0.031)	Loss 5.7241 (5.6405)	Top-1 acc 5.078 (5.568)	Top-5 acc 11.719 (16.136)	lr 0.04620
Warmup Train [8][380/3239]	Time 0.617 (0.540)	Data 0.001 (0.030)	Loss 5.6470 (5.6405)	Top-1 acc 5.859 (5.574)	Top-5 acc 18.750 (16.129)	lr 0.04619
Warmup Train [8][390/3239]	Time 0.534 (0.539)	Data 0.001 (0.029)	Loss 5.6071 (5.6410)	Top-1 acc 5.859 (5.566)	Top-5 acc 19.141 (16.138)	lr 0.04619
Warmup Train [8][400/3239]	Time 0.503 (0.539)	Data 0.002 (0.029)	Loss 5.5377 (5.6409)	Top-1 acc 3.125 (5.535)	Top-5 acc 17.188 (16.123)	lr 0.04619
Warmup Train [8][410/3239]	Time 0.492 (0.538)	Data 0.001 (0.028)	Loss 5.6188 (5.6406)	Top-1 acc 5.469 (5.548)	Top-5 acc 17.578 (16.148)	lr 0.04619
Warmup Train [8][420/3239]	Time 0.415 (0.537)	Data 0.001 (0.028)	Loss 5.5631 (5.6398)	Top-1 acc 8.203 (5.560)	Top-5 acc 19.531 (16.178)	lr 0.04618
Warmup Train [8][430/3239]	Time 0.509 (0.537)	Data 0.001 (0.027)	Loss 5.5606 (5.6397)	Top-1 acc 4.688 (5.554)	Top-5 acc 16.406 (16.201)	lr 0.04618
Warmup Train [8][440/3239]	Time 0.523 (0.537)	Data 0.001 (0.027)	Loss 5.6593 (5.6388)	Top-1 acc 5.469 (5.551)	Top-5 acc 19.141 (16.221)	lr 0.04618
Warmup Train [8][450/3239]	Time 0.470 (0.536)	Data 0.001 (0.026)	Loss 5.6814 (5.6394)	Top-1 acc 3.125 (5.527)	Top-5 acc 13.672 (16.191)	lr 0.04617
Warmup Train [8][460/3239]	Time 0.665 (0.536)	Data 0.001 (0.026)	Loss 5.4943 (5.6380)	Top-1 acc 6.641 (5.542)	Top-5 acc 17.578 (16.208)	lr 0.04617
Warmup Train [8][470/3239]	Time 0.596 (0.535)	Data 0.001 (0.026)	Loss 5.7113 (5.6380)	Top-1 acc 5.469 (5.535)	Top-5 acc 14.844 (16.211)	lr 0.04617
Warmup Train [8][480/3239]	Time 0.396 (0.532)	Data 0.001 (0.025)	Loss 5.6245 (5.6373)	Top-1 acc 5.078 (5.534)	Top-5 acc 16.797 (16.223)	lr 0.04616
Warmup Train [8][490/3239]	Time 0.507 (0.532)	Data 0.001 (0.025)	Loss 5.6693 (5.6369)	Top-1 acc 5.078 (5.549)	Top-5 acc 14.062 (16.241)	lr 0.04616
Warmup Train [8][500/3239]	Time 0.497 (0.531)	Data 0.001 (0.024)	Loss 5.6430 (5.6367)	Top-1 acc 5.078 (5.547)	Top-5 acc 15.625 (16.246)	lr 0.04616
Warmup Train [8][510/3239]	Time 0.506 (0.531)	Data 0.001 (0.024)	Loss 5.7049 (5.6362)	Top-1 acc 1.562 (5.538)	Top-5 acc 12.891 (16.250)	lr 0.04615
Warmup Train [8][520/3239]	Time 0.357 (0.530)	Data 0.001 (0.024)	Loss 5.6239 (5.6357)	Top-1 acc 4.297 (5.548)	Top-5 acc 14.062 (16.241)	lr 0.04615
Warmup Train [8][530/3239]	Time 0.350 (0.530)	Data 0.001 (0.023)	Loss 5.6110 (5.6350)	Top-1 acc 5.078 (5.558)	Top-5 acc 15.625 (16.256)	lr 0.04615
Warmup Train [8][540/3239]	Time 0.599 (0.529)	Data 0.001 (0.023)	Loss 5.5764 (5.6348)	Top-1 acc 4.688 (5.558)	Top-5 acc 15.234 (16.249)	lr 0.04614
Warmup Train [8][550/3239]	Time 0.536 (0.529)	Data 0.001 (0.023)	Loss 5.6958 (5.6344)	Top-1 acc 5.078 (5.560)	Top-5 acc 12.109 (16.265)	lr 0.04614
Warmup Train [8][560/3239]	Time 0.597 (0.529)	Data 0.001 (0.023)	Loss 5.7206 (5.6350)	Top-1 acc 4.688 (5.544)	Top-5 acc 13.281 (16.259)	lr 0.04614
Warmup Train [8][570/3239]	Time 0.371 (0.528)	Data 0.001 (0.022)	Loss 5.7291 (5.6345)	Top-1 acc 4.297 (5.565)	Top-5 acc 13.672 (16.283)	lr 0.04613
Warmup Train [8][580/3239]	Time 0.331 (0.528)	Data 0.001 (0.022)	Loss 5.5821 (5.6347)	Top-1 acc 6.250 (5.560)	Top-5 acc 16.797 (16.279)	lr 0.04613
Warmup Train [8][590/3239]	Time 0.511 (0.528)	Data 0.001 (0.022)	Loss 5.5937 (5.6353)	Top-1 acc 3.906 (5.553)	Top-5 acc 16.016 (16.275)	lr 0.04613
Warmup Train [8][600/3239]	Time 0.485 (0.528)	Data 0.001 (0.022)	Loss 5.6190 (5.6354)	Top-1 acc 7.812 (5.553)	Top-5 acc 17.188 (16.286)	lr 0.04612
Warmup Train [8][610/3239]	Time 0.381 (0.527)	Data 0.001 (0.022)	Loss 5.5840 (5.6350)	Top-1 acc 5.469 (5.557)	Top-5 acc 15.625 (16.303)	lr 0.04612
Warmup Train [8][620/3239]	Time 0.287 (0.527)	Data 0.001 (0.021)	Loss 5.6832 (5.6346)	Top-1 acc 3.125 (5.558)	Top-5 acc 15.625 (16.301)	lr 0.04612
Warmup Train [8][630/3239]	Time 0.532 (0.527)	Data 0.001 (0.021)	Loss 5.6169 (5.6344)	Top-1 acc 5.859 (5.558)	Top-5 acc 17.188 (16.293)	lr 0.04611
Warmup Train [8][640/3239]	Time 0.545 (0.527)	Data 0.001 (0.021)	Loss 5.6633 (5.6338)	Top-1 acc 5.469 (5.569)	Top-5 acc 16.406 (16.302)	lr 0.04611
Warmup Train [8][650/3239]	Time 0.544 (0.526)	Data 0.001 (0.021)	Loss 5.6416 (5.6333)	Top-1 acc 6.641 (5.568)	Top-5 acc 15.234 (16.314)	lr 0.04611
Warmup Train [8][660/3239]	Time 0.490 (0.526)	Data 0.001 (0.020)	Loss 5.6017 (5.6327)	Top-1 acc 5.859 (5.580)	Top-5 acc 17.969 (16.332)	lr 0.04610
Warmup Train [8][670/3239]	Time 0.648 (0.526)	Data 0.001 (0.020)	Loss 5.6247 (5.6329)	Top-1 acc 6.641 (5.582)	Top-5 acc 16.406 (16.334)	lr 0.04610
Warmup Train [8][680/3239]	Time 0.478 (0.526)	Data 0.001 (0.020)	Loss 5.4273 (5.6323)	Top-1 acc 8.594 (5.589)	Top-5 acc 21.484 (16.358)	lr 0.04610
Warmup Train [8][690/3239]	Time 0.618 (0.526)	Data 0.001 (0.020)	Loss 5.5185 (5.6315)	Top-1 acc 6.641 (5.590)	Top-5 acc 15.234 (16.363)	lr 0.04609
Warmup Train [8][700/3239]	Time 0.590 (0.525)	Data 0.002 (0.019)	Loss 5.6519 (5.6317)	Top-1 acc 5.469 (5.580)	Top-5 acc 14.844 (16.352)	lr 0.04609
Warmup Train [8][710/3239]	Time 0.633 (0.525)	Data 0.001 (0.019)	Loss 5.5956 (5.6320)	Top-1 acc 3.906 (5.585)	Top-5 acc 14.844 (16.350)	lr 0.04609
Warmup Train [8][720/3239]	Time 0.605 (0.524)	Data 0.001 (0.019)	Loss 5.6212 (5.6317)	Top-1 acc 5.469 (5.593)	Top-5 acc 16.016 (16.374)	lr 0.04608
Warmup Train [8][730/3239]	Time 0.435 (0.523)	Data 0.001 (0.019)	Loss 5.5343 (5.6312)	Top-1 acc 7.422 (5.599)	Top-5 acc 21.094 (16.391)	lr 0.04608
Warmup Train [8][740/3239]	Time 0.531 (0.523)	Data 0.001 (0.019)	Loss 5.6971 (5.6309)	Top-1 acc 3.516 (5.606)	Top-5 acc 11.719 (16.386)	lr 0.04608
Warmup Train [8][750/3239]	Time 0.526 (0.522)	Data 0.001 (0.018)	Loss 5.7732 (5.6306)	Top-1 acc 4.688 (5.623)	Top-5 acc 14.062 (16.399)	lr 0.04608
Warmup Train [8][760/3239]	Time 0.498 (0.522)	Data 0.001 (0.018)	Loss 5.5619 (5.6302)	Top-1 acc 7.422 (5.630)	Top-5 acc 16.016 (16.401)	lr 0.04607
Warmup Train [8][770/3239]	Time 0.515 (0.522)	Data 0.001 (0.018)	Loss 5.5568 (5.6303)	Top-1 acc 8.203 (5.636)	Top-5 acc 17.969 (16.392)	lr 0.04607
Warmup Train [8][780/3239]	Time 0.492 (0.522)	Data 0.001 (0.018)	Loss 5.8357 (5.6302)	Top-1 acc 4.297 (5.633)	Top-5 acc 13.281 (16.402)	lr 0.04607
Warmup Train [8][790/3239]	Time 0.723 (0.522)	Data 0.001 (0.018)	Loss 5.6141 (5.6303)	Top-1 acc 4.297 (5.628)	Top-5 acc 17.188 (16.401)	lr 0.04606
Warmup Train [8][800/3239]	Time 0.573 (0.522)	Data 0.001 (0.018)	Loss 5.4968 (5.6294)	Top-1 acc 5.859 (5.633)	Top-5 acc 21.484 (16.429)	lr 0.04606
Warmup Train [8][810/3239]	Time 0.653 (0.522)	Data 0.001 (0.017)	Loss 5.7058 (5.6293)	Top-1 acc 3.516 (5.633)	Top-5 acc 12.891 (16.436)	lr 0.04606
Warmup Train [8][820/3239]	Time 0.471 (0.522)	Data 0.001 (0.017)	Loss 5.5194 (5.6284)	Top-1 acc 7.812 (5.656)	Top-5 acc 20.312 (16.475)	lr 0.04605
Warmup Train [8][830/3239]	Time 0.449 (0.521)	Data 0.001 (0.017)	Loss 5.5864 (5.6281)	Top-1 acc 6.641 (5.657)	Top-5 acc 16.406 (16.478)	lr 0.04605
Warmup Train [8][840/3239]	Time 0.560 (0.522)	Data 0.001 (0.017)	Loss 5.4874 (5.6276)	Top-1 acc 5.469 (5.652)	Top-5 acc 19.531 (16.487)	lr 0.04605
Warmup Train [8][850/3239]	Time 0.421 (0.521)	Data 0.001 (0.017)	Loss 5.5759 (5.6268)	Top-1 acc 3.125 (5.656)	Top-5 acc 16.016 (16.500)	lr 0.04604
Warmup Train [8][860/3239]	Time 0.498 (0.521)	Data 0.002 (0.017)	Loss 5.6104 (5.6263)	Top-1 acc 5.469 (5.657)	Top-5 acc 16.016 (16.512)	lr 0.04604
Warmup Train [8][870/3239]	Time 0.382 (0.521)	Data 0.001 (0.017)	Loss 5.5117 (5.6259)	Top-1 acc 5.469 (5.653)	Top-5 acc 19.531 (16.512)	lr 0.04604
Warmup Train [8][880/3239]	Time 0.316 (0.520)	Data 0.001 (0.017)	Loss 5.7428 (5.6259)	Top-1 acc 7.812 (5.646)	Top-5 acc 17.969 (16.514)	lr 0.04603
Warmup Train [8][890/3239]	Time 0.595 (0.521)	Data 0.001 (0.017)	Loss 5.5244 (5.6254)	Top-1 acc 6.641 (5.652)	Top-5 acc 21.484 (16.521)	lr 0.04603
Warmup Train [8][900/3239]	Time 0.398 (0.521)	Data 0.001 (0.017)	Loss 5.6319 (5.6253)	Top-1 acc 6.250 (5.661)	Top-5 acc 18.359 (16.523)	lr 0.04603
Warmup Train [8][910/3239]	Time 0.522 (0.521)	Data 0.001 (0.017)	Loss 5.5769 (5.6248)	Top-1 acc 5.078 (5.660)	Top-5 acc 18.750 (16.540)	lr 0.04602
Warmup Train [8][920/3239]	Time 0.574 (0.521)	Data 0.001 (0.017)	Loss 5.6625 (5.6245)	Top-1 acc 5.859 (5.662)	Top-5 acc 16.406 (16.545)	lr 0.04602
Warmup Train [8][930/3239]	Time 0.499 (0.521)	Data 0.001 (0.016)	Loss 5.5341 (5.6240)	Top-1 acc 6.641 (5.664)	Top-5 acc 20.312 (16.566)	lr 0.04602
Warmup Train [8][940/3239]	Time 0.525 (0.521)	Data 0.001 (0.016)	Loss 5.5553 (5.6238)	Top-1 acc 6.250 (5.664)	Top-5 acc 18.359 (16.575)	lr 0.04601
Warmup Train [8][950/3239]	Time 0.550 (0.521)	Data 0.001 (0.016)	Loss 5.6706 (5.6234)	Top-1 acc 5.078 (5.665)	Top-5 acc 16.406 (16.586)	lr 0.04601
Warmup Train [8][960/3239]	Time 0.574 (0.520)	Data 0.001 (0.016)	Loss 5.5556 (5.6236)	Top-1 acc 6.250 (5.661)	Top-5 acc 20.312 (16.581)	lr 0.04601
Warmup Train [8][970/3239]	Time 0.566 (0.520)	Data 0.001 (0.016)	Loss 5.4743 (5.6233)	Top-1 acc 6.250 (5.662)	Top-5 acc 22.656 (16.592)	lr 0.04600
Warmup Train [8][980/3239]	Time 0.682 (0.520)	Data 0.001 (0.016)	Loss 5.6423 (5.6233)	Top-1 acc 5.859 (5.662)	Top-5 acc 15.234 (16.588)	lr 0.04600
Warmup Train [8][990/3239]	Time 0.564 (0.520)	Data 0.001 (0.015)	Loss 5.5881 (5.6234)	Top-1 acc 6.250 (5.662)	Top-5 acc 18.750 (16.589)	lr 0.04600
Warmup Train [8][1000/3239]	Time 0.468 (0.519)	Data 0.001 (0.015)	Loss 5.5464 (5.6232)	Top-1 acc 7.422 (5.671)	Top-5 acc 16.016 (16.594)	lr 0.04599
Warmup Train [8][1010/3239]	Time 0.561 (0.519)	Data 0.001 (0.015)	Loss 5.6344 (5.6229)	Top-1 acc 4.297 (5.671)	Top-5 acc 14.844 (16.595)	lr 0.04599
Warmup Train [8][1020/3239]	Time 0.460 (0.518)	Data 0.001 (0.015)	Loss 5.5970 (5.6227)	Top-1 acc 7.422 (5.674)	Top-5 acc 18.359 (16.607)	lr 0.04599
Warmup Train [8][1030/3239]	Time 0.628 (0.518)	Data 0.001 (0.015)	Loss 5.4291 (5.6224)	Top-1 acc 8.203 (5.676)	Top-5 acc 19.922 (16.610)	lr 0.04598
Warmup Train [8][1040/3239]	Time 0.375 (0.518)	Data 0.001 (0.015)	Loss 5.5419 (5.6227)	Top-1 acc 6.641 (5.675)	Top-5 acc 17.188 (16.601)	lr 0.04598
Warmup Train [8][1050/3239]	Time 0.641 (0.518)	Data 0.001 (0.015)	Loss 5.5258 (5.6229)	Top-1 acc 4.297 (5.670)	Top-5 acc 16.406 (16.592)	lr 0.04598
Warmup Train [8][1060/3239]	Time 0.593 (0.518)	Data 0.002 (0.015)	Loss 5.6052 (5.6225)	Top-1 acc 4.688 (5.678)	Top-5 acc 14.844 (16.604)	lr 0.04597
Warmup Train [8][1070/3239]	Time 0.529 (0.518)	Data 0.001 (0.015)	Loss 5.4279 (5.6219)	Top-1 acc 5.469 (5.685)	Top-5 acc 17.969 (16.616)	lr 0.04597
Warmup Train [8][1080/3239]	Time 0.456 (0.518)	Data 0.001 (0.015)	Loss 5.5592 (5.6211)	Top-1 acc 7.031 (5.681)	Top-5 acc 20.703 (16.630)	lr 0.04597
Warmup Train [8][1090/3239]	Time 0.461 (0.518)	Data 0.001 (0.015)	Loss 5.7912 (5.6209)	Top-1 acc 5.078 (5.682)	Top-5 acc 12.500 (16.631)	lr 0.04596
Warmup Train [8][1100/3239]	Time 0.637 (0.518)	Data 0.001 (0.015)	Loss 5.5470 (5.6206)	Top-1 acc 7.422 (5.683)	Top-5 acc 21.094 (16.636)	lr 0.04596
Warmup Train [8][1110/3239]	Time 0.592 (0.518)	Data 0.001 (0.015)	Loss 5.5990 (5.6205)	Top-1 acc 5.859 (5.684)	Top-5 acc 18.359 (16.651)	lr 0.04596
Warmup Train [8][1120/3239]	Time 0.459 (0.518)	Data 0.001 (0.014)	Loss 5.6375 (5.6203)	Top-1 acc 3.516 (5.684)	Top-5 acc 14.844 (16.659)	lr 0.04595
Warmup Train [8][1130/3239]	Time 0.371 (0.518)	Data 0.001 (0.014)	Loss 5.7551 (5.6205)	Top-1 acc 5.078 (5.689)	Top-5 acc 16.797 (16.656)	lr 0.04595
Warmup Train [8][1140/3239]	Time 0.366 (0.518)	Data 0.029 (0.014)	Loss 5.4869 (5.6202)	Top-1 acc 8.594 (5.696)	Top-5 acc 17.578 (16.669)	lr 0.04595
Warmup Train [8][1150/3239]	Time 0.584 (0.518)	Data 0.001 (0.014)	Loss 5.6845 (5.6201)	Top-1 acc 3.906 (5.696)	Top-5 acc 15.625 (16.671)	lr 0.04594
Warmup Train [8][1160/3239]	Time 0.509 (0.518)	Data 0.001 (0.014)	Loss 5.6374 (5.6202)	Top-1 acc 4.297 (5.695)	Top-5 acc 13.672 (16.669)	lr 0.04594
Warmup Train [8][1170/3239]	Time 0.491 (0.518)	Data 0.002 (0.014)	Loss 5.5979 (5.6200)	Top-1 acc 8.984 (5.700)	Top-5 acc 18.359 (16.669)	lr 0.04594
Warmup Train [8][1180/3239]	Time 0.434 (0.518)	Data 0.001 (0.014)	Loss 5.5703 (5.6199)	Top-1 acc 5.859 (5.696)	Top-5 acc 16.406 (16.672)	lr 0.04593
Warmup Train [8][1190/3239]	Time 0.643 (0.518)	Data 0.001 (0.014)	Loss 5.5961 (5.6195)	Top-1 acc 5.469 (5.701)	Top-5 acc 17.969 (16.677)	lr 0.04593
Warmup Train [8][1200/3239]	Time 0.509 (0.518)	Data 0.001 (0.014)	Loss 5.4316 (5.6193)	Top-1 acc 6.641 (5.704)	Top-5 acc 19.531 (16.689)	lr 0.04593
Warmup Train [8][1210/3239]	Time 0.493 (0.518)	Data 0.001 (0.014)	Loss 5.6710 (5.6190)	Top-1 acc 7.031 (5.706)	Top-5 acc 15.234 (16.688)	lr 0.04592
Warmup Train [8][1220/3239]	Time 0.478 (0.518)	Data 0.021 (0.014)	Loss 5.6695 (5.6188)	Top-1 acc 4.688 (5.702)	Top-5 acc 13.672 (16.686)	lr 0.04592
Warmup Train [8][1230/3239]	Time 0.483 (0.518)	Data 0.001 (0.014)	Loss 5.5001 (5.6186)	Top-1 acc 4.688 (5.699)	Top-5 acc 16.016 (16.681)	lr 0.04592
Warmup Train [8][1240/3239]	Time 0.656 (0.518)	Data 0.001 (0.014)	Loss 5.4366 (5.6184)	Top-1 acc 12.500 (5.702)	Top-5 acc 22.656 (16.694)	lr 0.04591
Warmup Train [8][1250/3239]	Time 0.472 (0.518)	Data 0.002 (0.014)	Loss 5.5932 (5.6182)	Top-1 acc 5.078 (5.700)	Top-5 acc 15.625 (16.693)	lr 0.04591
Warmup Train [8][1260/3239]	Time 0.306 (0.517)	Data 0.001 (0.014)	Loss 5.6372 (5.6176)	Top-1 acc 5.469 (5.703)	Top-5 acc 19.141 (16.702)	lr 0.04591
Warmup Train [8][1270/3239]	Time 0.291 (0.517)	Data 0.001 (0.014)	Loss 5.7359 (5.6177)	Top-1 acc 7.422 (5.707)	Top-5 acc 16.406 (16.697)	lr 0.04590
Warmup Train [8][1280/3239]	Time 0.488 (0.517)	Data 0.001 (0.014)	Loss 5.3742 (5.6172)	Top-1 acc 8.984 (5.717)	Top-5 acc 24.609 (16.711)	lr 0.04590
Warmup Train [8][1290/3239]	Time 0.596 (0.517)	Data 0.001 (0.014)	Loss 5.4210 (5.6167)	Top-1 acc 7.031 (5.721)	Top-5 acc 23.438 (16.725)	lr 0.04590
Warmup Train [8][1300/3239]	Time 0.566 (0.517)	Data 0.001 (0.014)	Loss 5.6044 (5.6165)	Top-1 acc 7.422 (5.728)	Top-5 acc 14.062 (16.717)	lr 0.04589
Warmup Train [8][1310/3239]	Time 0.493 (0.517)	Data 0.001 (0.014)	Loss 5.6612 (5.6164)	Top-1 acc 5.078 (5.726)	Top-5 acc 17.188 (16.720)	lr 0.04589
Warmup Train [8][1320/3239]	Time 0.483 (0.517)	Data 0.001 (0.013)	Loss 5.6941 (5.6164)	Top-1 acc 5.078 (5.727)	Top-5 acc 16.406 (16.723)	lr 0.04589
Warmup Train [8][1330/3239]	Time 0.701 (0.517)	Data 0.001 (0.013)	Loss 5.5818 (5.6161)	Top-1 acc 4.688 (5.731)	Top-5 acc 14.062 (16.721)	lr 0.04588
Warmup Train [8][1340/3239]	Time 0.446 (0.517)	Data 0.001 (0.013)	Loss 5.5857 (5.6159)	Top-1 acc 5.859 (5.732)	Top-5 acc 18.359 (16.731)	lr 0.04588
Warmup Train [8][1350/3239]	Time 0.468 (0.517)	Data 0.001 (0.013)	Loss 5.4717 (5.6156)	Top-1 acc 4.688 (5.731)	Top-5 acc 14.844 (16.734)	lr 0.04588
Warmup Train [8][1360/3239]	Time 0.564 (0.517)	Data 0.001 (0.013)	Loss 5.6042 (5.6152)	Top-1 acc 5.078 (5.734)	Top-5 acc 12.891 (16.739)	lr 0.04587
Warmup Train [8][1370/3239]	Time 0.517 (0.517)	Data 0.001 (0.013)	Loss 5.6854 (5.6150)	Top-1 acc 2.734 (5.735)	Top-5 acc 14.453 (16.744)	lr 0.04587
Warmup Train [8][1380/3239]	Time 0.428 (0.517)	Data 0.001 (0.013)	Loss 5.5699 (5.6145)	Top-1 acc 6.250 (5.741)	Top-5 acc 18.359 (16.759)	lr 0.04587
Warmup Train [8][1390/3239]	Time 0.514 (0.517)	Data 0.001 (0.013)	Loss 5.6344 (5.6145)	Top-1 acc 3.516 (5.740)	Top-5 acc 15.234 (16.759)	lr 0.04586
Warmup Train [8][1400/3239]	Time 0.560 (0.517)	Data 0.001 (0.013)	Loss 5.5710 (5.6142)	Top-1 acc 6.641 (5.741)	Top-5 acc 16.797 (16.767)	lr 0.04586
Warmup Train [8][1410/3239]	Time 0.433 (0.517)	Data 0.001 (0.013)	Loss 5.5776 (5.6136)	Top-1 acc 5.859 (5.743)	Top-5 acc 16.016 (16.776)	lr 0.04586
Warmup Train [8][1420/3239]	Time 0.546 (0.517)	Data 0.001 (0.013)	Loss 5.4779 (5.6132)	Top-1 acc 6.641 (5.743)	Top-5 acc 17.188 (16.784)	lr 0.04585
Warmup Train [8][1430/3239]	Time 0.429 (0.517)	Data 0.001 (0.013)	Loss 5.6636 (5.6132)	Top-1 acc 5.469 (5.748)	Top-5 acc 17.188 (16.791)	lr 0.04585
Warmup Train [8][1440/3239]	Time 0.443 (0.516)	Data 0.001 (0.013)	Loss 5.6009 (5.6130)	Top-1 acc 3.906 (5.750)	Top-5 acc 14.453 (16.795)	lr 0.04585
Warmup Train [8][1450/3239]	Time 0.398 (0.516)	Data 0.001 (0.013)	Loss 5.6107 (5.6126)	Top-1 acc 5.469 (5.757)	Top-5 acc 17.188 (16.805)	lr 0.04584
Warmup Train [8][1460/3239]	Time 0.490 (0.516)	Data 0.001 (0.013)	Loss 5.6786 (5.6122)	Top-1 acc 5.469 (5.760)	Top-5 acc 17.578 (16.815)	lr 0.04584
Warmup Train [8][1470/3239]	Time 0.514 (0.516)	Data 0.001 (0.013)	Loss 5.5060 (5.6120)	Top-1 acc 7.031 (5.762)	Top-5 acc 16.797 (16.819)	lr 0.04584
Warmup Train [8][1480/3239]	Time 0.633 (0.516)	Data 0.001 (0.013)	Loss 5.6488 (5.6119)	Top-1 acc 5.078 (5.761)	Top-5 acc 16.016 (16.822)	lr 0.04583
Warmup Train [8][1490/3239]	Time 0.568 (0.517)	Data 0.001 (0.013)	Loss 5.5138 (5.6117)	Top-1 acc 7.422 (5.761)	Top-5 acc 17.969 (16.822)	lr 0.04583
Warmup Train [8][1500/3239]	Time 0.679 (0.516)	Data 0.001 (0.012)	Loss 5.5963 (5.6114)	Top-1 acc 7.422 (5.768)	Top-5 acc 17.188 (16.830)	lr 0.04583
Warmup Train [8][1510/3239]	Time 0.575 (0.516)	Data 0.001 (0.012)	Loss 5.5490 (5.6111)	Top-1 acc 6.641 (5.773)	Top-5 acc 16.797 (16.841)	lr 0.04582
Warmup Train [8][1520/3239]	Time 0.587 (0.516)	Data 0.001 (0.012)	Loss 5.5217 (5.6112)	Top-1 acc 7.422 (5.771)	Top-5 acc 20.312 (16.838)	lr 0.04582
Warmup Train [8][1530/3239]	Time 0.369 (0.516)	Data 0.024 (0.012)	Loss 5.3932 (5.6109)	Top-1 acc 9.766 (5.777)	Top-5 acc 23.828 (16.846)	lr 0.04582
Warmup Train [8][1540/3239]	Time 0.459 (0.516)	Data 0.001 (0.012)	Loss 5.5937 (5.6108)	Top-1 acc 5.469 (5.778)	Top-5 acc 16.797 (16.848)	lr 0.04581
Warmup Train [8][1550/3239]	Time 0.377 (0.515)	Data 0.001 (0.012)	Loss 5.6548 (5.6109)	Top-1 acc 3.906 (5.778)	Top-5 acc 16.016 (16.851)	lr 0.04581
Warmup Train [8][1560/3239]	Time 0.391 (0.516)	Data 0.001 (0.012)	Loss 5.6362 (5.6105)	Top-1 acc 7.812 (5.782)	Top-5 acc 18.359 (16.855)	lr 0.04581
Warmup Train [8][1570/3239]	Time 0.412 (0.516)	Data 0.001 (0.012)	Loss 5.5512 (5.6101)	Top-1 acc 5.078 (5.783)	Top-5 acc 17.578 (16.863)	lr 0.04580
Warmup Train [8][1580/3239]	Time 0.521 (0.516)	Data 0.001 (0.012)	Loss 5.7018 (5.6100)	Top-1 acc 5.078 (5.783)	Top-5 acc 12.891 (16.860)	lr 0.04580
Warmup Train [8][1590/3239]	Time 0.366 (0.516)	Data 0.001 (0.012)	Loss 5.6109 (5.6097)	Top-1 acc 5.859 (5.789)	Top-5 acc 16.406 (16.868)	lr 0.04580
Warmup Train [8][1600/3239]	Time 0.472 (0.516)	Data 0.001 (0.012)	Loss 5.5916 (5.6096)	Top-1 acc 5.078 (5.788)	Top-5 acc 14.844 (16.868)	lr 0.04579
Warmup Train [8][1610/3239]	Time 0.670 (0.516)	Data 0.001 (0.012)	Loss 5.5624 (5.6095)	Top-1 acc 7.031 (5.789)	Top-5 acc 16.016 (16.867)	lr 0.04579
Warmup Train [8][1620/3239]	Time 0.352 (0.516)	Data 0.001 (0.012)	Loss 5.7192 (5.6093)	Top-1 acc 2.734 (5.790)	Top-5 acc 12.109 (16.875)	lr 0.04579
Warmup Train [8][1630/3239]	Time 0.553 (0.516)	Data 0.001 (0.012)	Loss 5.6216 (5.6092)	Top-1 acc 6.250 (5.791)	Top-5 acc 16.406 (16.881)	lr 0.04578
Warmup Train [8][1640/3239]	Time 0.724 (0.516)	Data 0.001 (0.012)	Loss 5.4580 (5.6090)	Top-1 acc 4.688 (5.790)	Top-5 acc 18.359 (16.887)	lr 0.04578
Warmup Train [8][1650/3239]	Time 0.557 (0.516)	Data 0.001 (0.012)	Loss 5.5186 (5.6089)	Top-1 acc 5.078 (5.791)	Top-5 acc 16.406 (16.886)	lr 0.04578
Warmup Train [8][1660/3239]	Time 0.453 (0.516)	Data 0.001 (0.012)	Loss 5.4108 (5.6087)	Top-1 acc 7.422 (5.794)	Top-5 acc 21.484 (16.901)	lr 0.04577
Warmup Train [8][1670/3239]	Time 0.519 (0.516)	Data 0.001 (0.012)	Loss 5.5161 (5.6085)	Top-1 acc 6.250 (5.796)	Top-5 acc 20.703 (16.908)	lr 0.04577
Warmup Train [8][1680/3239]	Time 0.541 (0.516)	Data 0.001 (0.012)	Loss 5.6335 (5.6085)	Top-1 acc 4.297 (5.799)	Top-5 acc 18.750 (16.912)	lr 0.04577
Warmup Train [8][1690/3239]	Time 0.587 (0.516)	Data 0.001 (0.012)	Loss 5.6380 (5.6082)	Top-1 acc 6.250 (5.798)	Top-5 acc 17.188 (16.922)	lr 0.04576
Warmup Train [8][1700/3239]	Time 0.695 (0.516)	Data 0.001 (0.012)	Loss 5.6250 (5.6081)	Top-1 acc 3.125 (5.795)	Top-5 acc 16.797 (16.930)	lr 0.04576
Warmup Train [8][1710/3239]	Time 0.611 (0.516)	Data 0.002 (0.012)	Loss 5.5091 (5.6082)	Top-1 acc 8.203 (5.798)	Top-5 acc 20.703 (16.927)	lr 0.04576
Warmup Train [8][1720/3239]	Time 0.515 (0.516)	Data 0.001 (0.012)	Loss 5.5401 (5.6083)	Top-1 acc 5.859 (5.796)	Top-5 acc 15.625 (16.925)	lr 0.04575
Warmup Train [8][1730/3239]	Time 0.473 (0.516)	Data 0.001 (0.012)	Loss 5.5695 (5.6080)	Top-1 acc 3.906 (5.792)	Top-5 acc 14.062 (16.925)	lr 0.04575
Warmup Train [8][1740/3239]	Time 0.470 (0.516)	Data 0.001 (0.012)	Loss 5.6169 (5.6077)	Top-1 acc 5.859 (5.793)	Top-5 acc 17.578 (16.931)	lr 0.04575
Warmup Train [8][1750/3239]	Time 0.620 (0.516)	Data 0.001 (0.012)	Loss 5.5846 (5.6076)	Top-1 acc 6.250 (5.795)	Top-5 acc 16.797 (16.931)	lr 0.04574
Warmup Train [8][1760/3239]	Time 0.408 (0.516)	Data 0.001 (0.012)	Loss 5.5028 (5.6075)	Top-1 acc 8.203 (5.794)	Top-5 acc 19.531 (16.932)	lr 0.04574
Warmup Train [8][1770/3239]	Time 0.580 (0.516)	Data 0.001 (0.012)	Loss 5.6856 (5.6072)	Top-1 acc 4.297 (5.800)	Top-5 acc 12.500 (16.936)	lr 0.04574
Warmup Train [8][1780/3239]	Time 0.562 (0.516)	Data 0.001 (0.011)	Loss 5.4660 (5.6070)	Top-1 acc 6.641 (5.802)	Top-5 acc 20.703 (16.943)	lr 0.04573
Warmup Train [8][1790/3239]	Time 0.369 (0.515)	Data 0.001 (0.011)	Loss 5.5071 (5.6067)	Top-1 acc 8.594 (5.805)	Top-5 acc 21.094 (16.951)	lr 0.04573
Warmup Train [8][1800/3239]	Time 0.481 (0.515)	Data 0.001 (0.011)	Loss 5.5290 (5.6065)	Top-1 acc 9.375 (5.807)	Top-5 acc 19.141 (16.955)	lr 0.04573
Warmup Train [8][1810/3239]	Time 0.376 (0.515)	Data 0.001 (0.011)	Loss 5.5285 (5.6063)	Top-1 acc 2.734 (5.808)	Top-5 acc 20.703 (16.962)	lr 0.04572
Warmup Train [8][1820/3239]	Time 0.525 (0.515)	Data 0.001 (0.011)	Loss 5.5418 (5.6061)	Top-1 acc 7.422 (5.813)	Top-5 acc 19.531 (16.968)	lr 0.04572
Warmup Train [8][1830/3239]	Time 0.636 (0.515)	Data 0.001 (0.011)	Loss 5.5798 (5.6059)	Top-1 acc 8.984 (5.819)	Top-5 acc 17.578 (16.972)	lr 0.04572
Warmup Train [8][1840/3239]	Time 0.476 (0.515)	Data 0.001 (0.011)	Loss 5.5863 (5.6056)	Top-1 acc 7.422 (5.827)	Top-5 acc 17.188 (16.981)	lr 0.04571
Warmup Train [8][1850/3239]	Time 0.628 (0.515)	Data 0.001 (0.011)	Loss 5.5367 (5.6053)	Top-1 acc 5.469 (5.832)	Top-5 acc 19.922 (16.988)	lr 0.04571
Warmup Train [8][1860/3239]	Time 0.454 (0.515)	Data 0.001 (0.011)	Loss 5.4585 (5.6052)	Top-1 acc 5.078 (5.831)	Top-5 acc 20.703 (16.986)	lr 0.04571
Warmup Train [8][1870/3239]	Time 0.349 (0.515)	Data 0.001 (0.011)	Loss 5.7425 (5.6051)	Top-1 acc 5.859 (5.831)	Top-5 acc 17.188 (16.988)	lr 0.04570
Warmup Train [8][1880/3239]	Time 0.517 (0.515)	Data 0.001 (0.011)	Loss 5.6880 (5.6046)	Top-1 acc 3.906 (5.833)	Top-5 acc 11.719 (17.001)	lr 0.04570
Warmup Train [8][1890/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 5.4859 (5.6045)	Top-1 acc 9.766 (5.837)	Top-5 acc 20.312 (17.005)	lr 0.04570
Warmup Train [8][1900/3239]	Time 0.405 (0.515)	Data 0.001 (0.011)	Loss 5.6117 (5.6043)	Top-1 acc 7.031 (5.843)	Top-5 acc 17.969 (17.010)	lr 0.04569
Warmup Train [8][1910/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 5.5745 (5.6042)	Top-1 acc 8.203 (5.843)	Top-5 acc 20.703 (17.011)	lr 0.04569
Warmup Train [8][1920/3239]	Time 0.645 (0.515)	Data 0.001 (0.011)	Loss 5.4244 (5.6039)	Top-1 acc 8.594 (5.841)	Top-5 acc 21.094 (17.009)	lr 0.04569
Warmup Train [8][1930/3239]	Time 0.393 (0.515)	Data 0.002 (0.011)	Loss 5.5494 (5.6035)	Top-1 acc 6.641 (5.846)	Top-5 acc 14.844 (17.015)	lr 0.04568
Warmup Train [8][1940/3239]	Time 0.425 (0.515)	Data 0.001 (0.011)	Loss 5.6187 (5.6034)	Top-1 acc 3.906 (5.846)	Top-5 acc 14.062 (17.010)	lr 0.04568
Warmup Train [8][1950/3239]	Time 0.423 (0.515)	Data 0.001 (0.011)	Loss 5.5362 (5.6034)	Top-1 acc 7.031 (5.847)	Top-5 acc 17.578 (17.016)	lr 0.04567
Warmup Train [8][1960/3239]	Time 0.593 (0.515)	Data 0.001 (0.011)	Loss 5.6067 (5.6032)	Top-1 acc 4.297 (5.847)	Top-5 acc 17.969 (17.020)	lr 0.04567
Warmup Train [8][1970/3239]	Time 0.567 (0.515)	Data 0.001 (0.011)	Loss 5.5356 (5.6028)	Top-1 acc 5.859 (5.848)	Top-5 acc 14.844 (17.024)	lr 0.04567
Warmup Train [8][1980/3239]	Time 0.510 (0.515)	Data 0.001 (0.011)	Loss 5.6316 (5.6024)	Top-1 acc 7.812 (5.853)	Top-5 acc 18.750 (17.035)	lr 0.04566
Warmup Train [8][1990/3239]	Time 0.583 (0.515)	Data 0.001 (0.011)	Loss 5.5665 (5.6023)	Top-1 acc 7.031 (5.853)	Top-5 acc 19.141 (17.039)	lr 0.04566
Warmup Train [8][2000/3239]	Time 0.544 (0.515)	Data 0.001 (0.011)	Loss 5.4902 (5.6022)	Top-1 acc 7.031 (5.852)	Top-5 acc 21.094 (17.043)	lr 0.04566
Warmup Train [8][2010/3239]	Time 0.683 (0.515)	Data 0.001 (0.011)	Loss 5.4730 (5.6019)	Top-1 acc 5.859 (5.855)	Top-5 acc 22.656 (17.054)	lr 0.04565
Warmup Train [8][2020/3239]	Time 0.678 (0.515)	Data 0.001 (0.011)	Loss 5.5524 (5.6018)	Top-1 acc 7.422 (5.858)	Top-5 acc 15.234 (17.055)	lr 0.04565
Warmup Train [8][2030/3239]	Time 0.550 (0.515)	Data 0.001 (0.011)	Loss 5.4951 (5.6015)	Top-1 acc 5.469 (5.860)	Top-5 acc 18.750 (17.060)	lr 0.04565
Warmup Train [8][2040/3239]	Time 0.536 (0.515)	Data 0.001 (0.011)	Loss 5.5274 (5.6014)	Top-1 acc 5.469 (5.861)	Top-5 acc 21.484 (17.065)	lr 0.04564
Warmup Train [8][2050/3239]	Time 0.376 (0.515)	Data 0.001 (0.011)	Loss 5.4794 (5.6014)	Top-1 acc 4.688 (5.859)	Top-5 acc 17.188 (17.064)	lr 0.04564
Warmup Train [8][2060/3239]	Time 0.595 (0.514)	Data 0.001 (0.011)	Loss 5.6105 (5.6011)	Top-1 acc 5.469 (5.861)	Top-5 acc 16.406 (17.072)	lr 0.04564
Warmup Train [8][2070/3239]	Time 0.502 (0.514)	Data 0.001 (0.011)	Loss 5.5517 (5.6008)	Top-1 acc 4.297 (5.866)	Top-5 acc 15.625 (17.083)	lr 0.04563
Warmup Train [8][2080/3239]	Time 0.515 (0.514)	Data 0.001 (0.011)	Loss 5.5052 (5.6007)	Top-1 acc 7.812 (5.869)	Top-5 acc 17.188 (17.090)	lr 0.04563
Warmup Train [8][2090/3239]	Time 0.577 (0.514)	Data 0.001 (0.011)	Loss 5.5701 (5.6006)	Top-1 acc 6.250 (5.869)	Top-5 acc 14.453 (17.090)	lr 0.04563
Warmup Train [8][2100/3239]	Time 0.588 (0.514)	Data 0.001 (0.010)	Loss 5.4352 (5.6003)	Top-1 acc 8.984 (5.875)	Top-5 acc 22.656 (17.097)	lr 0.04562
Warmup Train [8][2110/3239]	Time 0.486 (0.514)	Data 0.001 (0.010)	Loss 5.6697 (5.6000)	Top-1 acc 6.250 (5.876)	Top-5 acc 14.453 (17.097)	lr 0.04562
Warmup Train [8][2120/3239]	Time 0.636 (0.514)	Data 0.001 (0.010)	Loss 5.5544 (5.5998)	Top-1 acc 7.812 (5.880)	Top-5 acc 18.750 (17.107)	lr 0.04562
Warmup Train [8][2130/3239]	Time 0.673 (0.514)	Data 0.001 (0.010)	Loss 5.7044 (5.5997)	Top-1 acc 5.859 (5.883)	Top-5 acc 16.797 (17.115)	lr 0.04561
Warmup Train [8][2140/3239]	Time 0.712 (0.514)	Data 0.001 (0.010)	Loss 5.5513 (5.5998)	Top-1 acc 6.250 (5.884)	Top-5 acc 16.016 (17.114)	lr 0.04561
Warmup Train [8][2150/3239]	Time 0.621 (0.514)	Data 0.001 (0.010)	Loss 5.5662 (5.5999)	Top-1 acc 3.906 (5.882)	Top-5 acc 16.016 (17.111)	lr 0.04561
Warmup Train [8][2160/3239]	Time 0.537 (0.514)	Data 0.001 (0.010)	Loss 5.5816 (5.5996)	Top-1 acc 4.688 (5.882)	Top-5 acc 17.969 (17.114)	lr 0.04560
Warmup Train [8][2170/3239]	Time 0.473 (0.514)	Data 0.001 (0.010)	Loss 5.5684 (5.5996)	Top-1 acc 5.859 (5.883)	Top-5 acc 19.141 (17.115)	lr 0.04560
Warmup Train [8][2180/3239]	Time 0.506 (0.514)	Data 0.001 (0.010)	Loss 5.6278 (5.5996)	Top-1 acc 2.734 (5.879)	Top-5 acc 16.797 (17.111)	lr 0.04560
Warmup Train [8][2190/3239]	Time 0.542 (0.514)	Data 0.001 (0.010)	Loss 5.4873 (5.5994)	Top-1 acc 8.984 (5.880)	Top-5 acc 19.141 (17.116)	lr 0.04559
Warmup Train [8][2200/3239]	Time 0.611 (0.514)	Data 0.001 (0.010)	Loss 5.4993 (5.5992)	Top-1 acc 6.641 (5.882)	Top-5 acc 19.922 (17.120)	lr 0.04559
Warmup Train [8][2210/3239]	Time 0.415 (0.514)	Data 0.001 (0.010)	Loss 5.6269 (5.5990)	Top-1 acc 3.906 (5.884)	Top-5 acc 14.844 (17.130)	lr 0.04559
Warmup Train [8][2220/3239]	Time 0.658 (0.514)	Data 0.002 (0.010)	Loss 5.6198 (5.5988)	Top-1 acc 5.078 (5.885)	Top-5 acc 14.844 (17.134)	lr 0.04558
Warmup Train [8][2230/3239]	Time 0.534 (0.514)	Data 0.001 (0.010)	Loss 5.6466 (5.5987)	Top-1 acc 3.906 (5.883)	Top-5 acc 14.062 (17.138)	lr 0.04558
Warmup Train [8][2240/3239]	Time 0.414 (0.514)	Data 0.001 (0.010)	Loss 5.4861 (5.5984)	Top-1 acc 6.641 (5.886)	Top-5 acc 21.484 (17.144)	lr 0.04558
Warmup Train [8][2250/3239]	Time 0.502 (0.514)	Data 0.001 (0.010)	Loss 5.6309 (5.5983)	Top-1 acc 3.516 (5.888)	Top-5 acc 15.625 (17.148)	lr 0.04557
Warmup Train [8][2260/3239]	Time 0.697 (0.514)	Data 0.001 (0.010)	Loss 5.5570 (5.5981)	Top-1 acc 6.250 (5.890)	Top-5 acc 17.969 (17.155)	lr 0.04557
Warmup Train [8][2270/3239]	Time 0.451 (0.514)	Data 0.001 (0.010)	Loss 5.4625 (5.5979)	Top-1 acc 5.859 (5.891)	Top-5 acc 17.969 (17.158)	lr 0.04557
Warmup Train [8][2280/3239]	Time 0.412 (0.514)	Data 0.001 (0.010)	Loss 5.6485 (5.5977)	Top-1 acc 5.078 (5.890)	Top-5 acc 15.625 (17.157)	lr 0.04556
Warmup Train [8][2290/3239]	Time 0.438 (0.514)	Data 0.001 (0.010)	Loss 5.4581 (5.5974)	Top-1 acc 7.422 (5.895)	Top-5 acc 18.359 (17.166)	lr 0.04556
Warmup Train [8][2300/3239]	Time 0.377 (0.514)	Data 0.001 (0.010)	Loss 5.4426 (5.5973)	Top-1 acc 8.984 (5.897)	Top-5 acc 20.703 (17.168)	lr 0.04555
Warmup Train [8][2310/3239]	Time 0.487 (0.514)	Data 0.001 (0.010)	Loss 5.6550 (5.5972)	Top-1 acc 6.250 (5.896)	Top-5 acc 15.234 (17.166)	lr 0.04555
Warmup Train [8][2320/3239]	Time 0.670 (0.514)	Data 0.001 (0.010)	Loss 5.5798 (5.5972)	Top-1 acc 5.469 (5.896)	Top-5 acc 18.359 (17.166)	lr 0.04555
Warmup Train [8][2330/3239]	Time 0.589 (0.514)	Data 0.001 (0.010)	Loss 5.5242 (5.5972)	Top-1 acc 6.641 (5.897)	Top-5 acc 16.406 (17.168)	lr 0.04554
Warmup Train [8][2340/3239]	Time 0.451 (0.513)	Data 0.001 (0.010)	Loss 5.5192 (5.5969)	Top-1 acc 6.250 (5.901)	Top-5 acc 17.969 (17.170)	lr 0.04554
Warmup Train [8][2350/3239]	Time 0.463 (0.513)	Data 0.001 (0.010)	Loss 5.4838 (5.5967)	Top-1 acc 7.812 (5.907)	Top-5 acc 20.703 (17.176)	lr 0.04554
Warmup Train [8][2360/3239]	Time 0.347 (0.513)	Data 0.001 (0.010)	Loss 5.5617 (5.5964)	Top-1 acc 6.250 (5.908)	Top-5 acc 20.312 (17.180)	lr 0.04553
Warmup Train [8][2370/3239]	Time 0.349 (0.513)	Data 0.001 (0.010)	Loss 5.5077 (5.5963)	Top-1 acc 8.203 (5.910)	Top-5 acc 21.484 (17.183)	lr 0.04553
Warmup Train [8][2380/3239]	Time 0.376 (0.513)	Data 0.001 (0.010)	Loss 5.5406 (5.5961)	Top-1 acc 7.422 (5.913)	Top-5 acc 19.141 (17.190)	lr 0.04553
Warmup Train [8][2390/3239]	Time 0.396 (0.513)	Data 0.001 (0.010)	Loss 5.6169 (5.5959)	Top-1 acc 8.203 (5.916)	Top-5 acc 17.969 (17.196)	lr 0.04552
Warmup Train [8][2400/3239]	Time 0.450 (0.513)	Data 0.001 (0.010)	Loss 5.5069 (5.5958)	Top-1 acc 7.422 (5.919)	Top-5 acc 19.922 (17.202)	lr 0.04552
Warmup Train [8][2410/3239]	Time 0.556 (0.513)	Data 0.001 (0.010)	Loss 5.6117 (5.5957)	Top-1 acc 6.641 (5.919)	Top-5 acc 16.016 (17.201)	lr 0.04552
Warmup Train [8][2420/3239]	Time 0.429 (0.514)	Data 0.001 (0.010)	Loss 5.5226 (5.5955)	Top-1 acc 6.641 (5.926)	Top-5 acc 19.531 (17.207)	lr 0.04551
Warmup Train [8][2430/3239]	Time 0.456 (0.514)	Data 0.001 (0.010)	Loss 5.4077 (5.5952)	Top-1 acc 8.594 (5.927)	Top-5 acc 19.922 (17.213)	lr 0.04551
Warmup Train [8][2440/3239]	Time 0.546 (0.514)	Data 0.001 (0.010)	Loss 5.6401 (5.5951)	Top-1 acc 5.859 (5.932)	Top-5 acc 15.625 (17.218)	lr 0.04551
Warmup Train [8][2450/3239]	Time 0.451 (0.514)	Data 0.001 (0.010)	Loss 5.5088 (5.5949)	Top-1 acc 5.859 (5.933)	Top-5 acc 19.922 (17.226)	lr 0.04550
Warmup Train [8][2460/3239]	Time 0.522 (0.514)	Data 0.001 (0.010)	Loss 5.5505 (5.5945)	Top-1 acc 8.203 (5.935)	Top-5 acc 16.797 (17.231)	lr 0.04550
Warmup Train [8][2470/3239]	Time 0.390 (0.514)	Data 0.002 (0.010)	Loss 5.4922 (5.5943)	Top-1 acc 7.031 (5.937)	Top-5 acc 23.438 (17.240)	lr 0.04550
Warmup Train [8][2480/3239]	Time 0.478 (0.514)	Data 0.001 (0.010)	Loss 5.6044 (5.5941)	Top-1 acc 5.469 (5.938)	Top-5 acc 15.234 (17.243)	lr 0.04549
Warmup Train [8][2490/3239]	Time 0.681 (0.514)	Data 0.001 (0.010)	Loss 5.5820 (5.5941)	Top-1 acc 6.641 (5.937)	Top-5 acc 18.750 (17.240)	lr 0.04549
Warmup Train [8][2500/3239]	Time 0.521 (0.514)	Data 0.001 (0.010)	Loss 5.4168 (5.5939)	Top-1 acc 5.859 (5.937)	Top-5 acc 17.578 (17.240)	lr 0.04549
Warmup Train [8][2510/3239]	Time 0.453 (0.513)	Data 0.001 (0.010)	Loss 5.6068 (5.5940)	Top-1 acc 6.641 (5.935)	Top-5 acc 16.016 (17.237)	lr 0.04548
Warmup Train [8][2520/3239]	Time 0.466 (0.514)	Data 0.001 (0.010)	Loss 5.5094 (5.5937)	Top-1 acc 5.078 (5.936)	Top-5 acc 19.141 (17.245)	lr 0.04548
Warmup Train [8][2530/3239]	Time 0.574 (0.513)	Data 0.001 (0.010)	Loss 5.5102 (5.5936)	Top-1 acc 6.250 (5.935)	Top-5 acc 17.578 (17.249)	lr 0.04548
Warmup Train [8][2540/3239]	Time 0.508 (0.513)	Data 0.001 (0.010)	Loss 5.5889 (5.5934)	Top-1 acc 4.297 (5.937)	Top-5 acc 18.359 (17.254)	lr 0.04547
Warmup Train [8][2550/3239]	Time 0.562 (0.513)	Data 0.001 (0.010)	Loss 5.5278 (5.5933)	Top-1 acc 4.297 (5.938)	Top-5 acc 18.359 (17.256)	lr 0.04547
Warmup Train [8][2560/3239]	Time 0.424 (0.513)	Data 0.001 (0.010)	Loss 5.4868 (5.5930)	Top-1 acc 6.641 (5.941)	Top-5 acc 21.094 (17.264)	lr 0.04546
Warmup Train [8][2570/3239]	Time 0.635 (0.513)	Data 0.002 (0.010)	Loss 5.6941 (5.5928)	Top-1 acc 3.906 (5.944)	Top-5 acc 15.625 (17.267)	lr 0.04546
Warmup Train [8][2580/3239]	Time 0.452 (0.513)	Data 0.001 (0.010)	Loss 5.4297 (5.5926)	Top-1 acc 8.984 (5.945)	Top-5 acc 19.531 (17.270)	lr 0.04546
Warmup Train [8][2590/3239]	Time 0.482 (0.513)	Data 0.001 (0.010)	Loss 5.4641 (5.5925)	Top-1 acc 8.984 (5.945)	Top-5 acc 18.750 (17.268)	lr 0.04545
Warmup Train [8][2600/3239]	Time 0.475 (0.513)	Data 0.003 (0.010)	Loss 5.4889 (5.5924)	Top-1 acc 7.422 (5.948)	Top-5 acc 17.969 (17.271)	lr 0.04545
Warmup Train [8][2610/3239]	Time 0.180 (0.513)	Data 0.001 (0.010)	Loss 5.5413 (5.5922)	Top-1 acc 8.594 (5.950)	Top-5 acc 19.141 (17.276)	lr 0.04545
Warmup Train [8][2620/3239]	Time 0.528 (0.513)	Data 0.001 (0.010)	Loss 5.5820 (5.5919)	Top-1 acc 6.250 (5.953)	Top-5 acc 19.531 (17.282)	lr 0.04544
Warmup Train [8][2630/3239]	Time 0.634 (0.513)	Data 0.001 (0.010)	Loss 5.5103 (5.5916)	Top-1 acc 6.250 (5.957)	Top-5 acc 22.266 (17.289)	lr 0.04544
Warmup Train [8][2640/3239]	Time 0.430 (0.513)	Data 0.001 (0.010)	Loss 5.5725 (5.5914)	Top-1 acc 4.688 (5.957)	Top-5 acc 15.234 (17.285)	lr 0.04544
Warmup Train [8][2650/3239]	Time 0.594 (0.513)	Data 0.001 (0.010)	Loss 5.3775 (5.5912)	Top-1 acc 7.422 (5.959)	Top-5 acc 19.531 (17.289)	lr 0.04543
Warmup Train [8][2660/3239]	Time 0.582 (0.513)	Data 0.001 (0.010)	Loss 5.5340 (5.5911)	Top-1 acc 8.203 (5.962)	Top-5 acc 19.141 (17.290)	lr 0.04543
Warmup Train [8][2670/3239]	Time 0.578 (0.513)	Data 0.001 (0.010)	Loss 5.6018 (5.5912)	Top-1 acc 5.078 (5.961)	Top-5 acc 18.359 (17.287)	lr 0.04543
Warmup Train [8][2680/3239]	Time 0.555 (0.513)	Data 0.001 (0.010)	Loss 5.4407 (5.5911)	Top-1 acc 6.641 (5.962)	Top-5 acc 18.359 (17.290)	lr 0.04542
Warmup Train [8][2690/3239]	Time 0.408 (0.513)	Data 0.001 (0.010)	Loss 5.4518 (5.5907)	Top-1 acc 5.859 (5.965)	Top-5 acc 21.094 (17.295)	lr 0.04542
Warmup Train [8][2700/3239]	Time 0.626 (0.513)	Data 0.001 (0.010)	Loss 5.5108 (5.5905)	Top-1 acc 6.641 (5.971)	Top-5 acc 17.188 (17.303)	lr 0.04542
Warmup Train [8][2710/3239]	Time 0.515 (0.513)	Data 0.001 (0.010)	Loss 5.6090 (5.5905)	Top-1 acc 4.688 (5.969)	Top-5 acc 16.797 (17.300)	lr 0.04541
Warmup Train [8][2720/3239]	Time 0.622 (0.513)	Data 0.001 (0.010)	Loss 5.5378 (5.5902)	Top-1 acc 5.078 (5.970)	Top-5 acc 21.094 (17.305)	lr 0.04541
Warmup Train [8][2730/3239]	Time 0.552 (0.513)	Data 0.001 (0.010)	Loss 5.5543 (5.5900)	Top-1 acc 5.859 (5.974)	Top-5 acc 19.531 (17.312)	lr 0.04541
Warmup Train [8][2740/3239]	Time 0.529 (0.513)	Data 0.001 (0.010)	Loss 5.6649 (5.5898)	Top-1 acc 3.125 (5.976)	Top-5 acc 17.188 (17.319)	lr 0.04540
Warmup Train [8][2750/3239]	Time 0.659 (0.513)	Data 0.001 (0.010)	Loss 5.6358 (5.5898)	Top-1 acc 5.859 (5.975)	Top-5 acc 15.625 (17.318)	lr 0.04540
Warmup Train [8][2760/3239]	Time 0.534 (0.513)	Data 0.001 (0.009)	Loss 5.5883 (5.5896)	Top-1 acc 6.250 (5.977)	Top-5 acc 16.016 (17.324)	lr 0.04540
Warmup Train [8][2770/3239]	Time 0.358 (0.513)	Data 0.001 (0.009)	Loss 5.4777 (5.5894)	Top-1 acc 10.156 (5.981)	Top-5 acc 24.609 (17.331)	lr 0.04539
Warmup Train [8][2780/3239]	Time 0.675 (0.513)	Data 0.001 (0.009)	Loss 5.4072 (5.5891)	Top-1 acc 3.516 (5.981)	Top-5 acc 19.922 (17.337)	lr 0.04539
Warmup Train [8][2790/3239]	Time 0.472 (0.513)	Data 0.001 (0.009)	Loss 5.5803 (5.5889)	Top-1 acc 4.688 (5.982)	Top-5 acc 15.234 (17.335)	lr 0.04538
Warmup Train [8][2800/3239]	Time 0.305 (0.513)	Data 0.001 (0.009)	Loss 5.5621 (5.5886)	Top-1 acc 4.688 (5.985)	Top-5 acc 18.750 (17.340)	lr 0.04538
Warmup Train [8][2810/3239]	Time 0.494 (0.513)	Data 0.001 (0.009)	Loss 5.4376 (5.5883)	Top-1 acc 9.766 (5.987)	Top-5 acc 18.750 (17.349)	lr 0.04538
Warmup Train [8][2820/3239]	Time 0.522 (0.513)	Data 0.001 (0.009)	Loss 5.4990 (5.5881)	Top-1 acc 6.250 (5.989)	Top-5 acc 19.922 (17.355)	lr 0.04537
Warmup Train [8][2830/3239]	Time 0.586 (0.513)	Data 0.001 (0.009)	Loss 5.4578 (5.5878)	Top-1 acc 8.203 (5.992)	Top-5 acc 19.141 (17.359)	lr 0.04537
Warmup Train [8][2840/3239]	Time 0.479 (0.513)	Data 0.001 (0.009)	Loss 5.5486 (5.5877)	Top-1 acc 6.250 (5.995)	Top-5 acc 19.141 (17.363)	lr 0.04537
Warmup Train [8][2850/3239]	Time 0.537 (0.513)	Data 0.001 (0.009)	Loss 5.4851 (5.5875)	Top-1 acc 12.500 (5.996)	Top-5 acc 25.391 (17.369)	lr 0.04536
Warmup Train [8][2860/3239]	Time 0.644 (0.513)	Data 0.001 (0.009)	Loss 5.4789 (5.5874)	Top-1 acc 5.078 (6.000)	Top-5 acc 16.406 (17.372)	lr 0.04536
Warmup Train [8][2870/3239]	Time 0.482 (0.513)	Data 0.001 (0.009)	Loss 5.5227 (5.5871)	Top-1 acc 5.469 (6.003)	Top-5 acc 17.578 (17.377)	lr 0.04536
Warmup Train [8][2880/3239]	Time 0.601 (0.513)	Data 0.001 (0.009)	Loss 5.4486 (5.5868)	Top-1 acc 6.250 (6.006)	Top-5 acc 19.922 (17.381)	lr 0.04535
Warmup Train [8][2890/3239]	Time 0.573 (0.513)	Data 0.001 (0.009)	Loss 5.4436 (5.5866)	Top-1 acc 8.594 (6.007)	Top-5 acc 20.703 (17.386)	lr 0.04535
Warmup Train [8][2900/3239]	Time 0.492 (0.513)	Data 0.001 (0.009)	Loss 5.5533 (5.5863)	Top-1 acc 5.078 (6.008)	Top-5 acc 16.406 (17.388)	lr 0.04535
Warmup Train [8][2910/3239]	Time 0.343 (0.512)	Data 0.001 (0.009)	Loss 5.4793 (5.5861)	Top-1 acc 5.859 (6.007)	Top-5 acc 19.531 (17.387)	lr 0.04534
Warmup Train [8][2920/3239]	Time 0.495 (0.512)	Data 0.001 (0.009)	Loss 5.5257 (5.5860)	Top-1 acc 7.422 (6.011)	Top-5 acc 16.016 (17.391)	lr 0.04534
Warmup Train [8][2930/3239]	Time 0.523 (0.512)	Data 0.001 (0.009)	Loss 5.5178 (5.5858)	Top-1 acc 6.641 (6.015)	Top-5 acc 18.359 (17.396)	lr 0.04534
Warmup Train [8][2940/3239]	Time 0.366 (0.512)	Data 0.001 (0.009)	Loss 5.4686 (5.5856)	Top-1 acc 6.641 (6.016)	Top-5 acc 17.188 (17.402)	lr 0.04533
Warmup Train [8][2950/3239]	Time 0.607 (0.512)	Data 0.001 (0.009)	Loss 5.5662 (5.5852)	Top-1 acc 7.812 (6.021)	Top-5 acc 19.141 (17.410)	lr 0.04533
Warmup Train [8][2960/3239]	Time 0.591 (0.512)	Data 0.001 (0.009)	Loss 5.6172 (5.5851)	Top-1 acc 5.859 (6.022)	Top-5 acc 16.797 (17.413)	lr 0.04532
Warmup Train [8][2970/3239]	Time 0.763 (0.512)	Data 0.001 (0.009)	Loss 5.5987 (5.5848)	Top-1 acc 4.297 (6.024)	Top-5 acc 16.406 (17.416)	lr 0.04532
Warmup Train [8][2980/3239]	Time 0.530 (0.512)	Data 0.001 (0.009)	Loss 5.5626 (5.5846)	Top-1 acc 5.469 (6.026)	Top-5 acc 17.188 (17.421)	lr 0.04532
Warmup Train [8][2990/3239]	Time 0.472 (0.512)	Data 0.001 (0.009)	Loss 5.5261 (5.5843)	Top-1 acc 5.859 (6.030)	Top-5 acc 18.750 (17.426)	lr 0.04531
Warmup Train [8][3000/3239]	Time 0.531 (0.512)	Data 0.001 (0.009)	Loss 5.6134 (5.5841)	Top-1 acc 5.859 (6.030)	Top-5 acc 16.797 (17.433)	lr 0.04531
Warmup Train [8][3010/3239]	Time 0.479 (0.512)	Data 0.001 (0.009)	Loss 5.5523 (5.5839)	Top-1 acc 4.297 (6.030)	Top-5 acc 14.844 (17.434)	lr 0.04531
Warmup Train [8][3020/3239]	Time 0.526 (0.512)	Data 0.001 (0.009)	Loss 5.5344 (5.5837)	Top-1 acc 8.203 (6.034)	Top-5 acc 21.094 (17.440)	lr 0.04530
Warmup Train [8][3030/3239]	Time 0.531 (0.512)	Data 0.001 (0.009)	Loss 5.5990 (5.5836)	Top-1 acc 4.297 (6.034)	Top-5 acc 15.625 (17.440)	lr 0.04530
Warmup Train [8][3040/3239]	Time 0.437 (0.512)	Data 0.001 (0.009)	Loss 5.5571 (5.5833)	Top-1 acc 5.469 (6.037)	Top-5 acc 14.453 (17.446)	lr 0.04530
Warmup Train [8][3050/3239]	Time 0.513 (0.512)	Data 0.001 (0.009)	Loss 5.5842 (5.5831)	Top-1 acc 3.516 (6.035)	Top-5 acc 18.750 (17.450)	lr 0.04529
Warmup Train [8][3060/3239]	Time 0.395 (0.512)	Data 0.001 (0.009)	Loss 5.4954 (5.5830)	Top-1 acc 5.469 (6.034)	Top-5 acc 17.578 (17.450)	lr 0.04529
Warmup Train [8][3070/3239]	Time 0.676 (0.512)	Data 0.001 (0.009)	Loss 5.6489 (5.5828)	Top-1 acc 4.297 (6.035)	Top-5 acc 16.016 (17.450)	lr 0.04529
Warmup Train [8][3080/3239]	Time 0.539 (0.512)	Data 0.001 (0.009)	Loss 5.5864 (5.5828)	Top-1 acc 5.859 (6.038)	Top-5 acc 16.797 (17.450)	lr 0.04528
Warmup Train [8][3090/3239]	Time 0.503 (0.513)	Data 0.001 (0.009)	Loss 5.3297 (5.5826)	Top-1 acc 8.594 (6.038)	Top-5 acc 23.438 (17.455)	lr 0.04528
Warmup Train [8][3100/3239]	Time 0.445 (0.513)	Data 0.002 (0.009)	Loss 5.6450 (5.5824)	Top-1 acc 4.297 (6.039)	Top-5 acc 16.797 (17.460)	lr 0.04528
Warmup Train [8][3110/3239]	Time 0.399 (0.512)	Data 0.001 (0.009)	Loss 5.3834 (5.5820)	Top-1 acc 9.766 (6.046)	Top-5 acc 21.094 (17.465)	lr 0.04527
Warmup Train [8][3120/3239]	Time 0.488 (0.512)	Data 0.001 (0.009)	Loss 5.4877 (5.5819)	Top-1 acc 5.859 (6.047)	Top-5 acc 22.266 (17.468)	lr 0.04527
Warmup Train [8][3130/3239]	Time 0.434 (0.512)	Data 0.001 (0.009)	Loss 5.4504 (5.5818)	Top-1 acc 6.250 (6.047)	Top-5 acc 17.578 (17.469)	lr 0.04526
Warmup Train [8][3140/3239]	Time 0.522 (0.512)	Data 0.001 (0.009)	Loss 5.5303 (5.5816)	Top-1 acc 6.250 (6.048)	Top-5 acc 18.359 (17.474)	lr 0.04526
Warmup Train [8][3150/3239]	Time 0.388 (0.512)	Data 0.001 (0.009)	Loss 5.4187 (5.5813)	Top-1 acc 8.984 (6.053)	Top-5 acc 25.000 (17.482)	lr 0.04526
Warmup Train [8][3160/3239]	Time 0.611 (0.512)	Data 0.001 (0.009)	Loss 5.6472 (5.5810)	Top-1 acc 4.297 (6.052)	Top-5 acc 16.406 (17.483)	lr 0.04525
Warmup Train [8][3170/3239]	Time 0.516 (0.512)	Data 0.001 (0.009)	Loss 5.4700 (5.5807)	Top-1 acc 7.422 (6.055)	Top-5 acc 17.578 (17.488)	lr 0.04525
Warmup Train [8][3180/3239]	Time 0.526 (0.512)	Data 0.000 (0.009)	Loss 5.5174 (5.5806)	Top-1 acc 6.641 (6.057)	Top-5 acc 17.578 (17.490)	lr 0.04525
Warmup Train [8][3190/3239]	Time 0.488 (0.512)	Data 0.000 (0.009)	Loss 5.6411 (5.5805)	Top-1 acc 6.250 (6.059)	Top-5 acc 11.719 (17.490)	lr 0.04524
Warmup Train [8][3200/3239]	Time 0.513 (0.512)	Data 0.000 (0.009)	Loss 5.5131 (5.5802)	Top-1 acc 5.859 (6.062)	Top-5 acc 17.188 (17.494)	lr 0.04524
Warmup Train [8][3210/3239]	Time 0.420 (0.512)	Data 0.000 (0.009)	Loss 5.4923 (5.5801)	Top-1 acc 5.469 (6.060)	Top-5 acc 19.141 (17.496)	lr 0.04524
Warmup Train [8][3220/3239]	Time 0.480 (0.512)	Data 0.000 (0.009)	Loss 5.5921 (5.5799)	Top-1 acc 5.469 (6.059)	Top-5 acc 17.578 (17.499)	lr 0.04523
Warmup Train [8][3230/3239]	Time 0.501 (0.512)	Data 0.000 (0.009)	Loss 5.4578 (5.5797)	Top-1 acc 7.422 (6.060)	Top-5 acc 21.875 (17.503)	lr 0.04523
Warmup Train [8][3239/3239]	Time 0.356 (0.512)	Data 0.000 (0.009)	Loss 5.7432 (5.5797)	Top-1 acc 3.704 (6.061)	Top-5 acc 13.580 (17.505)	lr 0.04523
==========Warmup Valid [8/40]	loss 4.920	top-1 acc 9.380	top-5 acc 24.347	Train top-1 6.061	top-5 17.505	flops: 442.4M
Warmup Train [9][0/3239]	Time 11.793 (11.793)	Data 10.274 (10.274)	Loss 5.5456 (5.5456)	Top-1 acc 4.297 (4.297)	Top-5 acc 16.797 (16.797)	lr 0.04523
Warmup Train [9][10/3239]	Time 0.454 (1.662)	Data 0.001 (1.044)	Loss 5.4943 (5.5541)	Top-1 acc 7.812 (6.143)	Top-5 acc 23.047 (18.572)	lr 0.04522
Warmup Train [9][20/3239]	Time 0.206 (1.088)	Data 0.001 (0.549)	Loss 5.4718 (5.5288)	Top-1 acc 5.469 (6.343)	Top-5 acc 16.797 (18.750)	lr 0.04522
Warmup Train [9][30/3239]	Time 0.537 (0.899)	Data 0.001 (0.377)	Loss 5.3861 (5.5164)	Top-1 acc 6.641 (6.552)	Top-5 acc 20.703 (18.838)	lr 0.04521
Warmup Train [9][40/3239]	Time 0.514 (0.811)	Data 0.001 (0.286)	Loss 5.6923 (5.5246)	Top-1 acc 6.250 (6.679)	Top-5 acc 15.625 (18.740)	lr 0.04521
Warmup Train [9][50/3239]	Time 0.622 (0.753)	Data 0.001 (0.230)	Loss 5.6165 (5.5269)	Top-1 acc 3.906 (6.641)	Top-5 acc 14.062 (18.543)	lr 0.04521
Warmup Train [9][60/3239]	Time 0.473 (0.712)	Data 0.001 (0.193)	Loss 5.4989 (5.5315)	Top-1 acc 6.641 (6.641)	Top-5 acc 20.703 (18.398)	lr 0.04520
Warmup Train [9][70/3239]	Time 0.564 (0.684)	Data 0.001 (0.166)	Loss 5.5586 (5.5311)	Top-1 acc 5.859 (6.701)	Top-5 acc 18.750 (18.458)	lr 0.04520
Warmup Train [9][80/3239]	Time 0.515 (0.663)	Data 0.001 (0.147)	Loss 5.3243 (5.5276)	Top-1 acc 9.766 (6.708)	Top-5 acc 24.219 (18.581)	lr 0.04520
Warmup Train [9][90/3239]	Time 0.355 (0.647)	Data 0.001 (0.131)	Loss 5.5005 (5.5229)	Top-1 acc 8.203 (6.735)	Top-5 acc 20.703 (18.707)	lr 0.04519
Warmup Train [9][100/3239]	Time 0.490 (0.635)	Data 0.001 (0.120)	Loss 5.4472 (5.5231)	Top-1 acc 6.250 (6.726)	Top-5 acc 18.359 (18.692)	lr 0.04519
Warmup Train [9][110/3239]	Time 0.496 (0.624)	Data 0.001 (0.109)	Loss 5.3456 (5.5197)	Top-1 acc 10.156 (6.725)	Top-5 acc 21.484 (18.673)	lr 0.04519
Warmup Train [9][120/3239]	Time 0.396 (0.616)	Data 0.001 (0.102)	Loss 5.6157 (5.5180)	Top-1 acc 5.469 (6.750)	Top-5 acc 12.891 (18.805)	lr 0.04518
Warmup Train [9][130/3239]	Time 0.563 (0.609)	Data 0.001 (0.095)	Loss 5.3695 (5.5133)	Top-1 acc 10.547 (6.808)	Top-5 acc 24.219 (19.006)	lr 0.04518
Warmup Train [9][140/3239]	Time 0.474 (0.602)	Data 0.001 (0.088)	Loss 5.4545 (5.5142)	Top-1 acc 7.422 (6.779)	Top-5 acc 20.312 (18.983)	lr 0.04518
Warmup Train [9][150/3239]	Time 0.373 (0.596)	Data 0.001 (0.083)	Loss 5.5000 (5.5125)	Top-1 acc 7.031 (6.850)	Top-5 acc 16.797 (18.965)	lr 0.04517
Warmup Train [9][160/3239]	Time 0.529 (0.591)	Data 0.001 (0.078)	Loss 5.5153 (5.5095)	Top-1 acc 8.594 (6.910)	Top-5 acc 20.703 (19.080)	lr 0.04517
Warmup Train [9][170/3239]	Time 0.656 (0.586)	Data 0.001 (0.074)	Loss 5.3715 (5.5082)	Top-1 acc 5.859 (6.926)	Top-5 acc 20.312 (19.088)	lr 0.04516
Warmup Train [9][180/3239]	Time 0.548 (0.581)	Data 0.002 (0.070)	Loss 5.4722 (5.5105)	Top-1 acc 7.031 (6.902)	Top-5 acc 19.531 (19.078)	lr 0.04516
Warmup Train [9][190/3239]	Time 0.336 (0.576)	Data 0.001 (0.066)	Loss 5.6883 (5.5121)	Top-1 acc 3.906 (6.876)	Top-5 acc 14.844 (19.016)	lr 0.04516
Warmup Train [9][200/3239]	Time 0.498 (0.573)	Data 0.001 (0.064)	Loss 5.5281 (5.5115)	Top-1 acc 7.031 (6.864)	Top-5 acc 17.969 (19.040)	lr 0.04515
Warmup Train [9][210/3239]	Time 0.530 (0.571)	Data 0.001 (0.061)	Loss 5.5754 (5.5097)	Top-1 acc 8.203 (6.881)	Top-5 acc 19.922 (19.078)	lr 0.04515
Warmup Train [9][220/3239]	Time 0.494 (0.568)	Data 0.002 (0.059)	Loss 5.4989 (5.5107)	Top-1 acc 7.031 (6.892)	Top-5 acc 18.750 (19.077)	lr 0.04515
Warmup Train [9][230/3239]	Time 0.510 (0.566)	Data 0.001 (0.056)	Loss 5.5761 (5.5121)	Top-1 acc 7.031 (6.852)	Top-5 acc 20.703 (19.043)	lr 0.04514
Warmup Train [9][240/3239]	Time 0.481 (0.565)	Data 0.001 (0.054)	Loss 5.5931 (5.5124)	Top-1 acc 7.031 (6.830)	Top-5 acc 15.234 (19.011)	lr 0.04514
Warmup Train [9][250/3239]	Time 0.559 (0.561)	Data 0.001 (0.052)	Loss 5.4542 (5.5117)	Top-1 acc 7.031 (6.844)	Top-5 acc 16.406 (18.979)	lr 0.04514
Warmup Train [9][260/3239]	Time 0.642 (0.560)	Data 0.001 (0.050)	Loss 5.5646 (5.5127)	Top-1 acc 8.203 (6.843)	Top-5 acc 18.359 (18.949)	lr 0.04513
Warmup Train [9][270/3239]	Time 0.481 (0.557)	Data 0.001 (0.049)	Loss 5.3782 (5.5136)	Top-1 acc 5.469 (6.801)	Top-5 acc 16.016 (18.922)	lr 0.04513
Warmup Train [9][280/3239]	Time 0.669 (0.555)	Data 0.001 (0.047)	Loss 5.4356 (5.5112)	Top-1 acc 7.812 (6.834)	Top-5 acc 22.656 (18.995)	lr 0.04513
Warmup Train [9][290/3239]	Time 0.605 (0.551)	Data 0.001 (0.045)	Loss 5.4011 (5.5121)	Top-1 acc 10.156 (6.850)	Top-5 acc 23.828 (18.984)	lr 0.04512
Warmup Train [9][300/3239]	Time 0.513 (0.550)	Data 0.001 (0.044)	Loss 5.6503 (5.5126)	Top-1 acc 6.641 (6.860)	Top-5 acc 19.531 (19.008)	lr 0.04512
Warmup Train [9][310/3239]	Time 0.510 (0.550)	Data 0.001 (0.043)	Loss 5.4792 (5.5132)	Top-1 acc 7.422 (6.833)	Top-5 acc 17.578 (18.971)	lr 0.04511
Warmup Train [9][320/3239]	Time 0.543 (0.549)	Data 0.001 (0.042)	Loss 5.5299 (5.5135)	Top-1 acc 4.297 (6.826)	Top-5 acc 14.453 (18.942)	lr 0.04511
Warmup Train [9][330/3239]	Time 0.601 (0.547)	Data 0.001 (0.041)	Loss 5.4471 (5.5127)	Top-1 acc 6.641 (6.832)	Top-5 acc 18.750 (18.946)	lr 0.04511
Warmup Train [9][340/3239]	Time 0.498 (0.546)	Data 0.001 (0.039)	Loss 5.5593 (5.5115)	Top-1 acc 8.203 (6.840)	Top-5 acc 16.406 (18.986)	lr 0.04510
Warmup Train [9][350/3239]	Time 0.394 (0.545)	Data 0.001 (0.039)	Loss 5.5226 (5.5107)	Top-1 acc 7.422 (6.840)	Top-5 acc 19.922 (19.010)	lr 0.04510
Warmup Train [9][360/3239]	Time 0.674 (0.545)	Data 0.001 (0.038)	Loss 5.5113 (5.5097)	Top-1 acc 5.469 (6.838)	Top-5 acc 21.094 (19.022)	lr 0.04510
Warmup Train [9][370/3239]	Time 0.433 (0.544)	Data 0.001 (0.037)	Loss 5.4614 (5.5091)	Top-1 acc 6.250 (6.853)	Top-5 acc 23.047 (19.033)	lr 0.04509
Warmup Train [9][380/3239]	Time 0.658 (0.543)	Data 0.001 (0.037)	Loss 5.5337 (5.5095)	Top-1 acc 5.469 (6.855)	Top-5 acc 18.359 (19.050)	lr 0.04509
Warmup Train [9][390/3239]	Time 0.606 (0.543)	Data 0.001 (0.036)	Loss 5.7115 (5.5097)	Top-1 acc 8.594 (6.887)	Top-5 acc 17.969 (19.075)	lr 0.04509
Warmup Train [9][400/3239]	Time 0.474 (0.542)	Data 0.001 (0.035)	Loss 5.4298 (5.5088)	Top-1 acc 8.594 (6.900)	Top-5 acc 21.484 (19.099)	lr 0.04508
Warmup Train [9][410/3239]	Time 0.526 (0.542)	Data 0.002 (0.034)	Loss 5.4892 (5.5087)	Top-1 acc 7.422 (6.871)	Top-5 acc 21.875 (19.105)	lr 0.04508
Warmup Train [9][420/3239]	Time 0.512 (0.541)	Data 0.001 (0.033)	Loss 5.5127 (5.5072)	Top-1 acc 6.641 (6.878)	Top-5 acc 18.750 (19.124)	lr 0.04507
Warmup Train [9][430/3239]	Time 0.592 (0.541)	Data 0.001 (0.033)	Loss 5.4939 (5.5062)	Top-1 acc 7.812 (6.884)	Top-5 acc 17.578 (19.145)	lr 0.04507
Warmup Train [9][440/3239]	Time 0.359 (0.540)	Data 0.001 (0.032)	Loss 5.4169 (5.5061)	Top-1 acc 9.766 (6.898)	Top-5 acc 20.703 (19.155)	lr 0.04507
Warmup Train [9][450/3239]	Time 0.397 (0.539)	Data 0.001 (0.031)	Loss 5.4277 (5.5058)	Top-1 acc 8.203 (6.896)	Top-5 acc 21.094 (19.151)	lr 0.04506
Warmup Train [9][460/3239]	Time 0.486 (0.538)	Data 0.001 (0.031)	Loss 5.5424 (5.5060)	Top-1 acc 8.203 (6.889)	Top-5 acc 19.531 (19.147)	lr 0.04506
Warmup Train [9][470/3239]	Time 0.632 (0.538)	Data 0.001 (0.030)	Loss 5.4779 (5.5056)	Top-1 acc 8.594 (6.894)	Top-5 acc 19.922 (19.151)	lr 0.04506
Warmup Train [9][480/3239]	Time 0.299 (0.537)	Data 0.001 (0.030)	Loss 5.4956 (5.5055)	Top-1 acc 6.250 (6.907)	Top-5 acc 19.922 (19.171)	lr 0.04505
Warmup Train [9][490/3239]	Time 0.537 (0.537)	Data 0.001 (0.030)	Loss 5.5922 (5.5059)	Top-1 acc 5.469 (6.907)	Top-5 acc 17.188 (19.160)	lr 0.04505
Warmup Train [9][500/3239]	Time 0.553 (0.537)	Data 0.001 (0.029)	Loss 5.5225 (5.5059)	Top-1 acc 7.031 (6.910)	Top-5 acc 18.750 (19.169)	lr 0.04505
Warmup Train [9][510/3239]	Time 0.714 (0.536)	Data 0.001 (0.029)	Loss 5.6025 (5.5058)	Top-1 acc 5.078 (6.905)	Top-5 acc 18.750 (19.194)	lr 0.04504
Warmup Train [9][520/3239]	Time 0.406 (0.535)	Data 0.001 (0.028)	Loss 5.5552 (5.5053)	Top-1 acc 5.469 (6.893)	Top-5 acc 18.750 (19.210)	lr 0.04504
Warmup Train [9][530/3239]	Time 0.302 (0.534)	Data 0.001 (0.028)	Loss 5.4704 (5.5053)	Top-1 acc 10.547 (6.891)	Top-5 acc 21.094 (19.216)	lr 0.04503
Warmup Train [9][540/3239]	Time 0.392 (0.533)	Data 0.001 (0.028)	Loss 5.4722 (5.5054)	Top-1 acc 6.250 (6.883)	Top-5 acc 18.359 (19.216)	lr 0.04503
Warmup Train [9][550/3239]	Time 0.441 (0.532)	Data 0.001 (0.027)	Loss 5.4743 (5.5052)	Top-1 acc 7.031 (6.884)	Top-5 acc 18.359 (19.207)	lr 0.04503
Warmup Train [9][560/3239]	Time 0.457 (0.530)	Data 0.001 (0.027)	Loss 5.5128 (5.5047)	Top-1 acc 8.594 (6.885)	Top-5 acc 19.922 (19.217)	lr 0.04502
Warmup Train [9][570/3239]	Time 0.452 (0.530)	Data 0.001 (0.027)	Loss 5.4609 (5.5042)	Top-1 acc 7.031 (6.879)	Top-5 acc 17.578 (19.211)	lr 0.04502
Warmup Train [9][580/3239]	Time 0.520 (0.530)	Data 0.001 (0.026)	Loss 5.4164 (5.5032)	Top-1 acc 6.641 (6.886)	Top-5 acc 20.312 (19.223)	lr 0.04502
Warmup Train [9][590/3239]	Time 0.598 (0.529)	Data 0.001 (0.026)	Loss 5.3736 (5.5022)	Top-1 acc 6.250 (6.899)	Top-5 acc 20.312 (19.242)	lr 0.04501
Warmup Train [9][600/3239]	Time 0.530 (0.529)	Data 0.001 (0.026)	Loss 5.5447 (5.5022)	Top-1 acc 6.641 (6.894)	Top-5 acc 16.406 (19.250)	lr 0.04501
Warmup Train [9][610/3239]	Time 0.513 (0.529)	Data 0.002 (0.025)	Loss 5.5077 (5.5020)	Top-1 acc 9.375 (6.896)	Top-5 acc 20.312 (19.260)	lr 0.04501
Warmup Train [9][620/3239]	Time 0.548 (0.529)	Data 0.001 (0.025)	Loss 5.4802 (5.5019)	Top-1 acc 7.422 (6.896)	Top-5 acc 21.484 (19.252)	lr 0.04500
Warmup Train [9][630/3239]	Time 0.337 (0.528)	Data 0.001 (0.025)	Loss 5.3795 (5.5018)	Top-1 acc 6.641 (6.899)	Top-5 acc 23.047 (19.256)	lr 0.04500
Warmup Train [9][640/3239]	Time 0.405 (0.528)	Data 0.001 (0.025)	Loss 5.4664 (5.5016)	Top-1 acc 6.641 (6.892)	Top-5 acc 21.094 (19.247)	lr 0.04500
Warmup Train [9][650/3239]	Time 0.425 (0.527)	Data 0.001 (0.024)	Loss 5.5139 (5.5014)	Top-1 acc 6.641 (6.897)	Top-5 acc 18.750 (19.252)	lr 0.04499
Warmup Train [9][660/3239]	Time 0.402 (0.527)	Data 0.001 (0.024)	Loss 5.4198 (5.5006)	Top-1 acc 7.422 (6.904)	Top-5 acc 21.875 (19.278)	lr 0.04499
Warmup Train [9][670/3239]	Time 0.530 (0.527)	Data 0.001 (0.024)	Loss 5.6523 (5.5007)	Top-1 acc 4.688 (6.903)	Top-5 acc 18.359 (19.270)	lr 0.04498
Warmup Train [9][680/3239]	Time 0.601 (0.527)	Data 0.001 (0.024)	Loss 5.5204 (5.5008)	Top-1 acc 7.031 (6.908)	Top-5 acc 16.406 (19.259)	lr 0.04498
Warmup Train [9][690/3239]	Time 0.507 (0.527)	Data 0.001 (0.023)	Loss 5.5683 (5.4999)	Top-1 acc 7.031 (6.916)	Top-5 acc 16.797 (19.275)	lr 0.04498
Warmup Train [9][700/3239]	Time 0.572 (0.527)	Data 0.001 (0.023)	Loss 5.4417 (5.4995)	Top-1 acc 6.250 (6.913)	Top-5 acc 22.656 (19.280)	lr 0.04497
Warmup Train [9][710/3239]	Time 0.423 (0.527)	Data 0.001 (0.023)	Loss 5.4517 (5.4994)	Top-1 acc 7.812 (6.927)	Top-5 acc 23.047 (19.298)	lr 0.04497
Warmup Train [9][720/3239]	Time 0.618 (0.527)	Data 0.001 (0.023)	Loss 5.3758 (5.4986)	Top-1 acc 7.031 (6.941)	Top-5 acc 20.703 (19.319)	lr 0.04497
Warmup Train [9][730/3239]	Time 0.611 (0.527)	Data 0.001 (0.022)	Loss 5.6314 (5.4982)	Top-1 acc 7.031 (6.941)	Top-5 acc 15.234 (19.328)	lr 0.04496
Warmup Train [9][740/3239]	Time 0.592 (0.526)	Data 0.002 (0.022)	Loss 5.5498 (5.4980)	Top-1 acc 7.812 (6.948)	Top-5 acc 16.016 (19.341)	lr 0.04496
Warmup Train [9][750/3239]	Time 0.408 (0.526)	Data 0.001 (0.022)	Loss 5.4001 (5.4978)	Top-1 acc 9.375 (6.950)	Top-5 acc 23.438 (19.338)	lr 0.04495
Warmup Train [9][760/3239]	Time 0.560 (0.526)	Data 0.001 (0.022)	Loss 5.5220 (5.4982)	Top-1 acc 3.125 (6.935)	Top-5 acc 14.844 (19.319)	lr 0.04495
Warmup Train [9][770/3239]	Time 0.551 (0.526)	Data 0.001 (0.022)	Loss 5.5364 (5.4984)	Top-1 acc 5.859 (6.939)	Top-5 acc 19.922 (19.316)	lr 0.04495
Warmup Train [9][780/3239]	Time 0.550 (0.525)	Data 0.001 (0.021)	Loss 5.5460 (5.4979)	Top-1 acc 7.422 (6.953)	Top-5 acc 19.141 (19.337)	lr 0.04494
Warmup Train [9][790/3239]	Time 0.592 (0.525)	Data 0.001 (0.021)	Loss 5.5522 (5.4976)	Top-1 acc 7.031 (6.957)	Top-5 acc 19.922 (19.346)	lr 0.04494
Warmup Train [9][800/3239]	Time 0.362 (0.524)	Data 0.001 (0.021)	Loss 5.5177 (5.4970)	Top-1 acc 7.031 (6.964)	Top-5 acc 16.016 (19.360)	lr 0.04494
Warmup Train [9][810/3239]	Time 0.466 (0.524)	Data 0.001 (0.021)	Loss 5.4821 (5.4972)	Top-1 acc 6.641 (6.963)	Top-5 acc 17.188 (19.357)	lr 0.04493
Warmup Train [9][820/3239]	Time 0.260 (0.523)	Data 0.001 (0.021)	Loss 5.3918 (5.4974)	Top-1 acc 10.156 (6.968)	Top-5 acc 22.266 (19.350)	lr 0.04493
Warmup Train [9][830/3239]	Time 0.717 (0.523)	Data 0.001 (0.021)	Loss 5.4765 (5.4974)	Top-1 acc 8.203 (6.980)	Top-5 acc 21.875 (19.362)	lr 0.04493
Warmup Train [9][840/3239]	Time 0.512 (0.523)	Data 0.001 (0.020)	Loss 5.4028 (5.4973)	Top-1 acc 5.078 (6.983)	Top-5 acc 19.531 (19.368)	lr 0.04492
Warmup Train [9][850/3239]	Time 0.582 (0.523)	Data 0.001 (0.020)	Loss 5.5080 (5.4973)	Top-1 acc 5.859 (6.982)	Top-5 acc 18.750 (19.370)	lr 0.04492
Warmup Train [9][860/3239]	Time 0.706 (0.523)	Data 0.001 (0.020)	Loss 5.4915 (5.4976)	Top-1 acc 7.812 (6.975)	Top-5 acc 22.656 (19.370)	lr 0.04491
Warmup Train [9][870/3239]	Time 0.585 (0.523)	Data 0.001 (0.020)	Loss 5.4532 (5.4974)	Top-1 acc 7.422 (6.975)	Top-5 acc 22.266 (19.373)	lr 0.04491
Warmup Train [9][880/3239]	Time 0.417 (0.523)	Data 0.001 (0.020)	Loss 5.5778 (5.4971)	Top-1 acc 5.078 (6.978)	Top-5 acc 15.234 (19.379)	lr 0.04491
Warmup Train [9][890/3239]	Time 0.443 (0.523)	Data 0.001 (0.020)	Loss 5.4029 (5.4974)	Top-1 acc 7.422 (6.982)	Top-5 acc 22.266 (19.369)	lr 0.04490
Warmup Train [9][900/3239]	Time 0.608 (0.523)	Data 0.001 (0.020)	Loss 5.5033 (5.4975)	Top-1 acc 8.203 (6.974)	Top-5 acc 19.531 (19.364)	lr 0.04490
Warmup Train [9][910/3239]	Time 0.540 (0.523)	Data 0.001 (0.020)	Loss 5.6068 (5.4976)	Top-1 acc 6.250 (6.985)	Top-5 acc 18.359 (19.381)	lr 0.04490
Warmup Train [9][920/3239]	Time 0.547 (0.523)	Data 0.001 (0.020)	Loss 5.5597 (5.4973)	Top-1 acc 7.031 (6.981)	Top-5 acc 17.188 (19.383)	lr 0.04489
Warmup Train [9][930/3239]	Time 0.513 (0.523)	Data 0.001 (0.019)	Loss 5.4895 (5.4974)	Top-1 acc 9.375 (6.980)	Top-5 acc 22.656 (19.384)	lr 0.04489
Warmup Train [9][940/3239]	Time 0.673 (0.523)	Data 0.001 (0.019)	Loss 5.5093 (5.4969)	Top-1 acc 6.641 (6.984)	Top-5 acc 21.875 (19.385)	lr 0.04489
Warmup Train [9][950/3239]	Time 0.585 (0.523)	Data 0.001 (0.019)	Loss 5.5413 (5.4970)	Top-1 acc 5.859 (6.979)	Top-5 acc 19.922 (19.387)	lr 0.04488
Warmup Train [9][960/3239]	Time 0.561 (0.523)	Data 0.001 (0.019)	Loss 5.4140 (5.4968)	Top-1 acc 7.812 (6.987)	Top-5 acc 21.875 (19.393)	lr 0.04488
Warmup Train [9][970/3239]	Time 0.537 (0.523)	Data 0.001 (0.019)	Loss 5.4407 (5.4963)	Top-1 acc 7.031 (6.987)	Top-5 acc 22.656 (19.401)	lr 0.04487
Warmup Train [9][980/3239]	Time 0.520 (0.523)	Data 0.001 (0.019)	Loss 5.5100 (5.4962)	Top-1 acc 7.422 (6.991)	Top-5 acc 18.750 (19.404)	lr 0.04487
Warmup Train [9][990/3239]	Time 0.585 (0.522)	Data 0.001 (0.019)	Loss 5.4758 (5.4959)	Top-1 acc 7.422 (6.995)	Top-5 acc 21.094 (19.416)	lr 0.04487
Warmup Train [9][1000/3239]	Time 0.400 (0.522)	Data 0.001 (0.018)	Loss 5.4770 (5.4956)	Top-1 acc 7.031 (6.992)	Top-5 acc 17.188 (19.425)	lr 0.04486
Warmup Train [9][1010/3239]	Time 0.354 (0.522)	Data 0.001 (0.018)	Loss 5.4634 (5.4954)	Top-1 acc 10.156 (7.003)	Top-5 acc 20.312 (19.426)	lr 0.04486
Warmup Train [9][1020/3239]	Time 0.485 (0.522)	Data 0.001 (0.018)	Loss 5.3492 (5.4956)	Top-1 acc 6.641 (6.996)	Top-5 acc 21.484 (19.432)	lr 0.04486
Warmup Train [9][1030/3239]	Time 0.300 (0.522)	Data 0.001 (0.018)	Loss 5.3677 (5.4954)	Top-1 acc 8.984 (7.002)	Top-5 acc 23.047 (19.433)	lr 0.04485
Warmup Train [9][1040/3239]	Time 0.611 (0.522)	Data 0.001 (0.018)	Loss 5.5643 (5.4948)	Top-1 acc 6.641 (7.009)	Top-5 acc 17.969 (19.437)	lr 0.04485
Warmup Train [9][1050/3239]	Time 0.597 (0.521)	Data 0.001 (0.018)	Loss 5.4085 (5.4944)	Top-1 acc 10.938 (7.023)	Top-5 acc 24.609 (19.450)	lr 0.04484
Warmup Train [9][1060/3239]	Time 0.733 (0.521)	Data 0.001 (0.018)	Loss 5.5132 (5.4942)	Top-1 acc 5.859 (7.019)	Top-5 acc 21.484 (19.450)	lr 0.04484
Warmup Train [9][1070/3239]	Time 0.564 (0.521)	Data 0.001 (0.018)	Loss 5.6016 (5.4943)	Top-1 acc 6.250 (7.019)	Top-5 acc 16.016 (19.443)	lr 0.04484
Warmup Train [9][1080/3239]	Time 0.430 (0.521)	Data 0.001 (0.018)	Loss 5.4492 (5.4941)	Top-1 acc 5.469 (7.014)	Top-5 acc 15.625 (19.448)	lr 0.04483
Warmup Train [9][1090/3239]	Time 0.490 (0.520)	Data 0.001 (0.018)	Loss 5.4323 (5.4939)	Top-1 acc 8.203 (7.008)	Top-5 acc 24.219 (19.446)	lr 0.04483
Warmup Train [9][1100/3239]	Time 0.587 (0.519)	Data 0.001 (0.018)	Loss 5.4861 (5.4935)	Top-1 acc 7.422 (7.011)	Top-5 acc 17.578 (19.454)	lr 0.04483
Warmup Train [9][1110/3239]	Time 0.524 (0.520)	Data 0.001 (0.017)	Loss 5.2947 (5.4933)	Top-1 acc 10.156 (7.021)	Top-5 acc 25.391 (19.461)	lr 0.04482
Warmup Train [9][1120/3239]	Time 0.597 (0.520)	Data 0.001 (0.017)	Loss 5.4258 (5.4930)	Top-1 acc 8.203 (7.029)	Top-5 acc 22.656 (19.471)	lr 0.04482
Warmup Train [9][1130/3239]	Time 0.413 (0.520)	Data 0.001 (0.017)	Loss 5.5075 (5.4928)	Top-1 acc 8.203 (7.027)	Top-5 acc 21.875 (19.478)	lr 0.04482
Warmup Train [9][1140/3239]	Time 0.554 (0.520)	Data 0.001 (0.017)	Loss 5.3960 (5.4926)	Top-1 acc 7.812 (7.031)	Top-5 acc 21.484 (19.482)	lr 0.04481
Warmup Train [9][1150/3239]	Time 0.340 (0.519)	Data 0.001 (0.017)	Loss 5.5586 (5.4926)	Top-1 acc 5.469 (7.025)	Top-5 acc 17.969 (19.484)	lr 0.04481
Warmup Train [9][1160/3239]	Time 0.570 (0.519)	Data 0.001 (0.017)	Loss 5.3456 (5.4926)	Top-1 acc 7.422 (7.018)	Top-5 acc 22.656 (19.481)	lr 0.04480
Warmup Train [9][1170/3239]	Time 0.375 (0.519)	Data 0.001 (0.017)	Loss 5.5169 (5.4924)	Top-1 acc 7.031 (7.027)	Top-5 acc 18.359 (19.487)	lr 0.04480
Warmup Train [9][1180/3239]	Time 0.566 (0.519)	Data 0.001 (0.017)	Loss 5.2968 (5.4921)	Top-1 acc 8.203 (7.025)	Top-5 acc 24.609 (19.493)	lr 0.04480
Warmup Train [9][1190/3239]	Time 0.431 (0.519)	Data 0.001 (0.017)	Loss 5.5224 (5.4921)	Top-1 acc 8.203 (7.030)	Top-5 acc 19.531 (19.500)	lr 0.04479
Warmup Train [9][1200/3239]	Time 0.536 (0.519)	Data 0.001 (0.017)	Loss 5.4293 (5.4918)	Top-1 acc 5.859 (7.032)	Top-5 acc 20.312 (19.504)	lr 0.04479
Warmup Train [9][1210/3239]	Time 0.632 (0.519)	Data 0.001 (0.017)	Loss 5.5946 (5.4924)	Top-1 acc 5.469 (7.024)	Top-5 acc 19.141 (19.495)	lr 0.04479
Warmup Train [9][1220/3239]	Time 0.712 (0.519)	Data 0.001 (0.016)	Loss 5.3954 (5.4921)	Top-1 acc 7.422 (7.024)	Top-5 acc 20.312 (19.490)	lr 0.04478
Warmup Train [9][1230/3239]	Time 0.426 (0.519)	Data 0.001 (0.016)	Loss 5.5187 (5.4919)	Top-1 acc 6.250 (7.020)	Top-5 acc 19.141 (19.491)	lr 0.04478
Warmup Train [9][1240/3239]	Time 0.593 (0.519)	Data 0.001 (0.016)	Loss 5.6591 (5.4922)	Top-1 acc 3.125 (7.022)	Top-5 acc 16.016 (19.491)	lr 0.04477
Warmup Train [9][1250/3239]	Time 0.638 (0.519)	Data 0.001 (0.016)	Loss 5.4538 (5.4922)	Top-1 acc 6.641 (7.027)	Top-5 acc 19.141 (19.496)	lr 0.04477
Warmup Train [9][1260/3239]	Time 0.761 (0.519)	Data 0.001 (0.016)	Loss 5.6230 (5.4920)	Top-1 acc 5.078 (7.031)	Top-5 acc 19.922 (19.500)	lr 0.04477
Warmup Train [9][1270/3239]	Time 0.582 (0.519)	Data 0.001 (0.016)	Loss 5.3598 (5.4916)	Top-1 acc 9.375 (7.043)	Top-5 acc 25.000 (19.510)	lr 0.04476
Warmup Train [9][1280/3239]	Time 0.479 (0.519)	Data 0.001 (0.016)	Loss 5.5061 (5.4915)	Top-1 acc 5.469 (7.042)	Top-5 acc 19.141 (19.509)	lr 0.04476
Warmup Train [9][1290/3239]	Time 0.519 (0.519)	Data 0.001 (0.016)	Loss 5.4137 (5.4914)	Top-1 acc 7.812 (7.039)	Top-5 acc 23.438 (19.509)	lr 0.04476
Warmup Train [9][1300/3239]	Time 0.550 (0.519)	Data 0.001 (0.016)	Loss 5.3780 (5.4914)	Top-1 acc 7.422 (7.039)	Top-5 acc 21.094 (19.503)	lr 0.04475
Warmup Train [9][1310/3239]	Time 0.317 (0.519)	Data 0.001 (0.016)	Loss 5.4856 (5.4913)	Top-1 acc 6.250 (7.040)	Top-5 acc 20.312 (19.502)	lr 0.04475
Warmup Train [9][1320/3239]	Time 0.469 (0.519)	Data 0.001 (0.016)	Loss 5.4672 (5.4911)	Top-1 acc 5.469 (7.045)	Top-5 acc 18.359 (19.508)	lr 0.04474
Warmup Train [9][1330/3239]	Time 0.599 (0.519)	Data 0.001 (0.016)	Loss 5.4854 (5.4915)	Top-1 acc 5.469 (7.040)	Top-5 acc 19.141 (19.504)	lr 0.04474
Warmup Train [9][1340/3239]	Time 0.534 (0.518)	Data 0.001 (0.015)	Loss 5.3711 (5.4911)	Top-1 acc 10.547 (7.045)	Top-5 acc 23.047 (19.516)	lr 0.04474
Warmup Train [9][1350/3239]	Time 0.536 (0.518)	Data 0.001 (0.015)	Loss 5.5065 (5.4908)	Top-1 acc 6.641 (7.052)	Top-5 acc 19.141 (19.530)	lr 0.04473
Warmup Train [9][1360/3239]	Time 0.582 (0.518)	Data 0.001 (0.015)	Loss 5.4825 (5.4914)	Top-1 acc 6.641 (7.047)	Top-5 acc 20.703 (19.522)	lr 0.04473
Warmup Train [9][1370/3239]	Time 0.578 (0.518)	Data 0.002 (0.015)	Loss 5.5285 (5.4913)	Top-1 acc 5.469 (7.044)	Top-5 acc 17.969 (19.525)	lr 0.04473
Warmup Train [9][1380/3239]	Time 0.690 (0.518)	Data 0.001 (0.015)	Loss 5.5159 (5.4911)	Top-1 acc 6.641 (7.049)	Top-5 acc 18.359 (19.536)	lr 0.04472
Warmup Train [9][1390/3239]	Time 0.508 (0.518)	Data 0.001 (0.015)	Loss 5.5530 (5.4908)	Top-1 acc 6.641 (7.055)	Top-5 acc 22.656 (19.545)	lr 0.04472
Warmup Train [9][1400/3239]	Time 0.558 (0.518)	Data 0.001 (0.015)	Loss 5.5248 (5.4911)	Top-1 acc 5.078 (7.053)	Top-5 acc 19.141 (19.540)	lr 0.04472
Warmup Train [9][1410/3239]	Time 0.549 (0.517)	Data 0.001 (0.015)	Loss 5.6134 (5.4907)	Top-1 acc 5.859 (7.057)	Top-5 acc 16.406 (19.552)	lr 0.04471
Warmup Train [9][1420/3239]	Time 0.643 (0.517)	Data 0.001 (0.015)	Loss 5.6423 (5.4907)	Top-1 acc 3.906 (7.054)	Top-5 acc 15.625 (19.551)	lr 0.04471
Warmup Train [9][1430/3239]	Time 0.426 (0.517)	Data 0.001 (0.015)	Loss 5.3793 (5.4904)	Top-1 acc 8.594 (7.058)	Top-5 acc 23.047 (19.552)	lr 0.04470
Warmup Train [9][1440/3239]	Time 0.350 (0.517)	Data 0.001 (0.015)	Loss 5.5795 (5.4904)	Top-1 acc 5.469 (7.057)	Top-5 acc 18.359 (19.551)	lr 0.04470
Warmup Train [9][1450/3239]	Time 0.388 (0.517)	Data 0.001 (0.015)	Loss 5.6084 (5.4905)	Top-1 acc 5.469 (7.061)	Top-5 acc 15.625 (19.553)	lr 0.04470
Warmup Train [9][1460/3239]	Time 0.364 (0.517)	Data 0.001 (0.015)	Loss 5.4652 (5.4904)	Top-1 acc 8.594 (7.063)	Top-5 acc 21.875 (19.559)	lr 0.04469
Warmup Train [9][1470/3239]	Time 0.487 (0.517)	Data 0.001 (0.015)	Loss 5.4265 (5.4905)	Top-1 acc 8.984 (7.063)	Top-5 acc 21.094 (19.557)	lr 0.04469
Warmup Train [9][1480/3239]	Time 0.442 (0.517)	Data 0.001 (0.015)	Loss 5.4053 (5.4901)	Top-1 acc 6.250 (7.065)	Top-5 acc 22.266 (19.564)	lr 0.04469
Warmup Train [9][1490/3239]	Time 0.782 (0.517)	Data 0.001 (0.015)	Loss 5.4283 (5.4899)	Top-1 acc 6.250 (7.067)	Top-5 acc 20.703 (19.565)	lr 0.04468
Warmup Train [9][1500/3239]	Time 0.490 (0.517)	Data 0.001 (0.015)	Loss 5.4598 (5.4897)	Top-1 acc 7.422 (7.070)	Top-5 acc 19.141 (19.566)	lr 0.04468
Warmup Train [9][1510/3239]	Time 0.444 (0.517)	Data 0.001 (0.014)	Loss 5.5170 (5.4896)	Top-1 acc 6.250 (7.072)	Top-5 acc 19.531 (19.574)	lr 0.04467
Warmup Train [9][1520/3239]	Time 0.437 (0.517)	Data 0.001 (0.014)	Loss 5.3524 (5.4894)	Top-1 acc 10.156 (7.075)	Top-5 acc 21.484 (19.578)	lr 0.04467
Warmup Train [9][1530/3239]	Time 0.684 (0.517)	Data 0.001 (0.014)	Loss 5.3732 (5.4893)	Top-1 acc 10.547 (7.083)	Top-5 acc 24.609 (19.591)	lr 0.04467
Warmup Train [9][1540/3239]	Time 0.519 (0.517)	Data 0.001 (0.014)	Loss 5.4900 (5.4891)	Top-1 acc 9.375 (7.089)	Top-5 acc 19.141 (19.596)	lr 0.04466
Warmup Train [9][1550/3239]	Time 0.380 (0.517)	Data 0.001 (0.014)	Loss 5.3961 (5.4888)	Top-1 acc 8.203 (7.099)	Top-5 acc 21.875 (19.602)	lr 0.04466
Warmup Train [9][1560/3239]	Time 0.559 (0.517)	Data 0.001 (0.014)	Loss 5.5540 (5.4888)	Top-1 acc 7.031 (7.098)	Top-5 acc 16.406 (19.598)	lr 0.04466
Warmup Train [9][1570/3239]	Time 0.416 (0.517)	Data 0.001 (0.014)	Loss 5.6089 (5.4887)	Top-1 acc 4.688 (7.098)	Top-5 acc 18.359 (19.601)	lr 0.04465
Warmup Train [9][1580/3239]	Time 0.393 (0.516)	Data 0.001 (0.014)	Loss 5.4435 (5.4883)	Top-1 acc 7.812 (7.101)	Top-5 acc 18.750 (19.603)	lr 0.04465
Warmup Train [9][1590/3239]	Time 0.529 (0.516)	Data 0.001 (0.014)	Loss 5.3562 (5.4882)	Top-1 acc 6.250 (7.103)	Top-5 acc 21.875 (19.604)	lr 0.04464
Warmup Train [9][1600/3239]	Time 0.213 (0.516)	Data 0.001 (0.014)	Loss 5.3028 (5.4879)	Top-1 acc 8.203 (7.112)	Top-5 acc 20.703 (19.612)	lr 0.04464
Warmup Train [9][1610/3239]	Time 0.603 (0.516)	Data 0.001 (0.014)	Loss 5.3022 (5.4875)	Top-1 acc 7.031 (7.110)	Top-5 acc 26.562 (19.624)	lr 0.04464
Warmup Train [9][1620/3239]	Time 0.371 (0.516)	Data 0.001 (0.014)	Loss 5.4831 (5.4872)	Top-1 acc 5.859 (7.106)	Top-5 acc 19.922 (19.627)	lr 0.04463
Warmup Train [9][1630/3239]	Time 0.592 (0.516)	Data 0.001 (0.014)	Loss 5.3688 (5.4869)	Top-1 acc 7.812 (7.108)	Top-5 acc 19.922 (19.627)	lr 0.04463
Warmup Train [9][1640/3239]	Time 0.504 (0.516)	Data 0.001 (0.014)	Loss 5.6606 (5.4869)	Top-1 acc 1.953 (7.103)	Top-5 acc 17.969 (19.630)	lr 0.04463
Warmup Train [9][1650/3239]	Time 0.349 (0.515)	Data 0.001 (0.014)	Loss 5.5253 (5.4868)	Top-1 acc 7.031 (7.105)	Top-5 acc 19.922 (19.633)	lr 0.04462
Warmup Train [9][1660/3239]	Time 0.506 (0.515)	Data 0.001 (0.014)	Loss 5.3950 (5.4868)	Top-1 acc 7.031 (7.105)	Top-5 acc 22.266 (19.637)	lr 0.04462
Warmup Train [9][1670/3239]	Time 0.470 (0.516)	Data 0.001 (0.014)	Loss 5.4994 (5.4867)	Top-1 acc 6.641 (7.104)	Top-5 acc 21.875 (19.639)	lr 0.04461
Warmup Train [9][1680/3239]	Time 0.730 (0.516)	Data 0.001 (0.014)	Loss 5.4955 (5.4865)	Top-1 acc 7.031 (7.107)	Top-5 acc 16.797 (19.641)	lr 0.04461
Warmup Train [9][1690/3239]	Time 0.622 (0.516)	Data 0.001 (0.014)	Loss 5.5607 (5.4866)	Top-1 acc 8.203 (7.109)	Top-5 acc 17.578 (19.635)	lr 0.04461
Warmup Train [9][1700/3239]	Time 0.365 (0.515)	Data 0.001 (0.014)	Loss 5.3279 (5.4863)	Top-1 acc 10.156 (7.112)	Top-5 acc 22.266 (19.638)	lr 0.04460
Warmup Train [9][1710/3239]	Time 0.496 (0.515)	Data 0.001 (0.014)	Loss 5.3168 (5.4862)	Top-1 acc 8.594 (7.110)	Top-5 acc 22.266 (19.641)	lr 0.04460
Warmup Train [9][1720/3239]	Time 0.592 (0.515)	Data 0.001 (0.014)	Loss 5.3584 (5.4857)	Top-1 acc 7.422 (7.116)	Top-5 acc 21.484 (19.652)	lr 0.04460
Warmup Train [9][1730/3239]	Time 0.651 (0.515)	Data 0.001 (0.014)	Loss 5.3749 (5.4856)	Top-1 acc 8.594 (7.121)	Top-5 acc 22.266 (19.659)	lr 0.04459
Warmup Train [9][1740/3239]	Time 0.609 (0.515)	Data 0.001 (0.014)	Loss 5.4469 (5.4853)	Top-1 acc 7.031 (7.123)	Top-5 acc 18.359 (19.664)	lr 0.04459
Warmup Train [9][1750/3239]	Time 0.522 (0.515)	Data 0.001 (0.014)	Loss 5.3100 (5.4848)	Top-1 acc 9.375 (7.126)	Top-5 acc 23.047 (19.670)	lr 0.04458
Warmup Train [9][1760/3239]	Time 0.517 (0.515)	Data 0.001 (0.014)	Loss 5.3958 (5.4847)	Top-1 acc 6.641 (7.126)	Top-5 acc 23.047 (19.669)	lr 0.04458
Warmup Train [9][1770/3239]	Time 0.487 (0.515)	Data 0.001 (0.013)	Loss 5.3701 (5.4844)	Top-1 acc 8.203 (7.127)	Top-5 acc 23.047 (19.675)	lr 0.04458
Warmup Train [9][1780/3239]	Time 0.627 (0.515)	Data 0.001 (0.013)	Loss 5.3974 (5.4841)	Top-1 acc 10.547 (7.130)	Top-5 acc 23.438 (19.682)	lr 0.04457
Warmup Train [9][1790/3239]	Time 0.476 (0.515)	Data 0.001 (0.013)	Loss 5.5903 (5.4840)	Top-1 acc 3.906 (7.128)	Top-5 acc 17.969 (19.686)	lr 0.04457
Warmup Train [9][1800/3239]	Time 0.418 (0.515)	Data 0.001 (0.013)	Loss 5.3022 (5.4836)	Top-1 acc 12.109 (7.133)	Top-5 acc 27.734 (19.699)	lr 0.04457
Warmup Train [9][1810/3239]	Time 0.426 (0.515)	Data 0.001 (0.013)	Loss 5.4776 (5.4834)	Top-1 acc 8.203 (7.141)	Top-5 acc 20.312 (19.705)	lr 0.04456
Warmup Train [9][1820/3239]	Time 0.469 (0.515)	Data 0.001 (0.013)	Loss 5.4880 (5.4831)	Top-1 acc 9.766 (7.145)	Top-5 acc 19.922 (19.710)	lr 0.04456
Warmup Train [9][1830/3239]	Time 0.445 (0.515)	Data 0.001 (0.013)	Loss 5.4195 (5.4827)	Top-1 acc 8.594 (7.151)	Top-5 acc 21.875 (19.719)	lr 0.04455
Warmup Train [9][1840/3239]	Time 0.611 (0.515)	Data 0.001 (0.013)	Loss 5.5477 (5.4825)	Top-1 acc 4.688 (7.153)	Top-5 acc 18.359 (19.722)	lr 0.04455
Warmup Train [9][1850/3239]	Time 0.411 (0.515)	Data 0.003 (0.013)	Loss 5.5756 (5.4826)	Top-1 acc 5.469 (7.153)	Top-5 acc 17.969 (19.723)	lr 0.04455
Warmup Train [9][1860/3239]	Time 0.617 (0.515)	Data 0.001 (0.013)	Loss 5.4318 (5.4822)	Top-1 acc 8.203 (7.161)	Top-5 acc 19.531 (19.732)	lr 0.04454
Warmup Train [9][1870/3239]	Time 0.411 (0.515)	Data 0.001 (0.013)	Loss 5.2383 (5.4819)	Top-1 acc 9.375 (7.165)	Top-5 acc 21.484 (19.736)	lr 0.04454
Warmup Train [9][1880/3239]	Time 0.578 (0.515)	Data 0.001 (0.013)	Loss 5.4364 (5.4816)	Top-1 acc 5.859 (7.171)	Top-5 acc 19.531 (19.745)	lr 0.04453
Warmup Train [9][1890/3239]	Time 0.428 (0.515)	Data 0.001 (0.013)	Loss 5.2900 (5.4812)	Top-1 acc 9.766 (7.176)	Top-5 acc 22.266 (19.757)	lr 0.04453
Warmup Train [9][1900/3239]	Time 0.421 (0.515)	Data 0.001 (0.013)	Loss 5.5345 (5.4813)	Top-1 acc 7.422 (7.172)	Top-5 acc 18.359 (19.755)	lr 0.04453
Warmup Train [9][1910/3239]	Time 0.628 (0.515)	Data 0.001 (0.013)	Loss 5.4805 (5.4812)	Top-1 acc 4.688 (7.169)	Top-5 acc 18.750 (19.759)	lr 0.04452
Warmup Train [9][1920/3239]	Time 0.453 (0.515)	Data 0.001 (0.013)	Loss 5.5883 (5.4811)	Top-1 acc 5.469 (7.169)	Top-5 acc 19.922 (19.762)	lr 0.04452
Warmup Train [9][1930/3239]	Time 0.481 (0.515)	Data 0.001 (0.013)	Loss 5.3273 (5.4809)	Top-1 acc 8.203 (7.169)	Top-5 acc 21.484 (19.766)	lr 0.04452
Warmup Train [9][1940/3239]	Time 0.516 (0.515)	Data 0.001 (0.013)	Loss 5.3926 (5.4807)	Top-1 acc 5.078 (7.171)	Top-5 acc 17.578 (19.766)	lr 0.04451
Warmup Train [9][1950/3239]	Time 0.443 (0.515)	Data 0.001 (0.013)	Loss 5.3529 (5.4806)	Top-1 acc 5.469 (7.168)	Top-5 acc 20.312 (19.768)	lr 0.04451
Warmup Train [9][1960/3239]	Time 0.451 (0.515)	Data 0.002 (0.013)	Loss 5.4892 (5.4806)	Top-1 acc 7.031 (7.171)	Top-5 acc 18.359 (19.770)	lr 0.04450
Warmup Train [9][1970/3239]	Time 0.598 (0.515)	Data 0.001 (0.013)	Loss 5.3785 (5.4802)	Top-1 acc 6.250 (7.174)	Top-5 acc 20.703 (19.777)	lr 0.04450
Warmup Train [9][1980/3239]	Time 0.613 (0.515)	Data 0.001 (0.013)	Loss 5.5118 (5.4801)	Top-1 acc 7.422 (7.177)	Top-5 acc 21.484 (19.780)	lr 0.04450
Warmup Train [9][1990/3239]	Time 0.504 (0.515)	Data 0.001 (0.013)	Loss 5.4031 (5.4798)	Top-1 acc 4.688 (7.181)	Top-5 acc 16.797 (19.786)	lr 0.04449
Warmup Train [9][2000/3239]	Time 0.683 (0.515)	Data 0.002 (0.013)	Loss 5.5821 (5.4798)	Top-1 acc 4.688 (7.177)	Top-5 acc 14.844 (19.788)	lr 0.04449
Warmup Train [9][2010/3239]	Time 0.605 (0.515)	Data 0.001 (0.013)	Loss 5.5264 (5.4795)	Top-1 acc 7.422 (7.181)	Top-5 acc 19.531 (19.798)	lr 0.04449
Warmup Train [9][2020/3239]	Time 0.500 (0.515)	Data 0.001 (0.013)	Loss 5.5234 (5.4796)	Top-1 acc 8.203 (7.182)	Top-5 acc 18.359 (19.794)	lr 0.04448
Warmup Train [9][2030/3239]	Time 0.602 (0.515)	Data 0.002 (0.013)	Loss 5.5859 (5.4794)	Top-1 acc 7.031 (7.185)	Top-5 acc 16.797 (19.793)	lr 0.04448
Warmup Train [9][2040/3239]	Time 0.470 (0.515)	Data 0.001 (0.013)	Loss 5.2352 (5.4793)	Top-1 acc 10.547 (7.184)	Top-5 acc 22.266 (19.797)	lr 0.04447
Warmup Train [9][2050/3239]	Time 0.477 (0.515)	Data 0.001 (0.013)	Loss 5.4634 (5.4790)	Top-1 acc 7.812 (7.183)	Top-5 acc 20.312 (19.792)	lr 0.04447
Warmup Train [9][2060/3239]	Time 0.527 (0.515)	Data 0.001 (0.013)	Loss 5.5020 (5.4788)	Top-1 acc 8.984 (7.185)	Top-5 acc 22.656 (19.796)	lr 0.04447
Warmup Train [9][2070/3239]	Time 0.378 (0.515)	Data 0.001 (0.013)	Loss 5.5289 (5.4786)	Top-1 acc 7.422 (7.188)	Top-5 acc 18.359 (19.802)	lr 0.04446
Warmup Train [9][2080/3239]	Time 0.520 (0.515)	Data 0.001 (0.013)	Loss 5.4697 (5.4785)	Top-1 acc 6.250 (7.189)	Top-5 acc 18.750 (19.808)	lr 0.04446
Warmup Train [9][2090/3239]	Time 0.527 (0.515)	Data 0.001 (0.013)	Loss 5.3422 (5.4785)	Top-1 acc 6.641 (7.188)	Top-5 acc 24.609 (19.812)	lr 0.04446
Warmup Train [9][2100/3239]	Time 0.505 (0.515)	Data 0.001 (0.013)	Loss 5.4561 (5.4782)	Top-1 acc 7.812 (7.189)	Top-5 acc 19.531 (19.813)	lr 0.04445
Warmup Train [9][2110/3239]	Time 0.537 (0.515)	Data 0.001 (0.012)	Loss 5.5740 (5.4780)	Top-1 acc 6.250 (7.191)	Top-5 acc 16.797 (19.816)	lr 0.04445
Warmup Train [9][2120/3239]	Time 0.620 (0.514)	Data 0.001 (0.012)	Loss 5.3071 (5.4779)	Top-1 acc 8.594 (7.191)	Top-5 acc 22.266 (19.815)	lr 0.04444
Warmup Train [9][2130/3239]	Time 0.553 (0.515)	Data 0.001 (0.012)	Loss 5.3584 (5.4779)	Top-1 acc 8.203 (7.191)	Top-5 acc 21.875 (19.818)	lr 0.04444
Warmup Train [9][2140/3239]	Time 0.617 (0.514)	Data 0.001 (0.012)	Loss 5.2817 (5.4777)	Top-1 acc 9.766 (7.195)	Top-5 acc 22.266 (19.821)	lr 0.04444
Warmup Train [9][2150/3239]	Time 0.472 (0.514)	Data 0.001 (0.012)	Loss 5.4915 (5.4774)	Top-1 acc 8.984 (7.199)	Top-5 acc 21.875 (19.831)	lr 0.04443
Warmup Train [9][2160/3239]	Time 0.663 (0.514)	Data 0.001 (0.012)	Loss 5.5288 (5.4770)	Top-1 acc 5.078 (7.202)	Top-5 acc 17.578 (19.837)	lr 0.04443
Warmup Train [9][2170/3239]	Time 0.526 (0.514)	Data 0.001 (0.012)	Loss 5.3807 (5.4768)	Top-1 acc 6.641 (7.202)	Top-5 acc 20.312 (19.837)	lr 0.04442
Warmup Train [9][2180/3239]	Time 0.543 (0.514)	Data 0.001 (0.012)	Loss 5.5084 (5.4765)	Top-1 acc 8.203 (7.205)	Top-5 acc 17.969 (19.844)	lr 0.04442
Warmup Train [9][2190/3239]	Time 0.533 (0.514)	Data 0.001 (0.012)	Loss 5.4189 (5.4764)	Top-1 acc 6.250 (7.207)	Top-5 acc 19.141 (19.848)	lr 0.04442
Warmup Train [9][2200/3239]	Time 0.538 (0.514)	Data 0.001 (0.012)	Loss 5.2928 (5.4760)	Top-1 acc 10.547 (7.215)	Top-5 acc 26.172 (19.858)	lr 0.04441
Warmup Train [9][2210/3239]	Time 0.518 (0.514)	Data 0.001 (0.012)	Loss 5.2843 (5.4757)	Top-1 acc 8.594 (7.216)	Top-5 acc 24.219 (19.865)	lr 0.04441
Warmup Train [9][2220/3239]	Time 0.414 (0.514)	Data 0.002 (0.012)	Loss 5.5370 (5.4755)	Top-1 acc 5.469 (7.212)	Top-5 acc 16.406 (19.865)	lr 0.04441
Warmup Train [9][2230/3239]	Time 0.648 (0.514)	Data 0.001 (0.012)	Loss 5.4669 (5.4756)	Top-1 acc 5.859 (7.212)	Top-5 acc 19.922 (19.863)	lr 0.04440
Warmup Train [9][2240/3239]	Time 0.487 (0.514)	Data 0.001 (0.012)	Loss 5.4049 (5.4756)	Top-1 acc 7.422 (7.210)	Top-5 acc 20.312 (19.865)	lr 0.04440
Warmup Train [9][2250/3239]	Time 0.563 (0.514)	Data 0.001 (0.012)	Loss 5.6495 (5.4756)	Top-1 acc 3.125 (7.208)	Top-5 acc 14.062 (19.870)	lr 0.04439
Warmup Train [9][2260/3239]	Time 0.631 (0.514)	Data 0.001 (0.012)	Loss 5.4238 (5.4753)	Top-1 acc 5.859 (7.210)	Top-5 acc 21.484 (19.877)	lr 0.04439
Warmup Train [9][2270/3239]	Time 0.503 (0.514)	Data 0.001 (0.012)	Loss 5.4877 (5.4753)	Top-1 acc 6.641 (7.208)	Top-5 acc 17.188 (19.873)	lr 0.04439
Warmup Train [9][2280/3239]	Time 0.356 (0.514)	Data 0.001 (0.012)	Loss 5.5889 (5.4752)	Top-1 acc 7.422 (7.209)	Top-5 acc 18.359 (19.876)	lr 0.04438
Warmup Train [9][2290/3239]	Time 0.512 (0.514)	Data 0.001 (0.012)	Loss 5.4095 (5.4749)	Top-1 acc 8.984 (7.210)	Top-5 acc 21.875 (19.885)	lr 0.04438
Warmup Train [9][2300/3239]	Time 0.409 (0.514)	Data 0.002 (0.012)	Loss 5.3941 (5.4748)	Top-1 acc 8.984 (7.210)	Top-5 acc 23.047 (19.891)	lr 0.04438
Warmup Train [9][2310/3239]	Time 0.473 (0.514)	Data 0.001 (0.012)	Loss 5.3576 (5.4746)	Top-1 acc 8.594 (7.211)	Top-5 acc 21.875 (19.892)	lr 0.04437
Warmup Train [9][2320/3239]	Time 0.589 (0.514)	Data 0.001 (0.012)	Loss 5.4231 (5.4745)	Top-1 acc 7.812 (7.214)	Top-5 acc 19.531 (19.896)	lr 0.04437
Warmup Train [9][2330/3239]	Time 0.432 (0.514)	Data 0.001 (0.012)	Loss 5.3200 (5.4742)	Top-1 acc 9.375 (7.216)	Top-5 acc 24.219 (19.902)	lr 0.04436
Warmup Train [9][2340/3239]	Time 0.411 (0.514)	Data 0.001 (0.012)	Loss 5.3783 (5.4740)	Top-1 acc 9.766 (7.217)	Top-5 acc 23.047 (19.904)	lr 0.04436
Warmup Train [9][2350/3239]	Time 0.488 (0.514)	Data 0.001 (0.012)	Loss 5.4310 (5.4738)	Top-1 acc 8.594 (7.219)	Top-5 acc 23.438 (19.906)	lr 0.04436
Warmup Train [9][2360/3239]	Time 0.585 (0.514)	Data 0.001 (0.012)	Loss 5.3216 (5.4736)	Top-1 acc 8.203 (7.219)	Top-5 acc 21.094 (19.910)	lr 0.04435
Warmup Train [9][2370/3239]	Time 0.542 (0.514)	Data 0.001 (0.012)	Loss 5.4162 (5.4732)	Top-1 acc 7.031 (7.222)	Top-5 acc 20.703 (19.916)	lr 0.04435
Warmup Train [9][2380/3239]	Time 0.377 (0.514)	Data 0.001 (0.012)	Loss 5.4184 (5.4731)	Top-1 acc 11.328 (7.223)	Top-5 acc 23.828 (19.920)	lr 0.04434
Warmup Train [9][2390/3239]	Time 0.484 (0.514)	Data 0.001 (0.012)	Loss 5.4681 (5.4730)	Top-1 acc 5.859 (7.223)	Top-5 acc 17.578 (19.924)	lr 0.04434
Warmup Train [9][2400/3239]	Time 0.422 (0.514)	Data 0.001 (0.012)	Loss 5.3647 (5.4727)	Top-1 acc 8.203 (7.227)	Top-5 acc 21.094 (19.930)	lr 0.04434
Warmup Train [9][2410/3239]	Time 0.539 (0.513)	Data 0.001 (0.012)	Loss 5.4207 (5.4727)	Top-1 acc 7.031 (7.231)	Top-5 acc 20.703 (19.927)	lr 0.04433
Warmup Train [9][2420/3239]	Time 0.488 (0.513)	Data 0.001 (0.012)	Loss 5.3836 (5.4724)	Top-1 acc 7.422 (7.232)	Top-5 acc 23.047 (19.934)	lr 0.04433
Warmup Train [9][2430/3239]	Time 0.414 (0.513)	Data 0.001 (0.012)	Loss 5.5078 (5.4723)	Top-1 acc 7.031 (7.232)	Top-5 acc 19.141 (19.936)	lr 0.04433
Warmup Train [9][2440/3239]	Time 0.540 (0.513)	Data 0.001 (0.012)	Loss 5.3946 (5.4721)	Top-1 acc 10.156 (7.237)	Top-5 acc 25.000 (19.939)	lr 0.04432
Warmup Train [9][2450/3239]	Time 0.378 (0.513)	Data 0.001 (0.012)	Loss 5.3252 (5.4719)	Top-1 acc 7.031 (7.237)	Top-5 acc 21.094 (19.941)	lr 0.04432
Warmup Train [9][2460/3239]	Time 0.567 (0.513)	Data 0.001 (0.012)	Loss 5.3698 (5.4718)	Top-1 acc 5.469 (7.237)	Top-5 acc 23.047 (19.944)	lr 0.04431
Warmup Train [9][2470/3239]	Time 0.494 (0.513)	Data 0.001 (0.012)	Loss 5.3749 (5.4716)	Top-1 acc 7.031 (7.239)	Top-5 acc 20.703 (19.948)	lr 0.04431
Warmup Train [9][2480/3239]	Time 0.549 (0.513)	Data 0.001 (0.012)	Loss 5.4684 (5.4714)	Top-1 acc 7.812 (7.242)	Top-5 acc 17.969 (19.949)	lr 0.04431
Warmup Train [9][2490/3239]	Time 0.645 (0.513)	Data 0.001 (0.012)	Loss 5.4303 (5.4713)	Top-1 acc 7.812 (7.242)	Top-5 acc 23.047 (19.952)	lr 0.04430
Warmup Train [9][2500/3239]	Time 0.567 (0.513)	Data 0.001 (0.012)	Loss 5.3666 (5.4710)	Top-1 acc 9.375 (7.243)	Top-5 acc 22.656 (19.956)	lr 0.04430
Warmup Train [9][2510/3239]	Time 0.536 (0.513)	Data 0.001 (0.012)	Loss 5.4152 (5.4709)	Top-1 acc 8.984 (7.245)	Top-5 acc 23.438 (19.960)	lr 0.04429
Warmup Train [9][2520/3239]	Time 0.508 (0.513)	Data 0.001 (0.011)	Loss 5.3898 (5.4708)	Top-1 acc 7.031 (7.243)	Top-5 acc 22.266 (19.964)	lr 0.04429
Warmup Train [9][2530/3239]	Time 0.440 (0.513)	Data 0.001 (0.011)	Loss 5.4959 (5.4708)	Top-1 acc 8.984 (7.248)	Top-5 acc 20.312 (19.967)	lr 0.04429
Warmup Train [9][2540/3239]	Time 0.534 (0.513)	Data 0.001 (0.011)	Loss 5.3552 (5.4705)	Top-1 acc 8.984 (7.251)	Top-5 acc 21.484 (19.972)	lr 0.04428
Warmup Train [9][2550/3239]	Time 0.625 (0.513)	Data 0.001 (0.011)	Loss 5.4854 (5.4705)	Top-1 acc 6.641 (7.250)	Top-5 acc 16.797 (19.971)	lr 0.04428
Warmup Train [9][2560/3239]	Time 0.530 (0.513)	Data 0.001 (0.011)	Loss 5.4637 (5.4703)	Top-1 acc 7.422 (7.253)	Top-5 acc 20.703 (19.975)	lr 0.04428
Warmup Train [9][2570/3239]	Time 0.612 (0.513)	Data 0.001 (0.011)	Loss 5.4355 (5.4701)	Top-1 acc 8.984 (7.256)	Top-5 acc 22.266 (19.983)	lr 0.04427
Warmup Train [9][2580/3239]	Time 0.646 (0.513)	Data 0.001 (0.011)	Loss 5.3793 (5.4700)	Top-1 acc 8.984 (7.259)	Top-5 acc 23.047 (19.988)	lr 0.04427
Warmup Train [9][2590/3239]	Time 0.648 (0.513)	Data 0.001 (0.011)	Loss 5.4507 (5.4697)	Top-1 acc 7.422 (7.263)	Top-5 acc 22.656 (19.991)	lr 0.04426
Warmup Train [9][2600/3239]	Time 0.616 (0.513)	Data 0.001 (0.011)	Loss 5.4524 (5.4698)	Top-1 acc 8.984 (7.265)	Top-5 acc 18.750 (19.989)	lr 0.04426
Warmup Train [9][2610/3239]	Time 0.625 (0.513)	Data 0.001 (0.011)	Loss 5.2794 (5.4696)	Top-1 acc 8.594 (7.267)	Top-5 acc 26.953 (19.994)	lr 0.04426
Warmup Train [9][2620/3239]	Time 0.565 (0.513)	Data 0.001 (0.011)	Loss 5.4759 (5.4694)	Top-1 acc 7.422 (7.268)	Top-5 acc 19.531 (19.997)	lr 0.04425
Warmup Train [9][2630/3239]	Time 0.450 (0.513)	Data 0.001 (0.011)	Loss 5.4310 (5.4692)	Top-1 acc 5.859 (7.273)	Top-5 acc 18.750 (20.001)	lr 0.04425
Warmup Train [9][2640/3239]	Time 0.527 (0.513)	Data 0.001 (0.011)	Loss 5.4464 (5.4690)	Top-1 acc 6.250 (7.275)	Top-5 acc 20.312 (20.005)	lr 0.04424
Warmup Train [9][2650/3239]	Time 0.451 (0.513)	Data 0.001 (0.011)	Loss 5.4846 (5.4688)	Top-1 acc 6.250 (7.274)	Top-5 acc 22.266 (20.012)	lr 0.04424
Warmup Train [9][2660/3239]	Time 0.636 (0.513)	Data 0.001 (0.011)	Loss 5.3671 (5.4686)	Top-1 acc 6.641 (7.274)	Top-5 acc 22.656 (20.013)	lr 0.04424
Warmup Train [9][2670/3239]	Time 0.461 (0.513)	Data 0.001 (0.011)	Loss 5.3977 (5.4684)	Top-1 acc 6.641 (7.272)	Top-5 acc 22.266 (20.013)	lr 0.04423
Warmup Train [9][2680/3239]	Time 0.535 (0.513)	Data 0.002 (0.011)	Loss 5.4461 (5.4682)	Top-1 acc 7.422 (7.273)	Top-5 acc 20.312 (20.015)	lr 0.04423
Warmup Train [9][2690/3239]	Time 0.595 (0.513)	Data 0.001 (0.011)	Loss 5.4976 (5.4682)	Top-1 acc 7.422 (7.273)	Top-5 acc 18.750 (20.014)	lr 0.04422
Warmup Train [9][2700/3239]	Time 0.518 (0.513)	Data 0.001 (0.011)	Loss 5.5485 (5.4680)	Top-1 acc 6.641 (7.274)	Top-5 acc 17.188 (20.018)	lr 0.04422
Warmup Train [9][2710/3239]	Time 0.486 (0.513)	Data 0.001 (0.011)	Loss 5.4552 (5.4677)	Top-1 acc 7.031 (7.277)	Top-5 acc 19.141 (20.022)	lr 0.04422
Warmup Train [9][2720/3239]	Time 0.454 (0.513)	Data 0.001 (0.011)	Loss 5.4162 (5.4676)	Top-1 acc 8.203 (7.277)	Top-5 acc 24.219 (20.025)	lr 0.04421
Warmup Train [9][2730/3239]	Time 0.501 (0.513)	Data 0.001 (0.011)	Loss 5.4210 (5.4674)	Top-1 acc 5.469 (7.279)	Top-5 acc 17.969 (20.032)	lr 0.04421
Warmup Train [9][2740/3239]	Time 0.496 (0.513)	Data 0.001 (0.011)	Loss 5.3602 (5.4672)	Top-1 acc 7.812 (7.282)	Top-5 acc 21.484 (20.035)	lr 0.04421
Warmup Train [9][2750/3239]	Time 0.479 (0.513)	Data 0.001 (0.011)	Loss 5.6239 (5.4671)	Top-1 acc 9.375 (7.285)	Top-5 acc 21.875 (20.039)	lr 0.04420
Warmup Train [9][2760/3239]	Time 0.503 (0.513)	Data 0.001 (0.011)	Loss 5.5717 (5.4670)	Top-1 acc 3.906 (7.286)	Top-5 acc 17.188 (20.046)	lr 0.04420
Warmup Train [9][2770/3239]	Time 0.553 (0.513)	Data 0.002 (0.011)	Loss 5.3898 (5.4667)	Top-1 acc 7.812 (7.289)	Top-5 acc 20.703 (20.049)	lr 0.04419
Warmup Train [9][2780/3239]	Time 0.573 (0.513)	Data 0.001 (0.011)	Loss 5.2879 (5.4665)	Top-1 acc 7.422 (7.291)	Top-5 acc 21.484 (20.052)	lr 0.04419
Warmup Train [9][2790/3239]	Time 0.669 (0.513)	Data 0.001 (0.011)	Loss 5.3036 (5.4663)	Top-1 acc 10.547 (7.294)	Top-5 acc 24.219 (20.057)	lr 0.04419
Warmup Train [9][2800/3239]	Time 0.389 (0.513)	Data 0.001 (0.011)	Loss 5.3992 (5.4660)	Top-1 acc 7.422 (7.296)	Top-5 acc 22.656 (20.062)	lr 0.04418
Warmup Train [9][2810/3239]	Time 0.567 (0.513)	Data 0.001 (0.011)	Loss 5.4443 (5.4659)	Top-1 acc 7.812 (7.299)	Top-5 acc 21.094 (20.068)	lr 0.04418
Warmup Train [9][2820/3239]	Time 0.524 (0.513)	Data 0.001 (0.011)	Loss 5.3956 (5.4657)	Top-1 acc 8.594 (7.302)	Top-5 acc 24.219 (20.073)	lr 0.04417
Warmup Train [9][2830/3239]	Time 0.519 (0.513)	Data 0.001 (0.011)	Loss 5.5060 (5.4656)	Top-1 acc 8.984 (7.304)	Top-5 acc 18.750 (20.075)	lr 0.04417
Warmup Train [9][2840/3239]	Time 0.357 (0.513)	Data 0.001 (0.011)	Loss 5.3871 (5.4654)	Top-1 acc 5.078 (7.302)	Top-5 acc 19.922 (20.074)	lr 0.04417
Warmup Train [9][2850/3239]	Time 0.677 (0.513)	Data 0.001 (0.011)	Loss 5.4519 (5.4653)	Top-1 acc 7.812 (7.303)	Top-5 acc 24.219 (20.077)	lr 0.04416
Warmup Train [9][2860/3239]	Time 0.521 (0.513)	Data 0.001 (0.011)	Loss 5.3822 (5.4652)	Top-1 acc 11.719 (7.305)	Top-5 acc 24.609 (20.081)	lr 0.04416
Warmup Train [9][2870/3239]	Time 0.375 (0.513)	Data 0.001 (0.011)	Loss 5.4608 (5.4651)	Top-1 acc 6.250 (7.304)	Top-5 acc 18.359 (20.087)	lr 0.04416
Warmup Train [9][2880/3239]	Time 0.349 (0.513)	Data 0.001 (0.011)	Loss 5.2754 (5.4648)	Top-1 acc 10.938 (7.307)	Top-5 acc 24.609 (20.092)	lr 0.04415
Warmup Train [9][2890/3239]	Time 0.441 (0.513)	Data 0.001 (0.011)	Loss 5.3799 (5.4647)	Top-1 acc 8.594 (7.309)	Top-5 acc 19.141 (20.095)	lr 0.04415
Warmup Train [9][2900/3239]	Time 0.414 (0.513)	Data 0.001 (0.011)	Loss 5.4393 (5.4645)	Top-1 acc 7.812 (7.311)	Top-5 acc 19.141 (20.099)	lr 0.04414
Warmup Train [9][2910/3239]	Time 0.581 (0.513)	Data 0.001 (0.011)	Loss 5.5677 (5.4644)	Top-1 acc 8.594 (7.310)	Top-5 acc 19.922 (20.098)	lr 0.04414
Warmup Train [9][2920/3239]	Time 0.635 (0.513)	Data 0.001 (0.011)	Loss 5.4418 (5.4645)	Top-1 acc 5.859 (7.309)	Top-5 acc 18.359 (20.098)	lr 0.04414
Warmup Train [9][2930/3239]	Time 0.419 (0.513)	Data 0.001 (0.011)	Loss 5.4966 (5.4644)	Top-1 acc 8.203 (7.312)	Top-5 acc 19.922 (20.100)	lr 0.04413
Warmup Train [9][2940/3239]	Time 0.573 (0.512)	Data 0.001 (0.011)	Loss 5.3541 (5.4643)	Top-1 acc 7.422 (7.315)	Top-5 acc 23.438 (20.104)	lr 0.04413
Warmup Train [9][2950/3239]	Time 0.495 (0.512)	Data 0.001 (0.011)	Loss 5.3934 (5.4642)	Top-1 acc 7.812 (7.316)	Top-5 acc 16.797 (20.106)	lr 0.04412
Warmup Train [9][2960/3239]	Time 0.401 (0.512)	Data 0.001 (0.011)	Loss 5.5351 (5.4642)	Top-1 acc 7.422 (7.316)	Top-5 acc 18.750 (20.107)	lr 0.04412
Warmup Train [9][2970/3239]	Time 0.395 (0.512)	Data 0.001 (0.011)	Loss 5.3307 (5.4640)	Top-1 acc 9.766 (7.320)	Top-5 acc 23.438 (20.112)	lr 0.04412
Warmup Train [9][2980/3239]	Time 0.362 (0.512)	Data 0.001 (0.011)	Loss 5.4999 (5.4639)	Top-1 acc 7.422 (7.320)	Top-5 acc 19.141 (20.115)	lr 0.04411
Warmup Train [9][2990/3239]	Time 0.492 (0.512)	Data 0.001 (0.011)	Loss 5.4921 (5.4638)	Top-1 acc 7.031 (7.321)	Top-5 acc 17.578 (20.113)	lr 0.04411
Warmup Train [9][3000/3239]	Time 0.552 (0.512)	Data 0.001 (0.011)	Loss 5.2969 (5.4636)	Top-1 acc 9.766 (7.321)	Top-5 acc 23.047 (20.116)	lr 0.04410
Warmup Train [9][3010/3239]	Time 0.655 (0.512)	Data 0.001 (0.011)	Loss 5.3813 (5.4634)	Top-1 acc 7.422 (7.322)	Top-5 acc 21.875 (20.119)	lr 0.04410
Warmup Train [9][3020/3239]	Time 0.501 (0.512)	Data 0.002 (0.011)	Loss 5.4011 (5.4633)	Top-1 acc 5.078 (7.322)	Top-5 acc 20.703 (20.120)	lr 0.04410
Warmup Train [9][3030/3239]	Time 0.405 (0.512)	Data 0.001 (0.011)	Loss 5.3752 (5.4632)	Top-1 acc 11.328 (7.324)	Top-5 acc 25.000 (20.124)	lr 0.04409
Warmup Train [9][3040/3239]	Time 0.631 (0.512)	Data 0.001 (0.011)	Loss 5.5330 (5.4632)	Top-1 acc 8.594 (7.328)	Top-5 acc 17.578 (20.128)	lr 0.04409
Warmup Train [9][3050/3239]	Time 0.468 (0.512)	Data 0.001 (0.011)	Loss 5.4803 (5.4631)	Top-1 acc 7.031 (7.331)	Top-5 acc 20.312 (20.132)	lr 0.04408
Warmup Train [9][3060/3239]	Time 0.518 (0.513)	Data 0.001 (0.011)	Loss 5.3628 (5.4629)	Top-1 acc 10.547 (7.333)	Top-5 acc 23.047 (20.138)	lr 0.04408
Warmup Train [9][3070/3239]	Time 0.448 (0.512)	Data 0.001 (0.011)	Loss 5.3829 (5.4629)	Top-1 acc 7.031 (7.333)	Top-5 acc 19.141 (20.140)	lr 0.04408
Warmup Train [9][3080/3239]	Time 0.625 (0.512)	Data 0.001 (0.011)	Loss 5.5133 (5.4627)	Top-1 acc 6.641 (7.330)	Top-5 acc 21.875 (20.145)	lr 0.04407
Warmup Train [9][3090/3239]	Time 0.413 (0.512)	Data 0.001 (0.011)	Loss 5.4358 (5.4626)	Top-1 acc 5.859 (7.334)	Top-5 acc 22.656 (20.151)	lr 0.04407
Warmup Train [9][3100/3239]	Time 0.498 (0.512)	Data 0.001 (0.011)	Loss 5.4289 (5.4625)	Top-1 acc 6.641 (7.336)	Top-5 acc 18.750 (20.156)	lr 0.04407
Warmup Train [9][3110/3239]	Time 0.507 (0.513)	Data 0.001 (0.011)	Loss 5.3755 (5.4622)	Top-1 acc 8.594 (7.339)	Top-5 acc 23.438 (20.163)	lr 0.04406
Warmup Train [9][3120/3239]	Time 0.586 (0.513)	Data 0.001 (0.011)	Loss 5.3805 (5.4621)	Top-1 acc 6.250 (7.338)	Top-5 acc 23.047 (20.169)	lr 0.04406
Warmup Train [9][3130/3239]	Time 0.517 (0.513)	Data 0.001 (0.011)	Loss 5.4938 (5.4621)	Top-1 acc 5.469 (7.338)	Top-5 acc 20.312 (20.170)	lr 0.04405
Warmup Train [9][3140/3239]	Time 0.465 (0.513)	Data 0.001 (0.011)	Loss 5.5807 (5.4621)	Top-1 acc 6.641 (7.337)	Top-5 acc 16.797 (20.169)	lr 0.04405
Warmup Train [9][3150/3239]	Time 0.380 (0.512)	Data 0.001 (0.011)	Loss 5.4552 (5.4618)	Top-1 acc 9.766 (7.341)	Top-5 acc 21.875 (20.176)	lr 0.04405
Warmup Train [9][3160/3239]	Time 0.541 (0.513)	Data 0.001 (0.011)	Loss 5.4541 (5.4616)	Top-1 acc 8.984 (7.344)	Top-5 acc 19.531 (20.176)	lr 0.04404
Warmup Train [9][3170/3239]	Time 0.377 (0.512)	Data 0.001 (0.011)	Loss 5.6315 (5.4615)	Top-1 acc 5.078 (7.346)	Top-5 acc 16.016 (20.180)	lr 0.04404
Warmup Train [9][3180/3239]	Time 0.556 (0.512)	Data 0.000 (0.011)	Loss 5.2873 (5.4612)	Top-1 acc 9.375 (7.349)	Top-5 acc 21.875 (20.185)	lr 0.04403
Warmup Train [9][3190/3239]	Time 0.517 (0.512)	Data 0.000 (0.011)	Loss 5.4048 (5.4611)	Top-1 acc 8.984 (7.353)	Top-5 acc 22.656 (20.189)	lr 0.04403
Warmup Train [9][3200/3239]	Time 0.344 (0.512)	Data 0.000 (0.011)	Loss 5.5049 (5.4609)	Top-1 acc 4.688 (7.355)	Top-5 acc 16.016 (20.193)	lr 0.04403
Warmup Train [9][3210/3239]	Time 0.408 (0.512)	Data 0.000 (0.011)	Loss 5.4122 (5.4607)	Top-1 acc 5.859 (7.357)	Top-5 acc 19.141 (20.201)	lr 0.04402
Warmup Train [9][3220/3239]	Time 0.672 (0.512)	Data 0.000 (0.011)	Loss 5.3921 (5.4606)	Top-1 acc 9.375 (7.358)	Top-5 acc 25.391 (20.203)	lr 0.04402
Warmup Train [9][3230/3239]	Time 0.466 (0.512)	Data 0.000 (0.010)	Loss 5.3554 (5.4604)	Top-1 acc 7.422 (7.360)	Top-5 acc 22.266 (20.206)	lr 0.04401
Warmup Train [9][3239/3239]	Time 0.363 (0.512)	Data 0.000 (0.010)	Loss 5.0882 (5.4603)	Top-1 acc 6.173 (7.359)	Top-5 acc 35.802 (20.205)	lr 0.04401
==========Warmup Valid [9/40]	loss 4.772	top-1 acc 10.866	top-5 acc 27.484	Train top-1 7.359	top-5 20.205	flops: 442.4M
Warmup Train [10][0/3239]	Time 11.681 (11.681)	Data 11.095 (11.095)	Loss 5.3787 (5.3787)	Top-1 acc 7.422 (7.422)	Top-5 acc 21.094 (21.094)	lr 0.04401
Warmup Train [10][10/3239]	Time 0.462 (1.647)	Data 0.001 (1.019)	Loss 5.3466 (5.3759)	Top-1 acc 8.203 (8.310)	Top-5 acc 23.438 (21.626)	lr 0.04401
Warmup Train [10][20/3239]	Time 0.487 (1.101)	Data 0.001 (0.535)	Loss 5.4271 (5.3882)	Top-1 acc 8.203 (8.557)	Top-5 acc 22.656 (21.801)	lr 0.04400
Warmup Train [10][30/3239]	Time 0.556 (0.916)	Data 0.001 (0.365)	Loss 5.5312 (5.4004)	Top-1 acc 7.812 (8.228)	Top-5 acc 18.750 (21.333)	lr 0.04400
Warmup Train [10][40/3239]	Time 0.535 (0.821)	Data 0.001 (0.277)	Loss 5.3202 (5.3864)	Top-1 acc 7.031 (8.289)	Top-5 acc 22.266 (21.542)	lr 0.04399
Warmup Train [10][50/3239]	Time 0.429 (0.754)	Data 0.001 (0.223)	Loss 5.3066 (5.3905)	Top-1 acc 7.031 (8.218)	Top-5 acc 23.047 (21.461)	lr 0.04399
Warmup Train [10][60/3239]	Time 0.336 (0.712)	Data 0.001 (0.189)	Loss 5.4554 (5.3908)	Top-1 acc 7.812 (8.075)	Top-5 acc 21.094 (21.542)	lr 0.04399
Warmup Train [10][70/3239]	Time 0.487 (0.686)	Data 0.001 (0.165)	Loss 5.3960 (5.3914)	Top-1 acc 8.203 (8.022)	Top-5 acc 25.781 (21.699)	lr 0.04398
Warmup Train [10][80/3239]	Time 0.651 (0.662)	Data 0.001 (0.145)	Loss 5.3950 (5.3907)	Top-1 acc 8.984 (7.991)	Top-5 acc 19.922 (21.562)	lr 0.04398
Warmup Train [10][90/3239]	Time 0.616 (0.642)	Data 0.001 (0.129)	Loss 5.4546 (5.3912)	Top-1 acc 7.422 (8.001)	Top-5 acc 21.875 (21.699)	lr 0.04397
Warmup Train [10][100/3239]	Time 0.359 (0.625)	Data 0.001 (0.117)	Loss 5.4211 (5.3949)	Top-1 acc 5.469 (7.917)	Top-5 acc 18.359 (21.631)	lr 0.04397
Warmup Train [10][110/3239]	Time 0.357 (0.612)	Data 0.001 (0.108)	Loss 5.3725 (5.3942)	Top-1 acc 7.422 (7.936)	Top-5 acc 23.047 (21.762)	lr 0.04397
Warmup Train [10][120/3239]	Time 0.588 (0.605)	Data 0.001 (0.100)	Loss 5.4579 (5.3952)	Top-1 acc 5.859 (7.961)	Top-5 acc 22.656 (21.778)	lr 0.04396
Warmup Train [10][130/3239]	Time 0.368 (0.597)	Data 0.001 (0.093)	Loss 5.3040 (5.3936)	Top-1 acc 9.766 (8.021)	Top-5 acc 24.219 (21.756)	lr 0.04396
Warmup Train [10][140/3239]	Time 0.483 (0.592)	Data 0.001 (0.087)	Loss 5.3045 (5.3927)	Top-1 acc 8.594 (8.112)	Top-5 acc 28.125 (21.878)	lr 0.04395
Warmup Train [10][150/3239]	Time 0.437 (0.585)	Data 0.001 (0.082)	Loss 5.3566 (5.3942)	Top-1 acc 7.812 (8.082)	Top-5 acc 17.969 (21.751)	lr 0.04395
Warmup Train [10][160/3239]	Time 0.433 (0.580)	Data 0.001 (0.077)	Loss 5.2456 (5.3956)	Top-1 acc 9.766 (8.094)	Top-5 acc 23.438 (21.691)	lr 0.04395
Warmup Train [10][170/3239]	Time 0.463 (0.577)	Data 0.001 (0.073)	Loss 5.3463 (5.3980)	Top-1 acc 8.594 (8.100)	Top-5 acc 21.875 (21.658)	lr 0.04394
Warmup Train [10][180/3239]	Time 0.360 (0.571)	Data 0.001 (0.069)	Loss 5.4340 (5.3982)	Top-1 acc 7.031 (8.136)	Top-5 acc 19.531 (21.702)	lr 0.04394
Warmup Train [10][190/3239]	Time 0.365 (0.568)	Data 0.001 (0.066)	Loss 5.3401 (5.3983)	Top-1 acc 11.719 (8.144)	Top-5 acc 24.609 (21.664)	lr 0.04394
Warmup Train [10][200/3239]	Time 0.652 (0.567)	Data 0.001 (0.063)	Loss 5.3672 (5.4003)	Top-1 acc 8.984 (8.155)	Top-5 acc 21.094 (21.617)	lr 0.04393
Warmup Train [10][210/3239]	Time 0.461 (0.564)	Data 0.001 (0.060)	Loss 5.4654 (5.3998)	Top-1 acc 8.594 (8.168)	Top-5 acc 20.703 (21.595)	lr 0.04393
Warmup Train [10][220/3239]	Time 0.490 (0.561)	Data 0.001 (0.058)	Loss 5.4629 (5.4011)	Top-1 acc 5.469 (8.134)	Top-5 acc 21.875 (21.537)	lr 0.04392
Warmup Train [10][230/3239]	Time 0.569 (0.559)	Data 0.001 (0.056)	Loss 5.3561 (5.3968)	Top-1 acc 9.766 (8.168)	Top-5 acc 25.781 (21.635)	lr 0.04392
Warmup Train [10][240/3239]	Time 0.705 (0.558)	Data 0.001 (0.054)	Loss 5.2067 (5.3957)	Top-1 acc 8.984 (8.187)	Top-5 acc 25.391 (21.664)	lr 0.04392
Warmup Train [10][250/3239]	Time 0.534 (0.557)	Data 0.001 (0.052)	Loss 5.3508 (5.3939)	Top-1 acc 6.250 (8.194)	Top-5 acc 25.391 (21.724)	lr 0.04391
Warmup Train [10][260/3239]	Time 0.385 (0.555)	Data 0.001 (0.050)	Loss 5.4201 (5.3931)	Top-1 acc 7.031 (8.179)	Top-5 acc 19.531 (21.701)	lr 0.04391
Warmup Train [10][270/3239]	Time 0.533 (0.554)	Data 0.001 (0.049)	Loss 5.4253 (5.3933)	Top-1 acc 7.422 (8.197)	Top-5 acc 21.484 (21.701)	lr 0.04390
Warmup Train [10][280/3239]	Time 0.603 (0.553)	Data 0.001 (0.047)	Loss 5.5606 (5.3940)	Top-1 acc 6.250 (8.178)	Top-5 acc 18.750 (21.669)	lr 0.04390
Warmup Train [10][290/3239]	Time 0.409 (0.551)	Data 0.001 (0.046)	Loss 5.4374 (5.3946)	Top-1 acc 8.984 (8.164)	Top-5 acc 21.875 (21.648)	lr 0.04390
Warmup Train [10][300/3239]	Time 0.445 (0.549)	Data 0.001 (0.045)	Loss 5.4047 (5.3940)	Top-1 acc 10.156 (8.169)	Top-5 acc 20.312 (21.641)	lr 0.04389
Warmup Train [10][310/3239]	Time 0.489 (0.548)	Data 0.001 (0.044)	Loss 5.2060 (5.3918)	Top-1 acc 9.375 (8.177)	Top-5 acc 23.438 (21.688)	lr 0.04389
Warmup Train [10][320/3239]	Time 0.416 (0.548)	Data 0.001 (0.043)	Loss 5.4470 (5.3930)	Top-1 acc 8.594 (8.170)	Top-5 acc 23.828 (21.662)	lr 0.04388
Warmup Train [10][330/3239]	Time 0.483 (0.545)	Data 0.001 (0.042)	Loss 5.3704 (5.3917)	Top-1 acc 6.641 (8.156)	Top-5 acc 21.094 (21.680)	lr 0.04388
Warmup Train [10][340/3239]	Time 0.566 (0.545)	Data 0.001 (0.041)	Loss 5.2344 (5.3917)	Top-1 acc 11.328 (8.180)	Top-5 acc 20.703 (21.684)	lr 0.04388
Warmup Train [10][350/3239]	Time 0.410 (0.542)	Data 0.001 (0.040)	Loss 5.4457 (5.3923)	Top-1 acc 6.250 (8.182)	Top-5 acc 16.797 (21.681)	lr 0.04387
Warmup Train [10][360/3239]	Time 0.465 (0.541)	Data 0.001 (0.039)	Loss 5.5191 (5.3927)	Top-1 acc 5.469 (8.161)	Top-5 acc 16.016 (21.672)	lr 0.04387
Warmup Train [10][370/3239]	Time 0.345 (0.539)	Data 0.001 (0.038)	Loss 5.4682 (5.3920)	Top-1 acc 8.203 (8.163)	Top-5 acc 23.438 (21.703)	lr 0.04386
Warmup Train [10][380/3239]	Time 0.425 (0.538)	Data 0.001 (0.037)	Loss 5.5060 (5.3927)	Top-1 acc 5.859 (8.148)	Top-5 acc 16.406 (21.672)	lr 0.04386
Warmup Train [10][390/3239]	Time 0.470 (0.537)	Data 0.001 (0.037)	Loss 5.3859 (5.3937)	Top-1 acc 7.031 (8.128)	Top-5 acc 21.484 (21.643)	lr 0.04386
Warmup Train [10][400/3239]	Time 0.429 (0.536)	Data 0.001 (0.036)	Loss 5.2858 (5.3934)	Top-1 acc 11.328 (8.155)	Top-5 acc 26.562 (21.643)	lr 0.04385
Warmup Train [10][410/3239]	Time 0.515 (0.536)	Data 0.001 (0.036)	Loss 5.3769 (5.3925)	Top-1 acc 8.203 (8.158)	Top-5 acc 21.484 (21.673)	lr 0.04385
Warmup Train [10][420/3239]	Time 0.518 (0.535)	Data 0.001 (0.035)	Loss 5.4022 (5.3922)	Top-1 acc 8.203 (8.137)	Top-5 acc 24.219 (21.673)	lr 0.04384
Warmup Train [10][430/3239]	Time 0.561 (0.535)	Data 0.001 (0.034)	Loss 5.4035 (5.3930)	Top-1 acc 7.422 (8.143)	Top-5 acc 17.578 (21.660)	lr 0.04384
Warmup Train [10][440/3239]	Time 0.480 (0.534)	Data 0.001 (0.033)	Loss 5.3189 (5.3922)	Top-1 acc 7.812 (8.152)	Top-5 acc 21.484 (21.674)	lr 0.04384
Warmup Train [10][450/3239]	Time 0.540 (0.534)	Data 0.001 (0.033)	Loss 5.4920 (5.3921)	Top-1 acc 9.375 (8.166)	Top-5 acc 19.922 (21.684)	lr 0.04383
Warmup Train [10][460/3239]	Time 0.475 (0.534)	Data 0.001 (0.032)	Loss 5.4978 (5.3932)	Top-1 acc 5.078 (8.160)	Top-5 acc 19.141 (21.645)	lr 0.04383
Warmup Train [10][470/3239]	Time 0.423 (0.533)	Data 0.001 (0.032)	Loss 5.5610 (5.3938)	Top-1 acc 4.688 (8.157)	Top-5 acc 16.797 (21.625)	lr 0.04382
Warmup Train [10][480/3239]	Time 0.342 (0.533)	Data 0.001 (0.031)	Loss 5.3603 (5.3933)	Top-1 acc 7.812 (8.154)	Top-5 acc 19.531 (21.626)	lr 0.04382
Warmup Train [10][490/3239]	Time 0.478 (0.532)	Data 0.001 (0.031)	Loss 5.5626 (5.3932)	Top-1 acc 9.766 (8.168)	Top-5 acc 21.875 (21.640)	lr 0.04382
Warmup Train [10][500/3239]	Time 0.394 (0.532)	Data 0.001 (0.031)	Loss 5.3894 (5.3935)	Top-1 acc 8.594 (8.158)	Top-5 acc 22.656 (21.621)	lr 0.04381
Warmup Train [10][510/3239]	Time 0.595 (0.532)	Data 0.001 (0.030)	Loss 5.4402 (5.3936)	Top-1 acc 9.375 (8.166)	Top-5 acc 23.828 (21.641)	lr 0.04381
Warmup Train [10][520/3239]	Time 0.422 (0.530)	Data 0.001 (0.030)	Loss 5.3874 (5.3931)	Top-1 acc 5.859 (8.184)	Top-5 acc 23.828 (21.661)	lr 0.04380
Warmup Train [10][530/3239]	Time 0.502 (0.530)	Data 0.001 (0.029)	Loss 5.4917 (5.3939)	Top-1 acc 5.469 (8.165)	Top-5 acc 19.922 (21.633)	lr 0.04380
Warmup Train [10][540/3239]	Time 0.653 (0.530)	Data 0.001 (0.029)	Loss 5.2442 (5.3923)	Top-1 acc 10.938 (8.169)	Top-5 acc 22.656 (21.666)	lr 0.04380
Warmup Train [10][550/3239]	Time 0.581 (0.529)	Data 0.001 (0.028)	Loss 5.3075 (5.3925)	Top-1 acc 7.812 (8.161)	Top-5 acc 24.609 (21.659)	lr 0.04379
Warmup Train [10][560/3239]	Time 0.690 (0.529)	Data 0.001 (0.028)	Loss 5.4673 (5.3920)	Top-1 acc 8.594 (8.168)	Top-5 acc 21.875 (21.688)	lr 0.04379
Warmup Train [10][570/3239]	Time 0.541 (0.529)	Data 0.001 (0.028)	Loss 5.4660 (5.3920)	Top-1 acc 6.641 (8.161)	Top-5 acc 21.484 (21.673)	lr 0.04378
Warmup Train [10][580/3239]	Time 0.608 (0.529)	Data 0.001 (0.027)	Loss 5.4794 (5.3919)	Top-1 acc 8.203 (8.156)	Top-5 acc 20.312 (21.665)	lr 0.04378
Warmup Train [10][590/3239]	Time 0.401 (0.528)	Data 0.001 (0.027)	Loss 5.4298 (5.3915)	Top-1 acc 9.766 (8.156)	Top-5 acc 21.484 (21.665)	lr 0.04378
Warmup Train [10][600/3239]	Time 0.368 (0.527)	Data 0.001 (0.027)	Loss 5.2949 (5.3906)	Top-1 acc 12.109 (8.186)	Top-5 acc 26.172 (21.707)	lr 0.04377
Warmup Train [10][610/3239]	Time 0.360 (0.527)	Data 0.001 (0.026)	Loss 5.3900 (5.3907)	Top-1 acc 8.203 (8.198)	Top-5 acc 24.219 (21.714)	lr 0.04377
Warmup Train [10][620/3239]	Time 0.472 (0.526)	Data 0.001 (0.026)	Loss 5.3498 (5.3908)	Top-1 acc 6.641 (8.194)	Top-5 acc 25.000 (21.713)	lr 0.04376
Warmup Train [10][630/3239]	Time 0.460 (0.525)	Data 0.001 (0.026)	Loss 5.5789 (5.3913)	Top-1 acc 7.422 (8.179)	Top-5 acc 17.188 (21.691)	lr 0.04376
Warmup Train [10][640/3239]	Time 0.622 (0.524)	Data 0.001 (0.025)	Loss 5.4523 (5.3913)	Top-1 acc 5.859 (8.168)	Top-5 acc 19.531 (21.696)	lr 0.04376
Warmup Train [10][650/3239]	Time 0.467 (0.524)	Data 0.001 (0.025)	Loss 5.1989 (5.3910)	Top-1 acc 8.984 (8.154)	Top-5 acc 25.781 (21.693)	lr 0.04375
Warmup Train [10][660/3239]	Time 0.550 (0.524)	Data 0.001 (0.025)	Loss 5.2014 (5.3909)	Top-1 acc 11.328 (8.160)	Top-5 acc 22.266 (21.697)	lr 0.04375
Warmup Train [10][670/3239]	Time 0.532 (0.524)	Data 0.001 (0.024)	Loss 5.3711 (5.3910)	Top-1 acc 8.594 (8.157)	Top-5 acc 21.094 (21.685)	lr 0.04374
Warmup Train [10][680/3239]	Time 0.615 (0.523)	Data 0.001 (0.024)	Loss 5.3234 (5.3910)	Top-1 acc 9.375 (8.153)	Top-5 acc 23.828 (21.673)	lr 0.04374
Warmup Train [10][690/3239]	Time 0.594 (0.523)	Data 0.001 (0.024)	Loss 5.4660 (5.3906)	Top-1 acc 5.859 (8.150)	Top-5 acc 18.359 (21.691)	lr 0.04374
Warmup Train [10][700/3239]	Time 0.491 (0.523)	Data 0.001 (0.023)	Loss 5.4099 (5.3902)	Top-1 acc 5.469 (8.147)	Top-5 acc 17.578 (21.701)	lr 0.04373
Warmup Train [10][710/3239]	Time 0.475 (0.523)	Data 0.001 (0.023)	Loss 5.3532 (5.3901)	Top-1 acc 9.375 (8.144)	Top-5 acc 24.219 (21.699)	lr 0.04373
Warmup Train [10][720/3239]	Time 0.536 (0.523)	Data 0.001 (0.023)	Loss 5.2934 (5.3897)	Top-1 acc 7.812 (8.158)	Top-5 acc 19.922 (21.702)	lr 0.04372
Warmup Train [10][730/3239]	Time 0.369 (0.522)	Data 0.001 (0.023)	Loss 5.5368 (5.3897)	Top-1 acc 7.422 (8.164)	Top-5 acc 18.750 (21.702)	lr 0.04372
Warmup Train [10][740/3239]	Time 0.441 (0.522)	Data 0.001 (0.023)	Loss 5.3266 (5.3893)	Top-1 acc 8.203 (8.169)	Top-5 acc 23.828 (21.715)	lr 0.04372
Warmup Train [10][750/3239]	Time 0.585 (0.522)	Data 0.001 (0.022)	Loss 5.3195 (5.3892)	Top-1 acc 8.203 (8.170)	Top-5 acc 24.609 (21.712)	lr 0.04371
Warmup Train [10][760/3239]	Time 0.492 (0.522)	Data 0.001 (0.022)	Loss 5.3007 (5.3887)	Top-1 acc 10.938 (8.176)	Top-5 acc 27.344 (21.733)	lr 0.04371
Warmup Train [10][770/3239]	Time 0.527 (0.522)	Data 0.001 (0.022)	Loss 5.3343 (5.3890)	Top-1 acc 5.859 (8.166)	Top-5 acc 20.703 (21.736)	lr 0.04370
Warmup Train [10][780/3239]	Time 0.510 (0.522)	Data 0.001 (0.022)	Loss 5.5449 (5.3892)	Top-1 acc 5.469 (8.166)	Top-5 acc 16.797 (21.730)	lr 0.04370
Warmup Train [10][790/3239]	Time 0.485 (0.522)	Data 0.001 (0.021)	Loss 5.3876 (5.3894)	Top-1 acc 7.031 (8.164)	Top-5 acc 20.312 (21.717)	lr 0.04370
Warmup Train [10][800/3239]	Time 0.557 (0.522)	Data 0.001 (0.021)	Loss 5.4518 (5.3895)	Top-1 acc 3.906 (8.161)	Top-5 acc 15.625 (21.710)	lr 0.04369
Warmup Train [10][810/3239]	Time 0.589 (0.522)	Data 0.001 (0.021)	Loss 5.3511 (5.3900)	Top-1 acc 8.203 (8.158)	Top-5 acc 20.703 (21.702)	lr 0.04369
Warmup Train [10][820/3239]	Time 0.329 (0.522)	Data 0.001 (0.021)	Loss 5.2272 (5.3895)	Top-1 acc 6.250 (8.163)	Top-5 acc 25.391 (21.720)	lr 0.04368
Warmup Train [10][830/3239]	Time 0.376 (0.522)	Data 0.002 (0.021)	Loss 5.2817 (5.3895)	Top-1 acc 7.031 (8.158)	Top-5 acc 23.047 (21.727)	lr 0.04368
Warmup Train [10][840/3239]	Time 0.515 (0.522)	Data 0.001 (0.021)	Loss 5.3799 (5.3894)	Top-1 acc 8.594 (8.165)	Top-5 acc 22.656 (21.727)	lr 0.04368
Warmup Train [10][850/3239]	Time 0.386 (0.522)	Data 0.001 (0.020)	Loss 5.5222 (5.3897)	Top-1 acc 6.641 (8.165)	Top-5 acc 16.797 (21.721)	lr 0.04367
Warmup Train [10][860/3239]	Time 0.559 (0.522)	Data 0.001 (0.020)	Loss 5.3429 (5.3898)	Top-1 acc 10.547 (8.173)	Top-5 acc 21.484 (21.728)	lr 0.04367
Warmup Train [10][870/3239]	Time 0.531 (0.522)	Data 0.001 (0.020)	Loss 5.3426 (5.3897)	Top-1 acc 7.031 (8.176)	Top-5 acc 21.875 (21.727)	lr 0.04366
Warmup Train [10][880/3239]	Time 0.544 (0.522)	Data 0.001 (0.020)	Loss 5.4397 (5.3892)	Top-1 acc 5.078 (8.180)	Top-5 acc 17.188 (21.734)	lr 0.04366
Warmup Train [10][890/3239]	Time 0.528 (0.521)	Data 0.001 (0.020)	Loss 5.3739 (5.3892)	Top-1 acc 7.031 (8.176)	Top-5 acc 20.312 (21.738)	lr 0.04366
Warmup Train [10][900/3239]	Time 0.536 (0.521)	Data 0.001 (0.020)	Loss 5.3457 (5.3890)	Top-1 acc 9.375 (8.173)	Top-5 acc 21.094 (21.738)	lr 0.04365
Warmup Train [10][910/3239]	Time 0.543 (0.521)	Data 0.001 (0.019)	Loss 5.3255 (5.3886)	Top-1 acc 7.031 (8.179)	Top-5 acc 21.875 (21.755)	lr 0.04365
Warmup Train [10][920/3239]	Time 0.436 (0.520)	Data 0.001 (0.019)	Loss 5.3977 (5.3888)	Top-1 acc 7.812 (8.181)	Top-5 acc 22.656 (21.756)	lr 0.04364
Warmup Train [10][930/3239]	Time 0.391 (0.521)	Data 0.001 (0.019)	Loss 5.5344 (5.3884)	Top-1 acc 7.422 (8.179)	Top-5 acc 20.703 (21.761)	lr 0.04364
Warmup Train [10][940/3239]	Time 0.550 (0.521)	Data 0.001 (0.019)	Loss 5.4552 (5.3888)	Top-1 acc 7.812 (8.178)	Top-5 acc 21.094 (21.759)	lr 0.04364
Warmup Train [10][950/3239]	Time 0.483 (0.520)	Data 0.001 (0.019)	Loss 5.4592 (5.3888)	Top-1 acc 7.812 (8.182)	Top-5 acc 21.484 (21.764)	lr 0.04363
Warmup Train [10][960/3239]	Time 0.687 (0.520)	Data 0.001 (0.019)	Loss 5.2756 (5.3883)	Top-1 acc 7.812 (8.187)	Top-5 acc 22.656 (21.774)	lr 0.04363
Warmup Train [10][970/3239]	Time 0.437 (0.520)	Data 0.001 (0.019)	Loss 5.2267 (5.3877)	Top-1 acc 7.422 (8.192)	Top-5 acc 21.484 (21.774)	lr 0.04362
Warmup Train [10][980/3239]	Time 0.495 (0.520)	Data 0.002 (0.019)	Loss 5.3336 (5.3873)	Top-1 acc 11.719 (8.198)	Top-5 acc 22.266 (21.781)	lr 0.04362
Warmup Train [10][990/3239]	Time 0.513 (0.520)	Data 0.001 (0.018)	Loss 5.3805 (5.3870)	Top-1 acc 6.641 (8.204)	Top-5 acc 21.875 (21.785)	lr 0.04362
Warmup Train [10][1000/3239]	Time 0.368 (0.520)	Data 0.001 (0.018)	Loss 5.3810 (5.3867)	Top-1 acc 10.547 (8.216)	Top-5 acc 23.047 (21.809)	lr 0.04361
Warmup Train [10][1010/3239]	Time 0.545 (0.520)	Data 0.001 (0.018)	Loss 5.4007 (5.3863)	Top-1 acc 11.719 (8.228)	Top-5 acc 26.562 (21.826)	lr 0.04361
Warmup Train [10][1020/3239]	Time 0.539 (0.521)	Data 0.001 (0.018)	Loss 5.4708 (5.3857)	Top-1 acc 6.641 (8.227)	Top-5 acc 20.703 (21.840)	lr 0.04360
Warmup Train [10][1030/3239]	Time 0.541 (0.520)	Data 0.001 (0.018)	Loss 5.2734 (5.3854)	Top-1 acc 10.938 (8.238)	Top-5 acc 25.781 (21.847)	lr 0.04360
Warmup Train [10][1040/3239]	Time 0.445 (0.520)	Data 0.001 (0.018)	Loss 5.3494 (5.3851)	Top-1 acc 8.594 (8.243)	Top-5 acc 21.094 (21.858)	lr 0.04359
Warmup Train [10][1050/3239]	Time 0.331 (0.520)	Data 0.001 (0.018)	Loss 5.4577 (5.3850)	Top-1 acc 7.422 (8.245)	Top-5 acc 21.094 (21.863)	lr 0.04359
Warmup Train [10][1060/3239]	Time 0.725 (0.520)	Data 0.001 (0.018)	Loss 5.3529 (5.3845)	Top-1 acc 7.422 (8.258)	Top-5 acc 22.266 (21.879)	lr 0.04359
Warmup Train [10][1070/3239]	Time 0.514 (0.520)	Data 0.001 (0.018)	Loss 5.4450 (5.3845)	Top-1 acc 6.250 (8.258)	Top-5 acc 20.703 (21.879)	lr 0.04358
Warmup Train [10][1080/3239]	Time 0.499 (0.520)	Data 0.001 (0.017)	Loss 5.4792 (5.3841)	Top-1 acc 7.812 (8.261)	Top-5 acc 18.359 (21.893)	lr 0.04358
Warmup Train [10][1090/3239]	Time 0.696 (0.520)	Data 0.001 (0.017)	Loss 5.4263 (5.3840)	Top-1 acc 5.859 (8.263)	Top-5 acc 20.703 (21.901)	lr 0.04357
Warmup Train [10][1100/3239]	Time 0.563 (0.520)	Data 0.001 (0.017)	Loss 5.3653 (5.3839)	Top-1 acc 10.156 (8.267)	Top-5 acc 27.344 (21.915)	lr 0.04357
Warmup Train [10][1110/3239]	Time 0.601 (0.520)	Data 0.001 (0.017)	Loss 5.3951 (5.3836)	Top-1 acc 7.031 (8.269)	Top-5 acc 23.047 (21.923)	lr 0.04357
Warmup Train [10][1120/3239]	Time 0.691 (0.520)	Data 0.001 (0.017)	Loss 5.3633 (5.3834)	Top-1 acc 5.859 (8.268)	Top-5 acc 19.922 (21.927)	lr 0.04356
Warmup Train [10][1130/3239]	Time 0.339 (0.520)	Data 0.001 (0.017)	Loss 5.3390 (5.3833)	Top-1 acc 7.422 (8.275)	Top-5 acc 21.484 (21.943)	lr 0.04356
Warmup Train [10][1140/3239]	Time 0.441 (0.520)	Data 0.001 (0.017)	Loss 5.2803 (5.3832)	Top-1 acc 10.938 (8.276)	Top-5 acc 26.953 (21.951)	lr 0.04355
Warmup Train [10][1150/3239]	Time 0.477 (0.519)	Data 0.001 (0.017)	Loss 5.3172 (5.3831)	Top-1 acc 7.422 (8.279)	Top-5 acc 19.531 (21.956)	lr 0.04355
Warmup Train [10][1160/3239]	Time 0.639 (0.520)	Data 0.001 (0.017)	Loss 5.3000 (5.3827)	Top-1 acc 10.156 (8.281)	Top-5 acc 22.266 (21.956)	lr 0.04355
Warmup Train [10][1170/3239]	Time 0.373 (0.519)	Data 0.002 (0.017)	Loss 5.4733 (5.3826)	Top-1 acc 6.641 (8.282)	Top-5 acc 18.359 (21.958)	lr 0.04354
Warmup Train [10][1180/3239]	Time 0.437 (0.519)	Data 0.001 (0.017)	Loss 5.3672 (5.3830)	Top-1 acc 6.641 (8.280)	Top-5 acc 18.359 (21.951)	lr 0.04354
Warmup Train [10][1190/3239]	Time 0.563 (0.519)	Data 0.001 (0.017)	Loss 5.4137 (5.3828)	Top-1 acc 8.984 (8.285)	Top-5 acc 19.922 (21.962)	lr 0.04353
Warmup Train [10][1200/3239]	Time 0.565 (0.519)	Data 0.001 (0.016)	Loss 5.3119 (5.3827)	Top-1 acc 10.547 (8.297)	Top-5 acc 26.172 (21.970)	lr 0.04353
Warmup Train [10][1210/3239]	Time 0.515 (0.519)	Data 0.001 (0.016)	Loss 5.3030 (5.3823)	Top-1 acc 10.938 (8.307)	Top-5 acc 23.828 (21.983)	lr 0.04353
Warmup Train [10][1220/3239]	Time 0.472 (0.519)	Data 0.001 (0.016)	Loss 5.3939 (5.3820)	Top-1 acc 8.594 (8.305)	Top-5 acc 22.266 (21.986)	lr 0.04352
Warmup Train [10][1230/3239]	Time 0.560 (0.519)	Data 0.001 (0.016)	Loss 5.4613 (5.3818)	Top-1 acc 7.812 (8.310)	Top-5 acc 22.656 (21.991)	lr 0.04352
Warmup Train [10][1240/3239]	Time 0.664 (0.518)	Data 0.001 (0.016)	Loss 5.3777 (5.3815)	Top-1 acc 7.812 (8.313)	Top-5 acc 22.266 (22.000)	lr 0.04351
Warmup Train [10][1250/3239]	Time 0.438 (0.518)	Data 0.001 (0.016)	Loss 5.3475 (5.3810)	Top-1 acc 9.375 (8.320)	Top-5 acc 22.656 (22.014)	lr 0.04351
Warmup Train [10][1260/3239]	Time 0.753 (0.518)	Data 0.001 (0.016)	Loss 5.3847 (5.3806)	Top-1 acc 8.984 (8.322)	Top-5 acc 22.266 (22.019)	lr 0.04351
Warmup Train [10][1270/3239]	Time 0.681 (0.518)	Data 0.001 (0.016)	Loss 5.3925 (5.3809)	Top-1 acc 8.203 (8.319)	Top-5 acc 19.531 (22.013)	lr 0.04350
Warmup Train [10][1280/3239]	Time 0.592 (0.518)	Data 0.001 (0.016)	Loss 5.3056 (5.3806)	Top-1 acc 10.156 (8.324)	Top-5 acc 26.172 (22.027)	lr 0.04350
Warmup Train [10][1290/3239]	Time 0.609 (0.518)	Data 0.001 (0.016)	Loss 5.2450 (5.3806)	Top-1 acc 11.719 (8.324)	Top-5 acc 26.562 (22.031)	lr 0.04349
Warmup Train [10][1300/3239]	Time 0.468 (0.518)	Data 0.001 (0.016)	Loss 5.4061 (5.3804)	Top-1 acc 8.203 (8.329)	Top-5 acc 22.266 (22.038)	lr 0.04349
Warmup Train [10][1310/3239]	Time 0.513 (0.518)	Data 0.001 (0.015)	Loss 5.4398 (5.3803)	Top-1 acc 6.250 (8.329)	Top-5 acc 18.750 (22.033)	lr 0.04349
Warmup Train [10][1320/3239]	Time 0.508 (0.518)	Data 0.001 (0.015)	Loss 5.4540 (5.3802)	Top-1 acc 7.812 (8.332)	Top-5 acc 22.266 (22.049)	lr 0.04348
Warmup Train [10][1330/3239]	Time 0.570 (0.518)	Data 0.001 (0.015)	Loss 5.3456 (5.3805)	Top-1 acc 6.250 (8.322)	Top-5 acc 20.703 (22.045)	lr 0.04348
Warmup Train [10][1340/3239]	Time 0.575 (0.518)	Data 0.001 (0.015)	Loss 5.3021 (5.3803)	Top-1 acc 10.547 (8.323)	Top-5 acc 25.000 (22.055)	lr 0.04347
Warmup Train [10][1350/3239]	Time 0.386 (0.518)	Data 0.001 (0.015)	Loss 5.3866 (5.3801)	Top-1 acc 6.641 (8.320)	Top-5 acc 21.875 (22.059)	lr 0.04347
Warmup Train [10][1360/3239]	Time 0.574 (0.518)	Data 0.001 (0.015)	Loss 5.3969 (5.3800)	Top-1 acc 8.594 (8.320)	Top-5 acc 23.047 (22.059)	lr 0.04346
Warmup Train [10][1370/3239]	Time 0.449 (0.518)	Data 0.001 (0.015)	Loss 5.2932 (5.3800)	Top-1 acc 10.938 (8.322)	Top-5 acc 25.391 (22.064)	lr 0.04346
Warmup Train [10][1380/3239]	Time 0.523 (0.517)	Data 0.001 (0.015)	Loss 5.2291 (5.3798)	Top-1 acc 11.328 (8.328)	Top-5 acc 24.609 (22.068)	lr 0.04346
Warmup Train [10][1390/3239]	Time 0.601 (0.518)	Data 0.001 (0.015)	Loss 5.4253 (5.3795)	Top-1 acc 6.641 (8.331)	Top-5 acc 22.266 (22.077)	lr 0.04345
Warmup Train [10][1400/3239]	Time 0.441 (0.517)	Data 0.001 (0.015)	Loss 5.4961 (5.3795)	Top-1 acc 8.594 (8.334)	Top-5 acc 20.312 (22.080)	lr 0.04345
Warmup Train [10][1410/3239]	Time 0.511 (0.517)	Data 0.001 (0.015)	Loss 5.2378 (5.3794)	Top-1 acc 11.719 (8.339)	Top-5 acc 25.000 (22.082)	lr 0.04344
Warmup Train [10][1420/3239]	Time 0.506 (0.517)	Data 0.001 (0.015)	Loss 5.3689 (5.3792)	Top-1 acc 8.203 (8.339)	Top-5 acc 20.312 (22.080)	lr 0.04344
Warmup Train [10][1430/3239]	Time 0.546 (0.517)	Data 0.001 (0.015)	Loss 5.3316 (5.3798)	Top-1 acc 12.109 (8.339)	Top-5 acc 24.609 (22.070)	lr 0.04344
Warmup Train [10][1440/3239]	Time 0.465 (0.516)	Data 0.001 (0.015)	Loss 5.2885 (5.3796)	Top-1 acc 10.156 (8.336)	Top-5 acc 24.609 (22.078)	lr 0.04343
Warmup Train [10][1450/3239]	Time 0.334 (0.516)	Data 0.001 (0.015)	Loss 5.4827 (5.3796)	Top-1 acc 7.031 (8.336)	Top-5 acc 21.094 (22.073)	lr 0.04343
Warmup Train [10][1460/3239]	Time 0.532 (0.517)	Data 0.001 (0.015)	Loss 5.5533 (5.3795)	Top-1 acc 6.641 (8.340)	Top-5 acc 17.578 (22.081)	lr 0.04342
Warmup Train [10][1470/3239]	Time 0.482 (0.517)	Data 0.001 (0.014)	Loss 5.4486 (5.3794)	Top-1 acc 7.031 (8.345)	Top-5 acc 18.359 (22.080)	lr 0.04342
Warmup Train [10][1480/3239]	Time 0.751 (0.517)	Data 0.001 (0.014)	Loss 5.3648 (5.3793)	Top-1 acc 9.766 (8.345)	Top-5 acc 21.875 (22.080)	lr 0.04342
Warmup Train [10][1490/3239]	Time 0.430 (0.517)	Data 0.001 (0.014)	Loss 5.3227 (5.3792)	Top-1 acc 9.375 (8.346)	Top-5 acc 20.703 (22.070)	lr 0.04341
Warmup Train [10][1500/3239]	Time 0.487 (0.517)	Data 0.001 (0.014)	Loss 5.3801 (5.3791)	Top-1 acc 9.766 (8.346)	Top-5 acc 24.609 (22.075)	lr 0.04341
Warmup Train [10][1510/3239]	Time 0.586 (0.516)	Data 0.001 (0.014)	Loss 5.3003 (5.3792)	Top-1 acc 11.328 (8.346)	Top-5 acc 23.438 (22.070)	lr 0.04340
Warmup Train [10][1520/3239]	Time 0.447 (0.516)	Data 0.001 (0.014)	Loss 5.2743 (5.3787)	Top-1 acc 9.375 (8.348)	Top-5 acc 23.438 (22.073)	lr 0.04340
Warmup Train [10][1530/3239]	Time 0.318 (0.516)	Data 0.001 (0.014)	Loss 5.3052 (5.3786)	Top-1 acc 11.719 (8.358)	Top-5 acc 27.734 (22.078)	lr 0.04340
Warmup Train [10][1540/3239]	Time 0.407 (0.516)	Data 0.001 (0.014)	Loss 5.1827 (5.3783)	Top-1 acc 10.547 (8.362)	Top-5 acc 25.781 (22.086)	lr 0.04339
Warmup Train [10][1550/3239]	Time 0.373 (0.516)	Data 0.001 (0.014)	Loss 5.3830 (5.3784)	Top-1 acc 8.594 (8.362)	Top-5 acc 22.266 (22.084)	lr 0.04339
Warmup Train [10][1560/3239]	Time 0.485 (0.516)	Data 0.001 (0.014)	Loss 5.3556 (5.3780)	Top-1 acc 9.766 (8.366)	Top-5 acc 24.609 (22.087)	lr 0.04338
Warmup Train [10][1570/3239]	Time 0.429 (0.516)	Data 0.001 (0.014)	Loss 5.2062 (5.3776)	Top-1 acc 10.938 (8.371)	Top-5 acc 29.297 (22.097)	lr 0.04338
Warmup Train [10][1580/3239]	Time 0.688 (0.516)	Data 0.001 (0.014)	Loss 5.3788 (5.3775)	Top-1 acc 7.812 (8.373)	Top-5 acc 21.875 (22.104)	lr 0.04337
Warmup Train [10][1590/3239]	Time 0.477 (0.516)	Data 0.001 (0.014)	Loss 5.4117 (5.3774)	Top-1 acc 6.250 (8.369)	Top-5 acc 17.578 (22.102)	lr 0.04337
Warmup Train [10][1600/3239]	Time 0.603 (0.516)	Data 0.001 (0.014)	Loss 5.3713 (5.3770)	Top-1 acc 7.422 (8.371)	Top-5 acc 24.219 (22.111)	lr 0.04337
Warmup Train [10][1610/3239]	Time 0.535 (0.516)	Data 0.001 (0.014)	Loss 5.3950 (5.3767)	Top-1 acc 10.547 (8.375)	Top-5 acc 25.391 (22.115)	lr 0.04336
Warmup Train [10][1620/3239]	Time 0.474 (0.516)	Data 0.001 (0.014)	Loss 5.4087 (5.3764)	Top-1 acc 8.203 (8.374)	Top-5 acc 23.828 (22.124)	lr 0.04336
Warmup Train [10][1630/3239]	Time 0.550 (0.516)	Data 0.001 (0.014)	Loss 5.4373 (5.3762)	Top-1 acc 9.766 (8.379)	Top-5 acc 21.875 (22.133)	lr 0.04335
Warmup Train [10][1640/3239]	Time 0.519 (0.516)	Data 0.001 (0.014)	Loss 5.2697 (5.3763)	Top-1 acc 10.547 (8.376)	Top-5 acc 25.000 (22.129)	lr 0.04335
Warmup Train [10][1650/3239]	Time 0.516 (0.516)	Data 0.025 (0.014)	Loss 5.3387 (5.3760)	Top-1 acc 9.375 (8.381)	Top-5 acc 22.266 (22.134)	lr 0.04335
Warmup Train [10][1660/3239]	Time 0.324 (0.516)	Data 0.001 (0.014)	Loss 5.3722 (5.3761)	Top-1 acc 7.422 (8.378)	Top-5 acc 23.438 (22.128)	lr 0.04334
Warmup Train [10][1670/3239]	Time 0.527 (0.516)	Data 0.001 (0.014)	Loss 5.2476 (5.3761)	Top-1 acc 11.328 (8.379)	Top-5 acc 26.172 (22.130)	lr 0.04334
Warmup Train [10][1680/3239]	Time 0.644 (0.516)	Data 0.001 (0.014)	Loss 5.2604 (5.3759)	Top-1 acc 10.156 (8.380)	Top-5 acc 23.438 (22.134)	lr 0.04333
Warmup Train [10][1690/3239]	Time 0.528 (0.516)	Data 0.001 (0.014)	Loss 5.4343 (5.3759)	Top-1 acc 6.641 (8.379)	Top-5 acc 21.484 (22.132)	lr 0.04333
Warmup Train [10][1700/3239]	Time 0.356 (0.516)	Data 0.001 (0.014)	Loss 5.4431 (5.3759)	Top-1 acc 5.469 (8.378)	Top-5 acc 20.312 (22.134)	lr 0.04333
Warmup Train [10][1710/3239]	Time 0.632 (0.516)	Data 0.001 (0.014)	Loss 5.3042 (5.3757)	Top-1 acc 9.766 (8.384)	Top-5 acc 27.344 (22.146)	lr 0.04332
Warmup Train [10][1720/3239]	Time 0.585 (0.516)	Data 0.001 (0.013)	Loss 5.2522 (5.3754)	Top-1 acc 9.766 (8.387)	Top-5 acc 25.391 (22.154)	lr 0.04332
Warmup Train [10][1730/3239]	Time 0.643 (0.516)	Data 0.001 (0.013)	Loss 5.2649 (5.3753)	Top-1 acc 7.812 (8.388)	Top-5 acc 25.781 (22.156)	lr 0.04331
Warmup Train [10][1740/3239]	Time 0.427 (0.516)	Data 0.001 (0.013)	Loss 5.4004 (5.3751)	Top-1 acc 7.422 (8.392)	Top-5 acc 19.922 (22.157)	lr 0.04331
Warmup Train [10][1750/3239]	Time 0.554 (0.516)	Data 0.001 (0.013)	Loss 5.4352 (5.3750)	Top-1 acc 8.203 (8.395)	Top-5 acc 21.484 (22.161)	lr 0.04330
Warmup Train [10][1760/3239]	Time 0.573 (0.516)	Data 0.001 (0.013)	Loss 5.3484 (5.3749)	Top-1 acc 10.547 (8.401)	Top-5 acc 21.875 (22.166)	lr 0.04330
Warmup Train [10][1770/3239]	Time 0.421 (0.516)	Data 0.001 (0.013)	Loss 5.5314 (5.3749)	Top-1 acc 6.641 (8.405)	Top-5 acc 22.266 (22.177)	lr 0.04330
Warmup Train [10][1780/3239]	Time 0.355 (0.516)	Data 0.001 (0.013)	Loss 5.4349 (5.3749)	Top-1 acc 6.250 (8.408)	Top-5 acc 22.266 (22.175)	lr 0.04329
Warmup Train [10][1790/3239]	Time 0.644 (0.516)	Data 0.001 (0.013)	Loss 5.2250 (5.3746)	Top-1 acc 8.203 (8.413)	Top-5 acc 26.953 (22.186)	lr 0.04329
Warmup Train [10][1800/3239]	Time 0.594 (0.516)	Data 0.001 (0.013)	Loss 5.4262 (5.3747)	Top-1 acc 6.641 (8.414)	Top-5 acc 19.922 (22.185)	lr 0.04328
Warmup Train [10][1810/3239]	Time 0.612 (0.516)	Data 0.001 (0.013)	Loss 5.3623 (5.3747)	Top-1 acc 8.594 (8.410)	Top-5 acc 19.531 (22.184)	lr 0.04328
Warmup Train [10][1820/3239]	Time 0.379 (0.516)	Data 0.001 (0.013)	Loss 5.2936 (5.3746)	Top-1 acc 10.547 (8.411)	Top-5 acc 24.219 (22.181)	lr 0.04328
Warmup Train [10][1830/3239]	Time 0.462 (0.516)	Data 0.001 (0.013)	Loss 5.4424 (5.3747)	Top-1 acc 6.250 (8.409)	Top-5 acc 19.141 (22.180)	lr 0.04327
Warmup Train [10][1840/3239]	Time 0.677 (0.516)	Data 0.001 (0.013)	Loss 5.5824 (5.3748)	Top-1 acc 8.984 (8.409)	Top-5 acc 17.969 (22.179)	lr 0.04327
Warmup Train [10][1850/3239]	Time 0.538 (0.516)	Data 0.001 (0.013)	Loss 5.5471 (5.3745)	Top-1 acc 8.594 (8.414)	Top-5 acc 21.875 (22.186)	lr 0.04326
Warmup Train [10][1860/3239]	Time 0.443 (0.516)	Data 0.001 (0.013)	Loss 5.4979 (5.3743)	Top-1 acc 7.812 (8.417)	Top-5 acc 19.141 (22.194)	lr 0.04326
Warmup Train [10][1870/3239]	Time 0.665 (0.516)	Data 0.001 (0.013)	Loss 5.4325 (5.3746)	Top-1 acc 7.031 (8.411)	Top-5 acc 18.359 (22.190)	lr 0.04325
Warmup Train [10][1880/3239]	Time 0.401 (0.516)	Data 0.001 (0.013)	Loss 5.3736 (5.3744)	Top-1 acc 5.469 (8.415)	Top-5 acc 21.484 (22.198)	lr 0.04325
Warmup Train [10][1890/3239]	Time 0.383 (0.515)	Data 0.001 (0.013)	Loss 5.4876 (5.3745)	Top-1 acc 7.812 (8.415)	Top-5 acc 19.531 (22.197)	lr 0.04325
Warmup Train [10][1900/3239]	Time 0.558 (0.516)	Data 0.001 (0.013)	Loss 5.3167 (5.3744)	Top-1 acc 10.156 (8.416)	Top-5 acc 22.656 (22.196)	lr 0.04324
Warmup Train [10][1910/3239]	Time 0.635 (0.516)	Data 0.001 (0.013)	Loss 5.1842 (5.3738)	Top-1 acc 10.547 (8.421)	Top-5 acc 25.391 (22.210)	lr 0.04324
Warmup Train [10][1920/3239]	Time 0.554 (0.516)	Data 0.001 (0.013)	Loss 5.1096 (5.3734)	Top-1 acc 10.156 (8.427)	Top-5 acc 29.688 (22.222)	lr 0.04323
Warmup Train [10][1930/3239]	Time 0.487 (0.515)	Data 0.001 (0.013)	Loss 5.2415 (5.3733)	Top-1 acc 6.250 (8.424)	Top-5 acc 22.656 (22.224)	lr 0.04323
Warmup Train [10][1940/3239]	Time 0.635 (0.515)	Data 0.001 (0.013)	Loss 5.2454 (5.3732)	Top-1 acc 10.547 (8.427)	Top-5 acc 27.344 (22.231)	lr 0.04323
Warmup Train [10][1950/3239]	Time 0.347 (0.515)	Data 0.001 (0.013)	Loss 5.3107 (5.3728)	Top-1 acc 10.938 (8.431)	Top-5 acc 26.172 (22.241)	lr 0.04322
Warmup Train [10][1960/3239]	Time 0.565 (0.515)	Data 0.001 (0.013)	Loss 5.3305 (5.3727)	Top-1 acc 10.547 (8.434)	Top-5 acc 23.438 (22.247)	lr 0.04322
Warmup Train [10][1970/3239]	Time 0.494 (0.515)	Data 0.001 (0.013)	Loss 5.2993 (5.3726)	Top-1 acc 10.547 (8.435)	Top-5 acc 23.828 (22.249)	lr 0.04321
Warmup Train [10][1980/3239]	Time 0.510 (0.515)	Data 0.001 (0.013)	Loss 5.3080 (5.3725)	Top-1 acc 10.156 (8.436)	Top-5 acc 23.828 (22.253)	lr 0.04321
Warmup Train [10][1990/3239]	Time 0.447 (0.515)	Data 0.001 (0.012)	Loss 5.3409 (5.3725)	Top-1 acc 7.422 (8.438)	Top-5 acc 20.312 (22.247)	lr 0.04321
Warmup Train [10][2000/3239]	Time 0.451 (0.515)	Data 0.001 (0.012)	Loss 5.3507 (5.3722)	Top-1 acc 7.031 (8.440)	Top-5 acc 25.391 (22.258)	lr 0.04320
Warmup Train [10][2010/3239]	Time 0.526 (0.515)	Data 0.001 (0.012)	Loss 5.2361 (5.3721)	Top-1 acc 12.109 (8.445)	Top-5 acc 27.734 (22.265)	lr 0.04320
Warmup Train [10][2020/3239]	Time 0.384 (0.515)	Data 0.001 (0.012)	Loss 5.5836 (5.3721)	Top-1 acc 7.422 (8.444)	Top-5 acc 14.844 (22.259)	lr 0.04319
Warmup Train [10][2030/3239]	Time 0.440 (0.515)	Data 0.001 (0.012)	Loss 5.3295 (5.3718)	Top-1 acc 10.938 (8.448)	Top-5 acc 24.219 (22.262)	lr 0.04319
Warmup Train [10][2040/3239]	Time 0.540 (0.515)	Data 0.001 (0.012)	Loss 5.2583 (5.3718)	Top-1 acc 9.766 (8.450)	Top-5 acc 21.484 (22.262)	lr 0.04318
Warmup Train [10][2050/3239]	Time 0.569 (0.515)	Data 0.001 (0.012)	Loss 5.3080 (5.3717)	Top-1 acc 8.203 (8.453)	Top-5 acc 25.000 (22.266)	lr 0.04318
Warmup Train [10][2060/3239]	Time 0.342 (0.515)	Data 0.001 (0.012)	Loss 5.2549 (5.3716)	Top-1 acc 11.719 (8.454)	Top-5 acc 28.906 (22.268)	lr 0.04318
Warmup Train [10][2070/3239]	Time 0.502 (0.515)	Data 0.001 (0.012)	Loss 5.3210 (5.3712)	Top-1 acc 8.203 (8.455)	Top-5 acc 24.609 (22.271)	lr 0.04317
Warmup Train [10][2080/3239]	Time 0.379 (0.515)	Data 0.001 (0.012)	Loss 5.3926 (5.3714)	Top-1 acc 6.641 (8.454)	Top-5 acc 22.266 (22.269)	lr 0.04317
Warmup Train [10][2090/3239]	Time 0.470 (0.515)	Data 0.001 (0.012)	Loss 5.2932 (5.3711)	Top-1 acc 9.375 (8.456)	Top-5 acc 25.781 (22.275)	lr 0.04316
Warmup Train [10][2100/3239]	Time 0.594 (0.515)	Data 0.001 (0.012)	Loss 5.4308 (5.3713)	Top-1 acc 6.250 (8.455)	Top-5 acc 23.828 (22.276)	lr 0.04316
Warmup Train [10][2110/3239]	Time 0.761 (0.515)	Data 0.001 (0.012)	Loss 5.3769 (5.3711)	Top-1 acc 8.594 (8.459)	Top-5 acc 19.922 (22.282)	lr 0.04316
Warmup Train [10][2120/3239]	Time 0.561 (0.515)	Data 0.001 (0.012)	Loss 5.3755 (5.3710)	Top-1 acc 9.375 (8.464)	Top-5 acc 20.703 (22.287)	lr 0.04315
Warmup Train [10][2130/3239]	Time 0.521 (0.515)	Data 0.001 (0.012)	Loss 5.2037 (5.3707)	Top-1 acc 10.156 (8.468)	Top-5 acc 21.875 (22.293)	lr 0.04315
Warmup Train [10][2140/3239]	Time 0.562 (0.515)	Data 0.001 (0.012)	Loss 5.2438 (5.3705)	Top-1 acc 8.203 (8.470)	Top-5 acc 26.953 (22.305)	lr 0.04314
Warmup Train [10][2150/3239]	Time 0.511 (0.515)	Data 0.001 (0.012)	Loss 5.1275 (5.3701)	Top-1 acc 13.281 (8.477)	Top-5 acc 28.516 (22.314)	lr 0.04314
Warmup Train [10][2160/3239]	Time 0.368 (0.515)	Data 0.001 (0.012)	Loss 5.3370 (5.3699)	Top-1 acc 8.594 (8.480)	Top-5 acc 23.828 (22.318)	lr 0.04313
Warmup Train [10][2170/3239]	Time 0.346 (0.515)	Data 0.001 (0.012)	Loss 5.2995 (5.3697)	Top-1 acc 9.375 (8.482)	Top-5 acc 23.047 (22.320)	lr 0.04313
Warmup Train [10][2180/3239]	Time 0.517 (0.515)	Data 0.001 (0.012)	Loss 5.3861 (5.3692)	Top-1 acc 7.422 (8.487)	Top-5 acc 22.266 (22.332)	lr 0.04313
Warmup Train [10][2190/3239]	Time 0.463 (0.515)	Data 0.001 (0.012)	Loss 5.2987 (5.3688)	Top-1 acc 8.203 (8.493)	Top-5 acc 24.219 (22.340)	lr 0.04312
Warmup Train [10][2200/3239]	Time 0.585 (0.515)	Data 0.001 (0.012)	Loss 5.4564 (5.3687)	Top-1 acc 7.031 (8.495)	Top-5 acc 19.922 (22.344)	lr 0.04312
Warmup Train [10][2210/3239]	Time 0.615 (0.515)	Data 0.001 (0.012)	Loss 5.3506 (5.3685)	Top-1 acc 7.422 (8.497)	Top-5 acc 21.875 (22.351)	lr 0.04311
Warmup Train [10][2220/3239]	Time 0.676 (0.515)	Data 0.001 (0.012)	Loss 5.2782 (5.3684)	Top-1 acc 12.109 (8.497)	Top-5 acc 23.828 (22.350)	lr 0.04311
Warmup Train [10][2230/3239]	Time 0.506 (0.514)	Data 0.001 (0.012)	Loss 5.4084 (5.3684)	Top-1 acc 7.812 (8.496)	Top-5 acc 21.094 (22.348)	lr 0.04311
Warmup Train [10][2240/3239]	Time 0.525 (0.514)	Data 0.001 (0.012)	Loss 5.3954 (5.3683)	Top-1 acc 10.156 (8.497)	Top-5 acc 23.047 (22.352)	lr 0.04310
Warmup Train [10][2250/3239]	Time 0.508 (0.514)	Data 0.001 (0.012)	Loss 5.2378 (5.3680)	Top-1 acc 9.375 (8.497)	Top-5 acc 28.516 (22.357)	lr 0.04310
Warmup Train [10][2260/3239]	Time 0.391 (0.514)	Data 0.001 (0.012)	Loss 5.3431 (5.3679)	Top-1 acc 6.250 (8.495)	Top-5 acc 19.531 (22.354)	lr 0.04309
Warmup Train [10][2270/3239]	Time 0.522 (0.514)	Data 0.001 (0.012)	Loss 5.2282 (5.3677)	Top-1 acc 10.547 (8.497)	Top-5 acc 24.609 (22.358)	lr 0.04309
Warmup Train [10][2280/3239]	Time 0.364 (0.514)	Data 0.001 (0.012)	Loss 5.2157 (5.3676)	Top-1 acc 10.547 (8.501)	Top-5 acc 27.344 (22.360)	lr 0.04308
Warmup Train [10][2290/3239]	Time 0.387 (0.514)	Data 0.001 (0.012)	Loss 5.3691 (5.3677)	Top-1 acc 5.469 (8.500)	Top-5 acc 23.047 (22.360)	lr 0.04308
Warmup Train [10][2300/3239]	Time 0.592 (0.514)	Data 0.001 (0.012)	Loss 5.3157 (5.3677)	Top-1 acc 12.109 (8.501)	Top-5 acc 24.219 (22.363)	lr 0.04308
Warmup Train [10][2310/3239]	Time 0.623 (0.514)	Data 0.001 (0.012)	Loss 5.3214 (5.3676)	Top-1 acc 11.719 (8.505)	Top-5 acc 25.391 (22.365)	lr 0.04307
Warmup Train [10][2320/3239]	Time 0.507 (0.514)	Data 0.001 (0.012)	Loss 5.3744 (5.3673)	Top-1 acc 9.375 (8.507)	Top-5 acc 24.609 (22.371)	lr 0.04307
Warmup Train [10][2330/3239]	Time 0.454 (0.514)	Data 0.001 (0.012)	Loss 5.4444 (5.3672)	Top-1 acc 6.641 (8.507)	Top-5 acc 20.312 (22.377)	lr 0.04306
Warmup Train [10][2340/3239]	Time 0.501 (0.515)	Data 0.001 (0.012)	Loss 5.3884 (5.3670)	Top-1 acc 7.422 (8.509)	Top-5 acc 18.750 (22.382)	lr 0.04306
Warmup Train [10][2350/3239]	Time 0.432 (0.514)	Data 0.002 (0.012)	Loss 5.2438 (5.3669)	Top-1 acc 12.891 (8.513)	Top-5 acc 28.516 (22.389)	lr 0.04305
Warmup Train [10][2360/3239]	Time 0.458 (0.515)	Data 0.001 (0.012)	Loss 5.3024 (5.3666)	Top-1 acc 7.031 (8.515)	Top-5 acc 20.703 (22.393)	lr 0.04305
Warmup Train [10][2370/3239]	Time 0.663 (0.514)	Data 0.001 (0.012)	Loss 5.3302 (5.3664)	Top-1 acc 8.984 (8.517)	Top-5 acc 18.750 (22.397)	lr 0.04305
Warmup Train [10][2380/3239]	Time 0.501 (0.514)	Data 0.001 (0.012)	Loss 5.3693 (5.3662)	Top-1 acc 8.984 (8.517)	Top-5 acc 20.312 (22.405)	lr 0.04304
Warmup Train [10][2390/3239]	Time 0.518 (0.514)	Data 0.001 (0.011)	Loss 5.4240 (5.3662)	Top-1 acc 7.422 (8.517)	Top-5 acc 20.312 (22.410)	lr 0.04304
Warmup Train [10][2400/3239]	Time 0.493 (0.515)	Data 0.001 (0.011)	Loss 5.4127 (5.3662)	Top-1 acc 8.203 (8.515)	Top-5 acc 22.266 (22.408)	lr 0.04303
Warmup Train [10][2410/3239]	Time 0.627 (0.515)	Data 0.001 (0.011)	Loss 5.2681 (5.3661)	Top-1 acc 10.156 (8.517)	Top-5 acc 24.609 (22.405)	lr 0.04303
Warmup Train [10][2420/3239]	Time 0.488 (0.515)	Data 0.001 (0.011)	Loss 5.4080 (5.3659)	Top-1 acc 7.812 (8.515)	Top-5 acc 17.578 (22.407)	lr 0.04303
Warmup Train [10][2430/3239]	Time 0.374 (0.514)	Data 0.001 (0.011)	Loss 5.3668 (5.3657)	Top-1 acc 8.594 (8.515)	Top-5 acc 21.094 (22.408)	lr 0.04302
Warmup Train [10][2440/3239]	Time 0.423 (0.515)	Data 0.001 (0.011)	Loss 5.2792 (5.3657)	Top-1 acc 11.328 (8.516)	Top-5 acc 24.609 (22.405)	lr 0.04302
Warmup Train [10][2450/3239]	Time 0.502 (0.515)	Data 0.001 (0.011)	Loss 5.4078 (5.3659)	Top-1 acc 7.422 (8.515)	Top-5 acc 18.359 (22.404)	lr 0.04301
Warmup Train [10][2460/3239]	Time 0.517 (0.514)	Data 0.001 (0.011)	Loss 5.1874 (5.3659)	Top-1 acc 12.109 (8.517)	Top-5 acc 26.953 (22.405)	lr 0.04301
Warmup Train [10][2470/3239]	Time 0.477 (0.514)	Data 0.001 (0.011)	Loss 5.2491 (5.3657)	Top-1 acc 12.109 (8.519)	Top-5 acc 27.344 (22.414)	lr 0.04300
Warmup Train [10][2480/3239]	Time 0.437 (0.514)	Data 0.001 (0.011)	Loss 5.2707 (5.3655)	Top-1 acc 7.812 (8.520)	Top-5 acc 25.000 (22.420)	lr 0.04300
Warmup Train [10][2490/3239]	Time 0.451 (0.514)	Data 0.001 (0.011)	Loss 5.2249 (5.3651)	Top-1 acc 11.328 (8.527)	Top-5 acc 26.562 (22.432)	lr 0.04300
Warmup Train [10][2500/3239]	Time 0.494 (0.514)	Data 0.001 (0.011)	Loss 5.4014 (5.3653)	Top-1 acc 5.469 (8.523)	Top-5 acc 18.359 (22.431)	lr 0.04299
Warmup Train [10][2510/3239]	Time 0.625 (0.514)	Data 0.001 (0.011)	Loss 5.4261 (5.3650)	Top-1 acc 7.422 (8.528)	Top-5 acc 19.141 (22.438)	lr 0.04299
Warmup Train [10][2520/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 5.2977 (5.3649)	Top-1 acc 9.766 (8.528)	Top-5 acc 25.000 (22.439)	lr 0.04298
Warmup Train [10][2530/3239]	Time 0.578 (0.514)	Data 0.001 (0.011)	Loss 5.1511 (5.3645)	Top-1 acc 10.156 (8.531)	Top-5 acc 23.828 (22.447)	lr 0.04298
Warmup Train [10][2540/3239]	Time 0.380 (0.514)	Data 0.001 (0.011)	Loss 5.2275 (5.3644)	Top-1 acc 8.984 (8.532)	Top-5 acc 29.297 (22.451)	lr 0.04298
Warmup Train [10][2550/3239]	Time 0.368 (0.514)	Data 0.001 (0.011)	Loss 5.4202 (5.3642)	Top-1 acc 8.594 (8.533)	Top-5 acc 21.094 (22.452)	lr 0.04297
Warmup Train [10][2560/3239]	Time 0.523 (0.514)	Data 0.001 (0.011)	Loss 5.4891 (5.3642)	Top-1 acc 7.031 (8.538)	Top-5 acc 19.141 (22.457)	lr 0.04297
Warmup Train [10][2570/3239]	Time 0.507 (0.514)	Data 0.001 (0.011)	Loss 5.2597 (5.3640)	Top-1 acc 10.547 (8.543)	Top-5 acc 26.172 (22.463)	lr 0.04296
Warmup Train [10][2580/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 5.2917 (5.3638)	Top-1 acc 8.203 (8.549)	Top-5 acc 21.094 (22.470)	lr 0.04296
Warmup Train [10][2590/3239]	Time 0.502 (0.514)	Data 0.001 (0.011)	Loss 5.3668 (5.3636)	Top-1 acc 7.031 (8.550)	Top-5 acc 19.922 (22.476)	lr 0.04295
Warmup Train [10][2600/3239]	Time 0.535 (0.514)	Data 0.001 (0.011)	Loss 5.3589 (5.3636)	Top-1 acc 6.250 (8.551)	Top-5 acc 18.359 (22.476)	lr 0.04295
Warmup Train [10][2610/3239]	Time 0.604 (0.514)	Data 0.001 (0.011)	Loss 5.3050 (5.3634)	Top-1 acc 10.938 (8.558)	Top-5 acc 26.562 (22.483)	lr 0.04295
Warmup Train [10][2620/3239]	Time 0.563 (0.514)	Data 0.001 (0.011)	Loss 5.3178 (5.3631)	Top-1 acc 12.109 (8.562)	Top-5 acc 23.828 (22.489)	lr 0.04294
Warmup Train [10][2630/3239]	Time 0.534 (0.514)	Data 0.001 (0.011)	Loss 5.2605 (5.3629)	Top-1 acc 11.719 (8.568)	Top-5 acc 25.391 (22.497)	lr 0.04294
Warmup Train [10][2640/3239]	Time 0.735 (0.514)	Data 0.001 (0.011)	Loss 5.3727 (5.3627)	Top-1 acc 7.812 (8.568)	Top-5 acc 21.875 (22.498)	lr 0.04293
Warmup Train [10][2650/3239]	Time 0.412 (0.514)	Data 0.001 (0.011)	Loss 5.4941 (5.3625)	Top-1 acc 6.641 (8.573)	Top-5 acc 19.531 (22.505)	lr 0.04293
Warmup Train [10][2660/3239]	Time 0.639 (0.514)	Data 0.001 (0.011)	Loss 5.3793 (5.3623)	Top-1 acc 11.719 (8.575)	Top-5 acc 26.172 (22.508)	lr 0.04292
Warmup Train [10][2670/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 5.3532 (5.3621)	Top-1 acc 7.422 (8.578)	Top-5 acc 26.562 (22.515)	lr 0.04292
Warmup Train [10][2680/3239]	Time 0.626 (0.514)	Data 0.001 (0.011)	Loss 5.3564 (5.3622)	Top-1 acc 7.812 (8.578)	Top-5 acc 19.922 (22.513)	lr 0.04292
Warmup Train [10][2690/3239]	Time 0.442 (0.514)	Data 0.001 (0.011)	Loss 5.2142 (5.3621)	Top-1 acc 9.766 (8.579)	Top-5 acc 25.000 (22.517)	lr 0.04291
Warmup Train [10][2700/3239]	Time 0.535 (0.514)	Data 0.001 (0.011)	Loss 5.4350 (5.3618)	Top-1 acc 8.984 (8.581)	Top-5 acc 20.703 (22.528)	lr 0.04291
Warmup Train [10][2710/3239]	Time 0.411 (0.514)	Data 0.001 (0.011)	Loss 5.4403 (5.3618)	Top-1 acc 10.156 (8.584)	Top-5 acc 23.438 (22.527)	lr 0.04290
Warmup Train [10][2720/3239]	Time 0.677 (0.514)	Data 0.001 (0.011)	Loss 5.2909 (5.3618)	Top-1 acc 8.594 (8.583)	Top-5 acc 21.484 (22.528)	lr 0.04290
Warmup Train [10][2730/3239]	Time 0.367 (0.514)	Data 0.001 (0.011)	Loss 5.1876 (5.3616)	Top-1 acc 7.422 (8.584)	Top-5 acc 21.875 (22.530)	lr 0.04289
Warmup Train [10][2740/3239]	Time 0.349 (0.514)	Data 0.001 (0.011)	Loss 5.3810 (5.3615)	Top-1 acc 6.250 (8.585)	Top-5 acc 22.656 (22.534)	lr 0.04289
Warmup Train [10][2750/3239]	Time 0.321 (0.514)	Data 0.001 (0.011)	Loss 5.2976 (5.3614)	Top-1 acc 14.062 (8.588)	Top-5 acc 28.906 (22.541)	lr 0.04289
Warmup Train [10][2760/3239]	Time 0.295 (0.514)	Data 0.001 (0.011)	Loss 5.2713 (5.3613)	Top-1 acc 7.031 (8.589)	Top-5 acc 25.000 (22.547)	lr 0.04288
Warmup Train [10][2770/3239]	Time 0.602 (0.514)	Data 0.001 (0.011)	Loss 5.4738 (5.3613)	Top-1 acc 7.031 (8.590)	Top-5 acc 19.531 (22.547)	lr 0.04288
Warmup Train [10][2780/3239]	Time 0.446 (0.514)	Data 0.001 (0.011)	Loss 5.2884 (5.3611)	Top-1 acc 10.156 (8.593)	Top-5 acc 23.828 (22.552)	lr 0.04287
Warmup Train [10][2790/3239]	Time 0.539 (0.514)	Data 0.001 (0.011)	Loss 5.3328 (5.3610)	Top-1 acc 10.547 (8.598)	Top-5 acc 26.172 (22.559)	lr 0.04287
Warmup Train [10][2800/3239]	Time 0.484 (0.514)	Data 0.001 (0.011)	Loss 5.3368 (5.3607)	Top-1 acc 5.078 (8.594)	Top-5 acc 21.875 (22.562)	lr 0.04287
Warmup Train [10][2810/3239]	Time 0.502 (0.514)	Data 0.001 (0.011)	Loss 5.3624 (5.3608)	Top-1 acc 8.203 (8.595)	Top-5 acc 21.875 (22.562)	lr 0.04286
Warmup Train [10][2820/3239]	Time 0.574 (0.514)	Data 0.001 (0.011)	Loss 5.2613 (5.3606)	Top-1 acc 12.500 (8.600)	Top-5 acc 25.391 (22.567)	lr 0.04286
Warmup Train [10][2830/3239]	Time 0.625 (0.514)	Data 0.001 (0.011)	Loss 5.3990 (5.3604)	Top-1 acc 9.375 (8.601)	Top-5 acc 20.703 (22.573)	lr 0.04285
Warmup Train [10][2840/3239]	Time 0.727 (0.514)	Data 0.001 (0.011)	Loss 5.3662 (5.3602)	Top-1 acc 11.328 (8.604)	Top-5 acc 24.609 (22.579)	lr 0.04285
Warmup Train [10][2850/3239]	Time 0.548 (0.514)	Data 0.001 (0.011)	Loss 5.1931 (5.3599)	Top-1 acc 9.375 (8.605)	Top-5 acc 28.125 (22.583)	lr 0.04284
Warmup Train [10][2860/3239]	Time 0.538 (0.514)	Data 0.001 (0.011)	Loss 5.0656 (5.3596)	Top-1 acc 11.328 (8.608)	Top-5 acc 28.516 (22.593)	lr 0.04284
Warmup Train [10][2870/3239]	Time 0.579 (0.514)	Data 0.001 (0.011)	Loss 5.3238 (5.3593)	Top-1 acc 11.719 (8.609)	Top-5 acc 20.703 (22.599)	lr 0.04284
Warmup Train [10][2880/3239]	Time 0.483 (0.514)	Data 0.001 (0.011)	Loss 5.4108 (5.3593)	Top-1 acc 9.766 (8.612)	Top-5 acc 21.094 (22.597)	lr 0.04283
Warmup Train [10][2890/3239]	Time 0.471 (0.514)	Data 0.001 (0.011)	Loss 5.3761 (5.3592)	Top-1 acc 7.812 (8.612)	Top-5 acc 22.656 (22.600)	lr 0.04283
Warmup Train [10][2900/3239]	Time 0.476 (0.514)	Data 0.001 (0.011)	Loss 5.3377 (5.3590)	Top-1 acc 9.375 (8.615)	Top-5 acc 23.438 (22.605)	lr 0.04282
Warmup Train [10][2910/3239]	Time 0.351 (0.514)	Data 0.001 (0.011)	Loss 5.5026 (5.3588)	Top-1 acc 7.422 (8.619)	Top-5 acc 19.922 (22.609)	lr 0.04282
Warmup Train [10][2920/3239]	Time 0.733 (0.514)	Data 0.001 (0.011)	Loss 5.3781 (5.3587)	Top-1 acc 7.812 (8.619)	Top-5 acc 19.922 (22.610)	lr 0.04281
Warmup Train [10][2930/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 5.2638 (5.3585)	Top-1 acc 10.547 (8.621)	Top-5 acc 28.125 (22.615)	lr 0.04281
Warmup Train [10][2940/3239]	Time 0.538 (0.514)	Data 0.001 (0.011)	Loss 5.3280 (5.3584)	Top-1 acc 8.203 (8.621)	Top-5 acc 23.047 (22.619)	lr 0.04281
Warmup Train [10][2950/3239]	Time 0.517 (0.514)	Data 0.001 (0.011)	Loss 5.3314 (5.3582)	Top-1 acc 11.328 (8.626)	Top-5 acc 24.219 (22.622)	lr 0.04280
Warmup Train [10][2960/3239]	Time 0.543 (0.514)	Data 0.001 (0.011)	Loss 5.4517 (5.3581)	Top-1 acc 7.031 (8.625)	Top-5 acc 21.484 (22.623)	lr 0.04280
Warmup Train [10][2970/3239]	Time 0.590 (0.514)	Data 0.001 (0.011)	Loss 5.2178 (5.3579)	Top-1 acc 8.203 (8.629)	Top-5 acc 26.953 (22.629)	lr 0.04279
Warmup Train [10][2980/3239]	Time 0.418 (0.514)	Data 0.001 (0.010)	Loss 5.3350 (5.3579)	Top-1 acc 8.984 (8.630)	Top-5 acc 25.781 (22.633)	lr 0.04279
Warmup Train [10][2990/3239]	Time 0.490 (0.514)	Data 0.001 (0.010)	Loss 5.5522 (5.3578)	Top-1 acc 6.250 (8.632)	Top-5 acc 21.875 (22.636)	lr 0.04278
Warmup Train [10][3000/3239]	Time 0.402 (0.514)	Data 0.001 (0.010)	Loss 5.3941 (5.3577)	Top-1 acc 5.859 (8.633)	Top-5 acc 21.875 (22.636)	lr 0.04278
Warmup Train [10][3010/3239]	Time 0.419 (0.514)	Data 0.001 (0.010)	Loss 5.2396 (5.3575)	Top-1 acc 10.156 (8.636)	Top-5 acc 27.734 (22.641)	lr 0.04278
Warmup Train [10][3020/3239]	Time 0.447 (0.514)	Data 0.001 (0.010)	Loss 5.2637 (5.3575)	Top-1 acc 9.375 (8.637)	Top-5 acc 23.828 (22.640)	lr 0.04277
Warmup Train [10][3030/3239]	Time 0.512 (0.514)	Data 0.001 (0.010)	Loss 5.3202 (5.3572)	Top-1 acc 9.766 (8.640)	Top-5 acc 28.125 (22.647)	lr 0.04277
Warmup Train [10][3040/3239]	Time 0.576 (0.514)	Data 0.001 (0.010)	Loss 5.3684 (5.3571)	Top-1 acc 8.984 (8.644)	Top-5 acc 24.219 (22.652)	lr 0.04276
Warmup Train [10][3050/3239]	Time 0.606 (0.514)	Data 0.001 (0.010)	Loss 5.4351 (5.3568)	Top-1 acc 7.031 (8.650)	Top-5 acc 14.453 (22.659)	lr 0.04276
Warmup Train [10][3060/3239]	Time 0.393 (0.514)	Data 0.001 (0.010)	Loss 5.3593 (5.3567)	Top-1 acc 10.547 (8.652)	Top-5 acc 23.828 (22.664)	lr 0.04275
Warmup Train [10][3070/3239]	Time 0.453 (0.514)	Data 0.001 (0.010)	Loss 5.3011 (5.3564)	Top-1 acc 8.203 (8.653)	Top-5 acc 23.047 (22.668)	lr 0.04275
Warmup Train [10][3080/3239]	Time 0.600 (0.514)	Data 0.001 (0.010)	Loss 5.3216 (5.3563)	Top-1 acc 6.250 (8.654)	Top-5 acc 23.047 (22.672)	lr 0.04275
Warmup Train [10][3090/3239]	Time 0.578 (0.514)	Data 0.001 (0.010)	Loss 5.3227 (5.3562)	Top-1 acc 8.203 (8.657)	Top-5 acc 23.828 (22.677)	lr 0.04274
Warmup Train [10][3100/3239]	Time 0.491 (0.514)	Data 0.001 (0.010)	Loss 5.2486 (5.3562)	Top-1 acc 9.766 (8.660)	Top-5 acc 25.000 (22.679)	lr 0.04274
Warmup Train [10][3110/3239]	Time 0.512 (0.514)	Data 0.001 (0.010)	Loss 5.5018 (5.3562)	Top-1 acc 8.203 (8.661)	Top-5 acc 21.094 (22.679)	lr 0.04273
Warmup Train [10][3120/3239]	Time 0.554 (0.514)	Data 0.001 (0.010)	Loss 5.3368 (5.3560)	Top-1 acc 7.031 (8.661)	Top-5 acc 23.047 (22.682)	lr 0.04273
Warmup Train [10][3130/3239]	Time 0.620 (0.514)	Data 0.001 (0.010)	Loss 5.2738 (5.3558)	Top-1 acc 10.938 (8.664)	Top-5 acc 22.266 (22.687)	lr 0.04272
Warmup Train [10][3140/3239]	Time 0.316 (0.514)	Data 0.001 (0.010)	Loss 5.2040 (5.3556)	Top-1 acc 10.938 (8.668)	Top-5 acc 25.391 (22.693)	lr 0.04272
Warmup Train [10][3150/3239]	Time 0.547 (0.514)	Data 0.001 (0.010)	Loss 5.1882 (5.3555)	Top-1 acc 12.109 (8.671)	Top-5 acc 25.000 (22.695)	lr 0.04272
Warmup Train [10][3160/3239]	Time 0.482 (0.514)	Data 0.001 (0.010)	Loss 5.3711 (5.3554)	Top-1 acc 7.812 (8.673)	Top-5 acc 23.047 (22.697)	lr 0.04271
Warmup Train [10][3170/3239]	Time 0.515 (0.514)	Data 0.001 (0.010)	Loss 5.2527 (5.3552)	Top-1 acc 9.766 (8.674)	Top-5 acc 25.391 (22.701)	lr 0.04271
Warmup Train [10][3180/3239]	Time 0.597 (0.514)	Data 0.000 (0.010)	Loss 5.2914 (5.3551)	Top-1 acc 7.031 (8.676)	Top-5 acc 26.562 (22.704)	lr 0.04270
Warmup Train [10][3190/3239]	Time 0.497 (0.514)	Data 0.000 (0.010)	Loss 5.2936 (5.3547)	Top-1 acc 8.203 (8.677)	Top-5 acc 23.047 (22.712)	lr 0.04270
Warmup Train [10][3200/3239]	Time 0.491 (0.514)	Data 0.000 (0.010)	Loss 5.5665 (5.3547)	Top-1 acc 10.156 (8.679)	Top-5 acc 22.656 (22.714)	lr 0.04269
Warmup Train [10][3210/3239]	Time 0.485 (0.514)	Data 0.000 (0.010)	Loss 5.4225 (5.3544)	Top-1 acc 7.422 (8.684)	Top-5 acc 23.047 (22.720)	lr 0.04269
Warmup Train [10][3220/3239]	Time 0.559 (0.514)	Data 0.000 (0.010)	Loss 5.3687 (5.3543)	Top-1 acc 7.031 (8.682)	Top-5 acc 21.094 (22.719)	lr 0.04269
Warmup Train [10][3230/3239]	Time 0.527 (0.514)	Data 0.000 (0.010)	Loss 5.2368 (5.3540)	Top-1 acc 8.594 (8.689)	Top-5 acc 24.219 (22.729)	lr 0.04268
Warmup Train [10][3239/3239]	Time 0.292 (0.514)	Data 0.000 (0.010)	Loss 5.1062 (5.3537)	Top-1 acc 8.642 (8.693)	Top-5 acc 28.395 (22.735)	lr 0.04268
==========Warmup Valid [10/40]	loss 4.614	top-1 acc 12.697	top-5 acc 30.291	Train top-1 8.693	top-5 22.735	flops: 442.4M
Warmup Train [11][0/3239]	Time 12.381 (12.381)	Data 10.434 (10.434)	Loss 5.3065 (5.3065)	Top-1 acc 11.328 (11.328)	Top-5 acc 22.656 (22.656)	lr 0.04268
Warmup Train [11][10/3239]	Time 0.492 (1.661)	Data 0.001 (0.953)	Loss 5.2067 (5.3067)	Top-1 acc 11.328 (9.588)	Top-5 acc 28.516 (23.757)	lr 0.04267
Warmup Train [11][20/3239]	Time 0.474 (1.110)	Data 0.001 (0.502)	Loss 5.2435 (5.3050)	Top-1 acc 10.938 (9.431)	Top-5 acc 23.828 (23.270)	lr 0.04267
Warmup Train [11][30/3239]	Time 0.586 (0.917)	Data 0.002 (0.344)	Loss 5.3170 (5.3139)	Top-1 acc 8.594 (9.413)	Top-5 acc 25.391 (23.400)	lr 0.04266
Warmup Train [11][40/3239]	Time 0.578 (0.819)	Data 0.002 (0.262)	Loss 5.3633 (5.3171)	Top-1 acc 9.766 (9.108)	Top-5 acc 26.953 (23.628)	lr 0.04266
Warmup Train [11][50/3239]	Time 0.613 (0.762)	Data 0.001 (0.211)	Loss 5.2285 (5.3113)	Top-1 acc 8.594 (9.069)	Top-5 acc 25.000 (23.453)	lr 0.04266
Warmup Train [11][60/3239]	Time 0.602 (0.721)	Data 0.001 (0.178)	Loss 5.3855 (5.3075)	Top-1 acc 8.203 (9.189)	Top-5 acc 25.000 (23.687)	lr 0.04265
Warmup Train [11][70/3239]	Time 0.596 (0.691)	Data 0.001 (0.153)	Loss 5.2724 (5.3017)	Top-1 acc 10.547 (9.259)	Top-5 acc 23.828 (23.845)	lr 0.04265
Warmup Train [11][80/3239]	Time 0.581 (0.667)	Data 0.001 (0.135)	Loss 5.2964 (5.2962)	Top-1 acc 7.812 (9.144)	Top-5 acc 22.656 (23.968)	lr 0.04264
Warmup Train [11][90/3239]	Time 0.404 (0.648)	Data 0.001 (0.120)	Loss 5.3270 (5.2956)	Top-1 acc 7.422 (9.182)	Top-5 acc 25.781 (23.983)	lr 0.04264
Warmup Train [11][100/3239]	Time 0.521 (0.637)	Data 0.001 (0.109)	Loss 5.3385 (5.2945)	Top-1 acc 7.422 (9.097)	Top-5 acc 22.656 (23.991)	lr 0.04263
Warmup Train [11][110/3239]	Time 0.430 (0.626)	Data 0.001 (0.100)	Loss 5.2679 (5.2904)	Top-1 acc 4.297 (9.129)	Top-5 acc 24.609 (24.050)	lr 0.04263
Warmup Train [11][120/3239]	Time 0.480 (0.613)	Data 0.001 (0.092)	Loss 5.5099 (5.2899)	Top-1 acc 6.641 (9.155)	Top-5 acc 24.219 (24.048)	lr 0.04263
Warmup Train [11][130/3239]	Time 0.551 (0.604)	Data 0.001 (0.085)	Loss 5.2452 (5.2889)	Top-1 acc 9.375 (9.199)	Top-5 acc 25.391 (24.117)	lr 0.04262
Warmup Train [11][140/3239]	Time 0.315 (0.594)	Data 0.001 (0.080)	Loss 5.2183 (5.2872)	Top-1 acc 10.938 (9.239)	Top-5 acc 26.562 (24.161)	lr 0.04262
Warmup Train [11][150/3239]	Time 0.590 (0.588)	Data 0.001 (0.075)	Loss 5.2126 (5.2899)	Top-1 acc 10.938 (9.248)	Top-5 acc 24.219 (24.108)	lr 0.04261
Warmup Train [11][160/3239]	Time 0.443 (0.580)	Data 0.001 (0.072)	Loss 5.2385 (5.2925)	Top-1 acc 9.766 (9.234)	Top-5 acc 25.781 (24.010)	lr 0.04261
Warmup Train [11][170/3239]	Time 0.417 (0.576)	Data 0.001 (0.068)	Loss 5.3681 (5.2925)	Top-1 acc 8.594 (9.220)	Top-5 acc 20.703 (24.020)	lr 0.04260
Warmup Train [11][180/3239]	Time 0.602 (0.573)	Data 0.001 (0.065)	Loss 5.2483 (5.2923)	Top-1 acc 10.547 (9.207)	Top-5 acc 22.656 (24.012)	lr 0.04260
Warmup Train [11][190/3239]	Time 0.617 (0.570)	Data 0.001 (0.062)	Loss 5.3176 (5.2932)	Top-1 acc 7.031 (9.205)	Top-5 acc 22.266 (24.000)	lr 0.04260
Warmup Train [11][200/3239]	Time 0.605 (0.567)	Data 0.001 (0.059)	Loss 5.2023 (5.2909)	Top-1 acc 10.156 (9.255)	Top-5 acc 23.047 (24.024)	lr 0.04259
Warmup Train [11][210/3239]	Time 0.536 (0.565)	Data 0.001 (0.057)	Loss 5.2745 (5.2906)	Top-1 acc 12.891 (9.281)	Top-5 acc 25.781 (24.098)	lr 0.04259
Warmup Train [11][220/3239]	Time 0.522 (0.562)	Data 0.002 (0.054)	Loss 5.4254 (5.2909)	Top-1 acc 10.156 (9.320)	Top-5 acc 21.484 (24.093)	lr 0.04258
Warmup Train [11][230/3239]	Time 0.374 (0.559)	Data 0.001 (0.052)	Loss 5.4016 (5.2919)	Top-1 acc 10.547 (9.319)	Top-5 acc 25.391 (24.094)	lr 0.04258
Warmup Train [11][240/3239]	Time 0.606 (0.558)	Data 0.001 (0.050)	Loss 5.3449 (5.2927)	Top-1 acc 7.422 (9.304)	Top-5 acc 22.656 (24.100)	lr 0.04257
Warmup Train [11][250/3239]	Time 0.598 (0.556)	Data 0.001 (0.048)	Loss 5.2022 (5.2930)	Top-1 acc 8.203 (9.300)	Top-5 acc 23.828 (24.091)	lr 0.04257
Warmup Train [11][260/3239]	Time 0.470 (0.554)	Data 0.001 (0.047)	Loss 5.1518 (5.2920)	Top-1 acc 11.328 (9.338)	Top-5 acc 25.391 (24.090)	lr 0.04257
Warmup Train [11][270/3239]	Time 0.584 (0.552)	Data 0.001 (0.045)	Loss 5.2914 (5.2913)	Top-1 acc 9.766 (9.379)	Top-5 acc 24.219 (24.096)	lr 0.04256
Warmup Train [11][280/3239]	Time 0.371 (0.551)	Data 0.001 (0.044)	Loss 5.3392 (5.2904)	Top-1 acc 7.422 (9.401)	Top-5 acc 24.219 (24.152)	lr 0.04256
Warmup Train [11][290/3239]	Time 0.466 (0.549)	Data 0.001 (0.043)	Loss 5.4010 (5.2906)	Top-1 acc 7.422 (9.402)	Top-5 acc 19.531 (24.146)	lr 0.04255
Warmup Train [11][300/3239]	Time 0.480 (0.548)	Data 0.001 (0.042)	Loss 5.2063 (5.2917)	Top-1 acc 9.766 (9.396)	Top-5 acc 21.875 (24.114)	lr 0.04255
Warmup Train [11][310/3239]	Time 0.346 (0.547)	Data 0.001 (0.041)	Loss 5.2565 (5.2922)	Top-1 acc 10.156 (9.371)	Top-5 acc 26.172 (24.088)	lr 0.04254
Warmup Train [11][320/3239]	Time 0.404 (0.545)	Data 0.001 (0.040)	Loss 5.2280 (5.2914)	Top-1 acc 9.766 (9.386)	Top-5 acc 23.828 (24.076)	lr 0.04254
Warmup Train [11][330/3239]	Time 0.584 (0.544)	Data 0.001 (0.039)	Loss 5.3121 (5.2918)	Top-1 acc 8.984 (9.422)	Top-5 acc 24.609 (24.059)	lr 0.04254
Warmup Train [11][340/3239]	Time 0.320 (0.543)	Data 0.001 (0.038)	Loss 5.3061 (5.2923)	Top-1 acc 10.156 (9.404)	Top-5 acc 23.438 (24.043)	lr 0.04253
Warmup Train [11][350/3239]	Time 0.518 (0.542)	Data 0.001 (0.037)	Loss 5.4240 (5.2928)	Top-1 acc 8.984 (9.399)	Top-5 acc 20.703 (24.011)	lr 0.04253
Warmup Train [11][360/3239]	Time 0.485 (0.541)	Data 0.001 (0.036)	Loss 5.2872 (5.2928)	Top-1 acc 10.156 (9.401)	Top-5 acc 21.875 (23.990)	lr 0.04252
Warmup Train [11][370/3239]	Time 0.491 (0.540)	Data 0.001 (0.036)	Loss 5.3343 (5.2929)	Top-1 acc 9.766 (9.388)	Top-5 acc 24.609 (23.979)	lr 0.04252
Warmup Train [11][380/3239]	Time 0.610 (0.540)	Data 0.001 (0.035)	Loss 5.2365 (5.2928)	Top-1 acc 8.203 (9.398)	Top-5 acc 25.000 (23.989)	lr 0.04251
Warmup Train [11][390/3239]	Time 0.557 (0.538)	Data 0.001 (0.034)	Loss 5.2571 (5.2931)	Top-1 acc 10.547 (9.375)	Top-5 acc 22.266 (23.978)	lr 0.04251
Warmup Train [11][400/3239]	Time 0.338 (0.537)	Data 0.001 (0.033)	Loss 5.2537 (5.2930)	Top-1 acc 8.984 (9.385)	Top-5 acc 23.047 (23.965)	lr 0.04251
Warmup Train [11][410/3239]	Time 0.499 (0.536)	Data 0.001 (0.033)	Loss 5.2394 (5.2929)	Top-1 acc 8.203 (9.386)	Top-5 acc 23.828 (23.935)	lr 0.04250
Warmup Train [11][420/3239]	Time 0.438 (0.535)	Data 0.001 (0.032)	Loss 5.5028 (5.2939)	Top-1 acc 5.859 (9.407)	Top-5 acc 19.141 (23.934)	lr 0.04250
Warmup Train [11][430/3239]	Time 0.524 (0.533)	Data 0.001 (0.032)	Loss 5.1829 (5.2930)	Top-1 acc 10.547 (9.418)	Top-5 acc 27.344 (23.942)	lr 0.04249
Warmup Train [11][440/3239]	Time 0.375 (0.532)	Data 0.001 (0.031)	Loss 5.2229 (5.2928)	Top-1 acc 10.547 (9.418)	Top-5 acc 23.828 (23.938)	lr 0.04249
Warmup Train [11][450/3239]	Time 0.414 (0.532)	Data 0.001 (0.031)	Loss 5.3170 (5.2924)	Top-1 acc 11.328 (9.414)	Top-5 acc 24.609 (23.945)	lr 0.04248
Warmup Train [11][460/3239]	Time 0.580 (0.532)	Data 0.001 (0.030)	Loss 5.4120 (5.2918)	Top-1 acc 8.594 (9.421)	Top-5 acc 19.141 (23.970)	lr 0.04248
Warmup Train [11][470/3239]	Time 0.516 (0.532)	Data 0.001 (0.030)	Loss 5.3435 (5.2914)	Top-1 acc 8.203 (9.447)	Top-5 acc 24.609 (23.991)	lr 0.04248
Warmup Train [11][480/3239]	Time 0.639 (0.531)	Data 0.001 (0.029)	Loss 5.4480 (5.2922)	Top-1 acc 7.031 (9.438)	Top-5 acc 18.359 (23.955)	lr 0.04247
Warmup Train [11][490/3239]	Time 0.510 (0.530)	Data 0.001 (0.029)	Loss 5.2558 (5.2922)	Top-1 acc 9.766 (9.455)	Top-5 acc 23.828 (23.972)	lr 0.04247
Warmup Train [11][500/3239]	Time 0.655 (0.530)	Data 0.001 (0.028)	Loss 5.1766 (5.2912)	Top-1 acc 13.672 (9.469)	Top-5 acc 27.344 (24.008)	lr 0.04246
Warmup Train [11][510/3239]	Time 0.554 (0.529)	Data 0.001 (0.028)	Loss 5.2393 (5.2915)	Top-1 acc 8.984 (9.468)	Top-5 acc 24.219 (24.010)	lr 0.04246
Warmup Train [11][520/3239]	Time 0.610 (0.528)	Data 0.001 (0.027)	Loss 5.2644 (5.2918)	Top-1 acc 10.938 (9.466)	Top-5 acc 24.609 (24.007)	lr 0.04245
Warmup Train [11][530/3239]	Time 0.493 (0.528)	Data 0.001 (0.027)	Loss 5.1984 (5.2917)	Top-1 acc 11.719 (9.457)	Top-5 acc 27.734 (24.004)	lr 0.04245
Warmup Train [11][540/3239]	Time 0.497 (0.528)	Data 0.001 (0.027)	Loss 5.4175 (5.2916)	Top-1 acc 7.812 (9.458)	Top-5 acc 20.312 (24.016)	lr 0.04244
Warmup Train [11][550/3239]	Time 0.593 (0.528)	Data 0.001 (0.026)	Loss 5.1335 (5.2914)	Top-1 acc 11.719 (9.444)	Top-5 acc 28.516 (24.010)	lr 0.04244
Warmup Train [11][560/3239]	Time 0.549 (0.528)	Data 0.020 (0.026)	Loss 5.1843 (5.2906)	Top-1 acc 10.547 (9.440)	Top-5 acc 26.562 (24.018)	lr 0.04244
Warmup Train [11][570/3239]	Time 0.540 (0.527)	Data 0.001 (0.025)	Loss 5.1768 (5.2896)	Top-1 acc 9.766 (9.458)	Top-5 acc 26.953 (24.054)	lr 0.04243
Warmup Train [11][580/3239]	Time 0.480 (0.528)	Data 0.001 (0.025)	Loss 5.2667 (5.2899)	Top-1 acc 12.109 (9.446)	Top-5 acc 26.953 (24.049)	lr 0.04243
Warmup Train [11][590/3239]	Time 0.445 (0.527)	Data 0.001 (0.025)	Loss 5.2368 (5.2906)	Top-1 acc 11.328 (9.440)	Top-5 acc 23.828 (24.034)	lr 0.04242
Warmup Train [11][600/3239]	Time 0.589 (0.527)	Data 0.001 (0.025)	Loss 5.1884 (5.2904)	Top-1 acc 8.984 (9.439)	Top-5 acc 24.609 (24.040)	lr 0.04242
Warmup Train [11][610/3239]	Time 0.583 (0.527)	Data 0.001 (0.024)	Loss 5.3108 (5.2903)	Top-1 acc 12.500 (9.440)	Top-5 acc 26.953 (24.045)	lr 0.04241
Warmup Train [11][620/3239]	Time 0.559 (0.527)	Data 0.001 (0.024)	Loss 5.4458 (5.2902)	Top-1 acc 8.594 (9.427)	Top-5 acc 23.828 (24.046)	lr 0.04241
Warmup Train [11][630/3239]	Time 0.583 (0.527)	Data 0.001 (0.024)	Loss 5.1738 (5.2909)	Top-1 acc 12.109 (9.423)	Top-5 acc 29.688 (24.039)	lr 0.04241
Warmup Train [11][640/3239]	Time 0.526 (0.527)	Data 0.001 (0.023)	Loss 5.1833 (5.2906)	Top-1 acc 14.453 (9.442)	Top-5 acc 32.031 (24.052)	lr 0.04240
Warmup Train [11][650/3239]	Time 0.308 (0.526)	Data 0.001 (0.023)	Loss 5.4211 (5.2905)	Top-1 acc 7.031 (9.436)	Top-5 acc 19.531 (24.044)	lr 0.04240
Warmup Train [11][660/3239]	Time 0.508 (0.526)	Data 0.001 (0.023)	Loss 5.2998 (5.2899)	Top-1 acc 8.984 (9.439)	Top-5 acc 22.266 (24.061)	lr 0.04239
Warmup Train [11][670/3239]	Time 0.367 (0.525)	Data 0.001 (0.022)	Loss 5.2485 (5.2907)	Top-1 acc 9.766 (9.412)	Top-5 acc 25.000 (24.044)	lr 0.04239
Warmup Train [11][680/3239]	Time 0.656 (0.524)	Data 0.001 (0.022)	Loss 5.1674 (5.2905)	Top-1 acc 9.375 (9.425)	Top-5 acc 25.391 (24.054)	lr 0.04238
Warmup Train [11][690/3239]	Time 0.644 (0.524)	Data 0.001 (0.022)	Loss 5.2100 (5.2901)	Top-1 acc 10.156 (9.437)	Top-5 acc 25.781 (24.074)	lr 0.04238
Warmup Train [11][700/3239]	Time 0.562 (0.523)	Data 0.001 (0.022)	Loss 5.2713 (5.2901)	Top-1 acc 10.156 (9.435)	Top-5 acc 25.000 (24.074)	lr 0.04238
Warmup Train [11][710/3239]	Time 0.562 (0.523)	Data 0.001 (0.021)	Loss 5.3371 (5.2898)	Top-1 acc 8.594 (9.432)	Top-5 acc 23.047 (24.081)	lr 0.04237
Warmup Train [11][720/3239]	Time 0.358 (0.523)	Data 0.001 (0.021)	Loss 5.2655 (5.2900)	Top-1 acc 11.328 (9.424)	Top-5 acc 26.953 (24.076)	lr 0.04237
Warmup Train [11][730/3239]	Time 0.580 (0.523)	Data 0.001 (0.021)	Loss 5.2177 (5.2896)	Top-1 acc 12.109 (9.435)	Top-5 acc 25.781 (24.086)	lr 0.04236
Warmup Train [11][740/3239]	Time 0.413 (0.523)	Data 0.001 (0.021)	Loss 5.3078 (5.2899)	Top-1 acc 9.375 (9.429)	Top-5 acc 22.266 (24.082)	lr 0.04236
Warmup Train [11][750/3239]	Time 0.429 (0.523)	Data 0.001 (0.021)	Loss 5.2236 (5.2900)	Top-1 acc 10.156 (9.426)	Top-5 acc 25.000 (24.078)	lr 0.04235
Warmup Train [11][760/3239]	Time 0.342 (0.523)	Data 0.001 (0.021)	Loss 5.4330 (5.2897)	Top-1 acc 9.375 (9.431)	Top-5 acc 20.312 (24.085)	lr 0.04235
Warmup Train [11][770/3239]	Time 0.439 (0.522)	Data 0.001 (0.021)	Loss 5.2865 (5.2891)	Top-1 acc 9.766 (9.443)	Top-5 acc 22.266 (24.105)	lr 0.04234
Warmup Train [11][780/3239]	Time 0.432 (0.522)	Data 0.001 (0.021)	Loss 5.2634 (5.2890)	Top-1 acc 10.547 (9.437)	Top-5 acc 26.953 (24.109)	lr 0.04234
Warmup Train [11][790/3239]	Time 0.494 (0.522)	Data 0.001 (0.021)	Loss 5.2383 (5.2884)	Top-1 acc 10.938 (9.449)	Top-5 acc 24.219 (24.123)	lr 0.04234
Warmup Train [11][800/3239]	Time 0.626 (0.522)	Data 0.002 (0.020)	Loss 5.2279 (5.2883)	Top-1 acc 12.109 (9.453)	Top-5 acc 26.172 (24.128)	lr 0.04233
Warmup Train [11][810/3239]	Time 0.394 (0.522)	Data 0.001 (0.020)	Loss 5.4084 (5.2886)	Top-1 acc 7.422 (9.445)	Top-5 acc 19.922 (24.116)	lr 0.04233
Warmup Train [11][820/3239]	Time 0.568 (0.522)	Data 0.001 (0.020)	Loss 5.2499 (5.2888)	Top-1 acc 11.719 (9.447)	Top-5 acc 26.562 (24.110)	lr 0.04232
Warmup Train [11][830/3239]	Time 0.545 (0.522)	Data 0.001 (0.020)	Loss 5.2470 (5.2887)	Top-1 acc 8.984 (9.438)	Top-5 acc 24.219 (24.099)	lr 0.04232
Warmup Train [11][840/3239]	Time 0.496 (0.522)	Data 0.001 (0.020)	Loss 5.1728 (5.2884)	Top-1 acc 9.375 (9.442)	Top-5 acc 26.562 (24.114)	lr 0.04231
Warmup Train [11][850/3239]	Time 0.497 (0.522)	Data 0.001 (0.020)	Loss 5.2071 (5.2878)	Top-1 acc 11.719 (9.462)	Top-5 acc 26.562 (24.134)	lr 0.04231
Warmup Train [11][860/3239]	Time 0.550 (0.522)	Data 0.001 (0.019)	Loss 5.3461 (5.2874)	Top-1 acc 11.328 (9.470)	Top-5 acc 25.391 (24.140)	lr 0.04231
Warmup Train [11][870/3239]	Time 0.518 (0.522)	Data 0.001 (0.019)	Loss 5.2953 (5.2871)	Top-1 acc 8.984 (9.484)	Top-5 acc 24.219 (24.140)	lr 0.04230
Warmup Train [11][880/3239]	Time 0.468 (0.521)	Data 0.001 (0.019)	Loss 5.1805 (5.2865)	Top-1 acc 9.766 (9.496)	Top-5 acc 25.391 (24.164)	lr 0.04230
Warmup Train [11][890/3239]	Time 0.595 (0.521)	Data 0.001 (0.019)	Loss 5.0636 (5.2863)	Top-1 acc 10.938 (9.497)	Top-5 acc 27.344 (24.163)	lr 0.04229
Warmup Train [11][900/3239]	Time 0.523 (0.522)	Data 0.001 (0.019)	Loss 5.3758 (5.2864)	Top-1 acc 7.422 (9.502)	Top-5 acc 19.922 (24.169)	lr 0.04229
Warmup Train [11][910/3239]	Time 0.572 (0.522)	Data 0.001 (0.018)	Loss 5.2165 (5.2865)	Top-1 acc 12.109 (9.504)	Top-5 acc 25.781 (24.166)	lr 0.04228
Warmup Train [11][920/3239]	Time 0.648 (0.521)	Data 0.001 (0.018)	Loss 5.3601 (5.2862)	Top-1 acc 8.203 (9.507)	Top-5 acc 23.828 (24.165)	lr 0.04228
Warmup Train [11][930/3239]	Time 0.574 (0.521)	Data 0.001 (0.018)	Loss 5.3553 (5.2862)	Top-1 acc 9.766 (9.515)	Top-5 acc 22.266 (24.169)	lr 0.04227
Warmup Train [11][940/3239]	Time 0.523 (0.521)	Data 0.001 (0.018)	Loss 5.1923 (5.2861)	Top-1 acc 11.719 (9.513)	Top-5 acc 26.562 (24.165)	lr 0.04227
Warmup Train [11][950/3239]	Time 0.517 (0.521)	Data 0.001 (0.018)	Loss 5.3603 (5.2860)	Top-1 acc 9.766 (9.514)	Top-5 acc 20.312 (24.158)	lr 0.04227
Warmup Train [11][960/3239]	Time 0.540 (0.520)	Data 0.001 (0.018)	Loss 5.3079 (5.2859)	Top-1 acc 8.594 (9.522)	Top-5 acc 24.609 (24.174)	lr 0.04226
Warmup Train [11][970/3239]	Time 0.306 (0.520)	Data 0.001 (0.018)	Loss 5.1904 (5.2857)	Top-1 acc 11.328 (9.519)	Top-5 acc 26.953 (24.187)	lr 0.04226
Warmup Train [11][980/3239]	Time 0.540 (0.520)	Data 0.001 (0.018)	Loss 5.1970 (5.2856)	Top-1 acc 11.328 (9.517)	Top-5 acc 30.078 (24.193)	lr 0.04225
Warmup Train [11][990/3239]	Time 0.560 (0.520)	Data 0.001 (0.017)	Loss 5.2582 (5.2858)	Top-1 acc 8.594 (9.516)	Top-5 acc 25.000 (24.185)	lr 0.04225
Warmup Train [11][1000/3239]	Time 0.568 (0.520)	Data 0.001 (0.017)	Loss 5.3266 (5.2859)	Top-1 acc 10.938 (9.508)	Top-5 acc 24.609 (24.180)	lr 0.04224
Warmup Train [11][1010/3239]	Time 0.381 (0.520)	Data 0.001 (0.017)	Loss 5.3066 (5.2861)	Top-1 acc 7.812 (9.503)	Top-5 acc 21.094 (24.190)	lr 0.04224
Warmup Train [11][1020/3239]	Time 0.534 (0.520)	Data 0.001 (0.017)	Loss 5.3698 (5.2861)	Top-1 acc 5.469 (9.499)	Top-5 acc 19.531 (24.190)	lr 0.04224
Warmup Train [11][1030/3239]	Time 0.524 (0.520)	Data 0.001 (0.017)	Loss 5.2182 (5.2862)	Top-1 acc 10.938 (9.494)	Top-5 acc 25.000 (24.195)	lr 0.04223
Warmup Train [11][1040/3239]	Time 0.549 (0.519)	Data 0.001 (0.017)	Loss 5.2447 (5.2856)	Top-1 acc 6.641 (9.495)	Top-5 acc 22.656 (24.201)	lr 0.04223
Warmup Train [11][1050/3239]	Time 0.530 (0.519)	Data 0.001 (0.017)	Loss 5.2336 (5.2856)	Top-1 acc 9.766 (9.492)	Top-5 acc 25.391 (24.206)	lr 0.04222
Warmup Train [11][1060/3239]	Time 0.486 (0.519)	Data 0.001 (0.017)	Loss 5.3254 (5.2851)	Top-1 acc 8.984 (9.500)	Top-5 acc 26.172 (24.224)	lr 0.04222
Warmup Train [11][1070/3239]	Time 0.436 (0.519)	Data 0.001 (0.016)	Loss 5.2233 (5.2847)	Top-1 acc 13.281 (9.506)	Top-5 acc 28.125 (24.236)	lr 0.04221
Warmup Train [11][1080/3239]	Time 0.452 (0.519)	Data 0.001 (0.016)	Loss 5.2003 (5.2844)	Top-1 acc 10.938 (9.510)	Top-5 acc 28.125 (24.247)	lr 0.04221
Warmup Train [11][1090/3239]	Time 0.344 (0.519)	Data 0.001 (0.016)	Loss 5.3780 (5.2845)	Top-1 acc 8.203 (9.506)	Top-5 acc 21.875 (24.246)	lr 0.04220
Warmup Train [11][1100/3239]	Time 0.308 (0.519)	Data 0.001 (0.016)	Loss 5.3733 (5.2845)	Top-1 acc 6.250 (9.499)	Top-5 acc 21.875 (24.243)	lr 0.04220
Warmup Train [11][1110/3239]	Time 0.398 (0.519)	Data 0.001 (0.016)	Loss 5.3727 (5.2850)	Top-1 acc 7.422 (9.488)	Top-5 acc 21.484 (24.227)	lr 0.04220
Warmup Train [11][1120/3239]	Time 0.588 (0.519)	Data 0.001 (0.016)	Loss 5.2113 (5.2846)	Top-1 acc 9.766 (9.489)	Top-5 acc 24.609 (24.231)	lr 0.04219
Warmup Train [11][1130/3239]	Time 0.540 (0.519)	Data 0.001 (0.016)	Loss 5.3186 (5.2848)	Top-1 acc 7.422 (9.495)	Top-5 acc 23.047 (24.230)	lr 0.04219
Warmup Train [11][1140/3239]	Time 0.540 (0.519)	Data 0.001 (0.016)	Loss 5.3627 (5.2852)	Top-1 acc 8.984 (9.497)	Top-5 acc 22.656 (24.228)	lr 0.04218
Warmup Train [11][1150/3239]	Time 0.585 (0.519)	Data 0.001 (0.016)	Loss 5.2160 (5.2852)	Top-1 acc 8.984 (9.492)	Top-5 acc 23.438 (24.220)	lr 0.04218
Warmup Train [11][1160/3239]	Time 0.605 (0.519)	Data 0.001 (0.016)	Loss 5.1788 (5.2853)	Top-1 acc 8.594 (9.494)	Top-5 acc 24.609 (24.230)	lr 0.04217
Warmup Train [11][1170/3239]	Time 0.387 (0.519)	Data 0.001 (0.016)	Loss 5.2200 (5.2853)	Top-1 acc 9.766 (9.488)	Top-5 acc 23.438 (24.230)	lr 0.04217
Warmup Train [11][1180/3239]	Time 0.472 (0.519)	Data 0.001 (0.016)	Loss 5.2964 (5.2850)	Top-1 acc 10.156 (9.489)	Top-5 acc 25.391 (24.251)	lr 0.04216
Warmup Train [11][1190/3239]	Time 0.386 (0.519)	Data 0.001 (0.016)	Loss 5.2198 (5.2847)	Top-1 acc 11.328 (9.494)	Top-5 acc 30.469 (24.267)	lr 0.04216
Warmup Train [11][1200/3239]	Time 0.397 (0.518)	Data 0.001 (0.016)	Loss 5.3758 (5.2846)	Top-1 acc 8.984 (9.497)	Top-5 acc 22.656 (24.270)	lr 0.04216
Warmup Train [11][1210/3239]	Time 0.473 (0.518)	Data 0.001 (0.016)	Loss 5.2608 (5.2845)	Top-1 acc 7.812 (9.500)	Top-5 acc 22.266 (24.278)	lr 0.04215
Warmup Train [11][1220/3239]	Time 0.306 (0.518)	Data 0.001 (0.016)	Loss 5.0634 (5.2845)	Top-1 acc 13.672 (9.499)	Top-5 acc 29.297 (24.281)	lr 0.04215
Warmup Train [11][1230/3239]	Time 0.416 (0.517)	Data 0.001 (0.016)	Loss 5.3594 (5.2844)	Top-1 acc 10.547 (9.508)	Top-5 acc 24.609 (24.286)	lr 0.04214
Warmup Train [11][1240/3239]	Time 0.647 (0.517)	Data 0.001 (0.016)	Loss 5.1629 (5.2841)	Top-1 acc 12.500 (9.506)	Top-5 acc 29.688 (24.301)	lr 0.04214
Warmup Train [11][1250/3239]	Time 0.429 (0.517)	Data 0.001 (0.016)	Loss 5.4281 (5.2841)	Top-1 acc 7.031 (9.506)	Top-5 acc 21.875 (24.302)	lr 0.04213
Warmup Train [11][1260/3239]	Time 0.558 (0.517)	Data 0.001 (0.016)	Loss 5.2857 (5.2842)	Top-1 acc 10.156 (9.505)	Top-5 acc 26.953 (24.303)	lr 0.04213
Warmup Train [11][1270/3239]	Time 0.522 (0.517)	Data 0.001 (0.015)	Loss 5.2451 (5.2839)	Top-1 acc 10.156 (9.508)	Top-5 acc 25.391 (24.307)	lr 0.04213
Warmup Train [11][1280/3239]	Time 0.595 (0.517)	Data 0.001 (0.015)	Loss 5.3576 (5.2838)	Top-1 acc 7.031 (9.505)	Top-5 acc 18.750 (24.310)	lr 0.04212
Warmup Train [11][1290/3239]	Time 0.548 (0.517)	Data 0.001 (0.015)	Loss 5.2889 (5.2837)	Top-1 acc 10.547 (9.504)	Top-5 acc 24.219 (24.313)	lr 0.04212
Warmup Train [11][1300/3239]	Time 0.565 (0.517)	Data 0.001 (0.015)	Loss 5.1065 (5.2836)	Top-1 acc 13.672 (9.510)	Top-5 acc 27.734 (24.323)	lr 0.04211
Warmup Train [11][1310/3239]	Time 0.426 (0.517)	Data 0.001 (0.015)	Loss 5.2126 (5.2836)	Top-1 acc 7.422 (9.515)	Top-5 acc 22.266 (24.314)	lr 0.04211
Warmup Train [11][1320/3239]	Time 0.399 (0.517)	Data 0.001 (0.015)	Loss 5.3288 (5.2829)	Top-1 acc 9.375 (9.524)	Top-5 acc 20.703 (24.326)	lr 0.04210
Warmup Train [11][1330/3239]	Time 0.511 (0.517)	Data 0.001 (0.015)	Loss 5.2407 (5.2827)	Top-1 acc 10.156 (9.530)	Top-5 acc 24.219 (24.330)	lr 0.04210
Warmup Train [11][1340/3239]	Time 0.542 (0.517)	Data 0.001 (0.015)	Loss 5.1464 (5.2824)	Top-1 acc 7.422 (9.533)	Top-5 acc 23.438 (24.335)	lr 0.04209
Warmup Train [11][1350/3239]	Time 0.505 (0.517)	Data 0.001 (0.015)	Loss 5.4419 (5.2824)	Top-1 acc 10.547 (9.536)	Top-5 acc 21.875 (24.344)	lr 0.04209
Warmup Train [11][1360/3239]	Time 0.586 (0.517)	Data 0.001 (0.015)	Loss 5.4111 (5.2823)	Top-1 acc 7.812 (9.540)	Top-5 acc 19.531 (24.343)	lr 0.04209
Warmup Train [11][1370/3239]	Time 0.595 (0.517)	Data 0.001 (0.015)	Loss 5.4007 (5.2828)	Top-1 acc 9.766 (9.539)	Top-5 acc 21.094 (24.336)	lr 0.04208
Warmup Train [11][1380/3239]	Time 0.530 (0.517)	Data 0.001 (0.015)	Loss 5.3726 (5.2828)	Top-1 acc 9.766 (9.539)	Top-5 acc 21.484 (24.336)	lr 0.04208
Warmup Train [11][1390/3239]	Time 0.368 (0.517)	Data 0.001 (0.015)	Loss 5.4865 (5.2833)	Top-1 acc 5.859 (9.530)	Top-5 acc 17.188 (24.321)	lr 0.04207
Warmup Train [11][1400/3239]	Time 0.575 (0.517)	Data 0.001 (0.015)	Loss 5.1762 (5.2832)	Top-1 acc 11.328 (9.530)	Top-5 acc 31.250 (24.327)	lr 0.04207
Warmup Train [11][1410/3239]	Time 0.498 (0.517)	Data 0.001 (0.015)	Loss 5.2633 (5.2832)	Top-1 acc 12.500 (9.537)	Top-5 acc 24.219 (24.328)	lr 0.04206
Warmup Train [11][1420/3239]	Time 0.345 (0.516)	Data 0.001 (0.014)	Loss 5.3032 (5.2833)	Top-1 acc 11.719 (9.543)	Top-5 acc 23.438 (24.325)	lr 0.04206
Warmup Train [11][1430/3239]	Time 0.571 (0.517)	Data 0.001 (0.014)	Loss 5.2229 (5.2830)	Top-1 acc 10.547 (9.544)	Top-5 acc 25.781 (24.328)	lr 0.04205
Warmup Train [11][1440/3239]	Time 0.520 (0.517)	Data 0.001 (0.014)	Loss 5.2297 (5.2831)	Top-1 acc 13.281 (9.543)	Top-5 acc 26.953 (24.326)	lr 0.04205
Warmup Train [11][1450/3239]	Time 0.301 (0.517)	Data 0.001 (0.014)	Loss 5.1763 (5.2828)	Top-1 acc 11.719 (9.554)	Top-5 acc 30.859 (24.333)	lr 0.04205
Warmup Train [11][1460/3239]	Time 0.523 (0.517)	Data 0.001 (0.014)	Loss 5.2488 (5.2825)	Top-1 acc 9.766 (9.555)	Top-5 acc 23.438 (24.341)	lr 0.04204
Warmup Train [11][1470/3239]	Time 0.326 (0.516)	Data 0.001 (0.014)	Loss 5.1554 (5.2824)	Top-1 acc 12.109 (9.554)	Top-5 acc 27.344 (24.342)	lr 0.04204
Warmup Train [11][1480/3239]	Time 0.561 (0.516)	Data 0.001 (0.014)	Loss 5.0623 (5.2821)	Top-1 acc 10.938 (9.556)	Top-5 acc 31.250 (24.350)	lr 0.04203
Warmup Train [11][1490/3239]	Time 0.446 (0.516)	Data 0.001 (0.014)	Loss 5.3209 (5.2819)	Top-1 acc 9.375 (9.560)	Top-5 acc 23.828 (24.354)	lr 0.04203
Warmup Train [11][1500/3239]	Time 0.495 (0.516)	Data 0.001 (0.014)	Loss 5.1338 (5.2814)	Top-1 acc 11.719 (9.567)	Top-5 acc 28.125 (24.366)	lr 0.04202
Warmup Train [11][1510/3239]	Time 0.664 (0.516)	Data 0.001 (0.014)	Loss 5.2422 (5.2815)	Top-1 acc 8.203 (9.565)	Top-5 acc 23.438 (24.361)	lr 0.04202
Warmup Train [11][1520/3239]	Time 0.440 (0.516)	Data 0.001 (0.014)	Loss 5.3588 (5.2814)	Top-1 acc 7.812 (9.565)	Top-5 acc 22.266 (24.367)	lr 0.04201
Warmup Train [11][1530/3239]	Time 0.561 (0.516)	Data 0.001 (0.014)	Loss 5.3219 (5.2811)	Top-1 acc 9.375 (9.573)	Top-5 acc 24.609 (24.372)	lr 0.04201
Warmup Train [11][1540/3239]	Time 0.509 (0.516)	Data 0.001 (0.014)	Loss 5.3594 (5.2810)	Top-1 acc 8.203 (9.573)	Top-5 acc 24.219 (24.376)	lr 0.04201
Warmup Train [11][1550/3239]	Time 0.568 (0.516)	Data 0.001 (0.014)	Loss 5.2998 (5.2809)	Top-1 acc 12.109 (9.580)	Top-5 acc 21.875 (24.377)	lr 0.04200
Warmup Train [11][1560/3239]	Time 0.387 (0.516)	Data 0.001 (0.014)	Loss 5.2449 (5.2809)	Top-1 acc 13.281 (9.584)	Top-5 acc 24.609 (24.375)	lr 0.04200
Warmup Train [11][1570/3239]	Time 0.347 (0.516)	Data 0.001 (0.014)	Loss 5.4520 (5.2809)	Top-1 acc 8.594 (9.587)	Top-5 acc 21.484 (24.373)	lr 0.04199
Warmup Train [11][1580/3239]	Time 0.626 (0.516)	Data 0.001 (0.014)	Loss 5.2238 (5.2811)	Top-1 acc 12.109 (9.590)	Top-5 acc 26.172 (24.375)	lr 0.04199
Warmup Train [11][1590/3239]	Time 0.553 (0.515)	Data 0.001 (0.014)	Loss 5.2000 (5.2807)	Top-1 acc 9.766 (9.601)	Top-5 acc 26.172 (24.387)	lr 0.04198
Warmup Train [11][1600/3239]	Time 0.424 (0.515)	Data 0.001 (0.014)	Loss 5.2030 (5.2804)	Top-1 acc 10.938 (9.606)	Top-5 acc 25.781 (24.389)	lr 0.04198
Warmup Train [11][1610/3239]	Time 0.523 (0.516)	Data 0.001 (0.014)	Loss 5.1078 (5.2802)	Top-1 acc 14.062 (9.607)	Top-5 acc 30.078 (24.392)	lr 0.04197
Warmup Train [11][1620/3239]	Time 0.456 (0.516)	Data 0.001 (0.014)	Loss 5.2018 (5.2801)	Top-1 acc 10.156 (9.608)	Top-5 acc 26.953 (24.390)	lr 0.04197
Warmup Train [11][1630/3239]	Time 0.523 (0.516)	Data 0.001 (0.014)	Loss 5.2311 (5.2799)	Top-1 acc 12.109 (9.608)	Top-5 acc 26.172 (24.392)	lr 0.04197
Warmup Train [11][1640/3239]	Time 0.354 (0.516)	Data 0.001 (0.014)	Loss 5.3559 (5.2800)	Top-1 acc 8.594 (9.605)	Top-5 acc 21.484 (24.392)	lr 0.04196
Warmup Train [11][1650/3239]	Time 0.542 (0.516)	Data 0.001 (0.014)	Loss 5.1428 (5.2794)	Top-1 acc 12.891 (9.617)	Top-5 acc 29.688 (24.409)	lr 0.04196
Warmup Train [11][1660/3239]	Time 0.539 (0.516)	Data 0.001 (0.014)	Loss 5.3855 (5.2792)	Top-1 acc 7.422 (9.621)	Top-5 acc 25.000 (24.416)	lr 0.04195
Warmup Train [11][1670/3239]	Time 0.550 (0.516)	Data 0.001 (0.013)	Loss 5.1612 (5.2791)	Top-1 acc 10.938 (9.627)	Top-5 acc 29.297 (24.420)	lr 0.04195
Warmup Train [11][1680/3239]	Time 0.359 (0.516)	Data 0.001 (0.013)	Loss 5.2310 (5.2785)	Top-1 acc 10.938 (9.632)	Top-5 acc 29.297 (24.439)	lr 0.04194
Warmup Train [11][1690/3239]	Time 0.604 (0.516)	Data 0.001 (0.013)	Loss 5.1836 (5.2784)	Top-1 acc 11.328 (9.630)	Top-5 acc 27.344 (24.440)	lr 0.04194
Warmup Train [11][1700/3239]	Time 0.569 (0.516)	Data 0.001 (0.013)	Loss 5.3254 (5.2784)	Top-1 acc 8.984 (9.636)	Top-5 acc 22.266 (24.440)	lr 0.04193
Warmup Train [11][1710/3239]	Time 0.430 (0.516)	Data 0.001 (0.013)	Loss 5.2199 (5.2783)	Top-1 acc 10.938 (9.634)	Top-5 acc 28.516 (24.447)	lr 0.04193
Warmup Train [11][1720/3239]	Time 0.459 (0.515)	Data 0.001 (0.013)	Loss 5.3768 (5.2781)	Top-1 acc 7.812 (9.639)	Top-5 acc 23.047 (24.448)	lr 0.04193
Warmup Train [11][1730/3239]	Time 0.490 (0.515)	Data 0.001 (0.013)	Loss 5.2834 (5.2778)	Top-1 acc 7.812 (9.637)	Top-5 acc 25.781 (24.454)	lr 0.04192
Warmup Train [11][1740/3239]	Time 0.552 (0.515)	Data 0.001 (0.013)	Loss 5.2689 (5.2777)	Top-1 acc 5.859 (9.639)	Top-5 acc 23.828 (24.461)	lr 0.04192
Warmup Train [11][1750/3239]	Time 0.471 (0.515)	Data 0.001 (0.013)	Loss 5.2329 (5.2773)	Top-1 acc 9.375 (9.642)	Top-5 acc 23.828 (24.464)	lr 0.04191
Warmup Train [11][1760/3239]	Time 0.357 (0.514)	Data 0.001 (0.013)	Loss 5.2715 (5.2773)	Top-1 acc 7.031 (9.643)	Top-5 acc 20.312 (24.463)	lr 0.04191
Warmup Train [11][1770/3239]	Time 0.590 (0.514)	Data 0.001 (0.013)	Loss 5.2666 (5.2771)	Top-1 acc 9.766 (9.647)	Top-5 acc 20.312 (24.456)	lr 0.04190
Warmup Train [11][1780/3239]	Time 0.602 (0.514)	Data 0.001 (0.013)	Loss 5.4630 (5.2771)	Top-1 acc 7.031 (9.647)	Top-5 acc 20.703 (24.454)	lr 0.04190
Warmup Train [11][1790/3239]	Time 0.367 (0.514)	Data 0.001 (0.013)	Loss 5.2413 (5.2768)	Top-1 acc 6.641 (9.650)	Top-5 acc 23.438 (24.466)	lr 0.04189
Warmup Train [11][1800/3239]	Time 0.397 (0.514)	Data 0.001 (0.013)	Loss 5.3196 (5.2766)	Top-1 acc 7.812 (9.651)	Top-5 acc 25.391 (24.477)	lr 0.04189
Warmup Train [11][1810/3239]	Time 0.711 (0.514)	Data 0.001 (0.013)	Loss 5.2247 (5.2764)	Top-1 acc 10.547 (9.653)	Top-5 acc 26.953 (24.484)	lr 0.04189
Warmup Train [11][1820/3239]	Time 0.475 (0.514)	Data 0.001 (0.013)	Loss 5.2155 (5.2759)	Top-1 acc 11.719 (9.661)	Top-5 acc 25.000 (24.499)	lr 0.04188
Warmup Train [11][1830/3239]	Time 0.486 (0.514)	Data 0.001 (0.013)	Loss 5.1900 (5.2755)	Top-1 acc 13.281 (9.669)	Top-5 acc 28.906 (24.502)	lr 0.04188
Warmup Train [11][1840/3239]	Time 0.353 (0.514)	Data 0.001 (0.013)	Loss 5.2041 (5.2754)	Top-1 acc 10.156 (9.668)	Top-5 acc 22.266 (24.509)	lr 0.04187
Warmup Train [11][1850/3239]	Time 0.568 (0.514)	Data 0.001 (0.013)	Loss 5.2799 (5.2754)	Top-1 acc 7.422 (9.670)	Top-5 acc 24.219 (24.510)	lr 0.04187
Warmup Train [11][1860/3239]	Time 0.566 (0.514)	Data 0.001 (0.013)	Loss 5.2872 (5.2753)	Top-1 acc 9.375 (9.676)	Top-5 acc 23.047 (24.516)	lr 0.04186
Warmup Train [11][1870/3239]	Time 0.529 (0.514)	Data 0.001 (0.013)	Loss 5.4864 (5.2752)	Top-1 acc 11.719 (9.677)	Top-5 acc 21.875 (24.516)	lr 0.04186
Warmup Train [11][1880/3239]	Time 0.544 (0.514)	Data 0.001 (0.013)	Loss 5.1982 (5.2748)	Top-1 acc 11.328 (9.687)	Top-5 acc 28.516 (24.527)	lr 0.04185
Warmup Train [11][1890/3239]	Time 0.483 (0.514)	Data 0.001 (0.013)	Loss 5.1148 (5.2747)	Top-1 acc 11.328 (9.689)	Top-5 acc 27.734 (24.532)	lr 0.04185
Warmup Train [11][1900/3239]	Time 0.532 (0.514)	Data 0.001 (0.012)	Loss 5.1714 (5.2747)	Top-1 acc 10.938 (9.692)	Top-5 acc 25.000 (24.533)	lr 0.04185
Warmup Train [11][1910/3239]	Time 0.367 (0.513)	Data 0.001 (0.012)	Loss 5.2775 (5.2747)	Top-1 acc 10.547 (9.694)	Top-5 acc 26.953 (24.529)	lr 0.04184
Warmup Train [11][1920/3239]	Time 0.477 (0.514)	Data 0.001 (0.012)	Loss 5.5026 (5.2748)	Top-1 acc 7.422 (9.695)	Top-5 acc 21.094 (24.526)	lr 0.04184
Warmup Train [11][1930/3239]	Time 0.683 (0.514)	Data 0.001 (0.012)	Loss 5.3445 (5.2751)	Top-1 acc 8.203 (9.698)	Top-5 acc 20.703 (24.523)	lr 0.04183
Warmup Train [11][1940/3239]	Time 0.625 (0.514)	Data 0.001 (0.012)	Loss 5.2870 (5.2750)	Top-1 acc 7.812 (9.697)	Top-5 acc 24.219 (24.529)	lr 0.04183
Warmup Train [11][1950/3239]	Time 0.381 (0.514)	Data 0.001 (0.012)	Loss 5.2571 (5.2748)	Top-1 acc 12.109 (9.701)	Top-5 acc 25.391 (24.538)	lr 0.04182
Warmup Train [11][1960/3239]	Time 0.427 (0.514)	Data 0.001 (0.012)	Loss 5.1797 (5.2748)	Top-1 acc 10.938 (9.702)	Top-5 acc 23.438 (24.538)	lr 0.04182
Warmup Train [11][1970/3239]	Time 0.425 (0.514)	Data 0.001 (0.012)	Loss 5.1017 (5.2746)	Top-1 acc 9.766 (9.704)	Top-5 acc 26.562 (24.542)	lr 0.04181
Warmup Train [11][1980/3239]	Time 0.605 (0.514)	Data 0.001 (0.012)	Loss 5.1925 (5.2743)	Top-1 acc 10.547 (9.712)	Top-5 acc 26.562 (24.555)	lr 0.04181
Warmup Train [11][1990/3239]	Time 0.536 (0.513)	Data 0.001 (0.012)	Loss 5.3447 (5.2742)	Top-1 acc 9.375 (9.713)	Top-5 acc 22.266 (24.551)	lr 0.04180
Warmup Train [11][2000/3239]	Time 0.509 (0.513)	Data 0.001 (0.012)	Loss 5.2344 (5.2742)	Top-1 acc 8.594 (9.712)	Top-5 acc 27.344 (24.555)	lr 0.04180
Warmup Train [11][2010/3239]	Time 0.516 (0.513)	Data 0.001 (0.012)	Loss 5.3339 (5.2740)	Top-1 acc 10.156 (9.710)	Top-5 acc 21.875 (24.555)	lr 0.04180
Warmup Train [11][2020/3239]	Time 0.619 (0.513)	Data 0.001 (0.012)	Loss 5.4394 (5.2740)	Top-1 acc 7.812 (9.710)	Top-5 acc 25.391 (24.554)	lr 0.04179
Warmup Train [11][2030/3239]	Time 0.430 (0.513)	Data 0.001 (0.012)	Loss 5.1300 (5.2738)	Top-1 acc 10.938 (9.712)	Top-5 acc 27.344 (24.561)	lr 0.04179
Warmup Train [11][2040/3239]	Time 0.466 (0.513)	Data 0.001 (0.012)	Loss 5.0559 (5.2736)	Top-1 acc 12.891 (9.715)	Top-5 acc 32.422 (24.568)	lr 0.04178
Warmup Train [11][2050/3239]	Time 0.541 (0.513)	Data 0.001 (0.012)	Loss 5.3325 (5.2735)	Top-1 acc 6.250 (9.716)	Top-5 acc 20.312 (24.572)	lr 0.04178
Warmup Train [11][2060/3239]	Time 0.299 (0.513)	Data 0.001 (0.012)	Loss 5.1922 (5.2735)	Top-1 acc 10.156 (9.717)	Top-5 acc 26.953 (24.573)	lr 0.04177
Warmup Train [11][2070/3239]	Time 0.477 (0.513)	Data 0.001 (0.012)	Loss 5.0537 (5.2733)	Top-1 acc 12.109 (9.717)	Top-5 acc 30.078 (24.581)	lr 0.04177
Warmup Train [11][2080/3239]	Time 0.428 (0.513)	Data 0.001 (0.012)	Loss 5.2140 (5.2730)	Top-1 acc 12.109 (9.722)	Top-5 acc 26.953 (24.587)	lr 0.04176
Warmup Train [11][2090/3239]	Time 0.528 (0.513)	Data 0.001 (0.012)	Loss 5.2445 (5.2730)	Top-1 acc 10.547 (9.729)	Top-5 acc 27.734 (24.595)	lr 0.04176
Warmup Train [11][2100/3239]	Time 0.520 (0.513)	Data 0.001 (0.012)	Loss 5.2045 (5.2726)	Top-1 acc 10.547 (9.735)	Top-5 acc 26.953 (24.603)	lr 0.04176
Warmup Train [11][2110/3239]	Time 0.438 (0.513)	Data 0.001 (0.012)	Loss 5.1720 (5.2724)	Top-1 acc 13.281 (9.738)	Top-5 acc 28.906 (24.610)	lr 0.04175
Warmup Train [11][2120/3239]	Time 0.443 (0.513)	Data 0.001 (0.012)	Loss 5.1716 (5.2722)	Top-1 acc 12.500 (9.739)	Top-5 acc 25.000 (24.615)	lr 0.04175
Warmup Train [11][2130/3239]	Time 0.394 (0.513)	Data 0.001 (0.012)	Loss 5.3568 (5.2721)	Top-1 acc 9.766 (9.740)	Top-5 acc 25.781 (24.622)	lr 0.04174
Warmup Train [11][2140/3239]	Time 0.576 (0.513)	Data 0.001 (0.012)	Loss 5.2886 (5.2720)	Top-1 acc 10.547 (9.742)	Top-5 acc 24.609 (24.625)	lr 0.04174
Warmup Train [11][2150/3239]	Time 0.611 (0.513)	Data 0.001 (0.012)	Loss 5.1236 (5.2718)	Top-1 acc 10.547 (9.739)	Top-5 acc 25.781 (24.626)	lr 0.04173
Warmup Train [11][2160/3239]	Time 0.465 (0.513)	Data 0.001 (0.012)	Loss 5.2316 (5.2714)	Top-1 acc 11.719 (9.743)	Top-5 acc 27.344 (24.632)	lr 0.04173
Warmup Train [11][2170/3239]	Time 0.550 (0.513)	Data 0.001 (0.012)	Loss 5.4658 (5.2713)	Top-1 acc 7.031 (9.742)	Top-5 acc 21.875 (24.632)	lr 0.04172
Warmup Train [11][2180/3239]	Time 0.457 (0.513)	Data 0.001 (0.012)	Loss 5.2481 (5.2711)	Top-1 acc 8.984 (9.741)	Top-5 acc 25.000 (24.638)	lr 0.04172
Warmup Train [11][2190/3239]	Time 0.606 (0.513)	Data 0.001 (0.012)	Loss 5.3577 (5.2710)	Top-1 acc 10.547 (9.743)	Top-5 acc 20.703 (24.640)	lr 0.04171
Warmup Train [11][2200/3239]	Time 0.695 (0.513)	Data 0.001 (0.012)	Loss 5.2899 (5.2709)	Top-1 acc 12.500 (9.747)	Top-5 acc 26.172 (24.641)	lr 0.04171
Warmup Train [11][2210/3239]	Time 0.702 (0.513)	Data 0.001 (0.012)	Loss 5.1685 (5.2708)	Top-1 acc 5.859 (9.747)	Top-5 acc 25.000 (24.645)	lr 0.04171
Warmup Train [11][2220/3239]	Time 0.348 (0.513)	Data 0.001 (0.012)	Loss 5.3412 (5.2708)	Top-1 acc 9.375 (9.747)	Top-5 acc 23.047 (24.644)	lr 0.04170
Warmup Train [11][2230/3239]	Time 0.380 (0.513)	Data 0.001 (0.012)	Loss 5.1664 (5.2707)	Top-1 acc 14.062 (9.752)	Top-5 acc 28.516 (24.654)	lr 0.04170
Warmup Train [11][2240/3239]	Time 0.527 (0.513)	Data 0.001 (0.012)	Loss 5.0908 (5.2704)	Top-1 acc 13.672 (9.754)	Top-5 acc 29.688 (24.663)	lr 0.04169
Warmup Train [11][2250/3239]	Time 0.575 (0.513)	Data 0.001 (0.012)	Loss 4.9766 (5.2703)	Top-1 acc 14.453 (9.760)	Top-5 acc 35.938 (24.669)	lr 0.04169
Warmup Train [11][2260/3239]	Time 0.640 (0.513)	Data 0.001 (0.012)	Loss 5.0752 (5.2701)	Top-1 acc 12.891 (9.761)	Top-5 acc 27.734 (24.667)	lr 0.04168
Warmup Train [11][2270/3239]	Time 0.530 (0.513)	Data 0.001 (0.012)	Loss 5.1913 (5.2700)	Top-1 acc 9.766 (9.763)	Top-5 acc 27.344 (24.676)	lr 0.04168
Warmup Train [11][2280/3239]	Time 0.520 (0.513)	Data 0.001 (0.012)	Loss 5.2238 (5.2700)	Top-1 acc 10.547 (9.761)	Top-5 acc 23.438 (24.678)	lr 0.04167
Warmup Train [11][2290/3239]	Time 0.499 (0.513)	Data 0.001 (0.012)	Loss 5.3518 (5.2697)	Top-1 acc 8.594 (9.766)	Top-5 acc 24.219 (24.688)	lr 0.04167
Warmup Train [11][2300/3239]	Time 0.383 (0.513)	Data 0.001 (0.012)	Loss 5.2426 (5.2695)	Top-1 acc 9.375 (9.768)	Top-5 acc 24.609 (24.691)	lr 0.04167
Warmup Train [11][2310/3239]	Time 0.517 (0.513)	Data 0.001 (0.012)	Loss 5.2954 (5.2694)	Top-1 acc 10.156 (9.770)	Top-5 acc 25.391 (24.694)	lr 0.04166
Warmup Train [11][2320/3239]	Time 0.473 (0.512)	Data 0.001 (0.012)	Loss 5.3025 (5.2693)	Top-1 acc 8.203 (9.772)	Top-5 acc 21.484 (24.698)	lr 0.04166
Warmup Train [11][2330/3239]	Time 0.473 (0.513)	Data 0.001 (0.012)	Loss 5.3687 (5.2692)	Top-1 acc 7.031 (9.769)	Top-5 acc 21.484 (24.698)	lr 0.04165
Warmup Train [11][2340/3239]	Time 0.299 (0.513)	Data 0.001 (0.012)	Loss 5.1965 (5.2692)	Top-1 acc 11.719 (9.772)	Top-5 acc 26.562 (24.701)	lr 0.04165
Warmup Train [11][2350/3239]	Time 0.632 (0.513)	Data 0.001 (0.012)	Loss 5.1319 (5.2690)	Top-1 acc 9.766 (9.775)	Top-5 acc 30.469 (24.705)	lr 0.04164
Warmup Train [11][2360/3239]	Time 0.374 (0.513)	Data 0.001 (0.012)	Loss 5.2678 (5.2688)	Top-1 acc 11.328 (9.780)	Top-5 acc 25.000 (24.705)	lr 0.04164
Warmup Train [11][2370/3239]	Time 0.648 (0.513)	Data 0.001 (0.012)	Loss 5.3299 (5.2687)	Top-1 acc 10.938 (9.779)	Top-5 acc 23.438 (24.703)	lr 0.04163
Warmup Train [11][2380/3239]	Time 0.505 (0.513)	Data 0.001 (0.012)	Loss 5.2375 (5.2686)	Top-1 acc 10.156 (9.779)	Top-5 acc 22.656 (24.707)	lr 0.04163
Warmup Train [11][2390/3239]	Time 0.377 (0.513)	Data 0.001 (0.011)	Loss 5.2006 (5.2686)	Top-1 acc 10.547 (9.785)	Top-5 acc 26.172 (24.708)	lr 0.04162
Warmup Train [11][2400/3239]	Time 0.363 (0.513)	Data 0.001 (0.011)	Loss 5.2212 (5.2684)	Top-1 acc 9.766 (9.787)	Top-5 acc 21.094 (24.714)	lr 0.04162
Warmup Train [11][2410/3239]	Time 0.627 (0.513)	Data 0.001 (0.012)	Loss 5.3696 (5.2683)	Top-1 acc 7.422 (9.785)	Top-5 acc 22.656 (24.716)	lr 0.04162
Warmup Train [11][2420/3239]	Time 0.611 (0.513)	Data 0.001 (0.011)	Loss 5.2766 (5.2680)	Top-1 acc 12.109 (9.792)	Top-5 acc 25.000 (24.724)	lr 0.04161
Warmup Train [11][2430/3239]	Time 0.528 (0.513)	Data 0.001 (0.011)	Loss 5.1600 (5.2681)	Top-1 acc 14.062 (9.792)	Top-5 acc 29.297 (24.726)	lr 0.04161
Warmup Train [11][2440/3239]	Time 0.494 (0.513)	Data 0.001 (0.011)	Loss 5.2141 (5.2678)	Top-1 acc 10.156 (9.796)	Top-5 acc 24.609 (24.734)	lr 0.04160
Warmup Train [11][2450/3239]	Time 0.530 (0.513)	Data 0.001 (0.011)	Loss 5.1417 (5.2674)	Top-1 acc 12.891 (9.801)	Top-5 acc 29.297 (24.746)	lr 0.04160
Warmup Train [11][2460/3239]	Time 0.615 (0.513)	Data 0.001 (0.011)	Loss 5.2476 (5.2672)	Top-1 acc 8.594 (9.802)	Top-5 acc 25.000 (24.753)	lr 0.04159
Warmup Train [11][2470/3239]	Time 0.514 (0.513)	Data 0.001 (0.011)	Loss 5.3561 (5.2673)	Top-1 acc 7.812 (9.802)	Top-5 acc 21.484 (24.747)	lr 0.04159
Warmup Train [11][2480/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 5.2962 (5.2672)	Top-1 acc 10.938 (9.805)	Top-5 acc 22.656 (24.750)	lr 0.04158
Warmup Train [11][2490/3239]	Time 0.507 (0.513)	Data 0.001 (0.011)	Loss 5.0847 (5.2668)	Top-1 acc 10.547 (9.809)	Top-5 acc 26.562 (24.761)	lr 0.04158
Warmup Train [11][2500/3239]	Time 0.482 (0.513)	Data 0.001 (0.011)	Loss 5.2130 (5.2667)	Top-1 acc 11.328 (9.810)	Top-5 acc 26.953 (24.769)	lr 0.04157
Warmup Train [11][2510/3239]	Time 0.405 (0.513)	Data 0.001 (0.011)	Loss 5.2085 (5.2665)	Top-1 acc 13.281 (9.814)	Top-5 acc 29.297 (24.776)	lr 0.04157
Warmup Train [11][2520/3239]	Time 0.456 (0.513)	Data 0.001 (0.011)	Loss 5.1893 (5.2663)	Top-1 acc 12.109 (9.817)	Top-5 acc 26.953 (24.777)	lr 0.04157
Warmup Train [11][2530/3239]	Time 0.489 (0.513)	Data 0.001 (0.011)	Loss 5.4360 (5.2662)	Top-1 acc 9.375 (9.818)	Top-5 acc 22.266 (24.777)	lr 0.04156
Warmup Train [11][2540/3239]	Time 0.579 (0.513)	Data 0.001 (0.011)	Loss 5.1402 (5.2661)	Top-1 acc 12.109 (9.821)	Top-5 acc 26.562 (24.780)	lr 0.04156
Warmup Train [11][2550/3239]	Time 0.638 (0.513)	Data 0.001 (0.011)	Loss 5.3716 (5.2659)	Top-1 acc 8.984 (9.822)	Top-5 acc 25.391 (24.788)	lr 0.04155
Warmup Train [11][2560/3239]	Time 0.693 (0.513)	Data 0.001 (0.011)	Loss 5.1011 (5.2656)	Top-1 acc 10.156 (9.824)	Top-5 acc 28.516 (24.792)	lr 0.04155
Warmup Train [11][2570/3239]	Time 0.354 (0.513)	Data 0.001 (0.011)	Loss 5.3565 (5.2656)	Top-1 acc 9.766 (9.824)	Top-5 acc 25.781 (24.793)	lr 0.04154
Warmup Train [11][2580/3239]	Time 0.552 (0.513)	Data 0.002 (0.011)	Loss 5.2035 (5.2651)	Top-1 acc 10.547 (9.829)	Top-5 acc 27.344 (24.810)	lr 0.04154
Warmup Train [11][2590/3239]	Time 0.524 (0.513)	Data 0.001 (0.011)	Loss 5.1572 (5.2651)	Top-1 acc 10.938 (9.827)	Top-5 acc 25.781 (24.812)	lr 0.04153
Warmup Train [11][2600/3239]	Time 0.529 (0.513)	Data 0.001 (0.011)	Loss 5.3375 (5.2652)	Top-1 acc 11.328 (9.828)	Top-5 acc 23.828 (24.809)	lr 0.04153
Warmup Train [11][2610/3239]	Time 0.515 (0.513)	Data 0.001 (0.011)	Loss 5.1743 (5.2650)	Top-1 acc 15.625 (9.832)	Top-5 acc 28.906 (24.814)	lr 0.04152
Warmup Train [11][2620/3239]	Time 0.493 (0.513)	Data 0.001 (0.011)	Loss 5.2657 (5.2649)	Top-1 acc 10.547 (9.832)	Top-5 acc 25.781 (24.817)	lr 0.04152
Warmup Train [11][2630/3239]	Time 0.498 (0.513)	Data 0.001 (0.011)	Loss 5.1291 (5.2647)	Top-1 acc 10.547 (9.831)	Top-5 acc 27.344 (24.821)	lr 0.04152
Warmup Train [11][2640/3239]	Time 0.608 (0.513)	Data 0.001 (0.011)	Loss 5.2041 (5.2647)	Top-1 acc 10.938 (9.831)	Top-5 acc 28.125 (24.821)	lr 0.04151
Warmup Train [11][2650/3239]	Time 0.567 (0.513)	Data 0.001 (0.011)	Loss 5.2830 (5.2647)	Top-1 acc 9.375 (9.831)	Top-5 acc 22.266 (24.818)	lr 0.04151
Warmup Train [11][2660/3239]	Time 0.631 (0.513)	Data 0.001 (0.011)	Loss 5.2109 (5.2646)	Top-1 acc 10.938 (9.834)	Top-5 acc 27.344 (24.821)	lr 0.04150
Warmup Train [11][2670/3239]	Time 0.477 (0.513)	Data 0.001 (0.011)	Loss 5.1149 (5.2645)	Top-1 acc 11.328 (9.832)	Top-5 acc 27.344 (24.824)	lr 0.04150
Warmup Train [11][2680/3239]	Time 0.449 (0.513)	Data 0.001 (0.011)	Loss 5.2199 (5.2642)	Top-1 acc 10.938 (9.836)	Top-5 acc 23.438 (24.831)	lr 0.04149
Warmup Train [11][2690/3239]	Time 0.503 (0.513)	Data 0.001 (0.011)	Loss 5.1352 (5.2641)	Top-1 acc 11.328 (9.836)	Top-5 acc 25.391 (24.832)	lr 0.04149
Warmup Train [11][2700/3239]	Time 0.566 (0.513)	Data 0.001 (0.011)	Loss 5.2728 (5.2640)	Top-1 acc 13.281 (9.836)	Top-5 acc 32.031 (24.838)	lr 0.04148
Warmup Train [11][2710/3239]	Time 0.303 (0.513)	Data 0.001 (0.011)	Loss 5.3263 (5.2638)	Top-1 acc 8.203 (9.839)	Top-5 acc 21.875 (24.843)	lr 0.04148
Warmup Train [11][2720/3239]	Time 0.510 (0.513)	Data 0.001 (0.011)	Loss 5.2198 (5.2637)	Top-1 acc 8.594 (9.841)	Top-5 acc 23.047 (24.845)	lr 0.04147
Warmup Train [11][2730/3239]	Time 0.636 (0.513)	Data 0.001 (0.011)	Loss 5.2220 (5.2636)	Top-1 acc 10.156 (9.841)	Top-5 acc 24.609 (24.846)	lr 0.04147
Warmup Train [11][2740/3239]	Time 0.581 (0.513)	Data 0.001 (0.011)	Loss 5.2177 (5.2634)	Top-1 acc 10.156 (9.849)	Top-5 acc 25.000 (24.851)	lr 0.04147
Warmup Train [11][2750/3239]	Time 0.446 (0.513)	Data 0.001 (0.011)	Loss 5.1363 (5.2635)	Top-1 acc 14.844 (9.846)	Top-5 acc 29.688 (24.847)	lr 0.04146
Warmup Train [11][2760/3239]	Time 0.389 (0.513)	Data 0.001 (0.011)	Loss 5.1487 (5.2634)	Top-1 acc 10.938 (9.847)	Top-5 acc 24.219 (24.849)	lr 0.04146
Warmup Train [11][2770/3239]	Time 0.752 (0.513)	Data 0.001 (0.011)	Loss 5.2505 (5.2632)	Top-1 acc 10.156 (9.847)	Top-5 acc 21.484 (24.856)	lr 0.04145
Warmup Train [11][2780/3239]	Time 0.526 (0.513)	Data 0.001 (0.011)	Loss 5.2019 (5.2630)	Top-1 acc 7.031 (9.849)	Top-5 acc 25.000 (24.859)	lr 0.04145
Warmup Train [11][2790/3239]	Time 0.381 (0.513)	Data 0.001 (0.011)	Loss 5.2356 (5.2628)	Top-1 acc 11.328 (9.852)	Top-5 acc 21.484 (24.861)	lr 0.04144
Warmup Train [11][2800/3239]	Time 0.512 (0.513)	Data 0.001 (0.011)	Loss 5.2280 (5.2625)	Top-1 acc 10.547 (9.857)	Top-5 acc 22.656 (24.868)	lr 0.04144
Warmup Train [11][2810/3239]	Time 0.508 (0.513)	Data 0.001 (0.011)	Loss 5.3561 (5.2624)	Top-1 acc 7.812 (9.859)	Top-5 acc 18.359 (24.872)	lr 0.04143
Warmup Train [11][2820/3239]	Time 0.560 (0.513)	Data 0.001 (0.011)	Loss 5.1649 (5.2623)	Top-1 acc 8.984 (9.859)	Top-5 acc 28.125 (24.874)	lr 0.04143
Warmup Train [11][2830/3239]	Time 0.410 (0.512)	Data 0.001 (0.011)	Loss 5.2580 (5.2620)	Top-1 acc 9.375 (9.863)	Top-5 acc 25.000 (24.879)	lr 0.04142
Warmup Train [11][2840/3239]	Time 0.430 (0.512)	Data 0.001 (0.011)	Loss 5.1896 (5.2617)	Top-1 acc 12.500 (9.866)	Top-5 acc 28.516 (24.885)	lr 0.04142
Warmup Train [11][2850/3239]	Time 0.592 (0.513)	Data 0.001 (0.011)	Loss 5.0612 (5.2614)	Top-1 acc 12.500 (9.870)	Top-5 acc 26.953 (24.890)	lr 0.04142
Warmup Train [11][2860/3239]	Time 0.350 (0.513)	Data 0.001 (0.011)	Loss 5.3753 (5.2616)	Top-1 acc 8.203 (9.868)	Top-5 acc 23.047 (24.891)	lr 0.04141
Warmup Train [11][2870/3239]	Time 0.520 (0.512)	Data 0.001 (0.011)	Loss 5.2702 (5.2614)	Top-1 acc 7.422 (9.872)	Top-5 acc 24.219 (24.895)	lr 0.04141
Warmup Train [11][2880/3239]	Time 0.642 (0.512)	Data 0.001 (0.011)	Loss 5.2805 (5.2614)	Top-1 acc 9.766 (9.873)	Top-5 acc 19.922 (24.892)	lr 0.04140
Warmup Train [11][2890/3239]	Time 0.683 (0.513)	Data 0.001 (0.011)	Loss 5.2137 (5.2612)	Top-1 acc 14.844 (9.876)	Top-5 acc 27.344 (24.899)	lr 0.04140
Warmup Train [11][2900/3239]	Time 0.564 (0.513)	Data 0.001 (0.011)	Loss 5.2719 (5.2609)	Top-1 acc 12.109 (9.881)	Top-5 acc 26.953 (24.904)	lr 0.04139
Warmup Train [11][2910/3239]	Time 0.479 (0.513)	Data 0.001 (0.011)	Loss 5.1536 (5.2608)	Top-1 acc 10.547 (9.882)	Top-5 acc 27.344 (24.907)	lr 0.04139
Warmup Train [11][2920/3239]	Time 0.505 (0.513)	Data 0.001 (0.011)	Loss 5.1451 (5.2606)	Top-1 acc 10.938 (9.883)	Top-5 acc 27.344 (24.911)	lr 0.04138
Warmup Train [11][2930/3239]	Time 0.465 (0.513)	Data 0.001 (0.011)	Loss 5.3998 (5.2604)	Top-1 acc 8.984 (9.884)	Top-5 acc 21.875 (24.917)	lr 0.04138
Warmup Train [11][2940/3239]	Time 0.397 (0.513)	Data 0.001 (0.011)	Loss 5.1351 (5.2603)	Top-1 acc 9.766 (9.888)	Top-5 acc 23.828 (24.923)	lr 0.04137
Warmup Train [11][2950/3239]	Time 0.505 (0.513)	Data 0.001 (0.011)	Loss 5.2153 (5.2600)	Top-1 acc 10.938 (9.892)	Top-5 acc 25.781 (24.930)	lr 0.04137
Warmup Train [11][2960/3239]	Time 0.628 (0.513)	Data 0.001 (0.011)	Loss 5.1575 (5.2599)	Top-1 acc 8.984 (9.895)	Top-5 acc 26.172 (24.931)	lr 0.04136
Warmup Train [11][2970/3239]	Time 0.500 (0.513)	Data 0.001 (0.011)	Loss 5.2478 (5.2598)	Top-1 acc 9.766 (9.897)	Top-5 acc 23.438 (24.936)	lr 0.04136
Warmup Train [11][2980/3239]	Time 0.554 (0.513)	Data 0.001 (0.011)	Loss 5.2400 (5.2595)	Top-1 acc 10.938 (9.900)	Top-5 acc 23.047 (24.940)	lr 0.04136
Warmup Train [11][2990/3239]	Time 0.403 (0.512)	Data 0.001 (0.010)	Loss 5.2274 (5.2593)	Top-1 acc 12.109 (9.904)	Top-5 acc 25.000 (24.945)	lr 0.04135
Warmup Train [11][3000/3239]	Time 0.576 (0.513)	Data 0.001 (0.011)	Loss 5.2200 (5.2592)	Top-1 acc 9.766 (9.904)	Top-5 acc 26.953 (24.949)	lr 0.04135
Warmup Train [11][3010/3239]	Time 0.344 (0.512)	Data 0.001 (0.010)	Loss 5.1755 (5.2590)	Top-1 acc 9.375 (9.907)	Top-5 acc 28.516 (24.954)	lr 0.04134
Warmup Train [11][3020/3239]	Time 0.557 (0.512)	Data 0.001 (0.011)	Loss 5.2846 (5.2589)	Top-1 acc 8.594 (9.906)	Top-5 acc 23.828 (24.957)	lr 0.04134
Warmup Train [11][3030/3239]	Time 0.464 (0.512)	Data 0.001 (0.011)	Loss 5.3843 (5.2588)	Top-1 acc 5.078 (9.904)	Top-5 acc 21.094 (24.958)	lr 0.04133
Warmup Train [11][3040/3239]	Time 0.522 (0.512)	Data 0.001 (0.010)	Loss 5.0329 (5.2588)	Top-1 acc 15.234 (9.905)	Top-5 acc 32.812 (24.959)	lr 0.04133
Warmup Train [11][3050/3239]	Time 0.555 (0.512)	Data 0.001 (0.010)	Loss 5.2347 (5.2586)	Top-1 acc 12.891 (9.908)	Top-5 acc 26.172 (24.965)	lr 0.04132
Warmup Train [11][3060/3239]	Time 0.414 (0.512)	Data 0.001 (0.010)	Loss 5.1446 (5.2585)	Top-1 acc 11.328 (9.912)	Top-5 acc 28.125 (24.965)	lr 0.04132
Warmup Train [11][3070/3239]	Time 0.584 (0.512)	Data 0.001 (0.010)	Loss 5.2853 (5.2583)	Top-1 acc 12.500 (9.913)	Top-5 acc 25.781 (24.967)	lr 0.04131
Warmup Train [11][3080/3239]	Time 0.598 (0.512)	Data 0.001 (0.010)	Loss 5.2475 (5.2581)	Top-1 acc 10.547 (9.916)	Top-5 acc 23.438 (24.972)	lr 0.04131
Warmup Train [11][3090/3239]	Time 0.582 (0.512)	Data 0.001 (0.010)	Loss 5.3429 (5.2578)	Top-1 acc 8.594 (9.922)	Top-5 acc 26.953 (24.981)	lr 0.04131
Warmup Train [11][3100/3239]	Time 0.658 (0.512)	Data 0.001 (0.010)	Loss 5.0509 (5.2574)	Top-1 acc 12.109 (9.927)	Top-5 acc 27.734 (24.987)	lr 0.04130
Warmup Train [11][3110/3239]	Time 0.527 (0.512)	Data 0.001 (0.010)	Loss 5.1302 (5.2571)	Top-1 acc 16.797 (9.933)	Top-5 acc 31.641 (24.996)	lr 0.04130
Warmup Train [11][3120/3239]	Time 0.362 (0.512)	Data 0.020 (0.010)	Loss 5.2009 (5.2569)	Top-1 acc 11.328 (9.938)	Top-5 acc 26.953 (25.002)	lr 0.04129
Warmup Train [11][3130/3239]	Time 0.600 (0.512)	Data 0.001 (0.010)	Loss 4.9964 (5.2566)	Top-1 acc 15.234 (9.943)	Top-5 acc 29.688 (25.011)	lr 0.04129
Warmup Train [11][3140/3239]	Time 0.499 (0.512)	Data 0.001 (0.010)	Loss 5.2547 (5.2565)	Top-1 acc 7.031 (9.942)	Top-5 acc 25.000 (25.013)	lr 0.04128
Warmup Train [11][3150/3239]	Time 0.482 (0.512)	Data 0.001 (0.010)	Loss 5.1298 (5.2563)	Top-1 acc 12.500 (9.944)	Top-5 acc 28.125 (25.017)	lr 0.04128
Warmup Train [11][3160/3239]	Time 0.339 (0.512)	Data 0.001 (0.010)	Loss 5.2944 (5.2562)	Top-1 acc 7.031 (9.946)	Top-5 acc 22.656 (25.020)	lr 0.04127
Warmup Train [11][3170/3239]	Time 0.300 (0.512)	Data 0.001 (0.010)	Loss 5.1185 (5.2559)	Top-1 acc 11.328 (9.948)	Top-5 acc 31.250 (25.026)	lr 0.04127
Warmup Train [11][3180/3239]	Time 0.583 (0.512)	Data 0.000 (0.010)	Loss 5.2014 (5.2558)	Top-1 acc 11.328 (9.952)	Top-5 acc 26.562 (25.028)	lr 0.04126
Warmup Train [11][3190/3239]	Time 0.614 (0.512)	Data 0.000 (0.010)	Loss 5.2894 (5.2557)	Top-1 acc 8.594 (9.953)	Top-5 acc 23.047 (25.031)	lr 0.04126
Warmup Train [11][3200/3239]	Time 0.510 (0.512)	Data 0.000 (0.010)	Loss 5.1907 (5.2554)	Top-1 acc 12.891 (9.958)	Top-5 acc 26.172 (25.038)	lr 0.04125
Warmup Train [11][3210/3239]	Time 0.561 (0.512)	Data 0.000 (0.010)	Loss 5.1820 (5.2553)	Top-1 acc 13.281 (9.960)	Top-5 acc 31.641 (25.043)	lr 0.04125
Warmup Train [11][3220/3239]	Time 0.683 (0.512)	Data 0.000 (0.010)	Loss 5.1247 (5.2551)	Top-1 acc 10.547 (9.964)	Top-5 acc 31.641 (25.050)	lr 0.04125
Warmup Train [11][3230/3239]	Time 0.419 (0.512)	Data 0.000 (0.010)	Loss 5.2522 (5.2549)	Top-1 acc 11.719 (9.965)	Top-5 acc 26.562 (25.054)	lr 0.04124
Warmup Train [11][3239/3239]	Time 0.323 (0.512)	Data 0.000 (0.010)	Loss 5.4177 (5.2549)	Top-1 acc 6.173 (9.965)	Top-5 acc 17.284 (25.053)	lr 0.04124
==========Warmup Valid [11/40]	loss 4.485	top-1 acc 14.825	top-5 acc 33.315	Train top-1 9.965	top-5 25.053	flops: 442.4M
Warmup Train [12][0/3239]	Time 14.019 (14.019)	Data 11.739 (11.739)	Loss 5.2638 (5.2638)	Top-1 acc 7.812 (7.812)	Top-5 acc 26.562 (26.562)	lr 0.04124
Warmup Train [12][10/3239]	Time 0.531 (1.782)	Data 0.001 (1.077)	Loss 5.2280 (5.2477)	Top-1 acc 9.375 (9.837)	Top-5 acc 24.609 (25.604)	lr 0.04123
Warmup Train [12][20/3239]	Time 0.413 (1.171)	Data 0.001 (0.565)	Loss 5.2660 (5.2489)	Top-1 acc 7.422 (9.487)	Top-5 acc 23.438 (25.205)	lr 0.04123
Warmup Train [12][30/3239]	Time 0.493 (0.968)	Data 0.001 (0.388)	Loss 5.1652 (5.2349)	Top-1 acc 12.500 (9.967)	Top-5 acc 29.688 (25.794)	lr 0.04122
Warmup Train [12][40/3239]	Time 0.421 (0.848)	Data 0.001 (0.294)	Loss 5.1871 (5.2314)	Top-1 acc 12.891 (9.918)	Top-5 acc 26.562 (25.743)	lr 0.04122
Warmup Train [12][50/3239]	Time 0.552 (0.786)	Data 0.001 (0.239)	Loss 5.3149 (5.2238)	Top-1 acc 6.641 (10.003)	Top-5 acc 25.000 (25.843)	lr 0.04121
Warmup Train [12][60/3239]	Time 0.570 (0.743)	Data 0.001 (0.201)	Loss 5.1746 (5.2215)	Top-1 acc 12.500 (10.188)	Top-5 acc 28.516 (26.025)	lr 0.04121
Warmup Train [12][70/3239]	Time 0.558 (0.709)	Data 0.001 (0.173)	Loss 5.1881 (5.2224)	Top-1 acc 12.891 (10.255)	Top-5 acc 26.172 (25.952)	lr 0.04120
Warmup Train [12][80/3239]	Time 0.461 (0.685)	Data 0.001 (0.152)	Loss 5.0888 (5.2217)	Top-1 acc 12.891 (10.335)	Top-5 acc 28.516 (26.013)	lr 0.04120
Warmup Train [12][90/3239]	Time 0.417 (0.663)	Data 0.001 (0.135)	Loss 5.3375 (5.2201)	Top-1 acc 10.938 (10.375)	Top-5 acc 22.266 (26.090)	lr 0.04119
Warmup Train [12][100/3239]	Time 0.325 (0.648)	Data 0.001 (0.123)	Loss 5.2636 (5.2213)	Top-1 acc 9.766 (10.319)	Top-5 acc 25.391 (26.017)	lr 0.04119
Warmup Train [12][110/3239]	Time 0.601 (0.637)	Data 0.001 (0.113)	Loss 5.2226 (5.2197)	Top-1 acc 8.984 (10.248)	Top-5 acc 26.172 (25.929)	lr 0.04119
Warmup Train [12][120/3239]	Time 0.405 (0.626)	Data 0.001 (0.104)	Loss 5.1533 (5.2147)	Top-1 acc 10.156 (10.282)	Top-5 acc 31.641 (26.007)	lr 0.04118
Warmup Train [12][130/3239]	Time 0.446 (0.616)	Data 0.001 (0.097)	Loss 5.1771 (5.2120)	Top-1 acc 9.375 (10.296)	Top-5 acc 25.781 (26.035)	lr 0.04118
Warmup Train [12][140/3239]	Time 0.543 (0.609)	Data 0.001 (0.091)	Loss 5.1622 (5.2108)	Top-1 acc 11.719 (10.336)	Top-5 acc 27.344 (26.080)	lr 0.04117
Warmup Train [12][150/3239]	Time 0.635 (0.601)	Data 0.001 (0.085)	Loss 5.0629 (5.2070)	Top-1 acc 11.328 (10.386)	Top-5 acc 29.688 (26.162)	lr 0.04117
Warmup Train [12][160/3239]	Time 0.469 (0.595)	Data 0.001 (0.080)	Loss 5.3522 (5.2088)	Top-1 acc 8.984 (10.360)	Top-5 acc 21.484 (26.063)	lr 0.04116
Warmup Train [12][170/3239]	Time 0.531 (0.591)	Data 0.001 (0.075)	Loss 5.0878 (5.2077)	Top-1 acc 13.281 (10.433)	Top-5 acc 29.688 (26.108)	lr 0.04116
Warmup Train [12][180/3239]	Time 0.571 (0.585)	Data 0.001 (0.071)	Loss 5.0231 (5.2066)	Top-1 acc 12.109 (10.432)	Top-5 acc 33.984 (26.118)	lr 0.04115
Warmup Train [12][190/3239]	Time 0.358 (0.581)	Data 0.001 (0.068)	Loss 5.2586 (5.2065)	Top-1 acc 10.547 (10.477)	Top-5 acc 21.875 (26.162)	lr 0.04115
Warmup Train [12][200/3239]	Time 0.490 (0.578)	Data 0.001 (0.065)	Loss 4.9894 (5.2036)	Top-1 acc 15.625 (10.529)	Top-5 acc 31.641 (26.209)	lr 0.04114
Warmup Train [12][210/3239]	Time 0.347 (0.574)	Data 0.001 (0.062)	Loss 5.3469 (5.2023)	Top-1 acc 6.250 (10.549)	Top-5 acc 23.438 (26.281)	lr 0.04114
Warmup Train [12][220/3239]	Time 0.459 (0.571)	Data 0.001 (0.060)	Loss 5.3874 (5.2016)	Top-1 acc 7.031 (10.540)	Top-5 acc 23.438 (26.304)	lr 0.04113
Warmup Train [12][230/3239]	Time 0.507 (0.567)	Data 0.001 (0.057)	Loss 5.2091 (5.2018)	Top-1 acc 9.766 (10.547)	Top-5 acc 29.297 (26.336)	lr 0.04113
Warmup Train [12][240/3239]	Time 0.532 (0.566)	Data 0.025 (0.055)	Loss 5.2261 (5.2011)	Top-1 acc 12.891 (10.587)	Top-5 acc 25.781 (26.347)	lr 0.04113
Warmup Train [12][250/3239]	Time 0.562 (0.564)	Data 0.001 (0.053)	Loss 5.2106 (5.2025)	Top-1 acc 10.547 (10.576)	Top-5 acc 24.609 (26.320)	lr 0.04112
Warmup Train [12][260/3239]	Time 0.381 (0.562)	Data 0.001 (0.051)	Loss 5.1974 (5.2024)	Top-1 acc 12.109 (10.562)	Top-5 acc 27.344 (26.326)	lr 0.04112
Warmup Train [12][270/3239]	Time 0.389 (0.560)	Data 0.001 (0.050)	Loss 5.1438 (5.2037)	Top-1 acc 14.453 (10.558)	Top-5 acc 30.078 (26.312)	lr 0.04111
Warmup Train [12][280/3239]	Time 0.471 (0.559)	Data 0.001 (0.049)	Loss 5.1966 (5.2037)	Top-1 acc 10.938 (10.586)	Top-5 acc 27.344 (26.323)	lr 0.04111
Warmup Train [12][290/3239]	Time 0.411 (0.558)	Data 0.001 (0.047)	Loss 5.2074 (5.2035)	Top-1 acc 13.281 (10.602)	Top-5 acc 28.125 (26.368)	lr 0.04110
Warmup Train [12][300/3239]	Time 0.549 (0.556)	Data 0.001 (0.046)	Loss 5.2303 (5.2031)	Top-1 acc 10.938 (10.638)	Top-5 acc 25.781 (26.377)	lr 0.04110
Warmup Train [12][310/3239]	Time 0.450 (0.554)	Data 0.001 (0.044)	Loss 5.1146 (5.2032)	Top-1 acc 11.328 (10.656)	Top-5 acc 26.562 (26.388)	lr 0.04109
Warmup Train [12][320/3239]	Time 0.527 (0.553)	Data 0.001 (0.043)	Loss 5.3671 (5.2038)	Top-1 acc 7.422 (10.639)	Top-5 acc 23.438 (26.351)	lr 0.04109
Warmup Train [12][330/3239]	Time 0.554 (0.551)	Data 0.001 (0.042)	Loss 5.2146 (5.2055)	Top-1 acc 8.984 (10.608)	Top-5 acc 24.609 (26.308)	lr 0.04108
Warmup Train [12][340/3239]	Time 0.623 (0.550)	Data 0.001 (0.041)	Loss 5.2284 (5.2047)	Top-1 acc 10.938 (10.597)	Top-5 acc 21.875 (26.309)	lr 0.04108
Warmup Train [12][350/3239]	Time 0.518 (0.550)	Data 0.001 (0.040)	Loss 5.0823 (5.2035)	Top-1 acc 9.766 (10.616)	Top-5 acc 27.734 (26.356)	lr 0.04107
Warmup Train [12][360/3239]	Time 0.516 (0.548)	Data 0.001 (0.039)	Loss 5.1912 (5.2018)	Top-1 acc 10.156 (10.659)	Top-5 acc 24.219 (26.384)	lr 0.04107
Warmup Train [12][370/3239]	Time 0.464 (0.547)	Data 0.001 (0.038)	Loss 5.2486 (5.2016)	Top-1 acc 7.031 (10.652)	Top-5 acc 21.875 (26.345)	lr 0.04107
Warmup Train [12][380/3239]	Time 0.402 (0.546)	Data 0.001 (0.037)	Loss 5.1668 (5.2006)	Top-1 acc 8.594 (10.660)	Top-5 acc 26.953 (26.376)	lr 0.04106
Warmup Train [12][390/3239]	Time 0.551 (0.546)	Data 0.001 (0.036)	Loss 5.0896 (5.2000)	Top-1 acc 12.500 (10.678)	Top-5 acc 27.734 (26.399)	lr 0.04106
Warmup Train [12][400/3239]	Time 0.599 (0.545)	Data 0.001 (0.036)	Loss 5.2287 (5.2000)	Top-1 acc 8.594 (10.652)	Top-5 acc 22.266 (26.385)	lr 0.04105
Warmup Train [12][410/3239]	Time 0.608 (0.545)	Data 0.001 (0.035)	Loss 5.1845 (5.1998)	Top-1 acc 9.375 (10.650)	Top-5 acc 25.781 (26.382)	lr 0.04105
Warmup Train [12][420/3239]	Time 0.557 (0.544)	Data 0.001 (0.034)	Loss 5.1070 (5.2005)	Top-1 acc 14.453 (10.659)	Top-5 acc 29.688 (26.376)	lr 0.04104
Warmup Train [12][430/3239]	Time 0.534 (0.544)	Data 0.001 (0.033)	Loss 5.1066 (5.2010)	Top-1 acc 9.766 (10.649)	Top-5 acc 28.906 (26.378)	lr 0.04104
Warmup Train [12][440/3239]	Time 0.425 (0.543)	Data 0.001 (0.033)	Loss 5.2294 (5.2011)	Top-1 acc 12.109 (10.670)	Top-5 acc 27.734 (26.384)	lr 0.04103
Warmup Train [12][450/3239]	Time 0.311 (0.542)	Data 0.001 (0.032)	Loss 5.0901 (5.2006)	Top-1 acc 15.234 (10.679)	Top-5 acc 30.078 (26.404)	lr 0.04103
Warmup Train [12][460/3239]	Time 0.586 (0.541)	Data 0.001 (0.032)	Loss 5.1874 (5.2009)	Top-1 acc 10.156 (10.686)	Top-5 acc 21.484 (26.390)	lr 0.04102
Warmup Train [12][470/3239]	Time 0.398 (0.539)	Data 0.001 (0.031)	Loss 5.3244 (5.2006)	Top-1 acc 8.203 (10.697)	Top-5 acc 22.656 (26.385)	lr 0.04102
Warmup Train [12][480/3239]	Time 0.621 (0.539)	Data 0.001 (0.031)	Loss 5.1903 (5.2003)	Top-1 acc 13.281 (10.691)	Top-5 acc 24.219 (26.393)	lr 0.04101
Warmup Train [12][490/3239]	Time 0.513 (0.537)	Data 0.001 (0.030)	Loss 5.1693 (5.1986)	Top-1 acc 16.406 (10.724)	Top-5 acc 31.641 (26.436)	lr 0.04101
Warmup Train [12][500/3239]	Time 0.511 (0.537)	Data 0.001 (0.030)	Loss 5.0606 (5.1978)	Top-1 acc 13.672 (10.732)	Top-5 acc 28.125 (26.446)	lr 0.04100
Warmup Train [12][510/3239]	Time 0.536 (0.536)	Data 0.001 (0.029)	Loss 5.1628 (5.1984)	Top-1 acc 10.938 (10.723)	Top-5 acc 28.125 (26.424)	lr 0.04100
Warmup Train [12][520/3239]	Time 0.350 (0.536)	Data 0.001 (0.029)	Loss 5.2324 (5.1978)	Top-1 acc 10.938 (10.731)	Top-5 acc 24.609 (26.424)	lr 0.04100
Warmup Train [12][530/3239]	Time 0.446 (0.535)	Data 0.001 (0.029)	Loss 5.1480 (5.1967)	Top-1 acc 13.281 (10.745)	Top-5 acc 26.953 (26.436)	lr 0.04099
Warmup Train [12][540/3239]	Time 0.468 (0.535)	Data 0.001 (0.028)	Loss 5.2748 (5.1966)	Top-1 acc 9.766 (10.750)	Top-5 acc 25.391 (26.429)	lr 0.04099
Warmup Train [12][550/3239]	Time 0.601 (0.535)	Data 0.001 (0.028)	Loss 4.9980 (5.1957)	Top-1 acc 13.281 (10.770)	Top-5 acc 27.734 (26.426)	lr 0.04098
Warmup Train [12][560/3239]	Time 0.639 (0.535)	Data 0.001 (0.027)	Loss 5.4996 (5.1967)	Top-1 acc 8.594 (10.759)	Top-5 acc 18.750 (26.395)	lr 0.04098
Warmup Train [12][570/3239]	Time 0.594 (0.534)	Data 0.001 (0.027)	Loss 5.2077 (5.1973)	Top-1 acc 10.156 (10.740)	Top-5 acc 26.953 (26.359)	lr 0.04097
Warmup Train [12][580/3239]	Time 0.442 (0.534)	Data 0.001 (0.027)	Loss 5.1969 (5.1969)	Top-1 acc 12.109 (10.748)	Top-5 acc 23.047 (26.366)	lr 0.04097
Warmup Train [12][590/3239]	Time 0.493 (0.534)	Data 0.001 (0.026)	Loss 5.2193 (5.1963)	Top-1 acc 10.156 (10.770)	Top-5 acc 25.000 (26.389)	lr 0.04096
Warmup Train [12][600/3239]	Time 0.513 (0.533)	Data 0.002 (0.026)	Loss 5.2419 (5.1961)	Top-1 acc 12.109 (10.776)	Top-5 acc 26.172 (26.386)	lr 0.04096
Warmup Train [12][610/3239]	Time 0.607 (0.533)	Data 0.001 (0.026)	Loss 5.0705 (5.1957)	Top-1 acc 10.547 (10.783)	Top-5 acc 28.516 (26.412)	lr 0.04095
Warmup Train [12][620/3239]	Time 0.568 (0.532)	Data 0.001 (0.025)	Loss 5.0644 (5.1950)	Top-1 acc 10.938 (10.797)	Top-5 acc 27.734 (26.434)	lr 0.04095
Warmup Train [12][630/3239]	Time 0.546 (0.532)	Data 0.001 (0.025)	Loss 5.1726 (5.1950)	Top-1 acc 12.500 (10.788)	Top-5 acc 26.562 (26.439)	lr 0.04094
Warmup Train [12][640/3239]	Time 0.487 (0.532)	Data 0.001 (0.025)	Loss 5.1155 (5.1946)	Top-1 acc 9.766 (10.794)	Top-5 acc 27.344 (26.454)	lr 0.04094
Warmup Train [12][650/3239]	Time 0.556 (0.532)	Data 0.001 (0.024)	Loss 5.1390 (5.1941)	Top-1 acc 12.109 (10.792)	Top-5 acc 25.391 (26.454)	lr 0.04093
Warmup Train [12][660/3239]	Time 0.486 (0.532)	Data 0.001 (0.024)	Loss 4.9824 (5.1940)	Top-1 acc 13.281 (10.799)	Top-5 acc 33.984 (26.467)	lr 0.04093
Warmup Train [12][670/3239]	Time 0.612 (0.532)	Data 0.001 (0.024)	Loss 5.1368 (5.1936)	Top-1 acc 12.500 (10.797)	Top-5 acc 28.516 (26.478)	lr 0.04093
Warmup Train [12][680/3239]	Time 0.447 (0.531)	Data 0.001 (0.023)	Loss 5.3100 (5.1931)	Top-1 acc 12.500 (10.808)	Top-5 acc 25.000 (26.491)	lr 0.04092
Warmup Train [12][690/3239]	Time 0.572 (0.531)	Data 0.001 (0.023)	Loss 5.3055 (5.1936)	Top-1 acc 9.375 (10.810)	Top-5 acc 24.609 (26.487)	lr 0.04092
Warmup Train [12][700/3239]	Time 0.393 (0.531)	Data 0.001 (0.023)	Loss 5.1134 (5.1936)	Top-1 acc 10.938 (10.807)	Top-5 acc 26.562 (26.492)	lr 0.04091
Warmup Train [12][710/3239]	Time 0.507 (0.530)	Data 0.001 (0.023)	Loss 5.0670 (5.1934)	Top-1 acc 14.844 (10.813)	Top-5 acc 33.203 (26.514)	lr 0.04091
Warmup Train [12][720/3239]	Time 0.644 (0.530)	Data 0.001 (0.023)	Loss 5.1144 (5.1932)	Top-1 acc 14.062 (10.824)	Top-5 acc 28.906 (26.535)	lr 0.04090
Warmup Train [12][730/3239]	Time 0.474 (0.529)	Data 0.002 (0.022)	Loss 5.1230 (5.1925)	Top-1 acc 11.328 (10.828)	Top-5 acc 26.172 (26.558)	lr 0.04090
Warmup Train [12][740/3239]	Time 0.318 (0.528)	Data 0.001 (0.022)	Loss 5.1756 (5.1922)	Top-1 acc 12.891 (10.842)	Top-5 acc 29.297 (26.566)	lr 0.04089
Warmup Train [12][750/3239]	Time 0.463 (0.528)	Data 0.001 (0.022)	Loss 5.2684 (5.1920)	Top-1 acc 10.547 (10.854)	Top-5 acc 23.047 (26.577)	lr 0.04089
Warmup Train [12][760/3239]	Time 0.638 (0.527)	Data 0.001 (0.022)	Loss 5.2035 (5.1919)	Top-1 acc 10.547 (10.852)	Top-5 acc 22.656 (26.561)	lr 0.04088
Warmup Train [12][770/3239]	Time 0.507 (0.527)	Data 0.001 (0.022)	Loss 5.2738 (5.1925)	Top-1 acc 11.328 (10.853)	Top-5 acc 23.828 (26.535)	lr 0.04088
Warmup Train [12][780/3239]	Time 0.525 (0.527)	Data 0.001 (0.021)	Loss 5.1824 (5.1923)	Top-1 acc 13.672 (10.861)	Top-5 acc 28.906 (26.546)	lr 0.04087
Warmup Train [12][790/3239]	Time 0.447 (0.527)	Data 0.001 (0.021)	Loss 5.2467 (5.1915)	Top-1 acc 8.203 (10.860)	Top-5 acc 26.172 (26.556)	lr 0.04087
Warmup Train [12][800/3239]	Time 0.345 (0.527)	Data 0.001 (0.021)	Loss 5.3218 (5.1912)	Top-1 acc 10.547 (10.862)	Top-5 acc 23.047 (26.555)	lr 0.04086
Warmup Train [12][810/3239]	Time 0.614 (0.527)	Data 0.001 (0.021)	Loss 5.1888 (5.1909)	Top-1 acc 10.938 (10.860)	Top-5 acc 26.562 (26.564)	lr 0.04086
Warmup Train [12][820/3239]	Time 0.586 (0.527)	Data 0.001 (0.021)	Loss 5.1498 (5.1909)	Top-1 acc 12.500 (10.855)	Top-5 acc 26.953 (26.550)	lr 0.04086
Warmup Train [12][830/3239]	Time 0.434 (0.526)	Data 0.001 (0.021)	Loss 5.1443 (5.1905)	Top-1 acc 12.891 (10.851)	Top-5 acc 30.469 (26.562)	lr 0.04085
Warmup Train [12][840/3239]	Time 0.517 (0.526)	Data 0.001 (0.021)	Loss 5.2710 (5.1907)	Top-1 acc 7.812 (10.853)	Top-5 acc 25.000 (26.557)	lr 0.04085
Warmup Train [12][850/3239]	Time 0.520 (0.526)	Data 0.001 (0.020)	Loss 5.2043 (5.1900)	Top-1 acc 13.281 (10.868)	Top-5 acc 26.953 (26.581)	lr 0.04084
Warmup Train [12][860/3239]	Time 0.469 (0.526)	Data 0.001 (0.020)	Loss 5.0481 (5.1897)	Top-1 acc 13.672 (10.879)	Top-5 acc 31.250 (26.597)	lr 0.04084
Warmup Train [12][870/3239]	Time 0.618 (0.526)	Data 0.001 (0.020)	Loss 5.2531 (5.1894)	Top-1 acc 8.594 (10.885)	Top-5 acc 26.172 (26.602)	lr 0.04083
Warmup Train [12][880/3239]	Time 0.609 (0.526)	Data 0.001 (0.020)	Loss 5.2108 (5.1891)	Top-1 acc 10.156 (10.881)	Top-5 acc 26.172 (26.602)	lr 0.04083
Warmup Train [12][890/3239]	Time 0.651 (0.526)	Data 0.001 (0.020)	Loss 5.0500 (5.1892)	Top-1 acc 10.547 (10.887)	Top-5 acc 29.297 (26.609)	lr 0.04082
Warmup Train [12][900/3239]	Time 0.418 (0.526)	Data 0.001 (0.020)	Loss 5.1379 (5.1886)	Top-1 acc 11.328 (10.894)	Top-5 acc 26.953 (26.611)	lr 0.04082
Warmup Train [12][910/3239]	Time 0.648 (0.526)	Data 0.001 (0.019)	Loss 5.2951 (5.1884)	Top-1 acc 7.031 (10.885)	Top-5 acc 23.047 (26.608)	lr 0.04081
Warmup Train [12][920/3239]	Time 0.540 (0.526)	Data 0.001 (0.019)	Loss 5.0825 (5.1879)	Top-1 acc 12.500 (10.896)	Top-5 acc 29.297 (26.624)	lr 0.04081
Warmup Train [12][930/3239]	Time 0.600 (0.526)	Data 0.001 (0.019)	Loss 5.2254 (5.1878)	Top-1 acc 14.453 (10.906)	Top-5 acc 27.734 (26.625)	lr 0.04080
Warmup Train [12][940/3239]	Time 0.552 (0.526)	Data 0.001 (0.019)	Loss 5.2006 (5.1876)	Top-1 acc 13.672 (10.911)	Top-5 acc 27.734 (26.632)	lr 0.04080
Warmup Train [12][950/3239]	Time 0.554 (0.526)	Data 0.001 (0.019)	Loss 5.0560 (5.1878)	Top-1 acc 12.500 (10.894)	Top-5 acc 30.469 (26.624)	lr 0.04079
Warmup Train [12][960/3239]	Time 0.513 (0.526)	Data 0.001 (0.019)	Loss 5.3288 (5.1877)	Top-1 acc 9.766 (10.900)	Top-5 acc 24.219 (26.623)	lr 0.04079
Warmup Train [12][970/3239]	Time 0.371 (0.525)	Data 0.001 (0.018)	Loss 5.1798 (5.1877)	Top-1 acc 11.328 (10.904)	Top-5 acc 25.000 (26.622)	lr 0.04078
Warmup Train [12][980/3239]	Time 0.569 (0.525)	Data 0.001 (0.018)	Loss 5.2134 (5.1870)	Top-1 acc 7.812 (10.908)	Top-5 acc 23.438 (26.638)	lr 0.04078
Warmup Train [12][990/3239]	Time 0.404 (0.525)	Data 0.001 (0.018)	Loss 5.3290 (5.1868)	Top-1 acc 7.812 (10.914)	Top-5 acc 22.656 (26.637)	lr 0.04078
Warmup Train [12][1000/3239]	Time 0.657 (0.525)	Data 0.001 (0.018)	Loss 5.2777 (5.1865)	Top-1 acc 10.938 (10.914)	Top-5 acc 25.391 (26.650)	lr 0.04077
Warmup Train [12][1010/3239]	Time 0.571 (0.524)	Data 0.001 (0.018)	Loss 5.1871 (5.1866)	Top-1 acc 8.203 (10.917)	Top-5 acc 26.562 (26.651)	lr 0.04077
Warmup Train [12][1020/3239]	Time 0.530 (0.524)	Data 0.001 (0.018)	Loss 5.2485 (5.1865)	Top-1 acc 8.984 (10.918)	Top-5 acc 26.953 (26.655)	lr 0.04076
Warmup Train [12][1030/3239]	Time 0.398 (0.523)	Data 0.001 (0.018)	Loss 5.2977 (5.1861)	Top-1 acc 8.984 (10.919)	Top-5 acc 24.609 (26.663)	lr 0.04076
Warmup Train [12][1040/3239]	Time 0.534 (0.523)	Data 0.001 (0.018)	Loss 5.2705 (5.1864)	Top-1 acc 8.203 (10.913)	Top-5 acc 24.609 (26.657)	lr 0.04075
Warmup Train [12][1050/3239]	Time 0.493 (0.523)	Data 0.001 (0.018)	Loss 5.0175 (5.1864)	Top-1 acc 12.891 (10.917)	Top-5 acc 30.859 (26.664)	lr 0.04075
Warmup Train [12][1060/3239]	Time 0.498 (0.523)	Data 0.001 (0.017)	Loss 5.1790 (5.1869)	Top-1 acc 10.938 (10.904)	Top-5 acc 28.906 (26.654)	lr 0.04074
Warmup Train [12][1070/3239]	Time 0.659 (0.523)	Data 0.001 (0.017)	Loss 5.1557 (5.1867)	Top-1 acc 10.938 (10.904)	Top-5 acc 27.344 (26.661)	lr 0.04074
Warmup Train [12][1080/3239]	Time 0.572 (0.523)	Data 0.001 (0.017)	Loss 5.2308 (5.1871)	Top-1 acc 9.375 (10.903)	Top-5 acc 23.828 (26.656)	lr 0.04073
Warmup Train [12][1090/3239]	Time 0.568 (0.523)	Data 0.001 (0.017)	Loss 5.2844 (5.1869)	Top-1 acc 12.109 (10.905)	Top-5 acc 26.562 (26.667)	lr 0.04073
Warmup Train [12][1100/3239]	Time 0.482 (0.523)	Data 0.001 (0.017)	Loss 5.1196 (5.1864)	Top-1 acc 11.719 (10.917)	Top-5 acc 26.953 (26.676)	lr 0.04072
Warmup Train [12][1110/3239]	Time 0.652 (0.523)	Data 0.001 (0.017)	Loss 5.1727 (5.1861)	Top-1 acc 11.719 (10.922)	Top-5 acc 30.078 (26.695)	lr 0.04072
Warmup Train [12][1120/3239]	Time 0.723 (0.523)	Data 0.001 (0.017)	Loss 5.0735 (5.1857)	Top-1 acc 11.719 (10.924)	Top-5 acc 30.469 (26.698)	lr 0.04071
Warmup Train [12][1130/3239]	Time 0.668 (0.523)	Data 0.001 (0.017)	Loss 5.2089 (5.1857)	Top-1 acc 12.109 (10.922)	Top-5 acc 27.734 (26.697)	lr 0.04071
Warmup Train [12][1140/3239]	Time 0.491 (0.523)	Data 0.001 (0.017)	Loss 5.1475 (5.1852)	Top-1 acc 11.719 (10.926)	Top-5 acc 25.781 (26.708)	lr 0.04070
Warmup Train [12][1150/3239]	Time 0.379 (0.523)	Data 0.001 (0.016)	Loss 5.2692 (5.1852)	Top-1 acc 9.766 (10.929)	Top-5 acc 25.391 (26.708)	lr 0.04070
Warmup Train [12][1160/3239]	Time 0.484 (0.523)	Data 0.001 (0.016)	Loss 5.1831 (5.1851)	Top-1 acc 10.938 (10.934)	Top-5 acc 24.219 (26.697)	lr 0.04070
Warmup Train [12][1170/3239]	Time 0.574 (0.523)	Data 0.003 (0.016)	Loss 5.1269 (5.1848)	Top-1 acc 12.891 (10.935)	Top-5 acc 28.125 (26.704)	lr 0.04069
Warmup Train [12][1180/3239]	Time 0.525 (0.523)	Data 0.001 (0.016)	Loss 5.1646 (5.1845)	Top-1 acc 14.844 (10.934)	Top-5 acc 26.562 (26.701)	lr 0.04069
Warmup Train [12][1190/3239]	Time 0.467 (0.523)	Data 0.001 (0.016)	Loss 5.1712 (5.1842)	Top-1 acc 12.500 (10.944)	Top-5 acc 28.125 (26.718)	lr 0.04068
Warmup Train [12][1200/3239]	Time 0.426 (0.523)	Data 0.001 (0.016)	Loss 5.2241 (5.1842)	Top-1 acc 12.109 (10.942)	Top-5 acc 25.781 (26.713)	lr 0.04068
Warmup Train [12][1210/3239]	Time 0.479 (0.522)	Data 0.001 (0.016)	Loss 5.2858 (5.1842)	Top-1 acc 9.766 (10.948)	Top-5 acc 24.609 (26.717)	lr 0.04067
Warmup Train [12][1220/3239]	Time 0.619 (0.523)	Data 0.001 (0.016)	Loss 5.0564 (5.1836)	Top-1 acc 11.328 (10.953)	Top-5 acc 28.125 (26.730)	lr 0.04067
Warmup Train [12][1230/3239]	Time 0.541 (0.522)	Data 0.001 (0.016)	Loss 5.0913 (5.1833)	Top-1 acc 12.109 (10.955)	Top-5 acc 27.734 (26.748)	lr 0.04066
Warmup Train [12][1240/3239]	Time 0.528 (0.522)	Data 0.001 (0.016)	Loss 5.2193 (5.1828)	Top-1 acc 10.156 (10.962)	Top-5 acc 26.172 (26.762)	lr 0.04066
Warmup Train [12][1250/3239]	Time 0.558 (0.522)	Data 0.001 (0.016)	Loss 5.2378 (5.1829)	Top-1 acc 13.672 (10.960)	Top-5 acc 28.516 (26.760)	lr 0.04065
Warmup Train [12][1260/3239]	Time 0.238 (0.522)	Data 0.001 (0.016)	Loss 5.2533 (5.1830)	Top-1 acc 13.281 (10.958)	Top-5 acc 28.516 (26.763)	lr 0.04065
Warmup Train [12][1270/3239]	Time 0.556 (0.521)	Data 0.001 (0.016)	Loss 5.1107 (5.1829)	Top-1 acc 11.719 (10.964)	Top-5 acc 23.828 (26.760)	lr 0.04064
Warmup Train [12][1280/3239]	Time 0.284 (0.521)	Data 0.001 (0.016)	Loss 5.0716 (5.1826)	Top-1 acc 12.109 (10.971)	Top-5 acc 31.641 (26.768)	lr 0.04064
Warmup Train [12][1290/3239]	Time 0.511 (0.521)	Data 0.001 (0.016)	Loss 5.2809 (5.1830)	Top-1 acc 8.594 (10.965)	Top-5 acc 24.609 (26.759)	lr 0.04063
Warmup Train [12][1300/3239]	Time 0.498 (0.521)	Data 0.001 (0.015)	Loss 5.2249 (5.1830)	Top-1 acc 10.938 (10.960)	Top-5 acc 24.219 (26.757)	lr 0.04063
Warmup Train [12][1310/3239]	Time 0.537 (0.520)	Data 0.001 (0.015)	Loss 5.1599 (5.1831)	Top-1 acc 11.719 (10.965)	Top-5 acc 27.344 (26.759)	lr 0.04062
Warmup Train [12][1320/3239]	Time 0.603 (0.520)	Data 0.001 (0.015)	Loss 5.1712 (5.1832)	Top-1 acc 9.375 (10.961)	Top-5 acc 26.562 (26.759)	lr 0.04062
Warmup Train [12][1330/3239]	Time 0.571 (0.520)	Data 0.001 (0.015)	Loss 4.9923 (5.1829)	Top-1 acc 12.891 (10.959)	Top-5 acc 32.422 (26.759)	lr 0.04061
Warmup Train [12][1340/3239]	Time 0.514 (0.521)	Data 0.001 (0.015)	Loss 5.1770 (5.1827)	Top-1 acc 13.281 (10.963)	Top-5 acc 30.469 (26.764)	lr 0.04061
Warmup Train [12][1350/3239]	Time 0.500 (0.520)	Data 0.001 (0.015)	Loss 5.2468 (5.1827)	Top-1 acc 8.984 (10.960)	Top-5 acc 27.734 (26.761)	lr 0.04061
Warmup Train [12][1360/3239]	Time 0.411 (0.520)	Data 0.001 (0.015)	Loss 5.2016 (5.1827)	Top-1 acc 9.375 (10.955)	Top-5 acc 26.172 (26.762)	lr 0.04060
Warmup Train [12][1370/3239]	Time 0.394 (0.520)	Data 0.001 (0.015)	Loss 5.1954 (5.1826)	Top-1 acc 7.812 (10.947)	Top-5 acc 25.000 (26.758)	lr 0.04060
Warmup Train [12][1380/3239]	Time 0.365 (0.520)	Data 0.001 (0.015)	Loss 5.1831 (5.1824)	Top-1 acc 12.891 (10.952)	Top-5 acc 27.344 (26.763)	lr 0.04059
Warmup Train [12][1390/3239]	Time 0.510 (0.520)	Data 0.001 (0.015)	Loss 5.1789 (5.1823)	Top-1 acc 13.672 (10.959)	Top-5 acc 28.906 (26.769)	lr 0.04059
Warmup Train [12][1400/3239]	Time 0.393 (0.520)	Data 0.001 (0.015)	Loss 5.3663 (5.1823)	Top-1 acc 10.156 (10.960)	Top-5 acc 26.562 (26.768)	lr 0.04058
Warmup Train [12][1410/3239]	Time 0.681 (0.520)	Data 0.001 (0.015)	Loss 5.1869 (5.1822)	Top-1 acc 8.594 (10.963)	Top-5 acc 27.734 (26.772)	lr 0.04058
Warmup Train [12][1420/3239]	Time 0.342 (0.520)	Data 0.001 (0.015)	Loss 5.1327 (5.1820)	Top-1 acc 8.984 (10.962)	Top-5 acc 24.219 (26.769)	lr 0.04057
Warmup Train [12][1430/3239]	Time 0.506 (0.520)	Data 0.001 (0.015)	Loss 5.0686 (5.1820)	Top-1 acc 12.891 (10.964)	Top-5 acc 30.469 (26.772)	lr 0.04057
Warmup Train [12][1440/3239]	Time 0.408 (0.520)	Data 0.001 (0.015)	Loss 5.1797 (5.1820)	Top-1 acc 10.938 (10.971)	Top-5 acc 25.781 (26.774)	lr 0.04056
Warmup Train [12][1450/3239]	Time 0.506 (0.520)	Data 0.001 (0.015)	Loss 5.1582 (5.1819)	Top-1 acc 12.891 (10.975)	Top-5 acc 27.734 (26.782)	lr 0.04056
Warmup Train [12][1460/3239]	Time 0.401 (0.520)	Data 0.001 (0.015)	Loss 5.2791 (5.1818)	Top-1 acc 8.203 (10.973)	Top-5 acc 26.562 (26.783)	lr 0.04055
Warmup Train [12][1470/3239]	Time 0.578 (0.520)	Data 0.001 (0.015)	Loss 5.1211 (5.1816)	Top-1 acc 12.891 (10.978)	Top-5 acc 27.344 (26.777)	lr 0.04055
Warmup Train [12][1480/3239]	Time 0.378 (0.520)	Data 0.001 (0.014)	Loss 5.1343 (5.1818)	Top-1 acc 9.375 (10.969)	Top-5 acc 25.000 (26.771)	lr 0.04054
Warmup Train [12][1490/3239]	Time 0.381 (0.520)	Data 0.001 (0.014)	Loss 5.3588 (5.1819)	Top-1 acc 7.422 (10.972)	Top-5 acc 21.875 (26.768)	lr 0.04054
Warmup Train [12][1500/3239]	Time 0.362 (0.520)	Data 0.001 (0.014)	Loss 5.0436 (5.1817)	Top-1 acc 14.062 (10.975)	Top-5 acc 31.641 (26.771)	lr 0.04053
Warmup Train [12][1510/3239]	Time 0.481 (0.519)	Data 0.001 (0.014)	Loss 5.0541 (5.1816)	Top-1 acc 14.062 (10.972)	Top-5 acc 31.250 (26.768)	lr 0.04053
Warmup Train [12][1520/3239]	Time 0.489 (0.519)	Data 0.001 (0.014)	Loss 4.9717 (5.1815)	Top-1 acc 12.109 (10.975)	Top-5 acc 32.422 (26.774)	lr 0.04052
Warmup Train [12][1530/3239]	Time 0.629 (0.519)	Data 0.001 (0.014)	Loss 5.0875 (5.1813)	Top-1 acc 11.328 (10.967)	Top-5 acc 30.078 (26.781)	lr 0.04052
Warmup Train [12][1540/3239]	Time 0.367 (0.519)	Data 0.001 (0.014)	Loss 5.1555 (5.1809)	Top-1 acc 9.766 (10.971)	Top-5 acc 26.953 (26.795)	lr 0.04052
Warmup Train [12][1550/3239]	Time 0.618 (0.519)	Data 0.001 (0.014)	Loss 5.1917 (5.1810)	Top-1 acc 12.500 (10.969)	Top-5 acc 23.828 (26.794)	lr 0.04051
Warmup Train [12][1560/3239]	Time 0.437 (0.519)	Data 0.001 (0.014)	Loss 5.2154 (5.1810)	Top-1 acc 11.719 (10.964)	Top-5 acc 26.562 (26.798)	lr 0.04051
Warmup Train [12][1570/3239]	Time 0.451 (0.519)	Data 0.001 (0.014)	Loss 5.1140 (5.1807)	Top-1 acc 12.109 (10.969)	Top-5 acc 26.172 (26.804)	lr 0.04050
Warmup Train [12][1580/3239]	Time 0.490 (0.519)	Data 0.001 (0.014)	Loss 5.1411 (5.1807)	Top-1 acc 8.984 (10.969)	Top-5 acc 26.562 (26.801)	lr 0.04050
Warmup Train [12][1590/3239]	Time 0.567 (0.519)	Data 0.001 (0.014)	Loss 5.2491 (5.1807)	Top-1 acc 9.766 (10.971)	Top-5 acc 25.000 (26.799)	lr 0.04049
Warmup Train [12][1600/3239]	Time 0.611 (0.519)	Data 0.001 (0.014)	Loss 5.2764 (5.1806)	Top-1 acc 12.891 (10.973)	Top-5 acc 26.953 (26.800)	lr 0.04049
Warmup Train [12][1610/3239]	Time 0.492 (0.519)	Data 0.001 (0.014)	Loss 5.0455 (5.1807)	Top-1 acc 12.891 (10.970)	Top-5 acc 30.078 (26.796)	lr 0.04048
Warmup Train [12][1620/3239]	Time 0.509 (0.519)	Data 0.001 (0.014)	Loss 5.1048 (5.1808)	Top-1 acc 12.500 (10.969)	Top-5 acc 29.688 (26.796)	lr 0.04048
Warmup Train [12][1630/3239]	Time 0.635 (0.519)	Data 0.001 (0.014)	Loss 5.1847 (5.1809)	Top-1 acc 8.594 (10.973)	Top-5 acc 22.266 (26.794)	lr 0.04047
Warmup Train [12][1640/3239]	Time 0.767 (0.519)	Data 0.001 (0.014)	Loss 5.3621 (5.1811)	Top-1 acc 9.375 (10.973)	Top-5 acc 22.656 (26.796)	lr 0.04047
Warmup Train [12][1650/3239]	Time 0.541 (0.519)	Data 0.001 (0.014)	Loss 5.0498 (5.1810)	Top-1 acc 13.281 (10.977)	Top-5 acc 29.688 (26.794)	lr 0.04046
Warmup Train [12][1660/3239]	Time 0.433 (0.519)	Data 0.001 (0.014)	Loss 5.1504 (5.1811)	Top-1 acc 11.328 (10.978)	Top-5 acc 26.562 (26.795)	lr 0.04046
Warmup Train [12][1670/3239]	Time 0.576 (0.519)	Data 0.001 (0.014)	Loss 5.3138 (5.1810)	Top-1 acc 9.375 (10.981)	Top-5 acc 25.391 (26.801)	lr 0.04045
Warmup Train [12][1680/3239]	Time 0.431 (0.519)	Data 0.001 (0.014)	Loss 4.9972 (5.1809)	Top-1 acc 12.500 (10.979)	Top-5 acc 31.250 (26.812)	lr 0.04045
Warmup Train [12][1690/3239]	Time 0.493 (0.519)	Data 0.001 (0.014)	Loss 5.0928 (5.1806)	Top-1 acc 11.328 (10.984)	Top-5 acc 29.297 (26.820)	lr 0.04044
Warmup Train [12][1700/3239]	Time 0.588 (0.519)	Data 0.001 (0.013)	Loss 5.1107 (5.1804)	Top-1 acc 13.281 (10.992)	Top-5 acc 30.859 (26.831)	lr 0.04044
Warmup Train [12][1710/3239]	Time 0.568 (0.519)	Data 0.001 (0.013)	Loss 5.1898 (5.1805)	Top-1 acc 11.328 (10.989)	Top-5 acc 29.297 (26.833)	lr 0.04043
Warmup Train [12][1720/3239]	Time 0.517 (0.519)	Data 0.001 (0.013)	Loss 5.1223 (5.1804)	Top-1 acc 13.281 (10.990)	Top-5 acc 27.734 (26.836)	lr 0.04043
Warmup Train [12][1730/3239]	Time 0.635 (0.519)	Data 0.001 (0.013)	Loss 5.1619 (5.1801)	Top-1 acc 12.891 (10.999)	Top-5 acc 27.734 (26.845)	lr 0.04042
Warmup Train [12][1740/3239]	Time 0.577 (0.518)	Data 0.001 (0.013)	Loss 5.4888 (5.1801)	Top-1 acc 7.812 (10.996)	Top-5 acc 19.922 (26.841)	lr 0.04042
Warmup Train [12][1750/3239]	Time 0.702 (0.519)	Data 0.001 (0.013)	Loss 5.0622 (5.1797)	Top-1 acc 14.844 (10.997)	Top-5 acc 35.156 (26.849)	lr 0.04042
Warmup Train [12][1760/3239]	Time 0.442 (0.518)	Data 0.001 (0.013)	Loss 5.0827 (5.1798)	Top-1 acc 14.062 (10.999)	Top-5 acc 26.172 (26.846)	lr 0.04041
Warmup Train [12][1770/3239]	Time 0.316 (0.518)	Data 0.001 (0.013)	Loss 5.1021 (5.1797)	Top-1 acc 11.719 (10.995)	Top-5 acc 29.297 (26.851)	lr 0.04041
Warmup Train [12][1780/3239]	Time 0.553 (0.518)	Data 0.001 (0.013)	Loss 5.2039 (5.1795)	Top-1 acc 12.109 (10.997)	Top-5 acc 29.297 (26.856)	lr 0.04040
Warmup Train [12][1790/3239]	Time 0.458 (0.518)	Data 0.001 (0.013)	Loss 5.2232 (5.1795)	Top-1 acc 12.109 (11.001)	Top-5 acc 27.344 (26.863)	lr 0.04040
Warmup Train [12][1800/3239]	Time 0.268 (0.518)	Data 0.001 (0.013)	Loss 5.0469 (5.1790)	Top-1 acc 10.547 (11.002)	Top-5 acc 25.781 (26.869)	lr 0.04039
Warmup Train [12][1810/3239]	Time 0.475 (0.518)	Data 0.001 (0.013)	Loss 5.1726 (5.1788)	Top-1 acc 11.328 (11.010)	Top-5 acc 30.469 (26.882)	lr 0.04039
Warmup Train [12][1820/3239]	Time 0.510 (0.518)	Data 0.001 (0.013)	Loss 5.0085 (5.1786)	Top-1 acc 13.281 (11.012)	Top-5 acc 31.250 (26.881)	lr 0.04038
Warmup Train [12][1830/3239]	Time 0.464 (0.518)	Data 0.001 (0.013)	Loss 5.2154 (5.1783)	Top-1 acc 10.547 (11.019)	Top-5 acc 26.562 (26.896)	lr 0.04038
Warmup Train [12][1840/3239]	Time 0.350 (0.518)	Data 0.001 (0.013)	Loss 5.1983 (5.1784)	Top-1 acc 8.203 (11.016)	Top-5 acc 23.438 (26.893)	lr 0.04037
Warmup Train [12][1850/3239]	Time 0.515 (0.518)	Data 0.001 (0.013)	Loss 5.0312 (5.1781)	Top-1 acc 11.719 (11.017)	Top-5 acc 29.688 (26.902)	lr 0.04037
Warmup Train [12][1860/3239]	Time 0.584 (0.518)	Data 0.001 (0.013)	Loss 5.2839 (5.1781)	Top-1 acc 11.328 (11.019)	Top-5 acc 23.438 (26.903)	lr 0.04036
Warmup Train [12][1870/3239]	Time 0.381 (0.518)	Data 0.001 (0.013)	Loss 5.1406 (5.1779)	Top-1 acc 11.328 (11.018)	Top-5 acc 30.469 (26.905)	lr 0.04036
Warmup Train [12][1880/3239]	Time 0.449 (0.518)	Data 0.001 (0.013)	Loss 5.0905 (5.1779)	Top-1 acc 12.891 (11.023)	Top-5 acc 28.516 (26.909)	lr 0.04035
Warmup Train [12][1890/3239]	Time 0.506 (0.518)	Data 0.001 (0.013)	Loss 5.2614 (5.1776)	Top-1 acc 9.375 (11.027)	Top-5 acc 24.609 (26.911)	lr 0.04035
Warmup Train [12][1900/3239]	Time 0.491 (0.518)	Data 0.001 (0.013)	Loss 5.1641 (5.1774)	Top-1 acc 10.938 (11.034)	Top-5 acc 27.344 (26.919)	lr 0.04034
Warmup Train [12][1910/3239]	Time 0.474 (0.518)	Data 0.001 (0.013)	Loss 5.1682 (5.1770)	Top-1 acc 11.719 (11.040)	Top-5 acc 29.297 (26.932)	lr 0.04034
Warmup Train [12][1920/3239]	Time 0.596 (0.518)	Data 0.001 (0.013)	Loss 5.1779 (5.1769)	Top-1 acc 10.938 (11.042)	Top-5 acc 27.344 (26.939)	lr 0.04033
Warmup Train [12][1930/3239]	Time 0.335 (0.518)	Data 0.001 (0.013)	Loss 5.2876 (5.1769)	Top-1 acc 10.156 (11.042)	Top-5 acc 23.047 (26.937)	lr 0.04033
Warmup Train [12][1940/3239]	Time 0.332 (0.517)	Data 0.001 (0.013)	Loss 5.1819 (5.1767)	Top-1 acc 11.719 (11.048)	Top-5 acc 28.906 (26.947)	lr 0.04032
Warmup Train [12][1950/3239]	Time 0.444 (0.517)	Data 0.001 (0.013)	Loss 5.1219 (5.1764)	Top-1 acc 14.062 (11.050)	Top-5 acc 30.859 (26.955)	lr 0.04032
Warmup Train [12][1960/3239]	Time 0.600 (0.518)	Data 0.005 (0.013)	Loss 5.2458 (5.1762)	Top-1 acc 9.375 (11.056)	Top-5 acc 25.391 (26.962)	lr 0.04032
Warmup Train [12][1970/3239]	Time 0.559 (0.518)	Data 0.001 (0.013)	Loss 5.1590 (5.1761)	Top-1 acc 12.109 (11.058)	Top-5 acc 29.297 (26.966)	lr 0.04031
Warmup Train [12][1980/3239]	Time 0.481 (0.518)	Data 0.001 (0.013)	Loss 5.0736 (5.1761)	Top-1 acc 12.891 (11.062)	Top-5 acc 30.078 (26.973)	lr 0.04031
Warmup Train [12][1990/3239]	Time 0.518 (0.518)	Data 0.001 (0.013)	Loss 5.2191 (5.1762)	Top-1 acc 12.109 (11.061)	Top-5 acc 28.906 (26.973)	lr 0.04030
Warmup Train [12][2000/3239]	Time 0.468 (0.518)	Data 0.001 (0.013)	Loss 5.0271 (5.1757)	Top-1 acc 13.281 (11.071)	Top-5 acc 29.688 (26.985)	lr 0.04030
Warmup Train [12][2010/3239]	Time 0.413 (0.518)	Data 0.001 (0.013)	Loss 5.2196 (5.1756)	Top-1 acc 12.109 (11.073)	Top-5 acc 27.734 (26.993)	lr 0.04029
Warmup Train [12][2020/3239]	Time 0.393 (0.518)	Data 0.001 (0.013)	Loss 5.3161 (5.1754)	Top-1 acc 8.203 (11.074)	Top-5 acc 20.312 (26.996)	lr 0.04029
Warmup Train [12][2030/3239]	Time 0.404 (0.518)	Data 0.001 (0.013)	Loss 4.9404 (5.1750)	Top-1 acc 15.234 (11.079)	Top-5 acc 32.812 (27.008)	lr 0.04028
Warmup Train [12][2040/3239]	Time 0.494 (0.517)	Data 0.001 (0.012)	Loss 5.2425 (5.1749)	Top-1 acc 6.250 (11.079)	Top-5 acc 25.000 (27.010)	lr 0.04028
Warmup Train [12][2050/3239]	Time 0.385 (0.517)	Data 0.001 (0.012)	Loss 5.1170 (5.1747)	Top-1 acc 8.203 (11.078)	Top-5 acc 26.562 (27.017)	lr 0.04027
Warmup Train [12][2060/3239]	Time 0.350 (0.517)	Data 0.001 (0.012)	Loss 5.0979 (5.1744)	Top-1 acc 10.547 (11.083)	Top-5 acc 28.125 (27.022)	lr 0.04027
Warmup Train [12][2070/3239]	Time 0.402 (0.517)	Data 0.001 (0.012)	Loss 5.0433 (5.1742)	Top-1 acc 15.234 (11.084)	Top-5 acc 28.516 (27.020)	lr 0.04026
Warmup Train [12][2080/3239]	Time 0.614 (0.517)	Data 0.001 (0.012)	Loss 4.9684 (5.1741)	Top-1 acc 14.062 (11.087)	Top-5 acc 32.422 (27.021)	lr 0.04026
Warmup Train [12][2090/3239]	Time 0.494 (0.517)	Data 0.001 (0.012)	Loss 4.9721 (5.1739)	Top-1 acc 15.234 (11.085)	Top-5 acc 33.984 (27.023)	lr 0.04025
Warmup Train [12][2100/3239]	Time 0.531 (0.517)	Data 0.001 (0.012)	Loss 5.2224 (5.1739)	Top-1 acc 9.766 (11.085)	Top-5 acc 23.828 (27.022)	lr 0.04025
Warmup Train [12][2110/3239]	Time 0.517 (0.517)	Data 0.001 (0.012)	Loss 5.3060 (5.1737)	Top-1 acc 10.547 (11.088)	Top-5 acc 25.391 (27.027)	lr 0.04024
Warmup Train [12][2120/3239]	Time 0.450 (0.517)	Data 0.001 (0.012)	Loss 4.9808 (5.1733)	Top-1 acc 17.188 (11.097)	Top-5 acc 33.203 (27.039)	lr 0.04024
Warmup Train [12][2130/3239]	Time 0.586 (0.517)	Data 0.001 (0.012)	Loss 5.2139 (5.1731)	Top-1 acc 8.594 (11.098)	Top-5 acc 28.125 (27.046)	lr 0.04023
Warmup Train [12][2140/3239]	Time 0.650 (0.517)	Data 0.001 (0.012)	Loss 5.0430 (5.1728)	Top-1 acc 11.328 (11.100)	Top-5 acc 26.562 (27.051)	lr 0.04023
Warmup Train [12][2150/3239]	Time 0.582 (0.517)	Data 0.001 (0.012)	Loss 5.1621 (5.1727)	Top-1 acc 11.719 (11.102)	Top-5 acc 29.688 (27.056)	lr 0.04022
Warmup Train [12][2160/3239]	Time 0.486 (0.517)	Data 0.001 (0.012)	Loss 5.1618 (5.1724)	Top-1 acc 10.156 (11.105)	Top-5 acc 26.562 (27.063)	lr 0.04022
Warmup Train [12][2170/3239]	Time 0.615 (0.517)	Data 0.001 (0.012)	Loss 5.0535 (5.1723)	Top-1 acc 9.375 (11.102)	Top-5 acc 26.953 (27.066)	lr 0.04021
Warmup Train [12][2180/3239]	Time 0.516 (0.517)	Data 0.001 (0.012)	Loss 5.1974 (5.1721)	Top-1 acc 10.547 (11.105)	Top-5 acc 26.953 (27.069)	lr 0.04021
Warmup Train [12][2190/3239]	Time 0.601 (0.517)	Data 0.001 (0.012)	Loss 5.1157 (5.1720)	Top-1 acc 13.281 (11.109)	Top-5 acc 28.516 (27.073)	lr 0.04020
Warmup Train [12][2200/3239]	Time 0.605 (0.517)	Data 0.001 (0.012)	Loss 5.3099 (5.1719)	Top-1 acc 9.375 (11.108)	Top-5 acc 24.219 (27.077)	lr 0.04020
Warmup Train [12][2210/3239]	Time 0.573 (0.517)	Data 0.001 (0.012)	Loss 5.1860 (5.1717)	Top-1 acc 8.984 (11.108)	Top-5 acc 28.125 (27.084)	lr 0.04019
Warmup Train [12][2220/3239]	Time 0.354 (0.516)	Data 0.001 (0.012)	Loss 5.1725 (5.1718)	Top-1 acc 13.672 (11.106)	Top-5 acc 29.297 (27.083)	lr 0.04019
Warmup Train [12][2230/3239]	Time 0.518 (0.517)	Data 0.001 (0.012)	Loss 5.0796 (5.1717)	Top-1 acc 12.109 (11.109)	Top-5 acc 25.391 (27.082)	lr 0.04019
Warmup Train [12][2240/3239]	Time 0.458 (0.517)	Data 0.001 (0.012)	Loss 5.1603 (5.1714)	Top-1 acc 14.453 (11.115)	Top-5 acc 28.516 (27.090)	lr 0.04018
Warmup Train [12][2250/3239]	Time 0.505 (0.517)	Data 0.001 (0.012)	Loss 5.0956 (5.1711)	Top-1 acc 12.500 (11.122)	Top-5 acc 32.422 (27.102)	lr 0.04018
Warmup Train [12][2260/3239]	Time 0.659 (0.517)	Data 0.001 (0.012)	Loss 5.1059 (5.1710)	Top-1 acc 14.453 (11.123)	Top-5 acc 29.688 (27.103)	lr 0.04017
Warmup Train [12][2270/3239]	Time 0.362 (0.516)	Data 0.001 (0.012)	Loss 5.1267 (5.1710)	Top-1 acc 10.938 (11.122)	Top-5 acc 26.562 (27.100)	lr 0.04017
Warmup Train [12][2280/3239]	Time 0.378 (0.516)	Data 0.001 (0.012)	Loss 5.3417 (5.1710)	Top-1 acc 8.594 (11.122)	Top-5 acc 21.094 (27.100)	lr 0.04016
Warmup Train [12][2290/3239]	Time 0.524 (0.516)	Data 0.001 (0.012)	Loss 5.0758 (5.1707)	Top-1 acc 13.281 (11.123)	Top-5 acc 29.297 (27.108)	lr 0.04016
Warmup Train [12][2300/3239]	Time 0.630 (0.516)	Data 0.001 (0.012)	Loss 5.2096 (5.1704)	Top-1 acc 10.547 (11.131)	Top-5 acc 24.219 (27.115)	lr 0.04015
Warmup Train [12][2310/3239]	Time 0.487 (0.516)	Data 0.001 (0.012)	Loss 5.1408 (5.1701)	Top-1 acc 10.156 (11.136)	Top-5 acc 27.344 (27.123)	lr 0.04015
Warmup Train [12][2320/3239]	Time 0.527 (0.516)	Data 0.026 (0.012)	Loss 4.9461 (5.1699)	Top-1 acc 13.672 (11.139)	Top-5 acc 33.594 (27.126)	lr 0.04014
Warmup Train [12][2330/3239]	Time 0.330 (0.516)	Data 0.001 (0.012)	Loss 5.1035 (5.1698)	Top-1 acc 11.328 (11.140)	Top-5 acc 29.688 (27.131)	lr 0.04014
Warmup Train [12][2340/3239]	Time 0.474 (0.516)	Data 0.001 (0.012)	Loss 5.2351 (5.1694)	Top-1 acc 10.547 (11.141)	Top-5 acc 20.703 (27.138)	lr 0.04013
Warmup Train [12][2350/3239]	Time 0.537 (0.516)	Data 0.001 (0.012)	Loss 5.3719 (5.1694)	Top-1 acc 9.766 (11.143)	Top-5 acc 27.734 (27.142)	lr 0.04013
Warmup Train [12][2360/3239]	Time 0.480 (0.516)	Data 0.001 (0.012)	Loss 4.9299 (5.1692)	Top-1 acc 14.062 (11.144)	Top-5 acc 27.734 (27.144)	lr 0.04012
Warmup Train [12][2370/3239]	Time 0.346 (0.516)	Data 0.001 (0.012)	Loss 5.2969 (5.1692)	Top-1 acc 10.156 (11.144)	Top-5 acc 26.562 (27.144)	lr 0.04012
Warmup Train [12][2380/3239]	Time 0.510 (0.516)	Data 0.001 (0.012)	Loss 5.1503 (5.1690)	Top-1 acc 12.891 (11.147)	Top-5 acc 31.250 (27.154)	lr 0.04011
Warmup Train [12][2390/3239]	Time 0.514 (0.516)	Data 0.001 (0.012)	Loss 5.2121 (5.1691)	Top-1 acc 10.547 (11.146)	Top-5 acc 26.172 (27.153)	lr 0.04011
Warmup Train [12][2400/3239]	Time 0.540 (0.516)	Data 0.001 (0.012)	Loss 5.1495 (5.1688)	Top-1 acc 13.281 (11.152)	Top-5 acc 28.125 (27.162)	lr 0.04010
Warmup Train [12][2410/3239]	Time 0.647 (0.516)	Data 0.001 (0.012)	Loss 5.1994 (5.1688)	Top-1 acc 13.672 (11.155)	Top-5 acc 27.344 (27.166)	lr 0.04010
Warmup Train [12][2420/3239]	Time 0.501 (0.516)	Data 0.001 (0.012)	Loss 5.0169 (5.1685)	Top-1 acc 12.109 (11.160)	Top-5 acc 30.859 (27.174)	lr 0.04009
Warmup Train [12][2430/3239]	Time 0.439 (0.516)	Data 0.001 (0.012)	Loss 5.1229 (5.1684)	Top-1 acc 10.156 (11.164)	Top-5 acc 27.734 (27.175)	lr 0.04009
Warmup Train [12][2440/3239]	Time 0.354 (0.516)	Data 0.001 (0.012)	Loss 4.9979 (5.1682)	Top-1 acc 16.797 (11.167)	Top-5 acc 33.984 (27.188)	lr 0.04008
Warmup Train [12][2450/3239]	Time 0.600 (0.516)	Data 0.001 (0.012)	Loss 5.0189 (5.1678)	Top-1 acc 14.844 (11.173)	Top-5 acc 32.812 (27.199)	lr 0.04008
Warmup Train [12][2460/3239]	Time 0.587 (0.516)	Data 0.001 (0.011)	Loss 5.1396 (5.1678)	Top-1 acc 10.547 (11.173)	Top-5 acc 25.391 (27.200)	lr 0.04007
Warmup Train [12][2470/3239]	Time 0.596 (0.516)	Data 0.001 (0.011)	Loss 5.1496 (5.1675)	Top-1 acc 14.062 (11.176)	Top-5 acc 30.859 (27.207)	lr 0.04007
Warmup Train [12][2480/3239]	Time 0.316 (0.516)	Data 0.001 (0.011)	Loss 5.1558 (5.1674)	Top-1 acc 10.547 (11.176)	Top-5 acc 25.391 (27.209)	lr 0.04006
Warmup Train [12][2490/3239]	Time 0.479 (0.516)	Data 0.001 (0.011)	Loss 5.0273 (5.1674)	Top-1 acc 13.672 (11.177)	Top-5 acc 28.906 (27.208)	lr 0.04006
Warmup Train [12][2500/3239]	Time 0.520 (0.516)	Data 0.001 (0.011)	Loss 5.0797 (5.1674)	Top-1 acc 12.891 (11.177)	Top-5 acc 26.953 (27.209)	lr 0.04006
Warmup Train [12][2510/3239]	Time 0.569 (0.516)	Data 0.001 (0.011)	Loss 5.0737 (5.1671)	Top-1 acc 15.625 (11.182)	Top-5 acc 27.734 (27.211)	lr 0.04005
Warmup Train [12][2520/3239]	Time 0.485 (0.516)	Data 0.001 (0.011)	Loss 5.1394 (5.1670)	Top-1 acc 13.672 (11.184)	Top-5 acc 30.469 (27.212)	lr 0.04005
Warmup Train [12][2530/3239]	Time 0.496 (0.516)	Data 0.001 (0.011)	Loss 5.1545 (5.1668)	Top-1 acc 10.547 (11.186)	Top-5 acc 28.516 (27.217)	lr 0.04004
Warmup Train [12][2540/3239]	Time 0.635 (0.516)	Data 0.001 (0.011)	Loss 5.2444 (5.1666)	Top-1 acc 8.984 (11.187)	Top-5 acc 21.875 (27.222)	lr 0.04004
Warmup Train [12][2550/3239]	Time 0.512 (0.516)	Data 0.001 (0.011)	Loss 5.1074 (5.1665)	Top-1 acc 12.891 (11.187)	Top-5 acc 28.125 (27.221)	lr 0.04003
Warmup Train [12][2560/3239]	Time 0.359 (0.516)	Data 0.001 (0.011)	Loss 5.3241 (5.1664)	Top-1 acc 7.422 (11.186)	Top-5 acc 21.094 (27.222)	lr 0.04003
Warmup Train [12][2570/3239]	Time 0.352 (0.516)	Data 0.001 (0.011)	Loss 5.2901 (5.1661)	Top-1 acc 9.766 (11.188)	Top-5 acc 25.000 (27.230)	lr 0.04002
Warmup Train [12][2580/3239]	Time 0.474 (0.516)	Data 0.001 (0.011)	Loss 4.9507 (5.1658)	Top-1 acc 14.844 (11.191)	Top-5 acc 32.812 (27.242)	lr 0.04002
Warmup Train [12][2590/3239]	Time 0.357 (0.515)	Data 0.001 (0.011)	Loss 5.1949 (5.1657)	Top-1 acc 11.719 (11.191)	Top-5 acc 28.906 (27.245)	lr 0.04001
Warmup Train [12][2600/3239]	Time 0.400 (0.515)	Data 0.001 (0.011)	Loss 4.9134 (5.1655)	Top-1 acc 15.625 (11.197)	Top-5 acc 35.547 (27.254)	lr 0.04001
Warmup Train [12][2610/3239]	Time 0.382 (0.515)	Data 0.002 (0.011)	Loss 5.1101 (5.1651)	Top-1 acc 11.719 (11.207)	Top-5 acc 31.250 (27.261)	lr 0.04000
Warmup Train [12][2620/3239]	Time 0.304 (0.515)	Data 0.001 (0.011)	Loss 5.2521 (5.1649)	Top-1 acc 9.766 (11.211)	Top-5 acc 25.781 (27.270)	lr 0.04000
Warmup Train [12][2630/3239]	Time 0.221 (0.514)	Data 0.001 (0.011)	Loss 5.1826 (5.1646)	Top-1 acc 16.016 (11.218)	Top-5 acc 29.688 (27.277)	lr 0.03999
Warmup Train [12][2640/3239]	Time 0.446 (0.514)	Data 0.001 (0.011)	Loss 5.2673 (5.1647)	Top-1 acc 8.984 (11.218)	Top-5 acc 26.953 (27.275)	lr 0.03999
Warmup Train [12][2650/3239]	Time 0.563 (0.514)	Data 0.001 (0.011)	Loss 5.1113 (5.1647)	Top-1 acc 12.500 (11.216)	Top-5 acc 28.906 (27.273)	lr 0.03998
Warmup Train [12][2660/3239]	Time 0.498 (0.514)	Data 0.001 (0.011)	Loss 5.0754 (5.1645)	Top-1 acc 11.719 (11.220)	Top-5 acc 30.078 (27.275)	lr 0.03998
Warmup Train [12][2670/3239]	Time 0.529 (0.514)	Data 0.001 (0.011)	Loss 5.0096 (5.1644)	Top-1 acc 14.062 (11.222)	Top-5 acc 30.078 (27.273)	lr 0.03997
Warmup Train [12][2680/3239]	Time 0.407 (0.514)	Data 0.001 (0.011)	Loss 5.1315 (5.1642)	Top-1 acc 12.891 (11.226)	Top-5 acc 26.953 (27.275)	lr 0.03997
Warmup Train [12][2690/3239]	Time 0.545 (0.514)	Data 0.001 (0.011)	Loss 4.8920 (5.1638)	Top-1 acc 17.188 (11.232)	Top-5 acc 33.984 (27.284)	lr 0.03996
Warmup Train [12][2700/3239]	Time 0.612 (0.514)	Data 0.001 (0.011)	Loss 5.0711 (5.1637)	Top-1 acc 9.766 (11.232)	Top-5 acc 28.125 (27.288)	lr 0.03996
Warmup Train [12][2710/3239]	Time 0.549 (0.514)	Data 0.001 (0.011)	Loss 4.9477 (5.1635)	Top-1 acc 15.625 (11.234)	Top-5 acc 32.031 (27.297)	lr 0.03995
Warmup Train [12][2720/3239]	Time 0.707 (0.514)	Data 0.001 (0.011)	Loss 5.1673 (5.1633)	Top-1 acc 9.766 (11.236)	Top-5 acc 29.297 (27.302)	lr 0.03995
Warmup Train [12][2730/3239]	Time 0.445 (0.514)	Data 0.001 (0.011)	Loss 5.0980 (5.1631)	Top-1 acc 11.719 (11.238)	Top-5 acc 30.859 (27.305)	lr 0.03994
Warmup Train [12][2740/3239]	Time 0.436 (0.514)	Data 0.001 (0.011)	Loss 5.2228 (5.1631)	Top-1 acc 13.281 (11.237)	Top-5 acc 28.125 (27.307)	lr 0.03994
Warmup Train [12][2750/3239]	Time 0.516 (0.514)	Data 0.001 (0.011)	Loss 5.0118 (5.1629)	Top-1 acc 11.719 (11.238)	Top-5 acc 29.688 (27.312)	lr 0.03993
Warmup Train [12][2760/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 4.9828 (5.1627)	Top-1 acc 12.891 (11.242)	Top-5 acc 32.031 (27.317)	lr 0.03993
Warmup Train [12][2770/3239]	Time 0.497 (0.514)	Data 0.001 (0.011)	Loss 5.0987 (5.1625)	Top-1 acc 11.328 (11.245)	Top-5 acc 32.422 (27.329)	lr 0.03992
Warmup Train [12][2780/3239]	Time 0.504 (0.514)	Data 0.001 (0.011)	Loss 5.1634 (5.1623)	Top-1 acc 9.766 (11.248)	Top-5 acc 24.609 (27.331)	lr 0.03992
Warmup Train [12][2790/3239]	Time 0.347 (0.513)	Data 0.001 (0.011)	Loss 5.3598 (5.1624)	Top-1 acc 7.812 (11.245)	Top-5 acc 25.000 (27.329)	lr 0.03991
Warmup Train [12][2800/3239]	Time 0.517 (0.514)	Data 0.001 (0.011)	Loss 5.1174 (5.1623)	Top-1 acc 15.234 (11.248)	Top-5 acc 29.688 (27.332)	lr 0.03991
Warmup Train [12][2810/3239]	Time 0.478 (0.514)	Data 0.001 (0.011)	Loss 5.1862 (5.1620)	Top-1 acc 10.547 (11.248)	Top-5 acc 25.391 (27.338)	lr 0.03990
Warmup Train [12][2820/3239]	Time 0.553 (0.513)	Data 0.001 (0.011)	Loss 5.0484 (5.1621)	Top-1 acc 13.672 (11.249)	Top-5 acc 31.641 (27.339)	lr 0.03990
Warmup Train [12][2830/3239]	Time 0.561 (0.513)	Data 0.001 (0.011)	Loss 5.1075 (5.1618)	Top-1 acc 11.719 (11.253)	Top-5 acc 29.688 (27.349)	lr 0.03989
Warmup Train [12][2840/3239]	Time 0.534 (0.513)	Data 0.001 (0.011)	Loss 5.0906 (5.1617)	Top-1 acc 10.938 (11.252)	Top-5 acc 28.516 (27.350)	lr 0.03989
Warmup Train [12][2850/3239]	Time 0.630 (0.513)	Data 0.001 (0.011)	Loss 5.0477 (5.1615)	Top-1 acc 14.062 (11.256)	Top-5 acc 31.641 (27.357)	lr 0.03989
Warmup Train [12][2860/3239]	Time 0.362 (0.513)	Data 0.001 (0.011)	Loss 5.2018 (5.1614)	Top-1 acc 10.156 (11.258)	Top-5 acc 26.562 (27.362)	lr 0.03988
Warmup Train [12][2870/3239]	Time 0.710 (0.514)	Data 0.001 (0.011)	Loss 5.0104 (5.1612)	Top-1 acc 9.375 (11.259)	Top-5 acc 28.906 (27.365)	lr 0.03988
Warmup Train [12][2880/3239]	Time 0.460 (0.513)	Data 0.001 (0.011)	Loss 5.2788 (5.1612)	Top-1 acc 9.766 (11.261)	Top-5 acc 24.219 (27.365)	lr 0.03987
Warmup Train [12][2890/3239]	Time 0.518 (0.513)	Data 0.001 (0.011)	Loss 5.0954 (5.1610)	Top-1 acc 8.203 (11.263)	Top-5 acc 27.344 (27.370)	lr 0.03987
Warmup Train [12][2900/3239]	Time 0.488 (0.513)	Data 0.001 (0.011)	Loss 5.1696 (5.1609)	Top-1 acc 10.938 (11.265)	Top-5 acc 26.562 (27.373)	lr 0.03986
Warmup Train [12][2910/3239]	Time 0.361 (0.513)	Data 0.001 (0.011)	Loss 5.2516 (5.1606)	Top-1 acc 6.641 (11.265)	Top-5 acc 23.828 (27.377)	lr 0.03986
Warmup Train [12][2920/3239]	Time 0.403 (0.513)	Data 0.001 (0.011)	Loss 5.0065 (5.1604)	Top-1 acc 13.672 (11.270)	Top-5 acc 28.125 (27.381)	lr 0.03985
Warmup Train [12][2930/3239]	Time 0.461 (0.513)	Data 0.001 (0.011)	Loss 4.9450 (5.1603)	Top-1 acc 13.281 (11.269)	Top-5 acc 29.688 (27.382)	lr 0.03985
Warmup Train [12][2940/3239]	Time 0.527 (0.513)	Data 0.001 (0.011)	Loss 5.1012 (5.1600)	Top-1 acc 9.375 (11.272)	Top-5 acc 28.516 (27.389)	lr 0.03984
Warmup Train [12][2950/3239]	Time 0.521 (0.513)	Data 0.001 (0.011)	Loss 5.2741 (5.1600)	Top-1 acc 10.547 (11.273)	Top-5 acc 23.828 (27.391)	lr 0.03984
Warmup Train [12][2960/3239]	Time 0.512 (0.513)	Data 0.001 (0.011)	Loss 4.8931 (5.1599)	Top-1 acc 10.938 (11.273)	Top-5 acc 34.766 (27.392)	lr 0.03983
Warmup Train [12][2970/3239]	Time 0.499 (0.513)	Data 0.001 (0.011)	Loss 5.1727 (5.1598)	Top-1 acc 10.547 (11.274)	Top-5 acc 28.516 (27.392)	lr 0.03983
Warmup Train [12][2980/3239]	Time 0.533 (0.513)	Data 0.001 (0.011)	Loss 5.3848 (5.1596)	Top-1 acc 9.375 (11.279)	Top-5 acc 20.312 (27.401)	lr 0.03982
Warmup Train [12][2990/3239]	Time 0.300 (0.513)	Data 0.001 (0.011)	Loss 5.3092 (5.1596)	Top-1 acc 8.984 (11.277)	Top-5 acc 26.953 (27.401)	lr 0.03982
Warmup Train [12][3000/3239]	Time 0.561 (0.513)	Data 0.001 (0.011)	Loss 5.1669 (5.1594)	Top-1 acc 8.984 (11.280)	Top-5 acc 30.078 (27.409)	lr 0.03981
Warmup Train [12][3010/3239]	Time 0.491 (0.513)	Data 0.001 (0.011)	Loss 5.0424 (5.1593)	Top-1 acc 13.281 (11.280)	Top-5 acc 29.297 (27.407)	lr 0.03981
Warmup Train [12][3020/3239]	Time 0.580 (0.513)	Data 0.001 (0.011)	Loss 5.1324 (5.1591)	Top-1 acc 9.375 (11.282)	Top-5 acc 31.641 (27.414)	lr 0.03980
Warmup Train [12][3030/3239]	Time 0.431 (0.513)	Data 0.001 (0.011)	Loss 5.1715 (5.1589)	Top-1 acc 13.281 (11.287)	Top-5 acc 24.219 (27.419)	lr 0.03980
Warmup Train [12][3040/3239]	Time 0.569 (0.513)	Data 0.001 (0.011)	Loss 5.1440 (5.1587)	Top-1 acc 10.547 (11.288)	Top-5 acc 28.125 (27.425)	lr 0.03979
Warmup Train [12][3050/3239]	Time 0.417 (0.513)	Data 0.001 (0.011)	Loss 5.1165 (5.1587)	Top-1 acc 14.062 (11.290)	Top-5 acc 31.641 (27.426)	lr 0.03979
Warmup Train [12][3060/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 5.1295 (5.1585)	Top-1 acc 15.625 (11.293)	Top-5 acc 27.344 (27.428)	lr 0.03978
Warmup Train [12][3070/3239]	Time 0.550 (0.513)	Data 0.001 (0.011)	Loss 5.2733 (5.1584)	Top-1 acc 10.156 (11.297)	Top-5 acc 22.266 (27.428)	lr 0.03978
Warmup Train [12][3080/3239]	Time 0.402 (0.513)	Data 0.001 (0.011)	Loss 5.1067 (5.1583)	Top-1 acc 9.766 (11.295)	Top-5 acc 26.953 (27.431)	lr 0.03977
Warmup Train [12][3090/3239]	Time 0.525 (0.513)	Data 0.001 (0.011)	Loss 5.0751 (5.1582)	Top-1 acc 13.281 (11.297)	Top-5 acc 27.344 (27.434)	lr 0.03977
Warmup Train [12][3100/3239]	Time 0.504 (0.513)	Data 0.001 (0.011)	Loss 5.1742 (5.1581)	Top-1 acc 11.328 (11.299)	Top-5 acc 25.000 (27.439)	lr 0.03976
Warmup Train [12][3110/3239]	Time 0.578 (0.513)	Data 0.001 (0.011)	Loss 5.1769 (5.1581)	Top-1 acc 12.891 (11.298)	Top-5 acc 28.906 (27.438)	lr 0.03976
Warmup Train [12][3120/3239]	Time 0.617 (0.513)	Data 0.001 (0.011)	Loss 5.0113 (5.1580)	Top-1 acc 17.188 (11.299)	Top-5 acc 33.984 (27.440)	lr 0.03975
Warmup Train [12][3130/3239]	Time 0.634 (0.513)	Data 0.001 (0.011)	Loss 5.1437 (5.1579)	Top-1 acc 11.719 (11.302)	Top-5 acc 30.469 (27.449)	lr 0.03975
Warmup Train [12][3140/3239]	Time 0.579 (0.513)	Data 0.001 (0.011)	Loss 4.9691 (5.1576)	Top-1 acc 17.188 (11.305)	Top-5 acc 32.812 (27.456)	lr 0.03974
Warmup Train [12][3150/3239]	Time 0.660 (0.513)	Data 0.001 (0.011)	Loss 5.0826 (5.1575)	Top-1 acc 12.891 (11.306)	Top-5 acc 28.125 (27.457)	lr 0.03974
Warmup Train [12][3160/3239]	Time 0.385 (0.513)	Data 0.001 (0.011)	Loss 5.0299 (5.1573)	Top-1 acc 12.500 (11.307)	Top-5 acc 31.250 (27.462)	lr 0.03973
Warmup Train [12][3170/3239]	Time 0.423 (0.513)	Data 0.001 (0.011)	Loss 5.0855 (5.1572)	Top-1 acc 10.547 (11.308)	Top-5 acc 28.125 (27.464)	lr 0.03973
Warmup Train [12][3180/3239]	Time 0.382 (0.513)	Data 0.000 (0.011)	Loss 5.2818 (5.1570)	Top-1 acc 10.156 (11.310)	Top-5 acc 24.219 (27.468)	lr 0.03972
Warmup Train [12][3190/3239]	Time 0.490 (0.513)	Data 0.000 (0.011)	Loss 5.2628 (5.1568)	Top-1 acc 10.938 (11.316)	Top-5 acc 26.562 (27.473)	lr 0.03972
Warmup Train [12][3200/3239]	Time 0.539 (0.512)	Data 0.000 (0.011)	Loss 5.1374 (5.1567)	Top-1 acc 11.719 (11.321)	Top-5 acc 27.734 (27.474)	lr 0.03971
Warmup Train [12][3210/3239]	Time 0.610 (0.512)	Data 0.000 (0.011)	Loss 5.0737 (5.1565)	Top-1 acc 12.500 (11.323)	Top-5 acc 28.516 (27.478)	lr 0.03971
Warmup Train [12][3220/3239]	Time 0.503 (0.512)	Data 0.000 (0.010)	Loss 5.0925 (5.1564)	Top-1 acc 11.719 (11.323)	Top-5 acc 27.734 (27.482)	lr 0.03970
Warmup Train [12][3230/3239]	Time 0.523 (0.512)	Data 0.000 (0.010)	Loss 5.0656 (5.1563)	Top-1 acc 13.281 (11.327)	Top-5 acc 28.516 (27.484)	lr 0.03970
Warmup Train [12][3239/3239]	Time 0.439 (0.512)	Data 0.000 (0.010)	Loss 5.1261 (5.1562)	Top-1 acc 8.642 (11.328)	Top-5 acc 27.160 (27.484)	lr 0.03970
==========Warmup Valid [12/40]	loss 4.367	top-1 acc 16.110	top-5 acc 35.899	Train top-1 11.328	top-5 27.484	flops: 442.4M
Warmup Train [13][0/3239]	Time 12.505 (12.505)	Data 9.410 (9.410)	Loss 5.0524 (5.0524)	Top-1 acc 12.891 (12.891)	Top-5 acc 32.812 (32.812)	lr 0.03969
Warmup Train [13][10/3239]	Time 0.631 (1.759)	Data 0.002 (0.946)	Loss 5.0938 (5.1005)	Top-1 acc 11.328 (11.861)	Top-5 acc 26.953 (28.942)	lr 0.03969
Warmup Train [13][20/3239]	Time 0.489 (1.157)	Data 0.001 (0.497)	Loss 5.2540 (5.0977)	Top-1 acc 7.812 (11.942)	Top-5 acc 24.219 (28.720)	lr 0.03968
Warmup Train [13][30/3239]	Time 0.537 (0.949)	Data 0.001 (0.337)	Loss 5.0995 (5.1130)	Top-1 acc 8.984 (12.147)	Top-5 acc 25.781 (28.314)	lr 0.03968
Warmup Train [13][40/3239]	Time 0.429 (0.832)	Data 0.001 (0.255)	Loss 5.1685 (5.1233)	Top-1 acc 10.547 (11.976)	Top-5 acc 26.172 (28.039)	lr 0.03968
Warmup Train [13][50/3239]	Time 0.441 (0.767)	Data 0.001 (0.207)	Loss 5.1433 (5.1112)	Top-1 acc 12.891 (12.224)	Top-5 acc 25.000 (28.240)	lr 0.03967
Warmup Train [13][60/3239]	Time 0.636 (0.721)	Data 0.001 (0.175)	Loss 5.0933 (5.1081)	Top-1 acc 8.594 (12.257)	Top-5 acc 28.125 (28.464)	lr 0.03967
Warmup Train [13][70/3239]	Time 0.389 (0.685)	Data 0.001 (0.150)	Loss 5.0837 (5.1032)	Top-1 acc 12.500 (12.230)	Top-5 acc 27.344 (28.576)	lr 0.03966
Warmup Train [13][80/3239]	Time 0.346 (0.657)	Data 0.001 (0.133)	Loss 4.9983 (5.1018)	Top-1 acc 9.766 (12.191)	Top-5 acc 31.250 (28.593)	lr 0.03966
Warmup Train [13][90/3239]	Time 0.515 (0.640)	Data 0.001 (0.121)	Loss 5.1528 (5.1040)	Top-1 acc 14.453 (12.092)	Top-5 acc 30.859 (28.674)	lr 0.03965
Warmup Train [13][100/3239]	Time 0.461 (0.628)	Data 0.001 (0.110)	Loss 5.1908 (5.1041)	Top-1 acc 14.062 (12.148)	Top-5 acc 29.297 (28.682)	lr 0.03965
Warmup Train [13][110/3239]	Time 0.508 (0.618)	Data 0.001 (0.101)	Loss 5.3032 (5.1017)	Top-1 acc 9.766 (12.211)	Top-5 acc 23.438 (28.776)	lr 0.03964
Warmup Train [13][120/3239]	Time 0.681 (0.609)	Data 0.001 (0.093)	Loss 5.0722 (5.0994)	Top-1 acc 11.328 (12.213)	Top-5 acc 26.172 (28.813)	lr 0.03964
Warmup Train [13][130/3239]	Time 0.459 (0.601)	Data 0.001 (0.086)	Loss 4.9868 (5.1009)	Top-1 acc 14.453 (12.211)	Top-5 acc 31.250 (28.799)	lr 0.03963
Warmup Train [13][140/3239]	Time 0.431 (0.595)	Data 0.001 (0.081)	Loss 4.9093 (5.0984)	Top-1 acc 11.328 (12.204)	Top-5 acc 32.422 (28.768)	lr 0.03963
Warmup Train [13][150/3239]	Time 0.469 (0.590)	Data 0.001 (0.076)	Loss 5.0667 (5.0968)	Top-1 acc 14.453 (12.257)	Top-5 acc 30.469 (28.818)	lr 0.03962
Warmup Train [13][160/3239]	Time 0.469 (0.585)	Data 0.001 (0.072)	Loss 5.0608 (5.0936)	Top-1 acc 11.328 (12.318)	Top-5 acc 27.344 (28.933)	lr 0.03962
Warmup Train [13][170/3239]	Time 0.554 (0.581)	Data 0.001 (0.069)	Loss 5.3020 (5.0939)	Top-1 acc 12.109 (12.285)	Top-5 acc 26.562 (28.936)	lr 0.03961
Warmup Train [13][180/3239]	Time 0.555 (0.578)	Data 0.001 (0.065)	Loss 5.1625 (5.0952)	Top-1 acc 12.891 (12.304)	Top-5 acc 30.469 (28.973)	lr 0.03961
Warmup Train [13][190/3239]	Time 0.470 (0.575)	Data 0.002 (0.062)	Loss 4.9820 (5.0946)	Top-1 acc 12.109 (12.310)	Top-5 acc 28.906 (28.980)	lr 0.03960
Warmup Train [13][200/3239]	Time 0.332 (0.572)	Data 0.001 (0.060)	Loss 5.1325 (5.0952)	Top-1 acc 10.938 (12.286)	Top-5 acc 27.734 (28.965)	lr 0.03960
Warmup Train [13][210/3239]	Time 0.536 (0.570)	Data 0.001 (0.058)	Loss 5.0999 (5.0947)	Top-1 acc 14.062 (12.296)	Top-5 acc 29.688 (28.962)	lr 0.03959
Warmup Train [13][220/3239]	Time 0.553 (0.568)	Data 0.002 (0.055)	Loss 4.8801 (5.0955)	Top-1 acc 15.234 (12.295)	Top-5 acc 36.719 (28.938)	lr 0.03959
Warmup Train [13][230/3239]	Time 0.337 (0.564)	Data 0.001 (0.053)	Loss 5.0783 (5.0968)	Top-1 acc 10.156 (12.284)	Top-5 acc 27.734 (28.913)	lr 0.03958
Warmup Train [13][240/3239]	Time 0.328 (0.562)	Data 0.002 (0.051)	Loss 5.0965 (5.0976)	Top-1 acc 12.500 (12.275)	Top-5 acc 28.906 (28.916)	lr 0.03958
Warmup Train [13][250/3239]	Time 0.318 (0.560)	Data 0.001 (0.050)	Loss 5.1402 (5.0982)	Top-1 acc 8.984 (12.248)	Top-5 acc 28.906 (28.898)	lr 0.03957
Warmup Train [13][260/3239]	Time 0.646 (0.559)	Data 0.001 (0.049)	Loss 4.9181 (5.0991)	Top-1 acc 16.797 (12.229)	Top-5 acc 33.984 (28.858)	lr 0.03957
Warmup Train [13][270/3239]	Time 0.505 (0.557)	Data 0.001 (0.047)	Loss 5.1672 (5.0997)	Top-1 acc 8.594 (12.205)	Top-5 acc 21.875 (28.826)	lr 0.03956
Warmup Train [13][280/3239]	Time 0.497 (0.555)	Data 0.001 (0.045)	Loss 5.2419 (5.1015)	Top-1 acc 11.719 (12.175)	Top-5 acc 27.734 (28.792)	lr 0.03956
Warmup Train [13][290/3239]	Time 0.584 (0.554)	Data 0.001 (0.044)	Loss 5.2773 (5.1010)	Top-1 acc 12.500 (12.170)	Top-5 acc 27.344 (28.785)	lr 0.03955
Warmup Train [13][300/3239]	Time 0.572 (0.553)	Data 0.001 (0.043)	Loss 5.0867 (5.1023)	Top-1 acc 11.719 (12.147)	Top-5 acc 30.078 (28.754)	lr 0.03955
Warmup Train [13][310/3239]	Time 0.388 (0.552)	Data 0.001 (0.041)	Loss 4.9869 (5.0999)	Top-1 acc 10.938 (12.151)	Top-5 acc 31.641 (28.802)	lr 0.03954
Warmup Train [13][320/3239]	Time 0.497 (0.549)	Data 0.001 (0.040)	Loss 4.8793 (5.0966)	Top-1 acc 14.453 (12.165)	Top-5 acc 32.812 (28.887)	lr 0.03954
Warmup Train [13][330/3239]	Time 0.465 (0.548)	Data 0.001 (0.039)	Loss 5.0948 (5.0971)	Top-1 acc 11.328 (12.146)	Top-5 acc 28.516 (28.847)	lr 0.03953
Warmup Train [13][340/3239]	Time 0.281 (0.545)	Data 0.001 (0.038)	Loss 5.1544 (5.0966)	Top-1 acc 10.156 (12.123)	Top-5 acc 26.172 (28.851)	lr 0.03953
Warmup Train [13][350/3239]	Time 0.469 (0.544)	Data 0.001 (0.038)	Loss 5.1271 (5.0958)	Top-1 acc 13.281 (12.139)	Top-5 acc 29.688 (28.896)	lr 0.03952
Warmup Train [13][360/3239]	Time 0.367 (0.542)	Data 0.001 (0.037)	Loss 5.0620 (5.0952)	Top-1 acc 9.375 (12.136)	Top-5 acc 28.125 (28.892)	lr 0.03952
Warmup Train [13][370/3239]	Time 0.323 (0.539)	Data 0.001 (0.036)	Loss 5.0982 (5.0950)	Top-1 acc 13.672 (12.153)	Top-5 acc 28.516 (28.917)	lr 0.03951
Warmup Train [13][380/3239]	Time 0.291 (0.538)	Data 0.001 (0.036)	Loss 5.1700 (5.0952)	Top-1 acc 11.719 (12.147)	Top-5 acc 25.781 (28.932)	lr 0.03951
Warmup Train [13][390/3239]	Time 0.435 (0.537)	Data 0.001 (0.035)	Loss 5.0265 (5.0952)	Top-1 acc 12.109 (12.114)	Top-5 acc 32.812 (28.942)	lr 0.03950
Warmup Train [13][400/3239]	Time 0.396 (0.537)	Data 0.001 (0.035)	Loss 5.2960 (5.0964)	Top-1 acc 8.984 (12.090)	Top-5 acc 23.047 (28.890)	lr 0.03950
Warmup Train [13][410/3239]	Time 0.575 (0.535)	Data 0.001 (0.034)	Loss 5.0734 (5.0970)	Top-1 acc 14.453 (12.095)	Top-5 acc 26.953 (28.882)	lr 0.03949
Warmup Train [13][420/3239]	Time 0.498 (0.535)	Data 0.001 (0.034)	Loss 5.1334 (5.0971)	Top-1 acc 10.938 (12.088)	Top-5 acc 28.125 (28.875)	lr 0.03949
Warmup Train [13][430/3239]	Time 0.645 (0.534)	Data 0.001 (0.033)	Loss 5.2215 (5.0973)	Top-1 acc 10.938 (12.089)	Top-5 acc 25.781 (28.882)	lr 0.03948
Warmup Train [13][440/3239]	Time 0.510 (0.534)	Data 0.001 (0.032)	Loss 4.8730 (5.0959)	Top-1 acc 14.844 (12.101)	Top-5 acc 34.375 (28.905)	lr 0.03948
Warmup Train [13][450/3239]	Time 0.481 (0.534)	Data 0.001 (0.032)	Loss 5.1377 (5.0955)	Top-1 acc 12.109 (12.121)	Top-5 acc 30.469 (28.924)	lr 0.03947
Warmup Train [13][460/3239]	Time 0.506 (0.533)	Data 0.002 (0.031)	Loss 5.1939 (5.0952)	Top-1 acc 11.719 (12.132)	Top-5 acc 26.953 (28.941)	lr 0.03947
Warmup Train [13][470/3239]	Time 0.445 (0.532)	Data 0.001 (0.030)	Loss 5.1390 (5.0953)	Top-1 acc 8.984 (12.138)	Top-5 acc 25.391 (28.938)	lr 0.03946
Warmup Train [13][480/3239]	Time 0.637 (0.532)	Data 0.001 (0.030)	Loss 5.2324 (5.0949)	Top-1 acc 11.328 (12.143)	Top-5 acc 23.047 (28.926)	lr 0.03946
Warmup Train [13][490/3239]	Time 0.462 (0.532)	Data 0.001 (0.029)	Loss 5.0151 (5.0942)	Top-1 acc 12.891 (12.162)	Top-5 acc 28.125 (28.929)	lr 0.03945
Warmup Train [13][500/3239]	Time 0.400 (0.531)	Data 0.001 (0.029)	Loss 5.0262 (5.0942)	Top-1 acc 9.766 (12.149)	Top-5 acc 31.250 (28.933)	lr 0.03945
Warmup Train [13][510/3239]	Time 0.649 (0.531)	Data 0.001 (0.028)	Loss 5.0047 (5.0948)	Top-1 acc 13.672 (12.152)	Top-5 acc 29.688 (28.930)	lr 0.03944
Warmup Train [13][520/3239]	Time 0.467 (0.530)	Data 0.001 (0.028)	Loss 5.0569 (5.0951)	Top-1 acc 12.891 (12.141)	Top-5 acc 29.688 (28.917)	lr 0.03944
Warmup Train [13][530/3239]	Time 0.624 (0.530)	Data 0.001 (0.028)	Loss 5.0954 (5.0957)	Top-1 acc 11.328 (12.123)	Top-5 acc 30.078 (28.893)	lr 0.03943
Warmup Train [13][540/3239]	Time 0.571 (0.530)	Data 0.001 (0.027)	Loss 5.0442 (5.0963)	Top-1 acc 12.891 (12.128)	Top-5 acc 28.516 (28.876)	lr 0.03943
Warmup Train [13][550/3239]	Time 0.549 (0.530)	Data 0.001 (0.027)	Loss 4.9549 (5.0955)	Top-1 acc 14.453 (12.158)	Top-5 acc 31.250 (28.894)	lr 0.03942
Warmup Train [13][560/3239]	Time 0.519 (0.530)	Data 0.001 (0.026)	Loss 5.0228 (5.0955)	Top-1 acc 14.062 (12.156)	Top-5 acc 31.641 (28.899)	lr 0.03942
Warmup Train [13][570/3239]	Time 0.569 (0.530)	Data 0.001 (0.026)	Loss 5.1314 (5.0956)	Top-1 acc 13.281 (12.158)	Top-5 acc 28.516 (28.883)	lr 0.03941
Warmup Train [13][580/3239]	Time 0.644 (0.530)	Data 0.001 (0.025)	Loss 5.0325 (5.0950)	Top-1 acc 16.016 (12.159)	Top-5 acc 32.422 (28.883)	lr 0.03941
Warmup Train [13][590/3239]	Time 0.649 (0.529)	Data 0.001 (0.025)	Loss 5.0779 (5.0939)	Top-1 acc 14.062 (12.186)	Top-5 acc 31.641 (28.910)	lr 0.03940
Warmup Train [13][600/3239]	Time 0.519 (0.529)	Data 0.001 (0.025)	Loss 5.2017 (5.0945)	Top-1 acc 10.156 (12.189)	Top-5 acc 24.219 (28.898)	lr 0.03940
Warmup Train [13][610/3239]	Time 0.602 (0.528)	Data 0.001 (0.024)	Loss 5.1757 (5.0953)	Top-1 acc 10.547 (12.188)	Top-5 acc 27.344 (28.882)	lr 0.03939
Warmup Train [13][620/3239]	Time 0.538 (0.528)	Data 0.001 (0.024)	Loss 5.0024 (5.0950)	Top-1 acc 12.891 (12.187)	Top-5 acc 29.297 (28.893)	lr 0.03939
Warmup Train [13][630/3239]	Time 0.538 (0.527)	Data 0.001 (0.024)	Loss 4.9869 (5.0945)	Top-1 acc 16.016 (12.190)	Top-5 acc 34.766 (28.920)	lr 0.03938
Warmup Train [13][640/3239]	Time 0.626 (0.527)	Data 0.001 (0.023)	Loss 5.1372 (5.0944)	Top-1 acc 15.625 (12.201)	Top-5 acc 30.859 (28.939)	lr 0.03938
Warmup Train [13][650/3239]	Time 0.549 (0.526)	Data 0.001 (0.023)	Loss 5.2007 (5.0944)	Top-1 acc 10.938 (12.201)	Top-5 acc 25.781 (28.934)	lr 0.03937
Warmup Train [13][660/3239]	Time 0.523 (0.526)	Data 0.001 (0.023)	Loss 5.0553 (5.0936)	Top-1 acc 17.188 (12.220)	Top-5 acc 30.859 (28.944)	lr 0.03937
Warmup Train [13][670/3239]	Time 0.617 (0.525)	Data 0.001 (0.022)	Loss 5.0103 (5.0937)	Top-1 acc 12.109 (12.214)	Top-5 acc 27.734 (28.928)	lr 0.03936
Warmup Train [13][680/3239]	Time 0.488 (0.525)	Data 0.001 (0.022)	Loss 5.2328 (5.0942)	Top-1 acc 8.984 (12.214)	Top-5 acc 26.172 (28.907)	lr 0.03936
Warmup Train [13][690/3239]	Time 0.534 (0.525)	Data 0.001 (0.022)	Loss 5.0549 (5.0938)	Top-1 acc 10.938 (12.217)	Top-5 acc 27.734 (28.927)	lr 0.03935
Warmup Train [13][700/3239]	Time 0.599 (0.525)	Data 0.001 (0.021)	Loss 5.0569 (5.0936)	Top-1 acc 12.109 (12.209)	Top-5 acc 30.469 (28.921)	lr 0.03935
Warmup Train [13][710/3239]	Time 0.654 (0.525)	Data 0.001 (0.021)	Loss 4.9872 (5.0928)	Top-1 acc 13.281 (12.226)	Top-5 acc 32.422 (28.943)	lr 0.03934
Warmup Train [13][720/3239]	Time 0.511 (0.525)	Data 0.001 (0.021)	Loss 5.0999 (5.0924)	Top-1 acc 12.500 (12.224)	Top-5 acc 28.125 (28.949)	lr 0.03934
Warmup Train [13][730/3239]	Time 0.539 (0.525)	Data 0.001 (0.021)	Loss 5.0883 (5.0933)	Top-1 acc 15.234 (12.204)	Top-5 acc 32.812 (28.927)	lr 0.03933
Warmup Train [13][740/3239]	Time 0.570 (0.525)	Data 0.001 (0.021)	Loss 5.1365 (5.0936)	Top-1 acc 9.375 (12.188)	Top-5 acc 27.344 (28.917)	lr 0.03933
Warmup Train [13][750/3239]	Time 0.444 (0.525)	Data 0.001 (0.020)	Loss 5.0087 (5.0934)	Top-1 acc 11.719 (12.189)	Top-5 acc 27.344 (28.924)	lr 0.03932
Warmup Train [13][760/3239]	Time 0.528 (0.525)	Data 0.001 (0.020)	Loss 4.9567 (5.0932)	Top-1 acc 11.719 (12.192)	Top-5 acc 29.297 (28.933)	lr 0.03932
Warmup Train [13][770/3239]	Time 0.464 (0.525)	Data 0.001 (0.020)	Loss 5.2332 (5.0941)	Top-1 acc 10.938 (12.183)	Top-5 acc 25.000 (28.919)	lr 0.03931
Warmup Train [13][780/3239]	Time 0.491 (0.524)	Data 0.001 (0.020)	Loss 5.1488 (5.0940)	Top-1 acc 12.109 (12.188)	Top-5 acc 24.609 (28.920)	lr 0.03931
Warmup Train [13][790/3239]	Time 0.628 (0.524)	Data 0.001 (0.020)	Loss 5.0254 (5.0933)	Top-1 acc 15.234 (12.205)	Top-5 acc 31.250 (28.941)	lr 0.03930
Warmup Train [13][800/3239]	Time 0.517 (0.524)	Data 0.001 (0.019)	Loss 4.9777 (5.0934)	Top-1 acc 13.672 (12.208)	Top-5 acc 30.859 (28.949)	lr 0.03930
Warmup Train [13][810/3239]	Time 0.416 (0.524)	Data 0.001 (0.019)	Loss 5.0585 (5.0930)	Top-1 acc 12.891 (12.213)	Top-5 acc 30.078 (28.968)	lr 0.03929
Warmup Train [13][820/3239]	Time 0.525 (0.524)	Data 0.001 (0.019)	Loss 5.1522 (5.0928)	Top-1 acc 10.156 (12.218)	Top-5 acc 26.172 (28.969)	lr 0.03929
Warmup Train [13][830/3239]	Time 0.306 (0.524)	Data 0.001 (0.019)	Loss 5.2312 (5.0931)	Top-1 acc 9.766 (12.213)	Top-5 acc 28.125 (28.968)	lr 0.03928
Warmup Train [13][840/3239]	Time 0.544 (0.524)	Data 0.001 (0.019)	Loss 4.9363 (5.0934)	Top-1 acc 14.844 (12.217)	Top-5 acc 34.766 (28.955)	lr 0.03928
Warmup Train [13][850/3239]	Time 0.447 (0.524)	Data 0.001 (0.019)	Loss 4.9296 (5.0925)	Top-1 acc 14.453 (12.226)	Top-5 acc 31.250 (28.981)	lr 0.03927
Warmup Train [13][860/3239]	Time 0.453 (0.524)	Data 0.001 (0.019)	Loss 4.9387 (5.0922)	Top-1 acc 13.672 (12.225)	Top-5 acc 32.031 (28.988)	lr 0.03927
Warmup Train [13][870/3239]	Time 0.372 (0.524)	Data 0.001 (0.018)	Loss 5.1012 (5.0919)	Top-1 acc 11.719 (12.226)	Top-5 acc 31.250 (28.992)	lr 0.03926
Warmup Train [13][880/3239]	Time 0.476 (0.523)	Data 0.001 (0.018)	Loss 5.1085 (5.0918)	Top-1 acc 9.766 (12.222)	Top-5 acc 31.641 (29.002)	lr 0.03926
Warmup Train [13][890/3239]	Time 0.542 (0.523)	Data 0.002 (0.018)	Loss 5.0989 (5.0916)	Top-1 acc 11.719 (12.219)	Top-5 acc 27.344 (29.004)	lr 0.03925
Warmup Train [13][900/3239]	Time 0.339 (0.523)	Data 0.001 (0.018)	Loss 5.2197 (5.0922)	Top-1 acc 11.328 (12.224)	Top-5 acc 30.078 (29.005)	lr 0.03925
Warmup Train [13][910/3239]	Time 0.287 (0.522)	Data 0.001 (0.018)	Loss 5.2195 (5.0922)	Top-1 acc 14.453 (12.237)	Top-5 acc 28.125 (29.010)	lr 0.03924
Warmup Train [13][920/3239]	Time 0.199 (0.522)	Data 0.001 (0.018)	Loss 5.0571 (5.0918)	Top-1 acc 9.375 (12.237)	Top-5 acc 30.469 (29.026)	lr 0.03924
Warmup Train [13][930/3239]	Time 0.670 (0.522)	Data 0.001 (0.018)	Loss 5.0997 (5.0915)	Top-1 acc 11.328 (12.238)	Top-5 acc 28.516 (29.023)	lr 0.03923
Warmup Train [13][940/3239]	Time 0.475 (0.522)	Data 0.001 (0.018)	Loss 4.8566 (5.0913)	Top-1 acc 17.578 (12.240)	Top-5 acc 34.766 (29.032)	lr 0.03923
Warmup Train [13][950/3239]	Time 0.660 (0.522)	Data 0.001 (0.018)	Loss 5.0310 (5.0915)	Top-1 acc 12.109 (12.239)	Top-5 acc 33.203 (29.033)	lr 0.03923
Warmup Train [13][960/3239]	Time 0.526 (0.522)	Data 0.001 (0.018)	Loss 5.1029 (5.0914)	Top-1 acc 10.938 (12.232)	Top-5 acc 29.688 (29.037)	lr 0.03922
Warmup Train [13][970/3239]	Time 0.562 (0.522)	Data 0.001 (0.017)	Loss 4.8699 (5.0912)	Top-1 acc 16.016 (12.224)	Top-5 acc 34.766 (29.030)	lr 0.03922
Warmup Train [13][980/3239]	Time 0.364 (0.521)	Data 0.001 (0.017)	Loss 5.1417 (5.0907)	Top-1 acc 8.984 (12.229)	Top-5 acc 29.688 (29.036)	lr 0.03921
Warmup Train [13][990/3239]	Time 0.503 (0.522)	Data 0.001 (0.017)	Loss 5.2196 (5.0908)	Top-1 acc 8.203 (12.230)	Top-5 acc 26.562 (29.047)	lr 0.03921
Warmup Train [13][1000/3239]	Time 0.546 (0.522)	Data 0.001 (0.017)	Loss 5.2135 (5.0904)	Top-1 acc 10.547 (12.242)	Top-5 acc 26.172 (29.056)	lr 0.03920
Warmup Train [13][1010/3239]	Time 0.514 (0.522)	Data 0.001 (0.017)	Loss 4.9902 (5.0898)	Top-1 acc 12.500 (12.249)	Top-5 acc 32.031 (29.071)	lr 0.03920
Warmup Train [13][1020/3239]	Time 0.607 (0.522)	Data 0.001 (0.017)	Loss 5.1081 (5.0898)	Top-1 acc 8.984 (12.254)	Top-5 acc 26.562 (29.072)	lr 0.03919
Warmup Train [13][1030/3239]	Time 0.460 (0.521)	Data 0.001 (0.017)	Loss 5.0284 (5.0895)	Top-1 acc 9.375 (12.251)	Top-5 acc 28.516 (29.086)	lr 0.03919
Warmup Train [13][1040/3239]	Time 0.645 (0.521)	Data 0.001 (0.017)	Loss 5.0264 (5.0896)	Top-1 acc 15.234 (12.253)	Top-5 acc 30.469 (29.089)	lr 0.03918
Warmup Train [13][1050/3239]	Time 0.567 (0.521)	Data 0.002 (0.017)	Loss 5.0941 (5.0896)	Top-1 acc 14.062 (12.256)	Top-5 acc 29.297 (29.094)	lr 0.03918
Warmup Train [13][1060/3239]	Time 0.660 (0.521)	Data 0.002 (0.016)	Loss 4.9738 (5.0891)	Top-1 acc 13.672 (12.256)	Top-5 acc 28.906 (29.104)	lr 0.03917
Warmup Train [13][1070/3239]	Time 0.571 (0.521)	Data 0.001 (0.016)	Loss 5.0031 (5.0888)	Top-1 acc 10.156 (12.254)	Top-5 acc 30.078 (29.110)	lr 0.03917
Warmup Train [13][1080/3239]	Time 0.416 (0.521)	Data 0.001 (0.016)	Loss 5.1406 (5.0888)	Top-1 acc 10.156 (12.252)	Top-5 acc 27.344 (29.109)	lr 0.03916
Warmup Train [13][1090/3239]	Time 0.515 (0.521)	Data 0.001 (0.016)	Loss 5.0986 (5.0886)	Top-1 acc 8.203 (12.249)	Top-5 acc 30.859 (29.114)	lr 0.03916
Warmup Train [13][1100/3239]	Time 0.357 (0.521)	Data 0.001 (0.016)	Loss 5.3039 (5.0881)	Top-1 acc 8.203 (12.253)	Top-5 acc 23.828 (29.123)	lr 0.03915
Warmup Train [13][1110/3239]	Time 0.557 (0.521)	Data 0.001 (0.016)	Loss 5.2221 (5.0877)	Top-1 acc 11.328 (12.254)	Top-5 acc 28.516 (29.135)	lr 0.03915
Warmup Train [13][1120/3239]	Time 0.703 (0.521)	Data 0.001 (0.016)	Loss 5.0345 (5.0876)	Top-1 acc 11.328 (12.252)	Top-5 acc 30.859 (29.140)	lr 0.03914
Warmup Train [13][1130/3239]	Time 0.415 (0.521)	Data 0.001 (0.016)	Loss 5.1152 (5.0873)	Top-1 acc 15.234 (12.265)	Top-5 acc 25.781 (29.149)	lr 0.03914
Warmup Train [13][1140/3239]	Time 0.572 (0.521)	Data 0.001 (0.016)	Loss 5.0775 (5.0874)	Top-1 acc 13.281 (12.263)	Top-5 acc 28.906 (29.151)	lr 0.03913
Warmup Train [13][1150/3239]	Time 0.741 (0.521)	Data 0.001 (0.016)	Loss 5.0872 (5.0873)	Top-1 acc 12.109 (12.267)	Top-5 acc 28.906 (29.159)	lr 0.03913
Warmup Train [13][1160/3239]	Time 0.588 (0.520)	Data 0.001 (0.016)	Loss 4.9314 (5.0870)	Top-1 acc 14.844 (12.274)	Top-5 acc 31.641 (29.178)	lr 0.03912
Warmup Train [13][1170/3239]	Time 0.545 (0.520)	Data 0.001 (0.015)	Loss 5.0960 (5.0868)	Top-1 acc 12.891 (12.285)	Top-5 acc 29.297 (29.181)	lr 0.03912
Warmup Train [13][1180/3239]	Time 0.514 (0.520)	Data 0.001 (0.015)	Loss 4.9634 (5.0861)	Top-1 acc 10.547 (12.288)	Top-5 acc 30.469 (29.207)	lr 0.03911
Warmup Train [13][1190/3239]	Time 0.593 (0.520)	Data 0.001 (0.015)	Loss 5.1289 (5.0858)	Top-1 acc 12.891 (12.295)	Top-5 acc 28.906 (29.210)	lr 0.03911
Warmup Train [13][1200/3239]	Time 0.434 (0.519)	Data 0.001 (0.015)	Loss 5.1058 (5.0852)	Top-1 acc 11.719 (12.297)	Top-5 acc 29.297 (29.226)	lr 0.03910
Warmup Train [13][1210/3239]	Time 0.511 (0.519)	Data 0.001 (0.015)	Loss 4.8331 (5.0848)	Top-1 acc 16.797 (12.296)	Top-5 acc 34.766 (29.229)	lr 0.03910
Warmup Train [13][1220/3239]	Time 0.580 (0.519)	Data 0.001 (0.015)	Loss 5.1301 (5.0846)	Top-1 acc 14.844 (12.306)	Top-5 acc 28.516 (29.237)	lr 0.03909
Warmup Train [13][1230/3239]	Time 0.521 (0.519)	Data 0.001 (0.015)	Loss 5.1170 (5.0847)	Top-1 acc 14.453 (12.310)	Top-5 acc 31.250 (29.237)	lr 0.03909
Warmup Train [13][1240/3239]	Time 0.310 (0.519)	Data 0.001 (0.015)	Loss 5.0553 (5.0844)	Top-1 acc 15.234 (12.316)	Top-5 acc 30.469 (29.242)	lr 0.03908
Warmup Train [13][1250/3239]	Time 0.746 (0.519)	Data 0.001 (0.015)	Loss 5.0079 (5.0847)	Top-1 acc 11.719 (12.307)	Top-5 acc 28.516 (29.232)	lr 0.03908
Warmup Train [13][1260/3239]	Time 0.537 (0.519)	Data 0.001 (0.015)	Loss 5.1336 (5.0848)	Top-1 acc 9.766 (12.304)	Top-5 acc 27.344 (29.237)	lr 0.03907
Warmup Train [13][1270/3239]	Time 0.409 (0.519)	Data 0.002 (0.015)	Loss 5.1505 (5.0846)	Top-1 acc 10.938 (12.309)	Top-5 acc 26.953 (29.238)	lr 0.03907
Warmup Train [13][1280/3239]	Time 0.455 (0.519)	Data 0.001 (0.015)	Loss 5.0349 (5.0846)	Top-1 acc 12.891 (12.308)	Top-5 acc 28.906 (29.244)	lr 0.03906
Warmup Train [13][1290/3239]	Time 0.575 (0.519)	Data 0.001 (0.015)	Loss 5.0807 (5.0847)	Top-1 acc 15.234 (12.311)	Top-5 acc 28.516 (29.239)	lr 0.03906
Warmup Train [13][1300/3239]	Time 0.635 (0.519)	Data 0.001 (0.014)	Loss 5.0372 (5.0844)	Top-1 acc 14.844 (12.325)	Top-5 acc 32.031 (29.242)	lr 0.03905
Warmup Train [13][1310/3239]	Time 0.569 (0.519)	Data 0.001 (0.014)	Loss 5.0234 (5.0845)	Top-1 acc 12.109 (12.319)	Top-5 acc 32.812 (29.244)	lr 0.03905
Warmup Train [13][1320/3239]	Time 0.409 (0.519)	Data 0.001 (0.014)	Loss 4.9347 (5.0844)	Top-1 acc 15.625 (12.317)	Top-5 acc 31.250 (29.247)	lr 0.03904
Warmup Train [13][1330/3239]	Time 0.511 (0.519)	Data 0.001 (0.014)	Loss 5.1831 (5.0844)	Top-1 acc 12.500 (12.320)	Top-5 acc 28.906 (29.252)	lr 0.03904
Warmup Train [13][1340/3239]	Time 0.551 (0.519)	Data 0.001 (0.014)	Loss 5.2122 (5.0846)	Top-1 acc 12.891 (12.316)	Top-5 acc 28.516 (29.245)	lr 0.03903
Warmup Train [13][1350/3239]	Time 0.574 (0.519)	Data 0.002 (0.014)	Loss 5.2282 (5.0848)	Top-1 acc 6.250 (12.307)	Top-5 acc 26.172 (29.241)	lr 0.03903
Warmup Train [13][1360/3239]	Time 0.536 (0.519)	Data 0.001 (0.014)	Loss 5.0636 (5.0845)	Top-1 acc 11.328 (12.307)	Top-5 acc 31.250 (29.246)	lr 0.03902
Warmup Train [13][1370/3239]	Time 0.504 (0.519)	Data 0.001 (0.014)	Loss 5.1546 (5.0846)	Top-1 acc 10.547 (12.306)	Top-5 acc 26.172 (29.238)	lr 0.03901
Warmup Train [13][1380/3239]	Time 0.540 (0.519)	Data 0.001 (0.014)	Loss 5.0130 (5.0846)	Top-1 acc 12.891 (12.306)	Top-5 acc 28.516 (29.239)	lr 0.03901
Warmup Train [13][1390/3239]	Time 0.593 (0.518)	Data 0.001 (0.014)	Loss 5.1425 (5.0849)	Top-1 acc 12.891 (12.298)	Top-5 acc 28.906 (29.231)	lr 0.03900
Warmup Train [13][1400/3239]	Time 0.485 (0.518)	Data 0.001 (0.014)	Loss 4.9713 (5.0848)	Top-1 acc 14.062 (12.303)	Top-5 acc 32.031 (29.230)	lr 0.03900
Warmup Train [13][1410/3239]	Time 0.623 (0.518)	Data 0.001 (0.014)	Loss 5.0530 (5.0846)	Top-1 acc 10.156 (12.309)	Top-5 acc 30.469 (29.237)	lr 0.03899
Warmup Train [13][1420/3239]	Time 0.529 (0.518)	Data 0.002 (0.014)	Loss 4.9436 (5.0846)	Top-1 acc 14.453 (12.313)	Top-5 acc 33.203 (29.237)	lr 0.03899
Warmup Train [13][1430/3239]	Time 0.507 (0.518)	Data 0.001 (0.014)	Loss 5.1263 (5.0845)	Top-1 acc 12.500 (12.316)	Top-5 acc 29.297 (29.235)	lr 0.03898
Warmup Train [13][1440/3239]	Time 0.421 (0.518)	Data 0.002 (0.014)	Loss 5.0536 (5.0842)	Top-1 acc 13.672 (12.327)	Top-5 acc 31.250 (29.243)	lr 0.03898
Warmup Train [13][1450/3239]	Time 0.420 (0.518)	Data 0.001 (0.014)	Loss 5.0319 (5.0842)	Top-1 acc 13.672 (12.330)	Top-5 acc 31.250 (29.250)	lr 0.03897
Warmup Train [13][1460/3239]	Time 0.654 (0.518)	Data 0.001 (0.014)	Loss 4.8634 (5.0838)	Top-1 acc 16.797 (12.335)	Top-5 acc 38.281 (29.267)	lr 0.03897
Warmup Train [13][1470/3239]	Time 0.553 (0.518)	Data 0.001 (0.014)	Loss 4.9556 (5.0835)	Top-1 acc 11.719 (12.335)	Top-5 acc 32.422 (29.266)	lr 0.03896
Warmup Train [13][1480/3239]	Time 0.560 (0.517)	Data 0.001 (0.013)	Loss 5.2380 (5.0836)	Top-1 acc 10.156 (12.332)	Top-5 acc 25.781 (29.266)	lr 0.03896
Warmup Train [13][1490/3239]	Time 0.436 (0.517)	Data 0.001 (0.013)	Loss 5.1063 (5.0833)	Top-1 acc 11.719 (12.343)	Top-5 acc 31.250 (29.276)	lr 0.03895
Warmup Train [13][1500/3239]	Time 0.607 (0.517)	Data 0.001 (0.013)	Loss 5.1474 (5.0831)	Top-1 acc 12.891 (12.353)	Top-5 acc 26.953 (29.278)	lr 0.03895
Warmup Train [13][1510/3239]	Time 0.488 (0.517)	Data 0.001 (0.013)	Loss 5.0858 (5.0832)	Top-1 acc 12.500 (12.357)	Top-5 acc 31.641 (29.280)	lr 0.03894
Warmup Train [13][1520/3239]	Time 0.342 (0.517)	Data 0.001 (0.013)	Loss 5.1915 (5.0833)	Top-1 acc 12.500 (12.361)	Top-5 acc 27.344 (29.282)	lr 0.03894
Warmup Train [13][1530/3239]	Time 0.519 (0.517)	Data 0.001 (0.013)	Loss 5.0538 (5.0829)	Top-1 acc 12.109 (12.368)	Top-5 acc 30.078 (29.292)	lr 0.03893
Warmup Train [13][1540/3239]	Time 0.437 (0.517)	Data 0.001 (0.013)	Loss 5.0273 (5.0825)	Top-1 acc 16.797 (12.382)	Top-5 acc 31.641 (29.297)	lr 0.03893
Warmup Train [13][1550/3239]	Time 0.516 (0.517)	Data 0.001 (0.013)	Loss 5.0827 (5.0821)	Top-1 acc 12.109 (12.390)	Top-5 acc 29.297 (29.301)	lr 0.03892
Warmup Train [13][1560/3239]	Time 0.552 (0.517)	Data 0.001 (0.013)	Loss 4.9055 (5.0818)	Top-1 acc 15.234 (12.391)	Top-5 acc 33.984 (29.301)	lr 0.03892
Warmup Train [13][1570/3239]	Time 0.624 (0.517)	Data 0.001 (0.013)	Loss 5.0457 (5.0818)	Top-1 acc 13.281 (12.388)	Top-5 acc 30.078 (29.300)	lr 0.03891
Warmup Train [13][1580/3239]	Time 0.452 (0.517)	Data 0.001 (0.013)	Loss 5.0567 (5.0818)	Top-1 acc 11.719 (12.383)	Top-5 acc 29.688 (29.302)	lr 0.03891
Warmup Train [13][1590/3239]	Time 0.578 (0.517)	Data 0.001 (0.013)	Loss 5.0372 (5.0815)	Top-1 acc 11.328 (12.384)	Top-5 acc 28.906 (29.306)	lr 0.03890
Warmup Train [13][1600/3239]	Time 0.515 (0.517)	Data 0.001 (0.013)	Loss 5.1885 (5.0814)	Top-1 acc 8.203 (12.387)	Top-5 acc 22.266 (29.311)	lr 0.03890
Warmup Train [13][1610/3239]	Time 0.333 (0.517)	Data 0.001 (0.013)	Loss 5.0463 (5.0809)	Top-1 acc 13.672 (12.396)	Top-5 acc 28.516 (29.327)	lr 0.03889
Warmup Train [13][1620/3239]	Time 0.638 (0.517)	Data 0.001 (0.013)	Loss 5.0586 (5.0809)	Top-1 acc 14.062 (12.402)	Top-5 acc 28.906 (29.329)	lr 0.03889
Warmup Train [13][1630/3239]	Time 0.581 (0.517)	Data 0.001 (0.013)	Loss 5.1731 (5.0808)	Top-1 acc 8.594 (12.403)	Top-5 acc 26.172 (29.329)	lr 0.03888
Warmup Train [13][1640/3239]	Time 0.578 (0.517)	Data 0.001 (0.013)	Loss 4.9565 (5.0807)	Top-1 acc 14.844 (12.405)	Top-5 acc 30.859 (29.334)	lr 0.03888
Warmup Train [13][1650/3239]	Time 0.503 (0.517)	Data 0.001 (0.013)	Loss 5.0857 (5.0802)	Top-1 acc 15.625 (12.410)	Top-5 acc 32.031 (29.348)	lr 0.03887
Warmup Train [13][1660/3239]	Time 0.392 (0.517)	Data 0.001 (0.013)	Loss 5.0480 (5.0802)	Top-1 acc 12.891 (12.411)	Top-5 acc 26.953 (29.345)	lr 0.03887
Warmup Train [13][1670/3239]	Time 0.560 (0.517)	Data 0.001 (0.013)	Loss 5.1501 (5.0803)	Top-1 acc 8.984 (12.410)	Top-5 acc 24.609 (29.338)	lr 0.03886
Warmup Train [13][1680/3239]	Time 0.795 (0.517)	Data 0.001 (0.013)	Loss 5.0798 (5.0798)	Top-1 acc 13.281 (12.414)	Top-5 acc 30.859 (29.350)	lr 0.03886
Warmup Train [13][1690/3239]	Time 0.622 (0.517)	Data 0.001 (0.013)	Loss 4.9812 (5.0797)	Top-1 acc 10.938 (12.414)	Top-5 acc 29.297 (29.344)	lr 0.03885
Warmup Train [13][1700/3239]	Time 0.604 (0.517)	Data 0.001 (0.012)	Loss 5.0976 (5.0796)	Top-1 acc 13.672 (12.416)	Top-5 acc 32.031 (29.352)	lr 0.03885
Warmup Train [13][1710/3239]	Time 0.205 (0.517)	Data 0.001 (0.012)	Loss 4.9288 (5.0794)	Top-1 acc 14.062 (12.418)	Top-5 acc 31.250 (29.357)	lr 0.03884
Warmup Train [13][1720/3239]	Time 0.581 (0.517)	Data 0.001 (0.012)	Loss 5.0606 (5.0791)	Top-1 acc 13.672 (12.422)	Top-5 acc 30.469 (29.364)	lr 0.03884
Warmup Train [13][1730/3239]	Time 0.449 (0.517)	Data 0.001 (0.012)	Loss 5.0434 (5.0789)	Top-1 acc 11.719 (12.423)	Top-5 acc 25.781 (29.362)	lr 0.03883
Warmup Train [13][1740/3239]	Time 0.482 (0.516)	Data 0.002 (0.012)	Loss 5.0201 (5.0786)	Top-1 acc 14.844 (12.428)	Top-5 acc 29.688 (29.368)	lr 0.03883
Warmup Train [13][1750/3239]	Time 0.320 (0.516)	Data 0.001 (0.012)	Loss 5.0111 (5.0784)	Top-1 acc 15.234 (12.435)	Top-5 acc 33.203 (29.375)	lr 0.03882
Warmup Train [13][1760/3239]	Time 0.467 (0.516)	Data 0.001 (0.012)	Loss 5.0264 (5.0786)	Top-1 acc 15.234 (12.432)	Top-5 acc 32.422 (29.371)	lr 0.03882
Warmup Train [13][1770/3239]	Time 0.383 (0.516)	Data 0.001 (0.012)	Loss 5.0228 (5.0783)	Top-1 acc 13.672 (12.438)	Top-5 acc 30.078 (29.379)	lr 0.03881
Warmup Train [13][1780/3239]	Time 0.480 (0.516)	Data 0.001 (0.012)	Loss 5.0270 (5.0781)	Top-1 acc 11.328 (12.439)	Top-5 acc 29.297 (29.377)	lr 0.03881
Warmup Train [13][1790/3239]	Time 0.525 (0.516)	Data 0.001 (0.012)	Loss 5.0109 (5.0778)	Top-1 acc 13.281 (12.440)	Top-5 acc 30.859 (29.378)	lr 0.03880
Warmup Train [13][1800/3239]	Time 0.672 (0.516)	Data 0.001 (0.012)	Loss 4.8938 (5.0775)	Top-1 acc 16.406 (12.446)	Top-5 acc 36.328 (29.385)	lr 0.03880
Warmup Train [13][1810/3239]	Time 0.336 (0.516)	Data 0.001 (0.012)	Loss 5.1537 (5.0771)	Top-1 acc 13.281 (12.452)	Top-5 acc 29.688 (29.396)	lr 0.03879
Warmup Train [13][1820/3239]	Time 0.476 (0.516)	Data 0.001 (0.012)	Loss 4.9797 (5.0771)	Top-1 acc 13.281 (12.455)	Top-5 acc 27.734 (29.398)	lr 0.03879
Warmup Train [13][1830/3239]	Time 0.411 (0.516)	Data 0.001 (0.012)	Loss 5.0759 (5.0769)	Top-1 acc 13.672 (12.456)	Top-5 acc 32.031 (29.403)	lr 0.03878
Warmup Train [13][1840/3239]	Time 0.551 (0.516)	Data 0.001 (0.012)	Loss 5.0230 (5.0767)	Top-1 acc 14.453 (12.461)	Top-5 acc 31.641 (29.410)	lr 0.03878
Warmup Train [13][1850/3239]	Time 0.381 (0.516)	Data 0.001 (0.012)	Loss 5.1068 (5.0765)	Top-1 acc 9.766 (12.460)	Top-5 acc 28.516 (29.415)	lr 0.03877
Warmup Train [13][1860/3239]	Time 0.569 (0.516)	Data 0.001 (0.012)	Loss 5.1605 (5.0764)	Top-1 acc 10.938 (12.459)	Top-5 acc 28.906 (29.417)	lr 0.03877
Warmup Train [13][1870/3239]	Time 0.460 (0.516)	Data 0.001 (0.012)	Loss 5.1731 (5.0763)	Top-1 acc 10.156 (12.465)	Top-5 acc 25.391 (29.419)	lr 0.03876
Warmup Train [13][1880/3239]	Time 0.563 (0.516)	Data 0.001 (0.012)	Loss 5.0223 (5.0762)	Top-1 acc 13.281 (12.469)	Top-5 acc 28.906 (29.425)	lr 0.03876
Warmup Train [13][1890/3239]	Time 0.396 (0.516)	Data 0.001 (0.012)	Loss 5.0801 (5.0761)	Top-1 acc 15.234 (12.470)	Top-5 acc 28.125 (29.424)	lr 0.03875
Warmup Train [13][1900/3239]	Time 0.523 (0.516)	Data 0.001 (0.012)	Loss 5.1278 (5.0759)	Top-1 acc 13.672 (12.474)	Top-5 acc 27.344 (29.432)	lr 0.03875
Warmup Train [13][1910/3239]	Time 0.485 (0.516)	Data 0.001 (0.012)	Loss 5.1179 (5.0758)	Top-1 acc 11.719 (12.475)	Top-5 acc 27.734 (29.429)	lr 0.03874
Warmup Train [13][1920/3239]	Time 0.330 (0.516)	Data 0.001 (0.012)	Loss 5.0323 (5.0757)	Top-1 acc 15.234 (12.483)	Top-5 acc 32.031 (29.437)	lr 0.03874
Warmup Train [13][1930/3239]	Time 0.491 (0.516)	Data 0.001 (0.012)	Loss 5.0456 (5.0755)	Top-1 acc 12.500 (12.488)	Top-5 acc 32.031 (29.444)	lr 0.03873
Warmup Train [13][1940/3239]	Time 0.301 (0.516)	Data 0.001 (0.012)	Loss 5.0314 (5.0751)	Top-1 acc 12.891 (12.494)	Top-5 acc 33.203 (29.455)	lr 0.03873
Warmup Train [13][1950/3239]	Time 0.463 (0.516)	Data 0.001 (0.012)	Loss 4.7842 (5.0750)	Top-1 acc 16.406 (12.497)	Top-5 acc 32.812 (29.455)	lr 0.03872
Warmup Train [13][1960/3239]	Time 0.648 (0.516)	Data 0.001 (0.012)	Loss 5.0264 (5.0748)	Top-1 acc 13.281 (12.502)	Top-5 acc 28.516 (29.458)	lr 0.03872
Warmup Train [13][1970/3239]	Time 0.575 (0.517)	Data 0.001 (0.012)	Loss 5.0007 (5.0746)	Top-1 acc 13.672 (12.509)	Top-5 acc 32.812 (29.467)	lr 0.03871
Warmup Train [13][1980/3239]	Time 0.535 (0.517)	Data 0.001 (0.012)	Loss 5.0635 (5.0746)	Top-1 acc 12.109 (12.510)	Top-5 acc 29.688 (29.467)	lr 0.03871
Warmup Train [13][1990/3239]	Time 0.396 (0.516)	Data 0.001 (0.012)	Loss 4.8782 (5.0741)	Top-1 acc 15.625 (12.518)	Top-5 acc 33.984 (29.481)	lr 0.03870
Warmup Train [13][2000/3239]	Time 0.523 (0.516)	Data 0.001 (0.012)	Loss 4.9937 (5.0738)	Top-1 acc 14.062 (12.524)	Top-5 acc 31.641 (29.486)	lr 0.03870
Warmup Train [13][2010/3239]	Time 0.392 (0.516)	Data 0.001 (0.012)	Loss 4.7561 (5.0735)	Top-1 acc 17.969 (12.530)	Top-5 acc 37.500 (29.499)	lr 0.03869
Warmup Train [13][2020/3239]	Time 0.311 (0.516)	Data 0.001 (0.012)	Loss 5.0755 (5.0734)	Top-1 acc 12.109 (12.531)	Top-5 acc 26.562 (29.498)	lr 0.03869
Warmup Train [13][2030/3239]	Time 0.279 (0.516)	Data 0.001 (0.012)	Loss 5.0509 (5.0730)	Top-1 acc 13.281 (12.535)	Top-5 acc 29.688 (29.510)	lr 0.03868
Warmup Train [13][2040/3239]	Time 0.609 (0.516)	Data 0.001 (0.012)	Loss 4.8734 (5.0726)	Top-1 acc 14.844 (12.531)	Top-5 acc 33.984 (29.514)	lr 0.03868
Warmup Train [13][2050/3239]	Time 0.402 (0.516)	Data 0.001 (0.012)	Loss 5.0046 (5.0723)	Top-1 acc 14.453 (12.542)	Top-5 acc 29.297 (29.529)	lr 0.03867
Warmup Train [13][2060/3239]	Time 0.522 (0.516)	Data 0.001 (0.012)	Loss 5.0925 (5.0723)	Top-1 acc 11.719 (12.540)	Top-5 acc 29.688 (29.531)	lr 0.03867
Warmup Train [13][2070/3239]	Time 0.589 (0.516)	Data 0.001 (0.012)	Loss 5.2637 (5.0724)	Top-1 acc 8.203 (12.534)	Top-5 acc 25.781 (29.526)	lr 0.03866
Warmup Train [13][2080/3239]	Time 0.578 (0.516)	Data 0.001 (0.012)	Loss 4.9474 (5.0724)	Top-1 acc 13.672 (12.533)	Top-5 acc 34.766 (29.525)	lr 0.03866
Warmup Train [13][2090/3239]	Time 0.502 (0.516)	Data 0.001 (0.012)	Loss 5.1224 (5.0719)	Top-1 acc 10.156 (12.535)	Top-5 acc 31.641 (29.539)	lr 0.03865
Warmup Train [13][2100/3239]	Time 0.448 (0.516)	Data 0.001 (0.012)	Loss 4.8860 (5.0716)	Top-1 acc 14.062 (12.539)	Top-5 acc 33.594 (29.544)	lr 0.03865
Warmup Train [13][2110/3239]	Time 0.589 (0.516)	Data 0.001 (0.012)	Loss 4.8885 (5.0716)	Top-1 acc 13.672 (12.538)	Top-5 acc 34.375 (29.552)	lr 0.03864
Warmup Train [13][2120/3239]	Time 0.621 (0.516)	Data 0.001 (0.012)	Loss 5.0600 (5.0713)	Top-1 acc 11.328 (12.539)	Top-5 acc 26.953 (29.561)	lr 0.03864
Warmup Train [13][2130/3239]	Time 0.397 (0.516)	Data 0.001 (0.011)	Loss 5.1641 (5.0710)	Top-1 acc 11.719 (12.546)	Top-5 acc 24.609 (29.564)	lr 0.03863
Warmup Train [13][2140/3239]	Time 0.565 (0.516)	Data 0.001 (0.012)	Loss 5.0749 (5.0708)	Top-1 acc 12.500 (12.547)	Top-5 acc 30.859 (29.571)	lr 0.03863
Warmup Train [13][2150/3239]	Time 0.583 (0.516)	Data 0.001 (0.011)	Loss 4.9465 (5.0705)	Top-1 acc 14.844 (12.549)	Top-5 acc 34.375 (29.578)	lr 0.03862
Warmup Train [13][2160/3239]	Time 0.389 (0.516)	Data 0.001 (0.011)	Loss 5.0726 (5.0703)	Top-1 acc 10.156 (12.544)	Top-5 acc 25.000 (29.576)	lr 0.03862
Warmup Train [13][2170/3239]	Time 0.704 (0.516)	Data 0.001 (0.011)	Loss 5.0884 (5.0703)	Top-1 acc 12.109 (12.546)	Top-5 acc 25.781 (29.573)	lr 0.03861
Warmup Train [13][2180/3239]	Time 0.552 (0.516)	Data 0.001 (0.011)	Loss 5.0932 (5.0702)	Top-1 acc 13.672 (12.548)	Top-5 acc 31.641 (29.575)	lr 0.03861
Warmup Train [13][2190/3239]	Time 0.549 (0.516)	Data 0.001 (0.011)	Loss 5.0198 (5.0698)	Top-1 acc 11.719 (12.552)	Top-5 acc 34.375 (29.585)	lr 0.03860
Warmup Train [13][2200/3239]	Time 0.440 (0.516)	Data 0.001 (0.011)	Loss 5.1566 (5.0700)	Top-1 acc 12.891 (12.547)	Top-5 acc 25.781 (29.580)	lr 0.03860
Warmup Train [13][2210/3239]	Time 0.558 (0.516)	Data 0.001 (0.011)	Loss 4.9330 (5.0700)	Top-1 acc 18.359 (12.550)	Top-5 acc 39.453 (29.587)	lr 0.03859
Warmup Train [13][2220/3239]	Time 0.530 (0.516)	Data 0.001 (0.011)	Loss 4.9174 (5.0698)	Top-1 acc 15.234 (12.556)	Top-5 acc 35.156 (29.590)	lr 0.03859
Warmup Train [13][2230/3239]	Time 0.528 (0.516)	Data 0.001 (0.011)	Loss 5.2435 (5.0698)	Top-1 acc 10.156 (12.563)	Top-5 acc 31.641 (29.596)	lr 0.03858
Warmup Train [13][2240/3239]	Time 0.617 (0.516)	Data 0.001 (0.011)	Loss 5.0503 (5.0696)	Top-1 acc 13.281 (12.566)	Top-5 acc 30.078 (29.601)	lr 0.03858
Warmup Train [13][2250/3239]	Time 0.561 (0.516)	Data 0.001 (0.011)	Loss 5.1131 (5.0695)	Top-1 acc 10.938 (12.564)	Top-5 acc 26.172 (29.598)	lr 0.03857
Warmup Train [13][2260/3239]	Time 0.523 (0.516)	Data 0.001 (0.011)	Loss 5.0474 (5.0695)	Top-1 acc 17.578 (12.561)	Top-5 acc 31.641 (29.595)	lr 0.03857
Warmup Train [13][2270/3239]	Time 0.520 (0.516)	Data 0.001 (0.011)	Loss 4.8478 (5.0692)	Top-1 acc 19.531 (12.566)	Top-5 acc 35.547 (29.605)	lr 0.03856
Warmup Train [13][2280/3239]	Time 0.620 (0.516)	Data 0.001 (0.011)	Loss 4.9390 (5.0688)	Top-1 acc 12.109 (12.573)	Top-5 acc 36.328 (29.614)	lr 0.03855
Warmup Train [13][2290/3239]	Time 0.355 (0.516)	Data 0.001 (0.011)	Loss 4.9482 (5.0687)	Top-1 acc 16.797 (12.576)	Top-5 acc 33.984 (29.616)	lr 0.03855
Warmup Train [13][2300/3239]	Time 0.516 (0.516)	Data 0.001 (0.011)	Loss 5.0864 (5.0683)	Top-1 acc 10.547 (12.579)	Top-5 acc 32.031 (29.625)	lr 0.03854
Warmup Train [13][2310/3239]	Time 0.485 (0.515)	Data 0.001 (0.011)	Loss 5.0584 (5.0685)	Top-1 acc 10.938 (12.575)	Top-5 acc 28.125 (29.619)	lr 0.03854
Warmup Train [13][2320/3239]	Time 0.669 (0.515)	Data 0.001 (0.011)	Loss 5.1515 (5.0683)	Top-1 acc 13.672 (12.581)	Top-5 acc 26.953 (29.624)	lr 0.03853
Warmup Train [13][2330/3239]	Time 0.415 (0.515)	Data 0.001 (0.011)	Loss 4.9021 (5.0682)	Top-1 acc 15.234 (12.583)	Top-5 acc 33.594 (29.629)	lr 0.03853
Warmup Train [13][2340/3239]	Time 0.604 (0.515)	Data 0.001 (0.011)	Loss 5.0729 (5.0681)	Top-1 acc 13.281 (12.583)	Top-5 acc 29.688 (29.626)	lr 0.03852
Warmup Train [13][2350/3239]	Time 0.490 (0.515)	Data 0.001 (0.011)	Loss 4.8927 (5.0679)	Top-1 acc 14.453 (12.588)	Top-5 acc 29.688 (29.628)	lr 0.03852
Warmup Train [13][2360/3239]	Time 0.491 (0.515)	Data 0.001 (0.011)	Loss 5.0885 (5.0679)	Top-1 acc 13.672 (12.588)	Top-5 acc 28.516 (29.626)	lr 0.03851
Warmup Train [13][2370/3239]	Time 0.503 (0.515)	Data 0.001 (0.011)	Loss 5.0056 (5.0678)	Top-1 acc 18.750 (12.594)	Top-5 acc 27.734 (29.627)	lr 0.03851
Warmup Train [13][2380/3239]	Time 0.598 (0.515)	Data 0.001 (0.011)	Loss 5.1457 (5.0677)	Top-1 acc 10.547 (12.595)	Top-5 acc 23.828 (29.629)	lr 0.03850
Warmup Train [13][2390/3239]	Time 0.695 (0.515)	Data 0.001 (0.011)	Loss 5.1721 (5.0676)	Top-1 acc 11.719 (12.595)	Top-5 acc 26.953 (29.629)	lr 0.03850
Warmup Train [13][2400/3239]	Time 0.365 (0.515)	Data 0.001 (0.011)	Loss 4.8601 (5.0672)	Top-1 acc 14.844 (12.600)	Top-5 acc 32.031 (29.639)	lr 0.03849
Warmup Train [13][2410/3239]	Time 0.627 (0.515)	Data 0.001 (0.011)	Loss 5.0275 (5.0670)	Top-1 acc 13.672 (12.602)	Top-5 acc 31.250 (29.641)	lr 0.03849
Warmup Train [13][2420/3239]	Time 0.594 (0.515)	Data 0.001 (0.011)	Loss 4.9748 (5.0669)	Top-1 acc 13.672 (12.604)	Top-5 acc 33.203 (29.644)	lr 0.03848
Warmup Train [13][2430/3239]	Time 0.479 (0.515)	Data 0.001 (0.011)	Loss 5.0013 (5.0667)	Top-1 acc 16.797 (12.612)	Top-5 acc 33.203 (29.650)	lr 0.03848
Warmup Train [13][2440/3239]	Time 0.530 (0.515)	Data 0.001 (0.011)	Loss 4.8733 (5.0665)	Top-1 acc 16.406 (12.610)	Top-5 acc 33.594 (29.651)	lr 0.03847
Warmup Train [13][2450/3239]	Time 0.629 (0.515)	Data 0.001 (0.011)	Loss 5.0558 (5.0663)	Top-1 acc 14.453 (12.609)	Top-5 acc 29.688 (29.650)	lr 0.03847
Warmup Train [13][2460/3239]	Time 0.568 (0.515)	Data 0.001 (0.011)	Loss 5.1536 (5.0660)	Top-1 acc 12.109 (12.612)	Top-5 acc 27.344 (29.651)	lr 0.03846
Warmup Train [13][2470/3239]	Time 0.505 (0.515)	Data 0.001 (0.011)	Loss 4.9663 (5.0660)	Top-1 acc 12.500 (12.613)	Top-5 acc 33.594 (29.655)	lr 0.03846
Warmup Train [13][2480/3239]	Time 0.548 (0.515)	Data 0.001 (0.011)	Loss 4.9399 (5.0658)	Top-1 acc 10.938 (12.613)	Top-5 acc 32.422 (29.658)	lr 0.03845
Warmup Train [13][2490/3239]	Time 0.676 (0.515)	Data 0.002 (0.011)	Loss 4.9889 (5.0657)	Top-1 acc 12.500 (12.615)	Top-5 acc 30.078 (29.664)	lr 0.03845
Warmup Train [13][2500/3239]	Time 0.558 (0.515)	Data 0.001 (0.011)	Loss 4.9912 (5.0655)	Top-1 acc 16.016 (12.621)	Top-5 acc 31.250 (29.669)	lr 0.03844
Warmup Train [13][2510/3239]	Time 0.508 (0.515)	Data 0.001 (0.010)	Loss 5.0500 (5.0652)	Top-1 acc 11.719 (12.624)	Top-5 acc 32.422 (29.681)	lr 0.03844
Warmup Train [13][2520/3239]	Time 0.476 (0.515)	Data 0.001 (0.010)	Loss 5.0171 (5.0650)	Top-1 acc 13.281 (12.628)	Top-5 acc 28.906 (29.685)	lr 0.03843
Warmup Train [13][2530/3239]	Time 0.470 (0.515)	Data 0.001 (0.010)	Loss 4.9775 (5.0649)	Top-1 acc 12.891 (12.630)	Top-5 acc 29.688 (29.684)	lr 0.03843
Warmup Train [13][2540/3239]	Time 0.555 (0.515)	Data 0.001 (0.010)	Loss 5.0064 (5.0647)	Top-1 acc 13.672 (12.637)	Top-5 acc 30.859 (29.693)	lr 0.03842
Warmup Train [13][2550/3239]	Time 0.384 (0.515)	Data 0.002 (0.010)	Loss 4.9727 (5.0644)	Top-1 acc 13.672 (12.637)	Top-5 acc 32.031 (29.699)	lr 0.03842
Warmup Train [13][2560/3239]	Time 0.536 (0.515)	Data 0.001 (0.010)	Loss 4.9438 (5.0645)	Top-1 acc 15.234 (12.640)	Top-5 acc 35.156 (29.704)	lr 0.03841
Warmup Train [13][2570/3239]	Time 0.601 (0.515)	Data 0.001 (0.010)	Loss 5.1823 (5.0645)	Top-1 acc 12.109 (12.642)	Top-5 acc 27.734 (29.701)	lr 0.03841
Warmup Train [13][2580/3239]	Time 0.384 (0.515)	Data 0.020 (0.010)	Loss 4.9098 (5.0643)	Top-1 acc 13.281 (12.644)	Top-5 acc 31.250 (29.706)	lr 0.03840
Warmup Train [13][2590/3239]	Time 0.749 (0.515)	Data 0.001 (0.010)	Loss 5.0531 (5.0643)	Top-1 acc 12.891 (12.641)	Top-5 acc 30.469 (29.706)	lr 0.03840
Warmup Train [13][2600/3239]	Time 0.507 (0.515)	Data 0.001 (0.010)	Loss 5.0946 (5.0640)	Top-1 acc 11.719 (12.646)	Top-5 acc 26.953 (29.710)	lr 0.03839
Warmup Train [13][2610/3239]	Time 0.440 (0.515)	Data 0.001 (0.010)	Loss 4.9517 (5.0638)	Top-1 acc 15.234 (12.647)	Top-5 acc 31.641 (29.713)	lr 0.03839
Warmup Train [13][2620/3239]	Time 0.569 (0.515)	Data 0.001 (0.010)	Loss 5.1939 (5.0638)	Top-1 acc 12.500 (12.650)	Top-5 acc 25.000 (29.713)	lr 0.03838
Warmup Train [13][2630/3239]	Time 0.590 (0.515)	Data 0.001 (0.010)	Loss 5.0015 (5.0636)	Top-1 acc 16.406 (12.653)	Top-5 acc 35.156 (29.719)	lr 0.03838
Warmup Train [13][2640/3239]	Time 0.558 (0.515)	Data 0.001 (0.010)	Loss 5.0627 (5.0635)	Top-1 acc 12.109 (12.658)	Top-5 acc 33.203 (29.728)	lr 0.03837
Warmup Train [13][2650/3239]	Time 0.515 (0.515)	Data 0.001 (0.010)	Loss 4.8318 (5.0633)	Top-1 acc 13.672 (12.660)	Top-5 acc 33.984 (29.730)	lr 0.03837
Warmup Train [13][2660/3239]	Time 0.518 (0.515)	Data 0.001 (0.010)	Loss 5.1790 (5.0631)	Top-1 acc 10.938 (12.664)	Top-5 acc 30.469 (29.736)	lr 0.03836
Warmup Train [13][2670/3239]	Time 0.572 (0.515)	Data 0.001 (0.010)	Loss 4.9763 (5.0629)	Top-1 acc 11.719 (12.665)	Top-5 acc 30.078 (29.739)	lr 0.03836
Warmup Train [13][2680/3239]	Time 0.495 (0.515)	Data 0.001 (0.010)	Loss 4.9691 (5.0628)	Top-1 acc 15.625 (12.664)	Top-5 acc 35.156 (29.740)	lr 0.03835
Warmup Train [13][2690/3239]	Time 0.614 (0.515)	Data 0.001 (0.010)	Loss 5.0804 (5.0627)	Top-1 acc 10.938 (12.665)	Top-5 acc 28.125 (29.738)	lr 0.03835
Warmup Train [13][2700/3239]	Time 0.589 (0.515)	Data 0.001 (0.010)	Loss 4.9514 (5.0626)	Top-1 acc 12.891 (12.669)	Top-5 acc 32.031 (29.744)	lr 0.03834
Warmup Train [13][2710/3239]	Time 0.487 (0.515)	Data 0.001 (0.010)	Loss 4.8704 (5.0624)	Top-1 acc 15.234 (12.667)	Top-5 acc 30.469 (29.747)	lr 0.03834
Warmup Train [13][2720/3239]	Time 0.501 (0.515)	Data 0.001 (0.010)	Loss 5.1402 (5.0623)	Top-1 acc 12.891 (12.666)	Top-5 acc 29.688 (29.748)	lr 0.03833
Warmup Train [13][2730/3239]	Time 0.527 (0.515)	Data 0.001 (0.010)	Loss 5.1220 (5.0623)	Top-1 acc 10.156 (12.665)	Top-5 acc 30.469 (29.749)	lr 0.03832
Warmup Train [13][2740/3239]	Time 0.525 (0.515)	Data 0.002 (0.010)	Loss 5.2115 (5.0621)	Top-1 acc 11.328 (12.667)	Top-5 acc 24.609 (29.754)	lr 0.03832
Warmup Train [13][2750/3239]	Time 0.486 (0.515)	Data 0.001 (0.010)	Loss 5.1594 (5.0619)	Top-1 acc 11.719 (12.671)	Top-5 acc 22.656 (29.757)	lr 0.03831
Warmup Train [13][2760/3239]	Time 0.451 (0.515)	Data 0.001 (0.010)	Loss 4.9888 (5.0617)	Top-1 acc 16.797 (12.678)	Top-5 acc 28.906 (29.763)	lr 0.03831
Warmup Train [13][2770/3239]	Time 0.439 (0.515)	Data 0.001 (0.010)	Loss 4.9236 (5.0613)	Top-1 acc 17.188 (12.684)	Top-5 acc 32.812 (29.773)	lr 0.03830
Warmup Train [13][2780/3239]	Time 0.488 (0.515)	Data 0.001 (0.010)	Loss 5.1772 (5.0611)	Top-1 acc 9.375 (12.685)	Top-5 acc 29.297 (29.776)	lr 0.03830
Warmup Train [13][2790/3239]	Time 0.464 (0.515)	Data 0.001 (0.010)	Loss 5.0408 (5.0610)	Top-1 acc 14.062 (12.689)	Top-5 acc 33.594 (29.781)	lr 0.03829
Warmup Train [13][2800/3239]	Time 0.698 (0.515)	Data 0.001 (0.010)	Loss 5.0064 (5.0609)	Top-1 acc 13.672 (12.693)	Top-5 acc 28.906 (29.785)	lr 0.03829
Warmup Train [13][2810/3239]	Time 0.377 (0.515)	Data 0.001 (0.010)	Loss 5.2488 (5.0607)	Top-1 acc 13.281 (12.692)	Top-5 acc 26.562 (29.787)	lr 0.03828
Warmup Train [13][2820/3239]	Time 0.382 (0.515)	Data 0.001 (0.010)	Loss 4.9065 (5.0603)	Top-1 acc 16.016 (12.696)	Top-5 acc 33.594 (29.797)	lr 0.03828
Warmup Train [13][2830/3239]	Time 0.548 (0.515)	Data 0.001 (0.010)	Loss 5.0072 (5.0602)	Top-1 acc 14.844 (12.701)	Top-5 acc 32.031 (29.802)	lr 0.03827
Warmup Train [13][2840/3239]	Time 0.538 (0.515)	Data 0.001 (0.010)	Loss 5.0300 (5.0600)	Top-1 acc 14.062 (12.703)	Top-5 acc 30.078 (29.807)	lr 0.03827
Warmup Train [13][2850/3239]	Time 0.480 (0.515)	Data 0.001 (0.010)	Loss 4.9578 (5.0599)	Top-1 acc 15.234 (12.705)	Top-5 acc 31.250 (29.807)	lr 0.03826
Warmup Train [13][2860/3239]	Time 0.500 (0.515)	Data 0.001 (0.010)	Loss 5.0046 (5.0599)	Top-1 acc 14.453 (12.707)	Top-5 acc 28.906 (29.809)	lr 0.03826
Warmup Train [13][2870/3239]	Time 0.536 (0.514)	Data 0.001 (0.010)	Loss 5.1388 (5.0597)	Top-1 acc 10.547 (12.707)	Top-5 acc 27.734 (29.805)	lr 0.03825
Warmup Train [13][2880/3239]	Time 0.556 (0.514)	Data 0.001 (0.010)	Loss 4.9778 (5.0595)	Top-1 acc 11.328 (12.709)	Top-5 acc 28.906 (29.808)	lr 0.03825
Warmup Train [13][2890/3239]	Time 0.453 (0.514)	Data 0.001 (0.010)	Loss 4.9004 (5.0593)	Top-1 acc 14.844 (12.712)	Top-5 acc 33.203 (29.813)	lr 0.03824
Warmup Train [13][2900/3239]	Time 0.672 (0.515)	Data 0.001 (0.010)	Loss 4.9622 (5.0592)	Top-1 acc 11.328 (12.714)	Top-5 acc 32.812 (29.817)	lr 0.03824
Warmup Train [13][2910/3239]	Time 0.598 (0.515)	Data 0.001 (0.010)	Loss 5.1229 (5.0591)	Top-1 acc 14.844 (12.715)	Top-5 acc 32.422 (29.818)	lr 0.03823
Warmup Train [13][2920/3239]	Time 0.646 (0.515)	Data 0.001 (0.010)	Loss 4.9739 (5.0590)	Top-1 acc 12.109 (12.717)	Top-5 acc 28.516 (29.821)	lr 0.03823
Warmup Train [13][2930/3239]	Time 0.418 (0.515)	Data 0.001 (0.010)	Loss 4.9593 (5.0588)	Top-1 acc 15.234 (12.721)	Top-5 acc 29.297 (29.828)	lr 0.03822
Warmup Train [13][2940/3239]	Time 0.298 (0.514)	Data 0.001 (0.010)	Loss 5.0410 (5.0585)	Top-1 acc 14.453 (12.728)	Top-5 acc 30.469 (29.836)	lr 0.03822
Warmup Train [13][2950/3239]	Time 0.628 (0.514)	Data 0.001 (0.010)	Loss 4.9490 (5.0582)	Top-1 acc 14.844 (12.733)	Top-5 acc 31.250 (29.844)	lr 0.03821
Warmup Train [13][2960/3239]	Time 0.565 (0.514)	Data 0.001 (0.010)	Loss 4.7794 (5.0580)	Top-1 acc 17.188 (12.734)	Top-5 acc 37.500 (29.850)	lr 0.03821
Warmup Train [13][2970/3239]	Time 0.554 (0.514)	Data 0.001 (0.010)	Loss 5.0427 (5.0579)	Top-1 acc 14.844 (12.736)	Top-5 acc 33.203 (29.853)	lr 0.03820
Warmup Train [13][2980/3239]	Time 0.505 (0.514)	Data 0.002 (0.010)	Loss 4.9243 (5.0579)	Top-1 acc 14.453 (12.737)	Top-5 acc 32.031 (29.854)	lr 0.03820
Warmup Train [13][2990/3239]	Time 0.411 (0.514)	Data 0.001 (0.010)	Loss 5.0942 (5.0580)	Top-1 acc 12.891 (12.736)	Top-5 acc 27.734 (29.855)	lr 0.03819
Warmup Train [13][3000/3239]	Time 0.502 (0.514)	Data 0.001 (0.010)	Loss 4.9419 (5.0581)	Top-1 acc 13.672 (12.734)	Top-5 acc 31.641 (29.848)	lr 0.03819
Warmup Train [13][3010/3239]	Time 0.490 (0.514)	Data 0.001 (0.010)	Loss 5.1510 (5.0578)	Top-1 acc 11.719 (12.734)	Top-5 acc 26.953 (29.851)	lr 0.03818
Warmup Train [13][3020/3239]	Time 0.658 (0.514)	Data 0.001 (0.010)	Loss 5.0445 (5.0577)	Top-1 acc 15.234 (12.736)	Top-5 acc 32.812 (29.856)	lr 0.03818
Warmup Train [13][3030/3239]	Time 0.527 (0.514)	Data 0.001 (0.010)	Loss 5.0485 (5.0575)	Top-1 acc 13.672 (12.740)	Top-5 acc 28.516 (29.860)	lr 0.03817
Warmup Train [13][3040/3239]	Time 0.689 (0.514)	Data 0.001 (0.010)	Loss 4.9966 (5.0574)	Top-1 acc 16.016 (12.741)	Top-5 acc 32.031 (29.860)	lr 0.03817
Warmup Train [13][3050/3239]	Time 0.399 (0.514)	Data 0.001 (0.010)	Loss 4.7973 (5.0572)	Top-1 acc 15.234 (12.747)	Top-5 acc 36.719 (29.868)	lr 0.03816
Warmup Train [13][3060/3239]	Time 0.355 (0.514)	Data 0.001 (0.010)	Loss 4.9011 (5.0570)	Top-1 acc 16.406 (12.750)	Top-5 acc 31.250 (29.869)	lr 0.03816
Warmup Train [13][3070/3239]	Time 0.525 (0.514)	Data 0.001 (0.010)	Loss 5.1253 (5.0569)	Top-1 acc 10.938 (12.748)	Top-5 acc 27.344 (29.872)	lr 0.03815
Warmup Train [13][3080/3239]	Time 0.407 (0.514)	Data 0.001 (0.010)	Loss 5.0703 (5.0568)	Top-1 acc 11.328 (12.753)	Top-5 acc 26.172 (29.878)	lr 0.03815
Warmup Train [13][3090/3239]	Time 0.406 (0.514)	Data 0.001 (0.010)	Loss 5.2553 (5.0567)	Top-1 acc 7.422 (12.752)	Top-5 acc 25.391 (29.878)	lr 0.03814
Warmup Train [13][3100/3239]	Time 0.517 (0.514)	Data 0.027 (0.010)	Loss 4.8302 (5.0566)	Top-1 acc 18.359 (12.758)	Top-5 acc 39.062 (29.882)	lr 0.03813
Warmup Train [13][3110/3239]	Time 0.664 (0.514)	Data 0.001 (0.010)	Loss 5.0416 (5.0564)	Top-1 acc 14.453 (12.760)	Top-5 acc 30.078 (29.887)	lr 0.03813
Warmup Train [13][3120/3239]	Time 0.531 (0.514)	Data 0.001 (0.010)	Loss 5.0612 (5.0563)	Top-1 acc 12.891 (12.765)	Top-5 acc 31.250 (29.891)	lr 0.03812
Warmup Train [13][3130/3239]	Time 0.501 (0.514)	Data 0.001 (0.010)	Loss 5.1236 (5.0561)	Top-1 acc 14.062 (12.767)	Top-5 acc 27.344 (29.894)	lr 0.03812
Warmup Train [13][3140/3239]	Time 0.375 (0.514)	Data 0.001 (0.010)	Loss 5.0470 (5.0562)	Top-1 acc 12.109 (12.766)	Top-5 acc 28.516 (29.890)	lr 0.03811
Warmup Train [13][3150/3239]	Time 0.500 (0.514)	Data 0.001 (0.010)	Loss 5.1364 (5.0561)	Top-1 acc 9.375 (12.767)	Top-5 acc 27.344 (29.893)	lr 0.03811
Warmup Train [13][3160/3239]	Time 0.552 (0.514)	Data 0.001 (0.009)	Loss 5.0465 (5.0559)	Top-1 acc 10.547 (12.768)	Top-5 acc 30.078 (29.896)	lr 0.03810
Warmup Train [13][3170/3239]	Time 0.492 (0.514)	Data 0.001 (0.009)	Loss 4.9229 (5.0557)	Top-1 acc 17.188 (12.770)	Top-5 acc 33.594 (29.899)	lr 0.03810
Warmup Train [13][3180/3239]	Time 0.491 (0.514)	Data 0.000 (0.009)	Loss 4.8414 (5.0554)	Top-1 acc 15.625 (12.775)	Top-5 acc 33.594 (29.907)	lr 0.03809
Warmup Train [13][3190/3239]	Time 0.319 (0.514)	Data 0.000 (0.009)	Loss 4.8692 (5.0553)	Top-1 acc 14.844 (12.782)	Top-5 acc 33.594 (29.913)	lr 0.03809
Warmup Train [13][3200/3239]	Time 0.532 (0.514)	Data 0.000 (0.009)	Loss 4.9835 (5.0552)	Top-1 acc 16.797 (12.782)	Top-5 acc 32.422 (29.916)	lr 0.03808
Warmup Train [13][3210/3239]	Time 0.346 (0.514)	Data 0.000 (0.009)	Loss 4.9380 (5.0550)	Top-1 acc 16.406 (12.786)	Top-5 acc 34.766 (29.922)	lr 0.03808
Warmup Train [13][3220/3239]	Time 0.532 (0.514)	Data 0.000 (0.009)	Loss 4.9479 (5.0549)	Top-1 acc 13.672 (12.785)	Top-5 acc 29.688 (29.925)	lr 0.03807
Warmup Train [13][3230/3239]	Time 0.407 (0.514)	Data 0.000 (0.009)	Loss 5.1945 (5.0547)	Top-1 acc 13.672 (12.789)	Top-5 acc 30.078 (29.933)	lr 0.03807
Warmup Train [13][3239/3239]	Time 0.338 (0.513)	Data 0.000 (0.009)	Loss 4.9060 (5.0545)	Top-1 acc 12.346 (12.792)	Top-5 acc 35.802 (29.938)	lr 0.03806
==========Warmup Valid [13/40]	loss 4.203	top-1 acc 18.490	top-5 acc 39.395	Train top-1 12.792	top-5 29.938	flops: 442.4M
Warmup Train [14][0/3239]	Time 12.610 (12.610)	Data 11.239 (11.239)	Loss 5.2142 (5.2142)	Top-1 acc 13.281 (13.281)	Top-5 acc 28.906 (28.906)	lr 0.03806
Warmup Train [14][10/3239]	Time 0.572 (1.756)	Data 0.001 (1.128)	Loss 5.0730 (5.0056)	Top-1 acc 10.938 (14.205)	Top-5 acc 32.031 (31.143)	lr 0.03806
Warmup Train [14][20/3239]	Time 0.513 (1.142)	Data 0.001 (0.592)	Loss 5.0206 (4.9894)	Top-1 acc 18.359 (14.416)	Top-5 acc 35.156 (31.957)	lr 0.03805
Warmup Train [14][30/3239]	Time 0.530 (0.915)	Data 0.001 (0.401)	Loss 4.8702 (4.9876)	Top-1 acc 14.453 (14.100)	Top-5 acc 37.891 (31.653)	lr 0.03805
Warmup Train [14][40/3239]	Time 0.520 (0.820)	Data 0.001 (0.304)	Loss 5.0536 (4.9810)	Top-1 acc 12.500 (14.005)	Top-5 acc 30.469 (31.812)	lr 0.03804
Warmup Train [14][50/3239]	Time 0.612 (0.759)	Data 0.001 (0.245)	Loss 5.0713 (4.9924)	Top-1 acc 13.672 (13.863)	Top-5 acc 25.781 (31.419)	lr 0.03804
Warmup Train [14][60/3239]	Time 0.484 (0.717)	Data 0.001 (0.205)	Loss 5.0638 (4.9893)	Top-1 acc 13.672 (13.922)	Top-5 acc 27.734 (31.397)	lr 0.03803
Warmup Train [14][70/3239]	Time 0.509 (0.689)	Data 0.001 (0.177)	Loss 5.0518 (4.9804)	Top-1 acc 15.234 (14.029)	Top-5 acc 28.906 (31.613)	lr 0.03803
Warmup Train [14][80/3239]	Time 0.515 (0.669)	Data 0.001 (0.156)	Loss 5.0861 (4.9799)	Top-1 acc 12.109 (14.029)	Top-5 acc 30.078 (31.737)	lr 0.03802
Warmup Train [14][90/3239]	Time 0.572 (0.651)	Data 0.001 (0.139)	Loss 5.0447 (4.9787)	Top-1 acc 15.234 (14.127)	Top-5 acc 30.469 (31.739)	lr 0.03802
Warmup Train [14][100/3239]	Time 0.527 (0.637)	Data 0.001 (0.126)	Loss 4.9949 (4.9802)	Top-1 acc 12.500 (14.001)	Top-5 acc 30.859 (31.679)	lr 0.03801
Warmup Train [14][110/3239]	Time 0.520 (0.625)	Data 0.001 (0.115)	Loss 5.0883 (4.9831)	Top-1 acc 12.109 (13.922)	Top-5 acc 28.516 (31.627)	lr 0.03801
Warmup Train [14][120/3239]	Time 0.551 (0.618)	Data 0.001 (0.106)	Loss 5.0000 (4.9862)	Top-1 acc 14.062 (13.898)	Top-5 acc 33.203 (31.573)	lr 0.03800
Warmup Train [14][130/3239]	Time 0.378 (0.607)	Data 0.001 (0.098)	Loss 4.9819 (4.9891)	Top-1 acc 16.016 (13.809)	Top-5 acc 31.250 (31.515)	lr 0.03800
Warmup Train [14][140/3239]	Time 0.320 (0.600)	Data 0.001 (0.092)	Loss 5.0692 (4.9895)	Top-1 acc 13.672 (13.838)	Top-5 acc 30.078 (31.483)	lr 0.03799
Warmup Train [14][150/3239]	Time 0.676 (0.596)	Data 0.001 (0.087)	Loss 4.9934 (4.9905)	Top-1 acc 12.109 (13.749)	Top-5 acc 30.078 (31.395)	lr 0.03798
Warmup Train [14][160/3239]	Time 0.482 (0.590)	Data 0.001 (0.082)	Loss 4.9516 (4.9904)	Top-1 acc 13.672 (13.742)	Top-5 acc 32.812 (31.422)	lr 0.03798
Warmup Train [14][170/3239]	Time 0.521 (0.586)	Data 0.002 (0.077)	Loss 4.9740 (4.9926)	Top-1 acc 12.891 (13.699)	Top-5 acc 30.078 (31.351)	lr 0.03797
Warmup Train [14][180/3239]	Time 0.514 (0.583)	Data 0.001 (0.073)	Loss 4.9233 (4.9947)	Top-1 acc 13.672 (13.691)	Top-5 acc 32.031 (31.297)	lr 0.03797
Warmup Train [14][190/3239]	Time 0.469 (0.580)	Data 0.001 (0.069)	Loss 5.0041 (4.9957)	Top-1 acc 13.672 (13.684)	Top-5 acc 32.812 (31.313)	lr 0.03796
Warmup Train [14][200/3239]	Time 0.477 (0.577)	Data 0.001 (0.066)	Loss 4.8038 (4.9924)	Top-1 acc 16.016 (13.724)	Top-5 acc 35.938 (31.359)	lr 0.03796
Warmup Train [14][210/3239]	Time 0.511 (0.574)	Data 0.001 (0.063)	Loss 4.9352 (4.9900)	Top-1 acc 14.453 (13.714)	Top-5 acc 30.859 (31.376)	lr 0.03795
Warmup Train [14][220/3239]	Time 0.552 (0.572)	Data 0.001 (0.061)	Loss 5.0808 (4.9895)	Top-1 acc 11.328 (13.727)	Top-5 acc 30.469 (31.404)	lr 0.03795
Warmup Train [14][230/3239]	Time 0.698 (0.571)	Data 0.001 (0.058)	Loss 5.0178 (4.9895)	Top-1 acc 14.453 (13.704)	Top-5 acc 32.812 (31.444)	lr 0.03794
Warmup Train [14][240/3239]	Time 0.621 (0.568)	Data 0.001 (0.056)	Loss 5.0145 (4.9898)	Top-1 acc 12.500 (13.677)	Top-5 acc 33.203 (31.430)	lr 0.03794
Warmup Train [14][250/3239]	Time 0.362 (0.565)	Data 0.001 (0.054)	Loss 4.9026 (4.9876)	Top-1 acc 10.938 (13.703)	Top-5 acc 32.812 (31.510)	lr 0.03793
Warmup Train [14][260/3239]	Time 0.388 (0.562)	Data 0.001 (0.052)	Loss 5.0729 (4.9865)	Top-1 acc 11.328 (13.721)	Top-5 acc 26.172 (31.546)	lr 0.03793
Warmup Train [14][270/3239]	Time 0.601 (0.561)	Data 0.001 (0.051)	Loss 5.0225 (4.9862)	Top-1 acc 14.453 (13.730)	Top-5 acc 31.250 (31.556)	lr 0.03792
Warmup Train [14][280/3239]	Time 0.318 (0.558)	Data 0.001 (0.049)	Loss 4.8163 (4.9869)	Top-1 acc 17.969 (13.684)	Top-5 acc 35.938 (31.485)	lr 0.03792
Warmup Train [14][290/3239]	Time 0.575 (0.555)	Data 0.002 (0.048)	Loss 4.9758 (4.9868)	Top-1 acc 14.062 (13.665)	Top-5 acc 30.469 (31.450)	lr 0.03791
Warmup Train [14][300/3239]	Time 0.623 (0.552)	Data 0.001 (0.046)	Loss 4.9396 (4.9887)	Top-1 acc 12.500 (13.641)	Top-5 acc 31.641 (31.391)	lr 0.03791
Warmup Train [14][310/3239]	Time 0.423 (0.549)	Data 0.001 (0.045)	Loss 4.9269 (4.9894)	Top-1 acc 12.891 (13.645)	Top-5 acc 32.812 (31.376)	lr 0.03790
Warmup Train [14][320/3239]	Time 0.474 (0.548)	Data 0.001 (0.044)	Loss 5.1870 (4.9885)	Top-1 acc 8.984 (13.645)	Top-5 acc 25.391 (31.394)	lr 0.03790
Warmup Train [14][330/3239]	Time 0.520 (0.547)	Data 0.001 (0.043)	Loss 4.9511 (4.9877)	Top-1 acc 13.672 (13.674)	Top-5 acc 34.375 (31.440)	lr 0.03789
Warmup Train [14][340/3239]	Time 0.534 (0.547)	Data 0.001 (0.042)	Loss 4.7813 (4.9879)	Top-1 acc 17.969 (13.684)	Top-5 acc 34.766 (31.428)	lr 0.03789
Warmup Train [14][350/3239]	Time 0.554 (0.545)	Data 0.001 (0.041)	Loss 5.0906 (4.9883)	Top-1 acc 11.719 (13.701)	Top-5 acc 28.516 (31.459)	lr 0.03788
Warmup Train [14][360/3239]	Time 0.601 (0.545)	Data 0.001 (0.040)	Loss 4.9166 (4.9883)	Top-1 acc 14.062 (13.692)	Top-5 acc 32.812 (31.474)	lr 0.03788
Warmup Train [14][370/3239]	Time 0.507 (0.544)	Data 0.001 (0.039)	Loss 5.0896 (4.9886)	Top-1 acc 11.719 (13.716)	Top-5 acc 27.734 (31.441)	lr 0.03787
Warmup Train [14][380/3239]	Time 0.408 (0.543)	Data 0.001 (0.038)	Loss 4.9232 (4.9870)	Top-1 acc 16.016 (13.757)	Top-5 acc 32.812 (31.496)	lr 0.03787
Warmup Train [14][390/3239]	Time 0.343 (0.542)	Data 0.001 (0.037)	Loss 4.9995 (4.9860)	Top-1 acc 10.156 (13.766)	Top-5 acc 29.688 (31.509)	lr 0.03786
Warmup Train [14][400/3239]	Time 0.545 (0.542)	Data 0.001 (0.037)	Loss 4.9854 (4.9850)	Top-1 acc 13.672 (13.793)	Top-5 acc 30.078 (31.528)	lr 0.03786
Warmup Train [14][410/3239]	Time 0.577 (0.542)	Data 0.001 (0.036)	Loss 5.0769 (4.9849)	Top-1 acc 13.672 (13.783)	Top-5 acc 27.734 (31.506)	lr 0.03785
Warmup Train [14][420/3239]	Time 0.586 (0.541)	Data 0.001 (0.035)	Loss 5.0439 (4.9847)	Top-1 acc 15.625 (13.792)	Top-5 acc 31.250 (31.530)	lr 0.03784
Warmup Train [14][430/3239]	Time 0.552 (0.541)	Data 0.001 (0.035)	Loss 5.0331 (4.9854)	Top-1 acc 13.672 (13.789)	Top-5 acc 32.812 (31.539)	lr 0.03784
Warmup Train [14][440/3239]	Time 0.460 (0.540)	Data 0.001 (0.034)	Loss 5.0754 (4.9865)	Top-1 acc 9.766 (13.766)	Top-5 acc 30.078 (31.499)	lr 0.03783
Warmup Train [14][450/3239]	Time 0.609 (0.540)	Data 0.001 (0.033)	Loss 5.0772 (4.9867)	Top-1 acc 13.281 (13.745)	Top-5 acc 28.516 (31.484)	lr 0.03783
Warmup Train [14][460/3239]	Time 0.429 (0.538)	Data 0.001 (0.033)	Loss 5.0527 (4.9874)	Top-1 acc 10.156 (13.725)	Top-5 acc 30.859 (31.465)	lr 0.03782
Warmup Train [14][470/3239]	Time 0.488 (0.538)	Data 0.001 (0.032)	Loss 4.9106 (4.9872)	Top-1 acc 13.281 (13.725)	Top-5 acc 36.719 (31.487)	lr 0.03782
Warmup Train [14][480/3239]	Time 0.397 (0.537)	Data 0.001 (0.032)	Loss 4.8609 (4.9875)	Top-1 acc 16.406 (13.735)	Top-5 acc 33.984 (31.496)	lr 0.03781
Warmup Train [14][490/3239]	Time 0.388 (0.537)	Data 0.001 (0.031)	Loss 4.9920 (4.9870)	Top-1 acc 16.016 (13.756)	Top-5 acc 32.422 (31.509)	lr 0.03781
Warmup Train [14][500/3239]	Time 0.369 (0.536)	Data 0.001 (0.031)	Loss 5.0880 (4.9874)	Top-1 acc 8.984 (13.737)	Top-5 acc 31.250 (31.507)	lr 0.03780
Warmup Train [14][510/3239]	Time 0.607 (0.536)	Data 0.001 (0.030)	Loss 5.0744 (4.9880)	Top-1 acc 13.672 (13.725)	Top-5 acc 30.469 (31.498)	lr 0.03780
Warmup Train [14][520/3239]	Time 0.551 (0.536)	Data 0.002 (0.030)	Loss 5.0621 (4.9892)	Top-1 acc 13.672 (13.709)	Top-5 acc 30.078 (31.470)	lr 0.03779
Warmup Train [14][530/3239]	Time 0.628 (0.535)	Data 0.001 (0.029)	Loss 4.8213 (4.9886)	Top-1 acc 14.062 (13.707)	Top-5 acc 36.328 (31.481)	lr 0.03779
Warmup Train [14][540/3239]	Time 0.410 (0.534)	Data 0.001 (0.029)	Loss 5.0462 (4.9885)	Top-1 acc 14.844 (13.730)	Top-5 acc 29.297 (31.497)	lr 0.03778
Warmup Train [14][550/3239]	Time 0.410 (0.534)	Data 0.002 (0.029)	Loss 5.1096 (4.9890)	Top-1 acc 11.328 (13.724)	Top-5 acc 29.688 (31.503)	lr 0.03778
Warmup Train [14][560/3239]	Time 0.318 (0.532)	Data 0.001 (0.028)	Loss 5.1008 (4.9893)	Top-1 acc 9.766 (13.720)	Top-5 acc 30.469 (31.492)	lr 0.03777
Warmup Train [14][570/3239]	Time 0.520 (0.532)	Data 0.001 (0.028)	Loss 5.0746 (4.9884)	Top-1 acc 11.719 (13.733)	Top-5 acc 31.641 (31.512)	lr 0.03777
Warmup Train [14][580/3239]	Time 0.509 (0.531)	Data 0.001 (0.028)	Loss 5.1110 (4.9885)	Top-1 acc 11.719 (13.726)	Top-5 acc 28.516 (31.514)	lr 0.03776
Warmup Train [14][590/3239]	Time 0.683 (0.529)	Data 0.001 (0.027)	Loss 5.1399 (4.9879)	Top-1 acc 10.547 (13.731)	Top-5 acc 25.000 (31.501)	lr 0.03776
Warmup Train [14][600/3239]	Time 0.311 (0.529)	Data 0.002 (0.027)	Loss 5.0242 (4.9873)	Top-1 acc 13.281 (13.732)	Top-5 acc 32.422 (31.518)	lr 0.03775
Warmup Train [14][610/3239]	Time 0.470 (0.529)	Data 0.001 (0.027)	Loss 4.9592 (4.9869)	Top-1 acc 13.672 (13.742)	Top-5 acc 31.641 (31.517)	lr 0.03775
Warmup Train [14][620/3239]	Time 0.514 (0.529)	Data 0.001 (0.026)	Loss 5.1000 (4.9860)	Top-1 acc 12.109 (13.762)	Top-5 acc 24.219 (31.529)	lr 0.03774
Warmup Train [14][630/3239]	Time 0.455 (0.528)	Data 0.001 (0.026)	Loss 4.9710 (4.9864)	Top-1 acc 14.453 (13.761)	Top-5 acc 30.859 (31.533)	lr 0.03774
Warmup Train [14][640/3239]	Time 0.629 (0.528)	Data 0.001 (0.026)	Loss 5.1466 (4.9861)	Top-1 acc 14.453 (13.767)	Top-5 acc 28.906 (31.547)	lr 0.03773
Warmup Train [14][650/3239]	Time 0.384 (0.528)	Data 0.001 (0.025)	Loss 5.0168 (4.9861)	Top-1 acc 14.453 (13.763)	Top-5 acc 32.422 (31.554)	lr 0.03772
Warmup Train [14][660/3239]	Time 0.423 (0.527)	Data 0.001 (0.025)	Loss 4.9434 (4.9866)	Top-1 acc 11.328 (13.762)	Top-5 acc 30.469 (31.548)	lr 0.03772
Warmup Train [14][670/3239]	Time 0.580 (0.527)	Data 0.001 (0.025)	Loss 4.8220 (4.9866)	Top-1 acc 17.969 (13.773)	Top-5 acc 35.547 (31.552)	lr 0.03771
Warmup Train [14][680/3239]	Time 0.456 (0.527)	Data 0.001 (0.024)	Loss 4.9206 (4.9867)	Top-1 acc 14.453 (13.774)	Top-5 acc 34.766 (31.548)	lr 0.03771
Warmup Train [14][690/3239]	Time 0.542 (0.527)	Data 0.001 (0.024)	Loss 4.9619 (4.9858)	Top-1 acc 13.672 (13.796)	Top-5 acc 35.938 (31.575)	lr 0.03770
Warmup Train [14][700/3239]	Time 0.622 (0.527)	Data 0.001 (0.024)	Loss 5.0086 (4.9854)	Top-1 acc 10.938 (13.781)	Top-5 acc 32.031 (31.581)	lr 0.03770
Warmup Train [14][710/3239]	Time 0.543 (0.527)	Data 0.002 (0.024)	Loss 4.9810 (4.9850)	Top-1 acc 12.109 (13.787)	Top-5 acc 30.469 (31.599)	lr 0.03769
Warmup Train [14][720/3239]	Time 0.425 (0.526)	Data 0.001 (0.023)	Loss 5.0300 (4.9847)	Top-1 acc 13.672 (13.779)	Top-5 acc 32.031 (31.601)	lr 0.03769
Warmup Train [14][730/3239]	Time 0.592 (0.526)	Data 0.001 (0.023)	Loss 4.8898 (4.9844)	Top-1 acc 11.328 (13.775)	Top-5 acc 33.984 (31.602)	lr 0.03768
Warmup Train [14][740/3239]	Time 0.520 (0.526)	Data 0.001 (0.023)	Loss 4.9721 (4.9845)	Top-1 acc 13.672 (13.776)	Top-5 acc 27.344 (31.594)	lr 0.03768
Warmup Train [14][750/3239]	Time 0.451 (0.525)	Data 0.001 (0.023)	Loss 4.9484 (4.9842)	Top-1 acc 15.234 (13.777)	Top-5 acc 32.031 (31.605)	lr 0.03767
Warmup Train [14][760/3239]	Time 0.465 (0.525)	Data 0.001 (0.022)	Loss 4.9687 (4.9841)	Top-1 acc 14.062 (13.785)	Top-5 acc 31.641 (31.607)	lr 0.03767
Warmup Train [14][770/3239]	Time 0.537 (0.525)	Data 0.001 (0.022)	Loss 4.8421 (4.9840)	Top-1 acc 15.234 (13.793)	Top-5 acc 36.328 (31.610)	lr 0.03766
Warmup Train [14][780/3239]	Time 0.598 (0.525)	Data 0.001 (0.022)	Loss 5.0662 (4.9840)	Top-1 acc 9.766 (13.785)	Top-5 acc 26.953 (31.605)	lr 0.03766
Warmup Train [14][790/3239]	Time 0.416 (0.525)	Data 0.001 (0.022)	Loss 4.7798 (4.9838)	Top-1 acc 17.578 (13.786)	Top-5 acc 36.719 (31.607)	lr 0.03765
Warmup Train [14][800/3239]	Time 0.560 (0.525)	Data 0.001 (0.022)	Loss 4.9312 (4.9838)	Top-1 acc 15.234 (13.785)	Top-5 acc 33.203 (31.602)	lr 0.03765
Warmup Train [14][810/3239]	Time 0.550 (0.525)	Data 0.001 (0.021)	Loss 4.8584 (4.9833)	Top-1 acc 14.844 (13.797)	Top-5 acc 36.719 (31.604)	lr 0.03764
Warmup Train [14][820/3239]	Time 0.673 (0.525)	Data 0.001 (0.021)	Loss 4.9172 (4.9831)	Top-1 acc 18.359 (13.809)	Top-5 acc 35.938 (31.606)	lr 0.03764
Warmup Train [14][830/3239]	Time 0.479 (0.524)	Data 0.001 (0.021)	Loss 4.8918 (4.9832)	Top-1 acc 17.188 (13.807)	Top-5 acc 33.984 (31.611)	lr 0.03763
Warmup Train [14][840/3239]	Time 0.299 (0.524)	Data 0.001 (0.021)	Loss 4.9358 (4.9832)	Top-1 acc 13.281 (13.808)	Top-5 acc 31.250 (31.596)	lr 0.03763
Warmup Train [14][850/3239]	Time 0.619 (0.523)	Data 0.002 (0.021)	Loss 5.0424 (4.9837)	Top-1 acc 11.719 (13.796)	Top-5 acc 29.688 (31.583)	lr 0.03762
Warmup Train [14][860/3239]	Time 0.460 (0.523)	Data 0.001 (0.020)	Loss 4.9653 (4.9835)	Top-1 acc 14.453 (13.798)	Top-5 acc 32.422 (31.587)	lr 0.03762
Warmup Train [14][870/3239]	Time 0.633 (0.522)	Data 0.001 (0.020)	Loss 4.9997 (4.9838)	Top-1 acc 12.891 (13.791)	Top-5 acc 32.031 (31.577)	lr 0.03761
Warmup Train [14][880/3239]	Time 0.466 (0.522)	Data 0.001 (0.020)	Loss 5.0969 (4.9838)	Top-1 acc 14.453 (13.803)	Top-5 acc 32.031 (31.595)	lr 0.03760
Warmup Train [14][890/3239]	Time 0.526 (0.522)	Data 0.001 (0.020)	Loss 5.0506 (4.9838)	Top-1 acc 12.891 (13.810)	Top-5 acc 27.734 (31.598)	lr 0.03760
Warmup Train [14][900/3239]	Time 0.437 (0.522)	Data 0.001 (0.020)	Loss 5.0825 (4.9831)	Top-1 acc 13.281 (13.813)	Top-5 acc 29.297 (31.607)	lr 0.03759
Warmup Train [14][910/3239]	Time 0.585 (0.522)	Data 0.001 (0.020)	Loss 4.8994 (4.9827)	Top-1 acc 14.844 (13.834)	Top-5 acc 34.375 (31.613)	lr 0.03759
Warmup Train [14][920/3239]	Time 0.581 (0.521)	Data 0.001 (0.019)	Loss 4.9730 (4.9827)	Top-1 acc 16.016 (13.835)	Top-5 acc 32.031 (31.616)	lr 0.03758
Warmup Train [14][930/3239]	Time 0.700 (0.521)	Data 0.001 (0.019)	Loss 5.0245 (4.9827)	Top-1 acc 14.062 (13.833)	Top-5 acc 33.984 (31.623)	lr 0.03758
Warmup Train [14][940/3239]	Time 0.501 (0.521)	Data 0.001 (0.019)	Loss 5.0274 (4.9832)	Top-1 acc 12.891 (13.820)	Top-5 acc 32.031 (31.618)	lr 0.03757
Warmup Train [14][950/3239]	Time 0.344 (0.521)	Data 0.001 (0.019)	Loss 5.0116 (4.9832)	Top-1 acc 11.328 (13.827)	Top-5 acc 32.812 (31.614)	lr 0.03757
Warmup Train [14][960/3239]	Time 0.378 (0.521)	Data 0.001 (0.019)	Loss 4.9262 (4.9829)	Top-1 acc 16.406 (13.822)	Top-5 acc 34.766 (31.624)	lr 0.03756
Warmup Train [14][970/3239]	Time 0.383 (0.521)	Data 0.001 (0.019)	Loss 5.0458 (4.9829)	Top-1 acc 14.844 (13.829)	Top-5 acc 30.469 (31.634)	lr 0.03756
Warmup Train [14][980/3239]	Time 0.508 (0.521)	Data 0.001 (0.019)	Loss 4.8925 (4.9828)	Top-1 acc 13.672 (13.832)	Top-5 acc 32.812 (31.639)	lr 0.03755
Warmup Train [14][990/3239]	Time 0.476 (0.521)	Data 0.001 (0.019)	Loss 4.9280 (4.9826)	Top-1 acc 14.062 (13.843)	Top-5 acc 33.203 (31.649)	lr 0.03755
Warmup Train [14][1000/3239]	Time 0.447 (0.521)	Data 0.001 (0.019)	Loss 5.0711 (4.9825)	Top-1 acc 12.891 (13.850)	Top-5 acc 30.078 (31.649)	lr 0.03754
Warmup Train [14][1010/3239]	Time 0.673 (0.521)	Data 0.001 (0.018)	Loss 4.9346 (4.9826)	Top-1 acc 14.062 (13.841)	Top-5 acc 36.719 (31.647)	lr 0.03754
Warmup Train [14][1020/3239]	Time 0.520 (0.521)	Data 0.001 (0.018)	Loss 4.9543 (4.9826)	Top-1 acc 12.500 (13.839)	Top-5 acc 32.422 (31.656)	lr 0.03753
Warmup Train [14][1030/3239]	Time 0.529 (0.521)	Data 0.001 (0.018)	Loss 4.9215 (4.9825)	Top-1 acc 13.672 (13.839)	Top-5 acc 35.547 (31.664)	lr 0.03753
Warmup Train [14][1040/3239]	Time 0.401 (0.521)	Data 0.001 (0.018)	Loss 4.9743 (4.9823)	Top-1 acc 16.797 (13.845)	Top-5 acc 33.203 (31.668)	lr 0.03752
Warmup Train [14][1050/3239]	Time 0.435 (0.521)	Data 0.001 (0.018)	Loss 5.2689 (4.9826)	Top-1 acc 10.938 (13.846)	Top-5 acc 26.953 (31.666)	lr 0.03752
Warmup Train [14][1060/3239]	Time 0.475 (0.521)	Data 0.001 (0.018)	Loss 4.8268 (4.9828)	Top-1 acc 15.625 (13.848)	Top-5 acc 34.375 (31.664)	lr 0.03751
Warmup Train [14][1070/3239]	Time 0.614 (0.521)	Data 0.001 (0.018)	Loss 4.9344 (4.9832)	Top-1 acc 13.281 (13.837)	Top-5 acc 33.203 (31.654)	lr 0.03751
Warmup Train [14][1080/3239]	Time 0.505 (0.521)	Data 0.001 (0.018)	Loss 4.9819 (4.9832)	Top-1 acc 12.500 (13.832)	Top-5 acc 33.594 (31.661)	lr 0.03750
Warmup Train [14][1090/3239]	Time 0.720 (0.521)	Data 0.001 (0.018)	Loss 4.9717 (4.9833)	Top-1 acc 14.453 (13.838)	Top-5 acc 30.078 (31.656)	lr 0.03749
Warmup Train [14][1100/3239]	Time 0.380 (0.520)	Data 0.001 (0.017)	Loss 4.9586 (4.9830)	Top-1 acc 13.281 (13.842)	Top-5 acc 33.984 (31.663)	lr 0.03749
Warmup Train [14][1110/3239]	Time 0.582 (0.520)	Data 0.001 (0.017)	Loss 5.0190 (4.9834)	Top-1 acc 9.766 (13.837)	Top-5 acc 29.297 (31.647)	lr 0.03748
Warmup Train [14][1120/3239]	Time 0.213 (0.520)	Data 0.001 (0.017)	Loss 4.8221 (4.9836)	Top-1 acc 17.969 (13.834)	Top-5 acc 35.547 (31.649)	lr 0.03748
Warmup Train [14][1130/3239]	Time 0.470 (0.520)	Data 0.001 (0.017)	Loss 4.9735 (4.9834)	Top-1 acc 12.891 (13.849)	Top-5 acc 35.547 (31.670)	lr 0.03747
Warmup Train [14][1140/3239]	Time 0.685 (0.520)	Data 0.001 (0.017)	Loss 4.8432 (4.9831)	Top-1 acc 14.844 (13.841)	Top-5 acc 36.719 (31.673)	lr 0.03747
Warmup Train [14][1150/3239]	Time 0.588 (0.519)	Data 0.001 (0.017)	Loss 4.9266 (4.9829)	Top-1 acc 13.281 (13.847)	Top-5 acc 32.422 (31.676)	lr 0.03746
Warmup Train [14][1160/3239]	Time 0.451 (0.519)	Data 0.001 (0.017)	Loss 4.9153 (4.9829)	Top-1 acc 12.891 (13.840)	Top-5 acc 35.938 (31.683)	lr 0.03746
Warmup Train [14][1170/3239]	Time 0.536 (0.519)	Data 0.001 (0.017)	Loss 4.9106 (4.9830)	Top-1 acc 12.109 (13.832)	Top-5 acc 30.469 (31.669)	lr 0.03745
Warmup Train [14][1180/3239]	Time 0.479 (0.519)	Data 0.001 (0.017)	Loss 4.9958 (4.9830)	Top-1 acc 11.719 (13.838)	Top-5 acc 32.422 (31.670)	lr 0.03745
Warmup Train [14][1190/3239]	Time 0.590 (0.519)	Data 0.001 (0.017)	Loss 4.8365 (4.9825)	Top-1 acc 17.578 (13.852)	Top-5 acc 34.375 (31.684)	lr 0.03744
Warmup Train [14][1200/3239]	Time 0.644 (0.519)	Data 0.001 (0.017)	Loss 4.8053 (4.9826)	Top-1 acc 19.922 (13.858)	Top-5 acc 36.328 (31.697)	lr 0.03744
Warmup Train [14][1210/3239]	Time 0.508 (0.519)	Data 0.001 (0.016)	Loss 5.0628 (4.9823)	Top-1 acc 13.281 (13.857)	Top-5 acc 27.344 (31.697)	lr 0.03743
Warmup Train [14][1220/3239]	Time 0.484 (0.519)	Data 0.002 (0.016)	Loss 5.0015 (4.9823)	Top-1 acc 10.547 (13.856)	Top-5 acc 30.078 (31.696)	lr 0.03743
Warmup Train [14][1230/3239]	Time 0.518 (0.519)	Data 0.001 (0.016)	Loss 4.8762 (4.9822)	Top-1 acc 15.625 (13.858)	Top-5 acc 32.031 (31.701)	lr 0.03742
Warmup Train [14][1240/3239]	Time 0.402 (0.519)	Data 0.001 (0.016)	Loss 4.9621 (4.9814)	Top-1 acc 16.016 (13.863)	Top-5 acc 30.469 (31.706)	lr 0.03742
Warmup Train [14][1250/3239]	Time 0.560 (0.519)	Data 0.001 (0.016)	Loss 4.7849 (4.9816)	Top-1 acc 18.359 (13.863)	Top-5 acc 35.938 (31.711)	lr 0.03741
Warmup Train [14][1260/3239]	Time 0.563 (0.519)	Data 0.001 (0.016)	Loss 5.1814 (4.9816)	Top-1 acc 13.672 (13.859)	Top-5 acc 32.422 (31.713)	lr 0.03741
Warmup Train [14][1270/3239]	Time 0.526 (0.519)	Data 0.001 (0.016)	Loss 4.9236 (4.9814)	Top-1 acc 15.234 (13.854)	Top-5 acc 33.594 (31.711)	lr 0.03740
Warmup Train [14][1280/3239]	Time 0.373 (0.519)	Data 0.001 (0.016)	Loss 4.9893 (4.9813)	Top-1 acc 12.500 (13.856)	Top-5 acc 30.859 (31.708)	lr 0.03739
Warmup Train [14][1290/3239]	Time 0.517 (0.519)	Data 0.001 (0.016)	Loss 4.8925 (4.9814)	Top-1 acc 16.016 (13.864)	Top-5 acc 32.422 (31.709)	lr 0.03739
Warmup Train [14][1300/3239]	Time 0.546 (0.519)	Data 0.001 (0.016)	Loss 4.8679 (4.9811)	Top-1 acc 16.016 (13.877)	Top-5 acc 33.203 (31.720)	lr 0.03738
Warmup Train [14][1310/3239]	Time 0.606 (0.519)	Data 0.001 (0.016)	Loss 4.9331 (4.9807)	Top-1 acc 14.453 (13.883)	Top-5 acc 34.766 (31.736)	lr 0.03738
Warmup Train [14][1320/3239]	Time 0.647 (0.519)	Data 0.001 (0.016)	Loss 4.8617 (4.9802)	Top-1 acc 14.453 (13.878)	Top-5 acc 33.594 (31.749)	lr 0.03737
Warmup Train [14][1330/3239]	Time 0.426 (0.519)	Data 0.001 (0.016)	Loss 5.0350 (4.9800)	Top-1 acc 10.938 (13.879)	Top-5 acc 29.688 (31.754)	lr 0.03737
Warmup Train [14][1340/3239]	Time 0.662 (0.519)	Data 0.001 (0.016)	Loss 5.0413 (4.9802)	Top-1 acc 13.281 (13.883)	Top-5 acc 31.250 (31.749)	lr 0.03736
Warmup Train [14][1350/3239]	Time 0.482 (0.519)	Data 0.001 (0.015)	Loss 5.0476 (4.9803)	Top-1 acc 16.797 (13.885)	Top-5 acc 30.859 (31.755)	lr 0.03736
Warmup Train [14][1360/3239]	Time 0.521 (0.519)	Data 0.001 (0.015)	Loss 5.0276 (4.9799)	Top-1 acc 12.500 (13.896)	Top-5 acc 31.250 (31.760)	lr 0.03735
Warmup Train [14][1370/3239]	Time 0.585 (0.519)	Data 0.001 (0.015)	Loss 5.1357 (4.9798)	Top-1 acc 11.328 (13.894)	Top-5 acc 24.609 (31.759)	lr 0.03735
Warmup Train [14][1380/3239]	Time 0.440 (0.519)	Data 0.001 (0.015)	Loss 4.9242 (4.9798)	Top-1 acc 16.406 (13.894)	Top-5 acc 32.031 (31.760)	lr 0.03734
Warmup Train [14][1390/3239]	Time 0.345 (0.519)	Data 0.001 (0.015)	Loss 4.8975 (4.9799)	Top-1 acc 14.844 (13.901)	Top-5 acc 33.203 (31.764)	lr 0.03734
Warmup Train [14][1400/3239]	Time 0.489 (0.518)	Data 0.001 (0.015)	Loss 4.9564 (4.9800)	Top-1 acc 12.500 (13.900)	Top-5 acc 30.078 (31.762)	lr 0.03733
Warmup Train [14][1410/3239]	Time 0.616 (0.518)	Data 0.001 (0.015)	Loss 4.8828 (4.9796)	Top-1 acc 12.109 (13.902)	Top-5 acc 32.812 (31.765)	lr 0.03733
Warmup Train [14][1420/3239]	Time 0.184 (0.518)	Data 0.001 (0.015)	Loss 4.9448 (4.9794)	Top-1 acc 13.281 (13.904)	Top-5 acc 33.594 (31.768)	lr 0.03732
Warmup Train [14][1430/3239]	Time 0.577 (0.518)	Data 0.001 (0.015)	Loss 4.9573 (4.9794)	Top-1 acc 14.062 (13.906)	Top-5 acc 30.859 (31.769)	lr 0.03732
Warmup Train [14][1440/3239]	Time 0.597 (0.518)	Data 0.001 (0.015)	Loss 4.7300 (4.9792)	Top-1 acc 20.312 (13.908)	Top-5 acc 37.891 (31.769)	lr 0.03731
Warmup Train [14][1450/3239]	Time 0.442 (0.518)	Data 0.001 (0.015)	Loss 5.1114 (4.9791)	Top-1 acc 14.062 (13.907)	Top-5 acc 27.734 (31.769)	lr 0.03731
Warmup Train [14][1460/3239]	Time 0.451 (0.518)	Data 0.001 (0.015)	Loss 5.0409 (4.9793)	Top-1 acc 15.625 (13.904)	Top-5 acc 33.594 (31.772)	lr 0.03730
Warmup Train [14][1470/3239]	Time 0.523 (0.517)	Data 0.001 (0.015)	Loss 5.0191 (4.9792)	Top-1 acc 12.891 (13.908)	Top-5 acc 31.641 (31.783)	lr 0.03729
Warmup Train [14][1480/3239]	Time 0.494 (0.517)	Data 0.001 (0.015)	Loss 5.0349 (4.9790)	Top-1 acc 14.453 (13.913)	Top-5 acc 30.078 (31.789)	lr 0.03729
Warmup Train [14][1490/3239]	Time 0.611 (0.517)	Data 0.001 (0.015)	Loss 4.9703 (4.9795)	Top-1 acc 16.016 (13.903)	Top-5 acc 35.156 (31.777)	lr 0.03728
Warmup Train [14][1500/3239]	Time 0.394 (0.517)	Data 0.001 (0.015)	Loss 5.0897 (4.9798)	Top-1 acc 14.062 (13.897)	Top-5 acc 29.688 (31.770)	lr 0.03728
Warmup Train [14][1510/3239]	Time 0.343 (0.517)	Data 0.001 (0.015)	Loss 4.9486 (4.9797)	Top-1 acc 12.109 (13.901)	Top-5 acc 32.812 (31.772)	lr 0.03727
Warmup Train [14][1520/3239]	Time 0.452 (0.517)	Data 0.001 (0.015)	Loss 4.9232 (4.9796)	Top-1 acc 15.625 (13.905)	Top-5 acc 31.641 (31.776)	lr 0.03727
Warmup Train [14][1530/3239]	Time 0.538 (0.517)	Data 0.003 (0.014)	Loss 4.7416 (4.9797)	Top-1 acc 15.625 (13.892)	Top-5 acc 39.453 (31.773)	lr 0.03726
Warmup Train [14][1540/3239]	Time 0.533 (0.517)	Data 0.002 (0.014)	Loss 4.9375 (4.9795)	Top-1 acc 14.453 (13.894)	Top-5 acc 33.594 (31.774)	lr 0.03726
Warmup Train [14][1550/3239]	Time 0.617 (0.517)	Data 0.001 (0.014)	Loss 4.9301 (4.9797)	Top-1 acc 16.016 (13.890)	Top-5 acc 33.203 (31.766)	lr 0.03725
Warmup Train [14][1560/3239]	Time 0.524 (0.517)	Data 0.001 (0.014)	Loss 4.8063 (4.9797)	Top-1 acc 17.578 (13.893)	Top-5 acc 35.547 (31.767)	lr 0.03725
Warmup Train [14][1570/3239]	Time 0.550 (0.517)	Data 0.001 (0.014)	Loss 4.8843 (4.9794)	Top-1 acc 13.672 (13.888)	Top-5 acc 29.297 (31.770)	lr 0.03724
Warmup Train [14][1580/3239]	Time 0.482 (0.517)	Data 0.004 (0.014)	Loss 4.8720 (4.9792)	Top-1 acc 12.891 (13.892)	Top-5 acc 35.156 (31.768)	lr 0.03724
Warmup Train [14][1590/3239]	Time 0.605 (0.517)	Data 0.001 (0.014)	Loss 4.8377 (4.9792)	Top-1 acc 12.500 (13.892)	Top-5 acc 34.375 (31.770)	lr 0.03723
Warmup Train [14][1600/3239]	Time 0.328 (0.517)	Data 0.001 (0.014)	Loss 4.8431 (4.9790)	Top-1 acc 18.359 (13.899)	Top-5 acc 36.719 (31.777)	lr 0.03723
Warmup Train [14][1610/3239]	Time 0.375 (0.517)	Data 0.001 (0.014)	Loss 5.0525 (4.9791)	Top-1 acc 11.719 (13.898)	Top-5 acc 30.469 (31.773)	lr 0.03722
Warmup Train [14][1620/3239]	Time 0.369 (0.517)	Data 0.001 (0.014)	Loss 5.0351 (4.9787)	Top-1 acc 12.109 (13.905)	Top-5 acc 31.250 (31.787)	lr 0.03722
Warmup Train [14][1630/3239]	Time 0.448 (0.517)	Data 0.001 (0.014)	Loss 5.1021 (4.9786)	Top-1 acc 12.500 (13.907)	Top-5 acc 26.953 (31.787)	lr 0.03721
Warmup Train [14][1640/3239]	Time 0.486 (0.517)	Data 0.001 (0.014)	Loss 4.8308 (4.9785)	Top-1 acc 17.969 (13.909)	Top-5 acc 35.938 (31.793)	lr 0.03720
Warmup Train [14][1650/3239]	Time 0.537 (0.517)	Data 0.001 (0.014)	Loss 4.8607 (4.9784)	Top-1 acc 12.500 (13.908)	Top-5 acc 34.375 (31.794)	lr 0.03720
Warmup Train [14][1660/3239]	Time 0.395 (0.517)	Data 0.001 (0.014)	Loss 5.0516 (4.9785)	Top-1 acc 15.234 (13.913)	Top-5 acc 33.594 (31.794)	lr 0.03719
Warmup Train [14][1670/3239]	Time 0.641 (0.517)	Data 0.001 (0.014)	Loss 5.1096 (4.9786)	Top-1 acc 11.328 (13.911)	Top-5 acc 30.469 (31.792)	lr 0.03719
Warmup Train [14][1680/3239]	Time 0.295 (0.517)	Data 0.001 (0.014)	Loss 4.9562 (4.9784)	Top-1 acc 15.234 (13.907)	Top-5 acc 32.031 (31.790)	lr 0.03718
Warmup Train [14][1690/3239]	Time 0.505 (0.517)	Data 0.001 (0.014)	Loss 5.1350 (4.9783)	Top-1 acc 12.109 (13.907)	Top-5 acc 31.250 (31.790)	lr 0.03718
Warmup Train [14][1700/3239]	Time 0.325 (0.516)	Data 0.001 (0.014)	Loss 4.8007 (4.9781)	Top-1 acc 14.062 (13.910)	Top-5 acc 34.375 (31.792)	lr 0.03717
Warmup Train [14][1710/3239]	Time 0.724 (0.516)	Data 0.001 (0.014)	Loss 4.9226 (4.9782)	Top-1 acc 12.500 (13.906)	Top-5 acc 33.203 (31.784)	lr 0.03717
Warmup Train [14][1720/3239]	Time 0.399 (0.516)	Data 0.001 (0.014)	Loss 4.9713 (4.9779)	Top-1 acc 15.234 (13.912)	Top-5 acc 34.766 (31.794)	lr 0.03716
Warmup Train [14][1730/3239]	Time 0.476 (0.516)	Data 0.001 (0.014)	Loss 4.8988 (4.9777)	Top-1 acc 14.062 (13.914)	Top-5 acc 32.422 (31.791)	lr 0.03716
Warmup Train [14][1740/3239]	Time 0.535 (0.516)	Data 0.001 (0.014)	Loss 5.0543 (4.9774)	Top-1 acc 14.844 (13.918)	Top-5 acc 29.688 (31.797)	lr 0.03715
Warmup Train [14][1750/3239]	Time 0.633 (0.516)	Data 0.001 (0.014)	Loss 5.0319 (4.9774)	Top-1 acc 16.016 (13.922)	Top-5 acc 32.031 (31.797)	lr 0.03715
Warmup Train [14][1760/3239]	Time 0.399 (0.516)	Data 0.001 (0.014)	Loss 4.8499 (4.9772)	Top-1 acc 14.453 (13.920)	Top-5 acc 33.594 (31.801)	lr 0.03714
Warmup Train [14][1770/3239]	Time 0.406 (0.516)	Data 0.001 (0.014)	Loss 4.9264 (4.9769)	Top-1 acc 12.500 (13.920)	Top-5 acc 29.688 (31.808)	lr 0.03714
Warmup Train [14][1780/3239]	Time 0.624 (0.516)	Data 0.002 (0.014)	Loss 5.0059 (4.9767)	Top-1 acc 12.109 (13.921)	Top-5 acc 30.078 (31.809)	lr 0.03713
Warmup Train [14][1790/3239]	Time 0.487 (0.516)	Data 0.001 (0.014)	Loss 5.0025 (4.9766)	Top-1 acc 14.453 (13.923)	Top-5 acc 30.078 (31.812)	lr 0.03713
Warmup Train [14][1800/3239]	Time 0.512 (0.516)	Data 0.001 (0.014)	Loss 4.7762 (4.9763)	Top-1 acc 14.844 (13.933)	Top-5 acc 35.156 (31.821)	lr 0.03712
Warmup Train [14][1810/3239]	Time 0.388 (0.516)	Data 0.001 (0.014)	Loss 4.9932 (4.9761)	Top-1 acc 17.578 (13.940)	Top-5 acc 33.203 (31.821)	lr 0.03711
Warmup Train [14][1820/3239]	Time 0.494 (0.516)	Data 0.001 (0.014)	Loss 5.0570 (4.9760)	Top-1 acc 14.453 (13.941)	Top-5 acc 32.031 (31.824)	lr 0.03711
Warmup Train [14][1830/3239]	Time 0.478 (0.516)	Data 0.001 (0.013)	Loss 5.0604 (4.9760)	Top-1 acc 11.719 (13.941)	Top-5 acc 28.906 (31.822)	lr 0.03710
Warmup Train [14][1840/3239]	Time 0.597 (0.516)	Data 0.002 (0.013)	Loss 4.8080 (4.9760)	Top-1 acc 14.062 (13.940)	Top-5 acc 36.328 (31.823)	lr 0.03710
Warmup Train [14][1850/3239]	Time 0.387 (0.516)	Data 0.001 (0.013)	Loss 4.9935 (4.9758)	Top-1 acc 15.625 (13.942)	Top-5 acc 32.422 (31.830)	lr 0.03709
Warmup Train [14][1860/3239]	Time 0.483 (0.516)	Data 0.001 (0.013)	Loss 4.9184 (4.9756)	Top-1 acc 15.234 (13.942)	Top-5 acc 33.203 (31.834)	lr 0.03709
Warmup Train [14][1870/3239]	Time 0.484 (0.516)	Data 0.001 (0.013)	Loss 5.0821 (4.9759)	Top-1 acc 12.500 (13.940)	Top-5 acc 30.469 (31.830)	lr 0.03708
Warmup Train [14][1880/3239]	Time 0.557 (0.516)	Data 0.001 (0.013)	Loss 5.0282 (4.9758)	Top-1 acc 13.672 (13.939)	Top-5 acc 32.031 (31.834)	lr 0.03708
Warmup Train [14][1890/3239]	Time 0.605 (0.516)	Data 0.001 (0.013)	Loss 4.9157 (4.9754)	Top-1 acc 14.844 (13.943)	Top-5 acc 29.688 (31.841)	lr 0.03707
Warmup Train [14][1900/3239]	Time 0.503 (0.516)	Data 0.001 (0.013)	Loss 5.0031 (4.9751)	Top-1 acc 11.328 (13.948)	Top-5 acc 28.516 (31.849)	lr 0.03707
Warmup Train [14][1910/3239]	Time 0.365 (0.516)	Data 0.001 (0.013)	Loss 5.0993 (4.9752)	Top-1 acc 12.500 (13.945)	Top-5 acc 28.906 (31.851)	lr 0.03706
Warmup Train [14][1920/3239]	Time 0.574 (0.516)	Data 0.001 (0.013)	Loss 4.9892 (4.9749)	Top-1 acc 17.188 (13.955)	Top-5 acc 33.594 (31.860)	lr 0.03706
Warmup Train [14][1930/3239]	Time 0.502 (0.516)	Data 0.001 (0.013)	Loss 4.8528 (4.9746)	Top-1 acc 16.016 (13.959)	Top-5 acc 33.594 (31.871)	lr 0.03705
Warmup Train [14][1940/3239]	Time 0.432 (0.516)	Data 0.001 (0.013)	Loss 4.9331 (4.9743)	Top-1 acc 13.281 (13.963)	Top-5 acc 35.938 (31.877)	lr 0.03705
Warmup Train [14][1950/3239]	Time 0.599 (0.516)	Data 0.001 (0.013)	Loss 4.9592 (4.9744)	Top-1 acc 11.719 (13.956)	Top-5 acc 31.641 (31.874)	lr 0.03704
Warmup Train [14][1960/3239]	Time 0.392 (0.515)	Data 0.002 (0.013)	Loss 5.0866 (4.9745)	Top-1 acc 12.109 (13.957)	Top-5 acc 26.562 (31.876)	lr 0.03704
Warmup Train [14][1970/3239]	Time 0.479 (0.515)	Data 0.001 (0.013)	Loss 4.8791 (4.9744)	Top-1 acc 16.016 (13.957)	Top-5 acc 33.203 (31.874)	lr 0.03703
Warmup Train [14][1980/3239]	Time 0.281 (0.515)	Data 0.001 (0.013)	Loss 4.9813 (4.9743)	Top-1 acc 13.281 (13.958)	Top-5 acc 33.594 (31.878)	lr 0.03702
Warmup Train [14][1990/3239]	Time 0.623 (0.515)	Data 0.001 (0.013)	Loss 5.0136 (4.9739)	Top-1 acc 14.062 (13.960)	Top-5 acc 33.594 (31.885)	lr 0.03702
Warmup Train [14][2000/3239]	Time 0.606 (0.515)	Data 0.001 (0.013)	Loss 4.9926 (4.9739)	Top-1 acc 12.500 (13.961)	Top-5 acc 34.375 (31.893)	lr 0.03701
Warmup Train [14][2010/3239]	Time 0.497 (0.515)	Data 0.001 (0.013)	Loss 4.8256 (4.9741)	Top-1 acc 15.625 (13.958)	Top-5 acc 35.547 (31.889)	lr 0.03701
Warmup Train [14][2020/3239]	Time 0.372 (0.515)	Data 0.001 (0.013)	Loss 5.1391 (4.9738)	Top-1 acc 14.062 (13.962)	Top-5 acc 26.172 (31.892)	lr 0.03700
Warmup Train [14][2030/3239]	Time 0.469 (0.515)	Data 0.001 (0.013)	Loss 4.9010 (4.9737)	Top-1 acc 12.500 (13.961)	Top-5 acc 36.719 (31.895)	lr 0.03700
Warmup Train [14][2040/3239]	Time 0.482 (0.515)	Data 0.001 (0.013)	Loss 4.9175 (4.9736)	Top-1 acc 13.672 (13.957)	Top-5 acc 30.859 (31.893)	lr 0.03699
Warmup Train [14][2050/3239]	Time 0.671 (0.515)	Data 0.001 (0.013)	Loss 5.0645 (4.9735)	Top-1 acc 12.109 (13.960)	Top-5 acc 30.078 (31.896)	lr 0.03699
Warmup Train [14][2060/3239]	Time 0.533 (0.515)	Data 0.001 (0.013)	Loss 5.0059 (4.9734)	Top-1 acc 15.234 (13.960)	Top-5 acc 31.250 (31.893)	lr 0.03698
Warmup Train [14][2070/3239]	Time 0.337 (0.515)	Data 0.001 (0.013)	Loss 4.8863 (4.9729)	Top-1 acc 16.016 (13.962)	Top-5 acc 32.812 (31.900)	lr 0.03698
Warmup Train [14][2080/3239]	Time 0.504 (0.515)	Data 0.001 (0.013)	Loss 4.7529 (4.9726)	Top-1 acc 15.234 (13.969)	Top-5 acc 36.328 (31.905)	lr 0.03697
Warmup Train [14][2090/3239]	Time 0.529 (0.515)	Data 0.032 (0.013)	Loss 4.9731 (4.9726)	Top-1 acc 11.719 (13.970)	Top-5 acc 34.766 (31.906)	lr 0.03697
Warmup Train [14][2100/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 5.0310 (4.9728)	Top-1 acc 11.328 (13.968)	Top-5 acc 29.297 (31.901)	lr 0.03696
Warmup Train [14][2110/3239]	Time 0.571 (0.515)	Data 0.001 (0.013)	Loss 4.8943 (4.9726)	Top-1 acc 17.188 (13.972)	Top-5 acc 32.422 (31.906)	lr 0.03696
Warmup Train [14][2120/3239]	Time 0.425 (0.515)	Data 0.001 (0.013)	Loss 5.2167 (4.9725)	Top-1 acc 9.766 (13.973)	Top-5 acc 24.219 (31.902)	lr 0.03695
Warmup Train [14][2130/3239]	Time 0.394 (0.515)	Data 0.001 (0.013)	Loss 4.9180 (4.9725)	Top-1 acc 15.234 (13.974)	Top-5 acc 32.812 (31.903)	lr 0.03694
Warmup Train [14][2140/3239]	Time 0.568 (0.515)	Data 0.003 (0.013)	Loss 4.9652 (4.9724)	Top-1 acc 14.062 (13.981)	Top-5 acc 32.422 (31.905)	lr 0.03694
Warmup Train [14][2150/3239]	Time 0.566 (0.515)	Data 0.001 (0.013)	Loss 4.9733 (4.9722)	Top-1 acc 14.062 (13.988)	Top-5 acc 31.641 (31.915)	lr 0.03693
Warmup Train [14][2160/3239]	Time 0.533 (0.515)	Data 0.001 (0.013)	Loss 4.9967 (4.9719)	Top-1 acc 12.109 (13.987)	Top-5 acc 28.516 (31.918)	lr 0.03693
Warmup Train [14][2170/3239]	Time 0.527 (0.515)	Data 0.001 (0.013)	Loss 4.8426 (4.9718)	Top-1 acc 19.141 (13.987)	Top-5 acc 35.547 (31.920)	lr 0.03692
Warmup Train [14][2180/3239]	Time 0.582 (0.515)	Data 0.001 (0.013)	Loss 4.9942 (4.9717)	Top-1 acc 13.281 (13.987)	Top-5 acc 32.031 (31.925)	lr 0.03692
Warmup Train [14][2190/3239]	Time 0.643 (0.515)	Data 0.001 (0.012)	Loss 4.8842 (4.9714)	Top-1 acc 13.281 (13.993)	Top-5 acc 35.938 (31.932)	lr 0.03691
Warmup Train [14][2200/3239]	Time 0.506 (0.515)	Data 0.001 (0.012)	Loss 4.9150 (4.9711)	Top-1 acc 12.891 (13.995)	Top-5 acc 32.031 (31.936)	lr 0.03691
Warmup Train [14][2210/3239]	Time 0.723 (0.515)	Data 0.001 (0.012)	Loss 4.8222 (4.9707)	Top-1 acc 15.625 (13.999)	Top-5 acc 34.766 (31.947)	lr 0.03690
Warmup Train [14][2220/3239]	Time 0.550 (0.515)	Data 0.001 (0.012)	Loss 5.0831 (4.9708)	Top-1 acc 14.453 (13.998)	Top-5 acc 29.688 (31.946)	lr 0.03690
Warmup Train [14][2230/3239]	Time 0.496 (0.515)	Data 0.001 (0.012)	Loss 4.9597 (4.9707)	Top-1 acc 12.891 (14.001)	Top-5 acc 33.984 (31.953)	lr 0.03689
Warmup Train [14][2240/3239]	Time 0.604 (0.514)	Data 0.001 (0.012)	Loss 4.9664 (4.9703)	Top-1 acc 13.281 (14.008)	Top-5 acc 30.078 (31.962)	lr 0.03689
Warmup Train [14][2250/3239]	Time 0.638 (0.514)	Data 0.001 (0.012)	Loss 4.9819 (4.9701)	Top-1 acc 15.625 (14.010)	Top-5 acc 34.375 (31.967)	lr 0.03688
Warmup Train [14][2260/3239]	Time 0.350 (0.514)	Data 0.001 (0.012)	Loss 4.9082 (4.9700)	Top-1 acc 15.234 (14.012)	Top-5 acc 36.719 (31.974)	lr 0.03688
Warmup Train [14][2270/3239]	Time 0.508 (0.514)	Data 0.001 (0.012)	Loss 4.9785 (4.9699)	Top-1 acc 11.719 (14.011)	Top-5 acc 29.688 (31.973)	lr 0.03687
Warmup Train [14][2280/3239]	Time 0.586 (0.514)	Data 0.001 (0.012)	Loss 5.0074 (4.9697)	Top-1 acc 13.672 (14.013)	Top-5 acc 30.469 (31.977)	lr 0.03687
Warmup Train [14][2290/3239]	Time 0.470 (0.514)	Data 0.002 (0.012)	Loss 4.8599 (4.9696)	Top-1 acc 13.672 (14.017)	Top-5 acc 37.500 (31.982)	lr 0.03686
Warmup Train [14][2300/3239]	Time 0.553 (0.514)	Data 0.001 (0.012)	Loss 4.8668 (4.9694)	Top-1 acc 16.406 (14.022)	Top-5 acc 34.766 (31.988)	lr 0.03685
Warmup Train [14][2310/3239]	Time 0.575 (0.514)	Data 0.001 (0.012)	Loss 4.8496 (4.9693)	Top-1 acc 19.531 (14.023)	Top-5 acc 38.672 (31.992)	lr 0.03685
Warmup Train [14][2320/3239]	Time 0.594 (0.514)	Data 0.001 (0.012)	Loss 4.7894 (4.9691)	Top-1 acc 14.844 (14.024)	Top-5 acc 35.547 (31.996)	lr 0.03684
Warmup Train [14][2330/3239]	Time 0.431 (0.514)	Data 0.001 (0.012)	Loss 4.9623 (4.9691)	Top-1 acc 15.234 (14.025)	Top-5 acc 33.203 (32.001)	lr 0.03684
Warmup Train [14][2340/3239]	Time 0.480 (0.514)	Data 0.001 (0.012)	Loss 4.9714 (4.9690)	Top-1 acc 13.672 (14.028)	Top-5 acc 30.469 (32.000)	lr 0.03683
Warmup Train [14][2350/3239]	Time 0.633 (0.514)	Data 0.001 (0.012)	Loss 5.0599 (4.9688)	Top-1 acc 14.844 (14.037)	Top-5 acc 32.031 (32.008)	lr 0.03683
Warmup Train [14][2360/3239]	Time 0.515 (0.514)	Data 0.001 (0.012)	Loss 5.0489 (4.9688)	Top-1 acc 11.328 (14.034)	Top-5 acc 27.734 (32.005)	lr 0.03682
Warmup Train [14][2370/3239]	Time 0.410 (0.514)	Data 0.001 (0.012)	Loss 4.9309 (4.9686)	Top-1 acc 15.625 (14.039)	Top-5 acc 33.984 (32.011)	lr 0.03682
Warmup Train [14][2380/3239]	Time 0.523 (0.514)	Data 0.001 (0.012)	Loss 4.9502 (4.9685)	Top-1 acc 12.891 (14.039)	Top-5 acc 32.422 (32.015)	lr 0.03681
Warmup Train [14][2390/3239]	Time 0.678 (0.514)	Data 0.001 (0.012)	Loss 4.8224 (4.9685)	Top-1 acc 12.500 (14.036)	Top-5 acc 32.812 (32.012)	lr 0.03681
Warmup Train [14][2400/3239]	Time 0.503 (0.514)	Data 0.001 (0.012)	Loss 4.9198 (4.9686)	Top-1 acc 13.672 (14.033)	Top-5 acc 30.078 (32.006)	lr 0.03680
Warmup Train [14][2410/3239]	Time 0.581 (0.514)	Data 0.001 (0.012)	Loss 5.0568 (4.9685)	Top-1 acc 14.844 (14.040)	Top-5 acc 31.641 (32.012)	lr 0.03680
Warmup Train [14][2420/3239]	Time 0.597 (0.514)	Data 0.001 (0.012)	Loss 5.0597 (4.9683)	Top-1 acc 11.719 (14.044)	Top-5 acc 32.031 (32.019)	lr 0.03679
Warmup Train [14][2430/3239]	Time 0.435 (0.514)	Data 0.001 (0.012)	Loss 4.7526 (4.9683)	Top-1 acc 12.500 (14.038)	Top-5 acc 34.375 (32.017)	lr 0.03678
Warmup Train [14][2440/3239]	Time 0.493 (0.514)	Data 0.001 (0.012)	Loss 4.8719 (4.9680)	Top-1 acc 16.797 (14.044)	Top-5 acc 36.328 (32.025)	lr 0.03678
Warmup Train [14][2450/3239]	Time 0.513 (0.514)	Data 0.001 (0.012)	Loss 4.9969 (4.9679)	Top-1 acc 12.891 (14.050)	Top-5 acc 30.859 (32.030)	lr 0.03677
Warmup Train [14][2460/3239]	Time 0.509 (0.514)	Data 0.001 (0.012)	Loss 4.8793 (4.9675)	Top-1 acc 12.500 (14.055)	Top-5 acc 34.375 (32.040)	lr 0.03677
Warmup Train [14][2470/3239]	Time 0.494 (0.514)	Data 0.001 (0.012)	Loss 5.0125 (4.9672)	Top-1 acc 14.062 (14.060)	Top-5 acc 33.203 (32.045)	lr 0.03676
Warmup Train [14][2480/3239]	Time 0.616 (0.514)	Data 0.001 (0.012)	Loss 4.8086 (4.9669)	Top-1 acc 15.625 (14.066)	Top-5 acc 36.719 (32.057)	lr 0.03676
Warmup Train [14][2490/3239]	Time 0.514 (0.514)	Data 0.001 (0.011)	Loss 4.8840 (4.9667)	Top-1 acc 17.578 (14.070)	Top-5 acc 34.375 (32.062)	lr 0.03675
Warmup Train [14][2500/3239]	Time 0.675 (0.514)	Data 0.001 (0.011)	Loss 4.9426 (4.9666)	Top-1 acc 14.453 (14.073)	Top-5 acc 33.984 (32.064)	lr 0.03675
Warmup Train [14][2510/3239]	Time 0.579 (0.514)	Data 0.001 (0.011)	Loss 5.1422 (4.9666)	Top-1 acc 10.156 (14.072)	Top-5 acc 28.125 (32.061)	lr 0.03674
Warmup Train [14][2520/3239]	Time 0.561 (0.514)	Data 0.001 (0.011)	Loss 4.9811 (4.9664)	Top-1 acc 12.891 (14.078)	Top-5 acc 32.031 (32.070)	lr 0.03674
Warmup Train [14][2530/3239]	Time 0.389 (0.514)	Data 0.001 (0.011)	Loss 4.7715 (4.9661)	Top-1 acc 16.797 (14.083)	Top-5 acc 37.891 (32.081)	lr 0.03673
Warmup Train [14][2540/3239]	Time 0.698 (0.514)	Data 0.002 (0.011)	Loss 4.8836 (4.9657)	Top-1 acc 15.625 (14.088)	Top-5 acc 31.641 (32.091)	lr 0.03673
Warmup Train [14][2550/3239]	Time 0.515 (0.514)	Data 0.001 (0.011)	Loss 4.8030 (4.9655)	Top-1 acc 17.188 (14.089)	Top-5 acc 35.547 (32.093)	lr 0.03672
Warmup Train [14][2560/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 4.9749 (4.9654)	Top-1 acc 13.672 (14.088)	Top-5 acc 34.375 (32.099)	lr 0.03672
Warmup Train [14][2570/3239]	Time 0.516 (0.514)	Data 0.001 (0.011)	Loss 4.9433 (4.9654)	Top-1 acc 13.672 (14.085)	Top-5 acc 33.203 (32.098)	lr 0.03671
Warmup Train [14][2580/3239]	Time 0.617 (0.514)	Data 0.001 (0.011)	Loss 4.9950 (4.9654)	Top-1 acc 16.016 (14.085)	Top-5 acc 32.812 (32.097)	lr 0.03670
Warmup Train [14][2590/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 4.8021 (4.9653)	Top-1 acc 18.750 (14.089)	Top-5 acc 36.328 (32.101)	lr 0.03670
Warmup Train [14][2600/3239]	Time 0.371 (0.514)	Data 0.001 (0.011)	Loss 5.0879 (4.9652)	Top-1 acc 10.938 (14.086)	Top-5 acc 29.297 (32.098)	lr 0.03669
Warmup Train [14][2610/3239]	Time 0.611 (0.514)	Data 0.001 (0.011)	Loss 4.8663 (4.9652)	Top-1 acc 14.453 (14.091)	Top-5 acc 36.719 (32.102)	lr 0.03669
Warmup Train [14][2620/3239]	Time 0.541 (0.514)	Data 0.001 (0.011)	Loss 4.7937 (4.9651)	Top-1 acc 19.922 (14.093)	Top-5 acc 35.547 (32.101)	lr 0.03668
Warmup Train [14][2630/3239]	Time 0.343 (0.514)	Data 0.001 (0.011)	Loss 4.8975 (4.9648)	Top-1 acc 14.453 (14.095)	Top-5 acc 30.469 (32.107)	lr 0.03668
Warmup Train [14][2640/3239]	Time 0.523 (0.513)	Data 0.001 (0.011)	Loss 5.0056 (4.9647)	Top-1 acc 12.891 (14.097)	Top-5 acc 31.250 (32.110)	lr 0.03667
Warmup Train [14][2650/3239]	Time 0.578 (0.514)	Data 0.001 (0.011)	Loss 4.8685 (4.9646)	Top-1 acc 17.188 (14.097)	Top-5 acc 35.547 (32.110)	lr 0.03667
Warmup Train [14][2660/3239]	Time 0.371 (0.513)	Data 0.001 (0.011)	Loss 4.8682 (4.9643)	Top-1 acc 17.188 (14.101)	Top-5 acc 33.203 (32.114)	lr 0.03666
Warmup Train [14][2670/3239]	Time 0.499 (0.514)	Data 0.001 (0.011)	Loss 4.7802 (4.9641)	Top-1 acc 16.797 (14.104)	Top-5 acc 35.938 (32.121)	lr 0.03666
Warmup Train [14][2680/3239]	Time 0.425 (0.514)	Data 0.001 (0.011)	Loss 4.8506 (4.9640)	Top-1 acc 14.453 (14.105)	Top-5 acc 35.547 (32.122)	lr 0.03665
Warmup Train [14][2690/3239]	Time 0.725 (0.514)	Data 0.001 (0.011)	Loss 4.9523 (4.9639)	Top-1 acc 12.500 (14.105)	Top-5 acc 32.812 (32.122)	lr 0.03665
Warmup Train [14][2700/3239]	Time 0.603 (0.514)	Data 0.001 (0.011)	Loss 4.9644 (4.9637)	Top-1 acc 16.406 (14.111)	Top-5 acc 31.250 (32.130)	lr 0.03664
Warmup Train [14][2710/3239]	Time 0.553 (0.514)	Data 0.001 (0.011)	Loss 4.9905 (4.9635)	Top-1 acc 16.797 (14.116)	Top-5 acc 33.594 (32.136)	lr 0.03663
Warmup Train [14][2720/3239]	Time 0.594 (0.514)	Data 0.001 (0.011)	Loss 4.9326 (4.9634)	Top-1 acc 15.625 (14.116)	Top-5 acc 33.203 (32.133)	lr 0.03663
Warmup Train [14][2730/3239]	Time 0.586 (0.514)	Data 0.001 (0.011)	Loss 4.8342 (4.9630)	Top-1 acc 15.234 (14.121)	Top-5 acc 37.500 (32.141)	lr 0.03662
Warmup Train [14][2740/3239]	Time 0.352 (0.514)	Data 0.001 (0.011)	Loss 4.8832 (4.9628)	Top-1 acc 15.625 (14.123)	Top-5 acc 36.328 (32.146)	lr 0.03662
Warmup Train [14][2750/3239]	Time 0.338 (0.514)	Data 0.001 (0.011)	Loss 5.0206 (4.9627)	Top-1 acc 12.500 (14.124)	Top-5 acc 30.859 (32.149)	lr 0.03661
Warmup Train [14][2760/3239]	Time 0.601 (0.514)	Data 0.001 (0.011)	Loss 4.9341 (4.9625)	Top-1 acc 13.672 (14.126)	Top-5 acc 31.641 (32.151)	lr 0.03661
Warmup Train [14][2770/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 5.0743 (4.9623)	Top-1 acc 13.672 (14.132)	Top-5 acc 28.906 (32.160)	lr 0.03660
Warmup Train [14][2780/3239]	Time 0.492 (0.513)	Data 0.001 (0.011)	Loss 4.7878 (4.9623)	Top-1 acc 19.922 (14.132)	Top-5 acc 34.766 (32.161)	lr 0.03660
Warmup Train [14][2790/3239]	Time 0.508 (0.513)	Data 0.001 (0.011)	Loss 4.8591 (4.9624)	Top-1 acc 12.109 (14.130)	Top-5 acc 30.859 (32.158)	lr 0.03659
Warmup Train [14][2800/3239]	Time 0.422 (0.513)	Data 0.001 (0.011)	Loss 4.9542 (4.9625)	Top-1 acc 10.547 (14.126)	Top-5 acc 30.859 (32.159)	lr 0.03659
Warmup Train [14][2810/3239]	Time 0.668 (0.513)	Data 0.001 (0.011)	Loss 5.0450 (4.9624)	Top-1 acc 10.547 (14.127)	Top-5 acc 29.688 (32.159)	lr 0.03658
Warmup Train [14][2820/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 4.9229 (4.9621)	Top-1 acc 16.016 (14.130)	Top-5 acc 32.812 (32.164)	lr 0.03658
Warmup Train [14][2830/3239]	Time 0.520 (0.513)	Data 0.001 (0.011)	Loss 4.9096 (4.9621)	Top-1 acc 15.234 (14.131)	Top-5 acc 33.594 (32.166)	lr 0.03657
Warmup Train [14][2840/3239]	Time 0.490 (0.513)	Data 0.001 (0.011)	Loss 4.8877 (4.9618)	Top-1 acc 14.844 (14.135)	Top-5 acc 35.547 (32.174)	lr 0.03657
Warmup Train [14][2850/3239]	Time 0.524 (0.513)	Data 0.001 (0.011)	Loss 4.7769 (4.9615)	Top-1 acc 19.531 (14.140)	Top-5 acc 39.453 (32.178)	lr 0.03656
Warmup Train [14][2860/3239]	Time 0.377 (0.513)	Data 0.001 (0.011)	Loss 4.9136 (4.9614)	Top-1 acc 14.844 (14.140)	Top-5 acc 32.031 (32.182)	lr 0.03655
Warmup Train [14][2870/3239]	Time 0.600 (0.513)	Data 0.001 (0.011)	Loss 4.9493 (4.9613)	Top-1 acc 14.453 (14.141)	Top-5 acc 31.641 (32.185)	lr 0.03655
Warmup Train [14][2880/3239]	Time 0.418 (0.513)	Data 0.001 (0.011)	Loss 4.9647 (4.9610)	Top-1 acc 16.797 (14.146)	Top-5 acc 34.375 (32.190)	lr 0.03654
Warmup Train [14][2890/3239]	Time 0.455 (0.513)	Data 0.001 (0.011)	Loss 4.9361 (4.9608)	Top-1 acc 12.109 (14.154)	Top-5 acc 26.953 (32.196)	lr 0.03654
Warmup Train [14][2900/3239]	Time 0.485 (0.513)	Data 0.001 (0.011)	Loss 5.0061 (4.9608)	Top-1 acc 16.016 (14.156)	Top-5 acc 36.719 (32.197)	lr 0.03653
Warmup Train [14][2910/3239]	Time 0.427 (0.513)	Data 0.001 (0.011)	Loss 4.9444 (4.9606)	Top-1 acc 12.500 (14.161)	Top-5 acc 32.031 (32.204)	lr 0.03653
Warmup Train [14][2920/3239]	Time 0.583 (0.513)	Data 0.001 (0.011)	Loss 5.0675 (4.9605)	Top-1 acc 12.109 (14.166)	Top-5 acc 32.812 (32.207)	lr 0.03652
Warmup Train [14][2930/3239]	Time 0.515 (0.513)	Data 0.001 (0.011)	Loss 4.8833 (4.9604)	Top-1 acc 16.016 (14.165)	Top-5 acc 34.375 (32.211)	lr 0.03652
Warmup Train [14][2940/3239]	Time 0.556 (0.513)	Data 0.001 (0.011)	Loss 4.7797 (4.9601)	Top-1 acc 12.500 (14.169)	Top-5 acc 35.156 (32.215)	lr 0.03651
Warmup Train [14][2950/3239]	Time 0.547 (0.513)	Data 0.001 (0.011)	Loss 4.9301 (4.9599)	Top-1 acc 15.625 (14.175)	Top-5 acc 28.125 (32.220)	lr 0.03651
Warmup Train [14][2960/3239]	Time 0.665 (0.513)	Data 0.001 (0.011)	Loss 4.7771 (4.9597)	Top-1 acc 20.312 (14.179)	Top-5 acc 37.891 (32.221)	lr 0.03650
Warmup Train [14][2970/3239]	Time 0.544 (0.513)	Data 0.001 (0.011)	Loss 5.1078 (4.9596)	Top-1 acc 13.672 (14.180)	Top-5 acc 28.125 (32.224)	lr 0.03650
Warmup Train [14][2980/3239]	Time 0.574 (0.513)	Data 0.001 (0.011)	Loss 4.9334 (4.9595)	Top-1 acc 14.453 (14.181)	Top-5 acc 31.641 (32.229)	lr 0.03649
Warmup Train [14][2990/3239]	Time 0.566 (0.513)	Data 0.001 (0.011)	Loss 5.0002 (4.9595)	Top-1 acc 12.891 (14.185)	Top-5 acc 30.078 (32.231)	lr 0.03648
Warmup Train [14][3000/3239]	Time 0.760 (0.513)	Data 0.002 (0.011)	Loss 4.8867 (4.9593)	Top-1 acc 17.188 (14.189)	Top-5 acc 34.766 (32.234)	lr 0.03648
Warmup Train [14][3010/3239]	Time 0.522 (0.513)	Data 0.001 (0.011)	Loss 4.9374 (4.9591)	Top-1 acc 14.062 (14.189)	Top-5 acc 31.641 (32.237)	lr 0.03647
Warmup Train [14][3020/3239]	Time 0.457 (0.513)	Data 0.001 (0.011)	Loss 4.9868 (4.9592)	Top-1 acc 13.672 (14.189)	Top-5 acc 30.859 (32.234)	lr 0.03647
Warmup Train [14][3030/3239]	Time 0.445 (0.513)	Data 0.001 (0.011)	Loss 4.8370 (4.9590)	Top-1 acc 16.797 (14.190)	Top-5 acc 36.719 (32.242)	lr 0.03646
Warmup Train [14][3040/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 5.0271 (4.9589)	Top-1 acc 13.281 (14.191)	Top-5 acc 28.906 (32.246)	lr 0.03646
Warmup Train [14][3050/3239]	Time 0.416 (0.513)	Data 0.001 (0.011)	Loss 5.0877 (4.9589)	Top-1 acc 11.328 (14.192)	Top-5 acc 32.422 (32.247)	lr 0.03645
Warmup Train [14][3060/3239]	Time 0.336 (0.513)	Data 0.001 (0.011)	Loss 4.8633 (4.9587)	Top-1 acc 14.062 (14.192)	Top-5 acc 34.375 (32.250)	lr 0.03645
Warmup Train [14][3070/3239]	Time 0.571 (0.513)	Data 0.001 (0.011)	Loss 5.0154 (4.9586)	Top-1 acc 10.547 (14.195)	Top-5 acc 32.812 (32.255)	lr 0.03644
Warmup Train [14][3080/3239]	Time 0.756 (0.512)	Data 0.002 (0.011)	Loss 4.8772 (4.9584)	Top-1 acc 14.844 (14.201)	Top-5 acc 34.375 (32.261)	lr 0.03644
Warmup Train [14][3090/3239]	Time 0.714 (0.512)	Data 0.001 (0.011)	Loss 5.0015 (4.9584)	Top-1 acc 16.797 (14.204)	Top-5 acc 33.203 (32.263)	lr 0.03643
Warmup Train [14][3100/3239]	Time 0.361 (0.512)	Data 0.001 (0.011)	Loss 4.9650 (4.9583)	Top-1 acc 13.672 (14.205)	Top-5 acc 33.594 (32.264)	lr 0.03643
Warmup Train [14][3110/3239]	Time 0.566 (0.512)	Data 0.001 (0.011)	Loss 5.1342 (4.9583)	Top-1 acc 13.672 (14.206)	Top-5 acc 26.172 (32.265)	lr 0.03642
Warmup Train [14][3120/3239]	Time 0.643 (0.512)	Data 0.001 (0.011)	Loss 4.8289 (4.9582)	Top-1 acc 19.922 (14.209)	Top-5 acc 32.422 (32.267)	lr 0.03641
Warmup Train [14][3130/3239]	Time 0.557 (0.512)	Data 0.001 (0.011)	Loss 4.9793 (4.9581)	Top-1 acc 15.234 (14.213)	Top-5 acc 32.812 (32.275)	lr 0.03641
Warmup Train [14][3140/3239]	Time 0.527 (0.512)	Data 0.001 (0.010)	Loss 4.8975 (4.9580)	Top-1 acc 16.406 (14.212)	Top-5 acc 36.719 (32.277)	lr 0.03640
Warmup Train [14][3150/3239]	Time 0.458 (0.512)	Data 0.001 (0.010)	Loss 4.9293 (4.9580)	Top-1 acc 16.406 (14.212)	Top-5 acc 33.594 (32.276)	lr 0.03640
Warmup Train [14][3160/3239]	Time 0.389 (0.512)	Data 0.001 (0.010)	Loss 4.7891 (4.9578)	Top-1 acc 16.797 (14.214)	Top-5 acc 33.203 (32.277)	lr 0.03639
Warmup Train [14][3170/3239]	Time 0.509 (0.512)	Data 0.001 (0.010)	Loss 5.0340 (4.9578)	Top-1 acc 13.672 (14.214)	Top-5 acc 28.516 (32.276)	lr 0.03639
Warmup Train [14][3180/3239]	Time 0.465 (0.512)	Data 0.000 (0.010)	Loss 4.9784 (4.9578)	Top-1 acc 15.625 (14.218)	Top-5 acc 30.859 (32.277)	lr 0.03638
Warmup Train [14][3190/3239]	Time 0.719 (0.512)	Data 0.000 (0.010)	Loss 4.8142 (4.9577)	Top-1 acc 17.969 (14.221)	Top-5 acc 35.547 (32.278)	lr 0.03638
Warmup Train [14][3200/3239]	Time 0.485 (0.512)	Data 0.000 (0.010)	Loss 4.9054 (4.9576)	Top-1 acc 17.578 (14.224)	Top-5 acc 30.859 (32.281)	lr 0.03637
Warmup Train [14][3210/3239]	Time 0.439 (0.512)	Data 0.000 (0.010)	Loss 4.9167 (4.9575)	Top-1 acc 12.891 (14.225)	Top-5 acc 34.375 (32.286)	lr 0.03637
Warmup Train [14][3220/3239]	Time 0.412 (0.512)	Data 0.000 (0.010)	Loss 4.8878 (4.9572)	Top-1 acc 14.844 (14.233)	Top-5 acc 33.984 (32.296)	lr 0.03636
Warmup Train [14][3230/3239]	Time 0.432 (0.512)	Data 0.000 (0.010)	Loss 4.8842 (4.9568)	Top-1 acc 13.672 (14.235)	Top-5 acc 33.984 (32.304)	lr 0.03636
Warmup Train [14][3239/3239]	Time 0.292 (0.512)	Data 0.000 (0.010)	Loss 5.0134 (4.9568)	Top-1 acc 12.346 (14.233)	Top-5 acc 32.099 (32.308)	lr 0.03635
==========Warmup Valid [14/40]	loss 4.077	top-1 acc 20.080	top-5 acc 42.074	Train top-1 14.233	top-5 32.308	flops: 442.4M
Warmup Train [15][0/3239]	Time 12.215 (12.215)	Data 10.686 (10.686)	Loss 4.9295 (4.9295)	Top-1 acc 16.016 (16.016)	Top-5 acc 32.422 (32.422)	lr 0.03635
Warmup Train [15][10/3239]	Time 0.458 (1.697)	Data 0.001 (1.048)	Loss 4.8861 (4.9283)	Top-1 acc 12.891 (15.021)	Top-5 acc 34.375 (32.884)	lr 0.03634
Warmup Train [15][20/3239]	Time 0.554 (1.134)	Data 0.001 (0.554)	Loss 4.8412 (4.9116)	Top-1 acc 16.016 (14.993)	Top-5 acc 32.422 (32.999)	lr 0.03634
Warmup Train [15][30/3239]	Time 0.488 (0.935)	Data 0.001 (0.377)	Loss 4.8047 (4.8990)	Top-1 acc 18.750 (15.360)	Top-5 acc 39.844 (33.430)	lr 0.03633
Warmup Train [15][40/3239]	Time 0.509 (0.832)	Data 0.001 (0.285)	Loss 4.8589 (4.8958)	Top-1 acc 15.625 (15.444)	Top-5 acc 34.766 (33.527)	lr 0.03633
Warmup Train [15][50/3239]	Time 0.552 (0.770)	Data 0.001 (0.230)	Loss 5.0570 (4.9007)	Top-1 acc 14.453 (15.418)	Top-5 acc 31.641 (33.678)	lr 0.03632
Warmup Train [15][60/3239]	Time 0.523 (0.732)	Data 0.001 (0.192)	Loss 4.9402 (4.8952)	Top-1 acc 12.891 (15.497)	Top-5 acc 31.641 (33.863)	lr 0.03632
Warmup Train [15][70/3239]	Time 0.451 (0.700)	Data 0.001 (0.166)	Loss 4.7186 (4.8991)	Top-1 acc 16.797 (15.427)	Top-5 acc 35.547 (33.775)	lr 0.03631
Warmup Train [15][80/3239]	Time 0.442 (0.672)	Data 0.001 (0.146)	Loss 4.8035 (4.8936)	Top-1 acc 18.750 (15.471)	Top-5 acc 33.203 (33.883)	lr 0.03631
Warmup Train [15][90/3239]	Time 0.712 (0.658)	Data 0.002 (0.132)	Loss 4.9056 (4.8956)	Top-1 acc 14.062 (15.346)	Top-5 acc 32.422 (33.804)	lr 0.03630
Warmup Train [15][100/3239]	Time 0.634 (0.645)	Data 0.001 (0.119)	Loss 4.8169 (4.8947)	Top-1 acc 17.188 (15.339)	Top-5 acc 35.547 (33.892)	lr 0.03630
Warmup Train [15][110/3239]	Time 0.594 (0.635)	Data 0.001 (0.108)	Loss 5.0192 (4.8944)	Top-1 acc 14.062 (15.227)	Top-5 acc 31.250 (33.752)	lr 0.03629
Warmup Train [15][120/3239]	Time 0.536 (0.623)	Data 0.001 (0.100)	Loss 4.9361 (4.8954)	Top-1 acc 14.453 (15.183)	Top-5 acc 30.859 (33.678)	lr 0.03628
Warmup Train [15][130/3239]	Time 0.536 (0.614)	Data 0.001 (0.092)	Loss 4.8902 (4.8942)	Top-1 acc 15.625 (15.246)	Top-5 acc 32.031 (33.737)	lr 0.03628
Warmup Train [15][140/3239]	Time 0.580 (0.610)	Data 0.001 (0.086)	Loss 4.8594 (4.8942)	Top-1 acc 15.234 (15.207)	Top-5 acc 32.812 (33.774)	lr 0.03627
Warmup Train [15][150/3239]	Time 0.542 (0.603)	Data 0.001 (0.081)	Loss 4.8399 (4.8917)	Top-1 acc 19.531 (15.242)	Top-5 acc 37.109 (33.824)	lr 0.03627
Warmup Train [15][160/3239]	Time 0.466 (0.598)	Data 0.001 (0.076)	Loss 4.8300 (4.8913)	Top-1 acc 18.359 (15.288)	Top-5 acc 33.594 (33.827)	lr 0.03626
Warmup Train [15][170/3239]	Time 0.627 (0.593)	Data 0.001 (0.072)	Loss 4.9460 (4.8911)	Top-1 acc 13.672 (15.319)	Top-5 acc 34.766 (33.847)	lr 0.03626
Warmup Train [15][180/3239]	Time 0.548 (0.590)	Data 0.001 (0.068)	Loss 5.0019 (4.8908)	Top-1 acc 15.625 (15.338)	Top-5 acc 33.594 (33.874)	lr 0.03625
Warmup Train [15][190/3239]	Time 0.670 (0.586)	Data 0.001 (0.064)	Loss 4.7827 (4.8884)	Top-1 acc 16.797 (15.357)	Top-5 acc 38.672 (33.911)	lr 0.03625
Warmup Train [15][200/3239]	Time 0.594 (0.582)	Data 0.001 (0.061)	Loss 4.8439 (4.8840)	Top-1 acc 17.188 (15.411)	Top-5 acc 35.547 (34.033)	lr 0.03624
Warmup Train [15][210/3239]	Time 0.468 (0.580)	Data 0.001 (0.059)	Loss 4.9026 (4.8844)	Top-1 acc 14.453 (15.379)	Top-5 acc 36.328 (34.031)	lr 0.03624
Warmup Train [15][220/3239]	Time 0.532 (0.575)	Data 0.001 (0.056)	Loss 4.8910 (4.8870)	Top-1 acc 12.500 (15.312)	Top-5 acc 34.375 (33.976)	lr 0.03623
Warmup Train [15][230/3239]	Time 0.525 (0.573)	Data 0.001 (0.054)	Loss 4.9531 (4.8903)	Top-1 acc 14.453 (15.260)	Top-5 acc 33.594 (33.893)	lr 0.03623
Warmup Train [15][240/3239]	Time 0.580 (0.569)	Data 0.001 (0.052)	Loss 4.9809 (4.8900)	Top-1 acc 14.844 (15.298)	Top-5 acc 34.375 (33.890)	lr 0.03622
Warmup Train [15][250/3239]	Time 0.527 (0.567)	Data 0.001 (0.050)	Loss 4.9575 (4.8906)	Top-1 acc 16.797 (15.304)	Top-5 acc 34.375 (33.899)	lr 0.03621
Warmup Train [15][260/3239]	Time 0.552 (0.563)	Data 0.001 (0.048)	Loss 4.7644 (4.8891)	Top-1 acc 17.188 (15.317)	Top-5 acc 36.328 (33.905)	lr 0.03621
Warmup Train [15][270/3239]	Time 0.387 (0.561)	Data 0.001 (0.046)	Loss 4.8580 (4.8888)	Top-1 acc 14.844 (15.324)	Top-5 acc 37.891 (33.922)	lr 0.03620
Warmup Train [15][280/3239]	Time 0.594 (0.559)	Data 0.001 (0.045)	Loss 4.9362 (4.8901)	Top-1 acc 14.453 (15.334)	Top-5 acc 33.984 (33.886)	lr 0.03620
Warmup Train [15][290/3239]	Time 0.610 (0.558)	Data 0.001 (0.044)	Loss 4.8196 (4.8899)	Top-1 acc 14.844 (15.338)	Top-5 acc 35.938 (33.928)	lr 0.03619
Warmup Train [15][300/3239]	Time 0.433 (0.556)	Data 0.001 (0.042)	Loss 4.8144 (4.8912)	Top-1 acc 16.797 (15.327)	Top-5 acc 34.375 (33.938)	lr 0.03619
Warmup Train [15][310/3239]	Time 0.388 (0.554)	Data 0.001 (0.041)	Loss 4.8499 (4.8945)	Top-1 acc 14.062 (15.272)	Top-5 acc 36.719 (33.839)	lr 0.03618
Warmup Train [15][320/3239]	Time 0.509 (0.553)	Data 0.001 (0.041)	Loss 4.7989 (4.8962)	Top-1 acc 17.188 (15.234)	Top-5 acc 38.672 (33.801)	lr 0.03618
Warmup Train [15][330/3239]	Time 0.591 (0.552)	Data 0.001 (0.039)	Loss 4.8707 (4.8971)	Top-1 acc 15.234 (15.221)	Top-5 acc 33.203 (33.778)	lr 0.03617
Warmup Train [15][340/3239]	Time 0.607 (0.551)	Data 0.001 (0.038)	Loss 4.9034 (4.8970)	Top-1 acc 16.797 (15.240)	Top-5 acc 35.156 (33.795)	lr 0.03617
Warmup Train [15][350/3239]	Time 0.604 (0.549)	Data 0.001 (0.037)	Loss 4.7815 (4.8965)	Top-1 acc 19.141 (15.240)	Top-5 acc 37.500 (33.804)	lr 0.03616
Warmup Train [15][360/3239]	Time 0.655 (0.548)	Data 0.001 (0.036)	Loss 4.9350 (4.8964)	Top-1 acc 16.406 (15.230)	Top-5 acc 35.547 (33.805)	lr 0.03615
Warmup Train [15][370/3239]	Time 0.516 (0.547)	Data 0.001 (0.035)	Loss 4.9346 (4.8961)	Top-1 acc 16.406 (15.242)	Top-5 acc 33.984 (33.825)	lr 0.03615
Warmup Train [15][380/3239]	Time 0.561 (0.547)	Data 0.001 (0.035)	Loss 4.8147 (4.8965)	Top-1 acc 14.453 (15.223)	Top-5 acc 35.156 (33.833)	lr 0.03614
Warmup Train [15][390/3239]	Time 0.504 (0.546)	Data 0.001 (0.034)	Loss 5.0009 (4.8966)	Top-1 acc 12.891 (15.237)	Top-5 acc 29.297 (33.832)	lr 0.03614
Warmup Train [15][400/3239]	Time 0.543 (0.545)	Data 0.001 (0.033)	Loss 4.7513 (4.8968)	Top-1 acc 16.406 (15.248)	Top-5 acc 38.281 (33.822)	lr 0.03613
Warmup Train [15][410/3239]	Time 0.372 (0.544)	Data 0.001 (0.033)	Loss 4.9060 (4.8973)	Top-1 acc 15.234 (15.229)	Top-5 acc 32.812 (33.816)	lr 0.03613
Warmup Train [15][420/3239]	Time 0.641 (0.544)	Data 0.001 (0.032)	Loss 4.8519 (4.8974)	Top-1 acc 16.016 (15.222)	Top-5 acc 36.719 (33.809)	lr 0.03612
Warmup Train [15][430/3239]	Time 0.687 (0.543)	Data 0.001 (0.032)	Loss 4.8345 (4.8969)	Top-1 acc 16.797 (15.232)	Top-5 acc 37.891 (33.830)	lr 0.03612
Warmup Train [15][440/3239]	Time 0.401 (0.542)	Data 0.001 (0.031)	Loss 4.8201 (4.8962)	Top-1 acc 17.578 (15.235)	Top-5 acc 35.156 (33.839)	lr 0.03611
Warmup Train [15][450/3239]	Time 0.409 (0.542)	Data 0.001 (0.030)	Loss 5.0049 (4.8952)	Top-1 acc 13.672 (15.282)	Top-5 acc 29.297 (33.879)	lr 0.03611
Warmup Train [15][460/3239]	Time 0.559 (0.541)	Data 0.001 (0.030)	Loss 4.8170 (4.8948)	Top-1 acc 13.281 (15.250)	Top-5 acc 33.594 (33.880)	lr 0.03610
Warmup Train [15][470/3239]	Time 0.465 (0.541)	Data 0.001 (0.029)	Loss 4.8884 (4.8945)	Top-1 acc 14.453 (15.268)	Top-5 acc 34.766 (33.899)	lr 0.03610
Warmup Train [15][480/3239]	Time 0.559 (0.541)	Data 0.001 (0.029)	Loss 4.8541 (4.8943)	Top-1 acc 14.844 (15.278)	Top-5 acc 32.812 (33.884)	lr 0.03609
Warmup Train [15][490/3239]	Time 0.291 (0.540)	Data 0.001 (0.028)	Loss 4.9680 (4.8944)	Top-1 acc 16.016 (15.277)	Top-5 acc 35.547 (33.898)	lr 0.03608
Warmup Train [15][500/3239]	Time 0.574 (0.539)	Data 0.001 (0.028)	Loss 4.8324 (4.8930)	Top-1 acc 15.234 (15.271)	Top-5 acc 37.109 (33.915)	lr 0.03608
Warmup Train [15][510/3239]	Time 0.176 (0.538)	Data 0.001 (0.028)	Loss 4.8377 (4.8933)	Top-1 acc 13.672 (15.251)	Top-5 acc 33.594 (33.900)	lr 0.03607
Warmup Train [15][520/3239]	Time 0.473 (0.537)	Data 0.001 (0.028)	Loss 4.8986 (4.8932)	Top-1 acc 14.453 (15.263)	Top-5 acc 35.938 (33.909)	lr 0.03607
Warmup Train [15][530/3239]	Time 0.532 (0.536)	Data 0.001 (0.027)	Loss 5.0029 (4.8929)	Top-1 acc 13.281 (15.265)	Top-5 acc 28.516 (33.912)	lr 0.03606
Warmup Train [15][540/3239]	Time 0.390 (0.535)	Data 0.001 (0.027)	Loss 4.8165 (4.8926)	Top-1 acc 17.188 (15.263)	Top-5 acc 35.938 (33.906)	lr 0.03606
Warmup Train [15][550/3239]	Time 0.354 (0.534)	Data 0.001 (0.026)	Loss 4.6374 (4.8914)	Top-1 acc 19.141 (15.284)	Top-5 acc 38.281 (33.918)	lr 0.03605
Warmup Train [15][560/3239]	Time 0.392 (0.533)	Data 0.001 (0.026)	Loss 5.0075 (4.8915)	Top-1 acc 14.062 (15.284)	Top-5 acc 30.469 (33.910)	lr 0.03605
Warmup Train [15][570/3239]	Time 0.452 (0.533)	Data 0.001 (0.026)	Loss 4.6999 (4.8906)	Top-1 acc 18.359 (15.306)	Top-5 acc 38.281 (33.933)	lr 0.03604
Warmup Train [15][580/3239]	Time 0.528 (0.532)	Data 0.001 (0.026)	Loss 4.9474 (4.8911)	Top-1 acc 15.234 (15.301)	Top-5 acc 33.203 (33.908)	lr 0.03604
Warmup Train [15][590/3239]	Time 0.479 (0.532)	Data 0.001 (0.025)	Loss 4.8865 (4.8912)	Top-1 acc 13.672 (15.289)	Top-5 acc 33.203 (33.901)	lr 0.03603
Warmup Train [15][600/3239]	Time 0.548 (0.532)	Data 0.001 (0.025)	Loss 4.8619 (4.8909)	Top-1 acc 15.234 (15.303)	Top-5 acc 37.500 (33.907)	lr 0.03602
Warmup Train [15][610/3239]	Time 0.543 (0.531)	Data 0.001 (0.025)	Loss 5.0977 (4.8910)	Top-1 acc 13.672 (15.292)	Top-5 acc 30.859 (33.906)	lr 0.03602
Warmup Train [15][620/3239]	Time 0.779 (0.531)	Data 0.001 (0.024)	Loss 4.8678 (4.8914)	Top-1 acc 11.719 (15.283)	Top-5 acc 33.203 (33.897)	lr 0.03601
Warmup Train [15][630/3239]	Time 0.657 (0.530)	Data 0.001 (0.024)	Loss 4.8740 (4.8916)	Top-1 acc 16.016 (15.277)	Top-5 acc 33.594 (33.909)	lr 0.03601
Warmup Train [15][640/3239]	Time 0.521 (0.530)	Data 0.001 (0.024)	Loss 4.9673 (4.8914)	Top-1 acc 14.453 (15.276)	Top-5 acc 32.031 (33.905)	lr 0.03600
Warmup Train [15][650/3239]	Time 0.558 (0.530)	Data 0.001 (0.023)	Loss 4.9312 (4.8905)	Top-1 acc 14.453 (15.290)	Top-5 acc 33.594 (33.941)	lr 0.03600
Warmup Train [15][660/3239]	Time 0.431 (0.529)	Data 0.001 (0.023)	Loss 4.9490 (4.8903)	Top-1 acc 16.016 (15.286)	Top-5 acc 33.203 (33.947)	lr 0.03599
Warmup Train [15][670/3239]	Time 0.461 (0.529)	Data 0.002 (0.023)	Loss 4.9073 (4.8906)	Top-1 acc 16.016 (15.288)	Top-5 acc 32.031 (33.946)	lr 0.03599
Warmup Train [15][680/3239]	Time 0.432 (0.529)	Data 0.001 (0.023)	Loss 4.8879 (4.8904)	Top-1 acc 14.062 (15.276)	Top-5 acc 35.547 (33.948)	lr 0.03598
Warmup Train [15][690/3239]	Time 0.428 (0.529)	Data 0.001 (0.022)	Loss 5.0018 (4.8909)	Top-1 acc 12.891 (15.263)	Top-5 acc 28.516 (33.925)	lr 0.03598
Warmup Train [15][700/3239]	Time 0.451 (0.528)	Data 0.001 (0.022)	Loss 4.8841 (4.8907)	Top-1 acc 12.891 (15.259)	Top-5 acc 35.156 (33.936)	lr 0.03597
Warmup Train [15][710/3239]	Time 0.490 (0.528)	Data 0.001 (0.022)	Loss 4.8338 (4.8903)	Top-1 acc 13.672 (15.259)	Top-5 acc 32.812 (33.929)	lr 0.03596
Warmup Train [15][720/3239]	Time 0.485 (0.528)	Data 0.001 (0.022)	Loss 5.0446 (4.8910)	Top-1 acc 8.594 (15.247)	Top-5 acc 27.734 (33.918)	lr 0.03596
Warmup Train [15][730/3239]	Time 0.598 (0.528)	Data 0.001 (0.022)	Loss 4.9456 (4.8914)	Top-1 acc 12.109 (15.239)	Top-5 acc 31.250 (33.907)	lr 0.03595
Warmup Train [15][740/3239]	Time 0.360 (0.527)	Data 0.001 (0.021)	Loss 4.9768 (4.8917)	Top-1 acc 12.109 (15.226)	Top-5 acc 29.688 (33.897)	lr 0.03595
Warmup Train [15][750/3239]	Time 0.558 (0.527)	Data 0.001 (0.021)	Loss 4.8698 (4.8918)	Top-1 acc 12.109 (15.220)	Top-5 acc 35.547 (33.896)	lr 0.03594
Warmup Train [15][760/3239]	Time 0.512 (0.527)	Data 0.001 (0.021)	Loss 4.8452 (4.8916)	Top-1 acc 16.016 (15.223)	Top-5 acc 31.641 (33.899)	lr 0.03594
Warmup Train [15][770/3239]	Time 0.423 (0.526)	Data 0.001 (0.021)	Loss 4.7130 (4.8916)	Top-1 acc 19.141 (15.223)	Top-5 acc 40.625 (33.911)	lr 0.03593
Warmup Train [15][780/3239]	Time 0.371 (0.525)	Data 0.001 (0.021)	Loss 4.9111 (4.8921)	Top-1 acc 16.406 (15.225)	Top-5 acc 32.422 (33.898)	lr 0.03593
Warmup Train [15][790/3239]	Time 0.539 (0.525)	Data 0.001 (0.020)	Loss 4.7987 (4.8923)	Top-1 acc 16.406 (15.211)	Top-5 acc 37.500 (33.890)	lr 0.03592
Warmup Train [15][800/3239]	Time 0.352 (0.524)	Data 0.001 (0.020)	Loss 4.7003 (4.8918)	Top-1 acc 16.406 (15.207)	Top-5 acc 35.938 (33.899)	lr 0.03592
Warmup Train [15][810/3239]	Time 0.454 (0.524)	Data 0.001 (0.020)	Loss 4.9594 (4.8922)	Top-1 acc 12.500 (15.193)	Top-5 acc 35.156 (33.892)	lr 0.03591
Warmup Train [15][820/3239]	Time 0.575 (0.523)	Data 0.001 (0.020)	Loss 4.9172 (4.8926)	Top-1 acc 15.234 (15.188)	Top-5 acc 31.641 (33.888)	lr 0.03590
Warmup Train [15][830/3239]	Time 0.664 (0.523)	Data 0.001 (0.020)	Loss 5.0465 (4.8918)	Top-1 acc 12.500 (15.209)	Top-5 acc 31.250 (33.912)	lr 0.03590
Warmup Train [15][840/3239]	Time 0.492 (0.523)	Data 0.001 (0.020)	Loss 5.0169 (4.8914)	Top-1 acc 12.891 (15.208)	Top-5 acc 32.031 (33.911)	lr 0.03589
Warmup Train [15][850/3239]	Time 0.504 (0.523)	Data 0.001 (0.019)	Loss 4.7884 (4.8905)	Top-1 acc 12.891 (15.222)	Top-5 acc 35.547 (33.931)	lr 0.03589
Warmup Train [15][860/3239]	Time 0.503 (0.522)	Data 0.001 (0.019)	Loss 5.1423 (4.8906)	Top-1 acc 12.891 (15.218)	Top-5 acc 30.469 (33.937)	lr 0.03588
Warmup Train [15][870/3239]	Time 0.606 (0.522)	Data 0.001 (0.019)	Loss 4.7054 (4.8903)	Top-1 acc 20.312 (15.228)	Top-5 acc 37.109 (33.941)	lr 0.03588
Warmup Train [15][880/3239]	Time 0.515 (0.522)	Data 0.001 (0.019)	Loss 4.9589 (4.8905)	Top-1 acc 15.234 (15.222)	Top-5 acc 35.547 (33.944)	lr 0.03587
Warmup Train [15][890/3239]	Time 0.403 (0.522)	Data 0.001 (0.019)	Loss 4.8579 (4.8902)	Top-1 acc 16.406 (15.223)	Top-5 acc 37.500 (33.941)	lr 0.03587
Warmup Train [15][900/3239]	Time 0.491 (0.521)	Data 0.001 (0.019)	Loss 4.7915 (4.8902)	Top-1 acc 19.922 (15.230)	Top-5 acc 38.672 (33.932)	lr 0.03586
Warmup Train [15][910/3239]	Time 0.553 (0.521)	Data 0.001 (0.019)	Loss 5.0349 (4.8900)	Top-1 acc 10.938 (15.236)	Top-5 acc 28.906 (33.926)	lr 0.03586
Warmup Train [15][920/3239]	Time 0.515 (0.521)	Data 0.001 (0.018)	Loss 4.8819 (4.8901)	Top-1 acc 16.797 (15.233)	Top-5 acc 31.250 (33.930)	lr 0.03585
Warmup Train [15][930/3239]	Time 0.567 (0.521)	Data 0.001 (0.018)	Loss 4.8081 (4.8905)	Top-1 acc 18.359 (15.233)	Top-5 acc 37.500 (33.926)	lr 0.03584
Warmup Train [15][940/3239]	Time 0.721 (0.521)	Data 0.001 (0.018)	Loss 4.8883 (4.8902)	Top-1 acc 14.062 (15.235)	Top-5 acc 32.812 (33.921)	lr 0.03584
Warmup Train [15][950/3239]	Time 0.775 (0.521)	Data 0.001 (0.018)	Loss 4.9854 (4.8898)	Top-1 acc 15.625 (15.246)	Top-5 acc 30.859 (33.922)	lr 0.03583
Warmup Train [15][960/3239]	Time 0.342 (0.521)	Data 0.001 (0.018)	Loss 4.7369 (4.8892)	Top-1 acc 17.969 (15.251)	Top-5 acc 38.672 (33.936)	lr 0.03583
Warmup Train [15][970/3239]	Time 0.315 (0.521)	Data 0.001 (0.018)	Loss 4.8239 (4.8892)	Top-1 acc 18.359 (15.255)	Top-5 acc 38.281 (33.938)	lr 0.03582
Warmup Train [15][980/3239]	Time 0.357 (0.520)	Data 0.001 (0.018)	Loss 5.0452 (4.8889)	Top-1 acc 15.234 (15.259)	Top-5 acc 30.859 (33.933)	lr 0.03582
Warmup Train [15][990/3239]	Time 0.544 (0.520)	Data 0.001 (0.018)	Loss 5.0600 (4.8891)	Top-1 acc 14.844 (15.261)	Top-5 acc 29.688 (33.925)	lr 0.03581
Warmup Train [15][1000/3239]	Time 0.617 (0.520)	Data 0.001 (0.018)	Loss 4.9225 (4.8889)	Top-1 acc 14.062 (15.275)	Top-5 acc 34.375 (33.929)	lr 0.03581
Warmup Train [15][1010/3239]	Time 0.462 (0.520)	Data 0.001 (0.018)	Loss 4.7805 (4.8888)	Top-1 acc 17.969 (15.271)	Top-5 acc 35.547 (33.923)	lr 0.03580
Warmup Train [15][1020/3239]	Time 0.395 (0.520)	Data 0.001 (0.017)	Loss 4.7570 (4.8888)	Top-1 acc 17.969 (15.272)	Top-5 acc 36.719 (33.930)	lr 0.03580
Warmup Train [15][1030/3239]	Time 0.527 (0.520)	Data 0.001 (0.017)	Loss 4.8714 (4.8889)	Top-1 acc 17.578 (15.273)	Top-5 acc 34.766 (33.933)	lr 0.03579
Warmup Train [15][1040/3239]	Time 0.500 (0.520)	Data 0.001 (0.017)	Loss 4.8691 (4.8890)	Top-1 acc 14.844 (15.270)	Top-5 acc 36.328 (33.930)	lr 0.03578
Warmup Train [15][1050/3239]	Time 0.323 (0.520)	Data 0.001 (0.017)	Loss 5.0807 (4.8893)	Top-1 acc 10.938 (15.264)	Top-5 acc 28.906 (33.923)	lr 0.03578
Warmup Train [15][1060/3239]	Time 0.533 (0.519)	Data 0.001 (0.017)	Loss 4.8028 (4.8892)	Top-1 acc 18.750 (15.269)	Top-5 acc 37.891 (33.927)	lr 0.03577
Warmup Train [15][1070/3239]	Time 0.491 (0.519)	Data 0.001 (0.017)	Loss 4.9225 (4.8890)	Top-1 acc 14.844 (15.277)	Top-5 acc 33.203 (33.939)	lr 0.03577
Warmup Train [15][1080/3239]	Time 0.416 (0.519)	Data 0.002 (0.017)	Loss 4.9763 (4.8894)	Top-1 acc 13.672 (15.272)	Top-5 acc 30.078 (33.932)	lr 0.03576
Warmup Train [15][1090/3239]	Time 0.462 (0.519)	Data 0.001 (0.017)	Loss 5.0388 (4.8898)	Top-1 acc 12.109 (15.278)	Top-5 acc 29.688 (33.924)	lr 0.03576
Warmup Train [15][1100/3239]	Time 0.255 (0.518)	Data 0.001 (0.017)	Loss 4.9598 (4.8894)	Top-1 acc 14.062 (15.283)	Top-5 acc 31.641 (33.927)	lr 0.03575
Warmup Train [15][1110/3239]	Time 0.484 (0.518)	Data 0.001 (0.017)	Loss 5.0080 (4.8896)	Top-1 acc 12.891 (15.275)	Top-5 acc 32.031 (33.920)	lr 0.03575
Warmup Train [15][1120/3239]	Time 0.521 (0.518)	Data 0.001 (0.017)	Loss 4.9198 (4.8902)	Top-1 acc 14.844 (15.270)	Top-5 acc 36.719 (33.913)	lr 0.03574
Warmup Train [15][1130/3239]	Time 0.532 (0.518)	Data 0.001 (0.017)	Loss 4.8338 (4.8903)	Top-1 acc 15.625 (15.267)	Top-5 acc 34.766 (33.918)	lr 0.03574
Warmup Train [15][1140/3239]	Time 0.449 (0.518)	Data 0.001 (0.017)	Loss 4.9531 (4.8902)	Top-1 acc 16.406 (15.278)	Top-5 acc 35.938 (33.931)	lr 0.03573
Warmup Train [15][1150/3239]	Time 0.574 (0.518)	Data 0.001 (0.017)	Loss 4.9014 (4.8897)	Top-1 acc 14.844 (15.292)	Top-5 acc 33.594 (33.944)	lr 0.03572
Warmup Train [15][1160/3239]	Time 0.477 (0.518)	Data 0.001 (0.016)	Loss 4.9047 (4.8898)	Top-1 acc 13.672 (15.288)	Top-5 acc 33.594 (33.938)	lr 0.03572
Warmup Train [15][1170/3239]	Time 0.514 (0.518)	Data 0.001 (0.016)	Loss 4.8113 (4.8895)	Top-1 acc 14.453 (15.289)	Top-5 acc 33.203 (33.941)	lr 0.03571
Warmup Train [15][1180/3239]	Time 0.570 (0.518)	Data 0.001 (0.016)	Loss 5.0514 (4.8893)	Top-1 acc 13.281 (15.294)	Top-5 acc 30.859 (33.947)	lr 0.03571
Warmup Train [15][1190/3239]	Time 0.551 (0.518)	Data 0.001 (0.016)	Loss 4.9172 (4.8893)	Top-1 acc 15.234 (15.289)	Top-5 acc 30.078 (33.945)	lr 0.03570
Warmup Train [15][1200/3239]	Time 0.552 (0.517)	Data 0.001 (0.016)	Loss 4.8087 (4.8891)	Top-1 acc 13.281 (15.281)	Top-5 acc 34.766 (33.945)	lr 0.03570
Warmup Train [15][1210/3239]	Time 0.506 (0.517)	Data 0.001 (0.016)	Loss 4.7881 (4.8892)	Top-1 acc 15.625 (15.280)	Top-5 acc 35.547 (33.948)	lr 0.03569
Warmup Train [15][1220/3239]	Time 0.491 (0.518)	Data 0.001 (0.016)	Loss 4.8295 (4.8891)	Top-1 acc 15.625 (15.288)	Top-5 acc 34.766 (33.948)	lr 0.03569
Warmup Train [15][1230/3239]	Time 0.630 (0.518)	Data 0.001 (0.016)	Loss 4.6272 (4.8891)	Top-1 acc 19.141 (15.291)	Top-5 acc 39.844 (33.954)	lr 0.03568
Warmup Train [15][1240/3239]	Time 0.556 (0.517)	Data 0.001 (0.016)	Loss 4.8999 (4.8892)	Top-1 acc 15.625 (15.289)	Top-5 acc 35.938 (33.956)	lr 0.03568
Warmup Train [15][1250/3239]	Time 0.448 (0.517)	Data 0.001 (0.016)	Loss 4.8274 (4.8889)	Top-1 acc 13.281 (15.297)	Top-5 acc 33.984 (33.960)	lr 0.03567
Warmup Train [15][1260/3239]	Time 0.478 (0.517)	Data 0.001 (0.016)	Loss 4.8097 (4.8889)	Top-1 acc 17.188 (15.305)	Top-5 acc 36.719 (33.957)	lr 0.03566
Warmup Train [15][1270/3239]	Time 0.605 (0.517)	Data 0.001 (0.016)	Loss 4.8187 (4.8884)	Top-1 acc 16.016 (15.310)	Top-5 acc 33.984 (33.976)	lr 0.03566
Warmup Train [15][1280/3239]	Time 0.393 (0.517)	Data 0.001 (0.015)	Loss 5.0223 (4.8886)	Top-1 acc 16.016 (15.312)	Top-5 acc 28.125 (33.970)	lr 0.03565
Warmup Train [15][1290/3239]	Time 0.743 (0.517)	Data 0.001 (0.015)	Loss 4.8762 (4.8887)	Top-1 acc 16.406 (15.309)	Top-5 acc 37.109 (33.978)	lr 0.03565
Warmup Train [15][1300/3239]	Time 0.767 (0.517)	Data 0.001 (0.015)	Loss 4.8366 (4.8884)	Top-1 acc 17.578 (15.319)	Top-5 acc 34.375 (33.984)	lr 0.03564
Warmup Train [15][1310/3239]	Time 0.433 (0.517)	Data 0.001 (0.015)	Loss 5.0239 (4.8883)	Top-1 acc 12.500 (15.307)	Top-5 acc 31.641 (33.973)	lr 0.03564
Warmup Train [15][1320/3239]	Time 0.465 (0.517)	Data 0.001 (0.015)	Loss 4.7359 (4.8883)	Top-1 acc 17.578 (15.305)	Top-5 acc 36.328 (33.977)	lr 0.03563
Warmup Train [15][1330/3239]	Time 0.443 (0.517)	Data 0.001 (0.015)	Loss 4.8594 (4.8881)	Top-1 acc 14.844 (15.307)	Top-5 acc 35.547 (33.986)	lr 0.03563
Warmup Train [15][1340/3239]	Time 0.507 (0.517)	Data 0.001 (0.015)	Loss 4.9662 (4.8880)	Top-1 acc 10.156 (15.300)	Top-5 acc 30.469 (33.989)	lr 0.03562
Warmup Train [15][1350/3239]	Time 0.495 (0.516)	Data 0.001 (0.015)	Loss 5.1112 (4.8881)	Top-1 acc 14.453 (15.302)	Top-5 acc 28.125 (33.987)	lr 0.03561
Warmup Train [15][1360/3239]	Time 0.505 (0.516)	Data 0.001 (0.015)	Loss 5.0496 (4.8879)	Top-1 acc 16.016 (15.304)	Top-5 acc 32.031 (33.988)	lr 0.03561
Warmup Train [15][1370/3239]	Time 0.382 (0.516)	Data 0.001 (0.015)	Loss 4.7047 (4.8877)	Top-1 acc 17.578 (15.308)	Top-5 acc 39.453 (33.988)	lr 0.03560
Warmup Train [15][1380/3239]	Time 0.359 (0.516)	Data 0.001 (0.015)	Loss 4.8316 (4.8882)	Top-1 acc 15.234 (15.305)	Top-5 acc 34.766 (33.978)	lr 0.03560
Warmup Train [15][1390/3239]	Time 0.462 (0.515)	Data 0.001 (0.015)	Loss 4.7743 (4.8883)	Top-1 acc 16.016 (15.310)	Top-5 acc 33.984 (33.973)	lr 0.03559
Warmup Train [15][1400/3239]	Time 0.690 (0.516)	Data 0.003 (0.015)	Loss 4.8609 (4.8879)	Top-1 acc 15.625 (15.319)	Top-5 acc 33.203 (33.985)	lr 0.03559
Warmup Train [15][1410/3239]	Time 0.473 (0.516)	Data 0.002 (0.015)	Loss 4.7514 (4.8873)	Top-1 acc 19.141 (15.325)	Top-5 acc 35.156 (33.996)	lr 0.03558
Warmup Train [15][1420/3239]	Time 0.498 (0.515)	Data 0.001 (0.015)	Loss 4.7146 (4.8873)	Top-1 acc 17.969 (15.330)	Top-5 acc 39.453 (33.996)	lr 0.03558
Warmup Train [15][1430/3239]	Time 0.362 (0.515)	Data 0.001 (0.014)	Loss 4.9072 (4.8873)	Top-1 acc 13.672 (15.333)	Top-5 acc 32.031 (34.000)	lr 0.03557
Warmup Train [15][1440/3239]	Time 0.480 (0.515)	Data 0.001 (0.014)	Loss 4.9391 (4.8874)	Top-1 acc 14.062 (15.332)	Top-5 acc 33.203 (33.994)	lr 0.03557
Warmup Train [15][1450/3239]	Time 0.521 (0.515)	Data 0.001 (0.014)	Loss 5.0940 (4.8876)	Top-1 acc 9.766 (15.332)	Top-5 acc 28.125 (33.996)	lr 0.03556
Warmup Train [15][1460/3239]	Time 0.346 (0.515)	Data 0.002 (0.014)	Loss 4.9648 (4.8874)	Top-1 acc 12.109 (15.334)	Top-5 acc 33.203 (33.999)	lr 0.03555
Warmup Train [15][1470/3239]	Time 0.621 (0.515)	Data 0.001 (0.014)	Loss 4.9755 (4.8874)	Top-1 acc 13.672 (15.328)	Top-5 acc 32.422 (33.992)	lr 0.03555
Warmup Train [15][1480/3239]	Time 0.424 (0.515)	Data 0.001 (0.014)	Loss 4.9941 (4.8872)	Top-1 acc 10.156 (15.331)	Top-5 acc 30.469 (33.998)	lr 0.03554
Warmup Train [15][1490/3239]	Time 0.579 (0.515)	Data 0.001 (0.014)	Loss 4.9535 (4.8875)	Top-1 acc 13.672 (15.321)	Top-5 acc 32.422 (33.985)	lr 0.03554
Warmup Train [15][1500/3239]	Time 0.596 (0.515)	Data 0.001 (0.014)	Loss 5.1018 (4.8878)	Top-1 acc 12.500 (15.321)	Top-5 acc 28.516 (33.974)	lr 0.03553
Warmup Train [15][1510/3239]	Time 0.497 (0.515)	Data 0.001 (0.014)	Loss 4.7265 (4.8874)	Top-1 acc 19.531 (15.333)	Top-5 acc 39.844 (33.986)	lr 0.03553
Warmup Train [15][1520/3239]	Time 0.593 (0.515)	Data 0.001 (0.014)	Loss 4.9804 (4.8871)	Top-1 acc 11.719 (15.340)	Top-5 acc 32.031 (33.988)	lr 0.03552
Warmup Train [15][1530/3239]	Time 0.413 (0.515)	Data 0.001 (0.014)	Loss 4.8202 (4.8872)	Top-1 acc 18.359 (15.337)	Top-5 acc 35.547 (33.982)	lr 0.03552
Warmup Train [15][1540/3239]	Time 0.561 (0.515)	Data 0.001 (0.014)	Loss 4.9045 (4.8873)	Top-1 acc 13.672 (15.330)	Top-5 acc 35.156 (33.985)	lr 0.03551
Warmup Train [15][1550/3239]	Time 0.591 (0.515)	Data 0.002 (0.014)	Loss 4.9502 (4.8872)	Top-1 acc 15.625 (15.332)	Top-5 acc 33.203 (33.995)	lr 0.03551
Warmup Train [15][1560/3239]	Time 0.530 (0.515)	Data 0.001 (0.014)	Loss 4.8318 (4.8870)	Top-1 acc 14.844 (15.333)	Top-5 acc 34.766 (33.997)	lr 0.03550
Warmup Train [15][1570/3239]	Time 0.507 (0.515)	Data 0.001 (0.014)	Loss 4.7145 (4.8872)	Top-1 acc 14.453 (15.324)	Top-5 acc 38.281 (33.992)	lr 0.03549
Warmup Train [15][1580/3239]	Time 0.340 (0.515)	Data 0.001 (0.014)	Loss 4.7456 (4.8869)	Top-1 acc 17.188 (15.325)	Top-5 acc 36.328 (33.999)	lr 0.03549
Warmup Train [15][1590/3239]	Time 0.343 (0.515)	Data 0.001 (0.014)	Loss 4.9054 (4.8871)	Top-1 acc 15.625 (15.327)	Top-5 acc 32.422 (33.996)	lr 0.03548
Warmup Train [15][1600/3239]	Time 0.495 (0.515)	Data 0.001 (0.014)	Loss 4.7360 (4.8867)	Top-1 acc 17.969 (15.331)	Top-5 acc 40.234 (34.007)	lr 0.03548
Warmup Train [15][1610/3239]	Time 0.511 (0.515)	Data 0.001 (0.014)	Loss 5.0353 (4.8868)	Top-1 acc 12.109 (15.329)	Top-5 acc 31.641 (34.003)	lr 0.03547
Warmup Train [15][1620/3239]	Time 0.692 (0.515)	Data 0.001 (0.014)	Loss 4.7271 (4.8866)	Top-1 acc 18.750 (15.328)	Top-5 acc 38.281 (34.006)	lr 0.03547
Warmup Train [15][1630/3239]	Time 0.653 (0.515)	Data 0.001 (0.014)	Loss 4.6074 (4.8861)	Top-1 acc 26.172 (15.344)	Top-5 acc 41.406 (34.022)	lr 0.03546
Warmup Train [15][1640/3239]	Time 0.596 (0.514)	Data 0.001 (0.013)	Loss 4.8640 (4.8861)	Top-1 acc 16.406 (15.346)	Top-5 acc 34.375 (34.024)	lr 0.03546
Warmup Train [15][1650/3239]	Time 0.532 (0.514)	Data 0.001 (0.013)	Loss 4.9228 (4.8860)	Top-1 acc 16.016 (15.353)	Top-5 acc 30.078 (34.023)	lr 0.03545
Warmup Train [15][1660/3239]	Time 0.180 (0.514)	Data 0.001 (0.013)	Loss 4.9088 (4.8862)	Top-1 acc 16.406 (15.354)	Top-5 acc 34.766 (34.020)	lr 0.03544
Warmup Train [15][1670/3239]	Time 0.505 (0.514)	Data 0.001 (0.013)	Loss 4.8309 (4.8862)	Top-1 acc 16.406 (15.359)	Top-5 acc 33.984 (34.024)	lr 0.03544
Warmup Train [15][1680/3239]	Time 0.591 (0.514)	Data 0.001 (0.013)	Loss 4.9932 (4.8864)	Top-1 acc 13.672 (15.353)	Top-5 acc 34.766 (34.020)	lr 0.03543
Warmup Train [15][1690/3239]	Time 0.405 (0.513)	Data 0.003 (0.013)	Loss 4.7182 (4.8864)	Top-1 acc 19.922 (15.353)	Top-5 acc 36.328 (34.018)	lr 0.03543
Warmup Train [15][1700/3239]	Time 0.494 (0.513)	Data 0.001 (0.013)	Loss 4.7968 (4.8861)	Top-1 acc 18.750 (15.366)	Top-5 acc 37.500 (34.028)	lr 0.03542
Warmup Train [15][1710/3239]	Time 0.328 (0.513)	Data 0.001 (0.013)	Loss 5.0591 (4.8859)	Top-1 acc 15.625 (15.368)	Top-5 acc 28.516 (34.026)	lr 0.03542
Warmup Train [15][1720/3239]	Time 0.361 (0.513)	Data 0.001 (0.013)	Loss 4.7781 (4.8859)	Top-1 acc 14.844 (15.366)	Top-5 acc 37.109 (34.027)	lr 0.03541
Warmup Train [15][1730/3239]	Time 0.477 (0.513)	Data 0.001 (0.013)	Loss 4.8234 (4.8859)	Top-1 acc 16.016 (15.364)	Top-5 acc 36.719 (34.026)	lr 0.03541
Warmup Train [15][1740/3239]	Time 0.453 (0.513)	Data 0.001 (0.013)	Loss 5.0654 (4.8861)	Top-1 acc 10.156 (15.360)	Top-5 acc 30.469 (34.028)	lr 0.03540
Warmup Train [15][1750/3239]	Time 0.407 (0.513)	Data 0.001 (0.013)	Loss 4.8608 (4.8860)	Top-1 acc 14.453 (15.359)	Top-5 acc 31.641 (34.034)	lr 0.03539
Warmup Train [15][1760/3239]	Time 0.716 (0.513)	Data 0.001 (0.013)	Loss 4.8204 (4.8856)	Top-1 acc 18.750 (15.371)	Top-5 acc 32.031 (34.038)	lr 0.03539
Warmup Train [15][1770/3239]	Time 0.515 (0.513)	Data 0.001 (0.013)	Loss 4.8660 (4.8853)	Top-1 acc 13.672 (15.371)	Top-5 acc 32.031 (34.037)	lr 0.03538
Warmup Train [15][1780/3239]	Time 0.587 (0.513)	Data 0.001 (0.013)	Loss 4.7580 (4.8851)	Top-1 acc 21.875 (15.383)	Top-5 acc 41.016 (34.041)	lr 0.03538
Warmup Train [15][1790/3239]	Time 0.539 (0.513)	Data 0.001 (0.013)	Loss 5.0617 (4.8850)	Top-1 acc 15.234 (15.383)	Top-5 acc 28.125 (34.035)	lr 0.03537
Warmup Train [15][1800/3239]	Time 0.514 (0.513)	Data 0.001 (0.013)	Loss 4.8266 (4.8849)	Top-1 acc 14.453 (15.383)	Top-5 acc 34.375 (34.038)	lr 0.03537
Warmup Train [15][1810/3239]	Time 0.510 (0.513)	Data 0.001 (0.013)	Loss 4.7964 (4.8848)	Top-1 acc 16.406 (15.383)	Top-5 acc 36.328 (34.041)	lr 0.03536
Warmup Train [15][1820/3239]	Time 0.524 (0.513)	Data 0.001 (0.013)	Loss 5.0609 (4.8850)	Top-1 acc 12.109 (15.380)	Top-5 acc 26.953 (34.035)	lr 0.03536
Warmup Train [15][1830/3239]	Time 0.421 (0.513)	Data 0.001 (0.013)	Loss 4.8938 (4.8849)	Top-1 acc 14.062 (15.384)	Top-5 acc 34.375 (34.041)	lr 0.03535
Warmup Train [15][1840/3239]	Time 0.394 (0.513)	Data 0.001 (0.013)	Loss 4.6549 (4.8846)	Top-1 acc 20.312 (15.391)	Top-5 acc 39.062 (34.048)	lr 0.03535
Warmup Train [15][1850/3239]	Time 0.358 (0.513)	Data 0.001 (0.013)	Loss 4.9478 (4.8847)	Top-1 acc 13.672 (15.392)	Top-5 acc 34.766 (34.046)	lr 0.03534
Warmup Train [15][1860/3239]	Time 0.673 (0.513)	Data 0.001 (0.013)	Loss 4.9095 (4.8845)	Top-1 acc 12.500 (15.390)	Top-5 acc 32.031 (34.053)	lr 0.03533
Warmup Train [15][1870/3239]	Time 0.473 (0.513)	Data 0.001 (0.013)	Loss 4.9642 (4.8845)	Top-1 acc 15.625 (15.395)	Top-5 acc 33.203 (34.054)	lr 0.03533
Warmup Train [15][1880/3239]	Time 0.331 (0.513)	Data 0.001 (0.013)	Loss 4.7288 (4.8844)	Top-1 acc 15.234 (15.391)	Top-5 acc 39.844 (34.056)	lr 0.03532
Warmup Train [15][1890/3239]	Time 0.492 (0.513)	Data 0.001 (0.013)	Loss 4.7887 (4.8842)	Top-1 acc 15.234 (15.392)	Top-5 acc 34.766 (34.063)	lr 0.03532
Warmup Train [15][1900/3239]	Time 0.548 (0.513)	Data 0.001 (0.013)	Loss 4.7823 (4.8840)	Top-1 acc 14.844 (15.391)	Top-5 acc 38.281 (34.063)	lr 0.03531
Warmup Train [15][1910/3239]	Time 0.404 (0.513)	Data 0.001 (0.013)	Loss 4.8000 (4.8838)	Top-1 acc 16.016 (15.393)	Top-5 acc 37.500 (34.070)	lr 0.03531
Warmup Train [15][1920/3239]	Time 0.490 (0.513)	Data 0.001 (0.013)	Loss 4.8056 (4.8839)	Top-1 acc 17.969 (15.391)	Top-5 acc 35.938 (34.062)	lr 0.03530
Warmup Train [15][1930/3239]	Time 0.487 (0.513)	Data 0.001 (0.013)	Loss 4.8012 (4.8839)	Top-1 acc 16.797 (15.391)	Top-5 acc 34.375 (34.063)	lr 0.03530
Warmup Train [15][1940/3239]	Time 0.350 (0.513)	Data 0.001 (0.013)	Loss 4.9870 (4.8836)	Top-1 acc 13.281 (15.394)	Top-5 acc 31.250 (34.073)	lr 0.03529
Warmup Train [15][1950/3239]	Time 0.541 (0.513)	Data 0.001 (0.013)	Loss 5.0424 (4.8834)	Top-1 acc 10.938 (15.396)	Top-5 acc 27.734 (34.075)	lr 0.03528
Warmup Train [15][1960/3239]	Time 0.590 (0.513)	Data 0.001 (0.013)	Loss 4.7626 (4.8828)	Top-1 acc 16.406 (15.406)	Top-5 acc 37.891 (34.092)	lr 0.03528
Warmup Train [15][1970/3239]	Time 0.496 (0.513)	Data 0.001 (0.013)	Loss 4.8797 (4.8826)	Top-1 acc 17.578 (15.410)	Top-5 acc 37.109 (34.098)	lr 0.03527
Warmup Train [15][1980/3239]	Time 0.545 (0.513)	Data 0.001 (0.013)	Loss 4.8350 (4.8824)	Top-1 acc 16.406 (15.414)	Top-5 acc 33.594 (34.102)	lr 0.03527
Warmup Train [15][1990/3239]	Time 0.457 (0.513)	Data 0.001 (0.012)	Loss 5.1471 (4.8825)	Top-1 acc 12.109 (15.417)	Top-5 acc 29.297 (34.096)	lr 0.03526
Warmup Train [15][2000/3239]	Time 0.390 (0.513)	Data 0.001 (0.012)	Loss 4.9802 (4.8824)	Top-1 acc 16.016 (15.417)	Top-5 acc 33.594 (34.100)	lr 0.03526
Warmup Train [15][2010/3239]	Time 0.593 (0.513)	Data 0.001 (0.012)	Loss 4.9855 (4.8822)	Top-1 acc 11.328 (15.416)	Top-5 acc 29.297 (34.105)	lr 0.03525
Warmup Train [15][2020/3239]	Time 0.608 (0.513)	Data 0.001 (0.012)	Loss 4.7272 (4.8819)	Top-1 acc 18.359 (15.417)	Top-5 acc 37.891 (34.115)	lr 0.03525
Warmup Train [15][2030/3239]	Time 0.453 (0.513)	Data 0.001 (0.012)	Loss 4.9041 (4.8822)	Top-1 acc 14.844 (15.412)	Top-5 acc 34.375 (34.111)	lr 0.03524
Warmup Train [15][2040/3239]	Time 0.632 (0.513)	Data 0.001 (0.012)	Loss 4.9024 (4.8821)	Top-1 acc 11.719 (15.408)	Top-5 acc 34.375 (34.109)	lr 0.03523
Warmup Train [15][2050/3239]	Time 0.549 (0.513)	Data 0.001 (0.012)	Loss 4.9038 (4.8816)	Top-1 acc 12.500 (15.411)	Top-5 acc 31.250 (34.124)	lr 0.03523
Warmup Train [15][2060/3239]	Time 0.607 (0.513)	Data 0.001 (0.012)	Loss 4.9813 (4.8814)	Top-1 acc 14.453 (15.412)	Top-5 acc 30.078 (34.127)	lr 0.03522
Warmup Train [15][2070/3239]	Time 0.522 (0.513)	Data 0.001 (0.012)	Loss 4.9662 (4.8812)	Top-1 acc 12.891 (15.410)	Top-5 acc 33.594 (34.133)	lr 0.03522
Warmup Train [15][2080/3239]	Time 0.525 (0.513)	Data 0.001 (0.012)	Loss 4.8205 (4.8809)	Top-1 acc 16.016 (15.409)	Top-5 acc 33.203 (34.135)	lr 0.03521
Warmup Train [15][2090/3239]	Time 0.523 (0.513)	Data 0.001 (0.012)	Loss 4.9939 (4.8810)	Top-1 acc 10.938 (15.412)	Top-5 acc 32.031 (34.135)	lr 0.03521
Warmup Train [15][2100/3239]	Time 0.444 (0.513)	Data 0.001 (0.012)	Loss 4.9213 (4.8809)	Top-1 acc 14.453 (15.415)	Top-5 acc 28.125 (34.136)	lr 0.03520
Warmup Train [15][2110/3239]	Time 0.616 (0.513)	Data 0.001 (0.012)	Loss 4.8199 (4.8808)	Top-1 acc 14.062 (15.415)	Top-5 acc 34.375 (34.139)	lr 0.03520
Warmup Train [15][2120/3239]	Time 0.634 (0.513)	Data 0.001 (0.012)	Loss 5.0019 (4.8807)	Top-1 acc 11.328 (15.420)	Top-5 acc 31.250 (34.143)	lr 0.03519
Warmup Train [15][2130/3239]	Time 0.522 (0.513)	Data 0.001 (0.012)	Loss 4.8156 (4.8805)	Top-1 acc 14.844 (15.422)	Top-5 acc 34.766 (34.146)	lr 0.03519
Warmup Train [15][2140/3239]	Time 0.503 (0.513)	Data 0.001 (0.012)	Loss 4.8718 (4.8803)	Top-1 acc 17.188 (15.425)	Top-5 acc 33.984 (34.151)	lr 0.03518
Warmup Train [15][2150/3239]	Time 0.463 (0.513)	Data 0.001 (0.012)	Loss 4.9865 (4.8802)	Top-1 acc 13.281 (15.425)	Top-5 acc 32.031 (34.157)	lr 0.03517
Warmup Train [15][2160/3239]	Time 0.556 (0.513)	Data 0.001 (0.012)	Loss 4.8934 (4.8800)	Top-1 acc 16.797 (15.429)	Top-5 acc 33.203 (34.157)	lr 0.03517
Warmup Train [15][2170/3239]	Time 0.316 (0.513)	Data 0.001 (0.012)	Loss 4.8517 (4.8798)	Top-1 acc 14.453 (15.429)	Top-5 acc 33.203 (34.162)	lr 0.03516
Warmup Train [15][2180/3239]	Time 0.498 (0.513)	Data 0.001 (0.012)	Loss 5.0227 (4.8797)	Top-1 acc 14.062 (15.427)	Top-5 acc 28.906 (34.162)	lr 0.03516
Warmup Train [15][2190/3239]	Time 0.602 (0.513)	Data 0.001 (0.012)	Loss 4.9495 (4.8798)	Top-1 acc 14.062 (15.431)	Top-5 acc 34.375 (34.165)	lr 0.03515
Warmup Train [15][2200/3239]	Time 0.242 (0.512)	Data 0.001 (0.012)	Loss 4.8758 (4.8798)	Top-1 acc 13.281 (15.430)	Top-5 acc 33.203 (34.160)	lr 0.03515
Warmup Train [15][2210/3239]	Time 0.395 (0.512)	Data 0.001 (0.012)	Loss 4.7638 (4.8796)	Top-1 acc 18.750 (15.435)	Top-5 acc 40.625 (34.164)	lr 0.03514
Warmup Train [15][2220/3239]	Time 0.486 (0.512)	Data 0.001 (0.012)	Loss 4.9572 (4.8798)	Top-1 acc 16.016 (15.436)	Top-5 acc 32.812 (34.159)	lr 0.03514
Warmup Train [15][2230/3239]	Time 0.430 (0.512)	Data 0.001 (0.012)	Loss 4.9319 (4.8797)	Top-1 acc 15.234 (15.440)	Top-5 acc 30.859 (34.163)	lr 0.03513
Warmup Train [15][2240/3239]	Time 0.622 (0.512)	Data 0.001 (0.012)	Loss 5.0369 (4.8797)	Top-1 acc 14.453 (15.438)	Top-5 acc 30.859 (34.161)	lr 0.03512
Warmup Train [15][2250/3239]	Time 0.348 (0.512)	Data 0.001 (0.012)	Loss 4.7825 (4.8794)	Top-1 acc 12.891 (15.439)	Top-5 acc 33.203 (34.170)	lr 0.03512
Warmup Train [15][2260/3239]	Time 0.665 (0.512)	Data 0.001 (0.012)	Loss 4.8189 (4.8793)	Top-1 acc 18.359 (15.440)	Top-5 acc 39.453 (34.171)	lr 0.03511
Warmup Train [15][2270/3239]	Time 0.551 (0.512)	Data 0.001 (0.012)	Loss 4.9412 (4.8793)	Top-1 acc 17.188 (15.443)	Top-5 acc 34.766 (34.179)	lr 0.03511
Warmup Train [15][2280/3239]	Time 0.470 (0.512)	Data 0.001 (0.012)	Loss 4.9627 (4.8794)	Top-1 acc 16.016 (15.442)	Top-5 acc 31.250 (34.177)	lr 0.03510
Warmup Train [15][2290/3239]	Time 0.341 (0.512)	Data 0.001 (0.012)	Loss 4.9632 (4.8796)	Top-1 acc 13.672 (15.437)	Top-5 acc 31.250 (34.167)	lr 0.03510
Warmup Train [15][2300/3239]	Time 0.529 (0.512)	Data 0.001 (0.012)	Loss 4.7971 (4.8794)	Top-1 acc 16.016 (15.442)	Top-5 acc 38.281 (34.173)	lr 0.03509
Warmup Train [15][2310/3239]	Time 0.543 (0.512)	Data 0.001 (0.012)	Loss 4.7451 (4.8790)	Top-1 acc 13.281 (15.450)	Top-5 acc 32.812 (34.183)	lr 0.03509
Warmup Train [15][2320/3239]	Time 0.425 (0.512)	Data 0.001 (0.012)	Loss 4.9540 (4.8790)	Top-1 acc 15.625 (15.453)	Top-5 acc 33.594 (34.183)	lr 0.03508
Warmup Train [15][2330/3239]	Time 0.430 (0.512)	Data 0.001 (0.012)	Loss 4.8656 (4.8788)	Top-1 acc 17.969 (15.456)	Top-5 acc 35.938 (34.187)	lr 0.03507
Warmup Train [15][2340/3239]	Time 0.454 (0.512)	Data 0.001 (0.012)	Loss 5.0195 (4.8786)	Top-1 acc 16.797 (15.458)	Top-5 acc 32.031 (34.191)	lr 0.03507
Warmup Train [15][2350/3239]	Time 0.684 (0.512)	Data 0.001 (0.012)	Loss 4.8747 (4.8786)	Top-1 acc 14.844 (15.458)	Top-5 acc 32.031 (34.190)	lr 0.03506
Warmup Train [15][2360/3239]	Time 0.521 (0.512)	Data 0.001 (0.012)	Loss 4.7191 (4.8784)	Top-1 acc 17.188 (15.459)	Top-5 acc 38.281 (34.190)	lr 0.03506
Warmup Train [15][2370/3239]	Time 0.623 (0.512)	Data 0.002 (0.012)	Loss 4.8595 (4.8782)	Top-1 acc 14.453 (15.461)	Top-5 acc 34.375 (34.197)	lr 0.03505
Warmup Train [15][2380/3239]	Time 0.541 (0.512)	Data 0.001 (0.011)	Loss 4.8285 (4.8781)	Top-1 acc 17.969 (15.460)	Top-5 acc 33.203 (34.196)	lr 0.03505
Warmup Train [15][2390/3239]	Time 0.507 (0.512)	Data 0.001 (0.011)	Loss 4.9535 (4.8781)	Top-1 acc 12.500 (15.460)	Top-5 acc 32.812 (34.198)	lr 0.03504
Warmup Train [15][2400/3239]	Time 0.506 (0.512)	Data 0.001 (0.011)	Loss 4.8265 (4.8777)	Top-1 acc 19.922 (15.464)	Top-5 acc 34.766 (34.208)	lr 0.03504
Warmup Train [15][2410/3239]	Time 0.536 (0.512)	Data 0.001 (0.011)	Loss 4.9086 (4.8775)	Top-1 acc 12.500 (15.466)	Top-5 acc 31.250 (34.214)	lr 0.03503
Warmup Train [15][2420/3239]	Time 0.504 (0.512)	Data 0.001 (0.011)	Loss 4.9814 (4.8772)	Top-1 acc 16.797 (15.476)	Top-5 acc 35.156 (34.228)	lr 0.03502
Warmup Train [15][2430/3239]	Time 0.401 (0.512)	Data 0.001 (0.011)	Loss 4.8085 (4.8771)	Top-1 acc 16.797 (15.476)	Top-5 acc 35.547 (34.233)	lr 0.03502
Warmup Train [15][2440/3239]	Time 0.552 (0.512)	Data 0.001 (0.011)	Loss 4.9764 (4.8769)	Top-1 acc 15.625 (15.478)	Top-5 acc 35.547 (34.235)	lr 0.03501
Warmup Train [15][2450/3239]	Time 0.474 (0.512)	Data 0.001 (0.011)	Loss 4.6963 (4.8766)	Top-1 acc 18.750 (15.482)	Top-5 acc 38.672 (34.237)	lr 0.03501
Warmup Train [15][2460/3239]	Time 0.395 (0.512)	Data 0.001 (0.011)	Loss 4.7830 (4.8763)	Top-1 acc 15.625 (15.484)	Top-5 acc 37.500 (34.244)	lr 0.03500
Warmup Train [15][2470/3239]	Time 0.416 (0.512)	Data 0.001 (0.011)	Loss 4.6642 (4.8763)	Top-1 acc 19.141 (15.486)	Top-5 acc 34.766 (34.244)	lr 0.03500
Warmup Train [15][2480/3239]	Time 0.338 (0.512)	Data 0.001 (0.011)	Loss 4.7109 (4.8760)	Top-1 acc 16.016 (15.488)	Top-5 acc 40.234 (34.252)	lr 0.03499
Warmup Train [15][2490/3239]	Time 0.515 (0.512)	Data 0.001 (0.011)	Loss 4.8761 (4.8759)	Top-1 acc 19.922 (15.489)	Top-5 acc 37.109 (34.251)	lr 0.03499
Warmup Train [15][2500/3239]	Time 0.201 (0.512)	Data 0.002 (0.011)	Loss 4.8365 (4.8756)	Top-1 acc 14.453 (15.491)	Top-5 acc 33.594 (34.255)	lr 0.03498
Warmup Train [15][2510/3239]	Time 0.616 (0.512)	Data 0.001 (0.011)	Loss 4.8214 (4.8756)	Top-1 acc 17.969 (15.494)	Top-5 acc 35.156 (34.251)	lr 0.03497
Warmup Train [15][2520/3239]	Time 0.339 (0.512)	Data 0.001 (0.011)	Loss 4.9310 (4.8758)	Top-1 acc 12.500 (15.491)	Top-5 acc 30.469 (34.242)	lr 0.03497
Warmup Train [15][2530/3239]	Time 0.375 (0.512)	Data 0.001 (0.011)	Loss 4.9269 (4.8756)	Top-1 acc 16.016 (15.494)	Top-5 acc 33.203 (34.249)	lr 0.03496
Warmup Train [15][2540/3239]	Time 0.532 (0.512)	Data 0.001 (0.011)	Loss 4.7658 (4.8756)	Top-1 acc 14.844 (15.491)	Top-5 acc 37.500 (34.252)	lr 0.03496
Warmup Train [15][2550/3239]	Time 0.472 (0.512)	Data 0.001 (0.011)	Loss 5.0880 (4.8755)	Top-1 acc 12.109 (15.492)	Top-5 acc 28.125 (34.254)	lr 0.03495
Warmup Train [15][2560/3239]	Time 0.543 (0.512)	Data 0.001 (0.011)	Loss 4.8225 (4.8754)	Top-1 acc 17.188 (15.499)	Top-5 acc 37.109 (34.257)	lr 0.03495
Warmup Train [15][2570/3239]	Time 0.657 (0.512)	Data 0.001 (0.011)	Loss 4.9736 (4.8755)	Top-1 acc 17.188 (15.497)	Top-5 acc 33.984 (34.257)	lr 0.03494
Warmup Train [15][2580/3239]	Time 0.394 (0.511)	Data 0.001 (0.011)	Loss 4.8171 (4.8755)	Top-1 acc 16.406 (15.497)	Top-5 acc 35.547 (34.258)	lr 0.03494
Warmup Train [15][2590/3239]	Time 0.520 (0.512)	Data 0.001 (0.011)	Loss 4.9010 (4.8753)	Top-1 acc 13.672 (15.500)	Top-5 acc 32.812 (34.262)	lr 0.03493
Warmup Train [15][2600/3239]	Time 0.582 (0.512)	Data 0.001 (0.011)	Loss 4.7954 (4.8752)	Top-1 acc 17.969 (15.501)	Top-5 acc 37.500 (34.263)	lr 0.03492
Warmup Train [15][2610/3239]	Time 0.498 (0.512)	Data 0.001 (0.011)	Loss 4.9191 (4.8753)	Top-1 acc 17.188 (15.501)	Top-5 acc 29.688 (34.258)	lr 0.03492
Warmup Train [15][2620/3239]	Time 0.590 (0.512)	Data 0.001 (0.011)	Loss 4.6754 (4.8751)	Top-1 acc 21.094 (15.504)	Top-5 acc 39.453 (34.262)	lr 0.03491
Warmup Train [15][2630/3239]	Time 0.508 (0.512)	Data 0.001 (0.011)	Loss 4.7056 (4.8747)	Top-1 acc 15.625 (15.509)	Top-5 acc 39.062 (34.265)	lr 0.03491
Warmup Train [15][2640/3239]	Time 0.426 (0.511)	Data 0.001 (0.011)	Loss 4.9230 (4.8747)	Top-1 acc 15.234 (15.509)	Top-5 acc 33.594 (34.266)	lr 0.03490
Warmup Train [15][2650/3239]	Time 0.397 (0.511)	Data 0.001 (0.011)	Loss 4.8133 (4.8747)	Top-1 acc 16.797 (15.509)	Top-5 acc 35.938 (34.267)	lr 0.03490
Warmup Train [15][2660/3239]	Time 0.515 (0.512)	Data 0.001 (0.011)	Loss 4.8590 (4.8746)	Top-1 acc 17.188 (15.513)	Top-5 acc 33.203 (34.267)	lr 0.03489
Warmup Train [15][2670/3239]	Time 0.439 (0.512)	Data 0.001 (0.011)	Loss 4.7104 (4.8742)	Top-1 acc 12.891 (15.514)	Top-5 acc 37.891 (34.275)	lr 0.03489
Warmup Train [15][2680/3239]	Time 0.422 (0.512)	Data 0.001 (0.011)	Loss 4.9455 (4.8742)	Top-1 acc 17.188 (15.514)	Top-5 acc 30.469 (34.273)	lr 0.03488
Warmup Train [15][2690/3239]	Time 0.445 (0.512)	Data 0.001 (0.011)	Loss 4.7895 (4.8741)	Top-1 acc 19.141 (15.516)	Top-5 acc 37.109 (34.276)	lr 0.03487
Warmup Train [15][2700/3239]	Time 0.566 (0.512)	Data 0.001 (0.011)	Loss 4.9570 (4.8740)	Top-1 acc 14.844 (15.516)	Top-5 acc 33.594 (34.281)	lr 0.03487
Warmup Train [15][2710/3239]	Time 0.457 (0.511)	Data 0.001 (0.011)	Loss 4.8937 (4.8739)	Top-1 acc 15.234 (15.516)	Top-5 acc 31.250 (34.281)	lr 0.03486
Warmup Train [15][2720/3239]	Time 0.466 (0.511)	Data 0.001 (0.011)	Loss 4.7943 (4.8738)	Top-1 acc 18.359 (15.520)	Top-5 acc 35.938 (34.285)	lr 0.03486
Warmup Train [15][2730/3239]	Time 0.378 (0.511)	Data 0.001 (0.011)	Loss 4.9880 (4.8736)	Top-1 acc 14.844 (15.525)	Top-5 acc 33.594 (34.287)	lr 0.03485
Warmup Train [15][2740/3239]	Time 0.605 (0.511)	Data 0.001 (0.011)	Loss 4.7450 (4.8734)	Top-1 acc 18.359 (15.528)	Top-5 acc 36.719 (34.293)	lr 0.03485
Warmup Train [15][2750/3239]	Time 0.595 (0.511)	Data 0.001 (0.011)	Loss 4.9140 (4.8733)	Top-1 acc 15.234 (15.531)	Top-5 acc 35.156 (34.297)	lr 0.03484
Warmup Train [15][2760/3239]	Time 0.464 (0.511)	Data 0.001 (0.011)	Loss 4.6432 (4.8731)	Top-1 acc 20.703 (15.535)	Top-5 acc 43.359 (34.300)	lr 0.03484
Warmup Train [15][2770/3239]	Time 0.369 (0.511)	Data 0.001 (0.011)	Loss 4.9715 (4.8730)	Top-1 acc 13.281 (15.538)	Top-5 acc 30.859 (34.306)	lr 0.03483
Warmup Train [15][2780/3239]	Time 0.453 (0.511)	Data 0.001 (0.011)	Loss 4.6132 (4.8728)	Top-1 acc 19.922 (15.537)	Top-5 acc 40.625 (34.314)	lr 0.03482
Warmup Train [15][2790/3239]	Time 0.632 (0.511)	Data 0.001 (0.011)	Loss 4.8655 (4.8727)	Top-1 acc 16.016 (15.539)	Top-5 acc 34.766 (34.320)	lr 0.03482
Warmup Train [15][2800/3239]	Time 0.621 (0.511)	Data 0.001 (0.011)	Loss 4.5995 (4.8725)	Top-1 acc 17.578 (15.541)	Top-5 acc 42.188 (34.324)	lr 0.03481
Warmup Train [15][2810/3239]	Time 0.549 (0.511)	Data 0.001 (0.011)	Loss 4.9307 (4.8725)	Top-1 acc 17.578 (15.542)	Top-5 acc 35.547 (34.328)	lr 0.03481
Warmup Train [15][2820/3239]	Time 0.514 (0.511)	Data 0.001 (0.011)	Loss 4.8017 (4.8724)	Top-1 acc 16.406 (15.547)	Top-5 acc 32.031 (34.332)	lr 0.03480
Warmup Train [15][2830/3239]	Time 0.502 (0.511)	Data 0.001 (0.011)	Loss 4.6366 (4.8723)	Top-1 acc 20.703 (15.551)	Top-5 acc 40.625 (34.336)	lr 0.03480
Warmup Train [15][2840/3239]	Time 0.503 (0.511)	Data 0.001 (0.011)	Loss 4.9962 (4.8723)	Top-1 acc 17.188 (15.554)	Top-5 acc 32.031 (34.337)	lr 0.03479
Warmup Train [15][2850/3239]	Time 0.702 (0.511)	Data 0.001 (0.011)	Loss 4.7825 (4.8720)	Top-1 acc 17.188 (15.554)	Top-5 acc 37.891 (34.343)	lr 0.03479
Warmup Train [15][2860/3239]	Time 0.492 (0.511)	Data 0.001 (0.011)	Loss 4.9495 (4.8720)	Top-1 acc 16.016 (15.554)	Top-5 acc 33.203 (34.347)	lr 0.03478
Warmup Train [15][2870/3239]	Time 0.567 (0.511)	Data 0.001 (0.011)	Loss 4.8267 (4.8720)	Top-1 acc 14.844 (15.551)	Top-5 acc 35.938 (34.351)	lr 0.03477
Warmup Train [15][2880/3239]	Time 0.573 (0.511)	Data 0.001 (0.011)	Loss 4.6743 (4.8718)	Top-1 acc 17.188 (15.554)	Top-5 acc 40.234 (34.355)	lr 0.03477
Warmup Train [15][2890/3239]	Time 0.549 (0.511)	Data 0.001 (0.011)	Loss 4.9517 (4.8717)	Top-1 acc 13.672 (15.557)	Top-5 acc 29.688 (34.359)	lr 0.03476
Warmup Train [15][2900/3239]	Time 0.637 (0.511)	Data 0.001 (0.011)	Loss 4.7429 (4.8715)	Top-1 acc 13.672 (15.558)	Top-5 acc 36.328 (34.359)	lr 0.03476
Warmup Train [15][2910/3239]	Time 0.397 (0.511)	Data 0.001 (0.011)	Loss 4.8405 (4.8714)	Top-1 acc 16.406 (15.559)	Top-5 acc 34.375 (34.363)	lr 0.03475
Warmup Train [15][2920/3239]	Time 0.518 (0.511)	Data 0.001 (0.011)	Loss 4.7898 (4.8712)	Top-1 acc 15.625 (15.563)	Top-5 acc 35.938 (34.367)	lr 0.03475
Warmup Train [15][2930/3239]	Time 0.572 (0.511)	Data 0.001 (0.011)	Loss 4.8379 (4.8712)	Top-1 acc 17.969 (15.565)	Top-5 acc 37.500 (34.369)	lr 0.03474
Warmup Train [15][2940/3239]	Time 0.402 (0.511)	Data 0.002 (0.011)	Loss 4.7068 (4.8709)	Top-1 acc 18.750 (15.571)	Top-5 acc 42.578 (34.378)	lr 0.03473
Warmup Train [15][2950/3239]	Time 0.504 (0.511)	Data 0.001 (0.011)	Loss 4.8460 (4.8707)	Top-1 acc 16.797 (15.574)	Top-5 acc 35.938 (34.385)	lr 0.03473
Warmup Train [15][2960/3239]	Time 0.536 (0.511)	Data 0.001 (0.011)	Loss 4.7541 (4.8705)	Top-1 acc 16.797 (15.572)	Top-5 acc 41.016 (34.390)	lr 0.03472
Warmup Train [15][2970/3239]	Time 0.558 (0.511)	Data 0.001 (0.011)	Loss 4.6399 (4.8702)	Top-1 acc 18.750 (15.573)	Top-5 acc 37.109 (34.395)	lr 0.03472
Warmup Train [15][2980/3239]	Time 0.484 (0.511)	Data 0.001 (0.011)	Loss 4.8201 (4.8701)	Top-1 acc 18.359 (15.573)	Top-5 acc 35.156 (34.396)	lr 0.03471
Warmup Train [15][2990/3239]	Time 0.516 (0.511)	Data 0.001 (0.011)	Loss 4.8327 (4.8700)	Top-1 acc 17.188 (15.575)	Top-5 acc 38.672 (34.398)	lr 0.03471
Warmup Train [15][3000/3239]	Time 0.533 (0.511)	Data 0.001 (0.011)	Loss 5.1249 (4.8700)	Top-1 acc 9.375 (15.578)	Top-5 acc 28.906 (34.399)	lr 0.03470
Warmup Train [15][3010/3239]	Time 0.508 (0.511)	Data 0.001 (0.011)	Loss 4.8467 (4.8698)	Top-1 acc 19.531 (15.580)	Top-5 acc 34.766 (34.401)	lr 0.03470
Warmup Train [15][3020/3239]	Time 0.609 (0.511)	Data 0.001 (0.010)	Loss 5.0313 (4.8698)	Top-1 acc 15.234 (15.581)	Top-5 acc 33.984 (34.403)	lr 0.03469
Warmup Train [15][3030/3239]	Time 0.580 (0.511)	Data 0.001 (0.010)	Loss 5.0313 (4.8698)	Top-1 acc 11.328 (15.581)	Top-5 acc 31.250 (34.406)	lr 0.03468
Warmup Train [15][3040/3239]	Time 0.418 (0.511)	Data 0.001 (0.010)	Loss 4.8705 (4.8697)	Top-1 acc 17.188 (15.584)	Top-5 acc 36.328 (34.409)	lr 0.03468
Warmup Train [15][3050/3239]	Time 0.474 (0.511)	Data 0.001 (0.010)	Loss 4.7088 (4.8694)	Top-1 acc 15.234 (15.588)	Top-5 acc 33.594 (34.414)	lr 0.03467
Warmup Train [15][3060/3239]	Time 0.316 (0.511)	Data 0.001 (0.010)	Loss 4.7078 (4.8693)	Top-1 acc 17.578 (15.592)	Top-5 acc 39.453 (34.421)	lr 0.03467
Warmup Train [15][3070/3239]	Time 0.488 (0.511)	Data 0.001 (0.010)	Loss 4.8267 (4.8693)	Top-1 acc 19.922 (15.596)	Top-5 acc 38.672 (34.424)	lr 0.03466
Warmup Train [15][3080/3239]	Time 0.567 (0.511)	Data 0.001 (0.010)	Loss 4.8604 (4.8693)	Top-1 acc 16.797 (15.593)	Top-5 acc 34.766 (34.424)	lr 0.03466
Warmup Train [15][3090/3239]	Time 0.452 (0.511)	Data 0.001 (0.010)	Loss 4.8663 (4.8692)	Top-1 acc 12.891 (15.593)	Top-5 acc 32.031 (34.426)	lr 0.03465
Warmup Train [15][3100/3239]	Time 0.335 (0.511)	Data 0.001 (0.010)	Loss 4.9449 (4.8690)	Top-1 acc 14.844 (15.594)	Top-5 acc 37.109 (34.433)	lr 0.03465
Warmup Train [15][3110/3239]	Time 0.500 (0.511)	Data 0.001 (0.010)	Loss 4.8016 (4.8689)	Top-1 acc 17.578 (15.596)	Top-5 acc 38.281 (34.434)	lr 0.03464
Warmup Train [15][3120/3239]	Time 0.512 (0.511)	Data 0.001 (0.010)	Loss 4.9208 (4.8687)	Top-1 acc 15.625 (15.597)	Top-5 acc 33.594 (34.435)	lr 0.03463
Warmup Train [15][3130/3239]	Time 0.466 (0.511)	Data 0.001 (0.010)	Loss 4.8836 (4.8686)	Top-1 acc 19.531 (15.600)	Top-5 acc 35.156 (34.439)	lr 0.03463
Warmup Train [15][3140/3239]	Time 0.458 (0.511)	Data 0.002 (0.010)	Loss 5.0000 (4.8686)	Top-1 acc 12.500 (15.601)	Top-5 acc 31.250 (34.438)	lr 0.03462
Warmup Train [15][3150/3239]	Time 0.519 (0.511)	Data 0.001 (0.010)	Loss 4.9730 (4.8684)	Top-1 acc 10.547 (15.601)	Top-5 acc 28.516 (34.443)	lr 0.03462
Warmup Train [15][3160/3239]	Time 0.432 (0.511)	Data 0.001 (0.010)	Loss 4.6545 (4.8683)	Top-1 acc 17.578 (15.600)	Top-5 acc 38.672 (34.441)	lr 0.03461
Warmup Train [15][3170/3239]	Time 0.537 (0.511)	Data 0.001 (0.010)	Loss 4.7513 (4.8681)	Top-1 acc 15.234 (15.601)	Top-5 acc 37.109 (34.447)	lr 0.03461
Warmup Train [15][3180/3239]	Time 0.471 (0.511)	Data 0.000 (0.010)	Loss 4.6896 (4.8680)	Top-1 acc 17.188 (15.603)	Top-5 acc 39.453 (34.448)	lr 0.03460
Warmup Train [15][3190/3239]	Time 0.701 (0.511)	Data 0.000 (0.010)	Loss 4.6654 (4.8678)	Top-1 acc 15.234 (15.603)	Top-5 acc 37.500 (34.451)	lr 0.03460
Warmup Train [15][3200/3239]	Time 0.342 (0.511)	Data 0.000 (0.010)	Loss 4.9483 (4.8678)	Top-1 acc 13.281 (15.605)	Top-5 acc 33.203 (34.453)	lr 0.03459
Warmup Train [15][3210/3239]	Time 0.541 (0.511)	Data 0.000 (0.010)	Loss 4.8323 (4.8677)	Top-1 acc 18.359 (15.609)	Top-5 acc 33.203 (34.457)	lr 0.03458
Warmup Train [15][3220/3239]	Time 0.650 (0.511)	Data 0.000 (0.010)	Loss 4.7532 (4.8676)	Top-1 acc 18.750 (15.608)	Top-5 acc 38.281 (34.462)	lr 0.03458
Warmup Train [15][3230/3239]	Time 0.628 (0.511)	Data 0.000 (0.010)	Loss 4.8296 (4.8675)	Top-1 acc 16.797 (15.612)	Top-5 acc 34.375 (34.466)	lr 0.03457
Warmup Train [15][3239/3239]	Time 0.310 (0.511)	Data 0.000 (0.010)	Loss 4.8196 (4.8674)	Top-1 acc 16.049 (15.614)	Top-5 acc 38.272 (34.472)	lr 0.03457
==========Warmup Valid [15/40]	loss 3.962	top-1 acc 21.911	top-5 acc 44.445	Train top-1 15.614	top-5 34.472	flops: 442.4M
Warmup Train [16][0/3239]	Time 17.138 (17.138)	Data 15.869 (15.869)	Loss 4.7293 (4.7293)	Top-1 acc 17.969 (17.969)	Top-5 acc 39.062 (39.062)	lr 0.03457
Warmup Train [16][10/3239]	Time 0.518 (2.066)	Data 0.001 (1.455)	Loss 4.7397 (4.7957)	Top-1 acc 19.531 (17.543)	Top-5 acc 37.500 (37.216)	lr 0.03456
Warmup Train [16][20/3239]	Time 0.552 (1.331)	Data 0.001 (0.767)	Loss 4.9295 (4.8194)	Top-1 acc 14.844 (16.722)	Top-5 acc 33.203 (36.198)	lr 0.03456
Warmup Train [16][30/3239]	Time 0.531 (1.059)	Data 0.001 (0.520)	Loss 4.8868 (4.8284)	Top-1 acc 14.844 (16.696)	Top-5 acc 33.984 (35.988)	lr 0.03455
Warmup Train [16][40/3239]	Time 0.573 (0.925)	Data 0.003 (0.395)	Loss 4.7660 (4.8206)	Top-1 acc 14.062 (16.683)	Top-5 acc 33.203 (35.880)	lr 0.03454
Warmup Train [16][50/3239]	Time 0.577 (0.841)	Data 0.001 (0.319)	Loss 4.5879 (4.8217)	Top-1 acc 18.750 (16.544)	Top-5 acc 42.578 (35.685)	lr 0.03454
Warmup Train [16][60/3239]	Time 0.425 (0.786)	Data 0.001 (0.269)	Loss 4.9536 (4.8197)	Top-1 acc 15.234 (16.643)	Top-5 acc 33.594 (35.701)	lr 0.03453
Warmup Train [16][70/3239]	Time 0.574 (0.748)	Data 0.001 (0.233)	Loss 4.8422 (4.8141)	Top-1 acc 15.234 (16.769)	Top-5 acc 34.766 (35.734)	lr 0.03453
Warmup Train [16][80/3239]	Time 0.505 (0.719)	Data 0.001 (0.204)	Loss 4.8699 (4.8133)	Top-1 acc 18.750 (16.797)	Top-5 acc 38.672 (35.778)	lr 0.03452
Warmup Train [16][90/3239]	Time 0.389 (0.695)	Data 0.001 (0.182)	Loss 4.6598 (4.8053)	Top-1 acc 21.484 (16.883)	Top-5 acc 39.844 (35.998)	lr 0.03452
Warmup Train [16][100/3239]	Time 0.637 (0.678)	Data 0.001 (0.165)	Loss 4.7924 (4.8021)	Top-1 acc 13.672 (16.747)	Top-5 acc 37.891 (36.003)	lr 0.03451
Warmup Train [16][110/3239]	Time 0.500 (0.664)	Data 0.001 (0.150)	Loss 4.9352 (4.8027)	Top-1 acc 11.719 (16.667)	Top-5 acc 31.250 (36.036)	lr 0.03451
Warmup Train [16][120/3239]	Time 0.516 (0.651)	Data 0.001 (0.139)	Loss 4.8878 (4.8021)	Top-1 acc 12.109 (16.584)	Top-5 acc 32.812 (36.002)	lr 0.03450
Warmup Train [16][130/3239]	Time 0.451 (0.641)	Data 0.001 (0.128)	Loss 4.7698 (4.8004)	Top-1 acc 17.188 (16.618)	Top-5 acc 35.156 (36.009)	lr 0.03449
Warmup Train [16][140/3239]	Time 0.558 (0.634)	Data 0.001 (0.120)	Loss 4.7816 (4.7987)	Top-1 acc 16.797 (16.595)	Top-5 acc 37.500 (36.015)	lr 0.03449
Warmup Train [16][150/3239]	Time 0.541 (0.626)	Data 0.001 (0.112)	Loss 4.8361 (4.8002)	Top-1 acc 16.016 (16.605)	Top-5 acc 37.500 (36.049)	lr 0.03448
Warmup Train [16][160/3239]	Time 0.568 (0.619)	Data 0.001 (0.105)	Loss 4.7932 (4.8007)	Top-1 acc 18.359 (16.583)	Top-5 acc 39.062 (36.032)	lr 0.03448
Warmup Train [16][170/3239]	Time 0.324 (0.611)	Data 0.001 (0.100)	Loss 4.6395 (4.8017)	Top-1 acc 23.828 (16.653)	Top-5 acc 39.844 (36.033)	lr 0.03447
Warmup Train [16][180/3239]	Time 0.461 (0.606)	Data 0.001 (0.095)	Loss 4.8685 (4.7998)	Top-1 acc 15.625 (16.687)	Top-5 acc 33.984 (36.048)	lr 0.03447
Warmup Train [16][190/3239]	Time 0.533 (0.599)	Data 0.001 (0.091)	Loss 4.8592 (4.7993)	Top-1 acc 16.406 (16.668)	Top-5 acc 32.812 (35.987)	lr 0.03446
Warmup Train [16][200/3239]	Time 0.586 (0.593)	Data 0.001 (0.086)	Loss 4.8550 (4.7999)	Top-1 acc 16.016 (16.620)	Top-5 acc 34.766 (36.019)	lr 0.03445
Warmup Train [16][210/3239]	Time 0.162 (0.587)	Data 0.001 (0.082)	Loss 4.9384 (4.8028)	Top-1 acc 13.672 (16.528)	Top-5 acc 33.984 (36.004)	lr 0.03445
Warmup Train [16][220/3239]	Time 0.624 (0.584)	Data 0.001 (0.080)	Loss 4.8211 (4.8026)	Top-1 acc 12.500 (16.535)	Top-5 acc 37.109 (36.028)	lr 0.03444
Warmup Train [16][230/3239]	Time 0.502 (0.581)	Data 0.001 (0.076)	Loss 4.8392 (4.8044)	Top-1 acc 14.062 (16.492)	Top-5 acc 32.812 (35.990)	lr 0.03444
Warmup Train [16][240/3239]	Time 0.582 (0.578)	Data 0.001 (0.073)	Loss 4.9400 (4.8058)	Top-1 acc 13.281 (16.469)	Top-5 acc 32.031 (35.980)	lr 0.03443
Warmup Train [16][250/3239]	Time 0.533 (0.575)	Data 0.001 (0.070)	Loss 4.7800 (4.8079)	Top-1 acc 14.453 (16.437)	Top-5 acc 36.719 (35.967)	lr 0.03443
Warmup Train [16][260/3239]	Time 0.341 (0.571)	Data 0.001 (0.068)	Loss 4.8544 (4.8074)	Top-1 acc 13.672 (16.483)	Top-5 acc 32.031 (35.981)	lr 0.03442
Warmup Train [16][270/3239]	Time 0.589 (0.570)	Data 0.001 (0.066)	Loss 4.8907 (4.8091)	Top-1 acc 16.797 (16.514)	Top-5 acc 33.203 (35.932)	lr 0.03442
Warmup Train [16][280/3239]	Time 0.452 (0.567)	Data 0.001 (0.064)	Loss 4.6576 (4.8096)	Top-1 acc 17.969 (16.517)	Top-5 acc 41.016 (35.950)	lr 0.03441
Warmup Train [16][290/3239]	Time 0.355 (0.565)	Data 0.038 (0.062)	Loss 4.7676 (4.8082)	Top-1 acc 18.750 (16.565)	Top-5 acc 37.109 (35.971)	lr 0.03440
Warmup Train [16][300/3239]	Time 0.436 (0.564)	Data 0.001 (0.060)	Loss 4.9568 (4.8084)	Top-1 acc 15.234 (16.541)	Top-5 acc 30.859 (35.992)	lr 0.03440
Warmup Train [16][310/3239]	Time 0.531 (0.562)	Data 0.001 (0.059)	Loss 4.7715 (4.8087)	Top-1 acc 19.141 (16.534)	Top-5 acc 35.156 (35.979)	lr 0.03439
Warmup Train [16][320/3239]	Time 0.645 (0.562)	Data 0.001 (0.057)	Loss 4.8042 (4.8078)	Top-1 acc 16.016 (16.555)	Top-5 acc 39.062 (36.003)	lr 0.03439
Warmup Train [16][330/3239]	Time 0.501 (0.559)	Data 0.001 (0.055)	Loss 4.7877 (4.8064)	Top-1 acc 16.797 (16.590)	Top-5 acc 34.766 (36.027)	lr 0.03438
Warmup Train [16][340/3239]	Time 0.283 (0.557)	Data 0.001 (0.054)	Loss 5.0396 (4.8081)	Top-1 acc 12.500 (16.546)	Top-5 acc 32.422 (35.979)	lr 0.03438
Warmup Train [16][350/3239]	Time 0.511 (0.556)	Data 0.001 (0.053)	Loss 4.9523 (4.8107)	Top-1 acc 17.578 (16.511)	Top-5 acc 33.594 (35.902)	lr 0.03437
Warmup Train [16][360/3239]	Time 0.329 (0.554)	Data 0.001 (0.051)	Loss 4.8915 (4.8103)	Top-1 acc 17.578 (16.538)	Top-5 acc 31.250 (35.878)	lr 0.03437
Warmup Train [16][370/3239]	Time 0.437 (0.553)	Data 0.001 (0.050)	Loss 4.6575 (4.8099)	Top-1 acc 23.828 (16.546)	Top-5 acc 39.844 (35.882)	lr 0.03436
Warmup Train [16][380/3239]	Time 0.521 (0.552)	Data 0.001 (0.050)	Loss 4.6895 (4.8094)	Top-1 acc 16.406 (16.555)	Top-5 acc 37.109 (35.881)	lr 0.03435
Warmup Train [16][390/3239]	Time 0.508 (0.551)	Data 0.001 (0.048)	Loss 4.6130 (4.8085)	Top-1 acc 20.703 (16.584)	Top-5 acc 42.188 (35.901)	lr 0.03435
Warmup Train [16][400/3239]	Time 0.454 (0.549)	Data 0.001 (0.047)	Loss 4.8014 (4.8100)	Top-1 acc 13.281 (16.559)	Top-5 acc 35.156 (35.863)	lr 0.03434
Warmup Train [16][410/3239]	Time 0.562 (0.549)	Data 0.001 (0.046)	Loss 4.8114 (4.8102)	Top-1 acc 17.578 (16.580)	Top-5 acc 36.719 (35.881)	lr 0.03434
Warmup Train [16][420/3239]	Time 0.348 (0.547)	Data 0.001 (0.045)	Loss 5.0275 (4.8123)	Top-1 acc 10.938 (16.540)	Top-5 acc 32.031 (35.849)	lr 0.03433
Warmup Train [16][430/3239]	Time 0.521 (0.547)	Data 0.001 (0.045)	Loss 4.8578 (4.8122)	Top-1 acc 16.406 (16.544)	Top-5 acc 34.375 (35.845)	lr 0.03433
Warmup Train [16][440/3239]	Time 0.580 (0.547)	Data 0.001 (0.044)	Loss 4.6757 (4.8105)	Top-1 acc 19.531 (16.570)	Top-5 acc 38.672 (35.879)	lr 0.03432
Warmup Train [16][450/3239]	Time 0.468 (0.545)	Data 0.001 (0.043)	Loss 4.7451 (4.8105)	Top-1 acc 18.750 (16.573)	Top-5 acc 35.547 (35.891)	lr 0.03431
Warmup Train [16][460/3239]	Time 0.612 (0.545)	Data 0.001 (0.042)	Loss 4.6929 (4.8100)	Top-1 acc 21.094 (16.587)	Top-5 acc 37.891 (35.893)	lr 0.03431
Warmup Train [16][470/3239]	Time 0.474 (0.543)	Data 0.001 (0.041)	Loss 4.7455 (4.8113)	Top-1 acc 18.750 (16.550)	Top-5 acc 39.844 (35.870)	lr 0.03430
Warmup Train [16][480/3239]	Time 0.532 (0.541)	Data 0.001 (0.040)	Loss 4.7681 (4.8119)	Top-1 acc 17.188 (16.553)	Top-5 acc 37.109 (35.847)	lr 0.03430
Warmup Train [16][490/3239]	Time 0.321 (0.540)	Data 0.001 (0.040)	Loss 4.8064 (4.8124)	Top-1 acc 17.969 (16.552)	Top-5 acc 36.328 (35.837)	lr 0.03429
Warmup Train [16][500/3239]	Time 0.490 (0.539)	Data 0.001 (0.039)	Loss 4.8215 (4.8125)	Top-1 acc 17.969 (16.560)	Top-5 acc 35.938 (35.837)	lr 0.03429
Warmup Train [16][510/3239]	Time 0.347 (0.538)	Data 0.001 (0.039)	Loss 4.7429 (4.8122)	Top-1 acc 17.578 (16.552)	Top-5 acc 37.500 (35.850)	lr 0.03428
Warmup Train [16][520/3239]	Time 0.529 (0.538)	Data 0.024 (0.038)	Loss 4.7696 (4.8122)	Top-1 acc 18.359 (16.553)	Top-5 acc 38.281 (35.839)	lr 0.03428
Warmup Train [16][530/3239]	Time 0.560 (0.537)	Data 0.001 (0.038)	Loss 4.7619 (4.8122)	Top-1 acc 16.406 (16.577)	Top-5 acc 34.375 (35.848)	lr 0.03427
Warmup Train [16][540/3239]	Time 0.481 (0.537)	Data 0.001 (0.037)	Loss 4.8087 (4.8110)	Top-1 acc 17.969 (16.599)	Top-5 acc 38.281 (35.885)	lr 0.03426
Warmup Train [16][550/3239]	Time 0.564 (0.537)	Data 0.001 (0.036)	Loss 4.8493 (4.8113)	Top-1 acc 13.672 (16.604)	Top-5 acc 36.719 (35.894)	lr 0.03426
Warmup Train [16][560/3239]	Time 0.604 (0.537)	Data 0.001 (0.036)	Loss 4.8065 (4.8115)	Top-1 acc 12.500 (16.579)	Top-5 acc 36.719 (35.893)	lr 0.03425
Warmup Train [16][570/3239]	Time 0.410 (0.536)	Data 0.001 (0.035)	Loss 4.6409 (4.8109)	Top-1 acc 20.312 (16.593)	Top-5 acc 36.719 (35.900)	lr 0.03425
Warmup Train [16][580/3239]	Time 0.398 (0.536)	Data 0.001 (0.035)	Loss 4.8475 (4.8098)	Top-1 acc 15.234 (16.608)	Top-5 acc 33.594 (35.924)	lr 0.03424
Warmup Train [16][590/3239]	Time 0.442 (0.536)	Data 0.001 (0.034)	Loss 4.8404 (4.8098)	Top-1 acc 16.797 (16.620)	Top-5 acc 34.766 (35.918)	lr 0.03424
Warmup Train [16][600/3239]	Time 0.394 (0.536)	Data 0.001 (0.034)	Loss 4.7119 (4.8095)	Top-1 acc 16.797 (16.618)	Top-5 acc 39.062 (35.928)	lr 0.03423
Warmup Train [16][610/3239]	Time 0.558 (0.536)	Data 0.001 (0.033)	Loss 4.8238 (4.8096)	Top-1 acc 16.016 (16.613)	Top-5 acc 36.719 (35.916)	lr 0.03422
Warmup Train [16][620/3239]	Time 0.393 (0.535)	Data 0.001 (0.033)	Loss 4.6653 (4.8091)	Top-1 acc 17.188 (16.621)	Top-5 acc 35.547 (35.937)	lr 0.03422
Warmup Train [16][630/3239]	Time 0.342 (0.535)	Data 0.001 (0.033)	Loss 4.8359 (4.8092)	Top-1 acc 12.500 (16.602)	Top-5 acc 31.641 (35.936)	lr 0.03421
Warmup Train [16][640/3239]	Time 0.566 (0.535)	Data 0.001 (0.032)	Loss 4.7658 (4.8097)	Top-1 acc 16.016 (16.598)	Top-5 acc 36.719 (35.923)	lr 0.03421
Warmup Train [16][650/3239]	Time 0.519 (0.534)	Data 0.001 (0.032)	Loss 4.7708 (4.8099)	Top-1 acc 16.797 (16.609)	Top-5 acc 35.938 (35.912)	lr 0.03420
Warmup Train [16][660/3239]	Time 0.728 (0.534)	Data 0.001 (0.032)	Loss 4.6415 (4.8095)	Top-1 acc 18.359 (16.625)	Top-5 acc 38.281 (35.919)	lr 0.03420
Warmup Train [16][670/3239]	Time 0.504 (0.533)	Data 0.001 (0.031)	Loss 4.6806 (4.8090)	Top-1 acc 21.875 (16.654)	Top-5 acc 41.016 (35.938)	lr 0.03419
Warmup Train [16][680/3239]	Time 0.440 (0.533)	Data 0.001 (0.031)	Loss 4.9834 (4.8088)	Top-1 acc 12.109 (16.640)	Top-5 acc 30.078 (35.933)	lr 0.03419
Warmup Train [16][690/3239]	Time 0.388 (0.532)	Data 0.002 (0.030)	Loss 4.8837 (4.8085)	Top-1 acc 14.062 (16.637)	Top-5 acc 35.156 (35.937)	lr 0.03418
Warmup Train [16][700/3239]	Time 0.598 (0.532)	Data 0.001 (0.030)	Loss 4.6580 (4.8082)	Top-1 acc 16.797 (16.634)	Top-5 acc 38.672 (35.945)	lr 0.03417
Warmup Train [16][710/3239]	Time 0.508 (0.532)	Data 0.001 (0.030)	Loss 4.7008 (4.8081)	Top-1 acc 18.359 (16.641)	Top-5 acc 39.062 (35.948)	lr 0.03417
Warmup Train [16][720/3239]	Time 0.498 (0.532)	Data 0.001 (0.029)	Loss 4.7479 (4.8081)	Top-1 acc 17.188 (16.659)	Top-5 acc 37.891 (35.959)	lr 0.03416
Warmup Train [16][730/3239]	Time 0.576 (0.532)	Data 0.001 (0.029)	Loss 4.7960 (4.8077)	Top-1 acc 20.703 (16.668)	Top-5 acc 39.453 (35.978)	lr 0.03416
Warmup Train [16][740/3239]	Time 0.654 (0.531)	Data 0.001 (0.029)	Loss 4.7045 (4.8071)	Top-1 acc 19.141 (16.685)	Top-5 acc 41.016 (35.999)	lr 0.03415
Warmup Train [16][750/3239]	Time 0.775 (0.531)	Data 0.001 (0.028)	Loss 4.8252 (4.8066)	Top-1 acc 19.141 (16.689)	Top-5 acc 35.156 (36.012)	lr 0.03415
Warmup Train [16][760/3239]	Time 0.614 (0.530)	Data 0.001 (0.028)	Loss 4.6504 (4.8071)	Top-1 acc 15.234 (16.687)	Top-5 acc 40.625 (36.000)	lr 0.03414
Warmup Train [16][770/3239]	Time 0.327 (0.529)	Data 0.001 (0.028)	Loss 4.7098 (4.8063)	Top-1 acc 19.141 (16.699)	Top-5 acc 40.625 (36.012)	lr 0.03413
Warmup Train [16][780/3239]	Time 0.500 (0.529)	Data 0.001 (0.027)	Loss 4.7926 (4.8065)	Top-1 acc 16.797 (16.689)	Top-5 acc 32.422 (35.997)	lr 0.03413
Warmup Train [16][790/3239]	Time 0.655 (0.529)	Data 0.001 (0.027)	Loss 4.9119 (4.8071)	Top-1 acc 19.922 (16.686)	Top-5 acc 35.547 (35.984)	lr 0.03412
Warmup Train [16][800/3239]	Time 0.660 (0.529)	Data 0.001 (0.027)	Loss 4.8608 (4.8065)	Top-1 acc 18.359 (16.705)	Top-5 acc 36.719 (36.009)	lr 0.03412
Warmup Train [16][810/3239]	Time 0.360 (0.528)	Data 0.001 (0.027)	Loss 4.6519 (4.8058)	Top-1 acc 18.750 (16.712)	Top-5 acc 39.453 (36.028)	lr 0.03411
Warmup Train [16][820/3239]	Time 0.496 (0.528)	Data 0.001 (0.026)	Loss 4.7535 (4.8056)	Top-1 acc 17.578 (16.714)	Top-5 acc 38.672 (36.041)	lr 0.03411
Warmup Train [16][830/3239]	Time 0.524 (0.528)	Data 0.001 (0.026)	Loss 4.7056 (4.8057)	Top-1 acc 18.750 (16.720)	Top-5 acc 36.719 (36.054)	lr 0.03410
Warmup Train [16][840/3239]	Time 0.505 (0.528)	Data 0.001 (0.026)	Loss 4.7789 (4.8062)	Top-1 acc 15.234 (16.711)	Top-5 acc 36.328 (36.038)	lr 0.03409
Warmup Train [16][850/3239]	Time 0.451 (0.527)	Data 0.001 (0.026)	Loss 4.6748 (4.8062)	Top-1 acc 21.875 (16.711)	Top-5 acc 40.625 (36.039)	lr 0.03409
Warmup Train [16][860/3239]	Time 0.345 (0.527)	Data 0.001 (0.026)	Loss 4.9737 (4.8058)	Top-1 acc 16.016 (16.730)	Top-5 acc 35.156 (36.049)	lr 0.03408
Warmup Train [16][870/3239]	Time 0.595 (0.527)	Data 0.001 (0.026)	Loss 4.7418 (4.8058)	Top-1 acc 18.750 (16.737)	Top-5 acc 37.891 (36.040)	lr 0.03408
Warmup Train [16][880/3239]	Time 0.531 (0.527)	Data 0.001 (0.025)	Loss 4.9181 (4.8059)	Top-1 acc 16.406 (16.734)	Top-5 acc 31.641 (36.025)	lr 0.03407
Warmup Train [16][890/3239]	Time 0.477 (0.527)	Data 0.001 (0.025)	Loss 4.8690 (4.8063)	Top-1 acc 13.672 (16.723)	Top-5 acc 35.547 (36.015)	lr 0.03407
Warmup Train [16][900/3239]	Time 0.567 (0.526)	Data 0.001 (0.025)	Loss 4.7383 (4.8063)	Top-1 acc 18.750 (16.725)	Top-5 acc 39.453 (36.008)	lr 0.03406
Warmup Train [16][910/3239]	Time 0.566 (0.526)	Data 0.001 (0.025)	Loss 4.7595 (4.8061)	Top-1 acc 17.188 (16.732)	Top-5 acc 37.109 (36.003)	lr 0.03406
Warmup Train [16][920/3239]	Time 0.486 (0.526)	Data 0.001 (0.024)	Loss 4.8469 (4.8068)	Top-1 acc 17.188 (16.718)	Top-5 acc 33.594 (35.989)	lr 0.03405
Warmup Train [16][930/3239]	Time 0.678 (0.526)	Data 0.001 (0.024)	Loss 4.6753 (4.8067)	Top-1 acc 17.188 (16.720)	Top-5 acc 38.672 (35.985)	lr 0.03404
Warmup Train [16][940/3239]	Time 0.493 (0.526)	Data 0.001 (0.024)	Loss 4.9249 (4.8070)	Top-1 acc 16.016 (16.715)	Top-5 acc 30.859 (35.975)	lr 0.03404
Warmup Train [16][950/3239]	Time 0.524 (0.526)	Data 0.001 (0.024)	Loss 4.6948 (4.8067)	Top-1 acc 16.797 (16.714)	Top-5 acc 39.453 (35.981)	lr 0.03403
Warmup Train [16][960/3239]	Time 0.357 (0.525)	Data 0.001 (0.024)	Loss 4.8487 (4.8069)	Top-1 acc 13.281 (16.707)	Top-5 acc 34.766 (35.974)	lr 0.03403
Warmup Train [16][970/3239]	Time 0.620 (0.525)	Data 0.001 (0.024)	Loss 4.7216 (4.8072)	Top-1 acc 14.453 (16.698)	Top-5 acc 38.672 (35.954)	lr 0.03402
Warmup Train [16][980/3239]	Time 0.592 (0.525)	Data 0.001 (0.023)	Loss 4.7287 (4.8069)	Top-1 acc 18.359 (16.694)	Top-5 acc 42.188 (35.967)	lr 0.03402
Warmup Train [16][990/3239]	Time 0.508 (0.525)	Data 0.001 (0.023)	Loss 4.6850 (4.8068)	Top-1 acc 17.188 (16.694)	Top-5 acc 37.891 (35.973)	lr 0.03401
Warmup Train [16][1000/3239]	Time 0.570 (0.525)	Data 0.001 (0.023)	Loss 4.7482 (4.8068)	Top-1 acc 18.750 (16.692)	Top-5 acc 41.016 (35.972)	lr 0.03400
Warmup Train [16][1010/3239]	Time 0.537 (0.524)	Data 0.001 (0.023)	Loss 4.7983 (4.8068)	Top-1 acc 16.406 (16.692)	Top-5 acc 37.109 (35.978)	lr 0.03400
Warmup Train [16][1020/3239]	Time 0.596 (0.524)	Data 0.001 (0.023)	Loss 4.8253 (4.8067)	Top-1 acc 15.625 (16.684)	Top-5 acc 35.547 (35.988)	lr 0.03399
Warmup Train [16][1030/3239]	Time 0.516 (0.524)	Data 0.002 (0.022)	Loss 4.7184 (4.8067)	Top-1 acc 18.359 (16.685)	Top-5 acc 36.328 (35.985)	lr 0.03399
Warmup Train [16][1040/3239]	Time 0.344 (0.524)	Data 0.001 (0.022)	Loss 4.6087 (4.8062)	Top-1 acc 23.438 (16.697)	Top-5 acc 43.750 (35.993)	lr 0.03398
Warmup Train [16][1050/3239]	Time 0.400 (0.523)	Data 0.001 (0.022)	Loss 4.7936 (4.8058)	Top-1 acc 18.750 (16.707)	Top-5 acc 37.500 (36.002)	lr 0.03398
Warmup Train [16][1060/3239]	Time 0.468 (0.523)	Data 0.002 (0.022)	Loss 4.8071 (4.8054)	Top-1 acc 17.188 (16.709)	Top-5 acc 35.156 (36.003)	lr 0.03397
Warmup Train [16][1070/3239]	Time 0.399 (0.523)	Data 0.001 (0.022)	Loss 4.8745 (4.8057)	Top-1 acc 16.016 (16.701)	Top-5 acc 36.328 (36.005)	lr 0.03396
Warmup Train [16][1080/3239]	Time 0.660 (0.523)	Data 0.001 (0.022)	Loss 4.7519 (4.8058)	Top-1 acc 17.578 (16.701)	Top-5 acc 34.766 (35.999)	lr 0.03396
Warmup Train [16][1090/3239]	Time 0.625 (0.523)	Data 0.001 (0.022)	Loss 4.7177 (4.8060)	Top-1 acc 16.016 (16.694)	Top-5 acc 39.062 (35.982)	lr 0.03395
Warmup Train [16][1100/3239]	Time 0.477 (0.523)	Data 0.001 (0.021)	Loss 4.6736 (4.8063)	Top-1 acc 16.406 (16.688)	Top-5 acc 41.406 (35.980)	lr 0.03395
Warmup Train [16][1110/3239]	Time 0.445 (0.522)	Data 0.027 (0.021)	Loss 4.9620 (4.8060)	Top-1 acc 13.672 (16.685)	Top-5 acc 29.688 (35.973)	lr 0.03394
Warmup Train [16][1120/3239]	Time 0.323 (0.522)	Data 0.001 (0.021)	Loss 4.6223 (4.8061)	Top-1 acc 20.703 (16.677)	Top-5 acc 46.484 (35.977)	lr 0.03394
Warmup Train [16][1130/3239]	Time 0.723 (0.523)	Data 0.001 (0.021)	Loss 4.8411 (4.8063)	Top-1 acc 15.234 (16.686)	Top-5 acc 34.766 (35.983)	lr 0.03393
Warmup Train [16][1140/3239]	Time 0.595 (0.523)	Data 0.001 (0.021)	Loss 4.8444 (4.8065)	Top-1 acc 14.844 (16.677)	Top-5 acc 32.812 (35.984)	lr 0.03393
Warmup Train [16][1150/3239]	Time 0.615 (0.522)	Data 0.001 (0.021)	Loss 4.7129 (4.8064)	Top-1 acc 22.266 (16.678)	Top-5 acc 37.891 (35.984)	lr 0.03392
Warmup Train [16][1160/3239]	Time 0.491 (0.522)	Data 0.001 (0.021)	Loss 4.5516 (4.8058)	Top-1 acc 21.094 (16.688)	Top-5 acc 39.844 (35.996)	lr 0.03391
Warmup Train [16][1170/3239]	Time 0.547 (0.522)	Data 0.002 (0.020)	Loss 4.8305 (4.8056)	Top-1 acc 14.844 (16.689)	Top-5 acc 35.547 (35.996)	lr 0.03391
Warmup Train [16][1180/3239]	Time 0.583 (0.522)	Data 0.001 (0.020)	Loss 4.8211 (4.8057)	Top-1 acc 16.406 (16.690)	Top-5 acc 34.766 (35.993)	lr 0.03390
Warmup Train [16][1190/3239]	Time 0.681 (0.522)	Data 0.001 (0.020)	Loss 4.8272 (4.8055)	Top-1 acc 15.625 (16.687)	Top-5 acc 32.422 (35.999)	lr 0.03390
Warmup Train [16][1200/3239]	Time 0.564 (0.522)	Data 0.001 (0.020)	Loss 4.8353 (4.8053)	Top-1 acc 15.234 (16.690)	Top-5 acc 34.375 (36.002)	lr 0.03389
Warmup Train [16][1210/3239]	Time 0.433 (0.522)	Data 0.001 (0.020)	Loss 4.6126 (4.8050)	Top-1 acc 22.266 (16.698)	Top-5 acc 37.500 (36.006)	lr 0.03389
Warmup Train [16][1220/3239]	Time 0.488 (0.522)	Data 0.001 (0.020)	Loss 4.8718 (4.8052)	Top-1 acc 16.016 (16.694)	Top-5 acc 34.375 (35.997)	lr 0.03388
Warmup Train [16][1230/3239]	Time 0.530 (0.522)	Data 0.001 (0.020)	Loss 4.8534 (4.8050)	Top-1 acc 17.969 (16.703)	Top-5 acc 37.500 (36.005)	lr 0.03387
Warmup Train [16][1240/3239]	Time 0.518 (0.522)	Data 0.001 (0.020)	Loss 4.8428 (4.8050)	Top-1 acc 18.359 (16.705)	Top-5 acc 33.984 (36.003)	lr 0.03387
Warmup Train [16][1250/3239]	Time 0.357 (0.521)	Data 0.001 (0.019)	Loss 4.8704 (4.8051)	Top-1 acc 15.234 (16.707)	Top-5 acc 32.812 (35.996)	lr 0.03386
Warmup Train [16][1260/3239]	Time 0.470 (0.521)	Data 0.001 (0.019)	Loss 4.7949 (4.8048)	Top-1 acc 19.531 (16.712)	Top-5 acc 40.625 (36.010)	lr 0.03386
Warmup Train [16][1270/3239]	Time 0.474 (0.521)	Data 0.001 (0.019)	Loss 5.0304 (4.8049)	Top-1 acc 12.109 (16.706)	Top-5 acc 29.688 (36.001)	lr 0.03385
Warmup Train [16][1280/3239]	Time 0.496 (0.521)	Data 0.001 (0.019)	Loss 4.8181 (4.8046)	Top-1 acc 16.406 (16.712)	Top-5 acc 33.984 (36.013)	lr 0.03385
Warmup Train [16][1290/3239]	Time 0.506 (0.521)	Data 0.002 (0.019)	Loss 4.7358 (4.8041)	Top-1 acc 16.016 (16.717)	Top-5 acc 36.328 (36.024)	lr 0.03384
Warmup Train [16][1300/3239]	Time 0.574 (0.521)	Data 0.001 (0.019)	Loss 4.7820 (4.8044)	Top-1 acc 13.281 (16.713)	Top-5 acc 33.594 (36.017)	lr 0.03383
Warmup Train [16][1310/3239]	Time 0.670 (0.521)	Data 0.001 (0.019)	Loss 4.9230 (4.8048)	Top-1 acc 15.625 (16.700)	Top-5 acc 30.859 (36.000)	lr 0.03383
Warmup Train [16][1320/3239]	Time 0.352 (0.520)	Data 0.002 (0.019)	Loss 4.9301 (4.8047)	Top-1 acc 12.500 (16.701)	Top-5 acc 32.812 (36.007)	lr 0.03382
Warmup Train [16][1330/3239]	Time 0.506 (0.520)	Data 0.002 (0.019)	Loss 4.8350 (4.8045)	Top-1 acc 16.016 (16.705)	Top-5 acc 34.766 (36.009)	lr 0.03382
Warmup Train [16][1340/3239]	Time 0.336 (0.520)	Data 0.001 (0.019)	Loss 4.7820 (4.8046)	Top-1 acc 16.016 (16.700)	Top-5 acc 38.281 (36.011)	lr 0.03381
Warmup Train [16][1350/3239]	Time 0.560 (0.520)	Data 0.001 (0.019)	Loss 4.7821 (4.8046)	Top-1 acc 18.750 (16.706)	Top-5 acc 39.062 (36.012)	lr 0.03381
Warmup Train [16][1360/3239]	Time 0.573 (0.520)	Data 0.001 (0.019)	Loss 4.8453 (4.8046)	Top-1 acc 14.844 (16.706)	Top-5 acc 33.594 (36.012)	lr 0.03380
Warmup Train [16][1370/3239]	Time 0.446 (0.520)	Data 0.001 (0.018)	Loss 4.9593 (4.8043)	Top-1 acc 14.844 (16.705)	Top-5 acc 32.812 (36.019)	lr 0.03379
Warmup Train [16][1380/3239]	Time 0.611 (0.520)	Data 0.001 (0.018)	Loss 4.7200 (4.8040)	Top-1 acc 20.703 (16.719)	Top-5 acc 39.062 (36.030)	lr 0.03379
Warmup Train [16][1390/3239]	Time 0.601 (0.520)	Data 0.001 (0.018)	Loss 4.5447 (4.8035)	Top-1 acc 17.578 (16.721)	Top-5 acc 43.750 (36.050)	lr 0.03378
Warmup Train [16][1400/3239]	Time 0.713 (0.520)	Data 0.001 (0.018)	Loss 4.6118 (4.8028)	Top-1 acc 18.750 (16.729)	Top-5 acc 42.578 (36.063)	lr 0.03378
Warmup Train [16][1410/3239]	Time 0.546 (0.520)	Data 0.001 (0.018)	Loss 4.7192 (4.8028)	Top-1 acc 17.188 (16.727)	Top-5 acc 39.453 (36.069)	lr 0.03377
Warmup Train [16][1420/3239]	Time 0.321 (0.520)	Data 0.001 (0.018)	Loss 4.9800 (4.8027)	Top-1 acc 14.844 (16.731)	Top-5 acc 28.906 (36.069)	lr 0.03377
Warmup Train [16][1430/3239]	Time 0.515 (0.520)	Data 0.001 (0.018)	Loss 4.6620 (4.8024)	Top-1 acc 17.578 (16.734)	Top-5 acc 38.672 (36.079)	lr 0.03376
Warmup Train [16][1440/3239]	Time 0.531 (0.520)	Data 0.001 (0.018)	Loss 4.6890 (4.8023)	Top-1 acc 20.312 (16.739)	Top-5 acc 35.938 (36.083)	lr 0.03376
Warmup Train [16][1450/3239]	Time 0.522 (0.519)	Data 0.001 (0.018)	Loss 4.7162 (4.8023)	Top-1 acc 16.797 (16.739)	Top-5 acc 35.156 (36.076)	lr 0.03375
Warmup Train [16][1460/3239]	Time 0.411 (0.519)	Data 0.001 (0.018)	Loss 4.7085 (4.8021)	Top-1 acc 19.922 (16.742)	Top-5 acc 40.625 (36.083)	lr 0.03374
Warmup Train [16][1470/3239]	Time 0.591 (0.519)	Data 0.001 (0.018)	Loss 4.7704 (4.8023)	Top-1 acc 16.797 (16.735)	Top-5 acc 35.547 (36.074)	lr 0.03374
Warmup Train [16][1480/3239]	Time 0.563 (0.519)	Data 0.001 (0.018)	Loss 4.7950 (4.8018)	Top-1 acc 17.578 (16.749)	Top-5 acc 36.719 (36.085)	lr 0.03373
Warmup Train [16][1490/3239]	Time 0.502 (0.519)	Data 0.001 (0.018)	Loss 4.9540 (4.8018)	Top-1 acc 13.672 (16.742)	Top-5 acc 32.422 (36.082)	lr 0.03373
Warmup Train [16][1500/3239]	Time 0.481 (0.519)	Data 0.001 (0.017)	Loss 4.8733 (4.8015)	Top-1 acc 15.234 (16.754)	Top-5 acc 33.984 (36.090)	lr 0.03372
Warmup Train [16][1510/3239]	Time 0.617 (0.519)	Data 0.001 (0.017)	Loss 4.9488 (4.8017)	Top-1 acc 14.062 (16.748)	Top-5 acc 32.812 (36.085)	lr 0.03372
Warmup Train [16][1520/3239]	Time 0.666 (0.519)	Data 0.001 (0.017)	Loss 4.8385 (4.8017)	Top-1 acc 17.188 (16.747)	Top-5 acc 37.891 (36.086)	lr 0.03371
Warmup Train [16][1530/3239]	Time 0.694 (0.519)	Data 0.001 (0.017)	Loss 4.7704 (4.8014)	Top-1 acc 17.188 (16.751)	Top-5 acc 39.453 (36.094)	lr 0.03370
Warmup Train [16][1540/3239]	Time 0.523 (0.519)	Data 0.001 (0.017)	Loss 4.7904 (4.8013)	Top-1 acc 16.406 (16.754)	Top-5 acc 36.328 (36.090)	lr 0.03370
Warmup Train [16][1550/3239]	Time 0.648 (0.519)	Data 0.001 (0.017)	Loss 4.7159 (4.8011)	Top-1 acc 19.922 (16.756)	Top-5 acc 38.672 (36.092)	lr 0.03369
Warmup Train [16][1560/3239]	Time 0.488 (0.519)	Data 0.001 (0.017)	Loss 4.8702 (4.8011)	Top-1 acc 16.016 (16.753)	Top-5 acc 33.984 (36.098)	lr 0.03369
Warmup Train [16][1570/3239]	Time 0.435 (0.519)	Data 0.001 (0.017)	Loss 4.8744 (4.8014)	Top-1 acc 15.625 (16.747)	Top-5 acc 34.375 (36.090)	lr 0.03368
Warmup Train [16][1580/3239]	Time 0.616 (0.519)	Data 0.001 (0.017)	Loss 4.7650 (4.8010)	Top-1 acc 19.141 (16.764)	Top-5 acc 37.891 (36.101)	lr 0.03368
Warmup Train [16][1590/3239]	Time 0.454 (0.519)	Data 0.001 (0.017)	Loss 4.6837 (4.8007)	Top-1 acc 16.406 (16.764)	Top-5 acc 37.891 (36.103)	lr 0.03367
Warmup Train [16][1600/3239]	Time 0.516 (0.519)	Data 0.001 (0.017)	Loss 4.7306 (4.8006)	Top-1 acc 17.969 (16.764)	Top-5 acc 35.547 (36.104)	lr 0.03366
Warmup Train [16][1610/3239]	Time 0.601 (0.518)	Data 0.001 (0.017)	Loss 4.7575 (4.8004)	Top-1 acc 19.922 (16.773)	Top-5 acc 37.891 (36.104)	lr 0.03366
Warmup Train [16][1620/3239]	Time 0.552 (0.518)	Data 0.001 (0.016)	Loss 4.9482 (4.8004)	Top-1 acc 16.406 (16.774)	Top-5 acc 37.500 (36.109)	lr 0.03365
Warmup Train [16][1630/3239]	Time 0.461 (0.518)	Data 0.001 (0.016)	Loss 4.7180 (4.8005)	Top-1 acc 17.969 (16.770)	Top-5 acc 37.891 (36.104)	lr 0.03365
Warmup Train [16][1640/3239]	Time 0.477 (0.518)	Data 0.001 (0.016)	Loss 4.8254 (4.8009)	Top-1 acc 15.625 (16.768)	Top-5 acc 37.500 (36.098)	lr 0.03364
Warmup Train [16][1650/3239]	Time 0.635 (0.518)	Data 0.001 (0.016)	Loss 4.6457 (4.8007)	Top-1 acc 20.312 (16.767)	Top-5 acc 41.016 (36.104)	lr 0.03364
Warmup Train [16][1660/3239]	Time 0.308 (0.518)	Data 0.002 (0.016)	Loss 4.8923 (4.8005)	Top-1 acc 14.062 (16.774)	Top-5 acc 33.594 (36.110)	lr 0.03363
Warmup Train [16][1670/3239]	Time 0.617 (0.518)	Data 0.001 (0.016)	Loss 4.9146 (4.8005)	Top-1 acc 12.891 (16.773)	Top-5 acc 35.547 (36.110)	lr 0.03362
Warmup Train [16][1680/3239]	Time 0.547 (0.518)	Data 0.001 (0.016)	Loss 4.6106 (4.8004)	Top-1 acc 19.531 (16.773)	Top-5 acc 42.188 (36.113)	lr 0.03362
Warmup Train [16][1690/3239]	Time 0.621 (0.518)	Data 0.001 (0.016)	Loss 4.7273 (4.8002)	Top-1 acc 20.312 (16.778)	Top-5 acc 37.891 (36.119)	lr 0.03361
Warmup Train [16][1700/3239]	Time 0.603 (0.518)	Data 0.001 (0.016)	Loss 4.8061 (4.8000)	Top-1 acc 14.062 (16.774)	Top-5 acc 36.328 (36.118)	lr 0.03361
Warmup Train [16][1710/3239]	Time 0.479 (0.518)	Data 0.001 (0.016)	Loss 4.8166 (4.8001)	Top-1 acc 14.062 (16.764)	Top-5 acc 33.984 (36.114)	lr 0.03360
Warmup Train [16][1720/3239]	Time 0.837 (0.518)	Data 0.001 (0.016)	Loss 4.8086 (4.7998)	Top-1 acc 19.141 (16.766)	Top-5 acc 33.984 (36.117)	lr 0.03360
Warmup Train [16][1730/3239]	Time 0.528 (0.518)	Data 0.002 (0.016)	Loss 4.7029 (4.7995)	Top-1 acc 17.578 (16.766)	Top-5 acc 34.375 (36.121)	lr 0.03359
Warmup Train [16][1740/3239]	Time 0.389 (0.518)	Data 0.001 (0.016)	Loss 4.6094 (4.7992)	Top-1 acc 22.266 (16.765)	Top-5 acc 40.234 (36.122)	lr 0.03358
Warmup Train [16][1750/3239]	Time 0.540 (0.518)	Data 0.001 (0.016)	Loss 4.7381 (4.7990)	Top-1 acc 17.969 (16.763)	Top-5 acc 37.500 (36.128)	lr 0.03358
Warmup Train [16][1760/3239]	Time 0.431 (0.518)	Data 0.001 (0.016)	Loss 4.7828 (4.7988)	Top-1 acc 16.406 (16.769)	Top-5 acc 38.281 (36.131)	lr 0.03357
Warmup Train [16][1770/3239]	Time 0.469 (0.518)	Data 0.001 (0.016)	Loss 4.6506 (4.7987)	Top-1 acc 24.219 (16.776)	Top-5 acc 42.578 (36.136)	lr 0.03357
Warmup Train [16][1780/3239]	Time 0.642 (0.518)	Data 0.001 (0.016)	Loss 4.8737 (4.7988)	Top-1 acc 17.578 (16.777)	Top-5 acc 35.547 (36.140)	lr 0.03356
Warmup Train [16][1790/3239]	Time 0.449 (0.518)	Data 0.001 (0.015)	Loss 4.6627 (4.7988)	Top-1 acc 17.969 (16.781)	Top-5 acc 39.453 (36.137)	lr 0.03356
Warmup Train [16][1800/3239]	Time 0.472 (0.518)	Data 0.001 (0.015)	Loss 4.6985 (4.7985)	Top-1 acc 19.531 (16.783)	Top-5 acc 40.625 (36.139)	lr 0.03355
Warmup Train [16][1810/3239]	Time 0.747 (0.519)	Data 0.001 (0.015)	Loss 4.7315 (4.7984)	Top-1 acc 17.578 (16.782)	Top-5 acc 33.203 (36.138)	lr 0.03354
Warmup Train [16][1820/3239]	Time 0.632 (0.518)	Data 0.001 (0.015)	Loss 4.8880 (4.7984)	Top-1 acc 14.062 (16.788)	Top-5 acc 32.422 (36.145)	lr 0.03354
Warmup Train [16][1830/3239]	Time 0.556 (0.518)	Data 0.001 (0.015)	Loss 4.7565 (4.7981)	Top-1 acc 16.406 (16.787)	Top-5 acc 36.719 (36.147)	lr 0.03353
Warmup Train [16][1840/3239]	Time 0.638 (0.518)	Data 0.001 (0.015)	Loss 4.8139 (4.7981)	Top-1 acc 16.797 (16.789)	Top-5 acc 32.812 (36.143)	lr 0.03353
Warmup Train [16][1850/3239]	Time 0.581 (0.518)	Data 0.001 (0.015)	Loss 4.6817 (4.7979)	Top-1 acc 15.234 (16.794)	Top-5 acc 35.156 (36.145)	lr 0.03352
Warmup Train [16][1860/3239]	Time 0.160 (0.518)	Data 0.001 (0.015)	Loss 4.7394 (4.7976)	Top-1 acc 19.531 (16.799)	Top-5 acc 37.891 (36.148)	lr 0.03352
Warmup Train [16][1870/3239]	Time 0.430 (0.518)	Data 0.001 (0.015)	Loss 4.8824 (4.7974)	Top-1 acc 19.141 (16.801)	Top-5 acc 34.375 (36.154)	lr 0.03351
Warmup Train [16][1880/3239]	Time 0.579 (0.518)	Data 0.001 (0.015)	Loss 4.7041 (4.7974)	Top-1 acc 18.359 (16.794)	Top-5 acc 39.844 (36.150)	lr 0.03350
Warmup Train [16][1890/3239]	Time 0.568 (0.517)	Data 0.001 (0.015)	Loss 4.6606 (4.7973)	Top-1 acc 18.359 (16.792)	Top-5 acc 37.500 (36.155)	lr 0.03350
Warmup Train [16][1900/3239]	Time 0.512 (0.517)	Data 0.001 (0.015)	Loss 4.8256 (4.7971)	Top-1 acc 14.453 (16.787)	Top-5 acc 32.422 (36.158)	lr 0.03349
Warmup Train [16][1910/3239]	Time 0.459 (0.517)	Data 0.001 (0.015)	Loss 4.9690 (4.7970)	Top-1 acc 12.891 (16.787)	Top-5 acc 33.203 (36.158)	lr 0.03349
Warmup Train [16][1920/3239]	Time 0.495 (0.517)	Data 0.001 (0.015)	Loss 4.8293 (4.7968)	Top-1 acc 17.578 (16.790)	Top-5 acc 38.672 (36.159)	lr 0.03348
Warmup Train [16][1930/3239]	Time 0.397 (0.517)	Data 0.001 (0.015)	Loss 4.7348 (4.7969)	Top-1 acc 16.016 (16.787)	Top-5 acc 38.281 (36.158)	lr 0.03348
Warmup Train [16][1940/3239]	Time 0.547 (0.517)	Data 0.001 (0.015)	Loss 4.8941 (4.7967)	Top-1 acc 14.844 (16.792)	Top-5 acc 29.688 (36.159)	lr 0.03347
Warmup Train [16][1950/3239]	Time 0.521 (0.517)	Data 0.001 (0.015)	Loss 4.6371 (4.7965)	Top-1 acc 20.703 (16.796)	Top-5 acc 39.062 (36.166)	lr 0.03347
Warmup Train [16][1960/3239]	Time 0.499 (0.517)	Data 0.001 (0.015)	Loss 4.9692 (4.7963)	Top-1 acc 16.406 (16.798)	Top-5 acc 33.594 (36.177)	lr 0.03346
Warmup Train [16][1970/3239]	Time 0.378 (0.517)	Data 0.001 (0.014)	Loss 4.8838 (4.7961)	Top-1 acc 13.281 (16.804)	Top-5 acc 31.250 (36.179)	lr 0.03345
Warmup Train [16][1980/3239]	Time 0.442 (0.517)	Data 0.001 (0.014)	Loss 4.8608 (4.7961)	Top-1 acc 17.188 (16.803)	Top-5 acc 36.328 (36.174)	lr 0.03345
Warmup Train [16][1990/3239]	Time 0.597 (0.517)	Data 0.001 (0.014)	Loss 4.6490 (4.7958)	Top-1 acc 19.922 (16.809)	Top-5 acc 41.406 (36.179)	lr 0.03344
Warmup Train [16][2000/3239]	Time 0.327 (0.517)	Data 0.001 (0.014)	Loss 4.7073 (4.7956)	Top-1 acc 17.578 (16.811)	Top-5 acc 37.891 (36.177)	lr 0.03344
Warmup Train [16][2010/3239]	Time 0.579 (0.517)	Data 0.001 (0.014)	Loss 4.5608 (4.7955)	Top-1 acc 18.359 (16.815)	Top-5 acc 39.844 (36.178)	lr 0.03343
Warmup Train [16][2020/3239]	Time 0.614 (0.517)	Data 0.001 (0.014)	Loss 4.8881 (4.7953)	Top-1 acc 17.969 (16.817)	Top-5 acc 32.812 (36.177)	lr 0.03343
Warmup Train [16][2030/3239]	Time 0.502 (0.517)	Data 0.001 (0.014)	Loss 4.5497 (4.7949)	Top-1 acc 19.922 (16.823)	Top-5 acc 43.359 (36.180)	lr 0.03342
Warmup Train [16][2040/3239]	Time 0.529 (0.517)	Data 0.001 (0.014)	Loss 4.7533 (4.7949)	Top-1 acc 14.844 (16.817)	Top-5 acc 36.719 (36.176)	lr 0.03341
Warmup Train [16][2050/3239]	Time 0.389 (0.517)	Data 0.001 (0.014)	Loss 4.7488 (4.7949)	Top-1 acc 16.016 (16.820)	Top-5 acc 38.672 (36.181)	lr 0.03341
Warmup Train [16][2060/3239]	Time 0.368 (0.517)	Data 0.001 (0.014)	Loss 4.6834 (4.7949)	Top-1 acc 19.922 (16.824)	Top-5 acc 39.844 (36.182)	lr 0.03340
Warmup Train [16][2070/3239]	Time 0.542 (0.517)	Data 0.001 (0.014)	Loss 4.6168 (4.7948)	Top-1 acc 18.359 (16.825)	Top-5 acc 42.578 (36.183)	lr 0.03340
Warmup Train [16][2080/3239]	Time 0.429 (0.517)	Data 0.001 (0.014)	Loss 4.7670 (4.7945)	Top-1 acc 14.453 (16.825)	Top-5 acc 37.109 (36.190)	lr 0.03339
Warmup Train [16][2090/3239]	Time 0.525 (0.517)	Data 0.001 (0.014)	Loss 4.9448 (4.7949)	Top-1 acc 14.844 (16.819)	Top-5 acc 31.641 (36.178)	lr 0.03339
Warmup Train [16][2100/3239]	Time 0.436 (0.517)	Data 0.001 (0.014)	Loss 4.7203 (4.7950)	Top-1 acc 19.922 (16.824)	Top-5 acc 36.719 (36.183)	lr 0.03338
Warmup Train [16][2110/3239]	Time 0.497 (0.517)	Data 0.001 (0.014)	Loss 4.7096 (4.7950)	Top-1 acc 18.750 (16.824)	Top-5 acc 39.062 (36.186)	lr 0.03337
Warmup Train [16][2120/3239]	Time 0.581 (0.517)	Data 0.001 (0.014)	Loss 4.7788 (4.7951)	Top-1 acc 16.016 (16.819)	Top-5 acc 37.109 (36.180)	lr 0.03337
Warmup Train [16][2130/3239]	Time 0.505 (0.517)	Data 0.001 (0.014)	Loss 4.6528 (4.7951)	Top-1 acc 19.531 (16.823)	Top-5 acc 39.062 (36.180)	lr 0.03336
Warmup Train [16][2140/3239]	Time 0.444 (0.517)	Data 0.001 (0.014)	Loss 4.6392 (4.7951)	Top-1 acc 17.578 (16.825)	Top-5 acc 37.109 (36.179)	lr 0.03336
Warmup Train [16][2150/3239]	Time 0.408 (0.517)	Data 0.001 (0.014)	Loss 4.8646 (4.7954)	Top-1 acc 16.016 (16.818)	Top-5 acc 32.422 (36.174)	lr 0.03335
Warmup Train [16][2160/3239]	Time 0.387 (0.517)	Data 0.001 (0.014)	Loss 4.8361 (4.7955)	Top-1 acc 15.625 (16.817)	Top-5 acc 36.719 (36.170)	lr 0.03335
Warmup Train [16][2170/3239]	Time 0.441 (0.517)	Data 0.001 (0.014)	Loss 4.9618 (4.7957)	Top-1 acc 16.406 (16.816)	Top-5 acc 31.250 (36.162)	lr 0.03334
Warmup Train [16][2180/3239]	Time 0.524 (0.517)	Data 0.001 (0.014)	Loss 4.6960 (4.7956)	Top-1 acc 20.703 (16.823)	Top-5 acc 37.500 (36.168)	lr 0.03333
Warmup Train [16][2190/3239]	Time 0.688 (0.517)	Data 0.001 (0.014)	Loss 4.8137 (4.7952)	Top-1 acc 19.531 (16.833)	Top-5 acc 35.938 (36.176)	lr 0.03333
Warmup Train [16][2200/3239]	Time 0.635 (0.517)	Data 0.001 (0.014)	Loss 4.7739 (4.7950)	Top-1 acc 20.312 (16.839)	Top-5 acc 41.406 (36.186)	lr 0.03332
Warmup Train [16][2210/3239]	Time 0.451 (0.517)	Data 0.001 (0.014)	Loss 4.7794 (4.7951)	Top-1 acc 14.844 (16.834)	Top-5 acc 36.328 (36.183)	lr 0.03332
Warmup Train [16][2220/3239]	Time 0.618 (0.517)	Data 0.001 (0.014)	Loss 4.8204 (4.7950)	Top-1 acc 17.578 (16.835)	Top-5 acc 35.547 (36.182)	lr 0.03331
Warmup Train [16][2230/3239]	Time 0.521 (0.517)	Data 0.001 (0.013)	Loss 4.6688 (4.7948)	Top-1 acc 16.406 (16.841)	Top-5 acc 39.062 (36.186)	lr 0.03331
Warmup Train [16][2240/3239]	Time 0.464 (0.517)	Data 0.001 (0.013)	Loss 4.8336 (4.7949)	Top-1 acc 15.625 (16.839)	Top-5 acc 35.156 (36.187)	lr 0.03330
Warmup Train [16][2250/3239]	Time 0.497 (0.517)	Data 0.001 (0.013)	Loss 4.8125 (4.7949)	Top-1 acc 15.625 (16.837)	Top-5 acc 35.547 (36.187)	lr 0.03329
Warmup Train [16][2260/3239]	Time 0.421 (0.517)	Data 0.001 (0.013)	Loss 4.6778 (4.7948)	Top-1 acc 19.922 (16.837)	Top-5 acc 39.453 (36.185)	lr 0.03329
Warmup Train [16][2270/3239]	Time 0.614 (0.517)	Data 0.001 (0.013)	Loss 4.7238 (4.7948)	Top-1 acc 17.969 (16.843)	Top-5 acc 37.109 (36.189)	lr 0.03328
Warmup Train [16][2280/3239]	Time 0.415 (0.517)	Data 0.001 (0.013)	Loss 4.8280 (4.7949)	Top-1 acc 21.484 (16.845)	Top-5 acc 37.109 (36.186)	lr 0.03328
Warmup Train [16][2290/3239]	Time 0.604 (0.517)	Data 0.001 (0.013)	Loss 4.8993 (4.7950)	Top-1 acc 14.844 (16.839)	Top-5 acc 35.156 (36.183)	lr 0.03327
Warmup Train [16][2300/3239]	Time 0.531 (0.517)	Data 0.001 (0.013)	Loss 4.7417 (4.7949)	Top-1 acc 19.531 (16.845)	Top-5 acc 37.891 (36.181)	lr 0.03327
Warmup Train [16][2310/3239]	Time 0.782 (0.517)	Data 0.001 (0.013)	Loss 4.7265 (4.7949)	Top-1 acc 20.703 (16.847)	Top-5 acc 40.625 (36.184)	lr 0.03326
Warmup Train [16][2320/3239]	Time 0.632 (0.517)	Data 0.001 (0.013)	Loss 4.8574 (4.7947)	Top-1 acc 15.234 (16.849)	Top-5 acc 34.766 (36.188)	lr 0.03325
Warmup Train [16][2330/3239]	Time 0.577 (0.516)	Data 0.001 (0.013)	Loss 4.7756 (4.7946)	Top-1 acc 14.453 (16.847)	Top-5 acc 32.812 (36.186)	lr 0.03325
Warmup Train [16][2340/3239]	Time 0.489 (0.516)	Data 0.001 (0.013)	Loss 4.8026 (4.7945)	Top-1 acc 17.578 (16.850)	Top-5 acc 32.422 (36.190)	lr 0.03324
Warmup Train [16][2350/3239]	Time 0.508 (0.517)	Data 0.001 (0.013)	Loss 4.8015 (4.7944)	Top-1 acc 17.578 (16.855)	Top-5 acc 34.766 (36.193)	lr 0.03324
Warmup Train [16][2360/3239]	Time 0.354 (0.516)	Data 0.001 (0.013)	Loss 4.9663 (4.7944)	Top-1 acc 10.938 (16.854)	Top-5 acc 29.688 (36.191)	lr 0.03323
Warmup Train [16][2370/3239]	Time 0.402 (0.516)	Data 0.001 (0.013)	Loss 4.7121 (4.7942)	Top-1 acc 18.750 (16.854)	Top-5 acc 35.938 (36.195)	lr 0.03323
Warmup Train [16][2380/3239]	Time 0.430 (0.516)	Data 0.001 (0.013)	Loss 4.7208 (4.7941)	Top-1 acc 16.406 (16.851)	Top-5 acc 42.188 (36.199)	lr 0.03322
Warmup Train [16][2390/3239]	Time 0.547 (0.516)	Data 0.001 (0.013)	Loss 4.6588 (4.7941)	Top-1 acc 19.922 (16.851)	Top-5 acc 42.969 (36.201)	lr 0.03321
Warmup Train [16][2400/3239]	Time 0.535 (0.516)	Data 0.001 (0.013)	Loss 4.7913 (4.7939)	Top-1 acc 14.453 (16.852)	Top-5 acc 35.547 (36.206)	lr 0.03321
Warmup Train [16][2410/3239]	Time 0.638 (0.516)	Data 0.001 (0.013)	Loss 4.8424 (4.7939)	Top-1 acc 15.625 (16.850)	Top-5 acc 33.203 (36.206)	lr 0.03320
Warmup Train [16][2420/3239]	Time 0.503 (0.516)	Data 0.001 (0.013)	Loss 4.9543 (4.7937)	Top-1 acc 14.453 (16.851)	Top-5 acc 29.688 (36.205)	lr 0.03320
Warmup Train [16][2430/3239]	Time 0.519 (0.516)	Data 0.001 (0.013)	Loss 4.6959 (4.7934)	Top-1 acc 15.625 (16.854)	Top-5 acc 39.844 (36.216)	lr 0.03319
Warmup Train [16][2440/3239]	Time 0.516 (0.516)	Data 0.001 (0.013)	Loss 4.7174 (4.7935)	Top-1 acc 18.359 (16.850)	Top-5 acc 35.938 (36.210)	lr 0.03319
Warmup Train [16][2450/3239]	Time 0.529 (0.516)	Data 0.001 (0.013)	Loss 4.6422 (4.7932)	Top-1 acc 19.141 (16.852)	Top-5 acc 41.797 (36.211)	lr 0.03318
Warmup Train [16][2460/3239]	Time 0.510 (0.516)	Data 0.001 (0.013)	Loss 4.9157 (4.7934)	Top-1 acc 18.750 (16.852)	Top-5 acc 32.812 (36.212)	lr 0.03317
Warmup Train [16][2470/3239]	Time 0.503 (0.516)	Data 0.002 (0.013)	Loss 4.7217 (4.7934)	Top-1 acc 17.578 (16.851)	Top-5 acc 35.547 (36.215)	lr 0.03317
Warmup Train [16][2480/3239]	Time 0.481 (0.516)	Data 0.001 (0.013)	Loss 4.8992 (4.7932)	Top-1 acc 16.797 (16.850)	Top-5 acc 35.156 (36.217)	lr 0.03316
Warmup Train [16][2490/3239]	Time 0.607 (0.516)	Data 0.001 (0.013)	Loss 4.6987 (4.7931)	Top-1 acc 17.969 (16.851)	Top-5 acc 40.234 (36.223)	lr 0.03316
Warmup Train [16][2500/3239]	Time 0.497 (0.516)	Data 0.001 (0.013)	Loss 4.7836 (4.7928)	Top-1 acc 14.844 (16.854)	Top-5 acc 35.547 (36.230)	lr 0.03315
Warmup Train [16][2510/3239]	Time 0.723 (0.516)	Data 0.001 (0.013)	Loss 4.7272 (4.7925)	Top-1 acc 16.797 (16.859)	Top-5 acc 38.281 (36.239)	lr 0.03314
Warmup Train [16][2520/3239]	Time 0.397 (0.516)	Data 0.002 (0.012)	Loss 4.6214 (4.7923)	Top-1 acc 18.359 (16.864)	Top-5 acc 37.891 (36.246)	lr 0.03314
Warmup Train [16][2530/3239]	Time 0.562 (0.516)	Data 0.001 (0.012)	Loss 4.8615 (4.7923)	Top-1 acc 11.328 (16.859)	Top-5 acc 33.594 (36.245)	lr 0.03313
Warmup Train [16][2540/3239]	Time 0.577 (0.516)	Data 0.001 (0.012)	Loss 4.7193 (4.7926)	Top-1 acc 20.703 (16.853)	Top-5 acc 38.281 (36.238)	lr 0.03313
Warmup Train [16][2550/3239]	Time 0.488 (0.516)	Data 0.001 (0.012)	Loss 4.9740 (4.7925)	Top-1 acc 15.625 (16.856)	Top-5 acc 34.766 (36.237)	lr 0.03312
Warmup Train [16][2560/3239]	Time 0.517 (0.516)	Data 0.001 (0.012)	Loss 4.7008 (4.7922)	Top-1 acc 17.969 (16.863)	Top-5 acc 40.234 (36.248)	lr 0.03312
Warmup Train [16][2570/3239]	Time 0.471 (0.516)	Data 0.001 (0.012)	Loss 4.6860 (4.7920)	Top-1 acc 19.922 (16.870)	Top-5 acc 38.672 (36.255)	lr 0.03311
Warmup Train [16][2580/3239]	Time 0.488 (0.516)	Data 0.001 (0.012)	Loss 4.6910 (4.7918)	Top-1 acc 17.969 (16.869)	Top-5 acc 37.891 (36.258)	lr 0.03310
Warmup Train [16][2590/3239]	Time 0.487 (0.516)	Data 0.001 (0.012)	Loss 4.6123 (4.7915)	Top-1 acc 19.922 (16.872)	Top-5 acc 44.531 (36.266)	lr 0.03310
Warmup Train [16][2600/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 4.7200 (4.7916)	Top-1 acc 17.969 (16.873)	Top-5 acc 38.672 (36.267)	lr 0.03309
Warmup Train [16][2610/3239]	Time 0.595 (0.516)	Data 0.001 (0.012)	Loss 4.8131 (4.7915)	Top-1 acc 17.578 (16.874)	Top-5 acc 36.719 (36.272)	lr 0.03309
Warmup Train [16][2620/3239]	Time 0.563 (0.516)	Data 0.001 (0.012)	Loss 4.8542 (4.7914)	Top-1 acc 16.016 (16.878)	Top-5 acc 34.375 (36.277)	lr 0.03308
Warmup Train [16][2630/3239]	Time 0.483 (0.516)	Data 0.001 (0.012)	Loss 4.8545 (4.7913)	Top-1 acc 15.234 (16.878)	Top-5 acc 34.766 (36.278)	lr 0.03308
Warmup Train [16][2640/3239]	Time 0.551 (0.516)	Data 0.001 (0.012)	Loss 4.8088 (4.7912)	Top-1 acc 16.016 (16.880)	Top-5 acc 37.109 (36.280)	lr 0.03307
Warmup Train [16][2650/3239]	Time 0.462 (0.516)	Data 0.001 (0.012)	Loss 4.6614 (4.7910)	Top-1 acc 14.844 (16.881)	Top-5 acc 39.844 (36.285)	lr 0.03306
Warmup Train [16][2660/3239]	Time 0.496 (0.516)	Data 0.001 (0.012)	Loss 4.7678 (4.7909)	Top-1 acc 16.406 (16.884)	Top-5 acc 37.500 (36.289)	lr 0.03306
Warmup Train [16][2670/3239]	Time 0.464 (0.516)	Data 0.001 (0.012)	Loss 4.9109 (4.7907)	Top-1 acc 15.625 (16.887)	Top-5 acc 32.031 (36.293)	lr 0.03305
Warmup Train [16][2680/3239]	Time 0.606 (0.516)	Data 0.001 (0.012)	Loss 5.0803 (4.7907)	Top-1 acc 13.281 (16.886)	Top-5 acc 30.859 (36.295)	lr 0.03305
Warmup Train [16][2690/3239]	Time 0.360 (0.516)	Data 0.001 (0.012)	Loss 4.8422 (4.7907)	Top-1 acc 18.359 (16.888)	Top-5 acc 38.672 (36.293)	lr 0.03304
Warmup Train [16][2700/3239]	Time 0.573 (0.516)	Data 0.001 (0.012)	Loss 4.6800 (4.7906)	Top-1 acc 17.969 (16.891)	Top-5 acc 41.016 (36.296)	lr 0.03304
Warmup Train [16][2710/3239]	Time 0.545 (0.516)	Data 0.005 (0.012)	Loss 4.7418 (4.7905)	Top-1 acc 15.625 (16.888)	Top-5 acc 37.500 (36.295)	lr 0.03303
Warmup Train [16][2720/3239]	Time 0.623 (0.516)	Data 0.001 (0.012)	Loss 4.9270 (4.7905)	Top-1 acc 14.062 (16.888)	Top-5 acc 32.031 (36.292)	lr 0.03302
Warmup Train [16][2730/3239]	Time 0.591 (0.516)	Data 0.001 (0.012)	Loss 4.7554 (4.7904)	Top-1 acc 15.234 (16.888)	Top-5 acc 34.766 (36.293)	lr 0.03302
Warmup Train [16][2740/3239]	Time 0.619 (0.516)	Data 0.001 (0.012)	Loss 4.6663 (4.7903)	Top-1 acc 15.234 (16.887)	Top-5 acc 38.281 (36.291)	lr 0.03301
Warmup Train [16][2750/3239]	Time 0.354 (0.516)	Data 0.001 (0.012)	Loss 5.0079 (4.7903)	Top-1 acc 13.281 (16.889)	Top-5 acc 29.297 (36.293)	lr 0.03301
Warmup Train [16][2760/3239]	Time 0.300 (0.515)	Data 0.001 (0.012)	Loss 4.7860 (4.7903)	Top-1 acc 19.531 (16.888)	Top-5 acc 37.109 (36.294)	lr 0.03300
Warmup Train [16][2770/3239]	Time 0.451 (0.515)	Data 0.001 (0.012)	Loss 4.7744 (4.7902)	Top-1 acc 16.797 (16.888)	Top-5 acc 35.156 (36.295)	lr 0.03300
Warmup Train [16][2780/3239]	Time 0.535 (0.516)	Data 0.001 (0.012)	Loss 4.6605 (4.7901)	Top-1 acc 16.406 (16.888)	Top-5 acc 39.453 (36.294)	lr 0.03299
Warmup Train [16][2790/3239]	Time 0.588 (0.516)	Data 0.001 (0.012)	Loss 4.6976 (4.7900)	Top-1 acc 21.094 (16.886)	Top-5 acc 38.281 (36.297)	lr 0.03298
Warmup Train [16][2800/3239]	Time 0.460 (0.516)	Data 0.001 (0.012)	Loss 4.7169 (4.7900)	Top-1 acc 19.531 (16.884)	Top-5 acc 35.547 (36.298)	lr 0.03298
Warmup Train [16][2810/3239]	Time 0.496 (0.516)	Data 0.002 (0.012)	Loss 4.9680 (4.7899)	Top-1 acc 16.016 (16.891)	Top-5 acc 34.375 (36.302)	lr 0.03297
Warmup Train [16][2820/3239]	Time 0.418 (0.516)	Data 0.001 (0.012)	Loss 4.7319 (4.7895)	Top-1 acc 17.578 (16.899)	Top-5 acc 35.547 (36.313)	lr 0.03297
Warmup Train [16][2830/3239]	Time 0.549 (0.516)	Data 0.003 (0.012)	Loss 4.6204 (4.7891)	Top-1 acc 14.062 (16.904)	Top-5 acc 41.797 (36.325)	lr 0.03296
Warmup Train [16][2840/3239]	Time 0.364 (0.516)	Data 0.001 (0.012)	Loss 4.9341 (4.7891)	Top-1 acc 14.844 (16.902)	Top-5 acc 34.375 (36.322)	lr 0.03296
Warmup Train [16][2850/3239]	Time 0.530 (0.516)	Data 0.001 (0.012)	Loss 4.7667 (4.7891)	Top-1 acc 21.875 (16.904)	Top-5 acc 36.328 (36.316)	lr 0.03295
Warmup Train [16][2860/3239]	Time 0.332 (0.515)	Data 0.001 (0.012)	Loss 4.6876 (4.7891)	Top-1 acc 15.625 (16.906)	Top-5 acc 39.453 (36.318)	lr 0.03294
Warmup Train [16][2870/3239]	Time 0.539 (0.516)	Data 0.001 (0.012)	Loss 4.8189 (4.7890)	Top-1 acc 15.625 (16.907)	Top-5 acc 35.156 (36.319)	lr 0.03294
Warmup Train [16][2880/3239]	Time 0.443 (0.515)	Data 0.001 (0.012)	Loss 4.7554 (4.7888)	Top-1 acc 17.188 (16.907)	Top-5 acc 37.500 (36.325)	lr 0.03293
Warmup Train [16][2890/3239]	Time 0.575 (0.516)	Data 0.001 (0.012)	Loss 4.5640 (4.7887)	Top-1 acc 20.312 (16.911)	Top-5 acc 41.016 (36.327)	lr 0.03293
Warmup Train [16][2900/3239]	Time 0.520 (0.515)	Data 0.001 (0.012)	Loss 4.8183 (4.7888)	Top-1 acc 17.188 (16.908)	Top-5 acc 33.984 (36.324)	lr 0.03292
Warmup Train [16][2910/3239]	Time 0.579 (0.515)	Data 0.001 (0.012)	Loss 4.6657 (4.7889)	Top-1 acc 20.703 (16.904)	Top-5 acc 41.797 (36.324)	lr 0.03292
Warmup Train [16][2920/3239]	Time 0.333 (0.515)	Data 0.001 (0.012)	Loss 4.7282 (4.7888)	Top-1 acc 23.047 (16.905)	Top-5 acc 38.672 (36.325)	lr 0.03291
Warmup Train [16][2930/3239]	Time 0.452 (0.515)	Data 0.001 (0.012)	Loss 4.8996 (4.7888)	Top-1 acc 16.016 (16.908)	Top-5 acc 32.812 (36.326)	lr 0.03290
Warmup Train [16][2940/3239]	Time 0.413 (0.515)	Data 0.001 (0.012)	Loss 4.5828 (4.7888)	Top-1 acc 23.828 (16.910)	Top-5 acc 42.969 (36.329)	lr 0.03290
Warmup Train [16][2950/3239]	Time 0.521 (0.515)	Data 0.001 (0.012)	Loss 4.7651 (4.7888)	Top-1 acc 16.406 (16.909)	Top-5 acc 35.156 (36.329)	lr 0.03289
Warmup Train [16][2960/3239]	Time 0.605 (0.515)	Data 0.034 (0.012)	Loss 4.9423 (4.7886)	Top-1 acc 12.500 (16.913)	Top-5 acc 34.375 (36.335)	lr 0.03289
Warmup Train [16][2970/3239]	Time 0.386 (0.515)	Data 0.001 (0.012)	Loss 4.7819 (4.7884)	Top-1 acc 17.578 (16.916)	Top-5 acc 35.938 (36.338)	lr 0.03288
Warmup Train [16][2980/3239]	Time 0.455 (0.515)	Data 0.001 (0.012)	Loss 4.6257 (4.7883)	Top-1 acc 23.438 (16.919)	Top-5 acc 40.625 (36.342)	lr 0.03288
Warmup Train [16][2990/3239]	Time 0.610 (0.515)	Data 0.001 (0.012)	Loss 4.7884 (4.7883)	Top-1 acc 19.531 (16.923)	Top-5 acc 35.547 (36.344)	lr 0.03287
Warmup Train [16][3000/3239]	Time 0.491 (0.515)	Data 0.001 (0.012)	Loss 4.7194 (4.7880)	Top-1 acc 18.750 (16.928)	Top-5 acc 38.281 (36.350)	lr 0.03286
Warmup Train [16][3010/3239]	Time 0.630 (0.515)	Data 0.001 (0.012)	Loss 4.6957 (4.7879)	Top-1 acc 15.625 (16.926)	Top-5 acc 37.891 (36.351)	lr 0.03286
Warmup Train [16][3020/3239]	Time 0.524 (0.515)	Data 0.001 (0.012)	Loss 4.6405 (4.7878)	Top-1 acc 18.359 (16.928)	Top-5 acc 37.500 (36.351)	lr 0.03285
Warmup Train [16][3030/3239]	Time 0.593 (0.515)	Data 0.001 (0.012)	Loss 4.7160 (4.7880)	Top-1 acc 17.578 (16.919)	Top-5 acc 39.062 (36.345)	lr 0.03285
Warmup Train [16][3040/3239]	Time 0.541 (0.515)	Data 0.001 (0.012)	Loss 4.6365 (4.7880)	Top-1 acc 18.359 (16.920)	Top-5 acc 36.328 (36.343)	lr 0.03284
Warmup Train [16][3050/3239]	Time 0.449 (0.515)	Data 0.001 (0.012)	Loss 4.8842 (4.7878)	Top-1 acc 16.797 (16.921)	Top-5 acc 34.375 (36.348)	lr 0.03283
Warmup Train [16][3060/3239]	Time 0.371 (0.515)	Data 0.001 (0.012)	Loss 4.9962 (4.7877)	Top-1 acc 13.281 (16.922)	Top-5 acc 31.250 (36.351)	lr 0.03283
Warmup Train [16][3070/3239]	Time 0.616 (0.515)	Data 0.001 (0.012)	Loss 4.8284 (4.7877)	Top-1 acc 18.750 (16.924)	Top-5 acc 37.891 (36.353)	lr 0.03282
Warmup Train [16][3080/3239]	Time 0.424 (0.515)	Data 0.001 (0.012)	Loss 4.8713 (4.7876)	Top-1 acc 16.797 (16.929)	Top-5 acc 38.672 (36.358)	lr 0.03282
Warmup Train [16][3090/3239]	Time 0.520 (0.515)	Data 0.001 (0.012)	Loss 4.6877 (4.7874)	Top-1 acc 18.359 (16.932)	Top-5 acc 39.453 (36.361)	lr 0.03281
Warmup Train [16][3100/3239]	Time 0.517 (0.515)	Data 0.001 (0.012)	Loss 4.8949 (4.7875)	Top-1 acc 16.406 (16.930)	Top-5 acc 35.547 (36.360)	lr 0.03281
Warmup Train [16][3110/3239]	Time 0.367 (0.515)	Data 0.001 (0.012)	Loss 4.8064 (4.7874)	Top-1 acc 16.406 (16.931)	Top-5 acc 35.547 (36.360)	lr 0.03280
Warmup Train [16][3120/3239]	Time 0.509 (0.515)	Data 0.001 (0.012)	Loss 4.7420 (4.7874)	Top-1 acc 15.234 (16.928)	Top-5 acc 39.453 (36.359)	lr 0.03279
Warmup Train [16][3130/3239]	Time 0.455 (0.515)	Data 0.001 (0.012)	Loss 4.7059 (4.7875)	Top-1 acc 16.797 (16.926)	Top-5 acc 37.891 (36.359)	lr 0.03279
Warmup Train [16][3140/3239]	Time 0.501 (0.515)	Data 0.001 (0.012)	Loss 4.6797 (4.7874)	Top-1 acc 17.578 (16.923)	Top-5 acc 39.062 (36.358)	lr 0.03278
Warmup Train [16][3150/3239]	Time 0.435 (0.515)	Data 0.001 (0.011)	Loss 4.8320 (4.7874)	Top-1 acc 16.016 (16.925)	Top-5 acc 31.641 (36.357)	lr 0.03278
Warmup Train [16][3160/3239]	Time 0.492 (0.515)	Data 0.001 (0.011)	Loss 4.7567 (4.7873)	Top-1 acc 18.359 (16.927)	Top-5 acc 35.156 (36.356)	lr 0.03277
Warmup Train [16][3170/3239]	Time 0.723 (0.515)	Data 0.001 (0.011)	Loss 4.8043 (4.7875)	Top-1 acc 12.109 (16.925)	Top-5 acc 35.156 (36.356)	lr 0.03277
Warmup Train [16][3180/3239]	Time 0.545 (0.515)	Data 0.000 (0.011)	Loss 4.6363 (4.7873)	Top-1 acc 18.359 (16.923)	Top-5 acc 39.844 (36.363)	lr 0.03276
Warmup Train [16][3190/3239]	Time 0.445 (0.515)	Data 0.000 (0.011)	Loss 4.7679 (4.7870)	Top-1 acc 17.969 (16.926)	Top-5 acc 36.328 (36.368)	lr 0.03275
Warmup Train [16][3200/3239]	Time 0.446 (0.515)	Data 0.000 (0.011)	Loss 4.8541 (4.7868)	Top-1 acc 16.406 (16.928)	Top-5 acc 35.938 (36.371)	lr 0.03275
Warmup Train [16][3210/3239]	Time 0.472 (0.515)	Data 0.000 (0.011)	Loss 4.5117 (4.7867)	Top-1 acc 19.531 (16.929)	Top-5 acc 40.234 (36.374)	lr 0.03274
Warmup Train [16][3220/3239]	Time 0.395 (0.515)	Data 0.000 (0.011)	Loss 4.8189 (4.7867)	Top-1 acc 14.844 (16.928)	Top-5 acc 36.719 (36.375)	lr 0.03274
Warmup Train [16][3230/3239]	Time 0.618 (0.515)	Data 0.000 (0.011)	Loss 4.7920 (4.7867)	Top-1 acc 16.797 (16.929)	Top-5 acc 36.719 (36.374)	lr 0.03273
Warmup Train [16][3239/3239]	Time 0.337 (0.514)	Data 0.000 (0.011)	Loss 4.7017 (4.7865)	Top-1 acc 19.753 (16.935)	Top-5 acc 29.630 (36.381)	lr 0.03273
==========Warmup Valid [16/40]	loss 3.863	top-1 acc 23.591	top-5 acc 46.288	Train top-1 16.935	top-5 36.381	flops: 442.4M
Warmup Train [17][0/3239]	Time 14.788 (14.788)	Data 11.660 (11.660)	Loss 4.6949 (4.6949)	Top-1 acc 20.703 (20.703)	Top-5 acc 37.109 (37.109)	lr 0.03273
Warmup Train [17][10/3239]	Time 0.540 (1.860)	Data 0.001 (1.072)	Loss 4.7884 (4.7470)	Top-1 acc 16.797 (18.075)	Top-5 acc 33.984 (36.825)	lr 0.03272
Warmup Train [17][20/3239]	Time 0.447 (1.215)	Data 0.001 (0.563)	Loss 4.6649 (4.7635)	Top-1 acc 21.875 (17.671)	Top-5 acc 36.328 (36.737)	lr 0.03271
Warmup Train [17][30/3239]	Time 0.482 (0.988)	Data 0.001 (0.384)	Loss 4.4945 (4.7438)	Top-1 acc 20.703 (17.704)	Top-5 acc 39.453 (37.286)	lr 0.03271
Warmup Train [17][40/3239]	Time 0.554 (0.869)	Data 0.002 (0.291)	Loss 4.8036 (4.7581)	Top-1 acc 15.625 (17.207)	Top-5 acc 32.812 (36.747)	lr 0.03270
Warmup Train [17][50/3239]	Time 0.514 (0.800)	Data 0.001 (0.235)	Loss 4.9335 (4.7549)	Top-1 acc 14.062 (17.233)	Top-5 acc 35.156 (36.941)	lr 0.03270
Warmup Train [17][60/3239]	Time 0.528 (0.755)	Data 0.001 (0.196)	Loss 4.7681 (4.7494)	Top-1 acc 16.797 (17.386)	Top-5 acc 35.156 (37.071)	lr 0.03269
Warmup Train [17][70/3239]	Time 0.521 (0.719)	Data 0.001 (0.169)	Loss 4.6624 (4.7499)	Top-1 acc 18.750 (17.375)	Top-5 acc 38.672 (36.911)	lr 0.03269
Warmup Train [17][80/3239]	Time 0.740 (0.697)	Data 0.001 (0.149)	Loss 4.8620 (4.7498)	Top-1 acc 12.891 (17.313)	Top-5 acc 32.812 (36.984)	lr 0.03268
Warmup Train [17][90/3239]	Time 0.530 (0.678)	Data 0.001 (0.133)	Loss 4.9980 (4.7497)	Top-1 acc 12.500 (17.162)	Top-5 acc 32.422 (36.998)	lr 0.03267
Warmup Train [17][100/3239]	Time 0.484 (0.660)	Data 0.030 (0.120)	Loss 4.6664 (4.7487)	Top-1 acc 17.969 (17.300)	Top-5 acc 41.016 (37.140)	lr 0.03267
Warmup Train [17][110/3239]	Time 0.587 (0.642)	Data 0.001 (0.109)	Loss 4.7727 (4.7443)	Top-1 acc 17.578 (17.399)	Top-5 acc 38.281 (37.271)	lr 0.03266
Warmup Train [17][120/3239]	Time 0.553 (0.631)	Data 0.001 (0.101)	Loss 4.7499 (4.7423)	Top-1 acc 14.844 (17.462)	Top-5 acc 34.766 (37.306)	lr 0.03266
Warmup Train [17][130/3239]	Time 0.548 (0.620)	Data 0.001 (0.093)	Loss 4.7384 (4.7361)	Top-1 acc 16.797 (17.563)	Top-5 acc 35.938 (37.419)	lr 0.03265
Warmup Train [17][140/3239]	Time 0.573 (0.613)	Data 0.001 (0.087)	Loss 4.6735 (4.7330)	Top-1 acc 19.531 (17.670)	Top-5 acc 37.500 (37.458)	lr 0.03264
Warmup Train [17][150/3239]	Time 0.459 (0.602)	Data 0.001 (0.081)	Loss 4.5559 (4.7334)	Top-1 acc 19.141 (17.651)	Top-5 acc 42.188 (37.461)	lr 0.03264
Warmup Train [17][160/3239]	Time 0.408 (0.598)	Data 0.001 (0.076)	Loss 4.7076 (4.7334)	Top-1 acc 17.188 (17.661)	Top-5 acc 36.719 (37.425)	lr 0.03263
Warmup Train [17][170/3239]	Time 0.370 (0.592)	Data 0.001 (0.073)	Loss 4.5272 (4.7312)	Top-1 acc 19.141 (17.667)	Top-5 acc 40.625 (37.457)	lr 0.03263
Warmup Train [17][180/3239]	Time 0.480 (0.587)	Data 0.001 (0.069)	Loss 4.7619 (4.7317)	Top-1 acc 14.062 (17.606)	Top-5 acc 37.891 (37.446)	lr 0.03262
Warmup Train [17][190/3239]	Time 0.683 (0.585)	Data 0.001 (0.067)	Loss 4.5186 (4.7307)	Top-1 acc 19.922 (17.635)	Top-5 acc 41.016 (37.461)	lr 0.03262
Warmup Train [17][200/3239]	Time 0.537 (0.581)	Data 0.001 (0.063)	Loss 4.8590 (4.7295)	Top-1 acc 18.359 (17.691)	Top-5 acc 35.547 (37.552)	lr 0.03261
Warmup Train [17][210/3239]	Time 0.502 (0.577)	Data 0.001 (0.060)	Loss 4.6368 (4.7288)	Top-1 acc 19.531 (17.771)	Top-5 acc 39.453 (37.613)	lr 0.03260
Warmup Train [17][220/3239]	Time 0.476 (0.573)	Data 0.001 (0.058)	Loss 4.9253 (4.7306)	Top-1 acc 12.891 (17.765)	Top-5 acc 32.422 (37.603)	lr 0.03260
Warmup Train [17][230/3239]	Time 0.374 (0.570)	Data 0.001 (0.055)	Loss 5.0094 (4.7325)	Top-1 acc 14.062 (17.702)	Top-5 acc 31.641 (37.598)	lr 0.03259
Warmup Train [17][240/3239]	Time 0.459 (0.568)	Data 0.001 (0.054)	Loss 4.6446 (4.7317)	Top-1 acc 15.625 (17.747)	Top-5 acc 41.016 (37.623)	lr 0.03259
Warmup Train [17][250/3239]	Time 0.472 (0.567)	Data 0.001 (0.052)	Loss 4.5741 (4.7298)	Top-1 acc 21.094 (17.766)	Top-5 acc 43.750 (37.648)	lr 0.03258
Warmup Train [17][260/3239]	Time 0.439 (0.565)	Data 0.001 (0.051)	Loss 4.6471 (4.7274)	Top-1 acc 17.969 (17.798)	Top-5 acc 39.062 (37.698)	lr 0.03258
Warmup Train [17][270/3239]	Time 0.409 (0.564)	Data 0.001 (0.049)	Loss 4.6645 (4.7273)	Top-1 acc 14.844 (17.816)	Top-5 acc 35.547 (37.713)	lr 0.03257
Warmup Train [17][280/3239]	Time 0.582 (0.563)	Data 0.001 (0.048)	Loss 4.7067 (4.7269)	Top-1 acc 20.703 (17.824)	Top-5 acc 38.672 (37.743)	lr 0.03256
Warmup Train [17][290/3239]	Time 0.643 (0.561)	Data 0.001 (0.046)	Loss 5.0468 (4.7267)	Top-1 acc 12.109 (17.814)	Top-5 acc 33.203 (37.723)	lr 0.03256
Warmup Train [17][300/3239]	Time 0.744 (0.559)	Data 0.001 (0.045)	Loss 4.7174 (4.7281)	Top-1 acc 17.578 (17.794)	Top-5 acc 39.062 (37.684)	lr 0.03255
Warmup Train [17][310/3239]	Time 0.569 (0.558)	Data 0.002 (0.043)	Loss 4.7889 (4.7292)	Top-1 acc 18.750 (17.777)	Top-5 acc 34.766 (37.642)	lr 0.03255
Warmup Train [17][320/3239]	Time 0.543 (0.557)	Data 0.001 (0.042)	Loss 4.8958 (4.7313)	Top-1 acc 17.969 (17.748)	Top-5 acc 37.109 (37.630)	lr 0.03254
Warmup Train [17][330/3239]	Time 0.566 (0.555)	Data 0.001 (0.041)	Loss 4.7699 (4.7309)	Top-1 acc 15.625 (17.747)	Top-5 acc 37.500 (37.666)	lr 0.03253
Warmup Train [17][340/3239]	Time 0.475 (0.554)	Data 0.001 (0.040)	Loss 4.6173 (4.7321)	Top-1 acc 17.188 (17.713)	Top-5 acc 39.453 (37.636)	lr 0.03253
Warmup Train [17][350/3239]	Time 0.595 (0.553)	Data 0.001 (0.039)	Loss 4.6515 (4.7322)	Top-1 acc 19.141 (17.721)	Top-5 acc 39.453 (37.634)	lr 0.03252
Warmup Train [17][360/3239]	Time 0.542 (0.552)	Data 0.001 (0.038)	Loss 4.6407 (4.7336)	Top-1 acc 22.266 (17.705)	Top-5 acc 39.453 (37.595)	lr 0.03252
Warmup Train [17][370/3239]	Time 0.449 (0.550)	Data 0.002 (0.037)	Loss 4.7744 (4.7340)	Top-1 acc 16.016 (17.712)	Top-5 acc 33.984 (37.595)	lr 0.03251
Warmup Train [17][380/3239]	Time 0.609 (0.549)	Data 0.001 (0.037)	Loss 4.8515 (4.7336)	Top-1 acc 13.672 (17.742)	Top-5 acc 33.984 (37.610)	lr 0.03251
Warmup Train [17][390/3239]	Time 0.604 (0.548)	Data 0.001 (0.036)	Loss 4.7723 (4.7339)	Top-1 acc 17.188 (17.774)	Top-5 acc 35.547 (37.620)	lr 0.03250
Warmup Train [17][400/3239]	Time 0.298 (0.547)	Data 0.001 (0.035)	Loss 4.5084 (4.7314)	Top-1 acc 20.703 (17.806)	Top-5 acc 45.312 (37.687)	lr 0.03249
Warmup Train [17][410/3239]	Time 0.389 (0.545)	Data 0.001 (0.035)	Loss 4.8506 (4.7299)	Top-1 acc 14.453 (17.853)	Top-5 acc 35.547 (37.721)	lr 0.03249
Warmup Train [17][420/3239]	Time 0.417 (0.544)	Data 0.001 (0.034)	Loss 4.8744 (4.7301)	Top-1 acc 14.453 (17.866)	Top-5 acc 34.766 (37.731)	lr 0.03248
Warmup Train [17][430/3239]	Time 0.429 (0.542)	Data 0.001 (0.034)	Loss 4.8194 (4.7295)	Top-1 acc 14.844 (17.891)	Top-5 acc 40.234 (37.776)	lr 0.03248
Warmup Train [17][440/3239]	Time 0.438 (0.542)	Data 0.001 (0.033)	Loss 4.7258 (4.7302)	Top-1 acc 19.531 (17.879)	Top-5 acc 41.797 (37.783)	lr 0.03247
Warmup Train [17][450/3239]	Time 0.413 (0.541)	Data 0.001 (0.033)	Loss 4.6791 (4.7296)	Top-1 acc 18.750 (17.902)	Top-5 acc 37.891 (37.781)	lr 0.03247
Warmup Train [17][460/3239]	Time 0.397 (0.541)	Data 0.001 (0.032)	Loss 4.7258 (4.7301)	Top-1 acc 18.750 (17.890)	Top-5 acc 36.328 (37.766)	lr 0.03246
Warmup Train [17][470/3239]	Time 0.349 (0.540)	Data 0.001 (0.032)	Loss 4.7323 (4.7303)	Top-1 acc 17.188 (17.876)	Top-5 acc 37.500 (37.760)	lr 0.03245
Warmup Train [17][480/3239]	Time 0.532 (0.540)	Data 0.001 (0.031)	Loss 4.5646 (4.7298)	Top-1 acc 22.656 (17.881)	Top-5 acc 41.406 (37.757)	lr 0.03245
Warmup Train [17][490/3239]	Time 0.497 (0.539)	Data 0.001 (0.031)	Loss 4.7556 (4.7300)	Top-1 acc 17.969 (17.882)	Top-5 acc 39.062 (37.727)	lr 0.03244
Warmup Train [17][500/3239]	Time 0.629 (0.538)	Data 0.001 (0.031)	Loss 4.6818 (4.7294)	Top-1 acc 18.359 (17.875)	Top-5 acc 37.109 (37.742)	lr 0.03244
Warmup Train [17][510/3239]	Time 0.495 (0.538)	Data 0.002 (0.030)	Loss 4.6956 (4.7302)	Top-1 acc 15.625 (17.866)	Top-5 acc 33.594 (37.726)	lr 0.03243
Warmup Train [17][520/3239]	Time 0.596 (0.537)	Data 0.002 (0.030)	Loss 4.8003 (4.7305)	Top-1 acc 11.719 (17.859)	Top-5 acc 36.328 (37.738)	lr 0.03243
Warmup Train [17][530/3239]	Time 0.557 (0.537)	Data 0.002 (0.029)	Loss 4.5736 (4.7298)	Top-1 acc 17.969 (17.864)	Top-5 acc 41.406 (37.761)	lr 0.03242
Warmup Train [17][540/3239]	Time 0.610 (0.537)	Data 0.001 (0.029)	Loss 4.5704 (4.7293)	Top-1 acc 17.969 (17.876)	Top-5 acc 43.750 (37.782)	lr 0.03241
Warmup Train [17][550/3239]	Time 0.450 (0.536)	Data 0.001 (0.028)	Loss 4.7077 (4.7304)	Top-1 acc 18.750 (17.863)	Top-5 acc 37.500 (37.753)	lr 0.03241
Warmup Train [17][560/3239]	Time 0.547 (0.536)	Data 0.001 (0.028)	Loss 4.5221 (4.7305)	Top-1 acc 21.875 (17.865)	Top-5 acc 42.578 (37.756)	lr 0.03240
Warmup Train [17][570/3239]	Time 0.316 (0.535)	Data 0.001 (0.027)	Loss 4.6522 (4.7307)	Top-1 acc 15.625 (17.842)	Top-5 acc 38.672 (37.744)	lr 0.03240
Warmup Train [17][580/3239]	Time 0.343 (0.535)	Data 0.001 (0.027)	Loss 4.9270 (4.7307)	Top-1 acc 15.625 (17.866)	Top-5 acc 33.984 (37.735)	lr 0.03239
Warmup Train [17][590/3239]	Time 0.636 (0.535)	Data 0.001 (0.027)	Loss 4.8807 (4.7312)	Top-1 acc 16.016 (17.867)	Top-5 acc 34.766 (37.724)	lr 0.03238
Warmup Train [17][600/3239]	Time 0.461 (0.534)	Data 0.001 (0.027)	Loss 4.9179 (4.7310)	Top-1 acc 13.672 (17.888)	Top-5 acc 32.812 (37.723)	lr 0.03238
Warmup Train [17][610/3239]	Time 0.444 (0.534)	Data 0.001 (0.026)	Loss 5.0482 (4.7308)	Top-1 acc 11.328 (17.893)	Top-5 acc 33.594 (37.722)	lr 0.03237
Warmup Train [17][620/3239]	Time 0.515 (0.534)	Data 0.001 (0.026)	Loss 4.7248 (4.7299)	Top-1 acc 16.406 (17.908)	Top-5 acc 34.766 (37.747)	lr 0.03237
Warmup Train [17][630/3239]	Time 0.524 (0.534)	Data 0.001 (0.026)	Loss 4.8000 (4.7296)	Top-1 acc 14.844 (17.907)	Top-5 acc 33.594 (37.735)	lr 0.03236
Warmup Train [17][640/3239]	Time 0.481 (0.533)	Data 0.001 (0.025)	Loss 4.6581 (4.7291)	Top-1 acc 18.750 (17.905)	Top-5 acc 40.234 (37.746)	lr 0.03236
Warmup Train [17][650/3239]	Time 0.554 (0.533)	Data 0.001 (0.025)	Loss 4.7413 (4.7288)	Top-1 acc 16.406 (17.905)	Top-5 acc 41.016 (37.751)	lr 0.03235
Warmup Train [17][660/3239]	Time 0.441 (0.532)	Data 0.001 (0.025)	Loss 4.9026 (4.7279)	Top-1 acc 15.625 (17.915)	Top-5 acc 34.375 (37.786)	lr 0.03234
Warmup Train [17][670/3239]	Time 0.574 (0.532)	Data 0.001 (0.025)	Loss 4.6854 (4.7277)	Top-1 acc 16.406 (17.908)	Top-5 acc 36.328 (37.780)	lr 0.03234
Warmup Train [17][680/3239]	Time 0.578 (0.531)	Data 0.001 (0.024)	Loss 4.6251 (4.7279)	Top-1 acc 19.141 (17.905)	Top-5 acc 38.672 (37.780)	lr 0.03233
Warmup Train [17][690/3239]	Time 0.419 (0.531)	Data 0.001 (0.024)	Loss 4.5399 (4.7270)	Top-1 acc 21.875 (17.918)	Top-5 acc 42.188 (37.810)	lr 0.03233
Warmup Train [17][700/3239]	Time 0.311 (0.530)	Data 0.001 (0.024)	Loss 4.7292 (4.7269)	Top-1 acc 16.016 (17.920)	Top-5 acc 35.938 (37.806)	lr 0.03232
Warmup Train [17][710/3239]	Time 0.519 (0.529)	Data 0.001 (0.024)	Loss 4.7231 (4.7276)	Top-1 acc 17.969 (17.902)	Top-5 acc 39.844 (37.790)	lr 0.03232
Warmup Train [17][720/3239]	Time 0.623 (0.529)	Data 0.001 (0.023)	Loss 4.6613 (4.7277)	Top-1 acc 17.969 (17.917)	Top-5 acc 40.625 (37.806)	lr 0.03231
Warmup Train [17][730/3239]	Time 0.300 (0.528)	Data 0.002 (0.023)	Loss 4.7335 (4.7275)	Top-1 acc 16.797 (17.925)	Top-5 acc 32.031 (37.817)	lr 0.03230
Warmup Train [17][740/3239]	Time 0.503 (0.528)	Data 0.022 (0.023)	Loss 4.9314 (4.7277)	Top-1 acc 13.672 (17.910)	Top-5 acc 35.547 (37.814)	lr 0.03230
Warmup Train [17][750/3239]	Time 0.684 (0.528)	Data 0.001 (0.023)	Loss 4.6152 (4.7270)	Top-1 acc 20.312 (17.921)	Top-5 acc 40.625 (37.843)	lr 0.03229
Warmup Train [17][760/3239]	Time 0.665 (0.528)	Data 0.001 (0.023)	Loss 4.7162 (4.7268)	Top-1 acc 19.141 (17.926)	Top-5 acc 37.500 (37.842)	lr 0.03229
Warmup Train [17][770/3239]	Time 0.549 (0.528)	Data 0.001 (0.022)	Loss 4.7482 (4.7276)	Top-1 acc 19.922 (17.918)	Top-5 acc 37.109 (37.817)	lr 0.03228
Warmup Train [17][780/3239]	Time 0.578 (0.527)	Data 0.001 (0.022)	Loss 4.5711 (4.7271)	Top-1 acc 19.531 (17.916)	Top-5 acc 42.969 (37.820)	lr 0.03227
Warmup Train [17][790/3239]	Time 0.601 (0.527)	Data 0.001 (0.022)	Loss 4.7224 (4.7273)	Top-1 acc 23.438 (17.930)	Top-5 acc 40.234 (37.820)	lr 0.03227
Warmup Train [17][800/3239]	Time 0.474 (0.527)	Data 0.001 (0.022)	Loss 4.6711 (4.7272)	Top-1 acc 19.141 (17.928)	Top-5 acc 38.672 (37.816)	lr 0.03226
Warmup Train [17][810/3239]	Time 0.591 (0.527)	Data 0.001 (0.022)	Loss 4.7621 (4.7279)	Top-1 acc 17.578 (17.917)	Top-5 acc 40.234 (37.797)	lr 0.03226
Warmup Train [17][820/3239]	Time 0.438 (0.527)	Data 0.001 (0.021)	Loss 4.7846 (4.7277)	Top-1 acc 13.672 (17.907)	Top-5 acc 33.984 (37.797)	lr 0.03225
Warmup Train [17][830/3239]	Time 0.709 (0.526)	Data 0.001 (0.021)	Loss 4.6697 (4.7275)	Top-1 acc 19.922 (17.916)	Top-5 acc 39.453 (37.813)	lr 0.03225
Warmup Train [17][840/3239]	Time 0.538 (0.526)	Data 0.001 (0.021)	Loss 4.6401 (4.7273)	Top-1 acc 18.359 (17.920)	Top-5 acc 41.406 (37.813)	lr 0.03224
Warmup Train [17][850/3239]	Time 0.523 (0.526)	Data 0.001 (0.021)	Loss 4.8437 (4.7273)	Top-1 acc 17.188 (17.914)	Top-5 acc 32.031 (37.799)	lr 0.03223
Warmup Train [17][860/3239]	Time 0.498 (0.526)	Data 0.001 (0.020)	Loss 4.8150 (4.7277)	Top-1 acc 17.188 (17.915)	Top-5 acc 37.500 (37.790)	lr 0.03223
Warmup Train [17][870/3239]	Time 0.605 (0.526)	Data 0.001 (0.020)	Loss 4.8955 (4.7279)	Top-1 acc 14.844 (17.915)	Top-5 acc 35.156 (37.793)	lr 0.03222
Warmup Train [17][880/3239]	Time 0.394 (0.526)	Data 0.001 (0.020)	Loss 4.7593 (4.7276)	Top-1 acc 14.453 (17.925)	Top-5 acc 37.500 (37.803)	lr 0.03222
Warmup Train [17][890/3239]	Time 0.486 (0.526)	Data 0.001 (0.020)	Loss 4.6164 (4.7277)	Top-1 acc 21.484 (17.924)	Top-5 acc 38.281 (37.796)	lr 0.03221
Warmup Train [17][900/3239]	Time 0.458 (0.525)	Data 0.001 (0.020)	Loss 4.7757 (4.7280)	Top-1 acc 17.188 (17.920)	Top-5 acc 37.109 (37.783)	lr 0.03220
Warmup Train [17][910/3239]	Time 0.511 (0.525)	Data 0.001 (0.020)	Loss 4.5864 (4.7276)	Top-1 acc 16.797 (17.925)	Top-5 acc 41.406 (37.787)	lr 0.03220
Warmup Train [17][920/3239]	Time 0.549 (0.525)	Data 0.001 (0.019)	Loss 4.5948 (4.7272)	Top-1 acc 19.922 (17.922)	Top-5 acc 40.234 (37.781)	lr 0.03219
Warmup Train [17][930/3239]	Time 0.682 (0.525)	Data 0.001 (0.019)	Loss 4.9203 (4.7272)	Top-1 acc 17.578 (17.915)	Top-5 acc 31.641 (37.781)	lr 0.03219
Warmup Train [17][940/3239]	Time 0.550 (0.525)	Data 0.001 (0.019)	Loss 4.7722 (4.7275)	Top-1 acc 16.797 (17.913)	Top-5 acc 38.672 (37.769)	lr 0.03218
Warmup Train [17][950/3239]	Time 0.384 (0.525)	Data 0.002 (0.019)	Loss 4.5413 (4.7273)	Top-1 acc 21.875 (17.924)	Top-5 acc 45.312 (37.795)	lr 0.03218
Warmup Train [17][960/3239]	Time 0.471 (0.524)	Data 0.001 (0.019)	Loss 4.9365 (4.7276)	Top-1 acc 10.938 (17.914)	Top-5 acc 34.375 (37.787)	lr 0.03217
Warmup Train [17][970/3239]	Time 0.724 (0.524)	Data 0.001 (0.019)	Loss 4.5953 (4.7269)	Top-1 acc 19.531 (17.927)	Top-5 acc 42.188 (37.809)	lr 0.03216
Warmup Train [17][980/3239]	Time 0.259 (0.523)	Data 0.001 (0.019)	Loss 4.8169 (4.7271)	Top-1 acc 14.453 (17.919)	Top-5 acc 35.938 (37.801)	lr 0.03216
Warmup Train [17][990/3239]	Time 0.554 (0.523)	Data 0.001 (0.019)	Loss 4.7583 (4.7270)	Top-1 acc 17.188 (17.928)	Top-5 acc 34.766 (37.799)	lr 0.03215
Warmup Train [17][1000/3239]	Time 0.573 (0.523)	Data 0.001 (0.019)	Loss 4.9037 (4.7269)	Top-1 acc 15.234 (17.929)	Top-5 acc 32.031 (37.799)	lr 0.03215
Warmup Train [17][1010/3239]	Time 0.564 (0.523)	Data 0.001 (0.018)	Loss 4.7145 (4.7267)	Top-1 acc 20.703 (17.941)	Top-5 acc 39.844 (37.813)	lr 0.03214
Warmup Train [17][1020/3239]	Time 0.600 (0.523)	Data 0.002 (0.018)	Loss 4.7592 (4.7264)	Top-1 acc 19.531 (17.955)	Top-5 acc 34.766 (37.820)	lr 0.03214
Warmup Train [17][1030/3239]	Time 0.544 (0.523)	Data 0.001 (0.018)	Loss 4.5549 (4.7259)	Top-1 acc 21.875 (17.964)	Top-5 acc 44.531 (37.843)	lr 0.03213
Warmup Train [17][1040/3239]	Time 0.519 (0.523)	Data 0.001 (0.018)	Loss 4.6576 (4.7255)	Top-1 acc 20.703 (17.971)	Top-5 acc 41.797 (37.859)	lr 0.03212
Warmup Train [17][1050/3239]	Time 0.524 (0.523)	Data 0.001 (0.018)	Loss 4.6399 (4.7253)	Top-1 acc 22.266 (17.977)	Top-5 acc 44.141 (37.860)	lr 0.03212
Warmup Train [17][1060/3239]	Time 0.608 (0.522)	Data 0.001 (0.018)	Loss 4.6685 (4.7252)	Top-1 acc 15.234 (17.974)	Top-5 acc 39.844 (37.862)	lr 0.03211
Warmup Train [17][1070/3239]	Time 0.476 (0.522)	Data 0.001 (0.018)	Loss 4.6142 (4.7253)	Top-1 acc 22.266 (17.973)	Top-5 acc 37.500 (37.861)	lr 0.03211
Warmup Train [17][1080/3239]	Time 0.447 (0.522)	Data 0.022 (0.018)	Loss 4.6459 (4.7250)	Top-1 acc 21.875 (17.990)	Top-5 acc 38.672 (37.874)	lr 0.03210
Warmup Train [17][1090/3239]	Time 0.495 (0.522)	Data 0.001 (0.017)	Loss 4.8124 (4.7247)	Top-1 acc 19.922 (17.993)	Top-5 acc 38.281 (37.880)	lr 0.03209
Warmup Train [17][1100/3239]	Time 0.428 (0.522)	Data 0.001 (0.017)	Loss 4.5720 (4.7246)	Top-1 acc 20.703 (17.994)	Top-5 acc 39.453 (37.885)	lr 0.03209
Warmup Train [17][1110/3239]	Time 0.360 (0.522)	Data 0.001 (0.017)	Loss 4.4761 (4.7245)	Top-1 acc 21.875 (17.992)	Top-5 acc 46.094 (37.881)	lr 0.03208
Warmup Train [17][1120/3239]	Time 0.464 (0.522)	Data 0.001 (0.017)	Loss 4.7682 (4.7243)	Top-1 acc 16.016 (17.997)	Top-5 acc 40.234 (37.889)	lr 0.03208
Warmup Train [17][1130/3239]	Time 0.479 (0.522)	Data 0.001 (0.017)	Loss 4.5531 (4.7239)	Top-1 acc 23.047 (18.009)	Top-5 acc 42.578 (37.902)	lr 0.03207
Warmup Train [17][1140/3239]	Time 0.491 (0.522)	Data 0.001 (0.017)	Loss 4.7693 (4.7238)	Top-1 acc 20.312 (18.016)	Top-5 acc 40.234 (37.905)	lr 0.03207
Warmup Train [17][1150/3239]	Time 0.509 (0.522)	Data 0.001 (0.017)	Loss 4.4988 (4.7231)	Top-1 acc 19.922 (18.025)	Top-5 acc 41.016 (37.915)	lr 0.03206
Warmup Train [17][1160/3239]	Time 0.558 (0.522)	Data 0.001 (0.017)	Loss 4.6480 (4.7229)	Top-1 acc 19.922 (18.030)	Top-5 acc 37.891 (37.915)	lr 0.03205
Warmup Train [17][1170/3239]	Time 0.423 (0.522)	Data 0.001 (0.017)	Loss 4.8880 (4.7229)	Top-1 acc 13.672 (18.023)	Top-5 acc 33.203 (37.902)	lr 0.03205
Warmup Train [17][1180/3239]	Time 0.545 (0.522)	Data 0.001 (0.017)	Loss 4.5604 (4.7231)	Top-1 acc 21.094 (18.015)	Top-5 acc 42.578 (37.892)	lr 0.03204
Warmup Train [17][1190/3239]	Time 0.370 (0.522)	Data 0.001 (0.017)	Loss 4.7641 (4.7232)	Top-1 acc 14.453 (18.005)	Top-5 acc 38.281 (37.892)	lr 0.03204
Warmup Train [17][1200/3239]	Time 0.379 (0.522)	Data 0.001 (0.017)	Loss 4.7379 (4.7233)	Top-1 acc 17.578 (18.008)	Top-5 acc 38.672 (37.902)	lr 0.03203
Warmup Train [17][1210/3239]	Time 0.458 (0.522)	Data 0.001 (0.017)	Loss 4.6858 (4.7234)	Top-1 acc 18.750 (18.007)	Top-5 acc 37.500 (37.899)	lr 0.03202
Warmup Train [17][1220/3239]	Time 0.489 (0.522)	Data 0.001 (0.017)	Loss 4.5326 (4.7235)	Top-1 acc 19.531 (18.005)	Top-5 acc 39.844 (37.900)	lr 0.03202
Warmup Train [17][1230/3239]	Time 0.507 (0.522)	Data 0.001 (0.017)	Loss 4.8043 (4.7231)	Top-1 acc 19.141 (18.015)	Top-5 acc 37.891 (37.913)	lr 0.03201
Warmup Train [17][1240/3239]	Time 0.336 (0.521)	Data 0.001 (0.016)	Loss 4.7509 (4.7229)	Top-1 acc 18.359 (18.016)	Top-5 acc 37.891 (37.911)	lr 0.03201
Warmup Train [17][1250/3239]	Time 0.349 (0.521)	Data 0.001 (0.016)	Loss 4.6224 (4.7223)	Top-1 acc 20.703 (18.021)	Top-5 acc 38.672 (37.927)	lr 0.03200
Warmup Train [17][1260/3239]	Time 0.537 (0.521)	Data 0.001 (0.016)	Loss 4.7345 (4.7223)	Top-1 acc 18.359 (18.020)	Top-5 acc 37.891 (37.926)	lr 0.03200
Warmup Train [17][1270/3239]	Time 0.529 (0.520)	Data 0.001 (0.016)	Loss 4.8482 (4.7223)	Top-1 acc 15.625 (18.023)	Top-5 acc 37.500 (37.932)	lr 0.03199
Warmup Train [17][1280/3239]	Time 0.645 (0.520)	Data 0.001 (0.016)	Loss 4.6181 (4.7223)	Top-1 acc 21.484 (18.021)	Top-5 acc 43.359 (37.932)	lr 0.03198
Warmup Train [17][1290/3239]	Time 0.395 (0.520)	Data 0.001 (0.016)	Loss 4.7472 (4.7227)	Top-1 acc 15.625 (18.010)	Top-5 acc 37.109 (37.927)	lr 0.03198
Warmup Train [17][1300/3239]	Time 0.471 (0.520)	Data 0.001 (0.016)	Loss 4.8433 (4.7228)	Top-1 acc 15.625 (18.004)	Top-5 acc 34.766 (37.929)	lr 0.03197
Warmup Train [17][1310/3239]	Time 0.535 (0.520)	Data 0.001 (0.016)	Loss 4.6264 (4.7227)	Top-1 acc 20.312 (18.006)	Top-5 acc 41.016 (37.931)	lr 0.03197
Warmup Train [17][1320/3239]	Time 0.384 (0.520)	Data 0.001 (0.016)	Loss 4.7554 (4.7226)	Top-1 acc 17.188 (17.999)	Top-5 acc 38.672 (37.935)	lr 0.03196
Warmup Train [17][1330/3239]	Time 0.553 (0.520)	Data 0.001 (0.016)	Loss 4.7589 (4.7226)	Top-1 acc 16.797 (17.997)	Top-5 acc 37.109 (37.936)	lr 0.03195
Warmup Train [17][1340/3239]	Time 0.572 (0.520)	Data 0.001 (0.016)	Loss 4.8961 (4.7226)	Top-1 acc 14.062 (17.991)	Top-5 acc 31.250 (37.935)	lr 0.03195
Warmup Train [17][1350/3239]	Time 0.540 (0.520)	Data 0.001 (0.016)	Loss 4.7277 (4.7225)	Top-1 acc 17.969 (17.995)	Top-5 acc 39.062 (37.935)	lr 0.03194
Warmup Train [17][1360/3239]	Time 0.531 (0.520)	Data 0.001 (0.016)	Loss 4.6844 (4.7228)	Top-1 acc 15.625 (17.990)	Top-5 acc 37.891 (37.930)	lr 0.03194
Warmup Train [17][1370/3239]	Time 0.592 (0.520)	Data 0.001 (0.016)	Loss 4.6396 (4.7226)	Top-1 acc 16.406 (17.981)	Top-5 acc 39.062 (37.928)	lr 0.03193
Warmup Train [17][1380/3239]	Time 0.576 (0.519)	Data 0.001 (0.016)	Loss 4.5862 (4.7226)	Top-1 acc 19.531 (17.979)	Top-5 acc 42.969 (37.934)	lr 0.03193
Warmup Train [17][1390/3239]	Time 0.597 (0.519)	Data 0.001 (0.015)	Loss 4.9009 (4.7224)	Top-1 acc 16.016 (17.983)	Top-5 acc 35.938 (37.943)	lr 0.03192
Warmup Train [17][1400/3239]	Time 0.638 (0.519)	Data 0.001 (0.015)	Loss 4.7627 (4.7225)	Top-1 acc 17.969 (17.988)	Top-5 acc 37.109 (37.948)	lr 0.03191
Warmup Train [17][1410/3239]	Time 0.532 (0.520)	Data 0.001 (0.015)	Loss 4.7323 (4.7223)	Top-1 acc 16.797 (17.989)	Top-5 acc 39.453 (37.962)	lr 0.03191
Warmup Train [17][1420/3239]	Time 0.551 (0.520)	Data 0.001 (0.015)	Loss 4.4550 (4.7218)	Top-1 acc 22.656 (17.993)	Top-5 acc 44.531 (37.973)	lr 0.03190
Warmup Train [17][1430/3239]	Time 0.448 (0.519)	Data 0.001 (0.015)	Loss 4.7240 (4.7215)	Top-1 acc 20.312 (17.998)	Top-5 acc 36.328 (37.982)	lr 0.03190
Warmup Train [17][1440/3239]	Time 0.645 (0.520)	Data 0.001 (0.015)	Loss 4.6259 (4.7212)	Top-1 acc 18.750 (18.002)	Top-5 acc 41.406 (37.983)	lr 0.03189
Warmup Train [17][1450/3239]	Time 0.589 (0.519)	Data 0.001 (0.015)	Loss 4.7684 (4.7215)	Top-1 acc 17.188 (17.994)	Top-5 acc 34.766 (37.978)	lr 0.03189
Warmup Train [17][1460/3239]	Time 0.547 (0.519)	Data 0.001 (0.015)	Loss 4.6873 (4.7212)	Top-1 acc 18.359 (17.997)	Top-5 acc 39.453 (37.988)	lr 0.03188
Warmup Train [17][1470/3239]	Time 0.605 (0.519)	Data 0.001 (0.015)	Loss 4.7751 (4.7213)	Top-1 acc 16.016 (18.001)	Top-5 acc 39.062 (37.988)	lr 0.03187
Warmup Train [17][1480/3239]	Time 0.603 (0.519)	Data 0.001 (0.015)	Loss 4.7236 (4.7210)	Top-1 acc 17.969 (18.002)	Top-5 acc 38.281 (37.997)	lr 0.03187
Warmup Train [17][1490/3239]	Time 0.365 (0.519)	Data 0.002 (0.015)	Loss 4.8794 (4.7210)	Top-1 acc 14.453 (18.006)	Top-5 acc 33.203 (37.993)	lr 0.03186
Warmup Train [17][1500/3239]	Time 0.402 (0.519)	Data 0.001 (0.015)	Loss 4.6843 (4.7210)	Top-1 acc 19.922 (18.002)	Top-5 acc 36.719 (37.989)	lr 0.03186
Warmup Train [17][1510/3239]	Time 0.608 (0.519)	Data 0.001 (0.015)	Loss 4.7700 (4.7212)	Top-1 acc 18.750 (18.000)	Top-5 acc 38.672 (37.982)	lr 0.03185
Warmup Train [17][1520/3239]	Time 0.340 (0.518)	Data 0.001 (0.015)	Loss 4.6756 (4.7213)	Top-1 acc 18.750 (17.999)	Top-5 acc 39.062 (37.982)	lr 0.03184
Warmup Train [17][1530/3239]	Time 0.383 (0.518)	Data 0.001 (0.015)	Loss 4.7916 (4.7216)	Top-1 acc 19.531 (18.000)	Top-5 acc 38.281 (37.972)	lr 0.03184
Warmup Train [17][1540/3239]	Time 0.616 (0.518)	Data 0.001 (0.015)	Loss 4.5317 (4.7218)	Top-1 acc 22.266 (17.993)	Top-5 acc 42.969 (37.971)	lr 0.03183
Warmup Train [17][1550/3239]	Time 0.501 (0.518)	Data 0.002 (0.014)	Loss 4.6976 (4.7216)	Top-1 acc 17.188 (17.998)	Top-5 acc 37.500 (37.975)	lr 0.03183
Warmup Train [17][1560/3239]	Time 0.613 (0.518)	Data 0.001 (0.014)	Loss 4.5690 (4.7214)	Top-1 acc 19.531 (18.003)	Top-5 acc 39.844 (37.983)	lr 0.03182
Warmup Train [17][1570/3239]	Time 0.499 (0.518)	Data 0.001 (0.014)	Loss 4.7597 (4.7215)	Top-1 acc 16.406 (18.000)	Top-5 acc 36.328 (37.973)	lr 0.03182
Warmup Train [17][1580/3239]	Time 0.609 (0.518)	Data 0.001 (0.014)	Loss 4.8037 (4.7216)	Top-1 acc 17.578 (18.000)	Top-5 acc 35.938 (37.972)	lr 0.03181
Warmup Train [17][1590/3239]	Time 0.616 (0.518)	Data 0.001 (0.014)	Loss 4.7255 (4.7214)	Top-1 acc 19.531 (18.006)	Top-5 acc 36.719 (37.976)	lr 0.03180
Warmup Train [17][1600/3239]	Time 0.647 (0.518)	Data 0.001 (0.014)	Loss 4.7209 (4.7212)	Top-1 acc 15.234 (18.010)	Top-5 acc 33.984 (37.984)	lr 0.03180
Warmup Train [17][1610/3239]	Time 0.343 (0.518)	Data 0.001 (0.014)	Loss 4.5698 (4.7208)	Top-1 acc 19.531 (18.015)	Top-5 acc 39.062 (37.990)	lr 0.03179
Warmup Train [17][1620/3239]	Time 0.534 (0.518)	Data 0.001 (0.014)	Loss 4.8031 (4.7207)	Top-1 acc 20.312 (18.022)	Top-5 acc 35.938 (37.983)	lr 0.03179
Warmup Train [17][1630/3239]	Time 0.558 (0.518)	Data 0.001 (0.014)	Loss 4.5004 (4.7206)	Top-1 acc 28.125 (18.027)	Top-5 acc 48.828 (37.989)	lr 0.03178
Warmup Train [17][1640/3239]	Time 0.512 (0.518)	Data 0.001 (0.014)	Loss 4.7636 (4.7206)	Top-1 acc 16.797 (18.024)	Top-5 acc 36.328 (37.980)	lr 0.03177
Warmup Train [17][1650/3239]	Time 0.439 (0.518)	Data 0.001 (0.014)	Loss 4.6353 (4.7206)	Top-1 acc 19.141 (18.024)	Top-5 acc 40.234 (37.982)	lr 0.03177
Warmup Train [17][1660/3239]	Time 0.595 (0.518)	Data 0.001 (0.014)	Loss 4.7006 (4.7205)	Top-1 acc 17.578 (18.024)	Top-5 acc 37.109 (37.981)	lr 0.03176
Warmup Train [17][1670/3239]	Time 0.483 (0.518)	Data 0.001 (0.014)	Loss 4.8412 (4.7207)	Top-1 acc 14.844 (18.022)	Top-5 acc 32.812 (37.976)	lr 0.03176
Warmup Train [17][1680/3239]	Time 0.694 (0.518)	Data 0.001 (0.014)	Loss 4.6857 (4.7211)	Top-1 acc 21.484 (18.019)	Top-5 acc 38.281 (37.969)	lr 0.03175
Warmup Train [17][1690/3239]	Time 0.465 (0.518)	Data 0.001 (0.014)	Loss 4.6968 (4.7211)	Top-1 acc 16.406 (18.018)	Top-5 acc 36.719 (37.957)	lr 0.03175
Warmup Train [17][1700/3239]	Time 0.580 (0.518)	Data 0.001 (0.014)	Loss 4.7589 (4.7209)	Top-1 acc 16.797 (18.025)	Top-5 acc 35.156 (37.964)	lr 0.03174
Warmup Train [17][1710/3239]	Time 0.603 (0.518)	Data 0.001 (0.014)	Loss 4.7219 (4.7210)	Top-1 acc 20.703 (18.026)	Top-5 acc 39.062 (37.960)	lr 0.03173
Warmup Train [17][1720/3239]	Time 0.448 (0.518)	Data 0.001 (0.014)	Loss 4.6363 (4.7212)	Top-1 acc 17.969 (18.026)	Top-5 acc 41.406 (37.954)	lr 0.03173
Warmup Train [17][1730/3239]	Time 0.354 (0.518)	Data 0.001 (0.014)	Loss 4.7336 (4.7210)	Top-1 acc 16.406 (18.029)	Top-5 acc 36.719 (37.957)	lr 0.03172
Warmup Train [17][1740/3239]	Time 0.531 (0.518)	Data 0.001 (0.014)	Loss 4.7890 (4.7208)	Top-1 acc 19.141 (18.032)	Top-5 acc 36.719 (37.963)	lr 0.03172
Warmup Train [17][1750/3239]	Time 0.468 (0.518)	Data 0.001 (0.014)	Loss 4.7905 (4.7208)	Top-1 acc 18.359 (18.035)	Top-5 acc 37.500 (37.966)	lr 0.03171
Warmup Train [17][1760/3239]	Time 0.456 (0.518)	Data 0.005 (0.014)	Loss 4.8186 (4.7209)	Top-1 acc 16.406 (18.034)	Top-5 acc 37.500 (37.967)	lr 0.03170
Warmup Train [17][1770/3239]	Time 0.554 (0.518)	Data 0.002 (0.014)	Loss 4.5591 (4.7209)	Top-1 acc 18.359 (18.035)	Top-5 acc 43.750 (37.965)	lr 0.03170
Warmup Train [17][1780/3239]	Time 0.491 (0.517)	Data 0.001 (0.014)	Loss 4.7970 (4.7210)	Top-1 acc 14.453 (18.033)	Top-5 acc 37.109 (37.970)	lr 0.03169
Warmup Train [17][1790/3239]	Time 0.422 (0.517)	Data 0.001 (0.013)	Loss 4.5473 (4.7207)	Top-1 acc 21.875 (18.036)	Top-5 acc 42.578 (37.980)	lr 0.03169
Warmup Train [17][1800/3239]	Time 0.559 (0.517)	Data 0.001 (0.013)	Loss 4.7766 (4.7208)	Top-1 acc 14.062 (18.036)	Top-5 acc 37.109 (37.986)	lr 0.03168
Warmup Train [17][1810/3239]	Time 0.478 (0.517)	Data 0.001 (0.013)	Loss 4.8664 (4.7204)	Top-1 acc 15.234 (18.040)	Top-5 acc 35.547 (37.999)	lr 0.03168
Warmup Train [17][1820/3239]	Time 0.481 (0.517)	Data 0.002 (0.013)	Loss 4.6100 (4.7205)	Top-1 acc 21.094 (18.040)	Top-5 acc 43.359 (38.002)	lr 0.03167
Warmup Train [17][1830/3239]	Time 0.582 (0.517)	Data 0.001 (0.013)	Loss 4.8077 (4.7204)	Top-1 acc 17.188 (18.038)	Top-5 acc 35.938 (38.002)	lr 0.03166
Warmup Train [17][1840/3239]	Time 0.561 (0.517)	Data 0.001 (0.013)	Loss 4.8559 (4.7205)	Top-1 acc 16.797 (18.036)	Top-5 acc 31.641 (37.998)	lr 0.03166
Warmup Train [17][1850/3239]	Time 0.590 (0.517)	Data 0.001 (0.013)	Loss 4.6864 (4.7205)	Top-1 acc 21.094 (18.038)	Top-5 acc 40.625 (37.996)	lr 0.03165
Warmup Train [17][1860/3239]	Time 0.571 (0.517)	Data 0.001 (0.013)	Loss 4.6346 (4.7206)	Top-1 acc 16.797 (18.032)	Top-5 acc 42.578 (37.991)	lr 0.03165
Warmup Train [17][1870/3239]	Time 0.447 (0.517)	Data 0.001 (0.013)	Loss 4.6276 (4.7206)	Top-1 acc 17.188 (18.031)	Top-5 acc 41.016 (37.992)	lr 0.03164
Warmup Train [17][1880/3239]	Time 0.419 (0.517)	Data 0.001 (0.013)	Loss 4.6390 (4.7205)	Top-1 acc 22.656 (18.033)	Top-5 acc 42.969 (37.994)	lr 0.03163
Warmup Train [17][1890/3239]	Time 0.575 (0.517)	Data 0.001 (0.013)	Loss 4.6398 (4.7203)	Top-1 acc 22.266 (18.040)	Top-5 acc 41.797 (37.999)	lr 0.03163
Warmup Train [17][1900/3239]	Time 0.468 (0.517)	Data 0.001 (0.013)	Loss 4.7893 (4.7200)	Top-1 acc 16.797 (18.041)	Top-5 acc 37.109 (38.006)	lr 0.03162
Warmup Train [17][1910/3239]	Time 0.602 (0.517)	Data 0.001 (0.013)	Loss 4.7239 (4.7198)	Top-1 acc 16.797 (18.046)	Top-5 acc 39.062 (38.013)	lr 0.03162
Warmup Train [17][1920/3239]	Time 0.510 (0.517)	Data 0.001 (0.013)	Loss 4.9316 (4.7199)	Top-1 acc 12.891 (18.044)	Top-5 acc 32.812 (38.013)	lr 0.03161
Warmup Train [17][1930/3239]	Time 0.444 (0.517)	Data 0.001 (0.013)	Loss 4.6623 (4.7196)	Top-1 acc 18.750 (18.049)	Top-5 acc 39.844 (38.025)	lr 0.03161
Warmup Train [17][1940/3239]	Time 0.562 (0.517)	Data 0.001 (0.013)	Loss 4.7699 (4.7192)	Top-1 acc 17.578 (18.053)	Top-5 acc 37.500 (38.031)	lr 0.03160
Warmup Train [17][1950/3239]	Time 0.409 (0.517)	Data 0.001 (0.013)	Loss 4.7158 (4.7190)	Top-1 acc 16.406 (18.051)	Top-5 acc 39.062 (38.034)	lr 0.03159
Warmup Train [17][1960/3239]	Time 0.649 (0.517)	Data 0.001 (0.013)	Loss 4.6456 (4.7190)	Top-1 acc 21.094 (18.054)	Top-5 acc 42.188 (38.028)	lr 0.03159
Warmup Train [17][1970/3239]	Time 0.564 (0.517)	Data 0.001 (0.013)	Loss 4.5112 (4.7189)	Top-1 acc 20.312 (18.052)	Top-5 acc 43.750 (38.036)	lr 0.03158
Warmup Train [17][1980/3239]	Time 0.573 (0.517)	Data 0.001 (0.013)	Loss 4.8414 (4.7189)	Top-1 acc 18.750 (18.060)	Top-5 acc 38.672 (38.043)	lr 0.03158
Warmup Train [17][1990/3239]	Time 0.490 (0.517)	Data 0.001 (0.013)	Loss 4.9128 (4.7190)	Top-1 acc 16.016 (18.063)	Top-5 acc 32.031 (38.039)	lr 0.03157
Warmup Train [17][2000/3239]	Time 0.504 (0.517)	Data 0.001 (0.013)	Loss 4.6696 (4.7190)	Top-1 acc 18.750 (18.063)	Top-5 acc 37.500 (38.040)	lr 0.03156
Warmup Train [17][2010/3239]	Time 0.383 (0.517)	Data 0.001 (0.013)	Loss 4.7842 (4.7191)	Top-1 acc 18.750 (18.066)	Top-5 acc 37.109 (38.035)	lr 0.03156
Warmup Train [17][2020/3239]	Time 0.487 (0.517)	Data 0.001 (0.013)	Loss 4.7291 (4.7191)	Top-1 acc 14.062 (18.065)	Top-5 acc 35.547 (38.036)	lr 0.03155
Warmup Train [17][2030/3239]	Time 0.493 (0.517)	Data 0.001 (0.013)	Loss 4.6969 (4.7191)	Top-1 acc 15.625 (18.062)	Top-5 acc 37.109 (38.031)	lr 0.03155
Warmup Train [17][2040/3239]	Time 0.553 (0.517)	Data 0.001 (0.013)	Loss 4.8107 (4.7192)	Top-1 acc 17.188 (18.060)	Top-5 acc 37.500 (38.032)	lr 0.03154
Warmup Train [17][2050/3239]	Time 0.507 (0.517)	Data 0.001 (0.013)	Loss 4.7252 (4.7193)	Top-1 acc 18.359 (18.062)	Top-5 acc 37.500 (38.029)	lr 0.03153
Warmup Train [17][2060/3239]	Time 0.531 (0.517)	Data 0.001 (0.013)	Loss 4.8409 (4.7194)	Top-1 acc 20.312 (18.062)	Top-5 acc 35.547 (38.024)	lr 0.03153
Warmup Train [17][2070/3239]	Time 0.393 (0.517)	Data 0.001 (0.013)	Loss 4.6592 (4.7194)	Top-1 acc 19.922 (18.062)	Top-5 acc 39.453 (38.030)	lr 0.03152
Warmup Train [17][2080/3239]	Time 0.580 (0.517)	Data 0.001 (0.013)	Loss 4.7856 (4.7195)	Top-1 acc 18.750 (18.062)	Top-5 acc 37.891 (38.029)	lr 0.03152
Warmup Train [17][2090/3239]	Time 0.511 (0.517)	Data 0.002 (0.012)	Loss 4.6974 (4.7193)	Top-1 acc 19.922 (18.070)	Top-5 acc 39.453 (38.034)	lr 0.03151
Warmup Train [17][2100/3239]	Time 0.307 (0.517)	Data 0.001 (0.012)	Loss 4.6754 (4.7191)	Top-1 acc 18.750 (18.069)	Top-5 acc 38.281 (38.038)	lr 0.03151
Warmup Train [17][2110/3239]	Time 0.541 (0.517)	Data 0.001 (0.012)	Loss 4.5930 (4.7189)	Top-1 acc 17.578 (18.073)	Top-5 acc 40.625 (38.041)	lr 0.03150
Warmup Train [17][2120/3239]	Time 0.499 (0.517)	Data 0.001 (0.012)	Loss 4.6768 (4.7186)	Top-1 acc 20.312 (18.074)	Top-5 acc 37.109 (38.040)	lr 0.03149
Warmup Train [17][2130/3239]	Time 0.312 (0.517)	Data 0.002 (0.012)	Loss 4.6290 (4.7186)	Top-1 acc 19.922 (18.076)	Top-5 acc 37.109 (38.040)	lr 0.03149
Warmup Train [17][2140/3239]	Time 0.528 (0.517)	Data 0.001 (0.012)	Loss 4.6414 (4.7182)	Top-1 acc 19.531 (18.083)	Top-5 acc 40.625 (38.046)	lr 0.03148
Warmup Train [17][2150/3239]	Time 0.328 (0.517)	Data 0.001 (0.012)	Loss 4.6757 (4.7184)	Top-1 acc 14.844 (18.077)	Top-5 acc 39.844 (38.043)	lr 0.03148
Warmup Train [17][2160/3239]	Time 0.691 (0.517)	Data 0.001 (0.012)	Loss 4.7189 (4.7181)	Top-1 acc 18.750 (18.081)	Top-5 acc 36.328 (38.045)	lr 0.03147
Warmup Train [17][2170/3239]	Time 0.359 (0.517)	Data 0.001 (0.012)	Loss 4.8857 (4.7181)	Top-1 acc 17.188 (18.083)	Top-5 acc 37.500 (38.048)	lr 0.03146
Warmup Train [17][2180/3239]	Time 0.483 (0.517)	Data 0.001 (0.012)	Loss 4.5551 (4.7178)	Top-1 acc 19.922 (18.083)	Top-5 acc 39.062 (38.050)	lr 0.03146
Warmup Train [17][2190/3239]	Time 0.677 (0.517)	Data 0.001 (0.012)	Loss 4.7887 (4.7175)	Top-1 acc 19.141 (18.084)	Top-5 acc 37.109 (38.055)	lr 0.03145
Warmup Train [17][2200/3239]	Time 0.599 (0.517)	Data 0.001 (0.012)	Loss 4.7239 (4.7178)	Top-1 acc 18.750 (18.084)	Top-5 acc 37.109 (38.054)	lr 0.03145
Warmup Train [17][2210/3239]	Time 0.528 (0.517)	Data 0.001 (0.012)	Loss 4.7055 (4.7175)	Top-1 acc 17.578 (18.086)	Top-5 acc 38.281 (38.059)	lr 0.03144
Warmup Train [17][2220/3239]	Time 0.591 (0.517)	Data 0.001 (0.012)	Loss 4.7106 (4.7173)	Top-1 acc 16.406 (18.092)	Top-5 acc 39.062 (38.069)	lr 0.03144
Warmup Train [17][2230/3239]	Time 0.654 (0.517)	Data 0.001 (0.012)	Loss 4.6747 (4.7171)	Top-1 acc 16.406 (18.094)	Top-5 acc 39.453 (38.076)	lr 0.03143
Warmup Train [17][2240/3239]	Time 0.562 (0.517)	Data 0.001 (0.012)	Loss 4.8333 (4.7170)	Top-1 acc 13.672 (18.095)	Top-5 acc 34.766 (38.079)	lr 0.03142
Warmup Train [17][2250/3239]	Time 0.452 (0.517)	Data 0.001 (0.012)	Loss 4.6967 (4.7167)	Top-1 acc 17.188 (18.095)	Top-5 acc 39.062 (38.086)	lr 0.03142
Warmup Train [17][2260/3239]	Time 0.617 (0.517)	Data 0.001 (0.012)	Loss 4.6942 (4.7167)	Top-1 acc 16.797 (18.098)	Top-5 acc 39.453 (38.089)	lr 0.03141
Warmup Train [17][2270/3239]	Time 0.599 (0.517)	Data 0.001 (0.012)	Loss 4.5310 (4.7165)	Top-1 acc 22.266 (18.103)	Top-5 acc 41.406 (38.093)	lr 0.03141
Warmup Train [17][2280/3239]	Time 0.392 (0.517)	Data 0.001 (0.012)	Loss 4.5845 (4.7165)	Top-1 acc 20.312 (18.102)	Top-5 acc 40.234 (38.093)	lr 0.03140
Warmup Train [17][2290/3239]	Time 0.505 (0.517)	Data 0.001 (0.012)	Loss 4.7024 (4.7165)	Top-1 acc 21.484 (18.104)	Top-5 acc 37.109 (38.096)	lr 0.03139
Warmup Train [17][2300/3239]	Time 0.482 (0.517)	Data 0.001 (0.012)	Loss 4.6103 (4.7165)	Top-1 acc 18.750 (18.105)	Top-5 acc 39.453 (38.098)	lr 0.03139
Warmup Train [17][2310/3239]	Time 0.757 (0.517)	Data 0.001 (0.012)	Loss 4.7438 (4.7165)	Top-1 acc 16.016 (18.106)	Top-5 acc 35.938 (38.101)	lr 0.03138
Warmup Train [17][2320/3239]	Time 0.312 (0.516)	Data 0.001 (0.012)	Loss 4.8624 (4.7163)	Top-1 acc 13.281 (18.107)	Top-5 acc 33.984 (38.110)	lr 0.03138
Warmup Train [17][2330/3239]	Time 0.566 (0.516)	Data 0.001 (0.012)	Loss 4.4044 (4.7161)	Top-1 acc 22.656 (18.112)	Top-5 acc 44.531 (38.114)	lr 0.03137
Warmup Train [17][2340/3239]	Time 0.259 (0.516)	Data 0.001 (0.012)	Loss 4.7496 (4.7161)	Top-1 acc 19.141 (18.114)	Top-5 acc 37.891 (38.114)	lr 0.03137
Warmup Train [17][2350/3239]	Time 0.370 (0.516)	Data 0.001 (0.012)	Loss 4.8628 (4.7161)	Top-1 acc 15.234 (18.115)	Top-5 acc 33.594 (38.117)	lr 0.03136
Warmup Train [17][2360/3239]	Time 0.363 (0.516)	Data 0.001 (0.012)	Loss 4.6764 (4.7158)	Top-1 acc 17.578 (18.120)	Top-5 acc 37.891 (38.121)	lr 0.03135
Warmup Train [17][2370/3239]	Time 0.381 (0.516)	Data 0.001 (0.012)	Loss 4.6863 (4.7159)	Top-1 acc 18.750 (18.116)	Top-5 acc 36.328 (38.119)	lr 0.03135
Warmup Train [17][2380/3239]	Time 0.353 (0.516)	Data 0.001 (0.012)	Loss 4.6090 (4.7155)	Top-1 acc 21.094 (18.125)	Top-5 acc 37.500 (38.126)	lr 0.03134
Warmup Train [17][2390/3239]	Time 0.460 (0.516)	Data 0.001 (0.012)	Loss 4.6671 (4.7155)	Top-1 acc 16.797 (18.123)	Top-5 acc 39.844 (38.126)	lr 0.03134
Warmup Train [17][2400/3239]	Time 0.373 (0.516)	Data 0.001 (0.012)	Loss 4.7266 (4.7153)	Top-1 acc 19.141 (18.127)	Top-5 acc 40.625 (38.125)	lr 0.03133
Warmup Train [17][2410/3239]	Time 0.571 (0.516)	Data 0.001 (0.012)	Loss 4.7135 (4.7154)	Top-1 acc 21.094 (18.126)	Top-5 acc 41.016 (38.125)	lr 0.03132
Warmup Train [17][2420/3239]	Time 0.476 (0.516)	Data 0.001 (0.012)	Loss 4.5657 (4.7152)	Top-1 acc 15.234 (18.126)	Top-5 acc 41.016 (38.130)	lr 0.03132
Warmup Train [17][2430/3239]	Time 0.551 (0.516)	Data 0.001 (0.012)	Loss 4.6919 (4.7150)	Top-1 acc 21.484 (18.132)	Top-5 acc 39.844 (38.136)	lr 0.03131
Warmup Train [17][2440/3239]	Time 0.470 (0.516)	Data 0.001 (0.012)	Loss 4.7990 (4.7150)	Top-1 acc 19.141 (18.135)	Top-5 acc 37.891 (38.142)	lr 0.03131
Warmup Train [17][2450/3239]	Time 0.479 (0.516)	Data 0.001 (0.012)	Loss 4.7383 (4.7150)	Top-1 acc 16.016 (18.136)	Top-5 acc 36.328 (38.137)	lr 0.03130
Warmup Train [17][2460/3239]	Time 0.433 (0.516)	Data 0.001 (0.012)	Loss 4.7300 (4.7152)	Top-1 acc 18.750 (18.142)	Top-5 acc 39.062 (38.136)	lr 0.03129
Warmup Train [17][2470/3239]	Time 0.594 (0.516)	Data 0.001 (0.012)	Loss 4.6128 (4.7149)	Top-1 acc 18.359 (18.147)	Top-5 acc 39.844 (38.141)	lr 0.03129
Warmup Train [17][2480/3239]	Time 0.589 (0.516)	Data 0.002 (0.012)	Loss 4.6914 (4.7149)	Top-1 acc 18.359 (18.143)	Top-5 acc 39.062 (38.135)	lr 0.03128
Warmup Train [17][2490/3239]	Time 0.595 (0.516)	Data 0.001 (0.012)	Loss 4.5964 (4.7147)	Top-1 acc 23.047 (18.147)	Top-5 acc 42.188 (38.137)	lr 0.03128
Warmup Train [17][2500/3239]	Time 0.583 (0.516)	Data 0.001 (0.012)	Loss 4.6344 (4.7145)	Top-1 acc 18.359 (18.146)	Top-5 acc 39.844 (38.139)	lr 0.03127
Warmup Train [17][2510/3239]	Time 0.548 (0.516)	Data 0.001 (0.012)	Loss 4.6221 (4.7143)	Top-1 acc 22.266 (18.151)	Top-5 acc 42.578 (38.144)	lr 0.03127
Warmup Train [17][2520/3239]	Time 0.476 (0.516)	Data 0.001 (0.012)	Loss 4.6424 (4.7141)	Top-1 acc 17.969 (18.155)	Top-5 acc 41.797 (38.150)	lr 0.03126
Warmup Train [17][2530/3239]	Time 0.425 (0.516)	Data 0.001 (0.012)	Loss 4.5785 (4.7139)	Top-1 acc 15.234 (18.158)	Top-5 acc 34.766 (38.151)	lr 0.03125
Warmup Train [17][2540/3239]	Time 0.389 (0.516)	Data 0.001 (0.012)	Loss 4.6391 (4.7137)	Top-1 acc 18.359 (18.158)	Top-5 acc 38.672 (38.150)	lr 0.03125
Warmup Train [17][2550/3239]	Time 0.516 (0.516)	Data 0.001 (0.012)	Loss 4.8188 (4.7137)	Top-1 acc 13.672 (18.156)	Top-5 acc 39.453 (38.149)	lr 0.03124
Warmup Train [17][2560/3239]	Time 0.563 (0.516)	Data 0.001 (0.012)	Loss 4.8450 (4.7137)	Top-1 acc 17.578 (18.155)	Top-5 acc 35.156 (38.151)	lr 0.03124
Warmup Train [17][2570/3239]	Time 0.373 (0.516)	Data 0.001 (0.012)	Loss 4.8314 (4.7138)	Top-1 acc 17.969 (18.154)	Top-5 acc 38.672 (38.152)	lr 0.03123
Warmup Train [17][2580/3239]	Time 0.490 (0.516)	Data 0.001 (0.012)	Loss 4.6869 (4.7139)	Top-1 acc 16.797 (18.153)	Top-5 acc 39.844 (38.150)	lr 0.03122
Warmup Train [17][2590/3239]	Time 0.413 (0.516)	Data 0.001 (0.012)	Loss 4.7525 (4.7139)	Top-1 acc 19.531 (18.156)	Top-5 acc 38.281 (38.151)	lr 0.03122
Warmup Train [17][2600/3239]	Time 0.705 (0.516)	Data 0.001 (0.012)	Loss 4.7714 (4.7140)	Top-1 acc 15.625 (18.155)	Top-5 acc 37.891 (38.150)	lr 0.03121
Warmup Train [17][2610/3239]	Time 0.651 (0.516)	Data 0.001 (0.012)	Loss 4.5656 (4.7138)	Top-1 acc 19.922 (18.158)	Top-5 acc 40.234 (38.156)	lr 0.03121
Warmup Train [17][2620/3239]	Time 0.576 (0.516)	Data 0.001 (0.012)	Loss 4.8044 (4.7137)	Top-1 acc 15.234 (18.155)	Top-5 acc 35.547 (38.158)	lr 0.03120
Warmup Train [17][2630/3239]	Time 0.545 (0.516)	Data 0.001 (0.012)	Loss 4.7141 (4.7136)	Top-1 acc 17.188 (18.157)	Top-5 acc 41.016 (38.162)	lr 0.03119
Warmup Train [17][2640/3239]	Time 0.166 (0.516)	Data 0.001 (0.012)	Loss 4.5447 (4.7135)	Top-1 acc 23.047 (18.163)	Top-5 acc 44.531 (38.161)	lr 0.03119
Warmup Train [17][2650/3239]	Time 0.264 (0.516)	Data 0.001 (0.012)	Loss 4.7171 (4.7134)	Top-1 acc 17.969 (18.165)	Top-5 acc 37.109 (38.161)	lr 0.03118
Warmup Train [17][2660/3239]	Time 0.590 (0.516)	Data 0.001 (0.012)	Loss 4.6309 (4.7132)	Top-1 acc 17.188 (18.167)	Top-5 acc 39.844 (38.165)	lr 0.03118
Warmup Train [17][2670/3239]	Time 0.774 (0.516)	Data 0.002 (0.012)	Loss 4.7079 (4.7130)	Top-1 acc 16.797 (18.165)	Top-5 acc 39.453 (38.167)	lr 0.03117
Warmup Train [17][2680/3239]	Time 0.447 (0.516)	Data 0.001 (0.012)	Loss 4.7495 (4.7131)	Top-1 acc 16.016 (18.165)	Top-5 acc 37.500 (38.164)	lr 0.03117
Warmup Train [17][2690/3239]	Time 0.455 (0.516)	Data 0.001 (0.012)	Loss 4.8261 (4.7131)	Top-1 acc 13.281 (18.164)	Top-5 acc 33.594 (38.165)	lr 0.03116
Warmup Train [17][2700/3239]	Time 0.598 (0.516)	Data 0.001 (0.011)	Loss 4.6983 (4.7130)	Top-1 acc 21.484 (18.165)	Top-5 acc 42.188 (38.166)	lr 0.03115
Warmup Train [17][2710/3239]	Time 0.515 (0.516)	Data 0.001 (0.011)	Loss 4.7551 (4.7130)	Top-1 acc 17.188 (18.164)	Top-5 acc 36.328 (38.168)	lr 0.03115
Warmup Train [17][2720/3239]	Time 0.571 (0.516)	Data 0.001 (0.011)	Loss 4.8258 (4.7130)	Top-1 acc 17.578 (18.165)	Top-5 acc 36.328 (38.171)	lr 0.03114
Warmup Train [17][2730/3239]	Time 0.499 (0.516)	Data 0.001 (0.011)	Loss 4.6864 (4.7128)	Top-1 acc 21.875 (18.168)	Top-5 acc 39.062 (38.176)	lr 0.03114
Warmup Train [17][2740/3239]	Time 0.400 (0.516)	Data 0.001 (0.011)	Loss 4.6643 (4.7126)	Top-1 acc 16.797 (18.172)	Top-5 acc 39.062 (38.180)	lr 0.03113
Warmup Train [17][2750/3239]	Time 0.390 (0.516)	Data 0.001 (0.011)	Loss 4.5152 (4.7126)	Top-1 acc 20.312 (18.174)	Top-5 acc 43.359 (38.184)	lr 0.03112
Warmup Train [17][2760/3239]	Time 0.473 (0.516)	Data 0.001 (0.011)	Loss 4.8127 (4.7124)	Top-1 acc 17.969 (18.178)	Top-5 acc 33.594 (38.186)	lr 0.03112
Warmup Train [17][2770/3239]	Time 0.449 (0.516)	Data 0.001 (0.011)	Loss 4.7189 (4.7123)	Top-1 acc 20.312 (18.175)	Top-5 acc 36.719 (38.187)	lr 0.03111
Warmup Train [17][2780/3239]	Time 0.457 (0.516)	Data 0.001 (0.011)	Loss 4.5878 (4.7123)	Top-1 acc 17.188 (18.176)	Top-5 acc 39.844 (38.191)	lr 0.03111
Warmup Train [17][2790/3239]	Time 0.400 (0.516)	Data 0.001 (0.011)	Loss 4.4765 (4.7122)	Top-1 acc 19.531 (18.177)	Top-5 acc 42.969 (38.190)	lr 0.03110
Warmup Train [17][2800/3239]	Time 0.382 (0.516)	Data 0.001 (0.011)	Loss 4.5214 (4.7122)	Top-1 acc 21.875 (18.177)	Top-5 acc 42.578 (38.190)	lr 0.03110
Warmup Train [17][2810/3239]	Time 0.532 (0.516)	Data 0.001 (0.011)	Loss 4.7707 (4.7122)	Top-1 acc 18.359 (18.179)	Top-5 acc 35.938 (38.191)	lr 0.03109
Warmup Train [17][2820/3239]	Time 0.633 (0.516)	Data 0.001 (0.011)	Loss 4.7466 (4.7121)	Top-1 acc 16.016 (18.180)	Top-5 acc 36.719 (38.195)	lr 0.03108
Warmup Train [17][2830/3239]	Time 0.352 (0.516)	Data 0.001 (0.011)	Loss 4.8216 (4.7120)	Top-1 acc 16.797 (18.180)	Top-5 acc 34.375 (38.195)	lr 0.03108
Warmup Train [17][2840/3239]	Time 0.433 (0.516)	Data 0.001 (0.011)	Loss 4.7085 (4.7120)	Top-1 acc 17.969 (18.176)	Top-5 acc 35.156 (38.192)	lr 0.03107
Warmup Train [17][2850/3239]	Time 0.465 (0.516)	Data 0.001 (0.011)	Loss 4.5818 (4.7121)	Top-1 acc 19.141 (18.176)	Top-5 acc 44.141 (38.191)	lr 0.03107
Warmup Train [17][2860/3239]	Time 0.570 (0.516)	Data 0.001 (0.011)	Loss 4.7900 (4.7118)	Top-1 acc 16.016 (18.181)	Top-5 acc 37.891 (38.198)	lr 0.03106
Warmup Train [17][2870/3239]	Time 0.511 (0.516)	Data 0.001 (0.011)	Loss 4.8331 (4.7117)	Top-1 acc 18.750 (18.183)	Top-5 acc 33.594 (38.199)	lr 0.03105
Warmup Train [17][2880/3239]	Time 0.362 (0.516)	Data 0.002 (0.011)	Loss 4.7717 (4.7117)	Top-1 acc 16.406 (18.184)	Top-5 acc 35.938 (38.198)	lr 0.03105
Warmup Train [17][2890/3239]	Time 0.502 (0.515)	Data 0.001 (0.011)	Loss 4.5209 (4.7116)	Top-1 acc 24.219 (18.187)	Top-5 acc 45.703 (38.201)	lr 0.03104
Warmup Train [17][2900/3239]	Time 0.466 (0.515)	Data 0.001 (0.011)	Loss 4.5978 (4.7115)	Top-1 acc 19.141 (18.188)	Top-5 acc 41.406 (38.204)	lr 0.03104
Warmup Train [17][2910/3239]	Time 0.547 (0.515)	Data 0.001 (0.011)	Loss 4.5691 (4.7113)	Top-1 acc 18.750 (18.189)	Top-5 acc 43.750 (38.212)	lr 0.03103
Warmup Train [17][2920/3239]	Time 0.330 (0.515)	Data 0.001 (0.011)	Loss 4.6901 (4.7115)	Top-1 acc 22.266 (18.188)	Top-5 acc 41.797 (38.210)	lr 0.03102
Warmup Train [17][2930/3239]	Time 0.526 (0.515)	Data 0.001 (0.011)	Loss 4.6349 (4.7113)	Top-1 acc 20.703 (18.190)	Top-5 acc 37.891 (38.215)	lr 0.03102
Warmup Train [17][2940/3239]	Time 0.533 (0.515)	Data 0.001 (0.011)	Loss 4.6726 (4.7111)	Top-1 acc 19.922 (18.194)	Top-5 acc 35.938 (38.217)	lr 0.03101
Warmup Train [17][2950/3239]	Time 0.528 (0.515)	Data 0.001 (0.011)	Loss 4.7794 (4.7109)	Top-1 acc 14.453 (18.194)	Top-5 acc 34.375 (38.221)	lr 0.03101
Warmup Train [17][2960/3239]	Time 0.481 (0.515)	Data 0.001 (0.011)	Loss 4.5727 (4.7107)	Top-1 acc 21.875 (18.197)	Top-5 acc 42.578 (38.223)	lr 0.03100
Warmup Train [17][2970/3239]	Time 0.647 (0.515)	Data 0.001 (0.011)	Loss 4.5862 (4.7106)	Top-1 acc 19.922 (18.195)	Top-5 acc 42.578 (38.222)	lr 0.03100
Warmup Train [17][2980/3239]	Time 0.489 (0.515)	Data 0.001 (0.011)	Loss 4.8730 (4.7106)	Top-1 acc 18.359 (18.197)	Top-5 acc 33.984 (38.221)	lr 0.03099
Warmup Train [17][2990/3239]	Time 0.416 (0.515)	Data 0.001 (0.011)	Loss 4.7564 (4.7107)	Top-1 acc 19.531 (18.199)	Top-5 acc 37.891 (38.216)	lr 0.03098
Warmup Train [17][3000/3239]	Time 0.390 (0.515)	Data 0.001 (0.011)	Loss 4.5899 (4.7106)	Top-1 acc 19.141 (18.203)	Top-5 acc 37.500 (38.221)	lr 0.03098
Warmup Train [17][3010/3239]	Time 0.433 (0.515)	Data 0.001 (0.011)	Loss 4.7342 (4.7105)	Top-1 acc 18.359 (18.203)	Top-5 acc 36.719 (38.226)	lr 0.03097
Warmup Train [17][3020/3239]	Time 0.536 (0.515)	Data 0.001 (0.011)	Loss 4.7348 (4.7105)	Top-1 acc 17.969 (18.203)	Top-5 acc 34.766 (38.225)	lr 0.03097
Warmup Train [17][3030/3239]	Time 0.605 (0.515)	Data 0.002 (0.011)	Loss 4.7178 (4.7105)	Top-1 acc 19.922 (18.201)	Top-5 acc 37.500 (38.224)	lr 0.03096
Warmup Train [17][3040/3239]	Time 0.486 (0.515)	Data 0.001 (0.011)	Loss 4.6295 (4.7107)	Top-1 acc 19.531 (18.196)	Top-5 acc 37.891 (38.220)	lr 0.03095
Warmup Train [17][3050/3239]	Time 0.566 (0.515)	Data 0.001 (0.011)	Loss 4.6985 (4.7106)	Top-1 acc 18.750 (18.195)	Top-5 acc 37.891 (38.220)	lr 0.03095
Warmup Train [17][3060/3239]	Time 0.580 (0.515)	Data 0.001 (0.011)	Loss 4.5395 (4.7106)	Top-1 acc 19.922 (18.195)	Top-5 acc 38.672 (38.219)	lr 0.03094
Warmup Train [17][3070/3239]	Time 0.497 (0.515)	Data 0.002 (0.011)	Loss 4.7453 (4.7105)	Top-1 acc 17.578 (18.196)	Top-5 acc 33.984 (38.222)	lr 0.03094
Warmup Train [17][3080/3239]	Time 0.457 (0.515)	Data 0.001 (0.011)	Loss 4.8419 (4.7104)	Top-1 acc 15.625 (18.197)	Top-5 acc 33.594 (38.227)	lr 0.03093
Warmup Train [17][3090/3239]	Time 0.586 (0.515)	Data 0.001 (0.011)	Loss 4.6672 (4.7104)	Top-1 acc 19.141 (18.196)	Top-5 acc 38.281 (38.226)	lr 0.03092
Warmup Train [17][3100/3239]	Time 0.416 (0.515)	Data 0.001 (0.011)	Loss 4.7021 (4.7103)	Top-1 acc 18.359 (18.198)	Top-5 acc 35.938 (38.231)	lr 0.03092
Warmup Train [17][3110/3239]	Time 0.317 (0.515)	Data 0.001 (0.011)	Loss 4.7209 (4.7101)	Top-1 acc 17.969 (18.202)	Top-5 acc 34.766 (38.235)	lr 0.03091
Warmup Train [17][3120/3239]	Time 0.417 (0.515)	Data 0.001 (0.011)	Loss 4.5509 (4.7100)	Top-1 acc 18.750 (18.199)	Top-5 acc 41.797 (38.238)	lr 0.03091
Warmup Train [17][3130/3239]	Time 0.463 (0.515)	Data 0.001 (0.011)	Loss 4.7361 (4.7099)	Top-1 acc 17.969 (18.201)	Top-5 acc 36.328 (38.241)	lr 0.03090
Warmup Train [17][3140/3239]	Time 0.394 (0.515)	Data 0.001 (0.011)	Loss 4.9117 (4.7098)	Top-1 acc 15.234 (18.201)	Top-5 acc 31.641 (38.245)	lr 0.03090
Warmup Train [17][3150/3239]	Time 0.681 (0.515)	Data 0.001 (0.011)	Loss 4.6670 (4.7096)	Top-1 acc 19.141 (18.204)	Top-5 acc 42.969 (38.252)	lr 0.03089
Warmup Train [17][3160/3239]	Time 0.452 (0.515)	Data 0.001 (0.011)	Loss 4.6441 (4.7095)	Top-1 acc 21.875 (18.206)	Top-5 acc 42.578 (38.252)	lr 0.03088
Warmup Train [17][3170/3239]	Time 0.660 (0.515)	Data 0.001 (0.011)	Loss 4.6321 (4.7095)	Top-1 acc 15.625 (18.208)	Top-5 acc 39.844 (38.255)	lr 0.03088
Warmup Train [17][3180/3239]	Time 0.549 (0.514)	Data 0.000 (0.011)	Loss 4.5310 (4.7094)	Top-1 acc 17.969 (18.208)	Top-5 acc 42.969 (38.255)	lr 0.03087
Warmup Train [17][3190/3239]	Time 0.339 (0.514)	Data 0.000 (0.011)	Loss 4.7236 (4.7094)	Top-1 acc 19.141 (18.209)	Top-5 acc 36.328 (38.256)	lr 0.03087
Warmup Train [17][3200/3239]	Time 0.491 (0.514)	Data 0.000 (0.011)	Loss 4.8478 (4.7093)	Top-1 acc 16.797 (18.211)	Top-5 acc 37.500 (38.261)	lr 0.03086
Warmup Train [17][3210/3239]	Time 0.474 (0.514)	Data 0.000 (0.011)	Loss 4.6311 (4.7093)	Top-1 acc 20.703 (18.215)	Top-5 acc 43.359 (38.266)	lr 0.03085
Warmup Train [17][3220/3239]	Time 0.379 (0.514)	Data 0.000 (0.011)	Loss 4.8893 (4.7093)	Top-1 acc 15.234 (18.215)	Top-5 acc 32.422 (38.263)	lr 0.03085
Warmup Train [17][3230/3239]	Time 0.408 (0.514)	Data 0.000 (0.011)	Loss 4.8208 (4.7091)	Top-1 acc 16.406 (18.223)	Top-5 acc 35.938 (38.270)	lr 0.03084
Warmup Train [17][3239/3239]	Time 0.352 (0.514)	Data 0.000 (0.011)	Loss 4.6616 (4.7090)	Top-1 acc 22.222 (18.229)	Top-5 acc 40.741 (38.273)	lr 0.03084
==========Warmup Valid [17/40]	loss 3.777	top-1 acc 24.733	top-5 acc 47.754	Train top-1 18.229	top-5 38.273	flops: 442.4M
Warmup Train [18][0/3239]	Time 12.147 (12.147)	Data 10.936 (10.936)	Loss 4.5194 (4.5194)	Top-1 acc 22.656 (22.656)	Top-5 acc 43.750 (43.750)	lr 0.03084
Warmup Train [18][10/3239]	Time 0.534 (1.669)	Data 0.001 (1.034)	Loss 4.6569 (4.6314)	Top-1 acc 19.531 (19.744)	Top-5 acc 39.844 (40.483)	lr 0.03083
Warmup Train [18][20/3239]	Time 0.531 (1.120)	Data 0.001 (0.542)	Loss 4.6505 (4.6660)	Top-1 acc 16.797 (18.564)	Top-5 acc 35.938 (39.062)	lr 0.03082
Warmup Train [18][30/3239]	Time 0.583 (0.921)	Data 0.001 (0.369)	Loss 4.6693 (4.6583)	Top-1 acc 18.359 (18.712)	Top-5 acc 38.672 (39.239)	lr 0.03082
Warmup Train [18][40/3239]	Time 0.475 (0.815)	Data 0.001 (0.279)	Loss 4.6527 (4.6577)	Top-1 acc 18.750 (18.836)	Top-5 acc 39.844 (39.367)	lr 0.03081
Warmup Train [18][50/3239]	Time 0.625 (0.754)	Data 0.001 (0.225)	Loss 4.6327 (4.6654)	Top-1 acc 21.094 (18.681)	Top-5 acc 40.625 (39.116)	lr 0.03081
Warmup Train [18][60/3239]	Time 0.538 (0.707)	Data 0.001 (0.189)	Loss 4.5718 (4.6629)	Top-1 acc 20.703 (18.769)	Top-5 acc 39.453 (39.248)	lr 0.03080
Warmup Train [18][70/3239]	Time 0.535 (0.678)	Data 0.001 (0.163)	Loss 4.4139 (4.6596)	Top-1 acc 24.609 (18.899)	Top-5 acc 47.266 (39.453)	lr 0.03079
Warmup Train [18][80/3239]	Time 0.451 (0.655)	Data 0.001 (0.145)	Loss 4.8072 (4.6588)	Top-1 acc 19.531 (19.025)	Top-5 acc 36.719 (39.525)	lr 0.03079
Warmup Train [18][90/3239]	Time 0.611 (0.642)	Data 0.001 (0.130)	Loss 4.4667 (4.6520)	Top-1 acc 22.266 (19.235)	Top-5 acc 42.969 (39.706)	lr 0.03078
Warmup Train [18][100/3239]	Time 0.472 (0.627)	Data 0.001 (0.117)	Loss 4.7567 (4.6551)	Top-1 acc 17.188 (19.056)	Top-5 acc 37.500 (39.739)	lr 0.03078
Warmup Train [18][110/3239]	Time 0.520 (0.616)	Data 0.001 (0.108)	Loss 4.4909 (4.6608)	Top-1 acc 24.219 (19.053)	Top-5 acc 44.141 (39.590)	lr 0.03077
Warmup Train [18][120/3239]	Time 0.568 (0.607)	Data 0.001 (0.099)	Loss 4.8056 (4.6607)	Top-1 acc 15.234 (19.047)	Top-5 acc 31.641 (39.447)	lr 0.03077
Warmup Train [18][130/3239]	Time 0.347 (0.599)	Data 0.001 (0.092)	Loss 4.4954 (4.6607)	Top-1 acc 25.781 (19.096)	Top-5 acc 43.750 (39.355)	lr 0.03076
Warmup Train [18][140/3239]	Time 0.402 (0.592)	Data 0.001 (0.087)	Loss 4.9566 (4.6642)	Top-1 acc 16.016 (19.035)	Top-5 acc 31.250 (39.284)	lr 0.03075
Warmup Train [18][150/3239]	Time 0.346 (0.587)	Data 0.002 (0.082)	Loss 4.8090 (4.6678)	Top-1 acc 14.453 (18.944)	Top-5 acc 33.203 (39.205)	lr 0.03075
Warmup Train [18][160/3239]	Time 0.507 (0.584)	Data 0.001 (0.078)	Loss 4.6920 (4.6666)	Top-1 acc 19.922 (18.951)	Top-5 acc 40.625 (39.276)	lr 0.03074
Warmup Train [18][170/3239]	Time 0.487 (0.579)	Data 0.001 (0.074)	Loss 4.5487 (4.6653)	Top-1 acc 17.578 (18.967)	Top-5 acc 42.969 (39.273)	lr 0.03074
Warmup Train [18][180/3239]	Time 0.480 (0.575)	Data 0.001 (0.070)	Loss 4.7637 (4.6679)	Top-1 acc 17.578 (18.933)	Top-5 acc 36.328 (39.214)	lr 0.03073
Warmup Train [18][190/3239]	Time 0.527 (0.572)	Data 0.002 (0.067)	Loss 4.7404 (4.6643)	Top-1 acc 17.188 (18.942)	Top-5 acc 39.453 (39.263)	lr 0.03072
Warmup Train [18][200/3239]	Time 0.560 (0.569)	Data 0.002 (0.064)	Loss 4.8005 (4.6624)	Top-1 acc 18.359 (18.989)	Top-5 acc 38.281 (39.356)	lr 0.03072
Warmup Train [18][210/3239]	Time 0.489 (0.565)	Data 0.001 (0.061)	Loss 4.7106 (4.6635)	Top-1 acc 17.188 (18.987)	Top-5 acc 41.016 (39.333)	lr 0.03071
Warmup Train [18][220/3239]	Time 0.426 (0.562)	Data 0.001 (0.059)	Loss 4.9597 (4.6657)	Top-1 acc 13.672 (19.008)	Top-5 acc 33.203 (39.319)	lr 0.03071
Warmup Train [18][230/3239]	Time 0.590 (0.561)	Data 0.001 (0.057)	Loss 4.6648 (4.6668)	Top-1 acc 18.750 (18.980)	Top-5 acc 38.281 (39.279)	lr 0.03070
Warmup Train [18][240/3239]	Time 0.511 (0.560)	Data 0.001 (0.055)	Loss 4.5480 (4.6679)	Top-1 acc 17.969 (18.956)	Top-5 acc 39.453 (39.239)	lr 0.03069
Warmup Train [18][250/3239]	Time 0.535 (0.558)	Data 0.002 (0.053)	Loss 4.5377 (4.6670)	Top-1 acc 21.094 (18.960)	Top-5 acc 39.453 (39.221)	lr 0.03069
Warmup Train [18][260/3239]	Time 0.405 (0.556)	Data 0.001 (0.051)	Loss 4.5886 (4.6666)	Top-1 acc 16.797 (18.952)	Top-5 acc 37.891 (39.221)	lr 0.03068
Warmup Train [18][270/3239]	Time 0.738 (0.555)	Data 0.001 (0.049)	Loss 4.7115 (4.6668)	Top-1 acc 18.359 (18.936)	Top-5 acc 39.453 (39.241)	lr 0.03068
Warmup Train [18][280/3239]	Time 0.738 (0.554)	Data 0.001 (0.048)	Loss 4.8116 (4.6694)	Top-1 acc 17.188 (18.911)	Top-5 acc 37.891 (39.178)	lr 0.03067
Warmup Train [18][290/3239]	Time 0.679 (0.553)	Data 0.001 (0.046)	Loss 4.5570 (4.6696)	Top-1 acc 23.438 (18.880)	Top-5 acc 41.797 (39.178)	lr 0.03067
Warmup Train [18][300/3239]	Time 0.479 (0.552)	Data 0.001 (0.045)	Loss 4.7120 (4.6703)	Top-1 acc 19.141 (18.911)	Top-5 acc 37.109 (39.164)	lr 0.03066
Warmup Train [18][310/3239]	Time 0.671 (0.550)	Data 0.001 (0.043)	Loss 4.5943 (4.6690)	Top-1 acc 22.656 (18.950)	Top-5 acc 39.844 (39.186)	lr 0.03065
Warmup Train [18][320/3239]	Time 0.479 (0.547)	Data 0.001 (0.042)	Loss 4.8371 (4.6691)	Top-1 acc 15.234 (18.936)	Top-5 acc 33.203 (39.184)	lr 0.03065
Warmup Train [18][330/3239]	Time 0.519 (0.547)	Data 0.002 (0.041)	Loss 4.7060 (4.6695)	Top-1 acc 16.797 (18.914)	Top-5 acc 40.625 (39.173)	lr 0.03064
Warmup Train [18][340/3239]	Time 0.381 (0.544)	Data 0.001 (0.040)	Loss 4.6976 (4.6693)	Top-1 acc 16.797 (18.905)	Top-5 acc 39.844 (39.197)	lr 0.03064
Warmup Train [18][350/3239]	Time 0.504 (0.543)	Data 0.001 (0.039)	Loss 4.8595 (4.6701)	Top-1 acc 15.234 (18.882)	Top-5 acc 33.594 (39.178)	lr 0.03063
Warmup Train [18][360/3239]	Time 0.518 (0.541)	Data 0.001 (0.038)	Loss 4.7755 (4.6701)	Top-1 acc 15.625 (18.861)	Top-5 acc 37.109 (39.201)	lr 0.03062
Warmup Train [18][370/3239]	Time 0.542 (0.541)	Data 0.001 (0.037)	Loss 4.8314 (4.6708)	Top-1 acc 14.453 (18.834)	Top-5 acc 37.500 (39.175)	lr 0.03062
Warmup Train [18][380/3239]	Time 0.359 (0.540)	Data 0.001 (0.037)	Loss 4.6038 (4.6700)	Top-1 acc 21.094 (18.856)	Top-5 acc 39.844 (39.197)	lr 0.03061
Warmup Train [18][390/3239]	Time 0.656 (0.539)	Data 0.001 (0.036)	Loss 4.6576 (4.6698)	Top-1 acc 17.188 (18.831)	Top-5 acc 41.016 (39.167)	lr 0.03061
Warmup Train [18][400/3239]	Time 0.545 (0.538)	Data 0.001 (0.035)	Loss 4.5446 (4.6704)	Top-1 acc 24.219 (18.845)	Top-5 acc 44.922 (39.159)	lr 0.03060
Warmup Train [18][410/3239]	Time 0.536 (0.538)	Data 0.001 (0.034)	Loss 4.7078 (4.6702)	Top-1 acc 19.141 (18.852)	Top-5 acc 38.672 (39.149)	lr 0.03059
Warmup Train [18][420/3239]	Time 0.488 (0.537)	Data 0.001 (0.033)	Loss 4.6714 (4.6703)	Top-1 acc 20.703 (18.851)	Top-5 acc 37.500 (39.128)	lr 0.03059
Warmup Train [18][430/3239]	Time 0.648 (0.537)	Data 0.001 (0.033)	Loss 4.5876 (4.6701)	Top-1 acc 21.875 (18.874)	Top-5 acc 43.750 (39.145)	lr 0.03058
Warmup Train [18][440/3239]	Time 0.465 (0.535)	Data 0.001 (0.032)	Loss 4.7041 (4.6703)	Top-1 acc 15.234 (18.867)	Top-5 acc 39.453 (39.132)	lr 0.03058
Warmup Train [18][450/3239]	Time 0.413 (0.535)	Data 0.001 (0.031)	Loss 4.8077 (4.6697)	Top-1 acc 15.625 (18.869)	Top-5 acc 33.203 (39.125)	lr 0.03057
Warmup Train [18][460/3239]	Time 0.548 (0.534)	Data 0.001 (0.031)	Loss 4.5214 (4.6695)	Top-1 acc 19.531 (18.878)	Top-5 acc 42.969 (39.128)	lr 0.03056
Warmup Train [18][470/3239]	Time 0.691 (0.534)	Data 0.001 (0.030)	Loss 4.7285 (4.6691)	Top-1 acc 21.484 (18.905)	Top-5 acc 41.406 (39.152)	lr 0.03056
Warmup Train [18][480/3239]	Time 0.756 (0.534)	Data 0.001 (0.030)	Loss 4.5976 (4.6699)	Top-1 acc 19.922 (18.871)	Top-5 acc 42.188 (39.121)	lr 0.03055
Warmup Train [18][490/3239]	Time 0.520 (0.534)	Data 0.001 (0.029)	Loss 4.6657 (4.6700)	Top-1 acc 20.703 (18.876)	Top-5 acc 42.578 (39.133)	lr 0.03055
Warmup Train [18][500/3239]	Time 0.391 (0.533)	Data 0.001 (0.029)	Loss 4.6610 (4.6693)	Top-1 acc 20.312 (18.878)	Top-5 acc 41.016 (39.151)	lr 0.03054
Warmup Train [18][510/3239]	Time 0.461 (0.533)	Data 0.001 (0.029)	Loss 4.6042 (4.6688)	Top-1 acc 19.531 (18.888)	Top-5 acc 42.969 (39.173)	lr 0.03054
Warmup Train [18][520/3239]	Time 0.411 (0.532)	Data 0.001 (0.028)	Loss 4.6342 (4.6705)	Top-1 acc 19.141 (18.851)	Top-5 acc 39.453 (39.135)	lr 0.03053
Warmup Train [18][530/3239]	Time 0.457 (0.531)	Data 0.001 (0.028)	Loss 4.7024 (4.6711)	Top-1 acc 20.312 (18.851)	Top-5 acc 37.891 (39.140)	lr 0.03052
Warmup Train [18][540/3239]	Time 0.546 (0.531)	Data 0.001 (0.027)	Loss 4.5531 (4.6708)	Top-1 acc 23.047 (18.855)	Top-5 acc 43.359 (39.151)	lr 0.03052
Warmup Train [18][550/3239]	Time 0.618 (0.530)	Data 0.001 (0.027)	Loss 4.5784 (4.6707)	Top-1 acc 21.094 (18.852)	Top-5 acc 37.500 (39.148)	lr 0.03051
Warmup Train [18][560/3239]	Time 0.384 (0.529)	Data 0.001 (0.027)	Loss 4.6626 (4.6710)	Top-1 acc 19.531 (18.874)	Top-5 acc 39.453 (39.161)	lr 0.03051
Warmup Train [18][570/3239]	Time 0.644 (0.530)	Data 0.001 (0.026)	Loss 4.6819 (4.6705)	Top-1 acc 17.188 (18.888)	Top-5 acc 39.062 (39.177)	lr 0.03050
Warmup Train [18][580/3239]	Time 0.427 (0.530)	Data 0.001 (0.026)	Loss 4.6097 (4.6697)	Top-1 acc 16.406 (18.895)	Top-5 acc 39.062 (39.184)	lr 0.03049
Warmup Train [18][590/3239]	Time 0.551 (0.530)	Data 0.001 (0.026)	Loss 4.7128 (4.6697)	Top-1 acc 18.359 (18.877)	Top-5 acc 37.109 (39.178)	lr 0.03049
Warmup Train [18][600/3239]	Time 0.616 (0.529)	Data 0.001 (0.026)	Loss 4.9441 (4.6703)	Top-1 acc 10.547 (18.846)	Top-5 acc 32.422 (39.168)	lr 0.03048
Warmup Train [18][610/3239]	Time 0.375 (0.529)	Data 0.001 (0.025)	Loss 4.6687 (4.6694)	Top-1 acc 20.703 (18.857)	Top-5 acc 40.625 (39.191)	lr 0.03048
Warmup Train [18][620/3239]	Time 0.395 (0.529)	Data 0.002 (0.025)	Loss 4.3848 (4.6693)	Top-1 acc 25.781 (18.874)	Top-5 acc 47.266 (39.197)	lr 0.03047
Warmup Train [18][630/3239]	Time 0.460 (0.528)	Data 0.001 (0.025)	Loss 4.6734 (4.6686)	Top-1 acc 19.922 (18.869)	Top-5 acc 39.844 (39.206)	lr 0.03046
Warmup Train [18][640/3239]	Time 0.487 (0.527)	Data 0.001 (0.024)	Loss 4.8107 (4.6692)	Top-1 acc 16.797 (18.861)	Top-5 acc 32.812 (39.184)	lr 0.03046
Warmup Train [18][650/3239]	Time 0.558 (0.527)	Data 0.001 (0.024)	Loss 4.8394 (4.6691)	Top-1 acc 17.188 (18.869)	Top-5 acc 35.547 (39.190)	lr 0.03045
Warmup Train [18][660/3239]	Time 0.537 (0.527)	Data 0.001 (0.024)	Loss 4.5696 (4.6691)	Top-1 acc 19.922 (18.889)	Top-5 acc 39.453 (39.223)	lr 0.03045
Warmup Train [18][670/3239]	Time 0.519 (0.526)	Data 0.001 (0.023)	Loss 4.5417 (4.6687)	Top-1 acc 21.484 (18.904)	Top-5 acc 42.578 (39.228)	lr 0.03044
Warmup Train [18][680/3239]	Time 0.426 (0.526)	Data 0.001 (0.023)	Loss 4.5842 (4.6684)	Top-1 acc 17.969 (18.913)	Top-5 acc 38.281 (39.245)	lr 0.03043
Warmup Train [18][690/3239]	Time 0.485 (0.526)	Data 0.001 (0.023)	Loss 4.6150 (4.6675)	Top-1 acc 19.531 (18.936)	Top-5 acc 40.234 (39.268)	lr 0.03043
Warmup Train [18][700/3239]	Time 0.341 (0.525)	Data 0.001 (0.023)	Loss 4.5292 (4.6675)	Top-1 acc 21.484 (18.922)	Top-5 acc 41.016 (39.262)	lr 0.03042
Warmup Train [18][710/3239]	Time 0.490 (0.525)	Data 0.001 (0.022)	Loss 4.5700 (4.6674)	Top-1 acc 23.438 (18.941)	Top-5 acc 38.672 (39.249)	lr 0.03042
Warmup Train [18][720/3239]	Time 0.629 (0.526)	Data 0.001 (0.022)	Loss 4.5813 (4.6666)	Top-1 acc 17.188 (18.939)	Top-5 acc 42.969 (39.287)	lr 0.03041
Warmup Train [18][730/3239]	Time 0.421 (0.525)	Data 0.001 (0.022)	Loss 4.5761 (4.6664)	Top-1 acc 21.094 (18.946)	Top-5 acc 39.844 (39.295)	lr 0.03041
Warmup Train [18][740/3239]	Time 0.673 (0.525)	Data 0.001 (0.022)	Loss 4.8342 (4.6669)	Top-1 acc 14.453 (18.930)	Top-5 acc 35.156 (39.278)	lr 0.03040
Warmup Train [18][750/3239]	Time 0.430 (0.525)	Data 0.001 (0.022)	Loss 4.5811 (4.6665)	Top-1 acc 17.578 (18.924)	Top-5 acc 41.797 (39.281)	lr 0.03039
Warmup Train [18][760/3239]	Time 0.601 (0.525)	Data 0.001 (0.022)	Loss 4.7702 (4.6656)	Top-1 acc 17.969 (18.942)	Top-5 acc 39.453 (39.303)	lr 0.03039
Warmup Train [18][770/3239]	Time 0.348 (0.525)	Data 0.001 (0.021)	Loss 4.6309 (4.6654)	Top-1 acc 19.531 (18.942)	Top-5 acc 40.625 (39.305)	lr 0.03038
Warmup Train [18][780/3239]	Time 0.484 (0.525)	Data 0.001 (0.021)	Loss 4.7221 (4.6654)	Top-1 acc 14.844 (18.938)	Top-5 acc 37.109 (39.300)	lr 0.03038
Warmup Train [18][790/3239]	Time 0.597 (0.525)	Data 0.001 (0.021)	Loss 4.7523 (4.6658)	Top-1 acc 20.703 (18.933)	Top-5 acc 37.891 (39.309)	lr 0.03037
Warmup Train [18][800/3239]	Time 0.336 (0.525)	Data 0.001 (0.021)	Loss 4.6979 (4.6650)	Top-1 acc 17.578 (18.952)	Top-5 acc 40.234 (39.311)	lr 0.03036
Warmup Train [18][810/3239]	Time 0.519 (0.525)	Data 0.001 (0.021)	Loss 4.7244 (4.6646)	Top-1 acc 15.625 (18.960)	Top-5 acc 37.109 (39.334)	lr 0.03036
Warmup Train [18][820/3239]	Time 0.495 (0.524)	Data 0.001 (0.021)	Loss 4.7311 (4.6647)	Top-1 acc 20.703 (18.971)	Top-5 acc 39.453 (39.335)	lr 0.03035
Warmup Train [18][830/3239]	Time 0.499 (0.525)	Data 0.001 (0.021)	Loss 4.6839 (4.6647)	Top-1 acc 19.141 (18.958)	Top-5 acc 36.719 (39.325)	lr 0.03035
Warmup Train [18][840/3239]	Time 0.493 (0.524)	Data 0.001 (0.020)	Loss 4.6767 (4.6647)	Top-1 acc 21.094 (18.955)	Top-5 acc 40.234 (39.336)	lr 0.03034
Warmup Train [18][850/3239]	Time 0.372 (0.524)	Data 0.001 (0.020)	Loss 4.7765 (4.6647)	Top-1 acc 16.797 (18.954)	Top-5 acc 37.500 (39.337)	lr 0.03033
Warmup Train [18][860/3239]	Time 0.573 (0.524)	Data 0.001 (0.020)	Loss 4.7980 (4.6652)	Top-1 acc 15.625 (18.936)	Top-5 acc 33.984 (39.325)	lr 0.03033
Warmup Train [18][870/3239]	Time 0.544 (0.524)	Data 0.002 (0.020)	Loss 4.5278 (4.6651)	Top-1 acc 20.703 (18.938)	Top-5 acc 41.797 (39.316)	lr 0.03032
Warmup Train [18][880/3239]	Time 0.458 (0.523)	Data 0.001 (0.020)	Loss 4.7530 (4.6656)	Top-1 acc 20.703 (18.939)	Top-5 acc 37.109 (39.308)	lr 0.03032
Warmup Train [18][890/3239]	Time 0.181 (0.523)	Data 0.001 (0.020)	Loss 4.6925 (4.6653)	Top-1 acc 21.094 (18.936)	Top-5 acc 39.453 (39.306)	lr 0.03031
Warmup Train [18][900/3239]	Time 0.354 (0.523)	Data 0.001 (0.020)	Loss 4.8233 (4.6654)	Top-1 acc 13.672 (18.946)	Top-5 acc 38.672 (39.318)	lr 0.03030
Warmup Train [18][910/3239]	Time 0.432 (0.522)	Data 0.002 (0.020)	Loss 4.6363 (4.6654)	Top-1 acc 21.094 (18.948)	Top-5 acc 37.891 (39.320)	lr 0.03030
Warmup Train [18][920/3239]	Time 0.592 (0.522)	Data 0.001 (0.020)	Loss 4.6736 (4.6648)	Top-1 acc 22.266 (18.955)	Top-5 acc 40.625 (39.337)	lr 0.03029
Warmup Train [18][930/3239]	Time 0.516 (0.522)	Data 0.001 (0.020)	Loss 4.6386 (4.6649)	Top-1 acc 16.406 (18.955)	Top-5 acc 40.234 (39.328)	lr 0.03029
Warmup Train [18][940/3239]	Time 0.622 (0.522)	Data 0.001 (0.019)	Loss 4.4638 (4.6650)	Top-1 acc 21.875 (18.953)	Top-5 acc 45.703 (39.327)	lr 0.03028
Warmup Train [18][950/3239]	Time 0.527 (0.522)	Data 0.001 (0.019)	Loss 4.7283 (4.6651)	Top-1 acc 17.969 (18.950)	Top-5 acc 37.109 (39.334)	lr 0.03027
Warmup Train [18][960/3239]	Time 0.599 (0.522)	Data 0.001 (0.019)	Loss 4.6147 (4.6649)	Top-1 acc 19.141 (18.946)	Top-5 acc 41.406 (39.339)	lr 0.03027
Warmup Train [18][970/3239]	Time 0.398 (0.521)	Data 0.001 (0.019)	Loss 4.7565 (4.6650)	Top-1 acc 18.750 (18.939)	Top-5 acc 38.672 (39.345)	lr 0.03026
Warmup Train [18][980/3239]	Time 0.421 (0.521)	Data 0.001 (0.019)	Loss 4.5318 (4.6648)	Top-1 acc 21.094 (18.928)	Top-5 acc 43.750 (39.352)	lr 0.03026
Warmup Train [18][990/3239]	Time 0.358 (0.521)	Data 0.001 (0.019)	Loss 4.6784 (4.6643)	Top-1 acc 19.141 (18.953)	Top-5 acc 37.891 (39.373)	lr 0.03025
Warmup Train [18][1000/3239]	Time 0.389 (0.521)	Data 0.001 (0.019)	Loss 4.9217 (4.6643)	Top-1 acc 19.141 (18.949)	Top-5 acc 36.328 (39.367)	lr 0.03025
Warmup Train [18][1010/3239]	Time 0.514 (0.521)	Data 0.001 (0.019)	Loss 4.6902 (4.6637)	Top-1 acc 14.844 (18.940)	Top-5 acc 38.672 (39.375)	lr 0.03024
Warmup Train [18][1020/3239]	Time 0.676 (0.521)	Data 0.001 (0.019)	Loss 4.6927 (4.6636)	Top-1 acc 20.312 (18.949)	Top-5 acc 38.281 (39.382)	lr 0.03023
Warmup Train [18][1030/3239]	Time 0.471 (0.521)	Data 0.001 (0.018)	Loss 4.5437 (4.6637)	Top-1 acc 22.656 (18.944)	Top-5 acc 44.531 (39.382)	lr 0.03023
Warmup Train [18][1040/3239]	Time 0.493 (0.521)	Data 0.001 (0.018)	Loss 4.7253 (4.6637)	Top-1 acc 17.188 (18.944)	Top-5 acc 36.719 (39.380)	lr 0.03022
Warmup Train [18][1050/3239]	Time 0.521 (0.521)	Data 0.001 (0.018)	Loss 4.5350 (4.6633)	Top-1 acc 23.438 (18.952)	Top-5 acc 45.312 (39.380)	lr 0.03022
Warmup Train [18][1060/3239]	Time 0.475 (0.521)	Data 0.001 (0.018)	Loss 4.6463 (4.6630)	Top-1 acc 21.094 (18.958)	Top-5 acc 41.406 (39.387)	lr 0.03021
Warmup Train [18][1070/3239]	Time 0.523 (0.521)	Data 0.001 (0.018)	Loss 4.8711 (4.6631)	Top-1 acc 13.281 (18.947)	Top-5 acc 31.641 (39.372)	lr 0.03020
Warmup Train [18][1080/3239]	Time 0.462 (0.521)	Data 0.001 (0.018)	Loss 4.6808 (4.6632)	Top-1 acc 18.359 (18.951)	Top-5 acc 40.234 (39.373)	lr 0.03020
Warmup Train [18][1090/3239]	Time 0.445 (0.520)	Data 0.001 (0.018)	Loss 4.7255 (4.6635)	Top-1 acc 20.312 (18.954)	Top-5 acc 39.453 (39.367)	lr 0.03019
Warmup Train [18][1100/3239]	Time 0.650 (0.520)	Data 0.001 (0.018)	Loss 4.5559 (4.6640)	Top-1 acc 18.750 (18.944)	Top-5 acc 44.141 (39.370)	lr 0.03019
Warmup Train [18][1110/3239]	Time 0.483 (0.520)	Data 0.001 (0.018)	Loss 4.7375 (4.6634)	Top-1 acc 17.969 (18.947)	Top-5 acc 39.453 (39.382)	lr 0.03018
Warmup Train [18][1120/3239]	Time 0.554 (0.520)	Data 0.001 (0.018)	Loss 4.6214 (4.6629)	Top-1 acc 18.750 (18.949)	Top-5 acc 41.016 (39.394)	lr 0.03017
Warmup Train [18][1130/3239]	Time 0.691 (0.520)	Data 0.001 (0.017)	Loss 4.6112 (4.6622)	Top-1 acc 19.922 (18.969)	Top-5 acc 42.969 (39.409)	lr 0.03017
Warmup Train [18][1140/3239]	Time 0.431 (0.520)	Data 0.001 (0.017)	Loss 4.8503 (4.6622)	Top-1 acc 17.578 (18.970)	Top-5 acc 30.859 (39.400)	lr 0.03016
Warmup Train [18][1150/3239]	Time 0.596 (0.520)	Data 0.001 (0.017)	Loss 4.5645 (4.6621)	Top-1 acc 19.141 (18.970)	Top-5 acc 39.062 (39.401)	lr 0.03016
Warmup Train [18][1160/3239]	Time 0.665 (0.520)	Data 0.001 (0.017)	Loss 4.9362 (4.6616)	Top-1 acc 16.797 (18.988)	Top-5 acc 36.328 (39.419)	lr 0.03015
Warmup Train [18][1170/3239]	Time 0.448 (0.519)	Data 0.001 (0.017)	Loss 4.7425 (4.6615)	Top-1 acc 21.875 (18.997)	Top-5 acc 37.109 (39.417)	lr 0.03014
Warmup Train [18][1180/3239]	Time 0.477 (0.519)	Data 0.001 (0.017)	Loss 4.8067 (4.6615)	Top-1 acc 16.797 (18.993)	Top-5 acc 37.500 (39.413)	lr 0.03014
Warmup Train [18][1190/3239]	Time 0.292 (0.518)	Data 0.001 (0.017)	Loss 4.6508 (4.6615)	Top-1 acc 20.312 (18.991)	Top-5 acc 38.672 (39.416)	lr 0.03013
Warmup Train [18][1200/3239]	Time 0.572 (0.518)	Data 0.001 (0.017)	Loss 4.5780 (4.6617)	Top-1 acc 25.000 (18.993)	Top-5 acc 43.359 (39.412)	lr 0.03013
Warmup Train [18][1210/3239]	Time 0.629 (0.518)	Data 0.001 (0.017)	Loss 4.5451 (4.6613)	Top-1 acc 19.922 (19.002)	Top-5 acc 43.750 (39.422)	lr 0.03012
Warmup Train [18][1220/3239]	Time 0.531 (0.519)	Data 0.001 (0.017)	Loss 4.5236 (4.6606)	Top-1 acc 20.312 (19.013)	Top-5 acc 44.922 (39.432)	lr 0.03011
Warmup Train [18][1230/3239]	Time 0.537 (0.518)	Data 0.001 (0.016)	Loss 4.5919 (4.6604)	Top-1 acc 16.797 (19.014)	Top-5 acc 43.359 (39.439)	lr 0.03011
Warmup Train [18][1240/3239]	Time 0.528 (0.518)	Data 0.001 (0.016)	Loss 4.7680 (4.6608)	Top-1 acc 17.578 (19.010)	Top-5 acc 35.938 (39.426)	lr 0.03010
Warmup Train [18][1250/3239]	Time 0.559 (0.518)	Data 0.001 (0.016)	Loss 4.5299 (4.6607)	Top-1 acc 19.531 (19.017)	Top-5 acc 44.922 (39.428)	lr 0.03010
Warmup Train [18][1260/3239]	Time 0.628 (0.518)	Data 0.001 (0.016)	Loss 4.6391 (4.6604)	Top-1 acc 19.141 (19.015)	Top-5 acc 42.969 (39.433)	lr 0.03009
Warmup Train [18][1270/3239]	Time 0.600 (0.518)	Data 0.001 (0.016)	Loss 4.6756 (4.6603)	Top-1 acc 17.969 (19.009)	Top-5 acc 38.281 (39.433)	lr 0.03009
Warmup Train [18][1280/3239]	Time 0.464 (0.518)	Data 0.001 (0.016)	Loss 4.5322 (4.6606)	Top-1 acc 21.094 (19.008)	Top-5 acc 45.703 (39.432)	lr 0.03008
Warmup Train [18][1290/3239]	Time 0.582 (0.518)	Data 0.001 (0.016)	Loss 4.4269 (4.6600)	Top-1 acc 24.609 (19.018)	Top-5 acc 45.312 (39.456)	lr 0.03007
Warmup Train [18][1300/3239]	Time 0.353 (0.518)	Data 0.001 (0.016)	Loss 4.6749 (4.6603)	Top-1 acc 17.188 (19.013)	Top-5 acc 39.844 (39.450)	lr 0.03007
Warmup Train [18][1310/3239]	Time 0.429 (0.518)	Data 0.001 (0.016)	Loss 4.7573 (4.6603)	Top-1 acc 18.359 (19.016)	Top-5 acc 35.156 (39.444)	lr 0.03006
Warmup Train [18][1320/3239]	Time 0.347 (0.518)	Data 0.001 (0.016)	Loss 4.7827 (4.6598)	Top-1 acc 17.578 (19.012)	Top-5 acc 34.766 (39.453)	lr 0.03006
Warmup Train [18][1330/3239]	Time 0.412 (0.518)	Data 0.001 (0.016)	Loss 4.6346 (4.6593)	Top-1 acc 21.094 (19.025)	Top-5 acc 39.062 (39.465)	lr 0.03005
Warmup Train [18][1340/3239]	Time 0.540 (0.518)	Data 0.001 (0.016)	Loss 4.5361 (4.6595)	Top-1 acc 21.094 (19.030)	Top-5 acc 40.625 (39.464)	lr 0.03004
Warmup Train [18][1350/3239]	Time 0.548 (0.518)	Data 0.001 (0.016)	Loss 4.6835 (4.6595)	Top-1 acc 19.141 (19.023)	Top-5 acc 36.719 (39.457)	lr 0.03004
Warmup Train [18][1360/3239]	Time 0.571 (0.518)	Data 0.001 (0.016)	Loss 4.6707 (4.6596)	Top-1 acc 20.312 (19.019)	Top-5 acc 36.328 (39.454)	lr 0.03003
Warmup Train [18][1370/3239]	Time 0.392 (0.518)	Data 0.001 (0.016)	Loss 4.6605 (4.6592)	Top-1 acc 17.578 (19.020)	Top-5 acc 39.844 (39.470)	lr 0.03003
Warmup Train [18][1380/3239]	Time 0.526 (0.518)	Data 0.002 (0.016)	Loss 4.6612 (4.6592)	Top-1 acc 16.797 (19.016)	Top-5 acc 37.109 (39.469)	lr 0.03002
Warmup Train [18][1390/3239]	Time 0.485 (0.518)	Data 0.001 (0.015)	Loss 4.7942 (4.6594)	Top-1 acc 15.625 (19.011)	Top-5 acc 32.031 (39.463)	lr 0.03001
Warmup Train [18][1400/3239]	Time 0.558 (0.517)	Data 0.001 (0.015)	Loss 4.2962 (4.6589)	Top-1 acc 25.391 (19.017)	Top-5 acc 51.562 (39.471)	lr 0.03001
Warmup Train [18][1410/3239]	Time 0.561 (0.517)	Data 0.001 (0.015)	Loss 4.7334 (4.6591)	Top-1 acc 16.797 (19.014)	Top-5 acc 37.109 (39.464)	lr 0.03000
Warmup Train [18][1420/3239]	Time 0.526 (0.517)	Data 0.001 (0.015)	Loss 4.3856 (4.6585)	Top-1 acc 22.266 (19.027)	Top-5 acc 41.797 (39.469)	lr 0.03000
Warmup Train [18][1430/3239]	Time 0.459 (0.517)	Data 0.001 (0.015)	Loss 4.6686 (4.6586)	Top-1 acc 15.625 (19.015)	Top-5 acc 39.844 (39.471)	lr 0.02999
Warmup Train [18][1440/3239]	Time 0.486 (0.517)	Data 0.001 (0.015)	Loss 4.5689 (4.6582)	Top-1 acc 20.312 (19.021)	Top-5 acc 39.844 (39.476)	lr 0.02998
Warmup Train [18][1450/3239]	Time 0.566 (0.517)	Data 0.002 (0.015)	Loss 4.5624 (4.6578)	Top-1 acc 19.531 (19.033)	Top-5 acc 40.625 (39.484)	lr 0.02998
Warmup Train [18][1460/3239]	Time 0.691 (0.517)	Data 0.001 (0.015)	Loss 4.8498 (4.6575)	Top-1 acc 14.844 (19.036)	Top-5 acc 34.375 (39.491)	lr 0.02997
Warmup Train [18][1470/3239]	Time 0.206 (0.516)	Data 0.001 (0.015)	Loss 4.7059 (4.6573)	Top-1 acc 17.969 (19.041)	Top-5 acc 39.453 (39.498)	lr 0.02997
Warmup Train [18][1480/3239]	Time 0.488 (0.516)	Data 0.001 (0.015)	Loss 4.6083 (4.6572)	Top-1 acc 19.141 (19.048)	Top-5 acc 42.578 (39.501)	lr 0.02996
Warmup Train [18][1490/3239]	Time 0.366 (0.516)	Data 0.001 (0.015)	Loss 4.7202 (4.6571)	Top-1 acc 18.359 (19.052)	Top-5 acc 36.328 (39.500)	lr 0.02995
Warmup Train [18][1500/3239]	Time 0.584 (0.516)	Data 0.001 (0.015)	Loss 4.7468 (4.6567)	Top-1 acc 17.969 (19.054)	Top-5 acc 37.891 (39.506)	lr 0.02995
Warmup Train [18][1510/3239]	Time 0.381 (0.516)	Data 0.001 (0.015)	Loss 4.6068 (4.6566)	Top-1 acc 21.094 (19.062)	Top-5 acc 42.578 (39.505)	lr 0.02994
Warmup Train [18][1520/3239]	Time 0.601 (0.516)	Data 0.001 (0.015)	Loss 4.6899 (4.6565)	Top-1 acc 18.359 (19.057)	Top-5 acc 36.719 (39.500)	lr 0.02994
Warmup Train [18][1530/3239]	Time 0.428 (0.516)	Data 0.001 (0.015)	Loss 4.6027 (4.6563)	Top-1 acc 20.703 (19.057)	Top-5 acc 42.578 (39.508)	lr 0.02993
Warmup Train [18][1540/3239]	Time 0.363 (0.516)	Data 0.001 (0.015)	Loss 4.5964 (4.6563)	Top-1 acc 19.531 (19.057)	Top-5 acc 39.453 (39.510)	lr 0.02992
Warmup Train [18][1550/3239]	Time 0.504 (0.516)	Data 0.001 (0.015)	Loss 4.4204 (4.6558)	Top-1 acc 21.484 (19.058)	Top-5 acc 42.969 (39.520)	lr 0.02992
Warmup Train [18][1560/3239]	Time 0.455 (0.516)	Data 0.001 (0.014)	Loss 4.6107 (4.6560)	Top-1 acc 21.484 (19.055)	Top-5 acc 42.578 (39.512)	lr 0.02991
Warmup Train [18][1570/3239]	Time 0.405 (0.516)	Data 0.035 (0.014)	Loss 4.7343 (4.6559)	Top-1 acc 17.969 (19.054)	Top-5 acc 37.891 (39.517)	lr 0.02991
Warmup Train [18][1580/3239]	Time 0.604 (0.516)	Data 0.001 (0.014)	Loss 4.5230 (4.6555)	Top-1 acc 20.703 (19.057)	Top-5 acc 42.188 (39.527)	lr 0.02990
Warmup Train [18][1590/3239]	Time 0.567 (0.516)	Data 0.001 (0.014)	Loss 4.6359 (4.6553)	Top-1 acc 18.359 (19.063)	Top-5 acc 40.234 (39.527)	lr 0.02990
Warmup Train [18][1600/3239]	Time 0.540 (0.516)	Data 0.001 (0.014)	Loss 4.6384 (4.6549)	Top-1 acc 17.578 (19.068)	Top-5 acc 36.719 (39.529)	lr 0.02989
Warmup Train [18][1610/3239]	Time 0.527 (0.516)	Data 0.001 (0.014)	Loss 4.7173 (4.6550)	Top-1 acc 20.703 (19.072)	Top-5 acc 37.500 (39.526)	lr 0.02988
Warmup Train [18][1620/3239]	Time 0.639 (0.516)	Data 0.001 (0.014)	Loss 4.7938 (4.6552)	Top-1 acc 17.578 (19.079)	Top-5 acc 40.625 (39.527)	lr 0.02988
Warmup Train [18][1630/3239]	Time 0.564 (0.516)	Data 0.001 (0.014)	Loss 4.8103 (4.6552)	Top-1 acc 14.844 (19.069)	Top-5 acc 36.328 (39.522)	lr 0.02987
Warmup Train [18][1640/3239]	Time 0.521 (0.516)	Data 0.001 (0.014)	Loss 4.8577 (4.6553)	Top-1 acc 14.844 (19.062)	Top-5 acc 38.672 (39.519)	lr 0.02987
Warmup Train [18][1650/3239]	Time 0.598 (0.515)	Data 0.001 (0.014)	Loss 4.6853 (4.6552)	Top-1 acc 17.188 (19.059)	Top-5 acc 42.578 (39.520)	lr 0.02986
Warmup Train [18][1660/3239]	Time 0.677 (0.515)	Data 0.001 (0.014)	Loss 4.6244 (4.6552)	Top-1 acc 19.531 (19.052)	Top-5 acc 37.891 (39.517)	lr 0.02985
Warmup Train [18][1670/3239]	Time 0.425 (0.515)	Data 0.001 (0.014)	Loss 4.6478 (4.6552)	Top-1 acc 21.484 (19.051)	Top-5 acc 35.938 (39.517)	lr 0.02985
Warmup Train [18][1680/3239]	Time 0.599 (0.515)	Data 0.001 (0.014)	Loss 4.6737 (4.6551)	Top-1 acc 21.875 (19.047)	Top-5 acc 35.938 (39.509)	lr 0.02984
Warmup Train [18][1690/3239]	Time 0.394 (0.515)	Data 0.001 (0.014)	Loss 4.7502 (4.6554)	Top-1 acc 21.484 (19.043)	Top-5 acc 37.109 (39.502)	lr 0.02984
Warmup Train [18][1700/3239]	Time 0.521 (0.516)	Data 0.001 (0.014)	Loss 4.5990 (4.6553)	Top-1 acc 17.969 (19.039)	Top-5 acc 43.750 (39.507)	lr 0.02983
Warmup Train [18][1710/3239]	Time 0.429 (0.515)	Data 0.001 (0.014)	Loss 4.7143 (4.6549)	Top-1 acc 15.625 (19.043)	Top-5 acc 33.984 (39.512)	lr 0.02982
Warmup Train [18][1720/3239]	Time 0.537 (0.515)	Data 0.001 (0.014)	Loss 4.6118 (4.6547)	Top-1 acc 21.484 (19.049)	Top-5 acc 38.672 (39.521)	lr 0.02982
Warmup Train [18][1730/3239]	Time 0.364 (0.515)	Data 0.001 (0.013)	Loss 4.6145 (4.6547)	Top-1 acc 21.484 (19.049)	Top-5 acc 40.234 (39.530)	lr 0.02981
Warmup Train [18][1740/3239]	Time 0.514 (0.515)	Data 0.001 (0.013)	Loss 4.7231 (4.6545)	Top-1 acc 14.062 (19.051)	Top-5 acc 32.812 (39.529)	lr 0.02981
Warmup Train [18][1750/3239]	Time 0.350 (0.515)	Data 0.001 (0.013)	Loss 4.4686 (4.6542)	Top-1 acc 24.609 (19.057)	Top-5 acc 41.016 (39.537)	lr 0.02980
Warmup Train [18][1760/3239]	Time 0.675 (0.515)	Data 0.001 (0.013)	Loss 4.6820 (4.6541)	Top-1 acc 17.578 (19.055)	Top-5 acc 37.500 (39.539)	lr 0.02979
Warmup Train [18][1770/3239]	Time 0.625 (0.515)	Data 0.001 (0.013)	Loss 4.6085 (4.6540)	Top-1 acc 19.531 (19.059)	Top-5 acc 42.188 (39.546)	lr 0.02979
Warmup Train [18][1780/3239]	Time 0.694 (0.515)	Data 0.002 (0.013)	Loss 4.4738 (4.6541)	Top-1 acc 21.094 (19.051)	Top-5 acc 40.234 (39.535)	lr 0.02978
Warmup Train [18][1790/3239]	Time 0.556 (0.515)	Data 0.001 (0.013)	Loss 4.8041 (4.6538)	Top-1 acc 17.188 (19.056)	Top-5 acc 39.844 (39.545)	lr 0.02978
Warmup Train [18][1800/3239]	Time 0.509 (0.515)	Data 0.001 (0.013)	Loss 4.8766 (4.6539)	Top-1 acc 16.406 (19.054)	Top-5 acc 33.594 (39.545)	lr 0.02977
Warmup Train [18][1810/3239]	Time 0.427 (0.515)	Data 0.001 (0.013)	Loss 4.7717 (4.6535)	Top-1 acc 15.625 (19.058)	Top-5 acc 33.984 (39.550)	lr 0.02976
Warmup Train [18][1820/3239]	Time 0.546 (0.515)	Data 0.001 (0.013)	Loss 4.6924 (4.6535)	Top-1 acc 18.359 (19.062)	Top-5 acc 37.500 (39.551)	lr 0.02976
Warmup Train [18][1830/3239]	Time 0.421 (0.515)	Data 0.001 (0.013)	Loss 4.4710 (4.6532)	Top-1 acc 21.484 (19.070)	Top-5 acc 44.141 (39.560)	lr 0.02975
Warmup Train [18][1840/3239]	Time 0.651 (0.515)	Data 0.001 (0.013)	Loss 4.7012 (4.6535)	Top-1 acc 19.922 (19.066)	Top-5 acc 37.109 (39.552)	lr 0.02975
Warmup Train [18][1850/3239]	Time 0.458 (0.515)	Data 0.001 (0.013)	Loss 4.5050 (4.6535)	Top-1 acc 21.875 (19.068)	Top-5 acc 43.359 (39.552)	lr 0.02974
Warmup Train [18][1860/3239]	Time 0.542 (0.515)	Data 0.001 (0.013)	Loss 4.5674 (4.6533)	Top-1 acc 21.875 (19.074)	Top-5 acc 42.969 (39.558)	lr 0.02973
Warmup Train [18][1870/3239]	Time 0.397 (0.515)	Data 0.001 (0.013)	Loss 4.5237 (4.6535)	Top-1 acc 24.609 (19.074)	Top-5 acc 39.844 (39.556)	lr 0.02973
Warmup Train [18][1880/3239]	Time 0.501 (0.515)	Data 0.001 (0.013)	Loss 4.7573 (4.6533)	Top-1 acc 17.578 (19.073)	Top-5 acc 39.453 (39.557)	lr 0.02972
Warmup Train [18][1890/3239]	Time 0.587 (0.515)	Data 0.001 (0.013)	Loss 4.8215 (4.6532)	Top-1 acc 18.750 (19.069)	Top-5 acc 37.109 (39.559)	lr 0.02972
Warmup Train [18][1900/3239]	Time 0.522 (0.515)	Data 0.001 (0.013)	Loss 4.4502 (4.6532)	Top-1 acc 19.141 (19.067)	Top-5 acc 46.875 (39.557)	lr 0.02971
Warmup Train [18][1910/3239]	Time 0.508 (0.515)	Data 0.001 (0.013)	Loss 4.7575 (4.6533)	Top-1 acc 17.969 (19.072)	Top-5 acc 37.109 (39.554)	lr 0.02970
Warmup Train [18][1920/3239]	Time 0.427 (0.515)	Data 0.001 (0.013)	Loss 4.6938 (4.6531)	Top-1 acc 18.359 (19.072)	Top-5 acc 39.844 (39.552)	lr 0.02970
Warmup Train [18][1930/3239]	Time 0.536 (0.515)	Data 0.001 (0.013)	Loss 4.6023 (4.6530)	Top-1 acc 18.750 (19.082)	Top-5 acc 37.109 (39.558)	lr 0.02969
Warmup Train [18][1940/3239]	Time 0.393 (0.515)	Data 0.002 (0.013)	Loss 4.7159 (4.6532)	Top-1 acc 19.141 (19.084)	Top-5 acc 37.109 (39.556)	lr 0.02969
Warmup Train [18][1950/3239]	Time 0.423 (0.515)	Data 0.001 (0.013)	Loss 4.7458 (4.6533)	Top-1 acc 16.406 (19.085)	Top-5 acc 39.062 (39.558)	lr 0.02968
Warmup Train [18][1960/3239]	Time 0.442 (0.515)	Data 0.001 (0.013)	Loss 4.9185 (4.6534)	Top-1 acc 14.453 (19.078)	Top-5 acc 34.766 (39.553)	lr 0.02968
Warmup Train [18][1970/3239]	Time 0.508 (0.515)	Data 0.001 (0.013)	Loss 4.5165 (4.6532)	Top-1 acc 21.484 (19.081)	Top-5 acc 45.703 (39.563)	lr 0.02967
Warmup Train [18][1980/3239]	Time 0.419 (0.515)	Data 0.001 (0.013)	Loss 4.6615 (4.6531)	Top-1 acc 20.312 (19.085)	Top-5 acc 40.625 (39.574)	lr 0.02966
Warmup Train [18][1990/3239]	Time 0.513 (0.515)	Data 0.001 (0.013)	Loss 4.7394 (4.6532)	Top-1 acc 19.141 (19.089)	Top-5 acc 42.578 (39.574)	lr 0.02966
Warmup Train [18][2000/3239]	Time 0.384 (0.514)	Data 0.001 (0.013)	Loss 4.3630 (4.6530)	Top-1 acc 25.000 (19.094)	Top-5 acc 47.266 (39.575)	lr 0.02965
Warmup Train [18][2010/3239]	Time 0.440 (0.514)	Data 0.001 (0.013)	Loss 4.7780 (4.6530)	Top-1 acc 14.062 (19.087)	Top-5 acc 36.328 (39.578)	lr 0.02965
Warmup Train [18][2020/3239]	Time 0.394 (0.514)	Data 0.001 (0.013)	Loss 4.6340 (4.6526)	Top-1 acc 19.141 (19.091)	Top-5 acc 39.844 (39.587)	lr 0.02964
Warmup Train [18][2030/3239]	Time 0.311 (0.514)	Data 0.002 (0.013)	Loss 4.8284 (4.6525)	Top-1 acc 18.359 (19.094)	Top-5 acc 36.719 (39.590)	lr 0.02963
Warmup Train [18][2040/3239]	Time 0.534 (0.514)	Data 0.001 (0.013)	Loss 4.6017 (4.6524)	Top-1 acc 19.531 (19.094)	Top-5 acc 41.797 (39.594)	lr 0.02963
Warmup Train [18][2050/3239]	Time 0.409 (0.514)	Data 0.001 (0.013)	Loss 4.7899 (4.6524)	Top-1 acc 17.969 (19.092)	Top-5 acc 36.719 (39.597)	lr 0.02962
Warmup Train [18][2060/3239]	Time 0.459 (0.514)	Data 0.002 (0.013)	Loss 4.5538 (4.6523)	Top-1 acc 22.266 (19.100)	Top-5 acc 42.188 (39.600)	lr 0.02962
Warmup Train [18][2070/3239]	Time 0.467 (0.514)	Data 0.002 (0.013)	Loss 4.5947 (4.6520)	Top-1 acc 22.266 (19.105)	Top-5 acc 41.406 (39.605)	lr 0.02961
Warmup Train [18][2080/3239]	Time 0.548 (0.514)	Data 0.001 (0.013)	Loss 4.7733 (4.6521)	Top-1 acc 14.844 (19.104)	Top-5 acc 37.500 (39.603)	lr 0.02960
Warmup Train [18][2090/3239]	Time 0.605 (0.514)	Data 0.001 (0.013)	Loss 4.6504 (4.6522)	Top-1 acc 19.141 (19.101)	Top-5 acc 39.844 (39.601)	lr 0.02960
Warmup Train [18][2100/3239]	Time 0.417 (0.514)	Data 0.001 (0.012)	Loss 4.5348 (4.6519)	Top-1 acc 21.484 (19.108)	Top-5 acc 42.578 (39.606)	lr 0.02959
Warmup Train [18][2110/3239]	Time 0.526 (0.514)	Data 0.001 (0.012)	Loss 4.4409 (4.6518)	Top-1 acc 22.266 (19.109)	Top-5 acc 46.875 (39.608)	lr 0.02959
Warmup Train [18][2120/3239]	Time 0.586 (0.514)	Data 0.001 (0.012)	Loss 4.7113 (4.6518)	Top-1 acc 12.500 (19.109)	Top-5 acc 39.062 (39.610)	lr 0.02958
Warmup Train [18][2130/3239]	Time 0.577 (0.514)	Data 0.001 (0.012)	Loss 4.4669 (4.6517)	Top-1 acc 19.922 (19.108)	Top-5 acc 45.312 (39.612)	lr 0.02957
Warmup Train [18][2140/3239]	Time 0.580 (0.514)	Data 0.001 (0.012)	Loss 4.6223 (4.6515)	Top-1 acc 19.922 (19.108)	Top-5 acc 41.406 (39.619)	lr 0.02957
Warmup Train [18][2150/3239]	Time 0.598 (0.514)	Data 0.001 (0.012)	Loss 4.7713 (4.6513)	Top-1 acc 20.312 (19.115)	Top-5 acc 37.891 (39.628)	lr 0.02956
Warmup Train [18][2160/3239]	Time 0.484 (0.514)	Data 0.001 (0.012)	Loss 4.4301 (4.6511)	Top-1 acc 25.000 (19.124)	Top-5 acc 44.922 (39.632)	lr 0.02956
Warmup Train [18][2170/3239]	Time 0.465 (0.514)	Data 0.001 (0.012)	Loss 4.7001 (4.6511)	Top-1 acc 17.188 (19.125)	Top-5 acc 40.625 (39.634)	lr 0.02955
Warmup Train [18][2180/3239]	Time 0.556 (0.514)	Data 0.001 (0.012)	Loss 4.6834 (4.6509)	Top-1 acc 19.922 (19.127)	Top-5 acc 39.453 (39.636)	lr 0.02954
Warmup Train [18][2190/3239]	Time 0.788 (0.514)	Data 0.001 (0.012)	Loss 4.7175 (4.6508)	Top-1 acc 16.406 (19.129)	Top-5 acc 38.281 (39.641)	lr 0.02954
Warmup Train [18][2200/3239]	Time 0.452 (0.514)	Data 0.001 (0.012)	Loss 4.4399 (4.6508)	Top-1 acc 23.047 (19.129)	Top-5 acc 41.016 (39.642)	lr 0.02953
Warmup Train [18][2210/3239]	Time 0.548 (0.514)	Data 0.001 (0.012)	Loss 4.4791 (4.6512)	Top-1 acc 22.656 (19.120)	Top-5 acc 42.188 (39.634)	lr 0.02953
Warmup Train [18][2220/3239]	Time 0.360 (0.514)	Data 0.001 (0.012)	Loss 4.6960 (4.6512)	Top-1 acc 16.406 (19.124)	Top-5 acc 36.719 (39.635)	lr 0.02952
Warmup Train [18][2230/3239]	Time 0.380 (0.514)	Data 0.001 (0.012)	Loss 4.4923 (4.6508)	Top-1 acc 19.141 (19.132)	Top-5 acc 41.797 (39.642)	lr 0.02951
Warmup Train [18][2240/3239]	Time 0.477 (0.514)	Data 0.001 (0.012)	Loss 4.4726 (4.6506)	Top-1 acc 27.344 (19.140)	Top-5 acc 48.438 (39.646)	lr 0.02951
Warmup Train [18][2250/3239]	Time 0.387 (0.514)	Data 0.001 (0.012)	Loss 4.8087 (4.6507)	Top-1 acc 18.359 (19.140)	Top-5 acc 35.156 (39.646)	lr 0.02950
Warmup Train [18][2260/3239]	Time 0.502 (0.514)	Data 0.001 (0.012)	Loss 4.5980 (4.6506)	Top-1 acc 19.141 (19.142)	Top-5 acc 40.234 (39.644)	lr 0.02950
Warmup Train [18][2270/3239]	Time 0.456 (0.514)	Data 0.001 (0.012)	Loss 4.6527 (4.6506)	Top-1 acc 17.969 (19.144)	Top-5 acc 40.625 (39.649)	lr 0.02949
Warmup Train [18][2280/3239]	Time 0.324 (0.514)	Data 0.001 (0.012)	Loss 4.6803 (4.6506)	Top-1 acc 15.625 (19.141)	Top-5 acc 38.672 (39.647)	lr 0.02948
Warmup Train [18][2290/3239]	Time 0.714 (0.513)	Data 0.001 (0.012)	Loss 4.6930 (4.6502)	Top-1 acc 17.188 (19.145)	Top-5 acc 37.109 (39.657)	lr 0.02948
Warmup Train [18][2300/3239]	Time 0.448 (0.513)	Data 0.001 (0.012)	Loss 4.6060 (4.6502)	Top-1 acc 20.703 (19.149)	Top-5 acc 40.234 (39.656)	lr 0.02947
Warmup Train [18][2310/3239]	Time 0.364 (0.513)	Data 0.001 (0.012)	Loss 4.4338 (4.6499)	Top-1 acc 22.656 (19.156)	Top-5 acc 44.141 (39.664)	lr 0.02947
Warmup Train [18][2320/3239]	Time 0.489 (0.513)	Data 0.001 (0.012)	Loss 4.7627 (4.6499)	Top-1 acc 16.406 (19.157)	Top-5 acc 35.938 (39.667)	lr 0.02946
Warmup Train [18][2330/3239]	Time 0.649 (0.513)	Data 0.001 (0.012)	Loss 4.6546 (4.6497)	Top-1 acc 21.094 (19.163)	Top-5 acc 39.062 (39.673)	lr 0.02945
Warmup Train [18][2340/3239]	Time 0.303 (0.513)	Data 0.001 (0.012)	Loss 4.6168 (4.6496)	Top-1 acc 17.969 (19.168)	Top-5 acc 37.109 (39.678)	lr 0.02945
Warmup Train [18][2350/3239]	Time 0.492 (0.513)	Data 0.001 (0.012)	Loss 4.4636 (4.6494)	Top-1 acc 21.094 (19.172)	Top-5 acc 45.312 (39.682)	lr 0.02944
Warmup Train [18][2360/3239]	Time 0.359 (0.513)	Data 0.001 (0.012)	Loss 4.7009 (4.6493)	Top-1 acc 18.750 (19.172)	Top-5 acc 38.672 (39.682)	lr 0.02944
Warmup Train [18][2370/3239]	Time 0.536 (0.513)	Data 0.001 (0.012)	Loss 4.7970 (4.6496)	Top-1 acc 19.922 (19.167)	Top-5 acc 38.281 (39.680)	lr 0.02943
Warmup Train [18][2380/3239]	Time 0.544 (0.513)	Data 0.001 (0.012)	Loss 4.7649 (4.6498)	Top-1 acc 16.406 (19.167)	Top-5 acc 36.719 (39.678)	lr 0.02942
Warmup Train [18][2390/3239]	Time 0.432 (0.513)	Data 0.001 (0.012)	Loss 4.5241 (4.6497)	Top-1 acc 17.188 (19.168)	Top-5 acc 42.188 (39.678)	lr 0.02942
Warmup Train [18][2400/3239]	Time 0.370 (0.513)	Data 0.001 (0.012)	Loss 4.5854 (4.6497)	Top-1 acc 19.531 (19.169)	Top-5 acc 40.625 (39.683)	lr 0.02941
Warmup Train [18][2410/3239]	Time 0.760 (0.513)	Data 0.001 (0.012)	Loss 4.6325 (4.6498)	Top-1 acc 21.484 (19.166)	Top-5 acc 39.062 (39.676)	lr 0.02941
Warmup Train [18][2420/3239]	Time 0.606 (0.513)	Data 0.001 (0.012)	Loss 4.8765 (4.6497)	Top-1 acc 16.406 (19.164)	Top-5 acc 35.938 (39.678)	lr 0.02940
Warmup Train [18][2430/3239]	Time 0.353 (0.513)	Data 0.001 (0.012)	Loss 4.6365 (4.6496)	Top-1 acc 20.703 (19.167)	Top-5 acc 41.406 (39.680)	lr 0.02939
Warmup Train [18][2440/3239]	Time 0.438 (0.513)	Data 0.001 (0.012)	Loss 4.7249 (4.6494)	Top-1 acc 16.797 (19.173)	Top-5 acc 41.406 (39.692)	lr 0.02939
Warmup Train [18][2450/3239]	Time 0.530 (0.513)	Data 0.001 (0.012)	Loss 4.4539 (4.6493)	Top-1 acc 20.703 (19.176)	Top-5 acc 44.141 (39.698)	lr 0.02938
Warmup Train [18][2460/3239]	Time 0.517 (0.513)	Data 0.001 (0.012)	Loss 4.4936 (4.6490)	Top-1 acc 21.094 (19.181)	Top-5 acc 42.578 (39.706)	lr 0.02938
Warmup Train [18][2470/3239]	Time 0.461 (0.513)	Data 0.001 (0.012)	Loss 4.7217 (4.6488)	Top-1 acc 18.750 (19.184)	Top-5 acc 36.719 (39.710)	lr 0.02937
Warmup Train [18][2480/3239]	Time 0.536 (0.513)	Data 0.001 (0.012)	Loss 4.6861 (4.6488)	Top-1 acc 19.531 (19.183)	Top-5 acc 37.500 (39.714)	lr 0.02937
Warmup Train [18][2490/3239]	Time 0.427 (0.513)	Data 0.001 (0.012)	Loss 4.7916 (4.6487)	Top-1 acc 15.625 (19.186)	Top-5 acc 35.938 (39.717)	lr 0.02936
Warmup Train [18][2500/3239]	Time 0.405 (0.513)	Data 0.001 (0.012)	Loss 4.7012 (4.6488)	Top-1 acc 20.312 (19.188)	Top-5 acc 37.500 (39.715)	lr 0.02935
Warmup Train [18][2510/3239]	Time 0.560 (0.513)	Data 0.001 (0.012)	Loss 4.2960 (4.6485)	Top-1 acc 21.094 (19.188)	Top-5 acc 46.875 (39.721)	lr 0.02935
Warmup Train [18][2520/3239]	Time 0.421 (0.513)	Data 0.001 (0.012)	Loss 4.8469 (4.6481)	Top-1 acc 16.406 (19.194)	Top-5 acc 32.422 (39.730)	lr 0.02934
Warmup Train [18][2530/3239]	Time 0.485 (0.513)	Data 0.001 (0.012)	Loss 4.6356 (4.6481)	Top-1 acc 19.141 (19.192)	Top-5 acc 36.719 (39.730)	lr 0.02934
Warmup Train [18][2540/3239]	Time 0.557 (0.513)	Data 0.001 (0.012)	Loss 4.6437 (4.6482)	Top-1 acc 15.625 (19.181)	Top-5 acc 39.844 (39.723)	lr 0.02933
Warmup Train [18][2550/3239]	Time 0.440 (0.513)	Data 0.002 (0.011)	Loss 4.5752 (4.6480)	Top-1 acc 20.312 (19.182)	Top-5 acc 46.875 (39.732)	lr 0.02932
Warmup Train [18][2560/3239]	Time 0.381 (0.513)	Data 0.001 (0.011)	Loss 4.7264 (4.6478)	Top-1 acc 20.703 (19.185)	Top-5 acc 38.672 (39.735)	lr 0.02932
Warmup Train [18][2570/3239]	Time 0.601 (0.513)	Data 0.001 (0.012)	Loss 4.5364 (4.6475)	Top-1 acc 20.312 (19.186)	Top-5 acc 42.188 (39.744)	lr 0.02931
Warmup Train [18][2580/3239]	Time 0.443 (0.513)	Data 0.001 (0.011)	Loss 4.6554 (4.6474)	Top-1 acc 20.703 (19.187)	Top-5 acc 36.328 (39.743)	lr 0.02931
Warmup Train [18][2590/3239]	Time 0.698 (0.513)	Data 0.001 (0.011)	Loss 4.8341 (4.6476)	Top-1 acc 15.625 (19.185)	Top-5 acc 35.547 (39.738)	lr 0.02930
Warmup Train [18][2600/3239]	Time 0.577 (0.513)	Data 0.001 (0.011)	Loss 4.5153 (4.6474)	Top-1 acc 21.094 (19.192)	Top-5 acc 42.578 (39.738)	lr 0.02929
Warmup Train [18][2610/3239]	Time 0.536 (0.513)	Data 0.001 (0.011)	Loss 4.7359 (4.6474)	Top-1 acc 19.141 (19.190)	Top-5 acc 34.375 (39.736)	lr 0.02929
Warmup Train [18][2620/3239]	Time 0.385 (0.513)	Data 0.001 (0.011)	Loss 4.5631 (4.6472)	Top-1 acc 19.531 (19.191)	Top-5 acc 37.500 (39.740)	lr 0.02928
Warmup Train [18][2630/3239]	Time 0.565 (0.513)	Data 0.001 (0.011)	Loss 4.6237 (4.6470)	Top-1 acc 19.141 (19.191)	Top-5 acc 41.797 (39.743)	lr 0.02928
Warmup Train [18][2640/3239]	Time 0.493 (0.513)	Data 0.001 (0.011)	Loss 4.5079 (4.6469)	Top-1 acc 18.359 (19.190)	Top-5 acc 42.188 (39.744)	lr 0.02927
Warmup Train [18][2650/3239]	Time 0.587 (0.513)	Data 0.001 (0.011)	Loss 4.5749 (4.6469)	Top-1 acc 23.828 (19.190)	Top-5 acc 45.312 (39.747)	lr 0.02926
Warmup Train [18][2660/3239]	Time 0.525 (0.513)	Data 0.001 (0.011)	Loss 4.6184 (4.6470)	Top-1 acc 20.312 (19.187)	Top-5 acc 42.969 (39.745)	lr 0.02926
Warmup Train [18][2670/3239]	Time 0.292 (0.513)	Data 0.001 (0.011)	Loss 4.4274 (4.6467)	Top-1 acc 22.656 (19.190)	Top-5 acc 43.750 (39.752)	lr 0.02925
Warmup Train [18][2680/3239]	Time 0.317 (0.513)	Data 0.001 (0.011)	Loss 4.5608 (4.6466)	Top-1 acc 21.094 (19.192)	Top-5 acc 42.578 (39.754)	lr 0.02925
Warmup Train [18][2690/3239]	Time 0.465 (0.513)	Data 0.001 (0.011)	Loss 4.6499 (4.6466)	Top-1 acc 17.969 (19.192)	Top-5 acc 41.016 (39.754)	lr 0.02924
Warmup Train [18][2700/3239]	Time 0.651 (0.513)	Data 0.001 (0.011)	Loss 4.6767 (4.6465)	Top-1 acc 20.703 (19.195)	Top-5 acc 39.844 (39.759)	lr 0.02923
Warmup Train [18][2710/3239]	Time 0.457 (0.513)	Data 0.001 (0.011)	Loss 4.7617 (4.6466)	Top-1 acc 19.141 (19.196)	Top-5 acc 37.891 (39.758)	lr 0.02923
Warmup Train [18][2720/3239]	Time 0.437 (0.513)	Data 0.001 (0.011)	Loss 4.6936 (4.6464)	Top-1 acc 20.312 (19.201)	Top-5 acc 41.406 (39.763)	lr 0.02922
Warmup Train [18][2730/3239]	Time 0.358 (0.513)	Data 0.003 (0.011)	Loss 4.6769 (4.6465)	Top-1 acc 16.797 (19.200)	Top-5 acc 39.453 (39.763)	lr 0.02922
Warmup Train [18][2740/3239]	Time 0.504 (0.513)	Data 0.001 (0.011)	Loss 4.7291 (4.6465)	Top-1 acc 17.188 (19.199)	Top-5 acc 37.109 (39.763)	lr 0.02921
Warmup Train [18][2750/3239]	Time 0.360 (0.513)	Data 0.001 (0.011)	Loss 4.5962 (4.6467)	Top-1 acc 20.312 (19.198)	Top-5 acc 40.234 (39.757)	lr 0.02920
Warmup Train [18][2760/3239]	Time 0.575 (0.513)	Data 0.001 (0.011)	Loss 4.6541 (4.6466)	Top-1 acc 22.266 (19.204)	Top-5 acc 39.062 (39.761)	lr 0.02920
Warmup Train [18][2770/3239]	Time 0.570 (0.513)	Data 0.001 (0.011)	Loss 4.6103 (4.6466)	Top-1 acc 20.312 (19.204)	Top-5 acc 39.453 (39.758)	lr 0.02919
Warmup Train [18][2780/3239]	Time 0.347 (0.513)	Data 0.001 (0.011)	Loss 4.4169 (4.6465)	Top-1 acc 19.141 (19.205)	Top-5 acc 47.266 (39.763)	lr 0.02919
Warmup Train [18][2790/3239]	Time 0.396 (0.513)	Data 0.001 (0.011)	Loss 4.8653 (4.6465)	Top-1 acc 13.672 (19.206)	Top-5 acc 37.109 (39.766)	lr 0.02918
Warmup Train [18][2800/3239]	Time 0.663 (0.513)	Data 0.001 (0.011)	Loss 4.7403 (4.6465)	Top-1 acc 17.969 (19.207)	Top-5 acc 38.281 (39.769)	lr 0.02917
Warmup Train [18][2810/3239]	Time 0.407 (0.513)	Data 0.001 (0.011)	Loss 4.5477 (4.6466)	Top-1 acc 22.656 (19.206)	Top-5 acc 42.188 (39.768)	lr 0.02917
Warmup Train [18][2820/3239]	Time 0.487 (0.513)	Data 0.001 (0.011)	Loss 4.5163 (4.6465)	Top-1 acc 21.094 (19.207)	Top-5 acc 42.578 (39.772)	lr 0.02916
Warmup Train [18][2830/3239]	Time 0.541 (0.513)	Data 0.001 (0.011)	Loss 4.4513 (4.6463)	Top-1 acc 23.438 (19.209)	Top-5 acc 45.312 (39.777)	lr 0.02916
Warmup Train [18][2840/3239]	Time 0.552 (0.513)	Data 0.001 (0.011)	Loss 4.4640 (4.6461)	Top-1 acc 19.922 (19.208)	Top-5 acc 44.531 (39.783)	lr 0.02915
Warmup Train [18][2850/3239]	Time 0.616 (0.513)	Data 0.001 (0.011)	Loss 4.5903 (4.6459)	Top-1 acc 19.922 (19.207)	Top-5 acc 41.016 (39.789)	lr 0.02914
Warmup Train [18][2860/3239]	Time 0.225 (0.513)	Data 0.027 (0.011)	Loss 4.5541 (4.6458)	Top-1 acc 19.141 (19.208)	Top-5 acc 42.188 (39.788)	lr 0.02914
Warmup Train [18][2870/3239]	Time 0.515 (0.513)	Data 0.001 (0.011)	Loss 4.5630 (4.6457)	Top-1 acc 18.359 (19.208)	Top-5 acc 39.062 (39.788)	lr 0.02913
Warmup Train [18][2880/3239]	Time 0.503 (0.513)	Data 0.001 (0.011)	Loss 4.6096 (4.6456)	Top-1 acc 19.922 (19.207)	Top-5 acc 40.234 (39.791)	lr 0.02913
Warmup Train [18][2890/3239]	Time 0.620 (0.513)	Data 0.001 (0.011)	Loss 4.6397 (4.6457)	Top-1 acc 21.094 (19.207)	Top-5 acc 39.453 (39.789)	lr 0.02912
Warmup Train [18][2900/3239]	Time 0.497 (0.513)	Data 0.001 (0.011)	Loss 4.8427 (4.6456)	Top-1 acc 16.797 (19.207)	Top-5 acc 37.500 (39.791)	lr 0.02911
Warmup Train [18][2910/3239]	Time 0.537 (0.513)	Data 0.001 (0.011)	Loss 4.5174 (4.6455)	Top-1 acc 21.875 (19.209)	Top-5 acc 44.141 (39.793)	lr 0.02911
Warmup Train [18][2920/3239]	Time 0.406 (0.513)	Data 0.001 (0.011)	Loss 4.8279 (4.6454)	Top-1 acc 15.234 (19.208)	Top-5 acc 37.109 (39.797)	lr 0.02910
Warmup Train [18][2930/3239]	Time 0.549 (0.513)	Data 0.001 (0.011)	Loss 4.6172 (4.6453)	Top-1 acc 16.406 (19.206)	Top-5 acc 37.109 (39.798)	lr 0.02910
Warmup Train [18][2940/3239]	Time 0.555 (0.513)	Data 0.001 (0.011)	Loss 4.5701 (4.6451)	Top-1 acc 21.094 (19.209)	Top-5 acc 43.359 (39.800)	lr 0.02909
Warmup Train [18][2950/3239]	Time 0.497 (0.513)	Data 0.001 (0.011)	Loss 4.5549 (4.6451)	Top-1 acc 18.750 (19.211)	Top-5 acc 38.281 (39.797)	lr 0.02908
Warmup Train [18][2960/3239]	Time 0.558 (0.513)	Data 0.001 (0.011)	Loss 4.5510 (4.6451)	Top-1 acc 26.172 (19.215)	Top-5 acc 44.531 (39.799)	lr 0.02908
Warmup Train [18][2970/3239]	Time 0.501 (0.513)	Data 0.001 (0.011)	Loss 4.5322 (4.6453)	Top-1 acc 21.094 (19.213)	Top-5 acc 40.625 (39.794)	lr 0.02907
Warmup Train [18][2980/3239]	Time 0.521 (0.513)	Data 0.001 (0.011)	Loss 4.6314 (4.6453)	Top-1 acc 21.875 (19.216)	Top-5 acc 39.453 (39.792)	lr 0.02907
Warmup Train [18][2990/3239]	Time 0.583 (0.513)	Data 0.001 (0.011)	Loss 4.5844 (4.6453)	Top-1 acc 20.312 (19.218)	Top-5 acc 43.359 (39.795)	lr 0.02906
Warmup Train [18][3000/3239]	Time 0.519 (0.513)	Data 0.001 (0.011)	Loss 4.5265 (4.6452)	Top-1 acc 21.484 (19.218)	Top-5 acc 44.922 (39.798)	lr 0.02905
Warmup Train [18][3010/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 4.7145 (4.6451)	Top-1 acc 12.109 (19.212)	Top-5 acc 39.062 (39.799)	lr 0.02905
Warmup Train [18][3020/3239]	Time 0.576 (0.513)	Data 0.001 (0.011)	Loss 4.5544 (4.6450)	Top-1 acc 19.531 (19.212)	Top-5 acc 45.703 (39.808)	lr 0.02904
Warmup Train [18][3030/3239]	Time 0.487 (0.513)	Data 0.001 (0.011)	Loss 4.6146 (4.6449)	Top-1 acc 17.188 (19.216)	Top-5 acc 40.234 (39.811)	lr 0.02904
Warmup Train [18][3040/3239]	Time 0.367 (0.513)	Data 0.001 (0.011)	Loss 4.6924 (4.6447)	Top-1 acc 20.312 (19.218)	Top-5 acc 39.062 (39.816)	lr 0.02903
Warmup Train [18][3050/3239]	Time 0.584 (0.513)	Data 0.001 (0.011)	Loss 4.5758 (4.6447)	Top-1 acc 19.531 (19.218)	Top-5 acc 39.453 (39.816)	lr 0.02902
Warmup Train [18][3060/3239]	Time 0.522 (0.513)	Data 0.001 (0.011)	Loss 4.6575 (4.6444)	Top-1 acc 17.969 (19.225)	Top-5 acc 37.109 (39.822)	lr 0.02902
Warmup Train [18][3070/3239]	Time 0.534 (0.513)	Data 0.001 (0.011)	Loss 4.4887 (4.6441)	Top-1 acc 19.531 (19.226)	Top-5 acc 40.234 (39.826)	lr 0.02901
Warmup Train [18][3080/3239]	Time 0.511 (0.513)	Data 0.001 (0.011)	Loss 4.7457 (4.6442)	Top-1 acc 20.703 (19.228)	Top-5 acc 39.844 (39.822)	lr 0.02901
Warmup Train [18][3090/3239]	Time 0.477 (0.513)	Data 0.001 (0.011)	Loss 4.7796 (4.6440)	Top-1 acc 19.141 (19.234)	Top-5 acc 36.328 (39.828)	lr 0.02900
Warmup Train [18][3100/3239]	Time 0.484 (0.513)	Data 0.001 (0.011)	Loss 4.4745 (4.6437)	Top-1 acc 21.484 (19.237)	Top-5 acc 41.797 (39.836)	lr 0.02899
Warmup Train [18][3110/3239]	Time 0.421 (0.513)	Data 0.002 (0.011)	Loss 4.4640 (4.6436)	Top-1 acc 21.094 (19.240)	Top-5 acc 42.578 (39.837)	lr 0.02899
Warmup Train [18][3120/3239]	Time 0.399 (0.513)	Data 0.001 (0.011)	Loss 4.4977 (4.6436)	Top-1 acc 25.000 (19.236)	Top-5 acc 43.750 (39.836)	lr 0.02898
Warmup Train [18][3130/3239]	Time 0.564 (0.513)	Data 0.001 (0.011)	Loss 4.6878 (4.6434)	Top-1 acc 18.750 (19.238)	Top-5 acc 38.672 (39.838)	lr 0.02898
Warmup Train [18][3140/3239]	Time 0.503 (0.513)	Data 0.001 (0.011)	Loss 4.6834 (4.6434)	Top-1 acc 18.750 (19.237)	Top-5 acc 39.062 (39.838)	lr 0.02897
Warmup Train [18][3150/3239]	Time 0.399 (0.512)	Data 0.001 (0.011)	Loss 4.6878 (4.6433)	Top-1 acc 19.531 (19.241)	Top-5 acc 39.062 (39.837)	lr 0.02896
Warmup Train [18][3160/3239]	Time 0.611 (0.512)	Data 0.001 (0.011)	Loss 4.5014 (4.6433)	Top-1 acc 23.047 (19.240)	Top-5 acc 44.922 (39.838)	lr 0.02896
Warmup Train [18][3170/3239]	Time 0.488 (0.512)	Data 0.001 (0.011)	Loss 4.5634 (4.6431)	Top-1 acc 19.141 (19.243)	Top-5 acc 44.141 (39.844)	lr 0.02895
Warmup Train [18][3180/3239]	Time 0.539 (0.512)	Data 0.000 (0.011)	Loss 4.5602 (4.6429)	Top-1 acc 22.656 (19.248)	Top-5 acc 41.406 (39.849)	lr 0.02895
Warmup Train [18][3190/3239]	Time 0.509 (0.512)	Data 0.000 (0.011)	Loss 4.5920 (4.6428)	Top-1 acc 20.312 (19.254)	Top-5 acc 38.672 (39.852)	lr 0.02894
Warmup Train [18][3200/3239]	Time 0.583 (0.512)	Data 0.000 (0.011)	Loss 4.5703 (4.6425)	Top-1 acc 19.531 (19.254)	Top-5 acc 41.797 (39.855)	lr 0.02893
Warmup Train [18][3210/3239]	Time 0.517 (0.512)	Data 0.000 (0.011)	Loss 4.5594 (4.6425)	Top-1 acc 25.000 (19.255)	Top-5 acc 40.625 (39.854)	lr 0.02893
Warmup Train [18][3220/3239]	Time 0.566 (0.512)	Data 0.000 (0.010)	Loss 4.6756 (4.6423)	Top-1 acc 22.266 (19.256)	Top-5 acc 38.672 (39.858)	lr 0.02892
Warmup Train [18][3230/3239]	Time 0.590 (0.512)	Data 0.000 (0.010)	Loss 4.5525 (4.6421)	Top-1 acc 23.047 (19.257)	Top-5 acc 40.625 (39.859)	lr 0.02892
Warmup Train [18][3239/3239]	Time 0.509 (0.512)	Data 0.000 (0.010)	Loss 4.6896 (4.6422)	Top-1 acc 22.222 (19.256)	Top-5 acc 37.037 (39.859)	lr 0.02891
==========Warmup Valid [18/40]	loss 3.673	top-1 acc 26.303	top-5 acc 49.869	Train top-1 19.256	top-5 39.859	flops: 442.4M
Warmup Train [19][0/3239]	Time 13.930 (13.930)	Data 12.193 (12.193)	Loss 4.6753 (4.6753)	Top-1 acc 22.266 (22.266)	Top-5 acc 42.578 (42.578)	lr 0.02891
Warmup Train [19][10/3239]	Time 0.463 (1.767)	Data 0.001 (1.111)	Loss 4.6867 (4.6470)	Top-1 acc 17.188 (20.028)	Top-5 acc 37.891 (39.027)	lr 0.02890
Warmup Train [19][20/3239]	Time 0.629 (1.177)	Data 0.001 (0.589)	Loss 4.4362 (4.6222)	Top-1 acc 25.000 (20.424)	Top-5 acc 46.875 (39.881)	lr 0.02890
Warmup Train [19][30/3239]	Time 0.585 (0.967)	Data 0.001 (0.400)	Loss 4.4962 (4.6213)	Top-1 acc 20.703 (20.161)	Top-5 acc 42.969 (39.806)	lr 0.02889
Warmup Train [19][40/3239]	Time 0.535 (0.853)	Data 0.001 (0.303)	Loss 4.5533 (4.6150)	Top-1 acc 21.875 (20.255)	Top-5 acc 40.234 (39.891)	lr 0.02889
Warmup Train [19][50/3239]	Time 0.523 (0.789)	Data 0.001 (0.245)	Loss 4.6805 (4.6141)	Top-1 acc 20.312 (20.259)	Top-5 acc 39.062 (39.936)	lr 0.02888
Warmup Train [19][60/3239]	Time 0.513 (0.742)	Data 0.001 (0.205)	Loss 4.8251 (4.6212)	Top-1 acc 14.453 (19.864)	Top-5 acc 35.547 (39.818)	lr 0.02887
Warmup Train [19][70/3239]	Time 0.499 (0.711)	Data 0.001 (0.177)	Loss 4.5526 (4.6128)	Top-1 acc 23.828 (20.059)	Top-5 acc 39.844 (40.086)	lr 0.02887
Warmup Train [19][80/3239]	Time 0.383 (0.683)	Data 0.001 (0.155)	Loss 4.5436 (4.6089)	Top-1 acc 16.797 (20.062)	Top-5 acc 39.453 (40.210)	lr 0.02886
Warmup Train [19][90/3239]	Time 0.474 (0.665)	Data 0.001 (0.140)	Loss 4.6191 (4.6085)	Top-1 acc 19.531 (20.046)	Top-5 acc 40.625 (40.217)	lr 0.02886
Warmup Train [19][100/3239]	Time 0.542 (0.651)	Data 0.001 (0.127)	Loss 4.5484 (4.6114)	Top-1 acc 21.094 (19.964)	Top-5 acc 38.281 (40.107)	lr 0.02885
Warmup Train [19][110/3239]	Time 0.751 (0.640)	Data 0.001 (0.116)	Loss 4.6928 (4.6139)	Top-1 acc 18.359 (19.869)	Top-5 acc 36.328 (40.182)	lr 0.02885
Warmup Train [19][120/3239]	Time 0.554 (0.630)	Data 0.001 (0.107)	Loss 4.3034 (4.6149)	Top-1 acc 24.219 (19.877)	Top-5 acc 46.094 (40.231)	lr 0.02884
Warmup Train [19][130/3239]	Time 0.655 (0.623)	Data 0.001 (0.099)	Loss 4.6655 (4.6179)	Top-1 acc 19.531 (19.806)	Top-5 acc 37.500 (40.222)	lr 0.02883
Warmup Train [19][140/3239]	Time 0.523 (0.615)	Data 0.001 (0.092)	Loss 4.5446 (4.6163)	Top-1 acc 23.438 (19.844)	Top-5 acc 42.578 (40.287)	lr 0.02883
Warmup Train [19][150/3239]	Time 0.530 (0.610)	Data 0.001 (0.086)	Loss 4.5862 (4.6170)	Top-1 acc 17.188 (19.728)	Top-5 acc 39.844 (40.141)	lr 0.02882
Warmup Train [19][160/3239]	Time 0.571 (0.605)	Data 0.001 (0.081)	Loss 4.4663 (4.6134)	Top-1 acc 19.922 (19.822)	Top-5 acc 43.359 (40.181)	lr 0.02882
Warmup Train [19][170/3239]	Time 0.628 (0.599)	Data 0.001 (0.076)	Loss 4.5811 (4.6160)	Top-1 acc 22.266 (19.792)	Top-5 acc 43.359 (40.141)	lr 0.02881
Warmup Train [19][180/3239]	Time 0.670 (0.594)	Data 0.001 (0.072)	Loss 4.6020 (4.6179)	Top-1 acc 19.141 (19.700)	Top-5 acc 43.750 (40.073)	lr 0.02880
Warmup Train [19][190/3239]	Time 0.476 (0.589)	Data 0.001 (0.069)	Loss 4.6570 (4.6161)	Top-1 acc 19.141 (19.711)	Top-5 acc 41.016 (40.126)	lr 0.02880
Warmup Train [19][200/3239]	Time 0.704 (0.585)	Data 0.001 (0.065)	Loss 4.5429 (4.6132)	Top-1 acc 18.359 (19.728)	Top-5 acc 42.969 (40.182)	lr 0.02879
Warmup Train [19][210/3239]	Time 0.349 (0.580)	Data 0.001 (0.062)	Loss 4.7641 (4.6145)	Top-1 acc 17.578 (19.726)	Top-5 acc 39.062 (40.195)	lr 0.02879
Warmup Train [19][220/3239]	Time 0.506 (0.578)	Data 0.001 (0.060)	Loss 4.6213 (4.6137)	Top-1 acc 18.750 (19.752)	Top-5 acc 45.703 (40.241)	lr 0.02878
Warmup Train [19][230/3239]	Time 0.466 (0.575)	Data 0.001 (0.057)	Loss 4.6372 (4.6131)	Top-1 acc 18.750 (19.771)	Top-5 acc 40.234 (40.267)	lr 0.02877
Warmup Train [19][240/3239]	Time 0.139 (0.571)	Data 0.001 (0.055)	Loss 4.5543 (4.6147)	Top-1 acc 19.531 (19.750)	Top-5 acc 39.062 (40.207)	lr 0.02877
Warmup Train [19][250/3239]	Time 0.459 (0.568)	Data 0.001 (0.054)	Loss 4.5164 (4.6133)	Top-1 acc 20.703 (19.769)	Top-5 acc 43.750 (40.266)	lr 0.02876
Warmup Train [19][260/3239]	Time 0.509 (0.566)	Data 0.001 (0.052)	Loss 4.5738 (4.6099)	Top-1 acc 21.484 (19.804)	Top-5 acc 42.188 (40.327)	lr 0.02876
Warmup Train [19][270/3239]	Time 0.496 (0.563)	Data 0.001 (0.050)	Loss 4.6498 (4.6071)	Top-1 acc 17.578 (19.841)	Top-5 acc 36.328 (40.417)	lr 0.02875
Warmup Train [19][280/3239]	Time 0.485 (0.560)	Data 0.001 (0.048)	Loss 4.7187 (4.6083)	Top-1 acc 20.312 (19.869)	Top-5 acc 41.016 (40.405)	lr 0.02874
Warmup Train [19][290/3239]	Time 0.460 (0.557)	Data 0.001 (0.047)	Loss 4.7316 (4.6070)	Top-1 acc 16.406 (19.878)	Top-5 acc 37.109 (40.437)	lr 0.02874
Warmup Train [19][300/3239]	Time 0.523 (0.556)	Data 0.001 (0.046)	Loss 4.6927 (4.6066)	Top-1 acc 17.969 (19.886)	Top-5 acc 39.844 (40.454)	lr 0.02873
Warmup Train [19][310/3239]	Time 0.431 (0.554)	Data 0.001 (0.045)	Loss 4.5966 (4.6041)	Top-1 acc 17.578 (19.929)	Top-5 acc 39.453 (40.535)	lr 0.02873
Warmup Train [19][320/3239]	Time 0.537 (0.553)	Data 0.001 (0.043)	Loss 4.6986 (4.6040)	Top-1 acc 20.312 (19.913)	Top-5 acc 37.500 (40.520)	lr 0.02872
Warmup Train [19][330/3239]	Time 0.503 (0.553)	Data 0.001 (0.042)	Loss 4.4860 (4.6037)	Top-1 acc 26.172 (19.943)	Top-5 acc 44.531 (40.548)	lr 0.02871
Warmup Train [19][340/3239]	Time 0.535 (0.552)	Data 0.001 (0.041)	Loss 4.6479 (4.6023)	Top-1 acc 19.922 (19.959)	Top-5 acc 37.109 (40.576)	lr 0.02871
Warmup Train [19][350/3239]	Time 0.473 (0.550)	Data 0.001 (0.040)	Loss 4.4347 (4.6029)	Top-1 acc 22.266 (19.920)	Top-5 acc 45.703 (40.572)	lr 0.02870
Warmup Train [19][360/3239]	Time 0.517 (0.549)	Data 0.001 (0.039)	Loss 4.5575 (4.6033)	Top-1 acc 21.875 (19.913)	Top-5 acc 43.359 (40.598)	lr 0.02870
Warmup Train [19][370/3239]	Time 0.453 (0.548)	Data 0.001 (0.038)	Loss 4.8449 (4.6053)	Top-1 acc 18.750 (19.898)	Top-5 acc 37.109 (40.563)	lr 0.02869
Warmup Train [19][380/3239]	Time 0.514 (0.547)	Data 0.001 (0.037)	Loss 4.5610 (4.6060)	Top-1 acc 20.312 (19.909)	Top-5 acc 40.234 (40.541)	lr 0.02868
Warmup Train [19][390/3239]	Time 0.335 (0.544)	Data 0.001 (0.036)	Loss 4.6621 (4.6079)	Top-1 acc 17.578 (19.880)	Top-5 acc 39.062 (40.527)	lr 0.02868
Warmup Train [19][400/3239]	Time 0.512 (0.544)	Data 0.001 (0.036)	Loss 4.5168 (4.6072)	Top-1 acc 18.750 (19.874)	Top-5 acc 42.188 (40.574)	lr 0.02867
Warmup Train [19][410/3239]	Time 0.447 (0.543)	Data 0.001 (0.035)	Loss 4.4008 (4.6062)	Top-1 acc 24.609 (19.905)	Top-5 acc 45.312 (40.586)	lr 0.02867
Warmup Train [19][420/3239]	Time 0.639 (0.542)	Data 0.001 (0.034)	Loss 4.7241 (4.6055)	Top-1 acc 17.188 (19.931)	Top-5 acc 37.500 (40.589)	lr 0.02866
Warmup Train [19][430/3239]	Time 0.658 (0.541)	Data 0.001 (0.033)	Loss 4.4779 (4.6043)	Top-1 acc 24.219 (19.928)	Top-5 acc 48.047 (40.631)	lr 0.02865
Warmup Train [19][440/3239]	Time 0.356 (0.540)	Data 0.001 (0.033)	Loss 4.5941 (4.6039)	Top-1 acc 18.359 (19.926)	Top-5 acc 39.062 (40.660)	lr 0.02865
Warmup Train [19][450/3239]	Time 0.661 (0.540)	Data 0.003 (0.032)	Loss 4.7767 (4.6035)	Top-1 acc 16.797 (19.931)	Top-5 acc 37.500 (40.676)	lr 0.02864
Warmup Train [19][460/3239]	Time 0.531 (0.539)	Data 0.001 (0.032)	Loss 4.5188 (4.6030)	Top-1 acc 17.578 (19.942)	Top-5 acc 41.406 (40.667)	lr 0.02864
Warmup Train [19][470/3239]	Time 0.561 (0.538)	Data 0.001 (0.031)	Loss 4.6573 (4.6030)	Top-1 acc 19.922 (19.953)	Top-5 acc 39.453 (40.681)	lr 0.02863
Warmup Train [19][480/3239]	Time 0.421 (0.537)	Data 0.001 (0.030)	Loss 4.5327 (4.6024)	Top-1 acc 23.047 (19.967)	Top-5 acc 40.234 (40.676)	lr 0.02862
Warmup Train [19][490/3239]	Time 0.558 (0.537)	Data 0.001 (0.030)	Loss 4.4811 (4.6020)	Top-1 acc 22.266 (19.985)	Top-5 acc 44.922 (40.696)	lr 0.02862
Warmup Train [19][500/3239]	Time 0.593 (0.537)	Data 0.002 (0.030)	Loss 4.3915 (4.6008)	Top-1 acc 25.391 (20.019)	Top-5 acc 44.922 (40.707)	lr 0.02861
Warmup Train [19][510/3239]	Time 0.484 (0.537)	Data 0.001 (0.029)	Loss 4.4549 (4.6005)	Top-1 acc 25.000 (20.027)	Top-5 acc 41.016 (40.710)	lr 0.02861
Warmup Train [19][520/3239]	Time 0.285 (0.536)	Data 0.001 (0.028)	Loss 4.8243 (4.6003)	Top-1 acc 16.797 (20.031)	Top-5 acc 37.500 (40.696)	lr 0.02860
Warmup Train [19][530/3239]	Time 0.444 (0.535)	Data 0.001 (0.028)	Loss 4.5547 (4.5996)	Top-1 acc 20.312 (20.029)	Top-5 acc 42.578 (40.722)	lr 0.02859
Warmup Train [19][540/3239]	Time 0.524 (0.535)	Data 0.049 (0.028)	Loss 4.4954 (4.5997)	Top-1 acc 21.875 (20.025)	Top-5 acc 46.094 (40.720)	lr 0.02859
Warmup Train [19][550/3239]	Time 0.277 (0.533)	Data 0.001 (0.027)	Loss 4.5006 (4.5988)	Top-1 acc 21.484 (20.045)	Top-5 acc 44.141 (40.748)	lr 0.02858
Warmup Train [19][560/3239]	Time 0.454 (0.533)	Data 0.001 (0.027)	Loss 4.7665 (4.5985)	Top-1 acc 19.531 (20.052)	Top-5 acc 39.453 (40.754)	lr 0.02858
Warmup Train [19][570/3239]	Time 0.518 (0.531)	Data 0.001 (0.027)	Loss 4.5334 (4.5982)	Top-1 acc 19.141 (20.046)	Top-5 acc 40.625 (40.771)	lr 0.02857
Warmup Train [19][580/3239]	Time 0.437 (0.531)	Data 0.001 (0.027)	Loss 4.6127 (4.5978)	Top-1 acc 19.141 (20.063)	Top-5 acc 41.797 (40.788)	lr 0.02856
Warmup Train [19][590/3239]	Time 0.559 (0.531)	Data 0.001 (0.026)	Loss 4.7033 (4.5979)	Top-1 acc 18.750 (20.073)	Top-5 acc 37.109 (40.803)	lr 0.02856
Warmup Train [19][600/3239]	Time 0.387 (0.530)	Data 0.002 (0.026)	Loss 4.6544 (4.5987)	Top-1 acc 19.141 (20.064)	Top-5 acc 39.062 (40.774)	lr 0.02855
Warmup Train [19][610/3239]	Time 0.473 (0.530)	Data 0.001 (0.026)	Loss 4.6244 (4.5983)	Top-1 acc 17.578 (20.080)	Top-5 acc 41.406 (40.778)	lr 0.02855
Warmup Train [19][620/3239]	Time 0.632 (0.530)	Data 0.001 (0.025)	Loss 4.6118 (4.5985)	Top-1 acc 19.531 (20.055)	Top-5 acc 37.891 (40.760)	lr 0.02854
Warmup Train [19][630/3239]	Time 0.542 (0.530)	Data 0.001 (0.025)	Loss 4.4982 (4.5981)	Top-1 acc 23.438 (20.057)	Top-5 acc 42.578 (40.775)	lr 0.02853
Warmup Train [19][640/3239]	Time 0.396 (0.530)	Data 0.002 (0.025)	Loss 4.6935 (4.5986)	Top-1 acc 19.922 (20.064)	Top-5 acc 36.328 (40.764)	lr 0.02853
Warmup Train [19][650/3239]	Time 0.784 (0.530)	Data 0.001 (0.025)	Loss 4.4990 (4.5988)	Top-1 acc 21.094 (20.045)	Top-5 acc 41.406 (40.771)	lr 0.02852
Warmup Train [19][660/3239]	Time 0.617 (0.530)	Data 0.001 (0.024)	Loss 4.4731 (4.5990)	Top-1 acc 20.703 (20.031)	Top-5 acc 44.141 (40.768)	lr 0.02852
Warmup Train [19][670/3239]	Time 0.491 (0.530)	Data 0.001 (0.024)	Loss 4.7634 (4.5996)	Top-1 acc 15.234 (20.020)	Top-5 acc 37.500 (40.755)	lr 0.02851
Warmup Train [19][680/3239]	Time 0.507 (0.530)	Data 0.001 (0.024)	Loss 4.6423 (4.5994)	Top-1 acc 19.531 (20.029)	Top-5 acc 39.453 (40.770)	lr 0.02850
Warmup Train [19][690/3239]	Time 0.466 (0.529)	Data 0.001 (0.023)	Loss 4.4847 (4.5991)	Top-1 acc 17.578 (20.017)	Top-5 acc 45.312 (40.778)	lr 0.02850
Warmup Train [19][700/3239]	Time 0.388 (0.529)	Data 0.001 (0.023)	Loss 4.4853 (4.6000)	Top-1 acc 22.656 (19.998)	Top-5 acc 44.141 (40.751)	lr 0.02849
Warmup Train [19][710/3239]	Time 0.550 (0.529)	Data 0.001 (0.023)	Loss 4.6606 (4.6000)	Top-1 acc 16.797 (19.996)	Top-5 acc 40.234 (40.754)	lr 0.02849
Warmup Train [19][720/3239]	Time 0.525 (0.529)	Data 0.001 (0.023)	Loss 4.5024 (4.5995)	Top-1 acc 25.391 (20.014)	Top-5 acc 42.188 (40.759)	lr 0.02848
Warmup Train [19][730/3239]	Time 0.453 (0.529)	Data 0.001 (0.022)	Loss 4.7586 (4.5990)	Top-1 acc 17.188 (20.011)	Top-5 acc 36.328 (40.764)	lr 0.02847
Warmup Train [19][740/3239]	Time 0.596 (0.529)	Data 0.001 (0.022)	Loss 4.3242 (4.5980)	Top-1 acc 21.484 (20.032)	Top-5 acc 47.656 (40.792)	lr 0.02847
Warmup Train [19][750/3239]	Time 0.657 (0.529)	Data 0.001 (0.022)	Loss 4.5307 (4.5979)	Top-1 acc 24.219 (20.039)	Top-5 acc 43.359 (40.792)	lr 0.02846
Warmup Train [19][760/3239]	Time 0.542 (0.529)	Data 0.001 (0.022)	Loss 4.7341 (4.5981)	Top-1 acc 16.797 (20.045)	Top-5 acc 39.062 (40.796)	lr 0.02846
Warmup Train [19][770/3239]	Time 0.420 (0.528)	Data 0.001 (0.022)	Loss 4.5791 (4.5983)	Top-1 acc 21.484 (20.059)	Top-5 acc 41.016 (40.790)	lr 0.02845
Warmup Train [19][780/3239]	Time 0.555 (0.528)	Data 0.001 (0.021)	Loss 4.5344 (4.5981)	Top-1 acc 21.875 (20.070)	Top-5 acc 39.453 (40.811)	lr 0.02844
Warmup Train [19][790/3239]	Time 0.512 (0.528)	Data 0.001 (0.021)	Loss 4.5918 (4.5978)	Top-1 acc 19.531 (20.072)	Top-5 acc 39.844 (40.823)	lr 0.02844
Warmup Train [19][800/3239]	Time 0.436 (0.528)	Data 0.001 (0.021)	Loss 4.5781 (4.5966)	Top-1 acc 19.922 (20.084)	Top-5 acc 43.750 (40.861)	lr 0.02843
Warmup Train [19][810/3239]	Time 0.456 (0.528)	Data 0.001 (0.021)	Loss 4.8998 (4.5970)	Top-1 acc 16.797 (20.086)	Top-5 acc 37.109 (40.861)	lr 0.02843
Warmup Train [19][820/3239]	Time 0.461 (0.527)	Data 0.001 (0.020)	Loss 4.5421 (4.5966)	Top-1 acc 19.922 (20.097)	Top-5 acc 40.234 (40.865)	lr 0.02842
Warmup Train [19][830/3239]	Time 0.454 (0.527)	Data 0.001 (0.020)	Loss 4.6195 (4.5965)	Top-1 acc 21.094 (20.098)	Top-5 acc 39.062 (40.868)	lr 0.02841
Warmup Train [19][840/3239]	Time 0.267 (0.526)	Data 0.001 (0.020)	Loss 4.7415 (4.5965)	Top-1 acc 15.625 (20.096)	Top-5 acc 37.109 (40.879)	lr 0.02841
Warmup Train [19][850/3239]	Time 0.449 (0.525)	Data 0.001 (0.020)	Loss 4.6390 (4.5961)	Top-1 acc 19.922 (20.104)	Top-5 acc 36.719 (40.878)	lr 0.02840
Warmup Train [19][860/3239]	Time 0.549 (0.525)	Data 0.001 (0.020)	Loss 4.7325 (4.5962)	Top-1 acc 16.406 (20.095)	Top-5 acc 39.453 (40.875)	lr 0.02840
Warmup Train [19][870/3239]	Time 0.446 (0.525)	Data 0.001 (0.020)	Loss 4.4458 (4.5953)	Top-1 acc 21.875 (20.099)	Top-5 acc 46.875 (40.899)	lr 0.02839
Warmup Train [19][880/3239]	Time 0.726 (0.525)	Data 0.001 (0.020)	Loss 4.6882 (4.5951)	Top-1 acc 17.578 (20.104)	Top-5 acc 39.062 (40.903)	lr 0.02838
Warmup Train [19][890/3239]	Time 0.543 (0.525)	Data 0.001 (0.019)	Loss 4.5279 (4.5945)	Top-1 acc 23.438 (20.106)	Top-5 acc 44.141 (40.917)	lr 0.02838
Warmup Train [19][900/3239]	Time 0.692 (0.525)	Data 0.001 (0.019)	Loss 4.6185 (4.5944)	Top-1 acc 21.484 (20.117)	Top-5 acc 42.578 (40.927)	lr 0.02837
Warmup Train [19][910/3239]	Time 0.438 (0.524)	Data 0.001 (0.019)	Loss 4.6028 (4.5944)	Top-1 acc 19.531 (20.114)	Top-5 acc 41.797 (40.938)	lr 0.02837
Warmup Train [19][920/3239]	Time 0.507 (0.524)	Data 0.001 (0.019)	Loss 4.5962 (4.5946)	Top-1 acc 23.828 (20.120)	Top-5 acc 38.281 (40.928)	lr 0.02836
Warmup Train [19][930/3239]	Time 0.530 (0.524)	Data 0.001 (0.019)	Loss 4.5006 (4.5947)	Top-1 acc 25.000 (20.123)	Top-5 acc 42.188 (40.922)	lr 0.02835
Warmup Train [19][940/3239]	Time 0.534 (0.524)	Data 0.001 (0.019)	Loss 4.7057 (4.5948)	Top-1 acc 16.406 (20.117)	Top-5 acc 37.109 (40.915)	lr 0.02835
Warmup Train [19][950/3239]	Time 0.505 (0.524)	Data 0.001 (0.019)	Loss 4.6069 (4.5945)	Top-1 acc 18.359 (20.120)	Top-5 acc 38.281 (40.920)	lr 0.02834
Warmup Train [19][960/3239]	Time 0.515 (0.524)	Data 0.001 (0.018)	Loss 4.3371 (4.5935)	Top-1 acc 21.875 (20.143)	Top-5 acc 46.484 (40.938)	lr 0.02834
Warmup Train [19][970/3239]	Time 0.450 (0.524)	Data 0.001 (0.018)	Loss 4.6855 (4.5929)	Top-1 acc 19.141 (20.150)	Top-5 acc 38.672 (40.957)	lr 0.02833
Warmup Train [19][980/3239]	Time 0.648 (0.524)	Data 0.001 (0.018)	Loss 4.5734 (4.5927)	Top-1 acc 19.922 (20.145)	Top-5 acc 43.359 (40.970)	lr 0.02832
Warmup Train [19][990/3239]	Time 0.659 (0.523)	Data 0.001 (0.018)	Loss 4.6763 (4.5929)	Top-1 acc 22.266 (20.159)	Top-5 acc 40.234 (40.965)	lr 0.02832
Warmup Train [19][1000/3239]	Time 0.540 (0.523)	Data 0.001 (0.018)	Loss 4.7044 (4.5933)	Top-1 acc 18.750 (20.153)	Top-5 acc 35.547 (40.959)	lr 0.02831
Warmup Train [19][1010/3239]	Time 0.547 (0.524)	Data 0.001 (0.018)	Loss 4.3597 (4.5924)	Top-1 acc 23.438 (20.161)	Top-5 acc 47.656 (40.984)	lr 0.02831
Warmup Train [19][1020/3239]	Time 0.530 (0.523)	Data 0.001 (0.017)	Loss 4.6266 (4.5922)	Top-1 acc 21.094 (20.156)	Top-5 acc 37.891 (40.984)	lr 0.02830
Warmup Train [19][1030/3239]	Time 0.513 (0.523)	Data 0.001 (0.017)	Loss 4.7629 (4.5919)	Top-1 acc 17.969 (20.167)	Top-5 acc 36.719 (40.994)	lr 0.02829
Warmup Train [19][1040/3239]	Time 0.515 (0.523)	Data 0.001 (0.017)	Loss 4.3753 (4.5919)	Top-1 acc 23.047 (20.163)	Top-5 acc 49.219 (40.993)	lr 0.02829
Warmup Train [19][1050/3239]	Time 0.685 (0.523)	Data 0.001 (0.017)	Loss 4.6199 (4.5916)	Top-1 acc 19.531 (20.167)	Top-5 acc 40.625 (41.004)	lr 0.02828
Warmup Train [19][1060/3239]	Time 0.571 (0.523)	Data 0.001 (0.017)	Loss 4.6396 (4.5910)	Top-1 acc 19.141 (20.178)	Top-5 acc 41.406 (41.023)	lr 0.02828
Warmup Train [19][1070/3239]	Time 0.564 (0.523)	Data 0.001 (0.017)	Loss 4.5876 (4.5908)	Top-1 acc 21.875 (20.193)	Top-5 acc 38.672 (41.036)	lr 0.02827
Warmup Train [19][1080/3239]	Time 0.462 (0.523)	Data 0.001 (0.017)	Loss 4.5538 (4.5908)	Top-1 acc 21.875 (20.186)	Top-5 acc 38.281 (41.033)	lr 0.02826
Warmup Train [19][1090/3239]	Time 0.471 (0.523)	Data 0.001 (0.017)	Loss 4.4249 (4.5908)	Top-1 acc 23.438 (20.193)	Top-5 acc 48.828 (41.036)	lr 0.02826
Warmup Train [19][1100/3239]	Time 0.480 (0.522)	Data 0.001 (0.016)	Loss 4.5613 (4.5904)	Top-1 acc 20.312 (20.194)	Top-5 acc 41.406 (41.043)	lr 0.02825
Warmup Train [19][1110/3239]	Time 0.448 (0.522)	Data 0.001 (0.016)	Loss 4.5139 (4.5907)	Top-1 acc 21.875 (20.192)	Top-5 acc 44.141 (41.035)	lr 0.02825
Warmup Train [19][1120/3239]	Time 0.363 (0.521)	Data 0.001 (0.016)	Loss 4.5379 (4.5910)	Top-1 acc 22.266 (20.182)	Top-5 acc 42.969 (41.032)	lr 0.02824
Warmup Train [19][1130/3239]	Time 0.444 (0.521)	Data 0.001 (0.016)	Loss 4.8303 (4.5913)	Top-1 acc 16.406 (20.174)	Top-5 acc 35.156 (41.019)	lr 0.02823
Warmup Train [19][1140/3239]	Time 0.470 (0.521)	Data 0.001 (0.016)	Loss 4.5662 (4.5912)	Top-1 acc 17.188 (20.170)	Top-5 acc 42.969 (41.016)	lr 0.02823
Warmup Train [19][1150/3239]	Time 0.422 (0.521)	Data 0.001 (0.016)	Loss 4.7570 (4.5910)	Top-1 acc 18.750 (20.172)	Top-5 acc 34.766 (41.010)	lr 0.02822
Warmup Train [19][1160/3239]	Time 0.376 (0.521)	Data 0.001 (0.016)	Loss 4.7743 (4.5912)	Top-1 acc 19.141 (20.172)	Top-5 acc 35.547 (41.005)	lr 0.02822
Warmup Train [19][1170/3239]	Time 0.530 (0.521)	Data 0.001 (0.016)	Loss 4.4580 (4.5913)	Top-1 acc 22.656 (20.171)	Top-5 acc 44.531 (41.001)	lr 0.02821
Warmup Train [19][1180/3239]	Time 0.545 (0.521)	Data 0.001 (0.016)	Loss 4.6538 (4.5908)	Top-1 acc 18.359 (20.176)	Top-5 acc 38.672 (41.014)	lr 0.02820
Warmup Train [19][1190/3239]	Time 0.635 (0.521)	Data 0.001 (0.016)	Loss 4.8422 (4.5915)	Top-1 acc 14.062 (20.161)	Top-5 acc 33.984 (40.999)	lr 0.02820
Warmup Train [19][1200/3239]	Time 0.569 (0.521)	Data 0.001 (0.016)	Loss 4.4127 (4.5914)	Top-1 acc 19.141 (20.157)	Top-5 acc 42.578 (40.996)	lr 0.02819
Warmup Train [19][1210/3239]	Time 0.463 (0.521)	Data 0.001 (0.016)	Loss 4.5083 (4.5911)	Top-1 acc 21.875 (20.164)	Top-5 acc 45.312 (41.014)	lr 0.02819
Warmup Train [19][1220/3239]	Time 0.391 (0.520)	Data 0.001 (0.015)	Loss 4.6796 (4.5913)	Top-1 acc 21.484 (20.159)	Top-5 acc 38.281 (41.014)	lr 0.02818
Warmup Train [19][1230/3239]	Time 0.473 (0.520)	Data 0.001 (0.015)	Loss 4.7947 (4.5915)	Top-1 acc 20.312 (20.163)	Top-5 acc 37.109 (41.012)	lr 0.02817
Warmup Train [19][1240/3239]	Time 0.456 (0.520)	Data 0.001 (0.015)	Loss 4.7963 (4.5915)	Top-1 acc 21.875 (20.162)	Top-5 acc 35.547 (41.016)	lr 0.02817
Warmup Train [19][1250/3239]	Time 0.555 (0.520)	Data 0.001 (0.015)	Loss 4.3382 (4.5911)	Top-1 acc 29.297 (20.171)	Top-5 acc 47.266 (41.027)	lr 0.02816
Warmup Train [19][1260/3239]	Time 0.509 (0.519)	Data 0.001 (0.015)	Loss 4.5971 (4.5914)	Top-1 acc 22.266 (20.160)	Top-5 acc 42.188 (41.019)	lr 0.02815
Warmup Train [19][1270/3239]	Time 0.443 (0.519)	Data 0.001 (0.015)	Loss 4.6622 (4.5913)	Top-1 acc 16.797 (20.154)	Top-5 acc 41.016 (41.018)	lr 0.02815
Warmup Train [19][1280/3239]	Time 0.420 (0.519)	Data 0.001 (0.015)	Loss 4.5520 (4.5913)	Top-1 acc 18.359 (20.148)	Top-5 acc 43.750 (41.021)	lr 0.02814
Warmup Train [19][1290/3239]	Time 0.390 (0.519)	Data 0.001 (0.015)	Loss 4.4321 (4.5909)	Top-1 acc 23.828 (20.151)	Top-5 acc 41.016 (41.028)	lr 0.02814
Warmup Train [19][1300/3239]	Time 0.487 (0.519)	Data 0.001 (0.015)	Loss 4.5372 (4.5907)	Top-1 acc 21.094 (20.157)	Top-5 acc 42.188 (41.026)	lr 0.02813
Warmup Train [19][1310/3239]	Time 0.519 (0.519)	Data 0.001 (0.015)	Loss 4.7556 (4.5908)	Top-1 acc 18.359 (20.149)	Top-5 acc 39.062 (41.026)	lr 0.02812
Warmup Train [19][1320/3239]	Time 0.549 (0.519)	Data 0.001 (0.015)	Loss 4.6293 (4.5909)	Top-1 acc 17.969 (20.145)	Top-5 acc 41.016 (41.030)	lr 0.02812
Warmup Train [19][1330/3239]	Time 0.559 (0.519)	Data 0.001 (0.015)	Loss 4.3922 (4.5906)	Top-1 acc 26.172 (20.149)	Top-5 acc 45.312 (41.038)	lr 0.02811
Warmup Train [19][1340/3239]	Time 0.479 (0.519)	Data 0.001 (0.015)	Loss 4.6982 (4.5907)	Top-1 acc 15.625 (20.144)	Top-5 acc 36.719 (41.033)	lr 0.02811
Warmup Train [19][1350/3239]	Time 0.499 (0.519)	Data 0.001 (0.015)	Loss 4.4495 (4.5905)	Top-1 acc 21.094 (20.143)	Top-5 acc 44.922 (41.047)	lr 0.02810
Warmup Train [19][1360/3239]	Time 0.503 (0.519)	Data 0.001 (0.015)	Loss 4.6093 (4.5901)	Top-1 acc 17.188 (20.149)	Top-5 acc 42.578 (41.058)	lr 0.02809
Warmup Train [19][1370/3239]	Time 0.470 (0.519)	Data 0.001 (0.015)	Loss 4.5152 (4.5900)	Top-1 acc 18.750 (20.150)	Top-5 acc 42.578 (41.060)	lr 0.02809
Warmup Train [19][1380/3239]	Time 0.552 (0.518)	Data 0.001 (0.014)	Loss 4.4190 (4.5898)	Top-1 acc 22.656 (20.147)	Top-5 acc 45.703 (41.066)	lr 0.02808
Warmup Train [19][1390/3239]	Time 0.493 (0.518)	Data 0.001 (0.014)	Loss 4.6265 (4.5897)	Top-1 acc 19.922 (20.148)	Top-5 acc 39.062 (41.070)	lr 0.02808
Warmup Train [19][1400/3239]	Time 0.171 (0.518)	Data 0.001 (0.014)	Loss 4.5173 (4.5893)	Top-1 acc 21.875 (20.150)	Top-5 acc 45.312 (41.083)	lr 0.02807
Warmup Train [19][1410/3239]	Time 0.532 (0.518)	Data 0.001 (0.014)	Loss 4.4651 (4.5888)	Top-1 acc 21.094 (20.150)	Top-5 acc 46.484 (41.096)	lr 0.02806
Warmup Train [19][1420/3239]	Time 0.566 (0.518)	Data 0.001 (0.014)	Loss 4.5485 (4.5889)	Top-1 acc 18.359 (20.149)	Top-5 acc 42.188 (41.090)	lr 0.02806
Warmup Train [19][1430/3239]	Time 0.590 (0.517)	Data 0.001 (0.014)	Loss 4.4414 (4.5886)	Top-1 acc 23.047 (20.151)	Top-5 acc 44.531 (41.093)	lr 0.02805
Warmup Train [19][1440/3239]	Time 0.518 (0.518)	Data 0.001 (0.014)	Loss 4.4943 (4.5886)	Top-1 acc 20.703 (20.142)	Top-5 acc 46.484 (41.095)	lr 0.02805
Warmup Train [19][1450/3239]	Time 0.537 (0.517)	Data 0.001 (0.014)	Loss 4.4823 (4.5881)	Top-1 acc 21.875 (20.152)	Top-5 acc 46.875 (41.104)	lr 0.02804
Warmup Train [19][1460/3239]	Time 0.451 (0.517)	Data 0.001 (0.014)	Loss 4.7247 (4.5882)	Top-1 acc 14.844 (20.137)	Top-5 acc 37.500 (41.104)	lr 0.02803
Warmup Train [19][1470/3239]	Time 0.334 (0.518)	Data 0.001 (0.014)	Loss 4.5831 (4.5880)	Top-1 acc 19.141 (20.143)	Top-5 acc 40.625 (41.108)	lr 0.02803
Warmup Train [19][1480/3239]	Time 0.499 (0.518)	Data 0.001 (0.014)	Loss 4.5226 (4.5881)	Top-1 acc 22.266 (20.138)	Top-5 acc 43.359 (41.105)	lr 0.02802
Warmup Train [19][1490/3239]	Time 0.339 (0.518)	Data 0.001 (0.014)	Loss 4.4505 (4.5881)	Top-1 acc 26.172 (20.142)	Top-5 acc 45.312 (41.108)	lr 0.02802
Warmup Train [19][1500/3239]	Time 0.499 (0.518)	Data 0.001 (0.014)	Loss 4.7502 (4.5881)	Top-1 acc 17.969 (20.139)	Top-5 acc 41.016 (41.104)	lr 0.02801
Warmup Train [19][1510/3239]	Time 0.562 (0.518)	Data 0.001 (0.014)	Loss 4.6803 (4.5878)	Top-1 acc 19.922 (20.151)	Top-5 acc 37.500 (41.112)	lr 0.02800
Warmup Train [19][1520/3239]	Time 0.576 (0.518)	Data 0.001 (0.014)	Loss 4.5437 (4.5877)	Top-1 acc 21.484 (20.153)	Top-5 acc 42.969 (41.121)	lr 0.02800
Warmup Train [19][1530/3239]	Time 0.522 (0.518)	Data 0.001 (0.014)	Loss 4.5458 (4.5875)	Top-1 acc 20.703 (20.161)	Top-5 acc 43.750 (41.129)	lr 0.02799
Warmup Train [19][1540/3239]	Time 0.591 (0.518)	Data 0.001 (0.014)	Loss 4.6130 (4.5874)	Top-1 acc 21.484 (20.161)	Top-5 acc 44.531 (41.134)	lr 0.02799
Warmup Train [19][1550/3239]	Time 0.469 (0.518)	Data 0.001 (0.014)	Loss 4.6184 (4.5873)	Top-1 acc 18.359 (20.169)	Top-5 acc 41.016 (41.141)	lr 0.02798
Warmup Train [19][1560/3239]	Time 0.543 (0.518)	Data 0.001 (0.014)	Loss 4.6700 (4.5871)	Top-1 acc 17.188 (20.176)	Top-5 acc 39.844 (41.149)	lr 0.02797
Warmup Train [19][1570/3239]	Time 0.647 (0.518)	Data 0.001 (0.014)	Loss 4.6770 (4.5870)	Top-1 acc 19.531 (20.178)	Top-5 acc 40.625 (41.155)	lr 0.02797
Warmup Train [19][1580/3239]	Time 0.491 (0.518)	Data 0.001 (0.014)	Loss 4.5135 (4.5871)	Top-1 acc 19.922 (20.174)	Top-5 acc 44.922 (41.154)	lr 0.02796
Warmup Train [19][1590/3239]	Time 0.395 (0.518)	Data 0.001 (0.014)	Loss 4.4820 (4.5871)	Top-1 acc 20.312 (20.174)	Top-5 acc 41.406 (41.150)	lr 0.02796
Warmup Train [19][1600/3239]	Time 0.630 (0.518)	Data 0.001 (0.014)	Loss 4.5693 (4.5871)	Top-1 acc 24.219 (20.176)	Top-5 acc 43.750 (41.153)	lr 0.02795
Warmup Train [19][1610/3239]	Time 0.545 (0.518)	Data 0.002 (0.014)	Loss 4.3934 (4.5870)	Top-1 acc 25.781 (20.179)	Top-5 acc 45.312 (41.154)	lr 0.02794
Warmup Train [19][1620/3239]	Time 0.687 (0.518)	Data 0.001 (0.013)	Loss 4.6339 (4.5867)	Top-1 acc 17.188 (20.183)	Top-5 acc 38.672 (41.159)	lr 0.02794
Warmup Train [19][1630/3239]	Time 0.528 (0.518)	Data 0.001 (0.013)	Loss 4.6395 (4.5868)	Top-1 acc 16.016 (20.182)	Top-5 acc 38.672 (41.162)	lr 0.02793
Warmup Train [19][1640/3239]	Time 0.469 (0.518)	Data 0.001 (0.013)	Loss 4.5110 (4.5866)	Top-1 acc 23.438 (20.191)	Top-5 acc 43.750 (41.165)	lr 0.02793
Warmup Train [19][1650/3239]	Time 0.588 (0.518)	Data 0.001 (0.013)	Loss 4.5584 (4.5870)	Top-1 acc 21.484 (20.184)	Top-5 acc 43.359 (41.163)	lr 0.02792
Warmup Train [19][1660/3239]	Time 0.582 (0.517)	Data 0.001 (0.013)	Loss 4.6668 (4.5869)	Top-1 acc 19.531 (20.188)	Top-5 acc 39.844 (41.161)	lr 0.02791
Warmup Train [19][1670/3239]	Time 0.536 (0.517)	Data 0.001 (0.013)	Loss 4.5309 (4.5869)	Top-1 acc 19.922 (20.191)	Top-5 acc 40.625 (41.166)	lr 0.02791
Warmup Train [19][1680/3239]	Time 0.437 (0.517)	Data 0.001 (0.013)	Loss 4.5373 (4.5866)	Top-1 acc 21.484 (20.192)	Top-5 acc 44.141 (41.169)	lr 0.02790
Warmup Train [19][1690/3239]	Time 0.536 (0.517)	Data 0.001 (0.013)	Loss 4.4421 (4.5865)	Top-1 acc 24.219 (20.191)	Top-5 acc 41.797 (41.171)	lr 0.02790
Warmup Train [19][1700/3239]	Time 0.561 (0.517)	Data 0.001 (0.013)	Loss 4.5326 (4.5866)	Top-1 acc 21.875 (20.197)	Top-5 acc 42.969 (41.175)	lr 0.02789
Warmup Train [19][1710/3239]	Time 0.612 (0.517)	Data 0.001 (0.013)	Loss 4.7568 (4.5867)	Top-1 acc 19.531 (20.191)	Top-5 acc 35.938 (41.170)	lr 0.02788
Warmup Train [19][1720/3239]	Time 0.655 (0.517)	Data 0.001 (0.013)	Loss 4.4578 (4.5865)	Top-1 acc 21.875 (20.198)	Top-5 acc 45.312 (41.175)	lr 0.02788
Warmup Train [19][1730/3239]	Time 0.428 (0.517)	Data 0.001 (0.013)	Loss 4.6855 (4.5865)	Top-1 acc 18.750 (20.194)	Top-5 acc 37.500 (41.172)	lr 0.02787
Warmup Train [19][1740/3239]	Time 0.503 (0.517)	Data 0.001 (0.013)	Loss 4.6659 (4.5867)	Top-1 acc 20.312 (20.192)	Top-5 acc 39.844 (41.164)	lr 0.02787
Warmup Train [19][1750/3239]	Time 0.591 (0.517)	Data 0.001 (0.013)	Loss 4.6357 (4.5866)	Top-1 acc 22.656 (20.198)	Top-5 acc 46.094 (41.171)	lr 0.02786
Warmup Train [19][1760/3239]	Time 0.527 (0.517)	Data 0.001 (0.013)	Loss 4.5805 (4.5864)	Top-1 acc 19.141 (20.195)	Top-5 acc 39.844 (41.171)	lr 0.02785
Warmup Train [19][1770/3239]	Time 0.470 (0.517)	Data 0.001 (0.013)	Loss 4.5622 (4.5862)	Top-1 acc 21.484 (20.198)	Top-5 acc 37.891 (41.172)	lr 0.02785
Warmup Train [19][1780/3239]	Time 0.568 (0.517)	Data 0.001 (0.013)	Loss 4.7807 (4.5861)	Top-1 acc 15.234 (20.194)	Top-5 acc 36.328 (41.169)	lr 0.02784
Warmup Train [19][1790/3239]	Time 0.510 (0.517)	Data 0.001 (0.013)	Loss 4.7943 (4.5862)	Top-1 acc 20.703 (20.201)	Top-5 acc 36.719 (41.167)	lr 0.02784
Warmup Train [19][1800/3239]	Time 0.544 (0.517)	Data 0.001 (0.013)	Loss 4.6562 (4.5861)	Top-1 acc 17.969 (20.206)	Top-5 acc 37.500 (41.171)	lr 0.02783
Warmup Train [19][1810/3239]	Time 0.592 (0.517)	Data 0.001 (0.012)	Loss 4.6774 (4.5858)	Top-1 acc 15.625 (20.207)	Top-5 acc 39.844 (41.176)	lr 0.02782
Warmup Train [19][1820/3239]	Time 0.376 (0.517)	Data 0.002 (0.012)	Loss 4.6390 (4.5857)	Top-1 acc 18.359 (20.208)	Top-5 acc 39.453 (41.187)	lr 0.02782
Warmup Train [19][1830/3239]	Time 0.509 (0.517)	Data 0.001 (0.012)	Loss 4.5332 (4.5858)	Top-1 acc 21.484 (20.203)	Top-5 acc 43.359 (41.181)	lr 0.02781
Warmup Train [19][1840/3239]	Time 0.481 (0.517)	Data 0.001 (0.012)	Loss 4.6920 (4.5859)	Top-1 acc 18.750 (20.201)	Top-5 acc 39.844 (41.181)	lr 0.02781
Warmup Train [19][1850/3239]	Time 0.586 (0.517)	Data 0.001 (0.012)	Loss 4.7533 (4.5857)	Top-1 acc 19.141 (20.200)	Top-5 acc 38.672 (41.185)	lr 0.02780
Warmup Train [19][1860/3239]	Time 0.525 (0.517)	Data 0.001 (0.012)	Loss 4.6425 (4.5858)	Top-1 acc 23.438 (20.206)	Top-5 acc 40.625 (41.189)	lr 0.02779
Warmup Train [19][1870/3239]	Time 0.353 (0.517)	Data 0.001 (0.012)	Loss 4.7978 (4.5859)	Top-1 acc 17.188 (20.201)	Top-5 acc 38.281 (41.187)	lr 0.02779
Warmup Train [19][1880/3239]	Time 0.374 (0.517)	Data 0.001 (0.012)	Loss 4.2865 (4.5860)	Top-1 acc 24.219 (20.204)	Top-5 acc 46.875 (41.192)	lr 0.02778
Warmup Train [19][1890/3239]	Time 0.485 (0.517)	Data 0.001 (0.012)	Loss 4.3972 (4.5857)	Top-1 acc 21.484 (20.206)	Top-5 acc 47.266 (41.194)	lr 0.02778
Warmup Train [19][1900/3239]	Time 0.311 (0.517)	Data 0.001 (0.012)	Loss 4.7230 (4.5859)	Top-1 acc 19.531 (20.205)	Top-5 acc 39.453 (41.196)	lr 0.02777
Warmup Train [19][1910/3239]	Time 0.378 (0.517)	Data 0.001 (0.012)	Loss 4.5919 (4.5859)	Top-1 acc 21.094 (20.206)	Top-5 acc 41.406 (41.195)	lr 0.02776
Warmup Train [19][1920/3239]	Time 0.689 (0.517)	Data 0.001 (0.012)	Loss 4.5935 (4.5859)	Top-1 acc 21.094 (20.205)	Top-5 acc 37.891 (41.191)	lr 0.02776
Warmup Train [19][1930/3239]	Time 0.245 (0.517)	Data 0.001 (0.012)	Loss 4.6261 (4.5856)	Top-1 acc 19.531 (20.209)	Top-5 acc 41.406 (41.198)	lr 0.02775
Warmup Train [19][1940/3239]	Time 0.345 (0.516)	Data 0.001 (0.012)	Loss 4.5444 (4.5855)	Top-1 acc 19.141 (20.214)	Top-5 acc 43.750 (41.199)	lr 0.02775
Warmup Train [19][1950/3239]	Time 0.468 (0.516)	Data 0.001 (0.012)	Loss 4.6278 (4.5858)	Top-1 acc 20.703 (20.216)	Top-5 acc 42.188 (41.189)	lr 0.02774
Warmup Train [19][1960/3239]	Time 0.312 (0.516)	Data 0.002 (0.012)	Loss 4.7972 (4.5859)	Top-1 acc 17.578 (20.209)	Top-5 acc 37.109 (41.182)	lr 0.02773
Warmup Train [19][1970/3239]	Time 0.435 (0.516)	Data 0.001 (0.012)	Loss 4.4642 (4.5860)	Top-1 acc 21.094 (20.213)	Top-5 acc 44.922 (41.186)	lr 0.02773
Warmup Train [19][1980/3239]	Time 0.443 (0.516)	Data 0.001 (0.012)	Loss 4.5910 (4.5857)	Top-1 acc 22.266 (20.213)	Top-5 acc 40.234 (41.196)	lr 0.02772
Warmup Train [19][1990/3239]	Time 0.484 (0.516)	Data 0.001 (0.012)	Loss 4.3536 (4.5857)	Top-1 acc 24.609 (20.211)	Top-5 acc 45.703 (41.189)	lr 0.02772
Warmup Train [19][2000/3239]	Time 0.405 (0.516)	Data 0.001 (0.012)	Loss 4.3858 (4.5854)	Top-1 acc 22.656 (20.219)	Top-5 acc 45.312 (41.199)	lr 0.02771
Warmup Train [19][2010/3239]	Time 0.506 (0.516)	Data 0.002 (0.012)	Loss 4.4141 (4.5853)	Top-1 acc 18.750 (20.218)	Top-5 acc 44.922 (41.201)	lr 0.02770
Warmup Train [19][2020/3239]	Time 0.461 (0.516)	Data 0.001 (0.012)	Loss 4.6284 (4.5853)	Top-1 acc 20.312 (20.220)	Top-5 acc 41.016 (41.205)	lr 0.02770
Warmup Train [19][2030/3239]	Time 0.447 (0.516)	Data 0.001 (0.012)	Loss 4.4687 (4.5850)	Top-1 acc 17.969 (20.220)	Top-5 acc 39.453 (41.207)	lr 0.02769
Warmup Train [19][2040/3239]	Time 0.613 (0.516)	Data 0.001 (0.012)	Loss 4.6515 (4.5852)	Top-1 acc 18.750 (20.217)	Top-5 acc 39.453 (41.203)	lr 0.02769
Warmup Train [19][2050/3239]	Time 0.581 (0.516)	Data 0.001 (0.012)	Loss 4.6079 (4.5853)	Top-1 acc 23.438 (20.217)	Top-5 acc 41.406 (41.201)	lr 0.02768
Warmup Train [19][2060/3239]	Time 0.482 (0.516)	Data 0.001 (0.012)	Loss 4.6463 (4.5854)	Top-1 acc 18.359 (20.210)	Top-5 acc 41.406 (41.201)	lr 0.02767
Warmup Train [19][2070/3239]	Time 0.474 (0.516)	Data 0.001 (0.012)	Loss 4.4689 (4.5853)	Top-1 acc 21.875 (20.213)	Top-5 acc 43.359 (41.203)	lr 0.02767
Warmup Train [19][2080/3239]	Time 0.529 (0.516)	Data 0.001 (0.012)	Loss 4.5202 (4.5852)	Top-1 acc 21.094 (20.211)	Top-5 acc 43.750 (41.201)	lr 0.02766
Warmup Train [19][2090/3239]	Time 0.547 (0.516)	Data 0.002 (0.012)	Loss 4.7227 (4.5852)	Top-1 acc 19.922 (20.210)	Top-5 acc 37.109 (41.202)	lr 0.02766
Warmup Train [19][2100/3239]	Time 0.495 (0.516)	Data 0.001 (0.012)	Loss 4.4885 (4.5853)	Top-1 acc 20.703 (20.209)	Top-5 acc 40.625 (41.193)	lr 0.02765
Warmup Train [19][2110/3239]	Time 0.546 (0.516)	Data 0.001 (0.012)	Loss 4.5308 (4.5853)	Top-1 acc 21.484 (20.208)	Top-5 acc 39.844 (41.186)	lr 0.02764
Warmup Train [19][2120/3239]	Time 0.486 (0.516)	Data 0.001 (0.012)	Loss 4.5488 (4.5850)	Top-1 acc 20.312 (20.213)	Top-5 acc 41.016 (41.192)	lr 0.02764
Warmup Train [19][2130/3239]	Time 0.571 (0.516)	Data 0.001 (0.012)	Loss 4.4490 (4.5852)	Top-1 acc 23.828 (20.209)	Top-5 acc 42.578 (41.188)	lr 0.02763
Warmup Train [19][2140/3239]	Time 0.518 (0.516)	Data 0.001 (0.012)	Loss 4.7728 (4.5852)	Top-1 acc 17.188 (20.212)	Top-5 acc 35.156 (41.188)	lr 0.02763
Warmup Train [19][2150/3239]	Time 0.673 (0.516)	Data 0.001 (0.012)	Loss 4.7035 (4.5854)	Top-1 acc 13.281 (20.210)	Top-5 acc 35.547 (41.181)	lr 0.02762
Warmup Train [19][2160/3239]	Time 0.498 (0.516)	Data 0.001 (0.012)	Loss 4.7627 (4.5857)	Top-1 acc 17.578 (20.205)	Top-5 acc 37.109 (41.178)	lr 0.02761
Warmup Train [19][2170/3239]	Time 0.646 (0.516)	Data 0.001 (0.012)	Loss 4.5153 (4.5859)	Top-1 acc 20.312 (20.201)	Top-5 acc 41.406 (41.175)	lr 0.02761
Warmup Train [19][2180/3239]	Time 0.517 (0.516)	Data 0.001 (0.012)	Loss 4.4055 (4.5859)	Top-1 acc 21.484 (20.202)	Top-5 acc 46.875 (41.178)	lr 0.02760
Warmup Train [19][2190/3239]	Time 0.559 (0.516)	Data 0.001 (0.012)	Loss 4.7412 (4.5861)	Top-1 acc 15.625 (20.201)	Top-5 acc 36.719 (41.176)	lr 0.02760
Warmup Train [19][2200/3239]	Time 0.537 (0.516)	Data 0.001 (0.012)	Loss 4.6098 (4.5859)	Top-1 acc 21.484 (20.206)	Top-5 acc 39.844 (41.177)	lr 0.02759
Warmup Train [19][2210/3239]	Time 0.461 (0.515)	Data 0.001 (0.012)	Loss 4.4517 (4.5858)	Top-1 acc 22.266 (20.208)	Top-5 acc 43.750 (41.183)	lr 0.02758
Warmup Train [19][2220/3239]	Time 0.506 (0.515)	Data 0.001 (0.012)	Loss 4.5851 (4.5857)	Top-1 acc 22.656 (20.208)	Top-5 acc 42.188 (41.191)	lr 0.02758
Warmup Train [19][2230/3239]	Time 0.514 (0.515)	Data 0.001 (0.012)	Loss 4.5730 (4.5857)	Top-1 acc 18.750 (20.209)	Top-5 acc 35.938 (41.189)	lr 0.02757
Warmup Train [19][2240/3239]	Time 0.325 (0.515)	Data 0.001 (0.012)	Loss 4.5437 (4.5857)	Top-1 acc 18.750 (20.209)	Top-5 acc 41.797 (41.194)	lr 0.02756
Warmup Train [19][2250/3239]	Time 0.485 (0.515)	Data 0.002 (0.012)	Loss 4.6694 (4.5855)	Top-1 acc 20.703 (20.212)	Top-5 acc 41.406 (41.199)	lr 0.02756
Warmup Train [19][2260/3239]	Time 0.518 (0.515)	Data 0.001 (0.012)	Loss 4.6476 (4.5853)	Top-1 acc 18.750 (20.217)	Top-5 acc 39.062 (41.204)	lr 0.02755
Warmup Train [19][2270/3239]	Time 0.595 (0.515)	Data 0.001 (0.012)	Loss 4.6113 (4.5853)	Top-1 acc 16.797 (20.216)	Top-5 acc 40.625 (41.208)	lr 0.02755
Warmup Train [19][2280/3239]	Time 0.672 (0.515)	Data 0.001 (0.011)	Loss 4.5497 (4.5852)	Top-1 acc 19.141 (20.214)	Top-5 acc 40.625 (41.208)	lr 0.02754
Warmup Train [19][2290/3239]	Time 0.554 (0.515)	Data 0.001 (0.011)	Loss 4.7094 (4.5852)	Top-1 acc 21.484 (20.211)	Top-5 acc 38.281 (41.205)	lr 0.02753
Warmup Train [19][2300/3239]	Time 0.411 (0.515)	Data 0.001 (0.011)	Loss 4.7402 (4.5852)	Top-1 acc 20.312 (20.213)	Top-5 acc 38.672 (41.205)	lr 0.02753
Warmup Train [19][2310/3239]	Time 0.502 (0.515)	Data 0.001 (0.011)	Loss 4.6679 (4.5850)	Top-1 acc 19.531 (20.217)	Top-5 acc 38.281 (41.210)	lr 0.02752
Warmup Train [19][2320/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 4.6043 (4.5849)	Top-1 acc 19.531 (20.217)	Top-5 acc 41.797 (41.215)	lr 0.02752
Warmup Train [19][2330/3239]	Time 0.541 (0.515)	Data 0.001 (0.011)	Loss 4.6852 (4.5847)	Top-1 acc 22.266 (20.224)	Top-5 acc 38.672 (41.221)	lr 0.02751
Warmup Train [19][2340/3239]	Time 0.581 (0.515)	Data 0.001 (0.011)	Loss 4.6563 (4.5846)	Top-1 acc 19.922 (20.232)	Top-5 acc 37.109 (41.223)	lr 0.02750
Warmup Train [19][2350/3239]	Time 0.545 (0.515)	Data 0.001 (0.011)	Loss 4.6445 (4.5846)	Top-1 acc 17.578 (20.230)	Top-5 acc 39.844 (41.220)	lr 0.02750
Warmup Train [19][2360/3239]	Time 0.506 (0.515)	Data 0.001 (0.011)	Loss 4.5026 (4.5845)	Top-1 acc 22.656 (20.237)	Top-5 acc 42.578 (41.220)	lr 0.02749
Warmup Train [19][2370/3239]	Time 0.543 (0.515)	Data 0.001 (0.011)	Loss 4.7907 (4.5844)	Top-1 acc 14.062 (20.237)	Top-5 acc 36.719 (41.226)	lr 0.02749
Warmup Train [19][2380/3239]	Time 0.462 (0.515)	Data 0.001 (0.011)	Loss 4.6066 (4.5845)	Top-1 acc 18.359 (20.234)	Top-5 acc 41.406 (41.221)	lr 0.02748
Warmup Train [19][2390/3239]	Time 0.405 (0.515)	Data 0.001 (0.011)	Loss 4.4153 (4.5843)	Top-1 acc 23.047 (20.239)	Top-5 acc 45.703 (41.231)	lr 0.02747
Warmup Train [19][2400/3239]	Time 0.652 (0.515)	Data 0.002 (0.011)	Loss 4.7267 (4.5841)	Top-1 acc 18.750 (20.244)	Top-5 acc 38.281 (41.238)	lr 0.02747
Warmup Train [19][2410/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 4.5950 (4.5841)	Top-1 acc 17.578 (20.244)	Top-5 acc 39.453 (41.238)	lr 0.02746
Warmup Train [19][2420/3239]	Time 0.539 (0.515)	Data 0.001 (0.011)	Loss 4.4503 (4.5836)	Top-1 acc 21.875 (20.255)	Top-5 acc 47.656 (41.251)	lr 0.02746
Warmup Train [19][2430/3239]	Time 0.655 (0.515)	Data 0.001 (0.011)	Loss 4.6242 (4.5835)	Top-1 acc 19.531 (20.255)	Top-5 acc 41.016 (41.255)	lr 0.02745
Warmup Train [19][2440/3239]	Time 0.518 (0.515)	Data 0.001 (0.011)	Loss 4.6431 (4.5836)	Top-1 acc 19.922 (20.257)	Top-5 acc 41.406 (41.256)	lr 0.02744
Warmup Train [19][2450/3239]	Time 0.477 (0.515)	Data 0.001 (0.011)	Loss 4.4747 (4.5835)	Top-1 acc 20.703 (20.254)	Top-5 acc 42.188 (41.254)	lr 0.02744
Warmup Train [19][2460/3239]	Time 0.485 (0.515)	Data 0.001 (0.011)	Loss 4.3903 (4.5834)	Top-1 acc 25.781 (20.258)	Top-5 acc 43.750 (41.259)	lr 0.02743
Warmup Train [19][2470/3239]	Time 0.666 (0.515)	Data 0.001 (0.011)	Loss 4.5737 (4.5832)	Top-1 acc 21.484 (20.260)	Top-5 acc 40.625 (41.264)	lr 0.02743
Warmup Train [19][2480/3239]	Time 0.518 (0.515)	Data 0.001 (0.011)	Loss 4.5409 (4.5830)	Top-1 acc 19.531 (20.262)	Top-5 acc 43.359 (41.267)	lr 0.02742
Warmup Train [19][2490/3239]	Time 0.530 (0.515)	Data 0.001 (0.011)	Loss 4.5362 (4.5829)	Top-1 acc 21.484 (20.265)	Top-5 acc 42.578 (41.272)	lr 0.02741
Warmup Train [19][2500/3239]	Time 0.488 (0.515)	Data 0.026 (0.011)	Loss 4.5646 (4.5828)	Top-1 acc 21.094 (20.267)	Top-5 acc 38.672 (41.274)	lr 0.02741
Warmup Train [19][2510/3239]	Time 0.173 (0.514)	Data 0.001 (0.011)	Loss 4.7918 (4.5828)	Top-1 acc 19.531 (20.268)	Top-5 acc 37.500 (41.276)	lr 0.02740
Warmup Train [19][2520/3239]	Time 0.436 (0.514)	Data 0.001 (0.011)	Loss 4.5309 (4.5825)	Top-1 acc 19.531 (20.275)	Top-5 acc 42.188 (41.281)	lr 0.02740
Warmup Train [19][2530/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 4.5835 (4.5822)	Top-1 acc 21.875 (20.282)	Top-5 acc 44.531 (41.291)	lr 0.02739
Warmup Train [19][2540/3239]	Time 0.680 (0.514)	Data 0.001 (0.011)	Loss 4.5728 (4.5822)	Top-1 acc 16.406 (20.278)	Top-5 acc 41.406 (41.288)	lr 0.02738
Warmup Train [19][2550/3239]	Time 0.529 (0.515)	Data 0.001 (0.011)	Loss 4.7437 (4.5821)	Top-1 acc 22.266 (20.284)	Top-5 acc 37.109 (41.293)	lr 0.02738
Warmup Train [19][2560/3239]	Time 0.452 (0.514)	Data 0.001 (0.011)	Loss 4.6839 (4.5821)	Top-1 acc 17.188 (20.285)	Top-5 acc 39.844 (41.293)	lr 0.02737
Warmup Train [19][2570/3239]	Time 0.500 (0.515)	Data 0.001 (0.011)	Loss 4.3844 (4.5818)	Top-1 acc 24.219 (20.288)	Top-5 acc 45.703 (41.303)	lr 0.02737
Warmup Train [19][2580/3239]	Time 0.459 (0.514)	Data 0.002 (0.011)	Loss 4.3544 (4.5817)	Top-1 acc 19.922 (20.289)	Top-5 acc 44.531 (41.305)	lr 0.02736
Warmup Train [19][2590/3239]	Time 0.469 (0.514)	Data 0.004 (0.011)	Loss 4.4718 (4.5816)	Top-1 acc 23.438 (20.289)	Top-5 acc 43.359 (41.310)	lr 0.02735
Warmup Train [19][2600/3239]	Time 0.486 (0.514)	Data 0.001 (0.011)	Loss 4.7302 (4.5815)	Top-1 acc 16.797 (20.290)	Top-5 acc 39.062 (41.308)	lr 0.02735
Warmup Train [19][2610/3239]	Time 0.355 (0.514)	Data 0.001 (0.011)	Loss 4.6258 (4.5816)	Top-1 acc 21.484 (20.291)	Top-5 acc 42.969 (41.306)	lr 0.02734
Warmup Train [19][2620/3239]	Time 0.496 (0.514)	Data 0.001 (0.011)	Loss 4.4958 (4.5814)	Top-1 acc 20.312 (20.293)	Top-5 acc 42.578 (41.308)	lr 0.02734
Warmup Train [19][2630/3239]	Time 0.636 (0.514)	Data 0.001 (0.011)	Loss 4.7216 (4.5816)	Top-1 acc 17.578 (20.292)	Top-5 acc 37.891 (41.301)	lr 0.02733
Warmup Train [19][2640/3239]	Time 0.525 (0.514)	Data 0.001 (0.011)	Loss 4.4724 (4.5814)	Top-1 acc 22.266 (20.297)	Top-5 acc 42.969 (41.303)	lr 0.02732
Warmup Train [19][2650/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 4.6074 (4.5813)	Top-1 acc 21.094 (20.300)	Top-5 acc 42.578 (41.305)	lr 0.02732
Warmup Train [19][2660/3239]	Time 0.602 (0.514)	Data 0.001 (0.011)	Loss 4.5923 (4.5813)	Top-1 acc 17.578 (20.301)	Top-5 acc 44.141 (41.312)	lr 0.02731
Warmup Train [19][2670/3239]	Time 0.397 (0.514)	Data 0.001 (0.011)	Loss 4.5844 (4.5812)	Top-1 acc 21.094 (20.300)	Top-5 acc 41.406 (41.311)	lr 0.02731
Warmup Train [19][2680/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 4.4393 (4.5812)	Top-1 acc 20.312 (20.301)	Top-5 acc 44.922 (41.311)	lr 0.02730
Warmup Train [19][2690/3239]	Time 0.456 (0.514)	Data 0.001 (0.011)	Loss 4.5381 (4.5809)	Top-1 acc 21.094 (20.308)	Top-5 acc 41.406 (41.318)	lr 0.02729
Warmup Train [19][2700/3239]	Time 0.450 (0.514)	Data 0.002 (0.011)	Loss 4.5995 (4.5809)	Top-1 acc 23.047 (20.308)	Top-5 acc 43.359 (41.322)	lr 0.02729
Warmup Train [19][2710/3239]	Time 0.439 (0.514)	Data 0.001 (0.011)	Loss 4.8066 (4.5809)	Top-1 acc 14.844 (20.307)	Top-5 acc 38.281 (41.323)	lr 0.02728
Warmup Train [19][2720/3239]	Time 0.491 (0.514)	Data 0.001 (0.011)	Loss 4.5896 (4.5809)	Top-1 acc 22.656 (20.312)	Top-5 acc 39.844 (41.324)	lr 0.02728
Warmup Train [19][2730/3239]	Time 0.531 (0.514)	Data 0.001 (0.011)	Loss 4.5602 (4.5806)	Top-1 acc 18.359 (20.318)	Top-5 acc 41.797 (41.333)	lr 0.02727
Warmup Train [19][2740/3239]	Time 0.428 (0.514)	Data 0.001 (0.011)	Loss 4.6176 (4.5805)	Top-1 acc 19.141 (20.321)	Top-5 acc 41.406 (41.335)	lr 0.02726
Warmup Train [19][2750/3239]	Time 0.427 (0.514)	Data 0.001 (0.011)	Loss 4.6026 (4.5804)	Top-1 acc 17.578 (20.322)	Top-5 acc 40.625 (41.339)	lr 0.02726
Warmup Train [19][2760/3239]	Time 0.632 (0.514)	Data 0.001 (0.011)	Loss 4.4488 (4.5803)	Top-1 acc 20.312 (20.321)	Top-5 acc 46.484 (41.338)	lr 0.02725
Warmup Train [19][2770/3239]	Time 0.485 (0.514)	Data 0.001 (0.010)	Loss 4.4184 (4.5801)	Top-1 acc 26.172 (20.330)	Top-5 acc 46.094 (41.348)	lr 0.02725
Warmup Train [19][2780/3239]	Time 0.576 (0.514)	Data 0.001 (0.010)	Loss 4.5916 (4.5800)	Top-1 acc 21.484 (20.329)	Top-5 acc 41.406 (41.346)	lr 0.02724
Warmup Train [19][2790/3239]	Time 0.580 (0.514)	Data 0.001 (0.010)	Loss 4.6895 (4.5799)	Top-1 acc 18.750 (20.335)	Top-5 acc 43.750 (41.349)	lr 0.02723
Warmup Train [19][2800/3239]	Time 0.618 (0.514)	Data 0.001 (0.010)	Loss 4.5108 (4.5799)	Top-1 acc 22.266 (20.335)	Top-5 acc 41.797 (41.345)	lr 0.02723
Warmup Train [19][2810/3239]	Time 0.638 (0.514)	Data 0.001 (0.010)	Loss 4.6697 (4.5799)	Top-1 acc 18.359 (20.335)	Top-5 acc 37.500 (41.345)	lr 0.02722
Warmup Train [19][2820/3239]	Time 0.513 (0.514)	Data 0.001 (0.010)	Loss 4.5996 (4.5799)	Top-1 acc 19.531 (20.335)	Top-5 acc 40.234 (41.345)	lr 0.02722
Warmup Train [19][2830/3239]	Time 0.493 (0.514)	Data 0.001 (0.010)	Loss 4.4616 (4.5799)	Top-1 acc 24.219 (20.339)	Top-5 acc 42.188 (41.343)	lr 0.02721
Warmup Train [19][2840/3239]	Time 0.433 (0.514)	Data 0.001 (0.010)	Loss 4.6832 (4.5799)	Top-1 acc 20.312 (20.338)	Top-5 acc 40.234 (41.342)	lr 0.02720
Warmup Train [19][2850/3239]	Time 0.479 (0.514)	Data 0.001 (0.010)	Loss 4.5781 (4.5797)	Top-1 acc 19.922 (20.340)	Top-5 acc 41.797 (41.347)	lr 0.02720
Warmup Train [19][2860/3239]	Time 0.521 (0.514)	Data 0.001 (0.010)	Loss 4.3981 (4.5793)	Top-1 acc 23.828 (20.348)	Top-5 acc 48.438 (41.356)	lr 0.02719
Warmup Train [19][2870/3239]	Time 0.554 (0.514)	Data 0.030 (0.010)	Loss 4.6266 (4.5792)	Top-1 acc 16.406 (20.347)	Top-5 acc 38.672 (41.356)	lr 0.02718
Warmup Train [19][2880/3239]	Time 0.452 (0.514)	Data 0.001 (0.010)	Loss 4.5974 (4.5792)	Top-1 acc 21.094 (20.348)	Top-5 acc 41.016 (41.358)	lr 0.02718
Warmup Train [19][2890/3239]	Time 0.569 (0.514)	Data 0.001 (0.010)	Loss 4.6281 (4.5791)	Top-1 acc 22.656 (20.354)	Top-5 acc 40.625 (41.360)	lr 0.02717
Warmup Train [19][2900/3239]	Time 0.552 (0.514)	Data 0.001 (0.010)	Loss 4.6942 (4.5788)	Top-1 acc 14.062 (20.356)	Top-5 acc 35.938 (41.365)	lr 0.02717
Warmup Train [19][2910/3239]	Time 0.520 (0.514)	Data 0.001 (0.010)	Loss 4.5428 (4.5787)	Top-1 acc 23.828 (20.356)	Top-5 acc 42.969 (41.365)	lr 0.02716
Warmup Train [19][2920/3239]	Time 0.508 (0.514)	Data 0.001 (0.010)	Loss 4.6259 (4.5786)	Top-1 acc 19.922 (20.358)	Top-5 acc 42.188 (41.370)	lr 0.02715
Warmup Train [19][2930/3239]	Time 0.328 (0.514)	Data 0.001 (0.010)	Loss 4.6794 (4.5787)	Top-1 acc 17.969 (20.358)	Top-5 acc 40.625 (41.371)	lr 0.02715
Warmup Train [19][2940/3239]	Time 0.537 (0.514)	Data 0.001 (0.010)	Loss 4.5441 (4.5784)	Top-1 acc 17.578 (20.361)	Top-5 acc 42.188 (41.378)	lr 0.02714
Warmup Train [19][2950/3239]	Time 0.631 (0.514)	Data 0.001 (0.010)	Loss 4.5594 (4.5781)	Top-1 acc 21.094 (20.366)	Top-5 acc 42.578 (41.386)	lr 0.02714
Warmup Train [19][2960/3239]	Time 0.577 (0.514)	Data 0.001 (0.010)	Loss 4.5527 (4.5779)	Top-1 acc 23.828 (20.373)	Top-5 acc 44.141 (41.390)	lr 0.02713
Warmup Train [19][2970/3239]	Time 0.668 (0.514)	Data 0.001 (0.010)	Loss 4.4510 (4.5778)	Top-1 acc 23.047 (20.376)	Top-5 acc 42.578 (41.392)	lr 0.02712
Warmup Train [19][2980/3239]	Time 0.346 (0.514)	Data 0.001 (0.010)	Loss 4.6247 (4.5777)	Top-1 acc 19.141 (20.379)	Top-5 acc 39.844 (41.396)	lr 0.02712
Warmup Train [19][2990/3239]	Time 0.527 (0.514)	Data 0.002 (0.010)	Loss 4.4310 (4.5775)	Top-1 acc 19.922 (20.383)	Top-5 acc 44.922 (41.401)	lr 0.02711
Warmup Train [19][3000/3239]	Time 0.565 (0.514)	Data 0.001 (0.010)	Loss 4.6433 (4.5775)	Top-1 acc 19.531 (20.382)	Top-5 acc 39.453 (41.400)	lr 0.02711
Warmup Train [19][3010/3239]	Time 0.496 (0.514)	Data 0.001 (0.010)	Loss 4.5986 (4.5774)	Top-1 acc 21.875 (20.383)	Top-5 acc 38.672 (41.400)	lr 0.02710
Warmup Train [19][3020/3239]	Time 0.308 (0.514)	Data 0.001 (0.010)	Loss 4.6189 (4.5774)	Top-1 acc 22.656 (20.384)	Top-5 acc 41.797 (41.400)	lr 0.02709
Warmup Train [19][3030/3239]	Time 0.501 (0.514)	Data 0.001 (0.010)	Loss 4.3304 (4.5773)	Top-1 acc 22.656 (20.382)	Top-5 acc 47.266 (41.399)	lr 0.02709
Warmup Train [19][3040/3239]	Time 0.381 (0.514)	Data 0.001 (0.010)	Loss 4.6482 (4.5773)	Top-1 acc 19.141 (20.385)	Top-5 acc 39.062 (41.398)	lr 0.02708
Warmup Train [19][3050/3239]	Time 0.569 (0.514)	Data 0.001 (0.010)	Loss 4.4237 (4.5772)	Top-1 acc 21.484 (20.390)	Top-5 acc 43.750 (41.400)	lr 0.02708
Warmup Train [19][3060/3239]	Time 0.650 (0.514)	Data 0.001 (0.010)	Loss 4.3428 (4.5768)	Top-1 acc 24.219 (20.396)	Top-5 acc 45.703 (41.409)	lr 0.02707
Warmup Train [19][3070/3239]	Time 0.476 (0.514)	Data 0.001 (0.010)	Loss 4.8234 (4.5767)	Top-1 acc 16.406 (20.397)	Top-5 acc 38.672 (41.412)	lr 0.02706
Warmup Train [19][3080/3239]	Time 0.350 (0.514)	Data 0.001 (0.010)	Loss 4.4878 (4.5766)	Top-1 acc 24.219 (20.400)	Top-5 acc 43.359 (41.415)	lr 0.02706
Warmup Train [19][3090/3239]	Time 0.555 (0.514)	Data 0.001 (0.010)	Loss 4.6928 (4.5766)	Top-1 acc 17.969 (20.403)	Top-5 acc 40.234 (41.419)	lr 0.02705
Warmup Train [19][3100/3239]	Time 0.569 (0.514)	Data 0.001 (0.010)	Loss 4.3966 (4.5764)	Top-1 acc 23.047 (20.407)	Top-5 acc 42.969 (41.423)	lr 0.02705
Warmup Train [19][3110/3239]	Time 0.457 (0.514)	Data 0.001 (0.010)	Loss 4.5209 (4.5765)	Top-1 acc 17.969 (20.405)	Top-5 acc 43.750 (41.421)	lr 0.02704
Warmup Train [19][3120/3239]	Time 0.544 (0.514)	Data 0.001 (0.010)	Loss 4.5119 (4.5762)	Top-1 acc 23.047 (20.411)	Top-5 acc 41.406 (41.427)	lr 0.02703
Warmup Train [19][3130/3239]	Time 0.579 (0.514)	Data 0.001 (0.010)	Loss 4.2925 (4.5758)	Top-1 acc 25.391 (20.419)	Top-5 acc 47.266 (41.437)	lr 0.02703
Warmup Train [19][3140/3239]	Time 0.538 (0.514)	Data 0.001 (0.010)	Loss 4.7005 (4.5757)	Top-1 acc 19.531 (20.422)	Top-5 acc 38.672 (41.439)	lr 0.02702
Warmup Train [19][3150/3239]	Time 0.496 (0.514)	Data 0.001 (0.010)	Loss 4.5112 (4.5756)	Top-1 acc 22.266 (20.427)	Top-5 acc 43.750 (41.441)	lr 0.02702
Warmup Train [19][3160/3239]	Time 0.644 (0.514)	Data 0.001 (0.010)	Loss 4.5259 (4.5756)	Top-1 acc 23.047 (20.430)	Top-5 acc 42.578 (41.442)	lr 0.02701
Warmup Train [19][3170/3239]	Time 0.489 (0.514)	Data 0.001 (0.010)	Loss 4.6164 (4.5754)	Top-1 acc 20.312 (20.431)	Top-5 acc 41.016 (41.448)	lr 0.02700
Warmup Train [19][3180/3239]	Time 0.460 (0.514)	Data 0.000 (0.010)	Loss 4.5670 (4.5753)	Top-1 acc 19.531 (20.432)	Top-5 acc 39.844 (41.449)	lr 0.02700
Warmup Train [19][3190/3239]	Time 0.398 (0.514)	Data 0.000 (0.010)	Loss 4.5996 (4.5752)	Top-1 acc 23.438 (20.436)	Top-5 acc 43.750 (41.452)	lr 0.02699
Warmup Train [19][3200/3239]	Time 0.364 (0.514)	Data 0.000 (0.010)	Loss 4.5010 (4.5750)	Top-1 acc 21.094 (20.441)	Top-5 acc 43.359 (41.457)	lr 0.02699
Warmup Train [19][3210/3239]	Time 0.483 (0.514)	Data 0.000 (0.010)	Loss 4.5038 (4.5751)	Top-1 acc 22.266 (20.437)	Top-5 acc 42.969 (41.453)	lr 0.02698
Warmup Train [19][3220/3239]	Time 0.709 (0.514)	Data 0.000 (0.010)	Loss 4.4218 (4.5750)	Top-1 acc 21.875 (20.436)	Top-5 acc 49.219 (41.455)	lr 0.02697
Warmup Train [19][3230/3239]	Time 0.670 (0.514)	Data 0.000 (0.010)	Loss 4.5861 (4.5750)	Top-1 acc 21.875 (20.437)	Top-5 acc 38.672 (41.455)	lr 0.02697
Warmup Train [19][3239/3239]	Time 0.278 (0.514)	Data 0.000 (0.010)	Loss 4.5692 (4.5749)	Top-1 acc 29.630 (20.441)	Top-5 acc 41.975 (41.458)	lr 0.02696
==========Warmup Valid [19/40]	loss 3.599	top-1 acc 27.469	top-5 acc 51.190	Train top-1 20.441	top-5 41.458	flops: 442.4M
Warmup Train [20][0/3239]	Time 11.318 (11.318)	Data 10.612 (10.612)	Loss 4.6238 (4.6238)	Top-1 acc 18.750 (18.750)	Top-5 acc 39.453 (39.453)	lr 0.02696
Warmup Train [20][10/3239]	Time 0.469 (1.640)	Data 0.001 (0.994)	Loss 4.5902 (4.5893)	Top-1 acc 23.828 (20.241)	Top-5 acc 39.062 (41.584)	lr 0.02696
Warmup Train [20][20/3239]	Time 0.355 (1.106)	Data 0.001 (0.524)	Loss 4.5432 (4.5829)	Top-1 acc 25.781 (20.610)	Top-5 acc 43.359 (41.295)	lr 0.02695
Warmup Train [20][30/3239]	Time 0.524 (0.926)	Data 0.001 (0.362)	Loss 4.7852 (4.5917)	Top-1 acc 19.922 (20.514)	Top-5 acc 39.453 (41.242)	lr 0.02694
Warmup Train [20][40/3239]	Time 0.575 (0.828)	Data 0.001 (0.274)	Loss 4.5976 (4.5707)	Top-1 acc 19.141 (20.617)	Top-5 acc 41.016 (41.711)	lr 0.02694
Warmup Train [20][50/3239]	Time 0.522 (0.765)	Data 0.001 (0.221)	Loss 4.5111 (4.5610)	Top-1 acc 18.750 (20.519)	Top-5 acc 43.750 (41.873)	lr 0.02693
Warmup Train [20][60/3239]	Time 0.492 (0.726)	Data 0.001 (0.185)	Loss 4.3645 (4.5457)	Top-1 acc 22.656 (20.857)	Top-5 acc 44.141 (42.220)	lr 0.02693
Warmup Train [20][70/3239]	Time 0.612 (0.696)	Data 0.002 (0.159)	Loss 4.4386 (4.5359)	Top-1 acc 22.266 (20.929)	Top-5 acc 43.750 (42.501)	lr 0.02692
Warmup Train [20][80/3239]	Time 0.535 (0.676)	Data 0.001 (0.140)	Loss 4.3308 (4.5279)	Top-1 acc 26.172 (21.147)	Top-5 acc 48.047 (42.593)	lr 0.02691
Warmup Train [20][90/3239]	Time 0.482 (0.655)	Data 0.001 (0.124)	Loss 4.4438 (4.5238)	Top-1 acc 20.703 (21.171)	Top-5 acc 44.531 (42.737)	lr 0.02691
Warmup Train [20][100/3239]	Time 0.350 (0.640)	Data 0.001 (0.112)	Loss 4.9023 (4.5255)	Top-1 acc 15.234 (21.152)	Top-5 acc 33.984 (42.601)	lr 0.02690
Warmup Train [20][110/3239]	Time 0.504 (0.629)	Data 0.001 (0.103)	Loss 4.7199 (4.5247)	Top-1 acc 19.922 (21.111)	Top-5 acc 37.891 (42.543)	lr 0.02690
Warmup Train [20][120/3239]	Time 0.513 (0.620)	Data 0.001 (0.095)	Loss 4.7369 (4.5278)	Top-1 acc 17.578 (21.087)	Top-5 acc 37.500 (42.384)	lr 0.02689
Warmup Train [20][130/3239]	Time 0.658 (0.612)	Data 0.001 (0.088)	Loss 4.5116 (4.5263)	Top-1 acc 20.703 (21.028)	Top-5 acc 42.578 (42.417)	lr 0.02688
Warmup Train [20][140/3239]	Time 0.410 (0.602)	Data 0.001 (0.082)	Loss 4.6067 (4.5283)	Top-1 acc 25.000 (21.080)	Top-5 acc 40.625 (42.376)	lr 0.02688
Warmup Train [20][150/3239]	Time 0.650 (0.597)	Data 0.001 (0.077)	Loss 4.6164 (4.5297)	Top-1 acc 19.141 (21.096)	Top-5 acc 38.672 (42.366)	lr 0.02687
Warmup Train [20][160/3239]	Time 0.503 (0.591)	Data 0.002 (0.072)	Loss 4.8263 (4.5297)	Top-1 acc 16.406 (21.074)	Top-5 acc 37.109 (42.382)	lr 0.02686
Warmup Train [20][170/3239]	Time 0.545 (0.588)	Data 0.001 (0.069)	Loss 4.4890 (4.5313)	Top-1 acc 23.047 (21.032)	Top-5 acc 43.359 (42.258)	lr 0.02686
Warmup Train [20][180/3239]	Time 0.447 (0.583)	Data 0.001 (0.065)	Loss 4.4423 (4.5295)	Top-1 acc 25.000 (21.109)	Top-5 acc 43.359 (42.306)	lr 0.02685
Warmup Train [20][190/3239]	Time 0.508 (0.579)	Data 0.001 (0.062)	Loss 4.4831 (4.5297)	Top-1 acc 25.781 (21.102)	Top-5 acc 46.875 (42.331)	lr 0.02685
Warmup Train [20][200/3239]	Time 0.547 (0.575)	Data 0.001 (0.059)	Loss 4.4561 (4.5288)	Top-1 acc 22.656 (21.076)	Top-5 acc 43.750 (42.312)	lr 0.02684
Warmup Train [20][210/3239]	Time 0.485 (0.570)	Data 0.001 (0.056)	Loss 4.4825 (4.5307)	Top-1 acc 21.875 (21.051)	Top-5 acc 42.578 (42.249)	lr 0.02683
Warmup Train [20][220/3239]	Time 0.403 (0.565)	Data 0.001 (0.054)	Loss 4.5320 (4.5319)	Top-1 acc 19.922 (20.991)	Top-5 acc 43.750 (42.218)	lr 0.02683
Warmup Train [20][230/3239]	Time 0.494 (0.563)	Data 0.001 (0.052)	Loss 4.5013 (4.5328)	Top-1 acc 19.531 (21.014)	Top-5 acc 40.625 (42.248)	lr 0.02682
Warmup Train [20][240/3239]	Time 0.486 (0.561)	Data 0.001 (0.050)	Loss 4.6009 (4.5322)	Top-1 acc 21.484 (21.039)	Top-5 acc 39.844 (42.282)	lr 0.02682
Warmup Train [20][250/3239]	Time 0.537 (0.559)	Data 0.001 (0.048)	Loss 4.5030 (4.5328)	Top-1 acc 20.312 (21.010)	Top-5 acc 41.797 (42.267)	lr 0.02681
Warmup Train [20][260/3239]	Time 0.563 (0.558)	Data 0.001 (0.046)	Loss 4.4857 (4.5315)	Top-1 acc 25.000 (21.028)	Top-5 acc 45.312 (42.336)	lr 0.02680
Warmup Train [20][270/3239]	Time 0.633 (0.557)	Data 0.002 (0.045)	Loss 4.3049 (4.5300)	Top-1 acc 25.781 (21.074)	Top-5 acc 45.703 (42.335)	lr 0.02680
Warmup Train [20][280/3239]	Time 0.534 (0.556)	Data 0.001 (0.043)	Loss 4.5218 (4.5303)	Top-1 acc 20.312 (21.045)	Top-5 acc 41.797 (42.311)	lr 0.02679
Warmup Train [20][290/3239]	Time 0.549 (0.554)	Data 0.001 (0.042)	Loss 4.5823 (4.5308)	Top-1 acc 22.656 (21.047)	Top-5 acc 37.891 (42.299)	lr 0.02679
Warmup Train [20][300/3239]	Time 0.396 (0.554)	Data 0.001 (0.041)	Loss 4.3524 (4.5278)	Top-1 acc 24.219 (21.103)	Top-5 acc 48.438 (42.381)	lr 0.02678
Warmup Train [20][310/3239]	Time 0.443 (0.552)	Data 0.001 (0.040)	Loss 4.4113 (4.5259)	Top-1 acc 22.656 (21.130)	Top-5 acc 43.359 (42.412)	lr 0.02677
Warmup Train [20][320/3239]	Time 0.584 (0.551)	Data 0.001 (0.039)	Loss 4.4872 (4.5271)	Top-1 acc 23.828 (21.093)	Top-5 acc 44.141 (42.376)	lr 0.02677
Warmup Train [20][330/3239]	Time 0.506 (0.550)	Data 0.001 (0.038)	Loss 4.6367 (4.5297)	Top-1 acc 22.656 (21.048)	Top-5 acc 41.797 (42.314)	lr 0.02676
Warmup Train [20][340/3239]	Time 0.415 (0.549)	Data 0.001 (0.037)	Loss 4.7375 (4.5316)	Top-1 acc 17.188 (21.027)	Top-5 acc 40.234 (42.245)	lr 0.02676
Warmup Train [20][350/3239]	Time 0.568 (0.548)	Data 0.001 (0.036)	Loss 4.5775 (4.5311)	Top-1 acc 17.188 (21.037)	Top-5 acc 41.797 (42.252)	lr 0.02675
Warmup Train [20][360/3239]	Time 0.343 (0.546)	Data 0.001 (0.035)	Loss 4.6751 (4.5340)	Top-1 acc 16.797 (20.989)	Top-5 acc 39.062 (42.173)	lr 0.02674
Warmup Train [20][370/3239]	Time 0.553 (0.545)	Data 0.001 (0.035)	Loss 4.5796 (4.5340)	Top-1 acc 21.484 (20.980)	Top-5 acc 39.062 (42.170)	lr 0.02674
Warmup Train [20][380/3239]	Time 0.564 (0.544)	Data 0.037 (0.034)	Loss 4.5989 (4.5337)	Top-1 acc 20.703 (20.989)	Top-5 acc 39.844 (42.195)	lr 0.02673
Warmup Train [20][390/3239]	Time 0.563 (0.543)	Data 0.001 (0.033)	Loss 4.5869 (4.5344)	Top-1 acc 20.312 (20.992)	Top-5 acc 40.625 (42.212)	lr 0.02673
Warmup Train [20][400/3239]	Time 0.338 (0.543)	Data 0.001 (0.033)	Loss 4.4834 (4.5346)	Top-1 acc 22.266 (20.979)	Top-5 acc 42.969 (42.209)	lr 0.02672
Warmup Train [20][410/3239]	Time 0.614 (0.542)	Data 0.001 (0.032)	Loss 4.4215 (4.5344)	Top-1 acc 22.656 (20.990)	Top-5 acc 40.625 (42.203)	lr 0.02671
Warmup Train [20][420/3239]	Time 0.613 (0.541)	Data 0.001 (0.032)	Loss 4.6788 (4.5347)	Top-1 acc 17.578 (20.997)	Top-5 acc 38.672 (42.201)	lr 0.02671
Warmup Train [20][430/3239]	Time 0.593 (0.540)	Data 0.002 (0.031)	Loss 4.6118 (4.5338)	Top-1 acc 19.531 (21.020)	Top-5 acc 42.188 (42.247)	lr 0.02670
Warmup Train [20][440/3239]	Time 0.345 (0.539)	Data 0.001 (0.030)	Loss 4.4592 (4.5342)	Top-1 acc 21.484 (21.026)	Top-5 acc 41.797 (42.239)	lr 0.02670
Warmup Train [20][450/3239]	Time 0.372 (0.539)	Data 0.001 (0.030)	Loss 4.4016 (4.5337)	Top-1 acc 23.047 (21.051)	Top-5 acc 43.750 (42.268)	lr 0.02669
Warmup Train [20][460/3239]	Time 0.503 (0.538)	Data 0.001 (0.030)	Loss 4.4686 (4.5333)	Top-1 acc 23.438 (21.058)	Top-5 acc 46.094 (42.275)	lr 0.02668
Warmup Train [20][470/3239]	Time 0.532 (0.537)	Data 0.001 (0.029)	Loss 4.4078 (4.5313)	Top-1 acc 21.094 (21.078)	Top-5 acc 45.312 (42.328)	lr 0.02668
Warmup Train [20][480/3239]	Time 0.624 (0.536)	Data 0.001 (0.029)	Loss 4.5899 (4.5316)	Top-1 acc 19.922 (21.073)	Top-5 acc 40.234 (42.317)	lr 0.02667
Warmup Train [20][490/3239]	Time 0.605 (0.535)	Data 0.001 (0.028)	Loss 4.5012 (4.5326)	Top-1 acc 21.094 (21.056)	Top-5 acc 46.875 (42.293)	lr 0.02667
Warmup Train [20][500/3239]	Time 0.465 (0.534)	Data 0.001 (0.028)	Loss 4.3077 (4.5306)	Top-1 acc 25.781 (21.102)	Top-5 acc 46.484 (42.343)	lr 0.02666
Warmup Train [20][510/3239]	Time 0.353 (0.533)	Data 0.001 (0.028)	Loss 4.3977 (4.5308)	Top-1 acc 23.828 (21.105)	Top-5 acc 46.875 (42.339)	lr 0.02665
Warmup Train [20][520/3239]	Time 0.513 (0.533)	Data 0.001 (0.027)	Loss 4.4939 (4.5304)	Top-1 acc 25.781 (21.130)	Top-5 acc 43.359 (42.349)	lr 0.02665
Warmup Train [20][530/3239]	Time 0.607 (0.533)	Data 0.001 (0.027)	Loss 4.3068 (4.5300)	Top-1 acc 26.953 (21.145)	Top-5 acc 47.266 (42.368)	lr 0.02664
Warmup Train [20][540/3239]	Time 0.566 (0.533)	Data 0.001 (0.026)	Loss 4.2845 (4.5300)	Top-1 acc 25.781 (21.155)	Top-5 acc 46.484 (42.381)	lr 0.02664
Warmup Train [20][550/3239]	Time 0.743 (0.533)	Data 0.001 (0.026)	Loss 4.4847 (4.5299)	Top-1 acc 20.703 (21.157)	Top-5 acc 46.484 (42.387)	lr 0.02663
Warmup Train [20][560/3239]	Time 0.558 (0.533)	Data 0.001 (0.026)	Loss 4.4294 (4.5301)	Top-1 acc 23.047 (21.144)	Top-5 acc 44.922 (42.380)	lr 0.02662
Warmup Train [20][570/3239]	Time 0.493 (0.532)	Data 0.001 (0.025)	Loss 4.4289 (4.5291)	Top-1 acc 24.219 (21.159)	Top-5 acc 44.922 (42.415)	lr 0.02662
Warmup Train [20][580/3239]	Time 0.539 (0.532)	Data 0.001 (0.025)	Loss 4.4173 (4.5284)	Top-1 acc 21.094 (21.161)	Top-5 acc 45.703 (42.436)	lr 0.02661
Warmup Train [20][590/3239]	Time 0.544 (0.531)	Data 0.001 (0.024)	Loss 4.5808 (4.5287)	Top-1 acc 18.359 (21.154)	Top-5 acc 40.625 (42.437)	lr 0.02660
Warmup Train [20][600/3239]	Time 0.521 (0.531)	Data 0.001 (0.024)	Loss 4.5334 (4.5289)	Top-1 acc 19.922 (21.158)	Top-5 acc 40.625 (42.436)	lr 0.02660
Warmup Train [20][610/3239]	Time 0.577 (0.531)	Data 0.001 (0.024)	Loss 4.6005 (4.5291)	Top-1 acc 18.750 (21.170)	Top-5 acc 40.234 (42.430)	lr 0.02659
Warmup Train [20][620/3239]	Time 0.552 (0.530)	Data 0.001 (0.023)	Loss 4.5088 (4.5285)	Top-1 acc 22.266 (21.186)	Top-5 acc 39.453 (42.435)	lr 0.02659
Warmup Train [20][630/3239]	Time 0.373 (0.529)	Data 0.001 (0.023)	Loss 4.5517 (4.5286)	Top-1 acc 20.312 (21.168)	Top-5 acc 41.406 (42.438)	lr 0.02658
Warmup Train [20][640/3239]	Time 0.484 (0.529)	Data 0.001 (0.023)	Loss 4.5308 (4.5285)	Top-1 acc 21.875 (21.186)	Top-5 acc 41.797 (42.434)	lr 0.02657
Warmup Train [20][650/3239]	Time 0.541 (0.529)	Data 0.002 (0.023)	Loss 4.5949 (4.5282)	Top-1 acc 19.922 (21.179)	Top-5 acc 41.406 (42.440)	lr 0.02657
Warmup Train [20][660/3239]	Time 0.551 (0.529)	Data 0.001 (0.022)	Loss 4.3522 (4.5279)	Top-1 acc 23.047 (21.173)	Top-5 acc 47.266 (42.439)	lr 0.02656
Warmup Train [20][670/3239]	Time 0.500 (0.529)	Data 0.001 (0.022)	Loss 4.4983 (4.5274)	Top-1 acc 19.922 (21.174)	Top-5 acc 42.188 (42.459)	lr 0.02656
Warmup Train [20][680/3239]	Time 0.332 (0.528)	Data 0.001 (0.022)	Loss 4.4622 (4.5267)	Top-1 acc 20.312 (21.179)	Top-5 acc 45.312 (42.476)	lr 0.02655
Warmup Train [20][690/3239]	Time 0.628 (0.528)	Data 0.001 (0.022)	Loss 4.5300 (4.5264)	Top-1 acc 18.359 (21.178)	Top-5 acc 43.750 (42.476)	lr 0.02654
Warmup Train [20][700/3239]	Time 0.383 (0.528)	Data 0.001 (0.021)	Loss 4.5150 (4.5265)	Top-1 acc 17.578 (21.177)	Top-5 acc 42.188 (42.477)	lr 0.02654
Warmup Train [20][710/3239]	Time 0.576 (0.528)	Data 0.001 (0.021)	Loss 4.7052 (4.5265)	Top-1 acc 19.531 (21.188)	Top-5 acc 38.281 (42.485)	lr 0.02653
Warmup Train [20][720/3239]	Time 0.575 (0.528)	Data 0.001 (0.021)	Loss 4.5703 (4.5270)	Top-1 acc 15.234 (21.185)	Top-5 acc 42.188 (42.481)	lr 0.02653
Warmup Train [20][730/3239]	Time 0.442 (0.527)	Data 0.001 (0.021)	Loss 4.6190 (4.5270)	Top-1 acc 18.359 (21.184)	Top-5 acc 41.406 (42.482)	lr 0.02652
Warmup Train [20][740/3239]	Time 0.624 (0.527)	Data 0.001 (0.020)	Loss 4.3487 (4.5274)	Top-1 acc 25.391 (21.186)	Top-5 acc 47.266 (42.473)	lr 0.02651
Warmup Train [20][750/3239]	Time 0.364 (0.527)	Data 0.001 (0.020)	Loss 4.6490 (4.5275)	Top-1 acc 17.188 (21.186)	Top-5 acc 41.406 (42.471)	lr 0.02651
Warmup Train [20][760/3239]	Time 0.591 (0.526)	Data 0.001 (0.020)	Loss 4.2434 (4.5268)	Top-1 acc 25.000 (21.203)	Top-5 acc 51.953 (42.491)	lr 0.02650
Warmup Train [20][770/3239]	Time 0.472 (0.526)	Data 0.001 (0.020)	Loss 4.3647 (4.5268)	Top-1 acc 19.531 (21.203)	Top-5 acc 46.484 (42.493)	lr 0.02650
Warmup Train [20][780/3239]	Time 0.628 (0.525)	Data 0.001 (0.020)	Loss 4.5151 (4.5279)	Top-1 acc 21.094 (21.194)	Top-5 acc 42.969 (42.468)	lr 0.02649
Warmup Train [20][790/3239]	Time 0.552 (0.525)	Data 0.001 (0.020)	Loss 4.5294 (4.5281)	Top-1 acc 17.969 (21.202)	Top-5 acc 39.453 (42.463)	lr 0.02648
Warmup Train [20][800/3239]	Time 0.518 (0.525)	Data 0.001 (0.019)	Loss 4.5616 (4.5283)	Top-1 acc 21.094 (21.196)	Top-5 acc 40.625 (42.444)	lr 0.02648
Warmup Train [20][810/3239]	Time 0.460 (0.525)	Data 0.001 (0.019)	Loss 4.7066 (4.5286)	Top-1 acc 20.312 (21.191)	Top-5 acc 37.109 (42.435)	lr 0.02647
Warmup Train [20][820/3239]	Time 0.507 (0.524)	Data 0.001 (0.019)	Loss 4.5908 (4.5294)	Top-1 acc 21.484 (21.180)	Top-5 acc 38.672 (42.413)	lr 0.02647
Warmup Train [20][830/3239]	Time 0.528 (0.524)	Data 0.001 (0.019)	Loss 4.4090 (4.5293)	Top-1 acc 23.438 (21.199)	Top-5 acc 45.312 (42.416)	lr 0.02646
Warmup Train [20][840/3239]	Time 0.557 (0.524)	Data 0.001 (0.019)	Loss 4.5250 (4.5292)	Top-1 acc 22.266 (21.195)	Top-5 acc 45.312 (42.422)	lr 0.02645
Warmup Train [20][850/3239]	Time 0.344 (0.524)	Data 0.001 (0.019)	Loss 4.6042 (4.5293)	Top-1 acc 19.141 (21.190)	Top-5 acc 39.062 (42.414)	lr 0.02645
Warmup Train [20][860/3239]	Time 0.669 (0.524)	Data 0.002 (0.019)	Loss 4.3858 (4.5299)	Top-1 acc 20.703 (21.178)	Top-5 acc 46.484 (42.396)	lr 0.02644
Warmup Train [20][870/3239]	Time 0.401 (0.524)	Data 0.001 (0.018)	Loss 4.4970 (4.5302)	Top-1 acc 22.266 (21.174)	Top-5 acc 42.969 (42.384)	lr 0.02644
Warmup Train [20][880/3239]	Time 0.388 (0.523)	Data 0.001 (0.018)	Loss 4.4895 (4.5306)	Top-1 acc 23.047 (21.176)	Top-5 acc 45.703 (42.383)	lr 0.02643
Warmup Train [20][890/3239]	Time 0.353 (0.523)	Data 0.001 (0.018)	Loss 4.7383 (4.5306)	Top-1 acc 17.969 (21.185)	Top-5 acc 37.891 (42.382)	lr 0.02642
Warmup Train [20][900/3239]	Time 0.468 (0.523)	Data 0.001 (0.018)	Loss 4.7246 (4.5303)	Top-1 acc 17.578 (21.180)	Top-5 acc 40.234 (42.396)	lr 0.02642
Warmup Train [20][910/3239]	Time 0.584 (0.523)	Data 0.001 (0.018)	Loss 4.3037 (4.5303)	Top-1 acc 26.953 (21.192)	Top-5 acc 51.562 (42.398)	lr 0.02641
Warmup Train [20][920/3239]	Time 0.513 (0.523)	Data 0.001 (0.018)	Loss 4.5162 (4.5302)	Top-1 acc 22.656 (21.199)	Top-5 acc 42.578 (42.411)	lr 0.02641
Warmup Train [20][930/3239]	Time 0.640 (0.523)	Data 0.001 (0.018)	Loss 4.4344 (4.5300)	Top-1 acc 23.828 (21.204)	Top-5 acc 45.312 (42.430)	lr 0.02640
Warmup Train [20][940/3239]	Time 0.419 (0.523)	Data 0.001 (0.018)	Loss 4.5505 (4.5305)	Top-1 acc 18.750 (21.195)	Top-5 acc 44.531 (42.412)	lr 0.02639
Warmup Train [20][950/3239]	Time 0.639 (0.523)	Data 0.002 (0.017)	Loss 4.4100 (4.5303)	Top-1 acc 24.609 (21.204)	Top-5 acc 45.312 (42.415)	lr 0.02639
Warmup Train [20][960/3239]	Time 0.414 (0.523)	Data 0.001 (0.017)	Loss 4.4713 (4.5302)	Top-1 acc 21.875 (21.201)	Top-5 acc 42.188 (42.424)	lr 0.02638
Warmup Train [20][970/3239]	Time 0.439 (0.523)	Data 0.001 (0.017)	Loss 4.4318 (4.5303)	Top-1 acc 22.656 (21.196)	Top-5 acc 43.750 (42.423)	lr 0.02637
Warmup Train [20][980/3239]	Time 0.603 (0.523)	Data 0.001 (0.017)	Loss 4.6185 (4.5305)	Top-1 acc 15.234 (21.190)	Top-5 acc 42.969 (42.430)	lr 0.02637
Warmup Train [20][990/3239]	Time 0.522 (0.522)	Data 0.001 (0.017)	Loss 4.4646 (4.5302)	Top-1 acc 19.922 (21.193)	Top-5 acc 43.359 (42.439)	lr 0.02636
Warmup Train [20][1000/3239]	Time 0.395 (0.522)	Data 0.001 (0.017)	Loss 4.4455 (4.5296)	Top-1 acc 23.438 (21.198)	Top-5 acc 44.922 (42.458)	lr 0.02636
Warmup Train [20][1010/3239]	Time 0.635 (0.522)	Data 0.002 (0.017)	Loss 4.4635 (4.5293)	Top-1 acc 23.047 (21.211)	Top-5 acc 42.188 (42.467)	lr 0.02635
Warmup Train [20][1020/3239]	Time 0.512 (0.522)	Data 0.001 (0.017)	Loss 4.5692 (4.5291)	Top-1 acc 23.047 (21.210)	Top-5 acc 43.359 (42.471)	lr 0.02634
Warmup Train [20][1030/3239]	Time 0.376 (0.522)	Data 0.001 (0.017)	Loss 4.4203 (4.5298)	Top-1 acc 21.484 (21.207)	Top-5 acc 43.750 (42.450)	lr 0.02634
Warmup Train [20][1040/3239]	Time 0.539 (0.521)	Data 0.001 (0.017)	Loss 4.4470 (4.5289)	Top-1 acc 21.875 (21.213)	Top-5 acc 48.047 (42.466)	lr 0.02633
Warmup Train [20][1050/3239]	Time 0.360 (0.521)	Data 0.001 (0.017)	Loss 4.3505 (4.5292)	Top-1 acc 25.781 (21.203)	Top-5 acc 46.484 (42.453)	lr 0.02633
Warmup Train [20][1060/3239]	Time 0.663 (0.521)	Data 0.002 (0.017)	Loss 4.6667 (4.5285)	Top-1 acc 21.484 (21.212)	Top-5 acc 41.406 (42.481)	lr 0.02632
Warmup Train [20][1070/3239]	Time 0.712 (0.521)	Data 0.001 (0.017)	Loss 4.4225 (4.5283)	Top-1 acc 21.875 (21.219)	Top-5 acc 42.188 (42.484)	lr 0.02631
Warmup Train [20][1080/3239]	Time 0.337 (0.521)	Data 0.001 (0.016)	Loss 4.5768 (4.5281)	Top-1 acc 17.578 (21.207)	Top-5 acc 37.891 (42.486)	lr 0.02631
Warmup Train [20][1090/3239]	Time 0.662 (0.521)	Data 0.001 (0.016)	Loss 4.5220 (4.5280)	Top-1 acc 23.047 (21.212)	Top-5 acc 44.141 (42.499)	lr 0.02630
Warmup Train [20][1100/3239]	Time 0.536 (0.520)	Data 0.001 (0.016)	Loss 4.2713 (4.5278)	Top-1 acc 25.781 (21.219)	Top-5 acc 44.531 (42.504)	lr 0.02630
Warmup Train [20][1110/3239]	Time 0.636 (0.520)	Data 0.001 (0.016)	Loss 4.4363 (4.5279)	Top-1 acc 21.875 (21.223)	Top-5 acc 44.141 (42.504)	lr 0.02629
Warmup Train [20][1120/3239]	Time 0.563 (0.520)	Data 0.001 (0.016)	Loss 4.7672 (4.5271)	Top-1 acc 19.141 (21.240)	Top-5 acc 35.938 (42.521)	lr 0.02628
Warmup Train [20][1130/3239]	Time 0.534 (0.520)	Data 0.001 (0.016)	Loss 4.6101 (4.5273)	Top-1 acc 19.531 (21.247)	Top-5 acc 41.797 (42.528)	lr 0.02628
Warmup Train [20][1140/3239]	Time 0.361 (0.520)	Data 0.002 (0.016)	Loss 4.5666 (4.5274)	Top-1 acc 19.922 (21.244)	Top-5 acc 41.016 (42.538)	lr 0.02627
Warmup Train [20][1150/3239]	Time 0.314 (0.520)	Data 0.001 (0.016)	Loss 4.4486 (4.5273)	Top-1 acc 19.922 (21.236)	Top-5 acc 44.141 (42.541)	lr 0.02627
Warmup Train [20][1160/3239]	Time 0.545 (0.520)	Data 0.001 (0.016)	Loss 4.5149 (4.5270)	Top-1 acc 22.656 (21.239)	Top-5 acc 43.750 (42.549)	lr 0.02626
Warmup Train [20][1170/3239]	Time 0.376 (0.520)	Data 0.001 (0.016)	Loss 4.5777 (4.5276)	Top-1 acc 19.922 (21.230)	Top-5 acc 41.406 (42.537)	lr 0.02625
Warmup Train [20][1180/3239]	Time 0.495 (0.520)	Data 0.001 (0.016)	Loss 4.5806 (4.5275)	Top-1 acc 20.703 (21.224)	Top-5 acc 38.672 (42.541)	lr 0.02625
Warmup Train [20][1190/3239]	Time 0.455 (0.520)	Data 0.001 (0.016)	Loss 4.4420 (4.5273)	Top-1 acc 22.656 (21.230)	Top-5 acc 41.406 (42.545)	lr 0.02624
Warmup Train [20][1200/3239]	Time 0.437 (0.520)	Data 0.001 (0.016)	Loss 4.3261 (4.5269)	Top-1 acc 25.781 (21.246)	Top-5 acc 46.484 (42.557)	lr 0.02624
Warmup Train [20][1210/3239]	Time 0.458 (0.521)	Data 0.001 (0.016)	Loss 4.4932 (4.5265)	Top-1 acc 18.359 (21.252)	Top-5 acc 43.750 (42.571)	lr 0.02623
Warmup Train [20][1220/3239]	Time 0.504 (0.520)	Data 0.001 (0.016)	Loss 4.4374 (4.5266)	Top-1 acc 21.094 (21.250)	Top-5 acc 46.094 (42.569)	lr 0.02622
Warmup Train [20][1230/3239]	Time 0.492 (0.520)	Data 0.001 (0.015)	Loss 4.6513 (4.5264)	Top-1 acc 20.703 (21.257)	Top-5 acc 40.625 (42.573)	lr 0.02622
Warmup Train [20][1240/3239]	Time 0.485 (0.520)	Data 0.001 (0.015)	Loss 4.5097 (4.5258)	Top-1 acc 21.484 (21.267)	Top-5 acc 39.062 (42.586)	lr 0.02621
Warmup Train [20][1250/3239]	Time 0.390 (0.520)	Data 0.001 (0.015)	Loss 4.4346 (4.5262)	Top-1 acc 20.703 (21.260)	Top-5 acc 43.359 (42.575)	lr 0.02621
Warmup Train [20][1260/3239]	Time 0.484 (0.520)	Data 0.001 (0.015)	Loss 4.4435 (4.5260)	Top-1 acc 24.219 (21.268)	Top-5 acc 45.312 (42.581)	lr 0.02620
Warmup Train [20][1270/3239]	Time 0.489 (0.520)	Data 0.001 (0.015)	Loss 4.5343 (4.5260)	Top-1 acc 23.828 (21.265)	Top-5 acc 46.094 (42.585)	lr 0.02619
Warmup Train [20][1280/3239]	Time 0.360 (0.520)	Data 0.001 (0.015)	Loss 4.5914 (4.5255)	Top-1 acc 21.484 (21.276)	Top-5 acc 42.969 (42.599)	lr 0.02619
Warmup Train [20][1290/3239]	Time 0.504 (0.520)	Data 0.001 (0.015)	Loss 4.6437 (4.5255)	Top-1 acc 17.578 (21.279)	Top-5 acc 36.719 (42.601)	lr 0.02618
Warmup Train [20][1300/3239]	Time 0.516 (0.520)	Data 0.001 (0.015)	Loss 4.5842 (4.5257)	Top-1 acc 21.484 (21.281)	Top-5 acc 39.453 (42.592)	lr 0.02618
Warmup Train [20][1310/3239]	Time 0.614 (0.520)	Data 0.001 (0.015)	Loss 4.7712 (4.5256)	Top-1 acc 16.406 (21.278)	Top-5 acc 39.453 (42.591)	lr 0.02617
Warmup Train [20][1320/3239]	Time 0.486 (0.519)	Data 0.001 (0.015)	Loss 4.5037 (4.5254)	Top-1 acc 20.703 (21.272)	Top-5 acc 42.188 (42.597)	lr 0.02616
Warmup Train [20][1330/3239]	Time 0.375 (0.519)	Data 0.001 (0.015)	Loss 4.5556 (4.5251)	Top-1 acc 20.312 (21.280)	Top-5 acc 42.969 (42.604)	lr 0.02616
Warmup Train [20][1340/3239]	Time 0.560 (0.519)	Data 0.001 (0.015)	Loss 4.4867 (4.5248)	Top-1 acc 19.922 (21.291)	Top-5 acc 42.578 (42.614)	lr 0.02615
Warmup Train [20][1350/3239]	Time 0.516 (0.519)	Data 0.001 (0.015)	Loss 4.6138 (4.5256)	Top-1 acc 19.922 (21.279)	Top-5 acc 39.453 (42.597)	lr 0.02614
Warmup Train [20][1360/3239]	Time 0.585 (0.519)	Data 0.001 (0.015)	Loss 4.6506 (4.5258)	Top-1 acc 19.531 (21.276)	Top-5 acc 39.062 (42.590)	lr 0.02614
Warmup Train [20][1370/3239]	Time 0.506 (0.519)	Data 0.001 (0.015)	Loss 4.6318 (4.5256)	Top-1 acc 20.312 (21.286)	Top-5 acc 39.453 (42.597)	lr 0.02613
Warmup Train [20][1380/3239]	Time 0.559 (0.519)	Data 0.001 (0.015)	Loss 4.4692 (4.5257)	Top-1 acc 21.484 (21.286)	Top-5 acc 42.969 (42.593)	lr 0.02613
Warmup Train [20][1390/3239]	Time 0.335 (0.519)	Data 0.001 (0.015)	Loss 4.7052 (4.5256)	Top-1 acc 17.578 (21.281)	Top-5 acc 39.844 (42.593)	lr 0.02612
Warmup Train [20][1400/3239]	Time 0.354 (0.519)	Data 0.001 (0.015)	Loss 4.3640 (4.5256)	Top-1 acc 27.344 (21.289)	Top-5 acc 43.359 (42.598)	lr 0.02611
Warmup Train [20][1410/3239]	Time 0.551 (0.519)	Data 0.001 (0.015)	Loss 4.3376 (4.5254)	Top-1 acc 24.609 (21.292)	Top-5 acc 49.609 (42.606)	lr 0.02611
Warmup Train [20][1420/3239]	Time 0.501 (0.519)	Data 0.001 (0.014)	Loss 4.3678 (4.5251)	Top-1 acc 21.484 (21.295)	Top-5 acc 44.531 (42.623)	lr 0.02610
Warmup Train [20][1430/3239]	Time 0.611 (0.519)	Data 0.001 (0.014)	Loss 4.4982 (4.5248)	Top-1 acc 26.953 (21.304)	Top-5 acc 42.578 (42.634)	lr 0.02610
Warmup Train [20][1440/3239]	Time 0.594 (0.519)	Data 0.001 (0.014)	Loss 4.6240 (4.5250)	Top-1 acc 18.359 (21.296)	Top-5 acc 39.453 (42.625)	lr 0.02609
Warmup Train [20][1450/3239]	Time 0.502 (0.519)	Data 0.001 (0.014)	Loss 4.5586 (4.5244)	Top-1 acc 20.312 (21.312)	Top-5 acc 42.188 (42.636)	lr 0.02608
Warmup Train [20][1460/3239]	Time 0.364 (0.519)	Data 0.001 (0.014)	Loss 4.6163 (4.5248)	Top-1 acc 20.312 (21.301)	Top-5 acc 43.750 (42.627)	lr 0.02608
Warmup Train [20][1470/3239]	Time 0.589 (0.519)	Data 0.001 (0.014)	Loss 4.5398 (4.5249)	Top-1 acc 21.094 (21.297)	Top-5 acc 40.625 (42.618)	lr 0.02607
Warmup Train [20][1480/3239]	Time 0.567 (0.519)	Data 0.001 (0.014)	Loss 4.7218 (4.5250)	Top-1 acc 16.406 (21.297)	Top-5 acc 39.844 (42.623)	lr 0.02607
Warmup Train [20][1490/3239]	Time 0.393 (0.518)	Data 0.001 (0.014)	Loss 4.5352 (4.5251)	Top-1 acc 23.438 (21.303)	Top-5 acc 39.062 (42.616)	lr 0.02606
Warmup Train [20][1500/3239]	Time 0.413 (0.518)	Data 0.001 (0.014)	Loss 4.4920 (4.5254)	Top-1 acc 21.875 (21.300)	Top-5 acc 44.141 (42.614)	lr 0.02605
Warmup Train [20][1510/3239]	Time 0.444 (0.518)	Data 0.001 (0.014)	Loss 4.4730 (4.5250)	Top-1 acc 25.000 (21.304)	Top-5 acc 44.922 (42.630)	lr 0.02605
Warmup Train [20][1520/3239]	Time 0.357 (0.519)	Data 0.001 (0.014)	Loss 4.5737 (4.5248)	Top-1 acc 19.922 (21.300)	Top-5 acc 40.234 (42.633)	lr 0.02604
Warmup Train [20][1530/3239]	Time 0.518 (0.519)	Data 0.001 (0.014)	Loss 4.4665 (4.5248)	Top-1 acc 19.922 (21.294)	Top-5 acc 39.062 (42.632)	lr 0.02604
Warmup Train [20][1540/3239]	Time 0.637 (0.519)	Data 0.001 (0.014)	Loss 4.4573 (4.5242)	Top-1 acc 23.047 (21.298)	Top-5 acc 44.141 (42.638)	lr 0.02603
Warmup Train [20][1550/3239]	Time 0.531 (0.519)	Data 0.001 (0.014)	Loss 4.4108 (4.5239)	Top-1 acc 22.266 (21.295)	Top-5 acc 44.922 (42.646)	lr 0.02602
Warmup Train [20][1560/3239]	Time 0.627 (0.519)	Data 0.001 (0.014)	Loss 4.4983 (4.5238)	Top-1 acc 22.656 (21.295)	Top-5 acc 44.922 (42.649)	lr 0.02602
Warmup Train [20][1570/3239]	Time 0.581 (0.518)	Data 0.001 (0.014)	Loss 4.5025 (4.5235)	Top-1 acc 21.875 (21.304)	Top-5 acc 40.625 (42.655)	lr 0.02601
Warmup Train [20][1580/3239]	Time 0.507 (0.518)	Data 0.001 (0.014)	Loss 4.5368 (4.5235)	Top-1 acc 21.094 (21.306)	Top-5 acc 40.625 (42.658)	lr 0.02601
Warmup Train [20][1590/3239]	Time 0.481 (0.518)	Data 0.001 (0.014)	Loss 4.5091 (4.5238)	Top-1 acc 21.484 (21.310)	Top-5 acc 40.625 (42.653)	lr 0.02600
Warmup Train [20][1600/3239]	Time 0.513 (0.518)	Data 0.001 (0.014)	Loss 4.6412 (4.5235)	Top-1 acc 18.359 (21.314)	Top-5 acc 35.938 (42.660)	lr 0.02599
Warmup Train [20][1610/3239]	Time 0.529 (0.517)	Data 0.001 (0.013)	Loss 4.4557 (4.5235)	Top-1 acc 24.609 (21.316)	Top-5 acc 46.094 (42.665)	lr 0.02599
Warmup Train [20][1620/3239]	Time 0.551 (0.517)	Data 0.001 (0.013)	Loss 4.4523 (4.5235)	Top-1 acc 21.875 (21.322)	Top-5 acc 46.094 (42.659)	lr 0.02598
Warmup Train [20][1630/3239]	Time 0.479 (0.517)	Data 0.002 (0.013)	Loss 4.5196 (4.5234)	Top-1 acc 21.094 (21.317)	Top-5 acc 39.062 (42.657)	lr 0.02598
Warmup Train [20][1640/3239]	Time 0.676 (0.517)	Data 0.001 (0.013)	Loss 4.5607 (4.5233)	Top-1 acc 20.703 (21.320)	Top-5 acc 42.578 (42.658)	lr 0.02597
Warmup Train [20][1650/3239]	Time 0.532 (0.517)	Data 0.001 (0.013)	Loss 4.7010 (4.5234)	Top-1 acc 19.141 (21.312)	Top-5 acc 37.109 (42.653)	lr 0.02596
Warmup Train [20][1660/3239]	Time 0.497 (0.517)	Data 0.001 (0.013)	Loss 4.6551 (4.5235)	Top-1 acc 18.359 (21.312)	Top-5 acc 38.281 (42.652)	lr 0.02596
Warmup Train [20][1670/3239]	Time 0.321 (0.517)	Data 0.001 (0.013)	Loss 4.7357 (4.5234)	Top-1 acc 17.969 (21.322)	Top-5 acc 39.844 (42.656)	lr 0.02595
Warmup Train [20][1680/3239]	Time 0.403 (0.517)	Data 0.001 (0.013)	Loss 4.2819 (4.5232)	Top-1 acc 24.219 (21.326)	Top-5 acc 48.828 (42.660)	lr 0.02595
Warmup Train [20][1690/3239]	Time 0.537 (0.517)	Data 0.001 (0.013)	Loss 4.4782 (4.5231)	Top-1 acc 22.656 (21.332)	Top-5 acc 44.141 (42.662)	lr 0.02594
Warmup Train [20][1700/3239]	Time 0.656 (0.517)	Data 0.001 (0.013)	Loss 4.4963 (4.5232)	Top-1 acc 21.484 (21.332)	Top-5 acc 43.750 (42.656)	lr 0.02593
Warmup Train [20][1710/3239]	Time 0.518 (0.517)	Data 0.002 (0.013)	Loss 4.6025 (4.5231)	Top-1 acc 18.359 (21.340)	Top-5 acc 39.062 (42.660)	lr 0.02593
Warmup Train [20][1720/3239]	Time 0.521 (0.517)	Data 0.001 (0.013)	Loss 4.4299 (4.5230)	Top-1 acc 17.578 (21.338)	Top-5 acc 42.578 (42.661)	lr 0.02592
Warmup Train [20][1730/3239]	Time 0.438 (0.517)	Data 0.001 (0.013)	Loss 4.3841 (4.5229)	Top-1 acc 25.391 (21.344)	Top-5 acc 47.266 (42.664)	lr 0.02591
Warmup Train [20][1740/3239]	Time 0.365 (0.517)	Data 0.002 (0.013)	Loss 4.6067 (4.5232)	Top-1 acc 21.484 (21.346)	Top-5 acc 39.844 (42.657)	lr 0.02591
Warmup Train [20][1750/3239]	Time 0.381 (0.517)	Data 0.001 (0.013)	Loss 4.5157 (4.5228)	Top-1 acc 21.484 (21.351)	Top-5 acc 45.312 (42.669)	lr 0.02590
Warmup Train [20][1760/3239]	Time 0.669 (0.517)	Data 0.001 (0.013)	Loss 4.5318 (4.5227)	Top-1 acc 18.359 (21.348)	Top-5 acc 40.625 (42.673)	lr 0.02590
Warmup Train [20][1770/3239]	Time 0.742 (0.517)	Data 0.001 (0.013)	Loss 4.3461 (4.5225)	Top-1 acc 22.656 (21.353)	Top-5 acc 49.219 (42.682)	lr 0.02589
Warmup Train [20][1780/3239]	Time 0.364 (0.517)	Data 0.001 (0.013)	Loss 4.5499 (4.5223)	Top-1 acc 21.094 (21.357)	Top-5 acc 42.188 (42.683)	lr 0.02588
Warmup Train [20][1790/3239]	Time 0.450 (0.517)	Data 0.001 (0.013)	Loss 4.4537 (4.5223)	Top-1 acc 21.094 (21.360)	Top-5 acc 43.750 (42.688)	lr 0.02588
Warmup Train [20][1800/3239]	Time 0.450 (0.517)	Data 0.001 (0.013)	Loss 4.5124 (4.5224)	Top-1 acc 20.703 (21.357)	Top-5 acc 41.797 (42.680)	lr 0.02587
Warmup Train [20][1810/3239]	Time 0.647 (0.517)	Data 0.001 (0.013)	Loss 4.6279 (4.5220)	Top-1 acc 20.312 (21.363)	Top-5 acc 38.281 (42.683)	lr 0.02587
Warmup Train [20][1820/3239]	Time 0.512 (0.517)	Data 0.001 (0.013)	Loss 4.3763 (4.5220)	Top-1 acc 22.266 (21.359)	Top-5 acc 48.047 (42.689)	lr 0.02586
Warmup Train [20][1830/3239]	Time 0.484 (0.517)	Data 0.002 (0.012)	Loss 4.5840 (4.5221)	Top-1 acc 17.969 (21.352)	Top-5 acc 41.016 (42.683)	lr 0.02585
Warmup Train [20][1840/3239]	Time 0.283 (0.516)	Data 0.001 (0.012)	Loss 4.3235 (4.5220)	Top-1 acc 24.219 (21.349)	Top-5 acc 46.094 (42.685)	lr 0.02585
Warmup Train [20][1850/3239]	Time 0.342 (0.516)	Data 0.001 (0.012)	Loss 4.4807 (4.5218)	Top-1 acc 20.703 (21.351)	Top-5 acc 42.969 (42.686)	lr 0.02584
Warmup Train [20][1860/3239]	Time 0.357 (0.516)	Data 0.001 (0.012)	Loss 4.6053 (4.5218)	Top-1 acc 22.656 (21.355)	Top-5 acc 39.062 (42.685)	lr 0.02584
Warmup Train [20][1870/3239]	Time 0.485 (0.516)	Data 0.001 (0.013)	Loss 4.7678 (4.5220)	Top-1 acc 18.359 (21.351)	Top-5 acc 36.719 (42.684)	lr 0.02583
Warmup Train [20][1880/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 4.3426 (4.5217)	Top-1 acc 23.828 (21.357)	Top-5 acc 48.047 (42.690)	lr 0.02582
Warmup Train [20][1890/3239]	Time 0.483 (0.516)	Data 0.001 (0.012)	Loss 4.4522 (4.5217)	Top-1 acc 20.312 (21.357)	Top-5 acc 43.359 (42.685)	lr 0.02582
Warmup Train [20][1900/3239]	Time 0.439 (0.516)	Data 0.001 (0.012)	Loss 4.4404 (4.5214)	Top-1 acc 20.703 (21.356)	Top-5 acc 43.750 (42.685)	lr 0.02581
Warmup Train [20][1910/3239]	Time 0.644 (0.516)	Data 0.001 (0.012)	Loss 4.3306 (4.5216)	Top-1 acc 25.781 (21.347)	Top-5 acc 47.656 (42.680)	lr 0.02581
Warmup Train [20][1920/3239]	Time 0.441 (0.516)	Data 0.001 (0.012)	Loss 4.6220 (4.5216)	Top-1 acc 19.141 (21.355)	Top-5 acc 39.453 (42.685)	lr 0.02580
Warmup Train [20][1930/3239]	Time 0.487 (0.516)	Data 0.001 (0.012)	Loss 4.4782 (4.5213)	Top-1 acc 21.875 (21.360)	Top-5 acc 42.969 (42.692)	lr 0.02579
Warmup Train [20][1940/3239]	Time 0.681 (0.516)	Data 0.001 (0.012)	Loss 4.4198 (4.5212)	Top-1 acc 24.219 (21.363)	Top-5 acc 45.703 (42.695)	lr 0.02579
Warmup Train [20][1950/3239]	Time 0.489 (0.516)	Data 0.002 (0.012)	Loss 4.7572 (4.5212)	Top-1 acc 18.359 (21.361)	Top-5 acc 36.719 (42.692)	lr 0.02578
Warmup Train [20][1960/3239]	Time 0.578 (0.516)	Data 0.001 (0.012)	Loss 4.6860 (4.5213)	Top-1 acc 19.531 (21.361)	Top-5 acc 42.188 (42.688)	lr 0.02578
Warmup Train [20][1970/3239]	Time 0.550 (0.516)	Data 0.001 (0.012)	Loss 4.5522 (4.5212)	Top-1 acc 22.266 (21.360)	Top-5 acc 41.406 (42.686)	lr 0.02577
Warmup Train [20][1980/3239]	Time 0.517 (0.516)	Data 0.001 (0.012)	Loss 4.4335 (4.5214)	Top-1 acc 25.000 (21.363)	Top-5 acc 44.141 (42.684)	lr 0.02576
Warmup Train [20][1990/3239]	Time 0.602 (0.516)	Data 0.001 (0.012)	Loss 4.7248 (4.5214)	Top-1 acc 19.531 (21.369)	Top-5 acc 38.281 (42.690)	lr 0.02576
Warmup Train [20][2000/3239]	Time 0.575 (0.516)	Data 0.001 (0.012)	Loss 4.6960 (4.5215)	Top-1 acc 19.141 (21.371)	Top-5 acc 39.453 (42.686)	lr 0.02575
Warmup Train [20][2010/3239]	Time 0.671 (0.516)	Data 0.001 (0.012)	Loss 4.5526 (4.5216)	Top-1 acc 22.266 (21.375)	Top-5 acc 43.359 (42.685)	lr 0.02575
Warmup Train [20][2020/3239]	Time 0.562 (0.516)	Data 0.001 (0.012)	Loss 4.8324 (4.5214)	Top-1 acc 18.750 (21.382)	Top-5 acc 36.328 (42.692)	lr 0.02574
Warmup Train [20][2030/3239]	Time 0.552 (0.516)	Data 0.001 (0.012)	Loss 4.5472 (4.5210)	Top-1 acc 22.266 (21.382)	Top-5 acc 41.406 (42.698)	lr 0.02573
Warmup Train [20][2040/3239]	Time 0.577 (0.516)	Data 0.001 (0.012)	Loss 4.5690 (4.5208)	Top-1 acc 21.484 (21.383)	Top-5 acc 44.141 (42.704)	lr 0.02573
Warmup Train [20][2050/3239]	Time 0.428 (0.516)	Data 0.001 (0.012)	Loss 4.5115 (4.5207)	Top-1 acc 18.359 (21.382)	Top-5 acc 39.844 (42.709)	lr 0.02572
Warmup Train [20][2060/3239]	Time 0.555 (0.516)	Data 0.001 (0.012)	Loss 4.2418 (4.5204)	Top-1 acc 25.781 (21.391)	Top-5 acc 47.656 (42.713)	lr 0.02572
Warmup Train [20][2070/3239]	Time 0.520 (0.516)	Data 0.001 (0.012)	Loss 4.4314 (4.5202)	Top-1 acc 24.219 (21.393)	Top-5 acc 44.531 (42.717)	lr 0.02571
Warmup Train [20][2080/3239]	Time 0.571 (0.516)	Data 0.001 (0.012)	Loss 4.5127 (4.5204)	Top-1 acc 19.141 (21.392)	Top-5 acc 41.406 (42.718)	lr 0.02570
Warmup Train [20][2090/3239]	Time 0.558 (0.516)	Data 0.001 (0.012)	Loss 4.5436 (4.5203)	Top-1 acc 20.703 (21.394)	Top-5 acc 42.188 (42.717)	lr 0.02570
Warmup Train [20][2100/3239]	Time 0.725 (0.516)	Data 0.001 (0.012)	Loss 4.3965 (4.5202)	Top-1 acc 25.000 (21.396)	Top-5 acc 43.750 (42.721)	lr 0.02569
Warmup Train [20][2110/3239]	Time 0.428 (0.516)	Data 0.001 (0.012)	Loss 4.5379 (4.5204)	Top-1 acc 18.750 (21.391)	Top-5 acc 44.141 (42.714)	lr 0.02568
Warmup Train [20][2120/3239]	Time 0.517 (0.516)	Data 0.001 (0.012)	Loss 4.4563 (4.5202)	Top-1 acc 20.312 (21.393)	Top-5 acc 41.016 (42.714)	lr 0.02568
Warmup Train [20][2130/3239]	Time 0.567 (0.516)	Data 0.001 (0.012)	Loss 4.3377 (4.5201)	Top-1 acc 25.000 (21.389)	Top-5 acc 46.875 (42.714)	lr 0.02567
Warmup Train [20][2140/3239]	Time 0.513 (0.516)	Data 0.001 (0.012)	Loss 4.3919 (4.5200)	Top-1 acc 25.781 (21.386)	Top-5 acc 43.750 (42.714)	lr 0.02567
Warmup Train [20][2150/3239]	Time 0.577 (0.516)	Data 0.001 (0.012)	Loss 4.7532 (4.5201)	Top-1 acc 15.234 (21.380)	Top-5 acc 39.844 (42.716)	lr 0.02566
Warmup Train [20][2160/3239]	Time 0.398 (0.515)	Data 0.001 (0.012)	Loss 4.4619 (4.5197)	Top-1 acc 22.266 (21.381)	Top-5 acc 42.578 (42.723)	lr 0.02565
Warmup Train [20][2170/3239]	Time 0.386 (0.515)	Data 0.001 (0.012)	Loss 4.5263 (4.5196)	Top-1 acc 21.484 (21.382)	Top-5 acc 40.625 (42.722)	lr 0.02565
Warmup Train [20][2180/3239]	Time 0.343 (0.515)	Data 0.001 (0.012)	Loss 4.6176 (4.5196)	Top-1 acc 19.141 (21.384)	Top-5 acc 41.406 (42.724)	lr 0.02564
Warmup Train [20][2190/3239]	Time 0.545 (0.515)	Data 0.002 (0.012)	Loss 4.4295 (4.5196)	Top-1 acc 24.219 (21.382)	Top-5 acc 42.578 (42.726)	lr 0.02564
Warmup Train [20][2200/3239]	Time 0.430 (0.515)	Data 0.001 (0.012)	Loss 4.5936 (4.5194)	Top-1 acc 19.141 (21.387)	Top-5 acc 37.109 (42.728)	lr 0.02563
Warmup Train [20][2210/3239]	Time 0.271 (0.515)	Data 0.001 (0.012)	Loss 4.6770 (4.5195)	Top-1 acc 21.875 (21.390)	Top-5 acc 38.281 (42.728)	lr 0.02562
Warmup Train [20][2220/3239]	Time 0.694 (0.515)	Data 0.001 (0.012)	Loss 4.5390 (4.5192)	Top-1 acc 21.484 (21.394)	Top-5 acc 42.969 (42.736)	lr 0.02562
Warmup Train [20][2230/3239]	Time 0.460 (0.515)	Data 0.001 (0.012)	Loss 4.5789 (4.5191)	Top-1 acc 18.359 (21.393)	Top-5 acc 40.625 (42.736)	lr 0.02561
Warmup Train [20][2240/3239]	Time 0.584 (0.515)	Data 0.001 (0.012)	Loss 4.4973 (4.5193)	Top-1 acc 21.484 (21.389)	Top-5 acc 43.750 (42.733)	lr 0.02561
Warmup Train [20][2250/3239]	Time 0.432 (0.515)	Data 0.001 (0.012)	Loss 4.6690 (4.5192)	Top-1 acc 22.266 (21.390)	Top-5 acc 37.891 (42.735)	lr 0.02560
Warmup Train [20][2260/3239]	Time 0.610 (0.515)	Data 0.001 (0.012)	Loss 4.5495 (4.5191)	Top-1 acc 19.141 (21.394)	Top-5 acc 44.531 (42.735)	lr 0.02559
Warmup Train [20][2270/3239]	Time 0.509 (0.515)	Data 0.001 (0.012)	Loss 4.4606 (4.5188)	Top-1 acc 21.875 (21.399)	Top-5 acc 42.969 (42.742)	lr 0.02559
Warmup Train [20][2280/3239]	Time 0.415 (0.515)	Data 0.001 (0.012)	Loss 4.6323 (4.5188)	Top-1 acc 19.141 (21.393)	Top-5 acc 39.844 (42.738)	lr 0.02558
Warmup Train [20][2290/3239]	Time 0.560 (0.515)	Data 0.001 (0.012)	Loss 4.5800 (4.5190)	Top-1 acc 18.359 (21.387)	Top-5 acc 41.016 (42.734)	lr 0.02558
Warmup Train [20][2300/3239]	Time 0.304 (0.515)	Data 0.001 (0.012)	Loss 4.5235 (4.5189)	Top-1 acc 21.094 (21.391)	Top-5 acc 43.750 (42.735)	lr 0.02557
Warmup Train [20][2310/3239]	Time 0.412 (0.515)	Data 0.001 (0.012)	Loss 4.6091 (4.5187)	Top-1 acc 21.875 (21.399)	Top-5 acc 42.578 (42.746)	lr 0.02556
Warmup Train [20][2320/3239]	Time 0.380 (0.515)	Data 0.001 (0.012)	Loss 4.6339 (4.5185)	Top-1 acc 19.531 (21.404)	Top-5 acc 41.406 (42.751)	lr 0.02556
Warmup Train [20][2330/3239]	Time 0.717 (0.515)	Data 0.001 (0.012)	Loss 4.3138 (4.5180)	Top-1 acc 26.953 (21.413)	Top-5 acc 48.828 (42.765)	lr 0.02555
Warmup Train [20][2340/3239]	Time 0.633 (0.515)	Data 0.001 (0.012)	Loss 4.4261 (4.5180)	Top-1 acc 25.781 (21.414)	Top-5 acc 42.969 (42.765)	lr 0.02555
Warmup Train [20][2350/3239]	Time 0.480 (0.515)	Data 0.001 (0.011)	Loss 4.5402 (4.5180)	Top-1 acc 22.266 (21.411)	Top-5 acc 39.453 (42.762)	lr 0.02554
Warmup Train [20][2360/3239]	Time 0.384 (0.515)	Data 0.001 (0.011)	Loss 4.5750 (4.5180)	Top-1 acc 23.047 (21.415)	Top-5 acc 44.141 (42.764)	lr 0.02553
Warmup Train [20][2370/3239]	Time 0.308 (0.515)	Data 0.001 (0.011)	Loss 4.4962 (4.5176)	Top-1 acc 21.094 (21.424)	Top-5 acc 45.312 (42.775)	lr 0.02553
Warmup Train [20][2380/3239]	Time 0.551 (0.515)	Data 0.001 (0.011)	Loss 4.4906 (4.5176)	Top-1 acc 17.969 (21.418)	Top-5 acc 42.578 (42.774)	lr 0.02552
Warmup Train [20][2390/3239]	Time 0.411 (0.515)	Data 0.001 (0.011)	Loss 4.5312 (4.5177)	Top-1 acc 21.484 (21.420)	Top-5 acc 41.406 (42.772)	lr 0.02552
Warmup Train [20][2400/3239]	Time 0.608 (0.515)	Data 0.001 (0.011)	Loss 4.3977 (4.5175)	Top-1 acc 25.000 (21.423)	Top-5 acc 44.531 (42.775)	lr 0.02551
Warmup Train [20][2410/3239]	Time 0.454 (0.515)	Data 0.001 (0.011)	Loss 4.4357 (4.5175)	Top-1 acc 21.875 (21.419)	Top-5 acc 43.750 (42.779)	lr 0.02550
Warmup Train [20][2420/3239]	Time 0.483 (0.515)	Data 0.001 (0.011)	Loss 4.6911 (4.5174)	Top-1 acc 19.141 (21.421)	Top-5 acc 38.281 (42.782)	lr 0.02550
Warmup Train [20][2430/3239]	Time 0.439 (0.515)	Data 0.001 (0.011)	Loss 4.5930 (4.5176)	Top-1 acc 19.922 (21.413)	Top-5 acc 43.750 (42.779)	lr 0.02549
Warmup Train [20][2440/3239]	Time 0.410 (0.515)	Data 0.001 (0.011)	Loss 4.4569 (4.5178)	Top-1 acc 21.484 (21.409)	Top-5 acc 41.016 (42.775)	lr 0.02548
Warmup Train [20][2450/3239]	Time 0.660 (0.515)	Data 0.001 (0.011)	Loss 4.4386 (4.5175)	Top-1 acc 22.266 (21.415)	Top-5 acc 48.047 (42.783)	lr 0.02548
Warmup Train [20][2460/3239]	Time 0.333 (0.514)	Data 0.001 (0.011)	Loss 4.7819 (4.5177)	Top-1 acc 15.234 (21.411)	Top-5 acc 33.594 (42.773)	lr 0.02547
Warmup Train [20][2470/3239]	Time 0.609 (0.514)	Data 0.001 (0.011)	Loss 4.7250 (4.5178)	Top-1 acc 19.531 (21.409)	Top-5 acc 39.062 (42.771)	lr 0.02547
Warmup Train [20][2480/3239]	Time 0.369 (0.514)	Data 0.001 (0.011)	Loss 4.3184 (4.5175)	Top-1 acc 21.875 (21.414)	Top-5 acc 44.531 (42.780)	lr 0.02546
Warmup Train [20][2490/3239]	Time 0.569 (0.514)	Data 0.001 (0.011)	Loss 4.5308 (4.5175)	Top-1 acc 16.797 (21.413)	Top-5 acc 41.016 (42.780)	lr 0.02545
Warmup Train [20][2500/3239]	Time 0.430 (0.514)	Data 0.001 (0.011)	Loss 4.5606 (4.5178)	Top-1 acc 20.312 (21.406)	Top-5 acc 41.797 (42.772)	lr 0.02545
Warmup Train [20][2510/3239]	Time 0.500 (0.514)	Data 0.001 (0.011)	Loss 4.6639 (4.5176)	Top-1 acc 19.922 (21.410)	Top-5 acc 41.016 (42.773)	lr 0.02544
Warmup Train [20][2520/3239]	Time 0.573 (0.514)	Data 0.001 (0.011)	Loss 4.6307 (4.5177)	Top-1 acc 22.266 (21.412)	Top-5 acc 39.062 (42.772)	lr 0.02544
Warmup Train [20][2530/3239]	Time 0.581 (0.514)	Data 0.001 (0.011)	Loss 4.5960 (4.5176)	Top-1 acc 18.750 (21.416)	Top-5 acc 38.672 (42.773)	lr 0.02543
Warmup Train [20][2540/3239]	Time 0.365 (0.514)	Data 0.002 (0.011)	Loss 4.5147 (4.5176)	Top-1 acc 21.484 (21.417)	Top-5 acc 41.016 (42.772)	lr 0.02542
Warmup Train [20][2550/3239]	Time 0.521 (0.514)	Data 0.001 (0.011)	Loss 4.4052 (4.5175)	Top-1 acc 25.391 (21.423)	Top-5 acc 45.312 (42.776)	lr 0.02542
Warmup Train [20][2560/3239]	Time 0.610 (0.515)	Data 0.001 (0.011)	Loss 4.5246 (4.5174)	Top-1 acc 17.578 (21.426)	Top-5 acc 41.406 (42.777)	lr 0.02541
Warmup Train [20][2570/3239]	Time 0.309 (0.515)	Data 0.001 (0.011)	Loss 4.5165 (4.5175)	Top-1 acc 25.391 (21.425)	Top-5 acc 43.359 (42.776)	lr 0.02541
Warmup Train [20][2580/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 4.5208 (4.5174)	Top-1 acc 21.875 (21.428)	Top-5 acc 46.484 (42.779)	lr 0.02540
Warmup Train [20][2590/3239]	Time 0.354 (0.515)	Data 0.001 (0.011)	Loss 4.6676 (4.5173)	Top-1 acc 19.922 (21.432)	Top-5 acc 42.188 (42.786)	lr 0.02539
Warmup Train [20][2600/3239]	Time 0.525 (0.515)	Data 0.001 (0.011)	Loss 4.5954 (4.5172)	Top-1 acc 20.312 (21.430)	Top-5 acc 42.188 (42.787)	lr 0.02539
Warmup Train [20][2610/3239]	Time 0.618 (0.515)	Data 0.001 (0.011)	Loss 4.5605 (4.5172)	Top-1 acc 20.312 (21.432)	Top-5 acc 44.531 (42.791)	lr 0.02538
Warmup Train [20][2620/3239]	Time 0.496 (0.515)	Data 0.001 (0.011)	Loss 4.4369 (4.5172)	Top-1 acc 23.438 (21.431)	Top-5 acc 44.531 (42.790)	lr 0.02538
Warmup Train [20][2630/3239]	Time 0.601 (0.515)	Data 0.001 (0.011)	Loss 4.6220 (4.5169)	Top-1 acc 16.406 (21.437)	Top-5 acc 39.453 (42.799)	lr 0.02537
Warmup Train [20][2640/3239]	Time 0.480 (0.515)	Data 0.001 (0.011)	Loss 4.3722 (4.5169)	Top-1 acc 26.562 (21.440)	Top-5 acc 46.484 (42.796)	lr 0.02536
Warmup Train [20][2650/3239]	Time 0.671 (0.515)	Data 0.002 (0.011)	Loss 4.3082 (4.5167)	Top-1 acc 24.219 (21.443)	Top-5 acc 47.656 (42.800)	lr 0.02536
Warmup Train [20][2660/3239]	Time 0.601 (0.515)	Data 0.001 (0.011)	Loss 4.6198 (4.5166)	Top-1 acc 16.016 (21.446)	Top-5 acc 38.672 (42.803)	lr 0.02535
Warmup Train [20][2670/3239]	Time 0.385 (0.515)	Data 0.001 (0.011)	Loss 4.4565 (4.5165)	Top-1 acc 21.875 (21.448)	Top-5 acc 42.578 (42.807)	lr 0.02535
Warmup Train [20][2680/3239]	Time 0.472 (0.514)	Data 0.001 (0.011)	Loss 4.5660 (4.5165)	Top-1 acc 17.969 (21.449)	Top-5 acc 44.531 (42.809)	lr 0.02534
Warmup Train [20][2690/3239]	Time 0.604 (0.515)	Data 0.001 (0.011)	Loss 4.5535 (4.5164)	Top-1 acc 19.141 (21.453)	Top-5 acc 43.750 (42.814)	lr 0.02533
Warmup Train [20][2700/3239]	Time 0.340 (0.514)	Data 0.001 (0.011)	Loss 4.4224 (4.5162)	Top-1 acc 24.219 (21.458)	Top-5 acc 46.484 (42.822)	lr 0.02533
Warmup Train [20][2710/3239]	Time 0.609 (0.514)	Data 0.001 (0.011)	Loss 4.4214 (4.5160)	Top-1 acc 23.047 (21.466)	Top-5 acc 44.531 (42.828)	lr 0.02532
Warmup Train [20][2720/3239]	Time 0.603 (0.514)	Data 0.001 (0.011)	Loss 4.4829 (4.5160)	Top-1 acc 22.266 (21.461)	Top-5 acc 41.016 (42.829)	lr 0.02532
Warmup Train [20][2730/3239]	Time 0.624 (0.514)	Data 0.001 (0.011)	Loss 4.2169 (4.5157)	Top-1 acc 25.781 (21.464)	Top-5 acc 48.828 (42.839)	lr 0.02531
Warmup Train [20][2740/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 4.5077 (4.5155)	Top-1 acc 19.531 (21.468)	Top-5 acc 43.359 (42.845)	lr 0.02530
Warmup Train [20][2750/3239]	Time 0.508 (0.514)	Data 0.001 (0.011)	Loss 4.4300 (4.5152)	Top-1 acc 23.828 (21.474)	Top-5 acc 44.141 (42.848)	lr 0.02530
Warmup Train [20][2760/3239]	Time 0.778 (0.514)	Data 0.001 (0.011)	Loss 4.4912 (4.5155)	Top-1 acc 23.438 (21.472)	Top-5 acc 45.703 (42.841)	lr 0.02529
Warmup Train [20][2770/3239]	Time 0.641 (0.514)	Data 0.001 (0.011)	Loss 4.3831 (4.5156)	Top-1 acc 23.828 (21.471)	Top-5 acc 46.875 (42.840)	lr 0.02528
Warmup Train [20][2780/3239]	Time 0.395 (0.514)	Data 0.001 (0.011)	Loss 4.4721 (4.5155)	Top-1 acc 23.828 (21.476)	Top-5 acc 45.312 (42.847)	lr 0.02528
Warmup Train [20][2790/3239]	Time 0.417 (0.514)	Data 0.001 (0.011)	Loss 4.5675 (4.5152)	Top-1 acc 20.312 (21.482)	Top-5 acc 44.141 (42.852)	lr 0.02527
Warmup Train [20][2800/3239]	Time 0.345 (0.514)	Data 0.001 (0.011)	Loss 4.5218 (4.5150)	Top-1 acc 21.875 (21.482)	Top-5 acc 40.625 (42.854)	lr 0.02527
Warmup Train [20][2810/3239]	Time 0.604 (0.514)	Data 0.001 (0.011)	Loss 4.7004 (4.5151)	Top-1 acc 16.797 (21.481)	Top-5 acc 40.234 (42.855)	lr 0.02526
Warmup Train [20][2820/3239]	Time 0.665 (0.514)	Data 0.001 (0.011)	Loss 4.2332 (4.5151)	Top-1 acc 27.344 (21.485)	Top-5 acc 51.953 (42.860)	lr 0.02525
Warmup Train [20][2830/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 4.6712 (4.5150)	Top-1 acc 19.922 (21.490)	Top-5 acc 37.109 (42.863)	lr 0.02525
Warmup Train [20][2840/3239]	Time 0.331 (0.514)	Data 0.001 (0.011)	Loss 4.4742 (4.5148)	Top-1 acc 23.047 (21.493)	Top-5 acc 42.188 (42.866)	lr 0.02524
Warmup Train [20][2850/3239]	Time 0.532 (0.514)	Data 0.001 (0.011)	Loss 4.3198 (4.5147)	Top-1 acc 26.172 (21.494)	Top-5 acc 49.609 (42.869)	lr 0.02524
Warmup Train [20][2860/3239]	Time 0.522 (0.514)	Data 0.001 (0.011)	Loss 4.4492 (4.5148)	Top-1 acc 25.000 (21.494)	Top-5 acc 44.531 (42.868)	lr 0.02523
Warmup Train [20][2870/3239]	Time 0.410 (0.514)	Data 0.001 (0.011)	Loss 4.6151 (4.5147)	Top-1 acc 19.922 (21.496)	Top-5 acc 39.844 (42.867)	lr 0.02522
Warmup Train [20][2880/3239]	Time 0.692 (0.514)	Data 0.001 (0.011)	Loss 4.4124 (4.5148)	Top-1 acc 22.656 (21.496)	Top-5 acc 47.656 (42.869)	lr 0.02522
Warmup Train [20][2890/3239]	Time 0.566 (0.514)	Data 0.001 (0.011)	Loss 4.4864 (4.5146)	Top-1 acc 21.875 (21.501)	Top-5 acc 42.188 (42.869)	lr 0.02521
Warmup Train [20][2900/3239]	Time 0.659 (0.514)	Data 0.001 (0.011)	Loss 4.4229 (4.5146)	Top-1 acc 26.172 (21.505)	Top-5 acc 45.703 (42.866)	lr 0.02521
Warmup Train [20][2910/3239]	Time 0.506 (0.514)	Data 0.001 (0.011)	Loss 4.5747 (4.5145)	Top-1 acc 20.703 (21.501)	Top-5 acc 41.406 (42.867)	lr 0.02520
Warmup Train [20][2920/3239]	Time 0.611 (0.514)	Data 0.001 (0.011)	Loss 4.5783 (4.5146)	Top-1 acc 21.484 (21.499)	Top-5 acc 44.531 (42.864)	lr 0.02519
Warmup Train [20][2930/3239]	Time 0.634 (0.514)	Data 0.001 (0.011)	Loss 4.3072 (4.5143)	Top-1 acc 27.734 (21.506)	Top-5 acc 50.781 (42.874)	lr 0.02519
Warmup Train [20][2940/3239]	Time 0.542 (0.514)	Data 0.001 (0.011)	Loss 4.6183 (4.5142)	Top-1 acc 20.312 (21.513)	Top-5 acc 40.234 (42.877)	lr 0.02518
Warmup Train [20][2950/3239]	Time 0.564 (0.514)	Data 0.002 (0.011)	Loss 4.3950 (4.5140)	Top-1 acc 21.875 (21.514)	Top-5 acc 45.703 (42.881)	lr 0.02518
Warmup Train [20][2960/3239]	Time 0.288 (0.514)	Data 0.001 (0.011)	Loss 4.6185 (4.5141)	Top-1 acc 17.578 (21.514)	Top-5 acc 36.328 (42.881)	lr 0.02517
Warmup Train [20][2970/3239]	Time 0.671 (0.514)	Data 0.001 (0.011)	Loss 4.5495 (4.5140)	Top-1 acc 19.141 (21.515)	Top-5 acc 42.188 (42.883)	lr 0.02516
Warmup Train [20][2980/3239]	Time 0.371 (0.514)	Data 0.001 (0.011)	Loss 4.2968 (4.5138)	Top-1 acc 25.000 (21.519)	Top-5 acc 47.656 (42.889)	lr 0.02516
Warmup Train [20][2990/3239]	Time 0.491 (0.514)	Data 0.001 (0.011)	Loss 4.5127 (4.5139)	Top-1 acc 25.000 (21.518)	Top-5 acc 43.750 (42.888)	lr 0.02515
Warmup Train [20][3000/3239]	Time 0.549 (0.514)	Data 0.001 (0.011)	Loss 4.5146 (4.5140)	Top-1 acc 25.000 (21.517)	Top-5 acc 44.922 (42.886)	lr 0.02515
Warmup Train [20][3010/3239]	Time 0.569 (0.514)	Data 0.001 (0.011)	Loss 4.6094 (4.5139)	Top-1 acc 20.703 (21.516)	Top-5 acc 37.891 (42.888)	lr 0.02514
Warmup Train [20][3020/3239]	Time 0.693 (0.514)	Data 0.001 (0.010)	Loss 4.3323 (4.5138)	Top-1 acc 23.438 (21.518)	Top-5 acc 46.484 (42.895)	lr 0.02513
Warmup Train [20][3030/3239]	Time 0.398 (0.514)	Data 0.001 (0.010)	Loss 4.5284 (4.5136)	Top-1 acc 22.266 (21.515)	Top-5 acc 41.406 (42.900)	lr 0.02513
Warmup Train [20][3040/3239]	Time 0.525 (0.514)	Data 0.001 (0.010)	Loss 4.5362 (4.5135)	Top-1 acc 17.578 (21.516)	Top-5 acc 44.141 (42.904)	lr 0.02512
Warmup Train [20][3050/3239]	Time 0.516 (0.514)	Data 0.001 (0.010)	Loss 4.6407 (4.5134)	Top-1 acc 20.312 (21.516)	Top-5 acc 39.453 (42.905)	lr 0.02512
Warmup Train [20][3060/3239]	Time 0.527 (0.514)	Data 0.001 (0.010)	Loss 4.4745 (4.5133)	Top-1 acc 21.484 (21.518)	Top-5 acc 46.484 (42.902)	lr 0.02511
Warmup Train [20][3070/3239]	Time 0.383 (0.514)	Data 0.001 (0.010)	Loss 4.5797 (4.5131)	Top-1 acc 22.656 (21.523)	Top-5 acc 43.750 (42.908)	lr 0.02510
Warmup Train [20][3080/3239]	Time 0.413 (0.514)	Data 0.001 (0.010)	Loss 4.5879 (4.5132)	Top-1 acc 21.875 (21.521)	Top-5 acc 41.406 (42.907)	lr 0.02510
Warmup Train [20][3090/3239]	Time 0.689 (0.514)	Data 0.001 (0.010)	Loss 4.4504 (4.5130)	Top-1 acc 27.344 (21.525)	Top-5 acc 44.531 (42.911)	lr 0.02509
Warmup Train [20][3100/3239]	Time 0.651 (0.514)	Data 0.001 (0.010)	Loss 4.6459 (4.5129)	Top-1 acc 20.312 (21.525)	Top-5 acc 38.281 (42.911)	lr 0.02508
Warmup Train [20][3110/3239]	Time 0.557 (0.514)	Data 0.001 (0.010)	Loss 4.5804 (4.5128)	Top-1 acc 23.828 (21.528)	Top-5 acc 42.188 (42.914)	lr 0.02508
Warmup Train [20][3120/3239]	Time 0.490 (0.514)	Data 0.001 (0.010)	Loss 4.5821 (4.5128)	Top-1 acc 20.312 (21.529)	Top-5 acc 42.969 (42.913)	lr 0.02507
Warmup Train [20][3130/3239]	Time 0.410 (0.514)	Data 0.001 (0.010)	Loss 4.4983 (4.5129)	Top-1 acc 26.172 (21.531)	Top-5 acc 47.266 (42.914)	lr 0.02507
Warmup Train [20][3140/3239]	Time 0.551 (0.514)	Data 0.001 (0.010)	Loss 4.3520 (4.5127)	Top-1 acc 26.562 (21.535)	Top-5 acc 46.875 (42.917)	lr 0.02506
Warmup Train [20][3150/3239]	Time 0.482 (0.514)	Data 0.001 (0.010)	Loss 4.6104 (4.5127)	Top-1 acc 19.141 (21.533)	Top-5 acc 39.062 (42.914)	lr 0.02505
Warmup Train [20][3160/3239]	Time 0.628 (0.514)	Data 0.001 (0.010)	Loss 4.4759 (4.5126)	Top-1 acc 21.094 (21.531)	Top-5 acc 42.578 (42.913)	lr 0.02505
Warmup Train [20][3170/3239]	Time 0.474 (0.514)	Data 0.001 (0.010)	Loss 4.6799 (4.5126)	Top-1 acc 18.359 (21.533)	Top-5 acc 42.578 (42.914)	lr 0.02504
Warmup Train [20][3180/3239]	Time 0.726 (0.514)	Data 0.000 (0.010)	Loss 4.6232 (4.5125)	Top-1 acc 22.266 (21.537)	Top-5 acc 38.672 (42.916)	lr 0.02504
Warmup Train [20][3190/3239]	Time 0.493 (0.514)	Data 0.000 (0.010)	Loss 4.3303 (4.5124)	Top-1 acc 23.047 (21.542)	Top-5 acc 46.484 (42.917)	lr 0.02503
Warmup Train [20][3200/3239]	Time 0.466 (0.514)	Data 0.000 (0.010)	Loss 4.5016 (4.5123)	Top-1 acc 20.703 (21.543)	Top-5 acc 42.969 (42.920)	lr 0.02502
Warmup Train [20][3210/3239]	Time 0.460 (0.513)	Data 0.000 (0.010)	Loss 4.2580 (4.5123)	Top-1 acc 24.609 (21.546)	Top-5 acc 52.734 (42.925)	lr 0.02502
Warmup Train [20][3220/3239]	Time 0.395 (0.513)	Data 0.000 (0.010)	Loss 4.4071 (4.5122)	Top-1 acc 25.000 (21.549)	Top-5 acc 45.703 (42.927)	lr 0.02501
Warmup Train [20][3230/3239]	Time 0.427 (0.513)	Data 0.000 (0.010)	Loss 4.2301 (4.5121)	Top-1 acc 26.172 (21.547)	Top-5 acc 48.828 (42.929)	lr 0.02501
Warmup Train [20][3239/3239]	Time 0.311 (0.513)	Data 0.000 (0.010)	Loss 4.2376 (4.5120)	Top-1 acc 32.099 (21.550)	Top-5 acc 50.617 (42.931)	lr 0.02500
==========Warmup Valid [20/40]	loss 3.518	top-1 acc 28.757	top-5 acc 52.748	Train top-1 21.550	top-5 42.931	flops: 442.4M
Warmup Train [21][0/3239]	Time 15.619 (15.619)	Data 13.720 (13.720)	Loss 4.4404 (4.4404)	Top-1 acc 21.875 (21.875)	Top-5 acc 42.578 (42.578)	lr 0.02500
Warmup Train [21][10/3239]	Time 0.683 (1.915)	Data 0.001 (1.249)	Loss 4.4516 (4.4569)	Top-1 acc 21.875 (21.626)	Top-5 acc 46.484 (44.141)	lr 0.02499
Warmup Train [21][20/3239]	Time 0.636 (1.247)	Data 0.001 (0.655)	Loss 4.3655 (4.4747)	Top-1 acc 23.047 (21.875)	Top-5 acc 49.609 (43.862)	lr 0.02499
Warmup Train [21][30/3239]	Time 0.596 (1.007)	Data 0.001 (0.444)	Loss 4.3304 (4.4728)	Top-1 acc 26.172 (21.825)	Top-5 acc 44.141 (43.700)	lr 0.02498
Warmup Train [21][40/3239]	Time 0.598 (0.887)	Data 0.001 (0.337)	Loss 4.5338 (4.4752)	Top-1 acc 19.141 (21.494)	Top-5 acc 40.625 (43.493)	lr 0.02498
Warmup Train [21][50/3239]	Time 0.355 (0.813)	Data 0.001 (0.271)	Loss 4.4876 (4.4842)	Top-1 acc 21.094 (21.469)	Top-5 acc 42.188 (43.329)	lr 0.02497
Warmup Train [21][60/3239]	Time 0.610 (0.762)	Data 0.001 (0.229)	Loss 4.4142 (4.4798)	Top-1 acc 21.484 (21.491)	Top-5 acc 44.922 (43.577)	lr 0.02496
Warmup Train [21][70/3239]	Time 0.385 (0.725)	Data 0.001 (0.197)	Loss 4.5835 (4.4833)	Top-1 acc 19.531 (21.501)	Top-5 acc 40.625 (43.508)	lr 0.02496
Warmup Train [21][80/3239]	Time 0.604 (0.701)	Data 0.001 (0.174)	Loss 4.6407 (4.4808)	Top-1 acc 21.875 (21.774)	Top-5 acc 40.625 (43.465)	lr 0.02495
Warmup Train [21][90/3239]	Time 0.507 (0.679)	Data 0.001 (0.155)	Loss 4.4642 (4.4824)	Top-1 acc 23.047 (21.862)	Top-5 acc 46.484 (43.544)	lr 0.02495
Warmup Train [21][100/3239]	Time 0.181 (0.660)	Data 0.001 (0.140)	Loss 4.4590 (4.4838)	Top-1 acc 22.266 (21.972)	Top-5 acc 44.531 (43.564)	lr 0.02494
Warmup Train [21][110/3239]	Time 0.512 (0.648)	Data 0.001 (0.129)	Loss 4.5052 (4.4830)	Top-1 acc 23.047 (22.104)	Top-5 acc 43.750 (43.651)	lr 0.02493
Warmup Train [21][120/3239]	Time 0.396 (0.636)	Data 0.001 (0.119)	Loss 4.4029 (4.4778)	Top-1 acc 22.266 (22.185)	Top-5 acc 47.656 (43.760)	lr 0.02493
Warmup Train [21][130/3239]	Time 0.527 (0.624)	Data 0.001 (0.110)	Loss 4.5417 (4.4761)	Top-1 acc 23.438 (22.304)	Top-5 acc 41.797 (43.836)	lr 0.02492
Warmup Train [21][140/3239]	Time 0.468 (0.614)	Data 0.001 (0.103)	Loss 4.6709 (4.4780)	Top-1 acc 17.578 (22.329)	Top-5 acc 37.109 (43.819)	lr 0.02492
Warmup Train [21][150/3239]	Time 0.456 (0.604)	Data 0.002 (0.097)	Loss 4.6655 (4.4813)	Top-1 acc 18.750 (22.248)	Top-5 acc 35.547 (43.665)	lr 0.02491
Warmup Train [21][160/3239]	Time 0.522 (0.599)	Data 0.001 (0.091)	Loss 4.5870 (4.4832)	Top-1 acc 20.703 (22.178)	Top-5 acc 40.234 (43.638)	lr 0.02490
Warmup Train [21][170/3239]	Time 0.501 (0.595)	Data 0.001 (0.086)	Loss 4.5597 (4.4852)	Top-1 acc 23.828 (22.190)	Top-5 acc 41.406 (43.620)	lr 0.02490
Warmup Train [21][180/3239]	Time 0.385 (0.591)	Data 0.001 (0.082)	Loss 4.3775 (4.4825)	Top-1 acc 24.609 (22.203)	Top-5 acc 44.922 (43.709)	lr 0.02489
Warmup Train [21][190/3239]	Time 0.636 (0.586)	Data 0.001 (0.078)	Loss 4.3852 (4.4833)	Top-1 acc 23.438 (22.212)	Top-5 acc 45.312 (43.715)	lr 0.02488
Warmup Train [21][200/3239]	Time 0.681 (0.583)	Data 0.001 (0.074)	Loss 4.4687 (4.4849)	Top-1 acc 22.656 (22.192)	Top-5 acc 48.047 (43.738)	lr 0.02488
Warmup Train [21][210/3239]	Time 0.519 (0.579)	Data 0.001 (0.071)	Loss 4.5031 (4.4847)	Top-1 acc 19.922 (22.199)	Top-5 acc 46.094 (43.730)	lr 0.02487
Warmup Train [21][220/3239]	Time 0.506 (0.576)	Data 0.001 (0.068)	Loss 4.4734 (4.4812)	Top-1 acc 20.312 (22.223)	Top-5 acc 44.922 (43.796)	lr 0.02487
Warmup Train [21][230/3239]	Time 0.397 (0.574)	Data 0.001 (0.066)	Loss 4.5694 (4.4795)	Top-1 acc 18.359 (22.157)	Top-5 acc 39.844 (43.833)	lr 0.02486
Warmup Train [21][240/3239]	Time 0.515 (0.570)	Data 0.001 (0.063)	Loss 4.5046 (4.4809)	Top-1 acc 21.875 (22.117)	Top-5 acc 43.750 (43.781)	lr 0.02485
Warmup Train [21][250/3239]	Time 0.510 (0.568)	Data 0.001 (0.061)	Loss 4.3376 (4.4821)	Top-1 acc 23.047 (22.087)	Top-5 acc 46.094 (43.748)	lr 0.02485
Warmup Train [21][260/3239]	Time 0.385 (0.566)	Data 0.001 (0.059)	Loss 4.5930 (4.4806)	Top-1 acc 15.625 (22.107)	Top-5 acc 41.016 (43.757)	lr 0.02484
Warmup Train [21][270/3239]	Time 0.687 (0.564)	Data 0.001 (0.057)	Loss 4.5999 (4.4807)	Top-1 acc 25.391 (22.106)	Top-5 acc 42.188 (43.757)	lr 0.02484
Warmup Train [21][280/3239]	Time 0.475 (0.561)	Data 0.001 (0.055)	Loss 4.6722 (4.4808)	Top-1 acc 20.312 (22.099)	Top-5 acc 41.406 (43.756)	lr 0.02483
Warmup Train [21][290/3239]	Time 0.589 (0.560)	Data 0.001 (0.053)	Loss 4.4491 (4.4788)	Top-1 acc 21.875 (22.125)	Top-5 acc 41.406 (43.785)	lr 0.02482
Warmup Train [21][300/3239]	Time 0.545 (0.558)	Data 0.001 (0.051)	Loss 4.3626 (4.4786)	Top-1 acc 21.484 (22.115)	Top-5 acc 46.094 (43.802)	lr 0.02482
Warmup Train [21][310/3239]	Time 0.478 (0.556)	Data 0.001 (0.050)	Loss 4.3456 (4.4775)	Top-1 acc 22.656 (22.110)	Top-5 acc 48.047 (43.824)	lr 0.02481
Warmup Train [21][320/3239]	Time 0.495 (0.555)	Data 0.001 (0.048)	Loss 4.5210 (4.4753)	Top-1 acc 19.922 (22.167)	Top-5 acc 44.922 (43.866)	lr 0.02481
Warmup Train [21][330/3239]	Time 0.360 (0.553)	Data 0.002 (0.047)	Loss 4.3506 (4.4746)	Top-1 acc 25.781 (22.181)	Top-5 acc 46.094 (43.910)	lr 0.02480
Warmup Train [21][340/3239]	Time 0.524 (0.552)	Data 0.001 (0.046)	Loss 4.3005 (4.4749)	Top-1 acc 23.047 (22.176)	Top-5 acc 50.000 (43.903)	lr 0.02479
Warmup Train [21][350/3239]	Time 0.613 (0.551)	Data 0.002 (0.045)	Loss 4.2749 (4.4739)	Top-1 acc 21.484 (22.204)	Top-5 acc 46.875 (43.929)	lr 0.02479
Warmup Train [21][360/3239]	Time 0.479 (0.550)	Data 0.001 (0.044)	Loss 4.3253 (4.4724)	Top-1 acc 25.781 (22.235)	Top-5 acc 48.047 (43.962)	lr 0.02478
Warmup Train [21][370/3239]	Time 0.614 (0.549)	Data 0.001 (0.043)	Loss 4.5203 (4.4723)	Top-1 acc 23.828 (22.241)	Top-5 acc 43.750 (43.948)	lr 0.02478
Warmup Train [21][380/3239]	Time 0.239 (0.547)	Data 0.001 (0.042)	Loss 4.4296 (4.4721)	Top-1 acc 24.219 (22.229)	Top-5 acc 48.047 (43.936)	lr 0.02477
Warmup Train [21][390/3239]	Time 0.385 (0.546)	Data 0.001 (0.041)	Loss 4.4546 (4.4708)	Top-1 acc 24.609 (22.252)	Top-5 acc 47.266 (43.973)	lr 0.02476
Warmup Train [21][400/3239]	Time 0.511 (0.545)	Data 0.001 (0.040)	Loss 4.5930 (4.4706)	Top-1 acc 20.312 (22.271)	Top-5 acc 42.188 (43.962)	lr 0.02476
Warmup Train [21][410/3239]	Time 0.547 (0.543)	Data 0.001 (0.040)	Loss 4.2355 (4.4690)	Top-1 acc 28.125 (22.303)	Top-5 acc 46.875 (43.976)	lr 0.02475
Warmup Train [21][420/3239]	Time 0.462 (0.542)	Data 0.001 (0.039)	Loss 4.4945 (4.4690)	Top-1 acc 18.359 (22.270)	Top-5 acc 40.234 (43.950)	lr 0.02475
Warmup Train [21][430/3239]	Time 0.390 (0.540)	Data 0.001 (0.038)	Loss 4.3804 (4.4700)	Top-1 acc 23.047 (22.263)	Top-5 acc 46.875 (43.939)	lr 0.02474
Warmup Train [21][440/3239]	Time 0.444 (0.539)	Data 0.001 (0.037)	Loss 4.4159 (4.4699)	Top-1 acc 21.094 (22.259)	Top-5 acc 43.359 (43.930)	lr 0.02473
Warmup Train [21][450/3239]	Time 0.432 (0.538)	Data 0.002 (0.037)	Loss 4.3580 (4.4693)	Top-1 acc 25.391 (22.273)	Top-5 acc 48.828 (43.947)	lr 0.02473
Warmup Train [21][460/3239]	Time 0.509 (0.537)	Data 0.001 (0.036)	Loss 4.6708 (4.4703)	Top-1 acc 19.141 (22.258)	Top-5 acc 41.406 (43.919)	lr 0.02472
Warmup Train [21][470/3239]	Time 0.509 (0.537)	Data 0.001 (0.036)	Loss 4.4868 (4.4720)	Top-1 acc 21.875 (22.232)	Top-5 acc 44.922 (43.888)	lr 0.02472
Warmup Train [21][480/3239]	Time 0.518 (0.537)	Data 0.001 (0.035)	Loss 4.5022 (4.4726)	Top-1 acc 19.531 (22.201)	Top-5 acc 43.359 (43.874)	lr 0.02471
Warmup Train [21][490/3239]	Time 0.515 (0.536)	Data 0.001 (0.035)	Loss 4.6339 (4.4718)	Top-1 acc 19.922 (22.227)	Top-5 acc 39.844 (43.888)	lr 0.02470
Warmup Train [21][500/3239]	Time 0.466 (0.535)	Data 0.001 (0.034)	Loss 4.4500 (4.4719)	Top-1 acc 23.438 (22.227)	Top-5 acc 47.656 (43.913)	lr 0.02470
Warmup Train [21][510/3239]	Time 0.608 (0.535)	Data 0.001 (0.034)	Loss 4.4109 (4.4709)	Top-1 acc 23.438 (22.258)	Top-5 acc 42.188 (43.914)	lr 0.02469
Warmup Train [21][520/3239]	Time 0.554 (0.535)	Data 0.001 (0.033)	Loss 4.2892 (4.4703)	Top-1 acc 25.781 (22.274)	Top-5 acc 47.656 (43.916)	lr 0.02468
Warmup Train [21][530/3239]	Time 0.587 (0.535)	Data 0.001 (0.032)	Loss 4.5353 (4.4704)	Top-1 acc 20.703 (22.269)	Top-5 acc 43.359 (43.921)	lr 0.02468
Warmup Train [21][540/3239]	Time 0.491 (0.534)	Data 0.001 (0.032)	Loss 4.7828 (4.4716)	Top-1 acc 16.016 (22.253)	Top-5 acc 35.547 (43.891)	lr 0.02467
Warmup Train [21][550/3239]	Time 0.503 (0.534)	Data 0.001 (0.032)	Loss 4.4850 (4.4719)	Top-1 acc 18.750 (22.255)	Top-5 acc 41.797 (43.878)	lr 0.02467
Warmup Train [21][560/3239]	Time 0.470 (0.533)	Data 0.001 (0.031)	Loss 4.7285 (4.4723)	Top-1 acc 18.359 (22.250)	Top-5 acc 37.109 (43.875)	lr 0.02466
Warmup Train [21][570/3239]	Time 0.588 (0.533)	Data 0.001 (0.031)	Loss 4.6007 (4.4721)	Top-1 acc 19.141 (22.254)	Top-5 acc 40.234 (43.878)	lr 0.02465
Warmup Train [21][580/3239]	Time 0.545 (0.533)	Data 0.001 (0.030)	Loss 4.5924 (4.4718)	Top-1 acc 20.703 (22.252)	Top-5 acc 41.797 (43.881)	lr 0.02465
Warmup Train [21][590/3239]	Time 0.464 (0.532)	Data 0.001 (0.030)	Loss 4.5760 (4.4718)	Top-1 acc 19.922 (22.247)	Top-5 acc 41.016 (43.872)	lr 0.02464
Warmup Train [21][600/3239]	Time 0.419 (0.532)	Data 0.001 (0.029)	Loss 4.5055 (4.4717)	Top-1 acc 23.438 (22.259)	Top-5 acc 42.969 (43.869)	lr 0.02464
Warmup Train [21][610/3239]	Time 0.562 (0.532)	Data 0.026 (0.029)	Loss 4.6189 (4.4720)	Top-1 acc 22.266 (22.252)	Top-5 acc 41.016 (43.861)	lr 0.02463
Warmup Train [21][620/3239]	Time 0.661 (0.531)	Data 0.001 (0.028)	Loss 4.3402 (4.4715)	Top-1 acc 24.609 (22.257)	Top-5 acc 44.141 (43.882)	lr 0.02462
Warmup Train [21][630/3239]	Time 0.406 (0.531)	Data 0.002 (0.028)	Loss 4.4550 (4.4713)	Top-1 acc 23.828 (22.262)	Top-5 acc 48.047 (43.899)	lr 0.02462
Warmup Train [21][640/3239]	Time 0.482 (0.531)	Data 0.001 (0.028)	Loss 4.5777 (4.4714)	Top-1 acc 23.047 (22.258)	Top-5 acc 38.672 (43.890)	lr 0.02461
Warmup Train [21][650/3239]	Time 0.531 (0.530)	Data 0.001 (0.028)	Loss 4.5033 (4.4718)	Top-1 acc 21.875 (22.251)	Top-5 acc 46.094 (43.886)	lr 0.02461
Warmup Train [21][660/3239]	Time 0.546 (0.529)	Data 0.002 (0.027)	Loss 4.3983 (4.4716)	Top-1 acc 23.047 (22.244)	Top-5 acc 46.875 (43.900)	lr 0.02460
Warmup Train [21][670/3239]	Time 0.562 (0.529)	Data 0.001 (0.027)	Loss 4.3683 (4.4716)	Top-1 acc 24.219 (22.255)	Top-5 acc 48.047 (43.903)	lr 0.02459
Warmup Train [21][680/3239]	Time 0.335 (0.529)	Data 0.001 (0.026)	Loss 4.3133 (4.4719)	Top-1 acc 26.172 (22.231)	Top-5 acc 45.703 (43.891)	lr 0.02459
Warmup Train [21][690/3239]	Time 0.389 (0.528)	Data 0.001 (0.026)	Loss 4.3181 (4.4718)	Top-1 acc 28.125 (22.243)	Top-5 acc 51.562 (43.892)	lr 0.02458
Warmup Train [21][700/3239]	Time 0.461 (0.527)	Data 0.001 (0.026)	Loss 4.3631 (4.4714)	Top-1 acc 22.266 (22.238)	Top-5 acc 46.094 (43.898)	lr 0.02458
Warmup Train [21][710/3239]	Time 0.533 (0.527)	Data 0.001 (0.026)	Loss 4.5069 (4.4717)	Top-1 acc 22.656 (22.238)	Top-5 acc 42.188 (43.879)	lr 0.02457
Warmup Train [21][720/3239]	Time 0.662 (0.527)	Data 0.001 (0.026)	Loss 4.4819 (4.4706)	Top-1 acc 23.438 (22.255)	Top-5 acc 43.359 (43.896)	lr 0.02456
Warmup Train [21][730/3239]	Time 0.393 (0.526)	Data 0.001 (0.025)	Loss 4.4073 (4.4708)	Top-1 acc 23.047 (22.246)	Top-5 acc 44.922 (43.888)	lr 0.02456
Warmup Train [21][740/3239]	Time 0.429 (0.526)	Data 0.001 (0.025)	Loss 4.2983 (4.4700)	Top-1 acc 26.953 (22.262)	Top-5 acc 46.875 (43.908)	lr 0.02455
Warmup Train [21][750/3239]	Time 0.524 (0.526)	Data 0.001 (0.025)	Loss 4.6041 (4.4705)	Top-1 acc 16.406 (22.264)	Top-5 acc 37.109 (43.891)	lr 0.02455
Warmup Train [21][760/3239]	Time 0.638 (0.526)	Data 0.001 (0.025)	Loss 4.3701 (4.4709)	Top-1 acc 23.438 (22.260)	Top-5 acc 45.312 (43.867)	lr 0.02454
Warmup Train [21][770/3239]	Time 0.592 (0.526)	Data 0.001 (0.024)	Loss 4.4661 (4.4705)	Top-1 acc 25.391 (22.261)	Top-5 acc 47.266 (43.877)	lr 0.02453
Warmup Train [21][780/3239]	Time 0.659 (0.526)	Data 0.001 (0.024)	Loss 4.3392 (4.4699)	Top-1 acc 23.828 (22.272)	Top-5 acc 49.609 (43.887)	lr 0.02453
Warmup Train [21][790/3239]	Time 0.516 (0.526)	Data 0.001 (0.024)	Loss 4.7071 (4.4703)	Top-1 acc 20.312 (22.274)	Top-5 acc 42.188 (43.886)	lr 0.02452
Warmup Train [21][800/3239]	Time 0.555 (0.525)	Data 0.001 (0.024)	Loss 4.5722 (4.4702)	Top-1 acc 22.266 (22.278)	Top-5 acc 39.844 (43.887)	lr 0.02452
Warmup Train [21][810/3239]	Time 0.438 (0.525)	Data 0.001 (0.023)	Loss 4.2248 (4.4697)	Top-1 acc 26.172 (22.271)	Top-5 acc 49.219 (43.893)	lr 0.02451
Warmup Train [21][820/3239]	Time 0.489 (0.525)	Data 0.001 (0.023)	Loss 4.3230 (4.4698)	Top-1 acc 26.172 (22.276)	Top-5 acc 45.703 (43.886)	lr 0.02450
Warmup Train [21][830/3239]	Time 0.493 (0.525)	Data 0.001 (0.023)	Loss 4.5877 (4.4705)	Top-1 acc 18.750 (22.264)	Top-5 acc 39.844 (43.862)	lr 0.02450
Warmup Train [21][840/3239]	Time 0.601 (0.525)	Data 0.001 (0.023)	Loss 4.3277 (4.4700)	Top-1 acc 28.125 (22.262)	Top-5 acc 49.219 (43.881)	lr 0.02449
Warmup Train [21][850/3239]	Time 0.459 (0.524)	Data 0.001 (0.023)	Loss 4.5429 (4.4702)	Top-1 acc 21.094 (22.245)	Top-5 acc 43.359 (43.878)	lr 0.02448
Warmup Train [21][860/3239]	Time 0.480 (0.524)	Data 0.001 (0.023)	Loss 4.3856 (4.4704)	Top-1 acc 27.344 (22.243)	Top-5 acc 51.172 (43.879)	lr 0.02448
Warmup Train [21][870/3239]	Time 0.570 (0.524)	Data 0.001 (0.022)	Loss 4.4395 (4.4709)	Top-1 acc 24.219 (22.236)	Top-5 acc 42.188 (43.870)	lr 0.02447
Warmup Train [21][880/3239]	Time 0.418 (0.523)	Data 0.001 (0.022)	Loss 4.7324 (4.4712)	Top-1 acc 19.141 (22.228)	Top-5 acc 39.844 (43.859)	lr 0.02447
Warmup Train [21][890/3239]	Time 0.540 (0.524)	Data 0.001 (0.022)	Loss 4.4916 (4.4711)	Top-1 acc 17.969 (22.235)	Top-5 acc 46.875 (43.852)	lr 0.02446
Warmup Train [21][900/3239]	Time 0.544 (0.523)	Data 0.001 (0.022)	Loss 4.3537 (4.4705)	Top-1 acc 23.047 (22.231)	Top-5 acc 47.266 (43.862)	lr 0.02445
Warmup Train [21][910/3239]	Time 0.344 (0.523)	Data 0.001 (0.022)	Loss 4.6011 (4.4712)	Top-1 acc 23.438 (22.226)	Top-5 acc 41.797 (43.847)	lr 0.02445
Warmup Train [21][920/3239]	Time 0.612 (0.523)	Data 0.001 (0.022)	Loss 4.2913 (4.4711)	Top-1 acc 30.469 (22.233)	Top-5 acc 48.438 (43.841)	lr 0.02444
Warmup Train [21][930/3239]	Time 0.412 (0.523)	Data 0.001 (0.021)	Loss 4.4277 (4.4708)	Top-1 acc 22.266 (22.255)	Top-5 acc 48.828 (43.853)	lr 0.02444
Warmup Train [21][940/3239]	Time 0.650 (0.523)	Data 0.001 (0.021)	Loss 4.2803 (4.4709)	Top-1 acc 24.609 (22.242)	Top-5 acc 46.875 (43.833)	lr 0.02443
Warmup Train [21][950/3239]	Time 0.403 (0.522)	Data 0.001 (0.021)	Loss 4.5955 (4.4707)	Top-1 acc 20.312 (22.246)	Top-5 acc 37.109 (43.838)	lr 0.02442
Warmup Train [21][960/3239]	Time 0.559 (0.522)	Data 0.001 (0.021)	Loss 4.4457 (4.4702)	Top-1 acc 23.047 (22.254)	Top-5 acc 45.703 (43.856)	lr 0.02442
Warmup Train [21][970/3239]	Time 0.480 (0.522)	Data 0.001 (0.021)	Loss 4.4248 (4.4704)	Top-1 acc 21.875 (22.249)	Top-5 acc 41.797 (43.841)	lr 0.02441
Warmup Train [21][980/3239]	Time 0.479 (0.522)	Data 0.001 (0.021)	Loss 4.4221 (4.4705)	Top-1 acc 22.266 (22.236)	Top-5 acc 46.094 (43.842)	lr 0.02441
Warmup Train [21][990/3239]	Time 0.746 (0.521)	Data 0.001 (0.020)	Loss 4.3604 (4.4703)	Top-1 acc 26.172 (22.237)	Top-5 acc 44.531 (43.852)	lr 0.02440
Warmup Train [21][1000/3239]	Time 0.541 (0.521)	Data 0.001 (0.020)	Loss 4.4654 (4.4706)	Top-1 acc 23.828 (22.237)	Top-5 acc 46.875 (43.852)	lr 0.02439
Warmup Train [21][1010/3239]	Time 0.588 (0.521)	Data 0.001 (0.020)	Loss 4.5019 (4.4709)	Top-1 acc 19.922 (22.236)	Top-5 acc 44.922 (43.845)	lr 0.02439
Warmup Train [21][1020/3239]	Time 0.608 (0.521)	Data 0.001 (0.020)	Loss 4.4711 (4.4711)	Top-1 acc 23.047 (22.240)	Top-5 acc 41.797 (43.841)	lr 0.02438
Warmup Train [21][1030/3239]	Time 0.671 (0.520)	Data 0.001 (0.020)	Loss 4.2663 (4.4706)	Top-1 acc 25.000 (22.254)	Top-5 acc 49.219 (43.859)	lr 0.02438
Warmup Train [21][1040/3239]	Time 0.410 (0.520)	Data 0.001 (0.020)	Loss 4.5380 (4.4704)	Top-1 acc 22.266 (22.267)	Top-5 acc 41.406 (43.863)	lr 0.02437
Warmup Train [21][1050/3239]	Time 0.538 (0.520)	Data 0.001 (0.020)	Loss 4.3866 (4.4702)	Top-1 acc 23.047 (22.269)	Top-5 acc 46.875 (43.876)	lr 0.02436
Warmup Train [21][1060/3239]	Time 0.632 (0.520)	Data 0.001 (0.019)	Loss 4.4942 (4.4699)	Top-1 acc 20.312 (22.275)	Top-5 acc 41.797 (43.880)	lr 0.02436
Warmup Train [21][1070/3239]	Time 0.503 (0.520)	Data 0.001 (0.019)	Loss 4.4422 (4.4700)	Top-1 acc 24.219 (22.274)	Top-5 acc 46.094 (43.877)	lr 0.02435
Warmup Train [21][1080/3239]	Time 0.566 (0.520)	Data 0.001 (0.019)	Loss 4.4578 (4.4698)	Top-1 acc 21.484 (22.282)	Top-5 acc 46.875 (43.884)	lr 0.02435
Warmup Train [21][1090/3239]	Time 0.628 (0.520)	Data 0.001 (0.019)	Loss 4.4627 (4.4699)	Top-1 acc 21.875 (22.282)	Top-5 acc 46.094 (43.890)	lr 0.02434
Warmup Train [21][1100/3239]	Time 0.464 (0.520)	Data 0.001 (0.019)	Loss 4.4672 (4.4697)	Top-1 acc 20.312 (22.282)	Top-5 acc 42.188 (43.885)	lr 0.02433
Warmup Train [21][1110/3239]	Time 0.528 (0.520)	Data 0.001 (0.019)	Loss 4.5183 (4.4695)	Top-1 acc 22.266 (22.284)	Top-5 acc 42.188 (43.887)	lr 0.02433
Warmup Train [21][1120/3239]	Time 0.574 (0.520)	Data 0.001 (0.019)	Loss 4.4046 (4.4692)	Top-1 acc 20.312 (22.280)	Top-5 acc 44.922 (43.899)	lr 0.02432
Warmup Train [21][1130/3239]	Time 0.598 (0.520)	Data 0.001 (0.019)	Loss 4.3943 (4.4699)	Top-1 acc 23.828 (22.274)	Top-5 acc 45.312 (43.872)	lr 0.02432
Warmup Train [21][1140/3239]	Time 0.489 (0.520)	Data 0.001 (0.018)	Loss 4.4494 (4.4700)	Top-1 acc 23.828 (22.265)	Top-5 acc 44.531 (43.869)	lr 0.02431
Warmup Train [21][1150/3239]	Time 0.448 (0.520)	Data 0.001 (0.018)	Loss 4.6464 (4.4698)	Top-1 acc 20.703 (22.272)	Top-5 acc 39.844 (43.879)	lr 0.02430
Warmup Train [21][1160/3239]	Time 0.542 (0.520)	Data 0.001 (0.018)	Loss 4.4067 (4.4699)	Top-1 acc 25.391 (22.274)	Top-5 acc 48.828 (43.870)	lr 0.02430
Warmup Train [21][1170/3239]	Time 0.582 (0.520)	Data 0.001 (0.018)	Loss 4.5918 (4.4699)	Top-1 acc 22.656 (22.281)	Top-5 acc 44.922 (43.868)	lr 0.02429
Warmup Train [21][1180/3239]	Time 0.508 (0.520)	Data 0.001 (0.018)	Loss 4.3805 (4.4695)	Top-1 acc 28.125 (22.291)	Top-5 acc 48.438 (43.891)	lr 0.02428
Warmup Train [21][1190/3239]	Time 0.328 (0.520)	Data 0.001 (0.018)	Loss 4.4758 (4.4695)	Top-1 acc 19.922 (22.284)	Top-5 acc 44.531 (43.896)	lr 0.02428
Warmup Train [21][1200/3239]	Time 0.835 (0.520)	Data 0.001 (0.018)	Loss 4.2791 (4.4688)	Top-1 acc 27.734 (22.301)	Top-5 acc 48.828 (43.913)	lr 0.02427
Warmup Train [21][1210/3239]	Time 0.662 (0.520)	Data 0.001 (0.018)	Loss 4.4374 (4.4685)	Top-1 acc 26.562 (22.306)	Top-5 acc 44.922 (43.908)	lr 0.02427
Warmup Train [21][1220/3239]	Time 0.481 (0.519)	Data 0.001 (0.017)	Loss 4.4479 (4.4684)	Top-1 acc 23.047 (22.306)	Top-5 acc 47.656 (43.912)	lr 0.02426
Warmup Train [21][1230/3239]	Time 0.571 (0.519)	Data 0.001 (0.017)	Loss 4.3168 (4.4687)	Top-1 acc 21.875 (22.293)	Top-5 acc 48.047 (43.904)	lr 0.02425
Warmup Train [21][1240/3239]	Time 0.465 (0.519)	Data 0.001 (0.017)	Loss 4.2742 (4.4683)	Top-1 acc 28.906 (22.300)	Top-5 acc 47.266 (43.912)	lr 0.02425
Warmup Train [21][1250/3239]	Time 0.589 (0.519)	Data 0.001 (0.017)	Loss 4.4552 (4.4684)	Top-1 acc 22.266 (22.294)	Top-5 acc 42.969 (43.911)	lr 0.02424
Warmup Train [21][1260/3239]	Time 0.392 (0.519)	Data 0.001 (0.017)	Loss 4.4416 (4.4680)	Top-1 acc 20.703 (22.298)	Top-5 acc 42.578 (43.918)	lr 0.02424
Warmup Train [21][1270/3239]	Time 0.546 (0.519)	Data 0.001 (0.017)	Loss 4.3765 (4.4680)	Top-1 acc 22.656 (22.295)	Top-5 acc 46.094 (43.918)	lr 0.02423
Warmup Train [21][1280/3239]	Time 0.445 (0.518)	Data 0.002 (0.017)	Loss 4.4697 (4.4678)	Top-1 acc 23.047 (22.296)	Top-5 acc 42.969 (43.918)	lr 0.02422
Warmup Train [21][1290/3239]	Time 0.310 (0.518)	Data 0.001 (0.017)	Loss 4.2718 (4.4674)	Top-1 acc 25.391 (22.295)	Top-5 acc 49.609 (43.925)	lr 0.02422
Warmup Train [21][1300/3239]	Time 0.440 (0.518)	Data 0.001 (0.017)	Loss 4.3343 (4.4674)	Top-1 acc 26.562 (22.305)	Top-5 acc 46.875 (43.928)	lr 0.02421
Warmup Train [21][1310/3239]	Time 0.477 (0.518)	Data 0.001 (0.017)	Loss 4.4372 (4.4669)	Top-1 acc 22.266 (22.316)	Top-5 acc 44.141 (43.933)	lr 0.02421
Warmup Train [21][1320/3239]	Time 0.447 (0.518)	Data 0.001 (0.017)	Loss 4.3931 (4.4666)	Top-1 acc 21.484 (22.319)	Top-5 acc 45.703 (43.936)	lr 0.02420
Warmup Train [21][1330/3239]	Time 0.422 (0.518)	Data 0.001 (0.017)	Loss 4.5315 (4.4666)	Top-1 acc 19.922 (22.315)	Top-5 acc 42.969 (43.935)	lr 0.02419
Warmup Train [21][1340/3239]	Time 0.499 (0.519)	Data 0.001 (0.017)	Loss 4.3212 (4.4661)	Top-1 acc 23.438 (22.317)	Top-5 acc 48.438 (43.944)	lr 0.02419
Warmup Train [21][1350/3239]	Time 0.364 (0.518)	Data 0.001 (0.017)	Loss 4.4947 (4.4660)	Top-1 acc 21.484 (22.323)	Top-5 acc 42.969 (43.948)	lr 0.02418
Warmup Train [21][1360/3239]	Time 0.393 (0.518)	Data 0.001 (0.017)	Loss 4.6771 (4.4662)	Top-1 acc 16.016 (22.329)	Top-5 acc 37.891 (43.952)	lr 0.02418
Warmup Train [21][1370/3239]	Time 0.571 (0.518)	Data 0.001 (0.017)	Loss 4.5505 (4.4661)	Top-1 acc 21.875 (22.335)	Top-5 acc 40.625 (43.959)	lr 0.02417
Warmup Train [21][1380/3239]	Time 0.649 (0.518)	Data 0.001 (0.016)	Loss 4.5582 (4.4660)	Top-1 acc 20.312 (22.334)	Top-5 acc 42.188 (43.960)	lr 0.02416
Warmup Train [21][1390/3239]	Time 0.654 (0.518)	Data 0.001 (0.016)	Loss 4.4542 (4.4659)	Top-1 acc 23.047 (22.334)	Top-5 acc 46.094 (43.958)	lr 0.02416
Warmup Train [21][1400/3239]	Time 0.592 (0.518)	Data 0.001 (0.016)	Loss 4.2264 (4.4654)	Top-1 acc 28.516 (22.343)	Top-5 acc 50.391 (43.970)	lr 0.02415
Warmup Train [21][1410/3239]	Time 0.570 (0.518)	Data 0.001 (0.016)	Loss 4.4255 (4.4651)	Top-1 acc 18.750 (22.340)	Top-5 acc 42.188 (43.975)	lr 0.02415
Warmup Train [21][1420/3239]	Time 0.532 (0.518)	Data 0.001 (0.016)	Loss 4.4247 (4.4653)	Top-1 acc 23.828 (22.341)	Top-5 acc 46.875 (43.975)	lr 0.02414
Warmup Train [21][1430/3239]	Time 0.533 (0.518)	Data 0.001 (0.016)	Loss 4.4373 (4.4653)	Top-1 acc 18.359 (22.339)	Top-5 acc 46.484 (43.974)	lr 0.02413
Warmup Train [21][1440/3239]	Time 0.562 (0.518)	Data 0.001 (0.016)	Loss 4.2923 (4.4652)	Top-1 acc 24.219 (22.338)	Top-5 acc 48.047 (43.978)	lr 0.02413
Warmup Train [21][1450/3239]	Time 0.583 (0.518)	Data 0.001 (0.016)	Loss 4.4238 (4.4651)	Top-1 acc 21.875 (22.344)	Top-5 acc 44.141 (43.982)	lr 0.02412
Warmup Train [21][1460/3239]	Time 0.569 (0.518)	Data 0.001 (0.016)	Loss 4.4942 (4.4655)	Top-1 acc 25.000 (22.341)	Top-5 acc 42.969 (43.977)	lr 0.02412
Warmup Train [21][1470/3239]	Time 0.495 (0.518)	Data 0.001 (0.016)	Loss 4.4316 (4.4655)	Top-1 acc 24.219 (22.343)	Top-5 acc 48.047 (43.978)	lr 0.02411
Warmup Train [21][1480/3239]	Time 0.383 (0.518)	Data 0.001 (0.016)	Loss 4.3945 (4.4652)	Top-1 acc 25.000 (22.355)	Top-5 acc 48.047 (43.989)	lr 0.02410
Warmup Train [21][1490/3239]	Time 0.344 (0.518)	Data 0.001 (0.016)	Loss 4.5340 (4.4654)	Top-1 acc 16.797 (22.353)	Top-5 acc 39.453 (43.976)	lr 0.02410
Warmup Train [21][1500/3239]	Time 0.500 (0.518)	Data 0.001 (0.016)	Loss 4.3903 (4.4653)	Top-1 acc 23.828 (22.353)	Top-5 acc 46.875 (43.976)	lr 0.02409
Warmup Train [21][1510/3239]	Time 0.467 (0.518)	Data 0.001 (0.016)	Loss 4.3509 (4.4652)	Top-1 acc 24.609 (22.356)	Top-5 acc 46.094 (43.977)	lr 0.02409
Warmup Train [21][1520/3239]	Time 0.598 (0.518)	Data 0.001 (0.015)	Loss 4.2091 (4.4650)	Top-1 acc 28.125 (22.358)	Top-5 acc 48.438 (43.981)	lr 0.02408
Warmup Train [21][1530/3239]	Time 0.459 (0.518)	Data 0.001 (0.015)	Loss 4.6463 (4.4648)	Top-1 acc 20.312 (22.365)	Top-5 acc 40.625 (43.989)	lr 0.02407
Warmup Train [21][1540/3239]	Time 0.309 (0.517)	Data 0.001 (0.015)	Loss 4.5522 (4.4649)	Top-1 acc 22.266 (22.369)	Top-5 acc 44.141 (43.988)	lr 0.02407
Warmup Train [21][1550/3239]	Time 0.532 (0.517)	Data 0.001 (0.015)	Loss 4.3971 (4.4652)	Top-1 acc 22.656 (22.362)	Top-5 acc 44.141 (43.978)	lr 0.02406
Warmup Train [21][1560/3239]	Time 0.427 (0.517)	Data 0.001 (0.015)	Loss 4.5351 (4.4654)	Top-1 acc 17.188 (22.354)	Top-5 acc 39.062 (43.971)	lr 0.02405
Warmup Train [21][1570/3239]	Time 0.393 (0.517)	Data 0.001 (0.015)	Loss 4.2858 (4.4653)	Top-1 acc 25.391 (22.355)	Top-5 acc 49.609 (43.974)	lr 0.02405
Warmup Train [21][1580/3239]	Time 0.523 (0.517)	Data 0.001 (0.015)	Loss 4.6459 (4.4652)	Top-1 acc 21.094 (22.363)	Top-5 acc 41.016 (43.977)	lr 0.02404
Warmup Train [21][1590/3239]	Time 0.510 (0.517)	Data 0.001 (0.015)	Loss 4.2727 (4.4651)	Top-1 acc 28.125 (22.364)	Top-5 acc 53.125 (43.984)	lr 0.02404
Warmup Train [21][1600/3239]	Time 0.535 (0.517)	Data 0.001 (0.015)	Loss 4.4745 (4.4648)	Top-1 acc 19.922 (22.368)	Top-5 acc 43.750 (43.992)	lr 0.02403
Warmup Train [21][1610/3239]	Time 0.518 (0.517)	Data 0.001 (0.015)	Loss 4.6028 (4.4647)	Top-1 acc 18.750 (22.370)	Top-5 acc 38.281 (43.995)	lr 0.02402
Warmup Train [21][1620/3239]	Time 0.353 (0.517)	Data 0.002 (0.015)	Loss 4.4602 (4.4645)	Top-1 acc 21.484 (22.376)	Top-5 acc 40.234 (43.995)	lr 0.02402
Warmup Train [21][1630/3239]	Time 0.498 (0.517)	Data 0.001 (0.015)	Loss 4.5498 (4.4646)	Top-1 acc 20.312 (22.372)	Top-5 acc 41.016 (43.985)	lr 0.02401
Warmup Train [21][1640/3239]	Time 0.644 (0.517)	Data 0.001 (0.015)	Loss 4.6106 (4.4648)	Top-1 acc 18.750 (22.371)	Top-5 acc 41.797 (43.984)	lr 0.02401
Warmup Train [21][1650/3239]	Time 0.629 (0.517)	Data 0.001 (0.015)	Loss 4.1865 (4.4645)	Top-1 acc 24.609 (22.378)	Top-5 acc 51.562 (44.000)	lr 0.02400
Warmup Train [21][1660/3239]	Time 0.335 (0.517)	Data 0.001 (0.015)	Loss 4.4423 (4.4646)	Top-1 acc 23.047 (22.379)	Top-5 acc 45.312 (43.997)	lr 0.02399
Warmup Train [21][1670/3239]	Time 0.506 (0.517)	Data 0.001 (0.015)	Loss 4.4944 (4.4645)	Top-1 acc 25.000 (22.389)	Top-5 acc 45.312 (44.002)	lr 0.02399
Warmup Train [21][1680/3239]	Time 0.511 (0.517)	Data 0.001 (0.015)	Loss 4.3763 (4.4645)	Top-1 acc 21.094 (22.389)	Top-5 acc 42.578 (43.998)	lr 0.02398
Warmup Train [21][1690/3239]	Time 0.601 (0.517)	Data 0.001 (0.015)	Loss 4.5517 (4.4644)	Top-1 acc 19.141 (22.387)	Top-5 acc 42.969 (43.999)	lr 0.02398
Warmup Train [21][1700/3239]	Time 0.567 (0.518)	Data 0.001 (0.015)	Loss 4.3243 (4.4645)	Top-1 acc 27.344 (22.389)	Top-5 acc 47.656 (43.999)	lr 0.02397
Warmup Train [21][1710/3239]	Time 0.431 (0.517)	Data 0.001 (0.015)	Loss 4.5255 (4.4644)	Top-1 acc 21.484 (22.393)	Top-5 acc 43.359 (44.001)	lr 0.02396
Warmup Train [21][1720/3239]	Time 0.411 (0.517)	Data 0.001 (0.015)	Loss 4.2603 (4.4643)	Top-1 acc 24.219 (22.395)	Top-5 acc 46.094 (44.001)	lr 0.02396
Warmup Train [21][1730/3239]	Time 0.612 (0.517)	Data 0.001 (0.015)	Loss 4.5639 (4.4645)	Top-1 acc 21.875 (22.396)	Top-5 acc 44.531 (43.997)	lr 0.02395
Warmup Train [21][1740/3239]	Time 0.386 (0.517)	Data 0.001 (0.015)	Loss 4.3912 (4.4639)	Top-1 acc 25.391 (22.407)	Top-5 acc 42.969 (44.008)	lr 0.02395
Warmup Train [21][1750/3239]	Time 0.511 (0.518)	Data 0.001 (0.014)	Loss 4.4296 (4.4631)	Top-1 acc 26.172 (22.425)	Top-5 acc 45.703 (44.029)	lr 0.02394
Warmup Train [21][1760/3239]	Time 0.588 (0.518)	Data 0.001 (0.014)	Loss 4.4720 (4.4632)	Top-1 acc 22.656 (22.423)	Top-5 acc 42.969 (44.026)	lr 0.02393
Warmup Train [21][1770/3239]	Time 0.524 (0.517)	Data 0.001 (0.014)	Loss 4.4949 (4.4630)	Top-1 acc 22.656 (22.425)	Top-5 acc 40.625 (44.030)	lr 0.02393
Warmup Train [21][1780/3239]	Time 0.428 (0.517)	Data 0.001 (0.014)	Loss 4.3972 (4.4626)	Top-1 acc 25.000 (22.432)	Top-5 acc 46.875 (44.041)	lr 0.02392
Warmup Train [21][1790/3239]	Time 0.195 (0.517)	Data 0.001 (0.014)	Loss 4.3700 (4.4625)	Top-1 acc 26.953 (22.437)	Top-5 acc 47.266 (44.043)	lr 0.02392
Warmup Train [21][1800/3239]	Time 0.509 (0.517)	Data 0.001 (0.014)	Loss 4.4760 (4.4623)	Top-1 acc 17.578 (22.439)	Top-5 acc 42.188 (44.052)	lr 0.02391
Warmup Train [21][1810/3239]	Time 0.736 (0.517)	Data 0.001 (0.014)	Loss 4.4078 (4.4622)	Top-1 acc 26.953 (22.441)	Top-5 acc 47.656 (44.053)	lr 0.02390
Warmup Train [21][1820/3239]	Time 0.704 (0.517)	Data 0.001 (0.014)	Loss 4.6201 (4.4622)	Top-1 acc 19.141 (22.439)	Top-5 acc 41.406 (44.061)	lr 0.02390
Warmup Train [21][1830/3239]	Time 0.688 (0.516)	Data 0.001 (0.014)	Loss 4.3522 (4.4623)	Top-1 acc 21.094 (22.435)	Top-5 acc 42.578 (44.060)	lr 0.02389
Warmup Train [21][1840/3239]	Time 0.500 (0.517)	Data 0.001 (0.014)	Loss 4.3696 (4.4622)	Top-1 acc 24.609 (22.442)	Top-5 acc 45.312 (44.066)	lr 0.02389
Warmup Train [21][1850/3239]	Time 0.575 (0.517)	Data 0.001 (0.014)	Loss 4.2701 (4.4620)	Top-1 acc 23.828 (22.441)	Top-5 acc 49.219 (44.065)	lr 0.02388
Warmup Train [21][1860/3239]	Time 0.518 (0.517)	Data 0.001 (0.014)	Loss 4.5238 (4.4619)	Top-1 acc 20.312 (22.440)	Top-5 acc 40.234 (44.064)	lr 0.02387
Warmup Train [21][1870/3239]	Time 0.547 (0.517)	Data 0.001 (0.014)	Loss 4.5600 (4.4619)	Top-1 acc 22.266 (22.440)	Top-5 acc 41.406 (44.061)	lr 0.02387
Warmup Train [21][1880/3239]	Time 0.529 (0.517)	Data 0.001 (0.014)	Loss 4.5610 (4.4619)	Top-1 acc 22.656 (22.442)	Top-5 acc 39.062 (44.061)	lr 0.02386
Warmup Train [21][1890/3239]	Time 0.576 (0.516)	Data 0.001 (0.014)	Loss 4.3693 (4.4618)	Top-1 acc 25.391 (22.447)	Top-5 acc 45.703 (44.059)	lr 0.02386
Warmup Train [21][1900/3239]	Time 0.534 (0.517)	Data 0.001 (0.014)	Loss 4.2708 (4.4620)	Top-1 acc 24.609 (22.443)	Top-5 acc 48.438 (44.055)	lr 0.02385
Warmup Train [21][1910/3239]	Time 0.628 (0.517)	Data 0.001 (0.014)	Loss 4.3347 (4.4620)	Top-1 acc 26.172 (22.443)	Top-5 acc 47.266 (44.054)	lr 0.02384
Warmup Train [21][1920/3239]	Time 0.527 (0.517)	Data 0.001 (0.014)	Loss 4.4269 (4.4617)	Top-1 acc 21.875 (22.450)	Top-5 acc 46.094 (44.062)	lr 0.02384
Warmup Train [21][1930/3239]	Time 0.570 (0.517)	Data 0.002 (0.014)	Loss 4.3920 (4.4617)	Top-1 acc 24.219 (22.450)	Top-5 acc 47.266 (44.062)	lr 0.02383
Warmup Train [21][1940/3239]	Time 0.595 (0.517)	Data 0.001 (0.014)	Loss 4.5728 (4.4617)	Top-1 acc 21.875 (22.450)	Top-5 acc 44.531 (44.066)	lr 0.02382
Warmup Train [21][1950/3239]	Time 0.450 (0.517)	Data 0.001 (0.013)	Loss 4.3680 (4.4616)	Top-1 acc 21.484 (22.452)	Top-5 acc 44.141 (44.067)	lr 0.02382
Warmup Train [21][1960/3239]	Time 0.638 (0.517)	Data 0.001 (0.013)	Loss 4.1928 (4.4616)	Top-1 acc 25.781 (22.452)	Top-5 acc 50.391 (44.068)	lr 0.02381
Warmup Train [21][1970/3239]	Time 0.390 (0.516)	Data 0.001 (0.013)	Loss 4.4597 (4.4614)	Top-1 acc 20.703 (22.452)	Top-5 acc 45.312 (44.068)	lr 0.02381
Warmup Train [21][1980/3239]	Time 0.664 (0.517)	Data 0.001 (0.013)	Loss 4.2873 (4.4614)	Top-1 acc 28.125 (22.453)	Top-5 acc 46.484 (44.070)	lr 0.02380
Warmup Train [21][1990/3239]	Time 0.594 (0.517)	Data 0.001 (0.013)	Loss 4.5482 (4.4615)	Top-1 acc 21.484 (22.448)	Top-5 acc 41.406 (44.066)	lr 0.02379
Warmup Train [21][2000/3239]	Time 0.587 (0.517)	Data 0.001 (0.013)	Loss 4.4272 (4.4617)	Top-1 acc 23.438 (22.447)	Top-5 acc 42.578 (44.058)	lr 0.02379
Warmup Train [21][2010/3239]	Time 0.494 (0.517)	Data 0.001 (0.013)	Loss 4.3630 (4.4617)	Top-1 acc 26.172 (22.452)	Top-5 acc 47.266 (44.062)	lr 0.02378
Warmup Train [21][2020/3239]	Time 0.399 (0.517)	Data 0.001 (0.013)	Loss 4.3951 (4.4615)	Top-1 acc 21.484 (22.452)	Top-5 acc 44.531 (44.066)	lr 0.02378
Warmup Train [21][2030/3239]	Time 0.523 (0.517)	Data 0.001 (0.013)	Loss 4.3508 (4.4611)	Top-1 acc 26.953 (22.459)	Top-5 acc 49.219 (44.077)	lr 0.02377
Warmup Train [21][2040/3239]	Time 0.472 (0.517)	Data 0.001 (0.013)	Loss 4.2937 (4.4611)	Top-1 acc 25.781 (22.457)	Top-5 acc 49.219 (44.072)	lr 0.02376
Warmup Train [21][2050/3239]	Time 0.438 (0.517)	Data 0.001 (0.013)	Loss 4.3383 (4.4609)	Top-1 acc 21.875 (22.458)	Top-5 acc 51.562 (44.075)	lr 0.02376
Warmup Train [21][2060/3239]	Time 0.537 (0.517)	Data 0.001 (0.013)	Loss 4.5149 (4.4610)	Top-1 acc 20.703 (22.446)	Top-5 acc 43.750 (44.073)	lr 0.02375
Warmup Train [21][2070/3239]	Time 0.248 (0.517)	Data 0.001 (0.013)	Loss 4.3195 (4.4608)	Top-1 acc 25.000 (22.447)	Top-5 acc 46.875 (44.083)	lr 0.02375
Warmup Train [21][2080/3239]	Time 0.452 (0.517)	Data 0.001 (0.013)	Loss 4.5372 (4.4609)	Top-1 acc 21.484 (22.450)	Top-5 acc 43.359 (44.081)	lr 0.02374
Warmup Train [21][2090/3239]	Time 0.339 (0.516)	Data 0.001 (0.013)	Loss 4.5738 (4.4607)	Top-1 acc 24.219 (22.454)	Top-5 acc 42.188 (44.083)	lr 0.02373
Warmup Train [21][2100/3239]	Time 0.441 (0.516)	Data 0.002 (0.013)	Loss 4.3486 (4.4603)	Top-1 acc 23.828 (22.459)	Top-5 acc 47.266 (44.087)	lr 0.02373
Warmup Train [21][2110/3239]	Time 0.355 (0.515)	Data 0.001 (0.013)	Loss 4.4621 (4.4602)	Top-1 acc 22.266 (22.461)	Top-5 acc 45.312 (44.093)	lr 0.02372
Warmup Train [21][2120/3239]	Time 0.275 (0.514)	Data 0.001 (0.013)	Loss 4.5955 (4.4601)	Top-1 acc 18.359 (22.460)	Top-5 acc 39.844 (44.097)	lr 0.02372
Warmup Train [21][2130/3239]	Time 0.517 (0.514)	Data 0.001 (0.013)	Loss 4.4451 (4.4600)	Top-1 acc 19.531 (22.463)	Top-5 acc 42.188 (44.098)	lr 0.02371
Warmup Train [21][2140/3239]	Time 0.581 (0.514)	Data 0.001 (0.013)	Loss 4.4941 (4.4599)	Top-1 acc 21.094 (22.468)	Top-5 acc 43.359 (44.101)	lr 0.02370
Warmup Train [21][2150/3239]	Time 0.638 (0.514)	Data 0.001 (0.013)	Loss 4.5077 (4.4602)	Top-1 acc 23.438 (22.465)	Top-5 acc 42.969 (44.097)	lr 0.02370
Warmup Train [21][2160/3239]	Time 0.535 (0.514)	Data 0.001 (0.013)	Loss 4.5039 (4.4603)	Top-1 acc 23.828 (22.468)	Top-5 acc 43.359 (44.103)	lr 0.02369
Warmup Train [21][2170/3239]	Time 0.518 (0.514)	Data 0.001 (0.013)	Loss 4.4842 (4.4599)	Top-1 acc 20.312 (22.468)	Top-5 acc 44.531 (44.108)	lr 0.02369
Warmup Train [21][2180/3239]	Time 0.396 (0.514)	Data 0.001 (0.013)	Loss 4.4645 (4.4600)	Top-1 acc 21.875 (22.470)	Top-5 acc 48.047 (44.108)	lr 0.02368
Warmup Train [21][2190/3239]	Time 0.417 (0.514)	Data 0.001 (0.013)	Loss 4.2584 (4.4599)	Top-1 acc 26.562 (22.473)	Top-5 acc 50.781 (44.112)	lr 0.02367
Warmup Train [21][2200/3239]	Time 0.433 (0.514)	Data 0.001 (0.013)	Loss 4.3060 (4.4600)	Top-1 acc 26.953 (22.473)	Top-5 acc 46.875 (44.107)	lr 0.02367
Warmup Train [21][2210/3239]	Time 0.470 (0.514)	Data 0.001 (0.013)	Loss 4.5383 (4.4596)	Top-1 acc 20.312 (22.485)	Top-5 acc 41.797 (44.114)	lr 0.02366
Warmup Train [21][2220/3239]	Time 0.476 (0.514)	Data 0.001 (0.013)	Loss 4.4590 (4.4594)	Top-1 acc 25.391 (22.493)	Top-5 acc 45.312 (44.122)	lr 0.02366
Warmup Train [21][2230/3239]	Time 0.490 (0.514)	Data 0.001 (0.013)	Loss 4.5910 (4.4591)	Top-1 acc 21.875 (22.501)	Top-5 acc 42.578 (44.130)	lr 0.02365
Warmup Train [21][2240/3239]	Time 0.574 (0.514)	Data 0.001 (0.013)	Loss 4.2872 (4.4593)	Top-1 acc 26.172 (22.496)	Top-5 acc 48.438 (44.131)	lr 0.02364
Warmup Train [21][2250/3239]	Time 0.653 (0.515)	Data 0.001 (0.013)	Loss 4.2587 (4.4593)	Top-1 acc 24.219 (22.495)	Top-5 acc 51.953 (44.131)	lr 0.02364
Warmup Train [21][2260/3239]	Time 0.423 (0.515)	Data 0.001 (0.013)	Loss 4.3321 (4.4594)	Top-1 acc 25.000 (22.492)	Top-5 acc 45.703 (44.129)	lr 0.02363
Warmup Train [21][2270/3239]	Time 0.553 (0.515)	Data 0.001 (0.013)	Loss 4.5021 (4.4594)	Top-1 acc 21.875 (22.491)	Top-5 acc 41.797 (44.128)	lr 0.02363
Warmup Train [21][2280/3239]	Time 0.397 (0.514)	Data 0.001 (0.013)	Loss 4.3359 (4.4591)	Top-1 acc 27.344 (22.494)	Top-5 acc 47.266 (44.135)	lr 0.02362
Warmup Train [21][2290/3239]	Time 0.396 (0.514)	Data 0.001 (0.013)	Loss 4.5168 (4.4587)	Top-1 acc 22.266 (22.499)	Top-5 acc 41.016 (44.141)	lr 0.02361
Warmup Train [21][2300/3239]	Time 0.467 (0.514)	Data 0.001 (0.013)	Loss 4.3111 (4.4585)	Top-1 acc 26.172 (22.501)	Top-5 acc 49.219 (44.146)	lr 0.02361
Warmup Train [21][2310/3239]	Time 0.591 (0.514)	Data 0.001 (0.013)	Loss 4.3784 (4.4584)	Top-1 acc 23.828 (22.502)	Top-5 acc 44.531 (44.146)	lr 0.02360
Warmup Train [21][2320/3239]	Time 0.491 (0.514)	Data 0.001 (0.013)	Loss 4.2896 (4.4582)	Top-1 acc 25.391 (22.503)	Top-5 acc 46.875 (44.153)	lr 0.02359
Warmup Train [21][2330/3239]	Time 0.634 (0.514)	Data 0.001 (0.013)	Loss 4.3305 (4.4582)	Top-1 acc 22.656 (22.500)	Top-5 acc 45.312 (44.154)	lr 0.02359
Warmup Train [21][2340/3239]	Time 0.517 (0.514)	Data 0.001 (0.012)	Loss 4.4583 (4.4581)	Top-1 acc 20.312 (22.499)	Top-5 acc 45.312 (44.159)	lr 0.02358
Warmup Train [21][2350/3239]	Time 0.547 (0.514)	Data 0.001 (0.012)	Loss 4.2927 (4.4584)	Top-1 acc 25.391 (22.494)	Top-5 acc 50.391 (44.156)	lr 0.02358
Warmup Train [21][2360/3239]	Time 0.579 (0.514)	Data 0.001 (0.012)	Loss 4.5017 (4.4583)	Top-1 acc 20.703 (22.495)	Top-5 acc 41.406 (44.161)	lr 0.02357
Warmup Train [21][2370/3239]	Time 0.537 (0.514)	Data 0.001 (0.012)	Loss 4.5559 (4.4583)	Top-1 acc 21.875 (22.497)	Top-5 acc 42.578 (44.161)	lr 0.02356
Warmup Train [21][2380/3239]	Time 0.460 (0.514)	Data 0.001 (0.012)	Loss 4.4899 (4.4582)	Top-1 acc 23.047 (22.501)	Top-5 acc 41.797 (44.162)	lr 0.02356
Warmup Train [21][2390/3239]	Time 0.506 (0.514)	Data 0.001 (0.012)	Loss 4.5645 (4.4580)	Top-1 acc 22.266 (22.503)	Top-5 acc 39.844 (44.164)	lr 0.02355
Warmup Train [21][2400/3239]	Time 0.632 (0.514)	Data 0.001 (0.012)	Loss 4.1948 (4.4579)	Top-1 acc 28.906 (22.508)	Top-5 acc 50.000 (44.166)	lr 0.02355
Warmup Train [21][2410/3239]	Time 0.533 (0.514)	Data 0.001 (0.012)	Loss 4.1972 (4.4580)	Top-1 acc 28.125 (22.507)	Top-5 acc 51.172 (44.163)	lr 0.02354
Warmup Train [21][2420/3239]	Time 0.573 (0.514)	Data 0.001 (0.012)	Loss 4.3152 (4.4582)	Top-1 acc 22.656 (22.502)	Top-5 acc 49.219 (44.159)	lr 0.02353
Warmup Train [21][2430/3239]	Time 0.315 (0.514)	Data 0.001 (0.012)	Loss 4.5324 (4.4582)	Top-1 acc 18.750 (22.496)	Top-5 acc 41.797 (44.156)	lr 0.02353
Warmup Train [21][2440/3239]	Time 0.533 (0.514)	Data 0.001 (0.012)	Loss 4.4781 (4.4582)	Top-1 acc 25.391 (22.499)	Top-5 acc 44.531 (44.160)	lr 0.02352
Warmup Train [21][2450/3239]	Time 0.708 (0.514)	Data 0.001 (0.012)	Loss 4.3719 (4.4581)	Top-1 acc 20.703 (22.495)	Top-5 acc 46.094 (44.162)	lr 0.02352
Warmup Train [21][2460/3239]	Time 0.608 (0.514)	Data 0.001 (0.012)	Loss 4.5153 (4.4580)	Top-1 acc 23.438 (22.492)	Top-5 acc 44.141 (44.166)	lr 0.02351
Warmup Train [21][2470/3239]	Time 0.516 (0.514)	Data 0.001 (0.012)	Loss 4.4696 (4.4579)	Top-1 acc 23.047 (22.491)	Top-5 acc 45.703 (44.164)	lr 0.02350
Warmup Train [21][2480/3239]	Time 0.397 (0.514)	Data 0.001 (0.012)	Loss 4.5420 (4.4580)	Top-1 acc 21.094 (22.490)	Top-5 acc 41.406 (44.159)	lr 0.02350
Warmup Train [21][2490/3239]	Time 0.430 (0.514)	Data 0.001 (0.012)	Loss 4.4217 (4.4579)	Top-1 acc 22.266 (22.489)	Top-5 acc 44.531 (44.161)	lr 0.02349
Warmup Train [21][2500/3239]	Time 0.478 (0.514)	Data 0.001 (0.012)	Loss 4.3755 (4.4580)	Top-1 acc 23.047 (22.491)	Top-5 acc 45.312 (44.160)	lr 0.02349
Warmup Train [21][2510/3239]	Time 0.361 (0.514)	Data 0.001 (0.012)	Loss 4.3799 (4.4576)	Top-1 acc 22.656 (22.496)	Top-5 acc 44.141 (44.170)	lr 0.02348
Warmup Train [21][2520/3239]	Time 0.672 (0.514)	Data 0.002 (0.012)	Loss 4.3962 (4.4575)	Top-1 acc 27.344 (22.498)	Top-5 acc 44.531 (44.171)	lr 0.02347
Warmup Train [21][2530/3239]	Time 0.375 (0.514)	Data 0.002 (0.012)	Loss 4.6159 (4.4575)	Top-1 acc 17.969 (22.496)	Top-5 acc 42.969 (44.167)	lr 0.02347
Warmup Train [21][2540/3239]	Time 0.669 (0.514)	Data 0.001 (0.012)	Loss 4.4650 (4.4575)	Top-1 acc 22.266 (22.498)	Top-5 acc 41.797 (44.166)	lr 0.02346
Warmup Train [21][2550/3239]	Time 0.481 (0.514)	Data 0.001 (0.012)	Loss 4.4013 (4.4574)	Top-1 acc 19.922 (22.497)	Top-5 acc 42.188 (44.166)	lr 0.02346
Warmup Train [21][2560/3239]	Time 0.475 (0.514)	Data 0.001 (0.012)	Loss 4.5138 (4.4575)	Top-1 acc 20.312 (22.498)	Top-5 acc 40.234 (44.167)	lr 0.02345
Warmup Train [21][2570/3239]	Time 0.580 (0.514)	Data 0.001 (0.012)	Loss 4.3818 (4.4575)	Top-1 acc 23.828 (22.498)	Top-5 acc 47.656 (44.169)	lr 0.02344
Warmup Train [21][2580/3239]	Time 0.521 (0.514)	Data 0.001 (0.012)	Loss 4.6049 (4.4574)	Top-1 acc 19.141 (22.498)	Top-5 acc 39.453 (44.171)	lr 0.02344
Warmup Train [21][2590/3239]	Time 0.643 (0.514)	Data 0.001 (0.012)	Loss 4.4892 (4.4572)	Top-1 acc 20.703 (22.499)	Top-5 acc 45.703 (44.175)	lr 0.02343
Warmup Train [21][2600/3239]	Time 0.382 (0.514)	Data 0.001 (0.012)	Loss 4.5017 (4.4573)	Top-1 acc 21.484 (22.497)	Top-5 acc 42.969 (44.175)	lr 0.02343
Warmup Train [21][2610/3239]	Time 0.524 (0.513)	Data 0.001 (0.012)	Loss 4.4510 (4.4571)	Top-1 acc 22.266 (22.498)	Top-5 acc 41.406 (44.175)	lr 0.02342
Warmup Train [21][2620/3239]	Time 0.621 (0.514)	Data 0.001 (0.012)	Loss 4.5174 (4.4570)	Top-1 acc 21.484 (22.503)	Top-5 acc 43.359 (44.177)	lr 0.02341
Warmup Train [21][2630/3239]	Time 0.617 (0.514)	Data 0.001 (0.012)	Loss 4.4082 (4.4568)	Top-1 acc 23.828 (22.505)	Top-5 acc 46.875 (44.180)	lr 0.02341
Warmup Train [21][2640/3239]	Time 0.456 (0.513)	Data 0.001 (0.012)	Loss 4.4452 (4.4568)	Top-1 acc 23.438 (22.504)	Top-5 acc 42.969 (44.180)	lr 0.02340
Warmup Train [21][2650/3239]	Time 0.532 (0.513)	Data 0.001 (0.012)	Loss 4.3005 (4.4565)	Top-1 acc 27.344 (22.509)	Top-5 acc 48.438 (44.183)	lr 0.02340
Warmup Train [21][2660/3239]	Time 0.521 (0.513)	Data 0.001 (0.012)	Loss 4.2887 (4.4565)	Top-1 acc 25.781 (22.511)	Top-5 acc 51.562 (44.184)	lr 0.02339
Warmup Train [21][2670/3239]	Time 0.541 (0.513)	Data 0.001 (0.012)	Loss 4.4530 (4.4567)	Top-1 acc 22.266 (22.508)	Top-5 acc 44.531 (44.179)	lr 0.02338
Warmup Train [21][2680/3239]	Time 0.607 (0.513)	Data 0.001 (0.012)	Loss 4.3379 (4.4565)	Top-1 acc 21.094 (22.511)	Top-5 acc 47.656 (44.184)	lr 0.02338
Warmup Train [21][2690/3239]	Time 0.517 (0.513)	Data 0.001 (0.012)	Loss 4.3496 (4.4564)	Top-1 acc 25.781 (22.513)	Top-5 acc 50.391 (44.189)	lr 0.02337
Warmup Train [21][2700/3239]	Time 0.460 (0.513)	Data 0.001 (0.012)	Loss 4.3841 (4.4566)	Top-1 acc 23.047 (22.508)	Top-5 acc 45.312 (44.184)	lr 0.02336
Warmup Train [21][2710/3239]	Time 0.427 (0.513)	Data 0.003 (0.012)	Loss 4.2504 (4.4562)	Top-1 acc 26.562 (22.513)	Top-5 acc 46.875 (44.189)	lr 0.02336
Warmup Train [21][2720/3239]	Time 0.422 (0.513)	Data 0.001 (0.012)	Loss 4.2280 (4.4562)	Top-1 acc 23.828 (22.515)	Top-5 acc 45.703 (44.188)	lr 0.02335
Warmup Train [21][2730/3239]	Time 0.530 (0.513)	Data 0.001 (0.012)	Loss 4.3318 (4.4562)	Top-1 acc 23.047 (22.515)	Top-5 acc 46.875 (44.190)	lr 0.02335
Warmup Train [21][2740/3239]	Time 0.509 (0.513)	Data 0.001 (0.012)	Loss 4.4674 (4.4561)	Top-1 acc 23.047 (22.520)	Top-5 acc 47.266 (44.195)	lr 0.02334
Warmup Train [21][2750/3239]	Time 0.516 (0.513)	Data 0.001 (0.012)	Loss 4.5419 (4.4561)	Top-1 acc 21.484 (22.519)	Top-5 acc 40.625 (44.192)	lr 0.02333
Warmup Train [21][2760/3239]	Time 0.546 (0.513)	Data 0.001 (0.011)	Loss 4.4770 (4.4560)	Top-1 acc 21.875 (22.519)	Top-5 acc 42.969 (44.195)	lr 0.02333
Warmup Train [21][2770/3239]	Time 0.777 (0.513)	Data 0.001 (0.011)	Loss 4.4443 (4.4559)	Top-1 acc 23.047 (22.525)	Top-5 acc 42.188 (44.197)	lr 0.02332
Warmup Train [21][2780/3239]	Time 0.526 (0.513)	Data 0.001 (0.011)	Loss 4.3929 (4.4557)	Top-1 acc 21.875 (22.527)	Top-5 acc 45.312 (44.198)	lr 0.02332
Warmup Train [21][2790/3239]	Time 0.473 (0.513)	Data 0.001 (0.011)	Loss 4.2725 (4.4558)	Top-1 acc 25.781 (22.525)	Top-5 acc 51.172 (44.200)	lr 0.02331
Warmup Train [21][2800/3239]	Time 0.451 (0.513)	Data 0.001 (0.011)	Loss 4.2880 (4.4557)	Top-1 acc 25.391 (22.525)	Top-5 acc 48.438 (44.203)	lr 0.02330
Warmup Train [21][2810/3239]	Time 0.437 (0.513)	Data 0.001 (0.011)	Loss 4.5489 (4.4558)	Top-1 acc 23.438 (22.524)	Top-5 acc 42.188 (44.198)	lr 0.02330
Warmup Train [21][2820/3239]	Time 0.538 (0.513)	Data 0.001 (0.011)	Loss 4.6987 (4.4559)	Top-1 acc 18.359 (22.527)	Top-5 acc 37.891 (44.197)	lr 0.02329
Warmup Train [21][2830/3239]	Time 0.357 (0.513)	Data 0.001 (0.011)	Loss 4.3399 (4.4556)	Top-1 acc 27.344 (22.530)	Top-5 acc 47.656 (44.206)	lr 0.02329
Warmup Train [21][2840/3239]	Time 0.317 (0.513)	Data 0.001 (0.011)	Loss 4.4405 (4.4555)	Top-1 acc 21.484 (22.532)	Top-5 acc 44.922 (44.208)	lr 0.02328
Warmup Train [21][2850/3239]	Time 0.479 (0.513)	Data 0.001 (0.011)	Loss 4.4568 (4.4553)	Top-1 acc 26.562 (22.536)	Top-5 acc 45.312 (44.214)	lr 0.02327
Warmup Train [21][2860/3239]	Time 0.576 (0.513)	Data 0.001 (0.011)	Loss 4.4766 (4.4552)	Top-1 acc 18.750 (22.540)	Top-5 acc 41.797 (44.220)	lr 0.02327
Warmup Train [21][2870/3239]	Time 0.589 (0.513)	Data 0.001 (0.011)	Loss 4.5718 (4.4552)	Top-1 acc 24.609 (22.543)	Top-5 acc 41.016 (44.220)	lr 0.02326
Warmup Train [21][2880/3239]	Time 0.618 (0.513)	Data 0.001 (0.011)	Loss 4.4469 (4.4550)	Top-1 acc 21.875 (22.543)	Top-5 acc 46.484 (44.225)	lr 0.02326
Warmup Train [21][2890/3239]	Time 0.702 (0.513)	Data 0.001 (0.011)	Loss 4.5753 (4.4551)	Top-1 acc 22.656 (22.541)	Top-5 acc 42.188 (44.223)	lr 0.02325
Warmup Train [21][2900/3239]	Time 0.379 (0.513)	Data 0.001 (0.011)	Loss 4.5055 (4.4551)	Top-1 acc 20.312 (22.539)	Top-5 acc 38.672 (44.224)	lr 0.02324
Warmup Train [21][2910/3239]	Time 0.555 (0.513)	Data 0.001 (0.011)	Loss 4.3072 (4.4550)	Top-1 acc 25.781 (22.543)	Top-5 acc 49.219 (44.228)	lr 0.02324
Warmup Train [21][2920/3239]	Time 0.480 (0.513)	Data 0.001 (0.011)	Loss 4.6162 (4.4548)	Top-1 acc 18.359 (22.548)	Top-5 acc 40.625 (44.234)	lr 0.02323
Warmup Train [21][2930/3239]	Time 0.463 (0.513)	Data 0.001 (0.011)	Loss 4.5374 (4.4546)	Top-1 acc 18.359 (22.552)	Top-5 acc 41.406 (44.237)	lr 0.02323
Warmup Train [21][2940/3239]	Time 0.467 (0.513)	Data 0.001 (0.011)	Loss 4.4430 (4.4545)	Top-1 acc 23.828 (22.557)	Top-5 acc 44.922 (44.242)	lr 0.02322
Warmup Train [21][2950/3239]	Time 0.499 (0.513)	Data 0.001 (0.011)	Loss 4.4600 (4.4545)	Top-1 acc 24.219 (22.557)	Top-5 acc 43.359 (44.242)	lr 0.02321
Warmup Train [21][2960/3239]	Time 0.663 (0.513)	Data 0.001 (0.011)	Loss 4.3848 (4.4545)	Top-1 acc 23.438 (22.559)	Top-5 acc 46.094 (44.244)	lr 0.02321
Warmup Train [21][2970/3239]	Time 0.599 (0.513)	Data 0.001 (0.011)	Loss 4.4166 (4.4543)	Top-1 acc 25.781 (22.562)	Top-5 acc 46.875 (44.247)	lr 0.02320
Warmup Train [21][2980/3239]	Time 0.453 (0.513)	Data 0.001 (0.011)	Loss 4.1593 (4.4539)	Top-1 acc 28.125 (22.571)	Top-5 acc 49.609 (44.260)	lr 0.02320
Warmup Train [21][2990/3239]	Time 0.434 (0.513)	Data 0.001 (0.011)	Loss 4.5190 (4.4539)	Top-1 acc 21.094 (22.571)	Top-5 acc 44.141 (44.258)	lr 0.02319
Warmup Train [21][3000/3239]	Time 0.371 (0.513)	Data 0.001 (0.011)	Loss 4.3924 (4.4539)	Top-1 acc 24.219 (22.577)	Top-5 acc 44.922 (44.261)	lr 0.02318
Warmup Train [21][3010/3239]	Time 0.334 (0.513)	Data 0.001 (0.011)	Loss 4.3679 (4.4537)	Top-1 acc 21.484 (22.584)	Top-5 acc 47.266 (44.266)	lr 0.02318
Warmup Train [21][3020/3239]	Time 0.450 (0.513)	Data 0.001 (0.011)	Loss 4.3921 (4.4536)	Top-1 acc 23.047 (22.579)	Top-5 acc 45.312 (44.266)	lr 0.02317
Warmup Train [21][3030/3239]	Time 0.472 (0.513)	Data 0.001 (0.011)	Loss 4.2031 (4.4536)	Top-1 acc 25.781 (22.576)	Top-5 acc 47.656 (44.265)	lr 0.02317
Warmup Train [21][3040/3239]	Time 0.543 (0.513)	Data 0.001 (0.011)	Loss 4.3848 (4.4535)	Top-1 acc 25.000 (22.574)	Top-5 acc 46.094 (44.263)	lr 0.02316
Warmup Train [21][3050/3239]	Time 0.464 (0.513)	Data 0.001 (0.011)	Loss 4.5047 (4.4537)	Top-1 acc 22.266 (22.572)	Top-5 acc 44.531 (44.259)	lr 0.02315
Warmup Train [21][3060/3239]	Time 0.505 (0.513)	Data 0.001 (0.011)	Loss 4.4629 (4.4536)	Top-1 acc 24.609 (22.576)	Top-5 acc 46.094 (44.264)	lr 0.02315
Warmup Train [21][3070/3239]	Time 0.423 (0.513)	Data 0.001 (0.011)	Loss 4.3703 (4.4536)	Top-1 acc 23.438 (22.579)	Top-5 acc 48.438 (44.265)	lr 0.02314
Warmup Train [21][3080/3239]	Time 0.545 (0.513)	Data 0.001 (0.011)	Loss 4.3981 (4.4537)	Top-1 acc 23.438 (22.578)	Top-5 acc 44.922 (44.260)	lr 0.02314
Warmup Train [21][3090/3239]	Time 0.525 (0.513)	Data 0.001 (0.011)	Loss 4.5419 (4.4537)	Top-1 acc 20.312 (22.577)	Top-5 acc 40.234 (44.260)	lr 0.02313
Warmup Train [21][3100/3239]	Time 0.594 (0.513)	Data 0.001 (0.011)	Loss 4.5007 (4.4535)	Top-1 acc 20.312 (22.578)	Top-5 acc 41.406 (44.262)	lr 0.02312
Warmup Train [21][3110/3239]	Time 0.648 (0.513)	Data 0.001 (0.011)	Loss 4.6371 (4.4536)	Top-1 acc 21.875 (22.579)	Top-5 acc 39.844 (44.262)	lr 0.02312
Warmup Train [21][3120/3239]	Time 0.499 (0.513)	Data 0.001 (0.011)	Loss 4.6418 (4.4537)	Top-1 acc 18.359 (22.576)	Top-5 acc 41.797 (44.262)	lr 0.02311
Warmup Train [21][3130/3239]	Time 0.546 (0.513)	Data 0.001 (0.011)	Loss 4.3715 (4.4536)	Top-1 acc 22.656 (22.577)	Top-5 acc 47.656 (44.266)	lr 0.02310
Warmup Train [21][3140/3239]	Time 0.546 (0.513)	Data 0.002 (0.011)	Loss 4.4651 (4.4534)	Top-1 acc 23.047 (22.581)	Top-5 acc 44.141 (44.269)	lr 0.02310
Warmup Train [21][3150/3239]	Time 0.427 (0.513)	Data 0.001 (0.011)	Loss 4.5324 (4.4534)	Top-1 acc 25.391 (22.583)	Top-5 acc 43.750 (44.271)	lr 0.02309
Warmup Train [21][3160/3239]	Time 0.507 (0.513)	Data 0.001 (0.011)	Loss 4.3880 (4.4534)	Top-1 acc 22.656 (22.585)	Top-5 acc 42.969 (44.271)	lr 0.02309
Warmup Train [21][3170/3239]	Time 0.506 (0.513)	Data 0.001 (0.011)	Loss 4.4362 (4.4534)	Top-1 acc 23.047 (22.583)	Top-5 acc 45.312 (44.270)	lr 0.02308
Warmup Train [21][3180/3239]	Time 0.540 (0.513)	Data 0.000 (0.011)	Loss 4.5143 (4.4533)	Top-1 acc 25.391 (22.587)	Top-5 acc 41.797 (44.274)	lr 0.02307
Warmup Train [21][3190/3239]	Time 0.512 (0.513)	Data 0.000 (0.011)	Loss 4.2292 (4.4530)	Top-1 acc 29.688 (22.594)	Top-5 acc 51.172 (44.280)	lr 0.02307
Warmup Train [21][3200/3239]	Time 0.653 (0.513)	Data 0.000 (0.011)	Loss 4.4096 (4.4531)	Top-1 acc 22.656 (22.594)	Top-5 acc 46.094 (44.283)	lr 0.02306
Warmup Train [21][3210/3239]	Time 0.347 (0.513)	Data 0.000 (0.011)	Loss 4.4837 (4.4531)	Top-1 acc 21.484 (22.593)	Top-5 acc 45.703 (44.285)	lr 0.02306
Warmup Train [21][3220/3239]	Time 0.483 (0.513)	Data 0.000 (0.011)	Loss 4.4971 (4.4529)	Top-1 acc 19.922 (22.597)	Top-5 acc 40.625 (44.288)	lr 0.02305
Warmup Train [21][3230/3239]	Time 0.564 (0.513)	Data 0.000 (0.011)	Loss 4.3506 (4.4527)	Top-1 acc 25.781 (22.602)	Top-5 acc 46.875 (44.295)	lr 0.02304
Warmup Train [21][3239/3239]	Time 0.361 (0.513)	Data 0.000 (0.011)	Loss 4.2298 (4.4526)	Top-1 acc 30.864 (22.601)	Top-5 acc 54.321 (44.294)	lr 0.02304
==========Warmup Valid [21/40]	loss 3.448	top-1 acc 29.858	top-5 acc 54.181	Train top-1 22.601	top-5 44.294	flops: 442.4M
Warmup Train [22][0/3239]	Time 15.385 (15.385)	Data 12.975 (12.975)	Loss 4.3286 (4.3286)	Top-1 acc 25.391 (25.391)	Top-5 acc 48.828 (48.828)	lr 0.02304
Warmup Train [22][10/3239]	Time 0.597 (1.927)	Data 0.001 (1.183)	Loss 4.5018 (4.4646)	Top-1 acc 23.438 (22.940)	Top-5 acc 42.188 (44.070)	lr 0.02303
Warmup Train [22][20/3239]	Time 0.484 (1.248)	Data 0.001 (0.621)	Loss 4.3992 (4.4299)	Top-1 acc 23.438 (23.084)	Top-5 acc 43.750 (44.792)	lr 0.02303
Warmup Train [22][30/3239]	Time 0.592 (1.005)	Data 0.001 (0.421)	Loss 4.3543 (4.4396)	Top-1 acc 23.828 (22.732)	Top-5 acc 50.781 (44.695)	lr 0.02302
Warmup Train [22][40/3239]	Time 0.437 (0.886)	Data 0.001 (0.319)	Loss 4.5884 (4.4341)	Top-1 acc 21.094 (22.942)	Top-5 acc 40.625 (44.798)	lr 0.02301
Warmup Train [22][50/3239]	Time 0.371 (0.812)	Data 0.001 (0.259)	Loss 4.6186 (4.4333)	Top-1 acc 14.062 (22.924)	Top-5 acc 38.672 (44.914)	lr 0.02301
Warmup Train [22][60/3239]	Time 0.557 (0.767)	Data 0.001 (0.218)	Loss 4.3536 (4.4254)	Top-1 acc 25.391 (23.181)	Top-5 acc 47.656 (45.120)	lr 0.02300
Warmup Train [22][70/3239]	Time 0.509 (0.729)	Data 0.001 (0.188)	Loss 4.2720 (4.4224)	Top-1 acc 21.875 (23.140)	Top-5 acc 46.094 (45.092)	lr 0.02300
Warmup Train [22][80/3239]	Time 0.587 (0.702)	Data 0.001 (0.165)	Loss 4.2349 (4.4211)	Top-1 acc 28.516 (23.283)	Top-5 acc 49.609 (45.081)	lr 0.02299
Warmup Train [22][90/3239]	Time 0.618 (0.682)	Data 0.001 (0.147)	Loss 4.5869 (4.4216)	Top-1 acc 22.266 (23.197)	Top-5 acc 42.578 (44.986)	lr 0.02298
Warmup Train [22][100/3239]	Time 0.710 (0.668)	Data 0.001 (0.133)	Loss 4.4894 (4.4268)	Top-1 acc 21.484 (23.109)	Top-5 acc 41.797 (44.868)	lr 0.02298
Warmup Train [22][110/3239]	Time 0.522 (0.652)	Data 0.001 (0.121)	Loss 4.4324 (4.4278)	Top-1 acc 19.922 (23.128)	Top-5 acc 42.578 (44.880)	lr 0.02297
Warmup Train [22][120/3239]	Time 0.545 (0.640)	Data 0.001 (0.112)	Loss 4.5377 (4.4308)	Top-1 acc 22.266 (23.047)	Top-5 acc 43.750 (44.841)	lr 0.02297
Warmup Train [22][130/3239]	Time 0.518 (0.632)	Data 0.001 (0.104)	Loss 4.4169 (4.4308)	Top-1 acc 21.484 (23.035)	Top-5 acc 43.359 (44.800)	lr 0.02296
Warmup Train [22][140/3239]	Time 0.396 (0.619)	Data 0.001 (0.097)	Loss 4.4499 (4.4285)	Top-1 acc 23.828 (23.011)	Top-5 acc 45.703 (44.797)	lr 0.02295
Warmup Train [22][150/3239]	Time 0.604 (0.612)	Data 0.001 (0.091)	Loss 4.3830 (4.4267)	Top-1 acc 23.047 (23.000)	Top-5 acc 43.359 (44.769)	lr 0.02295
Warmup Train [22][160/3239]	Time 0.491 (0.603)	Data 0.001 (0.086)	Loss 4.3494 (4.4259)	Top-1 acc 24.609 (23.006)	Top-5 acc 48.438 (44.750)	lr 0.02294
Warmup Train [22][170/3239]	Time 0.543 (0.595)	Data 0.001 (0.081)	Loss 4.5366 (4.4287)	Top-1 acc 22.266 (22.994)	Top-5 acc 43.750 (44.728)	lr 0.02294
Warmup Train [22][180/3239]	Time 0.472 (0.587)	Data 0.002 (0.077)	Loss 4.6944 (4.4306)	Top-1 acc 18.359 (22.943)	Top-5 acc 39.062 (44.734)	lr 0.02293
Warmup Train [22][190/3239]	Time 0.374 (0.582)	Data 0.001 (0.073)	Loss 4.6901 (4.4306)	Top-1 acc 14.062 (22.900)	Top-5 acc 37.891 (44.734)	lr 0.02292
Warmup Train [22][200/3239]	Time 0.627 (0.579)	Data 0.001 (0.070)	Loss 4.4194 (4.4293)	Top-1 acc 20.703 (22.954)	Top-5 acc 45.703 (44.801)	lr 0.02292
Warmup Train [22][210/3239]	Time 0.444 (0.576)	Data 0.001 (0.067)	Loss 4.3909 (4.4278)	Top-1 acc 19.922 (23.010)	Top-5 acc 46.875 (44.887)	lr 0.02291
Warmup Train [22][220/3239]	Time 0.357 (0.573)	Data 0.001 (0.064)	Loss 4.2967 (4.4263)	Top-1 acc 26.172 (22.983)	Top-5 acc 47.266 (44.904)	lr 0.02291
Warmup Train [22][230/3239]	Time 0.602 (0.572)	Data 0.001 (0.062)	Loss 4.3883 (4.4235)	Top-1 acc 22.656 (23.040)	Top-5 acc 46.094 (44.937)	lr 0.02290
Warmup Train [22][240/3239]	Time 0.526 (0.570)	Data 0.001 (0.059)	Loss 4.5332 (4.4228)	Top-1 acc 22.266 (23.087)	Top-5 acc 43.359 (44.948)	lr 0.02289
Warmup Train [22][250/3239]	Time 0.545 (0.568)	Data 0.002 (0.057)	Loss 4.5285 (4.4240)	Top-1 acc 20.312 (23.104)	Top-5 acc 40.234 (44.925)	lr 0.02289
Warmup Train [22][260/3239]	Time 0.531 (0.566)	Data 0.001 (0.055)	Loss 4.3271 (4.4228)	Top-1 acc 22.656 (23.131)	Top-5 acc 44.531 (44.940)	lr 0.02288
Warmup Train [22][270/3239]	Time 0.441 (0.564)	Data 0.001 (0.053)	Loss 4.2887 (4.4216)	Top-1 acc 25.000 (23.167)	Top-5 acc 45.703 (44.941)	lr 0.02288
Warmup Train [22][280/3239]	Time 0.488 (0.562)	Data 0.001 (0.052)	Loss 4.4298 (4.4205)	Top-1 acc 17.969 (23.137)	Top-5 acc 44.922 (44.941)	lr 0.02287
Warmup Train [22][290/3239]	Time 0.493 (0.560)	Data 0.001 (0.050)	Loss 4.4148 (4.4198)	Top-1 acc 27.344 (23.146)	Top-5 acc 48.047 (44.990)	lr 0.02286
Warmup Train [22][300/3239]	Time 0.471 (0.558)	Data 0.001 (0.048)	Loss 4.4580 (4.4193)	Top-1 acc 23.828 (23.151)	Top-5 acc 45.312 (45.022)	lr 0.02286
Warmup Train [22][310/3239]	Time 0.591 (0.557)	Data 0.001 (0.047)	Loss 4.3939 (4.4199)	Top-1 acc 25.781 (23.118)	Top-5 acc 49.609 (45.022)	lr 0.02285
Warmup Train [22][320/3239]	Time 0.403 (0.555)	Data 0.001 (0.046)	Loss 4.6025 (4.4209)	Top-1 acc 19.531 (23.081)	Top-5 acc 39.844 (45.023)	lr 0.02285
Warmup Train [22][330/3239]	Time 0.399 (0.555)	Data 0.001 (0.045)	Loss 4.5023 (4.4207)	Top-1 acc 23.047 (23.111)	Top-5 acc 40.234 (45.023)	lr 0.02284
Warmup Train [22][340/3239]	Time 0.505 (0.554)	Data 0.001 (0.043)	Loss 4.4811 (4.4195)	Top-1 acc 18.359 (23.114)	Top-5 acc 41.016 (45.056)	lr 0.02283
Warmup Train [22][350/3239]	Time 0.486 (0.553)	Data 0.001 (0.042)	Loss 4.2072 (4.4183)	Top-1 acc 27.734 (23.178)	Top-5 acc 48.828 (45.094)	lr 0.02283
Warmup Train [22][360/3239]	Time 0.529 (0.552)	Data 0.001 (0.041)	Loss 4.5606 (4.4186)	Top-1 acc 22.656 (23.179)	Top-5 acc 44.531 (45.087)	lr 0.02282
Warmup Train [22][370/3239]	Time 0.547 (0.551)	Data 0.001 (0.040)	Loss 4.4854 (4.4176)	Top-1 acc 21.094 (23.191)	Top-5 acc 42.578 (45.102)	lr 0.02282
Warmup Train [22][380/3239]	Time 0.562 (0.550)	Data 0.001 (0.039)	Loss 4.4098 (4.4177)	Top-1 acc 25.391 (23.175)	Top-5 acc 43.750 (45.066)	lr 0.02281
Warmup Train [22][390/3239]	Time 0.363 (0.548)	Data 0.001 (0.038)	Loss 4.3624 (4.4182)	Top-1 acc 23.828 (23.167)	Top-5 acc 43.750 (45.052)	lr 0.02280
Warmup Train [22][400/3239]	Time 0.395 (0.546)	Data 0.001 (0.038)	Loss 4.3968 (4.4176)	Top-1 acc 24.609 (23.193)	Top-5 acc 42.578 (45.056)	lr 0.02280
Warmup Train [22][410/3239]	Time 0.581 (0.545)	Data 0.001 (0.037)	Loss 4.4919 (4.4171)	Top-1 acc 21.094 (23.186)	Top-5 acc 45.703 (45.051)	lr 0.02279
Warmup Train [22][420/3239]	Time 0.422 (0.544)	Data 0.001 (0.036)	Loss 4.5466 (4.4179)	Top-1 acc 20.703 (23.190)	Top-5 acc 39.844 (44.994)	lr 0.02278
Warmup Train [22][430/3239]	Time 0.554 (0.542)	Data 0.001 (0.036)	Loss 4.7043 (4.4177)	Top-1 acc 16.016 (23.192)	Top-5 acc 37.891 (45.027)	lr 0.02278
Warmup Train [22][440/3239]	Time 0.475 (0.541)	Data 0.001 (0.035)	Loss 4.5960 (4.4182)	Top-1 acc 16.016 (23.184)	Top-5 acc 42.969 (45.041)	lr 0.02277
Warmup Train [22][450/3239]	Time 0.617 (0.541)	Data 0.001 (0.035)	Loss 4.2824 (4.4184)	Top-1 acc 28.125 (23.185)	Top-5 acc 48.438 (45.048)	lr 0.02277
Warmup Train [22][460/3239]	Time 0.407 (0.540)	Data 0.001 (0.034)	Loss 4.2515 (4.4181)	Top-1 acc 25.391 (23.171)	Top-5 acc 50.391 (45.056)	lr 0.02276
Warmup Train [22][470/3239]	Time 0.579 (0.540)	Data 0.001 (0.033)	Loss 4.2678 (4.4176)	Top-1 acc 24.219 (23.165)	Top-5 acc 47.656 (45.065)	lr 0.02275
Warmup Train [22][480/3239]	Time 0.520 (0.540)	Data 0.001 (0.033)	Loss 4.5343 (4.4173)	Top-1 acc 22.656 (23.195)	Top-5 acc 42.188 (45.072)	lr 0.02275
Warmup Train [22][490/3239]	Time 0.499 (0.540)	Data 0.001 (0.032)	Loss 4.3819 (4.4164)	Top-1 acc 24.219 (23.184)	Top-5 acc 44.531 (45.104)	lr 0.02274
Warmup Train [22][500/3239]	Time 0.469 (0.540)	Data 0.001 (0.032)	Loss 4.1807 (4.4160)	Top-1 acc 28.906 (23.180)	Top-5 acc 53.516 (45.100)	lr 0.02274
Warmup Train [22][510/3239]	Time 0.511 (0.539)	Data 0.001 (0.031)	Loss 4.2686 (4.4167)	Top-1 acc 21.875 (23.180)	Top-5 acc 47.656 (45.072)	lr 0.02273
Warmup Train [22][520/3239]	Time 0.498 (0.539)	Data 0.001 (0.031)	Loss 4.4339 (4.4171)	Top-1 acc 22.266 (23.185)	Top-5 acc 45.312 (45.061)	lr 0.02272
Warmup Train [22][530/3239]	Time 0.549 (0.538)	Data 0.001 (0.030)	Loss 4.5096 (4.4166)	Top-1 acc 18.750 (23.181)	Top-5 acc 42.969 (45.076)	lr 0.02272
Warmup Train [22][540/3239]	Time 0.404 (0.538)	Data 0.001 (0.030)	Loss 4.7248 (4.4170)	Top-1 acc 15.625 (23.170)	Top-5 acc 38.672 (45.071)	lr 0.02271
Warmup Train [22][550/3239]	Time 0.404 (0.538)	Data 0.001 (0.030)	Loss 4.4136 (4.4173)	Top-1 acc 23.047 (23.186)	Top-5 acc 44.141 (45.047)	lr 0.02271
Warmup Train [22][560/3239]	Time 0.562 (0.537)	Data 0.001 (0.029)	Loss 4.5231 (4.4177)	Top-1 acc 24.609 (23.188)	Top-5 acc 42.578 (45.037)	lr 0.02270
Warmup Train [22][570/3239]	Time 0.475 (0.537)	Data 0.001 (0.029)	Loss 4.4375 (4.4182)	Top-1 acc 23.828 (23.188)	Top-5 acc 43.359 (45.028)	lr 0.02269
Warmup Train [22][580/3239]	Time 0.655 (0.537)	Data 0.001 (0.028)	Loss 4.5479 (4.4179)	Top-1 acc 21.875 (23.204)	Top-5 acc 41.797 (45.021)	lr 0.02269
Warmup Train [22][590/3239]	Time 0.610 (0.536)	Data 0.002 (0.028)	Loss 4.3097 (4.4179)	Top-1 acc 26.562 (23.186)	Top-5 acc 50.391 (45.013)	lr 0.02268
Warmup Train [22][600/3239]	Time 0.550 (0.536)	Data 0.001 (0.028)	Loss 4.3324 (4.4183)	Top-1 acc 26.562 (23.184)	Top-5 acc 46.094 (45.003)	lr 0.02268
Warmup Train [22][610/3239]	Time 0.584 (0.536)	Data 0.001 (0.027)	Loss 4.5437 (4.4179)	Top-1 acc 20.312 (23.191)	Top-5 acc 40.625 (45.004)	lr 0.02267
Warmup Train [22][620/3239]	Time 0.712 (0.536)	Data 0.001 (0.027)	Loss 4.4391 (4.4175)	Top-1 acc 25.781 (23.202)	Top-5 acc 44.531 (44.999)	lr 0.02266
Warmup Train [22][630/3239]	Time 0.614 (0.535)	Data 0.001 (0.026)	Loss 4.5495 (4.4176)	Top-1 acc 17.969 (23.190)	Top-5 acc 40.625 (44.989)	lr 0.02266
Warmup Train [22][640/3239]	Time 0.421 (0.534)	Data 0.001 (0.026)	Loss 4.3394 (4.4181)	Top-1 acc 28.125 (23.204)	Top-5 acc 48.047 (45.002)	lr 0.02265
Warmup Train [22][650/3239]	Time 0.356 (0.533)	Data 0.001 (0.026)	Loss 4.5323 (4.4188)	Top-1 acc 27.344 (23.191)	Top-5 acc 44.141 (44.984)	lr 0.02265
Warmup Train [22][660/3239]	Time 0.561 (0.532)	Data 0.001 (0.026)	Loss 4.5700 (4.4190)	Top-1 acc 20.703 (23.176)	Top-5 acc 43.359 (44.993)	lr 0.02264
Warmup Train [22][670/3239]	Time 0.520 (0.531)	Data 0.001 (0.025)	Loss 4.2527 (4.4193)	Top-1 acc 25.000 (23.167)	Top-5 acc 48.438 (44.992)	lr 0.02263
Warmup Train [22][680/3239]	Time 0.494 (0.530)	Data 0.001 (0.025)	Loss 4.4037 (4.4184)	Top-1 acc 23.828 (23.185)	Top-5 acc 44.922 (45.014)	lr 0.02263
Warmup Train [22][690/3239]	Time 0.628 (0.530)	Data 0.001 (0.025)	Loss 4.3892 (4.4190)	Top-1 acc 24.219 (23.189)	Top-5 acc 43.359 (45.005)	lr 0.02262
Warmup Train [22][700/3239]	Time 0.474 (0.530)	Data 0.001 (0.024)	Loss 4.6221 (4.4196)	Top-1 acc 21.875 (23.177)	Top-5 acc 43.359 (44.993)	lr 0.02262
Warmup Train [22][710/3239]	Time 0.392 (0.529)	Data 0.001 (0.024)	Loss 4.4220 (4.4196)	Top-1 acc 22.266 (23.178)	Top-5 acc 46.484 (44.988)	lr 0.02261
Warmup Train [22][720/3239]	Time 0.516 (0.529)	Data 0.001 (0.024)	Loss 4.3684 (4.4194)	Top-1 acc 24.219 (23.183)	Top-5 acc 44.922 (44.972)	lr 0.02260
Warmup Train [22][730/3239]	Time 0.298 (0.529)	Data 0.002 (0.024)	Loss 4.3774 (4.4192)	Top-1 acc 21.875 (23.194)	Top-5 acc 45.312 (44.982)	lr 0.02260
Warmup Train [22][740/3239]	Time 0.485 (0.529)	Data 0.001 (0.024)	Loss 4.3502 (4.4191)	Top-1 acc 25.000 (23.203)	Top-5 acc 44.922 (44.990)	lr 0.02259
Warmup Train [22][750/3239]	Time 0.718 (0.528)	Data 0.001 (0.024)	Loss 4.4545 (4.4195)	Top-1 acc 19.531 (23.186)	Top-5 acc 48.438 (44.984)	lr 0.02259
Warmup Train [22][760/3239]	Time 0.396 (0.528)	Data 0.021 (0.023)	Loss 4.4449 (4.4196)	Top-1 acc 24.609 (23.185)	Top-5 acc 48.828 (44.976)	lr 0.02258
Warmup Train [22][770/3239]	Time 0.617 (0.528)	Data 0.001 (0.023)	Loss 4.3135 (4.4188)	Top-1 acc 27.344 (23.197)	Top-5 acc 45.703 (44.995)	lr 0.02257
Warmup Train [22][780/3239]	Time 0.505 (0.528)	Data 0.001 (0.023)	Loss 4.3335 (4.4188)	Top-1 acc 25.000 (23.189)	Top-5 acc 44.922 (44.999)	lr 0.02257
Warmup Train [22][790/3239]	Time 0.609 (0.527)	Data 0.001 (0.023)	Loss 4.5355 (4.4192)	Top-1 acc 23.828 (23.185)	Top-5 acc 42.188 (44.995)	lr 0.02256
Warmup Train [22][800/3239]	Time 0.513 (0.527)	Data 0.001 (0.022)	Loss 4.6042 (4.4189)	Top-1 acc 16.406 (23.190)	Top-5 acc 38.672 (45.025)	lr 0.02256
Warmup Train [22][810/3239]	Time 0.481 (0.527)	Data 0.001 (0.022)	Loss 4.5346 (4.4196)	Top-1 acc 22.266 (23.175)	Top-5 acc 42.578 (45.011)	lr 0.02255
Warmup Train [22][820/3239]	Time 0.343 (0.527)	Data 0.001 (0.022)	Loss 4.3718 (4.4194)	Top-1 acc 23.438 (23.188)	Top-5 acc 46.094 (45.020)	lr 0.02254
Warmup Train [22][830/3239]	Time 0.561 (0.526)	Data 0.001 (0.022)	Loss 4.3400 (4.4193)	Top-1 acc 26.172 (23.199)	Top-5 acc 48.828 (45.030)	lr 0.02254
Warmup Train [22][840/3239]	Time 0.513 (0.526)	Data 0.002 (0.022)	Loss 4.5516 (4.4194)	Top-1 acc 20.312 (23.202)	Top-5 acc 44.531 (45.032)	lr 0.02253
Warmup Train [22][850/3239]	Time 0.432 (0.526)	Data 0.002 (0.021)	Loss 4.1684 (4.4193)	Top-1 acc 27.344 (23.202)	Top-5 acc 53.906 (45.043)	lr 0.02253
Warmup Train [22][860/3239]	Time 0.380 (0.526)	Data 0.001 (0.021)	Loss 4.4003 (4.4195)	Top-1 acc 21.484 (23.182)	Top-5 acc 46.094 (45.037)	lr 0.02252
Warmup Train [22][870/3239]	Time 0.522 (0.526)	Data 0.001 (0.021)	Loss 4.5468 (4.4198)	Top-1 acc 16.016 (23.164)	Top-5 acc 40.234 (45.038)	lr 0.02251
Warmup Train [22][880/3239]	Time 0.457 (0.526)	Data 0.002 (0.021)	Loss 4.4890 (4.4197)	Top-1 acc 24.609 (23.157)	Top-5 acc 44.531 (45.034)	lr 0.02251
Warmup Train [22][890/3239]	Time 0.500 (0.525)	Data 0.001 (0.021)	Loss 4.4747 (4.4200)	Top-1 acc 22.266 (23.156)	Top-5 acc 45.703 (45.032)	lr 0.02250
Warmup Train [22][900/3239]	Time 0.419 (0.525)	Data 0.001 (0.021)	Loss 4.3630 (4.4193)	Top-1 acc 24.609 (23.170)	Top-5 acc 48.828 (45.042)	lr 0.02250
Warmup Train [22][910/3239]	Time 0.173 (0.524)	Data 0.001 (0.021)	Loss 4.5184 (4.4191)	Top-1 acc 26.172 (23.185)	Top-5 acc 44.922 (45.040)	lr 0.02249
Warmup Train [22][920/3239]	Time 0.507 (0.524)	Data 0.001 (0.021)	Loss 4.1959 (4.4185)	Top-1 acc 29.297 (23.187)	Top-5 acc 48.438 (45.039)	lr 0.02248
Warmup Train [22][930/3239]	Time 0.494 (0.524)	Data 0.001 (0.020)	Loss 4.5567 (4.4184)	Top-1 acc 19.531 (23.184)	Top-5 acc 41.406 (45.041)	lr 0.02248
Warmup Train [22][940/3239]	Time 0.532 (0.524)	Data 0.001 (0.020)	Loss 4.4952 (4.4184)	Top-1 acc 19.531 (23.195)	Top-5 acc 43.750 (45.046)	lr 0.02247
Warmup Train [22][950/3239]	Time 0.483 (0.524)	Data 0.001 (0.020)	Loss 4.4536 (4.4184)	Top-1 acc 24.609 (23.202)	Top-5 acc 46.484 (45.050)	lr 0.02247
Warmup Train [22][960/3239]	Time 0.542 (0.524)	Data 0.001 (0.020)	Loss 4.2182 (4.4180)	Top-1 acc 23.047 (23.198)	Top-5 acc 52.734 (45.059)	lr 0.02246
Warmup Train [22][970/3239]	Time 0.435 (0.524)	Data 0.001 (0.020)	Loss 4.2916 (4.4176)	Top-1 acc 25.391 (23.207)	Top-5 acc 48.438 (45.063)	lr 0.02245
Warmup Train [22][980/3239]	Time 0.340 (0.523)	Data 0.001 (0.020)	Loss 4.4429 (4.4181)	Top-1 acc 21.484 (23.206)	Top-5 acc 43.750 (45.054)	lr 0.02245
Warmup Train [22][990/3239]	Time 0.506 (0.523)	Data 0.001 (0.020)	Loss 4.5431 (4.4181)	Top-1 acc 20.312 (23.199)	Top-5 acc 41.406 (45.057)	lr 0.02244
Warmup Train [22][1000/3239]	Time 0.646 (0.523)	Data 0.001 (0.019)	Loss 4.3809 (4.4181)	Top-1 acc 26.562 (23.205)	Top-5 acc 46.094 (45.066)	lr 0.02244
Warmup Train [22][1010/3239]	Time 0.507 (0.523)	Data 0.001 (0.019)	Loss 4.3261 (4.4176)	Top-1 acc 25.781 (23.220)	Top-5 acc 48.828 (45.078)	lr 0.02243
Warmup Train [22][1020/3239]	Time 0.358 (0.523)	Data 0.001 (0.019)	Loss 4.7394 (4.4169)	Top-1 acc 16.406 (23.213)	Top-5 acc 39.062 (45.103)	lr 0.02242
Warmup Train [22][1030/3239]	Time 0.280 (0.523)	Data 0.001 (0.019)	Loss 4.4240 (4.4167)	Top-1 acc 21.484 (23.219)	Top-5 acc 39.062 (45.108)	lr 0.02242
Warmup Train [22][1040/3239]	Time 0.416 (0.523)	Data 0.001 (0.019)	Loss 4.4838 (4.4161)	Top-1 acc 22.266 (23.236)	Top-5 acc 41.797 (45.125)	lr 0.02241
Warmup Train [22][1050/3239]	Time 0.357 (0.523)	Data 0.001 (0.019)	Loss 4.3423 (4.4161)	Top-1 acc 26.562 (23.227)	Top-5 acc 45.703 (45.124)	lr 0.02240
Warmup Train [22][1060/3239]	Time 0.538 (0.523)	Data 0.001 (0.019)	Loss 4.2679 (4.4158)	Top-1 acc 28.906 (23.241)	Top-5 acc 46.875 (45.131)	lr 0.02240
Warmup Train [22][1070/3239]	Time 0.624 (0.523)	Data 0.001 (0.019)	Loss 4.3301 (4.4160)	Top-1 acc 23.047 (23.238)	Top-5 acc 48.047 (45.132)	lr 0.02239
Warmup Train [22][1080/3239]	Time 0.405 (0.523)	Data 0.001 (0.019)	Loss 4.3288 (4.4159)	Top-1 acc 25.781 (23.239)	Top-5 acc 46.484 (45.125)	lr 0.02239
Warmup Train [22][1090/3239]	Time 0.502 (0.523)	Data 0.001 (0.019)	Loss 4.4411 (4.4160)	Top-1 acc 26.172 (23.233)	Top-5 acc 43.750 (45.113)	lr 0.02238
Warmup Train [22][1100/3239]	Time 0.497 (0.523)	Data 0.001 (0.018)	Loss 4.3017 (4.4156)	Top-1 acc 23.828 (23.232)	Top-5 acc 46.875 (45.128)	lr 0.02237
Warmup Train [22][1110/3239]	Time 0.446 (0.522)	Data 0.001 (0.018)	Loss 4.4491 (4.4159)	Top-1 acc 21.094 (23.233)	Top-5 acc 44.141 (45.121)	lr 0.02237
Warmup Train [22][1120/3239]	Time 0.402 (0.522)	Data 0.001 (0.018)	Loss 4.5057 (4.4163)	Top-1 acc 19.922 (23.220)	Top-5 acc 44.922 (45.121)	lr 0.02236
Warmup Train [22][1130/3239]	Time 0.470 (0.522)	Data 0.001 (0.018)	Loss 4.5876 (4.4161)	Top-1 acc 20.312 (23.231)	Top-5 acc 40.234 (45.126)	lr 0.02236
Warmup Train [22][1140/3239]	Time 0.623 (0.522)	Data 0.001 (0.018)	Loss 4.3872 (4.4162)	Top-1 acc 23.828 (23.233)	Top-5 acc 46.094 (45.118)	lr 0.02235
Warmup Train [22][1150/3239]	Time 0.399 (0.521)	Data 0.001 (0.018)	Loss 4.4122 (4.4161)	Top-1 acc 24.609 (23.237)	Top-5 acc 46.484 (45.126)	lr 0.02234
Warmup Train [22][1160/3239]	Time 0.636 (0.521)	Data 0.001 (0.018)	Loss 4.2983 (4.4163)	Top-1 acc 25.000 (23.237)	Top-5 acc 47.656 (45.121)	lr 0.02234
Warmup Train [22][1170/3239]	Time 0.534 (0.521)	Data 0.001 (0.018)	Loss 4.3900 (4.4161)	Top-1 acc 24.609 (23.245)	Top-5 acc 46.094 (45.132)	lr 0.02233
Warmup Train [22][1180/3239]	Time 0.445 (0.520)	Data 0.001 (0.018)	Loss 4.4985 (4.4163)	Top-1 acc 23.438 (23.251)	Top-5 acc 42.578 (45.127)	lr 0.02233
Warmup Train [22][1190/3239]	Time 0.568 (0.521)	Data 0.001 (0.018)	Loss 4.4258 (4.4160)	Top-1 acc 23.047 (23.258)	Top-5 acc 46.484 (45.133)	lr 0.02232
Warmup Train [22][1200/3239]	Time 0.470 (0.520)	Data 0.001 (0.017)	Loss 4.4486 (4.4159)	Top-1 acc 17.969 (23.258)	Top-5 acc 42.578 (45.133)	lr 0.02231
Warmup Train [22][1210/3239]	Time 0.467 (0.520)	Data 0.001 (0.017)	Loss 4.6487 (4.4159)	Top-1 acc 20.703 (23.264)	Top-5 acc 40.234 (45.142)	lr 0.02231
Warmup Train [22][1220/3239]	Time 0.580 (0.520)	Data 0.003 (0.017)	Loss 4.4337 (4.4152)	Top-1 acc 21.484 (23.273)	Top-5 acc 41.016 (45.154)	lr 0.02230
Warmup Train [22][1230/3239]	Time 0.569 (0.520)	Data 0.001 (0.017)	Loss 4.1418 (4.4148)	Top-1 acc 23.828 (23.276)	Top-5 acc 51.562 (45.166)	lr 0.02230
Warmup Train [22][1240/3239]	Time 0.545 (0.520)	Data 0.001 (0.017)	Loss 4.5291 (4.4150)	Top-1 acc 20.703 (23.266)	Top-5 acc 41.797 (45.165)	lr 0.02229
Warmup Train [22][1250/3239]	Time 0.557 (0.520)	Data 0.001 (0.017)	Loss 4.3890 (4.4150)	Top-1 acc 25.000 (23.269)	Top-5 acc 47.656 (45.169)	lr 0.02228
Warmup Train [22][1260/3239]	Time 0.404 (0.520)	Data 0.001 (0.017)	Loss 4.3373 (4.4150)	Top-1 acc 25.391 (23.276)	Top-5 acc 48.828 (45.172)	lr 0.02228
Warmup Train [22][1270/3239]	Time 0.476 (0.520)	Data 0.001 (0.017)	Loss 4.3901 (4.4149)	Top-1 acc 24.609 (23.277)	Top-5 acc 45.703 (45.175)	lr 0.02227
Warmup Train [22][1280/3239]	Time 0.567 (0.520)	Data 0.001 (0.017)	Loss 4.2486 (4.4149)	Top-1 acc 23.828 (23.276)	Top-5 acc 51.172 (45.177)	lr 0.02227
Warmup Train [22][1290/3239]	Time 0.358 (0.520)	Data 0.001 (0.016)	Loss 4.3002 (4.4148)	Top-1 acc 27.344 (23.273)	Top-5 acc 51.953 (45.190)	lr 0.02226
Warmup Train [22][1300/3239]	Time 0.367 (0.519)	Data 0.001 (0.016)	Loss 4.5024 (4.4150)	Top-1 acc 21.875 (23.272)	Top-5 acc 40.625 (45.184)	lr 0.02225
Warmup Train [22][1310/3239]	Time 0.491 (0.520)	Data 0.001 (0.016)	Loss 4.5013 (4.4152)	Top-1 acc 20.703 (23.264)	Top-5 acc 46.875 (45.190)	lr 0.02225
Warmup Train [22][1320/3239]	Time 0.416 (0.520)	Data 0.002 (0.016)	Loss 4.4221 (4.4153)	Top-1 acc 21.094 (23.260)	Top-5 acc 43.750 (45.189)	lr 0.02224
Warmup Train [22][1330/3239]	Time 0.502 (0.520)	Data 0.001 (0.016)	Loss 4.3556 (4.4153)	Top-1 acc 24.609 (23.260)	Top-5 acc 44.141 (45.179)	lr 0.02224
Warmup Train [22][1340/3239]	Time 0.543 (0.520)	Data 0.002 (0.016)	Loss 4.3002 (4.4153)	Top-1 acc 23.047 (23.249)	Top-5 acc 48.828 (45.170)	lr 0.02223
Warmup Train [22][1350/3239]	Time 0.322 (0.520)	Data 0.001 (0.016)	Loss 4.3980 (4.4152)	Top-1 acc 25.391 (23.251)	Top-5 acc 46.484 (45.168)	lr 0.02222
Warmup Train [22][1360/3239]	Time 0.709 (0.520)	Data 0.001 (0.016)	Loss 4.4466 (4.4144)	Top-1 acc 28.125 (23.273)	Top-5 acc 44.531 (45.185)	lr 0.02222
Warmup Train [22][1370/3239]	Time 0.576 (0.520)	Data 0.001 (0.016)	Loss 4.4100 (4.4137)	Top-1 acc 25.781 (23.286)	Top-5 acc 44.531 (45.198)	lr 0.02221
Warmup Train [22][1380/3239]	Time 0.487 (0.519)	Data 0.001 (0.016)	Loss 4.3445 (4.4138)	Top-1 acc 26.953 (23.293)	Top-5 acc 44.141 (45.192)	lr 0.02221
Warmup Train [22][1390/3239]	Time 0.622 (0.519)	Data 0.001 (0.016)	Loss 4.4200 (4.4133)	Top-1 acc 28.125 (23.306)	Top-5 acc 46.094 (45.201)	lr 0.02220
Warmup Train [22][1400/3239]	Time 0.513 (0.519)	Data 0.002 (0.016)	Loss 4.4163 (4.4126)	Top-1 acc 23.828 (23.321)	Top-5 acc 42.969 (45.213)	lr 0.02219
Warmup Train [22][1410/3239]	Time 0.392 (0.519)	Data 0.001 (0.016)	Loss 4.3636 (4.4127)	Top-1 acc 23.438 (23.323)	Top-5 acc 46.094 (45.211)	lr 0.02219
Warmup Train [22][1420/3239]	Time 0.358 (0.518)	Data 0.001 (0.016)	Loss 4.2788 (4.4125)	Top-1 acc 23.828 (23.314)	Top-5 acc 49.219 (45.218)	lr 0.02218
Warmup Train [22][1430/3239]	Time 0.489 (0.519)	Data 0.001 (0.016)	Loss 4.4198 (4.4126)	Top-1 acc 21.875 (23.314)	Top-5 acc 48.828 (45.214)	lr 0.02218
Warmup Train [22][1440/3239]	Time 0.419 (0.519)	Data 0.001 (0.016)	Loss 4.5859 (4.4124)	Top-1 acc 21.484 (23.321)	Top-5 acc 41.016 (45.218)	lr 0.02217
Warmup Train [22][1450/3239]	Time 0.492 (0.519)	Data 0.001 (0.016)	Loss 4.4412 (4.4125)	Top-1 acc 22.266 (23.316)	Top-5 acc 45.312 (45.212)	lr 0.02216
Warmup Train [22][1460/3239]	Time 0.634 (0.519)	Data 0.001 (0.016)	Loss 4.3777 (4.4124)	Top-1 acc 21.484 (23.315)	Top-5 acc 46.484 (45.207)	lr 0.02216
Warmup Train [22][1470/3239]	Time 0.297 (0.519)	Data 0.001 (0.015)	Loss 4.2655 (4.4120)	Top-1 acc 26.953 (23.321)	Top-5 acc 51.953 (45.220)	lr 0.02215
Warmup Train [22][1480/3239]	Time 0.536 (0.518)	Data 0.001 (0.015)	Loss 4.3762 (4.4119)	Top-1 acc 27.734 (23.324)	Top-5 acc 45.703 (45.218)	lr 0.02215
Warmup Train [22][1490/3239]	Time 0.521 (0.518)	Data 0.002 (0.015)	Loss 4.2439 (4.4118)	Top-1 acc 31.250 (23.322)	Top-5 acc 49.219 (45.219)	lr 0.02214
Warmup Train [22][1500/3239]	Time 0.510 (0.518)	Data 0.001 (0.015)	Loss 4.4078 (4.4117)	Top-1 acc 23.828 (23.323)	Top-5 acc 43.750 (45.221)	lr 0.02213
Warmup Train [22][1510/3239]	Time 0.527 (0.518)	Data 0.001 (0.015)	Loss 4.4119 (4.4118)	Top-1 acc 23.828 (23.319)	Top-5 acc 46.484 (45.220)	lr 0.02213
Warmup Train [22][1520/3239]	Time 0.399 (0.518)	Data 0.001 (0.015)	Loss 4.4879 (4.4115)	Top-1 acc 21.484 (23.322)	Top-5 acc 41.406 (45.219)	lr 0.02212
Warmup Train [22][1530/3239]	Time 0.336 (0.518)	Data 0.001 (0.015)	Loss 4.4544 (4.4115)	Top-1 acc 25.000 (23.321)	Top-5 acc 44.141 (45.216)	lr 0.02212
Warmup Train [22][1540/3239]	Time 0.624 (0.518)	Data 0.001 (0.015)	Loss 4.4487 (4.4113)	Top-1 acc 21.094 (23.320)	Top-5 acc 42.578 (45.218)	lr 0.02211
Warmup Train [22][1550/3239]	Time 0.367 (0.518)	Data 0.001 (0.015)	Loss 4.3552 (4.4113)	Top-1 acc 27.734 (23.317)	Top-5 acc 45.703 (45.220)	lr 0.02210
Warmup Train [22][1560/3239]	Time 0.508 (0.518)	Data 0.001 (0.015)	Loss 4.3567 (4.4115)	Top-1 acc 26.172 (23.312)	Top-5 acc 47.266 (45.213)	lr 0.02210
Warmup Train [22][1570/3239]	Time 0.485 (0.518)	Data 0.001 (0.015)	Loss 4.4998 (4.4110)	Top-1 acc 22.656 (23.314)	Top-5 acc 39.062 (45.229)	lr 0.02209
Warmup Train [22][1580/3239]	Time 0.362 (0.518)	Data 0.001 (0.015)	Loss 4.5142 (4.4112)	Top-1 acc 20.703 (23.309)	Top-5 acc 40.625 (45.224)	lr 0.02209
Warmup Train [22][1590/3239]	Time 0.428 (0.518)	Data 0.001 (0.015)	Loss 4.1967 (4.4112)	Top-1 acc 22.266 (23.310)	Top-5 acc 50.391 (45.228)	lr 0.02208
Warmup Train [22][1600/3239]	Time 0.476 (0.518)	Data 0.001 (0.015)	Loss 4.2305 (4.4113)	Top-1 acc 24.609 (23.302)	Top-5 acc 51.172 (45.230)	lr 0.02207
Warmup Train [22][1610/3239]	Time 0.493 (0.518)	Data 0.001 (0.015)	Loss 4.4457 (4.4112)	Top-1 acc 21.484 (23.303)	Top-5 acc 44.141 (45.236)	lr 0.02207
Warmup Train [22][1620/3239]	Time 0.394 (0.518)	Data 0.001 (0.015)	Loss 4.4595 (4.4113)	Top-1 acc 22.656 (23.301)	Top-5 acc 45.703 (45.236)	lr 0.02206
Warmup Train [22][1630/3239]	Time 0.458 (0.518)	Data 0.001 (0.015)	Loss 4.2492 (4.4110)	Top-1 acc 29.297 (23.306)	Top-5 acc 48.828 (45.242)	lr 0.02206
Warmup Train [22][1640/3239]	Time 0.425 (0.517)	Data 0.001 (0.015)	Loss 4.4140 (4.4108)	Top-1 acc 23.828 (23.311)	Top-5 acc 46.094 (45.246)	lr 0.02205
Warmup Train [22][1650/3239]	Time 0.387 (0.517)	Data 0.001 (0.015)	Loss 4.4988 (4.4109)	Top-1 acc 20.703 (23.306)	Top-5 acc 41.016 (45.247)	lr 0.02204
Warmup Train [22][1660/3239]	Time 0.490 (0.517)	Data 0.002 (0.015)	Loss 4.3165 (4.4104)	Top-1 acc 23.828 (23.313)	Top-5 acc 47.656 (45.252)	lr 0.02204
Warmup Train [22][1670/3239]	Time 0.561 (0.517)	Data 0.001 (0.015)	Loss 4.3658 (4.4103)	Top-1 acc 19.531 (23.308)	Top-5 acc 43.359 (45.251)	lr 0.02203
Warmup Train [22][1680/3239]	Time 0.652 (0.517)	Data 0.001 (0.015)	Loss 4.3891 (4.4103)	Top-1 acc 25.000 (23.308)	Top-5 acc 44.141 (45.247)	lr 0.02203
Warmup Train [22][1690/3239]	Time 0.488 (0.517)	Data 0.001 (0.015)	Loss 4.4843 (4.4107)	Top-1 acc 23.828 (23.297)	Top-5 acc 45.312 (45.238)	lr 0.02202
Warmup Train [22][1700/3239]	Time 0.512 (0.517)	Data 0.001 (0.015)	Loss 4.5153 (4.4108)	Top-1 acc 25.781 (23.298)	Top-5 acc 43.750 (45.236)	lr 0.02201
Warmup Train [22][1710/3239]	Time 0.502 (0.517)	Data 0.001 (0.015)	Loss 4.3989 (4.4109)	Top-1 acc 21.484 (23.297)	Top-5 acc 44.141 (45.239)	lr 0.02201
Warmup Train [22][1720/3239]	Time 0.493 (0.517)	Data 0.001 (0.015)	Loss 4.3933 (4.4111)	Top-1 acc 21.484 (23.293)	Top-5 acc 47.266 (45.236)	lr 0.02200
Warmup Train [22][1730/3239]	Time 0.526 (0.517)	Data 0.001 (0.014)	Loss 4.1098 (4.4106)	Top-1 acc 30.469 (23.306)	Top-5 acc 51.562 (45.248)	lr 0.02200
Warmup Train [22][1740/3239]	Time 0.465 (0.517)	Data 0.001 (0.014)	Loss 4.2607 (4.4100)	Top-1 acc 21.484 (23.316)	Top-5 acc 48.438 (45.258)	lr 0.02199
Warmup Train [22][1750/3239]	Time 0.608 (0.517)	Data 0.001 (0.014)	Loss 4.1360 (4.4093)	Top-1 acc 28.516 (23.331)	Top-5 acc 50.391 (45.279)	lr 0.02198
Warmup Train [22][1760/3239]	Time 0.539 (0.517)	Data 0.031 (0.014)	Loss 4.3394 (4.4086)	Top-1 acc 25.781 (23.339)	Top-5 acc 48.438 (45.295)	lr 0.02198
Warmup Train [22][1770/3239]	Time 0.531 (0.517)	Data 0.001 (0.014)	Loss 4.2435 (4.4084)	Top-1 acc 23.047 (23.343)	Top-5 acc 49.219 (45.300)	lr 0.02197
Warmup Train [22][1780/3239]	Time 0.531 (0.517)	Data 0.001 (0.014)	Loss 4.2350 (4.4082)	Top-1 acc 28.125 (23.349)	Top-5 acc 49.219 (45.305)	lr 0.02197
Warmup Train [22][1790/3239]	Time 0.581 (0.517)	Data 0.001 (0.014)	Loss 4.3895 (4.4084)	Top-1 acc 23.438 (23.343)	Top-5 acc 47.656 (45.300)	lr 0.02196
Warmup Train [22][1800/3239]	Time 0.472 (0.517)	Data 0.001 (0.014)	Loss 4.3616 (4.4083)	Top-1 acc 22.656 (23.348)	Top-5 acc 44.531 (45.301)	lr 0.02195
Warmup Train [22][1810/3239]	Time 0.431 (0.517)	Data 0.001 (0.014)	Loss 4.4742 (4.4084)	Top-1 acc 19.531 (23.347)	Top-5 acc 43.750 (45.297)	lr 0.02195
Warmup Train [22][1820/3239]	Time 0.625 (0.517)	Data 0.001 (0.014)	Loss 4.3333 (4.4083)	Top-1 acc 21.094 (23.350)	Top-5 acc 47.266 (45.301)	lr 0.02194
Warmup Train [22][1830/3239]	Time 0.476 (0.517)	Data 0.001 (0.014)	Loss 4.3824 (4.4080)	Top-1 acc 23.828 (23.355)	Top-5 acc 48.047 (45.312)	lr 0.02194
Warmup Train [22][1840/3239]	Time 0.487 (0.517)	Data 0.001 (0.014)	Loss 4.4111 (4.4079)	Top-1 acc 25.000 (23.353)	Top-5 acc 45.703 (45.318)	lr 0.02193
Warmup Train [22][1850/3239]	Time 0.616 (0.517)	Data 0.001 (0.014)	Loss 4.4270 (4.4080)	Top-1 acc 20.312 (23.349)	Top-5 acc 44.141 (45.314)	lr 0.02192
Warmup Train [22][1860/3239]	Time 0.652 (0.517)	Data 0.003 (0.014)	Loss 4.3083 (4.4077)	Top-1 acc 22.656 (23.350)	Top-5 acc 45.312 (45.318)	lr 0.02192
Warmup Train [22][1870/3239]	Time 0.348 (0.517)	Data 0.001 (0.014)	Loss 4.4152 (4.4072)	Top-1 acc 24.219 (23.356)	Top-5 acc 43.359 (45.328)	lr 0.02191
Warmup Train [22][1880/3239]	Time 0.393 (0.517)	Data 0.001 (0.014)	Loss 4.5140 (4.4073)	Top-1 acc 22.266 (23.356)	Top-5 acc 42.188 (45.332)	lr 0.02191
Warmup Train [22][1890/3239]	Time 0.598 (0.516)	Data 0.025 (0.014)	Loss 4.3010 (4.4072)	Top-1 acc 26.172 (23.355)	Top-5 acc 49.609 (45.336)	lr 0.02190
Warmup Train [22][1900/3239]	Time 0.503 (0.516)	Data 0.001 (0.014)	Loss 4.4834 (4.4071)	Top-1 acc 23.047 (23.359)	Top-5 acc 39.062 (45.340)	lr 0.02189
Warmup Train [22][1910/3239]	Time 0.343 (0.516)	Data 0.001 (0.014)	Loss 4.2161 (4.4067)	Top-1 acc 25.781 (23.364)	Top-5 acc 46.484 (45.354)	lr 0.02189
Warmup Train [22][1920/3239]	Time 0.433 (0.516)	Data 0.001 (0.014)	Loss 4.3760 (4.4064)	Top-1 acc 21.484 (23.371)	Top-5 acc 46.484 (45.360)	lr 0.02188
Warmup Train [22][1930/3239]	Time 0.514 (0.516)	Data 0.001 (0.014)	Loss 4.3104 (4.4061)	Top-1 acc 26.562 (23.369)	Top-5 acc 46.484 (45.369)	lr 0.02188
Warmup Train [22][1940/3239]	Time 0.610 (0.516)	Data 0.001 (0.014)	Loss 4.1869 (4.4060)	Top-1 acc 27.734 (23.366)	Top-5 acc 51.562 (45.365)	lr 0.02187
Warmup Train [22][1950/3239]	Time 0.421 (0.516)	Data 0.001 (0.014)	Loss 4.3077 (4.4060)	Top-1 acc 24.609 (23.366)	Top-5 acc 46.875 (45.364)	lr 0.02186
Warmup Train [22][1960/3239]	Time 0.637 (0.516)	Data 0.001 (0.014)	Loss 4.3140 (4.4060)	Top-1 acc 25.000 (23.368)	Top-5 acc 46.094 (45.361)	lr 0.02186
Warmup Train [22][1970/3239]	Time 0.536 (0.516)	Data 0.001 (0.014)	Loss 4.3595 (4.4058)	Top-1 acc 22.656 (23.363)	Top-5 acc 43.750 (45.366)	lr 0.02185
Warmup Train [22][1980/3239]	Time 0.607 (0.516)	Data 0.001 (0.013)	Loss 4.2816 (4.4058)	Top-1 acc 28.125 (23.365)	Top-5 acc 48.828 (45.372)	lr 0.02185
Warmup Train [22][1990/3239]	Time 0.529 (0.516)	Data 0.001 (0.013)	Loss 4.4320 (4.4059)	Top-1 acc 22.266 (23.365)	Top-5 acc 46.094 (45.370)	lr 0.02184
Warmup Train [22][2000/3239]	Time 0.437 (0.516)	Data 0.001 (0.013)	Loss 4.5578 (4.4058)	Top-1 acc 19.531 (23.369)	Top-5 acc 42.578 (45.379)	lr 0.02183
Warmup Train [22][2010/3239]	Time 0.554 (0.516)	Data 0.001 (0.013)	Loss 4.4366 (4.4057)	Top-1 acc 20.703 (23.368)	Top-5 acc 44.531 (45.385)	lr 0.02183
Warmup Train [22][2020/3239]	Time 0.508 (0.516)	Data 0.001 (0.013)	Loss 4.2546 (4.4055)	Top-1 acc 29.297 (23.375)	Top-5 acc 51.172 (45.391)	lr 0.02182
Warmup Train [22][2030/3239]	Time 0.458 (0.516)	Data 0.001 (0.013)	Loss 4.3495 (4.4052)	Top-1 acc 24.219 (23.380)	Top-5 acc 46.484 (45.400)	lr 0.02181
Warmup Train [22][2040/3239]	Time 0.503 (0.516)	Data 0.001 (0.013)	Loss 4.4151 (4.4052)	Top-1 acc 19.922 (23.379)	Top-5 acc 44.141 (45.401)	lr 0.02181
Warmup Train [22][2050/3239]	Time 0.630 (0.516)	Data 0.001 (0.013)	Loss 4.4186 (4.4048)	Top-1 acc 25.000 (23.383)	Top-5 acc 49.219 (45.409)	lr 0.02180
Warmup Train [22][2060/3239]	Time 0.562 (0.516)	Data 0.002 (0.013)	Loss 4.2842 (4.4047)	Top-1 acc 27.344 (23.384)	Top-5 acc 47.266 (45.413)	lr 0.02180
Warmup Train [22][2070/3239]	Time 0.534 (0.516)	Data 0.002 (0.013)	Loss 4.3982 (4.4047)	Top-1 acc 23.438 (23.387)	Top-5 acc 44.922 (45.416)	lr 0.02179
Warmup Train [22][2080/3239]	Time 0.412 (0.516)	Data 0.001 (0.013)	Loss 4.6424 (4.4047)	Top-1 acc 18.750 (23.387)	Top-5 acc 37.109 (45.415)	lr 0.02178
Warmup Train [22][2090/3239]	Time 0.681 (0.516)	Data 0.001 (0.013)	Loss 4.4454 (4.4046)	Top-1 acc 23.438 (23.391)	Top-5 acc 44.922 (45.418)	lr 0.02178
Warmup Train [22][2100/3239]	Time 0.467 (0.516)	Data 0.002 (0.013)	Loss 4.4503 (4.4045)	Top-1 acc 24.219 (23.397)	Top-5 acc 43.750 (45.418)	lr 0.02177
Warmup Train [22][2110/3239]	Time 0.651 (0.515)	Data 0.001 (0.013)	Loss 4.3865 (4.4045)	Top-1 acc 26.172 (23.399)	Top-5 acc 45.703 (45.420)	lr 0.02177
Warmup Train [22][2120/3239]	Time 0.519 (0.515)	Data 0.001 (0.013)	Loss 4.4822 (4.4042)	Top-1 acc 22.656 (23.404)	Top-5 acc 44.922 (45.424)	lr 0.02176
Warmup Train [22][2130/3239]	Time 0.363 (0.515)	Data 0.001 (0.013)	Loss 4.3887 (4.4040)	Top-1 acc 24.219 (23.405)	Top-5 acc 46.484 (45.424)	lr 0.02175
Warmup Train [22][2140/3239]	Time 0.571 (0.515)	Data 0.001 (0.013)	Loss 4.2272 (4.4040)	Top-1 acc 26.172 (23.406)	Top-5 acc 48.438 (45.428)	lr 0.02175
Warmup Train [22][2150/3239]	Time 0.500 (0.515)	Data 0.001 (0.013)	Loss 4.2842 (4.4040)	Top-1 acc 28.906 (23.402)	Top-5 acc 48.828 (45.425)	lr 0.02174
Warmup Train [22][2160/3239]	Time 0.620 (0.515)	Data 0.001 (0.013)	Loss 4.4065 (4.4039)	Top-1 acc 20.703 (23.402)	Top-5 acc 44.922 (45.423)	lr 0.02174
Warmup Train [22][2170/3239]	Time 0.503 (0.515)	Data 0.001 (0.013)	Loss 4.5383 (4.4040)	Top-1 acc 21.875 (23.400)	Top-5 acc 44.141 (45.421)	lr 0.02173
Warmup Train [22][2180/3239]	Time 0.470 (0.515)	Data 0.001 (0.013)	Loss 4.6913 (4.4038)	Top-1 acc 18.359 (23.401)	Top-5 acc 39.062 (45.428)	lr 0.02172
Warmup Train [22][2190/3239]	Time 0.432 (0.515)	Data 0.001 (0.013)	Loss 4.6086 (4.4041)	Top-1 acc 22.266 (23.398)	Top-5 acc 41.016 (45.420)	lr 0.02172
Warmup Train [22][2200/3239]	Time 0.347 (0.515)	Data 0.001 (0.013)	Loss 4.2910 (4.4037)	Top-1 acc 28.516 (23.407)	Top-5 acc 48.047 (45.428)	lr 0.02171
Warmup Train [22][2210/3239]	Time 0.412 (0.515)	Data 0.001 (0.013)	Loss 4.3582 (4.4037)	Top-1 acc 24.609 (23.408)	Top-5 acc 44.922 (45.428)	lr 0.02171
Warmup Train [22][2220/3239]	Time 0.436 (0.515)	Data 0.001 (0.013)	Loss 4.4085 (4.4038)	Top-1 acc 25.000 (23.411)	Top-5 acc 46.484 (45.426)	lr 0.02170
Warmup Train [22][2230/3239]	Time 0.521 (0.515)	Data 0.001 (0.013)	Loss 4.3314 (4.4037)	Top-1 acc 26.953 (23.413)	Top-5 acc 49.219 (45.428)	lr 0.02169
Warmup Train [22][2240/3239]	Time 0.423 (0.515)	Data 0.001 (0.013)	Loss 4.3435 (4.4037)	Top-1 acc 25.000 (23.419)	Top-5 acc 49.219 (45.430)	lr 0.02169
Warmup Train [22][2250/3239]	Time 0.540 (0.515)	Data 0.001 (0.012)	Loss 4.5333 (4.4032)	Top-1 acc 20.703 (23.428)	Top-5 acc 45.703 (45.444)	lr 0.02168
Warmup Train [22][2260/3239]	Time 0.707 (0.515)	Data 0.001 (0.012)	Loss 4.5305 (4.4032)	Top-1 acc 19.141 (23.425)	Top-5 acc 43.359 (45.444)	lr 0.02168
Warmup Train [22][2270/3239]	Time 0.477 (0.515)	Data 0.001 (0.012)	Loss 4.5159 (4.4032)	Top-1 acc 17.578 (23.423)	Top-5 acc 40.625 (45.443)	lr 0.02167
Warmup Train [22][2280/3239]	Time 0.660 (0.515)	Data 0.001 (0.012)	Loss 4.3062 (4.4031)	Top-1 acc 23.828 (23.424)	Top-5 acc 50.000 (45.445)	lr 0.02166
Warmup Train [22][2290/3239]	Time 0.474 (0.515)	Data 0.001 (0.012)	Loss 4.5572 (4.4030)	Top-1 acc 20.703 (23.428)	Top-5 acc 40.625 (45.445)	lr 0.02166
Warmup Train [22][2300/3239]	Time 0.513 (0.515)	Data 0.001 (0.012)	Loss 4.4421 (4.4029)	Top-1 acc 20.312 (23.424)	Top-5 acc 44.531 (45.451)	lr 0.02165
Warmup Train [22][2310/3239]	Time 0.555 (0.515)	Data 0.001 (0.012)	Loss 4.4104 (4.4028)	Top-1 acc 21.094 (23.425)	Top-5 acc 44.141 (45.451)	lr 0.02165
Warmup Train [22][2320/3239]	Time 0.526 (0.515)	Data 0.001 (0.012)	Loss 4.4528 (4.4028)	Top-1 acc 21.094 (23.419)	Top-5 acc 39.844 (45.452)	lr 0.02164
Warmup Train [22][2330/3239]	Time 0.501 (0.515)	Data 0.001 (0.012)	Loss 4.5817 (4.4029)	Top-1 acc 20.312 (23.418)	Top-5 acc 42.188 (45.448)	lr 0.02163
Warmup Train [22][2340/3239]	Time 0.349 (0.515)	Data 0.001 (0.012)	Loss 4.5198 (4.4029)	Top-1 acc 23.438 (23.417)	Top-5 acc 40.234 (45.443)	lr 0.02163
Warmup Train [22][2350/3239]	Time 0.662 (0.515)	Data 0.001 (0.012)	Loss 4.2446 (4.4028)	Top-1 acc 23.828 (23.417)	Top-5 acc 45.703 (45.444)	lr 0.02162
Warmup Train [22][2360/3239]	Time 0.578 (0.515)	Data 0.001 (0.012)	Loss 4.3387 (4.4030)	Top-1 acc 23.828 (23.413)	Top-5 acc 46.094 (45.441)	lr 0.02162
Warmup Train [22][2370/3239]	Time 0.264 (0.515)	Data 0.001 (0.012)	Loss 4.2785 (4.4029)	Top-1 acc 26.172 (23.415)	Top-5 acc 49.219 (45.445)	lr 0.02161
Warmup Train [22][2380/3239]	Time 0.517 (0.514)	Data 0.001 (0.012)	Loss 4.4328 (4.4030)	Top-1 acc 22.656 (23.414)	Top-5 acc 45.312 (45.443)	lr 0.02160
Warmup Train [22][2390/3239]	Time 0.524 (0.514)	Data 0.001 (0.012)	Loss 4.3746 (4.4030)	Top-1 acc 24.219 (23.413)	Top-5 acc 48.438 (45.444)	lr 0.02160
Warmup Train [22][2400/3239]	Time 0.515 (0.514)	Data 0.001 (0.012)	Loss 4.4073 (4.4031)	Top-1 acc 24.609 (23.410)	Top-5 acc 45.312 (45.438)	lr 0.02159
Warmup Train [22][2410/3239]	Time 0.427 (0.514)	Data 0.001 (0.012)	Loss 4.5178 (4.4033)	Top-1 acc 20.312 (23.409)	Top-5 acc 45.312 (45.438)	lr 0.02159
Warmup Train [22][2420/3239]	Time 0.598 (0.514)	Data 0.001 (0.012)	Loss 4.3812 (4.4030)	Top-1 acc 19.141 (23.412)	Top-5 acc 45.312 (45.446)	lr 0.02158
Warmup Train [22][2430/3239]	Time 0.553 (0.514)	Data 0.001 (0.012)	Loss 4.4419 (4.4031)	Top-1 acc 24.609 (23.409)	Top-5 acc 44.141 (45.443)	lr 0.02157
Warmup Train [22][2440/3239]	Time 0.425 (0.514)	Data 0.001 (0.012)	Loss 4.7205 (4.4030)	Top-1 acc 16.406 (23.412)	Top-5 acc 37.891 (45.449)	lr 0.02157
Warmup Train [22][2450/3239]	Time 0.627 (0.514)	Data 0.001 (0.012)	Loss 4.3793 (4.4031)	Top-1 acc 23.828 (23.416)	Top-5 acc 44.922 (45.441)	lr 0.02156
Warmup Train [22][2460/3239]	Time 0.499 (0.514)	Data 0.001 (0.012)	Loss 4.2657 (4.4030)	Top-1 acc 25.000 (23.415)	Top-5 acc 49.609 (45.446)	lr 0.02156
Warmup Train [22][2470/3239]	Time 0.717 (0.514)	Data 0.001 (0.012)	Loss 4.4915 (4.4031)	Top-1 acc 21.875 (23.416)	Top-5 acc 44.141 (45.444)	lr 0.02155
Warmup Train [22][2480/3239]	Time 0.481 (0.514)	Data 0.001 (0.012)	Loss 4.4026 (4.4033)	Top-1 acc 25.000 (23.411)	Top-5 acc 49.609 (45.442)	lr 0.02154
Warmup Train [22][2490/3239]	Time 0.608 (0.514)	Data 0.001 (0.012)	Loss 4.3775 (4.4033)	Top-1 acc 23.438 (23.413)	Top-5 acc 43.750 (45.441)	lr 0.02154
Warmup Train [22][2500/3239]	Time 0.538 (0.514)	Data 0.001 (0.012)	Loss 4.6128 (4.4032)	Top-1 acc 20.312 (23.419)	Top-5 acc 36.719 (45.439)	lr 0.02153
Warmup Train [22][2510/3239]	Time 0.594 (0.514)	Data 0.001 (0.012)	Loss 4.3473 (4.4029)	Top-1 acc 25.000 (23.423)	Top-5 acc 46.875 (45.450)	lr 0.02153
Warmup Train [22][2520/3239]	Time 0.339 (0.514)	Data 0.001 (0.012)	Loss 4.3440 (4.4028)	Top-1 acc 25.000 (23.424)	Top-5 acc 46.094 (45.455)	lr 0.02152
Warmup Train [22][2530/3239]	Time 0.595 (0.514)	Data 0.001 (0.012)	Loss 4.3158 (4.4025)	Top-1 acc 27.734 (23.432)	Top-5 acc 46.094 (45.457)	lr 0.02151
Warmup Train [22][2540/3239]	Time 0.392 (0.514)	Data 0.001 (0.012)	Loss 4.4550 (4.4024)	Top-1 acc 20.312 (23.435)	Top-5 acc 42.969 (45.460)	lr 0.02151
Warmup Train [22][2550/3239]	Time 0.536 (0.514)	Data 0.002 (0.012)	Loss 4.5291 (4.4025)	Top-1 acc 19.531 (23.436)	Top-5 acc 45.312 (45.457)	lr 0.02150
Warmup Train [22][2560/3239]	Time 0.475 (0.514)	Data 0.001 (0.012)	Loss 4.3903 (4.4027)	Top-1 acc 20.703 (23.439)	Top-5 acc 44.531 (45.454)	lr 0.02150
Warmup Train [22][2570/3239]	Time 0.556 (0.514)	Data 0.001 (0.012)	Loss 4.4241 (4.4028)	Top-1 acc 23.438 (23.435)	Top-5 acc 41.797 (45.447)	lr 0.02149
Warmup Train [22][2580/3239]	Time 0.525 (0.514)	Data 0.001 (0.012)	Loss 4.4151 (4.4027)	Top-1 acc 24.609 (23.440)	Top-5 acc 48.828 (45.455)	lr 0.02148
Warmup Train [22][2590/3239]	Time 0.670 (0.514)	Data 0.001 (0.012)	Loss 4.1583 (4.4026)	Top-1 acc 24.609 (23.441)	Top-5 acc 51.953 (45.453)	lr 0.02148
Warmup Train [22][2600/3239]	Time 0.613 (0.514)	Data 0.001 (0.012)	Loss 4.4935 (4.4030)	Top-1 acc 23.047 (23.437)	Top-5 acc 44.531 (45.444)	lr 0.02147
Warmup Train [22][2610/3239]	Time 0.671 (0.514)	Data 0.001 (0.012)	Loss 4.1977 (4.4029)	Top-1 acc 26.172 (23.438)	Top-5 acc 49.219 (45.447)	lr 0.02147
Warmup Train [22][2620/3239]	Time 0.396 (0.514)	Data 0.001 (0.012)	Loss 4.3427 (4.4030)	Top-1 acc 23.438 (23.430)	Top-5 acc 50.000 (45.446)	lr 0.02146
Warmup Train [22][2630/3239]	Time 0.440 (0.514)	Data 0.001 (0.012)	Loss 4.3211 (4.4028)	Top-1 acc 26.562 (23.437)	Top-5 acc 48.828 (45.451)	lr 0.02145
Warmup Train [22][2640/3239]	Time 0.535 (0.514)	Data 0.001 (0.012)	Loss 4.5270 (4.4029)	Top-1 acc 25.781 (23.438)	Top-5 acc 45.312 (45.453)	lr 0.02145
Warmup Train [22][2650/3239]	Time 0.659 (0.514)	Data 0.001 (0.012)	Loss 4.4159 (4.4028)	Top-1 acc 22.266 (23.442)	Top-5 acc 44.922 (45.461)	lr 0.02144
Warmup Train [22][2660/3239]	Time 0.656 (0.514)	Data 0.001 (0.011)	Loss 4.3199 (4.4027)	Top-1 acc 26.562 (23.446)	Top-5 acc 44.922 (45.462)	lr 0.02144
Warmup Train [22][2670/3239]	Time 0.661 (0.514)	Data 0.001 (0.011)	Loss 4.4384 (4.4027)	Top-1 acc 24.609 (23.451)	Top-5 acc 44.922 (45.463)	lr 0.02143
Warmup Train [22][2680/3239]	Time 0.538 (0.514)	Data 0.001 (0.011)	Loss 4.1798 (4.4027)	Top-1 acc 31.641 (23.454)	Top-5 acc 49.219 (45.462)	lr 0.02142
Warmup Train [22][2690/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 4.5083 (4.4027)	Top-1 acc 22.266 (23.454)	Top-5 acc 45.312 (45.462)	lr 0.02142
Warmup Train [22][2700/3239]	Time 0.441 (0.514)	Data 0.001 (0.011)	Loss 4.3967 (4.4024)	Top-1 acc 23.438 (23.458)	Top-5 acc 43.750 (45.471)	lr 0.02141
Warmup Train [22][2710/3239]	Time 0.524 (0.514)	Data 0.001 (0.011)	Loss 4.2955 (4.4020)	Top-1 acc 23.828 (23.466)	Top-5 acc 47.656 (45.481)	lr 0.02141
Warmup Train [22][2720/3239]	Time 0.567 (0.514)	Data 0.001 (0.011)	Loss 4.4607 (4.4019)	Top-1 acc 21.484 (23.471)	Top-5 acc 44.922 (45.484)	lr 0.02140
Warmup Train [22][2730/3239]	Time 0.504 (0.514)	Data 0.001 (0.011)	Loss 4.2627 (4.4020)	Top-1 acc 26.562 (23.467)	Top-5 acc 46.875 (45.481)	lr 0.02139
Warmup Train [22][2740/3239]	Time 0.438 (0.514)	Data 0.001 (0.011)	Loss 4.4951 (4.4021)	Top-1 acc 19.922 (23.466)	Top-5 acc 42.188 (45.479)	lr 0.02139
Warmup Train [22][2750/3239]	Time 0.574 (0.514)	Data 0.001 (0.011)	Loss 4.2745 (4.4019)	Top-1 acc 27.734 (23.469)	Top-5 acc 50.781 (45.480)	lr 0.02138
Warmup Train [22][2760/3239]	Time 0.495 (0.514)	Data 0.001 (0.011)	Loss 4.2133 (4.4018)	Top-1 acc 29.297 (23.470)	Top-5 acc 48.047 (45.483)	lr 0.02138
Warmup Train [22][2770/3239]	Time 0.373 (0.514)	Data 0.001 (0.011)	Loss 4.3625 (4.4017)	Top-1 acc 23.828 (23.469)	Top-5 acc 44.922 (45.486)	lr 0.02137
Warmup Train [22][2780/3239]	Time 0.529 (0.514)	Data 0.001 (0.011)	Loss 4.3250 (4.4015)	Top-1 acc 24.219 (23.475)	Top-5 acc 48.438 (45.491)	lr 0.02136
Warmup Train [22][2790/3239]	Time 0.434 (0.514)	Data 0.001 (0.011)	Loss 4.1131 (4.4012)	Top-1 acc 28.516 (23.482)	Top-5 acc 48.828 (45.498)	lr 0.02136
Warmup Train [22][2800/3239]	Time 0.528 (0.514)	Data 0.001 (0.011)	Loss 4.3954 (4.4010)	Top-1 acc 19.531 (23.485)	Top-5 acc 45.703 (45.503)	lr 0.02135
Warmup Train [22][2810/3239]	Time 0.468 (0.514)	Data 0.001 (0.011)	Loss 4.3591 (4.4009)	Top-1 acc 29.297 (23.489)	Top-5 acc 48.828 (45.507)	lr 0.02135
Warmup Train [22][2820/3239]	Time 0.367 (0.514)	Data 0.001 (0.011)	Loss 4.3874 (4.4010)	Top-1 acc 23.047 (23.490)	Top-5 acc 46.484 (45.507)	lr 0.02134
Warmup Train [22][2830/3239]	Time 0.412 (0.514)	Data 0.001 (0.011)	Loss 4.3228 (4.4008)	Top-1 acc 25.781 (23.493)	Top-5 acc 48.047 (45.511)	lr 0.02133
Warmup Train [22][2840/3239]	Time 0.247 (0.514)	Data 0.001 (0.011)	Loss 4.4089 (4.4007)	Top-1 acc 24.609 (23.496)	Top-5 acc 48.047 (45.514)	lr 0.02133
Warmup Train [22][2850/3239]	Time 0.525 (0.514)	Data 0.001 (0.011)	Loss 4.3479 (4.4004)	Top-1 acc 24.219 (23.498)	Top-5 acc 46.484 (45.519)	lr 0.02132
Warmup Train [22][2860/3239]	Time 0.731 (0.513)	Data 0.001 (0.011)	Loss 4.1118 (4.4003)	Top-1 acc 28.906 (23.496)	Top-5 acc 52.734 (45.519)	lr 0.02132
Warmup Train [22][2870/3239]	Time 0.431 (0.513)	Data 0.001 (0.011)	Loss 4.3255 (4.4002)	Top-1 acc 24.219 (23.502)	Top-5 acc 45.703 (45.523)	lr 0.02131
Warmup Train [22][2880/3239]	Time 0.425 (0.513)	Data 0.001 (0.011)	Loss 4.1879 (4.4000)	Top-1 acc 28.125 (23.508)	Top-5 acc 52.734 (45.529)	lr 0.02130
Warmup Train [22][2890/3239]	Time 0.623 (0.513)	Data 0.001 (0.011)	Loss 4.3491 (4.3998)	Top-1 acc 23.828 (23.513)	Top-5 acc 48.047 (45.534)	lr 0.02130
Warmup Train [22][2900/3239]	Time 0.376 (0.513)	Data 0.002 (0.011)	Loss 4.5194 (4.3998)	Top-1 acc 20.703 (23.515)	Top-5 acc 41.406 (45.535)	lr 0.02129
Warmup Train [22][2910/3239]	Time 0.542 (0.513)	Data 0.001 (0.011)	Loss 4.1271 (4.3997)	Top-1 acc 28.516 (23.515)	Top-5 acc 52.344 (45.539)	lr 0.02129
Warmup Train [22][2920/3239]	Time 0.411 (0.513)	Data 0.001 (0.011)	Loss 4.3719 (4.3994)	Top-1 acc 25.781 (23.517)	Top-5 acc 44.141 (45.544)	lr 0.02128
Warmup Train [22][2930/3239]	Time 0.558 (0.513)	Data 0.001 (0.011)	Loss 4.2605 (4.3994)	Top-1 acc 26.172 (23.518)	Top-5 acc 49.609 (45.546)	lr 0.02127
Warmup Train [22][2940/3239]	Time 0.501 (0.513)	Data 0.001 (0.011)	Loss 4.4334 (4.3994)	Top-1 acc 23.047 (23.515)	Top-5 acc 44.531 (45.543)	lr 0.02127
Warmup Train [22][2950/3239]	Time 0.593 (0.513)	Data 0.001 (0.011)	Loss 4.2569 (4.3993)	Top-1 acc 24.219 (23.515)	Top-5 acc 48.047 (45.545)	lr 0.02126
Warmup Train [22][2960/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 4.5583 (4.3993)	Top-1 acc 21.094 (23.521)	Top-5 acc 46.094 (45.546)	lr 0.02126
Warmup Train [22][2970/3239]	Time 0.405 (0.513)	Data 0.001 (0.011)	Loss 4.2922 (4.3992)	Top-1 acc 25.000 (23.525)	Top-5 acc 46.484 (45.547)	lr 0.02125
Warmup Train [22][2980/3239]	Time 0.525 (0.514)	Data 0.001 (0.011)	Loss 4.6442 (4.3994)	Top-1 acc 20.312 (23.524)	Top-5 acc 37.500 (45.539)	lr 0.02124
Warmup Train [22][2990/3239]	Time 0.470 (0.513)	Data 0.001 (0.011)	Loss 4.3557 (4.3993)	Top-1 acc 23.438 (23.526)	Top-5 acc 50.000 (45.544)	lr 0.02124
Warmup Train [22][3000/3239]	Time 0.565 (0.513)	Data 0.029 (0.011)	Loss 4.3528 (4.3993)	Top-1 acc 27.344 (23.526)	Top-5 acc 44.141 (45.542)	lr 0.02123
Warmup Train [22][3010/3239]	Time 0.434 (0.513)	Data 0.001 (0.011)	Loss 4.3329 (4.3994)	Top-1 acc 21.484 (23.525)	Top-5 acc 44.531 (45.541)	lr 0.02123
Warmup Train [22][3020/3239]	Time 0.553 (0.513)	Data 0.001 (0.011)	Loss 4.2924 (4.3994)	Top-1 acc 25.391 (23.526)	Top-5 acc 48.438 (45.542)	lr 0.02122
Warmup Train [22][3030/3239]	Time 0.416 (0.513)	Data 0.001 (0.011)	Loss 4.4884 (4.3993)	Top-1 acc 22.266 (23.528)	Top-5 acc 45.312 (45.545)	lr 0.02121
Warmup Train [22][3040/3239]	Time 0.566 (0.513)	Data 0.001 (0.011)	Loss 4.3397 (4.3992)	Top-1 acc 24.219 (23.532)	Top-5 acc 45.703 (45.547)	lr 0.02121
Warmup Train [22][3050/3239]	Time 0.550 (0.513)	Data 0.001 (0.011)	Loss 4.5331 (4.3992)	Top-1 acc 23.828 (23.534)	Top-5 acc 43.750 (45.547)	lr 0.02120
Warmup Train [22][3060/3239]	Time 0.530 (0.513)	Data 0.001 (0.011)	Loss 4.3499 (4.3991)	Top-1 acc 27.344 (23.542)	Top-5 acc 46.484 (45.550)	lr 0.02120
Warmup Train [22][3070/3239]	Time 0.514 (0.513)	Data 0.001 (0.011)	Loss 4.4534 (4.3990)	Top-1 acc 21.094 (23.544)	Top-5 acc 44.531 (45.549)	lr 0.02119
Warmup Train [22][3080/3239]	Time 0.382 (0.513)	Data 0.001 (0.011)	Loss 4.5209 (4.3989)	Top-1 acc 21.484 (23.546)	Top-5 acc 42.188 (45.553)	lr 0.02118
Warmup Train [22][3090/3239]	Time 0.481 (0.513)	Data 0.001 (0.011)	Loss 4.3295 (4.3988)	Top-1 acc 23.828 (23.544)	Top-5 acc 45.703 (45.553)	lr 0.02118
Warmup Train [22][3100/3239]	Time 0.351 (0.513)	Data 0.001 (0.011)	Loss 4.3594 (4.3987)	Top-1 acc 23.438 (23.545)	Top-5 acc 46.094 (45.552)	lr 0.02117
Warmup Train [22][3110/3239]	Time 0.601 (0.513)	Data 0.001 (0.011)	Loss 4.4322 (4.3985)	Top-1 acc 24.219 (23.552)	Top-5 acc 45.312 (45.559)	lr 0.02117
Warmup Train [22][3120/3239]	Time 0.609 (0.513)	Data 0.001 (0.011)	Loss 4.3082 (4.3984)	Top-1 acc 25.000 (23.557)	Top-5 acc 42.578 (45.562)	lr 0.02116
Warmup Train [22][3130/3239]	Time 0.602 (0.513)	Data 0.001 (0.011)	Loss 4.4537 (4.3983)	Top-1 acc 26.562 (23.558)	Top-5 acc 43.359 (45.566)	lr 0.02115
Warmup Train [22][3140/3239]	Time 0.491 (0.513)	Data 0.001 (0.011)	Loss 4.4395 (4.3982)	Top-1 acc 26.562 (23.559)	Top-5 acc 43.359 (45.569)	lr 0.02115
Warmup Train [22][3150/3239]	Time 0.512 (0.513)	Data 0.001 (0.011)	Loss 4.4193 (4.3980)	Top-1 acc 20.703 (23.559)	Top-5 acc 45.703 (45.572)	lr 0.02114
Warmup Train [22][3160/3239]	Time 0.585 (0.513)	Data 0.001 (0.011)	Loss 4.3801 (4.3980)	Top-1 acc 25.391 (23.557)	Top-5 acc 45.312 (45.571)	lr 0.02114
Warmup Train [22][3170/3239]	Time 0.354 (0.513)	Data 0.001 (0.011)	Loss 4.4575 (4.3982)	Top-1 acc 21.875 (23.559)	Top-5 acc 46.875 (45.566)	lr 0.02113
Warmup Train [22][3180/3239]	Time 0.545 (0.513)	Data 0.000 (0.011)	Loss 4.4271 (4.3982)	Top-1 acc 24.219 (23.561)	Top-5 acc 42.188 (45.564)	lr 0.02113
Warmup Train [22][3190/3239]	Time 0.518 (0.513)	Data 0.000 (0.011)	Loss 4.2565 (4.3983)	Top-1 acc 26.562 (23.558)	Top-5 acc 48.828 (45.564)	lr 0.02112
Warmup Train [22][3200/3239]	Time 0.584 (0.513)	Data 0.000 (0.011)	Loss 4.4100 (4.3979)	Top-1 acc 24.609 (23.568)	Top-5 acc 45.703 (45.574)	lr 0.02111
Warmup Train [22][3210/3239]	Time 0.427 (0.513)	Data 0.000 (0.011)	Loss 4.2771 (4.3979)	Top-1 acc 24.219 (23.567)	Top-5 acc 50.391 (45.576)	lr 0.02111
Warmup Train [22][3220/3239]	Time 0.465 (0.513)	Data 0.000 (0.011)	Loss 4.4940 (4.3980)	Top-1 acc 24.219 (23.566)	Top-5 acc 44.141 (45.572)	lr 0.02110
Warmup Train [22][3230/3239]	Time 0.469 (0.513)	Data 0.000 (0.011)	Loss 4.3964 (4.3978)	Top-1 acc 22.656 (23.568)	Top-5 acc 42.188 (45.576)	lr 0.02110
Warmup Train [22][3239/3239]	Time 0.404 (0.513)	Data 0.000 (0.011)	Loss 4.5252 (4.3978)	Top-1 acc 23.457 (23.568)	Top-5 acc 40.741 (45.577)	lr 0.02109
==========Warmup Valid [22/40]	loss 3.402	top-1 acc 30.522	top-5 acc 54.804	Train top-1 23.568	top-5 45.577	flops: 442.4M
Warmup Train [23][0/3239]	Time 13.265 (13.265)	Data 11.624 (11.624)	Loss 4.5189 (4.5189)	Top-1 acc 21.875 (21.875)	Top-5 acc 41.016 (41.016)	lr 0.02109
Warmup Train [23][10/3239]	Time 0.588 (1.731)	Data 0.001 (1.059)	Loss 4.2907 (4.3962)	Top-1 acc 25.391 (24.290)	Top-5 acc 45.703 (45.241)	lr 0.02108
Warmup Train [23][20/3239]	Time 0.441 (1.151)	Data 0.001 (0.559)	Loss 4.3435 (4.3859)	Top-1 acc 26.562 (24.628)	Top-5 acc 46.094 (45.964)	lr 0.02108
Warmup Train [23][30/3239]	Time 0.451 (0.947)	Data 0.001 (0.383)	Loss 4.4106 (4.3869)	Top-1 acc 25.000 (24.458)	Top-5 acc 43.750 (45.804)	lr 0.02107
Warmup Train [23][40/3239]	Time 0.529 (0.849)	Data 0.001 (0.293)	Loss 4.3791 (4.3718)	Top-1 acc 21.094 (24.705)	Top-5 acc 45.312 (46.151)	lr 0.02107
Warmup Train [23][50/3239]	Time 0.575 (0.785)	Data 0.001 (0.237)	Loss 4.3429 (4.3614)	Top-1 acc 26.172 (24.778)	Top-5 acc 44.922 (46.247)	lr 0.02106
Warmup Train [23][60/3239]	Time 0.646 (0.741)	Data 0.001 (0.198)	Loss 4.4335 (4.3506)	Top-1 acc 21.094 (24.981)	Top-5 acc 46.484 (46.536)	lr 0.02105
Warmup Train [23][70/3239]	Time 0.395 (0.709)	Data 0.001 (0.170)	Loss 4.5135 (4.3549)	Top-1 acc 17.969 (24.769)	Top-5 acc 41.797 (46.396)	lr 0.02105
Warmup Train [23][80/3239]	Time 0.506 (0.688)	Data 0.001 (0.152)	Loss 4.3234 (4.3532)	Top-1 acc 26.562 (24.619)	Top-5 acc 46.094 (46.504)	lr 0.02104
Warmup Train [23][90/3239]	Time 0.472 (0.668)	Data 0.001 (0.135)	Loss 4.3874 (4.3570)	Top-1 acc 25.000 (24.575)	Top-5 acc 43.750 (46.373)	lr 0.02104
Warmup Train [23][100/3239]	Time 0.502 (0.652)	Data 0.001 (0.122)	Loss 4.2305 (4.3507)	Top-1 acc 27.734 (24.698)	Top-5 acc 52.734 (46.539)	lr 0.02103
Warmup Train [23][110/3239]	Time 0.689 (0.642)	Data 0.001 (0.111)	Loss 4.3550 (4.3492)	Top-1 acc 25.781 (24.729)	Top-5 acc 46.875 (46.530)	lr 0.02102
Warmup Train [23][120/3239]	Time 0.512 (0.630)	Data 0.001 (0.102)	Loss 4.4545 (4.3535)	Top-1 acc 24.219 (24.606)	Top-5 acc 42.578 (46.449)	lr 0.02102
Warmup Train [23][130/3239]	Time 0.476 (0.617)	Data 0.001 (0.095)	Loss 4.2810 (4.3575)	Top-1 acc 23.828 (24.541)	Top-5 acc 49.219 (46.416)	lr 0.02101
Warmup Train [23][140/3239]	Time 0.409 (0.611)	Data 0.001 (0.089)	Loss 4.4266 (4.3564)	Top-1 acc 21.875 (24.576)	Top-5 acc 45.312 (46.473)	lr 0.02101
Warmup Train [23][150/3239]	Time 0.515 (0.604)	Data 0.001 (0.084)	Loss 4.3383 (4.3541)	Top-1 acc 23.047 (24.596)	Top-5 acc 48.438 (46.523)	lr 0.02100
Warmup Train [23][160/3239]	Time 0.423 (0.598)	Data 0.001 (0.079)	Loss 4.3684 (4.3571)	Top-1 acc 25.781 (24.529)	Top-5 acc 47.656 (46.436)	lr 0.02099
Warmup Train [23][170/3239]	Time 0.537 (0.591)	Data 0.001 (0.075)	Loss 4.3802 (4.3584)	Top-1 acc 22.656 (24.493)	Top-5 acc 44.531 (46.441)	lr 0.02099
Warmup Train [23][180/3239]	Time 0.534 (0.587)	Data 0.002 (0.071)	Loss 4.5238 (4.3590)	Top-1 acc 19.141 (24.422)	Top-5 acc 42.188 (46.463)	lr 0.02098
Warmup Train [23][190/3239]	Time 0.425 (0.580)	Data 0.001 (0.067)	Loss 4.5006 (4.3589)	Top-1 acc 19.922 (24.391)	Top-5 acc 43.359 (46.519)	lr 0.02098
Warmup Train [23][200/3239]	Time 0.673 (0.578)	Data 0.001 (0.064)	Loss 4.3287 (4.3594)	Top-1 acc 25.781 (24.384)	Top-5 acc 49.609 (46.537)	lr 0.02097
Warmup Train [23][210/3239]	Time 0.584 (0.576)	Data 0.001 (0.061)	Loss 4.2802 (4.3588)	Top-1 acc 24.609 (24.324)	Top-5 acc 50.391 (46.562)	lr 0.02096
Warmup Train [23][220/3239]	Time 0.512 (0.573)	Data 0.001 (0.059)	Loss 4.3482 (4.3596)	Top-1 acc 23.438 (24.291)	Top-5 acc 45.312 (46.514)	lr 0.02096
Warmup Train [23][230/3239]	Time 0.486 (0.571)	Data 0.001 (0.056)	Loss 4.2988 (4.3592)	Top-1 acc 25.000 (24.285)	Top-5 acc 48.047 (46.491)	lr 0.02095
Warmup Train [23][240/3239]	Time 0.478 (0.568)	Data 0.001 (0.054)	Loss 4.4835 (4.3613)	Top-1 acc 20.703 (24.264)	Top-5 acc 43.359 (46.476)	lr 0.02095
Warmup Train [23][250/3239]	Time 0.436 (0.565)	Data 0.001 (0.052)	Loss 4.5840 (4.3630)	Top-1 acc 21.484 (24.264)	Top-5 acc 42.578 (46.455)	lr 0.02094
Warmup Train [23][260/3239]	Time 0.585 (0.564)	Data 0.001 (0.051)	Loss 4.2188 (4.3616)	Top-1 acc 26.953 (24.298)	Top-5 acc 46.484 (46.466)	lr 0.02093
Warmup Train [23][270/3239]	Time 0.459 (0.562)	Data 0.001 (0.049)	Loss 4.4104 (4.3618)	Top-1 acc 21.484 (24.272)	Top-5 acc 44.922 (46.464)	lr 0.02093
Warmup Train [23][280/3239]	Time 0.501 (0.560)	Data 0.001 (0.047)	Loss 4.3726 (4.3602)	Top-1 acc 23.828 (24.299)	Top-5 acc 48.828 (46.497)	lr 0.02092
Warmup Train [23][290/3239]	Time 0.474 (0.560)	Data 0.001 (0.046)	Loss 4.3471 (4.3599)	Top-1 acc 25.391 (24.318)	Top-5 acc 46.875 (46.507)	lr 0.02092
Warmup Train [23][300/3239]	Time 0.637 (0.558)	Data 0.001 (0.045)	Loss 4.3645 (4.3610)	Top-1 acc 25.781 (24.313)	Top-5 acc 48.438 (46.486)	lr 0.02091
Warmup Train [23][310/3239]	Time 0.505 (0.556)	Data 0.001 (0.043)	Loss 4.2566 (4.3610)	Top-1 acc 26.562 (24.315)	Top-5 acc 50.000 (46.459)	lr 0.02090
Warmup Train [23][320/3239]	Time 0.582 (0.555)	Data 0.001 (0.042)	Loss 4.3320 (4.3602)	Top-1 acc 28.516 (24.329)	Top-5 acc 46.094 (46.465)	lr 0.02090
Warmup Train [23][330/3239]	Time 0.353 (0.554)	Data 0.001 (0.041)	Loss 4.3643 (4.3613)	Top-1 acc 25.391 (24.323)	Top-5 acc 46.094 (46.424)	lr 0.02089
Warmup Train [23][340/3239]	Time 0.526 (0.553)	Data 0.001 (0.040)	Loss 4.3990 (4.3621)	Top-1 acc 23.047 (24.312)	Top-5 acc 46.484 (46.403)	lr 0.02089
Warmup Train [23][350/3239]	Time 0.507 (0.552)	Data 0.001 (0.039)	Loss 4.4415 (4.3639)	Top-1 acc 23.438 (24.272)	Top-5 acc 42.969 (46.358)	lr 0.02088
Warmup Train [23][360/3239]	Time 0.550 (0.551)	Data 0.001 (0.038)	Loss 4.4140 (4.3630)	Top-1 acc 23.047 (24.290)	Top-5 acc 45.312 (46.409)	lr 0.02087
Warmup Train [23][370/3239]	Time 0.552 (0.550)	Data 0.001 (0.037)	Loss 4.4467 (4.3631)	Top-1 acc 24.219 (24.285)	Top-5 acc 44.141 (46.383)	lr 0.02087
Warmup Train [23][380/3239]	Time 0.655 (0.549)	Data 0.001 (0.036)	Loss 4.2798 (4.3642)	Top-1 acc 28.125 (24.252)	Top-5 acc 48.047 (46.346)	lr 0.02086
Warmup Train [23][390/3239]	Time 0.651 (0.548)	Data 0.001 (0.035)	Loss 4.3776 (4.3645)	Top-1 acc 26.953 (24.251)	Top-5 acc 49.609 (46.357)	lr 0.02086
Warmup Train [23][400/3239]	Time 0.509 (0.546)	Data 0.001 (0.035)	Loss 4.2903 (4.3634)	Top-1 acc 23.828 (24.298)	Top-5 acc 47.656 (46.388)	lr 0.02085
Warmup Train [23][410/3239]	Time 0.524 (0.545)	Data 0.001 (0.034)	Loss 4.3004 (4.3620)	Top-1 acc 30.469 (24.307)	Top-5 acc 44.922 (46.432)	lr 0.02084
Warmup Train [23][420/3239]	Time 0.435 (0.545)	Data 0.001 (0.033)	Loss 4.2570 (4.3616)	Top-1 acc 26.953 (24.271)	Top-5 acc 49.609 (46.430)	lr 0.02084
Warmup Train [23][430/3239]	Time 0.407 (0.542)	Data 0.002 (0.033)	Loss 4.3937 (4.3616)	Top-1 acc 20.703 (24.256)	Top-5 acc 45.703 (46.428)	lr 0.02083
Warmup Train [23][440/3239]	Time 0.380 (0.542)	Data 0.002 (0.032)	Loss 4.3246 (4.3606)	Top-1 acc 26.172 (24.277)	Top-5 acc 50.000 (46.473)	lr 0.02083
Warmup Train [23][450/3239]	Time 0.490 (0.541)	Data 0.001 (0.032)	Loss 4.2102 (4.3601)	Top-1 acc 28.516 (24.299)	Top-5 acc 49.609 (46.493)	lr 0.02082
Warmup Train [23][460/3239]	Time 0.500 (0.541)	Data 0.001 (0.031)	Loss 4.5403 (4.3600)	Top-1 acc 19.141 (24.292)	Top-5 acc 39.453 (46.501)	lr 0.02081
Warmup Train [23][470/3239]	Time 0.415 (0.540)	Data 0.001 (0.031)	Loss 4.4606 (4.3603)	Top-1 acc 24.219 (24.310)	Top-5 acc 41.797 (46.461)	lr 0.02081
Warmup Train [23][480/3239]	Time 0.512 (0.539)	Data 0.001 (0.030)	Loss 4.4876 (4.3610)	Top-1 acc 20.703 (24.289)	Top-5 acc 41.797 (46.452)	lr 0.02080
Warmup Train [23][490/3239]	Time 0.486 (0.539)	Data 0.001 (0.030)	Loss 4.4517 (4.3607)	Top-1 acc 22.656 (24.295)	Top-5 acc 48.047 (46.470)	lr 0.02080
Warmup Train [23][500/3239]	Time 0.541 (0.538)	Data 0.001 (0.029)	Loss 4.5037 (4.3617)	Top-1 acc 24.219 (24.276)	Top-5 acc 43.359 (46.448)	lr 0.02079
Warmup Train [23][510/3239]	Time 0.664 (0.538)	Data 0.001 (0.029)	Loss 4.2599 (4.3613)	Top-1 acc 23.438 (24.268)	Top-5 acc 48.828 (46.460)	lr 0.02078
Warmup Train [23][520/3239]	Time 0.559 (0.537)	Data 0.001 (0.029)	Loss 4.3667 (4.3618)	Top-1 acc 25.000 (24.259)	Top-5 acc 46.484 (46.467)	lr 0.02078
Warmup Train [23][530/3239]	Time 0.500 (0.537)	Data 0.001 (0.028)	Loss 4.3285 (4.3615)	Top-1 acc 24.219 (24.263)	Top-5 acc 46.875 (46.474)	lr 0.02077
Warmup Train [23][540/3239]	Time 0.485 (0.536)	Data 0.001 (0.028)	Loss 4.5703 (4.3614)	Top-1 acc 21.484 (24.268)	Top-5 acc 41.797 (46.480)	lr 0.02077
Warmup Train [23][550/3239]	Time 0.526 (0.535)	Data 0.001 (0.027)	Loss 4.2371 (4.3613)	Top-1 acc 27.344 (24.290)	Top-5 acc 48.047 (46.501)	lr 0.02076
Warmup Train [23][560/3239]	Time 0.536 (0.535)	Data 0.001 (0.027)	Loss 4.3126 (4.3613)	Top-1 acc 22.266 (24.266)	Top-5 acc 48.047 (46.505)	lr 0.02075
Warmup Train [23][570/3239]	Time 0.526 (0.534)	Data 0.001 (0.026)	Loss 4.5691 (4.3612)	Top-1 acc 23.438 (24.265)	Top-5 acc 40.625 (46.504)	lr 0.02075
Warmup Train [23][580/3239]	Time 0.410 (0.533)	Data 0.001 (0.026)	Loss 4.2757 (4.3614)	Top-1 acc 24.609 (24.271)	Top-5 acc 46.484 (46.491)	lr 0.02074
Warmup Train [23][590/3239]	Time 0.434 (0.533)	Data 0.001 (0.026)	Loss 4.2826 (4.3616)	Top-1 acc 24.219 (24.296)	Top-5 acc 46.094 (46.482)	lr 0.02074
Warmup Train [23][600/3239]	Time 0.595 (0.533)	Data 0.001 (0.025)	Loss 4.3898 (4.3602)	Top-1 acc 21.875 (24.318)	Top-5 acc 48.828 (46.511)	lr 0.02073
Warmup Train [23][610/3239]	Time 0.505 (0.533)	Data 0.001 (0.025)	Loss 4.1902 (4.3605)	Top-1 acc 26.953 (24.300)	Top-5 acc 52.344 (46.505)	lr 0.02072
Warmup Train [23][620/3239]	Time 0.667 (0.533)	Data 0.001 (0.025)	Loss 4.5266 (4.3611)	Top-1 acc 26.172 (24.270)	Top-5 acc 38.281 (46.463)	lr 0.02072
Warmup Train [23][630/3239]	Time 0.345 (0.532)	Data 0.001 (0.024)	Loss 4.4113 (4.3615)	Top-1 acc 21.484 (24.267)	Top-5 acc 44.531 (46.461)	lr 0.02071
Warmup Train [23][640/3239]	Time 0.549 (0.531)	Data 0.001 (0.024)	Loss 4.2955 (4.3621)	Top-1 acc 21.875 (24.239)	Top-5 acc 48.438 (46.434)	lr 0.02071
Warmup Train [23][650/3239]	Time 0.306 (0.531)	Data 0.001 (0.024)	Loss 4.4305 (4.3619)	Top-1 acc 23.828 (24.239)	Top-5 acc 46.484 (46.448)	lr 0.02070
Warmup Train [23][660/3239]	Time 0.545 (0.530)	Data 0.001 (0.024)	Loss 4.2020 (4.3612)	Top-1 acc 25.391 (24.242)	Top-5 acc 50.781 (46.453)	lr 0.02069
Warmup Train [23][670/3239]	Time 0.257 (0.529)	Data 0.001 (0.023)	Loss 4.1660 (4.3611)	Top-1 acc 29.688 (24.237)	Top-5 acc 51.953 (46.466)	lr 0.02069
Warmup Train [23][680/3239]	Time 0.612 (0.528)	Data 0.001 (0.023)	Loss 4.3434 (4.3615)	Top-1 acc 22.656 (24.233)	Top-5 acc 50.781 (46.465)	lr 0.02068
Warmup Train [23][690/3239]	Time 0.516 (0.528)	Data 0.001 (0.023)	Loss 4.3804 (4.3615)	Top-1 acc 22.266 (24.223)	Top-5 acc 48.438 (46.457)	lr 0.02068
Warmup Train [23][700/3239]	Time 0.599 (0.528)	Data 0.001 (0.023)	Loss 4.4965 (4.3617)	Top-1 acc 24.219 (24.218)	Top-5 acc 43.750 (46.455)	lr 0.02067
Warmup Train [23][710/3239]	Time 0.608 (0.528)	Data 0.001 (0.022)	Loss 4.2666 (4.3615)	Top-1 acc 25.391 (24.220)	Top-5 acc 44.922 (46.454)	lr 0.02066
Warmup Train [23][720/3239]	Time 0.425 (0.527)	Data 0.001 (0.022)	Loss 4.3315 (4.3612)	Top-1 acc 28.516 (24.238)	Top-5 acc 47.266 (46.472)	lr 0.02066
Warmup Train [23][730/3239]	Time 0.449 (0.527)	Data 0.001 (0.022)	Loss 4.4767 (4.3613)	Top-1 acc 22.266 (24.244)	Top-5 acc 45.312 (46.468)	lr 0.02065
Warmup Train [23][740/3239]	Time 0.360 (0.526)	Data 0.001 (0.022)	Loss 4.2637 (4.3604)	Top-1 acc 23.047 (24.252)	Top-5 acc 47.266 (46.476)	lr 0.02065
Warmup Train [23][750/3239]	Time 0.633 (0.526)	Data 0.001 (0.022)	Loss 4.6099 (4.3612)	Top-1 acc 24.219 (24.239)	Top-5 acc 42.188 (46.466)	lr 0.02064
Warmup Train [23][760/3239]	Time 0.537 (0.526)	Data 0.001 (0.021)	Loss 4.1976 (4.3610)	Top-1 acc 24.609 (24.235)	Top-5 acc 51.172 (46.465)	lr 0.02063
Warmup Train [23][770/3239]	Time 0.540 (0.526)	Data 0.001 (0.021)	Loss 4.4505 (4.3609)	Top-1 acc 22.656 (24.234)	Top-5 acc 45.703 (46.450)	lr 0.02063
Warmup Train [23][780/3239]	Time 0.543 (0.526)	Data 0.001 (0.021)	Loss 4.2078 (4.3610)	Top-1 acc 27.734 (24.230)	Top-5 acc 46.484 (46.436)	lr 0.02062
Warmup Train [23][790/3239]	Time 0.378 (0.526)	Data 0.001 (0.021)	Loss 4.1924 (4.3617)	Top-1 acc 25.781 (24.215)	Top-5 acc 46.484 (46.416)	lr 0.02062
Warmup Train [23][800/3239]	Time 0.560 (0.526)	Data 0.001 (0.020)	Loss 4.2313 (4.3610)	Top-1 acc 26.562 (24.233)	Top-5 acc 46.484 (46.430)	lr 0.02061
Warmup Train [23][810/3239]	Time 0.550 (0.526)	Data 0.001 (0.020)	Loss 4.1740 (4.3602)	Top-1 acc 26.953 (24.248)	Top-5 acc 53.125 (46.450)	lr 0.02061
Warmup Train [23][820/3239]	Time 0.461 (0.526)	Data 0.001 (0.020)	Loss 4.3103 (4.3612)	Top-1 acc 23.438 (24.237)	Top-5 acc 46.484 (46.419)	lr 0.02060
Warmup Train [23][830/3239]	Time 0.515 (0.526)	Data 0.001 (0.020)	Loss 4.3571 (4.3607)	Top-1 acc 22.266 (24.249)	Top-5 acc 44.531 (46.415)	lr 0.02059
Warmup Train [23][840/3239]	Time 0.372 (0.526)	Data 0.001 (0.020)	Loss 4.4310 (4.3605)	Top-1 acc 17.969 (24.234)	Top-5 acc 44.922 (46.417)	lr 0.02059
Warmup Train [23][850/3239]	Time 0.553 (0.526)	Data 0.001 (0.020)	Loss 4.4290 (4.3605)	Top-1 acc 25.391 (24.238)	Top-5 acc 46.094 (46.417)	lr 0.02058
Warmup Train [23][860/3239]	Time 0.501 (0.526)	Data 0.001 (0.019)	Loss 4.5307 (4.3609)	Top-1 acc 19.922 (24.237)	Top-5 acc 45.703 (46.424)	lr 0.02058
Warmup Train [23][870/3239]	Time 0.351 (0.525)	Data 0.001 (0.019)	Loss 4.3347 (4.3611)	Top-1 acc 24.609 (24.245)	Top-5 acc 43.750 (46.429)	lr 0.02057
Warmup Train [23][880/3239]	Time 0.498 (0.525)	Data 0.001 (0.019)	Loss 4.2709 (4.3612)	Top-1 acc 26.172 (24.249)	Top-5 acc 44.922 (46.422)	lr 0.02056
Warmup Train [23][890/3239]	Time 0.561 (0.525)	Data 0.001 (0.019)	Loss 4.1372 (4.3614)	Top-1 acc 27.344 (24.260)	Top-5 acc 52.734 (46.426)	lr 0.02056
Warmup Train [23][900/3239]	Time 0.362 (0.524)	Data 0.001 (0.019)	Loss 4.4180 (4.3607)	Top-1 acc 23.828 (24.278)	Top-5 acc 46.875 (46.441)	lr 0.02055
Warmup Train [23][910/3239]	Time 0.333 (0.524)	Data 0.001 (0.019)	Loss 4.4458 (4.3612)	Top-1 acc 23.828 (24.271)	Top-5 acc 45.703 (46.431)	lr 0.02055
Warmup Train [23][920/3239]	Time 0.442 (0.523)	Data 0.001 (0.019)	Loss 4.4065 (4.3613)	Top-1 acc 26.562 (24.273)	Top-5 acc 45.312 (46.440)	lr 0.02054
Warmup Train [23][930/3239]	Time 0.588 (0.523)	Data 0.001 (0.019)	Loss 4.2232 (4.3608)	Top-1 acc 25.000 (24.268)	Top-5 acc 47.656 (46.443)	lr 0.02053
Warmup Train [23][940/3239]	Time 0.533 (0.523)	Data 0.001 (0.019)	Loss 4.7995 (4.3615)	Top-1 acc 21.484 (24.261)	Top-5 acc 39.844 (46.431)	lr 0.02053
Warmup Train [23][950/3239]	Time 0.481 (0.523)	Data 0.001 (0.019)	Loss 4.3691 (4.3612)	Top-1 acc 22.656 (24.267)	Top-5 acc 46.875 (46.438)	lr 0.02052
Warmup Train [23][960/3239]	Time 0.425 (0.523)	Data 0.001 (0.019)	Loss 4.4908 (4.3612)	Top-1 acc 20.703 (24.272)	Top-5 acc 43.359 (46.443)	lr 0.02052
Warmup Train [23][970/3239]	Time 0.549 (0.523)	Data 0.001 (0.019)	Loss 4.2687 (4.3608)	Top-1 acc 25.391 (24.269)	Top-5 acc 48.828 (46.453)	lr 0.02051
Warmup Train [23][980/3239]	Time 0.466 (0.523)	Data 0.002 (0.019)	Loss 4.4708 (4.3607)	Top-1 acc 19.141 (24.250)	Top-5 acc 44.922 (46.438)	lr 0.02050
Warmup Train [23][990/3239]	Time 0.560 (0.523)	Data 0.001 (0.019)	Loss 4.3724 (4.3603)	Top-1 acc 25.781 (24.253)	Top-5 acc 43.359 (46.445)	lr 0.02050
Warmup Train [23][1000/3239]	Time 0.547 (0.523)	Data 0.001 (0.018)	Loss 4.4362 (4.3599)	Top-1 acc 20.703 (24.257)	Top-5 acc 42.969 (46.459)	lr 0.02049
Warmup Train [23][1010/3239]	Time 0.510 (0.523)	Data 0.001 (0.018)	Loss 4.2652 (4.3598)	Top-1 acc 25.000 (24.266)	Top-5 acc 48.828 (46.476)	lr 0.02049
Warmup Train [23][1020/3239]	Time 0.531 (0.522)	Data 0.001 (0.018)	Loss 4.4338 (4.3599)	Top-1 acc 26.562 (24.264)	Top-5 acc 45.312 (46.479)	lr 0.02048
Warmup Train [23][1030/3239]	Time 0.433 (0.522)	Data 0.001 (0.018)	Loss 4.3429 (4.3596)	Top-1 acc 25.781 (24.277)	Top-5 acc 48.438 (46.486)	lr 0.02047
Warmup Train [23][1040/3239]	Time 0.654 (0.522)	Data 0.001 (0.018)	Loss 4.5831 (4.3605)	Top-1 acc 21.094 (24.273)	Top-5 acc 38.672 (46.468)	lr 0.02047
Warmup Train [23][1050/3239]	Time 0.543 (0.522)	Data 0.001 (0.018)	Loss 4.3692 (4.3600)	Top-1 acc 23.047 (24.278)	Top-5 acc 45.312 (46.473)	lr 0.02046
Warmup Train [23][1060/3239]	Time 0.420 (0.522)	Data 0.001 (0.018)	Loss 4.4348 (4.3599)	Top-1 acc 22.656 (24.273)	Top-5 acc 45.703 (46.483)	lr 0.02046
Warmup Train [23][1070/3239]	Time 0.562 (0.522)	Data 0.001 (0.017)	Loss 4.3138 (4.3596)	Top-1 acc 25.781 (24.277)	Top-5 acc 48.828 (46.496)	lr 0.02045
Warmup Train [23][1080/3239]	Time 0.420 (0.522)	Data 0.001 (0.017)	Loss 4.2920 (4.3594)	Top-1 acc 25.000 (24.285)	Top-5 acc 42.578 (46.483)	lr 0.02044
Warmup Train [23][1090/3239]	Time 0.525 (0.522)	Data 0.001 (0.017)	Loss 4.3503 (4.3597)	Top-1 acc 26.172 (24.282)	Top-5 acc 44.922 (46.485)	lr 0.02044
Warmup Train [23][1100/3239]	Time 0.499 (0.522)	Data 0.001 (0.017)	Loss 4.3826 (4.3600)	Top-1 acc 21.875 (24.273)	Top-5 acc 48.828 (46.492)	lr 0.02043
Warmup Train [23][1110/3239]	Time 0.556 (0.522)	Data 0.001 (0.017)	Loss 4.1115 (4.3597)	Top-1 acc 28.516 (24.277)	Top-5 acc 49.219 (46.491)	lr 0.02043
Warmup Train [23][1120/3239]	Time 0.200 (0.521)	Data 0.001 (0.017)	Loss 4.4624 (4.3596)	Top-1 acc 20.703 (24.284)	Top-5 acc 44.141 (46.499)	lr 0.02042
Warmup Train [23][1130/3239]	Time 0.583 (0.521)	Data 0.001 (0.017)	Loss 4.3180 (4.3599)	Top-1 acc 27.344 (24.278)	Top-5 acc 46.875 (46.486)	lr 0.02041
Warmup Train [23][1140/3239]	Time 0.404 (0.521)	Data 0.001 (0.017)	Loss 4.2387 (4.3600)	Top-1 acc 29.297 (24.279)	Top-5 acc 51.953 (46.482)	lr 0.02041
Warmup Train [23][1150/3239]	Time 0.534 (0.520)	Data 0.001 (0.017)	Loss 4.3120 (4.3598)	Top-1 acc 26.562 (24.288)	Top-5 acc 46.484 (46.481)	lr 0.02040
Warmup Train [23][1160/3239]	Time 0.560 (0.520)	Data 0.001 (0.017)	Loss 4.3019 (4.3595)	Top-1 acc 24.609 (24.295)	Top-5 acc 45.703 (46.489)	lr 0.02040
Warmup Train [23][1170/3239]	Time 0.628 (0.520)	Data 0.001 (0.017)	Loss 4.2525 (4.3593)	Top-1 acc 28.516 (24.304)	Top-5 acc 48.047 (46.500)	lr 0.02039
Warmup Train [23][1180/3239]	Time 0.578 (0.520)	Data 0.001 (0.016)	Loss 4.3521 (4.3596)	Top-1 acc 23.828 (24.294)	Top-5 acc 43.750 (46.486)	lr 0.02038
Warmup Train [23][1190/3239]	Time 0.583 (0.520)	Data 0.001 (0.016)	Loss 4.1625 (4.3595)	Top-1 acc 29.688 (24.295)	Top-5 acc 48.047 (46.485)	lr 0.02038
Warmup Train [23][1200/3239]	Time 0.476 (0.520)	Data 0.001 (0.016)	Loss 4.2956 (4.3595)	Top-1 acc 22.656 (24.296)	Top-5 acc 47.266 (46.479)	lr 0.02037
Warmup Train [23][1210/3239]	Time 0.494 (0.520)	Data 0.001 (0.016)	Loss 4.3091 (4.3595)	Top-1 acc 25.781 (24.298)	Top-5 acc 48.047 (46.482)	lr 0.02037
Warmup Train [23][1220/3239]	Time 0.472 (0.520)	Data 0.001 (0.016)	Loss 4.5195 (4.3598)	Top-1 acc 20.312 (24.293)	Top-5 acc 42.578 (46.472)	lr 0.02036
Warmup Train [23][1230/3239]	Time 0.606 (0.520)	Data 0.001 (0.016)	Loss 4.2407 (4.3597)	Top-1 acc 26.562 (24.306)	Top-5 acc 46.484 (46.474)	lr 0.02035
Warmup Train [23][1240/3239]	Time 0.490 (0.520)	Data 0.001 (0.016)	Loss 4.3812 (4.3594)	Top-1 acc 23.438 (24.317)	Top-5 acc 46.875 (46.477)	lr 0.02035
Warmup Train [23][1250/3239]	Time 0.323 (0.520)	Data 0.001 (0.016)	Loss 4.4768 (4.3597)	Top-1 acc 23.438 (24.314)	Top-5 acc 43.750 (46.482)	lr 0.02034
Warmup Train [23][1260/3239]	Time 0.511 (0.520)	Data 0.001 (0.016)	Loss 4.3062 (4.3594)	Top-1 acc 23.047 (24.316)	Top-5 acc 44.141 (46.486)	lr 0.02034
Warmup Train [23][1270/3239]	Time 0.470 (0.520)	Data 0.001 (0.016)	Loss 4.3077 (4.3592)	Top-1 acc 20.703 (24.316)	Top-5 acc 48.438 (46.487)	lr 0.02033
Warmup Train [23][1280/3239]	Time 0.467 (0.519)	Data 0.001 (0.016)	Loss 4.2840 (4.3588)	Top-1 acc 21.484 (24.318)	Top-5 acc 45.703 (46.492)	lr 0.02032
Warmup Train [23][1290/3239]	Time 0.444 (0.519)	Data 0.001 (0.016)	Loss 4.2702 (4.3584)	Top-1 acc 24.609 (24.318)	Top-5 acc 48.438 (46.503)	lr 0.02032
Warmup Train [23][1300/3239]	Time 0.543 (0.519)	Data 0.001 (0.016)	Loss 4.3115 (4.3582)	Top-1 acc 27.734 (24.326)	Top-5 acc 49.219 (46.509)	lr 0.02031
Warmup Train [23][1310/3239]	Time 0.622 (0.519)	Data 0.001 (0.015)	Loss 4.3662 (4.3581)	Top-1 acc 21.484 (24.324)	Top-5 acc 44.531 (46.516)	lr 0.02031
Warmup Train [23][1320/3239]	Time 0.590 (0.519)	Data 0.001 (0.015)	Loss 4.3356 (4.3584)	Top-1 acc 24.609 (24.317)	Top-5 acc 48.828 (46.512)	lr 0.02030
Warmup Train [23][1330/3239]	Time 0.566 (0.519)	Data 0.001 (0.015)	Loss 4.2043 (4.3583)	Top-1 acc 28.516 (24.315)	Top-5 acc 51.953 (46.517)	lr 0.02030
Warmup Train [23][1340/3239]	Time 0.376 (0.519)	Data 0.001 (0.015)	Loss 4.2206 (4.3581)	Top-1 acc 25.000 (24.320)	Top-5 acc 47.656 (46.521)	lr 0.02029
Warmup Train [23][1350/3239]	Time 0.443 (0.519)	Data 0.001 (0.015)	Loss 4.3150 (4.3581)	Top-1 acc 25.391 (24.321)	Top-5 acc 46.875 (46.516)	lr 0.02028
Warmup Train [23][1360/3239]	Time 0.632 (0.519)	Data 0.001 (0.015)	Loss 4.3118 (4.3576)	Top-1 acc 24.219 (24.326)	Top-5 acc 47.656 (46.524)	lr 0.02028
Warmup Train [23][1370/3239]	Time 0.668 (0.519)	Data 0.001 (0.015)	Loss 4.4341 (4.3575)	Top-1 acc 24.609 (24.326)	Top-5 acc 45.312 (46.525)	lr 0.02027
Warmup Train [23][1380/3239]	Time 0.226 (0.518)	Data 0.001 (0.015)	Loss 4.4692 (4.3577)	Top-1 acc 22.656 (24.321)	Top-5 acc 43.750 (46.519)	lr 0.02027
Warmup Train [23][1390/3239]	Time 0.546 (0.518)	Data 0.001 (0.015)	Loss 4.4253 (4.3578)	Top-1 acc 17.578 (24.318)	Top-5 acc 45.312 (46.518)	lr 0.02026
Warmup Train [23][1400/3239]	Time 0.307 (0.518)	Data 0.001 (0.015)	Loss 4.1274 (4.3574)	Top-1 acc 27.734 (24.322)	Top-5 acc 52.344 (46.526)	lr 0.02025
Warmup Train [23][1410/3239]	Time 0.432 (0.517)	Data 0.002 (0.015)	Loss 4.2747 (4.3564)	Top-1 acc 25.781 (24.342)	Top-5 acc 46.875 (46.549)	lr 0.02025
Warmup Train [23][1420/3239]	Time 0.453 (0.518)	Data 0.001 (0.015)	Loss 4.3020 (4.3559)	Top-1 acc 22.656 (24.350)	Top-5 acc 49.609 (46.560)	lr 0.02024
Warmup Train [23][1430/3239]	Time 0.682 (0.518)	Data 0.001 (0.015)	Loss 4.3980 (4.3559)	Top-1 acc 22.266 (24.354)	Top-5 acc 44.531 (46.559)	lr 0.02024
Warmup Train [23][1440/3239]	Time 0.718 (0.518)	Data 0.001 (0.015)	Loss 4.2645 (4.3553)	Top-1 acc 27.344 (24.372)	Top-5 acc 46.484 (46.578)	lr 0.02023
Warmup Train [23][1450/3239]	Time 0.399 (0.518)	Data 0.001 (0.015)	Loss 4.3270 (4.3551)	Top-1 acc 26.562 (24.377)	Top-5 acc 47.656 (46.581)	lr 0.02022
Warmup Train [23][1460/3239]	Time 0.480 (0.518)	Data 0.001 (0.015)	Loss 4.2431 (4.3547)	Top-1 acc 28.906 (24.384)	Top-5 acc 50.391 (46.592)	lr 0.02022
Warmup Train [23][1470/3239]	Time 0.515 (0.518)	Data 0.001 (0.015)	Loss 4.1780 (4.3544)	Top-1 acc 25.391 (24.385)	Top-5 acc 50.391 (46.608)	lr 0.02021
Warmup Train [23][1480/3239]	Time 0.527 (0.517)	Data 0.001 (0.014)	Loss 4.4427 (4.3552)	Top-1 acc 23.828 (24.372)	Top-5 acc 45.703 (46.591)	lr 0.02021
Warmup Train [23][1490/3239]	Time 0.729 (0.517)	Data 0.001 (0.014)	Loss 4.3392 (4.3552)	Top-1 acc 24.219 (24.374)	Top-5 acc 42.969 (46.588)	lr 0.02020
Warmup Train [23][1500/3239]	Time 0.335 (0.517)	Data 0.001 (0.014)	Loss 4.5178 (4.3554)	Top-1 acc 20.312 (24.370)	Top-5 acc 42.969 (46.585)	lr 0.02019
Warmup Train [23][1510/3239]	Time 0.497 (0.517)	Data 0.001 (0.014)	Loss 4.5367 (4.3555)	Top-1 acc 20.312 (24.371)	Top-5 acc 46.094 (46.586)	lr 0.02019
Warmup Train [23][1520/3239]	Time 0.504 (0.517)	Data 0.001 (0.014)	Loss 4.2051 (4.3557)	Top-1 acc 25.391 (24.370)	Top-5 acc 48.438 (46.579)	lr 0.02018
Warmup Train [23][1530/3239]	Time 0.491 (0.517)	Data 0.001 (0.014)	Loss 4.3204 (4.3558)	Top-1 acc 25.391 (24.376)	Top-5 acc 47.266 (46.571)	lr 0.02018
Warmup Train [23][1540/3239]	Time 0.372 (0.517)	Data 0.001 (0.014)	Loss 4.4096 (4.3560)	Top-1 acc 23.828 (24.375)	Top-5 acc 45.312 (46.567)	lr 0.02017
Warmup Train [23][1550/3239]	Time 0.480 (0.517)	Data 0.001 (0.014)	Loss 4.3541 (4.3562)	Top-1 acc 22.266 (24.372)	Top-5 acc 47.266 (46.566)	lr 0.02016
Warmup Train [23][1560/3239]	Time 0.539 (0.517)	Data 0.003 (0.014)	Loss 4.4462 (4.3559)	Top-1 acc 24.219 (24.380)	Top-5 acc 44.922 (46.573)	lr 0.02016
Warmup Train [23][1570/3239]	Time 0.431 (0.517)	Data 0.001 (0.014)	Loss 4.3336 (4.3558)	Top-1 acc 23.438 (24.378)	Top-5 acc 49.219 (46.580)	lr 0.02015
Warmup Train [23][1580/3239]	Time 0.537 (0.517)	Data 0.001 (0.014)	Loss 4.3200 (4.3557)	Top-1 acc 26.172 (24.377)	Top-5 acc 46.094 (46.580)	lr 0.02015
Warmup Train [23][1590/3239]	Time 0.561 (0.517)	Data 0.001 (0.014)	Loss 4.2156 (4.3558)	Top-1 acc 24.219 (24.367)	Top-5 acc 50.000 (46.572)	lr 0.02014
Warmup Train [23][1600/3239]	Time 0.505 (0.517)	Data 0.001 (0.014)	Loss 4.2970 (4.3559)	Top-1 acc 26.953 (24.365)	Top-5 acc 47.266 (46.574)	lr 0.02013
Warmup Train [23][1610/3239]	Time 0.521 (0.517)	Data 0.001 (0.014)	Loss 4.5078 (4.3560)	Top-1 acc 23.828 (24.359)	Top-5 acc 48.047 (46.573)	lr 0.02013
Warmup Train [23][1620/3239]	Time 0.548 (0.517)	Data 0.001 (0.014)	Loss 4.2199 (4.3560)	Top-1 acc 26.172 (24.359)	Top-5 acc 46.094 (46.571)	lr 0.02012
Warmup Train [23][1630/3239]	Time 0.471 (0.517)	Data 0.001 (0.014)	Loss 4.5361 (4.3565)	Top-1 acc 23.828 (24.355)	Top-5 acc 42.188 (46.561)	lr 0.02012
Warmup Train [23][1640/3239]	Time 0.638 (0.516)	Data 0.001 (0.014)	Loss 4.3761 (4.3569)	Top-1 acc 23.828 (24.352)	Top-5 acc 44.922 (46.556)	lr 0.02011
Warmup Train [23][1650/3239]	Time 0.491 (0.516)	Data 0.001 (0.013)	Loss 4.1372 (4.3565)	Top-1 acc 25.781 (24.363)	Top-5 acc 51.562 (46.565)	lr 0.02010
Warmup Train [23][1660/3239]	Time 0.695 (0.516)	Data 0.001 (0.013)	Loss 4.3484 (4.3563)	Top-1 acc 23.828 (24.361)	Top-5 acc 46.484 (46.570)	lr 0.02010
Warmup Train [23][1670/3239]	Time 0.600 (0.516)	Data 0.001 (0.013)	Loss 4.1771 (4.3563)	Top-1 acc 24.219 (24.355)	Top-5 acc 48.828 (46.568)	lr 0.02009
Warmup Train [23][1680/3239]	Time 0.540 (0.516)	Data 0.001 (0.013)	Loss 4.3747 (4.3565)	Top-1 acc 25.391 (24.353)	Top-5 acc 46.094 (46.565)	lr 0.02009
Warmup Train [23][1690/3239]	Time 0.752 (0.516)	Data 0.001 (0.013)	Loss 4.4537 (4.3563)	Top-1 acc 23.047 (24.360)	Top-5 acc 44.141 (46.566)	lr 0.02008
Warmup Train [23][1700/3239]	Time 0.598 (0.516)	Data 0.001 (0.013)	Loss 4.1629 (4.3561)	Top-1 acc 25.781 (24.359)	Top-5 acc 51.562 (46.571)	lr 0.02008
Warmup Train [23][1710/3239]	Time 0.505 (0.516)	Data 0.001 (0.013)	Loss 4.5097 (4.3559)	Top-1 acc 22.266 (24.361)	Top-5 acc 44.922 (46.573)	lr 0.02007
Warmup Train [23][1720/3239]	Time 0.406 (0.516)	Data 0.001 (0.013)	Loss 4.3732 (4.3561)	Top-1 acc 23.047 (24.364)	Top-5 acc 49.219 (46.571)	lr 0.02006
Warmup Train [23][1730/3239]	Time 0.486 (0.516)	Data 0.001 (0.013)	Loss 4.3244 (4.3560)	Top-1 acc 23.438 (24.365)	Top-5 acc 50.000 (46.575)	lr 0.02006
Warmup Train [23][1740/3239]	Time 0.358 (0.516)	Data 0.001 (0.013)	Loss 4.3550 (4.3558)	Top-1 acc 25.000 (24.363)	Top-5 acc 45.312 (46.577)	lr 0.02005
Warmup Train [23][1750/3239]	Time 0.423 (0.516)	Data 0.001 (0.013)	Loss 4.3891 (4.3557)	Top-1 acc 22.656 (24.364)	Top-5 acc 45.703 (46.580)	lr 0.02005
Warmup Train [23][1760/3239]	Time 0.524 (0.516)	Data 0.001 (0.013)	Loss 4.1628 (4.3559)	Top-1 acc 26.953 (24.361)	Top-5 acc 48.828 (46.570)	lr 0.02004
Warmup Train [23][1770/3239]	Time 0.537 (0.516)	Data 0.002 (0.013)	Loss 4.4566 (4.3560)	Top-1 acc 25.781 (24.362)	Top-5 acc 43.750 (46.567)	lr 0.02003
Warmup Train [23][1780/3239]	Time 0.568 (0.516)	Data 0.001 (0.013)	Loss 4.5658 (4.3561)	Top-1 acc 20.312 (24.362)	Top-5 acc 35.938 (46.558)	lr 0.02003
Warmup Train [23][1790/3239]	Time 0.545 (0.516)	Data 0.027 (0.013)	Loss 4.2359 (4.3562)	Top-1 acc 25.391 (24.360)	Top-5 acc 50.000 (46.554)	lr 0.02002
Warmup Train [23][1800/3239]	Time 0.328 (0.516)	Data 0.001 (0.013)	Loss 4.3432 (4.3561)	Top-1 acc 28.516 (24.368)	Top-5 acc 45.703 (46.556)	lr 0.02002
Warmup Train [23][1810/3239]	Time 0.354 (0.516)	Data 0.002 (0.013)	Loss 4.2051 (4.3559)	Top-1 acc 27.344 (24.371)	Top-5 acc 49.609 (46.561)	lr 0.02001
Warmup Train [23][1820/3239]	Time 0.600 (0.516)	Data 0.001 (0.013)	Loss 4.3346 (4.3558)	Top-1 acc 24.219 (24.377)	Top-5 acc 46.484 (46.565)	lr 0.02000
Warmup Train [23][1830/3239]	Time 0.638 (0.516)	Data 0.001 (0.013)	Loss 4.2980 (4.3556)	Top-1 acc 21.875 (24.380)	Top-5 acc 45.703 (46.566)	lr 0.02000
Warmup Train [23][1840/3239]	Time 0.382 (0.516)	Data 0.001 (0.013)	Loss 4.3356 (4.3554)	Top-1 acc 20.703 (24.381)	Top-5 acc 46.094 (46.572)	lr 0.01999
Warmup Train [23][1850/3239]	Time 0.320 (0.516)	Data 0.001 (0.013)	Loss 4.4641 (4.3554)	Top-1 acc 23.438 (24.381)	Top-5 acc 44.531 (46.574)	lr 0.01999
Warmup Train [23][1860/3239]	Time 0.570 (0.516)	Data 0.001 (0.013)	Loss 4.3642 (4.3554)	Top-1 acc 25.000 (24.381)	Top-5 acc 43.750 (46.567)	lr 0.01998
Warmup Train [23][1870/3239]	Time 0.380 (0.516)	Data 0.001 (0.013)	Loss 4.3164 (4.3556)	Top-1 acc 24.219 (24.377)	Top-5 acc 48.438 (46.566)	lr 0.01997
Warmup Train [23][1880/3239]	Time 0.394 (0.516)	Data 0.001 (0.013)	Loss 4.5229 (4.3555)	Top-1 acc 23.828 (24.383)	Top-5 acc 46.484 (46.566)	lr 0.01997
Warmup Train [23][1890/3239]	Time 0.714 (0.516)	Data 0.001 (0.013)	Loss 4.2567 (4.3555)	Top-1 acc 24.219 (24.383)	Top-5 acc 48.828 (46.565)	lr 0.01996
Warmup Train [23][1900/3239]	Time 0.502 (0.516)	Data 0.002 (0.013)	Loss 4.1218 (4.3550)	Top-1 acc 25.391 (24.394)	Top-5 acc 47.656 (46.571)	lr 0.01996
Warmup Train [23][1910/3239]	Time 0.411 (0.516)	Data 0.002 (0.013)	Loss 4.3644 (4.3551)	Top-1 acc 24.219 (24.391)	Top-5 acc 48.828 (46.571)	lr 0.01995
Warmup Train [23][1920/3239]	Time 0.442 (0.516)	Data 0.001 (0.013)	Loss 4.3068 (4.3553)	Top-1 acc 26.562 (24.391)	Top-5 acc 50.391 (46.572)	lr 0.01994
Warmup Train [23][1930/3239]	Time 0.509 (0.516)	Data 0.001 (0.013)	Loss 4.3567 (4.3554)	Top-1 acc 23.438 (24.387)	Top-5 acc 45.312 (46.572)	lr 0.01994
Warmup Train [23][1940/3239]	Time 0.422 (0.516)	Data 0.001 (0.012)	Loss 4.4475 (4.3555)	Top-1 acc 23.438 (24.395)	Top-5 acc 42.969 (46.575)	lr 0.01993
Warmup Train [23][1950/3239]	Time 0.365 (0.516)	Data 0.001 (0.012)	Loss 4.3983 (4.3556)	Top-1 acc 24.609 (24.391)	Top-5 acc 50.391 (46.574)	lr 0.01993
Warmup Train [23][1960/3239]	Time 0.507 (0.516)	Data 0.001 (0.012)	Loss 4.3938 (4.3555)	Top-1 acc 21.484 (24.393)	Top-5 acc 42.969 (46.573)	lr 0.01992
Warmup Train [23][1970/3239]	Time 0.510 (0.516)	Data 0.001 (0.012)	Loss 4.3253 (4.3551)	Top-1 acc 23.438 (24.395)	Top-5 acc 49.219 (46.584)	lr 0.01991
Warmup Train [23][1980/3239]	Time 0.440 (0.516)	Data 0.001 (0.012)	Loss 4.5085 (4.3550)	Top-1 acc 19.141 (24.397)	Top-5 acc 41.406 (46.584)	lr 0.01991
Warmup Train [23][1990/3239]	Time 0.515 (0.516)	Data 0.001 (0.012)	Loss 4.1060 (4.3547)	Top-1 acc 28.906 (24.398)	Top-5 acc 53.125 (46.584)	lr 0.01990
Warmup Train [23][2000/3239]	Time 0.393 (0.516)	Data 0.001 (0.012)	Loss 4.4229 (4.3544)	Top-1 acc 20.312 (24.396)	Top-5 acc 43.359 (46.587)	lr 0.01990
Warmup Train [23][2010/3239]	Time 0.552 (0.516)	Data 0.001 (0.012)	Loss 4.3432 (4.3544)	Top-1 acc 20.703 (24.399)	Top-5 acc 46.094 (46.588)	lr 0.01989
Warmup Train [23][2020/3239]	Time 0.597 (0.516)	Data 0.001 (0.012)	Loss 4.5072 (4.3546)	Top-1 acc 21.484 (24.388)	Top-5 acc 44.922 (46.588)	lr 0.01989
Warmup Train [23][2030/3239]	Time 0.381 (0.516)	Data 0.001 (0.012)	Loss 4.4336 (4.3543)	Top-1 acc 21.094 (24.387)	Top-5 acc 45.312 (46.597)	lr 0.01988
Warmup Train [23][2040/3239]	Time 0.561 (0.516)	Data 0.001 (0.012)	Loss 4.3969 (4.3540)	Top-1 acc 19.531 (24.392)	Top-5 acc 46.094 (46.604)	lr 0.01987
Warmup Train [23][2050/3239]	Time 0.583 (0.516)	Data 0.001 (0.012)	Loss 4.2165 (4.3540)	Top-1 acc 24.609 (24.389)	Top-5 acc 47.656 (46.601)	lr 0.01987
Warmup Train [23][2060/3239]	Time 0.376 (0.516)	Data 0.001 (0.012)	Loss 4.1783 (4.3541)	Top-1 acc 27.734 (24.388)	Top-5 acc 50.000 (46.602)	lr 0.01986
Warmup Train [23][2070/3239]	Time 0.648 (0.516)	Data 0.001 (0.012)	Loss 4.2897 (4.3538)	Top-1 acc 27.344 (24.392)	Top-5 acc 46.875 (46.607)	lr 0.01986
Warmup Train [23][2080/3239]	Time 0.378 (0.516)	Data 0.001 (0.012)	Loss 4.4262 (4.3536)	Top-1 acc 25.000 (24.395)	Top-5 acc 46.094 (46.611)	lr 0.01985
Warmup Train [23][2090/3239]	Time 0.491 (0.516)	Data 0.001 (0.012)	Loss 4.3351 (4.3538)	Top-1 acc 22.656 (24.389)	Top-5 acc 44.531 (46.607)	lr 0.01984
Warmup Train [23][2100/3239]	Time 0.695 (0.516)	Data 0.001 (0.012)	Loss 4.3058 (4.3539)	Top-1 acc 24.609 (24.389)	Top-5 acc 48.828 (46.606)	lr 0.01984
Warmup Train [23][2110/3239]	Time 0.550 (0.516)	Data 0.001 (0.012)	Loss 4.2680 (4.3537)	Top-1 acc 25.000 (24.396)	Top-5 acc 48.438 (46.613)	lr 0.01983
Warmup Train [23][2120/3239]	Time 0.469 (0.516)	Data 0.001 (0.012)	Loss 4.3820 (4.3536)	Top-1 acc 23.828 (24.397)	Top-5 acc 47.656 (46.612)	lr 0.01983
Warmup Train [23][2130/3239]	Time 0.623 (0.515)	Data 0.001 (0.012)	Loss 4.1963 (4.3532)	Top-1 acc 26.172 (24.402)	Top-5 acc 51.172 (46.619)	lr 0.01982
Warmup Train [23][2140/3239]	Time 0.538 (0.515)	Data 0.001 (0.012)	Loss 4.1591 (4.3532)	Top-1 acc 26.172 (24.402)	Top-5 acc 50.781 (46.617)	lr 0.01981
Warmup Train [23][2150/3239]	Time 0.506 (0.515)	Data 0.001 (0.012)	Loss 4.3200 (4.3531)	Top-1 acc 25.391 (24.412)	Top-5 acc 44.141 (46.618)	lr 0.01981
Warmup Train [23][2160/3239]	Time 0.364 (0.515)	Data 0.001 (0.012)	Loss 4.5217 (4.3532)	Top-1 acc 19.531 (24.410)	Top-5 acc 41.797 (46.618)	lr 0.01980
Warmup Train [23][2170/3239]	Time 0.340 (0.515)	Data 0.001 (0.012)	Loss 4.3619 (4.3533)	Top-1 acc 20.703 (24.410)	Top-5 acc 45.312 (46.617)	lr 0.01980
Warmup Train [23][2180/3239]	Time 0.331 (0.515)	Data 0.001 (0.012)	Loss 4.1729 (4.3533)	Top-1 acc 25.391 (24.406)	Top-5 acc 49.609 (46.616)	lr 0.01979
Warmup Train [23][2190/3239]	Time 0.366 (0.515)	Data 0.001 (0.012)	Loss 4.3777 (4.3536)	Top-1 acc 26.172 (24.398)	Top-5 acc 47.266 (46.611)	lr 0.01978
Warmup Train [23][2200/3239]	Time 0.464 (0.515)	Data 0.001 (0.012)	Loss 4.5755 (4.3538)	Top-1 acc 20.703 (24.396)	Top-5 acc 38.672 (46.604)	lr 0.01978
Warmup Train [23][2210/3239]	Time 0.313 (0.515)	Data 0.001 (0.012)	Loss 4.3402 (4.3539)	Top-1 acc 25.781 (24.395)	Top-5 acc 48.047 (46.600)	lr 0.01977
Warmup Train [23][2220/3239]	Time 0.648 (0.515)	Data 0.001 (0.012)	Loss 4.3148 (4.3535)	Top-1 acc 25.391 (24.403)	Top-5 acc 44.141 (46.606)	lr 0.01977
Warmup Train [23][2230/3239]	Time 0.434 (0.515)	Data 0.001 (0.012)	Loss 4.3797 (4.3533)	Top-1 acc 23.828 (24.404)	Top-5 acc 44.141 (46.612)	lr 0.01976
Warmup Train [23][2240/3239]	Time 0.531 (0.515)	Data 0.002 (0.012)	Loss 4.4468 (4.3531)	Top-1 acc 21.094 (24.408)	Top-5 acc 46.875 (46.617)	lr 0.01975
Warmup Train [23][2250/3239]	Time 0.614 (0.515)	Data 0.001 (0.012)	Loss 4.4214 (4.3531)	Top-1 acc 25.391 (24.409)	Top-5 acc 45.312 (46.618)	lr 0.01975
Warmup Train [23][2260/3239]	Time 0.383 (0.515)	Data 0.001 (0.012)	Loss 4.2992 (4.3530)	Top-1 acc 24.219 (24.412)	Top-5 acc 51.172 (46.619)	lr 0.01974
Warmup Train [23][2270/3239]	Time 0.585 (0.515)	Data 0.001 (0.012)	Loss 4.2030 (4.3530)	Top-1 acc 25.781 (24.415)	Top-5 acc 48.438 (46.616)	lr 0.01974
Warmup Train [23][2280/3239]	Time 0.673 (0.515)	Data 0.001 (0.012)	Loss 4.4340 (4.3530)	Top-1 acc 17.578 (24.415)	Top-5 acc 44.531 (46.617)	lr 0.01973
Warmup Train [23][2290/3239]	Time 0.576 (0.515)	Data 0.001 (0.012)	Loss 4.3816 (4.3529)	Top-1 acc 24.219 (24.415)	Top-5 acc 48.438 (46.622)	lr 0.01973
Warmup Train [23][2300/3239]	Time 0.526 (0.515)	Data 0.001 (0.012)	Loss 4.4232 (4.3528)	Top-1 acc 21.484 (24.416)	Top-5 acc 42.969 (46.627)	lr 0.01972
Warmup Train [23][2310/3239]	Time 0.384 (0.515)	Data 0.001 (0.012)	Loss 4.4183 (4.3528)	Top-1 acc 20.312 (24.417)	Top-5 acc 46.875 (46.627)	lr 0.01971
Warmup Train [23][2320/3239]	Time 0.500 (0.515)	Data 0.001 (0.012)	Loss 4.2162 (4.3528)	Top-1 acc 25.000 (24.417)	Top-5 acc 44.922 (46.621)	lr 0.01971
Warmup Train [23][2330/3239]	Time 0.420 (0.515)	Data 0.001 (0.012)	Loss 4.2689 (4.3527)	Top-1 acc 24.609 (24.417)	Top-5 acc 48.438 (46.621)	lr 0.01970
Warmup Train [23][2340/3239]	Time 0.465 (0.515)	Data 0.001 (0.012)	Loss 4.2872 (4.3528)	Top-1 acc 25.000 (24.416)	Top-5 acc 49.609 (46.617)	lr 0.01970
Warmup Train [23][2350/3239]	Time 0.614 (0.515)	Data 0.001 (0.012)	Loss 4.2254 (4.3529)	Top-1 acc 23.828 (24.416)	Top-5 acc 47.656 (46.613)	lr 0.01969
Warmup Train [23][2360/3239]	Time 0.513 (0.515)	Data 0.001 (0.012)	Loss 4.3073 (4.3529)	Top-1 acc 29.297 (24.418)	Top-5 acc 47.266 (46.617)	lr 0.01968
Warmup Train [23][2370/3239]	Time 0.210 (0.514)	Data 0.001 (0.012)	Loss 4.3056 (4.3531)	Top-1 acc 25.391 (24.410)	Top-5 acc 44.922 (46.611)	lr 0.01968
Warmup Train [23][2380/3239]	Time 0.711 (0.514)	Data 0.002 (0.012)	Loss 4.1959 (4.3529)	Top-1 acc 29.297 (24.413)	Top-5 acc 50.000 (46.616)	lr 0.01967
Warmup Train [23][2390/3239]	Time 0.475 (0.514)	Data 0.001 (0.012)	Loss 4.2359 (4.3528)	Top-1 acc 28.516 (24.412)	Top-5 acc 49.609 (46.617)	lr 0.01967
Warmup Train [23][2400/3239]	Time 0.350 (0.514)	Data 0.001 (0.012)	Loss 4.3603 (4.3525)	Top-1 acc 22.266 (24.415)	Top-5 acc 43.750 (46.623)	lr 0.01966
Warmup Train [23][2410/3239]	Time 0.476 (0.514)	Data 0.001 (0.012)	Loss 4.3334 (4.3524)	Top-1 acc 24.219 (24.414)	Top-5 acc 47.656 (46.630)	lr 0.01965
Warmup Train [23][2420/3239]	Time 0.327 (0.514)	Data 0.001 (0.012)	Loss 4.3124 (4.3523)	Top-1 acc 24.609 (24.418)	Top-5 acc 44.531 (46.632)	lr 0.01965
Warmup Train [23][2430/3239]	Time 0.533 (0.514)	Data 0.001 (0.012)	Loss 4.2741 (4.3523)	Top-1 acc 23.828 (24.411)	Top-5 acc 49.609 (46.628)	lr 0.01964
Warmup Train [23][2440/3239]	Time 0.745 (0.514)	Data 0.001 (0.012)	Loss 4.4001 (4.3522)	Top-1 acc 25.391 (24.413)	Top-5 acc 45.703 (46.628)	lr 0.01964
Warmup Train [23][2450/3239]	Time 0.552 (0.514)	Data 0.001 (0.012)	Loss 4.3877 (4.3523)	Top-1 acc 23.438 (24.414)	Top-5 acc 45.312 (46.624)	lr 0.01963
Warmup Train [23][2460/3239]	Time 0.300 (0.514)	Data 0.001 (0.011)	Loss 4.2397 (4.3520)	Top-1 acc 28.516 (24.419)	Top-5 acc 47.266 (46.630)	lr 0.01962
Warmup Train [23][2470/3239]	Time 0.494 (0.514)	Data 0.001 (0.011)	Loss 4.3835 (4.3521)	Top-1 acc 25.391 (24.420)	Top-5 acc 46.094 (46.628)	lr 0.01962
Warmup Train [23][2480/3239]	Time 0.363 (0.514)	Data 0.001 (0.011)	Loss 4.3425 (4.3519)	Top-1 acc 21.484 (24.419)	Top-5 acc 44.922 (46.633)	lr 0.01961
Warmup Train [23][2490/3239]	Time 0.437 (0.514)	Data 0.001 (0.011)	Loss 4.3886 (4.3520)	Top-1 acc 22.656 (24.420)	Top-5 acc 47.266 (46.634)	lr 0.01961
Warmup Train [23][2500/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 4.1655 (4.3519)	Top-1 acc 30.078 (24.420)	Top-5 acc 52.734 (46.641)	lr 0.01960
Warmup Train [23][2510/3239]	Time 0.543 (0.514)	Data 0.001 (0.011)	Loss 4.3986 (4.3519)	Top-1 acc 19.141 (24.419)	Top-5 acc 48.047 (46.645)	lr 0.01959
Warmup Train [23][2520/3239]	Time 0.475 (0.514)	Data 0.001 (0.011)	Loss 4.3074 (4.3519)	Top-1 acc 22.656 (24.417)	Top-5 acc 49.219 (46.648)	lr 0.01959
Warmup Train [23][2530/3239]	Time 0.452 (0.514)	Data 0.001 (0.011)	Loss 4.3807 (4.3520)	Top-1 acc 21.094 (24.415)	Top-5 acc 49.219 (46.648)	lr 0.01958
Warmup Train [23][2540/3239]	Time 0.579 (0.514)	Data 0.001 (0.011)	Loss 4.0931 (4.3517)	Top-1 acc 29.688 (24.424)	Top-5 acc 55.859 (46.654)	lr 0.01958
Warmup Train [23][2550/3239]	Time 0.436 (0.514)	Data 0.001 (0.011)	Loss 4.4073 (4.3519)	Top-1 acc 22.656 (24.418)	Top-5 acc 43.750 (46.647)	lr 0.01957
Warmup Train [23][2560/3239]	Time 0.632 (0.514)	Data 0.001 (0.011)	Loss 4.3169 (4.3518)	Top-1 acc 28.125 (24.423)	Top-5 acc 49.609 (46.647)	lr 0.01957
Warmup Train [23][2570/3239]	Time 0.341 (0.514)	Data 0.001 (0.011)	Loss 4.4985 (4.3517)	Top-1 acc 17.578 (24.424)	Top-5 acc 42.188 (46.649)	lr 0.01956
Warmup Train [23][2580/3239]	Time 0.509 (0.514)	Data 0.001 (0.011)	Loss 4.4529 (4.3516)	Top-1 acc 21.875 (24.427)	Top-5 acc 41.016 (46.654)	lr 0.01955
Warmup Train [23][2590/3239]	Time 0.462 (0.514)	Data 0.001 (0.011)	Loss 4.3794 (4.3515)	Top-1 acc 26.172 (24.431)	Top-5 acc 45.312 (46.657)	lr 0.01955
Warmup Train [23][2600/3239]	Time 0.526 (0.514)	Data 0.030 (0.011)	Loss 4.3481 (4.3516)	Top-1 acc 24.609 (24.427)	Top-5 acc 50.000 (46.657)	lr 0.01954
Warmup Train [23][2610/3239]	Time 0.573 (0.514)	Data 0.001 (0.011)	Loss 4.4095 (4.3516)	Top-1 acc 22.266 (24.424)	Top-5 acc 45.703 (46.656)	lr 0.01954
Warmup Train [23][2620/3239]	Time 0.603 (0.514)	Data 0.001 (0.011)	Loss 4.5217 (4.3516)	Top-1 acc 23.438 (24.424)	Top-5 acc 39.844 (46.652)	lr 0.01953
Warmup Train [23][2630/3239]	Time 0.370 (0.514)	Data 0.001 (0.011)	Loss 4.2974 (4.3515)	Top-1 acc 24.219 (24.428)	Top-5 acc 45.703 (46.652)	lr 0.01952
Warmup Train [23][2640/3239]	Time 0.432 (0.514)	Data 0.001 (0.011)	Loss 4.2402 (4.3513)	Top-1 acc 27.344 (24.432)	Top-5 acc 50.000 (46.655)	lr 0.01952
Warmup Train [23][2650/3239]	Time 0.594 (0.514)	Data 0.002 (0.011)	Loss 4.2899 (4.3513)	Top-1 acc 26.562 (24.432)	Top-5 acc 50.000 (46.655)	lr 0.01951
Warmup Train [23][2660/3239]	Time 0.599 (0.514)	Data 0.001 (0.011)	Loss 4.3244 (4.3510)	Top-1 acc 25.781 (24.436)	Top-5 acc 45.703 (46.660)	lr 0.01951
Warmup Train [23][2670/3239]	Time 0.581 (0.514)	Data 0.001 (0.011)	Loss 4.1235 (4.3509)	Top-1 acc 30.078 (24.439)	Top-5 acc 51.953 (46.663)	lr 0.01950
Warmup Train [23][2680/3239]	Time 0.512 (0.514)	Data 0.001 (0.011)	Loss 4.4309 (4.3510)	Top-1 acc 23.438 (24.435)	Top-5 acc 43.750 (46.659)	lr 0.01949
Warmup Train [23][2690/3239]	Time 0.522 (0.514)	Data 0.001 (0.011)	Loss 4.4442 (4.3510)	Top-1 acc 23.828 (24.436)	Top-5 acc 46.094 (46.659)	lr 0.01949
Warmup Train [23][2700/3239]	Time 0.683 (0.514)	Data 0.026 (0.011)	Loss 4.1863 (4.3508)	Top-1 acc 26.172 (24.436)	Top-5 acc 50.391 (46.663)	lr 0.01948
Warmup Train [23][2710/3239]	Time 0.534 (0.514)	Data 0.001 (0.011)	Loss 4.4087 (4.3510)	Top-1 acc 21.484 (24.435)	Top-5 acc 45.312 (46.656)	lr 0.01948
Warmup Train [23][2720/3239]	Time 0.506 (0.514)	Data 0.001 (0.011)	Loss 4.3952 (4.3509)	Top-1 acc 23.828 (24.436)	Top-5 acc 47.656 (46.658)	lr 0.01947
Warmup Train [23][2730/3239]	Time 0.589 (0.514)	Data 0.001 (0.011)	Loss 4.2709 (4.3507)	Top-1 acc 25.391 (24.441)	Top-5 acc 50.391 (46.661)	lr 0.01946
Warmup Train [23][2740/3239]	Time 0.461 (0.514)	Data 0.001 (0.011)	Loss 4.4611 (4.3507)	Top-1 acc 19.922 (24.440)	Top-5 acc 44.531 (46.665)	lr 0.01946
Warmup Train [23][2750/3239]	Time 0.510 (0.514)	Data 0.001 (0.011)	Loss 4.3136 (4.3508)	Top-1 acc 21.875 (24.440)	Top-5 acc 50.391 (46.666)	lr 0.01945
Warmup Train [23][2760/3239]	Time 0.468 (0.514)	Data 0.001 (0.011)	Loss 4.4698 (4.3507)	Top-1 acc 21.484 (24.442)	Top-5 acc 43.750 (46.668)	lr 0.01945
Warmup Train [23][2770/3239]	Time 0.736 (0.514)	Data 0.001 (0.011)	Loss 4.4656 (4.3505)	Top-1 acc 21.094 (24.441)	Top-5 acc 45.312 (46.674)	lr 0.01944
Warmup Train [23][2780/3239]	Time 0.447 (0.514)	Data 0.001 (0.011)	Loss 4.5181 (4.3504)	Top-1 acc 25.391 (24.447)	Top-5 acc 44.531 (46.677)	lr 0.01944
Warmup Train [23][2790/3239]	Time 0.555 (0.514)	Data 0.001 (0.011)	Loss 4.2056 (4.3503)	Top-1 acc 24.219 (24.450)	Top-5 acc 48.438 (46.681)	lr 0.01943
Warmup Train [23][2800/3239]	Time 0.501 (0.514)	Data 0.001 (0.011)	Loss 4.3473 (4.3506)	Top-1 acc 23.047 (24.444)	Top-5 acc 47.656 (46.672)	lr 0.01942
Warmup Train [23][2810/3239]	Time 0.463 (0.514)	Data 0.001 (0.011)	Loss 4.1932 (4.3504)	Top-1 acc 28.125 (24.450)	Top-5 acc 52.734 (46.678)	lr 0.01942
Warmup Train [23][2820/3239]	Time 0.387 (0.514)	Data 0.001 (0.011)	Loss 4.1762 (4.3504)	Top-1 acc 27.344 (24.451)	Top-5 acc 54.688 (46.679)	lr 0.01941
Warmup Train [23][2830/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 4.2815 (4.3504)	Top-1 acc 29.688 (24.453)	Top-5 acc 51.562 (46.681)	lr 0.01941
Warmup Train [23][2840/3239]	Time 0.553 (0.514)	Data 0.001 (0.011)	Loss 4.4665 (4.3507)	Top-1 acc 24.219 (24.449)	Top-5 acc 43.750 (46.671)	lr 0.01940
Warmup Train [23][2850/3239]	Time 0.405 (0.514)	Data 0.001 (0.011)	Loss 4.1216 (4.3506)	Top-1 acc 27.734 (24.451)	Top-5 acc 51.172 (46.673)	lr 0.01939
Warmup Train [23][2860/3239]	Time 0.575 (0.514)	Data 0.001 (0.011)	Loss 4.1219 (4.3503)	Top-1 acc 28.125 (24.458)	Top-5 acc 49.219 (46.676)	lr 0.01939
Warmup Train [23][2870/3239]	Time 0.433 (0.514)	Data 0.001 (0.011)	Loss 4.2127 (4.3504)	Top-1 acc 25.781 (24.456)	Top-5 acc 48.828 (46.672)	lr 0.01938
Warmup Train [23][2880/3239]	Time 0.339 (0.514)	Data 0.001 (0.011)	Loss 4.3775 (4.3503)	Top-1 acc 25.000 (24.458)	Top-5 acc 46.094 (46.677)	lr 0.01938
Warmup Train [23][2890/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 4.2493 (4.3502)	Top-1 acc 25.000 (24.462)	Top-5 acc 48.047 (46.678)	lr 0.01937
Warmup Train [23][2900/3239]	Time 0.534 (0.514)	Data 0.001 (0.011)	Loss 4.3049 (4.3503)	Top-1 acc 25.391 (24.461)	Top-5 acc 51.562 (46.681)	lr 0.01936
Warmup Train [23][2910/3239]	Time 0.369 (0.514)	Data 0.001 (0.011)	Loss 4.5179 (4.3502)	Top-1 acc 22.656 (24.466)	Top-5 acc 43.359 (46.681)	lr 0.01936
Warmup Train [23][2920/3239]	Time 0.381 (0.513)	Data 0.001 (0.011)	Loss 4.4172 (4.3502)	Top-1 acc 24.219 (24.466)	Top-5 acc 45.703 (46.681)	lr 0.01935
Warmup Train [23][2930/3239]	Time 0.439 (0.513)	Data 0.001 (0.011)	Loss 4.5242 (4.3500)	Top-1 acc 23.828 (24.469)	Top-5 acc 39.844 (46.686)	lr 0.01935
Warmup Train [23][2940/3239]	Time 0.356 (0.513)	Data 0.001 (0.011)	Loss 4.2227 (4.3498)	Top-1 acc 26.953 (24.471)	Top-5 acc 51.953 (46.692)	lr 0.01934
Warmup Train [23][2950/3239]	Time 0.566 (0.513)	Data 0.001 (0.011)	Loss 4.2394 (4.3496)	Top-1 acc 26.172 (24.474)	Top-5 acc 51.172 (46.700)	lr 0.01933
Warmup Train [23][2960/3239]	Time 0.417 (0.514)	Data 0.001 (0.011)	Loss 4.1822 (4.3495)	Top-1 acc 28.516 (24.479)	Top-5 acc 50.781 (46.703)	lr 0.01933
Warmup Train [23][2970/3239]	Time 0.477 (0.514)	Data 0.001 (0.011)	Loss 4.3173 (4.3494)	Top-1 acc 21.875 (24.478)	Top-5 acc 42.578 (46.703)	lr 0.01932
Warmup Train [23][2980/3239]	Time 0.640 (0.514)	Data 0.001 (0.011)	Loss 4.4486 (4.3492)	Top-1 acc 23.047 (24.481)	Top-5 acc 49.219 (46.713)	lr 0.01932
Warmup Train [23][2990/3239]	Time 0.574 (0.514)	Data 0.001 (0.011)	Loss 4.3491 (4.3490)	Top-1 acc 23.047 (24.479)	Top-5 acc 46.875 (46.716)	lr 0.01931
Warmup Train [23][3000/3239]	Time 0.524 (0.514)	Data 0.002 (0.011)	Loss 4.1903 (4.3487)	Top-1 acc 28.516 (24.485)	Top-5 acc 48.828 (46.723)	lr 0.01931
Warmup Train [23][3010/3239]	Time 0.536 (0.514)	Data 0.001 (0.011)	Loss 4.3345 (4.3485)	Top-1 acc 28.516 (24.490)	Top-5 acc 48.438 (46.726)	lr 0.01930
Warmup Train [23][3020/3239]	Time 0.693 (0.514)	Data 0.001 (0.011)	Loss 4.4706 (4.3484)	Top-1 acc 24.219 (24.492)	Top-5 acc 44.922 (46.730)	lr 0.01929
Warmup Train [23][3030/3239]	Time 0.653 (0.514)	Data 0.001 (0.011)	Loss 4.2744 (4.3485)	Top-1 acc 27.734 (24.493)	Top-5 acc 46.484 (46.727)	lr 0.01929
Warmup Train [23][3040/3239]	Time 0.409 (0.514)	Data 0.001 (0.011)	Loss 4.3641 (4.3484)	Top-1 acc 25.391 (24.492)	Top-5 acc 48.828 (46.726)	lr 0.01928
Warmup Train [23][3050/3239]	Time 0.596 (0.514)	Data 0.001 (0.011)	Loss 4.3798 (4.3484)	Top-1 acc 21.484 (24.488)	Top-5 acc 48.828 (46.730)	lr 0.01928
Warmup Train [23][3060/3239]	Time 0.677 (0.514)	Data 0.001 (0.011)	Loss 4.1527 (4.3483)	Top-1 acc 26.562 (24.491)	Top-5 acc 47.656 (46.731)	lr 0.01927
Warmup Train [23][3070/3239]	Time 0.337 (0.514)	Data 0.001 (0.011)	Loss 4.2550 (4.3484)	Top-1 acc 26.172 (24.497)	Top-5 acc 50.391 (46.730)	lr 0.01926
Warmup Train [23][3080/3239]	Time 0.467 (0.514)	Data 0.001 (0.011)	Loss 4.3677 (4.3483)	Top-1 acc 25.000 (24.497)	Top-5 acc 47.266 (46.731)	lr 0.01926
Warmup Train [23][3090/3239]	Time 0.483 (0.514)	Data 0.001 (0.011)	Loss 4.3626 (4.3482)	Top-1 acc 21.875 (24.500)	Top-5 acc 46.875 (46.733)	lr 0.01925
Warmup Train [23][3100/3239]	Time 0.613 (0.513)	Data 0.001 (0.011)	Loss 4.3048 (4.3480)	Top-1 acc 25.391 (24.501)	Top-5 acc 49.609 (46.737)	lr 0.01925
Warmup Train [23][3110/3239]	Time 0.538 (0.513)	Data 0.001 (0.011)	Loss 4.2578 (4.3479)	Top-1 acc 27.344 (24.504)	Top-5 acc 48.438 (46.736)	lr 0.01924
Warmup Train [23][3120/3239]	Time 0.461 (0.513)	Data 0.001 (0.011)	Loss 4.3838 (4.3480)	Top-1 acc 21.875 (24.502)	Top-5 acc 43.750 (46.735)	lr 0.01923
Warmup Train [23][3130/3239]	Time 0.627 (0.513)	Data 0.001 (0.010)	Loss 4.4281 (4.3479)	Top-1 acc 21.875 (24.503)	Top-5 acc 43.750 (46.736)	lr 0.01923
Warmup Train [23][3140/3239]	Time 0.536 (0.513)	Data 0.001 (0.010)	Loss 4.3812 (4.3480)	Top-1 acc 21.875 (24.498)	Top-5 acc 46.094 (46.734)	lr 0.01922
Warmup Train [23][3150/3239]	Time 0.619 (0.513)	Data 0.001 (0.010)	Loss 4.4511 (4.3480)	Top-1 acc 25.391 (24.500)	Top-5 acc 44.141 (46.734)	lr 0.01922
Warmup Train [23][3160/3239]	Time 0.733 (0.513)	Data 0.001 (0.010)	Loss 4.0612 (4.3477)	Top-1 acc 30.859 (24.503)	Top-5 acc 56.641 (46.738)	lr 0.01921
Warmup Train [23][3170/3239]	Time 0.606 (0.513)	Data 0.001 (0.010)	Loss 4.2265 (4.3476)	Top-1 acc 26.562 (24.504)	Top-5 acc 49.609 (46.738)	lr 0.01921
Warmup Train [23][3180/3239]	Time 0.449 (0.513)	Data 0.000 (0.010)	Loss 4.4921 (4.3476)	Top-1 acc 21.484 (24.500)	Top-5 acc 41.016 (46.736)	lr 0.01920
Warmup Train [23][3190/3239]	Time 0.501 (0.513)	Data 0.000 (0.010)	Loss 4.3136 (4.3477)	Top-1 acc 23.828 (24.497)	Top-5 acc 49.609 (46.734)	lr 0.01919
Warmup Train [23][3200/3239]	Time 0.641 (0.513)	Data 0.000 (0.010)	Loss 4.1801 (4.3476)	Top-1 acc 28.125 (24.498)	Top-5 acc 50.391 (46.734)	lr 0.01919
Warmup Train [23][3210/3239]	Time 0.334 (0.513)	Data 0.000 (0.010)	Loss 4.3013 (4.3475)	Top-1 acc 28.125 (24.502)	Top-5 acc 46.484 (46.736)	lr 0.01918
Warmup Train [23][3220/3239]	Time 0.401 (0.513)	Data 0.000 (0.010)	Loss 4.4473 (4.3475)	Top-1 acc 21.484 (24.504)	Top-5 acc 41.797 (46.736)	lr 0.01918
Warmup Train [23][3230/3239]	Time 0.483 (0.513)	Data 0.000 (0.010)	Loss 4.2494 (4.3476)	Top-1 acc 26.562 (24.500)	Top-5 acc 47.656 (46.731)	lr 0.01917
Warmup Train [23][3239/3239]	Time 0.286 (0.513)	Data 0.000 (0.010)	Loss 4.1984 (4.3475)	Top-1 acc 25.926 (24.498)	Top-5 acc 49.383 (46.735)	lr 0.01916
==========Warmup Valid [23/40]	loss 3.331	top-1 acc 31.703	top-5 acc 56.294	Train top-1 24.498	top-5 46.735	flops: 442.4M
Warmup Train [24][0/3239]	Time 15.456 (15.456)	Data 13.867 (13.867)	Loss 4.3507 (4.3507)	Top-1 acc 25.781 (25.781)	Top-5 acc 48.047 (48.047)	lr 0.01916
Warmup Train [24][10/3239]	Time 0.698 (1.928)	Data 0.001 (1.266)	Loss 4.2917 (4.2747)	Top-1 acc 25.391 (26.030)	Top-5 acc 45.703 (47.692)	lr 0.01916
Warmup Train [24][20/3239]	Time 0.466 (1.254)	Data 0.001 (0.664)	Loss 4.2755 (4.3037)	Top-1 acc 22.656 (25.465)	Top-5 acc 43.359 (46.726)	lr 0.01915
Warmup Train [24][30/3239]	Time 0.514 (1.010)	Data 0.001 (0.451)	Loss 4.2442 (4.2969)	Top-1 acc 23.438 (25.328)	Top-5 acc 51.953 (47.127)	lr 0.01915
Warmup Train [24][40/3239]	Time 0.567 (0.888)	Data 0.001 (0.341)	Loss 4.3450 (4.2948)	Top-1 acc 25.000 (25.600)	Top-5 acc 48.047 (47.599)	lr 0.01914
Warmup Train [24][50/3239]	Time 0.694 (0.814)	Data 0.001 (0.275)	Loss 4.2786 (4.3057)	Top-1 acc 25.000 (25.506)	Top-5 acc 48.047 (47.350)	lr 0.01913
Warmup Train [24][60/3239]	Time 0.707 (0.766)	Data 0.001 (0.230)	Loss 4.4175 (4.3103)	Top-1 acc 23.828 (25.224)	Top-5 acc 46.875 (47.246)	lr 0.01913
Warmup Train [24][70/3239]	Time 0.358 (0.728)	Data 0.001 (0.198)	Loss 4.4843 (4.3103)	Top-1 acc 19.922 (25.253)	Top-5 acc 42.188 (47.315)	lr 0.01912
Warmup Train [24][80/3239]	Time 0.526 (0.704)	Data 0.001 (0.176)	Loss 4.3374 (4.3104)	Top-1 acc 26.953 (25.227)	Top-5 acc 47.656 (47.352)	lr 0.01912
Warmup Train [24][90/3239]	Time 0.589 (0.686)	Data 0.001 (0.157)	Loss 4.3206 (4.3035)	Top-1 acc 25.391 (25.245)	Top-5 acc 50.391 (47.549)	lr 0.01911
Warmup Train [24][100/3239]	Time 0.628 (0.668)	Data 0.001 (0.141)	Loss 4.3126 (4.3093)	Top-1 acc 24.219 (25.166)	Top-5 acc 50.391 (47.486)	lr 0.01910
Warmup Train [24][110/3239]	Time 0.511 (0.651)	Data 0.001 (0.129)	Loss 4.3368 (4.3121)	Top-1 acc 22.266 (25.032)	Top-5 acc 48.828 (47.515)	lr 0.01910
Warmup Train [24][120/3239]	Time 0.496 (0.640)	Data 0.001 (0.119)	Loss 4.2323 (4.3145)	Top-1 acc 27.344 (25.023)	Top-5 acc 49.219 (47.404)	lr 0.01909
Warmup Train [24][130/3239]	Time 0.398 (0.631)	Data 0.029 (0.111)	Loss 4.3504 (4.3133)	Top-1 acc 25.781 (25.128)	Top-5 acc 46.094 (47.400)	lr 0.01909
Warmup Train [24][140/3239]	Time 0.651 (0.623)	Data 0.001 (0.103)	Loss 4.1663 (4.3109)	Top-1 acc 30.859 (25.205)	Top-5 acc 50.000 (47.462)	lr 0.01908
Warmup Train [24][150/3239]	Time 0.429 (0.615)	Data 0.001 (0.097)	Loss 4.2601 (4.3105)	Top-1 acc 24.609 (25.178)	Top-5 acc 46.094 (47.444)	lr 0.01908
Warmup Train [24][160/3239]	Time 0.444 (0.607)	Data 0.001 (0.091)	Loss 4.2405 (4.3111)	Top-1 acc 25.781 (25.209)	Top-5 acc 47.266 (47.494)	lr 0.01907
Warmup Train [24][170/3239]	Time 0.490 (0.600)	Data 0.002 (0.087)	Loss 4.5983 (4.3126)	Top-1 acc 20.312 (25.206)	Top-5 acc 40.625 (47.442)	lr 0.01906
Warmup Train [24][180/3239]	Time 0.325 (0.594)	Data 0.001 (0.082)	Loss 4.1011 (4.3141)	Top-1 acc 31.250 (25.220)	Top-5 acc 52.344 (47.430)	lr 0.01906
Warmup Train [24][190/3239]	Time 0.571 (0.590)	Data 0.001 (0.079)	Loss 4.3459 (4.3121)	Top-1 acc 27.344 (25.223)	Top-5 acc 50.781 (47.513)	lr 0.01905
Warmup Train [24][200/3239]	Time 0.410 (0.585)	Data 0.001 (0.075)	Loss 4.4474 (4.3128)	Top-1 acc 26.562 (25.183)	Top-5 acc 43.750 (47.501)	lr 0.01905
Warmup Train [24][210/3239]	Time 0.640 (0.582)	Data 0.001 (0.072)	Loss 4.2678 (4.3125)	Top-1 acc 28.516 (25.193)	Top-5 acc 49.219 (47.482)	lr 0.01904
Warmup Train [24][220/3239]	Time 0.449 (0.578)	Data 0.001 (0.069)	Loss 4.4559 (4.3144)	Top-1 acc 19.531 (25.122)	Top-5 acc 42.578 (47.418)	lr 0.01903
Warmup Train [24][230/3239]	Time 0.542 (0.575)	Data 0.001 (0.066)	Loss 4.5431 (4.3174)	Top-1 acc 20.312 (25.108)	Top-5 acc 41.016 (47.328)	lr 0.01903
Warmup Train [24][240/3239]	Time 0.502 (0.573)	Data 0.001 (0.063)	Loss 4.2493 (4.3164)	Top-1 acc 25.391 (25.115)	Top-5 acc 48.828 (47.350)	lr 0.01902
Warmup Train [24][250/3239]	Time 0.497 (0.571)	Data 0.001 (0.061)	Loss 4.2957 (4.3176)	Top-1 acc 27.344 (25.104)	Top-5 acc 48.438 (47.303)	lr 0.01902
Warmup Train [24][260/3239]	Time 0.487 (0.569)	Data 0.001 (0.059)	Loss 4.3005 (4.3189)	Top-1 acc 24.219 (25.094)	Top-5 acc 48.828 (47.264)	lr 0.01901
Warmup Train [24][270/3239]	Time 0.587 (0.567)	Data 0.001 (0.057)	Loss 4.4001 (4.3182)	Top-1 acc 26.953 (25.123)	Top-5 acc 45.703 (47.312)	lr 0.01900
Warmup Train [24][280/3239]	Time 0.448 (0.565)	Data 0.001 (0.055)	Loss 4.3642 (4.3164)	Top-1 acc 27.734 (25.147)	Top-5 acc 43.359 (47.338)	lr 0.01900
Warmup Train [24][290/3239]	Time 0.445 (0.563)	Data 0.001 (0.054)	Loss 4.3552 (4.3149)	Top-1 acc 29.297 (25.176)	Top-5 acc 42.969 (47.380)	lr 0.01899
Warmup Train [24][300/3239]	Time 0.378 (0.561)	Data 0.001 (0.052)	Loss 4.3438 (4.3156)	Top-1 acc 26.172 (25.174)	Top-5 acc 46.484 (47.332)	lr 0.01899
Warmup Train [24][310/3239]	Time 0.519 (0.560)	Data 0.001 (0.051)	Loss 4.2950 (4.3139)	Top-1 acc 26.172 (25.166)	Top-5 acc 44.531 (47.335)	lr 0.01898
Warmup Train [24][320/3239]	Time 0.473 (0.559)	Data 0.001 (0.050)	Loss 4.2384 (4.3135)	Top-1 acc 26.562 (25.173)	Top-5 acc 48.047 (47.373)	lr 0.01898
Warmup Train [24][330/3239]	Time 0.594 (0.558)	Data 0.001 (0.048)	Loss 4.2772 (4.3125)	Top-1 acc 26.562 (25.173)	Top-5 acc 43.359 (47.404)	lr 0.01897
Warmup Train [24][340/3239]	Time 0.599 (0.556)	Data 0.001 (0.047)	Loss 4.3288 (4.3124)	Top-1 acc 23.828 (25.117)	Top-5 acc 48.047 (47.373)	lr 0.01896
Warmup Train [24][350/3239]	Time 0.516 (0.555)	Data 0.001 (0.046)	Loss 4.2579 (4.3115)	Top-1 acc 26.953 (25.140)	Top-5 acc 50.781 (47.410)	lr 0.01896
Warmup Train [24][360/3239]	Time 0.484 (0.554)	Data 0.001 (0.044)	Loss 4.4264 (4.3122)	Top-1 acc 24.609 (25.110)	Top-5 acc 43.359 (47.391)	lr 0.01895
Warmup Train [24][370/3239]	Time 0.517 (0.553)	Data 0.001 (0.044)	Loss 4.2970 (4.3120)	Top-1 acc 25.391 (25.137)	Top-5 acc 51.953 (47.414)	lr 0.01895
Warmup Train [24][380/3239]	Time 0.556 (0.552)	Data 0.001 (0.042)	Loss 4.2088 (4.3129)	Top-1 acc 27.734 (25.140)	Top-5 acc 47.656 (47.410)	lr 0.01894
Warmup Train [24][390/3239]	Time 0.474 (0.550)	Data 0.001 (0.041)	Loss 4.3984 (4.3139)	Top-1 acc 21.484 (25.092)	Top-5 acc 47.266 (47.397)	lr 0.01893
Warmup Train [24][400/3239]	Time 0.587 (0.549)	Data 0.001 (0.040)	Loss 4.1659 (4.3154)	Top-1 acc 26.172 (25.094)	Top-5 acc 51.953 (47.391)	lr 0.01893
Warmup Train [24][410/3239]	Time 0.436 (0.547)	Data 0.001 (0.040)	Loss 4.2765 (4.3150)	Top-1 acc 25.000 (25.088)	Top-5 acc 47.656 (47.406)	lr 0.01892
Warmup Train [24][420/3239]	Time 0.469 (0.545)	Data 0.001 (0.039)	Loss 4.3699 (4.3147)	Top-1 acc 23.438 (25.073)	Top-5 acc 47.656 (47.396)	lr 0.01892
Warmup Train [24][430/3239]	Time 0.518 (0.544)	Data 0.001 (0.038)	Loss 4.4519 (4.3162)	Top-1 acc 23.828 (25.062)	Top-5 acc 44.922 (47.384)	lr 0.01891
Warmup Train [24][440/3239]	Time 0.626 (0.544)	Data 0.001 (0.037)	Loss 4.1775 (4.3168)	Top-1 acc 30.469 (25.051)	Top-5 acc 55.469 (47.383)	lr 0.01890
Warmup Train [24][450/3239]	Time 0.394 (0.543)	Data 0.001 (0.037)	Loss 4.5166 (4.3165)	Top-1 acc 21.484 (25.055)	Top-5 acc 43.359 (47.386)	lr 0.01890
Warmup Train [24][460/3239]	Time 0.526 (0.543)	Data 0.001 (0.036)	Loss 4.4056 (4.3155)	Top-1 acc 20.312 (25.070)	Top-5 acc 45.312 (47.398)	lr 0.01889
Warmup Train [24][470/3239]	Time 0.363 (0.542)	Data 0.001 (0.035)	Loss 4.4424 (4.3162)	Top-1 acc 20.703 (25.075)	Top-5 acc 43.750 (47.398)	lr 0.01889
Warmup Train [24][480/3239]	Time 0.412 (0.541)	Data 0.001 (0.035)	Loss 4.3147 (4.3150)	Top-1 acc 23.438 (25.099)	Top-5 acc 48.828 (47.446)	lr 0.01888
Warmup Train [24][490/3239]	Time 0.539 (0.541)	Data 0.001 (0.034)	Loss 4.3030 (4.3143)	Top-1 acc 26.172 (25.107)	Top-5 acc 48.828 (47.453)	lr 0.01888
Warmup Train [24][500/3239]	Time 0.505 (0.540)	Data 0.001 (0.034)	Loss 4.3720 (4.3141)	Top-1 acc 23.047 (25.097)	Top-5 acc 47.656 (47.468)	lr 0.01887
Warmup Train [24][510/3239]	Time 0.371 (0.539)	Data 0.001 (0.033)	Loss 4.1713 (4.3141)	Top-1 acc 23.438 (25.086)	Top-5 acc 49.219 (47.442)	lr 0.01886
Warmup Train [24][520/3239]	Time 0.375 (0.539)	Data 0.001 (0.033)	Loss 4.3384 (4.3142)	Top-1 acc 25.391 (25.088)	Top-5 acc 44.922 (47.433)	lr 0.01886
Warmup Train [24][530/3239]	Time 0.435 (0.539)	Data 0.001 (0.033)	Loss 4.1583 (4.3135)	Top-1 acc 31.250 (25.090)	Top-5 acc 53.125 (47.438)	lr 0.01885
Warmup Train [24][540/3239]	Time 0.495 (0.539)	Data 0.001 (0.032)	Loss 4.1597 (4.3133)	Top-1 acc 27.734 (25.103)	Top-5 acc 50.391 (47.459)	lr 0.01885
Warmup Train [24][550/3239]	Time 0.545 (0.538)	Data 0.001 (0.032)	Loss 4.3467 (4.3145)	Top-1 acc 25.781 (25.091)	Top-5 acc 47.266 (47.428)	lr 0.01884
Warmup Train [24][560/3239]	Time 0.543 (0.538)	Data 0.001 (0.031)	Loss 4.2033 (4.3144)	Top-1 acc 26.953 (25.086)	Top-5 acc 50.000 (47.421)	lr 0.01883
Warmup Train [24][570/3239]	Time 0.499 (0.538)	Data 0.002 (0.031)	Loss 4.2874 (4.3142)	Top-1 acc 22.656 (25.077)	Top-5 acc 49.609 (47.417)	lr 0.01883
Warmup Train [24][580/3239]	Time 0.499 (0.537)	Data 0.001 (0.030)	Loss 4.2210 (4.3151)	Top-1 acc 30.859 (25.069)	Top-5 acc 50.781 (47.403)	lr 0.01882
Warmup Train [24][590/3239]	Time 0.511 (0.537)	Data 0.001 (0.030)	Loss 4.1552 (4.3141)	Top-1 acc 28.906 (25.096)	Top-5 acc 50.781 (47.438)	lr 0.01882
Warmup Train [24][600/3239]	Time 0.477 (0.536)	Data 0.001 (0.029)	Loss 4.4083 (4.3139)	Top-1 acc 21.484 (25.084)	Top-5 acc 46.875 (47.440)	lr 0.01881
Warmup Train [24][610/3239]	Time 0.569 (0.536)	Data 0.001 (0.029)	Loss 4.4587 (4.3131)	Top-1 acc 21.094 (25.091)	Top-5 acc 45.312 (47.472)	lr 0.01881
Warmup Train [24][620/3239]	Time 0.631 (0.535)	Data 0.001 (0.029)	Loss 4.3621 (4.3130)	Top-1 acc 26.562 (25.107)	Top-5 acc 46.094 (47.474)	lr 0.01880
Warmup Train [24][630/3239]	Time 0.514 (0.535)	Data 0.001 (0.028)	Loss 4.2624 (4.3127)	Top-1 acc 26.562 (25.111)	Top-5 acc 47.656 (47.475)	lr 0.01879
Warmup Train [24][640/3239]	Time 0.594 (0.534)	Data 0.001 (0.028)	Loss 4.3416 (4.3133)	Top-1 acc 25.000 (25.099)	Top-5 acc 46.875 (47.461)	lr 0.01879
Warmup Train [24][650/3239]	Time 0.481 (0.533)	Data 0.001 (0.027)	Loss 4.2236 (4.3128)	Top-1 acc 25.000 (25.100)	Top-5 acc 49.219 (47.462)	lr 0.01878
Warmup Train [24][660/3239]	Time 0.691 (0.532)	Data 0.001 (0.027)	Loss 4.3806 (4.3134)	Top-1 acc 26.562 (25.095)	Top-5 acc 47.656 (47.436)	lr 0.01878
Warmup Train [24][670/3239]	Time 0.450 (0.532)	Data 0.001 (0.027)	Loss 4.4052 (4.3127)	Top-1 acc 21.484 (25.099)	Top-5 acc 46.484 (47.436)	lr 0.01877
Warmup Train [24][680/3239]	Time 0.552 (0.532)	Data 0.001 (0.027)	Loss 4.3573 (4.3125)	Top-1 acc 24.219 (25.089)	Top-5 acc 45.703 (47.445)	lr 0.01876
Warmup Train [24][690/3239]	Time 0.552 (0.532)	Data 0.001 (0.026)	Loss 4.3151 (4.3135)	Top-1 acc 26.953 (25.084)	Top-5 acc 50.000 (47.430)	lr 0.01876
Warmup Train [24][700/3239]	Time 0.514 (0.531)	Data 0.001 (0.026)	Loss 4.3361 (4.3138)	Top-1 acc 25.781 (25.091)	Top-5 acc 45.703 (47.438)	lr 0.01875
Warmup Train [24][710/3239]	Time 0.673 (0.531)	Data 0.001 (0.026)	Loss 4.3816 (4.3141)	Top-1 acc 23.828 (25.086)	Top-5 acc 48.047 (47.445)	lr 0.01875
Warmup Train [24][720/3239]	Time 0.553 (0.531)	Data 0.001 (0.025)	Loss 4.4133 (4.3143)	Top-1 acc 23.828 (25.076)	Top-5 acc 46.094 (47.445)	lr 0.01874
Warmup Train [24][730/3239]	Time 0.686 (0.531)	Data 0.001 (0.025)	Loss 4.5290 (4.3154)	Top-1 acc 21.484 (25.060)	Top-5 acc 44.922 (47.418)	lr 0.01873
Warmup Train [24][740/3239]	Time 0.544 (0.530)	Data 0.001 (0.025)	Loss 4.4685 (4.3164)	Top-1 acc 22.656 (25.051)	Top-5 acc 45.703 (47.397)	lr 0.01873
Warmup Train [24][750/3239]	Time 0.382 (0.530)	Data 0.002 (0.025)	Loss 4.2468 (4.3156)	Top-1 acc 26.172 (25.060)	Top-5 acc 48.828 (47.411)	lr 0.01872
Warmup Train [24][760/3239]	Time 0.543 (0.530)	Data 0.001 (0.024)	Loss 4.3511 (4.3162)	Top-1 acc 28.125 (25.063)	Top-5 acc 48.047 (47.404)	lr 0.01872
Warmup Train [24][770/3239]	Time 0.577 (0.530)	Data 0.001 (0.024)	Loss 4.3829 (4.3162)	Top-1 acc 24.609 (25.077)	Top-5 acc 45.312 (47.401)	lr 0.01871
Warmup Train [24][780/3239]	Time 0.590 (0.530)	Data 0.001 (0.024)	Loss 4.3359 (4.3166)	Top-1 acc 24.219 (25.082)	Top-5 acc 46.484 (47.394)	lr 0.01871
Warmup Train [24][790/3239]	Time 0.513 (0.530)	Data 0.001 (0.024)	Loss 4.2126 (4.3159)	Top-1 acc 28.906 (25.094)	Top-5 acc 54.688 (47.418)	lr 0.01870
Warmup Train [24][800/3239]	Time 0.566 (0.529)	Data 0.001 (0.023)	Loss 4.3800 (4.3160)	Top-1 acc 25.781 (25.114)	Top-5 acc 45.703 (47.426)	lr 0.01869
Warmup Train [24][810/3239]	Time 0.429 (0.529)	Data 0.001 (0.023)	Loss 4.3472 (4.3164)	Top-1 acc 24.609 (25.101)	Top-5 acc 44.531 (47.414)	lr 0.01869
Warmup Train [24][820/3239]	Time 0.665 (0.529)	Data 0.001 (0.023)	Loss 4.1874 (4.3161)	Top-1 acc 28.125 (25.124)	Top-5 acc 49.609 (47.417)	lr 0.01868
Warmup Train [24][830/3239]	Time 0.572 (0.529)	Data 0.001 (0.023)	Loss 4.2179 (4.3155)	Top-1 acc 26.953 (25.133)	Top-5 acc 48.828 (47.429)	lr 0.01868
Warmup Train [24][840/3239]	Time 0.550 (0.529)	Data 0.001 (0.023)	Loss 4.2923 (4.3148)	Top-1 acc 26.562 (25.153)	Top-5 acc 46.484 (47.441)	lr 0.01867
Warmup Train [24][850/3239]	Time 0.546 (0.529)	Data 0.001 (0.022)	Loss 4.2586 (4.3148)	Top-1 acc 27.734 (25.165)	Top-5 acc 51.562 (47.455)	lr 0.01866
Warmup Train [24][860/3239]	Time 0.430 (0.528)	Data 0.001 (0.022)	Loss 4.3437 (4.3147)	Top-1 acc 23.047 (25.162)	Top-5 acc 45.312 (47.465)	lr 0.01866
Warmup Train [24][870/3239]	Time 0.492 (0.528)	Data 0.001 (0.022)	Loss 4.1567 (4.3145)	Top-1 acc 28.906 (25.169)	Top-5 acc 50.000 (47.461)	lr 0.01865
Warmup Train [24][880/3239]	Time 0.396 (0.527)	Data 0.001 (0.022)	Loss 4.3877 (4.3142)	Top-1 acc 24.219 (25.168)	Top-5 acc 43.750 (47.466)	lr 0.01865
Warmup Train [24][890/3239]	Time 0.563 (0.527)	Data 0.001 (0.021)	Loss 4.1217 (4.3136)	Top-1 acc 26.172 (25.190)	Top-5 acc 51.172 (47.473)	lr 0.01864
Warmup Train [24][900/3239]	Time 0.320 (0.526)	Data 0.001 (0.021)	Loss 4.5429 (4.3142)	Top-1 acc 23.047 (25.157)	Top-5 acc 42.969 (47.452)	lr 0.01863
Warmup Train [24][910/3239]	Time 0.610 (0.526)	Data 0.001 (0.021)	Loss 4.2214 (4.3139)	Top-1 acc 26.172 (25.167)	Top-5 acc 49.219 (47.462)	lr 0.01863
Warmup Train [24][920/3239]	Time 0.369 (0.526)	Data 0.001 (0.021)	Loss 4.4903 (4.3138)	Top-1 acc 21.094 (25.162)	Top-5 acc 41.016 (47.473)	lr 0.01862
Warmup Train [24][930/3239]	Time 0.619 (0.526)	Data 0.001 (0.021)	Loss 4.4141 (4.3144)	Top-1 acc 24.219 (25.148)	Top-5 acc 48.047 (47.458)	lr 0.01862
Warmup Train [24][940/3239]	Time 0.558 (0.526)	Data 0.001 (0.021)	Loss 4.4647 (4.3137)	Top-1 acc 21.484 (25.161)	Top-5 acc 41.797 (47.474)	lr 0.01861
Warmup Train [24][950/3239]	Time 0.492 (0.526)	Data 0.001 (0.020)	Loss 4.2799 (4.3138)	Top-1 acc 26.953 (25.163)	Top-5 acc 48.047 (47.459)	lr 0.01861
Warmup Train [24][960/3239]	Time 0.547 (0.525)	Data 0.001 (0.020)	Loss 4.1616 (4.3136)	Top-1 acc 26.562 (25.157)	Top-5 acc 51.562 (47.469)	lr 0.01860
Warmup Train [24][970/3239]	Time 0.378 (0.525)	Data 0.001 (0.020)	Loss 4.0785 (4.3134)	Top-1 acc 32.422 (25.167)	Top-5 acc 54.688 (47.475)	lr 0.01859
Warmup Train [24][980/3239]	Time 0.565 (0.525)	Data 0.001 (0.020)	Loss 4.3482 (4.3133)	Top-1 acc 24.219 (25.162)	Top-5 acc 45.703 (47.474)	lr 0.01859
Warmup Train [24][990/3239]	Time 0.452 (0.525)	Data 0.001 (0.020)	Loss 4.2833 (4.3130)	Top-1 acc 26.562 (25.160)	Top-5 acc 47.266 (47.475)	lr 0.01858
Warmup Train [24][1000/3239]	Time 0.696 (0.525)	Data 0.001 (0.020)	Loss 4.3220 (4.3132)	Top-1 acc 26.953 (25.169)	Top-5 acc 46.875 (47.475)	lr 0.01858
Warmup Train [24][1010/3239]	Time 0.557 (0.525)	Data 0.001 (0.020)	Loss 4.2160 (4.3132)	Top-1 acc 28.516 (25.168)	Top-5 acc 50.391 (47.479)	lr 0.01857
Warmup Train [24][1020/3239]	Time 0.460 (0.525)	Data 0.001 (0.019)	Loss 4.2892 (4.3130)	Top-1 acc 25.391 (25.177)	Top-5 acc 51.562 (47.491)	lr 0.01856
Warmup Train [24][1030/3239]	Time 0.610 (0.525)	Data 0.001 (0.019)	Loss 4.3502 (4.3129)	Top-1 acc 23.438 (25.178)	Top-5 acc 46.094 (47.486)	lr 0.01856
Warmup Train [24][1040/3239]	Time 0.635 (0.525)	Data 0.001 (0.019)	Loss 4.3905 (4.3130)	Top-1 acc 22.266 (25.176)	Top-5 acc 47.656 (47.477)	lr 0.01855
Warmup Train [24][1050/3239]	Time 0.422 (0.524)	Data 0.001 (0.019)	Loss 4.2903 (4.3128)	Top-1 acc 21.875 (25.172)	Top-5 acc 48.828 (47.489)	lr 0.01855
Warmup Train [24][1060/3239]	Time 0.601 (0.524)	Data 0.001 (0.019)	Loss 4.2754 (4.3127)	Top-1 acc 28.906 (25.172)	Top-5 acc 51.562 (47.491)	lr 0.01854
Warmup Train [24][1070/3239]	Time 0.670 (0.525)	Data 0.001 (0.019)	Loss 4.2402 (4.3120)	Top-1 acc 26.172 (25.179)	Top-5 acc 48.828 (47.506)	lr 0.01854
Warmup Train [24][1080/3239]	Time 0.496 (0.525)	Data 0.001 (0.019)	Loss 4.1749 (4.3118)	Top-1 acc 28.516 (25.179)	Top-5 acc 50.781 (47.510)	lr 0.01853
Warmup Train [24][1090/3239]	Time 0.494 (0.524)	Data 0.001 (0.019)	Loss 4.4718 (4.3120)	Top-1 acc 23.047 (25.173)	Top-5 acc 44.922 (47.505)	lr 0.01852
Warmup Train [24][1100/3239]	Time 0.466 (0.524)	Data 0.001 (0.018)	Loss 4.6079 (4.3119)	Top-1 acc 21.875 (25.177)	Top-5 acc 39.062 (47.509)	lr 0.01852
Warmup Train [24][1110/3239]	Time 0.592 (0.524)	Data 0.003 (0.018)	Loss 4.3348 (4.3112)	Top-1 acc 24.609 (25.189)	Top-5 acc 49.219 (47.522)	lr 0.01851
Warmup Train [24][1120/3239]	Time 0.494 (0.524)	Data 0.001 (0.018)	Loss 4.2609 (4.3113)	Top-1 acc 25.000 (25.197)	Top-5 acc 47.266 (47.523)	lr 0.01851
Warmup Train [24][1130/3239]	Time 0.667 (0.523)	Data 0.001 (0.018)	Loss 4.2945 (4.3111)	Top-1 acc 24.609 (25.207)	Top-5 acc 47.656 (47.529)	lr 0.01850
Warmup Train [24][1140/3239]	Time 0.394 (0.523)	Data 0.001 (0.018)	Loss 4.2541 (4.3111)	Top-1 acc 25.000 (25.214)	Top-5 acc 53.125 (47.529)	lr 0.01849
Warmup Train [24][1150/3239]	Time 0.456 (0.522)	Data 0.001 (0.018)	Loss 4.3810 (4.3115)	Top-1 acc 22.656 (25.212)	Top-5 acc 43.750 (47.521)	lr 0.01849
Warmup Train [24][1160/3239]	Time 0.425 (0.523)	Data 0.001 (0.018)	Loss 4.3248 (4.3112)	Top-1 acc 23.828 (25.207)	Top-5 acc 44.531 (47.530)	lr 0.01848
Warmup Train [24][1170/3239]	Time 0.388 (0.522)	Data 0.001 (0.018)	Loss 4.1732 (4.3110)	Top-1 acc 26.953 (25.207)	Top-5 acc 51.562 (47.538)	lr 0.01848
Warmup Train [24][1180/3239]	Time 0.507 (0.522)	Data 0.001 (0.018)	Loss 4.2019 (4.3107)	Top-1 acc 25.000 (25.211)	Top-5 acc 47.266 (47.546)	lr 0.01847
Warmup Train [24][1190/3239]	Time 0.510 (0.522)	Data 0.027 (0.018)	Loss 4.3333 (4.3107)	Top-1 acc 21.484 (25.219)	Top-5 acc 49.219 (47.549)	lr 0.01847
Warmup Train [24][1200/3239]	Time 0.409 (0.522)	Data 0.001 (0.018)	Loss 4.2659 (4.3111)	Top-1 acc 26.953 (25.213)	Top-5 acc 47.656 (47.544)	lr 0.01846
Warmup Train [24][1210/3239]	Time 0.468 (0.522)	Data 0.001 (0.018)	Loss 4.3861 (4.3115)	Top-1 acc 23.047 (25.202)	Top-5 acc 43.359 (47.535)	lr 0.01845
Warmup Train [24][1220/3239]	Time 0.424 (0.522)	Data 0.001 (0.017)	Loss 4.4638 (4.3117)	Top-1 acc 19.531 (25.196)	Top-5 acc 40.625 (47.534)	lr 0.01845
Warmup Train [24][1230/3239]	Time 0.567 (0.522)	Data 0.001 (0.017)	Loss 4.3940 (4.3118)	Top-1 acc 22.656 (25.185)	Top-5 acc 44.141 (47.531)	lr 0.01844
Warmup Train [24][1240/3239]	Time 0.499 (0.522)	Data 0.001 (0.017)	Loss 4.1757 (4.3117)	Top-1 acc 26.953 (25.187)	Top-5 acc 50.391 (47.532)	lr 0.01844
Warmup Train [24][1250/3239]	Time 0.377 (0.522)	Data 0.001 (0.017)	Loss 4.3785 (4.3118)	Top-1 acc 26.172 (25.185)	Top-5 acc 46.875 (47.538)	lr 0.01843
Warmup Train [24][1260/3239]	Time 0.604 (0.522)	Data 0.001 (0.017)	Loss 4.4340 (4.3119)	Top-1 acc 22.656 (25.180)	Top-5 acc 43.750 (47.534)	lr 0.01842
Warmup Train [24][1270/3239]	Time 0.474 (0.522)	Data 0.001 (0.017)	Loss 4.4064 (4.3115)	Top-1 acc 19.531 (25.173)	Top-5 acc 42.188 (47.541)	lr 0.01842
Warmup Train [24][1280/3239]	Time 0.630 (0.521)	Data 0.001 (0.017)	Loss 4.2510 (4.3118)	Top-1 acc 28.516 (25.177)	Top-5 acc 52.344 (47.543)	lr 0.01841
Warmup Train [24][1290/3239]	Time 0.618 (0.521)	Data 0.001 (0.017)	Loss 4.3693 (4.3117)	Top-1 acc 23.828 (25.184)	Top-5 acc 46.875 (47.545)	lr 0.01841
Warmup Train [24][1300/3239]	Time 0.592 (0.521)	Data 0.001 (0.017)	Loss 4.5554 (4.3121)	Top-1 acc 23.438 (25.178)	Top-5 acc 40.234 (47.528)	lr 0.01840
Warmup Train [24][1310/3239]	Time 0.494 (0.521)	Data 0.001 (0.017)	Loss 4.2568 (4.3125)	Top-1 acc 25.000 (25.167)	Top-5 acc 50.000 (47.526)	lr 0.01839
Warmup Train [24][1320/3239]	Time 0.663 (0.521)	Data 0.001 (0.017)	Loss 4.3153 (4.3120)	Top-1 acc 28.125 (25.180)	Top-5 acc 48.047 (47.544)	lr 0.01839
Warmup Train [24][1330/3239]	Time 0.504 (0.521)	Data 0.001 (0.016)	Loss 4.3572 (4.3118)	Top-1 acc 29.297 (25.193)	Top-5 acc 47.656 (47.552)	lr 0.01838
Warmup Train [24][1340/3239]	Time 0.493 (0.521)	Data 0.001 (0.016)	Loss 4.5461 (4.3115)	Top-1 acc 21.875 (25.209)	Top-5 acc 39.062 (47.563)	lr 0.01838
Warmup Train [24][1350/3239]	Time 0.634 (0.521)	Data 0.001 (0.016)	Loss 4.2196 (4.3112)	Top-1 acc 26.172 (25.219)	Top-5 acc 50.781 (47.567)	lr 0.01837
Warmup Train [24][1360/3239]	Time 0.488 (0.521)	Data 0.001 (0.016)	Loss 4.2310 (4.3108)	Top-1 acc 26.562 (25.230)	Top-5 acc 49.219 (47.575)	lr 0.01837
Warmup Train [24][1370/3239]	Time 0.443 (0.520)	Data 0.001 (0.016)	Loss 4.1466 (4.3108)	Top-1 acc 24.609 (25.218)	Top-5 acc 49.219 (47.580)	lr 0.01836
Warmup Train [24][1380/3239]	Time 0.576 (0.520)	Data 0.001 (0.016)	Loss 4.3586 (4.3111)	Top-1 acc 22.656 (25.207)	Top-5 acc 46.484 (47.569)	lr 0.01835
Warmup Train [24][1390/3239]	Time 0.552 (0.520)	Data 0.001 (0.016)	Loss 4.3958 (4.3117)	Top-1 acc 23.047 (25.202)	Top-5 acc 44.141 (47.558)	lr 0.01835
Warmup Train [24][1400/3239]	Time 0.722 (0.520)	Data 0.001 (0.016)	Loss 4.4241 (4.3123)	Top-1 acc 22.656 (25.189)	Top-5 acc 44.141 (47.544)	lr 0.01834
Warmup Train [24][1410/3239]	Time 0.512 (0.520)	Data 0.001 (0.016)	Loss 4.3137 (4.3122)	Top-1 acc 23.828 (25.192)	Top-5 acc 47.266 (47.544)	lr 0.01834
Warmup Train [24][1420/3239]	Time 0.583 (0.520)	Data 0.001 (0.016)	Loss 4.2432 (4.3119)	Top-1 acc 26.953 (25.208)	Top-5 acc 50.391 (47.548)	lr 0.01833
Warmup Train [24][1430/3239]	Time 0.487 (0.520)	Data 0.001 (0.016)	Loss 4.2947 (4.3116)	Top-1 acc 25.781 (25.210)	Top-5 acc 46.094 (47.552)	lr 0.01832
Warmup Train [24][1440/3239]	Time 0.594 (0.520)	Data 0.001 (0.016)	Loss 4.2317 (4.3115)	Top-1 acc 26.953 (25.208)	Top-5 acc 51.172 (47.556)	lr 0.01832
Warmup Train [24][1450/3239]	Time 0.469 (0.520)	Data 0.001 (0.016)	Loss 4.1855 (4.3111)	Top-1 acc 30.078 (25.216)	Top-5 acc 50.391 (47.570)	lr 0.01831
Warmup Train [24][1460/3239]	Time 0.498 (0.520)	Data 0.001 (0.015)	Loss 4.1691 (4.3110)	Top-1 acc 32.031 (25.220)	Top-5 acc 50.781 (47.578)	lr 0.01831
Warmup Train [24][1470/3239]	Time 0.523 (0.520)	Data 0.001 (0.015)	Loss 4.4578 (4.3115)	Top-1 acc 23.438 (25.214)	Top-5 acc 47.266 (47.578)	lr 0.01830
Warmup Train [24][1480/3239]	Time 0.408 (0.520)	Data 0.001 (0.015)	Loss 4.2258 (4.3115)	Top-1 acc 24.609 (25.211)	Top-5 acc 49.219 (47.580)	lr 0.01830
Warmup Train [24][1490/3239]	Time 0.631 (0.520)	Data 0.001 (0.015)	Loss 4.3003 (4.3115)	Top-1 acc 29.688 (25.214)	Top-5 acc 50.391 (47.584)	lr 0.01829
Warmup Train [24][1500/3239]	Time 0.515 (0.520)	Data 0.001 (0.015)	Loss 4.3672 (4.3119)	Top-1 acc 22.656 (25.210)	Top-5 acc 48.828 (47.576)	lr 0.01828
Warmup Train [24][1510/3239]	Time 0.436 (0.520)	Data 0.001 (0.015)	Loss 4.2927 (4.3118)	Top-1 acc 25.781 (25.211)	Top-5 acc 49.609 (47.578)	lr 0.01828
Warmup Train [24][1520/3239]	Time 0.634 (0.520)	Data 0.001 (0.015)	Loss 4.2933 (4.3114)	Top-1 acc 25.781 (25.219)	Top-5 acc 47.656 (47.585)	lr 0.01827
Warmup Train [24][1530/3239]	Time 0.588 (0.520)	Data 0.001 (0.015)	Loss 4.3786 (4.3115)	Top-1 acc 25.781 (25.215)	Top-5 acc 48.047 (47.579)	lr 0.01827
Warmup Train [24][1540/3239]	Time 0.486 (0.520)	Data 0.001 (0.015)	Loss 4.4624 (4.3121)	Top-1 acc 22.266 (25.201)	Top-5 acc 48.438 (47.567)	lr 0.01826
Warmup Train [24][1550/3239]	Time 0.470 (0.520)	Data 0.001 (0.015)	Loss 4.1992 (4.3120)	Top-1 acc 24.609 (25.204)	Top-5 acc 51.953 (47.569)	lr 0.01825
Warmup Train [24][1560/3239]	Time 0.545 (0.520)	Data 0.001 (0.015)	Loss 4.2718 (4.3119)	Top-1 acc 25.000 (25.205)	Top-5 acc 48.047 (47.573)	lr 0.01825
Warmup Train [24][1570/3239]	Time 0.575 (0.520)	Data 0.001 (0.015)	Loss 4.0600 (4.3113)	Top-1 acc 28.906 (25.206)	Top-5 acc 54.297 (47.582)	lr 0.01824
Warmup Train [24][1580/3239]	Time 0.421 (0.519)	Data 0.001 (0.015)	Loss 4.4513 (4.3112)	Top-1 acc 22.266 (25.209)	Top-5 acc 44.141 (47.580)	lr 0.01824
Warmup Train [24][1590/3239]	Time 0.269 (0.519)	Data 0.001 (0.015)	Loss 4.3252 (4.3111)	Top-1 acc 24.219 (25.207)	Top-5 acc 46.484 (47.583)	lr 0.01823
Warmup Train [24][1600/3239]	Time 0.487 (0.520)	Data 0.001 (0.015)	Loss 4.3147 (4.3109)	Top-1 acc 23.438 (25.212)	Top-5 acc 45.703 (47.585)	lr 0.01823
Warmup Train [24][1610/3239]	Time 0.512 (0.519)	Data 0.001 (0.015)	Loss 4.4630 (4.3112)	Top-1 acc 25.000 (25.206)	Top-5 acc 47.656 (47.577)	lr 0.01822
Warmup Train [24][1620/3239]	Time 0.592 (0.519)	Data 0.001 (0.015)	Loss 4.4424 (4.3110)	Top-1 acc 22.266 (25.204)	Top-5 acc 43.359 (47.581)	lr 0.01821
Warmup Train [24][1630/3239]	Time 0.634 (0.519)	Data 0.001 (0.015)	Loss 4.1392 (4.3108)	Top-1 acc 27.734 (25.205)	Top-5 acc 50.781 (47.583)	lr 0.01821
Warmup Train [24][1640/3239]	Time 0.474 (0.519)	Data 0.001 (0.014)	Loss 4.4870 (4.3108)	Top-1 acc 21.875 (25.210)	Top-5 acc 42.188 (47.584)	lr 0.01820
Warmup Train [24][1650/3239]	Time 0.520 (0.519)	Data 0.001 (0.014)	Loss 4.3032 (4.3104)	Top-1 acc 24.609 (25.218)	Top-5 acc 45.703 (47.592)	lr 0.01820
Warmup Train [24][1660/3239]	Time 0.395 (0.519)	Data 0.001 (0.014)	Loss 4.3470 (4.3104)	Top-1 acc 29.688 (25.223)	Top-5 acc 48.438 (47.595)	lr 0.01819
Warmup Train [24][1670/3239]	Time 0.517 (0.519)	Data 0.001 (0.014)	Loss 4.2304 (4.3102)	Top-1 acc 23.828 (25.220)	Top-5 acc 50.781 (47.596)	lr 0.01818
Warmup Train [24][1680/3239]	Time 0.397 (0.519)	Data 0.001 (0.014)	Loss 4.1826 (4.3101)	Top-1 acc 25.781 (25.224)	Top-5 acc 51.953 (47.600)	lr 0.01818
Warmup Train [24][1690/3239]	Time 0.580 (0.519)	Data 0.001 (0.014)	Loss 4.2701 (4.3103)	Top-1 acc 23.047 (25.217)	Top-5 acc 48.047 (47.596)	lr 0.01817
Warmup Train [24][1700/3239]	Time 0.566 (0.519)	Data 0.001 (0.014)	Loss 4.3731 (4.3103)	Top-1 acc 25.781 (25.210)	Top-5 acc 51.562 (47.597)	lr 0.01817
Warmup Train [24][1710/3239]	Time 0.616 (0.519)	Data 0.001 (0.014)	Loss 4.0361 (4.3097)	Top-1 acc 29.688 (25.218)	Top-5 acc 51.953 (47.612)	lr 0.01816
Warmup Train [24][1720/3239]	Time 0.578 (0.519)	Data 0.001 (0.014)	Loss 4.1268 (4.3096)	Top-1 acc 24.609 (25.221)	Top-5 acc 51.172 (47.613)	lr 0.01816
Warmup Train [24][1730/3239]	Time 0.369 (0.519)	Data 0.001 (0.014)	Loss 4.4946 (4.3096)	Top-1 acc 21.094 (25.224)	Top-5 acc 44.141 (47.618)	lr 0.01815
Warmup Train [24][1740/3239]	Time 0.604 (0.519)	Data 0.001 (0.014)	Loss 4.3643 (4.3099)	Top-1 acc 22.266 (25.218)	Top-5 acc 44.141 (47.610)	lr 0.01814
Warmup Train [24][1750/3239]	Time 0.481 (0.519)	Data 0.001 (0.014)	Loss 4.3320 (4.3100)	Top-1 acc 22.266 (25.216)	Top-5 acc 48.828 (47.612)	lr 0.01814
Warmup Train [24][1760/3239]	Time 0.486 (0.519)	Data 0.001 (0.014)	Loss 4.4494 (4.3099)	Top-1 acc 22.266 (25.217)	Top-5 acc 41.406 (47.617)	lr 0.01813
Warmup Train [24][1770/3239]	Time 0.494 (0.519)	Data 0.001 (0.014)	Loss 4.3394 (4.3097)	Top-1 acc 26.172 (25.220)	Top-5 acc 46.484 (47.628)	lr 0.01813
Warmup Train [24][1780/3239]	Time 0.369 (0.519)	Data 0.001 (0.014)	Loss 4.3310 (4.3097)	Top-1 acc 25.781 (25.222)	Top-5 acc 47.266 (47.630)	lr 0.01812
Warmup Train [24][1790/3239]	Time 0.433 (0.519)	Data 0.001 (0.014)	Loss 4.5061 (4.3100)	Top-1 acc 19.531 (25.217)	Top-5 acc 41.016 (47.625)	lr 0.01811
Warmup Train [24][1800/3239]	Time 0.521 (0.519)	Data 0.001 (0.014)	Loss 4.2159 (4.3097)	Top-1 acc 25.391 (25.221)	Top-5 acc 46.094 (47.635)	lr 0.01811
Warmup Train [24][1810/3239]	Time 0.740 (0.519)	Data 0.001 (0.014)	Loss 4.4307 (4.3099)	Top-1 acc 24.219 (25.220)	Top-5 acc 42.188 (47.631)	lr 0.01810
Warmup Train [24][1820/3239]	Time 0.539 (0.519)	Data 0.001 (0.014)	Loss 4.2238 (4.3100)	Top-1 acc 24.609 (25.222)	Top-5 acc 50.391 (47.629)	lr 0.01810
Warmup Train [24][1830/3239]	Time 0.330 (0.519)	Data 0.001 (0.014)	Loss 4.4181 (4.3098)	Top-1 acc 23.438 (25.226)	Top-5 acc 43.359 (47.628)	lr 0.01809
Warmup Train [24][1840/3239]	Time 0.440 (0.519)	Data 0.001 (0.014)	Loss 4.3448 (4.3099)	Top-1 acc 24.609 (25.224)	Top-5 acc 45.703 (47.626)	lr 0.01809
Warmup Train [24][1850/3239]	Time 0.360 (0.519)	Data 0.001 (0.014)	Loss 4.2430 (4.3097)	Top-1 acc 23.438 (25.225)	Top-5 acc 49.219 (47.635)	lr 0.01808
Warmup Train [24][1860/3239]	Time 0.500 (0.519)	Data 0.001 (0.014)	Loss 4.4885 (4.3098)	Top-1 acc 21.094 (25.220)	Top-5 acc 44.141 (47.630)	lr 0.01807
Warmup Train [24][1870/3239]	Time 0.717 (0.518)	Data 0.001 (0.014)	Loss 4.2577 (4.3097)	Top-1 acc 25.000 (25.219)	Top-5 acc 45.312 (47.630)	lr 0.01807
Warmup Train [24][1880/3239]	Time 0.349 (0.518)	Data 0.001 (0.013)	Loss 4.4992 (4.3096)	Top-1 acc 23.438 (25.217)	Top-5 acc 43.359 (47.637)	lr 0.01806
Warmup Train [24][1890/3239]	Time 0.406 (0.518)	Data 0.001 (0.013)	Loss 4.2930 (4.3097)	Top-1 acc 25.781 (25.217)	Top-5 acc 47.656 (47.638)	lr 0.01806
Warmup Train [24][1900/3239]	Time 0.574 (0.518)	Data 0.001 (0.013)	Loss 4.4160 (4.3097)	Top-1 acc 22.266 (25.220)	Top-5 acc 44.922 (47.642)	lr 0.01805
Warmup Train [24][1910/3239]	Time 0.579 (0.518)	Data 0.001 (0.013)	Loss 4.1896 (4.3099)	Top-1 acc 27.344 (25.219)	Top-5 acc 49.609 (47.638)	lr 0.01805
Warmup Train [24][1920/3239]	Time 0.616 (0.518)	Data 0.001 (0.013)	Loss 4.2430 (4.3100)	Top-1 acc 24.609 (25.215)	Top-5 acc 47.266 (47.632)	lr 0.01804
Warmup Train [24][1930/3239]	Time 0.639 (0.518)	Data 0.001 (0.013)	Loss 4.3903 (4.3100)	Top-1 acc 25.391 (25.217)	Top-5 acc 46.875 (47.630)	lr 0.01803
Warmup Train [24][1940/3239]	Time 0.658 (0.518)	Data 0.001 (0.013)	Loss 4.2650 (4.3103)	Top-1 acc 22.266 (25.206)	Top-5 acc 46.484 (47.626)	lr 0.01803
Warmup Train [24][1950/3239]	Time 0.659 (0.518)	Data 0.001 (0.013)	Loss 4.2496 (4.3103)	Top-1 acc 25.000 (25.210)	Top-5 acc 48.438 (47.624)	lr 0.01802
Warmup Train [24][1960/3239]	Time 0.413 (0.518)	Data 0.001 (0.013)	Loss 4.1564 (4.3099)	Top-1 acc 26.562 (25.218)	Top-5 acc 51.562 (47.635)	lr 0.01802
Warmup Train [24][1970/3239]	Time 0.369 (0.518)	Data 0.001 (0.013)	Loss 4.0944 (4.3099)	Top-1 acc 28.906 (25.221)	Top-5 acc 52.734 (47.630)	lr 0.01801
Warmup Train [24][1980/3239]	Time 0.529 (0.518)	Data 0.001 (0.013)	Loss 4.2393 (4.3100)	Top-1 acc 27.344 (25.218)	Top-5 acc 49.609 (47.629)	lr 0.01800
Warmup Train [24][1990/3239]	Time 0.594 (0.518)	Data 0.001 (0.013)	Loss 4.2198 (4.3098)	Top-1 acc 25.781 (25.220)	Top-5 acc 46.484 (47.630)	lr 0.01800
Warmup Train [24][2000/3239]	Time 0.541 (0.518)	Data 0.001 (0.013)	Loss 4.4315 (4.3098)	Top-1 acc 21.484 (25.214)	Top-5 acc 41.797 (47.631)	lr 0.01799
Warmup Train [24][2010/3239]	Time 0.614 (0.519)	Data 0.001 (0.013)	Loss 4.2607 (4.3096)	Top-1 acc 23.438 (25.214)	Top-5 acc 49.219 (47.634)	lr 0.01799
Warmup Train [24][2020/3239]	Time 0.567 (0.519)	Data 0.001 (0.013)	Loss 4.3673 (4.3095)	Top-1 acc 23.438 (25.216)	Top-5 acc 48.438 (47.639)	lr 0.01798
Warmup Train [24][2030/3239]	Time 0.480 (0.519)	Data 0.001 (0.013)	Loss 4.2398 (4.3095)	Top-1 acc 26.953 (25.219)	Top-5 acc 50.781 (47.639)	lr 0.01798
Warmup Train [24][2040/3239]	Time 0.487 (0.518)	Data 0.001 (0.013)	Loss 4.5612 (4.3095)	Top-1 acc 19.922 (25.217)	Top-5 acc 41.406 (47.638)	lr 0.01797
Warmup Train [24][2050/3239]	Time 0.518 (0.518)	Data 0.001 (0.013)	Loss 4.3443 (4.3094)	Top-1 acc 25.000 (25.219)	Top-5 acc 47.656 (47.639)	lr 0.01796
Warmup Train [24][2060/3239]	Time 0.457 (0.518)	Data 0.001 (0.013)	Loss 4.1522 (4.3093)	Top-1 acc 27.734 (25.223)	Top-5 acc 51.172 (47.632)	lr 0.01796
Warmup Train [24][2070/3239]	Time 0.306 (0.518)	Data 0.001 (0.013)	Loss 4.3502 (4.3090)	Top-1 acc 25.391 (25.227)	Top-5 acc 48.438 (47.642)	lr 0.01795
Warmup Train [24][2080/3239]	Time 0.631 (0.518)	Data 0.001 (0.013)	Loss 4.3206 (4.3091)	Top-1 acc 26.562 (25.226)	Top-5 acc 47.266 (47.639)	lr 0.01795
Warmup Train [24][2090/3239]	Time 0.576 (0.518)	Data 0.001 (0.013)	Loss 4.4961 (4.3091)	Top-1 acc 19.141 (25.223)	Top-5 acc 42.969 (47.638)	lr 0.01794
Warmup Train [24][2100/3239]	Time 0.488 (0.518)	Data 0.001 (0.013)	Loss 3.8838 (4.3088)	Top-1 acc 33.984 (25.233)	Top-5 acc 57.812 (47.647)	lr 0.01793
Warmup Train [24][2110/3239]	Time 0.304 (0.518)	Data 0.001 (0.013)	Loss 4.4517 (4.3089)	Top-1 acc 23.828 (25.233)	Top-5 acc 46.484 (47.642)	lr 0.01793
Warmup Train [24][2120/3239]	Time 0.576 (0.518)	Data 0.001 (0.013)	Loss 4.4168 (4.3088)	Top-1 acc 23.047 (25.234)	Top-5 acc 43.359 (47.643)	lr 0.01792
Warmup Train [24][2130/3239]	Time 0.474 (0.518)	Data 0.001 (0.012)	Loss 4.2560 (4.3085)	Top-1 acc 27.734 (25.239)	Top-5 acc 51.562 (47.648)	lr 0.01792
Warmup Train [24][2140/3239]	Time 0.559 (0.518)	Data 0.001 (0.012)	Loss 4.2183 (4.3086)	Top-1 acc 26.172 (25.238)	Top-5 acc 49.219 (47.649)	lr 0.01791
Warmup Train [24][2150/3239]	Time 0.497 (0.518)	Data 0.001 (0.012)	Loss 4.3831 (4.3085)	Top-1 acc 22.656 (25.236)	Top-5 acc 48.828 (47.654)	lr 0.01791
Warmup Train [24][2160/3239]	Time 0.564 (0.518)	Data 0.001 (0.012)	Loss 4.1683 (4.3084)	Top-1 acc 30.078 (25.237)	Top-5 acc 48.438 (47.657)	lr 0.01790
Warmup Train [24][2170/3239]	Time 0.506 (0.518)	Data 0.001 (0.012)	Loss 4.4003 (4.3082)	Top-1 acc 23.828 (25.244)	Top-5 acc 44.141 (47.665)	lr 0.01789
Warmup Train [24][2180/3239]	Time 0.485 (0.518)	Data 0.001 (0.012)	Loss 4.2399 (4.3083)	Top-1 acc 30.078 (25.241)	Top-5 acc 49.609 (47.663)	lr 0.01789
Warmup Train [24][2190/3239]	Time 0.394 (0.518)	Data 0.001 (0.012)	Loss 4.2722 (4.3084)	Top-1 acc 27.344 (25.242)	Top-5 acc 48.438 (47.657)	lr 0.01788
Warmup Train [24][2200/3239]	Time 0.731 (0.518)	Data 0.001 (0.012)	Loss 4.3709 (4.3083)	Top-1 acc 21.875 (25.239)	Top-5 acc 47.266 (47.657)	lr 0.01788
Warmup Train [24][2210/3239]	Time 0.539 (0.518)	Data 0.001 (0.012)	Loss 4.3267 (4.3081)	Top-1 acc 29.688 (25.241)	Top-5 acc 48.047 (47.657)	lr 0.01787
Warmup Train [24][2220/3239]	Time 0.387 (0.518)	Data 0.001 (0.012)	Loss 4.1715 (4.3080)	Top-1 acc 30.078 (25.248)	Top-5 acc 50.391 (47.661)	lr 0.01786
Warmup Train [24][2230/3239]	Time 0.462 (0.518)	Data 0.001 (0.012)	Loss 4.3908 (4.3080)	Top-1 acc 24.219 (25.250)	Top-5 acc 44.922 (47.664)	lr 0.01786
Warmup Train [24][2240/3239]	Time 0.356 (0.518)	Data 0.001 (0.012)	Loss 4.2898 (4.3078)	Top-1 acc 25.000 (25.250)	Top-5 acc 49.609 (47.663)	lr 0.01785
Warmup Train [24][2250/3239]	Time 0.439 (0.518)	Data 0.001 (0.012)	Loss 4.2231 (4.3076)	Top-1 acc 29.688 (25.253)	Top-5 acc 48.828 (47.671)	lr 0.01785
Warmup Train [24][2260/3239]	Time 0.579 (0.518)	Data 0.001 (0.012)	Loss 4.1747 (4.3076)	Top-1 acc 30.078 (25.253)	Top-5 acc 50.391 (47.669)	lr 0.01784
Warmup Train [24][2270/3239]	Time 0.461 (0.518)	Data 0.002 (0.012)	Loss 4.4343 (4.3079)	Top-1 acc 26.562 (25.247)	Top-5 acc 43.750 (47.661)	lr 0.01784
Warmup Train [24][2280/3239]	Time 0.594 (0.518)	Data 0.001 (0.012)	Loss 4.1519 (4.3078)	Top-1 acc 30.859 (25.245)	Top-5 acc 50.781 (47.657)	lr 0.01783
Warmup Train [24][2290/3239]	Time 0.459 (0.518)	Data 0.001 (0.012)	Loss 4.2026 (4.3074)	Top-1 acc 23.828 (25.253)	Top-5 acc 47.656 (47.665)	lr 0.01782
Warmup Train [24][2300/3239]	Time 0.697 (0.518)	Data 0.001 (0.012)	Loss 4.4792 (4.3075)	Top-1 acc 20.312 (25.252)	Top-5 acc 42.969 (47.662)	lr 0.01782
Warmup Train [24][2310/3239]	Time 0.395 (0.518)	Data 0.001 (0.012)	Loss 4.2987 (4.3075)	Top-1 acc 24.609 (25.255)	Top-5 acc 45.703 (47.660)	lr 0.01781
Warmup Train [24][2320/3239]	Time 0.478 (0.518)	Data 0.001 (0.012)	Loss 4.3317 (4.3075)	Top-1 acc 23.047 (25.256)	Top-5 acc 42.969 (47.659)	lr 0.01781
Warmup Train [24][2330/3239]	Time 0.619 (0.518)	Data 0.001 (0.012)	Loss 4.2770 (4.3075)	Top-1 acc 23.438 (25.258)	Top-5 acc 46.094 (47.657)	lr 0.01780
Warmup Train [24][2340/3239]	Time 0.396 (0.517)	Data 0.001 (0.012)	Loss 4.1578 (4.3074)	Top-1 acc 24.609 (25.258)	Top-5 acc 50.781 (47.660)	lr 0.01780
Warmup Train [24][2350/3239]	Time 0.398 (0.517)	Data 0.001 (0.012)	Loss 4.4795 (4.3074)	Top-1 acc 19.531 (25.256)	Top-5 acc 41.797 (47.660)	lr 0.01779
Warmup Train [24][2360/3239]	Time 0.462 (0.517)	Data 0.001 (0.012)	Loss 4.5228 (4.3075)	Top-1 acc 21.875 (25.257)	Top-5 acc 41.406 (47.661)	lr 0.01778
Warmup Train [24][2370/3239]	Time 0.478 (0.517)	Data 0.001 (0.012)	Loss 4.1399 (4.3072)	Top-1 acc 26.562 (25.261)	Top-5 acc 54.297 (47.670)	lr 0.01778
Warmup Train [24][2380/3239]	Time 0.664 (0.517)	Data 0.001 (0.012)	Loss 4.2204 (4.3069)	Top-1 acc 25.000 (25.264)	Top-5 acc 48.438 (47.675)	lr 0.01777
Warmup Train [24][2390/3239]	Time 0.410 (0.517)	Data 0.001 (0.012)	Loss 4.1830 (4.3066)	Top-1 acc 27.734 (25.269)	Top-5 acc 48.047 (47.684)	lr 0.01777
Warmup Train [24][2400/3239]	Time 0.645 (0.517)	Data 0.001 (0.012)	Loss 4.3346 (4.3066)	Top-1 acc 23.828 (25.270)	Top-5 acc 44.531 (47.682)	lr 0.01776
Warmup Train [24][2410/3239]	Time 0.497 (0.517)	Data 0.001 (0.012)	Loss 4.3220 (4.3066)	Top-1 acc 22.656 (25.271)	Top-5 acc 48.828 (47.682)	lr 0.01775
Warmup Train [24][2420/3239]	Time 0.608 (0.517)	Data 0.001 (0.012)	Loss 4.2321 (4.3067)	Top-1 acc 28.125 (25.270)	Top-5 acc 48.438 (47.680)	lr 0.01775
Warmup Train [24][2430/3239]	Time 0.436 (0.517)	Data 0.001 (0.012)	Loss 4.4412 (4.3066)	Top-1 acc 23.047 (25.271)	Top-5 acc 44.922 (47.682)	lr 0.01774
Warmup Train [24][2440/3239]	Time 0.590 (0.517)	Data 0.001 (0.012)	Loss 4.1681 (4.3066)	Top-1 acc 26.562 (25.271)	Top-5 acc 51.562 (47.684)	lr 0.01774
Warmup Train [24][2450/3239]	Time 0.507 (0.517)	Data 0.001 (0.012)	Loss 4.2586 (4.3066)	Top-1 acc 25.000 (25.275)	Top-5 acc 48.438 (47.683)	lr 0.01773
Warmup Train [24][2460/3239]	Time 0.591 (0.517)	Data 0.001 (0.012)	Loss 4.2293 (4.3066)	Top-1 acc 25.000 (25.272)	Top-5 acc 44.922 (47.679)	lr 0.01773
Warmup Train [24][2470/3239]	Time 0.623 (0.517)	Data 0.001 (0.012)	Loss 4.1651 (4.3064)	Top-1 acc 27.734 (25.273)	Top-5 acc 49.609 (47.681)	lr 0.01772
Warmup Train [24][2480/3239]	Time 0.499 (0.517)	Data 0.001 (0.012)	Loss 4.3107 (4.3064)	Top-1 acc 21.875 (25.270)	Top-5 acc 45.703 (47.683)	lr 0.01771
Warmup Train [24][2490/3239]	Time 0.570 (0.517)	Data 0.001 (0.012)	Loss 4.3104 (4.3064)	Top-1 acc 22.656 (25.270)	Top-5 acc 48.828 (47.682)	lr 0.01771
Warmup Train [24][2500/3239]	Time 0.625 (0.517)	Data 0.001 (0.011)	Loss 4.2258 (4.3064)	Top-1 acc 23.828 (25.265)	Top-5 acc 54.297 (47.686)	lr 0.01770
Warmup Train [24][2510/3239]	Time 0.704 (0.517)	Data 0.001 (0.011)	Loss 4.2001 (4.3062)	Top-1 acc 27.344 (25.270)	Top-5 acc 53.906 (47.692)	lr 0.01770
Warmup Train [24][2520/3239]	Time 0.489 (0.517)	Data 0.001 (0.011)	Loss 4.2945 (4.3063)	Top-1 acc 26.562 (25.269)	Top-5 acc 49.609 (47.690)	lr 0.01769
Warmup Train [24][2530/3239]	Time 0.293 (0.517)	Data 0.001 (0.011)	Loss 4.2281 (4.3064)	Top-1 acc 26.172 (25.266)	Top-5 acc 49.609 (47.685)	lr 0.01768
Warmup Train [24][2540/3239]	Time 0.548 (0.517)	Data 0.001 (0.011)	Loss 4.0713 (4.3064)	Top-1 acc 27.344 (25.269)	Top-5 acc 51.953 (47.685)	lr 0.01768
Warmup Train [24][2550/3239]	Time 0.633 (0.517)	Data 0.001 (0.011)	Loss 4.2003 (4.3063)	Top-1 acc 25.391 (25.268)	Top-5 acc 45.703 (47.684)	lr 0.01767
Warmup Train [24][2560/3239]	Time 0.432 (0.517)	Data 0.001 (0.011)	Loss 4.4468 (4.3062)	Top-1 acc 23.438 (25.268)	Top-5 acc 40.234 (47.684)	lr 0.01767
Warmup Train [24][2570/3239]	Time 0.478 (0.517)	Data 0.001 (0.011)	Loss 4.3211 (4.3062)	Top-1 acc 24.219 (25.270)	Top-5 acc 43.359 (47.686)	lr 0.01766
Warmup Train [24][2580/3239]	Time 0.366 (0.517)	Data 0.001 (0.011)	Loss 4.1833 (4.3062)	Top-1 acc 29.297 (25.272)	Top-5 acc 52.344 (47.686)	lr 0.01766
Warmup Train [24][2590/3239]	Time 0.495 (0.516)	Data 0.001 (0.011)	Loss 4.6089 (4.3062)	Top-1 acc 19.922 (25.272)	Top-5 acc 45.312 (47.690)	lr 0.01765
Warmup Train [24][2600/3239]	Time 0.607 (0.516)	Data 0.001 (0.011)	Loss 4.0572 (4.3059)	Top-1 acc 28.125 (25.277)	Top-5 acc 54.688 (47.692)	lr 0.01764
Warmup Train [24][2610/3239]	Time 0.551 (0.516)	Data 0.001 (0.011)	Loss 4.3136 (4.3060)	Top-1 acc 23.438 (25.273)	Top-5 acc 48.047 (47.694)	lr 0.01764
Warmup Train [24][2620/3239]	Time 0.498 (0.516)	Data 0.001 (0.011)	Loss 4.3581 (4.3060)	Top-1 acc 24.219 (25.273)	Top-5 acc 47.266 (47.700)	lr 0.01763
Warmup Train [24][2630/3239]	Time 0.567 (0.516)	Data 0.001 (0.011)	Loss 4.2186 (4.3057)	Top-1 acc 25.000 (25.273)	Top-5 acc 50.000 (47.704)	lr 0.01763
Warmup Train [24][2640/3239]	Time 0.541 (0.516)	Data 0.001 (0.011)	Loss 4.2798 (4.3058)	Top-1 acc 26.562 (25.268)	Top-5 acc 43.750 (47.701)	lr 0.01762
Warmup Train [24][2650/3239]	Time 0.418 (0.516)	Data 0.001 (0.011)	Loss 4.4062 (4.3060)	Top-1 acc 26.562 (25.271)	Top-5 acc 47.656 (47.698)	lr 0.01762
Warmup Train [24][2660/3239]	Time 0.489 (0.516)	Data 0.001 (0.011)	Loss 4.0764 (4.3058)	Top-1 acc 32.422 (25.279)	Top-5 acc 55.078 (47.706)	lr 0.01761
Warmup Train [24][2670/3239]	Time 0.668 (0.516)	Data 0.001 (0.011)	Loss 4.2113 (4.3057)	Top-1 acc 25.000 (25.279)	Top-5 acc 50.000 (47.709)	lr 0.01760
Warmup Train [24][2680/3239]	Time 0.500 (0.516)	Data 0.001 (0.011)	Loss 4.2394 (4.3057)	Top-1 acc 27.734 (25.280)	Top-5 acc 50.391 (47.712)	lr 0.01760
Warmup Train [24][2690/3239]	Time 0.461 (0.516)	Data 0.001 (0.011)	Loss 4.5000 (4.3057)	Top-1 acc 19.922 (25.280)	Top-5 acc 40.234 (47.712)	lr 0.01759
Warmup Train [24][2700/3239]	Time 0.490 (0.516)	Data 0.001 (0.011)	Loss 4.3603 (4.3059)	Top-1 acc 22.656 (25.280)	Top-5 acc 46.484 (47.709)	lr 0.01759
Warmup Train [24][2710/3239]	Time 0.499 (0.516)	Data 0.001 (0.011)	Loss 4.1616 (4.3054)	Top-1 acc 27.344 (25.288)	Top-5 acc 50.781 (47.724)	lr 0.01758
Warmup Train [24][2720/3239]	Time 0.598 (0.516)	Data 0.001 (0.011)	Loss 4.2466 (4.3053)	Top-1 acc 20.703 (25.283)	Top-5 acc 44.531 (47.722)	lr 0.01757
Warmup Train [24][2730/3239]	Time 0.385 (0.516)	Data 0.001 (0.011)	Loss 4.2227 (4.3052)	Top-1 acc 30.469 (25.289)	Top-5 acc 48.828 (47.725)	lr 0.01757
Warmup Train [24][2740/3239]	Time 0.574 (0.516)	Data 0.001 (0.011)	Loss 4.3256 (4.3052)	Top-1 acc 21.484 (25.286)	Top-5 acc 46.484 (47.727)	lr 0.01756
Warmup Train [24][2750/3239]	Time 0.588 (0.516)	Data 0.001 (0.011)	Loss 4.2097 (4.3050)	Top-1 acc 26.172 (25.292)	Top-5 acc 49.609 (47.733)	lr 0.01756
Warmup Train [24][2760/3239]	Time 0.537 (0.516)	Data 0.001 (0.011)	Loss 4.3686 (4.3053)	Top-1 acc 23.828 (25.287)	Top-5 acc 46.484 (47.729)	lr 0.01755
Warmup Train [24][2770/3239]	Time 0.370 (0.516)	Data 0.001 (0.011)	Loss 4.4136 (4.3054)	Top-1 acc 24.609 (25.284)	Top-5 acc 43.750 (47.723)	lr 0.01755
Warmup Train [24][2780/3239]	Time 0.412 (0.516)	Data 0.001 (0.011)	Loss 4.1327 (4.3054)	Top-1 acc 25.391 (25.280)	Top-5 acc 51.953 (47.721)	lr 0.01754
Warmup Train [24][2790/3239]	Time 0.603 (0.516)	Data 0.001 (0.011)	Loss 4.3616 (4.3055)	Top-1 acc 26.562 (25.283)	Top-5 acc 46.484 (47.721)	lr 0.01753
Warmup Train [24][2800/3239]	Time 0.389 (0.516)	Data 0.001 (0.011)	Loss 4.3489 (4.3053)	Top-1 acc 23.047 (25.285)	Top-5 acc 45.703 (47.723)	lr 0.01753
Warmup Train [24][2810/3239]	Time 0.510 (0.516)	Data 0.001 (0.011)	Loss 4.1708 (4.3052)	Top-1 acc 25.000 (25.284)	Top-5 acc 50.391 (47.731)	lr 0.01752
Warmup Train [24][2820/3239]	Time 0.513 (0.516)	Data 0.001 (0.011)	Loss 4.1768 (4.3051)	Top-1 acc 23.047 (25.286)	Top-5 acc 51.953 (47.735)	lr 0.01752
Warmup Train [24][2830/3239]	Time 0.464 (0.516)	Data 0.001 (0.011)	Loss 4.4687 (4.3050)	Top-1 acc 21.875 (25.286)	Top-5 acc 42.188 (47.732)	lr 0.01751
Warmup Train [24][2840/3239]	Time 0.466 (0.515)	Data 0.001 (0.011)	Loss 4.3419 (4.3050)	Top-1 acc 25.391 (25.289)	Top-5 acc 46.484 (47.733)	lr 0.01751
Warmup Train [24][2850/3239]	Time 0.579 (0.515)	Data 0.001 (0.011)	Loss 4.3332 (4.3051)	Top-1 acc 26.562 (25.283)	Top-5 acc 46.094 (47.727)	lr 0.01750
Warmup Train [24][2860/3239]	Time 0.464 (0.515)	Data 0.001 (0.011)	Loss 4.3532 (4.3050)	Top-1 acc 25.000 (25.285)	Top-5 acc 49.609 (47.733)	lr 0.01749
Warmup Train [24][2870/3239]	Time 0.488 (0.515)	Data 0.001 (0.011)	Loss 4.2812 (4.3048)	Top-1 acc 22.266 (25.287)	Top-5 acc 49.219 (47.738)	lr 0.01749
Warmup Train [24][2880/3239]	Time 0.592 (0.515)	Data 0.001 (0.011)	Loss 4.3108 (4.3047)	Top-1 acc 25.781 (25.286)	Top-5 acc 49.609 (47.736)	lr 0.01748
Warmup Train [24][2890/3239]	Time 0.355 (0.515)	Data 0.001 (0.011)	Loss 4.3834 (4.3047)	Top-1 acc 26.172 (25.286)	Top-5 acc 44.531 (47.733)	lr 0.01748
Warmup Train [24][2900/3239]	Time 0.572 (0.515)	Data 0.001 (0.011)	Loss 4.2890 (4.3044)	Top-1 acc 20.703 (25.291)	Top-5 acc 47.656 (47.740)	lr 0.01747
Warmup Train [24][2910/3239]	Time 0.432 (0.515)	Data 0.001 (0.011)	Loss 4.3758 (4.3044)	Top-1 acc 25.391 (25.288)	Top-5 acc 47.656 (47.743)	lr 0.01747
Warmup Train [24][2920/3239]	Time 0.518 (0.515)	Data 0.001 (0.011)	Loss 4.2576 (4.3044)	Top-1 acc 22.266 (25.289)	Top-5 acc 51.172 (47.745)	lr 0.01746
Warmup Train [24][2930/3239]	Time 0.576 (0.515)	Data 0.001 (0.011)	Loss 4.0820 (4.3041)	Top-1 acc 29.297 (25.296)	Top-5 acc 54.297 (47.750)	lr 0.01745
Warmup Train [24][2940/3239]	Time 0.478 (0.516)	Data 0.028 (0.011)	Loss 4.3834 (4.3041)	Top-1 acc 24.609 (25.297)	Top-5 acc 47.266 (47.749)	lr 0.01745
Warmup Train [24][2950/3239]	Time 0.497 (0.515)	Data 0.001 (0.011)	Loss 4.3696 (4.3042)	Top-1 acc 30.078 (25.300)	Top-5 acc 48.047 (47.744)	lr 0.01744
Warmup Train [24][2960/3239]	Time 0.485 (0.515)	Data 0.001 (0.011)	Loss 4.3679 (4.3039)	Top-1 acc 23.828 (25.304)	Top-5 acc 44.141 (47.750)	lr 0.01744
Warmup Train [24][2970/3239]	Time 0.670 (0.516)	Data 0.001 (0.011)	Loss 4.2780 (4.3039)	Top-1 acc 24.219 (25.304)	Top-5 acc 49.219 (47.752)	lr 0.01743
Warmup Train [24][2980/3239]	Time 0.547 (0.515)	Data 0.001 (0.011)	Loss 4.2823 (4.3040)	Top-1 acc 26.953 (25.300)	Top-5 acc 48.047 (47.749)	lr 0.01742
Warmup Train [24][2990/3239]	Time 0.652 (0.515)	Data 0.001 (0.011)	Loss 4.4911 (4.3043)	Top-1 acc 23.047 (25.292)	Top-5 acc 45.703 (47.742)	lr 0.01742
Warmup Train [24][3000/3239]	Time 0.524 (0.516)	Data 0.001 (0.011)	Loss 4.3564 (4.3041)	Top-1 acc 24.609 (25.295)	Top-5 acc 45.703 (47.748)	lr 0.01741
Warmup Train [24][3010/3239]	Time 0.561 (0.516)	Data 0.001 (0.011)	Loss 4.1655 (4.3040)	Top-1 acc 26.172 (25.295)	Top-5 acc 54.297 (47.755)	lr 0.01741
Warmup Train [24][3020/3239]	Time 0.542 (0.516)	Data 0.020 (0.011)	Loss 4.2944 (4.3039)	Top-1 acc 27.344 (25.297)	Top-5 acc 48.438 (47.757)	lr 0.01740
Warmup Train [24][3030/3239]	Time 0.414 (0.516)	Data 0.001 (0.011)	Loss 4.0008 (4.3037)	Top-1 acc 30.469 (25.299)	Top-5 acc 53.125 (47.760)	lr 0.01740
Warmup Train [24][3040/3239]	Time 0.382 (0.516)	Data 0.002 (0.010)	Loss 4.2662 (4.3037)	Top-1 acc 26.172 (25.301)	Top-5 acc 44.531 (47.760)	lr 0.01739
Warmup Train [24][3050/3239]	Time 0.470 (0.515)	Data 0.001 (0.011)	Loss 4.1790 (4.3036)	Top-1 acc 25.781 (25.300)	Top-5 acc 51.172 (47.763)	lr 0.01738
Warmup Train [24][3060/3239]	Time 0.410 (0.515)	Data 0.001 (0.010)	Loss 4.4463 (4.3035)	Top-1 acc 21.875 (25.305)	Top-5 acc 48.438 (47.765)	lr 0.01738
Warmup Train [24][3070/3239]	Time 0.551 (0.515)	Data 0.001 (0.010)	Loss 4.2534 (4.3035)	Top-1 acc 27.344 (25.307)	Top-5 acc 48.828 (47.763)	lr 0.01737
Warmup Train [24][3080/3239]	Time 0.438 (0.515)	Data 0.001 (0.010)	Loss 4.3650 (4.3034)	Top-1 acc 21.484 (25.305)	Top-5 acc 49.609 (47.764)	lr 0.01737
Warmup Train [24][3090/3239]	Time 0.575 (0.515)	Data 0.001 (0.010)	Loss 4.1600 (4.3032)	Top-1 acc 27.734 (25.308)	Top-5 acc 50.391 (47.768)	lr 0.01736
Warmup Train [24][3100/3239]	Time 0.607 (0.515)	Data 0.001 (0.010)	Loss 4.3161 (4.3030)	Top-1 acc 22.656 (25.309)	Top-5 acc 46.875 (47.772)	lr 0.01736
Warmup Train [24][3110/3239]	Time 0.572 (0.515)	Data 0.001 (0.010)	Loss 4.2903 (4.3030)	Top-1 acc 23.047 (25.309)	Top-5 acc 51.172 (47.776)	lr 0.01735
Warmup Train [24][3120/3239]	Time 0.389 (0.515)	Data 0.001 (0.010)	Loss 4.2348 (4.3029)	Top-1 acc 26.562 (25.309)	Top-5 acc 49.609 (47.776)	lr 0.01734
Warmup Train [24][3130/3239]	Time 0.527 (0.515)	Data 0.001 (0.010)	Loss 4.4986 (4.3030)	Top-1 acc 21.094 (25.300)	Top-5 acc 46.094 (47.772)	lr 0.01734
Warmup Train [24][3140/3239]	Time 0.486 (0.515)	Data 0.001 (0.010)	Loss 4.2681 (4.3029)	Top-1 acc 27.344 (25.302)	Top-5 acc 49.219 (47.774)	lr 0.01733
Warmup Train [24][3150/3239]	Time 0.592 (0.515)	Data 0.001 (0.010)	Loss 4.3026 (4.3029)	Top-1 acc 27.734 (25.301)	Top-5 acc 50.000 (47.775)	lr 0.01733
Warmup Train [24][3160/3239]	Time 0.570 (0.515)	Data 0.001 (0.010)	Loss 4.2481 (4.3029)	Top-1 acc 30.469 (25.301)	Top-5 acc 48.828 (47.774)	lr 0.01732
Warmup Train [24][3170/3239]	Time 0.660 (0.515)	Data 0.001 (0.010)	Loss 4.4949 (4.3030)	Top-1 acc 19.141 (25.298)	Top-5 acc 41.406 (47.771)	lr 0.01731
Warmup Train [24][3180/3239]	Time 0.535 (0.515)	Data 0.000 (0.010)	Loss 4.1424 (4.3029)	Top-1 acc 25.000 (25.297)	Top-5 acc 48.828 (47.774)	lr 0.01731
Warmup Train [24][3190/3239]	Time 0.462 (0.515)	Data 0.000 (0.010)	Loss 4.5916 (4.3029)	Top-1 acc 20.312 (25.294)	Top-5 acc 42.188 (47.775)	lr 0.01730
Warmup Train [24][3200/3239]	Time 0.585 (0.515)	Data 0.000 (0.010)	Loss 4.4025 (4.3029)	Top-1 acc 21.094 (25.293)	Top-5 acc 46.875 (47.776)	lr 0.01730
Warmup Train [24][3210/3239]	Time 0.559 (0.515)	Data 0.000 (0.010)	Loss 4.4431 (4.3029)	Top-1 acc 21.484 (25.293)	Top-5 acc 44.922 (47.781)	lr 0.01729
Warmup Train [24][3220/3239]	Time 0.496 (0.515)	Data 0.000 (0.010)	Loss 4.0766 (4.3029)	Top-1 acc 29.297 (25.294)	Top-5 acc 54.688 (47.783)	lr 0.01729
Warmup Train [24][3230/3239]	Time 0.550 (0.515)	Data 0.000 (0.010)	Loss 4.1735 (4.3027)	Top-1 acc 27.734 (25.298)	Top-5 acc 49.609 (47.788)	lr 0.01728
Warmup Train [24][3239/3239]	Time 0.333 (0.515)	Data 0.000 (0.010)	Loss 4.5163 (4.3029)	Top-1 acc 29.630 (25.297)	Top-5 acc 45.679 (47.782)	lr 0.01728
==========Warmup Valid [24/40]	loss 3.283	top-1 acc 32.668	top-5 acc 57.047	Train top-1 25.297	top-5 47.782	flops: 442.4M
Warmup Train [25][0/3239]	Time 15.433 (15.433)	Data 13.816 (13.816)	Loss 4.3740 (4.3740)	Top-1 acc 23.047 (23.047)	Top-5 acc 43.359 (43.359)	lr 0.01727
Warmup Train [25][10/3239]	Time 0.416 (1.881)	Data 0.001 (1.261)	Loss 4.2458 (4.2616)	Top-1 acc 26.172 (25.284)	Top-5 acc 50.000 (49.077)	lr 0.01727
Warmup Train [25][20/3239]	Time 0.323 (1.230)	Data 0.001 (0.665)	Loss 4.3182 (4.2821)	Top-1 acc 23.828 (25.037)	Top-5 acc 51.562 (48.772)	lr 0.01726
Warmup Train [25][30/3239]	Time 0.485 (1.004)	Data 0.001 (0.457)	Loss 4.3272 (4.2845)	Top-1 acc 24.609 (25.088)	Top-5 acc 42.969 (48.412)	lr 0.01726
Warmup Train [25][40/3239]	Time 0.474 (0.881)	Data 0.001 (0.346)	Loss 4.2701 (4.2816)	Top-1 acc 26.562 (25.314)	Top-5 acc 49.219 (48.428)	lr 0.01725
Warmup Train [25][50/3239]	Time 0.421 (0.806)	Data 0.001 (0.279)	Loss 4.4096 (4.2934)	Top-1 acc 20.703 (25.169)	Top-5 acc 46.484 (48.284)	lr 0.01725
Warmup Train [25][60/3239]	Time 0.521 (0.762)	Data 0.001 (0.235)	Loss 4.2863 (4.2874)	Top-1 acc 26.562 (25.339)	Top-5 acc 47.656 (48.386)	lr 0.01724
Warmup Train [25][70/3239]	Time 0.492 (0.727)	Data 0.001 (0.202)	Loss 4.3778 (4.2894)	Top-1 acc 22.656 (25.396)	Top-5 acc 48.047 (48.239)	lr 0.01723
Warmup Train [25][80/3239]	Time 0.609 (0.705)	Data 0.001 (0.178)	Loss 4.3125 (4.2884)	Top-1 acc 26.953 (25.463)	Top-5 acc 48.047 (48.336)	lr 0.01723
Warmup Train [25][90/3239]	Time 0.434 (0.683)	Data 0.001 (0.159)	Loss 4.2104 (4.2859)	Top-1 acc 28.906 (25.562)	Top-5 acc 48.828 (48.326)	lr 0.01722
Warmup Train [25][100/3239]	Time 0.434 (0.665)	Data 0.001 (0.144)	Loss 4.1797 (4.2823)	Top-1 acc 27.344 (25.735)	Top-5 acc 45.312 (48.298)	lr 0.01722
Warmup Train [25][110/3239]	Time 0.559 (0.653)	Data 0.001 (0.133)	Loss 4.1892 (4.2817)	Top-1 acc 27.344 (25.693)	Top-5 acc 48.828 (48.304)	lr 0.01721
Warmup Train [25][120/3239]	Time 0.556 (0.642)	Data 0.001 (0.123)	Loss 4.3895 (4.2793)	Top-1 acc 23.047 (25.697)	Top-5 acc 45.703 (48.386)	lr 0.01721
Warmup Train [25][130/3239]	Time 0.291 (0.631)	Data 0.001 (0.114)	Loss 4.3138 (4.2730)	Top-1 acc 25.000 (25.844)	Top-5 acc 47.656 (48.515)	lr 0.01720
Warmup Train [25][140/3239]	Time 0.303 (0.621)	Data 0.001 (0.107)	Loss 4.4547 (4.2768)	Top-1 acc 21.875 (25.745)	Top-5 acc 45.312 (48.413)	lr 0.01719
Warmup Train [25][150/3239]	Time 0.528 (0.615)	Data 0.001 (0.101)	Loss 4.3276 (4.2754)	Top-1 acc 27.734 (25.830)	Top-5 acc 44.531 (48.435)	lr 0.01719
Warmup Train [25][160/3239]	Time 0.508 (0.605)	Data 0.001 (0.095)	Loss 4.2508 (4.2749)	Top-1 acc 28.516 (25.944)	Top-5 acc 47.656 (48.418)	lr 0.01718
Warmup Train [25][170/3239]	Time 0.605 (0.601)	Data 0.001 (0.090)	Loss 4.2554 (4.2742)	Top-1 acc 27.734 (25.930)	Top-5 acc 50.781 (48.449)	lr 0.01718
Warmup Train [25][180/3239]	Time 0.581 (0.597)	Data 0.001 (0.085)	Loss 4.1502 (4.2765)	Top-1 acc 27.734 (25.915)	Top-5 acc 49.219 (48.401)	lr 0.01717
Warmup Train [25][190/3239]	Time 0.713 (0.592)	Data 0.001 (0.080)	Loss 4.0748 (4.2760)	Top-1 acc 26.562 (25.871)	Top-5 acc 54.297 (48.435)	lr 0.01717
Warmup Train [25][200/3239]	Time 0.359 (0.587)	Data 0.001 (0.077)	Loss 4.1863 (4.2743)	Top-1 acc 25.781 (25.869)	Top-5 acc 48.047 (48.434)	lr 0.01716
Warmup Train [25][210/3239]	Time 0.505 (0.585)	Data 0.001 (0.074)	Loss 4.1634 (4.2749)	Top-1 acc 26.562 (25.865)	Top-5 acc 50.391 (48.415)	lr 0.01715
Warmup Train [25][220/3239]	Time 0.440 (0.581)	Data 0.001 (0.070)	Loss 4.1978 (4.2746)	Top-1 acc 31.250 (25.933)	Top-5 acc 50.781 (48.452)	lr 0.01715
Warmup Train [25][230/3239]	Time 0.544 (0.580)	Data 0.001 (0.068)	Loss 4.3090 (4.2766)	Top-1 acc 27.734 (25.903)	Top-5 acc 50.781 (48.400)	lr 0.01714
Warmup Train [25][240/3239]	Time 0.490 (0.577)	Data 0.001 (0.065)	Loss 4.1630 (4.2745)	Top-1 acc 29.297 (25.898)	Top-5 acc 55.078 (48.478)	lr 0.01714
Warmup Train [25][250/3239]	Time 0.551 (0.574)	Data 0.001 (0.063)	Loss 4.2709 (4.2724)	Top-1 acc 24.219 (25.937)	Top-5 acc 45.703 (48.515)	lr 0.01713
Warmup Train [25][260/3239]	Time 0.426 (0.571)	Data 0.001 (0.061)	Loss 4.4356 (4.2704)	Top-1 acc 19.531 (25.941)	Top-5 acc 40.234 (48.523)	lr 0.01712
Warmup Train [25][270/3239]	Time 0.479 (0.569)	Data 0.001 (0.059)	Loss 4.4291 (4.2708)	Top-1 acc 25.000 (25.943)	Top-5 acc 45.312 (48.550)	lr 0.01712
Warmup Train [25][280/3239]	Time 0.631 (0.567)	Data 0.001 (0.057)	Loss 4.2005 (4.2700)	Top-1 acc 26.953 (25.969)	Top-5 acc 51.172 (48.540)	lr 0.01711
Warmup Train [25][290/3239]	Time 0.538 (0.565)	Data 0.001 (0.055)	Loss 4.1627 (4.2713)	Top-1 acc 30.859 (25.966)	Top-5 acc 52.344 (48.499)	lr 0.01711
Warmup Train [25][300/3239]	Time 0.553 (0.563)	Data 0.001 (0.053)	Loss 4.3788 (4.2736)	Top-1 acc 23.047 (25.918)	Top-5 acc 43.750 (48.482)	lr 0.01710
Warmup Train [25][310/3239]	Time 0.443 (0.561)	Data 0.001 (0.052)	Loss 4.3931 (4.2744)	Top-1 acc 24.219 (25.914)	Top-5 acc 43.359 (48.417)	lr 0.01710
Warmup Train [25][320/3239]	Time 0.558 (0.560)	Data 0.001 (0.051)	Loss 4.2193 (4.2728)	Top-1 acc 26.562 (25.952)	Top-5 acc 48.438 (48.464)	lr 0.01709
Warmup Train [25][330/3239]	Time 0.659 (0.559)	Data 0.001 (0.049)	Loss 4.2302 (4.2741)	Top-1 acc 25.000 (25.898)	Top-5 acc 46.484 (48.399)	lr 0.01708
Warmup Train [25][340/3239]	Time 0.458 (0.558)	Data 0.001 (0.048)	Loss 4.2131 (4.2724)	Top-1 acc 28.125 (25.938)	Top-5 acc 46.875 (48.393)	lr 0.01708
Warmup Train [25][350/3239]	Time 0.505 (0.557)	Data 0.001 (0.047)	Loss 4.3230 (4.2740)	Top-1 acc 24.219 (25.908)	Top-5 acc 47.266 (48.346)	lr 0.01707
Warmup Train [25][360/3239]	Time 0.580 (0.555)	Data 0.001 (0.045)	Loss 4.4875 (4.2748)	Top-1 acc 20.703 (25.895)	Top-5 acc 47.266 (48.337)	lr 0.01707
Warmup Train [25][370/3239]	Time 0.535 (0.553)	Data 0.001 (0.044)	Loss 4.3561 (4.2739)	Top-1 acc 27.734 (25.924)	Top-5 acc 48.438 (48.380)	lr 0.01706
Warmup Train [25][380/3239]	Time 0.672 (0.552)	Data 0.001 (0.043)	Loss 4.3456 (4.2753)	Top-1 acc 23.047 (25.928)	Top-5 acc 47.656 (48.328)	lr 0.01706
Warmup Train [25][390/3239]	Time 0.416 (0.551)	Data 0.001 (0.042)	Loss 4.1085 (4.2760)	Top-1 acc 27.734 (25.907)	Top-5 acc 53.125 (48.307)	lr 0.01705
Warmup Train [25][400/3239]	Time 0.580 (0.549)	Data 0.001 (0.041)	Loss 4.2810 (4.2762)	Top-1 acc 28.516 (25.908)	Top-5 acc 47.656 (48.303)	lr 0.01704
Warmup Train [25][410/3239]	Time 0.408 (0.548)	Data 0.001 (0.040)	Loss 4.1683 (4.2758)	Top-1 acc 27.344 (25.947)	Top-5 acc 47.266 (48.327)	lr 0.01704
Warmup Train [25][420/3239]	Time 0.387 (0.547)	Data 0.001 (0.040)	Loss 4.3165 (4.2756)	Top-1 acc 26.562 (25.920)	Top-5 acc 50.781 (48.347)	lr 0.01703
Warmup Train [25][430/3239]	Time 0.484 (0.547)	Data 0.001 (0.039)	Loss 4.1067 (4.2752)	Top-1 acc 27.734 (25.938)	Top-5 acc 50.781 (48.360)	lr 0.01703
Warmup Train [25][440/3239]	Time 0.426 (0.546)	Data 0.028 (0.038)	Loss 4.2746 (4.2758)	Top-1 acc 24.219 (25.918)	Top-5 acc 48.438 (48.354)	lr 0.01702
Warmup Train [25][450/3239]	Time 0.503 (0.545)	Data 0.001 (0.038)	Loss 4.4274 (4.2758)	Top-1 acc 22.266 (25.935)	Top-5 acc 46.094 (48.347)	lr 0.01702
Warmup Train [25][460/3239]	Time 0.406 (0.545)	Data 0.001 (0.037)	Loss 4.3605 (4.2755)	Top-1 acc 23.438 (25.933)	Top-5 acc 48.047 (48.394)	lr 0.01701
Warmup Train [25][470/3239]	Time 0.526 (0.544)	Data 0.001 (0.037)	Loss 4.1792 (4.2746)	Top-1 acc 25.391 (25.931)	Top-5 acc 52.344 (48.419)	lr 0.01700
Warmup Train [25][480/3239]	Time 0.518 (0.544)	Data 0.001 (0.036)	Loss 4.3018 (4.2748)	Top-1 acc 24.219 (25.912)	Top-5 acc 48.047 (48.405)	lr 0.01700
Warmup Train [25][490/3239]	Time 0.399 (0.543)	Data 0.001 (0.035)	Loss 4.1048 (4.2749)	Top-1 acc 26.562 (25.898)	Top-5 acc 52.344 (48.423)	lr 0.01699
Warmup Train [25][500/3239]	Time 0.729 (0.543)	Data 0.001 (0.035)	Loss 4.3688 (4.2736)	Top-1 acc 22.656 (25.911)	Top-5 acc 42.969 (48.432)	lr 0.01699
Warmup Train [25][510/3239]	Time 0.545 (0.542)	Data 0.001 (0.034)	Loss 4.3516 (4.2728)	Top-1 acc 27.344 (25.939)	Top-5 acc 46.094 (48.459)	lr 0.01698
Warmup Train [25][520/3239]	Time 0.591 (0.542)	Data 0.001 (0.034)	Loss 4.1132 (4.2718)	Top-1 acc 29.297 (25.942)	Top-5 acc 49.609 (48.465)	lr 0.01698
Warmup Train [25][530/3239]	Time 0.385 (0.540)	Data 0.001 (0.033)	Loss 4.1290 (4.2728)	Top-1 acc 24.609 (25.924)	Top-5 acc 53.906 (48.471)	lr 0.01697
Warmup Train [25][540/3239]	Time 0.514 (0.540)	Data 0.001 (0.033)	Loss 4.1669 (4.2726)	Top-1 acc 25.391 (25.930)	Top-5 acc 51.562 (48.479)	lr 0.01696
Warmup Train [25][550/3239]	Time 0.471 (0.539)	Data 0.001 (0.032)	Loss 4.2099 (4.2708)	Top-1 acc 26.953 (25.951)	Top-5 acc 49.609 (48.539)	lr 0.01696
Warmup Train [25][560/3239]	Time 0.535 (0.539)	Data 0.001 (0.032)	Loss 4.3418 (4.2704)	Top-1 acc 25.391 (25.967)	Top-5 acc 45.703 (48.534)	lr 0.01695
Warmup Train [25][570/3239]	Time 0.666 (0.539)	Data 0.001 (0.031)	Loss 4.2179 (4.2707)	Top-1 acc 25.391 (25.971)	Top-5 acc 48.828 (48.507)	lr 0.01695
Warmup Train [25][580/3239]	Time 0.572 (0.539)	Data 0.001 (0.031)	Loss 4.2039 (4.2705)	Top-1 acc 26.562 (25.964)	Top-5 acc 51.562 (48.514)	lr 0.01694
Warmup Train [25][590/3239]	Time 0.337 (0.538)	Data 0.001 (0.030)	Loss 4.2481 (4.2710)	Top-1 acc 27.734 (25.955)	Top-5 acc 50.781 (48.512)	lr 0.01694
Warmup Train [25][600/3239]	Time 0.372 (0.538)	Data 0.001 (0.030)	Loss 4.2315 (4.2711)	Top-1 acc 26.562 (25.952)	Top-5 acc 49.219 (48.501)	lr 0.01693
Warmup Train [25][610/3239]	Time 0.627 (0.538)	Data 0.001 (0.030)	Loss 4.3758 (4.2714)	Top-1 acc 23.828 (25.949)	Top-5 acc 45.703 (48.482)	lr 0.01692
Warmup Train [25][620/3239]	Time 0.350 (0.536)	Data 0.001 (0.029)	Loss 4.2813 (4.2722)	Top-1 acc 26.562 (25.952)	Top-5 acc 50.391 (48.466)	lr 0.01692
Warmup Train [25][630/3239]	Time 0.455 (0.536)	Data 0.001 (0.029)	Loss 4.4222 (4.2733)	Top-1 acc 23.047 (25.940)	Top-5 acc 44.141 (48.451)	lr 0.01691
Warmup Train [25][640/3239]	Time 0.207 (0.534)	Data 0.001 (0.029)	Loss 4.2137 (4.2727)	Top-1 acc 25.391 (25.940)	Top-5 acc 50.391 (48.474)	lr 0.01691
Warmup Train [25][650/3239]	Time 0.572 (0.534)	Data 0.001 (0.029)	Loss 4.3078 (4.2727)	Top-1 acc 23.047 (25.949)	Top-5 acc 46.484 (48.487)	lr 0.01690
Warmup Train [25][660/3239]	Time 0.606 (0.534)	Data 0.001 (0.028)	Loss 4.2372 (4.2728)	Top-1 acc 31.641 (25.937)	Top-5 acc 44.531 (48.469)	lr 0.01690
Warmup Train [25][670/3239]	Time 0.367 (0.533)	Data 0.002 (0.028)	Loss 4.2374 (4.2723)	Top-1 acc 28.516 (25.936)	Top-5 acc 46.484 (48.467)	lr 0.01689
Warmup Train [25][680/3239]	Time 0.526 (0.533)	Data 0.001 (0.028)	Loss 4.0901 (4.2724)	Top-1 acc 31.641 (25.927)	Top-5 acc 51.953 (48.455)	lr 0.01688
Warmup Train [25][690/3239]	Time 0.497 (0.533)	Data 0.001 (0.027)	Loss 4.2224 (4.2717)	Top-1 acc 25.000 (25.927)	Top-5 acc 51.953 (48.481)	lr 0.01688
Warmup Train [25][700/3239]	Time 0.528 (0.532)	Data 0.001 (0.027)	Loss 4.2554 (4.2716)	Top-1 acc 28.906 (25.935)	Top-5 acc 44.922 (48.484)	lr 0.01687
Warmup Train [25][710/3239]	Time 0.582 (0.532)	Data 0.001 (0.027)	Loss 4.4010 (4.2726)	Top-1 acc 21.875 (25.914)	Top-5 acc 46.875 (48.482)	lr 0.01687
Warmup Train [25][720/3239]	Time 0.524 (0.532)	Data 0.001 (0.026)	Loss 4.3318 (4.2726)	Top-1 acc 23.438 (25.922)	Top-5 acc 48.438 (48.480)	lr 0.01686
Warmup Train [25][730/3239]	Time 0.579 (0.532)	Data 0.001 (0.026)	Loss 4.2917 (4.2734)	Top-1 acc 21.875 (25.891)	Top-5 acc 45.703 (48.458)	lr 0.01686
Warmup Train [25][740/3239]	Time 0.543 (0.531)	Data 0.001 (0.026)	Loss 4.2980 (4.2733)	Top-1 acc 22.656 (25.895)	Top-5 acc 46.484 (48.470)	lr 0.01685
Warmup Train [25][750/3239]	Time 0.480 (0.531)	Data 0.002 (0.025)	Loss 4.1617 (4.2737)	Top-1 acc 28.906 (25.896)	Top-5 acc 50.391 (48.462)	lr 0.01684
Warmup Train [25][760/3239]	Time 0.396 (0.530)	Data 0.001 (0.025)	Loss 4.2855 (4.2735)	Top-1 acc 30.469 (25.904)	Top-5 acc 47.266 (48.472)	lr 0.01684
Warmup Train [25][770/3239]	Time 0.656 (0.530)	Data 0.001 (0.025)	Loss 4.2746 (4.2739)	Top-1 acc 24.609 (25.880)	Top-5 acc 47.266 (48.467)	lr 0.01683
Warmup Train [25][780/3239]	Time 0.492 (0.530)	Data 0.001 (0.025)	Loss 4.1873 (4.2737)	Top-1 acc 22.656 (25.884)	Top-5 acc 47.656 (48.456)	lr 0.01683
Warmup Train [25][790/3239]	Time 0.623 (0.530)	Data 0.001 (0.025)	Loss 4.1295 (4.2732)	Top-1 acc 31.641 (25.894)	Top-5 acc 50.000 (48.461)	lr 0.01682
Warmup Train [25][800/3239]	Time 0.418 (0.530)	Data 0.001 (0.024)	Loss 4.2530 (4.2731)	Top-1 acc 25.781 (25.891)	Top-5 acc 47.266 (48.456)	lr 0.01681
Warmup Train [25][810/3239]	Time 0.380 (0.530)	Data 0.001 (0.024)	Loss 4.2253 (4.2730)	Top-1 acc 30.859 (25.891)	Top-5 acc 48.047 (48.455)	lr 0.01681
Warmup Train [25][820/3239]	Time 0.576 (0.530)	Data 0.001 (0.024)	Loss 4.3639 (4.2728)	Top-1 acc 22.266 (25.894)	Top-5 acc 42.578 (48.445)	lr 0.01680
Warmup Train [25][830/3239]	Time 0.568 (0.529)	Data 0.001 (0.024)	Loss 4.4069 (4.2725)	Top-1 acc 20.703 (25.894)	Top-5 acc 42.969 (48.447)	lr 0.01680
Warmup Train [25][840/3239]	Time 0.552 (0.529)	Data 0.001 (0.024)	Loss 4.1108 (4.2723)	Top-1 acc 28.125 (25.897)	Top-5 acc 53.125 (48.453)	lr 0.01679
Warmup Train [25][850/3239]	Time 0.357 (0.529)	Data 0.001 (0.024)	Loss 3.9653 (4.2719)	Top-1 acc 30.859 (25.891)	Top-5 acc 57.031 (48.467)	lr 0.01679
Warmup Train [25][860/3239]	Time 0.497 (0.529)	Data 0.001 (0.024)	Loss 4.3272 (4.2720)	Top-1 acc 25.781 (25.887)	Top-5 acc 50.000 (48.467)	lr 0.01678
Warmup Train [25][870/3239]	Time 0.647 (0.528)	Data 0.001 (0.023)	Loss 4.3717 (4.2720)	Top-1 acc 28.906 (25.893)	Top-5 acc 48.438 (48.472)	lr 0.01677
Warmup Train [25][880/3239]	Time 0.322 (0.527)	Data 0.001 (0.023)	Loss 4.2346 (4.2715)	Top-1 acc 28.906 (25.904)	Top-5 acc 54.688 (48.484)	lr 0.01677
Warmup Train [25][890/3239]	Time 0.424 (0.527)	Data 0.001 (0.023)	Loss 4.3236 (4.2713)	Top-1 acc 28.906 (25.904)	Top-5 acc 47.656 (48.484)	lr 0.01676
Warmup Train [25][900/3239]	Time 0.401 (0.526)	Data 0.001 (0.023)	Loss 4.1310 (4.2707)	Top-1 acc 25.391 (25.909)	Top-5 acc 51.562 (48.497)	lr 0.01676
Warmup Train [25][910/3239]	Time 0.528 (0.526)	Data 0.001 (0.023)	Loss 4.4818 (4.2706)	Top-1 acc 23.047 (25.909)	Top-5 acc 45.703 (48.496)	lr 0.01675
Warmup Train [25][920/3239]	Time 0.611 (0.526)	Data 0.001 (0.022)	Loss 4.3015 (4.2702)	Top-1 acc 26.562 (25.919)	Top-5 acc 46.875 (48.510)	lr 0.01675
Warmup Train [25][930/3239]	Time 0.578 (0.526)	Data 0.002 (0.022)	Loss 4.2873 (4.2703)	Top-1 acc 25.391 (25.921)	Top-5 acc 50.781 (48.513)	lr 0.01674
Warmup Train [25][940/3239]	Time 0.492 (0.526)	Data 0.001 (0.022)	Loss 4.3711 (4.2700)	Top-1 acc 20.703 (25.929)	Top-5 acc 47.656 (48.536)	lr 0.01673
Warmup Train [25][950/3239]	Time 0.343 (0.526)	Data 0.001 (0.022)	Loss 4.4274 (4.2700)	Top-1 acc 23.438 (25.932)	Top-5 acc 45.312 (48.535)	lr 0.01673
Warmup Train [25][960/3239]	Time 0.627 (0.526)	Data 0.037 (0.022)	Loss 4.2868 (4.2693)	Top-1 acc 23.828 (25.937)	Top-5 acc 49.219 (48.549)	lr 0.01672
Warmup Train [25][970/3239]	Time 0.688 (0.526)	Data 0.002 (0.022)	Loss 4.1095 (4.2689)	Top-1 acc 25.391 (25.942)	Top-5 acc 50.391 (48.561)	lr 0.01672
Warmup Train [25][980/3239]	Time 0.525 (0.526)	Data 0.001 (0.021)	Loss 4.1626 (4.2688)	Top-1 acc 27.344 (25.943)	Top-5 acc 48.047 (48.559)	lr 0.01671
Warmup Train [25][990/3239]	Time 0.495 (0.526)	Data 0.001 (0.021)	Loss 4.0746 (4.2678)	Top-1 acc 30.078 (25.961)	Top-5 acc 48.438 (48.576)	lr 0.01671
Warmup Train [25][1000/3239]	Time 0.362 (0.525)	Data 0.001 (0.021)	Loss 4.2529 (4.2679)	Top-1 acc 28.516 (25.957)	Top-5 acc 50.000 (48.581)	lr 0.01670
Warmup Train [25][1010/3239]	Time 0.662 (0.525)	Data 0.001 (0.021)	Loss 4.2401 (4.2682)	Top-1 acc 26.562 (25.953)	Top-5 acc 49.609 (48.571)	lr 0.01669
Warmup Train [25][1020/3239]	Time 0.720 (0.525)	Data 0.001 (0.021)	Loss 4.0556 (4.2679)	Top-1 acc 30.469 (25.952)	Top-5 acc 52.344 (48.580)	lr 0.01669
Warmup Train [25][1030/3239]	Time 0.514 (0.525)	Data 0.001 (0.021)	Loss 3.9964 (4.2681)	Top-1 acc 31.641 (25.952)	Top-5 acc 53.516 (48.570)	lr 0.01668
Warmup Train [25][1040/3239]	Time 0.460 (0.525)	Data 0.001 (0.021)	Loss 4.4494 (4.2684)	Top-1 acc 26.172 (25.953)	Top-5 acc 46.094 (48.574)	lr 0.01668
Warmup Train [25][1050/3239]	Time 0.585 (0.525)	Data 0.001 (0.020)	Loss 4.4438 (4.2685)	Top-1 acc 21.094 (25.951)	Top-5 acc 41.406 (48.566)	lr 0.01667
Warmup Train [25][1060/3239]	Time 0.616 (0.524)	Data 0.001 (0.020)	Loss 4.3801 (4.2681)	Top-1 acc 20.703 (25.948)	Top-5 acc 46.094 (48.580)	lr 0.01667
Warmup Train [25][1070/3239]	Time 0.573 (0.524)	Data 0.001 (0.020)	Loss 4.4294 (4.2687)	Top-1 acc 21.484 (25.928)	Top-5 acc 44.922 (48.567)	lr 0.01666
Warmup Train [25][1080/3239]	Time 0.418 (0.524)	Data 0.001 (0.020)	Loss 4.2664 (4.2685)	Top-1 acc 25.000 (25.938)	Top-5 acc 50.000 (48.569)	lr 0.01665
Warmup Train [25][1090/3239]	Time 0.676 (0.523)	Data 0.001 (0.020)	Loss 4.2652 (4.2691)	Top-1 acc 26.562 (25.935)	Top-5 acc 46.875 (48.560)	lr 0.01665
Warmup Train [25][1100/3239]	Time 0.674 (0.523)	Data 0.001 (0.020)	Loss 4.3064 (4.2692)	Top-1 acc 26.172 (25.938)	Top-5 acc 46.094 (48.560)	lr 0.01664
Warmup Train [25][1110/3239]	Time 0.308 (0.523)	Data 0.001 (0.020)	Loss 4.1578 (4.2689)	Top-1 acc 25.000 (25.935)	Top-5 acc 47.266 (48.563)	lr 0.01664
Warmup Train [25][1120/3239]	Time 0.516 (0.523)	Data 0.001 (0.020)	Loss 4.2139 (4.2684)	Top-1 acc 27.344 (25.937)	Top-5 acc 51.562 (48.570)	lr 0.01663
Warmup Train [25][1130/3239]	Time 0.303 (0.522)	Data 0.001 (0.019)	Loss 4.3832 (4.2686)	Top-1 acc 25.391 (25.933)	Top-5 acc 44.141 (48.563)	lr 0.01663
Warmup Train [25][1140/3239]	Time 0.597 (0.522)	Data 0.001 (0.019)	Loss 4.2967 (4.2688)	Top-1 acc 25.000 (25.925)	Top-5 acc 46.484 (48.556)	lr 0.01662
Warmup Train [25][1150/3239]	Time 0.448 (0.522)	Data 0.001 (0.019)	Loss 4.2417 (4.2685)	Top-1 acc 26.953 (25.944)	Top-5 acc 49.219 (48.565)	lr 0.01661
Warmup Train [25][1160/3239]	Time 0.551 (0.522)	Data 0.001 (0.019)	Loss 4.1355 (4.2683)	Top-1 acc 28.516 (25.943)	Top-5 acc 50.391 (48.566)	lr 0.01661
Warmup Train [25][1170/3239]	Time 0.516 (0.522)	Data 0.001 (0.019)	Loss 4.4032 (4.2683)	Top-1 acc 23.047 (25.946)	Top-5 acc 46.875 (48.566)	lr 0.01660
Warmup Train [25][1180/3239]	Time 0.312 (0.522)	Data 0.001 (0.019)	Loss 4.5176 (4.2681)	Top-1 acc 23.047 (25.945)	Top-5 acc 38.672 (48.561)	lr 0.01660
Warmup Train [25][1190/3239]	Time 0.494 (0.522)	Data 0.001 (0.019)	Loss 4.1758 (4.2683)	Top-1 acc 27.734 (25.932)	Top-5 acc 50.781 (48.561)	lr 0.01659
Warmup Train [25][1200/3239]	Time 0.513 (0.522)	Data 0.002 (0.019)	Loss 4.2440 (4.2681)	Top-1 acc 26.953 (25.940)	Top-5 acc 49.609 (48.567)	lr 0.01659
Warmup Train [25][1210/3239]	Time 0.655 (0.522)	Data 0.001 (0.019)	Loss 4.3318 (4.2678)	Top-1 acc 25.000 (25.936)	Top-5 acc 45.312 (48.571)	lr 0.01658
Warmup Train [25][1220/3239]	Time 0.570 (0.522)	Data 0.001 (0.018)	Loss 4.3303 (4.2678)	Top-1 acc 25.781 (25.941)	Top-5 acc 49.219 (48.580)	lr 0.01657
Warmup Train [25][1230/3239]	Time 0.575 (0.522)	Data 0.001 (0.018)	Loss 4.2108 (4.2675)	Top-1 acc 27.344 (25.948)	Top-5 acc 48.438 (48.592)	lr 0.01657
Warmup Train [25][1240/3239]	Time 0.562 (0.522)	Data 0.001 (0.018)	Loss 4.3271 (4.2671)	Top-1 acc 23.828 (25.953)	Top-5 acc 45.312 (48.605)	lr 0.01656
Warmup Train [25][1250/3239]	Time 0.439 (0.522)	Data 0.001 (0.018)	Loss 4.1704 (4.2668)	Top-1 acc 31.250 (25.954)	Top-5 acc 52.734 (48.610)	lr 0.01656
Warmup Train [25][1260/3239]	Time 0.535 (0.522)	Data 0.001 (0.018)	Loss 4.3444 (4.2668)	Top-1 acc 25.781 (25.957)	Top-5 acc 48.828 (48.605)	lr 0.01655
Warmup Train [25][1270/3239]	Time 0.495 (0.522)	Data 0.001 (0.018)	Loss 4.4774 (4.2672)	Top-1 acc 23.438 (25.961)	Top-5 acc 42.969 (48.599)	lr 0.01655
Warmup Train [25][1280/3239]	Time 0.533 (0.522)	Data 0.001 (0.018)	Loss 4.1835 (4.2673)	Top-1 acc 27.344 (25.968)	Top-5 acc 51.172 (48.599)	lr 0.01654
Warmup Train [25][1290/3239]	Time 0.515 (0.522)	Data 0.001 (0.018)	Loss 4.2358 (4.2671)	Top-1 acc 24.609 (25.967)	Top-5 acc 51.172 (48.605)	lr 0.01653
Warmup Train [25][1300/3239]	Time 0.508 (0.522)	Data 0.001 (0.018)	Loss 4.5385 (4.2675)	Top-1 acc 21.484 (25.966)	Top-5 acc 41.406 (48.599)	lr 0.01653
Warmup Train [25][1310/3239]	Time 0.603 (0.522)	Data 0.001 (0.018)	Loss 4.3700 (4.2675)	Top-1 acc 22.656 (25.963)	Top-5 acc 46.875 (48.597)	lr 0.01652
Warmup Train [25][1320/3239]	Time 0.574 (0.522)	Data 0.001 (0.018)	Loss 4.1178 (4.2673)	Top-1 acc 30.078 (25.966)	Top-5 acc 53.516 (48.608)	lr 0.01652
Warmup Train [25][1330/3239]	Time 0.413 (0.522)	Data 0.001 (0.017)	Loss 4.3769 (4.2673)	Top-1 acc 25.000 (25.968)	Top-5 acc 48.438 (48.611)	lr 0.01651
Warmup Train [25][1340/3239]	Time 0.429 (0.522)	Data 0.001 (0.017)	Loss 4.2032 (4.2668)	Top-1 acc 27.344 (25.975)	Top-5 acc 50.391 (48.612)	lr 0.01651
Warmup Train [25][1350/3239]	Time 0.643 (0.521)	Data 0.001 (0.017)	Loss 4.3162 (4.2664)	Top-1 acc 24.219 (25.988)	Top-5 acc 45.703 (48.625)	lr 0.01650
Warmup Train [25][1360/3239]	Time 0.574 (0.521)	Data 0.001 (0.017)	Loss 4.3976 (4.2659)	Top-1 acc 25.000 (25.987)	Top-5 acc 44.531 (48.636)	lr 0.01650
Warmup Train [25][1370/3239]	Time 0.554 (0.521)	Data 0.001 (0.017)	Loss 4.2768 (4.2663)	Top-1 acc 23.828 (25.985)	Top-5 acc 50.391 (48.624)	lr 0.01649
Warmup Train [25][1380/3239]	Time 0.398 (0.520)	Data 0.001 (0.017)	Loss 4.3200 (4.2663)	Top-1 acc 26.172 (25.984)	Top-5 acc 48.047 (48.619)	lr 0.01648
Warmup Train [25][1390/3239]	Time 0.565 (0.520)	Data 0.001 (0.017)	Loss 4.1726 (4.2666)	Top-1 acc 27.734 (25.978)	Top-5 acc 50.781 (48.611)	lr 0.01648
Warmup Train [25][1400/3239]	Time 0.408 (0.520)	Data 0.001 (0.017)	Loss 4.1484 (4.2666)	Top-1 acc 29.297 (25.976)	Top-5 acc 50.000 (48.614)	lr 0.01647
Warmup Train [25][1410/3239]	Time 0.450 (0.521)	Data 0.001 (0.017)	Loss 4.3768 (4.2666)	Top-1 acc 25.000 (25.974)	Top-5 acc 45.312 (48.614)	lr 0.01647
Warmup Train [25][1420/3239]	Time 0.629 (0.520)	Data 0.001 (0.017)	Loss 4.2726 (4.2660)	Top-1 acc 28.125 (25.985)	Top-5 acc 47.656 (48.622)	lr 0.01646
Warmup Train [25][1430/3239]	Time 0.670 (0.521)	Data 0.001 (0.017)	Loss 4.3604 (4.2658)	Top-1 acc 25.391 (25.989)	Top-5 acc 46.094 (48.624)	lr 0.01646
Warmup Train [25][1440/3239]	Time 0.426 (0.521)	Data 0.001 (0.017)	Loss 4.3510 (4.2655)	Top-1 acc 26.562 (25.999)	Top-5 acc 45.703 (48.629)	lr 0.01645
Warmup Train [25][1450/3239]	Time 0.433 (0.520)	Data 0.001 (0.017)	Loss 4.3032 (4.2657)	Top-1 acc 25.391 (25.996)	Top-5 acc 47.656 (48.620)	lr 0.01644
Warmup Train [25][1460/3239]	Time 0.551 (0.520)	Data 0.001 (0.017)	Loss 4.1973 (4.2655)	Top-1 acc 24.609 (26.001)	Top-5 acc 47.656 (48.621)	lr 0.01644
Warmup Train [25][1470/3239]	Time 0.578 (0.520)	Data 0.001 (0.016)	Loss 4.3144 (4.2657)	Top-1 acc 23.828 (26.002)	Top-5 acc 46.094 (48.614)	lr 0.01643
Warmup Train [25][1480/3239]	Time 0.504 (0.520)	Data 0.001 (0.016)	Loss 4.3191 (4.2657)	Top-1 acc 24.609 (26.008)	Top-5 acc 45.703 (48.620)	lr 0.01643
Warmup Train [25][1490/3239]	Time 0.492 (0.520)	Data 0.001 (0.016)	Loss 4.2235 (4.2659)	Top-1 acc 28.906 (25.999)	Top-5 acc 48.438 (48.615)	lr 0.01642
Warmup Train [25][1500/3239]	Time 0.534 (0.520)	Data 0.001 (0.016)	Loss 4.3383 (4.2662)	Top-1 acc 22.266 (25.994)	Top-5 acc 47.266 (48.596)	lr 0.01642
Warmup Train [25][1510/3239]	Time 0.573 (0.520)	Data 0.001 (0.016)	Loss 4.2624 (4.2663)	Top-1 acc 23.828 (25.982)	Top-5 acc 47.656 (48.591)	lr 0.01641
Warmup Train [25][1520/3239]	Time 0.510 (0.520)	Data 0.001 (0.016)	Loss 4.2381 (4.2660)	Top-1 acc 30.078 (25.992)	Top-5 acc 47.656 (48.597)	lr 0.01640
Warmup Train [25][1530/3239]	Time 0.578 (0.520)	Data 0.001 (0.016)	Loss 4.2301 (4.2661)	Top-1 acc 26.953 (25.985)	Top-5 acc 52.734 (48.594)	lr 0.01640
Warmup Train [25][1540/3239]	Time 0.620 (0.520)	Data 0.001 (0.016)	Loss 4.3118 (4.2663)	Top-1 acc 26.562 (25.988)	Top-5 acc 47.656 (48.592)	lr 0.01639
Warmup Train [25][1550/3239]	Time 0.613 (0.520)	Data 0.001 (0.016)	Loss 4.4127 (4.2663)	Top-1 acc 23.828 (25.986)	Top-5 acc 47.266 (48.593)	lr 0.01639
Warmup Train [25][1560/3239]	Time 0.328 (0.520)	Data 0.001 (0.016)	Loss 4.3753 (4.2665)	Top-1 acc 23.438 (25.985)	Top-5 acc 42.578 (48.579)	lr 0.01638
Warmup Train [25][1570/3239]	Time 0.416 (0.520)	Data 0.001 (0.016)	Loss 4.0869 (4.2664)	Top-1 acc 27.734 (25.983)	Top-5 acc 51.562 (48.580)	lr 0.01638
Warmup Train [25][1580/3239]	Time 0.483 (0.520)	Data 0.001 (0.016)	Loss 4.2725 (4.2668)	Top-1 acc 26.172 (25.969)	Top-5 acc 45.703 (48.569)	lr 0.01637
Warmup Train [25][1590/3239]	Time 0.346 (0.520)	Data 0.001 (0.016)	Loss 4.5094 (4.2670)	Top-1 acc 20.312 (25.965)	Top-5 acc 40.625 (48.569)	lr 0.01636
Warmup Train [25][1600/3239]	Time 0.462 (0.520)	Data 0.001 (0.016)	Loss 4.0831 (4.2669)	Top-1 acc 28.516 (25.965)	Top-5 acc 55.469 (48.575)	lr 0.01636
Warmup Train [25][1610/3239]	Time 0.671 (0.519)	Data 0.001 (0.016)	Loss 4.2695 (4.2671)	Top-1 acc 25.391 (25.963)	Top-5 acc 47.656 (48.564)	lr 0.01635
Warmup Train [25][1620/3239]	Time 0.649 (0.519)	Data 0.001 (0.016)	Loss 4.3467 (4.2669)	Top-1 acc 25.781 (25.970)	Top-5 acc 47.656 (48.566)	lr 0.01635
Warmup Train [25][1630/3239]	Time 0.424 (0.519)	Data 0.001 (0.016)	Loss 4.1817 (4.2668)	Top-1 acc 30.859 (25.975)	Top-5 acc 51.562 (48.577)	lr 0.01634
Warmup Train [25][1640/3239]	Time 0.471 (0.519)	Data 0.001 (0.016)	Loss 4.2305 (4.2666)	Top-1 acc 28.125 (25.977)	Top-5 acc 50.000 (48.583)	lr 0.01634
Warmup Train [25][1650/3239]	Time 0.605 (0.519)	Data 0.001 (0.015)	Loss 4.2244 (4.2667)	Top-1 acc 24.219 (25.978)	Top-5 acc 46.875 (48.582)	lr 0.01633
Warmup Train [25][1660/3239]	Time 0.462 (0.519)	Data 0.001 (0.015)	Loss 4.0872 (4.2667)	Top-1 acc 28.125 (25.975)	Top-5 acc 53.125 (48.584)	lr 0.01632
Warmup Train [25][1670/3239]	Time 0.508 (0.519)	Data 0.001 (0.015)	Loss 4.2875 (4.2666)	Top-1 acc 24.609 (25.974)	Top-5 acc 49.219 (48.590)	lr 0.01632
Warmup Train [25][1680/3239]	Time 0.582 (0.519)	Data 0.001 (0.015)	Loss 4.3494 (4.2664)	Top-1 acc 25.781 (25.975)	Top-5 acc 47.266 (48.597)	lr 0.01631
Warmup Train [25][1690/3239]	Time 0.754 (0.519)	Data 0.001 (0.015)	Loss 3.9108 (4.2667)	Top-1 acc 34.375 (25.973)	Top-5 acc 54.688 (48.587)	lr 0.01631
Warmup Train [25][1700/3239]	Time 0.458 (0.519)	Data 0.001 (0.015)	Loss 4.1342 (4.2667)	Top-1 acc 25.000 (25.975)	Top-5 acc 54.297 (48.591)	lr 0.01630
Warmup Train [25][1710/3239]	Time 0.517 (0.519)	Data 0.001 (0.015)	Loss 4.1314 (4.2666)	Top-1 acc 28.906 (25.975)	Top-5 acc 53.906 (48.588)	lr 0.01630
Warmup Train [25][1720/3239]	Time 0.671 (0.519)	Data 0.001 (0.015)	Loss 4.3334 (4.2663)	Top-1 acc 23.438 (25.975)	Top-5 acc 49.219 (48.600)	lr 0.01629
Warmup Train [25][1730/3239]	Time 0.570 (0.519)	Data 0.001 (0.015)	Loss 4.2224 (4.2662)	Top-1 acc 23.438 (25.975)	Top-5 acc 46.484 (48.605)	lr 0.01628
Warmup Train [25][1740/3239]	Time 0.635 (0.519)	Data 0.001 (0.015)	Loss 4.3202 (4.2661)	Top-1 acc 29.688 (25.978)	Top-5 acc 45.703 (48.605)	lr 0.01628
Warmup Train [25][1750/3239]	Time 0.551 (0.519)	Data 0.001 (0.015)	Loss 4.2884 (4.2664)	Top-1 acc 23.828 (25.971)	Top-5 acc 49.219 (48.605)	lr 0.01627
Warmup Train [25][1760/3239]	Time 0.511 (0.519)	Data 0.001 (0.015)	Loss 4.4375 (4.2665)	Top-1 acc 21.094 (25.966)	Top-5 acc 45.703 (48.604)	lr 0.01627
Warmup Train [25][1770/3239]	Time 0.494 (0.519)	Data 0.001 (0.015)	Loss 4.2666 (4.2666)	Top-1 acc 26.172 (25.967)	Top-5 acc 48.438 (48.601)	lr 0.01626
Warmup Train [25][1780/3239]	Time 0.438 (0.519)	Data 0.001 (0.015)	Loss 4.2311 (4.2666)	Top-1 acc 27.734 (25.968)	Top-5 acc 50.391 (48.601)	lr 0.01626
Warmup Train [25][1790/3239]	Time 0.629 (0.519)	Data 0.001 (0.015)	Loss 4.2644 (4.2663)	Top-1 acc 23.828 (25.973)	Top-5 acc 50.781 (48.606)	lr 0.01625
Warmup Train [25][1800/3239]	Time 0.479 (0.519)	Data 0.001 (0.015)	Loss 4.2410 (4.2660)	Top-1 acc 29.297 (25.975)	Top-5 acc 46.875 (48.611)	lr 0.01624
Warmup Train [25][1810/3239]	Time 0.451 (0.519)	Data 0.001 (0.015)	Loss 3.9912 (4.2655)	Top-1 acc 29.688 (25.987)	Top-5 acc 53.125 (48.619)	lr 0.01624
Warmup Train [25][1820/3239]	Time 0.403 (0.518)	Data 0.001 (0.014)	Loss 4.3530 (4.2657)	Top-1 acc 23.828 (25.988)	Top-5 acc 47.266 (48.616)	lr 0.01623
Warmup Train [25][1830/3239]	Time 0.552 (0.518)	Data 0.001 (0.014)	Loss 4.0464 (4.2659)	Top-1 acc 32.812 (25.989)	Top-5 acc 55.469 (48.612)	lr 0.01623
Warmup Train [25][1840/3239]	Time 0.297 (0.518)	Data 0.001 (0.014)	Loss 4.4184 (4.2662)	Top-1 acc 24.609 (25.984)	Top-5 acc 45.703 (48.609)	lr 0.01622
Warmup Train [25][1850/3239]	Time 0.363 (0.518)	Data 0.001 (0.014)	Loss 4.2369 (4.2662)	Top-1 acc 26.953 (25.983)	Top-5 acc 50.000 (48.611)	lr 0.01622
Warmup Train [25][1860/3239]	Time 0.418 (0.517)	Data 0.001 (0.014)	Loss 4.2219 (4.2662)	Top-1 acc 27.344 (25.979)	Top-5 acc 48.047 (48.608)	lr 0.01621
Warmup Train [25][1870/3239]	Time 0.509 (0.518)	Data 0.001 (0.014)	Loss 4.3792 (4.2662)	Top-1 acc 27.344 (25.984)	Top-5 acc 46.484 (48.610)	lr 0.01621
Warmup Train [25][1880/3239]	Time 0.459 (0.517)	Data 0.001 (0.014)	Loss 4.3329 (4.2662)	Top-1 acc 21.094 (25.983)	Top-5 acc 43.750 (48.607)	lr 0.01620
Warmup Train [25][1890/3239]	Time 0.619 (0.517)	Data 0.001 (0.014)	Loss 4.3668 (4.2663)	Top-1 acc 24.219 (25.975)	Top-5 acc 44.531 (48.602)	lr 0.01619
Warmup Train [25][1900/3239]	Time 0.438 (0.517)	Data 0.001 (0.014)	Loss 4.4626 (4.2662)	Top-1 acc 23.438 (25.972)	Top-5 acc 41.406 (48.596)	lr 0.01619
Warmup Train [25][1910/3239]	Time 0.376 (0.517)	Data 0.001 (0.014)	Loss 4.2207 (4.2660)	Top-1 acc 26.953 (25.978)	Top-5 acc 53.906 (48.600)	lr 0.01618
Warmup Train [25][1920/3239]	Time 0.561 (0.518)	Data 0.001 (0.014)	Loss 4.0832 (4.2662)	Top-1 acc 31.641 (25.978)	Top-5 acc 55.859 (48.600)	lr 0.01618
Warmup Train [25][1930/3239]	Time 0.563 (0.518)	Data 0.001 (0.014)	Loss 4.2734 (4.2660)	Top-1 acc 24.219 (25.983)	Top-5 acc 50.000 (48.605)	lr 0.01617
Warmup Train [25][1940/3239]	Time 0.463 (0.518)	Data 0.001 (0.014)	Loss 4.1435 (4.2659)	Top-1 acc 29.688 (25.985)	Top-5 acc 53.906 (48.609)	lr 0.01617
Warmup Train [25][1950/3239]	Time 0.590 (0.518)	Data 0.001 (0.014)	Loss 4.2088 (4.2659)	Top-1 acc 26.562 (25.984)	Top-5 acc 49.219 (48.604)	lr 0.01616
Warmup Train [25][1960/3239]	Time 0.437 (0.518)	Data 0.001 (0.014)	Loss 4.3235 (4.2656)	Top-1 acc 23.438 (25.991)	Top-5 acc 44.922 (48.614)	lr 0.01615
Warmup Train [25][1970/3239]	Time 0.606 (0.518)	Data 0.001 (0.014)	Loss 4.3701 (4.2659)	Top-1 acc 25.000 (25.995)	Top-5 acc 47.266 (48.608)	lr 0.01615
Warmup Train [25][1980/3239]	Time 0.480 (0.518)	Data 0.001 (0.014)	Loss 4.2501 (4.2659)	Top-1 acc 26.172 (25.995)	Top-5 acc 47.656 (48.605)	lr 0.01614
Warmup Train [25][1990/3239]	Time 0.486 (0.518)	Data 0.001 (0.014)	Loss 4.3165 (4.2661)	Top-1 acc 28.906 (25.992)	Top-5 acc 46.875 (48.599)	lr 0.01614
Warmup Train [25][2000/3239]	Time 0.515 (0.518)	Data 0.001 (0.014)	Loss 4.4397 (4.2663)	Top-1 acc 21.484 (25.991)	Top-5 acc 43.359 (48.593)	lr 0.01613
Warmup Train [25][2010/3239]	Time 0.549 (0.518)	Data 0.001 (0.014)	Loss 4.4278 (4.2664)	Top-1 acc 24.219 (25.987)	Top-5 acc 46.484 (48.591)	lr 0.01613
Warmup Train [25][2020/3239]	Time 0.485 (0.518)	Data 0.001 (0.014)	Loss 4.3620 (4.2666)	Top-1 acc 24.219 (25.982)	Top-5 acc 48.438 (48.588)	lr 0.01612
Warmup Train [25][2030/3239]	Time 0.393 (0.517)	Data 0.001 (0.014)	Loss 4.1833 (4.2668)	Top-1 acc 27.344 (25.981)	Top-5 acc 49.219 (48.583)	lr 0.01611
Warmup Train [25][2040/3239]	Time 0.484 (0.518)	Data 0.001 (0.014)	Loss 4.2843 (4.2668)	Top-1 acc 25.391 (25.986)	Top-5 acc 45.312 (48.584)	lr 0.01611
Warmup Train [25][2050/3239]	Time 0.509 (0.517)	Data 0.001 (0.014)	Loss 4.1617 (4.2667)	Top-1 acc 27.344 (25.987)	Top-5 acc 50.000 (48.587)	lr 0.01610
Warmup Train [25][2060/3239]	Time 0.663 (0.517)	Data 0.001 (0.013)	Loss 4.3568 (4.2668)	Top-1 acc 23.828 (25.988)	Top-5 acc 46.875 (48.587)	lr 0.01610
Warmup Train [25][2070/3239]	Time 0.605 (0.517)	Data 0.001 (0.013)	Loss 4.0919 (4.2665)	Top-1 acc 27.344 (25.995)	Top-5 acc 51.953 (48.593)	lr 0.01609
Warmup Train [25][2080/3239]	Time 0.621 (0.517)	Data 0.001 (0.013)	Loss 4.1928 (4.2666)	Top-1 acc 28.906 (25.997)	Top-5 acc 49.609 (48.588)	lr 0.01609
Warmup Train [25][2090/3239]	Time 0.536 (0.517)	Data 0.001 (0.013)	Loss 4.3291 (4.2666)	Top-1 acc 26.953 (26.000)	Top-5 acc 47.656 (48.590)	lr 0.01608
Warmup Train [25][2100/3239]	Time 0.479 (0.517)	Data 0.001 (0.013)	Loss 4.3294 (4.2667)	Top-1 acc 24.609 (26.001)	Top-5 acc 45.312 (48.590)	lr 0.01607
Warmup Train [25][2110/3239]	Time 0.633 (0.517)	Data 0.001 (0.013)	Loss 4.3699 (4.2668)	Top-1 acc 23.828 (25.998)	Top-5 acc 49.219 (48.591)	lr 0.01607
Warmup Train [25][2120/3239]	Time 0.673 (0.517)	Data 0.001 (0.013)	Loss 4.1929 (4.2665)	Top-1 acc 27.344 (26.006)	Top-5 acc 50.000 (48.596)	lr 0.01606
Warmup Train [25][2130/3239]	Time 0.502 (0.517)	Data 0.001 (0.013)	Loss 4.2926 (4.2664)	Top-1 acc 26.172 (26.007)	Top-5 acc 48.828 (48.600)	lr 0.01606
Warmup Train [25][2140/3239]	Time 0.466 (0.517)	Data 0.001 (0.013)	Loss 4.0954 (4.2663)	Top-1 acc 32.031 (26.013)	Top-5 acc 53.125 (48.607)	lr 0.01605
Warmup Train [25][2150/3239]	Time 0.535 (0.517)	Data 0.001 (0.013)	Loss 4.2568 (4.2662)	Top-1 acc 28.516 (26.018)	Top-5 acc 50.781 (48.615)	lr 0.01605
Warmup Train [25][2160/3239]	Time 0.659 (0.517)	Data 0.001 (0.013)	Loss 4.2683 (4.2663)	Top-1 acc 26.953 (26.016)	Top-5 acc 48.047 (48.613)	lr 0.01604
Warmup Train [25][2170/3239]	Time 0.552 (0.517)	Data 0.001 (0.013)	Loss 4.2566 (4.2662)	Top-1 acc 27.734 (26.019)	Top-5 acc 48.047 (48.613)	lr 0.01604
Warmup Train [25][2180/3239]	Time 0.400 (0.517)	Data 0.001 (0.013)	Loss 4.0242 (4.2662)	Top-1 acc 32.812 (26.021)	Top-5 acc 51.562 (48.614)	lr 0.01603
Warmup Train [25][2190/3239]	Time 0.484 (0.517)	Data 0.001 (0.013)	Loss 4.2809 (4.2666)	Top-1 acc 26.562 (26.018)	Top-5 acc 47.656 (48.604)	lr 0.01602
Warmup Train [25][2200/3239]	Time 0.336 (0.517)	Data 0.001 (0.013)	Loss 4.0081 (4.2663)	Top-1 acc 26.562 (26.014)	Top-5 acc 54.297 (48.615)	lr 0.01602
Warmup Train [25][2210/3239]	Time 0.631 (0.517)	Data 0.001 (0.013)	Loss 4.2965 (4.2663)	Top-1 acc 25.391 (26.015)	Top-5 acc 48.438 (48.617)	lr 0.01601
Warmup Train [25][2220/3239]	Time 0.529 (0.517)	Data 0.001 (0.013)	Loss 4.1447 (4.2663)	Top-1 acc 30.469 (26.015)	Top-5 acc 53.906 (48.617)	lr 0.01601
Warmup Train [25][2230/3239]	Time 0.305 (0.517)	Data 0.003 (0.013)	Loss 4.2779 (4.2662)	Top-1 acc 24.219 (26.016)	Top-5 acc 48.047 (48.616)	lr 0.01600
Warmup Train [25][2240/3239]	Time 0.514 (0.517)	Data 0.001 (0.013)	Loss 4.5263 (4.2665)	Top-1 acc 21.875 (26.015)	Top-5 acc 46.484 (48.612)	lr 0.01600
Warmup Train [25][2250/3239]	Time 0.535 (0.517)	Data 0.001 (0.013)	Loss 4.1922 (4.2665)	Top-1 acc 28.125 (26.014)	Top-5 acc 48.438 (48.610)	lr 0.01599
Warmup Train [25][2260/3239]	Time 0.441 (0.517)	Data 0.002 (0.013)	Loss 4.1968 (4.2666)	Top-1 acc 26.562 (26.013)	Top-5 acc 50.000 (48.608)	lr 0.01598
Warmup Train [25][2270/3239]	Time 0.511 (0.517)	Data 0.002 (0.013)	Loss 4.1522 (4.2665)	Top-1 acc 24.609 (26.011)	Top-5 acc 48.047 (48.609)	lr 0.01598
Warmup Train [25][2280/3239]	Time 0.368 (0.517)	Data 0.001 (0.013)	Loss 4.1427 (4.2666)	Top-1 acc 30.859 (26.011)	Top-5 acc 50.000 (48.607)	lr 0.01597
Warmup Train [25][2290/3239]	Time 0.286 (0.517)	Data 0.001 (0.013)	Loss 4.2395 (4.2665)	Top-1 acc 27.344 (26.008)	Top-5 acc 50.391 (48.605)	lr 0.01597
Warmup Train [25][2300/3239]	Time 0.492 (0.517)	Data 0.001 (0.013)	Loss 4.2923 (4.2667)	Top-1 acc 30.078 (26.007)	Top-5 acc 45.703 (48.605)	lr 0.01596
Warmup Train [25][2310/3239]	Time 0.452 (0.517)	Data 0.001 (0.013)	Loss 4.1213 (4.2666)	Top-1 acc 29.297 (26.008)	Top-5 acc 49.609 (48.605)	lr 0.01596
Warmup Train [25][2320/3239]	Time 0.385 (0.517)	Data 0.001 (0.013)	Loss 4.3063 (4.2664)	Top-1 acc 24.609 (26.009)	Top-5 acc 49.219 (48.608)	lr 0.01595
Warmup Train [25][2330/3239]	Time 0.534 (0.517)	Data 0.001 (0.013)	Loss 4.3367 (4.2663)	Top-1 acc 26.172 (26.010)	Top-5 acc 48.047 (48.609)	lr 0.01594
Warmup Train [25][2340/3239]	Time 0.430 (0.516)	Data 0.001 (0.013)	Loss 4.4090 (4.2665)	Top-1 acc 25.391 (26.010)	Top-5 acc 45.312 (48.608)	lr 0.01594
Warmup Train [25][2350/3239]	Time 0.532 (0.516)	Data 0.001 (0.013)	Loss 4.2152 (4.2665)	Top-1 acc 26.562 (26.009)	Top-5 acc 50.781 (48.605)	lr 0.01593
Warmup Train [25][2360/3239]	Time 0.616 (0.516)	Data 0.001 (0.013)	Loss 4.1391 (4.2666)	Top-1 acc 23.828 (26.005)	Top-5 acc 50.781 (48.598)	lr 0.01593
Warmup Train [25][2370/3239]	Time 0.633 (0.516)	Data 0.001 (0.013)	Loss 4.2494 (4.2668)	Top-1 acc 26.953 (26.001)	Top-5 acc 48.047 (48.593)	lr 0.01592
Warmup Train [25][2380/3239]	Time 0.684 (0.516)	Data 0.001 (0.013)	Loss 4.2647 (4.2666)	Top-1 acc 30.469 (26.010)	Top-5 acc 48.047 (48.598)	lr 0.01592
Warmup Train [25][2390/3239]	Time 0.642 (0.516)	Data 0.001 (0.013)	Loss 4.1733 (4.2666)	Top-1 acc 27.344 (26.010)	Top-5 acc 48.828 (48.596)	lr 0.01591
Warmup Train [25][2400/3239]	Time 0.506 (0.516)	Data 0.001 (0.013)	Loss 4.3949 (4.2668)	Top-1 acc 24.609 (26.008)	Top-5 acc 47.266 (48.589)	lr 0.01591
Warmup Train [25][2410/3239]	Time 0.477 (0.516)	Data 0.001 (0.013)	Loss 4.2912 (4.2666)	Top-1 acc 28.516 (26.012)	Top-5 acc 48.828 (48.594)	lr 0.01590
Warmup Train [25][2420/3239]	Time 0.488 (0.516)	Data 0.001 (0.013)	Loss 4.1606 (4.2666)	Top-1 acc 30.078 (26.013)	Top-5 acc 50.781 (48.589)	lr 0.01589
Warmup Train [25][2430/3239]	Time 0.392 (0.516)	Data 0.001 (0.013)	Loss 4.2173 (4.2664)	Top-1 acc 23.047 (26.013)	Top-5 acc 50.391 (48.592)	lr 0.01589
Warmup Train [25][2440/3239]	Time 0.496 (0.516)	Data 0.001 (0.013)	Loss 4.4013 (4.2664)	Top-1 acc 23.047 (26.015)	Top-5 acc 46.875 (48.598)	lr 0.01588
Warmup Train [25][2450/3239]	Time 0.432 (0.516)	Data 0.001 (0.013)	Loss 4.3372 (4.2662)	Top-1 acc 23.438 (26.019)	Top-5 acc 50.781 (48.604)	lr 0.01588
Warmup Train [25][2460/3239]	Time 0.628 (0.516)	Data 0.001 (0.012)	Loss 4.1899 (4.2662)	Top-1 acc 25.391 (26.016)	Top-5 acc 49.219 (48.603)	lr 0.01587
Warmup Train [25][2470/3239]	Time 0.443 (0.516)	Data 0.001 (0.012)	Loss 4.3910 (4.2662)	Top-1 acc 21.875 (26.015)	Top-5 acc 45.703 (48.601)	lr 0.01587
Warmup Train [25][2480/3239]	Time 0.630 (0.516)	Data 0.001 (0.012)	Loss 4.4009 (4.2662)	Top-1 acc 23.438 (26.014)	Top-5 acc 43.750 (48.604)	lr 0.01586
Warmup Train [25][2490/3239]	Time 0.515 (0.516)	Data 0.001 (0.012)	Loss 4.3179 (4.2664)	Top-1 acc 23.438 (26.011)	Top-5 acc 45.312 (48.597)	lr 0.01585
Warmup Train [25][2500/3239]	Time 0.420 (0.516)	Data 0.001 (0.012)	Loss 4.2050 (4.2661)	Top-1 acc 30.078 (26.017)	Top-5 acc 50.000 (48.604)	lr 0.01585
Warmup Train [25][2510/3239]	Time 0.466 (0.516)	Data 0.001 (0.012)	Loss 4.3048 (4.2660)	Top-1 acc 26.172 (26.022)	Top-5 acc 47.656 (48.606)	lr 0.01584
Warmup Train [25][2520/3239]	Time 0.530 (0.516)	Data 0.001 (0.012)	Loss 4.3017 (4.2658)	Top-1 acc 23.047 (26.025)	Top-5 acc 46.875 (48.612)	lr 0.01584
Warmup Train [25][2530/3239]	Time 0.512 (0.516)	Data 0.001 (0.012)	Loss 4.4094 (4.2657)	Top-1 acc 25.781 (26.024)	Top-5 acc 46.875 (48.610)	lr 0.01583
Warmup Train [25][2540/3239]	Time 0.144 (0.516)	Data 0.001 (0.012)	Loss 4.2787 (4.2656)	Top-1 acc 26.172 (26.027)	Top-5 acc 49.609 (48.612)	lr 0.01583
Warmup Train [25][2550/3239]	Time 0.579 (0.516)	Data 0.001 (0.012)	Loss 4.2163 (4.2658)	Top-1 acc 25.781 (26.020)	Top-5 acc 51.172 (48.605)	lr 0.01582
Warmup Train [25][2560/3239]	Time 0.510 (0.516)	Data 0.001 (0.012)	Loss 4.1998 (4.2657)	Top-1 acc 28.906 (26.025)	Top-5 acc 51.172 (48.607)	lr 0.01581
Warmup Train [25][2570/3239]	Time 0.458 (0.516)	Data 0.001 (0.012)	Loss 4.1845 (4.2657)	Top-1 acc 27.734 (26.024)	Top-5 acc 50.391 (48.609)	lr 0.01581
Warmup Train [25][2580/3239]	Time 0.427 (0.516)	Data 0.001 (0.012)	Loss 4.3149 (4.2657)	Top-1 acc 25.000 (26.027)	Top-5 acc 47.266 (48.609)	lr 0.01580
Warmup Train [25][2590/3239]	Time 0.370 (0.516)	Data 0.001 (0.012)	Loss 4.1061 (4.2655)	Top-1 acc 25.781 (26.024)	Top-5 acc 53.125 (48.612)	lr 0.01580
Warmup Train [25][2600/3239]	Time 0.536 (0.516)	Data 0.001 (0.012)	Loss 4.1618 (4.2654)	Top-1 acc 26.953 (26.027)	Top-5 acc 48.047 (48.611)	lr 0.01579
Warmup Train [25][2610/3239]	Time 0.410 (0.516)	Data 0.001 (0.012)	Loss 4.4014 (4.2653)	Top-1 acc 23.438 (26.024)	Top-5 acc 46.094 (48.613)	lr 0.01579
Warmup Train [25][2620/3239]	Time 0.447 (0.516)	Data 0.001 (0.012)	Loss 4.1659 (4.2651)	Top-1 acc 29.688 (26.024)	Top-5 acc 51.562 (48.616)	lr 0.01578
Warmup Train [25][2630/3239]	Time 0.566 (0.516)	Data 0.001 (0.012)	Loss 4.1592 (4.2651)	Top-1 acc 24.609 (26.025)	Top-5 acc 47.656 (48.618)	lr 0.01578
Warmup Train [25][2640/3239]	Time 0.642 (0.516)	Data 0.001 (0.012)	Loss 4.3753 (4.2652)	Top-1 acc 26.562 (26.024)	Top-5 acc 47.266 (48.618)	lr 0.01577
Warmup Train [25][2650/3239]	Time 0.383 (0.516)	Data 0.001 (0.012)	Loss 4.4087 (4.2653)	Top-1 acc 24.219 (26.025)	Top-5 acc 43.359 (48.612)	lr 0.01576
Warmup Train [25][2660/3239]	Time 0.604 (0.516)	Data 0.001 (0.012)	Loss 4.2344 (4.2652)	Top-1 acc 27.344 (26.028)	Top-5 acc 49.609 (48.615)	lr 0.01576
Warmup Train [25][2670/3239]	Time 0.509 (0.516)	Data 0.001 (0.012)	Loss 4.0719 (4.2652)	Top-1 acc 26.172 (26.027)	Top-5 acc 52.734 (48.614)	lr 0.01575
Warmup Train [25][2680/3239]	Time 0.442 (0.516)	Data 0.001 (0.012)	Loss 4.3748 (4.2652)	Top-1 acc 26.953 (26.034)	Top-5 acc 44.141 (48.614)	lr 0.01575
Warmup Train [25][2690/3239]	Time 0.466 (0.516)	Data 0.001 (0.012)	Loss 4.0727 (4.2650)	Top-1 acc 26.172 (26.036)	Top-5 acc 55.078 (48.617)	lr 0.01574
Warmup Train [25][2700/3239]	Time 0.683 (0.516)	Data 0.001 (0.012)	Loss 4.2442 (4.2652)	Top-1 acc 28.125 (26.035)	Top-5 acc 48.438 (48.611)	lr 0.01574
Warmup Train [25][2710/3239]	Time 0.587 (0.516)	Data 0.001 (0.012)	Loss 4.2741 (4.2652)	Top-1 acc 23.438 (26.035)	Top-5 acc 51.172 (48.616)	lr 0.01573
Warmup Train [25][2720/3239]	Time 0.638 (0.516)	Data 0.001 (0.012)	Loss 4.4641 (4.2651)	Top-1 acc 24.219 (26.038)	Top-5 acc 44.922 (48.616)	lr 0.01572
Warmup Train [25][2730/3239]	Time 0.502 (0.516)	Data 0.001 (0.012)	Loss 4.1844 (4.2652)	Top-1 acc 26.953 (26.035)	Top-5 acc 50.781 (48.616)	lr 0.01572
Warmup Train [25][2740/3239]	Time 0.522 (0.516)	Data 0.001 (0.012)	Loss 4.2098 (4.2651)	Top-1 acc 25.000 (26.037)	Top-5 acc 46.875 (48.621)	lr 0.01571
Warmup Train [25][2750/3239]	Time 0.642 (0.516)	Data 0.001 (0.012)	Loss 4.2987 (4.2649)	Top-1 acc 28.516 (26.041)	Top-5 acc 45.703 (48.625)	lr 0.01571
Warmup Train [25][2760/3239]	Time 0.494 (0.516)	Data 0.001 (0.012)	Loss 4.2725 (4.2650)	Top-1 acc 25.781 (26.040)	Top-5 acc 53.125 (48.627)	lr 0.01570
Warmup Train [25][2770/3239]	Time 0.487 (0.516)	Data 0.001 (0.012)	Loss 4.2570 (4.2650)	Top-1 acc 27.734 (26.042)	Top-5 acc 50.781 (48.627)	lr 0.01570
Warmup Train [25][2780/3239]	Time 0.358 (0.516)	Data 0.001 (0.012)	Loss 4.3933 (4.2649)	Top-1 acc 22.266 (26.042)	Top-5 acc 46.875 (48.629)	lr 0.01569
Warmup Train [25][2790/3239]	Time 0.478 (0.515)	Data 0.001 (0.012)	Loss 4.3200 (4.2647)	Top-1 acc 28.125 (26.044)	Top-5 acc 48.438 (48.632)	lr 0.01569
Warmup Train [25][2800/3239]	Time 0.412 (0.515)	Data 0.001 (0.012)	Loss 4.2890 (4.2649)	Top-1 acc 27.734 (26.042)	Top-5 acc 50.781 (48.626)	lr 0.01568
Warmup Train [25][2810/3239]	Time 0.301 (0.515)	Data 0.001 (0.012)	Loss 4.0812 (4.2648)	Top-1 acc 27.734 (26.045)	Top-5 acc 52.344 (48.629)	lr 0.01567
Warmup Train [25][2820/3239]	Time 0.413 (0.515)	Data 0.001 (0.012)	Loss 4.2463 (4.2648)	Top-1 acc 25.000 (26.043)	Top-5 acc 47.266 (48.625)	lr 0.01567
Warmup Train [25][2830/3239]	Time 0.663 (0.515)	Data 0.001 (0.012)	Loss 4.1694 (4.2651)	Top-1 acc 33.984 (26.041)	Top-5 acc 52.734 (48.619)	lr 0.01566
Warmup Train [25][2840/3239]	Time 0.415 (0.515)	Data 0.001 (0.012)	Loss 4.1411 (4.2650)	Top-1 acc 27.344 (26.043)	Top-5 acc 52.344 (48.621)	lr 0.01566
Warmup Train [25][2850/3239]	Time 0.574 (0.515)	Data 0.001 (0.012)	Loss 4.3272 (4.2652)	Top-1 acc 25.391 (26.035)	Top-5 acc 46.484 (48.615)	lr 0.01565
Warmup Train [25][2860/3239]	Time 0.551 (0.515)	Data 0.001 (0.012)	Loss 4.0802 (4.2651)	Top-1 acc 27.344 (26.036)	Top-5 acc 49.609 (48.616)	lr 0.01565
Warmup Train [25][2870/3239]	Time 0.505 (0.515)	Data 0.001 (0.012)	Loss 4.0810 (4.2647)	Top-1 acc 26.172 (26.042)	Top-5 acc 53.906 (48.627)	lr 0.01564
Warmup Train [25][2880/3239]	Time 0.507 (0.515)	Data 0.001 (0.012)	Loss 4.2097 (4.2645)	Top-1 acc 26.562 (26.046)	Top-5 acc 46.875 (48.636)	lr 0.01563
Warmup Train [25][2890/3239]	Time 0.486 (0.515)	Data 0.001 (0.012)	Loss 4.1962 (4.2643)	Top-1 acc 25.391 (26.051)	Top-5 acc 48.828 (48.642)	lr 0.01563
Warmup Train [25][2900/3239]	Time 0.690 (0.515)	Data 0.001 (0.012)	Loss 4.1872 (4.2641)	Top-1 acc 26.953 (26.050)	Top-5 acc 49.219 (48.645)	lr 0.01562
Warmup Train [25][2910/3239]	Time 0.564 (0.515)	Data 0.001 (0.012)	Loss 4.2782 (4.2637)	Top-1 acc 26.172 (26.060)	Top-5 acc 47.266 (48.652)	lr 0.01562
Warmup Train [25][2920/3239]	Time 0.482 (0.515)	Data 0.002 (0.012)	Loss 4.3843 (4.2638)	Top-1 acc 28.906 (26.064)	Top-5 acc 46.484 (48.649)	lr 0.01561
Warmup Train [25][2930/3239]	Time 0.368 (0.515)	Data 0.001 (0.012)	Loss 4.1378 (4.2637)	Top-1 acc 25.781 (26.063)	Top-5 acc 49.219 (48.651)	lr 0.01561
Warmup Train [25][2940/3239]	Time 0.635 (0.515)	Data 0.001 (0.012)	Loss 4.2265 (4.2637)	Top-1 acc 27.344 (26.066)	Top-5 acc 50.781 (48.653)	lr 0.01560
Warmup Train [25][2950/3239]	Time 0.373 (0.515)	Data 0.001 (0.012)	Loss 4.2521 (4.2638)	Top-1 acc 24.219 (26.061)	Top-5 acc 48.828 (48.648)	lr 0.01560
Warmup Train [25][2960/3239]	Time 0.592 (0.515)	Data 0.001 (0.012)	Loss 4.2369 (4.2637)	Top-1 acc 24.219 (26.059)	Top-5 acc 49.609 (48.649)	lr 0.01559
Warmup Train [25][2970/3239]	Time 0.448 (0.515)	Data 0.001 (0.012)	Loss 3.9847 (4.2637)	Top-1 acc 30.859 (26.059)	Top-5 acc 56.250 (48.650)	lr 0.01558
Warmup Train [25][2980/3239]	Time 0.565 (0.515)	Data 0.001 (0.012)	Loss 4.2214 (4.2635)	Top-1 acc 27.734 (26.060)	Top-5 acc 51.953 (48.652)	lr 0.01558
Warmup Train [25][2990/3239]	Time 0.544 (0.515)	Data 0.001 (0.012)	Loss 4.2786 (4.2636)	Top-1 acc 24.609 (26.058)	Top-5 acc 44.531 (48.648)	lr 0.01557
Warmup Train [25][3000/3239]	Time 0.567 (0.515)	Data 0.001 (0.012)	Loss 4.4966 (4.2637)	Top-1 acc 20.312 (26.055)	Top-5 acc 44.141 (48.647)	lr 0.01557
Warmup Train [25][3010/3239]	Time 0.579 (0.515)	Data 0.001 (0.012)	Loss 4.0839 (4.2638)	Top-1 acc 29.688 (26.053)	Top-5 acc 54.688 (48.643)	lr 0.01556
Warmup Train [25][3020/3239]	Time 0.505 (0.515)	Data 0.001 (0.012)	Loss 4.1764 (4.2638)	Top-1 acc 27.344 (26.053)	Top-5 acc 48.047 (48.642)	lr 0.01556
Warmup Train [25][3030/3239]	Time 0.605 (0.515)	Data 0.001 (0.012)	Loss 4.1988 (4.2636)	Top-1 acc 27.344 (26.054)	Top-5 acc 50.000 (48.648)	lr 0.01555
Warmup Train [25][3040/3239]	Time 0.496 (0.515)	Data 0.001 (0.011)	Loss 4.3298 (4.2635)	Top-1 acc 26.562 (26.061)	Top-5 acc 47.266 (48.654)	lr 0.01555
Warmup Train [25][3050/3239]	Time 0.506 (0.515)	Data 0.001 (0.011)	Loss 4.2077 (4.2637)	Top-1 acc 30.078 (26.057)	Top-5 acc 49.609 (48.648)	lr 0.01554
Warmup Train [25][3060/3239]	Time 0.446 (0.515)	Data 0.001 (0.011)	Loss 4.2400 (4.2636)	Top-1 acc 26.953 (26.058)	Top-5 acc 52.344 (48.652)	lr 0.01553
Warmup Train [25][3070/3239]	Time 0.548 (0.515)	Data 0.001 (0.011)	Loss 4.2372 (4.2635)	Top-1 acc 26.562 (26.061)	Top-5 acc 50.781 (48.654)	lr 0.01553
Warmup Train [25][3080/3239]	Time 0.554 (0.515)	Data 0.001 (0.011)	Loss 4.1231 (4.2633)	Top-1 acc 28.516 (26.067)	Top-5 acc 53.516 (48.660)	lr 0.01552
Warmup Train [25][3090/3239]	Time 0.531 (0.515)	Data 0.001 (0.011)	Loss 4.3680 (4.2633)	Top-1 acc 23.438 (26.066)	Top-5 acc 45.703 (48.659)	lr 0.01552
Warmup Train [25][3100/3239]	Time 0.558 (0.515)	Data 0.001 (0.011)	Loss 4.3739 (4.2631)	Top-1 acc 26.562 (26.075)	Top-5 acc 46.875 (48.662)	lr 0.01551
Warmup Train [25][3110/3239]	Time 0.542 (0.515)	Data 0.001 (0.011)	Loss 4.1668 (4.2630)	Top-1 acc 26.562 (26.082)	Top-5 acc 52.344 (48.666)	lr 0.01551
Warmup Train [25][3120/3239]	Time 0.510 (0.515)	Data 0.001 (0.011)	Loss 4.3854 (4.2631)	Top-1 acc 24.219 (26.082)	Top-5 acc 46.875 (48.663)	lr 0.01550
Warmup Train [25][3130/3239]	Time 0.596 (0.515)	Data 0.001 (0.011)	Loss 4.1736 (4.2631)	Top-1 acc 31.250 (26.081)	Top-5 acc 50.391 (48.663)	lr 0.01549
Warmup Train [25][3140/3239]	Time 0.494 (0.515)	Data 0.001 (0.011)	Loss 4.3251 (4.2632)	Top-1 acc 24.219 (26.083)	Top-5 acc 45.312 (48.663)	lr 0.01549
Warmup Train [25][3150/3239]	Time 0.490 (0.515)	Data 0.001 (0.011)	Loss 4.4021 (4.2631)	Top-1 acc 23.828 (26.081)	Top-5 acc 42.578 (48.660)	lr 0.01548
Warmup Train [25][3160/3239]	Time 0.529 (0.515)	Data 0.001 (0.011)	Loss 4.1195 (4.2633)	Top-1 acc 32.422 (26.079)	Top-5 acc 49.219 (48.658)	lr 0.01548
Warmup Train [25][3170/3239]	Time 0.482 (0.515)	Data 0.001 (0.011)	Loss 4.3334 (4.2632)	Top-1 acc 28.125 (26.082)	Top-5 acc 48.438 (48.657)	lr 0.01547
Warmup Train [25][3180/3239]	Time 0.327 (0.515)	Data 0.000 (0.011)	Loss 4.3925 (4.2630)	Top-1 acc 25.000 (26.086)	Top-5 acc 44.531 (48.664)	lr 0.01547
Warmup Train [25][3190/3239]	Time 0.485 (0.515)	Data 0.000 (0.011)	Loss 4.1406 (4.2628)	Top-1 acc 30.078 (26.095)	Top-5 acc 49.609 (48.667)	lr 0.01546
Warmup Train [25][3200/3239]	Time 0.564 (0.514)	Data 0.000 (0.011)	Loss 4.2291 (4.2628)	Top-1 acc 28.125 (26.096)	Top-5 acc 50.000 (48.669)	lr 0.01546
Warmup Train [25][3210/3239]	Time 0.663 (0.514)	Data 0.000 (0.011)	Loss 4.1422 (4.2625)	Top-1 acc 28.125 (26.102)	Top-5 acc 51.562 (48.674)	lr 0.01545
Warmup Train [25][3220/3239]	Time 0.489 (0.514)	Data 0.000 (0.011)	Loss 4.1975 (4.2623)	Top-1 acc 28.516 (26.106)	Top-5 acc 50.391 (48.677)	lr 0.01544
Warmup Train [25][3230/3239]	Time 0.481 (0.514)	Data 0.000 (0.011)	Loss 4.1301 (4.2622)	Top-1 acc 29.688 (26.108)	Top-5 acc 51.562 (48.677)	lr 0.01544
Warmup Train [25][3239/3239]	Time 0.320 (0.514)	Data 0.000 (0.011)	Loss 4.3514 (4.2622)	Top-1 acc 28.395 (26.108)	Top-5 acc 43.210 (48.677)	lr 0.01543
==========Warmup Valid [25/40]	loss 3.215	top-1 acc 33.831	top-5 acc 58.409	Train top-1 26.108	top-5 48.677	flops: 442.4M
Warmup Train [26][0/3239]	Time 12.693 (12.693)	Data 11.198 (11.198)	Loss 4.0851 (4.0851)	Top-1 acc 30.859 (30.859)	Top-5 acc 53.906 (53.906)	lr 0.01543
Warmup Train [26][10/3239]	Time 0.535 (1.737)	Data 0.001 (1.064)	Loss 4.0426 (4.1750)	Top-1 acc 30.859 (27.273)	Top-5 acc 52.734 (50.497)	lr 0.01543
Warmup Train [26][20/3239]	Time 0.418 (1.152)	Data 0.004 (0.558)	Loss 4.2124 (4.2119)	Top-1 acc 27.344 (26.581)	Top-5 acc 47.266 (49.814)	lr 0.01542
Warmup Train [26][30/3239]	Time 0.655 (0.955)	Data 0.001 (0.385)	Loss 4.2518 (4.2226)	Top-1 acc 29.297 (26.865)	Top-5 acc 51.172 (49.622)	lr 0.01542
Warmup Train [26][40/3239]	Time 0.518 (0.841)	Data 0.001 (0.292)	Loss 4.3388 (4.2372)	Top-1 acc 25.781 (26.267)	Top-5 acc 46.094 (49.352)	lr 0.01541
Warmup Train [26][50/3239]	Time 0.489 (0.778)	Data 0.001 (0.237)	Loss 4.1582 (4.2318)	Top-1 acc 28.125 (26.517)	Top-5 acc 52.344 (49.609)	lr 0.01540
Warmup Train [26][60/3239]	Time 0.584 (0.736)	Data 0.027 (0.199)	Loss 4.0568 (4.2252)	Top-1 acc 30.469 (26.684)	Top-5 acc 55.078 (49.782)	lr 0.01540
Warmup Train [26][70/3239]	Time 0.648 (0.707)	Data 0.001 (0.171)	Loss 4.2836 (4.2254)	Top-1 acc 23.047 (26.596)	Top-5 acc 51.172 (49.758)	lr 0.01539
Warmup Train [26][80/3239]	Time 0.568 (0.683)	Data 0.001 (0.150)	Loss 4.3355 (4.2221)	Top-1 acc 23.828 (26.673)	Top-5 acc 50.391 (49.904)	lr 0.01539
Warmup Train [26][90/3239]	Time 0.509 (0.664)	Data 0.001 (0.134)	Loss 4.2980 (4.2270)	Top-1 acc 23.828 (26.627)	Top-5 acc 48.047 (49.764)	lr 0.01538
Warmup Train [26][100/3239]	Time 0.531 (0.647)	Data 0.001 (0.121)	Loss 4.1204 (4.2201)	Top-1 acc 27.344 (26.698)	Top-5 acc 51.172 (49.818)	lr 0.01538
Warmup Train [26][110/3239]	Time 0.438 (0.635)	Data 0.001 (0.111)	Loss 4.2459 (4.2189)	Top-1 acc 23.047 (26.612)	Top-5 acc 50.391 (49.799)	lr 0.01537
Warmup Train [26][120/3239]	Time 0.309 (0.622)	Data 0.001 (0.102)	Loss 4.1458 (4.2177)	Top-1 acc 28.906 (26.701)	Top-5 acc 53.906 (49.806)	lr 0.01537
Warmup Train [26][130/3239]	Time 0.565 (0.613)	Data 0.001 (0.096)	Loss 4.1081 (4.2224)	Top-1 acc 34.375 (26.673)	Top-5 acc 52.734 (49.645)	lr 0.01536
Warmup Train [26][140/3239]	Time 0.505 (0.605)	Data 0.001 (0.089)	Loss 4.0656 (4.2201)	Top-1 acc 27.734 (26.684)	Top-5 acc 55.469 (49.692)	lr 0.01535
Warmup Train [26][150/3239]	Time 0.497 (0.596)	Data 0.001 (0.083)	Loss 4.0770 (4.2193)	Top-1 acc 32.031 (26.713)	Top-5 acc 53.125 (49.687)	lr 0.01535
Warmup Train [26][160/3239]	Time 0.507 (0.591)	Data 0.001 (0.079)	Loss 4.2332 (4.2215)	Top-1 acc 24.219 (26.664)	Top-5 acc 48.828 (49.624)	lr 0.01534
Warmup Train [26][170/3239]	Time 0.607 (0.586)	Data 0.001 (0.074)	Loss 4.2782 (4.2210)	Top-1 acc 28.125 (26.764)	Top-5 acc 47.656 (49.614)	lr 0.01534
Warmup Train [26][180/3239]	Time 0.664 (0.583)	Data 0.001 (0.070)	Loss 4.2877 (4.2206)	Top-1 acc 26.953 (26.817)	Top-5 acc 48.828 (49.650)	lr 0.01533
Warmup Train [26][190/3239]	Time 0.496 (0.579)	Data 0.001 (0.067)	Loss 4.2267 (4.2231)	Top-1 acc 27.734 (26.787)	Top-5 acc 51.172 (49.575)	lr 0.01533
Warmup Train [26][200/3239]	Time 0.571 (0.577)	Data 0.001 (0.064)	Loss 4.3236 (4.2205)	Top-1 acc 24.609 (26.846)	Top-5 acc 41.406 (49.567)	lr 0.01532
Warmup Train [26][210/3239]	Time 0.542 (0.573)	Data 0.001 (0.061)	Loss 4.1037 (4.2210)	Top-1 acc 28.906 (26.827)	Top-5 acc 51.953 (49.576)	lr 0.01532
Warmup Train [26][220/3239]	Time 0.489 (0.570)	Data 0.001 (0.058)	Loss 4.0488 (4.2200)	Top-1 acc 27.344 (26.831)	Top-5 acc 53.125 (49.595)	lr 0.01531
Warmup Train [26][230/3239]	Time 0.422 (0.568)	Data 0.001 (0.056)	Loss 4.3413 (4.2219)	Top-1 acc 23.047 (26.789)	Top-5 acc 47.266 (49.530)	lr 0.01530
Warmup Train [26][240/3239]	Time 0.356 (0.566)	Data 0.001 (0.054)	Loss 4.1820 (4.2231)	Top-1 acc 29.688 (26.809)	Top-5 acc 53.516 (49.523)	lr 0.01530
Warmup Train [26][250/3239]	Time 0.419 (0.563)	Data 0.001 (0.052)	Loss 4.3489 (4.2264)	Top-1 acc 26.172 (26.734)	Top-5 acc 50.391 (49.499)	lr 0.01529
Warmup Train [26][260/3239]	Time 0.462 (0.561)	Data 0.001 (0.051)	Loss 4.2619 (4.2263)	Top-1 acc 26.562 (26.718)	Top-5 acc 46.484 (49.457)	lr 0.01529
Warmup Train [26][270/3239]	Time 0.413 (0.560)	Data 0.001 (0.049)	Loss 4.3165 (4.2280)	Top-1 acc 25.391 (26.675)	Top-5 acc 50.000 (49.406)	lr 0.01528
Warmup Train [26][280/3239]	Time 0.515 (0.559)	Data 0.001 (0.048)	Loss 4.2002 (4.2266)	Top-1 acc 25.781 (26.704)	Top-5 acc 52.344 (49.448)	lr 0.01528
Warmup Train [26][290/3239]	Time 0.690 (0.558)	Data 0.001 (0.046)	Loss 4.1316 (4.2274)	Top-1 acc 32.422 (26.710)	Top-5 acc 50.000 (49.403)	lr 0.01527
Warmup Train [26][300/3239]	Time 0.406 (0.556)	Data 0.001 (0.045)	Loss 4.2796 (4.2274)	Top-1 acc 24.219 (26.723)	Top-5 acc 48.438 (49.435)	lr 0.01527
Warmup Train [26][310/3239]	Time 0.484 (0.555)	Data 0.001 (0.043)	Loss 4.3723 (4.2257)	Top-1 acc 21.094 (26.747)	Top-5 acc 46.484 (49.461)	lr 0.01526
Warmup Train [26][320/3239]	Time 0.552 (0.554)	Data 0.001 (0.042)	Loss 4.3725 (4.2243)	Top-1 acc 24.219 (26.758)	Top-5 acc 46.484 (49.500)	lr 0.01525
Warmup Train [26][330/3239]	Time 0.444 (0.553)	Data 0.001 (0.041)	Loss 4.2582 (4.2226)	Top-1 acc 23.828 (26.788)	Top-5 acc 48.047 (49.517)	lr 0.01525
Warmup Train [26][340/3239]	Time 0.603 (0.553)	Data 0.001 (0.040)	Loss 4.2837 (4.2234)	Top-1 acc 24.609 (26.771)	Top-5 acc 49.609 (49.507)	lr 0.01524
Warmup Train [26][350/3239]	Time 0.825 (0.552)	Data 0.001 (0.039)	Loss 4.3126 (4.2263)	Top-1 acc 26.172 (26.707)	Top-5 acc 49.609 (49.460)	lr 0.01524
Warmup Train [26][360/3239]	Time 0.533 (0.551)	Data 0.001 (0.038)	Loss 4.2917 (4.2261)	Top-1 acc 28.906 (26.695)	Top-5 acc 49.219 (49.470)	lr 0.01523
Warmup Train [26][370/3239]	Time 0.710 (0.549)	Data 0.001 (0.037)	Loss 4.3156 (4.2270)	Top-1 acc 22.266 (26.657)	Top-5 acc 45.703 (49.451)	lr 0.01523
Warmup Train [26][380/3239]	Time 0.545 (0.548)	Data 0.001 (0.036)	Loss 4.2560 (4.2281)	Top-1 acc 32.422 (26.671)	Top-5 acc 55.469 (49.432)	lr 0.01522
Warmup Train [26][390/3239]	Time 0.183 (0.545)	Data 0.002 (0.035)	Loss 4.3726 (4.2295)	Top-1 acc 24.609 (26.629)	Top-5 acc 46.094 (49.389)	lr 0.01521
Warmup Train [26][400/3239]	Time 0.587 (0.545)	Data 0.001 (0.035)	Loss 4.2329 (4.2286)	Top-1 acc 25.391 (26.634)	Top-5 acc 47.266 (49.419)	lr 0.01521
Warmup Train [26][410/3239]	Time 0.556 (0.544)	Data 0.001 (0.034)	Loss 4.1814 (4.2276)	Top-1 acc 25.000 (26.647)	Top-5 acc 50.781 (49.416)	lr 0.01520
Warmup Train [26][420/3239]	Time 0.547 (0.543)	Data 0.001 (0.033)	Loss 4.1008 (4.2280)	Top-1 acc 25.781 (26.637)	Top-5 acc 54.297 (49.420)	lr 0.01520
Warmup Train [26][430/3239]	Time 0.575 (0.543)	Data 0.002 (0.033)	Loss 4.3199 (4.2283)	Top-1 acc 24.609 (26.641)	Top-5 acc 46.875 (49.430)	lr 0.01519
Warmup Train [26][440/3239]	Time 0.545 (0.542)	Data 0.001 (0.032)	Loss 4.2842 (4.2287)	Top-1 acc 23.828 (26.620)	Top-5 acc 50.000 (49.431)	lr 0.01519
Warmup Train [26][450/3239]	Time 0.568 (0.541)	Data 0.001 (0.031)	Loss 4.1970 (4.2290)	Top-1 acc 28.125 (26.602)	Top-5 acc 49.609 (49.404)	lr 0.01518
Warmup Train [26][460/3239]	Time 0.438 (0.540)	Data 0.001 (0.031)	Loss 4.0692 (4.2300)	Top-1 acc 28.516 (26.561)	Top-5 acc 52.734 (49.389)	lr 0.01518
Warmup Train [26][470/3239]	Time 0.404 (0.540)	Data 0.001 (0.030)	Loss 4.2105 (4.2290)	Top-1 acc 26.953 (26.587)	Top-5 acc 47.656 (49.411)	lr 0.01517
Warmup Train [26][480/3239]	Time 0.418 (0.539)	Data 0.001 (0.030)	Loss 4.1706 (4.2297)	Top-1 acc 30.469 (26.598)	Top-5 acc 53.906 (49.407)	lr 0.01516
Warmup Train [26][490/3239]	Time 0.430 (0.538)	Data 0.001 (0.029)	Loss 4.3558 (4.2295)	Top-1 acc 21.094 (26.598)	Top-5 acc 44.141 (49.428)	lr 0.01516
Warmup Train [26][500/3239]	Time 0.400 (0.538)	Data 0.001 (0.029)	Loss 4.0020 (4.2289)	Top-1 acc 30.469 (26.612)	Top-5 acc 53.125 (49.446)	lr 0.01515
Warmup Train [26][510/3239]	Time 0.642 (0.538)	Data 0.001 (0.029)	Loss 4.1585 (4.2296)	Top-1 acc 28.125 (26.611)	Top-5 acc 51.953 (49.435)	lr 0.01515
Warmup Train [26][520/3239]	Time 0.610 (0.537)	Data 0.001 (0.028)	Loss 4.1333 (4.2299)	Top-1 acc 27.344 (26.614)	Top-5 acc 51.562 (49.442)	lr 0.01514
Warmup Train [26][530/3239]	Time 0.480 (0.537)	Data 0.001 (0.028)	Loss 4.2871 (4.2291)	Top-1 acc 26.562 (26.624)	Top-5 acc 51.562 (49.477)	lr 0.01514
Warmup Train [26][540/3239]	Time 0.428 (0.536)	Data 0.001 (0.027)	Loss 4.1923 (4.2294)	Top-1 acc 25.781 (26.616)	Top-5 acc 52.344 (49.464)	lr 0.01513
Warmup Train [26][550/3239]	Time 0.505 (0.536)	Data 0.001 (0.027)	Loss 4.1094 (4.2292)	Top-1 acc 28.125 (26.647)	Top-5 acc 51.562 (49.483)	lr 0.01513
Warmup Train [26][560/3239]	Time 0.459 (0.536)	Data 0.001 (0.027)	Loss 4.2492 (4.2293)	Top-1 acc 28.516 (26.640)	Top-5 acc 50.000 (49.506)	lr 0.01512
Warmup Train [26][570/3239]	Time 0.533 (0.535)	Data 0.001 (0.026)	Loss 4.0723 (4.2292)	Top-1 acc 29.297 (26.643)	Top-5 acc 55.469 (49.512)	lr 0.01511
Warmup Train [26][580/3239]	Time 0.548 (0.535)	Data 0.001 (0.026)	Loss 4.0960 (4.2286)	Top-1 acc 33.203 (26.657)	Top-5 acc 51.562 (49.527)	lr 0.01511
Warmup Train [26][590/3239]	Time 0.536 (0.534)	Data 0.001 (0.025)	Loss 4.2103 (4.2287)	Top-1 acc 28.125 (26.650)	Top-5 acc 48.438 (49.499)	lr 0.01510
Warmup Train [26][600/3239]	Time 0.570 (0.534)	Data 0.001 (0.025)	Loss 4.1319 (4.2295)	Top-1 acc 28.906 (26.641)	Top-5 acc 51.172 (49.475)	lr 0.01510
Warmup Train [26][610/3239]	Time 0.341 (0.533)	Data 0.001 (0.025)	Loss 4.1820 (4.2298)	Top-1 acc 29.297 (26.650)	Top-5 acc 50.000 (49.476)	lr 0.01509
Warmup Train [26][620/3239]	Time 0.449 (0.532)	Data 0.001 (0.024)	Loss 4.1394 (4.2301)	Top-1 acc 28.125 (26.645)	Top-5 acc 53.125 (49.463)	lr 0.01509
Warmup Train [26][630/3239]	Time 0.408 (0.532)	Data 0.001 (0.024)	Loss 4.1676 (4.2294)	Top-1 acc 24.219 (26.650)	Top-5 acc 49.219 (49.481)	lr 0.01508
Warmup Train [26][640/3239]	Time 0.554 (0.531)	Data 0.002 (0.024)	Loss 4.2156 (4.2295)	Top-1 acc 30.078 (26.664)	Top-5 acc 51.172 (49.472)	lr 0.01508
Warmup Train [26][650/3239]	Time 0.556 (0.531)	Data 0.001 (0.024)	Loss 4.1955 (4.2294)	Top-1 acc 25.000 (26.670)	Top-5 acc 50.391 (49.470)	lr 0.01507
Warmup Train [26][660/3239]	Time 0.590 (0.531)	Data 0.004 (0.023)	Loss 4.1329 (4.2297)	Top-1 acc 29.297 (26.670)	Top-5 acc 49.609 (49.455)	lr 0.01506
Warmup Train [26][670/3239]	Time 0.451 (0.531)	Data 0.001 (0.023)	Loss 4.2400 (4.2285)	Top-1 acc 25.391 (26.703)	Top-5 acc 46.484 (49.470)	lr 0.01506
Warmup Train [26][680/3239]	Time 0.529 (0.531)	Data 0.001 (0.023)	Loss 4.4193 (4.2282)	Top-1 acc 21.484 (26.697)	Top-5 acc 46.484 (49.489)	lr 0.01505
Warmup Train [26][690/3239]	Time 0.525 (0.531)	Data 0.001 (0.023)	Loss 4.0750 (4.2285)	Top-1 acc 31.641 (26.692)	Top-5 acc 52.734 (49.489)	lr 0.01505
Warmup Train [26][700/3239]	Time 0.641 (0.531)	Data 0.001 (0.022)	Loss 4.1475 (4.2291)	Top-1 acc 25.391 (26.673)	Top-5 acc 53.906 (49.472)	lr 0.01504
Warmup Train [26][710/3239]	Time 0.566 (0.531)	Data 0.001 (0.022)	Loss 4.4550 (4.2289)	Top-1 acc 23.047 (26.669)	Top-5 acc 41.797 (49.481)	lr 0.01504
Warmup Train [26][720/3239]	Time 0.327 (0.530)	Data 0.002 (0.022)	Loss 4.1478 (4.2291)	Top-1 acc 29.297 (26.662)	Top-5 acc 51.172 (49.482)	lr 0.01503
Warmup Train [26][730/3239]	Time 0.446 (0.530)	Data 0.001 (0.022)	Loss 4.3447 (4.2287)	Top-1 acc 26.172 (26.675)	Top-5 acc 46.875 (49.493)	lr 0.01503
Warmup Train [26][740/3239]	Time 0.574 (0.530)	Data 0.001 (0.022)	Loss 4.3453 (4.2300)	Top-1 acc 21.094 (26.639)	Top-5 acc 46.484 (49.460)	lr 0.01502
Warmup Train [26][750/3239]	Time 0.468 (0.530)	Data 0.001 (0.021)	Loss 4.1505 (4.2309)	Top-1 acc 26.953 (26.629)	Top-5 acc 53.125 (49.439)	lr 0.01501
Warmup Train [26][760/3239]	Time 0.778 (0.530)	Data 0.003 (0.021)	Loss 4.3424 (4.2307)	Top-1 acc 21.875 (26.619)	Top-5 acc 45.703 (49.439)	lr 0.01501
Warmup Train [26][770/3239]	Time 0.605 (0.530)	Data 0.001 (0.021)	Loss 4.0103 (4.2310)	Top-1 acc 31.641 (26.607)	Top-5 acc 53.906 (49.439)	lr 0.01500
Warmup Train [26][780/3239]	Time 0.466 (0.530)	Data 0.001 (0.021)	Loss 4.1895 (4.2315)	Top-1 acc 28.125 (26.597)	Top-5 acc 50.391 (49.428)	lr 0.01500
Warmup Train [26][790/3239]	Time 0.496 (0.530)	Data 0.002 (0.021)	Loss 4.1509 (4.2315)	Top-1 acc 30.078 (26.606)	Top-5 acc 52.344 (49.426)	lr 0.01499
Warmup Train [26][800/3239]	Time 0.657 (0.530)	Data 0.002 (0.020)	Loss 4.3179 (4.2320)	Top-1 acc 25.781 (26.600)	Top-5 acc 47.266 (49.424)	lr 0.01499
Warmup Train [26][810/3239]	Time 0.560 (0.530)	Data 0.001 (0.020)	Loss 4.1303 (4.2321)	Top-1 acc 26.172 (26.605)	Top-5 acc 54.688 (49.418)	lr 0.01498
Warmup Train [26][820/3239]	Time 0.528 (0.529)	Data 0.002 (0.020)	Loss 4.2064 (4.2322)	Top-1 acc 25.000 (26.608)	Top-5 acc 48.828 (49.403)	lr 0.01498
Warmup Train [26][830/3239]	Time 0.324 (0.529)	Data 0.001 (0.020)	Loss 4.1944 (4.2325)	Top-1 acc 28.516 (26.604)	Top-5 acc 48.047 (49.407)	lr 0.01497
Warmup Train [26][840/3239]	Time 0.551 (0.529)	Data 0.001 (0.020)	Loss 4.3191 (4.2324)	Top-1 acc 23.438 (26.600)	Top-5 acc 47.266 (49.423)	lr 0.01496
Warmup Train [26][850/3239]	Time 0.420 (0.528)	Data 0.001 (0.020)	Loss 4.2102 (4.2329)	Top-1 acc 30.078 (26.592)	Top-5 acc 49.219 (49.408)	lr 0.01496
Warmup Train [26][860/3239]	Time 0.564 (0.528)	Data 0.001 (0.020)	Loss 4.2942 (4.2330)	Top-1 acc 22.656 (26.597)	Top-5 acc 48.438 (49.410)	lr 0.01495
Warmup Train [26][870/3239]	Time 0.203 (0.527)	Data 0.001 (0.019)	Loss 4.0554 (4.2321)	Top-1 acc 27.734 (26.614)	Top-5 acc 54.688 (49.429)	lr 0.01495
Warmup Train [26][880/3239]	Time 0.539 (0.527)	Data 0.001 (0.019)	Loss 4.3904 (4.2321)	Top-1 acc 25.781 (26.610)	Top-5 acc 44.922 (49.436)	lr 0.01494
Warmup Train [26][890/3239]	Time 0.613 (0.527)	Data 0.001 (0.019)	Loss 4.0110 (4.2320)	Top-1 acc 35.156 (26.621)	Top-5 acc 55.469 (49.445)	lr 0.01494
Warmup Train [26][900/3239]	Time 0.598 (0.527)	Data 0.001 (0.019)	Loss 4.1726 (4.2315)	Top-1 acc 25.781 (26.610)	Top-5 acc 48.047 (49.445)	lr 0.01493
Warmup Train [26][910/3239]	Time 0.544 (0.527)	Data 0.001 (0.019)	Loss 4.1642 (4.2316)	Top-1 acc 28.516 (26.608)	Top-5 acc 54.297 (49.442)	lr 0.01493
Warmup Train [26][920/3239]	Time 0.504 (0.526)	Data 0.001 (0.019)	Loss 4.3371 (4.2314)	Top-1 acc 21.875 (26.601)	Top-5 acc 46.875 (49.450)	lr 0.01492
Warmup Train [26][930/3239]	Time 0.482 (0.526)	Data 0.001 (0.019)	Loss 4.1822 (4.2312)	Top-1 acc 30.078 (26.624)	Top-5 acc 51.953 (49.450)	lr 0.01491
Warmup Train [26][940/3239]	Time 0.435 (0.526)	Data 0.001 (0.019)	Loss 4.3108 (4.2313)	Top-1 acc 25.391 (26.621)	Top-5 acc 51.172 (49.447)	lr 0.01491
Warmup Train [26][950/3239]	Time 0.491 (0.526)	Data 0.001 (0.018)	Loss 4.3349 (4.2321)	Top-1 acc 23.047 (26.613)	Top-5 acc 43.750 (49.429)	lr 0.01490
Warmup Train [26][960/3239]	Time 0.596 (0.526)	Data 0.002 (0.018)	Loss 4.3048 (4.2323)	Top-1 acc 22.266 (26.602)	Top-5 acc 49.219 (49.427)	lr 0.01490
Warmup Train [26][970/3239]	Time 0.626 (0.526)	Data 0.001 (0.018)	Loss 4.3342 (4.2326)	Top-1 acc 22.266 (26.592)	Top-5 acc 49.219 (49.427)	lr 0.01489
Warmup Train [26][980/3239]	Time 0.362 (0.525)	Data 0.001 (0.018)	Loss 4.4075 (4.2327)	Top-1 acc 27.344 (26.590)	Top-5 acc 48.047 (49.424)	lr 0.01489
Warmup Train [26][990/3239]	Time 0.692 (0.526)	Data 0.001 (0.018)	Loss 4.0347 (4.2331)	Top-1 acc 27.344 (26.578)	Top-5 acc 54.688 (49.412)	lr 0.01488
Warmup Train [26][1000/3239]	Time 0.587 (0.525)	Data 0.001 (0.018)	Loss 4.1304 (4.2333)	Top-1 acc 26.562 (26.566)	Top-5 acc 53.125 (49.403)	lr 0.01488
Warmup Train [26][1010/3239]	Time 0.617 (0.525)	Data 0.001 (0.018)	Loss 4.4042 (4.2335)	Top-1 acc 24.219 (26.562)	Top-5 acc 46.875 (49.401)	lr 0.01487
Warmup Train [26][1020/3239]	Time 0.470 (0.525)	Data 0.001 (0.018)	Loss 4.1387 (4.2341)	Top-1 acc 27.344 (26.549)	Top-5 acc 50.781 (49.384)	lr 0.01486
Warmup Train [26][1030/3239]	Time 0.531 (0.525)	Data 0.001 (0.017)	Loss 4.0118 (4.2342)	Top-1 acc 28.906 (26.551)	Top-5 acc 53.906 (49.374)	lr 0.01486
Warmup Train [26][1040/3239]	Time 0.601 (0.525)	Data 0.001 (0.017)	Loss 4.2965 (4.2345)	Top-1 acc 27.344 (26.555)	Top-5 acc 48.438 (49.365)	lr 0.01485
Warmup Train [26][1050/3239]	Time 0.429 (0.525)	Data 0.001 (0.017)	Loss 4.2640 (4.2346)	Top-1 acc 25.391 (26.549)	Top-5 acc 48.047 (49.370)	lr 0.01485
Warmup Train [26][1060/3239]	Time 0.613 (0.525)	Data 0.001 (0.017)	Loss 4.3997 (4.2344)	Top-1 acc 23.828 (26.550)	Top-5 acc 42.969 (49.383)	lr 0.01484
Warmup Train [26][1070/3239]	Time 0.540 (0.525)	Data 0.001 (0.017)	Loss 4.0307 (4.2340)	Top-1 acc 32.422 (26.559)	Top-5 acc 53.125 (49.391)	lr 0.01484
Warmup Train [26][1080/3239]	Time 0.562 (0.524)	Data 0.001 (0.017)	Loss 4.0262 (4.2331)	Top-1 acc 28.516 (26.577)	Top-5 acc 53.906 (49.413)	lr 0.01483
Warmup Train [26][1090/3239]	Time 0.543 (0.524)	Data 0.001 (0.017)	Loss 3.9509 (4.2328)	Top-1 acc 30.469 (26.587)	Top-5 acc 52.344 (49.416)	lr 0.01483
Warmup Train [26][1100/3239]	Time 0.412 (0.523)	Data 0.001 (0.017)	Loss 4.1053 (4.2324)	Top-1 acc 28.516 (26.585)	Top-5 acc 53.906 (49.433)	lr 0.01482
Warmup Train [26][1110/3239]	Time 0.598 (0.523)	Data 0.001 (0.017)	Loss 4.2541 (4.2325)	Top-1 acc 31.641 (26.597)	Top-5 acc 51.562 (49.430)	lr 0.01481
Warmup Train [26][1120/3239]	Time 0.493 (0.522)	Data 0.001 (0.016)	Loss 4.2101 (4.2325)	Top-1 acc 26.953 (26.610)	Top-5 acc 49.219 (49.432)	lr 0.01481
Warmup Train [26][1130/3239]	Time 0.491 (0.522)	Data 0.001 (0.016)	Loss 4.1845 (4.2323)	Top-1 acc 28.906 (26.615)	Top-5 acc 50.391 (49.440)	lr 0.01480
Warmup Train [26][1140/3239]	Time 0.517 (0.522)	Data 0.001 (0.016)	Loss 4.2084 (4.2325)	Top-1 acc 32.422 (26.619)	Top-5 acc 53.516 (49.440)	lr 0.01480
Warmup Train [26][1150/3239]	Time 0.529 (0.522)	Data 0.001 (0.016)	Loss 4.3578 (4.2324)	Top-1 acc 22.266 (26.622)	Top-5 acc 46.875 (49.448)	lr 0.01479
Warmup Train [26][1160/3239]	Time 0.328 (0.522)	Data 0.001 (0.016)	Loss 4.1656 (4.2325)	Top-1 acc 30.469 (26.622)	Top-5 acc 48.828 (49.430)	lr 0.01479
Warmup Train [26][1170/3239]	Time 0.377 (0.522)	Data 0.001 (0.016)	Loss 4.1275 (4.2322)	Top-1 acc 29.688 (26.632)	Top-5 acc 48.828 (49.437)	lr 0.01478
Warmup Train [26][1180/3239]	Time 0.492 (0.522)	Data 0.001 (0.016)	Loss 4.1864 (4.2325)	Top-1 acc 25.391 (26.612)	Top-5 acc 48.047 (49.429)	lr 0.01478
Warmup Train [26][1190/3239]	Time 0.525 (0.522)	Data 0.001 (0.016)	Loss 4.3046 (4.2329)	Top-1 acc 25.781 (26.617)	Top-5 acc 44.922 (49.422)	lr 0.01477
Warmup Train [26][1200/3239]	Time 0.379 (0.522)	Data 0.030 (0.016)	Loss 4.1148 (4.2327)	Top-1 acc 30.078 (26.622)	Top-5 acc 53.516 (49.429)	lr 0.01477
Warmup Train [26][1210/3239]	Time 0.688 (0.522)	Data 0.001 (0.016)	Loss 4.1685 (4.2324)	Top-1 acc 26.172 (26.620)	Top-5 acc 48.828 (49.430)	lr 0.01476
Warmup Train [26][1220/3239]	Time 0.532 (0.522)	Data 0.001 (0.016)	Loss 4.1800 (4.2320)	Top-1 acc 27.734 (26.627)	Top-5 acc 46.875 (49.432)	lr 0.01475
Warmup Train [26][1230/3239]	Time 0.432 (0.522)	Data 0.001 (0.016)	Loss 4.3832 (4.2319)	Top-1 acc 23.438 (26.627)	Top-5 acc 44.531 (49.437)	lr 0.01475
Warmup Train [26][1240/3239]	Time 0.597 (0.522)	Data 0.001 (0.016)	Loss 4.1652 (4.2321)	Top-1 acc 27.734 (26.619)	Top-5 acc 48.438 (49.429)	lr 0.01474
Warmup Train [26][1250/3239]	Time 0.511 (0.522)	Data 0.001 (0.016)	Loss 4.2958 (4.2321)	Top-1 acc 28.125 (26.622)	Top-5 acc 45.312 (49.431)	lr 0.01474
Warmup Train [26][1260/3239]	Time 0.532 (0.522)	Data 0.001 (0.015)	Loss 4.1663 (4.2324)	Top-1 acc 25.781 (26.621)	Top-5 acc 51.172 (49.423)	lr 0.01473
Warmup Train [26][1270/3239]	Time 0.346 (0.521)	Data 0.001 (0.015)	Loss 4.2768 (4.2323)	Top-1 acc 28.516 (26.626)	Top-5 acc 48.438 (49.421)	lr 0.01473
Warmup Train [26][1280/3239]	Time 0.625 (0.522)	Data 0.001 (0.015)	Loss 4.5346 (4.2328)	Top-1 acc 21.875 (26.627)	Top-5 acc 42.188 (49.412)	lr 0.01472
Warmup Train [26][1290/3239]	Time 0.525 (0.522)	Data 0.001 (0.015)	Loss 4.2238 (4.2325)	Top-1 acc 22.266 (26.621)	Top-5 acc 46.484 (49.413)	lr 0.01472
Warmup Train [26][1300/3239]	Time 0.675 (0.522)	Data 0.001 (0.015)	Loss 4.0241 (4.2325)	Top-1 acc 31.641 (26.618)	Top-5 acc 53.906 (49.416)	lr 0.01471
Warmup Train [26][1310/3239]	Time 0.544 (0.521)	Data 0.001 (0.015)	Loss 4.2837 (4.2323)	Top-1 acc 19.922 (26.609)	Top-5 acc 48.438 (49.415)	lr 0.01470
Warmup Train [26][1320/3239]	Time 0.590 (0.521)	Data 0.001 (0.015)	Loss 4.4561 (4.2327)	Top-1 acc 19.531 (26.598)	Top-5 acc 43.750 (49.405)	lr 0.01470
Warmup Train [26][1330/3239]	Time 0.618 (0.521)	Data 0.001 (0.015)	Loss 4.2580 (4.2326)	Top-1 acc 26.172 (26.598)	Top-5 acc 46.484 (49.406)	lr 0.01469
Warmup Train [26][1340/3239]	Time 0.487 (0.521)	Data 0.002 (0.015)	Loss 3.9828 (4.2327)	Top-1 acc 28.125 (26.597)	Top-5 acc 55.469 (49.404)	lr 0.01469
Warmup Train [26][1350/3239]	Time 0.316 (0.521)	Data 0.001 (0.015)	Loss 4.1267 (4.2331)	Top-1 acc 30.469 (26.588)	Top-5 acc 53.125 (49.396)	lr 0.01468
Warmup Train [26][1360/3239]	Time 0.636 (0.520)	Data 0.001 (0.015)	Loss 4.1323 (4.2330)	Top-1 acc 28.125 (26.592)	Top-5 acc 52.734 (49.396)	lr 0.01468
Warmup Train [26][1370/3239]	Time 0.627 (0.520)	Data 0.001 (0.015)	Loss 4.2364 (4.2335)	Top-1 acc 25.391 (26.586)	Top-5 acc 53.516 (49.383)	lr 0.01467
Warmup Train [26][1380/3239]	Time 0.518 (0.520)	Data 0.001 (0.015)	Loss 4.5569 (4.2341)	Top-1 acc 21.875 (26.583)	Top-5 acc 42.969 (49.364)	lr 0.01467
Warmup Train [26][1390/3239]	Time 0.382 (0.520)	Data 0.001 (0.014)	Loss 4.3326 (4.2340)	Top-1 acc 24.609 (26.591)	Top-5 acc 50.000 (49.365)	lr 0.01466
Warmup Train [26][1400/3239]	Time 0.406 (0.520)	Data 0.001 (0.014)	Loss 4.3450 (4.2339)	Top-1 acc 24.219 (26.593)	Top-5 acc 47.656 (49.373)	lr 0.01465
Warmup Train [26][1410/3239]	Time 0.380 (0.520)	Data 0.002 (0.014)	Loss 4.0473 (4.2339)	Top-1 acc 26.172 (26.589)	Top-5 acc 52.344 (49.367)	lr 0.01465
Warmup Train [26][1420/3239]	Time 0.594 (0.520)	Data 0.001 (0.014)	Loss 4.2074 (4.2336)	Top-1 acc 25.781 (26.598)	Top-5 acc 49.219 (49.367)	lr 0.01464
Warmup Train [26][1430/3239]	Time 0.629 (0.520)	Data 0.001 (0.014)	Loss 4.1882 (4.2333)	Top-1 acc 26.953 (26.590)	Top-5 acc 50.781 (49.375)	lr 0.01464
Warmup Train [26][1440/3239]	Time 0.481 (0.520)	Data 0.001 (0.014)	Loss 4.2723 (4.2341)	Top-1 acc 26.172 (26.573)	Top-5 acc 42.578 (49.347)	lr 0.01463
Warmup Train [26][1450/3239]	Time 0.626 (0.520)	Data 0.001 (0.014)	Loss 4.5524 (4.2343)	Top-1 acc 21.484 (26.573)	Top-5 acc 43.359 (49.340)	lr 0.01463
Warmup Train [26][1460/3239]	Time 0.338 (0.520)	Data 0.001 (0.014)	Loss 4.4488 (4.2348)	Top-1 acc 23.047 (26.564)	Top-5 acc 46.094 (49.329)	lr 0.01462
Warmup Train [26][1470/3239]	Time 0.652 (0.520)	Data 0.001 (0.014)	Loss 4.2350 (4.2345)	Top-1 acc 26.562 (26.574)	Top-5 acc 49.609 (49.338)	lr 0.01462
Warmup Train [26][1480/3239]	Time 0.535 (0.519)	Data 0.002 (0.014)	Loss 4.1899 (4.2342)	Top-1 acc 26.562 (26.580)	Top-5 acc 51.562 (49.339)	lr 0.01461
Warmup Train [26][1490/3239]	Time 0.596 (0.520)	Data 0.001 (0.014)	Loss 4.3751 (4.2337)	Top-1 acc 22.656 (26.597)	Top-5 acc 44.922 (49.352)	lr 0.01461
Warmup Train [26][1500/3239]	Time 0.526 (0.520)	Data 0.001 (0.014)	Loss 4.0845 (4.2335)	Top-1 acc 28.906 (26.598)	Top-5 acc 49.609 (49.351)	lr 0.01460
Warmup Train [26][1510/3239]	Time 0.503 (0.520)	Data 0.001 (0.014)	Loss 4.1900 (4.2339)	Top-1 acc 26.172 (26.590)	Top-5 acc 51.562 (49.341)	lr 0.01459
Warmup Train [26][1520/3239]	Time 0.599 (0.520)	Data 0.001 (0.014)	Loss 4.2763 (4.2342)	Top-1 acc 27.344 (26.587)	Top-5 acc 48.828 (49.334)	lr 0.01459
Warmup Train [26][1530/3239]	Time 0.511 (0.520)	Data 0.001 (0.014)	Loss 4.0858 (4.2339)	Top-1 acc 30.078 (26.595)	Top-5 acc 52.734 (49.340)	lr 0.01458
Warmup Train [26][1540/3239]	Time 0.380 (0.520)	Data 0.001 (0.014)	Loss 4.2472 (4.2338)	Top-1 acc 24.609 (26.591)	Top-5 acc 48.438 (49.338)	lr 0.01458
Warmup Train [26][1550/3239]	Time 0.571 (0.520)	Data 0.001 (0.014)	Loss 4.2181 (4.2339)	Top-1 acc 28.125 (26.592)	Top-5 acc 49.219 (49.338)	lr 0.01457
Warmup Train [26][1560/3239]	Time 0.165 (0.519)	Data 0.001 (0.014)	Loss 4.2528 (4.2336)	Top-1 acc 22.656 (26.596)	Top-5 acc 48.438 (49.350)	lr 0.01457
Warmup Train [26][1570/3239]	Time 0.544 (0.519)	Data 0.001 (0.014)	Loss 4.3870 (4.2336)	Top-1 acc 23.047 (26.593)	Top-5 acc 42.969 (49.344)	lr 0.01456
Warmup Train [26][1580/3239]	Time 0.511 (0.519)	Data 0.001 (0.014)	Loss 4.1772 (4.2337)	Top-1 acc 30.859 (26.594)	Top-5 acc 52.344 (49.346)	lr 0.01456
Warmup Train [26][1590/3239]	Time 0.513 (0.519)	Data 0.001 (0.014)	Loss 4.1076 (4.2334)	Top-1 acc 26.953 (26.596)	Top-5 acc 53.906 (49.356)	lr 0.01455
Warmup Train [26][1600/3239]	Time 0.348 (0.519)	Data 0.001 (0.014)	Loss 4.1894 (4.2334)	Top-1 acc 30.859 (26.599)	Top-5 acc 49.609 (49.352)	lr 0.01454
Warmup Train [26][1610/3239]	Time 0.542 (0.519)	Data 0.001 (0.014)	Loss 4.1984 (4.2332)	Top-1 acc 30.469 (26.607)	Top-5 acc 51.562 (49.362)	lr 0.01454
Warmup Train [26][1620/3239]	Time 0.567 (0.519)	Data 0.001 (0.014)	Loss 4.3222 (4.2331)	Top-1 acc 22.266 (26.600)	Top-5 acc 44.922 (49.357)	lr 0.01453
Warmup Train [26][1630/3239]	Time 0.553 (0.519)	Data 0.001 (0.014)	Loss 4.1306 (4.2331)	Top-1 acc 27.344 (26.600)	Top-5 acc 51.562 (49.356)	lr 0.01453
Warmup Train [26][1640/3239]	Time 0.561 (0.519)	Data 0.001 (0.014)	Loss 4.1485 (4.2333)	Top-1 acc 29.297 (26.595)	Top-5 acc 48.438 (49.351)	lr 0.01452
Warmup Train [26][1650/3239]	Time 0.437 (0.519)	Data 0.001 (0.013)	Loss 4.2596 (4.2335)	Top-1 acc 26.172 (26.591)	Top-5 acc 50.391 (49.347)	lr 0.01452
Warmup Train [26][1660/3239]	Time 0.545 (0.519)	Data 0.001 (0.013)	Loss 4.3062 (4.2334)	Top-1 acc 25.391 (26.590)	Top-5 acc 43.359 (49.347)	lr 0.01451
Warmup Train [26][1670/3239]	Time 0.693 (0.519)	Data 0.001 (0.013)	Loss 4.0054 (4.2334)	Top-1 acc 32.031 (26.591)	Top-5 acc 55.078 (49.347)	lr 0.01451
Warmup Train [26][1680/3239]	Time 0.566 (0.519)	Data 0.001 (0.013)	Loss 4.0149 (4.2331)	Top-1 acc 25.000 (26.596)	Top-5 acc 57.422 (49.356)	lr 0.01450
Warmup Train [26][1690/3239]	Time 0.381 (0.519)	Data 0.001 (0.013)	Loss 4.2989 (4.2333)	Top-1 acc 26.172 (26.591)	Top-5 acc 48.828 (49.351)	lr 0.01449
Warmup Train [26][1700/3239]	Time 0.408 (0.519)	Data 0.001 (0.013)	Loss 4.1811 (4.2333)	Top-1 acc 27.344 (26.594)	Top-5 acc 53.516 (49.354)	lr 0.01449
Warmup Train [26][1710/3239]	Time 0.459 (0.519)	Data 0.001 (0.013)	Loss 4.2010 (4.2333)	Top-1 acc 26.172 (26.596)	Top-5 acc 48.047 (49.353)	lr 0.01448
Warmup Train [26][1720/3239]	Time 0.488 (0.519)	Data 0.001 (0.013)	Loss 4.0863 (4.2332)	Top-1 acc 30.078 (26.596)	Top-5 acc 54.688 (49.362)	lr 0.01448
Warmup Train [26][1730/3239]	Time 0.533 (0.519)	Data 0.001 (0.013)	Loss 4.1327 (4.2332)	Top-1 acc 30.469 (26.597)	Top-5 acc 51.562 (49.363)	lr 0.01447
Warmup Train [26][1740/3239]	Time 0.563 (0.519)	Data 0.001 (0.013)	Loss 4.0518 (4.2329)	Top-1 acc 27.344 (26.603)	Top-5 acc 54.688 (49.369)	lr 0.01447
Warmup Train [26][1750/3239]	Time 0.728 (0.519)	Data 0.001 (0.013)	Loss 4.4468 (4.2328)	Top-1 acc 22.266 (26.607)	Top-5 acc 41.797 (49.372)	lr 0.01446
Warmup Train [26][1760/3239]	Time 0.560 (0.519)	Data 0.001 (0.013)	Loss 4.3847 (4.2330)	Top-1 acc 24.219 (26.608)	Top-5 acc 44.922 (49.369)	lr 0.01446
Warmup Train [26][1770/3239]	Time 0.452 (0.519)	Data 0.001 (0.013)	Loss 4.0487 (4.2327)	Top-1 acc 31.250 (26.604)	Top-5 acc 52.344 (49.371)	lr 0.01445
Warmup Train [26][1780/3239]	Time 0.366 (0.519)	Data 0.001 (0.013)	Loss 4.1271 (4.2328)	Top-1 acc 30.078 (26.606)	Top-5 acc 55.078 (49.379)	lr 0.01445
Warmup Train [26][1790/3239]	Time 0.360 (0.519)	Data 0.001 (0.013)	Loss 4.2362 (4.2329)	Top-1 acc 28.516 (26.607)	Top-5 acc 48.438 (49.372)	lr 0.01444
Warmup Train [26][1800/3239]	Time 0.230 (0.519)	Data 0.001 (0.013)	Loss 4.1778 (4.2329)	Top-1 acc 30.469 (26.603)	Top-5 acc 50.781 (49.374)	lr 0.01443
Warmup Train [26][1810/3239]	Time 0.469 (0.519)	Data 0.001 (0.013)	Loss 4.3727 (4.2332)	Top-1 acc 24.219 (26.604)	Top-5 acc 44.531 (49.367)	lr 0.01443
Warmup Train [26][1820/3239]	Time 0.571 (0.519)	Data 0.001 (0.013)	Loss 4.4507 (4.2335)	Top-1 acc 21.484 (26.599)	Top-5 acc 45.312 (49.366)	lr 0.01442
Warmup Train [26][1830/3239]	Time 0.446 (0.518)	Data 0.001 (0.013)	Loss 4.2658 (4.2331)	Top-1 acc 25.000 (26.609)	Top-5 acc 48.438 (49.373)	lr 0.01442
Warmup Train [26][1840/3239]	Time 0.294 (0.518)	Data 0.001 (0.013)	Loss 4.6359 (4.2332)	Top-1 acc 20.703 (26.604)	Top-5 acc 41.797 (49.371)	lr 0.01441
Warmup Train [26][1850/3239]	Time 0.611 (0.518)	Data 0.001 (0.013)	Loss 4.1931 (4.2332)	Top-1 acc 25.391 (26.598)	Top-5 acc 50.391 (49.368)	lr 0.01441
Warmup Train [26][1860/3239]	Time 0.494 (0.518)	Data 0.001 (0.013)	Loss 4.1944 (4.2331)	Top-1 acc 28.125 (26.595)	Top-5 acc 48.438 (49.369)	lr 0.01440
Warmup Train [26][1870/3239]	Time 0.408 (0.518)	Data 0.001 (0.013)	Loss 4.0285 (4.2329)	Top-1 acc 26.953 (26.597)	Top-5 acc 54.297 (49.375)	lr 0.01440
Warmup Train [26][1880/3239]	Time 0.632 (0.518)	Data 0.001 (0.013)	Loss 4.2338 (4.2329)	Top-1 acc 26.562 (26.600)	Top-5 acc 49.219 (49.371)	lr 0.01439
Warmup Train [26][1890/3239]	Time 0.472 (0.518)	Data 0.001 (0.013)	Loss 4.3112 (4.2329)	Top-1 acc 27.734 (26.597)	Top-5 acc 46.875 (49.366)	lr 0.01439
Warmup Train [26][1900/3239]	Time 0.540 (0.518)	Data 0.001 (0.013)	Loss 4.2644 (4.2327)	Top-1 acc 25.000 (26.607)	Top-5 acc 45.312 (49.369)	lr 0.01438
Warmup Train [26][1910/3239]	Time 0.392 (0.517)	Data 0.001 (0.013)	Loss 4.2535 (4.2327)	Top-1 acc 26.172 (26.606)	Top-5 acc 50.781 (49.367)	lr 0.01437
Warmup Train [26][1920/3239]	Time 0.468 (0.517)	Data 0.001 (0.013)	Loss 4.1603 (4.2331)	Top-1 acc 25.000 (26.596)	Top-5 acc 52.344 (49.358)	lr 0.01437
Warmup Train [26][1930/3239]	Time 0.422 (0.517)	Data 0.001 (0.013)	Loss 4.0916 (4.2330)	Top-1 acc 30.859 (26.600)	Top-5 acc 51.172 (49.363)	lr 0.01436
Warmup Train [26][1940/3239]	Time 0.544 (0.517)	Data 0.001 (0.013)	Loss 4.2845 (4.2330)	Top-1 acc 26.172 (26.598)	Top-5 acc 49.219 (49.360)	lr 0.01436
Warmup Train [26][1950/3239]	Time 0.464 (0.517)	Data 0.001 (0.013)	Loss 4.3242 (4.2329)	Top-1 acc 22.656 (26.607)	Top-5 acc 45.703 (49.362)	lr 0.01435
Warmup Train [26][1960/3239]	Time 0.613 (0.517)	Data 0.001 (0.013)	Loss 4.1452 (4.2328)	Top-1 acc 29.297 (26.610)	Top-5 acc 51.953 (49.361)	lr 0.01435
Warmup Train [26][1970/3239]	Time 0.651 (0.517)	Data 0.001 (0.012)	Loss 4.2348 (4.2328)	Top-1 acc 28.125 (26.612)	Top-5 acc 48.438 (49.361)	lr 0.01434
Warmup Train [26][1980/3239]	Time 0.520 (0.517)	Data 0.001 (0.012)	Loss 4.3595 (4.2327)	Top-1 acc 21.484 (26.611)	Top-5 acc 48.828 (49.365)	lr 0.01434
Warmup Train [26][1990/3239]	Time 0.355 (0.518)	Data 0.001 (0.012)	Loss 4.0540 (4.2326)	Top-1 acc 29.688 (26.608)	Top-5 acc 55.469 (49.375)	lr 0.01433
Warmup Train [26][2000/3239]	Time 0.445 (0.518)	Data 0.001 (0.012)	Loss 4.0994 (4.2326)	Top-1 acc 30.078 (26.610)	Top-5 acc 52.344 (49.373)	lr 0.01432
Warmup Train [26][2010/3239]	Time 0.502 (0.518)	Data 0.001 (0.012)	Loss 4.1485 (4.2327)	Top-1 acc 29.297 (26.609)	Top-5 acc 50.000 (49.369)	lr 0.01432
Warmup Train [26][2020/3239]	Time 0.543 (0.517)	Data 0.001 (0.012)	Loss 4.1819 (4.2326)	Top-1 acc 28.125 (26.609)	Top-5 acc 51.953 (49.368)	lr 0.01431
Warmup Train [26][2030/3239]	Time 0.533 (0.518)	Data 0.001 (0.012)	Loss 4.1548 (4.2326)	Top-1 acc 26.562 (26.611)	Top-5 acc 52.344 (49.370)	lr 0.01431
Warmup Train [26][2040/3239]	Time 0.450 (0.517)	Data 0.001 (0.012)	Loss 4.3690 (4.2327)	Top-1 acc 24.609 (26.616)	Top-5 acc 43.359 (49.370)	lr 0.01430
Warmup Train [26][2050/3239]	Time 0.456 (0.517)	Data 0.001 (0.012)	Loss 4.1511 (4.2326)	Top-1 acc 30.078 (26.617)	Top-5 acc 50.000 (49.369)	lr 0.01430
Warmup Train [26][2060/3239]	Time 0.376 (0.517)	Data 0.001 (0.012)	Loss 4.1609 (4.2325)	Top-1 acc 28.906 (26.625)	Top-5 acc 50.781 (49.371)	lr 0.01429
Warmup Train [26][2070/3239]	Time 0.530 (0.517)	Data 0.001 (0.012)	Loss 4.3681 (4.2325)	Top-1 acc 24.219 (26.625)	Top-5 acc 49.219 (49.375)	lr 0.01429
Warmup Train [26][2080/3239]	Time 0.355 (0.517)	Data 0.001 (0.012)	Loss 4.2733 (4.2325)	Top-1 acc 26.172 (26.627)	Top-5 acc 47.656 (49.375)	lr 0.01428
Warmup Train [26][2090/3239]	Time 0.436 (0.517)	Data 0.001 (0.012)	Loss 4.2930 (4.2329)	Top-1 acc 25.391 (26.615)	Top-5 acc 48.438 (49.367)	lr 0.01428
Warmup Train [26][2100/3239]	Time 0.362 (0.517)	Data 0.001 (0.012)	Loss 4.0335 (4.2330)	Top-1 acc 25.781 (26.610)	Top-5 acc 53.516 (49.365)	lr 0.01427
Warmup Train [26][2110/3239]	Time 0.555 (0.517)	Data 0.001 (0.012)	Loss 4.2535 (4.2326)	Top-1 acc 26.172 (26.619)	Top-5 acc 46.094 (49.373)	lr 0.01426
Warmup Train [26][2120/3239]	Time 0.412 (0.517)	Data 0.001 (0.012)	Loss 4.4759 (4.2328)	Top-1 acc 23.438 (26.611)	Top-5 acc 45.312 (49.370)	lr 0.01426
Warmup Train [26][2130/3239]	Time 0.500 (0.517)	Data 0.001 (0.012)	Loss 4.3640 (4.2329)	Top-1 acc 24.609 (26.606)	Top-5 acc 46.484 (49.364)	lr 0.01425
Warmup Train [26][2140/3239]	Time 0.393 (0.517)	Data 0.001 (0.012)	Loss 4.0886 (4.2327)	Top-1 acc 29.688 (26.609)	Top-5 acc 54.297 (49.374)	lr 0.01425
Warmup Train [26][2150/3239]	Time 0.337 (0.517)	Data 0.001 (0.012)	Loss 4.3616 (4.2326)	Top-1 acc 23.828 (26.612)	Top-5 acc 44.531 (49.381)	lr 0.01424
Warmup Train [26][2160/3239]	Time 0.514 (0.517)	Data 0.001 (0.012)	Loss 4.2098 (4.2326)	Top-1 acc 26.953 (26.607)	Top-5 acc 49.609 (49.380)	lr 0.01424
Warmup Train [26][2170/3239]	Time 0.502 (0.517)	Data 0.001 (0.012)	Loss 4.0546 (4.2324)	Top-1 acc 23.438 (26.607)	Top-5 acc 54.297 (49.385)	lr 0.01423
Warmup Train [26][2180/3239]	Time 0.580 (0.517)	Data 0.001 (0.012)	Loss 4.2441 (4.2325)	Top-1 acc 25.781 (26.601)	Top-5 acc 50.000 (49.382)	lr 0.01423
Warmup Train [26][2190/3239]	Time 0.653 (0.517)	Data 0.001 (0.012)	Loss 4.1211 (4.2323)	Top-1 acc 28.516 (26.606)	Top-5 acc 49.219 (49.392)	lr 0.01422
Warmup Train [26][2200/3239]	Time 0.503 (0.517)	Data 0.001 (0.012)	Loss 4.4961 (4.2324)	Top-1 acc 21.875 (26.604)	Top-5 acc 41.797 (49.388)	lr 0.01422
Warmup Train [26][2210/3239]	Time 0.560 (0.517)	Data 0.001 (0.012)	Loss 4.1760 (4.2324)	Top-1 acc 27.344 (26.607)	Top-5 acc 50.391 (49.391)	lr 0.01421
Warmup Train [26][2220/3239]	Time 0.545 (0.517)	Data 0.001 (0.012)	Loss 4.1244 (4.2323)	Top-1 acc 28.125 (26.605)	Top-5 acc 53.125 (49.388)	lr 0.01420
Warmup Train [26][2230/3239]	Time 0.443 (0.517)	Data 0.001 (0.012)	Loss 4.4373 (4.2322)	Top-1 acc 24.219 (26.611)	Top-5 acc 46.875 (49.389)	lr 0.01420
Warmup Train [26][2240/3239]	Time 0.401 (0.517)	Data 0.001 (0.012)	Loss 4.2875 (4.2321)	Top-1 acc 27.344 (26.613)	Top-5 acc 49.609 (49.388)	lr 0.01419
Warmup Train [26][2250/3239]	Time 0.502 (0.517)	Data 0.001 (0.012)	Loss 4.2903 (4.2320)	Top-1 acc 25.391 (26.612)	Top-5 acc 48.828 (49.392)	lr 0.01419
Warmup Train [26][2260/3239]	Time 0.586 (0.517)	Data 0.001 (0.012)	Loss 3.9562 (4.2318)	Top-1 acc 31.250 (26.616)	Top-5 acc 55.859 (49.394)	lr 0.01418
Warmup Train [26][2270/3239]	Time 0.505 (0.517)	Data 0.001 (0.012)	Loss 4.2843 (4.2319)	Top-1 acc 25.000 (26.614)	Top-5 acc 47.656 (49.396)	lr 0.01418
Warmup Train [26][2280/3239]	Time 0.653 (0.517)	Data 0.001 (0.012)	Loss 4.3405 (4.2321)	Top-1 acc 23.438 (26.610)	Top-5 acc 44.922 (49.390)	lr 0.01417
Warmup Train [26][2290/3239]	Time 0.667 (0.516)	Data 0.001 (0.012)	Loss 4.0476 (4.2321)	Top-1 acc 33.594 (26.611)	Top-5 acc 54.297 (49.392)	lr 0.01417
Warmup Train [26][2300/3239]	Time 0.504 (0.516)	Data 0.001 (0.012)	Loss 4.2375 (4.2322)	Top-1 acc 28.906 (26.610)	Top-5 acc 48.047 (49.388)	lr 0.01416
Warmup Train [26][2310/3239]	Time 0.559 (0.516)	Data 0.001 (0.012)	Loss 4.2528 (4.2322)	Top-1 acc 25.781 (26.612)	Top-5 acc 51.172 (49.391)	lr 0.01416
Warmup Train [26][2320/3239]	Time 0.475 (0.516)	Data 0.001 (0.012)	Loss 4.1836 (4.2322)	Top-1 acc 28.125 (26.613)	Top-5 acc 51.953 (49.392)	lr 0.01415
Warmup Train [26][2330/3239]	Time 0.528 (0.516)	Data 0.001 (0.012)	Loss 4.1730 (4.2320)	Top-1 acc 29.688 (26.615)	Top-5 acc 51.953 (49.394)	lr 0.01414
Warmup Train [26][2340/3239]	Time 0.499 (0.516)	Data 0.001 (0.012)	Loss 4.1622 (4.2320)	Top-1 acc 26.172 (26.618)	Top-5 acc 51.953 (49.397)	lr 0.01414
Warmup Train [26][2350/3239]	Time 0.444 (0.516)	Data 0.001 (0.012)	Loss 4.2501 (4.2320)	Top-1 acc 26.562 (26.617)	Top-5 acc 51.172 (49.399)	lr 0.01413
Warmup Train [26][2360/3239]	Time 0.583 (0.516)	Data 0.001 (0.012)	Loss 4.1167 (4.2316)	Top-1 acc 29.297 (26.630)	Top-5 acc 48.828 (49.404)	lr 0.01413
Warmup Train [26][2370/3239]	Time 0.599 (0.516)	Data 0.001 (0.012)	Loss 4.1437 (4.2314)	Top-1 acc 30.859 (26.630)	Top-5 acc 51.562 (49.411)	lr 0.01412
Warmup Train [26][2380/3239]	Time 0.431 (0.516)	Data 0.001 (0.012)	Loss 4.1971 (4.2314)	Top-1 acc 28.906 (26.630)	Top-5 acc 51.562 (49.417)	lr 0.01412
Warmup Train [26][2390/3239]	Time 0.683 (0.516)	Data 0.001 (0.012)	Loss 4.0929 (4.2314)	Top-1 acc 27.344 (26.629)	Top-5 acc 51.953 (49.416)	lr 0.01411
Warmup Train [26][2400/3239]	Time 0.549 (0.516)	Data 0.001 (0.012)	Loss 4.1753 (4.2314)	Top-1 acc 27.344 (26.628)	Top-5 acc 50.781 (49.416)	lr 0.01411
Warmup Train [26][2410/3239]	Time 0.457 (0.516)	Data 0.001 (0.012)	Loss 4.3865 (4.2314)	Top-1 acc 28.125 (26.630)	Top-5 acc 47.266 (49.419)	lr 0.01410
Warmup Train [26][2420/3239]	Time 0.557 (0.516)	Data 0.001 (0.012)	Loss 4.5553 (4.2313)	Top-1 acc 17.578 (26.629)	Top-5 acc 40.625 (49.418)	lr 0.01410
Warmup Train [26][2430/3239]	Time 0.530 (0.516)	Data 0.001 (0.012)	Loss 4.3645 (4.2314)	Top-1 acc 27.344 (26.627)	Top-5 acc 45.312 (49.414)	lr 0.01409
Warmup Train [26][2440/3239]	Time 0.331 (0.516)	Data 0.001 (0.012)	Loss 4.1473 (4.2313)	Top-1 acc 26.953 (26.626)	Top-5 acc 51.172 (49.415)	lr 0.01408
Warmup Train [26][2450/3239]	Time 0.515 (0.516)	Data 0.001 (0.012)	Loss 4.2755 (4.2311)	Top-1 acc 25.391 (26.627)	Top-5 acc 50.000 (49.416)	lr 0.01408
Warmup Train [26][2460/3239]	Time 0.493 (0.516)	Data 0.001 (0.012)	Loss 4.0431 (4.2308)	Top-1 acc 30.078 (26.635)	Top-5 acc 53.516 (49.425)	lr 0.01407
Warmup Train [26][2470/3239]	Time 0.376 (0.516)	Data 0.001 (0.011)	Loss 4.3370 (4.2310)	Top-1 acc 25.000 (26.634)	Top-5 acc 45.312 (49.419)	lr 0.01407
Warmup Train [26][2480/3239]	Time 0.364 (0.516)	Data 0.001 (0.011)	Loss 4.5240 (4.2309)	Top-1 acc 22.266 (26.634)	Top-5 acc 44.922 (49.418)	lr 0.01406
Warmup Train [26][2490/3239]	Time 0.634 (0.516)	Data 0.001 (0.011)	Loss 4.1974 (4.2306)	Top-1 acc 26.562 (26.633)	Top-5 acc 50.781 (49.423)	lr 0.01406
Warmup Train [26][2500/3239]	Time 0.485 (0.516)	Data 0.001 (0.011)	Loss 4.2029 (4.2306)	Top-1 acc 24.609 (26.631)	Top-5 acc 49.609 (49.422)	lr 0.01405
Warmup Train [26][2510/3239]	Time 0.547 (0.516)	Data 0.001 (0.011)	Loss 4.3059 (4.2302)	Top-1 acc 24.219 (26.637)	Top-5 acc 47.656 (49.428)	lr 0.01405
Warmup Train [26][2520/3239]	Time 0.461 (0.516)	Data 0.001 (0.011)	Loss 4.2552 (4.2300)	Top-1 acc 27.344 (26.640)	Top-5 acc 48.047 (49.429)	lr 0.01404
Warmup Train [26][2530/3239]	Time 0.527 (0.516)	Data 0.001 (0.011)	Loss 4.3735 (4.2302)	Top-1 acc 28.906 (26.640)	Top-5 acc 48.828 (49.428)	lr 0.01404
Warmup Train [26][2540/3239]	Time 0.409 (0.516)	Data 0.001 (0.011)	Loss 4.3010 (4.2308)	Top-1 acc 26.562 (26.627)	Top-5 acc 46.094 (49.413)	lr 0.01403
Warmup Train [26][2550/3239]	Time 0.476 (0.515)	Data 0.001 (0.011)	Loss 4.2992 (4.2307)	Top-1 acc 20.312 (26.628)	Top-5 acc 48.047 (49.421)	lr 0.01402
Warmup Train [26][2560/3239]	Time 0.556 (0.515)	Data 0.001 (0.011)	Loss 4.2835 (4.2308)	Top-1 acc 25.781 (26.627)	Top-5 acc 47.656 (49.420)	lr 0.01402
Warmup Train [26][2570/3239]	Time 0.470 (0.515)	Data 0.001 (0.011)	Loss 4.0907 (4.2307)	Top-1 acc 28.906 (26.629)	Top-5 acc 53.125 (49.422)	lr 0.01401
Warmup Train [26][2580/3239]	Time 0.555 (0.515)	Data 0.001 (0.011)	Loss 4.3093 (4.2308)	Top-1 acc 25.391 (26.625)	Top-5 acc 49.609 (49.421)	lr 0.01401
Warmup Train [26][2590/3239]	Time 0.662 (0.515)	Data 0.001 (0.011)	Loss 4.0990 (4.2308)	Top-1 acc 26.172 (26.626)	Top-5 acc 48.828 (49.422)	lr 0.01400
Warmup Train [26][2600/3239]	Time 0.491 (0.515)	Data 0.001 (0.011)	Loss 4.1593 (4.2307)	Top-1 acc 28.516 (26.631)	Top-5 acc 49.609 (49.424)	lr 0.01400
Warmup Train [26][2610/3239]	Time 0.491 (0.515)	Data 0.001 (0.011)	Loss 4.2365 (4.2306)	Top-1 acc 23.438 (26.632)	Top-5 acc 46.484 (49.424)	lr 0.01399
Warmup Train [26][2620/3239]	Time 0.634 (0.515)	Data 0.003 (0.011)	Loss 4.1858 (4.2304)	Top-1 acc 26.172 (26.630)	Top-5 acc 49.609 (49.426)	lr 0.01399
Warmup Train [26][2630/3239]	Time 0.407 (0.515)	Data 0.001 (0.011)	Loss 4.3250 (4.2305)	Top-1 acc 24.609 (26.629)	Top-5 acc 50.781 (49.428)	lr 0.01398
Warmup Train [26][2640/3239]	Time 0.407 (0.515)	Data 0.001 (0.011)	Loss 4.2208 (4.2305)	Top-1 acc 27.734 (26.631)	Top-5 acc 49.609 (49.424)	lr 0.01398
Warmup Train [26][2650/3239]	Time 0.628 (0.515)	Data 0.001 (0.011)	Loss 4.1853 (4.2304)	Top-1 acc 27.344 (26.631)	Top-5 acc 48.047 (49.425)	lr 0.01397
Warmup Train [26][2660/3239]	Time 0.481 (0.515)	Data 0.001 (0.011)	Loss 4.3428 (4.2302)	Top-1 acc 26.953 (26.633)	Top-5 acc 45.312 (49.425)	lr 0.01396
Warmup Train [26][2670/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 4.2466 (4.2300)	Top-1 acc 27.344 (26.639)	Top-5 acc 49.219 (49.434)	lr 0.01396
Warmup Train [26][2680/3239]	Time 0.780 (0.515)	Data 0.001 (0.011)	Loss 4.2312 (4.2298)	Top-1 acc 28.906 (26.642)	Top-5 acc 50.000 (49.441)	lr 0.01395
Warmup Train [26][2690/3239]	Time 0.356 (0.515)	Data 0.001 (0.011)	Loss 4.2761 (4.2299)	Top-1 acc 25.781 (26.638)	Top-5 acc 48.828 (49.440)	lr 0.01395
Warmup Train [26][2700/3239]	Time 0.380 (0.515)	Data 0.001 (0.011)	Loss 4.3447 (4.2302)	Top-1 acc 23.828 (26.637)	Top-5 acc 47.266 (49.437)	lr 0.01394
Warmup Train [26][2710/3239]	Time 0.560 (0.515)	Data 0.001 (0.011)	Loss 4.2850 (4.2302)	Top-1 acc 26.562 (26.633)	Top-5 acc 47.266 (49.437)	lr 0.01394
Warmup Train [26][2720/3239]	Time 0.356 (0.515)	Data 0.001 (0.011)	Loss 4.1592 (4.2302)	Top-1 acc 27.344 (26.631)	Top-5 acc 50.781 (49.442)	lr 0.01393
Warmup Train [26][2730/3239]	Time 0.540 (0.515)	Data 0.001 (0.011)	Loss 4.3381 (4.2300)	Top-1 acc 23.438 (26.634)	Top-5 acc 46.875 (49.444)	lr 0.01393
Warmup Train [26][2740/3239]	Time 0.556 (0.515)	Data 0.001 (0.011)	Loss 4.4038 (4.2299)	Top-1 acc 19.922 (26.633)	Top-5 acc 44.922 (49.446)	lr 0.01392
Warmup Train [26][2750/3239]	Time 0.400 (0.515)	Data 0.001 (0.011)	Loss 4.0635 (4.2296)	Top-1 acc 29.297 (26.641)	Top-5 acc 51.953 (49.449)	lr 0.01392
Warmup Train [26][2760/3239]	Time 0.474 (0.515)	Data 0.001 (0.011)	Loss 4.0298 (4.2292)	Top-1 acc 30.469 (26.648)	Top-5 acc 55.078 (49.455)	lr 0.01391
Warmup Train [26][2770/3239]	Time 0.517 (0.515)	Data 0.001 (0.011)	Loss 4.1630 (4.2292)	Top-1 acc 28.125 (26.652)	Top-5 acc 50.391 (49.460)	lr 0.01390
Warmup Train [26][2780/3239]	Time 0.540 (0.515)	Data 0.001 (0.011)	Loss 4.3470 (4.2295)	Top-1 acc 23.438 (26.643)	Top-5 acc 47.656 (49.451)	lr 0.01390
Warmup Train [26][2790/3239]	Time 0.483 (0.515)	Data 0.001 (0.011)	Loss 4.2009 (4.2293)	Top-1 acc 24.219 (26.641)	Top-5 acc 51.172 (49.458)	lr 0.01389
Warmup Train [26][2800/3239]	Time 0.531 (0.515)	Data 0.003 (0.011)	Loss 4.0819 (4.2295)	Top-1 acc 31.641 (26.635)	Top-5 acc 53.125 (49.452)	lr 0.01389
Warmup Train [26][2810/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 4.2463 (4.2297)	Top-1 acc 26.562 (26.634)	Top-5 acc 49.609 (49.447)	lr 0.01388
Warmup Train [26][2820/3239]	Time 0.590 (0.515)	Data 0.001 (0.011)	Loss 4.1105 (4.2295)	Top-1 acc 25.391 (26.636)	Top-5 acc 51.172 (49.454)	lr 0.01388
Warmup Train [26][2830/3239]	Time 0.529 (0.515)	Data 0.001 (0.011)	Loss 4.2794 (4.2295)	Top-1 acc 22.656 (26.636)	Top-5 acc 50.000 (49.453)	lr 0.01387
Warmup Train [26][2840/3239]	Time 0.363 (0.514)	Data 0.001 (0.011)	Loss 4.2797 (4.2293)	Top-1 acc 28.125 (26.644)	Top-5 acc 48.438 (49.457)	lr 0.01387
Warmup Train [26][2850/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 4.1479 (4.2293)	Top-1 acc 27.344 (26.644)	Top-5 acc 48.438 (49.457)	lr 0.01386
Warmup Train [26][2860/3239]	Time 0.499 (0.515)	Data 0.001 (0.011)	Loss 4.2170 (4.2291)	Top-1 acc 28.125 (26.644)	Top-5 acc 48.438 (49.460)	lr 0.01386
Warmup Train [26][2870/3239]	Time 0.637 (0.515)	Data 0.001 (0.011)	Loss 4.1695 (4.2292)	Top-1 acc 27.734 (26.639)	Top-5 acc 51.953 (49.460)	lr 0.01385
Warmup Train [26][2880/3239]	Time 0.662 (0.515)	Data 0.001 (0.011)	Loss 4.2214 (4.2291)	Top-1 acc 26.172 (26.640)	Top-5 acc 48.047 (49.465)	lr 0.01385
Warmup Train [26][2890/3239]	Time 0.610 (0.515)	Data 0.001 (0.011)	Loss 4.1657 (4.2291)	Top-1 acc 30.078 (26.639)	Top-5 acc 51.562 (49.460)	lr 0.01384
Warmup Train [26][2900/3239]	Time 0.533 (0.515)	Data 0.001 (0.011)	Loss 4.2813 (4.2290)	Top-1 acc 24.219 (26.642)	Top-5 acc 47.656 (49.462)	lr 0.01383
Warmup Train [26][2910/3239]	Time 0.623 (0.515)	Data 0.001 (0.011)	Loss 4.3435 (4.2292)	Top-1 acc 23.438 (26.639)	Top-5 acc 46.875 (49.458)	lr 0.01383
Warmup Train [26][2920/3239]	Time 0.595 (0.515)	Data 0.001 (0.011)	Loss 4.3382 (4.2293)	Top-1 acc 22.656 (26.637)	Top-5 acc 47.266 (49.455)	lr 0.01382
Warmup Train [26][2930/3239]	Time 0.626 (0.515)	Data 0.001 (0.011)	Loss 4.1172 (4.2292)	Top-1 acc 29.688 (26.637)	Top-5 acc 54.297 (49.455)	lr 0.01382
Warmup Train [26][2940/3239]	Time 0.483 (0.515)	Data 0.001 (0.011)	Loss 4.2791 (4.2292)	Top-1 acc 26.172 (26.637)	Top-5 acc 45.312 (49.452)	lr 0.01381
Warmup Train [26][2950/3239]	Time 0.598 (0.515)	Data 0.001 (0.011)	Loss 4.1249 (4.2292)	Top-1 acc 26.953 (26.635)	Top-5 acc 52.344 (49.453)	lr 0.01381
Warmup Train [26][2960/3239]	Time 0.411 (0.515)	Data 0.001 (0.011)	Loss 4.0250 (4.2290)	Top-1 acc 34.375 (26.639)	Top-5 acc 56.641 (49.459)	lr 0.01380
Warmup Train [26][2970/3239]	Time 0.429 (0.515)	Data 0.002 (0.011)	Loss 4.2777 (4.2290)	Top-1 acc 28.125 (26.638)	Top-5 acc 50.000 (49.459)	lr 0.01380
Warmup Train [26][2980/3239]	Time 0.556 (0.515)	Data 0.001 (0.011)	Loss 4.1513 (4.2290)	Top-1 acc 26.562 (26.637)	Top-5 acc 51.562 (49.458)	lr 0.01379
Warmup Train [26][2990/3239]	Time 0.535 (0.515)	Data 0.001 (0.010)	Loss 4.2391 (4.2288)	Top-1 acc 31.250 (26.644)	Top-5 acc 51.953 (49.460)	lr 0.01379
Warmup Train [26][3000/3239]	Time 0.514 (0.515)	Data 0.001 (0.011)	Loss 4.0250 (4.2286)	Top-1 acc 29.688 (26.650)	Top-5 acc 54.297 (49.467)	lr 0.01378
Warmup Train [26][3010/3239]	Time 0.464 (0.515)	Data 0.001 (0.010)	Loss 4.1009 (4.2283)	Top-1 acc 28.516 (26.652)	Top-5 acc 50.391 (49.474)	lr 0.01377
Warmup Train [26][3020/3239]	Time 0.617 (0.514)	Data 0.001 (0.010)	Loss 4.1971 (4.2281)	Top-1 acc 25.391 (26.655)	Top-5 acc 50.000 (49.476)	lr 0.01377
Warmup Train [26][3030/3239]	Time 0.508 (0.514)	Data 0.001 (0.010)	Loss 4.1089 (4.2280)	Top-1 acc 30.859 (26.656)	Top-5 acc 51.953 (49.479)	lr 0.01376
Warmup Train [26][3040/3239]	Time 0.527 (0.514)	Data 0.001 (0.010)	Loss 4.2854 (4.2282)	Top-1 acc 26.172 (26.650)	Top-5 acc 50.391 (49.476)	lr 0.01376
Warmup Train [26][3050/3239]	Time 0.350 (0.514)	Data 0.001 (0.010)	Loss 4.2717 (4.2283)	Top-1 acc 25.781 (26.649)	Top-5 acc 48.828 (49.475)	lr 0.01375
Warmup Train [26][3060/3239]	Time 0.517 (0.514)	Data 0.001 (0.010)	Loss 4.2262 (4.2281)	Top-1 acc 26.562 (26.651)	Top-5 acc 49.609 (49.477)	lr 0.01375
Warmup Train [26][3070/3239]	Time 0.496 (0.514)	Data 0.001 (0.010)	Loss 4.2134 (4.2281)	Top-1 acc 27.344 (26.653)	Top-5 acc 50.000 (49.477)	lr 0.01374
Warmup Train [26][3080/3239]	Time 0.496 (0.514)	Data 0.001 (0.010)	Loss 4.3226 (4.2280)	Top-1 acc 23.438 (26.657)	Top-5 acc 50.781 (49.483)	lr 0.01374
Warmup Train [26][3090/3239]	Time 0.593 (0.514)	Data 0.001 (0.010)	Loss 4.2326 (4.2280)	Top-1 acc 25.781 (26.659)	Top-5 acc 49.609 (49.485)	lr 0.01373
Warmup Train [26][3100/3239]	Time 0.359 (0.514)	Data 0.001 (0.010)	Loss 4.2403 (4.2278)	Top-1 acc 27.734 (26.664)	Top-5 acc 48.438 (49.489)	lr 0.01373
Warmup Train [26][3110/3239]	Time 0.677 (0.514)	Data 0.001 (0.010)	Loss 4.2843 (4.2278)	Top-1 acc 25.000 (26.666)	Top-5 acc 47.656 (49.489)	lr 0.01372
Warmup Train [26][3120/3239]	Time 0.642 (0.514)	Data 0.001 (0.010)	Loss 4.1775 (4.2277)	Top-1 acc 28.125 (26.672)	Top-5 acc 50.391 (49.492)	lr 0.01372
Warmup Train [26][3130/3239]	Time 0.682 (0.514)	Data 0.001 (0.010)	Loss 4.2116 (4.2275)	Top-1 acc 26.562 (26.676)	Top-5 acc 48.047 (49.494)	lr 0.01371
Warmup Train [26][3140/3239]	Time 0.479 (0.514)	Data 0.001 (0.010)	Loss 4.0525 (4.2273)	Top-1 acc 30.859 (26.681)	Top-5 acc 53.906 (49.503)	lr 0.01370
Warmup Train [26][3150/3239]	Time 0.400 (0.514)	Data 0.001 (0.010)	Loss 4.0429 (4.2273)	Top-1 acc 32.422 (26.685)	Top-5 acc 54.297 (49.506)	lr 0.01370
Warmup Train [26][3160/3239]	Time 0.729 (0.514)	Data 0.001 (0.010)	Loss 4.1250 (4.2273)	Top-1 acc 28.125 (26.688)	Top-5 acc 55.469 (49.511)	lr 0.01369
Warmup Train [26][3170/3239]	Time 0.657 (0.514)	Data 0.001 (0.010)	Loss 4.1711 (4.2273)	Top-1 acc 26.172 (26.686)	Top-5 acc 48.828 (49.511)	lr 0.01369
Warmup Train [26][3180/3239]	Time 0.560 (0.514)	Data 0.000 (0.010)	Loss 4.4827 (4.2273)	Top-1 acc 23.438 (26.687)	Top-5 acc 45.703 (49.512)	lr 0.01368
Warmup Train [26][3190/3239]	Time 0.545 (0.514)	Data 0.000 (0.010)	Loss 4.1292 (4.2270)	Top-1 acc 27.344 (26.693)	Top-5 acc 50.781 (49.516)	lr 0.01368
Warmup Train [26][3200/3239]	Time 0.496 (0.514)	Data 0.000 (0.010)	Loss 4.2418 (4.2269)	Top-1 acc 27.344 (26.695)	Top-5 acc 47.266 (49.515)	lr 0.01367
Warmup Train [26][3210/3239]	Time 0.378 (0.514)	Data 0.000 (0.010)	Loss 4.2210 (4.2271)	Top-1 acc 25.781 (26.694)	Top-5 acc 46.094 (49.511)	lr 0.01367
Warmup Train [26][3220/3239]	Time 0.579 (0.514)	Data 0.000 (0.010)	Loss 4.1672 (4.2270)	Top-1 acc 25.000 (26.696)	Top-5 acc 51.562 (49.514)	lr 0.01366
Warmup Train [26][3230/3239]	Time 0.511 (0.514)	Data 0.000 (0.010)	Loss 4.3089 (4.2269)	Top-1 acc 26.562 (26.700)	Top-5 acc 50.781 (49.517)	lr 0.01366
Warmup Train [26][3239/3239]	Time 0.372 (0.514)	Data 0.000 (0.010)	Loss 4.1464 (4.2268)	Top-1 acc 29.630 (26.697)	Top-5 acc 49.383 (49.514)	lr 0.01365
==========Warmup Valid [26/40]	loss 3.169	top-1 acc 34.362	top-5 acc 59.374	Train top-1 26.697	top-5 49.514	flops: 442.4M
Warmup Train [27][0/3239]	Time 14.495 (14.495)	Data 11.842 (11.842)	Loss 3.9085 (3.9085)	Top-1 acc 33.203 (33.203)	Top-5 acc 59.766 (59.766)	lr 0.01365
Warmup Train [27][10/3239]	Time 0.434 (1.828)	Data 0.001 (1.100)	Loss 4.1522 (4.1501)	Top-1 acc 28.906 (28.871)	Top-5 acc 53.516 (51.634)	lr 0.01364
Warmup Train [27][20/3239]	Time 0.551 (1.217)	Data 0.001 (0.583)	Loss 4.1770 (4.1779)	Top-1 acc 30.078 (27.697)	Top-5 acc 52.344 (50.763)	lr 0.01364
Warmup Train [27][30/3239]	Time 0.642 (0.995)	Data 0.001 (0.395)	Loss 4.0300 (4.1768)	Top-1 acc 30.469 (27.646)	Top-5 acc 55.078 (50.466)	lr 0.01363
Warmup Train [27][40/3239]	Time 0.422 (0.875)	Data 0.001 (0.299)	Loss 4.4733 (4.1913)	Top-1 acc 28.125 (27.563)	Top-5 acc 45.312 (50.124)	lr 0.01363
Warmup Train [27][50/3239]	Time 0.510 (0.802)	Data 0.001 (0.243)	Loss 4.3139 (4.1927)	Top-1 acc 26.172 (27.443)	Top-5 acc 50.391 (50.329)	lr 0.01362
Warmup Train [27][60/3239]	Time 0.577 (0.758)	Data 0.002 (0.205)	Loss 4.1463 (4.1892)	Top-1 acc 26.562 (27.517)	Top-5 acc 51.953 (50.301)	lr 0.01362
Warmup Train [27][70/3239]	Time 0.398 (0.721)	Data 0.001 (0.176)	Loss 4.2870 (4.1941)	Top-1 acc 26.172 (27.421)	Top-5 acc 49.609 (50.088)	lr 0.01361
Warmup Train [27][80/3239]	Time 0.523 (0.695)	Data 0.001 (0.157)	Loss 4.2900 (4.1975)	Top-1 acc 27.734 (27.387)	Top-5 acc 51.953 (50.034)	lr 0.01361
Warmup Train [27][90/3239]	Time 0.345 (0.674)	Data 0.001 (0.141)	Loss 4.2185 (4.2001)	Top-1 acc 28.906 (27.485)	Top-5 acc 52.344 (50.043)	lr 0.01360
Warmup Train [27][100/3239]	Time 0.481 (0.659)	Data 0.001 (0.129)	Loss 4.2520 (4.1944)	Top-1 acc 25.781 (27.533)	Top-5 acc 48.828 (50.197)	lr 0.01360
Warmup Train [27][110/3239]	Time 0.540 (0.645)	Data 0.002 (0.118)	Loss 4.2219 (4.1948)	Top-1 acc 25.781 (27.530)	Top-5 acc 50.391 (50.229)	lr 0.01359
Warmup Train [27][120/3239]	Time 0.489 (0.631)	Data 0.001 (0.108)	Loss 4.2729 (4.1993)	Top-1 acc 24.219 (27.515)	Top-5 acc 47.266 (50.148)	lr 0.01359
Warmup Train [27][130/3239]	Time 0.188 (0.617)	Data 0.001 (0.100)	Loss 4.2640 (4.1978)	Top-1 acc 28.125 (27.549)	Top-5 acc 47.266 (50.194)	lr 0.01358
Warmup Train [27][140/3239]	Time 0.384 (0.610)	Data 0.001 (0.095)	Loss 4.1810 (4.1943)	Top-1 acc 25.391 (27.516)	Top-5 acc 46.094 (50.197)	lr 0.01357
Warmup Train [27][150/3239]	Time 0.497 (0.605)	Data 0.001 (0.089)	Loss 4.1369 (4.1987)	Top-1 acc 26.172 (27.395)	Top-5 acc 55.078 (50.129)	lr 0.01357
Warmup Train [27][160/3239]	Time 0.563 (0.598)	Data 0.001 (0.084)	Loss 4.2051 (4.2022)	Top-1 acc 28.906 (27.339)	Top-5 acc 48.828 (50.039)	lr 0.01356
Warmup Train [27][170/3239]	Time 0.472 (0.594)	Data 0.001 (0.079)	Loss 4.0938 (4.2039)	Top-1 acc 33.203 (27.262)	Top-5 acc 51.562 (50.041)	lr 0.01356
Warmup Train [27][180/3239]	Time 0.546 (0.590)	Data 0.001 (0.075)	Loss 4.0005 (4.2023)	Top-1 acc 32.031 (27.329)	Top-5 acc 55.078 (50.043)	lr 0.01355
Warmup Train [27][190/3239]	Time 0.591 (0.588)	Data 0.001 (0.071)	Loss 4.2373 (4.2015)	Top-1 acc 24.609 (27.362)	Top-5 acc 49.219 (50.076)	lr 0.01355
Warmup Train [27][200/3239]	Time 0.566 (0.584)	Data 0.001 (0.068)	Loss 4.1569 (4.1990)	Top-1 acc 28.906 (27.398)	Top-5 acc 49.609 (50.177)	lr 0.01354
Warmup Train [27][210/3239]	Time 0.583 (0.580)	Data 0.001 (0.065)	Loss 4.1834 (4.2026)	Top-1 acc 28.906 (27.309)	Top-5 acc 51.562 (50.117)	lr 0.01354
Warmup Train [27][220/3239]	Time 0.562 (0.578)	Data 0.001 (0.062)	Loss 4.3730 (4.2013)	Top-1 acc 23.438 (27.303)	Top-5 acc 48.438 (50.166)	lr 0.01353
Warmup Train [27][230/3239]	Time 0.311 (0.575)	Data 0.001 (0.059)	Loss 4.4067 (4.2004)	Top-1 acc 21.484 (27.320)	Top-5 acc 44.922 (50.161)	lr 0.01353
Warmup Train [27][240/3239]	Time 0.537 (0.573)	Data 0.001 (0.058)	Loss 4.3708 (4.2028)	Top-1 acc 21.875 (27.259)	Top-5 acc 42.578 (50.099)	lr 0.01352
Warmup Train [27][250/3239]	Time 0.517 (0.571)	Data 0.001 (0.055)	Loss 4.0478 (4.2031)	Top-1 acc 28.125 (27.294)	Top-5 acc 53.125 (50.100)	lr 0.01352
Warmup Train [27][260/3239]	Time 0.560 (0.569)	Data 0.001 (0.054)	Loss 4.3522 (4.2050)	Top-1 acc 25.000 (27.306)	Top-5 acc 49.609 (50.064)	lr 0.01351
Warmup Train [27][270/3239]	Time 0.360 (0.567)	Data 0.001 (0.052)	Loss 4.2544 (4.2041)	Top-1 acc 24.609 (27.306)	Top-5 acc 47.656 (50.095)	lr 0.01350
Warmup Train [27][280/3239]	Time 0.615 (0.566)	Data 0.001 (0.051)	Loss 4.2501 (4.2018)	Top-1 acc 26.562 (27.334)	Top-5 acc 48.438 (50.182)	lr 0.01350
Warmup Train [27][290/3239]	Time 0.642 (0.564)	Data 0.001 (0.049)	Loss 4.2596 (4.2029)	Top-1 acc 25.781 (27.281)	Top-5 acc 50.000 (50.141)	lr 0.01349
Warmup Train [27][300/3239]	Time 0.518 (0.563)	Data 0.002 (0.047)	Loss 4.1372 (4.2027)	Top-1 acc 30.469 (27.257)	Top-5 acc 50.000 (50.114)	lr 0.01349
Warmup Train [27][310/3239]	Time 0.557 (0.561)	Data 0.001 (0.046)	Loss 4.1140 (4.2004)	Top-1 acc 29.297 (27.285)	Top-5 acc 49.609 (50.156)	lr 0.01348
Warmup Train [27][320/3239]	Time 0.497 (0.560)	Data 0.001 (0.045)	Loss 4.2017 (4.2020)	Top-1 acc 26.562 (27.252)	Top-5 acc 51.172 (50.117)	lr 0.01348
Warmup Train [27][330/3239]	Time 0.374 (0.558)	Data 0.001 (0.043)	Loss 4.2790 (4.2031)	Top-1 acc 26.562 (27.264)	Top-5 acc 50.781 (50.114)	lr 0.01347
Warmup Train [27][340/3239]	Time 0.500 (0.556)	Data 0.001 (0.042)	Loss 4.2913 (4.2033)	Top-1 acc 25.781 (27.256)	Top-5 acc 50.000 (50.150)	lr 0.01347
Warmup Train [27][350/3239]	Time 0.218 (0.554)	Data 0.001 (0.041)	Loss 4.2222 (4.2023)	Top-1 acc 27.344 (27.274)	Top-5 acc 50.781 (50.188)	lr 0.01346
Warmup Train [27][360/3239]	Time 0.513 (0.552)	Data 0.001 (0.041)	Loss 4.1713 (4.2028)	Top-1 acc 29.297 (27.257)	Top-5 acc 52.734 (50.161)	lr 0.01346
Warmup Train [27][370/3239]	Time 0.321 (0.550)	Data 0.001 (0.040)	Loss 3.8074 (4.2006)	Top-1 acc 33.984 (27.283)	Top-5 acc 56.641 (50.201)	lr 0.01345
Warmup Train [27][380/3239]	Time 0.515 (0.548)	Data 0.001 (0.039)	Loss 4.4689 (4.2013)	Top-1 acc 25.781 (27.274)	Top-5 acc 44.531 (50.185)	lr 0.01345
Warmup Train [27][390/3239]	Time 0.544 (0.547)	Data 0.001 (0.039)	Loss 4.2630 (4.2005)	Top-1 acc 22.266 (27.289)	Top-5 acc 47.266 (50.195)	lr 0.01344
Warmup Train [27][400/3239]	Time 0.476 (0.546)	Data 0.001 (0.038)	Loss 4.5092 (4.2018)	Top-1 acc 21.875 (27.245)	Top-5 acc 41.797 (50.144)	lr 0.01343
Warmup Train [27][410/3239]	Time 0.434 (0.545)	Data 0.001 (0.037)	Loss 4.0643 (4.2020)	Top-1 acc 32.031 (27.239)	Top-5 acc 53.516 (50.149)	lr 0.01343
Warmup Train [27][420/3239]	Time 0.406 (0.544)	Data 0.001 (0.036)	Loss 4.4197 (4.2016)	Top-1 acc 27.344 (27.233)	Top-5 acc 47.266 (50.143)	lr 0.01342
Warmup Train [27][430/3239]	Time 0.476 (0.543)	Data 0.001 (0.036)	Loss 4.1452 (4.2013)	Top-1 acc 27.344 (27.219)	Top-5 acc 51.562 (50.143)	lr 0.01342
Warmup Train [27][440/3239]	Time 0.484 (0.542)	Data 0.001 (0.035)	Loss 4.0428 (4.2030)	Top-1 acc 30.469 (27.183)	Top-5 acc 51.953 (50.110)	lr 0.01341
Warmup Train [27][450/3239]	Time 0.635 (0.542)	Data 0.001 (0.034)	Loss 4.0755 (4.2018)	Top-1 acc 28.516 (27.207)	Top-5 acc 51.562 (50.123)	lr 0.01341
Warmup Train [27][460/3239]	Time 0.527 (0.542)	Data 0.001 (0.033)	Loss 4.2987 (4.2023)	Top-1 acc 25.000 (27.188)	Top-5 acc 48.438 (50.097)	lr 0.01340
Warmup Train [27][470/3239]	Time 0.345 (0.540)	Data 0.001 (0.033)	Loss 4.3596 (4.2032)	Top-1 acc 25.781 (27.165)	Top-5 acc 47.656 (50.074)	lr 0.01340
Warmup Train [27][480/3239]	Time 0.514 (0.540)	Data 0.002 (0.032)	Loss 4.1252 (4.2027)	Top-1 acc 29.688 (27.181)	Top-5 acc 53.125 (50.097)	lr 0.01339
Warmup Train [27][490/3239]	Time 0.571 (0.540)	Data 0.001 (0.032)	Loss 4.1868 (4.2032)	Top-1 acc 31.250 (27.176)	Top-5 acc 48.828 (50.082)	lr 0.01339
Warmup Train [27][500/3239]	Time 0.584 (0.539)	Data 0.001 (0.031)	Loss 4.1789 (4.2021)	Top-1 acc 25.781 (27.221)	Top-5 acc 48.047 (50.110)	lr 0.01338
Warmup Train [27][510/3239]	Time 0.552 (0.538)	Data 0.001 (0.031)	Loss 4.3297 (4.2023)	Top-1 acc 26.953 (27.222)	Top-5 acc 49.219 (50.105)	lr 0.01338
Warmup Train [27][520/3239]	Time 0.496 (0.538)	Data 0.001 (0.030)	Loss 4.0789 (4.2023)	Top-1 acc 27.344 (27.202)	Top-5 acc 52.344 (50.112)	lr 0.01337
Warmup Train [27][530/3239]	Time 0.597 (0.538)	Data 0.001 (0.030)	Loss 4.4232 (4.2024)	Top-1 acc 22.266 (27.208)	Top-5 acc 45.312 (50.104)	lr 0.01337
Warmup Train [27][540/3239]	Time 0.457 (0.537)	Data 0.001 (0.029)	Loss 4.2301 (4.2032)	Top-1 acc 26.953 (27.189)	Top-5 acc 50.781 (50.079)	lr 0.01336
Warmup Train [27][550/3239]	Time 0.498 (0.536)	Data 0.001 (0.029)	Loss 3.8864 (4.2017)	Top-1 acc 32.812 (27.215)	Top-5 acc 55.078 (50.111)	lr 0.01335
Warmup Train [27][560/3239]	Time 0.570 (0.535)	Data 0.001 (0.028)	Loss 4.1556 (4.2022)	Top-1 acc 26.953 (27.216)	Top-5 acc 51.172 (50.091)	lr 0.01335
Warmup Train [27][570/3239]	Time 0.455 (0.535)	Data 0.001 (0.028)	Loss 4.1178 (4.2021)	Top-1 acc 30.078 (27.229)	Top-5 acc 49.609 (50.084)	lr 0.01334
Warmup Train [27][580/3239]	Time 0.286 (0.533)	Data 0.001 (0.027)	Loss 4.1706 (4.2023)	Top-1 acc 28.906 (27.219)	Top-5 acc 50.000 (50.084)	lr 0.01334
Warmup Train [27][590/3239]	Time 0.492 (0.533)	Data 0.001 (0.027)	Loss 4.0618 (4.2012)	Top-1 acc 27.734 (27.226)	Top-5 acc 56.641 (50.120)	lr 0.01333
Warmup Train [27][600/3239]	Time 0.628 (0.532)	Data 0.001 (0.027)	Loss 4.1040 (4.2014)	Top-1 acc 28.516 (27.222)	Top-5 acc 51.953 (50.107)	lr 0.01333
Warmup Train [27][610/3239]	Time 0.509 (0.532)	Data 0.001 (0.026)	Loss 4.1765 (4.2014)	Top-1 acc 28.906 (27.210)	Top-5 acc 53.516 (50.098)	lr 0.01332
Warmup Train [27][620/3239]	Time 0.491 (0.530)	Data 0.002 (0.026)	Loss 3.9172 (4.2009)	Top-1 acc 32.422 (27.212)	Top-5 acc 57.031 (50.126)	lr 0.01332
Warmup Train [27][630/3239]	Time 0.506 (0.530)	Data 0.001 (0.026)	Loss 4.3253 (4.2008)	Top-1 acc 27.344 (27.216)	Top-5 acc 50.391 (50.136)	lr 0.01331
Warmup Train [27][640/3239]	Time 0.500 (0.530)	Data 0.001 (0.025)	Loss 4.2134 (4.2006)	Top-1 acc 26.562 (27.224)	Top-5 acc 52.344 (50.150)	lr 0.01331
Warmup Train [27][650/3239]	Time 0.447 (0.529)	Data 0.001 (0.025)	Loss 4.1008 (4.1998)	Top-1 acc 32.031 (27.248)	Top-5 acc 51.562 (50.173)	lr 0.01330
Warmup Train [27][660/3239]	Time 0.500 (0.529)	Data 0.001 (0.025)	Loss 4.1682 (4.2000)	Top-1 acc 26.172 (27.247)	Top-5 acc 50.000 (50.162)	lr 0.01330
Warmup Train [27][670/3239]	Time 0.498 (0.529)	Data 0.001 (0.025)	Loss 4.3079 (4.2003)	Top-1 acc 26.562 (27.249)	Top-5 acc 51.172 (50.152)	lr 0.01329
Warmup Train [27][680/3239]	Time 0.579 (0.529)	Data 0.001 (0.024)	Loss 4.0564 (4.1999)	Top-1 acc 31.250 (27.259)	Top-5 acc 53.125 (50.151)	lr 0.01328
Warmup Train [27][690/3239]	Time 0.357 (0.528)	Data 0.001 (0.024)	Loss 4.2418 (4.1999)	Top-1 acc 27.344 (27.256)	Top-5 acc 50.391 (50.165)	lr 0.01328
Warmup Train [27][700/3239]	Time 0.435 (0.528)	Data 0.003 (0.024)	Loss 4.3056 (4.2001)	Top-1 acc 25.781 (27.260)	Top-5 acc 49.219 (50.168)	lr 0.01327
Warmup Train [27][710/3239]	Time 0.510 (0.528)	Data 0.001 (0.024)	Loss 4.1666 (4.1992)	Top-1 acc 30.078 (27.262)	Top-5 acc 51.562 (50.191)	lr 0.01327
Warmup Train [27][720/3239]	Time 0.605 (0.528)	Data 0.001 (0.023)	Loss 4.2232 (4.1988)	Top-1 acc 25.781 (27.259)	Top-5 acc 51.562 (50.192)	lr 0.01326
Warmup Train [27][730/3239]	Time 0.558 (0.528)	Data 0.001 (0.023)	Loss 4.1906 (4.1983)	Top-1 acc 27.734 (27.271)	Top-5 acc 51.562 (50.196)	lr 0.01326
Warmup Train [27][740/3239]	Time 0.588 (0.528)	Data 0.001 (0.023)	Loss 4.2411 (4.1969)	Top-1 acc 27.734 (27.311)	Top-5 acc 48.438 (50.234)	lr 0.01325
Warmup Train [27][750/3239]	Time 0.556 (0.528)	Data 0.026 (0.023)	Loss 3.9566 (4.1967)	Top-1 acc 30.078 (27.319)	Top-5 acc 56.250 (50.231)	lr 0.01325
Warmup Train [27][760/3239]	Time 0.441 (0.528)	Data 0.001 (0.022)	Loss 4.2477 (4.1966)	Top-1 acc 27.344 (27.322)	Top-5 acc 48.828 (50.234)	lr 0.01324
Warmup Train [27][770/3239]	Time 0.486 (0.528)	Data 0.002 (0.022)	Loss 4.3343 (4.1972)	Top-1 acc 27.734 (27.314)	Top-5 acc 50.391 (50.220)	lr 0.01324
Warmup Train [27][780/3239]	Time 0.429 (0.528)	Data 0.001 (0.022)	Loss 4.4475 (4.1976)	Top-1 acc 19.922 (27.297)	Top-5 acc 45.312 (50.204)	lr 0.01323
Warmup Train [27][790/3239]	Time 0.532 (0.527)	Data 0.001 (0.022)	Loss 4.2027 (4.1979)	Top-1 acc 26.562 (27.300)	Top-5 acc 48.047 (50.204)	lr 0.01323
Warmup Train [27][800/3239]	Time 0.565 (0.528)	Data 0.001 (0.022)	Loss 4.3221 (4.1978)	Top-1 acc 22.266 (27.309)	Top-5 acc 49.219 (50.208)	lr 0.01322
Warmup Train [27][810/3239]	Time 0.557 (0.527)	Data 0.002 (0.021)	Loss 4.0824 (4.1979)	Top-1 acc 26.953 (27.307)	Top-5 acc 51.562 (50.212)	lr 0.01322
Warmup Train [27][820/3239]	Time 0.442 (0.527)	Data 0.001 (0.021)	Loss 4.0493 (4.1976)	Top-1 acc 29.297 (27.319)	Top-5 acc 47.656 (50.217)	lr 0.01321
Warmup Train [27][830/3239]	Time 0.457 (0.526)	Data 0.001 (0.021)	Loss 4.3952 (4.1979)	Top-1 acc 23.828 (27.324)	Top-5 acc 43.359 (50.202)	lr 0.01320
Warmup Train [27][840/3239]	Time 0.379 (0.526)	Data 0.001 (0.021)	Loss 4.3857 (4.1990)	Top-1 acc 23.828 (27.297)	Top-5 acc 46.484 (50.165)	lr 0.01320
Warmup Train [27][850/3239]	Time 0.480 (0.525)	Data 0.001 (0.021)	Loss 4.1206 (4.1988)	Top-1 acc 30.078 (27.306)	Top-5 acc 50.000 (50.171)	lr 0.01319
Warmup Train [27][860/3239]	Time 0.376 (0.525)	Data 0.001 (0.021)	Loss 4.1564 (4.1981)	Top-1 acc 25.000 (27.305)	Top-5 acc 51.562 (50.192)	lr 0.01319
Warmup Train [27][870/3239]	Time 0.577 (0.525)	Data 0.001 (0.021)	Loss 4.0643 (4.1981)	Top-1 acc 30.078 (27.298)	Top-5 acc 53.125 (50.188)	lr 0.01318
Warmup Train [27][880/3239]	Time 0.697 (0.525)	Data 0.001 (0.021)	Loss 4.0517 (4.1977)	Top-1 acc 31.250 (27.307)	Top-5 acc 54.688 (50.201)	lr 0.01318
Warmup Train [27][890/3239]	Time 0.571 (0.525)	Data 0.001 (0.020)	Loss 4.2430 (4.1973)	Top-1 acc 26.172 (27.314)	Top-5 acc 46.875 (50.203)	lr 0.01317
Warmup Train [27][900/3239]	Time 0.510 (0.525)	Data 0.001 (0.020)	Loss 4.1766 (4.1972)	Top-1 acc 26.953 (27.320)	Top-5 acc 51.562 (50.202)	lr 0.01317
Warmup Train [27][910/3239]	Time 0.587 (0.525)	Data 0.001 (0.020)	Loss 4.3182 (4.1972)	Top-1 acc 26.172 (27.327)	Top-5 acc 44.922 (50.192)	lr 0.01316
Warmup Train [27][920/3239]	Time 0.489 (0.525)	Data 0.001 (0.020)	Loss 4.1823 (4.1974)	Top-1 acc 24.609 (27.322)	Top-5 acc 48.828 (50.189)	lr 0.01316
Warmup Train [27][930/3239]	Time 0.478 (0.524)	Data 0.001 (0.020)	Loss 3.9914 (4.1966)	Top-1 acc 31.641 (27.339)	Top-5 acc 52.344 (50.207)	lr 0.01315
Warmup Train [27][940/3239]	Time 0.452 (0.524)	Data 0.001 (0.019)	Loss 4.0161 (4.1963)	Top-1 acc 29.688 (27.351)	Top-5 acc 55.859 (50.217)	lr 0.01315
Warmup Train [27][950/3239]	Time 0.524 (0.524)	Data 0.001 (0.019)	Loss 4.2273 (4.1963)	Top-1 acc 23.828 (27.341)	Top-5 acc 48.438 (50.214)	lr 0.01314
Warmup Train [27][960/3239]	Time 0.500 (0.524)	Data 0.001 (0.019)	Loss 4.2691 (4.1970)	Top-1 acc 24.219 (27.325)	Top-5 acc 48.438 (50.197)	lr 0.01313
Warmup Train [27][970/3239]	Time 0.620 (0.524)	Data 0.001 (0.019)	Loss 4.1856 (4.1969)	Top-1 acc 25.000 (27.326)	Top-5 acc 51.953 (50.197)	lr 0.01313
Warmup Train [27][980/3239]	Time 0.505 (0.524)	Data 0.001 (0.019)	Loss 4.2183 (4.1974)	Top-1 acc 25.781 (27.318)	Top-5 acc 51.953 (50.182)	lr 0.01312
Warmup Train [27][990/3239]	Time 0.308 (0.524)	Data 0.001 (0.019)	Loss 4.3192 (4.1972)	Top-1 acc 28.906 (27.321)	Top-5 acc 49.609 (50.181)	lr 0.01312
Warmup Train [27][1000/3239]	Time 0.552 (0.524)	Data 0.001 (0.019)	Loss 4.3959 (4.1970)	Top-1 acc 23.828 (27.320)	Top-5 acc 48.047 (50.179)	lr 0.01311
Warmup Train [27][1010/3239]	Time 0.522 (0.524)	Data 0.001 (0.019)	Loss 4.5192 (4.1972)	Top-1 acc 23.047 (27.309)	Top-5 acc 41.797 (50.168)	lr 0.01311
Warmup Train [27][1020/3239]	Time 0.370 (0.524)	Data 0.001 (0.018)	Loss 4.1247 (4.1970)	Top-1 acc 28.906 (27.315)	Top-5 acc 49.609 (50.166)	lr 0.01310
Warmup Train [27][1030/3239]	Time 0.475 (0.524)	Data 0.001 (0.018)	Loss 4.3641 (4.1969)	Top-1 acc 23.828 (27.309)	Top-5 acc 44.531 (50.167)	lr 0.01310
Warmup Train [27][1040/3239]	Time 0.565 (0.524)	Data 0.001 (0.018)	Loss 4.3779 (4.1967)	Top-1 acc 23.047 (27.316)	Top-5 acc 46.484 (50.172)	lr 0.01309
Warmup Train [27][1050/3239]	Time 0.485 (0.524)	Data 0.001 (0.018)	Loss 4.1871 (4.1971)	Top-1 acc 25.781 (27.307)	Top-5 acc 51.172 (50.165)	lr 0.01309
Warmup Train [27][1060/3239]	Time 0.568 (0.524)	Data 0.001 (0.018)	Loss 4.3041 (4.1973)	Top-1 acc 26.953 (27.312)	Top-5 acc 52.344 (50.158)	lr 0.01308
Warmup Train [27][1070/3239]	Time 0.630 (0.523)	Data 0.001 (0.018)	Loss 4.1484 (4.1979)	Top-1 acc 25.781 (27.287)	Top-5 acc 53.906 (50.147)	lr 0.01308
Warmup Train [27][1080/3239]	Time 0.555 (0.523)	Data 0.001 (0.018)	Loss 4.1449 (4.1978)	Top-1 acc 29.688 (27.298)	Top-5 acc 52.344 (50.156)	lr 0.01307
Warmup Train [27][1090/3239]	Time 0.428 (0.523)	Data 0.001 (0.018)	Loss 4.2433 (4.1973)	Top-1 acc 28.516 (27.300)	Top-5 acc 48.047 (50.174)	lr 0.01307
Warmup Train [27][1100/3239]	Time 0.520 (0.522)	Data 0.001 (0.018)	Loss 4.1737 (4.1977)	Top-1 acc 28.125 (27.294)	Top-5 acc 46.875 (50.162)	lr 0.01306
Warmup Train [27][1110/3239]	Time 0.580 (0.522)	Data 0.001 (0.017)	Loss 4.1970 (4.1979)	Top-1 acc 25.781 (27.287)	Top-5 acc 47.656 (50.153)	lr 0.01306
Warmup Train [27][1120/3239]	Time 0.599 (0.522)	Data 0.001 (0.017)	Loss 4.1944 (4.1981)	Top-1 acc 26.953 (27.291)	Top-5 acc 53.125 (50.163)	lr 0.01305
Warmup Train [27][1130/3239]	Time 0.619 (0.522)	Data 0.001 (0.017)	Loss 4.1324 (4.1980)	Top-1 acc 26.562 (27.295)	Top-5 acc 51.953 (50.172)	lr 0.01304
Warmup Train [27][1140/3239]	Time 0.624 (0.522)	Data 0.001 (0.017)	Loss 4.2113 (4.1980)	Top-1 acc 26.953 (27.294)	Top-5 acc 52.344 (50.172)	lr 0.01304
Warmup Train [27][1150/3239]	Time 0.484 (0.522)	Data 0.001 (0.017)	Loss 4.0119 (4.1979)	Top-1 acc 33.594 (27.298)	Top-5 acc 55.078 (50.187)	lr 0.01303
Warmup Train [27][1160/3239]	Time 0.621 (0.522)	Data 0.001 (0.017)	Loss 4.0633 (4.1979)	Top-1 acc 30.859 (27.299)	Top-5 acc 54.688 (50.192)	lr 0.01303
Warmup Train [27][1170/3239]	Time 0.551 (0.522)	Data 0.001 (0.017)	Loss 4.2654 (4.1983)	Top-1 acc 28.906 (27.289)	Top-5 acc 49.609 (50.188)	lr 0.01302
Warmup Train [27][1180/3239]	Time 0.504 (0.522)	Data 0.001 (0.017)	Loss 4.2752 (4.1986)	Top-1 acc 27.344 (27.293)	Top-5 acc 47.266 (50.183)	lr 0.01302
Warmup Train [27][1190/3239]	Time 0.522 (0.522)	Data 0.001 (0.016)	Loss 4.2494 (4.1993)	Top-1 acc 26.562 (27.281)	Top-5 acc 49.609 (50.168)	lr 0.01301
Warmup Train [27][1200/3239]	Time 0.587 (0.522)	Data 0.001 (0.016)	Loss 4.2651 (4.1996)	Top-1 acc 24.609 (27.283)	Top-5 acc 46.875 (50.166)	lr 0.01301
Warmup Train [27][1210/3239]	Time 0.720 (0.522)	Data 0.001 (0.016)	Loss 4.3746 (4.1990)	Top-1 acc 24.609 (27.294)	Top-5 acc 44.922 (50.180)	lr 0.01300
Warmup Train [27][1220/3239]	Time 0.470 (0.522)	Data 0.001 (0.016)	Loss 4.4057 (4.1993)	Top-1 acc 24.219 (27.291)	Top-5 acc 43.750 (50.172)	lr 0.01300
Warmup Train [27][1230/3239]	Time 0.644 (0.522)	Data 0.001 (0.016)	Loss 4.2290 (4.1991)	Top-1 acc 25.000 (27.292)	Top-5 acc 46.484 (50.176)	lr 0.01299
Warmup Train [27][1240/3239]	Time 0.503 (0.522)	Data 0.001 (0.016)	Loss 4.1119 (4.1994)	Top-1 acc 27.344 (27.283)	Top-5 acc 50.000 (50.166)	lr 0.01299
Warmup Train [27][1250/3239]	Time 0.509 (0.522)	Data 0.001 (0.016)	Loss 4.3710 (4.1992)	Top-1 acc 22.266 (27.284)	Top-5 acc 46.484 (50.166)	lr 0.01298
Warmup Train [27][1260/3239]	Time 0.522 (0.522)	Data 0.001 (0.016)	Loss 4.1310 (4.1988)	Top-1 acc 25.000 (27.290)	Top-5 acc 49.219 (50.174)	lr 0.01298
Warmup Train [27][1270/3239]	Time 0.561 (0.522)	Data 0.001 (0.016)	Loss 4.2458 (4.1988)	Top-1 acc 26.562 (27.290)	Top-5 acc 48.438 (50.170)	lr 0.01297
Warmup Train [27][1280/3239]	Time 0.523 (0.522)	Data 0.001 (0.016)	Loss 4.3125 (4.1988)	Top-1 acc 25.781 (27.292)	Top-5 acc 49.219 (50.177)	lr 0.01296
Warmup Train [27][1290/3239]	Time 0.510 (0.522)	Data 0.001 (0.016)	Loss 4.3856 (4.1990)	Top-1 acc 25.781 (27.284)	Top-5 acc 44.531 (50.175)	lr 0.01296
Warmup Train [27][1300/3239]	Time 0.359 (0.522)	Data 0.001 (0.015)	Loss 4.0996 (4.1988)	Top-1 acc 24.609 (27.289)	Top-5 acc 51.172 (50.177)	lr 0.01295
Warmup Train [27][1310/3239]	Time 0.490 (0.521)	Data 0.001 (0.015)	Loss 4.1577 (4.1986)	Top-1 acc 25.781 (27.297)	Top-5 acc 49.609 (50.178)	lr 0.01295
Warmup Train [27][1320/3239]	Time 0.530 (0.521)	Data 0.001 (0.015)	Loss 4.1025 (4.1983)	Top-1 acc 28.516 (27.301)	Top-5 acc 50.391 (50.182)	lr 0.01294
Warmup Train [27][1330/3239]	Time 0.455 (0.521)	Data 0.001 (0.015)	Loss 4.1561 (4.1986)	Top-1 acc 29.688 (27.305)	Top-5 acc 50.781 (50.175)	lr 0.01294
Warmup Train [27][1340/3239]	Time 0.309 (0.521)	Data 0.001 (0.015)	Loss 4.1423 (4.1984)	Top-1 acc 27.344 (27.316)	Top-5 acc 51.172 (50.186)	lr 0.01293
Warmup Train [27][1350/3239]	Time 0.586 (0.520)	Data 0.001 (0.015)	Loss 4.1444 (4.1981)	Top-1 acc 29.688 (27.333)	Top-5 acc 53.125 (50.191)	lr 0.01293
Warmup Train [27][1360/3239]	Time 0.525 (0.520)	Data 0.001 (0.015)	Loss 4.3058 (4.1981)	Top-1 acc 20.703 (27.327)	Top-5 acc 46.484 (50.189)	lr 0.01292
Warmup Train [27][1370/3239]	Time 0.533 (0.520)	Data 0.001 (0.015)	Loss 4.1514 (4.1980)	Top-1 acc 27.734 (27.330)	Top-5 acc 48.828 (50.186)	lr 0.01292
Warmup Train [27][1380/3239]	Time 0.676 (0.520)	Data 0.001 (0.015)	Loss 4.3713 (4.1976)	Top-1 acc 20.703 (27.332)	Top-5 acc 47.656 (50.194)	lr 0.01291
Warmup Train [27][1390/3239]	Time 0.531 (0.520)	Data 0.001 (0.015)	Loss 4.0212 (4.1973)	Top-1 acc 33.203 (27.336)	Top-5 acc 52.734 (50.198)	lr 0.01291
Warmup Train [27][1400/3239]	Time 0.679 (0.520)	Data 0.001 (0.015)	Loss 4.0422 (4.1970)	Top-1 acc 28.125 (27.340)	Top-5 acc 51.172 (50.201)	lr 0.01290
Warmup Train [27][1410/3239]	Time 0.456 (0.520)	Data 0.001 (0.015)	Loss 4.0150 (4.1971)	Top-1 acc 27.344 (27.325)	Top-5 acc 54.688 (50.200)	lr 0.01290
Warmup Train [27][1420/3239]	Time 0.523 (0.520)	Data 0.001 (0.015)	Loss 4.2051 (4.1967)	Top-1 acc 25.000 (27.331)	Top-5 acc 50.000 (50.214)	lr 0.01289
Warmup Train [27][1430/3239]	Time 0.501 (0.520)	Data 0.001 (0.015)	Loss 4.0655 (4.1966)	Top-1 acc 31.250 (27.331)	Top-5 acc 55.469 (50.216)	lr 0.01289
Warmup Train [27][1440/3239]	Time 0.490 (0.520)	Data 0.001 (0.015)	Loss 4.1996 (4.1964)	Top-1 acc 26.172 (27.331)	Top-5 acc 46.875 (50.219)	lr 0.01288
Warmup Train [27][1450/3239]	Time 0.501 (0.520)	Data 0.001 (0.015)	Loss 4.1427 (4.1962)	Top-1 acc 25.781 (27.334)	Top-5 acc 54.297 (50.219)	lr 0.01287
Warmup Train [27][1460/3239]	Time 0.462 (0.520)	Data 0.001 (0.014)	Loss 4.2704 (4.1962)	Top-1 acc 21.094 (27.327)	Top-5 acc 46.484 (50.219)	lr 0.01287
Warmup Train [27][1470/3239]	Time 0.526 (0.520)	Data 0.001 (0.014)	Loss 4.0552 (4.1957)	Top-1 acc 29.297 (27.333)	Top-5 acc 53.516 (50.227)	lr 0.01286
Warmup Train [27][1480/3239]	Time 0.507 (0.520)	Data 0.001 (0.014)	Loss 4.2646 (4.1960)	Top-1 acc 27.734 (27.333)	Top-5 acc 48.438 (50.223)	lr 0.01286
Warmup Train [27][1490/3239]	Time 0.488 (0.519)	Data 0.001 (0.014)	Loss 4.1763 (4.1960)	Top-1 acc 30.078 (27.334)	Top-5 acc 50.781 (50.218)	lr 0.01285
Warmup Train [27][1500/3239]	Time 0.619 (0.519)	Data 0.001 (0.014)	Loss 4.2532 (4.1960)	Top-1 acc 27.344 (27.331)	Top-5 acc 51.953 (50.220)	lr 0.01285
Warmup Train [27][1510/3239]	Time 0.342 (0.519)	Data 0.001 (0.014)	Loss 4.3451 (4.1966)	Top-1 acc 22.656 (27.320)	Top-5 acc 48.438 (50.211)	lr 0.01284
Warmup Train [27][1520/3239]	Time 0.569 (0.519)	Data 0.001 (0.014)	Loss 4.0410 (4.1961)	Top-1 acc 31.641 (27.331)	Top-5 acc 51.562 (50.221)	lr 0.01284
Warmup Train [27][1530/3239]	Time 0.648 (0.519)	Data 0.001 (0.014)	Loss 4.1873 (4.1959)	Top-1 acc 27.734 (27.338)	Top-5 acc 53.516 (50.224)	lr 0.01283
Warmup Train [27][1540/3239]	Time 0.335 (0.519)	Data 0.001 (0.014)	Loss 4.0279 (4.1958)	Top-1 acc 29.688 (27.344)	Top-5 acc 55.859 (50.227)	lr 0.01283
Warmup Train [27][1550/3239]	Time 0.463 (0.519)	Data 0.001 (0.014)	Loss 4.2593 (4.1960)	Top-1 acc 26.562 (27.339)	Top-5 acc 51.172 (50.223)	lr 0.01282
Warmup Train [27][1560/3239]	Time 0.457 (0.519)	Data 0.001 (0.014)	Loss 4.0658 (4.1960)	Top-1 acc 30.859 (27.334)	Top-5 acc 54.297 (50.219)	lr 0.01282
Warmup Train [27][1570/3239]	Time 0.511 (0.519)	Data 0.001 (0.014)	Loss 4.3482 (4.1961)	Top-1 acc 21.094 (27.323)	Top-5 acc 44.531 (50.221)	lr 0.01281
Warmup Train [27][1580/3239]	Time 0.347 (0.519)	Data 0.001 (0.014)	Loss 4.2944 (4.1962)	Top-1 acc 26.172 (27.322)	Top-5 acc 48.828 (50.213)	lr 0.01281
Warmup Train [27][1590/3239]	Time 0.490 (0.518)	Data 0.001 (0.014)	Loss 4.0949 (4.1963)	Top-1 acc 30.859 (27.323)	Top-5 acc 53.906 (50.213)	lr 0.01280
Warmup Train [27][1600/3239]	Time 0.518 (0.518)	Data 0.001 (0.014)	Loss 4.1572 (4.1965)	Top-1 acc 29.297 (27.316)	Top-5 acc 52.734 (50.214)	lr 0.01280
Warmup Train [27][1610/3239]	Time 0.622 (0.519)	Data 0.001 (0.014)	Loss 4.3551 (4.1965)	Top-1 acc 27.344 (27.320)	Top-5 acc 44.531 (50.218)	lr 0.01279
Warmup Train [27][1620/3239]	Time 0.601 (0.519)	Data 0.002 (0.014)	Loss 4.1857 (4.1962)	Top-1 acc 28.906 (27.322)	Top-5 acc 48.828 (50.224)	lr 0.01278
Warmup Train [27][1630/3239]	Time 0.675 (0.519)	Data 0.001 (0.014)	Loss 4.3289 (4.1963)	Top-1 acc 24.609 (27.323)	Top-5 acc 48.047 (50.226)	lr 0.01278
Warmup Train [27][1640/3239]	Time 0.588 (0.519)	Data 0.001 (0.014)	Loss 4.3079 (4.1964)	Top-1 acc 24.609 (27.320)	Top-5 acc 48.047 (50.225)	lr 0.01277
Warmup Train [27][1650/3239]	Time 0.547 (0.519)	Data 0.001 (0.014)	Loss 4.1534 (4.1963)	Top-1 acc 25.391 (27.322)	Top-5 acc 51.172 (50.229)	lr 0.01277
Warmup Train [27][1660/3239]	Time 0.622 (0.519)	Data 0.001 (0.014)	Loss 4.4011 (4.1965)	Top-1 acc 26.562 (27.322)	Top-5 acc 48.438 (50.231)	lr 0.01276
Warmup Train [27][1670/3239]	Time 0.403 (0.519)	Data 0.001 (0.013)	Loss 4.3228 (4.1969)	Top-1 acc 24.609 (27.319)	Top-5 acc 45.703 (50.227)	lr 0.01276
Warmup Train [27][1680/3239]	Time 0.546 (0.518)	Data 0.001 (0.013)	Loss 4.1763 (4.1972)	Top-1 acc 26.953 (27.314)	Top-5 acc 49.219 (50.213)	lr 0.01275
Warmup Train [27][1690/3239]	Time 0.433 (0.519)	Data 0.001 (0.013)	Loss 4.1888 (4.1968)	Top-1 acc 27.734 (27.322)	Top-5 acc 49.609 (50.224)	lr 0.01275
Warmup Train [27][1700/3239]	Time 0.590 (0.519)	Data 0.001 (0.013)	Loss 4.0400 (4.1966)	Top-1 acc 34.375 (27.334)	Top-5 acc 53.125 (50.230)	lr 0.01274
Warmup Train [27][1710/3239]	Time 0.536 (0.519)	Data 0.001 (0.013)	Loss 4.3586 (4.1968)	Top-1 acc 19.531 (27.331)	Top-5 acc 45.703 (50.225)	lr 0.01274
Warmup Train [27][1720/3239]	Time 0.539 (0.519)	Data 0.001 (0.013)	Loss 3.8819 (4.1966)	Top-1 acc 31.641 (27.334)	Top-5 acc 55.078 (50.225)	lr 0.01273
Warmup Train [27][1730/3239]	Time 0.660 (0.518)	Data 0.001 (0.013)	Loss 4.0597 (4.1965)	Top-1 acc 30.078 (27.328)	Top-5 acc 53.516 (50.219)	lr 0.01273
Warmup Train [27][1740/3239]	Time 0.503 (0.518)	Data 0.001 (0.013)	Loss 4.1463 (4.1967)	Top-1 acc 27.734 (27.331)	Top-5 acc 53.125 (50.214)	lr 0.01272
Warmup Train [27][1750/3239]	Time 0.494 (0.518)	Data 0.001 (0.013)	Loss 4.2767 (4.1964)	Top-1 acc 28.516 (27.332)	Top-5 acc 47.266 (50.223)	lr 0.01272
Warmup Train [27][1760/3239]	Time 0.541 (0.518)	Data 0.001 (0.013)	Loss 4.2852 (4.1963)	Top-1 acc 27.344 (27.335)	Top-5 acc 49.609 (50.233)	lr 0.01271
Warmup Train [27][1770/3239]	Time 0.637 (0.518)	Data 0.001 (0.013)	Loss 4.1464 (4.1963)	Top-1 acc 31.641 (27.334)	Top-5 acc 53.516 (50.230)	lr 0.01271
Warmup Train [27][1780/3239]	Time 0.500 (0.518)	Data 0.001 (0.013)	Loss 4.3093 (4.1966)	Top-1 acc 25.000 (27.329)	Top-5 acc 47.656 (50.224)	lr 0.01270
Warmup Train [27][1790/3239]	Time 0.377 (0.518)	Data 0.027 (0.013)	Loss 4.3261 (4.1964)	Top-1 acc 27.344 (27.339)	Top-5 acc 47.656 (50.231)	lr 0.01269
Warmup Train [27][1800/3239]	Time 0.575 (0.518)	Data 0.001 (0.013)	Loss 4.0833 (4.1962)	Top-1 acc 31.250 (27.341)	Top-5 acc 49.609 (50.234)	lr 0.01269
Warmup Train [27][1810/3239]	Time 0.392 (0.518)	Data 0.001 (0.013)	Loss 4.0586 (4.1961)	Top-1 acc 30.078 (27.347)	Top-5 acc 55.078 (50.237)	lr 0.01268
Warmup Train [27][1820/3239]	Time 0.470 (0.518)	Data 0.001 (0.013)	Loss 4.1604 (4.1960)	Top-1 acc 26.953 (27.351)	Top-5 acc 48.438 (50.234)	lr 0.01268
Warmup Train [27][1830/3239]	Time 0.633 (0.518)	Data 0.001 (0.013)	Loss 4.2174 (4.1958)	Top-1 acc 25.391 (27.354)	Top-5 acc 46.094 (50.236)	lr 0.01267
Warmup Train [27][1840/3239]	Time 0.534 (0.518)	Data 0.001 (0.013)	Loss 4.3417 (4.1959)	Top-1 acc 23.438 (27.351)	Top-5 acc 46.484 (50.229)	lr 0.01267
Warmup Train [27][1850/3239]	Time 0.510 (0.518)	Data 0.001 (0.013)	Loss 4.4100 (4.1960)	Top-1 acc 24.219 (27.343)	Top-5 acc 41.797 (50.226)	lr 0.01266
Warmup Train [27][1860/3239]	Time 0.529 (0.518)	Data 0.001 (0.013)	Loss 3.9981 (4.1961)	Top-1 acc 27.344 (27.340)	Top-5 acc 55.859 (50.225)	lr 0.01266
Warmup Train [27][1870/3239]	Time 0.640 (0.518)	Data 0.001 (0.013)	Loss 4.2462 (4.1962)	Top-1 acc 23.438 (27.337)	Top-5 acc 42.969 (50.220)	lr 0.01265
Warmup Train [27][1880/3239]	Time 0.434 (0.518)	Data 0.001 (0.013)	Loss 4.3172 (4.1965)	Top-1 acc 25.781 (27.329)	Top-5 acc 45.312 (50.212)	lr 0.01265
Warmup Train [27][1890/3239]	Time 0.485 (0.517)	Data 0.001 (0.013)	Loss 4.1410 (4.1965)	Top-1 acc 26.953 (27.331)	Top-5 acc 53.125 (50.215)	lr 0.01264
Warmup Train [27][1900/3239]	Time 0.362 (0.517)	Data 0.001 (0.012)	Loss 4.1499 (4.1962)	Top-1 acc 28.906 (27.335)	Top-5 acc 50.781 (50.216)	lr 0.01264
Warmup Train [27][1910/3239]	Time 0.595 (0.517)	Data 0.001 (0.012)	Loss 4.0125 (4.1962)	Top-1 acc 28.516 (27.334)	Top-5 acc 51.953 (50.216)	lr 0.01263
Warmup Train [27][1920/3239]	Time 0.443 (0.517)	Data 0.001 (0.012)	Loss 4.2768 (4.1964)	Top-1 acc 27.344 (27.330)	Top-5 acc 49.219 (50.215)	lr 0.01263
Warmup Train [27][1930/3239]	Time 0.614 (0.518)	Data 0.001 (0.012)	Loss 4.2214 (4.1962)	Top-1 acc 26.172 (27.333)	Top-5 acc 49.609 (50.219)	lr 0.01262
Warmup Train [27][1940/3239]	Time 0.599 (0.518)	Data 0.001 (0.012)	Loss 4.1852 (4.1961)	Top-1 acc 25.781 (27.333)	Top-5 acc 52.344 (50.220)	lr 0.01262
Warmup Train [27][1950/3239]	Time 0.520 (0.517)	Data 0.001 (0.012)	Loss 4.3145 (4.1961)	Top-1 acc 26.953 (27.334)	Top-5 acc 48.047 (50.222)	lr 0.01261
Warmup Train [27][1960/3239]	Time 0.499 (0.517)	Data 0.001 (0.012)	Loss 4.2724 (4.1962)	Top-1 acc 29.688 (27.339)	Top-5 acc 47.266 (50.216)	lr 0.01261
Warmup Train [27][1970/3239]	Time 0.527 (0.517)	Data 0.001 (0.012)	Loss 4.0830 (4.1959)	Top-1 acc 26.172 (27.345)	Top-5 acc 53.125 (50.223)	lr 0.01260
Warmup Train [27][1980/3239]	Time 0.639 (0.517)	Data 0.001 (0.012)	Loss 4.2008 (4.1960)	Top-1 acc 30.078 (27.344)	Top-5 acc 51.172 (50.217)	lr 0.01259
Warmup Train [27][1990/3239]	Time 0.679 (0.517)	Data 0.001 (0.012)	Loss 4.2330 (4.1962)	Top-1 acc 25.000 (27.340)	Top-5 acc 50.000 (50.213)	lr 0.01259
Warmup Train [27][2000/3239]	Time 0.489 (0.517)	Data 0.001 (0.012)	Loss 4.0942 (4.1959)	Top-1 acc 26.953 (27.338)	Top-5 acc 51.562 (50.217)	lr 0.01258
Warmup Train [27][2010/3239]	Time 0.483 (0.517)	Data 0.001 (0.012)	Loss 4.1693 (4.1962)	Top-1 acc 27.344 (27.339)	Top-5 acc 53.906 (50.208)	lr 0.01258
Warmup Train [27][2020/3239]	Time 0.706 (0.517)	Data 0.001 (0.012)	Loss 4.2825 (4.1962)	Top-1 acc 26.562 (27.336)	Top-5 acc 46.875 (50.212)	lr 0.01257
Warmup Train [27][2030/3239]	Time 0.439 (0.517)	Data 0.001 (0.012)	Loss 4.2069 (4.1961)	Top-1 acc 30.078 (27.340)	Top-5 acc 50.391 (50.213)	lr 0.01257
Warmup Train [27][2040/3239]	Time 0.454 (0.517)	Data 0.001 (0.012)	Loss 4.2058 (4.1960)	Top-1 acc 23.047 (27.339)	Top-5 acc 47.266 (50.214)	lr 0.01256
Warmup Train [27][2050/3239]	Time 0.345 (0.517)	Data 0.001 (0.012)	Loss 4.1513 (4.1960)	Top-1 acc 26.953 (27.340)	Top-5 acc 52.734 (50.216)	lr 0.01256
Warmup Train [27][2060/3239]	Time 0.427 (0.517)	Data 0.001 (0.012)	Loss 4.3918 (4.1961)	Top-1 acc 22.266 (27.334)	Top-5 acc 43.750 (50.207)	lr 0.01255
Warmup Train [27][2070/3239]	Time 0.182 (0.516)	Data 0.001 (0.012)	Loss 4.1568 (4.1959)	Top-1 acc 26.172 (27.339)	Top-5 acc 50.391 (50.212)	lr 0.01255
Warmup Train [27][2080/3239]	Time 0.517 (0.516)	Data 0.001 (0.012)	Loss 4.3712 (4.1963)	Top-1 acc 23.047 (27.332)	Top-5 acc 47.656 (50.201)	lr 0.01254
Warmup Train [27][2090/3239]	Time 0.534 (0.516)	Data 0.001 (0.012)	Loss 4.4710 (4.1963)	Top-1 acc 25.000 (27.335)	Top-5 acc 48.047 (50.200)	lr 0.01254
Warmup Train [27][2100/3239]	Time 0.346 (0.516)	Data 0.001 (0.012)	Loss 4.0560 (4.1961)	Top-1 acc 29.297 (27.337)	Top-5 acc 53.516 (50.206)	lr 0.01253
Warmup Train [27][2110/3239]	Time 0.633 (0.516)	Data 0.001 (0.012)	Loss 3.9793 (4.1959)	Top-1 acc 33.203 (27.337)	Top-5 acc 56.641 (50.213)	lr 0.01253
Warmup Train [27][2120/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 4.2401 (4.1960)	Top-1 acc 26.953 (27.333)	Top-5 acc 49.609 (50.214)	lr 0.01252
Warmup Train [27][2130/3239]	Time 0.543 (0.516)	Data 0.001 (0.012)	Loss 4.1780 (4.1958)	Top-1 acc 27.344 (27.334)	Top-5 acc 48.438 (50.216)	lr 0.01252
Warmup Train [27][2140/3239]	Time 0.647 (0.516)	Data 0.001 (0.012)	Loss 4.1693 (4.1959)	Top-1 acc 27.344 (27.326)	Top-5 acc 50.391 (50.215)	lr 0.01251
Warmup Train [27][2150/3239]	Time 0.322 (0.516)	Data 0.001 (0.012)	Loss 4.4477 (4.1956)	Top-1 acc 23.047 (27.331)	Top-5 acc 43.359 (50.219)	lr 0.01251
Warmup Train [27][2160/3239]	Time 0.535 (0.516)	Data 0.001 (0.012)	Loss 4.0171 (4.1956)	Top-1 acc 33.594 (27.334)	Top-5 acc 55.859 (50.221)	lr 0.01250
Warmup Train [27][2170/3239]	Time 0.488 (0.516)	Data 0.001 (0.012)	Loss 4.1689 (4.1955)	Top-1 acc 29.688 (27.336)	Top-5 acc 51.953 (50.224)	lr 0.01249
Warmup Train [27][2180/3239]	Time 0.622 (0.516)	Data 0.001 (0.012)	Loss 4.3337 (4.1954)	Top-1 acc 26.562 (27.336)	Top-5 acc 44.922 (50.225)	lr 0.01249
Warmup Train [27][2190/3239]	Time 0.537 (0.516)	Data 0.001 (0.012)	Loss 4.1377 (4.1954)	Top-1 acc 26.953 (27.333)	Top-5 acc 52.344 (50.225)	lr 0.01248
Warmup Train [27][2200/3239]	Time 0.426 (0.516)	Data 0.001 (0.012)	Loss 4.2166 (4.1955)	Top-1 acc 25.781 (27.336)	Top-5 acc 50.000 (50.226)	lr 0.01248
Warmup Train [27][2210/3239]	Time 0.545 (0.516)	Data 0.001 (0.012)	Loss 4.1082 (4.1953)	Top-1 acc 32.812 (27.339)	Top-5 acc 50.000 (50.226)	lr 0.01247
Warmup Train [27][2220/3239]	Time 0.550 (0.516)	Data 0.001 (0.012)	Loss 4.1029 (4.1953)	Top-1 acc 28.516 (27.343)	Top-5 acc 48.047 (50.227)	lr 0.01247
Warmup Train [27][2230/3239]	Time 0.600 (0.516)	Data 0.001 (0.012)	Loss 4.3902 (4.1952)	Top-1 acc 26.172 (27.341)	Top-5 acc 43.750 (50.226)	lr 0.01246
Warmup Train [27][2240/3239]	Time 0.474 (0.516)	Data 0.001 (0.012)	Loss 4.3186 (4.1953)	Top-1 acc 26.953 (27.340)	Top-5 acc 47.656 (50.225)	lr 0.01246
Warmup Train [27][2250/3239]	Time 0.674 (0.516)	Data 0.002 (0.012)	Loss 4.1729 (4.1952)	Top-1 acc 25.391 (27.339)	Top-5 acc 48.828 (50.225)	lr 0.01245
Warmup Train [27][2260/3239]	Time 0.566 (0.516)	Data 0.001 (0.012)	Loss 4.3561 (4.1955)	Top-1 acc 23.828 (27.336)	Top-5 acc 48.047 (50.218)	lr 0.01245
Warmup Train [27][2270/3239]	Time 0.491 (0.516)	Data 0.001 (0.011)	Loss 4.1908 (4.1952)	Top-1 acc 25.000 (27.338)	Top-5 acc 53.906 (50.224)	lr 0.01244
Warmup Train [27][2280/3239]	Time 0.464 (0.516)	Data 0.001 (0.011)	Loss 4.3269 (4.1953)	Top-1 acc 25.000 (27.336)	Top-5 acc 48.047 (50.222)	lr 0.01244
Warmup Train [27][2290/3239]	Time 0.599 (0.516)	Data 0.001 (0.011)	Loss 4.1498 (4.1955)	Top-1 acc 29.297 (27.333)	Top-5 acc 50.781 (50.218)	lr 0.01243
Warmup Train [27][2300/3239]	Time 0.330 (0.516)	Data 0.001 (0.011)	Loss 4.2207 (4.1958)	Top-1 acc 29.297 (27.324)	Top-5 acc 50.781 (50.214)	lr 0.01243
Warmup Train [27][2310/3239]	Time 0.362 (0.516)	Data 0.001 (0.011)	Loss 4.3184 (4.1958)	Top-1 acc 23.438 (27.323)	Top-5 acc 45.312 (50.209)	lr 0.01242
Warmup Train [27][2320/3239]	Time 0.335 (0.516)	Data 0.001 (0.011)	Loss 4.2121 (4.1955)	Top-1 acc 25.391 (27.325)	Top-5 acc 49.219 (50.212)	lr 0.01242
Warmup Train [27][2330/3239]	Time 0.588 (0.516)	Data 0.001 (0.011)	Loss 4.0689 (4.1956)	Top-1 acc 29.297 (27.323)	Top-5 acc 51.953 (50.210)	lr 0.01241
Warmup Train [27][2340/3239]	Time 0.399 (0.516)	Data 0.001 (0.011)	Loss 4.1898 (4.1954)	Top-1 acc 25.781 (27.323)	Top-5 acc 50.781 (50.212)	lr 0.01241
Warmup Train [27][2350/3239]	Time 0.516 (0.516)	Data 0.001 (0.011)	Loss 4.1301 (4.1954)	Top-1 acc 26.953 (27.323)	Top-5 acc 48.047 (50.213)	lr 0.01240
Warmup Train [27][2360/3239]	Time 0.622 (0.516)	Data 0.001 (0.011)	Loss 4.1975 (4.1953)	Top-1 acc 25.000 (27.322)	Top-5 acc 55.078 (50.217)	lr 0.01240
Warmup Train [27][2370/3239]	Time 0.435 (0.516)	Data 0.001 (0.011)	Loss 4.3314 (4.1951)	Top-1 acc 23.438 (27.323)	Top-5 acc 47.266 (50.220)	lr 0.01239
Warmup Train [27][2380/3239]	Time 0.442 (0.516)	Data 0.001 (0.011)	Loss 4.0622 (4.1950)	Top-1 acc 26.953 (27.324)	Top-5 acc 50.391 (50.220)	lr 0.01238
Warmup Train [27][2390/3239]	Time 0.538 (0.515)	Data 0.001 (0.011)	Loss 4.1746 (4.1949)	Top-1 acc 28.906 (27.325)	Top-5 acc 50.000 (50.218)	lr 0.01238
Warmup Train [27][2400/3239]	Time 0.495 (0.515)	Data 0.001 (0.011)	Loss 4.3170 (4.1949)	Top-1 acc 25.781 (27.325)	Top-5 acc 45.703 (50.219)	lr 0.01237
Warmup Train [27][2410/3239]	Time 0.380 (0.515)	Data 0.001 (0.011)	Loss 4.2924 (4.1950)	Top-1 acc 24.219 (27.323)	Top-5 acc 46.094 (50.212)	lr 0.01237
Warmup Train [27][2420/3239]	Time 0.295 (0.515)	Data 0.001 (0.011)	Loss 4.3669 (4.1949)	Top-1 acc 24.219 (27.320)	Top-5 acc 47.266 (50.217)	lr 0.01236
Warmup Train [27][2430/3239]	Time 0.686 (0.516)	Data 0.001 (0.011)	Loss 4.0200 (4.1949)	Top-1 acc 26.562 (27.314)	Top-5 acc 51.953 (50.216)	lr 0.01236
Warmup Train [27][2440/3239]	Time 0.601 (0.516)	Data 0.001 (0.011)	Loss 4.1552 (4.1947)	Top-1 acc 30.078 (27.316)	Top-5 acc 52.734 (50.222)	lr 0.01235
Warmup Train [27][2450/3239]	Time 0.467 (0.516)	Data 0.001 (0.011)	Loss 4.0066 (4.1945)	Top-1 acc 33.594 (27.324)	Top-5 acc 53.906 (50.228)	lr 0.01235
Warmup Train [27][2460/3239]	Time 0.509 (0.516)	Data 0.001 (0.011)	Loss 4.2611 (4.1945)	Top-1 acc 21.484 (27.321)	Top-5 acc 50.391 (50.228)	lr 0.01234
Warmup Train [27][2470/3239]	Time 0.617 (0.516)	Data 0.002 (0.011)	Loss 4.0911 (4.1942)	Top-1 acc 27.344 (27.324)	Top-5 acc 53.516 (50.238)	lr 0.01234
Warmup Train [27][2480/3239]	Time 0.602 (0.516)	Data 0.001 (0.011)	Loss 4.3647 (4.1946)	Top-1 acc 23.047 (27.319)	Top-5 acc 45.312 (50.234)	lr 0.01233
Warmup Train [27][2490/3239]	Time 0.555 (0.516)	Data 0.001 (0.011)	Loss 4.0524 (4.1947)	Top-1 acc 28.906 (27.317)	Top-5 acc 53.516 (50.232)	lr 0.01233
Warmup Train [27][2500/3239]	Time 0.564 (0.516)	Data 0.001 (0.011)	Loss 4.2535 (4.1947)	Top-1 acc 27.344 (27.317)	Top-5 acc 49.609 (50.233)	lr 0.01232
Warmup Train [27][2510/3239]	Time 0.535 (0.516)	Data 0.001 (0.011)	Loss 4.1066 (4.1949)	Top-1 acc 28.125 (27.313)	Top-5 acc 50.391 (50.229)	lr 0.01232
Warmup Train [27][2520/3239]	Time 0.658 (0.516)	Data 0.001 (0.011)	Loss 4.0737 (4.1949)	Top-1 acc 26.562 (27.314)	Top-5 acc 52.734 (50.230)	lr 0.01231
Warmup Train [27][2530/3239]	Time 0.521 (0.516)	Data 0.001 (0.011)	Loss 4.1554 (4.1946)	Top-1 acc 32.422 (27.321)	Top-5 acc 50.000 (50.235)	lr 0.01231
Warmup Train [27][2540/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 3.9685 (4.1944)	Top-1 acc 26.953 (27.326)	Top-5 acc 56.641 (50.242)	lr 0.01230
Warmup Train [27][2550/3239]	Time 0.450 (0.515)	Data 0.001 (0.011)	Loss 4.1567 (4.1944)	Top-1 acc 26.172 (27.326)	Top-5 acc 50.781 (50.244)	lr 0.01230
Warmup Train [27][2560/3239]	Time 0.514 (0.515)	Data 0.001 (0.011)	Loss 4.1218 (4.1942)	Top-1 acc 29.297 (27.330)	Top-5 acc 51.562 (50.247)	lr 0.01229
Warmup Train [27][2570/3239]	Time 0.576 (0.515)	Data 0.001 (0.011)	Loss 4.1486 (4.1942)	Top-1 acc 26.953 (27.332)	Top-5 acc 50.391 (50.246)	lr 0.01229
Warmup Train [27][2580/3239]	Time 0.606 (0.515)	Data 0.001 (0.011)	Loss 4.2424 (4.1939)	Top-1 acc 25.000 (27.337)	Top-5 acc 49.219 (50.254)	lr 0.01228
Warmup Train [27][2590/3239]	Time 0.676 (0.515)	Data 0.001 (0.011)	Loss 4.0257 (4.1938)	Top-1 acc 32.422 (27.340)	Top-5 acc 54.688 (50.258)	lr 0.01228
Warmup Train [27][2600/3239]	Time 0.495 (0.515)	Data 0.001 (0.011)	Loss 4.2858 (4.1937)	Top-1 acc 28.125 (27.343)	Top-5 acc 45.703 (50.260)	lr 0.01227
Warmup Train [27][2610/3239]	Time 0.576 (0.515)	Data 0.001 (0.011)	Loss 4.2410 (4.1937)	Top-1 acc 23.438 (27.344)	Top-5 acc 49.219 (50.260)	lr 0.01226
Warmup Train [27][2620/3239]	Time 0.613 (0.515)	Data 0.001 (0.011)	Loss 4.0800 (4.1937)	Top-1 acc 27.734 (27.339)	Top-5 acc 53.125 (50.257)	lr 0.01226
Warmup Train [27][2630/3239]	Time 0.321 (0.515)	Data 0.001 (0.011)	Loss 4.1852 (4.1936)	Top-1 acc 29.297 (27.341)	Top-5 acc 51.562 (50.257)	lr 0.01225
Warmup Train [27][2640/3239]	Time 0.493 (0.515)	Data 0.001 (0.011)	Loss 4.1160 (4.1935)	Top-1 acc 28.125 (27.340)	Top-5 acc 50.391 (50.254)	lr 0.01225
Warmup Train [27][2650/3239]	Time 0.425 (0.515)	Data 0.001 (0.011)	Loss 4.2382 (4.1936)	Top-1 acc 26.953 (27.339)	Top-5 acc 48.828 (50.253)	lr 0.01224
Warmup Train [27][2660/3239]	Time 0.468 (0.515)	Data 0.001 (0.011)	Loss 4.0980 (4.1934)	Top-1 acc 29.688 (27.340)	Top-5 acc 57.031 (50.260)	lr 0.01224
Warmup Train [27][2670/3239]	Time 0.392 (0.515)	Data 0.001 (0.011)	Loss 4.3317 (4.1935)	Top-1 acc 26.953 (27.335)	Top-5 acc 49.219 (50.261)	lr 0.01223
Warmup Train [27][2680/3239]	Time 0.433 (0.515)	Data 0.001 (0.011)	Loss 4.3827 (4.1935)	Top-1 acc 23.047 (27.331)	Top-5 acc 45.312 (50.260)	lr 0.01223
Warmup Train [27][2690/3239]	Time 0.582 (0.515)	Data 0.001 (0.011)	Loss 4.2990 (4.1935)	Top-1 acc 23.828 (27.334)	Top-5 acc 47.656 (50.259)	lr 0.01222
Warmup Train [27][2700/3239]	Time 0.546 (0.515)	Data 0.001 (0.011)	Loss 4.1072 (4.1934)	Top-1 acc 28.125 (27.335)	Top-5 acc 51.953 (50.266)	lr 0.01222
Warmup Train [27][2710/3239]	Time 0.439 (0.515)	Data 0.001 (0.011)	Loss 4.1031 (4.1932)	Top-1 acc 26.953 (27.341)	Top-5 acc 54.688 (50.273)	lr 0.01221
Warmup Train [27][2720/3239]	Time 0.345 (0.515)	Data 0.001 (0.011)	Loss 4.2948 (4.1933)	Top-1 acc 25.781 (27.341)	Top-5 acc 45.312 (50.273)	lr 0.01221
Warmup Train [27][2730/3239]	Time 0.544 (0.515)	Data 0.001 (0.011)	Loss 4.0809 (4.1930)	Top-1 acc 29.297 (27.346)	Top-5 acc 51.172 (50.282)	lr 0.01220
Warmup Train [27][2740/3239]	Time 0.530 (0.515)	Data 0.001 (0.011)	Loss 3.9402 (4.1930)	Top-1 acc 30.078 (27.346)	Top-5 acc 55.078 (50.283)	lr 0.01220
Warmup Train [27][2750/3239]	Time 0.436 (0.515)	Data 0.001 (0.011)	Loss 4.2185 (4.1931)	Top-1 acc 26.172 (27.346)	Top-5 acc 48.047 (50.285)	lr 0.01219
Warmup Train [27][2760/3239]	Time 0.312 (0.515)	Data 0.001 (0.011)	Loss 4.2197 (4.1929)	Top-1 acc 26.172 (27.352)	Top-5 acc 44.922 (50.289)	lr 0.01219
Warmup Train [27][2770/3239]	Time 0.578 (0.515)	Data 0.001 (0.011)	Loss 4.2886 (4.1930)	Top-1 acc 26.562 (27.353)	Top-5 acc 49.219 (50.290)	lr 0.01218
Warmup Train [27][2780/3239]	Time 0.382 (0.515)	Data 0.001 (0.011)	Loss 4.3693 (4.1933)	Top-1 acc 23.438 (27.345)	Top-5 acc 45.703 (50.284)	lr 0.01218
Warmup Train [27][2790/3239]	Time 0.432 (0.515)	Data 0.001 (0.011)	Loss 4.0569 (4.1932)	Top-1 acc 28.125 (27.346)	Top-5 acc 54.688 (50.289)	lr 0.01217
Warmup Train [27][2800/3239]	Time 0.492 (0.515)	Data 0.001 (0.011)	Loss 4.2811 (4.1930)	Top-1 acc 26.172 (27.348)	Top-5 acc 48.438 (50.292)	lr 0.01217
Warmup Train [27][2810/3239]	Time 0.736 (0.515)	Data 0.001 (0.011)	Loss 4.3422 (4.1931)	Top-1 acc 26.953 (27.350)	Top-5 acc 46.484 (50.292)	lr 0.01216
Warmup Train [27][2820/3239]	Time 0.496 (0.515)	Data 0.001 (0.011)	Loss 4.1520 (4.1932)	Top-1 acc 29.297 (27.349)	Top-5 acc 52.344 (50.292)	lr 0.01216
Warmup Train [27][2830/3239]	Time 0.341 (0.515)	Data 0.001 (0.011)	Loss 4.1743 (4.1931)	Top-1 acc 26.562 (27.350)	Top-5 acc 48.438 (50.291)	lr 0.01215
Warmup Train [27][2840/3239]	Time 0.468 (0.515)	Data 0.001 (0.011)	Loss 4.0378 (4.1931)	Top-1 acc 28.906 (27.352)	Top-5 acc 54.297 (50.291)	lr 0.01214
Warmup Train [27][2850/3239]	Time 0.560 (0.515)	Data 0.001 (0.011)	Loss 3.9514 (4.1928)	Top-1 acc 30.078 (27.358)	Top-5 acc 59.375 (50.297)	lr 0.01214
Warmup Train [27][2860/3239]	Time 0.637 (0.515)	Data 0.001 (0.011)	Loss 4.3259 (4.1929)	Top-1 acc 24.609 (27.355)	Top-5 acc 44.922 (50.297)	lr 0.01213
Warmup Train [27][2870/3239]	Time 0.541 (0.515)	Data 0.001 (0.011)	Loss 4.1275 (4.1929)	Top-1 acc 29.297 (27.359)	Top-5 acc 50.000 (50.299)	lr 0.01213
Warmup Train [27][2880/3239]	Time 0.343 (0.515)	Data 0.001 (0.011)	Loss 4.0380 (4.1930)	Top-1 acc 30.078 (27.358)	Top-5 acc 49.609 (50.293)	lr 0.01212
Warmup Train [27][2890/3239]	Time 0.835 (0.515)	Data 0.001 (0.011)	Loss 4.0342 (4.1931)	Top-1 acc 32.812 (27.361)	Top-5 acc 53.906 (50.292)	lr 0.01212
Warmup Train [27][2900/3239]	Time 0.538 (0.515)	Data 0.001 (0.010)	Loss 4.1681 (4.1929)	Top-1 acc 29.297 (27.364)	Top-5 acc 52.734 (50.296)	lr 0.01211
Warmup Train [27][2910/3239]	Time 0.512 (0.515)	Data 0.001 (0.010)	Loss 4.2080 (4.1928)	Top-1 acc 26.562 (27.365)	Top-5 acc 47.266 (50.297)	lr 0.01211
Warmup Train [27][2920/3239]	Time 0.519 (0.515)	Data 0.001 (0.010)	Loss 4.1345 (4.1928)	Top-1 acc 26.562 (27.363)	Top-5 acc 50.391 (50.294)	lr 0.01210
Warmup Train [27][2930/3239]	Time 0.509 (0.515)	Data 0.001 (0.010)	Loss 4.3215 (4.1930)	Top-1 acc 29.297 (27.363)	Top-5 acc 46.484 (50.290)	lr 0.01210
Warmup Train [27][2940/3239]	Time 0.460 (0.515)	Data 0.001 (0.010)	Loss 4.2260 (4.1932)	Top-1 acc 24.609 (27.361)	Top-5 acc 49.609 (50.289)	lr 0.01209
Warmup Train [27][2950/3239]	Time 0.590 (0.515)	Data 0.001 (0.010)	Loss 4.0887 (4.1931)	Top-1 acc 29.297 (27.363)	Top-5 acc 55.859 (50.292)	lr 0.01209
Warmup Train [27][2960/3239]	Time 0.487 (0.515)	Data 0.001 (0.010)	Loss 4.3302 (4.1931)	Top-1 acc 23.047 (27.362)	Top-5 acc 47.266 (50.293)	lr 0.01208
Warmup Train [27][2970/3239]	Time 0.449 (0.515)	Data 0.001 (0.010)	Loss 4.2185 (4.1930)	Top-1 acc 27.344 (27.366)	Top-5 acc 52.344 (50.296)	lr 0.01208
Warmup Train [27][2980/3239]	Time 0.510 (0.515)	Data 0.001 (0.010)	Loss 4.2784 (4.1929)	Top-1 acc 26.172 (27.370)	Top-5 acc 48.047 (50.298)	lr 0.01207
Warmup Train [27][2990/3239]	Time 0.471 (0.515)	Data 0.001 (0.010)	Loss 4.3670 (4.1927)	Top-1 acc 25.391 (27.373)	Top-5 acc 44.141 (50.298)	lr 0.01207
Warmup Train [27][3000/3239]	Time 0.555 (0.515)	Data 0.001 (0.010)	Loss 4.1459 (4.1927)	Top-1 acc 32.812 (27.374)	Top-5 acc 53.906 (50.297)	lr 0.01206
Warmup Train [27][3010/3239]	Time 0.394 (0.515)	Data 0.001 (0.010)	Loss 4.3566 (4.1925)	Top-1 acc 26.562 (27.379)	Top-5 acc 48.828 (50.303)	lr 0.01206
Warmup Train [27][3020/3239]	Time 0.536 (0.515)	Data 0.001 (0.010)	Loss 4.1184 (4.1924)	Top-1 acc 30.469 (27.386)	Top-5 acc 53.125 (50.306)	lr 0.01205
Warmup Train [27][3030/3239]	Time 0.562 (0.515)	Data 0.001 (0.010)	Loss 4.0608 (4.1923)	Top-1 acc 31.250 (27.386)	Top-5 acc 51.172 (50.306)	lr 0.01205
Warmup Train [27][3040/3239]	Time 0.456 (0.515)	Data 0.001 (0.010)	Loss 4.0310 (4.1920)	Top-1 acc 28.125 (27.392)	Top-5 acc 51.953 (50.313)	lr 0.01204
Warmup Train [27][3050/3239]	Time 0.498 (0.515)	Data 0.001 (0.010)	Loss 4.1226 (4.1917)	Top-1 acc 30.078 (27.397)	Top-5 acc 53.516 (50.319)	lr 0.01204
Warmup Train [27][3060/3239]	Time 0.557 (0.515)	Data 0.001 (0.010)	Loss 4.2413 (4.1917)	Top-1 acc 26.172 (27.397)	Top-5 acc 53.906 (50.317)	lr 0.01203
Warmup Train [27][3070/3239]	Time 0.432 (0.514)	Data 0.001 (0.010)	Loss 3.9698 (4.1918)	Top-1 acc 27.734 (27.395)	Top-5 acc 54.297 (50.314)	lr 0.01203
Warmup Train [27][3080/3239]	Time 0.475 (0.515)	Data 0.001 (0.010)	Loss 4.1018 (4.1918)	Top-1 acc 30.078 (27.395)	Top-5 acc 48.438 (50.314)	lr 0.01202
Warmup Train [27][3090/3239]	Time 0.499 (0.515)	Data 0.001 (0.010)	Loss 4.3106 (4.1920)	Top-1 acc 28.516 (27.391)	Top-5 acc 47.656 (50.307)	lr 0.01202
Warmup Train [27][3100/3239]	Time 0.651 (0.515)	Data 0.001 (0.010)	Loss 4.1378 (4.1919)	Top-1 acc 27.734 (27.389)	Top-5 acc 50.000 (50.307)	lr 0.01201
Warmup Train [27][3110/3239]	Time 0.515 (0.515)	Data 0.001 (0.010)	Loss 4.4248 (4.1919)	Top-1 acc 21.875 (27.388)	Top-5 acc 42.188 (50.305)	lr 0.01200
Warmup Train [27][3120/3239]	Time 0.465 (0.515)	Data 0.001 (0.010)	Loss 4.2444 (4.1920)	Top-1 acc 26.562 (27.386)	Top-5 acc 51.172 (50.302)	lr 0.01200
Warmup Train [27][3130/3239]	Time 0.501 (0.515)	Data 0.001 (0.010)	Loss 4.1735 (4.1918)	Top-1 acc 27.344 (27.391)	Top-5 acc 51.562 (50.307)	lr 0.01199
Warmup Train [27][3140/3239]	Time 0.513 (0.515)	Data 0.001 (0.010)	Loss 4.3820 (4.1918)	Top-1 acc 23.047 (27.389)	Top-5 acc 44.531 (50.308)	lr 0.01199
Warmup Train [27][3150/3239]	Time 0.571 (0.515)	Data 0.001 (0.010)	Loss 4.2040 (4.1916)	Top-1 acc 28.906 (27.394)	Top-5 acc 46.094 (50.311)	lr 0.01198
Warmup Train [27][3160/3239]	Time 0.506 (0.515)	Data 0.001 (0.010)	Loss 4.3628 (4.1916)	Top-1 acc 26.953 (27.397)	Top-5 acc 48.047 (50.313)	lr 0.01198
Warmup Train [27][3170/3239]	Time 0.473 (0.515)	Data 0.001 (0.010)	Loss 4.1390 (4.1915)	Top-1 acc 26.562 (27.399)	Top-5 acc 51.562 (50.315)	lr 0.01197
Warmup Train [27][3180/3239]	Time 0.398 (0.515)	Data 0.000 (0.010)	Loss 4.2991 (4.1915)	Top-1 acc 26.172 (27.395)	Top-5 acc 50.781 (50.315)	lr 0.01197
Warmup Train [27][3190/3239]	Time 0.501 (0.515)	Data 0.000 (0.010)	Loss 4.1343 (4.1913)	Top-1 acc 28.516 (27.399)	Top-5 acc 53.125 (50.320)	lr 0.01196
Warmup Train [27][3200/3239]	Time 0.682 (0.514)	Data 0.000 (0.010)	Loss 4.2163 (4.1912)	Top-1 acc 30.078 (27.404)	Top-5 acc 44.922 (50.321)	lr 0.01196
Warmup Train [27][3210/3239]	Time 0.550 (0.514)	Data 0.000 (0.010)	Loss 4.2289 (4.1911)	Top-1 acc 31.250 (27.412)	Top-5 acc 51.562 (50.326)	lr 0.01195
Warmup Train [27][3220/3239]	Time 0.456 (0.514)	Data 0.000 (0.010)	Loss 4.1663 (4.1912)	Top-1 acc 26.953 (27.408)	Top-5 acc 48.047 (50.324)	lr 0.01195
Warmup Train [27][3230/3239]	Time 0.336 (0.514)	Data 0.000 (0.010)	Loss 4.1806 (4.1910)	Top-1 acc 28.125 (27.414)	Top-5 acc 48.828 (50.330)	lr 0.01194
Warmup Train [27][3239/3239]	Time 0.305 (0.514)	Data 0.000 (0.010)	Loss 4.9294 (4.1909)	Top-1 acc 16.049 (27.415)	Top-5 acc 29.630 (50.330)	lr 0.01194
==========Warmup Valid [27/40]	loss 3.151	top-1 acc 34.772	top-5 acc 59.507	Train top-1 27.415	top-5 50.330	flops: 442.4M
Warmup Train [28][0/3239]	Time 16.458 (16.458)	Data 14.210 (14.210)	Loss 4.0029 (4.0029)	Top-1 acc 32.422 (32.422)	Top-5 acc 55.078 (55.078)	lr 0.01194
Warmup Train [28][10/3239]	Time 0.536 (2.040)	Data 0.001 (1.297)	Loss 4.1226 (4.0670)	Top-1 acc 25.000 (28.764)	Top-5 acc 53.125 (52.557)	lr 0.01193
Warmup Train [28][20/3239]	Time 0.667 (1.318)	Data 0.001 (0.681)	Loss 3.9682 (4.1053)	Top-1 acc 31.250 (28.013)	Top-5 acc 56.250 (51.935)	lr 0.01193
Warmup Train [28][30/3239]	Time 0.429 (1.054)	Data 0.001 (0.462)	Loss 4.1841 (4.1236)	Top-1 acc 25.000 (27.734)	Top-5 acc 52.344 (51.499)	lr 0.01192
Warmup Train [28][40/3239]	Time 0.550 (0.921)	Data 0.001 (0.351)	Loss 4.0082 (4.1149)	Top-1 acc 30.078 (27.944)	Top-5 acc 50.781 (51.686)	lr 0.01192
Warmup Train [28][50/3239]	Time 0.590 (0.842)	Data 0.001 (0.285)	Loss 4.0987 (4.1204)	Top-1 acc 25.781 (27.926)	Top-5 acc 52.734 (51.800)	lr 0.01191
Warmup Train [28][60/3239]	Time 0.514 (0.786)	Data 0.001 (0.238)	Loss 4.1993 (4.1300)	Top-1 acc 26.562 (27.869)	Top-5 acc 51.953 (51.614)	lr 0.01191
Warmup Train [28][70/3239]	Time 0.419 (0.747)	Data 0.001 (0.205)	Loss 3.9680 (4.1281)	Top-1 acc 32.031 (28.031)	Top-5 acc 57.812 (51.733)	lr 0.01190
Warmup Train [28][80/3239]	Time 0.557 (0.719)	Data 0.001 (0.181)	Loss 4.1743 (4.1356)	Top-1 acc 27.734 (27.812)	Top-5 acc 46.875 (51.514)	lr 0.01190
Warmup Train [28][90/3239]	Time 0.582 (0.696)	Data 0.001 (0.162)	Loss 4.1571 (4.1349)	Top-1 acc 27.344 (27.803)	Top-5 acc 52.344 (51.584)	lr 0.01189
Warmup Train [28][100/3239]	Time 0.449 (0.676)	Data 0.001 (0.147)	Loss 4.2077 (4.1330)	Top-1 acc 30.469 (27.963)	Top-5 acc 50.391 (51.559)	lr 0.01189
Warmup Train [28][110/3239]	Time 0.584 (0.657)	Data 0.001 (0.134)	Loss 4.2097 (4.1385)	Top-1 acc 26.953 (27.981)	Top-5 acc 47.266 (51.418)	lr 0.01188
Warmup Train [28][120/3239]	Time 0.617 (0.647)	Data 0.001 (0.123)	Loss 4.2441 (4.1391)	Top-1 acc 26.172 (27.947)	Top-5 acc 47.266 (51.388)	lr 0.01188
Warmup Train [28][130/3239]	Time 0.494 (0.638)	Data 0.002 (0.114)	Loss 3.9805 (4.1358)	Top-1 acc 30.859 (28.053)	Top-5 acc 51.172 (51.461)	lr 0.01187
Warmup Train [28][140/3239]	Time 0.466 (0.629)	Data 0.001 (0.106)	Loss 4.0224 (4.1367)	Top-1 acc 26.953 (28.081)	Top-5 acc 56.641 (51.460)	lr 0.01187
Warmup Train [28][150/3239]	Time 0.527 (0.621)	Data 0.001 (0.100)	Loss 3.9810 (4.1355)	Top-1 acc 33.594 (28.128)	Top-5 acc 56.250 (51.498)	lr 0.01186
Warmup Train [28][160/3239]	Time 0.524 (0.614)	Data 0.001 (0.094)	Loss 4.1745 (4.1367)	Top-1 acc 30.078 (28.123)	Top-5 acc 51.562 (51.560)	lr 0.01185
Warmup Train [28][170/3239]	Time 0.416 (0.608)	Data 0.001 (0.088)	Loss 4.2266 (4.1371)	Top-1 acc 25.781 (28.120)	Top-5 acc 47.266 (51.503)	lr 0.01185
Warmup Train [28][180/3239]	Time 0.597 (0.602)	Data 0.001 (0.084)	Loss 4.2463 (4.1411)	Top-1 acc 30.469 (28.054)	Top-5 acc 51.562 (51.405)	lr 0.01184
Warmup Train [28][190/3239]	Time 0.619 (0.597)	Data 0.001 (0.080)	Loss 4.1187 (4.1426)	Top-1 acc 28.516 (28.041)	Top-5 acc 51.172 (51.391)	lr 0.01184
Warmup Train [28][200/3239]	Time 0.635 (0.593)	Data 0.001 (0.076)	Loss 3.8990 (4.1414)	Top-1 acc 35.156 (28.117)	Top-5 acc 55.859 (51.411)	lr 0.01183
Warmup Train [28][210/3239]	Time 0.417 (0.589)	Data 0.001 (0.072)	Loss 4.0083 (4.1412)	Top-1 acc 29.297 (28.147)	Top-5 acc 55.469 (51.503)	lr 0.01183
Warmup Train [28][220/3239]	Time 0.486 (0.586)	Data 0.001 (0.070)	Loss 3.9337 (4.1409)	Top-1 acc 33.984 (28.157)	Top-5 acc 56.250 (51.522)	lr 0.01182
Warmup Train [28][230/3239]	Time 0.488 (0.583)	Data 0.001 (0.067)	Loss 4.0563 (4.1412)	Top-1 acc 30.078 (28.181)	Top-5 acc 53.125 (51.471)	lr 0.01182
Warmup Train [28][240/3239]	Time 0.490 (0.580)	Data 0.001 (0.065)	Loss 4.1380 (4.1414)	Top-1 acc 26.562 (28.222)	Top-5 acc 50.391 (51.506)	lr 0.01181
Warmup Train [28][250/3239]	Time 0.478 (0.578)	Data 0.001 (0.062)	Loss 4.1701 (4.1417)	Top-1 acc 24.219 (28.184)	Top-5 acc 47.656 (51.472)	lr 0.01181
Warmup Train [28][260/3239]	Time 0.524 (0.576)	Data 0.001 (0.060)	Loss 4.2002 (4.1439)	Top-1 acc 30.078 (28.174)	Top-5 acc 51.953 (51.435)	lr 0.01180
Warmup Train [28][270/3239]	Time 0.645 (0.574)	Data 0.001 (0.058)	Loss 4.1659 (4.1450)	Top-1 acc 30.859 (28.167)	Top-5 acc 50.391 (51.436)	lr 0.01180
Warmup Train [28][280/3239]	Time 0.406 (0.572)	Data 0.001 (0.056)	Loss 4.0599 (4.1457)	Top-1 acc 27.734 (28.163)	Top-5 acc 53.906 (51.437)	lr 0.01179
Warmup Train [28][290/3239]	Time 0.459 (0.570)	Data 0.001 (0.054)	Loss 4.1574 (4.1457)	Top-1 acc 28.516 (28.151)	Top-5 acc 51.562 (51.462)	lr 0.01179
Warmup Train [28][300/3239]	Time 0.453 (0.568)	Data 0.001 (0.053)	Loss 4.1717 (4.1452)	Top-1 acc 26.562 (28.155)	Top-5 acc 51.172 (51.464)	lr 0.01178
Warmup Train [28][310/3239]	Time 0.559 (0.566)	Data 0.001 (0.051)	Loss 4.4570 (4.1463)	Top-1 acc 25.000 (28.130)	Top-5 acc 44.141 (51.439)	lr 0.01178
Warmup Train [28][320/3239]	Time 0.500 (0.565)	Data 0.001 (0.049)	Loss 4.1111 (4.1471)	Top-1 acc 27.344 (28.076)	Top-5 acc 50.000 (51.398)	lr 0.01177
Warmup Train [28][330/3239]	Time 0.584 (0.562)	Data 0.001 (0.048)	Loss 4.1573 (4.1477)	Top-1 acc 28.906 (28.105)	Top-5 acc 54.688 (51.397)	lr 0.01177
Warmup Train [28][340/3239]	Time 0.401 (0.559)	Data 0.001 (0.047)	Loss 4.1147 (4.1471)	Top-1 acc 28.906 (28.139)	Top-5 acc 52.734 (51.422)	lr 0.01176
Warmup Train [28][350/3239]	Time 0.243 (0.556)	Data 0.001 (0.046)	Loss 4.2804 (4.1488)	Top-1 acc 26.953 (28.132)	Top-5 acc 50.000 (51.392)	lr 0.01176
Warmup Train [28][360/3239]	Time 0.393 (0.555)	Data 0.001 (0.045)	Loss 4.0830 (4.1478)	Top-1 acc 30.469 (28.166)	Top-5 acc 53.125 (51.400)	lr 0.01175
Warmup Train [28][370/3239]	Time 0.375 (0.553)	Data 0.001 (0.044)	Loss 4.5266 (4.1492)	Top-1 acc 19.922 (28.133)	Top-5 acc 41.406 (51.382)	lr 0.01175
Warmup Train [28][380/3239]	Time 0.562 (0.552)	Data 0.001 (0.043)	Loss 4.1521 (4.1495)	Top-1 acc 28.516 (28.123)	Top-5 acc 53.516 (51.354)	lr 0.01174
Warmup Train [28][390/3239]	Time 0.344 (0.552)	Data 0.001 (0.042)	Loss 4.2466 (4.1510)	Top-1 acc 29.688 (28.090)	Top-5 acc 46.875 (51.313)	lr 0.01174
Warmup Train [28][400/3239]	Time 0.540 (0.551)	Data 0.001 (0.041)	Loss 4.0461 (4.1501)	Top-1 acc 28.516 (28.119)	Top-5 acc 55.859 (51.356)	lr 0.01173
Warmup Train [28][410/3239]	Time 0.626 (0.550)	Data 0.001 (0.041)	Loss 4.0116 (4.1501)	Top-1 acc 26.562 (28.096)	Top-5 acc 54.688 (51.345)	lr 0.01173
Warmup Train [28][420/3239]	Time 0.522 (0.549)	Data 0.001 (0.040)	Loss 4.2977 (4.1508)	Top-1 acc 27.734 (28.086)	Top-5 acc 49.219 (51.335)	lr 0.01172
Warmup Train [28][430/3239]	Time 0.409 (0.548)	Data 0.001 (0.039)	Loss 4.3366 (4.1513)	Top-1 acc 26.953 (28.085)	Top-5 acc 45.312 (51.309)	lr 0.01172
Warmup Train [28][440/3239]	Time 0.461 (0.548)	Data 0.001 (0.038)	Loss 4.4606 (4.1527)	Top-1 acc 23.438 (28.074)	Top-5 acc 42.188 (51.261)	lr 0.01171
Warmup Train [28][450/3239]	Time 0.488 (0.547)	Data 0.002 (0.038)	Loss 4.4112 (4.1554)	Top-1 acc 22.266 (28.014)	Top-5 acc 45.703 (51.183)	lr 0.01171
Warmup Train [28][460/3239]	Time 0.636 (0.546)	Data 0.001 (0.037)	Loss 4.2181 (4.1552)	Top-1 acc 23.828 (28.022)	Top-5 acc 49.219 (51.182)	lr 0.01170
Warmup Train [28][470/3239]	Time 0.548 (0.545)	Data 0.001 (0.036)	Loss 4.1427 (4.1559)	Top-1 acc 28.516 (28.006)	Top-5 acc 49.609 (51.161)	lr 0.01170
Warmup Train [28][480/3239]	Time 0.540 (0.545)	Data 0.001 (0.035)	Loss 4.3104 (4.1555)	Top-1 acc 25.000 (28.021)	Top-5 acc 45.312 (51.167)	lr 0.01169
Warmup Train [28][490/3239]	Time 0.549 (0.544)	Data 0.001 (0.035)	Loss 4.0323 (4.1556)	Top-1 acc 36.328 (28.017)	Top-5 acc 55.078 (51.156)	lr 0.01169
Warmup Train [28][500/3239]	Time 0.636 (0.544)	Data 0.001 (0.034)	Loss 4.1714 (4.1562)	Top-1 acc 29.297 (28.015)	Top-5 acc 51.953 (51.156)	lr 0.01168
Warmup Train [28][510/3239]	Time 0.488 (0.543)	Data 0.001 (0.033)	Loss 4.1449 (4.1558)	Top-1 acc 27.734 (28.032)	Top-5 acc 50.000 (51.144)	lr 0.01168
Warmup Train [28][520/3239]	Time 0.523 (0.543)	Data 0.001 (0.033)	Loss 4.1093 (4.1569)	Top-1 acc 32.422 (28.043)	Top-5 acc 48.438 (51.102)	lr 0.01167
Warmup Train [28][530/3239]	Time 0.551 (0.542)	Data 0.001 (0.033)	Loss 4.1115 (4.1578)	Top-1 acc 30.859 (28.060)	Top-5 acc 55.859 (51.090)	lr 0.01166
Warmup Train [28][540/3239]	Time 0.504 (0.542)	Data 0.001 (0.032)	Loss 3.9726 (4.1581)	Top-1 acc 31.250 (28.038)	Top-5 acc 58.203 (51.084)	lr 0.01166
Warmup Train [28][550/3239]	Time 0.576 (0.542)	Data 0.001 (0.032)	Loss 4.2646 (4.1579)	Top-1 acc 27.344 (28.044)	Top-5 acc 50.391 (51.091)	lr 0.01165
Warmup Train [28][560/3239]	Time 0.710 (0.541)	Data 0.001 (0.031)	Loss 4.0587 (4.1574)	Top-1 acc 31.641 (28.050)	Top-5 acc 53.906 (51.104)	lr 0.01165
Warmup Train [28][570/3239]	Time 0.397 (0.540)	Data 0.001 (0.031)	Loss 4.1675 (4.1578)	Top-1 acc 27.734 (28.039)	Top-5 acc 51.172 (51.097)	lr 0.01164
Warmup Train [28][580/3239]	Time 0.521 (0.540)	Data 0.001 (0.030)	Loss 4.1639 (4.1578)	Top-1 acc 26.172 (28.042)	Top-5 acc 46.484 (51.083)	lr 0.01164
Warmup Train [28][590/3239]	Time 0.545 (0.539)	Data 0.001 (0.030)	Loss 4.1550 (4.1575)	Top-1 acc 29.297 (28.048)	Top-5 acc 54.297 (51.110)	lr 0.01163
Warmup Train [28][600/3239]	Time 0.571 (0.538)	Data 0.001 (0.030)	Loss 4.1055 (4.1577)	Top-1 acc 28.516 (28.045)	Top-5 acc 53.125 (51.118)	lr 0.01163
Warmup Train [28][610/3239]	Time 0.668 (0.537)	Data 0.002 (0.029)	Loss 3.9052 (4.1577)	Top-1 acc 34.766 (28.058)	Top-5 acc 57.031 (51.116)	lr 0.01162
Warmup Train [28][620/3239]	Time 0.361 (0.537)	Data 0.001 (0.029)	Loss 4.3486 (4.1588)	Top-1 acc 24.609 (28.034)	Top-5 acc 45.703 (51.084)	lr 0.01162
Warmup Train [28][630/3239]	Time 0.551 (0.537)	Data 0.001 (0.029)	Loss 4.1202 (4.1593)	Top-1 acc 26.562 (28.015)	Top-5 acc 50.000 (51.071)	lr 0.01161
Warmup Train [28][640/3239]	Time 0.480 (0.537)	Data 0.001 (0.028)	Loss 3.9510 (4.1597)	Top-1 acc 32.422 (28.004)	Top-5 acc 55.078 (51.054)	lr 0.01161
Warmup Train [28][650/3239]	Time 0.400 (0.536)	Data 0.001 (0.028)	Loss 4.2832 (4.1585)	Top-1 acc 20.703 (28.006)	Top-5 acc 48.828 (51.096)	lr 0.01160
Warmup Train [28][660/3239]	Time 0.498 (0.536)	Data 0.001 (0.027)	Loss 4.2557 (4.1594)	Top-1 acc 26.172 (28.003)	Top-5 acc 48.438 (51.085)	lr 0.01160
Warmup Train [28][670/3239]	Time 0.618 (0.535)	Data 0.001 (0.027)	Loss 4.1233 (4.1598)	Top-1 acc 29.297 (28.005)	Top-5 acc 54.297 (51.093)	lr 0.01159
Warmup Train [28][680/3239]	Time 0.476 (0.535)	Data 0.001 (0.027)	Loss 4.3022 (4.1598)	Top-1 acc 28.125 (27.994)	Top-5 acc 49.219 (51.099)	lr 0.01159
Warmup Train [28][690/3239]	Time 0.448 (0.534)	Data 0.001 (0.026)	Loss 4.1844 (4.1595)	Top-1 acc 24.219 (27.997)	Top-5 acc 50.391 (51.107)	lr 0.01158
Warmup Train [28][700/3239]	Time 0.536 (0.534)	Data 0.001 (0.026)	Loss 4.1268 (4.1594)	Top-1 acc 32.031 (28.006)	Top-5 acc 52.734 (51.109)	lr 0.01158
Warmup Train [28][710/3239]	Time 0.585 (0.534)	Data 0.002 (0.026)	Loss 4.2502 (4.1606)	Top-1 acc 21.484 (27.984)	Top-5 acc 48.047 (51.083)	lr 0.01157
Warmup Train [28][720/3239]	Time 0.478 (0.534)	Data 0.001 (0.025)	Loss 4.2144 (4.1606)	Top-1 acc 28.516 (27.975)	Top-5 acc 45.312 (51.072)	lr 0.01157
Warmup Train [28][730/3239]	Time 0.626 (0.533)	Data 0.001 (0.025)	Loss 4.2621 (4.1606)	Top-1 acc 26.953 (27.989)	Top-5 acc 48.438 (51.081)	lr 0.01156
Warmup Train [28][740/3239]	Time 0.570 (0.533)	Data 0.001 (0.025)	Loss 4.2667 (4.1608)	Top-1 acc 23.438 (27.969)	Top-5 acc 48.438 (51.070)	lr 0.01156
Warmup Train [28][750/3239]	Time 0.515 (0.533)	Data 0.001 (0.025)	Loss 4.3990 (4.1615)	Top-1 acc 23.438 (27.959)	Top-5 acc 44.141 (51.049)	lr 0.01155
Warmup Train [28][760/3239]	Time 0.496 (0.532)	Data 0.001 (0.024)	Loss 4.0773 (4.1617)	Top-1 acc 31.641 (27.949)	Top-5 acc 55.469 (51.047)	lr 0.01155
Warmup Train [28][770/3239]	Time 0.559 (0.533)	Data 0.001 (0.024)	Loss 4.3368 (4.1617)	Top-1 acc 26.172 (27.950)	Top-5 acc 44.922 (51.040)	lr 0.01154
Warmup Train [28][780/3239]	Time 0.560 (0.532)	Data 0.001 (0.024)	Loss 4.1692 (4.1616)	Top-1 acc 29.688 (27.960)	Top-5 acc 48.438 (51.029)	lr 0.01154
Warmup Train [28][790/3239]	Time 0.564 (0.532)	Data 0.001 (0.024)	Loss 3.9672 (4.1610)	Top-1 acc 28.516 (27.967)	Top-5 acc 52.734 (51.036)	lr 0.01153
Warmup Train [28][800/3239]	Time 0.540 (0.531)	Data 0.001 (0.023)	Loss 4.2894 (4.1621)	Top-1 acc 27.344 (27.947)	Top-5 acc 48.438 (51.018)	lr 0.01153
Warmup Train [28][810/3239]	Time 0.496 (0.531)	Data 0.001 (0.023)	Loss 4.1303 (4.1623)	Top-1 acc 26.562 (27.939)	Top-5 acc 50.000 (51.016)	lr 0.01152
Warmup Train [28][820/3239]	Time 0.504 (0.531)	Data 0.001 (0.023)	Loss 3.8287 (4.1618)	Top-1 acc 34.766 (27.953)	Top-5 acc 62.109 (51.028)	lr 0.01152
Warmup Train [28][830/3239]	Time 0.469 (0.530)	Data 0.001 (0.023)	Loss 4.2714 (4.1626)	Top-1 acc 29.688 (27.948)	Top-5 acc 49.609 (51.012)	lr 0.01151
Warmup Train [28][840/3239]	Time 0.491 (0.529)	Data 0.001 (0.023)	Loss 4.1842 (4.1618)	Top-1 acc 26.172 (27.956)	Top-5 acc 51.562 (51.038)	lr 0.01151
Warmup Train [28][850/3239]	Time 0.453 (0.529)	Data 0.001 (0.022)	Loss 4.3227 (4.1627)	Top-1 acc 23.828 (27.929)	Top-5 acc 49.219 (51.021)	lr 0.01150
Warmup Train [28][860/3239]	Time 0.476 (0.529)	Data 0.001 (0.022)	Loss 4.3341 (4.1630)	Top-1 acc 23.828 (27.917)	Top-5 acc 51.172 (51.027)	lr 0.01150
Warmup Train [28][870/3239]	Time 0.462 (0.529)	Data 0.001 (0.022)	Loss 4.0515 (4.1633)	Top-1 acc 24.609 (27.900)	Top-5 acc 50.781 (51.010)	lr 0.01149
Warmup Train [28][880/3239]	Time 0.427 (0.529)	Data 0.001 (0.022)	Loss 4.1654 (4.1634)	Top-1 acc 29.688 (27.898)	Top-5 acc 50.000 (51.003)	lr 0.01149
Warmup Train [28][890/3239]	Time 0.352 (0.528)	Data 0.001 (0.022)	Loss 4.1461 (4.1632)	Top-1 acc 30.859 (27.905)	Top-5 acc 50.781 (51.002)	lr 0.01148
Warmup Train [28][900/3239]	Time 0.549 (0.528)	Data 0.001 (0.022)	Loss 4.3663 (4.1635)	Top-1 acc 25.000 (27.904)	Top-5 acc 45.703 (50.988)	lr 0.01148
Warmup Train [28][910/3239]	Time 0.576 (0.528)	Data 0.002 (0.021)	Loss 4.2649 (4.1634)	Top-1 acc 23.828 (27.890)	Top-5 acc 48.438 (50.973)	lr 0.01147
Warmup Train [28][920/3239]	Time 0.630 (0.528)	Data 0.001 (0.021)	Loss 4.0833 (4.1634)	Top-1 acc 29.688 (27.892)	Top-5 acc 57.031 (50.976)	lr 0.01147
Warmup Train [28][930/3239]	Time 0.569 (0.529)	Data 0.001 (0.021)	Loss 4.2046 (4.1638)	Top-1 acc 29.297 (27.889)	Top-5 acc 51.562 (50.967)	lr 0.01146
Warmup Train [28][940/3239]	Time 0.537 (0.528)	Data 0.001 (0.021)	Loss 4.2071 (4.1636)	Top-1 acc 25.391 (27.899)	Top-5 acc 48.047 (50.968)	lr 0.01146
Warmup Train [28][950/3239]	Time 0.372 (0.528)	Data 0.001 (0.021)	Loss 4.2386 (4.1627)	Top-1 acc 24.609 (27.915)	Top-5 acc 48.047 (50.991)	lr 0.01145
Warmup Train [28][960/3239]	Time 0.623 (0.528)	Data 0.002 (0.021)	Loss 4.2603 (4.1630)	Top-1 acc 27.734 (27.908)	Top-5 acc 47.656 (50.987)	lr 0.01145
Warmup Train [28][970/3239]	Time 0.527 (0.528)	Data 0.001 (0.020)	Loss 3.9714 (4.1629)	Top-1 acc 34.766 (27.913)	Top-5 acc 57.422 (50.983)	lr 0.01144
Warmup Train [28][980/3239]	Time 0.540 (0.528)	Data 0.001 (0.020)	Loss 4.1107 (4.1634)	Top-1 acc 31.250 (27.912)	Top-5 acc 52.734 (50.972)	lr 0.01143
Warmup Train [28][990/3239]	Time 0.583 (0.527)	Data 0.001 (0.020)	Loss 4.1073 (4.1637)	Top-1 acc 26.172 (27.900)	Top-5 acc 55.859 (50.962)	lr 0.01143
Warmup Train [28][1000/3239]	Time 0.493 (0.527)	Data 0.001 (0.020)	Loss 4.0690 (4.1641)	Top-1 acc 30.078 (27.894)	Top-5 acc 52.344 (50.955)	lr 0.01142
Warmup Train [28][1010/3239]	Time 0.580 (0.527)	Data 0.001 (0.020)	Loss 4.0137 (4.1637)	Top-1 acc 29.297 (27.894)	Top-5 acc 53.125 (50.963)	lr 0.01142
Warmup Train [28][1020/3239]	Time 0.523 (0.527)	Data 0.001 (0.020)	Loss 4.1483 (4.1644)	Top-1 acc 30.469 (27.888)	Top-5 acc 50.391 (50.940)	lr 0.01141
Warmup Train [28][1030/3239]	Time 0.376 (0.527)	Data 0.001 (0.020)	Loss 4.1307 (4.1645)	Top-1 acc 28.516 (27.884)	Top-5 acc 53.125 (50.943)	lr 0.01141
Warmup Train [28][1040/3239]	Time 0.506 (0.526)	Data 0.001 (0.020)	Loss 4.2698 (4.1641)	Top-1 acc 24.219 (27.882)	Top-5 acc 47.266 (50.944)	lr 0.01140
Warmup Train [28][1050/3239]	Time 0.433 (0.526)	Data 0.001 (0.019)	Loss 4.1963 (4.1636)	Top-1 acc 28.125 (27.885)	Top-5 acc 51.953 (50.961)	lr 0.01140
Warmup Train [28][1060/3239]	Time 0.478 (0.526)	Data 0.001 (0.019)	Loss 4.2575 (4.1636)	Top-1 acc 26.953 (27.888)	Top-5 acc 48.828 (50.965)	lr 0.01139
Warmup Train [28][1070/3239]	Time 0.527 (0.525)	Data 0.002 (0.019)	Loss 4.2320 (4.1639)	Top-1 acc 32.031 (27.882)	Top-5 acc 48.047 (50.957)	lr 0.01139
Warmup Train [28][1080/3239]	Time 0.528 (0.525)	Data 0.001 (0.019)	Loss 4.2112 (4.1636)	Top-1 acc 25.391 (27.898)	Top-5 acc 50.391 (50.964)	lr 0.01138
Warmup Train [28][1090/3239]	Time 0.550 (0.524)	Data 0.001 (0.019)	Loss 4.1481 (4.1634)	Top-1 acc 30.859 (27.903)	Top-5 acc 53.125 (50.979)	lr 0.01138
Warmup Train [28][1100/3239]	Time 0.639 (0.524)	Data 0.001 (0.019)	Loss 4.2188 (4.1638)	Top-1 acc 29.688 (27.896)	Top-5 acc 51.562 (50.973)	lr 0.01137
Warmup Train [28][1110/3239]	Time 0.494 (0.524)	Data 0.001 (0.019)	Loss 4.1990 (4.1638)	Top-1 acc 24.219 (27.900)	Top-5 acc 50.391 (50.980)	lr 0.01137
Warmup Train [28][1120/3239]	Time 0.673 (0.524)	Data 0.001 (0.019)	Loss 4.1889 (4.1641)	Top-1 acc 28.125 (27.893)	Top-5 acc 51.562 (50.978)	lr 0.01136
Warmup Train [28][1130/3239]	Time 0.473 (0.524)	Data 0.001 (0.018)	Loss 4.0574 (4.1640)	Top-1 acc 31.250 (27.892)	Top-5 acc 53.906 (50.969)	lr 0.01136
Warmup Train [28][1140/3239]	Time 0.511 (0.524)	Data 0.001 (0.018)	Loss 4.1410 (4.1639)	Top-1 acc 32.031 (27.895)	Top-5 acc 53.906 (50.978)	lr 0.01135
Warmup Train [28][1150/3239]	Time 0.404 (0.524)	Data 0.001 (0.018)	Loss 4.0839 (4.1637)	Top-1 acc 25.781 (27.901)	Top-5 acc 50.391 (50.973)	lr 0.01135
Warmup Train [28][1160/3239]	Time 0.603 (0.524)	Data 0.001 (0.018)	Loss 4.1334 (4.1635)	Top-1 acc 30.078 (27.915)	Top-5 acc 51.172 (50.984)	lr 0.01134
Warmup Train [28][1170/3239]	Time 0.472 (0.524)	Data 0.001 (0.018)	Loss 4.1032 (4.1636)	Top-1 acc 27.734 (27.919)	Top-5 acc 53.125 (50.972)	lr 0.01134
Warmup Train [28][1180/3239]	Time 0.631 (0.524)	Data 0.001 (0.018)	Loss 3.9624 (4.1638)	Top-1 acc 30.078 (27.916)	Top-5 acc 58.203 (50.965)	lr 0.01133
Warmup Train [28][1190/3239]	Time 0.521 (0.524)	Data 0.001 (0.018)	Loss 4.2528 (4.1637)	Top-1 acc 31.250 (27.929)	Top-5 acc 49.219 (50.971)	lr 0.01133
Warmup Train [28][1200/3239]	Time 0.467 (0.524)	Data 0.001 (0.018)	Loss 4.1884 (4.1641)	Top-1 acc 28.125 (27.920)	Top-5 acc 50.000 (50.959)	lr 0.01132
Warmup Train [28][1210/3239]	Time 0.600 (0.524)	Data 0.001 (0.018)	Loss 4.3103 (4.1641)	Top-1 acc 25.391 (27.910)	Top-5 acc 49.609 (50.963)	lr 0.01132
Warmup Train [28][1220/3239]	Time 0.649 (0.524)	Data 0.001 (0.017)	Loss 4.2320 (4.1644)	Top-1 acc 26.172 (27.905)	Top-5 acc 49.609 (50.960)	lr 0.01131
Warmup Train [28][1230/3239]	Time 0.639 (0.524)	Data 0.001 (0.017)	Loss 4.1591 (4.1638)	Top-1 acc 25.000 (27.911)	Top-5 acc 50.000 (50.972)	lr 0.01131
Warmup Train [28][1240/3239]	Time 0.396 (0.524)	Data 0.001 (0.017)	Loss 4.3334 (4.1642)	Top-1 acc 22.656 (27.889)	Top-5 acc 48.047 (50.962)	lr 0.01130
Warmup Train [28][1250/3239]	Time 0.537 (0.524)	Data 0.001 (0.017)	Loss 3.8500 (4.1640)	Top-1 acc 33.203 (27.884)	Top-5 acc 61.719 (50.972)	lr 0.01130
Warmup Train [28][1260/3239]	Time 0.330 (0.524)	Data 0.001 (0.017)	Loss 4.1157 (4.1638)	Top-1 acc 30.859 (27.890)	Top-5 acc 51.562 (50.966)	lr 0.01129
Warmup Train [28][1270/3239]	Time 0.397 (0.524)	Data 0.001 (0.017)	Loss 4.0400 (4.1641)	Top-1 acc 28.906 (27.885)	Top-5 acc 55.859 (50.962)	lr 0.01129
Warmup Train [28][1280/3239]	Time 0.629 (0.524)	Data 0.001 (0.017)	Loss 4.3445 (4.1645)	Top-1 acc 24.219 (27.872)	Top-5 acc 43.750 (50.950)	lr 0.01128
Warmup Train [28][1290/3239]	Time 0.508 (0.523)	Data 0.001 (0.017)	Loss 4.1761 (4.1649)	Top-1 acc 28.516 (27.871)	Top-5 acc 48.438 (50.952)	lr 0.01128
Warmup Train [28][1300/3239]	Time 0.500 (0.523)	Data 0.001 (0.017)	Loss 4.1396 (4.1646)	Top-1 acc 26.562 (27.875)	Top-5 acc 48.828 (50.960)	lr 0.01127
Warmup Train [28][1310/3239]	Time 0.466 (0.523)	Data 0.001 (0.017)	Loss 4.3692 (4.1650)	Top-1 acc 25.391 (27.870)	Top-5 acc 43.359 (50.949)	lr 0.01127
Warmup Train [28][1320/3239]	Time 0.395 (0.523)	Data 0.001 (0.017)	Loss 4.1545 (4.1649)	Top-1 acc 30.078 (27.868)	Top-5 acc 56.250 (50.954)	lr 0.01126
Warmup Train [28][1330/3239]	Time 0.493 (0.522)	Data 0.001 (0.017)	Loss 4.1973 (4.1648)	Top-1 acc 26.562 (27.870)	Top-5 acc 50.781 (50.953)	lr 0.01126
Warmup Train [28][1340/3239]	Time 0.502 (0.522)	Data 0.001 (0.017)	Loss 4.0073 (4.1646)	Top-1 acc 28.125 (27.873)	Top-5 acc 55.469 (50.958)	lr 0.01125
Warmup Train [28][1350/3239]	Time 0.474 (0.522)	Data 0.001 (0.016)	Loss 4.0558 (4.1649)	Top-1 acc 29.688 (27.862)	Top-5 acc 53.125 (50.955)	lr 0.01125
Warmup Train [28][1360/3239]	Time 0.356 (0.522)	Data 0.001 (0.016)	Loss 4.1347 (4.1647)	Top-1 acc 30.859 (27.867)	Top-5 acc 53.906 (50.969)	lr 0.01124
Warmup Train [28][1370/3239]	Time 0.616 (0.522)	Data 0.001 (0.016)	Loss 4.0342 (4.1644)	Top-1 acc 32.422 (27.869)	Top-5 acc 53.516 (50.968)	lr 0.01124
Warmup Train [28][1380/3239]	Time 0.522 (0.522)	Data 0.001 (0.016)	Loss 4.2339 (4.1645)	Top-1 acc 25.781 (27.861)	Top-5 acc 51.172 (50.967)	lr 0.01123
Warmup Train [28][1390/3239]	Time 0.433 (0.522)	Data 0.001 (0.016)	Loss 4.2373 (4.1642)	Top-1 acc 24.219 (27.866)	Top-5 acc 47.656 (50.972)	lr 0.01123
Warmup Train [28][1400/3239]	Time 0.430 (0.521)	Data 0.001 (0.016)	Loss 4.2213 (4.1638)	Top-1 acc 25.000 (27.863)	Top-5 acc 46.875 (50.976)	lr 0.01122
Warmup Train [28][1410/3239]	Time 0.355 (0.521)	Data 0.001 (0.016)	Loss 4.1227 (4.1638)	Top-1 acc 25.000 (27.859)	Top-5 acc 51.172 (50.979)	lr 0.01122
Warmup Train [28][1420/3239]	Time 0.387 (0.521)	Data 0.001 (0.016)	Loss 4.2439 (4.1640)	Top-1 acc 28.906 (27.859)	Top-5 acc 49.609 (50.972)	lr 0.01121
Warmup Train [28][1430/3239]	Time 0.745 (0.521)	Data 0.001 (0.016)	Loss 4.1121 (4.1639)	Top-1 acc 29.688 (27.863)	Top-5 acc 52.344 (50.983)	lr 0.01121
Warmup Train [28][1440/3239]	Time 0.463 (0.521)	Data 0.001 (0.016)	Loss 4.2239 (4.1639)	Top-1 acc 27.344 (27.869)	Top-5 acc 48.828 (50.980)	lr 0.01120
Warmup Train [28][1450/3239]	Time 0.481 (0.521)	Data 0.001 (0.016)	Loss 4.1036 (4.1636)	Top-1 acc 24.219 (27.867)	Top-5 acc 49.219 (50.985)	lr 0.01120
Warmup Train [28][1460/3239]	Time 0.521 (0.521)	Data 0.001 (0.016)	Loss 4.3302 (4.1642)	Top-1 acc 25.000 (27.852)	Top-5 acc 47.266 (50.968)	lr 0.01119
Warmup Train [28][1470/3239]	Time 0.430 (0.521)	Data 0.001 (0.016)	Loss 4.1499 (4.1639)	Top-1 acc 29.688 (27.864)	Top-5 acc 51.172 (50.976)	lr 0.01119
Warmup Train [28][1480/3239]	Time 0.542 (0.521)	Data 0.001 (0.016)	Loss 3.9352 (4.1635)	Top-1 acc 33.594 (27.883)	Top-5 acc 57.031 (50.986)	lr 0.01118
Warmup Train [28][1490/3239]	Time 0.490 (0.521)	Data 0.001 (0.016)	Loss 4.2005 (4.1634)	Top-1 acc 28.906 (27.892)	Top-5 acc 52.734 (50.993)	lr 0.01118
Warmup Train [28][1500/3239]	Time 0.483 (0.520)	Data 0.001 (0.015)	Loss 4.2978 (4.1634)	Top-1 acc 25.781 (27.892)	Top-5 acc 48.047 (50.998)	lr 0.01117
Warmup Train [28][1510/3239]	Time 0.499 (0.521)	Data 0.001 (0.015)	Loss 4.0678 (4.1633)	Top-1 acc 32.422 (27.893)	Top-5 acc 52.734 (50.995)	lr 0.01117
Warmup Train [28][1520/3239]	Time 0.489 (0.521)	Data 0.001 (0.015)	Loss 4.3209 (4.1637)	Top-1 acc 24.609 (27.880)	Top-5 acc 51.172 (50.991)	lr 0.01116
Warmup Train [28][1530/3239]	Time 0.641 (0.520)	Data 0.002 (0.015)	Loss 4.0380 (4.1635)	Top-1 acc 32.031 (27.885)	Top-5 acc 49.609 (50.994)	lr 0.01116
Warmup Train [28][1540/3239]	Time 0.462 (0.520)	Data 0.002 (0.015)	Loss 4.1594 (4.1634)	Top-1 acc 28.516 (27.892)	Top-5 acc 49.219 (50.994)	lr 0.01115
Warmup Train [28][1550/3239]	Time 0.554 (0.520)	Data 0.001 (0.015)	Loss 4.0840 (4.1635)	Top-1 acc 30.859 (27.889)	Top-5 acc 53.125 (50.996)	lr 0.01115
Warmup Train [28][1560/3239]	Time 0.463 (0.520)	Data 0.001 (0.015)	Loss 4.2953 (4.1633)	Top-1 acc 24.219 (27.893)	Top-5 acc 45.703 (51.001)	lr 0.01114
Warmup Train [28][1570/3239]	Time 0.570 (0.519)	Data 0.001 (0.015)	Loss 4.1766 (4.1637)	Top-1 acc 28.125 (27.893)	Top-5 acc 52.344 (50.993)	lr 0.01114
Warmup Train [28][1580/3239]	Time 0.541 (0.519)	Data 0.001 (0.015)	Loss 4.1841 (4.1635)	Top-1 acc 28.516 (27.899)	Top-5 acc 51.562 (50.996)	lr 0.01113
Warmup Train [28][1590/3239]	Time 0.671 (0.519)	Data 0.001 (0.015)	Loss 4.1322 (4.1637)	Top-1 acc 31.250 (27.907)	Top-5 acc 51.953 (50.998)	lr 0.01113
Warmup Train [28][1600/3239]	Time 0.538 (0.519)	Data 0.001 (0.015)	Loss 4.3283 (4.1638)	Top-1 acc 21.484 (27.900)	Top-5 acc 47.656 (50.992)	lr 0.01112
Warmup Train [28][1610/3239]	Time 0.677 (0.519)	Data 0.001 (0.015)	Loss 4.0492 (4.1635)	Top-1 acc 32.031 (27.905)	Top-5 acc 55.469 (50.999)	lr 0.01112
Warmup Train [28][1620/3239]	Time 0.544 (0.519)	Data 0.001 (0.015)	Loss 4.0593 (4.1634)	Top-1 acc 32.422 (27.910)	Top-5 acc 53.906 (51.003)	lr 0.01111
Warmup Train [28][1630/3239]	Time 0.438 (0.519)	Data 0.001 (0.015)	Loss 4.2686 (4.1634)	Top-1 acc 25.781 (27.914)	Top-5 acc 49.609 (51.009)	lr 0.01111
Warmup Train [28][1640/3239]	Time 0.560 (0.519)	Data 0.001 (0.015)	Loss 3.9241 (4.1634)	Top-1 acc 32.422 (27.915)	Top-5 acc 62.109 (51.017)	lr 0.01110
Warmup Train [28][1650/3239]	Time 0.386 (0.519)	Data 0.001 (0.015)	Loss 3.9442 (4.1632)	Top-1 acc 30.859 (27.916)	Top-5 acc 57.812 (51.023)	lr 0.01110
Warmup Train [28][1660/3239]	Time 0.500 (0.519)	Data 0.001 (0.015)	Loss 4.1280 (4.1637)	Top-1 acc 32.812 (27.912)	Top-5 acc 51.562 (51.016)	lr 0.01109
Warmup Train [28][1670/3239]	Time 0.561 (0.519)	Data 0.001 (0.014)	Loss 4.3067 (4.1640)	Top-1 acc 27.344 (27.903)	Top-5 acc 47.656 (51.010)	lr 0.01109
Warmup Train [28][1680/3239]	Time 0.553 (0.519)	Data 0.002 (0.014)	Loss 4.1747 (4.1642)	Top-1 acc 28.125 (27.904)	Top-5 acc 52.734 (51.011)	lr 0.01108
Warmup Train [28][1690/3239]	Time 0.485 (0.519)	Data 0.001 (0.014)	Loss 4.1978 (4.1641)	Top-1 acc 28.125 (27.903)	Top-5 acc 51.172 (51.014)	lr 0.01108
Warmup Train [28][1700/3239]	Time 0.481 (0.519)	Data 0.001 (0.014)	Loss 4.2366 (4.1644)	Top-1 acc 24.609 (27.901)	Top-5 acc 51.953 (51.014)	lr 0.01107
Warmup Train [28][1710/3239]	Time 0.407 (0.518)	Data 0.001 (0.014)	Loss 4.1817 (4.1645)	Top-1 acc 26.172 (27.897)	Top-5 acc 50.781 (51.020)	lr 0.01107
Warmup Train [28][1720/3239]	Time 0.659 (0.518)	Data 0.002 (0.014)	Loss 4.1041 (4.1645)	Top-1 acc 25.781 (27.899)	Top-5 acc 51.562 (51.020)	lr 0.01106
Warmup Train [28][1730/3239]	Time 0.544 (0.518)	Data 0.001 (0.014)	Loss 4.0287 (4.1647)	Top-1 acc 32.422 (27.899)	Top-5 acc 51.953 (51.014)	lr 0.01106
Warmup Train [28][1740/3239]	Time 0.509 (0.518)	Data 0.001 (0.014)	Loss 4.2636 (4.1645)	Top-1 acc 26.172 (27.906)	Top-5 acc 48.828 (51.023)	lr 0.01105
Warmup Train [28][1750/3239]	Time 0.601 (0.518)	Data 0.001 (0.014)	Loss 3.9820 (4.1643)	Top-1 acc 27.734 (27.910)	Top-5 acc 55.469 (51.031)	lr 0.01105
Warmup Train [28][1760/3239]	Time 0.495 (0.518)	Data 0.001 (0.014)	Loss 4.0166 (4.1643)	Top-1 acc 29.297 (27.909)	Top-5 acc 55.078 (51.033)	lr 0.01104
Warmup Train [28][1770/3239]	Time 0.367 (0.518)	Data 0.001 (0.014)	Loss 4.1568 (4.1643)	Top-1 acc 25.391 (27.911)	Top-5 acc 51.953 (51.033)	lr 0.01104
Warmup Train [28][1780/3239]	Time 0.553 (0.518)	Data 0.001 (0.014)	Loss 4.1786 (4.1642)	Top-1 acc 30.469 (27.918)	Top-5 acc 49.609 (51.036)	lr 0.01103
Warmup Train [28][1790/3239]	Time 0.162 (0.518)	Data 0.001 (0.014)	Loss 4.3133 (4.1640)	Top-1 acc 23.828 (27.926)	Top-5 acc 44.922 (51.043)	lr 0.01103
Warmup Train [28][1800/3239]	Time 0.609 (0.518)	Data 0.001 (0.014)	Loss 4.0150 (4.1635)	Top-1 acc 28.125 (27.933)	Top-5 acc 56.250 (51.057)	lr 0.01102
Warmup Train [28][1810/3239]	Time 0.237 (0.518)	Data 0.035 (0.014)	Loss 4.0067 (4.1638)	Top-1 acc 27.344 (27.926)	Top-5 acc 51.172 (51.046)	lr 0.01102
Warmup Train [28][1820/3239]	Time 0.522 (0.518)	Data 0.001 (0.014)	Loss 3.9811 (4.1634)	Top-1 acc 27.344 (27.929)	Top-5 acc 55.859 (51.053)	lr 0.01101
Warmup Train [28][1830/3239]	Time 0.513 (0.518)	Data 0.001 (0.014)	Loss 4.2539 (4.1631)	Top-1 acc 26.172 (27.931)	Top-5 acc 51.172 (51.057)	lr 0.01101
Warmup Train [28][1840/3239]	Time 0.599 (0.518)	Data 0.001 (0.014)	Loss 4.3880 (4.1633)	Top-1 acc 22.266 (27.928)	Top-5 acc 46.484 (51.050)	lr 0.01100
Warmup Train [28][1850/3239]	Time 0.536 (0.518)	Data 0.001 (0.014)	Loss 4.2693 (4.1631)	Top-1 acc 24.219 (27.934)	Top-5 acc 50.000 (51.056)	lr 0.01100
Warmup Train [28][1860/3239]	Time 0.507 (0.518)	Data 0.001 (0.014)	Loss 4.3968 (4.1631)	Top-1 acc 24.609 (27.929)	Top-5 acc 43.750 (51.055)	lr 0.01099
Warmup Train [28][1870/3239]	Time 0.463 (0.518)	Data 0.001 (0.014)	Loss 4.2495 (4.1630)	Top-1 acc 26.562 (27.931)	Top-5 acc 49.609 (51.051)	lr 0.01099
Warmup Train [28][1880/3239]	Time 0.397 (0.518)	Data 0.001 (0.013)	Loss 4.1159 (4.1627)	Top-1 acc 29.688 (27.943)	Top-5 acc 51.172 (51.060)	lr 0.01098
Warmup Train [28][1890/3239]	Time 0.492 (0.518)	Data 0.001 (0.013)	Loss 4.2954 (4.1632)	Top-1 acc 22.656 (27.932)	Top-5 acc 46.484 (51.049)	lr 0.01097
Warmup Train [28][1900/3239]	Time 0.526 (0.518)	Data 0.001 (0.013)	Loss 4.1055 (4.1633)	Top-1 acc 30.078 (27.932)	Top-5 acc 49.219 (51.047)	lr 0.01097
Warmup Train [28][1910/3239]	Time 0.464 (0.518)	Data 0.001 (0.013)	Loss 4.1822 (4.1629)	Top-1 acc 26.953 (27.938)	Top-5 acc 51.172 (51.053)	lr 0.01096
Warmup Train [28][1920/3239]	Time 0.564 (0.517)	Data 0.002 (0.013)	Loss 4.2253 (4.1626)	Top-1 acc 30.078 (27.942)	Top-5 acc 51.562 (51.059)	lr 0.01096
Warmup Train [28][1930/3239]	Time 0.446 (0.517)	Data 0.001 (0.013)	Loss 4.2399 (4.1624)	Top-1 acc 26.172 (27.942)	Top-5 acc 45.703 (51.063)	lr 0.01095
Warmup Train [28][1940/3239]	Time 0.578 (0.517)	Data 0.001 (0.013)	Loss 4.0727 (4.1623)	Top-1 acc 28.516 (27.943)	Top-5 acc 54.688 (51.065)	lr 0.01095
Warmup Train [28][1950/3239]	Time 0.566 (0.517)	Data 0.001 (0.013)	Loss 4.2281 (4.1622)	Top-1 acc 30.078 (27.943)	Top-5 acc 48.438 (51.063)	lr 0.01094
Warmup Train [28][1960/3239]	Time 0.723 (0.517)	Data 0.002 (0.013)	Loss 4.2454 (4.1622)	Top-1 acc 25.391 (27.942)	Top-5 acc 48.828 (51.066)	lr 0.01094
Warmup Train [28][1970/3239]	Time 0.504 (0.517)	Data 0.001 (0.013)	Loss 4.2259 (4.1623)	Top-1 acc 27.734 (27.940)	Top-5 acc 47.656 (51.064)	lr 0.01093
Warmup Train [28][1980/3239]	Time 0.581 (0.517)	Data 0.001 (0.013)	Loss 4.0625 (4.1619)	Top-1 acc 27.344 (27.943)	Top-5 acc 54.297 (51.073)	lr 0.01093
Warmup Train [28][1990/3239]	Time 0.506 (0.517)	Data 0.001 (0.013)	Loss 4.2808 (4.1619)	Top-1 acc 32.031 (27.950)	Top-5 acc 48.438 (51.076)	lr 0.01092
Warmup Train [28][2000/3239]	Time 0.619 (0.517)	Data 0.001 (0.013)	Loss 4.0994 (4.1618)	Top-1 acc 30.859 (27.953)	Top-5 acc 52.734 (51.073)	lr 0.01092
Warmup Train [28][2010/3239]	Time 0.554 (0.517)	Data 0.001 (0.013)	Loss 4.0131 (4.1618)	Top-1 acc 32.812 (27.950)	Top-5 acc 54.688 (51.070)	lr 0.01091
Warmup Train [28][2020/3239]	Time 0.515 (0.517)	Data 0.001 (0.013)	Loss 4.1876 (4.1621)	Top-1 acc 32.031 (27.949)	Top-5 acc 51.562 (51.066)	lr 0.01091
Warmup Train [28][2030/3239]	Time 0.441 (0.517)	Data 0.001 (0.013)	Loss 4.1696 (4.1621)	Top-1 acc 29.688 (27.948)	Top-5 acc 51.562 (51.068)	lr 0.01090
Warmup Train [28][2040/3239]	Time 0.526 (0.517)	Data 0.001 (0.013)	Loss 4.3206 (4.1621)	Top-1 acc 28.516 (27.947)	Top-5 acc 47.656 (51.069)	lr 0.01090
Warmup Train [28][2050/3239]	Time 0.487 (0.517)	Data 0.001 (0.013)	Loss 4.1777 (4.1618)	Top-1 acc 28.125 (27.952)	Top-5 acc 51.953 (51.070)	lr 0.01089
Warmup Train [28][2060/3239]	Time 0.470 (0.517)	Data 0.001 (0.013)	Loss 4.2005 (4.1620)	Top-1 acc 26.172 (27.948)	Top-5 acc 50.000 (51.062)	lr 0.01089
Warmup Train [28][2070/3239]	Time 0.463 (0.517)	Data 0.001 (0.013)	Loss 4.2123 (4.1619)	Top-1 acc 28.906 (27.953)	Top-5 acc 51.562 (51.070)	lr 0.01088
Warmup Train [28][2080/3239]	Time 0.398 (0.516)	Data 0.001 (0.013)	Loss 4.3116 (4.1619)	Top-1 acc 24.219 (27.957)	Top-5 acc 45.312 (51.069)	lr 0.01088
Warmup Train [28][2090/3239]	Time 0.538 (0.517)	Data 0.001 (0.013)	Loss 4.2474 (4.1620)	Top-1 acc 26.953 (27.950)	Top-5 acc 51.172 (51.067)	lr 0.01087
Warmup Train [28][2100/3239]	Time 0.468 (0.517)	Data 0.001 (0.013)	Loss 4.2156 (4.1621)	Top-1 acc 24.609 (27.947)	Top-5 acc 51.172 (51.067)	lr 0.01087
Warmup Train [28][2110/3239]	Time 0.567 (0.517)	Data 0.001 (0.013)	Loss 4.2543 (4.1624)	Top-1 acc 28.906 (27.941)	Top-5 acc 47.266 (51.057)	lr 0.01086
Warmup Train [28][2120/3239]	Time 0.445 (0.517)	Data 0.001 (0.012)	Loss 4.1397 (4.1621)	Top-1 acc 29.297 (27.941)	Top-5 acc 50.781 (51.063)	lr 0.01086
Warmup Train [28][2130/3239]	Time 0.422 (0.516)	Data 0.001 (0.012)	Loss 4.1053 (4.1618)	Top-1 acc 32.422 (27.947)	Top-5 acc 56.250 (51.075)	lr 0.01085
Warmup Train [28][2140/3239]	Time 0.533 (0.516)	Data 0.001 (0.012)	Loss 4.0831 (4.1617)	Top-1 acc 28.125 (27.948)	Top-5 acc 51.562 (51.076)	lr 0.01085
Warmup Train [28][2150/3239]	Time 0.625 (0.516)	Data 0.001 (0.012)	Loss 4.3589 (4.1617)	Top-1 acc 25.781 (27.945)	Top-5 acc 47.266 (51.077)	lr 0.01084
Warmup Train [28][2160/3239]	Time 0.466 (0.516)	Data 0.001 (0.012)	Loss 4.1364 (4.1616)	Top-1 acc 30.859 (27.949)	Top-5 acc 48.828 (51.083)	lr 0.01084
Warmup Train [28][2170/3239]	Time 0.506 (0.516)	Data 0.001 (0.012)	Loss 4.1752 (4.1619)	Top-1 acc 26.172 (27.943)	Top-5 acc 49.609 (51.078)	lr 0.01083
Warmup Train [28][2180/3239]	Time 0.469 (0.516)	Data 0.001 (0.012)	Loss 4.0701 (4.1612)	Top-1 acc 28.125 (27.957)	Top-5 acc 51.562 (51.093)	lr 0.01083
Warmup Train [28][2190/3239]	Time 0.519 (0.516)	Data 0.001 (0.012)	Loss 3.9837 (4.1613)	Top-1 acc 34.375 (27.960)	Top-5 acc 53.125 (51.091)	lr 0.01082
Warmup Train [28][2200/3239]	Time 0.581 (0.516)	Data 0.001 (0.012)	Loss 4.2058 (4.1616)	Top-1 acc 26.562 (27.951)	Top-5 acc 48.438 (51.082)	lr 0.01082
Warmup Train [28][2210/3239]	Time 0.486 (0.516)	Data 0.001 (0.012)	Loss 4.1136 (4.1616)	Top-1 acc 31.250 (27.956)	Top-5 acc 51.172 (51.084)	lr 0.01081
Warmup Train [28][2220/3239]	Time 0.543 (0.516)	Data 0.001 (0.012)	Loss 4.0989 (4.1617)	Top-1 acc 30.859 (27.956)	Top-5 acc 53.125 (51.081)	lr 0.01081
Warmup Train [28][2230/3239]	Time 0.639 (0.516)	Data 0.001 (0.012)	Loss 4.0195 (4.1617)	Top-1 acc 27.344 (27.958)	Top-5 acc 52.344 (51.079)	lr 0.01080
Warmup Train [28][2240/3239]	Time 0.507 (0.516)	Data 0.001 (0.012)	Loss 4.1093 (4.1617)	Top-1 acc 31.641 (27.957)	Top-5 acc 53.125 (51.080)	lr 0.01080
Warmup Train [28][2250/3239]	Time 0.611 (0.516)	Data 0.001 (0.012)	Loss 4.0341 (4.1616)	Top-1 acc 28.906 (27.954)	Top-5 acc 53.906 (51.083)	lr 0.01079
Warmup Train [28][2260/3239]	Time 0.535 (0.516)	Data 0.001 (0.012)	Loss 4.4332 (4.1619)	Top-1 acc 22.656 (27.952)	Top-5 acc 43.359 (51.078)	lr 0.01079
Warmup Train [28][2270/3239]	Time 0.513 (0.516)	Data 0.001 (0.012)	Loss 4.0900 (4.1619)	Top-1 acc 33.203 (27.954)	Top-5 acc 50.781 (51.071)	lr 0.01078
Warmup Train [28][2280/3239]	Time 0.660 (0.516)	Data 0.001 (0.012)	Loss 3.9365 (4.1617)	Top-1 acc 30.469 (27.960)	Top-5 acc 56.641 (51.078)	lr 0.01078
Warmup Train [28][2290/3239]	Time 0.495 (0.516)	Data 0.001 (0.012)	Loss 4.1874 (4.1618)	Top-1 acc 27.734 (27.951)	Top-5 acc 52.344 (51.076)	lr 0.01077
Warmup Train [28][2300/3239]	Time 0.465 (0.515)	Data 0.001 (0.012)	Loss 4.1157 (4.1616)	Top-1 acc 29.297 (27.955)	Top-5 acc 49.609 (51.078)	lr 0.01077
Warmup Train [28][2310/3239]	Time 0.508 (0.515)	Data 0.001 (0.012)	Loss 4.2888 (4.1614)	Top-1 acc 23.047 (27.955)	Top-5 acc 47.656 (51.080)	lr 0.01077
Warmup Train [28][2320/3239]	Time 0.583 (0.515)	Data 0.001 (0.012)	Loss 4.1854 (4.1614)	Top-1 acc 26.953 (27.957)	Top-5 acc 53.906 (51.083)	lr 0.01076
Warmup Train [28][2330/3239]	Time 0.411 (0.515)	Data 0.001 (0.012)	Loss 4.3219 (4.1619)	Top-1 acc 23.828 (27.944)	Top-5 acc 45.312 (51.066)	lr 0.01076
Warmup Train [28][2340/3239]	Time 0.322 (0.515)	Data 0.001 (0.012)	Loss 3.9820 (4.1618)	Top-1 acc 33.203 (27.942)	Top-5 acc 57.422 (51.069)	lr 0.01075
Warmup Train [28][2350/3239]	Time 0.455 (0.515)	Data 0.001 (0.012)	Loss 4.1765 (4.1616)	Top-1 acc 25.781 (27.946)	Top-5 acc 48.438 (51.071)	lr 0.01075
Warmup Train [28][2360/3239]	Time 0.650 (0.515)	Data 0.001 (0.012)	Loss 4.1226 (4.1616)	Top-1 acc 24.609 (27.944)	Top-5 acc 53.906 (51.074)	lr 0.01074
Warmup Train [28][2370/3239]	Time 0.542 (0.515)	Data 0.001 (0.012)	Loss 4.1393 (4.1617)	Top-1 acc 25.391 (27.940)	Top-5 acc 48.047 (51.073)	lr 0.01074
Warmup Train [28][2380/3239]	Time 0.558 (0.516)	Data 0.001 (0.012)	Loss 4.2158 (4.1620)	Top-1 acc 25.391 (27.938)	Top-5 acc 48.047 (51.063)	lr 0.01073
Warmup Train [28][2390/3239]	Time 0.475 (0.516)	Data 0.001 (0.012)	Loss 4.0325 (4.1617)	Top-1 acc 33.594 (27.945)	Top-5 acc 53.906 (51.071)	lr 0.01073
Warmup Train [28][2400/3239]	Time 0.432 (0.515)	Data 0.001 (0.012)	Loss 4.1050 (4.1617)	Top-1 acc 28.516 (27.944)	Top-5 acc 51.172 (51.070)	lr 0.01072
Warmup Train [28][2410/3239]	Time 0.546 (0.515)	Data 0.001 (0.012)	Loss 4.1655 (4.1616)	Top-1 acc 28.125 (27.944)	Top-5 acc 51.172 (51.074)	lr 0.01072
Warmup Train [28][2420/3239]	Time 0.476 (0.515)	Data 0.001 (0.012)	Loss 4.1441 (4.1617)	Top-1 acc 27.344 (27.941)	Top-5 acc 48.828 (51.069)	lr 0.01071
Warmup Train [28][2430/3239]	Time 0.433 (0.515)	Data 0.001 (0.012)	Loss 4.2800 (4.1618)	Top-1 acc 23.047 (27.939)	Top-5 acc 52.734 (51.070)	lr 0.01071
Warmup Train [28][2440/3239]	Time 0.612 (0.515)	Data 0.001 (0.012)	Loss 3.9917 (4.1618)	Top-1 acc 30.469 (27.936)	Top-5 acc 57.812 (51.067)	lr 0.01070
Warmup Train [28][2450/3239]	Time 0.541 (0.515)	Data 0.001 (0.011)	Loss 4.2433 (4.1621)	Top-1 acc 27.344 (27.937)	Top-5 acc 48.828 (51.059)	lr 0.01070
Warmup Train [28][2460/3239]	Time 0.494 (0.515)	Data 0.001 (0.011)	Loss 4.3133 (4.1623)	Top-1 acc 26.953 (27.934)	Top-5 acc 48.828 (51.056)	lr 0.01069
Warmup Train [28][2470/3239]	Time 0.521 (0.515)	Data 0.001 (0.011)	Loss 4.1013 (4.1622)	Top-1 acc 27.734 (27.935)	Top-5 acc 50.781 (51.054)	lr 0.01069
Warmup Train [28][2480/3239]	Time 0.517 (0.515)	Data 0.001 (0.011)	Loss 4.3615 (4.1623)	Top-1 acc 24.609 (27.938)	Top-5 acc 44.141 (51.054)	lr 0.01068
Warmup Train [28][2490/3239]	Time 0.537 (0.515)	Data 0.001 (0.011)	Loss 4.2252 (4.1623)	Top-1 acc 26.953 (27.937)	Top-5 acc 47.266 (51.054)	lr 0.01068
Warmup Train [28][2500/3239]	Time 0.381 (0.515)	Data 0.001 (0.011)	Loss 4.0785 (4.1622)	Top-1 acc 27.344 (27.938)	Top-5 acc 49.609 (51.055)	lr 0.01067
Warmup Train [28][2510/3239]	Time 0.462 (0.515)	Data 0.001 (0.011)	Loss 4.3552 (4.1622)	Top-1 acc 24.219 (27.937)	Top-5 acc 43.750 (51.055)	lr 0.01067
Warmup Train [28][2520/3239]	Time 0.375 (0.515)	Data 0.001 (0.011)	Loss 4.2757 (4.1621)	Top-1 acc 23.438 (27.938)	Top-5 acc 44.922 (51.052)	lr 0.01066
Warmup Train [28][2530/3239]	Time 0.524 (0.515)	Data 0.001 (0.011)	Loss 4.1489 (4.1620)	Top-1 acc 27.344 (27.941)	Top-5 acc 52.734 (51.058)	lr 0.01066
Warmup Train [28][2540/3239]	Time 0.508 (0.515)	Data 0.001 (0.011)	Loss 4.0315 (4.1620)	Top-1 acc 30.859 (27.941)	Top-5 acc 55.078 (51.058)	lr 0.01065
Warmup Train [28][2550/3239]	Time 0.581 (0.515)	Data 0.001 (0.011)	Loss 4.2318 (4.1620)	Top-1 acc 25.391 (27.941)	Top-5 acc 49.609 (51.058)	lr 0.01065
Warmup Train [28][2560/3239]	Time 0.596 (0.515)	Data 0.001 (0.011)	Loss 4.1157 (4.1621)	Top-1 acc 29.688 (27.939)	Top-5 acc 50.781 (51.052)	lr 0.01064
Warmup Train [28][2570/3239]	Time 0.585 (0.515)	Data 0.001 (0.011)	Loss 4.2069 (4.1619)	Top-1 acc 28.906 (27.941)	Top-5 acc 46.875 (51.057)	lr 0.01064
Warmup Train [28][2580/3239]	Time 0.447 (0.515)	Data 0.001 (0.011)	Loss 4.2002 (4.1619)	Top-1 acc 26.172 (27.942)	Top-5 acc 47.656 (51.055)	lr 0.01063
Warmup Train [28][2590/3239]	Time 0.406 (0.515)	Data 0.001 (0.011)	Loss 4.2746 (4.1620)	Top-1 acc 25.000 (27.941)	Top-5 acc 48.438 (51.052)	lr 0.01063
Warmup Train [28][2600/3239]	Time 0.525 (0.515)	Data 0.001 (0.011)	Loss 4.2336 (4.1620)	Top-1 acc 24.219 (27.945)	Top-5 acc 50.000 (51.052)	lr 0.01062
Warmup Train [28][2610/3239]	Time 0.410 (0.515)	Data 0.001 (0.011)	Loss 4.2575 (4.1618)	Top-1 acc 28.125 (27.948)	Top-5 acc 48.828 (51.055)	lr 0.01062
Warmup Train [28][2620/3239]	Time 0.485 (0.515)	Data 0.001 (0.011)	Loss 3.8467 (4.1616)	Top-1 acc 36.328 (27.954)	Top-5 acc 60.938 (51.059)	lr 0.01061
Warmup Train [28][2630/3239]	Time 0.558 (0.515)	Data 0.001 (0.011)	Loss 4.3152 (4.1617)	Top-1 acc 22.266 (27.951)	Top-5 acc 45.703 (51.053)	lr 0.01061
Warmup Train [28][2640/3239]	Time 0.390 (0.515)	Data 0.001 (0.011)	Loss 4.2905 (4.1617)	Top-1 acc 23.828 (27.952)	Top-5 acc 44.922 (51.053)	lr 0.01060
Warmup Train [28][2650/3239]	Time 0.492 (0.515)	Data 0.001 (0.011)	Loss 4.1814 (4.1617)	Top-1 acc 25.781 (27.949)	Top-5 acc 49.219 (51.052)	lr 0.01060
Warmup Train [28][2660/3239]	Time 0.691 (0.515)	Data 0.001 (0.011)	Loss 4.2908 (4.1618)	Top-1 acc 25.391 (27.951)	Top-5 acc 50.000 (51.052)	lr 0.01059
Warmup Train [28][2670/3239]	Time 0.405 (0.515)	Data 0.001 (0.011)	Loss 4.1451 (4.1617)	Top-1 acc 28.906 (27.954)	Top-5 acc 50.391 (51.052)	lr 0.01059
Warmup Train [28][2680/3239]	Time 0.534 (0.515)	Data 0.001 (0.011)	Loss 3.9605 (4.1618)	Top-1 acc 31.250 (27.954)	Top-5 acc 54.297 (51.050)	lr 0.01058
Warmup Train [28][2690/3239]	Time 0.544 (0.515)	Data 0.001 (0.011)	Loss 4.0957 (4.1614)	Top-1 acc 26.562 (27.957)	Top-5 acc 53.125 (51.062)	lr 0.01058
Warmup Train [28][2700/3239]	Time 0.556 (0.515)	Data 0.001 (0.011)	Loss 4.1963 (4.1614)	Top-1 acc 26.172 (27.957)	Top-5 acc 48.438 (51.059)	lr 0.01057
Warmup Train [28][2710/3239]	Time 0.538 (0.515)	Data 0.001 (0.011)	Loss 4.2572 (4.1613)	Top-1 acc 27.344 (27.957)	Top-5 acc 50.781 (51.061)	lr 0.01057
Warmup Train [28][2720/3239]	Time 0.392 (0.515)	Data 0.001 (0.011)	Loss 4.0177 (4.1611)	Top-1 acc 30.469 (27.957)	Top-5 acc 56.641 (51.060)	lr 0.01056
Warmup Train [28][2730/3239]	Time 0.489 (0.515)	Data 0.001 (0.011)	Loss 4.1765 (4.1614)	Top-1 acc 30.859 (27.953)	Top-5 acc 49.609 (51.057)	lr 0.01056
Warmup Train [28][2740/3239]	Time 0.370 (0.515)	Data 0.001 (0.011)	Loss 4.3457 (4.1613)	Top-1 acc 23.047 (27.954)	Top-5 acc 49.219 (51.056)	lr 0.01055
Warmup Train [28][2750/3239]	Time 0.445 (0.515)	Data 0.001 (0.011)	Loss 3.9733 (4.1613)	Top-1 acc 30.078 (27.956)	Top-5 acc 55.859 (51.059)	lr 0.01055
Warmup Train [28][2760/3239]	Time 0.711 (0.515)	Data 0.001 (0.011)	Loss 3.9968 (4.1613)	Top-1 acc 28.516 (27.955)	Top-5 acc 54.297 (51.059)	lr 0.01054
Warmup Train [28][2770/3239]	Time 0.479 (0.515)	Data 0.001 (0.011)	Loss 4.2958 (4.1613)	Top-1 acc 27.734 (27.959)	Top-5 acc 49.219 (51.059)	lr 0.01054
Warmup Train [28][2780/3239]	Time 0.534 (0.515)	Data 0.001 (0.011)	Loss 4.2762 (4.1613)	Top-1 acc 25.391 (27.959)	Top-5 acc 47.656 (51.060)	lr 0.01053
Warmup Train [28][2790/3239]	Time 0.646 (0.515)	Data 0.001 (0.011)	Loss 4.0722 (4.1613)	Top-1 acc 30.859 (27.959)	Top-5 acc 56.641 (51.062)	lr 0.01053
Warmup Train [28][2800/3239]	Time 0.545 (0.515)	Data 0.001 (0.011)	Loss 4.0009 (4.1615)	Top-1 acc 30.859 (27.959)	Top-5 acc 53.125 (51.057)	lr 0.01052
Warmup Train [28][2810/3239]	Time 0.398 (0.515)	Data 0.001 (0.011)	Loss 4.1679 (4.1616)	Top-1 acc 26.562 (27.953)	Top-5 acc 51.953 (51.056)	lr 0.01052
Warmup Train [28][2820/3239]	Time 0.470 (0.515)	Data 0.001 (0.011)	Loss 4.2281 (4.1616)	Top-1 acc 23.828 (27.950)	Top-5 acc 50.781 (51.059)	lr 0.01051
Warmup Train [28][2830/3239]	Time 0.589 (0.515)	Data 0.001 (0.011)	Loss 4.3829 (4.1616)	Top-1 acc 18.359 (27.945)	Top-5 acc 44.531 (51.060)	lr 0.01051
Warmup Train [28][2840/3239]	Time 0.538 (0.515)	Data 0.001 (0.011)	Loss 4.3011 (4.1615)	Top-1 acc 23.438 (27.943)	Top-5 acc 47.656 (51.062)	lr 0.01050
Warmup Train [28][2850/3239]	Time 0.535 (0.515)	Data 0.001 (0.011)	Loss 4.1755 (4.1614)	Top-1 acc 25.781 (27.949)	Top-5 acc 52.734 (51.067)	lr 0.01050
Warmup Train [28][2860/3239]	Time 0.474 (0.515)	Data 0.001 (0.011)	Loss 4.2262 (4.1614)	Top-1 acc 28.125 (27.950)	Top-5 acc 50.781 (51.066)	lr 0.01049
Warmup Train [28][2870/3239]	Time 0.392 (0.515)	Data 0.001 (0.011)	Loss 4.3023 (4.1614)	Top-1 acc 27.734 (27.948)	Top-5 acc 47.656 (51.063)	lr 0.01049
Warmup Train [28][2880/3239]	Time 0.491 (0.515)	Data 0.001 (0.011)	Loss 4.1367 (4.1615)	Top-1 acc 28.125 (27.946)	Top-5 acc 53.125 (51.061)	lr 0.01048
Warmup Train [28][2890/3239]	Time 0.580 (0.515)	Data 0.001 (0.011)	Loss 4.1259 (4.1615)	Top-1 acc 24.609 (27.947)	Top-5 acc 55.469 (51.063)	lr 0.01048
Warmup Train [28][2900/3239]	Time 0.596 (0.515)	Data 0.001 (0.011)	Loss 4.1412 (4.1613)	Top-1 acc 28.125 (27.951)	Top-5 acc 50.391 (51.065)	lr 0.01047
Warmup Train [28][2910/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 4.1329 (4.1613)	Top-1 acc 31.250 (27.951)	Top-5 acc 53.125 (51.064)	lr 0.01047
Warmup Train [28][2920/3239]	Time 0.573 (0.515)	Data 0.001 (0.011)	Loss 4.2172 (4.1611)	Top-1 acc 23.828 (27.955)	Top-5 acc 50.000 (51.068)	lr 0.01046
Warmup Train [28][2930/3239]	Time 0.470 (0.515)	Data 0.001 (0.011)	Loss 4.0601 (4.1610)	Top-1 acc 32.812 (27.958)	Top-5 acc 58.594 (51.075)	lr 0.01046
Warmup Train [28][2940/3239]	Time 0.640 (0.515)	Data 0.001 (0.011)	Loss 4.3088 (4.1611)	Top-1 acc 24.219 (27.957)	Top-5 acc 43.359 (51.074)	lr 0.01045
Warmup Train [28][2950/3239]	Time 0.618 (0.515)	Data 0.001 (0.011)	Loss 4.2460 (4.1611)	Top-1 acc 26.953 (27.956)	Top-5 acc 48.438 (51.071)	lr 0.01045
Warmup Train [28][2960/3239]	Time 0.499 (0.515)	Data 0.001 (0.011)	Loss 4.1333 (4.1611)	Top-1 acc 25.781 (27.959)	Top-5 acc 47.266 (51.071)	lr 0.01044
Warmup Train [28][2970/3239]	Time 0.403 (0.515)	Data 0.023 (0.011)	Loss 4.1425 (4.1611)	Top-1 acc 30.078 (27.962)	Top-5 acc 53.516 (51.075)	lr 0.01044
Warmup Train [28][2980/3239]	Time 0.503 (0.515)	Data 0.001 (0.011)	Loss 4.1377 (4.1612)	Top-1 acc 26.562 (27.962)	Top-5 acc 52.344 (51.072)	lr 0.01043
Warmup Train [28][2990/3239]	Time 0.446 (0.515)	Data 0.001 (0.011)	Loss 4.2149 (4.1610)	Top-1 acc 22.656 (27.965)	Top-5 acc 48.828 (51.076)	lr 0.01043
Warmup Train [28][3000/3239]	Time 0.608 (0.515)	Data 0.001 (0.011)	Loss 4.1798 (4.1610)	Top-1 acc 27.734 (27.962)	Top-5 acc 46.094 (51.073)	lr 0.01042
Warmup Train [28][3010/3239]	Time 0.473 (0.515)	Data 0.001 (0.010)	Loss 4.1674 (4.1607)	Top-1 acc 27.344 (27.968)	Top-5 acc 53.125 (51.076)	lr 0.01042
Warmup Train [28][3020/3239]	Time 0.463 (0.515)	Data 0.001 (0.010)	Loss 4.1828 (4.1606)	Top-1 acc 23.828 (27.967)	Top-5 acc 50.000 (51.078)	lr 0.01041
Warmup Train [28][3030/3239]	Time 0.517 (0.514)	Data 0.001 (0.010)	Loss 4.2077 (4.1606)	Top-1 acc 27.344 (27.965)	Top-5 acc 50.391 (51.081)	lr 0.01041
Warmup Train [28][3040/3239]	Time 0.508 (0.514)	Data 0.001 (0.010)	Loss 3.9825 (4.1604)	Top-1 acc 29.297 (27.969)	Top-5 acc 53.906 (51.084)	lr 0.01040
Warmup Train [28][3050/3239]	Time 0.630 (0.514)	Data 0.001 (0.010)	Loss 4.1954 (4.1605)	Top-1 acc 24.609 (27.970)	Top-5 acc 47.656 (51.081)	lr 0.01040
Warmup Train [28][3060/3239]	Time 0.591 (0.514)	Data 0.001 (0.010)	Loss 4.1521 (4.1607)	Top-1 acc 32.031 (27.968)	Top-5 acc 53.125 (51.079)	lr 0.01039
Warmup Train [28][3070/3239]	Time 0.399 (0.514)	Data 0.001 (0.010)	Loss 4.2289 (4.1606)	Top-1 acc 28.516 (27.971)	Top-5 acc 47.266 (51.080)	lr 0.01039
Warmup Train [28][3080/3239]	Time 0.404 (0.514)	Data 0.001 (0.010)	Loss 4.1255 (4.1606)	Top-1 acc 27.734 (27.970)	Top-5 acc 52.734 (51.079)	lr 0.01038
Warmup Train [28][3090/3239]	Time 0.576 (0.514)	Data 0.001 (0.010)	Loss 4.3064 (4.1607)	Top-1 acc 25.391 (27.968)	Top-5 acc 46.875 (51.076)	lr 0.01038
Warmup Train [28][3100/3239]	Time 0.431 (0.514)	Data 0.001 (0.010)	Loss 4.1188 (4.1605)	Top-1 acc 29.688 (27.973)	Top-5 acc 49.219 (51.077)	lr 0.01037
Warmup Train [28][3110/3239]	Time 0.462 (0.514)	Data 0.001 (0.010)	Loss 4.2892 (4.1604)	Top-1 acc 26.172 (27.975)	Top-5 acc 50.781 (51.078)	lr 0.01037
Warmup Train [28][3120/3239]	Time 0.529 (0.514)	Data 0.002 (0.010)	Loss 4.0374 (4.1605)	Top-1 acc 25.391 (27.968)	Top-5 acc 53.125 (51.071)	lr 0.01036
Warmup Train [28][3130/3239]	Time 0.573 (0.514)	Data 0.001 (0.010)	Loss 4.0976 (4.1604)	Top-1 acc 26.562 (27.969)	Top-5 acc 51.172 (51.072)	lr 0.01036
Warmup Train [28][3140/3239]	Time 0.404 (0.514)	Data 0.001 (0.010)	Loss 4.0017 (4.1602)	Top-1 acc 32.812 (27.974)	Top-5 acc 55.078 (51.077)	lr 0.01035
Warmup Train [28][3150/3239]	Time 0.460 (0.514)	Data 0.001 (0.010)	Loss 4.2209 (4.1603)	Top-1 acc 26.172 (27.972)	Top-5 acc 50.000 (51.076)	lr 0.01035
Warmup Train [28][3160/3239]	Time 0.759 (0.514)	Data 0.001 (0.010)	Loss 4.1425 (4.1602)	Top-1 acc 28.516 (27.973)	Top-5 acc 54.297 (51.077)	lr 0.01034
Warmup Train [28][3170/3239]	Time 0.564 (0.514)	Data 0.001 (0.010)	Loss 4.0737 (4.1599)	Top-1 acc 28.516 (27.982)	Top-5 acc 51.562 (51.080)	lr 0.01034
Warmup Train [28][3180/3239]	Time 0.695 (0.514)	Data 0.000 (0.010)	Loss 4.3774 (4.1600)	Top-1 acc 23.828 (27.980)	Top-5 acc 44.922 (51.077)	lr 0.01033
Warmup Train [28][3190/3239]	Time 0.367 (0.514)	Data 0.000 (0.010)	Loss 3.9429 (4.1600)	Top-1 acc 33.203 (27.982)	Top-5 acc 57.812 (51.077)	lr 0.01033
Warmup Train [28][3200/3239]	Time 0.556 (0.514)	Data 0.000 (0.010)	Loss 4.0702 (4.1600)	Top-1 acc 29.688 (27.984)	Top-5 acc 54.297 (51.080)	lr 0.01032
Warmup Train [28][3210/3239]	Time 0.315 (0.514)	Data 0.000 (0.010)	Loss 4.0687 (4.1599)	Top-1 acc 31.250 (27.984)	Top-5 acc 53.125 (51.083)	lr 0.01032
Warmup Train [28][3220/3239]	Time 0.458 (0.514)	Data 0.000 (0.010)	Loss 4.2201 (4.1599)	Top-1 acc 24.219 (27.981)	Top-5 acc 48.828 (51.084)	lr 0.01032
Warmup Train [28][3230/3239]	Time 0.282 (0.514)	Data 0.000 (0.010)	Loss 4.0643 (4.1599)	Top-1 acc 30.078 (27.984)	Top-5 acc 51.562 (51.085)	lr 0.01031
Warmup Train [28][3239/3239]	Time 0.410 (0.514)	Data 0.000 (0.010)	Loss 4.2428 (4.1599)	Top-1 acc 25.926 (27.982)	Top-5 acc 48.148 (51.081)	lr 0.01031
==========Warmup Valid [28/40]	loss 3.119	top-1 acc 35.593	top-5 acc 60.243	Train top-1 27.982	top-5 51.081	flops: 442.4M
Warmup Train [29][0/3239]	Time 16.048 (16.048)	Data 14.657 (14.657)	Loss 4.2961 (4.2961)	Top-1 acc 26.953 (26.953)	Top-5 acc 48.047 (48.047)	lr 0.01031
Warmup Train [29][10/3239]	Time 0.475 (1.960)	Data 0.001 (1.335)	Loss 4.0820 (4.1215)	Top-1 acc 29.297 (28.587)	Top-5 acc 54.297 (51.634)	lr 0.01030
Warmup Train [29][20/3239]	Time 0.437 (1.274)	Data 0.001 (0.703)	Loss 3.9664 (4.1502)	Top-1 acc 32.031 (28.757)	Top-5 acc 53.516 (50.986)	lr 0.01030
Warmup Train [29][30/3239]	Time 0.516 (1.032)	Data 0.001 (0.479)	Loss 4.2247 (4.1487)	Top-1 acc 28.516 (28.591)	Top-5 acc 50.391 (51.008)	lr 0.01029
Warmup Train [29][40/3239]	Time 0.404 (0.901)	Data 0.001 (0.363)	Loss 4.0656 (4.1308)	Top-1 acc 27.344 (28.620)	Top-5 acc 54.688 (51.562)	lr 0.01029
Warmup Train [29][50/3239]	Time 0.175 (0.824)	Data 0.001 (0.294)	Loss 4.3031 (4.1414)	Top-1 acc 25.000 (28.370)	Top-5 acc 49.219 (51.294)	lr 0.01028
Warmup Train [29][60/3239]	Time 0.448 (0.769)	Data 0.002 (0.249)	Loss 4.0162 (4.1431)	Top-1 acc 28.906 (28.330)	Top-5 acc 51.953 (51.197)	lr 0.01028
Warmup Train [29][70/3239]	Time 0.350 (0.726)	Data 0.001 (0.216)	Loss 4.1444 (4.1423)	Top-1 acc 29.297 (28.279)	Top-5 acc 52.734 (51.381)	lr 0.01027
Warmup Train [29][80/3239]	Time 0.497 (0.698)	Data 0.001 (0.191)	Loss 4.1325 (4.1390)	Top-1 acc 25.781 (28.323)	Top-5 acc 50.000 (51.408)	lr 0.01027
Warmup Train [29][90/3239]	Time 0.564 (0.675)	Data 0.001 (0.171)	Loss 4.1368 (4.1379)	Top-1 acc 29.297 (28.331)	Top-5 acc 53.125 (51.511)	lr 0.01026
Warmup Train [29][100/3239]	Time 0.599 (0.659)	Data 0.001 (0.154)	Loss 4.1007 (4.1416)	Top-1 acc 28.906 (28.210)	Top-5 acc 48.438 (51.404)	lr 0.01026
Warmup Train [29][110/3239]	Time 0.712 (0.646)	Data 0.001 (0.140)	Loss 4.0341 (4.1409)	Top-1 acc 28.906 (28.322)	Top-5 acc 51.953 (51.401)	lr 0.01025
Warmup Train [29][120/3239]	Time 0.549 (0.636)	Data 0.001 (0.129)	Loss 4.0149 (4.1422)	Top-1 acc 32.422 (28.364)	Top-5 acc 52.734 (51.327)	lr 0.01025
Warmup Train [29][130/3239]	Time 0.660 (0.626)	Data 0.001 (0.120)	Loss 4.1756 (4.1442)	Top-1 acc 25.000 (28.259)	Top-5 acc 50.000 (51.363)	lr 0.01024
Warmup Train [29][140/3239]	Time 0.667 (0.620)	Data 0.001 (0.112)	Loss 4.1475 (4.1451)	Top-1 acc 28.125 (28.261)	Top-5 acc 53.125 (51.321)	lr 0.01024
Warmup Train [29][150/3239]	Time 0.542 (0.613)	Data 0.001 (0.104)	Loss 4.0272 (4.1435)	Top-1 acc 31.250 (28.249)	Top-5 acc 56.641 (51.381)	lr 0.01023
Warmup Train [29][160/3239]	Time 0.487 (0.608)	Data 0.001 (0.098)	Loss 4.0552 (4.1431)	Top-1 acc 26.562 (28.244)	Top-5 acc 53.906 (51.356)	lr 0.01023
Warmup Train [29][170/3239]	Time 0.604 (0.604)	Data 0.001 (0.093)	Loss 4.2062 (4.1429)	Top-1 acc 28.125 (28.223)	Top-5 acc 48.438 (51.357)	lr 0.01022
Warmup Train [29][180/3239]	Time 0.565 (0.598)	Data 0.001 (0.088)	Loss 3.9941 (4.1417)	Top-1 acc 33.594 (28.267)	Top-5 acc 53.516 (51.370)	lr 0.01022
Warmup Train [29][190/3239]	Time 0.571 (0.596)	Data 0.001 (0.083)	Loss 4.0086 (4.1392)	Top-1 acc 26.953 (28.295)	Top-5 acc 55.859 (51.428)	lr 0.01021
Warmup Train [29][200/3239]	Time 0.593 (0.592)	Data 0.001 (0.079)	Loss 4.1050 (4.1387)	Top-1 acc 30.469 (28.271)	Top-5 acc 53.125 (51.413)	lr 0.01021
Warmup Train [29][210/3239]	Time 0.569 (0.589)	Data 0.001 (0.076)	Loss 3.9919 (4.1377)	Top-1 acc 29.688 (28.290)	Top-5 acc 55.469 (51.483)	lr 0.01020
Warmup Train [29][220/3239]	Time 0.501 (0.585)	Data 0.001 (0.072)	Loss 4.1642 (4.1359)	Top-1 acc 28.516 (28.348)	Top-5 acc 51.953 (51.555)	lr 0.01020
Warmup Train [29][230/3239]	Time 0.542 (0.582)	Data 0.001 (0.069)	Loss 4.0902 (4.1357)	Top-1 acc 27.734 (28.367)	Top-5 acc 50.391 (51.564)	lr 0.01019
Warmup Train [29][240/3239]	Time 0.531 (0.580)	Data 0.001 (0.067)	Loss 4.0300 (4.1350)	Top-1 acc 32.031 (28.386)	Top-5 acc 53.125 (51.553)	lr 0.01019
Warmup Train [29][250/3239]	Time 0.501 (0.577)	Data 0.001 (0.064)	Loss 4.0531 (4.1339)	Top-1 acc 30.859 (28.427)	Top-5 acc 55.469 (51.601)	lr 0.01018
Warmup Train [29][260/3239]	Time 0.492 (0.575)	Data 0.001 (0.062)	Loss 4.0657 (4.1348)	Top-1 acc 33.984 (28.417)	Top-5 acc 54.297 (51.585)	lr 0.01018
Warmup Train [29][270/3239]	Time 0.495 (0.572)	Data 0.001 (0.059)	Loss 4.2791 (4.1329)	Top-1 acc 28.125 (28.454)	Top-5 acc 50.781 (51.610)	lr 0.01017
Warmup Train [29][280/3239]	Time 0.475 (0.570)	Data 0.001 (0.058)	Loss 4.0604 (4.1333)	Top-1 acc 30.078 (28.454)	Top-5 acc 51.562 (51.622)	lr 0.01017
Warmup Train [29][290/3239]	Time 0.540 (0.568)	Data 0.001 (0.056)	Loss 4.1837 (4.1345)	Top-1 acc 24.609 (28.414)	Top-5 acc 51.172 (51.628)	lr 0.01016
Warmup Train [29][300/3239]	Time 0.485 (0.566)	Data 0.001 (0.055)	Loss 4.2713 (4.1350)	Top-1 acc 30.078 (28.431)	Top-5 acc 50.391 (51.627)	lr 0.01016
Warmup Train [29][310/3239]	Time 0.427 (0.563)	Data 0.001 (0.053)	Loss 4.3086 (4.1359)	Top-1 acc 27.344 (28.435)	Top-5 acc 50.000 (51.605)	lr 0.01015
Warmup Train [29][320/3239]	Time 0.447 (0.561)	Data 0.001 (0.052)	Loss 4.1481 (4.1373)	Top-1 acc 26.953 (28.411)	Top-5 acc 53.906 (51.577)	lr 0.01015
Warmup Train [29][330/3239]	Time 0.426 (0.559)	Data 0.001 (0.050)	Loss 4.1480 (4.1379)	Top-1 acc 28.125 (28.435)	Top-5 acc 53.906 (51.593)	lr 0.01014
Warmup Train [29][340/3239]	Time 0.546 (0.556)	Data 0.001 (0.049)	Loss 3.9760 (4.1365)	Top-1 acc 31.250 (28.469)	Top-5 acc 52.734 (51.597)	lr 0.01014
Warmup Train [29][350/3239]	Time 0.506 (0.554)	Data 0.001 (0.048)	Loss 4.1792 (4.1371)	Top-1 acc 30.078 (28.473)	Top-5 acc 50.391 (51.557)	lr 0.01013
Warmup Train [29][360/3239]	Time 0.502 (0.553)	Data 0.001 (0.046)	Loss 4.3767 (4.1381)	Top-1 acc 24.609 (28.464)	Top-5 acc 47.656 (51.514)	lr 0.01013
Warmup Train [29][370/3239]	Time 0.532 (0.551)	Data 0.001 (0.045)	Loss 4.0349 (4.1387)	Top-1 acc 30.859 (28.440)	Top-5 acc 55.078 (51.495)	lr 0.01012
Warmup Train [29][380/3239]	Time 0.457 (0.550)	Data 0.001 (0.044)	Loss 4.2927 (4.1374)	Top-1 acc 28.125 (28.459)	Top-5 acc 50.781 (51.550)	lr 0.01012
Warmup Train [29][390/3239]	Time 0.618 (0.550)	Data 0.001 (0.043)	Loss 3.9724 (4.1378)	Top-1 acc 33.203 (28.477)	Top-5 acc 55.469 (51.546)	lr 0.01011
Warmup Train [29][400/3239]	Time 0.497 (0.550)	Data 0.001 (0.042)	Loss 4.1677 (4.1374)	Top-1 acc 28.125 (28.496)	Top-5 acc 51.172 (51.578)	lr 0.01011
Warmup Train [29][410/3239]	Time 0.567 (0.550)	Data 0.001 (0.042)	Loss 4.1710 (4.1365)	Top-1 acc 31.250 (28.511)	Top-5 acc 52.734 (51.608)	lr 0.01011
Warmup Train [29][420/3239]	Time 0.427 (0.549)	Data 0.001 (0.041)	Loss 4.2013 (4.1360)	Top-1 acc 25.391 (28.543)	Top-5 acc 52.344 (51.624)	lr 0.01010
Warmup Train [29][430/3239]	Time 0.510 (0.549)	Data 0.001 (0.040)	Loss 4.1182 (4.1361)	Top-1 acc 31.641 (28.547)	Top-5 acc 51.953 (51.623)	lr 0.01010
Warmup Train [29][440/3239]	Time 0.349 (0.547)	Data 0.001 (0.039)	Loss 4.1179 (4.1364)	Top-1 acc 28.906 (28.535)	Top-5 acc 48.828 (51.627)	lr 0.01009
Warmup Train [29][450/3239]	Time 0.673 (0.547)	Data 0.001 (0.039)	Loss 4.1398 (4.1371)	Top-1 acc 25.781 (28.478)	Top-5 acc 53.516 (51.608)	lr 0.01009
Warmup Train [29][460/3239]	Time 0.555 (0.546)	Data 0.001 (0.038)	Loss 4.0928 (4.1366)	Top-1 acc 31.250 (28.515)	Top-5 acc 52.344 (51.610)	lr 0.01008
Warmup Train [29][470/3239]	Time 0.609 (0.546)	Data 0.001 (0.037)	Loss 4.0399 (4.1360)	Top-1 acc 32.422 (28.543)	Top-5 acc 52.344 (51.619)	lr 0.01008
Warmup Train [29][480/3239]	Time 0.529 (0.545)	Data 0.001 (0.036)	Loss 4.2822 (4.1358)	Top-1 acc 21.875 (28.525)	Top-5 acc 45.703 (51.636)	lr 0.01007
Warmup Train [29][490/3239]	Time 0.636 (0.544)	Data 0.001 (0.036)	Loss 4.2472 (4.1373)	Top-1 acc 28.125 (28.489)	Top-5 acc 48.438 (51.596)	lr 0.01007
Warmup Train [29][500/3239]	Time 0.604 (0.543)	Data 0.001 (0.035)	Loss 4.0877 (4.1371)	Top-1 acc 28.125 (28.476)	Top-5 acc 53.125 (51.610)	lr 0.01006
Warmup Train [29][510/3239]	Time 0.507 (0.543)	Data 0.001 (0.034)	Loss 4.1826 (4.1375)	Top-1 acc 26.562 (28.464)	Top-5 acc 50.781 (51.620)	lr 0.01006
Warmup Train [29][520/3239]	Time 0.552 (0.543)	Data 0.001 (0.034)	Loss 4.0993 (4.1367)	Top-1 acc 29.688 (28.480)	Top-5 acc 55.078 (51.647)	lr 0.01005
Warmup Train [29][530/3239]	Time 0.369 (0.542)	Data 0.001 (0.033)	Loss 4.1633 (4.1358)	Top-1 acc 27.734 (28.500)	Top-5 acc 48.438 (51.682)	lr 0.01005
Warmup Train [29][540/3239]	Time 0.525 (0.542)	Data 0.001 (0.033)	Loss 4.0738 (4.1351)	Top-1 acc 30.469 (28.512)	Top-5 acc 55.469 (51.698)	lr 0.01004
Warmup Train [29][550/3239]	Time 0.654 (0.541)	Data 0.001 (0.032)	Loss 4.2380 (4.1361)	Top-1 acc 27.344 (28.490)	Top-5 acc 50.391 (51.679)	lr 0.01004
Warmup Train [29][560/3239]	Time 0.503 (0.540)	Data 0.001 (0.032)	Loss 4.2922 (4.1368)	Top-1 acc 28.516 (28.492)	Top-5 acc 49.219 (51.666)	lr 0.01003
Warmup Train [29][570/3239]	Time 0.551 (0.539)	Data 0.001 (0.031)	Loss 4.1700 (4.1356)	Top-1 acc 27.344 (28.520)	Top-5 acc 47.266 (51.702)	lr 0.01003
Warmup Train [29][580/3239]	Time 0.469 (0.538)	Data 0.001 (0.031)	Loss 4.1876 (4.1358)	Top-1 acc 28.906 (28.514)	Top-5 acc 51.953 (51.687)	lr 0.01002
Warmup Train [29][590/3239]	Time 0.571 (0.537)	Data 0.001 (0.031)	Loss 4.1952 (4.1361)	Top-1 acc 25.781 (28.481)	Top-5 acc 50.000 (51.676)	lr 0.01002
Warmup Train [29][600/3239]	Time 0.509 (0.537)	Data 0.001 (0.030)	Loss 4.1595 (4.1350)	Top-1 acc 27.734 (28.509)	Top-5 acc 49.219 (51.696)	lr 0.01001
Warmup Train [29][610/3239]	Time 0.384 (0.536)	Data 0.001 (0.030)	Loss 4.3305 (4.1345)	Top-1 acc 21.484 (28.519)	Top-5 acc 47.656 (51.710)	lr 0.01001
Warmup Train [29][620/3239]	Time 0.546 (0.536)	Data 0.001 (0.029)	Loss 4.0767 (4.1351)	Top-1 acc 30.469 (28.475)	Top-5 acc 53.125 (51.675)	lr 0.01000
Warmup Train [29][630/3239]	Time 0.532 (0.535)	Data 0.002 (0.029)	Loss 4.3931 (4.1356)	Top-1 acc 24.219 (28.475)	Top-5 acc 47.656 (51.655)	lr 0.01000
Warmup Train [29][640/3239]	Time 0.456 (0.534)	Data 0.001 (0.029)	Loss 4.1095 (4.1353)	Top-1 acc 29.297 (28.483)	Top-5 acc 53.906 (51.651)	lr 0.00999
Warmup Train [29][650/3239]	Time 0.387 (0.534)	Data 0.001 (0.028)	Loss 4.3528 (4.1356)	Top-1 acc 22.656 (28.468)	Top-5 acc 42.969 (51.660)	lr 0.00999
Warmup Train [29][660/3239]	Time 0.460 (0.533)	Data 0.001 (0.028)	Loss 4.0584 (4.1358)	Top-1 acc 29.297 (28.470)	Top-5 acc 57.031 (51.652)	lr 0.00998
Warmup Train [29][670/3239]	Time 0.577 (0.533)	Data 0.001 (0.028)	Loss 4.1408 (4.1367)	Top-1 acc 29.688 (28.447)	Top-5 acc 50.391 (51.636)	lr 0.00998
Warmup Train [29][680/3239]	Time 0.557 (0.533)	Data 0.001 (0.027)	Loss 3.9990 (4.1359)	Top-1 acc 29.688 (28.449)	Top-5 acc 55.078 (51.642)	lr 0.00997
Warmup Train [29][690/3239]	Time 0.555 (0.533)	Data 0.001 (0.027)	Loss 4.2590 (4.1360)	Top-1 acc 28.125 (28.436)	Top-5 acc 46.094 (51.627)	lr 0.00997
Warmup Train [29][700/3239]	Time 0.500 (0.533)	Data 0.001 (0.027)	Loss 4.1505 (4.1360)	Top-1 acc 28.906 (28.443)	Top-5 acc 52.734 (51.635)	lr 0.00996
Warmup Train [29][710/3239]	Time 0.467 (0.532)	Data 0.001 (0.027)	Loss 4.0592 (4.1357)	Top-1 acc 28.906 (28.451)	Top-5 acc 55.469 (51.651)	lr 0.00996
Warmup Train [29][720/3239]	Time 0.538 (0.532)	Data 0.001 (0.026)	Loss 4.2133 (4.1351)	Top-1 acc 28.125 (28.453)	Top-5 acc 53.125 (51.665)	lr 0.00995
Warmup Train [29][730/3239]	Time 0.518 (0.532)	Data 0.001 (0.026)	Loss 4.1544 (4.1352)	Top-1 acc 29.688 (28.464)	Top-5 acc 50.781 (51.672)	lr 0.00995
Warmup Train [29][740/3239]	Time 0.352 (0.532)	Data 0.001 (0.026)	Loss 4.1493 (4.1348)	Top-1 acc 26.953 (28.469)	Top-5 acc 52.734 (51.675)	lr 0.00994
Warmup Train [29][750/3239]	Time 0.600 (0.532)	Data 0.001 (0.026)	Loss 4.0486 (4.1348)	Top-1 acc 28.125 (28.440)	Top-5 acc 54.688 (51.681)	lr 0.00994
Warmup Train [29][760/3239]	Time 0.437 (0.532)	Data 0.001 (0.025)	Loss 4.1388 (4.1350)	Top-1 acc 31.641 (28.451)	Top-5 acc 50.781 (51.677)	lr 0.00994
Warmup Train [29][770/3239]	Time 0.488 (0.531)	Data 0.001 (0.025)	Loss 3.8396 (4.1350)	Top-1 acc 33.203 (28.456)	Top-5 acc 59.766 (51.678)	lr 0.00993
Warmup Train [29][780/3239]	Time 0.541 (0.531)	Data 0.001 (0.025)	Loss 4.0741 (4.1353)	Top-1 acc 29.297 (28.448)	Top-5 acc 55.859 (51.671)	lr 0.00993
Warmup Train [29][790/3239]	Time 0.597 (0.531)	Data 0.001 (0.024)	Loss 4.1734 (4.1358)	Top-1 acc 28.906 (28.435)	Top-5 acc 52.734 (51.650)	lr 0.00992
Warmup Train [29][800/3239]	Time 0.782 (0.530)	Data 0.001 (0.024)	Loss 4.1553 (4.1352)	Top-1 acc 26.562 (28.450)	Top-5 acc 50.391 (51.660)	lr 0.00992
Warmup Train [29][810/3239]	Time 0.558 (0.529)	Data 0.001 (0.024)	Loss 3.9858 (4.1356)	Top-1 acc 34.766 (28.436)	Top-5 acc 53.906 (51.652)	lr 0.00991
Warmup Train [29][820/3239]	Time 0.226 (0.528)	Data 0.001 (0.024)	Loss 4.1191 (4.1362)	Top-1 acc 25.000 (28.417)	Top-5 acc 51.172 (51.641)	lr 0.00991
Warmup Train [29][830/3239]	Time 0.402 (0.528)	Data 0.001 (0.023)	Loss 4.1046 (4.1361)	Top-1 acc 30.078 (28.422)	Top-5 acc 52.344 (51.652)	lr 0.00990
Warmup Train [29][840/3239]	Time 0.551 (0.528)	Data 0.001 (0.023)	Loss 4.0077 (4.1363)	Top-1 acc 30.469 (28.404)	Top-5 acc 56.641 (51.638)	lr 0.00990
Warmup Train [29][850/3239]	Time 0.521 (0.528)	Data 0.001 (0.023)	Loss 4.0304 (4.1367)	Top-1 acc 29.297 (28.389)	Top-5 acc 51.953 (51.623)	lr 0.00989
Warmup Train [29][860/3239]	Time 0.492 (0.527)	Data 0.001 (0.023)	Loss 4.0840 (4.1370)	Top-1 acc 28.906 (28.375)	Top-5 acc 51.953 (51.600)	lr 0.00989
Warmup Train [29][870/3239]	Time 0.566 (0.527)	Data 0.001 (0.023)	Loss 3.9841 (4.1372)	Top-1 acc 28.516 (28.372)	Top-5 acc 55.859 (51.605)	lr 0.00988
Warmup Train [29][880/3239]	Time 0.453 (0.527)	Data 0.001 (0.022)	Loss 4.2455 (4.1380)	Top-1 acc 26.562 (28.347)	Top-5 acc 53.906 (51.594)	lr 0.00988
Warmup Train [29][890/3239]	Time 0.639 (0.527)	Data 0.001 (0.022)	Loss 4.0541 (4.1378)	Top-1 acc 31.641 (28.347)	Top-5 acc 53.125 (51.594)	lr 0.00987
Warmup Train [29][900/3239]	Time 0.594 (0.527)	Data 0.001 (0.022)	Loss 4.1088 (4.1379)	Top-1 acc 27.344 (28.357)	Top-5 acc 51.562 (51.601)	lr 0.00987
Warmup Train [29][910/3239]	Time 0.583 (0.527)	Data 0.001 (0.022)	Loss 3.9192 (4.1368)	Top-1 acc 34.375 (28.377)	Top-5 acc 55.469 (51.627)	lr 0.00986
Warmup Train [29][920/3239]	Time 0.549 (0.526)	Data 0.001 (0.022)	Loss 4.2446 (4.1371)	Top-1 acc 26.953 (28.368)	Top-5 acc 50.391 (51.620)	lr 0.00986
Warmup Train [29][930/3239]	Time 0.462 (0.526)	Data 0.024 (0.022)	Loss 3.8739 (4.1368)	Top-1 acc 33.594 (28.375)	Top-5 acc 58.203 (51.630)	lr 0.00985
Warmup Train [29][940/3239]	Time 0.358 (0.526)	Data 0.001 (0.021)	Loss 4.1713 (4.1363)	Top-1 acc 27.734 (28.384)	Top-5 acc 51.172 (51.637)	lr 0.00985
Warmup Train [29][950/3239]	Time 0.553 (0.525)	Data 0.001 (0.021)	Loss 4.0026 (4.1360)	Top-1 acc 31.250 (28.390)	Top-5 acc 52.344 (51.635)	lr 0.00984
Warmup Train [29][960/3239]	Time 0.522 (0.525)	Data 0.001 (0.021)	Loss 4.2516 (4.1358)	Top-1 acc 26.172 (28.396)	Top-5 acc 50.391 (51.643)	lr 0.00984
Warmup Train [29][970/3239]	Time 0.334 (0.525)	Data 0.001 (0.021)	Loss 3.9910 (4.1353)	Top-1 acc 30.859 (28.405)	Top-5 acc 52.734 (51.649)	lr 0.00983
Warmup Train [29][980/3239]	Time 0.563 (0.525)	Data 0.001 (0.021)	Loss 4.0974 (4.1356)	Top-1 acc 23.828 (28.406)	Top-5 acc 52.344 (51.640)	lr 0.00983
Warmup Train [29][990/3239]	Time 0.521 (0.525)	Data 0.001 (0.021)	Loss 4.1302 (4.1352)	Top-1 acc 27.344 (28.412)	Top-5 acc 51.562 (51.650)	lr 0.00982
Warmup Train [29][1000/3239]	Time 0.537 (0.525)	Data 0.001 (0.020)	Loss 3.9683 (4.1351)	Top-1 acc 30.469 (28.408)	Top-5 acc 54.688 (51.653)	lr 0.00982
Warmup Train [29][1010/3239]	Time 0.521 (0.525)	Data 0.001 (0.020)	Loss 4.2604 (4.1348)	Top-1 acc 25.000 (28.418)	Top-5 acc 49.219 (51.661)	lr 0.00981
Warmup Train [29][1020/3239]	Time 0.463 (0.525)	Data 0.002 (0.020)	Loss 4.4024 (4.1350)	Top-1 acc 23.438 (28.413)	Top-5 acc 42.969 (51.641)	lr 0.00981
Warmup Train [29][1030/3239]	Time 0.503 (0.525)	Data 0.001 (0.020)	Loss 4.2353 (4.1353)	Top-1 acc 25.391 (28.400)	Top-5 acc 47.656 (51.630)	lr 0.00981
Warmup Train [29][1040/3239]	Time 0.529 (0.525)	Data 0.001 (0.020)	Loss 4.2996 (4.1356)	Top-1 acc 28.516 (28.403)	Top-5 acc 51.562 (51.635)	lr 0.00980
Warmup Train [29][1050/3239]	Time 0.482 (0.524)	Data 0.001 (0.020)	Loss 4.2544 (4.1361)	Top-1 acc 25.000 (28.389)	Top-5 acc 50.781 (51.625)	lr 0.00980
Warmup Train [29][1060/3239]	Time 0.439 (0.524)	Data 0.001 (0.020)	Loss 4.3442 (4.1356)	Top-1 acc 22.266 (28.406)	Top-5 acc 44.531 (51.632)	lr 0.00979
Warmup Train [29][1070/3239]	Time 0.207 (0.522)	Data 0.001 (0.019)	Loss 4.0764 (4.1354)	Top-1 acc 29.688 (28.409)	Top-5 acc 55.859 (51.645)	lr 0.00979
Warmup Train [29][1080/3239]	Time 0.276 (0.521)	Data 0.001 (0.019)	Loss 3.9572 (4.1355)	Top-1 acc 33.594 (28.402)	Top-5 acc 53.906 (51.633)	lr 0.00978
Warmup Train [29][1090/3239]	Time 0.378 (0.520)	Data 0.001 (0.019)	Loss 4.2300 (4.1356)	Top-1 acc 21.094 (28.393)	Top-5 acc 50.781 (51.635)	lr 0.00978
Warmup Train [29][1100/3239]	Time 0.537 (0.519)	Data 0.001 (0.019)	Loss 4.0723 (4.1353)	Top-1 acc 27.734 (28.395)	Top-5 acc 51.172 (51.637)	lr 0.00977
Warmup Train [29][1110/3239]	Time 0.516 (0.519)	Data 0.001 (0.019)	Loss 3.9984 (4.1351)	Top-1 acc 32.031 (28.402)	Top-5 acc 51.953 (51.637)	lr 0.00977
Warmup Train [29][1120/3239]	Time 0.635 (0.519)	Data 0.001 (0.019)	Loss 4.2016 (4.1349)	Top-1 acc 26.172 (28.405)	Top-5 acc 46.875 (51.638)	lr 0.00976
Warmup Train [29][1130/3239]	Time 0.621 (0.519)	Data 0.001 (0.019)	Loss 4.2663 (4.1354)	Top-1 acc 28.516 (28.400)	Top-5 acc 49.609 (51.626)	lr 0.00976
Warmup Train [29][1140/3239]	Time 0.664 (0.519)	Data 0.001 (0.019)	Loss 4.1521 (4.1357)	Top-1 acc 30.078 (28.404)	Top-5 acc 50.391 (51.619)	lr 0.00975
Warmup Train [29][1150/3239]	Time 0.472 (0.519)	Data 0.001 (0.019)	Loss 4.2708 (4.1362)	Top-1 acc 30.078 (28.395)	Top-5 acc 49.219 (51.602)	lr 0.00975
Warmup Train [29][1160/3239]	Time 0.322 (0.519)	Data 0.001 (0.019)	Loss 4.1060 (4.1365)	Top-1 acc 25.781 (28.384)	Top-5 acc 54.297 (51.592)	lr 0.00974
Warmup Train [29][1170/3239]	Time 0.421 (0.519)	Data 0.001 (0.019)	Loss 3.9999 (4.1365)	Top-1 acc 30.469 (28.394)	Top-5 acc 51.172 (51.584)	lr 0.00974
Warmup Train [29][1180/3239]	Time 0.547 (0.519)	Data 0.001 (0.018)	Loss 4.2038 (4.1360)	Top-1 acc 23.047 (28.394)	Top-5 acc 50.781 (51.601)	lr 0.00973
Warmup Train [29][1190/3239]	Time 0.615 (0.519)	Data 0.001 (0.018)	Loss 4.1851 (4.1355)	Top-1 acc 27.344 (28.402)	Top-5 acc 51.953 (51.622)	lr 0.00973
Warmup Train [29][1200/3239]	Time 0.510 (0.519)	Data 0.001 (0.018)	Loss 4.2048 (4.1358)	Top-1 acc 25.781 (28.400)	Top-5 acc 46.484 (51.607)	lr 0.00972
Warmup Train [29][1210/3239]	Time 0.664 (0.519)	Data 0.001 (0.018)	Loss 4.2779 (4.1363)	Top-1 acc 26.562 (28.389)	Top-5 acc 48.828 (51.590)	lr 0.00972
Warmup Train [29][1220/3239]	Time 0.421 (0.519)	Data 0.001 (0.018)	Loss 4.1388 (4.1357)	Top-1 acc 30.469 (28.402)	Top-5 acc 50.391 (51.602)	lr 0.00971
Warmup Train [29][1230/3239]	Time 0.626 (0.518)	Data 0.001 (0.018)	Loss 4.0861 (4.1360)	Top-1 acc 27.734 (28.397)	Top-5 acc 51.953 (51.597)	lr 0.00971
Warmup Train [29][1240/3239]	Time 0.555 (0.518)	Data 0.002 (0.018)	Loss 3.9843 (4.1359)	Top-1 acc 30.859 (28.395)	Top-5 acc 56.250 (51.602)	lr 0.00970
Warmup Train [29][1250/3239]	Time 0.606 (0.518)	Data 0.002 (0.018)	Loss 3.8853 (4.1355)	Top-1 acc 31.250 (28.402)	Top-5 acc 57.031 (51.621)	lr 0.00970
Warmup Train [29][1260/3239]	Time 0.428 (0.518)	Data 0.001 (0.018)	Loss 4.0808 (4.1354)	Top-1 acc 32.422 (28.411)	Top-5 acc 51.562 (51.620)	lr 0.00969
Warmup Train [29][1270/3239]	Time 0.623 (0.518)	Data 0.001 (0.018)	Loss 4.0184 (4.1353)	Top-1 acc 28.906 (28.416)	Top-5 acc 54.688 (51.619)	lr 0.00969
Warmup Train [29][1280/3239]	Time 0.481 (0.518)	Data 0.001 (0.017)	Loss 4.1325 (4.1349)	Top-1 acc 26.172 (28.422)	Top-5 acc 52.734 (51.631)	lr 0.00968
Warmup Train [29][1290/3239]	Time 0.544 (0.518)	Data 0.001 (0.017)	Loss 4.1952 (4.1355)	Top-1 acc 24.609 (28.411)	Top-5 acc 51.172 (51.626)	lr 0.00968
Warmup Train [29][1300/3239]	Time 0.494 (0.518)	Data 0.001 (0.017)	Loss 4.1907 (4.1354)	Top-1 acc 25.000 (28.409)	Top-5 acc 50.391 (51.630)	lr 0.00968
Warmup Train [29][1310/3239]	Time 0.336 (0.518)	Data 0.001 (0.017)	Loss 4.2888 (4.1357)	Top-1 acc 25.000 (28.406)	Top-5 acc 49.219 (51.624)	lr 0.00967
Warmup Train [29][1320/3239]	Time 0.374 (0.518)	Data 0.001 (0.017)	Loss 4.2916 (4.1360)	Top-1 acc 23.047 (28.404)	Top-5 acc 45.312 (51.621)	lr 0.00967
Warmup Train [29][1330/3239]	Time 0.497 (0.517)	Data 0.001 (0.017)	Loss 4.1273 (4.1366)	Top-1 acc 26.953 (28.403)	Top-5 acc 50.781 (51.606)	lr 0.00966
Warmup Train [29][1340/3239]	Time 0.461 (0.517)	Data 0.001 (0.017)	Loss 4.0759 (4.1368)	Top-1 acc 26.562 (28.405)	Top-5 acc 53.516 (51.602)	lr 0.00966
Warmup Train [29][1350/3239]	Time 0.655 (0.517)	Data 0.001 (0.017)	Loss 4.1172 (4.1369)	Top-1 acc 32.422 (28.409)	Top-5 acc 50.000 (51.599)	lr 0.00965
Warmup Train [29][1360/3239]	Time 0.645 (0.517)	Data 0.001 (0.017)	Loss 4.0628 (4.1368)	Top-1 acc 31.250 (28.421)	Top-5 acc 52.344 (51.599)	lr 0.00965
Warmup Train [29][1370/3239]	Time 0.643 (0.517)	Data 0.001 (0.017)	Loss 3.8682 (4.1369)	Top-1 acc 32.812 (28.418)	Top-5 acc 57.422 (51.596)	lr 0.00964
Warmup Train [29][1380/3239]	Time 0.480 (0.516)	Data 0.001 (0.017)	Loss 4.2245 (4.1371)	Top-1 acc 25.000 (28.413)	Top-5 acc 49.609 (51.589)	lr 0.00964
Warmup Train [29][1390/3239]	Time 0.566 (0.516)	Data 0.001 (0.016)	Loss 4.0145 (4.1369)	Top-1 acc 30.469 (28.415)	Top-5 acc 55.469 (51.601)	lr 0.00963
Warmup Train [29][1400/3239]	Time 0.562 (0.516)	Data 0.001 (0.016)	Loss 4.2255 (4.1366)	Top-1 acc 28.125 (28.421)	Top-5 acc 54.297 (51.610)	lr 0.00963
Warmup Train [29][1410/3239]	Time 0.554 (0.516)	Data 0.001 (0.016)	Loss 4.2783 (4.1366)	Top-1 acc 25.391 (28.419)	Top-5 acc 48.438 (51.597)	lr 0.00962
Warmup Train [29][1420/3239]	Time 0.512 (0.516)	Data 0.001 (0.016)	Loss 4.0482 (4.1367)	Top-1 acc 27.344 (28.407)	Top-5 acc 53.906 (51.592)	lr 0.00962
Warmup Train [29][1430/3239]	Time 0.367 (0.516)	Data 0.023 (0.016)	Loss 4.0184 (4.1366)	Top-1 acc 30.469 (28.405)	Top-5 acc 51.953 (51.590)	lr 0.00961
Warmup Train [29][1440/3239]	Time 0.360 (0.516)	Data 0.001 (0.016)	Loss 4.2477 (4.1366)	Top-1 acc 30.078 (28.409)	Top-5 acc 49.609 (51.591)	lr 0.00961
Warmup Train [29][1450/3239]	Time 0.564 (0.516)	Data 0.001 (0.016)	Loss 4.0939 (4.1365)	Top-1 acc 28.906 (28.414)	Top-5 acc 53.516 (51.597)	lr 0.00960
Warmup Train [29][1460/3239]	Time 0.545 (0.516)	Data 0.001 (0.016)	Loss 4.0270 (4.1366)	Top-1 acc 31.641 (28.409)	Top-5 acc 54.688 (51.595)	lr 0.00960
Warmup Train [29][1470/3239]	Time 0.617 (0.516)	Data 0.001 (0.016)	Loss 4.1434 (4.1368)	Top-1 acc 30.859 (28.414)	Top-5 acc 52.344 (51.588)	lr 0.00959
Warmup Train [29][1480/3239]	Time 0.464 (0.516)	Data 0.001 (0.016)	Loss 4.0415 (4.1366)	Top-1 acc 27.734 (28.405)	Top-5 acc 55.469 (51.591)	lr 0.00959
Warmup Train [29][1490/3239]	Time 0.488 (0.516)	Data 0.001 (0.016)	Loss 4.1937 (4.1373)	Top-1 acc 30.078 (28.395)	Top-5 acc 50.781 (51.579)	lr 0.00958
Warmup Train [29][1500/3239]	Time 0.584 (0.516)	Data 0.001 (0.016)	Loss 4.0696 (4.1373)	Top-1 acc 30.078 (28.394)	Top-5 acc 51.953 (51.576)	lr 0.00958
Warmup Train [29][1510/3239]	Time 0.346 (0.516)	Data 0.001 (0.016)	Loss 4.2401 (4.1375)	Top-1 acc 26.172 (28.394)	Top-5 acc 47.656 (51.569)	lr 0.00958
Warmup Train [29][1520/3239]	Time 0.611 (0.516)	Data 0.001 (0.016)	Loss 4.4648 (4.1377)	Top-1 acc 25.000 (28.395)	Top-5 acc 42.969 (51.567)	lr 0.00957
Warmup Train [29][1530/3239]	Time 0.577 (0.516)	Data 0.001 (0.015)	Loss 3.9706 (4.1375)	Top-1 acc 33.984 (28.404)	Top-5 acc 56.250 (51.573)	lr 0.00957
Warmup Train [29][1540/3239]	Time 0.588 (0.516)	Data 0.001 (0.015)	Loss 3.9311 (4.1370)	Top-1 acc 33.594 (28.417)	Top-5 acc 54.688 (51.588)	lr 0.00956
Warmup Train [29][1550/3239]	Time 0.369 (0.516)	Data 0.001 (0.015)	Loss 4.5170 (4.1375)	Top-1 acc 23.047 (28.405)	Top-5 acc 40.625 (51.577)	lr 0.00956
Warmup Train [29][1560/3239]	Time 0.452 (0.516)	Data 0.001 (0.015)	Loss 4.3845 (4.1383)	Top-1 acc 26.172 (28.391)	Top-5 acc 42.578 (51.560)	lr 0.00955
Warmup Train [29][1570/3239]	Time 0.638 (0.516)	Data 0.001 (0.015)	Loss 4.0394 (4.1381)	Top-1 acc 26.172 (28.401)	Top-5 acc 55.469 (51.564)	lr 0.00955
Warmup Train [29][1580/3239]	Time 0.623 (0.516)	Data 0.001 (0.015)	Loss 4.1218 (4.1383)	Top-1 acc 27.344 (28.403)	Top-5 acc 56.250 (51.564)	lr 0.00954
Warmup Train [29][1590/3239]	Time 0.536 (0.516)	Data 0.001 (0.015)	Loss 4.0803 (4.1383)	Top-1 acc 32.422 (28.406)	Top-5 acc 55.859 (51.561)	lr 0.00954
Warmup Train [29][1600/3239]	Time 0.339 (0.516)	Data 0.001 (0.015)	Loss 4.2402 (4.1382)	Top-1 acc 29.297 (28.403)	Top-5 acc 50.781 (51.564)	lr 0.00953
Warmup Train [29][1610/3239]	Time 0.547 (0.516)	Data 0.001 (0.015)	Loss 4.1089 (4.1382)	Top-1 acc 27.344 (28.405)	Top-5 acc 53.125 (51.560)	lr 0.00953
Warmup Train [29][1620/3239]	Time 0.624 (0.516)	Data 0.001 (0.015)	Loss 3.9971 (4.1377)	Top-1 acc 30.469 (28.412)	Top-5 acc 57.031 (51.572)	lr 0.00952
Warmup Train [29][1630/3239]	Time 0.466 (0.516)	Data 0.001 (0.015)	Loss 4.2577 (4.1380)	Top-1 acc 28.906 (28.406)	Top-5 acc 48.047 (51.562)	lr 0.00952
Warmup Train [29][1640/3239]	Time 0.381 (0.515)	Data 0.001 (0.015)	Loss 4.1816 (4.1378)	Top-1 acc 30.469 (28.414)	Top-5 acc 49.609 (51.562)	lr 0.00951
Warmup Train [29][1650/3239]	Time 0.402 (0.515)	Data 0.001 (0.015)	Loss 4.2815 (4.1379)	Top-1 acc 23.438 (28.410)	Top-5 acc 48.438 (51.558)	lr 0.00951
Warmup Train [29][1660/3239]	Time 0.305 (0.515)	Data 0.001 (0.015)	Loss 4.0540 (4.1375)	Top-1 acc 31.250 (28.418)	Top-5 acc 53.125 (51.567)	lr 0.00950
Warmup Train [29][1670/3239]	Time 0.506 (0.515)	Data 0.001 (0.015)	Loss 4.2722 (4.1373)	Top-1 acc 26.172 (28.421)	Top-5 acc 49.609 (51.576)	lr 0.00950
Warmup Train [29][1680/3239]	Time 0.598 (0.515)	Data 0.001 (0.015)	Loss 4.1398 (4.1373)	Top-1 acc 24.609 (28.422)	Top-5 acc 50.000 (51.571)	lr 0.00949
Warmup Train [29][1690/3239]	Time 0.515 (0.515)	Data 0.001 (0.015)	Loss 4.1760 (4.1375)	Top-1 acc 29.688 (28.421)	Top-5 acc 50.000 (51.566)	lr 0.00949
Warmup Train [29][1700/3239]	Time 0.677 (0.515)	Data 0.001 (0.015)	Loss 4.1120 (4.1374)	Top-1 acc 29.688 (28.424)	Top-5 acc 52.734 (51.569)	lr 0.00948
Warmup Train [29][1710/3239]	Time 0.553 (0.515)	Data 0.001 (0.014)	Loss 4.1363 (4.1374)	Top-1 acc 27.734 (28.425)	Top-5 acc 49.219 (51.572)	lr 0.00948
Warmup Train [29][1720/3239]	Time 0.345 (0.515)	Data 0.001 (0.014)	Loss 3.8683 (4.1373)	Top-1 acc 34.375 (28.429)	Top-5 acc 54.688 (51.566)	lr 0.00948
Warmup Train [29][1730/3239]	Time 0.456 (0.515)	Data 0.001 (0.014)	Loss 4.2795 (4.1373)	Top-1 acc 27.344 (28.433)	Top-5 acc 46.875 (51.569)	lr 0.00947
Warmup Train [29][1740/3239]	Time 0.311 (0.515)	Data 0.001 (0.014)	Loss 4.3219 (4.1376)	Top-1 acc 24.219 (28.427)	Top-5 acc 45.312 (51.565)	lr 0.00947
Warmup Train [29][1750/3239]	Time 0.385 (0.515)	Data 0.001 (0.014)	Loss 4.0308 (4.1375)	Top-1 acc 32.812 (28.425)	Top-5 acc 51.562 (51.565)	lr 0.00946
Warmup Train [29][1760/3239]	Time 0.529 (0.515)	Data 0.001 (0.014)	Loss 4.0903 (4.1375)	Top-1 acc 32.422 (28.431)	Top-5 acc 55.078 (51.568)	lr 0.00946
Warmup Train [29][1770/3239]	Time 0.367 (0.515)	Data 0.001 (0.014)	Loss 4.1620 (4.1373)	Top-1 acc 26.953 (28.437)	Top-5 acc 48.047 (51.564)	lr 0.00945
Warmup Train [29][1780/3239]	Time 0.541 (0.515)	Data 0.001 (0.014)	Loss 4.1922 (4.1373)	Top-1 acc 28.906 (28.436)	Top-5 acc 54.297 (51.565)	lr 0.00945
Warmup Train [29][1790/3239]	Time 0.433 (0.515)	Data 0.001 (0.014)	Loss 4.2767 (4.1374)	Top-1 acc 25.781 (28.435)	Top-5 acc 47.656 (51.559)	lr 0.00944
Warmup Train [29][1800/3239]	Time 0.415 (0.515)	Data 0.001 (0.014)	Loss 4.0884 (4.1373)	Top-1 acc 31.250 (28.442)	Top-5 acc 53.906 (51.556)	lr 0.00944
Warmup Train [29][1810/3239]	Time 0.482 (0.515)	Data 0.001 (0.014)	Loss 4.1986 (4.1372)	Top-1 acc 27.734 (28.445)	Top-5 acc 51.953 (51.564)	lr 0.00943
Warmup Train [29][1820/3239]	Time 0.380 (0.515)	Data 0.001 (0.014)	Loss 4.2659 (4.1370)	Top-1 acc 27.344 (28.448)	Top-5 acc 47.266 (51.569)	lr 0.00943
Warmup Train [29][1830/3239]	Time 0.523 (0.515)	Data 0.001 (0.014)	Loss 4.0367 (4.1367)	Top-1 acc 30.469 (28.456)	Top-5 acc 53.125 (51.571)	lr 0.00942
Warmup Train [29][1840/3239]	Time 0.430 (0.515)	Data 0.001 (0.014)	Loss 4.1362 (4.1364)	Top-1 acc 27.344 (28.460)	Top-5 acc 50.781 (51.574)	lr 0.00942
Warmup Train [29][1850/3239]	Time 0.623 (0.515)	Data 0.001 (0.014)	Loss 4.2861 (4.1367)	Top-1 acc 23.047 (28.448)	Top-5 acc 44.531 (51.562)	lr 0.00941
Warmup Train [29][1860/3239]	Time 0.676 (0.515)	Data 0.001 (0.014)	Loss 4.0565 (4.1364)	Top-1 acc 30.469 (28.452)	Top-5 acc 55.078 (51.571)	lr 0.00941
Warmup Train [29][1870/3239]	Time 0.514 (0.515)	Data 0.001 (0.014)	Loss 4.1889 (4.1363)	Top-1 acc 29.688 (28.455)	Top-5 acc 48.828 (51.566)	lr 0.00940
Warmup Train [29][1880/3239]	Time 0.526 (0.515)	Data 0.001 (0.014)	Loss 4.2363 (4.1360)	Top-1 acc 26.172 (28.461)	Top-5 acc 47.656 (51.573)	lr 0.00940
Warmup Train [29][1890/3239]	Time 0.409 (0.515)	Data 0.001 (0.014)	Loss 4.1592 (4.1361)	Top-1 acc 29.688 (28.457)	Top-5 acc 51.172 (51.572)	lr 0.00939
Warmup Train [29][1900/3239]	Time 0.663 (0.515)	Data 0.001 (0.014)	Loss 4.0450 (4.1361)	Top-1 acc 29.688 (28.457)	Top-5 acc 57.031 (51.573)	lr 0.00939
Warmup Train [29][1910/3239]	Time 0.635 (0.515)	Data 0.001 (0.014)	Loss 4.2284 (4.1360)	Top-1 acc 25.781 (28.457)	Top-5 acc 48.828 (51.576)	lr 0.00939
Warmup Train [29][1920/3239]	Time 0.518 (0.514)	Data 0.001 (0.014)	Loss 4.2955 (4.1358)	Top-1 acc 25.000 (28.460)	Top-5 acc 49.609 (51.582)	lr 0.00938
Warmup Train [29][1930/3239]	Time 0.500 (0.514)	Data 0.002 (0.014)	Loss 4.1944 (4.1356)	Top-1 acc 25.391 (28.463)	Top-5 acc 50.000 (51.589)	lr 0.00938
Warmup Train [29][1940/3239]	Time 0.362 (0.514)	Data 0.001 (0.014)	Loss 4.4446 (4.1360)	Top-1 acc 23.828 (28.451)	Top-5 acc 47.266 (51.577)	lr 0.00937
Warmup Train [29][1950/3239]	Time 0.472 (0.514)	Data 0.001 (0.014)	Loss 4.0997 (4.1360)	Top-1 acc 25.781 (28.445)	Top-5 acc 50.391 (51.573)	lr 0.00937
Warmup Train [29][1960/3239]	Time 0.710 (0.514)	Data 0.002 (0.014)	Loss 4.0509 (4.1359)	Top-1 acc 35.156 (28.450)	Top-5 acc 53.516 (51.575)	lr 0.00936
Warmup Train [29][1970/3239]	Time 0.477 (0.514)	Data 0.001 (0.014)	Loss 4.2424 (4.1358)	Top-1 acc 26.562 (28.452)	Top-5 acc 51.172 (51.577)	lr 0.00936
Warmup Train [29][1980/3239]	Time 0.623 (0.514)	Data 0.001 (0.014)	Loss 4.1865 (4.1358)	Top-1 acc 26.953 (28.451)	Top-5 acc 50.391 (51.580)	lr 0.00935
Warmup Train [29][1990/3239]	Time 0.586 (0.514)	Data 0.001 (0.013)	Loss 4.0252 (4.1354)	Top-1 acc 32.422 (28.459)	Top-5 acc 51.172 (51.589)	lr 0.00935
Warmup Train [29][2000/3239]	Time 0.647 (0.514)	Data 0.001 (0.013)	Loss 4.1625 (4.1356)	Top-1 acc 28.125 (28.456)	Top-5 acc 53.125 (51.584)	lr 0.00934
Warmup Train [29][2010/3239]	Time 0.480 (0.514)	Data 0.001 (0.013)	Loss 4.2141 (4.1359)	Top-1 acc 26.953 (28.448)	Top-5 acc 52.734 (51.579)	lr 0.00934
Warmup Train [29][2020/3239]	Time 0.552 (0.514)	Data 0.001 (0.013)	Loss 3.7508 (4.1359)	Top-1 acc 39.062 (28.460)	Top-5 acc 59.766 (51.583)	lr 0.00933
Warmup Train [29][2030/3239]	Time 0.384 (0.514)	Data 0.001 (0.013)	Loss 4.3646 (4.1358)	Top-1 acc 25.391 (28.460)	Top-5 acc 46.484 (51.581)	lr 0.00933
Warmup Train [29][2040/3239]	Time 0.600 (0.514)	Data 0.001 (0.013)	Loss 4.0400 (4.1356)	Top-1 acc 30.078 (28.457)	Top-5 acc 55.859 (51.589)	lr 0.00932
Warmup Train [29][2050/3239]	Time 0.611 (0.514)	Data 0.001 (0.013)	Loss 4.2157 (4.1357)	Top-1 acc 28.516 (28.461)	Top-5 acc 51.562 (51.593)	lr 0.00932
Warmup Train [29][2060/3239]	Time 0.644 (0.514)	Data 0.001 (0.013)	Loss 4.0912 (4.1357)	Top-1 acc 30.469 (28.460)	Top-5 acc 48.438 (51.591)	lr 0.00931
Warmup Train [29][2070/3239]	Time 0.621 (0.514)	Data 0.001 (0.013)	Loss 3.9795 (4.1358)	Top-1 acc 28.906 (28.456)	Top-5 acc 52.344 (51.586)	lr 0.00931
Warmup Train [29][2080/3239]	Time 0.512 (0.514)	Data 0.001 (0.013)	Loss 3.9540 (4.1358)	Top-1 acc 34.375 (28.458)	Top-5 acc 58.594 (51.588)	lr 0.00930
Warmup Train [29][2090/3239]	Time 0.532 (0.514)	Data 0.001 (0.013)	Loss 4.2965 (4.1358)	Top-1 acc 26.172 (28.459)	Top-5 acc 47.266 (51.589)	lr 0.00930
Warmup Train [29][2100/3239]	Time 0.417 (0.514)	Data 0.001 (0.013)	Loss 4.1502 (4.1357)	Top-1 acc 25.391 (28.458)	Top-5 acc 53.516 (51.594)	lr 0.00930
Warmup Train [29][2110/3239]	Time 0.399 (0.514)	Data 0.001 (0.013)	Loss 4.0377 (4.1354)	Top-1 acc 33.203 (28.462)	Top-5 acc 54.688 (51.601)	lr 0.00929
Warmup Train [29][2120/3239]	Time 0.594 (0.514)	Data 0.001 (0.013)	Loss 4.1548 (4.1354)	Top-1 acc 28.906 (28.461)	Top-5 acc 51.953 (51.600)	lr 0.00929
Warmup Train [29][2130/3239]	Time 0.616 (0.514)	Data 0.001 (0.013)	Loss 4.0655 (4.1352)	Top-1 acc 28.906 (28.466)	Top-5 acc 51.953 (51.605)	lr 0.00928
Warmup Train [29][2140/3239]	Time 0.517 (0.514)	Data 0.001 (0.013)	Loss 4.0168 (4.1351)	Top-1 acc 30.859 (28.467)	Top-5 acc 51.953 (51.601)	lr 0.00928
Warmup Train [29][2150/3239]	Time 0.643 (0.514)	Data 0.001 (0.013)	Loss 4.0102 (4.1352)	Top-1 acc 30.469 (28.462)	Top-5 acc 57.422 (51.600)	lr 0.00927
Warmup Train [29][2160/3239]	Time 0.472 (0.514)	Data 0.001 (0.013)	Loss 4.2438 (4.1352)	Top-1 acc 24.219 (28.461)	Top-5 acc 48.828 (51.603)	lr 0.00927
Warmup Train [29][2170/3239]	Time 0.307 (0.514)	Data 0.001 (0.013)	Loss 4.2674 (4.1349)	Top-1 acc 25.000 (28.470)	Top-5 acc 46.484 (51.607)	lr 0.00926
Warmup Train [29][2180/3239]	Time 0.376 (0.513)	Data 0.001 (0.013)	Loss 4.1894 (4.1348)	Top-1 acc 26.172 (28.465)	Top-5 acc 49.219 (51.608)	lr 0.00926
Warmup Train [29][2190/3239]	Time 0.461 (0.513)	Data 0.001 (0.013)	Loss 4.1916 (4.1351)	Top-1 acc 26.953 (28.459)	Top-5 acc 47.656 (51.601)	lr 0.00925
Warmup Train [29][2200/3239]	Time 0.588 (0.513)	Data 0.001 (0.013)	Loss 4.0304 (4.1350)	Top-1 acc 31.641 (28.467)	Top-5 acc 54.688 (51.609)	lr 0.00925
Warmup Train [29][2210/3239]	Time 0.358 (0.513)	Data 0.001 (0.013)	Loss 4.0949 (4.1348)	Top-1 acc 28.125 (28.470)	Top-5 acc 52.734 (51.614)	lr 0.00924
Warmup Train [29][2220/3239]	Time 0.445 (0.513)	Data 0.001 (0.013)	Loss 4.0920 (4.1347)	Top-1 acc 26.562 (28.472)	Top-5 acc 52.344 (51.617)	lr 0.00924
Warmup Train [29][2230/3239]	Time 0.417 (0.513)	Data 0.001 (0.013)	Loss 4.2994 (4.1346)	Top-1 acc 26.172 (28.469)	Top-5 acc 48.438 (51.618)	lr 0.00923
Warmup Train [29][2240/3239]	Time 0.517 (0.513)	Data 0.001 (0.013)	Loss 4.2896 (4.1349)	Top-1 acc 23.828 (28.462)	Top-5 acc 48.828 (51.609)	lr 0.00923
Warmup Train [29][2250/3239]	Time 0.608 (0.513)	Data 0.001 (0.013)	Loss 4.1295 (4.1347)	Top-1 acc 29.297 (28.467)	Top-5 acc 54.688 (51.614)	lr 0.00922
Warmup Train [29][2260/3239]	Time 0.575 (0.513)	Data 0.001 (0.013)	Loss 4.0154 (4.1345)	Top-1 acc 29.688 (28.475)	Top-5 acc 53.516 (51.617)	lr 0.00922
Warmup Train [29][2270/3239]	Time 0.398 (0.513)	Data 0.001 (0.013)	Loss 3.9390 (4.1342)	Top-1 acc 32.422 (28.473)	Top-5 acc 58.203 (51.625)	lr 0.00922
Warmup Train [29][2280/3239]	Time 0.439 (0.513)	Data 0.001 (0.013)	Loss 4.1617 (4.1343)	Top-1 acc 27.344 (28.474)	Top-5 acc 50.391 (51.620)	lr 0.00921
Warmup Train [29][2290/3239]	Time 0.513 (0.513)	Data 0.001 (0.013)	Loss 4.1554 (4.1341)	Top-1 acc 31.641 (28.482)	Top-5 acc 53.906 (51.629)	lr 0.00921
Warmup Train [29][2300/3239]	Time 0.670 (0.513)	Data 0.001 (0.013)	Loss 3.9937 (4.1344)	Top-1 acc 31.641 (28.482)	Top-5 acc 52.734 (51.621)	lr 0.00920
Warmup Train [29][2310/3239]	Time 0.598 (0.513)	Data 0.001 (0.013)	Loss 4.0675 (4.1343)	Top-1 acc 28.516 (28.490)	Top-5 acc 52.344 (51.624)	lr 0.00920
Warmup Train [29][2320/3239]	Time 0.402 (0.513)	Data 0.001 (0.013)	Loss 4.2702 (4.1344)	Top-1 acc 28.125 (28.488)	Top-5 acc 48.828 (51.617)	lr 0.00919
Warmup Train [29][2330/3239]	Time 0.382 (0.513)	Data 0.001 (0.013)	Loss 4.1574 (4.1342)	Top-1 acc 26.953 (28.492)	Top-5 acc 50.000 (51.623)	lr 0.00919
Warmup Train [29][2340/3239]	Time 0.617 (0.513)	Data 0.001 (0.013)	Loss 4.2065 (4.1338)	Top-1 acc 24.609 (28.493)	Top-5 acc 51.172 (51.635)	lr 0.00918
Warmup Train [29][2350/3239]	Time 0.289 (0.513)	Data 0.001 (0.013)	Loss 4.3289 (4.1338)	Top-1 acc 27.344 (28.488)	Top-5 acc 49.609 (51.634)	lr 0.00918
Warmup Train [29][2360/3239]	Time 0.653 (0.513)	Data 0.001 (0.013)	Loss 4.1418 (4.1339)	Top-1 acc 28.906 (28.488)	Top-5 acc 49.609 (51.631)	lr 0.00917
Warmup Train [29][2370/3239]	Time 0.653 (0.513)	Data 0.001 (0.012)	Loss 4.0477 (4.1339)	Top-1 acc 31.250 (28.489)	Top-5 acc 57.031 (51.636)	lr 0.00917
Warmup Train [29][2380/3239]	Time 0.549 (0.513)	Data 0.001 (0.012)	Loss 4.1064 (4.1339)	Top-1 acc 31.641 (28.492)	Top-5 acc 51.562 (51.633)	lr 0.00916
Warmup Train [29][2390/3239]	Time 0.498 (0.513)	Data 0.001 (0.012)	Loss 4.1144 (4.1339)	Top-1 acc 30.078 (28.488)	Top-5 acc 51.172 (51.632)	lr 0.00916
Warmup Train [29][2400/3239]	Time 0.488 (0.513)	Data 0.001 (0.012)	Loss 4.0893 (4.1337)	Top-1 acc 28.906 (28.488)	Top-5 acc 50.781 (51.632)	lr 0.00915
Warmup Train [29][2410/3239]	Time 0.609 (0.513)	Data 0.001 (0.012)	Loss 3.8600 (4.1337)	Top-1 acc 33.984 (28.493)	Top-5 acc 55.469 (51.635)	lr 0.00915
Warmup Train [29][2420/3239]	Time 0.372 (0.513)	Data 0.001 (0.012)	Loss 4.0023 (4.1335)	Top-1 acc 34.766 (28.500)	Top-5 acc 55.859 (51.639)	lr 0.00914
Warmup Train [29][2430/3239]	Time 0.292 (0.513)	Data 0.001 (0.012)	Loss 4.1718 (4.1334)	Top-1 acc 26.562 (28.503)	Top-5 acc 48.438 (51.641)	lr 0.00914
Warmup Train [29][2440/3239]	Time 0.636 (0.513)	Data 0.001 (0.012)	Loss 4.0929 (4.1335)	Top-1 acc 30.078 (28.496)	Top-5 acc 50.391 (51.638)	lr 0.00914
Warmup Train [29][2450/3239]	Time 0.514 (0.513)	Data 0.001 (0.012)	Loss 4.0658 (4.1336)	Top-1 acc 33.203 (28.494)	Top-5 acc 53.125 (51.636)	lr 0.00913
Warmup Train [29][2460/3239]	Time 0.593 (0.513)	Data 0.001 (0.012)	Loss 4.1570 (4.1335)	Top-1 acc 27.344 (28.496)	Top-5 acc 49.609 (51.634)	lr 0.00913
Warmup Train [29][2470/3239]	Time 0.313 (0.513)	Data 0.001 (0.012)	Loss 4.2861 (4.1334)	Top-1 acc 26.562 (28.499)	Top-5 acc 46.094 (51.634)	lr 0.00912
Warmup Train [29][2480/3239]	Time 0.414 (0.513)	Data 0.001 (0.012)	Loss 4.1055 (4.1335)	Top-1 acc 30.078 (28.500)	Top-5 acc 55.078 (51.638)	lr 0.00912
Warmup Train [29][2490/3239]	Time 0.508 (0.513)	Data 0.001 (0.012)	Loss 4.2849 (4.1335)	Top-1 acc 26.953 (28.493)	Top-5 acc 51.172 (51.638)	lr 0.00911
Warmup Train [29][2500/3239]	Time 0.481 (0.513)	Data 0.001 (0.012)	Loss 4.0645 (4.1337)	Top-1 acc 27.734 (28.487)	Top-5 acc 51.562 (51.631)	lr 0.00911
Warmup Train [29][2510/3239]	Time 0.669 (0.513)	Data 0.001 (0.012)	Loss 3.9638 (4.1338)	Top-1 acc 32.422 (28.488)	Top-5 acc 58.203 (51.632)	lr 0.00910
Warmup Train [29][2520/3239]	Time 0.505 (0.513)	Data 0.001 (0.012)	Loss 4.2943 (4.1339)	Top-1 acc 24.219 (28.487)	Top-5 acc 44.922 (51.631)	lr 0.00910
Warmup Train [29][2530/3239]	Time 0.415 (0.513)	Data 0.001 (0.012)	Loss 4.0138 (4.1339)	Top-1 acc 32.031 (28.482)	Top-5 acc 55.078 (51.630)	lr 0.00909
Warmup Train [29][2540/3239]	Time 0.470 (0.513)	Data 0.001 (0.012)	Loss 3.9865 (4.1340)	Top-1 acc 34.375 (28.477)	Top-5 acc 57.031 (51.623)	lr 0.00909
Warmup Train [29][2550/3239]	Time 0.353 (0.512)	Data 0.002 (0.012)	Loss 4.0816 (4.1339)	Top-1 acc 28.906 (28.484)	Top-5 acc 52.344 (51.626)	lr 0.00908
Warmup Train [29][2560/3239]	Time 0.461 (0.512)	Data 0.001 (0.012)	Loss 4.0161 (4.1339)	Top-1 acc 30.859 (28.487)	Top-5 acc 54.688 (51.625)	lr 0.00908
Warmup Train [29][2570/3239]	Time 0.477 (0.512)	Data 0.001 (0.012)	Loss 4.3759 (4.1341)	Top-1 acc 25.391 (28.485)	Top-5 acc 46.875 (51.620)	lr 0.00907
Warmup Train [29][2580/3239]	Time 0.651 (0.512)	Data 0.001 (0.012)	Loss 4.0447 (4.1343)	Top-1 acc 34.766 (28.477)	Top-5 acc 58.594 (51.614)	lr 0.00907
Warmup Train [29][2590/3239]	Time 0.499 (0.512)	Data 0.001 (0.012)	Loss 4.0323 (4.1343)	Top-1 acc 32.031 (28.481)	Top-5 acc 52.734 (51.611)	lr 0.00907
Warmup Train [29][2600/3239]	Time 0.498 (0.513)	Data 0.001 (0.012)	Loss 4.1762 (4.1346)	Top-1 acc 26.562 (28.477)	Top-5 acc 50.000 (51.606)	lr 0.00906
Warmup Train [29][2610/3239]	Time 0.538 (0.513)	Data 0.001 (0.012)	Loss 4.0804 (4.1347)	Top-1 acc 26.562 (28.474)	Top-5 acc 52.734 (51.603)	lr 0.00906
Warmup Train [29][2620/3239]	Time 0.576 (0.512)	Data 0.001 (0.012)	Loss 4.1367 (4.1347)	Top-1 acc 26.953 (28.474)	Top-5 acc 51.172 (51.605)	lr 0.00905
Warmup Train [29][2630/3239]	Time 0.527 (0.513)	Data 0.001 (0.012)	Loss 4.1551 (4.1347)	Top-1 acc 28.906 (28.474)	Top-5 acc 47.656 (51.603)	lr 0.00905
Warmup Train [29][2640/3239]	Time 0.651 (0.513)	Data 0.001 (0.012)	Loss 4.0134 (4.1348)	Top-1 acc 28.125 (28.478)	Top-5 acc 53.125 (51.601)	lr 0.00904
Warmup Train [29][2650/3239]	Time 0.434 (0.513)	Data 0.001 (0.012)	Loss 4.1420 (4.1349)	Top-1 acc 30.469 (28.476)	Top-5 acc 50.000 (51.598)	lr 0.00904
Warmup Train [29][2660/3239]	Time 0.491 (0.512)	Data 0.001 (0.012)	Loss 4.0210 (4.1348)	Top-1 acc 32.422 (28.478)	Top-5 acc 55.078 (51.606)	lr 0.00903
Warmup Train [29][2670/3239]	Time 0.372 (0.513)	Data 0.001 (0.012)	Loss 4.0177 (4.1347)	Top-1 acc 33.594 (28.479)	Top-5 acc 54.688 (51.607)	lr 0.00903
Warmup Train [29][2680/3239]	Time 0.355 (0.513)	Data 0.001 (0.012)	Loss 4.0600 (4.1346)	Top-1 acc 31.641 (28.484)	Top-5 acc 51.172 (51.605)	lr 0.00902
Warmup Train [29][2690/3239]	Time 0.537 (0.513)	Data 0.001 (0.012)	Loss 3.9597 (4.1344)	Top-1 acc 32.422 (28.488)	Top-5 acc 55.469 (51.609)	lr 0.00902
Warmup Train [29][2700/3239]	Time 0.672 (0.513)	Data 0.001 (0.012)	Loss 3.9535 (4.1343)	Top-1 acc 33.594 (28.494)	Top-5 acc 57.422 (51.614)	lr 0.00901
Warmup Train [29][2710/3239]	Time 0.488 (0.513)	Data 0.001 (0.012)	Loss 3.9419 (4.1341)	Top-1 acc 32.812 (28.498)	Top-5 acc 54.688 (51.620)	lr 0.00901
Warmup Train [29][2720/3239]	Time 0.607 (0.513)	Data 0.001 (0.012)	Loss 4.0632 (4.1341)	Top-1 acc 33.203 (28.499)	Top-5 acc 57.422 (51.620)	lr 0.00900
Warmup Train [29][2730/3239]	Time 0.395 (0.513)	Data 0.001 (0.012)	Loss 4.2471 (4.1340)	Top-1 acc 26.953 (28.500)	Top-5 acc 48.828 (51.621)	lr 0.00900
Warmup Train [29][2740/3239]	Time 0.514 (0.513)	Data 0.001 (0.012)	Loss 4.2393 (4.1342)	Top-1 acc 28.516 (28.496)	Top-5 acc 50.000 (51.616)	lr 0.00900
Warmup Train [29][2750/3239]	Time 0.603 (0.513)	Data 0.001 (0.012)	Loss 3.9820 (4.1341)	Top-1 acc 28.906 (28.495)	Top-5 acc 51.172 (51.617)	lr 0.00899
Warmup Train [29][2760/3239]	Time 0.519 (0.513)	Data 0.001 (0.012)	Loss 4.0421 (4.1341)	Top-1 acc 33.984 (28.503)	Top-5 acc 54.297 (51.613)	lr 0.00899
Warmup Train [29][2770/3239]	Time 0.542 (0.512)	Data 0.001 (0.012)	Loss 4.1715 (4.1340)	Top-1 acc 29.297 (28.509)	Top-5 acc 49.219 (51.617)	lr 0.00898
Warmup Train [29][2780/3239]	Time 0.506 (0.512)	Data 0.001 (0.012)	Loss 4.1337 (4.1341)	Top-1 acc 27.344 (28.509)	Top-5 acc 51.172 (51.614)	lr 0.00898
Warmup Train [29][2790/3239]	Time 0.550 (0.512)	Data 0.001 (0.012)	Loss 4.1480 (4.1340)	Top-1 acc 29.688 (28.511)	Top-5 acc 50.000 (51.612)	lr 0.00897
Warmup Train [29][2800/3239]	Time 0.712 (0.512)	Data 0.001 (0.012)	Loss 4.0973 (4.1342)	Top-1 acc 30.859 (28.510)	Top-5 acc 53.906 (51.607)	lr 0.00897
Warmup Train [29][2810/3239]	Time 0.529 (0.513)	Data 0.002 (0.012)	Loss 4.1509 (4.1339)	Top-1 acc 28.516 (28.515)	Top-5 acc 50.391 (51.611)	lr 0.00896
Warmup Train [29][2820/3239]	Time 0.388 (0.512)	Data 0.001 (0.012)	Loss 4.1499 (4.1340)	Top-1 acc 25.781 (28.513)	Top-5 acc 51.562 (51.612)	lr 0.00896
Warmup Train [29][2830/3239]	Time 0.398 (0.513)	Data 0.001 (0.012)	Loss 4.2265 (4.1340)	Top-1 acc 29.688 (28.514)	Top-5 acc 50.000 (51.611)	lr 0.00895
Warmup Train [29][2840/3239]	Time 0.458 (0.513)	Data 0.001 (0.012)	Loss 4.0508 (4.1339)	Top-1 acc 28.906 (28.515)	Top-5 acc 50.781 (51.608)	lr 0.00895
Warmup Train [29][2850/3239]	Time 0.539 (0.513)	Data 0.001 (0.012)	Loss 4.0763 (4.1339)	Top-1 acc 28.906 (28.515)	Top-5 acc 55.469 (51.609)	lr 0.00894
Warmup Train [29][2860/3239]	Time 0.481 (0.512)	Data 0.001 (0.012)	Loss 4.0954 (4.1339)	Top-1 acc 28.906 (28.515)	Top-5 acc 55.469 (51.606)	lr 0.00894
Warmup Train [29][2870/3239]	Time 0.535 (0.513)	Data 0.001 (0.012)	Loss 4.1071 (4.1336)	Top-1 acc 32.422 (28.521)	Top-5 acc 51.562 (51.612)	lr 0.00893
Warmup Train [29][2880/3239]	Time 0.517 (0.513)	Data 0.001 (0.011)	Loss 4.1824 (4.1337)	Top-1 acc 28.125 (28.521)	Top-5 acc 50.391 (51.609)	lr 0.00893
Warmup Train [29][2890/3239]	Time 0.688 (0.513)	Data 0.001 (0.011)	Loss 4.1170 (4.1336)	Top-1 acc 32.031 (28.523)	Top-5 acc 52.734 (51.608)	lr 0.00893
Warmup Train [29][2900/3239]	Time 0.336 (0.513)	Data 0.001 (0.011)	Loss 4.1494 (4.1339)	Top-1 acc 27.344 (28.516)	Top-5 acc 49.609 (51.604)	lr 0.00892
Warmup Train [29][2910/3239]	Time 0.590 (0.513)	Data 0.001 (0.011)	Loss 4.1798 (4.1340)	Top-1 acc 30.859 (28.519)	Top-5 acc 50.391 (51.602)	lr 0.00892
Warmup Train [29][2920/3239]	Time 0.618 (0.513)	Data 0.001 (0.011)	Loss 3.9567 (4.1337)	Top-1 acc 32.422 (28.525)	Top-5 acc 58.984 (51.610)	lr 0.00891
Warmup Train [29][2930/3239]	Time 0.281 (0.513)	Data 0.001 (0.011)	Loss 3.9359 (4.1335)	Top-1 acc 32.422 (28.528)	Top-5 acc 56.641 (51.612)	lr 0.00891
Warmup Train [29][2940/3239]	Time 0.497 (0.513)	Data 0.001 (0.011)	Loss 4.4443 (4.1336)	Top-1 acc 22.656 (28.529)	Top-5 acc 47.266 (51.612)	lr 0.00890
Warmup Train [29][2950/3239]	Time 0.635 (0.513)	Data 0.001 (0.011)	Loss 4.0788 (4.1335)	Top-1 acc 28.125 (28.528)	Top-5 acc 51.562 (51.614)	lr 0.00890
Warmup Train [29][2960/3239]	Time 0.567 (0.513)	Data 0.001 (0.011)	Loss 4.1197 (4.1336)	Top-1 acc 32.812 (28.526)	Top-5 acc 50.781 (51.608)	lr 0.00889
Warmup Train [29][2970/3239]	Time 0.578 (0.513)	Data 0.001 (0.011)	Loss 4.0978 (4.1336)	Top-1 acc 30.469 (28.526)	Top-5 acc 51.172 (51.608)	lr 0.00889
Warmup Train [29][2980/3239]	Time 0.513 (0.512)	Data 0.001 (0.011)	Loss 3.9854 (4.1334)	Top-1 acc 31.641 (28.531)	Top-5 acc 56.250 (51.614)	lr 0.00888
Warmup Train [29][2990/3239]	Time 0.480 (0.512)	Data 0.001 (0.011)	Loss 4.2235 (4.1336)	Top-1 acc 29.297 (28.529)	Top-5 acc 51.172 (51.611)	lr 0.00888
Warmup Train [29][3000/3239]	Time 0.534 (0.513)	Data 0.001 (0.011)	Loss 4.0120 (4.1336)	Top-1 acc 30.469 (28.530)	Top-5 acc 57.031 (51.612)	lr 0.00887
Warmup Train [29][3010/3239]	Time 0.607 (0.512)	Data 0.001 (0.011)	Loss 4.1718 (4.1338)	Top-1 acc 28.125 (28.526)	Top-5 acc 52.734 (51.608)	lr 0.00887
Warmup Train [29][3020/3239]	Time 0.508 (0.512)	Data 0.001 (0.011)	Loss 4.4284 (4.1342)	Top-1 acc 21.875 (28.521)	Top-5 acc 48.828 (51.603)	lr 0.00887
Warmup Train [29][3030/3239]	Time 0.381 (0.512)	Data 0.001 (0.011)	Loss 4.2860 (4.1341)	Top-1 acc 26.562 (28.522)	Top-5 acc 46.094 (51.605)	lr 0.00886
Warmup Train [29][3040/3239]	Time 0.371 (0.512)	Data 0.001 (0.011)	Loss 4.0865 (4.1341)	Top-1 acc 28.516 (28.524)	Top-5 acc 48.828 (51.604)	lr 0.00886
Warmup Train [29][3050/3239]	Time 0.480 (0.512)	Data 0.001 (0.011)	Loss 4.2822 (4.1343)	Top-1 acc 24.219 (28.522)	Top-5 acc 49.609 (51.598)	lr 0.00885
Warmup Train [29][3060/3239]	Time 0.540 (0.512)	Data 0.001 (0.011)	Loss 3.9685 (4.1341)	Top-1 acc 30.078 (28.525)	Top-5 acc 53.906 (51.603)	lr 0.00885
Warmup Train [29][3070/3239]	Time 0.402 (0.512)	Data 0.001 (0.011)	Loss 4.2166 (4.1340)	Top-1 acc 31.641 (28.526)	Top-5 acc 47.656 (51.605)	lr 0.00884
Warmup Train [29][3080/3239]	Time 0.463 (0.512)	Data 0.001 (0.011)	Loss 4.2343 (4.1341)	Top-1 acc 26.562 (28.530)	Top-5 acc 48.438 (51.602)	lr 0.00884
Warmup Train [29][3090/3239]	Time 0.505 (0.512)	Data 0.001 (0.011)	Loss 4.2138 (4.1341)	Top-1 acc 26.172 (28.526)	Top-5 acc 51.172 (51.602)	lr 0.00883
Warmup Train [29][3100/3239]	Time 0.670 (0.512)	Data 0.001 (0.011)	Loss 4.2000 (4.1342)	Top-1 acc 25.391 (28.524)	Top-5 acc 49.219 (51.604)	lr 0.00883
Warmup Train [29][3110/3239]	Time 0.402 (0.512)	Data 0.001 (0.011)	Loss 4.0543 (4.1342)	Top-1 acc 29.297 (28.524)	Top-5 acc 51.562 (51.607)	lr 0.00882
Warmup Train [29][3120/3239]	Time 0.536 (0.512)	Data 0.001 (0.011)	Loss 4.0377 (4.1341)	Top-1 acc 28.906 (28.527)	Top-5 acc 50.781 (51.610)	lr 0.00882
Warmup Train [29][3130/3239]	Time 0.417 (0.512)	Data 0.001 (0.011)	Loss 3.9642 (4.1339)	Top-1 acc 33.984 (28.531)	Top-5 acc 55.859 (51.613)	lr 0.00881
Warmup Train [29][3140/3239]	Time 0.488 (0.512)	Data 0.001 (0.011)	Loss 3.9037 (4.1339)	Top-1 acc 30.078 (28.530)	Top-5 acc 56.250 (51.615)	lr 0.00881
Warmup Train [29][3150/3239]	Time 0.323 (0.512)	Data 0.001 (0.011)	Loss 4.3701 (4.1338)	Top-1 acc 25.000 (28.530)	Top-5 acc 45.703 (51.617)	lr 0.00881
Warmup Train [29][3160/3239]	Time 0.365 (0.512)	Data 0.001 (0.011)	Loss 4.0912 (4.1338)	Top-1 acc 28.125 (28.529)	Top-5 acc 54.297 (51.617)	lr 0.00880
Warmup Train [29][3170/3239]	Time 0.515 (0.512)	Data 0.001 (0.011)	Loss 4.2563 (4.1340)	Top-1 acc 29.297 (28.527)	Top-5 acc 50.391 (51.617)	lr 0.00880
Warmup Train [29][3180/3239]	Time 0.472 (0.512)	Data 0.000 (0.011)	Loss 4.2999 (4.1338)	Top-1 acc 25.391 (28.532)	Top-5 acc 49.219 (51.620)	lr 0.00879
Warmup Train [29][3190/3239]	Time 0.536 (0.512)	Data 0.000 (0.011)	Loss 4.1222 (4.1337)	Top-1 acc 32.422 (28.533)	Top-5 acc 48.828 (51.624)	lr 0.00879
Warmup Train [29][3200/3239]	Time 0.483 (0.512)	Data 0.000 (0.011)	Loss 4.2551 (4.1337)	Top-1 acc 25.781 (28.535)	Top-5 acc 48.438 (51.626)	lr 0.00878
Warmup Train [29][3210/3239]	Time 0.628 (0.512)	Data 0.000 (0.011)	Loss 4.3003 (4.1334)	Top-1 acc 27.344 (28.541)	Top-5 acc 48.828 (51.633)	lr 0.00878
Warmup Train [29][3220/3239]	Time 0.491 (0.512)	Data 0.000 (0.011)	Loss 4.2095 (4.1335)	Top-1 acc 28.516 (28.538)	Top-5 acc 50.000 (51.633)	lr 0.00877
Warmup Train [29][3230/3239]	Time 0.500 (0.512)	Data 0.000 (0.011)	Loss 4.1773 (4.1334)	Top-1 acc 23.438 (28.536)	Top-5 acc 51.953 (51.638)	lr 0.00877
Warmup Train [29][3239/3239]	Time 0.402 (0.512)	Data 0.000 (0.011)	Loss 4.0362 (4.1334)	Top-1 acc 33.333 (28.540)	Top-5 acc 53.086 (51.639)	lr 0.00876
==========Warmup Valid [29/40]	loss 3.072	top-1 acc 36.089	top-5 acc 61.104	Train top-1 28.540	top-5 51.639	flops: 442.4M
Warmup Train [30][0/3239]	Time 17.591 (17.591)	Data 14.236 (14.236)	Loss 4.2904 (4.2904)	Top-1 acc 26.172 (26.172)	Top-5 acc 50.000 (50.000)	lr 0.00876
Warmup Train [30][10/3239]	Time 0.337 (2.106)	Data 0.001 (1.300)	Loss 3.9396 (4.0887)	Top-1 acc 31.250 (29.652)	Top-5 acc 56.250 (52.486)	lr 0.00876
Warmup Train [30][20/3239]	Time 0.548 (1.341)	Data 0.002 (0.690)	Loss 4.2378 (4.1231)	Top-1 acc 27.734 (28.553)	Top-5 acc 48.047 (51.860)	lr 0.00875
Warmup Train [30][30/3239]	Time 0.714 (1.090)	Data 0.001 (0.468)	Loss 3.9748 (4.1050)	Top-1 acc 29.297 (29.020)	Top-5 acc 53.906 (52.243)	lr 0.00875
Warmup Train [30][40/3239]	Time 0.453 (0.947)	Data 0.001 (0.355)	Loss 3.9143 (4.0920)	Top-1 acc 31.250 (29.240)	Top-5 acc 58.203 (52.611)	lr 0.00875
Warmup Train [30][50/3239]	Time 0.553 (0.861)	Data 0.001 (0.285)	Loss 4.1278 (4.0962)	Top-1 acc 30.859 (29.082)	Top-5 acc 52.734 (52.436)	lr 0.00874
Warmup Train [30][60/3239]	Time 0.470 (0.801)	Data 0.001 (0.239)	Loss 3.8732 (4.0962)	Top-1 acc 35.547 (29.015)	Top-5 acc 58.984 (52.536)	lr 0.00874
Warmup Train [30][70/3239]	Time 0.469 (0.760)	Data 0.002 (0.208)	Loss 4.0326 (4.0899)	Top-1 acc 31.641 (29.198)	Top-5 acc 53.125 (52.602)	lr 0.00873
Warmup Train [30][80/3239]	Time 0.519 (0.729)	Data 0.001 (0.183)	Loss 4.0856 (4.0928)	Top-1 acc 29.688 (29.104)	Top-5 acc 52.344 (52.517)	lr 0.00873
Warmup Train [30][90/3239]	Time 0.459 (0.705)	Data 0.001 (0.163)	Loss 4.1486 (4.0967)	Top-1 acc 30.078 (29.108)	Top-5 acc 50.781 (52.524)	lr 0.00872
Warmup Train [30][100/3239]	Time 0.566 (0.686)	Data 0.001 (0.148)	Loss 4.0169 (4.0954)	Top-1 acc 33.594 (29.250)	Top-5 acc 56.641 (52.564)	lr 0.00872
Warmup Train [30][110/3239]	Time 0.425 (0.672)	Data 0.001 (0.135)	Loss 3.9724 (4.0932)	Top-1 acc 34.766 (29.350)	Top-5 acc 54.297 (52.689)	lr 0.00871
Warmup Train [30][120/3239]	Time 0.741 (0.662)	Data 0.001 (0.125)	Loss 4.3781 (4.0944)	Top-1 acc 24.219 (29.358)	Top-5 acc 42.969 (52.634)	lr 0.00871
Warmup Train [30][130/3239]	Time 0.560 (0.652)	Data 0.001 (0.115)	Loss 4.0882 (4.0949)	Top-1 acc 29.688 (29.300)	Top-5 acc 50.781 (52.606)	lr 0.00870
Warmup Train [30][140/3239]	Time 0.447 (0.639)	Data 0.001 (0.107)	Loss 4.0273 (4.0944)	Top-1 acc 30.078 (29.305)	Top-5 acc 53.516 (52.574)	lr 0.00870
Warmup Train [30][150/3239]	Time 0.384 (0.630)	Data 0.001 (0.101)	Loss 3.9951 (4.0954)	Top-1 acc 30.078 (29.271)	Top-5 acc 53.906 (52.564)	lr 0.00869
Warmup Train [30][160/3239]	Time 0.581 (0.620)	Data 0.001 (0.095)	Loss 4.1731 (4.0971)	Top-1 acc 25.391 (29.231)	Top-5 acc 53.125 (52.538)	lr 0.00869
Warmup Train [30][170/3239]	Time 0.364 (0.612)	Data 0.001 (0.089)	Loss 4.1133 (4.0980)	Top-1 acc 27.734 (29.201)	Top-5 acc 50.391 (52.479)	lr 0.00869
Warmup Train [30][180/3239]	Time 0.570 (0.606)	Data 0.001 (0.085)	Loss 4.1468 (4.0988)	Top-1 acc 30.469 (29.262)	Top-5 acc 51.172 (52.506)	lr 0.00868
Warmup Train [30][190/3239]	Time 0.577 (0.601)	Data 0.001 (0.081)	Loss 4.3349 (4.1028)	Top-1 acc 24.219 (29.180)	Top-5 acc 46.484 (52.444)	lr 0.00868
Warmup Train [30][200/3239]	Time 0.485 (0.596)	Data 0.001 (0.077)	Loss 4.2985 (4.1037)	Top-1 acc 25.391 (29.145)	Top-5 acc 49.609 (52.466)	lr 0.00867
Warmup Train [30][210/3239]	Time 0.638 (0.593)	Data 0.001 (0.074)	Loss 3.8885 (4.1042)	Top-1 acc 33.203 (29.119)	Top-5 acc 58.984 (52.470)	lr 0.00867
Warmup Train [30][220/3239]	Time 0.532 (0.589)	Data 0.001 (0.071)	Loss 4.0824 (4.1051)	Top-1 acc 30.469 (29.083)	Top-5 acc 52.344 (52.432)	lr 0.00866
Warmup Train [30][230/3239]	Time 0.620 (0.586)	Data 0.001 (0.068)	Loss 4.0073 (4.1055)	Top-1 acc 28.125 (29.016)	Top-5 acc 54.297 (52.422)	lr 0.00866
Warmup Train [30][240/3239]	Time 0.387 (0.582)	Data 0.001 (0.065)	Loss 4.2067 (4.1066)	Top-1 acc 26.562 (29.018)	Top-5 acc 48.438 (52.397)	lr 0.00865
Warmup Train [30][250/3239]	Time 0.539 (0.579)	Data 0.001 (0.063)	Loss 4.0655 (4.1058)	Top-1 acc 31.641 (29.034)	Top-5 acc 52.344 (52.428)	lr 0.00865
Warmup Train [30][260/3239]	Time 0.550 (0.576)	Data 0.001 (0.061)	Loss 4.1041 (4.1067)	Top-1 acc 26.172 (29.045)	Top-5 acc 50.781 (52.398)	lr 0.00864
Warmup Train [30][270/3239]	Time 0.628 (0.574)	Data 0.001 (0.059)	Loss 4.2013 (4.1068)	Top-1 acc 30.078 (29.060)	Top-5 acc 52.344 (52.378)	lr 0.00864
Warmup Train [30][280/3239]	Time 0.587 (0.572)	Data 0.001 (0.056)	Loss 4.0488 (4.1052)	Top-1 acc 33.984 (29.068)	Top-5 acc 51.953 (52.399)	lr 0.00864
Warmup Train [30][290/3239]	Time 0.579 (0.570)	Data 0.001 (0.055)	Loss 3.9792 (4.1038)	Top-1 acc 32.812 (29.094)	Top-5 acc 53.906 (52.397)	lr 0.00863
Warmup Train [30][300/3239]	Time 0.482 (0.568)	Data 0.001 (0.053)	Loss 4.0775 (4.1035)	Top-1 acc 28.125 (29.089)	Top-5 acc 57.031 (52.435)	lr 0.00863
Warmup Train [30][310/3239]	Time 0.457 (0.565)	Data 0.001 (0.051)	Loss 4.1893 (4.1045)	Top-1 acc 27.734 (29.047)	Top-5 acc 48.047 (52.388)	lr 0.00862
Warmup Train [30][320/3239]	Time 0.517 (0.563)	Data 0.001 (0.050)	Loss 4.0747 (4.1049)	Top-1 acc 28.906 (29.040)	Top-5 acc 52.344 (52.361)	lr 0.00862
Warmup Train [30][330/3239]	Time 0.615 (0.562)	Data 0.001 (0.048)	Loss 3.9849 (4.1067)	Top-1 acc 29.688 (29.001)	Top-5 acc 55.078 (52.301)	lr 0.00861
Warmup Train [30][340/3239]	Time 0.577 (0.561)	Data 0.001 (0.047)	Loss 4.0881 (4.1059)	Top-1 acc 32.031 (29.046)	Top-5 acc 53.125 (52.315)	lr 0.00861
Warmup Train [30][350/3239]	Time 0.504 (0.560)	Data 0.001 (0.046)	Loss 4.1017 (4.1043)	Top-1 acc 25.391 (29.081)	Top-5 acc 51.172 (52.362)	lr 0.00860
Warmup Train [30][360/3239]	Time 0.458 (0.559)	Data 0.001 (0.045)	Loss 3.9341 (4.1033)	Top-1 acc 33.594 (29.099)	Top-5 acc 57.422 (52.362)	lr 0.00860
Warmup Train [30][370/3239]	Time 0.402 (0.557)	Data 0.001 (0.044)	Loss 4.1560 (4.1047)	Top-1 acc 26.562 (29.097)	Top-5 acc 50.391 (52.335)	lr 0.00859
Warmup Train [30][380/3239]	Time 0.483 (0.556)	Data 0.001 (0.043)	Loss 4.1112 (4.1048)	Top-1 acc 29.688 (29.125)	Top-5 acc 49.609 (52.339)	lr 0.00859
Warmup Train [30][390/3239]	Time 0.543 (0.555)	Data 0.001 (0.042)	Loss 4.0409 (4.1040)	Top-1 acc 26.562 (29.143)	Top-5 acc 53.125 (52.346)	lr 0.00858
Warmup Train [30][400/3239]	Time 0.354 (0.554)	Data 0.001 (0.041)	Loss 4.0006 (4.1017)	Top-1 acc 30.469 (29.165)	Top-5 acc 53.125 (52.384)	lr 0.00858
Warmup Train [30][410/3239]	Time 0.400 (0.552)	Data 0.001 (0.040)	Loss 4.1766 (4.1035)	Top-1 acc 26.562 (29.139)	Top-5 acc 50.781 (52.356)	lr 0.00858
Warmup Train [30][420/3239]	Time 0.531 (0.551)	Data 0.001 (0.040)	Loss 4.0107 (4.1026)	Top-1 acc 28.516 (29.133)	Top-5 acc 53.906 (52.392)	lr 0.00857
Warmup Train [30][430/3239]	Time 0.478 (0.550)	Data 0.001 (0.039)	Loss 3.9243 (4.1014)	Top-1 acc 32.031 (29.150)	Top-5 acc 55.859 (52.387)	lr 0.00857
Warmup Train [30][440/3239]	Time 0.384 (0.548)	Data 0.001 (0.038)	Loss 4.3702 (4.1020)	Top-1 acc 24.219 (29.126)	Top-5 acc 44.531 (52.384)	lr 0.00856
Warmup Train [30][450/3239]	Time 0.481 (0.548)	Data 0.001 (0.038)	Loss 4.2579 (4.1025)	Top-1 acc 30.469 (29.144)	Top-5 acc 46.875 (52.383)	lr 0.00856
Warmup Train [30][460/3239]	Time 0.331 (0.545)	Data 0.001 (0.037)	Loss 4.1309 (4.1011)	Top-1 acc 23.828 (29.182)	Top-5 acc 47.656 (52.400)	lr 0.00855
Warmup Train [30][470/3239]	Time 0.613 (0.545)	Data 0.001 (0.036)	Loss 4.1616 (4.1008)	Top-1 acc 25.391 (29.177)	Top-5 acc 48.828 (52.423)	lr 0.00855
Warmup Train [30][480/3239]	Time 0.529 (0.544)	Data 0.001 (0.036)	Loss 4.2696 (4.1009)	Top-1 acc 26.172 (29.182)	Top-5 acc 47.656 (52.402)	lr 0.00854
Warmup Train [30][490/3239]	Time 0.475 (0.543)	Data 0.001 (0.035)	Loss 3.9815 (4.1008)	Top-1 acc 29.297 (29.209)	Top-5 acc 53.516 (52.410)	lr 0.00854
Warmup Train [30][500/3239]	Time 0.613 (0.543)	Data 0.001 (0.035)	Loss 4.0546 (4.1002)	Top-1 acc 29.297 (29.231)	Top-5 acc 50.391 (52.402)	lr 0.00853
Warmup Train [30][510/3239]	Time 0.620 (0.543)	Data 0.001 (0.034)	Loss 4.0424 (4.1002)	Top-1 acc 29.688 (29.221)	Top-5 acc 54.297 (52.406)	lr 0.00853
Warmup Train [30][520/3239]	Time 0.372 (0.542)	Data 0.001 (0.033)	Loss 4.1059 (4.1000)	Top-1 acc 25.781 (29.226)	Top-5 acc 51.562 (52.400)	lr 0.00853
Warmup Train [30][530/3239]	Time 0.439 (0.541)	Data 0.001 (0.033)	Loss 4.1132 (4.1003)	Top-1 acc 27.734 (29.206)	Top-5 acc 48.828 (52.386)	lr 0.00852
Warmup Train [30][540/3239]	Time 0.559 (0.541)	Data 0.001 (0.033)	Loss 3.8011 (4.1011)	Top-1 acc 33.984 (29.178)	Top-5 acc 60.156 (52.359)	lr 0.00852
Warmup Train [30][550/3239]	Time 0.411 (0.540)	Data 0.001 (0.032)	Loss 4.2504 (4.1021)	Top-1 acc 24.609 (29.154)	Top-5 acc 51.172 (52.329)	lr 0.00851
Warmup Train [30][560/3239]	Time 0.421 (0.539)	Data 0.001 (0.032)	Loss 4.0483 (4.1010)	Top-1 acc 31.641 (29.175)	Top-5 acc 53.516 (52.346)	lr 0.00851
Warmup Train [30][570/3239]	Time 0.520 (0.539)	Data 0.001 (0.031)	Loss 4.1791 (4.1012)	Top-1 acc 30.078 (29.166)	Top-5 acc 49.219 (52.340)	lr 0.00850
Warmup Train [30][580/3239]	Time 0.421 (0.539)	Data 0.001 (0.031)	Loss 4.0233 (4.1010)	Top-1 acc 30.078 (29.165)	Top-5 acc 55.469 (52.348)	lr 0.00850
Warmup Train [30][590/3239]	Time 0.379 (0.539)	Data 0.001 (0.030)	Loss 4.1452 (4.1012)	Top-1 acc 29.297 (29.155)	Top-5 acc 52.734 (52.361)	lr 0.00849
Warmup Train [30][600/3239]	Time 0.536 (0.538)	Data 0.001 (0.030)	Loss 4.0146 (4.1007)	Top-1 acc 30.859 (29.157)	Top-5 acc 55.859 (52.353)	lr 0.00849
Warmup Train [30][610/3239]	Time 0.422 (0.538)	Data 0.001 (0.030)	Loss 4.0718 (4.1009)	Top-1 acc 30.859 (29.142)	Top-5 acc 55.859 (52.341)	lr 0.00848
Warmup Train [30][620/3239]	Time 0.667 (0.538)	Data 0.001 (0.029)	Loss 3.9951 (4.1007)	Top-1 acc 29.688 (29.142)	Top-5 acc 56.641 (52.352)	lr 0.00848
Warmup Train [30][630/3239]	Time 0.429 (0.537)	Data 0.001 (0.029)	Loss 4.1312 (4.1017)	Top-1 acc 26.562 (29.110)	Top-5 acc 51.953 (52.332)	lr 0.00848
Warmup Train [30][640/3239]	Time 0.595 (0.537)	Data 0.001 (0.029)	Loss 4.3273 (4.1024)	Top-1 acc 22.266 (29.095)	Top-5 acc 46.094 (52.308)	lr 0.00847
Warmup Train [30][650/3239]	Time 0.512 (0.537)	Data 0.001 (0.028)	Loss 4.2667 (4.1018)	Top-1 acc 25.391 (29.096)	Top-5 acc 45.703 (52.306)	lr 0.00847
Warmup Train [30][660/3239]	Time 0.416 (0.537)	Data 0.001 (0.028)	Loss 4.0799 (4.1028)	Top-1 acc 30.859 (29.075)	Top-5 acc 56.250 (52.279)	lr 0.00846
Warmup Train [30][670/3239]	Time 0.555 (0.537)	Data 0.001 (0.028)	Loss 4.0683 (4.1034)	Top-1 acc 32.422 (29.080)	Top-5 acc 52.734 (52.279)	lr 0.00846
Warmup Train [30][680/3239]	Time 0.570 (0.537)	Data 0.001 (0.027)	Loss 4.1633 (4.1041)	Top-1 acc 29.688 (29.075)	Top-5 acc 51.172 (52.271)	lr 0.00845
Warmup Train [30][690/3239]	Time 0.502 (0.536)	Data 0.001 (0.027)	Loss 4.0276 (4.1032)	Top-1 acc 28.906 (29.091)	Top-5 acc 53.125 (52.287)	lr 0.00845
Warmup Train [30][700/3239]	Time 0.417 (0.535)	Data 0.001 (0.027)	Loss 4.1304 (4.1028)	Top-1 acc 31.641 (29.112)	Top-5 acc 48.438 (52.296)	lr 0.00844
Warmup Train [30][710/3239]	Time 0.349 (0.535)	Data 0.001 (0.026)	Loss 4.1624 (4.1029)	Top-1 acc 25.781 (29.098)	Top-5 acc 50.000 (52.279)	lr 0.00844
Warmup Train [30][720/3239]	Time 0.534 (0.534)	Data 0.001 (0.026)	Loss 4.2452 (4.1025)	Top-1 acc 28.125 (29.095)	Top-5 acc 48.438 (52.286)	lr 0.00843
Warmup Train [30][730/3239]	Time 0.638 (0.534)	Data 0.001 (0.026)	Loss 3.9566 (4.1032)	Top-1 acc 31.250 (29.082)	Top-5 acc 55.859 (52.263)	lr 0.00843
Warmup Train [30][740/3239]	Time 0.575 (0.533)	Data 0.001 (0.026)	Loss 4.2583 (4.1033)	Top-1 acc 27.734 (29.095)	Top-5 acc 48.438 (52.269)	lr 0.00843
Warmup Train [30][750/3239]	Time 0.524 (0.533)	Data 0.001 (0.025)	Loss 4.2075 (4.1033)	Top-1 acc 27.344 (29.099)	Top-5 acc 53.516 (52.279)	lr 0.00842
Warmup Train [30][760/3239]	Time 0.520 (0.532)	Data 0.001 (0.025)	Loss 4.1259 (4.1036)	Top-1 acc 25.781 (29.089)	Top-5 acc 51.562 (52.264)	lr 0.00842
Warmup Train [30][770/3239]	Time 0.412 (0.531)	Data 0.001 (0.025)	Loss 4.2861 (4.1036)	Top-1 acc 26.172 (29.104)	Top-5 acc 48.047 (52.260)	lr 0.00841
Warmup Train [30][780/3239]	Time 0.551 (0.531)	Data 0.001 (0.025)	Loss 4.1106 (4.1030)	Top-1 acc 27.344 (29.106)	Top-5 acc 50.391 (52.269)	lr 0.00841
Warmup Train [30][790/3239]	Time 0.416 (0.531)	Data 0.001 (0.024)	Loss 4.1081 (4.1032)	Top-1 acc 27.734 (29.105)	Top-5 acc 54.688 (52.282)	lr 0.00840
Warmup Train [30][800/3239]	Time 0.327 (0.531)	Data 0.001 (0.024)	Loss 4.0044 (4.1036)	Top-1 acc 26.562 (29.083)	Top-5 acc 51.953 (52.281)	lr 0.00840
Warmup Train [30][810/3239]	Time 0.466 (0.531)	Data 0.001 (0.024)	Loss 4.0528 (4.1034)	Top-1 acc 29.297 (29.092)	Top-5 acc 53.516 (52.292)	lr 0.00839
Warmup Train [30][820/3239]	Time 0.359 (0.530)	Data 0.001 (0.024)	Loss 4.0614 (4.1043)	Top-1 acc 30.469 (29.084)	Top-5 acc 53.906 (52.273)	lr 0.00839
Warmup Train [30][830/3239]	Time 0.391 (0.530)	Data 0.001 (0.024)	Loss 4.1624 (4.1047)	Top-1 acc 30.469 (29.084)	Top-5 acc 51.172 (52.265)	lr 0.00838
Warmup Train [30][840/3239]	Time 0.380 (0.530)	Data 0.001 (0.024)	Loss 4.2084 (4.1038)	Top-1 acc 23.828 (29.090)	Top-5 acc 48.438 (52.286)	lr 0.00838
Warmup Train [30][850/3239]	Time 0.594 (0.530)	Data 0.001 (0.023)	Loss 4.1639 (4.1039)	Top-1 acc 26.562 (29.086)	Top-5 acc 51.172 (52.286)	lr 0.00838
Warmup Train [30][860/3239]	Time 0.577 (0.530)	Data 0.002 (0.023)	Loss 3.9490 (4.1034)	Top-1 acc 32.422 (29.089)	Top-5 acc 52.734 (52.290)	lr 0.00837
Warmup Train [30][870/3239]	Time 0.599 (0.530)	Data 0.002 (0.023)	Loss 3.9709 (4.1029)	Top-1 acc 31.250 (29.093)	Top-5 acc 53.906 (52.295)	lr 0.00837
Warmup Train [30][880/3239]	Time 0.601 (0.530)	Data 0.001 (0.023)	Loss 3.8664 (4.1036)	Top-1 acc 34.375 (29.083)	Top-5 acc 59.766 (52.280)	lr 0.00836
Warmup Train [30][890/3239]	Time 0.361 (0.530)	Data 0.001 (0.022)	Loss 4.1426 (4.1034)	Top-1 acc 26.953 (29.084)	Top-5 acc 53.516 (52.279)	lr 0.00836
Warmup Train [30][900/3239]	Time 0.515 (0.530)	Data 0.001 (0.022)	Loss 4.1310 (4.1033)	Top-1 acc 28.906 (29.081)	Top-5 acc 53.906 (52.284)	lr 0.00835
Warmup Train [30][910/3239]	Time 0.588 (0.529)	Data 0.001 (0.022)	Loss 4.1539 (4.1032)	Top-1 acc 29.688 (29.080)	Top-5 acc 49.609 (52.275)	lr 0.00835
Warmup Train [30][920/3239]	Time 0.362 (0.529)	Data 0.001 (0.022)	Loss 4.0385 (4.1032)	Top-1 acc 27.734 (29.076)	Top-5 acc 53.516 (52.270)	lr 0.00834
Warmup Train [30][930/3239]	Time 0.569 (0.529)	Data 0.001 (0.022)	Loss 4.1481 (4.1038)	Top-1 acc 29.297 (29.060)	Top-5 acc 50.391 (52.247)	lr 0.00834
Warmup Train [30][940/3239]	Time 0.516 (0.529)	Data 0.001 (0.022)	Loss 4.2392 (4.1039)	Top-1 acc 27.344 (29.067)	Top-5 acc 50.391 (52.239)	lr 0.00833
Warmup Train [30][950/3239]	Time 0.464 (0.529)	Data 0.001 (0.021)	Loss 4.2624 (4.1042)	Top-1 acc 25.391 (29.058)	Top-5 acc 48.047 (52.237)	lr 0.00833
Warmup Train [30][960/3239]	Time 0.522 (0.529)	Data 0.001 (0.021)	Loss 4.0264 (4.1037)	Top-1 acc 28.125 (29.074)	Top-5 acc 51.172 (52.247)	lr 0.00833
Warmup Train [30][970/3239]	Time 0.773 (0.529)	Data 0.002 (0.021)	Loss 3.9925 (4.1037)	Top-1 acc 33.594 (29.084)	Top-5 acc 55.859 (52.253)	lr 0.00832
Warmup Train [30][980/3239]	Time 0.503 (0.529)	Data 0.001 (0.021)	Loss 4.2952 (4.1035)	Top-1 acc 24.609 (29.089)	Top-5 acc 48.438 (52.263)	lr 0.00832
Warmup Train [30][990/3239]	Time 0.378 (0.528)	Data 0.001 (0.021)	Loss 4.1853 (4.1030)	Top-1 acc 26.953 (29.088)	Top-5 acc 50.000 (52.267)	lr 0.00831
Warmup Train [30][1000/3239]	Time 0.389 (0.528)	Data 0.001 (0.021)	Loss 4.2572 (4.1037)	Top-1 acc 25.781 (29.072)	Top-5 acc 48.047 (52.252)	lr 0.00831
Warmup Train [30][1010/3239]	Time 0.628 (0.528)	Data 0.001 (0.021)	Loss 4.1393 (4.1043)	Top-1 acc 28.906 (29.070)	Top-5 acc 52.734 (52.240)	lr 0.00830
Warmup Train [30][1020/3239]	Time 0.559 (0.527)	Data 0.001 (0.020)	Loss 4.1257 (4.1042)	Top-1 acc 28.906 (29.076)	Top-5 acc 51.172 (52.234)	lr 0.00830
Warmup Train [30][1030/3239]	Time 0.474 (0.527)	Data 0.001 (0.020)	Loss 4.1049 (4.1041)	Top-1 acc 30.078 (29.074)	Top-5 acc 53.906 (52.237)	lr 0.00829
Warmup Train [30][1040/3239]	Time 0.535 (0.527)	Data 0.001 (0.020)	Loss 4.1766 (4.1039)	Top-1 acc 28.516 (29.083)	Top-5 acc 53.906 (52.238)	lr 0.00829
Warmup Train [30][1050/3239]	Time 0.411 (0.526)	Data 0.001 (0.020)	Loss 4.1266 (4.1039)	Top-1 acc 28.516 (29.077)	Top-5 acc 53.516 (52.244)	lr 0.00829
Warmup Train [30][1060/3239]	Time 0.573 (0.526)	Data 0.001 (0.020)	Loss 3.9112 (4.1033)	Top-1 acc 33.984 (29.088)	Top-5 acc 57.031 (52.255)	lr 0.00828
Warmup Train [30][1070/3239]	Time 0.616 (0.526)	Data 0.001 (0.020)	Loss 4.2803 (4.1034)	Top-1 acc 27.344 (29.093)	Top-5 acc 50.781 (52.251)	lr 0.00828
Warmup Train [30][1080/3239]	Time 0.536 (0.526)	Data 0.001 (0.019)	Loss 4.1777 (4.1037)	Top-1 acc 28.125 (29.097)	Top-5 acc 50.000 (52.246)	lr 0.00827
Warmup Train [30][1090/3239]	Time 0.360 (0.526)	Data 0.001 (0.019)	Loss 3.9452 (4.1037)	Top-1 acc 32.422 (29.097)	Top-5 acc 55.469 (52.254)	lr 0.00827
Warmup Train [30][1100/3239]	Time 0.315 (0.526)	Data 0.001 (0.019)	Loss 4.3321 (4.1043)	Top-1 acc 25.391 (29.081)	Top-5 acc 50.391 (52.245)	lr 0.00826
Warmup Train [30][1110/3239]	Time 0.370 (0.526)	Data 0.001 (0.019)	Loss 4.0511 (4.1041)	Top-1 acc 32.422 (29.094)	Top-5 acc 55.859 (52.258)	lr 0.00826
Warmup Train [30][1120/3239]	Time 0.701 (0.525)	Data 0.001 (0.019)	Loss 4.1959 (4.1044)	Top-1 acc 25.391 (29.090)	Top-5 acc 51.172 (52.250)	lr 0.00825
Warmup Train [30][1130/3239]	Time 0.376 (0.525)	Data 0.001 (0.019)	Loss 4.1062 (4.1044)	Top-1 acc 31.250 (29.084)	Top-5 acc 51.562 (52.251)	lr 0.00825
Warmup Train [30][1140/3239]	Time 0.485 (0.525)	Data 0.001 (0.019)	Loss 3.9033 (4.1043)	Top-1 acc 32.422 (29.072)	Top-5 acc 58.984 (52.243)	lr 0.00824
Warmup Train [30][1150/3239]	Time 0.554 (0.525)	Data 0.001 (0.019)	Loss 4.0772 (4.1044)	Top-1 acc 33.594 (29.072)	Top-5 acc 54.688 (52.236)	lr 0.00824
Warmup Train [30][1160/3239]	Time 0.554 (0.525)	Data 0.001 (0.019)	Loss 4.0323 (4.1046)	Top-1 acc 32.422 (29.067)	Top-5 acc 54.297 (52.237)	lr 0.00824
Warmup Train [30][1170/3239]	Time 0.513 (0.525)	Data 0.001 (0.019)	Loss 4.1446 (4.1046)	Top-1 acc 31.641 (29.065)	Top-5 acc 52.344 (52.243)	lr 0.00823
Warmup Train [30][1180/3239]	Time 0.522 (0.525)	Data 0.001 (0.019)	Loss 4.1062 (4.1042)	Top-1 acc 28.906 (29.069)	Top-5 acc 49.609 (52.249)	lr 0.00823
Warmup Train [30][1190/3239]	Time 0.576 (0.525)	Data 0.001 (0.018)	Loss 4.0682 (4.1040)	Top-1 acc 30.078 (29.076)	Top-5 acc 52.734 (52.257)	lr 0.00822
Warmup Train [30][1200/3239]	Time 0.502 (0.525)	Data 0.001 (0.018)	Loss 3.9655 (4.1043)	Top-1 acc 28.125 (29.061)	Top-5 acc 54.688 (52.243)	lr 0.00822
Warmup Train [30][1210/3239]	Time 0.448 (0.525)	Data 0.002 (0.018)	Loss 4.2440 (4.1046)	Top-1 acc 26.562 (29.060)	Top-5 acc 48.047 (52.237)	lr 0.00821
Warmup Train [30][1220/3239]	Time 0.426 (0.525)	Data 0.001 (0.018)	Loss 4.1416 (4.1042)	Top-1 acc 29.688 (29.069)	Top-5 acc 46.484 (52.244)	lr 0.00821
Warmup Train [30][1230/3239]	Time 0.657 (0.525)	Data 0.001 (0.018)	Loss 4.1759 (4.1034)	Top-1 acc 23.828 (29.083)	Top-5 acc 48.047 (52.267)	lr 0.00820
Warmup Train [30][1240/3239]	Time 0.514 (0.525)	Data 0.001 (0.018)	Loss 3.9817 (4.1028)	Top-1 acc 33.594 (29.100)	Top-5 acc 53.906 (52.280)	lr 0.00820
Warmup Train [30][1250/3239]	Time 0.560 (0.525)	Data 0.001 (0.018)	Loss 4.1770 (4.1027)	Top-1 acc 28.906 (29.110)	Top-5 acc 53.516 (52.280)	lr 0.00820
Warmup Train [30][1260/3239]	Time 0.551 (0.525)	Data 0.001 (0.018)	Loss 4.0527 (4.1027)	Top-1 acc 29.688 (29.114)	Top-5 acc 51.953 (52.276)	lr 0.00819
Warmup Train [30][1270/3239]	Time 0.266 (0.524)	Data 0.001 (0.018)	Loss 4.2957 (4.1034)	Top-1 acc 25.781 (29.100)	Top-5 acc 48.047 (52.271)	lr 0.00819
Warmup Train [30][1280/3239]	Time 0.369 (0.524)	Data 0.001 (0.018)	Loss 4.1126 (4.1033)	Top-1 acc 29.297 (29.104)	Top-5 acc 54.297 (52.279)	lr 0.00818
Warmup Train [30][1290/3239]	Time 0.190 (0.524)	Data 0.001 (0.018)	Loss 3.9542 (4.1030)	Top-1 acc 28.906 (29.111)	Top-5 acc 54.297 (52.284)	lr 0.00818
Warmup Train [30][1300/3239]	Time 0.397 (0.524)	Data 0.001 (0.018)	Loss 4.0013 (4.1031)	Top-1 acc 35.938 (29.111)	Top-5 acc 55.078 (52.284)	lr 0.00817
Warmup Train [30][1310/3239]	Time 0.572 (0.524)	Data 0.001 (0.018)	Loss 4.1257 (4.1037)	Top-1 acc 26.953 (29.097)	Top-5 acc 50.391 (52.270)	lr 0.00817
Warmup Train [30][1320/3239]	Time 0.629 (0.524)	Data 0.002 (0.017)	Loss 4.2486 (4.1040)	Top-1 acc 26.953 (29.088)	Top-5 acc 53.125 (52.269)	lr 0.00816
Warmup Train [30][1330/3239]	Time 0.578 (0.523)	Data 0.001 (0.017)	Loss 3.9314 (4.1034)	Top-1 acc 34.375 (29.089)	Top-5 acc 54.688 (52.280)	lr 0.00816
Warmup Train [30][1340/3239]	Time 0.494 (0.523)	Data 0.001 (0.017)	Loss 4.0406 (4.1035)	Top-1 acc 32.422 (29.094)	Top-5 acc 53.906 (52.274)	lr 0.00815
Warmup Train [30][1350/3239]	Time 0.574 (0.523)	Data 0.032 (0.017)	Loss 4.0476 (4.1039)	Top-1 acc 29.688 (29.082)	Top-5 acc 55.078 (52.266)	lr 0.00815
Warmup Train [30][1360/3239]	Time 0.563 (0.523)	Data 0.001 (0.017)	Loss 4.0165 (4.1039)	Top-1 acc 33.984 (29.091)	Top-5 acc 53.516 (52.262)	lr 0.00815
Warmup Train [30][1370/3239]	Time 0.627 (0.523)	Data 0.001 (0.017)	Loss 4.3864 (4.1041)	Top-1 acc 23.047 (29.085)	Top-5 acc 49.219 (52.263)	lr 0.00814
Warmup Train [30][1380/3239]	Time 0.368 (0.523)	Data 0.001 (0.017)	Loss 4.1248 (4.1038)	Top-1 acc 28.906 (29.088)	Top-5 acc 50.000 (52.260)	lr 0.00814
Warmup Train [30][1390/3239]	Time 0.645 (0.523)	Data 0.002 (0.017)	Loss 3.8587 (4.1040)	Top-1 acc 31.641 (29.088)	Top-5 acc 53.906 (52.254)	lr 0.00813
Warmup Train [30][1400/3239]	Time 0.448 (0.523)	Data 0.001 (0.017)	Loss 4.0250 (4.1039)	Top-1 acc 31.250 (29.086)	Top-5 acc 51.953 (52.255)	lr 0.00813
Warmup Train [30][1410/3239]	Time 0.604 (0.523)	Data 0.001 (0.017)	Loss 4.1287 (4.1037)	Top-1 acc 28.125 (29.088)	Top-5 acc 55.469 (52.267)	lr 0.00812
Warmup Train [30][1420/3239]	Time 0.581 (0.523)	Data 0.001 (0.017)	Loss 4.2057 (4.1042)	Top-1 acc 26.562 (29.076)	Top-5 acc 52.734 (52.258)	lr 0.00812
Warmup Train [30][1430/3239]	Time 0.657 (0.523)	Data 0.001 (0.017)	Loss 4.0055 (4.1040)	Top-1 acc 31.250 (29.083)	Top-5 acc 52.344 (52.260)	lr 0.00811
Warmup Train [30][1440/3239]	Time 0.626 (0.523)	Data 0.001 (0.016)	Loss 4.1431 (4.1040)	Top-1 acc 25.781 (29.078)	Top-5 acc 48.438 (52.265)	lr 0.00811
Warmup Train [30][1450/3239]	Time 0.570 (0.523)	Data 0.001 (0.016)	Loss 4.2615 (4.1044)	Top-1 acc 25.781 (29.072)	Top-5 acc 50.000 (52.258)	lr 0.00811
Warmup Train [30][1460/3239]	Time 0.682 (0.523)	Data 0.001 (0.016)	Loss 4.0481 (4.1049)	Top-1 acc 30.859 (29.064)	Top-5 acc 54.297 (52.249)	lr 0.00810
Warmup Train [30][1470/3239]	Time 0.463 (0.523)	Data 0.001 (0.016)	Loss 4.2205 (4.1052)	Top-1 acc 29.688 (29.058)	Top-5 acc 50.000 (52.241)	lr 0.00810
Warmup Train [30][1480/3239]	Time 0.456 (0.523)	Data 0.001 (0.016)	Loss 4.1297 (4.1056)	Top-1 acc 28.125 (29.047)	Top-5 acc 52.344 (52.230)	lr 0.00809
Warmup Train [30][1490/3239]	Time 0.537 (0.523)	Data 0.001 (0.016)	Loss 4.0138 (4.1059)	Top-1 acc 30.859 (29.046)	Top-5 acc 53.906 (52.224)	lr 0.00809
Warmup Train [30][1500/3239]	Time 0.362 (0.522)	Data 0.001 (0.016)	Loss 4.3080 (4.1061)	Top-1 acc 26.172 (29.046)	Top-5 acc 50.391 (52.219)	lr 0.00808
Warmup Train [30][1510/3239]	Time 0.357 (0.522)	Data 0.002 (0.016)	Loss 4.2450 (4.1063)	Top-1 acc 28.125 (29.045)	Top-5 acc 47.656 (52.210)	lr 0.00808
Warmup Train [30][1520/3239]	Time 0.589 (0.522)	Data 0.001 (0.016)	Loss 4.0131 (4.1053)	Top-1 acc 31.641 (29.059)	Top-5 acc 54.297 (52.233)	lr 0.00807
Warmup Train [30][1530/3239]	Time 0.538 (0.522)	Data 0.001 (0.016)	Loss 4.1037 (4.1054)	Top-1 acc 27.344 (29.060)	Top-5 acc 50.000 (52.230)	lr 0.00807
Warmup Train [30][1540/3239]	Time 0.361 (0.522)	Data 0.001 (0.016)	Loss 4.1017 (4.1054)	Top-1 acc 25.391 (29.058)	Top-5 acc 52.734 (52.227)	lr 0.00807
Warmup Train [30][1550/3239]	Time 0.668 (0.522)	Data 0.001 (0.016)	Loss 4.1143 (4.1053)	Top-1 acc 28.516 (29.060)	Top-5 acc 51.562 (52.228)	lr 0.00806
Warmup Train [30][1560/3239]	Time 0.383 (0.522)	Data 0.001 (0.016)	Loss 4.2010 (4.1059)	Top-1 acc 28.516 (29.048)	Top-5 acc 51.562 (52.216)	lr 0.00806
Warmup Train [30][1570/3239]	Time 0.407 (0.521)	Data 0.001 (0.016)	Loss 4.1738 (4.1061)	Top-1 acc 28.906 (29.042)	Top-5 acc 51.953 (52.211)	lr 0.00805
Warmup Train [30][1580/3239]	Time 0.621 (0.521)	Data 0.002 (0.016)	Loss 4.0820 (4.1064)	Top-1 acc 30.078 (29.037)	Top-5 acc 53.516 (52.210)	lr 0.00805
Warmup Train [30][1590/3239]	Time 0.499 (0.521)	Data 0.001 (0.016)	Loss 4.1727 (4.1061)	Top-1 acc 26.562 (29.046)	Top-5 acc 52.344 (52.219)	lr 0.00804
Warmup Train [30][1600/3239]	Time 0.543 (0.521)	Data 0.001 (0.016)	Loss 3.9821 (4.1057)	Top-1 acc 33.594 (29.058)	Top-5 acc 56.641 (52.232)	lr 0.00804
Warmup Train [30][1610/3239]	Time 0.644 (0.521)	Data 0.001 (0.016)	Loss 4.3043 (4.1058)	Top-1 acc 26.953 (29.055)	Top-5 acc 48.047 (52.222)	lr 0.00803
Warmup Train [30][1620/3239]	Time 0.454 (0.521)	Data 0.002 (0.015)	Loss 4.2561 (4.1061)	Top-1 acc 28.516 (29.055)	Top-5 acc 50.781 (52.218)	lr 0.00803
Warmup Train [30][1630/3239]	Time 0.423 (0.521)	Data 0.001 (0.015)	Loss 4.2960 (4.1065)	Top-1 acc 26.953 (29.047)	Top-5 acc 42.969 (52.208)	lr 0.00803
Warmup Train [30][1640/3239]	Time 0.528 (0.521)	Data 0.001 (0.015)	Loss 3.8885 (4.1062)	Top-1 acc 31.641 (29.051)	Top-5 acc 57.031 (52.215)	lr 0.00802
Warmup Train [30][1650/3239]	Time 0.463 (0.521)	Data 0.001 (0.015)	Loss 4.2151 (4.1059)	Top-1 acc 28.906 (29.062)	Top-5 acc 50.781 (52.227)	lr 0.00802
Warmup Train [30][1660/3239]	Time 0.415 (0.521)	Data 0.001 (0.015)	Loss 3.9870 (4.1057)	Top-1 acc 30.469 (29.069)	Top-5 acc 55.469 (52.231)	lr 0.00801
Warmup Train [30][1670/3239]	Time 0.518 (0.521)	Data 0.001 (0.015)	Loss 4.0850 (4.1057)	Top-1 acc 32.031 (29.078)	Top-5 acc 52.344 (52.233)	lr 0.00801
Warmup Train [30][1680/3239]	Time 0.383 (0.521)	Data 0.001 (0.015)	Loss 3.8307 (4.1054)	Top-1 acc 33.984 (29.086)	Top-5 acc 60.547 (52.241)	lr 0.00800
Warmup Train [30][1690/3239]	Time 0.482 (0.521)	Data 0.001 (0.015)	Loss 4.1208 (4.1055)	Top-1 acc 29.297 (29.082)	Top-5 acc 52.344 (52.238)	lr 0.00800
Warmup Train [30][1700/3239]	Time 0.655 (0.521)	Data 0.001 (0.015)	Loss 4.1163 (4.1058)	Top-1 acc 27.734 (29.078)	Top-5 acc 53.516 (52.231)	lr 0.00799
Warmup Train [30][1710/3239]	Time 0.553 (0.521)	Data 0.001 (0.015)	Loss 4.0499 (4.1058)	Top-1 acc 32.031 (29.076)	Top-5 acc 52.344 (52.228)	lr 0.00799
Warmup Train [30][1720/3239]	Time 0.516 (0.521)	Data 0.001 (0.015)	Loss 4.2074 (4.1055)	Top-1 acc 28.125 (29.084)	Top-5 acc 48.047 (52.238)	lr 0.00799
Warmup Train [30][1730/3239]	Time 0.513 (0.521)	Data 0.001 (0.015)	Loss 4.1279 (4.1053)	Top-1 acc 26.562 (29.080)	Top-5 acc 48.828 (52.241)	lr 0.00798
Warmup Train [30][1740/3239]	Time 0.459 (0.521)	Data 0.001 (0.015)	Loss 4.1855 (4.1055)	Top-1 acc 28.906 (29.079)	Top-5 acc 51.953 (52.238)	lr 0.00798
Warmup Train [30][1750/3239]	Time 0.571 (0.521)	Data 0.001 (0.015)	Loss 4.0696 (4.1057)	Top-1 acc 32.812 (29.073)	Top-5 acc 53.906 (52.236)	lr 0.00797
Warmup Train [30][1760/3239]	Time 0.472 (0.521)	Data 0.001 (0.015)	Loss 4.1626 (4.1059)	Top-1 acc 30.859 (29.074)	Top-5 acc 51.562 (52.235)	lr 0.00797
Warmup Train [30][1770/3239]	Time 0.490 (0.521)	Data 0.001 (0.015)	Loss 4.0825 (4.1062)	Top-1 acc 28.906 (29.071)	Top-5 acc 52.734 (52.230)	lr 0.00796
Warmup Train [30][1780/3239]	Time 0.403 (0.521)	Data 0.001 (0.015)	Loss 4.3571 (4.1064)	Top-1 acc 25.391 (29.064)	Top-5 acc 47.266 (52.229)	lr 0.00796
Warmup Train [30][1790/3239]	Time 0.545 (0.521)	Data 0.001 (0.015)	Loss 4.2894 (4.1066)	Top-1 acc 27.734 (29.059)	Top-5 acc 48.438 (52.226)	lr 0.00795
Warmup Train [30][1800/3239]	Time 0.321 (0.521)	Data 0.001 (0.015)	Loss 4.0401 (4.1066)	Top-1 acc 25.781 (29.054)	Top-5 acc 52.344 (52.227)	lr 0.00795
Warmup Train [30][1810/3239]	Time 0.427 (0.521)	Data 0.001 (0.014)	Loss 4.1052 (4.1063)	Top-1 acc 31.641 (29.059)	Top-5 acc 52.734 (52.229)	lr 0.00795
Warmup Train [30][1820/3239]	Time 0.287 (0.521)	Data 0.001 (0.014)	Loss 4.0893 (4.1061)	Top-1 acc 26.172 (29.063)	Top-5 acc 52.734 (52.237)	lr 0.00794
Warmup Train [30][1830/3239]	Time 0.536 (0.521)	Data 0.001 (0.014)	Loss 4.1817 (4.1061)	Top-1 acc 27.734 (29.062)	Top-5 acc 52.734 (52.237)	lr 0.00794
Warmup Train [30][1840/3239]	Time 0.348 (0.520)	Data 0.001 (0.014)	Loss 4.1648 (4.1062)	Top-1 acc 27.344 (29.060)	Top-5 acc 48.828 (52.232)	lr 0.00793
Warmup Train [30][1850/3239]	Time 0.480 (0.520)	Data 0.001 (0.014)	Loss 4.1159 (4.1059)	Top-1 acc 29.297 (29.061)	Top-5 acc 52.344 (52.239)	lr 0.00793
Warmup Train [30][1860/3239]	Time 0.552 (0.520)	Data 0.001 (0.014)	Loss 4.1795 (4.1060)	Top-1 acc 26.562 (29.055)	Top-5 acc 51.953 (52.237)	lr 0.00792
Warmup Train [30][1870/3239]	Time 0.457 (0.520)	Data 0.001 (0.014)	Loss 3.8744 (4.1058)	Top-1 acc 34.766 (29.060)	Top-5 acc 60.547 (52.245)	lr 0.00792
Warmup Train [30][1880/3239]	Time 0.596 (0.520)	Data 0.001 (0.014)	Loss 3.9852 (4.1056)	Top-1 acc 33.594 (29.065)	Top-5 acc 57.031 (52.247)	lr 0.00791
Warmup Train [30][1890/3239]	Time 0.389 (0.520)	Data 0.001 (0.014)	Loss 4.3737 (4.1055)	Top-1 acc 22.656 (29.063)	Top-5 acc 45.703 (52.252)	lr 0.00791
Warmup Train [30][1900/3239]	Time 0.483 (0.520)	Data 0.001 (0.014)	Loss 4.2342 (4.1059)	Top-1 acc 30.859 (29.056)	Top-5 acc 50.000 (52.245)	lr 0.00791
Warmup Train [30][1910/3239]	Time 0.530 (0.520)	Data 0.001 (0.014)	Loss 3.9193 (4.1057)	Top-1 acc 31.641 (29.062)	Top-5 acc 55.078 (52.255)	lr 0.00790
Warmup Train [30][1920/3239]	Time 0.525 (0.520)	Data 0.001 (0.014)	Loss 4.1142 (4.1058)	Top-1 acc 28.906 (29.065)	Top-5 acc 51.953 (52.251)	lr 0.00790
Warmup Train [30][1930/3239]	Time 0.514 (0.520)	Data 0.001 (0.014)	Loss 4.0783 (4.1060)	Top-1 acc 30.859 (29.059)	Top-5 acc 52.344 (52.247)	lr 0.00789
Warmup Train [30][1940/3239]	Time 0.547 (0.520)	Data 0.001 (0.014)	Loss 3.9556 (4.1062)	Top-1 acc 27.734 (29.053)	Top-5 acc 55.469 (52.242)	lr 0.00789
Warmup Train [30][1950/3239]	Time 0.576 (0.520)	Data 0.001 (0.014)	Loss 4.0963 (4.1063)	Top-1 acc 24.609 (29.051)	Top-5 acc 55.078 (52.242)	lr 0.00788
Warmup Train [30][1960/3239]	Time 0.556 (0.519)	Data 0.001 (0.014)	Loss 4.0441 (4.1062)	Top-1 acc 33.203 (29.055)	Top-5 acc 56.641 (52.247)	lr 0.00788
Warmup Train [30][1970/3239]	Time 0.513 (0.519)	Data 0.001 (0.014)	Loss 4.0362 (4.1059)	Top-1 acc 27.734 (29.057)	Top-5 acc 58.203 (52.256)	lr 0.00787
Warmup Train [30][1980/3239]	Time 0.524 (0.519)	Data 0.001 (0.014)	Loss 4.0298 (4.1059)	Top-1 acc 31.250 (29.059)	Top-5 acc 53.516 (52.256)	lr 0.00787
Warmup Train [30][1990/3239]	Time 0.518 (0.519)	Data 0.001 (0.014)	Loss 4.2782 (4.1064)	Top-1 acc 27.344 (29.050)	Top-5 acc 50.781 (52.246)	lr 0.00787
Warmup Train [30][2000/3239]	Time 0.557 (0.519)	Data 0.001 (0.014)	Loss 4.1847 (4.1065)	Top-1 acc 30.859 (29.051)	Top-5 acc 51.562 (52.249)	lr 0.00786
Warmup Train [30][2010/3239]	Time 0.385 (0.519)	Data 0.001 (0.014)	Loss 4.4927 (4.1064)	Top-1 acc 26.953 (29.051)	Top-5 acc 44.141 (52.246)	lr 0.00786
Warmup Train [30][2020/3239]	Time 0.497 (0.519)	Data 0.001 (0.014)	Loss 4.1807 (4.1064)	Top-1 acc 29.688 (29.050)	Top-5 acc 49.609 (52.245)	lr 0.00785
Warmup Train [30][2030/3239]	Time 0.678 (0.519)	Data 0.001 (0.014)	Loss 4.0828 (4.1062)	Top-1 acc 30.078 (29.048)	Top-5 acc 50.781 (52.247)	lr 0.00785
Warmup Train [30][2040/3239]	Time 0.640 (0.519)	Data 0.001 (0.014)	Loss 4.1729 (4.1065)	Top-1 acc 28.906 (29.045)	Top-5 acc 51.562 (52.241)	lr 0.00784
Warmup Train [30][2050/3239]	Time 0.507 (0.519)	Data 0.001 (0.014)	Loss 4.2313 (4.1064)	Top-1 acc 30.078 (29.050)	Top-5 acc 52.344 (52.240)	lr 0.00784
Warmup Train [30][2060/3239]	Time 0.373 (0.519)	Data 0.001 (0.014)	Loss 4.0568 (4.1063)	Top-1 acc 32.812 (29.058)	Top-5 acc 52.734 (52.237)	lr 0.00784
Warmup Train [30][2070/3239]	Time 0.497 (0.519)	Data 0.001 (0.014)	Loss 4.2816 (4.1063)	Top-1 acc 23.828 (29.056)	Top-5 acc 48.438 (52.236)	lr 0.00783
Warmup Train [30][2080/3239]	Time 0.522 (0.519)	Data 0.001 (0.014)	Loss 4.0393 (4.1064)	Top-1 acc 30.859 (29.055)	Top-5 acc 50.781 (52.234)	lr 0.00783
Warmup Train [30][2090/3239]	Time 0.540 (0.519)	Data 0.001 (0.014)	Loss 4.1434 (4.1064)	Top-1 acc 27.734 (29.049)	Top-5 acc 50.391 (52.235)	lr 0.00782
Warmup Train [30][2100/3239]	Time 0.630 (0.519)	Data 0.001 (0.013)	Loss 4.2327 (4.1064)	Top-1 acc 26.562 (29.053)	Top-5 acc 50.000 (52.235)	lr 0.00782
Warmup Train [30][2110/3239]	Time 0.427 (0.519)	Data 0.001 (0.013)	Loss 4.0531 (4.1062)	Top-1 acc 28.906 (29.053)	Top-5 acc 51.562 (52.231)	lr 0.00781
Warmup Train [30][2120/3239]	Time 0.490 (0.519)	Data 0.001 (0.013)	Loss 4.1044 (4.1065)	Top-1 acc 28.516 (29.048)	Top-5 acc 52.734 (52.227)	lr 0.00781
Warmup Train [30][2130/3239]	Time 0.419 (0.519)	Data 0.001 (0.013)	Loss 4.3965 (4.1070)	Top-1 acc 24.609 (29.037)	Top-5 acc 44.141 (52.214)	lr 0.00780
Warmup Train [30][2140/3239]	Time 0.743 (0.519)	Data 0.001 (0.013)	Loss 4.2270 (4.1073)	Top-1 acc 26.562 (29.030)	Top-5 acc 48.828 (52.210)	lr 0.00780
Warmup Train [30][2150/3239]	Time 0.407 (0.518)	Data 0.001 (0.013)	Loss 4.4410 (4.1074)	Top-1 acc 25.781 (29.032)	Top-5 acc 46.094 (52.207)	lr 0.00780
Warmup Train [30][2160/3239]	Time 0.691 (0.518)	Data 0.001 (0.013)	Loss 4.1367 (4.1074)	Top-1 acc 29.688 (29.030)	Top-5 acc 48.438 (52.209)	lr 0.00779
Warmup Train [30][2170/3239]	Time 0.456 (0.518)	Data 0.001 (0.013)	Loss 4.1602 (4.1073)	Top-1 acc 28.125 (29.036)	Top-5 acc 50.000 (52.207)	lr 0.00779
Warmup Train [30][2180/3239]	Time 0.456 (0.518)	Data 0.001 (0.013)	Loss 4.1387 (4.1074)	Top-1 acc 28.906 (29.034)	Top-5 acc 51.172 (52.198)	lr 0.00778
Warmup Train [30][2190/3239]	Time 0.486 (0.518)	Data 0.001 (0.013)	Loss 4.0095 (4.1076)	Top-1 acc 30.859 (29.029)	Top-5 acc 53.516 (52.193)	lr 0.00778
Warmup Train [30][2200/3239]	Time 0.611 (0.518)	Data 0.001 (0.013)	Loss 3.9981 (4.1076)	Top-1 acc 30.469 (29.028)	Top-5 acc 52.344 (52.194)	lr 0.00777
Warmup Train [30][2210/3239]	Time 0.452 (0.518)	Data 0.001 (0.013)	Loss 4.1757 (4.1074)	Top-1 acc 25.391 (29.028)	Top-5 acc 50.781 (52.199)	lr 0.00777
Warmup Train [30][2220/3239]	Time 0.480 (0.518)	Data 0.001 (0.013)	Loss 4.1573 (4.1075)	Top-1 acc 26.562 (29.022)	Top-5 acc 51.172 (52.195)	lr 0.00776
Warmup Train [30][2230/3239]	Time 0.446 (0.518)	Data 0.001 (0.013)	Loss 4.2508 (4.1074)	Top-1 acc 25.000 (29.026)	Top-5 acc 46.484 (52.202)	lr 0.00776
Warmup Train [30][2240/3239]	Time 0.668 (0.518)	Data 0.001 (0.013)	Loss 3.9853 (4.1073)	Top-1 acc 31.250 (29.030)	Top-5 acc 56.250 (52.202)	lr 0.00776
Warmup Train [30][2250/3239]	Time 0.496 (0.518)	Data 0.001 (0.013)	Loss 4.0303 (4.1072)	Top-1 acc 27.734 (29.028)	Top-5 acc 53.125 (52.200)	lr 0.00775
Warmup Train [30][2260/3239]	Time 0.450 (0.518)	Data 0.001 (0.013)	Loss 4.1210 (4.1076)	Top-1 acc 28.906 (29.025)	Top-5 acc 52.344 (52.190)	lr 0.00775
Warmup Train [30][2270/3239]	Time 0.562 (0.518)	Data 0.002 (0.013)	Loss 4.0832 (4.1076)	Top-1 acc 30.859 (29.033)	Top-5 acc 52.344 (52.192)	lr 0.00774
Warmup Train [30][2280/3239]	Time 0.516 (0.518)	Data 0.001 (0.013)	Loss 4.0310 (4.1077)	Top-1 acc 27.344 (29.030)	Top-5 acc 51.172 (52.188)	lr 0.00774
Warmup Train [30][2290/3239]	Time 0.473 (0.518)	Data 0.001 (0.013)	Loss 4.2447 (4.1079)	Top-1 acc 23.828 (29.026)	Top-5 acc 45.312 (52.182)	lr 0.00773
Warmup Train [30][2300/3239]	Time 0.395 (0.518)	Data 0.001 (0.013)	Loss 4.2184 (4.1079)	Top-1 acc 26.172 (29.025)	Top-5 acc 46.484 (52.181)	lr 0.00773
Warmup Train [30][2310/3239]	Time 0.537 (0.518)	Data 0.001 (0.013)	Loss 4.4445 (4.1082)	Top-1 acc 25.781 (29.024)	Top-5 acc 46.484 (52.175)	lr 0.00773
Warmup Train [30][2320/3239]	Time 0.494 (0.518)	Data 0.001 (0.013)	Loss 3.9972 (4.1080)	Top-1 acc 35.156 (29.031)	Top-5 acc 57.812 (52.179)	lr 0.00772
Warmup Train [30][2330/3239]	Time 0.583 (0.518)	Data 0.001 (0.013)	Loss 4.1382 (4.1082)	Top-1 acc 26.953 (29.028)	Top-5 acc 51.172 (52.178)	lr 0.00772
Warmup Train [30][2340/3239]	Time 0.472 (0.518)	Data 0.001 (0.013)	Loss 4.0153 (4.1082)	Top-1 acc 26.953 (29.024)	Top-5 acc 52.344 (52.177)	lr 0.00771
Warmup Train [30][2350/3239]	Time 0.514 (0.518)	Data 0.001 (0.013)	Loss 4.2041 (4.1082)	Top-1 acc 28.516 (29.023)	Top-5 acc 49.609 (52.178)	lr 0.00771
Warmup Train [30][2360/3239]	Time 0.467 (0.518)	Data 0.001 (0.013)	Loss 4.1631 (4.1083)	Top-1 acc 29.297 (29.023)	Top-5 acc 51.172 (52.175)	lr 0.00770
Warmup Train [30][2370/3239]	Time 0.398 (0.518)	Data 0.001 (0.013)	Loss 4.0529 (4.1086)	Top-1 acc 28.125 (29.018)	Top-5 acc 54.297 (52.170)	lr 0.00770
Warmup Train [30][2380/3239]	Time 0.363 (0.518)	Data 0.001 (0.013)	Loss 4.0362 (4.1084)	Top-1 acc 33.203 (29.024)	Top-5 acc 54.297 (52.172)	lr 0.00769
Warmup Train [30][2390/3239]	Time 0.462 (0.517)	Data 0.001 (0.013)	Loss 4.0769 (4.1085)	Top-1 acc 32.031 (29.023)	Top-5 acc 54.297 (52.169)	lr 0.00769
Warmup Train [30][2400/3239]	Time 0.404 (0.517)	Data 0.001 (0.013)	Loss 4.0449 (4.1084)	Top-1 acc 32.422 (29.023)	Top-5 acc 51.953 (52.166)	lr 0.00769
Warmup Train [30][2410/3239]	Time 0.414 (0.517)	Data 0.001 (0.013)	Loss 4.0656 (4.1085)	Top-1 acc 30.469 (29.023)	Top-5 acc 50.781 (52.165)	lr 0.00768
Warmup Train [30][2420/3239]	Time 0.496 (0.517)	Data 0.001 (0.013)	Loss 4.3149 (4.1088)	Top-1 acc 26.562 (29.018)	Top-5 acc 49.609 (52.157)	lr 0.00768
Warmup Train [30][2430/3239]	Time 0.509 (0.517)	Data 0.001 (0.013)	Loss 4.1849 (4.1088)	Top-1 acc 29.297 (29.018)	Top-5 acc 48.047 (52.157)	lr 0.00767
Warmup Train [30][2440/3239]	Time 0.406 (0.517)	Data 0.001 (0.012)	Loss 4.2037 (4.1087)	Top-1 acc 26.562 (29.016)	Top-5 acc 52.344 (52.158)	lr 0.00767
Warmup Train [30][2450/3239]	Time 0.425 (0.517)	Data 0.001 (0.012)	Loss 4.3937 (4.1086)	Top-1 acc 21.484 (29.018)	Top-5 acc 46.094 (52.160)	lr 0.00766
Warmup Train [30][2460/3239]	Time 0.625 (0.517)	Data 0.001 (0.012)	Loss 4.0892 (4.1086)	Top-1 acc 30.078 (29.015)	Top-5 acc 50.391 (52.163)	lr 0.00766
Warmup Train [30][2470/3239]	Time 0.435 (0.517)	Data 0.001 (0.012)	Loss 3.9782 (4.1084)	Top-1 acc 29.688 (29.021)	Top-5 acc 55.469 (52.167)	lr 0.00766
Warmup Train [30][2480/3239]	Time 0.543 (0.517)	Data 0.001 (0.012)	Loss 4.1189 (4.1086)	Top-1 acc 29.688 (29.017)	Top-5 acc 51.562 (52.162)	lr 0.00765
Warmup Train [30][2490/3239]	Time 0.544 (0.517)	Data 0.001 (0.012)	Loss 4.1087 (4.1085)	Top-1 acc 26.953 (29.020)	Top-5 acc 53.516 (52.163)	lr 0.00765
Warmup Train [30][2500/3239]	Time 0.618 (0.517)	Data 0.001 (0.012)	Loss 3.9607 (4.1082)	Top-1 acc 29.297 (29.026)	Top-5 acc 55.469 (52.169)	lr 0.00764
Warmup Train [30][2510/3239]	Time 0.342 (0.517)	Data 0.001 (0.012)	Loss 4.0122 (4.1080)	Top-1 acc 32.422 (29.029)	Top-5 acc 50.391 (52.178)	lr 0.00764
Warmup Train [30][2520/3239]	Time 0.525 (0.517)	Data 0.001 (0.012)	Loss 4.2413 (4.1080)	Top-1 acc 26.562 (29.029)	Top-5 acc 48.047 (52.175)	lr 0.00763
Warmup Train [30][2530/3239]	Time 0.441 (0.517)	Data 0.001 (0.012)	Loss 4.1180 (4.1080)	Top-1 acc 26.172 (29.023)	Top-5 acc 50.000 (52.172)	lr 0.00763
Warmup Train [30][2540/3239]	Time 0.454 (0.517)	Data 0.002 (0.012)	Loss 4.0609 (4.1080)	Top-1 acc 27.734 (29.019)	Top-5 acc 53.906 (52.172)	lr 0.00762
Warmup Train [30][2550/3239]	Time 0.536 (0.517)	Data 0.001 (0.012)	Loss 4.0635 (4.1079)	Top-1 acc 29.297 (29.020)	Top-5 acc 54.688 (52.176)	lr 0.00762
Warmup Train [30][2560/3239]	Time 0.522 (0.517)	Data 0.001 (0.012)	Loss 4.0446 (4.1077)	Top-1 acc 31.250 (29.026)	Top-5 acc 57.422 (52.179)	lr 0.00762
Warmup Train [30][2570/3239]	Time 0.390 (0.517)	Data 0.001 (0.012)	Loss 4.2056 (4.1078)	Top-1 acc 22.656 (29.021)	Top-5 acc 51.172 (52.172)	lr 0.00761
Warmup Train [30][2580/3239]	Time 0.346 (0.517)	Data 0.001 (0.012)	Loss 4.1982 (4.1077)	Top-1 acc 28.516 (29.025)	Top-5 acc 48.828 (52.177)	lr 0.00761
Warmup Train [30][2590/3239]	Time 0.556 (0.517)	Data 0.001 (0.012)	Loss 4.1074 (4.1079)	Top-1 acc 30.469 (29.022)	Top-5 acc 54.688 (52.174)	lr 0.00760
Warmup Train [30][2600/3239]	Time 0.542 (0.517)	Data 0.001 (0.012)	Loss 4.0514 (4.1079)	Top-1 acc 31.641 (29.021)	Top-5 acc 53.125 (52.173)	lr 0.00760
Warmup Train [30][2610/3239]	Time 0.573 (0.517)	Data 0.001 (0.012)	Loss 4.0177 (4.1078)	Top-1 acc 34.375 (29.024)	Top-5 acc 55.859 (52.175)	lr 0.00759
Warmup Train [30][2620/3239]	Time 0.579 (0.517)	Data 0.001 (0.012)	Loss 4.2017 (4.1077)	Top-1 acc 23.047 (29.021)	Top-5 acc 49.609 (52.174)	lr 0.00759
Warmup Train [30][2630/3239]	Time 0.457 (0.517)	Data 0.001 (0.012)	Loss 3.9960 (4.1079)	Top-1 acc 30.469 (29.017)	Top-5 acc 55.469 (52.171)	lr 0.00759
Warmup Train [30][2640/3239]	Time 0.610 (0.517)	Data 0.001 (0.012)	Loss 4.0964 (4.1078)	Top-1 acc 28.516 (29.020)	Top-5 acc 51.953 (52.175)	lr 0.00758
Warmup Train [30][2650/3239]	Time 0.527 (0.517)	Data 0.001 (0.012)	Loss 4.1436 (4.1076)	Top-1 acc 33.203 (29.026)	Top-5 acc 52.734 (52.181)	lr 0.00758
Warmup Train [30][2660/3239]	Time 0.265 (0.517)	Data 0.001 (0.012)	Loss 4.3542 (4.1077)	Top-1 acc 23.828 (29.021)	Top-5 acc 46.484 (52.178)	lr 0.00757
Warmup Train [30][2670/3239]	Time 0.567 (0.517)	Data 0.001 (0.012)	Loss 4.0817 (4.1076)	Top-1 acc 31.641 (29.020)	Top-5 acc 53.906 (52.181)	lr 0.00757
Warmup Train [30][2680/3239]	Time 0.716 (0.516)	Data 0.001 (0.012)	Loss 4.1930 (4.1074)	Top-1 acc 26.562 (29.025)	Top-5 acc 51.953 (52.186)	lr 0.00756
Warmup Train [30][2690/3239]	Time 0.573 (0.516)	Data 0.001 (0.012)	Loss 4.1192 (4.1074)	Top-1 acc 28.125 (29.030)	Top-5 acc 50.000 (52.185)	lr 0.00756
Warmup Train [30][2700/3239]	Time 0.557 (0.516)	Data 0.001 (0.012)	Loss 4.2166 (4.1074)	Top-1 acc 28.516 (29.028)	Top-5 acc 48.828 (52.181)	lr 0.00756
Warmup Train [30][2710/3239]	Time 0.447 (0.516)	Data 0.002 (0.012)	Loss 4.0227 (4.1075)	Top-1 acc 30.078 (29.028)	Top-5 acc 53.906 (52.176)	lr 0.00755
Warmup Train [30][2720/3239]	Time 0.541 (0.516)	Data 0.001 (0.012)	Loss 3.9924 (4.1075)	Top-1 acc 29.688 (29.027)	Top-5 acc 53.516 (52.179)	lr 0.00755
Warmup Train [30][2730/3239]	Time 0.631 (0.516)	Data 0.001 (0.012)	Loss 4.1011 (4.1076)	Top-1 acc 29.688 (29.022)	Top-5 acc 50.391 (52.180)	lr 0.00754
Warmup Train [30][2740/3239]	Time 0.291 (0.516)	Data 0.001 (0.012)	Loss 4.1459 (4.1077)	Top-1 acc 24.219 (29.017)	Top-5 acc 51.172 (52.176)	lr 0.00754
Warmup Train [30][2750/3239]	Time 0.521 (0.516)	Data 0.001 (0.012)	Loss 4.1550 (4.1077)	Top-1 acc 29.297 (29.017)	Top-5 acc 49.219 (52.179)	lr 0.00753
Warmup Train [30][2760/3239]	Time 0.484 (0.516)	Data 0.001 (0.012)	Loss 4.0507 (4.1076)	Top-1 acc 29.688 (29.017)	Top-5 acc 51.172 (52.179)	lr 0.00753
Warmup Train [30][2770/3239]	Time 0.505 (0.516)	Data 0.001 (0.012)	Loss 3.9021 (4.1073)	Top-1 acc 32.031 (29.020)	Top-5 acc 57.031 (52.183)	lr 0.00752
Warmup Train [30][2780/3239]	Time 0.669 (0.516)	Data 0.001 (0.012)	Loss 4.1766 (4.1074)	Top-1 acc 28.906 (29.018)	Top-5 acc 50.781 (52.184)	lr 0.00752
Warmup Train [30][2790/3239]	Time 0.579 (0.516)	Data 0.001 (0.012)	Loss 4.1602 (4.1076)	Top-1 acc 29.688 (29.017)	Top-5 acc 53.125 (52.181)	lr 0.00752
Warmup Train [30][2800/3239]	Time 0.415 (0.516)	Data 0.001 (0.012)	Loss 4.3388 (4.1076)	Top-1 acc 24.219 (29.013)	Top-5 acc 45.703 (52.174)	lr 0.00751
Warmup Train [30][2810/3239]	Time 0.510 (0.516)	Data 0.039 (0.012)	Loss 4.0368 (4.1073)	Top-1 acc 29.297 (29.019)	Top-5 acc 57.031 (52.182)	lr 0.00751
Warmup Train [30][2820/3239]	Time 0.576 (0.516)	Data 0.001 (0.012)	Loss 4.0204 (4.1073)	Top-1 acc 32.812 (29.023)	Top-5 acc 54.688 (52.182)	lr 0.00750
Warmup Train [30][2830/3239]	Time 0.508 (0.516)	Data 0.001 (0.012)	Loss 3.8671 (4.1073)	Top-1 acc 35.547 (29.027)	Top-5 acc 57.422 (52.181)	lr 0.00750
Warmup Train [30][2840/3239]	Time 0.526 (0.516)	Data 0.001 (0.012)	Loss 4.0435 (4.1074)	Top-1 acc 29.297 (29.025)	Top-5 acc 52.344 (52.179)	lr 0.00749
Warmup Train [30][2850/3239]	Time 0.581 (0.516)	Data 0.001 (0.012)	Loss 4.1624 (4.1072)	Top-1 acc 27.734 (29.033)	Top-5 acc 49.219 (52.184)	lr 0.00749
Warmup Train [30][2860/3239]	Time 0.343 (0.516)	Data 0.001 (0.012)	Loss 4.0859 (4.1072)	Top-1 acc 30.078 (29.034)	Top-5 acc 56.250 (52.186)	lr 0.00749
Warmup Train [30][2870/3239]	Time 0.524 (0.516)	Data 0.001 (0.012)	Loss 4.1705 (4.1074)	Top-1 acc 26.953 (29.032)	Top-5 acc 50.391 (52.183)	lr 0.00748
Warmup Train [30][2880/3239]	Time 0.622 (0.516)	Data 0.001 (0.012)	Loss 4.1693 (4.1073)	Top-1 acc 31.250 (29.034)	Top-5 acc 51.562 (52.181)	lr 0.00748
Warmup Train [30][2890/3239]	Time 0.427 (0.516)	Data 0.001 (0.012)	Loss 4.1160 (4.1072)	Top-1 acc 29.297 (29.036)	Top-5 acc 51.562 (52.182)	lr 0.00747
Warmup Train [30][2900/3239]	Time 0.637 (0.516)	Data 0.001 (0.012)	Loss 3.9745 (4.1072)	Top-1 acc 32.422 (29.035)	Top-5 acc 55.469 (52.185)	lr 0.00747
Warmup Train [30][2910/3239]	Time 0.659 (0.516)	Data 0.001 (0.011)	Loss 4.2184 (4.1074)	Top-1 acc 27.734 (29.030)	Top-5 acc 50.000 (52.181)	lr 0.00746
Warmup Train [30][2920/3239]	Time 0.369 (0.516)	Data 0.001 (0.011)	Loss 4.1100 (4.1074)	Top-1 acc 28.516 (29.026)	Top-5 acc 50.391 (52.179)	lr 0.00746
Warmup Train [30][2930/3239]	Time 0.512 (0.516)	Data 0.001 (0.011)	Loss 4.2205 (4.1072)	Top-1 acc 25.000 (29.033)	Top-5 acc 51.562 (52.184)	lr 0.00746
Warmup Train [30][2940/3239]	Time 0.430 (0.516)	Data 0.001 (0.011)	Loss 4.1943 (4.1071)	Top-1 acc 26.172 (29.032)	Top-5 acc 48.828 (52.182)	lr 0.00745
Warmup Train [30][2950/3239]	Time 0.476 (0.516)	Data 0.001 (0.011)	Loss 4.1514 (4.1071)	Top-1 acc 26.172 (29.032)	Top-5 acc 50.000 (52.180)	lr 0.00745
Warmup Train [30][2960/3239]	Time 0.506 (0.516)	Data 0.001 (0.011)	Loss 4.1962 (4.1072)	Top-1 acc 33.594 (29.034)	Top-5 acc 50.391 (52.178)	lr 0.00744
Warmup Train [30][2970/3239]	Time 0.372 (0.516)	Data 0.001 (0.011)	Loss 4.0603 (4.1071)	Top-1 acc 28.125 (29.042)	Top-5 acc 56.250 (52.182)	lr 0.00744
Warmup Train [30][2980/3239]	Time 0.485 (0.516)	Data 0.001 (0.011)	Loss 4.0571 (4.1072)	Top-1 acc 28.516 (29.041)	Top-5 acc 53.125 (52.179)	lr 0.00743
Warmup Train [30][2990/3239]	Time 0.584 (0.516)	Data 0.001 (0.011)	Loss 4.1867 (4.1072)	Top-1 acc 28.516 (29.038)	Top-5 acc 50.391 (52.177)	lr 0.00743
Warmup Train [30][3000/3239]	Time 0.636 (0.516)	Data 0.001 (0.011)	Loss 4.0858 (4.1074)	Top-1 acc 29.688 (29.032)	Top-5 acc 51.953 (52.176)	lr 0.00743
Warmup Train [30][3010/3239]	Time 0.476 (0.516)	Data 0.001 (0.011)	Loss 4.2802 (4.1074)	Top-1 acc 27.344 (29.035)	Top-5 acc 48.047 (52.177)	lr 0.00742
Warmup Train [30][3020/3239]	Time 0.519 (0.516)	Data 0.001 (0.011)	Loss 3.9392 (4.1071)	Top-1 acc 29.297 (29.038)	Top-5 acc 56.250 (52.182)	lr 0.00742
Warmup Train [30][3030/3239]	Time 0.471 (0.516)	Data 0.001 (0.011)	Loss 4.3133 (4.1073)	Top-1 acc 24.219 (29.036)	Top-5 acc 49.609 (52.177)	lr 0.00741
Warmup Train [30][3040/3239]	Time 0.492 (0.516)	Data 0.001 (0.011)	Loss 4.0523 (4.1073)	Top-1 acc 30.859 (29.037)	Top-5 acc 52.344 (52.174)	lr 0.00741
Warmup Train [30][3050/3239]	Time 0.465 (0.515)	Data 0.001 (0.011)	Loss 4.2214 (4.1072)	Top-1 acc 26.953 (29.042)	Top-5 acc 50.000 (52.176)	lr 0.00740
Warmup Train [30][3060/3239]	Time 0.471 (0.516)	Data 0.001 (0.011)	Loss 4.0808 (4.1075)	Top-1 acc 26.953 (29.033)	Top-5 acc 52.734 (52.170)	lr 0.00740
Warmup Train [30][3070/3239]	Time 0.475 (0.516)	Data 0.001 (0.011)	Loss 4.0640 (4.1075)	Top-1 acc 27.344 (29.032)	Top-5 acc 52.344 (52.170)	lr 0.00740
Warmup Train [30][3080/3239]	Time 0.358 (0.515)	Data 0.001 (0.011)	Loss 4.0623 (4.1074)	Top-1 acc 29.297 (29.037)	Top-5 acc 51.953 (52.168)	lr 0.00739
Warmup Train [30][3090/3239]	Time 0.522 (0.515)	Data 0.001 (0.011)	Loss 4.0439 (4.1073)	Top-1 acc 31.641 (29.040)	Top-5 acc 57.422 (52.169)	lr 0.00739
Warmup Train [30][3100/3239]	Time 0.352 (0.515)	Data 0.002 (0.011)	Loss 3.9867 (4.1071)	Top-1 acc 27.344 (29.045)	Top-5 acc 54.297 (52.174)	lr 0.00738
Warmup Train [30][3110/3239]	Time 0.504 (0.515)	Data 0.001 (0.011)	Loss 3.9813 (4.1070)	Top-1 acc 32.812 (29.049)	Top-5 acc 55.078 (52.179)	lr 0.00738
Warmup Train [30][3120/3239]	Time 0.444 (0.515)	Data 0.001 (0.011)	Loss 4.0193 (4.1070)	Top-1 acc 30.078 (29.047)	Top-5 acc 54.297 (52.179)	lr 0.00737
Warmup Train [30][3130/3239]	Time 0.690 (0.516)	Data 0.001 (0.011)	Loss 4.1460 (4.1069)	Top-1 acc 28.516 (29.049)	Top-5 acc 49.609 (52.178)	lr 0.00737
Warmup Train [30][3140/3239]	Time 0.570 (0.516)	Data 0.001 (0.011)	Loss 4.1370 (4.1070)	Top-1 acc 23.828 (29.045)	Top-5 acc 54.688 (52.175)	lr 0.00737
Warmup Train [30][3150/3239]	Time 0.534 (0.515)	Data 0.001 (0.011)	Loss 4.0737 (4.1069)	Top-1 acc 30.469 (29.044)	Top-5 acc 52.734 (52.180)	lr 0.00736
Warmup Train [30][3160/3239]	Time 0.549 (0.515)	Data 0.001 (0.011)	Loss 4.2330 (4.1068)	Top-1 acc 25.781 (29.050)	Top-5 acc 49.609 (52.185)	lr 0.00736
Warmup Train [30][3170/3239]	Time 0.519 (0.515)	Data 0.001 (0.011)	Loss 4.0290 (4.1069)	Top-1 acc 27.734 (29.047)	Top-5 acc 52.734 (52.183)	lr 0.00735
Warmup Train [30][3180/3239]	Time 0.478 (0.515)	Data 0.000 (0.011)	Loss 4.1891 (4.1070)	Top-1 acc 30.078 (29.047)	Top-5 acc 49.609 (52.178)	lr 0.00735
Warmup Train [30][3190/3239]	Time 0.450 (0.515)	Data 0.000 (0.011)	Loss 4.0899 (4.1070)	Top-1 acc 28.516 (29.046)	Top-5 acc 53.125 (52.179)	lr 0.00734
Warmup Train [30][3200/3239]	Time 0.378 (0.515)	Data 0.000 (0.011)	Loss 4.1554 (4.1070)	Top-1 acc 26.172 (29.044)	Top-5 acc 55.078 (52.179)	lr 0.00734
Warmup Train [30][3210/3239]	Time 0.373 (0.515)	Data 0.000 (0.011)	Loss 4.0446 (4.1070)	Top-1 acc 30.469 (29.048)	Top-5 acc 53.516 (52.177)	lr 0.00734
Warmup Train [30][3220/3239]	Time 0.406 (0.515)	Data 0.000 (0.011)	Loss 4.1112 (4.1071)	Top-1 acc 24.609 (29.047)	Top-5 acc 51.562 (52.174)	lr 0.00733
Warmup Train [30][3230/3239]	Time 0.563 (0.515)	Data 0.000 (0.011)	Loss 4.0835 (4.1071)	Top-1 acc 27.344 (29.047)	Top-5 acc 53.906 (52.174)	lr 0.00733
Warmup Train [30][3239/3239]	Time 0.364 (0.515)	Data 0.000 (0.011)	Loss 3.8005 (4.1070)	Top-1 acc 38.272 (29.054)	Top-5 acc 62.963 (52.178)	lr 0.00732
==========Warmup Valid [30/40]	loss 3.059	top-1 acc 36.501	top-5 acc 61.341	Train top-1 29.054	top-5 52.178	flops: 442.4M
Warmup Train [31][0/3239]	Time 21.702 (21.702)	Data 18.928 (18.928)	Loss 4.0449 (4.0449)	Top-1 acc 33.203 (33.203)	Top-5 acc 53.125 (53.125)	lr 0.00732
Warmup Train [31][10/3239]	Time 0.549 (2.466)	Data 0.001 (1.726)	Loss 4.1045 (4.0785)	Top-1 acc 27.344 (30.114)	Top-5 acc 55.078 (53.089)	lr 0.00732
Warmup Train [31][20/3239]	Time 0.498 (1.539)	Data 0.001 (0.905)	Loss 4.3344 (4.0883)	Top-1 acc 27.344 (30.022)	Top-5 acc 46.484 (52.976)	lr 0.00731
Warmup Train [31][30/3239]	Time 0.672 (1.207)	Data 0.001 (0.614)	Loss 4.1175 (4.0700)	Top-1 acc 28.125 (30.103)	Top-5 acc 53.125 (53.478)	lr 0.00731
Warmup Train [31][40/3239]	Time 0.547 (1.026)	Data 0.001 (0.465)	Loss 4.0555 (4.0739)	Top-1 acc 29.688 (29.859)	Top-5 acc 52.344 (53.249)	lr 0.00731
Warmup Train [31][50/3239]	Time 0.435 (0.921)	Data 0.001 (0.376)	Loss 4.0596 (4.0784)	Top-1 acc 30.859 (29.695)	Top-5 acc 56.250 (53.018)	lr 0.00730
Warmup Train [31][60/3239]	Time 0.439 (0.847)	Data 0.001 (0.317)	Loss 4.1215 (4.0842)	Top-1 acc 26.562 (29.553)	Top-5 acc 51.172 (53.087)	lr 0.00730
Warmup Train [31][70/3239]	Time 0.604 (0.797)	Data 0.001 (0.273)	Loss 4.2474 (4.0919)	Top-1 acc 27.344 (29.440)	Top-5 acc 46.875 (52.828)	lr 0.00729
Warmup Train [31][80/3239]	Time 0.455 (0.756)	Data 0.001 (0.241)	Loss 4.1152 (4.0876)	Top-1 acc 30.859 (29.543)	Top-5 acc 51.172 (53.009)	lr 0.00729
Warmup Train [31][90/3239]	Time 0.514 (0.731)	Data 0.001 (0.216)	Loss 4.0701 (4.0769)	Top-1 acc 29.297 (29.713)	Top-5 acc 51.953 (53.125)	lr 0.00728
Warmup Train [31][100/3239]	Time 0.476 (0.710)	Data 0.001 (0.195)	Loss 4.0023 (4.0771)	Top-1 acc 27.734 (29.668)	Top-5 acc 53.516 (53.048)	lr 0.00728
Warmup Train [31][110/3239]	Time 0.599 (0.692)	Data 0.001 (0.177)	Loss 3.9356 (4.0790)	Top-1 acc 30.469 (29.684)	Top-5 acc 55.078 (53.079)	lr 0.00728
Warmup Train [31][120/3239]	Time 0.555 (0.679)	Data 0.001 (0.163)	Loss 3.9289 (4.0755)	Top-1 acc 32.031 (29.749)	Top-5 acc 56.641 (53.170)	lr 0.00727
Warmup Train [31][130/3239]	Time 0.472 (0.667)	Data 0.001 (0.151)	Loss 3.7499 (4.0719)	Top-1 acc 37.500 (29.729)	Top-5 acc 63.281 (53.268)	lr 0.00727
Warmup Train [31][140/3239]	Time 0.575 (0.657)	Data 0.001 (0.140)	Loss 4.2212 (4.0764)	Top-1 acc 27.344 (29.629)	Top-5 acc 51.562 (53.119)	lr 0.00726
Warmup Train [31][150/3239]	Time 0.455 (0.648)	Data 0.001 (0.131)	Loss 3.9519 (4.0761)	Top-1 acc 30.078 (29.610)	Top-5 acc 51.562 (53.045)	lr 0.00726
Warmup Train [31][160/3239]	Time 0.465 (0.640)	Data 0.001 (0.123)	Loss 4.1404 (4.0808)	Top-1 acc 30.469 (29.571)	Top-5 acc 53.906 (53.009)	lr 0.00725
Warmup Train [31][170/3239]	Time 0.538 (0.632)	Data 0.001 (0.116)	Loss 4.1027 (4.0842)	Top-1 acc 29.297 (29.448)	Top-5 acc 51.953 (52.899)	lr 0.00725
Warmup Train [31][180/3239]	Time 0.411 (0.624)	Data 0.001 (0.110)	Loss 4.4096 (4.0874)	Top-1 acc 21.875 (29.372)	Top-5 acc 43.750 (52.855)	lr 0.00725
Warmup Train [31][190/3239]	Time 0.489 (0.618)	Data 0.001 (0.105)	Loss 3.9683 (4.0869)	Top-1 acc 30.859 (29.458)	Top-5 acc 53.906 (52.826)	lr 0.00724
Warmup Train [31][200/3239]	Time 0.333 (0.613)	Data 0.001 (0.100)	Loss 3.9059 (4.0859)	Top-1 acc 34.375 (29.480)	Top-5 acc 56.250 (52.841)	lr 0.00724
Warmup Train [31][210/3239]	Time 0.663 (0.608)	Data 0.001 (0.096)	Loss 4.2421 (4.0883)	Top-1 acc 29.297 (29.430)	Top-5 acc 49.219 (52.801)	lr 0.00723
Warmup Train [31][220/3239]	Time 0.646 (0.604)	Data 0.001 (0.091)	Loss 4.1848 (4.0886)	Top-1 acc 25.391 (29.391)	Top-5 acc 51.953 (52.770)	lr 0.00723
Warmup Train [31][230/3239]	Time 0.606 (0.601)	Data 0.001 (0.087)	Loss 4.1416 (4.0892)	Top-1 acc 27.734 (29.447)	Top-5 acc 50.781 (52.729)	lr 0.00722
Warmup Train [31][240/3239]	Time 0.621 (0.598)	Data 0.001 (0.084)	Loss 4.0277 (4.0885)	Top-1 acc 28.125 (29.423)	Top-5 acc 53.125 (52.741)	lr 0.00722
Warmup Train [31][250/3239]	Time 0.545 (0.594)	Data 0.001 (0.081)	Loss 4.0191 (4.0877)	Top-1 acc 29.297 (29.443)	Top-5 acc 51.953 (52.778)	lr 0.00722
Warmup Train [31][260/3239]	Time 0.474 (0.591)	Data 0.001 (0.078)	Loss 4.0030 (4.0894)	Top-1 acc 30.469 (29.408)	Top-5 acc 51.953 (52.698)	lr 0.00721
Warmup Train [31][270/3239]	Time 0.495 (0.588)	Data 0.001 (0.075)	Loss 4.0474 (4.0895)	Top-1 acc 30.469 (29.398)	Top-5 acc 53.125 (52.701)	lr 0.00721
Warmup Train [31][280/3239]	Time 0.575 (0.585)	Data 0.001 (0.072)	Loss 4.0745 (4.0917)	Top-1 acc 31.250 (29.352)	Top-5 acc 55.078 (52.661)	lr 0.00720
Warmup Train [31][290/3239]	Time 0.455 (0.583)	Data 0.001 (0.070)	Loss 4.1108 (4.0936)	Top-1 acc 28.906 (29.325)	Top-5 acc 50.781 (52.615)	lr 0.00720
Warmup Train [31][300/3239]	Time 0.383 (0.579)	Data 0.001 (0.068)	Loss 4.1270 (4.0904)	Top-1 acc 30.859 (29.403)	Top-5 acc 49.609 (52.702)	lr 0.00719
Warmup Train [31][310/3239]	Time 0.603 (0.577)	Data 0.001 (0.066)	Loss 4.3101 (4.0896)	Top-1 acc 25.391 (29.419)	Top-5 acc 46.875 (52.729)	lr 0.00719
Warmup Train [31][320/3239]	Time 0.417 (0.574)	Data 0.001 (0.064)	Loss 4.2101 (4.0887)	Top-1 acc 24.609 (29.425)	Top-5 acc 53.125 (52.755)	lr 0.00719
Warmup Train [31][330/3239]	Time 0.328 (0.572)	Data 0.001 (0.063)	Loss 3.8461 (4.0885)	Top-1 acc 32.422 (29.400)	Top-5 acc 55.469 (52.719)	lr 0.00718
Warmup Train [31][340/3239]	Time 0.521 (0.570)	Data 0.001 (0.061)	Loss 4.1127 (4.0862)	Top-1 acc 30.469 (29.423)	Top-5 acc 52.734 (52.754)	lr 0.00718
Warmup Train [31][350/3239]	Time 0.468 (0.568)	Data 0.001 (0.060)	Loss 4.0906 (4.0874)	Top-1 acc 29.297 (29.374)	Top-5 acc 51.172 (52.702)	lr 0.00717
Warmup Train [31][360/3239]	Time 0.682 (0.564)	Data 0.001 (0.058)	Loss 4.1942 (4.0903)	Top-1 acc 28.516 (29.323)	Top-5 acc 51.172 (52.627)	lr 0.00717
Warmup Train [31][370/3239]	Time 0.338 (0.562)	Data 0.001 (0.056)	Loss 4.2696 (4.0910)	Top-1 acc 27.344 (29.348)	Top-5 acc 50.391 (52.606)	lr 0.00716
Warmup Train [31][380/3239]	Time 0.506 (0.561)	Data 0.001 (0.055)	Loss 4.2699 (4.0922)	Top-1 acc 25.000 (29.316)	Top-5 acc 48.047 (52.572)	lr 0.00716
Warmup Train [31][390/3239]	Time 0.355 (0.560)	Data 0.001 (0.054)	Loss 3.9492 (4.0920)	Top-1 acc 33.203 (29.348)	Top-5 acc 57.031 (52.590)	lr 0.00716
Warmup Train [31][400/3239]	Time 0.654 (0.559)	Data 0.001 (0.053)	Loss 3.9549 (4.0916)	Top-1 acc 30.078 (29.355)	Top-5 acc 53.516 (52.585)	lr 0.00715
Warmup Train [31][410/3239]	Time 0.551 (0.559)	Data 0.001 (0.052)	Loss 4.1149 (4.0921)	Top-1 acc 29.297 (29.332)	Top-5 acc 50.000 (52.564)	lr 0.00715
Warmup Train [31][420/3239]	Time 0.605 (0.557)	Data 0.001 (0.051)	Loss 4.1520 (4.0928)	Top-1 acc 31.641 (29.334)	Top-5 acc 52.734 (52.556)	lr 0.00714
Warmup Train [31][430/3239]	Time 0.547 (0.557)	Data 0.001 (0.049)	Loss 4.0025 (4.0919)	Top-1 acc 32.812 (29.344)	Top-5 acc 52.344 (52.593)	lr 0.00714
Warmup Train [31][440/3239]	Time 0.728 (0.556)	Data 0.001 (0.048)	Loss 4.2112 (4.0919)	Top-1 acc 26.953 (29.339)	Top-5 acc 51.562 (52.583)	lr 0.00713
Warmup Train [31][450/3239]	Time 0.414 (0.555)	Data 0.001 (0.047)	Loss 4.1911 (4.0917)	Top-1 acc 27.344 (29.335)	Top-5 acc 51.172 (52.595)	lr 0.00713
Warmup Train [31][460/3239]	Time 0.456 (0.554)	Data 0.001 (0.047)	Loss 4.1652 (4.0916)	Top-1 acc 28.906 (29.366)	Top-5 acc 50.781 (52.589)	lr 0.00713
Warmup Train [31][470/3239]	Time 0.355 (0.553)	Data 0.001 (0.046)	Loss 4.2988 (4.0921)	Top-1 acc 26.562 (29.341)	Top-5 acc 48.828 (52.581)	lr 0.00712
Warmup Train [31][480/3239]	Time 0.443 (0.553)	Data 0.001 (0.045)	Loss 3.9874 (4.0929)	Top-1 acc 27.344 (29.328)	Top-5 acc 51.953 (52.577)	lr 0.00712
Warmup Train [31][490/3239]	Time 0.459 (0.552)	Data 0.001 (0.045)	Loss 3.9252 (4.0919)	Top-1 acc 35.156 (29.359)	Top-5 acc 55.078 (52.584)	lr 0.00711
Warmup Train [31][500/3239]	Time 0.340 (0.551)	Data 0.001 (0.044)	Loss 4.1656 (4.0931)	Top-1 acc 28.906 (29.348)	Top-5 acc 51.953 (52.574)	lr 0.00711
Warmup Train [31][510/3239]	Time 0.532 (0.551)	Data 0.001 (0.044)	Loss 4.0770 (4.0920)	Top-1 acc 30.078 (29.373)	Top-5 acc 55.859 (52.614)	lr 0.00711
Warmup Train [31][520/3239]	Time 0.527 (0.549)	Data 0.001 (0.043)	Loss 4.0730 (4.0915)	Top-1 acc 28.516 (29.383)	Top-5 acc 51.953 (52.615)	lr 0.00710
Warmup Train [31][530/3239]	Time 0.650 (0.549)	Data 0.001 (0.042)	Loss 4.1694 (4.0916)	Top-1 acc 31.641 (29.412)	Top-5 acc 53.516 (52.619)	lr 0.00710
Warmup Train [31][540/3239]	Time 0.641 (0.548)	Data 0.001 (0.042)	Loss 4.2724 (4.0920)	Top-1 acc 26.172 (29.391)	Top-5 acc 47.266 (52.600)	lr 0.00709
Warmup Train [31][550/3239]	Time 0.630 (0.547)	Data 0.001 (0.041)	Loss 4.1842 (4.0925)	Top-1 acc 29.688 (29.390)	Top-5 acc 49.609 (52.589)	lr 0.00709
Warmup Train [31][560/3239]	Time 0.394 (0.546)	Data 0.001 (0.040)	Loss 3.9031 (4.0924)	Top-1 acc 35.156 (29.380)	Top-5 acc 56.250 (52.596)	lr 0.00708
Warmup Train [31][570/3239]	Time 0.462 (0.546)	Data 0.002 (0.040)	Loss 4.1462 (4.0923)	Top-1 acc 28.125 (29.387)	Top-5 acc 50.391 (52.595)	lr 0.00708
Warmup Train [31][580/3239]	Time 0.532 (0.546)	Data 0.001 (0.039)	Loss 4.2210 (4.0923)	Top-1 acc 26.953 (29.376)	Top-5 acc 45.312 (52.574)	lr 0.00708
Warmup Train [31][590/3239]	Time 0.554 (0.545)	Data 0.001 (0.038)	Loss 4.0562 (4.0924)	Top-1 acc 32.031 (29.372)	Top-5 acc 54.688 (52.568)	lr 0.00707
Warmup Train [31][600/3239]	Time 0.550 (0.544)	Data 0.001 (0.038)	Loss 4.1453 (4.0919)	Top-1 acc 30.078 (29.380)	Top-5 acc 53.516 (52.587)	lr 0.00707
Warmup Train [31][610/3239]	Time 0.532 (0.543)	Data 0.001 (0.037)	Loss 4.0524 (4.0921)	Top-1 acc 28.516 (29.356)	Top-5 acc 51.953 (52.591)	lr 0.00706
Warmup Train [31][620/3239]	Time 0.370 (0.542)	Data 0.001 (0.037)	Loss 4.1056 (4.0926)	Top-1 acc 30.859 (29.334)	Top-5 acc 53.906 (52.582)	lr 0.00706
Warmup Train [31][630/3239]	Time 0.361 (0.541)	Data 0.001 (0.036)	Loss 3.9015 (4.0928)	Top-1 acc 33.203 (29.330)	Top-5 acc 57.031 (52.569)	lr 0.00705
Warmup Train [31][640/3239]	Time 0.610 (0.540)	Data 0.001 (0.036)	Loss 4.0261 (4.0924)	Top-1 acc 28.125 (29.334)	Top-5 acc 53.125 (52.579)	lr 0.00705
Warmup Train [31][650/3239]	Time 0.649 (0.540)	Data 0.001 (0.036)	Loss 4.1382 (4.0924)	Top-1 acc 26.562 (29.328)	Top-5 acc 50.391 (52.576)	lr 0.00705
Warmup Train [31][660/3239]	Time 0.542 (0.540)	Data 0.002 (0.035)	Loss 4.2298 (4.0920)	Top-1 acc 27.734 (29.339)	Top-5 acc 47.266 (52.574)	lr 0.00704
Warmup Train [31][670/3239]	Time 0.483 (0.540)	Data 0.001 (0.035)	Loss 4.2365 (4.0919)	Top-1 acc 26.172 (29.346)	Top-5 acc 47.656 (52.571)	lr 0.00704
Warmup Train [31][680/3239]	Time 0.423 (0.539)	Data 0.001 (0.034)	Loss 3.7990 (4.0904)	Top-1 acc 34.766 (29.369)	Top-5 acc 59.766 (52.597)	lr 0.00703
Warmup Train [31][690/3239]	Time 0.443 (0.539)	Data 0.001 (0.034)	Loss 4.1983 (4.0910)	Top-1 acc 29.688 (29.362)	Top-5 acc 52.734 (52.604)	lr 0.00703
Warmup Train [31][700/3239]	Time 0.498 (0.539)	Data 0.001 (0.034)	Loss 4.0619 (4.0904)	Top-1 acc 26.172 (29.367)	Top-5 acc 51.953 (52.601)	lr 0.00702
Warmup Train [31][710/3239]	Time 0.445 (0.539)	Data 0.001 (0.033)	Loss 4.2742 (4.0902)	Top-1 acc 28.125 (29.358)	Top-5 acc 47.656 (52.605)	lr 0.00702
Warmup Train [31][720/3239]	Time 0.445 (0.538)	Data 0.001 (0.033)	Loss 3.7681 (4.0897)	Top-1 acc 34.375 (29.356)	Top-5 acc 60.547 (52.615)	lr 0.00702
Warmup Train [31][730/3239]	Time 0.502 (0.538)	Data 0.001 (0.032)	Loss 3.9866 (4.0894)	Top-1 acc 30.859 (29.362)	Top-5 acc 56.250 (52.625)	lr 0.00701
Warmup Train [31][740/3239]	Time 0.504 (0.537)	Data 0.001 (0.032)	Loss 4.1664 (4.0897)	Top-1 acc 28.125 (29.357)	Top-5 acc 46.094 (52.616)	lr 0.00701
Warmup Train [31][750/3239]	Time 0.427 (0.537)	Data 0.001 (0.032)	Loss 4.1747 (4.0891)	Top-1 acc 27.734 (29.370)	Top-5 acc 46.875 (52.633)	lr 0.00700
Warmup Train [31][760/3239]	Time 0.385 (0.537)	Data 0.001 (0.031)	Loss 3.9437 (4.0890)	Top-1 acc 34.375 (29.388)	Top-5 acc 56.250 (52.627)	lr 0.00700
Warmup Train [31][770/3239]	Time 0.431 (0.537)	Data 0.001 (0.031)	Loss 3.9292 (4.0883)	Top-1 acc 32.031 (29.392)	Top-5 acc 56.250 (52.633)	lr 0.00700
Warmup Train [31][780/3239]	Time 0.555 (0.536)	Data 0.001 (0.031)	Loss 4.0879 (4.0882)	Top-1 acc 32.422 (29.394)	Top-5 acc 50.000 (52.630)	lr 0.00699
Warmup Train [31][790/3239]	Time 0.463 (0.536)	Data 0.001 (0.031)	Loss 4.1349 (4.0882)	Top-1 acc 26.172 (29.398)	Top-5 acc 50.391 (52.644)	lr 0.00699
Warmup Train [31][800/3239]	Time 0.607 (0.536)	Data 0.001 (0.030)	Loss 3.8827 (4.0878)	Top-1 acc 37.891 (29.421)	Top-5 acc 58.984 (52.654)	lr 0.00698
Warmup Train [31][810/3239]	Time 0.420 (0.535)	Data 0.002 (0.030)	Loss 4.1576 (4.0888)	Top-1 acc 25.000 (29.393)	Top-5 acc 53.516 (52.639)	lr 0.00698
Warmup Train [31][820/3239]	Time 0.478 (0.535)	Data 0.001 (0.030)	Loss 4.1215 (4.0888)	Top-1 acc 26.953 (29.400)	Top-5 acc 52.344 (52.640)	lr 0.00697
Warmup Train [31][830/3239]	Time 0.582 (0.535)	Data 0.001 (0.030)	Loss 4.0226 (4.0886)	Top-1 acc 33.203 (29.410)	Top-5 acc 55.078 (52.646)	lr 0.00697
Warmup Train [31][840/3239]	Time 0.714 (0.535)	Data 0.001 (0.029)	Loss 3.9999 (4.0884)	Top-1 acc 30.859 (29.426)	Top-5 acc 55.469 (52.661)	lr 0.00697
Warmup Train [31][850/3239]	Time 0.434 (0.535)	Data 0.001 (0.029)	Loss 4.1322 (4.0878)	Top-1 acc 32.422 (29.438)	Top-5 acc 52.344 (52.688)	lr 0.00696
Warmup Train [31][860/3239]	Time 0.349 (0.534)	Data 0.001 (0.029)	Loss 4.1345 (4.0880)	Top-1 acc 28.125 (29.433)	Top-5 acc 50.000 (52.679)	lr 0.00696
Warmup Train [31][870/3239]	Time 0.447 (0.534)	Data 0.001 (0.029)	Loss 4.0970 (4.0882)	Top-1 acc 27.734 (29.432)	Top-5 acc 50.391 (52.664)	lr 0.00695
Warmup Train [31][880/3239]	Time 0.405 (0.534)	Data 0.001 (0.028)	Loss 4.0041 (4.0883)	Top-1 acc 32.812 (29.425)	Top-5 acc 55.469 (52.667)	lr 0.00695
Warmup Train [31][890/3239]	Time 0.464 (0.534)	Data 0.001 (0.028)	Loss 4.0024 (4.0879)	Top-1 acc 27.344 (29.422)	Top-5 acc 57.031 (52.687)	lr 0.00695
Warmup Train [31][900/3239]	Time 0.477 (0.533)	Data 0.001 (0.028)	Loss 4.0413 (4.0880)	Top-1 acc 30.078 (29.414)	Top-5 acc 51.562 (52.684)	lr 0.00694
Warmup Train [31][910/3239]	Time 0.557 (0.533)	Data 0.001 (0.028)	Loss 3.9013 (4.0878)	Top-1 acc 35.547 (29.417)	Top-5 acc 57.422 (52.693)	lr 0.00694
Warmup Train [31][920/3239]	Time 0.615 (0.532)	Data 0.001 (0.028)	Loss 4.1291 (4.0878)	Top-1 acc 25.781 (29.423)	Top-5 acc 48.047 (52.692)	lr 0.00693
Warmup Train [31][930/3239]	Time 0.549 (0.532)	Data 0.002 (0.027)	Loss 4.3037 (4.0886)	Top-1 acc 23.828 (29.408)	Top-5 acc 50.391 (52.682)	lr 0.00693
Warmup Train [31][940/3239]	Time 0.676 (0.532)	Data 0.001 (0.027)	Loss 4.1157 (4.0890)	Top-1 acc 26.953 (29.404)	Top-5 acc 51.953 (52.670)	lr 0.00692
Warmup Train [31][950/3239]	Time 0.669 (0.532)	Data 0.002 (0.027)	Loss 3.9197 (4.0893)	Top-1 acc 33.594 (29.403)	Top-5 acc 60.938 (52.662)	lr 0.00692
Warmup Train [31][960/3239]	Time 0.522 (0.531)	Data 0.001 (0.027)	Loss 4.0935 (4.0896)	Top-1 acc 28.516 (29.403)	Top-5 acc 53.516 (52.661)	lr 0.00692
Warmup Train [31][970/3239]	Time 0.567 (0.532)	Data 0.001 (0.026)	Loss 4.1188 (4.0904)	Top-1 acc 26.172 (29.382)	Top-5 acc 49.219 (52.634)	lr 0.00691
Warmup Train [31][980/3239]	Time 0.383 (0.531)	Data 0.027 (0.026)	Loss 4.0607 (4.0901)	Top-1 acc 30.859 (29.384)	Top-5 acc 50.391 (52.640)	lr 0.00691
Warmup Train [31][990/3239]	Time 0.559 (0.531)	Data 0.001 (0.026)	Loss 4.0248 (4.0905)	Top-1 acc 34.375 (29.382)	Top-5 acc 52.734 (52.628)	lr 0.00690
Warmup Train [31][1000/3239]	Time 0.578 (0.531)	Data 0.001 (0.026)	Loss 3.9348 (4.0908)	Top-1 acc 30.469 (29.360)	Top-5 acc 57.812 (52.620)	lr 0.00690
Warmup Train [31][1010/3239]	Time 0.487 (0.531)	Data 0.001 (0.026)	Loss 4.0942 (4.0910)	Top-1 acc 28.125 (29.354)	Top-5 acc 51.562 (52.617)	lr 0.00689
Warmup Train [31][1020/3239]	Time 0.673 (0.531)	Data 0.001 (0.025)	Loss 4.1410 (4.0910)	Top-1 acc 28.906 (29.356)	Top-5 acc 48.828 (52.618)	lr 0.00689
Warmup Train [31][1030/3239]	Time 0.486 (0.531)	Data 0.001 (0.025)	Loss 4.1570 (4.0910)	Top-1 acc 30.859 (29.369)	Top-5 acc 51.562 (52.617)	lr 0.00689
Warmup Train [31][1040/3239]	Time 0.469 (0.531)	Data 0.001 (0.025)	Loss 3.9685 (4.0913)	Top-1 acc 31.641 (29.367)	Top-5 acc 57.031 (52.609)	lr 0.00688
Warmup Train [31][1050/3239]	Time 0.549 (0.530)	Data 0.001 (0.025)	Loss 3.9993 (4.0916)	Top-1 acc 30.469 (29.364)	Top-5 acc 53.125 (52.600)	lr 0.00688
Warmup Train [31][1060/3239]	Time 0.403 (0.530)	Data 0.001 (0.025)	Loss 4.1314 (4.0914)	Top-1 acc 29.297 (29.375)	Top-5 acc 52.734 (52.606)	lr 0.00687
Warmup Train [31][1070/3239]	Time 0.535 (0.530)	Data 0.002 (0.025)	Loss 3.9697 (4.0920)	Top-1 acc 33.594 (29.356)	Top-5 acc 54.688 (52.581)	lr 0.00687
Warmup Train [31][1080/3239]	Time 0.474 (0.530)	Data 0.001 (0.024)	Loss 3.9418 (4.0923)	Top-1 acc 32.422 (29.356)	Top-5 acc 56.641 (52.574)	lr 0.00687
Warmup Train [31][1090/3239]	Time 0.467 (0.530)	Data 0.001 (0.024)	Loss 3.9354 (4.0915)	Top-1 acc 27.734 (29.367)	Top-5 acc 55.078 (52.594)	lr 0.00686
Warmup Train [31][1100/3239]	Time 0.518 (0.530)	Data 0.002 (0.024)	Loss 4.2242 (4.0920)	Top-1 acc 24.609 (29.356)	Top-5 acc 46.875 (52.584)	lr 0.00686
Warmup Train [31][1110/3239]	Time 0.553 (0.530)	Data 0.001 (0.024)	Loss 3.8670 (4.0919)	Top-1 acc 35.938 (29.359)	Top-5 acc 57.031 (52.590)	lr 0.00685
Warmup Train [31][1120/3239]	Time 0.563 (0.530)	Data 0.001 (0.024)	Loss 4.1714 (4.0913)	Top-1 acc 28.906 (29.374)	Top-5 acc 46.875 (52.606)	lr 0.00685
Warmup Train [31][1130/3239]	Time 0.305 (0.529)	Data 0.001 (0.023)	Loss 4.0933 (4.0915)	Top-1 acc 31.641 (29.366)	Top-5 acc 53.906 (52.603)	lr 0.00684
Warmup Train [31][1140/3239]	Time 0.466 (0.529)	Data 0.001 (0.023)	Loss 3.9516 (4.0914)	Top-1 acc 30.469 (29.357)	Top-5 acc 57.812 (52.616)	lr 0.00684
Warmup Train [31][1150/3239]	Time 0.518 (0.529)	Data 0.001 (0.023)	Loss 4.0402 (4.0916)	Top-1 acc 27.344 (29.355)	Top-5 acc 52.344 (52.615)	lr 0.00684
Warmup Train [31][1160/3239]	Time 0.405 (0.529)	Data 0.001 (0.023)	Loss 3.9729 (4.0917)	Top-1 acc 33.984 (29.346)	Top-5 acc 58.984 (52.618)	lr 0.00683
Warmup Train [31][1170/3239]	Time 0.476 (0.529)	Data 0.001 (0.023)	Loss 3.9703 (4.0915)	Top-1 acc 31.641 (29.352)	Top-5 acc 53.906 (52.619)	lr 0.00683
Warmup Train [31][1180/3239]	Time 0.696 (0.528)	Data 0.001 (0.023)	Loss 4.1433 (4.0910)	Top-1 acc 29.297 (29.356)	Top-5 acc 50.781 (52.630)	lr 0.00682
Warmup Train [31][1190/3239]	Time 0.220 (0.528)	Data 0.002 (0.023)	Loss 4.1422 (4.0911)	Top-1 acc 30.078 (29.360)	Top-5 acc 50.781 (52.630)	lr 0.00682
Warmup Train [31][1200/3239]	Time 0.517 (0.528)	Data 0.001 (0.023)	Loss 4.2300 (4.0911)	Top-1 acc 28.125 (29.371)	Top-5 acc 48.047 (52.643)	lr 0.00682
Warmup Train [31][1210/3239]	Time 0.540 (0.528)	Data 0.001 (0.022)	Loss 4.0745 (4.0910)	Top-1 acc 31.250 (29.371)	Top-5 acc 53.906 (52.652)	lr 0.00681
Warmup Train [31][1220/3239]	Time 0.594 (0.528)	Data 0.001 (0.022)	Loss 4.2079 (4.0910)	Top-1 acc 26.562 (29.379)	Top-5 acc 50.781 (52.658)	lr 0.00681
Warmup Train [31][1230/3239]	Time 0.539 (0.528)	Data 0.001 (0.022)	Loss 4.0493 (4.0905)	Top-1 acc 30.078 (29.388)	Top-5 acc 52.734 (52.665)	lr 0.00680
Warmup Train [31][1240/3239]	Time 0.346 (0.527)	Data 0.001 (0.022)	Loss 4.2972 (4.0907)	Top-1 acc 25.000 (29.383)	Top-5 acc 49.219 (52.655)	lr 0.00680
Warmup Train [31][1250/3239]	Time 0.460 (0.527)	Data 0.001 (0.022)	Loss 4.0589 (4.0906)	Top-1 acc 31.641 (29.383)	Top-5 acc 55.078 (52.661)	lr 0.00679
Warmup Train [31][1260/3239]	Time 0.639 (0.527)	Data 0.001 (0.022)	Loss 4.2451 (4.0909)	Top-1 acc 26.953 (29.378)	Top-5 acc 50.000 (52.652)	lr 0.00679
Warmup Train [31][1270/3239]	Time 0.573 (0.527)	Data 0.001 (0.022)	Loss 4.0602 (4.0911)	Top-1 acc 30.078 (29.372)	Top-5 acc 54.688 (52.642)	lr 0.00679
Warmup Train [31][1280/3239]	Time 0.467 (0.527)	Data 0.001 (0.021)	Loss 4.2353 (4.0914)	Top-1 acc 28.125 (29.365)	Top-5 acc 47.656 (52.638)	lr 0.00678
Warmup Train [31][1290/3239]	Time 0.541 (0.527)	Data 0.001 (0.021)	Loss 4.1673 (4.0911)	Top-1 acc 26.172 (29.369)	Top-5 acc 51.562 (52.641)	lr 0.00678
Warmup Train [31][1300/3239]	Time 0.536 (0.527)	Data 0.001 (0.021)	Loss 4.0794 (4.0910)	Top-1 acc 33.984 (29.370)	Top-5 acc 55.469 (52.639)	lr 0.00677
Warmup Train [31][1310/3239]	Time 0.392 (0.527)	Data 0.001 (0.021)	Loss 4.2289 (4.0905)	Top-1 acc 26.172 (29.375)	Top-5 acc 49.609 (52.646)	lr 0.00677
Warmup Train [31][1320/3239]	Time 0.628 (0.527)	Data 0.001 (0.021)	Loss 3.9613 (4.0906)	Top-1 acc 32.031 (29.375)	Top-5 acc 53.516 (52.640)	lr 0.00677
Warmup Train [31][1330/3239]	Time 0.354 (0.527)	Data 0.002 (0.021)	Loss 3.9315 (4.0908)	Top-1 acc 32.422 (29.369)	Top-5 acc 55.078 (52.634)	lr 0.00676
Warmup Train [31][1340/3239]	Time 0.679 (0.527)	Data 0.001 (0.021)	Loss 4.0392 (4.0912)	Top-1 acc 30.078 (29.358)	Top-5 acc 55.859 (52.631)	lr 0.00676
Warmup Train [31][1350/3239]	Time 0.548 (0.527)	Data 0.001 (0.021)	Loss 3.9447 (4.0914)	Top-1 acc 34.766 (29.354)	Top-5 acc 54.297 (52.624)	lr 0.00675
Warmup Train [31][1360/3239]	Time 0.429 (0.526)	Data 0.001 (0.020)	Loss 3.9508 (4.0915)	Top-1 acc 34.766 (29.354)	Top-5 acc 54.297 (52.618)	lr 0.00675
Warmup Train [31][1370/3239]	Time 0.555 (0.526)	Data 0.001 (0.020)	Loss 4.1101 (4.0913)	Top-1 acc 29.688 (29.356)	Top-5 acc 52.344 (52.621)	lr 0.00675
Warmup Train [31][1380/3239]	Time 0.342 (0.526)	Data 0.001 (0.020)	Loss 4.3459 (4.0912)	Top-1 acc 26.172 (29.354)	Top-5 acc 49.609 (52.626)	lr 0.00674
Warmup Train [31][1390/3239]	Time 0.319 (0.526)	Data 0.001 (0.020)	Loss 4.1651 (4.0910)	Top-1 acc 29.297 (29.357)	Top-5 acc 49.219 (52.628)	lr 0.00674
Warmup Train [31][1400/3239]	Time 0.544 (0.526)	Data 0.002 (0.020)	Loss 4.0863 (4.0908)	Top-1 acc 29.688 (29.362)	Top-5 acc 53.516 (52.624)	lr 0.00673
Warmup Train [31][1410/3239]	Time 0.497 (0.526)	Data 0.001 (0.020)	Loss 4.1147 (4.0909)	Top-1 acc 26.172 (29.363)	Top-5 acc 50.391 (52.623)	lr 0.00673
Warmup Train [31][1420/3239]	Time 0.478 (0.526)	Data 0.001 (0.020)	Loss 4.1308 (4.0908)	Top-1 acc 28.906 (29.365)	Top-5 acc 53.906 (52.628)	lr 0.00672
Warmup Train [31][1430/3239]	Time 0.544 (0.525)	Data 0.001 (0.020)	Loss 3.8217 (4.0907)	Top-1 acc 34.375 (29.363)	Top-5 acc 59.766 (52.632)	lr 0.00672
Warmup Train [31][1440/3239]	Time 0.495 (0.525)	Data 0.001 (0.020)	Loss 4.1462 (4.0910)	Top-1 acc 27.734 (29.357)	Top-5 acc 50.000 (52.621)	lr 0.00672
Warmup Train [31][1450/3239]	Time 0.487 (0.525)	Data 0.001 (0.020)	Loss 4.2715 (4.0906)	Top-1 acc 25.781 (29.366)	Top-5 acc 49.609 (52.634)	lr 0.00671
Warmup Train [31][1460/3239]	Time 0.551 (0.525)	Data 0.001 (0.020)	Loss 4.1551 (4.0902)	Top-1 acc 28.516 (29.375)	Top-5 acc 51.172 (52.648)	lr 0.00671
Warmup Train [31][1470/3239]	Time 0.597 (0.524)	Data 0.001 (0.019)	Loss 4.3149 (4.0903)	Top-1 acc 26.562 (29.382)	Top-5 acc 47.266 (52.645)	lr 0.00670
Warmup Train [31][1480/3239]	Time 0.527 (0.524)	Data 0.001 (0.019)	Loss 3.9979 (4.0904)	Top-1 acc 27.734 (29.379)	Top-5 acc 56.641 (52.646)	lr 0.00670
Warmup Train [31][1490/3239]	Time 0.647 (0.524)	Data 0.001 (0.019)	Loss 4.1328 (4.0903)	Top-1 acc 29.297 (29.385)	Top-5 acc 51.562 (52.654)	lr 0.00670
Warmup Train [31][1500/3239]	Time 0.599 (0.524)	Data 0.001 (0.019)	Loss 4.0422 (4.0902)	Top-1 acc 30.078 (29.392)	Top-5 acc 54.688 (52.662)	lr 0.00669
Warmup Train [31][1510/3239]	Time 0.560 (0.524)	Data 0.001 (0.019)	Loss 4.3382 (4.0903)	Top-1 acc 25.000 (29.388)	Top-5 acc 46.094 (52.648)	lr 0.00669
Warmup Train [31][1520/3239]	Time 0.608 (0.523)	Data 0.001 (0.019)	Loss 4.0256 (4.0904)	Top-1 acc 32.422 (29.392)	Top-5 acc 56.641 (52.645)	lr 0.00668
Warmup Train [31][1530/3239]	Time 0.366 (0.523)	Data 0.001 (0.019)	Loss 4.0670 (4.0907)	Top-1 acc 33.984 (29.391)	Top-5 acc 53.516 (52.634)	lr 0.00668
Warmup Train [31][1540/3239]	Time 0.613 (0.523)	Data 0.001 (0.019)	Loss 4.1556 (4.0906)	Top-1 acc 25.781 (29.387)	Top-5 acc 51.172 (52.643)	lr 0.00667
Warmup Train [31][1550/3239]	Time 0.615 (0.523)	Data 0.001 (0.019)	Loss 4.0055 (4.0906)	Top-1 acc 29.297 (29.384)	Top-5 acc 52.344 (52.638)	lr 0.00667
Warmup Train [31][1560/3239]	Time 0.499 (0.523)	Data 0.001 (0.019)	Loss 3.8655 (4.0904)	Top-1 acc 34.375 (29.383)	Top-5 acc 57.812 (52.642)	lr 0.00667
Warmup Train [31][1570/3239]	Time 0.584 (0.523)	Data 0.001 (0.019)	Loss 4.0757 (4.0906)	Top-1 acc 29.688 (29.380)	Top-5 acc 55.469 (52.639)	lr 0.00666
Warmup Train [31][1580/3239]	Time 0.538 (0.523)	Data 0.002 (0.018)	Loss 4.1010 (4.0903)	Top-1 acc 28.906 (29.383)	Top-5 acc 51.953 (52.642)	lr 0.00666
Warmup Train [31][1590/3239]	Time 0.346 (0.522)	Data 0.001 (0.018)	Loss 4.1162 (4.0905)	Top-1 acc 30.078 (29.387)	Top-5 acc 52.344 (52.642)	lr 0.00665
Warmup Train [31][1600/3239]	Time 0.397 (0.522)	Data 0.001 (0.018)	Loss 4.1050 (4.0906)	Top-1 acc 29.297 (29.384)	Top-5 acc 50.000 (52.638)	lr 0.00665
Warmup Train [31][1610/3239]	Time 0.383 (0.522)	Data 0.001 (0.018)	Loss 4.1716 (4.0906)	Top-1 acc 29.688 (29.386)	Top-5 acc 49.609 (52.641)	lr 0.00665
Warmup Train [31][1620/3239]	Time 0.681 (0.522)	Data 0.001 (0.018)	Loss 3.9685 (4.0905)	Top-1 acc 30.078 (29.393)	Top-5 acc 55.078 (52.644)	lr 0.00664
Warmup Train [31][1630/3239]	Time 0.633 (0.522)	Data 0.001 (0.018)	Loss 3.9336 (4.0902)	Top-1 acc 33.594 (29.397)	Top-5 acc 55.859 (52.655)	lr 0.00664
Warmup Train [31][1640/3239]	Time 0.497 (0.522)	Data 0.001 (0.018)	Loss 4.0727 (4.0902)	Top-1 acc 30.078 (29.395)	Top-5 acc 52.344 (52.652)	lr 0.00663
Warmup Train [31][1650/3239]	Time 0.576 (0.522)	Data 0.001 (0.018)	Loss 3.9873 (4.0906)	Top-1 acc 31.641 (29.393)	Top-5 acc 55.469 (52.646)	lr 0.00663
Warmup Train [31][1660/3239]	Time 0.391 (0.522)	Data 0.001 (0.018)	Loss 4.1014 (4.0904)	Top-1 acc 28.125 (29.396)	Top-5 acc 51.953 (52.648)	lr 0.00663
Warmup Train [31][1670/3239]	Time 0.461 (0.522)	Data 0.001 (0.018)	Loss 4.1153 (4.0901)	Top-1 acc 28.125 (29.401)	Top-5 acc 52.344 (52.650)	lr 0.00662
Warmup Train [31][1680/3239]	Time 0.607 (0.522)	Data 0.001 (0.018)	Loss 4.0987 (4.0903)	Top-1 acc 27.734 (29.395)	Top-5 acc 51.172 (52.646)	lr 0.00662
Warmup Train [31][1690/3239]	Time 0.439 (0.522)	Data 0.001 (0.018)	Loss 3.9062 (4.0901)	Top-1 acc 34.766 (29.403)	Top-5 acc 55.078 (52.652)	lr 0.00661
Warmup Train [31][1700/3239]	Time 0.535 (0.522)	Data 0.001 (0.018)	Loss 4.3331 (4.0900)	Top-1 acc 23.047 (29.399)	Top-5 acc 46.875 (52.654)	lr 0.00661
Warmup Train [31][1710/3239]	Time 0.589 (0.522)	Data 0.001 (0.018)	Loss 4.0061 (4.0903)	Top-1 acc 29.688 (29.395)	Top-5 acc 52.344 (52.651)	lr 0.00660
Warmup Train [31][1720/3239]	Time 0.328 (0.522)	Data 0.001 (0.018)	Loss 4.1891 (4.0901)	Top-1 acc 25.391 (29.399)	Top-5 acc 53.125 (52.658)	lr 0.00660
Warmup Train [31][1730/3239]	Time 0.311 (0.521)	Data 0.001 (0.017)	Loss 4.0218 (4.0897)	Top-1 acc 33.203 (29.404)	Top-5 acc 55.078 (52.662)	lr 0.00660
Warmup Train [31][1740/3239]	Time 0.513 (0.521)	Data 0.001 (0.017)	Loss 4.2284 (4.0898)	Top-1 acc 26.562 (29.406)	Top-5 acc 49.219 (52.661)	lr 0.00659
Warmup Train [31][1750/3239]	Time 0.325 (0.521)	Data 0.002 (0.017)	Loss 4.1474 (4.0897)	Top-1 acc 26.953 (29.406)	Top-5 acc 48.438 (52.663)	lr 0.00659
Warmup Train [31][1760/3239]	Time 0.684 (0.521)	Data 0.001 (0.017)	Loss 3.9277 (4.0895)	Top-1 acc 30.859 (29.406)	Top-5 acc 55.469 (52.666)	lr 0.00658
Warmup Train [31][1770/3239]	Time 0.526 (0.521)	Data 0.001 (0.017)	Loss 4.2497 (4.0894)	Top-1 acc 23.828 (29.410)	Top-5 acc 48.047 (52.666)	lr 0.00658
Warmup Train [31][1780/3239]	Time 0.321 (0.521)	Data 0.002 (0.017)	Loss 3.9274 (4.0893)	Top-1 acc 32.031 (29.414)	Top-5 acc 57.422 (52.669)	lr 0.00658
Warmup Train [31][1790/3239]	Time 0.486 (0.521)	Data 0.001 (0.017)	Loss 4.2198 (4.0893)	Top-1 acc 28.906 (29.414)	Top-5 acc 51.953 (52.670)	lr 0.00657
Warmup Train [31][1800/3239]	Time 0.629 (0.521)	Data 0.001 (0.017)	Loss 4.0166 (4.0894)	Top-1 acc 29.297 (29.413)	Top-5 acc 55.078 (52.673)	lr 0.00657
Warmup Train [31][1810/3239]	Time 0.512 (0.521)	Data 0.001 (0.017)	Loss 3.8132 (4.0891)	Top-1 acc 35.547 (29.419)	Top-5 acc 57.422 (52.682)	lr 0.00656
Warmup Train [31][1820/3239]	Time 0.629 (0.521)	Data 0.001 (0.017)	Loss 4.1941 (4.0888)	Top-1 acc 29.297 (29.422)	Top-5 acc 49.219 (52.689)	lr 0.00656
Warmup Train [31][1830/3239]	Time 0.523 (0.521)	Data 0.001 (0.017)	Loss 4.1231 (4.0887)	Top-1 acc 28.125 (29.425)	Top-5 acc 50.781 (52.688)	lr 0.00656
Warmup Train [31][1840/3239]	Time 0.645 (0.520)	Data 0.001 (0.017)	Loss 3.9716 (4.0886)	Top-1 acc 28.906 (29.424)	Top-5 acc 56.250 (52.690)	lr 0.00655
Warmup Train [31][1850/3239]	Time 0.478 (0.520)	Data 0.001 (0.017)	Loss 4.0142 (4.0885)	Top-1 acc 30.469 (29.427)	Top-5 acc 53.516 (52.692)	lr 0.00655
Warmup Train [31][1860/3239]	Time 0.647 (0.520)	Data 0.001 (0.017)	Loss 4.0130 (4.0885)	Top-1 acc 32.422 (29.425)	Top-5 acc 50.391 (52.691)	lr 0.00654
Warmup Train [31][1870/3239]	Time 0.384 (0.520)	Data 0.001 (0.017)	Loss 4.4151 (4.0884)	Top-1 acc 25.000 (29.436)	Top-5 acc 48.438 (52.691)	lr 0.00654
Warmup Train [31][1880/3239]	Time 0.502 (0.520)	Data 0.001 (0.017)	Loss 4.3175 (4.0882)	Top-1 acc 25.391 (29.439)	Top-5 acc 48.828 (52.692)	lr 0.00654
Warmup Train [31][1890/3239]	Time 0.410 (0.520)	Data 0.001 (0.017)	Loss 4.0126 (4.0878)	Top-1 acc 31.641 (29.449)	Top-5 acc 53.516 (52.700)	lr 0.00653
Warmup Train [31][1900/3239]	Time 0.397 (0.520)	Data 0.001 (0.017)	Loss 4.4096 (4.0880)	Top-1 acc 25.781 (29.450)	Top-5 acc 50.000 (52.698)	lr 0.00653
Warmup Train [31][1910/3239]	Time 0.575 (0.520)	Data 0.001 (0.017)	Loss 4.1333 (4.0879)	Top-1 acc 33.594 (29.455)	Top-5 acc 52.344 (52.699)	lr 0.00652
Warmup Train [31][1920/3239]	Time 0.376 (0.520)	Data 0.001 (0.016)	Loss 4.1801 (4.0880)	Top-1 acc 26.562 (29.452)	Top-5 acc 48.828 (52.694)	lr 0.00652
Warmup Train [31][1930/3239]	Time 0.550 (0.520)	Data 0.001 (0.016)	Loss 4.0224 (4.0880)	Top-1 acc 32.422 (29.456)	Top-5 acc 55.469 (52.693)	lr 0.00651
Warmup Train [31][1940/3239]	Time 0.510 (0.520)	Data 0.001 (0.016)	Loss 3.9713 (4.0882)	Top-1 acc 30.469 (29.452)	Top-5 acc 56.250 (52.687)	lr 0.00651
Warmup Train [31][1950/3239]	Time 0.479 (0.520)	Data 0.001 (0.016)	Loss 4.2347 (4.0880)	Top-1 acc 23.828 (29.461)	Top-5 acc 46.875 (52.693)	lr 0.00651
Warmup Train [31][1960/3239]	Time 0.405 (0.520)	Data 0.001 (0.016)	Loss 4.2287 (4.0881)	Top-1 acc 29.297 (29.460)	Top-5 acc 51.562 (52.696)	lr 0.00650
Warmup Train [31][1970/3239]	Time 0.496 (0.520)	Data 0.001 (0.016)	Loss 3.9400 (4.0878)	Top-1 acc 31.641 (29.467)	Top-5 acc 55.859 (52.703)	lr 0.00650
Warmup Train [31][1980/3239]	Time 0.555 (0.520)	Data 0.001 (0.016)	Loss 4.1752 (4.0878)	Top-1 acc 27.344 (29.469)	Top-5 acc 50.000 (52.698)	lr 0.00649
Warmup Train [31][1990/3239]	Time 0.513 (0.520)	Data 0.001 (0.016)	Loss 4.1194 (4.0878)	Top-1 acc 32.031 (29.468)	Top-5 acc 52.734 (52.699)	lr 0.00649
Warmup Train [31][2000/3239]	Time 0.588 (0.520)	Data 0.001 (0.016)	Loss 4.0175 (4.0876)	Top-1 acc 29.297 (29.469)	Top-5 acc 55.859 (52.709)	lr 0.00649
Warmup Train [31][2010/3239]	Time 0.483 (0.520)	Data 0.001 (0.016)	Loss 3.9984 (4.0877)	Top-1 acc 32.422 (29.466)	Top-5 acc 56.250 (52.705)	lr 0.00648
Warmup Train [31][2020/3239]	Time 0.493 (0.520)	Data 0.001 (0.016)	Loss 4.1577 (4.0872)	Top-1 acc 27.734 (29.470)	Top-5 acc 52.734 (52.720)	lr 0.00648
Warmup Train [31][2030/3239]	Time 0.525 (0.519)	Data 0.001 (0.016)	Loss 4.1405 (4.0873)	Top-1 acc 30.469 (29.466)	Top-5 acc 51.562 (52.719)	lr 0.00647
Warmup Train [31][2040/3239]	Time 0.518 (0.519)	Data 0.001 (0.016)	Loss 4.0912 (4.0874)	Top-1 acc 29.297 (29.463)	Top-5 acc 50.000 (52.713)	lr 0.00647
Warmup Train [31][2050/3239]	Time 0.342 (0.519)	Data 0.001 (0.016)	Loss 4.2513 (4.0876)	Top-1 acc 26.172 (29.460)	Top-5 acc 47.656 (52.707)	lr 0.00647
Warmup Train [31][2060/3239]	Time 0.753 (0.519)	Data 0.001 (0.016)	Loss 4.1532 (4.0879)	Top-1 acc 28.125 (29.455)	Top-5 acc 51.562 (52.706)	lr 0.00646
Warmup Train [31][2070/3239]	Time 0.510 (0.519)	Data 0.001 (0.016)	Loss 4.1098 (4.0880)	Top-1 acc 32.031 (29.454)	Top-5 acc 50.781 (52.700)	lr 0.00646
Warmup Train [31][2080/3239]	Time 0.362 (0.519)	Data 0.001 (0.016)	Loss 4.0537 (4.0881)	Top-1 acc 31.250 (29.452)	Top-5 acc 53.125 (52.701)	lr 0.00645
Warmup Train [31][2090/3239]	Time 0.433 (0.519)	Data 0.001 (0.016)	Loss 4.0733 (4.0881)	Top-1 acc 31.250 (29.453)	Top-5 acc 52.344 (52.702)	lr 0.00645
Warmup Train [31][2100/3239]	Time 0.383 (0.519)	Data 0.001 (0.016)	Loss 4.2914 (4.0883)	Top-1 acc 25.000 (29.450)	Top-5 acc 48.828 (52.696)	lr 0.00645
Warmup Train [31][2110/3239]	Time 0.553 (0.519)	Data 0.001 (0.016)	Loss 4.0888 (4.0881)	Top-1 acc 26.953 (29.453)	Top-5 acc 52.734 (52.698)	lr 0.00644
Warmup Train [31][2120/3239]	Time 0.427 (0.519)	Data 0.001 (0.015)	Loss 4.1135 (4.0881)	Top-1 acc 30.469 (29.451)	Top-5 acc 53.125 (52.700)	lr 0.00644
Warmup Train [31][2130/3239]	Time 0.447 (0.519)	Data 0.001 (0.015)	Loss 3.9579 (4.0879)	Top-1 acc 35.938 (29.455)	Top-5 acc 57.812 (52.708)	lr 0.00643
Warmup Train [31][2140/3239]	Time 0.507 (0.519)	Data 0.001 (0.015)	Loss 4.0442 (4.0881)	Top-1 acc 37.500 (29.455)	Top-5 acc 54.688 (52.700)	lr 0.00643
Warmup Train [31][2150/3239]	Time 0.520 (0.519)	Data 0.001 (0.015)	Loss 4.0209 (4.0881)	Top-1 acc 29.688 (29.459)	Top-5 acc 53.906 (52.704)	lr 0.00643
Warmup Train [31][2160/3239]	Time 0.549 (0.519)	Data 0.001 (0.015)	Loss 3.9336 (4.0878)	Top-1 acc 30.859 (29.465)	Top-5 acc 57.812 (52.714)	lr 0.00642
Warmup Train [31][2170/3239]	Time 0.475 (0.519)	Data 0.001 (0.015)	Loss 4.3012 (4.0878)	Top-1 acc 23.047 (29.463)	Top-5 acc 48.047 (52.713)	lr 0.00642
Warmup Train [31][2180/3239]	Time 0.595 (0.519)	Data 0.001 (0.015)	Loss 3.9373 (4.0876)	Top-1 acc 33.594 (29.465)	Top-5 acc 55.469 (52.715)	lr 0.00641
Warmup Train [31][2190/3239]	Time 0.525 (0.519)	Data 0.001 (0.015)	Loss 4.0279 (4.0876)	Top-1 acc 31.641 (29.466)	Top-5 acc 55.469 (52.717)	lr 0.00641
Warmup Train [31][2200/3239]	Time 0.608 (0.519)	Data 0.001 (0.015)	Loss 3.8752 (4.0877)	Top-1 acc 33.984 (29.469)	Top-5 acc 56.250 (52.712)	lr 0.00641
Warmup Train [31][2210/3239]	Time 0.537 (0.519)	Data 0.001 (0.015)	Loss 4.0433 (4.0874)	Top-1 acc 30.469 (29.474)	Top-5 acc 53.906 (52.721)	lr 0.00640
Warmup Train [31][2220/3239]	Time 0.446 (0.519)	Data 0.001 (0.015)	Loss 4.0914 (4.0868)	Top-1 acc 27.734 (29.487)	Top-5 acc 52.344 (52.736)	lr 0.00640
Warmup Train [31][2230/3239]	Time 0.406 (0.519)	Data 0.001 (0.015)	Loss 3.9606 (4.0869)	Top-1 acc 32.422 (29.484)	Top-5 acc 57.031 (52.741)	lr 0.00639
Warmup Train [31][2240/3239]	Time 0.518 (0.519)	Data 0.001 (0.015)	Loss 3.9899 (4.0868)	Top-1 acc 28.516 (29.486)	Top-5 acc 53.125 (52.739)	lr 0.00639
Warmup Train [31][2250/3239]	Time 0.392 (0.519)	Data 0.001 (0.015)	Loss 3.9923 (4.0868)	Top-1 acc 30.078 (29.486)	Top-5 acc 56.641 (52.741)	lr 0.00638
Warmup Train [31][2260/3239]	Time 0.439 (0.519)	Data 0.001 (0.015)	Loss 4.0594 (4.0866)	Top-1 acc 22.266 (29.483)	Top-5 acc 57.031 (52.746)	lr 0.00638
Warmup Train [31][2270/3239]	Time 0.473 (0.519)	Data 0.001 (0.015)	Loss 4.1431 (4.0865)	Top-1 acc 26.953 (29.485)	Top-5 acc 50.391 (52.749)	lr 0.00638
Warmup Train [31][2280/3239]	Time 0.515 (0.519)	Data 0.001 (0.015)	Loss 4.1950 (4.0865)	Top-1 acc 27.344 (29.481)	Top-5 acc 46.875 (52.744)	lr 0.00637
Warmup Train [31][2290/3239]	Time 0.420 (0.518)	Data 0.001 (0.015)	Loss 3.9939 (4.0868)	Top-1 acc 31.250 (29.475)	Top-5 acc 56.250 (52.738)	lr 0.00637
Warmup Train [31][2300/3239]	Time 0.376 (0.518)	Data 0.001 (0.015)	Loss 3.9521 (4.0864)	Top-1 acc 35.938 (29.486)	Top-5 acc 55.859 (52.748)	lr 0.00636
Warmup Train [31][2310/3239]	Time 0.439 (0.518)	Data 0.001 (0.015)	Loss 4.1232 (4.0867)	Top-1 acc 27.734 (29.477)	Top-5 acc 54.297 (52.742)	lr 0.00636
Warmup Train [31][2320/3239]	Time 0.591 (0.518)	Data 0.001 (0.015)	Loss 4.0251 (4.0867)	Top-1 acc 30.469 (29.475)	Top-5 acc 54.297 (52.743)	lr 0.00636
Warmup Train [31][2330/3239]	Time 0.423 (0.518)	Data 0.001 (0.015)	Loss 3.9412 (4.0865)	Top-1 acc 32.812 (29.484)	Top-5 acc 54.688 (52.744)	lr 0.00635
Warmup Train [31][2340/3239]	Time 0.536 (0.518)	Data 0.001 (0.015)	Loss 4.3182 (4.0867)	Top-1 acc 27.344 (29.481)	Top-5 acc 49.609 (52.742)	lr 0.00635
Warmup Train [31][2350/3239]	Time 0.645 (0.518)	Data 0.001 (0.015)	Loss 3.8980 (4.0867)	Top-1 acc 33.203 (29.480)	Top-5 acc 57.812 (52.743)	lr 0.00634
Warmup Train [31][2360/3239]	Time 0.749 (0.518)	Data 0.001 (0.015)	Loss 4.0936 (4.0867)	Top-1 acc 30.078 (29.482)	Top-5 acc 52.344 (52.742)	lr 0.00634
Warmup Train [31][2370/3239]	Time 0.553 (0.518)	Data 0.001 (0.015)	Loss 4.1676 (4.0869)	Top-1 acc 28.516 (29.481)	Top-5 acc 48.047 (52.731)	lr 0.00634
Warmup Train [31][2380/3239]	Time 0.671 (0.518)	Data 0.001 (0.014)	Loss 4.1162 (4.0869)	Top-1 acc 32.031 (29.484)	Top-5 acc 53.906 (52.734)	lr 0.00633
Warmup Train [31][2390/3239]	Time 0.412 (0.518)	Data 0.001 (0.014)	Loss 4.0978 (4.0869)	Top-1 acc 31.641 (29.487)	Top-5 acc 50.000 (52.730)	lr 0.00633
Warmup Train [31][2400/3239]	Time 0.500 (0.518)	Data 0.003 (0.014)	Loss 4.0602 (4.0871)	Top-1 acc 29.297 (29.482)	Top-5 acc 52.344 (52.726)	lr 0.00632
Warmup Train [31][2410/3239]	Time 0.482 (0.518)	Data 0.001 (0.014)	Loss 3.9255 (4.0870)	Top-1 acc 32.812 (29.486)	Top-5 acc 58.203 (52.731)	lr 0.00632
Warmup Train [31][2420/3239]	Time 0.577 (0.518)	Data 0.001 (0.014)	Loss 4.0237 (4.0869)	Top-1 acc 30.078 (29.491)	Top-5 acc 53.125 (52.734)	lr 0.00632
Warmup Train [31][2430/3239]	Time 0.429 (0.518)	Data 0.001 (0.014)	Loss 4.1273 (4.0867)	Top-1 acc 26.953 (29.494)	Top-5 acc 50.391 (52.737)	lr 0.00631
Warmup Train [31][2440/3239]	Time 0.591 (0.518)	Data 0.001 (0.014)	Loss 4.0220 (4.0867)	Top-1 acc 29.297 (29.494)	Top-5 acc 55.078 (52.733)	lr 0.00631
Warmup Train [31][2450/3239]	Time 0.502 (0.518)	Data 0.001 (0.014)	Loss 3.9101 (4.0867)	Top-1 acc 33.984 (29.496)	Top-5 acc 57.031 (52.737)	lr 0.00630
Warmup Train [31][2460/3239]	Time 0.427 (0.518)	Data 0.001 (0.014)	Loss 4.1093 (4.0866)	Top-1 acc 28.125 (29.495)	Top-5 acc 50.391 (52.740)	lr 0.00630
Warmup Train [31][2470/3239]	Time 0.613 (0.518)	Data 0.001 (0.014)	Loss 3.9997 (4.0867)	Top-1 acc 32.031 (29.492)	Top-5 acc 55.469 (52.731)	lr 0.00630
Warmup Train [31][2480/3239]	Time 0.657 (0.518)	Data 0.001 (0.014)	Loss 4.1520 (4.0867)	Top-1 acc 26.172 (29.491)	Top-5 acc 50.000 (52.731)	lr 0.00629
Warmup Train [31][2490/3239]	Time 0.629 (0.518)	Data 0.001 (0.014)	Loss 4.0701 (4.0866)	Top-1 acc 29.688 (29.491)	Top-5 acc 51.562 (52.734)	lr 0.00629
Warmup Train [31][2500/3239]	Time 0.623 (0.518)	Data 0.001 (0.014)	Loss 4.0351 (4.0866)	Top-1 acc 29.688 (29.494)	Top-5 acc 51.172 (52.735)	lr 0.00628
Warmup Train [31][2510/3239]	Time 0.582 (0.518)	Data 0.001 (0.014)	Loss 4.1250 (4.0866)	Top-1 acc 27.734 (29.496)	Top-5 acc 51.562 (52.737)	lr 0.00628
Warmup Train [31][2520/3239]	Time 0.494 (0.518)	Data 0.001 (0.014)	Loss 4.1594 (4.0865)	Top-1 acc 28.906 (29.502)	Top-5 acc 50.781 (52.739)	lr 0.00628
Warmup Train [31][2530/3239]	Time 0.509 (0.518)	Data 0.001 (0.014)	Loss 3.9427 (4.0865)	Top-1 acc 33.984 (29.506)	Top-5 acc 51.172 (52.737)	lr 0.00627
Warmup Train [31][2540/3239]	Time 0.522 (0.518)	Data 0.001 (0.014)	Loss 4.0554 (4.0865)	Top-1 acc 28.906 (29.502)	Top-5 acc 53.906 (52.737)	lr 0.00627
Warmup Train [31][2550/3239]	Time 0.517 (0.518)	Data 0.001 (0.014)	Loss 4.3152 (4.0866)	Top-1 acc 26.562 (29.504)	Top-5 acc 47.266 (52.735)	lr 0.00626
Warmup Train [31][2560/3239]	Time 0.389 (0.518)	Data 0.001 (0.014)	Loss 4.0177 (4.0866)	Top-1 acc 34.375 (29.502)	Top-5 acc 52.344 (52.736)	lr 0.00626
Warmup Train [31][2570/3239]	Time 0.505 (0.518)	Data 0.001 (0.014)	Loss 3.9485 (4.0865)	Top-1 acc 27.344 (29.503)	Top-5 acc 53.906 (52.740)	lr 0.00626
Warmup Train [31][2580/3239]	Time 0.591 (0.518)	Data 0.001 (0.014)	Loss 4.0818 (4.0865)	Top-1 acc 26.172 (29.500)	Top-5 acc 53.516 (52.741)	lr 0.00625
Warmup Train [31][2590/3239]	Time 0.342 (0.517)	Data 0.001 (0.014)	Loss 4.0470 (4.0865)	Top-1 acc 31.250 (29.499)	Top-5 acc 55.078 (52.746)	lr 0.00625
Warmup Train [31][2600/3239]	Time 0.549 (0.517)	Data 0.001 (0.014)	Loss 4.1037 (4.0864)	Top-1 acc 27.734 (29.498)	Top-5 acc 52.344 (52.743)	lr 0.00624
Warmup Train [31][2610/3239]	Time 0.705 (0.517)	Data 0.001 (0.014)	Loss 4.2671 (4.0863)	Top-1 acc 28.125 (29.500)	Top-5 acc 47.266 (52.749)	lr 0.00624
Warmup Train [31][2620/3239]	Time 0.383 (0.517)	Data 0.001 (0.014)	Loss 3.9199 (4.0862)	Top-1 acc 30.469 (29.497)	Top-5 acc 54.297 (52.750)	lr 0.00624
Warmup Train [31][2630/3239]	Time 0.547 (0.517)	Data 0.001 (0.014)	Loss 4.1326 (4.0861)	Top-1 acc 28.516 (29.499)	Top-5 acc 52.734 (52.748)	lr 0.00623
Warmup Train [31][2640/3239]	Time 0.687 (0.517)	Data 0.001 (0.014)	Loss 4.0130 (4.0862)	Top-1 acc 27.734 (29.497)	Top-5 acc 53.516 (52.744)	lr 0.00623
Warmup Train [31][2650/3239]	Time 0.328 (0.517)	Data 0.001 (0.014)	Loss 4.2714 (4.0861)	Top-1 acc 27.344 (29.497)	Top-5 acc 45.703 (52.746)	lr 0.00622
Warmup Train [31][2660/3239]	Time 0.583 (0.517)	Data 0.001 (0.014)	Loss 4.0476 (4.0862)	Top-1 acc 29.297 (29.495)	Top-5 acc 49.609 (52.738)	lr 0.00622
Warmup Train [31][2670/3239]	Time 0.514 (0.517)	Data 0.001 (0.013)	Loss 4.0177 (4.0862)	Top-1 acc 33.984 (29.498)	Top-5 acc 51.172 (52.741)	lr 0.00622
Warmup Train [31][2680/3239]	Time 0.355 (0.517)	Data 0.001 (0.013)	Loss 4.1945 (4.0862)	Top-1 acc 27.734 (29.498)	Top-5 acc 47.656 (52.739)	lr 0.00621
Warmup Train [31][2690/3239]	Time 0.538 (0.517)	Data 0.001 (0.013)	Loss 3.9822 (4.0864)	Top-1 acc 31.250 (29.495)	Top-5 acc 54.688 (52.736)	lr 0.00621
Warmup Train [31][2700/3239]	Time 0.640 (0.517)	Data 0.001 (0.013)	Loss 4.0763 (4.0863)	Top-1 acc 29.688 (29.495)	Top-5 acc 53.906 (52.740)	lr 0.00620
Warmup Train [31][2710/3239]	Time 0.391 (0.517)	Data 0.001 (0.013)	Loss 4.1676 (4.0863)	Top-1 acc 25.000 (29.499)	Top-5 acc 47.656 (52.739)	lr 0.00620
Warmup Train [31][2720/3239]	Time 0.626 (0.517)	Data 0.001 (0.013)	Loss 4.2107 (4.0862)	Top-1 acc 29.688 (29.502)	Top-5 acc 48.828 (52.740)	lr 0.00620
Warmup Train [31][2730/3239]	Time 0.538 (0.517)	Data 0.001 (0.013)	Loss 3.8488 (4.0861)	Top-1 acc 35.547 (29.507)	Top-5 acc 56.250 (52.742)	lr 0.00619
Warmup Train [31][2740/3239]	Time 0.598 (0.517)	Data 0.001 (0.013)	Loss 4.1346 (4.0860)	Top-1 acc 27.344 (29.507)	Top-5 acc 48.438 (52.741)	lr 0.00619
Warmup Train [31][2750/3239]	Time 0.474 (0.517)	Data 0.001 (0.013)	Loss 3.8218 (4.0857)	Top-1 acc 35.938 (29.513)	Top-5 acc 59.766 (52.749)	lr 0.00618
Warmup Train [31][2760/3239]	Time 0.528 (0.517)	Data 0.001 (0.013)	Loss 4.3159 (4.0856)	Top-1 acc 27.734 (29.509)	Top-5 acc 46.484 (52.751)	lr 0.00618
Warmup Train [31][2770/3239]	Time 0.538 (0.517)	Data 0.001 (0.013)	Loss 4.0571 (4.0855)	Top-1 acc 30.859 (29.511)	Top-5 acc 51.562 (52.755)	lr 0.00618
Warmup Train [31][2780/3239]	Time 0.623 (0.517)	Data 0.001 (0.013)	Loss 4.1008 (4.0857)	Top-1 acc 26.562 (29.510)	Top-5 acc 50.391 (52.749)	lr 0.00617
Warmup Train [31][2790/3239]	Time 0.579 (0.517)	Data 0.001 (0.013)	Loss 4.0759 (4.0857)	Top-1 acc 28.906 (29.512)	Top-5 acc 55.078 (52.754)	lr 0.00617
Warmup Train [31][2800/3239]	Time 0.420 (0.517)	Data 0.001 (0.013)	Loss 4.2260 (4.0857)	Top-1 acc 32.031 (29.514)	Top-5 acc 50.000 (52.752)	lr 0.00616
Warmup Train [31][2810/3239]	Time 0.367 (0.517)	Data 0.001 (0.013)	Loss 4.0340 (4.0856)	Top-1 acc 30.469 (29.514)	Top-5 acc 53.125 (52.752)	lr 0.00616
Warmup Train [31][2820/3239]	Time 0.408 (0.517)	Data 0.001 (0.013)	Loss 3.9238 (4.0856)	Top-1 acc 34.375 (29.514)	Top-5 acc 57.031 (52.751)	lr 0.00616
Warmup Train [31][2830/3239]	Time 0.543 (0.517)	Data 0.001 (0.013)	Loss 4.1864 (4.0856)	Top-1 acc 26.953 (29.511)	Top-5 acc 50.781 (52.747)	lr 0.00615
Warmup Train [31][2840/3239]	Time 0.396 (0.517)	Data 0.001 (0.013)	Loss 4.1094 (4.0857)	Top-1 acc 28.125 (29.505)	Top-5 acc 54.688 (52.748)	lr 0.00615
Warmup Train [31][2850/3239]	Time 0.339 (0.517)	Data 0.001 (0.013)	Loss 4.1070 (4.0857)	Top-1 acc 28.906 (29.504)	Top-5 acc 52.734 (52.747)	lr 0.00614
Warmup Train [31][2860/3239]	Time 0.332 (0.517)	Data 0.001 (0.013)	Loss 4.2535 (4.0857)	Top-1 acc 28.125 (29.510)	Top-5 acc 44.922 (52.746)	lr 0.00614
Warmup Train [31][2870/3239]	Time 0.488 (0.517)	Data 0.001 (0.013)	Loss 3.9616 (4.0856)	Top-1 acc 27.344 (29.510)	Top-5 acc 56.250 (52.745)	lr 0.00614
Warmup Train [31][2880/3239]	Time 0.594 (0.517)	Data 0.002 (0.013)	Loss 4.1724 (4.0858)	Top-1 acc 26.172 (29.507)	Top-5 acc 50.781 (52.741)	lr 0.00613
Warmup Train [31][2890/3239]	Time 0.568 (0.517)	Data 0.001 (0.013)	Loss 3.9741 (4.0857)	Top-1 acc 30.859 (29.508)	Top-5 acc 55.078 (52.749)	lr 0.00613
Warmup Train [31][2900/3239]	Time 0.633 (0.517)	Data 0.001 (0.013)	Loss 3.9654 (4.0855)	Top-1 acc 31.641 (29.514)	Top-5 acc 58.984 (52.753)	lr 0.00612
Warmup Train [31][2910/3239]	Time 0.566 (0.517)	Data 0.001 (0.013)	Loss 4.0299 (4.0855)	Top-1 acc 31.250 (29.512)	Top-5 acc 54.297 (52.751)	lr 0.00612
Warmup Train [31][2920/3239]	Time 0.380 (0.517)	Data 0.001 (0.013)	Loss 3.9854 (4.0855)	Top-1 acc 28.906 (29.516)	Top-5 acc 50.781 (52.750)	lr 0.00612
Warmup Train [31][2930/3239]	Time 0.500 (0.517)	Data 0.001 (0.013)	Loss 4.0358 (4.0856)	Top-1 acc 30.078 (29.515)	Top-5 acc 53.516 (52.743)	lr 0.00611
Warmup Train [31][2940/3239]	Time 0.537 (0.517)	Data 0.001 (0.013)	Loss 4.1158 (4.0855)	Top-1 acc 27.734 (29.516)	Top-5 acc 50.781 (52.745)	lr 0.00611
Warmup Train [31][2950/3239]	Time 0.494 (0.517)	Data 0.001 (0.013)	Loss 4.0853 (4.0856)	Top-1 acc 26.562 (29.514)	Top-5 acc 53.516 (52.742)	lr 0.00610
Warmup Train [31][2960/3239]	Time 0.612 (0.517)	Data 0.001 (0.013)	Loss 3.9468 (4.0853)	Top-1 acc 30.469 (29.521)	Top-5 acc 53.906 (52.751)	lr 0.00610
Warmup Train [31][2970/3239]	Time 0.518 (0.517)	Data 0.001 (0.013)	Loss 4.0741 (4.0854)	Top-1 acc 30.469 (29.519)	Top-5 acc 55.469 (52.753)	lr 0.00610
Warmup Train [31][2980/3239]	Time 0.499 (0.517)	Data 0.001 (0.013)	Loss 3.9848 (4.0851)	Top-1 acc 29.297 (29.522)	Top-5 acc 58.594 (52.758)	lr 0.00609
Warmup Train [31][2990/3239]	Time 0.547 (0.517)	Data 0.001 (0.013)	Loss 4.1108 (4.0852)	Top-1 acc 25.781 (29.519)	Top-5 acc 50.391 (52.755)	lr 0.00609
Warmup Train [31][3000/3239]	Time 0.455 (0.517)	Data 0.001 (0.013)	Loss 4.1588 (4.0852)	Top-1 acc 28.906 (29.520)	Top-5 acc 48.047 (52.754)	lr 0.00608
Warmup Train [31][3010/3239]	Time 0.680 (0.517)	Data 0.003 (0.013)	Loss 4.1428 (4.0854)	Top-1 acc 29.297 (29.519)	Top-5 acc 50.781 (52.751)	lr 0.00608
Warmup Train [31][3020/3239]	Time 0.556 (0.517)	Data 0.001 (0.013)	Loss 4.2307 (4.0855)	Top-1 acc 29.297 (29.517)	Top-5 acc 48.047 (52.750)	lr 0.00608
Warmup Train [31][3030/3239]	Time 0.644 (0.517)	Data 0.001 (0.013)	Loss 4.1279 (4.0854)	Top-1 acc 28.906 (29.517)	Top-5 acc 49.219 (52.749)	lr 0.00607
Warmup Train [31][3040/3239]	Time 0.533 (0.517)	Data 0.001 (0.012)	Loss 4.0346 (4.0855)	Top-1 acc 29.297 (29.517)	Top-5 acc 54.297 (52.749)	lr 0.00607
Warmup Train [31][3050/3239]	Time 0.624 (0.517)	Data 0.001 (0.012)	Loss 3.9779 (4.0855)	Top-1 acc 36.719 (29.519)	Top-5 acc 57.422 (52.751)	lr 0.00606
Warmup Train [31][3060/3239]	Time 0.510 (0.517)	Data 0.001 (0.012)	Loss 4.1376 (4.0857)	Top-1 acc 31.250 (29.518)	Top-5 acc 54.688 (52.746)	lr 0.00606
Warmup Train [31][3070/3239]	Time 0.500 (0.517)	Data 0.001 (0.012)	Loss 4.1592 (4.0857)	Top-1 acc 28.906 (29.516)	Top-5 acc 51.562 (52.746)	lr 0.00606
Warmup Train [31][3080/3239]	Time 0.555 (0.517)	Data 0.001 (0.012)	Loss 4.2558 (4.0857)	Top-1 acc 28.516 (29.515)	Top-5 acc 46.875 (52.746)	lr 0.00605
Warmup Train [31][3090/3239]	Time 0.587 (0.517)	Data 0.001 (0.012)	Loss 4.0852 (4.0856)	Top-1 acc 30.469 (29.516)	Top-5 acc 50.781 (52.747)	lr 0.00605
Warmup Train [31][3100/3239]	Time 0.517 (0.517)	Data 0.001 (0.012)	Loss 3.9237 (4.0855)	Top-1 acc 33.594 (29.517)	Top-5 acc 53.906 (52.748)	lr 0.00605
Warmup Train [31][3110/3239]	Time 0.428 (0.517)	Data 0.001 (0.012)	Loss 4.1288 (4.0854)	Top-1 acc 29.688 (29.521)	Top-5 acc 53.125 (52.753)	lr 0.00604
Warmup Train [31][3120/3239]	Time 0.522 (0.517)	Data 0.001 (0.012)	Loss 4.0887 (4.0853)	Top-1 acc 30.078 (29.519)	Top-5 acc 51.953 (52.755)	lr 0.00604
Warmup Train [31][3130/3239]	Time 0.500 (0.517)	Data 0.001 (0.012)	Loss 4.0069 (4.0852)	Top-1 acc 30.078 (29.523)	Top-5 acc 54.688 (52.757)	lr 0.00603
Warmup Train [31][3140/3239]	Time 0.443 (0.516)	Data 0.001 (0.012)	Loss 3.9508 (4.0853)	Top-1 acc 31.250 (29.522)	Top-5 acc 55.078 (52.755)	lr 0.00603
Warmup Train [31][3150/3239]	Time 0.535 (0.516)	Data 0.001 (0.012)	Loss 4.0134 (4.0850)	Top-1 acc 25.391 (29.527)	Top-5 acc 53.906 (52.765)	lr 0.00603
Warmup Train [31][3160/3239]	Time 0.366 (0.516)	Data 0.002 (0.012)	Loss 4.0263 (4.0849)	Top-1 acc 33.203 (29.530)	Top-5 acc 55.469 (52.766)	lr 0.00602
Warmup Train [31][3170/3239]	Time 0.497 (0.516)	Data 0.001 (0.012)	Loss 4.1488 (4.0849)	Top-1 acc 29.688 (29.529)	Top-5 acc 49.609 (52.768)	lr 0.00602
Warmup Train [31][3180/3239]	Time 0.470 (0.516)	Data 0.000 (0.012)	Loss 3.9754 (4.0849)	Top-1 acc 32.422 (29.532)	Top-5 acc 51.172 (52.769)	lr 0.00601
Warmup Train [31][3190/3239]	Time 0.585 (0.516)	Data 0.000 (0.012)	Loss 4.1305 (4.0847)	Top-1 acc 26.172 (29.531)	Top-5 acc 52.344 (52.771)	lr 0.00601
Warmup Train [31][3200/3239]	Time 0.433 (0.516)	Data 0.000 (0.012)	Loss 4.0647 (4.0848)	Top-1 acc 29.297 (29.527)	Top-5 acc 55.469 (52.769)	lr 0.00601
Warmup Train [31][3210/3239]	Time 0.508 (0.516)	Data 0.000 (0.012)	Loss 4.1226 (4.0849)	Top-1 acc 26.562 (29.525)	Top-5 acc 50.781 (52.766)	lr 0.00600
Warmup Train [31][3220/3239]	Time 0.567 (0.516)	Data 0.000 (0.012)	Loss 4.0342 (4.0850)	Top-1 acc 29.688 (29.519)	Top-5 acc 55.078 (52.765)	lr 0.00600
Warmup Train [31][3230/3239]	Time 0.536 (0.516)	Data 0.000 (0.012)	Loss 4.0422 (4.0851)	Top-1 acc 33.984 (29.522)	Top-5 acc 54.688 (52.765)	lr 0.00599
Warmup Train [31][3239/3239]	Time 0.352 (0.516)	Data 0.000 (0.012)	Loss 4.0918 (4.0851)	Top-1 acc 22.222 (29.519)	Top-5 acc 56.790 (52.767)	lr 0.00599
==========Warmup Valid [31/40]	loss 3.028	top-1 acc 36.748	top-5 acc 61.843	Train top-1 29.519	top-5 52.767	flops: 442.4M
Warmup Train [32][0/3239]	Time 19.367 (19.367)	Data 16.530 (16.530)	Loss 4.3022 (4.3022)	Top-1 acc 24.609 (24.609)	Top-5 acc 47.656 (47.656)	lr 0.00599
Warmup Train [32][10/3239]	Time 0.573 (2.267)	Data 0.001 (1.511)	Loss 4.1646 (4.0577)	Top-1 acc 25.000 (30.043)	Top-5 acc 49.609 (52.663)	lr 0.00599
Warmup Train [32][20/3239]	Time 0.533 (1.439)	Data 0.002 (0.792)	Loss 4.1875 (4.0626)	Top-1 acc 30.469 (30.506)	Top-5 acc 51.562 (53.237)	lr 0.00598
Warmup Train [32][30/3239]	Time 0.522 (1.134)	Data 0.001 (0.537)	Loss 4.2071 (4.0833)	Top-1 acc 25.391 (29.751)	Top-5 acc 50.000 (52.747)	lr 0.00598
Warmup Train [32][40/3239]	Time 0.519 (0.979)	Data 0.001 (0.407)	Loss 4.1282 (4.0938)	Top-1 acc 26.562 (29.163)	Top-5 acc 55.078 (52.611)	lr 0.00597
Warmup Train [32][50/3239]	Time 0.463 (0.885)	Data 0.001 (0.327)	Loss 3.8648 (4.0753)	Top-1 acc 32.422 (29.596)	Top-5 acc 57.031 (53.002)	lr 0.00597
Warmup Train [32][60/3239]	Time 0.477 (0.823)	Data 0.001 (0.274)	Loss 4.4163 (4.0679)	Top-1 acc 26.172 (29.707)	Top-5 acc 42.578 (53.016)	lr 0.00597
Warmup Train [32][70/3239]	Time 0.452 (0.777)	Data 0.001 (0.236)	Loss 4.0169 (4.0694)	Top-1 acc 30.078 (29.770)	Top-5 acc 53.125 (53.081)	lr 0.00596
Warmup Train [32][80/3239]	Time 0.672 (0.746)	Data 0.001 (0.209)	Loss 3.8743 (4.0710)	Top-1 acc 32.812 (29.837)	Top-5 acc 58.594 (52.942)	lr 0.00596
Warmup Train [32][90/3239]	Time 0.572 (0.719)	Data 0.001 (0.186)	Loss 4.1429 (4.0743)	Top-1 acc 25.391 (29.683)	Top-5 acc 52.344 (52.825)	lr 0.00595
Warmup Train [32][100/3239]	Time 0.469 (0.696)	Data 0.001 (0.168)	Loss 4.0341 (4.0754)	Top-1 acc 31.641 (29.571)	Top-5 acc 51.953 (52.831)	lr 0.00595
Warmup Train [32][110/3239]	Time 0.402 (0.679)	Data 0.001 (0.154)	Loss 4.2089 (4.0724)	Top-1 acc 26.953 (29.603)	Top-5 acc 48.828 (52.910)	lr 0.00595
Warmup Train [32][120/3239]	Time 0.469 (0.664)	Data 0.001 (0.142)	Loss 4.1528 (4.0735)	Top-1 acc 28.125 (29.665)	Top-5 acc 52.734 (52.973)	lr 0.00594
Warmup Train [32][130/3239]	Time 0.393 (0.652)	Data 0.001 (0.132)	Loss 4.0552 (4.0733)	Top-1 acc 28.516 (29.702)	Top-5 acc 51.562 (52.940)	lr 0.00594
Warmup Train [32][140/3239]	Time 0.502 (0.645)	Data 0.001 (0.124)	Loss 3.9304 (4.0712)	Top-1 acc 32.031 (29.790)	Top-5 acc 57.031 (52.964)	lr 0.00593
Warmup Train [32][150/3239]	Time 0.451 (0.637)	Data 0.001 (0.116)	Loss 4.2164 (4.0722)	Top-1 acc 27.734 (29.786)	Top-5 acc 48.438 (52.993)	lr 0.00593
Warmup Train [32][160/3239]	Time 0.666 (0.630)	Data 0.001 (0.110)	Loss 4.2374 (4.0745)	Top-1 acc 26.953 (29.707)	Top-5 acc 50.391 (52.987)	lr 0.00593
Warmup Train [32][170/3239]	Time 0.638 (0.626)	Data 0.001 (0.103)	Loss 4.0486 (4.0715)	Top-1 acc 30.469 (29.793)	Top-5 acc 54.688 (53.029)	lr 0.00592
Warmup Train [32][180/3239]	Time 0.640 (0.619)	Data 0.001 (0.098)	Loss 4.1766 (4.0731)	Top-1 acc 29.688 (29.817)	Top-5 acc 51.953 (52.985)	lr 0.00592
Warmup Train [32][190/3239]	Time 0.652 (0.614)	Data 0.001 (0.093)	Loss 4.1467 (4.0772)	Top-1 acc 30.078 (29.728)	Top-5 acc 52.344 (52.941)	lr 0.00592
Warmup Train [32][200/3239]	Time 0.627 (0.609)	Data 0.001 (0.088)	Loss 4.1901 (4.0794)	Top-1 acc 29.297 (29.730)	Top-5 acc 52.344 (52.933)	lr 0.00591
Warmup Train [32][210/3239]	Time 0.408 (0.604)	Data 0.001 (0.084)	Loss 4.1346 (4.0814)	Top-1 acc 27.734 (29.682)	Top-5 acc 51.172 (52.879)	lr 0.00591
Warmup Train [32][220/3239]	Time 0.434 (0.599)	Data 0.001 (0.081)	Loss 4.1304 (4.0801)	Top-1 acc 29.688 (29.710)	Top-5 acc 51.172 (52.867)	lr 0.00590
Warmup Train [32][230/3239]	Time 0.418 (0.597)	Data 0.001 (0.078)	Loss 4.2410 (4.0801)	Top-1 acc 27.734 (29.764)	Top-5 acc 49.219 (52.849)	lr 0.00590
Warmup Train [32][240/3239]	Time 0.367 (0.592)	Data 0.001 (0.075)	Loss 4.0149 (4.0802)	Top-1 acc 31.250 (29.767)	Top-5 acc 54.297 (52.840)	lr 0.00590
Warmup Train [32][250/3239]	Time 0.604 (0.587)	Data 0.001 (0.073)	Loss 3.9688 (4.0808)	Top-1 acc 32.812 (29.737)	Top-5 acc 54.688 (52.846)	lr 0.00589
Warmup Train [32][260/3239]	Time 0.362 (0.582)	Data 0.001 (0.070)	Loss 4.1310 (4.0793)	Top-1 acc 30.859 (29.716)	Top-5 acc 52.734 (52.889)	lr 0.00589
Warmup Train [32][270/3239]	Time 0.420 (0.579)	Data 0.001 (0.068)	Loss 4.0520 (4.0770)	Top-1 acc 26.953 (29.757)	Top-5 acc 52.344 (52.913)	lr 0.00588
Warmup Train [32][280/3239]	Time 0.510 (0.577)	Data 0.001 (0.066)	Loss 3.8026 (4.0752)	Top-1 acc 38.672 (29.811)	Top-5 acc 60.547 (52.972)	lr 0.00588
Warmup Train [32][290/3239]	Time 0.591 (0.575)	Data 0.001 (0.064)	Loss 4.0298 (4.0752)	Top-1 acc 28.125 (29.792)	Top-5 acc 55.859 (52.973)	lr 0.00588
Warmup Train [32][300/3239]	Time 0.448 (0.573)	Data 0.001 (0.062)	Loss 4.0710 (4.0766)	Top-1 acc 26.562 (29.746)	Top-5 acc 54.688 (52.967)	lr 0.00587
Warmup Train [32][310/3239]	Time 0.563 (0.570)	Data 0.001 (0.060)	Loss 3.9224 (4.0772)	Top-1 acc 32.812 (29.750)	Top-5 acc 54.688 (52.929)	lr 0.00587
Warmup Train [32][320/3239]	Time 0.547 (0.568)	Data 0.001 (0.058)	Loss 4.0674 (4.0768)	Top-1 acc 30.469 (29.762)	Top-5 acc 52.734 (52.947)	lr 0.00586
Warmup Train [32][330/3239]	Time 0.563 (0.567)	Data 0.001 (0.057)	Loss 4.3380 (4.0786)	Top-1 acc 27.344 (29.713)	Top-5 acc 45.703 (52.900)	lr 0.00586
Warmup Train [32][340/3239]	Time 0.543 (0.565)	Data 0.001 (0.055)	Loss 3.9906 (4.0793)	Top-1 acc 26.562 (29.732)	Top-5 acc 49.219 (52.888)	lr 0.00586
Warmup Train [32][350/3239]	Time 0.471 (0.564)	Data 0.001 (0.054)	Loss 4.2359 (4.0793)	Top-1 acc 25.781 (29.733)	Top-5 acc 48.828 (52.884)	lr 0.00585
Warmup Train [32][360/3239]	Time 0.595 (0.562)	Data 0.001 (0.053)	Loss 4.1057 (4.0787)	Top-1 acc 27.344 (29.748)	Top-5 acc 51.953 (52.871)	lr 0.00585
Warmup Train [32][370/3239]	Time 0.352 (0.561)	Data 0.001 (0.052)	Loss 4.1862 (4.0786)	Top-1 acc 27.344 (29.734)	Top-5 acc 50.391 (52.884)	lr 0.00584
Warmup Train [32][380/3239]	Time 0.430 (0.560)	Data 0.001 (0.051)	Loss 4.2558 (4.0777)	Top-1 acc 24.219 (29.736)	Top-5 acc 47.656 (52.877)	lr 0.00584
Warmup Train [32][390/3239]	Time 0.455 (0.559)	Data 0.001 (0.050)	Loss 3.8162 (4.0767)	Top-1 acc 35.156 (29.769)	Top-5 acc 57.422 (52.910)	lr 0.00584
Warmup Train [32][400/3239]	Time 0.549 (0.558)	Data 0.001 (0.048)	Loss 4.0476 (4.0775)	Top-1 acc 30.859 (29.735)	Top-5 acc 51.172 (52.901)	lr 0.00583
Warmup Train [32][410/3239]	Time 0.462 (0.557)	Data 0.001 (0.047)	Loss 4.1037 (4.0767)	Top-1 acc 28.906 (29.730)	Top-5 acc 54.297 (52.924)	lr 0.00583
Warmup Train [32][420/3239]	Time 0.512 (0.556)	Data 0.001 (0.046)	Loss 4.1259 (4.0773)	Top-1 acc 26.953 (29.706)	Top-5 acc 55.078 (52.933)	lr 0.00583
Warmup Train [32][430/3239]	Time 0.624 (0.556)	Data 0.001 (0.046)	Loss 4.0969 (4.0763)	Top-1 acc 30.469 (29.734)	Top-5 acc 54.297 (52.947)	lr 0.00582
Warmup Train [32][440/3239]	Time 0.621 (0.555)	Data 0.001 (0.045)	Loss 4.0038 (4.0754)	Top-1 acc 29.688 (29.726)	Top-5 acc 55.078 (52.979)	lr 0.00582
Warmup Train [32][450/3239]	Time 0.506 (0.554)	Data 0.001 (0.044)	Loss 4.0708 (4.0764)	Top-1 acc 27.734 (29.702)	Top-5 acc 52.344 (52.962)	lr 0.00581
Warmup Train [32][460/3239]	Time 0.646 (0.553)	Data 0.001 (0.043)	Loss 3.9624 (4.0753)	Top-1 acc 32.422 (29.744)	Top-5 acc 51.172 (52.971)	lr 0.00581
Warmup Train [32][470/3239]	Time 0.614 (0.552)	Data 0.001 (0.042)	Loss 4.1157 (4.0761)	Top-1 acc 30.078 (29.743)	Top-5 acc 55.078 (52.973)	lr 0.00581
Warmup Train [32][480/3239]	Time 0.392 (0.552)	Data 0.001 (0.041)	Loss 4.0470 (4.0769)	Top-1 acc 30.078 (29.718)	Top-5 acc 53.125 (52.964)	lr 0.00580
Warmup Train [32][490/3239]	Time 0.575 (0.551)	Data 0.001 (0.041)	Loss 3.9585 (4.0774)	Top-1 acc 33.594 (29.688)	Top-5 acc 56.641 (52.944)	lr 0.00580
Warmup Train [32][500/3239]	Time 0.481 (0.549)	Data 0.001 (0.040)	Loss 4.1003 (4.0772)	Top-1 acc 30.859 (29.692)	Top-5 acc 51.172 (52.947)	lr 0.00579
Warmup Train [32][510/3239]	Time 0.543 (0.548)	Data 0.001 (0.039)	Loss 4.2074 (4.0774)	Top-1 acc 26.562 (29.697)	Top-5 acc 48.438 (52.954)	lr 0.00579
Warmup Train [32][520/3239]	Time 0.520 (0.547)	Data 0.001 (0.039)	Loss 3.9648 (4.0779)	Top-1 acc 30.859 (29.665)	Top-5 acc 53.516 (52.954)	lr 0.00579
Warmup Train [32][530/3239]	Time 0.499 (0.546)	Data 0.001 (0.038)	Loss 4.1274 (4.0772)	Top-1 acc 29.297 (29.686)	Top-5 acc 51.953 (52.976)	lr 0.00578
Warmup Train [32][540/3239]	Time 0.381 (0.544)	Data 0.001 (0.037)	Loss 4.1036 (4.0773)	Top-1 acc 27.734 (29.700)	Top-5 acc 51.172 (52.981)	lr 0.00578
Warmup Train [32][550/3239]	Time 0.543 (0.545)	Data 0.001 (0.037)	Loss 4.1241 (4.0772)	Top-1 acc 28.516 (29.705)	Top-5 acc 51.172 (52.990)	lr 0.00578
Warmup Train [32][560/3239]	Time 0.535 (0.544)	Data 0.023 (0.036)	Loss 4.1561 (4.0769)	Top-1 acc 28.516 (29.679)	Top-5 acc 48.438 (52.967)	lr 0.00577
Warmup Train [32][570/3239]	Time 0.477 (0.544)	Data 0.001 (0.036)	Loss 3.9978 (4.0764)	Top-1 acc 28.125 (29.690)	Top-5 acc 54.688 (52.974)	lr 0.00577
Warmup Train [32][580/3239]	Time 0.691 (0.543)	Data 0.001 (0.035)	Loss 4.0952 (4.0755)	Top-1 acc 27.734 (29.700)	Top-5 acc 53.125 (52.997)	lr 0.00576
Warmup Train [32][590/3239]	Time 0.589 (0.543)	Data 0.001 (0.035)	Loss 3.8212 (4.0742)	Top-1 acc 36.328 (29.704)	Top-5 acc 58.203 (53.016)	lr 0.00576
Warmup Train [32][600/3239]	Time 0.594 (0.542)	Data 0.001 (0.034)	Loss 4.0776 (4.0740)	Top-1 acc 30.859 (29.702)	Top-5 acc 56.641 (53.032)	lr 0.00576
Warmup Train [32][610/3239]	Time 0.570 (0.542)	Data 0.001 (0.034)	Loss 3.9994 (4.0732)	Top-1 acc 31.250 (29.719)	Top-5 acc 55.078 (53.050)	lr 0.00575
Warmup Train [32][620/3239]	Time 0.437 (0.541)	Data 0.001 (0.033)	Loss 3.9372 (4.0734)	Top-1 acc 32.422 (29.721)	Top-5 acc 55.469 (53.040)	lr 0.00575
Warmup Train [32][630/3239]	Time 0.410 (0.541)	Data 0.001 (0.033)	Loss 4.1550 (4.0733)	Top-1 acc 32.031 (29.726)	Top-5 acc 53.125 (53.054)	lr 0.00574
Warmup Train [32][640/3239]	Time 0.762 (0.541)	Data 0.001 (0.032)	Loss 3.9753 (4.0738)	Top-1 acc 33.203 (29.723)	Top-5 acc 54.297 (53.058)	lr 0.00574
Warmup Train [32][650/3239]	Time 0.507 (0.540)	Data 0.001 (0.032)	Loss 4.0022 (4.0742)	Top-1 acc 27.344 (29.724)	Top-5 acc 56.250 (53.067)	lr 0.00574
Warmup Train [32][660/3239]	Time 0.606 (0.540)	Data 0.001 (0.031)	Loss 3.7362 (4.0742)	Top-1 acc 37.891 (29.742)	Top-5 acc 60.547 (53.071)	lr 0.00573
Warmup Train [32][670/3239]	Time 0.343 (0.539)	Data 0.001 (0.031)	Loss 4.0518 (4.0747)	Top-1 acc 30.859 (29.748)	Top-5 acc 54.688 (53.077)	lr 0.00573
Warmup Train [32][680/3239]	Time 0.547 (0.539)	Data 0.001 (0.031)	Loss 4.0800 (4.0750)	Top-1 acc 25.000 (29.729)	Top-5 acc 50.781 (53.056)	lr 0.00572
Warmup Train [32][690/3239]	Time 0.350 (0.539)	Data 0.001 (0.030)	Loss 4.3278 (4.0753)	Top-1 acc 25.781 (29.723)	Top-5 acc 44.141 (53.032)	lr 0.00572
Warmup Train [32][700/3239]	Time 0.551 (0.538)	Data 0.001 (0.030)	Loss 3.9743 (4.0748)	Top-1 acc 30.859 (29.734)	Top-5 acc 55.469 (53.048)	lr 0.00572
Warmup Train [32][710/3239]	Time 0.572 (0.538)	Data 0.001 (0.030)	Loss 3.9166 (4.0747)	Top-1 acc 33.984 (29.738)	Top-5 acc 58.984 (53.057)	lr 0.00571
Warmup Train [32][720/3239]	Time 0.646 (0.537)	Data 0.001 (0.029)	Loss 4.0189 (4.0754)	Top-1 acc 29.688 (29.729)	Top-5 acc 52.734 (53.039)	lr 0.00571
Warmup Train [32][730/3239]	Time 0.538 (0.537)	Data 0.001 (0.029)	Loss 3.9778 (4.0749)	Top-1 acc 37.891 (29.739)	Top-5 acc 55.078 (53.058)	lr 0.00571
Warmup Train [32][740/3239]	Time 0.511 (0.537)	Data 0.001 (0.029)	Loss 3.9300 (4.0743)	Top-1 acc 37.109 (29.754)	Top-5 acc 58.203 (53.066)	lr 0.00570
Warmup Train [32][750/3239]	Time 0.507 (0.536)	Data 0.001 (0.028)	Loss 4.0559 (4.0743)	Top-1 acc 30.078 (29.754)	Top-5 acc 53.516 (53.053)	lr 0.00570
Warmup Train [32][760/3239]	Time 0.505 (0.536)	Data 0.001 (0.028)	Loss 3.8727 (4.0735)	Top-1 acc 30.859 (29.772)	Top-5 acc 55.469 (53.058)	lr 0.00569
Warmup Train [32][770/3239]	Time 0.600 (0.536)	Data 0.001 (0.028)	Loss 4.1978 (4.0731)	Top-1 acc 33.203 (29.786)	Top-5 acc 52.344 (53.063)	lr 0.00569
Warmup Train [32][780/3239]	Time 0.509 (0.535)	Data 0.001 (0.027)	Loss 4.1414 (4.0735)	Top-1 acc 28.906 (29.782)	Top-5 acc 50.391 (53.052)	lr 0.00569
Warmup Train [32][790/3239]	Time 0.465 (0.535)	Data 0.001 (0.027)	Loss 3.8837 (4.0736)	Top-1 acc 33.594 (29.773)	Top-5 acc 55.859 (53.038)	lr 0.00568
Warmup Train [32][800/3239]	Time 0.510 (0.534)	Data 0.001 (0.027)	Loss 4.1408 (4.0733)	Top-1 acc 28.125 (29.783)	Top-5 acc 52.344 (53.046)	lr 0.00568
Warmup Train [32][810/3239]	Time 0.596 (0.534)	Data 0.001 (0.027)	Loss 4.0230 (4.0735)	Top-1 acc 30.469 (29.767)	Top-5 acc 55.859 (53.048)	lr 0.00567
Warmup Train [32][820/3239]	Time 0.625 (0.533)	Data 0.001 (0.026)	Loss 4.1279 (4.0735)	Top-1 acc 32.422 (29.777)	Top-5 acc 55.859 (53.050)	lr 0.00567
Warmup Train [32][830/3239]	Time 0.409 (0.533)	Data 0.001 (0.026)	Loss 4.0972 (4.0735)	Top-1 acc 30.078 (29.779)	Top-5 acc 53.125 (53.043)	lr 0.00567
Warmup Train [32][840/3239]	Time 0.659 (0.533)	Data 0.001 (0.026)	Loss 4.1174 (4.0732)	Top-1 acc 30.078 (29.793)	Top-5 acc 55.078 (53.047)	lr 0.00566
Warmup Train [32][850/3239]	Time 0.371 (0.533)	Data 0.001 (0.026)	Loss 3.9251 (4.0728)	Top-1 acc 32.422 (29.824)	Top-5 acc 56.250 (53.060)	lr 0.00566
Warmup Train [32][860/3239]	Time 0.360 (0.532)	Data 0.001 (0.025)	Loss 4.1952 (4.0740)	Top-1 acc 30.859 (29.807)	Top-5 acc 49.219 (53.037)	lr 0.00566
Warmup Train [32][870/3239]	Time 0.463 (0.532)	Data 0.001 (0.025)	Loss 3.9341 (4.0747)	Top-1 acc 33.594 (29.800)	Top-5 acc 54.297 (53.021)	lr 0.00565
Warmup Train [32][880/3239]	Time 0.360 (0.532)	Data 0.001 (0.025)	Loss 4.1972 (4.0749)	Top-1 acc 28.516 (29.803)	Top-5 acc 47.266 (53.013)	lr 0.00565
Warmup Train [32][890/3239]	Time 0.433 (0.532)	Data 0.001 (0.025)	Loss 3.9900 (4.0745)	Top-1 acc 31.250 (29.823)	Top-5 acc 56.250 (53.024)	lr 0.00564
Warmup Train [32][900/3239]	Time 0.502 (0.532)	Data 0.001 (0.025)	Loss 3.9205 (4.0745)	Top-1 acc 33.594 (29.815)	Top-5 acc 55.859 (53.021)	lr 0.00564
Warmup Train [32][910/3239]	Time 0.701 (0.532)	Data 0.001 (0.025)	Loss 4.0405 (4.0742)	Top-1 acc 30.859 (29.815)	Top-5 acc 52.344 (53.026)	lr 0.00564
Warmup Train [32][920/3239]	Time 0.460 (0.531)	Data 0.001 (0.024)	Loss 4.2738 (4.0737)	Top-1 acc 28.125 (29.826)	Top-5 acc 50.781 (53.033)	lr 0.00563
Warmup Train [32][930/3239]	Time 0.624 (0.531)	Data 0.001 (0.024)	Loss 4.0915 (4.0743)	Top-1 acc 29.688 (29.810)	Top-5 acc 51.953 (53.013)	lr 0.00563
Warmup Train [32][940/3239]	Time 0.406 (0.531)	Data 0.001 (0.024)	Loss 4.0155 (4.0736)	Top-1 acc 30.078 (29.814)	Top-5 acc 50.000 (53.031)	lr 0.00562
Warmup Train [32][950/3239]	Time 0.515 (0.531)	Data 0.001 (0.024)	Loss 4.0141 (4.0732)	Top-1 acc 28.125 (29.821)	Top-5 acc 54.297 (53.039)	lr 0.00562
Warmup Train [32][960/3239]	Time 0.725 (0.531)	Data 0.001 (0.024)	Loss 4.1245 (4.0731)	Top-1 acc 30.078 (29.825)	Top-5 acc 52.734 (53.046)	lr 0.00562
Warmup Train [32][970/3239]	Time 0.620 (0.531)	Data 0.001 (0.023)	Loss 4.0080 (4.0729)	Top-1 acc 32.422 (29.822)	Top-5 acc 56.641 (53.048)	lr 0.00561
Warmup Train [32][980/3239]	Time 0.625 (0.531)	Data 0.001 (0.023)	Loss 3.9675 (4.0732)	Top-1 acc 29.688 (29.809)	Top-5 acc 54.297 (53.042)	lr 0.00561
Warmup Train [32][990/3239]	Time 0.622 (0.530)	Data 0.001 (0.023)	Loss 4.0665 (4.0727)	Top-1 acc 27.734 (29.815)	Top-5 acc 52.344 (53.058)	lr 0.00561
Warmup Train [32][1000/3239]	Time 0.488 (0.530)	Data 0.001 (0.023)	Loss 4.1269 (4.0728)	Top-1 acc 28.125 (29.802)	Top-5 acc 51.562 (53.051)	lr 0.00560
Warmup Train [32][1010/3239]	Time 0.624 (0.530)	Data 0.001 (0.023)	Loss 3.8489 (4.0732)	Top-1 acc 35.547 (29.781)	Top-5 acc 57.812 (53.041)	lr 0.00560
Warmup Train [32][1020/3239]	Time 0.725 (0.530)	Data 0.001 (0.022)	Loss 4.1020 (4.0735)	Top-1 acc 30.078 (29.775)	Top-5 acc 53.125 (53.044)	lr 0.00559
Warmup Train [32][1030/3239]	Time 0.643 (0.530)	Data 0.001 (0.022)	Loss 4.1533 (4.0735)	Top-1 acc 28.125 (29.784)	Top-5 acc 51.172 (53.033)	lr 0.00559
Warmup Train [32][1040/3239]	Time 0.532 (0.530)	Data 0.001 (0.022)	Loss 4.1342 (4.0735)	Top-1 acc 28.125 (29.790)	Top-5 acc 51.953 (53.030)	lr 0.00559
Warmup Train [32][1050/3239]	Time 0.552 (0.530)	Data 0.001 (0.022)	Loss 3.9040 (4.0736)	Top-1 acc 32.031 (29.787)	Top-5 acc 58.594 (53.024)	lr 0.00558
Warmup Train [32][1060/3239]	Time 0.461 (0.529)	Data 0.001 (0.022)	Loss 4.0321 (4.0731)	Top-1 acc 33.984 (29.800)	Top-5 acc 53.516 (53.026)	lr 0.00558
Warmup Train [32][1070/3239]	Time 0.157 (0.528)	Data 0.002 (0.021)	Loss 3.9534 (4.0734)	Top-1 acc 29.688 (29.791)	Top-5 acc 57.422 (53.019)	lr 0.00558
Warmup Train [32][1080/3239]	Time 0.615 (0.528)	Data 0.001 (0.021)	Loss 3.9724 (4.0733)	Top-1 acc 31.250 (29.789)	Top-5 acc 55.859 (53.015)	lr 0.00557
Warmup Train [32][1090/3239]	Time 0.225 (0.528)	Data 0.001 (0.021)	Loss 3.9839 (4.0735)	Top-1 acc 28.906 (29.790)	Top-5 acc 52.344 (53.012)	lr 0.00557
Warmup Train [32][1100/3239]	Time 0.508 (0.527)	Data 0.001 (0.021)	Loss 3.9546 (4.0737)	Top-1 acc 34.375 (29.795)	Top-5 acc 55.859 (53.013)	lr 0.00556
Warmup Train [32][1110/3239]	Time 0.463 (0.527)	Data 0.001 (0.021)	Loss 4.2158 (4.0737)	Top-1 acc 25.000 (29.797)	Top-5 acc 49.609 (53.013)	lr 0.00556
Warmup Train [32][1120/3239]	Time 0.392 (0.527)	Data 0.001 (0.021)	Loss 4.1068 (4.0739)	Top-1 acc 26.562 (29.791)	Top-5 acc 51.172 (53.003)	lr 0.00556
Warmup Train [32][1130/3239]	Time 0.489 (0.527)	Data 0.001 (0.021)	Loss 4.0318 (4.0741)	Top-1 acc 28.516 (29.782)	Top-5 acc 53.516 (52.999)	lr 0.00555
Warmup Train [32][1140/3239]	Time 0.743 (0.527)	Data 0.001 (0.021)	Loss 3.8162 (4.0735)	Top-1 acc 33.594 (29.794)	Top-5 acc 61.719 (53.023)	lr 0.00555
Warmup Train [32][1150/3239]	Time 0.500 (0.527)	Data 0.001 (0.020)	Loss 4.1909 (4.0735)	Top-1 acc 26.953 (29.788)	Top-5 acc 45.703 (53.013)	lr 0.00554
Warmup Train [32][1160/3239]	Time 0.547 (0.527)	Data 0.001 (0.020)	Loss 4.0093 (4.0733)	Top-1 acc 28.906 (29.792)	Top-5 acc 54.297 (53.023)	lr 0.00554
Warmup Train [32][1170/3239]	Time 0.520 (0.527)	Data 0.001 (0.020)	Loss 3.9540 (4.0726)	Top-1 acc 33.203 (29.805)	Top-5 acc 58.984 (53.036)	lr 0.00554
Warmup Train [32][1180/3239]	Time 0.609 (0.527)	Data 0.001 (0.020)	Loss 4.0746 (4.0719)	Top-1 acc 31.250 (29.814)	Top-5 acc 53.516 (53.051)	lr 0.00553
Warmup Train [32][1190/3239]	Time 0.406 (0.526)	Data 0.001 (0.020)	Loss 4.0333 (4.0716)	Top-1 acc 29.688 (29.817)	Top-5 acc 53.906 (53.061)	lr 0.00553
Warmup Train [32][1200/3239]	Time 0.358 (0.527)	Data 0.001 (0.020)	Loss 4.1780 (4.0713)	Top-1 acc 30.859 (29.821)	Top-5 acc 51.953 (53.064)	lr 0.00553
Warmup Train [32][1210/3239]	Time 0.702 (0.527)	Data 0.001 (0.020)	Loss 3.9656 (4.0717)	Top-1 acc 29.688 (29.812)	Top-5 acc 53.516 (53.062)	lr 0.00552
Warmup Train [32][1220/3239]	Time 0.615 (0.526)	Data 0.001 (0.020)	Loss 3.9730 (4.0717)	Top-1 acc 33.594 (29.814)	Top-5 acc 55.469 (53.067)	lr 0.00552
Warmup Train [32][1230/3239]	Time 0.675 (0.526)	Data 0.001 (0.020)	Loss 3.9202 (4.0714)	Top-1 acc 37.109 (29.820)	Top-5 acc 59.375 (53.075)	lr 0.00551
Warmup Train [32][1240/3239]	Time 0.674 (0.526)	Data 0.001 (0.019)	Loss 4.0920 (4.0712)	Top-1 acc 31.641 (29.823)	Top-5 acc 51.953 (53.085)	lr 0.00551
Warmup Train [32][1250/3239]	Time 0.383 (0.526)	Data 0.001 (0.019)	Loss 4.0943 (4.0716)	Top-1 acc 32.031 (29.825)	Top-5 acc 50.781 (53.072)	lr 0.00551
Warmup Train [32][1260/3239]	Time 0.643 (0.526)	Data 0.001 (0.019)	Loss 4.1513 (4.0721)	Top-1 acc 30.859 (29.817)	Top-5 acc 51.562 (53.066)	lr 0.00550
Warmup Train [32][1270/3239]	Time 0.529 (0.526)	Data 0.001 (0.019)	Loss 3.8831 (4.0719)	Top-1 acc 32.422 (29.828)	Top-5 acc 57.812 (53.074)	lr 0.00550
Warmup Train [32][1280/3239]	Time 0.671 (0.526)	Data 0.001 (0.019)	Loss 4.1321 (4.0716)	Top-1 acc 30.078 (29.835)	Top-5 acc 53.906 (53.087)	lr 0.00550
Warmup Train [32][1290/3239]	Time 0.574 (0.526)	Data 0.001 (0.019)	Loss 4.1336 (4.0718)	Top-1 acc 27.344 (29.823)	Top-5 acc 50.391 (53.084)	lr 0.00549
Warmup Train [32][1300/3239]	Time 0.422 (0.526)	Data 0.001 (0.019)	Loss 4.0263 (4.0716)	Top-1 acc 32.812 (29.830)	Top-5 acc 52.734 (53.089)	lr 0.00549
Warmup Train [32][1310/3239]	Time 0.512 (0.526)	Data 0.001 (0.019)	Loss 4.0906 (4.0720)	Top-1 acc 27.344 (29.821)	Top-5 acc 53.125 (53.074)	lr 0.00548
Warmup Train [32][1320/3239]	Time 0.352 (0.526)	Data 0.001 (0.019)	Loss 4.2933 (4.0716)	Top-1 acc 24.609 (29.832)	Top-5 acc 48.047 (53.088)	lr 0.00548
Warmup Train [32][1330/3239]	Time 0.372 (0.525)	Data 0.001 (0.019)	Loss 3.9746 (4.0714)	Top-1 acc 30.078 (29.838)	Top-5 acc 52.734 (53.084)	lr 0.00548
Warmup Train [32][1340/3239]	Time 0.748 (0.525)	Data 0.001 (0.019)	Loss 3.7447 (4.0712)	Top-1 acc 35.938 (29.849)	Top-5 acc 63.281 (53.092)	lr 0.00547
Warmup Train [32][1350/3239]	Time 0.417 (0.525)	Data 0.001 (0.018)	Loss 4.1812 (4.0709)	Top-1 acc 28.125 (29.854)	Top-5 acc 52.344 (53.104)	lr 0.00547
Warmup Train [32][1360/3239]	Time 0.455 (0.524)	Data 0.001 (0.018)	Loss 4.1398 (4.0714)	Top-1 acc 27.344 (29.842)	Top-5 acc 54.688 (53.096)	lr 0.00547
Warmup Train [32][1370/3239]	Time 0.384 (0.524)	Data 0.001 (0.018)	Loss 3.8373 (4.0709)	Top-1 acc 34.375 (29.848)	Top-5 acc 55.859 (53.112)	lr 0.00546
Warmup Train [32][1380/3239]	Time 0.430 (0.524)	Data 0.001 (0.018)	Loss 4.1724 (4.0708)	Top-1 acc 26.562 (29.845)	Top-5 acc 55.078 (53.119)	lr 0.00546
Warmup Train [32][1390/3239]	Time 0.645 (0.524)	Data 0.001 (0.018)	Loss 3.9487 (4.0708)	Top-1 acc 29.688 (29.842)	Top-5 acc 55.078 (53.106)	lr 0.00545
Warmup Train [32][1400/3239]	Time 0.605 (0.524)	Data 0.001 (0.018)	Loss 3.9924 (4.0708)	Top-1 acc 33.203 (29.844)	Top-5 acc 54.297 (53.101)	lr 0.00545
Warmup Train [32][1410/3239]	Time 0.346 (0.523)	Data 0.001 (0.018)	Loss 4.0658 (4.0709)	Top-1 acc 30.859 (29.844)	Top-5 acc 53.125 (53.103)	lr 0.00545
Warmup Train [32][1420/3239]	Time 0.478 (0.523)	Data 0.001 (0.018)	Loss 4.0007 (4.0709)	Top-1 acc 30.078 (29.851)	Top-5 acc 55.469 (53.107)	lr 0.00544
Warmup Train [32][1430/3239]	Time 0.568 (0.523)	Data 0.001 (0.018)	Loss 3.8682 (4.0706)	Top-1 acc 30.078 (29.860)	Top-5 acc 57.812 (53.111)	lr 0.00544
Warmup Train [32][1440/3239]	Time 0.473 (0.523)	Data 0.001 (0.018)	Loss 4.3107 (4.0706)	Top-1 acc 27.344 (29.867)	Top-5 acc 49.609 (53.108)	lr 0.00543
Warmup Train [32][1450/3239]	Time 0.355 (0.523)	Data 0.001 (0.018)	Loss 4.1885 (4.0705)	Top-1 acc 28.516 (29.874)	Top-5 acc 50.000 (53.112)	lr 0.00543
Warmup Train [32][1460/3239]	Time 0.391 (0.523)	Data 0.001 (0.018)	Loss 4.0168 (4.0704)	Top-1 acc 30.469 (29.878)	Top-5 acc 52.344 (53.118)	lr 0.00543
Warmup Train [32][1470/3239]	Time 0.496 (0.523)	Data 0.001 (0.018)	Loss 4.2297 (4.0703)	Top-1 acc 27.734 (29.875)	Top-5 acc 47.656 (53.124)	lr 0.00542
Warmup Train [32][1480/3239]	Time 0.514 (0.523)	Data 0.001 (0.018)	Loss 4.0698 (4.0704)	Top-1 acc 31.641 (29.881)	Top-5 acc 51.953 (53.121)	lr 0.00542
Warmup Train [32][1490/3239]	Time 0.420 (0.522)	Data 0.001 (0.017)	Loss 4.0493 (4.0705)	Top-1 acc 30.078 (29.885)	Top-5 acc 53.125 (53.121)	lr 0.00542
Warmup Train [32][1500/3239]	Time 0.357 (0.522)	Data 0.001 (0.017)	Loss 4.2464 (4.0707)	Top-1 acc 26.172 (29.881)	Top-5 acc 51.172 (53.115)	lr 0.00541
Warmup Train [32][1510/3239]	Time 0.624 (0.522)	Data 0.001 (0.017)	Loss 4.2074 (4.0707)	Top-1 acc 28.906 (29.883)	Top-5 acc 51.172 (53.118)	lr 0.00541
Warmup Train [32][1520/3239]	Time 0.414 (0.522)	Data 0.001 (0.017)	Loss 4.1320 (4.0709)	Top-1 acc 23.828 (29.878)	Top-5 acc 50.781 (53.106)	lr 0.00540
Warmup Train [32][1530/3239]	Time 0.595 (0.522)	Data 0.001 (0.017)	Loss 4.0285 (4.0710)	Top-1 acc 30.078 (29.868)	Top-5 acc 53.516 (53.097)	lr 0.00540
Warmup Train [32][1540/3239]	Time 0.508 (0.522)	Data 0.001 (0.017)	Loss 4.0396 (4.0711)	Top-1 acc 26.953 (29.861)	Top-5 acc 51.562 (53.093)	lr 0.00540
Warmup Train [32][1550/3239]	Time 0.473 (0.522)	Data 0.001 (0.017)	Loss 3.8789 (4.0709)	Top-1 acc 32.031 (29.855)	Top-5 acc 56.250 (53.094)	lr 0.00539
Warmup Train [32][1560/3239]	Time 0.435 (0.522)	Data 0.001 (0.017)	Loss 4.1328 (4.0709)	Top-1 acc 30.859 (29.852)	Top-5 acc 52.344 (53.092)	lr 0.00539
Warmup Train [32][1570/3239]	Time 0.613 (0.522)	Data 0.001 (0.017)	Loss 3.9880 (4.0708)	Top-1 acc 33.203 (29.851)	Top-5 acc 51.953 (53.088)	lr 0.00539
Warmup Train [32][1580/3239]	Time 0.578 (0.522)	Data 0.001 (0.017)	Loss 3.9876 (4.0710)	Top-1 acc 31.641 (29.849)	Top-5 acc 59.375 (53.090)	lr 0.00538
Warmup Train [32][1590/3239]	Time 0.442 (0.522)	Data 0.001 (0.017)	Loss 4.1169 (4.0709)	Top-1 acc 30.469 (29.850)	Top-5 acc 50.391 (53.092)	lr 0.00538
Warmup Train [32][1600/3239]	Time 0.528 (0.522)	Data 0.001 (0.017)	Loss 3.9379 (4.0706)	Top-1 acc 33.984 (29.852)	Top-5 acc 54.297 (53.095)	lr 0.00537
Warmup Train [32][1610/3239]	Time 0.559 (0.522)	Data 0.001 (0.017)	Loss 3.8804 (4.0699)	Top-1 acc 33.984 (29.869)	Top-5 acc 56.250 (53.113)	lr 0.00537
Warmup Train [32][1620/3239]	Time 0.488 (0.521)	Data 0.001 (0.017)	Loss 4.0813 (4.0697)	Top-1 acc 29.688 (29.874)	Top-5 acc 55.859 (53.115)	lr 0.00537
Warmup Train [32][1630/3239]	Time 0.581 (0.521)	Data 0.001 (0.017)	Loss 4.1031 (4.0698)	Top-1 acc 30.078 (29.871)	Top-5 acc 55.078 (53.124)	lr 0.00536
Warmup Train [32][1640/3239]	Time 0.487 (0.521)	Data 0.001 (0.017)	Loss 4.1927 (4.0701)	Top-1 acc 28.125 (29.873)	Top-5 acc 46.875 (53.112)	lr 0.00536
Warmup Train [32][1650/3239]	Time 0.681 (0.521)	Data 0.001 (0.017)	Loss 3.9835 (4.0697)	Top-1 acc 33.594 (29.881)	Top-5 acc 58.203 (53.119)	lr 0.00536
Warmup Train [32][1660/3239]	Time 0.593 (0.521)	Data 0.001 (0.016)	Loss 4.0549 (4.0696)	Top-1 acc 30.859 (29.889)	Top-5 acc 59.375 (53.125)	lr 0.00535
Warmup Train [32][1670/3239]	Time 0.388 (0.521)	Data 0.001 (0.016)	Loss 4.0351 (4.0697)	Top-1 acc 32.031 (29.889)	Top-5 acc 51.172 (53.115)	lr 0.00535
Warmup Train [32][1680/3239]	Time 0.585 (0.521)	Data 0.001 (0.016)	Loss 4.0949 (4.0696)	Top-1 acc 31.250 (29.894)	Top-5 acc 52.344 (53.115)	lr 0.00534
Warmup Train [32][1690/3239]	Time 0.442 (0.521)	Data 0.001 (0.016)	Loss 4.0004 (4.0698)	Top-1 acc 32.812 (29.887)	Top-5 acc 55.078 (53.103)	lr 0.00534
Warmup Train [32][1700/3239]	Time 0.497 (0.521)	Data 0.001 (0.016)	Loss 4.0872 (4.0696)	Top-1 acc 26.562 (29.887)	Top-5 acc 53.125 (53.106)	lr 0.00534
Warmup Train [32][1710/3239]	Time 0.624 (0.521)	Data 0.001 (0.016)	Loss 4.0398 (4.0696)	Top-1 acc 30.469 (29.891)	Top-5 acc 53.516 (53.107)	lr 0.00533
Warmup Train [32][1720/3239]	Time 0.460 (0.521)	Data 0.001 (0.016)	Loss 4.0266 (4.0695)	Top-1 acc 28.125 (29.890)	Top-5 acc 54.297 (53.111)	lr 0.00533
Warmup Train [32][1730/3239]	Time 0.533 (0.520)	Data 0.001 (0.016)	Loss 3.8540 (4.0695)	Top-1 acc 35.547 (29.892)	Top-5 acc 57.422 (53.112)	lr 0.00533
Warmup Train [32][1740/3239]	Time 0.343 (0.520)	Data 0.001 (0.016)	Loss 4.2281 (4.0698)	Top-1 acc 28.906 (29.886)	Top-5 acc 49.609 (53.108)	lr 0.00532
Warmup Train [32][1750/3239]	Time 0.563 (0.520)	Data 0.001 (0.016)	Loss 4.2170 (4.0700)	Top-1 acc 27.734 (29.882)	Top-5 acc 47.266 (53.102)	lr 0.00532
Warmup Train [32][1760/3239]	Time 0.527 (0.520)	Data 0.001 (0.016)	Loss 4.3984 (4.0703)	Top-1 acc 24.609 (29.875)	Top-5 acc 46.094 (53.105)	lr 0.00531
Warmup Train [32][1770/3239]	Time 0.544 (0.520)	Data 0.001 (0.016)	Loss 3.8931 (4.0703)	Top-1 acc 31.250 (29.873)	Top-5 acc 58.203 (53.107)	lr 0.00531
Warmup Train [32][1780/3239]	Time 0.494 (0.520)	Data 0.001 (0.016)	Loss 4.0138 (4.0700)	Top-1 acc 32.031 (29.881)	Top-5 acc 56.641 (53.112)	lr 0.00531
Warmup Train [32][1790/3239]	Time 0.550 (0.520)	Data 0.001 (0.016)	Loss 4.1062 (4.0701)	Top-1 acc 32.031 (29.873)	Top-5 acc 51.562 (53.110)	lr 0.00530
Warmup Train [32][1800/3239]	Time 0.796 (0.520)	Data 0.001 (0.016)	Loss 3.9020 (4.0699)	Top-1 acc 33.203 (29.876)	Top-5 acc 58.984 (53.118)	lr 0.00530
Warmup Train [32][1810/3239]	Time 0.378 (0.520)	Data 0.001 (0.016)	Loss 4.1798 (4.0696)	Top-1 acc 28.906 (29.878)	Top-5 acc 49.609 (53.124)	lr 0.00530
Warmup Train [32][1820/3239]	Time 0.469 (0.520)	Data 0.001 (0.016)	Loss 4.1111 (4.0698)	Top-1 acc 26.953 (29.878)	Top-5 acc 50.391 (53.117)	lr 0.00529
Warmup Train [32][1830/3239]	Time 0.506 (0.520)	Data 0.001 (0.016)	Loss 4.0367 (4.0697)	Top-1 acc 35.547 (29.879)	Top-5 acc 53.516 (53.123)	lr 0.00529
Warmup Train [32][1840/3239]	Time 0.546 (0.520)	Data 0.001 (0.015)	Loss 3.8072 (4.0695)	Top-1 acc 32.031 (29.879)	Top-5 acc 58.984 (53.126)	lr 0.00528
Warmup Train [32][1850/3239]	Time 0.407 (0.520)	Data 0.001 (0.015)	Loss 4.0873 (4.0696)	Top-1 acc 29.688 (29.874)	Top-5 acc 52.344 (53.122)	lr 0.00528
Warmup Train [32][1860/3239]	Time 0.419 (0.520)	Data 0.001 (0.015)	Loss 4.1979 (4.0699)	Top-1 acc 30.469 (29.868)	Top-5 acc 47.656 (53.109)	lr 0.00528
Warmup Train [32][1870/3239]	Time 0.640 (0.520)	Data 0.001 (0.015)	Loss 4.2872 (4.0697)	Top-1 acc 22.656 (29.873)	Top-5 acc 47.266 (53.114)	lr 0.00527
Warmup Train [32][1880/3239]	Time 0.659 (0.520)	Data 0.002 (0.015)	Loss 4.0296 (4.0696)	Top-1 acc 27.344 (29.871)	Top-5 acc 53.516 (53.114)	lr 0.00527
Warmup Train [32][1890/3239]	Time 0.612 (0.520)	Data 0.001 (0.015)	Loss 4.0295 (4.0692)	Top-1 acc 30.078 (29.882)	Top-5 acc 52.344 (53.121)	lr 0.00527
Warmup Train [32][1900/3239]	Time 0.554 (0.520)	Data 0.001 (0.015)	Loss 3.9445 (4.0689)	Top-1 acc 32.031 (29.880)	Top-5 acc 55.469 (53.127)	lr 0.00526
Warmup Train [32][1910/3239]	Time 0.563 (0.520)	Data 0.001 (0.015)	Loss 4.0244 (4.0690)	Top-1 acc 31.641 (29.879)	Top-5 acc 52.734 (53.120)	lr 0.00526
Warmup Train [32][1920/3239]	Time 0.487 (0.520)	Data 0.001 (0.015)	Loss 4.0182 (4.0689)	Top-1 acc 29.297 (29.886)	Top-5 acc 56.641 (53.121)	lr 0.00526
Warmup Train [32][1930/3239]	Time 0.589 (0.519)	Data 0.001 (0.015)	Loss 4.0225 (4.0688)	Top-1 acc 33.984 (29.892)	Top-5 acc 57.031 (53.128)	lr 0.00525
Warmup Train [32][1940/3239]	Time 0.475 (0.519)	Data 0.001 (0.015)	Loss 4.0987 (4.0688)	Top-1 acc 30.859 (29.899)	Top-5 acc 55.469 (53.127)	lr 0.00525
Warmup Train [32][1950/3239]	Time 0.428 (0.519)	Data 0.001 (0.015)	Loss 4.1690 (4.0688)	Top-1 acc 27.734 (29.900)	Top-5 acc 50.781 (53.130)	lr 0.00524
Warmup Train [32][1960/3239]	Time 0.532 (0.519)	Data 0.001 (0.015)	Loss 4.0224 (4.0686)	Top-1 acc 30.078 (29.898)	Top-5 acc 55.078 (53.133)	lr 0.00524
Warmup Train [32][1970/3239]	Time 0.515 (0.519)	Data 0.001 (0.015)	Loss 4.1699 (4.0687)	Top-1 acc 29.297 (29.898)	Top-5 acc 51.172 (53.133)	lr 0.00524
Warmup Train [32][1980/3239]	Time 0.455 (0.519)	Data 0.001 (0.015)	Loss 4.1173 (4.0686)	Top-1 acc 30.469 (29.896)	Top-5 acc 51.953 (53.133)	lr 0.00523
Warmup Train [32][1990/3239]	Time 0.559 (0.519)	Data 0.001 (0.015)	Loss 4.1476 (4.0686)	Top-1 acc 26.562 (29.895)	Top-5 acc 50.781 (53.133)	lr 0.00523
Warmup Train [32][2000/3239]	Time 0.601 (0.519)	Data 0.001 (0.015)	Loss 4.0460 (4.0684)	Top-1 acc 29.297 (29.896)	Top-5 acc 53.516 (53.135)	lr 0.00523
Warmup Train [32][2010/3239]	Time 0.486 (0.519)	Data 0.001 (0.015)	Loss 4.0150 (4.0681)	Top-1 acc 26.953 (29.897)	Top-5 acc 55.469 (53.139)	lr 0.00522
Warmup Train [32][2020/3239]	Time 0.366 (0.519)	Data 0.001 (0.015)	Loss 4.2133 (4.0679)	Top-1 acc 26.953 (29.900)	Top-5 acc 49.609 (53.146)	lr 0.00522
Warmup Train [32][2030/3239]	Time 0.450 (0.519)	Data 0.001 (0.015)	Loss 4.0683 (4.0679)	Top-1 acc 32.422 (29.899)	Top-5 acc 58.203 (53.145)	lr 0.00521
Warmup Train [32][2040/3239]	Time 0.464 (0.519)	Data 0.001 (0.014)	Loss 3.9604 (4.0679)	Top-1 acc 32.812 (29.900)	Top-5 acc 53.125 (53.143)	lr 0.00521
Warmup Train [32][2050/3239]	Time 0.508 (0.519)	Data 0.001 (0.014)	Loss 3.9546 (4.0679)	Top-1 acc 33.984 (29.901)	Top-5 acc 58.984 (53.143)	lr 0.00521
Warmup Train [32][2060/3239]	Time 0.606 (0.519)	Data 0.001 (0.014)	Loss 3.9537 (4.0679)	Top-1 acc 35.156 (29.900)	Top-5 acc 53.125 (53.146)	lr 0.00520
Warmup Train [32][2070/3239]	Time 0.671 (0.519)	Data 0.001 (0.014)	Loss 3.8057 (4.0674)	Top-1 acc 32.031 (29.909)	Top-5 acc 57.812 (53.158)	lr 0.00520
Warmup Train [32][2080/3239]	Time 0.573 (0.519)	Data 0.001 (0.014)	Loss 3.9886 (4.0672)	Top-1 acc 30.859 (29.912)	Top-5 acc 52.734 (53.165)	lr 0.00520
Warmup Train [32][2090/3239]	Time 0.527 (0.519)	Data 0.001 (0.014)	Loss 4.1500 (4.0672)	Top-1 acc 26.953 (29.907)	Top-5 acc 53.125 (53.169)	lr 0.00519
Warmup Train [32][2100/3239]	Time 0.378 (0.519)	Data 0.001 (0.014)	Loss 4.1530 (4.0669)	Top-1 acc 31.641 (29.915)	Top-5 acc 51.562 (53.173)	lr 0.00519
Warmup Train [32][2110/3239]	Time 0.572 (0.519)	Data 0.001 (0.014)	Loss 3.9804 (4.0669)	Top-1 acc 30.469 (29.914)	Top-5 acc 55.078 (53.177)	lr 0.00518
Warmup Train [32][2120/3239]	Time 0.423 (0.519)	Data 0.002 (0.014)	Loss 3.7640 (4.0667)	Top-1 acc 33.203 (29.918)	Top-5 acc 58.984 (53.178)	lr 0.00518
Warmup Train [32][2130/3239]	Time 0.481 (0.519)	Data 0.001 (0.014)	Loss 4.0720 (4.0668)	Top-1 acc 28.906 (29.911)	Top-5 acc 57.812 (53.174)	lr 0.00518
Warmup Train [32][2140/3239]	Time 0.401 (0.518)	Data 0.001 (0.014)	Loss 3.9696 (4.0668)	Top-1 acc 33.594 (29.918)	Top-5 acc 55.859 (53.175)	lr 0.00517
Warmup Train [32][2150/3239]	Time 0.520 (0.519)	Data 0.001 (0.014)	Loss 4.2244 (4.0669)	Top-1 acc 22.656 (29.915)	Top-5 acc 49.219 (53.172)	lr 0.00517
Warmup Train [32][2160/3239]	Time 0.323 (0.518)	Data 0.001 (0.014)	Loss 4.0396 (4.0669)	Top-1 acc 30.469 (29.920)	Top-5 acc 54.297 (53.169)	lr 0.00517
Warmup Train [32][2170/3239]	Time 0.551 (0.518)	Data 0.001 (0.014)	Loss 4.2635 (4.0673)	Top-1 acc 28.516 (29.914)	Top-5 acc 51.172 (53.163)	lr 0.00516
Warmup Train [32][2180/3239]	Time 0.215 (0.518)	Data 0.001 (0.014)	Loss 4.1086 (4.0674)	Top-1 acc 30.859 (29.909)	Top-5 acc 52.344 (53.157)	lr 0.00516
Warmup Train [32][2190/3239]	Time 0.539 (0.518)	Data 0.001 (0.014)	Loss 4.0726 (4.0674)	Top-1 acc 27.344 (29.911)	Top-5 acc 54.688 (53.153)	lr 0.00516
Warmup Train [32][2200/3239]	Time 0.266 (0.518)	Data 0.001 (0.014)	Loss 4.1332 (4.0673)	Top-1 acc 28.906 (29.911)	Top-5 acc 52.734 (53.152)	lr 0.00515
Warmup Train [32][2210/3239]	Time 0.609 (0.518)	Data 0.001 (0.014)	Loss 3.8370 (4.0673)	Top-1 acc 32.031 (29.912)	Top-5 acc 58.594 (53.151)	lr 0.00515
Warmup Train [32][2220/3239]	Time 0.390 (0.518)	Data 0.001 (0.014)	Loss 3.9012 (4.0669)	Top-1 acc 33.203 (29.921)	Top-5 acc 55.859 (53.156)	lr 0.00514
Warmup Train [32][2230/3239]	Time 0.646 (0.518)	Data 0.001 (0.014)	Loss 4.0117 (4.0669)	Top-1 acc 28.906 (29.924)	Top-5 acc 53.516 (53.154)	lr 0.00514
Warmup Train [32][2240/3239]	Time 0.397 (0.518)	Data 0.001 (0.014)	Loss 4.3007 (4.0672)	Top-1 acc 23.438 (29.913)	Top-5 acc 48.438 (53.149)	lr 0.00514
Warmup Train [32][2250/3239]	Time 0.711 (0.518)	Data 0.002 (0.014)	Loss 3.9508 (4.0670)	Top-1 acc 30.469 (29.916)	Top-5 acc 57.031 (53.155)	lr 0.00513
Warmup Train [32][2260/3239]	Time 0.495 (0.518)	Data 0.001 (0.014)	Loss 3.8929 (4.0667)	Top-1 acc 30.469 (29.919)	Top-5 acc 55.859 (53.159)	lr 0.00513
Warmup Train [32][2270/3239]	Time 0.456 (0.518)	Data 0.001 (0.014)	Loss 3.9448 (4.0669)	Top-1 acc 31.250 (29.915)	Top-5 acc 58.203 (53.153)	lr 0.00513
Warmup Train [32][2280/3239]	Time 0.551 (0.518)	Data 0.001 (0.014)	Loss 4.0589 (4.0670)	Top-1 acc 37.109 (29.921)	Top-5 acc 55.078 (53.149)	lr 0.00512
Warmup Train [32][2290/3239]	Time 0.548 (0.518)	Data 0.001 (0.014)	Loss 4.0294 (4.0668)	Top-1 acc 30.859 (29.926)	Top-5 acc 53.516 (53.156)	lr 0.00512
Warmup Train [32][2300/3239]	Time 0.497 (0.518)	Data 0.001 (0.014)	Loss 4.0671 (4.0672)	Top-1 acc 27.734 (29.919)	Top-5 acc 55.469 (53.149)	lr 0.00511
Warmup Train [32][2310/3239]	Time 0.403 (0.518)	Data 0.001 (0.014)	Loss 4.1315 (4.0671)	Top-1 acc 30.859 (29.914)	Top-5 acc 49.219 (53.145)	lr 0.00511
Warmup Train [32][2320/3239]	Time 0.574 (0.518)	Data 0.001 (0.014)	Loss 3.9914 (4.0670)	Top-1 acc 32.031 (29.919)	Top-5 acc 58.984 (53.145)	lr 0.00511
Warmup Train [32][2330/3239]	Time 0.578 (0.517)	Data 0.001 (0.014)	Loss 4.0965 (4.0670)	Top-1 acc 30.859 (29.920)	Top-5 acc 53.516 (53.146)	lr 0.00510
Warmup Train [32][2340/3239]	Time 0.494 (0.517)	Data 0.001 (0.014)	Loss 4.0902 (4.0668)	Top-1 acc 30.469 (29.930)	Top-5 acc 54.297 (53.153)	lr 0.00510
Warmup Train [32][2350/3239]	Time 0.621 (0.517)	Data 0.001 (0.014)	Loss 4.0789 (4.0667)	Top-1 acc 28.516 (29.933)	Top-5 acc 51.562 (53.157)	lr 0.00510
Warmup Train [32][2360/3239]	Time 0.619 (0.518)	Data 0.001 (0.013)	Loss 4.0207 (4.0667)	Top-1 acc 31.250 (29.930)	Top-5 acc 53.906 (53.155)	lr 0.00509
Warmup Train [32][2370/3239]	Time 0.450 (0.517)	Data 0.001 (0.013)	Loss 3.8926 (4.0667)	Top-1 acc 35.547 (29.928)	Top-5 acc 58.984 (53.155)	lr 0.00509
Warmup Train [32][2380/3239]	Time 0.418 (0.517)	Data 0.001 (0.013)	Loss 4.0531 (4.0668)	Top-1 acc 30.078 (29.928)	Top-5 acc 51.562 (53.151)	lr 0.00509
Warmup Train [32][2390/3239]	Time 0.548 (0.517)	Data 0.001 (0.013)	Loss 3.8968 (4.0665)	Top-1 acc 36.328 (29.937)	Top-5 acc 55.469 (53.157)	lr 0.00508
Warmup Train [32][2400/3239]	Time 0.451 (0.517)	Data 0.001 (0.013)	Loss 3.9920 (4.0668)	Top-1 acc 30.859 (29.926)	Top-5 acc 55.078 (53.146)	lr 0.00508
Warmup Train [32][2410/3239]	Time 0.310 (0.517)	Data 0.001 (0.013)	Loss 4.1576 (4.0669)	Top-1 acc 30.078 (29.925)	Top-5 acc 51.172 (53.142)	lr 0.00507
Warmup Train [32][2420/3239]	Time 0.490 (0.517)	Data 0.001 (0.013)	Loss 4.1224 (4.0671)	Top-1 acc 29.688 (29.920)	Top-5 acc 53.906 (53.142)	lr 0.00507
Warmup Train [32][2430/3239]	Time 0.490 (0.517)	Data 0.001 (0.013)	Loss 4.2144 (4.0668)	Top-1 acc 28.906 (29.922)	Top-5 acc 50.000 (53.145)	lr 0.00507
Warmup Train [32][2440/3239]	Time 0.642 (0.517)	Data 0.001 (0.013)	Loss 4.0636 (4.0667)	Top-1 acc 27.344 (29.921)	Top-5 acc 51.953 (53.145)	lr 0.00506
Warmup Train [32][2450/3239]	Time 0.519 (0.517)	Data 0.001 (0.013)	Loss 4.1583 (4.0666)	Top-1 acc 30.859 (29.919)	Top-5 acc 50.781 (53.148)	lr 0.00506
Warmup Train [32][2460/3239]	Time 0.459 (0.517)	Data 0.001 (0.013)	Loss 4.0615 (4.0666)	Top-1 acc 29.688 (29.920)	Top-5 acc 53.516 (53.147)	lr 0.00506
Warmup Train [32][2470/3239]	Time 0.557 (0.517)	Data 0.001 (0.013)	Loss 4.0406 (4.0664)	Top-1 acc 30.469 (29.922)	Top-5 acc 55.078 (53.153)	lr 0.00505
Warmup Train [32][2480/3239]	Time 0.657 (0.517)	Data 0.001 (0.013)	Loss 3.9521 (4.0664)	Top-1 acc 32.422 (29.919)	Top-5 acc 53.516 (53.153)	lr 0.00505
Warmup Train [32][2490/3239]	Time 0.649 (0.517)	Data 0.001 (0.013)	Loss 4.0603 (4.0665)	Top-1 acc 31.641 (29.917)	Top-5 acc 55.469 (53.153)	lr 0.00505
Warmup Train [32][2500/3239]	Time 0.446 (0.517)	Data 0.001 (0.013)	Loss 3.9835 (4.0665)	Top-1 acc 29.688 (29.908)	Top-5 acc 56.250 (53.146)	lr 0.00504
Warmup Train [32][2510/3239]	Time 0.493 (0.517)	Data 0.001 (0.013)	Loss 3.8842 (4.0666)	Top-1 acc 34.375 (29.903)	Top-5 acc 57.422 (53.142)	lr 0.00504
Warmup Train [32][2520/3239]	Time 0.682 (0.517)	Data 0.001 (0.013)	Loss 4.0359 (4.0667)	Top-1 acc 25.391 (29.903)	Top-5 acc 53.125 (53.142)	lr 0.00503
Warmup Train [32][2530/3239]	Time 0.563 (0.517)	Data 0.001 (0.013)	Loss 3.8935 (4.0664)	Top-1 acc 33.984 (29.911)	Top-5 acc 57.812 (53.152)	lr 0.00503
Warmup Train [32][2540/3239]	Time 0.365 (0.517)	Data 0.001 (0.013)	Loss 4.1342 (4.0663)	Top-1 acc 31.641 (29.913)	Top-5 acc 55.859 (53.155)	lr 0.00503
Warmup Train [32][2550/3239]	Time 0.515 (0.517)	Data 0.001 (0.013)	Loss 4.2393 (4.0661)	Top-1 acc 24.219 (29.912)	Top-5 acc 51.172 (53.159)	lr 0.00502
Warmup Train [32][2560/3239]	Time 0.482 (0.517)	Data 0.001 (0.013)	Loss 4.2223 (4.0663)	Top-1 acc 26.562 (29.907)	Top-5 acc 47.266 (53.154)	lr 0.00502
Warmup Train [32][2570/3239]	Time 0.526 (0.517)	Data 0.001 (0.013)	Loss 3.8069 (4.0660)	Top-1 acc 31.641 (29.912)	Top-5 acc 60.156 (53.161)	lr 0.00502
Warmup Train [32][2580/3239]	Time 0.387 (0.517)	Data 0.001 (0.013)	Loss 4.1595 (4.0661)	Top-1 acc 28.516 (29.913)	Top-5 acc 52.344 (53.156)	lr 0.00501
Warmup Train [32][2590/3239]	Time 0.465 (0.517)	Data 0.001 (0.013)	Loss 3.9491 (4.0659)	Top-1 acc 34.766 (29.922)	Top-5 acc 56.250 (53.160)	lr 0.00501
Warmup Train [32][2600/3239]	Time 0.507 (0.517)	Data 0.023 (0.013)	Loss 4.2298 (4.0659)	Top-1 acc 28.516 (29.923)	Top-5 acc 52.734 (53.161)	lr 0.00500
Warmup Train [32][2610/3239]	Time 0.554 (0.517)	Data 0.001 (0.013)	Loss 4.0388 (4.0658)	Top-1 acc 29.688 (29.919)	Top-5 acc 52.734 (53.164)	lr 0.00500
Warmup Train [32][2620/3239]	Time 0.529 (0.517)	Data 0.001 (0.013)	Loss 3.8942 (4.0656)	Top-1 acc 32.422 (29.926)	Top-5 acc 55.078 (53.170)	lr 0.00500
Warmup Train [32][2630/3239]	Time 0.492 (0.517)	Data 0.001 (0.013)	Loss 4.2488 (4.0657)	Top-1 acc 27.734 (29.925)	Top-5 acc 49.609 (53.169)	lr 0.00499
Warmup Train [32][2640/3239]	Time 0.485 (0.517)	Data 0.001 (0.013)	Loss 4.1175 (4.0656)	Top-1 acc 29.688 (29.929)	Top-5 acc 52.734 (53.178)	lr 0.00499
Warmup Train [32][2650/3239]	Time 0.339 (0.517)	Data 0.001 (0.013)	Loss 3.9922 (4.0653)	Top-1 acc 33.984 (29.933)	Top-5 acc 53.906 (53.181)	lr 0.00499
Warmup Train [32][2660/3239]	Time 0.437 (0.517)	Data 0.001 (0.013)	Loss 4.1075 (4.0654)	Top-1 acc 28.516 (29.930)	Top-5 acc 51.562 (53.180)	lr 0.00498
Warmup Train [32][2670/3239]	Time 0.358 (0.517)	Data 0.001 (0.013)	Loss 4.1044 (4.0656)	Top-1 acc 28.516 (29.929)	Top-5 acc 53.125 (53.177)	lr 0.00498
Warmup Train [32][2680/3239]	Time 0.588 (0.517)	Data 0.001 (0.013)	Loss 4.0119 (4.0658)	Top-1 acc 30.859 (29.921)	Top-5 acc 55.859 (53.171)	lr 0.00498
Warmup Train [32][2690/3239]	Time 0.445 (0.517)	Data 0.001 (0.013)	Loss 4.0933 (4.0655)	Top-1 acc 26.562 (29.926)	Top-5 acc 49.219 (53.175)	lr 0.00497
Warmup Train [32][2700/3239]	Time 0.463 (0.517)	Data 0.001 (0.013)	Loss 3.9629 (4.0650)	Top-1 acc 30.859 (29.934)	Top-5 acc 58.203 (53.187)	lr 0.00497
Warmup Train [32][2710/3239]	Time 0.540 (0.517)	Data 0.001 (0.013)	Loss 4.1536 (4.0651)	Top-1 acc 28.906 (29.934)	Top-5 acc 52.344 (53.182)	lr 0.00497
Warmup Train [32][2720/3239]	Time 0.587 (0.517)	Data 0.001 (0.013)	Loss 4.0759 (4.0652)	Top-1 acc 31.641 (29.928)	Top-5 acc 52.734 (53.178)	lr 0.00496
Warmup Train [32][2730/3239]	Time 0.467 (0.517)	Data 0.001 (0.013)	Loss 3.9081 (4.0651)	Top-1 acc 35.547 (29.929)	Top-5 acc 59.766 (53.182)	lr 0.00496
Warmup Train [32][2740/3239]	Time 0.695 (0.516)	Data 0.001 (0.013)	Loss 4.1152 (4.0651)	Top-1 acc 30.859 (29.929)	Top-5 acc 50.391 (53.182)	lr 0.00495
Warmup Train [32][2750/3239]	Time 0.594 (0.516)	Data 0.002 (0.013)	Loss 4.0294 (4.0653)	Top-1 acc 32.031 (29.925)	Top-5 acc 53.516 (53.184)	lr 0.00495
Warmup Train [32][2760/3239]	Time 0.630 (0.516)	Data 0.001 (0.013)	Loss 3.9785 (4.0654)	Top-1 acc 32.812 (29.928)	Top-5 acc 56.250 (53.181)	lr 0.00495
Warmup Train [32][2770/3239]	Time 0.547 (0.516)	Data 0.002 (0.012)	Loss 4.0879 (4.0652)	Top-1 acc 29.297 (29.931)	Top-5 acc 54.688 (53.190)	lr 0.00494
Warmup Train [32][2780/3239]	Time 0.772 (0.516)	Data 0.001 (0.012)	Loss 4.0075 (4.0652)	Top-1 acc 30.469 (29.932)	Top-5 acc 52.734 (53.192)	lr 0.00494
Warmup Train [32][2790/3239]	Time 0.596 (0.516)	Data 0.001 (0.012)	Loss 4.1026 (4.0649)	Top-1 acc 29.688 (29.936)	Top-5 acc 51.953 (53.195)	lr 0.00494
Warmup Train [32][2800/3239]	Time 0.559 (0.516)	Data 0.001 (0.012)	Loss 4.1711 (4.0648)	Top-1 acc 28.516 (29.939)	Top-5 acc 48.438 (53.197)	lr 0.00493
Warmup Train [32][2810/3239]	Time 0.369 (0.516)	Data 0.001 (0.012)	Loss 4.0157 (4.0649)	Top-1 acc 30.859 (29.934)	Top-5 acc 54.297 (53.198)	lr 0.00493
Warmup Train [32][2820/3239]	Time 0.432 (0.516)	Data 0.001 (0.012)	Loss 4.0180 (4.0648)	Top-1 acc 32.422 (29.935)	Top-5 acc 51.172 (53.197)	lr 0.00493
Warmup Train [32][2830/3239]	Time 0.387 (0.516)	Data 0.001 (0.012)	Loss 4.0368 (4.0649)	Top-1 acc 29.297 (29.938)	Top-5 acc 55.859 (53.200)	lr 0.00492
Warmup Train [32][2840/3239]	Time 0.436 (0.516)	Data 0.001 (0.012)	Loss 3.8555 (4.0649)	Top-1 acc 34.375 (29.932)	Top-5 acc 55.469 (53.199)	lr 0.00492
Warmup Train [32][2850/3239]	Time 0.676 (0.516)	Data 0.001 (0.012)	Loss 4.1964 (4.0651)	Top-1 acc 30.469 (29.930)	Top-5 acc 51.562 (53.194)	lr 0.00491
Warmup Train [32][2860/3239]	Time 0.555 (0.516)	Data 0.001 (0.012)	Loss 4.0982 (4.0649)	Top-1 acc 27.734 (29.933)	Top-5 acc 51.562 (53.198)	lr 0.00491
Warmup Train [32][2870/3239]	Time 0.537 (0.516)	Data 0.001 (0.012)	Loss 4.0882 (4.0650)	Top-1 acc 26.953 (29.934)	Top-5 acc 49.609 (53.192)	lr 0.00491
Warmup Train [32][2880/3239]	Time 0.611 (0.516)	Data 0.001 (0.012)	Loss 4.2156 (4.0652)	Top-1 acc 24.219 (29.928)	Top-5 acc 46.875 (53.183)	lr 0.00490
Warmup Train [32][2890/3239]	Time 0.739 (0.516)	Data 0.001 (0.012)	Loss 4.0424 (4.0653)	Top-1 acc 32.031 (29.926)	Top-5 acc 50.391 (53.177)	lr 0.00490
Warmup Train [32][2900/3239]	Time 0.516 (0.516)	Data 0.001 (0.012)	Loss 4.0583 (4.0653)	Top-1 acc 30.469 (29.924)	Top-5 acc 55.078 (53.178)	lr 0.00490
Warmup Train [32][2910/3239]	Time 0.409 (0.516)	Data 0.001 (0.012)	Loss 4.0343 (4.0653)	Top-1 acc 31.641 (29.926)	Top-5 acc 53.906 (53.178)	lr 0.00489
Warmup Train [32][2920/3239]	Time 0.408 (0.516)	Data 0.001 (0.012)	Loss 4.2370 (4.0654)	Top-1 acc 28.516 (29.923)	Top-5 acc 46.875 (53.179)	lr 0.00489
Warmup Train [32][2930/3239]	Time 0.346 (0.516)	Data 0.001 (0.012)	Loss 4.0880 (4.0652)	Top-1 acc 26.562 (29.923)	Top-5 acc 51.562 (53.179)	lr 0.00489
Warmup Train [32][2940/3239]	Time 0.551 (0.516)	Data 0.001 (0.012)	Loss 4.2004 (4.0651)	Top-1 acc 27.344 (29.921)	Top-5 acc 50.781 (53.180)	lr 0.00488
Warmup Train [32][2950/3239]	Time 0.527 (0.516)	Data 0.001 (0.012)	Loss 4.1228 (4.0652)	Top-1 acc 28.516 (29.920)	Top-5 acc 50.781 (53.178)	lr 0.00488
Warmup Train [32][2960/3239]	Time 0.481 (0.516)	Data 0.001 (0.012)	Loss 4.1962 (4.0653)	Top-1 acc 31.641 (29.920)	Top-5 acc 49.609 (53.174)	lr 0.00487
Warmup Train [32][2970/3239]	Time 0.563 (0.516)	Data 0.001 (0.012)	Loss 3.9705 (4.0651)	Top-1 acc 30.469 (29.922)	Top-5 acc 50.781 (53.176)	lr 0.00487
Warmup Train [32][2980/3239]	Time 0.622 (0.516)	Data 0.001 (0.012)	Loss 4.1458 (4.0649)	Top-1 acc 28.516 (29.924)	Top-5 acc 51.562 (53.177)	lr 0.00487
Warmup Train [32][2990/3239]	Time 0.501 (0.516)	Data 0.001 (0.012)	Loss 4.0960 (4.0647)	Top-1 acc 32.422 (29.929)	Top-5 acc 55.859 (53.183)	lr 0.00486
Warmup Train [32][3000/3239]	Time 0.723 (0.516)	Data 0.001 (0.012)	Loss 3.9585 (4.0646)	Top-1 acc 34.766 (29.931)	Top-5 acc 58.984 (53.187)	lr 0.00486
Warmup Train [32][3010/3239]	Time 0.412 (0.516)	Data 0.001 (0.012)	Loss 3.9586 (4.0647)	Top-1 acc 32.812 (29.936)	Top-5 acc 51.953 (53.187)	lr 0.00486
Warmup Train [32][3020/3239]	Time 0.478 (0.516)	Data 0.001 (0.012)	Loss 4.0262 (4.0647)	Top-1 acc 30.078 (29.934)	Top-5 acc 51.953 (53.184)	lr 0.00485
Warmup Train [32][3030/3239]	Time 0.319 (0.516)	Data 0.001 (0.012)	Loss 4.2110 (4.0648)	Top-1 acc 26.172 (29.936)	Top-5 acc 49.219 (53.180)	lr 0.00485
Warmup Train [32][3040/3239]	Time 0.617 (0.515)	Data 0.001 (0.012)	Loss 4.1209 (4.0648)	Top-1 acc 31.641 (29.940)	Top-5 acc 53.125 (53.182)	lr 0.00485
Warmup Train [32][3050/3239]	Time 0.676 (0.515)	Data 0.001 (0.012)	Loss 3.9544 (4.0649)	Top-1 acc 30.859 (29.938)	Top-5 acc 53.125 (53.178)	lr 0.00484
Warmup Train [32][3060/3239]	Time 0.516 (0.515)	Data 0.001 (0.012)	Loss 4.1816 (4.0650)	Top-1 acc 29.297 (29.938)	Top-5 acc 51.562 (53.175)	lr 0.00484
Warmup Train [32][3070/3239]	Time 0.423 (0.515)	Data 0.035 (0.012)	Loss 4.2235 (4.0651)	Top-1 acc 27.344 (29.936)	Top-5 acc 50.000 (53.176)	lr 0.00484
Warmup Train [32][3080/3239]	Time 0.320 (0.515)	Data 0.001 (0.012)	Loss 4.1566 (4.0650)	Top-1 acc 28.516 (29.937)	Top-5 acc 50.391 (53.176)	lr 0.00483
Warmup Train [32][3090/3239]	Time 0.398 (0.515)	Data 0.001 (0.012)	Loss 4.0392 (4.0648)	Top-1 acc 29.688 (29.938)	Top-5 acc 51.562 (53.180)	lr 0.00483
Warmup Train [32][3100/3239]	Time 0.589 (0.515)	Data 0.001 (0.012)	Loss 3.9219 (4.0647)	Top-1 acc 33.594 (29.939)	Top-5 acc 57.422 (53.180)	lr 0.00482
Warmup Train [32][3110/3239]	Time 0.462 (0.515)	Data 0.001 (0.012)	Loss 4.0746 (4.0648)	Top-1 acc 31.641 (29.940)	Top-5 acc 51.562 (53.180)	lr 0.00482
Warmup Train [32][3120/3239]	Time 0.455 (0.515)	Data 0.001 (0.012)	Loss 4.1360 (4.0648)	Top-1 acc 28.906 (29.940)	Top-5 acc 50.000 (53.177)	lr 0.00482
Warmup Train [32][3130/3239]	Time 0.427 (0.515)	Data 0.001 (0.012)	Loss 4.2176 (4.0647)	Top-1 acc 27.734 (29.940)	Top-5 acc 51.172 (53.177)	lr 0.00481
Warmup Train [32][3140/3239]	Time 0.428 (0.515)	Data 0.001 (0.012)	Loss 3.8630 (4.0647)	Top-1 acc 35.156 (29.939)	Top-5 acc 58.984 (53.176)	lr 0.00481
Warmup Train [32][3150/3239]	Time 0.426 (0.515)	Data 0.001 (0.012)	Loss 4.1453 (4.0648)	Top-1 acc 29.688 (29.938)	Top-5 acc 51.172 (53.176)	lr 0.00481
Warmup Train [32][3160/3239]	Time 0.502 (0.515)	Data 0.001 (0.012)	Loss 4.1475 (4.0646)	Top-1 acc 27.734 (29.937)	Top-5 acc 52.344 (53.176)	lr 0.00480
Warmup Train [32][3170/3239]	Time 0.579 (0.515)	Data 0.001 (0.012)	Loss 3.8912 (4.0647)	Top-1 acc 30.469 (29.934)	Top-5 acc 58.203 (53.176)	lr 0.00480
Warmup Train [32][3180/3239]	Time 0.429 (0.515)	Data 0.000 (0.012)	Loss 4.0196 (4.0647)	Top-1 acc 32.031 (29.936)	Top-5 acc 54.688 (53.178)	lr 0.00480
Warmup Train [32][3190/3239]	Time 0.516 (0.515)	Data 0.000 (0.012)	Loss 4.1799 (4.0648)	Top-1 acc 29.688 (29.933)	Top-5 acc 50.391 (53.173)	lr 0.00479
Warmup Train [32][3200/3239]	Time 0.326 (0.515)	Data 0.000 (0.012)	Loss 3.9870 (4.0647)	Top-1 acc 33.203 (29.935)	Top-5 acc 57.031 (53.175)	lr 0.00479
Warmup Train [32][3210/3239]	Time 0.421 (0.515)	Data 0.000 (0.012)	Loss 4.0422 (4.0647)	Top-1 acc 30.859 (29.937)	Top-5 acc 54.688 (53.174)	lr 0.00479
Warmup Train [32][3220/3239]	Time 0.747 (0.515)	Data 0.000 (0.012)	Loss 4.0233 (4.0645)	Top-1 acc 31.641 (29.941)	Top-5 acc 51.172 (53.176)	lr 0.00478
Warmup Train [32][3230/3239]	Time 0.493 (0.515)	Data 0.000 (0.012)	Loss 4.1134 (4.0643)	Top-1 acc 23.438 (29.939)	Top-5 acc 51.172 (53.182)	lr 0.00478
Warmup Train [32][3239/3239]	Time 0.317 (0.515)	Data 0.000 (0.012)	Loss 4.3890 (4.0644)	Top-1 acc 25.926 (29.942)	Top-5 acc 48.148 (53.180)	lr 0.00477
==========Warmup Valid [32/40]	loss 3.005	top-1 acc 37.279	top-5 acc 62.190	Train top-1 29.942	top-5 53.180	flops: 442.4M
Warmup Train [33][0/3239]	Time 13.636 (13.636)	Data 12.177 (12.177)	Loss 4.0457 (4.0457)	Top-1 acc 32.422 (32.422)	Top-5 acc 53.516 (53.516)	lr 0.00477
Warmup Train [33][10/3239]	Time 0.378 (1.870)	Data 0.001 (1.229)	Loss 3.8727 (4.0136)	Top-1 acc 30.469 (31.214)	Top-5 acc 58.594 (53.764)	lr 0.00477
Warmup Train [33][20/3239]	Time 0.489 (1.237)	Data 0.001 (0.651)	Loss 3.9901 (4.0192)	Top-1 acc 33.203 (31.008)	Top-5 acc 54.297 (54.036)	lr 0.00477
Warmup Train [33][30/3239]	Time 0.558 (1.007)	Data 0.001 (0.445)	Loss 3.8464 (4.0241)	Top-1 acc 35.156 (30.696)	Top-5 acc 60.938 (53.969)	lr 0.00476
Warmup Train [33][40/3239]	Time 0.557 (0.884)	Data 0.001 (0.337)	Loss 3.8471 (4.0302)	Top-1 acc 32.812 (30.488)	Top-5 acc 60.156 (54.011)	lr 0.00476
Warmup Train [33][50/3239]	Time 0.366 (0.810)	Data 0.001 (0.272)	Loss 4.1483 (4.0395)	Top-1 acc 25.781 (30.369)	Top-5 acc 50.000 (53.715)	lr 0.00476
Warmup Train [33][60/3239]	Time 0.501 (0.765)	Data 0.002 (0.230)	Loss 3.9942 (4.0438)	Top-1 acc 30.859 (30.296)	Top-5 acc 53.125 (53.535)	lr 0.00475
Warmup Train [33][70/3239]	Time 0.549 (0.731)	Data 0.001 (0.198)	Loss 4.0430 (4.0414)	Top-1 acc 29.297 (30.265)	Top-5 acc 53.125 (53.411)	lr 0.00475
Warmup Train [33][80/3239]	Time 0.463 (0.704)	Data 0.001 (0.173)	Loss 4.0293 (4.0491)	Top-1 acc 31.250 (30.175)	Top-5 acc 51.953 (53.289)	lr 0.00475
Warmup Train [33][90/3239]	Time 0.649 (0.682)	Data 0.001 (0.155)	Loss 3.9753 (4.0558)	Top-1 acc 31.250 (30.134)	Top-5 acc 55.078 (53.112)	lr 0.00474
Warmup Train [33][100/3239]	Time 0.561 (0.664)	Data 0.001 (0.140)	Loss 3.9704 (4.0585)	Top-1 acc 31.641 (29.989)	Top-5 acc 54.688 (53.164)	lr 0.00474
Warmup Train [33][110/3239]	Time 0.618 (0.651)	Data 0.001 (0.128)	Loss 3.9284 (4.0569)	Top-1 acc 30.859 (30.004)	Top-5 acc 56.250 (53.290)	lr 0.00474
Warmup Train [33][120/3239]	Time 0.496 (0.638)	Data 0.001 (0.117)	Loss 3.9602 (4.0561)	Top-1 acc 30.859 (30.068)	Top-5 acc 56.250 (53.296)	lr 0.00473
Warmup Train [33][130/3239]	Time 0.523 (0.630)	Data 0.001 (0.108)	Loss 4.2898 (4.0567)	Top-1 acc 24.219 (30.042)	Top-5 acc 47.266 (53.280)	lr 0.00473
Warmup Train [33][140/3239]	Time 0.458 (0.619)	Data 0.001 (0.101)	Loss 3.9873 (4.0557)	Top-1 acc 29.297 (29.984)	Top-5 acc 53.125 (53.286)	lr 0.00472
Warmup Train [33][150/3239]	Time 0.572 (0.612)	Data 0.001 (0.094)	Loss 4.1368 (4.0544)	Top-1 acc 28.906 (29.985)	Top-5 acc 53.125 (53.332)	lr 0.00472
Warmup Train [33][160/3239]	Time 0.513 (0.605)	Data 0.001 (0.089)	Loss 3.9123 (4.0558)	Top-1 acc 33.594 (30.025)	Top-5 acc 58.594 (53.358)	lr 0.00472
Warmup Train [33][170/3239]	Time 0.457 (0.597)	Data 0.001 (0.084)	Loss 4.0043 (4.0546)	Top-1 acc 30.078 (29.982)	Top-5 acc 55.469 (53.399)	lr 0.00471
Warmup Train [33][180/3239]	Time 0.475 (0.590)	Data 0.001 (0.080)	Loss 4.0189 (4.0575)	Top-1 acc 31.250 (29.938)	Top-5 acc 59.766 (53.406)	lr 0.00471
Warmup Train [33][190/3239]	Time 0.539 (0.586)	Data 0.002 (0.075)	Loss 4.3211 (4.0565)	Top-1 acc 22.656 (29.941)	Top-5 acc 48.828 (53.405)	lr 0.00471
Warmup Train [33][200/3239]	Time 0.336 (0.582)	Data 0.001 (0.072)	Loss 4.0011 (4.0559)	Top-1 acc 30.078 (30.000)	Top-5 acc 54.688 (53.450)	lr 0.00470
Warmup Train [33][210/3239]	Time 0.399 (0.579)	Data 0.001 (0.070)	Loss 3.8490 (4.0554)	Top-1 acc 32.422 (29.984)	Top-5 acc 59.375 (53.466)	lr 0.00470
Warmup Train [33][220/3239]	Time 0.588 (0.577)	Data 0.001 (0.067)	Loss 4.1789 (4.0547)	Top-1 acc 28.906 (29.921)	Top-5 acc 51.172 (53.491)	lr 0.00470
Warmup Train [33][230/3239]	Time 0.530 (0.574)	Data 0.001 (0.064)	Loss 4.2853 (4.0556)	Top-1 acc 26.953 (29.867)	Top-5 acc 50.391 (53.509)	lr 0.00469
Warmup Train [33][240/3239]	Time 0.493 (0.571)	Data 0.001 (0.062)	Loss 3.8139 (4.0540)	Top-1 acc 35.156 (29.892)	Top-5 acc 59.766 (53.535)	lr 0.00469
Warmup Train [33][250/3239]	Time 0.417 (0.569)	Data 0.001 (0.060)	Loss 4.0559 (4.0526)	Top-1 acc 32.031 (29.961)	Top-5 acc 53.906 (53.558)	lr 0.00469
Warmup Train [33][260/3239]	Time 0.349 (0.566)	Data 0.001 (0.058)	Loss 4.0940 (4.0535)	Top-1 acc 29.297 (29.919)	Top-5 acc 51.953 (53.532)	lr 0.00468
Warmup Train [33][270/3239]	Time 0.520 (0.565)	Data 0.001 (0.056)	Loss 4.0933 (4.0533)	Top-1 acc 29.688 (29.907)	Top-5 acc 50.391 (53.497)	lr 0.00468
Warmup Train [33][280/3239]	Time 0.677 (0.563)	Data 0.002 (0.054)	Loss 4.1319 (4.0521)	Top-1 acc 29.688 (29.922)	Top-5 acc 50.391 (53.538)	lr 0.00468
Warmup Train [33][290/3239]	Time 0.453 (0.561)	Data 0.001 (0.052)	Loss 4.2528 (4.0543)	Top-1 acc 26.172 (29.905)	Top-5 acc 50.000 (53.510)	lr 0.00467
Warmup Train [33][300/3239]	Time 0.558 (0.561)	Data 0.001 (0.051)	Loss 4.0709 (4.0551)	Top-1 acc 29.297 (29.899)	Top-5 acc 54.688 (53.516)	lr 0.00467
Warmup Train [33][310/3239]	Time 0.481 (0.559)	Data 0.001 (0.050)	Loss 4.1171 (4.0548)	Top-1 acc 28.125 (29.892)	Top-5 acc 49.219 (53.488)	lr 0.00466
Warmup Train [33][320/3239]	Time 0.587 (0.558)	Data 0.001 (0.048)	Loss 4.1282 (4.0549)	Top-1 acc 28.906 (29.900)	Top-5 acc 53.125 (53.499)	lr 0.00466
Warmup Train [33][330/3239]	Time 0.639 (0.557)	Data 0.001 (0.047)	Loss 4.2061 (4.0550)	Top-1 acc 28.906 (29.895)	Top-5 acc 51.562 (53.459)	lr 0.00466
Warmup Train [33][340/3239]	Time 0.510 (0.555)	Data 0.001 (0.045)	Loss 3.9832 (4.0550)	Top-1 acc 34.766 (29.902)	Top-5 acc 56.250 (53.454)	lr 0.00465
Warmup Train [33][350/3239]	Time 0.506 (0.554)	Data 0.001 (0.044)	Loss 4.0246 (4.0532)	Top-1 acc 31.250 (29.937)	Top-5 acc 55.859 (53.496)	lr 0.00465
Warmup Train [33][360/3239]	Time 0.506 (0.553)	Data 0.001 (0.043)	Loss 4.0248 (4.0539)	Top-1 acc 31.250 (29.922)	Top-5 acc 55.469 (53.480)	lr 0.00465
Warmup Train [33][370/3239]	Time 0.304 (0.552)	Data 0.001 (0.042)	Loss 4.0023 (4.0535)	Top-1 acc 32.031 (29.932)	Top-5 acc 53.516 (53.476)	lr 0.00464
Warmup Train [33][380/3239]	Time 0.570 (0.551)	Data 0.002 (0.041)	Loss 3.8191 (4.0521)	Top-1 acc 38.672 (29.986)	Top-5 acc 59.766 (53.503)	lr 0.00464
Warmup Train [33][390/3239]	Time 0.475 (0.550)	Data 0.001 (0.040)	Loss 4.1269 (4.0518)	Top-1 acc 28.125 (29.977)	Top-5 acc 47.266 (53.498)	lr 0.00464
Warmup Train [33][400/3239]	Time 0.474 (0.549)	Data 0.001 (0.040)	Loss 4.1501 (4.0521)	Top-1 acc 26.953 (29.959)	Top-5 acc 50.781 (53.483)	lr 0.00463
Warmup Train [33][410/3239]	Time 0.391 (0.548)	Data 0.001 (0.039)	Loss 4.0061 (4.0521)	Top-1 acc 31.641 (29.936)	Top-5 acc 55.078 (53.487)	lr 0.00463
Warmup Train [33][420/3239]	Time 0.532 (0.547)	Data 0.001 (0.038)	Loss 4.2238 (4.0519)	Top-1 acc 27.344 (29.947)	Top-5 acc 50.000 (53.481)	lr 0.00463
Warmup Train [33][430/3239]	Time 0.697 (0.547)	Data 0.001 (0.037)	Loss 3.9658 (4.0502)	Top-1 acc 31.641 (29.978)	Top-5 acc 56.641 (53.532)	lr 0.00462
Warmup Train [33][440/3239]	Time 0.367 (0.545)	Data 0.001 (0.037)	Loss 4.2387 (4.0508)	Top-1 acc 23.828 (29.993)	Top-5 acc 48.438 (53.521)	lr 0.00462
Warmup Train [33][450/3239]	Time 0.483 (0.545)	Data 0.001 (0.036)	Loss 4.1818 (4.0510)	Top-1 acc 25.781 (29.965)	Top-5 acc 48.438 (53.493)	lr 0.00462
Warmup Train [33][460/3239]	Time 0.591 (0.543)	Data 0.001 (0.035)	Loss 4.0744 (4.0507)	Top-1 acc 29.688 (29.945)	Top-5 acc 53.125 (53.500)	lr 0.00461
Warmup Train [33][470/3239]	Time 0.563 (0.542)	Data 0.001 (0.035)	Loss 4.1759 (4.0497)	Top-1 acc 25.781 (29.966)	Top-5 acc 50.391 (53.508)	lr 0.00461
Warmup Train [33][480/3239]	Time 0.497 (0.541)	Data 0.001 (0.034)	Loss 4.0140 (4.0496)	Top-1 acc 31.250 (29.990)	Top-5 acc 54.688 (53.512)	lr 0.00460
Warmup Train [33][490/3239]	Time 0.522 (0.541)	Data 0.001 (0.034)	Loss 3.8769 (4.0489)	Top-1 acc 33.984 (30.011)	Top-5 acc 57.812 (53.543)	lr 0.00460
Warmup Train [33][500/3239]	Time 0.477 (0.540)	Data 0.001 (0.033)	Loss 4.2287 (4.0492)	Top-1 acc 27.734 (30.007)	Top-5 acc 50.781 (53.539)	lr 0.00460
Warmup Train [33][510/3239]	Time 0.436 (0.540)	Data 0.002 (0.032)	Loss 4.0804 (4.0491)	Top-1 acc 28.125 (30.001)	Top-5 acc 57.422 (53.560)	lr 0.00459
Warmup Train [33][520/3239]	Time 0.503 (0.539)	Data 0.001 (0.032)	Loss 4.2142 (4.0500)	Top-1 acc 26.562 (29.973)	Top-5 acc 52.344 (53.567)	lr 0.00459
Warmup Train [33][530/3239]	Time 0.628 (0.539)	Data 0.001 (0.031)	Loss 3.8429 (4.0495)	Top-1 acc 35.938 (30.002)	Top-5 acc 58.594 (53.558)	lr 0.00459
Warmup Train [33][540/3239]	Time 0.567 (0.539)	Data 0.001 (0.031)	Loss 4.0824 (4.0499)	Top-1 acc 28.906 (30.016)	Top-5 acc 51.562 (53.549)	lr 0.00458
Warmup Train [33][550/3239]	Time 0.466 (0.538)	Data 0.001 (0.030)	Loss 4.0184 (4.0514)	Top-1 acc 28.906 (29.980)	Top-5 acc 50.781 (53.521)	lr 0.00458
Warmup Train [33][560/3239]	Time 0.504 (0.538)	Data 0.001 (0.030)	Loss 3.9660 (4.0507)	Top-1 acc 31.250 (29.992)	Top-5 acc 58.594 (53.551)	lr 0.00458
Warmup Train [33][570/3239]	Time 0.523 (0.537)	Data 0.001 (0.030)	Loss 4.2039 (4.0516)	Top-1 acc 27.734 (29.982)	Top-5 acc 46.094 (53.542)	lr 0.00457
Warmup Train [33][580/3239]	Time 0.661 (0.537)	Data 0.002 (0.029)	Loss 4.1563 (4.0515)	Top-1 acc 27.734 (29.985)	Top-5 acc 52.734 (53.543)	lr 0.00457
Warmup Train [33][590/3239]	Time 0.527 (0.537)	Data 0.001 (0.029)	Loss 3.9263 (4.0521)	Top-1 acc 33.203 (29.986)	Top-5 acc 60.156 (53.531)	lr 0.00457
Warmup Train [33][600/3239]	Time 0.577 (0.537)	Data 0.001 (0.028)	Loss 3.9943 (4.0526)	Top-1 acc 35.938 (30.001)	Top-5 acc 55.078 (53.498)	lr 0.00456
Warmup Train [33][610/3239]	Time 0.515 (0.536)	Data 0.001 (0.028)	Loss 3.9688 (4.0520)	Top-1 acc 27.734 (30.014)	Top-5 acc 54.297 (53.514)	lr 0.00456
Warmup Train [33][620/3239]	Time 0.632 (0.536)	Data 0.001 (0.028)	Loss 4.0411 (4.0528)	Top-1 acc 34.766 (30.017)	Top-5 acc 58.594 (53.502)	lr 0.00456
Warmup Train [33][630/3239]	Time 0.529 (0.535)	Data 0.001 (0.027)	Loss 4.1683 (4.0525)	Top-1 acc 27.344 (30.029)	Top-5 acc 51.562 (53.512)	lr 0.00455
Warmup Train [33][640/3239]	Time 0.503 (0.535)	Data 0.001 (0.027)	Loss 4.0348 (4.0521)	Top-1 acc 30.469 (30.045)	Top-5 acc 51.562 (53.508)	lr 0.00455
Warmup Train [33][650/3239]	Time 0.503 (0.535)	Data 0.001 (0.027)	Loss 3.9696 (4.0515)	Top-1 acc 30.859 (30.069)	Top-5 acc 57.422 (53.525)	lr 0.00455
Warmup Train [33][660/3239]	Time 0.302 (0.534)	Data 0.001 (0.026)	Loss 4.1833 (4.0519)	Top-1 acc 23.828 (30.077)	Top-5 acc 45.703 (53.509)	lr 0.00454
Warmup Train [33][670/3239]	Time 0.500 (0.533)	Data 0.001 (0.026)	Loss 4.2362 (4.0522)	Top-1 acc 29.297 (30.091)	Top-5 acc 50.391 (53.506)	lr 0.00454
Warmup Train [33][680/3239]	Time 0.458 (0.533)	Data 0.001 (0.026)	Loss 4.0828 (4.0514)	Top-1 acc 32.422 (30.121)	Top-5 acc 53.906 (53.518)	lr 0.00454
Warmup Train [33][690/3239]	Time 0.301 (0.533)	Data 0.001 (0.026)	Loss 3.9343 (4.0507)	Top-1 acc 31.250 (30.133)	Top-5 acc 55.859 (53.520)	lr 0.00453
Warmup Train [33][700/3239]	Time 0.536 (0.533)	Data 0.001 (0.025)	Loss 3.8542 (4.0509)	Top-1 acc 33.594 (30.130)	Top-5 acc 54.297 (53.520)	lr 0.00453
Warmup Train [33][710/3239]	Time 0.579 (0.532)	Data 0.001 (0.025)	Loss 3.9792 (4.0510)	Top-1 acc 30.469 (30.119)	Top-5 acc 54.688 (53.522)	lr 0.00452
Warmup Train [33][720/3239]	Time 0.461 (0.531)	Data 0.001 (0.025)	Loss 3.9830 (4.0512)	Top-1 acc 32.031 (30.109)	Top-5 acc 55.859 (53.529)	lr 0.00452
Warmup Train [33][730/3239]	Time 0.459 (0.531)	Data 0.001 (0.024)	Loss 4.1135 (4.0516)	Top-1 acc 31.641 (30.107)	Top-5 acc 52.734 (53.527)	lr 0.00452
Warmup Train [33][740/3239]	Time 0.534 (0.530)	Data 0.001 (0.024)	Loss 3.9571 (4.0521)	Top-1 acc 33.594 (30.104)	Top-5 acc 53.516 (53.498)	lr 0.00451
Warmup Train [33][750/3239]	Time 0.380 (0.530)	Data 0.001 (0.024)	Loss 3.9350 (4.0512)	Top-1 acc 30.469 (30.129)	Top-5 acc 56.641 (53.522)	lr 0.00451
Warmup Train [33][760/3239]	Time 0.588 (0.530)	Data 0.001 (0.024)	Loss 4.1007 (4.0508)	Top-1 acc 29.688 (30.125)	Top-5 acc 53.906 (53.523)	lr 0.00451
Warmup Train [33][770/3239]	Time 0.495 (0.530)	Data 0.001 (0.024)	Loss 3.9618 (4.0501)	Top-1 acc 30.859 (30.132)	Top-5 acc 51.562 (53.527)	lr 0.00450
Warmup Train [33][780/3239]	Time 0.374 (0.529)	Data 0.001 (0.023)	Loss 4.1263 (4.0499)	Top-1 acc 30.078 (30.140)	Top-5 acc 51.562 (53.534)	lr 0.00450
Warmup Train [33][790/3239]	Time 0.447 (0.529)	Data 0.001 (0.023)	Loss 4.0527 (4.0502)	Top-1 acc 28.125 (30.128)	Top-5 acc 51.172 (53.526)	lr 0.00450
Warmup Train [33][800/3239]	Time 0.533 (0.529)	Data 0.001 (0.023)	Loss 4.2503 (4.0501)	Top-1 acc 28.516 (30.120)	Top-5 acc 51.562 (53.527)	lr 0.00449
Warmup Train [33][810/3239]	Time 0.496 (0.529)	Data 0.001 (0.023)	Loss 3.9146 (4.0507)	Top-1 acc 31.641 (30.102)	Top-5 acc 55.078 (53.505)	lr 0.00449
Warmup Train [33][820/3239]	Time 0.568 (0.529)	Data 0.001 (0.022)	Loss 4.0574 (4.0511)	Top-1 acc 30.859 (30.100)	Top-5 acc 52.734 (53.511)	lr 0.00449
Warmup Train [33][830/3239]	Time 0.429 (0.529)	Data 0.001 (0.022)	Loss 3.9803 (4.0516)	Top-1 acc 32.031 (30.088)	Top-5 acc 54.688 (53.506)	lr 0.00448
Warmup Train [33][840/3239]	Time 0.662 (0.529)	Data 0.001 (0.022)	Loss 3.9834 (4.0512)	Top-1 acc 31.250 (30.097)	Top-5 acc 56.250 (53.520)	lr 0.00448
Warmup Train [33][850/3239]	Time 0.424 (0.528)	Data 0.001 (0.022)	Loss 4.1321 (4.0514)	Top-1 acc 29.297 (30.079)	Top-5 acc 51.172 (53.518)	lr 0.00448
Warmup Train [33][860/3239]	Time 0.576 (0.528)	Data 0.001 (0.022)	Loss 3.8895 (4.0516)	Top-1 acc 32.031 (30.066)	Top-5 acc 55.469 (53.501)	lr 0.00447
Warmup Train [33][870/3239]	Time 0.457 (0.528)	Data 0.001 (0.021)	Loss 3.9720 (4.0513)	Top-1 acc 34.375 (30.088)	Top-5 acc 55.859 (53.510)	lr 0.00447
Warmup Train [33][880/3239]	Time 0.494 (0.528)	Data 0.001 (0.022)	Loss 4.0817 (4.0513)	Top-1 acc 30.078 (30.083)	Top-5 acc 53.516 (53.509)	lr 0.00447
Warmup Train [33][890/3239]	Time 0.453 (0.528)	Data 0.001 (0.021)	Loss 4.0480 (4.0514)	Top-1 acc 31.641 (30.084)	Top-5 acc 54.688 (53.523)	lr 0.00446
Warmup Train [33][900/3239]	Time 0.446 (0.527)	Data 0.001 (0.021)	Loss 3.7535 (4.0508)	Top-1 acc 32.031 (30.088)	Top-5 acc 58.203 (53.530)	lr 0.00446
Warmup Train [33][910/3239]	Time 0.467 (0.527)	Data 0.001 (0.021)	Loss 4.0147 (4.0511)	Top-1 acc 33.203 (30.087)	Top-5 acc 53.125 (53.525)	lr 0.00446
Warmup Train [33][920/3239]	Time 0.553 (0.527)	Data 0.001 (0.021)	Loss 4.0712 (4.0512)	Top-1 acc 28.906 (30.093)	Top-5 acc 55.859 (53.521)	lr 0.00445
Warmup Train [33][930/3239]	Time 0.505 (0.527)	Data 0.001 (0.021)	Loss 4.3294 (4.0515)	Top-1 acc 28.906 (30.098)	Top-5 acc 48.438 (53.521)	lr 0.00445
Warmup Train [33][940/3239]	Time 0.663 (0.527)	Data 0.001 (0.020)	Loss 4.2990 (4.0514)	Top-1 acc 24.609 (30.096)	Top-5 acc 43.359 (53.523)	lr 0.00445
Warmup Train [33][950/3239]	Time 0.547 (0.527)	Data 0.001 (0.020)	Loss 4.1199 (4.0512)	Top-1 acc 27.734 (30.098)	Top-5 acc 54.297 (53.523)	lr 0.00444
Warmup Train [33][960/3239]	Time 0.416 (0.526)	Data 0.001 (0.020)	Loss 3.9694 (4.0510)	Top-1 acc 35.938 (30.110)	Top-5 acc 55.859 (53.531)	lr 0.00444
Warmup Train [33][970/3239]	Time 0.406 (0.526)	Data 0.001 (0.020)	Loss 4.0283 (4.0511)	Top-1 acc 28.516 (30.094)	Top-5 acc 52.344 (53.526)	lr 0.00443
Warmup Train [33][980/3239]	Time 0.543 (0.526)	Data 0.002 (0.020)	Loss 4.0264 (4.0508)	Top-1 acc 31.250 (30.092)	Top-5 acc 56.250 (53.532)	lr 0.00443
Warmup Train [33][990/3239]	Time 0.542 (0.525)	Data 0.001 (0.020)	Loss 4.0203 (4.0509)	Top-1 acc 32.812 (30.095)	Top-5 acc 53.906 (53.533)	lr 0.00443
Warmup Train [33][1000/3239]	Time 0.566 (0.525)	Data 0.001 (0.020)	Loss 4.0221 (4.0509)	Top-1 acc 32.812 (30.093)	Top-5 acc 52.344 (53.533)	lr 0.00442
Warmup Train [33][1010/3239]	Time 0.435 (0.524)	Data 0.001 (0.019)	Loss 4.1177 (4.0509)	Top-1 acc 30.469 (30.094)	Top-5 acc 53.516 (53.538)	lr 0.00442
Warmup Train [33][1020/3239]	Time 0.492 (0.524)	Data 0.001 (0.019)	Loss 4.1073 (4.0510)	Top-1 acc 29.297 (30.100)	Top-5 acc 54.688 (53.539)	lr 0.00442
Warmup Train [33][1030/3239]	Time 0.619 (0.524)	Data 0.001 (0.019)	Loss 4.1763 (4.0513)	Top-1 acc 28.906 (30.087)	Top-5 acc 50.000 (53.533)	lr 0.00441
Warmup Train [33][1040/3239]	Time 0.367 (0.524)	Data 0.001 (0.019)	Loss 4.2899 (4.0516)	Top-1 acc 25.781 (30.087)	Top-5 acc 48.047 (53.532)	lr 0.00441
Warmup Train [33][1050/3239]	Time 0.376 (0.524)	Data 0.001 (0.019)	Loss 4.0668 (4.0517)	Top-1 acc 27.344 (30.070)	Top-5 acc 53.516 (53.521)	lr 0.00441
Warmup Train [33][1060/3239]	Time 0.460 (0.524)	Data 0.003 (0.019)	Loss 4.1007 (4.0518)	Top-1 acc 30.859 (30.063)	Top-5 acc 51.172 (53.515)	lr 0.00440
Warmup Train [33][1070/3239]	Time 0.518 (0.524)	Data 0.001 (0.019)	Loss 4.1199 (4.0511)	Top-1 acc 28.906 (30.074)	Top-5 acc 51.953 (53.529)	lr 0.00440
Warmup Train [33][1080/3239]	Time 0.676 (0.524)	Data 0.001 (0.019)	Loss 3.8581 (4.0507)	Top-1 acc 32.422 (30.073)	Top-5 acc 57.031 (53.538)	lr 0.00440
Warmup Train [33][1090/3239]	Time 0.461 (0.524)	Data 0.001 (0.019)	Loss 4.2107 (4.0512)	Top-1 acc 27.344 (30.053)	Top-5 acc 47.266 (53.526)	lr 0.00439
Warmup Train [33][1100/3239]	Time 0.507 (0.524)	Data 0.001 (0.019)	Loss 4.0422 (4.0508)	Top-1 acc 34.375 (30.063)	Top-5 acc 53.906 (53.533)	lr 0.00439
Warmup Train [33][1110/3239]	Time 0.623 (0.523)	Data 0.001 (0.018)	Loss 4.3300 (4.0510)	Top-1 acc 28.906 (30.052)	Top-5 acc 49.219 (53.521)	lr 0.00439
Warmup Train [33][1120/3239]	Time 0.610 (0.523)	Data 0.001 (0.018)	Loss 4.1478 (4.0510)	Top-1 acc 25.391 (30.050)	Top-5 acc 51.172 (53.521)	lr 0.00438
Warmup Train [33][1130/3239]	Time 0.608 (0.523)	Data 0.001 (0.018)	Loss 3.8811 (4.0508)	Top-1 acc 33.594 (30.046)	Top-5 acc 56.250 (53.518)	lr 0.00438
Warmup Train [33][1140/3239]	Time 0.475 (0.523)	Data 0.001 (0.018)	Loss 4.1773 (4.0506)	Top-1 acc 30.078 (30.057)	Top-5 acc 49.219 (53.519)	lr 0.00438
Warmup Train [33][1150/3239]	Time 0.426 (0.523)	Data 0.001 (0.018)	Loss 4.1028 (4.0504)	Top-1 acc 28.906 (30.064)	Top-5 acc 53.906 (53.529)	lr 0.00437
Warmup Train [33][1160/3239]	Time 0.657 (0.523)	Data 0.001 (0.018)	Loss 4.0620 (4.0507)	Top-1 acc 26.172 (30.070)	Top-5 acc 51.172 (53.522)	lr 0.00437
Warmup Train [33][1170/3239]	Time 0.603 (0.523)	Data 0.001 (0.018)	Loss 3.9898 (4.0507)	Top-1 acc 34.375 (30.070)	Top-5 acc 57.812 (53.526)	lr 0.00437
Warmup Train [33][1180/3239]	Time 0.588 (0.523)	Data 0.001 (0.018)	Loss 4.0275 (4.0505)	Top-1 acc 32.422 (30.075)	Top-5 acc 55.078 (53.531)	lr 0.00436
Warmup Train [33][1190/3239]	Time 0.591 (0.523)	Data 0.001 (0.017)	Loss 4.0541 (4.0504)	Top-1 acc 28.125 (30.075)	Top-5 acc 53.125 (53.541)	lr 0.00436
Warmup Train [33][1200/3239]	Time 0.608 (0.522)	Data 0.001 (0.017)	Loss 4.1751 (4.0509)	Top-1 acc 26.953 (30.061)	Top-5 acc 54.297 (53.528)	lr 0.00436
Warmup Train [33][1210/3239]	Time 0.591 (0.522)	Data 0.001 (0.017)	Loss 4.1336 (4.0512)	Top-1 acc 32.812 (30.065)	Top-5 acc 50.781 (53.523)	lr 0.00435
Warmup Train [33][1220/3239]	Time 0.334 (0.522)	Data 0.001 (0.017)	Loss 4.2202 (4.0513)	Top-1 acc 23.047 (30.052)	Top-5 acc 49.219 (53.518)	lr 0.00435
Warmup Train [33][1230/3239]	Time 0.487 (0.522)	Data 0.001 (0.017)	Loss 4.0940 (4.0511)	Top-1 acc 31.250 (30.055)	Top-5 acc 51.562 (53.519)	lr 0.00435
Warmup Train [33][1240/3239]	Time 0.341 (0.522)	Data 0.001 (0.017)	Loss 4.0173 (4.0504)	Top-1 acc 29.688 (30.070)	Top-5 acc 53.516 (53.528)	lr 0.00434
Warmup Train [33][1250/3239]	Time 0.522 (0.522)	Data 0.001 (0.017)	Loss 4.1618 (4.0506)	Top-1 acc 30.078 (30.075)	Top-5 acc 51.562 (53.523)	lr 0.00434
Warmup Train [33][1260/3239]	Time 0.378 (0.522)	Data 0.001 (0.017)	Loss 4.0375 (4.0506)	Top-1 acc 30.859 (30.077)	Top-5 acc 52.344 (53.530)	lr 0.00434
Warmup Train [33][1270/3239]	Time 0.471 (0.521)	Data 0.001 (0.017)	Loss 4.0687 (4.0500)	Top-1 acc 31.641 (30.086)	Top-5 acc 57.422 (53.543)	lr 0.00433
Warmup Train [33][1280/3239]	Time 0.352 (0.521)	Data 0.001 (0.017)	Loss 4.2020 (4.0504)	Top-1 acc 30.078 (30.084)	Top-5 acc 51.172 (53.544)	lr 0.00433
Warmup Train [33][1290/3239]	Time 0.352 (0.521)	Data 0.001 (0.017)	Loss 4.0134 (4.0508)	Top-1 acc 28.906 (30.075)	Top-5 acc 55.859 (53.539)	lr 0.00433
Warmup Train [33][1300/3239]	Time 0.588 (0.521)	Data 0.001 (0.017)	Loss 3.8245 (4.0511)	Top-1 acc 35.938 (30.077)	Top-5 acc 59.375 (53.532)	lr 0.00432
Warmup Train [33][1310/3239]	Time 0.422 (0.520)	Data 0.001 (0.016)	Loss 4.2936 (4.0512)	Top-1 acc 25.781 (30.071)	Top-5 acc 45.703 (53.530)	lr 0.00432
Warmup Train [33][1320/3239]	Time 0.481 (0.520)	Data 0.001 (0.016)	Loss 3.9157 (4.0513)	Top-1 acc 35.938 (30.078)	Top-5 acc 56.641 (53.531)	lr 0.00431
Warmup Train [33][1330/3239]	Time 0.645 (0.520)	Data 0.001 (0.016)	Loss 3.7388 (4.0511)	Top-1 acc 33.984 (30.085)	Top-5 acc 61.328 (53.538)	lr 0.00431
Warmup Train [33][1340/3239]	Time 0.653 (0.520)	Data 0.001 (0.016)	Loss 4.2265 (4.0511)	Top-1 acc 25.391 (30.081)	Top-5 acc 45.312 (53.544)	lr 0.00431
Warmup Train [33][1350/3239]	Time 0.402 (0.520)	Data 0.001 (0.016)	Loss 4.3015 (4.0510)	Top-1 acc 25.391 (30.084)	Top-5 acc 45.312 (53.544)	lr 0.00430
Warmup Train [33][1360/3239]	Time 0.514 (0.520)	Data 0.001 (0.016)	Loss 3.9765 (4.0511)	Top-1 acc 32.812 (30.082)	Top-5 acc 52.734 (53.544)	lr 0.00430
Warmup Train [33][1370/3239]	Time 0.478 (0.520)	Data 0.001 (0.016)	Loss 4.0491 (4.0504)	Top-1 acc 30.078 (30.097)	Top-5 acc 51.172 (53.555)	lr 0.00430
Warmup Train [33][1380/3239]	Time 0.413 (0.519)	Data 0.001 (0.016)	Loss 3.9631 (4.0507)	Top-1 acc 30.469 (30.098)	Top-5 acc 57.812 (53.549)	lr 0.00429
Warmup Train [33][1390/3239]	Time 0.421 (0.519)	Data 0.001 (0.016)	Loss 4.0693 (4.0509)	Top-1 acc 33.984 (30.094)	Top-5 acc 55.469 (53.543)	lr 0.00429
Warmup Train [33][1400/3239]	Time 0.652 (0.519)	Data 0.001 (0.016)	Loss 4.2010 (4.0510)	Top-1 acc 23.438 (30.091)	Top-5 acc 49.609 (53.535)	lr 0.00429
Warmup Train [33][1410/3239]	Time 0.723 (0.519)	Data 0.001 (0.016)	Loss 4.0465 (4.0510)	Top-1 acc 29.297 (30.093)	Top-5 acc 56.641 (53.529)	lr 0.00428
Warmup Train [33][1420/3239]	Time 0.535 (0.519)	Data 0.002 (0.016)	Loss 3.8391 (4.0514)	Top-1 acc 38.672 (30.098)	Top-5 acc 57.422 (53.522)	lr 0.00428
Warmup Train [33][1430/3239]	Time 0.602 (0.519)	Data 0.001 (0.016)	Loss 4.0356 (4.0512)	Top-1 acc 31.250 (30.098)	Top-5 acc 54.688 (53.524)	lr 0.00428
Warmup Train [33][1440/3239]	Time 0.489 (0.519)	Data 0.001 (0.016)	Loss 4.0322 (4.0514)	Top-1 acc 35.547 (30.099)	Top-5 acc 53.125 (53.521)	lr 0.00427
Warmup Train [33][1450/3239]	Time 0.561 (0.519)	Data 0.001 (0.015)	Loss 4.0570 (4.0516)	Top-1 acc 28.906 (30.103)	Top-5 acc 52.344 (53.519)	lr 0.00427
Warmup Train [33][1460/3239]	Time 0.503 (0.519)	Data 0.001 (0.015)	Loss 4.0040 (4.0516)	Top-1 acc 29.688 (30.097)	Top-5 acc 54.297 (53.517)	lr 0.00427
Warmup Train [33][1470/3239]	Time 0.471 (0.519)	Data 0.001 (0.015)	Loss 4.0917 (4.0517)	Top-1 acc 31.250 (30.101)	Top-5 acc 56.250 (53.514)	lr 0.00426
Warmup Train [33][1480/3239]	Time 0.514 (0.519)	Data 0.001 (0.015)	Loss 3.9949 (4.0518)	Top-1 acc 30.078 (30.093)	Top-5 acc 56.250 (53.512)	lr 0.00426
Warmup Train [33][1490/3239]	Time 0.565 (0.519)	Data 0.001 (0.015)	Loss 4.0317 (4.0518)	Top-1 acc 28.125 (30.093)	Top-5 acc 54.297 (53.511)	lr 0.00426
Warmup Train [33][1500/3239]	Time 0.468 (0.519)	Data 0.001 (0.015)	Loss 4.1233 (4.0519)	Top-1 acc 27.344 (30.087)	Top-5 acc 50.781 (53.510)	lr 0.00425
Warmup Train [33][1510/3239]	Time 0.844 (0.519)	Data 0.001 (0.015)	Loss 4.2251 (4.0518)	Top-1 acc 26.562 (30.093)	Top-5 acc 48.828 (53.516)	lr 0.00425
Warmup Train [33][1520/3239]	Time 0.404 (0.519)	Data 0.002 (0.015)	Loss 4.2143 (4.0516)	Top-1 acc 25.781 (30.092)	Top-5 acc 55.469 (53.525)	lr 0.00425
Warmup Train [33][1530/3239]	Time 0.438 (0.519)	Data 0.001 (0.015)	Loss 4.0350 (4.0514)	Top-1 acc 31.250 (30.097)	Top-5 acc 53.906 (53.532)	lr 0.00424
Warmup Train [33][1540/3239]	Time 0.559 (0.519)	Data 0.001 (0.015)	Loss 3.9422 (4.0511)	Top-1 acc 31.250 (30.102)	Top-5 acc 60.156 (53.544)	lr 0.00424
Warmup Train [33][1550/3239]	Time 0.460 (0.518)	Data 0.001 (0.015)	Loss 3.9304 (4.0512)	Top-1 acc 31.641 (30.093)	Top-5 acc 54.688 (53.545)	lr 0.00424
Warmup Train [33][1560/3239]	Time 0.633 (0.518)	Data 0.001 (0.015)	Loss 4.3353 (4.0514)	Top-1 acc 24.219 (30.094)	Top-5 acc 48.828 (53.540)	lr 0.00423
Warmup Train [33][1570/3239]	Time 0.473 (0.518)	Data 0.001 (0.015)	Loss 4.0837 (4.0515)	Top-1 acc 28.125 (30.094)	Top-5 acc 55.469 (53.544)	lr 0.00423
Warmup Train [33][1580/3239]	Time 0.551 (0.518)	Data 0.001 (0.015)	Loss 4.0919 (4.0515)	Top-1 acc 30.859 (30.101)	Top-5 acc 48.828 (53.542)	lr 0.00423
Warmup Train [33][1590/3239]	Time 0.509 (0.517)	Data 0.001 (0.015)	Loss 4.0580 (4.0515)	Top-1 acc 26.172 (30.100)	Top-5 acc 51.953 (53.543)	lr 0.00422
Warmup Train [33][1600/3239]	Time 0.611 (0.517)	Data 0.001 (0.015)	Loss 3.9356 (4.0514)	Top-1 acc 32.031 (30.102)	Top-5 acc 57.422 (53.548)	lr 0.00422
Warmup Train [33][1610/3239]	Time 0.512 (0.517)	Data 0.001 (0.015)	Loss 3.9232 (4.0513)	Top-1 acc 33.203 (30.108)	Top-5 acc 58.594 (53.553)	lr 0.00422
Warmup Train [33][1620/3239]	Time 0.675 (0.517)	Data 0.001 (0.014)	Loss 4.0419 (4.0514)	Top-1 acc 33.594 (30.110)	Top-5 acc 55.078 (53.559)	lr 0.00421
Warmup Train [33][1630/3239]	Time 0.604 (0.517)	Data 0.001 (0.014)	Loss 4.0975 (4.0513)	Top-1 acc 31.250 (30.116)	Top-5 acc 48.828 (53.555)	lr 0.00421
Warmup Train [33][1640/3239]	Time 0.585 (0.517)	Data 0.001 (0.014)	Loss 4.0659 (4.0510)	Top-1 acc 29.297 (30.125)	Top-5 acc 53.516 (53.563)	lr 0.00421
Warmup Train [33][1650/3239]	Time 0.506 (0.517)	Data 0.001 (0.014)	Loss 3.9795 (4.0511)	Top-1 acc 31.250 (30.121)	Top-5 acc 55.078 (53.558)	lr 0.00420
Warmup Train [33][1660/3239]	Time 0.406 (0.517)	Data 0.001 (0.014)	Loss 4.1558 (4.0509)	Top-1 acc 30.078 (30.122)	Top-5 acc 51.953 (53.565)	lr 0.00420
Warmup Train [33][1670/3239]	Time 0.376 (0.517)	Data 0.001 (0.014)	Loss 3.8688 (4.0508)	Top-1 acc 30.078 (30.125)	Top-5 acc 59.766 (53.564)	lr 0.00420
Warmup Train [33][1680/3239]	Time 0.496 (0.517)	Data 0.001 (0.014)	Loss 4.2288 (4.0509)	Top-1 acc 27.734 (30.120)	Top-5 acc 51.172 (53.561)	lr 0.00419
Warmup Train [33][1690/3239]	Time 0.515 (0.517)	Data 0.001 (0.014)	Loss 3.9893 (4.0510)	Top-1 acc 31.250 (30.117)	Top-5 acc 55.078 (53.562)	lr 0.00419
Warmup Train [33][1700/3239]	Time 0.572 (0.517)	Data 0.001 (0.014)	Loss 4.0274 (4.0510)	Top-1 acc 31.641 (30.119)	Top-5 acc 51.953 (53.559)	lr 0.00419
Warmup Train [33][1710/3239]	Time 0.590 (0.517)	Data 0.002 (0.014)	Loss 4.0588 (4.0511)	Top-1 acc 27.344 (30.115)	Top-5 acc 51.172 (53.554)	lr 0.00418
Warmup Train [33][1720/3239]	Time 0.570 (0.517)	Data 0.001 (0.014)	Loss 4.1034 (4.0510)	Top-1 acc 29.297 (30.118)	Top-5 acc 51.953 (53.556)	lr 0.00418
Warmup Train [33][1730/3239]	Time 0.507 (0.517)	Data 0.001 (0.014)	Loss 4.0886 (4.0507)	Top-1 acc 33.984 (30.125)	Top-5 acc 52.734 (53.561)	lr 0.00418
Warmup Train [33][1740/3239]	Time 0.467 (0.517)	Data 0.001 (0.014)	Loss 4.1504 (4.0506)	Top-1 acc 25.391 (30.131)	Top-5 acc 48.828 (53.568)	lr 0.00417
Warmup Train [33][1750/3239]	Time 0.650 (0.517)	Data 0.001 (0.014)	Loss 4.0557 (4.0505)	Top-1 acc 30.859 (30.135)	Top-5 acc 56.250 (53.568)	lr 0.00417
Warmup Train [33][1760/3239]	Time 0.543 (0.517)	Data 0.001 (0.014)	Loss 4.1485 (4.0505)	Top-1 acc 27.734 (30.133)	Top-5 acc 51.172 (53.569)	lr 0.00417
Warmup Train [33][1770/3239]	Time 0.450 (0.517)	Data 0.001 (0.014)	Loss 4.0945 (4.0506)	Top-1 acc 27.734 (30.131)	Top-5 acc 51.562 (53.569)	lr 0.00416
Warmup Train [33][1780/3239]	Time 0.414 (0.517)	Data 0.001 (0.014)	Loss 3.8716 (4.0506)	Top-1 acc 36.328 (30.133)	Top-5 acc 57.031 (53.565)	lr 0.00416
Warmup Train [33][1790/3239]	Time 0.424 (0.517)	Data 0.001 (0.014)	Loss 4.1522 (4.0502)	Top-1 acc 25.391 (30.141)	Top-5 acc 53.516 (53.576)	lr 0.00416
Warmup Train [33][1800/3239]	Time 0.363 (0.517)	Data 0.001 (0.014)	Loss 4.0936 (4.0505)	Top-1 acc 31.641 (30.137)	Top-5 acc 52.734 (53.568)	lr 0.00415
Warmup Train [33][1810/3239]	Time 0.485 (0.517)	Data 0.001 (0.014)	Loss 4.1054 (4.0504)	Top-1 acc 26.562 (30.133)	Top-5 acc 52.734 (53.562)	lr 0.00415
Warmup Train [33][1820/3239]	Time 0.562 (0.517)	Data 0.001 (0.014)	Loss 3.9469 (4.0507)	Top-1 acc 33.594 (30.122)	Top-5 acc 56.641 (53.557)	lr 0.00415
Warmup Train [33][1830/3239]	Time 0.630 (0.516)	Data 0.001 (0.014)	Loss 4.2306 (4.0511)	Top-1 acc 31.641 (30.119)	Top-5 acc 50.000 (53.545)	lr 0.00414
Warmup Train [33][1840/3239]	Time 0.514 (0.516)	Data 0.001 (0.014)	Loss 4.0093 (4.0513)	Top-1 acc 31.641 (30.115)	Top-5 acc 52.344 (53.538)	lr 0.00414
Warmup Train [33][1850/3239]	Time 0.427 (0.516)	Data 0.001 (0.014)	Loss 4.0228 (4.0510)	Top-1 acc 33.594 (30.116)	Top-5 acc 54.688 (53.543)	lr 0.00414
Warmup Train [33][1860/3239]	Time 0.574 (0.516)	Data 0.001 (0.014)	Loss 4.0391 (4.0509)	Top-1 acc 31.250 (30.117)	Top-5 acc 54.688 (53.546)	lr 0.00413
Warmup Train [33][1870/3239]	Time 0.455 (0.516)	Data 0.001 (0.013)	Loss 4.0669 (4.0512)	Top-1 acc 31.641 (30.113)	Top-5 acc 51.562 (53.539)	lr 0.00413
Warmup Train [33][1880/3239]	Time 0.524 (0.516)	Data 0.001 (0.013)	Loss 3.8640 (4.0509)	Top-1 acc 33.203 (30.115)	Top-5 acc 57.031 (53.542)	lr 0.00413
Warmup Train [33][1890/3239]	Time 0.505 (0.516)	Data 0.001 (0.013)	Loss 4.0609 (4.0507)	Top-1 acc 32.812 (30.122)	Top-5 acc 54.297 (53.546)	lr 0.00412
Warmup Train [33][1900/3239]	Time 0.649 (0.516)	Data 0.001 (0.013)	Loss 4.0229 (4.0506)	Top-1 acc 32.422 (30.125)	Top-5 acc 54.297 (53.550)	lr 0.00412
Warmup Train [33][1910/3239]	Time 0.497 (0.516)	Data 0.001 (0.013)	Loss 4.2242 (4.0507)	Top-1 acc 27.344 (30.127)	Top-5 acc 50.391 (53.546)	lr 0.00412
Warmup Train [33][1920/3239]	Time 0.569 (0.516)	Data 0.001 (0.013)	Loss 4.0390 (4.0506)	Top-1 acc 30.078 (30.134)	Top-5 acc 55.859 (53.550)	lr 0.00411
Warmup Train [33][1930/3239]	Time 0.511 (0.516)	Data 0.002 (0.013)	Loss 3.9515 (4.0503)	Top-1 acc 34.375 (30.151)	Top-5 acc 54.688 (53.549)	lr 0.00411
Warmup Train [33][1940/3239]	Time 0.582 (0.516)	Data 0.001 (0.013)	Loss 4.0362 (4.0506)	Top-1 acc 27.344 (30.144)	Top-5 acc 54.297 (53.542)	lr 0.00411
Warmup Train [33][1950/3239]	Time 0.476 (0.516)	Data 0.001 (0.013)	Loss 3.9618 (4.0504)	Top-1 acc 30.078 (30.147)	Top-5 acc 52.734 (53.541)	lr 0.00410
Warmup Train [33][1960/3239]	Time 0.473 (0.516)	Data 0.001 (0.013)	Loss 3.9409 (4.0505)	Top-1 acc 37.891 (30.150)	Top-5 acc 55.859 (53.536)	lr 0.00410
Warmup Train [33][1970/3239]	Time 0.512 (0.516)	Data 0.001 (0.013)	Loss 4.0250 (4.0503)	Top-1 acc 31.641 (30.155)	Top-5 acc 53.516 (53.538)	lr 0.00410
Warmup Train [33][1980/3239]	Time 0.452 (0.515)	Data 0.001 (0.013)	Loss 4.0745 (4.0504)	Top-1 acc 29.688 (30.146)	Top-5 acc 53.125 (53.539)	lr 0.00409
Warmup Train [33][1990/3239]	Time 0.601 (0.516)	Data 0.001 (0.013)	Loss 3.9465 (4.0503)	Top-1 acc 33.984 (30.146)	Top-5 acc 55.078 (53.537)	lr 0.00409
Warmup Train [33][2000/3239]	Time 0.463 (0.516)	Data 0.001 (0.013)	Loss 4.1253 (4.0503)	Top-1 acc 25.391 (30.145)	Top-5 acc 51.953 (53.534)	lr 0.00409
Warmup Train [33][2010/3239]	Time 0.618 (0.516)	Data 0.001 (0.013)	Loss 4.1272 (4.0505)	Top-1 acc 31.641 (30.140)	Top-5 acc 51.172 (53.528)	lr 0.00408
Warmup Train [33][2020/3239]	Time 0.567 (0.516)	Data 0.001 (0.013)	Loss 4.0516 (4.0507)	Top-1 acc 28.906 (30.141)	Top-5 acc 49.609 (53.522)	lr 0.00408
Warmup Train [33][2030/3239]	Time 0.614 (0.516)	Data 0.001 (0.013)	Loss 4.0409 (4.0510)	Top-1 acc 28.125 (30.142)	Top-5 acc 53.906 (53.515)	lr 0.00408
Warmup Train [33][2040/3239]	Time 0.467 (0.516)	Data 0.001 (0.013)	Loss 3.8513 (4.0510)	Top-1 acc 33.984 (30.146)	Top-5 acc 57.812 (53.519)	lr 0.00407
Warmup Train [33][2050/3239]	Time 0.318 (0.515)	Data 0.001 (0.013)	Loss 3.9675 (4.0511)	Top-1 acc 35.156 (30.150)	Top-5 acc 55.859 (53.514)	lr 0.00407
Warmup Train [33][2060/3239]	Time 0.405 (0.515)	Data 0.001 (0.013)	Loss 4.0629 (4.0511)	Top-1 acc 28.906 (30.149)	Top-5 acc 53.516 (53.516)	lr 0.00407
Warmup Train [33][2070/3239]	Time 0.510 (0.515)	Data 0.001 (0.013)	Loss 3.9444 (4.0511)	Top-1 acc 31.641 (30.149)	Top-5 acc 56.641 (53.514)	lr 0.00406
Warmup Train [33][2080/3239]	Time 0.431 (0.515)	Data 0.001 (0.013)	Loss 3.8616 (4.0513)	Top-1 acc 33.594 (30.148)	Top-5 acc 56.250 (53.510)	lr 0.00406
Warmup Train [33][2090/3239]	Time 0.680 (0.515)	Data 0.001 (0.013)	Loss 3.8670 (4.0510)	Top-1 acc 34.375 (30.153)	Top-5 acc 59.766 (53.520)	lr 0.00406
Warmup Train [33][2100/3239]	Time 0.540 (0.515)	Data 0.001 (0.013)	Loss 3.9972 (4.0507)	Top-1 acc 32.422 (30.161)	Top-5 acc 54.688 (53.525)	lr 0.00405
Warmup Train [33][2110/3239]	Time 0.508 (0.515)	Data 0.001 (0.013)	Loss 4.0359 (4.0506)	Top-1 acc 30.859 (30.162)	Top-5 acc 54.297 (53.529)	lr 0.00405
Warmup Train [33][2120/3239]	Time 0.410 (0.515)	Data 0.001 (0.013)	Loss 4.0231 (4.0506)	Top-1 acc 33.203 (30.162)	Top-5 acc 55.078 (53.534)	lr 0.00405
Warmup Train [33][2130/3239]	Time 0.376 (0.515)	Data 0.001 (0.013)	Loss 3.9277 (4.0504)	Top-1 acc 33.203 (30.164)	Top-5 acc 52.344 (53.539)	lr 0.00404
Warmup Train [33][2140/3239]	Time 0.339 (0.515)	Data 0.001 (0.013)	Loss 3.9893 (4.0507)	Top-1 acc 28.906 (30.156)	Top-5 acc 52.344 (53.530)	lr 0.00404
Warmup Train [33][2150/3239]	Time 0.526 (0.515)	Data 0.001 (0.013)	Loss 3.8879 (4.0505)	Top-1 acc 32.812 (30.156)	Top-5 acc 58.984 (53.529)	lr 0.00404
Warmup Train [33][2160/3239]	Time 0.557 (0.515)	Data 0.001 (0.013)	Loss 4.0990 (4.0506)	Top-1 acc 31.250 (30.158)	Top-5 acc 52.344 (53.528)	lr 0.00403
Warmup Train [33][2170/3239]	Time 0.605 (0.515)	Data 0.001 (0.013)	Loss 4.0053 (4.0505)	Top-1 acc 26.953 (30.157)	Top-5 acc 53.516 (53.526)	lr 0.00403
Warmup Train [33][2180/3239]	Time 0.463 (0.515)	Data 0.001 (0.012)	Loss 4.0853 (4.0508)	Top-1 acc 28.516 (30.151)	Top-5 acc 52.344 (53.517)	lr 0.00403
Warmup Train [33][2190/3239]	Time 0.369 (0.515)	Data 0.001 (0.012)	Loss 4.0966 (4.0508)	Top-1 acc 28.906 (30.151)	Top-5 acc 53.516 (53.520)	lr 0.00402
Warmup Train [33][2200/3239]	Time 0.534 (0.515)	Data 0.001 (0.012)	Loss 4.0941 (4.0511)	Top-1 acc 32.422 (30.148)	Top-5 acc 50.391 (53.513)	lr 0.00402
Warmup Train [33][2210/3239]	Time 0.321 (0.515)	Data 0.002 (0.012)	Loss 3.9957 (4.0512)	Top-1 acc 32.812 (30.153)	Top-5 acc 51.172 (53.514)	lr 0.00402
Warmup Train [33][2220/3239]	Time 0.514 (0.515)	Data 0.001 (0.012)	Loss 4.2581 (4.0511)	Top-1 acc 24.219 (30.155)	Top-5 acc 48.828 (53.512)	lr 0.00401
Warmup Train [33][2230/3239]	Time 0.515 (0.515)	Data 0.001 (0.012)	Loss 4.2000 (4.0511)	Top-1 acc 23.828 (30.154)	Top-5 acc 46.875 (53.509)	lr 0.00401
Warmup Train [33][2240/3239]	Time 0.520 (0.515)	Data 0.001 (0.012)	Loss 4.0553 (4.0510)	Top-1 acc 30.469 (30.161)	Top-5 acc 52.344 (53.512)	lr 0.00401
Warmup Train [33][2250/3239]	Time 0.529 (0.515)	Data 0.001 (0.012)	Loss 4.1515 (4.0510)	Top-1 acc 30.078 (30.160)	Top-5 acc 48.438 (53.511)	lr 0.00400
Warmup Train [33][2260/3239]	Time 0.628 (0.515)	Data 0.001 (0.012)	Loss 4.1353 (4.0510)	Top-1 acc 31.641 (30.161)	Top-5 acc 50.781 (53.512)	lr 0.00400
Warmup Train [33][2270/3239]	Time 0.494 (0.515)	Data 0.001 (0.012)	Loss 4.0908 (4.0508)	Top-1 acc 30.078 (30.163)	Top-5 acc 52.734 (53.518)	lr 0.00400
Warmup Train [33][2280/3239]	Time 0.452 (0.515)	Data 0.001 (0.012)	Loss 4.1566 (4.0510)	Top-1 acc 28.516 (30.161)	Top-5 acc 52.344 (53.515)	lr 0.00399
Warmup Train [33][2290/3239]	Time 0.524 (0.515)	Data 0.001 (0.012)	Loss 4.0323 (4.0510)	Top-1 acc 32.031 (30.165)	Top-5 acc 51.172 (53.517)	lr 0.00399
Warmup Train [33][2300/3239]	Time 0.641 (0.515)	Data 0.001 (0.012)	Loss 4.0352 (4.0508)	Top-1 acc 32.812 (30.170)	Top-5 acc 58.594 (53.519)	lr 0.00399
Warmup Train [33][2310/3239]	Time 0.464 (0.515)	Data 0.001 (0.012)	Loss 3.9527 (4.0511)	Top-1 acc 31.250 (30.162)	Top-5 acc 58.594 (53.514)	lr 0.00398
Warmup Train [33][2320/3239]	Time 0.318 (0.515)	Data 0.001 (0.012)	Loss 3.9411 (4.0512)	Top-1 acc 31.641 (30.161)	Top-5 acc 52.734 (53.509)	lr 0.00398
Warmup Train [33][2330/3239]	Time 0.542 (0.515)	Data 0.001 (0.012)	Loss 4.0821 (4.0512)	Top-1 acc 27.734 (30.161)	Top-5 acc 50.781 (53.507)	lr 0.00398
Warmup Train [33][2340/3239]	Time 0.567 (0.515)	Data 0.001 (0.012)	Loss 4.1440 (4.0511)	Top-1 acc 26.172 (30.165)	Top-5 acc 54.297 (53.514)	lr 0.00397
Warmup Train [33][2350/3239]	Time 0.455 (0.515)	Data 0.001 (0.012)	Loss 4.1732 (4.0510)	Top-1 acc 31.641 (30.172)	Top-5 acc 47.656 (53.518)	lr 0.00397
Warmup Train [33][2360/3239]	Time 0.499 (0.515)	Data 0.001 (0.012)	Loss 4.0702 (4.0509)	Top-1 acc 31.641 (30.173)	Top-5 acc 55.078 (53.525)	lr 0.00397
Warmup Train [33][2370/3239]	Time 0.533 (0.515)	Data 0.001 (0.012)	Loss 3.9600 (4.0510)	Top-1 acc 32.812 (30.176)	Top-5 acc 53.906 (53.525)	lr 0.00396
Warmup Train [33][2380/3239]	Time 0.510 (0.515)	Data 0.001 (0.012)	Loss 4.0184 (4.0509)	Top-1 acc 33.984 (30.183)	Top-5 acc 57.812 (53.528)	lr 0.00396
Warmup Train [33][2390/3239]	Time 0.607 (0.515)	Data 0.001 (0.012)	Loss 3.9220 (4.0509)	Top-1 acc 32.422 (30.184)	Top-5 acc 56.641 (53.528)	lr 0.00396
Warmup Train [33][2400/3239]	Time 0.329 (0.515)	Data 0.001 (0.012)	Loss 4.2527 (4.0511)	Top-1 acc 30.078 (30.183)	Top-5 acc 50.391 (53.523)	lr 0.00395
Warmup Train [33][2410/3239]	Time 0.504 (0.515)	Data 0.001 (0.012)	Loss 4.0455 (4.0509)	Top-1 acc 32.031 (30.183)	Top-5 acc 53.906 (53.525)	lr 0.00395
Warmup Train [33][2420/3239]	Time 0.572 (0.515)	Data 0.001 (0.012)	Loss 3.8759 (4.0509)	Top-1 acc 35.156 (30.181)	Top-5 acc 58.594 (53.525)	lr 0.00395
Warmup Train [33][2430/3239]	Time 0.534 (0.515)	Data 0.001 (0.012)	Loss 4.1942 (4.0509)	Top-1 acc 29.688 (30.179)	Top-5 acc 47.266 (53.528)	lr 0.00394
Warmup Train [33][2440/3239]	Time 0.518 (0.515)	Data 0.001 (0.012)	Loss 3.9273 (4.0506)	Top-1 acc 29.297 (30.186)	Top-5 acc 53.125 (53.536)	lr 0.00394
Warmup Train [33][2450/3239]	Time 0.595 (0.515)	Data 0.001 (0.012)	Loss 3.8355 (4.0505)	Top-1 acc 32.422 (30.187)	Top-5 acc 57.422 (53.536)	lr 0.00394
Warmup Train [33][2460/3239]	Time 0.418 (0.515)	Data 0.001 (0.012)	Loss 4.0325 (4.0505)	Top-1 acc 28.125 (30.193)	Top-5 acc 53.906 (53.540)	lr 0.00393
Warmup Train [33][2470/3239]	Time 0.631 (0.515)	Data 0.001 (0.012)	Loss 4.3121 (4.0507)	Top-1 acc 26.953 (30.191)	Top-5 acc 48.047 (53.533)	lr 0.00393
Warmup Train [33][2480/3239]	Time 0.432 (0.515)	Data 0.001 (0.012)	Loss 3.9862 (4.0506)	Top-1 acc 33.203 (30.197)	Top-5 acc 53.906 (53.532)	lr 0.00393
Warmup Train [33][2490/3239]	Time 0.355 (0.515)	Data 0.001 (0.012)	Loss 4.1907 (4.0506)	Top-1 acc 31.641 (30.197)	Top-5 acc 53.906 (53.534)	lr 0.00392
Warmup Train [33][2500/3239]	Time 0.491 (0.514)	Data 0.001 (0.012)	Loss 4.1483 (4.0507)	Top-1 acc 26.562 (30.197)	Top-5 acc 51.562 (53.536)	lr 0.00392
Warmup Train [33][2510/3239]	Time 0.671 (0.515)	Data 0.001 (0.012)	Loss 4.0200 (4.0508)	Top-1 acc 30.078 (30.204)	Top-5 acc 56.250 (53.534)	lr 0.00392
Warmup Train [33][2520/3239]	Time 0.570 (0.515)	Data 0.001 (0.012)	Loss 3.9604 (4.0503)	Top-1 acc 33.203 (30.213)	Top-5 acc 55.859 (53.542)	lr 0.00392
Warmup Train [33][2530/3239]	Time 0.558 (0.515)	Data 0.001 (0.012)	Loss 3.8398 (4.0500)	Top-1 acc 33.594 (30.218)	Top-5 acc 55.859 (53.550)	lr 0.00391
Warmup Train [33][2540/3239]	Time 0.523 (0.515)	Data 0.002 (0.012)	Loss 3.9796 (4.0501)	Top-1 acc 34.375 (30.217)	Top-5 acc 55.469 (53.546)	lr 0.00391
Warmup Train [33][2550/3239]	Time 0.487 (0.515)	Data 0.001 (0.012)	Loss 3.8855 (4.0501)	Top-1 acc 31.641 (30.216)	Top-5 acc 61.328 (53.545)	lr 0.00391
Warmup Train [33][2560/3239]	Time 0.658 (0.515)	Data 0.001 (0.012)	Loss 4.1440 (4.0504)	Top-1 acc 26.562 (30.207)	Top-5 acc 50.000 (53.536)	lr 0.00390
Warmup Train [33][2570/3239]	Time 0.473 (0.515)	Data 0.001 (0.012)	Loss 3.7314 (4.0502)	Top-1 acc 35.547 (30.212)	Top-5 acc 58.984 (53.541)	lr 0.00390
Warmup Train [33][2580/3239]	Time 0.579 (0.515)	Data 0.001 (0.012)	Loss 3.9684 (4.0502)	Top-1 acc 34.375 (30.210)	Top-5 acc 53.906 (53.537)	lr 0.00390
Warmup Train [33][2590/3239]	Time 0.477 (0.515)	Data 0.001 (0.012)	Loss 4.0379 (4.0504)	Top-1 acc 29.297 (30.207)	Top-5 acc 55.469 (53.531)	lr 0.00389
Warmup Train [33][2600/3239]	Time 0.531 (0.515)	Data 0.001 (0.012)	Loss 3.9975 (4.0503)	Top-1 acc 30.859 (30.207)	Top-5 acc 54.688 (53.529)	lr 0.00389
Warmup Train [33][2610/3239]	Time 0.761 (0.514)	Data 0.001 (0.012)	Loss 3.9315 (4.0502)	Top-1 acc 31.641 (30.212)	Top-5 acc 58.984 (53.531)	lr 0.00389
Warmup Train [33][2620/3239]	Time 0.402 (0.514)	Data 0.001 (0.011)	Loss 3.9286 (4.0499)	Top-1 acc 33.984 (30.220)	Top-5 acc 54.297 (53.532)	lr 0.00388
Warmup Train [33][2630/3239]	Time 0.562 (0.514)	Data 0.001 (0.011)	Loss 4.0465 (4.0500)	Top-1 acc 34.375 (30.218)	Top-5 acc 54.297 (53.530)	lr 0.00388
Warmup Train [33][2640/3239]	Time 0.628 (0.515)	Data 0.001 (0.011)	Loss 4.3307 (4.0500)	Top-1 acc 25.391 (30.219)	Top-5 acc 43.750 (53.529)	lr 0.00388
Warmup Train [33][2650/3239]	Time 0.644 (0.514)	Data 0.001 (0.011)	Loss 4.2493 (4.0502)	Top-1 acc 24.219 (30.215)	Top-5 acc 46.484 (53.520)	lr 0.00387
Warmup Train [33][2660/3239]	Time 0.607 (0.514)	Data 0.001 (0.011)	Loss 4.2203 (4.0503)	Top-1 acc 28.906 (30.214)	Top-5 acc 50.391 (53.518)	lr 0.00387
Warmup Train [33][2670/3239]	Time 0.401 (0.514)	Data 0.001 (0.011)	Loss 3.9829 (4.0504)	Top-1 acc 29.297 (30.217)	Top-5 acc 52.734 (53.518)	lr 0.00387
Warmup Train [33][2680/3239]	Time 0.678 (0.514)	Data 0.001 (0.011)	Loss 4.2212 (4.0504)	Top-1 acc 29.688 (30.220)	Top-5 acc 48.047 (53.516)	lr 0.00386
Warmup Train [33][2690/3239]	Time 0.597 (0.514)	Data 0.001 (0.011)	Loss 4.0391 (4.0507)	Top-1 acc 31.250 (30.213)	Top-5 acc 54.688 (53.508)	lr 0.00386
Warmup Train [33][2700/3239]	Time 0.598 (0.514)	Data 0.001 (0.011)	Loss 4.0188 (4.0507)	Top-1 acc 29.688 (30.214)	Top-5 acc 51.172 (53.504)	lr 0.00386
Warmup Train [33][2710/3239]	Time 0.499 (0.514)	Data 0.001 (0.011)	Loss 4.2336 (4.0507)	Top-1 acc 28.125 (30.216)	Top-5 acc 48.047 (53.501)	lr 0.00385
Warmup Train [33][2720/3239]	Time 0.616 (0.514)	Data 0.001 (0.011)	Loss 3.9811 (4.0506)	Top-1 acc 29.297 (30.213)	Top-5 acc 55.469 (53.502)	lr 0.00385
Warmup Train [33][2730/3239]	Time 0.423 (0.514)	Data 0.001 (0.011)	Loss 4.1456 (4.0507)	Top-1 acc 23.828 (30.208)	Top-5 acc 50.000 (53.499)	lr 0.00385
Warmup Train [33][2740/3239]	Time 0.552 (0.514)	Data 0.001 (0.011)	Loss 3.7600 (4.0507)	Top-1 acc 34.766 (30.208)	Top-5 acc 56.641 (53.497)	lr 0.00384
Warmup Train [33][2750/3239]	Time 0.364 (0.514)	Data 0.001 (0.011)	Loss 4.0513 (4.0508)	Top-1 acc 30.469 (30.209)	Top-5 acc 54.688 (53.497)	lr 0.00384
Warmup Train [33][2760/3239]	Time 0.410 (0.514)	Data 0.001 (0.011)	Loss 4.1743 (4.0507)	Top-1 acc 26.953 (30.207)	Top-5 acc 53.125 (53.502)	lr 0.00384
Warmup Train [33][2770/3239]	Time 0.633 (0.514)	Data 0.001 (0.011)	Loss 3.9552 (4.0506)	Top-1 acc 35.547 (30.209)	Top-5 acc 54.688 (53.503)	lr 0.00383
Warmup Train [33][2780/3239]	Time 0.783 (0.514)	Data 0.001 (0.011)	Loss 4.0101 (4.0508)	Top-1 acc 33.594 (30.204)	Top-5 acc 54.297 (53.499)	lr 0.00383
Warmup Train [33][2790/3239]	Time 0.620 (0.514)	Data 0.001 (0.011)	Loss 3.9923 (4.0506)	Top-1 acc 32.422 (30.212)	Top-5 acc 53.516 (53.508)	lr 0.00383
Warmup Train [33][2800/3239]	Time 0.487 (0.514)	Data 0.001 (0.011)	Loss 4.1050 (4.0506)	Top-1 acc 30.078 (30.213)	Top-5 acc 53.906 (53.509)	lr 0.00382
Warmup Train [33][2810/3239]	Time 0.567 (0.514)	Data 0.001 (0.011)	Loss 4.2407 (4.0506)	Top-1 acc 25.000 (30.211)	Top-5 acc 48.438 (53.508)	lr 0.00382
Warmup Train [33][2820/3239]	Time 0.419 (0.514)	Data 0.001 (0.011)	Loss 3.8626 (4.0506)	Top-1 acc 34.375 (30.214)	Top-5 acc 57.422 (53.509)	lr 0.00382
Warmup Train [33][2830/3239]	Time 0.475 (0.514)	Data 0.001 (0.011)	Loss 3.8596 (4.0506)	Top-1 acc 35.156 (30.213)	Top-5 acc 58.203 (53.511)	lr 0.00381
Warmup Train [33][2840/3239]	Time 0.512 (0.514)	Data 0.001 (0.011)	Loss 4.1664 (4.0506)	Top-1 acc 30.859 (30.210)	Top-5 acc 52.734 (53.510)	lr 0.00381
Warmup Train [33][2850/3239]	Time 0.619 (0.514)	Data 0.028 (0.011)	Loss 4.0270 (4.0507)	Top-1 acc 31.641 (30.209)	Top-5 acc 53.906 (53.507)	lr 0.00381
Warmup Train [33][2860/3239]	Time 0.548 (0.514)	Data 0.001 (0.011)	Loss 3.9285 (4.0507)	Top-1 acc 33.594 (30.214)	Top-5 acc 57.031 (53.507)	lr 0.00381
Warmup Train [33][2870/3239]	Time 0.510 (0.514)	Data 0.001 (0.011)	Loss 4.1437 (4.0508)	Top-1 acc 29.688 (30.213)	Top-5 acc 55.859 (53.506)	lr 0.00380
Warmup Train [33][2880/3239]	Time 0.430 (0.514)	Data 0.001 (0.011)	Loss 4.1047 (4.0508)	Top-1 acc 28.516 (30.215)	Top-5 acc 50.391 (53.505)	lr 0.00380
Warmup Train [33][2890/3239]	Time 0.628 (0.514)	Data 0.001 (0.011)	Loss 4.1004 (4.0508)	Top-1 acc 30.859 (30.216)	Top-5 acc 54.297 (53.506)	lr 0.00380
Warmup Train [33][2900/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 3.9037 (4.0508)	Top-1 acc 34.375 (30.220)	Top-5 acc 55.859 (53.503)	lr 0.00379
Warmup Train [33][2910/3239]	Time 0.595 (0.514)	Data 0.001 (0.011)	Loss 4.1792 (4.0507)	Top-1 acc 25.391 (30.222)	Top-5 acc 50.391 (53.503)	lr 0.00379
Warmup Train [33][2920/3239]	Time 0.454 (0.514)	Data 0.001 (0.011)	Loss 4.1775 (4.0508)	Top-1 acc 25.000 (30.219)	Top-5 acc 51.562 (53.502)	lr 0.00379
Warmup Train [33][2930/3239]	Time 0.509 (0.514)	Data 0.001 (0.011)	Loss 4.2152 (4.0510)	Top-1 acc 26.172 (30.217)	Top-5 acc 51.562 (53.500)	lr 0.00378
Warmup Train [33][2940/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 4.1051 (4.0511)	Top-1 acc 28.906 (30.214)	Top-5 acc 51.953 (53.497)	lr 0.00378
Warmup Train [33][2950/3239]	Time 0.500 (0.513)	Data 0.001 (0.011)	Loss 4.0524 (4.0512)	Top-1 acc 33.203 (30.212)	Top-5 acc 53.125 (53.491)	lr 0.00378
Warmup Train [33][2960/3239]	Time 0.459 (0.513)	Data 0.001 (0.011)	Loss 4.1140 (4.0513)	Top-1 acc 29.297 (30.211)	Top-5 acc 53.125 (53.490)	lr 0.00377
Warmup Train [33][2970/3239]	Time 0.631 (0.513)	Data 0.001 (0.011)	Loss 4.0743 (4.0512)	Top-1 acc 29.297 (30.213)	Top-5 acc 51.562 (53.494)	lr 0.00377
Warmup Train [33][2980/3239]	Time 0.439 (0.513)	Data 0.001 (0.011)	Loss 3.7175 (4.0510)	Top-1 acc 35.547 (30.216)	Top-5 acc 58.594 (53.497)	lr 0.00377
Warmup Train [33][2990/3239]	Time 0.360 (0.513)	Data 0.001 (0.011)	Loss 4.0718 (4.0513)	Top-1 acc 26.562 (30.211)	Top-5 acc 51.953 (53.492)	lr 0.00376
Warmup Train [33][3000/3239]	Time 0.557 (0.513)	Data 0.001 (0.011)	Loss 4.0664 (4.0512)	Top-1 acc 31.641 (30.210)	Top-5 acc 52.734 (53.492)	lr 0.00376
Warmup Train [33][3010/3239]	Time 0.528 (0.513)	Data 0.001 (0.011)	Loss 4.0790 (4.0512)	Top-1 acc 28.906 (30.213)	Top-5 acc 53.906 (53.495)	lr 0.00376
Warmup Train [33][3020/3239]	Time 0.624 (0.513)	Data 0.001 (0.011)	Loss 4.0061 (4.0512)	Top-1 acc 30.859 (30.207)	Top-5 acc 54.688 (53.494)	lr 0.00375
Warmup Train [33][3030/3239]	Time 0.355 (0.513)	Data 0.001 (0.011)	Loss 4.1767 (4.0513)	Top-1 acc 25.000 (30.204)	Top-5 acc 50.391 (53.493)	lr 0.00375
Warmup Train [33][3040/3239]	Time 0.522 (0.513)	Data 0.001 (0.011)	Loss 4.0317 (4.0512)	Top-1 acc 32.422 (30.207)	Top-5 acc 52.344 (53.492)	lr 0.00375
Warmup Train [33][3050/3239]	Time 0.620 (0.513)	Data 0.001 (0.011)	Loss 4.0837 (4.0514)	Top-1 acc 30.469 (30.207)	Top-5 acc 49.609 (53.488)	lr 0.00374
Warmup Train [33][3060/3239]	Time 0.570 (0.513)	Data 0.001 (0.011)	Loss 4.0897 (4.0511)	Top-1 acc 29.297 (30.213)	Top-5 acc 52.734 (53.492)	lr 0.00374
Warmup Train [33][3070/3239]	Time 0.473 (0.513)	Data 0.001 (0.011)	Loss 4.0554 (4.0511)	Top-1 acc 29.297 (30.214)	Top-5 acc 53.125 (53.492)	lr 0.00374
Warmup Train [33][3080/3239]	Time 0.542 (0.513)	Data 0.001 (0.011)	Loss 3.8623 (4.0513)	Top-1 acc 32.812 (30.210)	Top-5 acc 57.422 (53.491)	lr 0.00373
Warmup Train [33][3090/3239]	Time 0.569 (0.513)	Data 0.001 (0.011)	Loss 4.1331 (4.0511)	Top-1 acc 30.859 (30.215)	Top-5 acc 49.609 (53.496)	lr 0.00373
Warmup Train [33][3100/3239]	Time 0.390 (0.513)	Data 0.001 (0.011)	Loss 3.9591 (4.0510)	Top-1 acc 30.078 (30.215)	Top-5 acc 54.297 (53.497)	lr 0.00373
Warmup Train [33][3110/3239]	Time 0.526 (0.513)	Data 0.001 (0.011)	Loss 4.0595 (4.0512)	Top-1 acc 34.375 (30.211)	Top-5 acc 55.859 (53.492)	lr 0.00373
Warmup Train [33][3120/3239]	Time 0.530 (0.513)	Data 0.001 (0.011)	Loss 4.1223 (4.0511)	Top-1 acc 30.469 (30.213)	Top-5 acc 51.562 (53.495)	lr 0.00372
Warmup Train [33][3130/3239]	Time 0.445 (0.513)	Data 0.001 (0.011)	Loss 4.0160 (4.0513)	Top-1 acc 31.250 (30.211)	Top-5 acc 53.516 (53.491)	lr 0.00372
Warmup Train [33][3140/3239]	Time 0.521 (0.513)	Data 0.001 (0.011)	Loss 3.9481 (4.0514)	Top-1 acc 29.688 (30.205)	Top-5 acc 58.203 (53.491)	lr 0.00372
Warmup Train [33][3150/3239]	Time 0.543 (0.513)	Data 0.001 (0.011)	Loss 4.0445 (4.0512)	Top-1 acc 31.641 (30.208)	Top-5 acc 51.562 (53.495)	lr 0.00371
Warmup Train [33][3160/3239]	Time 0.473 (0.513)	Data 0.001 (0.011)	Loss 3.8581 (4.0508)	Top-1 acc 34.375 (30.216)	Top-5 acc 60.156 (53.502)	lr 0.00371
Warmup Train [33][3170/3239]	Time 0.544 (0.513)	Data 0.001 (0.011)	Loss 3.9919 (4.0506)	Top-1 acc 33.203 (30.222)	Top-5 acc 54.688 (53.508)	lr 0.00371
Warmup Train [33][3180/3239]	Time 0.648 (0.513)	Data 0.000 (0.011)	Loss 3.9341 (4.0506)	Top-1 acc 33.594 (30.224)	Top-5 acc 56.641 (53.510)	lr 0.00370
Warmup Train [33][3190/3239]	Time 0.585 (0.513)	Data 0.000 (0.011)	Loss 4.1246 (4.0508)	Top-1 acc 28.125 (30.216)	Top-5 acc 52.344 (53.506)	lr 0.00370
Warmup Train [33][3200/3239]	Time 0.660 (0.513)	Data 0.000 (0.010)	Loss 4.0740 (4.0508)	Top-1 acc 28.125 (30.215)	Top-5 acc 50.000 (53.505)	lr 0.00370
Warmup Train [33][3210/3239]	Time 0.467 (0.513)	Data 0.000 (0.010)	Loss 4.1031 (4.0506)	Top-1 acc 28.516 (30.219)	Top-5 acc 51.562 (53.511)	lr 0.00369
Warmup Train [33][3220/3239]	Time 0.526 (0.513)	Data 0.000 (0.010)	Loss 3.9955 (4.0505)	Top-1 acc 30.078 (30.219)	Top-5 acc 52.344 (53.512)	lr 0.00369
Warmup Train [33][3230/3239]	Time 0.330 (0.513)	Data 0.000 (0.010)	Loss 3.9717 (4.0504)	Top-1 acc 30.078 (30.222)	Top-5 acc 56.641 (53.517)	lr 0.00369
Warmup Train [33][3239/3239]	Time 0.351 (0.513)	Data 0.000 (0.010)	Loss 4.5798 (4.0504)	Top-1 acc 19.753 (30.219)	Top-5 acc 39.506 (53.519)	lr 0.00368
==========Warmup Valid [33/40]	loss 2.994	top-1 acc 37.810	top-5 acc 62.588	Train top-1 30.219	top-5 53.519	flops: 442.4M
Warmup Train [34][0/3239]	Time 15.171 (15.171)	Data 12.065 (12.065)	Loss 4.1883 (4.1883)	Top-1 acc 23.047 (23.047)	Top-5 acc 49.219 (49.219)	lr 0.00368
Warmup Train [34][10/3239]	Time 0.516 (1.896)	Data 0.001 (1.099)	Loss 4.2335 (4.0834)	Top-1 acc 26.562 (29.368)	Top-5 acc 48.047 (53.161)	lr 0.00368
Warmup Train [34][20/3239]	Time 0.500 (1.236)	Data 0.001 (0.577)	Loss 4.0182 (4.0764)	Top-1 acc 33.203 (29.706)	Top-5 acc 55.469 (53.032)	lr 0.00368
Warmup Train [34][30/3239]	Time 0.426 (1.006)	Data 0.001 (0.392)	Loss 4.0579 (4.0781)	Top-1 acc 25.000 (29.335)	Top-5 acc 55.469 (52.785)	lr 0.00367
Warmup Train [34][40/3239]	Time 0.328 (0.889)	Data 0.001 (0.300)	Loss 3.9586 (4.0829)	Top-1 acc 31.641 (29.459)	Top-5 acc 57.812 (52.706)	lr 0.00367
Warmup Train [34][50/3239]	Time 0.482 (0.814)	Data 0.001 (0.244)	Loss 4.0405 (4.0814)	Top-1 acc 30.859 (29.496)	Top-5 acc 51.953 (52.903)	lr 0.00367
Warmup Train [34][60/3239]	Time 0.633 (0.760)	Data 0.001 (0.204)	Loss 3.8777 (4.0726)	Top-1 acc 34.766 (29.566)	Top-5 acc 58.594 (53.356)	lr 0.00367
Warmup Train [34][70/3239]	Time 0.624 (0.724)	Data 0.001 (0.175)	Loss 4.0547 (4.0703)	Top-1 acc 28.516 (29.693)	Top-5 acc 52.734 (53.428)	lr 0.00366
Warmup Train [34][80/3239]	Time 0.681 (0.692)	Data 0.001 (0.154)	Loss 3.9439 (4.0692)	Top-1 acc 34.375 (29.818)	Top-5 acc 55.078 (53.472)	lr 0.00366
Warmup Train [34][90/3239]	Time 0.686 (0.671)	Data 0.001 (0.137)	Loss 3.9981 (4.0552)	Top-1 acc 29.688 (30.198)	Top-5 acc 51.172 (53.687)	lr 0.00366
Warmup Train [34][100/3239]	Time 0.618 (0.651)	Data 0.001 (0.124)	Loss 4.3308 (4.0554)	Top-1 acc 25.000 (30.275)	Top-5 acc 50.391 (53.721)	lr 0.00365
Warmup Train [34][110/3239]	Time 0.590 (0.639)	Data 0.001 (0.113)	Loss 4.0347 (4.0538)	Top-1 acc 30.078 (30.251)	Top-5 acc 51.953 (53.635)	lr 0.00365
Warmup Train [34][120/3239]	Time 0.494 (0.624)	Data 0.001 (0.104)	Loss 4.1566 (4.0540)	Top-1 acc 28.516 (30.269)	Top-5 acc 51.953 (53.554)	lr 0.00365
Warmup Train [34][130/3239]	Time 0.391 (0.615)	Data 0.001 (0.097)	Loss 3.6865 (4.0441)	Top-1 acc 35.156 (30.454)	Top-5 acc 58.984 (53.745)	lr 0.00364
Warmup Train [34][140/3239]	Time 0.493 (0.609)	Data 0.001 (0.091)	Loss 3.9853 (4.0445)	Top-1 acc 29.297 (30.449)	Top-5 acc 54.297 (53.662)	lr 0.00364
Warmup Train [34][150/3239]	Time 0.604 (0.604)	Data 0.001 (0.085)	Loss 4.1236 (4.0463)	Top-1 acc 29.297 (30.350)	Top-5 acc 50.781 (53.601)	lr 0.00364
Warmup Train [34][160/3239]	Time 0.529 (0.598)	Data 0.001 (0.080)	Loss 4.0096 (4.0447)	Top-1 acc 30.859 (30.377)	Top-5 acc 54.688 (53.698)	lr 0.00363
Warmup Train [34][170/3239]	Time 0.496 (0.592)	Data 0.001 (0.075)	Loss 4.0025 (4.0461)	Top-1 acc 31.641 (30.345)	Top-5 acc 54.297 (53.682)	lr 0.00363
Warmup Train [34][180/3239]	Time 0.485 (0.587)	Data 0.001 (0.071)	Loss 3.9736 (4.0449)	Top-1 acc 34.375 (30.354)	Top-5 acc 53.906 (53.727)	lr 0.00363
Warmup Train [34][190/3239]	Time 0.476 (0.583)	Data 0.001 (0.068)	Loss 3.8989 (4.0423)	Top-1 acc 33.984 (30.369)	Top-5 acc 57.422 (53.722)	lr 0.00362
Warmup Train [34][200/3239]	Time 0.530 (0.580)	Data 0.001 (0.065)	Loss 3.7426 (4.0421)	Top-1 acc 35.156 (30.350)	Top-5 acc 61.328 (53.759)	lr 0.00362
Warmup Train [34][210/3239]	Time 0.413 (0.576)	Data 0.001 (0.062)	Loss 4.0375 (4.0420)	Top-1 acc 29.297 (30.308)	Top-5 acc 55.078 (53.767)	lr 0.00362
Warmup Train [34][220/3239]	Time 0.584 (0.574)	Data 0.001 (0.060)	Loss 3.9657 (4.0428)	Top-1 acc 33.203 (30.304)	Top-5 acc 56.250 (53.767)	lr 0.00361
Warmup Train [34][230/3239]	Time 0.395 (0.570)	Data 0.001 (0.057)	Loss 3.8995 (4.0424)	Top-1 acc 33.203 (30.330)	Top-5 acc 57.031 (53.796)	lr 0.00361
Warmup Train [34][240/3239]	Time 0.440 (0.569)	Data 0.001 (0.055)	Loss 4.0529 (4.0404)	Top-1 acc 33.203 (30.402)	Top-5 acc 54.297 (53.840)	lr 0.00361
Warmup Train [34][250/3239]	Time 0.622 (0.566)	Data 0.001 (0.053)	Loss 4.1646 (4.0411)	Top-1 acc 29.688 (30.414)	Top-5 acc 53.516 (53.828)	lr 0.00361
Warmup Train [34][260/3239]	Time 0.465 (0.564)	Data 0.001 (0.051)	Loss 3.9844 (4.0410)	Top-1 acc 29.688 (30.401)	Top-5 acc 52.344 (53.806)	lr 0.00360
Warmup Train [34][270/3239]	Time 0.342 (0.562)	Data 0.001 (0.050)	Loss 4.0499 (4.0431)	Top-1 acc 30.469 (30.345)	Top-5 acc 54.297 (53.762)	lr 0.00360
Warmup Train [34][280/3239]	Time 0.563 (0.560)	Data 0.001 (0.048)	Loss 4.1239 (4.0394)	Top-1 acc 28.125 (30.395)	Top-5 acc 49.609 (53.817)	lr 0.00360
Warmup Train [34][290/3239]	Time 0.430 (0.558)	Data 0.001 (0.047)	Loss 4.1356 (4.0387)	Top-1 acc 30.078 (30.414)	Top-5 acc 52.344 (53.858)	lr 0.00359
Warmup Train [34][300/3239]	Time 0.575 (0.557)	Data 0.001 (0.046)	Loss 4.1471 (4.0387)	Top-1 acc 31.641 (30.458)	Top-5 acc 57.812 (53.850)	lr 0.00359
Warmup Train [34][310/3239]	Time 0.472 (0.555)	Data 0.001 (0.044)	Loss 3.9457 (4.0376)	Top-1 acc 32.031 (30.498)	Top-5 acc 57.422 (53.875)	lr 0.00359
Warmup Train [34][320/3239]	Time 0.648 (0.554)	Data 0.001 (0.043)	Loss 4.0448 (4.0373)	Top-1 acc 26.562 (30.485)	Top-5 acc 52.344 (53.869)	lr 0.00358
Warmup Train [34][330/3239]	Time 0.550 (0.553)	Data 0.001 (0.042)	Loss 4.0096 (4.0381)	Top-1 acc 32.031 (30.471)	Top-5 acc 53.906 (53.826)	lr 0.00358
Warmup Train [34][340/3239]	Time 0.752 (0.553)	Data 0.001 (0.041)	Loss 4.0076 (4.0381)	Top-1 acc 31.250 (30.470)	Top-5 acc 55.469 (53.816)	lr 0.00358
Warmup Train [34][350/3239]	Time 0.573 (0.552)	Data 0.001 (0.040)	Loss 3.9339 (4.0372)	Top-1 acc 31.250 (30.450)	Top-5 acc 58.594 (53.809)	lr 0.00357
Warmup Train [34][360/3239]	Time 0.521 (0.549)	Data 0.001 (0.039)	Loss 4.0270 (4.0371)	Top-1 acc 32.031 (30.463)	Top-5 acc 50.391 (53.798)	lr 0.00357
Warmup Train [34][370/3239]	Time 0.519 (0.548)	Data 0.001 (0.038)	Loss 4.0868 (4.0378)	Top-1 acc 31.641 (30.462)	Top-5 acc 54.688 (53.799)	lr 0.00357
Warmup Train [34][380/3239]	Time 0.404 (0.546)	Data 0.001 (0.037)	Loss 3.9581 (4.0375)	Top-1 acc 33.203 (30.469)	Top-5 acc 57.422 (53.805)	lr 0.00356
Warmup Train [34][390/3239]	Time 0.475 (0.544)	Data 0.001 (0.036)	Loss 4.1036 (4.0374)	Top-1 acc 29.688 (30.465)	Top-5 acc 51.562 (53.812)	lr 0.00356
Warmup Train [34][400/3239]	Time 0.507 (0.541)	Data 0.001 (0.036)	Loss 3.9674 (4.0365)	Top-1 acc 29.688 (30.487)	Top-5 acc 54.297 (53.826)	lr 0.00356
Warmup Train [34][410/3239]	Time 0.360 (0.541)	Data 0.001 (0.035)	Loss 4.3084 (4.0376)	Top-1 acc 27.734 (30.463)	Top-5 acc 46.484 (53.789)	lr 0.00356
Warmup Train [34][420/3239]	Time 0.590 (0.540)	Data 0.001 (0.034)	Loss 3.8868 (4.0384)	Top-1 acc 32.812 (30.431)	Top-5 acc 55.469 (53.762)	lr 0.00355
Warmup Train [34][430/3239]	Time 0.373 (0.540)	Data 0.001 (0.033)	Loss 3.9429 (4.0375)	Top-1 acc 33.203 (30.459)	Top-5 acc 58.203 (53.767)	lr 0.00355
Warmup Train [34][440/3239]	Time 0.415 (0.539)	Data 0.001 (0.033)	Loss 3.9105 (4.0373)	Top-1 acc 30.078 (30.459)	Top-5 acc 57.422 (53.782)	lr 0.00355
Warmup Train [34][450/3239]	Time 0.539 (0.539)	Data 0.001 (0.032)	Loss 4.0003 (4.0386)	Top-1 acc 31.250 (30.427)	Top-5 acc 54.688 (53.746)	lr 0.00354
Warmup Train [34][460/3239]	Time 0.671 (0.538)	Data 0.001 (0.032)	Loss 4.0672 (4.0371)	Top-1 acc 31.250 (30.435)	Top-5 acc 54.688 (53.788)	lr 0.00354
Warmup Train [34][470/3239]	Time 0.299 (0.537)	Data 0.001 (0.031)	Loss 4.0270 (4.0370)	Top-1 acc 29.297 (30.431)	Top-5 acc 51.953 (53.789)	lr 0.00354
Warmup Train [34][480/3239]	Time 0.329 (0.537)	Data 0.002 (0.031)	Loss 4.1387 (4.0367)	Top-1 acc 28.906 (30.417)	Top-5 acc 52.344 (53.793)	lr 0.00353
Warmup Train [34][490/3239]	Time 0.458 (0.537)	Data 0.001 (0.030)	Loss 4.0553 (4.0364)	Top-1 acc 33.203 (30.466)	Top-5 acc 57.422 (53.800)	lr 0.00353
Warmup Train [34][500/3239]	Time 0.416 (0.536)	Data 0.001 (0.030)	Loss 4.0627 (4.0372)	Top-1 acc 30.078 (30.456)	Top-5 acc 51.953 (53.777)	lr 0.00353
Warmup Train [34][510/3239]	Time 0.359 (0.536)	Data 0.001 (0.030)	Loss 3.9398 (4.0367)	Top-1 acc 34.375 (30.468)	Top-5 acc 55.859 (53.788)	lr 0.00352
Warmup Train [34][520/3239]	Time 0.665 (0.535)	Data 0.001 (0.029)	Loss 3.9811 (4.0370)	Top-1 acc 30.469 (30.464)	Top-5 acc 57.422 (53.802)	lr 0.00352
Warmup Train [34][530/3239]	Time 0.354 (0.535)	Data 0.002 (0.029)	Loss 4.1435 (4.0369)	Top-1 acc 26.953 (30.472)	Top-5 acc 51.172 (53.809)	lr 0.00352
Warmup Train [34][540/3239]	Time 0.501 (0.535)	Data 0.001 (0.029)	Loss 4.1366 (4.0388)	Top-1 acc 26.562 (30.452)	Top-5 acc 47.656 (53.746)	lr 0.00351
Warmup Train [34][550/3239]	Time 0.428 (0.534)	Data 0.001 (0.028)	Loss 4.2731 (4.0409)	Top-1 acc 24.609 (30.426)	Top-5 acc 50.000 (53.712)	lr 0.00351
Warmup Train [34][560/3239]	Time 0.606 (0.534)	Data 0.001 (0.028)	Loss 4.2595 (4.0411)	Top-1 acc 24.609 (30.414)	Top-5 acc 50.781 (53.709)	lr 0.00351
Warmup Train [34][570/3239]	Time 0.375 (0.533)	Data 0.001 (0.027)	Loss 4.1351 (4.0409)	Top-1 acc 28.125 (30.409)	Top-5 acc 51.562 (53.709)	lr 0.00351
Warmup Train [34][580/3239]	Time 0.576 (0.533)	Data 0.001 (0.027)	Loss 4.0359 (4.0399)	Top-1 acc 27.344 (30.422)	Top-5 acc 53.125 (53.722)	lr 0.00350
Warmup Train [34][590/3239]	Time 0.486 (0.532)	Data 0.001 (0.027)	Loss 3.9215 (4.0400)	Top-1 acc 32.031 (30.413)	Top-5 acc 56.641 (53.710)	lr 0.00350
Warmup Train [34][600/3239]	Time 0.428 (0.532)	Data 0.001 (0.026)	Loss 4.1142 (4.0401)	Top-1 acc 28.125 (30.401)	Top-5 acc 51.953 (53.699)	lr 0.00350
Warmup Train [34][610/3239]	Time 0.607 (0.532)	Data 0.001 (0.026)	Loss 4.1129 (4.0391)	Top-1 acc 30.859 (30.433)	Top-5 acc 52.734 (53.711)	lr 0.00349
Warmup Train [34][620/3239]	Time 0.570 (0.532)	Data 0.001 (0.025)	Loss 4.0030 (4.0382)	Top-1 acc 31.250 (30.447)	Top-5 acc 53.516 (53.729)	lr 0.00349
Warmup Train [34][630/3239]	Time 0.570 (0.532)	Data 0.001 (0.025)	Loss 4.0676 (4.0388)	Top-1 acc 33.203 (30.429)	Top-5 acc 53.125 (53.706)	lr 0.00349
Warmup Train [34][640/3239]	Time 0.413 (0.531)	Data 0.001 (0.025)	Loss 4.2046 (4.0389)	Top-1 acc 25.391 (30.430)	Top-5 acc 50.000 (53.716)	lr 0.00348
Warmup Train [34][650/3239]	Time 0.335 (0.531)	Data 0.002 (0.025)	Loss 3.8899 (4.0391)	Top-1 acc 31.641 (30.427)	Top-5 acc 57.031 (53.716)	lr 0.00348
Warmup Train [34][660/3239]	Time 0.430 (0.530)	Data 0.001 (0.024)	Loss 4.0051 (4.0387)	Top-1 acc 29.297 (30.429)	Top-5 acc 55.078 (53.736)	lr 0.00348
Warmup Train [34][670/3239]	Time 0.632 (0.530)	Data 0.001 (0.024)	Loss 4.3357 (4.0391)	Top-1 acc 26.562 (30.440)	Top-5 acc 47.266 (53.729)	lr 0.00347
Warmup Train [34][680/3239]	Time 0.513 (0.529)	Data 0.001 (0.024)	Loss 3.8591 (4.0387)	Top-1 acc 34.766 (30.448)	Top-5 acc 57.031 (53.734)	lr 0.00347
Warmup Train [34][690/3239]	Time 0.469 (0.529)	Data 0.001 (0.024)	Loss 4.0276 (4.0385)	Top-1 acc 32.422 (30.457)	Top-5 acc 55.469 (53.740)	lr 0.00347
Warmup Train [34][700/3239]	Time 0.447 (0.528)	Data 0.001 (0.023)	Loss 4.0623 (4.0386)	Top-1 acc 32.422 (30.470)	Top-5 acc 53.906 (53.746)	lr 0.00347
Warmup Train [34][710/3239]	Time 0.478 (0.528)	Data 0.001 (0.023)	Loss 4.1439 (4.0398)	Top-1 acc 28.516 (30.474)	Top-5 acc 49.219 (53.714)	lr 0.00346
Warmup Train [34][720/3239]	Time 0.571 (0.528)	Data 0.001 (0.023)	Loss 3.9180 (4.0401)	Top-1 acc 33.594 (30.476)	Top-5 acc 53.906 (53.701)	lr 0.00346
Warmup Train [34][730/3239]	Time 0.606 (0.528)	Data 0.001 (0.023)	Loss 4.0567 (4.0396)	Top-1 acc 31.641 (30.477)	Top-5 acc 54.297 (53.704)	lr 0.00346
Warmup Train [34][740/3239]	Time 0.485 (0.528)	Data 0.001 (0.022)	Loss 4.2497 (4.0412)	Top-1 acc 28.516 (30.454)	Top-5 acc 45.312 (53.670)	lr 0.00345
Warmup Train [34][750/3239]	Time 0.354 (0.528)	Data 0.001 (0.022)	Loss 4.0555 (4.0411)	Top-1 acc 29.688 (30.453)	Top-5 acc 53.906 (53.664)	lr 0.00345
Warmup Train [34][760/3239]	Time 0.518 (0.528)	Data 0.001 (0.022)	Loss 4.0383 (4.0419)	Top-1 acc 28.906 (30.450)	Top-5 acc 53.516 (53.643)	lr 0.00345
Warmup Train [34][770/3239]	Time 0.393 (0.527)	Data 0.001 (0.022)	Loss 4.1370 (4.0422)	Top-1 acc 30.859 (30.451)	Top-5 acc 53.906 (53.644)	lr 0.00344
Warmup Train [34][780/3239]	Time 0.660 (0.527)	Data 0.001 (0.022)	Loss 4.0636 (4.0423)	Top-1 acc 30.859 (30.453)	Top-5 acc 53.125 (53.645)	lr 0.00344
Warmup Train [34][790/3239]	Time 0.540 (0.527)	Data 0.001 (0.021)	Loss 4.2501 (4.0431)	Top-1 acc 27.734 (30.438)	Top-5 acc 49.609 (53.618)	lr 0.00344
Warmup Train [34][800/3239]	Time 0.439 (0.527)	Data 0.001 (0.021)	Loss 4.1883 (4.0428)	Top-1 acc 24.219 (30.442)	Top-5 acc 50.781 (53.615)	lr 0.00343
Warmup Train [34][810/3239]	Time 0.476 (0.527)	Data 0.001 (0.021)	Loss 4.1013 (4.0427)	Top-1 acc 29.688 (30.432)	Top-5 acc 49.609 (53.617)	lr 0.00343
Warmup Train [34][820/3239]	Time 0.482 (0.526)	Data 0.001 (0.021)	Loss 4.0629 (4.0429)	Top-1 acc 32.812 (30.426)	Top-5 acc 52.734 (53.622)	lr 0.00343
Warmup Train [34][830/3239]	Time 0.486 (0.526)	Data 0.001 (0.020)	Loss 4.0832 (4.0420)	Top-1 acc 29.297 (30.440)	Top-5 acc 52.734 (53.640)	lr 0.00343
Warmup Train [34][840/3239]	Time 0.481 (0.526)	Data 0.001 (0.020)	Loss 3.9239 (4.0420)	Top-1 acc 33.203 (30.439)	Top-5 acc 56.641 (53.633)	lr 0.00342
Warmup Train [34][850/3239]	Time 0.602 (0.525)	Data 0.001 (0.020)	Loss 3.9869 (4.0415)	Top-1 acc 32.812 (30.462)	Top-5 acc 55.078 (53.645)	lr 0.00342
Warmup Train [34][860/3239]	Time 0.510 (0.525)	Data 0.001 (0.020)	Loss 4.1319 (4.0415)	Top-1 acc 28.125 (30.460)	Top-5 acc 52.344 (53.642)	lr 0.00342
Warmup Train [34][870/3239]	Time 0.485 (0.525)	Data 0.001 (0.020)	Loss 4.1877 (4.0414)	Top-1 acc 26.953 (30.459)	Top-5 acc 51.172 (53.652)	lr 0.00341
Warmup Train [34][880/3239]	Time 0.612 (0.525)	Data 0.001 (0.020)	Loss 3.9939 (4.0411)	Top-1 acc 30.859 (30.467)	Top-5 acc 53.125 (53.660)	lr 0.00341
Warmup Train [34][890/3239]	Time 0.535 (0.526)	Data 0.001 (0.019)	Loss 4.0799 (4.0412)	Top-1 acc 27.734 (30.467)	Top-5 acc 53.516 (53.659)	lr 0.00341
Warmup Train [34][900/3239]	Time 0.544 (0.525)	Data 0.001 (0.019)	Loss 3.9661 (4.0410)	Top-1 acc 30.469 (30.468)	Top-5 acc 54.297 (53.670)	lr 0.00340
Warmup Train [34][910/3239]	Time 0.498 (0.525)	Data 0.001 (0.019)	Loss 4.0092 (4.0414)	Top-1 acc 30.859 (30.469)	Top-5 acc 54.688 (53.667)	lr 0.00340
Warmup Train [34][920/3239]	Time 0.477 (0.525)	Data 0.001 (0.019)	Loss 3.9904 (4.0412)	Top-1 acc 26.953 (30.475)	Top-5 acc 53.906 (53.681)	lr 0.00340
Warmup Train [34][930/3239]	Time 0.447 (0.525)	Data 0.001 (0.019)	Loss 4.0546 (4.0410)	Top-1 acc 29.688 (30.474)	Top-5 acc 53.516 (53.683)	lr 0.00339
Warmup Train [34][940/3239]	Time 0.510 (0.524)	Data 0.001 (0.019)	Loss 3.8422 (4.0407)	Top-1 acc 31.641 (30.476)	Top-5 acc 58.594 (53.686)	lr 0.00339
Warmup Train [34][950/3239]	Time 0.388 (0.524)	Data 0.001 (0.018)	Loss 4.1501 (4.0413)	Top-1 acc 27.344 (30.461)	Top-5 acc 52.734 (53.673)	lr 0.00339
Warmup Train [34][960/3239]	Time 0.578 (0.523)	Data 0.001 (0.018)	Loss 4.1056 (4.0411)	Top-1 acc 30.859 (30.469)	Top-5 acc 53.516 (53.684)	lr 0.00339
Warmup Train [34][970/3239]	Time 0.601 (0.523)	Data 0.001 (0.018)	Loss 4.1709 (4.0410)	Top-1 acc 26.172 (30.472)	Top-5 acc 52.344 (53.685)	lr 0.00338
Warmup Train [34][980/3239]	Time 0.750 (0.523)	Data 0.001 (0.018)	Loss 3.9550 (4.0411)	Top-1 acc 31.250 (30.474)	Top-5 acc 52.734 (53.673)	lr 0.00338
Warmup Train [34][990/3239]	Time 0.552 (0.523)	Data 0.001 (0.018)	Loss 3.9510 (4.0412)	Top-1 acc 26.953 (30.460)	Top-5 acc 55.469 (53.667)	lr 0.00338
Warmup Train [34][1000/3239]	Time 0.413 (0.522)	Data 0.001 (0.018)	Loss 3.9046 (4.0401)	Top-1 acc 33.984 (30.495)	Top-5 acc 55.859 (53.692)	lr 0.00337
Warmup Train [34][1010/3239]	Time 0.460 (0.523)	Data 0.001 (0.018)	Loss 4.1258 (4.0402)	Top-1 acc 29.297 (30.493)	Top-5 acc 51.172 (53.692)	lr 0.00337
Warmup Train [34][1020/3239]	Time 0.515 (0.522)	Data 0.001 (0.018)	Loss 4.0740 (4.0400)	Top-1 acc 28.906 (30.497)	Top-5 acc 56.641 (53.703)	lr 0.00337
Warmup Train [34][1030/3239]	Time 0.486 (0.522)	Data 0.001 (0.017)	Loss 4.1229 (4.0402)	Top-1 acc 28.516 (30.492)	Top-5 acc 51.953 (53.696)	lr 0.00336
Warmup Train [34][1040/3239]	Time 0.440 (0.522)	Data 0.001 (0.017)	Loss 3.8966 (4.0394)	Top-1 acc 32.812 (30.500)	Top-5 acc 58.984 (53.711)	lr 0.00336
Warmup Train [34][1050/3239]	Time 0.543 (0.522)	Data 0.001 (0.017)	Loss 3.9985 (4.0390)	Top-1 acc 30.469 (30.511)	Top-5 acc 53.125 (53.728)	lr 0.00336
Warmup Train [34][1060/3239]	Time 0.332 (0.522)	Data 0.001 (0.017)	Loss 4.0029 (4.0386)	Top-1 acc 31.641 (30.517)	Top-5 acc 55.078 (53.741)	lr 0.00336
Warmup Train [34][1070/3239]	Time 0.506 (0.522)	Data 0.001 (0.017)	Loss 3.8975 (4.0380)	Top-1 acc 34.766 (30.525)	Top-5 acc 58.984 (53.754)	lr 0.00335
Warmup Train [34][1080/3239]	Time 0.515 (0.522)	Data 0.001 (0.017)	Loss 3.9817 (4.0377)	Top-1 acc 28.906 (30.527)	Top-5 acc 57.812 (53.769)	lr 0.00335
Warmup Train [34][1090/3239]	Time 0.401 (0.522)	Data 0.001 (0.017)	Loss 4.1858 (4.0378)	Top-1 acc 25.781 (30.522)	Top-5 acc 53.516 (53.772)	lr 0.00335
Warmup Train [34][1100/3239]	Time 0.488 (0.521)	Data 0.001 (0.017)	Loss 4.0477 (4.0380)	Top-1 acc 30.078 (30.513)	Top-5 acc 51.172 (53.757)	lr 0.00334
Warmup Train [34][1110/3239]	Time 0.623 (0.522)	Data 0.001 (0.017)	Loss 3.9332 (4.0378)	Top-1 acc 31.641 (30.513)	Top-5 acc 54.688 (53.758)	lr 0.00334
Warmup Train [34][1120/3239]	Time 0.531 (0.522)	Data 0.001 (0.017)	Loss 4.0403 (4.0378)	Top-1 acc 30.859 (30.509)	Top-5 acc 51.562 (53.761)	lr 0.00334
Warmup Train [34][1130/3239]	Time 0.468 (0.522)	Data 0.001 (0.017)	Loss 3.9900 (4.0378)	Top-1 acc 34.375 (30.520)	Top-5 acc 56.641 (53.760)	lr 0.00333
Warmup Train [34][1140/3239]	Time 0.422 (0.521)	Data 0.001 (0.016)	Loss 3.9246 (4.0375)	Top-1 acc 32.812 (30.528)	Top-5 acc 58.203 (53.768)	lr 0.00333
Warmup Train [34][1150/3239]	Time 0.387 (0.521)	Data 0.001 (0.016)	Loss 4.0414 (4.0378)	Top-1 acc 29.688 (30.526)	Top-5 acc 54.297 (53.768)	lr 0.00333
Warmup Train [34][1160/3239]	Time 0.561 (0.521)	Data 0.001 (0.016)	Loss 4.2115 (4.0378)	Top-1 acc 29.297 (30.523)	Top-5 acc 48.828 (53.766)	lr 0.00333
Warmup Train [34][1170/3239]	Time 0.565 (0.521)	Data 0.001 (0.016)	Loss 4.0226 (4.0375)	Top-1 acc 32.812 (30.536)	Top-5 acc 51.562 (53.777)	lr 0.00332
Warmup Train [34][1180/3239]	Time 0.513 (0.522)	Data 0.001 (0.016)	Loss 3.9243 (4.0375)	Top-1 acc 35.547 (30.545)	Top-5 acc 58.594 (53.774)	lr 0.00332
Warmup Train [34][1190/3239]	Time 0.775 (0.521)	Data 0.002 (0.016)	Loss 3.9833 (4.0377)	Top-1 acc 29.688 (30.543)	Top-5 acc 60.547 (53.777)	lr 0.00332
Warmup Train [34][1200/3239]	Time 0.644 (0.521)	Data 0.001 (0.016)	Loss 3.9945 (4.0375)	Top-1 acc 29.297 (30.557)	Top-5 acc 53.906 (53.780)	lr 0.00331
Warmup Train [34][1210/3239]	Time 0.557 (0.521)	Data 0.001 (0.016)	Loss 3.9380 (4.0372)	Top-1 acc 30.469 (30.554)	Top-5 acc 59.375 (53.791)	lr 0.00331
Warmup Train [34][1220/3239]	Time 0.577 (0.521)	Data 0.001 (0.016)	Loss 4.0599 (4.0367)	Top-1 acc 28.906 (30.558)	Top-5 acc 53.906 (53.804)	lr 0.00331
Warmup Train [34][1230/3239]	Time 0.387 (0.520)	Data 0.001 (0.016)	Loss 3.9766 (4.0369)	Top-1 acc 31.641 (30.550)	Top-5 acc 55.078 (53.799)	lr 0.00330
Warmup Train [34][1240/3239]	Time 0.518 (0.520)	Data 0.001 (0.016)	Loss 4.2491 (4.0373)	Top-1 acc 25.000 (30.546)	Top-5 acc 49.609 (53.795)	lr 0.00330
Warmup Train [34][1250/3239]	Time 0.595 (0.520)	Data 0.001 (0.015)	Loss 3.8604 (4.0370)	Top-1 acc 30.859 (30.553)	Top-5 acc 59.766 (53.803)	lr 0.00330
Warmup Train [34][1260/3239]	Time 0.570 (0.520)	Data 0.001 (0.015)	Loss 3.8586 (4.0376)	Top-1 acc 34.375 (30.544)	Top-5 acc 59.766 (53.800)	lr 0.00330
Warmup Train [34][1270/3239]	Time 0.514 (0.520)	Data 0.001 (0.015)	Loss 4.0064 (4.0375)	Top-1 acc 31.641 (30.542)	Top-5 acc 54.688 (53.802)	lr 0.00329
Warmup Train [34][1280/3239]	Time 0.471 (0.520)	Data 0.001 (0.015)	Loss 4.1864 (4.0370)	Top-1 acc 28.125 (30.545)	Top-5 acc 50.000 (53.810)	lr 0.00329
Warmup Train [34][1290/3239]	Time 0.325 (0.519)	Data 0.001 (0.015)	Loss 4.1856 (4.0371)	Top-1 acc 25.000 (30.540)	Top-5 acc 48.438 (53.799)	lr 0.00329
Warmup Train [34][1300/3239]	Time 0.589 (0.520)	Data 0.001 (0.015)	Loss 4.1193 (4.0374)	Top-1 acc 26.953 (30.532)	Top-5 acc 51.172 (53.790)	lr 0.00328
Warmup Train [34][1310/3239]	Time 0.615 (0.520)	Data 0.001 (0.015)	Loss 4.2267 (4.0372)	Top-1 acc 24.609 (30.532)	Top-5 acc 52.734 (53.796)	lr 0.00328
Warmup Train [34][1320/3239]	Time 0.498 (0.519)	Data 0.001 (0.015)	Loss 3.7741 (4.0370)	Top-1 acc 38.672 (30.539)	Top-5 acc 62.109 (53.806)	lr 0.00328
Warmup Train [34][1330/3239]	Time 0.505 (0.519)	Data 0.001 (0.015)	Loss 4.0557 (4.0369)	Top-1 acc 27.734 (30.532)	Top-5 acc 53.906 (53.812)	lr 0.00327
Warmup Train [34][1340/3239]	Time 0.595 (0.519)	Data 0.001 (0.015)	Loss 3.9542 (4.0370)	Top-1 acc 33.594 (30.528)	Top-5 acc 56.250 (53.809)	lr 0.00327
Warmup Train [34][1350/3239]	Time 0.509 (0.519)	Data 0.001 (0.015)	Loss 3.9078 (4.0368)	Top-1 acc 31.250 (30.534)	Top-5 acc 58.203 (53.814)	lr 0.00327
Warmup Train [34][1360/3239]	Time 0.579 (0.519)	Data 0.001 (0.015)	Loss 3.8422 (4.0364)	Top-1 acc 34.766 (30.543)	Top-5 acc 57.031 (53.828)	lr 0.00327
Warmup Train [34][1370/3239]	Time 0.459 (0.519)	Data 0.001 (0.014)	Loss 3.9653 (4.0366)	Top-1 acc 28.125 (30.532)	Top-5 acc 53.906 (53.822)	lr 0.00326
Warmup Train [34][1380/3239]	Time 0.386 (0.519)	Data 0.001 (0.014)	Loss 4.0547 (4.0364)	Top-1 acc 31.250 (30.537)	Top-5 acc 54.688 (53.832)	lr 0.00326
Warmup Train [34][1390/3239]	Time 0.653 (0.519)	Data 0.001 (0.014)	Loss 4.0555 (4.0366)	Top-1 acc 31.250 (30.537)	Top-5 acc 55.469 (53.830)	lr 0.00326
Warmup Train [34][1400/3239]	Time 0.681 (0.519)	Data 0.001 (0.014)	Loss 4.0659 (4.0369)	Top-1 acc 31.641 (30.540)	Top-5 acc 53.125 (53.823)	lr 0.00325
Warmup Train [34][1410/3239]	Time 0.628 (0.519)	Data 0.001 (0.014)	Loss 4.0347 (4.0368)	Top-1 acc 27.734 (30.547)	Top-5 acc 55.078 (53.829)	lr 0.00325
Warmup Train [34][1420/3239]	Time 0.555 (0.519)	Data 0.001 (0.014)	Loss 3.9251 (4.0365)	Top-1 acc 34.375 (30.549)	Top-5 acc 57.812 (53.831)	lr 0.00325
Warmup Train [34][1430/3239]	Time 0.523 (0.519)	Data 0.001 (0.014)	Loss 3.8069 (4.0366)	Top-1 acc 39.844 (30.540)	Top-5 acc 58.984 (53.825)	lr 0.00324
Warmup Train [34][1440/3239]	Time 0.489 (0.519)	Data 0.001 (0.014)	Loss 4.0314 (4.0367)	Top-1 acc 30.078 (30.532)	Top-5 acc 52.734 (53.823)	lr 0.00324
Warmup Train [34][1450/3239]	Time 0.637 (0.519)	Data 0.001 (0.014)	Loss 3.7146 (4.0366)	Top-1 acc 37.109 (30.543)	Top-5 acc 62.109 (53.819)	lr 0.00324
Warmup Train [34][1460/3239]	Time 0.381 (0.519)	Data 0.001 (0.014)	Loss 4.0717 (4.0365)	Top-1 acc 32.422 (30.554)	Top-5 acc 54.297 (53.826)	lr 0.00324
Warmup Train [34][1470/3239]	Time 0.543 (0.518)	Data 0.001 (0.014)	Loss 4.1549 (4.0364)	Top-1 acc 27.344 (30.553)	Top-5 acc 48.438 (53.829)	lr 0.00323
Warmup Train [34][1480/3239]	Time 0.480 (0.518)	Data 0.001 (0.014)	Loss 4.1907 (4.0361)	Top-1 acc 28.906 (30.564)	Top-5 acc 53.516 (53.839)	lr 0.00323
Warmup Train [34][1490/3239]	Time 0.512 (0.518)	Data 0.001 (0.014)	Loss 3.9916 (4.0361)	Top-1 acc 30.078 (30.564)	Top-5 acc 53.516 (53.840)	lr 0.00323
Warmup Train [34][1500/3239]	Time 0.406 (0.518)	Data 0.001 (0.014)	Loss 4.0848 (4.0364)	Top-1 acc 31.250 (30.556)	Top-5 acc 49.609 (53.835)	lr 0.00322
Warmup Train [34][1510/3239]	Time 0.624 (0.518)	Data 0.001 (0.014)	Loss 3.9754 (4.0364)	Top-1 acc 32.031 (30.543)	Top-5 acc 55.469 (53.840)	lr 0.00322
Warmup Train [34][1520/3239]	Time 0.520 (0.517)	Data 0.001 (0.013)	Loss 4.1164 (4.0361)	Top-1 acc 29.297 (30.549)	Top-5 acc 51.172 (53.845)	lr 0.00322
Warmup Train [34][1530/3239]	Time 0.490 (0.517)	Data 0.001 (0.013)	Loss 4.1262 (4.0363)	Top-1 acc 29.297 (30.549)	Top-5 acc 55.078 (53.844)	lr 0.00321
Warmup Train [34][1540/3239]	Time 0.513 (0.517)	Data 0.001 (0.013)	Loss 3.9630 (4.0366)	Top-1 acc 33.984 (30.537)	Top-5 acc 57.031 (53.839)	lr 0.00321
Warmup Train [34][1550/3239]	Time 0.514 (0.517)	Data 0.001 (0.013)	Loss 4.0166 (4.0364)	Top-1 acc 31.641 (30.547)	Top-5 acc 54.297 (53.841)	lr 0.00321
Warmup Train [34][1560/3239]	Time 0.467 (0.517)	Data 0.001 (0.013)	Loss 4.0895 (4.0363)	Top-1 acc 27.344 (30.541)	Top-5 acc 53.125 (53.844)	lr 0.00321
Warmup Train [34][1570/3239]	Time 0.425 (0.517)	Data 0.001 (0.013)	Loss 4.2038 (4.0363)	Top-1 acc 25.781 (30.543)	Top-5 acc 50.000 (53.850)	lr 0.00320
Warmup Train [34][1580/3239]	Time 0.596 (0.517)	Data 0.001 (0.013)	Loss 3.9178 (4.0359)	Top-1 acc 30.078 (30.545)	Top-5 acc 55.469 (53.857)	lr 0.00320
Warmup Train [34][1590/3239]	Time 0.682 (0.517)	Data 0.001 (0.013)	Loss 4.0893 (4.0356)	Top-1 acc 28.516 (30.544)	Top-5 acc 51.562 (53.864)	lr 0.00320
Warmup Train [34][1600/3239]	Time 0.485 (0.517)	Data 0.001 (0.013)	Loss 3.7678 (4.0357)	Top-1 acc 37.109 (30.544)	Top-5 acc 60.156 (53.861)	lr 0.00319
Warmup Train [34][1610/3239]	Time 0.735 (0.517)	Data 0.001 (0.013)	Loss 4.1763 (4.0360)	Top-1 acc 27.344 (30.536)	Top-5 acc 50.781 (53.861)	lr 0.00319
Warmup Train [34][1620/3239]	Time 0.440 (0.517)	Data 0.001 (0.013)	Loss 3.9376 (4.0361)	Top-1 acc 29.688 (30.538)	Top-5 acc 57.812 (53.860)	lr 0.00319
Warmup Train [34][1630/3239]	Time 0.555 (0.517)	Data 0.001 (0.013)	Loss 4.1965 (4.0362)	Top-1 acc 28.125 (30.528)	Top-5 acc 50.781 (53.856)	lr 0.00318
Warmup Train [34][1640/3239]	Time 0.365 (0.517)	Data 0.001 (0.013)	Loss 4.1015 (4.0360)	Top-1 acc 26.953 (30.526)	Top-5 acc 50.391 (53.860)	lr 0.00318
Warmup Train [34][1650/3239]	Time 0.542 (0.517)	Data 0.001 (0.013)	Loss 4.2089 (4.0361)	Top-1 acc 30.859 (30.532)	Top-5 acc 51.953 (53.861)	lr 0.00318
Warmup Train [34][1660/3239]	Time 0.329 (0.517)	Data 0.001 (0.013)	Loss 4.0394 (4.0359)	Top-1 acc 33.984 (30.543)	Top-5 acc 51.562 (53.868)	lr 0.00318
Warmup Train [34][1670/3239]	Time 0.493 (0.517)	Data 0.001 (0.013)	Loss 3.9208 (4.0353)	Top-1 acc 33.594 (30.562)	Top-5 acc 53.906 (53.875)	lr 0.00317
Warmup Train [34][1680/3239]	Time 0.536 (0.517)	Data 0.001 (0.013)	Loss 4.0258 (4.0357)	Top-1 acc 30.469 (30.552)	Top-5 acc 53.516 (53.868)	lr 0.00317
Warmup Train [34][1690/3239]	Time 0.425 (0.517)	Data 0.001 (0.013)	Loss 4.0666 (4.0357)	Top-1 acc 29.297 (30.548)	Top-5 acc 55.469 (53.870)	lr 0.00317
Warmup Train [34][1700/3239]	Time 0.509 (0.517)	Data 0.001 (0.013)	Loss 4.3208 (4.0363)	Top-1 acc 22.656 (30.537)	Top-5 acc 46.094 (53.855)	lr 0.00316
Warmup Train [34][1710/3239]	Time 0.607 (0.517)	Data 0.001 (0.013)	Loss 3.9247 (4.0361)	Top-1 acc 30.078 (30.541)	Top-5 acc 57.422 (53.859)	lr 0.00316
Warmup Train [34][1720/3239]	Time 0.552 (0.517)	Data 0.001 (0.013)	Loss 4.0300 (4.0362)	Top-1 acc 30.078 (30.536)	Top-5 acc 50.781 (53.853)	lr 0.00316
Warmup Train [34][1730/3239]	Time 0.503 (0.517)	Data 0.001 (0.013)	Loss 4.2433 (4.0364)	Top-1 acc 24.219 (30.534)	Top-5 acc 50.000 (53.847)	lr 0.00316
Warmup Train [34][1740/3239]	Time 0.675 (0.517)	Data 0.001 (0.013)	Loss 4.1075 (4.0365)	Top-1 acc 29.688 (30.536)	Top-5 acc 51.562 (53.845)	lr 0.00315
Warmup Train [34][1750/3239]	Time 0.598 (0.517)	Data 0.001 (0.012)	Loss 3.9276 (4.0366)	Top-1 acc 32.422 (30.531)	Top-5 acc 56.641 (53.844)	lr 0.00315
Warmup Train [34][1760/3239]	Time 0.505 (0.517)	Data 0.001 (0.012)	Loss 4.0386 (4.0368)	Top-1 acc 29.688 (30.520)	Top-5 acc 53.516 (53.834)	lr 0.00315
Warmup Train [34][1770/3239]	Time 0.335 (0.517)	Data 0.001 (0.012)	Loss 3.9569 (4.0366)	Top-1 acc 29.297 (30.523)	Top-5 acc 57.812 (53.839)	lr 0.00314
Warmup Train [34][1780/3239]	Time 0.528 (0.517)	Data 0.002 (0.012)	Loss 4.0826 (4.0366)	Top-1 acc 28.125 (30.518)	Top-5 acc 52.734 (53.837)	lr 0.00314
Warmup Train [34][1790/3239]	Time 0.216 (0.516)	Data 0.001 (0.012)	Loss 4.1430 (4.0366)	Top-1 acc 28.125 (30.520)	Top-5 acc 51.953 (53.836)	lr 0.00314
Warmup Train [34][1800/3239]	Time 0.726 (0.516)	Data 0.001 (0.012)	Loss 3.9100 (4.0367)	Top-1 acc 27.344 (30.517)	Top-5 acc 53.906 (53.834)	lr 0.00313
Warmup Train [34][1810/3239]	Time 0.539 (0.516)	Data 0.001 (0.012)	Loss 4.2187 (4.0369)	Top-1 acc 26.562 (30.516)	Top-5 acc 51.172 (53.835)	lr 0.00313
Warmup Train [34][1820/3239]	Time 0.388 (0.516)	Data 0.001 (0.012)	Loss 3.9879 (4.0366)	Top-1 acc 31.250 (30.522)	Top-5 acc 56.250 (53.843)	lr 0.00313
Warmup Train [34][1830/3239]	Time 0.385 (0.516)	Data 0.001 (0.012)	Loss 3.8921 (4.0365)	Top-1 acc 33.984 (30.523)	Top-5 acc 56.250 (53.847)	lr 0.00313
Warmup Train [34][1840/3239]	Time 0.529 (0.516)	Data 0.001 (0.012)	Loss 4.1070 (4.0365)	Top-1 acc 27.734 (30.523)	Top-5 acc 52.344 (53.849)	lr 0.00312
Warmup Train [34][1850/3239]	Time 0.340 (0.516)	Data 0.001 (0.012)	Loss 4.1905 (4.0368)	Top-1 acc 26.172 (30.518)	Top-5 acc 50.391 (53.842)	lr 0.00312
Warmup Train [34][1860/3239]	Time 0.565 (0.516)	Data 0.001 (0.012)	Loss 4.0190 (4.0369)	Top-1 acc 28.516 (30.514)	Top-5 acc 55.469 (53.840)	lr 0.00312
Warmup Train [34][1870/3239]	Time 0.540 (0.516)	Data 0.001 (0.012)	Loss 3.8534 (4.0367)	Top-1 acc 32.812 (30.515)	Top-5 acc 60.938 (53.850)	lr 0.00311
Warmup Train [34][1880/3239]	Time 0.564 (0.516)	Data 0.001 (0.012)	Loss 3.9747 (4.0366)	Top-1 acc 30.469 (30.513)	Top-5 acc 56.250 (53.849)	lr 0.00311
Warmup Train [34][1890/3239]	Time 0.464 (0.516)	Data 0.001 (0.012)	Loss 4.2207 (4.0369)	Top-1 acc 24.219 (30.509)	Top-5 acc 50.000 (53.844)	lr 0.00311
Warmup Train [34][1900/3239]	Time 0.542 (0.516)	Data 0.001 (0.012)	Loss 4.1310 (4.0369)	Top-1 acc 28.516 (30.511)	Top-5 acc 51.172 (53.843)	lr 0.00311
Warmup Train [34][1910/3239]	Time 0.339 (0.516)	Data 0.026 (0.012)	Loss 4.1647 (4.0369)	Top-1 acc 28.125 (30.508)	Top-5 acc 51.562 (53.840)	lr 0.00310
Warmup Train [34][1920/3239]	Time 0.459 (0.516)	Data 0.001 (0.012)	Loss 3.9806 (4.0370)	Top-1 acc 29.297 (30.504)	Top-5 acc 56.250 (53.838)	lr 0.00310
Warmup Train [34][1930/3239]	Time 0.525 (0.516)	Data 0.001 (0.012)	Loss 4.1051 (4.0369)	Top-1 acc 30.859 (30.509)	Top-5 acc 48.828 (53.843)	lr 0.00310
Warmup Train [34][1940/3239]	Time 0.337 (0.516)	Data 0.001 (0.012)	Loss 4.2247 (4.0372)	Top-1 acc 24.609 (30.502)	Top-5 acc 49.609 (53.836)	lr 0.00309
Warmup Train [34][1950/3239]	Time 0.562 (0.516)	Data 0.001 (0.012)	Loss 4.0103 (4.0370)	Top-1 acc 32.031 (30.505)	Top-5 acc 55.469 (53.843)	lr 0.00309
Warmup Train [34][1960/3239]	Time 0.612 (0.516)	Data 0.001 (0.012)	Loss 3.8797 (4.0371)	Top-1 acc 28.125 (30.503)	Top-5 acc 58.594 (53.845)	lr 0.00309
Warmup Train [34][1970/3239]	Time 0.528 (0.516)	Data 0.002 (0.012)	Loss 4.1311 (4.0373)	Top-1 acc 28.516 (30.498)	Top-5 acc 52.344 (53.838)	lr 0.00308
Warmup Train [34][1980/3239]	Time 0.529 (0.516)	Data 0.001 (0.012)	Loss 4.0097 (4.0374)	Top-1 acc 27.734 (30.493)	Top-5 acc 55.859 (53.836)	lr 0.00308
Warmup Train [34][1990/3239]	Time 0.350 (0.516)	Data 0.001 (0.012)	Loss 4.2827 (4.0374)	Top-1 acc 28.125 (30.496)	Top-5 acc 47.656 (53.839)	lr 0.00308
Warmup Train [34][2000/3239]	Time 0.427 (0.516)	Data 0.001 (0.012)	Loss 4.0343 (4.0374)	Top-1 acc 31.641 (30.493)	Top-5 acc 55.078 (53.839)	lr 0.00308
Warmup Train [34][2010/3239]	Time 0.613 (0.516)	Data 0.001 (0.012)	Loss 3.9613 (4.0378)	Top-1 acc 30.078 (30.485)	Top-5 acc 53.516 (53.829)	lr 0.00307
Warmup Train [34][2020/3239]	Time 0.526 (0.516)	Data 0.001 (0.012)	Loss 3.9501 (4.0377)	Top-1 acc 28.906 (30.484)	Top-5 acc 57.422 (53.824)	lr 0.00307
Warmup Train [34][2030/3239]	Time 0.524 (0.516)	Data 0.002 (0.012)	Loss 4.1485 (4.0375)	Top-1 acc 30.469 (30.492)	Top-5 acc 51.562 (53.827)	lr 0.00307
Warmup Train [34][2040/3239]	Time 0.549 (0.516)	Data 0.001 (0.012)	Loss 4.0457 (4.0375)	Top-1 acc 30.078 (30.495)	Top-5 acc 51.172 (53.824)	lr 0.00306
Warmup Train [34][2050/3239]	Time 0.386 (0.516)	Data 0.001 (0.012)	Loss 4.0955 (4.0374)	Top-1 acc 28.906 (30.495)	Top-5 acc 52.734 (53.825)	lr 0.00306
Warmup Train [34][2060/3239]	Time 0.510 (0.516)	Data 0.001 (0.012)	Loss 4.2068 (4.0373)	Top-1 acc 27.344 (30.499)	Top-5 acc 54.688 (53.829)	lr 0.00306
Warmup Train [34][2070/3239]	Time 0.288 (0.516)	Data 0.002 (0.012)	Loss 4.2383 (4.0373)	Top-1 acc 23.047 (30.498)	Top-5 acc 49.219 (53.829)	lr 0.00306
Warmup Train [34][2080/3239]	Time 0.616 (0.516)	Data 0.001 (0.012)	Loss 3.9418 (4.0371)	Top-1 acc 35.156 (30.503)	Top-5 acc 54.297 (53.831)	lr 0.00305
Warmup Train [34][2090/3239]	Time 0.541 (0.516)	Data 0.001 (0.012)	Loss 3.7708 (4.0370)	Top-1 acc 34.766 (30.507)	Top-5 acc 61.328 (53.832)	lr 0.00305
Warmup Train [34][2100/3239]	Time 0.470 (0.515)	Data 0.001 (0.012)	Loss 4.0343 (4.0370)	Top-1 acc 30.469 (30.507)	Top-5 acc 53.125 (53.833)	lr 0.00305
Warmup Train [34][2110/3239]	Time 0.538 (0.516)	Data 0.001 (0.012)	Loss 4.0536 (4.0371)	Top-1 acc 30.859 (30.506)	Top-5 acc 53.125 (53.832)	lr 0.00304
Warmup Train [34][2120/3239]	Time 0.604 (0.515)	Data 0.001 (0.012)	Loss 4.0162 (4.0371)	Top-1 acc 35.156 (30.505)	Top-5 acc 54.297 (53.829)	lr 0.00304
Warmup Train [34][2130/3239]	Time 0.577 (0.516)	Data 0.001 (0.012)	Loss 4.1825 (4.0372)	Top-1 acc 25.391 (30.506)	Top-5 acc 53.516 (53.835)	lr 0.00304
Warmup Train [34][2140/3239]	Time 0.522 (0.516)	Data 0.001 (0.012)	Loss 3.9563 (4.0371)	Top-1 acc 32.422 (30.505)	Top-5 acc 58.203 (53.837)	lr 0.00304
Warmup Train [34][2150/3239]	Time 0.622 (0.516)	Data 0.001 (0.012)	Loss 4.0724 (4.0375)	Top-1 acc 28.516 (30.495)	Top-5 acc 51.953 (53.832)	lr 0.00303
Warmup Train [34][2160/3239]	Time 0.505 (0.515)	Data 0.001 (0.012)	Loss 4.0008 (4.0377)	Top-1 acc 33.984 (30.493)	Top-5 acc 55.469 (53.827)	lr 0.00303
Warmup Train [34][2170/3239]	Time 0.530 (0.516)	Data 0.001 (0.012)	Loss 3.9350 (4.0374)	Top-1 acc 33.203 (30.500)	Top-5 acc 55.859 (53.838)	lr 0.00303
Warmup Train [34][2180/3239]	Time 0.548 (0.516)	Data 0.001 (0.011)	Loss 3.8549 (4.0372)	Top-1 acc 34.375 (30.503)	Top-5 acc 57.031 (53.848)	lr 0.00302
Warmup Train [34][2190/3239]	Time 0.569 (0.516)	Data 0.001 (0.011)	Loss 4.0481 (4.0372)	Top-1 acc 32.422 (30.507)	Top-5 acc 53.516 (53.852)	lr 0.00302
Warmup Train [34][2200/3239]	Time 0.509 (0.516)	Data 0.002 (0.011)	Loss 4.2161 (4.0373)	Top-1 acc 26.953 (30.501)	Top-5 acc 50.781 (53.851)	lr 0.00302
Warmup Train [34][2210/3239]	Time 0.582 (0.516)	Data 0.001 (0.011)	Loss 4.1483 (4.0370)	Top-1 acc 30.859 (30.506)	Top-5 acc 52.344 (53.855)	lr 0.00302
Warmup Train [34][2220/3239]	Time 0.562 (0.516)	Data 0.001 (0.011)	Loss 4.1213 (4.0372)	Top-1 acc 28.906 (30.500)	Top-5 acc 47.266 (53.852)	lr 0.00301
Warmup Train [34][2230/3239]	Time 0.607 (0.516)	Data 0.001 (0.011)	Loss 3.9957 (4.0371)	Top-1 acc 28.906 (30.501)	Top-5 acc 53.516 (53.851)	lr 0.00301
Warmup Train [34][2240/3239]	Time 0.561 (0.516)	Data 0.001 (0.011)	Loss 4.2220 (4.0371)	Top-1 acc 26.172 (30.496)	Top-5 acc 48.828 (53.853)	lr 0.00301
Warmup Train [34][2250/3239]	Time 0.574 (0.516)	Data 0.001 (0.011)	Loss 3.8706 (4.0369)	Top-1 acc 34.766 (30.501)	Top-5 acc 55.859 (53.862)	lr 0.00300
Warmup Train [34][2260/3239]	Time 0.460 (0.516)	Data 0.001 (0.011)	Loss 4.0313 (4.0372)	Top-1 acc 28.516 (30.494)	Top-5 acc 51.172 (53.854)	lr 0.00300
Warmup Train [34][2270/3239]	Time 0.528 (0.516)	Data 0.001 (0.011)	Loss 4.0788 (4.0371)	Top-1 acc 33.203 (30.498)	Top-5 acc 53.516 (53.854)	lr 0.00300
Warmup Train [34][2280/3239]	Time 0.442 (0.515)	Data 0.001 (0.011)	Loss 4.1154 (4.0371)	Top-1 acc 30.469 (30.498)	Top-5 acc 50.000 (53.851)	lr 0.00299
Warmup Train [34][2290/3239]	Time 0.352 (0.515)	Data 0.001 (0.011)	Loss 3.9561 (4.0368)	Top-1 acc 30.469 (30.497)	Top-5 acc 54.297 (53.855)	lr 0.00299
Warmup Train [34][2300/3239]	Time 0.583 (0.516)	Data 0.001 (0.011)	Loss 3.9030 (4.0368)	Top-1 acc 33.594 (30.500)	Top-5 acc 55.078 (53.856)	lr 0.00299
Warmup Train [34][2310/3239]	Time 0.305 (0.515)	Data 0.001 (0.011)	Loss 3.9241 (4.0368)	Top-1 acc 33.984 (30.497)	Top-5 acc 54.297 (53.856)	lr 0.00299
Warmup Train [34][2320/3239]	Time 0.433 (0.515)	Data 0.001 (0.011)	Loss 4.2927 (4.0371)	Top-1 acc 24.219 (30.488)	Top-5 acc 49.219 (53.846)	lr 0.00298
Warmup Train [34][2330/3239]	Time 0.490 (0.515)	Data 0.001 (0.011)	Loss 3.9800 (4.0369)	Top-1 acc 35.156 (30.491)	Top-5 acc 58.203 (53.853)	lr 0.00298
Warmup Train [34][2340/3239]	Time 0.394 (0.515)	Data 0.001 (0.011)	Loss 4.0940 (4.0369)	Top-1 acc 31.641 (30.490)	Top-5 acc 52.344 (53.852)	lr 0.00298
Warmup Train [34][2350/3239]	Time 0.359 (0.515)	Data 0.001 (0.011)	Loss 3.9736 (4.0368)	Top-1 acc 32.031 (30.493)	Top-5 acc 57.031 (53.853)	lr 0.00297
Warmup Train [34][2360/3239]	Time 0.366 (0.515)	Data 0.001 (0.011)	Loss 4.1871 (4.0369)	Top-1 acc 28.906 (30.492)	Top-5 acc 48.438 (53.850)	lr 0.00297
Warmup Train [34][2370/3239]	Time 0.495 (0.515)	Data 0.001 (0.011)	Loss 4.0531 (4.0370)	Top-1 acc 29.688 (30.490)	Top-5 acc 54.688 (53.847)	lr 0.00297
Warmup Train [34][2380/3239]	Time 0.622 (0.515)	Data 0.001 (0.011)	Loss 4.0032 (4.0367)	Top-1 acc 31.641 (30.496)	Top-5 acc 53.516 (53.854)	lr 0.00297
Warmup Train [34][2390/3239]	Time 0.334 (0.515)	Data 0.001 (0.011)	Loss 4.0824 (4.0366)	Top-1 acc 27.344 (30.499)	Top-5 acc 55.859 (53.858)	lr 0.00296
Warmup Train [34][2400/3239]	Time 0.476 (0.515)	Data 0.001 (0.011)	Loss 3.9929 (4.0366)	Top-1 acc 30.469 (30.501)	Top-5 acc 51.953 (53.856)	lr 0.00296
Warmup Train [34][2410/3239]	Time 0.359 (0.515)	Data 0.001 (0.011)	Loss 4.0370 (4.0366)	Top-1 acc 32.812 (30.501)	Top-5 acc 52.344 (53.857)	lr 0.00296
Warmup Train [34][2420/3239]	Time 0.627 (0.515)	Data 0.001 (0.011)	Loss 4.0465 (4.0366)	Top-1 acc 28.125 (30.503)	Top-5 acc 52.734 (53.857)	lr 0.00295
Warmup Train [34][2430/3239]	Time 0.701 (0.515)	Data 0.001 (0.011)	Loss 4.0338 (4.0368)	Top-1 acc 29.297 (30.502)	Top-5 acc 54.688 (53.851)	lr 0.00295
Warmup Train [34][2440/3239]	Time 0.362 (0.514)	Data 0.001 (0.011)	Loss 4.0380 (4.0366)	Top-1 acc 31.250 (30.508)	Top-5 acc 52.734 (53.853)	lr 0.00295
Warmup Train [34][2450/3239]	Time 0.569 (0.515)	Data 0.001 (0.011)	Loss 4.0149 (4.0367)	Top-1 acc 33.984 (30.503)	Top-5 acc 51.953 (53.851)	lr 0.00295
Warmup Train [34][2460/3239]	Time 0.639 (0.515)	Data 0.001 (0.011)	Loss 3.9757 (4.0370)	Top-1 acc 28.125 (30.499)	Top-5 acc 61.328 (53.852)	lr 0.00294
Warmup Train [34][2470/3239]	Time 0.451 (0.514)	Data 0.002 (0.011)	Loss 4.0166 (4.0370)	Top-1 acc 30.469 (30.500)	Top-5 acc 55.078 (53.853)	lr 0.00294
Warmup Train [34][2480/3239]	Time 0.593 (0.515)	Data 0.001 (0.011)	Loss 4.0723 (4.0373)	Top-1 acc 33.594 (30.500)	Top-5 acc 54.297 (53.849)	lr 0.00294
Warmup Train [34][2490/3239]	Time 0.552 (0.515)	Data 0.001 (0.011)	Loss 4.0588 (4.0372)	Top-1 acc 30.469 (30.501)	Top-5 acc 51.953 (53.849)	lr 0.00293
Warmup Train [34][2500/3239]	Time 0.328 (0.515)	Data 0.001 (0.011)	Loss 3.9329 (4.0373)	Top-1 acc 31.641 (30.499)	Top-5 acc 53.906 (53.842)	lr 0.00293
Warmup Train [34][2510/3239]	Time 0.486 (0.515)	Data 0.001 (0.011)	Loss 4.1114 (4.0375)	Top-1 acc 30.078 (30.500)	Top-5 acc 54.297 (53.839)	lr 0.00293
Warmup Train [34][2520/3239]	Time 0.581 (0.515)	Data 0.001 (0.011)	Loss 3.7863 (4.0374)	Top-1 acc 39.844 (30.506)	Top-5 acc 58.594 (53.842)	lr 0.00293
Warmup Train [34][2530/3239]	Time 0.572 (0.515)	Data 0.001 (0.011)	Loss 3.9796 (4.0372)	Top-1 acc 32.031 (30.510)	Top-5 acc 57.422 (53.843)	lr 0.00292
Warmup Train [34][2540/3239]	Time 0.785 (0.515)	Data 0.001 (0.011)	Loss 3.9605 (4.0370)	Top-1 acc 30.469 (30.513)	Top-5 acc 55.078 (53.848)	lr 0.00292
Warmup Train [34][2550/3239]	Time 0.455 (0.515)	Data 0.001 (0.011)	Loss 3.9220 (4.0372)	Top-1 acc 34.375 (30.510)	Top-5 acc 59.766 (53.843)	lr 0.00292
Warmup Train [34][2560/3239]	Time 0.483 (0.515)	Data 0.002 (0.011)	Loss 3.8961 (4.0374)	Top-1 acc 32.812 (30.502)	Top-5 acc 55.859 (53.838)	lr 0.00291
Warmup Train [34][2570/3239]	Time 0.429 (0.515)	Data 0.001 (0.011)	Loss 4.1121 (4.0372)	Top-1 acc 29.297 (30.506)	Top-5 acc 51.562 (53.840)	lr 0.00291
Warmup Train [34][2580/3239]	Time 0.505 (0.515)	Data 0.001 (0.011)	Loss 4.0039 (4.0370)	Top-1 acc 30.469 (30.510)	Top-5 acc 54.297 (53.843)	lr 0.00291
Warmup Train [34][2590/3239]	Time 0.511 (0.514)	Data 0.001 (0.011)	Loss 4.2196 (4.0369)	Top-1 acc 26.953 (30.511)	Top-5 acc 49.609 (53.842)	lr 0.00291
Warmup Train [34][2600/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 4.0255 (4.0370)	Top-1 acc 28.125 (30.509)	Top-5 acc 53.906 (53.838)	lr 0.00290
Warmup Train [34][2610/3239]	Time 0.728 (0.514)	Data 0.001 (0.011)	Loss 3.9321 (4.0369)	Top-1 acc 30.859 (30.512)	Top-5 acc 56.641 (53.843)	lr 0.00290
Warmup Train [34][2620/3239]	Time 0.484 (0.514)	Data 0.001 (0.011)	Loss 3.8919 (4.0367)	Top-1 acc 33.594 (30.517)	Top-5 acc 58.203 (53.845)	lr 0.00290
Warmup Train [34][2630/3239]	Time 0.552 (0.514)	Data 0.001 (0.011)	Loss 4.0350 (4.0368)	Top-1 acc 32.422 (30.515)	Top-5 acc 55.469 (53.844)	lr 0.00290
Warmup Train [34][2640/3239]	Time 0.623 (0.514)	Data 0.001 (0.011)	Loss 3.9853 (4.0370)	Top-1 acc 28.125 (30.515)	Top-5 acc 54.688 (53.840)	lr 0.00289
Warmup Train [34][2650/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 4.1328 (4.0367)	Top-1 acc 31.250 (30.522)	Top-5 acc 50.000 (53.848)	lr 0.00289
Warmup Train [34][2660/3239]	Time 0.591 (0.514)	Data 0.001 (0.011)	Loss 4.0834 (4.0365)	Top-1 acc 26.562 (30.520)	Top-5 acc 53.906 (53.856)	lr 0.00289
Warmup Train [34][2670/3239]	Time 0.416 (0.514)	Data 0.001 (0.010)	Loss 3.8600 (4.0365)	Top-1 acc 33.984 (30.521)	Top-5 acc 58.984 (53.858)	lr 0.00288
Warmup Train [34][2680/3239]	Time 0.620 (0.514)	Data 0.001 (0.011)	Loss 4.0272 (4.0365)	Top-1 acc 32.422 (30.521)	Top-5 acc 57.422 (53.861)	lr 0.00288
Warmup Train [34][2690/3239]	Time 0.581 (0.514)	Data 0.001 (0.010)	Loss 4.1768 (4.0364)	Top-1 acc 28.906 (30.524)	Top-5 acc 50.781 (53.862)	lr 0.00288
Warmup Train [34][2700/3239]	Time 0.322 (0.514)	Data 0.001 (0.010)	Loss 4.0319 (4.0364)	Top-1 acc 32.422 (30.524)	Top-5 acc 55.078 (53.862)	lr 0.00288
Warmup Train [34][2710/3239]	Time 0.560 (0.514)	Data 0.001 (0.010)	Loss 3.8861 (4.0360)	Top-1 acc 31.250 (30.531)	Top-5 acc 59.375 (53.873)	lr 0.00287
Warmup Train [34][2720/3239]	Time 0.559 (0.514)	Data 0.001 (0.010)	Loss 3.9138 (4.0361)	Top-1 acc 35.938 (30.531)	Top-5 acc 57.422 (53.872)	lr 0.00287
Warmup Train [34][2730/3239]	Time 0.611 (0.514)	Data 0.001 (0.010)	Loss 4.0228 (4.0362)	Top-1 acc 33.594 (30.527)	Top-5 acc 53.516 (53.867)	lr 0.00287
Warmup Train [34][2740/3239]	Time 0.508 (0.514)	Data 0.001 (0.010)	Loss 3.9148 (4.0363)	Top-1 acc 32.422 (30.525)	Top-5 acc 57.812 (53.864)	lr 0.00286
Warmup Train [34][2750/3239]	Time 0.561 (0.514)	Data 0.002 (0.010)	Loss 3.9251 (4.0363)	Top-1 acc 33.984 (30.526)	Top-5 acc 58.203 (53.864)	lr 0.00286
Warmup Train [34][2760/3239]	Time 0.367 (0.514)	Data 0.001 (0.010)	Loss 4.4031 (4.0364)	Top-1 acc 23.047 (30.523)	Top-5 acc 41.406 (53.856)	lr 0.00286
Warmup Train [34][2770/3239]	Time 0.335 (0.514)	Data 0.001 (0.010)	Loss 4.1654 (4.0364)	Top-1 acc 26.172 (30.525)	Top-5 acc 49.609 (53.859)	lr 0.00286
Warmup Train [34][2780/3239]	Time 0.601 (0.514)	Data 0.001 (0.010)	Loss 4.1126 (4.0364)	Top-1 acc 27.734 (30.523)	Top-5 acc 51.953 (53.860)	lr 0.00285
Warmup Train [34][2790/3239]	Time 0.393 (0.514)	Data 0.001 (0.010)	Loss 3.9596 (4.0364)	Top-1 acc 28.906 (30.523)	Top-5 acc 55.078 (53.863)	lr 0.00285
Warmup Train [34][2800/3239]	Time 0.549 (0.514)	Data 0.001 (0.010)	Loss 4.1738 (4.0363)	Top-1 acc 26.562 (30.522)	Top-5 acc 50.000 (53.863)	lr 0.00285
Warmup Train [34][2810/3239]	Time 0.536 (0.514)	Data 0.001 (0.010)	Loss 4.0758 (4.0364)	Top-1 acc 28.125 (30.522)	Top-5 acc 55.469 (53.865)	lr 0.00284
Warmup Train [34][2820/3239]	Time 0.642 (0.514)	Data 0.001 (0.010)	Loss 3.8710 (4.0365)	Top-1 acc 33.594 (30.521)	Top-5 acc 59.375 (53.863)	lr 0.00284
Warmup Train [34][2830/3239]	Time 0.659 (0.514)	Data 0.001 (0.010)	Loss 4.0509 (4.0366)	Top-1 acc 26.562 (30.516)	Top-5 acc 52.734 (53.858)	lr 0.00284
Warmup Train [34][2840/3239]	Time 0.530 (0.514)	Data 0.001 (0.010)	Loss 4.0746 (4.0365)	Top-1 acc 31.250 (30.523)	Top-5 acc 51.172 (53.863)	lr 0.00284
Warmup Train [34][2850/3239]	Time 0.371 (0.514)	Data 0.002 (0.010)	Loss 4.0277 (4.0365)	Top-1 acc 31.250 (30.521)	Top-5 acc 53.125 (53.866)	lr 0.00283
Warmup Train [34][2860/3239]	Time 0.560 (0.514)	Data 0.001 (0.010)	Loss 4.1525 (4.0368)	Top-1 acc 25.391 (30.511)	Top-5 acc 50.391 (53.860)	lr 0.00283
Warmup Train [34][2870/3239]	Time 0.596 (0.514)	Data 0.001 (0.010)	Loss 3.9549 (4.0366)	Top-1 acc 33.203 (30.515)	Top-5 acc 55.859 (53.864)	lr 0.00283
Warmup Train [34][2880/3239]	Time 0.425 (0.514)	Data 0.001 (0.010)	Loss 4.1011 (4.0368)	Top-1 acc 28.125 (30.510)	Top-5 acc 49.219 (53.859)	lr 0.00282
Warmup Train [34][2890/3239]	Time 0.532 (0.514)	Data 0.001 (0.010)	Loss 3.9554 (4.0367)	Top-1 acc 28.906 (30.511)	Top-5 acc 61.328 (53.862)	lr 0.00282
Warmup Train [34][2900/3239]	Time 0.328 (0.514)	Data 0.001 (0.010)	Loss 4.0153 (4.0366)	Top-1 acc 30.469 (30.512)	Top-5 acc 57.422 (53.865)	lr 0.00282
Warmup Train [34][2910/3239]	Time 0.477 (0.514)	Data 0.001 (0.010)	Loss 4.0174 (4.0368)	Top-1 acc 32.031 (30.509)	Top-5 acc 53.125 (53.858)	lr 0.00282
Warmup Train [34][2920/3239]	Time 0.550 (0.514)	Data 0.001 (0.010)	Loss 3.9934 (4.0367)	Top-1 acc 32.031 (30.512)	Top-5 acc 54.688 (53.861)	lr 0.00281
Warmup Train [34][2930/3239]	Time 0.498 (0.514)	Data 0.001 (0.010)	Loss 3.9793 (4.0367)	Top-1 acc 28.125 (30.510)	Top-5 acc 52.734 (53.861)	lr 0.00281
Warmup Train [34][2940/3239]	Time 0.483 (0.514)	Data 0.002 (0.010)	Loss 3.7074 (4.0365)	Top-1 acc 36.719 (30.514)	Top-5 acc 62.891 (53.864)	lr 0.00281
Warmup Train [34][2950/3239]	Time 0.642 (0.514)	Data 0.001 (0.010)	Loss 3.9985 (4.0361)	Top-1 acc 29.688 (30.522)	Top-5 acc 54.297 (53.871)	lr 0.00281
Warmup Train [34][2960/3239]	Time 0.376 (0.514)	Data 0.002 (0.010)	Loss 4.0384 (4.0360)	Top-1 acc 34.766 (30.524)	Top-5 acc 55.859 (53.871)	lr 0.00280
Warmup Train [34][2970/3239]	Time 0.440 (0.514)	Data 0.001 (0.010)	Loss 4.3106 (4.0360)	Top-1 acc 26.172 (30.527)	Top-5 acc 49.219 (53.872)	lr 0.00280
Warmup Train [34][2980/3239]	Time 0.552 (0.514)	Data 0.001 (0.010)	Loss 4.1435 (4.0362)	Top-1 acc 25.000 (30.519)	Top-5 acc 50.000 (53.866)	lr 0.00280
Warmup Train [34][2990/3239]	Time 0.561 (0.514)	Data 0.001 (0.010)	Loss 3.8932 (4.0361)	Top-1 acc 34.766 (30.524)	Top-5 acc 57.422 (53.864)	lr 0.00279
Warmup Train [34][3000/3239]	Time 0.625 (0.514)	Data 0.001 (0.010)	Loss 4.0612 (4.0363)	Top-1 acc 31.641 (30.519)	Top-5 acc 53.906 (53.865)	lr 0.00279
Warmup Train [34][3010/3239]	Time 0.336 (0.514)	Data 0.001 (0.010)	Loss 4.3263 (4.0363)	Top-1 acc 26.953 (30.522)	Top-5 acc 46.094 (53.865)	lr 0.00279
Warmup Train [34][3020/3239]	Time 0.508 (0.514)	Data 0.001 (0.010)	Loss 3.9601 (4.0363)	Top-1 acc 30.469 (30.517)	Top-5 acc 55.078 (53.862)	lr 0.00279
Warmup Train [34][3030/3239]	Time 0.541 (0.514)	Data 0.001 (0.010)	Loss 3.9485 (4.0364)	Top-1 acc 33.203 (30.519)	Top-5 acc 57.812 (53.859)	lr 0.00278
Warmup Train [34][3040/3239]	Time 0.591 (0.514)	Data 0.001 (0.010)	Loss 3.9564 (4.0363)	Top-1 acc 32.031 (30.522)	Top-5 acc 54.688 (53.861)	lr 0.00278
Warmup Train [34][3050/3239]	Time 0.470 (0.514)	Data 0.001 (0.010)	Loss 4.0905 (4.0363)	Top-1 acc 31.250 (30.520)	Top-5 acc 50.391 (53.860)	lr 0.00278
Warmup Train [34][3060/3239]	Time 0.462 (0.514)	Data 0.001 (0.010)	Loss 4.2051 (4.0363)	Top-1 acc 29.297 (30.521)	Top-5 acc 50.781 (53.860)	lr 0.00277
Warmup Train [34][3070/3239]	Time 0.499 (0.514)	Data 0.001 (0.010)	Loss 4.0627 (4.0364)	Top-1 acc 32.422 (30.520)	Top-5 acc 55.469 (53.859)	lr 0.00277
Warmup Train [34][3080/3239]	Time 0.590 (0.514)	Data 0.001 (0.010)	Loss 4.0051 (4.0366)	Top-1 acc 30.078 (30.518)	Top-5 acc 53.516 (53.857)	lr 0.00277
Warmup Train [34][3090/3239]	Time 0.541 (0.514)	Data 0.001 (0.010)	Loss 4.0135 (4.0365)	Top-1 acc 29.688 (30.517)	Top-5 acc 52.344 (53.857)	lr 0.00277
Warmup Train [34][3100/3239]	Time 0.533 (0.514)	Data 0.001 (0.010)	Loss 4.1245 (4.0366)	Top-1 acc 32.812 (30.517)	Top-5 acc 52.734 (53.855)	lr 0.00276
Warmup Train [34][3110/3239]	Time 0.558 (0.514)	Data 0.001 (0.010)	Loss 4.1221 (4.0366)	Top-1 acc 30.078 (30.518)	Top-5 acc 52.734 (53.858)	lr 0.00276
Warmup Train [34][3120/3239]	Time 0.478 (0.514)	Data 0.001 (0.010)	Loss 4.1909 (4.0366)	Top-1 acc 27.734 (30.520)	Top-5 acc 47.656 (53.856)	lr 0.00276
Warmup Train [34][3130/3239]	Time 0.637 (0.514)	Data 0.001 (0.010)	Loss 3.9335 (4.0365)	Top-1 acc 27.344 (30.521)	Top-5 acc 58.984 (53.858)	lr 0.00276
Warmup Train [34][3140/3239]	Time 0.504 (0.514)	Data 0.001 (0.010)	Loss 3.9848 (4.0366)	Top-1 acc 32.812 (30.521)	Top-5 acc 55.859 (53.860)	lr 0.00275
Warmup Train [34][3150/3239]	Time 0.492 (0.514)	Data 0.001 (0.010)	Loss 3.9199 (4.0366)	Top-1 acc 30.859 (30.522)	Top-5 acc 57.422 (53.860)	lr 0.00275
Warmup Train [34][3160/3239]	Time 0.524 (0.514)	Data 0.001 (0.010)	Loss 4.0616 (4.0367)	Top-1 acc 27.734 (30.516)	Top-5 acc 51.562 (53.857)	lr 0.00275
Warmup Train [34][3170/3239]	Time 0.525 (0.514)	Data 0.002 (0.010)	Loss 3.8362 (4.0368)	Top-1 acc 32.422 (30.514)	Top-5 acc 56.641 (53.855)	lr 0.00274
Warmup Train [34][3180/3239]	Time 0.404 (0.514)	Data 0.000 (0.010)	Loss 3.9567 (4.0368)	Top-1 acc 32.031 (30.514)	Top-5 acc 57.812 (53.855)	lr 0.00274
Warmup Train [34][3190/3239]	Time 0.340 (0.513)	Data 0.000 (0.010)	Loss 3.9542 (4.0367)	Top-1 acc 30.859 (30.512)	Top-5 acc 55.078 (53.859)	lr 0.00274
Warmup Train [34][3200/3239]	Time 0.526 (0.513)	Data 0.000 (0.010)	Loss 4.1882 (4.0367)	Top-1 acc 28.516 (30.512)	Top-5 acc 51.953 (53.859)	lr 0.00274
Warmup Train [34][3210/3239]	Time 0.389 (0.513)	Data 0.000 (0.010)	Loss 4.0581 (4.0369)	Top-1 acc 30.078 (30.510)	Top-5 acc 51.562 (53.855)	lr 0.00273
Warmup Train [34][3220/3239]	Time 0.472 (0.513)	Data 0.000 (0.010)	Loss 4.2542 (4.0370)	Top-1 acc 26.172 (30.509)	Top-5 acc 48.438 (53.856)	lr 0.00273
Warmup Train [34][3230/3239]	Time 0.508 (0.513)	Data 0.000 (0.010)	Loss 4.0570 (4.0371)	Top-1 acc 28.906 (30.506)	Top-5 acc 53.125 (53.853)	lr 0.00273
Warmup Train [34][3239/3239]	Time 0.286 (0.513)	Data 0.000 (0.010)	Loss 4.2492 (4.0371)	Top-1 acc 30.864 (30.509)	Top-5 acc 48.148 (53.852)	lr 0.00273
==========Warmup Valid [34/40]	loss 2.980	top-1 acc 38.015	top-5 acc 62.608	Train top-1 30.509	top-5 53.852	flops: 442.4M
Warmup Train [35][0/3239]	Time 15.110 (15.110)	Data 13.937 (13.937)	Loss 4.0228 (4.0228)	Top-1 acc 31.250 (31.250)	Top-5 acc 53.516 (53.516)	lr 0.00272
Warmup Train [35][10/3239]	Time 0.485 (1.890)	Data 0.002 (1.283)	Loss 4.0598 (4.0773)	Top-1 acc 28.516 (29.616)	Top-5 acc 51.953 (52.983)	lr 0.00272
Warmup Train [35][20/3239]	Time 0.523 (1.228)	Data 0.029 (0.678)	Loss 4.0519 (4.0553)	Top-1 acc 28.125 (30.060)	Top-5 acc 53.125 (53.478)	lr 0.00272
Warmup Train [35][30/3239]	Time 0.484 (0.991)	Data 0.002 (0.462)	Loss 4.0017 (4.0452)	Top-1 acc 31.250 (30.229)	Top-5 acc 56.250 (53.679)	lr 0.00272
Warmup Train [35][40/3239]	Time 0.578 (0.866)	Data 0.001 (0.350)	Loss 3.8955 (4.0466)	Top-1 acc 33.203 (30.040)	Top-5 acc 55.469 (53.763)	lr 0.00271
Warmup Train [35][50/3239]	Time 0.478 (0.785)	Data 0.001 (0.282)	Loss 4.0370 (4.0521)	Top-1 acc 30.078 (30.040)	Top-5 acc 53.125 (53.569)	lr 0.00271
Warmup Train [35][60/3239]	Time 0.452 (0.739)	Data 0.001 (0.237)	Loss 4.2611 (4.0524)	Top-1 acc 26.562 (30.091)	Top-5 acc 50.000 (53.522)	lr 0.00271
Warmup Train [35][70/3239]	Time 0.633 (0.711)	Data 0.001 (0.207)	Loss 3.9864 (4.0510)	Top-1 acc 30.078 (29.990)	Top-5 acc 53.906 (53.488)	lr 0.00271
Warmup Train [35][80/3239]	Time 0.490 (0.686)	Data 0.001 (0.181)	Loss 3.9415 (4.0491)	Top-1 acc 37.109 (30.064)	Top-5 acc 57.422 (53.549)	lr 0.00270
Warmup Train [35][90/3239]	Time 0.605 (0.665)	Data 0.001 (0.162)	Loss 4.0712 (4.0544)	Top-1 acc 26.172 (29.911)	Top-5 acc 49.609 (53.529)	lr 0.00270
Warmup Train [35][100/3239]	Time 0.474 (0.651)	Data 0.001 (0.146)	Loss 4.0266 (4.0458)	Top-1 acc 30.469 (30.132)	Top-5 acc 52.344 (53.779)	lr 0.00270
Warmup Train [35][110/3239]	Time 0.587 (0.637)	Data 0.001 (0.133)	Loss 3.7641 (4.0454)	Top-1 acc 39.453 (30.163)	Top-5 acc 57.812 (53.706)	lr 0.00269
Warmup Train [35][120/3239]	Time 0.499 (0.626)	Data 0.001 (0.122)	Loss 4.0815 (4.0438)	Top-1 acc 26.562 (30.091)	Top-5 acc 51.172 (53.661)	lr 0.00269
Warmup Train [35][130/3239]	Time 0.635 (0.615)	Data 0.001 (0.113)	Loss 3.9629 (4.0405)	Top-1 acc 29.688 (30.221)	Top-5 acc 57.031 (53.784)	lr 0.00269
Warmup Train [35][140/3239]	Time 0.594 (0.608)	Data 0.001 (0.105)	Loss 4.0129 (4.0361)	Top-1 acc 31.641 (30.422)	Top-5 acc 55.078 (53.867)	lr 0.00269
Warmup Train [35][150/3239]	Time 0.325 (0.600)	Data 0.001 (0.098)	Loss 4.0511 (4.0346)	Top-1 acc 27.734 (30.435)	Top-5 acc 54.297 (53.893)	lr 0.00268
Warmup Train [35][160/3239]	Time 0.516 (0.595)	Data 0.001 (0.093)	Loss 3.7455 (4.0324)	Top-1 acc 35.938 (30.522)	Top-5 acc 59.766 (53.962)	lr 0.00268
Warmup Train [35][170/3239]	Time 0.550 (0.590)	Data 0.001 (0.088)	Loss 3.9624 (4.0314)	Top-1 acc 34.375 (30.530)	Top-5 acc 56.250 (53.979)	lr 0.00268
Warmup Train [35][180/3239]	Time 0.474 (0.586)	Data 0.001 (0.084)	Loss 4.0242 (4.0326)	Top-1 acc 35.938 (30.542)	Top-5 acc 54.688 (53.956)	lr 0.00268
Warmup Train [35][190/3239]	Time 0.408 (0.582)	Data 0.001 (0.080)	Loss 4.0173 (4.0312)	Top-1 acc 32.422 (30.598)	Top-5 acc 56.641 (54.031)	lr 0.00267
Warmup Train [35][200/3239]	Time 0.416 (0.578)	Data 0.001 (0.076)	Loss 3.9189 (4.0297)	Top-1 acc 32.422 (30.661)	Top-5 acc 53.906 (54.056)	lr 0.00267
Warmup Train [35][210/3239]	Time 0.408 (0.575)	Data 0.001 (0.073)	Loss 3.8938 (4.0296)	Top-1 acc 32.422 (30.665)	Top-5 acc 58.203 (54.014)	lr 0.00267
Warmup Train [35][220/3239]	Time 0.496 (0.573)	Data 0.001 (0.070)	Loss 4.2010 (4.0286)	Top-1 acc 26.953 (30.706)	Top-5 acc 49.609 (54.041)	lr 0.00266
Warmup Train [35][230/3239]	Time 0.440 (0.569)	Data 0.001 (0.067)	Loss 3.9292 (4.0268)	Top-1 acc 33.203 (30.783)	Top-5 acc 59.375 (54.111)	lr 0.00266
Warmup Train [35][240/3239]	Time 0.618 (0.568)	Data 0.001 (0.065)	Loss 4.1539 (4.0266)	Top-1 acc 29.688 (30.832)	Top-5 acc 52.344 (54.094)	lr 0.00266
Warmup Train [35][250/3239]	Time 0.461 (0.566)	Data 0.001 (0.063)	Loss 3.8295 (4.0268)	Top-1 acc 31.641 (30.802)	Top-5 acc 58.203 (54.060)	lr 0.00266
Warmup Train [35][260/3239]	Time 0.562 (0.564)	Data 0.001 (0.060)	Loss 4.2607 (4.0274)	Top-1 acc 28.516 (30.804)	Top-5 acc 48.438 (54.081)	lr 0.00265
Warmup Train [35][270/3239]	Time 0.488 (0.562)	Data 0.001 (0.058)	Loss 4.2017 (4.0283)	Top-1 acc 28.906 (30.771)	Top-5 acc 46.094 (54.039)	lr 0.00265
Warmup Train [35][280/3239]	Time 0.652 (0.560)	Data 0.001 (0.056)	Loss 4.0732 (4.0267)	Top-1 acc 30.859 (30.815)	Top-5 acc 51.172 (54.048)	lr 0.00265
Warmup Train [35][290/3239]	Time 0.364 (0.558)	Data 0.001 (0.055)	Loss 3.9842 (4.0266)	Top-1 acc 31.641 (30.807)	Top-5 acc 55.078 (54.027)	lr 0.00265
Warmup Train [35][300/3239]	Time 0.354 (0.556)	Data 0.001 (0.053)	Loss 3.8871 (4.0268)	Top-1 acc 33.984 (30.793)	Top-5 acc 57.031 (54.052)	lr 0.00264
Warmup Train [35][310/3239]	Time 0.429 (0.554)	Data 0.001 (0.052)	Loss 4.1166 (4.0262)	Top-1 acc 26.953 (30.798)	Top-5 acc 50.781 (54.051)	lr 0.00264
Warmup Train [35][320/3239]	Time 0.341 (0.552)	Data 0.001 (0.051)	Loss 3.8106 (4.0248)	Top-1 acc 35.156 (30.820)	Top-5 acc 58.984 (54.096)	lr 0.00264
Warmup Train [35][330/3239]	Time 0.448 (0.550)	Data 0.001 (0.049)	Loss 3.8612 (4.0242)	Top-1 acc 31.250 (30.823)	Top-5 acc 58.984 (54.115)	lr 0.00263
Warmup Train [35][340/3239]	Time 0.544 (0.549)	Data 0.001 (0.048)	Loss 4.0674 (4.0225)	Top-1 acc 29.297 (30.879)	Top-5 acc 55.078 (54.167)	lr 0.00263
Warmup Train [35][350/3239]	Time 0.736 (0.547)	Data 0.001 (0.047)	Loss 3.6565 (4.0225)	Top-1 acc 38.281 (30.877)	Top-5 acc 64.062 (54.147)	lr 0.00263
Warmup Train [35][360/3239]	Time 0.357 (0.546)	Data 0.001 (0.046)	Loss 4.0663 (4.0222)	Top-1 acc 27.344 (30.864)	Top-5 acc 53.125 (54.139)	lr 0.00263
Warmup Train [35][370/3239]	Time 0.536 (0.546)	Data 0.001 (0.045)	Loss 4.0937 (4.0216)	Top-1 acc 28.906 (30.860)	Top-5 acc 51.953 (54.137)	lr 0.00262
Warmup Train [35][380/3239]	Time 0.469 (0.545)	Data 0.001 (0.044)	Loss 4.1506 (4.0223)	Top-1 acc 26.562 (30.853)	Top-5 acc 49.219 (54.115)	lr 0.00262
Warmup Train [35][390/3239]	Time 0.443 (0.544)	Data 0.001 (0.043)	Loss 3.9429 (4.0220)	Top-1 acc 32.812 (30.840)	Top-5 acc 59.766 (54.131)	lr 0.00262
Warmup Train [35][400/3239]	Time 0.485 (0.544)	Data 0.001 (0.042)	Loss 3.9784 (4.0218)	Top-1 acc 31.250 (30.826)	Top-5 acc 54.688 (54.142)	lr 0.00262
Warmup Train [35][410/3239]	Time 0.572 (0.543)	Data 0.001 (0.041)	Loss 4.2436 (4.0230)	Top-1 acc 28.125 (30.799)	Top-5 acc 49.609 (54.124)	lr 0.00261
Warmup Train [35][420/3239]	Time 0.573 (0.542)	Data 0.001 (0.040)	Loss 4.1827 (4.0244)	Top-1 acc 25.781 (30.776)	Top-5 acc 48.828 (54.083)	lr 0.00261
Warmup Train [35][430/3239]	Time 0.683 (0.541)	Data 0.001 (0.040)	Loss 4.0617 (4.0257)	Top-1 acc 26.953 (30.748)	Top-5 acc 51.562 (54.068)	lr 0.00261
Warmup Train [35][440/3239]	Time 0.498 (0.541)	Data 0.001 (0.039)	Loss 4.1315 (4.0261)	Top-1 acc 30.469 (30.719)	Top-5 acc 47.656 (54.059)	lr 0.00261
Warmup Train [35][450/3239]	Time 0.603 (0.540)	Data 0.001 (0.038)	Loss 4.0808 (4.0263)	Top-1 acc 30.859 (30.740)	Top-5 acc 53.125 (54.033)	lr 0.00260
Warmup Train [35][460/3239]	Time 0.644 (0.540)	Data 0.002 (0.037)	Loss 3.9401 (4.0258)	Top-1 acc 30.469 (30.731)	Top-5 acc 57.031 (54.029)	lr 0.00260
Warmup Train [35][470/3239]	Time 0.549 (0.540)	Data 0.001 (0.037)	Loss 4.0469 (4.0258)	Top-1 acc 33.594 (30.722)	Top-5 acc 57.422 (54.027)	lr 0.00260
Warmup Train [35][480/3239]	Time 0.529 (0.539)	Data 0.001 (0.036)	Loss 4.0577 (4.0263)	Top-1 acc 28.906 (30.716)	Top-5 acc 55.078 (54.028)	lr 0.00259
Warmup Train [35][490/3239]	Time 0.509 (0.538)	Data 0.001 (0.035)	Loss 4.1767 (4.0271)	Top-1 acc 23.828 (30.688)	Top-5 acc 49.219 (54.003)	lr 0.00259
Warmup Train [35][500/3239]	Time 0.454 (0.537)	Data 0.001 (0.034)	Loss 4.0427 (4.0263)	Top-1 acc 29.688 (30.686)	Top-5 acc 55.859 (54.037)	lr 0.00259
Warmup Train [35][510/3239]	Time 0.671 (0.538)	Data 0.002 (0.034)	Loss 4.0413 (4.0256)	Top-1 acc 32.422 (30.713)	Top-5 acc 54.688 (54.066)	lr 0.00259
Warmup Train [35][520/3239]	Time 0.613 (0.537)	Data 0.001 (0.034)	Loss 3.9865 (4.0268)	Top-1 acc 32.422 (30.688)	Top-5 acc 50.781 (54.024)	lr 0.00258
Warmup Train [35][530/3239]	Time 0.596 (0.537)	Data 0.001 (0.033)	Loss 3.9255 (4.0267)	Top-1 acc 28.906 (30.678)	Top-5 acc 57.031 (54.026)	lr 0.00258
Warmup Train [35][540/3239]	Time 0.618 (0.536)	Data 0.001 (0.032)	Loss 3.9165 (4.0260)	Top-1 acc 33.984 (30.698)	Top-5 acc 55.469 (54.040)	lr 0.00258
Warmup Train [35][550/3239]	Time 0.676 (0.536)	Data 0.001 (0.032)	Loss 3.8906 (4.0261)	Top-1 acc 32.031 (30.692)	Top-5 acc 55.859 (54.018)	lr 0.00258
Warmup Train [35][560/3239]	Time 0.458 (0.534)	Data 0.001 (0.031)	Loss 4.0509 (4.0259)	Top-1 acc 32.031 (30.710)	Top-5 acc 54.297 (54.009)	lr 0.00257
Warmup Train [35][570/3239]	Time 0.550 (0.534)	Data 0.001 (0.031)	Loss 4.0014 (4.0253)	Top-1 acc 30.078 (30.725)	Top-5 acc 55.859 (54.023)	lr 0.00257
Warmup Train [35][580/3239]	Time 0.411 (0.534)	Data 0.001 (0.031)	Loss 4.0435 (4.0261)	Top-1 acc 31.250 (30.703)	Top-5 acc 54.297 (54.012)	lr 0.00257
Warmup Train [35][590/3239]	Time 0.587 (0.533)	Data 0.001 (0.030)	Loss 3.8517 (4.0260)	Top-1 acc 32.031 (30.686)	Top-5 acc 57.812 (54.013)	lr 0.00256
Warmup Train [35][600/3239]	Time 0.208 (0.532)	Data 0.001 (0.030)	Loss 4.0531 (4.0265)	Top-1 acc 30.469 (30.704)	Top-5 acc 55.078 (54.005)	lr 0.00256
Warmup Train [35][610/3239]	Time 0.498 (0.531)	Data 0.001 (0.030)	Loss 4.0636 (4.0259)	Top-1 acc 30.859 (30.720)	Top-5 acc 53.516 (54.021)	lr 0.00256
Warmup Train [35][620/3239]	Time 0.533 (0.531)	Data 0.001 (0.029)	Loss 4.0802 (4.0268)	Top-1 acc 30.078 (30.706)	Top-5 acc 54.297 (53.993)	lr 0.00256
Warmup Train [35][630/3239]	Time 0.543 (0.530)	Data 0.001 (0.029)	Loss 3.7796 (4.0257)	Top-1 acc 33.594 (30.728)	Top-5 acc 58.984 (54.017)	lr 0.00255
Warmup Train [35][640/3239]	Time 0.455 (0.530)	Data 0.001 (0.029)	Loss 4.1748 (4.0253)	Top-1 acc 31.250 (30.747)	Top-5 acc 51.562 (54.035)	lr 0.00255
Warmup Train [35][650/3239]	Time 0.521 (0.530)	Data 0.001 (0.028)	Loss 4.0241 (4.0262)	Top-1 acc 30.469 (30.732)	Top-5 acc 51.953 (54.003)	lr 0.00255
Warmup Train [35][660/3239]	Time 0.747 (0.530)	Data 0.001 (0.028)	Loss 4.0292 (4.0266)	Top-1 acc 32.031 (30.740)	Top-5 acc 54.688 (54.003)	lr 0.00255
Warmup Train [35][670/3239]	Time 0.555 (0.530)	Data 0.001 (0.028)	Loss 4.0897 (4.0272)	Top-1 acc 33.594 (30.759)	Top-5 acc 52.344 (53.987)	lr 0.00254
Warmup Train [35][680/3239]	Time 0.465 (0.529)	Data 0.001 (0.027)	Loss 4.0150 (4.0272)	Top-1 acc 29.688 (30.743)	Top-5 acc 55.859 (53.989)	lr 0.00254
Warmup Train [35][690/3239]	Time 0.357 (0.529)	Data 0.002 (0.027)	Loss 4.1945 (4.0270)	Top-1 acc 28.516 (30.761)	Top-5 acc 51.953 (53.995)	lr 0.00254
Warmup Train [35][700/3239]	Time 0.413 (0.529)	Data 0.001 (0.027)	Loss 3.9182 (4.0269)	Top-1 acc 32.812 (30.761)	Top-5 acc 57.031 (53.995)	lr 0.00254
Warmup Train [35][710/3239]	Time 0.520 (0.529)	Data 0.001 (0.027)	Loss 3.8455 (4.0272)	Top-1 acc 30.078 (30.735)	Top-5 acc 59.766 (53.991)	lr 0.00253
Warmup Train [35][720/3239]	Time 0.413 (0.528)	Data 0.001 (0.026)	Loss 4.1747 (4.0263)	Top-1 acc 26.172 (30.731)	Top-5 acc 54.297 (54.009)	lr 0.00253
Warmup Train [35][730/3239]	Time 0.510 (0.528)	Data 0.001 (0.026)	Loss 4.1091 (4.0265)	Top-1 acc 31.250 (30.735)	Top-5 acc 53.516 (54.028)	lr 0.00253
Warmup Train [35][740/3239]	Time 0.503 (0.528)	Data 0.001 (0.026)	Loss 4.1284 (4.0266)	Top-1 acc 27.734 (30.740)	Top-5 acc 51.953 (54.024)	lr 0.00252
Warmup Train [35][750/3239]	Time 0.482 (0.527)	Data 0.001 (0.025)	Loss 4.1666 (4.0260)	Top-1 acc 26.953 (30.745)	Top-5 acc 53.906 (54.026)	lr 0.00252
Warmup Train [35][760/3239]	Time 0.479 (0.527)	Data 0.001 (0.025)	Loss 4.1216 (4.0267)	Top-1 acc 28.906 (30.722)	Top-5 acc 50.000 (54.017)	lr 0.00252
Warmup Train [35][770/3239]	Time 0.475 (0.527)	Data 0.001 (0.025)	Loss 4.2013 (4.0275)	Top-1 acc 28.516 (30.698)	Top-5 acc 52.734 (54.005)	lr 0.00252
Warmup Train [35][780/3239]	Time 0.568 (0.527)	Data 0.001 (0.025)	Loss 4.0429 (4.0272)	Top-1 acc 30.859 (30.693)	Top-5 acc 54.688 (54.016)	lr 0.00251
Warmup Train [35][790/3239]	Time 0.448 (0.527)	Data 0.001 (0.024)	Loss 3.8930 (4.0268)	Top-1 acc 30.469 (30.686)	Top-5 acc 55.078 (54.022)	lr 0.00251
Warmup Train [35][800/3239]	Time 0.529 (0.526)	Data 0.001 (0.024)	Loss 4.1177 (4.0269)	Top-1 acc 33.203 (30.679)	Top-5 acc 53.125 (54.016)	lr 0.00251
Warmup Train [35][810/3239]	Time 0.516 (0.526)	Data 0.001 (0.024)	Loss 3.9859 (4.0270)	Top-1 acc 30.469 (30.675)	Top-5 acc 54.688 (54.020)	lr 0.00251
Warmup Train [35][820/3239]	Time 0.630 (0.526)	Data 0.001 (0.024)	Loss 4.1417 (4.0271)	Top-1 acc 26.172 (30.678)	Top-5 acc 54.688 (54.015)	lr 0.00250
Warmup Train [35][830/3239]	Time 0.543 (0.526)	Data 0.001 (0.023)	Loss 3.9545 (4.0266)	Top-1 acc 32.812 (30.683)	Top-5 acc 55.469 (54.021)	lr 0.00250
Warmup Train [35][840/3239]	Time 0.393 (0.525)	Data 0.001 (0.023)	Loss 4.0389 (4.0274)	Top-1 acc 31.250 (30.658)	Top-5 acc 53.516 (53.985)	lr 0.00250
Warmup Train [35][850/3239]	Time 0.448 (0.525)	Data 0.001 (0.023)	Loss 4.2580 (4.0278)	Top-1 acc 28.906 (30.657)	Top-5 acc 52.344 (53.986)	lr 0.00250
Warmup Train [35][860/3239]	Time 0.298 (0.524)	Data 0.001 (0.023)	Loss 3.8523 (4.0275)	Top-1 acc 36.328 (30.673)	Top-5 acc 58.984 (53.984)	lr 0.00249
Warmup Train [35][870/3239]	Time 0.345 (0.524)	Data 0.001 (0.023)	Loss 3.8696 (4.0267)	Top-1 acc 31.641 (30.686)	Top-5 acc 59.766 (54.010)	lr 0.00249
Warmup Train [35][880/3239]	Time 0.426 (0.524)	Data 0.001 (0.023)	Loss 4.1302 (4.0271)	Top-1 acc 26.562 (30.669)	Top-5 acc 50.000 (54.005)	lr 0.00249
Warmup Train [35][890/3239]	Time 0.558 (0.524)	Data 0.001 (0.023)	Loss 4.0284 (4.0264)	Top-1 acc 30.078 (30.673)	Top-5 acc 51.172 (54.014)	lr 0.00249
Warmup Train [35][900/3239]	Time 0.349 (0.523)	Data 0.001 (0.022)	Loss 4.0831 (4.0263)	Top-1 acc 28.516 (30.661)	Top-5 acc 51.562 (54.010)	lr 0.00248
Warmup Train [35][910/3239]	Time 0.394 (0.523)	Data 0.002 (0.022)	Loss 3.9869 (4.0266)	Top-1 acc 32.422 (30.660)	Top-5 acc 55.469 (54.006)	lr 0.00248
Warmup Train [35][920/3239]	Time 0.663 (0.523)	Data 0.001 (0.022)	Loss 3.9707 (4.0269)	Top-1 acc 31.250 (30.652)	Top-5 acc 52.734 (53.992)	lr 0.00248
Warmup Train [35][930/3239]	Time 0.466 (0.523)	Data 0.001 (0.022)	Loss 4.0267 (4.0275)	Top-1 acc 32.812 (30.639)	Top-5 acc 57.812 (53.983)	lr 0.00247
Warmup Train [35][940/3239]	Time 0.553 (0.523)	Data 0.001 (0.022)	Loss 4.0966 (4.0277)	Top-1 acc 28.906 (30.629)	Top-5 acc 50.391 (53.970)	lr 0.00247
Warmup Train [35][950/3239]	Time 0.597 (0.523)	Data 0.001 (0.022)	Loss 4.0381 (4.0275)	Top-1 acc 27.734 (30.627)	Top-5 acc 54.688 (53.980)	lr 0.00247
Warmup Train [35][960/3239]	Time 0.481 (0.523)	Data 0.001 (0.021)	Loss 4.1294 (4.0274)	Top-1 acc 32.812 (30.636)	Top-5 acc 54.688 (53.979)	lr 0.00247
Warmup Train [35][970/3239]	Time 0.436 (0.523)	Data 0.001 (0.021)	Loss 4.0045 (4.0274)	Top-1 acc 29.688 (30.632)	Top-5 acc 51.562 (53.980)	lr 0.00246
Warmup Train [35][980/3239]	Time 0.522 (0.522)	Data 0.001 (0.021)	Loss 3.8278 (4.0273)	Top-1 acc 33.203 (30.636)	Top-5 acc 55.859 (53.981)	lr 0.00246
Warmup Train [35][990/3239]	Time 0.637 (0.523)	Data 0.001 (0.021)	Loss 4.0690 (4.0271)	Top-1 acc 32.422 (30.648)	Top-5 acc 52.734 (53.981)	lr 0.00246
Warmup Train [35][1000/3239]	Time 0.344 (0.522)	Data 0.001 (0.021)	Loss 4.0750 (4.0270)	Top-1 acc 31.250 (30.660)	Top-5 acc 53.125 (53.993)	lr 0.00246
Warmup Train [35][1010/3239]	Time 0.399 (0.522)	Data 0.001 (0.021)	Loss 3.7151 (4.0270)	Top-1 acc 35.156 (30.653)	Top-5 acc 62.891 (53.989)	lr 0.00245
Warmup Train [35][1020/3239]	Time 0.430 (0.522)	Data 0.001 (0.021)	Loss 3.8918 (4.0276)	Top-1 acc 34.375 (30.644)	Top-5 acc 57.422 (53.979)	lr 0.00245
Warmup Train [35][1030/3239]	Time 0.550 (0.522)	Data 0.001 (0.021)	Loss 4.1825 (4.0278)	Top-1 acc 25.000 (30.635)	Top-5 acc 51.172 (53.980)	lr 0.00245
Warmup Train [35][1040/3239]	Time 0.530 (0.522)	Data 0.001 (0.020)	Loss 3.9358 (4.0273)	Top-1 acc 33.594 (30.648)	Top-5 acc 56.250 (53.998)	lr 0.00245
Warmup Train [35][1050/3239]	Time 0.415 (0.522)	Data 0.001 (0.020)	Loss 4.0936 (4.0265)	Top-1 acc 25.391 (30.650)	Top-5 acc 56.641 (54.024)	lr 0.00244
Warmup Train [35][1060/3239]	Time 0.456 (0.522)	Data 0.001 (0.020)	Loss 3.7738 (4.0265)	Top-1 acc 41.016 (30.667)	Top-5 acc 60.938 (54.028)	lr 0.00244
Warmup Train [35][1070/3239]	Time 0.526 (0.522)	Data 0.001 (0.020)	Loss 4.2875 (4.0266)	Top-1 acc 25.000 (30.659)	Top-5 acc 48.438 (54.021)	lr 0.00244
Warmup Train [35][1080/3239]	Time 0.416 (0.522)	Data 0.001 (0.020)	Loss 4.2808 (4.0268)	Top-1 acc 26.172 (30.660)	Top-5 acc 47.656 (54.013)	lr 0.00244
Warmup Train [35][1090/3239]	Time 0.606 (0.522)	Data 0.001 (0.020)	Loss 4.0449 (4.0267)	Top-1 acc 29.297 (30.661)	Top-5 acc 49.609 (54.027)	lr 0.00243
Warmup Train [35][1100/3239]	Time 0.536 (0.522)	Data 0.001 (0.020)	Loss 3.9522 (4.0271)	Top-1 acc 33.984 (30.654)	Top-5 acc 52.734 (54.011)	lr 0.00243
Warmup Train [35][1110/3239]	Time 0.359 (0.522)	Data 0.001 (0.019)	Loss 4.0549 (4.0274)	Top-1 acc 33.594 (30.656)	Top-5 acc 54.688 (54.022)	lr 0.00243
Warmup Train [35][1120/3239]	Time 0.420 (0.521)	Data 0.001 (0.019)	Loss 3.9215 (4.0278)	Top-1 acc 28.516 (30.640)	Top-5 acc 56.641 (54.003)	lr 0.00242
Warmup Train [35][1130/3239]	Time 0.526 (0.521)	Data 0.001 (0.019)	Loss 4.1556 (4.0275)	Top-1 acc 33.203 (30.650)	Top-5 acc 49.219 (54.012)	lr 0.00242
Warmup Train [35][1140/3239]	Time 0.524 (0.520)	Data 0.001 (0.019)	Loss 4.0788 (4.0275)	Top-1 acc 30.078 (30.652)	Top-5 acc 52.734 (54.011)	lr 0.00242
Warmup Train [35][1150/3239]	Time 0.465 (0.520)	Data 0.001 (0.019)	Loss 3.9212 (4.0278)	Top-1 acc 32.031 (30.643)	Top-5 acc 55.078 (54.004)	lr 0.00242
Warmup Train [35][1160/3239]	Time 0.511 (0.520)	Data 0.001 (0.019)	Loss 3.7817 (4.0277)	Top-1 acc 39.453 (30.651)	Top-5 acc 57.422 (54.004)	lr 0.00241
Warmup Train [35][1170/3239]	Time 0.453 (0.520)	Data 0.001 (0.019)	Loss 3.9342 (4.0280)	Top-1 acc 35.156 (30.648)	Top-5 acc 55.078 (53.997)	lr 0.00241
Warmup Train [35][1180/3239]	Time 0.627 (0.520)	Data 0.001 (0.019)	Loss 4.0119 (4.0279)	Top-1 acc 32.812 (30.653)	Top-5 acc 55.469 (53.999)	lr 0.00241
Warmup Train [35][1190/3239]	Time 0.476 (0.520)	Data 0.001 (0.019)	Loss 4.0927 (4.0277)	Top-1 acc 31.250 (30.653)	Top-5 acc 52.344 (54.008)	lr 0.00241
Warmup Train [35][1200/3239]	Time 0.597 (0.520)	Data 0.001 (0.018)	Loss 3.9470 (4.0279)	Top-1 acc 29.297 (30.651)	Top-5 acc 55.859 (54.001)	lr 0.00240
Warmup Train [35][1210/3239]	Time 0.651 (0.520)	Data 0.001 (0.018)	Loss 3.9890 (4.0275)	Top-1 acc 29.688 (30.650)	Top-5 acc 53.516 (54.006)	lr 0.00240
Warmup Train [35][1220/3239]	Time 0.511 (0.520)	Data 0.001 (0.018)	Loss 4.0399 (4.0276)	Top-1 acc 29.688 (30.642)	Top-5 acc 55.469 (54.008)	lr 0.00240
Warmup Train [35][1230/3239]	Time 0.532 (0.519)	Data 0.001 (0.018)	Loss 4.0549 (4.0279)	Top-1 acc 31.250 (30.642)	Top-5 acc 52.734 (54.001)	lr 0.00240
Warmup Train [35][1240/3239]	Time 0.585 (0.519)	Data 0.001 (0.018)	Loss 4.0679 (4.0270)	Top-1 acc 30.469 (30.656)	Top-5 acc 52.344 (54.018)	lr 0.00239
Warmup Train [35][1250/3239]	Time 0.456 (0.519)	Data 0.001 (0.018)	Loss 4.1922 (4.0274)	Top-1 acc 30.469 (30.654)	Top-5 acc 49.219 (54.008)	lr 0.00239
Warmup Train [35][1260/3239]	Time 0.489 (0.519)	Data 0.001 (0.018)	Loss 3.9275 (4.0268)	Top-1 acc 31.641 (30.668)	Top-5 acc 57.031 (54.026)	lr 0.00239
Warmup Train [35][1270/3239]	Time 0.571 (0.519)	Data 0.001 (0.018)	Loss 4.1829 (4.0270)	Top-1 acc 26.562 (30.651)	Top-5 acc 48.438 (54.024)	lr 0.00239
Warmup Train [35][1280/3239]	Time 0.620 (0.519)	Data 0.001 (0.017)	Loss 3.9678 (4.0279)	Top-1 acc 33.984 (30.635)	Top-5 acc 55.078 (54.009)	lr 0.00238
Warmup Train [35][1290/3239]	Time 0.447 (0.519)	Data 0.001 (0.017)	Loss 3.9926 (4.0281)	Top-1 acc 30.469 (30.636)	Top-5 acc 57.031 (54.007)	lr 0.00238
Warmup Train [35][1300/3239]	Time 0.462 (0.519)	Data 0.001 (0.017)	Loss 3.9960 (4.0279)	Top-1 acc 29.297 (30.634)	Top-5 acc 55.078 (54.013)	lr 0.00238
Warmup Train [35][1310/3239]	Time 0.489 (0.519)	Data 0.001 (0.017)	Loss 4.1873 (4.0277)	Top-1 acc 26.172 (30.627)	Top-5 acc 51.953 (54.016)	lr 0.00238
Warmup Train [35][1320/3239]	Time 0.475 (0.519)	Data 0.001 (0.017)	Loss 4.1347 (4.0285)	Top-1 acc 28.516 (30.612)	Top-5 acc 50.781 (53.995)	lr 0.00237
Warmup Train [35][1330/3239]	Time 0.579 (0.519)	Data 0.001 (0.017)	Loss 3.9236 (4.0285)	Top-1 acc 30.469 (30.612)	Top-5 acc 56.250 (53.993)	lr 0.00237
Warmup Train [35][1340/3239]	Time 0.586 (0.520)	Data 0.001 (0.017)	Loss 4.0071 (4.0282)	Top-1 acc 27.344 (30.611)	Top-5 acc 55.859 (53.998)	lr 0.00237
Warmup Train [35][1350/3239]	Time 0.636 (0.519)	Data 0.001 (0.017)	Loss 4.0487 (4.0284)	Top-1 acc 31.250 (30.602)	Top-5 acc 53.125 (53.993)	lr 0.00237
Warmup Train [35][1360/3239]	Time 0.615 (0.519)	Data 0.001 (0.017)	Loss 3.9970 (4.0284)	Top-1 acc 33.203 (30.600)	Top-5 acc 56.250 (53.992)	lr 0.00236
Warmup Train [35][1370/3239]	Time 0.397 (0.519)	Data 0.001 (0.017)	Loss 4.0544 (4.0285)	Top-1 acc 29.688 (30.600)	Top-5 acc 55.859 (53.994)	lr 0.00236
Warmup Train [35][1380/3239]	Time 0.512 (0.519)	Data 0.001 (0.017)	Loss 4.0077 (4.0284)	Top-1 acc 27.734 (30.601)	Top-5 acc 54.297 (53.996)	lr 0.00236
Warmup Train [35][1390/3239]	Time 0.614 (0.519)	Data 0.001 (0.016)	Loss 3.9877 (4.0283)	Top-1 acc 32.031 (30.598)	Top-5 acc 58.203 (53.992)	lr 0.00236
Warmup Train [35][1400/3239]	Time 0.579 (0.519)	Data 0.001 (0.016)	Loss 3.9099 (4.0284)	Top-1 acc 31.641 (30.591)	Top-5 acc 54.688 (53.987)	lr 0.00235
Warmup Train [35][1410/3239]	Time 0.422 (0.519)	Data 0.001 (0.016)	Loss 3.8413 (4.0284)	Top-1 acc 33.594 (30.593)	Top-5 acc 58.203 (53.990)	lr 0.00235
Warmup Train [35][1420/3239]	Time 0.426 (0.518)	Data 0.001 (0.016)	Loss 4.1540 (4.0287)	Top-1 acc 28.516 (30.582)	Top-5 acc 52.344 (53.980)	lr 0.00235
Warmup Train [35][1430/3239]	Time 0.366 (0.518)	Data 0.001 (0.016)	Loss 3.9387 (4.0283)	Top-1 acc 33.984 (30.584)	Top-5 acc 55.469 (53.985)	lr 0.00234
Warmup Train [35][1440/3239]	Time 0.308 (0.517)	Data 0.001 (0.016)	Loss 3.9584 (4.0282)	Top-1 acc 30.078 (30.584)	Top-5 acc 57.422 (53.990)	lr 0.00234
Warmup Train [35][1450/3239]	Time 0.535 (0.517)	Data 0.001 (0.016)	Loss 4.1729 (4.0283)	Top-1 acc 28.125 (30.582)	Top-5 acc 50.781 (53.988)	lr 0.00234
Warmup Train [35][1460/3239]	Time 0.489 (0.517)	Data 0.001 (0.016)	Loss 3.9704 (4.0282)	Top-1 acc 31.641 (30.587)	Top-5 acc 55.469 (53.984)	lr 0.00234
Warmup Train [35][1470/3239]	Time 0.421 (0.517)	Data 0.001 (0.016)	Loss 3.9864 (4.0281)	Top-1 acc 33.594 (30.589)	Top-5 acc 54.297 (53.976)	lr 0.00233
Warmup Train [35][1480/3239]	Time 0.466 (0.517)	Data 0.001 (0.016)	Loss 3.9559 (4.0279)	Top-1 acc 34.766 (30.594)	Top-5 acc 55.078 (53.979)	lr 0.00233
Warmup Train [35][1490/3239]	Time 0.583 (0.517)	Data 0.001 (0.016)	Loss 4.1091 (4.0277)	Top-1 acc 28.906 (30.592)	Top-5 acc 51.172 (53.980)	lr 0.00233
Warmup Train [35][1500/3239]	Time 0.510 (0.517)	Data 0.001 (0.016)	Loss 3.9468 (4.0278)	Top-1 acc 35.547 (30.595)	Top-5 acc 57.812 (53.975)	lr 0.00233
Warmup Train [35][1510/3239]	Time 0.537 (0.517)	Data 0.001 (0.016)	Loss 3.9785 (4.0281)	Top-1 acc 28.906 (30.585)	Top-5 acc 58.984 (53.974)	lr 0.00232
Warmup Train [35][1520/3239]	Time 0.545 (0.517)	Data 0.001 (0.016)	Loss 4.1008 (4.0280)	Top-1 acc 31.250 (30.586)	Top-5 acc 50.391 (53.974)	lr 0.00232
Warmup Train [35][1530/3239]	Time 0.577 (0.517)	Data 0.001 (0.016)	Loss 3.9619 (4.0277)	Top-1 acc 34.375 (30.595)	Top-5 acc 55.078 (53.976)	lr 0.00232
Warmup Train [35][1540/3239]	Time 0.668 (0.517)	Data 0.001 (0.016)	Loss 4.0352 (4.0274)	Top-1 acc 32.422 (30.609)	Top-5 acc 55.469 (53.978)	lr 0.00232
Warmup Train [35][1550/3239]	Time 0.507 (0.517)	Data 0.001 (0.015)	Loss 3.9002 (4.0276)	Top-1 acc 34.766 (30.610)	Top-5 acc 55.469 (53.977)	lr 0.00231
Warmup Train [35][1560/3239]	Time 0.534 (0.517)	Data 0.001 (0.015)	Loss 3.7121 (4.0273)	Top-1 acc 37.500 (30.613)	Top-5 acc 62.891 (53.986)	lr 0.00231
Warmup Train [35][1570/3239]	Time 0.467 (0.517)	Data 0.001 (0.015)	Loss 4.1514 (4.0274)	Top-1 acc 29.297 (30.612)	Top-5 acc 54.297 (53.979)	lr 0.00231
Warmup Train [35][1580/3239]	Time 0.514 (0.516)	Data 0.001 (0.015)	Loss 3.8838 (4.0272)	Top-1 acc 35.156 (30.621)	Top-5 acc 58.984 (53.979)	lr 0.00231
Warmup Train [35][1590/3239]	Time 0.551 (0.517)	Data 0.001 (0.015)	Loss 3.8831 (4.0271)	Top-1 acc 33.594 (30.624)	Top-5 acc 60.156 (53.987)	lr 0.00230
Warmup Train [35][1600/3239]	Time 0.606 (0.517)	Data 0.001 (0.015)	Loss 4.0814 (4.0272)	Top-1 acc 27.734 (30.620)	Top-5 acc 54.688 (53.984)	lr 0.00230
Warmup Train [35][1610/3239]	Time 0.426 (0.517)	Data 0.001 (0.015)	Loss 4.0104 (4.0271)	Top-1 acc 28.906 (30.622)	Top-5 acc 52.344 (53.988)	lr 0.00230
Warmup Train [35][1620/3239]	Time 0.521 (0.517)	Data 0.001 (0.015)	Loss 3.7029 (4.0271)	Top-1 acc 33.594 (30.624)	Top-5 acc 61.328 (53.989)	lr 0.00230
Warmup Train [35][1630/3239]	Time 0.639 (0.517)	Data 0.001 (0.015)	Loss 4.1045 (4.0274)	Top-1 acc 30.078 (30.610)	Top-5 acc 50.781 (53.978)	lr 0.00229
Warmup Train [35][1640/3239]	Time 0.481 (0.517)	Data 0.001 (0.015)	Loss 3.8322 (4.0272)	Top-1 acc 33.984 (30.613)	Top-5 acc 58.594 (53.986)	lr 0.00229
Warmup Train [35][1650/3239]	Time 0.411 (0.516)	Data 0.001 (0.015)	Loss 4.1869 (4.0273)	Top-1 acc 27.734 (30.615)	Top-5 acc 50.781 (53.988)	lr 0.00229
Warmup Train [35][1660/3239]	Time 0.533 (0.517)	Data 0.001 (0.015)	Loss 3.9238 (4.0270)	Top-1 acc 29.688 (30.616)	Top-5 acc 51.562 (53.991)	lr 0.00229
Warmup Train [35][1670/3239]	Time 0.485 (0.517)	Data 0.001 (0.015)	Loss 4.0184 (4.0271)	Top-1 acc 30.078 (30.618)	Top-5 acc 53.125 (53.989)	lr 0.00228
Warmup Train [35][1680/3239]	Time 0.525 (0.516)	Data 0.001 (0.015)	Loss 3.8572 (4.0269)	Top-1 acc 35.938 (30.627)	Top-5 acc 58.594 (53.989)	lr 0.00228
Warmup Train [35][1690/3239]	Time 0.503 (0.516)	Data 0.001 (0.015)	Loss 3.9074 (4.0267)	Top-1 acc 32.031 (30.634)	Top-5 acc 56.250 (53.993)	lr 0.00228
Warmup Train [35][1700/3239]	Time 0.393 (0.516)	Data 0.001 (0.015)	Loss 4.1202 (4.0271)	Top-1 acc 29.688 (30.632)	Top-5 acc 52.734 (53.986)	lr 0.00228
Warmup Train [35][1710/3239]	Time 0.607 (0.516)	Data 0.001 (0.014)	Loss 4.1331 (4.0271)	Top-1 acc 27.344 (30.635)	Top-5 acc 46.094 (53.983)	lr 0.00227
Warmup Train [35][1720/3239]	Time 0.595 (0.516)	Data 0.001 (0.014)	Loss 4.1319 (4.0268)	Top-1 acc 26.953 (30.638)	Top-5 acc 52.344 (53.987)	lr 0.00227
Warmup Train [35][1730/3239]	Time 0.531 (0.516)	Data 0.001 (0.014)	Loss 3.8245 (4.0266)	Top-1 acc 33.203 (30.646)	Top-5 acc 58.594 (53.997)	lr 0.00227
Warmup Train [35][1740/3239]	Time 0.592 (0.515)	Data 0.001 (0.014)	Loss 3.9662 (4.0266)	Top-1 acc 32.812 (30.646)	Top-5 acc 57.812 (53.999)	lr 0.00227
Warmup Train [35][1750/3239]	Time 0.498 (0.515)	Data 0.001 (0.014)	Loss 3.9374 (4.0265)	Top-1 acc 35.938 (30.645)	Top-5 acc 58.203 (54.000)	lr 0.00226
Warmup Train [35][1760/3239]	Time 0.530 (0.515)	Data 0.001 (0.014)	Loss 4.0781 (4.0266)	Top-1 acc 29.297 (30.644)	Top-5 acc 55.078 (53.995)	lr 0.00226
Warmup Train [35][1770/3239]	Time 0.410 (0.515)	Data 0.001 (0.014)	Loss 3.8119 (4.0267)	Top-1 acc 32.031 (30.645)	Top-5 acc 56.641 (53.995)	lr 0.00226
Warmup Train [35][1780/3239]	Time 0.383 (0.516)	Data 0.001 (0.014)	Loss 4.0102 (4.0266)	Top-1 acc 32.031 (30.656)	Top-5 acc 58.203 (53.999)	lr 0.00226
Warmup Train [35][1790/3239]	Time 0.479 (0.516)	Data 0.001 (0.014)	Loss 3.9286 (4.0269)	Top-1 acc 33.203 (30.659)	Top-5 acc 53.125 (53.991)	lr 0.00225
Warmup Train [35][1800/3239]	Time 0.632 (0.516)	Data 0.001 (0.014)	Loss 3.8581 (4.0268)	Top-1 acc 36.719 (30.659)	Top-5 acc 58.984 (53.995)	lr 0.00225
Warmup Train [35][1810/3239]	Time 0.594 (0.516)	Data 0.001 (0.014)	Loss 3.8799 (4.0270)	Top-1 acc 30.859 (30.654)	Top-5 acc 57.031 (53.989)	lr 0.00225
Warmup Train [35][1820/3239]	Time 0.560 (0.516)	Data 0.001 (0.014)	Loss 4.0458 (4.0271)	Top-1 acc 31.641 (30.656)	Top-5 acc 52.734 (53.988)	lr 0.00225
Warmup Train [35][1830/3239]	Time 0.411 (0.516)	Data 0.001 (0.014)	Loss 4.1671 (4.0272)	Top-1 acc 26.562 (30.655)	Top-5 acc 50.000 (53.988)	lr 0.00224
Warmup Train [35][1840/3239]	Time 0.539 (0.516)	Data 0.001 (0.014)	Loss 3.8145 (4.0271)	Top-1 acc 32.422 (30.658)	Top-5 acc 56.250 (53.992)	lr 0.00224
Warmup Train [35][1850/3239]	Time 0.398 (0.516)	Data 0.001 (0.014)	Loss 4.0153 (4.0272)	Top-1 acc 30.859 (30.654)	Top-5 acc 53.516 (53.991)	lr 0.00224
Warmup Train [35][1860/3239]	Time 0.536 (0.516)	Data 0.001 (0.014)	Loss 3.8158 (4.0272)	Top-1 acc 33.594 (30.655)	Top-5 acc 57.031 (53.987)	lr 0.00224
Warmup Train [35][1870/3239]	Time 0.606 (0.516)	Data 0.001 (0.014)	Loss 3.9001 (4.0270)	Top-1 acc 31.250 (30.664)	Top-5 acc 59.375 (54.000)	lr 0.00223
Warmup Train [35][1880/3239]	Time 0.513 (0.516)	Data 0.001 (0.014)	Loss 3.7820 (4.0269)	Top-1 acc 35.547 (30.663)	Top-5 acc 60.547 (53.998)	lr 0.00223
Warmup Train [35][1890/3239]	Time 0.546 (0.516)	Data 0.001 (0.014)	Loss 4.1195 (4.0269)	Top-1 acc 30.859 (30.665)	Top-5 acc 53.516 (54.001)	lr 0.00223
Warmup Train [35][1900/3239]	Time 0.589 (0.516)	Data 0.001 (0.014)	Loss 4.0155 (4.0270)	Top-1 acc 27.344 (30.659)	Top-5 acc 55.078 (53.994)	lr 0.00223
Warmup Train [35][1910/3239]	Time 0.404 (0.516)	Data 0.001 (0.013)	Loss 4.1326 (4.0271)	Top-1 acc 31.641 (30.657)	Top-5 acc 53.516 (53.994)	lr 0.00222
Warmup Train [35][1920/3239]	Time 0.417 (0.516)	Data 0.001 (0.013)	Loss 4.1832 (4.0271)	Top-1 acc 28.516 (30.658)	Top-5 acc 51.172 (53.991)	lr 0.00222
Warmup Train [35][1930/3239]	Time 0.494 (0.516)	Data 0.001 (0.013)	Loss 4.0467 (4.0270)	Top-1 acc 30.469 (30.659)	Top-5 acc 52.344 (53.989)	lr 0.00222
Warmup Train [35][1940/3239]	Time 0.683 (0.516)	Data 0.001 (0.013)	Loss 3.9978 (4.0268)	Top-1 acc 32.031 (30.664)	Top-5 acc 54.688 (53.995)	lr 0.00222
Warmup Train [35][1950/3239]	Time 0.612 (0.516)	Data 0.001 (0.013)	Loss 3.8989 (4.0267)	Top-1 acc 37.500 (30.670)	Top-5 acc 59.375 (54.001)	lr 0.00221
Warmup Train [35][1960/3239]	Time 0.433 (0.516)	Data 0.001 (0.013)	Loss 3.8567 (4.0263)	Top-1 acc 33.594 (30.677)	Top-5 acc 57.422 (54.007)	lr 0.00221
Warmup Train [35][1970/3239]	Time 0.583 (0.516)	Data 0.001 (0.013)	Loss 3.8442 (4.0259)	Top-1 acc 33.984 (30.685)	Top-5 acc 55.078 (54.012)	lr 0.00221
Warmup Train [35][1980/3239]	Time 0.444 (0.515)	Data 0.001 (0.013)	Loss 4.2393 (4.0258)	Top-1 acc 29.297 (30.692)	Top-5 acc 50.391 (54.020)	lr 0.00221
Warmup Train [35][1990/3239]	Time 0.500 (0.515)	Data 0.001 (0.013)	Loss 3.9411 (4.0259)	Top-1 acc 32.422 (30.686)	Top-5 acc 56.250 (54.019)	lr 0.00220
Warmup Train [35][2000/3239]	Time 0.462 (0.515)	Data 0.001 (0.013)	Loss 4.1026 (4.0261)	Top-1 acc 30.859 (30.676)	Top-5 acc 53.906 (54.015)	lr 0.00220
Warmup Train [35][2010/3239]	Time 0.546 (0.515)	Data 0.001 (0.013)	Loss 4.0546 (4.0262)	Top-1 acc 33.984 (30.680)	Top-5 acc 53.516 (54.011)	lr 0.00220
Warmup Train [35][2020/3239]	Time 0.624 (0.515)	Data 0.001 (0.013)	Loss 3.9726 (4.0261)	Top-1 acc 31.641 (30.682)	Top-5 acc 55.469 (54.014)	lr 0.00220
Warmup Train [35][2030/3239]	Time 0.543 (0.515)	Data 0.001 (0.013)	Loss 4.0082 (4.0263)	Top-1 acc 31.250 (30.677)	Top-5 acc 53.906 (54.010)	lr 0.00219
Warmup Train [35][2040/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 4.0096 (4.0261)	Top-1 acc 29.297 (30.679)	Top-5 acc 57.812 (54.014)	lr 0.00219
Warmup Train [35][2050/3239]	Time 0.630 (0.515)	Data 0.001 (0.013)	Loss 4.0668 (4.0261)	Top-1 acc 28.906 (30.681)	Top-5 acc 53.125 (54.014)	lr 0.00219
Warmup Train [35][2060/3239]	Time 0.491 (0.515)	Data 0.001 (0.013)	Loss 3.8983 (4.0262)	Top-1 acc 30.859 (30.678)	Top-5 acc 56.250 (54.010)	lr 0.00219
Warmup Train [35][2070/3239]	Time 0.484 (0.515)	Data 0.001 (0.013)	Loss 4.0048 (4.0265)	Top-1 acc 28.516 (30.672)	Top-5 acc 55.078 (54.001)	lr 0.00218
Warmup Train [35][2080/3239]	Time 0.400 (0.515)	Data 0.001 (0.013)	Loss 3.9395 (4.0264)	Top-1 acc 32.812 (30.674)	Top-5 acc 52.734 (54.001)	lr 0.00218
Warmup Train [35][2090/3239]	Time 0.579 (0.515)	Data 0.001 (0.013)	Loss 4.1997 (4.0268)	Top-1 acc 25.781 (30.668)	Top-5 acc 50.391 (53.990)	lr 0.00218
Warmup Train [35][2100/3239]	Time 0.558 (0.515)	Data 0.001 (0.013)	Loss 3.9947 (4.0268)	Top-1 acc 31.250 (30.670)	Top-5 acc 54.688 (53.989)	lr 0.00218
Warmup Train [35][2110/3239]	Time 0.465 (0.515)	Data 0.001 (0.013)	Loss 3.9884 (4.0268)	Top-1 acc 29.688 (30.672)	Top-5 acc 54.688 (53.985)	lr 0.00217
Warmup Train [35][2120/3239]	Time 0.558 (0.515)	Data 0.001 (0.013)	Loss 3.8523 (4.0266)	Top-1 acc 35.156 (30.672)	Top-5 acc 57.031 (53.994)	lr 0.00217
Warmup Train [35][2130/3239]	Time 0.711 (0.515)	Data 0.001 (0.013)	Loss 3.8946 (4.0265)	Top-1 acc 34.375 (30.677)	Top-5 acc 59.375 (54.000)	lr 0.00217
Warmup Train [35][2140/3239]	Time 0.517 (0.515)	Data 0.001 (0.013)	Loss 4.0387 (4.0266)	Top-1 acc 26.953 (30.679)	Top-5 acc 54.297 (53.998)	lr 0.00217
Warmup Train [35][2150/3239]	Time 0.479 (0.515)	Data 0.001 (0.013)	Loss 3.9275 (4.0267)	Top-1 acc 32.031 (30.678)	Top-5 acc 59.766 (54.000)	lr 0.00216
Warmup Train [35][2160/3239]	Time 0.556 (0.515)	Data 0.002 (0.012)	Loss 4.0163 (4.0267)	Top-1 acc 32.031 (30.678)	Top-5 acc 51.953 (53.995)	lr 0.00216
Warmup Train [35][2170/3239]	Time 0.621 (0.515)	Data 0.001 (0.012)	Loss 4.1064 (4.0267)	Top-1 acc 29.297 (30.674)	Top-5 acc 51.953 (53.992)	lr 0.00216
Warmup Train [35][2180/3239]	Time 0.475 (0.515)	Data 0.001 (0.012)	Loss 3.9917 (4.0266)	Top-1 acc 34.766 (30.677)	Top-5 acc 52.734 (53.996)	lr 0.00216
Warmup Train [35][2190/3239]	Time 0.392 (0.515)	Data 0.001 (0.012)	Loss 4.0692 (4.0264)	Top-1 acc 32.422 (30.686)	Top-5 acc 58.594 (54.001)	lr 0.00215
Warmup Train [35][2200/3239]	Time 0.389 (0.515)	Data 0.001 (0.012)	Loss 4.1101 (4.0265)	Top-1 acc 23.828 (30.685)	Top-5 acc 50.000 (54.002)	lr 0.00215
Warmup Train [35][2210/3239]	Time 0.523 (0.515)	Data 0.001 (0.012)	Loss 4.0887 (4.0266)	Top-1 acc 33.594 (30.685)	Top-5 acc 53.125 (54.000)	lr 0.00215
Warmup Train [35][2220/3239]	Time 0.412 (0.515)	Data 0.001 (0.012)	Loss 4.2779 (4.0268)	Top-1 acc 26.172 (30.686)	Top-5 acc 48.047 (53.997)	lr 0.00215
Warmup Train [35][2230/3239]	Time 0.461 (0.515)	Data 0.001 (0.012)	Loss 4.2377 (4.0270)	Top-1 acc 26.953 (30.682)	Top-5 acc 50.391 (53.994)	lr 0.00214
Warmup Train [35][2240/3239]	Time 0.490 (0.515)	Data 0.001 (0.012)	Loss 3.7958 (4.0270)	Top-1 acc 35.547 (30.686)	Top-5 acc 62.500 (53.994)	lr 0.00214
Warmup Train [35][2250/3239]	Time 0.372 (0.515)	Data 0.001 (0.012)	Loss 4.0649 (4.0268)	Top-1 acc 25.781 (30.692)	Top-5 acc 53.906 (53.996)	lr 0.00214
Warmup Train [35][2260/3239]	Time 0.577 (0.515)	Data 0.001 (0.012)	Loss 3.9993 (4.0267)	Top-1 acc 37.109 (30.698)	Top-5 acc 55.469 (53.999)	lr 0.00214
Warmup Train [35][2270/3239]	Time 0.374 (0.515)	Data 0.001 (0.012)	Loss 3.9180 (4.0263)	Top-1 acc 33.203 (30.705)	Top-5 acc 61.328 (54.009)	lr 0.00213
Warmup Train [35][2280/3239]	Time 0.589 (0.514)	Data 0.001 (0.012)	Loss 3.9790 (4.0266)	Top-1 acc 34.375 (30.696)	Top-5 acc 53.516 (54.001)	lr 0.00213
Warmup Train [35][2290/3239]	Time 0.456 (0.514)	Data 0.001 (0.012)	Loss 4.2236 (4.0267)	Top-1 acc 26.953 (30.693)	Top-5 acc 48.047 (53.997)	lr 0.00213
Warmup Train [35][2300/3239]	Time 0.347 (0.514)	Data 0.001 (0.012)	Loss 3.9458 (4.0266)	Top-1 acc 32.031 (30.695)	Top-5 acc 55.859 (53.996)	lr 0.00213
Warmup Train [35][2310/3239]	Time 0.597 (0.514)	Data 0.001 (0.012)	Loss 3.8884 (4.0269)	Top-1 acc 33.203 (30.687)	Top-5 acc 59.766 (53.992)	lr 0.00212
Warmup Train [35][2320/3239]	Time 0.513 (0.514)	Data 0.001 (0.012)	Loss 3.9758 (4.0270)	Top-1 acc 32.422 (30.682)	Top-5 acc 55.078 (53.991)	lr 0.00212
Warmup Train [35][2330/3239]	Time 0.590 (0.515)	Data 0.001 (0.012)	Loss 4.0681 (4.0269)	Top-1 acc 29.688 (30.685)	Top-5 acc 57.812 (53.997)	lr 0.00212
Warmup Train [35][2340/3239]	Time 0.359 (0.515)	Data 0.001 (0.012)	Loss 4.4027 (4.0270)	Top-1 acc 21.484 (30.681)	Top-5 acc 44.922 (53.997)	lr 0.00212
Warmup Train [35][2350/3239]	Time 0.430 (0.515)	Data 0.001 (0.012)	Loss 3.9991 (4.0270)	Top-1 acc 30.859 (30.679)	Top-5 acc 55.469 (53.995)	lr 0.00211
Warmup Train [35][2360/3239]	Time 0.644 (0.515)	Data 0.001 (0.012)	Loss 4.1560 (4.0270)	Top-1 acc 30.859 (30.681)	Top-5 acc 53.125 (54.001)	lr 0.00211
Warmup Train [35][2370/3239]	Time 0.467 (0.515)	Data 0.001 (0.012)	Loss 3.9663 (4.0270)	Top-1 acc 29.297 (30.678)	Top-5 acc 55.859 (54.001)	lr 0.00211
Warmup Train [35][2380/3239]	Time 0.401 (0.515)	Data 0.001 (0.012)	Loss 4.1627 (4.0270)	Top-1 acc 24.609 (30.680)	Top-5 acc 51.562 (54.000)	lr 0.00211
Warmup Train [35][2390/3239]	Time 0.623 (0.515)	Data 0.001 (0.012)	Loss 4.1645 (4.0272)	Top-1 acc 24.609 (30.674)	Top-5 acc 51.172 (53.997)	lr 0.00211
Warmup Train [35][2400/3239]	Time 0.497 (0.515)	Data 0.001 (0.012)	Loss 3.9607 (4.0271)	Top-1 acc 35.156 (30.678)	Top-5 acc 57.031 (54.001)	lr 0.00210
Warmup Train [35][2410/3239]	Time 0.589 (0.515)	Data 0.001 (0.012)	Loss 3.9357 (4.0272)	Top-1 acc 31.641 (30.672)	Top-5 acc 57.812 (53.998)	lr 0.00210
Warmup Train [35][2420/3239]	Time 0.612 (0.515)	Data 0.002 (0.012)	Loss 3.9363 (4.0270)	Top-1 acc 32.031 (30.676)	Top-5 acc 57.812 (54.006)	lr 0.00210
Warmup Train [35][2430/3239]	Time 0.569 (0.515)	Data 0.001 (0.012)	Loss 4.0225 (4.0270)	Top-1 acc 29.297 (30.678)	Top-5 acc 54.297 (54.005)	lr 0.00210
Warmup Train [35][2440/3239]	Time 0.444 (0.515)	Data 0.001 (0.012)	Loss 4.1940 (4.0269)	Top-1 acc 26.953 (30.680)	Top-5 acc 53.906 (54.009)	lr 0.00209
Warmup Train [35][2450/3239]	Time 0.578 (0.515)	Data 0.001 (0.012)	Loss 4.0670 (4.0269)	Top-1 acc 31.250 (30.679)	Top-5 acc 52.734 (54.010)	lr 0.00209
Warmup Train [35][2460/3239]	Time 0.563 (0.515)	Data 0.001 (0.012)	Loss 3.9486 (4.0270)	Top-1 acc 28.125 (30.678)	Top-5 acc 57.031 (54.012)	lr 0.00209
Warmup Train [35][2470/3239]	Time 0.494 (0.515)	Data 0.001 (0.012)	Loss 3.9631 (4.0268)	Top-1 acc 29.297 (30.679)	Top-5 acc 57.031 (54.018)	lr 0.00209
Warmup Train [35][2480/3239]	Time 0.472 (0.515)	Data 0.001 (0.012)	Loss 3.9110 (4.0267)	Top-1 acc 32.812 (30.678)	Top-5 acc 57.422 (54.019)	lr 0.00208
Warmup Train [35][2490/3239]	Time 0.502 (0.515)	Data 0.001 (0.012)	Loss 4.0898 (4.0267)	Top-1 acc 28.516 (30.680)	Top-5 acc 53.125 (54.022)	lr 0.00208
Warmup Train [35][2500/3239]	Time 0.406 (0.515)	Data 0.001 (0.012)	Loss 4.0618 (4.0267)	Top-1 acc 30.469 (30.680)	Top-5 acc 52.734 (54.021)	lr 0.00208
Warmup Train [35][2510/3239]	Time 0.422 (0.515)	Data 0.002 (0.012)	Loss 4.0866 (4.0266)	Top-1 acc 30.859 (30.682)	Top-5 acc 51.562 (54.022)	lr 0.00208
Warmup Train [35][2520/3239]	Time 0.553 (0.514)	Data 0.001 (0.012)	Loss 4.1835 (4.0268)	Top-1 acc 24.219 (30.676)	Top-5 acc 51.953 (54.014)	lr 0.00207
Warmup Train [35][2530/3239]	Time 0.356 (0.514)	Data 0.001 (0.012)	Loss 3.9448 (4.0268)	Top-1 acc 30.469 (30.674)	Top-5 acc 55.859 (54.016)	lr 0.00207
Warmup Train [35][2540/3239]	Time 0.658 (0.514)	Data 0.001 (0.012)	Loss 3.9532 (4.0268)	Top-1 acc 31.641 (30.674)	Top-5 acc 56.250 (54.015)	lr 0.00207
Warmup Train [35][2550/3239]	Time 0.575 (0.514)	Data 0.001 (0.012)	Loss 3.9460 (4.0268)	Top-1 acc 33.984 (30.673)	Top-5 acc 55.078 (54.009)	lr 0.00207
Warmup Train [35][2560/3239]	Time 0.520 (0.514)	Data 0.001 (0.012)	Loss 4.1619 (4.0269)	Top-1 acc 29.688 (30.675)	Top-5 acc 50.000 (54.009)	lr 0.00206
Warmup Train [35][2570/3239]	Time 0.572 (0.514)	Data 0.001 (0.012)	Loss 4.0482 (4.0268)	Top-1 acc 30.078 (30.678)	Top-5 acc 53.906 (54.012)	lr 0.00206
Warmup Train [35][2580/3239]	Time 0.507 (0.514)	Data 0.001 (0.012)	Loss 4.0409 (4.0268)	Top-1 acc 32.031 (30.679)	Top-5 acc 53.516 (54.008)	lr 0.00206
Warmup Train [35][2590/3239]	Time 0.600 (0.514)	Data 0.001 (0.012)	Loss 4.0231 (4.0270)	Top-1 acc 30.078 (30.671)	Top-5 acc 55.078 (54.007)	lr 0.00206
Warmup Train [35][2600/3239]	Time 0.376 (0.514)	Data 0.001 (0.012)	Loss 4.1953 (4.0270)	Top-1 acc 32.812 (30.671)	Top-5 acc 52.734 (54.009)	lr 0.00205
Warmup Train [35][2610/3239]	Time 0.562 (0.514)	Data 0.001 (0.012)	Loss 3.9230 (4.0269)	Top-1 acc 34.375 (30.676)	Top-5 acc 59.766 (54.011)	lr 0.00205
Warmup Train [35][2620/3239]	Time 0.506 (0.514)	Data 0.001 (0.012)	Loss 3.9553 (4.0270)	Top-1 acc 31.641 (30.676)	Top-5 acc 56.250 (54.009)	lr 0.00205
Warmup Train [35][2630/3239]	Time 0.538 (0.514)	Data 0.001 (0.012)	Loss 3.8758 (4.0270)	Top-1 acc 33.594 (30.675)	Top-5 acc 58.594 (54.007)	lr 0.00205
Warmup Train [35][2640/3239]	Time 0.578 (0.514)	Data 0.001 (0.011)	Loss 3.9292 (4.0269)	Top-1 acc 30.859 (30.676)	Top-5 acc 58.203 (54.011)	lr 0.00204
Warmup Train [35][2650/3239]	Time 0.585 (0.514)	Data 0.001 (0.011)	Loss 3.8891 (4.0269)	Top-1 acc 31.250 (30.678)	Top-5 acc 57.422 (54.010)	lr 0.00204
Warmup Train [35][2660/3239]	Time 0.453 (0.514)	Data 0.001 (0.011)	Loss 3.9626 (4.0269)	Top-1 acc 30.859 (30.677)	Top-5 acc 53.906 (54.009)	lr 0.00204
Warmup Train [35][2670/3239]	Time 0.329 (0.514)	Data 0.001 (0.011)	Loss 3.9342 (4.0267)	Top-1 acc 32.422 (30.684)	Top-5 acc 58.594 (54.016)	lr 0.00204
Warmup Train [35][2680/3239]	Time 0.429 (0.514)	Data 0.001 (0.011)	Loss 3.7838 (4.0266)	Top-1 acc 33.594 (30.686)	Top-5 acc 58.203 (54.014)	lr 0.00204
Warmup Train [35][2690/3239]	Time 0.624 (0.514)	Data 0.001 (0.011)	Loss 4.1395 (4.0266)	Top-1 acc 27.344 (30.684)	Top-5 acc 49.609 (54.012)	lr 0.00203
Warmup Train [35][2700/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 4.0824 (4.0266)	Top-1 acc 30.859 (30.687)	Top-5 acc 52.344 (54.010)	lr 0.00203
Warmup Train [35][2710/3239]	Time 0.507 (0.514)	Data 0.001 (0.011)	Loss 4.0679 (4.0266)	Top-1 acc 30.469 (30.688)	Top-5 acc 54.297 (54.010)	lr 0.00203
Warmup Train [35][2720/3239]	Time 0.421 (0.514)	Data 0.001 (0.011)	Loss 4.0990 (4.0265)	Top-1 acc 27.734 (30.687)	Top-5 acc 52.344 (54.012)	lr 0.00203
Warmup Train [35][2730/3239]	Time 0.570 (0.514)	Data 0.001 (0.011)	Loss 3.9948 (4.0264)	Top-1 acc 34.766 (30.686)	Top-5 acc 53.906 (54.009)	lr 0.00202
Warmup Train [35][2740/3239]	Time 0.474 (0.514)	Data 0.001 (0.011)	Loss 4.1098 (4.0265)	Top-1 acc 27.344 (30.684)	Top-5 acc 50.391 (54.005)	lr 0.00202
Warmup Train [35][2750/3239]	Time 0.456 (0.514)	Data 0.001 (0.011)	Loss 3.9871 (4.0264)	Top-1 acc 29.688 (30.688)	Top-5 acc 53.516 (54.009)	lr 0.00202
Warmup Train [35][2760/3239]	Time 0.656 (0.514)	Data 0.001 (0.011)	Loss 4.0313 (4.0265)	Top-1 acc 30.469 (30.687)	Top-5 acc 54.688 (54.011)	lr 0.00202
Warmup Train [35][2770/3239]	Time 0.520 (0.514)	Data 0.001 (0.011)	Loss 3.9117 (4.0267)	Top-1 acc 33.594 (30.682)	Top-5 acc 53.125 (54.005)	lr 0.00201
Warmup Train [35][2780/3239]	Time 0.446 (0.514)	Data 0.001 (0.011)	Loss 4.0737 (4.0266)	Top-1 acc 29.297 (30.683)	Top-5 acc 50.391 (54.008)	lr 0.00201
Warmup Train [35][2790/3239]	Time 0.618 (0.514)	Data 0.001 (0.011)	Loss 3.9251 (4.0267)	Top-1 acc 32.031 (30.681)	Top-5 acc 54.688 (54.005)	lr 0.00201
Warmup Train [35][2800/3239]	Time 0.517 (0.514)	Data 0.001 (0.011)	Loss 4.0401 (4.0270)	Top-1 acc 28.516 (30.677)	Top-5 acc 53.516 (54.000)	lr 0.00201
Warmup Train [35][2810/3239]	Time 0.456 (0.514)	Data 0.001 (0.011)	Loss 4.0618 (4.0268)	Top-1 acc 28.906 (30.677)	Top-5 acc 53.516 (54.006)	lr 0.00200
Warmup Train [35][2820/3239]	Time 0.397 (0.514)	Data 0.001 (0.011)	Loss 3.9103 (4.0266)	Top-1 acc 28.906 (30.679)	Top-5 acc 51.562 (54.007)	lr 0.00200
Warmup Train [35][2830/3239]	Time 0.395 (0.514)	Data 0.001 (0.011)	Loss 4.0818 (4.0266)	Top-1 acc 26.172 (30.683)	Top-5 acc 60.547 (54.012)	lr 0.00200
Warmup Train [35][2840/3239]	Time 0.393 (0.514)	Data 0.001 (0.011)	Loss 3.9296 (4.0266)	Top-1 acc 29.297 (30.682)	Top-5 acc 56.641 (54.007)	lr 0.00200
Warmup Train [35][2850/3239]	Time 0.567 (0.514)	Data 0.001 (0.011)	Loss 3.7977 (4.0265)	Top-1 acc 36.328 (30.685)	Top-5 acc 58.594 (54.010)	lr 0.00199
Warmup Train [35][2860/3239]	Time 0.533 (0.514)	Data 0.001 (0.011)	Loss 4.1330 (4.0267)	Top-1 acc 26.172 (30.681)	Top-5 acc 45.703 (54.005)	lr 0.00199
Warmup Train [35][2870/3239]	Time 0.668 (0.514)	Data 0.001 (0.011)	Loss 4.1314 (4.0268)	Top-1 acc 28.125 (30.680)	Top-5 acc 50.391 (54.005)	lr 0.00199
Warmup Train [35][2880/3239]	Time 0.483 (0.514)	Data 0.001 (0.011)	Loss 4.0863 (4.0270)	Top-1 acc 27.734 (30.679)	Top-5 acc 52.344 (54.000)	lr 0.00199
Warmup Train [35][2890/3239]	Time 0.641 (0.514)	Data 0.001 (0.011)	Loss 3.8683 (4.0268)	Top-1 acc 34.375 (30.686)	Top-5 acc 60.156 (54.002)	lr 0.00199
Warmup Train [35][2900/3239]	Time 0.548 (0.514)	Data 0.001 (0.011)	Loss 3.9321 (4.0266)	Top-1 acc 28.516 (30.691)	Top-5 acc 53.516 (54.008)	lr 0.00198
Warmup Train [35][2910/3239]	Time 0.428 (0.514)	Data 0.001 (0.011)	Loss 4.1040 (4.0267)	Top-1 acc 31.641 (30.690)	Top-5 acc 55.078 (54.009)	lr 0.00198
Warmup Train [35][2920/3239]	Time 0.585 (0.514)	Data 0.001 (0.011)	Loss 3.8888 (4.0266)	Top-1 acc 34.375 (30.694)	Top-5 acc 58.203 (54.010)	lr 0.00198
Warmup Train [35][2930/3239]	Time 0.534 (0.514)	Data 0.001 (0.011)	Loss 3.7707 (4.0263)	Top-1 acc 33.984 (30.701)	Top-5 acc 60.547 (54.016)	lr 0.00198
Warmup Train [35][2940/3239]	Time 0.574 (0.514)	Data 0.001 (0.011)	Loss 3.9196 (4.0264)	Top-1 acc 32.812 (30.705)	Top-5 acc 57.422 (54.017)	lr 0.00197
Warmup Train [35][2950/3239]	Time 0.712 (0.514)	Data 0.001 (0.011)	Loss 4.1887 (4.0265)	Top-1 acc 32.031 (30.705)	Top-5 acc 52.344 (54.016)	lr 0.00197
Warmup Train [35][2960/3239]	Time 0.391 (0.514)	Data 0.001 (0.011)	Loss 4.2419 (4.0266)	Top-1 acc 28.125 (30.704)	Top-5 acc 52.344 (54.012)	lr 0.00197
Warmup Train [35][2970/3239]	Time 0.454 (0.514)	Data 0.001 (0.011)	Loss 4.1549 (4.0267)	Top-1 acc 31.641 (30.705)	Top-5 acc 54.297 (54.012)	lr 0.00197
Warmup Train [35][2980/3239]	Time 0.525 (0.514)	Data 0.001 (0.011)	Loss 4.1207 (4.0268)	Top-1 acc 29.297 (30.700)	Top-5 acc 50.391 (54.012)	lr 0.00196
Warmup Train [35][2990/3239]	Time 0.495 (0.514)	Data 0.001 (0.011)	Loss 4.0045 (4.0268)	Top-1 acc 29.688 (30.705)	Top-5 acc 55.859 (54.014)	lr 0.00196
Warmup Train [35][3000/3239]	Time 0.433 (0.514)	Data 0.001 (0.011)	Loss 4.0317 (4.0270)	Top-1 acc 31.641 (30.704)	Top-5 acc 52.344 (54.012)	lr 0.00196
Warmup Train [35][3010/3239]	Time 0.531 (0.514)	Data 0.001 (0.011)	Loss 4.1159 (4.0271)	Top-1 acc 31.641 (30.702)	Top-5 acc 53.516 (54.009)	lr 0.00196
Warmup Train [35][3020/3239]	Time 0.504 (0.514)	Data 0.001 (0.011)	Loss 4.0964 (4.0270)	Top-1 acc 28.125 (30.699)	Top-5 acc 50.391 (54.012)	lr 0.00195
Warmup Train [35][3030/3239]	Time 0.545 (0.514)	Data 0.001 (0.011)	Loss 3.9527 (4.0270)	Top-1 acc 32.031 (30.699)	Top-5 acc 54.297 (54.010)	lr 0.00195
Warmup Train [35][3040/3239]	Time 0.583 (0.514)	Data 0.001 (0.011)	Loss 3.9541 (4.0269)	Top-1 acc 28.906 (30.700)	Top-5 acc 57.031 (54.014)	lr 0.00195
Warmup Train [35][3050/3239]	Time 0.555 (0.514)	Data 0.001 (0.011)	Loss 3.8466 (4.0266)	Top-1 acc 35.156 (30.706)	Top-5 acc 57.422 (54.021)	lr 0.00195
Warmup Train [35][3060/3239]	Time 0.523 (0.514)	Data 0.001 (0.011)	Loss 3.9955 (4.0265)	Top-1 acc 30.078 (30.705)	Top-5 acc 54.297 (54.025)	lr 0.00194
Warmup Train [35][3070/3239]	Time 0.590 (0.514)	Data 0.001 (0.011)	Loss 4.1692 (4.0266)	Top-1 acc 28.125 (30.702)	Top-5 acc 51.953 (54.021)	lr 0.00194
Warmup Train [35][3080/3239]	Time 0.310 (0.514)	Data 0.001 (0.011)	Loss 4.1436 (4.0266)	Top-1 acc 29.688 (30.700)	Top-5 acc 50.781 (54.023)	lr 0.00194
Warmup Train [35][3090/3239]	Time 0.535 (0.514)	Data 0.001 (0.011)	Loss 4.0777 (4.0267)	Top-1 acc 32.422 (30.701)	Top-5 acc 51.953 (54.022)	lr 0.00194
Warmup Train [35][3100/3239]	Time 0.575 (0.513)	Data 0.001 (0.011)	Loss 4.0234 (4.0267)	Top-1 acc 34.375 (30.705)	Top-5 acc 54.688 (54.021)	lr 0.00194
Warmup Train [35][3110/3239]	Time 0.174 (0.513)	Data 0.001 (0.011)	Loss 4.2239 (4.0267)	Top-1 acc 28.906 (30.705)	Top-5 acc 52.734 (54.022)	lr 0.00193
Warmup Train [35][3120/3239]	Time 0.644 (0.513)	Data 0.001 (0.011)	Loss 4.0649 (4.0267)	Top-1 acc 33.984 (30.705)	Top-5 acc 53.125 (54.019)	lr 0.00193
Warmup Train [35][3130/3239]	Time 0.378 (0.513)	Data 0.001 (0.011)	Loss 4.1553 (4.0265)	Top-1 acc 25.391 (30.707)	Top-5 acc 52.734 (54.027)	lr 0.00193
Warmup Train [35][3140/3239]	Time 0.507 (0.513)	Data 0.001 (0.011)	Loss 4.1266 (4.0265)	Top-1 acc 31.641 (30.708)	Top-5 acc 52.344 (54.027)	lr 0.00193
Warmup Train [35][3150/3239]	Time 0.458 (0.513)	Data 0.001 (0.011)	Loss 4.0174 (4.0265)	Top-1 acc 33.203 (30.709)	Top-5 acc 57.812 (54.027)	lr 0.00192
Warmup Train [35][3160/3239]	Time 0.606 (0.513)	Data 0.001 (0.011)	Loss 4.0871 (4.0266)	Top-1 acc 30.859 (30.705)	Top-5 acc 55.078 (54.027)	lr 0.00192
Warmup Train [35][3170/3239]	Time 0.540 (0.513)	Data 0.001 (0.011)	Loss 3.9985 (4.0268)	Top-1 acc 30.859 (30.702)	Top-5 acc 53.906 (54.023)	lr 0.00192
Warmup Train [35][3180/3239]	Time 0.610 (0.513)	Data 0.000 (0.011)	Loss 3.9398 (4.0267)	Top-1 acc 29.297 (30.701)	Top-5 acc 55.078 (54.025)	lr 0.00192
Warmup Train [35][3190/3239]	Time 0.663 (0.513)	Data 0.000 (0.011)	Loss 3.9470 (4.0268)	Top-1 acc 34.375 (30.702)	Top-5 acc 55.859 (54.024)	lr 0.00191
Warmup Train [35][3200/3239]	Time 0.534 (0.513)	Data 0.000 (0.011)	Loss 4.1163 (4.0268)	Top-1 acc 30.859 (30.702)	Top-5 acc 53.906 (54.028)	lr 0.00191
Warmup Train [35][3210/3239]	Time 0.514 (0.513)	Data 0.000 (0.011)	Loss 3.9069 (4.0268)	Top-1 acc 30.078 (30.702)	Top-5 acc 55.859 (54.027)	lr 0.00191
Warmup Train [35][3220/3239]	Time 0.472 (0.513)	Data 0.000 (0.010)	Loss 3.9632 (4.0267)	Top-1 acc 33.203 (30.705)	Top-5 acc 55.469 (54.029)	lr 0.00191
Warmup Train [35][3230/3239]	Time 0.380 (0.513)	Data 0.000 (0.010)	Loss 4.1892 (4.0269)	Top-1 acc 24.219 (30.699)	Top-5 acc 51.172 (54.026)	lr 0.00191
Warmup Train [35][3239/3239]	Time 0.329 (0.513)	Data 0.000 (0.010)	Loss 4.2868 (4.0269)	Top-1 acc 30.864 (30.696)	Top-5 acc 45.679 (54.026)	lr 0.00190
==========Warmup Valid [35/40]	loss 2.969	top-1 acc 38.125	top-5 acc 62.958	Train top-1 30.696	top-5 54.026	flops: 442.4M
Warmup Train [36][0/3239]	Time 18.540 (18.540)	Data 16.376 (16.376)	Loss 4.0282 (4.0282)	Top-1 acc 30.859 (30.859)	Top-5 acc 54.297 (54.297)	lr 0.00190
Warmup Train [36][10/3239]	Time 0.643 (2.194)	Data 0.001 (1.490)	Loss 3.8756 (4.0060)	Top-1 acc 29.297 (29.616)	Top-5 acc 56.641 (54.119)	lr 0.00190
Warmup Train [36][20/3239]	Time 0.520 (1.395)	Data 0.001 (0.782)	Loss 4.2489 (4.0347)	Top-1 acc 25.781 (29.725)	Top-5 acc 47.266 (53.646)	lr 0.00190
Warmup Train [36][30/3239]	Time 0.596 (1.106)	Data 0.001 (0.530)	Loss 4.0416 (4.0209)	Top-1 acc 26.953 (30.217)	Top-5 acc 53.906 (54.070)	lr 0.00190
Warmup Train [36][40/3239]	Time 0.621 (0.958)	Data 0.001 (0.404)	Loss 3.9304 (4.0226)	Top-1 acc 32.422 (30.564)	Top-5 acc 58.203 (53.859)	lr 0.00189
Warmup Train [36][50/3239]	Time 0.564 (0.871)	Data 0.001 (0.325)	Loss 3.9280 (4.0233)	Top-1 acc 33.203 (30.507)	Top-5 acc 55.859 (53.960)	lr 0.00189
Warmup Train [36][60/3239]	Time 0.491 (0.810)	Data 0.001 (0.272)	Loss 4.0150 (4.0234)	Top-1 acc 30.859 (30.475)	Top-5 acc 50.781 (53.791)	lr 0.00189
Warmup Train [36][70/3239]	Time 0.574 (0.767)	Data 0.001 (0.234)	Loss 3.9304 (4.0186)	Top-1 acc 31.641 (30.568)	Top-5 acc 55.469 (53.945)	lr 0.00189
Warmup Train [36][80/3239]	Time 0.554 (0.734)	Data 0.001 (0.206)	Loss 4.0975 (4.0282)	Top-1 acc 32.031 (30.459)	Top-5 acc 51.172 (53.689)	lr 0.00188
Warmup Train [36][90/3239]	Time 0.409 (0.708)	Data 0.002 (0.183)	Loss 4.0297 (4.0352)	Top-1 acc 28.125 (30.336)	Top-5 acc 52.344 (53.554)	lr 0.00188
Warmup Train [36][100/3239]	Time 0.324 (0.686)	Data 0.001 (0.166)	Loss 4.3148 (4.0323)	Top-1 acc 25.781 (30.507)	Top-5 acc 46.484 (53.562)	lr 0.00188
Warmup Train [36][110/3239]	Time 0.825 (0.672)	Data 0.001 (0.153)	Loss 3.8005 (4.0340)	Top-1 acc 31.641 (30.455)	Top-5 acc 59.766 (53.554)	lr 0.00188
Warmup Train [36][120/3239]	Time 0.532 (0.660)	Data 0.001 (0.140)	Loss 3.8046 (4.0306)	Top-1 acc 33.594 (30.511)	Top-5 acc 60.156 (53.642)	lr 0.00188
Warmup Train [36][130/3239]	Time 0.653 (0.649)	Data 0.001 (0.130)	Loss 4.0880 (4.0298)	Top-1 acc 29.297 (30.576)	Top-5 acc 49.609 (53.656)	lr 0.00187
Warmup Train [36][140/3239]	Time 0.409 (0.640)	Data 0.001 (0.121)	Loss 3.9986 (4.0269)	Top-1 acc 31.641 (30.638)	Top-5 acc 55.469 (53.784)	lr 0.00187
Warmup Train [36][150/3239]	Time 0.623 (0.630)	Data 0.001 (0.113)	Loss 4.1363 (4.0241)	Top-1 acc 28.125 (30.637)	Top-5 acc 51.953 (53.878)	lr 0.00187
Warmup Train [36][160/3239]	Time 0.540 (0.623)	Data 0.001 (0.106)	Loss 4.0301 (4.0223)	Top-1 acc 27.734 (30.682)	Top-5 acc 51.953 (53.962)	lr 0.00187
Warmup Train [36][170/3239]	Time 0.408 (0.615)	Data 0.001 (0.100)	Loss 4.0131 (4.0221)	Top-1 acc 31.250 (30.729)	Top-5 acc 55.078 (53.970)	lr 0.00186
Warmup Train [36][180/3239]	Time 0.458 (0.610)	Data 0.001 (0.095)	Loss 3.9185 (4.0204)	Top-1 acc 35.547 (30.803)	Top-5 acc 56.250 (53.999)	lr 0.00186
Warmup Train [36][190/3239]	Time 0.525 (0.605)	Data 0.001 (0.091)	Loss 3.9230 (4.0204)	Top-1 acc 32.031 (30.845)	Top-5 acc 57.812 (54.013)	lr 0.00186
Warmup Train [36][200/3239]	Time 0.266 (0.599)	Data 0.001 (0.086)	Loss 4.0292 (4.0206)	Top-1 acc 30.078 (30.842)	Top-5 acc 51.953 (53.980)	lr 0.00186
Warmup Train [36][210/3239]	Time 0.546 (0.595)	Data 0.001 (0.083)	Loss 4.1301 (4.0206)	Top-1 acc 30.469 (30.798)	Top-5 acc 52.734 (54.003)	lr 0.00185
Warmup Train [36][220/3239]	Time 0.493 (0.591)	Data 0.001 (0.079)	Loss 4.0667 (4.0206)	Top-1 acc 31.641 (30.787)	Top-5 acc 53.516 (53.980)	lr 0.00185
Warmup Train [36][230/3239]	Time 0.451 (0.586)	Data 0.002 (0.076)	Loss 3.9985 (4.0195)	Top-1 acc 29.688 (30.839)	Top-5 acc 52.344 (54.033)	lr 0.00185
Warmup Train [36][240/3239]	Time 0.391 (0.582)	Data 0.001 (0.074)	Loss 3.9583 (4.0200)	Top-1 acc 30.859 (30.798)	Top-5 acc 55.078 (54.041)	lr 0.00185
Warmup Train [36][250/3239]	Time 0.580 (0.577)	Data 0.001 (0.071)	Loss 4.0013 (4.0200)	Top-1 acc 32.422 (30.791)	Top-5 acc 55.078 (54.015)	lr 0.00185
Warmup Train [36][260/3239]	Time 0.505 (0.574)	Data 0.001 (0.069)	Loss 3.9952 (4.0217)	Top-1 acc 28.906 (30.735)	Top-5 acc 54.297 (53.974)	lr 0.00184
Warmup Train [36][270/3239]	Time 0.517 (0.573)	Data 0.001 (0.066)	Loss 3.9246 (4.0230)	Top-1 acc 33.594 (30.725)	Top-5 acc 55.469 (53.939)	lr 0.00184
Warmup Train [36][280/3239]	Time 0.561 (0.570)	Data 0.001 (0.064)	Loss 3.9113 (4.0214)	Top-1 acc 32.422 (30.751)	Top-5 acc 60.156 (53.973)	lr 0.00184
Warmup Train [36][290/3239]	Time 0.391 (0.568)	Data 0.001 (0.062)	Loss 3.7251 (4.0207)	Top-1 acc 36.328 (30.776)	Top-5 acc 59.766 (53.984)	lr 0.00184
Warmup Train [36][300/3239]	Time 0.481 (0.566)	Data 0.001 (0.060)	Loss 3.9096 (4.0206)	Top-1 acc 31.641 (30.757)	Top-5 acc 57.031 (53.978)	lr 0.00183
Warmup Train [36][310/3239]	Time 0.696 (0.565)	Data 0.001 (0.058)	Loss 3.8004 (4.0221)	Top-1 acc 33.594 (30.741)	Top-5 acc 59.766 (53.924)	lr 0.00183
Warmup Train [36][320/3239]	Time 0.355 (0.562)	Data 0.001 (0.057)	Loss 4.1456 (4.0224)	Top-1 acc 29.297 (30.738)	Top-5 acc 51.172 (53.932)	lr 0.00183
Warmup Train [36][330/3239]	Time 0.410 (0.561)	Data 0.001 (0.055)	Loss 3.8498 (4.0223)	Top-1 acc 34.766 (30.717)	Top-5 acc 58.203 (53.953)	lr 0.00183
Warmup Train [36][340/3239]	Time 0.326 (0.559)	Data 0.001 (0.054)	Loss 3.9579 (4.0217)	Top-1 acc 30.859 (30.737)	Top-5 acc 55.469 (53.967)	lr 0.00182
Warmup Train [36][350/3239]	Time 0.527 (0.557)	Data 0.001 (0.053)	Loss 4.0031 (4.0207)	Top-1 acc 30.469 (30.737)	Top-5 acc 55.078 (53.996)	lr 0.00182
Warmup Train [36][360/3239]	Time 0.600 (0.555)	Data 0.001 (0.051)	Loss 3.9930 (4.0205)	Top-1 acc 30.859 (30.743)	Top-5 acc 53.125 (53.992)	lr 0.00182
Warmup Train [36][370/3239]	Time 0.360 (0.554)	Data 0.001 (0.050)	Loss 4.0194 (4.0203)	Top-1 acc 28.516 (30.733)	Top-5 acc 54.297 (53.995)	lr 0.00182
Warmup Train [36][380/3239]	Time 0.531 (0.553)	Data 0.001 (0.049)	Loss 4.0880 (4.0203)	Top-1 acc 30.078 (30.738)	Top-5 acc 52.734 (54.012)	lr 0.00182
Warmup Train [36][390/3239]	Time 0.479 (0.552)	Data 0.001 (0.048)	Loss 3.9998 (4.0219)	Top-1 acc 25.781 (30.725)	Top-5 acc 53.125 (54.018)	lr 0.00181
Warmup Train [36][400/3239]	Time 0.351 (0.551)	Data 0.001 (0.047)	Loss 3.9939 (4.0244)	Top-1 acc 30.859 (30.651)	Top-5 acc 52.734 (53.954)	lr 0.00181
Warmup Train [36][410/3239]	Time 0.516 (0.551)	Data 0.001 (0.046)	Loss 3.8988 (4.0241)	Top-1 acc 35.938 (30.646)	Top-5 acc 55.078 (53.958)	lr 0.00181
Warmup Train [36][420/3239]	Time 0.595 (0.550)	Data 0.001 (0.045)	Loss 3.8821 (4.0226)	Top-1 acc 33.984 (30.681)	Top-5 acc 55.859 (53.999)	lr 0.00181
Warmup Train [36][430/3239]	Time 0.567 (0.550)	Data 0.001 (0.044)	Loss 3.9772 (4.0224)	Top-1 acc 33.984 (30.694)	Top-5 acc 57.031 (54.010)	lr 0.00180
Warmup Train [36][440/3239]	Time 0.510 (0.549)	Data 0.001 (0.043)	Loss 4.0460 (4.0220)	Top-1 acc 29.688 (30.707)	Top-5 acc 52.344 (54.007)	lr 0.00180
Warmup Train [36][450/3239]	Time 0.547 (0.548)	Data 0.001 (0.042)	Loss 4.1058 (4.0217)	Top-1 acc 29.297 (30.698)	Top-5 acc 51.172 (54.008)	lr 0.00180
Warmup Train [36][460/3239]	Time 0.493 (0.548)	Data 0.001 (0.041)	Loss 3.9358 (4.0219)	Top-1 acc 36.328 (30.725)	Top-5 acc 57.422 (53.999)	lr 0.00180
Warmup Train [36][470/3239]	Time 0.709 (0.548)	Data 0.001 (0.041)	Loss 3.9970 (4.0214)	Top-1 acc 25.781 (30.713)	Top-5 acc 54.297 (54.012)	lr 0.00180
Warmup Train [36][480/3239]	Time 0.342 (0.547)	Data 0.002 (0.040)	Loss 3.9914 (4.0217)	Top-1 acc 28.125 (30.702)	Top-5 acc 57.812 (54.009)	lr 0.00179
Warmup Train [36][490/3239]	Time 0.437 (0.546)	Data 0.001 (0.040)	Loss 4.0289 (4.0212)	Top-1 acc 29.297 (30.711)	Top-5 acc 50.391 (54.024)	lr 0.00179
Warmup Train [36][500/3239]	Time 0.357 (0.545)	Data 0.001 (0.039)	Loss 4.1741 (4.0217)	Top-1 acc 25.391 (30.712)	Top-5 acc 49.219 (54.015)	lr 0.00179
Warmup Train [36][510/3239]	Time 0.608 (0.544)	Data 0.001 (0.039)	Loss 3.9747 (4.0216)	Top-1 acc 29.688 (30.709)	Top-5 acc 53.906 (54.015)	lr 0.00179
Warmup Train [36][520/3239]	Time 0.272 (0.543)	Data 0.001 (0.038)	Loss 4.0303 (4.0218)	Top-1 acc 31.250 (30.709)	Top-5 acc 49.609 (54.008)	lr 0.00178
Warmup Train [36][530/3239]	Time 0.389 (0.541)	Data 0.001 (0.037)	Loss 3.9266 (4.0209)	Top-1 acc 33.203 (30.709)	Top-5 acc 53.125 (54.006)	lr 0.00178
Warmup Train [36][540/3239]	Time 0.519 (0.541)	Data 0.001 (0.037)	Loss 4.1062 (4.0213)	Top-1 acc 30.078 (30.688)	Top-5 acc 52.344 (54.007)	lr 0.00178
Warmup Train [36][550/3239]	Time 0.529 (0.541)	Data 0.001 (0.036)	Loss 4.1760 (4.0215)	Top-1 acc 29.688 (30.683)	Top-5 acc 50.781 (54.025)	lr 0.00178
Warmup Train [36][560/3239]	Time 0.468 (0.540)	Data 0.001 (0.036)	Loss 3.9722 (4.0208)	Top-1 acc 29.297 (30.680)	Top-5 acc 52.344 (54.047)	lr 0.00178
Warmup Train [36][570/3239]	Time 0.605 (0.540)	Data 0.001 (0.035)	Loss 3.8881 (4.0201)	Top-1 acc 30.859 (30.686)	Top-5 acc 56.641 (54.046)	lr 0.00177
Warmup Train [36][580/3239]	Time 0.522 (0.540)	Data 0.001 (0.035)	Loss 4.0341 (4.0195)	Top-1 acc 28.516 (30.681)	Top-5 acc 52.734 (54.062)	lr 0.00177
Warmup Train [36][590/3239]	Time 0.476 (0.539)	Data 0.001 (0.034)	Loss 4.1234 (4.0189)	Top-1 acc 28.906 (30.693)	Top-5 acc 51.953 (54.071)	lr 0.00177
Warmup Train [36][600/3239]	Time 0.394 (0.538)	Data 0.001 (0.034)	Loss 4.0671 (4.0192)	Top-1 acc 27.734 (30.694)	Top-5 acc 52.734 (54.065)	lr 0.00177
Warmup Train [36][610/3239]	Time 0.798 (0.538)	Data 0.001 (0.033)	Loss 4.0815 (4.0189)	Top-1 acc 30.078 (30.685)	Top-5 acc 55.859 (54.069)	lr 0.00176
Warmup Train [36][620/3239]	Time 0.488 (0.538)	Data 0.001 (0.033)	Loss 3.9443 (4.0196)	Top-1 acc 30.859 (30.674)	Top-5 acc 55.859 (54.050)	lr 0.00176
Warmup Train [36][630/3239]	Time 0.634 (0.538)	Data 0.001 (0.032)	Loss 4.1592 (4.0204)	Top-1 acc 26.953 (30.658)	Top-5 acc 52.344 (54.047)	lr 0.00176
Warmup Train [36][640/3239]	Time 0.467 (0.537)	Data 0.001 (0.032)	Loss 3.9723 (4.0204)	Top-1 acc 31.641 (30.662)	Top-5 acc 54.688 (54.059)	lr 0.00176
Warmup Train [36][650/3239]	Time 0.621 (0.537)	Data 0.001 (0.031)	Loss 4.0389 (4.0207)	Top-1 acc 29.297 (30.655)	Top-5 acc 53.516 (54.056)	lr 0.00176
Warmup Train [36][660/3239]	Time 0.628 (0.537)	Data 0.001 (0.031)	Loss 3.9952 (4.0204)	Top-1 acc 30.859 (30.676)	Top-5 acc 53.906 (54.078)	lr 0.00175
Warmup Train [36][670/3239]	Time 0.460 (0.536)	Data 0.001 (0.031)	Loss 3.7965 (4.0211)	Top-1 acc 41.016 (30.681)	Top-5 acc 60.156 (54.063)	lr 0.00175
Warmup Train [36][680/3239]	Time 0.441 (0.536)	Data 0.001 (0.030)	Loss 4.1589 (4.0217)	Top-1 acc 29.297 (30.676)	Top-5 acc 50.781 (54.050)	lr 0.00175
Warmup Train [36][690/3239]	Time 0.506 (0.536)	Data 0.002 (0.030)	Loss 4.0606 (4.0216)	Top-1 acc 28.906 (30.678)	Top-5 acc 55.078 (54.056)	lr 0.00175
Warmup Train [36][700/3239]	Time 0.545 (0.535)	Data 0.001 (0.029)	Loss 3.9181 (4.0218)	Top-1 acc 32.422 (30.692)	Top-5 acc 54.688 (54.045)	lr 0.00174
Warmup Train [36][710/3239]	Time 0.411 (0.535)	Data 0.001 (0.029)	Loss 4.0452 (4.0211)	Top-1 acc 26.172 (30.713)	Top-5 acc 55.078 (54.066)	lr 0.00174
Warmup Train [36][720/3239]	Time 0.451 (0.535)	Data 0.001 (0.029)	Loss 4.2168 (4.0205)	Top-1 acc 30.469 (30.736)	Top-5 acc 51.172 (54.077)	lr 0.00174
Warmup Train [36][730/3239]	Time 0.601 (0.535)	Data 0.001 (0.029)	Loss 3.9325 (4.0200)	Top-1 acc 33.203 (30.745)	Top-5 acc 56.250 (54.086)	lr 0.00174
Warmup Train [36][740/3239]	Time 0.374 (0.534)	Data 0.001 (0.028)	Loss 4.0225 (4.0196)	Top-1 acc 32.812 (30.757)	Top-5 acc 54.297 (54.098)	lr 0.00174
Warmup Train [36][750/3239]	Time 0.390 (0.534)	Data 0.001 (0.028)	Loss 4.0457 (4.0202)	Top-1 acc 32.031 (30.752)	Top-5 acc 53.125 (54.098)	lr 0.00173
Warmup Train [36][760/3239]	Time 0.396 (0.534)	Data 0.001 (0.028)	Loss 4.0929 (4.0200)	Top-1 acc 31.250 (30.761)	Top-5 acc 52.734 (54.103)	lr 0.00173
Warmup Train [36][770/3239]	Time 0.500 (0.533)	Data 0.003 (0.027)	Loss 4.0058 (4.0198)	Top-1 acc 32.812 (30.767)	Top-5 acc 53.516 (54.115)	lr 0.00173
Warmup Train [36][780/3239]	Time 0.199 (0.532)	Data 0.001 (0.027)	Loss 4.2700 (4.0202)	Top-1 acc 28.125 (30.758)	Top-5 acc 48.438 (54.112)	lr 0.00173
Warmup Train [36][790/3239]	Time 0.599 (0.532)	Data 0.001 (0.027)	Loss 4.0926 (4.0198)	Top-1 acc 25.000 (30.765)	Top-5 acc 52.734 (54.119)	lr 0.00172
Warmup Train [36][800/3239]	Time 0.475 (0.531)	Data 0.001 (0.027)	Loss 3.9060 (4.0199)	Top-1 acc 33.594 (30.755)	Top-5 acc 58.594 (54.121)	lr 0.00172
Warmup Train [36][810/3239]	Time 0.678 (0.530)	Data 0.001 (0.026)	Loss 4.1498 (4.0200)	Top-1 acc 25.391 (30.756)	Top-5 acc 51.172 (54.113)	lr 0.00172
Warmup Train [36][820/3239]	Time 0.432 (0.530)	Data 0.001 (0.026)	Loss 4.1253 (4.0199)	Top-1 acc 28.516 (30.747)	Top-5 acc 49.609 (54.113)	lr 0.00172
Warmup Train [36][830/3239]	Time 0.468 (0.530)	Data 0.001 (0.026)	Loss 4.1034 (4.0200)	Top-1 acc 27.344 (30.744)	Top-5 acc 51.562 (54.107)	lr 0.00172
Warmup Train [36][840/3239]	Time 0.600 (0.530)	Data 0.001 (0.026)	Loss 4.1514 (4.0207)	Top-1 acc 28.516 (30.727)	Top-5 acc 52.344 (54.096)	lr 0.00171
Warmup Train [36][850/3239]	Time 0.476 (0.529)	Data 0.001 (0.026)	Loss 4.0392 (4.0206)	Top-1 acc 29.688 (30.724)	Top-5 acc 53.125 (54.094)	lr 0.00171
Warmup Train [36][860/3239]	Time 0.464 (0.529)	Data 0.001 (0.025)	Loss 3.9489 (4.0204)	Top-1 acc 34.766 (30.738)	Top-5 acc 55.078 (54.086)	lr 0.00171
Warmup Train [36][870/3239]	Time 0.375 (0.529)	Data 0.001 (0.025)	Loss 4.1212 (4.0204)	Top-1 acc 27.344 (30.731)	Top-5 acc 51.562 (54.090)	lr 0.00171
Warmup Train [36][880/3239]	Time 0.651 (0.529)	Data 0.001 (0.025)	Loss 4.0421 (4.0203)	Top-1 acc 28.906 (30.730)	Top-5 acc 55.078 (54.099)	lr 0.00170
Warmup Train [36][890/3239]	Time 0.541 (0.529)	Data 0.001 (0.025)	Loss 4.0917 (4.0204)	Top-1 acc 35.156 (30.730)	Top-5 acc 54.297 (54.092)	lr 0.00170
Warmup Train [36][900/3239]	Time 0.382 (0.529)	Data 0.001 (0.024)	Loss 4.2032 (4.0204)	Top-1 acc 28.516 (30.729)	Top-5 acc 51.562 (54.087)	lr 0.00170
Warmup Train [36][910/3239]	Time 0.530 (0.529)	Data 0.001 (0.024)	Loss 4.0779 (4.0208)	Top-1 acc 28.516 (30.721)	Top-5 acc 54.688 (54.082)	lr 0.00170
Warmup Train [36][920/3239]	Time 0.389 (0.528)	Data 0.001 (0.024)	Loss 3.9064 (4.0207)	Top-1 acc 31.641 (30.729)	Top-5 acc 57.422 (54.084)	lr 0.00170
Warmup Train [36][930/3239]	Time 0.471 (0.528)	Data 0.001 (0.024)	Loss 3.9865 (4.0201)	Top-1 acc 32.422 (30.746)	Top-5 acc 55.078 (54.089)	lr 0.00169
Warmup Train [36][940/3239]	Time 0.487 (0.528)	Data 0.001 (0.024)	Loss 3.9776 (4.0201)	Top-1 acc 30.469 (30.763)	Top-5 acc 52.734 (54.091)	lr 0.00169
Warmup Train [36][950/3239]	Time 0.451 (0.528)	Data 0.001 (0.024)	Loss 3.7969 (4.0196)	Top-1 acc 35.938 (30.774)	Top-5 acc 61.328 (54.107)	lr 0.00169
Warmup Train [36][960/3239]	Time 0.571 (0.528)	Data 0.001 (0.023)	Loss 4.0581 (4.0199)	Top-1 acc 27.734 (30.759)	Top-5 acc 52.734 (54.094)	lr 0.00169
Warmup Train [36][970/3239]	Time 0.488 (0.527)	Data 0.001 (0.023)	Loss 4.0161 (4.0198)	Top-1 acc 32.031 (30.753)	Top-5 acc 54.297 (54.090)	lr 0.00168
Warmup Train [36][980/3239]	Time 0.485 (0.527)	Data 0.001 (0.023)	Loss 3.9032 (4.0200)	Top-1 acc 33.984 (30.769)	Top-5 acc 57.422 (54.094)	lr 0.00168
Warmup Train [36][990/3239]	Time 0.429 (0.527)	Data 0.001 (0.023)	Loss 3.8719 (4.0192)	Top-1 acc 37.891 (30.790)	Top-5 acc 55.469 (54.106)	lr 0.00168
Warmup Train [36][1000/3239]	Time 0.535 (0.527)	Data 0.001 (0.023)	Loss 3.9516 (4.0190)	Top-1 acc 33.984 (30.793)	Top-5 acc 54.688 (54.111)	lr 0.00168
Warmup Train [36][1010/3239]	Time 0.563 (0.527)	Data 0.001 (0.023)	Loss 3.9957 (4.0190)	Top-1 acc 30.469 (30.789)	Top-5 acc 54.688 (54.112)	lr 0.00168
Warmup Train [36][1020/3239]	Time 0.703 (0.527)	Data 0.001 (0.022)	Loss 4.1170 (4.0188)	Top-1 acc 27.734 (30.781)	Top-5 acc 49.219 (54.117)	lr 0.00167
Warmup Train [36][1030/3239]	Time 0.477 (0.527)	Data 0.002 (0.022)	Loss 3.9229 (4.0186)	Top-1 acc 28.906 (30.776)	Top-5 acc 57.422 (54.129)	lr 0.00167
Warmup Train [36][1040/3239]	Time 0.520 (0.527)	Data 0.001 (0.022)	Loss 4.0471 (4.0179)	Top-1 acc 30.078 (30.789)	Top-5 acc 56.641 (54.153)	lr 0.00167
Warmup Train [36][1050/3239]	Time 0.541 (0.526)	Data 0.001 (0.022)	Loss 4.1449 (4.0179)	Top-1 acc 29.297 (30.796)	Top-5 acc 51.562 (54.157)	lr 0.00167
Warmup Train [36][1060/3239]	Time 0.358 (0.526)	Data 0.001 (0.022)	Loss 4.2721 (4.0182)	Top-1 acc 23.828 (30.784)	Top-5 acc 45.312 (54.158)	lr 0.00166
Warmup Train [36][1070/3239]	Time 0.581 (0.526)	Data 0.001 (0.021)	Loss 3.8530 (4.0185)	Top-1 acc 37.109 (30.784)	Top-5 acc 59.375 (54.155)	lr 0.00166
Warmup Train [36][1080/3239]	Time 0.446 (0.525)	Data 0.002 (0.021)	Loss 3.9724 (4.0184)	Top-1 acc 31.250 (30.791)	Top-5 acc 51.953 (54.153)	lr 0.00166
Warmup Train [36][1090/3239]	Time 0.425 (0.525)	Data 0.002 (0.021)	Loss 4.0202 (4.0180)	Top-1 acc 31.250 (30.790)	Top-5 acc 53.906 (54.159)	lr 0.00166
Warmup Train [36][1100/3239]	Time 0.477 (0.525)	Data 0.001 (0.021)	Loss 4.0105 (4.0171)	Top-1 acc 33.203 (30.798)	Top-5 acc 55.469 (54.185)	lr 0.00166
Warmup Train [36][1110/3239]	Time 0.577 (0.525)	Data 0.001 (0.021)	Loss 3.7058 (4.0168)	Top-1 acc 39.062 (30.809)	Top-5 acc 60.156 (54.195)	lr 0.00165
Warmup Train [36][1120/3239]	Time 0.428 (0.525)	Data 0.001 (0.021)	Loss 3.9300 (4.0166)	Top-1 acc 30.078 (30.813)	Top-5 acc 55.859 (54.194)	lr 0.00165
Warmup Train [36][1130/3239]	Time 0.369 (0.524)	Data 0.001 (0.021)	Loss 4.0501 (4.0167)	Top-1 acc 32.031 (30.808)	Top-5 acc 52.344 (54.189)	lr 0.00165
Warmup Train [36][1140/3239]	Time 0.505 (0.524)	Data 0.002 (0.020)	Loss 3.9730 (4.0169)	Top-1 acc 32.422 (30.801)	Top-5 acc 58.203 (54.193)	lr 0.00165
Warmup Train [36][1150/3239]	Time 0.505 (0.524)	Data 0.001 (0.020)	Loss 4.2843 (4.0174)	Top-1 acc 28.125 (30.802)	Top-5 acc 49.609 (54.186)	lr 0.00165
Warmup Train [36][1160/3239]	Time 0.637 (0.524)	Data 0.001 (0.020)	Loss 4.0439 (4.0173)	Top-1 acc 33.594 (30.815)	Top-5 acc 53.125 (54.194)	lr 0.00164
Warmup Train [36][1170/3239]	Time 0.444 (0.524)	Data 0.001 (0.020)	Loss 4.0309 (4.0168)	Top-1 acc 31.250 (30.817)	Top-5 acc 54.688 (54.208)	lr 0.00164
Warmup Train [36][1180/3239]	Time 0.363 (0.524)	Data 0.001 (0.020)	Loss 3.9695 (4.0173)	Top-1 acc 30.469 (30.797)	Top-5 acc 54.688 (54.202)	lr 0.00164
Warmup Train [36][1190/3239]	Time 0.616 (0.524)	Data 0.001 (0.020)	Loss 3.8081 (4.0174)	Top-1 acc 39.062 (30.791)	Top-5 acc 61.328 (54.202)	lr 0.00164
Warmup Train [36][1200/3239]	Time 0.373 (0.524)	Data 0.001 (0.020)	Loss 4.0274 (4.0174)	Top-1 acc 35.156 (30.800)	Top-5 acc 54.688 (54.197)	lr 0.00163
Warmup Train [36][1210/3239]	Time 0.409 (0.524)	Data 0.001 (0.020)	Loss 4.1932 (4.0174)	Top-1 acc 26.953 (30.801)	Top-5 acc 53.516 (54.208)	lr 0.00163
Warmup Train [36][1220/3239]	Time 0.740 (0.524)	Data 0.003 (0.020)	Loss 3.9252 (4.0172)	Top-1 acc 30.469 (30.808)	Top-5 acc 55.078 (54.214)	lr 0.00163
Warmup Train [36][1230/3239]	Time 0.601 (0.523)	Data 0.001 (0.020)	Loss 3.9652 (4.0166)	Top-1 acc 33.203 (30.818)	Top-5 acc 54.688 (54.232)	lr 0.00163
Warmup Train [36][1240/3239]	Time 0.321 (0.523)	Data 0.001 (0.019)	Loss 4.1295 (4.0167)	Top-1 acc 26.172 (30.815)	Top-5 acc 51.172 (54.227)	lr 0.00163
Warmup Train [36][1250/3239]	Time 0.434 (0.523)	Data 0.001 (0.019)	Loss 4.0221 (4.0163)	Top-1 acc 32.031 (30.825)	Top-5 acc 53.125 (54.233)	lr 0.00162
Warmup Train [36][1260/3239]	Time 0.323 (0.523)	Data 0.001 (0.019)	Loss 4.1879 (4.0166)	Top-1 acc 26.172 (30.815)	Top-5 acc 48.828 (54.219)	lr 0.00162
Warmup Train [36][1270/3239]	Time 0.470 (0.523)	Data 0.001 (0.019)	Loss 4.0548 (4.0167)	Top-1 acc 28.516 (30.802)	Top-5 acc 49.609 (54.219)	lr 0.00162
Warmup Train [36][1280/3239]	Time 0.499 (0.523)	Data 0.001 (0.019)	Loss 3.9776 (4.0173)	Top-1 acc 32.422 (30.797)	Top-5 acc 57.422 (54.208)	lr 0.00162
Warmup Train [36][1290/3239]	Time 0.552 (0.523)	Data 0.001 (0.019)	Loss 3.9525 (4.0173)	Top-1 acc 34.375 (30.805)	Top-5 acc 57.812 (54.216)	lr 0.00162
Warmup Train [36][1300/3239]	Time 0.517 (0.523)	Data 0.001 (0.019)	Loss 4.0978 (4.0175)	Top-1 acc 24.609 (30.800)	Top-5 acc 53.125 (54.210)	lr 0.00161
Warmup Train [36][1310/3239]	Time 0.505 (0.523)	Data 0.001 (0.019)	Loss 3.8579 (4.0176)	Top-1 acc 32.422 (30.793)	Top-5 acc 56.641 (54.204)	lr 0.00161
Warmup Train [36][1320/3239]	Time 0.574 (0.523)	Data 0.001 (0.019)	Loss 3.8585 (4.0174)	Top-1 acc 37.109 (30.797)	Top-5 acc 61.328 (54.214)	lr 0.00161
Warmup Train [36][1330/3239]	Time 0.657 (0.523)	Data 0.001 (0.019)	Loss 3.9198 (4.0174)	Top-1 acc 34.766 (30.800)	Top-5 acc 55.469 (54.211)	lr 0.00161
Warmup Train [36][1340/3239]	Time 0.338 (0.522)	Data 0.001 (0.019)	Loss 4.0379 (4.0171)	Top-1 acc 28.906 (30.807)	Top-5 acc 57.031 (54.218)	lr 0.00160
Warmup Train [36][1350/3239]	Time 0.404 (0.522)	Data 0.001 (0.018)	Loss 4.0986 (4.0172)	Top-1 acc 27.734 (30.804)	Top-5 acc 50.000 (54.210)	lr 0.00160
Warmup Train [36][1360/3239]	Time 0.365 (0.522)	Data 0.001 (0.018)	Loss 4.1828 (4.0175)	Top-1 acc 27.344 (30.797)	Top-5 acc 50.781 (54.204)	lr 0.00160
Warmup Train [36][1370/3239]	Time 0.388 (0.521)	Data 0.001 (0.018)	Loss 3.9668 (4.0174)	Top-1 acc 32.422 (30.803)	Top-5 acc 58.203 (54.218)	lr 0.00160
Warmup Train [36][1380/3239]	Time 0.389 (0.521)	Data 0.001 (0.018)	Loss 3.8503 (4.0170)	Top-1 acc 30.469 (30.808)	Top-5 acc 57.812 (54.219)	lr 0.00160
Warmup Train [36][1390/3239]	Time 0.547 (0.521)	Data 0.001 (0.018)	Loss 4.0755 (4.0170)	Top-1 acc 30.859 (30.813)	Top-5 acc 52.734 (54.219)	lr 0.00159
Warmup Train [36][1400/3239]	Time 0.697 (0.521)	Data 0.001 (0.018)	Loss 4.0379 (4.0171)	Top-1 acc 30.859 (30.815)	Top-5 acc 53.125 (54.217)	lr 0.00159
Warmup Train [36][1410/3239]	Time 0.356 (0.521)	Data 0.001 (0.018)	Loss 4.0008 (4.0173)	Top-1 acc 29.688 (30.812)	Top-5 acc 57.031 (54.205)	lr 0.00159
Warmup Train [36][1420/3239]	Time 0.581 (0.521)	Data 0.001 (0.018)	Loss 3.9389 (4.0169)	Top-1 acc 35.156 (30.821)	Top-5 acc 56.641 (54.219)	lr 0.00159
Warmup Train [36][1430/3239]	Time 0.489 (0.521)	Data 0.002 (0.018)	Loss 4.0439 (4.0171)	Top-1 acc 28.906 (30.819)	Top-5 acc 53.516 (54.213)	lr 0.00159
Warmup Train [36][1440/3239]	Time 0.413 (0.521)	Data 0.002 (0.018)	Loss 3.9368 (4.0167)	Top-1 acc 33.594 (30.825)	Top-5 acc 55.078 (54.219)	lr 0.00158
Warmup Train [36][1450/3239]	Time 0.429 (0.521)	Data 0.001 (0.018)	Loss 4.0660 (4.0170)	Top-1 acc 30.859 (30.812)	Top-5 acc 53.125 (54.213)	lr 0.00158
Warmup Train [36][1460/3239]	Time 0.589 (0.521)	Data 0.001 (0.018)	Loss 3.9783 (4.0169)	Top-1 acc 34.375 (30.819)	Top-5 acc 55.078 (54.214)	lr 0.00158
Warmup Train [36][1470/3239]	Time 0.600 (0.521)	Data 0.001 (0.018)	Loss 3.9047 (4.0171)	Top-1 acc 29.688 (30.813)	Top-5 acc 54.688 (54.205)	lr 0.00158
Warmup Train [36][1480/3239]	Time 0.347 (0.520)	Data 0.001 (0.018)	Loss 3.9088 (4.0172)	Top-1 acc 29.297 (30.814)	Top-5 acc 54.688 (54.193)	lr 0.00157
Warmup Train [36][1490/3239]	Time 0.635 (0.520)	Data 0.001 (0.018)	Loss 3.8200 (4.0174)	Top-1 acc 33.594 (30.810)	Top-5 acc 59.375 (54.193)	lr 0.00157
Warmup Train [36][1500/3239]	Time 0.527 (0.520)	Data 0.001 (0.017)	Loss 3.9900 (4.0177)	Top-1 acc 30.859 (30.807)	Top-5 acc 55.859 (54.182)	lr 0.00157
Warmup Train [36][1510/3239]	Time 0.400 (0.520)	Data 0.001 (0.017)	Loss 4.1474 (4.0180)	Top-1 acc 28.906 (30.800)	Top-5 acc 53.906 (54.178)	lr 0.00157
Warmup Train [36][1520/3239]	Time 0.452 (0.520)	Data 0.001 (0.017)	Loss 3.9568 (4.0182)	Top-1 acc 31.250 (30.792)	Top-5 acc 55.078 (54.177)	lr 0.00157
Warmup Train [36][1530/3239]	Time 0.310 (0.520)	Data 0.001 (0.017)	Loss 4.1602 (4.0182)	Top-1 acc 26.172 (30.803)	Top-5 acc 49.219 (54.175)	lr 0.00156
Warmup Train [36][1540/3239]	Time 0.495 (0.520)	Data 0.001 (0.017)	Loss 4.0933 (4.0183)	Top-1 acc 29.297 (30.802)	Top-5 acc 51.953 (54.172)	lr 0.00156
Warmup Train [36][1550/3239]	Time 0.495 (0.520)	Data 0.001 (0.017)	Loss 4.2229 (4.0185)	Top-1 acc 25.781 (30.801)	Top-5 acc 48.438 (54.166)	lr 0.00156
Warmup Train [36][1560/3239]	Time 0.485 (0.520)	Data 0.001 (0.017)	Loss 3.9140 (4.0185)	Top-1 acc 32.031 (30.812)	Top-5 acc 53.906 (54.171)	lr 0.00156
Warmup Train [36][1570/3239]	Time 0.591 (0.520)	Data 0.001 (0.017)	Loss 4.1642 (4.0185)	Top-1 acc 30.078 (30.817)	Top-5 acc 53.125 (54.169)	lr 0.00156
Warmup Train [36][1580/3239]	Time 0.534 (0.520)	Data 0.001 (0.017)	Loss 4.2226 (4.0185)	Top-1 acc 25.000 (30.813)	Top-5 acc 52.344 (54.176)	lr 0.00155
Warmup Train [36][1590/3239]	Time 0.371 (0.520)	Data 0.001 (0.017)	Loss 4.1554 (4.0186)	Top-1 acc 30.859 (30.816)	Top-5 acc 52.734 (54.181)	lr 0.00155
Warmup Train [36][1600/3239]	Time 0.430 (0.520)	Data 0.001 (0.017)	Loss 3.9086 (4.0182)	Top-1 acc 31.250 (30.815)	Top-5 acc 55.859 (54.185)	lr 0.00155
Warmup Train [36][1610/3239]	Time 0.503 (0.520)	Data 0.001 (0.017)	Loss 4.0718 (4.0180)	Top-1 acc 30.078 (30.826)	Top-5 acc 53.516 (54.193)	lr 0.00155
Warmup Train [36][1620/3239]	Time 0.356 (0.520)	Data 0.001 (0.017)	Loss 3.9167 (4.0179)	Top-1 acc 34.375 (30.824)	Top-5 acc 59.375 (54.194)	lr 0.00155
Warmup Train [36][1630/3239]	Time 0.474 (0.519)	Data 0.001 (0.017)	Loss 4.0279 (4.0182)	Top-1 acc 30.469 (30.820)	Top-5 acc 56.641 (54.194)	lr 0.00154
Warmup Train [36][1640/3239]	Time 0.764 (0.519)	Data 0.001 (0.016)	Loss 4.0775 (4.0182)	Top-1 acc 28.906 (30.824)	Top-5 acc 53.516 (54.195)	lr 0.00154
Warmup Train [36][1650/3239]	Time 0.376 (0.519)	Data 0.001 (0.016)	Loss 3.8832 (4.0181)	Top-1 acc 33.984 (30.827)	Top-5 acc 55.859 (54.195)	lr 0.00154
Warmup Train [36][1660/3239]	Time 0.520 (0.519)	Data 0.002 (0.016)	Loss 4.1830 (4.0182)	Top-1 acc 26.953 (30.829)	Top-5 acc 50.781 (54.199)	lr 0.00154
Warmup Train [36][1670/3239]	Time 0.507 (0.519)	Data 0.001 (0.016)	Loss 3.8778 (4.0177)	Top-1 acc 32.031 (30.842)	Top-5 acc 58.594 (54.215)	lr 0.00153
Warmup Train [36][1680/3239]	Time 0.492 (0.519)	Data 0.001 (0.016)	Loss 4.0253 (4.0177)	Top-1 acc 34.375 (30.838)	Top-5 acc 58.203 (54.221)	lr 0.00153
Warmup Train [36][1690/3239]	Time 0.538 (0.519)	Data 0.001 (0.016)	Loss 3.9000 (4.0176)	Top-1 acc 33.594 (30.840)	Top-5 acc 56.641 (54.223)	lr 0.00153
Warmup Train [36][1700/3239]	Time 0.502 (0.519)	Data 0.001 (0.016)	Loss 4.0899 (4.0177)	Top-1 acc 30.078 (30.833)	Top-5 acc 52.734 (54.225)	lr 0.00153
Warmup Train [36][1710/3239]	Time 0.613 (0.518)	Data 0.001 (0.016)	Loss 3.7973 (4.0175)	Top-1 acc 37.109 (30.838)	Top-5 acc 59.766 (54.234)	lr 0.00153
Warmup Train [36][1720/3239]	Time 0.601 (0.518)	Data 0.001 (0.016)	Loss 3.9319 (4.0174)	Top-1 acc 33.984 (30.841)	Top-5 acc 56.250 (54.238)	lr 0.00152
Warmup Train [36][1730/3239]	Time 0.610 (0.518)	Data 0.001 (0.016)	Loss 3.9145 (4.0175)	Top-1 acc 30.078 (30.835)	Top-5 acc 58.203 (54.235)	lr 0.00152
Warmup Train [36][1740/3239]	Time 0.410 (0.518)	Data 0.001 (0.016)	Loss 3.9525 (4.0173)	Top-1 acc 32.812 (30.837)	Top-5 acc 57.031 (54.242)	lr 0.00152
Warmup Train [36][1750/3239]	Time 0.565 (0.518)	Data 0.001 (0.016)	Loss 3.9726 (4.0169)	Top-1 acc 32.812 (30.842)	Top-5 acc 54.297 (54.250)	lr 0.00152
Warmup Train [36][1760/3239]	Time 0.555 (0.518)	Data 0.001 (0.016)	Loss 4.0008 (4.0170)	Top-1 acc 30.859 (30.837)	Top-5 acc 53.906 (54.248)	lr 0.00152
Warmup Train [36][1770/3239]	Time 0.616 (0.518)	Data 0.001 (0.016)	Loss 3.8317 (4.0167)	Top-1 acc 33.203 (30.843)	Top-5 acc 63.281 (54.262)	lr 0.00151
Warmup Train [36][1780/3239]	Time 0.655 (0.518)	Data 0.001 (0.016)	Loss 4.1279 (4.0168)	Top-1 acc 34.766 (30.848)	Top-5 acc 51.562 (54.262)	lr 0.00151
Warmup Train [36][1790/3239]	Time 0.531 (0.518)	Data 0.001 (0.016)	Loss 3.9406 (4.0164)	Top-1 acc 33.594 (30.854)	Top-5 acc 55.469 (54.271)	lr 0.00151
Warmup Train [36][1800/3239]	Time 0.529 (0.518)	Data 0.001 (0.015)	Loss 3.9993 (4.0163)	Top-1 acc 32.422 (30.856)	Top-5 acc 53.906 (54.276)	lr 0.00151
Warmup Train [36][1810/3239]	Time 0.611 (0.518)	Data 0.001 (0.015)	Loss 3.8779 (4.0159)	Top-1 acc 37.109 (30.858)	Top-5 acc 53.516 (54.282)	lr 0.00151
Warmup Train [36][1820/3239]	Time 0.374 (0.518)	Data 0.001 (0.015)	Loss 4.3010 (4.0162)	Top-1 acc 28.906 (30.859)	Top-5 acc 49.219 (54.275)	lr 0.00150
Warmup Train [36][1830/3239]	Time 0.386 (0.518)	Data 0.001 (0.015)	Loss 3.9817 (4.0162)	Top-1 acc 28.516 (30.862)	Top-5 acc 54.297 (54.276)	lr 0.00150
Warmup Train [36][1840/3239]	Time 0.502 (0.518)	Data 0.001 (0.015)	Loss 3.9145 (4.0166)	Top-1 acc 32.812 (30.849)	Top-5 acc 55.469 (54.267)	lr 0.00150
Warmup Train [36][1850/3239]	Time 0.468 (0.518)	Data 0.001 (0.015)	Loss 3.9192 (4.0162)	Top-1 acc 33.984 (30.859)	Top-5 acc 57.422 (54.274)	lr 0.00150
Warmup Train [36][1860/3239]	Time 0.508 (0.518)	Data 0.001 (0.015)	Loss 4.0861 (4.0161)	Top-1 acc 28.125 (30.859)	Top-5 acc 53.906 (54.283)	lr 0.00150
Warmup Train [36][1870/3239]	Time 0.525 (0.518)	Data 0.001 (0.015)	Loss 3.7142 (4.0158)	Top-1 acc 38.672 (30.869)	Top-5 acc 61.719 (54.290)	lr 0.00149
Warmup Train [36][1880/3239]	Time 0.571 (0.518)	Data 0.001 (0.015)	Loss 3.9787 (4.0160)	Top-1 acc 30.078 (30.862)	Top-5 acc 58.594 (54.286)	lr 0.00149
Warmup Train [36][1890/3239]	Time 0.533 (0.518)	Data 0.002 (0.015)	Loss 3.9621 (4.0159)	Top-1 acc 31.250 (30.866)	Top-5 acc 55.469 (54.287)	lr 0.00149
Warmup Train [36][1900/3239]	Time 0.343 (0.518)	Data 0.001 (0.015)	Loss 4.0510 (4.0156)	Top-1 acc 28.125 (30.866)	Top-5 acc 54.688 (54.294)	lr 0.00149
Warmup Train [36][1910/3239]	Time 0.605 (0.517)	Data 0.001 (0.015)	Loss 3.9393 (4.0158)	Top-1 acc 31.641 (30.863)	Top-5 acc 59.375 (54.290)	lr 0.00148
Warmup Train [36][1920/3239]	Time 0.464 (0.517)	Data 0.001 (0.015)	Loss 3.8913 (4.0157)	Top-1 acc 28.125 (30.859)	Top-5 acc 60.938 (54.294)	lr 0.00148
Warmup Train [36][1930/3239]	Time 0.479 (0.517)	Data 0.001 (0.015)	Loss 4.0621 (4.0153)	Top-1 acc 32.422 (30.870)	Top-5 acc 55.469 (54.302)	lr 0.00148
Warmup Train [36][1940/3239]	Time 0.522 (0.517)	Data 0.001 (0.015)	Loss 4.0062 (4.0153)	Top-1 acc 33.984 (30.871)	Top-5 acc 56.641 (54.302)	lr 0.00148
Warmup Train [36][1950/3239]	Time 0.511 (0.517)	Data 0.001 (0.015)	Loss 4.1604 (4.0155)	Top-1 acc 29.688 (30.859)	Top-5 acc 52.344 (54.298)	lr 0.00148
Warmup Train [36][1960/3239]	Time 0.427 (0.517)	Data 0.001 (0.015)	Loss 3.9965 (4.0153)	Top-1 acc 30.859 (30.865)	Top-5 acc 51.562 (54.305)	lr 0.00147
Warmup Train [36][1970/3239]	Time 0.477 (0.517)	Data 0.001 (0.015)	Loss 4.2235 (4.0151)	Top-1 acc 27.734 (30.871)	Top-5 acc 50.000 (54.314)	lr 0.00147
Warmup Train [36][1980/3239]	Time 0.546 (0.517)	Data 0.001 (0.015)	Loss 3.9524 (4.0151)	Top-1 acc 33.594 (30.868)	Top-5 acc 56.250 (54.314)	lr 0.00147
Warmup Train [36][1990/3239]	Time 0.552 (0.517)	Data 0.001 (0.015)	Loss 4.0309 (4.0150)	Top-1 acc 30.469 (30.869)	Top-5 acc 55.859 (54.312)	lr 0.00147
Warmup Train [36][2000/3239]	Time 0.618 (0.517)	Data 0.001 (0.015)	Loss 4.1463 (4.0152)	Top-1 acc 28.516 (30.871)	Top-5 acc 52.734 (54.307)	lr 0.00147
Warmup Train [36][2010/3239]	Time 0.558 (0.517)	Data 0.001 (0.014)	Loss 3.9202 (4.0151)	Top-1 acc 32.031 (30.873)	Top-5 acc 56.250 (54.311)	lr 0.00146
Warmup Train [36][2020/3239]	Time 0.502 (0.517)	Data 0.001 (0.014)	Loss 3.9665 (4.0153)	Top-1 acc 34.375 (30.873)	Top-5 acc 53.125 (54.305)	lr 0.00146
Warmup Train [36][2030/3239]	Time 0.596 (0.517)	Data 0.001 (0.014)	Loss 4.0406 (4.0155)	Top-1 acc 29.688 (30.866)	Top-5 acc 53.125 (54.299)	lr 0.00146
Warmup Train [36][2040/3239]	Time 0.538 (0.517)	Data 0.001 (0.014)	Loss 4.0896 (4.0155)	Top-1 acc 32.031 (30.868)	Top-5 acc 53.516 (54.299)	lr 0.00146
Warmup Train [36][2050/3239]	Time 0.352 (0.517)	Data 0.001 (0.014)	Loss 4.1905 (4.0158)	Top-1 acc 26.562 (30.862)	Top-5 acc 51.172 (54.290)	lr 0.00146
Warmup Train [36][2060/3239]	Time 0.492 (0.517)	Data 0.001 (0.014)	Loss 4.0913 (4.0157)	Top-1 acc 26.953 (30.861)	Top-5 acc 51.953 (54.295)	lr 0.00145
Warmup Train [36][2070/3239]	Time 0.455 (0.517)	Data 0.001 (0.014)	Loss 4.0896 (4.0157)	Top-1 acc 29.688 (30.866)	Top-5 acc 53.906 (54.294)	lr 0.00145
Warmup Train [36][2080/3239]	Time 0.349 (0.517)	Data 0.001 (0.014)	Loss 4.0997 (4.0159)	Top-1 acc 30.469 (30.862)	Top-5 acc 55.078 (54.287)	lr 0.00145
Warmup Train [36][2090/3239]	Time 0.497 (0.517)	Data 0.001 (0.014)	Loss 4.0070 (4.0157)	Top-1 acc 32.031 (30.866)	Top-5 acc 51.953 (54.291)	lr 0.00145
Warmup Train [36][2100/3239]	Time 0.451 (0.517)	Data 0.001 (0.014)	Loss 4.1059 (4.0155)	Top-1 acc 32.422 (30.871)	Top-5 acc 54.297 (54.298)	lr 0.00145
Warmup Train [36][2110/3239]	Time 0.481 (0.517)	Data 0.001 (0.014)	Loss 4.1315 (4.0155)	Top-1 acc 28.906 (30.873)	Top-5 acc 50.781 (54.300)	lr 0.00144
Warmup Train [36][2120/3239]	Time 0.538 (0.517)	Data 0.001 (0.014)	Loss 3.7344 (4.0154)	Top-1 acc 35.156 (30.871)	Top-5 acc 61.328 (54.300)	lr 0.00144
Warmup Train [36][2130/3239]	Time 0.358 (0.517)	Data 0.001 (0.014)	Loss 4.0165 (4.0154)	Top-1 acc 32.031 (30.870)	Top-5 acc 54.688 (54.303)	lr 0.00144
Warmup Train [36][2140/3239]	Time 0.472 (0.517)	Data 0.001 (0.014)	Loss 4.1698 (4.0153)	Top-1 acc 30.469 (30.872)	Top-5 acc 51.172 (54.302)	lr 0.00144
Warmup Train [36][2150/3239]	Time 0.585 (0.517)	Data 0.001 (0.014)	Loss 3.9474 (4.0155)	Top-1 acc 32.031 (30.868)	Top-5 acc 53.516 (54.299)	lr 0.00144
Warmup Train [36][2160/3239]	Time 0.666 (0.517)	Data 0.001 (0.014)	Loss 4.0222 (4.0155)	Top-1 acc 32.031 (30.861)	Top-5 acc 55.859 (54.306)	lr 0.00143
Warmup Train [36][2170/3239]	Time 0.549 (0.517)	Data 0.001 (0.014)	Loss 4.0308 (4.0154)	Top-1 acc 32.031 (30.865)	Top-5 acc 53.906 (54.307)	lr 0.00143
Warmup Train [36][2180/3239]	Time 0.553 (0.517)	Data 0.001 (0.014)	Loss 3.8981 (4.0158)	Top-1 acc 35.938 (30.860)	Top-5 acc 55.859 (54.297)	lr 0.00143
Warmup Train [36][2190/3239]	Time 0.615 (0.517)	Data 0.001 (0.014)	Loss 3.7990 (4.0156)	Top-1 acc 34.375 (30.859)	Top-5 acc 59.766 (54.303)	lr 0.00143
Warmup Train [36][2200/3239]	Time 0.230 (0.516)	Data 0.001 (0.014)	Loss 3.8940 (4.0154)	Top-1 acc 31.641 (30.866)	Top-5 acc 57.031 (54.307)	lr 0.00143
Warmup Train [36][2210/3239]	Time 0.626 (0.516)	Data 0.003 (0.014)	Loss 4.1570 (4.0154)	Top-1 acc 32.812 (30.870)	Top-5 acc 50.391 (54.308)	lr 0.00142
Warmup Train [36][2220/3239]	Time 0.503 (0.516)	Data 0.001 (0.014)	Loss 3.8475 (4.0151)	Top-1 acc 37.109 (30.880)	Top-5 acc 57.422 (54.316)	lr 0.00142
Warmup Train [36][2230/3239]	Time 0.620 (0.516)	Data 0.001 (0.014)	Loss 3.9578 (4.0148)	Top-1 acc 30.078 (30.879)	Top-5 acc 56.250 (54.323)	lr 0.00142
Warmup Train [36][2240/3239]	Time 0.447 (0.516)	Data 0.001 (0.014)	Loss 3.9273 (4.0147)	Top-1 acc 31.641 (30.876)	Top-5 acc 57.812 (54.326)	lr 0.00142
Warmup Train [36][2250/3239]	Time 0.529 (0.516)	Data 0.002 (0.014)	Loss 3.7557 (4.0146)	Top-1 acc 35.938 (30.879)	Top-5 acc 60.156 (54.329)	lr 0.00142
Warmup Train [36][2260/3239]	Time 0.686 (0.516)	Data 0.001 (0.014)	Loss 4.0312 (4.0147)	Top-1 acc 32.812 (30.879)	Top-5 acc 54.688 (54.327)	lr 0.00141
Warmup Train [36][2270/3239]	Time 0.421 (0.516)	Data 0.001 (0.014)	Loss 4.1268 (4.0147)	Top-1 acc 29.297 (30.883)	Top-5 acc 51.172 (54.321)	lr 0.00141
Warmup Train [36][2280/3239]	Time 0.511 (0.516)	Data 0.001 (0.014)	Loss 4.0099 (4.0146)	Top-1 acc 32.422 (30.885)	Top-5 acc 54.688 (54.324)	lr 0.00141
Warmup Train [36][2290/3239]	Time 0.590 (0.516)	Data 0.001 (0.013)	Loss 3.8888 (4.0147)	Top-1 acc 33.203 (30.883)	Top-5 acc 55.859 (54.319)	lr 0.00141
Warmup Train [36][2300/3239]	Time 0.586 (0.516)	Data 0.001 (0.013)	Loss 4.2414 (4.0150)	Top-1 acc 28.125 (30.881)	Top-5 acc 48.438 (54.315)	lr 0.00141
Warmup Train [36][2310/3239]	Time 0.517 (0.516)	Data 0.001 (0.013)	Loss 3.9499 (4.0150)	Top-1 acc 35.938 (30.883)	Top-5 acc 58.203 (54.313)	lr 0.00140
Warmup Train [36][2320/3239]	Time 0.322 (0.516)	Data 0.001 (0.013)	Loss 4.0280 (4.0150)	Top-1 acc 32.031 (30.885)	Top-5 acc 53.125 (54.314)	lr 0.00140
Warmup Train [36][2330/3239]	Time 0.616 (0.516)	Data 0.001 (0.013)	Loss 4.1936 (4.0155)	Top-1 acc 26.953 (30.877)	Top-5 acc 49.609 (54.301)	lr 0.00140
Warmup Train [36][2340/3239]	Time 0.285 (0.516)	Data 0.001 (0.013)	Loss 4.4188 (4.0155)	Top-1 acc 24.219 (30.878)	Top-5 acc 46.484 (54.300)	lr 0.00140
Warmup Train [36][2350/3239]	Time 0.527 (0.516)	Data 0.001 (0.013)	Loss 3.9071 (4.0154)	Top-1 acc 32.812 (30.880)	Top-5 acc 56.641 (54.302)	lr 0.00140
Warmup Train [36][2360/3239]	Time 0.588 (0.516)	Data 0.001 (0.013)	Loss 4.0806 (4.0152)	Top-1 acc 31.641 (30.886)	Top-5 acc 51.953 (54.307)	lr 0.00139
Warmup Train [36][2370/3239]	Time 0.369 (0.516)	Data 0.001 (0.013)	Loss 4.1182 (4.0153)	Top-1 acc 25.391 (30.881)	Top-5 acc 53.906 (54.306)	lr 0.00139
Warmup Train [36][2380/3239]	Time 0.531 (0.516)	Data 0.001 (0.013)	Loss 3.9745 (4.0154)	Top-1 acc 34.766 (30.877)	Top-5 acc 53.906 (54.302)	lr 0.00139
Warmup Train [36][2390/3239]	Time 0.672 (0.516)	Data 0.001 (0.013)	Loss 4.2273 (4.0157)	Top-1 acc 27.344 (30.872)	Top-5 acc 48.828 (54.297)	lr 0.00139
Warmup Train [36][2400/3239]	Time 0.308 (0.516)	Data 0.021 (0.013)	Loss 4.1394 (4.0156)	Top-1 acc 31.250 (30.872)	Top-5 acc 51.953 (54.296)	lr 0.00139
Warmup Train [36][2410/3239]	Time 0.554 (0.516)	Data 0.001 (0.013)	Loss 3.9455 (4.0158)	Top-1 acc 30.859 (30.868)	Top-5 acc 55.469 (54.288)	lr 0.00138
Warmup Train [36][2420/3239]	Time 0.356 (0.516)	Data 0.001 (0.013)	Loss 4.0761 (4.0158)	Top-1 acc 29.688 (30.866)	Top-5 acc 53.516 (54.286)	lr 0.00138
Warmup Train [36][2430/3239]	Time 0.297 (0.516)	Data 0.001 (0.013)	Loss 4.2598 (4.0158)	Top-1 acc 26.172 (30.871)	Top-5 acc 49.219 (54.293)	lr 0.00138
Warmup Train [36][2440/3239]	Time 0.492 (0.516)	Data 0.001 (0.013)	Loss 4.0060 (4.0158)	Top-1 acc 33.594 (30.874)	Top-5 acc 53.125 (54.291)	lr 0.00138
Warmup Train [36][2450/3239]	Time 0.350 (0.516)	Data 0.001 (0.013)	Loss 4.0092 (4.0157)	Top-1 acc 25.000 (30.873)	Top-5 acc 53.125 (54.298)	lr 0.00138
Warmup Train [36][2460/3239]	Time 0.196 (0.516)	Data 0.001 (0.013)	Loss 4.0932 (4.0155)	Top-1 acc 28.125 (30.872)	Top-5 acc 55.469 (54.303)	lr 0.00137
Warmup Train [36][2470/3239]	Time 0.482 (0.515)	Data 0.001 (0.013)	Loss 3.9914 (4.0156)	Top-1 acc 34.766 (30.864)	Top-5 acc 57.812 (54.305)	lr 0.00137
Warmup Train [36][2480/3239]	Time 0.360 (0.515)	Data 0.001 (0.013)	Loss 3.7823 (4.0158)	Top-1 acc 33.984 (30.857)	Top-5 acc 58.203 (54.296)	lr 0.00137
Warmup Train [36][2490/3239]	Time 0.508 (0.515)	Data 0.001 (0.013)	Loss 4.4419 (4.0160)	Top-1 acc 25.000 (30.861)	Top-5 acc 46.484 (54.295)	lr 0.00137
Warmup Train [36][2500/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 4.0230 (4.0161)	Top-1 acc 29.297 (30.860)	Top-5 acc 54.297 (54.295)	lr 0.00137
Warmup Train [36][2510/3239]	Time 0.562 (0.515)	Data 0.001 (0.013)	Loss 4.2405 (4.0163)	Top-1 acc 25.391 (30.854)	Top-5 acc 48.047 (54.287)	lr 0.00136
Warmup Train [36][2520/3239]	Time 0.534 (0.515)	Data 0.001 (0.013)	Loss 4.0005 (4.0161)	Top-1 acc 32.422 (30.853)	Top-5 acc 51.953 (54.292)	lr 0.00136
Warmup Train [36][2530/3239]	Time 0.530 (0.515)	Data 0.001 (0.013)	Loss 3.9647 (4.0161)	Top-1 acc 32.422 (30.852)	Top-5 acc 57.031 (54.293)	lr 0.00136
Warmup Train [36][2540/3239]	Time 0.524 (0.515)	Data 0.001 (0.013)	Loss 4.0210 (4.0165)	Top-1 acc 30.859 (30.847)	Top-5 acc 54.688 (54.283)	lr 0.00136
Warmup Train [36][2550/3239]	Time 0.498 (0.515)	Data 0.001 (0.013)	Loss 4.0457 (4.0166)	Top-1 acc 32.422 (30.847)	Top-5 acc 56.250 (54.283)	lr 0.00136
Warmup Train [36][2560/3239]	Time 0.407 (0.515)	Data 0.001 (0.013)	Loss 3.9321 (4.0164)	Top-1 acc 31.641 (30.850)	Top-5 acc 58.984 (54.287)	lr 0.00135
Warmup Train [36][2570/3239]	Time 0.523 (0.515)	Data 0.001 (0.013)	Loss 3.9516 (4.0163)	Top-1 acc 33.594 (30.851)	Top-5 acc 53.516 (54.287)	lr 0.00135
Warmup Train [36][2580/3239]	Time 0.708 (0.515)	Data 0.001 (0.013)	Loss 3.9643 (4.0169)	Top-1 acc 30.078 (30.844)	Top-5 acc 56.641 (54.274)	lr 0.00135
Warmup Train [36][2590/3239]	Time 0.698 (0.515)	Data 0.001 (0.013)	Loss 3.8907 (4.0169)	Top-1 acc 30.859 (30.845)	Top-5 acc 58.984 (54.277)	lr 0.00135
Warmup Train [36][2600/3239]	Time 0.526 (0.515)	Data 0.001 (0.013)	Loss 4.0515 (4.0169)	Top-1 acc 28.516 (30.843)	Top-5 acc 54.688 (54.276)	lr 0.00135
Warmup Train [36][2610/3239]	Time 0.505 (0.515)	Data 0.001 (0.013)	Loss 4.1748 (4.0169)	Top-1 acc 30.469 (30.846)	Top-5 acc 52.344 (54.276)	lr 0.00134
Warmup Train [36][2620/3239]	Time 0.553 (0.515)	Data 0.001 (0.013)	Loss 4.1380 (4.0171)	Top-1 acc 25.391 (30.841)	Top-5 acc 50.781 (54.271)	lr 0.00134
Warmup Train [36][2630/3239]	Time 0.420 (0.515)	Data 0.001 (0.013)	Loss 4.0804 (4.0171)	Top-1 acc 28.906 (30.837)	Top-5 acc 56.250 (54.268)	lr 0.00134
Warmup Train [36][2640/3239]	Time 0.507 (0.515)	Data 0.001 (0.013)	Loss 4.0915 (4.0174)	Top-1 acc 30.469 (30.832)	Top-5 acc 52.344 (54.266)	lr 0.00134
Warmup Train [36][2650/3239]	Time 0.533 (0.515)	Data 0.001 (0.013)	Loss 4.1558 (4.0175)	Top-1 acc 26.562 (30.828)	Top-5 acc 46.875 (54.262)	lr 0.00134
Warmup Train [36][2660/3239]	Time 0.354 (0.515)	Data 0.001 (0.013)	Loss 4.1832 (4.0175)	Top-1 acc 26.562 (30.825)	Top-5 acc 52.344 (54.267)	lr 0.00133
Warmup Train [36][2670/3239]	Time 0.548 (0.515)	Data 0.001 (0.013)	Loss 4.0424 (4.0175)	Top-1 acc 29.688 (30.827)	Top-5 acc 55.859 (54.270)	lr 0.00133
Warmup Train [36][2680/3239]	Time 0.614 (0.515)	Data 0.001 (0.013)	Loss 4.0420 (4.0176)	Top-1 acc 26.953 (30.821)	Top-5 acc 55.078 (54.267)	lr 0.00133
Warmup Train [36][2690/3239]	Time 0.540 (0.515)	Data 0.001 (0.013)	Loss 4.1481 (4.0176)	Top-1 acc 28.125 (30.824)	Top-5 acc 48.438 (54.270)	lr 0.00133
Warmup Train [36][2700/3239]	Time 0.480 (0.515)	Data 0.001 (0.012)	Loss 3.8700 (4.0176)	Top-1 acc 33.203 (30.820)	Top-5 acc 54.297 (54.264)	lr 0.00133
Warmup Train [36][2710/3239]	Time 0.522 (0.515)	Data 0.001 (0.012)	Loss 4.1196 (4.0177)	Top-1 acc 28.125 (30.822)	Top-5 acc 52.344 (54.262)	lr 0.00132
Warmup Train [36][2720/3239]	Time 0.584 (0.515)	Data 0.001 (0.012)	Loss 3.9737 (4.0179)	Top-1 acc 29.297 (30.815)	Top-5 acc 53.516 (54.254)	lr 0.00132
Warmup Train [36][2730/3239]	Time 0.496 (0.515)	Data 0.001 (0.012)	Loss 4.1415 (4.0180)	Top-1 acc 31.250 (30.813)	Top-5 acc 50.781 (54.251)	lr 0.00132
Warmup Train [36][2740/3239]	Time 0.481 (0.515)	Data 0.001 (0.012)	Loss 4.0223 (4.0178)	Top-1 acc 30.859 (30.814)	Top-5 acc 51.953 (54.254)	lr 0.00132
Warmup Train [36][2750/3239]	Time 0.547 (0.515)	Data 0.001 (0.012)	Loss 4.0128 (4.0180)	Top-1 acc 30.078 (30.812)	Top-5 acc 54.688 (54.251)	lr 0.00132
Warmup Train [36][2760/3239]	Time 0.417 (0.515)	Data 0.001 (0.012)	Loss 3.9129 (4.0180)	Top-1 acc 32.031 (30.814)	Top-5 acc 57.422 (54.248)	lr 0.00132
Warmup Train [36][2770/3239]	Time 0.732 (0.515)	Data 0.001 (0.012)	Loss 3.7404 (4.0177)	Top-1 acc 38.672 (30.821)	Top-5 acc 59.766 (54.255)	lr 0.00131
Warmup Train [36][2780/3239]	Time 0.666 (0.515)	Data 0.001 (0.012)	Loss 4.1537 (4.0177)	Top-1 acc 25.391 (30.822)	Top-5 acc 49.219 (54.254)	lr 0.00131
Warmup Train [36][2790/3239]	Time 0.613 (0.515)	Data 0.001 (0.012)	Loss 4.0100 (4.0175)	Top-1 acc 32.422 (30.826)	Top-5 acc 55.859 (54.260)	lr 0.00131
Warmup Train [36][2800/3239]	Time 0.512 (0.515)	Data 0.001 (0.012)	Loss 3.7860 (4.0173)	Top-1 acc 37.109 (30.834)	Top-5 acc 57.812 (54.263)	lr 0.00131
Warmup Train [36][2810/3239]	Time 0.648 (0.515)	Data 0.001 (0.012)	Loss 4.1093 (4.0173)	Top-1 acc 25.391 (30.839)	Top-5 acc 53.906 (54.265)	lr 0.00131
Warmup Train [36][2820/3239]	Time 0.505 (0.515)	Data 0.001 (0.012)	Loss 3.9407 (4.0174)	Top-1 acc 34.375 (30.840)	Top-5 acc 53.906 (54.263)	lr 0.00130
Warmup Train [36][2830/3239]	Time 0.581 (0.515)	Data 0.001 (0.012)	Loss 4.0885 (4.0174)	Top-1 acc 26.562 (30.839)	Top-5 acc 51.562 (54.265)	lr 0.00130
Warmup Train [36][2840/3239]	Time 0.591 (0.515)	Data 0.002 (0.012)	Loss 3.8914 (4.0172)	Top-1 acc 33.594 (30.843)	Top-5 acc 57.031 (54.264)	lr 0.00130
Warmup Train [36][2850/3239]	Time 0.489 (0.515)	Data 0.001 (0.012)	Loss 3.8526 (4.0173)	Top-1 acc 32.812 (30.840)	Top-5 acc 57.031 (54.264)	lr 0.00130
Warmup Train [36][2860/3239]	Time 0.583 (0.515)	Data 0.001 (0.012)	Loss 3.9648 (4.0173)	Top-1 acc 32.422 (30.841)	Top-5 acc 53.906 (54.259)	lr 0.00130
Warmup Train [36][2870/3239]	Time 0.460 (0.515)	Data 0.001 (0.012)	Loss 3.9970 (4.0171)	Top-1 acc 33.984 (30.843)	Top-5 acc 52.734 (54.265)	lr 0.00129
Warmup Train [36][2880/3239]	Time 0.548 (0.515)	Data 0.001 (0.012)	Loss 4.0380 (4.0170)	Top-1 acc 32.422 (30.848)	Top-5 acc 56.250 (54.267)	lr 0.00129
Warmup Train [36][2890/3239]	Time 0.559 (0.515)	Data 0.001 (0.012)	Loss 4.1200 (4.0167)	Top-1 acc 31.641 (30.855)	Top-5 acc 52.344 (54.273)	lr 0.00129
Warmup Train [36][2900/3239]	Time 0.509 (0.515)	Data 0.001 (0.012)	Loss 4.0192 (4.0167)	Top-1 acc 32.422 (30.858)	Top-5 acc 53.906 (54.274)	lr 0.00129
Warmup Train [36][2910/3239]	Time 0.388 (0.515)	Data 0.001 (0.012)	Loss 3.9344 (4.0168)	Top-1 acc 32.812 (30.854)	Top-5 acc 56.250 (54.272)	lr 0.00129
Warmup Train [36][2920/3239]	Time 0.525 (0.515)	Data 0.001 (0.012)	Loss 4.1114 (4.0167)	Top-1 acc 29.688 (30.858)	Top-5 acc 50.391 (54.273)	lr 0.00128
Warmup Train [36][2930/3239]	Time 0.552 (0.515)	Data 0.001 (0.012)	Loss 3.9747 (4.0168)	Top-1 acc 33.203 (30.858)	Top-5 acc 56.641 (54.274)	lr 0.00128
Warmup Train [36][2940/3239]	Time 0.534 (0.515)	Data 0.001 (0.012)	Loss 3.8423 (4.0167)	Top-1 acc 31.641 (30.860)	Top-5 acc 57.812 (54.277)	lr 0.00128
Warmup Train [36][2950/3239]	Time 0.546 (0.515)	Data 0.001 (0.012)	Loss 4.0042 (4.0168)	Top-1 acc 28.906 (30.860)	Top-5 acc 55.859 (54.277)	lr 0.00128
Warmup Train [36][2960/3239]	Time 0.398 (0.515)	Data 0.001 (0.012)	Loss 3.9940 (4.0169)	Top-1 acc 30.859 (30.859)	Top-5 acc 53.906 (54.274)	lr 0.00128
Warmup Train [36][2970/3239]	Time 0.642 (0.515)	Data 0.001 (0.012)	Loss 3.9452 (4.0169)	Top-1 acc 29.297 (30.863)	Top-5 acc 53.516 (54.275)	lr 0.00127
Warmup Train [36][2980/3239]	Time 0.500 (0.515)	Data 0.001 (0.012)	Loss 3.9862 (4.0168)	Top-1 acc 34.766 (30.866)	Top-5 acc 55.469 (54.275)	lr 0.00127
Warmup Train [36][2990/3239]	Time 0.491 (0.515)	Data 0.001 (0.012)	Loss 3.9974 (4.0168)	Top-1 acc 30.469 (30.865)	Top-5 acc 54.688 (54.276)	lr 0.00127
Warmup Train [36][3000/3239]	Time 0.474 (0.515)	Data 0.001 (0.012)	Loss 4.1030 (4.0166)	Top-1 acc 28.906 (30.869)	Top-5 acc 49.609 (54.278)	lr 0.00127
Warmup Train [36][3010/3239]	Time 0.408 (0.515)	Data 0.001 (0.012)	Loss 4.0895 (4.0167)	Top-1 acc 28.906 (30.865)	Top-5 acc 54.297 (54.275)	lr 0.00127
Warmup Train [36][3020/3239]	Time 0.459 (0.515)	Data 0.001 (0.012)	Loss 4.1687 (4.0168)	Top-1 acc 26.172 (30.865)	Top-5 acc 49.609 (54.274)	lr 0.00127
Warmup Train [36][3030/3239]	Time 0.439 (0.515)	Data 0.001 (0.012)	Loss 4.0211 (4.0168)	Top-1 acc 28.516 (30.861)	Top-5 acc 55.078 (54.274)	lr 0.00126
Warmup Train [36][3040/3239]	Time 0.528 (0.514)	Data 0.001 (0.012)	Loss 4.1328 (4.0170)	Top-1 acc 32.031 (30.861)	Top-5 acc 53.906 (54.272)	lr 0.00126
Warmup Train [36][3050/3239]	Time 0.525 (0.514)	Data 0.001 (0.012)	Loss 4.0940 (4.0170)	Top-1 acc 30.859 (30.860)	Top-5 acc 51.562 (54.273)	lr 0.00126
Warmup Train [36][3060/3239]	Time 0.604 (0.514)	Data 0.001 (0.012)	Loss 4.1634 (4.0172)	Top-1 acc 31.250 (30.857)	Top-5 acc 51.953 (54.271)	lr 0.00126
Warmup Train [36][3070/3239]	Time 0.353 (0.515)	Data 0.001 (0.012)	Loss 4.1076 (4.0174)	Top-1 acc 31.641 (30.853)	Top-5 acc 51.562 (54.266)	lr 0.00126
Warmup Train [36][3080/3239]	Time 0.565 (0.515)	Data 0.001 (0.012)	Loss 3.9386 (4.0174)	Top-1 acc 30.469 (30.853)	Top-5 acc 53.906 (54.265)	lr 0.00125
Warmup Train [36][3090/3239]	Time 0.607 (0.515)	Data 0.001 (0.012)	Loss 4.2133 (4.0174)	Top-1 acc 25.781 (30.853)	Top-5 acc 54.297 (54.269)	lr 0.00125
Warmup Train [36][3100/3239]	Time 0.365 (0.515)	Data 0.001 (0.012)	Loss 3.9778 (4.0173)	Top-1 acc 33.203 (30.855)	Top-5 acc 54.688 (54.269)	lr 0.00125
Warmup Train [36][3110/3239]	Time 0.449 (0.515)	Data 0.001 (0.011)	Loss 4.0720 (4.0171)	Top-1 acc 29.688 (30.860)	Top-5 acc 53.516 (54.275)	lr 0.00125
Warmup Train [36][3120/3239]	Time 0.525 (0.515)	Data 0.001 (0.011)	Loss 4.1467 (4.0171)	Top-1 acc 30.078 (30.864)	Top-5 acc 49.609 (54.274)	lr 0.00125
Warmup Train [36][3130/3239]	Time 0.473 (0.515)	Data 0.001 (0.011)	Loss 4.0406 (4.0169)	Top-1 acc 27.344 (30.870)	Top-5 acc 53.516 (54.279)	lr 0.00124
Warmup Train [36][3140/3239]	Time 0.360 (0.515)	Data 0.001 (0.011)	Loss 4.1818 (4.0168)	Top-1 acc 32.422 (30.873)	Top-5 acc 49.609 (54.281)	lr 0.00124
Warmup Train [36][3150/3239]	Time 0.517 (0.515)	Data 0.001 (0.011)	Loss 3.7501 (4.0168)	Top-1 acc 33.203 (30.869)	Top-5 acc 63.281 (54.283)	lr 0.00124
Warmup Train [36][3160/3239]	Time 0.461 (0.515)	Data 0.001 (0.011)	Loss 4.0103 (4.0169)	Top-1 acc 31.250 (30.870)	Top-5 acc 56.250 (54.283)	lr 0.00124
Warmup Train [36][3170/3239]	Time 0.334 (0.515)	Data 0.001 (0.011)	Loss 4.0063 (4.0168)	Top-1 acc 30.859 (30.869)	Top-5 acc 52.344 (54.282)	lr 0.00124
Warmup Train [36][3180/3239]	Time 0.426 (0.515)	Data 0.000 (0.011)	Loss 4.1593 (4.0168)	Top-1 acc 29.297 (30.866)	Top-5 acc 50.781 (54.283)	lr 0.00123
Warmup Train [36][3190/3239]	Time 0.527 (0.515)	Data 0.000 (0.011)	Loss 4.0024 (4.0167)	Top-1 acc 30.078 (30.870)	Top-5 acc 55.469 (54.285)	lr 0.00123
Warmup Train [36][3200/3239]	Time 0.518 (0.515)	Data 0.000 (0.011)	Loss 4.2936 (4.0169)	Top-1 acc 26.172 (30.867)	Top-5 acc 48.047 (54.284)	lr 0.00123
Warmup Train [36][3210/3239]	Time 0.492 (0.515)	Data 0.000 (0.011)	Loss 3.8529 (4.0167)	Top-1 acc 35.547 (30.870)	Top-5 acc 59.375 (54.289)	lr 0.00123
Warmup Train [36][3220/3239]	Time 0.300 (0.514)	Data 0.000 (0.011)	Loss 4.0362 (4.0170)	Top-1 acc 25.781 (30.867)	Top-5 acc 52.734 (54.283)	lr 0.00123
Warmup Train [36][3230/3239]	Time 0.537 (0.514)	Data 0.000 (0.011)	Loss 3.8378 (4.0169)	Top-1 acc 33.203 (30.868)	Top-5 acc 57.031 (54.284)	lr 0.00123
Warmup Train [36][3239/3239]	Time 0.426 (0.514)	Data 0.000 (0.011)	Loss 3.9702 (4.0167)	Top-1 acc 27.160 (30.872)	Top-5 acc 55.556 (54.290)	lr 0.00122
==========Warmup Valid [36/40]	loss 2.959	top-1 acc 38.261	top-5 acc 63.065	Train top-1 30.872	top-5 54.290	flops: 442.4M
Warmup Train [37][0/3239]	Time 16.612 (16.612)	Data 14.449 (14.449)	Loss 4.3182 (4.3182)	Top-1 acc 26.172 (26.172)	Top-5 acc 46.094 (46.094)	lr 0.00122
Warmup Train [37][10/3239]	Time 0.547 (2.035)	Data 0.001 (1.328)	Loss 3.9482 (4.0386)	Top-1 acc 35.156 (30.362)	Top-5 acc 58.594 (54.297)	lr 0.00122
Warmup Train [37][20/3239]	Time 0.466 (1.310)	Data 0.001 (0.696)	Loss 3.9266 (4.0266)	Top-1 acc 27.344 (29.855)	Top-5 acc 58.203 (54.539)	lr 0.00122
Warmup Train [37][30/3239]	Time 0.622 (1.054)	Data 0.001 (0.473)	Loss 4.0113 (4.0158)	Top-1 acc 33.984 (30.330)	Top-5 acc 57.031 (54.599)	lr 0.00122
Warmup Train [37][40/3239]	Time 0.570 (0.926)	Data 0.001 (0.361)	Loss 4.0027 (4.0039)	Top-1 acc 30.859 (30.974)	Top-5 acc 55.469 (54.821)	lr 0.00122
Warmup Train [37][50/3239]	Time 0.387 (0.844)	Data 0.001 (0.291)	Loss 4.0847 (4.0069)	Top-1 acc 28.125 (30.990)	Top-5 acc 52.344 (54.680)	lr 0.00121
Warmup Train [37][60/3239]	Time 0.709 (0.793)	Data 0.001 (0.244)	Loss 3.7216 (4.0035)	Top-1 acc 37.891 (30.981)	Top-5 acc 60.938 (54.745)	lr 0.00121
Warmup Train [37][70/3239]	Time 0.414 (0.753)	Data 0.001 (0.211)	Loss 4.0632 (4.0034)	Top-1 acc 27.344 (30.909)	Top-5 acc 51.562 (54.748)	lr 0.00121
Warmup Train [37][80/3239]	Time 0.493 (0.724)	Data 0.001 (0.186)	Loss 4.3545 (4.0051)	Top-1 acc 29.297 (30.985)	Top-5 acc 46.875 (54.726)	lr 0.00121
Warmup Train [37][90/3239]	Time 0.583 (0.700)	Data 0.001 (0.167)	Loss 4.0093 (4.0066)	Top-1 acc 31.250 (30.988)	Top-5 acc 56.250 (54.718)	lr 0.00121
Warmup Train [37][100/3239]	Time 0.419 (0.677)	Data 0.001 (0.151)	Loss 3.8849 (4.0122)	Top-1 acc 36.719 (30.906)	Top-5 acc 60.938 (54.649)	lr 0.00120
Warmup Train [37][110/3239]	Time 0.490 (0.663)	Data 0.001 (0.138)	Loss 4.0945 (4.0095)	Top-1 acc 26.953 (30.838)	Top-5 acc 52.344 (54.652)	lr 0.00120
Warmup Train [37][120/3239]	Time 0.469 (0.650)	Data 0.001 (0.127)	Loss 3.9753 (4.0128)	Top-1 acc 35.547 (30.827)	Top-5 acc 55.469 (54.516)	lr 0.00120
Warmup Train [37][130/3239]	Time 0.211 (0.636)	Data 0.035 (0.118)	Loss 4.0810 (4.0123)	Top-1 acc 29.688 (30.967)	Top-5 acc 53.516 (54.529)	lr 0.00120
Warmup Train [37][140/3239]	Time 0.614 (0.628)	Data 0.001 (0.111)	Loss 3.8589 (4.0104)	Top-1 acc 35.547 (30.937)	Top-5 acc 57.812 (54.577)	lr 0.00120
Warmup Train [37][150/3239]	Time 0.329 (0.620)	Data 0.001 (0.103)	Loss 3.9655 (4.0058)	Top-1 acc 30.859 (31.022)	Top-5 acc 53.125 (54.633)	lr 0.00120
Warmup Train [37][160/3239]	Time 0.569 (0.612)	Data 0.001 (0.098)	Loss 4.0392 (4.0089)	Top-1 acc 30.078 (30.978)	Top-5 acc 52.344 (54.535)	lr 0.00119
Warmup Train [37][170/3239]	Time 0.494 (0.606)	Data 0.001 (0.093)	Loss 4.0076 (4.0050)	Top-1 acc 33.984 (31.145)	Top-5 acc 55.859 (54.642)	lr 0.00119
Warmup Train [37][180/3239]	Time 0.514 (0.599)	Data 0.001 (0.089)	Loss 4.1545 (4.0022)	Top-1 acc 26.562 (31.151)	Top-5 acc 51.562 (54.735)	lr 0.00119
Warmup Train [37][190/3239]	Time 0.563 (0.595)	Data 0.001 (0.084)	Loss 4.0212 (4.0039)	Top-1 acc 34.375 (31.105)	Top-5 acc 55.078 (54.661)	lr 0.00119
Warmup Train [37][200/3239]	Time 0.718 (0.591)	Data 0.001 (0.080)	Loss 4.0259 (4.0031)	Top-1 acc 31.250 (31.042)	Top-5 acc 57.812 (54.658)	lr 0.00119
Warmup Train [37][210/3239]	Time 0.539 (0.587)	Data 0.002 (0.077)	Loss 4.0970 (4.0060)	Top-1 acc 31.250 (31.015)	Top-5 acc 52.344 (54.612)	lr 0.00118
Warmup Train [37][220/3239]	Time 0.524 (0.584)	Data 0.001 (0.073)	Loss 4.0292 (4.0065)	Top-1 acc 28.906 (31.036)	Top-5 acc 54.297 (54.619)	lr 0.00118
Warmup Train [37][230/3239]	Time 0.585 (0.581)	Data 0.001 (0.070)	Loss 3.9874 (4.0078)	Top-1 acc 28.516 (30.988)	Top-5 acc 57.812 (54.623)	lr 0.00118
Warmup Train [37][240/3239]	Time 0.422 (0.578)	Data 0.001 (0.068)	Loss 4.1306 (4.0094)	Top-1 acc 28.906 (30.937)	Top-5 acc 52.734 (54.629)	lr 0.00118
Warmup Train [37][250/3239]	Time 0.472 (0.575)	Data 0.001 (0.065)	Loss 4.0449 (4.0108)	Top-1 acc 31.250 (30.934)	Top-5 acc 51.953 (54.546)	lr 0.00118
Warmup Train [37][260/3239]	Time 0.498 (0.572)	Data 0.001 (0.063)	Loss 3.7618 (4.0128)	Top-1 acc 31.641 (30.834)	Top-5 acc 62.891 (54.491)	lr 0.00118
Warmup Train [37][270/3239]	Time 0.552 (0.570)	Data 0.001 (0.061)	Loss 4.0381 (4.0135)	Top-1 acc 33.203 (30.849)	Top-5 acc 56.641 (54.487)	lr 0.00117
Warmup Train [37][280/3239]	Time 0.580 (0.568)	Data 0.001 (0.059)	Loss 3.9206 (4.0166)	Top-1 acc 32.422 (30.809)	Top-5 acc 55.859 (54.394)	lr 0.00117
Warmup Train [37][290/3239]	Time 0.415 (0.566)	Data 0.001 (0.057)	Loss 3.8903 (4.0160)	Top-1 acc 32.422 (30.798)	Top-5 acc 58.203 (54.420)	lr 0.00117
Warmup Train [37][300/3239]	Time 0.491 (0.564)	Data 0.001 (0.056)	Loss 4.5048 (4.0160)	Top-1 acc 18.750 (30.794)	Top-5 acc 41.797 (54.424)	lr 0.00117
Warmup Train [37][310/3239]	Time 0.369 (0.562)	Data 0.001 (0.054)	Loss 4.1384 (4.0161)	Top-1 acc 24.609 (30.773)	Top-5 acc 51.172 (54.420)	lr 0.00117
Warmup Train [37][320/3239]	Time 0.593 (0.561)	Data 0.001 (0.053)	Loss 3.9940 (4.0168)	Top-1 acc 32.812 (30.756)	Top-5 acc 54.688 (54.432)	lr 0.00116
Warmup Train [37][330/3239]	Time 0.517 (0.560)	Data 0.001 (0.051)	Loss 3.8644 (4.0147)	Top-1 acc 30.859 (30.786)	Top-5 acc 56.641 (54.462)	lr 0.00116
Warmup Train [37][340/3239]	Time 0.369 (0.559)	Data 0.001 (0.050)	Loss 4.1321 (4.0124)	Top-1 acc 28.516 (30.826)	Top-5 acc 50.781 (54.521)	lr 0.00116
Warmup Train [37][350/3239]	Time 0.447 (0.557)	Data 0.002 (0.049)	Loss 4.1245 (4.0151)	Top-1 acc 26.953 (30.775)	Top-5 acc 53.125 (54.435)	lr 0.00116
Warmup Train [37][360/3239]	Time 0.564 (0.556)	Data 0.001 (0.048)	Loss 3.9528 (4.0150)	Top-1 acc 33.203 (30.776)	Top-5 acc 51.562 (54.412)	lr 0.00116
Warmup Train [37][370/3239]	Time 0.529 (0.554)	Data 0.001 (0.047)	Loss 3.8898 (4.0146)	Top-1 acc 32.812 (30.805)	Top-5 acc 57.812 (54.433)	lr 0.00116
Warmup Train [37][380/3239]	Time 0.601 (0.554)	Data 0.001 (0.046)	Loss 3.8848 (4.0130)	Top-1 acc 32.812 (30.849)	Top-5 acc 58.984 (54.474)	lr 0.00115
Warmup Train [37][390/3239]	Time 0.397 (0.553)	Data 0.001 (0.045)	Loss 4.0485 (4.0135)	Top-1 acc 27.734 (30.833)	Top-5 acc 52.344 (54.443)	lr 0.00115
Warmup Train [37][400/3239]	Time 0.667 (0.552)	Data 0.001 (0.044)	Loss 4.1833 (4.0136)	Top-1 acc 30.859 (30.855)	Top-5 acc 53.906 (54.447)	lr 0.00115
Warmup Train [37][410/3239]	Time 0.302 (0.549)	Data 0.001 (0.043)	Loss 3.9604 (4.0131)	Top-1 acc 31.641 (30.885)	Top-5 acc 59.375 (54.454)	lr 0.00115
Warmup Train [37][420/3239]	Time 0.656 (0.549)	Data 0.001 (0.042)	Loss 4.1188 (4.0136)	Top-1 acc 26.953 (30.856)	Top-5 acc 52.344 (54.453)	lr 0.00115
Warmup Train [37][430/3239]	Time 0.305 (0.547)	Data 0.002 (0.041)	Loss 3.9814 (4.0134)	Top-1 acc 33.984 (30.854)	Top-5 acc 56.250 (54.467)	lr 0.00114
Warmup Train [37][440/3239]	Time 0.308 (0.545)	Data 0.001 (0.041)	Loss 4.1088 (4.0137)	Top-1 acc 26.172 (30.849)	Top-5 acc 50.781 (54.469)	lr 0.00114
Warmup Train [37][450/3239]	Time 0.418 (0.544)	Data 0.001 (0.040)	Loss 4.0689 (4.0134)	Top-1 acc 29.688 (30.867)	Top-5 acc 55.078 (54.464)	lr 0.00114
Warmup Train [37][460/3239]	Time 0.482 (0.543)	Data 0.001 (0.040)	Loss 4.0188 (4.0140)	Top-1 acc 32.422 (30.848)	Top-5 acc 55.469 (54.462)	lr 0.00114
Warmup Train [37][470/3239]	Time 0.588 (0.542)	Data 0.001 (0.039)	Loss 4.0861 (4.0149)	Top-1 acc 28.125 (30.832)	Top-5 acc 54.688 (54.433)	lr 0.00114
Warmup Train [37][480/3239]	Time 0.547 (0.541)	Data 0.001 (0.038)	Loss 3.9275 (4.0136)	Top-1 acc 30.078 (30.855)	Top-5 acc 56.641 (54.458)	lr 0.00114
Warmup Train [37][490/3239]	Time 0.553 (0.541)	Data 0.002 (0.037)	Loss 4.0330 (4.0138)	Top-1 acc 32.031 (30.840)	Top-5 acc 53.906 (54.460)	lr 0.00113
Warmup Train [37][500/3239]	Time 0.657 (0.540)	Data 0.001 (0.037)	Loss 4.0523 (4.0134)	Top-1 acc 27.734 (30.827)	Top-5 acc 52.734 (54.479)	lr 0.00113
Warmup Train [37][510/3239]	Time 0.696 (0.540)	Data 0.001 (0.036)	Loss 4.1561 (4.0140)	Top-1 acc 28.516 (30.847)	Top-5 acc 51.562 (54.457)	lr 0.00113
Warmup Train [37][520/3239]	Time 0.547 (0.539)	Data 0.001 (0.035)	Loss 3.8746 (4.0123)	Top-1 acc 36.328 (30.896)	Top-5 acc 57.812 (54.497)	lr 0.00113
Warmup Train [37][530/3239]	Time 0.401 (0.539)	Data 0.001 (0.035)	Loss 3.7986 (4.0124)	Top-1 acc 32.031 (30.889)	Top-5 acc 58.984 (54.494)	lr 0.00113
Warmup Train [37][540/3239]	Time 0.519 (0.538)	Data 0.001 (0.034)	Loss 3.8503 (4.0116)	Top-1 acc 33.594 (30.903)	Top-5 acc 55.859 (54.494)	lr 0.00112
Warmup Train [37][550/3239]	Time 0.460 (0.537)	Data 0.001 (0.034)	Loss 4.1169 (4.0117)	Top-1 acc 30.078 (30.887)	Top-5 acc 51.172 (54.509)	lr 0.00112
Warmup Train [37][560/3239]	Time 0.548 (0.537)	Data 0.001 (0.033)	Loss 3.9555 (4.0109)	Top-1 acc 34.375 (30.919)	Top-5 acc 55.859 (54.509)	lr 0.00112
Warmup Train [37][570/3239]	Time 0.344 (0.536)	Data 0.001 (0.033)	Loss 4.0714 (4.0119)	Top-1 acc 29.688 (30.900)	Top-5 acc 51.953 (54.471)	lr 0.00112
Warmup Train [37][580/3239]	Time 0.350 (0.536)	Data 0.001 (0.033)	Loss 3.9124 (4.0112)	Top-1 acc 34.375 (30.913)	Top-5 acc 55.078 (54.482)	lr 0.00112
Warmup Train [37][590/3239]	Time 0.584 (0.536)	Data 0.001 (0.032)	Loss 3.9344 (4.0107)	Top-1 acc 29.688 (30.910)	Top-5 acc 57.422 (54.491)	lr 0.00112
Warmup Train [37][600/3239]	Time 0.538 (0.535)	Data 0.001 (0.032)	Loss 3.9711 (4.0115)	Top-1 acc 32.031 (30.892)	Top-5 acc 55.078 (54.472)	lr 0.00111
Warmup Train [37][610/3239]	Time 0.424 (0.534)	Data 0.001 (0.031)	Loss 3.9934 (4.0111)	Top-1 acc 33.594 (30.888)	Top-5 acc 53.906 (54.484)	lr 0.00111
Warmup Train [37][620/3239]	Time 0.415 (0.534)	Data 0.001 (0.031)	Loss 3.9180 (4.0116)	Top-1 acc 31.641 (30.874)	Top-5 acc 56.250 (54.470)	lr 0.00111
Warmup Train [37][630/3239]	Time 0.738 (0.534)	Data 0.001 (0.031)	Loss 3.9896 (4.0120)	Top-1 acc 32.031 (30.873)	Top-5 acc 53.125 (54.466)	lr 0.00111
Warmup Train [37][640/3239]	Time 0.621 (0.533)	Data 0.001 (0.030)	Loss 3.9429 (4.0116)	Top-1 acc 33.203 (30.881)	Top-5 acc 59.766 (54.482)	lr 0.00111
Warmup Train [37][650/3239]	Time 0.520 (0.533)	Data 0.001 (0.030)	Loss 3.9868 (4.0111)	Top-1 acc 32.031 (30.898)	Top-5 acc 56.250 (54.498)	lr 0.00110
Warmup Train [37][660/3239]	Time 0.500 (0.532)	Data 0.001 (0.030)	Loss 4.0302 (4.0116)	Top-1 acc 28.516 (30.895)	Top-5 acc 54.297 (54.486)	lr 0.00110
Warmup Train [37][670/3239]	Time 0.568 (0.532)	Data 0.001 (0.029)	Loss 4.1384 (4.0126)	Top-1 acc 29.688 (30.876)	Top-5 acc 51.172 (54.461)	lr 0.00110
Warmup Train [37][680/3239]	Time 0.670 (0.531)	Data 0.001 (0.029)	Loss 3.8241 (4.0119)	Top-1 acc 33.594 (30.884)	Top-5 acc 57.031 (54.476)	lr 0.00110
Warmup Train [37][690/3239]	Time 0.686 (0.531)	Data 0.001 (0.028)	Loss 3.8615 (4.0127)	Top-1 acc 34.375 (30.865)	Top-5 acc 58.594 (54.453)	lr 0.00110
Warmup Train [37][700/3239]	Time 0.483 (0.530)	Data 0.001 (0.028)	Loss 4.3219 (4.0136)	Top-1 acc 23.438 (30.858)	Top-5 acc 47.266 (54.438)	lr 0.00110
Warmup Train [37][710/3239]	Time 0.510 (0.530)	Data 0.001 (0.028)	Loss 4.2501 (4.0142)	Top-1 acc 29.688 (30.848)	Top-5 acc 51.172 (54.429)	lr 0.00109
Warmup Train [37][720/3239]	Time 0.551 (0.529)	Data 0.001 (0.027)	Loss 3.8354 (4.0143)	Top-1 acc 30.859 (30.837)	Top-5 acc 57.031 (54.421)	lr 0.00109
Warmup Train [37][730/3239]	Time 0.655 (0.529)	Data 0.001 (0.027)	Loss 4.0168 (4.0137)	Top-1 acc 31.250 (30.852)	Top-5 acc 50.781 (54.433)	lr 0.00109
Warmup Train [37][740/3239]	Time 0.375 (0.528)	Data 0.001 (0.027)	Loss 4.0136 (4.0135)	Top-1 acc 30.469 (30.869)	Top-5 acc 53.906 (54.434)	lr 0.00109
Warmup Train [37][750/3239]	Time 0.536 (0.528)	Data 0.001 (0.026)	Loss 3.9491 (4.0141)	Top-1 acc 30.859 (30.871)	Top-5 acc 57.422 (54.408)	lr 0.00109
Warmup Train [37][760/3239]	Time 0.595 (0.527)	Data 0.001 (0.026)	Loss 4.0048 (4.0149)	Top-1 acc 28.906 (30.856)	Top-5 acc 51.562 (54.396)	lr 0.00109
Warmup Train [37][770/3239]	Time 0.457 (0.527)	Data 0.001 (0.026)	Loss 3.8494 (4.0153)	Top-1 acc 37.891 (30.855)	Top-5 acc 58.594 (54.382)	lr 0.00108
Warmup Train [37][780/3239]	Time 0.340 (0.527)	Data 0.001 (0.026)	Loss 4.0693 (4.0150)	Top-1 acc 30.078 (30.847)	Top-5 acc 53.516 (54.391)	lr 0.00108
Warmup Train [37][790/3239]	Time 0.520 (0.526)	Data 0.001 (0.025)	Loss 3.9131 (4.0156)	Top-1 acc 28.125 (30.838)	Top-5 acc 58.203 (54.390)	lr 0.00108
Warmup Train [37][800/3239]	Time 0.499 (0.526)	Data 0.001 (0.025)	Loss 3.9983 (4.0159)	Top-1 acc 30.469 (30.822)	Top-5 acc 55.469 (54.374)	lr 0.00108
Warmup Train [37][810/3239]	Time 0.433 (0.525)	Data 0.001 (0.025)	Loss 4.0466 (4.0162)	Top-1 acc 29.688 (30.810)	Top-5 acc 51.172 (54.356)	lr 0.00108
Warmup Train [37][820/3239]	Time 0.464 (0.525)	Data 0.001 (0.025)	Loss 3.8395 (4.0163)	Top-1 acc 33.594 (30.810)	Top-5 acc 58.594 (54.363)	lr 0.00107
Warmup Train [37][830/3239]	Time 0.590 (0.525)	Data 0.001 (0.024)	Loss 4.1131 (4.0162)	Top-1 acc 28.906 (30.808)	Top-5 acc 55.859 (54.369)	lr 0.00107
Warmup Train [37][840/3239]	Time 0.517 (0.525)	Data 0.001 (0.024)	Loss 4.0166 (4.0164)	Top-1 acc 32.812 (30.806)	Top-5 acc 52.734 (54.367)	lr 0.00107
Warmup Train [37][850/3239]	Time 0.364 (0.525)	Data 0.001 (0.024)	Loss 4.0863 (4.0171)	Top-1 acc 27.734 (30.793)	Top-5 acc 54.297 (54.350)	lr 0.00107
Warmup Train [37][860/3239]	Time 0.336 (0.524)	Data 0.001 (0.024)	Loss 3.7664 (4.0164)	Top-1 acc 35.547 (30.806)	Top-5 acc 61.328 (54.359)	lr 0.00107
Warmup Train [37][870/3239]	Time 0.584 (0.524)	Data 0.001 (0.024)	Loss 4.0086 (4.0162)	Top-1 acc 31.250 (30.801)	Top-5 acc 55.859 (54.369)	lr 0.00107
Warmup Train [37][880/3239]	Time 0.502 (0.524)	Data 0.001 (0.023)	Loss 3.9147 (4.0158)	Top-1 acc 34.766 (30.823)	Top-5 acc 52.734 (54.372)	lr 0.00106
Warmup Train [37][890/3239]	Time 0.438 (0.524)	Data 0.001 (0.023)	Loss 4.2841 (4.0164)	Top-1 acc 25.781 (30.807)	Top-5 acc 49.609 (54.359)	lr 0.00106
Warmup Train [37][900/3239]	Time 0.547 (0.524)	Data 0.001 (0.023)	Loss 4.2289 (4.0174)	Top-1 acc 27.734 (30.797)	Top-5 acc 50.391 (54.346)	lr 0.00106
Warmup Train [37][910/3239]	Time 0.657 (0.524)	Data 0.001 (0.023)	Loss 3.8838 (4.0170)	Top-1 acc 35.547 (30.811)	Top-5 acc 56.250 (54.361)	lr 0.00106
Warmup Train [37][920/3239]	Time 0.645 (0.523)	Data 0.001 (0.023)	Loss 4.1101 (4.0171)	Top-1 acc 30.078 (30.822)	Top-5 acc 51.562 (54.355)	lr 0.00106
Warmup Train [37][930/3239]	Time 0.474 (0.523)	Data 0.001 (0.022)	Loss 3.8441 (4.0166)	Top-1 acc 33.984 (30.835)	Top-5 acc 56.641 (54.374)	lr 0.00106
Warmup Train [37][940/3239]	Time 0.593 (0.523)	Data 0.001 (0.022)	Loss 4.0504 (4.0164)	Top-1 acc 29.297 (30.836)	Top-5 acc 55.859 (54.379)	lr 0.00105
Warmup Train [37][950/3239]	Time 0.594 (0.523)	Data 0.001 (0.022)	Loss 4.1818 (4.0170)	Top-1 acc 26.953 (30.815)	Top-5 acc 50.781 (54.370)	lr 0.00105
Warmup Train [37][960/3239]	Time 0.403 (0.523)	Data 0.001 (0.022)	Loss 4.0585 (4.0168)	Top-1 acc 28.906 (30.808)	Top-5 acc 53.516 (54.371)	lr 0.00105
Warmup Train [37][970/3239]	Time 0.571 (0.523)	Data 0.001 (0.022)	Loss 3.7804 (4.0163)	Top-1 acc 33.594 (30.805)	Top-5 acc 56.641 (54.370)	lr 0.00105
Warmup Train [37][980/3239]	Time 0.633 (0.522)	Data 0.001 (0.022)	Loss 3.9639 (4.0164)	Top-1 acc 34.766 (30.799)	Top-5 acc 55.469 (54.373)	lr 0.00105
Warmup Train [37][990/3239]	Time 0.617 (0.522)	Data 0.001 (0.021)	Loss 3.8186 (4.0161)	Top-1 acc 33.984 (30.783)	Top-5 acc 60.547 (54.378)	lr 0.00105
Warmup Train [37][1000/3239]	Time 0.472 (0.522)	Data 0.001 (0.021)	Loss 4.0403 (4.0171)	Top-1 acc 27.344 (30.760)	Top-5 acc 54.688 (54.341)	lr 0.00104
Warmup Train [37][1010/3239]	Time 0.519 (0.521)	Data 0.001 (0.021)	Loss 4.1597 (4.0166)	Top-1 acc 30.859 (30.772)	Top-5 acc 52.734 (54.348)	lr 0.00104
Warmup Train [37][1020/3239]	Time 0.222 (0.520)	Data 0.002 (0.021)	Loss 3.9070 (4.0161)	Top-1 acc 32.812 (30.781)	Top-5 acc 54.297 (54.360)	lr 0.00104
Warmup Train [37][1030/3239]	Time 0.592 (0.521)	Data 0.001 (0.021)	Loss 3.8942 (4.0164)	Top-1 acc 32.422 (30.783)	Top-5 acc 58.594 (54.359)	lr 0.00104
Warmup Train [37][1040/3239]	Time 0.546 (0.520)	Data 0.001 (0.021)	Loss 4.1509 (4.0160)	Top-1 acc 25.391 (30.800)	Top-5 acc 48.438 (54.371)	lr 0.00104
Warmup Train [37][1050/3239]	Time 0.641 (0.520)	Data 0.001 (0.021)	Loss 3.9152 (4.0160)	Top-1 acc 35.547 (30.795)	Top-5 acc 56.641 (54.376)	lr 0.00103
Warmup Train [37][1060/3239]	Time 0.523 (0.520)	Data 0.001 (0.020)	Loss 4.0058 (4.0161)	Top-1 acc 30.859 (30.790)	Top-5 acc 54.688 (54.377)	lr 0.00103
Warmup Train [37][1070/3239]	Time 0.514 (0.520)	Data 0.001 (0.020)	Loss 4.0802 (4.0162)	Top-1 acc 28.906 (30.785)	Top-5 acc 53.516 (54.381)	lr 0.00103
Warmup Train [37][1080/3239]	Time 0.488 (0.520)	Data 0.001 (0.020)	Loss 3.9929 (4.0164)	Top-1 acc 31.250 (30.778)	Top-5 acc 54.688 (54.373)	lr 0.00103
Warmup Train [37][1090/3239]	Time 0.354 (0.520)	Data 0.001 (0.020)	Loss 3.7575 (4.0159)	Top-1 acc 33.984 (30.786)	Top-5 acc 59.766 (54.390)	lr 0.00103
Warmup Train [37][1100/3239]	Time 0.389 (0.520)	Data 0.001 (0.020)	Loss 3.8829 (4.0159)	Top-1 acc 30.078 (30.787)	Top-5 acc 57.422 (54.395)	lr 0.00103
Warmup Train [37][1110/3239]	Time 0.435 (0.519)	Data 0.001 (0.020)	Loss 4.0387 (4.0157)	Top-1 acc 34.766 (30.804)	Top-5 acc 53.906 (54.395)	lr 0.00102
Warmup Train [37][1120/3239]	Time 0.520 (0.519)	Data 0.002 (0.020)	Loss 4.0251 (4.0158)	Top-1 acc 33.203 (30.802)	Top-5 acc 56.250 (54.391)	lr 0.00102
Warmup Train [37][1130/3239]	Time 0.329 (0.519)	Data 0.001 (0.020)	Loss 4.1094 (4.0160)	Top-1 acc 26.953 (30.806)	Top-5 acc 50.781 (54.380)	lr 0.00102
Warmup Train [37][1140/3239]	Time 0.509 (0.519)	Data 0.001 (0.020)	Loss 3.8984 (4.0153)	Top-1 acc 34.766 (30.824)	Top-5 acc 60.547 (54.393)	lr 0.00102
Warmup Train [37][1150/3239]	Time 0.622 (0.519)	Data 0.001 (0.019)	Loss 3.9558 (4.0152)	Top-1 acc 33.984 (30.829)	Top-5 acc 55.469 (54.397)	lr 0.00102
Warmup Train [37][1160/3239]	Time 0.421 (0.519)	Data 0.001 (0.019)	Loss 3.9744 (4.0152)	Top-1 acc 32.031 (30.837)	Top-5 acc 56.250 (54.402)	lr 0.00102
Warmup Train [37][1170/3239]	Time 0.384 (0.519)	Data 0.001 (0.019)	Loss 3.9848 (4.0153)	Top-1 acc 30.859 (30.831)	Top-5 acc 54.297 (54.395)	lr 0.00101
Warmup Train [37][1180/3239]	Time 0.376 (0.519)	Data 0.001 (0.019)	Loss 4.1730 (4.0149)	Top-1 acc 26.562 (30.839)	Top-5 acc 50.000 (54.399)	lr 0.00101
Warmup Train [37][1190/3239]	Time 0.607 (0.519)	Data 0.001 (0.019)	Loss 4.1194 (4.0149)	Top-1 acc 28.125 (30.837)	Top-5 acc 54.297 (54.401)	lr 0.00101
Warmup Train [37][1200/3239]	Time 0.634 (0.519)	Data 0.001 (0.019)	Loss 4.0660 (4.0154)	Top-1 acc 29.297 (30.829)	Top-5 acc 50.000 (54.379)	lr 0.00101
Warmup Train [37][1210/3239]	Time 0.413 (0.519)	Data 0.001 (0.019)	Loss 4.2305 (4.0155)	Top-1 acc 23.047 (30.818)	Top-5 acc 50.000 (54.379)	lr 0.00101
Warmup Train [37][1220/3239]	Time 0.572 (0.519)	Data 0.001 (0.019)	Loss 4.0227 (4.0154)	Top-1 acc 30.859 (30.833)	Top-5 acc 53.516 (54.383)	lr 0.00101
Warmup Train [37][1230/3239]	Time 0.455 (0.519)	Data 0.001 (0.019)	Loss 4.0640 (4.0154)	Top-1 acc 32.422 (30.836)	Top-5 acc 56.250 (54.385)	lr 0.00100
Warmup Train [37][1240/3239]	Time 0.492 (0.519)	Data 0.001 (0.019)	Loss 4.1323 (4.0152)	Top-1 acc 29.297 (30.836)	Top-5 acc 52.344 (54.383)	lr 0.00100
Warmup Train [37][1250/3239]	Time 0.429 (0.519)	Data 0.001 (0.018)	Loss 4.1648 (4.0153)	Top-1 acc 25.000 (30.828)	Top-5 acc 52.344 (54.375)	lr 0.00100
Warmup Train [37][1260/3239]	Time 0.341 (0.518)	Data 0.001 (0.018)	Loss 4.0443 (4.0150)	Top-1 acc 29.688 (30.836)	Top-5 acc 53.125 (54.384)	lr 0.00100
Warmup Train [37][1270/3239]	Time 0.447 (0.518)	Data 0.001 (0.018)	Loss 3.9968 (4.0146)	Top-1 acc 33.594 (30.845)	Top-5 acc 53.516 (54.390)	lr 0.00100
Warmup Train [37][1280/3239]	Time 0.553 (0.518)	Data 0.001 (0.018)	Loss 3.9051 (4.0145)	Top-1 acc 33.984 (30.845)	Top-5 acc 58.594 (54.396)	lr 0.00100
Warmup Train [37][1290/3239]	Time 0.645 (0.518)	Data 0.001 (0.018)	Loss 3.9118 (4.0144)	Top-1 acc 33.984 (30.855)	Top-5 acc 57.031 (54.396)	lr 0.00099
Warmup Train [37][1300/3239]	Time 0.221 (0.517)	Data 0.001 (0.018)	Loss 3.9225 (4.0139)	Top-1 acc 33.984 (30.867)	Top-5 acc 55.469 (54.407)	lr 0.00099
Warmup Train [37][1310/3239]	Time 0.451 (0.517)	Data 0.001 (0.018)	Loss 3.9969 (4.0140)	Top-1 acc 30.078 (30.859)	Top-5 acc 56.250 (54.399)	lr 0.00099
Warmup Train [37][1320/3239]	Time 0.389 (0.517)	Data 0.001 (0.018)	Loss 3.9897 (4.0139)	Top-1 acc 30.078 (30.861)	Top-5 acc 54.688 (54.402)	lr 0.00099
Warmup Train [37][1330/3239]	Time 0.421 (0.517)	Data 0.001 (0.018)	Loss 4.0877 (4.0142)	Top-1 acc 25.781 (30.858)	Top-5 acc 48.047 (54.391)	lr 0.00099
Warmup Train [37][1340/3239]	Time 0.528 (0.517)	Data 0.001 (0.018)	Loss 4.1756 (4.0144)	Top-1 acc 28.906 (30.863)	Top-5 acc 49.609 (54.385)	lr 0.00099
Warmup Train [37][1350/3239]	Time 0.310 (0.517)	Data 0.001 (0.018)	Loss 4.1620 (4.0143)	Top-1 acc 27.344 (30.872)	Top-5 acc 51.172 (54.390)	lr 0.00098
Warmup Train [37][1360/3239]	Time 0.540 (0.517)	Data 0.001 (0.018)	Loss 4.0646 (4.0141)	Top-1 acc 30.859 (30.879)	Top-5 acc 57.031 (54.393)	lr 0.00098
Warmup Train [37][1370/3239]	Time 0.517 (0.517)	Data 0.001 (0.018)	Loss 3.8999 (4.0138)	Top-1 acc 35.156 (30.896)	Top-5 acc 54.688 (54.391)	lr 0.00098
Warmup Train [37][1380/3239]	Time 0.526 (0.518)	Data 0.001 (0.018)	Loss 3.9977 (4.0135)	Top-1 acc 30.469 (30.902)	Top-5 acc 51.562 (54.394)	lr 0.00098
Warmup Train [37][1390/3239]	Time 0.495 (0.517)	Data 0.001 (0.017)	Loss 3.8799 (4.0134)	Top-1 acc 33.203 (30.910)	Top-5 acc 57.812 (54.393)	lr 0.00098
Warmup Train [37][1400/3239]	Time 0.575 (0.518)	Data 0.001 (0.017)	Loss 3.9714 (4.0131)	Top-1 acc 31.250 (30.916)	Top-5 acc 55.078 (54.391)	lr 0.00098
Warmup Train [37][1410/3239]	Time 0.607 (0.518)	Data 0.001 (0.017)	Loss 3.9251 (4.0132)	Top-1 acc 32.031 (30.917)	Top-5 acc 55.469 (54.382)	lr 0.00097
Warmup Train [37][1420/3239]	Time 0.429 (0.518)	Data 0.001 (0.017)	Loss 4.1072 (4.0133)	Top-1 acc 29.688 (30.910)	Top-5 acc 51.172 (54.376)	lr 0.00097
Warmup Train [37][1430/3239]	Time 0.561 (0.518)	Data 0.001 (0.017)	Loss 3.9128 (4.0133)	Top-1 acc 32.422 (30.905)	Top-5 acc 55.859 (54.377)	lr 0.00097
Warmup Train [37][1440/3239]	Time 0.522 (0.518)	Data 0.001 (0.017)	Loss 4.0334 (4.0135)	Top-1 acc 28.516 (30.900)	Top-5 acc 52.734 (54.368)	lr 0.00097
Warmup Train [37][1450/3239]	Time 0.595 (0.518)	Data 0.001 (0.017)	Loss 3.9494 (4.0135)	Top-1 acc 33.203 (30.903)	Top-5 acc 55.859 (54.370)	lr 0.00097
Warmup Train [37][1460/3239]	Time 0.515 (0.518)	Data 0.001 (0.017)	Loss 3.8515 (4.0131)	Top-1 acc 33.984 (30.912)	Top-5 acc 57.422 (54.382)	lr 0.00097
Warmup Train [37][1470/3239]	Time 0.626 (0.518)	Data 0.001 (0.017)	Loss 3.9624 (4.0130)	Top-1 acc 33.203 (30.921)	Top-5 acc 56.641 (54.375)	lr 0.00096
Warmup Train [37][1480/3239]	Time 0.560 (0.518)	Data 0.001 (0.017)	Loss 4.0375 (4.0129)	Top-1 acc 30.078 (30.919)	Top-5 acc 53.125 (54.377)	lr 0.00096
Warmup Train [37][1490/3239]	Time 0.619 (0.517)	Data 0.001 (0.017)	Loss 3.8284 (4.0128)	Top-1 acc 34.766 (30.915)	Top-5 acc 55.469 (54.383)	lr 0.00096
Warmup Train [37][1500/3239]	Time 0.694 (0.518)	Data 0.001 (0.017)	Loss 3.8848 (4.0129)	Top-1 acc 32.422 (30.916)	Top-5 acc 60.547 (54.389)	lr 0.00096
Warmup Train [37][1510/3239]	Time 0.531 (0.518)	Data 0.001 (0.016)	Loss 3.9908 (4.0126)	Top-1 acc 31.641 (30.922)	Top-5 acc 54.688 (54.404)	lr 0.00096
Warmup Train [37][1520/3239]	Time 0.642 (0.518)	Data 0.001 (0.016)	Loss 4.0618 (4.0128)	Top-1 acc 30.859 (30.917)	Top-5 acc 50.391 (54.400)	lr 0.00096
Warmup Train [37][1530/3239]	Time 0.428 (0.518)	Data 0.001 (0.016)	Loss 3.9756 (4.0125)	Top-1 acc 30.078 (30.922)	Top-5 acc 51.562 (54.405)	lr 0.00095
Warmup Train [37][1540/3239]	Time 0.653 (0.517)	Data 0.001 (0.016)	Loss 3.9807 (4.0124)	Top-1 acc 30.078 (30.926)	Top-5 acc 54.297 (54.408)	lr 0.00095
Warmup Train [37][1550/3239]	Time 0.570 (0.517)	Data 0.001 (0.016)	Loss 3.9692 (4.0126)	Top-1 acc 31.250 (30.924)	Top-5 acc 55.469 (54.398)	lr 0.00095
Warmup Train [37][1560/3239]	Time 0.429 (0.517)	Data 0.001 (0.016)	Loss 3.9827 (4.0122)	Top-1 acc 33.203 (30.932)	Top-5 acc 54.297 (54.412)	lr 0.00095
Warmup Train [37][1570/3239]	Time 0.514 (0.517)	Data 0.001 (0.016)	Loss 3.9744 (4.0123)	Top-1 acc 32.422 (30.932)	Top-5 acc 57.422 (54.407)	lr 0.00095
Warmup Train [37][1580/3239]	Time 0.569 (0.517)	Data 0.001 (0.016)	Loss 3.9652 (4.0119)	Top-1 acc 30.859 (30.941)	Top-5 acc 54.688 (54.418)	lr 0.00095
Warmup Train [37][1590/3239]	Time 0.610 (0.517)	Data 0.001 (0.016)	Loss 4.1504 (4.0120)	Top-1 acc 28.516 (30.939)	Top-5 acc 51.562 (54.407)	lr 0.00094
Warmup Train [37][1600/3239]	Time 0.565 (0.517)	Data 0.001 (0.016)	Loss 3.9126 (4.0122)	Top-1 acc 32.812 (30.937)	Top-5 acc 56.641 (54.405)	lr 0.00094
Warmup Train [37][1610/3239]	Time 0.358 (0.517)	Data 0.001 (0.016)	Loss 3.9309 (4.0122)	Top-1 acc 28.906 (30.942)	Top-5 acc 56.641 (54.414)	lr 0.00094
Warmup Train [37][1620/3239]	Time 0.485 (0.517)	Data 0.001 (0.016)	Loss 4.2176 (4.0121)	Top-1 acc 24.609 (30.945)	Top-5 acc 50.000 (54.416)	lr 0.00094
Warmup Train [37][1630/3239]	Time 0.606 (0.517)	Data 0.001 (0.016)	Loss 4.1136 (4.0124)	Top-1 acc 26.562 (30.942)	Top-5 acc 51.172 (54.409)	lr 0.00094
Warmup Train [37][1640/3239]	Time 0.583 (0.517)	Data 0.002 (0.016)	Loss 3.9325 (4.0124)	Top-1 acc 30.469 (30.938)	Top-5 acc 57.031 (54.410)	lr 0.00094
Warmup Train [37][1650/3239]	Time 0.417 (0.517)	Data 0.001 (0.015)	Loss 4.0703 (4.0128)	Top-1 acc 34.375 (30.939)	Top-5 acc 53.906 (54.402)	lr 0.00093
Warmup Train [37][1660/3239]	Time 0.433 (0.517)	Data 0.001 (0.015)	Loss 4.0904 (4.0125)	Top-1 acc 27.734 (30.943)	Top-5 acc 51.172 (54.408)	lr 0.00093
Warmup Train [37][1670/3239]	Time 0.450 (0.517)	Data 0.001 (0.015)	Loss 3.9408 (4.0126)	Top-1 acc 33.203 (30.940)	Top-5 acc 56.250 (54.404)	lr 0.00093
Warmup Train [37][1680/3239]	Time 0.397 (0.517)	Data 0.001 (0.015)	Loss 3.7752 (4.0123)	Top-1 acc 37.109 (30.951)	Top-5 acc 58.984 (54.406)	lr 0.00093
Warmup Train [37][1690/3239]	Time 0.473 (0.517)	Data 0.001 (0.015)	Loss 4.1753 (4.0125)	Top-1 acc 28.125 (30.950)	Top-5 acc 50.000 (54.402)	lr 0.00093
Warmup Train [37][1700/3239]	Time 0.376 (0.517)	Data 0.001 (0.015)	Loss 4.1537 (4.0128)	Top-1 acc 25.781 (30.944)	Top-5 acc 51.953 (54.394)	lr 0.00093
Warmup Train [37][1710/3239]	Time 0.437 (0.517)	Data 0.001 (0.015)	Loss 3.7690 (4.0129)	Top-1 acc 38.672 (30.943)	Top-5 acc 62.500 (54.391)	lr 0.00092
Warmup Train [37][1720/3239]	Time 0.484 (0.517)	Data 0.003 (0.015)	Loss 3.9346 (4.0127)	Top-1 acc 33.203 (30.949)	Top-5 acc 59.375 (54.400)	lr 0.00092
Warmup Train [37][1730/3239]	Time 0.640 (0.517)	Data 0.001 (0.015)	Loss 3.9616 (4.0128)	Top-1 acc 35.156 (30.949)	Top-5 acc 58.203 (54.402)	lr 0.00092
Warmup Train [37][1740/3239]	Time 0.348 (0.517)	Data 0.001 (0.015)	Loss 4.0276 (4.0129)	Top-1 acc 31.250 (30.953)	Top-5 acc 55.859 (54.406)	lr 0.00092
Warmup Train [37][1750/3239]	Time 0.584 (0.517)	Data 0.001 (0.015)	Loss 4.0462 (4.0128)	Top-1 acc 28.125 (30.946)	Top-5 acc 54.688 (54.407)	lr 0.00092
Warmup Train [37][1760/3239]	Time 0.479 (0.517)	Data 0.001 (0.015)	Loss 4.0996 (4.0133)	Top-1 acc 28.516 (30.935)	Top-5 acc 53.516 (54.392)	lr 0.00092
Warmup Train [37][1770/3239]	Time 0.461 (0.517)	Data 0.001 (0.015)	Loss 3.9427 (4.0135)	Top-1 acc 32.422 (30.933)	Top-5 acc 57.422 (54.388)	lr 0.00091
Warmup Train [37][1780/3239]	Time 0.508 (0.517)	Data 0.001 (0.015)	Loss 4.2294 (4.0136)	Top-1 acc 28.125 (30.937)	Top-5 acc 49.609 (54.390)	lr 0.00091
Warmup Train [37][1790/3239]	Time 0.566 (0.517)	Data 0.001 (0.015)	Loss 3.8157 (4.0134)	Top-1 acc 33.594 (30.938)	Top-5 acc 57.812 (54.396)	lr 0.00091
Warmup Train [37][1800/3239]	Time 0.495 (0.517)	Data 0.001 (0.015)	Loss 3.8776 (4.0131)	Top-1 acc 32.031 (30.939)	Top-5 acc 57.812 (54.410)	lr 0.00091
Warmup Train [37][1810/3239]	Time 0.559 (0.516)	Data 0.001 (0.015)	Loss 4.1044 (4.0132)	Top-1 acc 27.734 (30.934)	Top-5 acc 54.688 (54.410)	lr 0.00091
Warmup Train [37][1820/3239]	Time 0.592 (0.516)	Data 0.001 (0.015)	Loss 3.9414 (4.0131)	Top-1 acc 33.594 (30.935)	Top-5 acc 55.078 (54.404)	lr 0.00091
Warmup Train [37][1830/3239]	Time 0.642 (0.516)	Data 0.001 (0.015)	Loss 3.9418 (4.0132)	Top-1 acc 33.984 (30.940)	Top-5 acc 56.250 (54.403)	lr 0.00090
Warmup Train [37][1840/3239]	Time 0.556 (0.516)	Data 0.001 (0.015)	Loss 4.0541 (4.0132)	Top-1 acc 32.812 (30.947)	Top-5 acc 52.734 (54.406)	lr 0.00090
Warmup Train [37][1850/3239]	Time 0.279 (0.516)	Data 0.001 (0.015)	Loss 4.0441 (4.0135)	Top-1 acc 30.078 (30.947)	Top-5 acc 53.906 (54.410)	lr 0.00090
Warmup Train [37][1860/3239]	Time 0.593 (0.516)	Data 0.002 (0.015)	Loss 3.9236 (4.0135)	Top-1 acc 31.250 (30.946)	Top-5 acc 59.375 (54.412)	lr 0.00090
Warmup Train [37][1870/3239]	Time 0.518 (0.516)	Data 0.001 (0.015)	Loss 3.9885 (4.0134)	Top-1 acc 33.984 (30.954)	Top-5 acc 56.250 (54.417)	lr 0.00090
Warmup Train [37][1880/3239]	Time 0.445 (0.516)	Data 0.029 (0.014)	Loss 4.0801 (4.0132)	Top-1 acc 29.297 (30.956)	Top-5 acc 52.734 (54.420)	lr 0.00090
Warmup Train [37][1890/3239]	Time 0.511 (0.516)	Data 0.001 (0.014)	Loss 3.8747 (4.0131)	Top-1 acc 33.203 (30.960)	Top-5 acc 57.812 (54.418)	lr 0.00089
Warmup Train [37][1900/3239]	Time 0.537 (0.516)	Data 0.001 (0.014)	Loss 4.0626 (4.0133)	Top-1 acc 29.688 (30.956)	Top-5 acc 51.953 (54.408)	lr 0.00089
Warmup Train [37][1910/3239]	Time 0.542 (0.516)	Data 0.001 (0.014)	Loss 3.8495 (4.0130)	Top-1 acc 37.109 (30.961)	Top-5 acc 58.594 (54.417)	lr 0.00089
Warmup Train [37][1920/3239]	Time 0.457 (0.516)	Data 0.001 (0.014)	Loss 4.0785 (4.0132)	Top-1 acc 32.031 (30.958)	Top-5 acc 53.125 (54.413)	lr 0.00089
Warmup Train [37][1930/3239]	Time 0.429 (0.516)	Data 0.001 (0.014)	Loss 4.0622 (4.0130)	Top-1 acc 28.516 (30.962)	Top-5 acc 52.734 (54.417)	lr 0.00089
Warmup Train [37][1940/3239]	Time 0.582 (0.516)	Data 0.001 (0.014)	Loss 4.0462 (4.0127)	Top-1 acc 26.172 (30.967)	Top-5 acc 53.516 (54.426)	lr 0.00089
Warmup Train [37][1950/3239]	Time 0.328 (0.516)	Data 0.001 (0.014)	Loss 4.1107 (4.0128)	Top-1 acc 28.906 (30.966)	Top-5 acc 53.516 (54.423)	lr 0.00089
Warmup Train [37][1960/3239]	Time 0.482 (0.516)	Data 0.001 (0.014)	Loss 4.1092 (4.0131)	Top-1 acc 27.734 (30.962)	Top-5 acc 53.906 (54.415)	lr 0.00088
Warmup Train [37][1970/3239]	Time 0.561 (0.516)	Data 0.001 (0.014)	Loss 3.8945 (4.0129)	Top-1 acc 33.203 (30.965)	Top-5 acc 57.812 (54.424)	lr 0.00088
Warmup Train [37][1980/3239]	Time 0.563 (0.516)	Data 0.001 (0.014)	Loss 3.8455 (4.0130)	Top-1 acc 32.422 (30.962)	Top-5 acc 55.859 (54.424)	lr 0.00088
Warmup Train [37][1990/3239]	Time 0.465 (0.516)	Data 0.001 (0.014)	Loss 4.0735 (4.0131)	Top-1 acc 29.297 (30.962)	Top-5 acc 53.125 (54.422)	lr 0.00088
Warmup Train [37][2000/3239]	Time 0.541 (0.516)	Data 0.001 (0.014)	Loss 3.9868 (4.0133)	Top-1 acc 32.812 (30.961)	Top-5 acc 53.516 (54.421)	lr 0.00088
Warmup Train [37][2010/3239]	Time 0.618 (0.516)	Data 0.001 (0.014)	Loss 4.0500 (4.0132)	Top-1 acc 29.688 (30.966)	Top-5 acc 54.688 (54.425)	lr 0.00088
Warmup Train [37][2020/3239]	Time 0.538 (0.516)	Data 0.001 (0.014)	Loss 3.8359 (4.0128)	Top-1 acc 33.203 (30.968)	Top-5 acc 57.422 (54.438)	lr 0.00087
Warmup Train [37][2030/3239]	Time 0.585 (0.516)	Data 0.001 (0.014)	Loss 4.0097 (4.0127)	Top-1 acc 30.469 (30.967)	Top-5 acc 54.297 (54.440)	lr 0.00087
Warmup Train [37][2040/3239]	Time 0.641 (0.516)	Data 0.001 (0.014)	Loss 3.9150 (4.0128)	Top-1 acc 31.250 (30.968)	Top-5 acc 51.562 (54.434)	lr 0.00087
Warmup Train [37][2050/3239]	Time 0.484 (0.516)	Data 0.002 (0.014)	Loss 3.8788 (4.0126)	Top-1 acc 32.812 (30.976)	Top-5 acc 57.031 (54.444)	lr 0.00087
Warmup Train [37][2060/3239]	Time 0.605 (0.516)	Data 0.001 (0.014)	Loss 3.9371 (4.0125)	Top-1 acc 31.641 (30.979)	Top-5 acc 57.422 (54.448)	lr 0.00087
Warmup Train [37][2070/3239]	Time 0.319 (0.516)	Data 0.001 (0.014)	Loss 4.0191 (4.0121)	Top-1 acc 30.859 (30.991)	Top-5 acc 53.125 (54.453)	lr 0.00087
Warmup Train [37][2080/3239]	Time 0.403 (0.516)	Data 0.001 (0.014)	Loss 4.0470 (4.0120)	Top-1 acc 30.469 (30.994)	Top-5 acc 55.859 (54.461)	lr 0.00086
Warmup Train [37][2090/3239]	Time 0.467 (0.516)	Data 0.001 (0.014)	Loss 4.0717 (4.0118)	Top-1 acc 26.562 (30.998)	Top-5 acc 52.344 (54.470)	lr 0.00086
Warmup Train [37][2100/3239]	Time 0.504 (0.516)	Data 0.001 (0.014)	Loss 3.8880 (4.0115)	Top-1 acc 33.594 (31.003)	Top-5 acc 60.547 (54.479)	lr 0.00086
Warmup Train [37][2110/3239]	Time 0.538 (0.516)	Data 0.001 (0.014)	Loss 3.9277 (4.0112)	Top-1 acc 31.250 (31.005)	Top-5 acc 58.203 (54.481)	lr 0.00086
Warmup Train [37][2120/3239]	Time 0.600 (0.516)	Data 0.001 (0.014)	Loss 3.8553 (4.0116)	Top-1 acc 34.375 (30.993)	Top-5 acc 53.516 (54.467)	lr 0.00086
Warmup Train [37][2130/3239]	Time 0.601 (0.516)	Data 0.001 (0.014)	Loss 3.8805 (4.0114)	Top-1 acc 35.938 (30.997)	Top-5 acc 58.594 (54.469)	lr 0.00086
Warmup Train [37][2140/3239]	Time 0.483 (0.516)	Data 0.001 (0.014)	Loss 3.9230 (4.0114)	Top-1 acc 32.031 (30.994)	Top-5 acc 53.906 (54.465)	lr 0.00085
Warmup Train [37][2150/3239]	Time 0.489 (0.516)	Data 0.001 (0.014)	Loss 4.1419 (4.0115)	Top-1 acc 27.734 (30.995)	Top-5 acc 49.609 (54.463)	lr 0.00085
Warmup Train [37][2160/3239]	Time 0.483 (0.516)	Data 0.001 (0.013)	Loss 3.9516 (4.0115)	Top-1 acc 34.375 (31.001)	Top-5 acc 60.547 (54.465)	lr 0.00085
Warmup Train [37][2170/3239]	Time 0.542 (0.516)	Data 0.001 (0.013)	Loss 3.9996 (4.0117)	Top-1 acc 31.641 (30.997)	Top-5 acc 53.906 (54.461)	lr 0.00085
Warmup Train [37][2180/3239]	Time 0.536 (0.516)	Data 0.001 (0.013)	Loss 3.8780 (4.0119)	Top-1 acc 34.766 (30.994)	Top-5 acc 57.031 (54.454)	lr 0.00085
Warmup Train [37][2190/3239]	Time 0.333 (0.516)	Data 0.001 (0.013)	Loss 4.1099 (4.0118)	Top-1 acc 28.516 (30.990)	Top-5 acc 53.516 (54.453)	lr 0.00085
Warmup Train [37][2200/3239]	Time 0.555 (0.516)	Data 0.029 (0.013)	Loss 4.0129 (4.0119)	Top-1 acc 32.422 (30.989)	Top-5 acc 53.516 (54.454)	lr 0.00085
Warmup Train [37][2210/3239]	Time 0.674 (0.516)	Data 0.001 (0.013)	Loss 4.0439 (4.0118)	Top-1 acc 28.125 (30.988)	Top-5 acc 54.688 (54.450)	lr 0.00084
Warmup Train [37][2220/3239]	Time 0.743 (0.516)	Data 0.002 (0.013)	Loss 3.9793 (4.0116)	Top-1 acc 30.469 (30.994)	Top-5 acc 51.172 (54.453)	lr 0.00084
Warmup Train [37][2230/3239]	Time 0.512 (0.516)	Data 0.001 (0.013)	Loss 3.9036 (4.0116)	Top-1 acc 31.641 (30.995)	Top-5 acc 55.469 (54.450)	lr 0.00084
Warmup Train [37][2240/3239]	Time 0.403 (0.516)	Data 0.001 (0.013)	Loss 4.1163 (4.0114)	Top-1 acc 28.125 (30.996)	Top-5 acc 53.516 (54.455)	lr 0.00084
Warmup Train [37][2250/3239]	Time 0.529 (0.516)	Data 0.001 (0.013)	Loss 3.9108 (4.0112)	Top-1 acc 31.641 (31.000)	Top-5 acc 56.250 (54.461)	lr 0.00084
Warmup Train [37][2260/3239]	Time 0.477 (0.516)	Data 0.001 (0.013)	Loss 3.8998 (4.0114)	Top-1 acc 30.859 (30.997)	Top-5 acc 58.594 (54.460)	lr 0.00084
Warmup Train [37][2270/3239]	Time 0.502 (0.516)	Data 0.001 (0.013)	Loss 4.2846 (4.0115)	Top-1 acc 25.000 (30.993)	Top-5 acc 46.094 (54.460)	lr 0.00083
Warmup Train [37][2280/3239]	Time 0.543 (0.516)	Data 0.001 (0.013)	Loss 4.0699 (4.0117)	Top-1 acc 29.688 (30.996)	Top-5 acc 52.734 (54.454)	lr 0.00083
Warmup Train [37][2290/3239]	Time 0.399 (0.516)	Data 0.001 (0.013)	Loss 4.0922 (4.0116)	Top-1 acc 30.859 (30.997)	Top-5 acc 53.906 (54.458)	lr 0.00083
Warmup Train [37][2300/3239]	Time 0.557 (0.516)	Data 0.001 (0.013)	Loss 3.8618 (4.0118)	Top-1 acc 35.938 (31.001)	Top-5 acc 57.812 (54.457)	lr 0.00083
Warmup Train [37][2310/3239]	Time 0.576 (0.516)	Data 0.001 (0.013)	Loss 4.1067 (4.0117)	Top-1 acc 31.641 (31.006)	Top-5 acc 50.391 (54.455)	lr 0.00083
Warmup Train [37][2320/3239]	Time 0.513 (0.516)	Data 0.001 (0.013)	Loss 3.7785 (4.0119)	Top-1 acc 37.109 (31.004)	Top-5 acc 58.984 (54.451)	lr 0.00083
Warmup Train [37][2330/3239]	Time 0.513 (0.516)	Data 0.002 (0.013)	Loss 4.3062 (4.0119)	Top-1 acc 23.828 (31.007)	Top-5 acc 48.828 (54.449)	lr 0.00083
Warmup Train [37][2340/3239]	Time 0.561 (0.516)	Data 0.001 (0.013)	Loss 3.9850 (4.0118)	Top-1 acc 34.766 (31.012)	Top-5 acc 58.203 (54.454)	lr 0.00082
Warmup Train [37][2350/3239]	Time 0.521 (0.516)	Data 0.001 (0.013)	Loss 4.0905 (4.0118)	Top-1 acc 28.906 (31.014)	Top-5 acc 53.906 (54.452)	lr 0.00082
Warmup Train [37][2360/3239]	Time 0.309 (0.516)	Data 0.001 (0.013)	Loss 4.3261 (4.0119)	Top-1 acc 25.781 (31.013)	Top-5 acc 48.438 (54.449)	lr 0.00082
Warmup Train [37][2370/3239]	Time 0.516 (0.516)	Data 0.001 (0.013)	Loss 4.0218 (4.0119)	Top-1 acc 31.641 (31.015)	Top-5 acc 53.125 (54.445)	lr 0.00082
Warmup Train [37][2380/3239]	Time 0.443 (0.516)	Data 0.001 (0.013)	Loss 4.0346 (4.0120)	Top-1 acc 35.547 (31.018)	Top-5 acc 55.078 (54.444)	lr 0.00082
Warmup Train [37][2390/3239]	Time 0.475 (0.515)	Data 0.001 (0.013)	Loss 3.9758 (4.0121)	Top-1 acc 32.031 (31.017)	Top-5 acc 55.469 (54.444)	lr 0.00082
Warmup Train [37][2400/3239]	Time 0.374 (0.515)	Data 0.001 (0.013)	Loss 3.9411 (4.0117)	Top-1 acc 33.203 (31.027)	Top-5 acc 56.250 (54.453)	lr 0.00081
Warmup Train [37][2410/3239]	Time 0.459 (0.515)	Data 0.001 (0.013)	Loss 4.1014 (4.0115)	Top-1 acc 29.688 (31.028)	Top-5 acc 56.250 (54.463)	lr 0.00081
Warmup Train [37][2420/3239]	Time 0.316 (0.515)	Data 0.001 (0.013)	Loss 4.1289 (4.0114)	Top-1 acc 30.078 (31.033)	Top-5 acc 52.734 (54.466)	lr 0.00081
Warmup Train [37][2430/3239]	Time 0.453 (0.515)	Data 0.001 (0.013)	Loss 4.1248 (4.0113)	Top-1 acc 32.031 (31.034)	Top-5 acc 55.078 (54.468)	lr 0.00081
Warmup Train [37][2440/3239]	Time 0.585 (0.515)	Data 0.002 (0.013)	Loss 4.0330 (4.0112)	Top-1 acc 28.516 (31.034)	Top-5 acc 51.562 (54.468)	lr 0.00081
Warmup Train [37][2450/3239]	Time 0.491 (0.515)	Data 0.001 (0.013)	Loss 3.9021 (4.0110)	Top-1 acc 33.594 (31.036)	Top-5 acc 57.422 (54.473)	lr 0.00081
Warmup Train [37][2460/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 3.8503 (4.0106)	Top-1 acc 35.547 (31.043)	Top-5 acc 58.594 (54.483)	lr 0.00081
Warmup Train [37][2470/3239]	Time 0.472 (0.515)	Data 0.001 (0.013)	Loss 4.1192 (4.0108)	Top-1 acc 29.297 (31.041)	Top-5 acc 52.344 (54.479)	lr 0.00080
Warmup Train [37][2480/3239]	Time 0.424 (0.515)	Data 0.001 (0.013)	Loss 4.0078 (4.0109)	Top-1 acc 30.078 (31.039)	Top-5 acc 55.469 (54.472)	lr 0.00080
Warmup Train [37][2490/3239]	Time 0.478 (0.515)	Data 0.001 (0.013)	Loss 4.0612 (4.0109)	Top-1 acc 27.344 (31.037)	Top-5 acc 51.562 (54.471)	lr 0.00080
Warmup Train [37][2500/3239]	Time 0.428 (0.515)	Data 0.001 (0.013)	Loss 3.9532 (4.0109)	Top-1 acc 30.859 (31.034)	Top-5 acc 55.469 (54.471)	lr 0.00080
Warmup Train [37][2510/3239]	Time 0.423 (0.515)	Data 0.001 (0.013)	Loss 4.1128 (4.0110)	Top-1 acc 31.641 (31.030)	Top-5 acc 54.297 (54.466)	lr 0.00080
Warmup Train [37][2520/3239]	Time 0.545 (0.515)	Data 0.001 (0.013)	Loss 3.8789 (4.0110)	Top-1 acc 33.594 (31.030)	Top-5 acc 58.203 (54.472)	lr 0.00080
Warmup Train [37][2530/3239]	Time 0.598 (0.515)	Data 0.001 (0.013)	Loss 3.9400 (4.0111)	Top-1 acc 31.250 (31.026)	Top-5 acc 55.859 (54.468)	lr 0.00079
Warmup Train [37][2540/3239]	Time 0.657 (0.515)	Data 0.001 (0.013)	Loss 3.8801 (4.0111)	Top-1 acc 32.422 (31.022)	Top-5 acc 58.594 (54.470)	lr 0.00079
Warmup Train [37][2550/3239]	Time 0.468 (0.515)	Data 0.001 (0.012)	Loss 4.0498 (4.0111)	Top-1 acc 30.859 (31.021)	Top-5 acc 53.516 (54.471)	lr 0.00079
Warmup Train [37][2560/3239]	Time 0.620 (0.515)	Data 0.001 (0.012)	Loss 4.2247 (4.0108)	Top-1 acc 24.219 (31.021)	Top-5 acc 50.781 (54.478)	lr 0.00079
Warmup Train [37][2570/3239]	Time 0.477 (0.515)	Data 0.001 (0.012)	Loss 4.0976 (4.0108)	Top-1 acc 30.469 (31.023)	Top-5 acc 53.516 (54.478)	lr 0.00079
Warmup Train [37][2580/3239]	Time 0.448 (0.515)	Data 0.001 (0.012)	Loss 4.1773 (4.0110)	Top-1 acc 26.953 (31.022)	Top-5 acc 46.094 (54.473)	lr 0.00079
Warmup Train [37][2590/3239]	Time 0.499 (0.515)	Data 0.001 (0.012)	Loss 3.9236 (4.0111)	Top-1 acc 31.250 (31.022)	Top-5 acc 54.688 (54.470)	lr 0.00079
Warmup Train [37][2600/3239]	Time 0.510 (0.515)	Data 0.001 (0.012)	Loss 4.0004 (4.0111)	Top-1 acc 29.688 (31.025)	Top-5 acc 56.250 (54.471)	lr 0.00078
Warmup Train [37][2610/3239]	Time 0.524 (0.515)	Data 0.001 (0.012)	Loss 3.8881 (4.0110)	Top-1 acc 33.203 (31.029)	Top-5 acc 57.422 (54.474)	lr 0.00078
Warmup Train [37][2620/3239]	Time 0.364 (0.515)	Data 0.001 (0.012)	Loss 4.1517 (4.0111)	Top-1 acc 29.688 (31.029)	Top-5 acc 53.125 (54.476)	lr 0.00078
Warmup Train [37][2630/3239]	Time 0.485 (0.515)	Data 0.001 (0.012)	Loss 4.0323 (4.0112)	Top-1 acc 30.078 (31.028)	Top-5 acc 53.906 (54.470)	lr 0.00078
Warmup Train [37][2640/3239]	Time 0.747 (0.515)	Data 0.001 (0.012)	Loss 3.8723 (4.0108)	Top-1 acc 35.156 (31.037)	Top-5 acc 52.344 (54.477)	lr 0.00078
Warmup Train [37][2650/3239]	Time 0.649 (0.515)	Data 0.001 (0.012)	Loss 4.0979 (4.0108)	Top-1 acc 32.422 (31.043)	Top-5 acc 50.781 (54.476)	lr 0.00078
Warmup Train [37][2660/3239]	Time 0.396 (0.515)	Data 0.001 (0.012)	Loss 4.2555 (4.0109)	Top-1 acc 30.469 (31.040)	Top-5 acc 49.609 (54.471)	lr 0.00078
Warmup Train [37][2670/3239]	Time 0.369 (0.514)	Data 0.001 (0.012)	Loss 4.1126 (4.0109)	Top-1 acc 30.469 (31.038)	Top-5 acc 52.344 (54.471)	lr 0.00077
Warmup Train [37][2680/3239]	Time 0.510 (0.514)	Data 0.001 (0.012)	Loss 3.9019 (4.0110)	Top-1 acc 32.031 (31.034)	Top-5 acc 56.641 (54.466)	lr 0.00077
Warmup Train [37][2690/3239]	Time 0.405 (0.514)	Data 0.001 (0.012)	Loss 4.0051 (4.0110)	Top-1 acc 28.125 (31.036)	Top-5 acc 55.078 (54.467)	lr 0.00077
Warmup Train [37][2700/3239]	Time 0.528 (0.514)	Data 0.001 (0.012)	Loss 3.9816 (4.0110)	Top-1 acc 28.516 (31.034)	Top-5 acc 55.469 (54.466)	lr 0.00077
Warmup Train [37][2710/3239]	Time 0.400 (0.514)	Data 0.001 (0.012)	Loss 4.2218 (4.0109)	Top-1 acc 25.391 (31.038)	Top-5 acc 48.047 (54.466)	lr 0.00077
Warmup Train [37][2720/3239]	Time 0.574 (0.514)	Data 0.001 (0.012)	Loss 3.9435 (4.0110)	Top-1 acc 31.250 (31.037)	Top-5 acc 55.469 (54.467)	lr 0.00077
Warmup Train [37][2730/3239]	Time 0.391 (0.514)	Data 0.001 (0.012)	Loss 3.9456 (4.0109)	Top-1 acc 30.078 (31.037)	Top-5 acc 59.766 (54.470)	lr 0.00076
Warmup Train [37][2740/3239]	Time 0.390 (0.514)	Data 0.001 (0.012)	Loss 3.8559 (4.0109)	Top-1 acc 31.641 (31.036)	Top-5 acc 55.469 (54.468)	lr 0.00076
Warmup Train [37][2750/3239]	Time 0.765 (0.514)	Data 0.001 (0.012)	Loss 4.0405 (4.0110)	Top-1 acc 30.859 (31.031)	Top-5 acc 55.078 (54.465)	lr 0.00076
Warmup Train [37][2760/3239]	Time 0.484 (0.514)	Data 0.001 (0.012)	Loss 3.9042 (4.0110)	Top-1 acc 30.078 (31.031)	Top-5 acc 57.031 (54.467)	lr 0.00076
Warmup Train [37][2770/3239]	Time 0.545 (0.514)	Data 0.001 (0.012)	Loss 4.1499 (4.0111)	Top-1 acc 27.344 (31.027)	Top-5 acc 46.484 (54.459)	lr 0.00076
Warmup Train [37][2780/3239]	Time 0.660 (0.514)	Data 0.001 (0.012)	Loss 4.1227 (4.0112)	Top-1 acc 33.594 (31.025)	Top-5 acc 53.906 (54.455)	lr 0.00076
Warmup Train [37][2790/3239]	Time 0.506 (0.514)	Data 0.003 (0.012)	Loss 3.9126 (4.0110)	Top-1 acc 34.375 (31.027)	Top-5 acc 55.078 (54.454)	lr 0.00076
Warmup Train [37][2800/3239]	Time 0.654 (0.514)	Data 0.001 (0.012)	Loss 3.8284 (4.0109)	Top-1 acc 35.938 (31.032)	Top-5 acc 60.938 (54.457)	lr 0.00075
Warmup Train [37][2810/3239]	Time 0.555 (0.514)	Data 0.001 (0.012)	Loss 4.0934 (4.0108)	Top-1 acc 29.688 (31.030)	Top-5 acc 51.562 (54.457)	lr 0.00075
Warmup Train [37][2820/3239]	Time 0.502 (0.514)	Data 0.001 (0.012)	Loss 4.0134 (4.0108)	Top-1 acc 30.078 (31.031)	Top-5 acc 53.125 (54.456)	lr 0.00075
Warmup Train [37][2830/3239]	Time 0.575 (0.514)	Data 0.001 (0.012)	Loss 3.9997 (4.0110)	Top-1 acc 28.125 (31.024)	Top-5 acc 54.297 (54.453)	lr 0.00075
Warmup Train [37][2840/3239]	Time 0.558 (0.514)	Data 0.001 (0.012)	Loss 4.0290 (4.0110)	Top-1 acc 30.469 (31.024)	Top-5 acc 51.562 (54.456)	lr 0.00075
Warmup Train [37][2850/3239]	Time 0.605 (0.514)	Data 0.002 (0.012)	Loss 4.2340 (4.0109)	Top-1 acc 27.734 (31.029)	Top-5 acc 51.172 (54.459)	lr 0.00075
Warmup Train [37][2860/3239]	Time 0.659 (0.514)	Data 0.001 (0.012)	Loss 4.0021 (4.0112)	Top-1 acc 34.766 (31.028)	Top-5 acc 55.859 (54.453)	lr 0.00075
Warmup Train [37][2870/3239]	Time 0.623 (0.514)	Data 0.001 (0.012)	Loss 4.0290 (4.0113)	Top-1 acc 29.688 (31.023)	Top-5 acc 55.078 (54.450)	lr 0.00074
Warmup Train [37][2880/3239]	Time 0.533 (0.514)	Data 0.001 (0.012)	Loss 3.9007 (4.0111)	Top-1 acc 33.203 (31.026)	Top-5 acc 57.031 (54.457)	lr 0.00074
Warmup Train [37][2890/3239]	Time 0.473 (0.514)	Data 0.001 (0.012)	Loss 4.0081 (4.0113)	Top-1 acc 29.297 (31.023)	Top-5 acc 53.906 (54.456)	lr 0.00074
Warmup Train [37][2900/3239]	Time 0.460 (0.514)	Data 0.001 (0.012)	Loss 4.0123 (4.0112)	Top-1 acc 29.297 (31.023)	Top-5 acc 51.953 (54.457)	lr 0.00074
Warmup Train [37][2910/3239]	Time 0.405 (0.514)	Data 0.002 (0.012)	Loss 4.2742 (4.0116)	Top-1 acc 27.344 (31.020)	Top-5 acc 49.609 (54.451)	lr 0.00074
Warmup Train [37][2920/3239]	Time 0.649 (0.514)	Data 0.001 (0.012)	Loss 3.9466 (4.0114)	Top-1 acc 33.984 (31.024)	Top-5 acc 52.734 (54.454)	lr 0.00074
Warmup Train [37][2930/3239]	Time 0.548 (0.514)	Data 0.001 (0.012)	Loss 4.0849 (4.0112)	Top-1 acc 30.859 (31.025)	Top-5 acc 50.781 (54.455)	lr 0.00074
Warmup Train [37][2940/3239]	Time 0.495 (0.514)	Data 0.001 (0.012)	Loss 3.9526 (4.0108)	Top-1 acc 32.031 (31.033)	Top-5 acc 55.078 (54.464)	lr 0.00073
Warmup Train [37][2950/3239]	Time 0.503 (0.514)	Data 0.001 (0.012)	Loss 3.9606 (4.0108)	Top-1 acc 33.594 (31.036)	Top-5 acc 57.031 (54.463)	lr 0.00073
Warmup Train [37][2960/3239]	Time 0.462 (0.514)	Data 0.001 (0.012)	Loss 3.8989 (4.0109)	Top-1 acc 32.031 (31.032)	Top-5 acc 55.469 (54.459)	lr 0.00073
Warmup Train [37][2970/3239]	Time 0.551 (0.514)	Data 0.001 (0.012)	Loss 4.0049 (4.0110)	Top-1 acc 33.594 (31.031)	Top-5 acc 54.688 (54.456)	lr 0.00073
Warmup Train [37][2980/3239]	Time 0.634 (0.514)	Data 0.001 (0.012)	Loss 4.0563 (4.0110)	Top-1 acc 30.078 (31.031)	Top-5 acc 54.297 (54.460)	lr 0.00073
Warmup Train [37][2990/3239]	Time 0.428 (0.514)	Data 0.001 (0.011)	Loss 3.7969 (4.0108)	Top-1 acc 38.672 (31.035)	Top-5 acc 60.547 (54.461)	lr 0.00073
Warmup Train [37][3000/3239]	Time 0.513 (0.514)	Data 0.001 (0.011)	Loss 3.9490 (4.0107)	Top-1 acc 32.422 (31.036)	Top-5 acc 57.031 (54.465)	lr 0.00073
Warmup Train [37][3010/3239]	Time 0.560 (0.514)	Data 0.001 (0.011)	Loss 4.1996 (4.0108)	Top-1 acc 30.469 (31.035)	Top-5 acc 47.656 (54.459)	lr 0.00072
Warmup Train [37][3020/3239]	Time 0.498 (0.514)	Data 0.001 (0.011)	Loss 3.9979 (4.0108)	Top-1 acc 33.594 (31.037)	Top-5 acc 50.781 (54.462)	lr 0.00072
Warmup Train [37][3030/3239]	Time 0.355 (0.514)	Data 0.001 (0.011)	Loss 3.9798 (4.0108)	Top-1 acc 29.688 (31.038)	Top-5 acc 55.078 (54.459)	lr 0.00072
Warmup Train [37][3040/3239]	Time 0.523 (0.514)	Data 0.001 (0.011)	Loss 3.9408 (4.0106)	Top-1 acc 33.203 (31.043)	Top-5 acc 55.469 (54.467)	lr 0.00072
Warmup Train [37][3050/3239]	Time 0.517 (0.514)	Data 0.001 (0.011)	Loss 3.9367 (4.0107)	Top-1 acc 37.109 (31.043)	Top-5 acc 55.469 (54.462)	lr 0.00072
Warmup Train [37][3060/3239]	Time 0.425 (0.514)	Data 0.001 (0.011)	Loss 4.3021 (4.0108)	Top-1 acc 23.438 (31.041)	Top-5 acc 47.656 (54.459)	lr 0.00072
Warmup Train [37][3070/3239]	Time 0.605 (0.514)	Data 0.001 (0.011)	Loss 4.1151 (4.0107)	Top-1 acc 30.078 (31.040)	Top-5 acc 51.953 (54.460)	lr 0.00072
Warmup Train [37][3080/3239]	Time 0.560 (0.514)	Data 0.001 (0.011)	Loss 4.1202 (4.0108)	Top-1 acc 28.906 (31.040)	Top-5 acc 55.469 (54.460)	lr 0.00071
Warmup Train [37][3090/3239]	Time 0.364 (0.514)	Data 0.001 (0.011)	Loss 3.9961 (4.0108)	Top-1 acc 33.203 (31.039)	Top-5 acc 51.953 (54.457)	lr 0.00071
Warmup Train [37][3100/3239]	Time 0.497 (0.514)	Data 0.001 (0.011)	Loss 3.9080 (4.0108)	Top-1 acc 32.812 (31.041)	Top-5 acc 53.906 (54.460)	lr 0.00071
Warmup Train [37][3110/3239]	Time 0.516 (0.514)	Data 0.001 (0.011)	Loss 4.1498 (4.0108)	Top-1 acc 30.469 (31.040)	Top-5 acc 49.219 (54.457)	lr 0.00071
Warmup Train [37][3120/3239]	Time 0.527 (0.514)	Data 0.001 (0.011)	Loss 3.7333 (4.0105)	Top-1 acc 33.984 (31.042)	Top-5 acc 55.469 (54.464)	lr 0.00071
Warmup Train [37][3130/3239]	Time 0.573 (0.514)	Data 0.001 (0.011)	Loss 4.2327 (4.0104)	Top-1 acc 23.438 (31.040)	Top-5 acc 50.781 (54.462)	lr 0.00071
Warmup Train [37][3140/3239]	Time 0.583 (0.514)	Data 0.001 (0.011)	Loss 3.8472 (4.0102)	Top-1 acc 32.031 (31.045)	Top-5 acc 59.766 (54.471)	lr 0.00070
Warmup Train [37][3150/3239]	Time 0.448 (0.514)	Data 0.001 (0.011)	Loss 4.0208 (4.0102)	Top-1 acc 30.469 (31.044)	Top-5 acc 56.250 (54.472)	lr 0.00070
Warmup Train [37][3160/3239]	Time 0.465 (0.514)	Data 0.001 (0.011)	Loss 4.0874 (4.0102)	Top-1 acc 29.297 (31.044)	Top-5 acc 53.516 (54.469)	lr 0.00070
Warmup Train [37][3170/3239]	Time 0.681 (0.514)	Data 0.001 (0.011)	Loss 3.9739 (4.0103)	Top-1 acc 32.422 (31.043)	Top-5 acc 56.250 (54.468)	lr 0.00070
Warmup Train [37][3180/3239]	Time 0.552 (0.514)	Data 0.000 (0.011)	Loss 4.0572 (4.0102)	Top-1 acc 24.219 (31.040)	Top-5 acc 54.297 (54.470)	lr 0.00070
Warmup Train [37][3190/3239]	Time 0.501 (0.514)	Data 0.000 (0.011)	Loss 4.0686 (4.0104)	Top-1 acc 30.078 (31.037)	Top-5 acc 50.000 (54.463)	lr 0.00070
Warmup Train [37][3200/3239]	Time 0.510 (0.514)	Data 0.000 (0.011)	Loss 3.7914 (4.0104)	Top-1 acc 37.891 (31.037)	Top-5 acc 60.938 (54.463)	lr 0.00070
Warmup Train [37][3210/3239]	Time 0.499 (0.514)	Data 0.000 (0.011)	Loss 3.8917 (4.0104)	Top-1 acc 31.641 (31.036)	Top-5 acc 57.422 (54.463)	lr 0.00070
Warmup Train [37][3220/3239]	Time 0.511 (0.513)	Data 0.000 (0.011)	Loss 4.0025 (4.0103)	Top-1 acc 29.688 (31.042)	Top-5 acc 53.125 (54.468)	lr 0.00069
Warmup Train [37][3230/3239]	Time 0.527 (0.513)	Data 0.000 (0.011)	Loss 4.0309 (4.0102)	Top-1 acc 30.469 (31.045)	Top-5 acc 54.688 (54.472)	lr 0.00069
Warmup Train [37][3239/3239]	Time 0.309 (0.513)	Data 0.000 (0.011)	Loss 4.1376 (4.0101)	Top-1 acc 27.160 (31.049)	Top-5 acc 53.086 (54.473)	lr 0.00069
==========Warmup Valid [37/40]	loss 2.957	top-1 acc 38.312	top-5 acc 63.270	Train top-1 31.049	top-5 54.473	flops: 442.4M
Warmup Train [38][0/3239]	Time 14.981 (14.981)	Data 11.879 (11.879)	Loss 4.0088 (4.0088)	Top-1 acc 32.031 (32.031)	Top-5 acc 57.031 (57.031)	lr 0.00069
Warmup Train [38][10/3239]	Time 0.663 (1.901)	Data 0.001 (1.084)	Loss 3.8483 (4.0542)	Top-1 acc 33.594 (30.504)	Top-5 acc 58.203 (53.977)	lr 0.00069
Warmup Train [38][20/3239]	Time 0.480 (1.225)	Data 0.001 (0.569)	Loss 3.7273 (4.0362)	Top-1 acc 38.281 (30.934)	Top-5 acc 62.891 (54.334)	lr 0.00069
Warmup Train [38][30/3239]	Time 0.481 (0.990)	Data 0.001 (0.386)	Loss 3.9377 (4.0274)	Top-1 acc 31.250 (30.721)	Top-5 acc 57.422 (54.410)	lr 0.00069
Warmup Train [38][40/3239]	Time 0.528 (0.876)	Data 0.001 (0.294)	Loss 3.7674 (4.0400)	Top-1 acc 35.938 (30.650)	Top-5 acc 61.719 (53.716)	lr 0.00069
Warmup Train [38][50/3239]	Time 0.515 (0.803)	Data 0.001 (0.237)	Loss 3.9344 (4.0335)	Top-1 acc 30.469 (30.584)	Top-5 acc 53.906 (53.868)	lr 0.00068
Warmup Train [38][60/3239]	Time 0.500 (0.754)	Data 0.001 (0.198)	Loss 3.9518 (4.0356)	Top-1 acc 30.469 (30.597)	Top-5 acc 55.859 (53.861)	lr 0.00068
Warmup Train [38][70/3239]	Time 0.425 (0.720)	Data 0.001 (0.171)	Loss 4.0688 (4.0323)	Top-1 acc 27.734 (30.612)	Top-5 acc 56.250 (53.884)	lr 0.00068
Warmup Train [38][80/3239]	Time 0.465 (0.695)	Data 0.001 (0.151)	Loss 3.8985 (4.0274)	Top-1 acc 33.594 (30.647)	Top-5 acc 58.203 (53.882)	lr 0.00068
Warmup Train [38][90/3239]	Time 0.583 (0.671)	Data 0.001 (0.135)	Loss 3.9645 (4.0315)	Top-1 acc 32.031 (30.658)	Top-5 acc 57.031 (53.850)	lr 0.00068
Warmup Train [38][100/3239]	Time 0.455 (0.655)	Data 0.001 (0.122)	Loss 4.1026 (4.0370)	Top-1 acc 31.641 (30.728)	Top-5 acc 50.000 (53.709)	lr 0.00068
Warmup Train [38][110/3239]	Time 0.701 (0.636)	Data 0.001 (0.111)	Loss 3.9925 (4.0330)	Top-1 acc 29.688 (30.736)	Top-5 acc 54.297 (53.825)	lr 0.00068
Warmup Train [38][120/3239]	Time 0.549 (0.626)	Data 0.001 (0.102)	Loss 4.1706 (4.0332)	Top-1 acc 26.953 (30.733)	Top-5 acc 49.609 (53.822)	lr 0.00067
Warmup Train [38][130/3239]	Time 0.635 (0.618)	Data 0.001 (0.094)	Loss 3.9553 (4.0333)	Top-1 acc 30.469 (30.710)	Top-5 acc 56.641 (53.808)	lr 0.00067
Warmup Train [38][140/3239]	Time 0.560 (0.610)	Data 0.001 (0.088)	Loss 3.8853 (4.0335)	Top-1 acc 29.688 (30.682)	Top-5 acc 58.984 (53.793)	lr 0.00067
Warmup Train [38][150/3239]	Time 0.541 (0.605)	Data 0.001 (0.083)	Loss 3.9956 (4.0281)	Top-1 acc 27.344 (30.699)	Top-5 acc 55.859 (53.901)	lr 0.00067
Warmup Train [38][160/3239]	Time 0.646 (0.601)	Data 0.001 (0.078)	Loss 3.7934 (4.0295)	Top-1 acc 33.594 (30.619)	Top-5 acc 59.375 (53.846)	lr 0.00067
Warmup Train [38][170/3239]	Time 0.596 (0.596)	Data 0.001 (0.073)	Loss 4.0031 (4.0275)	Top-1 acc 28.906 (30.636)	Top-5 acc 55.078 (53.897)	lr 0.00067
Warmup Train [38][180/3239]	Time 0.570 (0.591)	Data 0.001 (0.069)	Loss 3.8741 (4.0264)	Top-1 acc 34.766 (30.687)	Top-5 acc 57.422 (53.934)	lr 0.00067
Warmup Train [38][190/3239]	Time 0.512 (0.586)	Data 0.001 (0.066)	Loss 4.2396 (4.0298)	Top-1 acc 25.391 (30.638)	Top-5 acc 51.172 (53.906)	lr 0.00066
Warmup Train [38][200/3239]	Time 0.577 (0.583)	Data 0.001 (0.063)	Loss 3.9391 (4.0269)	Top-1 acc 33.594 (30.729)	Top-5 acc 53.125 (53.982)	lr 0.00066
Warmup Train [38][210/3239]	Time 0.516 (0.579)	Data 0.001 (0.060)	Loss 4.0774 (4.0272)	Top-1 acc 29.688 (30.728)	Top-5 acc 57.812 (53.991)	lr 0.00066
Warmup Train [38][220/3239]	Time 0.324 (0.575)	Data 0.001 (0.058)	Loss 3.9072 (4.0256)	Top-1 acc 30.078 (30.778)	Top-5 acc 57.422 (54.049)	lr 0.00066
Warmup Train [38][230/3239]	Time 0.633 (0.572)	Data 0.001 (0.056)	Loss 4.2256 (4.0278)	Top-1 acc 25.781 (30.726)	Top-5 acc 51.953 (53.984)	lr 0.00066
Warmup Train [38][240/3239]	Time 0.503 (0.570)	Data 0.001 (0.054)	Loss 4.0528 (4.0287)	Top-1 acc 31.250 (30.676)	Top-5 acc 53.906 (53.978)	lr 0.00066
Warmup Train [38][250/3239]	Time 0.452 (0.566)	Data 0.001 (0.051)	Loss 3.8868 (4.0240)	Top-1 acc 35.156 (30.744)	Top-5 acc 58.203 (54.121)	lr 0.00066
Warmup Train [38][260/3239]	Time 0.527 (0.564)	Data 0.002 (0.050)	Loss 4.0427 (4.0230)	Top-1 acc 28.906 (30.732)	Top-5 acc 51.562 (54.134)	lr 0.00065
Warmup Train [38][270/3239]	Time 0.567 (0.562)	Data 0.001 (0.048)	Loss 3.7289 (4.0230)	Top-1 acc 39.062 (30.714)	Top-5 acc 58.984 (54.154)	lr 0.00065
Warmup Train [38][280/3239]	Time 0.502 (0.561)	Data 0.001 (0.047)	Loss 4.0395 (4.0223)	Top-1 acc 33.203 (30.751)	Top-5 acc 57.812 (54.194)	lr 0.00065
Warmup Train [38][290/3239]	Time 0.582 (0.559)	Data 0.001 (0.045)	Loss 3.9007 (4.0202)	Top-1 acc 30.469 (30.744)	Top-5 acc 55.859 (54.223)	lr 0.00065
Warmup Train [38][300/3239]	Time 0.536 (0.558)	Data 0.001 (0.044)	Loss 3.8329 (4.0195)	Top-1 acc 33.984 (30.774)	Top-5 acc 55.469 (54.233)	lr 0.00065
Warmup Train [38][310/3239]	Time 0.636 (0.557)	Data 0.001 (0.043)	Loss 4.0127 (4.0196)	Top-1 acc 29.688 (30.759)	Top-5 acc 55.859 (54.248)	lr 0.00065
Warmup Train [38][320/3239]	Time 0.630 (0.556)	Data 0.001 (0.042)	Loss 4.0357 (4.0203)	Top-1 acc 31.250 (30.758)	Top-5 acc 54.297 (54.235)	lr 0.00065
Warmup Train [38][330/3239]	Time 0.485 (0.554)	Data 0.001 (0.040)	Loss 4.1610 (4.0216)	Top-1 acc 29.688 (30.743)	Top-5 acc 48.828 (54.195)	lr 0.00064
Warmup Train [38][340/3239]	Time 0.390 (0.552)	Data 0.001 (0.039)	Loss 3.8443 (4.0224)	Top-1 acc 37.891 (30.748)	Top-5 acc 60.156 (54.189)	lr 0.00064
Warmup Train [38][350/3239]	Time 0.424 (0.550)	Data 0.001 (0.039)	Loss 3.9528 (4.0204)	Top-1 acc 30.469 (30.763)	Top-5 acc 51.562 (54.229)	lr 0.00064
Warmup Train [38][360/3239]	Time 0.533 (0.549)	Data 0.001 (0.038)	Loss 3.9248 (4.0211)	Top-1 acc 33.984 (30.774)	Top-5 acc 58.203 (54.215)	lr 0.00064
Warmup Train [38][370/3239]	Time 0.506 (0.548)	Data 0.001 (0.037)	Loss 4.0417 (4.0215)	Top-1 acc 29.688 (30.778)	Top-5 acc 54.297 (54.216)	lr 0.00064
Warmup Train [38][380/3239]	Time 0.455 (0.546)	Data 0.001 (0.036)	Loss 4.0378 (4.0213)	Top-1 acc 32.812 (30.782)	Top-5 acc 53.906 (54.224)	lr 0.00064
Warmup Train [38][390/3239]	Time 0.335 (0.542)	Data 0.001 (0.035)	Loss 3.9529 (4.0195)	Top-1 acc 33.984 (30.812)	Top-5 acc 54.688 (54.260)	lr 0.00064
Warmup Train [38][400/3239]	Time 0.367 (0.539)	Data 0.001 (0.035)	Loss 4.0069 (4.0197)	Top-1 acc 32.812 (30.780)	Top-5 acc 55.469 (54.240)	lr 0.00064
Warmup Train [38][410/3239]	Time 0.506 (0.535)	Data 0.001 (0.034)	Loss 4.1210 (4.0194)	Top-1 acc 28.516 (30.813)	Top-5 acc 49.219 (54.223)	lr 0.00063
Warmup Train [38][420/3239]	Time 0.545 (0.533)	Data 0.001 (0.034)	Loss 3.8647 (4.0185)	Top-1 acc 33.203 (30.820)	Top-5 acc 60.938 (54.265)	lr 0.00063
Warmup Train [38][430/3239]	Time 0.563 (0.532)	Data 0.001 (0.033)	Loss 3.9250 (4.0188)	Top-1 acc 30.469 (30.807)	Top-5 acc 54.688 (54.244)	lr 0.00063
Warmup Train [38][440/3239]	Time 0.415 (0.531)	Data 0.001 (0.032)	Loss 3.9979 (4.0177)	Top-1 acc 28.906 (30.839)	Top-5 acc 55.859 (54.263)	lr 0.00063
Warmup Train [38][450/3239]	Time 0.456 (0.531)	Data 0.001 (0.032)	Loss 4.0711 (4.0169)	Top-1 acc 31.250 (30.855)	Top-5 acc 49.219 (54.260)	lr 0.00063
Warmup Train [38][460/3239]	Time 0.376 (0.531)	Data 0.001 (0.031)	Loss 4.0758 (4.0165)	Top-1 acc 26.953 (30.859)	Top-5 acc 51.953 (54.268)	lr 0.00063
Warmup Train [38][470/3239]	Time 0.482 (0.530)	Data 0.001 (0.031)	Loss 3.9510 (4.0155)	Top-1 acc 30.469 (30.859)	Top-5 acc 54.688 (54.292)	lr 0.00063
Warmup Train [38][480/3239]	Time 0.458 (0.530)	Data 0.001 (0.030)	Loss 4.0468 (4.0159)	Top-1 acc 29.297 (30.848)	Top-5 acc 55.469 (54.281)	lr 0.00062
Warmup Train [38][490/3239]	Time 0.428 (0.530)	Data 0.001 (0.030)	Loss 4.0474 (4.0142)	Top-1 acc 33.203 (30.898)	Top-5 acc 51.953 (54.321)	lr 0.00062
Warmup Train [38][500/3239]	Time 0.497 (0.529)	Data 0.001 (0.029)	Loss 3.8722 (4.0146)	Top-1 acc 32.422 (30.867)	Top-5 acc 57.031 (54.292)	lr 0.00062
Warmup Train [38][510/3239]	Time 0.496 (0.529)	Data 0.001 (0.029)	Loss 4.0481 (4.0157)	Top-1 acc 31.250 (30.859)	Top-5 acc 53.516 (54.273)	lr 0.00062
Warmup Train [38][520/3239]	Time 0.515 (0.528)	Data 0.001 (0.028)	Loss 3.9906 (4.0152)	Top-1 acc 28.516 (30.880)	Top-5 acc 55.469 (54.285)	lr 0.00062
Warmup Train [38][530/3239]	Time 0.467 (0.528)	Data 0.001 (0.028)	Loss 4.1436 (4.0146)	Top-1 acc 28.125 (30.884)	Top-5 acc 50.000 (54.298)	lr 0.00062
Warmup Train [38][540/3239]	Time 0.490 (0.528)	Data 0.001 (0.027)	Loss 4.0578 (4.0140)	Top-1 acc 34.766 (30.911)	Top-5 acc 53.516 (54.327)	lr 0.00062
Warmup Train [38][550/3239]	Time 0.504 (0.527)	Data 0.001 (0.027)	Loss 4.0688 (4.0138)	Top-1 acc 28.906 (30.920)	Top-5 acc 50.391 (54.325)	lr 0.00062
Warmup Train [38][560/3239]	Time 0.558 (0.528)	Data 0.001 (0.027)	Loss 4.1743 (4.0138)	Top-1 acc 26.953 (30.930)	Top-5 acc 50.391 (54.316)	lr 0.00061
Warmup Train [38][570/3239]	Time 0.468 (0.527)	Data 0.001 (0.026)	Loss 4.0863 (4.0138)	Top-1 acc 29.688 (30.911)	Top-5 acc 50.781 (54.301)	lr 0.00061
Warmup Train [38][580/3239]	Time 0.408 (0.527)	Data 0.001 (0.026)	Loss 3.8485 (4.0128)	Top-1 acc 36.328 (30.917)	Top-5 acc 61.719 (54.333)	lr 0.00061
Warmup Train [38][590/3239]	Time 0.633 (0.527)	Data 0.001 (0.025)	Loss 4.1132 (4.0127)	Top-1 acc 28.516 (30.912)	Top-5 acc 53.906 (54.348)	lr 0.00061
Warmup Train [38][600/3239]	Time 0.492 (0.526)	Data 0.001 (0.025)	Loss 4.0999 (4.0123)	Top-1 acc 28.906 (30.911)	Top-5 acc 51.953 (54.359)	lr 0.00061
Warmup Train [38][610/3239]	Time 0.516 (0.527)	Data 0.001 (0.025)	Loss 3.9830 (4.0114)	Top-1 acc 33.594 (30.939)	Top-5 acc 59.766 (54.385)	lr 0.00061
Warmup Train [38][620/3239]	Time 0.597 (0.526)	Data 0.001 (0.025)	Loss 3.9515 (4.0123)	Top-1 acc 27.734 (30.901)	Top-5 acc 55.078 (54.357)	lr 0.00061
Warmup Train [38][630/3239]	Time 0.547 (0.525)	Data 0.001 (0.024)	Loss 4.0658 (4.0130)	Top-1 acc 29.688 (30.890)	Top-5 acc 52.734 (54.354)	lr 0.00060
Warmup Train [38][640/3239]	Time 0.401 (0.525)	Data 0.001 (0.024)	Loss 4.0280 (4.0127)	Top-1 acc 28.906 (30.883)	Top-5 acc 50.781 (54.347)	lr 0.00060
Warmup Train [38][650/3239]	Time 0.462 (0.524)	Data 0.001 (0.024)	Loss 3.9621 (4.0122)	Top-1 acc 27.344 (30.889)	Top-5 acc 57.812 (54.368)	lr 0.00060
Warmup Train [38][660/3239]	Time 0.585 (0.524)	Data 0.001 (0.023)	Loss 4.0114 (4.0112)	Top-1 acc 30.469 (30.894)	Top-5 acc 54.688 (54.393)	lr 0.00060
Warmup Train [38][670/3239]	Time 0.460 (0.522)	Data 0.001 (0.023)	Loss 4.1471 (4.0110)	Top-1 acc 28.906 (30.899)	Top-5 acc 50.781 (54.388)	lr 0.00060
Warmup Train [38][680/3239]	Time 0.316 (0.522)	Data 0.001 (0.023)	Loss 4.0139 (4.0107)	Top-1 acc 33.984 (30.893)	Top-5 acc 53.906 (54.402)	lr 0.00060
Warmup Train [38][690/3239]	Time 0.447 (0.522)	Data 0.001 (0.023)	Loss 3.9096 (4.0101)	Top-1 acc 32.812 (30.894)	Top-5 acc 57.422 (54.412)	lr 0.00060
Warmup Train [38][700/3239]	Time 0.602 (0.522)	Data 0.001 (0.023)	Loss 4.0149 (4.0095)	Top-1 acc 30.859 (30.915)	Top-5 acc 54.297 (54.426)	lr 0.00060
Warmup Train [38][710/3239]	Time 0.687 (0.522)	Data 0.001 (0.022)	Loss 4.0408 (4.0096)	Top-1 acc 28.125 (30.896)	Top-5 acc 51.953 (54.421)	lr 0.00059
Warmup Train [38][720/3239]	Time 0.468 (0.522)	Data 0.001 (0.022)	Loss 3.8060 (4.0090)	Top-1 acc 36.719 (30.913)	Top-5 acc 58.203 (54.436)	lr 0.00059
Warmup Train [38][730/3239]	Time 0.525 (0.522)	Data 0.001 (0.022)	Loss 3.9051 (4.0087)	Top-1 acc 32.422 (30.930)	Top-5 acc 56.641 (54.448)	lr 0.00059
Warmup Train [38][740/3239]	Time 0.519 (0.522)	Data 0.001 (0.022)	Loss 4.1031 (4.0091)	Top-1 acc 30.469 (30.917)	Top-5 acc 53.125 (54.442)	lr 0.00059
Warmup Train [38][750/3239]	Time 0.478 (0.522)	Data 0.001 (0.021)	Loss 3.9175 (4.0092)	Top-1 acc 30.078 (30.907)	Top-5 acc 55.859 (54.437)	lr 0.00059
Warmup Train [38][760/3239]	Time 0.501 (0.522)	Data 0.001 (0.021)	Loss 4.0291 (4.0090)	Top-1 acc 30.078 (30.905)	Top-5 acc 53.516 (54.440)	lr 0.00059
Warmup Train [38][770/3239]	Time 0.399 (0.522)	Data 0.001 (0.021)	Loss 3.9599 (4.0090)	Top-1 acc 34.375 (30.915)	Top-5 acc 57.812 (54.430)	lr 0.00059
Warmup Train [38][780/3239]	Time 0.454 (0.522)	Data 0.001 (0.021)	Loss 3.8978 (4.0085)	Top-1 acc 33.594 (30.919)	Top-5 acc 57.812 (54.447)	lr 0.00058
Warmup Train [38][790/3239]	Time 0.573 (0.522)	Data 0.001 (0.021)	Loss 4.2026 (4.0095)	Top-1 acc 28.125 (30.900)	Top-5 acc 51.953 (54.424)	lr 0.00058
Warmup Train [38][800/3239]	Time 0.590 (0.522)	Data 0.001 (0.021)	Loss 3.7628 (4.0091)	Top-1 acc 32.422 (30.890)	Top-5 acc 60.156 (54.429)	lr 0.00058
Warmup Train [38][810/3239]	Time 0.469 (0.522)	Data 0.001 (0.020)	Loss 3.7854 (4.0082)	Top-1 acc 35.938 (30.908)	Top-5 acc 60.547 (54.460)	lr 0.00058
Warmup Train [38][820/3239]	Time 0.424 (0.522)	Data 0.001 (0.020)	Loss 4.0046 (4.0082)	Top-1 acc 28.906 (30.896)	Top-5 acc 54.297 (54.446)	lr 0.00058
Warmup Train [38][830/3239]	Time 0.589 (0.522)	Data 0.001 (0.020)	Loss 4.1015 (4.0082)	Top-1 acc 31.250 (30.904)	Top-5 acc 52.344 (54.439)	lr 0.00058
Warmup Train [38][840/3239]	Time 0.557 (0.522)	Data 0.001 (0.020)	Loss 4.1118 (4.0077)	Top-1 acc 28.906 (30.919)	Top-5 acc 50.000 (54.462)	lr 0.00058
Warmup Train [38][850/3239]	Time 0.518 (0.521)	Data 0.001 (0.020)	Loss 4.0651 (4.0076)	Top-1 acc 27.734 (30.923)	Top-5 acc 51.562 (54.468)	lr 0.00058
Warmup Train [38][860/3239]	Time 0.512 (0.521)	Data 0.001 (0.020)	Loss 3.9536 (4.0079)	Top-1 acc 28.906 (30.926)	Top-5 acc 54.688 (54.447)	lr 0.00057
Warmup Train [38][870/3239]	Time 0.439 (0.521)	Data 0.001 (0.019)	Loss 3.7351 (4.0068)	Top-1 acc 33.984 (30.942)	Top-5 acc 60.156 (54.471)	lr 0.00057
Warmup Train [38][880/3239]	Time 0.152 (0.521)	Data 0.001 (0.019)	Loss 3.9642 (4.0071)	Top-1 acc 29.297 (30.936)	Top-5 acc 56.250 (54.465)	lr 0.00057
Warmup Train [38][890/3239]	Time 0.412 (0.520)	Data 0.001 (0.019)	Loss 4.0019 (4.0068)	Top-1 acc 28.906 (30.936)	Top-5 acc 54.297 (54.459)	lr 0.00057
Warmup Train [38][900/3239]	Time 0.549 (0.520)	Data 0.001 (0.019)	Loss 3.8933 (4.0060)	Top-1 acc 31.250 (30.960)	Top-5 acc 54.297 (54.484)	lr 0.00057
Warmup Train [38][910/3239]	Time 0.574 (0.520)	Data 0.001 (0.019)	Loss 3.9748 (4.0060)	Top-1 acc 26.953 (30.959)	Top-5 acc 55.859 (54.481)	lr 0.00057
Warmup Train [38][920/3239]	Time 0.496 (0.519)	Data 0.001 (0.019)	Loss 4.0818 (4.0060)	Top-1 acc 30.859 (30.956)	Top-5 acc 53.906 (54.478)	lr 0.00057
Warmup Train [38][930/3239]	Time 0.550 (0.519)	Data 0.001 (0.019)	Loss 3.9159 (4.0068)	Top-1 acc 31.250 (30.941)	Top-5 acc 57.031 (54.458)	lr 0.00057
Warmup Train [38][940/3239]	Time 0.511 (0.519)	Data 0.001 (0.018)	Loss 3.9556 (4.0076)	Top-1 acc 32.422 (30.928)	Top-5 acc 54.297 (54.443)	lr 0.00056
Warmup Train [38][950/3239]	Time 0.475 (0.519)	Data 0.001 (0.018)	Loss 3.9071 (4.0074)	Top-1 acc 36.328 (30.948)	Top-5 acc 58.984 (54.450)	lr 0.00056
Warmup Train [38][960/3239]	Time 0.697 (0.519)	Data 0.001 (0.018)	Loss 3.9944 (4.0078)	Top-1 acc 33.203 (30.937)	Top-5 acc 57.812 (54.443)	lr 0.00056
Warmup Train [38][970/3239]	Time 0.613 (0.519)	Data 0.001 (0.018)	Loss 3.9215 (4.0077)	Top-1 acc 30.078 (30.950)	Top-5 acc 59.375 (54.455)	lr 0.00056
Warmup Train [38][980/3239]	Time 0.495 (0.519)	Data 0.001 (0.018)	Loss 4.0785 (4.0078)	Top-1 acc 31.641 (30.950)	Top-5 acc 52.344 (54.448)	lr 0.00056
Warmup Train [38][990/3239]	Time 0.525 (0.519)	Data 0.001 (0.018)	Loss 3.9017 (4.0079)	Top-1 acc 35.156 (30.949)	Top-5 acc 57.812 (54.452)	lr 0.00056
Warmup Train [38][1000/3239]	Time 0.528 (0.519)	Data 0.001 (0.018)	Loss 4.1158 (4.0073)	Top-1 acc 27.344 (30.967)	Top-5 acc 52.344 (54.456)	lr 0.00056
Warmup Train [38][1010/3239]	Time 0.629 (0.519)	Data 0.001 (0.017)	Loss 4.0406 (4.0076)	Top-1 acc 28.906 (30.965)	Top-5 acc 51.562 (54.459)	lr 0.00056
Warmup Train [38][1020/3239]	Time 0.450 (0.519)	Data 0.001 (0.017)	Loss 3.8828 (4.0071)	Top-1 acc 28.125 (30.970)	Top-5 acc 57.812 (54.466)	lr 0.00055
Warmup Train [38][1030/3239]	Time 0.515 (0.519)	Data 0.001 (0.017)	Loss 3.9601 (4.0073)	Top-1 acc 29.297 (30.967)	Top-5 acc 56.250 (54.462)	lr 0.00055
Warmup Train [38][1040/3239]	Time 0.537 (0.519)	Data 0.001 (0.017)	Loss 4.2797 (4.0078)	Top-1 acc 29.688 (30.965)	Top-5 acc 50.000 (54.457)	lr 0.00055
Warmup Train [38][1050/3239]	Time 0.487 (0.519)	Data 0.001 (0.017)	Loss 4.0344 (4.0083)	Top-1 acc 33.203 (30.950)	Top-5 acc 58.203 (54.451)	lr 0.00055
Warmup Train [38][1060/3239]	Time 0.349 (0.519)	Data 0.001 (0.017)	Loss 3.9987 (4.0087)	Top-1 acc 30.859 (30.941)	Top-5 acc 53.906 (54.445)	lr 0.00055
Warmup Train [38][1070/3239]	Time 0.495 (0.519)	Data 0.001 (0.017)	Loss 4.0338 (4.0085)	Top-1 acc 29.688 (30.953)	Top-5 acc 53.125 (54.449)	lr 0.00055
Warmup Train [38][1080/3239]	Time 0.519 (0.519)	Data 0.001 (0.017)	Loss 3.9107 (4.0082)	Top-1 acc 36.719 (30.964)	Top-5 acc 57.812 (54.462)	lr 0.00055
Warmup Train [38][1090/3239]	Time 0.336 (0.518)	Data 0.001 (0.017)	Loss 4.1390 (4.0082)	Top-1 acc 30.078 (30.968)	Top-5 acc 51.172 (54.456)	lr 0.00055
Warmup Train [38][1100/3239]	Time 0.411 (0.518)	Data 0.001 (0.017)	Loss 4.1649 (4.0079)	Top-1 acc 29.688 (30.974)	Top-5 acc 53.125 (54.467)	lr 0.00054
Warmup Train [38][1110/3239]	Time 0.594 (0.518)	Data 0.001 (0.017)	Loss 4.1812 (4.0082)	Top-1 acc 24.219 (30.961)	Top-5 acc 51.953 (54.453)	lr 0.00054
Warmup Train [38][1120/3239]	Time 0.466 (0.518)	Data 0.001 (0.016)	Loss 3.7828 (4.0082)	Top-1 acc 34.375 (30.964)	Top-5 acc 59.375 (54.457)	lr 0.00054
Warmup Train [38][1130/3239]	Time 0.366 (0.518)	Data 0.001 (0.016)	Loss 3.8250 (4.0080)	Top-1 acc 33.594 (30.964)	Top-5 acc 59.766 (54.467)	lr 0.00054
Warmup Train [38][1140/3239]	Time 0.657 (0.518)	Data 0.001 (0.016)	Loss 3.8197 (4.0081)	Top-1 acc 35.547 (30.961)	Top-5 acc 61.328 (54.466)	lr 0.00054
Warmup Train [38][1150/3239]	Time 0.480 (0.518)	Data 0.001 (0.016)	Loss 4.0106 (4.0088)	Top-1 acc 31.641 (30.948)	Top-5 acc 52.344 (54.454)	lr 0.00054
Warmup Train [38][1160/3239]	Time 0.254 (0.518)	Data 0.001 (0.016)	Loss 4.0800 (4.0086)	Top-1 acc 28.125 (30.948)	Top-5 acc 53.516 (54.456)	lr 0.00054
Warmup Train [38][1170/3239]	Time 0.316 (0.517)	Data 0.001 (0.016)	Loss 4.0370 (4.0084)	Top-1 acc 31.641 (30.957)	Top-5 acc 53.906 (54.458)	lr 0.00054
Warmup Train [38][1180/3239]	Time 0.489 (0.517)	Data 0.001 (0.016)	Loss 3.9422 (4.0080)	Top-1 acc 32.422 (30.963)	Top-5 acc 57.031 (54.467)	lr 0.00053
Warmup Train [38][1190/3239]	Time 0.588 (0.517)	Data 0.004 (0.016)	Loss 3.6043 (4.0073)	Top-1 acc 34.766 (30.973)	Top-5 acc 64.844 (54.476)	lr 0.00053
Warmup Train [38][1200/3239]	Time 0.426 (0.517)	Data 0.001 (0.016)	Loss 3.9538 (4.0074)	Top-1 acc 32.812 (30.970)	Top-5 acc 56.250 (54.474)	lr 0.00053
Warmup Train [38][1210/3239]	Time 0.584 (0.517)	Data 0.001 (0.016)	Loss 3.9346 (4.0072)	Top-1 acc 31.641 (30.979)	Top-5 acc 58.203 (54.484)	lr 0.00053
Warmup Train [38][1220/3239]	Time 0.511 (0.517)	Data 0.001 (0.016)	Loss 4.0561 (4.0073)	Top-1 acc 30.859 (30.974)	Top-5 acc 53.906 (54.478)	lr 0.00053
Warmup Train [38][1230/3239]	Time 0.579 (0.517)	Data 0.001 (0.016)	Loss 4.1193 (4.0073)	Top-1 acc 28.906 (30.972)	Top-5 acc 52.344 (54.483)	lr 0.00053
Warmup Train [38][1240/3239]	Time 0.380 (0.517)	Data 0.001 (0.016)	Loss 3.8906 (4.0074)	Top-1 acc 32.031 (30.965)	Top-5 acc 56.250 (54.477)	lr 0.00053
Warmup Train [38][1250/3239]	Time 0.617 (0.517)	Data 0.001 (0.015)	Loss 4.3447 (4.0072)	Top-1 acc 23.828 (30.978)	Top-5 acc 46.094 (54.486)	lr 0.00053
Warmup Train [38][1260/3239]	Time 0.505 (0.517)	Data 0.001 (0.015)	Loss 4.0043 (4.0071)	Top-1 acc 35.938 (30.980)	Top-5 acc 59.766 (54.495)	lr 0.00052
Warmup Train [38][1270/3239]	Time 0.652 (0.518)	Data 0.001 (0.015)	Loss 4.1428 (4.0069)	Top-1 acc 27.344 (30.984)	Top-5 acc 53.516 (54.508)	lr 0.00052
Warmup Train [38][1280/3239]	Time 0.519 (0.518)	Data 0.001 (0.015)	Loss 4.1166 (4.0066)	Top-1 acc 28.906 (30.985)	Top-5 acc 52.734 (54.512)	lr 0.00052
Warmup Train [38][1290/3239]	Time 0.667 (0.518)	Data 0.001 (0.015)	Loss 4.0596 (4.0071)	Top-1 acc 30.469 (30.986)	Top-5 acc 51.953 (54.500)	lr 0.00052
Warmup Train [38][1300/3239]	Time 0.495 (0.518)	Data 0.001 (0.015)	Loss 3.6684 (4.0069)	Top-1 acc 39.453 (30.989)	Top-5 acc 62.891 (54.501)	lr 0.00052
Warmup Train [38][1310/3239]	Time 0.510 (0.518)	Data 0.001 (0.015)	Loss 4.0314 (4.0070)	Top-1 acc 30.469 (30.985)	Top-5 acc 52.734 (54.497)	lr 0.00052
Warmup Train [38][1320/3239]	Time 0.402 (0.518)	Data 0.001 (0.015)	Loss 4.0203 (4.0070)	Top-1 acc 27.734 (30.985)	Top-5 acc 53.125 (54.500)	lr 0.00052
Warmup Train [38][1330/3239]	Time 0.513 (0.517)	Data 0.001 (0.015)	Loss 4.1957 (4.0070)	Top-1 acc 25.781 (30.989)	Top-5 acc 49.609 (54.493)	lr 0.00052
Warmup Train [38][1340/3239]	Time 0.613 (0.517)	Data 0.001 (0.015)	Loss 4.1427 (4.0072)	Top-1 acc 30.078 (30.986)	Top-5 acc 53.906 (54.490)	lr 0.00051
Warmup Train [38][1350/3239]	Time 0.602 (0.517)	Data 0.001 (0.015)	Loss 3.7533 (4.0071)	Top-1 acc 35.938 (30.988)	Top-5 acc 62.500 (54.492)	lr 0.00051
Warmup Train [38][1360/3239]	Time 0.498 (0.517)	Data 0.001 (0.015)	Loss 4.0821 (4.0069)	Top-1 acc 31.250 (30.989)	Top-5 acc 53.125 (54.495)	lr 0.00051
Warmup Train [38][1370/3239]	Time 0.490 (0.517)	Data 0.001 (0.014)	Loss 4.0871 (4.0071)	Top-1 acc 30.469 (30.988)	Top-5 acc 51.562 (54.494)	lr 0.00051
Warmup Train [38][1380/3239]	Time 0.587 (0.517)	Data 0.001 (0.014)	Loss 3.9459 (4.0076)	Top-1 acc 32.812 (30.975)	Top-5 acc 59.375 (54.485)	lr 0.00051
Warmup Train [38][1390/3239]	Time 0.559 (0.517)	Data 0.001 (0.014)	Loss 4.1150 (4.0074)	Top-1 acc 26.953 (30.974)	Top-5 acc 54.688 (54.487)	lr 0.00051
Warmup Train [38][1400/3239]	Time 0.679 (0.517)	Data 0.001 (0.014)	Loss 3.9866 (4.0077)	Top-1 acc 32.812 (30.971)	Top-5 acc 56.641 (54.494)	lr 0.00051
Warmup Train [38][1410/3239]	Time 0.563 (0.517)	Data 0.001 (0.014)	Loss 3.9984 (4.0078)	Top-1 acc 33.203 (30.970)	Top-5 acc 57.812 (54.495)	lr 0.00051
Warmup Train [38][1420/3239]	Time 0.475 (0.517)	Data 0.001 (0.014)	Loss 3.9596 (4.0078)	Top-1 acc 34.375 (30.969)	Top-5 acc 54.688 (54.499)	lr 0.00050
Warmup Train [38][1430/3239]	Time 0.478 (0.516)	Data 0.001 (0.014)	Loss 3.8904 (4.0074)	Top-1 acc 32.422 (30.975)	Top-5 acc 57.031 (54.506)	lr 0.00050
Warmup Train [38][1440/3239]	Time 0.534 (0.516)	Data 0.001 (0.014)	Loss 4.0427 (4.0075)	Top-1 acc 31.250 (30.974)	Top-5 acc 51.562 (54.501)	lr 0.00050
Warmup Train [38][1450/3239]	Time 0.488 (0.516)	Data 0.001 (0.014)	Loss 3.8956 (4.0071)	Top-1 acc 27.734 (30.974)	Top-5 acc 54.688 (54.511)	lr 0.00050
Warmup Train [38][1460/3239]	Time 0.539 (0.516)	Data 0.001 (0.014)	Loss 3.8789 (4.0073)	Top-1 acc 33.594 (30.968)	Top-5 acc 55.859 (54.502)	lr 0.00050
Warmup Train [38][1470/3239]	Time 0.403 (0.516)	Data 0.001 (0.014)	Loss 3.9673 (4.0072)	Top-1 acc 33.594 (30.976)	Top-5 acc 54.688 (54.506)	lr 0.00050
Warmup Train [38][1480/3239]	Time 0.397 (0.516)	Data 0.001 (0.014)	Loss 3.9938 (4.0073)	Top-1 acc 31.250 (30.981)	Top-5 acc 55.859 (54.511)	lr 0.00050
Warmup Train [38][1490/3239]	Time 0.586 (0.516)	Data 0.001 (0.014)	Loss 4.0730 (4.0071)	Top-1 acc 28.125 (30.987)	Top-5 acc 51.562 (54.519)	lr 0.00050
Warmup Train [38][1500/3239]	Time 0.446 (0.516)	Data 0.001 (0.014)	Loss 4.2222 (4.0065)	Top-1 acc 26.953 (30.994)	Top-5 acc 53.125 (54.537)	lr 0.00049
Warmup Train [38][1510/3239]	Time 0.743 (0.516)	Data 0.001 (0.014)	Loss 4.0650 (4.0070)	Top-1 acc 31.641 (30.992)	Top-5 acc 57.422 (54.528)	lr 0.00049
Warmup Train [38][1520/3239]	Time 0.553 (0.516)	Data 0.002 (0.014)	Loss 4.0658 (4.0070)	Top-1 acc 28.125 (30.985)	Top-5 acc 48.828 (54.520)	lr 0.00049
Warmup Train [38][1530/3239]	Time 0.538 (0.516)	Data 0.001 (0.014)	Loss 3.9278 (4.0068)	Top-1 acc 27.734 (30.985)	Top-5 acc 56.641 (54.525)	lr 0.00049
Warmup Train [38][1540/3239]	Time 0.501 (0.516)	Data 0.001 (0.013)	Loss 4.1949 (4.0071)	Top-1 acc 28.125 (30.981)	Top-5 acc 46.484 (54.520)	lr 0.00049
Warmup Train [38][1550/3239]	Time 0.567 (0.516)	Data 0.001 (0.013)	Loss 3.8278 (4.0077)	Top-1 acc 37.891 (30.976)	Top-5 acc 58.203 (54.512)	lr 0.00049
Warmup Train [38][1560/3239]	Time 0.419 (0.516)	Data 0.001 (0.013)	Loss 3.8769 (4.0076)	Top-1 acc 29.688 (30.975)	Top-5 acc 56.250 (54.515)	lr 0.00049
Warmup Train [38][1570/3239]	Time 0.336 (0.516)	Data 0.001 (0.013)	Loss 3.9170 (4.0076)	Top-1 acc 33.203 (30.980)	Top-5 acc 55.859 (54.518)	lr 0.00049
Warmup Train [38][1580/3239]	Time 0.425 (0.516)	Data 0.001 (0.013)	Loss 4.0430 (4.0074)	Top-1 acc 30.078 (30.987)	Top-5 acc 55.859 (54.518)	lr 0.00049
Warmup Train [38][1590/3239]	Time 0.647 (0.516)	Data 0.001 (0.013)	Loss 4.1696 (4.0075)	Top-1 acc 27.734 (30.991)	Top-5 acc 52.734 (54.517)	lr 0.00048
Warmup Train [38][1600/3239]	Time 0.438 (0.516)	Data 0.001 (0.013)	Loss 4.2466 (4.0069)	Top-1 acc 26.953 (31.006)	Top-5 acc 49.609 (54.531)	lr 0.00048
Warmup Train [38][1610/3239]	Time 0.437 (0.516)	Data 0.001 (0.013)	Loss 4.0394 (4.0070)	Top-1 acc 32.422 (31.002)	Top-5 acc 53.906 (54.530)	lr 0.00048
Warmup Train [38][1620/3239]	Time 0.655 (0.516)	Data 0.001 (0.013)	Loss 3.9699 (4.0071)	Top-1 acc 32.031 (31.005)	Top-5 acc 56.250 (54.531)	lr 0.00048
Warmup Train [38][1630/3239]	Time 0.318 (0.516)	Data 0.001 (0.013)	Loss 4.0521 (4.0069)	Top-1 acc 31.250 (31.004)	Top-5 acc 56.250 (54.536)	lr 0.00048
Warmup Train [38][1640/3239]	Time 0.553 (0.515)	Data 0.001 (0.013)	Loss 3.9047 (4.0067)	Top-1 acc 35.156 (31.010)	Top-5 acc 55.078 (54.541)	lr 0.00048
Warmup Train [38][1650/3239]	Time 0.481 (0.515)	Data 0.001 (0.013)	Loss 3.8976 (4.0066)	Top-1 acc 32.031 (31.016)	Top-5 acc 54.688 (54.546)	lr 0.00048
Warmup Train [38][1660/3239]	Time 0.363 (0.515)	Data 0.001 (0.013)	Loss 4.1563 (4.0063)	Top-1 acc 28.906 (31.017)	Top-5 acc 51.953 (54.550)	lr 0.00048
Warmup Train [38][1670/3239]	Time 0.572 (0.515)	Data 0.001 (0.013)	Loss 3.7841 (4.0065)	Top-1 acc 38.672 (31.016)	Top-5 acc 60.156 (54.544)	lr 0.00047
Warmup Train [38][1680/3239]	Time 0.568 (0.515)	Data 0.001 (0.013)	Loss 3.9919 (4.0065)	Top-1 acc 32.422 (31.011)	Top-5 acc 55.859 (54.539)	lr 0.00047
Warmup Train [38][1690/3239]	Time 0.535 (0.515)	Data 0.001 (0.013)	Loss 3.9129 (4.0059)	Top-1 acc 31.250 (31.016)	Top-5 acc 58.203 (54.552)	lr 0.00047
Warmup Train [38][1700/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 4.0760 (4.0058)	Top-1 acc 26.953 (31.015)	Top-5 acc 51.172 (54.548)	lr 0.00047
Warmup Train [38][1710/3239]	Time 0.788 (0.515)	Data 0.001 (0.013)	Loss 4.0757 (4.0060)	Top-1 acc 28.906 (31.014)	Top-5 acc 53.516 (54.540)	lr 0.00047
Warmup Train [38][1720/3239]	Time 0.391 (0.515)	Data 0.001 (0.013)	Loss 3.8029 (4.0059)	Top-1 acc 34.766 (31.011)	Top-5 acc 60.156 (54.550)	lr 0.00047
Warmup Train [38][1730/3239]	Time 0.351 (0.515)	Data 0.001 (0.013)	Loss 4.0679 (4.0060)	Top-1 acc 28.125 (31.007)	Top-5 acc 50.391 (54.548)	lr 0.00047
Warmup Train [38][1740/3239]	Time 0.649 (0.515)	Data 0.002 (0.013)	Loss 3.8847 (4.0058)	Top-1 acc 31.641 (31.010)	Top-5 acc 59.766 (54.554)	lr 0.00047
Warmup Train [38][1750/3239]	Time 0.581 (0.515)	Data 0.001 (0.013)	Loss 4.1458 (4.0058)	Top-1 acc 29.688 (31.012)	Top-5 acc 53.906 (54.555)	lr 0.00047
Warmup Train [38][1760/3239]	Time 0.485 (0.515)	Data 0.001 (0.013)	Loss 4.0417 (4.0057)	Top-1 acc 30.469 (31.009)	Top-5 acc 55.859 (54.556)	lr 0.00046
Warmup Train [38][1770/3239]	Time 0.471 (0.515)	Data 0.001 (0.013)	Loss 4.0309 (4.0057)	Top-1 acc 30.469 (31.016)	Top-5 acc 56.250 (54.553)	lr 0.00046
Warmup Train [38][1780/3239]	Time 0.337 (0.515)	Data 0.001 (0.013)	Loss 4.1793 (4.0062)	Top-1 acc 29.297 (31.011)	Top-5 acc 50.000 (54.544)	lr 0.00046
Warmup Train [38][1790/3239]	Time 0.352 (0.515)	Data 0.001 (0.013)	Loss 4.0723 (4.0060)	Top-1 acc 32.812 (31.018)	Top-5 acc 51.172 (54.548)	lr 0.00046
Warmup Train [38][1800/3239]	Time 0.551 (0.515)	Data 0.001 (0.013)	Loss 3.9073 (4.0058)	Top-1 acc 35.938 (31.027)	Top-5 acc 60.547 (54.558)	lr 0.00046
Warmup Train [38][1810/3239]	Time 0.532 (0.515)	Data 0.001 (0.013)	Loss 3.8125 (4.0058)	Top-1 acc 31.250 (31.029)	Top-5 acc 55.469 (54.552)	lr 0.00046
Warmup Train [38][1820/3239]	Time 0.493 (0.515)	Data 0.001 (0.013)	Loss 4.1779 (4.0059)	Top-1 acc 29.297 (31.031)	Top-5 acc 54.297 (54.553)	lr 0.00046
Warmup Train [38][1830/3239]	Time 0.498 (0.515)	Data 0.001 (0.013)	Loss 4.0060 (4.0061)	Top-1 acc 27.734 (31.021)	Top-5 acc 54.297 (54.554)	lr 0.00046
Warmup Train [38][1840/3239]	Time 0.414 (0.515)	Data 0.001 (0.013)	Loss 4.0329 (4.0062)	Top-1 acc 26.562 (31.013)	Top-5 acc 55.469 (54.553)	lr 0.00045
Warmup Train [38][1850/3239]	Time 0.544 (0.515)	Data 0.001 (0.013)	Loss 4.0253 (4.0058)	Top-1 acc 29.688 (31.012)	Top-5 acc 55.469 (54.563)	lr 0.00045
Warmup Train [38][1860/3239]	Time 0.538 (0.515)	Data 0.001 (0.012)	Loss 4.0868 (4.0059)	Top-1 acc 30.078 (31.014)	Top-5 acc 51.953 (54.559)	lr 0.00045
Warmup Train [38][1870/3239]	Time 0.501 (0.515)	Data 0.001 (0.012)	Loss 4.2285 (4.0060)	Top-1 acc 28.125 (31.019)	Top-5 acc 49.219 (54.558)	lr 0.00045
Warmup Train [38][1880/3239]	Time 0.408 (0.515)	Data 0.001 (0.012)	Loss 4.0563 (4.0061)	Top-1 acc 32.031 (31.018)	Top-5 acc 54.297 (54.558)	lr 0.00045
Warmup Train [38][1890/3239]	Time 0.473 (0.515)	Data 0.001 (0.012)	Loss 4.0659 (4.0060)	Top-1 acc 29.688 (31.012)	Top-5 acc 51.172 (54.560)	lr 0.00045
Warmup Train [38][1900/3239]	Time 0.475 (0.515)	Data 0.001 (0.012)	Loss 4.0906 (4.0065)	Top-1 acc 34.766 (31.010)	Top-5 acc 53.516 (54.549)	lr 0.00045
Warmup Train [38][1910/3239]	Time 0.502 (0.515)	Data 0.001 (0.012)	Loss 3.9111 (4.0063)	Top-1 acc 32.422 (31.019)	Top-5 acc 58.594 (54.555)	lr 0.00045
Warmup Train [38][1920/3239]	Time 0.609 (0.515)	Data 0.001 (0.012)	Loss 3.7621 (4.0064)	Top-1 acc 32.422 (31.016)	Top-5 acc 60.938 (54.553)	lr 0.00045
Warmup Train [38][1930/3239]	Time 0.476 (0.514)	Data 0.001 (0.012)	Loss 3.8710 (4.0063)	Top-1 acc 32.422 (31.013)	Top-5 acc 58.203 (54.553)	lr 0.00044
Warmup Train [38][1940/3239]	Time 0.439 (0.514)	Data 0.001 (0.012)	Loss 3.9884 (4.0064)	Top-1 acc 32.422 (31.011)	Top-5 acc 53.516 (54.551)	lr 0.00044
Warmup Train [38][1950/3239]	Time 0.482 (0.514)	Data 0.001 (0.012)	Loss 4.1163 (4.0065)	Top-1 acc 29.688 (31.012)	Top-5 acc 53.516 (54.550)	lr 0.00044
Warmup Train [38][1960/3239]	Time 0.568 (0.514)	Data 0.001 (0.012)	Loss 4.0589 (4.0064)	Top-1 acc 27.734 (31.009)	Top-5 acc 53.516 (54.549)	lr 0.00044
Warmup Train [38][1970/3239]	Time 0.396 (0.514)	Data 0.001 (0.012)	Loss 4.0751 (4.0063)	Top-1 acc 26.953 (31.012)	Top-5 acc 53.906 (54.554)	lr 0.00044
Warmup Train [38][1980/3239]	Time 0.507 (0.514)	Data 0.001 (0.012)	Loss 3.9824 (4.0065)	Top-1 acc 33.594 (31.006)	Top-5 acc 55.469 (54.552)	lr 0.00044
Warmup Train [38][1990/3239]	Time 0.653 (0.514)	Data 0.001 (0.012)	Loss 4.0298 (4.0063)	Top-1 acc 30.859 (31.006)	Top-5 acc 54.688 (54.557)	lr 0.00044
Warmup Train [38][2000/3239]	Time 0.536 (0.514)	Data 0.001 (0.012)	Loss 3.9537 (4.0061)	Top-1 acc 32.422 (31.003)	Top-5 acc 54.297 (54.559)	lr 0.00044
Warmup Train [38][2010/3239]	Time 0.478 (0.514)	Data 0.001 (0.012)	Loss 3.7428 (4.0061)	Top-1 acc 35.156 (31.003)	Top-5 acc 62.109 (54.559)	lr 0.00044
Warmup Train [38][2020/3239]	Time 0.471 (0.514)	Data 0.001 (0.012)	Loss 3.9316 (4.0061)	Top-1 acc 29.688 (31.001)	Top-5 acc 53.125 (54.555)	lr 0.00043
Warmup Train [38][2030/3239]	Time 0.638 (0.514)	Data 0.001 (0.012)	Loss 4.0056 (4.0055)	Top-1 acc 30.469 (31.014)	Top-5 acc 53.125 (54.567)	lr 0.00043
Warmup Train [38][2040/3239]	Time 0.632 (0.514)	Data 0.001 (0.012)	Loss 3.8472 (4.0054)	Top-1 acc 35.547 (31.017)	Top-5 acc 59.375 (54.572)	lr 0.00043
Warmup Train [38][2050/3239]	Time 0.617 (0.514)	Data 0.001 (0.012)	Loss 3.9031 (4.0052)	Top-1 acc 36.328 (31.026)	Top-5 acc 56.641 (54.577)	lr 0.00043
Warmup Train [38][2060/3239]	Time 0.400 (0.514)	Data 0.001 (0.012)	Loss 4.1601 (4.0054)	Top-1 acc 29.688 (31.030)	Top-5 acc 48.438 (54.572)	lr 0.00043
Warmup Train [38][2070/3239]	Time 0.358 (0.514)	Data 0.001 (0.012)	Loss 4.0070 (4.0055)	Top-1 acc 27.734 (31.029)	Top-5 acc 55.859 (54.572)	lr 0.00043
Warmup Train [38][2080/3239]	Time 0.570 (0.514)	Data 0.001 (0.012)	Loss 3.9422 (4.0053)	Top-1 acc 30.078 (31.029)	Top-5 acc 57.031 (54.577)	lr 0.00043
Warmup Train [38][2090/3239]	Time 0.496 (0.514)	Data 0.001 (0.012)	Loss 3.9449 (4.0057)	Top-1 acc 32.422 (31.018)	Top-5 acc 53.906 (54.571)	lr 0.00043
Warmup Train [38][2100/3239]	Time 0.386 (0.514)	Data 0.001 (0.012)	Loss 4.2092 (4.0056)	Top-1 acc 30.859 (31.021)	Top-5 acc 53.516 (54.574)	lr 0.00043
Warmup Train [38][2110/3239]	Time 0.407 (0.514)	Data 0.001 (0.012)	Loss 3.9503 (4.0056)	Top-1 acc 32.031 (31.023)	Top-5 acc 53.516 (54.569)	lr 0.00042
Warmup Train [38][2120/3239]	Time 0.618 (0.514)	Data 0.001 (0.012)	Loss 3.9879 (4.0055)	Top-1 acc 33.203 (31.025)	Top-5 acc 55.469 (54.568)	lr 0.00042
Warmup Train [38][2130/3239]	Time 0.540 (0.514)	Data 0.001 (0.012)	Loss 4.0255 (4.0057)	Top-1 acc 29.688 (31.025)	Top-5 acc 53.906 (54.567)	lr 0.00042
Warmup Train [38][2140/3239]	Time 0.500 (0.514)	Data 0.001 (0.012)	Loss 3.9518 (4.0059)	Top-1 acc 31.250 (31.017)	Top-5 acc 55.859 (54.559)	lr 0.00042
Warmup Train [38][2150/3239]	Time 0.627 (0.514)	Data 0.001 (0.012)	Loss 4.2056 (4.0056)	Top-1 acc 25.000 (31.023)	Top-5 acc 48.047 (54.563)	lr 0.00042
Warmup Train [38][2160/3239]	Time 0.525 (0.514)	Data 0.001 (0.012)	Loss 3.9879 (4.0055)	Top-1 acc 32.422 (31.033)	Top-5 acc 51.562 (54.566)	lr 0.00042
Warmup Train [38][2170/3239]	Time 0.330 (0.514)	Data 0.001 (0.012)	Loss 4.2308 (4.0055)	Top-1 acc 26.172 (31.035)	Top-5 acc 51.562 (54.571)	lr 0.00042
Warmup Train [38][2180/3239]	Time 0.529 (0.514)	Data 0.001 (0.012)	Loss 3.7490 (4.0053)	Top-1 acc 37.109 (31.036)	Top-5 acc 61.719 (54.577)	lr 0.00042
Warmup Train [38][2190/3239]	Time 0.470 (0.514)	Data 0.001 (0.012)	Loss 3.9380 (4.0053)	Top-1 acc 28.125 (31.032)	Top-5 acc 57.422 (54.575)	lr 0.00042
Warmup Train [38][2200/3239]	Time 0.441 (0.513)	Data 0.001 (0.012)	Loss 3.9339 (4.0056)	Top-1 acc 33.203 (31.027)	Top-5 acc 55.859 (54.569)	lr 0.00041
Warmup Train [38][2210/3239]	Time 0.481 (0.514)	Data 0.001 (0.012)	Loss 3.9774 (4.0056)	Top-1 acc 33.203 (31.027)	Top-5 acc 54.297 (54.570)	lr 0.00041
Warmup Train [38][2220/3239]	Time 0.540 (0.514)	Data 0.001 (0.012)	Loss 3.7995 (4.0053)	Top-1 acc 35.547 (31.034)	Top-5 acc 57.031 (54.574)	lr 0.00041
Warmup Train [38][2230/3239]	Time 0.522 (0.514)	Data 0.001 (0.011)	Loss 4.0435 (4.0051)	Top-1 acc 32.422 (31.038)	Top-5 acc 54.297 (54.575)	lr 0.00041
Warmup Train [38][2240/3239]	Time 0.658 (0.514)	Data 0.001 (0.011)	Loss 3.9932 (4.0051)	Top-1 acc 33.594 (31.036)	Top-5 acc 58.203 (54.578)	lr 0.00041
Warmup Train [38][2250/3239]	Time 0.464 (0.514)	Data 0.001 (0.011)	Loss 3.9101 (4.0048)	Top-1 acc 34.766 (31.041)	Top-5 acc 54.297 (54.585)	lr 0.00041
Warmup Train [38][2260/3239]	Time 0.589 (0.514)	Data 0.001 (0.011)	Loss 4.0574 (4.0047)	Top-1 acc 32.031 (31.045)	Top-5 acc 53.906 (54.585)	lr 0.00041
Warmup Train [38][2270/3239]	Time 0.566 (0.514)	Data 0.001 (0.011)	Loss 4.0533 (4.0048)	Top-1 acc 30.859 (31.042)	Top-5 acc 54.688 (54.583)	lr 0.00041
Warmup Train [38][2280/3239]	Time 0.519 (0.514)	Data 0.001 (0.011)	Loss 3.9136 (4.0046)	Top-1 acc 33.594 (31.044)	Top-5 acc 55.469 (54.588)	lr 0.00041
Warmup Train [38][2290/3239]	Time 0.498 (0.514)	Data 0.001 (0.011)	Loss 4.1237 (4.0047)	Top-1 acc 32.031 (31.042)	Top-5 acc 52.344 (54.585)	lr 0.00040
Warmup Train [38][2300/3239]	Time 0.550 (0.514)	Data 0.001 (0.011)	Loss 4.1376 (4.0049)	Top-1 acc 28.125 (31.041)	Top-5 acc 52.734 (54.579)	lr 0.00040
Warmup Train [38][2310/3239]	Time 0.500 (0.514)	Data 0.001 (0.011)	Loss 4.2541 (4.0050)	Top-1 acc 29.688 (31.041)	Top-5 acc 46.484 (54.572)	lr 0.00040
Warmup Train [38][2320/3239]	Time 0.551 (0.514)	Data 0.001 (0.011)	Loss 3.8872 (4.0053)	Top-1 acc 29.297 (31.035)	Top-5 acc 53.906 (54.563)	lr 0.00040
Warmup Train [38][2330/3239]	Time 0.540 (0.514)	Data 0.001 (0.011)	Loss 4.0828 (4.0052)	Top-1 acc 26.172 (31.036)	Top-5 acc 52.734 (54.561)	lr 0.00040
Warmup Train [38][2340/3239]	Time 0.468 (0.514)	Data 0.001 (0.011)	Loss 3.9438 (4.0051)	Top-1 acc 32.422 (31.035)	Top-5 acc 58.203 (54.563)	lr 0.00040
Warmup Train [38][2350/3239]	Time 0.655 (0.514)	Data 0.001 (0.011)	Loss 4.1930 (4.0055)	Top-1 acc 26.953 (31.033)	Top-5 acc 49.609 (54.558)	lr 0.00040
Warmup Train [38][2360/3239]	Time 0.597 (0.514)	Data 0.001 (0.011)	Loss 4.0733 (4.0059)	Top-1 acc 30.859 (31.033)	Top-5 acc 53.906 (54.550)	lr 0.00040
Warmup Train [38][2370/3239]	Time 0.644 (0.514)	Data 0.001 (0.011)	Loss 3.9236 (4.0060)	Top-1 acc 32.812 (31.031)	Top-5 acc 53.516 (54.550)	lr 0.00040
Warmup Train [38][2380/3239]	Time 0.552 (0.514)	Data 0.001 (0.011)	Loss 4.0992 (4.0063)	Top-1 acc 29.297 (31.028)	Top-5 acc 50.781 (54.544)	lr 0.00039
Warmup Train [38][2390/3239]	Time 0.417 (0.514)	Data 0.001 (0.011)	Loss 3.9487 (4.0059)	Top-1 acc 29.688 (31.034)	Top-5 acc 57.422 (54.553)	lr 0.00039
Warmup Train [38][2400/3239]	Time 0.545 (0.514)	Data 0.001 (0.011)	Loss 4.1632 (4.0058)	Top-1 acc 27.344 (31.039)	Top-5 acc 51.172 (54.556)	lr 0.00039
Warmup Train [38][2410/3239]	Time 0.352 (0.514)	Data 0.001 (0.011)	Loss 3.9280 (4.0058)	Top-1 acc 32.422 (31.034)	Top-5 acc 56.641 (54.554)	lr 0.00039
Warmup Train [38][2420/3239]	Time 0.546 (0.514)	Data 0.001 (0.011)	Loss 3.9618 (4.0054)	Top-1 acc 28.125 (31.038)	Top-5 acc 58.203 (54.564)	lr 0.00039
Warmup Train [38][2430/3239]	Time 0.597 (0.513)	Data 0.001 (0.011)	Loss 4.0839 (4.0055)	Top-1 acc 30.469 (31.038)	Top-5 acc 51.172 (54.563)	lr 0.00039
Warmup Train [38][2440/3239]	Time 0.537 (0.513)	Data 0.002 (0.011)	Loss 3.8808 (4.0053)	Top-1 acc 34.375 (31.039)	Top-5 acc 55.859 (54.565)	lr 0.00039
Warmup Train [38][2450/3239]	Time 0.510 (0.513)	Data 0.001 (0.011)	Loss 3.9872 (4.0053)	Top-1 acc 31.250 (31.040)	Top-5 acc 55.859 (54.565)	lr 0.00039
Warmup Train [38][2460/3239]	Time 0.642 (0.513)	Data 0.001 (0.011)	Loss 4.1130 (4.0052)	Top-1 acc 29.688 (31.043)	Top-5 acc 50.391 (54.568)	lr 0.00039
Warmup Train [38][2470/3239]	Time 0.562 (0.513)	Data 0.001 (0.011)	Loss 4.2102 (4.0054)	Top-1 acc 23.438 (31.040)	Top-5 acc 48.828 (54.565)	lr 0.00039
Warmup Train [38][2480/3239]	Time 0.473 (0.513)	Data 0.001 (0.011)	Loss 4.0675 (4.0053)	Top-1 acc 28.125 (31.048)	Top-5 acc 53.125 (54.568)	lr 0.00038
Warmup Train [38][2490/3239]	Time 0.383 (0.513)	Data 0.001 (0.011)	Loss 4.0542 (4.0054)	Top-1 acc 30.859 (31.049)	Top-5 acc 54.297 (54.564)	lr 0.00038
Warmup Train [38][2500/3239]	Time 0.693 (0.513)	Data 0.001 (0.011)	Loss 3.9923 (4.0056)	Top-1 acc 31.250 (31.046)	Top-5 acc 58.594 (54.560)	lr 0.00038
Warmup Train [38][2510/3239]	Time 0.373 (0.513)	Data 0.001 (0.011)	Loss 4.2559 (4.0058)	Top-1 acc 25.391 (31.040)	Top-5 acc 51.953 (54.557)	lr 0.00038
Warmup Train [38][2520/3239]	Time 0.432 (0.513)	Data 0.001 (0.011)	Loss 3.9194 (4.0059)	Top-1 acc 34.375 (31.039)	Top-5 acc 57.812 (54.555)	lr 0.00038
Warmup Train [38][2530/3239]	Time 0.579 (0.513)	Data 0.001 (0.011)	Loss 3.9048 (4.0059)	Top-1 acc 33.594 (31.040)	Top-5 acc 56.641 (54.554)	lr 0.00038
Warmup Train [38][2540/3239]	Time 0.530 (0.513)	Data 0.001 (0.011)	Loss 3.8802 (4.0058)	Top-1 acc 35.547 (31.040)	Top-5 acc 57.812 (54.558)	lr 0.00038
Warmup Train [38][2550/3239]	Time 0.487 (0.513)	Data 0.001 (0.011)	Loss 3.9746 (4.0058)	Top-1 acc 29.297 (31.040)	Top-5 acc 52.734 (54.556)	lr 0.00038
Warmup Train [38][2560/3239]	Time 0.524 (0.513)	Data 0.001 (0.011)	Loss 4.1346 (4.0059)	Top-1 acc 28.516 (31.034)	Top-5 acc 51.172 (54.554)	lr 0.00038
Warmup Train [38][2570/3239]	Time 0.679 (0.513)	Data 0.001 (0.011)	Loss 3.8864 (4.0058)	Top-1 acc 34.375 (31.037)	Top-5 acc 57.031 (54.559)	lr 0.00037
Warmup Train [38][2580/3239]	Time 0.499 (0.513)	Data 0.001 (0.011)	Loss 4.1917 (4.0061)	Top-1 acc 29.297 (31.031)	Top-5 acc 49.219 (54.545)	lr 0.00037
Warmup Train [38][2590/3239]	Time 0.393 (0.513)	Data 0.001 (0.011)	Loss 4.0663 (4.0061)	Top-1 acc 25.391 (31.032)	Top-5 acc 50.000 (54.544)	lr 0.00037
Warmup Train [38][2600/3239]	Time 0.468 (0.513)	Data 0.001 (0.011)	Loss 4.1829 (4.0060)	Top-1 acc 24.609 (31.036)	Top-5 acc 51.562 (54.543)	lr 0.00037
Warmup Train [38][2610/3239]	Time 0.552 (0.513)	Data 0.001 (0.011)	Loss 3.9957 (4.0062)	Top-1 acc 31.250 (31.030)	Top-5 acc 54.297 (54.537)	lr 0.00037
Warmup Train [38][2620/3239]	Time 0.512 (0.513)	Data 0.001 (0.011)	Loss 3.8735 (4.0060)	Top-1 acc 31.641 (31.030)	Top-5 acc 58.594 (54.538)	lr 0.00037
Warmup Train [38][2630/3239]	Time 0.522 (0.513)	Data 0.001 (0.011)	Loss 4.0291 (4.0062)	Top-1 acc 30.859 (31.029)	Top-5 acc 54.297 (54.535)	lr 0.00037
Warmup Train [38][2640/3239]	Time 0.516 (0.513)	Data 0.001 (0.011)	Loss 3.9165 (4.0064)	Top-1 acc 30.859 (31.024)	Top-5 acc 58.594 (54.528)	lr 0.00037
Warmup Train [38][2650/3239]	Time 0.586 (0.513)	Data 0.001 (0.011)	Loss 3.9904 (4.0068)	Top-1 acc 29.688 (31.021)	Top-5 acc 53.906 (54.522)	lr 0.00037
Warmup Train [38][2660/3239]	Time 0.460 (0.513)	Data 0.001 (0.011)	Loss 3.9230 (4.0066)	Top-1 acc 33.203 (31.025)	Top-5 acc 59.766 (54.528)	lr 0.00037
Warmup Train [38][2670/3239]	Time 0.575 (0.513)	Data 0.001 (0.011)	Loss 3.9927 (4.0066)	Top-1 acc 33.203 (31.027)	Top-5 acc 53.125 (54.525)	lr 0.00036
Warmup Train [38][2680/3239]	Time 0.487 (0.513)	Data 0.001 (0.011)	Loss 3.9497 (4.0066)	Top-1 acc 28.906 (31.024)	Top-5 acc 58.203 (54.526)	lr 0.00036
Warmup Train [38][2690/3239]	Time 0.644 (0.513)	Data 0.001 (0.011)	Loss 3.9343 (4.0069)	Top-1 acc 34.375 (31.019)	Top-5 acc 55.078 (54.520)	lr 0.00036
Warmup Train [38][2700/3239]	Time 0.380 (0.513)	Data 0.001 (0.010)	Loss 4.0390 (4.0067)	Top-1 acc 30.859 (31.020)	Top-5 acc 54.297 (54.521)	lr 0.00036
Warmup Train [38][2710/3239]	Time 0.482 (0.513)	Data 0.001 (0.010)	Loss 3.8562 (4.0066)	Top-1 acc 32.812 (31.020)	Top-5 acc 55.469 (54.523)	lr 0.00036
Warmup Train [38][2720/3239]	Time 0.647 (0.513)	Data 0.001 (0.011)	Loss 3.7864 (4.0065)	Top-1 acc 36.328 (31.024)	Top-5 acc 58.594 (54.523)	lr 0.00036
Warmup Train [38][2730/3239]	Time 0.578 (0.513)	Data 0.001 (0.010)	Loss 3.9969 (4.0066)	Top-1 acc 30.859 (31.024)	Top-5 acc 55.859 (54.526)	lr 0.00036
Warmup Train [38][2740/3239]	Time 0.449 (0.513)	Data 0.001 (0.010)	Loss 3.9683 (4.0064)	Top-1 acc 30.859 (31.024)	Top-5 acc 53.125 (54.526)	lr 0.00036
Warmup Train [38][2750/3239]	Time 0.357 (0.513)	Data 0.001 (0.010)	Loss 3.9381 (4.0063)	Top-1 acc 35.547 (31.027)	Top-5 acc 56.641 (54.532)	lr 0.00036
Warmup Train [38][2760/3239]	Time 0.373 (0.513)	Data 0.001 (0.010)	Loss 4.0373 (4.0064)	Top-1 acc 32.812 (31.024)	Top-5 acc 52.734 (54.533)	lr 0.00035
Warmup Train [38][2770/3239]	Time 0.619 (0.513)	Data 0.001 (0.010)	Loss 3.8752 (4.0064)	Top-1 acc 32.812 (31.023)	Top-5 acc 57.031 (54.534)	lr 0.00035
Warmup Train [38][2780/3239]	Time 0.326 (0.513)	Data 0.002 (0.010)	Loss 3.8759 (4.0064)	Top-1 acc 33.594 (31.021)	Top-5 acc 57.422 (54.534)	lr 0.00035
Warmup Train [38][2790/3239]	Time 0.524 (0.513)	Data 0.001 (0.010)	Loss 4.0855 (4.0061)	Top-1 acc 28.125 (31.029)	Top-5 acc 53.125 (54.540)	lr 0.00035
Warmup Train [38][2800/3239]	Time 0.512 (0.513)	Data 0.001 (0.010)	Loss 4.0734 (4.0060)	Top-1 acc 30.859 (31.030)	Top-5 acc 56.250 (54.543)	lr 0.00035
Warmup Train [38][2810/3239]	Time 0.702 (0.513)	Data 0.001 (0.010)	Loss 4.0719 (4.0060)	Top-1 acc 28.906 (31.032)	Top-5 acc 55.078 (54.546)	lr 0.00035
Warmup Train [38][2820/3239]	Time 0.670 (0.513)	Data 0.001 (0.010)	Loss 4.1537 (4.0059)	Top-1 acc 26.562 (31.034)	Top-5 acc 48.828 (54.547)	lr 0.00035
Warmup Train [38][2830/3239]	Time 0.458 (0.513)	Data 0.001 (0.010)	Loss 4.1601 (4.0058)	Top-1 acc 28.906 (31.036)	Top-5 acc 51.172 (54.545)	lr 0.00035
Warmup Train [38][2840/3239]	Time 0.549 (0.513)	Data 0.001 (0.010)	Loss 3.9250 (4.0058)	Top-1 acc 35.938 (31.040)	Top-5 acc 57.812 (54.543)	lr 0.00035
Warmup Train [38][2850/3239]	Time 0.640 (0.513)	Data 0.001 (0.010)	Loss 3.9750 (4.0059)	Top-1 acc 41.016 (31.044)	Top-5 acc 57.031 (54.542)	lr 0.00035
Warmup Train [38][2860/3239]	Time 0.422 (0.513)	Data 0.001 (0.010)	Loss 4.0417 (4.0059)	Top-1 acc 32.812 (31.043)	Top-5 acc 56.641 (54.545)	lr 0.00034
Warmup Train [38][2870/3239]	Time 0.704 (0.513)	Data 0.001 (0.010)	Loss 4.0968 (4.0059)	Top-1 acc 25.781 (31.039)	Top-5 acc 50.391 (54.543)	lr 0.00034
Warmup Train [38][2880/3239]	Time 0.647 (0.513)	Data 0.001 (0.010)	Loss 3.8698 (4.0059)	Top-1 acc 33.203 (31.042)	Top-5 acc 58.984 (54.541)	lr 0.00034
Warmup Train [38][2890/3239]	Time 0.556 (0.513)	Data 0.001 (0.010)	Loss 4.0485 (4.0059)	Top-1 acc 35.547 (31.043)	Top-5 acc 52.344 (54.544)	lr 0.00034
Warmup Train [38][2900/3239]	Time 0.425 (0.513)	Data 0.001 (0.010)	Loss 3.9591 (4.0058)	Top-1 acc 29.688 (31.040)	Top-5 acc 54.297 (54.542)	lr 0.00034
Warmup Train [38][2910/3239]	Time 0.451 (0.513)	Data 0.001 (0.010)	Loss 3.8387 (4.0056)	Top-1 acc 33.984 (31.043)	Top-5 acc 57.422 (54.547)	lr 0.00034
Warmup Train [38][2920/3239]	Time 0.546 (0.513)	Data 0.001 (0.010)	Loss 3.9948 (4.0055)	Top-1 acc 32.812 (31.044)	Top-5 acc 51.562 (54.548)	lr 0.00034
Warmup Train [38][2930/3239]	Time 0.485 (0.513)	Data 0.001 (0.010)	Loss 4.1844 (4.0056)	Top-1 acc 28.125 (31.043)	Top-5 acc 49.609 (54.544)	lr 0.00034
Warmup Train [38][2940/3239]	Time 0.419 (0.513)	Data 0.001 (0.010)	Loss 4.2748 (4.0058)	Top-1 acc 23.828 (31.044)	Top-5 acc 52.734 (54.545)	lr 0.00034
Warmup Train [38][2950/3239]	Time 0.534 (0.513)	Data 0.001 (0.010)	Loss 3.9279 (4.0057)	Top-1 acc 38.281 (31.049)	Top-5 acc 56.250 (54.549)	lr 0.00034
Warmup Train [38][2960/3239]	Time 0.352 (0.513)	Data 0.001 (0.010)	Loss 3.9306 (4.0057)	Top-1 acc 32.812 (31.055)	Top-5 acc 55.859 (54.548)	lr 0.00033
Warmup Train [38][2970/3239]	Time 0.669 (0.513)	Data 0.001 (0.010)	Loss 3.9254 (4.0055)	Top-1 acc 31.641 (31.058)	Top-5 acc 57.812 (54.552)	lr 0.00033
Warmup Train [38][2980/3239]	Time 0.518 (0.513)	Data 0.001 (0.010)	Loss 4.0155 (4.0057)	Top-1 acc 32.031 (31.053)	Top-5 acc 54.297 (54.553)	lr 0.00033
Warmup Train [38][2990/3239]	Time 0.539 (0.513)	Data 0.001 (0.010)	Loss 3.8744 (4.0056)	Top-1 acc 30.859 (31.054)	Top-5 acc 52.734 (54.550)	lr 0.00033
Warmup Train [38][3000/3239]	Time 0.704 (0.513)	Data 0.001 (0.010)	Loss 3.8675 (4.0056)	Top-1 acc 29.297 (31.051)	Top-5 acc 56.250 (54.553)	lr 0.00033
Warmup Train [38][3010/3239]	Time 0.476 (0.513)	Data 0.002 (0.010)	Loss 4.1992 (4.0056)	Top-1 acc 26.172 (31.051)	Top-5 acc 48.047 (54.555)	lr 0.00033
Warmup Train [38][3020/3239]	Time 0.481 (0.513)	Data 0.001 (0.010)	Loss 4.0135 (4.0055)	Top-1 acc 26.562 (31.053)	Top-5 acc 51.953 (54.558)	lr 0.00033
Warmup Train [38][3030/3239]	Time 0.507 (0.513)	Data 0.001 (0.010)	Loss 3.8001 (4.0055)	Top-1 acc 33.984 (31.049)	Top-5 acc 57.031 (54.554)	lr 0.00033
Warmup Train [38][3040/3239]	Time 0.469 (0.513)	Data 0.001 (0.010)	Loss 3.8600 (4.0053)	Top-1 acc 29.297 (31.054)	Top-5 acc 57.031 (54.557)	lr 0.00033
Warmup Train [38][3050/3239]	Time 0.622 (0.513)	Data 0.001 (0.010)	Loss 3.9414 (4.0054)	Top-1 acc 30.859 (31.056)	Top-5 acc 54.297 (54.557)	lr 0.00033
Warmup Train [38][3060/3239]	Time 0.510 (0.513)	Data 0.001 (0.010)	Loss 3.8083 (4.0053)	Top-1 acc 36.328 (31.059)	Top-5 acc 57.031 (54.559)	lr 0.00033
Warmup Train [38][3070/3239]	Time 0.338 (0.513)	Data 0.001 (0.010)	Loss 3.9991 (4.0052)	Top-1 acc 32.422 (31.067)	Top-5 acc 55.078 (54.561)	lr 0.00032
Warmup Train [38][3080/3239]	Time 0.456 (0.513)	Data 0.001 (0.010)	Loss 4.0159 (4.0052)	Top-1 acc 31.250 (31.067)	Top-5 acc 55.078 (54.557)	lr 0.00032
Warmup Train [38][3090/3239]	Time 0.452 (0.513)	Data 0.001 (0.010)	Loss 3.9921 (4.0052)	Top-1 acc 31.641 (31.063)	Top-5 acc 55.078 (54.560)	lr 0.00032
Warmup Train [38][3100/3239]	Time 0.662 (0.513)	Data 0.001 (0.010)	Loss 3.9317 (4.0053)	Top-1 acc 31.641 (31.062)	Top-5 acc 57.031 (54.558)	lr 0.00032
Warmup Train [38][3110/3239]	Time 0.606 (0.513)	Data 0.001 (0.010)	Loss 4.1751 (4.0053)	Top-1 acc 26.562 (31.063)	Top-5 acc 49.609 (54.557)	lr 0.00032
Warmup Train [38][3120/3239]	Time 0.510 (0.513)	Data 0.001 (0.010)	Loss 4.1599 (4.0054)	Top-1 acc 28.516 (31.059)	Top-5 acc 50.391 (54.557)	lr 0.00032
Warmup Train [38][3130/3239]	Time 0.435 (0.513)	Data 0.001 (0.010)	Loss 3.9422 (4.0055)	Top-1 acc 31.641 (31.055)	Top-5 acc 57.812 (54.554)	lr 0.00032
Warmup Train [38][3140/3239]	Time 0.532 (0.513)	Data 0.001 (0.010)	Loss 4.0777 (4.0055)	Top-1 acc 28.125 (31.055)	Top-5 acc 53.125 (54.554)	lr 0.00032
Warmup Train [38][3150/3239]	Time 0.548 (0.512)	Data 0.001 (0.010)	Loss 4.0809 (4.0054)	Top-1 acc 30.469 (31.055)	Top-5 acc 55.469 (54.558)	lr 0.00032
Warmup Train [38][3160/3239]	Time 0.556 (0.512)	Data 0.001 (0.010)	Loss 3.9800 (4.0053)	Top-1 acc 33.984 (31.055)	Top-5 acc 53.125 (54.557)	lr 0.00032
Warmup Train [38][3170/3239]	Time 0.349 (0.512)	Data 0.001 (0.010)	Loss 4.0107 (4.0053)	Top-1 acc 31.250 (31.053)	Top-5 acc 54.297 (54.558)	lr 0.00031
Warmup Train [38][3180/3239]	Time 0.183 (0.512)	Data 0.000 (0.010)	Loss 4.0057 (4.0055)	Top-1 acc 29.688 (31.050)	Top-5 acc 57.031 (54.558)	lr 0.00031
Warmup Train [38][3190/3239]	Time 0.399 (0.512)	Data 0.000 (0.010)	Loss 4.0089 (4.0055)	Top-1 acc 29.297 (31.051)	Top-5 acc 55.469 (54.560)	lr 0.00031
Warmup Train [38][3200/3239]	Time 0.591 (0.512)	Data 0.000 (0.010)	Loss 4.0463 (4.0056)	Top-1 acc 31.641 (31.049)	Top-5 acc 53.906 (54.561)	lr 0.00031
Warmup Train [38][3210/3239]	Time 0.560 (0.512)	Data 0.000 (0.010)	Loss 3.8762 (4.0055)	Top-1 acc 32.812 (31.048)	Top-5 acc 55.859 (54.562)	lr 0.00031
Warmup Train [38][3220/3239]	Time 0.425 (0.512)	Data 0.000 (0.010)	Loss 3.9805 (4.0055)	Top-1 acc 30.078 (31.050)	Top-5 acc 54.297 (54.564)	lr 0.00031
Warmup Train [38][3230/3239]	Time 0.496 (0.512)	Data 0.000 (0.010)	Loss 4.2883 (4.0055)	Top-1 acc 23.828 (31.052)	Top-5 acc 49.219 (54.563)	lr 0.00031
Warmup Train [38][3239/3239]	Time 0.322 (0.512)	Data 0.000 (0.010)	Loss 4.0117 (4.0054)	Top-1 acc 32.099 (31.055)	Top-5 acc 60.494 (54.564)	lr 0.00031
==========Warmup Valid [38/40]	loss 2.951	top-1 acc 38.451	top-5 acc 63.145	Train top-1 31.055	top-5 54.564	flops: 442.4M
Warmup Train [39][0/3239]	Time 17.609 (17.609)	Data 15.370 (15.370)	Loss 4.2088 (4.2088)	Top-1 acc 28.516 (28.516)	Top-5 acc 48.828 (48.828)	lr 0.00031
Warmup Train [39][10/3239]	Time 0.468 (2.093)	Data 0.001 (1.407)	Loss 3.8851 (4.0410)	Top-1 acc 30.859 (30.753)	Top-5 acc 58.984 (54.084)	lr 0.00031
Warmup Train [39][20/3239]	Time 0.646 (1.314)	Data 0.001 (0.738)	Loss 3.9959 (3.9943)	Top-1 acc 29.688 (31.659)	Top-5 acc 55.078 (55.171)	lr 0.00031
Warmup Train [39][30/3239]	Time 0.529 (1.050)	Data 0.001 (0.501)	Loss 3.9992 (3.9861)	Top-1 acc 30.859 (31.678)	Top-5 acc 51.562 (54.952)	lr 0.00030
Warmup Train [39][40/3239]	Time 0.563 (0.922)	Data 0.001 (0.381)	Loss 3.9747 (3.9791)	Top-1 acc 31.641 (31.536)	Top-5 acc 55.469 (54.954)	lr 0.00030
Warmup Train [39][50/3239]	Time 0.618 (0.845)	Data 0.001 (0.307)	Loss 4.0500 (3.9938)	Top-1 acc 28.125 (31.097)	Top-5 acc 54.297 (54.626)	lr 0.00030
Warmup Train [39][60/3239]	Time 0.574 (0.793)	Data 0.001 (0.257)	Loss 4.0800 (3.9960)	Top-1 acc 32.031 (31.084)	Top-5 acc 56.250 (54.572)	lr 0.00030
Warmup Train [39][70/3239]	Time 0.452 (0.753)	Data 0.001 (0.221)	Loss 3.9075 (3.9932)	Top-1 acc 29.297 (31.079)	Top-5 acc 53.125 (54.583)	lr 0.00030
Warmup Train [39][80/3239]	Time 0.332 (0.722)	Data 0.001 (0.196)	Loss 4.2932 (3.9932)	Top-1 acc 28.516 (31.033)	Top-5 acc 52.344 (54.678)	lr 0.00030
Warmup Train [39][90/3239]	Time 0.315 (0.698)	Data 0.001 (0.176)	Loss 4.0012 (3.9924)	Top-1 acc 28.125 (31.027)	Top-5 acc 58.203 (54.670)	lr 0.00030
Warmup Train [39][100/3239]	Time 0.383 (0.678)	Data 0.001 (0.160)	Loss 4.0774 (3.9953)	Top-1 acc 30.859 (31.103)	Top-5 acc 53.906 (54.568)	lr 0.00030
Warmup Train [39][110/3239]	Time 0.588 (0.666)	Data 0.001 (0.147)	Loss 3.9544 (3.9955)	Top-1 acc 28.906 (31.088)	Top-5 acc 55.859 (54.505)	lr 0.00030
Warmup Train [39][120/3239]	Time 0.518 (0.653)	Data 0.001 (0.136)	Loss 3.8490 (3.9937)	Top-1 acc 34.766 (31.156)	Top-5 acc 57.031 (54.568)	lr 0.00030
Warmup Train [39][130/3239]	Time 0.641 (0.643)	Data 0.001 (0.126)	Loss 4.0165 (3.9974)	Top-1 acc 27.734 (31.065)	Top-5 acc 51.953 (54.488)	lr 0.00030
Warmup Train [39][140/3239]	Time 0.586 (0.635)	Data 0.001 (0.117)	Loss 4.2288 (4.0004)	Top-1 acc 28.906 (31.034)	Top-5 acc 51.172 (54.433)	lr 0.00029
Warmup Train [39][150/3239]	Time 0.595 (0.625)	Data 0.001 (0.110)	Loss 4.0593 (3.9998)	Top-1 acc 34.766 (31.074)	Top-5 acc 55.859 (54.457)	lr 0.00029
Warmup Train [39][160/3239]	Time 0.469 (0.617)	Data 0.001 (0.103)	Loss 4.0995 (4.0051)	Top-1 acc 26.172 (30.932)	Top-5 acc 51.172 (54.353)	lr 0.00029
Warmup Train [39][170/3239]	Time 0.516 (0.611)	Data 0.001 (0.097)	Loss 4.1056 (4.0076)	Top-1 acc 25.781 (30.942)	Top-5 acc 51.172 (54.343)	lr 0.00029
Warmup Train [39][180/3239]	Time 0.428 (0.605)	Data 0.001 (0.092)	Loss 4.1592 (4.0081)	Top-1 acc 28.516 (30.920)	Top-5 acc 46.875 (54.347)	lr 0.00029
Warmup Train [39][190/3239]	Time 0.333 (0.599)	Data 0.001 (0.088)	Loss 4.0996 (4.0128)	Top-1 acc 32.422 (30.833)	Top-5 acc 50.391 (54.258)	lr 0.00029
Warmup Train [39][200/3239]	Time 0.576 (0.594)	Data 0.001 (0.084)	Loss 3.9559 (4.0123)	Top-1 acc 30.469 (30.889)	Top-5 acc 56.250 (54.287)	lr 0.00029
Warmup Train [39][210/3239]	Time 0.508 (0.591)	Data 0.001 (0.080)	Loss 3.8871 (4.0137)	Top-1 acc 32.422 (30.889)	Top-5 acc 57.031 (54.271)	lr 0.00029
Warmup Train [39][220/3239]	Time 0.464 (0.587)	Data 0.001 (0.077)	Loss 4.1750 (4.0131)	Top-1 acc 29.297 (30.916)	Top-5 acc 48.047 (54.313)	lr 0.00029
Warmup Train [39][230/3239]	Time 0.597 (0.583)	Data 0.002 (0.074)	Loss 3.8620 (4.0143)	Top-1 acc 33.203 (30.886)	Top-5 acc 55.469 (54.261)	lr 0.00029
Warmup Train [39][240/3239]	Time 0.619 (0.580)	Data 0.001 (0.071)	Loss 4.0176 (4.0142)	Top-1 acc 26.562 (30.942)	Top-5 acc 52.734 (54.297)	lr 0.00029
Warmup Train [39][250/3239]	Time 0.369 (0.574)	Data 0.001 (0.068)	Loss 3.8661 (4.0142)	Top-1 acc 31.641 (30.917)	Top-5 acc 58.203 (54.289)	lr 0.00028
Warmup Train [39][260/3239]	Time 0.546 (0.572)	Data 0.001 (0.066)	Loss 4.0384 (4.0134)	Top-1 acc 30.859 (30.937)	Top-5 acc 51.953 (54.301)	lr 0.00028
Warmup Train [39][270/3239]	Time 0.573 (0.567)	Data 0.001 (0.064)	Loss 4.0159 (4.0129)	Top-1 acc 32.422 (30.949)	Top-5 acc 54.688 (54.298)	lr 0.00028
Warmup Train [39][280/3239]	Time 0.448 (0.566)	Data 0.001 (0.061)	Loss 3.9624 (4.0104)	Top-1 acc 35.156 (30.998)	Top-5 acc 54.688 (54.362)	lr 0.00028
Warmup Train [39][290/3239]	Time 0.596 (0.564)	Data 0.001 (0.060)	Loss 4.0844 (4.0079)	Top-1 acc 29.688 (31.047)	Top-5 acc 53.125 (54.436)	lr 0.00028
Warmup Train [39][300/3239]	Time 0.594 (0.563)	Data 0.001 (0.058)	Loss 4.0803 (4.0082)	Top-1 acc 31.250 (31.051)	Top-5 acc 51.562 (54.405)	lr 0.00028
Warmup Train [39][310/3239]	Time 0.401 (0.561)	Data 0.001 (0.056)	Loss 4.0428 (4.0089)	Top-1 acc 28.906 (31.069)	Top-5 acc 52.734 (54.411)	lr 0.00028
Warmup Train [39][320/3239]	Time 0.607 (0.560)	Data 0.001 (0.054)	Loss 4.0502 (4.0098)	Top-1 acc 29.688 (31.046)	Top-5 acc 54.297 (54.378)	lr 0.00028
Warmup Train [39][330/3239]	Time 0.490 (0.559)	Data 0.001 (0.053)	Loss 3.8946 (4.0112)	Top-1 acc 34.766 (31.005)	Top-5 acc 55.078 (54.365)	lr 0.00028
Warmup Train [39][340/3239]	Time 0.593 (0.557)	Data 0.001 (0.051)	Loss 3.8816 (4.0105)	Top-1 acc 32.812 (31.020)	Top-5 acc 57.422 (54.356)	lr 0.00028
Warmup Train [39][350/3239]	Time 0.362 (0.556)	Data 0.001 (0.050)	Loss 4.0001 (4.0100)	Top-1 acc 31.250 (31.067)	Top-5 acc 54.688 (54.368)	lr 0.00028
Warmup Train [39][360/3239]	Time 0.575 (0.555)	Data 0.001 (0.049)	Loss 4.1259 (4.0101)	Top-1 acc 28.906 (31.056)	Top-5 acc 51.953 (54.355)	lr 0.00027
Warmup Train [39][370/3239]	Time 0.374 (0.554)	Data 0.001 (0.048)	Loss 3.9782 (4.0091)	Top-1 acc 30.859 (31.087)	Top-5 acc 53.125 (54.372)	lr 0.00027
Warmup Train [39][380/3239]	Time 0.369 (0.552)	Data 0.001 (0.047)	Loss 4.0694 (4.0105)	Top-1 acc 29.688 (31.023)	Top-5 acc 51.562 (54.325)	lr 0.00027
Warmup Train [39][390/3239]	Time 0.543 (0.551)	Data 0.001 (0.046)	Loss 3.8504 (4.0093)	Top-1 acc 34.375 (31.046)	Top-5 acc 56.250 (54.345)	lr 0.00027
Warmup Train [39][400/3239]	Time 0.483 (0.550)	Data 0.001 (0.045)	Loss 4.2150 (4.0102)	Top-1 acc 29.688 (31.010)	Top-5 acc 51.172 (54.333)	lr 0.00027
Warmup Train [39][410/3239]	Time 0.492 (0.549)	Data 0.001 (0.044)	Loss 4.0593 (4.0096)	Top-1 acc 29.297 (31.006)	Top-5 acc 54.688 (54.339)	lr 0.00027
Warmup Train [39][420/3239]	Time 0.497 (0.548)	Data 0.001 (0.043)	Loss 4.1313 (4.0096)	Top-1 acc 32.031 (31.041)	Top-5 acc 52.734 (54.383)	lr 0.00027
Warmup Train [39][430/3239]	Time 0.661 (0.548)	Data 0.001 (0.042)	Loss 3.7231 (4.0091)	Top-1 acc 35.938 (31.052)	Top-5 acc 60.938 (54.394)	lr 0.00027
Warmup Train [39][440/3239]	Time 0.543 (0.547)	Data 0.001 (0.041)	Loss 4.0311 (4.0092)	Top-1 acc 28.906 (31.031)	Top-5 acc 55.859 (54.403)	lr 0.00027
Warmup Train [39][450/3239]	Time 0.503 (0.546)	Data 0.001 (0.040)	Loss 3.6467 (4.0084)	Top-1 acc 34.766 (31.050)	Top-5 acc 62.500 (54.428)	lr 0.00027
Warmup Train [39][460/3239]	Time 0.567 (0.546)	Data 0.001 (0.039)	Loss 4.0734 (4.0076)	Top-1 acc 28.516 (31.052)	Top-5 acc 54.688 (54.449)	lr 0.00027
Warmup Train [39][470/3239]	Time 0.570 (0.545)	Data 0.002 (0.039)	Loss 3.9117 (4.0067)	Top-1 acc 30.469 (31.079)	Top-5 acc 55.859 (54.462)	lr 0.00026
Warmup Train [39][480/3239]	Time 0.323 (0.544)	Data 0.001 (0.038)	Loss 3.8605 (4.0065)	Top-1 acc 35.156 (31.093)	Top-5 acc 58.984 (54.471)	lr 0.00026
Warmup Train [39][490/3239]	Time 0.582 (0.543)	Data 0.001 (0.037)	Loss 4.0394 (4.0064)	Top-1 acc 32.812 (31.085)	Top-5 acc 53.516 (54.472)	lr 0.00026
Warmup Train [39][500/3239]	Time 0.403 (0.542)	Data 0.001 (0.037)	Loss 4.0086 (4.0058)	Top-1 acc 32.812 (31.136)	Top-5 acc 55.859 (54.470)	lr 0.00026
Warmup Train [39][510/3239]	Time 0.572 (0.541)	Data 0.001 (0.036)	Loss 3.7310 (4.0045)	Top-1 acc 38.281 (31.163)	Top-5 acc 60.156 (54.501)	lr 0.00026
Warmup Train [39][520/3239]	Time 0.389 (0.540)	Data 0.001 (0.035)	Loss 4.0601 (4.0047)	Top-1 acc 30.859 (31.175)	Top-5 acc 54.297 (54.529)	lr 0.00026
Warmup Train [39][530/3239]	Time 0.366 (0.539)	Data 0.001 (0.035)	Loss 4.0281 (4.0053)	Top-1 acc 28.906 (31.172)	Top-5 acc 53.906 (54.526)	lr 0.00026
Warmup Train [39][540/3239]	Time 0.384 (0.538)	Data 0.001 (0.034)	Loss 3.9686 (4.0047)	Top-1 acc 33.984 (31.189)	Top-5 acc 55.078 (54.560)	lr 0.00026
Warmup Train [39][550/3239]	Time 0.506 (0.539)	Data 0.001 (0.034)	Loss 3.7439 (4.0037)	Top-1 acc 35.156 (31.208)	Top-5 acc 60.547 (54.584)	lr 0.00026
Warmup Train [39][560/3239]	Time 0.520 (0.538)	Data 0.001 (0.034)	Loss 4.0861 (4.0034)	Top-1 acc 26.172 (31.213)	Top-5 acc 53.125 (54.593)	lr 0.00026
Warmup Train [39][570/3239]	Time 0.526 (0.538)	Data 0.001 (0.033)	Loss 4.0649 (4.0038)	Top-1 acc 31.250 (31.176)	Top-5 acc 53.906 (54.573)	lr 0.00026
Warmup Train [39][580/3239]	Time 0.483 (0.537)	Data 0.001 (0.033)	Loss 4.0155 (4.0035)	Top-1 acc 33.203 (31.200)	Top-5 acc 51.172 (54.582)	lr 0.00026
Warmup Train [39][590/3239]	Time 0.655 (0.537)	Data 0.001 (0.032)	Loss 4.0865 (4.0034)	Top-1 acc 27.344 (31.198)	Top-5 acc 54.688 (54.593)	lr 0.00025
Warmup Train [39][600/3239]	Time 0.494 (0.537)	Data 0.001 (0.032)	Loss 3.9363 (4.0040)	Top-1 acc 31.641 (31.177)	Top-5 acc 53.516 (54.581)	lr 0.00025
Warmup Train [39][610/3239]	Time 0.592 (0.536)	Data 0.002 (0.031)	Loss 3.8001 (4.0048)	Top-1 acc 36.719 (31.159)	Top-5 acc 58.594 (54.564)	lr 0.00025
Warmup Train [39][620/3239]	Time 0.623 (0.536)	Data 0.001 (0.031)	Loss 4.1457 (4.0040)	Top-1 acc 28.906 (31.178)	Top-5 acc 49.609 (54.585)	lr 0.00025
Warmup Train [39][630/3239]	Time 0.608 (0.535)	Data 0.001 (0.031)	Loss 3.9651 (4.0048)	Top-1 acc 33.594 (31.162)	Top-5 acc 57.812 (54.564)	lr 0.00025
Warmup Train [39][640/3239]	Time 0.596 (0.535)	Data 0.001 (0.030)	Loss 4.1468 (4.0053)	Top-1 acc 26.562 (31.143)	Top-5 acc 51.562 (54.546)	lr 0.00025
Warmup Train [39][650/3239]	Time 0.544 (0.535)	Data 0.001 (0.030)	Loss 3.9153 (4.0065)	Top-1 acc 33.984 (31.110)	Top-5 acc 57.031 (54.515)	lr 0.00025
Warmup Train [39][660/3239]	Time 0.366 (0.535)	Data 0.001 (0.029)	Loss 3.9974 (4.0064)	Top-1 acc 29.297 (31.120)	Top-5 acc 55.859 (54.524)	lr 0.00025
Warmup Train [39][670/3239]	Time 0.417 (0.534)	Data 0.001 (0.029)	Loss 3.8371 (4.0065)	Top-1 acc 32.422 (31.104)	Top-5 acc 61.328 (54.522)	lr 0.00025
Warmup Train [39][680/3239]	Time 0.579 (0.534)	Data 0.001 (0.029)	Loss 4.1349 (4.0074)	Top-1 acc 26.953 (31.093)	Top-5 acc 53.906 (54.514)	lr 0.00025
Warmup Train [39][690/3239]	Time 0.548 (0.534)	Data 0.002 (0.029)	Loss 3.9946 (4.0069)	Top-1 acc 30.078 (31.102)	Top-5 acc 52.734 (54.534)	lr 0.00025
Warmup Train [39][700/3239]	Time 0.620 (0.534)	Data 0.001 (0.028)	Loss 4.0165 (4.0070)	Top-1 acc 29.297 (31.096)	Top-5 acc 53.125 (54.523)	lr 0.00024
Warmup Train [39][710/3239]	Time 0.551 (0.534)	Data 0.001 (0.028)	Loss 4.0674 (4.0068)	Top-1 acc 30.078 (31.099)	Top-5 acc 51.953 (54.528)	lr 0.00024
Warmup Train [39][720/3239]	Time 0.767 (0.533)	Data 0.001 (0.027)	Loss 3.9502 (4.0068)	Top-1 acc 32.031 (31.102)	Top-5 acc 54.688 (54.527)	lr 0.00024
Warmup Train [39][730/3239]	Time 0.549 (0.533)	Data 0.001 (0.027)	Loss 4.0032 (4.0059)	Top-1 acc 34.375 (31.135)	Top-5 acc 55.078 (54.553)	lr 0.00024
Warmup Train [39][740/3239]	Time 0.766 (0.533)	Data 0.001 (0.027)	Loss 4.1517 (4.0062)	Top-1 acc 31.250 (31.131)	Top-5 acc 52.734 (54.532)	lr 0.00024
Warmup Train [39][750/3239]	Time 0.545 (0.532)	Data 0.001 (0.026)	Loss 3.9831 (4.0069)	Top-1 acc 31.641 (31.123)	Top-5 acc 55.469 (54.518)	lr 0.00024
Warmup Train [39][760/3239]	Time 0.526 (0.532)	Data 0.001 (0.026)	Loss 3.9548 (4.0069)	Top-1 acc 32.812 (31.116)	Top-5 acc 57.422 (54.520)	lr 0.00024
Warmup Train [39][770/3239]	Time 0.298 (0.531)	Data 0.001 (0.026)	Loss 3.9099 (4.0066)	Top-1 acc 35.156 (31.129)	Top-5 acc 58.984 (54.523)	lr 0.00024
Warmup Train [39][780/3239]	Time 0.322 (0.530)	Data 0.001 (0.026)	Loss 4.0084 (4.0066)	Top-1 acc 31.641 (31.137)	Top-5 acc 55.859 (54.517)	lr 0.00024
Warmup Train [39][790/3239]	Time 0.416 (0.530)	Data 0.001 (0.026)	Loss 3.9217 (4.0062)	Top-1 acc 30.469 (31.139)	Top-5 acc 54.297 (54.515)	lr 0.00024
Warmup Train [39][800/3239]	Time 0.537 (0.530)	Data 0.001 (0.025)	Loss 4.0868 (4.0060)	Top-1 acc 28.906 (31.133)	Top-5 acc 49.219 (54.516)	lr 0.00024
Warmup Train [39][810/3239]	Time 0.505 (0.530)	Data 0.001 (0.025)	Loss 4.1877 (4.0059)	Top-1 acc 29.688 (31.138)	Top-5 acc 53.906 (54.530)	lr 0.00024
Warmup Train [39][820/3239]	Time 0.611 (0.530)	Data 0.001 (0.025)	Loss 3.8157 (4.0057)	Top-1 acc 36.328 (31.142)	Top-5 acc 56.641 (54.537)	lr 0.00023
Warmup Train [39][830/3239]	Time 0.535 (0.530)	Data 0.001 (0.025)	Loss 3.9729 (4.0055)	Top-1 acc 34.766 (31.144)	Top-5 acc 56.641 (54.537)	lr 0.00023
Warmup Train [39][840/3239]	Time 0.640 (0.530)	Data 0.001 (0.024)	Loss 3.9721 (4.0057)	Top-1 acc 34.375 (31.148)	Top-5 acc 55.469 (54.532)	lr 0.00023
Warmup Train [39][850/3239]	Time 0.522 (0.530)	Data 0.001 (0.024)	Loss 3.8255 (4.0056)	Top-1 acc 33.594 (31.152)	Top-5 acc 62.500 (54.544)	lr 0.00023
Warmup Train [39][860/3239]	Time 0.294 (0.530)	Data 0.001 (0.024)	Loss 3.9799 (4.0047)	Top-1 acc 33.203 (31.167)	Top-5 acc 55.469 (54.563)	lr 0.00023
Warmup Train [39][870/3239]	Time 0.558 (0.529)	Data 0.001 (0.024)	Loss 4.0984 (4.0050)	Top-1 acc 29.688 (31.161)	Top-5 acc 51.953 (54.558)	lr 0.00023
Warmup Train [39][880/3239]	Time 0.586 (0.529)	Data 0.001 (0.024)	Loss 3.9018 (4.0050)	Top-1 acc 35.156 (31.141)	Top-5 acc 56.250 (54.560)	lr 0.00023
Warmup Train [39][890/3239]	Time 0.565 (0.529)	Data 0.001 (0.023)	Loss 3.9109 (4.0051)	Top-1 acc 30.469 (31.135)	Top-5 acc 57.812 (54.547)	lr 0.00023
Warmup Train [39][900/3239]	Time 0.492 (0.528)	Data 0.001 (0.023)	Loss 4.0754 (4.0047)	Top-1 acc 31.641 (31.140)	Top-5 acc 53.906 (54.554)	lr 0.00023
Warmup Train [39][910/3239]	Time 0.618 (0.528)	Data 0.001 (0.023)	Loss 4.0392 (4.0044)	Top-1 acc 33.594 (31.148)	Top-5 acc 54.688 (54.552)	lr 0.00023
Warmup Train [39][920/3239]	Time 0.433 (0.528)	Data 0.001 (0.023)	Loss 3.8889 (4.0046)	Top-1 acc 33.984 (31.151)	Top-5 acc 56.641 (54.553)	lr 0.00023
Warmup Train [39][930/3239]	Time 0.517 (0.528)	Data 0.001 (0.023)	Loss 3.9890 (4.0045)	Top-1 acc 34.766 (31.157)	Top-5 acc 54.297 (54.564)	lr 0.00023
Warmup Train [39][940/3239]	Time 0.473 (0.528)	Data 0.001 (0.022)	Loss 3.8925 (4.0043)	Top-1 acc 30.469 (31.144)	Top-5 acc 55.469 (54.567)	lr 0.00023
Warmup Train [39][950/3239]	Time 0.664 (0.528)	Data 0.001 (0.022)	Loss 4.1651 (4.0045)	Top-1 acc 25.391 (31.139)	Top-5 acc 51.953 (54.564)	lr 0.00022
Warmup Train [39][960/3239]	Time 0.543 (0.528)	Data 0.001 (0.022)	Loss 3.9342 (4.0042)	Top-1 acc 31.250 (31.146)	Top-5 acc 57.812 (54.567)	lr 0.00022
Warmup Train [39][970/3239]	Time 0.461 (0.527)	Data 0.001 (0.022)	Loss 3.9218 (4.0045)	Top-1 acc 34.375 (31.147)	Top-5 acc 56.250 (54.564)	lr 0.00022
Warmup Train [39][980/3239]	Time 0.480 (0.527)	Data 0.001 (0.022)	Loss 3.9162 (4.0047)	Top-1 acc 34.375 (31.140)	Top-5 acc 58.203 (54.555)	lr 0.00022
Warmup Train [39][990/3239]	Time 0.480 (0.527)	Data 0.001 (0.022)	Loss 4.1189 (4.0051)	Top-1 acc 28.906 (31.139)	Top-5 acc 51.172 (54.544)	lr 0.00022
Warmup Train [39][1000/3239]	Time 0.568 (0.527)	Data 0.001 (0.021)	Loss 4.0758 (4.0051)	Top-1 acc 30.078 (31.129)	Top-5 acc 53.906 (54.546)	lr 0.00022
Warmup Train [39][1010/3239]	Time 0.568 (0.526)	Data 0.001 (0.021)	Loss 4.0435 (4.0049)	Top-1 acc 32.031 (31.131)	Top-5 acc 57.812 (54.558)	lr 0.00022
Warmup Train [39][1020/3239]	Time 0.436 (0.526)	Data 0.001 (0.021)	Loss 4.0587 (4.0042)	Top-1 acc 30.078 (31.146)	Top-5 acc 52.734 (54.568)	lr 0.00022
Warmup Train [39][1030/3239]	Time 0.372 (0.526)	Data 0.001 (0.021)	Loss 3.9321 (4.0046)	Top-1 acc 32.812 (31.140)	Top-5 acc 56.641 (54.560)	lr 0.00022
Warmup Train [39][1040/3239]	Time 0.513 (0.526)	Data 0.001 (0.021)	Loss 4.1654 (4.0043)	Top-1 acc 28.906 (31.147)	Top-5 acc 51.953 (54.561)	lr 0.00022
Warmup Train [39][1050/3239]	Time 0.385 (0.525)	Data 0.001 (0.021)	Loss 4.0902 (4.0039)	Top-1 acc 25.000 (31.152)	Top-5 acc 51.562 (54.570)	lr 0.00022
Warmup Train [39][1060/3239]	Time 0.659 (0.525)	Data 0.001 (0.021)	Loss 4.0797 (4.0041)	Top-1 acc 28.516 (31.148)	Top-5 acc 53.125 (54.559)	lr 0.00022
Warmup Train [39][1070/3239]	Time 0.493 (0.525)	Data 0.001 (0.020)	Loss 3.8290 (4.0040)	Top-1 acc 33.594 (31.145)	Top-5 acc 57.422 (54.567)	lr 0.00021
Warmup Train [39][1080/3239]	Time 0.629 (0.525)	Data 0.001 (0.020)	Loss 3.8967 (4.0042)	Top-1 acc 38.281 (31.148)	Top-5 acc 55.859 (54.553)	lr 0.00021
Warmup Train [39][1090/3239]	Time 0.428 (0.525)	Data 0.001 (0.020)	Loss 4.2168 (4.0041)	Top-1 acc 25.781 (31.139)	Top-5 acc 53.125 (54.558)	lr 0.00021
Warmup Train [39][1100/3239]	Time 0.320 (0.525)	Data 0.001 (0.020)	Loss 3.9413 (4.0042)	Top-1 acc 34.766 (31.143)	Top-5 acc 53.125 (54.549)	lr 0.00021
Warmup Train [39][1110/3239]	Time 0.584 (0.525)	Data 0.001 (0.020)	Loss 3.9783 (4.0041)	Top-1 acc 32.812 (31.145)	Top-5 acc 56.641 (54.562)	lr 0.00021
Warmup Train [39][1120/3239]	Time 0.499 (0.524)	Data 0.001 (0.020)	Loss 4.1488 (4.0041)	Top-1 acc 26.953 (31.148)	Top-5 acc 53.516 (54.556)	lr 0.00021
Warmup Train [39][1130/3239]	Time 0.548 (0.524)	Data 0.001 (0.020)	Loss 3.9950 (4.0040)	Top-1 acc 33.984 (31.153)	Top-5 acc 53.906 (54.557)	lr 0.00021
Warmup Train [39][1140/3239]	Time 0.535 (0.524)	Data 0.001 (0.019)	Loss 3.9590 (4.0036)	Top-1 acc 32.031 (31.162)	Top-5 acc 57.812 (54.578)	lr 0.00021
Warmup Train [39][1150/3239]	Time 0.567 (0.524)	Data 0.001 (0.019)	Loss 3.9276 (4.0037)	Top-1 acc 28.906 (31.160)	Top-5 acc 57.812 (54.582)	lr 0.00021
Warmup Train [39][1160/3239]	Time 0.399 (0.524)	Data 0.001 (0.019)	Loss 4.0987 (4.0038)	Top-1 acc 33.203 (31.162)	Top-5 acc 53.125 (54.585)	lr 0.00021
Warmup Train [39][1170/3239]	Time 0.629 (0.524)	Data 0.001 (0.019)	Loss 3.9099 (4.0035)	Top-1 acc 34.375 (31.166)	Top-5 acc 57.812 (54.587)	lr 0.00021
Warmup Train [39][1180/3239]	Time 0.405 (0.524)	Data 0.001 (0.019)	Loss 4.2141 (4.0035)	Top-1 acc 26.562 (31.163)	Top-5 acc 47.656 (54.585)	lr 0.00021
Warmup Train [39][1190/3239]	Time 0.390 (0.524)	Data 0.001 (0.019)	Loss 3.9971 (4.0037)	Top-1 acc 28.906 (31.142)	Top-5 acc 58.203 (54.585)	lr 0.00021
Warmup Train [39][1200/3239]	Time 0.581 (0.523)	Data 0.001 (0.019)	Loss 4.0495 (4.0041)	Top-1 acc 28.906 (31.130)	Top-5 acc 52.344 (54.576)	lr 0.00020
Warmup Train [39][1210/3239]	Time 0.548 (0.523)	Data 0.001 (0.019)	Loss 4.0124 (4.0040)	Top-1 acc 31.250 (31.130)	Top-5 acc 56.641 (54.587)	lr 0.00020
Warmup Train [39][1220/3239]	Time 0.513 (0.524)	Data 0.001 (0.019)	Loss 4.1998 (4.0049)	Top-1 acc 26.953 (31.115)	Top-5 acc 50.781 (54.562)	lr 0.00020
Warmup Train [39][1230/3239]	Time 0.512 (0.524)	Data 0.001 (0.019)	Loss 4.0599 (4.0048)	Top-1 acc 28.906 (31.120)	Top-5 acc 51.562 (54.552)	lr 0.00020
Warmup Train [39][1240/3239]	Time 0.548 (0.523)	Data 0.001 (0.018)	Loss 4.1366 (4.0045)	Top-1 acc 31.250 (31.128)	Top-5 acc 51.562 (54.555)	lr 0.00020
Warmup Train [39][1250/3239]	Time 0.487 (0.523)	Data 0.001 (0.018)	Loss 4.0668 (4.0045)	Top-1 acc 28.906 (31.134)	Top-5 acc 51.172 (54.557)	lr 0.00020
Warmup Train [39][1260/3239]	Time 0.375 (0.523)	Data 0.001 (0.018)	Loss 3.9996 (4.0048)	Top-1 acc 33.984 (31.131)	Top-5 acc 52.734 (54.542)	lr 0.00020
Warmup Train [39][1270/3239]	Time 0.733 (0.523)	Data 0.001 (0.018)	Loss 4.0257 (4.0049)	Top-1 acc 33.594 (31.138)	Top-5 acc 56.641 (54.538)	lr 0.00020
Warmup Train [39][1280/3239]	Time 0.548 (0.522)	Data 0.001 (0.018)	Loss 3.8422 (4.0049)	Top-1 acc 31.641 (31.136)	Top-5 acc 58.594 (54.545)	lr 0.00020
Warmup Train [39][1290/3239]	Time 0.521 (0.522)	Data 0.001 (0.018)	Loss 4.1470 (4.0042)	Top-1 acc 28.516 (31.154)	Top-5 acc 51.953 (54.561)	lr 0.00020
Warmup Train [39][1300/3239]	Time 0.565 (0.522)	Data 0.001 (0.018)	Loss 3.7927 (4.0039)	Top-1 acc 37.500 (31.164)	Top-5 acc 62.109 (54.568)	lr 0.00020
Warmup Train [39][1310/3239]	Time 0.524 (0.522)	Data 0.001 (0.018)	Loss 3.9389 (4.0041)	Top-1 acc 28.516 (31.155)	Top-5 acc 54.688 (54.563)	lr 0.00020
Warmup Train [39][1320/3239]	Time 0.407 (0.522)	Data 0.001 (0.018)	Loss 4.0398 (4.0042)	Top-1 acc 31.641 (31.158)	Top-5 acc 53.125 (54.557)	lr 0.00020
Warmup Train [39][1330/3239]	Time 0.538 (0.522)	Data 0.001 (0.018)	Loss 4.1989 (4.0046)	Top-1 acc 26.172 (31.146)	Top-5 acc 50.000 (54.549)	lr 0.00019
Warmup Train [39][1340/3239]	Time 0.397 (0.522)	Data 0.001 (0.017)	Loss 4.0774 (4.0043)	Top-1 acc 30.078 (31.156)	Top-5 acc 52.734 (54.559)	lr 0.00019
Warmup Train [39][1350/3239]	Time 0.514 (0.522)	Data 0.001 (0.017)	Loss 4.0559 (4.0043)	Top-1 acc 26.953 (31.161)	Top-5 acc 51.172 (54.557)	lr 0.00019
Warmup Train [39][1360/3239]	Time 0.668 (0.522)	Data 0.001 (0.017)	Loss 3.9015 (4.0043)	Top-1 acc 33.203 (31.163)	Top-5 acc 57.422 (54.555)	lr 0.00019
Warmup Train [39][1370/3239]	Time 0.512 (0.522)	Data 0.001 (0.017)	Loss 4.1758 (4.0044)	Top-1 acc 26.953 (31.158)	Top-5 acc 50.391 (54.563)	lr 0.00019
Warmup Train [39][1380/3239]	Time 0.602 (0.522)	Data 0.001 (0.017)	Loss 4.1064 (4.0040)	Top-1 acc 27.344 (31.158)	Top-5 acc 46.484 (54.570)	lr 0.00019
Warmup Train [39][1390/3239]	Time 0.360 (0.522)	Data 0.001 (0.017)	Loss 4.0733 (4.0044)	Top-1 acc 28.516 (31.154)	Top-5 acc 53.906 (54.563)	lr 0.00019
Warmup Train [39][1400/3239]	Time 0.476 (0.522)	Data 0.001 (0.017)	Loss 3.7349 (4.0043)	Top-1 acc 36.328 (31.157)	Top-5 acc 56.250 (54.556)	lr 0.00019
Warmup Train [39][1410/3239]	Time 0.579 (0.522)	Data 0.001 (0.017)	Loss 3.9925 (4.0043)	Top-1 acc 31.250 (31.156)	Top-5 acc 55.469 (54.565)	lr 0.00019
Warmup Train [39][1420/3239]	Time 0.636 (0.522)	Data 0.001 (0.017)	Loss 3.9748 (4.0043)	Top-1 acc 30.078 (31.158)	Top-5 acc 56.641 (54.564)	lr 0.00019
Warmup Train [39][1430/3239]	Time 0.492 (0.522)	Data 0.001 (0.017)	Loss 4.0581 (4.0046)	Top-1 acc 28.516 (31.143)	Top-5 acc 52.344 (54.556)	lr 0.00019
Warmup Train [39][1440/3239]	Time 0.352 (0.521)	Data 0.001 (0.017)	Loss 4.2183 (4.0049)	Top-1 acc 26.953 (31.136)	Top-5 acc 48.828 (54.551)	lr 0.00019
Warmup Train [39][1450/3239]	Time 0.398 (0.522)	Data 0.001 (0.017)	Loss 4.3407 (4.0052)	Top-1 acc 28.516 (31.127)	Top-5 acc 46.094 (54.545)	lr 0.00019
Warmup Train [39][1460/3239]	Time 0.596 (0.522)	Data 0.001 (0.017)	Loss 3.9234 (4.0050)	Top-1 acc 34.375 (31.133)	Top-5 acc 57.031 (54.544)	lr 0.00018
Warmup Train [39][1470/3239]	Time 0.556 (0.522)	Data 0.001 (0.016)	Loss 3.8528 (4.0044)	Top-1 acc 31.641 (31.147)	Top-5 acc 58.203 (54.554)	lr 0.00018
Warmup Train [39][1480/3239]	Time 0.379 (0.521)	Data 0.001 (0.016)	Loss 3.9860 (4.0043)	Top-1 acc 33.203 (31.144)	Top-5 acc 57.031 (54.557)	lr 0.00018
Warmup Train [39][1490/3239]	Time 0.355 (0.521)	Data 0.001 (0.016)	Loss 4.1688 (4.0043)	Top-1 acc 27.734 (31.144)	Top-5 acc 51.953 (54.566)	lr 0.00018
Warmup Train [39][1500/3239]	Time 0.313 (0.521)	Data 0.001 (0.016)	Loss 4.0742 (4.0042)	Top-1 acc 31.641 (31.148)	Top-5 acc 53.516 (54.572)	lr 0.00018
Warmup Train [39][1510/3239]	Time 0.476 (0.521)	Data 0.001 (0.016)	Loss 3.8417 (4.0042)	Top-1 acc 34.766 (31.152)	Top-5 acc 58.203 (54.566)	lr 0.00018
Warmup Train [39][1520/3239]	Time 0.526 (0.521)	Data 0.001 (0.016)	Loss 3.9997 (4.0041)	Top-1 acc 32.031 (31.153)	Top-5 acc 53.906 (54.567)	lr 0.00018
Warmup Train [39][1530/3239]	Time 0.412 (0.520)	Data 0.002 (0.016)	Loss 3.9400 (4.0037)	Top-1 acc 31.250 (31.158)	Top-5 acc 55.078 (54.570)	lr 0.00018
Warmup Train [39][1540/3239]	Time 0.418 (0.520)	Data 0.001 (0.016)	Loss 4.0566 (4.0038)	Top-1 acc 31.250 (31.164)	Top-5 acc 51.562 (54.567)	lr 0.00018
Warmup Train [39][1550/3239]	Time 0.526 (0.520)	Data 0.001 (0.016)	Loss 4.1184 (4.0041)	Top-1 acc 25.781 (31.151)	Top-5 acc 51.953 (54.559)	lr 0.00018
Warmup Train [39][1560/3239]	Time 0.555 (0.520)	Data 0.002 (0.016)	Loss 3.9793 (4.0039)	Top-1 acc 31.641 (31.150)	Top-5 acc 57.422 (54.566)	lr 0.00018
Warmup Train [39][1570/3239]	Time 0.453 (0.520)	Data 0.001 (0.016)	Loss 4.2772 (4.0041)	Top-1 acc 25.781 (31.143)	Top-5 acc 51.172 (54.568)	lr 0.00018
Warmup Train [39][1580/3239]	Time 0.563 (0.520)	Data 0.001 (0.016)	Loss 4.1635 (4.0038)	Top-1 acc 28.125 (31.147)	Top-5 acc 51.562 (54.573)	lr 0.00018
Warmup Train [39][1590/3239]	Time 0.502 (0.520)	Data 0.001 (0.016)	Loss 4.0326 (4.0040)	Top-1 acc 30.078 (31.143)	Top-5 acc 51.562 (54.572)	lr 0.00018
Warmup Train [39][1600/3239]	Time 0.418 (0.520)	Data 0.001 (0.016)	Loss 3.9567 (4.0039)	Top-1 acc 33.594 (31.147)	Top-5 acc 57.422 (54.571)	lr 0.00017
Warmup Train [39][1610/3239]	Time 0.480 (0.520)	Data 0.001 (0.016)	Loss 3.8751 (4.0040)	Top-1 acc 31.250 (31.138)	Top-5 acc 55.859 (54.567)	lr 0.00017
Warmup Train [39][1620/3239]	Time 0.431 (0.520)	Data 0.001 (0.016)	Loss 4.0113 (4.0037)	Top-1 acc 32.422 (31.146)	Top-5 acc 51.562 (54.574)	lr 0.00017
Warmup Train [39][1630/3239]	Time 0.511 (0.520)	Data 0.001 (0.016)	Loss 3.9935 (4.0038)	Top-1 acc 32.031 (31.140)	Top-5 acc 58.984 (54.571)	lr 0.00017
Warmup Train [39][1640/3239]	Time 0.638 (0.520)	Data 0.001 (0.016)	Loss 3.9569 (4.0038)	Top-1 acc 34.766 (31.144)	Top-5 acc 54.688 (54.566)	lr 0.00017
Warmup Train [39][1650/3239]	Time 0.402 (0.520)	Data 0.001 (0.016)	Loss 4.0041 (4.0038)	Top-1 acc 28.516 (31.139)	Top-5 acc 56.250 (54.565)	lr 0.00017
Warmup Train [39][1660/3239]	Time 0.444 (0.520)	Data 0.001 (0.016)	Loss 4.0273 (4.0039)	Top-1 acc 30.859 (31.135)	Top-5 acc 53.906 (54.565)	lr 0.00017
Warmup Train [39][1670/3239]	Time 0.552 (0.520)	Data 0.001 (0.016)	Loss 3.9738 (4.0043)	Top-1 acc 33.594 (31.129)	Top-5 acc 51.953 (54.556)	lr 0.00017
Warmup Train [39][1680/3239]	Time 0.817 (0.520)	Data 0.001 (0.016)	Loss 3.8051 (4.0044)	Top-1 acc 28.906 (31.123)	Top-5 acc 56.250 (54.548)	lr 0.00017
Warmup Train [39][1690/3239]	Time 0.446 (0.520)	Data 0.001 (0.016)	Loss 4.0092 (4.0045)	Top-1 acc 29.688 (31.118)	Top-5 acc 56.250 (54.547)	lr 0.00017
Warmup Train [39][1700/3239]	Time 0.526 (0.520)	Data 0.001 (0.015)	Loss 3.9958 (4.0045)	Top-1 acc 32.031 (31.120)	Top-5 acc 55.469 (54.547)	lr 0.00017
Warmup Train [39][1710/3239]	Time 0.531 (0.520)	Data 0.001 (0.015)	Loss 4.0443 (4.0045)	Top-1 acc 30.078 (31.122)	Top-5 acc 52.344 (54.551)	lr 0.00017
Warmup Train [39][1720/3239]	Time 0.604 (0.520)	Data 0.001 (0.015)	Loss 3.9697 (4.0044)	Top-1 acc 32.812 (31.122)	Top-5 acc 56.641 (54.558)	lr 0.00017
Warmup Train [39][1730/3239]	Time 0.461 (0.519)	Data 0.001 (0.015)	Loss 3.9879 (4.0042)	Top-1 acc 33.594 (31.126)	Top-5 acc 53.125 (54.568)	lr 0.00017
Warmup Train [39][1740/3239]	Time 0.564 (0.519)	Data 0.001 (0.015)	Loss 3.9729 (4.0041)	Top-1 acc 31.250 (31.128)	Top-5 acc 57.031 (54.572)	lr 0.00016
Warmup Train [39][1750/3239]	Time 0.492 (0.519)	Data 0.001 (0.015)	Loss 4.0561 (4.0040)	Top-1 acc 28.906 (31.127)	Top-5 acc 53.516 (54.572)	lr 0.00016
Warmup Train [39][1760/3239]	Time 0.535 (0.519)	Data 0.001 (0.015)	Loss 3.9830 (4.0038)	Top-1 acc 30.859 (31.130)	Top-5 acc 54.688 (54.578)	lr 0.00016
Warmup Train [39][1770/3239]	Time 0.714 (0.519)	Data 0.001 (0.015)	Loss 4.0232 (4.0037)	Top-1 acc 26.562 (31.121)	Top-5 acc 53.125 (54.578)	lr 0.00016
Warmup Train [39][1780/3239]	Time 0.424 (0.518)	Data 0.002 (0.015)	Loss 3.8924 (4.0039)	Top-1 acc 32.031 (31.120)	Top-5 acc 52.344 (54.572)	lr 0.00016
Warmup Train [39][1790/3239]	Time 0.614 (0.518)	Data 0.001 (0.015)	Loss 3.9976 (4.0040)	Top-1 acc 32.812 (31.121)	Top-5 acc 52.734 (54.565)	lr 0.00016
Warmup Train [39][1800/3239]	Time 0.344 (0.518)	Data 0.001 (0.015)	Loss 4.1501 (4.0043)	Top-1 acc 27.344 (31.114)	Top-5 acc 50.391 (54.557)	lr 0.00016
Warmup Train [39][1810/3239]	Time 0.386 (0.518)	Data 0.001 (0.015)	Loss 3.9016 (4.0043)	Top-1 acc 32.812 (31.119)	Top-5 acc 55.078 (54.556)	lr 0.00016
Warmup Train [39][1820/3239]	Time 0.617 (0.518)	Data 0.001 (0.015)	Loss 4.2466 (4.0043)	Top-1 acc 25.781 (31.114)	Top-5 acc 50.391 (54.553)	lr 0.00016
Warmup Train [39][1830/3239]	Time 0.572 (0.518)	Data 0.001 (0.015)	Loss 4.0285 (4.0043)	Top-1 acc 27.734 (31.116)	Top-5 acc 57.031 (54.552)	lr 0.00016
Warmup Train [39][1840/3239]	Time 0.514 (0.518)	Data 0.001 (0.015)	Loss 4.0628 (4.0047)	Top-1 acc 27.344 (31.111)	Top-5 acc 51.953 (54.547)	lr 0.00016
Warmup Train [39][1850/3239]	Time 0.620 (0.518)	Data 0.001 (0.015)	Loss 3.9379 (4.0046)	Top-1 acc 35.156 (31.119)	Top-5 acc 58.594 (54.551)	lr 0.00016
Warmup Train [39][1860/3239]	Time 0.548 (0.518)	Data 0.001 (0.015)	Loss 3.9638 (4.0045)	Top-1 acc 28.516 (31.114)	Top-5 acc 57.422 (54.554)	lr 0.00016
Warmup Train [39][1870/3239]	Time 0.544 (0.518)	Data 0.001 (0.014)	Loss 4.0461 (4.0043)	Top-1 acc 30.078 (31.117)	Top-5 acc 52.734 (54.558)	lr 0.00016
Warmup Train [39][1880/3239]	Time 0.476 (0.518)	Data 0.001 (0.014)	Loss 4.0372 (4.0040)	Top-1 acc 28.125 (31.116)	Top-5 acc 53.516 (54.556)	lr 0.00016
Warmup Train [39][1890/3239]	Time 0.663 (0.518)	Data 0.001 (0.014)	Loss 3.8817 (4.0042)	Top-1 acc 37.109 (31.114)	Top-5 acc 57.031 (54.554)	lr 0.00015
Warmup Train [39][1900/3239]	Time 0.353 (0.518)	Data 0.001 (0.014)	Loss 4.0385 (4.0040)	Top-1 acc 28.906 (31.125)	Top-5 acc 52.344 (54.560)	lr 0.00015
Warmup Train [39][1910/3239]	Time 0.335 (0.518)	Data 0.001 (0.014)	Loss 4.1613 (4.0037)	Top-1 acc 27.344 (31.128)	Top-5 acc 50.391 (54.569)	lr 0.00015
Warmup Train [39][1920/3239]	Time 0.578 (0.518)	Data 0.001 (0.014)	Loss 3.9761 (4.0036)	Top-1 acc 25.781 (31.125)	Top-5 acc 54.688 (54.571)	lr 0.00015
Warmup Train [39][1930/3239]	Time 0.494 (0.518)	Data 0.001 (0.014)	Loss 4.1783 (4.0039)	Top-1 acc 28.516 (31.123)	Top-5 acc 52.344 (54.565)	lr 0.00015
Warmup Train [39][1940/3239]	Time 0.539 (0.518)	Data 0.001 (0.014)	Loss 4.0897 (4.0040)	Top-1 acc 29.688 (31.124)	Top-5 acc 53.516 (54.564)	lr 0.00015
Warmup Train [39][1950/3239]	Time 0.539 (0.518)	Data 0.001 (0.014)	Loss 4.1921 (4.0039)	Top-1 acc 26.172 (31.123)	Top-5 acc 51.562 (54.567)	lr 0.00015
Warmup Train [39][1960/3239]	Time 0.572 (0.518)	Data 0.001 (0.014)	Loss 3.9571 (4.0038)	Top-1 acc 30.078 (31.123)	Top-5 acc 55.859 (54.569)	lr 0.00015
Warmup Train [39][1970/3239]	Time 0.307 (0.518)	Data 0.001 (0.014)	Loss 3.9207 (4.0036)	Top-1 acc 32.422 (31.128)	Top-5 acc 57.812 (54.579)	lr 0.00015
Warmup Train [39][1980/3239]	Time 0.473 (0.518)	Data 0.001 (0.014)	Loss 3.9315 (4.0035)	Top-1 acc 32.422 (31.126)	Top-5 acc 58.984 (54.582)	lr 0.00015
Warmup Train [39][1990/3239]	Time 0.442 (0.518)	Data 0.001 (0.014)	Loss 4.0640 (4.0038)	Top-1 acc 30.859 (31.122)	Top-5 acc 53.516 (54.580)	lr 0.00015
Warmup Train [39][2000/3239]	Time 0.630 (0.518)	Data 0.001 (0.014)	Loss 4.0495 (4.0041)	Top-1 acc 33.203 (31.118)	Top-5 acc 53.906 (54.573)	lr 0.00015
Warmup Train [39][2010/3239]	Time 0.279 (0.517)	Data 0.001 (0.014)	Loss 4.1493 (4.0041)	Top-1 acc 29.297 (31.118)	Top-5 acc 51.953 (54.568)	lr 0.00015
Warmup Train [39][2020/3239]	Time 0.472 (0.517)	Data 0.001 (0.014)	Loss 3.8098 (4.0040)	Top-1 acc 34.766 (31.122)	Top-5 acc 59.766 (54.568)	lr 0.00015
Warmup Train [39][2030/3239]	Time 0.207 (0.517)	Data 0.001 (0.014)	Loss 3.9229 (4.0042)	Top-1 acc 32.422 (31.122)	Top-5 acc 57.812 (54.566)	lr 0.00015
Warmup Train [39][2040/3239]	Time 0.605 (0.517)	Data 0.001 (0.014)	Loss 4.1495 (4.0042)	Top-1 acc 26.562 (31.121)	Top-5 acc 46.875 (54.564)	lr 0.00014
Warmup Train [39][2050/3239]	Time 0.349 (0.517)	Data 0.002 (0.014)	Loss 3.9295 (4.0040)	Top-1 acc 30.469 (31.125)	Top-5 acc 55.469 (54.568)	lr 0.00014
Warmup Train [39][2060/3239]	Time 0.590 (0.517)	Data 0.001 (0.014)	Loss 3.9717 (4.0041)	Top-1 acc 31.641 (31.119)	Top-5 acc 57.422 (54.562)	lr 0.00014
Warmup Train [39][2070/3239]	Time 0.487 (0.517)	Data 0.001 (0.014)	Loss 3.9932 (4.0040)	Top-1 acc 32.422 (31.128)	Top-5 acc 56.250 (54.568)	lr 0.00014
Warmup Train [39][2080/3239]	Time 0.553 (0.517)	Data 0.001 (0.014)	Loss 4.0184 (4.0041)	Top-1 acc 33.984 (31.132)	Top-5 acc 56.641 (54.568)	lr 0.00014
Warmup Train [39][2090/3239]	Time 0.372 (0.517)	Data 0.001 (0.014)	Loss 3.9516 (4.0042)	Top-1 acc 30.469 (31.132)	Top-5 acc 57.422 (54.568)	lr 0.00014
Warmup Train [39][2100/3239]	Time 0.650 (0.517)	Data 0.001 (0.014)	Loss 3.8944 (4.0042)	Top-1 acc 33.203 (31.136)	Top-5 acc 55.469 (54.565)	lr 0.00014
Warmup Train [39][2110/3239]	Time 0.368 (0.517)	Data 0.031 (0.014)	Loss 4.0143 (4.0041)	Top-1 acc 30.859 (31.134)	Top-5 acc 51.953 (54.562)	lr 0.00014
Warmup Train [39][2120/3239]	Time 0.562 (0.517)	Data 0.001 (0.014)	Loss 3.9699 (4.0041)	Top-1 acc 27.734 (31.132)	Top-5 acc 55.078 (54.562)	lr 0.00014
Warmup Train [39][2130/3239]	Time 0.541 (0.517)	Data 0.001 (0.014)	Loss 4.0116 (4.0041)	Top-1 acc 29.297 (31.130)	Top-5 acc 53.516 (54.560)	lr 0.00014
Warmup Train [39][2140/3239]	Time 0.490 (0.517)	Data 0.001 (0.014)	Loss 3.9101 (4.0042)	Top-1 acc 34.375 (31.129)	Top-5 acc 54.297 (54.558)	lr 0.00014
Warmup Train [39][2150/3239]	Time 0.613 (0.517)	Data 0.002 (0.014)	Loss 4.0012 (4.0043)	Top-1 acc 30.859 (31.127)	Top-5 acc 55.859 (54.556)	lr 0.00014
Warmup Train [39][2160/3239]	Time 0.518 (0.517)	Data 0.001 (0.014)	Loss 4.0899 (4.0043)	Top-1 acc 30.859 (31.129)	Top-5 acc 52.344 (54.558)	lr 0.00014
Warmup Train [39][2170/3239]	Time 0.466 (0.517)	Data 0.001 (0.014)	Loss 4.0287 (4.0044)	Top-1 acc 30.859 (31.129)	Top-5 acc 53.125 (54.555)	lr 0.00014
Warmup Train [39][2180/3239]	Time 0.359 (0.517)	Data 0.001 (0.014)	Loss 3.8765 (4.0045)	Top-1 acc 32.422 (31.125)	Top-5 acc 56.641 (54.549)	lr 0.00014
Warmup Train [39][2190/3239]	Time 0.493 (0.517)	Data 0.001 (0.014)	Loss 4.0892 (4.0041)	Top-1 acc 30.469 (31.131)	Top-5 acc 53.516 (54.554)	lr 0.00014
Warmup Train [39][2200/3239]	Time 0.517 (0.517)	Data 0.001 (0.014)	Loss 4.0099 (4.0040)	Top-1 acc 28.906 (31.133)	Top-5 acc 53.906 (54.562)	lr 0.00013
Warmup Train [39][2210/3239]	Time 0.568 (0.517)	Data 0.001 (0.014)	Loss 4.0218 (4.0040)	Top-1 acc 31.641 (31.136)	Top-5 acc 55.859 (54.562)	lr 0.00013
Warmup Train [39][2220/3239]	Time 0.683 (0.517)	Data 0.001 (0.014)	Loss 4.1070 (4.0040)	Top-1 acc 31.641 (31.135)	Top-5 acc 52.344 (54.559)	lr 0.00013
Warmup Train [39][2230/3239]	Time 0.468 (0.517)	Data 0.001 (0.013)	Loss 3.9276 (4.0041)	Top-1 acc 30.469 (31.134)	Top-5 acc 57.422 (54.560)	lr 0.00013
Warmup Train [39][2240/3239]	Time 0.471 (0.517)	Data 0.001 (0.013)	Loss 3.9184 (4.0039)	Top-1 acc 33.594 (31.139)	Top-5 acc 58.984 (54.568)	lr 0.00013
Warmup Train [39][2250/3239]	Time 0.366 (0.517)	Data 0.001 (0.013)	Loss 4.1118 (4.0044)	Top-1 acc 33.203 (31.139)	Top-5 acc 53.125 (54.561)	lr 0.00013
Warmup Train [39][2260/3239]	Time 0.544 (0.517)	Data 0.002 (0.013)	Loss 3.7624 (4.0041)	Top-1 acc 33.203 (31.142)	Top-5 acc 59.766 (54.568)	lr 0.00013
Warmup Train [39][2270/3239]	Time 0.483 (0.517)	Data 0.001 (0.013)	Loss 3.9975 (4.0040)	Top-1 acc 30.469 (31.149)	Top-5 acc 52.344 (54.576)	lr 0.00013
Warmup Train [39][2280/3239]	Time 0.397 (0.516)	Data 0.001 (0.013)	Loss 3.9763 (4.0040)	Top-1 acc 33.594 (31.152)	Top-5 acc 56.250 (54.578)	lr 0.00013
Warmup Train [39][2290/3239]	Time 0.608 (0.516)	Data 0.001 (0.013)	Loss 4.0004 (4.0040)	Top-1 acc 36.719 (31.154)	Top-5 acc 57.031 (54.577)	lr 0.00013
Warmup Train [39][2300/3239]	Time 0.482 (0.516)	Data 0.001 (0.013)	Loss 4.0133 (4.0041)	Top-1 acc 30.859 (31.149)	Top-5 acc 55.469 (54.572)	lr 0.00013
Warmup Train [39][2310/3239]	Time 0.490 (0.516)	Data 0.001 (0.013)	Loss 4.1343 (4.0044)	Top-1 acc 30.469 (31.145)	Top-5 acc 51.953 (54.565)	lr 0.00013
Warmup Train [39][2320/3239]	Time 0.424 (0.516)	Data 0.001 (0.013)	Loss 3.9072 (4.0042)	Top-1 acc 30.859 (31.149)	Top-5 acc 56.250 (54.570)	lr 0.00013
Warmup Train [39][2330/3239]	Time 0.502 (0.516)	Data 0.001 (0.013)	Loss 3.9458 (4.0043)	Top-1 acc 33.203 (31.143)	Top-5 acc 56.250 (54.569)	lr 0.00013
Warmup Train [39][2340/3239]	Time 0.442 (0.516)	Data 0.001 (0.013)	Loss 3.8344 (4.0045)	Top-1 acc 36.328 (31.137)	Top-5 acc 60.938 (54.567)	lr 0.00013
Warmup Train [39][2350/3239]	Time 0.489 (0.516)	Data 0.001 (0.013)	Loss 4.1621 (4.0042)	Top-1 acc 28.906 (31.138)	Top-5 acc 50.000 (54.576)	lr 0.00013
Warmup Train [39][2360/3239]	Time 0.411 (0.516)	Data 0.001 (0.013)	Loss 4.0091 (4.0041)	Top-1 acc 29.688 (31.138)	Top-5 acc 55.078 (54.573)	lr 0.00012
Warmup Train [39][2370/3239]	Time 0.520 (0.516)	Data 0.001 (0.013)	Loss 3.9294 (4.0041)	Top-1 acc 32.812 (31.143)	Top-5 acc 56.641 (54.579)	lr 0.00012
Warmup Train [39][2380/3239]	Time 0.562 (0.516)	Data 0.001 (0.013)	Loss 4.0270 (4.0040)	Top-1 acc 30.078 (31.145)	Top-5 acc 54.688 (54.581)	lr 0.00012
Warmup Train [39][2390/3239]	Time 0.360 (0.516)	Data 0.026 (0.013)	Loss 4.0931 (4.0043)	Top-1 acc 29.297 (31.139)	Top-5 acc 51.953 (54.577)	lr 0.00012
Warmup Train [39][2400/3239]	Time 0.363 (0.516)	Data 0.001 (0.013)	Loss 4.1801 (4.0040)	Top-1 acc 25.781 (31.146)	Top-5 acc 50.781 (54.585)	lr 0.00012
Warmup Train [39][2410/3239]	Time 0.557 (0.516)	Data 0.001 (0.013)	Loss 4.1696 (4.0040)	Top-1 acc 26.562 (31.147)	Top-5 acc 51.953 (54.591)	lr 0.00012
Warmup Train [39][2420/3239]	Time 0.491 (0.516)	Data 0.001 (0.013)	Loss 4.1048 (4.0039)	Top-1 acc 26.562 (31.145)	Top-5 acc 52.344 (54.594)	lr 0.00012
Warmup Train [39][2430/3239]	Time 0.409 (0.516)	Data 0.001 (0.013)	Loss 3.8503 (4.0038)	Top-1 acc 30.859 (31.144)	Top-5 acc 56.641 (54.593)	lr 0.00012
Warmup Train [39][2440/3239]	Time 0.350 (0.516)	Data 0.001 (0.013)	Loss 4.1201 (4.0041)	Top-1 acc 28.125 (31.137)	Top-5 acc 50.391 (54.586)	lr 0.00012
Warmup Train [39][2450/3239]	Time 0.362 (0.516)	Data 0.001 (0.013)	Loss 4.1684 (4.0043)	Top-1 acc 26.953 (31.135)	Top-5 acc 50.781 (54.579)	lr 0.00012
Warmup Train [39][2460/3239]	Time 0.684 (0.516)	Data 0.001 (0.013)	Loss 3.9379 (4.0042)	Top-1 acc 32.031 (31.132)	Top-5 acc 53.906 (54.580)	lr 0.00012
Warmup Train [39][2470/3239]	Time 0.576 (0.516)	Data 0.001 (0.013)	Loss 3.9953 (4.0044)	Top-1 acc 28.516 (31.128)	Top-5 acc 57.422 (54.577)	lr 0.00012
Warmup Train [39][2480/3239]	Time 0.548 (0.516)	Data 0.001 (0.013)	Loss 4.1014 (4.0043)	Top-1 acc 27.344 (31.132)	Top-5 acc 52.734 (54.580)	lr 0.00012
Warmup Train [39][2490/3239]	Time 0.597 (0.516)	Data 0.001 (0.013)	Loss 3.9357 (4.0042)	Top-1 acc 32.031 (31.132)	Top-5 acc 55.859 (54.578)	lr 0.00012
Warmup Train [39][2500/3239]	Time 0.341 (0.516)	Data 0.001 (0.013)	Loss 3.9233 (4.0039)	Top-1 acc 31.641 (31.137)	Top-5 acc 54.297 (54.583)	lr 0.00012
Warmup Train [39][2510/3239]	Time 0.522 (0.516)	Data 0.001 (0.013)	Loss 4.0337 (4.0041)	Top-1 acc 30.859 (31.134)	Top-5 acc 52.344 (54.578)	lr 0.00012
Warmup Train [39][2520/3239]	Time 0.402 (0.516)	Data 0.001 (0.013)	Loss 3.7275 (4.0040)	Top-1 acc 34.375 (31.135)	Top-5 acc 59.375 (54.583)	lr 0.00012
Warmup Train [39][2530/3239]	Time 0.407 (0.516)	Data 0.001 (0.013)	Loss 3.9701 (4.0041)	Top-1 acc 30.469 (31.129)	Top-5 acc 56.641 (54.581)	lr 0.00011
Warmup Train [39][2540/3239]	Time 0.525 (0.515)	Data 0.002 (0.013)	Loss 3.9696 (4.0042)	Top-1 acc 32.422 (31.129)	Top-5 acc 54.688 (54.582)	lr 0.00011
Warmup Train [39][2550/3239]	Time 0.531 (0.515)	Data 0.001 (0.013)	Loss 3.8910 (4.0040)	Top-1 acc 30.859 (31.131)	Top-5 acc 54.297 (54.586)	lr 0.00011
Warmup Train [39][2560/3239]	Time 0.559 (0.515)	Data 0.001 (0.013)	Loss 4.0861 (4.0040)	Top-1 acc 30.469 (31.130)	Top-5 acc 51.953 (54.586)	lr 0.00011
Warmup Train [39][2570/3239]	Time 0.525 (0.515)	Data 0.001 (0.013)	Loss 3.9565 (4.0038)	Top-1 acc 33.203 (31.134)	Top-5 acc 56.250 (54.595)	lr 0.00011
Warmup Train [39][2580/3239]	Time 0.540 (0.515)	Data 0.001 (0.013)	Loss 3.9233 (4.0035)	Top-1 acc 32.422 (31.141)	Top-5 acc 53.516 (54.601)	lr 0.00011
Warmup Train [39][2590/3239]	Time 0.474 (0.516)	Data 0.001 (0.013)	Loss 4.1802 (4.0034)	Top-1 acc 28.125 (31.142)	Top-5 acc 52.734 (54.606)	lr 0.00011
Warmup Train [39][2600/3239]	Time 0.501 (0.515)	Data 0.001 (0.013)	Loss 4.0282 (4.0035)	Top-1 acc 31.250 (31.140)	Top-5 acc 51.562 (54.604)	lr 0.00011
Warmup Train [39][2610/3239]	Time 0.473 (0.516)	Data 0.001 (0.013)	Loss 3.7641 (4.0031)	Top-1 acc 34.375 (31.148)	Top-5 acc 60.547 (54.611)	lr 0.00011
Warmup Train [39][2620/3239]	Time 0.646 (0.515)	Data 0.001 (0.013)	Loss 3.9110 (4.0028)	Top-1 acc 30.859 (31.156)	Top-5 acc 58.203 (54.622)	lr 0.00011
Warmup Train [39][2630/3239]	Time 0.436 (0.515)	Data 0.001 (0.012)	Loss 4.0301 (4.0029)	Top-1 acc 27.734 (31.152)	Top-5 acc 53.125 (54.614)	lr 0.00011
Warmup Train [39][2640/3239]	Time 0.619 (0.516)	Data 0.001 (0.012)	Loss 4.1101 (4.0029)	Top-1 acc 30.078 (31.152)	Top-5 acc 53.125 (54.612)	lr 0.00011
Warmup Train [39][2650/3239]	Time 0.409 (0.516)	Data 0.001 (0.012)	Loss 4.0556 (4.0028)	Top-1 acc 26.172 (31.153)	Top-5 acc 52.734 (54.615)	lr 0.00011
Warmup Train [39][2660/3239]	Time 0.572 (0.516)	Data 0.001 (0.012)	Loss 4.1360 (4.0028)	Top-1 acc 29.688 (31.153)	Top-5 acc 49.219 (54.616)	lr 0.00011
Warmup Train [39][2670/3239]	Time 0.443 (0.516)	Data 0.001 (0.012)	Loss 4.0500 (4.0028)	Top-1 acc 27.734 (31.158)	Top-5 acc 54.297 (54.620)	lr 0.00011
Warmup Train [39][2680/3239]	Time 0.330 (0.516)	Data 0.001 (0.012)	Loss 4.0971 (4.0028)	Top-1 acc 28.906 (31.155)	Top-5 acc 53.906 (54.622)	lr 0.00011
Warmup Train [39][2690/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 3.9617 (4.0029)	Top-1 acc 33.984 (31.155)	Top-5 acc 56.641 (54.621)	lr 0.00011
Warmup Train [39][2700/3239]	Time 0.309 (0.516)	Data 0.001 (0.012)	Loss 4.0416 (4.0028)	Top-1 acc 27.734 (31.155)	Top-5 acc 52.344 (54.623)	lr 0.00010
Warmup Train [39][2710/3239]	Time 0.522 (0.516)	Data 0.001 (0.012)	Loss 3.8265 (4.0026)	Top-1 acc 38.281 (31.158)	Top-5 acc 58.594 (54.629)	lr 0.00010
Warmup Train [39][2720/3239]	Time 0.522 (0.516)	Data 0.001 (0.012)	Loss 4.0717 (4.0030)	Top-1 acc 28.516 (31.154)	Top-5 acc 51.953 (54.619)	lr 0.00010
Warmup Train [39][2730/3239]	Time 0.383 (0.516)	Data 0.001 (0.012)	Loss 3.9806 (4.0031)	Top-1 acc 28.516 (31.150)	Top-5 acc 57.812 (54.620)	lr 0.00010
Warmup Train [39][2740/3239]	Time 0.548 (0.516)	Data 0.001 (0.012)	Loss 3.9819 (4.0030)	Top-1 acc 32.031 (31.156)	Top-5 acc 55.859 (54.627)	lr 0.00010
Warmup Train [39][2750/3239]	Time 0.512 (0.516)	Data 0.001 (0.012)	Loss 3.9904 (4.0029)	Top-1 acc 33.594 (31.159)	Top-5 acc 55.469 (54.628)	lr 0.00010
Warmup Train [39][2760/3239]	Time 0.501 (0.516)	Data 0.001 (0.012)	Loss 4.1935 (4.0029)	Top-1 acc 27.344 (31.162)	Top-5 acc 48.438 (54.626)	lr 0.00010
Warmup Train [39][2770/3239]	Time 0.445 (0.516)	Data 0.001 (0.012)	Loss 3.8378 (4.0029)	Top-1 acc 32.422 (31.160)	Top-5 acc 58.594 (54.627)	lr 0.00010
Warmup Train [39][2780/3239]	Time 0.528 (0.515)	Data 0.001 (0.012)	Loss 3.9079 (4.0030)	Top-1 acc 32.031 (31.159)	Top-5 acc 54.688 (54.623)	lr 0.00010
Warmup Train [39][2790/3239]	Time 0.482 (0.515)	Data 0.001 (0.012)	Loss 3.8357 (4.0027)	Top-1 acc 35.156 (31.164)	Top-5 acc 57.812 (54.630)	lr 0.00010
Warmup Train [39][2800/3239]	Time 0.459 (0.515)	Data 0.001 (0.012)	Loss 3.9305 (4.0026)	Top-1 acc 28.906 (31.165)	Top-5 acc 53.516 (54.631)	lr 0.00010
Warmup Train [39][2810/3239]	Time 0.492 (0.515)	Data 0.001 (0.012)	Loss 3.9485 (4.0027)	Top-1 acc 31.250 (31.162)	Top-5 acc 53.516 (54.624)	lr 0.00010
Warmup Train [39][2820/3239]	Time 0.527 (0.515)	Data 0.001 (0.012)	Loss 4.2057 (4.0029)	Top-1 acc 29.297 (31.160)	Top-5 acc 49.219 (54.616)	lr 0.00010
Warmup Train [39][2830/3239]	Time 0.575 (0.515)	Data 0.001 (0.012)	Loss 4.2367 (4.0029)	Top-1 acc 28.516 (31.159)	Top-5 acc 50.000 (54.618)	lr 0.00010
Warmup Train [39][2840/3239]	Time 0.481 (0.515)	Data 0.001 (0.012)	Loss 3.9493 (4.0028)	Top-1 acc 29.688 (31.160)	Top-5 acc 56.641 (54.618)	lr 0.00010
Warmup Train [39][2850/3239]	Time 0.516 (0.515)	Data 0.001 (0.012)	Loss 4.0480 (4.0026)	Top-1 acc 27.734 (31.164)	Top-5 acc 51.953 (54.618)	lr 0.00010
Warmup Train [39][2860/3239]	Time 0.477 (0.515)	Data 0.001 (0.012)	Loss 4.1212 (4.0027)	Top-1 acc 30.469 (31.163)	Top-5 acc 55.078 (54.616)	lr 0.00010
Warmup Train [39][2870/3239]	Time 0.484 (0.515)	Data 0.001 (0.012)	Loss 3.9644 (4.0028)	Top-1 acc 30.078 (31.161)	Top-5 acc 55.469 (54.613)	lr 0.00010
Warmup Train [39][2880/3239]	Time 0.556 (0.515)	Data 0.001 (0.012)	Loss 4.0621 (4.0029)	Top-1 acc 32.031 (31.159)	Top-5 acc 56.641 (54.612)	lr 0.00010
Warmup Train [39][2890/3239]	Time 0.546 (0.515)	Data 0.001 (0.012)	Loss 4.0129 (4.0032)	Top-1 acc 29.688 (31.150)	Top-5 acc 51.562 (54.605)	lr 0.00009
Warmup Train [39][2900/3239]	Time 0.457 (0.515)	Data 0.001 (0.012)	Loss 3.9570 (4.0031)	Top-1 acc 31.641 (31.151)	Top-5 acc 54.688 (54.603)	lr 0.00009
Warmup Train [39][2910/3239]	Time 0.473 (0.515)	Data 0.001 (0.012)	Loss 3.9908 (4.0030)	Top-1 acc 29.688 (31.152)	Top-5 acc 57.422 (54.605)	lr 0.00009
Warmup Train [39][2920/3239]	Time 0.371 (0.515)	Data 0.001 (0.012)	Loss 3.8780 (4.0029)	Top-1 acc 30.859 (31.155)	Top-5 acc 58.984 (54.608)	lr 0.00009
Warmup Train [39][2930/3239]	Time 0.609 (0.515)	Data 0.001 (0.012)	Loss 3.9865 (4.0031)	Top-1 acc 30.469 (31.148)	Top-5 acc 57.031 (54.605)	lr 0.00009
Warmup Train [39][2940/3239]	Time 0.696 (0.515)	Data 0.001 (0.012)	Loss 3.8969 (4.0030)	Top-1 acc 31.641 (31.150)	Top-5 acc 57.031 (54.607)	lr 0.00009
Warmup Train [39][2950/3239]	Time 0.573 (0.515)	Data 0.001 (0.012)	Loss 3.7103 (4.0031)	Top-1 acc 40.234 (31.147)	Top-5 acc 64.453 (54.604)	lr 0.00009
Warmup Train [39][2960/3239]	Time 0.631 (0.515)	Data 0.001 (0.012)	Loss 3.7770 (4.0032)	Top-1 acc 32.812 (31.146)	Top-5 acc 60.547 (54.605)	lr 0.00009
Warmup Train [39][2970/3239]	Time 0.468 (0.515)	Data 0.001 (0.012)	Loss 3.9115 (4.0032)	Top-1 acc 31.250 (31.146)	Top-5 acc 56.641 (54.604)	lr 0.00009
Warmup Train [39][2980/3239]	Time 0.362 (0.515)	Data 0.001 (0.012)	Loss 4.1576 (4.0034)	Top-1 acc 28.125 (31.142)	Top-5 acc 52.344 (54.602)	lr 0.00009
Warmup Train [39][2990/3239]	Time 0.464 (0.515)	Data 0.001 (0.012)	Loss 3.7993 (4.0036)	Top-1 acc 33.984 (31.137)	Top-5 acc 61.328 (54.601)	lr 0.00009
Warmup Train [39][3000/3239]	Time 0.613 (0.515)	Data 0.001 (0.012)	Loss 3.9285 (4.0035)	Top-1 acc 34.766 (31.139)	Top-5 acc 57.422 (54.603)	lr 0.00009
Warmup Train [39][3010/3239]	Time 0.611 (0.515)	Data 0.001 (0.012)	Loss 4.1171 (4.0033)	Top-1 acc 30.859 (31.142)	Top-5 acc 53.125 (54.606)	lr 0.00009
Warmup Train [39][3020/3239]	Time 0.458 (0.515)	Data 0.001 (0.012)	Loss 4.0303 (4.0033)	Top-1 acc 33.594 (31.141)	Top-5 acc 52.734 (54.606)	lr 0.00009
Warmup Train [39][3030/3239]	Time 0.479 (0.515)	Data 0.003 (0.012)	Loss 3.9101 (4.0031)	Top-1 acc 33.203 (31.144)	Top-5 acc 58.203 (54.609)	lr 0.00009
Warmup Train [39][3040/3239]	Time 0.603 (0.515)	Data 0.001 (0.012)	Loss 3.9621 (4.0030)	Top-1 acc 32.031 (31.147)	Top-5 acc 55.859 (54.613)	lr 0.00009
Warmup Train [39][3050/3239]	Time 0.453 (0.515)	Data 0.001 (0.012)	Loss 4.1609 (4.0031)	Top-1 acc 30.078 (31.147)	Top-5 acc 48.828 (54.611)	lr 0.00009
Warmup Train [39][3060/3239]	Time 0.595 (0.515)	Data 0.001 (0.012)	Loss 4.1975 (4.0032)	Top-1 acc 26.562 (31.146)	Top-5 acc 51.953 (54.606)	lr 0.00009
Warmup Train [39][3070/3239]	Time 0.405 (0.515)	Data 0.001 (0.012)	Loss 4.0088 (4.0032)	Top-1 acc 35.547 (31.147)	Top-5 acc 55.469 (54.604)	lr 0.00009
Warmup Train [39][3080/3239]	Time 0.527 (0.515)	Data 0.001 (0.012)	Loss 3.9981 (4.0033)	Top-1 acc 26.562 (31.145)	Top-5 acc 54.297 (54.603)	lr 0.00008
Warmup Train [39][3090/3239]	Time 0.428 (0.515)	Data 0.001 (0.012)	Loss 3.9502 (4.0033)	Top-1 acc 31.641 (31.144)	Top-5 acc 56.250 (54.603)	lr 0.00008
Warmup Train [39][3100/3239]	Time 0.586 (0.515)	Data 0.001 (0.012)	Loss 3.9342 (4.0030)	Top-1 acc 32.031 (31.149)	Top-5 acc 55.859 (54.607)	lr 0.00008
Warmup Train [39][3110/3239]	Time 0.595 (0.515)	Data 0.001 (0.012)	Loss 3.9553 (4.0032)	Top-1 acc 30.859 (31.143)	Top-5 acc 60.156 (54.607)	lr 0.00008
Warmup Train [39][3120/3239]	Time 0.532 (0.515)	Data 0.001 (0.012)	Loss 4.0778 (4.0032)	Top-1 acc 28.516 (31.146)	Top-5 acc 53.516 (54.605)	lr 0.00008
Warmup Train [39][3130/3239]	Time 0.483 (0.515)	Data 0.001 (0.012)	Loss 4.0816 (4.0032)	Top-1 acc 27.344 (31.147)	Top-5 acc 49.609 (54.606)	lr 0.00008
Warmup Train [39][3140/3239]	Time 0.551 (0.515)	Data 0.001 (0.011)	Loss 4.0139 (4.0032)	Top-1 acc 31.250 (31.150)	Top-5 acc 53.906 (54.608)	lr 0.00008
Warmup Train [39][3150/3239]	Time 0.540 (0.515)	Data 0.001 (0.011)	Loss 3.8213 (4.0030)	Top-1 acc 35.547 (31.153)	Top-5 acc 56.641 (54.610)	lr 0.00008
Warmup Train [39][3160/3239]	Time 0.593 (0.515)	Data 0.001 (0.011)	Loss 4.1425 (4.0030)	Top-1 acc 28.516 (31.148)	Top-5 acc 50.000 (54.609)	lr 0.00008
Warmup Train [39][3170/3239]	Time 0.516 (0.515)	Data 0.001 (0.011)	Loss 4.0726 (4.0031)	Top-1 acc 30.078 (31.148)	Top-5 acc 55.078 (54.604)	lr 0.00008
Warmup Train [39][3180/3239]	Time 0.653 (0.515)	Data 0.000 (0.011)	Loss 3.8906 (4.0031)	Top-1 acc 36.719 (31.148)	Top-5 acc 57.422 (54.603)	lr 0.00008
Warmup Train [39][3190/3239]	Time 0.550 (0.515)	Data 0.000 (0.011)	Loss 3.8946 (4.0031)	Top-1 acc 33.984 (31.148)	Top-5 acc 57.812 (54.605)	lr 0.00008
Warmup Train [39][3200/3239]	Time 0.410 (0.515)	Data 0.000 (0.011)	Loss 3.8816 (4.0031)	Top-1 acc 29.688 (31.145)	Top-5 acc 57.031 (54.604)	lr 0.00008
Warmup Train [39][3210/3239]	Time 0.512 (0.515)	Data 0.000 (0.011)	Loss 4.0046 (4.0030)	Top-1 acc 32.031 (31.146)	Top-5 acc 56.250 (54.602)	lr 0.00008
Warmup Train [39][3220/3239]	Time 0.642 (0.515)	Data 0.000 (0.011)	Loss 3.8460 (4.0030)	Top-1 acc 33.984 (31.147)	Top-5 acc 53.516 (54.598)	lr 0.00008
Warmup Train [39][3230/3239]	Time 0.503 (0.514)	Data 0.000 (0.011)	Loss 4.0026 (4.0029)	Top-1 acc 27.734 (31.149)	Top-5 acc 56.250 (54.599)	lr 0.00008
Warmup Train [39][3239/3239]	Time 0.306 (0.514)	Data 0.000 (0.011)	Loss 4.3740 (4.0030)	Top-1 acc 23.457 (31.149)	Top-5 acc 50.617 (54.596)	lr 0.00008
==========Warmup Valid [39/40]	loss 2.951	top-1 acc 38.457	top-5 acc 63.332	Train top-1 31.149	top-5 54.596	flops: 442.4M
Warmup Train [40][0/3239]	Time 16.017 (16.017)	Data 12.680 (12.680)	Loss 4.0262 (4.0262)	Top-1 acc 28.125 (28.125)	Top-5 acc 52.344 (52.344)	lr 0.00008
Warmup Train [40][10/3239]	Time 0.526 (2.042)	Data 0.001 (1.228)	Loss 3.9775 (3.9862)	Top-1 acc 30.078 (30.895)	Top-5 acc 54.688 (54.652)	lr 0.00008
Warmup Train [40][20/3239]	Time 0.538 (1.312)	Data 0.001 (0.644)	Loss 4.1472 (3.9931)	Top-1 acc 27.734 (30.692)	Top-5 acc 51.172 (54.706)	lr 0.00008
Warmup Train [40][30/3239]	Time 0.391 (1.054)	Data 0.001 (0.437)	Loss 3.9922 (4.0010)	Top-1 acc 32.422 (30.759)	Top-5 acc 52.344 (54.662)	lr 0.00008
Warmup Train [40][40/3239]	Time 0.455 (0.920)	Data 0.001 (0.333)	Loss 4.0193 (3.9990)	Top-1 acc 32.031 (30.983)	Top-5 acc 55.859 (54.878)	lr 0.00008
Warmup Train [40][50/3239]	Time 0.527 (0.844)	Data 0.001 (0.268)	Loss 4.2035 (4.0104)	Top-1 acc 29.297 (30.882)	Top-5 acc 51.172 (54.779)	lr 0.00007
Warmup Train [40][60/3239]	Time 0.575 (0.789)	Data 0.001 (0.225)	Loss 4.0259 (4.0074)	Top-1 acc 30.469 (31.090)	Top-5 acc 53.125 (54.636)	lr 0.00007
Warmup Train [40][70/3239]	Time 0.581 (0.748)	Data 0.001 (0.193)	Loss 3.9247 (4.0011)	Top-1 acc 32.031 (31.322)	Top-5 acc 55.078 (54.616)	lr 0.00007
Warmup Train [40][80/3239]	Time 0.428 (0.718)	Data 0.001 (0.170)	Loss 4.0948 (4.0052)	Top-1 acc 32.422 (31.245)	Top-5 acc 51.172 (54.437)	lr 0.00007
Warmup Train [40][90/3239]	Time 0.354 (0.695)	Data 0.001 (0.152)	Loss 3.9887 (4.0076)	Top-1 acc 34.375 (31.254)	Top-5 acc 54.688 (54.426)	lr 0.00007
Warmup Train [40][100/3239]	Time 0.429 (0.678)	Data 0.001 (0.138)	Loss 3.8064 (4.0061)	Top-1 acc 30.469 (31.157)	Top-5 acc 58.984 (54.583)	lr 0.00007
Warmup Train [40][110/3239]	Time 0.596 (0.662)	Data 0.001 (0.127)	Loss 4.0121 (4.0069)	Top-1 acc 33.984 (31.201)	Top-5 acc 55.859 (54.582)	lr 0.00007
Warmup Train [40][120/3239]	Time 0.531 (0.648)	Data 0.001 (0.117)	Loss 4.0385 (4.0024)	Top-1 acc 31.641 (31.321)	Top-5 acc 54.297 (54.613)	lr 0.00007
Warmup Train [40][130/3239]	Time 0.363 (0.637)	Data 0.001 (0.108)	Loss 3.8331 (4.0007)	Top-1 acc 39.453 (31.345)	Top-5 acc 59.375 (54.607)	lr 0.00007
Warmup Train [40][140/3239]	Time 0.474 (0.628)	Data 0.001 (0.101)	Loss 4.1488 (4.0035)	Top-1 acc 30.859 (31.258)	Top-5 acc 54.297 (54.591)	lr 0.00007
Warmup Train [40][150/3239]	Time 0.381 (0.620)	Data 0.001 (0.095)	Loss 4.0711 (4.0009)	Top-1 acc 33.203 (31.359)	Top-5 acc 57.031 (54.672)	lr 0.00007
Warmup Train [40][160/3239]	Time 0.614 (0.615)	Data 0.001 (0.090)	Loss 3.9142 (3.9969)	Top-1 acc 34.766 (31.490)	Top-5 acc 56.250 (54.794)	lr 0.00007
Warmup Train [40][170/3239]	Time 0.629 (0.609)	Data 0.001 (0.085)	Loss 3.6935 (3.9960)	Top-1 acc 40.625 (31.506)	Top-5 acc 58.984 (54.795)	lr 0.00007
Warmup Train [40][180/3239]	Time 0.489 (0.603)	Data 0.001 (0.080)	Loss 3.7220 (3.9935)	Top-1 acc 32.031 (31.580)	Top-5 acc 57.422 (54.826)	lr 0.00007
Warmup Train [40][190/3239]	Time 0.447 (0.598)	Data 0.001 (0.076)	Loss 4.0929 (3.9955)	Top-1 acc 30.469 (31.589)	Top-5 acc 50.391 (54.790)	lr 0.00007
Warmup Train [40][200/3239]	Time 0.529 (0.594)	Data 0.001 (0.073)	Loss 3.9947 (3.9930)	Top-1 acc 33.203 (31.658)	Top-5 acc 53.516 (54.818)	lr 0.00007
Warmup Train [40][210/3239]	Time 0.521 (0.591)	Data 0.001 (0.070)	Loss 4.0981 (3.9926)	Top-1 acc 30.469 (31.694)	Top-5 acc 51.172 (54.800)	lr 0.00007
Warmup Train [40][220/3239]	Time 0.366 (0.588)	Data 0.001 (0.067)	Loss 4.0015 (3.9905)	Top-1 acc 32.031 (31.775)	Top-5 acc 51.953 (54.896)	lr 0.00007
Warmup Train [40][230/3239]	Time 0.574 (0.586)	Data 0.001 (0.065)	Loss 4.0663 (3.9906)	Top-1 acc 26.953 (31.725)	Top-5 acc 48.438 (54.852)	lr 0.00007
Warmup Train [40][240/3239]	Time 0.611 (0.583)	Data 0.001 (0.062)	Loss 3.8853 (3.9886)	Top-1 acc 34.375 (31.783)	Top-5 acc 57.422 (54.882)	lr 0.00007
Warmup Train [40][250/3239]	Time 0.568 (0.580)	Data 0.001 (0.060)	Loss 4.0195 (3.9915)	Top-1 acc 29.688 (31.680)	Top-5 acc 53.516 (54.818)	lr 0.00007
Warmup Train [40][260/3239]	Time 0.404 (0.578)	Data 0.001 (0.057)	Loss 3.9440 (3.9921)	Top-1 acc 31.641 (31.641)	Top-5 acc 51.562 (54.800)	lr 0.00007
Warmup Train [40][270/3239]	Time 0.752 (0.576)	Data 0.001 (0.056)	Loss 3.9936 (3.9917)	Top-1 acc 34.766 (31.649)	Top-5 acc 53.906 (54.839)	lr 0.00006
Warmup Train [40][280/3239]	Time 0.632 (0.574)	Data 0.001 (0.054)	Loss 4.0333 (3.9931)	Top-1 acc 32.422 (31.611)	Top-5 acc 51.562 (54.810)	lr 0.00006
Warmup Train [40][290/3239]	Time 0.552 (0.571)	Data 0.001 (0.052)	Loss 4.0771 (3.9928)	Top-1 acc 30.078 (31.595)	Top-5 acc 56.250 (54.814)	lr 0.00006
Warmup Train [40][300/3239]	Time 0.519 (0.570)	Data 0.001 (0.050)	Loss 4.0444 (3.9941)	Top-1 acc 35.156 (31.576)	Top-5 acc 55.078 (54.799)	lr 0.00006
Warmup Train [40][310/3239]	Time 0.461 (0.568)	Data 0.001 (0.049)	Loss 3.9416 (3.9919)	Top-1 acc 28.516 (31.603)	Top-5 acc 57.422 (54.843)	lr 0.00006
Warmup Train [40][320/3239]	Time 0.563 (0.567)	Data 0.001 (0.047)	Loss 3.9025 (3.9904)	Top-1 acc 30.078 (31.641)	Top-5 acc 57.031 (54.871)	lr 0.00006
Warmup Train [40][330/3239]	Time 0.635 (0.565)	Data 0.001 (0.046)	Loss 3.7668 (3.9908)	Top-1 acc 33.594 (31.595)	Top-5 acc 60.547 (54.841)	lr 0.00006
Warmup Train [40][340/3239]	Time 0.309 (0.563)	Data 0.001 (0.045)	Loss 3.9936 (3.9916)	Top-1 acc 33.594 (31.558)	Top-5 acc 53.125 (54.802)	lr 0.00006
Warmup Train [40][350/3239]	Time 0.458 (0.561)	Data 0.001 (0.044)	Loss 4.0180 (3.9915)	Top-1 acc 26.953 (31.539)	Top-5 acc 52.734 (54.822)	lr 0.00006
Warmup Train [40][360/3239]	Time 0.612 (0.559)	Data 0.001 (0.043)	Loss 3.9310 (3.9928)	Top-1 acc 31.250 (31.504)	Top-5 acc 53.125 (54.744)	lr 0.00006
Warmup Train [40][370/3239]	Time 0.549 (0.556)	Data 0.001 (0.042)	Loss 4.0778 (3.9936)	Top-1 acc 30.469 (31.470)	Top-5 acc 50.000 (54.694)	lr 0.00006
Warmup Train [40][380/3239]	Time 0.636 (0.555)	Data 0.001 (0.041)	Loss 4.1245 (3.9947)	Top-1 acc 30.078 (31.464)	Top-5 acc 51.953 (54.657)	lr 0.00006
Warmup Train [40][390/3239]	Time 0.451 (0.554)	Data 0.001 (0.040)	Loss 3.9597 (3.9955)	Top-1 acc 34.766 (31.454)	Top-5 acc 57.422 (54.645)	lr 0.00006
Warmup Train [40][400/3239]	Time 0.613 (0.553)	Data 0.001 (0.039)	Loss 3.9704 (3.9947)	Top-1 acc 30.469 (31.473)	Top-5 acc 53.125 (54.676)	lr 0.00006
Warmup Train [40][410/3239]	Time 0.396 (0.553)	Data 0.001 (0.038)	Loss 3.8617 (3.9951)	Top-1 acc 34.375 (31.438)	Top-5 acc 58.594 (54.688)	lr 0.00006
Warmup Train [40][420/3239]	Time 0.367 (0.552)	Data 0.001 (0.038)	Loss 3.9119 (3.9961)	Top-1 acc 32.422 (31.427)	Top-5 acc 53.125 (54.633)	lr 0.00006
Warmup Train [40][430/3239]	Time 0.458 (0.551)	Data 0.001 (0.037)	Loss 3.9898 (3.9968)	Top-1 acc 33.203 (31.423)	Top-5 acc 56.250 (54.638)	lr 0.00006
Warmup Train [40][440/3239]	Time 0.477 (0.550)	Data 0.001 (0.036)	Loss 4.0642 (3.9962)	Top-1 acc 29.297 (31.459)	Top-5 acc 53.906 (54.651)	lr 0.00006
Warmup Train [40][450/3239]	Time 0.396 (0.548)	Data 0.001 (0.035)	Loss 4.0247 (3.9965)	Top-1 acc 30.859 (31.429)	Top-5 acc 52.344 (54.655)	lr 0.00006
Warmup Train [40][460/3239]	Time 0.523 (0.548)	Data 0.001 (0.035)	Loss 3.8086 (3.9966)	Top-1 acc 32.031 (31.400)	Top-5 acc 57.031 (54.652)	lr 0.00006
Warmup Train [40][470/3239]	Time 0.497 (0.547)	Data 0.001 (0.034)	Loss 4.0095 (3.9971)	Top-1 acc 35.156 (31.396)	Top-5 acc 54.297 (54.641)	lr 0.00006
Warmup Train [40][480/3239]	Time 0.545 (0.547)	Data 0.001 (0.034)	Loss 4.1517 (3.9989)	Top-1 acc 28.906 (31.356)	Top-5 acc 52.344 (54.607)	lr 0.00006
Warmup Train [40][490/3239]	Time 0.489 (0.546)	Data 0.001 (0.033)	Loss 3.8961 (3.9981)	Top-1 acc 36.328 (31.369)	Top-5 acc 58.984 (54.613)	lr 0.00006
Warmup Train [40][500/3239]	Time 0.346 (0.545)	Data 0.001 (0.033)	Loss 3.9649 (3.9973)	Top-1 acc 30.078 (31.390)	Top-5 acc 53.516 (54.621)	lr 0.00006
Warmup Train [40][510/3239]	Time 0.515 (0.545)	Data 0.001 (0.033)	Loss 3.9279 (3.9988)	Top-1 acc 32.422 (31.346)	Top-5 acc 56.641 (54.591)	lr 0.00005
Warmup Train [40][520/3239]	Time 0.406 (0.544)	Data 0.001 (0.032)	Loss 4.1396 (3.9988)	Top-1 acc 28.125 (31.334)	Top-5 acc 55.078 (54.616)	lr 0.00005
Warmup Train [40][530/3239]	Time 0.589 (0.544)	Data 0.001 (0.032)	Loss 4.0054 (3.9990)	Top-1 acc 30.859 (31.327)	Top-5 acc 54.688 (54.586)	lr 0.00005
Warmup Train [40][540/3239]	Time 0.334 (0.544)	Data 0.001 (0.031)	Loss 3.8919 (3.9990)	Top-1 acc 32.422 (31.353)	Top-5 acc 54.688 (54.572)	lr 0.00005
Warmup Train [40][550/3239]	Time 0.441 (0.543)	Data 0.001 (0.031)	Loss 3.9878 (3.9990)	Top-1 acc 28.906 (31.346)	Top-5 acc 53.906 (54.561)	lr 0.00005
Warmup Train [40][560/3239]	Time 0.431 (0.543)	Data 0.001 (0.031)	Loss 4.0481 (4.0000)	Top-1 acc 29.688 (31.337)	Top-5 acc 53.516 (54.548)	lr 0.00005
Warmup Train [40][570/3239]	Time 0.480 (0.543)	Data 0.001 (0.030)	Loss 3.9930 (3.9990)	Top-1 acc 32.422 (31.346)	Top-5 acc 55.078 (54.566)	lr 0.00005
Warmup Train [40][580/3239]	Time 0.621 (0.542)	Data 0.001 (0.030)	Loss 3.9920 (3.9994)	Top-1 acc 31.250 (31.325)	Top-5 acc 51.562 (54.540)	lr 0.00005
Warmup Train [40][590/3239]	Time 0.495 (0.541)	Data 0.001 (0.029)	Loss 4.2104 (4.0002)	Top-1 acc 25.781 (31.306)	Top-5 acc 49.609 (54.528)	lr 0.00005
Warmup Train [40][600/3239]	Time 0.572 (0.540)	Data 0.001 (0.029)	Loss 3.8559 (3.9993)	Top-1 acc 33.594 (31.310)	Top-5 acc 57.812 (54.561)	lr 0.00005
Warmup Train [40][610/3239]	Time 0.549 (0.539)	Data 0.002 (0.028)	Loss 3.9463 (3.9989)	Top-1 acc 33.203 (31.310)	Top-5 acc 54.688 (54.578)	lr 0.00005
Warmup Train [40][620/3239]	Time 0.363 (0.537)	Data 0.002 (0.028)	Loss 3.8422 (3.9991)	Top-1 acc 31.641 (31.292)	Top-5 acc 59.766 (54.582)	lr 0.00005
Warmup Train [40][630/3239]	Time 0.442 (0.537)	Data 0.001 (0.028)	Loss 4.0090 (4.0004)	Top-1 acc 32.812 (31.271)	Top-5 acc 50.000 (54.545)	lr 0.00005
Warmup Train [40][640/3239]	Time 0.531 (0.537)	Data 0.001 (0.027)	Loss 3.9614 (4.0009)	Top-1 acc 32.031 (31.255)	Top-5 acc 54.297 (54.531)	lr 0.00005
Warmup Train [40][650/3239]	Time 0.491 (0.537)	Data 0.001 (0.027)	Loss 4.0233 (4.0010)	Top-1 acc 28.125 (31.253)	Top-5 acc 52.344 (54.533)	lr 0.00005
Warmup Train [40][660/3239]	Time 0.337 (0.536)	Data 0.001 (0.027)	Loss 3.9003 (4.0013)	Top-1 acc 33.984 (31.255)	Top-5 acc 58.203 (54.534)	lr 0.00005
Warmup Train [40][670/3239]	Time 0.577 (0.536)	Data 0.001 (0.027)	Loss 4.0365 (4.0017)	Top-1 acc 29.297 (31.250)	Top-5 acc 50.781 (54.525)	lr 0.00005
Warmup Train [40][680/3239]	Time 0.323 (0.535)	Data 0.001 (0.026)	Loss 3.8844 (4.0021)	Top-1 acc 33.984 (31.240)	Top-5 acc 60.547 (54.518)	lr 0.00005
Warmup Train [40][690/3239]	Time 0.345 (0.534)	Data 0.001 (0.026)	Loss 4.1820 (4.0014)	Top-1 acc 28.906 (31.248)	Top-5 acc 50.781 (54.516)	lr 0.00005
Warmup Train [40][700/3239]	Time 0.527 (0.534)	Data 0.001 (0.026)	Loss 3.9395 (4.0007)	Top-1 acc 32.031 (31.266)	Top-5 acc 57.422 (54.527)	lr 0.00005
Warmup Train [40][710/3239]	Time 0.542 (0.534)	Data 0.001 (0.026)	Loss 4.1569 (4.0010)	Top-1 acc 31.250 (31.260)	Top-5 acc 50.391 (54.528)	lr 0.00005
Warmup Train [40][720/3239]	Time 0.351 (0.534)	Data 0.001 (0.025)	Loss 3.8831 (4.0004)	Top-1 acc 35.156 (31.279)	Top-5 acc 58.594 (54.533)	lr 0.00005
Warmup Train [40][730/3239]	Time 0.552 (0.533)	Data 0.001 (0.025)	Loss 4.0677 (4.0013)	Top-1 acc 26.562 (31.253)	Top-5 acc 53.125 (54.518)	lr 0.00005
Warmup Train [40][740/3239]	Time 0.587 (0.533)	Data 0.001 (0.025)	Loss 3.9021 (4.0005)	Top-1 acc 35.547 (31.272)	Top-5 acc 58.203 (54.535)	lr 0.00005
Warmup Train [40][750/3239]	Time 0.502 (0.533)	Data 0.001 (0.025)	Loss 4.0381 (4.0011)	Top-1 acc 30.469 (31.258)	Top-5 acc 55.078 (54.525)	lr 0.00005
Warmup Train [40][760/3239]	Time 0.438 (0.533)	Data 0.001 (0.025)	Loss 3.8827 (4.0013)	Top-1 acc 34.766 (31.268)	Top-5 acc 55.859 (54.515)	lr 0.00005
Warmup Train [40][770/3239]	Time 0.388 (0.532)	Data 0.001 (0.024)	Loss 4.1916 (4.0004)	Top-1 acc 28.906 (31.292)	Top-5 acc 49.609 (54.534)	lr 0.00004
Warmup Train [40][780/3239]	Time 0.719 (0.532)	Data 0.001 (0.024)	Loss 3.8927 (4.0005)	Top-1 acc 31.250 (31.300)	Top-5 acc 55.469 (54.536)	lr 0.00004
Warmup Train [40][790/3239]	Time 0.499 (0.532)	Data 0.001 (0.024)	Loss 4.0222 (4.0002)	Top-1 acc 30.078 (31.296)	Top-5 acc 53.125 (54.553)	lr 0.00004
Warmup Train [40][800/3239]	Time 0.547 (0.532)	Data 0.001 (0.024)	Loss 3.9644 (4.0003)	Top-1 acc 32.422 (31.294)	Top-5 acc 55.859 (54.569)	lr 0.00004
Warmup Train [40][810/3239]	Time 0.551 (0.532)	Data 0.001 (0.023)	Loss 3.9135 (4.0000)	Top-1 acc 33.203 (31.299)	Top-5 acc 57.031 (54.585)	lr 0.00004
Warmup Train [40][820/3239]	Time 0.475 (0.531)	Data 0.002 (0.023)	Loss 4.0864 (3.9993)	Top-1 acc 30.078 (31.319)	Top-5 acc 51.172 (54.602)	lr 0.00004
Warmup Train [40][830/3239]	Time 0.299 (0.531)	Data 0.001 (0.023)	Loss 4.1126 (4.0006)	Top-1 acc 31.250 (31.292)	Top-5 acc 50.000 (54.575)	lr 0.00004
Warmup Train [40][840/3239]	Time 0.551 (0.530)	Data 0.001 (0.023)	Loss 3.8235 (4.0010)	Top-1 acc 41.016 (31.302)	Top-5 acc 60.547 (54.565)	lr 0.00004
Warmup Train [40][850/3239]	Time 0.281 (0.530)	Data 0.001 (0.023)	Loss 3.9602 (4.0012)	Top-1 acc 31.641 (31.300)	Top-5 acc 55.859 (54.569)	lr 0.00004
Warmup Train [40][860/3239]	Time 0.471 (0.529)	Data 0.001 (0.023)	Loss 4.0296 (4.0009)	Top-1 acc 27.344 (31.299)	Top-5 acc 55.078 (54.575)	lr 0.00004
Warmup Train [40][870/3239]	Time 0.376 (0.529)	Data 0.001 (0.023)	Loss 3.9510 (4.0010)	Top-1 acc 35.156 (31.304)	Top-5 acc 56.641 (54.575)	lr 0.00004
Warmup Train [40][880/3239]	Time 0.600 (0.528)	Data 0.001 (0.022)	Loss 4.0292 (4.0013)	Top-1 acc 29.297 (31.295)	Top-5 acc 57.422 (54.570)	lr 0.00004
Warmup Train [40][890/3239]	Time 0.733 (0.528)	Data 0.001 (0.022)	Loss 3.8896 (4.0006)	Top-1 acc 31.641 (31.306)	Top-5 acc 61.328 (54.582)	lr 0.00004
Warmup Train [40][900/3239]	Time 0.502 (0.528)	Data 0.001 (0.022)	Loss 4.1346 (4.0014)	Top-1 acc 30.469 (31.293)	Top-5 acc 48.828 (54.563)	lr 0.00004
Warmup Train [40][910/3239]	Time 0.376 (0.528)	Data 0.001 (0.022)	Loss 3.7285 (4.0013)	Top-1 acc 34.766 (31.296)	Top-5 acc 63.281 (54.570)	lr 0.00004
Warmup Train [40][920/3239]	Time 0.539 (0.528)	Data 0.001 (0.022)	Loss 4.0878 (4.0015)	Top-1 acc 32.031 (31.298)	Top-5 acc 54.297 (54.570)	lr 0.00004
Warmup Train [40][930/3239]	Time 0.408 (0.528)	Data 0.001 (0.022)	Loss 3.9168 (4.0015)	Top-1 acc 30.859 (31.305)	Top-5 acc 57.812 (54.584)	lr 0.00004
Warmup Train [40][940/3239]	Time 0.551 (0.527)	Data 0.001 (0.021)	Loss 3.9179 (4.0015)	Top-1 acc 33.594 (31.290)	Top-5 acc 55.078 (54.579)	lr 0.00004
Warmup Train [40][950/3239]	Time 0.448 (0.527)	Data 0.001 (0.021)	Loss 3.8405 (4.0013)	Top-1 acc 37.891 (31.288)	Top-5 acc 59.766 (54.588)	lr 0.00004
Warmup Train [40][960/3239]	Time 0.517 (0.527)	Data 0.001 (0.021)	Loss 4.3220 (4.0019)	Top-1 acc 26.562 (31.271)	Top-5 acc 46.094 (54.571)	lr 0.00004
Warmup Train [40][970/3239]	Time 0.697 (0.527)	Data 0.001 (0.021)	Loss 4.0018 (4.0022)	Top-1 acc 33.984 (31.272)	Top-5 acc 55.469 (54.562)	lr 0.00004
Warmup Train [40][980/3239]	Time 0.425 (0.527)	Data 0.001 (0.021)	Loss 3.8037 (4.0020)	Top-1 acc 33.594 (31.271)	Top-5 acc 60.938 (54.577)	lr 0.00004
Warmup Train [40][990/3239]	Time 0.481 (0.527)	Data 0.001 (0.021)	Loss 3.6727 (4.0019)	Top-1 acc 40.234 (31.258)	Top-5 acc 62.500 (54.576)	lr 0.00004
Warmup Train [40][1000/3239]	Time 0.609 (0.527)	Data 0.001 (0.021)	Loss 3.9172 (4.0016)	Top-1 acc 29.688 (31.260)	Top-5 acc 57.031 (54.581)	lr 0.00004
Warmup Train [40][1010/3239]	Time 0.550 (0.527)	Data 0.001 (0.020)	Loss 3.9956 (4.0016)	Top-1 acc 28.125 (31.258)	Top-5 acc 57.422 (54.582)	lr 0.00004
Warmup Train [40][1020/3239]	Time 0.360 (0.527)	Data 0.001 (0.020)	Loss 4.1124 (4.0016)	Top-1 acc 32.422 (31.253)	Top-5 acc 53.125 (54.587)	lr 0.00004
Warmup Train [40][1030/3239]	Time 0.597 (0.527)	Data 0.001 (0.020)	Loss 3.9338 (4.0012)	Top-1 acc 33.203 (31.252)	Top-5 acc 57.422 (54.592)	lr 0.00004
Warmup Train [40][1040/3239]	Time 0.580 (0.527)	Data 0.001 (0.020)	Loss 3.7914 (4.0004)	Top-1 acc 37.109 (31.263)	Top-5 acc 59.375 (54.608)	lr 0.00004
Warmup Train [40][1050/3239]	Time 0.621 (0.527)	Data 0.001 (0.020)	Loss 3.8949 (4.0003)	Top-1 acc 33.203 (31.266)	Top-5 acc 56.641 (54.617)	lr 0.00004
Warmup Train [40][1060/3239]	Time 0.592 (0.527)	Data 0.001 (0.020)	Loss 4.0490 (4.0006)	Top-1 acc 28.906 (31.259)	Top-5 acc 55.469 (54.612)	lr 0.00003
Warmup Train [40][1070/3239]	Time 0.613 (0.527)	Data 0.001 (0.020)	Loss 4.0296 (4.0006)	Top-1 acc 33.984 (31.263)	Top-5 acc 57.422 (54.609)	lr 0.00003
Warmup Train [40][1080/3239]	Time 0.499 (0.526)	Data 0.001 (0.019)	Loss 4.1258 (4.0008)	Top-1 acc 29.297 (31.257)	Top-5 acc 51.172 (54.600)	lr 0.00003
Warmup Train [40][1090/3239]	Time 0.497 (0.526)	Data 0.001 (0.019)	Loss 4.1123 (4.0009)	Top-1 acc 30.859 (31.253)	Top-5 acc 50.000 (54.598)	lr 0.00003
Warmup Train [40][1100/3239]	Time 0.221 (0.526)	Data 0.001 (0.019)	Loss 4.0665 (4.0005)	Top-1 acc 31.641 (31.258)	Top-5 acc 53.125 (54.607)	lr 0.00003
Warmup Train [40][1110/3239]	Time 0.559 (0.525)	Data 0.001 (0.019)	Loss 3.9645 (4.0005)	Top-1 acc 32.422 (31.256)	Top-5 acc 52.734 (54.600)	lr 0.00003
Warmup Train [40][1120/3239]	Time 0.390 (0.525)	Data 0.001 (0.019)	Loss 4.0450 (4.0012)	Top-1 acc 27.344 (31.237)	Top-5 acc 54.297 (54.592)	lr 0.00003
Warmup Train [40][1130/3239]	Time 0.250 (0.525)	Data 0.001 (0.019)	Loss 4.0794 (4.0010)	Top-1 acc 31.250 (31.255)	Top-5 acc 51.562 (54.594)	lr 0.00003
Warmup Train [40][1140/3239]	Time 0.505 (0.524)	Data 0.001 (0.019)	Loss 4.0008 (4.0007)	Top-1 acc 31.641 (31.264)	Top-5 acc 51.562 (54.602)	lr 0.00003
Warmup Train [40][1150/3239]	Time 0.494 (0.524)	Data 0.001 (0.019)	Loss 4.0746 (4.0011)	Top-1 acc 29.688 (31.253)	Top-5 acc 52.344 (54.588)	lr 0.00003
Warmup Train [40][1160/3239]	Time 0.669 (0.524)	Data 0.001 (0.019)	Loss 3.9037 (4.0007)	Top-1 acc 31.250 (31.261)	Top-5 acc 57.812 (54.597)	lr 0.00003
Warmup Train [40][1170/3239]	Time 0.348 (0.524)	Data 0.001 (0.018)	Loss 3.8222 (4.0003)	Top-1 acc 36.328 (31.273)	Top-5 acc 58.594 (54.612)	lr 0.00003
Warmup Train [40][1180/3239]	Time 0.510 (0.524)	Data 0.001 (0.018)	Loss 4.0422 (4.0003)	Top-1 acc 28.125 (31.271)	Top-5 acc 55.078 (54.612)	lr 0.00003
Warmup Train [40][1190/3239]	Time 0.550 (0.524)	Data 0.001 (0.018)	Loss 4.1392 (4.0009)	Top-1 acc 27.734 (31.266)	Top-5 acc 50.781 (54.592)	lr 0.00003
Warmup Train [40][1200/3239]	Time 0.464 (0.524)	Data 0.001 (0.018)	Loss 4.0304 (4.0001)	Top-1 acc 32.422 (31.273)	Top-5 acc 55.078 (54.608)	lr 0.00003
Warmup Train [40][1210/3239]	Time 0.635 (0.524)	Data 0.001 (0.018)	Loss 3.9539 (3.9998)	Top-1 acc 30.859 (31.276)	Top-5 acc 58.203 (54.621)	lr 0.00003
Warmup Train [40][1220/3239]	Time 0.433 (0.523)	Data 0.001 (0.018)	Loss 4.0157 (3.9998)	Top-1 acc 31.641 (31.280)	Top-5 acc 54.297 (54.620)	lr 0.00003
Warmup Train [40][1230/3239]	Time 0.673 (0.523)	Data 0.001 (0.018)	Loss 3.8000 (4.0004)	Top-1 acc 34.375 (31.272)	Top-5 acc 59.375 (54.611)	lr 0.00003
Warmup Train [40][1240/3239]	Time 0.382 (0.523)	Data 0.001 (0.018)	Loss 4.0718 (4.0003)	Top-1 acc 30.859 (31.274)	Top-5 acc 55.859 (54.614)	lr 0.00003
Warmup Train [40][1250/3239]	Time 0.528 (0.523)	Data 0.001 (0.018)	Loss 3.9012 (4.0004)	Top-1 acc 34.375 (31.262)	Top-5 acc 57.422 (54.619)	lr 0.00003
Warmup Train [40][1260/3239]	Time 0.590 (0.523)	Data 0.001 (0.018)	Loss 4.0128 (4.0005)	Top-1 acc 30.859 (31.261)	Top-5 acc 53.516 (54.614)	lr 0.00003
Warmup Train [40][1270/3239]	Time 0.537 (0.523)	Data 0.001 (0.018)	Loss 3.9305 (4.0007)	Top-1 acc 34.375 (31.254)	Top-5 acc 57.031 (54.608)	lr 0.00003
Warmup Train [40][1280/3239]	Time 0.485 (0.523)	Data 0.001 (0.017)	Loss 3.9538 (4.0006)	Top-1 acc 30.859 (31.256)	Top-5 acc 58.594 (54.613)	lr 0.00003
Warmup Train [40][1290/3239]	Time 0.467 (0.523)	Data 0.001 (0.017)	Loss 3.9629 (4.0004)	Top-1 acc 33.984 (31.261)	Top-5 acc 56.250 (54.622)	lr 0.00003
Warmup Train [40][1300/3239]	Time 0.599 (0.523)	Data 0.001 (0.017)	Loss 3.7917 (4.0007)	Top-1 acc 39.844 (31.259)	Top-5 acc 61.328 (54.614)	lr 0.00003
Warmup Train [40][1310/3239]	Time 0.663 (0.523)	Data 0.001 (0.017)	Loss 4.1416 (4.0006)	Top-1 acc 30.469 (31.258)	Top-5 acc 51.953 (54.620)	lr 0.00003
Warmup Train [40][1320/3239]	Time 0.565 (0.523)	Data 0.001 (0.017)	Loss 4.0798 (4.0012)	Top-1 acc 28.906 (31.248)	Top-5 acc 52.344 (54.610)	lr 0.00003
Warmup Train [40][1330/3239]	Time 0.658 (0.523)	Data 0.001 (0.017)	Loss 3.9327 (4.0011)	Top-1 acc 30.469 (31.259)	Top-5 acc 51.562 (54.611)	lr 0.00003
Warmup Train [40][1340/3239]	Time 0.761 (0.523)	Data 0.001 (0.017)	Loss 3.9016 (4.0009)	Top-1 acc 35.547 (31.262)	Top-5 acc 58.203 (54.619)	lr 0.00003
Warmup Train [40][1350/3239]	Time 0.521 (0.523)	Data 0.001 (0.017)	Loss 4.2533 (4.0013)	Top-1 acc 25.391 (31.256)	Top-5 acc 47.656 (54.607)	lr 0.00003
Warmup Train [40][1360/3239]	Time 0.364 (0.522)	Data 0.001 (0.017)	Loss 3.9453 (4.0012)	Top-1 acc 33.203 (31.261)	Top-5 acc 53.906 (54.604)	lr 0.00003
Warmup Train [40][1370/3239]	Time 0.430 (0.522)	Data 0.001 (0.017)	Loss 4.0298 (4.0013)	Top-1 acc 27.734 (31.253)	Top-5 acc 56.250 (54.603)	lr 0.00003
Warmup Train [40][1380/3239]	Time 0.538 (0.522)	Data 0.001 (0.016)	Loss 3.9896 (4.0008)	Top-1 acc 29.688 (31.260)	Top-5 acc 53.125 (54.614)	lr 0.00003
Warmup Train [40][1390/3239]	Time 0.379 (0.522)	Data 0.001 (0.016)	Loss 4.2587 (4.0013)	Top-1 acc 25.781 (31.244)	Top-5 acc 49.609 (54.602)	lr 0.00003
Warmup Train [40][1400/3239]	Time 0.498 (0.521)	Data 0.001 (0.016)	Loss 3.8945 (4.0012)	Top-1 acc 33.594 (31.242)	Top-5 acc 57.031 (54.607)	lr 0.00002
Warmup Train [40][1410/3239]	Time 0.564 (0.521)	Data 0.001 (0.016)	Loss 3.8526 (4.0008)	Top-1 acc 38.281 (31.255)	Top-5 acc 59.766 (54.617)	lr 0.00002
Warmup Train [40][1420/3239]	Time 0.602 (0.521)	Data 0.001 (0.016)	Loss 4.0318 (4.0014)	Top-1 acc 30.469 (31.250)	Top-5 acc 51.562 (54.613)	lr 0.00002
Warmup Train [40][1430/3239]	Time 0.560 (0.521)	Data 0.001 (0.016)	Loss 4.0338 (4.0014)	Top-1 acc 32.422 (31.246)	Top-5 acc 54.297 (54.609)	lr 0.00002
Warmup Train [40][1440/3239]	Time 0.454 (0.521)	Data 0.001 (0.016)	Loss 4.2219 (4.0017)	Top-1 acc 26.172 (31.239)	Top-5 acc 47.656 (54.604)	lr 0.00002
Warmup Train [40][1450/3239]	Time 0.609 (0.521)	Data 0.001 (0.016)	Loss 3.9647 (4.0022)	Top-1 acc 29.297 (31.226)	Top-5 acc 57.422 (54.601)	lr 0.00002
Warmup Train [40][1460/3239]	Time 0.522 (0.521)	Data 0.001 (0.016)	Loss 3.8421 (4.0024)	Top-1 acc 30.078 (31.210)	Top-5 acc 57.812 (54.593)	lr 0.00002
Warmup Train [40][1470/3239]	Time 0.614 (0.521)	Data 0.001 (0.016)	Loss 3.9284 (4.0025)	Top-1 acc 32.422 (31.209)	Top-5 acc 54.688 (54.585)	lr 0.00002
Warmup Train [40][1480/3239]	Time 0.516 (0.521)	Data 0.001 (0.016)	Loss 3.9390 (4.0026)	Top-1 acc 30.469 (31.206)	Top-5 acc 54.688 (54.585)	lr 0.00002
Warmup Train [40][1490/3239]	Time 0.560 (0.521)	Data 0.001 (0.016)	Loss 4.0377 (4.0030)	Top-1 acc 33.203 (31.202)	Top-5 acc 55.469 (54.577)	lr 0.00002
Warmup Train [40][1500/3239]	Time 0.480 (0.521)	Data 0.001 (0.015)	Loss 4.2115 (4.0031)	Top-1 acc 32.422 (31.204)	Top-5 acc 53.906 (54.577)	lr 0.00002
Warmup Train [40][1510/3239]	Time 0.521 (0.521)	Data 0.001 (0.015)	Loss 4.0768 (4.0031)	Top-1 acc 32.812 (31.208)	Top-5 acc 52.734 (54.572)	lr 0.00002
Warmup Train [40][1520/3239]	Time 0.385 (0.521)	Data 0.001 (0.015)	Loss 4.0377 (4.0032)	Top-1 acc 32.812 (31.210)	Top-5 acc 55.859 (54.575)	lr 0.00002
Warmup Train [40][1530/3239]	Time 0.755 (0.521)	Data 0.001 (0.015)	Loss 4.2204 (4.0028)	Top-1 acc 25.781 (31.211)	Top-5 acc 46.875 (54.580)	lr 0.00002
Warmup Train [40][1540/3239]	Time 0.477 (0.521)	Data 0.001 (0.015)	Loss 3.9122 (4.0026)	Top-1 acc 33.203 (31.219)	Top-5 acc 53.125 (54.580)	lr 0.00002
Warmup Train [40][1550/3239]	Time 0.699 (0.521)	Data 0.001 (0.015)	Loss 4.0304 (4.0025)	Top-1 acc 35.938 (31.225)	Top-5 acc 51.953 (54.573)	lr 0.00002
Warmup Train [40][1560/3239]	Time 0.516 (0.521)	Data 0.001 (0.015)	Loss 4.0907 (4.0023)	Top-1 acc 30.078 (31.230)	Top-5 acc 50.391 (54.579)	lr 0.00002
Warmup Train [40][1570/3239]	Time 0.636 (0.521)	Data 0.001 (0.015)	Loss 4.1339 (4.0024)	Top-1 acc 30.859 (31.228)	Top-5 acc 55.078 (54.582)	lr 0.00002
Warmup Train [40][1580/3239]	Time 0.398 (0.521)	Data 0.001 (0.015)	Loss 3.8776 (4.0021)	Top-1 acc 36.719 (31.231)	Top-5 acc 60.547 (54.587)	lr 0.00002
Warmup Train [40][1590/3239]	Time 0.546 (0.521)	Data 0.001 (0.015)	Loss 3.9377 (4.0021)	Top-1 acc 33.203 (31.233)	Top-5 acc 53.906 (54.587)	lr 0.00002
Warmup Train [40][1600/3239]	Time 0.533 (0.521)	Data 0.001 (0.015)	Loss 4.1898 (4.0021)	Top-1 acc 28.516 (31.242)	Top-5 acc 47.266 (54.586)	lr 0.00002
Warmup Train [40][1610/3239]	Time 0.571 (0.520)	Data 0.001 (0.015)	Loss 4.2705 (4.0024)	Top-1 acc 25.000 (31.239)	Top-5 acc 47.266 (54.577)	lr 0.00002
Warmup Train [40][1620/3239]	Time 0.549 (0.520)	Data 0.001 (0.015)	Loss 4.1353 (4.0021)	Top-1 acc 30.859 (31.249)	Top-5 acc 49.219 (54.583)	lr 0.00002
Warmup Train [40][1630/3239]	Time 0.694 (0.520)	Data 0.001 (0.015)	Loss 3.9073 (4.0019)	Top-1 acc 34.375 (31.257)	Top-5 acc 60.547 (54.596)	lr 0.00002
Warmup Train [40][1640/3239]	Time 0.479 (0.520)	Data 0.001 (0.015)	Loss 3.8510 (4.0019)	Top-1 acc 34.766 (31.262)	Top-5 acc 60.938 (54.603)	lr 0.00002
Warmup Train [40][1650/3239]	Time 0.383 (0.520)	Data 0.001 (0.015)	Loss 4.1624 (4.0020)	Top-1 acc 25.391 (31.258)	Top-5 acc 51.953 (54.603)	lr 0.00002
Warmup Train [40][1660/3239]	Time 0.513 (0.520)	Data 0.001 (0.014)	Loss 3.8562 (4.0017)	Top-1 acc 33.594 (31.265)	Top-5 acc 59.375 (54.609)	lr 0.00002
Warmup Train [40][1670/3239]	Time 0.565 (0.519)	Data 0.001 (0.014)	Loss 4.1468 (4.0018)	Top-1 acc 30.859 (31.263)	Top-5 acc 48.438 (54.606)	lr 0.00002
Warmup Train [40][1680/3239]	Time 0.501 (0.519)	Data 0.001 (0.014)	Loss 3.9886 (4.0019)	Top-1 acc 31.641 (31.259)	Top-5 acc 53.516 (54.601)	lr 0.00002
Warmup Train [40][1690/3239]	Time 0.534 (0.519)	Data 0.001 (0.014)	Loss 3.9997 (4.0017)	Top-1 acc 32.031 (31.263)	Top-5 acc 53.516 (54.611)	lr 0.00002
Warmup Train [40][1700/3239]	Time 0.482 (0.519)	Data 0.001 (0.014)	Loss 4.0932 (4.0015)	Top-1 acc 28.125 (31.263)	Top-5 acc 52.734 (54.610)	lr 0.00002
Warmup Train [40][1710/3239]	Time 0.416 (0.519)	Data 0.001 (0.014)	Loss 4.0692 (4.0017)	Top-1 acc 27.344 (31.263)	Top-5 acc 53.516 (54.608)	lr 0.00002
Warmup Train [40][1720/3239]	Time 0.605 (0.519)	Data 0.001 (0.014)	Loss 3.9594 (4.0017)	Top-1 acc 31.641 (31.264)	Top-5 acc 56.641 (54.602)	lr 0.00002
Warmup Train [40][1730/3239]	Time 0.318 (0.519)	Data 0.001 (0.014)	Loss 4.2066 (4.0018)	Top-1 acc 25.391 (31.260)	Top-5 acc 49.219 (54.601)	lr 0.00002
Warmup Train [40][1740/3239]	Time 0.375 (0.519)	Data 0.002 (0.014)	Loss 4.1390 (4.0017)	Top-1 acc 26.953 (31.261)	Top-5 acc 50.000 (54.603)	lr 0.00002
Warmup Train [40][1750/3239]	Time 0.653 (0.519)	Data 0.001 (0.014)	Loss 4.1651 (4.0017)	Top-1 acc 29.688 (31.257)	Top-5 acc 52.344 (54.600)	lr 0.00002
Warmup Train [40][1760/3239]	Time 0.419 (0.519)	Data 0.001 (0.014)	Loss 3.9302 (4.0017)	Top-1 acc 34.375 (31.253)	Top-5 acc 56.250 (54.601)	lr 0.00002
Warmup Train [40][1770/3239]	Time 0.652 (0.519)	Data 0.001 (0.014)	Loss 3.9901 (4.0015)	Top-1 acc 31.250 (31.250)	Top-5 acc 55.859 (54.608)	lr 0.00002
Warmup Train [40][1780/3239]	Time 0.658 (0.519)	Data 0.001 (0.014)	Loss 3.8223 (4.0013)	Top-1 acc 35.547 (31.250)	Top-5 acc 56.641 (54.612)	lr 0.00002
Warmup Train [40][1790/3239]	Time 0.483 (0.519)	Data 0.001 (0.014)	Loss 3.9916 (4.0012)	Top-1 acc 30.469 (31.249)	Top-5 acc 58.594 (54.616)	lr 0.00002
Warmup Train [40][1800/3239]	Time 0.598 (0.519)	Data 0.001 (0.014)	Loss 3.7803 (4.0010)	Top-1 acc 40.234 (31.253)	Top-5 acc 60.156 (54.620)	lr 0.00002
Warmup Train [40][1810/3239]	Time 0.399 (0.519)	Data 0.001 (0.014)	Loss 3.9330 (4.0008)	Top-1 acc 33.984 (31.256)	Top-5 acc 53.125 (54.621)	lr 0.00002
Warmup Train [40][1820/3239]	Time 0.595 (0.519)	Data 0.001 (0.014)	Loss 3.9013 (4.0007)	Top-1 acc 35.547 (31.261)	Top-5 acc 57.812 (54.631)	lr 0.00001
Warmup Train [40][1830/3239]	Time 0.413 (0.519)	Data 0.001 (0.014)	Loss 4.1550 (4.0009)	Top-1 acc 21.484 (31.251)	Top-5 acc 51.953 (54.628)	lr 0.00001
Warmup Train [40][1840/3239]	Time 0.324 (0.518)	Data 0.001 (0.014)	Loss 3.9486 (4.0007)	Top-1 acc 32.812 (31.257)	Top-5 acc 57.031 (54.634)	lr 0.00001
Warmup Train [40][1850/3239]	Time 0.664 (0.518)	Data 0.001 (0.014)	Loss 3.9450 (4.0005)	Top-1 acc 30.859 (31.261)	Top-5 acc 55.859 (54.644)	lr 0.00001
Warmup Train [40][1860/3239]	Time 0.445 (0.518)	Data 0.001 (0.014)	Loss 3.8845 (4.0005)	Top-1 acc 34.375 (31.262)	Top-5 acc 55.859 (54.644)	lr 0.00001
Warmup Train [40][1870/3239]	Time 0.525 (0.518)	Data 0.001 (0.014)	Loss 3.8837 (4.0006)	Top-1 acc 35.547 (31.258)	Top-5 acc 56.641 (54.641)	lr 0.00001
Warmup Train [40][1880/3239]	Time 0.610 (0.518)	Data 0.001 (0.014)	Loss 4.0622 (4.0005)	Top-1 acc 30.078 (31.259)	Top-5 acc 51.953 (54.641)	lr 0.00001
Warmup Train [40][1890/3239]	Time 0.328 (0.518)	Data 0.001 (0.014)	Loss 4.1042 (4.0003)	Top-1 acc 27.344 (31.258)	Top-5 acc 52.344 (54.644)	lr 0.00001
Warmup Train [40][1900/3239]	Time 0.543 (0.518)	Data 0.001 (0.014)	Loss 3.9363 (4.0005)	Top-1 acc 37.109 (31.254)	Top-5 acc 57.422 (54.643)	lr 0.00001
Warmup Train [40][1910/3239]	Time 0.549 (0.518)	Data 0.001 (0.014)	Loss 3.8724 (4.0001)	Top-1 acc 32.422 (31.262)	Top-5 acc 59.375 (54.649)	lr 0.00001
Warmup Train [40][1920/3239]	Time 0.427 (0.518)	Data 0.001 (0.013)	Loss 3.9866 (4.0002)	Top-1 acc 27.344 (31.256)	Top-5 acc 54.688 (54.647)	lr 0.00001
Warmup Train [40][1930/3239]	Time 0.721 (0.518)	Data 0.001 (0.013)	Loss 4.0275 (4.0002)	Top-1 acc 30.078 (31.256)	Top-5 acc 54.688 (54.648)	lr 0.00001
Warmup Train [40][1940/3239]	Time 0.535 (0.518)	Data 0.001 (0.013)	Loss 3.9104 (4.0004)	Top-1 acc 32.031 (31.253)	Top-5 acc 57.812 (54.645)	lr 0.00001
Warmup Train [40][1950/3239]	Time 0.653 (0.518)	Data 0.001 (0.013)	Loss 4.0055 (4.0005)	Top-1 acc 31.641 (31.252)	Top-5 acc 54.297 (54.644)	lr 0.00001
Warmup Train [40][1960/3239]	Time 0.557 (0.518)	Data 0.001 (0.013)	Loss 4.0182 (4.0006)	Top-1 acc 32.422 (31.247)	Top-5 acc 56.250 (54.646)	lr 0.00001
Warmup Train [40][1970/3239]	Time 0.571 (0.518)	Data 0.001 (0.013)	Loss 4.0922 (4.0006)	Top-1 acc 31.250 (31.245)	Top-5 acc 52.344 (54.644)	lr 0.00001
Warmup Train [40][1980/3239]	Time 0.655 (0.518)	Data 0.001 (0.013)	Loss 3.9159 (4.0005)	Top-1 acc 31.250 (31.253)	Top-5 acc 57.812 (54.651)	lr 0.00001
Warmup Train [40][1990/3239]	Time 0.556 (0.518)	Data 0.001 (0.013)	Loss 3.9622 (4.0003)	Top-1 acc 33.594 (31.258)	Top-5 acc 53.906 (54.652)	lr 0.00001
Warmup Train [40][2000/3239]	Time 0.712 (0.518)	Data 0.001 (0.013)	Loss 4.1074 (4.0001)	Top-1 acc 31.250 (31.265)	Top-5 acc 52.734 (54.661)	lr 0.00001
Warmup Train [40][2010/3239]	Time 0.520 (0.518)	Data 0.001 (0.013)	Loss 4.0573 (3.9998)	Top-1 acc 30.078 (31.274)	Top-5 acc 56.641 (54.670)	lr 0.00001
Warmup Train [40][2020/3239]	Time 0.386 (0.518)	Data 0.001 (0.013)	Loss 3.9444 (3.9998)	Top-1 acc 35.156 (31.274)	Top-5 acc 55.469 (54.665)	lr 0.00001
Warmup Train [40][2030/3239]	Time 0.509 (0.518)	Data 0.001 (0.013)	Loss 3.9537 (3.9998)	Top-1 acc 30.078 (31.272)	Top-5 acc 56.250 (54.662)	lr 0.00001
Warmup Train [40][2040/3239]	Time 0.379 (0.518)	Data 0.001 (0.013)	Loss 4.2716 (3.9997)	Top-1 acc 27.344 (31.278)	Top-5 acc 49.609 (54.663)	lr 0.00001
Warmup Train [40][2050/3239]	Time 0.572 (0.518)	Data 0.001 (0.013)	Loss 3.9453 (3.9996)	Top-1 acc 30.469 (31.278)	Top-5 acc 56.250 (54.671)	lr 0.00001
Warmup Train [40][2060/3239]	Time 0.509 (0.518)	Data 0.001 (0.013)	Loss 4.2459 (3.9998)	Top-1 acc 29.297 (31.280)	Top-5 acc 45.312 (54.663)	lr 0.00001
Warmup Train [40][2070/3239]	Time 0.588 (0.518)	Data 0.001 (0.013)	Loss 4.1290 (4.0000)	Top-1 acc 29.297 (31.283)	Top-5 acc 53.906 (54.655)	lr 0.00001
Warmup Train [40][2080/3239]	Time 0.486 (0.518)	Data 0.001 (0.013)	Loss 4.0162 (4.0002)	Top-1 acc 32.812 (31.277)	Top-5 acc 55.859 (54.650)	lr 0.00001
Warmup Train [40][2090/3239]	Time 0.557 (0.518)	Data 0.001 (0.013)	Loss 3.9642 (4.0002)	Top-1 acc 26.172 (31.274)	Top-5 acc 54.297 (54.649)	lr 0.00001
Warmup Train [40][2100/3239]	Time 0.493 (0.518)	Data 0.001 (0.013)	Loss 3.6304 (4.0003)	Top-1 acc 37.109 (31.272)	Top-5 acc 62.109 (54.648)	lr 0.00001
Warmup Train [40][2110/3239]	Time 0.526 (0.517)	Data 0.001 (0.013)	Loss 4.1925 (4.0003)	Top-1 acc 28.906 (31.267)	Top-5 acc 49.219 (54.643)	lr 0.00001
Warmup Train [40][2120/3239]	Time 0.565 (0.517)	Data 0.002 (0.013)	Loss 3.9057 (4.0004)	Top-1 acc 33.203 (31.262)	Top-5 acc 58.203 (54.644)	lr 0.00001
Warmup Train [40][2130/3239]	Time 0.494 (0.517)	Data 0.001 (0.013)	Loss 3.9303 (4.0004)	Top-1 acc 33.203 (31.267)	Top-5 acc 57.812 (54.639)	lr 0.00001
Warmup Train [40][2140/3239]	Time 0.519 (0.517)	Data 0.001 (0.013)	Loss 4.1282 (4.0005)	Top-1 acc 28.906 (31.266)	Top-5 acc 51.172 (54.640)	lr 0.00001
Warmup Train [40][2150/3239]	Time 0.545 (0.517)	Data 0.001 (0.013)	Loss 3.9547 (4.0006)	Top-1 acc 31.641 (31.263)	Top-5 acc 51.953 (54.631)	lr 0.00001
Warmup Train [40][2160/3239]	Time 0.591 (0.517)	Data 0.001 (0.013)	Loss 3.8724 (4.0005)	Top-1 acc 33.984 (31.269)	Top-5 acc 55.859 (54.632)	lr 0.00001
Warmup Train [40][2170/3239]	Time 0.388 (0.517)	Data 0.001 (0.012)	Loss 4.0904 (4.0005)	Top-1 acc 28.516 (31.266)	Top-5 acc 52.734 (54.631)	lr 0.00001
Warmup Train [40][2180/3239]	Time 0.625 (0.517)	Data 0.001 (0.012)	Loss 4.0266 (4.0007)	Top-1 acc 30.469 (31.256)	Top-5 acc 54.688 (54.623)	lr 0.00001
Warmup Train [40][2190/3239]	Time 0.628 (0.517)	Data 0.001 (0.012)	Loss 4.0504 (4.0010)	Top-1 acc 26.562 (31.250)	Top-5 acc 54.297 (54.616)	lr 0.00001
Warmup Train [40][2200/3239]	Time 0.518 (0.517)	Data 0.001 (0.012)	Loss 4.0394 (4.0011)	Top-1 acc 32.031 (31.251)	Top-5 acc 54.688 (54.618)	lr 0.00001
Warmup Train [40][2210/3239]	Time 0.548 (0.517)	Data 0.001 (0.012)	Loss 3.9901 (4.0009)	Top-1 acc 35.547 (31.258)	Top-5 acc 57.812 (54.625)	lr 0.00001
Warmup Train [40][2220/3239]	Time 0.475 (0.517)	Data 0.001 (0.012)	Loss 3.9689 (4.0008)	Top-1 acc 30.469 (31.263)	Top-5 acc 56.250 (54.626)	lr 0.00001
Warmup Train [40][2230/3239]	Time 0.451 (0.517)	Data 0.001 (0.012)	Loss 3.9363 (4.0010)	Top-1 acc 32.422 (31.260)	Top-5 acc 56.641 (54.623)	lr 0.00001
Warmup Train [40][2240/3239]	Time 0.434 (0.517)	Data 0.001 (0.012)	Loss 4.0263 (4.0008)	Top-1 acc 33.203 (31.268)	Top-5 acc 53.125 (54.626)	lr 0.00001
Warmup Train [40][2250/3239]	Time 0.526 (0.517)	Data 0.001 (0.012)	Loss 4.0289 (4.0007)	Top-1 acc 29.297 (31.268)	Top-5 acc 55.469 (54.630)	lr 0.00001
Warmup Train [40][2260/3239]	Time 0.527 (0.517)	Data 0.001 (0.012)	Loss 4.3222 (4.0008)	Top-1 acc 25.781 (31.260)	Top-5 acc 46.484 (54.626)	lr 0.00001
Warmup Train [40][2270/3239]	Time 0.513 (0.517)	Data 0.001 (0.012)	Loss 3.8815 (4.0008)	Top-1 acc 34.375 (31.265)	Top-5 acc 60.547 (54.626)	lr 0.00001
Warmup Train [40][2280/3239]	Time 0.499 (0.517)	Data 0.001 (0.012)	Loss 4.1326 (4.0007)	Top-1 acc 26.562 (31.264)	Top-5 acc 52.344 (54.626)	lr 0.00001
Warmup Train [40][2290/3239]	Time 0.463 (0.517)	Data 0.001 (0.012)	Loss 3.9930 (4.0008)	Top-1 acc 30.859 (31.266)	Top-5 acc 55.859 (54.627)	lr 0.00001
Warmup Train [40][2300/3239]	Time 0.631 (0.517)	Data 0.001 (0.012)	Loss 3.8223 (4.0007)	Top-1 acc 33.203 (31.268)	Top-5 acc 60.547 (54.629)	lr 0.00001
Warmup Train [40][2310/3239]	Time 0.514 (0.517)	Data 0.001 (0.012)	Loss 4.0178 (4.0008)	Top-1 acc 31.641 (31.269)	Top-5 acc 56.250 (54.630)	lr 0.00001
Warmup Train [40][2320/3239]	Time 0.491 (0.517)	Data 0.001 (0.012)	Loss 3.8265 (4.0004)	Top-1 acc 32.812 (31.276)	Top-5 acc 56.250 (54.639)	lr 0.00001
Warmup Train [40][2330/3239]	Time 0.451 (0.517)	Data 0.001 (0.012)	Loss 4.0515 (4.0004)	Top-1 acc 27.734 (31.277)	Top-5 acc 50.000 (54.638)	lr 0.00001
Warmup Train [40][2340/3239]	Time 0.507 (0.517)	Data 0.001 (0.012)	Loss 3.7427 (4.0001)	Top-1 acc 37.500 (31.281)	Top-5 acc 58.594 (54.640)	lr 0.00001
Warmup Train [40][2350/3239]	Time 0.412 (0.517)	Data 0.001 (0.012)	Loss 3.7127 (3.9999)	Top-1 acc 30.859 (31.281)	Top-5 acc 57.422 (54.643)	lr 0.00001
Warmup Train [40][2360/3239]	Time 0.646 (0.517)	Data 0.001 (0.012)	Loss 3.7737 (3.9996)	Top-1 acc 35.156 (31.280)	Top-5 acc 60.156 (54.651)	lr 0.00001
Warmup Train [40][2370/3239]	Time 0.491 (0.517)	Data 0.001 (0.012)	Loss 4.0517 (3.9995)	Top-1 acc 29.688 (31.272)	Top-5 acc 53.125 (54.654)	lr 0.00001
Warmup Train [40][2380/3239]	Time 0.514 (0.516)	Data 0.001 (0.012)	Loss 3.9559 (3.9994)	Top-1 acc 30.859 (31.276)	Top-5 acc 53.906 (54.660)	lr 0.00001
Warmup Train [40][2390/3239]	Time 0.349 (0.516)	Data 0.001 (0.012)	Loss 3.9128 (3.9995)	Top-1 acc 29.297 (31.271)	Top-5 acc 52.344 (54.655)	lr 0.00001
Warmup Train [40][2400/3239]	Time 0.515 (0.516)	Data 0.001 (0.012)	Loss 4.0179 (3.9999)	Top-1 acc 31.250 (31.266)	Top-5 acc 55.859 (54.646)	lr 0.00001
Warmup Train [40][2410/3239]	Time 0.444 (0.516)	Data 0.001 (0.012)	Loss 3.8578 (3.9998)	Top-1 acc 33.203 (31.265)	Top-5 acc 57.031 (54.646)	lr 0.00001
Warmup Train [40][2420/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 4.0728 (3.9999)	Top-1 acc 29.297 (31.264)	Top-5 acc 51.562 (54.639)	lr 0.00000
Warmup Train [40][2430/3239]	Time 0.519 (0.516)	Data 0.001 (0.012)	Loss 4.1659 (3.9998)	Top-1 acc 24.609 (31.264)	Top-5 acc 48.047 (54.638)	lr 0.00000
Warmup Train [40][2440/3239]	Time 0.610 (0.516)	Data 0.001 (0.012)	Loss 3.8499 (3.9999)	Top-1 acc 31.250 (31.264)	Top-5 acc 57.422 (54.640)	lr 0.00000
Warmup Train [40][2450/3239]	Time 0.578 (0.516)	Data 0.001 (0.012)	Loss 3.9208 (3.9999)	Top-1 acc 32.812 (31.263)	Top-5 acc 55.078 (54.638)	lr 0.00000
Warmup Train [40][2460/3239]	Time 0.352 (0.516)	Data 0.001 (0.012)	Loss 3.9175 (3.9998)	Top-1 acc 32.422 (31.269)	Top-5 acc 57.422 (54.646)	lr 0.00000
Warmup Train [40][2470/3239]	Time 0.634 (0.516)	Data 0.001 (0.012)	Loss 3.9693 (4.0000)	Top-1 acc 32.031 (31.261)	Top-5 acc 58.203 (54.645)	lr 0.00000
Warmup Train [40][2480/3239]	Time 0.418 (0.516)	Data 0.002 (0.012)	Loss 3.9911 (3.9999)	Top-1 acc 31.641 (31.262)	Top-5 acc 53.516 (54.645)	lr 0.00000
Warmup Train [40][2490/3239]	Time 0.533 (0.516)	Data 0.001 (0.012)	Loss 4.0621 (3.9999)	Top-1 acc 30.469 (31.261)	Top-5 acc 52.734 (54.644)	lr 0.00000
Warmup Train [40][2500/3239]	Time 0.641 (0.516)	Data 0.001 (0.012)	Loss 4.0340 (3.9997)	Top-1 acc 29.297 (31.262)	Top-5 acc 52.734 (54.646)	lr 0.00000
Warmup Train [40][2510/3239]	Time 0.490 (0.516)	Data 0.001 (0.012)	Loss 3.9995 (3.9999)	Top-1 acc 31.250 (31.256)	Top-5 acc 54.297 (54.644)	lr 0.00000
Warmup Train [40][2520/3239]	Time 0.449 (0.516)	Data 0.001 (0.012)	Loss 4.0759 (3.9998)	Top-1 acc 29.688 (31.260)	Top-5 acc 51.562 (54.646)	lr 0.00000
Warmup Train [40][2530/3239]	Time 0.687 (0.516)	Data 0.001 (0.012)	Loss 3.9765 (3.9993)	Top-1 acc 33.984 (31.271)	Top-5 acc 53.516 (54.655)	lr 0.00000
Warmup Train [40][2540/3239]	Time 0.312 (0.516)	Data 0.001 (0.012)	Loss 4.2474 (3.9997)	Top-1 acc 32.812 (31.267)	Top-5 acc 50.000 (54.644)	lr 0.00000
Warmup Train [40][2550/3239]	Time 0.368 (0.516)	Data 0.001 (0.012)	Loss 4.2840 (3.9998)	Top-1 acc 27.344 (31.265)	Top-5 acc 49.219 (54.642)	lr 0.00000
Warmup Train [40][2560/3239]	Time 0.575 (0.516)	Data 0.001 (0.012)	Loss 4.1015 (3.9997)	Top-1 acc 29.688 (31.269)	Top-5 acc 54.297 (54.645)	lr 0.00000
Warmup Train [40][2570/3239]	Time 0.658 (0.516)	Data 0.001 (0.012)	Loss 4.1187 (4.0000)	Top-1 acc 28.906 (31.263)	Top-5 acc 52.734 (54.634)	lr 0.00000
Warmup Train [40][2580/3239]	Time 0.503 (0.516)	Data 0.001 (0.012)	Loss 3.7884 (4.0000)	Top-1 acc 37.500 (31.263)	Top-5 acc 60.156 (54.637)	lr 0.00000
Warmup Train [40][2590/3239]	Time 0.270 (0.516)	Data 0.001 (0.011)	Loss 3.7612 (3.9999)	Top-1 acc 37.109 (31.270)	Top-5 acc 58.984 (54.637)	lr 0.00000
Warmup Train [40][2600/3239]	Time 0.538 (0.516)	Data 0.001 (0.011)	Loss 3.9153 (3.9999)	Top-1 acc 33.594 (31.268)	Top-5 acc 55.078 (54.636)	lr 0.00000
Warmup Train [40][2610/3239]	Time 0.465 (0.516)	Data 0.001 (0.011)	Loss 4.0892 (4.0000)	Top-1 acc 27.734 (31.263)	Top-5 acc 53.516 (54.633)	lr 0.00000
Warmup Train [40][2620/3239]	Time 0.574 (0.516)	Data 0.001 (0.011)	Loss 3.9795 (3.9998)	Top-1 acc 33.984 (31.267)	Top-5 acc 56.250 (54.640)	lr 0.00000
Warmup Train [40][2630/3239]	Time 0.278 (0.515)	Data 0.001 (0.011)	Loss 3.8665 (3.9999)	Top-1 acc 31.641 (31.259)	Top-5 acc 60.156 (54.637)	lr 0.00000
Warmup Train [40][2640/3239]	Time 0.513 (0.515)	Data 0.001 (0.011)	Loss 3.8291 (3.9997)	Top-1 acc 36.328 (31.262)	Top-5 acc 58.594 (54.642)	lr 0.00000
Warmup Train [40][2650/3239]	Time 0.502 (0.515)	Data 0.027 (0.011)	Loss 4.1679 (3.9998)	Top-1 acc 30.859 (31.265)	Top-5 acc 49.609 (54.642)	lr 0.00000
Warmup Train [40][2660/3239]	Time 0.379 (0.515)	Data 0.001 (0.011)	Loss 3.9901 (4.0000)	Top-1 acc 28.906 (31.258)	Top-5 acc 56.641 (54.640)	lr 0.00000
Warmup Train [40][2670/3239]	Time 0.639 (0.515)	Data 0.001 (0.011)	Loss 4.0111 (3.9998)	Top-1 acc 32.031 (31.260)	Top-5 acc 58.203 (54.646)	lr 0.00000
Warmup Train [40][2680/3239]	Time 0.375 (0.515)	Data 0.001 (0.011)	Loss 4.0645 (3.9997)	Top-1 acc 33.594 (31.258)	Top-5 acc 53.906 (54.650)	lr 0.00000
Warmup Train [40][2690/3239]	Time 0.535 (0.515)	Data 0.001 (0.011)	Loss 3.9237 (3.9998)	Top-1 acc 31.250 (31.257)	Top-5 acc 55.469 (54.652)	lr 0.00000
Warmup Train [40][2700/3239]	Time 0.474 (0.515)	Data 0.001 (0.011)	Loss 4.1627 (3.9998)	Top-1 acc 30.078 (31.256)	Top-5 acc 53.516 (54.652)	lr 0.00000
Warmup Train [40][2710/3239]	Time 0.491 (0.515)	Data 0.001 (0.011)	Loss 4.0453 (3.9996)	Top-1 acc 30.469 (31.259)	Top-5 acc 53.125 (54.654)	lr 0.00000
Warmup Train [40][2720/3239]	Time 0.507 (0.515)	Data 0.001 (0.011)	Loss 3.9896 (3.9997)	Top-1 acc 36.719 (31.258)	Top-5 acc 53.906 (54.650)	lr 0.00000
Warmup Train [40][2730/3239]	Time 0.411 (0.515)	Data 0.001 (0.011)	Loss 4.0782 (3.9997)	Top-1 acc 29.297 (31.262)	Top-5 acc 53.906 (54.650)	lr 0.00000
Warmup Train [40][2740/3239]	Time 0.594 (0.515)	Data 0.001 (0.011)	Loss 3.9582 (3.9996)	Top-1 acc 31.250 (31.267)	Top-5 acc 51.172 (54.652)	lr 0.00000
Warmup Train [40][2750/3239]	Time 0.419 (0.515)	Data 0.001 (0.011)	Loss 4.0805 (3.9996)	Top-1 acc 30.469 (31.266)	Top-5 acc 48.828 (54.651)	lr 0.00000
Warmup Train [40][2760/3239]	Time 0.493 (0.515)	Data 0.001 (0.011)	Loss 3.8468 (3.9995)	Top-1 acc 34.766 (31.263)	Top-5 acc 58.594 (54.654)	lr 0.00000
Warmup Train [40][2770/3239]	Time 0.317 (0.515)	Data 0.001 (0.011)	Loss 4.0527 (3.9995)	Top-1 acc 28.906 (31.262)	Top-5 acc 51.172 (54.650)	lr 0.00000
Warmup Train [40][2780/3239]	Time 0.563 (0.515)	Data 0.001 (0.011)	Loss 3.8881 (3.9994)	Top-1 acc 36.328 (31.267)	Top-5 acc 58.984 (54.653)	lr 0.00000
Warmup Train [40][2790/3239]	Time 0.476 (0.515)	Data 0.001 (0.011)	Loss 4.1529 (3.9994)	Top-1 acc 27.344 (31.265)	Top-5 acc 53.906 (54.656)	lr 0.00000
Warmup Train [40][2800/3239]	Time 0.515 (0.515)	Data 0.001 (0.011)	Loss 4.0094 (3.9995)	Top-1 acc 30.078 (31.263)	Top-5 acc 53.906 (54.655)	lr 0.00000
Warmup Train [40][2810/3239]	Time 0.505 (0.515)	Data 0.001 (0.011)	Loss 4.1166 (3.9996)	Top-1 acc 27.734 (31.263)	Top-5 acc 50.781 (54.652)	lr 0.00000
Warmup Train [40][2820/3239]	Time 0.371 (0.515)	Data 0.001 (0.011)	Loss 4.0903 (3.9996)	Top-1 acc 31.250 (31.264)	Top-5 acc 54.688 (54.653)	lr 0.00000
Warmup Train [40][2830/3239]	Time 0.614 (0.515)	Data 0.001 (0.011)	Loss 4.2198 (3.9997)	Top-1 acc 28.906 (31.260)	Top-5 acc 51.172 (54.652)	lr 0.00000
Warmup Train [40][2840/3239]	Time 0.643 (0.515)	Data 0.001 (0.011)	Loss 3.9517 (3.9998)	Top-1 acc 35.156 (31.260)	Top-5 acc 56.641 (54.647)	lr 0.00000
Warmup Train [40][2850/3239]	Time 0.446 (0.515)	Data 0.001 (0.011)	Loss 4.1579 (3.9997)	Top-1 acc 28.125 (31.263)	Top-5 acc 46.875 (54.649)	lr 0.00000
Warmup Train [40][2860/3239]	Time 0.553 (0.515)	Data 0.002 (0.011)	Loss 4.1241 (3.9997)	Top-1 acc 30.078 (31.263)	Top-5 acc 52.344 (54.649)	lr 0.00000
Warmup Train [40][2870/3239]	Time 0.467 (0.515)	Data 0.001 (0.011)	Loss 4.0826 (3.9996)	Top-1 acc 31.641 (31.264)	Top-5 acc 51.562 (54.650)	lr 0.00000
Warmup Train [40][2880/3239]	Time 0.385 (0.515)	Data 0.001 (0.011)	Loss 4.1694 (3.9998)	Top-1 acc 27.344 (31.256)	Top-5 acc 50.000 (54.647)	lr 0.00000
Warmup Train [40][2890/3239]	Time 0.539 (0.515)	Data 0.001 (0.011)	Loss 3.9704 (3.9997)	Top-1 acc 31.250 (31.260)	Top-5 acc 57.812 (54.653)	lr 0.00000
Warmup Train [40][2900/3239]	Time 0.499 (0.515)	Data 0.001 (0.011)	Loss 4.0308 (3.9997)	Top-1 acc 33.203 (31.256)	Top-5 acc 52.734 (54.653)	lr 0.00000
Warmup Train [40][2910/3239]	Time 0.488 (0.515)	Data 0.001 (0.011)	Loss 4.0991 (3.9998)	Top-1 acc 28.516 (31.252)	Top-5 acc 51.953 (54.648)	lr 0.00000
Warmup Train [40][2920/3239]	Time 0.547 (0.515)	Data 0.001 (0.011)	Loss 3.9063 (3.9998)	Top-1 acc 30.859 (31.255)	Top-5 acc 57.031 (54.647)	lr 0.00000
Warmup Train [40][2930/3239]	Time 0.492 (0.515)	Data 0.001 (0.011)	Loss 4.0736 (4.0001)	Top-1 acc 30.469 (31.250)	Top-5 acc 50.781 (54.640)	lr 0.00000
Warmup Train [40][2940/3239]	Time 0.410 (0.514)	Data 0.001 (0.011)	Loss 4.1165 (4.0003)	Top-1 acc 26.562 (31.245)	Top-5 acc 51.562 (54.633)	lr 0.00000
Warmup Train [40][2950/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 3.8308 (4.0001)	Top-1 acc 33.984 (31.247)	Top-5 acc 56.250 (54.634)	lr 0.00000
Warmup Train [40][2960/3239]	Time 0.642 (0.515)	Data 0.001 (0.011)	Loss 4.0682 (4.0003)	Top-1 acc 30.859 (31.245)	Top-5 acc 53.906 (54.633)	lr 0.00000
Warmup Train [40][2970/3239]	Time 0.405 (0.515)	Data 0.001 (0.011)	Loss 4.0507 (4.0004)	Top-1 acc 27.344 (31.243)	Top-5 acc 54.297 (54.632)	lr 0.00000
Warmup Train [40][2980/3239]	Time 0.502 (0.515)	Data 0.001 (0.011)	Loss 4.1798 (4.0003)	Top-1 acc 26.562 (31.244)	Top-5 acc 50.391 (54.634)	lr 0.00000
Warmup Train [40][2990/3239]	Time 0.523 (0.515)	Data 0.001 (0.011)	Loss 4.0940 (4.0002)	Top-1 acc 34.766 (31.248)	Top-5 acc 53.125 (54.637)	lr 0.00000
Warmup Train [40][3000/3239]	Time 0.375 (0.514)	Data 0.001 (0.011)	Loss 3.9500 (4.0002)	Top-1 acc 32.812 (31.251)	Top-5 acc 56.250 (54.639)	lr 0.00000
Warmup Train [40][3010/3239]	Time 0.404 (0.515)	Data 0.001 (0.011)	Loss 3.9564 (4.0004)	Top-1 acc 26.562 (31.247)	Top-5 acc 56.641 (54.634)	lr 0.00000
Warmup Train [40][3020/3239]	Time 0.513 (0.515)	Data 0.001 (0.011)	Loss 4.0562 (4.0006)	Top-1 acc 31.250 (31.248)	Top-5 acc 54.297 (54.632)	lr 0.00000
Warmup Train [40][3030/3239]	Time 0.449 (0.515)	Data 0.001 (0.011)	Loss 4.2121 (4.0006)	Top-1 acc 28.125 (31.246)	Top-5 acc 50.000 (54.632)	lr 0.00000
Warmup Train [40][3040/3239]	Time 0.582 (0.515)	Data 0.001 (0.011)	Loss 3.8523 (4.0008)	Top-1 acc 33.203 (31.244)	Top-5 acc 59.766 (54.632)	lr 0.00000
Warmup Train [40][3050/3239]	Time 0.614 (0.515)	Data 0.001 (0.011)	Loss 3.8488 (4.0008)	Top-1 acc 33.594 (31.242)	Top-5 acc 58.594 (54.630)	lr 0.00000
Warmup Train [40][3060/3239]	Time 0.354 (0.515)	Data 0.001 (0.011)	Loss 4.1111 (4.0008)	Top-1 acc 27.734 (31.242)	Top-5 acc 51.953 (54.627)	lr 0.00000
Warmup Train [40][3070/3239]	Time 0.683 (0.515)	Data 0.001 (0.011)	Loss 3.7654 (4.0009)	Top-1 acc 39.062 (31.241)	Top-5 acc 56.641 (54.621)	lr 0.00000
Warmup Train [40][3080/3239]	Time 0.519 (0.515)	Data 0.001 (0.011)	Loss 4.0518 (4.0009)	Top-1 acc 31.641 (31.239)	Top-5 acc 56.641 (54.622)	lr 0.00000
Warmup Train [40][3090/3239]	Time 0.554 (0.515)	Data 0.001 (0.011)	Loss 4.2167 (4.0009)	Top-1 acc 30.078 (31.239)	Top-5 acc 48.438 (54.621)	lr 0.00000
Warmup Train [40][3100/3239]	Time 0.501 (0.515)	Data 0.001 (0.011)	Loss 4.0073 (4.0008)	Top-1 acc 28.906 (31.239)	Top-5 acc 55.859 (54.619)	lr 0.00000
Warmup Train [40][3110/3239]	Time 0.666 (0.515)	Data 0.001 (0.011)	Loss 3.9446 (4.0009)	Top-1 acc 30.469 (31.235)	Top-5 acc 55.078 (54.618)	lr 0.00000
Warmup Train [40][3120/3239]	Time 0.482 (0.515)	Data 0.001 (0.011)	Loss 4.0111 (4.0009)	Top-1 acc 31.641 (31.232)	Top-5 acc 53.516 (54.614)	lr 0.00000
Warmup Train [40][3130/3239]	Time 0.383 (0.514)	Data 0.001 (0.011)	Loss 3.9977 (4.0012)	Top-1 acc 31.641 (31.227)	Top-5 acc 54.688 (54.611)	lr 0.00000
Warmup Train [40][3140/3239]	Time 0.585 (0.514)	Data 0.001 (0.011)	Loss 4.0144 (4.0013)	Top-1 acc 32.031 (31.226)	Top-5 acc 52.344 (54.610)	lr 0.00000
Warmup Train [40][3150/3239]	Time 0.461 (0.514)	Data 0.001 (0.011)	Loss 4.1585 (4.0014)	Top-1 acc 29.297 (31.225)	Top-5 acc 52.344 (54.606)	lr 0.00000
Warmup Train [40][3160/3239]	Time 0.573 (0.514)	Data 0.001 (0.011)	Loss 3.8734 (4.0016)	Top-1 acc 31.641 (31.223)	Top-5 acc 60.547 (54.603)	lr 0.00000
Warmup Train [40][3170/3239]	Time 0.685 (0.514)	Data 0.001 (0.011)	Loss 4.0703 (4.0015)	Top-1 acc 32.422 (31.225)	Top-5 acc 51.172 (54.600)	lr 0.00000
Warmup Train [40][3180/3239]	Time 0.620 (0.514)	Data 0.000 (0.011)	Loss 4.1218 (4.0016)	Top-1 acc 30.469 (31.223)	Top-5 acc 53.516 (54.598)	lr 0.00000
Warmup Train [40][3190/3239]	Time 0.521 (0.514)	Data 0.000 (0.011)	Loss 4.0151 (4.0015)	Top-1 acc 26.953 (31.225)	Top-5 acc 53.516 (54.599)	lr 0.00000
Warmup Train [40][3200/3239]	Time 0.422 (0.514)	Data 0.000 (0.011)	Loss 4.3748 (4.0016)	Top-1 acc 27.734 (31.224)	Top-5 acc 48.438 (54.599)	lr 0.00000
Warmup Train [40][3210/3239]	Time 0.520 (0.514)	Data 0.000 (0.011)	Loss 3.9428 (4.0016)	Top-1 acc 36.328 (31.225)	Top-5 acc 56.641 (54.597)	lr 0.00000
Warmup Train [40][3220/3239]	Time 0.473 (0.514)	Data 0.000 (0.011)	Loss 4.1828 (4.0018)	Top-1 acc 23.047 (31.220)	Top-5 acc 50.391 (54.593)	lr 0.00000
Warmup Train [40][3230/3239]	Time 0.481 (0.514)	Data 0.000 (0.011)	Loss 4.0080 (4.0017)	Top-1 acc 27.344 (31.219)	Top-5 acc 53.125 (54.597)	lr 0.00000
Warmup Train [40][3239/3239]	Time 0.267 (0.514)	Data 0.000 (0.010)	Loss 4.4808 (4.0018)	Top-1 acc 19.753 (31.215)	Top-5 acc 45.679 (54.597)	lr 0.00000
==========Warmup Valid [40/40]	loss 2.947	top-1 acc 38.558	top-5 acc 63.157	Train top-1 31.215	top-5 54.597	flops: 442.4M
Train [1][0/3239]	Time 16.645 (16.645)	Data Time 14.831 (14.831)	Loss 3.9422 (3.9422)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (32.031)	Top-5 acc 53.906 (53.906)	lr 0.02500
Train [1][10/3239]	Time 0.557 (2.062)	Data Time 0.001 (1.398)	Loss 4.0672 (4.0792)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (30.149)	Top-5 acc 55.078 (52.876)	lr 0.02500
Train [1][20/3239]	Time 0.658 (1.332)	Data Time 0.001 (0.733)	Loss 4.0655 (4.0868)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (29.688)	Top-5 acc 51.562 (51.990)	lr 0.02500
Train [1][30/3239]	Time 0.543 (1.067)	Data Time 0.001 (0.497)	Loss 3.9908 (4.0769)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (29.763)	Top-5 acc 50.781 (52.268)	lr 0.02500
Train [1][40/3239]	Time 0.473 (0.938)	Data Time 0.002 (0.377)	Loss 4.0878 (4.0659)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (29.745)	Top-5 acc 53.516 (52.925)	lr 0.02500
Train [1][50/3239]	Time 0.419 (0.854)	Data Time 0.001 (0.304)	Loss 4.0345 (4.0625)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (29.703)	Top-5 acc 52.734 (52.918)	lr 0.02500
Train [1][60/3239]	Time 0.471 (0.798)	Data Time 0.001 (0.255)	Loss 4.0851 (4.0574)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (29.880)	Top-5 acc 52.734 (53.125)	lr 0.02500
Train [1][70/3239]	Time 0.595 (0.760)	Data Time 0.001 (0.221)	Loss 4.2210 (4.0620)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (29.946)	Top-5 acc 48.047 (53.108)	lr 0.02500
Train [1][80/3239]	Time 0.657 (0.731)	Data Time 0.001 (0.195)	Loss 4.2061 (4.0680)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (29.789)	Top-5 acc 51.562 (53.009)	lr 0.02500
Train [1][90/3239]	Time 0.636 (0.707)	Data Time 0.001 (0.174)	Loss 3.9487 (4.0706)	Entropy 1.90187 (1.90187)	Top-1 acc 33.984 (29.825)	Top-5 acc 55.078 (52.966)	lr 0.02500
Train [1][100/3239]	Time 0.573 (0.692)	Data Time 0.001 (0.157)	Loss 4.1625 (4.0703)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (29.715)	Top-5 acc 48.828 (53.086)	lr 0.02500
Train [1][110/3239]	Time 0.542 (0.676)	Data Time 0.001 (0.143)	Loss 4.0643 (4.0680)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (29.585)	Top-5 acc 53.516 (53.076)	lr 0.02500
Train [1][120/3239]	Time 0.520 (0.661)	Data Time 0.001 (0.131)	Loss 4.0313 (4.0657)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (29.568)	Top-5 acc 52.734 (53.109)	lr 0.02500
Train [1][130/3239]	Time 0.589 (0.651)	Data Time 0.001 (0.122)	Loss 4.1131 (4.0697)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (29.467)	Top-5 acc 49.609 (52.955)	lr 0.02500
Train [1][140/3239]	Time 0.328 (0.640)	Data Time 0.001 (0.114)	Loss 4.2407 (4.0754)	Entropy 1.90187 (1.90187)	Top-1 acc 23.047 (29.338)	Top-5 acc 49.219 (52.812)	lr 0.02500
Train [1][150/3239]	Time 0.626 (0.634)	Data Time 0.001 (0.108)	Loss 4.0306 (4.0786)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (29.323)	Top-5 acc 53.125 (52.773)	lr 0.02500
Train [1][160/3239]	Time 0.522 (0.627)	Data Time 0.001 (0.101)	Loss 4.1012 (4.0784)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (29.307)	Top-5 acc 50.781 (52.759)	lr 0.02500
Train [1][170/3239]	Time 0.353 (0.620)	Data Time 0.001 (0.095)	Loss 3.9946 (4.0730)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (29.452)	Top-5 acc 54.688 (52.931)	lr 0.02500
Train [1][180/3239]	Time 0.510 (0.614)	Data Time 0.001 (0.091)	Loss 4.0985 (4.0737)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (29.431)	Top-5 acc 52.344 (52.868)	lr 0.02500
Train [1][190/3239]	Time 0.343 (0.606)	Data Time 0.001 (0.087)	Loss 4.0696 (4.0762)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (29.342)	Top-5 acc 53.906 (52.798)	lr 0.02500
Train [1][200/3239]	Time 0.342 (0.601)	Data Time 0.001 (0.083)	Loss 4.3106 (4.0771)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (29.344)	Top-5 acc 47.656 (52.771)	lr 0.02500
Train [1][210/3239]	Time 0.347 (0.595)	Data Time 0.001 (0.080)	Loss 4.2043 (4.0771)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (29.343)	Top-5 acc 51.953 (52.807)	lr 0.02500
Train [1][220/3239]	Time 0.641 (0.591)	Data Time 0.001 (0.077)	Loss 4.1550 (4.0775)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (29.364)	Top-5 acc 52.734 (52.833)	lr 0.02500
Train [1][230/3239]	Time 0.508 (0.587)	Data Time 0.001 (0.074)	Loss 3.9020 (4.0756)	Entropy 1.90187 (1.90187)	Top-1 acc 35.156 (29.429)	Top-5 acc 53.906 (52.865)	lr 0.02500
Train [1][240/3239]	Time 0.504 (0.583)	Data Time 0.001 (0.071)	Loss 4.2250 (4.0771)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (29.412)	Top-5 acc 51.562 (52.838)	lr 0.02500
Train [1][250/3239]	Time 0.586 (0.580)	Data Time 0.001 (0.068)	Loss 3.9052 (4.0759)	Entropy 1.90187 (1.90187)	Top-1 acc 32.812 (29.442)	Top-5 acc 57.812 (52.854)	lr 0.02500
Train [1][260/3239]	Time 0.550 (0.578)	Data Time 0.001 (0.066)	Loss 4.1507 (4.0778)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (29.426)	Top-5 acc 51.562 (52.800)	lr 0.02500
Train [1][270/3239]	Time 0.520 (0.575)	Data Time 0.001 (0.063)	Loss 4.3293 (4.0802)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (29.409)	Top-5 acc 46.875 (52.744)	lr 0.02500
Train [1][280/3239]	Time 0.618 (0.574)	Data Time 0.001 (0.061)	Loss 4.2348 (4.0810)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (29.394)	Top-5 acc 52.734 (52.745)	lr 0.02500
Train [1][290/3239]	Time 0.554 (0.573)	Data Time 0.001 (0.059)	Loss 3.9719 (4.0814)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (29.367)	Top-5 acc 51.953 (52.714)	lr 0.02500
Train [1][300/3239]	Time 0.477 (0.571)	Data Time 0.001 (0.057)	Loss 4.1622 (4.0820)	Entropy 1.90187 (1.90187)	Top-1 acc 23.438 (29.329)	Top-5 acc 53.125 (52.707)	lr 0.02500
Train [1][310/3239]	Time 0.580 (0.569)	Data Time 0.001 (0.055)	Loss 4.1306 (4.0834)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (29.337)	Top-5 acc 52.734 (52.677)	lr 0.02500
Train [1][320/3239]	Time 0.528 (0.567)	Data Time 0.001 (0.054)	Loss 4.0728 (4.0852)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (29.288)	Top-5 acc 54.297 (52.660)	lr 0.02500
Train [1][330/3239]	Time 0.574 (0.566)	Data Time 0.001 (0.052)	Loss 4.0777 (4.0861)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (29.219)	Top-5 acc 52.734 (52.634)	lr 0.02500
Train [1][340/3239]	Time 0.409 (0.564)	Data Time 0.002 (0.051)	Loss 4.1135 (4.0849)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (29.288)	Top-5 acc 54.688 (52.660)	lr 0.02500
Train [1][350/3239]	Time 0.434 (0.563)	Data Time 0.001 (0.050)	Loss 4.2705 (4.0850)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (29.307)	Top-5 acc 46.484 (52.652)	lr 0.02500
Train [1][360/3239]	Time 0.535 (0.562)	Data Time 0.001 (0.049)	Loss 4.0771 (4.0857)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (29.300)	Top-5 acc 51.953 (52.619)	lr 0.02500
Train [1][370/3239]	Time 0.489 (0.561)	Data Time 0.001 (0.047)	Loss 4.0184 (4.0857)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (29.298)	Top-5 acc 57.031 (52.609)	lr 0.02500
Train [1][380/3239]	Time 0.579 (0.560)	Data Time 0.001 (0.046)	Loss 4.0797 (4.0856)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (29.303)	Top-5 acc 51.953 (52.594)	lr 0.02500
Train [1][390/3239]	Time 0.483 (0.559)	Data Time 0.001 (0.046)	Loss 4.1927 (4.0876)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (29.285)	Top-5 acc 52.734 (52.557)	lr 0.02500
Train [1][400/3239]	Time 0.375 (0.557)	Data Time 0.001 (0.045)	Loss 4.0770 (4.0870)	Entropy 1.90187 (1.90187)	Top-1 acc 21.875 (29.254)	Top-5 acc 50.000 (52.560)	lr 0.02500
Train [1][410/3239]	Time 0.591 (0.556)	Data Time 0.001 (0.044)	Loss 4.2598 (4.0891)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (29.210)	Top-5 acc 49.609 (52.512)	lr 0.02500
Train [1][420/3239]	Time 0.500 (0.555)	Data Time 0.001 (0.043)	Loss 4.3107 (4.0912)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (29.168)	Top-5 acc 46.875 (52.483)	lr 0.02500
Train [1][430/3239]	Time 0.498 (0.553)	Data Time 0.001 (0.042)	Loss 4.2435 (4.0938)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (29.106)	Top-5 acc 45.703 (52.418)	lr 0.02500
Train [1][440/3239]	Time 0.380 (0.552)	Data Time 0.001 (0.041)	Loss 4.1795 (4.0964)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (29.047)	Top-5 acc 53.516 (52.353)	lr 0.02500
Train [1][450/3239]	Time 0.498 (0.551)	Data Time 0.001 (0.040)	Loss 3.9830 (4.0971)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (29.013)	Top-5 acc 54.688 (52.323)	lr 0.02500
Train [1][460/3239]	Time 0.230 (0.549)	Data Time 0.034 (0.039)	Loss 4.1497 (4.0975)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (29.005)	Top-5 acc 50.391 (52.301)	lr 0.02500
Train [1][470/3239]	Time 0.539 (0.548)	Data Time 0.001 (0.039)	Loss 4.1201 (4.0982)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (29.011)	Top-5 acc 53.125 (52.296)	lr 0.02500
Train [1][480/3239]	Time 0.625 (0.548)	Data Time 0.001 (0.038)	Loss 4.1779 (4.0999)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.991)	Top-5 acc 52.344 (52.291)	lr 0.02500
Train [1][490/3239]	Time 0.521 (0.547)	Data Time 0.001 (0.037)	Loss 3.9949 (4.1006)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.987)	Top-5 acc 50.000 (52.284)	lr 0.02500
Train [1][500/3239]	Time 0.733 (0.547)	Data Time 0.001 (0.037)	Loss 4.2124 (4.1019)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.969)	Top-5 acc 50.000 (52.264)	lr 0.02500
Train [1][510/3239]	Time 0.596 (0.546)	Data Time 0.001 (0.036)	Loss 4.1922 (4.1032)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.925)	Top-5 acc 46.484 (52.231)	lr 0.02500
Train [1][520/3239]	Time 0.546 (0.546)	Data Time 0.001 (0.036)	Loss 4.0839 (4.1033)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.926)	Top-5 acc 54.688 (52.237)	lr 0.02500
Train [1][530/3239]	Time 0.482 (0.545)	Data Time 0.001 (0.035)	Loss 4.2574 (4.1041)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.925)	Top-5 acc 42.578 (52.233)	lr 0.02500
Train [1][540/3239]	Time 0.471 (0.544)	Data Time 0.001 (0.034)	Loss 4.1779 (4.1047)	Entropy 1.90187 (1.90187)	Top-1 acc 23.047 (28.890)	Top-5 acc 49.609 (52.209)	lr 0.02500
Train [1][550/3239]	Time 0.483 (0.544)	Data Time 0.001 (0.034)	Loss 3.9440 (4.1044)	Entropy 1.90187 (1.90187)	Top-1 acc 32.812 (28.890)	Top-5 acc 60.938 (52.227)	lr 0.02500
Train [1][560/3239]	Time 0.503 (0.544)	Data Time 0.001 (0.033)	Loss 4.1572 (4.1053)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.871)	Top-5 acc 49.609 (52.211)	lr 0.02500
Train [1][570/3239]	Time 0.637 (0.543)	Data Time 0.001 (0.033)	Loss 4.2081 (4.1054)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.852)	Top-5 acc 46.484 (52.197)	lr 0.02500
Train [1][580/3239]	Time 0.551 (0.543)	Data Time 0.001 (0.032)	Loss 4.0978 (4.1054)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.867)	Top-5 acc 50.000 (52.207)	lr 0.02500
Train [1][590/3239]	Time 0.574 (0.543)	Data Time 0.001 (0.032)	Loss 4.0838 (4.1046)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.878)	Top-5 acc 51.562 (52.218)	lr 0.02500
Train [1][600/3239]	Time 0.657 (0.543)	Data Time 0.001 (0.031)	Loss 4.1478 (4.1055)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.857)	Top-5 acc 49.219 (52.185)	lr 0.02500
Train [1][610/3239]	Time 0.493 (0.543)	Data Time 0.001 (0.031)	Loss 4.1879 (4.1050)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.876)	Top-5 acc 51.562 (52.198)	lr 0.02500
Train [1][620/3239]	Time 0.345 (0.542)	Data Time 0.001 (0.030)	Loss 4.2562 (4.1056)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.866)	Top-5 acc 48.047 (52.183)	lr 0.02500
Train [1][630/3239]	Time 0.432 (0.542)	Data Time 0.001 (0.030)	Loss 4.0649 (4.1058)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.865)	Top-5 acc 54.297 (52.177)	lr 0.02500
Train [1][640/3239]	Time 0.472 (0.542)	Data Time 0.001 (0.030)	Loss 4.1666 (4.1058)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.868)	Top-5 acc 48.828 (52.185)	lr 0.02500
Train [1][650/3239]	Time 0.510 (0.541)	Data Time 0.002 (0.030)	Loss 4.1307 (4.1061)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.868)	Top-5 acc 51.953 (52.185)	lr 0.02500
Train [1][660/3239]	Time 0.572 (0.541)	Data Time 0.001 (0.029)	Loss 4.1296 (4.1064)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.844)	Top-5 acc 51.562 (52.162)	lr 0.02500
Train [1][670/3239]	Time 0.367 (0.540)	Data Time 0.001 (0.029)	Loss 4.2252 (4.1076)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.815)	Top-5 acc 51.172 (52.137)	lr 0.02500
Train [1][680/3239]	Time 0.370 (0.539)	Data Time 0.001 (0.028)	Loss 4.1265 (4.1074)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.837)	Top-5 acc 48.438 (52.144)	lr 0.02500
Train [1][690/3239]	Time 0.504 (0.539)	Data Time 0.001 (0.028)	Loss 4.2778 (4.1083)	Entropy 1.90187 (1.90187)	Top-1 acc 23.438 (28.816)	Top-5 acc 47.266 (52.129)	lr 0.02500
Train [1][700/3239]	Time 0.480 (0.538)	Data Time 0.001 (0.028)	Loss 4.2319 (4.1094)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.791)	Top-5 acc 47.656 (52.114)	lr 0.02500
Train [1][710/3239]	Time 0.522 (0.538)	Data Time 0.001 (0.028)	Loss 4.0308 (4.1097)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.772)	Top-5 acc 53.906 (52.099)	lr 0.02500
Train [1][720/3239]	Time 0.397 (0.537)	Data Time 0.001 (0.027)	Loss 4.1947 (4.1107)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.780)	Top-5 acc 53.906 (52.082)	lr 0.02500
Train [1][730/3239]	Time 0.510 (0.537)	Data Time 0.001 (0.027)	Loss 4.0916 (4.1105)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.782)	Top-5 acc 53.125 (52.089)	lr 0.02500
Train [1][740/3239]	Time 0.628 (0.537)	Data Time 0.001 (0.027)	Loss 4.2704 (4.1108)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.775)	Top-5 acc 44.531 (52.073)	lr 0.02500
Train [1][750/3239]	Time 0.471 (0.537)	Data Time 0.001 (0.027)	Loss 4.1683 (4.1105)	Entropy 1.90187 (1.90187)	Top-1 acc 22.656 (28.774)	Top-5 acc 49.609 (52.078)	lr 0.02500
Train [1][760/3239]	Time 0.385 (0.536)	Data Time 0.001 (0.026)	Loss 3.9905 (4.1099)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.771)	Top-5 acc 51.172 (52.080)	lr 0.02500
Train [1][770/3239]	Time 0.401 (0.536)	Data Time 0.001 (0.026)	Loss 4.2875 (4.1103)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.757)	Top-5 acc 50.000 (52.077)	lr 0.02500
Train [1][780/3239]	Time 0.490 (0.536)	Data Time 0.001 (0.026)	Loss 4.0935 (4.1110)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.746)	Top-5 acc 52.344 (52.058)	lr 0.02500
Train [1][790/3239]	Time 0.391 (0.535)	Data Time 0.001 (0.026)	Loss 4.3409 (4.1117)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.748)	Top-5 acc 47.266 (52.054)	lr 0.02500
Train [1][800/3239]	Time 0.467 (0.535)	Data Time 0.001 (0.025)	Loss 4.1912 (4.1115)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.759)	Top-5 acc 50.000 (52.059)	lr 0.02500
Train [1][810/3239]	Time 0.719 (0.535)	Data Time 0.001 (0.025)	Loss 3.9598 (4.1115)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.742)	Top-5 acc 57.422 (52.062)	lr 0.02500
Train [1][820/3239]	Time 0.529 (0.535)	Data Time 0.001 (0.025)	Loss 4.1495 (4.1119)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.742)	Top-5 acc 49.219 (52.045)	lr 0.02500
Train [1][830/3239]	Time 0.529 (0.535)	Data Time 0.001 (0.025)	Loss 4.2624 (4.1128)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.719)	Top-5 acc 46.094 (52.011)	lr 0.02500
Train [1][840/3239]	Time 0.568 (0.535)	Data Time 0.001 (0.025)	Loss 4.2699 (4.1136)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.720)	Top-5 acc 50.391 (52.009)	lr 0.02500
Train [1][850/3239]	Time 0.526 (0.534)	Data Time 0.001 (0.024)	Loss 4.1679 (4.1135)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.719)	Top-5 acc 52.344 (52.028)	lr 0.02500
Train [1][860/3239]	Time 0.685 (0.534)	Data Time 0.001 (0.024)	Loss 4.0581 (4.1140)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.702)	Top-5 acc 52.734 (52.009)	lr 0.02500
Train [1][870/3239]	Time 0.596 (0.534)	Data Time 0.031 (0.024)	Loss 4.1428 (4.1139)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.710)	Top-5 acc 50.781 (52.009)	lr 0.02500
Train [1][880/3239]	Time 0.413 (0.534)	Data Time 0.001 (0.024)	Loss 4.1324 (4.1139)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.698)	Top-5 acc 46.875 (51.999)	lr 0.02500
Train [1][890/3239]	Time 0.471 (0.534)	Data Time 0.001 (0.024)	Loss 4.3416 (4.1146)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.687)	Top-5 acc 45.312 (51.984)	lr 0.02500
Train [1][900/3239]	Time 0.647 (0.534)	Data Time 0.001 (0.023)	Loss 4.3863 (4.1146)	Entropy 1.90187 (1.90187)	Top-1 acc 23.828 (28.689)	Top-5 acc 45.312 (51.983)	lr 0.02500
Train [1][910/3239]	Time 0.286 (0.534)	Data Time 0.001 (0.023)	Loss 4.2151 (4.1151)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.671)	Top-5 acc 50.000 (51.972)	lr 0.02500
Train [1][920/3239]	Time 0.609 (0.533)	Data Time 0.001 (0.023)	Loss 3.9975 (4.1152)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.671)	Top-5 acc 53.516 (51.978)	lr 0.02500
Train [1][930/3239]	Time 0.557 (0.533)	Data Time 0.001 (0.023)	Loss 4.0082 (4.1153)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.673)	Top-5 acc 55.078 (51.975)	lr 0.02500
Train [1][940/3239]	Time 0.594 (0.532)	Data Time 0.001 (0.023)	Loss 4.1629 (4.1153)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.665)	Top-5 acc 50.391 (51.977)	lr 0.02500
Train [1][950/3239]	Time 0.588 (0.532)	Data Time 0.001 (0.022)	Loss 4.1483 (4.1157)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.663)	Top-5 acc 49.609 (51.967)	lr 0.02500
Train [1][960/3239]	Time 0.493 (0.532)	Data Time 0.001 (0.022)	Loss 4.1185 (4.1164)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.655)	Top-5 acc 48.828 (51.950)	lr 0.02500
Train [1][970/3239]	Time 0.488 (0.531)	Data Time 0.001 (0.022)	Loss 4.3604 (4.1160)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.662)	Top-5 acc 48.828 (51.967)	lr 0.02500
Train [1][980/3239]	Time 0.626 (0.531)	Data Time 0.001 (0.022)	Loss 4.1948 (4.1162)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.649)	Top-5 acc 49.609 (51.959)	lr 0.02500
Train [1][990/3239]	Time 0.401 (0.531)	Data Time 0.002 (0.022)	Loss 4.0103 (4.1168)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.645)	Top-5 acc 52.734 (51.942)	lr 0.02500
Train [1][1000/3239]	Time 0.426 (0.531)	Data Time 0.001 (0.022)	Loss 4.1638 (4.1168)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.640)	Top-5 acc 49.609 (51.939)	lr 0.02500
Train [1][1010/3239]	Time 0.583 (0.531)	Data Time 0.001 (0.022)	Loss 4.2729 (4.1175)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.632)	Top-5 acc 48.828 (51.933)	lr 0.02500
Train [1][1020/3239]	Time 0.662 (0.531)	Data Time 0.001 (0.021)	Loss 4.1273 (4.1177)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.633)	Top-5 acc 52.734 (51.925)	lr 0.02500
Train [1][1030/3239]	Time 0.415 (0.530)	Data Time 0.001 (0.021)	Loss 4.1828 (4.1174)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.632)	Top-5 acc 50.391 (51.932)	lr 0.02500
Train [1][1040/3239]	Time 0.498 (0.531)	Data Time 0.001 (0.021)	Loss 3.9594 (4.1176)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.630)	Top-5 acc 54.688 (51.932)	lr 0.02500
Train [1][1050/3239]	Time 0.535 (0.530)	Data Time 0.001 (0.021)	Loss 4.1292 (4.1178)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.626)	Top-5 acc 52.344 (51.923)	lr 0.02500
Train [1][1060/3239]	Time 0.417 (0.530)	Data Time 0.001 (0.021)	Loss 4.0959 (4.1177)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.624)	Top-5 acc 50.000 (51.921)	lr 0.02500
Train [1][1070/3239]	Time 0.498 (0.530)	Data Time 0.001 (0.021)	Loss 4.3169 (4.1179)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.624)	Top-5 acc 47.656 (51.916)	lr 0.02500
Train [1][1080/3239]	Time 0.499 (0.530)	Data Time 0.001 (0.021)	Loss 4.3678 (4.1180)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.627)	Top-5 acc 42.969 (51.914)	lr 0.02500
Train [1][1090/3239]	Time 0.504 (0.530)	Data Time 0.001 (0.021)	Loss 4.1211 (4.1178)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.637)	Top-5 acc 50.391 (51.929)	lr 0.02500
Train [1][1100/3239]	Time 0.643 (0.529)	Data Time 0.001 (0.020)	Loss 4.0902 (4.1178)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.630)	Top-5 acc 50.781 (51.920)	lr 0.02500
Train [1][1110/3239]	Time 0.536 (0.529)	Data Time 0.001 (0.020)	Loss 3.9982 (4.1176)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.631)	Top-5 acc 51.953 (51.926)	lr 0.02500
Train [1][1120/3239]	Time 0.705 (0.530)	Data Time 0.001 (0.020)	Loss 4.2037 (4.1183)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.626)	Top-5 acc 50.391 (51.906)	lr 0.02500
Train [1][1130/3239]	Time 0.665 (0.529)	Data Time 0.001 (0.020)	Loss 4.0574 (4.1184)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.627)	Top-5 acc 52.344 (51.911)	lr 0.02500
Train [1][1140/3239]	Time 0.575 (0.529)	Data Time 0.001 (0.020)	Loss 4.0662 (4.1182)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.635)	Top-5 acc 54.297 (51.914)	lr 0.02500
Train [1][1150/3239]	Time 0.531 (0.529)	Data Time 0.001 (0.020)	Loss 4.1952 (4.1184)	Entropy 1.90187 (1.90187)	Top-1 acc 33.203 (28.639)	Top-5 acc 54.297 (51.920)	lr 0.02500
Train [1][1160/3239]	Time 0.457 (0.529)	Data Time 0.001 (0.019)	Loss 4.3533 (4.1194)	Entropy 1.90187 (1.90187)	Top-1 acc 22.656 (28.613)	Top-5 acc 42.578 (51.892)	lr 0.02500
Train [1][1170/3239]	Time 0.413 (0.529)	Data Time 0.001 (0.019)	Loss 4.1503 (4.1194)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.606)	Top-5 acc 53.125 (51.897)	lr 0.02500
Train [1][1180/3239]	Time 0.492 (0.528)	Data Time 0.001 (0.019)	Loss 4.2420 (4.1196)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.607)	Top-5 acc 51.172 (51.903)	lr 0.02500
Train [1][1190/3239]	Time 0.650 (0.528)	Data Time 0.001 (0.019)	Loss 4.3642 (4.1197)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.607)	Top-5 acc 49.609 (51.906)	lr 0.02500
Train [1][1200/3239]	Time 0.521 (0.528)	Data Time 0.002 (0.019)	Loss 4.1980 (4.1201)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.598)	Top-5 acc 50.000 (51.904)	lr 0.02500
Train [1][1210/3239]	Time 0.459 (0.527)	Data Time 0.001 (0.019)	Loss 4.0055 (4.1202)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.600)	Top-5 acc 54.297 (51.898)	lr 0.02500
Train [1][1220/3239]	Time 0.431 (0.527)	Data Time 0.031 (0.019)	Loss 4.0949 (4.1207)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.595)	Top-5 acc 51.953 (51.883)	lr 0.02500
Train [1][1230/3239]	Time 0.644 (0.527)	Data Time 0.026 (0.019)	Loss 3.7808 (4.1205)	Entropy 1.90187 (1.90187)	Top-1 acc 35.938 (28.606)	Top-5 acc 61.328 (51.894)	lr 0.02500
Train [1][1240/3239]	Time 0.575 (0.527)	Data Time 0.001 (0.019)	Loss 4.0413 (4.1208)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.605)	Top-5 acc 52.344 (51.887)	lr 0.02500
Train [1][1250/3239]	Time 0.523 (0.527)	Data Time 0.001 (0.019)	Loss 4.1976 (4.1213)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.589)	Top-5 acc 51.953 (51.874)	lr 0.02500
Train [1][1260/3239]	Time 0.637 (0.527)	Data Time 0.001 (0.018)	Loss 4.0240 (4.1212)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.585)	Top-5 acc 56.641 (51.884)	lr 0.02500
Train [1][1270/3239]	Time 0.455 (0.527)	Data Time 0.001 (0.018)	Loss 3.9484 (4.1211)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.590)	Top-5 acc 58.203 (51.892)	lr 0.02500
Train [1][1280/3239]	Time 0.633 (0.527)	Data Time 0.001 (0.018)	Loss 4.0639 (4.1210)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.585)	Top-5 acc 52.734 (51.896)	lr 0.02500
Train [1][1290/3239]	Time 0.487 (0.527)	Data Time 0.001 (0.018)	Loss 4.1402 (4.1214)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.580)	Top-5 acc 50.000 (51.888)	lr 0.02500
Train [1][1300/3239]	Time 0.453 (0.527)	Data Time 0.001 (0.018)	Loss 4.2845 (4.1212)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.591)	Top-5 acc 48.438 (51.886)	lr 0.02500
Train [1][1310/3239]	Time 0.536 (0.527)	Data Time 0.002 (0.018)	Loss 4.2579 (4.1210)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.595)	Top-5 acc 46.484 (51.888)	lr 0.02500
Train [1][1320/3239]	Time 0.660 (0.527)	Data Time 0.001 (0.018)	Loss 4.0368 (4.1212)	Entropy 1.90187 (1.90187)	Top-1 acc 37.109 (28.597)	Top-5 acc 55.859 (51.883)	lr 0.02500
Train [1][1330/3239]	Time 0.587 (0.527)	Data Time 0.001 (0.018)	Loss 4.0639 (4.1214)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.591)	Top-5 acc 55.469 (51.875)	lr 0.02500
Train [1][1340/3239]	Time 0.597 (0.527)	Data Time 0.001 (0.018)	Loss 4.1228 (4.1212)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.584)	Top-5 acc 49.219 (51.881)	lr 0.02500
Train [1][1350/3239]	Time 0.385 (0.527)	Data Time 0.001 (0.018)	Loss 4.0728 (4.1217)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.579)	Top-5 acc 55.859 (51.872)	lr 0.02500
Train [1][1360/3239]	Time 0.464 (0.526)	Data Time 0.001 (0.018)	Loss 4.1929 (4.1216)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.575)	Top-5 acc 46.484 (51.871)	lr 0.02500
Train [1][1370/3239]	Time 0.553 (0.527)	Data Time 0.001 (0.018)	Loss 4.0810 (4.1220)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.572)	Top-5 acc 51.562 (51.859)	lr 0.02500
Train [1][1380/3239]	Time 0.511 (0.527)	Data Time 0.001 (0.017)	Loss 4.0667 (4.1216)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.578)	Top-5 acc 56.641 (51.861)	lr 0.02500
Train [1][1390/3239]	Time 0.482 (0.527)	Data Time 0.001 (0.017)	Loss 4.1244 (4.1211)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.579)	Top-5 acc 53.516 (51.864)	lr 0.02500
Train [1][1400/3239]	Time 0.290 (0.527)	Data Time 0.001 (0.017)	Loss 4.2662 (4.1211)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.582)	Top-5 acc 51.562 (51.868)	lr 0.02500
Train [1][1410/3239]	Time 0.594 (0.527)	Data Time 0.001 (0.017)	Loss 4.1393 (4.1214)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.588)	Top-5 acc 49.609 (51.864)	lr 0.02500
Train [1][1420/3239]	Time 0.616 (0.526)	Data Time 0.001 (0.017)	Loss 4.0762 (4.1213)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.595)	Top-5 acc 52.344 (51.864)	lr 0.02500
Train [1][1430/3239]	Time 0.536 (0.526)	Data Time 0.001 (0.017)	Loss 4.1654 (4.1212)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.601)	Top-5 acc 46.484 (51.872)	lr 0.02500
Train [1][1440/3239]	Time 0.415 (0.526)	Data Time 0.001 (0.017)	Loss 4.0950 (4.1217)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.584)	Top-5 acc 52.734 (51.854)	lr 0.02500
Train [1][1450/3239]	Time 0.699 (0.526)	Data Time 0.001 (0.017)	Loss 4.1594 (4.1217)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.584)	Top-5 acc 52.344 (51.859)	lr 0.02500
Train [1][1460/3239]	Time 0.510 (0.525)	Data Time 0.001 (0.017)	Loss 4.1127 (4.1215)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.585)	Top-5 acc 54.688 (51.868)	lr 0.02500
Train [1][1470/3239]	Time 0.618 (0.525)	Data Time 0.001 (0.017)	Loss 4.2111 (4.1215)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.587)	Top-5 acc 47.266 (51.862)	lr 0.02500
Train [1][1480/3239]	Time 0.421 (0.525)	Data Time 0.001 (0.017)	Loss 4.2354 (4.1221)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.578)	Top-5 acc 48.828 (51.849)	lr 0.02500
Train [1][1490/3239]	Time 0.567 (0.525)	Data Time 0.001 (0.017)	Loss 4.2566 (4.1223)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.577)	Top-5 acc 44.531 (51.844)	lr 0.02500
Train [1][1500/3239]	Time 0.418 (0.525)	Data Time 0.001 (0.017)	Loss 4.1241 (4.1225)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.569)	Top-5 acc 50.781 (51.830)	lr 0.02500
Train [1][1510/3239]	Time 0.469 (0.525)	Data Time 0.001 (0.017)	Loss 4.1493 (4.1230)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.564)	Top-5 acc 50.391 (51.821)	lr 0.02500
Train [1][1520/3239]	Time 0.666 (0.525)	Data Time 0.001 (0.016)	Loss 4.2708 (4.1232)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.562)	Top-5 acc 49.219 (51.817)	lr 0.02500
Train [1][1530/3239]	Time 0.662 (0.525)	Data Time 0.001 (0.016)	Loss 3.9853 (4.1232)	Entropy 1.90187 (1.90187)	Top-1 acc 35.156 (28.569)	Top-5 acc 55.469 (51.819)	lr 0.02500
Train [1][1540/3239]	Time 0.474 (0.525)	Data Time 0.001 (0.016)	Loss 4.1251 (4.1235)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.561)	Top-5 acc 52.734 (51.816)	lr 0.02500
Train [1][1550/3239]	Time 0.367 (0.525)	Data Time 0.001 (0.016)	Loss 4.1582 (4.1237)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.559)	Top-5 acc 52.734 (51.815)	lr 0.02500
Train [1][1560/3239]	Time 0.499 (0.525)	Data Time 0.001 (0.016)	Loss 4.2787 (4.1239)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.548)	Top-5 acc 50.781 (51.807)	lr 0.02500
Train [1][1570/3239]	Time 0.583 (0.525)	Data Time 0.001 (0.016)	Loss 4.1253 (4.1239)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.546)	Top-5 acc 48.828 (51.809)	lr 0.02500
Train [1][1580/3239]	Time 0.658 (0.525)	Data Time 0.001 (0.016)	Loss 3.9172 (4.1241)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.538)	Top-5 acc 58.203 (51.810)	lr 0.02500
Train [1][1590/3239]	Time 0.503 (0.525)	Data Time 0.001 (0.016)	Loss 4.1399 (4.1243)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.537)	Top-5 acc 53.125 (51.812)	lr 0.02500
Train [1][1600/3239]	Time 0.542 (0.525)	Data Time 0.001 (0.016)	Loss 4.1581 (4.1243)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.541)	Top-5 acc 49.609 (51.817)	lr 0.02500
Train [1][1610/3239]	Time 0.511 (0.525)	Data Time 0.001 (0.016)	Loss 4.2427 (4.1244)	Entropy 1.90187 (1.90187)	Top-1 acc 23.438 (28.536)	Top-5 acc 47.266 (51.815)	lr 0.02500
Train [1][1620/3239]	Time 0.488 (0.525)	Data Time 0.001 (0.016)	Loss 3.9603 (4.1246)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (28.536)	Top-5 acc 55.078 (51.814)	lr 0.02500
Train [1][1630/3239]	Time 0.783 (0.525)	Data Time 0.001 (0.016)	Loss 4.0352 (4.1249)	Entropy 1.90187 (1.90187)	Top-1 acc 33.203 (28.519)	Top-5 acc 54.297 (51.813)	lr 0.02500
Train [1][1640/3239]	Time 0.322 (0.525)	Data Time 0.001 (0.016)	Loss 4.1918 (4.1249)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.515)	Top-5 acc 49.609 (51.811)	lr 0.02500
Train [1][1650/3239]	Time 0.491 (0.525)	Data Time 0.001 (0.016)	Loss 3.9897 (4.1248)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.518)	Top-5 acc 55.859 (51.816)	lr 0.02500
Train [1][1660/3239]	Time 0.313 (0.525)	Data Time 0.001 (0.016)	Loss 4.0682 (4.1251)	Entropy 1.90187 (1.90187)	Top-1 acc 33.203 (28.510)	Top-5 acc 53.516 (51.804)	lr 0.02500
Train [1][1670/3239]	Time 0.551 (0.525)	Data Time 0.001 (0.016)	Loss 4.0410 (4.1251)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.520)	Top-5 acc 53.125 (51.808)	lr 0.02500
Train [1][1680/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.015)	Loss 4.0488 (4.1252)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.515)	Top-5 acc 54.297 (51.803)	lr 0.02500
Train [1][1690/3239]	Time 0.337 (0.524)	Data Time 0.001 (0.015)	Loss 4.2788 (4.1250)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.515)	Top-5 acc 50.391 (51.802)	lr 0.02500
Train [1][1700/3239]	Time 0.513 (0.524)	Data Time 0.001 (0.015)	Loss 4.2082 (4.1253)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.513)	Top-5 acc 50.781 (51.798)	lr 0.02500
Train [1][1710/3239]	Time 0.564 (0.524)	Data Time 0.001 (0.015)	Loss 3.9531 (4.1252)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.510)	Top-5 acc 55.469 (51.799)	lr 0.02500
Train [1][1720/3239]	Time 0.497 (0.524)	Data Time 0.001 (0.015)	Loss 3.9882 (4.1255)	Entropy 1.90187 (1.90187)	Top-1 acc 35.547 (28.504)	Top-5 acc 57.422 (51.800)	lr 0.02500
Train [1][1730/3239]	Time 0.377 (0.523)	Data Time 0.001 (0.015)	Loss 4.1941 (4.1252)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.509)	Top-5 acc 46.875 (51.804)	lr 0.02500
Train [1][1740/3239]	Time 0.487 (0.524)	Data Time 0.001 (0.015)	Loss 4.3618 (4.1254)	Entropy 1.90187 (1.90187)	Top-1 acc 19.922 (28.505)	Top-5 acc 47.656 (51.805)	lr 0.02500
Train [1][1750/3239]	Time 0.472 (0.524)	Data Time 0.001 (0.015)	Loss 4.0973 (4.1258)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.502)	Top-5 acc 52.734 (51.802)	lr 0.02500
Train [1][1760/3239]	Time 0.618 (0.524)	Data Time 0.001 (0.015)	Loss 4.2643 (4.1257)	Entropy 1.90187 (1.90187)	Top-1 acc 21.094 (28.497)	Top-5 acc 48.438 (51.802)	lr 0.02500
Train [1][1770/3239]	Time 0.410 (0.523)	Data Time 0.001 (0.015)	Loss 4.1395 (4.1260)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.491)	Top-5 acc 53.125 (51.799)	lr 0.02500
Train [1][1780/3239]	Time 0.559 (0.523)	Data Time 0.001 (0.015)	Loss 4.1420 (4.1263)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.482)	Top-5 acc 54.688 (51.787)	lr 0.02500
Train [1][1790/3239]	Time 0.562 (0.523)	Data Time 0.001 (0.015)	Loss 4.0674 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.475)	Top-5 acc 52.344 (51.773)	lr 0.02500
Train [1][1800/3239]	Time 0.360 (0.523)	Data Time 0.001 (0.015)	Loss 4.0849 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.474)	Top-5 acc 52.344 (51.777)	lr 0.02500
Train [1][1810/3239]	Time 0.656 (0.523)	Data Time 0.001 (0.015)	Loss 4.2350 (4.1267)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.474)	Top-5 acc 48.828 (51.776)	lr 0.02500
Train [1][1820/3239]	Time 0.492 (0.523)	Data Time 0.001 (0.015)	Loss 4.2760 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.474)	Top-5 acc 48.438 (51.775)	lr 0.02500
Train [1][1830/3239]	Time 0.562 (0.523)	Data Time 0.001 (0.015)	Loss 4.1648 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.470)	Top-5 acc 51.953 (51.772)	lr 0.02500
Train [1][1840/3239]	Time 0.584 (0.523)	Data Time 0.001 (0.015)	Loss 3.9905 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.473)	Top-5 acc 55.859 (51.773)	lr 0.02500
Train [1][1850/3239]	Time 0.468 (0.523)	Data Time 0.001 (0.015)	Loss 3.9408 (4.1266)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.476)	Top-5 acc 56.641 (51.778)	lr 0.02500
Train [1][1860/3239]	Time 0.364 (0.523)	Data Time 0.001 (0.015)	Loss 4.1705 (4.1267)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.475)	Top-5 acc 49.609 (51.774)	lr 0.02500
Train [1][1870/3239]	Time 0.668 (0.523)	Data Time 0.001 (0.015)	Loss 4.2036 (4.1272)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.465)	Top-5 acc 49.219 (51.759)	lr 0.02500
Train [1][1880/3239]	Time 0.513 (0.523)	Data Time 0.001 (0.015)	Loss 4.1242 (4.1274)	Entropy 1.90187 (1.90187)	Top-1 acc 33.594 (28.465)	Top-5 acc 55.078 (51.758)	lr 0.02500
Train [1][1890/3239]	Time 0.567 (0.523)	Data Time 0.001 (0.015)	Loss 4.0953 (4.1273)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.467)	Top-5 acc 53.906 (51.760)	lr 0.02500
Train [1][1900/3239]	Time 0.663 (0.523)	Data Time 0.001 (0.015)	Loss 4.1146 (4.1273)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.471)	Top-5 acc 49.219 (51.756)	lr 0.02500
Train [1][1910/3239]	Time 0.681 (0.523)	Data Time 0.001 (0.015)	Loss 4.1253 (4.1271)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (28.478)	Top-5 acc 54.297 (51.755)	lr 0.02500
Train [1][1920/3239]	Time 0.481 (0.523)	Data Time 0.001 (0.015)	Loss 4.1145 (4.1273)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.480)	Top-5 acc 53.125 (51.749)	lr 0.02500
Train [1][1930/3239]	Time 0.578 (0.523)	Data Time 0.001 (0.015)	Loss 4.2728 (4.1278)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.473)	Top-5 acc 46.094 (51.741)	lr 0.02500
Train [1][1940/3239]	Time 0.418 (0.522)	Data Time 0.001 (0.014)	Loss 3.9655 (4.1277)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.471)	Top-5 acc 54.297 (51.742)	lr 0.02500
Train [1][1950/3239]	Time 0.409 (0.522)	Data Time 0.001 (0.014)	Loss 4.1654 (4.1278)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.469)	Top-5 acc 52.344 (51.745)	lr 0.02500
Train [1][1960/3239]	Time 0.440 (0.522)	Data Time 0.001 (0.014)	Loss 4.1617 (4.1279)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.466)	Top-5 acc 50.000 (51.745)	lr 0.02500
Train [1][1970/3239]	Time 0.460 (0.522)	Data Time 0.001 (0.014)	Loss 4.2208 (4.1279)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.477)	Top-5 acc 50.391 (51.744)	lr 0.02500
Train [1][1980/3239]	Time 0.612 (0.522)	Data Time 0.001 (0.014)	Loss 4.1594 (4.1278)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.478)	Top-5 acc 50.781 (51.749)	lr 0.02500
Train [1][1990/3239]	Time 0.611 (0.522)	Data Time 0.002 (0.014)	Loss 4.1299 (4.1280)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.473)	Top-5 acc 56.641 (51.754)	lr 0.02500
Train [1][2000/3239]	Time 0.429 (0.522)	Data Time 0.001 (0.014)	Loss 4.1133 (4.1279)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.478)	Top-5 acc 51.953 (51.762)	lr 0.02500
Train [1][2010/3239]	Time 0.430 (0.522)	Data Time 0.001 (0.014)	Loss 4.2436 (4.1283)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.466)	Top-5 acc 49.219 (51.755)	lr 0.02500
Train [1][2020/3239]	Time 0.502 (0.522)	Data Time 0.001 (0.014)	Loss 4.2885 (4.1284)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.464)	Top-5 acc 49.609 (51.750)	lr 0.02500
Train [1][2030/3239]	Time 0.611 (0.522)	Data Time 0.001 (0.014)	Loss 4.1663 (4.1287)	Entropy 1.90187 (1.90187)	Top-1 acc 23.438 (28.453)	Top-5 acc 50.391 (51.739)	lr 0.02500
Train [1][2040/3239]	Time 0.425 (0.521)	Data Time 0.001 (0.014)	Loss 4.0921 (4.1288)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.457)	Top-5 acc 50.391 (51.733)	lr 0.02500
Train [1][2050/3239]	Time 0.389 (0.521)	Data Time 0.001 (0.014)	Loss 4.2027 (4.1291)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.453)	Top-5 acc 48.047 (51.725)	lr 0.02500
Train [1][2060/3239]	Time 0.388 (0.521)	Data Time 0.001 (0.014)	Loss 4.2295 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.455)	Top-5 acc 48.047 (51.726)	lr 0.02500
Train [1][2070/3239]	Time 0.442 (0.521)	Data Time 0.001 (0.014)	Loss 3.9333 (4.1291)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.452)	Top-5 acc 55.859 (51.724)	lr 0.02500
Train [1][2080/3239]	Time 0.505 (0.521)	Data Time 0.001 (0.014)	Loss 4.1125 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.447)	Top-5 acc 50.391 (51.723)	lr 0.02500
Train [1][2090/3239]	Time 0.648 (0.521)	Data Time 0.001 (0.014)	Loss 4.2935 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.443)	Top-5 acc 47.656 (51.722)	lr 0.02500
Train [1][2100/3239]	Time 0.595 (0.521)	Data Time 0.001 (0.014)	Loss 4.2109 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.442)	Top-5 acc 51.562 (51.720)	lr 0.02500
Train [1][2110/3239]	Time 0.391 (0.521)	Data Time 0.001 (0.014)	Loss 4.0866 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.445)	Top-5 acc 53.125 (51.723)	lr 0.02500
Train [1][2120/3239]	Time 0.569 (0.521)	Data Time 0.001 (0.014)	Loss 3.9983 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.449)	Top-5 acc 57.422 (51.732)	lr 0.02500
Train [1][2130/3239]	Time 0.631 (0.521)	Data Time 0.001 (0.014)	Loss 4.1426 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.441)	Top-5 acc 51.562 (51.725)	lr 0.02500
Train [1][2140/3239]	Time 0.601 (0.521)	Data Time 0.001 (0.014)	Loss 4.1502 (4.1297)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.440)	Top-5 acc 51.953 (51.721)	lr 0.02500
Train [1][2150/3239]	Time 0.424 (0.521)	Data Time 0.001 (0.014)	Loss 4.3109 (4.1295)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.446)	Top-5 acc 46.875 (51.726)	lr 0.02500
Train [1][2160/3239]	Time 0.498 (0.521)	Data Time 0.001 (0.014)	Loss 4.0748 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.452)	Top-5 acc 53.125 (51.732)	lr 0.02500
Train [1][2170/3239]	Time 0.502 (0.521)	Data Time 0.001 (0.014)	Loss 4.2207 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.454)	Top-5 acc 47.266 (51.735)	lr 0.02500
Train [1][2180/3239]	Time 0.426 (0.521)	Data Time 0.001 (0.014)	Loss 3.9802 (4.1291)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.457)	Top-5 acc 53.516 (51.736)	lr 0.02500
Train [1][2190/3239]	Time 0.505 (0.521)	Data Time 0.001 (0.014)	Loss 4.0363 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (28.458)	Top-5 acc 53.516 (51.732)	lr 0.02500
Train [1][2200/3239]	Time 0.506 (0.521)	Data Time 0.001 (0.014)	Loss 4.1421 (4.1294)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.457)	Top-5 acc 50.000 (51.731)	lr 0.02500
Train [1][2210/3239]	Time 0.444 (0.521)	Data Time 0.001 (0.014)	Loss 4.1240 (4.1295)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.462)	Top-5 acc 55.078 (51.734)	lr 0.02500
Train [1][2220/3239]	Time 0.585 (0.521)	Data Time 0.001 (0.014)	Loss 4.2164 (4.1295)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.458)	Top-5 acc 48.438 (51.733)	lr 0.02500
Train [1][2230/3239]	Time 0.536 (0.521)	Data Time 0.001 (0.014)	Loss 4.2597 (4.1294)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.462)	Top-5 acc 48.047 (51.734)	lr 0.02500
Train [1][2240/3239]	Time 0.552 (0.521)	Data Time 0.001 (0.014)	Loss 3.9563 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.467)	Top-5 acc 57.031 (51.737)	lr 0.02500
Train [1][2250/3239]	Time 0.515 (0.521)	Data Time 0.001 (0.013)	Loss 4.2428 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.473)	Top-5 acc 49.609 (51.742)	lr 0.02500
Train [1][2260/3239]	Time 0.651 (0.521)	Data Time 0.001 (0.013)	Loss 3.7551 (4.1286)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (28.477)	Top-5 acc 62.891 (51.749)	lr 0.02500
Train [1][2270/3239]	Time 0.597 (0.521)	Data Time 0.001 (0.013)	Loss 4.0729 (4.1287)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.475)	Top-5 acc 51.953 (51.747)	lr 0.02500
Train [1][2280/3239]	Time 0.460 (0.521)	Data Time 0.001 (0.013)	Loss 4.2972 (4.1288)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.474)	Top-5 acc 48.047 (51.748)	lr 0.02500
Train [1][2290/3239]	Time 0.485 (0.521)	Data Time 0.001 (0.013)	Loss 4.0258 (4.1286)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.480)	Top-5 acc 57.031 (51.754)	lr 0.02500
Train [1][2300/3239]	Time 0.512 (0.521)	Data Time 0.001 (0.013)	Loss 3.9355 (4.1285)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.484)	Top-5 acc 55.859 (51.753)	lr 0.02500
Train [1][2310/3239]	Time 0.528 (0.521)	Data Time 0.001 (0.013)	Loss 3.9710 (4.1284)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.485)	Top-5 acc 53.906 (51.752)	lr 0.02500
Train [1][2320/3239]	Time 0.544 (0.521)	Data Time 0.001 (0.013)	Loss 4.2331 (4.1281)	Entropy 1.90187 (1.90187)	Top-1 acc 25.781 (28.488)	Top-5 acc 46.875 (51.757)	lr 0.02500
Train [1][2330/3239]	Time 0.596 (0.521)	Data Time 0.001 (0.013)	Loss 4.1454 (4.1282)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.487)	Top-5 acc 50.391 (51.751)	lr 0.02500
Train [1][2340/3239]	Time 0.559 (0.521)	Data Time 0.001 (0.013)	Loss 4.2011 (4.1282)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.484)	Top-5 acc 51.172 (51.757)	lr 0.02500
Train [1][2350/3239]	Time 0.437 (0.521)	Data Time 0.001 (0.013)	Loss 4.4003 (4.1289)	Entropy 1.90187 (1.90187)	Top-1 acc 21.094 (28.473)	Top-5 acc 44.922 (51.743)	lr 0.02500
Train [1][2360/3239]	Time 0.553 (0.521)	Data Time 0.001 (0.013)	Loss 4.0466 (4.1288)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.477)	Top-5 acc 51.172 (51.741)	lr 0.02500
Train [1][2370/3239]	Time 0.502 (0.521)	Data Time 0.001 (0.013)	Loss 3.9788 (4.1287)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (28.482)	Top-5 acc 56.641 (51.744)	lr 0.02500
Train [1][2380/3239]	Time 0.531 (0.521)	Data Time 0.001 (0.013)	Loss 4.0149 (4.1286)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (28.484)	Top-5 acc 54.297 (51.744)	lr 0.02500
Train [1][2390/3239]	Time 0.407 (0.521)	Data Time 0.001 (0.013)	Loss 3.9666 (4.1287)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.479)	Top-5 acc 52.344 (51.743)	lr 0.02500
Train [1][2400/3239]	Time 0.516 (0.521)	Data Time 0.001 (0.013)	Loss 4.0369 (4.1289)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (28.475)	Top-5 acc 53.906 (51.740)	lr 0.02500
Train [1][2410/3239]	Time 0.542 (0.521)	Data Time 0.001 (0.013)	Loss 4.1276 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.470)	Top-5 acc 51.172 (51.735)	lr 0.02500
Train [1][2420/3239]	Time 0.567 (0.521)	Data Time 0.001 (0.013)	Loss 4.0809 (4.1289)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.476)	Top-5 acc 55.078 (51.736)	lr 0.02500
Train [1][2430/3239]	Time 0.392 (0.521)	Data Time 0.001 (0.013)	Loss 4.1659 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.472)	Top-5 acc 50.781 (51.730)	lr 0.02500
Train [1][2440/3239]	Time 0.345 (0.521)	Data Time 0.001 (0.013)	Loss 4.2160 (4.1291)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.470)	Top-5 acc 51.172 (51.726)	lr 0.02500
Train [1][2450/3239]	Time 0.472 (0.520)	Data Time 0.001 (0.013)	Loss 4.0322 (4.1289)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.472)	Top-5 acc 51.562 (51.731)	lr 0.02500
Train [1][2460/3239]	Time 0.461 (0.520)	Data Time 0.001 (0.013)	Loss 4.1740 (4.1289)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.472)	Top-5 acc 50.391 (51.729)	lr 0.02500
Train [1][2470/3239]	Time 0.543 (0.520)	Data Time 0.001 (0.013)	Loss 4.1729 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.473)	Top-5 acc 49.609 (51.723)	lr 0.02500
Train [1][2480/3239]	Time 0.505 (0.520)	Data Time 0.001 (0.013)	Loss 4.2532 (4.1290)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.474)	Top-5 acc 50.391 (51.729)	lr 0.02500
Train [1][2490/3239]	Time 0.478 (0.520)	Data Time 0.002 (0.013)	Loss 4.0922 (4.1292)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.473)	Top-5 acc 52.734 (51.727)	lr 0.02500
Train [1][2500/3239]	Time 0.528 (0.520)	Data Time 0.001 (0.013)	Loss 3.9922 (4.1295)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.468)	Top-5 acc 60.547 (51.728)	lr 0.02500
Train [1][2510/3239]	Time 0.575 (0.520)	Data Time 0.001 (0.013)	Loss 4.3145 (4.1297)	Entropy 1.90187 (1.90187)	Top-1 acc 21.484 (28.458)	Top-5 acc 48.047 (51.723)	lr 0.02500
Train [1][2520/3239]	Time 0.531 (0.520)	Data Time 0.001 (0.013)	Loss 4.3070 (4.1297)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.455)	Top-5 acc 44.922 (51.719)	lr 0.02500
Train [1][2530/3239]	Time 0.349 (0.520)	Data Time 0.001 (0.013)	Loss 4.0934 (4.1294)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.462)	Top-5 acc 52.734 (51.726)	lr 0.02500
Train [1][2540/3239]	Time 0.626 (0.520)	Data Time 0.001 (0.013)	Loss 4.0954 (4.1293)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.466)	Top-5 acc 54.297 (51.725)	lr 0.02500
Train [1][2550/3239]	Time 0.528 (0.520)	Data Time 0.001 (0.013)	Loss 4.0793 (4.1294)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.465)	Top-5 acc 50.781 (51.720)	lr 0.02500
Train [1][2560/3239]	Time 0.360 (0.520)	Data Time 0.001 (0.013)	Loss 4.0695 (4.1294)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.464)	Top-5 acc 51.172 (51.722)	lr 0.02500
Train [1][2570/3239]	Time 0.558 (0.520)	Data Time 0.001 (0.013)	Loss 4.0197 (4.1295)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.463)	Top-5 acc 53.516 (51.718)	lr 0.02500
Train [1][2580/3239]	Time 0.557 (0.520)	Data Time 0.001 (0.013)	Loss 4.1564 (4.1296)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.462)	Top-5 acc 52.344 (51.718)	lr 0.02500
Train [1][2590/3239]	Time 0.540 (0.521)	Data Time 0.001 (0.013)	Loss 4.1301 (4.1296)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.465)	Top-5 acc 51.562 (51.715)	lr 0.02500
Train [1][2600/3239]	Time 0.570 (0.521)	Data Time 0.001 (0.013)	Loss 4.2135 (4.1296)	Entropy 1.90187 (1.90187)	Top-1 acc 25.000 (28.466)	Top-5 acc 50.391 (51.714)	lr 0.02500
Train [1][2610/3239]	Time 0.507 (0.521)	Data Time 0.001 (0.013)	Loss 4.2763 (4.1298)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.463)	Top-5 acc 47.656 (51.711)	lr 0.02500
Train [1][2620/3239]	Time 0.511 (0.520)	Data Time 0.001 (0.013)	Loss 4.2174 (4.1301)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.459)	Top-5 acc 46.484 (51.703)	lr 0.02500
Train [1][2630/3239]	Time 0.419 (0.520)	Data Time 0.001 (0.013)	Loss 3.9867 (4.1300)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.461)	Top-5 acc 54.297 (51.704)	lr 0.02500
Train [1][2640/3239]	Time 0.365 (0.520)	Data Time 0.001 (0.013)	Loss 3.9676 (4.1299)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.462)	Top-5 acc 57.031 (51.710)	lr 0.02500
Train [1][2650/3239]	Time 0.567 (0.520)	Data Time 0.001 (0.013)	Loss 3.9970 (4.1299)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.463)	Top-5 acc 53.906 (51.709)	lr 0.02500
Train [1][2660/3239]	Time 0.402 (0.520)	Data Time 0.001 (0.013)	Loss 4.2694 (4.1300)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.458)	Top-5 acc 48.438 (51.705)	lr 0.02500
Train [1][2670/3239]	Time 0.561 (0.520)	Data Time 0.001 (0.013)	Loss 3.9688 (4.1297)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.462)	Top-5 acc 54.688 (51.713)	lr 0.02500
Train [1][2680/3239]	Time 0.264 (0.520)	Data Time 0.001 (0.013)	Loss 4.3111 (4.1298)	Entropy 1.90187 (1.90187)	Top-1 acc 23.438 (28.459)	Top-5 acc 51.953 (51.712)	lr 0.02500
Train [1][2690/3239]	Time 0.409 (0.520)	Data Time 0.001 (0.013)	Loss 4.4338 (4.1300)	Entropy 1.90187 (1.90187)	Top-1 acc 23.828 (28.455)	Top-5 acc 45.703 (51.707)	lr 0.02500
Train [1][2700/3239]	Time 0.444 (0.520)	Data Time 0.001 (0.013)	Loss 4.0475 (4.1301)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (28.451)	Top-5 acc 54.688 (51.701)	lr 0.02500
Train [1][2710/3239]	Time 0.728 (0.520)	Data Time 0.001 (0.013)	Loss 4.2232 (4.1302)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.450)	Top-5 acc 50.000 (51.699)	lr 0.02500
Train [1][2720/3239]	Time 0.481 (0.520)	Data Time 0.001 (0.013)	Loss 4.2661 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 21.875 (28.444)	Top-5 acc 48.047 (51.694)	lr 0.02500
Train [1][2730/3239]	Time 0.515 (0.520)	Data Time 0.001 (0.012)	Loss 4.2220 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.441)	Top-5 acc 50.000 (51.690)	lr 0.02500
Train [1][2740/3239]	Time 0.751 (0.520)	Data Time 0.001 (0.012)	Loss 4.0622 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 31.250 (28.445)	Top-5 acc 55.469 (51.694)	lr 0.02500
Train [1][2750/3239]	Time 0.621 (0.520)	Data Time 0.001 (0.012)	Loss 4.1186 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 31.641 (28.450)	Top-5 acc 51.953 (51.697)	lr 0.02500
Train [1][2760/3239]	Time 0.516 (0.520)	Data Time 0.025 (0.012)	Loss 4.3690 (4.1305)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.448)	Top-5 acc 46.484 (51.691)	lr 0.02500
Train [1][2770/3239]	Time 0.743 (0.520)	Data Time 0.001 (0.012)	Loss 4.1456 (4.1306)	Entropy 1.90187 (1.90187)	Top-1 acc 28.906 (28.446)	Top-5 acc 48.438 (51.686)	lr 0.02500
Train [1][2780/3239]	Time 0.639 (0.520)	Data Time 0.001 (0.012)	Loss 4.1165 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.449)	Top-5 acc 49.219 (51.681)	lr 0.02500
Train [1][2790/3239]	Time 0.556 (0.520)	Data Time 0.001 (0.012)	Loss 4.1332 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.444)	Top-5 acc 50.781 (51.674)	lr 0.02500
Train [1][2800/3239]	Time 0.475 (0.520)	Data Time 0.001 (0.012)	Loss 4.0031 (4.1311)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.439)	Top-5 acc 54.688 (51.671)	lr 0.02500
Train [1][2810/3239]	Time 0.572 (0.520)	Data Time 0.002 (0.012)	Loss 3.9786 (4.1310)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.440)	Top-5 acc 53.906 (51.670)	lr 0.02500
Train [1][2820/3239]	Time 0.574 (0.520)	Data Time 0.001 (0.012)	Loss 4.0231 (4.1308)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.442)	Top-5 acc 52.734 (51.671)	lr 0.02500
Train [1][2830/3239]	Time 0.663 (0.520)	Data Time 0.001 (0.012)	Loss 4.1877 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.442)	Top-5 acc 51.953 (51.668)	lr 0.02500
Train [1][2840/3239]	Time 0.448 (0.520)	Data Time 0.001 (0.012)	Loss 4.3182 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 22.656 (28.437)	Top-5 acc 45.703 (51.665)	lr 0.02500
Train [1][2850/3239]	Time 0.633 (0.520)	Data Time 0.001 (0.012)	Loss 4.0336 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 29.297 (28.435)	Top-5 acc 54.688 (51.669)	lr 0.02500
Train [1][2860/3239]	Time 0.577 (0.520)	Data Time 0.001 (0.012)	Loss 4.3108 (4.1311)	Entropy 1.90187 (1.90187)	Top-1 acc 24.219 (28.432)	Top-5 acc 44.922 (51.664)	lr 0.02500
Train [1][2870/3239]	Time 0.463 (0.520)	Data Time 0.001 (0.012)	Loss 4.0766 (4.1312)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.423)	Top-5 acc 51.172 (51.663)	lr 0.02500
Train [1][2880/3239]	Time 0.535 (0.520)	Data Time 0.001 (0.012)	Loss 3.8368 (4.1311)	Entropy 1.90187 (1.90187)	Top-1 acc 35.156 (28.426)	Top-5 acc 58.594 (51.663)	lr 0.02500
Train [1][2890/3239]	Time 0.618 (0.520)	Data Time 0.001 (0.012)	Loss 4.0831 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.426)	Top-5 acc 50.781 (51.665)	lr 0.02500
Train [1][2900/3239]	Time 0.577 (0.520)	Data Time 0.001 (0.012)	Loss 3.9800 (4.1308)	Entropy 1.90187 (1.90187)	Top-1 acc 33.984 (28.430)	Top-5 acc 52.734 (51.670)	lr 0.02500
Train [1][2910/3239]	Time 0.356 (0.520)	Data Time 0.002 (0.012)	Loss 4.1064 (4.1310)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.426)	Top-5 acc 53.516 (51.666)	lr 0.02500
Train [1][2920/3239]	Time 0.401 (0.520)	Data Time 0.001 (0.012)	Loss 4.2815 (4.1310)	Entropy 1.90187 (1.90187)	Top-1 acc 22.266 (28.421)	Top-5 acc 46.484 (51.663)	lr 0.02500
Train [1][2930/3239]	Time 0.583 (0.520)	Data Time 0.001 (0.012)	Loss 4.0377 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.426)	Top-5 acc 54.688 (51.663)	lr 0.02500
Train [1][2940/3239]	Time 0.511 (0.520)	Data Time 0.001 (0.012)	Loss 3.9015 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.426)	Top-5 acc 55.469 (51.661)	lr 0.02500
Train [1][2950/3239]	Time 0.380 (0.520)	Data Time 0.001 (0.012)	Loss 4.2055 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.427)	Top-5 acc 53.906 (51.663)	lr 0.02500
Train [1][2960/3239]	Time 0.423 (0.520)	Data Time 0.001 (0.012)	Loss 3.9954 (4.1306)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.431)	Top-5 acc 55.859 (51.668)	lr 0.02500
Train [1][2970/3239]	Time 0.346 (0.520)	Data Time 0.001 (0.012)	Loss 4.0046 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (28.428)	Top-5 acc 53.906 (51.668)	lr 0.02500
Train [1][2980/3239]	Time 0.356 (0.520)	Data Time 0.001 (0.012)	Loss 4.2991 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 20.703 (28.425)	Top-5 acc 48.047 (51.672)	lr 0.02500
Train [1][2990/3239]	Time 0.535 (0.520)	Data Time 0.001 (0.012)	Loss 4.0315 (4.1308)	Entropy 1.90187 (1.90187)	Top-1 acc 33.594 (28.423)	Top-5 acc 53.125 (51.666)	lr 0.02500
Train [1][3000/3239]	Time 0.491 (0.520)	Data Time 0.001 (0.012)	Loss 4.1835 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.425)	Top-5 acc 50.781 (51.671)	lr 0.02500
Train [1][3010/3239]	Time 0.610 (0.520)	Data Time 0.001 (0.012)	Loss 4.2578 (4.1309)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.419)	Top-5 acc 48.047 (51.664)	lr 0.02500
Train [1][3020/3239]	Time 0.510 (0.520)	Data Time 0.001 (0.012)	Loss 4.1892 (4.1308)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.420)	Top-5 acc 52.344 (51.670)	lr 0.02500
Train [1][3030/3239]	Time 0.617 (0.520)	Data Time 0.001 (0.012)	Loss 4.0501 (4.1306)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.422)	Top-5 acc 52.344 (51.671)	lr 0.02500
Train [1][3040/3239]	Time 0.635 (0.520)	Data Time 0.049 (0.012)	Loss 4.0577 (4.1305)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.423)	Top-5 acc 56.250 (51.676)	lr 0.02500
Train [1][3050/3239]	Time 0.514 (0.520)	Data Time 0.001 (0.012)	Loss 3.9836 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.424)	Top-5 acc 55.469 (51.679)	lr 0.02500
Train [1][3060/3239]	Time 0.429 (0.520)	Data Time 0.001 (0.012)	Loss 4.0664 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 30.859 (28.425)	Top-5 acc 57.422 (51.681)	lr 0.02500
Train [1][3070/3239]	Time 0.523 (0.520)	Data Time 0.001 (0.012)	Loss 4.1275 (4.1306)	Entropy 1.90187 (1.90187)	Top-1 acc 28.516 (28.422)	Top-5 acc 50.781 (51.678)	lr 0.02500
Train [1][3080/3239]	Time 0.495 (0.520)	Data Time 0.001 (0.012)	Loss 4.2443 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.421)	Top-5 acc 50.781 (51.677)	lr 0.02500
Train [1][3090/3239]	Time 0.571 (0.520)	Data Time 0.001 (0.012)	Loss 4.0420 (4.1306)	Entropy 1.90187 (1.90187)	Top-1 acc 29.688 (28.422)	Top-5 acc 55.078 (51.677)	lr 0.02500
Train [1][3100/3239]	Time 0.532 (0.520)	Data Time 0.001 (0.012)	Loss 4.1340 (4.1305)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.424)	Top-5 acc 49.219 (51.675)	lr 0.02500
Train [1][3110/3239]	Time 0.604 (0.520)	Data Time 0.001 (0.012)	Loss 4.1919 (4.1307)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.423)	Top-5 acc 48.047 (51.674)	lr 0.02500
Train [1][3120/3239]	Time 0.322 (0.520)	Data Time 0.001 (0.012)	Loss 4.1588 (4.1305)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.422)	Top-5 acc 50.391 (51.675)	lr 0.02500
Train [1][3130/3239]	Time 0.539 (0.520)	Data Time 0.001 (0.012)	Loss 4.1251 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 27.344 (28.428)	Top-5 acc 53.906 (51.680)	lr 0.02500
Train [1][3140/3239]	Time 0.753 (0.520)	Data Time 0.001 (0.012)	Loss 4.2943 (4.1302)	Entropy 1.90187 (1.90187)	Top-1 acc 21.875 (28.430)	Top-5 acc 46.875 (51.685)	lr 0.02500
Train [1][3150/3239]	Time 0.729 (0.520)	Data Time 0.001 (0.012)	Loss 4.0724 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 30.469 (28.427)	Top-5 acc 53.516 (51.680)	lr 0.02500
Train [1][3160/3239]	Time 0.453 (0.520)	Data Time 0.001 (0.012)	Loss 4.1105 (4.1305)	Entropy 1.90187 (1.90187)	Top-1 acc 30.078 (28.424)	Top-5 acc 50.781 (51.675)	lr 0.02500
Train [1][3170/3239]	Time 0.617 (0.520)	Data Time 0.001 (0.012)	Loss 4.1897 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 25.391 (28.423)	Top-5 acc 50.781 (51.678)	lr 0.02500
Train [1][3180/3239]	Time 0.328 (0.520)	Data Time 0.000 (0.012)	Loss 4.3028 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 32.031 (28.429)	Top-5 acc 45.312 (51.681)	lr 0.02500
Train [1][3190/3239]	Time 0.358 (0.520)	Data Time 0.000 (0.012)	Loss 4.3493 (4.1304)	Entropy 1.90187 (1.90187)	Top-1 acc 24.609 (28.428)	Top-5 acc 46.094 (51.681)	lr 0.02500
Train [1][3200/3239]	Time 0.576 (0.520)	Data Time 0.000 (0.012)	Loss 4.1258 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 26.953 (28.432)	Top-5 acc 51.953 (51.685)	lr 0.02500
Train [1][3210/3239]	Time 0.401 (0.520)	Data Time 0.000 (0.012)	Loss 4.1846 (4.1302)	Entropy 1.90187 (1.90187)	Top-1 acc 26.562 (28.432)	Top-5 acc 49.609 (51.685)	lr 0.02500
Train [1][3220/3239]	Time 0.332 (0.519)	Data Time 0.000 (0.012)	Loss 4.0387 (4.1303)	Entropy 1.90187 (1.90187)	Top-1 acc 27.734 (28.432)	Top-5 acc 52.344 (51.682)	lr 0.02500
Train [1][3230/3239]	Time 0.514 (0.519)	Data Time 0.000 (0.012)	Loss 4.2275 (4.1302)	Entropy 1.90187 (1.90187)	Top-1 acc 28.125 (28.434)	Top-5 acc 48.438 (51.682)	lr 0.02500
Train [1][3239/3239]	Time 0.363 (0.519)	Data Time 0.000 (0.012)	Loss 4.2932 (4.1301)	Entropy 1.90187 (1.90187)	Top-1 acc 22.222 (28.436)	Top-5 acc 48.148 (51.680)	lr 0.02500
==========Valid [1/120]	loss 3.076	top-1 acc 35.700 (35.700)	top-5 acc 61.077	Train top-1 28.436	top-5 51.680	Entropy 1.90187	Latency-None: 0.000ms	Flops: 442.44M
Train [2][0/3239]	Time 15.871 (15.871)	Data Time 14.223 (14.223)	Loss 3.9554 (3.9554)	Entropy 1.90187 (1.90187)	Top-1 acc 32.422 (32.422)	Top-5 acc 54.688 (54.688)	lr 0.02500
Train [2][10/3239]	Time 0.868 (3.689)	Data Time 0.004 (1.298)	Loss 4.0734 (4.1795)	Entropy 1.90187 (1.90187)	Top-1 acc 26.172 (28.303)	Top-5 acc 53.516 (50.000)	lr 0.02500
Train [2][20/3239]	Time 0.448 (2.280)	Data Time 0.002 (0.681)	Loss 4.0003 (4.1127)	Entropy 1.90186 (1.90187)	Top-1 acc 30.859 (29.055)	Top-5 acc 54.688 (51.860)	lr 0.02500
Train [2][30/3239]	Time 0.632 (1.793)	Data Time 0.002 (0.463)	Loss 4.0390 (4.1070)	Entropy 1.90186 (1.90187)	Top-1 acc 28.125 (29.360)	Top-5 acc 53.516 (51.978)	lr 0.02500
Train [2][40/3239]	Time 0.449 (1.534)	Data Time 0.001 (0.350)	Loss 4.0223 (4.1034)	Entropy 1.90186 (1.90186)	Top-1 acc 32.812 (29.354)	Top-5 acc 49.219 (52.048)	lr 0.02500
Train [2][50/3239]	Time 0.516 (1.381)	Data Time 0.001 (0.284)	Loss 3.9169 (4.0927)	Entropy 1.90186 (1.90186)	Top-1 acc 28.516 (29.182)	Top-5 acc 53.906 (52.405)	lr 0.02500
Train [2][60/3239]	Time 0.621 (1.280)	Data Time 0.003 (0.238)	Loss 4.1924 (4.0975)	Entropy 1.90186 (1.90186)	Top-1 acc 28.125 (28.970)	Top-5 acc 49.609 (52.363)	lr 0.02500
Train [2][70/3239]	Time 0.342 (1.202)	Data Time 0.001 (0.205)	Loss 4.3399 (4.1117)	Entropy 1.90185 (1.90186)	Top-1 acc 21.875 (28.664)	Top-5 acc 45.703 (52.019)	lr 0.02500
Train [2][80/3239]	Time 0.453 (1.145)	Data Time 0.001 (0.181)	Loss 4.1335 (4.1097)	Entropy 1.90185 (1.90186)	Top-1 acc 25.781 (28.684)	Top-5 acc 52.734 (52.011)	lr 0.02500
Train [2][90/3239]	Time 0.339 (1.098)	Data Time 0.002 (0.162)	Loss 4.0312 (4.1055)	Entropy 1.90185 (1.90186)	Top-1 acc 28.516 (28.687)	Top-5 acc 54.688 (52.168)	lr 0.02500
Train [2][100/3239]	Time 0.351 (1.062)	Data Time 0.001 (0.147)	Loss 3.9692 (4.1067)	Entropy 1.90184 (1.90186)	Top-1 acc 33.203 (28.717)	Top-5 acc 55.859 (52.208)	lr 0.02500
Train [2][110/3239]	Time 0.368 (1.034)	Data Time 0.001 (0.135)	Loss 4.1551 (4.1039)	Entropy 1.90184 (1.90186)	Top-1 acc 29.297 (28.899)	Top-5 acc 49.609 (52.238)	lr 0.02500
Train [2][120/3239]	Time 0.420 (1.009)	Data Time 0.001 (0.125)	Loss 4.1415 (4.1088)	Entropy 1.90183 (1.90185)	Top-1 acc 28.906 (28.787)	Top-5 acc 49.609 (52.105)	lr 0.02500
Train [2][130/3239]	Time 0.503 (0.987)	Data Time 0.001 (0.116)	Loss 3.9916 (4.1050)	Entropy 1.90183 (1.90185)	Top-1 acc 30.859 (28.867)	Top-5 acc 52.344 (52.147)	lr 0.02500
Train [2][140/3239]	Time 0.523 (0.969)	Data Time 0.001 (0.109)	Loss 4.0765 (4.1037)	Entropy 1.90182 (1.90185)	Top-1 acc 31.250 (28.912)	Top-5 acc 53.125 (52.247)	lr 0.02500
Train [2][150/3239]	Time 0.481 (0.952)	Data Time 0.001 (0.101)	Loss 4.0951 (4.1022)	Entropy 1.90181 (1.90185)	Top-1 acc 27.734 (28.906)	Top-5 acc 49.609 (52.279)	lr 0.02500
Train [2][160/3239]	Time 0.518 (0.936)	Data Time 0.001 (0.095)	Loss 4.0337 (4.1017)	Entropy 1.90181 (1.90185)	Top-1 acc 32.422 (28.882)	Top-5 acc 53.516 (52.295)	lr 0.02500
Train [2][170/3239]	Time 0.453 (0.925)	Data Time 0.001 (0.090)	Loss 4.1984 (4.1031)	Entropy 1.90180 (1.90184)	Top-1 acc 28.125 (28.865)	Top-5 acc 54.297 (52.307)	lr 0.02500
Train [2][180/3239]	Time 0.475 (0.914)	Data Time 0.002 (0.086)	Loss 4.2949 (4.1079)	Entropy 1.90180 (1.90184)	Top-1 acc 24.609 (28.751)	Top-5 acc 46.484 (52.152)	lr 0.02500
Train [2][190/3239]	Time 0.571 (0.906)	Data Time 0.001 (0.081)	Loss 4.1518 (4.1073)	Entropy 1.90179 (1.90184)	Top-1 acc 25.000 (28.773)	Top-5 acc 49.219 (52.096)	lr 0.02500
Train [2][200/3239]	Time 0.490 (0.897)	Data Time 0.001 (0.078)	Loss 3.9609 (4.1072)	Entropy 1.90179 (1.90184)	Top-1 acc 32.422 (28.759)	Top-5 acc 60.938 (52.093)	lr 0.02500
Train [2][210/3239]	Time 0.521 (0.890)	Data Time 0.001 (0.074)	Loss 4.1906 (4.1069)	Entropy 1.90178 (1.90183)	Top-1 acc 28.125 (28.782)	Top-5 acc 49.609 (52.123)	lr 0.02500
Train [2][220/3239]	Time 0.497 (0.883)	Data Time 0.001 (0.071)	Loss 3.9216 (4.1057)	Entropy 1.90177 (1.90183)	Top-1 acc 31.641 (28.827)	Top-5 acc 55.469 (52.165)	lr 0.02500
Train [2][230/3239]	Time 0.481 (0.876)	Data Time 0.001 (0.068)	Loss 4.3586 (4.1070)	Entropy 1.90176 (1.90183)	Top-1 acc 25.781 (28.818)	Top-5 acc 47.656 (52.127)	lr 0.02500
Train [2][240/3239]	Time 0.325 (0.868)	Data Time 0.001 (0.065)	Loss 4.1881 (4.1105)	Entropy 1.90176 (1.90183)	Top-1 acc 29.688 (28.752)	Top-5 acc 50.781 (52.058)	lr 0.02500
Train [2][250/3239]	Time 0.481 (0.864)	Data Time 0.001 (0.063)	Loss 4.1670 (4.1112)	Entropy 1.90175 (1.90182)	Top-1 acc 25.781 (28.710)	Top-5 acc 49.609 (52.029)	lr 0.02500
Train [2][260/3239]	Time 0.531 (0.860)	Data Time 0.001 (0.061)	Loss 3.9312 (4.1120)	Entropy 1.90175 (1.90182)	Top-1 acc 29.688 (28.710)	Top-5 acc 52.344 (51.992)	lr 0.02500
Train [2][270/3239]	Time 0.464 (0.855)	Data Time 0.001 (0.059)	Loss 4.2606 (4.1139)	Entropy 1.90173 (1.90182)	Top-1 acc 25.781 (28.687)	Top-5 acc 49.609 (51.939)	lr 0.02499
Train [2][280/3239]	Time 0.501 (0.850)	Data Time 0.001 (0.057)	Loss 3.9598 (4.1158)	Entropy 1.90173 (1.90181)	Top-1 acc 28.516 (28.652)	Top-5 acc 53.906 (51.909)	lr 0.02499
Train [2][290/3239]	Time 0.331 (0.846)	Data Time 0.001 (0.055)	Loss 4.4000 (4.1175)	Entropy 1.90172 (1.90181)	Top-1 acc 23.047 (28.649)	Top-5 acc 44.922 (51.842)	lr 0.02499
Train [2][300/3239]	Time 0.337 (0.841)	Data Time 0.001 (0.054)	Loss 4.2271 (4.1185)	Entropy 1.90170 (1.90181)	Top-1 acc 24.219 (28.617)	Top-5 acc 49.219 (51.838)	lr 0.02499
Train [2][310/3239]	Time 0.447 (0.837)	Data Time 0.001 (0.052)	Loss 4.1150 (4.1183)	Entropy 1.90169 (1.90180)	Top-1 acc 26.953 (28.642)	Top-5 acc 55.078 (51.861)	lr 0.02499
Train [2][320/3239]	Time 0.377 (0.832)	Data Time 0.001 (0.051)	Loss 4.0925 (4.1174)	Entropy 1.90168 (1.90180)	Top-1 acc 26.953 (28.656)	Top-5 acc 53.516 (51.903)	lr 0.02499
Train [2][330/3239]	Time 0.447 (0.828)	Data Time 0.001 (0.050)	Loss 4.1950 (4.1185)	Entropy 1.90167 (1.90180)	Top-1 acc 28.516 (28.647)	Top-5 acc 47.266 (51.840)	lr 0.02499
Train [2][340/3239]	Time 0.474 (0.826)	Data Time 0.001 (0.049)	Loss 4.2249 (4.1185)	Entropy 1.90166 (1.90179)	Top-1 acc 27.344 (28.678)	Top-5 acc 51.953 (51.840)	lr 0.02499
Train [2][350/3239]	Time 0.474 (0.824)	Data Time 0.001 (0.047)	Loss 4.1558 (4.1176)	Entropy 1.90165 (1.90179)	Top-1 acc 27.734 (28.649)	Top-5 acc 48.438 (51.832)	lr 0.02499
Train [2][360/3239]	Time 0.429 (0.821)	Data Time 0.001 (0.046)	Loss 4.3289 (4.1197)	Entropy 1.90164 (1.90178)	Top-1 acc 26.562 (28.645)	Top-5 acc 46.484 (51.770)	lr 0.02499
Train [2][370/3239]	Time 0.490 (0.819)	Data Time 0.001 (0.045)	Loss 4.1938 (4.1196)	Entropy 1.90162 (1.90178)	Top-1 acc 28.125 (28.631)	Top-5 acc 48.438 (51.765)	lr 0.02499
Train [2][380/3239]	Time 0.513 (0.817)	Data Time 0.001 (0.044)	Loss 4.0244 (4.1199)	Entropy 1.90161 (1.90178)	Top-1 acc 32.422 (28.668)	Top-5 acc 52.734 (51.764)	lr 0.02499
Train [2][390/3239]	Time 0.559 (0.815)	Data Time 0.001 (0.043)	Loss 4.2044 (4.1181)	Entropy 1.90159 (1.90177)	Top-1 acc 26.172 (28.672)	Top-5 acc 49.219 (51.787)	lr 0.02499
Train [2][400/3239]	Time 0.500 (0.813)	Data Time 0.001 (0.042)	Loss 4.0796 (4.1187)	Entropy 1.90157 (1.90177)	Top-1 acc 33.594 (28.689)	Top-5 acc 53.906 (51.808)	lr 0.02499
Train [2][410/3239]	Time 0.509 (0.811)	Data Time 0.001 (0.041)	Loss 4.0759 (4.1172)	Entropy 1.90156 (1.90176)	Top-1 acc 27.734 (28.707)	Top-5 acc 53.906 (51.856)	lr 0.02499
Train [2][420/3239]	Time 0.355 (0.809)	Data Time 0.001 (0.040)	Loss 4.1722 (4.1175)	Entropy 1.90156 (1.90176)	Top-1 acc 26.172 (28.687)	Top-5 acc 50.000 (51.858)	lr 0.02499
Train [2][430/3239]	Time 0.517 (0.807)	Data Time 0.001 (0.039)	Loss 4.0968 (4.1185)	Entropy 1.90154 (1.90175)	Top-1 acc 27.734 (28.672)	Top-5 acc 52.734 (51.873)	lr 0.02499
Train [2][440/3239]	Time 0.390 (0.806)	Data Time 0.001 (0.038)	Loss 4.1338 (4.1177)	Entropy 1.90153 (1.90175)	Top-1 acc 26.172 (28.670)	Top-5 acc 52.734 (51.888)	lr 0.02499
Train [2][450/3239]	Time 0.426 (0.804)	Data Time 0.001 (0.038)	Loss 4.1525 (4.1173)	Entropy 1.90151 (1.90174)	Top-1 acc 32.422 (28.684)	Top-5 acc 51.172 (51.865)	lr 0.02499
Train [2][460/3239]	Time 0.351 (0.802)	Data Time 0.001 (0.037)	Loss 4.0857 (4.1157)	Entropy 1.90149 (1.90174)	Top-1 acc 30.859 (28.726)	Top-5 acc 53.125 (51.890)	lr 0.02499
Train [2][470/3239]	Time 0.546 (0.801)	Data Time 0.002 (0.037)	Loss 3.7871 (4.1155)	Entropy 1.90147 (1.90173)	Top-1 acc 35.938 (28.740)	Top-5 acc 60.547 (51.904)	lr 0.02499
Train [2][480/3239]	Time 0.321 (0.799)	Data Time 0.001 (0.036)	Loss 4.1492 (4.1172)	Entropy 1.90146 (1.90173)	Top-1 acc 26.172 (28.711)	Top-5 acc 55.859 (51.887)	lr 0.02499
Train [2][490/3239]	Time 0.627 (0.798)	Data Time 0.002 (0.036)	Loss 4.0583 (4.1174)	Entropy 1.90145 (1.90172)	Top-1 acc 29.688 (28.710)	Top-5 acc 55.859 (51.889)	lr 0.02499
Train [2][500/3239]	Time 0.520 (0.796)	Data Time 0.001 (0.035)	Loss 4.1055 (4.1187)	Entropy 1.90142 (1.90172)	Top-1 acc 27.734 (28.683)	Top-5 acc 49.609 (51.848)	lr 0.02499
Train [2][510/3239]	Time 0.386 (0.794)	Data Time 0.001 (0.034)	Loss 4.2326 (4.1182)	Entropy 1.90140 (1.90171)	Top-1 acc 27.344 (28.685)	Top-5 acc 47.656 (51.869)	lr 0.02499
Train [2][520/3239]	Time 0.539 (0.793)	Data Time 0.001 (0.034)	Loss 4.0107 (4.1183)	Entropy 1.90138 (1.90170)	Top-1 acc 28.516 (28.666)	Top-5 acc 51.953 (51.850)	lr 0.02499
Train [2][530/3239]	Time 0.375 (0.792)	Data Time 0.001 (0.033)	Loss 4.0919 (4.1182)	Entropy 1.90136 (1.90170)	Top-1 acc 28.906 (28.676)	Top-5 acc 51.953 (51.872)	lr 0.02499
Train [2][540/3239]	Time 0.530 (0.791)	Data Time 0.001 (0.033)	Loss 4.0644 (4.1189)	Entropy 1.90133 (1.90169)	Top-1 acc 31.250 (28.669)	Top-5 acc 55.078 (51.862)	lr 0.02499
Train [2][550/3239]	Time 0.466 (0.790)	Data Time 0.001 (0.032)	Loss 4.1799 (4.1191)	Entropy 1.90131 (1.90168)	Top-1 acc 27.344 (28.649)	Top-5 acc 55.469 (51.883)	lr 0.02499
Train [2][560/3239]	Time 0.534 (0.789)	Data Time 0.002 (0.032)	Loss 4.2060 (4.1191)	Entropy 1.90130 (1.90168)	Top-1 acc 28.906 (28.628)	Top-5 acc 51.172 (51.884)	lr 0.02499
Train [2][570/3239]	Time 0.343 (0.787)	Data Time 0.001 (0.031)	Loss 4.1675 (4.1205)	Entropy 1.90128 (1.90167)	Top-1 acc 30.078 (28.600)	Top-5 acc 51.953 (51.857)	lr 0.02499
Train [2][580/3239]	Time 0.495 (0.787)	Data Time 0.001 (0.031)	Loss 4.0391 (4.1188)	Entropy 1.90126 (1.90166)	Top-1 acc 29.297 (28.623)	Top-5 acc 52.734 (51.893)	lr 0.02499
Train [2][590/3239]	Time 0.517 (0.787)	Data Time 0.001 (0.031)	Loss 4.1797 (4.1191)	Entropy 1.90124 (1.90166)	Top-1 acc 27.344 (28.607)	Top-5 acc 52.344 (51.896)	lr 0.02499
Train [2][600/3239]	Time 0.435 (0.786)	Data Time 0.001 (0.030)	Loss 4.0846 (4.1194)	Entropy 1.90122 (1.90165)	Top-1 acc 30.469 (28.627)	Top-5 acc 53.906 (51.890)	lr 0.02499
Train [2][610/3239]	Time 0.300 (0.784)	Data Time 0.001 (0.030)	Loss 4.2902 (4.1188)	Entropy 1.90120 (1.90164)	Top-1 acc 31.250 (28.638)	Top-5 acc 48.828 (51.910)	lr 0.02499
Train [2][620/3239]	Time 0.429 (0.784)	Data Time 0.001 (0.030)	Loss 3.9963 (4.1193)	Entropy 1.90119 (1.90164)	Top-1 acc 29.688 (28.635)	Top-5 acc 57.812 (51.897)	lr 0.02499
Train [2][630/3239]	Time 0.357 (0.782)	Data Time 0.001 (0.029)	Loss 4.0405 (4.1183)	Entropy 1.90117 (1.90163)	Top-1 acc 29.688 (28.647)	Top-5 acc 53.906 (51.905)	lr 0.02499
Train [2][640/3239]	Time 0.595 (0.782)	Data Time 0.001 (0.029)	Loss 4.0093 (4.1192)	Entropy 1.90116 (1.90162)	Top-1 acc 28.516 (28.621)	Top-5 acc 50.781 (51.887)	lr 0.02499
Train [2][650/3239]	Time 0.482 (0.781)	Data Time 0.001 (0.029)	Loss 3.9844 (4.1188)	Entropy 1.90114 (1.90161)	Top-1 acc 30.859 (28.634)	Top-5 acc 53.516 (51.902)	lr 0.02499
Train [2][660/3239]	Time 0.476 (0.804)	Data Time 0.004 (0.028)	Loss 4.1062 (4.1185)	Entropy 1.90112 (1.90161)	Top-1 acc 32.812 (28.656)	Top-5 acc 51.562 (51.911)	lr 0.02499
Train [2][670/3239]	Time 0.550 (0.803)	Data Time 0.002 (0.028)	Loss 4.0749 (4.1189)	Entropy 1.90109 (1.90160)	Top-1 acc 26.172 (28.648)	Top-5 acc 54.297 (51.900)	lr 0.02499
Train [2][680/3239]	Time 0.548 (0.802)	Data Time 0.002 (0.028)	Loss 4.1489 (4.1188)	Entropy 1.90104 (1.90159)	Top-1 acc 25.391 (28.632)	Top-5 acc 45.703 (51.888)	lr 0.02499
Train [2][690/3239]	Time 0.459 (0.801)	Data Time 0.001 (0.027)	Loss 4.2676 (4.1184)	Entropy 1.90103 (1.90158)	Top-1 acc 21.875 (28.632)	Top-5 acc 48.438 (51.910)	lr 0.02499
Train [2][700/3239]	Time 0.629 (0.800)	Data Time 0.001 (0.027)	Loss 4.1974 (4.1175)	Entropy 1.90100 (1.90158)	Top-1 acc 30.469 (28.661)	Top-5 acc 46.484 (51.934)	lr 0.02499
Train [2][710/3239]	Time 0.525 (0.799)	Data Time 0.001 (0.027)	Loss 4.1504 (4.1167)	Entropy 1.90097 (1.90157)	Top-1 acc 26.172 (28.669)	Top-5 acc 49.219 (51.945)	lr 0.02499
Train [2][720/3239]	Time 0.491 (0.798)	Data Time 0.001 (0.026)	Loss 4.2191 (4.1174)	Entropy 1.90094 (1.90156)	Top-1 acc 28.125 (28.661)	Top-5 acc 48.438 (51.923)	lr 0.02499
Train [2][730/3239]	Time 0.481 (0.797)	Data Time 0.001 (0.026)	Loss 4.0442 (4.1176)	Entropy 1.90091 (1.90155)	Top-1 acc 29.688 (28.665)	Top-5 acc 55.078 (51.931)	lr 0.02499
Train [2][740/3239]	Time 0.447 (0.797)	Data Time 0.001 (0.026)	Loss 4.1598 (4.1179)	Entropy 1.90090 (1.90154)	Top-1 acc 28.906 (28.661)	Top-5 acc 52.734 (51.920)	lr 0.02499
Train [2][750/3239]	Time 0.425 (0.796)	Data Time 0.001 (0.026)	Loss 4.1812 (4.1174)	Entropy 1.90088 (1.90153)	Top-1 acc 25.781 (28.660)	Top-5 acc 50.000 (51.935)	lr 0.02499
Train [2][760/3239]	Time 0.529 (0.795)	Data Time 0.001 (0.025)	Loss 4.1824 (4.1166)	Entropy 1.90085 (1.90152)	Top-1 acc 25.781 (28.662)	Top-5 acc 48.828 (51.950)	lr 0.02499
Train [2][770/3239]	Time 0.528 (0.795)	Data Time 0.001 (0.025)	Loss 4.0583 (4.1158)	Entropy 1.90084 (1.90152)	Top-1 acc 31.641 (28.684)	Top-5 acc 55.469 (51.977)	lr 0.02499
Train [2][780/3239]	Time 0.327 (0.794)	Data Time 0.001 (0.025)	Loss 4.0565 (4.1157)	Entropy 1.90081 (1.90151)	Top-1 acc 25.000 (28.687)	Top-5 acc 53.125 (51.970)	lr 0.02499
Train [2][790/3239]	Time 0.541 (0.793)	Data Time 0.001 (0.025)	Loss 4.1271 (4.1153)	Entropy 1.90078 (1.90150)	Top-1 acc 25.781 (28.695)	Top-5 acc 51.562 (51.991)	lr 0.02499
Train [2][800/3239]	Time 0.530 (0.792)	Data Time 0.001 (0.024)	Loss 4.1467 (4.1153)	Entropy 1.90075 (1.90149)	Top-1 acc 29.688 (28.705)	Top-5 acc 50.781 (51.992)	lr 0.02499
Train [2][810/3239]	Time 0.539 (0.791)	Data Time 0.001 (0.024)	Loss 4.1180 (4.1152)	Entropy 1.90073 (1.90148)	Top-1 acc 26.562 (28.701)	Top-5 acc 50.781 (51.994)	lr 0.02499
Train [2][820/3239]	Time 0.413 (0.790)	Data Time 0.001 (0.024)	Loss 4.0908 (4.1149)	Entropy 1.90068 (1.90147)	Top-1 acc 29.297 (28.690)	Top-5 acc 54.688 (51.997)	lr 0.02499
Train [2][830/3239]	Time 0.402 (0.790)	Data Time 0.001 (0.024)	Loss 4.1504 (4.1146)	Entropy 1.90067 (1.90146)	Top-1 acc 28.516 (28.693)	Top-5 acc 52.734 (52.004)	lr 0.02499
Train [2][840/3239]	Time 0.562 (0.789)	Data Time 0.001 (0.023)	Loss 3.8997 (4.1136)	Entropy 1.90065 (1.90145)	Top-1 acc 29.297 (28.725)	Top-5 acc 59.375 (52.032)	lr 0.02499
Train [2][850/3239]	Time 0.514 (0.789)	Data Time 0.001 (0.023)	Loss 4.2152 (4.1138)	Entropy 1.90063 (1.90144)	Top-1 acc 26.953 (28.728)	Top-5 acc 50.781 (52.021)	lr 0.02499
Train [2][860/3239]	Time 0.489 (0.788)	Data Time 0.001 (0.023)	Loss 3.9562 (4.1140)	Entropy 1.90060 (1.90143)	Top-1 acc 35.156 (28.719)	Top-5 acc 56.641 (52.014)	lr 0.02499
Train [2][870/3239]	Time 0.363 (0.787)	Data Time 0.001 (0.023)	Loss 4.1652 (4.1141)	Entropy 1.90056 (1.90142)	Top-1 acc 25.391 (28.702)	Top-5 acc 51.953 (52.023)	lr 0.02499
Train [2][880/3239]	Time 0.499 (0.787)	Data Time 0.001 (0.023)	Loss 4.0498 (4.1143)	Entropy 1.90054 (1.90141)	Top-1 acc 32.812 (28.701)	Top-5 acc 52.344 (52.012)	lr 0.02499
Train [2][890/3239]	Time 0.358 (0.786)	Data Time 0.001 (0.022)	Loss 3.9286 (4.1137)	Entropy 1.90050 (1.90140)	Top-1 acc 32.422 (28.713)	Top-5 acc 58.594 (52.017)	lr 0.02499
Train [2][900/3239]	Time 0.490 (0.786)	Data Time 0.001 (0.022)	Loss 4.0795 (4.1134)	Entropy 1.90048 (1.90139)	Top-1 acc 28.125 (28.712)	Top-5 acc 50.391 (52.017)	lr 0.02499
Train [2][910/3239]	Time 0.516 (0.786)	Data Time 0.001 (0.022)	Loss 3.9964 (4.1129)	Entropy 1.90045 (1.90138)	Top-1 acc 30.469 (28.714)	Top-5 acc 52.734 (52.025)	lr 0.02499
Train [2][920/3239]	Time 0.510 (0.785)	Data Time 0.001 (0.022)	Loss 4.1352 (4.1128)	Entropy 1.90043 (1.90137)	Top-1 acc 28.516 (28.723)	Top-5 acc 50.781 (52.023)	lr 0.02499
Train [2][930/3239]	Time 0.547 (0.785)	Data Time 0.001 (0.022)	Loss 3.9605 (4.1125)	Entropy 1.90041 (1.90136)	Top-1 acc 30.469 (28.735)	Top-5 acc 60.156 (52.035)	lr 0.02499
Train [2][940/3239]	Time 0.527 (0.785)	Data Time 0.001 (0.021)	Loss 3.9968 (4.1124)	Entropy 1.90039 (1.90135)	Top-1 acc 31.250 (28.736)	Top-5 acc 53.516 (52.042)	lr 0.02499
Train [2][950/3239]	Time 0.345 (0.784)	Data Time 0.001 (0.021)	Loss 4.1047 (4.1126)	Entropy 1.90037 (1.90134)	Top-1 acc 27.734 (28.726)	Top-5 acc 51.172 (52.039)	lr 0.02499
Train [2][960/3239]	Time 0.474 (0.784)	Data Time 0.001 (0.021)	Loss 4.1834 (4.1127)	Entropy 1.90034 (1.90133)	Top-1 acc 31.250 (28.728)	Top-5 acc 48.438 (52.026)	lr 0.02499
Train [2][970/3239]	Time 0.462 (0.783)	Data Time 0.001 (0.021)	Loss 4.2504 (4.1132)	Entropy 1.90030 (1.90132)	Top-1 acc 25.000 (28.707)	Top-5 acc 51.172 (52.012)	lr 0.02499
Train [2][980/3239]	Time 0.435 (0.782)	Data Time 0.001 (0.021)	Loss 4.2116 (4.1137)	Entropy 1.90029 (1.90131)	Top-1 acc 27.734 (28.686)	Top-5 acc 49.609 (52.001)	lr 0.02499
Train [2][990/3239]	Time 0.532 (0.782)	Data Time 0.001 (0.021)	Loss 4.2060 (4.1133)	Entropy 1.90026 (1.90130)	Top-1 acc 25.781 (28.694)	Top-5 acc 50.391 (52.018)	lr 0.02499
Train [2][1000/3239]	Time 0.518 (0.781)	Data Time 0.001 (0.021)	Loss 4.0246 (4.1135)	Entropy 1.90022 (1.90129)	Top-1 acc 27.734 (28.690)	Top-5 acc 55.469 (52.010)	lr 0.02499
Train [2][1010/3239]	Time 0.300 (0.780)	Data Time 0.001 (0.020)	Loss 4.3344 (4.1131)	Entropy 1.90021 (1.90128)	Top-1 acc 25.781 (28.696)	Top-5 acc 42.969 (52.013)	lr 0.02499
Train [2][1020/3239]	Time 0.513 (0.780)	Data Time 0.001 (0.020)	Loss 4.1574 (4.1135)	Entropy 1.90017 (1.90127)	Top-1 acc 25.000 (28.684)	Top-5 acc 48.828 (51.992)	lr 0.02499
Train [2][1030/3239]	Time 0.343 (0.779)	Data Time 0.001 (0.020)	Loss 4.1453 (4.1136)	Entropy 1.90015 (1.90126)	Top-1 acc 26.953 (28.680)	Top-5 acc 49.219 (51.990)	lr 0.02499
Train [2][1040/3239]	Time 0.567 (0.779)	Data Time 0.001 (0.020)	Loss 4.1576 (4.1138)	Entropy 1.90011 (1.90125)	Top-1 acc 30.859 (28.674)	Top-5 acc 52.734 (51.988)	lr 0.02499
Train [2][1050/3239]	Time 0.499 (0.779)	Data Time 0.002 (0.020)	Loss 4.1856 (4.1137)	Entropy 1.90008 (1.90124)	Top-1 acc 26.562 (28.677)	Top-5 acc 53.516 (51.998)	lr 0.02499
Train [2][1060/3239]	Time 0.572 (0.779)	Data Time 0.001 (0.020)	Loss 4.0860 (4.1135)	Entropy 1.90007 (1.90123)	Top-1 acc 33.203 (28.686)	Top-5 acc 52.344 (52.004)	lr 0.02499
Train [2][1070/3239]	Time 0.478 (0.778)	Data Time 0.001 (0.020)	Loss 4.1455 (4.1135)	Entropy 1.90003 (1.90121)	Top-1 acc 27.344 (28.692)	Top-5 acc 51.172 (52.002)	lr 0.02499
Train [2][1080/3239]	Time 0.557 (0.778)	Data Time 0.001 (0.020)	Loss 4.3353 (4.1137)	Entropy 1.90000 (1.90120)	Top-1 acc 25.000 (28.690)	Top-5 acc 46.875 (51.996)	lr 0.02499
Train [2][1090/3239]	Time 0.392 (0.778)	Data Time 0.001 (0.019)	Loss 4.2147 (4.1136)	Entropy 1.89997 (1.90119)	Top-1 acc 25.781 (28.693)	Top-5 acc 46.875 (52.003)	lr 0.02499
Train [2][1100/3239]	Time 0.406 (0.777)	Data Time 0.001 (0.019)	Loss 4.1218 (4.1138)	Entropy 1.89993 (1.90118)	Top-1 acc 28.516 (28.693)	Top-5 acc 50.000 (51.998)	lr 0.02499
Train [2][1110/3239]	Time 0.696 (0.777)	Data Time 0.001 (0.019)	Loss 4.0731 (4.1138)	Entropy 1.89989 (1.90117)	Top-1 acc 27.734 (28.698)	Top-5 acc 52.344 (51.996)	lr 0.02499
Train [2][1120/3239]	Time 0.458 (0.776)	Data Time 0.003 (0.019)	Loss 3.8357 (4.1137)	Entropy 1.89985 (1.90116)	Top-1 acc 35.938 (28.697)	Top-5 acc 59.375 (52.001)	lr 0.02499
Train [2][1130/3239]	Time 0.506 (0.776)	Data Time 0.001 (0.019)	Loss 4.1600 (4.1136)	Entropy 1.89981 (1.90115)	Top-1 acc 27.344 (28.694)	Top-5 acc 54.688 (52.011)	lr 0.02499
Train [2][1140/3239]	Time 0.552 (0.775)	Data Time 0.001 (0.019)	Loss 3.8735 (4.1137)	Entropy 1.89979 (1.90113)	Top-1 acc 30.078 (28.690)	Top-5 acc 58.203 (52.006)	lr 0.02499
Train [2][1150/3239]	Time 0.544 (0.775)	Data Time 0.001 (0.019)	Loss 4.0564 (4.1136)	Entropy 1.89975 (1.90112)	Top-1 acc 29.297 (28.696)	Top-5 acc 51.953 (52.010)	lr 0.02499
Train [2][1160/3239]	Time 0.442 (0.774)	Data Time 0.001 (0.019)	Loss 4.0934 (4.1140)	Entropy 1.89972 (1.90111)	Top-1 acc 28.516 (28.698)	Top-5 acc 50.781 (51.995)	lr 0.02499
Train [2][1170/3239]	Time 0.525 (0.774)	Data Time 0.001 (0.018)	Loss 4.0682 (4.1137)	Entropy 1.89968 (1.90110)	Top-1 acc 26.562 (28.704)	Top-5 acc 53.906 (51.995)	lr 0.02499
Train [2][1180/3239]	Time 0.487 (0.774)	Data Time 0.001 (0.018)	Loss 3.9856 (4.1136)	Entropy 1.89964 (1.90109)	Top-1 acc 32.422 (28.709)	Top-5 acc 56.250 (51.993)	lr 0.02499
Train [2][1190/3239]	Time 0.570 (0.773)	Data Time 0.001 (0.018)	Loss 3.9884 (4.1136)	Entropy 1.89959 (1.90107)	Top-1 acc 30.859 (28.707)	Top-5 acc 53.125 (51.992)	lr 0.02499
Train [2][1200/3239]	Time 0.494 (0.773)	Data Time 0.001 (0.018)	Loss 4.2591 (4.1136)	Entropy 1.89955 (1.90106)	Top-1 acc 20.312 (28.708)	Top-5 acc 48.047 (51.999)	lr 0.02499
Train [2][1210/3239]	Time 0.533 (0.773)	Data Time 0.001 (0.018)	Loss 4.0741 (4.1130)	Entropy 1.89952 (1.90105)	Top-1 acc 30.469 (28.722)	Top-5 acc 55.469 (52.022)	lr 0.02499
Train [2][1220/3239]	Time 0.319 (0.772)	Data Time 0.001 (0.018)	Loss 4.1662 (4.1124)	Entropy 1.89950 (1.90104)	Top-1 acc 29.297 (28.731)	Top-5 acc 49.219 (52.031)	lr 0.02499
Train [2][1230/3239]	Time 0.542 (0.772)	Data Time 0.001 (0.018)	Loss 3.8636 (4.1122)	Entropy 1.89948 (1.90102)	Top-1 acc 31.641 (28.737)	Top-5 acc 56.641 (52.039)	lr 0.02499
Train [2][1240/3239]	Time 0.507 (0.772)	Data Time 0.001 (0.018)	Loss 4.1776 (4.1119)	Entropy 1.89942 (1.90101)	Top-1 acc 25.000 (28.733)	Top-5 acc 51.172 (52.043)	lr 0.02499
Train [2][1250/3239]	Time 0.560 (0.772)	Data Time 0.001 (0.018)	Loss 4.0347 (4.1118)	Entropy 1.89937 (1.90100)	Top-1 acc 26.953 (28.728)	Top-5 acc 57.031 (52.051)	lr 0.02499
Train [2][1260/3239]	Time 0.464 (0.771)	Data Time 0.001 (0.017)	Loss 4.2301 (4.1117)	Entropy 1.89933 (1.90099)	Top-1 acc 28.516 (28.726)	Top-5 acc 53.125 (52.046)	lr 0.02499
Train [2][1270/3239]	Time 0.382 (0.771)	Data Time 0.001 (0.017)	Loss 4.0235 (4.1115)	Entropy 1.89931 (1.90097)	Top-1 acc 28.516 (28.730)	Top-5 acc 52.344 (52.048)	lr 0.02499
Train [2][1280/3239]	Time 0.376 (0.771)	Data Time 0.001 (0.017)	Loss 4.2826 (4.1121)	Entropy 1.89925 (1.90096)	Top-1 acc 24.609 (28.717)	Top-5 acc 45.703 (52.026)	lr 0.02499
Train [2][1290/3239]	Time 0.373 (0.771)	Data Time 0.001 (0.017)	Loss 4.0730 (4.1123)	Entropy 1.89922 (1.90095)	Top-1 acc 29.297 (28.710)	Top-5 acc 56.250 (52.028)	lr 0.02499
Train [2][1300/3239]	Time 0.541 (0.770)	Data Time 0.001 (0.017)	Loss 3.9298 (4.1117)	Entropy 1.89915 (1.90093)	Top-1 acc 27.734 (28.719)	Top-5 acc 56.250 (52.043)	lr 0.02499
Train [2][1310/3239]	Time 0.439 (0.770)	Data Time 0.001 (0.017)	Loss 3.9058 (4.1117)	Entropy 1.89910 (1.90092)	Top-1 acc 31.641 (28.711)	Top-5 acc 55.469 (52.040)	lr 0.02499
Train [2][1320/3239]	Time 0.319 (0.781)	Data Time 0.002 (0.017)	Loss 4.1081 (4.1118)	Entropy 1.89907 (1.90091)	Top-1 acc 28.516 (28.708)	Top-5 acc 55.078 (52.028)	lr 0.02499
Train [2][1330/3239]	Time 0.495 (0.780)	Data Time 0.001 (0.017)	Loss 4.1940 (4.1117)	Entropy 1.89903 (1.90089)	Top-1 acc 26.953 (28.697)	Top-5 acc 50.000 (52.021)	lr 0.02499
Train [2][1340/3239]	Time 0.470 (0.780)	Data Time 0.001 (0.017)	Loss 4.3298 (4.1119)	Entropy 1.89898 (1.90088)	Top-1 acc 25.391 (28.697)	Top-5 acc 42.188 (52.020)	lr 0.02499
Train [2][1350/3239]	Time 0.348 (0.780)	Data Time 0.001 (0.017)	Loss 4.2801 (4.1119)	Entropy 1.89896 (1.90086)	Top-1 acc 26.562 (28.700)	Top-5 acc 48.438 (52.025)	lr 0.02499
Train [2][1360/3239]	Time 0.515 (0.779)	Data Time 0.001 (0.017)	Loss 3.9589 (4.1118)	Entropy 1.89894 (1.90085)	Top-1 acc 30.078 (28.706)	Top-5 acc 50.391 (52.026)	lr 0.02499
Train [2][1370/3239]	Time 0.444 (0.779)	Data Time 0.001 (0.017)	Loss 4.1536 (4.1114)	Entropy 1.89888 (1.90083)	Top-1 acc 30.078 (28.715)	Top-5 acc 50.781 (52.032)	lr 0.02499
Train [2][1380/3239]	Time 0.476 (0.779)	Data Time 0.001 (0.017)	Loss 3.9605 (4.1111)	Entropy 1.89886 (1.90082)	Top-1 acc 34.766 (28.722)	Top-5 acc 51.953 (52.039)	lr 0.02499
Train [2][1390/3239]	Time 0.517 (0.779)	Data Time 0.001 (0.017)	Loss 4.1044 (4.1114)	Entropy 1.89883 (1.90081)	Top-1 acc 28.516 (28.715)	Top-5 acc 51.172 (52.032)	lr 0.02499
Train [2][1400/3239]	Time 0.553 (0.778)	Data Time 0.001 (0.016)	Loss 3.9283 (4.1112)	Entropy 1.89881 (1.90079)	Top-1 acc 36.328 (28.716)	Top-5 acc 52.734 (52.040)	lr 0.02499
Train [2][1410/3239]	Time 0.355 (0.778)	Data Time 0.001 (0.016)	Loss 4.2020 (4.1113)	Entropy 1.89876 (1.90078)	Top-1 acc 27.344 (28.724)	Top-5 acc 53.125 (52.039)	lr 0.02499
Train [2][1420/3239]	Time 0.573 (0.778)	Data Time 0.001 (0.016)	Loss 4.0290 (4.1113)	Entropy 1.89872 (1.90076)	Top-1 acc 31.250 (28.723)	Top-5 acc 55.859 (52.045)	lr 0.02499
Train [2][1430/3239]	Time 0.486 (0.778)	Data Time 0.001 (0.016)	Loss 4.1244 (4.1114)	Entropy 1.89867 (1.90075)	Top-1 acc 30.469 (28.719)	Top-5 acc 52.734 (52.042)	lr 0.02499
Train [2][1440/3239]	Time 0.495 (0.778)	Data Time 0.001 (0.016)	Loss 3.8990 (4.1111)	Entropy 1.89863 (1.90073)	Top-1 acc 35.156 (28.720)	Top-5 acc 58.594 (52.046)	lr 0.02499
Train [2][1450/3239]	Time 0.490 (0.777)	Data Time 0.001 (0.016)	Loss 4.0312 (4.1111)	Entropy 1.89861 (1.90072)	Top-1 acc 25.000 (28.714)	Top-5 acc 53.516 (52.041)	lr 0.02499
Train [2][1460/3239]	Time 0.409 (0.777)	Data Time 0.001 (0.016)	Loss 4.2577 (4.1107)	Entropy 1.89856 (1.90071)	Top-1 acc 23.438 (28.715)	Top-5 acc 47.656 (52.046)	lr 0.02499
Train [2][1470/3239]	Time 0.512 (0.777)	Data Time 0.001 (0.016)	Loss 3.9322 (4.1109)	Entropy 1.89851 (1.90069)	Top-1 acc 31.250 (28.715)	Top-5 acc 55.469 (52.040)	lr 0.02499
Train [2][1480/3239]	Time 0.393 (0.776)	Data Time 0.003 (0.016)	Loss 4.0017 (4.1112)	Entropy 1.89847 (1.90068)	Top-1 acc 30.078 (28.709)	Top-5 acc 57.812 (52.036)	lr 0.02499
Train [2][1490/3239]	Time 0.560 (0.776)	Data Time 0.002 (0.016)	Loss 4.0777 (4.1111)	Entropy 1.89843 (1.90066)	Top-1 acc 32.031 (28.712)	Top-5 acc 50.781 (52.040)	lr 0.02499
Train [2][1500/3239]	Time 0.523 (0.776)	Data Time 0.001 (0.016)	Loss 4.1754 (4.1109)	Entropy 1.89841 (1.90065)	Top-1 acc 27.734 (28.719)	Top-5 acc 52.344 (52.044)	lr 0.02499
Train [2][1510/3239]	Time 0.486 (0.776)	Data Time 0.001 (0.016)	Loss 3.9508 (4.1111)	Entropy 1.89836 (1.90063)	Top-1 acc 31.641 (28.713)	Top-5 acc 54.688 (52.042)	lr 0.02499
Train [2][1520/3239]	Time 0.483 (0.775)	Data Time 0.002 (0.016)	Loss 4.0663 (4.1112)	Entropy 1.89831 (1.90062)	Top-1 acc 32.422 (28.713)	Top-5 acc 55.078 (52.037)	lr 0.02499
Train [2][1530/3239]	Time 0.461 (0.775)	Data Time 0.001 (0.016)	Loss 4.1062 (4.1117)	Entropy 1.89827 (1.90060)	Top-1 acc 28.125 (28.705)	Top-5 acc 50.781 (52.028)	lr 0.02499
Train [2][1540/3239]	Time 0.385 (0.775)	Data Time 0.001 (0.015)	Loss 3.9283 (4.1114)	Entropy 1.89824 (1.90059)	Top-1 acc 36.719 (28.712)	Top-5 acc 58.984 (52.040)	lr 0.02499
Train [2][1550/3239]	Time 0.381 (0.775)	Data Time 0.001 (0.015)	Loss 4.0458 (4.1115)	Entropy 1.89818 (1.90057)	Top-1 acc 30.469 (28.713)	Top-5 acc 56.641 (52.043)	lr 0.02499
Train [2][1560/3239]	Time 0.486 (0.775)	Data Time 0.001 (0.015)	Loss 4.0151 (4.1120)	Entropy 1.89814 (1.90056)	Top-1 acc 30.859 (28.706)	Top-5 acc 51.562 (52.036)	lr 0.02499
Train [2][1570/3239]	Time 0.521 (0.775)	Data Time 0.001 (0.015)	Loss 3.8568 (4.1115)	Entropy 1.89810 (1.90054)	Top-1 acc 34.766 (28.718)	Top-5 acc 56.641 (52.047)	lr 0.02499
Train [2][1580/3239]	Time 0.530 (0.774)	Data Time 0.001 (0.015)	Loss 4.1257 (4.1114)	Entropy 1.89808 (1.90052)	Top-1 acc 30.859 (28.717)	Top-5 acc 51.953 (52.046)	lr 0.02499
Train [2][1590/3239]	Time 0.519 (0.774)	Data Time 0.001 (0.015)	Loss 4.0543 (4.1113)	Entropy 1.89803 (1.90051)	Top-1 acc 29.297 (28.718)	Top-5 acc 53.516 (52.048)	lr 0.02499
Train [2][1600/3239]	Time 0.500 (0.774)	Data Time 0.001 (0.015)	Loss 4.0250 (4.1112)	Entropy 1.89795 (1.90049)	Top-1 acc 30.859 (28.720)	Top-5 acc 55.859 (52.050)	lr 0.02499
Train [2][1610/3239]	Time 0.535 (0.773)	Data Time 0.001 (0.015)	Loss 4.0329 (4.1110)	Entropy 1.89791 (1.90048)	Top-1 acc 26.953 (28.725)	Top-5 acc 55.859 (52.064)	lr 0.02499
Train [2][1620/3239]	Time 0.381 (0.773)	Data Time 0.001 (0.015)	Loss 3.9497 (4.1107)	Entropy 1.89788 (1.90046)	Top-1 acc 30.078 (28.731)	Top-5 acc 54.688 (52.070)	lr 0.02499
Train [2][1630/3239]	Time 0.522 (0.773)	Data Time 0.001 (0.015)	Loss 4.1833 (4.1109)	Entropy 1.89782 (1.90045)	Top-1 acc 26.562 (28.727)	Top-5 acc 48.828 (52.061)	lr 0.02499
Train [2][1640/3239]	Time 0.472 (0.773)	Data Time 0.001 (0.015)	Loss 4.0707 (4.1106)	Entropy 1.89780 (1.90043)	Top-1 acc 28.125 (28.731)	Top-5 acc 51.953 (52.069)	lr 0.02499
Train [2][1650/3239]	Time 0.517 (0.772)	Data Time 0.001 (0.015)	Loss 4.1309 (4.1101)	Entropy 1.89775 (1.90041)	Top-1 acc 26.953 (28.739)	Top-5 acc 55.469 (52.079)	lr 0.02499
Train [2][1660/3239]	Time 0.344 (0.772)	Data Time 0.001 (0.015)	Loss 4.2880 (4.1100)	Entropy 1.89771 (1.90040)	Top-1 acc 25.000 (28.743)	Top-5 acc 50.000 (52.083)	lr 0.02499
Train [2][1670/3239]	Time 0.450 (0.772)	Data Time 0.001 (0.015)	Loss 4.1314 (4.1101)	Entropy 1.89767 (1.90038)	Top-1 acc 28.906 (28.743)	Top-5 acc 52.734 (52.081)	lr 0.02499
Train [2][1680/3239]	Time 0.455 (0.772)	Data Time 0.001 (0.015)	Loss 4.2394 (4.1102)	Entropy 1.89761 (1.90036)	Top-1 acc 21.875 (28.743)	Top-5 acc 52.734 (52.086)	lr 0.02499
Train [2][1690/3239]	Time 0.451 (0.772)	Data Time 0.001 (0.015)	Loss 4.0393 (4.1100)	Entropy 1.89757 (1.90035)	Top-1 acc 34.375 (28.741)	Top-5 acc 53.125 (52.094)	lr 0.02499
Train [2][1700/3239]	Time 0.541 (0.772)	Data Time 0.001 (0.015)	Loss 3.9761 (4.1100)	Entropy 1.89753 (1.90033)	Top-1 acc 32.031 (28.742)	Top-5 acc 53.125 (52.094)	lr 0.02499
Train [2][1710/3239]	Time 0.486 (0.772)	Data Time 0.001 (0.015)	Loss 3.9583 (4.1097)	Entropy 1.89745 (1.90032)	Top-1 acc 29.688 (28.746)	Top-5 acc 53.906 (52.099)	lr 0.02499
Train [2][1720/3239]	Time 0.354 (0.771)	Data Time 0.001 (0.015)	Loss 4.2897 (4.1098)	Entropy 1.89742 (1.90030)	Top-1 acc 25.000 (28.743)	Top-5 acc 45.703 (52.097)	lr 0.02499
Train [2][1730/3239]	Time 0.641 (0.771)	Data Time 0.001 (0.015)	Loss 4.3120 (4.1096)	Entropy 1.89740 (1.90028)	Top-1 acc 26.562 (28.744)	Top-5 acc 48.047 (52.100)	lr 0.02499
Train [2][1740/3239]	Time 0.550 (0.771)	Data Time 0.001 (0.014)	Loss 4.2307 (4.1097)	Entropy 1.89734 (1.90027)	Top-1 acc 27.734 (28.740)	Top-5 acc 46.484 (52.093)	lr 0.02499
Train [2][1750/3239]	Time 0.464 (0.771)	Data Time 0.001 (0.014)	Loss 4.2545 (4.1100)	Entropy 1.89730 (1.90025)	Top-1 acc 29.297 (28.735)	Top-5 acc 48.047 (52.087)	lr 0.02499
Train [2][1760/3239]	Time 0.636 (0.771)	Data Time 0.001 (0.014)	Loss 4.1264 (4.1097)	Entropy 1.89724 (1.90023)	Top-1 acc 28.125 (28.737)	Top-5 acc 52.344 (52.092)	lr 0.02499
Train [2][1770/3239]	Time 0.330 (0.771)	Data Time 0.001 (0.014)	Loss 4.1900 (4.1095)	Entropy 1.89719 (1.90021)	Top-1 acc 29.297 (28.748)	Top-5 acc 50.000 (52.093)	lr 0.02499
Train [2][1780/3239]	Time 0.487 (0.771)	Data Time 0.001 (0.014)	Loss 4.1339 (4.1098)	Entropy 1.89714 (1.90020)	Top-1 acc 29.297 (28.740)	Top-5 acc 50.000 (52.075)	lr 0.02499
Train [2][1790/3239]	Time 0.400 (0.770)	Data Time 0.001 (0.014)	Loss 4.1347 (4.1099)	Entropy 1.89712 (1.90018)	Top-1 acc 28.906 (28.739)	Top-5 acc 50.391 (52.070)	lr 0.02499
Train [2][1800/3239]	Time 0.373 (0.770)	Data Time 0.001 (0.014)	Loss 4.2183 (4.1101)	Entropy 1.89706 (1.90016)	Top-1 acc 28.125 (28.734)	Top-5 acc 53.125 (52.068)	lr 0.02499
Train [2][1810/3239]	Time 0.372 (0.770)	Data Time 0.001 (0.014)	Loss 4.1815 (4.1103)	Entropy 1.89702 (1.90015)	Top-1 acc 24.609 (28.724)	Top-5 acc 50.781 (52.061)	lr 0.02499
Train [2][1820/3239]	Time 0.500 (0.770)	Data Time 0.001 (0.014)	Loss 4.2100 (4.1106)	Entropy 1.89697 (1.90013)	Top-1 acc 29.688 (28.723)	Top-5 acc 49.219 (52.052)	lr 0.02499
Train [2][1830/3239]	Time 0.386 (0.769)	Data Time 0.001 (0.014)	Loss 4.1084 (4.1109)	Entropy 1.89693 (1.90011)	Top-1 acc 28.516 (28.715)	Top-5 acc 49.219 (52.043)	lr 0.02499
Train [2][1840/3239]	Time 0.561 (0.769)	Data Time 0.001 (0.014)	Loss 3.9558 (4.1110)	Entropy 1.89689 (1.90009)	Top-1 acc 32.812 (28.716)	Top-5 acc 55.078 (52.042)	lr 0.02499
Train [2][1850/3239]	Time 0.584 (0.769)	Data Time 0.001 (0.014)	Loss 4.1357 (4.1106)	Entropy 1.89685 (1.90008)	Top-1 acc 31.641 (28.727)	Top-5 acc 52.734 (52.054)	lr 0.02499
Train [2][1860/3239]	Time 0.481 (0.769)	Data Time 0.001 (0.014)	Loss 4.0681 (4.1106)	Entropy 1.89678 (1.90006)	Top-1 acc 26.562 (28.723)	Top-5 acc 51.953 (52.057)	lr 0.02499
Train [2][1870/3239]	Time 0.423 (0.769)	Data Time 0.001 (0.014)	Loss 4.0135 (4.1104)	Entropy 1.89675 (1.90004)	Top-1 acc 33.594 (28.727)	Top-5 acc 56.250 (52.066)	lr 0.02499
Train [2][1880/3239]	Time 0.525 (0.769)	Data Time 0.002 (0.014)	Loss 4.2451 (4.1104)	Entropy 1.89672 (1.90002)	Top-1 acc 28.906 (28.729)	Top-5 acc 48.047 (52.065)	lr 0.02499
Train [2][1890/3239]	Time 0.416 (0.769)	Data Time 0.001 (0.014)	Loss 4.2328 (4.1106)	Entropy 1.89670 (1.90001)	Top-1 acc 25.000 (28.726)	Top-5 acc 48.828 (52.063)	lr 0.02499
Train [2][1900/3239]	Time 0.529 (0.769)	Data Time 0.001 (0.014)	Loss 4.1145 (4.1108)	Entropy 1.89664 (1.89999)	Top-1 acc 21.484 (28.718)	Top-5 acc 49.609 (52.052)	lr 0.02499
Train [2][1910/3239]	Time 0.415 (0.769)	Data Time 0.001 (0.014)	Loss 4.1531 (4.1109)	Entropy 1.89658 (1.89997)	Top-1 acc 30.469 (28.724)	Top-5 acc 53.125 (52.055)	lr 0.02499
Train [2][1920/3239]	Time 0.473 (0.769)	Data Time 0.001 (0.014)	Loss 4.0308 (4.1107)	Entropy 1.89652 (1.89995)	Top-1 acc 27.344 (28.723)	Top-5 acc 51.172 (52.058)	lr 0.02499
Train [2][1930/3239]	Time 0.421 (0.768)	Data Time 0.001 (0.014)	Loss 4.1325 (4.1107)	Entropy 1.89645 (1.89994)	Top-1 acc 29.297 (28.725)	Top-5 acc 55.469 (52.060)	lr 0.02499
Train [2][1940/3239]	Time 0.517 (0.768)	Data Time 0.001 (0.014)	Loss 4.2954 (4.1109)	Entropy 1.89641 (1.89992)	Top-1 acc 24.219 (28.729)	Top-5 acc 47.266 (52.059)	lr 0.02499
Train [2][1950/3239]	Time 0.526 (0.768)	Data Time 0.001 (0.014)	Loss 4.0980 (4.1106)	Entropy 1.89634 (1.89990)	Top-1 acc 30.469 (28.738)	Top-5 acc 55.078 (52.072)	lr 0.02499
Train [2][1960/3239]	Time 0.449 (0.768)	Data Time 0.001 (0.014)	Loss 4.0177 (4.1106)	Entropy 1.89631 (1.89988)	Top-1 acc 32.812 (28.743)	Top-5 acc 58.203 (52.065)	lr 0.02499
Train [2][1970/3239]	Time 0.631 (0.776)	Data Time 0.005 (0.014)	Loss 4.0082 (4.1106)	Entropy 1.89623 (1.89986)	Top-1 acc 32.812 (28.747)	Top-5 acc 53.125 (52.065)	lr 0.02499
Train [2][1980/3239]	Time 0.558 (0.776)	Data Time 0.002 (0.013)	Loss 3.9749 (4.1102)	Entropy 1.89617 (1.89984)	Top-1 acc 32.422 (28.751)	Top-5 acc 56.641 (52.073)	lr 0.02499
Train [2][1990/3239]	Time 0.491 (0.775)	Data Time 0.001 (0.013)	Loss 4.2331 (4.1102)	Entropy 1.89612 (1.89983)	Top-1 acc 26.172 (28.747)	Top-5 acc 47.656 (52.074)	lr 0.02499
Train [2][2000/3239]	Time 0.554 (0.775)	Data Time 0.001 (0.013)	Loss 4.2554 (4.1101)	Entropy 1.89607 (1.89981)	Top-1 acc 24.219 (28.751)	Top-5 acc 52.344 (52.081)	lr 0.02499
Train [2][2010/3239]	Time 0.486 (0.775)	Data Time 0.001 (0.013)	Loss 4.0425 (4.1100)	Entropy 1.89602 (1.89979)	Top-1 acc 28.125 (28.748)	Top-5 acc 53.516 (52.082)	lr 0.02499
Train [2][2020/3239]	Time 0.695 (0.775)	Data Time 0.001 (0.013)	Loss 4.0708 (4.1099)	Entropy 1.89599 (1.89977)	Top-1 acc 29.688 (28.754)	Top-5 acc 53.516 (52.088)	lr 0.02499
Train [2][2030/3239]	Time 0.514 (0.775)	Data Time 0.001 (0.013)	Loss 4.2110 (4.1098)	Entropy 1.89591 (1.89975)	Top-1 acc 26.172 (28.751)	Top-5 acc 52.344 (52.086)	lr 0.02499
Train [2][2040/3239]	Time 0.499 (0.775)	Data Time 0.001 (0.013)	Loss 4.1967 (4.1098)	Entropy 1.89587 (1.89973)	Top-1 acc 24.609 (28.748)	Top-5 acc 50.781 (52.084)	lr 0.02499
Train [2][2050/3239]	Time 0.372 (0.775)	Data Time 0.003 (0.013)	Loss 4.0693 (4.1098)	Entropy 1.89585 (1.89971)	Top-1 acc 30.859 (28.751)	Top-5 acc 50.000 (52.082)	lr 0.02499
Train [2][2060/3239]	Time 0.575 (0.775)	Data Time 0.001 (0.013)	Loss 3.9924 (4.1096)	Entropy 1.89583 (1.89969)	Top-1 acc 29.297 (28.755)	Top-5 acc 54.297 (52.090)	lr 0.02499
Train [2][2070/3239]	Time 0.478 (0.774)	Data Time 0.001 (0.013)	Loss 3.9172 (4.1097)	Entropy 1.89581 (1.89968)	Top-1 acc 34.766 (28.753)	Top-5 acc 58.203 (52.089)	lr 0.02499
Train [2][2080/3239]	Time 0.510 (0.774)	Data Time 0.001 (0.013)	Loss 4.2447 (4.1095)	Entropy 1.89573 (1.89966)	Top-1 acc 26.172 (28.759)	Top-5 acc 48.047 (52.095)	lr 0.02499
Train [2][2090/3239]	Time 0.422 (0.774)	Data Time 0.001 (0.013)	Loss 4.2182 (4.1094)	Entropy 1.89566 (1.89964)	Top-1 acc 25.391 (28.761)	Top-5 acc 49.219 (52.095)	lr 0.02499
Train [2][2100/3239]	Time 0.461 (0.774)	Data Time 0.001 (0.013)	Loss 4.2014 (4.1092)	Entropy 1.89563 (1.89962)	Top-1 acc 22.656 (28.765)	Top-5 acc 53.906 (52.098)	lr 0.02499
Train [2][2110/3239]	Time 0.558 (0.774)	Data Time 0.001 (0.013)	Loss 4.0068 (4.1092)	Entropy 1.89558 (1.89960)	Top-1 acc 28.906 (28.766)	Top-5 acc 51.953 (52.099)	lr 0.02499
Train [2][2120/3239]	Time 0.495 (0.773)	Data Time 0.001 (0.013)	Loss 3.9611 (4.1091)	Entropy 1.89552 (1.89958)	Top-1 acc 30.078 (28.766)	Top-5 acc 58.203 (52.103)	lr 0.02499
Train [2][2130/3239]	Time 0.551 (0.773)	Data Time 0.002 (0.013)	Loss 4.0939 (4.1088)	Entropy 1.89546 (1.89956)	Top-1 acc 30.078 (28.773)	Top-5 acc 51.562 (52.110)	lr 0.02499
Train [2][2140/3239]	Time 0.532 (0.773)	Data Time 0.001 (0.013)	Loss 4.0417 (4.1088)	Entropy 1.89540 (1.89954)	Top-1 acc 28.516 (28.777)	Top-5 acc 53.906 (52.111)	lr 0.02499
Train [2][2150/3239]	Time 0.433 (0.773)	Data Time 0.001 (0.013)	Loss 4.1006 (4.1084)	Entropy 1.89534 (1.89952)	Top-1 acc 30.078 (28.783)	Top-5 acc 52.734 (52.119)	lr 0.02499
Train [2][2160/3239]	Time 0.429 (0.773)	Data Time 0.001 (0.013)	Loss 4.2149 (4.1084)	Entropy 1.89528 (1.89950)	Top-1 acc 23.828 (28.785)	Top-5 acc 49.219 (52.120)	lr 0.02499
Train [2][2170/3239]	Time 0.524 (0.773)	Data Time 0.001 (0.013)	Loss 4.1684 (4.1082)	Entropy 1.89518 (1.89948)	Top-1 acc 29.688 (28.789)	Top-5 acc 53.516 (52.127)	lr 0.02499
Train [2][2180/3239]	Time 0.416 (0.773)	Data Time 0.024 (0.013)	Loss 4.2312 (4.1085)	Entropy 1.89515 (1.89947)	Top-1 acc 30.078 (28.782)	Top-5 acc 50.000 (52.119)	lr 0.02499
Train [2][2190/3239]	Time 0.495 (0.773)	Data Time 0.001 (0.013)	Loss 3.9503 (4.1081)	Entropy 1.89504 (1.89945)	Top-1 acc 30.078 (28.794)	Top-5 acc 53.906 (52.126)	lr 0.02499
Train [2][2200/3239]	Time 0.474 (0.773)	Data Time 0.002 (0.013)	Loss 4.2341 (4.1081)	Entropy 1.89503 (1.89943)	Top-1 acc 25.000 (28.796)	Top-5 acc 46.094 (52.127)	lr 0.02499
Train [2][2210/3239]	Time 0.446 (0.773)	Data Time 0.001 (0.013)	Loss 4.0688 (4.1079)	Entropy 1.89499 (1.89941)	Top-1 acc 26.562 (28.797)	Top-5 acc 51.953 (52.123)	lr 0.02499
Train [2][2220/3239]	Time 0.434 (0.772)	Data Time 0.001 (0.013)	Loss 4.0229 (4.1081)	Entropy 1.89493 (1.89939)	Top-1 acc 30.469 (28.795)	Top-5 acc 54.688 (52.124)	lr 0.02499
Train [2][2230/3239]	Time 0.352 (0.772)	Data Time 0.001 (0.013)	Loss 4.1360 (4.1081)	Entropy 1.89486 (1.89937)	Top-1 acc 25.391 (28.796)	Top-5 acc 48.438 (52.123)	lr 0.02499
Train [2][2240/3239]	Time 0.527 (0.772)	Data Time 0.001 (0.013)	Loss 4.0369 (4.1079)	Entropy 1.89479 (1.89934)	Top-1 acc 28.516 (28.794)	Top-5 acc 52.734 (52.127)	lr 0.02499
Train [2][2250/3239]	Time 0.584 (0.772)	Data Time 0.001 (0.013)	Loss 4.1356 (4.1081)	Entropy 1.89471 (1.89932)	Top-1 acc 26.562 (28.788)	Top-5 acc 49.609 (52.123)	lr 0.02499
Train [2][2260/3239]	Time 0.344 (0.772)	Data Time 0.001 (0.013)	Loss 4.1659 (4.1079)	Entropy 1.89467 (1.89930)	Top-1 acc 29.688 (28.789)	Top-5 acc 51.562 (52.127)	lr 0.02499
Train [2][2270/3239]	Time 0.427 (0.772)	Data Time 0.001 (0.013)	Loss 4.0263 (4.1077)	Entropy 1.89464 (1.89928)	Top-1 acc 30.469 (28.793)	Top-5 acc 52.344 (52.134)	lr 0.02499
Train [2][2280/3239]	Time 0.569 (0.772)	Data Time 0.001 (0.013)	Loss 3.9919 (4.1076)	Entropy 1.89454 (1.89926)	Top-1 acc 30.078 (28.798)	Top-5 acc 55.859 (52.130)	lr 0.02499
Train [2][2290/3239]	Time 0.569 (0.772)	Data Time 0.001 (0.013)	Loss 3.9469 (4.1076)	Entropy 1.89446 (1.89924)	Top-1 acc 30.469 (28.796)	Top-5 acc 56.250 (52.131)	lr 0.02499
Train [2][2300/3239]	Time 0.525 (0.771)	Data Time 0.001 (0.012)	Loss 4.1693 (4.1074)	Entropy 1.89438 (1.89922)	Top-1 acc 27.344 (28.799)	Top-5 acc 51.562 (52.138)	lr 0.02499
Train [2][2310/3239]	Time 0.441 (0.771)	Data Time 0.001 (0.012)	Loss 4.1902 (4.1075)	Entropy 1.89433 (1.89920)	Top-1 acc 28.516 (28.802)	Top-5 acc 48.828 (52.135)	lr 0.02499
Train [2][2320/3239]	Time 0.398 (0.771)	Data Time 0.001 (0.012)	Loss 4.0248 (4.1075)	Entropy 1.89430 (1.89918)	Top-1 acc 30.078 (28.807)	Top-5 acc 50.391 (52.136)	lr 0.02499
Train [2][2330/3239]	Time 0.458 (0.771)	Data Time 0.001 (0.012)	Loss 3.8676 (4.1073)	Entropy 1.89424 (1.89916)	Top-1 acc 32.812 (28.813)	Top-5 acc 56.250 (52.142)	lr 0.02499
Train [2][2340/3239]	Time 0.398 (0.771)	Data Time 0.001 (0.012)	Loss 4.1855 (4.1074)	Entropy 1.89418 (1.89914)	Top-1 acc 25.781 (28.810)	Top-5 acc 51.953 (52.137)	lr 0.02499
Train [2][2350/3239]	Time 0.538 (0.771)	Data Time 0.002 (0.012)	Loss 4.0547 (4.1071)	Entropy 1.89414 (1.89912)	Top-1 acc 30.859 (28.819)	Top-5 acc 58.594 (52.143)	lr 0.02499
Train [2][2360/3239]	Time 0.454 (0.771)	Data Time 0.001 (0.012)	Loss 4.0196 (4.1072)	Entropy 1.89413 (1.89910)	Top-1 acc 28.125 (28.818)	Top-5 acc 55.078 (52.144)	lr 0.02499
Train [2][2370/3239]	Time 0.529 (0.771)	Data Time 0.002 (0.012)	Loss 4.1431 (4.1076)	Entropy 1.89402 (1.89907)	Top-1 acc 28.516 (28.814)	Top-5 acc 53.906 (52.141)	lr 0.02499
Train [2][2380/3239]	Time 0.530 (0.771)	Data Time 0.001 (0.012)	Loss 4.0069 (4.1075)	Entropy 1.89393 (1.89905)	Top-1 acc 35.547 (28.821)	Top-5 acc 53.125 (52.145)	lr 0.02499
Train [2][2390/3239]	Time 0.618 (0.771)	Data Time 0.001 (0.012)	Loss 4.2501 (4.1074)	Entropy 1.89388 (1.89903)	Top-1 acc 24.609 (28.828)	Top-5 acc 48.438 (52.148)	lr 0.02499
Train [2][2400/3239]	Time 0.404 (0.771)	Data Time 0.001 (0.012)	Loss 4.1073 (4.1070)	Entropy 1.89386 (1.89901)	Top-1 acc 30.078 (28.837)	Top-5 acc 53.516 (52.154)	lr 0.02499
Train [2][2410/3239]	Time 0.504 (0.771)	Data Time 0.001 (0.012)	Loss 4.1261 (4.1071)	Entropy 1.89379 (1.89899)	Top-1 acc 28.125 (28.836)	Top-5 acc 51.953 (52.153)	lr 0.02499
Train [2][2420/3239]	Time 0.468 (0.771)	Data Time 0.001 (0.012)	Loss 3.9551 (4.1067)	Entropy 1.89373 (1.89897)	Top-1 acc 32.422 (28.839)	Top-5 acc 57.422 (52.162)	lr 0.02499
Train [2][2430/3239]	Time 0.548 (0.771)	Data Time 0.001 (0.012)	Loss 3.9254 (4.1066)	Entropy 1.89365 (1.89894)	Top-1 acc 33.594 (28.844)	Top-5 acc 59.766 (52.166)	lr 0.02499
Train [2][2440/3239]	Time 0.465 (0.770)	Data Time 0.001 (0.012)	Loss 3.9483 (4.1064)	Entropy 1.89357 (1.89892)	Top-1 acc 30.078 (28.849)	Top-5 acc 57.812 (52.171)	lr 0.02499
Train [2][2450/3239]	Time 0.429 (0.770)	Data Time 0.001 (0.012)	Loss 4.0959 (4.1063)	Entropy 1.89350 (1.89890)	Top-1 acc 30.469 (28.855)	Top-5 acc 52.344 (52.173)	lr 0.02499
Train [2][2460/3239]	Time 0.514 (0.770)	Data Time 0.001 (0.012)	Loss 4.0863 (4.1061)	Entropy 1.89345 (1.89888)	Top-1 acc 31.250 (28.860)	Top-5 acc 52.344 (52.178)	lr 0.02499
Train [2][2470/3239]	Time 0.531 (0.770)	Data Time 0.002 (0.012)	Loss 4.2727 (4.1059)	Entropy 1.89339 (1.89886)	Top-1 acc 26.172 (28.866)	Top-5 acc 49.219 (52.186)	lr 0.02499
Train [2][2480/3239]	Time 0.478 (0.770)	Data Time 0.001 (0.012)	Loss 4.2750 (4.1057)	Entropy 1.89333 (1.89884)	Top-1 acc 29.297 (28.869)	Top-5 acc 49.219 (52.191)	lr 0.02499
Train [2][2490/3239]	Time 0.559 (0.770)	Data Time 0.001 (0.012)	Loss 3.9219 (4.1056)	Entropy 1.89332 (1.89881)	Top-1 acc 34.766 (28.878)	Top-5 acc 58.984 (52.190)	lr 0.02499
Train [2][2500/3239]	Time 0.614 (0.770)	Data Time 0.002 (0.012)	Loss 4.1110 (4.1055)	Entropy 1.89327 (1.89879)	Top-1 acc 29.297 (28.882)	Top-5 acc 51.172 (52.187)	lr 0.02499
Train [2][2510/3239]	Time 0.545 (0.770)	Data Time 0.001 (0.012)	Loss 3.9957 (4.1053)	Entropy 1.89321 (1.89877)	Top-1 acc 31.641 (28.883)	Top-5 acc 51.562 (52.188)	lr 0.02499
Train [2][2520/3239]	Time 0.547 (0.770)	Data Time 0.001 (0.012)	Loss 3.8948 (4.1053)	Entropy 1.89316 (1.89875)	Top-1 acc 33.594 (28.889)	Top-5 acc 57.812 (52.193)	lr 0.02499
Train [2][2530/3239]	Time 0.449 (0.770)	Data Time 0.001 (0.012)	Loss 4.1787 (4.1053)	Entropy 1.89310 (1.89872)	Top-1 acc 26.562 (28.890)	Top-5 acc 50.000 (52.193)	lr 0.02499
Train [2][2540/3239]	Time 0.552 (0.770)	Data Time 0.002 (0.012)	Loss 4.1677 (4.1054)	Entropy 1.89305 (1.89870)	Top-1 acc 30.078 (28.889)	Top-5 acc 51.562 (52.188)	lr 0.02499
Train [2][2550/3239]	Time 0.588 (0.769)	Data Time 0.001 (0.012)	Loss 4.1855 (4.1053)	Entropy 1.89297 (1.89868)	Top-1 acc 30.078 (28.893)	Top-5 acc 51.172 (52.192)	lr 0.02499
Train [2][2560/3239]	Time 0.652 (0.769)	Data Time 0.001 (0.012)	Loss 4.1429 (4.1053)	Entropy 1.89292 (1.89866)	Top-1 acc 30.469 (28.894)	Top-5 acc 55.078 (52.193)	lr 0.02499
Train [2][2570/3239]	Time 0.585 (0.769)	Data Time 0.001 (0.012)	Loss 3.7659 (4.1050)	Entropy 1.89288 (1.89864)	Top-1 acc 37.109 (28.904)	Top-5 acc 58.203 (52.201)	lr 0.02499
Train [2][2580/3239]	Time 0.404 (0.769)	Data Time 0.001 (0.012)	Loss 4.1634 (4.1052)	Entropy 1.89284 (1.89861)	Top-1 acc 29.297 (28.900)	Top-5 acc 48.828 (52.194)	lr 0.02499
Train [2][2590/3239]	Time 0.614 (0.769)	Data Time 0.001 (0.012)	Loss 4.1238 (4.1053)	Entropy 1.89282 (1.89859)	Top-1 acc 28.906 (28.901)	Top-5 acc 50.781 (52.194)	lr 0.02499
Train [2][2600/3239]	Time 0.523 (0.769)	Data Time 0.001 (0.012)	Loss 4.3138 (4.1056)	Entropy 1.89281 (1.89857)	Top-1 acc 27.734 (28.900)	Top-5 acc 48.047 (52.186)	lr 0.02499
Train [2][2610/3239]	Time 0.281 (0.769)	Data Time 0.001 (0.012)	Loss 4.0675 (4.1055)	Entropy 1.89276 (1.89855)	Top-1 acc 31.250 (28.902)	Top-5 acc 53.906 (52.189)	lr 0.02499
Train [2][2620/3239]	Time 0.538 (0.768)	Data Time 0.001 (0.012)	Loss 4.0102 (4.1054)	Entropy 1.89268 (1.89852)	Top-1 acc 30.469 (28.905)	Top-5 acc 53.906 (52.196)	lr 0.02499
Train [2][2630/3239]	Time 0.393 (0.774)	Data Time 0.002 (0.012)	Loss 4.0916 (4.1052)	Entropy 1.89258 (1.89850)	Top-1 acc 24.219 (28.904)	Top-5 acc 52.344 (52.198)	lr 0.02499
Train [2][2640/3239]	Time 0.539 (0.774)	Data Time 0.002 (0.012)	Loss 4.0240 (4.1050)	Entropy 1.89245 (1.89848)	Top-1 acc 30.469 (28.908)	Top-5 acc 54.297 (52.202)	lr 0.02499
Train [2][2650/3239]	Time 0.515 (0.774)	Data Time 0.001 (0.012)	Loss 3.9890 (4.1047)	Entropy 1.89237 (1.89846)	Top-1 acc 33.594 (28.909)	Top-5 acc 56.250 (52.209)	lr 0.02499
Train [2][2660/3239]	Time 0.352 (0.774)	Data Time 0.001 (0.012)	Loss 3.8773 (4.1044)	Entropy 1.89228 (1.89843)	Top-1 acc 32.422 (28.919)	Top-5 acc 55.859 (52.218)	lr 0.02499
Train [2][2670/3239]	Time 0.406 (0.774)	Data Time 0.001 (0.012)	Loss 3.8313 (4.1042)	Entropy 1.89223 (1.89841)	Top-1 acc 33.984 (28.924)	Top-5 acc 57.812 (52.225)	lr 0.02499
Train [2][2680/3239]	Time 0.392 (0.774)	Data Time 0.001 (0.012)	Loss 4.1392 (4.1045)	Entropy 1.89216 (1.89839)	Top-1 acc 28.516 (28.920)	Top-5 acc 53.125 (52.220)	lr 0.02499
Train [2][2690/3239]	Time 0.417 (0.774)	Data Time 0.001 (0.012)	Loss 4.0046 (4.1043)	Entropy 1.89210 (1.89836)	Top-1 acc 29.688 (28.923)	Top-5 acc 52.734 (52.223)	lr 0.02499
Train [2][2700/3239]	Time 0.611 (0.774)	Data Time 0.001 (0.012)	Loss 4.0233 (4.1040)	Entropy 1.89199 (1.89834)	Top-1 acc 31.250 (28.927)	Top-5 acc 56.250 (52.231)	lr 0.02499
Train [2][2710/3239]	Time 0.583 (0.774)	Data Time 0.001 (0.011)	Loss 3.8764 (4.1035)	Entropy 1.89188 (1.89832)	Top-1 acc 32.422 (28.935)	Top-5 acc 55.859 (52.243)	lr 0.02499
Train [2][2720/3239]	Time 0.481 (0.774)	Data Time 0.001 (0.011)	Loss 4.0074 (4.1034)	Entropy 1.89180 (1.89829)	Top-1 acc 29.297 (28.934)	Top-5 acc 57.812 (52.245)	lr 0.02499
Train [2][2730/3239]	Time 0.345 (0.774)	Data Time 0.002 (0.011)	Loss 3.9540 (4.1034)	Entropy 1.89174 (1.89827)	Top-1 acc 32.031 (28.935)	Top-5 acc 51.562 (52.244)	lr 0.02499
Train [2][2740/3239]	Time 0.502 (0.773)	Data Time 0.001 (0.011)	Loss 4.0425 (4.1036)	Entropy 1.89163 (1.89825)	Top-1 acc 30.078 (28.932)	Top-5 acc 54.297 (52.238)	lr 0.02499
Train [2][2750/3239]	Time 0.524 (0.773)	Data Time 0.001 (0.011)	Loss 4.1325 (4.1034)	Entropy 1.89155 (1.89822)	Top-1 acc 28.906 (28.937)	Top-5 acc 54.688 (52.247)	lr 0.02499
Train [2][2760/3239]	Time 0.356 (0.773)	Data Time 0.001 (0.011)	Loss 4.2419 (4.1035)	Entropy 1.89149 (1.89820)	Top-1 acc 25.781 (28.935)	Top-5 acc 46.875 (52.244)	lr 0.02499
Train [2][2770/3239]	Time 0.572 (0.773)	Data Time 0.001 (0.011)	Loss 3.9802 (4.1034)	Entropy 1.89146 (1.89817)	Top-1 acc 28.125 (28.939)	Top-5 acc 53.125 (52.244)	lr 0.02499
Train [2][2780/3239]	Time 0.504 (0.773)	Data Time 0.001 (0.011)	Loss 4.1797 (4.1033)	Entropy 1.89139 (1.89815)	Top-1 acc 26.562 (28.937)	Top-5 acc 51.562 (52.245)	lr 0.02499
Train [2][2790/3239]	Time 0.614 (0.773)	Data Time 0.001 (0.011)	Loss 4.1900 (4.1032)	Entropy 1.89130 (1.89812)	Top-1 acc 23.047 (28.940)	Top-5 acc 48.438 (52.245)	lr 0.02499
Train [2][2800/3239]	Time 0.494 (0.773)	Data Time 0.001 (0.011)	Loss 4.1073 (4.1033)	Entropy 1.89126 (1.89810)	Top-1 acc 31.250 (28.940)	Top-5 acc 51.562 (52.242)	lr 0.02499
Train [2][2810/3239]	Time 0.604 (0.773)	Data Time 0.001 (0.011)	Loss 4.0381 (4.1033)	Entropy 1.89119 (1.89808)	Top-1 acc 25.000 (28.939)	Top-5 acc 53.906 (52.243)	lr 0.02499
Train [2][2820/3239]	Time 0.553 (0.773)	Data Time 0.001 (0.011)	Loss 3.9848 (4.1031)	Entropy 1.89116 (1.89805)	Top-1 acc 28.516 (28.943)	Top-5 acc 56.641 (52.248)	lr 0.02499
Train [2][2830/3239]	Time 0.497 (0.773)	Data Time 0.003 (0.011)	Loss 4.1605 (4.1030)	Entropy 1.89107 (1.89803)	Top-1 acc 27.344 (28.946)	Top-5 acc 50.391 (52.254)	lr 0.02498
Train [2][2840/3239]	Time 0.525 (0.772)	Data Time 0.001 (0.011)	Loss 4.0441 (4.1028)	Entropy 1.89102 (1.89800)	Top-1 acc 30.078 (28.945)	Top-5 acc 55.078 (52.259)	lr 0.02498
Train [2][2850/3239]	Time 0.605 (0.772)	Data Time 0.003 (0.011)	Loss 4.0180 (4.1026)	Entropy 1.89095 (1.89798)	Top-1 acc 29.688 (28.948)	Top-5 acc 57.031 (52.265)	lr 0.02498
Train [2][2860/3239]	Time 0.562 (0.772)	Data Time 0.001 (0.011)	Loss 3.9602 (4.1024)	Entropy 1.89089 (1.89795)	Top-1 acc 33.203 (28.952)	Top-5 acc 56.250 (52.273)	lr 0.02498
Train [2][2870/3239]	Time 0.534 (0.772)	Data Time 0.003 (0.011)	Loss 4.3664 (4.1027)	Entropy 1.89080 (1.89793)	Top-1 acc 25.391 (28.947)	Top-5 acc 47.656 (52.269)	lr 0.02498
Train [2][2880/3239]	Time 0.501 (0.772)	Data Time 0.001 (0.011)	Loss 4.2071 (4.1026)	Entropy 1.89071 (1.89790)	Top-1 acc 27.734 (28.947)	Top-5 acc 50.391 (52.271)	lr 0.02498
Train [2][2890/3239]	Time 0.507 (0.772)	Data Time 0.001 (0.011)	Loss 4.0535 (4.1025)	Entropy 1.89064 (1.89788)	Top-1 acc 30.469 (28.950)	Top-5 acc 53.906 (52.272)	lr 0.02498
Train [2][2900/3239]	Time 0.380 (0.772)	Data Time 0.001 (0.011)	Loss 3.9176 (4.1023)	Entropy 1.89056 (1.89785)	Top-1 acc 31.641 (28.954)	Top-5 acc 55.078 (52.273)	lr 0.02498
Train [2][2910/3239]	Time 0.492 (0.772)	Data Time 0.001 (0.011)	Loss 4.1112 (4.1023)	Entropy 1.89047 (1.89783)	Top-1 acc 26.172 (28.952)	Top-5 acc 51.953 (52.271)	lr 0.02498
Train [2][2920/3239]	Time 0.404 (0.772)	Data Time 0.003 (0.011)	Loss 4.1489 (4.1021)	Entropy 1.89040 (1.89780)	Top-1 acc 25.781 (28.953)	Top-5 acc 51.562 (52.281)	lr 0.02498
Train [2][2930/3239]	Time 0.498 (0.772)	Data Time 0.001 (0.011)	Loss 4.0199 (4.1019)	Entropy 1.89029 (1.89778)	Top-1 acc 29.688 (28.956)	Top-5 acc 55.469 (52.285)	lr 0.02498
Train [2][2940/3239]	Time 0.520 (0.772)	Data Time 0.001 (0.011)	Loss 4.0671 (4.1020)	Entropy 1.89020 (1.89775)	Top-1 acc 28.906 (28.955)	Top-5 acc 51.953 (52.280)	lr 0.02498
Train [2][2950/3239]	Time 0.522 (0.771)	Data Time 0.001 (0.011)	Loss 4.3409 (4.1018)	Entropy 1.89013 (1.89773)	Top-1 acc 23.828 (28.959)	Top-5 acc 48.047 (52.286)	lr 0.02498
Train [2][2960/3239]	Time 0.485 (0.771)	Data Time 0.001 (0.011)	Loss 4.0665 (4.1017)	Entropy 1.89005 (1.89770)	Top-1 acc 27.734 (28.962)	Top-5 acc 53.125 (52.287)	lr 0.02498
Train [2][2970/3239]	Time 0.531 (0.771)	Data Time 0.001 (0.011)	Loss 3.9810 (4.1017)	Entropy 1.88999 (1.89767)	Top-1 acc 30.469 (28.961)	Top-5 acc 50.781 (52.287)	lr 0.02498
Train [2][2980/3239]	Time 0.524 (0.771)	Data Time 0.002 (0.011)	Loss 4.0666 (4.1016)	Entropy 1.88988 (1.89765)	Top-1 acc 28.906 (28.962)	Top-5 acc 53.906 (52.289)	lr 0.02498
Train [2][2990/3239]	Time 0.521 (0.771)	Data Time 0.001 (0.011)	Loss 4.0907 (4.1015)	Entropy 1.88981 (1.89762)	Top-1 acc 29.688 (28.968)	Top-5 acc 51.172 (52.288)	lr 0.02498
Train [2][3000/3239]	Time 0.584 (0.771)	Data Time 0.001 (0.011)	Loss 3.9201 (4.1013)	Entropy 1.88972 (1.89760)	Top-1 acc 30.469 (28.968)	Top-5 acc 55.469 (52.294)	lr 0.02498
Train [2][3010/3239]	Time 0.477 (0.771)	Data Time 0.001 (0.011)	Loss 4.1302 (4.1013)	Entropy 1.88959 (1.89757)	Top-1 acc 29.688 (28.969)	Top-5 acc 52.344 (52.295)	lr 0.02498
Train [2][3020/3239]	Time 0.485 (0.771)	Data Time 0.002 (0.011)	Loss 4.2966 (4.1010)	Entropy 1.88952 (1.89754)	Top-1 acc 26.953 (28.975)	Top-5 acc 49.609 (52.304)	lr 0.02498
Train [2][3030/3239]	Time 0.586 (0.771)	Data Time 0.001 (0.011)	Loss 3.9744 (4.1007)	Entropy 1.88942 (1.89752)	Top-1 acc 36.328 (28.982)	Top-5 acc 55.078 (52.309)	lr 0.02498
Train [2][3040/3239]	Time 0.515 (0.771)	Data Time 0.001 (0.011)	Loss 3.8892 (4.1006)	Entropy 1.88937 (1.89749)	Top-1 acc 33.203 (28.985)	Top-5 acc 54.688 (52.313)	lr 0.02498
Train [2][3050/3239]	Time 0.414 (0.771)	Data Time 0.001 (0.011)	Loss 3.9739 (4.1006)	Entropy 1.88930 (1.89746)	Top-1 acc 33.984 (28.985)	Top-5 acc 55.469 (52.313)	lr 0.02498
Train [2][3060/3239]	Time 0.489 (0.771)	Data Time 0.001 (0.011)	Loss 4.2871 (4.1005)	Entropy 1.88921 (1.89744)	Top-1 acc 25.391 (28.988)	Top-5 acc 47.656 (52.316)	lr 0.02498
Train [2][3070/3239]	Time 0.406 (0.771)	Data Time 0.002 (0.011)	Loss 4.1471 (4.1004)	Entropy 1.88914 (1.89741)	Top-1 acc 28.125 (28.991)	Top-5 acc 52.734 (52.319)	lr 0.02498
Train [2][3080/3239]	Time 0.514 (0.770)	Data Time 0.001 (0.011)	Loss 4.1905 (4.1001)	Entropy 1.88901 (1.89738)	Top-1 acc 24.219 (28.997)	Top-5 acc 52.344 (52.325)	lr 0.02498
Train [2][3090/3239]	Time 0.525 (0.770)	Data Time 0.001 (0.011)	Loss 4.1104 (4.1002)	Entropy 1.88894 (1.89736)	Top-1 acc 27.734 (28.993)	Top-5 acc 52.344 (52.323)	lr 0.02498
Train [2][3100/3239]	Time 0.386 (0.770)	Data Time 0.001 (0.011)	Loss 3.9774 (4.1000)	Entropy 1.88891 (1.89733)	Top-1 acc 32.031 (28.995)	Top-5 acc 54.297 (52.326)	lr 0.02498
Train [2][3110/3239]	Time 0.495 (0.770)	Data Time 0.018 (0.011)	Loss 4.0691 (4.0999)	Entropy 1.88880 (1.89730)	Top-1 acc 30.078 (28.997)	Top-5 acc 53.516 (52.330)	lr 0.02498
Train [2][3120/3239]	Time 0.565 (0.770)	Data Time 0.001 (0.011)	Loss 3.9007 (4.0998)	Entropy 1.88878 (1.89727)	Top-1 acc 33.984 (28.999)	Top-5 acc 59.375 (52.332)	lr 0.02498
Train [2][3130/3239]	Time 0.441 (0.770)	Data Time 0.001 (0.010)	Loss 4.2328 (4.0996)	Entropy 1.88874 (1.89725)	Top-1 acc 29.297 (29.002)	Top-5 acc 51.953 (52.334)	lr 0.02498
Train [2][3140/3239]	Time 0.537 (0.770)	Data Time 0.001 (0.010)	Loss 4.3495 (4.0998)	Entropy 1.88865 (1.89722)	Top-1 acc 25.781 (29.003)	Top-5 acc 47.266 (52.332)	lr 0.02498
Train [2][3150/3239]	Time 0.473 (0.770)	Data Time 0.001 (0.010)	Loss 4.0632 (4.0998)	Entropy 1.88857 (1.89719)	Top-1 acc 28.906 (29.006)	Top-5 acc 51.172 (52.333)	lr 0.02498
Train [2][3160/3239]	Time 0.591 (0.770)	Data Time 0.001 (0.010)	Loss 3.9215 (4.0997)	Entropy 1.88847 (1.89716)	Top-1 acc 31.641 (29.005)	Top-5 acc 57.812 (52.334)	lr 0.02498
Train [2][3170/3239]	Time 0.608 (0.770)	Data Time 0.001 (0.010)	Loss 4.0432 (4.0997)	Entropy 1.88839 (1.89714)	Top-1 acc 28.906 (29.009)	Top-5 acc 51.562 (52.330)	lr 0.02498
Train [2][3180/3239]	Time 0.476 (0.770)	Data Time 0.000 (0.010)	Loss 4.1670 (4.0997)	Entropy 1.88828 (1.89711)	Top-1 acc 27.344 (29.006)	Top-5 acc 50.391 (52.327)	lr 0.02498
Train [2][3190/3239]	Time 0.363 (0.770)	Data Time 0.000 (0.010)	Loss 4.2544 (4.0997)	Entropy 1.88820 (1.89708)	Top-1 acc 30.859 (29.007)	Top-5 acc 47.266 (52.326)	lr 0.02498
Train [2][3200/3239]	Time 0.344 (0.770)	Data Time 0.000 (0.010)	Loss 4.3531 (4.0996)	Entropy 1.88817 (1.89705)	Top-1 acc 23.828 (29.014)	Top-5 acc 46.875 (52.329)	lr 0.02498
Train [2][3210/3239]	Time 0.529 (0.770)	Data Time 0.000 (0.010)	Loss 3.9943 (4.0997)	Entropy 1.88811 (1.89703)	Top-1 acc 36.719 (29.014)	Top-5 acc 56.250 (52.328)	lr 0.02498
Train [2][3220/3239]	Time 0.351 (0.769)	Data Time 0.000 (0.010)	Loss 3.9340 (4.0996)	Entropy 1.88804 (1.89700)	Top-1 acc 34.766 (29.018)	Top-5 acc 54.688 (52.331)	lr 0.02498
Train [2][3230/3239]	Time 0.512 (0.769)	Data Time 0.000 (0.010)	Loss 4.0966 (4.0995)	Entropy 1.88800 (1.89697)	Top-1 acc 32.031 (29.020)	Top-5 acc 46.875 (52.331)	lr 0.02498
Train [2][3239/3239]	Time 1.482 (0.769)	Data Time 0.000 (0.010)	Loss 4.4928 (4.0994)	Entropy 1.88795 (1.89695)	Top-1 acc 22.222 (29.020)	Top-5 acc 44.444 (52.334)	lr 0.02498
==========Valid [2/120]	loss 3.009	top-1 acc 37.320 (37.320)	top-5 acc 62.223	Train top-1 29.020	top-5 52.334	Entropy 1.88795	Latency-None: 0.000ms	Flops: 508.30M
Train [3][0/3239]	Time 17.088 (17.088)	Data Time 15.486 (15.486)	Loss 4.2230 (4.2230)	Entropy 1.88792 (1.88792)	Top-1 acc 23.047 (23.047)	Top-5 acc 48.438 (48.438)	lr 0.02498
Train [3][10/3239]	Time 0.509 (2.276)	Data Time 0.001 (1.413)	Loss 4.0585 (4.0035)	Entropy 1.88785 (1.88790)	Top-1 acc 29.688 (30.966)	Top-5 acc 53.125 (54.652)	lr 0.02498
Train [3][20/3239]	Time 0.519 (1.559)	Data Time 0.001 (0.741)	Loss 4.2479 (4.0421)	Entropy 1.88776 (1.88787)	Top-1 acc 23.047 (29.985)	Top-5 acc 51.562 (53.850)	lr 0.02498
Train [3][30/3239]	Time 0.534 (1.304)	Data Time 0.001 (0.503)	Loss 4.3361 (4.0556)	Entropy 1.88771 (1.88783)	Top-1 acc 21.094 (29.448)	Top-5 acc 47.266 (53.125)	lr 0.02498
Train [3][40/3239]	Time 0.471 (1.547)	Data Time 0.029 (0.382)	Loss 3.9735 (4.0380)	Entropy 1.88763 (1.88779)	Top-1 acc 28.125 (29.592)	Top-5 acc 54.297 (53.554)	lr 0.02498
Train [3][50/3239]	Time 0.392 (1.399)	Data Time 0.002 (0.311)	Loss 4.2793 (4.0496)	Entropy 1.88760 (1.88776)	Top-1 acc 25.000 (29.511)	Top-5 acc 49.609 (53.301)	lr 0.02498
Train [3][60/3239]	Time 0.431 (1.295)	Data Time 0.001 (0.262)	Loss 4.1502 (4.0453)	Entropy 1.88753 (1.88773)	Top-1 acc 29.688 (29.764)	Top-5 acc 48.438 (53.298)	lr 0.02498
Train [3][70/3239]	Time 0.632 (1.218)	Data Time 0.001 (0.226)	Loss 4.0572 (4.0422)	Entropy 1.88747 (1.88770)	Top-1 acc 29.297 (29.710)	Top-5 acc 53.125 (53.472)	lr 0.02498
Train [3][80/3239]	Time 0.578 (1.159)	Data Time 0.001 (0.199)	Loss 4.0956 (4.0450)	Entropy 1.88740 (1.88767)	Top-1 acc 28.906 (29.827)	Top-5 acc 53.125 (53.496)	lr 0.02498
Train [3][90/3239]	Time 0.528 (1.114)	Data Time 0.002 (0.177)	Loss 4.0040 (4.0503)	Entropy 1.88737 (1.88764)	Top-1 acc 31.641 (29.782)	Top-5 acc 52.734 (53.365)	lr 0.02498
Train [3][100/3239]	Time 0.602 (1.078)	Data Time 0.001 (0.160)	Loss 3.8714 (4.0547)	Entropy 1.88731 (1.88761)	Top-1 acc 32.031 (29.792)	Top-5 acc 58.203 (53.202)	lr 0.02498
Train [3][110/3239]	Time 0.315 (1.048)	Data Time 0.001 (0.146)	Loss 4.2516 (4.0551)	Entropy 1.88722 (1.88758)	Top-1 acc 26.172 (29.793)	Top-5 acc 50.781 (53.220)	lr 0.02498
Train [3][120/3239]	Time 0.588 (1.027)	Data Time 0.002 (0.135)	Loss 4.1288 (4.0588)	Entropy 1.88716 (1.88755)	Top-1 acc 30.078 (29.765)	Top-5 acc 52.734 (53.128)	lr 0.02498
Train [3][130/3239]	Time 0.502 (1.008)	Data Time 0.001 (0.125)	Loss 4.0257 (4.0586)	Entropy 1.88709 (1.88752)	Top-1 acc 26.953 (29.685)	Top-5 acc 51.953 (53.140)	lr 0.02498
Train [3][140/3239]	Time 0.443 (0.989)	Data Time 0.001 (0.116)	Loss 3.9640 (4.0625)	Entropy 1.88700 (1.88749)	Top-1 acc 30.859 (29.701)	Top-5 acc 56.641 (53.078)	lr 0.02498
Train [3][150/3239]	Time 0.496 (0.975)	Data Time 0.001 (0.110)	Loss 3.9964 (4.0575)	Entropy 1.88687 (1.88745)	Top-1 acc 32.812 (29.809)	Top-5 acc 55.469 (53.221)	lr 0.02498
Train [3][160/3239]	Time 0.590 (0.962)	Data Time 0.001 (0.103)	Loss 4.0901 (4.0547)	Entropy 1.88678 (1.88741)	Top-1 acc 27.734 (29.804)	Top-5 acc 52.344 (53.278)	lr 0.02498
Train [3][170/3239]	Time 0.324 (0.946)	Data Time 0.001 (0.097)	Loss 4.0618 (4.0553)	Entropy 1.88669 (1.88738)	Top-1 acc 32.422 (29.868)	Top-5 acc 53.516 (53.257)	lr 0.02498
Train [3][180/3239]	Time 0.409 (0.936)	Data Time 0.001 (0.092)	Loss 4.2045 (4.0580)	Entropy 1.88668 (1.88734)	Top-1 acc 26.172 (29.826)	Top-5 acc 50.000 (53.162)	lr 0.02498
Train [3][190/3239]	Time 0.521 (0.926)	Data Time 0.001 (0.088)	Loss 4.1262 (4.0581)	Entropy 1.88664 (1.88730)	Top-1 acc 31.641 (29.812)	Top-5 acc 53.906 (53.186)	lr 0.02498
Train [3][200/3239]	Time 0.550 (0.915)	Data Time 0.001 (0.083)	Loss 3.9678 (4.0600)	Entropy 1.88659 (1.88727)	Top-1 acc 29.297 (29.839)	Top-5 acc 53.125 (53.144)	lr 0.02498
Train [3][210/3239]	Time 0.698 (0.908)	Data Time 0.001 (0.080)	Loss 4.0284 (4.0613)	Entropy 1.88647 (1.88724)	Top-1 acc 32.422 (29.854)	Top-5 acc 54.688 (53.131)	lr 0.02498
Train [3][220/3239]	Time 0.384 (0.900)	Data Time 0.001 (0.076)	Loss 4.0258 (4.0631)	Entropy 1.88641 (1.88720)	Top-1 acc 26.172 (29.776)	Top-5 acc 54.297 (53.129)	lr 0.02498
Train [3][230/3239]	Time 0.501 (0.893)	Data Time 0.003 (0.073)	Loss 4.0792 (4.0633)	Entropy 1.88640 (1.88716)	Top-1 acc 28.906 (29.738)	Top-5 acc 53.516 (53.179)	lr 0.02498
Train [3][240/3239]	Time 0.576 (0.888)	Data Time 0.001 (0.070)	Loss 3.9148 (4.0606)	Entropy 1.88636 (1.88713)	Top-1 acc 32.812 (29.770)	Top-5 acc 55.469 (53.213)	lr 0.02498
Train [3][250/3239]	Time 0.556 (0.883)	Data Time 0.001 (0.067)	Loss 4.0759 (4.0595)	Entropy 1.88635 (1.88710)	Top-1 acc 30.078 (29.765)	Top-5 acc 52.344 (53.220)	lr 0.02498
Train [3][260/3239]	Time 0.530 (0.878)	Data Time 0.001 (0.065)	Loss 4.1005 (4.0571)	Entropy 1.88634 (1.88707)	Top-1 acc 25.781 (29.777)	Top-5 acc 50.781 (53.255)	lr 0.02498
Train [3][270/3239]	Time 0.518 (0.874)	Data Time 0.001 (0.063)	Loss 4.1630 (4.0584)	Entropy 1.88622 (1.88704)	Top-1 acc 24.219 (29.765)	Top-5 acc 50.000 (53.255)	lr 0.02498
Train [3][280/3239]	Time 0.394 (0.870)	Data Time 0.001 (0.060)	Loss 4.2588 (4.0597)	Entropy 1.88608 (1.88701)	Top-1 acc 23.828 (29.761)	Top-5 acc 48.047 (53.183)	lr 0.02498
Train [3][290/3239]	Time 0.529 (0.866)	Data Time 0.001 (0.059)	Loss 4.1154 (4.0622)	Entropy 1.88602 (1.88698)	Top-1 acc 29.688 (29.717)	Top-5 acc 52.344 (53.121)	lr 0.02498
Train [3][300/3239]	Time 0.510 (0.863)	Data Time 0.002 (0.057)	Loss 3.9075 (4.0621)	Entropy 1.88596 (1.88695)	Top-1 acc 31.250 (29.698)	Top-5 acc 53.125 (53.131)	lr 0.02498
Train [3][310/3239]	Time 0.532 (0.860)	Data Time 0.001 (0.055)	Loss 3.8884 (4.0620)	Entropy 1.88584 (1.88692)	Top-1 acc 31.641 (29.721)	Top-5 acc 58.203 (53.151)	lr 0.02498
Train [3][320/3239]	Time 0.614 (0.858)	Data Time 0.001 (0.053)	Loss 4.1717 (4.0633)	Entropy 1.88577 (1.88688)	Top-1 acc 26.953 (29.708)	Top-5 acc 48.828 (53.093)	lr 0.02498
Train [3][330/3239]	Time 0.529 (0.855)	Data Time 0.001 (0.052)	Loss 4.0464 (4.0636)	Entropy 1.88576 (1.88685)	Top-1 acc 27.344 (29.683)	Top-5 acc 54.297 (53.091)	lr 0.02498
Train [3][340/3239]	Time 0.544 (0.851)	Data Time 0.001 (0.051)	Loss 4.1503 (4.0641)	Entropy 1.88572 (1.88682)	Top-1 acc 30.469 (29.701)	Top-5 acc 52.734 (53.080)	lr 0.02498
Train [3][350/3239]	Time 0.503 (0.847)	Data Time 0.002 (0.049)	Loss 3.9634 (4.0629)	Entropy 1.88559 (1.88678)	Top-1 acc 36.719 (29.760)	Top-5 acc 56.641 (53.136)	lr 0.02498
Train [3][360/3239]	Time 0.458 (0.844)	Data Time 0.001 (0.048)	Loss 4.0668 (4.0653)	Entropy 1.88550 (1.88675)	Top-1 acc 30.859 (29.707)	Top-5 acc 53.516 (53.073)	lr 0.02498
Train [3][370/3239]	Time 0.439 (0.840)	Data Time 0.001 (0.047)	Loss 4.0729 (4.0640)	Entropy 1.88540 (1.88671)	Top-1 acc 26.953 (29.706)	Top-5 acc 51.172 (53.080)	lr 0.02498
Train [3][380/3239]	Time 0.491 (0.839)	Data Time 0.001 (0.046)	Loss 4.2919 (4.0646)	Entropy 1.88531 (1.88668)	Top-1 acc 28.125 (29.715)	Top-5 acc 50.391 (53.079)	lr 0.02498
Train [3][390/3239]	Time 0.370 (0.836)	Data Time 0.001 (0.045)	Loss 4.0310 (4.0636)	Entropy 1.88522 (1.88664)	Top-1 acc 34.766 (29.724)	Top-5 acc 55.078 (53.105)	lr 0.02498
Train [3][400/3239]	Time 0.491 (0.834)	Data Time 0.001 (0.044)	Loss 4.1369 (4.0640)	Entropy 1.88515 (1.88661)	Top-1 acc 26.562 (29.725)	Top-5 acc 50.391 (53.096)	lr 0.02498
Train [3][410/3239]	Time 0.560 (0.832)	Data Time 0.001 (0.043)	Loss 4.0918 (4.0642)	Entropy 1.88501 (1.88657)	Top-1 acc 27.734 (29.703)	Top-5 acc 53.906 (53.074)	lr 0.02498
Train [3][420/3239]	Time 0.557 (0.830)	Data Time 0.001 (0.042)	Loss 4.0316 (4.0634)	Entropy 1.88486 (1.88653)	Top-1 acc 29.297 (29.681)	Top-5 acc 54.297 (53.065)	lr 0.02498
Train [3][430/3239]	Time 0.511 (0.828)	Data Time 0.001 (0.041)	Loss 4.1285 (4.0644)	Entropy 1.88476 (1.88649)	Top-1 acc 31.250 (29.684)	Top-5 acc 53.906 (53.059)	lr 0.02498
Train [3][440/3239]	Time 0.449 (0.827)	Data Time 0.001 (0.040)	Loss 3.9510 (4.0626)	Entropy 1.88469 (1.88645)	Top-1 acc 30.469 (29.716)	Top-5 acc 54.688 (53.085)	lr 0.02498
Train [3][450/3239]	Time 0.432 (0.826)	Data Time 0.001 (0.039)	Loss 4.0771 (4.0635)	Entropy 1.88465 (1.88641)	Top-1 acc 30.078 (29.694)	Top-5 acc 53.516 (53.072)	lr 0.02498
Train [3][460/3239]	Time 0.484 (0.824)	Data Time 0.002 (0.039)	Loss 4.0530 (4.0647)	Entropy 1.88454 (1.88637)	Top-1 acc 27.344 (29.671)	Top-5 acc 53.125 (53.045)	lr 0.02498
Train [3][470/3239]	Time 0.579 (0.823)	Data Time 0.001 (0.038)	Loss 3.9466 (4.0644)	Entropy 1.88444 (1.88633)	Top-1 acc 31.641 (29.706)	Top-5 acc 55.078 (53.054)	lr 0.02498
Train [3][480/3239]	Time 0.370 (0.821)	Data Time 0.001 (0.037)	Loss 4.0674 (4.0638)	Entropy 1.88436 (1.88629)	Top-1 acc 28.906 (29.721)	Top-5 acc 53.125 (53.082)	lr 0.02498
Train [3][490/3239]	Time 0.518 (0.820)	Data Time 0.001 (0.037)	Loss 4.0279 (4.0634)	Entropy 1.88423 (1.88625)	Top-1 acc 31.641 (29.725)	Top-5 acc 55.469 (53.061)	lr 0.02498
Train [3][500/3239]	Time 0.517 (0.819)	Data Time 0.003 (0.036)	Loss 3.9910 (4.0625)	Entropy 1.88412 (1.88621)	Top-1 acc 34.766 (29.741)	Top-5 acc 55.078 (53.075)	lr 0.02498
Train [3][510/3239]	Time 0.573 (0.817)	Data Time 0.001 (0.035)	Loss 4.1587 (4.0622)	Entropy 1.88408 (1.88617)	Top-1 acc 26.562 (29.754)	Top-5 acc 51.172 (53.082)	lr 0.02498
Train [3][520/3239]	Time 0.553 (0.816)	Data Time 0.001 (0.035)	Loss 4.0322 (4.0622)	Entropy 1.88403 (1.88613)	Top-1 acc 26.562 (29.750)	Top-5 acc 54.688 (53.093)	lr 0.02498
Train [3][530/3239]	Time 0.466 (0.814)	Data Time 0.001 (0.034)	Loss 4.0462 (4.0630)	Entropy 1.88398 (1.88609)	Top-1 acc 28.125 (29.752)	Top-5 acc 51.562 (53.070)	lr 0.02498
Train [3][540/3239]	Time 0.394 (0.812)	Data Time 0.001 (0.034)	Loss 4.0666 (4.0634)	Entropy 1.88394 (1.88605)	Top-1 acc 33.594 (29.747)	Top-5 acc 53.906 (53.058)	lr 0.02498
Train [3][550/3239]	Time 0.540 (0.811)	Data Time 0.001 (0.033)	Loss 4.0576 (4.0643)	Entropy 1.88387 (1.88601)	Top-1 acc 33.203 (29.744)	Top-5 acc 54.297 (53.050)	lr 0.02498
Train [3][560/3239]	Time 0.467 (0.811)	Data Time 0.001 (0.033)	Loss 4.1031 (4.0639)	Entropy 1.88383 (1.88597)	Top-1 acc 30.859 (29.753)	Top-5 acc 54.688 (53.057)	lr 0.02498
Train [3][570/3239]	Time 0.521 (0.810)	Data Time 0.002 (0.032)	Loss 4.0733 (4.0639)	Entropy 1.88380 (1.88594)	Top-1 acc 31.250 (29.759)	Top-5 acc 52.734 (53.056)	lr 0.02498
Train [3][580/3239]	Time 0.490 (0.809)	Data Time 0.001 (0.032)	Loss 3.8729 (4.0627)	Entropy 1.88371 (1.88590)	Top-1 acc 28.906 (29.783)	Top-5 acc 55.469 (53.075)	lr 0.02498
Train [3][590/3239]	Time 0.345 (0.808)	Data Time 0.001 (0.031)	Loss 4.1424 (4.0632)	Entropy 1.88369 (1.88586)	Top-1 acc 26.953 (29.787)	Top-5 acc 52.344 (53.073)	lr 0.02498
Train [3][600/3239]	Time 0.410 (0.807)	Data Time 0.002 (0.031)	Loss 4.0475 (4.0627)	Entropy 1.88356 (1.88583)	Top-1 acc 28.125 (29.814)	Top-5 acc 52.734 (53.090)	lr 0.02498
Train [3][610/3239]	Time 0.534 (0.806)	Data Time 0.001 (0.031)	Loss 3.9675 (4.0626)	Entropy 1.88346 (1.88579)	Top-1 acc 33.203 (29.826)	Top-5 acc 58.594 (53.096)	lr 0.02498
Train [3][620/3239]	Time 0.529 (0.805)	Data Time 0.001 (0.030)	Loss 3.8959 (4.0621)	Entropy 1.88333 (1.88575)	Top-1 acc 36.328 (29.839)	Top-5 acc 58.984 (53.108)	lr 0.02498
Train [3][630/3239]	Time 0.396 (0.805)	Data Time 0.001 (0.030)	Loss 4.0599 (4.0618)	Entropy 1.88325 (1.88571)	Top-1 acc 26.953 (29.848)	Top-5 acc 54.297 (53.110)	lr 0.02498
Train [3][640/3239]	Time 0.559 (0.804)	Data Time 0.001 (0.029)	Loss 3.8669 (4.0610)	Entropy 1.88316 (1.88567)	Top-1 acc 38.281 (29.890)	Top-5 acc 57.422 (53.121)	lr 0.02498
Train [3][650/3239]	Time 0.472 (0.803)	Data Time 0.001 (0.029)	Loss 4.0757 (4.0609)	Entropy 1.88311 (1.88563)	Top-1 acc 30.469 (29.872)	Top-5 acc 54.688 (53.135)	lr 0.02498
Train [3][660/3239]	Time 0.472 (0.802)	Data Time 0.001 (0.029)	Loss 4.1111 (4.0616)	Entropy 1.88306 (1.88560)	Top-1 acc 23.828 (29.849)	Top-5 acc 51.562 (53.126)	lr 0.02498
Train [3][670/3239]	Time 0.414 (0.801)	Data Time 0.001 (0.028)	Loss 4.0658 (4.0608)	Entropy 1.88296 (1.88556)	Top-1 acc 34.375 (29.862)	Top-5 acc 53.125 (53.148)	lr 0.02498
Train [3][680/3239]	Time 0.500 (0.800)	Data Time 0.001 (0.028)	Loss 4.0234 (4.0601)	Entropy 1.88294 (1.88552)	Top-1 acc 31.641 (29.867)	Top-5 acc 54.688 (53.163)	lr 0.02498
Train [3][690/3239]	Time 0.401 (0.800)	Data Time 0.001 (0.028)	Loss 4.0225 (4.0599)	Entropy 1.88290 (1.88548)	Top-1 acc 28.906 (29.875)	Top-5 acc 53.516 (53.169)	lr 0.02498
Train [3][700/3239]	Time 0.526 (0.824)	Data Time 0.002 (0.027)	Loss 4.0032 (4.0598)	Entropy 1.88286 (1.88544)	Top-1 acc 33.203 (29.879)	Top-5 acc 55.859 (53.170)	lr 0.02498
Train [3][710/3239]	Time 0.516 (0.823)	Data Time 0.001 (0.027)	Loss 4.0654 (4.0591)	Entropy 1.88281 (1.88541)	Top-1 acc 30.859 (29.897)	Top-5 acc 50.391 (53.190)	lr 0.02498
Train [3][720/3239]	Time 0.542 (0.823)	Data Time 0.001 (0.027)	Loss 3.8333 (4.0591)	Entropy 1.88268 (1.88537)	Top-1 acc 38.281 (29.909)	Top-5 acc 59.766 (53.200)	lr 0.02498
Train [3][730/3239]	Time 0.384 (0.822)	Data Time 0.001 (0.026)	Loss 4.2659 (4.0601)	Entropy 1.88264 (1.88533)	Top-1 acc 25.391 (29.889)	Top-5 acc 48.047 (53.170)	lr 0.02498
Train [3][740/3239]	Time 0.662 (0.821)	Data Time 0.001 (0.026)	Loss 4.0707 (4.0594)	Entropy 1.88249 (1.88530)	Top-1 acc 32.422 (29.908)	Top-5 acc 51.562 (53.186)	lr 0.02498
Train [3][750/3239]	Time 0.553 (0.820)	Data Time 0.001 (0.026)	Loss 4.0763 (4.0595)	Entropy 1.88236 (1.88526)	Top-1 acc 31.641 (29.907)	Top-5 acc 52.734 (53.174)	lr 0.02498
Train [3][760/3239]	Time 0.525 (0.819)	Data Time 0.001 (0.026)	Loss 3.8899 (4.0593)	Entropy 1.88223 (1.88522)	Top-1 acc 33.984 (29.907)	Top-5 acc 57.422 (53.170)	lr 0.02498
Train [3][770/3239]	Time 0.484 (0.819)	Data Time 0.001 (0.025)	Loss 4.0260 (4.0587)	Entropy 1.88214 (1.88518)	Top-1 acc 33.984 (29.933)	Top-5 acc 56.641 (53.197)	lr 0.02498
Train [3][780/3239]	Time 0.523 (0.818)	Data Time 0.001 (0.025)	Loss 4.1602 (4.0584)	Entropy 1.88207 (1.88514)	Top-1 acc 26.562 (29.938)	Top-5 acc 51.172 (53.205)	lr 0.02498
Train [3][790/3239]	Time 0.471 (0.817)	Data Time 0.001 (0.025)	Loss 4.1134 (4.0576)	Entropy 1.88199 (1.88510)	Top-1 acc 29.688 (29.934)	Top-5 acc 51.172 (53.219)	lr 0.02498
Train [3][800/3239]	Time 0.532 (0.816)	Data Time 0.001 (0.024)	Loss 3.9088 (4.0578)	Entropy 1.88192 (1.88506)	Top-1 acc 35.938 (29.928)	Top-5 acc 56.641 (53.212)	lr 0.02498
Train [3][810/3239]	Time 0.522 (0.815)	Data Time 0.001 (0.024)	Loss 4.1480 (4.0581)	Entropy 1.88180 (1.88502)	Top-1 acc 23.047 (29.922)	Top-5 acc 50.781 (53.213)	lr 0.02498
Train [3][820/3239]	Time 0.428 (0.814)	Data Time 0.001 (0.024)	Loss 4.1337 (4.0588)	Entropy 1.88165 (1.88498)	Top-1 acc 30.469 (29.911)	Top-5 acc 50.000 (53.198)	lr 0.02498
Train [3][830/3239]	Time 0.382 (0.813)	Data Time 0.001 (0.024)	Loss 4.0926 (4.0593)	Entropy 1.88155 (1.88494)	Top-1 acc 30.469 (29.909)	Top-5 acc 55.078 (53.204)	lr 0.02498
Train [3][840/3239]	Time 0.481 (0.811)	Data Time 0.001 (0.024)	Loss 3.9281 (4.0589)	Entropy 1.88147 (1.88490)	Top-1 acc 33.984 (29.909)	Top-5 acc 57.031 (53.213)	lr 0.02498
Train [3][850/3239]	Time 0.409 (0.811)	Data Time 0.001 (0.023)	Loss 3.9294 (4.0585)	Entropy 1.88139 (1.88486)	Top-1 acc 31.641 (29.905)	Top-5 acc 55.078 (53.215)	lr 0.02498
Train [3][860/3239]	Time 0.530 (0.810)	Data Time 0.001 (0.023)	Loss 4.0655 (4.0582)	Entropy 1.88128 (1.88482)	Top-1 acc 26.562 (29.901)	Top-5 acc 53.516 (53.225)	lr 0.02498
Train [3][870/3239]	Time 0.537 (0.810)	Data Time 0.001 (0.023)	Loss 4.0137 (4.0584)	Entropy 1.88126 (1.88478)	Top-1 acc 32.031 (29.893)	Top-5 acc 57.422 (53.232)	lr 0.02498
Train [3][880/3239]	Time 0.531 (0.809)	Data Time 0.001 (0.023)	Loss 4.3550 (4.0591)	Entropy 1.88116 (1.88474)	Top-1 acc 23.828 (29.879)	Top-5 acc 46.484 (53.224)	lr 0.02498
Train [3][890/3239]	Time 0.307 (0.809)	Data Time 0.001 (0.022)	Loss 4.0531 (4.0593)	Entropy 1.88101 (1.88470)	Top-1 acc 31.641 (29.875)	Top-5 acc 47.656 (53.208)	lr 0.02498
Train [3][900/3239]	Time 0.488 (0.808)	Data Time 0.001 (0.022)	Loss 3.9207 (4.0593)	Entropy 1.88092 (1.88466)	Top-1 acc 33.203 (29.880)	Top-5 acc 56.641 (53.215)	lr 0.02498
Train [3][910/3239]	Time 0.477 (0.807)	Data Time 0.001 (0.022)	Loss 4.2750 (4.0595)	Entropy 1.88078 (1.88462)	Top-1 acc 25.781 (29.883)	Top-5 acc 46.875 (53.216)	lr 0.02498
Train [3][920/3239]	Time 0.599 (0.807)	Data Time 0.001 (0.022)	Loss 3.9601 (4.0599)	Entropy 1.88071 (1.88457)	Top-1 acc 32.422 (29.889)	Top-5 acc 55.078 (53.217)	lr 0.02498
Train [3][930/3239]	Time 0.519 (0.806)	Data Time 0.001 (0.022)	Loss 4.2101 (4.0590)	Entropy 1.88062 (1.88453)	Top-1 acc 26.953 (29.902)	Top-5 acc 51.172 (53.248)	lr 0.02498
Train [3][940/3239]	Time 0.495 (0.806)	Data Time 0.002 (0.022)	Loss 4.0438 (4.0586)	Entropy 1.88046 (1.88449)	Top-1 acc 30.078 (29.915)	Top-5 acc 52.734 (53.263)	lr 0.02498
Train [3][950/3239]	Time 0.495 (0.805)	Data Time 0.001 (0.021)	Loss 4.0660 (4.0586)	Entropy 1.88034 (1.88445)	Top-1 acc 26.953 (29.918)	Top-5 acc 53.516 (53.258)	lr 0.02498
Train [3][960/3239]	Time 0.481 (0.805)	Data Time 0.001 (0.021)	Loss 4.0302 (4.0584)	Entropy 1.88029 (1.88440)	Top-1 acc 29.688 (29.914)	Top-5 acc 52.734 (53.258)	lr 0.02498
Train [3][970/3239]	Time 0.428 (0.804)	Data Time 0.002 (0.021)	Loss 3.9413 (4.0584)	Entropy 1.88017 (1.88436)	Top-1 acc 27.344 (29.906)	Top-5 acc 55.078 (53.251)	lr 0.02498
Train [3][980/3239]	Time 0.558 (0.804)	Data Time 0.001 (0.021)	Loss 3.9537 (4.0586)	Entropy 1.88005 (1.88432)	Top-1 acc 33.984 (29.908)	Top-5 acc 55.469 (53.238)	lr 0.02498
Train [3][990/3239]	Time 0.464 (0.803)	Data Time 0.001 (0.021)	Loss 3.9407 (4.0589)	Entropy 1.87991 (1.88428)	Top-1 acc 29.688 (29.895)	Top-5 acc 56.250 (53.233)	lr 0.02498
Train [3][1000/3239]	Time 0.354 (0.802)	Data Time 0.001 (0.021)	Loss 4.2404 (4.0590)	Entropy 1.87986 (1.88423)	Top-1 acc 25.781 (29.889)	Top-5 acc 50.000 (53.234)	lr 0.02498
Train [3][1010/3239]	Time 0.478 (0.801)	Data Time 0.001 (0.021)	Loss 4.1727 (4.0594)	Entropy 1.87979 (1.88419)	Top-1 acc 27.344 (29.892)	Top-5 acc 51.562 (53.225)	lr 0.02498
Train [3][1020/3239]	Time 0.518 (0.801)	Data Time 0.001 (0.020)	Loss 4.2693 (4.0593)	Entropy 1.87970 (1.88414)	Top-1 acc 26.172 (29.896)	Top-5 acc 48.047 (53.221)	lr 0.02498
Train [3][1030/3239]	Time 0.546 (0.801)	Data Time 0.001 (0.020)	Loss 3.9717 (4.0598)	Entropy 1.87961 (1.88410)	Top-1 acc 30.469 (29.890)	Top-5 acc 55.078 (53.205)	lr 0.02498
Train [3][1040/3239]	Time 0.539 (0.800)	Data Time 0.001 (0.020)	Loss 3.8960 (4.0598)	Entropy 1.87950 (1.88406)	Top-1 acc 30.859 (29.886)	Top-5 acc 53.516 (53.206)	lr 0.02498
Train [3][1050/3239]	Time 0.559 (0.800)	Data Time 0.001 (0.020)	Loss 3.8647 (4.0595)	Entropy 1.87938 (1.88401)	Top-1 acc 35.156 (29.893)	Top-5 acc 57.422 (53.206)	lr 0.02498
Train [3][1060/3239]	Time 0.437 (0.799)	Data Time 0.001 (0.020)	Loss 4.1862 (4.0599)	Entropy 1.87931 (1.88397)	Top-1 acc 25.000 (29.893)	Top-5 acc 48.047 (53.192)	lr 0.02498
Train [3][1070/3239]	Time 0.535 (0.799)	Data Time 0.001 (0.020)	Loss 3.9922 (4.0596)	Entropy 1.87913 (1.88393)	Top-1 acc 29.297 (29.892)	Top-5 acc 57.422 (53.199)	lr 0.02498
Train [3][1080/3239]	Time 0.512 (0.799)	Data Time 0.001 (0.020)	Loss 3.9605 (4.0599)	Entropy 1.87900 (1.88388)	Top-1 acc 32.812 (29.897)	Top-5 acc 54.297 (53.197)	lr 0.02498
Train [3][1090/3239]	Time 0.522 (0.798)	Data Time 0.001 (0.019)	Loss 4.0419 (4.0602)	Entropy 1.87890 (1.88384)	Top-1 acc 30.078 (29.892)	Top-5 acc 52.344 (53.185)	lr 0.02498
Train [3][1100/3239]	Time 0.532 (0.798)	Data Time 0.001 (0.019)	Loss 4.0239 (4.0600)	Entropy 1.87882 (1.88379)	Top-1 acc 29.297 (29.888)	Top-5 acc 57.422 (53.192)	lr 0.02498
Train [3][1110/3239]	Time 0.569 (0.798)	Data Time 0.001 (0.019)	Loss 3.8143 (4.0595)	Entropy 1.87875 (1.88375)	Top-1 acc 38.672 (29.901)	Top-5 acc 60.547 (53.217)	lr 0.02498
Train [3][1120/3239]	Time 0.644 (0.797)	Data Time 0.001 (0.019)	Loss 3.9206 (4.0594)	Entropy 1.87868 (1.88370)	Top-1 acc 32.422 (29.905)	Top-5 acc 55.078 (53.221)	lr 0.02498
Train [3][1130/3239]	Time 0.569 (0.797)	Data Time 0.001 (0.019)	Loss 4.1380 (4.0593)	Entropy 1.87861 (1.88366)	Top-1 acc 29.688 (29.905)	Top-5 acc 53.125 (53.219)	lr 0.02498
Train [3][1140/3239]	Time 0.499 (0.796)	Data Time 0.001 (0.019)	Loss 4.0001 (4.0591)	Entropy 1.87847 (1.88361)	Top-1 acc 31.250 (29.905)	Top-5 acc 55.078 (53.224)	lr 0.02498
Train [3][1150/3239]	Time 0.469 (0.796)	Data Time 0.001 (0.018)	Loss 3.9025 (4.0591)	Entropy 1.87839 (1.88357)	Top-1 acc 33.984 (29.902)	Top-5 acc 57.422 (53.226)	lr 0.02498
Train [3][1160/3239]	Time 0.335 (0.796)	Data Time 0.002 (0.018)	Loss 4.0054 (4.0590)	Entropy 1.87832 (1.88352)	Top-1 acc 30.078 (29.899)	Top-5 acc 54.297 (53.242)	lr 0.02498
Train [3][1170/3239]	Time 0.535 (0.795)	Data Time 0.001 (0.018)	Loss 4.0545 (4.0592)	Entropy 1.87825 (1.88348)	Top-1 acc 26.953 (29.894)	Top-5 acc 51.562 (53.231)	lr 0.02498
Train [3][1180/3239]	Time 0.608 (0.795)	Data Time 0.001 (0.018)	Loss 4.0302 (4.0591)	Entropy 1.87811 (1.88343)	Top-1 acc 30.859 (29.899)	Top-5 acc 52.734 (53.231)	lr 0.02498
Train [3][1190/3239]	Time 0.507 (0.794)	Data Time 0.001 (0.018)	Loss 4.0964 (4.0589)	Entropy 1.87807 (1.88339)	Top-1 acc 28.906 (29.904)	Top-5 acc 50.391 (53.230)	lr 0.02498
Train [3][1200/3239]	Time 0.419 (0.793)	Data Time 0.001 (0.018)	Loss 4.1193 (4.0591)	Entropy 1.87793 (1.88334)	Top-1 acc 28.906 (29.904)	Top-5 acc 52.344 (53.225)	lr 0.02498
Train [3][1210/3239]	Time 0.420 (0.793)	Data Time 0.001 (0.018)	Loss 4.1960 (4.0594)	Entropy 1.87781 (1.88330)	Top-1 acc 25.781 (29.896)	Top-5 acc 50.391 (53.218)	lr 0.02498
Train [3][1220/3239]	Time 0.477 (0.793)	Data Time 0.001 (0.018)	Loss 4.3321 (4.0596)	Entropy 1.87767 (1.88325)	Top-1 acc 25.781 (29.895)	Top-5 acc 48.438 (53.211)	lr 0.02498
Train [3][1230/3239]	Time 0.584 (0.793)	Data Time 0.001 (0.018)	Loss 4.0108 (4.0596)	Entropy 1.87755 (1.88321)	Top-1 acc 29.688 (29.904)	Top-5 acc 53.516 (53.211)	lr 0.02498
Train [3][1240/3239]	Time 0.569 (0.793)	Data Time 0.001 (0.018)	Loss 3.9756 (4.0595)	Entropy 1.87745 (1.88316)	Top-1 acc 30.859 (29.907)	Top-5 acc 53.125 (53.215)	lr 0.02498
Train [3][1250/3239]	Time 0.555 (0.792)	Data Time 0.001 (0.017)	Loss 4.0495 (4.0594)	Entropy 1.87738 (1.88312)	Top-1 acc 30.078 (29.907)	Top-5 acc 56.250 (53.216)	lr 0.02498
Train [3][1260/3239]	Time 0.549 (0.792)	Data Time 0.003 (0.017)	Loss 4.0855 (4.0594)	Entropy 1.87719 (1.88307)	Top-1 acc 28.516 (29.902)	Top-5 acc 52.734 (53.219)	lr 0.02498
Train [3][1270/3239]	Time 0.509 (0.792)	Data Time 0.001 (0.017)	Loss 4.1921 (4.0597)	Entropy 1.87713 (1.88302)	Top-1 acc 30.469 (29.902)	Top-5 acc 48.828 (53.217)	lr 0.02498
Train [3][1280/3239]	Time 0.513 (0.792)	Data Time 0.001 (0.017)	Loss 4.1319 (4.0596)	Entropy 1.87704 (1.88298)	Top-1 acc 28.125 (29.900)	Top-5 acc 51.953 (53.222)	lr 0.02498
Train [3][1290/3239]	Time 0.621 (0.792)	Data Time 0.001 (0.017)	Loss 4.1374 (4.0594)	Entropy 1.87697 (1.88293)	Top-1 acc 25.000 (29.904)	Top-5 acc 55.078 (53.236)	lr 0.02498
Train [3][1300/3239]	Time 0.510 (0.791)	Data Time 0.001 (0.017)	Loss 4.2245 (4.0598)	Entropy 1.87690 (1.88288)	Top-1 acc 27.344 (29.894)	Top-5 acc 52.734 (53.228)	lr 0.02498
Train [3][1310/3239]	Time 0.567 (0.791)	Data Time 0.001 (0.017)	Loss 3.9801 (4.0597)	Entropy 1.87682 (1.88284)	Top-1 acc 35.547 (29.894)	Top-5 acc 56.641 (53.232)	lr 0.02498
Train [3][1320/3239]	Time 0.409 (0.791)	Data Time 0.001 (0.017)	Loss 4.0196 (4.0596)	Entropy 1.87682 (1.88279)	Top-1 acc 30.469 (29.899)	Top-5 acc 51.953 (53.235)	lr 0.02498
Train [3][1330/3239]	Time 0.510 (0.790)	Data Time 0.001 (0.017)	Loss 4.2994 (4.0600)	Entropy 1.87666 (1.88275)	Top-1 acc 25.000 (29.884)	Top-5 acc 50.781 (53.225)	lr 0.02498
Train [3][1340/3239]	Time 0.688 (0.790)	Data Time 0.002 (0.016)	Loss 4.1204 (4.0602)	Entropy 1.87650 (1.88270)	Top-1 acc 29.297 (29.877)	Top-5 acc 50.391 (53.219)	lr 0.02498
Train [3][1350/3239]	Time 0.659 (0.802)	Data Time 0.005 (0.016)	Loss 4.1855 (4.0603)	Entropy 1.87638 (1.88266)	Top-1 acc 24.219 (29.877)	Top-5 acc 55.078 (53.221)	lr 0.02497
Train [3][1360/3239]	Time 0.563 (0.802)	Data Time 0.002 (0.016)	Loss 3.9547 (4.0606)	Entropy 1.87625 (1.88261)	Top-1 acc 28.516 (29.865)	Top-5 acc 53.516 (53.218)	lr 0.02497
Train [3][1370/3239]	Time 0.517 (0.802)	Data Time 0.001 (0.016)	Loss 3.9501 (4.0605)	Entropy 1.87613 (1.88256)	Top-1 acc 32.031 (29.864)	Top-5 acc 52.344 (53.216)	lr 0.02497
Train [3][1380/3239]	Time 0.552 (0.802)	Data Time 0.001 (0.016)	Loss 4.2083 (4.0607)	Entropy 1.87611 (1.88252)	Top-1 acc 27.734 (29.869)	Top-5 acc 50.391 (53.214)	lr 0.02497
Train [3][1390/3239]	Time 0.545 (0.802)	Data Time 0.001 (0.016)	Loss 4.0259 (4.0608)	Entropy 1.87595 (1.88247)	Top-1 acc 28.125 (29.867)	Top-5 acc 51.562 (53.216)	lr 0.02497
Train [3][1400/3239]	Time 0.558 (0.802)	Data Time 0.001 (0.016)	Loss 3.8763 (4.0609)	Entropy 1.87579 (1.88242)	Top-1 acc 35.156 (29.862)	Top-5 acc 57.031 (53.213)	lr 0.02497
Train [3][1410/3239]	Time 0.388 (0.801)	Data Time 0.001 (0.016)	Loss 3.9456 (4.0606)	Entropy 1.87575 (1.88238)	Top-1 acc 30.469 (29.866)	Top-5 acc 53.516 (53.215)	lr 0.02497
Train [3][1420/3239]	Time 0.459 (0.801)	Data Time 0.002 (0.016)	Loss 4.2234 (4.0610)	Entropy 1.87567 (1.88233)	Top-1 acc 26.562 (29.857)	Top-5 acc 50.000 (53.199)	lr 0.02497
Train [3][1430/3239]	Time 0.501 (0.801)	Data Time 0.001 (0.016)	Loss 3.9343 (4.0611)	Entropy 1.87569 (1.88228)	Top-1 acc 32.031 (29.849)	Top-5 acc 57.812 (53.196)	lr 0.02497
Train [3][1440/3239]	Time 0.524 (0.801)	Data Time 0.001 (0.016)	Loss 3.8136 (4.0610)	Entropy 1.87563 (1.88224)	Top-1 acc 32.422 (29.848)	Top-5 acc 59.375 (53.201)	lr 0.02497
Train [3][1450/3239]	Time 0.503 (0.801)	Data Time 0.001 (0.016)	Loss 4.0879 (4.0607)	Entropy 1.87556 (1.88219)	Top-1 acc 28.516 (29.852)	Top-5 acc 55.469 (53.207)	lr 0.02497
Train [3][1460/3239]	Time 0.371 (0.800)	Data Time 0.001 (0.015)	Loss 4.0526 (4.0607)	Entropy 1.87550 (1.88215)	Top-1 acc 30.859 (29.857)	Top-5 acc 54.688 (53.208)	lr 0.02497
Train [3][1470/3239]	Time 0.505 (0.800)	Data Time 0.002 (0.015)	Loss 4.2641 (4.0609)	Entropy 1.87546 (1.88210)	Top-1 acc 27.344 (29.856)	Top-5 acc 46.484 (53.200)	lr 0.02497
Train [3][1480/3239]	Time 0.496 (0.799)	Data Time 0.001 (0.015)	Loss 4.1912 (4.0606)	Entropy 1.87539 (1.88206)	Top-1 acc 23.438 (29.856)	Top-5 acc 45.312 (53.206)	lr 0.02497
Train [3][1490/3239]	Time 0.515 (0.799)	Data Time 0.001 (0.015)	Loss 4.0808 (4.0607)	Entropy 1.87529 (1.88201)	Top-1 acc 27.344 (29.852)	Top-5 acc 55.469 (53.210)	lr 0.02497
Train [3][1500/3239]	Time 0.541 (0.799)	Data Time 0.001 (0.015)	Loss 3.9277 (4.0606)	Entropy 1.87520 (1.88197)	Top-1 acc 28.516 (29.854)	Top-5 acc 56.641 (53.209)	lr 0.02497
Train [3][1510/3239]	Time 0.538 (0.799)	Data Time 0.001 (0.015)	Loss 4.0055 (4.0605)	Entropy 1.87509 (1.88192)	Top-1 acc 29.297 (29.856)	Top-5 acc 53.906 (53.211)	lr 0.02497
Train [3][1520/3239]	Time 0.482 (0.799)	Data Time 0.001 (0.015)	Loss 4.0154 (4.0607)	Entropy 1.87502 (1.88188)	Top-1 acc 32.031 (29.853)	Top-5 acc 53.906 (53.214)	lr 0.02497
Train [3][1530/3239]	Time 0.444 (0.798)	Data Time 0.001 (0.015)	Loss 4.1631 (4.0609)	Entropy 1.87482 (1.88183)	Top-1 acc 28.516 (29.854)	Top-5 acc 55.469 (53.204)	lr 0.02497
Train [3][1540/3239]	Time 0.516 (0.798)	Data Time 0.001 (0.015)	Loss 4.1468 (4.0608)	Entropy 1.87468 (1.88178)	Top-1 acc 27.344 (29.859)	Top-5 acc 49.609 (53.204)	lr 0.02497
Train [3][1550/3239]	Time 0.525 (0.798)	Data Time 0.001 (0.015)	Loss 4.0029 (4.0605)	Entropy 1.87458 (1.88174)	Top-1 acc 31.250 (29.863)	Top-5 acc 53.516 (53.211)	lr 0.02497
Train [3][1560/3239]	Time 0.509 (0.797)	Data Time 0.001 (0.015)	Loss 4.0842 (4.0600)	Entropy 1.87442 (1.88169)	Top-1 acc 29.297 (29.867)	Top-5 acc 54.688 (53.223)	lr 0.02497
Train [3][1570/3239]	Time 0.549 (0.797)	Data Time 0.001 (0.015)	Loss 4.0046 (4.0599)	Entropy 1.87435 (1.88165)	Top-1 acc 33.203 (29.876)	Top-5 acc 53.906 (53.229)	lr 0.02497
Train [3][1580/3239]	Time 0.567 (0.797)	Data Time 0.001 (0.015)	Loss 4.0058 (4.0601)	Entropy 1.87422 (1.88160)	Top-1 acc 35.547 (29.871)	Top-5 acc 56.641 (53.223)	lr 0.02497
Train [3][1590/3239]	Time 0.499 (0.797)	Data Time 0.023 (0.015)	Loss 3.9370 (4.0600)	Entropy 1.87417 (1.88155)	Top-1 acc 28.516 (29.865)	Top-5 acc 57.031 (53.227)	lr 0.02497
Train [3][1600/3239]	Time 0.412 (0.796)	Data Time 0.001 (0.015)	Loss 3.8621 (4.0595)	Entropy 1.87404 (1.88151)	Top-1 acc 34.375 (29.871)	Top-5 acc 60.156 (53.242)	lr 0.02497
Train [3][1610/3239]	Time 0.524 (0.796)	Data Time 0.001 (0.015)	Loss 3.9957 (4.0593)	Entropy 1.87392 (1.88146)	Top-1 acc 30.469 (29.873)	Top-5 acc 55.469 (53.249)	lr 0.02497
Train [3][1620/3239]	Time 0.548 (0.796)	Data Time 0.001 (0.015)	Loss 4.0524 (4.0597)	Entropy 1.87383 (1.88141)	Top-1 acc 29.297 (29.869)	Top-5 acc 52.344 (53.238)	lr 0.02497
Train [3][1630/3239]	Time 0.363 (0.795)	Data Time 0.001 (0.014)	Loss 3.9673 (4.0597)	Entropy 1.87380 (1.88137)	Top-1 acc 28.516 (29.864)	Top-5 acc 51.172 (53.231)	lr 0.02497
Train [3][1640/3239]	Time 0.641 (0.795)	Data Time 0.001 (0.014)	Loss 3.9875 (4.0596)	Entropy 1.87378 (1.88132)	Top-1 acc 31.250 (29.869)	Top-5 acc 53.906 (53.235)	lr 0.02497
Train [3][1650/3239]	Time 0.530 (0.795)	Data Time 0.001 (0.014)	Loss 3.9845 (4.0597)	Entropy 1.87366 (1.88127)	Top-1 acc 31.641 (29.866)	Top-5 acc 58.203 (53.227)	lr 0.02497
Train [3][1660/3239]	Time 0.548 (0.795)	Data Time 0.001 (0.014)	Loss 3.8535 (4.0595)	Entropy 1.87358 (1.88123)	Top-1 acc 33.984 (29.864)	Top-5 acc 57.812 (53.227)	lr 0.02497
Train [3][1670/3239]	Time 0.494 (0.795)	Data Time 0.001 (0.014)	Loss 4.1197 (4.0597)	Entropy 1.87347 (1.88118)	Top-1 acc 25.000 (29.856)	Top-5 acc 53.516 (53.219)	lr 0.02497
Train [3][1680/3239]	Time 0.472 (0.794)	Data Time 0.001 (0.014)	Loss 4.1295 (4.0599)	Entropy 1.87341 (1.88114)	Top-1 acc 31.250 (29.850)	Top-5 acc 50.391 (53.209)	lr 0.02497
Train [3][1690/3239]	Time 0.495 (0.794)	Data Time 0.001 (0.014)	Loss 3.9564 (4.0600)	Entropy 1.87329 (1.88109)	Top-1 acc 32.031 (29.850)	Top-5 acc 55.469 (53.210)	lr 0.02497
Train [3][1700/3239]	Time 0.475 (0.794)	Data Time 0.001 (0.014)	Loss 3.9798 (4.0598)	Entropy 1.87322 (1.88104)	Top-1 acc 34.766 (29.854)	Top-5 acc 55.078 (53.213)	lr 0.02497
Train [3][1710/3239]	Time 0.498 (0.794)	Data Time 0.001 (0.014)	Loss 4.3716 (4.0597)	Entropy 1.87314 (1.88100)	Top-1 acc 26.562 (29.858)	Top-5 acc 47.266 (53.217)	lr 0.02497
Train [3][1720/3239]	Time 0.591 (0.794)	Data Time 0.001 (0.014)	Loss 4.0237 (4.0597)	Entropy 1.87310 (1.88095)	Top-1 acc 30.859 (29.858)	Top-5 acc 54.688 (53.217)	lr 0.02497
Train [3][1730/3239]	Time 0.592 (0.794)	Data Time 0.002 (0.014)	Loss 4.1875 (4.0594)	Entropy 1.87300 (1.88091)	Top-1 acc 31.250 (29.866)	Top-5 acc 53.125 (53.218)	lr 0.02497
Train [3][1740/3239]	Time 0.506 (0.794)	Data Time 0.001 (0.014)	Loss 3.8394 (4.0594)	Entropy 1.87293 (1.88086)	Top-1 acc 32.812 (29.863)	Top-5 acc 55.078 (53.219)	lr 0.02497
Train [3][1750/3239]	Time 0.623 (0.793)	Data Time 0.001 (0.014)	Loss 4.1691 (4.0596)	Entropy 1.87286 (1.88082)	Top-1 acc 29.297 (29.858)	Top-5 acc 49.219 (53.212)	lr 0.02497
Train [3][1760/3239]	Time 0.575 (0.793)	Data Time 0.001 (0.014)	Loss 3.9340 (4.0596)	Entropy 1.87275 (1.88077)	Top-1 acc 35.938 (29.857)	Top-5 acc 56.250 (53.208)	lr 0.02497
Train [3][1770/3239]	Time 0.526 (0.793)	Data Time 0.001 (0.014)	Loss 4.0256 (4.0597)	Entropy 1.87274 (1.88073)	Top-1 acc 31.641 (29.854)	Top-5 acc 55.859 (53.204)	lr 0.02497
Train [3][1780/3239]	Time 0.287 (0.793)	Data Time 0.001 (0.014)	Loss 4.0475 (4.0595)	Entropy 1.87260 (1.88068)	Top-1 acc 29.688 (29.859)	Top-5 acc 51.172 (53.206)	lr 0.02497
Train [3][1790/3239]	Time 0.537 (0.792)	Data Time 0.001 (0.014)	Loss 4.1410 (4.0595)	Entropy 1.87251 (1.88064)	Top-1 acc 30.469 (29.859)	Top-5 acc 51.953 (53.207)	lr 0.02497
Train [3][1800/3239]	Time 0.500 (0.792)	Data Time 0.001 (0.013)	Loss 3.8994 (4.0595)	Entropy 1.87241 (1.88059)	Top-1 acc 31.641 (29.860)	Top-5 acc 57.812 (53.211)	lr 0.02497
Train [3][1810/3239]	Time 0.379 (0.791)	Data Time 0.001 (0.013)	Loss 3.9460 (4.0591)	Entropy 1.87227 (1.88054)	Top-1 acc 33.984 (29.870)	Top-5 acc 56.641 (53.222)	lr 0.02497
Train [3][1820/3239]	Time 0.471 (0.791)	Data Time 0.001 (0.013)	Loss 4.1185 (4.0587)	Entropy 1.87213 (1.88050)	Top-1 acc 28.125 (29.876)	Top-5 acc 51.953 (53.232)	lr 0.02497
Train [3][1830/3239]	Time 0.413 (0.791)	Data Time 0.001 (0.013)	Loss 4.2801 (4.0588)	Entropy 1.87209 (1.88045)	Top-1 acc 23.828 (29.869)	Top-5 acc 43.750 (53.228)	lr 0.02497
Train [3][1840/3239]	Time 0.348 (0.791)	Data Time 0.001 (0.013)	Loss 4.1545 (4.0590)	Entropy 1.87198 (1.88041)	Top-1 acc 28.906 (29.866)	Top-5 acc 50.391 (53.225)	lr 0.02497
Train [3][1850/3239]	Time 0.550 (0.791)	Data Time 0.001 (0.013)	Loss 4.1916 (4.0589)	Entropy 1.87194 (1.88036)	Top-1 acc 28.906 (29.866)	Top-5 acc 49.609 (53.229)	lr 0.02497
Train [3][1860/3239]	Time 0.640 (0.791)	Data Time 0.001 (0.013)	Loss 4.1254 (4.0586)	Entropy 1.87184 (1.88032)	Top-1 acc 24.609 (29.872)	Top-5 acc 50.781 (53.235)	lr 0.02497
Train [3][1870/3239]	Time 0.538 (0.790)	Data Time 0.001 (0.013)	Loss 4.0764 (4.0581)	Entropy 1.87174 (1.88027)	Top-1 acc 31.250 (29.878)	Top-5 acc 48.828 (53.242)	lr 0.02497
Train [3][1880/3239]	Time 0.562 (0.790)	Data Time 0.001 (0.013)	Loss 4.0902 (4.0579)	Entropy 1.87160 (1.88023)	Top-1 acc 30.469 (29.884)	Top-5 acc 52.344 (53.242)	lr 0.02497
Train [3][1890/3239]	Time 0.595 (0.790)	Data Time 0.002 (0.013)	Loss 3.9007 (4.0577)	Entropy 1.87156 (1.88018)	Top-1 acc 32.422 (29.883)	Top-5 acc 57.031 (53.240)	lr 0.02497
Train [3][1900/3239]	Time 0.506 (0.790)	Data Time 0.001 (0.013)	Loss 4.0186 (4.0576)	Entropy 1.87144 (1.88013)	Top-1 acc 29.297 (29.882)	Top-5 acc 54.297 (53.245)	lr 0.02497
Train [3][1910/3239]	Time 0.396 (0.790)	Data Time 0.001 (0.013)	Loss 4.0488 (4.0576)	Entropy 1.87126 (1.88009)	Top-1 acc 30.469 (29.885)	Top-5 acc 52.344 (53.244)	lr 0.02497
Train [3][1920/3239]	Time 0.483 (0.790)	Data Time 0.001 (0.013)	Loss 4.0614 (4.0577)	Entropy 1.87122 (1.88004)	Top-1 acc 28.125 (29.891)	Top-5 acc 54.688 (53.247)	lr 0.02497
Train [3][1930/3239]	Time 0.531 (0.789)	Data Time 0.001 (0.013)	Loss 4.3547 (4.0580)	Entropy 1.87111 (1.88000)	Top-1 acc 26.172 (29.890)	Top-5 acc 48.047 (53.245)	lr 0.02497
Train [3][1940/3239]	Time 0.576 (0.789)	Data Time 0.001 (0.013)	Loss 3.9311 (4.0577)	Entropy 1.87102 (1.87995)	Top-1 acc 30.078 (29.894)	Top-5 acc 53.906 (53.249)	lr 0.02497
Train [3][1950/3239]	Time 0.363 (0.789)	Data Time 0.001 (0.013)	Loss 4.2074 (4.0576)	Entropy 1.87088 (1.87990)	Top-1 acc 28.516 (29.896)	Top-5 acc 51.562 (53.250)	lr 0.02497
Train [3][1960/3239]	Time 0.577 (0.789)	Data Time 0.001 (0.013)	Loss 3.8113 (4.0571)	Entropy 1.87078 (1.87986)	Top-1 acc 33.594 (29.905)	Top-5 acc 57.031 (53.263)	lr 0.02497
Train [3][1970/3239]	Time 0.480 (0.789)	Data Time 0.001 (0.013)	Loss 4.0782 (4.0569)	Entropy 1.87080 (1.87981)	Top-1 acc 28.516 (29.904)	Top-5 acc 55.078 (53.262)	lr 0.02497
Train [3][1980/3239]	Time 0.250 (0.788)	Data Time 0.001 (0.013)	Loss 3.9875 (4.0571)	Entropy 1.87073 (1.87977)	Top-1 acc 29.688 (29.903)	Top-5 acc 52.344 (53.257)	lr 0.02497
Train [3][1990/3239]	Time 0.577 (0.788)	Data Time 0.002 (0.013)	Loss 3.8976 (4.0568)	Entropy 1.87066 (1.87972)	Top-1 acc 34.766 (29.905)	Top-5 acc 57.812 (53.269)	lr 0.02497
Train [3][2000/3239]	Time 0.522 (0.788)	Data Time 0.001 (0.013)	Loss 3.9797 (4.0569)	Entropy 1.87053 (1.87968)	Top-1 acc 30.469 (29.903)	Top-5 acc 57.031 (53.271)	lr 0.02497
Train [3][2010/3239]	Time 0.407 (0.795)	Data Time 0.002 (0.013)	Loss 4.0335 (4.0568)	Entropy 1.87047 (1.87963)	Top-1 acc 29.688 (29.909)	Top-5 acc 52.344 (53.270)	lr 0.02497
Train [3][2020/3239]	Time 0.693 (0.795)	Data Time 0.002 (0.013)	Loss 4.0578 (4.0567)	Entropy 1.87044 (1.87958)	Top-1 acc 28.125 (29.914)	Top-5 acc 52.344 (53.276)	lr 0.02497
Train [3][2030/3239]	Time 0.434 (0.795)	Data Time 0.001 (0.013)	Loss 4.0058 (4.0565)	Entropy 1.87039 (1.87954)	Top-1 acc 32.031 (29.915)	Top-5 acc 53.516 (53.280)	lr 0.02497
Train [3][2040/3239]	Time 0.406 (0.795)	Data Time 0.001 (0.013)	Loss 3.9095 (4.0565)	Entropy 1.87027 (1.87949)	Top-1 acc 33.984 (29.916)	Top-5 acc 58.203 (53.286)	lr 0.02497
Train [3][2050/3239]	Time 0.446 (0.795)	Data Time 0.023 (0.013)	Loss 4.1101 (4.0563)	Entropy 1.87014 (1.87945)	Top-1 acc 29.688 (29.918)	Top-5 acc 53.125 (53.293)	lr 0.02497
Train [3][2060/3239]	Time 0.543 (0.795)	Data Time 0.001 (0.013)	Loss 4.0867 (4.0562)	Entropy 1.87009 (1.87940)	Top-1 acc 29.297 (29.922)	Top-5 acc 54.297 (53.300)	lr 0.02497
Train [3][2070/3239]	Time 0.482 (0.795)	Data Time 0.002 (0.013)	Loss 4.0613 (4.0564)	Entropy 1.86999 (1.87936)	Top-1 acc 30.078 (29.918)	Top-5 acc 54.688 (53.299)	lr 0.02497
Train [3][2080/3239]	Time 0.529 (0.795)	Data Time 0.001 (0.013)	Loss 4.0566 (4.0563)	Entropy 1.86982 (1.87931)	Top-1 acc 27.344 (29.923)	Top-5 acc 49.609 (53.297)	lr 0.02497
Train [3][2090/3239]	Time 0.551 (0.794)	Data Time 0.001 (0.012)	Loss 4.1164 (4.0565)	Entropy 1.86962 (1.87927)	Top-1 acc 27.344 (29.921)	Top-5 acc 52.344 (53.291)	lr 0.02497
Train [3][2100/3239]	Time 0.511 (0.794)	Data Time 0.001 (0.012)	Loss 4.1622 (4.0564)	Entropy 1.86956 (1.87922)	Top-1 acc 29.688 (29.924)	Top-5 acc 51.172 (53.294)	lr 0.02497
Train [3][2110/3239]	Time 0.478 (0.794)	Data Time 0.001 (0.012)	Loss 4.2431 (4.0562)	Entropy 1.86944 (1.87918)	Top-1 acc 29.688 (29.927)	Top-5 acc 49.219 (53.295)	lr 0.02497
Train [3][2120/3239]	Time 0.503 (0.793)	Data Time 0.001 (0.012)	Loss 3.9931 (4.0564)	Entropy 1.86934 (1.87913)	Top-1 acc 27.734 (29.918)	Top-5 acc 57.812 (53.290)	lr 0.02497
Train [3][2130/3239]	Time 0.661 (0.793)	Data Time 0.001 (0.012)	Loss 3.7989 (4.0563)	Entropy 1.86924 (1.87908)	Top-1 acc 34.375 (29.922)	Top-5 acc 57.422 (53.293)	lr 0.02497
Train [3][2140/3239]	Time 0.527 (0.793)	Data Time 0.001 (0.012)	Loss 3.8813 (4.0563)	Entropy 1.86923 (1.87904)	Top-1 acc 31.641 (29.923)	Top-5 acc 56.250 (53.293)	lr 0.02497
Train [3][2150/3239]	Time 0.496 (0.793)	Data Time 0.001 (0.012)	Loss 3.9221 (4.0562)	Entropy 1.86921 (1.87899)	Top-1 acc 31.641 (29.926)	Top-5 acc 57.422 (53.289)	lr 0.02497
Train [3][2160/3239]	Time 0.504 (0.793)	Data Time 0.001 (0.012)	Loss 4.1647 (4.0561)	Entropy 1.86917 (1.87895)	Top-1 acc 26.562 (29.925)	Top-5 acc 50.000 (53.291)	lr 0.02497
Train [3][2170/3239]	Time 0.463 (0.793)	Data Time 0.001 (0.012)	Loss 3.9438 (4.0563)	Entropy 1.86901 (1.87890)	Top-1 acc 30.859 (29.924)	Top-5 acc 53.125 (53.290)	lr 0.02497
Train [3][2180/3239]	Time 0.533 (0.793)	Data Time 0.002 (0.012)	Loss 4.0096 (4.0563)	Entropy 1.86895 (1.87886)	Top-1 acc 31.250 (29.927)	Top-5 acc 58.594 (53.294)	lr 0.02497
Train [3][2190/3239]	Time 0.476 (0.793)	Data Time 0.002 (0.012)	Loss 3.9231 (4.0561)	Entropy 1.86890 (1.87881)	Top-1 acc 32.812 (29.928)	Top-5 acc 57.812 (53.299)	lr 0.02497
Train [3][2200/3239]	Time 0.568 (0.792)	Data Time 0.001 (0.012)	Loss 4.0110 (4.0560)	Entropy 1.86886 (1.87877)	Top-1 acc 31.250 (29.929)	Top-5 acc 52.344 (53.301)	lr 0.02497
Train [3][2210/3239]	Time 0.587 (0.792)	Data Time 0.001 (0.012)	Loss 4.0586 (4.0560)	Entropy 1.86871 (1.87872)	Top-1 acc 28.516 (29.926)	Top-5 acc 51.562 (53.300)	lr 0.02497
Train [3][2220/3239]	Time 0.487 (0.792)	Data Time 0.001 (0.012)	Loss 4.1059 (4.0561)	Entropy 1.86858 (1.87868)	Top-1 acc 32.031 (29.923)	Top-5 acc 53.906 (53.298)	lr 0.02497
Train [3][2230/3239]	Time 0.504 (0.792)	Data Time 0.001 (0.012)	Loss 3.9128 (4.0559)	Entropy 1.86851 (1.87863)	Top-1 acc 31.250 (29.927)	Top-5 acc 53.906 (53.302)	lr 0.02497
Train [3][2240/3239]	Time 0.521 (0.792)	Data Time 0.001 (0.012)	Loss 4.2095 (4.0556)	Entropy 1.86838 (1.87858)	Top-1 acc 26.562 (29.928)	Top-5 acc 52.734 (53.305)	lr 0.02497
Train [3][2250/3239]	Time 0.525 (0.792)	Data Time 0.001 (0.012)	Loss 4.1248 (4.0552)	Entropy 1.86828 (1.87854)	Top-1 acc 31.250 (29.938)	Top-5 acc 50.781 (53.312)	lr 0.02497
Train [3][2260/3239]	Time 0.574 (0.792)	Data Time 0.001 (0.012)	Loss 4.1230 (4.0554)	Entropy 1.86825 (1.87849)	Top-1 acc 28.906 (29.935)	Top-5 acc 52.344 (53.307)	lr 0.02497
Train [3][2270/3239]	Time 0.534 (0.791)	Data Time 0.002 (0.012)	Loss 4.2895 (4.0553)	Entropy 1.86813 (1.87845)	Top-1 acc 30.078 (29.942)	Top-5 acc 48.828 (53.314)	lr 0.02497
Train [3][2280/3239]	Time 0.407 (0.791)	Data Time 0.002 (0.012)	Loss 4.0621 (4.0553)	Entropy 1.86799 (1.87840)	Top-1 acc 31.250 (29.936)	Top-5 acc 53.516 (53.316)	lr 0.02497
Train [3][2290/3239]	Time 0.681 (0.791)	Data Time 0.001 (0.012)	Loss 4.0920 (4.0553)	Entropy 1.86778 (1.87836)	Top-1 acc 32.031 (29.937)	Top-5 acc 53.125 (53.313)	lr 0.02497
Train [3][2300/3239]	Time 0.485 (0.791)	Data Time 0.001 (0.012)	Loss 3.9594 (4.0553)	Entropy 1.86764 (1.87831)	Top-1 acc 30.078 (29.939)	Top-5 acc 53.516 (53.314)	lr 0.02497
Train [3][2310/3239]	Time 0.532 (0.790)	Data Time 0.001 (0.012)	Loss 4.0230 (4.0553)	Entropy 1.86745 (1.87826)	Top-1 acc 31.250 (29.939)	Top-5 acc 51.172 (53.317)	lr 0.02497
Train [3][2320/3239]	Time 0.384 (0.790)	Data Time 0.001 (0.011)	Loss 3.9693 (4.0552)	Entropy 1.86734 (1.87822)	Top-1 acc 32.031 (29.944)	Top-5 acc 56.250 (53.319)	lr 0.02497
Train [3][2330/3239]	Time 0.474 (0.790)	Data Time 0.001 (0.011)	Loss 4.0861 (4.0553)	Entropy 1.86720 (1.87817)	Top-1 acc 30.078 (29.945)	Top-5 acc 48.828 (53.320)	lr 0.02497
Train [3][2340/3239]	Time 0.442 (0.790)	Data Time 0.001 (0.011)	Loss 3.8229 (4.0550)	Entropy 1.86711 (1.87812)	Top-1 acc 35.547 (29.952)	Top-5 acc 55.859 (53.324)	lr 0.02497
Train [3][2350/3239]	Time 0.496 (0.790)	Data Time 0.001 (0.011)	Loss 4.1091 (4.0548)	Entropy 1.86708 (1.87808)	Top-1 acc 28.125 (29.957)	Top-5 acc 52.344 (53.328)	lr 0.02497
Train [3][2360/3239]	Time 0.613 (0.790)	Data Time 0.001 (0.011)	Loss 4.2392 (4.0550)	Entropy 1.86698 (1.87803)	Top-1 acc 26.562 (29.957)	Top-5 acc 50.781 (53.326)	lr 0.02497
Train [3][2370/3239]	Time 0.637 (0.790)	Data Time 0.001 (0.011)	Loss 4.1863 (4.0550)	Entropy 1.86690 (1.87798)	Top-1 acc 28.516 (29.954)	Top-5 acc 51.953 (53.325)	lr 0.02497
Train [3][2380/3239]	Time 0.537 (0.790)	Data Time 0.001 (0.011)	Loss 3.9880 (4.0550)	Entropy 1.86674 (1.87794)	Top-1 acc 30.859 (29.955)	Top-5 acc 55.078 (53.324)	lr 0.02497
Train [3][2390/3239]	Time 0.412 (0.790)	Data Time 0.001 (0.011)	Loss 3.8813 (4.0547)	Entropy 1.86664 (1.87789)	Top-1 acc 34.375 (29.960)	Top-5 acc 57.031 (53.326)	lr 0.02497
Train [3][2400/3239]	Time 0.536 (0.790)	Data Time 0.001 (0.011)	Loss 3.8276 (4.0547)	Entropy 1.86654 (1.87784)	Top-1 acc 33.984 (29.965)	Top-5 acc 60.156 (53.323)	lr 0.02497
Train [3][2410/3239]	Time 0.530 (0.790)	Data Time 0.001 (0.011)	Loss 4.2139 (4.0550)	Entropy 1.86649 (1.87780)	Top-1 acc 25.781 (29.963)	Top-5 acc 49.219 (53.318)	lr 0.02497
Train [3][2420/3239]	Time 0.549 (0.789)	Data Time 0.001 (0.011)	Loss 4.0859 (4.0547)	Entropy 1.86631 (1.87775)	Top-1 acc 31.250 (29.968)	Top-5 acc 50.391 (53.325)	lr 0.02497
Train [3][2430/3239]	Time 0.575 (0.789)	Data Time 0.001 (0.011)	Loss 4.2038 (4.0547)	Entropy 1.86624 (1.87770)	Top-1 acc 26.172 (29.967)	Top-5 acc 49.609 (53.325)	lr 0.02497
Train [3][2440/3239]	Time 0.547 (0.789)	Data Time 0.001 (0.011)	Loss 4.1586 (4.0547)	Entropy 1.86604 (1.87765)	Top-1 acc 26.562 (29.972)	Top-5 acc 48.828 (53.328)	lr 0.02497
Train [3][2450/3239]	Time 0.462 (0.789)	Data Time 0.001 (0.011)	Loss 4.0282 (4.0546)	Entropy 1.86595 (1.87761)	Top-1 acc 30.469 (29.970)	Top-5 acc 54.297 (53.332)	lr 0.02497
Train [3][2460/3239]	Time 0.553 (0.789)	Data Time 0.001 (0.011)	Loss 4.0154 (4.0546)	Entropy 1.86584 (1.87756)	Top-1 acc 34.766 (29.974)	Top-5 acc 55.469 (53.331)	lr 0.02497
Train [3][2470/3239]	Time 0.493 (0.788)	Data Time 0.001 (0.011)	Loss 3.9318 (4.0543)	Entropy 1.86568 (1.87751)	Top-1 acc 30.859 (29.979)	Top-5 acc 57.031 (53.339)	lr 0.02497
Train [3][2480/3239]	Time 0.539 (0.788)	Data Time 0.001 (0.011)	Loss 3.9309 (4.0544)	Entropy 1.86558 (1.87746)	Top-1 acc 28.125 (29.974)	Top-5 acc 53.906 (53.336)	lr 0.02497
Train [3][2490/3239]	Time 0.508 (0.788)	Data Time 0.001 (0.011)	Loss 4.0019 (4.0542)	Entropy 1.86551 (1.87742)	Top-1 acc 30.859 (29.980)	Top-5 acc 54.297 (53.340)	lr 0.02497
Train [3][2500/3239]	Time 0.461 (0.788)	Data Time 0.001 (0.011)	Loss 3.9999 (4.0541)	Entropy 1.86540 (1.87737)	Top-1 acc 32.422 (29.984)	Top-5 acc 54.297 (53.343)	lr 0.02497
Train [3][2510/3239]	Time 0.378 (0.788)	Data Time 0.001 (0.011)	Loss 4.1892 (4.0540)	Entropy 1.86526 (1.87732)	Top-1 acc 31.250 (29.985)	Top-5 acc 52.734 (53.344)	lr 0.02497
Train [3][2520/3239]	Time 0.549 (0.788)	Data Time 0.001 (0.011)	Loss 4.0112 (4.0542)	Entropy 1.86515 (1.87727)	Top-1 acc 27.344 (29.980)	Top-5 acc 53.906 (53.338)	lr 0.02497
Train [3][2530/3239]	Time 0.656 (0.788)	Data Time 0.001 (0.011)	Loss 4.2159 (4.0541)	Entropy 1.86506 (1.87722)	Top-1 acc 31.250 (29.990)	Top-5 acc 51.953 (53.344)	lr 0.02497
Train [3][2540/3239]	Time 0.506 (0.788)	Data Time 0.001 (0.011)	Loss 3.9439 (4.0540)	Entropy 1.86492 (1.87718)	Top-1 acc 33.594 (29.991)	Top-5 acc 57.422 (53.350)	lr 0.02497
Train [3][2550/3239]	Time 0.493 (0.788)	Data Time 0.001 (0.011)	Loss 3.9165 (4.0538)	Entropy 1.86482 (1.87713)	Top-1 acc 29.297 (29.994)	Top-5 acc 53.906 (53.351)	lr 0.02497
Train [3][2560/3239]	Time 0.500 (0.788)	Data Time 0.001 (0.011)	Loss 3.9380 (4.0536)	Entropy 1.86469 (1.87708)	Top-1 acc 28.516 (29.996)	Top-5 acc 55.469 (53.360)	lr 0.02497
Train [3][2570/3239]	Time 0.492 (0.788)	Data Time 0.001 (0.011)	Loss 4.1054 (4.0535)	Entropy 1.86455 (1.87703)	Top-1 acc 27.344 (30.000)	Top-5 acc 51.172 (53.364)	lr 0.02497
Train [3][2580/3239]	Time 0.543 (0.788)	Data Time 0.001 (0.011)	Loss 3.9779 (4.0533)	Entropy 1.86446 (1.87698)	Top-1 acc 31.250 (30.003)	Top-5 acc 52.734 (53.365)	lr 0.02497
Train [3][2590/3239]	Time 0.399 (0.788)	Data Time 0.002 (0.011)	Loss 4.2448 (4.0531)	Entropy 1.86434 (1.87693)	Top-1 acc 27.344 (30.004)	Top-5 acc 49.609 (53.365)	lr 0.02497
Train [3][2600/3239]	Time 0.533 (0.787)	Data Time 0.002 (0.011)	Loss 4.0662 (4.0531)	Entropy 1.86418 (1.87689)	Top-1 acc 29.297 (30.001)	Top-5 acc 52.344 (53.370)	lr 0.02497
Train [3][2610/3239]	Time 0.485 (0.787)	Data Time 0.001 (0.011)	Loss 4.1698 (4.0531)	Entropy 1.86409 (1.87684)	Top-1 acc 33.984 (30.008)	Top-5 acc 51.953 (53.369)	lr 0.02497
Train [3][2620/3239]	Time 0.550 (0.787)	Data Time 0.003 (0.011)	Loss 4.0448 (4.0528)	Entropy 1.86396 (1.87679)	Top-1 acc 28.125 (30.012)	Top-5 acc 55.469 (53.374)	lr 0.02497
Train [3][2630/3239]	Time 0.441 (0.787)	Data Time 0.001 (0.011)	Loss 4.2950 (4.0528)	Entropy 1.86384 (1.87674)	Top-1 acc 25.391 (30.012)	Top-5 acc 49.219 (53.375)	lr 0.02497
Train [3][2640/3239]	Time 0.607 (0.787)	Data Time 0.001 (0.011)	Loss 4.0033 (4.0530)	Entropy 1.86380 (1.87669)	Top-1 acc 29.297 (30.011)	Top-5 acc 53.125 (53.372)	lr 0.02497
Train [3][2650/3239]	Time 0.509 (0.787)	Data Time 0.001 (0.011)	Loss 4.1158 (4.0528)	Entropy 1.86364 (1.87664)	Top-1 acc 29.688 (30.014)	Top-5 acc 48.438 (53.377)	lr 0.02497
Train [3][2660/3239]	Time 0.676 (0.792)	Data Time 0.006 (0.011)	Loss 4.0124 (4.0530)	Entropy 1.86359 (1.87659)	Top-1 acc 30.469 (30.007)	Top-5 acc 57.031 (53.373)	lr 0.02497
Train [3][2670/3239]	Time 0.534 (0.792)	Data Time 0.002 (0.011)	Loss 4.1980 (4.0530)	Entropy 1.86348 (1.87654)	Top-1 acc 30.859 (30.010)	Top-5 acc 49.219 (53.377)	lr 0.02497
Train [3][2680/3239]	Time 0.422 (0.792)	Data Time 0.001 (0.010)	Loss 4.1559 (4.0528)	Entropy 1.86340 (1.87650)	Top-1 acc 30.078 (30.016)	Top-5 acc 52.734 (53.382)	lr 0.02497
Train [3][2690/3239]	Time 0.532 (0.792)	Data Time 0.001 (0.011)	Loss 4.1677 (4.0530)	Entropy 1.86331 (1.87645)	Top-1 acc 29.688 (30.018)	Top-5 acc 49.219 (53.378)	lr 0.02497
Train [3][2700/3239]	Time 0.540 (0.792)	Data Time 0.001 (0.010)	Loss 4.0934 (4.0529)	Entropy 1.86316 (1.87640)	Top-1 acc 29.297 (30.021)	Top-5 acc 51.172 (53.381)	lr 0.02497
Train [3][2710/3239]	Time 0.532 (0.792)	Data Time 0.001 (0.010)	Loss 3.9499 (4.0529)	Entropy 1.86297 (1.87635)	Top-1 acc 30.078 (30.020)	Top-5 acc 50.391 (53.379)	lr 0.02497
Train [3][2720/3239]	Time 0.610 (0.792)	Data Time 0.001 (0.010)	Loss 4.2187 (4.0532)	Entropy 1.86284 (1.87630)	Top-1 acc 26.562 (30.011)	Top-5 acc 48.828 (53.375)	lr 0.02497
Train [3][2730/3239]	Time 0.559 (0.792)	Data Time 0.002 (0.010)	Loss 4.2528 (4.0532)	Entropy 1.86280 (1.87625)	Top-1 acc 25.000 (30.007)	Top-5 acc 48.047 (53.374)	lr 0.02497
Train [3][2740/3239]	Time 0.264 (0.792)	Data Time 0.001 (0.010)	Loss 3.8700 (4.0531)	Entropy 1.86272 (1.87620)	Top-1 acc 35.156 (30.010)	Top-5 acc 55.078 (53.373)	lr 0.02497
Train [3][2750/3239]	Time 0.237 (0.791)	Data Time 0.001 (0.010)	Loss 4.0306 (4.0530)	Entropy 1.86259 (1.87615)	Top-1 acc 28.516 (30.011)	Top-5 acc 50.781 (53.379)	lr 0.02497
Train [3][2760/3239]	Time 0.535 (0.791)	Data Time 0.001 (0.010)	Loss 3.9755 (4.0528)	Entropy 1.86244 (1.87610)	Top-1 acc 32.422 (30.012)	Top-5 acc 51.953 (53.379)	lr 0.02497
Train [3][2770/3239]	Time 0.498 (0.791)	Data Time 0.003 (0.010)	Loss 3.9334 (4.0526)	Entropy 1.86237 (1.87605)	Top-1 acc 31.641 (30.015)	Top-5 acc 55.078 (53.382)	lr 0.02497
Train [3][2780/3239]	Time 0.495 (0.791)	Data Time 0.001 (0.010)	Loss 4.0432 (4.0525)	Entropy 1.86215 (1.87600)	Top-1 acc 32.812 (30.019)	Top-5 acc 53.516 (53.388)	lr 0.02497
Train [3][2790/3239]	Time 0.543 (0.791)	Data Time 0.001 (0.010)	Loss 3.9057 (4.0523)	Entropy 1.86203 (1.87595)	Top-1 acc 29.688 (30.022)	Top-5 acc 57.031 (53.389)	lr 0.02496
Train [3][2800/3239]	Time 0.548 (0.791)	Data Time 0.001 (0.010)	Loss 4.0308 (4.0522)	Entropy 1.86189 (1.87590)	Top-1 acc 32.031 (30.025)	Top-5 acc 56.250 (53.394)	lr 0.02496
Train [3][2810/3239]	Time 0.522 (0.791)	Data Time 0.001 (0.010)	Loss 4.2792 (4.0521)	Entropy 1.86180 (1.87585)	Top-1 acc 31.250 (30.027)	Top-5 acc 50.781 (53.398)	lr 0.02496
Train [3][2820/3239]	Time 0.494 (0.791)	Data Time 0.003 (0.010)	Loss 4.4105 (4.0521)	Entropy 1.86170 (1.87580)	Top-1 acc 23.047 (30.019)	Top-5 acc 47.656 (53.396)	lr 0.02496
Train [3][2830/3239]	Time 0.508 (0.791)	Data Time 0.001 (0.010)	Loss 3.9063 (4.0518)	Entropy 1.86163 (1.87575)	Top-1 acc 33.594 (30.025)	Top-5 acc 58.203 (53.402)	lr 0.02496
Train [3][2840/3239]	Time 0.578 (0.791)	Data Time 0.001 (0.010)	Loss 3.9328 (4.0517)	Entropy 1.86155 (1.87570)	Top-1 acc 30.078 (30.025)	Top-5 acc 52.344 (53.399)	lr 0.02496
Train [3][2850/3239]	Time 0.624 (0.791)	Data Time 0.001 (0.010)	Loss 3.9760 (4.0517)	Entropy 1.86151 (1.87565)	Top-1 acc 32.031 (30.029)	Top-5 acc 55.859 (53.401)	lr 0.02496
Train [3][2860/3239]	Time 0.538 (0.790)	Data Time 0.001 (0.010)	Loss 3.9517 (4.0516)	Entropy 1.86139 (1.87561)	Top-1 acc 31.250 (30.026)	Top-5 acc 53.125 (53.400)	lr 0.02496
Train [3][2870/3239]	Time 0.519 (0.790)	Data Time 0.001 (0.010)	Loss 4.0107 (4.0516)	Entropy 1.86129 (1.87556)	Top-1 acc 30.078 (30.023)	Top-5 acc 58.203 (53.398)	lr 0.02496
Train [3][2880/3239]	Time 0.485 (0.790)	Data Time 0.001 (0.010)	Loss 4.1568 (4.0518)	Entropy 1.86116 (1.87551)	Top-1 acc 26.562 (30.022)	Top-5 acc 51.953 (53.392)	lr 0.02496
Train [3][2890/3239]	Time 0.552 (0.790)	Data Time 0.001 (0.010)	Loss 4.0612 (4.0517)	Entropy 1.86105 (1.87546)	Top-1 acc 27.734 (30.025)	Top-5 acc 55.859 (53.395)	lr 0.02496
Train [3][2900/3239]	Time 0.530 (0.790)	Data Time 0.001 (0.010)	Loss 4.1233 (4.0518)	Entropy 1.86098 (1.87541)	Top-1 acc 27.734 (30.019)	Top-5 acc 48.828 (53.389)	lr 0.02496
Train [3][2910/3239]	Time 0.514 (0.790)	Data Time 0.001 (0.010)	Loss 4.1321 (4.0519)	Entropy 1.86080 (1.87536)	Top-1 acc 27.734 (30.017)	Top-5 acc 49.219 (53.390)	lr 0.02496
Train [3][2920/3239]	Time 0.476 (0.790)	Data Time 0.001 (0.010)	Loss 4.3359 (4.0520)	Entropy 1.86064 (1.87531)	Top-1 acc 25.391 (30.018)	Top-5 acc 49.219 (53.394)	lr 0.02496
Train [3][2930/3239]	Time 0.705 (0.790)	Data Time 0.001 (0.010)	Loss 3.9777 (4.0519)	Entropy 1.86062 (1.87526)	Top-1 acc 28.516 (30.017)	Top-5 acc 55.078 (53.398)	lr 0.02496
Train [3][2940/3239]	Time 0.505 (0.790)	Data Time 0.001 (0.010)	Loss 4.0469 (4.0518)	Entropy 1.86043 (1.87521)	Top-1 acc 30.078 (30.018)	Top-5 acc 53.906 (53.396)	lr 0.02496
Train [3][2950/3239]	Time 0.483 (0.789)	Data Time 0.001 (0.010)	Loss 3.7851 (4.0517)	Entropy 1.86026 (1.87516)	Top-1 acc 37.500 (30.022)	Top-5 acc 61.328 (53.400)	lr 0.02496
Train [3][2960/3239]	Time 0.426 (0.789)	Data Time 0.001 (0.010)	Loss 4.0729 (4.0518)	Entropy 1.86017 (1.87511)	Top-1 acc 32.031 (30.016)	Top-5 acc 53.516 (53.401)	lr 0.02496
Train [3][2970/3239]	Time 0.346 (0.789)	Data Time 0.001 (0.010)	Loss 4.1189 (4.0519)	Entropy 1.86011 (1.87506)	Top-1 acc 32.031 (30.012)	Top-5 acc 50.391 (53.399)	lr 0.02496
Train [3][2980/3239]	Time 0.378 (0.789)	Data Time 0.001 (0.010)	Loss 4.0159 (4.0517)	Entropy 1.86006 (1.87501)	Top-1 acc 31.641 (30.017)	Top-5 acc 57.031 (53.404)	lr 0.02496
Train [3][2990/3239]	Time 0.493 (0.789)	Data Time 0.001 (0.010)	Loss 4.1263 (4.0517)	Entropy 1.86001 (1.87496)	Top-1 acc 27.734 (30.018)	Top-5 acc 51.562 (53.410)	lr 0.02496
Train [3][3000/3239]	Time 0.603 (0.789)	Data Time 0.001 (0.010)	Loss 4.1241 (4.0517)	Entropy 1.85997 (1.87491)	Top-1 acc 27.734 (30.015)	Top-5 acc 50.781 (53.406)	lr 0.02496
Train [3][3010/3239]	Time 0.522 (0.789)	Data Time 0.001 (0.010)	Loss 4.1883 (4.0517)	Entropy 1.85981 (1.87486)	Top-1 acc 29.688 (30.017)	Top-5 acc 48.828 (53.406)	lr 0.02496
Train [3][3020/3239]	Time 0.581 (0.789)	Data Time 0.001 (0.010)	Loss 4.0040 (4.0517)	Entropy 1.85980 (1.87481)	Top-1 acc 30.078 (30.017)	Top-5 acc 56.641 (53.407)	lr 0.02496
Train [3][3030/3239]	Time 0.531 (0.789)	Data Time 0.002 (0.010)	Loss 4.2866 (4.0515)	Entropy 1.85964 (1.87476)	Top-1 acc 26.172 (30.019)	Top-5 acc 49.609 (53.410)	lr 0.02496
Train [3][3040/3239]	Time 0.513 (0.789)	Data Time 0.001 (0.010)	Loss 3.9272 (4.0514)	Entropy 1.85956 (1.87471)	Top-1 acc 35.938 (30.022)	Top-5 acc 57.812 (53.415)	lr 0.02496
Train [3][3050/3239]	Time 0.610 (0.789)	Data Time 0.001 (0.010)	Loss 4.0927 (4.0514)	Entropy 1.85943 (1.87466)	Top-1 acc 29.688 (30.021)	Top-5 acc 51.172 (53.412)	lr 0.02496
Train [3][3060/3239]	Time 0.338 (0.789)	Data Time 0.001 (0.010)	Loss 3.9488 (4.0513)	Entropy 1.85936 (1.87461)	Top-1 acc 31.641 (30.024)	Top-5 acc 55.859 (53.415)	lr 0.02496
Train [3][3070/3239]	Time 0.492 (0.789)	Data Time 0.001 (0.010)	Loss 4.0743 (4.0512)	Entropy 1.85925 (1.87456)	Top-1 acc 29.688 (30.028)	Top-5 acc 54.297 (53.415)	lr 0.02496
Train [3][3080/3239]	Time 0.398 (0.788)	Data Time 0.001 (0.010)	Loss 4.0999 (4.0510)	Entropy 1.85908 (1.87451)	Top-1 acc 30.859 (30.031)	Top-5 acc 54.297 (53.422)	lr 0.02496
Train [3][3090/3239]	Time 0.474 (0.788)	Data Time 0.001 (0.010)	Loss 3.9561 (4.0508)	Entropy 1.85898 (1.87446)	Top-1 acc 30.859 (30.033)	Top-5 acc 54.688 (53.425)	lr 0.02496
Train [3][3100/3239]	Time 0.510 (0.788)	Data Time 0.001 (0.010)	Loss 3.9420 (4.0509)	Entropy 1.85890 (1.87441)	Top-1 acc 29.297 (30.028)	Top-5 acc 54.297 (53.420)	lr 0.02496
Train [3][3110/3239]	Time 0.545 (0.788)	Data Time 0.001 (0.010)	Loss 3.9629 (4.0509)	Entropy 1.85866 (1.87436)	Top-1 acc 32.031 (30.028)	Top-5 acc 54.688 (53.420)	lr 0.02496
Train [3][3120/3239]	Time 0.549 (0.788)	Data Time 0.001 (0.010)	Loss 4.1992 (4.0510)	Entropy 1.85857 (1.87431)	Top-1 acc 27.344 (30.027)	Top-5 acc 51.562 (53.418)	lr 0.02496
Train [3][3130/3239]	Time 0.535 (0.788)	Data Time 0.001 (0.010)	Loss 4.0697 (4.0509)	Entropy 1.85847 (1.87426)	Top-1 acc 29.297 (30.026)	Top-5 acc 53.516 (53.418)	lr 0.02496
Train [3][3140/3239]	Time 0.547 (0.788)	Data Time 0.001 (0.010)	Loss 4.1225 (4.0509)	Entropy 1.85833 (1.87421)	Top-1 acc 30.078 (30.024)	Top-5 acc 52.344 (53.418)	lr 0.02496
Train [3][3150/3239]	Time 0.536 (0.788)	Data Time 0.001 (0.010)	Loss 3.7835 (4.0509)	Entropy 1.85823 (1.87416)	Top-1 acc 37.500 (30.024)	Top-5 acc 60.156 (53.422)	lr 0.02496
Train [3][3160/3239]	Time 0.550 (0.788)	Data Time 0.001 (0.010)	Loss 4.2780 (4.0510)	Entropy 1.85815 (1.87410)	Top-1 acc 26.953 (30.023)	Top-5 acc 49.219 (53.419)	lr 0.02496
Train [3][3170/3239]	Time 0.485 (0.787)	Data Time 0.001 (0.009)	Loss 4.0605 (4.0510)	Entropy 1.85807 (1.87405)	Top-1 acc 27.344 (30.021)	Top-5 acc 58.594 (53.420)	lr 0.02496
Train [3][3180/3239]	Time 0.525 (0.787)	Data Time 0.000 (0.009)	Loss 3.9759 (4.0507)	Entropy 1.85800 (1.87400)	Top-1 acc 31.641 (30.025)	Top-5 acc 53.516 (53.429)	lr 0.02496
Train [3][3190/3239]	Time 0.394 (0.787)	Data Time 0.000 (0.009)	Loss 3.9556 (4.0506)	Entropy 1.85788 (1.87395)	Top-1 acc 31.250 (30.026)	Top-5 acc 56.250 (53.434)	lr 0.02496
Train [3][3200/3239]	Time 0.600 (0.787)	Data Time 0.000 (0.009)	Loss 4.2761 (4.0508)	Entropy 1.85773 (1.87390)	Top-1 acc 26.172 (30.023)	Top-5 acc 49.609 (53.431)	lr 0.02496
Train [3][3210/3239]	Time 0.508 (0.787)	Data Time 0.000 (0.009)	Loss 4.1351 (4.0506)	Entropy 1.85765 (1.87385)	Top-1 acc 31.641 (30.026)	Top-5 acc 54.688 (53.436)	lr 0.02496
Train [3][3220/3239]	Time 0.531 (0.787)	Data Time 0.000 (0.009)	Loss 3.9974 (4.0504)	Entropy 1.85757 (1.87380)	Top-1 acc 27.734 (30.022)	Top-5 acc 57.031 (53.442)	lr 0.02496
Train [3][3230/3239]	Time 0.402 (0.787)	Data Time 0.000 (0.009)	Loss 4.1240 (4.0504)	Entropy 1.85740 (1.87375)	Top-1 acc 28.125 (30.022)	Top-5 acc 51.953 (53.442)	lr 0.02496
Train [3][3239/3239]	Time 1.430 (0.787)	Data Time 0.000 (0.009)	Loss 4.1628 (4.0504)	Entropy 1.85733 (1.87371)	Top-1 acc 33.333 (30.024)	Top-5 acc 51.852 (53.441)	lr 0.02496
==========Valid [3/120]	loss 2.921	top-1 acc 38.757 (38.757)	top-5 acc 63.573	Train top-1 30.024	top-5 53.441	Entropy 1.85733	Latency-None: 0.000ms	Flops: 535.54M
Train [4][0/3239]	Time 17.071 (17.071)	Data Time 15.230 (15.230)	Loss 3.8791 (3.8791)	Entropy 1.85732 (1.85732)	Top-1 acc 30.859 (30.859)	Top-5 acc 56.250 (56.250)	lr 0.02496
Train [4][10/3239]	Time 0.582 (2.361)	Data Time 0.002 (1.399)	Loss 4.0777 (4.0118)	Entropy 1.85720 (1.85727)	Top-1 acc 30.078 (30.362)	Top-5 acc 53.516 (53.942)	lr 0.02496
Train [4][20/3239]	Time 0.590 (1.610)	Data Time 0.001 (0.734)	Loss 3.8615 (3.9905)	Entropy 1.85706 (1.85722)	Top-1 acc 33.594 (30.804)	Top-5 acc 58.203 (54.185)	lr 0.02496
Train [4][30/3239]	Time 0.463 (1.325)	Data Time 0.001 (0.498)	Loss 3.9832 (3.9832)	Entropy 1.85692 (1.85715)	Top-1 acc 32.812 (31.023)	Top-5 acc 55.078 (54.524)	lr 0.02496
Train [4][40/3239]	Time 0.208 (1.183)	Data Time 0.002 (0.377)	Loss 3.9763 (3.9825)	Entropy 1.85680 (1.85709)	Top-1 acc 32.031 (31.279)	Top-5 acc 56.641 (54.859)	lr 0.02496
Train [4][50/3239]	Time 0.541 (1.099)	Data Time 0.001 (0.306)	Loss 3.8895 (3.9942)	Entropy 1.85675 (1.85703)	Top-1 acc 33.984 (31.158)	Top-5 acc 58.594 (54.680)	lr 0.02496
Train [4][60/3239]	Time 0.476 (1.039)	Data Time 0.001 (0.256)	Loss 4.0086 (3.9973)	Entropy 1.85665 (1.85697)	Top-1 acc 29.688 (31.077)	Top-5 acc 54.688 (54.816)	lr 0.02496
Train [4][70/3239]	Time 0.530 (1.001)	Data Time 0.001 (0.220)	Loss 4.0909 (4.0056)	Entropy 1.85659 (1.85692)	Top-1 acc 29.688 (30.969)	Top-5 acc 53.516 (54.572)	lr 0.02496
Train [4][80/3239]	Time 0.484 (1.181)	Data Time 0.002 (0.194)	Loss 3.9487 (4.0018)	Entropy 1.85637 (1.85687)	Top-1 acc 30.469 (30.908)	Top-5 acc 54.688 (54.625)	lr 0.02496
Train [4][90/3239]	Time 0.494 (1.138)	Data Time 0.002 (0.173)	Loss 4.0710 (3.9985)	Entropy 1.85632 (1.85681)	Top-1 acc 31.641 (30.992)	Top-5 acc 54.297 (54.752)	lr 0.02496
Train [4][100/3239]	Time 0.403 (1.103)	Data Time 0.001 (0.156)	Loss 4.0459 (3.9978)	Entropy 1.85620 (1.85677)	Top-1 acc 31.250 (31.045)	Top-5 acc 51.172 (54.668)	lr 0.02496
Train [4][110/3239]	Time 0.569 (1.074)	Data Time 0.001 (0.143)	Loss 3.9738 (4.0000)	Entropy 1.85613 (1.85671)	Top-1 acc 30.859 (31.078)	Top-5 acc 54.297 (54.561)	lr 0.02496
Train [4][120/3239]	Time 0.598 (1.048)	Data Time 0.001 (0.131)	Loss 3.8835 (4.0010)	Entropy 1.85610 (1.85666)	Top-1 acc 37.109 (31.150)	Top-5 acc 57.031 (54.536)	lr 0.02496
Train [4][130/3239]	Time 0.467 (1.028)	Data Time 0.001 (0.122)	Loss 4.1025 (4.0037)	Entropy 1.85606 (1.85662)	Top-1 acc 30.078 (31.029)	Top-5 acc 48.047 (54.398)	lr 0.02496
Train [4][140/3239]	Time 0.540 (1.011)	Data Time 0.001 (0.113)	Loss 4.1568 (4.0057)	Entropy 1.85588 (1.85658)	Top-1 acc 27.344 (30.942)	Top-5 acc 48.828 (54.380)	lr 0.02496
Train [4][150/3239]	Time 0.441 (0.996)	Data Time 0.001 (0.106)	Loss 4.0339 (4.0055)	Entropy 1.85578 (1.85653)	Top-1 acc 31.641 (30.919)	Top-5 acc 55.469 (54.359)	lr 0.02496
Train [4][160/3239]	Time 0.543 (0.980)	Data Time 0.001 (0.100)	Loss 4.0110 (4.0027)	Entropy 1.85559 (1.85648)	Top-1 acc 30.078 (30.922)	Top-5 acc 51.562 (54.433)	lr 0.02496
Train [4][170/3239]	Time 0.423 (0.967)	Data Time 0.001 (0.094)	Loss 4.1677 (4.0064)	Entropy 1.85561 (1.85643)	Top-1 acc 30.078 (30.848)	Top-5 acc 50.391 (54.388)	lr 0.02496
Train [4][180/3239]	Time 0.503 (0.955)	Data Time 0.001 (0.089)	Loss 4.1942 (4.0070)	Entropy 1.85550 (1.85638)	Top-1 acc 32.422 (30.855)	Top-5 acc 52.344 (54.353)	lr 0.02496
Train [4][190/3239]	Time 0.534 (0.942)	Data Time 0.001 (0.084)	Loss 3.9175 (4.0088)	Entropy 1.85543 (1.85633)	Top-1 acc 31.250 (30.790)	Top-5 acc 57.031 (54.297)	lr 0.02496
Train [4][200/3239]	Time 0.521 (0.933)	Data Time 0.001 (0.080)	Loss 3.9902 (4.0093)	Entropy 1.85529 (1.85628)	Top-1 acc 28.516 (30.826)	Top-5 acc 55.078 (54.310)	lr 0.02496
Train [4][210/3239]	Time 0.535 (0.927)	Data Time 0.001 (0.077)	Loss 4.0095 (4.0091)	Entropy 1.85508 (1.85623)	Top-1 acc 33.203 (30.870)	Top-5 acc 53.906 (54.295)	lr 0.02496
Train [4][220/3239]	Time 0.581 (0.921)	Data Time 0.001 (0.074)	Loss 4.1294 (4.0070)	Entropy 1.85499 (1.85618)	Top-1 acc 28.906 (30.888)	Top-5 acc 50.781 (54.338)	lr 0.02496
Train [4][230/3239]	Time 0.522 (0.915)	Data Time 0.001 (0.071)	Loss 3.8471 (4.0068)	Entropy 1.85488 (1.85613)	Top-1 acc 33.984 (30.895)	Top-5 acc 58.594 (54.329)	lr 0.02496
Train [4][240/3239]	Time 0.496 (0.909)	Data Time 0.001 (0.068)	Loss 4.0406 (4.0069)	Entropy 1.85464 (1.85607)	Top-1 acc 35.156 (30.913)	Top-5 acc 51.562 (54.282)	lr 0.02496
Train [4][250/3239]	Time 0.468 (0.903)	Data Time 0.001 (0.065)	Loss 4.1571 (4.0075)	Entropy 1.85447 (1.85601)	Top-1 acc 30.078 (30.920)	Top-5 acc 51.562 (54.264)	lr 0.02496
Train [4][260/3239]	Time 0.555 (0.898)	Data Time 0.001 (0.063)	Loss 3.9626 (4.0064)	Entropy 1.85438 (1.85595)	Top-1 acc 30.078 (30.894)	Top-5 acc 51.562 (54.265)	lr 0.02496
Train [4][270/3239]	Time 0.579 (0.893)	Data Time 0.001 (0.061)	Loss 3.9394 (4.0057)	Entropy 1.85420 (1.85589)	Top-1 acc 28.516 (30.872)	Top-5 acc 58.594 (54.293)	lr 0.02496
Train [4][280/3239]	Time 0.511 (0.889)	Data Time 0.001 (0.059)	Loss 4.0564 (4.0040)	Entropy 1.85408 (1.85583)	Top-1 acc 30.859 (30.914)	Top-5 acc 54.688 (54.321)	lr 0.02496
Train [4][290/3239]	Time 0.479 (0.885)	Data Time 0.001 (0.057)	Loss 4.1237 (4.0022)	Entropy 1.85404 (1.85577)	Top-1 acc 27.734 (30.937)	Top-5 acc 53.125 (54.348)	lr 0.02496
Train [4][300/3239]	Time 0.464 (0.880)	Data Time 0.001 (0.055)	Loss 3.9713 (4.0034)	Entropy 1.85388 (1.85571)	Top-1 acc 35.156 (30.980)	Top-5 acc 54.688 (54.318)	lr 0.02496
Train [4][310/3239]	Time 0.500 (0.877)	Data Time 0.001 (0.053)	Loss 3.9681 (4.0010)	Entropy 1.85381 (1.85565)	Top-1 acc 31.641 (30.993)	Top-5 acc 57.031 (54.399)	lr 0.02496
Train [4][320/3239]	Time 0.567 (0.874)	Data Time 0.002 (0.052)	Loss 3.8221 (4.0013)	Entropy 1.85369 (1.85559)	Top-1 acc 32.422 (31.004)	Top-5 acc 58.203 (54.398)	lr 0.02496
Train [4][330/3239]	Time 0.516 (0.870)	Data Time 0.001 (0.050)	Loss 4.1708 (4.0032)	Entropy 1.85357 (1.85553)	Top-1 acc 28.516 (30.979)	Top-5 acc 51.172 (54.356)	lr 0.02496
Train [4][340/3239]	Time 0.440 (0.866)	Data Time 0.001 (0.049)	Loss 4.0686 (4.0021)	Entropy 1.85340 (1.85547)	Top-1 acc 29.688 (30.973)	Top-5 acc 52.734 (54.374)	lr 0.02496
Train [4][350/3239]	Time 0.297 (0.863)	Data Time 0.001 (0.048)	Loss 3.7627 (4.0016)	Entropy 1.85322 (1.85541)	Top-1 acc 34.375 (30.967)	Top-5 acc 58.984 (54.369)	lr 0.02496
Train [4][360/3239]	Time 0.539 (0.861)	Data Time 0.001 (0.047)	Loss 3.9370 (4.0031)	Entropy 1.85317 (1.85535)	Top-1 acc 31.250 (30.929)	Top-5 acc 53.125 (54.352)	lr 0.02496
Train [4][370/3239]	Time 0.550 (0.858)	Data Time 0.001 (0.046)	Loss 4.0901 (4.0029)	Entropy 1.85314 (1.85529)	Top-1 acc 32.031 (30.950)	Top-5 acc 51.953 (54.366)	lr 0.02496
Train [4][380/3239]	Time 0.568 (0.857)	Data Time 0.001 (0.044)	Loss 3.8593 (4.0016)	Entropy 1.85310 (1.85523)	Top-1 acc 30.469 (30.952)	Top-5 acc 57.812 (54.393)	lr 0.02496
Train [4][390/3239]	Time 0.523 (0.854)	Data Time 0.001 (0.043)	Loss 4.2076 (4.0026)	Entropy 1.85294 (1.85518)	Top-1 acc 25.000 (30.931)	Top-5 acc 50.391 (54.375)	lr 0.02496
Train [4][400/3239]	Time 0.504 (0.852)	Data Time 0.001 (0.042)	Loss 3.9194 (4.0043)	Entropy 1.85281 (1.85512)	Top-1 acc 30.469 (30.901)	Top-5 acc 55.859 (54.349)	lr 0.02496
Train [4][410/3239]	Time 0.669 (0.851)	Data Time 0.001 (0.041)	Loss 3.7708 (4.0033)	Entropy 1.85279 (1.85506)	Top-1 acc 35.938 (30.911)	Top-5 acc 62.109 (54.393)	lr 0.02496
Train [4][420/3239]	Time 0.514 (0.848)	Data Time 0.001 (0.040)	Loss 4.0605 (4.0045)	Entropy 1.85269 (1.85501)	Top-1 acc 27.344 (30.851)	Top-5 acc 53.516 (54.352)	lr 0.02496
Train [4][430/3239]	Time 0.338 (0.846)	Data Time 0.001 (0.040)	Loss 4.2188 (4.0044)	Entropy 1.85262 (1.85496)	Top-1 acc 25.391 (30.842)	Top-5 acc 50.781 (54.341)	lr 0.02496
Train [4][440/3239]	Time 0.582 (0.845)	Data Time 0.001 (0.039)	Loss 3.8412 (4.0038)	Entropy 1.85247 (1.85490)	Top-1 acc 34.375 (30.859)	Top-5 acc 57.031 (54.342)	lr 0.02496
Train [4][450/3239]	Time 0.594 (0.843)	Data Time 0.001 (0.038)	Loss 4.0966 (4.0033)	Entropy 1.85234 (1.85485)	Top-1 acc 29.688 (30.873)	Top-5 acc 52.734 (54.367)	lr 0.02496
Train [4][460/3239]	Time 0.516 (0.841)	Data Time 0.001 (0.038)	Loss 3.8985 (4.0043)	Entropy 1.85213 (1.85479)	Top-1 acc 33.594 (30.848)	Top-5 acc 60.156 (54.371)	lr 0.02496
Train [4][470/3239]	Time 0.592 (0.840)	Data Time 0.003 (0.037)	Loss 4.0473 (4.0035)	Entropy 1.85190 (1.85473)	Top-1 acc 30.469 (30.840)	Top-5 acc 48.828 (54.370)	lr 0.02496
Train [4][480/3239]	Time 0.402 (0.838)	Data Time 0.002 (0.036)	Loss 3.9902 (4.0032)	Entropy 1.85169 (1.85467)	Top-1 acc 30.469 (30.832)	Top-5 acc 55.859 (54.376)	lr 0.02496
Train [4][490/3239]	Time 0.424 (0.837)	Data Time 0.001 (0.036)	Loss 3.9480 (4.0025)	Entropy 1.85154 (1.85461)	Top-1 acc 30.859 (30.849)	Top-5 acc 55.078 (54.404)	lr 0.02496
Train [4][500/3239]	Time 0.561 (0.835)	Data Time 0.001 (0.035)	Loss 3.9648 (4.0026)	Entropy 1.85144 (1.85455)	Top-1 acc 33.594 (30.854)	Top-5 acc 51.562 (54.408)	lr 0.02496
Train [4][510/3239]	Time 0.389 (0.833)	Data Time 0.002 (0.035)	Loss 3.9397 (4.0023)	Entropy 1.85134 (1.85449)	Top-1 acc 30.859 (30.857)	Top-5 acc 55.469 (54.418)	lr 0.02496
Train [4][520/3239]	Time 0.339 (0.831)	Data Time 0.001 (0.034)	Loss 4.0643 (4.0021)	Entropy 1.85125 (1.85443)	Top-1 acc 29.688 (30.859)	Top-5 acc 49.609 (54.415)	lr 0.02496
Train [4][530/3239]	Time 0.543 (0.830)	Data Time 0.001 (0.033)	Loss 3.9907 (4.0018)	Entropy 1.85113 (1.85437)	Top-1 acc 29.297 (30.859)	Top-5 acc 55.469 (54.409)	lr 0.02496
Train [4][540/3239]	Time 0.494 (0.829)	Data Time 0.001 (0.033)	Loss 4.1889 (4.0022)	Entropy 1.85108 (1.85431)	Top-1 acc 26.562 (30.833)	Top-5 acc 49.219 (54.399)	lr 0.02496
Train [4][550/3239]	Time 0.550 (0.828)	Data Time 0.001 (0.032)	Loss 4.1656 (4.0027)	Entropy 1.85092 (1.85425)	Top-1 acc 27.344 (30.837)	Top-5 acc 50.391 (54.392)	lr 0.02496
Train [4][560/3239]	Time 0.461 (0.827)	Data Time 0.001 (0.032)	Loss 4.1681 (4.0041)	Entropy 1.85073 (1.85419)	Top-1 acc 27.734 (30.827)	Top-5 acc 48.828 (54.366)	lr 0.02496
Train [4][570/3239]	Time 0.614 (0.826)	Data Time 0.001 (0.031)	Loss 3.9187 (4.0041)	Entropy 1.85047 (1.85412)	Top-1 acc 33.203 (30.846)	Top-5 acc 55.859 (54.351)	lr 0.02496
Train [4][580/3239]	Time 0.538 (0.825)	Data Time 0.001 (0.031)	Loss 4.0712 (4.0046)	Entropy 1.85032 (1.85406)	Top-1 acc 31.250 (30.843)	Top-5 acc 52.734 (54.331)	lr 0.02496
Train [4][590/3239]	Time 0.510 (0.824)	Data Time 0.001 (0.030)	Loss 3.7367 (4.0046)	Entropy 1.85012 (1.85400)	Top-1 acc 39.062 (30.871)	Top-5 acc 60.938 (54.342)	lr 0.02496
Train [4][600/3239]	Time 0.552 (0.824)	Data Time 0.002 (0.030)	Loss 4.2286 (4.0045)	Entropy 1.85007 (1.85393)	Top-1 acc 28.516 (30.857)	Top-5 acc 48.047 (54.340)	lr 0.02496
Train [4][610/3239]	Time 0.521 (0.823)	Data Time 0.001 (0.029)	Loss 4.0799 (4.0048)	Entropy 1.84999 (1.85387)	Top-1 acc 32.422 (30.857)	Top-5 acc 53.516 (54.341)	lr 0.02496
Train [4][620/3239]	Time 0.436 (0.822)	Data Time 0.001 (0.029)	Loss 3.9013 (4.0042)	Entropy 1.84986 (1.85381)	Top-1 acc 32.812 (30.861)	Top-5 acc 56.250 (54.353)	lr 0.02496
Train [4][630/3239]	Time 0.510 (0.821)	Data Time 0.001 (0.029)	Loss 4.0687 (4.0046)	Entropy 1.84968 (1.85374)	Top-1 acc 32.812 (30.855)	Top-5 acc 53.125 (54.337)	lr 0.02496
Train [4][640/3239]	Time 0.520 (0.820)	Data Time 0.001 (0.028)	Loss 4.2307 (4.0053)	Entropy 1.84947 (1.85368)	Top-1 acc 26.172 (30.841)	Top-5 acc 46.094 (54.318)	lr 0.02496
Train [4][650/3239]	Time 0.613 (0.820)	Data Time 0.001 (0.028)	Loss 4.0328 (4.0048)	Entropy 1.84939 (1.85361)	Top-1 acc 29.688 (30.856)	Top-5 acc 53.906 (54.339)	lr 0.02496
Train [4][660/3239]	Time 0.388 (0.819)	Data Time 0.001 (0.028)	Loss 4.1613 (4.0057)	Entropy 1.84913 (1.85355)	Top-1 acc 26.562 (30.835)	Top-5 acc 50.781 (54.315)	lr 0.02496
Train [4][670/3239]	Time 0.616 (0.818)	Data Time 0.001 (0.027)	Loss 3.9180 (4.0055)	Entropy 1.84887 (1.85348)	Top-1 acc 30.078 (30.824)	Top-5 acc 60.156 (54.314)	lr 0.02496
Train [4][680/3239]	Time 0.478 (0.816)	Data Time 0.001 (0.027)	Loss 3.9515 (4.0058)	Entropy 1.84883 (1.85341)	Top-1 acc 28.906 (30.803)	Top-5 acc 55.078 (54.289)	lr 0.02496
Train [4][690/3239]	Time 0.531 (0.815)	Data Time 0.001 (0.026)	Loss 4.1544 (4.0072)	Entropy 1.84872 (1.85335)	Top-1 acc 30.078 (30.777)	Top-5 acc 51.172 (54.251)	lr 0.02496
Train [4][700/3239]	Time 0.540 (0.814)	Data Time 0.002 (0.026)	Loss 4.0052 (4.0075)	Entropy 1.84864 (1.85328)	Top-1 acc 29.688 (30.784)	Top-5 acc 57.422 (54.277)	lr 0.02496
Train [4][710/3239]	Time 0.484 (0.813)	Data Time 0.001 (0.026)	Loss 4.1507 (4.0076)	Entropy 1.84861 (1.85321)	Top-1 acc 26.953 (30.794)	Top-5 acc 55.469 (54.281)	lr 0.02496
Train [4][720/3239]	Time 0.467 (0.813)	Data Time 0.002 (0.025)	Loss 4.0720 (4.0075)	Entropy 1.84844 (1.85315)	Top-1 acc 28.516 (30.803)	Top-5 acc 52.344 (54.283)	lr 0.02496
Train [4][730/3239]	Time 0.596 (0.835)	Data Time 0.006 (0.025)	Loss 4.1862 (4.0072)	Entropy 1.84828 (1.85308)	Top-1 acc 25.000 (30.788)	Top-5 acc 50.391 (54.281)	lr 0.02496
Train [4][740/3239]	Time 0.528 (0.835)	Data Time 0.002 (0.025)	Loss 4.0207 (4.0073)	Entropy 1.84806 (1.85302)	Top-1 acc 32.812 (30.792)	Top-5 acc 52.734 (54.285)	lr 0.02496
Train [4][750/3239]	Time 0.560 (0.834)	Data Time 0.001 (0.025)	Loss 3.9140 (4.0065)	Entropy 1.84788 (1.85295)	Top-1 acc 29.688 (30.791)	Top-5 acc 55.078 (54.301)	lr 0.02496
Train [4][760/3239]	Time 0.377 (0.833)	Data Time 0.001 (0.024)	Loss 3.9319 (4.0070)	Entropy 1.84784 (1.85288)	Top-1 acc 31.250 (30.779)	Top-5 acc 56.250 (54.293)	lr 0.02496
Train [4][770/3239]	Time 0.574 (0.833)	Data Time 0.001 (0.024)	Loss 3.9713 (4.0074)	Entropy 1.84769 (1.85282)	Top-1 acc 32.031 (30.769)	Top-5 acc 56.641 (54.293)	lr 0.02496
Train [4][780/3239]	Time 0.544 (0.832)	Data Time 0.001 (0.024)	Loss 4.0582 (4.0078)	Entropy 1.84748 (1.85275)	Top-1 acc 34.375 (30.767)	Top-5 acc 54.688 (54.290)	lr 0.02496
Train [4][790/3239]	Time 0.291 (0.832)	Data Time 0.001 (0.024)	Loss 4.0780 (4.0083)	Entropy 1.84733 (1.85268)	Top-1 acc 30.078 (30.742)	Top-5 acc 54.297 (54.271)	lr 0.02495
Train [4][800/3239]	Time 0.539 (0.831)	Data Time 0.001 (0.024)	Loss 4.0410 (4.0077)	Entropy 1.84729 (1.85262)	Top-1 acc 29.297 (30.767)	Top-5 acc 55.469 (54.290)	lr 0.02495
Train [4][810/3239]	Time 0.411 (0.829)	Data Time 0.001 (0.023)	Loss 4.0498 (4.0079)	Entropy 1.84708 (1.85255)	Top-1 acc 27.344 (30.753)	Top-5 acc 54.297 (54.286)	lr 0.02495
Train [4][820/3239]	Time 0.407 (0.828)	Data Time 0.001 (0.023)	Loss 4.0580 (4.0075)	Entropy 1.84701 (1.85248)	Top-1 acc 29.297 (30.759)	Top-5 acc 53.906 (54.290)	lr 0.02495
Train [4][830/3239]	Time 0.539 (0.828)	Data Time 0.001 (0.023)	Loss 3.8070 (4.0069)	Entropy 1.84690 (1.85242)	Top-1 acc 35.547 (30.786)	Top-5 acc 57.812 (54.311)	lr 0.02495
Train [4][840/3239]	Time 0.513 (0.827)	Data Time 0.001 (0.023)	Loss 4.0094 (4.0069)	Entropy 1.84677 (1.85235)	Top-1 acc 32.031 (30.779)	Top-5 acc 53.125 (54.309)	lr 0.02495
Train [4][850/3239]	Time 0.517 (0.826)	Data Time 0.001 (0.023)	Loss 4.0902 (4.0066)	Entropy 1.84659 (1.85229)	Top-1 acc 26.172 (30.780)	Top-5 acc 50.781 (54.303)	lr 0.02495
Train [4][860/3239]	Time 0.510 (0.825)	Data Time 0.001 (0.022)	Loss 4.2271 (4.0072)	Entropy 1.84636 (1.85222)	Top-1 acc 29.297 (30.778)	Top-5 acc 51.953 (54.298)	lr 0.02495
Train [4][870/3239]	Time 0.574 (0.825)	Data Time 0.001 (0.022)	Loss 4.0439 (4.0076)	Entropy 1.84616 (1.85215)	Top-1 acc 29.688 (30.768)	Top-5 acc 52.734 (54.275)	lr 0.02495
Train [4][880/3239]	Time 0.465 (0.824)	Data Time 0.001 (0.022)	Loss 4.1758 (4.0073)	Entropy 1.84610 (1.85208)	Top-1 acc 30.469 (30.786)	Top-5 acc 50.000 (54.277)	lr 0.02495
Train [4][890/3239]	Time 0.486 (0.824)	Data Time 0.001 (0.022)	Loss 3.9938 (4.0077)	Entropy 1.84604 (1.85202)	Top-1 acc 29.297 (30.774)	Top-5 acc 51.953 (54.271)	lr 0.02495
Train [4][900/3239]	Time 0.572 (0.823)	Data Time 0.001 (0.022)	Loss 3.8358 (4.0073)	Entropy 1.84591 (1.85195)	Top-1 acc 33.203 (30.792)	Top-5 acc 60.156 (54.287)	lr 0.02495
Train [4][910/3239]	Time 0.541 (0.823)	Data Time 0.001 (0.021)	Loss 4.0187 (4.0081)	Entropy 1.84583 (1.85188)	Top-1 acc 28.125 (30.777)	Top-5 acc 54.688 (54.272)	lr 0.02495
Train [4][920/3239]	Time 0.425 (0.823)	Data Time 0.001 (0.021)	Loss 4.3103 (4.0085)	Entropy 1.84577 (1.85182)	Top-1 acc 23.438 (30.775)	Top-5 acc 45.703 (54.265)	lr 0.02495
Train [4][930/3239]	Time 0.341 (0.822)	Data Time 0.001 (0.021)	Loss 4.1258 (4.0088)	Entropy 1.84568 (1.85175)	Top-1 acc 30.078 (30.777)	Top-5 acc 52.344 (54.261)	lr 0.02495
Train [4][940/3239]	Time 0.533 (0.822)	Data Time 0.001 (0.021)	Loss 4.0453 (4.0095)	Entropy 1.84558 (1.85169)	Top-1 acc 30.078 (30.774)	Top-5 acc 55.078 (54.253)	lr 0.02495
Train [4][950/3239]	Time 0.407 (0.821)	Data Time 0.001 (0.021)	Loss 3.7505 (4.0091)	Entropy 1.84542 (1.85162)	Top-1 acc 31.641 (30.776)	Top-5 acc 59.766 (54.265)	lr 0.02495
Train [4][960/3239]	Time 0.511 (0.820)	Data Time 0.001 (0.021)	Loss 4.1186 (4.0094)	Entropy 1.84525 (1.85156)	Top-1 acc 30.469 (30.777)	Top-5 acc 51.172 (54.258)	lr 0.02495
Train [4][970/3239]	Time 0.424 (0.820)	Data Time 0.001 (0.021)	Loss 4.0563 (4.0098)	Entropy 1.84515 (1.85149)	Top-1 acc 31.250 (30.766)	Top-5 acc 51.172 (54.239)	lr 0.02495
Train [4][980/3239]	Time 0.607 (0.819)	Data Time 0.001 (0.020)	Loss 3.6972 (4.0099)	Entropy 1.84513 (1.85143)	Top-1 acc 32.422 (30.766)	Top-5 acc 62.500 (54.236)	lr 0.02495
Train [4][990/3239]	Time 0.518 (0.818)	Data Time 0.001 (0.020)	Loss 3.8903 (4.0096)	Entropy 1.84485 (1.85136)	Top-1 acc 34.375 (30.768)	Top-5 acc 54.297 (54.257)	lr 0.02495
Train [4][1000/3239]	Time 0.520 (0.817)	Data Time 0.001 (0.020)	Loss 3.9524 (4.0101)	Entropy 1.84473 (1.85130)	Top-1 acc 31.250 (30.754)	Top-5 acc 54.297 (54.234)	lr 0.02495
Train [4][1010/3239]	Time 0.532 (0.817)	Data Time 0.001 (0.020)	Loss 3.9128 (4.0103)	Entropy 1.84459 (1.85123)	Top-1 acc 32.031 (30.757)	Top-5 acc 57.031 (54.225)	lr 0.02495
Train [4][1020/3239]	Time 0.572 (0.816)	Data Time 0.001 (0.020)	Loss 3.8731 (4.0105)	Entropy 1.84438 (1.85116)	Top-1 acc 33.594 (30.739)	Top-5 acc 59.766 (54.234)	lr 0.02495
Train [4][1030/3239]	Time 0.548 (0.816)	Data Time 0.001 (0.020)	Loss 3.9641 (4.0104)	Entropy 1.84414 (1.85110)	Top-1 acc 33.203 (30.735)	Top-5 acc 55.078 (54.236)	lr 0.02495
Train [4][1040/3239]	Time 0.525 (0.815)	Data Time 0.001 (0.019)	Loss 4.1078 (4.0104)	Entropy 1.84402 (1.85103)	Top-1 acc 26.562 (30.742)	Top-5 acc 52.734 (54.236)	lr 0.02495
Train [4][1050/3239]	Time 0.589 (0.815)	Data Time 0.001 (0.019)	Loss 3.9354 (4.0101)	Entropy 1.84394 (1.85096)	Top-1 acc 31.641 (30.749)	Top-5 acc 58.984 (54.245)	lr 0.02495
Train [4][1060/3239]	Time 0.631 (0.815)	Data Time 0.001 (0.019)	Loss 4.0442 (4.0100)	Entropy 1.84386 (1.85090)	Top-1 acc 30.469 (30.749)	Top-5 acc 53.906 (54.253)	lr 0.02495
Train [4][1070/3239]	Time 0.508 (0.815)	Data Time 0.001 (0.019)	Loss 4.0098 (4.0095)	Entropy 1.84370 (1.85083)	Top-1 acc 28.516 (30.761)	Top-5 acc 52.734 (54.261)	lr 0.02495
Train [4][1080/3239]	Time 0.559 (0.814)	Data Time 0.001 (0.019)	Loss 4.1098 (4.0089)	Entropy 1.84358 (1.85076)	Top-1 acc 28.516 (30.772)	Top-5 acc 50.781 (54.268)	lr 0.02495
Train [4][1090/3239]	Time 0.516 (0.814)	Data Time 0.001 (0.019)	Loss 4.2006 (4.0095)	Entropy 1.84343 (1.85070)	Top-1 acc 27.734 (30.762)	Top-5 acc 50.781 (54.256)	lr 0.02495
Train [4][1100/3239]	Time 0.496 (0.814)	Data Time 0.001 (0.018)	Loss 4.3049 (4.0101)	Entropy 1.84326 (1.85063)	Top-1 acc 26.953 (30.766)	Top-5 acc 49.219 (54.256)	lr 0.02495
Train [4][1110/3239]	Time 0.567 (0.813)	Data Time 0.001 (0.018)	Loss 4.0985 (4.0106)	Entropy 1.84315 (1.85056)	Top-1 acc 31.641 (30.759)	Top-5 acc 55.078 (54.247)	lr 0.02495
Train [4][1120/3239]	Time 0.532 (0.813)	Data Time 0.001 (0.018)	Loss 4.1451 (4.0107)	Entropy 1.84306 (1.85050)	Top-1 acc 25.781 (30.753)	Top-5 acc 52.344 (54.241)	lr 0.02495
Train [4][1130/3239]	Time 0.519 (0.812)	Data Time 0.001 (0.018)	Loss 3.9368 (4.0108)	Entropy 1.84289 (1.85043)	Top-1 acc 38.672 (30.762)	Top-5 acc 57.031 (54.240)	lr 0.02495
Train [4][1140/3239]	Time 0.618 (0.812)	Data Time 0.001 (0.018)	Loss 3.9695 (4.0102)	Entropy 1.84282 (1.85037)	Top-1 acc 35.938 (30.772)	Top-5 acc 53.906 (54.243)	lr 0.02495
Train [4][1150/3239]	Time 0.380 (0.811)	Data Time 0.001 (0.018)	Loss 4.0965 (4.0101)	Entropy 1.84263 (1.85030)	Top-1 acc 25.781 (30.769)	Top-5 acc 54.297 (54.240)	lr 0.02495
Train [4][1160/3239]	Time 0.563 (0.810)	Data Time 0.001 (0.018)	Loss 4.2562 (4.0103)	Entropy 1.84250 (1.85023)	Top-1 acc 25.781 (30.762)	Top-5 acc 50.000 (54.245)	lr 0.02495
Train [4][1170/3239]	Time 0.535 (0.810)	Data Time 0.001 (0.018)	Loss 4.0918 (4.0098)	Entropy 1.84243 (1.85017)	Top-1 acc 30.469 (30.768)	Top-5 acc 55.078 (54.262)	lr 0.02495
Train [4][1180/3239]	Time 0.500 (0.810)	Data Time 0.001 (0.017)	Loss 4.0254 (4.0099)	Entropy 1.84244 (1.85010)	Top-1 acc 31.641 (30.763)	Top-5 acc 50.781 (54.259)	lr 0.02495
Train [4][1190/3239]	Time 0.650 (0.810)	Data Time 0.001 (0.017)	Loss 3.9318 (4.0095)	Entropy 1.84233 (1.85004)	Top-1 acc 30.859 (30.775)	Top-5 acc 56.641 (54.269)	lr 0.02495
Train [4][1200/3239]	Time 0.530 (0.809)	Data Time 0.001 (0.017)	Loss 4.0155 (4.0095)	Entropy 1.84230 (1.84997)	Top-1 acc 35.938 (30.777)	Top-5 acc 52.734 (54.263)	lr 0.02495
Train [4][1210/3239]	Time 0.544 (0.809)	Data Time 0.002 (0.017)	Loss 3.9388 (4.0093)	Entropy 1.84229 (1.84991)	Top-1 acc 30.078 (30.776)	Top-5 acc 53.125 (54.262)	lr 0.02495
Train [4][1220/3239]	Time 0.544 (0.809)	Data Time 0.001 (0.017)	Loss 4.0486 (4.0094)	Entropy 1.84221 (1.84985)	Top-1 acc 28.906 (30.773)	Top-5 acc 51.172 (54.261)	lr 0.02495
Train [4][1230/3239]	Time 0.581 (0.809)	Data Time 0.001 (0.017)	Loss 3.9792 (4.0090)	Entropy 1.84208 (1.84978)	Top-1 acc 31.250 (30.778)	Top-5 acc 55.078 (54.270)	lr 0.02495
Train [4][1240/3239]	Time 0.454 (0.808)	Data Time 0.001 (0.017)	Loss 4.0619 (4.0088)	Entropy 1.84200 (1.84972)	Top-1 acc 32.422 (30.783)	Top-5 acc 53.906 (54.283)	lr 0.02495
Train [4][1250/3239]	Time 0.541 (0.808)	Data Time 0.001 (0.017)	Loss 4.0095 (4.0090)	Entropy 1.84187 (1.84966)	Top-1 acc 30.078 (30.778)	Top-5 acc 54.688 (54.278)	lr 0.02495
Train [4][1260/3239]	Time 0.562 (0.808)	Data Time 0.001 (0.016)	Loss 4.1603 (4.0094)	Entropy 1.84165 (1.84960)	Top-1 acc 27.734 (30.765)	Top-5 acc 48.047 (54.268)	lr 0.02495
Train [4][1270/3239]	Time 0.401 (0.807)	Data Time 0.001 (0.016)	Loss 3.9685 (4.0090)	Entropy 1.84153 (1.84953)	Top-1 acc 31.250 (30.766)	Top-5 acc 57.422 (54.279)	lr 0.02495
Train [4][1280/3239]	Time 0.479 (0.807)	Data Time 0.001 (0.016)	Loss 4.0739 (4.0091)	Entropy 1.84138 (1.84947)	Top-1 acc 30.859 (30.767)	Top-5 acc 50.781 (54.273)	lr 0.02495
Train [4][1290/3239]	Time 0.519 (0.807)	Data Time 0.003 (0.016)	Loss 4.1893 (4.0090)	Entropy 1.84126 (1.84941)	Top-1 acc 28.125 (30.767)	Top-5 acc 52.734 (54.276)	lr 0.02495
Train [4][1300/3239]	Time 0.557 (0.806)	Data Time 0.001 (0.016)	Loss 3.9977 (4.0090)	Entropy 1.84126 (1.84935)	Top-1 acc 35.156 (30.769)	Top-5 acc 53.906 (54.277)	lr 0.02495
Train [4][1310/3239]	Time 0.509 (0.806)	Data Time 0.001 (0.016)	Loss 3.9495 (4.0095)	Entropy 1.84104 (1.84928)	Top-1 acc 31.250 (30.767)	Top-5 acc 55.469 (54.268)	lr 0.02495
Train [4][1320/3239]	Time 0.236 (0.805)	Data Time 0.001 (0.016)	Loss 3.8555 (4.0093)	Entropy 1.84087 (1.84922)	Top-1 acc 33.984 (30.765)	Top-5 acc 58.203 (54.269)	lr 0.02495
Train [4][1330/3239]	Time 0.544 (0.805)	Data Time 0.001 (0.016)	Loss 3.9961 (4.0095)	Entropy 1.84069 (1.84916)	Top-1 acc 30.078 (30.755)	Top-5 acc 56.250 (54.265)	lr 0.02495
Train [4][1340/3239]	Time 0.525 (0.804)	Data Time 0.001 (0.016)	Loss 3.8639 (4.0097)	Entropy 1.84061 (1.84909)	Top-1 acc 35.547 (30.755)	Top-5 acc 56.250 (54.257)	lr 0.02495
Train [4][1350/3239]	Time 0.427 (0.804)	Data Time 0.001 (0.016)	Loss 4.1122 (4.0100)	Entropy 1.84053 (1.84903)	Top-1 acc 28.906 (30.750)	Top-5 acc 51.953 (54.254)	lr 0.02495
Train [4][1360/3239]	Time 0.516 (0.804)	Data Time 0.001 (0.016)	Loss 4.1922 (4.0097)	Entropy 1.84036 (1.84897)	Top-1 acc 25.000 (30.763)	Top-5 acc 51.562 (54.266)	lr 0.02495
Train [4][1370/3239]	Time 0.565 (0.804)	Data Time 0.001 (0.016)	Loss 3.8756 (4.0094)	Entropy 1.84018 (1.84891)	Top-1 acc 35.938 (30.772)	Top-5 acc 57.031 (54.281)	lr 0.02495
Train [4][1380/3239]	Time 0.587 (0.803)	Data Time 0.001 (0.015)	Loss 4.0037 (4.0091)	Entropy 1.84001 (1.84884)	Top-1 acc 32.031 (30.778)	Top-5 acc 52.734 (54.285)	lr 0.02495
Train [4][1390/3239]	Time 0.579 (0.815)	Data Time 0.002 (0.015)	Loss 3.9615 (4.0094)	Entropy 1.83995 (1.84878)	Top-1 acc 33.594 (30.775)	Top-5 acc 55.469 (54.279)	lr 0.02495
Train [4][1400/3239]	Time 0.495 (0.815)	Data Time 0.001 (0.015)	Loss 4.2455 (4.0095)	Entropy 1.83978 (1.84871)	Top-1 acc 23.828 (30.770)	Top-5 acc 48.438 (54.277)	lr 0.02495
Train [4][1410/3239]	Time 0.570 (0.814)	Data Time 0.003 (0.015)	Loss 3.9504 (4.0093)	Entropy 1.83957 (1.84865)	Top-1 acc 32.422 (30.788)	Top-5 acc 55.859 (54.285)	lr 0.02495
Train [4][1420/3239]	Time 0.534 (0.814)	Data Time 0.002 (0.015)	Loss 4.0284 (4.0092)	Entropy 1.83942 (1.84859)	Top-1 acc 29.688 (30.786)	Top-5 acc 50.391 (54.291)	lr 0.02495
Train [4][1430/3239]	Time 0.542 (0.814)	Data Time 0.002 (0.015)	Loss 3.7801 (4.0087)	Entropy 1.83917 (1.84852)	Top-1 acc 33.594 (30.801)	Top-5 acc 58.984 (54.300)	lr 0.02495
Train [4][1440/3239]	Time 0.566 (0.813)	Data Time 0.001 (0.015)	Loss 4.0046 (4.0087)	Entropy 1.83897 (1.84846)	Top-1 acc 28.906 (30.795)	Top-5 acc 54.688 (54.304)	lr 0.02495
Train [4][1450/3239]	Time 0.634 (0.813)	Data Time 0.001 (0.015)	Loss 3.8588 (4.0085)	Entropy 1.83875 (1.84839)	Top-1 acc 29.688 (30.791)	Top-5 acc 57.812 (54.306)	lr 0.02495
Train [4][1460/3239]	Time 0.544 (0.812)	Data Time 0.002 (0.015)	Loss 4.1521 (4.0087)	Entropy 1.83862 (1.84832)	Top-1 acc 26.953 (30.780)	Top-5 acc 48.438 (54.295)	lr 0.02495
Train [4][1470/3239]	Time 0.529 (0.812)	Data Time 0.001 (0.015)	Loss 3.8708 (4.0088)	Entropy 1.83851 (1.84826)	Top-1 acc 30.469 (30.778)	Top-5 acc 59.375 (54.297)	lr 0.02495
Train [4][1480/3239]	Time 0.512 (0.811)	Data Time 0.001 (0.015)	Loss 4.0744 (4.0088)	Entropy 1.83848 (1.84819)	Top-1 acc 28.516 (30.779)	Top-5 acc 54.297 (54.298)	lr 0.02495
Train [4][1490/3239]	Time 0.562 (0.811)	Data Time 0.001 (0.015)	Loss 4.0279 (4.0091)	Entropy 1.83830 (1.84813)	Top-1 acc 30.859 (30.777)	Top-5 acc 53.516 (54.288)	lr 0.02495
Train [4][1500/3239]	Time 0.658 (0.811)	Data Time 0.001 (0.014)	Loss 3.8930 (4.0092)	Entropy 1.83804 (1.84806)	Top-1 acc 30.469 (30.769)	Top-5 acc 55.078 (54.288)	lr 0.02495
Train [4][1510/3239]	Time 0.575 (0.811)	Data Time 0.002 (0.014)	Loss 3.9254 (4.0090)	Entropy 1.83793 (1.84799)	Top-1 acc 28.516 (30.775)	Top-5 acc 58.984 (54.300)	lr 0.02495
Train [4][1520/3239]	Time 0.540 (0.811)	Data Time 0.001 (0.014)	Loss 3.9563 (4.0088)	Entropy 1.83774 (1.84793)	Top-1 acc 33.203 (30.791)	Top-5 acc 56.641 (54.305)	lr 0.02495
Train [4][1530/3239]	Time 0.506 (0.811)	Data Time 0.001 (0.014)	Loss 3.8752 (4.0088)	Entropy 1.83757 (1.84786)	Top-1 acc 30.469 (30.791)	Top-5 acc 59.766 (54.306)	lr 0.02495
Train [4][1540/3239]	Time 0.411 (0.810)	Data Time 0.001 (0.014)	Loss 4.0688 (4.0085)	Entropy 1.83747 (1.84779)	Top-1 acc 28.516 (30.801)	Top-5 acc 53.516 (54.315)	lr 0.02495
Train [4][1550/3239]	Time 0.596 (0.810)	Data Time 0.001 (0.014)	Loss 3.9248 (4.0085)	Entropy 1.83735 (1.84773)	Top-1 acc 33.984 (30.799)	Top-5 acc 55.859 (54.321)	lr 0.02495
Train [4][1560/3239]	Time 0.401 (0.810)	Data Time 0.001 (0.014)	Loss 3.8977 (4.0080)	Entropy 1.83721 (1.84766)	Top-1 acc 33.594 (30.815)	Top-5 acc 58.203 (54.332)	lr 0.02495
Train [4][1570/3239]	Time 0.537 (0.810)	Data Time 0.001 (0.014)	Loss 3.9205 (4.0081)	Entropy 1.83703 (1.84759)	Top-1 acc 32.422 (30.817)	Top-5 acc 59.375 (54.340)	lr 0.02495
Train [4][1580/3239]	Time 0.603 (0.810)	Data Time 0.002 (0.014)	Loss 3.8839 (4.0079)	Entropy 1.83696 (1.84753)	Top-1 acc 28.516 (30.812)	Top-5 acc 56.641 (54.341)	lr 0.02495
Train [4][1590/3239]	Time 0.529 (0.810)	Data Time 0.001 (0.014)	Loss 4.1021 (4.0078)	Entropy 1.83683 (1.84746)	Top-1 acc 30.469 (30.814)	Top-5 acc 53.906 (54.343)	lr 0.02495
Train [4][1600/3239]	Time 0.545 (0.809)	Data Time 0.002 (0.014)	Loss 3.9550 (4.0081)	Entropy 1.83667 (1.84739)	Top-1 acc 31.641 (30.805)	Top-5 acc 57.812 (54.333)	lr 0.02495
Train [4][1610/3239]	Time 0.554 (0.809)	Data Time 0.001 (0.014)	Loss 4.1876 (4.0079)	Entropy 1.83664 (1.84733)	Top-1 acc 29.297 (30.805)	Top-5 acc 47.656 (54.335)	lr 0.02495
Train [4][1620/3239]	Time 0.480 (0.809)	Data Time 0.001 (0.014)	Loss 4.0702 (4.0073)	Entropy 1.83652 (1.84726)	Top-1 acc 30.078 (30.813)	Top-5 acc 51.953 (54.341)	lr 0.02495
Train [4][1630/3239]	Time 0.503 (0.808)	Data Time 0.001 (0.014)	Loss 4.0430 (4.0077)	Entropy 1.83636 (1.84719)	Top-1 acc 27.344 (30.803)	Top-5 acc 53.516 (54.331)	lr 0.02495
Train [4][1640/3239]	Time 0.583 (0.808)	Data Time 0.001 (0.014)	Loss 3.8781 (4.0074)	Entropy 1.83632 (1.84713)	Top-1 acc 35.156 (30.807)	Top-5 acc 56.250 (54.339)	lr 0.02495
Train [4][1650/3239]	Time 0.555 (0.808)	Data Time 0.001 (0.014)	Loss 3.9889 (4.0074)	Entropy 1.83614 (1.84706)	Top-1 acc 33.594 (30.809)	Top-5 acc 56.641 (54.342)	lr 0.02495
Train [4][1660/3239]	Time 0.618 (0.808)	Data Time 0.001 (0.013)	Loss 4.0712 (4.0075)	Entropy 1.83599 (1.84700)	Top-1 acc 26.562 (30.807)	Top-5 acc 55.859 (54.336)	lr 0.02495
Train [4][1670/3239]	Time 0.512 (0.808)	Data Time 0.001 (0.013)	Loss 4.1334 (4.0075)	Entropy 1.83592 (1.84693)	Top-1 acc 30.859 (30.812)	Top-5 acc 51.562 (54.345)	lr 0.02495
Train [4][1680/3239]	Time 0.524 (0.808)	Data Time 0.001 (0.013)	Loss 4.0786 (4.0077)	Entropy 1.83571 (1.84686)	Top-1 acc 29.688 (30.813)	Top-5 acc 49.219 (54.342)	lr 0.02495
Train [4][1690/3239]	Time 0.559 (0.807)	Data Time 0.001 (0.013)	Loss 4.0698 (4.0077)	Entropy 1.83563 (1.84680)	Top-1 acc 31.641 (30.815)	Top-5 acc 53.516 (54.341)	lr 0.02495
Train [4][1700/3239]	Time 0.538 (0.807)	Data Time 0.001 (0.013)	Loss 4.0529 (4.0077)	Entropy 1.83560 (1.84673)	Top-1 acc 30.859 (30.819)	Top-5 acc 53.125 (54.351)	lr 0.02495
Train [4][1710/3239]	Time 0.518 (0.807)	Data Time 0.001 (0.013)	Loss 4.1103 (4.0077)	Entropy 1.83545 (1.84667)	Top-1 acc 31.641 (30.817)	Top-5 acc 53.125 (54.352)	lr 0.02495
Train [4][1720/3239]	Time 0.564 (0.807)	Data Time 0.001 (0.013)	Loss 4.1674 (4.0079)	Entropy 1.83535 (1.84660)	Top-1 acc 28.125 (30.817)	Top-5 acc 51.562 (54.351)	lr 0.02495
Train [4][1730/3239]	Time 0.526 (0.807)	Data Time 0.003 (0.013)	Loss 4.1059 (4.0079)	Entropy 1.83511 (1.84654)	Top-1 acc 32.031 (30.814)	Top-5 acc 50.781 (54.351)	lr 0.02495
Train [4][1740/3239]	Time 0.546 (0.807)	Data Time 0.001 (0.013)	Loss 3.9997 (4.0078)	Entropy 1.83493 (1.84647)	Top-1 acc 31.641 (30.814)	Top-5 acc 54.297 (54.354)	lr 0.02495
Train [4][1750/3239]	Time 0.484 (0.806)	Data Time 0.001 (0.013)	Loss 4.0873 (4.0075)	Entropy 1.83469 (1.84640)	Top-1 acc 28.125 (30.820)	Top-5 acc 52.734 (54.360)	lr 0.02495
Train [4][1760/3239]	Time 0.553 (0.806)	Data Time 0.001 (0.013)	Loss 3.8797 (4.0077)	Entropy 1.83461 (1.84634)	Top-1 acc 32.812 (30.818)	Top-5 acc 55.469 (54.359)	lr 0.02495
Train [4][1770/3239]	Time 0.565 (0.806)	Data Time 0.001 (0.013)	Loss 3.9428 (4.0076)	Entropy 1.83460 (1.84627)	Top-1 acc 32.812 (30.824)	Top-5 acc 55.859 (54.362)	lr 0.02495
Train [4][1780/3239]	Time 0.527 (0.806)	Data Time 0.001 (0.013)	Loss 4.1358 (4.0075)	Entropy 1.83445 (1.84620)	Top-1 acc 30.078 (30.821)	Top-5 acc 50.781 (54.363)	lr 0.02495
Train [4][1790/3239]	Time 0.582 (0.805)	Data Time 0.001 (0.013)	Loss 4.0927 (4.0073)	Entropy 1.83433 (1.84614)	Top-1 acc 28.516 (30.825)	Top-5 acc 51.172 (54.368)	lr 0.02495
Train [4][1800/3239]	Time 0.543 (0.805)	Data Time 0.001 (0.013)	Loss 3.8872 (4.0072)	Entropy 1.83422 (1.84607)	Top-1 acc 32.422 (30.828)	Top-5 acc 57.422 (54.374)	lr 0.02495
Train [4][1810/3239]	Time 0.521 (0.805)	Data Time 0.001 (0.013)	Loss 4.0238 (4.0073)	Entropy 1.83392 (1.84601)	Top-1 acc 32.422 (30.824)	Top-5 acc 54.688 (54.371)	lr 0.02495
Train [4][1820/3239]	Time 0.502 (0.805)	Data Time 0.001 (0.013)	Loss 4.0795 (4.0073)	Entropy 1.83384 (1.84594)	Top-1 acc 27.344 (30.819)	Top-5 acc 52.344 (54.368)	lr 0.02495
Train [4][1830/3239]	Time 0.562 (0.805)	Data Time 0.001 (0.012)	Loss 3.9916 (4.0074)	Entropy 1.83367 (1.84587)	Top-1 acc 32.812 (30.817)	Top-5 acc 55.859 (54.365)	lr 0.02495
Train [4][1840/3239]	Time 0.451 (0.804)	Data Time 0.001 (0.012)	Loss 4.1264 (4.0075)	Entropy 1.83360 (1.84581)	Top-1 acc 27.344 (30.812)	Top-5 acc 53.906 (54.366)	lr 0.02495
Train [4][1850/3239]	Time 0.367 (0.804)	Data Time 0.001 (0.012)	Loss 4.0262 (4.0076)	Entropy 1.83352 (1.84574)	Top-1 acc 31.250 (30.809)	Top-5 acc 55.859 (54.365)	lr 0.02495
Train [4][1860/3239]	Time 0.698 (0.804)	Data Time 0.001 (0.012)	Loss 4.1348 (4.0076)	Entropy 1.83338 (1.84567)	Top-1 acc 30.078 (30.812)	Top-5 acc 53.516 (54.363)	lr 0.02495
Train [4][1870/3239]	Time 0.569 (0.804)	Data Time 0.002 (0.012)	Loss 3.8225 (4.0074)	Entropy 1.83345 (1.84561)	Top-1 acc 32.031 (30.809)	Top-5 acc 60.156 (54.368)	lr 0.02495
Train [4][1880/3239]	Time 0.517 (0.804)	Data Time 0.001 (0.012)	Loss 4.0457 (4.0070)	Entropy 1.83338 (1.84554)	Top-1 acc 29.688 (30.811)	Top-5 acc 49.609 (54.371)	lr 0.02495
Train [4][1890/3239]	Time 0.557 (0.804)	Data Time 0.001 (0.012)	Loss 4.0947 (4.0074)	Entropy 1.83321 (1.84548)	Top-1 acc 28.906 (30.810)	Top-5 acc 52.734 (54.362)	lr 0.02495
Train [4][1900/3239]	Time 0.550 (0.804)	Data Time 0.001 (0.012)	Loss 3.9280 (4.0072)	Entropy 1.83297 (1.84541)	Top-1 acc 32.422 (30.813)	Top-5 acc 58.594 (54.376)	lr 0.02494
Train [4][1910/3239]	Time 0.512 (0.804)	Data Time 0.001 (0.012)	Loss 4.0944 (4.0073)	Entropy 1.83282 (1.84535)	Top-1 acc 28.906 (30.809)	Top-5 acc 54.688 (54.375)	lr 0.02494
Train [4][1920/3239]	Time 0.538 (0.804)	Data Time 0.001 (0.012)	Loss 3.9592 (4.0075)	Entropy 1.83264 (1.84528)	Top-1 acc 34.766 (30.803)	Top-5 acc 56.250 (54.369)	lr 0.02494
Train [4][1930/3239]	Time 0.483 (0.803)	Data Time 0.001 (0.012)	Loss 4.0089 (4.0075)	Entropy 1.83248 (1.84522)	Top-1 acc 31.641 (30.805)	Top-5 acc 52.344 (54.367)	lr 0.02494
Train [4][1940/3239]	Time 0.548 (0.803)	Data Time 0.001 (0.012)	Loss 4.0186 (4.0076)	Entropy 1.83237 (1.84515)	Top-1 acc 30.859 (30.800)	Top-5 acc 55.469 (54.359)	lr 0.02494
Train [4][1950/3239]	Time 0.534 (0.802)	Data Time 0.001 (0.012)	Loss 3.8640 (4.0076)	Entropy 1.83232 (1.84509)	Top-1 acc 35.938 (30.805)	Top-5 acc 56.250 (54.358)	lr 0.02494
Train [4][1960/3239]	Time 0.580 (0.802)	Data Time 0.001 (0.012)	Loss 3.9032 (4.0076)	Entropy 1.83223 (1.84502)	Top-1 acc 32.422 (30.796)	Top-5 acc 55.078 (54.353)	lr 0.02494
Train [4][1970/3239]	Time 0.569 (0.802)	Data Time 0.002 (0.012)	Loss 3.9759 (4.0074)	Entropy 1.83214 (1.84496)	Top-1 acc 31.641 (30.804)	Top-5 acc 58.984 (54.363)	lr 0.02494
Train [4][1980/3239]	Time 0.483 (0.802)	Data Time 0.001 (0.012)	Loss 4.2258 (4.0074)	Entropy 1.83200 (1.84489)	Top-1 acc 30.078 (30.800)	Top-5 acc 50.391 (54.363)	lr 0.02494
Train [4][1990/3239]	Time 0.564 (0.802)	Data Time 0.001 (0.012)	Loss 4.0713 (4.0077)	Entropy 1.83180 (1.84483)	Top-1 acc 27.344 (30.795)	Top-5 acc 55.078 (54.361)	lr 0.02494
Train [4][2000/3239]	Time 0.506 (0.802)	Data Time 0.002 (0.012)	Loss 4.0994 (4.0078)	Entropy 1.83161 (1.84476)	Top-1 acc 25.000 (30.788)	Top-5 acc 54.688 (54.361)	lr 0.02494
Train [4][2010/3239]	Time 0.506 (0.802)	Data Time 0.001 (0.012)	Loss 4.2080 (4.0079)	Entropy 1.83147 (1.84469)	Top-1 acc 27.344 (30.788)	Top-5 acc 48.828 (54.357)	lr 0.02494
Train [4][2020/3239]	Time 0.510 (0.801)	Data Time 0.001 (0.012)	Loss 4.0816 (4.0080)	Entropy 1.83108 (1.84463)	Top-1 acc 27.734 (30.789)	Top-5 acc 50.781 (54.355)	lr 0.02494
Train [4][2030/3239]	Time 0.456 (0.801)	Data Time 0.001 (0.012)	Loss 4.1256 (4.0078)	Entropy 1.83096 (1.84456)	Top-1 acc 28.516 (30.797)	Top-5 acc 55.859 (54.363)	lr 0.02494
Train [4][2040/3239]	Time 0.650 (0.809)	Data Time 0.006 (0.012)	Loss 4.0666 (4.0082)	Entropy 1.83093 (1.84450)	Top-1 acc 31.250 (30.793)	Top-5 acc 53.906 (54.356)	lr 0.02494
Train [4][2050/3239]	Time 0.597 (0.809)	Data Time 0.002 (0.012)	Loss 3.9783 (4.0081)	Entropy 1.83079 (1.84443)	Top-1 acc 33.984 (30.792)	Top-5 acc 54.688 (54.359)	lr 0.02494
Train [4][2060/3239]	Time 0.529 (0.809)	Data Time 0.001 (0.011)	Loss 4.0115 (4.0081)	Entropy 1.83063 (1.84436)	Top-1 acc 27.344 (30.795)	Top-5 acc 57.422 (54.363)	lr 0.02494
Train [4][2070/3239]	Time 0.480 (0.809)	Data Time 0.003 (0.011)	Loss 3.8839 (4.0083)	Entropy 1.83038 (1.84430)	Top-1 acc 29.688 (30.791)	Top-5 acc 59.766 (54.359)	lr 0.02494
Train [4][2080/3239]	Time 0.398 (0.808)	Data Time 0.001 (0.011)	Loss 3.9420 (4.0081)	Entropy 1.83023 (1.84423)	Top-1 acc 35.938 (30.802)	Top-5 acc 51.562 (54.365)	lr 0.02494
Train [4][2090/3239]	Time 0.290 (0.807)	Data Time 0.001 (0.011)	Loss 4.1258 (4.0082)	Entropy 1.83025 (1.84416)	Top-1 acc 28.125 (30.794)	Top-5 acc 52.734 (54.360)	lr 0.02494
Train [4][2100/3239]	Time 0.506 (0.807)	Data Time 0.001 (0.011)	Loss 3.9585 (4.0080)	Entropy 1.83024 (1.84410)	Top-1 acc 29.688 (30.803)	Top-5 acc 55.859 (54.366)	lr 0.02494
Train [4][2110/3239]	Time 0.548 (0.807)	Data Time 0.002 (0.011)	Loss 3.9600 (4.0081)	Entropy 1.83022 (1.84403)	Top-1 acc 28.906 (30.798)	Top-5 acc 55.469 (54.367)	lr 0.02494
Train [4][2120/3239]	Time 0.398 (0.807)	Data Time 0.001 (0.011)	Loss 4.1567 (4.0083)	Entropy 1.83022 (1.84396)	Top-1 acc 27.734 (30.794)	Top-5 acc 52.734 (54.362)	lr 0.02494
Train [4][2130/3239]	Time 0.534 (0.806)	Data Time 0.001 (0.011)	Loss 3.8469 (4.0084)	Entropy 1.83009 (1.84390)	Top-1 acc 35.156 (30.792)	Top-5 acc 55.078 (54.357)	lr 0.02494
Train [4][2140/3239]	Time 0.555 (0.806)	Data Time 0.002 (0.011)	Loss 4.1763 (4.0083)	Entropy 1.82993 (1.84384)	Top-1 acc 30.078 (30.793)	Top-5 acc 48.047 (54.356)	lr 0.02494
Train [4][2150/3239]	Time 0.626 (0.806)	Data Time 0.001 (0.011)	Loss 3.8607 (4.0086)	Entropy 1.82966 (1.84377)	Top-1 acc 33.203 (30.787)	Top-5 acc 55.859 (54.350)	lr 0.02494
Train [4][2160/3239]	Time 0.432 (0.806)	Data Time 0.001 (0.011)	Loss 4.0709 (4.0086)	Entropy 1.82949 (1.84370)	Top-1 acc 28.125 (30.784)	Top-5 acc 53.516 (54.350)	lr 0.02494
Train [4][2170/3239]	Time 0.598 (0.806)	Data Time 0.001 (0.011)	Loss 4.1600 (4.0084)	Entropy 1.82932 (1.84364)	Top-1 acc 28.906 (30.786)	Top-5 acc 49.609 (54.351)	lr 0.02494
Train [4][2180/3239]	Time 0.461 (0.806)	Data Time 0.001 (0.011)	Loss 4.0196 (4.0084)	Entropy 1.82913 (1.84357)	Top-1 acc 31.641 (30.785)	Top-5 acc 56.641 (54.350)	lr 0.02494
Train [4][2190/3239]	Time 0.502 (0.806)	Data Time 0.001 (0.011)	Loss 4.0900 (4.0085)	Entropy 1.82900 (1.84351)	Top-1 acc 27.734 (30.780)	Top-5 acc 54.297 (54.344)	lr 0.02494
Train [4][2200/3239]	Time 0.565 (0.806)	Data Time 0.001 (0.011)	Loss 3.9722 (4.0082)	Entropy 1.82888 (1.84344)	Top-1 acc 31.641 (30.782)	Top-5 acc 57.031 (54.350)	lr 0.02494
Train [4][2210/3239]	Time 0.492 (0.806)	Data Time 0.001 (0.011)	Loss 3.9945 (4.0084)	Entropy 1.82875 (1.84337)	Top-1 acc 29.688 (30.773)	Top-5 acc 53.516 (54.344)	lr 0.02494
Train [4][2220/3239]	Time 0.658 (0.805)	Data Time 0.002 (0.011)	Loss 3.9485 (4.0082)	Entropy 1.82853 (1.84331)	Top-1 acc 31.250 (30.778)	Top-5 acc 55.859 (54.348)	lr 0.02494
Train [4][2230/3239]	Time 0.532 (0.805)	Data Time 0.001 (0.011)	Loss 3.9283 (4.0080)	Entropy 1.82846 (1.84324)	Top-1 acc 30.469 (30.782)	Top-5 acc 51.953 (54.349)	lr 0.02494
Train [4][2240/3239]	Time 0.535 (0.805)	Data Time 0.002 (0.011)	Loss 3.8755 (4.0082)	Entropy 1.82822 (1.84318)	Top-1 acc 31.641 (30.778)	Top-5 acc 54.688 (54.342)	lr 0.02494
Train [4][2250/3239]	Time 0.539 (0.805)	Data Time 0.001 (0.011)	Loss 3.9880 (4.0083)	Entropy 1.82805 (1.84311)	Top-1 acc 31.250 (30.771)	Top-5 acc 55.469 (54.340)	lr 0.02494
Train [4][2260/3239]	Time 0.540 (0.805)	Data Time 0.001 (0.011)	Loss 3.8641 (4.0081)	Entropy 1.82783 (1.84304)	Top-1 acc 34.375 (30.773)	Top-5 acc 60.938 (54.345)	lr 0.02494
Train [4][2270/3239]	Time 0.614 (0.804)	Data Time 0.001 (0.011)	Loss 4.0763 (4.0081)	Entropy 1.82772 (1.84297)	Top-1 acc 25.781 (30.770)	Top-5 acc 52.734 (54.345)	lr 0.02494
Train [4][2280/3239]	Time 0.531 (0.804)	Data Time 0.001 (0.011)	Loss 3.9767 (4.0081)	Entropy 1.82766 (1.84291)	Top-1 acc 33.594 (30.771)	Top-5 acc 55.859 (54.347)	lr 0.02494
Train [4][2290/3239]	Time 0.574 (0.804)	Data Time 0.001 (0.011)	Loss 3.8823 (4.0079)	Entropy 1.82748 (1.84284)	Top-1 acc 33.203 (30.775)	Top-5 acc 59.766 (54.353)	lr 0.02494
Train [4][2300/3239]	Time 0.524 (0.804)	Data Time 0.001 (0.011)	Loss 4.0173 (4.0075)	Entropy 1.82730 (1.84277)	Top-1 acc 27.734 (30.780)	Top-5 acc 50.391 (54.358)	lr 0.02494
Train [4][2310/3239]	Time 0.496 (0.804)	Data Time 0.001 (0.011)	Loss 4.1600 (4.0073)	Entropy 1.82723 (1.84271)	Top-1 acc 26.953 (30.785)	Top-5 acc 52.734 (54.368)	lr 0.02494
Train [4][2320/3239]	Time 0.572 (0.804)	Data Time 0.001 (0.011)	Loss 4.1310 (4.0076)	Entropy 1.82705 (1.84264)	Top-1 acc 30.469 (30.779)	Top-5 acc 52.734 (54.362)	lr 0.02494
Train [4][2330/3239]	Time 0.485 (0.804)	Data Time 0.001 (0.011)	Loss 3.9444 (4.0075)	Entropy 1.82702 (1.84257)	Top-1 acc 31.250 (30.782)	Top-5 acc 51.562 (54.365)	lr 0.02494
Train [4][2340/3239]	Time 0.501 (0.804)	Data Time 0.001 (0.011)	Loss 4.1529 (4.0072)	Entropy 1.82691 (1.84251)	Top-1 acc 23.828 (30.784)	Top-5 acc 48.047 (54.368)	lr 0.02494
Train [4][2350/3239]	Time 0.641 (0.804)	Data Time 0.001 (0.011)	Loss 4.1701 (4.0072)	Entropy 1.82682 (1.84244)	Top-1 acc 25.000 (30.782)	Top-5 acc 52.344 (54.367)	lr 0.02494
Train [4][2360/3239]	Time 0.546 (0.804)	Data Time 0.001 (0.011)	Loss 3.9516 (4.0071)	Entropy 1.82666 (1.84237)	Top-1 acc 33.594 (30.788)	Top-5 acc 57.031 (54.368)	lr 0.02494
Train [4][2370/3239]	Time 0.551 (0.804)	Data Time 0.001 (0.010)	Loss 4.0439 (4.0070)	Entropy 1.82651 (1.84231)	Top-1 acc 32.031 (30.788)	Top-5 acc 52.734 (54.370)	lr 0.02494
Train [4][2380/3239]	Time 0.505 (0.804)	Data Time 0.001 (0.010)	Loss 4.1402 (4.0071)	Entropy 1.82645 (1.84224)	Top-1 acc 27.734 (30.783)	Top-5 acc 51.562 (54.367)	lr 0.02494
Train [4][2390/3239]	Time 0.569 (0.804)	Data Time 0.001 (0.010)	Loss 3.9703 (4.0069)	Entropy 1.82630 (1.84217)	Top-1 acc 28.906 (30.785)	Top-5 acc 56.641 (54.373)	lr 0.02494
Train [4][2400/3239]	Time 0.683 (0.803)	Data Time 0.001 (0.010)	Loss 4.0940 (4.0071)	Entropy 1.82622 (1.84211)	Top-1 acc 30.469 (30.782)	Top-5 acc 51.953 (54.370)	lr 0.02494
Train [4][2410/3239]	Time 0.580 (0.803)	Data Time 0.001 (0.010)	Loss 3.9386 (4.0070)	Entropy 1.82618 (1.84204)	Top-1 acc 31.250 (30.781)	Top-5 acc 55.469 (54.376)	lr 0.02494
Train [4][2420/3239]	Time 0.537 (0.803)	Data Time 0.001 (0.010)	Loss 3.8636 (4.0070)	Entropy 1.82596 (1.84198)	Top-1 acc 32.031 (30.783)	Top-5 acc 62.891 (54.380)	lr 0.02494
Train [4][2430/3239]	Time 0.493 (0.803)	Data Time 0.001 (0.010)	Loss 4.1530 (4.0071)	Entropy 1.82586 (1.84191)	Top-1 acc 25.781 (30.779)	Top-5 acc 50.781 (54.374)	lr 0.02494
Train [4][2440/3239]	Time 0.526 (0.803)	Data Time 0.002 (0.010)	Loss 3.8744 (4.0070)	Entropy 1.82575 (1.84184)	Top-1 acc 32.812 (30.781)	Top-5 acc 60.547 (54.379)	lr 0.02494
Train [4][2450/3239]	Time 0.463 (0.802)	Data Time 0.001 (0.010)	Loss 4.0162 (4.0070)	Entropy 1.82566 (1.84178)	Top-1 acc 31.641 (30.781)	Top-5 acc 53.906 (54.378)	lr 0.02494
Train [4][2460/3239]	Time 0.514 (0.802)	Data Time 0.001 (0.010)	Loss 3.9595 (4.0065)	Entropy 1.82563 (1.84171)	Top-1 acc 30.859 (30.787)	Top-5 acc 55.469 (54.388)	lr 0.02494
Train [4][2470/3239]	Time 0.517 (0.802)	Data Time 0.001 (0.010)	Loss 4.0620 (4.0066)	Entropy 1.82553 (1.84165)	Top-1 acc 32.812 (30.785)	Top-5 acc 53.516 (54.387)	lr 0.02494
Train [4][2480/3239]	Time 0.679 (0.802)	Data Time 0.002 (0.010)	Loss 3.9254 (4.0065)	Entropy 1.82547 (1.84158)	Top-1 acc 28.125 (30.783)	Top-5 acc 56.641 (54.394)	lr 0.02494
Train [4][2490/3239]	Time 0.535 (0.802)	Data Time 0.001 (0.010)	Loss 3.9684 (4.0063)	Entropy 1.82545 (1.84152)	Top-1 acc 33.594 (30.784)	Top-5 acc 55.078 (54.399)	lr 0.02494
Train [4][2500/3239]	Time 0.626 (0.802)	Data Time 0.001 (0.010)	Loss 4.0342 (4.0063)	Entropy 1.82513 (1.84145)	Top-1 acc 28.516 (30.779)	Top-5 acc 55.078 (54.402)	lr 0.02494
Train [4][2510/3239]	Time 0.505 (0.802)	Data Time 0.001 (0.010)	Loss 3.9896 (4.0063)	Entropy 1.82506 (1.84139)	Top-1 acc 27.344 (30.776)	Top-5 acc 52.734 (54.403)	lr 0.02494
Train [4][2520/3239]	Time 0.554 (0.802)	Data Time 0.003 (0.010)	Loss 4.0080 (4.0065)	Entropy 1.82484 (1.84132)	Top-1 acc 30.859 (30.772)	Top-5 acc 55.859 (54.402)	lr 0.02494
Train [4][2530/3239]	Time 0.688 (0.802)	Data Time 0.001 (0.010)	Loss 3.9451 (4.0066)	Entropy 1.82461 (1.84126)	Top-1 acc 35.547 (30.770)	Top-5 acc 57.422 (54.400)	lr 0.02494
Train [4][2540/3239]	Time 0.582 (0.802)	Data Time 0.001 (0.010)	Loss 3.8976 (4.0065)	Entropy 1.82442 (1.84119)	Top-1 acc 31.641 (30.775)	Top-5 acc 53.125 (54.403)	lr 0.02494
Train [4][2550/3239]	Time 0.525 (0.801)	Data Time 0.001 (0.010)	Loss 4.1143 (4.0065)	Entropy 1.82431 (1.84113)	Top-1 acc 28.906 (30.778)	Top-5 acc 53.906 (54.405)	lr 0.02494
Train [4][2560/3239]	Time 0.553 (0.801)	Data Time 0.001 (0.010)	Loss 4.0199 (4.0065)	Entropy 1.82409 (1.84106)	Top-1 acc 28.125 (30.777)	Top-5 acc 53.906 (54.403)	lr 0.02494
Train [4][2570/3239]	Time 0.511 (0.801)	Data Time 0.001 (0.010)	Loss 4.0676 (4.0064)	Entropy 1.82398 (1.84099)	Top-1 acc 26.172 (30.776)	Top-5 acc 51.953 (54.405)	lr 0.02494
Train [4][2580/3239]	Time 0.424 (0.801)	Data Time 0.001 (0.010)	Loss 4.0553 (4.0065)	Entropy 1.82395 (1.84093)	Top-1 acc 30.469 (30.774)	Top-5 acc 55.469 (54.407)	lr 0.02494
Train [4][2590/3239]	Time 0.523 (0.801)	Data Time 0.001 (0.010)	Loss 3.7855 (4.0065)	Entropy 1.82386 (1.84086)	Top-1 acc 37.891 (30.776)	Top-5 acc 59.375 (54.410)	lr 0.02494
Train [4][2600/3239]	Time 0.529 (0.801)	Data Time 0.001 (0.010)	Loss 3.8865 (4.0064)	Entropy 1.82379 (1.84080)	Top-1 acc 32.812 (30.776)	Top-5 acc 57.031 (54.413)	lr 0.02494
Train [4][2610/3239]	Time 0.603 (0.801)	Data Time 0.001 (0.010)	Loss 3.9843 (4.0062)	Entropy 1.82356 (1.84073)	Top-1 acc 30.078 (30.779)	Top-5 acc 53.516 (54.416)	lr 0.02494
Train [4][2620/3239]	Time 0.549 (0.801)	Data Time 0.001 (0.010)	Loss 3.9331 (4.0061)	Entropy 1.82348 (1.84066)	Top-1 acc 31.641 (30.784)	Top-5 acc 54.688 (54.422)	lr 0.02494
Train [4][2630/3239]	Time 0.481 (0.800)	Data Time 0.001 (0.010)	Loss 4.0882 (4.0061)	Entropy 1.82341 (1.84060)	Top-1 acc 31.641 (30.785)	Top-5 acc 53.125 (54.423)	lr 0.02494
Train [4][2640/3239]	Time 0.516 (0.800)	Data Time 0.001 (0.010)	Loss 4.0699 (4.0062)	Entropy 1.82339 (1.84053)	Top-1 acc 32.031 (30.786)	Top-5 acc 51.172 (54.423)	lr 0.02494
Train [4][2650/3239]	Time 0.495 (0.800)	Data Time 0.001 (0.010)	Loss 3.8657 (4.0060)	Entropy 1.82317 (1.84047)	Top-1 acc 35.156 (30.790)	Top-5 acc 55.469 (54.423)	lr 0.02494
Train [4][2660/3239]	Time 0.386 (0.800)	Data Time 0.001 (0.010)	Loss 4.0212 (4.0061)	Entropy 1.82300 (1.84040)	Top-1 acc 30.469 (30.788)	Top-5 acc 51.953 (54.420)	lr 0.02494
Train [4][2670/3239]	Time 0.583 (0.800)	Data Time 0.001 (0.010)	Loss 4.0268 (4.0064)	Entropy 1.82295 (1.84034)	Top-1 acc 28.125 (30.783)	Top-5 acc 53.906 (54.410)	lr 0.02494
Train [4][2680/3239]	Time 0.584 (0.800)	Data Time 0.003 (0.010)	Loss 4.2783 (4.0067)	Entropy 1.82283 (1.84027)	Top-1 acc 26.172 (30.780)	Top-5 acc 46.484 (54.402)	lr 0.02494
Train [4][2690/3239]	Time 0.636 (0.800)	Data Time 0.001 (0.010)	Loss 3.9314 (4.0065)	Entropy 1.82268 (1.84021)	Top-1 acc 32.031 (30.784)	Top-5 acc 55.859 (54.408)	lr 0.02494
Train [4][2700/3239]	Time 0.516 (0.806)	Data Time 0.002 (0.010)	Loss 3.9958 (4.0064)	Entropy 1.82258 (1.84014)	Top-1 acc 32.812 (30.788)	Top-5 acc 55.078 (54.411)	lr 0.02494
Train [4][2710/3239]	Time 0.538 (0.806)	Data Time 0.001 (0.010)	Loss 3.9699 (4.0062)	Entropy 1.82248 (1.84008)	Top-1 acc 32.031 (30.790)	Top-5 acc 52.344 (54.413)	lr 0.02494
Train [4][2720/3239]	Time 0.561 (0.806)	Data Time 0.001 (0.010)	Loss 4.0706 (4.0062)	Entropy 1.82228 (1.84001)	Top-1 acc 29.688 (30.791)	Top-5 acc 52.734 (54.417)	lr 0.02494
Train [4][2730/3239]	Time 0.355 (0.806)	Data Time 0.001 (0.010)	Loss 3.9530 (4.0062)	Entropy 1.82227 (1.83995)	Top-1 acc 31.250 (30.787)	Top-5 acc 57.031 (54.415)	lr 0.02494
Train [4][2740/3239]	Time 0.634 (0.805)	Data Time 0.001 (0.010)	Loss 3.9342 (4.0063)	Entropy 1.82221 (1.83988)	Top-1 acc 33.203 (30.782)	Top-5 acc 57.422 (54.416)	lr 0.02494
Train [4][2750/3239]	Time 0.552 (0.805)	Data Time 0.002 (0.010)	Loss 3.8699 (4.0062)	Entropy 1.82220 (1.83982)	Top-1 acc 31.641 (30.786)	Top-5 acc 58.594 (54.417)	lr 0.02494
Train [4][2760/3239]	Time 0.528 (0.805)	Data Time 0.001 (0.009)	Loss 4.0056 (4.0060)	Entropy 1.82216 (1.83976)	Top-1 acc 31.250 (30.790)	Top-5 acc 55.469 (54.422)	lr 0.02494
Train [4][2770/3239]	Time 0.527 (0.805)	Data Time 0.001 (0.009)	Loss 4.0522 (4.0060)	Entropy 1.82211 (1.83969)	Top-1 acc 31.250 (30.789)	Top-5 acc 55.859 (54.421)	lr 0.02494
Train [4][2780/3239]	Time 0.572 (0.805)	Data Time 0.001 (0.009)	Loss 3.7875 (4.0058)	Entropy 1.82189 (1.83963)	Top-1 acc 36.328 (30.791)	Top-5 acc 57.422 (54.426)	lr 0.02494
Train [4][2790/3239]	Time 0.514 (0.805)	Data Time 0.001 (0.009)	Loss 4.0999 (4.0058)	Entropy 1.82182 (1.83957)	Top-1 acc 29.688 (30.792)	Top-5 acc 53.125 (54.428)	lr 0.02494
Train [4][2800/3239]	Time 0.513 (0.805)	Data Time 0.002 (0.009)	Loss 4.1089 (4.0058)	Entropy 1.82175 (1.83950)	Top-1 acc 26.562 (30.791)	Top-5 acc 50.000 (54.430)	lr 0.02494
Train [4][2810/3239]	Time 0.585 (0.805)	Data Time 0.002 (0.009)	Loss 3.7989 (4.0055)	Entropy 1.82151 (1.83944)	Top-1 acc 32.422 (30.794)	Top-5 acc 58.203 (54.435)	lr 0.02494
Train [4][2820/3239]	Time 0.469 (0.805)	Data Time 0.001 (0.009)	Loss 4.1296 (4.0057)	Entropy 1.82126 (1.83937)	Top-1 acc 31.250 (30.797)	Top-5 acc 51.172 (54.435)	lr 0.02494
Train [4][2830/3239]	Time 0.565 (0.804)	Data Time 0.001 (0.009)	Loss 4.0200 (4.0057)	Entropy 1.82106 (1.83931)	Top-1 acc 36.719 (30.793)	Top-5 acc 56.250 (54.435)	lr 0.02494
Train [4][2840/3239]	Time 0.520 (0.804)	Data Time 0.001 (0.009)	Loss 3.9506 (4.0055)	Entropy 1.82088 (1.83925)	Top-1 acc 30.078 (30.798)	Top-5 acc 52.344 (54.438)	lr 0.02494
Train [4][2850/3239]	Time 0.559 (0.804)	Data Time 0.001 (0.009)	Loss 3.9664 (4.0053)	Entropy 1.82084 (1.83918)	Top-1 acc 30.078 (30.802)	Top-5 acc 54.688 (54.446)	lr 0.02494
Train [4][2860/3239]	Time 0.462 (0.804)	Data Time 0.001 (0.009)	Loss 4.0549 (4.0053)	Entropy 1.82066 (1.83912)	Top-1 acc 27.734 (30.803)	Top-5 acc 54.688 (54.445)	lr 0.02494
Train [4][2870/3239]	Time 0.562 (0.804)	Data Time 0.001 (0.009)	Loss 3.8928 (4.0053)	Entropy 1.82036 (1.83905)	Top-1 acc 30.078 (30.802)	Top-5 acc 57.422 (54.446)	lr 0.02494
Train [4][2880/3239]	Time 0.518 (0.804)	Data Time 0.001 (0.009)	Loss 4.0929 (4.0053)	Entropy 1.82032 (1.83899)	Top-1 acc 26.953 (30.803)	Top-5 acc 54.297 (54.445)	lr 0.02494
Train [4][2890/3239]	Time 0.565 (0.804)	Data Time 0.002 (0.009)	Loss 4.0034 (4.0055)	Entropy 1.82010 (1.83892)	Top-1 acc 30.469 (30.799)	Top-5 acc 52.734 (54.443)	lr 0.02494
Train [4][2900/3239]	Time 0.547 (0.804)	Data Time 0.001 (0.009)	Loss 3.8528 (4.0055)	Entropy 1.81989 (1.83886)	Top-1 acc 34.375 (30.800)	Top-5 acc 60.547 (54.441)	lr 0.02494
Train [4][2910/3239]	Time 0.567 (0.804)	Data Time 0.002 (0.009)	Loss 3.8595 (4.0055)	Entropy 1.81970 (1.83879)	Top-1 acc 31.641 (30.802)	Top-5 acc 55.469 (54.439)	lr 0.02493
Train [4][2920/3239]	Time 0.566 (0.804)	Data Time 0.001 (0.009)	Loss 3.7906 (4.0053)	Entropy 1.81949 (1.83873)	Top-1 acc 33.203 (30.806)	Top-5 acc 57.422 (54.443)	lr 0.02493
Train [4][2930/3239]	Time 0.540 (0.804)	Data Time 0.001 (0.009)	Loss 4.0437 (4.0053)	Entropy 1.81925 (1.83866)	Top-1 acc 33.594 (30.807)	Top-5 acc 53.906 (54.442)	lr 0.02493
Train [4][2940/3239]	Time 0.499 (0.804)	Data Time 0.001 (0.009)	Loss 4.0735 (4.0054)	Entropy 1.81899 (1.83859)	Top-1 acc 30.859 (30.804)	Top-5 acc 54.688 (54.436)	lr 0.02493
Train [4][2950/3239]	Time 0.511 (0.804)	Data Time 0.001 (0.009)	Loss 4.0813 (4.0054)	Entropy 1.81883 (1.83853)	Top-1 acc 26.172 (30.803)	Top-5 acc 55.859 (54.438)	lr 0.02493
Train [4][2960/3239]	Time 0.529 (0.804)	Data Time 0.001 (0.009)	Loss 3.7708 (4.0056)	Entropy 1.81881 (1.83846)	Top-1 acc 37.891 (30.803)	Top-5 acc 58.203 (54.434)	lr 0.02493
Train [4][2970/3239]	Time 0.660 (0.803)	Data Time 0.001 (0.009)	Loss 4.0397 (4.0056)	Entropy 1.81861 (1.83839)	Top-1 acc 30.469 (30.802)	Top-5 acc 55.078 (54.435)	lr 0.02493
Train [4][2980/3239]	Time 0.527 (0.803)	Data Time 0.001 (0.009)	Loss 4.0816 (4.0055)	Entropy 1.81857 (1.83833)	Top-1 acc 27.734 (30.802)	Top-5 acc 51.562 (54.436)	lr 0.02493
Train [4][2990/3239]	Time 0.440 (0.803)	Data Time 0.001 (0.009)	Loss 3.9692 (4.0055)	Entropy 1.81841 (1.83826)	Top-1 acc 29.297 (30.801)	Top-5 acc 53.906 (54.436)	lr 0.02493
Train [4][3000/3239]	Time 0.565 (0.803)	Data Time 0.002 (0.009)	Loss 4.1374 (4.0053)	Entropy 1.81818 (1.83819)	Top-1 acc 33.984 (30.805)	Top-5 acc 51.172 (54.442)	lr 0.02493
Train [4][3010/3239]	Time 0.568 (0.803)	Data Time 0.001 (0.009)	Loss 3.8731 (4.0052)	Entropy 1.81804 (1.83813)	Top-1 acc 34.375 (30.808)	Top-5 acc 57.422 (54.442)	lr 0.02493
Train [4][3020/3239]	Time 0.567 (0.803)	Data Time 0.001 (0.009)	Loss 4.2843 (4.0054)	Entropy 1.81787 (1.83806)	Top-1 acc 29.297 (30.810)	Top-5 acc 47.266 (54.441)	lr 0.02493
Train [4][3030/3239]	Time 0.554 (0.803)	Data Time 0.001 (0.009)	Loss 3.8825 (4.0052)	Entropy 1.81776 (1.83799)	Top-1 acc 31.250 (30.811)	Top-5 acc 56.641 (54.442)	lr 0.02493
Train [4][3040/3239]	Time 0.492 (0.803)	Data Time 0.001 (0.009)	Loss 3.9317 (4.0052)	Entropy 1.81757 (1.83793)	Top-1 acc 33.203 (30.811)	Top-5 acc 55.859 (54.443)	lr 0.02493
Train [4][3050/3239]	Time 0.491 (0.803)	Data Time 0.001 (0.009)	Loss 4.0154 (4.0051)	Entropy 1.81737 (1.83786)	Top-1 acc 32.422 (30.813)	Top-5 acc 52.344 (54.446)	lr 0.02493
Train [4][3060/3239]	Time 0.546 (0.803)	Data Time 0.001 (0.009)	Loss 4.1689 (4.0049)	Entropy 1.81717 (1.83779)	Top-1 acc 28.125 (30.815)	Top-5 acc 49.219 (54.447)	lr 0.02493
Train [4][3070/3239]	Time 0.500 (0.803)	Data Time 0.001 (0.009)	Loss 3.9621 (4.0048)	Entropy 1.81713 (1.83773)	Top-1 acc 33.203 (30.816)	Top-5 acc 55.078 (54.450)	lr 0.02493
Train [4][3080/3239]	Time 0.514 (0.803)	Data Time 0.002 (0.009)	Loss 4.0593 (4.0048)	Entropy 1.81700 (1.83766)	Top-1 acc 29.297 (30.814)	Top-5 acc 52.344 (54.446)	lr 0.02493
Train [4][3090/3239]	Time 0.510 (0.802)	Data Time 0.001 (0.009)	Loss 4.0069 (4.0048)	Entropy 1.81694 (1.83759)	Top-1 acc 32.422 (30.812)	Top-5 acc 55.078 (54.449)	lr 0.02493
Train [4][3100/3239]	Time 0.595 (0.802)	Data Time 0.001 (0.009)	Loss 4.0947 (4.0049)	Entropy 1.81679 (1.83753)	Top-1 acc 27.344 (30.807)	Top-5 acc 53.125 (54.447)	lr 0.02493
Train [4][3110/3239]	Time 0.574 (0.802)	Data Time 0.001 (0.009)	Loss 4.0069 (4.0047)	Entropy 1.81683 (1.83746)	Top-1 acc 30.469 (30.811)	Top-5 acc 50.391 (54.451)	lr 0.02493
Train [4][3120/3239]	Time 0.481 (0.802)	Data Time 0.001 (0.009)	Loss 3.9264 (4.0047)	Entropy 1.81672 (1.83739)	Top-1 acc 32.031 (30.811)	Top-5 acc 57.812 (54.452)	lr 0.02493
Train [4][3130/3239]	Time 0.560 (0.802)	Data Time 0.002 (0.009)	Loss 4.0822 (4.0046)	Entropy 1.81657 (1.83733)	Top-1 acc 27.734 (30.812)	Top-5 acc 52.734 (54.452)	lr 0.02493
Train [4][3140/3239]	Time 0.469 (0.802)	Data Time 0.001 (0.009)	Loss 4.1303 (4.0046)	Entropy 1.81631 (1.83726)	Top-1 acc 30.469 (30.814)	Top-5 acc 51.562 (54.452)	lr 0.02493
Train [4][3150/3239]	Time 0.451 (0.802)	Data Time 0.001 (0.009)	Loss 4.0680 (4.0047)	Entropy 1.81621 (1.83719)	Top-1 acc 32.422 (30.814)	Top-5 acc 56.641 (54.454)	lr 0.02493
Train [4][3160/3239]	Time 0.472 (0.802)	Data Time 0.001 (0.009)	Loss 4.0666 (4.0049)	Entropy 1.81600 (1.83713)	Top-1 acc 31.250 (30.810)	Top-5 acc 52.344 (54.447)	lr 0.02493
Train [4][3170/3239]	Time 0.535 (0.801)	Data Time 0.001 (0.009)	Loss 3.9420 (4.0049)	Entropy 1.81592 (1.83706)	Top-1 acc 30.078 (30.809)	Top-5 acc 53.906 (54.443)	lr 0.02493
Train [4][3180/3239]	Time 0.509 (0.801)	Data Time 0.000 (0.009)	Loss 4.1684 (4.0049)	Entropy 1.81570 (1.83699)	Top-1 acc 26.562 (30.807)	Top-5 acc 52.734 (54.445)	lr 0.02493
Train [4][3190/3239]	Time 0.458 (0.801)	Data Time 0.000 (0.009)	Loss 3.9866 (4.0047)	Entropy 1.81546 (1.83693)	Top-1 acc 26.953 (30.811)	Top-5 acc 54.688 (54.448)	lr 0.02493
Train [4][3200/3239]	Time 0.551 (0.801)	Data Time 0.000 (0.009)	Loss 4.0103 (4.0047)	Entropy 1.81530 (1.83686)	Top-1 acc 32.422 (30.813)	Top-5 acc 55.078 (54.450)	lr 0.02493
Train [4][3210/3239]	Time 0.483 (0.801)	Data Time 0.000 (0.009)	Loss 3.9239 (4.0046)	Entropy 1.81519 (1.83679)	Top-1 acc 32.031 (30.815)	Top-5 acc 57.812 (54.451)	lr 0.02493
Train [4][3220/3239]	Time 0.550 (0.801)	Data Time 0.000 (0.009)	Loss 3.8858 (4.0043)	Entropy 1.81502 (1.83672)	Top-1 acc 30.078 (30.818)	Top-5 acc 56.250 (54.456)	lr 0.02493
Train [4][3230/3239]	Time 0.473 (0.801)	Data Time 0.000 (0.009)	Loss 3.6904 (4.0042)	Entropy 1.81500 (1.83666)	Top-1 acc 37.109 (30.823)	Top-5 acc 61.719 (54.460)	lr 0.02493
Train [4][3239/3239]	Time 1.392 (0.801)	Data Time 0.000 (0.009)	Loss 4.0367 (4.0043)	Entropy 1.81491 (1.83660)	Top-1 acc 35.802 (30.823)	Top-5 acc 54.321 (54.459)	lr 0.02493
==========Valid [4/120]	loss 2.872	top-1 acc 39.320 (39.320)	top-5 acc 64.463	Train top-1 30.823	top-5 54.459	Entropy 1.81491	Latency-None: 0.000ms	Flops: 539.76M
Train [5][0/3239]	Time 17.393 (17.393)	Data Time 15.187 (15.187)	Loss 3.8581 (3.8581)	Entropy 1.81471 (1.81471)	Top-1 acc 29.688 (29.688)	Top-5 acc 55.859 (55.859)	lr 0.02493
Train [5][10/3239]	Time 0.435 (2.332)	Data Time 0.001 (1.382)	Loss 3.9502 (3.9489)	Entropy 1.81465 (1.81469)	Top-1 acc 33.203 (31.747)	Top-5 acc 60.156 (55.717)	lr 0.02493
Train [5][20/3239]	Time 0.638 (1.590)	Data Time 0.001 (0.726)	Loss 3.8704 (3.9608)	Entropy 1.81452 (1.81463)	Top-1 acc 35.938 (31.864)	Top-5 acc 55.859 (55.264)	lr 0.02493
Train [5][30/3239]	Time 0.574 (1.325)	Data Time 0.001 (0.492)	Loss 3.9308 (3.9547)	Entropy 1.81433 (1.81457)	Top-1 acc 31.641 (31.666)	Top-5 acc 54.297 (55.129)	lr 0.02493
Train [5][40/3239]	Time 0.508 (1.190)	Data Time 0.001 (0.373)	Loss 3.9746 (3.9706)	Entropy 1.81411 (1.81449)	Top-1 acc 32.422 (31.421)	Top-5 acc 52.734 (54.869)	lr 0.02493
Train [5][50/3239]	Time 0.654 (1.115)	Data Time 0.001 (0.300)	Loss 3.9328 (3.9731)	Entropy 1.81407 (1.81441)	Top-1 acc 32.812 (31.533)	Top-5 acc 61.328 (55.063)	lr 0.02493
Train [5][60/3239]	Time 0.512 (1.062)	Data Time 0.001 (0.251)	Loss 4.0286 (3.9768)	Entropy 1.81407 (1.81435)	Top-1 acc 28.516 (31.513)	Top-5 acc 51.172 (55.020)	lr 0.02493
Train [5][70/3239]	Time 0.609 (1.025)	Data Time 0.001 (0.216)	Loss 3.9654 (3.9784)	Entropy 1.81398 (1.81430)	Top-1 acc 32.031 (31.481)	Top-5 acc 55.078 (54.996)	lr 0.02493
Train [5][80/3239]	Time 0.531 (0.993)	Data Time 0.001 (0.189)	Loss 3.9911 (3.9716)	Entropy 1.81387 (1.81425)	Top-1 acc 34.375 (31.641)	Top-5 acc 53.516 (55.179)	lr 0.02493
Train [5][90/3239]	Time 0.499 (0.970)	Data Time 0.002 (0.169)	Loss 3.9954 (3.9737)	Entropy 1.81384 (1.81421)	Top-1 acc 31.641 (31.636)	Top-5 acc 52.344 (55.134)	lr 0.02493
Train [5][100/3239]	Time 0.511 (0.951)	Data Time 0.001 (0.153)	Loss 4.0639 (3.9758)	Entropy 1.81369 (1.81417)	Top-1 acc 28.516 (31.606)	Top-5 acc 53.125 (55.051)	lr 0.02493
Train [5][110/3239]	Time 0.579 (1.080)	Data Time 0.026 (0.139)	Loss 4.0692 (3.9752)	Entropy 1.81362 (1.81412)	Top-1 acc 28.125 (31.609)	Top-5 acc 52.344 (55.068)	lr 0.02493
Train [5][120/3239]	Time 0.479 (1.059)	Data Time 0.003 (0.129)	Loss 3.9942 (3.9799)	Entropy 1.81335 (1.81407)	Top-1 acc 32.031 (31.541)	Top-5 acc 55.469 (55.010)	lr 0.02493
Train [5][130/3239]	Time 0.570 (1.039)	Data Time 0.001 (0.119)	Loss 3.9414 (3.9809)	Entropy 1.81304 (1.81400)	Top-1 acc 30.859 (31.465)	Top-5 acc 54.688 (54.962)	lr 0.02493
Train [5][140/3239]	Time 0.524 (1.020)	Data Time 0.001 (0.111)	Loss 4.0928 (3.9824)	Entropy 1.81290 (1.81393)	Top-1 acc 26.562 (31.427)	Top-5 acc 52.734 (54.923)	lr 0.02493
Train [5][150/3239]	Time 0.543 (1.004)	Data Time 0.001 (0.104)	Loss 4.0465 (3.9822)	Entropy 1.81279 (1.81386)	Top-1 acc 30.859 (31.359)	Top-5 acc 54.688 (54.905)	lr 0.02493
Train [5][160/3239]	Time 0.465 (0.990)	Data Time 0.001 (0.097)	Loss 3.8474 (3.9834)	Entropy 1.81271 (1.81379)	Top-1 acc 34.375 (31.318)	Top-5 acc 59.375 (54.930)	lr 0.02493
Train [5][170/3239]	Time 0.581 (0.979)	Data Time 0.001 (0.092)	Loss 4.0404 (3.9847)	Entropy 1.81261 (1.81373)	Top-1 acc 29.297 (31.287)	Top-5 acc 55.469 (54.921)	lr 0.02493
Train [5][180/3239]	Time 0.517 (0.969)	Data Time 0.001 (0.087)	Loss 3.9375 (3.9823)	Entropy 1.81253 (1.81366)	Top-1 acc 31.641 (31.317)	Top-5 acc 54.688 (55.000)	lr 0.02493
Train [5][190/3239]	Time 0.582 (0.960)	Data Time 0.002 (0.082)	Loss 3.9141 (3.9815)	Entropy 1.81243 (1.81360)	Top-1 acc 37.109 (31.379)	Top-5 acc 57.812 (55.039)	lr 0.02493
Train [5][200/3239]	Time 0.581 (0.952)	Data Time 0.001 (0.078)	Loss 3.8606 (3.9771)	Entropy 1.81238 (1.81354)	Top-1 acc 32.422 (31.431)	Top-5 acc 59.375 (55.156)	lr 0.02493
Train [5][210/3239]	Time 0.536 (0.943)	Data Time 0.001 (0.075)	Loss 4.0973 (3.9756)	Entropy 1.81236 (1.81349)	Top-1 acc 27.344 (31.483)	Top-5 acc 49.219 (55.163)	lr 0.02493
Train [5][220/3239]	Time 0.643 (0.936)	Data Time 0.001 (0.072)	Loss 4.0274 (3.9736)	Entropy 1.81224 (1.81344)	Top-1 acc 30.469 (31.478)	Top-5 acc 59.375 (55.205)	lr 0.02493
Train [5][230/3239]	Time 0.509 (0.929)	Data Time 0.001 (0.069)	Loss 3.9501 (3.9732)	Entropy 1.81203 (1.81338)	Top-1 acc 30.859 (31.485)	Top-5 acc 58.984 (55.205)	lr 0.02493
Train [5][240/3239]	Time 0.524 (0.923)	Data Time 0.001 (0.066)	Loss 4.0842 (3.9757)	Entropy 1.81197 (1.81332)	Top-1 acc 29.688 (31.425)	Top-5 acc 53.125 (55.128)	lr 0.02493
Train [5][250/3239]	Time 0.557 (0.918)	Data Time 0.001 (0.063)	Loss 4.1582 (3.9756)	Entropy 1.81184 (1.81327)	Top-1 acc 29.688 (31.409)	Top-5 acc 50.391 (55.134)	lr 0.02493
Train [5][260/3239]	Time 0.435 (0.912)	Data Time 0.001 (0.061)	Loss 3.8971 (3.9760)	Entropy 1.81165 (1.81321)	Top-1 acc 33.984 (31.410)	Top-5 acc 56.641 (55.139)	lr 0.02493
Train [5][270/3239]	Time 0.604 (0.907)	Data Time 0.002 (0.059)	Loss 4.0687 (3.9772)	Entropy 1.81149 (1.81315)	Top-1 acc 29.688 (31.394)	Top-5 acc 52.734 (55.107)	lr 0.02493
Train [5][280/3239]	Time 0.563 (0.901)	Data Time 0.001 (0.057)	Loss 4.0212 (3.9787)	Entropy 1.81148 (1.81309)	Top-1 acc 28.906 (31.326)	Top-5 acc 51.562 (55.071)	lr 0.02493
Train [5][290/3239]	Time 0.427 (0.894)	Data Time 0.001 (0.055)	Loss 3.8900 (3.9771)	Entropy 1.81123 (1.81303)	Top-1 acc 33.203 (31.371)	Top-5 acc 56.641 (55.082)	lr 0.02493
Train [5][300/3239]	Time 0.565 (0.891)	Data Time 0.001 (0.054)	Loss 3.9021 (3.9743)	Entropy 1.81108 (1.81297)	Top-1 acc 33.984 (31.425)	Top-5 acc 56.250 (55.162)	lr 0.02493
Train [5][310/3239]	Time 0.593 (0.888)	Data Time 0.001 (0.052)	Loss 3.9281 (3.9754)	Entropy 1.81089 (1.81291)	Top-1 acc 28.516 (31.392)	Top-5 acc 55.078 (55.135)	lr 0.02493
Train [5][320/3239]	Time 0.524 (0.885)	Data Time 0.001 (0.050)	Loss 3.9329 (3.9763)	Entropy 1.81091 (1.81285)	Top-1 acc 32.812 (31.389)	Top-5 acc 58.203 (55.122)	lr 0.02493
Train [5][330/3239]	Time 0.576 (0.882)	Data Time 0.001 (0.049)	Loss 3.8096 (3.9748)	Entropy 1.81060 (1.81278)	Top-1 acc 37.891 (31.392)	Top-5 acc 60.156 (55.157)	lr 0.02493
Train [5][340/3239]	Time 0.603 (0.879)	Data Time 0.001 (0.048)	Loss 4.0142 (3.9741)	Entropy 1.81052 (1.81272)	Top-1 acc 33.203 (31.387)	Top-5 acc 56.641 (55.147)	lr 0.02493
Train [5][350/3239]	Time 0.485 (0.876)	Data Time 0.001 (0.046)	Loss 3.8839 (3.9731)	Entropy 1.81035 (1.81266)	Top-1 acc 30.078 (31.406)	Top-5 acc 55.469 (55.152)	lr 0.02493
Train [5][360/3239]	Time 0.589 (0.873)	Data Time 0.001 (0.045)	Loss 4.0255 (3.9736)	Entropy 1.81020 (1.81259)	Top-1 acc 28.516 (31.419)	Top-5 acc 55.078 (55.140)	lr 0.02493
Train [5][370/3239]	Time 0.467 (0.870)	Data Time 0.001 (0.044)	Loss 4.0619 (3.9728)	Entropy 1.81010 (1.81253)	Top-1 acc 33.203 (31.413)	Top-5 acc 49.219 (55.143)	lr 0.02493
Train [5][380/3239]	Time 0.516 (0.869)	Data Time 0.001 (0.043)	Loss 3.8880 (3.9732)	Entropy 1.81004 (1.81246)	Top-1 acc 31.641 (31.407)	Top-5 acc 56.641 (55.151)	lr 0.02493
Train [5][390/3239]	Time 0.564 (0.867)	Data Time 0.001 (0.042)	Loss 3.8037 (3.9731)	Entropy 1.81005 (1.81240)	Top-1 acc 36.719 (31.423)	Top-5 acc 60.156 (55.141)	lr 0.02493
Train [5][400/3239]	Time 0.522 (0.865)	Data Time 0.001 (0.041)	Loss 4.0424 (3.9744)	Entropy 1.80993 (1.81234)	Top-1 acc 32.422 (31.386)	Top-5 acc 56.641 (55.137)	lr 0.02493
Train [5][410/3239]	Time 0.522 (0.863)	Data Time 0.001 (0.040)	Loss 3.9912 (3.9749)	Entropy 1.80976 (1.81228)	Top-1 acc 30.859 (31.398)	Top-5 acc 54.688 (55.132)	lr 0.02493
Train [5][420/3239]	Time 0.533 (0.861)	Data Time 0.001 (0.039)	Loss 3.8683 (3.9747)	Entropy 1.80970 (1.81222)	Top-1 acc 32.031 (31.391)	Top-5 acc 53.125 (55.116)	lr 0.02493
Train [5][430/3239]	Time 0.558 (0.860)	Data Time 0.001 (0.038)	Loss 3.8895 (3.9740)	Entropy 1.80966 (1.81216)	Top-1 acc 32.031 (31.392)	Top-5 acc 55.469 (55.116)	lr 0.02493
Train [5][440/3239]	Time 0.418 (0.858)	Data Time 0.001 (0.037)	Loss 4.0923 (3.9727)	Entropy 1.80948 (1.81210)	Top-1 acc 27.344 (31.418)	Top-5 acc 49.609 (55.129)	lr 0.02493
Train [5][450/3239]	Time 0.606 (0.856)	Data Time 0.001 (0.037)	Loss 3.8051 (3.9729)	Entropy 1.80910 (1.81204)	Top-1 acc 38.672 (31.421)	Top-5 acc 58.984 (55.095)	lr 0.02493
Train [5][460/3239]	Time 0.487 (0.853)	Data Time 0.001 (0.036)	Loss 4.1814 (3.9758)	Entropy 1.80900 (1.81198)	Top-1 acc 26.172 (31.374)	Top-5 acc 45.312 (55.041)	lr 0.02493
Train [5][470/3239]	Time 0.446 (0.851)	Data Time 0.001 (0.035)	Loss 4.0285 (3.9750)	Entropy 1.80883 (1.81191)	Top-1 acc 30.469 (31.405)	Top-5 acc 51.172 (55.079)	lr 0.02493
Train [5][480/3239]	Time 0.520 (0.849)	Data Time 0.001 (0.035)	Loss 3.9327 (3.9756)	Entropy 1.80876 (1.81185)	Top-1 acc 26.953 (31.389)	Top-5 acc 56.641 (55.061)	lr 0.02493
Train [5][490/3239]	Time 0.530 (0.848)	Data Time 0.001 (0.034)	Loss 3.8613 (3.9751)	Entropy 1.80875 (1.81179)	Top-1 acc 36.719 (31.392)	Top-5 acc 57.422 (55.056)	lr 0.02493
Train [5][500/3239]	Time 0.610 (0.847)	Data Time 0.001 (0.033)	Loss 3.8773 (3.9753)	Entropy 1.80853 (1.81172)	Top-1 acc 33.594 (31.390)	Top-5 acc 58.203 (55.048)	lr 0.02493
Train [5][510/3239]	Time 0.514 (0.846)	Data Time 0.001 (0.033)	Loss 4.1047 (3.9757)	Entropy 1.80831 (1.81166)	Top-1 acc 30.859 (31.383)	Top-5 acc 51.172 (55.032)	lr 0.02493
Train [5][520/3239]	Time 0.536 (0.844)	Data Time 0.001 (0.032)	Loss 3.9807 (3.9750)	Entropy 1.80808 (1.81159)	Top-1 acc 29.297 (31.409)	Top-5 acc 55.469 (55.044)	lr 0.02493
Train [5][530/3239]	Time 0.518 (0.843)	Data Time 0.001 (0.031)	Loss 3.9810 (3.9759)	Entropy 1.80799 (1.81153)	Top-1 acc 30.469 (31.396)	Top-5 acc 54.688 (55.012)	lr 0.02493
Train [5][540/3239]	Time 0.528 (0.842)	Data Time 0.001 (0.031)	Loss 4.1560 (3.9753)	Entropy 1.80777 (1.81146)	Top-1 acc 26.172 (31.399)	Top-5 acc 54.297 (55.034)	lr 0.02493
Train [5][550/3239]	Time 0.570 (0.841)	Data Time 0.002 (0.030)	Loss 3.9280 (3.9751)	Entropy 1.80757 (1.81139)	Top-1 acc 32.812 (31.422)	Top-5 acc 54.297 (55.037)	lr 0.02493
Train [5][560/3239]	Time 0.538 (0.840)	Data Time 0.001 (0.030)	Loss 4.1156 (3.9754)	Entropy 1.80740 (1.81132)	Top-1 acc 28.516 (31.416)	Top-5 acc 51.562 (55.036)	lr 0.02493
Train [5][570/3239]	Time 0.608 (0.839)	Data Time 0.001 (0.030)	Loss 3.8644 (3.9752)	Entropy 1.80724 (1.81125)	Top-1 acc 34.375 (31.431)	Top-5 acc 57.031 (55.033)	lr 0.02493
Train [5][580/3239]	Time 0.534 (0.838)	Data Time 0.001 (0.029)	Loss 3.9052 (3.9756)	Entropy 1.80720 (1.81119)	Top-1 acc 35.938 (31.436)	Top-5 acc 55.469 (55.012)	lr 0.02493
Train [5][590/3239]	Time 0.500 (0.837)	Data Time 0.001 (0.029)	Loss 4.0242 (3.9749)	Entropy 1.80709 (1.81112)	Top-1 acc 33.203 (31.458)	Top-5 acc 57.422 (55.017)	lr 0.02493
Train [5][600/3239]	Time 0.564 (0.837)	Data Time 0.001 (0.028)	Loss 3.7601 (3.9758)	Entropy 1.80683 (1.81105)	Top-1 acc 35.938 (31.451)	Top-5 acc 58.594 (55.004)	lr 0.02493
Train [5][610/3239]	Time 0.605 (0.837)	Data Time 0.001 (0.028)	Loss 4.0699 (3.9762)	Entropy 1.80673 (1.81098)	Top-1 acc 32.031 (31.453)	Top-5 acc 52.734 (54.991)	lr 0.02492
Train [5][620/3239]	Time 0.507 (0.835)	Data Time 0.001 (0.027)	Loss 3.9424 (3.9754)	Entropy 1.80657 (1.81091)	Top-1 acc 30.078 (31.453)	Top-5 acc 56.250 (55.034)	lr 0.02492
Train [5][630/3239]	Time 0.584 (0.834)	Data Time 0.002 (0.027)	Loss 4.1317 (3.9757)	Entropy 1.80649 (1.81084)	Top-1 acc 29.297 (31.442)	Top-5 acc 48.438 (55.021)	lr 0.02492
Train [5][640/3239]	Time 0.400 (0.833)	Data Time 0.002 (0.027)	Loss 4.0148 (3.9756)	Entropy 1.80631 (1.81077)	Top-1 acc 30.078 (31.456)	Top-5 acc 53.125 (55.032)	lr 0.02492
Train [5][650/3239]	Time 0.511 (0.832)	Data Time 0.001 (0.026)	Loss 4.1226 (3.9754)	Entropy 1.80627 (1.81070)	Top-1 acc 30.469 (31.452)	Top-5 acc 51.562 (55.028)	lr 0.02492
Train [5][660/3239]	Time 0.504 (0.830)	Data Time 0.001 (0.026)	Loss 3.9228 (3.9751)	Entropy 1.80597 (1.81063)	Top-1 acc 32.031 (31.447)	Top-5 acc 58.984 (55.054)	lr 0.02492
Train [5][670/3239]	Time 0.539 (0.829)	Data Time 0.001 (0.026)	Loss 4.1233 (3.9749)	Entropy 1.80589 (1.81056)	Top-1 acc 30.078 (31.446)	Top-5 acc 52.734 (55.072)	lr 0.02492
Train [5][680/3239]	Time 0.562 (0.829)	Data Time 0.001 (0.025)	Loss 3.9765 (3.9743)	Entropy 1.80580 (1.81049)	Top-1 acc 30.469 (31.466)	Top-5 acc 57.422 (55.099)	lr 0.02492
Train [5][690/3239]	Time 0.566 (0.828)	Data Time 0.001 (0.025)	Loss 4.0594 (3.9745)	Entropy 1.80552 (1.81042)	Top-1 acc 29.688 (31.446)	Top-5 acc 54.297 (55.080)	lr 0.02492
Train [5][700/3239]	Time 0.587 (0.827)	Data Time 0.001 (0.025)	Loss 4.1379 (3.9740)	Entropy 1.80538 (1.81035)	Top-1 acc 28.125 (31.438)	Top-5 acc 53.516 (55.102)	lr 0.02492
Train [5][710/3239]	Time 0.584 (0.827)	Data Time 0.002 (0.024)	Loss 3.8766 (3.9736)	Entropy 1.80520 (1.81028)	Top-1 acc 30.469 (31.437)	Top-5 acc 55.469 (55.103)	lr 0.02492
Train [5][720/3239]	Time 0.553 (0.826)	Data Time 0.001 (0.024)	Loss 3.9610 (3.9740)	Entropy 1.80509 (1.81021)	Top-1 acc 33.203 (31.435)	Top-5 acc 55.078 (55.090)	lr 0.02492
Train [5][730/3239]	Time 0.630 (0.825)	Data Time 0.002 (0.024)	Loss 4.2941 (3.9747)	Entropy 1.80495 (1.81014)	Top-1 acc 28.125 (31.417)	Top-5 acc 47.266 (55.077)	lr 0.02492
Train [5][740/3239]	Time 0.545 (0.825)	Data Time 0.001 (0.023)	Loss 3.9271 (3.9738)	Entropy 1.80475 (1.81007)	Top-1 acc 30.469 (31.425)	Top-5 acc 56.641 (55.100)	lr 0.02492
Train [5][750/3239]	Time 0.610 (0.824)	Data Time 0.001 (0.023)	Loss 3.9972 (3.9733)	Entropy 1.80442 (1.81000)	Top-1 acc 31.250 (31.435)	Top-5 acc 54.688 (55.116)	lr 0.02492
Train [5][760/3239]	Time 0.589 (0.824)	Data Time 0.001 (0.023)	Loss 4.1932 (3.9734)	Entropy 1.80423 (1.80992)	Top-1 acc 28.516 (31.426)	Top-5 acc 49.219 (55.114)	lr 0.02492
Train [5][770/3239]	Time 0.510 (0.845)	Data Time 0.002 (0.023)	Loss 3.9602 (3.9737)	Entropy 1.80413 (1.80985)	Top-1 acc 30.469 (31.420)	Top-5 acc 57.422 (55.113)	lr 0.02492
Train [5][780/3239]	Time 0.470 (0.844)	Data Time 0.001 (0.022)	Loss 4.1026 (3.9729)	Entropy 1.80408 (1.80978)	Top-1 acc 29.297 (31.439)	Top-5 acc 50.391 (55.127)	lr 0.02492
Train [5][790/3239]	Time 0.581 (0.843)	Data Time 0.001 (0.022)	Loss 3.9181 (3.9718)	Entropy 1.80371 (1.80970)	Top-1 acc 33.984 (31.460)	Top-5 acc 57.422 (55.163)	lr 0.02492
Train [5][800/3239]	Time 0.438 (0.841)	Data Time 0.002 (0.022)	Loss 4.1075 (3.9724)	Entropy 1.80368 (1.80963)	Top-1 acc 29.297 (31.440)	Top-5 acc 51.953 (55.140)	lr 0.02492
Train [5][810/3239]	Time 0.497 (0.840)	Data Time 0.001 (0.022)	Loss 3.8617 (3.9720)	Entropy 1.80365 (1.80955)	Top-1 acc 34.766 (31.451)	Top-5 acc 57.031 (55.153)	lr 0.02492
Train [5][820/3239]	Time 0.510 (0.840)	Data Time 0.001 (0.022)	Loss 4.0362 (3.9726)	Entropy 1.80354 (1.80948)	Top-1 acc 29.297 (31.443)	Top-5 acc 54.688 (55.144)	lr 0.02492
Train [5][830/3239]	Time 0.566 (0.839)	Data Time 0.001 (0.021)	Loss 3.7612 (3.9726)	Entropy 1.80343 (1.80941)	Top-1 acc 35.547 (31.451)	Top-5 acc 58.594 (55.147)	lr 0.02492
Train [5][840/3239]	Time 0.564 (0.839)	Data Time 0.001 (0.021)	Loss 4.0487 (3.9721)	Entropy 1.80329 (1.80934)	Top-1 acc 34.375 (31.457)	Top-5 acc 53.516 (55.178)	lr 0.02492
Train [5][850/3239]	Time 0.534 (0.838)	Data Time 0.001 (0.021)	Loss 4.1512 (3.9723)	Entropy 1.80329 (1.80927)	Top-1 acc 28.906 (31.455)	Top-5 acc 51.562 (55.187)	lr 0.02492
Train [5][860/3239]	Time 0.402 (0.838)	Data Time 0.001 (0.021)	Loss 4.0760 (3.9727)	Entropy 1.80322 (1.80920)	Top-1 acc 32.812 (31.448)	Top-5 acc 54.688 (55.182)	lr 0.02492
Train [5][870/3239]	Time 0.485 (0.837)	Data Time 0.001 (0.021)	Loss 3.8662 (3.9729)	Entropy 1.80297 (1.80913)	Top-1 acc 33.594 (31.441)	Top-5 acc 54.297 (55.170)	lr 0.02492
Train [5][880/3239]	Time 0.613 (0.837)	Data Time 0.001 (0.020)	Loss 3.6137 (3.9729)	Entropy 1.80274 (1.80906)	Top-1 acc 36.328 (31.441)	Top-5 acc 61.328 (55.165)	lr 0.02492
Train [5][890/3239]	Time 0.553 (0.836)	Data Time 0.001 (0.020)	Loss 4.0100 (3.9728)	Entropy 1.80262 (1.80898)	Top-1 acc 35.156 (31.451)	Top-5 acc 54.297 (55.167)	lr 0.02492
Train [5][900/3239]	Time 0.544 (0.835)	Data Time 0.001 (0.020)	Loss 3.7925 (3.9727)	Entropy 1.80252 (1.80891)	Top-1 acc 33.203 (31.453)	Top-5 acc 58.984 (55.163)	lr 0.02492
Train [5][910/3239]	Time 0.397 (0.835)	Data Time 0.001 (0.020)	Loss 3.8216 (3.9730)	Entropy 1.80227 (1.80884)	Top-1 acc 36.328 (31.446)	Top-5 acc 60.547 (55.157)	lr 0.02492
Train [5][920/3239]	Time 0.630 (0.834)	Data Time 0.001 (0.020)	Loss 4.0944 (3.9733)	Entropy 1.80213 (1.80877)	Top-1 acc 28.906 (31.432)	Top-5 acc 50.781 (55.145)	lr 0.02492
Train [5][930/3239]	Time 0.501 (0.834)	Data Time 0.001 (0.020)	Loss 3.7713 (3.9738)	Entropy 1.80212 (1.80870)	Top-1 acc 36.719 (31.420)	Top-5 acc 57.812 (55.135)	lr 0.02492
Train [5][940/3239]	Time 0.578 (0.833)	Data Time 0.001 (0.019)	Loss 4.0427 (3.9743)	Entropy 1.80180 (1.80863)	Top-1 acc 31.250 (31.418)	Top-5 acc 53.516 (55.118)	lr 0.02492
Train [5][950/3239]	Time 0.541 (0.833)	Data Time 0.001 (0.019)	Loss 4.3297 (3.9746)	Entropy 1.80175 (1.80856)	Top-1 acc 25.000 (31.411)	Top-5 acc 48.828 (55.114)	lr 0.02492
Train [5][960/3239]	Time 0.537 (0.832)	Data Time 0.001 (0.019)	Loss 4.0718 (3.9752)	Entropy 1.80167 (1.80848)	Top-1 acc 30.078 (31.402)	Top-5 acc 52.344 (55.091)	lr 0.02492
Train [5][970/3239]	Time 0.530 (0.832)	Data Time 0.001 (0.019)	Loss 4.0207 (3.9756)	Entropy 1.80156 (1.80841)	Top-1 acc 32.031 (31.394)	Top-5 acc 52.734 (55.085)	lr 0.02492
Train [5][980/3239]	Time 0.558 (0.831)	Data Time 0.001 (0.019)	Loss 3.7727 (3.9752)	Entropy 1.80143 (1.80834)	Top-1 acc 33.594 (31.398)	Top-5 acc 57.812 (55.102)	lr 0.02492
Train [5][990/3239]	Time 0.563 (0.830)	Data Time 0.002 (0.019)	Loss 3.9648 (3.9753)	Entropy 1.80127 (1.80827)	Top-1 acc 31.250 (31.400)	Top-5 acc 56.641 (55.096)	lr 0.02492
Train [5][1000/3239]	Time 0.542 (0.830)	Data Time 0.001 (0.018)	Loss 4.0689 (3.9752)	Entropy 1.80106 (1.80820)	Top-1 acc 31.641 (31.417)	Top-5 acc 54.297 (55.098)	lr 0.02492
Train [5][1010/3239]	Time 0.549 (0.829)	Data Time 0.001 (0.018)	Loss 3.9786 (3.9748)	Entropy 1.80103 (1.80813)	Top-1 acc 31.641 (31.422)	Top-5 acc 55.078 (55.111)	lr 0.02492
Train [5][1020/3239]	Time 0.546 (0.829)	Data Time 0.001 (0.018)	Loss 4.0375 (3.9742)	Entropy 1.80089 (1.80806)	Top-1 acc 30.859 (31.437)	Top-5 acc 56.250 (55.123)	lr 0.02492
Train [5][1030/3239]	Time 0.529 (0.828)	Data Time 0.001 (0.018)	Loss 3.9161 (3.9735)	Entropy 1.80070 (1.80799)	Top-1 acc 30.859 (31.444)	Top-5 acc 57.031 (55.131)	lr 0.02492
Train [5][1040/3239]	Time 0.405 (0.828)	Data Time 0.001 (0.018)	Loss 3.8847 (3.9730)	Entropy 1.80060 (1.80792)	Top-1 acc 32.422 (31.458)	Top-5 acc 55.078 (55.134)	lr 0.02492
Train [5][1050/3239]	Time 0.500 (0.828)	Data Time 0.001 (0.018)	Loss 4.0533 (3.9733)	Entropy 1.80048 (1.80785)	Top-1 acc 28.516 (31.444)	Top-5 acc 51.172 (55.123)	lr 0.02492
Train [5][1060/3239]	Time 0.611 (0.827)	Data Time 0.001 (0.018)	Loss 3.9731 (3.9734)	Entropy 1.80026 (1.80778)	Top-1 acc 25.000 (31.437)	Top-5 acc 55.469 (55.122)	lr 0.02492
Train [5][1070/3239]	Time 0.563 (0.827)	Data Time 0.001 (0.017)	Loss 4.0446 (3.9730)	Entropy 1.80019 (1.80771)	Top-1 acc 30.078 (31.448)	Top-5 acc 53.906 (55.123)	lr 0.02492
Train [5][1080/3239]	Time 0.529 (0.827)	Data Time 0.001 (0.017)	Loss 3.9688 (3.9727)	Entropy 1.79993 (1.80764)	Top-1 acc 31.641 (31.450)	Top-5 acc 55.078 (55.132)	lr 0.02492
Train [5][1090/3239]	Time 0.508 (0.826)	Data Time 0.001 (0.017)	Loss 3.8977 (3.9723)	Entropy 1.79973 (1.80757)	Top-1 acc 32.812 (31.459)	Top-5 acc 54.297 (55.143)	lr 0.02492
Train [5][1100/3239]	Time 0.516 (0.826)	Data Time 0.001 (0.017)	Loss 4.0620 (3.9718)	Entropy 1.79958 (1.80750)	Top-1 acc 33.984 (31.471)	Top-5 acc 53.906 (55.154)	lr 0.02492
Train [5][1110/3239]	Time 0.530 (0.826)	Data Time 0.001 (0.017)	Loss 3.8604 (3.9718)	Entropy 1.79951 (1.80743)	Top-1 acc 33.203 (31.464)	Top-5 acc 57.031 (55.147)	lr 0.02492
Train [5][1120/3239]	Time 0.573 (0.825)	Data Time 0.001 (0.017)	Loss 4.1261 (3.9721)	Entropy 1.79930 (1.80735)	Top-1 acc 31.641 (31.464)	Top-5 acc 51.562 (55.144)	lr 0.02492
Train [5][1130/3239]	Time 0.228 (0.825)	Data Time 0.001 (0.017)	Loss 3.9570 (3.9725)	Entropy 1.79906 (1.80728)	Top-1 acc 31.641 (31.459)	Top-5 acc 55.078 (55.132)	lr 0.02492
Train [5][1140/3239]	Time 0.539 (0.824)	Data Time 0.001 (0.017)	Loss 3.7893 (3.9728)	Entropy 1.79890 (1.80721)	Top-1 acc 33.203 (31.456)	Top-5 acc 59.766 (55.127)	lr 0.02492
Train [5][1150/3239]	Time 0.524 (0.824)	Data Time 0.001 (0.016)	Loss 3.8710 (3.9728)	Entropy 1.79877 (1.80714)	Top-1 acc 34.766 (31.455)	Top-5 acc 56.250 (55.133)	lr 0.02492
Train [5][1160/3239]	Time 0.467 (0.823)	Data Time 0.001 (0.016)	Loss 3.8416 (3.9728)	Entropy 1.79846 (1.80706)	Top-1 acc 35.938 (31.462)	Top-5 acc 58.203 (55.132)	lr 0.02492
Train [5][1170/3239]	Time 0.525 (0.822)	Data Time 0.001 (0.016)	Loss 4.2355 (3.9724)	Entropy 1.79830 (1.80699)	Top-1 acc 23.438 (31.468)	Top-5 acc 49.219 (55.138)	lr 0.02492
Train [5][1180/3239]	Time 0.534 (0.822)	Data Time 0.001 (0.016)	Loss 4.0312 (3.9719)	Entropy 1.79825 (1.80692)	Top-1 acc 28.906 (31.475)	Top-5 acc 54.688 (55.151)	lr 0.02492
Train [5][1190/3239]	Time 0.585 (0.822)	Data Time 0.001 (0.016)	Loss 3.9861 (3.9720)	Entropy 1.79804 (1.80684)	Top-1 acc 34.766 (31.477)	Top-5 acc 55.469 (55.152)	lr 0.02492
Train [5][1200/3239]	Time 0.549 (0.822)	Data Time 0.001 (0.016)	Loss 3.8879 (3.9718)	Entropy 1.79780 (1.80677)	Top-1 acc 30.859 (31.492)	Top-5 acc 55.859 (55.154)	lr 0.02492
Train [5][1210/3239]	Time 0.592 (0.822)	Data Time 0.001 (0.016)	Loss 3.8631 (3.9711)	Entropy 1.79763 (1.80669)	Top-1 acc 35.938 (31.505)	Top-5 acc 58.203 (55.164)	lr 0.02492
Train [5][1220/3239]	Time 0.535 (0.821)	Data Time 0.001 (0.016)	Loss 3.9454 (3.9708)	Entropy 1.79764 (1.80662)	Top-1 acc 30.469 (31.504)	Top-5 acc 57.422 (55.171)	lr 0.02492
Train [5][1230/3239]	Time 0.568 (0.821)	Data Time 0.001 (0.016)	Loss 3.9409 (3.9713)	Entropy 1.79736 (1.80655)	Top-1 acc 32.031 (31.497)	Top-5 acc 55.469 (55.157)	lr 0.02492
Train [5][1240/3239]	Time 0.479 (0.821)	Data Time 0.001 (0.015)	Loss 4.1222 (3.9714)	Entropy 1.79737 (1.80647)	Top-1 acc 29.297 (31.490)	Top-5 acc 57.812 (55.159)	lr 0.02492
Train [5][1250/3239]	Time 0.634 (0.821)	Data Time 0.001 (0.015)	Loss 4.0333 (3.9715)	Entropy 1.79722 (1.80640)	Top-1 acc 30.078 (31.483)	Top-5 acc 54.297 (55.157)	lr 0.02492
Train [5][1260/3239]	Time 0.528 (0.821)	Data Time 0.001 (0.015)	Loss 4.1530 (3.9714)	Entropy 1.79705 (1.80633)	Top-1 acc 28.516 (31.496)	Top-5 acc 51.172 (55.165)	lr 0.02492
Train [5][1270/3239]	Time 0.568 (0.820)	Data Time 0.001 (0.015)	Loss 4.0266 (3.9716)	Entropy 1.79694 (1.80625)	Top-1 acc 34.375 (31.496)	Top-5 acc 54.688 (55.162)	lr 0.02492
Train [5][1280/3239]	Time 0.549 (0.820)	Data Time 0.001 (0.015)	Loss 3.6962 (3.9712)	Entropy 1.79686 (1.80618)	Top-1 acc 37.109 (31.509)	Top-5 acc 61.719 (55.162)	lr 0.02492
Train [5][1290/3239]	Time 0.418 (0.820)	Data Time 0.001 (0.015)	Loss 4.1088 (3.9712)	Entropy 1.79675 (1.80611)	Top-1 acc 29.688 (31.494)	Top-5 acc 50.391 (55.153)	lr 0.02492
Train [5][1300/3239]	Time 0.628 (0.820)	Data Time 0.001 (0.015)	Loss 3.9377 (3.9709)	Entropy 1.79672 (1.80603)	Top-1 acc 31.641 (31.495)	Top-5 acc 53.516 (55.161)	lr 0.02492
Train [5][1310/3239]	Time 0.464 (0.820)	Data Time 0.001 (0.015)	Loss 4.1454 (3.9710)	Entropy 1.79653 (1.80596)	Top-1 acc 28.125 (31.501)	Top-5 acc 53.906 (55.161)	lr 0.02492
Train [5][1320/3239]	Time 0.531 (0.819)	Data Time 0.001 (0.015)	Loss 3.8984 (3.9712)	Entropy 1.79643 (1.80589)	Top-1 acc 33.984 (31.498)	Top-5 acc 54.688 (55.154)	lr 0.02492
Train [5][1330/3239]	Time 0.539 (0.819)	Data Time 0.001 (0.015)	Loss 3.8803 (3.9712)	Entropy 1.79638 (1.80582)	Top-1 acc 32.422 (31.499)	Top-5 acc 60.156 (55.153)	lr 0.02492
Train [5][1340/3239]	Time 0.437 (0.818)	Data Time 0.001 (0.015)	Loss 4.0436 (3.9714)	Entropy 1.79637 (1.80575)	Top-1 acc 32.422 (31.484)	Top-5 acc 54.297 (55.149)	lr 0.02492
Train [5][1350/3239]	Time 0.567 (0.818)	Data Time 0.001 (0.014)	Loss 4.0543 (3.9713)	Entropy 1.79620 (1.80568)	Top-1 acc 29.297 (31.483)	Top-5 acc 50.000 (55.142)	lr 0.02492
Train [5][1360/3239]	Time 0.635 (0.818)	Data Time 0.001 (0.014)	Loss 4.1894 (3.9713)	Entropy 1.79609 (1.80561)	Top-1 acc 25.391 (31.485)	Top-5 acc 50.000 (55.136)	lr 0.02492
Train [5][1370/3239]	Time 0.543 (0.817)	Data Time 0.002 (0.014)	Loss 3.8538 (3.9709)	Entropy 1.79589 (1.80554)	Top-1 acc 38.672 (31.485)	Top-5 acc 60.938 (55.148)	lr 0.02492
Train [5][1380/3239]	Time 0.461 (0.817)	Data Time 0.001 (0.014)	Loss 3.9850 (3.9714)	Entropy 1.79582 (1.80547)	Top-1 acc 32.422 (31.480)	Top-5 acc 56.250 (55.141)	lr 0.02492
Train [5][1390/3239]	Time 0.567 (0.817)	Data Time 0.001 (0.014)	Loss 3.8907 (3.9714)	Entropy 1.79539 (1.80540)	Top-1 acc 30.469 (31.474)	Top-5 acc 57.812 (55.145)	lr 0.02492
Train [5][1400/3239]	Time 0.556 (0.816)	Data Time 0.001 (0.014)	Loss 3.9524 (3.9716)	Entropy 1.79523 (1.80533)	Top-1 acc 28.516 (31.461)	Top-5 acc 55.078 (55.137)	lr 0.02492
Train [5][1410/3239]	Time 0.648 (0.816)	Data Time 0.001 (0.014)	Loss 4.3289 (3.9712)	Entropy 1.79498 (1.80526)	Top-1 acc 29.688 (31.470)	Top-5 acc 48.828 (55.153)	lr 0.02492
Train [5][1420/3239]	Time 0.697 (0.827)	Data Time 0.007 (0.014)	Loss 4.0189 (3.9712)	Entropy 1.79482 (1.80518)	Top-1 acc 27.344 (31.464)	Top-5 acc 51.172 (55.147)	lr 0.02492
Train [5][1430/3239]	Time 0.550 (0.827)	Data Time 0.002 (0.014)	Loss 4.0778 (3.9714)	Entropy 1.79463 (1.80511)	Top-1 acc 29.297 (31.469)	Top-5 acc 53.516 (55.150)	lr 0.02492
Train [5][1440/3239]	Time 0.551 (0.827)	Data Time 0.001 (0.014)	Loss 4.2414 (3.9717)	Entropy 1.79437 (1.80504)	Top-1 acc 26.562 (31.463)	Top-5 acc 49.219 (55.142)	lr 0.02492
Train [5][1450/3239]	Time 0.562 (0.827)	Data Time 0.002 (0.014)	Loss 3.9752 (3.9719)	Entropy 1.79437 (1.80496)	Top-1 acc 32.031 (31.463)	Top-5 acc 56.250 (55.142)	lr 0.02492
Train [5][1460/3239]	Time 0.545 (0.827)	Data Time 0.001 (0.014)	Loss 3.9624 (3.9718)	Entropy 1.79435 (1.80489)	Top-1 acc 32.422 (31.468)	Top-5 acc 55.859 (55.144)	lr 0.02492
Train [5][1470/3239]	Time 0.639 (0.826)	Data Time 0.001 (0.014)	Loss 3.8938 (3.9720)	Entropy 1.79410 (1.80482)	Top-1 acc 29.688 (31.464)	Top-5 acc 55.469 (55.138)	lr 0.02492
Train [5][1480/3239]	Time 0.483 (0.826)	Data Time 0.001 (0.013)	Loss 3.9706 (3.9719)	Entropy 1.79413 (1.80475)	Top-1 acc 30.859 (31.467)	Top-5 acc 54.688 (55.139)	lr 0.02492
Train [5][1490/3239]	Time 0.476 (0.825)	Data Time 0.001 (0.013)	Loss 3.8295 (3.9718)	Entropy 1.79422 (1.80468)	Top-1 acc 34.375 (31.475)	Top-5 acc 59.766 (55.148)	lr 0.02491
Train [5][1500/3239]	Time 0.538 (0.825)	Data Time 0.001 (0.013)	Loss 3.7867 (3.9719)	Entropy 1.79416 (1.80461)	Top-1 acc 33.203 (31.465)	Top-5 acc 56.250 (55.148)	lr 0.02491
Train [5][1510/3239]	Time 0.591 (0.825)	Data Time 0.001 (0.013)	Loss 4.1021 (3.9719)	Entropy 1.79410 (1.80454)	Top-1 acc 33.984 (31.473)	Top-5 acc 53.125 (55.148)	lr 0.02491
Train [5][1520/3239]	Time 0.510 (0.824)	Data Time 0.001 (0.013)	Loss 4.0185 (3.9720)	Entropy 1.79398 (1.80447)	Top-1 acc 28.516 (31.477)	Top-5 acc 52.344 (55.145)	lr 0.02491
Train [5][1530/3239]	Time 0.557 (0.824)	Data Time 0.001 (0.013)	Loss 4.0767 (3.9721)	Entropy 1.79388 (1.80440)	Top-1 acc 26.953 (31.474)	Top-5 acc 51.953 (55.142)	lr 0.02491
Train [5][1540/3239]	Time 0.532 (0.824)	Data Time 0.001 (0.013)	Loss 4.0538 (3.9722)	Entropy 1.79368 (1.80433)	Top-1 acc 28.516 (31.476)	Top-5 acc 54.688 (55.142)	lr 0.02491
Train [5][1550/3239]	Time 0.589 (0.824)	Data Time 0.001 (0.013)	Loss 3.9304 (3.9723)	Entropy 1.79357 (1.80426)	Top-1 acc 32.031 (31.475)	Top-5 acc 53.906 (55.143)	lr 0.02491
Train [5][1560/3239]	Time 0.668 (0.823)	Data Time 0.001 (0.013)	Loss 3.9742 (3.9720)	Entropy 1.79328 (1.80419)	Top-1 acc 30.859 (31.474)	Top-5 acc 55.469 (55.147)	lr 0.02491
Train [5][1570/3239]	Time 0.487 (0.823)	Data Time 0.001 (0.013)	Loss 3.8441 (3.9719)	Entropy 1.79327 (1.80412)	Top-1 acc 33.203 (31.482)	Top-5 acc 56.641 (55.147)	lr 0.02491
Train [5][1580/3239]	Time 0.541 (0.823)	Data Time 0.001 (0.013)	Loss 3.9848 (3.9717)	Entropy 1.79319 (1.80405)	Top-1 acc 28.125 (31.487)	Top-5 acc 52.344 (55.152)	lr 0.02491
Train [5][1590/3239]	Time 0.614 (0.823)	Data Time 0.001 (0.013)	Loss 3.8453 (3.9719)	Entropy 1.79290 (1.80398)	Top-1 acc 33.203 (31.488)	Top-5 acc 59.375 (55.151)	lr 0.02491
Train [5][1600/3239]	Time 0.512 (0.823)	Data Time 0.001 (0.013)	Loss 4.0130 (3.9720)	Entropy 1.79289 (1.80392)	Top-1 acc 29.688 (31.481)	Top-5 acc 54.297 (55.151)	lr 0.02491
Train [5][1610/3239]	Time 0.635 (0.823)	Data Time 0.001 (0.013)	Loss 3.8244 (3.9719)	Entropy 1.79282 (1.80385)	Top-1 acc 33.203 (31.486)	Top-5 acc 59.766 (55.151)	lr 0.02491
Train [5][1620/3239]	Time 0.428 (0.822)	Data Time 0.001 (0.013)	Loss 4.0037 (3.9722)	Entropy 1.79269 (1.80378)	Top-1 acc 32.422 (31.482)	Top-5 acc 55.469 (55.149)	lr 0.02491
Train [5][1630/3239]	Time 0.552 (0.822)	Data Time 0.001 (0.013)	Loss 3.7864 (3.9720)	Entropy 1.79249 (1.80371)	Top-1 acc 33.594 (31.487)	Top-5 acc 58.594 (55.151)	lr 0.02491
Train [5][1640/3239]	Time 0.509 (0.822)	Data Time 0.001 (0.012)	Loss 4.0943 (3.9721)	Entropy 1.79238 (1.80364)	Top-1 acc 29.688 (31.488)	Top-5 acc 51.562 (55.152)	lr 0.02491
Train [5][1650/3239]	Time 0.532 (0.821)	Data Time 0.001 (0.012)	Loss 3.9675 (3.9722)	Entropy 1.79230 (1.80357)	Top-1 acc 30.469 (31.487)	Top-5 acc 55.469 (55.150)	lr 0.02491
Train [5][1660/3239]	Time 0.457 (0.821)	Data Time 0.001 (0.012)	Loss 3.7805 (3.9719)	Entropy 1.79203 (1.80350)	Top-1 acc 34.375 (31.494)	Top-5 acc 58.203 (55.154)	lr 0.02491
Train [5][1670/3239]	Time 0.511 (0.820)	Data Time 0.001 (0.012)	Loss 4.0873 (3.9717)	Entropy 1.79174 (1.80344)	Top-1 acc 30.078 (31.493)	Top-5 acc 49.219 (55.159)	lr 0.02491
Train [5][1680/3239]	Time 0.565 (0.820)	Data Time 0.001 (0.012)	Loss 3.6507 (3.9718)	Entropy 1.79160 (1.80337)	Top-1 acc 36.328 (31.488)	Top-5 acc 62.891 (55.159)	lr 0.02491
Train [5][1690/3239]	Time 0.398 (0.820)	Data Time 0.001 (0.012)	Loss 4.1084 (3.9718)	Entropy 1.79154 (1.80330)	Top-1 acc 31.641 (31.484)	Top-5 acc 55.078 (55.167)	lr 0.02491
Train [5][1700/3239]	Time 0.521 (0.820)	Data Time 0.001 (0.012)	Loss 3.9666 (3.9716)	Entropy 1.79132 (1.80323)	Top-1 acc 30.078 (31.491)	Top-5 acc 57.812 (55.174)	lr 0.02491
Train [5][1710/3239]	Time 0.506 (0.820)	Data Time 0.001 (0.012)	Loss 4.1757 (3.9715)	Entropy 1.79109 (1.80316)	Top-1 acc 26.172 (31.494)	Top-5 acc 51.172 (55.180)	lr 0.02491
Train [5][1720/3239]	Time 0.538 (0.820)	Data Time 0.001 (0.012)	Loss 3.9047 (3.9709)	Entropy 1.79102 (1.80309)	Top-1 acc 31.250 (31.509)	Top-5 acc 57.422 (55.194)	lr 0.02491
Train [5][1730/3239]	Time 0.552 (0.820)	Data Time 0.001 (0.012)	Loss 4.1724 (3.9712)	Entropy 1.79089 (1.80302)	Top-1 acc 30.859 (31.510)	Top-5 acc 50.000 (55.186)	lr 0.02491
Train [5][1740/3239]	Time 0.534 (0.819)	Data Time 0.001 (0.012)	Loss 3.8894 (3.9711)	Entropy 1.79075 (1.80295)	Top-1 acc 33.594 (31.504)	Top-5 acc 59.375 (55.187)	lr 0.02491
Train [5][1750/3239]	Time 0.470 (0.819)	Data Time 0.001 (0.012)	Loss 4.0236 (3.9713)	Entropy 1.79053 (1.80288)	Top-1 acc 27.344 (31.496)	Top-5 acc 57.422 (55.186)	lr 0.02491
Train [5][1760/3239]	Time 0.539 (0.819)	Data Time 0.001 (0.012)	Loss 3.9475 (3.9711)	Entropy 1.79041 (1.80281)	Top-1 acc 26.172 (31.496)	Top-5 acc 54.297 (55.189)	lr 0.02491
Train [5][1770/3239]	Time 0.587 (0.819)	Data Time 0.001 (0.012)	Loss 3.8093 (3.9711)	Entropy 1.79034 (1.80273)	Top-1 acc 32.422 (31.498)	Top-5 acc 58.203 (55.191)	lr 0.02491
Train [5][1780/3239]	Time 0.545 (0.819)	Data Time 0.001 (0.012)	Loss 3.8465 (3.9710)	Entropy 1.79023 (1.80267)	Top-1 acc 32.812 (31.503)	Top-5 acc 58.203 (55.192)	lr 0.02491
Train [5][1790/3239]	Time 0.521 (0.818)	Data Time 0.001 (0.012)	Loss 3.8154 (3.9706)	Entropy 1.79009 (1.80260)	Top-1 acc 38.672 (31.516)	Top-5 acc 58.203 (55.197)	lr 0.02491
Train [5][1800/3239]	Time 0.487 (0.818)	Data Time 0.001 (0.012)	Loss 3.9051 (3.9705)	Entropy 1.79004 (1.80253)	Top-1 acc 32.031 (31.510)	Top-5 acc 57.812 (55.194)	lr 0.02491
Train [5][1810/3239]	Time 0.537 (0.818)	Data Time 0.001 (0.012)	Loss 3.7154 (3.9705)	Entropy 1.79001 (1.80246)	Top-1 acc 39.844 (31.508)	Top-5 acc 61.328 (55.194)	lr 0.02491
Train [5][1820/3239]	Time 0.529 (0.818)	Data Time 0.001 (0.012)	Loss 3.7970 (3.9707)	Entropy 1.78984 (1.80239)	Top-1 acc 33.594 (31.510)	Top-5 acc 57.422 (55.186)	lr 0.02491
Train [5][1830/3239]	Time 0.645 (0.818)	Data Time 0.001 (0.011)	Loss 3.8262 (3.9707)	Entropy 1.78976 (1.80232)	Top-1 acc 35.547 (31.505)	Top-5 acc 59.766 (55.189)	lr 0.02491
Train [5][1840/3239]	Time 0.527 (0.817)	Data Time 0.001 (0.011)	Loss 3.8372 (3.9704)	Entropy 1.78965 (1.80225)	Top-1 acc 32.812 (31.519)	Top-5 acc 60.547 (55.192)	lr 0.02491
Train [5][1850/3239]	Time 0.494 (0.817)	Data Time 0.001 (0.011)	Loss 3.9060 (3.9702)	Entropy 1.78952 (1.80218)	Top-1 acc 34.375 (31.524)	Top-5 acc 53.516 (55.192)	lr 0.02491
Train [5][1860/3239]	Time 0.490 (0.817)	Data Time 0.001 (0.011)	Loss 3.7774 (3.9699)	Entropy 1.78942 (1.80211)	Top-1 acc 37.500 (31.531)	Top-5 acc 61.328 (55.201)	lr 0.02491
Train [5][1870/3239]	Time 0.610 (0.816)	Data Time 0.002 (0.011)	Loss 3.9091 (3.9698)	Entropy 1.78919 (1.80205)	Top-1 acc 33.594 (31.536)	Top-5 acc 58.203 (55.204)	lr 0.02491
Train [5][1880/3239]	Time 0.657 (0.816)	Data Time 0.001 (0.011)	Loss 3.9071 (3.9696)	Entropy 1.78911 (1.80198)	Top-1 acc 32.812 (31.542)	Top-5 acc 53.516 (55.208)	lr 0.02491
Train [5][1890/3239]	Time 0.480 (0.816)	Data Time 0.001 (0.011)	Loss 3.7884 (3.9692)	Entropy 1.78882 (1.80191)	Top-1 acc 38.672 (31.552)	Top-5 acc 57.812 (55.212)	lr 0.02491
Train [5][1900/3239]	Time 0.607 (0.816)	Data Time 0.002 (0.011)	Loss 4.1351 (3.9692)	Entropy 1.78864 (1.80184)	Top-1 acc 28.125 (31.548)	Top-5 acc 48.828 (55.213)	lr 0.02491
Train [5][1910/3239]	Time 0.572 (0.816)	Data Time 0.001 (0.011)	Loss 3.9710 (3.9694)	Entropy 1.78864 (1.80177)	Top-1 acc 32.422 (31.546)	Top-5 acc 56.641 (55.211)	lr 0.02491
Train [5][1920/3239]	Time 0.516 (0.815)	Data Time 0.001 (0.011)	Loss 4.0814 (3.9698)	Entropy 1.78855 (1.80170)	Top-1 acc 31.250 (31.539)	Top-5 acc 52.344 (55.203)	lr 0.02491
Train [5][1930/3239]	Time 0.521 (0.815)	Data Time 0.001 (0.011)	Loss 3.8675 (3.9698)	Entropy 1.78835 (1.80163)	Top-1 acc 32.031 (31.539)	Top-5 acc 57.031 (55.201)	lr 0.02491
Train [5][1940/3239]	Time 0.478 (0.815)	Data Time 0.001 (0.011)	Loss 4.0908 (3.9700)	Entropy 1.78821 (1.80156)	Top-1 acc 30.469 (31.535)	Top-5 acc 54.688 (55.198)	lr 0.02491
Train [5][1950/3239]	Time 0.582 (0.815)	Data Time 0.001 (0.011)	Loss 3.9325 (3.9697)	Entropy 1.78819 (1.80150)	Top-1 acc 32.812 (31.540)	Top-5 acc 55.859 (55.206)	lr 0.02491
Train [5][1960/3239]	Time 0.537 (0.815)	Data Time 0.001 (0.011)	Loss 4.0339 (3.9692)	Entropy 1.78803 (1.80143)	Top-1 acc 32.812 (31.551)	Top-5 acc 53.516 (55.220)	lr 0.02491
Train [5][1970/3239]	Time 0.563 (0.815)	Data Time 0.001 (0.011)	Loss 4.0878 (3.9689)	Entropy 1.78802 (1.80136)	Top-1 acc 29.297 (31.556)	Top-5 acc 51.953 (55.220)	lr 0.02491
Train [5][1980/3239]	Time 0.545 (0.815)	Data Time 0.001 (0.011)	Loss 3.9331 (3.9685)	Entropy 1.78786 (1.80129)	Top-1 acc 32.422 (31.566)	Top-5 acc 55.859 (55.229)	lr 0.02491
Train [5][1990/3239]	Time 0.601 (0.815)	Data Time 0.003 (0.011)	Loss 3.9239 (3.9684)	Entropy 1.78771 (1.80122)	Top-1 acc 30.469 (31.565)	Top-5 acc 53.906 (55.232)	lr 0.02491
Train [5][2000/3239]	Time 0.339 (0.814)	Data Time 0.001 (0.011)	Loss 3.8397 (3.9681)	Entropy 1.78761 (1.80116)	Top-1 acc 32.812 (31.567)	Top-5 acc 59.375 (55.245)	lr 0.02491
Train [5][2010/3239]	Time 0.517 (0.814)	Data Time 0.001 (0.011)	Loss 3.9447 (3.9678)	Entropy 1.78733 (1.80109)	Top-1 acc 29.297 (31.571)	Top-5 acc 55.469 (55.247)	lr 0.02491
Train [5][2020/3239]	Time 0.577 (0.814)	Data Time 0.001 (0.011)	Loss 3.9740 (3.9676)	Entropy 1.78730 (1.80102)	Top-1 acc 31.641 (31.576)	Top-5 acc 56.641 (55.258)	lr 0.02491
Train [5][2030/3239]	Time 0.254 (0.814)	Data Time 0.001 (0.011)	Loss 3.8379 (3.9676)	Entropy 1.78700 (1.80095)	Top-1 acc 36.719 (31.582)	Top-5 acc 55.859 (55.258)	lr 0.02491
Train [5][2040/3239]	Time 0.542 (0.814)	Data Time 0.001 (0.011)	Loss 4.0525 (3.9675)	Entropy 1.78685 (1.80088)	Top-1 acc 32.812 (31.591)	Top-5 acc 54.688 (55.262)	lr 0.02491
Train [5][2050/3239]	Time 0.554 (0.813)	Data Time 0.001 (0.011)	Loss 3.8022 (3.9676)	Entropy 1.78666 (1.80082)	Top-1 acc 37.109 (31.586)	Top-5 acc 59.375 (55.258)	lr 0.02491
Train [5][2060/3239]	Time 0.506 (0.813)	Data Time 0.002 (0.011)	Loss 3.8803 (3.9675)	Entropy 1.78656 (1.80075)	Top-1 acc 34.766 (31.589)	Top-5 acc 56.250 (55.263)	lr 0.02491
Train [5][2070/3239]	Time 0.519 (0.813)	Data Time 0.001 (0.011)	Loss 4.0693 (3.9672)	Entropy 1.78643 (1.80068)	Top-1 acc 28.906 (31.597)	Top-5 acc 55.078 (55.271)	lr 0.02491
Train [5][2080/3239]	Time 0.496 (0.821)	Data Time 0.002 (0.011)	Loss 4.2407 (3.9678)	Entropy 1.78626 (1.80061)	Top-1 acc 32.031 (31.587)	Top-5 acc 49.609 (55.259)	lr 0.02491
Train [5][2090/3239]	Time 0.530 (0.821)	Data Time 0.002 (0.011)	Loss 3.8637 (3.9675)	Entropy 1.78615 (1.80054)	Top-1 acc 33.984 (31.594)	Top-5 acc 58.594 (55.265)	lr 0.02491
Train [5][2100/3239]	Time 0.528 (0.821)	Data Time 0.001 (0.010)	Loss 3.8587 (3.9673)	Entropy 1.78591 (1.80047)	Top-1 acc 33.203 (31.597)	Top-5 acc 55.859 (55.271)	lr 0.02491
Train [5][2110/3239]	Time 0.499 (0.820)	Data Time 0.001 (0.010)	Loss 4.0281 (3.9676)	Entropy 1.78577 (1.80040)	Top-1 acc 30.859 (31.593)	Top-5 acc 52.344 (55.267)	lr 0.02491
Train [5][2120/3239]	Time 0.535 (0.820)	Data Time 0.001 (0.010)	Loss 3.8407 (3.9675)	Entropy 1.78552 (1.80033)	Top-1 acc 32.812 (31.588)	Top-5 acc 59.766 (55.271)	lr 0.02491
Train [5][2130/3239]	Time 0.624 (0.820)	Data Time 0.002 (0.010)	Loss 4.1628 (3.9678)	Entropy 1.78542 (1.80026)	Top-1 acc 26.562 (31.581)	Top-5 acc 48.828 (55.265)	lr 0.02491
Train [5][2140/3239]	Time 0.475 (0.820)	Data Time 0.002 (0.010)	Loss 4.0818 (3.9677)	Entropy 1.78531 (1.80019)	Top-1 acc 30.078 (31.588)	Top-5 acc 55.469 (55.266)	lr 0.02491
Train [5][2150/3239]	Time 0.554 (0.820)	Data Time 0.002 (0.010)	Loss 3.8903 (3.9677)	Entropy 1.78504 (1.80012)	Top-1 acc 36.328 (31.588)	Top-5 acc 56.641 (55.265)	lr 0.02491
Train [5][2160/3239]	Time 0.445 (0.820)	Data Time 0.001 (0.010)	Loss 3.8829 (3.9673)	Entropy 1.78489 (1.80005)	Top-1 acc 34.375 (31.595)	Top-5 acc 57.031 (55.275)	lr 0.02491
Train [5][2170/3239]	Time 0.575 (0.819)	Data Time 0.023 (0.010)	Loss 4.0183 (3.9674)	Entropy 1.78472 (1.79998)	Top-1 acc 32.031 (31.594)	Top-5 acc 55.469 (55.274)	lr 0.02491
Train [5][2180/3239]	Time 0.657 (0.819)	Data Time 0.002 (0.010)	Loss 3.8635 (3.9673)	Entropy 1.78474 (1.79991)	Top-1 acc 34.375 (31.600)	Top-5 acc 58.984 (55.277)	lr 0.02491
Train [5][2190/3239]	Time 0.550 (0.819)	Data Time 0.001 (0.010)	Loss 3.9301 (3.9675)	Entropy 1.78456 (1.79984)	Top-1 acc 30.469 (31.592)	Top-5 acc 54.688 (55.275)	lr 0.02491
Train [5][2200/3239]	Time 0.590 (0.818)	Data Time 0.001 (0.010)	Loss 3.9694 (3.9677)	Entropy 1.78438 (1.79977)	Top-1 acc 32.031 (31.591)	Top-5 acc 58.203 (55.274)	lr 0.02491
Train [5][2210/3239]	Time 0.486 (0.818)	Data Time 0.001 (0.010)	Loss 3.8188 (3.9678)	Entropy 1.78428 (1.79971)	Top-1 acc 36.328 (31.587)	Top-5 acc 58.984 (55.273)	lr 0.02491
Train [5][2220/3239]	Time 0.543 (0.818)	Data Time 0.001 (0.010)	Loss 4.1108 (3.9676)	Entropy 1.78412 (1.79964)	Top-1 acc 27.344 (31.590)	Top-5 acc 52.734 (55.275)	lr 0.02491
Train [5][2230/3239]	Time 0.621 (0.818)	Data Time 0.001 (0.010)	Loss 4.1017 (3.9676)	Entropy 1.78398 (1.79957)	Top-1 acc 26.172 (31.592)	Top-5 acc 54.297 (55.279)	lr 0.02491
Train [5][2240/3239]	Time 0.567 (0.818)	Data Time 0.001 (0.010)	Loss 3.8839 (3.9672)	Entropy 1.78378 (1.79950)	Top-1 acc 33.594 (31.600)	Top-5 acc 59.766 (55.286)	lr 0.02491
Train [5][2250/3239]	Time 0.576 (0.818)	Data Time 0.001 (0.010)	Loss 3.9043 (3.9671)	Entropy 1.78361 (1.79943)	Top-1 acc 30.469 (31.605)	Top-5 acc 57.422 (55.284)	lr 0.02491
Train [5][2260/3239]	Time 0.460 (0.818)	Data Time 0.001 (0.010)	Loss 4.0478 (3.9672)	Entropy 1.78351 (1.79936)	Top-1 acc 30.078 (31.602)	Top-5 acc 51.953 (55.278)	lr 0.02491
Train [5][2270/3239]	Time 0.568 (0.818)	Data Time 0.001 (0.010)	Loss 4.1124 (3.9672)	Entropy 1.78342 (1.79929)	Top-1 acc 28.906 (31.602)	Top-5 acc 55.078 (55.279)	lr 0.02491
Train [5][2280/3239]	Time 0.547 (0.818)	Data Time 0.001 (0.010)	Loss 3.9046 (3.9670)	Entropy 1.78310 (1.79922)	Top-1 acc 30.859 (31.605)	Top-5 acc 54.688 (55.282)	lr 0.02491
Train [5][2290/3239]	Time 0.530 (0.817)	Data Time 0.001 (0.010)	Loss 3.9123 (3.9668)	Entropy 1.78276 (1.79914)	Top-1 acc 32.031 (31.610)	Top-5 acc 54.297 (55.288)	lr 0.02491
Train [5][2300/3239]	Time 0.551 (0.817)	Data Time 0.001 (0.010)	Loss 3.7744 (3.9667)	Entropy 1.78274 (1.79907)	Top-1 acc 35.938 (31.609)	Top-5 acc 60.156 (55.289)	lr 0.02491
Train [5][2310/3239]	Time 0.569 (0.817)	Data Time 0.001 (0.010)	Loss 3.9797 (3.9667)	Entropy 1.78266 (1.79900)	Top-1 acc 29.297 (31.606)	Top-5 acc 54.688 (55.293)	lr 0.02490
Train [5][2320/3239]	Time 0.518 (0.817)	Data Time 0.001 (0.010)	Loss 4.0246 (3.9671)	Entropy 1.78230 (1.79893)	Top-1 acc 32.031 (31.604)	Top-5 acc 55.078 (55.288)	lr 0.02490
Train [5][2330/3239]	Time 0.505 (0.817)	Data Time 0.001 (0.010)	Loss 3.9747 (3.9671)	Entropy 1.78221 (1.79886)	Top-1 acc 31.641 (31.606)	Top-5 acc 54.688 (55.288)	lr 0.02490
Train [5][2340/3239]	Time 0.499 (0.817)	Data Time 0.001 (0.010)	Loss 3.9376 (3.9670)	Entropy 1.78215 (1.79879)	Top-1 acc 33.203 (31.610)	Top-5 acc 58.594 (55.294)	lr 0.02490
Train [5][2350/3239]	Time 0.587 (0.817)	Data Time 0.001 (0.010)	Loss 4.0967 (3.9672)	Entropy 1.78200 (1.79872)	Top-1 acc 27.344 (31.605)	Top-5 acc 52.734 (55.295)	lr 0.02490
Train [5][2360/3239]	Time 0.421 (0.816)	Data Time 0.001 (0.010)	Loss 4.1907 (3.9673)	Entropy 1.78193 (1.79865)	Top-1 acc 28.516 (31.602)	Top-5 acc 51.562 (55.293)	lr 0.02490
Train [5][2370/3239]	Time 0.497 (0.816)	Data Time 0.001 (0.010)	Loss 4.0624 (3.9673)	Entropy 1.78174 (1.79858)	Top-1 acc 30.078 (31.605)	Top-5 acc 51.172 (55.297)	lr 0.02490
Train [5][2380/3239]	Time 0.528 (0.816)	Data Time 0.001 (0.010)	Loss 4.0181 (3.9672)	Entropy 1.78151 (1.79851)	Top-1 acc 29.297 (31.603)	Top-5 acc 53.125 (55.301)	lr 0.02490
Train [5][2390/3239]	Time 0.592 (0.816)	Data Time 0.001 (0.010)	Loss 4.0178 (3.9672)	Entropy 1.78147 (1.79843)	Top-1 acc 32.812 (31.598)	Top-5 acc 53.906 (55.298)	lr 0.02490
Train [5][2400/3239]	Time 0.640 (0.816)	Data Time 0.001 (0.010)	Loss 3.9884 (3.9669)	Entropy 1.78129 (1.79836)	Top-1 acc 32.812 (31.606)	Top-5 acc 57.812 (55.305)	lr 0.02490
Train [5][2410/3239]	Time 0.519 (0.816)	Data Time 0.001 (0.010)	Loss 3.9621 (3.9667)	Entropy 1.78116 (1.79829)	Top-1 acc 33.594 (31.612)	Top-5 acc 54.688 (55.311)	lr 0.02490
Train [5][2420/3239]	Time 0.548 (0.816)	Data Time 0.001 (0.009)	Loss 3.8998 (3.9665)	Entropy 1.78091 (1.79822)	Top-1 acc 29.688 (31.613)	Top-5 acc 59.375 (55.317)	lr 0.02490
Train [5][2430/3239]	Time 0.393 (0.816)	Data Time 0.001 (0.009)	Loss 3.8102 (3.9665)	Entropy 1.78070 (1.79815)	Top-1 acc 35.938 (31.611)	Top-5 acc 58.203 (55.313)	lr 0.02490
Train [5][2440/3239]	Time 0.538 (0.816)	Data Time 0.001 (0.009)	Loss 3.7531 (3.9663)	Entropy 1.78044 (1.79808)	Top-1 acc 33.984 (31.612)	Top-5 acc 59.766 (55.321)	lr 0.02490
Train [5][2450/3239]	Time 0.624 (0.816)	Data Time 0.001 (0.009)	Loss 3.9222 (3.9664)	Entropy 1.78031 (1.79801)	Top-1 acc 32.422 (31.610)	Top-5 acc 51.953 (55.318)	lr 0.02490
Train [5][2460/3239]	Time 0.542 (0.815)	Data Time 0.002 (0.009)	Loss 3.8263 (3.9664)	Entropy 1.78018 (1.79793)	Top-1 acc 31.641 (31.607)	Top-5 acc 55.859 (55.314)	lr 0.02490
Train [5][2470/3239]	Time 0.553 (0.815)	Data Time 0.001 (0.009)	Loss 3.9885 (3.9663)	Entropy 1.77988 (1.79786)	Top-1 acc 32.812 (31.613)	Top-5 acc 56.250 (55.318)	lr 0.02490
Train [5][2480/3239]	Time 0.530 (0.815)	Data Time 0.001 (0.009)	Loss 3.9905 (3.9661)	Entropy 1.77989 (1.79779)	Top-1 acc 31.641 (31.615)	Top-5 acc 54.688 (55.322)	lr 0.02490
Train [5][2490/3239]	Time 0.587 (0.815)	Data Time 0.002 (0.009)	Loss 4.1511 (3.9661)	Entropy 1.77979 (1.79772)	Top-1 acc 29.297 (31.615)	Top-5 acc 55.078 (55.317)	lr 0.02490
Train [5][2500/3239]	Time 0.528 (0.815)	Data Time 0.001 (0.009)	Loss 3.9180 (3.9657)	Entropy 1.77965 (1.79764)	Top-1 acc 28.906 (31.619)	Top-5 acc 54.688 (55.328)	lr 0.02490
Train [5][2510/3239]	Time 0.548 (0.815)	Data Time 0.001 (0.009)	Loss 3.8855 (3.9655)	Entropy 1.77955 (1.79757)	Top-1 acc 36.328 (31.621)	Top-5 acc 57.031 (55.331)	lr 0.02490
Train [5][2520/3239]	Time 0.468 (0.815)	Data Time 0.001 (0.009)	Loss 3.8016 (3.9655)	Entropy 1.77923 (1.79750)	Top-1 acc 38.281 (31.623)	Top-5 acc 57.812 (55.329)	lr 0.02490
Train [5][2530/3239]	Time 0.455 (0.814)	Data Time 0.001 (0.009)	Loss 4.0605 (3.9655)	Entropy 1.77901 (1.79743)	Top-1 acc 25.000 (31.619)	Top-5 acc 55.469 (55.329)	lr 0.02490
Train [5][2540/3239]	Time 0.620 (0.814)	Data Time 0.001 (0.009)	Loss 4.0692 (3.9657)	Entropy 1.77869 (1.79736)	Top-1 acc 28.906 (31.615)	Top-5 acc 51.172 (55.326)	lr 0.02490
Train [5][2550/3239]	Time 0.721 (0.814)	Data Time 0.001 (0.009)	Loss 3.8612 (3.9656)	Entropy 1.77853 (1.79728)	Top-1 acc 33.203 (31.617)	Top-5 acc 59.375 (55.330)	lr 0.02490
Train [5][2560/3239]	Time 0.537 (0.814)	Data Time 0.001 (0.009)	Loss 3.8014 (3.9655)	Entropy 1.77824 (1.79721)	Top-1 acc 39.453 (31.617)	Top-5 acc 55.469 (55.328)	lr 0.02490
Train [5][2570/3239]	Time 0.565 (0.814)	Data Time 0.002 (0.009)	Loss 4.0509 (3.9655)	Entropy 1.77818 (1.79713)	Top-1 acc 31.641 (31.616)	Top-5 acc 53.125 (55.330)	lr 0.02490
Train [5][2580/3239]	Time 0.560 (0.814)	Data Time 0.001 (0.009)	Loss 3.9822 (3.9657)	Entropy 1.77796 (1.79706)	Top-1 acc 29.688 (31.617)	Top-5 acc 55.469 (55.323)	lr 0.02490
Train [5][2590/3239]	Time 0.518 (0.814)	Data Time 0.001 (0.009)	Loss 3.8971 (3.9657)	Entropy 1.77800 (1.79699)	Top-1 acc 31.250 (31.617)	Top-5 acc 58.203 (55.326)	lr 0.02490
Train [5][2600/3239]	Time 0.556 (0.814)	Data Time 0.001 (0.009)	Loss 3.8796 (3.9655)	Entropy 1.77774 (1.79691)	Top-1 acc 33.984 (31.617)	Top-5 acc 55.469 (55.325)	lr 0.02490
Train [5][2610/3239]	Time 0.507 (0.814)	Data Time 0.001 (0.009)	Loss 4.0366 (3.9656)	Entropy 1.77752 (1.79684)	Top-1 acc 28.906 (31.617)	Top-5 acc 56.641 (55.323)	lr 0.02490
Train [5][2620/3239]	Time 0.573 (0.813)	Data Time 0.003 (0.009)	Loss 3.9394 (3.9654)	Entropy 1.77734 (1.79677)	Top-1 acc 37.891 (31.620)	Top-5 acc 58.203 (55.329)	lr 0.02490
Train [5][2630/3239]	Time 0.528 (0.813)	Data Time 0.001 (0.009)	Loss 3.9343 (3.9652)	Entropy 1.77727 (1.79669)	Top-1 acc 30.859 (31.623)	Top-5 acc 55.859 (55.334)	lr 0.02490
Train [5][2640/3239]	Time 0.549 (0.813)	Data Time 0.001 (0.009)	Loss 3.7735 (3.9649)	Entropy 1.77707 (1.79662)	Top-1 acc 30.859 (31.630)	Top-5 acc 58.984 (55.341)	lr 0.02490
Train [5][2650/3239]	Time 0.550 (0.813)	Data Time 0.001 (0.009)	Loss 3.9431 (3.9652)	Entropy 1.77706 (1.79654)	Top-1 acc 36.328 (31.629)	Top-5 acc 54.688 (55.332)	lr 0.02490
Train [5][2660/3239]	Time 0.537 (0.813)	Data Time 0.001 (0.009)	Loss 3.9597 (3.9651)	Entropy 1.77685 (1.79647)	Top-1 acc 32.031 (31.632)	Top-5 acc 55.078 (55.334)	lr 0.02490
Train [5][2670/3239]	Time 0.567 (0.813)	Data Time 0.001 (0.009)	Loss 3.9266 (3.9648)	Entropy 1.77665 (1.79640)	Top-1 acc 31.250 (31.637)	Top-5 acc 56.641 (55.344)	lr 0.02490
Train [5][2680/3239]	Time 0.582 (0.813)	Data Time 0.001 (0.009)	Loss 4.1086 (3.9646)	Entropy 1.77655 (1.79632)	Top-1 acc 28.125 (31.634)	Top-5 acc 51.562 (55.350)	lr 0.02490
Train [5][2690/3239]	Time 0.528 (0.813)	Data Time 0.001 (0.009)	Loss 3.9346 (3.9647)	Entropy 1.77636 (1.79625)	Top-1 acc 35.156 (31.632)	Top-5 acc 56.250 (55.346)	lr 0.02490
Train [5][2700/3239]	Time 0.482 (0.813)	Data Time 0.001 (0.009)	Loss 3.7581 (3.9646)	Entropy 1.77617 (1.79618)	Top-1 acc 36.719 (31.635)	Top-5 acc 60.156 (55.352)	lr 0.02490
Train [5][2710/3239]	Time 0.588 (0.813)	Data Time 0.003 (0.009)	Loss 3.7194 (3.9643)	Entropy 1.77603 (1.79610)	Top-1 acc 38.672 (31.643)	Top-5 acc 62.109 (55.356)	lr 0.02490
Train [5][2720/3239]	Time 0.633 (0.813)	Data Time 0.001 (0.009)	Loss 3.9047 (3.9642)	Entropy 1.77576 (1.79603)	Top-1 acc 36.328 (31.644)	Top-5 acc 58.984 (55.362)	lr 0.02490
Train [5][2730/3239]	Time 0.644 (0.819)	Data Time 0.006 (0.009)	Loss 3.9118 (3.9641)	Entropy 1.77550 (1.79595)	Top-1 acc 33.594 (31.646)	Top-5 acc 51.953 (55.363)	lr 0.02490
Train [5][2740/3239]	Time 0.602 (0.819)	Data Time 0.002 (0.009)	Loss 3.9908 (3.9642)	Entropy 1.77531 (1.79588)	Top-1 acc 28.906 (31.642)	Top-5 acc 60.156 (55.364)	lr 0.02490
Train [5][2750/3239]	Time 0.420 (0.819)	Data Time 0.001 (0.009)	Loss 3.9210 (3.9640)	Entropy 1.77514 (1.79580)	Top-1 acc 31.250 (31.646)	Top-5 acc 51.953 (55.367)	lr 0.02490
Train [5][2760/3239]	Time 0.544 (0.819)	Data Time 0.001 (0.009)	Loss 3.8965 (3.9639)	Entropy 1.77512 (1.79573)	Top-1 acc 33.984 (31.648)	Top-5 acc 55.859 (55.369)	lr 0.02490
Train [5][2770/3239]	Time 0.614 (0.818)	Data Time 0.001 (0.009)	Loss 3.9258 (3.9637)	Entropy 1.77502 (1.79565)	Top-1 acc 28.516 (31.650)	Top-5 acc 60.156 (55.375)	lr 0.02490
Train [5][2780/3239]	Time 0.534 (0.818)	Data Time 0.001 (0.009)	Loss 3.9009 (3.9636)	Entropy 1.77475 (1.79558)	Top-1 acc 36.719 (31.649)	Top-5 acc 57.422 (55.376)	lr 0.02490
Train [5][2790/3239]	Time 0.563 (0.818)	Data Time 0.001 (0.009)	Loss 3.8797 (3.9636)	Entropy 1.77446 (1.79550)	Top-1 acc 34.375 (31.655)	Top-5 acc 55.078 (55.376)	lr 0.02490
Train [5][2800/3239]	Time 0.534 (0.818)	Data Time 0.002 (0.009)	Loss 3.7665 (3.9634)	Entropy 1.77434 (1.79543)	Top-1 acc 33.594 (31.656)	Top-5 acc 60.547 (55.377)	lr 0.02490
Train [5][2810/3239]	Time 0.566 (0.818)	Data Time 0.002 (0.009)	Loss 3.9465 (3.9633)	Entropy 1.77412 (1.79535)	Top-1 acc 32.812 (31.656)	Top-5 acc 55.859 (55.381)	lr 0.02490
Train [5][2820/3239]	Time 0.590 (0.818)	Data Time 0.001 (0.009)	Loss 3.8538 (3.9634)	Entropy 1.77378 (1.79528)	Top-1 acc 33.984 (31.657)	Top-5 acc 58.203 (55.377)	lr 0.02490
Train [5][2830/3239]	Time 0.501 (0.818)	Data Time 0.001 (0.009)	Loss 4.0939 (3.9634)	Entropy 1.77353 (1.79520)	Top-1 acc 28.906 (31.655)	Top-5 acc 53.906 (55.377)	lr 0.02490
Train [5][2840/3239]	Time 0.542 (0.818)	Data Time 0.001 (0.009)	Loss 3.8156 (3.9634)	Entropy 1.77327 (1.79513)	Top-1 acc 36.719 (31.656)	Top-5 acc 60.547 (55.376)	lr 0.02490
Train [5][2850/3239]	Time 0.525 (0.817)	Data Time 0.001 (0.009)	Loss 4.2086 (3.9635)	Entropy 1.77308 (1.79505)	Top-1 acc 27.344 (31.654)	Top-5 acc 49.609 (55.374)	lr 0.02490
Train [5][2860/3239]	Time 0.510 (0.817)	Data Time 0.001 (0.009)	Loss 3.8737 (3.9635)	Entropy 1.77268 (1.79497)	Top-1 acc 33.594 (31.655)	Top-5 acc 59.375 (55.375)	lr 0.02490
Train [5][2870/3239]	Time 0.604 (0.817)	Data Time 0.001 (0.009)	Loss 3.8029 (3.9633)	Entropy 1.77246 (1.79489)	Top-1 acc 39.062 (31.655)	Top-5 acc 61.328 (55.379)	lr 0.02490
Train [5][2880/3239]	Time 0.569 (0.817)	Data Time 0.001 (0.008)	Loss 3.8644 (3.9634)	Entropy 1.77228 (1.79482)	Top-1 acc 32.422 (31.653)	Top-5 acc 57.031 (55.378)	lr 0.02490
Train [5][2890/3239]	Time 0.428 (0.817)	Data Time 0.001 (0.008)	Loss 3.9688 (3.9634)	Entropy 1.77195 (1.79474)	Top-1 acc 34.766 (31.653)	Top-5 acc 58.203 (55.377)	lr 0.02490
Train [5][2900/3239]	Time 0.512 (0.817)	Data Time 0.001 (0.008)	Loss 3.8150 (3.9631)	Entropy 1.77173 (1.79466)	Top-1 acc 33.984 (31.656)	Top-5 acc 57.422 (55.380)	lr 0.02490
Train [5][2910/3239]	Time 0.517 (0.817)	Data Time 0.001 (0.008)	Loss 3.8072 (3.9632)	Entropy 1.77165 (1.79458)	Top-1 acc 34.375 (31.655)	Top-5 acc 56.641 (55.375)	lr 0.02490
Train [5][2920/3239]	Time 0.522 (0.817)	Data Time 0.002 (0.008)	Loss 3.8063 (3.9630)	Entropy 1.77167 (1.79450)	Top-1 acc 32.422 (31.661)	Top-5 acc 60.156 (55.380)	lr 0.02490
Train [5][2930/3239]	Time 0.584 (0.817)	Data Time 0.001 (0.008)	Loss 3.9285 (3.9630)	Entropy 1.77142 (1.79442)	Top-1 acc 32.422 (31.660)	Top-5 acc 55.859 (55.379)	lr 0.02490
Train [5][2940/3239]	Time 0.515 (0.817)	Data Time 0.001 (0.008)	Loss 4.0577 (3.9631)	Entropy 1.77126 (1.79434)	Top-1 acc 26.562 (31.661)	Top-5 acc 53.516 (55.380)	lr 0.02490
Train [5][2950/3239]	Time 0.501 (0.816)	Data Time 0.001 (0.008)	Loss 3.8674 (3.9628)	Entropy 1.77108 (1.79427)	Top-1 acc 32.422 (31.666)	Top-5 acc 55.469 (55.386)	lr 0.02490
Train [5][2960/3239]	Time 0.588 (0.816)	Data Time 0.002 (0.008)	Loss 3.6832 (3.9627)	Entropy 1.77093 (1.79419)	Top-1 acc 38.672 (31.670)	Top-5 acc 59.375 (55.388)	lr 0.02490
Train [5][2970/3239]	Time 0.497 (0.816)	Data Time 0.001 (0.008)	Loss 4.0359 (3.9627)	Entropy 1.77089 (1.79411)	Top-1 acc 28.125 (31.669)	Top-5 acc 56.641 (55.389)	lr 0.02490
Train [5][2980/3239]	Time 0.607 (0.816)	Data Time 0.001 (0.008)	Loss 4.0946 (3.9628)	Entropy 1.77068 (1.79403)	Top-1 acc 28.125 (31.662)	Top-5 acc 53.906 (55.387)	lr 0.02490
Train [5][2990/3239]	Time 0.542 (0.816)	Data Time 0.001 (0.008)	Loss 3.7286 (3.9627)	Entropy 1.77042 (1.79395)	Top-1 acc 38.672 (31.668)	Top-5 acc 60.156 (55.389)	lr 0.02490
Train [5][3000/3239]	Time 0.603 (0.816)	Data Time 0.001 (0.008)	Loss 3.9840 (3.9626)	Entropy 1.77013 (1.79387)	Top-1 acc 25.781 (31.666)	Top-5 acc 54.688 (55.392)	lr 0.02490
Train [5][3010/3239]	Time 0.534 (0.816)	Data Time 0.001 (0.008)	Loss 4.0065 (3.9626)	Entropy 1.76997 (1.79379)	Top-1 acc 29.297 (31.669)	Top-5 acc 55.859 (55.389)	lr 0.02490
Train [5][3020/3239]	Time 0.555 (0.816)	Data Time 0.001 (0.008)	Loss 3.9843 (3.9626)	Entropy 1.76982 (1.79372)	Top-1 acc 32.422 (31.667)	Top-5 acc 54.297 (55.391)	lr 0.02490
Train [5][3030/3239]	Time 0.543 (0.816)	Data Time 0.001 (0.008)	Loss 4.0361 (3.9626)	Entropy 1.76971 (1.79364)	Top-1 acc 30.469 (31.666)	Top-5 acc 49.219 (55.391)	lr 0.02490
Train [5][3040/3239]	Time 0.538 (0.815)	Data Time 0.001 (0.008)	Loss 3.8796 (3.9626)	Entropy 1.76959 (1.79356)	Top-1 acc 35.938 (31.669)	Top-5 acc 57.031 (55.392)	lr 0.02490
Train [5][3050/3239]	Time 0.550 (0.815)	Data Time 0.001 (0.008)	Loss 4.0012 (3.9627)	Entropy 1.76947 (1.79348)	Top-1 acc 29.297 (31.664)	Top-5 acc 54.688 (55.391)	lr 0.02490
Train [5][3060/3239]	Time 0.525 (0.815)	Data Time 0.001 (0.008)	Loss 3.8412 (3.9626)	Entropy 1.76932 (1.79340)	Top-1 acc 33.594 (31.664)	Top-5 acc 58.984 (55.395)	lr 0.02490
Train [5][3070/3239]	Time 0.511 (0.815)	Data Time 0.001 (0.008)	Loss 3.9383 (3.9625)	Entropy 1.76924 (1.79332)	Top-1 acc 34.766 (31.665)	Top-5 acc 57.812 (55.396)	lr 0.02490
Train [5][3080/3239]	Time 0.544 (0.815)	Data Time 0.001 (0.008)	Loss 3.8404 (3.9624)	Entropy 1.76917 (1.79324)	Top-1 acc 31.641 (31.666)	Top-5 acc 58.594 (55.397)	lr 0.02490
Train [5][3090/3239]	Time 0.426 (0.815)	Data Time 0.001 (0.008)	Loss 4.0049 (3.9625)	Entropy 1.76891 (1.79317)	Top-1 acc 31.641 (31.665)	Top-5 acc 52.344 (55.395)	lr 0.02490
Train [5][3100/3239]	Time 0.590 (0.815)	Data Time 0.001 (0.008)	Loss 4.0638 (3.9627)	Entropy 1.76897 (1.79309)	Top-1 acc 27.344 (31.661)	Top-5 acc 54.297 (55.391)	lr 0.02489
Train [5][3110/3239]	Time 0.498 (0.815)	Data Time 0.001 (0.008)	Loss 4.1199 (3.9625)	Entropy 1.76877 (1.79301)	Top-1 acc 25.000 (31.662)	Top-5 acc 50.000 (55.396)	lr 0.02489
Train [5][3120/3239]	Time 0.656 (0.815)	Data Time 0.001 (0.008)	Loss 4.0246 (3.9626)	Entropy 1.76860 (1.79293)	Top-1 acc 29.688 (31.656)	Top-5 acc 52.344 (55.391)	lr 0.02489
Train [5][3130/3239]	Time 0.542 (0.815)	Data Time 0.001 (0.008)	Loss 3.9558 (3.9626)	Entropy 1.76842 (1.79285)	Top-1 acc 30.859 (31.656)	Top-5 acc 55.078 (55.394)	lr 0.02489
Train [5][3140/3239]	Time 0.596 (0.814)	Data Time 0.001 (0.008)	Loss 3.7884 (3.9625)	Entropy 1.76822 (1.79278)	Top-1 acc 36.328 (31.659)	Top-5 acc 60.547 (55.395)	lr 0.02489
Train [5][3150/3239]	Time 0.537 (0.814)	Data Time 0.001 (0.008)	Loss 4.0294 (3.9624)	Entropy 1.76824 (1.79270)	Top-1 acc 31.641 (31.665)	Top-5 acc 52.734 (55.397)	lr 0.02489
Train [5][3160/3239]	Time 0.580 (0.814)	Data Time 0.001 (0.008)	Loss 4.0605 (3.9625)	Entropy 1.76814 (1.79262)	Top-1 acc 30.078 (31.666)	Top-5 acc 54.688 (55.394)	lr 0.02489
Train [5][3170/3239]	Time 0.692 (0.814)	Data Time 0.001 (0.008)	Loss 3.8906 (3.9625)	Entropy 1.76799 (1.79254)	Top-1 acc 33.203 (31.669)	Top-5 acc 55.469 (55.395)	lr 0.02489
Train [5][3180/3239]	Time 0.516 (0.814)	Data Time 0.000 (0.008)	Loss 3.7681 (3.9624)	Entropy 1.76794 (1.79247)	Top-1 acc 32.812 (31.673)	Top-5 acc 59.766 (55.395)	lr 0.02489
Train [5][3190/3239]	Time 0.502 (0.814)	Data Time 0.000 (0.008)	Loss 3.8307 (3.9622)	Entropy 1.76778 (1.79239)	Top-1 acc 36.719 (31.676)	Top-5 acc 60.156 (55.402)	lr 0.02489
Train [5][3200/3239]	Time 0.490 (0.814)	Data Time 0.000 (0.008)	Loss 3.8575 (3.9620)	Entropy 1.76748 (1.79231)	Top-1 acc 36.328 (31.678)	Top-5 acc 61.328 (55.406)	lr 0.02489
Train [5][3210/3239]	Time 0.559 (0.814)	Data Time 0.000 (0.008)	Loss 3.7469 (3.9619)	Entropy 1.76726 (1.79223)	Top-1 acc 36.328 (31.679)	Top-5 acc 59.375 (55.405)	lr 0.02489
Train [5][3220/3239]	Time 0.685 (0.813)	Data Time 0.000 (0.008)	Loss 3.8551 (3.9619)	Entropy 1.76713 (1.79216)	Top-1 acc 33.203 (31.678)	Top-5 acc 55.859 (55.404)	lr 0.02489
Train [5][3230/3239]	Time 0.483 (0.813)	Data Time 0.000 (0.008)	Loss 3.7091 (3.9618)	Entropy 1.76713 (1.79208)	Top-1 acc 37.891 (31.678)	Top-5 acc 60.547 (55.405)	lr 0.02489
Train [5][3239/3239]	Time 1.576 (0.813)	Data Time 0.000 (0.008)	Loss 3.9949 (3.9617)	Entropy 1.76705 (1.79201)	Top-1 acc 27.160 (31.678)	Top-5 acc 56.790 (55.407)	lr 0.02489
==========Valid [5/120]	loss 2.815	top-1 acc 40.288 (40.288)	top-5 acc 65.178	Train top-1 31.678	top-5 55.407	Entropy 1.76705	Latency-None: 0.000ms	Flops: 539.76M
Train [6][0/3239]	Time 17.800 (17.800)	Data Time 14.912 (14.912)	Loss 3.9364 (3.9364)	Entropy 1.76698 (1.76698)	Top-1 acc 30.078 (30.078)	Top-5 acc 56.250 (56.250)	lr 0.02489
Train [6][10/3239]	Time 0.442 (2.394)	Data Time 0.001 (1.362)	Loss 3.8151 (3.8977)	Entropy 1.76687 (1.76693)	Top-1 acc 37.109 (32.457)	Top-5 acc 58.203 (56.712)	lr 0.02489
Train [6][20/3239]	Time 0.536 (1.628)	Data Time 0.001 (0.714)	Loss 3.9977 (3.9096)	Entropy 1.76678 (1.76689)	Top-1 acc 33.203 (33.054)	Top-5 acc 55.859 (56.622)	lr 0.02489
Train [6][30/3239]	Time 0.475 (1.353)	Data Time 0.001 (0.485)	Loss 3.8083 (3.9115)	Entropy 1.76663 (1.76684)	Top-1 acc 36.719 (33.102)	Top-5 acc 58.984 (56.741)	lr 0.02489
Train [6][40/3239]	Time 0.528 (1.222)	Data Time 0.002 (0.368)	Loss 4.0262 (3.9204)	Entropy 1.76651 (1.76677)	Top-1 acc 28.906 (32.908)	Top-5 acc 52.734 (56.641)	lr 0.02489
Train [6][50/3239]	Time 0.475 (1.141)	Data Time 0.001 (0.296)	Loss 4.0441 (3.9151)	Entropy 1.76615 (1.76669)	Top-1 acc 26.172 (33.081)	Top-5 acc 55.078 (56.671)	lr 0.02489
Train [6][60/3239]	Time 0.490 (1.085)	Data Time 0.001 (0.248)	Loss 4.0119 (3.9104)	Entropy 1.76618 (1.76660)	Top-1 acc 31.641 (33.190)	Top-5 acc 55.859 (56.782)	lr 0.02489
Train [6][70/3239]	Time 0.531 (1.045)	Data Time 0.001 (0.213)	Loss 3.9288 (3.9130)	Entropy 1.76601 (1.76654)	Top-1 acc 28.516 (33.077)	Top-5 acc 55.078 (56.696)	lr 0.02489
Train [6][80/3239]	Time 0.685 (1.016)	Data Time 0.001 (0.187)	Loss 4.2342 (3.9176)	Entropy 1.76606 (1.76647)	Top-1 acc 28.906 (32.851)	Top-5 acc 47.266 (56.592)	lr 0.02489
Train [6][90/3239]	Time 0.511 (0.989)	Data Time 0.001 (0.167)	Loss 3.9630 (3.9165)	Entropy 1.76592 (1.76642)	Top-1 acc 34.766 (32.868)	Top-5 acc 58.594 (56.623)	lr 0.02489
Train [6][100/3239]	Time 0.524 (0.970)	Data Time 0.001 (0.151)	Loss 3.8537 (3.9171)	Entropy 1.76594 (1.76638)	Top-1 acc 34.375 (32.898)	Top-5 acc 56.641 (56.598)	lr 0.02489
Train [6][110/3239]	Time 0.553 (0.952)	Data Time 0.001 (0.137)	Loss 3.9487 (3.9157)	Entropy 1.76575 (1.76633)	Top-1 acc 30.859 (32.883)	Top-5 acc 56.641 (56.648)	lr 0.02489
Train [6][120/3239]	Time 0.562 (0.939)	Data Time 0.001 (0.126)	Loss 3.9574 (3.9166)	Entropy 1.76551 (1.76627)	Top-1 acc 35.938 (32.880)	Top-5 acc 55.469 (56.618)	lr 0.02489
Train [6][130/3239]	Time 0.679 (0.929)	Data Time 0.001 (0.117)	Loss 4.0142 (3.9170)	Entropy 1.76537 (1.76621)	Top-1 acc 26.562 (32.818)	Top-5 acc 54.688 (56.545)	lr 0.02489
Train [6][140/3239]	Time 0.579 (0.920)	Data Time 0.001 (0.108)	Loss 3.9674 (3.9198)	Entropy 1.76534 (1.76615)	Top-1 acc 32.422 (32.812)	Top-5 acc 52.734 (56.458)	lr 0.02489
Train [6][150/3239]	Time 0.291 (1.031)	Data Time 0.002 (0.101)	Loss 3.9740 (3.9226)	Entropy 1.76522 (1.76610)	Top-1 acc 28.516 (32.725)	Top-5 acc 54.297 (56.346)	lr 0.02489
Train [6][160/3239]	Time 0.527 (1.017)	Data Time 0.002 (0.096)	Loss 3.7243 (3.9253)	Entropy 1.76511 (1.76604)	Top-1 acc 35.938 (32.626)	Top-5 acc 63.672 (56.318)	lr 0.02489
Train [6][170/3239]	Time 0.557 (1.002)	Data Time 0.001 (0.091)	Loss 3.8952 (3.9250)	Entropy 1.76504 (1.76598)	Top-1 acc 37.500 (32.698)	Top-5 acc 57.031 (56.346)	lr 0.02489
Train [6][180/3239]	Time 0.691 (0.990)	Data Time 0.001 (0.086)	Loss 3.6699 (3.9201)	Entropy 1.76480 (1.76592)	Top-1 acc 33.203 (32.748)	Top-5 acc 59.375 (56.408)	lr 0.02489
Train [6][190/3239]	Time 0.518 (0.980)	Data Time 0.001 (0.081)	Loss 3.9166 (3.9196)	Entropy 1.76474 (1.76586)	Top-1 acc 36.328 (32.759)	Top-5 acc 58.984 (56.432)	lr 0.02489
Train [6][200/3239]	Time 0.445 (0.970)	Data Time 0.001 (0.078)	Loss 4.0304 (3.9220)	Entropy 1.76449 (1.76580)	Top-1 acc 26.562 (32.659)	Top-5 acc 53.906 (56.365)	lr 0.02489
Train [6][210/3239]	Time 0.543 (0.963)	Data Time 0.001 (0.074)	Loss 3.9949 (3.9206)	Entropy 1.76437 (1.76574)	Top-1 acc 30.859 (32.648)	Top-5 acc 51.953 (56.363)	lr 0.02489
Train [6][220/3239]	Time 0.573 (0.956)	Data Time 0.001 (0.071)	Loss 3.9237 (3.9223)	Entropy 1.76423 (1.76567)	Top-1 acc 31.641 (32.655)	Top-5 acc 57.422 (56.331)	lr 0.02489
Train [6][230/3239]	Time 0.564 (0.949)	Data Time 0.001 (0.068)	Loss 4.0272 (3.9256)	Entropy 1.76405 (1.76561)	Top-1 acc 31.250 (32.589)	Top-5 acc 56.641 (56.274)	lr 0.02489
Train [6][240/3239]	Time 0.531 (0.942)	Data Time 0.001 (0.066)	Loss 3.6079 (3.9232)	Entropy 1.76396 (1.76554)	Top-1 acc 38.281 (32.613)	Top-5 acc 62.500 (56.307)	lr 0.02489
Train [6][250/3239]	Time 0.519 (0.936)	Data Time 0.001 (0.063)	Loss 4.1041 (3.9263)	Entropy 1.76400 (1.76548)	Top-1 acc 29.297 (32.556)	Top-5 acc 51.172 (56.242)	lr 0.02489
Train [6][260/3239]	Time 0.579 (0.932)	Data Time 0.002 (0.061)	Loss 3.7851 (3.9251)	Entropy 1.76405 (1.76542)	Top-1 acc 34.375 (32.569)	Top-5 acc 60.938 (56.301)	lr 0.02489
Train [6][270/3239]	Time 0.603 (0.927)	Data Time 0.001 (0.059)	Loss 3.9281 (3.9243)	Entropy 1.76368 (1.76536)	Top-1 acc 31.250 (32.569)	Top-5 acc 54.688 (56.316)	lr 0.02489
Train [6][280/3239]	Time 0.515 (0.922)	Data Time 0.001 (0.057)	Loss 3.9843 (3.9252)	Entropy 1.76340 (1.76530)	Top-1 acc 27.344 (32.497)	Top-5 acc 51.172 (56.265)	lr 0.02489
Train [6][290/3239]	Time 0.548 (0.917)	Data Time 0.001 (0.055)	Loss 3.9098 (3.9259)	Entropy 1.76318 (1.76523)	Top-1 acc 35.938 (32.474)	Top-5 acc 53.125 (56.231)	lr 0.02489
Train [6][300/3239]	Time 0.705 (0.914)	Data Time 0.001 (0.053)	Loss 3.8425 (3.9256)	Entropy 1.76294 (1.76516)	Top-1 acc 33.594 (32.472)	Top-5 acc 62.891 (56.247)	lr 0.02489
Train [6][310/3239]	Time 0.611 (0.911)	Data Time 0.001 (0.051)	Loss 3.8632 (3.9243)	Entropy 1.76282 (1.76509)	Top-1 acc 32.422 (32.480)	Top-5 acc 58.203 (56.278)	lr 0.02489
Train [6][320/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.050)	Loss 3.9675 (3.9232)	Entropy 1.76271 (1.76501)	Top-1 acc 31.641 (32.508)	Top-5 acc 56.641 (56.291)	lr 0.02489
Train [6][330/3239]	Time 0.540 (0.903)	Data Time 0.002 (0.048)	Loss 3.8562 (3.9216)	Entropy 1.76241 (1.76494)	Top-1 acc 33.203 (32.509)	Top-5 acc 54.688 (56.335)	lr 0.02489
Train [6][340/3239]	Time 0.543 (0.900)	Data Time 0.001 (0.047)	Loss 3.7107 (3.9209)	Entropy 1.76220 (1.76486)	Top-1 acc 35.547 (32.481)	Top-5 acc 60.547 (56.352)	lr 0.02489
Train [6][350/3239]	Time 0.653 (0.896)	Data Time 0.001 (0.046)	Loss 3.8803 (3.9203)	Entropy 1.76189 (1.76479)	Top-1 acc 30.078 (32.489)	Top-5 acc 58.594 (56.351)	lr 0.02489
Train [6][360/3239]	Time 0.595 (0.893)	Data Time 0.001 (0.045)	Loss 3.7083 (3.9192)	Entropy 1.76173 (1.76470)	Top-1 acc 36.719 (32.540)	Top-5 acc 62.109 (56.383)	lr 0.02489
Train [6][370/3239]	Time 0.531 (0.891)	Data Time 0.001 (0.043)	Loss 3.6765 (3.9183)	Entropy 1.76172 (1.76462)	Top-1 acc 31.641 (32.545)	Top-5 acc 61.328 (56.404)	lr 0.02489
Train [6][380/3239]	Time 0.513 (0.888)	Data Time 0.001 (0.042)	Loss 3.9246 (3.9190)	Entropy 1.76160 (1.76455)	Top-1 acc 33.984 (32.530)	Top-5 acc 55.078 (56.391)	lr 0.02489
Train [6][390/3239]	Time 0.523 (0.886)	Data Time 0.001 (0.041)	Loss 4.1168 (3.9227)	Entropy 1.76160 (1.76447)	Top-1 acc 25.781 (32.449)	Top-5 acc 52.734 (56.301)	lr 0.02489
Train [6][400/3239]	Time 0.544 (0.884)	Data Time 0.001 (0.040)	Loss 3.9476 (3.9225)	Entropy 1.76142 (1.76440)	Top-1 acc 33.984 (32.465)	Top-5 acc 56.250 (56.303)	lr 0.02489
Train [6][410/3239]	Time 0.513 (0.881)	Data Time 0.001 (0.039)	Loss 3.9250 (3.9228)	Entropy 1.76123 (1.76432)	Top-1 acc 31.641 (32.453)	Top-5 acc 53.125 (56.323)	lr 0.02489
Train [6][420/3239]	Time 0.543 (0.879)	Data Time 0.001 (0.039)	Loss 4.1264 (3.9250)	Entropy 1.76125 (1.76425)	Top-1 acc 33.203 (32.412)	Top-5 acc 53.516 (56.275)	lr 0.02489
Train [6][430/3239]	Time 0.494 (0.878)	Data Time 0.001 (0.038)	Loss 3.8146 (3.9247)	Entropy 1.76124 (1.76418)	Top-1 acc 33.984 (32.398)	Top-5 acc 59.766 (56.266)	lr 0.02489
Train [6][440/3239]	Time 0.516 (0.876)	Data Time 0.002 (0.037)	Loss 3.7184 (3.9238)	Entropy 1.76117 (1.76411)	Top-1 acc 38.281 (32.414)	Top-5 acc 59.375 (56.271)	lr 0.02489
Train [6][450/3239]	Time 0.525 (0.874)	Data Time 0.001 (0.036)	Loss 4.0609 (3.9249)	Entropy 1.76105 (1.76404)	Top-1 acc 30.469 (32.407)	Top-5 acc 52.344 (56.233)	lr 0.02489
Train [6][460/3239]	Time 0.607 (0.873)	Data Time 0.001 (0.035)	Loss 3.9443 (3.9261)	Entropy 1.76094 (1.76398)	Top-1 acc 32.812 (32.407)	Top-5 acc 56.250 (56.211)	lr 0.02489
Train [6][470/3239]	Time 0.556 (0.871)	Data Time 0.001 (0.035)	Loss 3.8026 (3.9267)	Entropy 1.76077 (1.76391)	Top-1 acc 32.422 (32.420)	Top-5 acc 58.594 (56.180)	lr 0.02489
Train [6][480/3239]	Time 0.517 (0.870)	Data Time 0.001 (0.034)	Loss 3.7772 (3.9254)	Entropy 1.76073 (1.76385)	Top-1 acc 32.031 (32.435)	Top-5 acc 60.938 (56.206)	lr 0.02489
Train [6][490/3239]	Time 0.505 (0.867)	Data Time 0.001 (0.033)	Loss 4.0083 (3.9270)	Entropy 1.76060 (1.76378)	Top-1 acc 32.422 (32.396)	Top-5 acc 53.516 (56.170)	lr 0.02489
Train [6][500/3239]	Time 0.589 (0.866)	Data Time 0.001 (0.033)	Loss 4.0433 (3.9265)	Entropy 1.76057 (1.76372)	Top-1 acc 27.734 (32.384)	Top-5 acc 51.172 (56.171)	lr 0.02489
Train [6][510/3239]	Time 0.491 (0.864)	Data Time 0.001 (0.032)	Loss 4.0778 (3.9282)	Entropy 1.76048 (1.76366)	Top-1 acc 32.031 (32.339)	Top-5 acc 50.781 (56.163)	lr 0.02489
Train [6][520/3239]	Time 0.545 (0.861)	Data Time 0.001 (0.032)	Loss 3.8400 (3.9283)	Entropy 1.76030 (1.76359)	Top-1 acc 33.594 (32.330)	Top-5 acc 58.984 (56.159)	lr 0.02489
Train [6][530/3239]	Time 0.508 (0.860)	Data Time 0.001 (0.031)	Loss 3.8836 (3.9296)	Entropy 1.76014 (1.76353)	Top-1 acc 28.906 (32.292)	Top-5 acc 56.250 (56.116)	lr 0.02489
Train [6][540/3239]	Time 0.606 (0.859)	Data Time 0.001 (0.031)	Loss 3.9708 (3.9286)	Entropy 1.76005 (1.76347)	Top-1 acc 31.250 (32.306)	Top-5 acc 55.859 (56.144)	lr 0.02489
Train [6][550/3239]	Time 0.556 (0.858)	Data Time 0.001 (0.030)	Loss 3.9588 (3.9293)	Entropy 1.75989 (1.76341)	Top-1 acc 29.688 (32.284)	Top-5 acc 54.688 (56.144)	lr 0.02489
Train [6][560/3239]	Time 0.566 (0.856)	Data Time 0.001 (0.029)	Loss 3.7586 (3.9293)	Entropy 1.75976 (1.76334)	Top-1 acc 40.234 (32.296)	Top-5 acc 60.547 (56.141)	lr 0.02489
Train [6][570/3239]	Time 0.600 (0.855)	Data Time 0.001 (0.029)	Loss 3.8246 (3.9278)	Entropy 1.75954 (1.76328)	Top-1 acc 34.375 (32.324)	Top-5 acc 55.469 (56.178)	lr 0.02489
Train [6][580/3239]	Time 0.520 (0.855)	Data Time 0.001 (0.029)	Loss 4.1610 (3.9283)	Entropy 1.75933 (1.76321)	Top-1 acc 27.734 (32.308)	Top-5 acc 52.344 (56.153)	lr 0.02489
Train [6][590/3239]	Time 0.473 (0.853)	Data Time 0.001 (0.028)	Loss 4.0938 (3.9290)	Entropy 1.75911 (1.76315)	Top-1 acc 30.859 (32.293)	Top-5 acc 52.734 (56.146)	lr 0.02489
Train [6][600/3239]	Time 0.563 (0.852)	Data Time 0.001 (0.028)	Loss 3.8865 (3.9296)	Entropy 1.75894 (1.76308)	Top-1 acc 31.250 (32.267)	Top-5 acc 57.812 (56.121)	lr 0.02489
Train [6][610/3239]	Time 0.547 (0.851)	Data Time 0.001 (0.027)	Loss 3.9128 (3.9294)	Entropy 1.75873 (1.76301)	Top-1 acc 33.594 (32.261)	Top-5 acc 57.031 (56.124)	lr 0.02488
Train [6][620/3239]	Time 0.627 (0.850)	Data Time 0.001 (0.027)	Loss 3.9370 (3.9293)	Entropy 1.75840 (1.76294)	Top-1 acc 30.859 (32.267)	Top-5 acc 51.953 (56.116)	lr 0.02488
Train [6][630/3239]	Time 0.525 (0.849)	Data Time 0.001 (0.026)	Loss 4.0989 (3.9305)	Entropy 1.75824 (1.76287)	Top-1 acc 29.688 (32.249)	Top-5 acc 53.516 (56.092)	lr 0.02488
Train [6][640/3239]	Time 0.477 (0.848)	Data Time 0.002 (0.026)	Loss 3.8596 (3.9308)	Entropy 1.75800 (1.76279)	Top-1 acc 35.938 (32.243)	Top-5 acc 55.859 (56.090)	lr 0.02488
Train [6][650/3239]	Time 0.586 (0.847)	Data Time 0.001 (0.026)	Loss 3.8171 (3.9308)	Entropy 1.75777 (1.76272)	Top-1 acc 33.594 (32.236)	Top-5 acc 56.250 (56.077)	lr 0.02488
Train [6][660/3239]	Time 0.532 (0.846)	Data Time 0.001 (0.025)	Loss 4.0005 (3.9307)	Entropy 1.75761 (1.76264)	Top-1 acc 33.594 (32.227)	Top-5 acc 53.906 (56.093)	lr 0.02488
Train [6][670/3239]	Time 0.482 (0.845)	Data Time 0.001 (0.025)	Loss 4.0042 (3.9317)	Entropy 1.75739 (1.76257)	Top-1 acc 27.734 (32.222)	Top-5 acc 53.125 (56.063)	lr 0.02488
Train [6][680/3239]	Time 0.579 (0.844)	Data Time 0.001 (0.025)	Loss 3.9230 (3.9315)	Entropy 1.75718 (1.76249)	Top-1 acc 34.375 (32.231)	Top-5 acc 58.203 (56.075)	lr 0.02488
Train [6][690/3239]	Time 0.556 (0.843)	Data Time 0.001 (0.024)	Loss 3.9757 (3.9316)	Entropy 1.75699 (1.76241)	Top-1 acc 29.688 (32.217)	Top-5 acc 53.516 (56.072)	lr 0.02488
Train [6][700/3239]	Time 0.503 (0.841)	Data Time 0.001 (0.024)	Loss 3.7631 (3.9322)	Entropy 1.75685 (1.76233)	Top-1 acc 33.203 (32.195)	Top-5 acc 63.672 (56.054)	lr 0.02488
Train [6][710/3239]	Time 0.580 (0.841)	Data Time 0.001 (0.024)	Loss 3.9662 (3.9329)	Entropy 1.75679 (1.76226)	Top-1 acc 32.031 (32.180)	Top-5 acc 56.250 (56.033)	lr 0.02488
Train [6][720/3239]	Time 0.597 (0.841)	Data Time 0.001 (0.024)	Loss 4.0753 (3.9332)	Entropy 1.75679 (1.76218)	Top-1 acc 33.594 (32.179)	Top-5 acc 53.516 (56.021)	lr 0.02488
Train [6][730/3239]	Time 0.502 (0.840)	Data Time 0.001 (0.023)	Loss 4.0693 (3.9349)	Entropy 1.75648 (1.76210)	Top-1 acc 27.734 (32.154)	Top-5 acc 48.828 (55.991)	lr 0.02488
Train [6][740/3239]	Time 0.507 (0.839)	Data Time 0.001 (0.023)	Loss 3.8032 (3.9336)	Entropy 1.75637 (1.76203)	Top-1 acc 39.844 (32.173)	Top-5 acc 61.328 (56.022)	lr 0.02488
Train [6][750/3239]	Time 0.554 (0.839)	Data Time 0.001 (0.023)	Loss 3.7243 (3.9335)	Entropy 1.75614 (1.76195)	Top-1 acc 30.078 (32.150)	Top-5 acc 62.500 (56.023)	lr 0.02488
Train [6][760/3239]	Time 0.541 (0.838)	Data Time 0.001 (0.022)	Loss 3.8589 (3.9330)	Entropy 1.75610 (1.76188)	Top-1 acc 35.547 (32.159)	Top-5 acc 57.031 (56.039)	lr 0.02488
Train [6][770/3239]	Time 0.530 (0.838)	Data Time 0.001 (0.022)	Loss 3.8532 (3.9329)	Entropy 1.75596 (1.76180)	Top-1 acc 35.156 (32.166)	Top-5 acc 55.469 (56.054)	lr 0.02488
Train [6][780/3239]	Time 0.605 (0.837)	Data Time 0.001 (0.022)	Loss 3.8272 (3.9320)	Entropy 1.75551 (1.76172)	Top-1 acc 34.766 (32.173)	Top-5 acc 58.984 (56.072)	lr 0.02488
Train [6][790/3239]	Time 0.699 (0.837)	Data Time 0.001 (0.022)	Loss 3.9527 (3.9319)	Entropy 1.75526 (1.76164)	Top-1 acc 30.469 (32.166)	Top-5 acc 57.812 (56.078)	lr 0.02488
Train [6][800/3239]	Time 0.705 (0.856)	Data Time 0.007 (0.021)	Loss 4.0134 (3.9327)	Entropy 1.75497 (1.76156)	Top-1 acc 30.859 (32.140)	Top-5 acc 52.344 (56.053)	lr 0.02488
Train [6][810/3239]	Time 0.585 (0.857)	Data Time 0.002 (0.021)	Loss 3.7453 (3.9319)	Entropy 1.75469 (1.76148)	Top-1 acc 35.156 (32.164)	Top-5 acc 62.109 (56.071)	lr 0.02488
Train [6][820/3239]	Time 0.557 (0.856)	Data Time 0.002 (0.021)	Loss 4.1452 (3.9324)	Entropy 1.75447 (1.76140)	Top-1 acc 28.906 (32.149)	Top-5 acc 51.953 (56.050)	lr 0.02488
Train [6][830/3239]	Time 0.541 (0.855)	Data Time 0.001 (0.021)	Loss 4.0167 (3.9327)	Entropy 1.75422 (1.76131)	Top-1 acc 30.859 (32.152)	Top-5 acc 53.906 (56.045)	lr 0.02488
Train [6][840/3239]	Time 0.667 (0.854)	Data Time 0.001 (0.021)	Loss 3.7546 (3.9330)	Entropy 1.75410 (1.76123)	Top-1 acc 36.719 (32.140)	Top-5 acc 55.859 (56.042)	lr 0.02488
Train [6][850/3239]	Time 0.555 (0.853)	Data Time 0.001 (0.020)	Loss 3.9516 (3.9330)	Entropy 1.75417 (1.76114)	Top-1 acc 30.469 (32.138)	Top-5 acc 55.859 (56.048)	lr 0.02488
Train [6][860/3239]	Time 0.553 (0.853)	Data Time 0.001 (0.020)	Loss 4.0047 (3.9329)	Entropy 1.75412 (1.76106)	Top-1 acc 32.422 (32.146)	Top-5 acc 55.469 (56.058)	lr 0.02488
Train [6][870/3239]	Time 0.589 (0.853)	Data Time 0.001 (0.020)	Loss 4.0665 (3.9328)	Entropy 1.75369 (1.76098)	Top-1 acc 29.688 (32.157)	Top-5 acc 53.125 (56.062)	lr 0.02488
Train [6][880/3239]	Time 0.579 (0.852)	Data Time 0.002 (0.020)	Loss 3.6941 (3.9328)	Entropy 1.75348 (1.76090)	Top-1 acc 40.234 (32.163)	Top-5 acc 60.938 (56.066)	lr 0.02488
Train [6][890/3239]	Time 0.558 (0.851)	Data Time 0.001 (0.020)	Loss 3.8511 (3.9328)	Entropy 1.75322 (1.76081)	Top-1 acc 33.203 (32.174)	Top-5 acc 58.594 (56.064)	lr 0.02488
Train [6][900/3239]	Time 0.526 (0.850)	Data Time 0.001 (0.019)	Loss 3.9220 (3.9326)	Entropy 1.75322 (1.76073)	Top-1 acc 33.984 (32.170)	Top-5 acc 55.859 (56.062)	lr 0.02488
Train [6][910/3239]	Time 0.595 (0.850)	Data Time 0.001 (0.019)	Loss 4.0279 (3.9322)	Entropy 1.75310 (1.76065)	Top-1 acc 28.906 (32.175)	Top-5 acc 53.516 (56.063)	lr 0.02488
Train [6][920/3239]	Time 0.501 (0.849)	Data Time 0.001 (0.019)	Loss 3.9544 (3.9321)	Entropy 1.75290 (1.76056)	Top-1 acc 29.297 (32.170)	Top-5 acc 48.828 (56.064)	lr 0.02488
Train [6][930/3239]	Time 0.534 (0.849)	Data Time 0.001 (0.019)	Loss 3.7798 (3.9321)	Entropy 1.75275 (1.76048)	Top-1 acc 32.812 (32.175)	Top-5 acc 57.031 (56.057)	lr 0.02488
Train [6][940/3239]	Time 0.535 (0.848)	Data Time 0.001 (0.019)	Loss 4.1865 (3.9327)	Entropy 1.75258 (1.76040)	Top-1 acc 27.734 (32.160)	Top-5 acc 53.125 (56.047)	lr 0.02488
Train [6][950/3239]	Time 0.526 (0.848)	Data Time 0.001 (0.018)	Loss 4.0653 (3.9329)	Entropy 1.75235 (1.76032)	Top-1 acc 29.297 (32.152)	Top-5 acc 53.125 (56.038)	lr 0.02488
Train [6][960/3239]	Time 0.675 (0.847)	Data Time 0.001 (0.018)	Loss 3.6739 (3.9328)	Entropy 1.75227 (1.76023)	Top-1 acc 37.109 (32.151)	Top-5 acc 60.547 (56.047)	lr 0.02488
Train [6][970/3239]	Time 0.560 (0.847)	Data Time 0.001 (0.018)	Loss 4.0147 (3.9324)	Entropy 1.75207 (1.76015)	Top-1 acc 30.859 (32.147)	Top-5 acc 53.906 (56.061)	lr 0.02488
Train [6][980/3239]	Time 0.496 (0.846)	Data Time 0.001 (0.018)	Loss 3.9192 (3.9326)	Entropy 1.75214 (1.76007)	Top-1 acc 34.766 (32.144)	Top-5 acc 57.031 (56.052)	lr 0.02488
Train [6][990/3239]	Time 0.519 (0.845)	Data Time 0.002 (0.018)	Loss 3.8796 (3.9324)	Entropy 1.75191 (1.75999)	Top-1 acc 33.203 (32.155)	Top-5 acc 58.203 (56.072)	lr 0.02488
Train [6][1000/3239]	Time 0.495 (0.844)	Data Time 0.001 (0.018)	Loss 3.8604 (3.9324)	Entropy 1.75174 (1.75991)	Top-1 acc 32.031 (32.150)	Top-5 acc 55.078 (56.078)	lr 0.02488
Train [6][1010/3239]	Time 0.566 (0.844)	Data Time 0.001 (0.018)	Loss 4.0384 (3.9323)	Entropy 1.75156 (1.75982)	Top-1 acc 31.250 (32.148)	Top-5 acc 54.297 (56.078)	lr 0.02488
Train [6][1020/3239]	Time 0.604 (0.843)	Data Time 0.001 (0.017)	Loss 3.9294 (3.9322)	Entropy 1.75129 (1.75974)	Top-1 acc 33.984 (32.142)	Top-5 acc 54.688 (56.074)	lr 0.02488
Train [6][1030/3239]	Time 0.578 (0.842)	Data Time 0.001 (0.017)	Loss 3.8899 (3.9320)	Entropy 1.75116 (1.75966)	Top-1 acc 32.031 (32.136)	Top-5 acc 53.125 (56.078)	lr 0.02488
Train [6][1040/3239]	Time 0.551 (0.842)	Data Time 0.001 (0.017)	Loss 4.0683 (3.9324)	Entropy 1.75099 (1.75958)	Top-1 acc 30.469 (32.138)	Top-5 acc 51.172 (56.073)	lr 0.02488
Train [6][1050/3239]	Time 0.541 (0.842)	Data Time 0.001 (0.017)	Loss 3.8976 (3.9323)	Entropy 1.75087 (1.75949)	Top-1 acc 33.984 (32.150)	Top-5 acc 58.984 (56.076)	lr 0.02488
Train [6][1060/3239]	Time 0.543 (0.841)	Data Time 0.001 (0.017)	Loss 3.8879 (3.9321)	Entropy 1.75059 (1.75941)	Top-1 acc 30.469 (32.147)	Top-5 acc 56.641 (56.089)	lr 0.02488
Train [6][1070/3239]	Time 0.528 (0.841)	Data Time 0.002 (0.017)	Loss 4.1715 (3.9327)	Entropy 1.75049 (1.75933)	Top-1 acc 28.516 (32.125)	Top-5 acc 47.656 (56.071)	lr 0.02488
Train [6][1080/3239]	Time 0.530 (0.840)	Data Time 0.001 (0.017)	Loss 4.0879 (3.9327)	Entropy 1.75029 (1.75925)	Top-1 acc 33.203 (32.132)	Top-5 acc 52.344 (56.070)	lr 0.02488
Train [6][1090/3239]	Time 0.566 (0.840)	Data Time 0.001 (0.016)	Loss 3.8992 (3.9331)	Entropy 1.75015 (1.75917)	Top-1 acc 33.594 (32.125)	Top-5 acc 58.203 (56.049)	lr 0.02488
Train [6][1100/3239]	Time 0.558 (0.839)	Data Time 0.001 (0.016)	Loss 3.9209 (3.9337)	Entropy 1.74988 (1.75908)	Top-1 acc 33.203 (32.106)	Top-5 acc 59.375 (56.031)	lr 0.02488
Train [6][1110/3239]	Time 0.612 (0.839)	Data Time 0.001 (0.016)	Loss 3.8494 (3.9333)	Entropy 1.74982 (1.75900)	Top-1 acc 27.734 (32.103)	Top-5 acc 57.031 (56.038)	lr 0.02488
Train [6][1120/3239]	Time 0.539 (0.839)	Data Time 0.001 (0.016)	Loss 3.9484 (3.9333)	Entropy 1.74972 (1.75892)	Top-1 acc 34.375 (32.113)	Top-5 acc 53.906 (56.034)	lr 0.02488
Train [6][1130/3239]	Time 0.636 (0.838)	Data Time 0.001 (0.016)	Loss 3.9026 (3.9327)	Entropy 1.74955 (1.75884)	Top-1 acc 30.469 (32.123)	Top-5 acc 58.203 (56.043)	lr 0.02488
Train [6][1140/3239]	Time 0.502 (0.838)	Data Time 0.001 (0.016)	Loss 3.8875 (3.9326)	Entropy 1.74953 (1.75875)	Top-1 acc 30.078 (32.121)	Top-5 acc 55.078 (56.034)	lr 0.02488
Train [6][1150/3239]	Time 0.543 (0.838)	Data Time 0.001 (0.016)	Loss 3.8352 (3.9323)	Entropy 1.74946 (1.75867)	Top-1 acc 32.422 (32.117)	Top-5 acc 56.250 (56.044)	lr 0.02488
Train [6][1160/3239]	Time 0.614 (0.837)	Data Time 0.001 (0.016)	Loss 3.9489 (3.9319)	Entropy 1.74938 (1.75859)	Top-1 acc 30.078 (32.129)	Top-5 acc 59.375 (56.053)	lr 0.02488
Train [6][1170/3239]	Time 0.622 (0.837)	Data Time 0.001 (0.015)	Loss 3.9570 (3.9314)	Entropy 1.74919 (1.75851)	Top-1 acc 32.812 (32.145)	Top-5 acc 56.641 (56.063)	lr 0.02488
Train [6][1180/3239]	Time 0.566 (0.837)	Data Time 0.001 (0.015)	Loss 4.0068 (3.9318)	Entropy 1.74906 (1.75844)	Top-1 acc 27.734 (32.126)	Top-5 acc 56.250 (56.059)	lr 0.02488
Train [6][1190/3239]	Time 0.598 (0.836)	Data Time 0.001 (0.015)	Loss 3.9360 (3.9317)	Entropy 1.74901 (1.75836)	Top-1 acc 33.203 (32.127)	Top-5 acc 52.734 (56.058)	lr 0.02488
Train [6][1200/3239]	Time 0.502 (0.836)	Data Time 0.001 (0.015)	Loss 3.9785 (3.9315)	Entropy 1.74898 (1.75828)	Top-1 acc 34.766 (32.139)	Top-5 acc 56.250 (56.063)	lr 0.02488
Train [6][1210/3239]	Time 0.634 (0.835)	Data Time 0.001 (0.015)	Loss 3.9793 (3.9312)	Entropy 1.74898 (1.75820)	Top-1 acc 32.812 (32.148)	Top-5 acc 53.906 (56.069)	lr 0.02488
Train [6][1220/3239]	Time 0.592 (0.835)	Data Time 0.003 (0.015)	Loss 4.1193 (3.9311)	Entropy 1.74877 (1.75813)	Top-1 acc 31.250 (32.150)	Top-5 acc 53.516 (56.075)	lr 0.02488
Train [6][1230/3239]	Time 0.539 (0.835)	Data Time 0.001 (0.015)	Loss 3.9285 (3.9314)	Entropy 1.74874 (1.75805)	Top-1 acc 33.203 (32.139)	Top-5 acc 55.078 (56.072)	lr 0.02488
Train [6][1240/3239]	Time 0.572 (0.835)	Data Time 0.001 (0.015)	Loss 3.7399 (3.9313)	Entropy 1.74866 (1.75798)	Top-1 acc 35.547 (32.134)	Top-5 acc 59.375 (56.072)	lr 0.02488
Train [6][1250/3239]	Time 0.553 (0.834)	Data Time 0.001 (0.015)	Loss 3.8814 (3.9310)	Entropy 1.74870 (1.75790)	Top-1 acc 31.250 (32.135)	Top-5 acc 57.031 (56.075)	lr 0.02488
Train [6][1260/3239]	Time 0.558 (0.834)	Data Time 0.001 (0.014)	Loss 3.7666 (3.9309)	Entropy 1.74842 (1.75783)	Top-1 acc 37.500 (32.142)	Top-5 acc 60.156 (56.081)	lr 0.02488
Train [6][1270/3239]	Time 0.487 (0.834)	Data Time 0.001 (0.014)	Loss 3.6531 (3.9308)	Entropy 1.74823 (1.75775)	Top-1 acc 35.547 (32.141)	Top-5 acc 60.547 (56.083)	lr 0.02488
Train [6][1280/3239]	Time 0.550 (0.833)	Data Time 0.001 (0.014)	Loss 3.8971 (3.9306)	Entropy 1.74806 (1.75768)	Top-1 acc 31.250 (32.139)	Top-5 acc 55.078 (56.091)	lr 0.02488
Train [6][1290/3239]	Time 0.517 (0.833)	Data Time 0.001 (0.014)	Loss 4.0435 (3.9311)	Entropy 1.74793 (1.75760)	Top-1 acc 28.906 (32.135)	Top-5 acc 53.906 (56.079)	lr 0.02488
Train [6][1300/3239]	Time 0.589 (0.833)	Data Time 0.032 (0.014)	Loss 3.8236 (3.9311)	Entropy 1.74771 (1.75753)	Top-1 acc 32.422 (32.146)	Top-5 acc 58.594 (56.080)	lr 0.02488
Train [6][1310/3239]	Time 0.512 (0.832)	Data Time 0.001 (0.014)	Loss 3.8767 (3.9310)	Entropy 1.74753 (1.75745)	Top-1 acc 33.594 (32.146)	Top-5 acc 56.250 (56.085)	lr 0.02488
Train [6][1320/3239]	Time 0.525 (0.832)	Data Time 0.001 (0.014)	Loss 4.0388 (3.9311)	Entropy 1.74749 (1.75738)	Top-1 acc 28.125 (32.142)	Top-5 acc 51.172 (56.084)	lr 0.02487
Train [6][1330/3239]	Time 0.512 (0.832)	Data Time 0.001 (0.014)	Loss 3.9749 (3.9313)	Entropy 1.74738 (1.75730)	Top-1 acc 35.156 (32.139)	Top-5 acc 55.859 (56.082)	lr 0.02487
Train [6][1340/3239]	Time 0.544 (0.832)	Data Time 0.001 (0.014)	Loss 3.9140 (3.9315)	Entropy 1.74707 (1.75723)	Top-1 acc 31.250 (32.131)	Top-5 acc 54.297 (56.088)	lr 0.02487
Train [6][1350/3239]	Time 0.565 (0.832)	Data Time 0.001 (0.014)	Loss 4.0577 (3.9311)	Entropy 1.74714 (1.75715)	Top-1 acc 30.859 (32.142)	Top-5 acc 52.734 (56.102)	lr 0.02487
Train [6][1360/3239]	Time 0.515 (0.831)	Data Time 0.001 (0.014)	Loss 3.8540 (3.9310)	Entropy 1.74697 (1.75708)	Top-1 acc 36.719 (32.154)	Top-5 acc 61.328 (56.110)	lr 0.02487
Train [6][1370/3239]	Time 0.593 (0.831)	Data Time 0.001 (0.014)	Loss 3.8219 (3.9309)	Entropy 1.74678 (1.75700)	Top-1 acc 34.375 (32.155)	Top-5 acc 55.859 (56.113)	lr 0.02487
Train [6][1380/3239]	Time 0.584 (0.830)	Data Time 0.001 (0.013)	Loss 4.0957 (3.9312)	Entropy 1.74669 (1.75693)	Top-1 acc 29.297 (32.151)	Top-5 acc 51.953 (56.109)	lr 0.02487
Train [6][1390/3239]	Time 0.530 (0.830)	Data Time 0.001 (0.013)	Loss 3.9301 (3.9308)	Entropy 1.74662 (1.75686)	Top-1 acc 33.984 (32.155)	Top-5 acc 56.250 (56.117)	lr 0.02487
Train [6][1400/3239]	Time 0.545 (0.830)	Data Time 0.001 (0.013)	Loss 3.9467 (3.9306)	Entropy 1.74652 (1.75678)	Top-1 acc 33.203 (32.164)	Top-5 acc 55.859 (56.116)	lr 0.02487
Train [6][1410/3239]	Time 0.529 (0.830)	Data Time 0.001 (0.013)	Loss 3.7501 (3.9304)	Entropy 1.74626 (1.75671)	Top-1 acc 38.281 (32.172)	Top-5 acc 57.031 (56.118)	lr 0.02487
Train [6][1420/3239]	Time 0.561 (0.829)	Data Time 0.002 (0.013)	Loss 3.9564 (3.9300)	Entropy 1.74604 (1.75664)	Top-1 acc 30.469 (32.177)	Top-5 acc 53.906 (56.116)	lr 0.02487
Train [6][1430/3239]	Time 0.571 (0.829)	Data Time 0.001 (0.013)	Loss 3.9533 (3.9298)	Entropy 1.74584 (1.75656)	Top-1 acc 33.203 (32.179)	Top-5 acc 57.422 (56.118)	lr 0.02487
Train [6][1440/3239]	Time 0.525 (0.829)	Data Time 0.001 (0.013)	Loss 3.8794 (3.9294)	Entropy 1.74563 (1.75649)	Top-1 acc 33.203 (32.183)	Top-5 acc 55.469 (56.127)	lr 0.02487
Train [6][1450/3239]	Time 0.701 (0.829)	Data Time 0.001 (0.013)	Loss 4.1020 (3.9295)	Entropy 1.74538 (1.75641)	Top-1 acc 32.812 (32.192)	Top-5 acc 55.469 (56.132)	lr 0.02487
Train [6][1460/3239]	Time 0.544 (0.840)	Data Time 0.002 (0.013)	Loss 3.8885 (3.9298)	Entropy 1.74508 (1.75633)	Top-1 acc 36.719 (32.190)	Top-5 acc 58.594 (56.129)	lr 0.02487
Train [6][1470/3239]	Time 0.521 (0.840)	Data Time 0.002 (0.013)	Loss 3.8993 (3.9301)	Entropy 1.74477 (1.75626)	Top-1 acc 29.688 (32.182)	Top-5 acc 54.297 (56.127)	lr 0.02487
Train [6][1480/3239]	Time 0.514 (0.840)	Data Time 0.001 (0.013)	Loss 4.0632 (3.9304)	Entropy 1.74463 (1.75618)	Top-1 acc 32.422 (32.182)	Top-5 acc 51.562 (56.119)	lr 0.02487
Train [6][1490/3239]	Time 0.593 (0.840)	Data Time 0.001 (0.013)	Loss 3.7774 (3.9301)	Entropy 1.74457 (1.75610)	Top-1 acc 36.328 (32.180)	Top-5 acc 57.422 (56.125)	lr 0.02487
Train [6][1500/3239]	Time 0.588 (0.839)	Data Time 0.003 (0.013)	Loss 3.7295 (3.9298)	Entropy 1.74450 (1.75603)	Top-1 acc 35.938 (32.182)	Top-5 acc 61.328 (56.134)	lr 0.02487
Train [6][1510/3239]	Time 0.511 (0.839)	Data Time 0.001 (0.013)	Loss 3.8750 (3.9296)	Entropy 1.74421 (1.75595)	Top-1 acc 32.422 (32.180)	Top-5 acc 57.031 (56.135)	lr 0.02487
Train [6][1520/3239]	Time 0.550 (0.838)	Data Time 0.003 (0.012)	Loss 3.7324 (3.9293)	Entropy 1.74391 (1.75587)	Top-1 acc 34.766 (32.189)	Top-5 acc 58.594 (56.134)	lr 0.02487
Train [6][1530/3239]	Time 0.548 (0.838)	Data Time 0.001 (0.012)	Loss 4.0917 (3.9293)	Entropy 1.74374 (1.75579)	Top-1 acc 28.906 (32.190)	Top-5 acc 53.125 (56.133)	lr 0.02487
Train [6][1540/3239]	Time 0.556 (0.838)	Data Time 0.001 (0.012)	Loss 3.8445 (3.9290)	Entropy 1.74359 (1.75571)	Top-1 acc 32.422 (32.195)	Top-5 acc 56.250 (56.142)	lr 0.02487
Train [6][1550/3239]	Time 0.572 (0.838)	Data Time 0.001 (0.012)	Loss 4.0121 (3.9289)	Entropy 1.74345 (1.75564)	Top-1 acc 28.516 (32.198)	Top-5 acc 55.469 (56.139)	lr 0.02487
Train [6][1560/3239]	Time 0.569 (0.838)	Data Time 0.001 (0.012)	Loss 3.9449 (3.9286)	Entropy 1.74313 (1.75556)	Top-1 acc 34.375 (32.209)	Top-5 acc 57.031 (56.146)	lr 0.02487
Train [6][1570/3239]	Time 0.658 (0.837)	Data Time 0.001 (0.012)	Loss 3.9438 (3.9289)	Entropy 1.74262 (1.75548)	Top-1 acc 31.641 (32.202)	Top-5 acc 56.250 (56.136)	lr 0.02487
Train [6][1580/3239]	Time 0.605 (0.837)	Data Time 0.001 (0.012)	Loss 3.9173 (3.9289)	Entropy 1.74219 (1.75539)	Top-1 acc 32.031 (32.201)	Top-5 acc 57.031 (56.140)	lr 0.02487
Train [6][1590/3239]	Time 0.541 (0.837)	Data Time 0.002 (0.012)	Loss 3.7932 (3.9290)	Entropy 1.74220 (1.75531)	Top-1 acc 35.156 (32.200)	Top-5 acc 58.594 (56.142)	lr 0.02487
Train [6][1600/3239]	Time 0.518 (0.837)	Data Time 0.001 (0.012)	Loss 3.9527 (3.9286)	Entropy 1.74192 (1.75523)	Top-1 acc 31.641 (32.205)	Top-5 acc 51.172 (56.154)	lr 0.02487
Train [6][1610/3239]	Time 0.520 (0.837)	Data Time 0.001 (0.012)	Loss 3.8268 (3.9287)	Entropy 1.74204 (1.75515)	Top-1 acc 34.766 (32.199)	Top-5 acc 58.594 (56.145)	lr 0.02487
Train [6][1620/3239]	Time 0.541 (0.836)	Data Time 0.001 (0.012)	Loss 3.8367 (3.9285)	Entropy 1.74203 (1.75506)	Top-1 acc 35.156 (32.205)	Top-5 acc 59.766 (56.151)	lr 0.02487
Train [6][1630/3239]	Time 0.501 (0.836)	Data Time 0.001 (0.012)	Loss 3.6668 (3.9284)	Entropy 1.74180 (1.75498)	Top-1 acc 36.719 (32.214)	Top-5 acc 62.500 (56.157)	lr 0.02487
Train [6][1640/3239]	Time 0.555 (0.836)	Data Time 0.001 (0.012)	Loss 3.8527 (3.9287)	Entropy 1.74165 (1.75490)	Top-1 acc 35.547 (32.210)	Top-5 acc 57.812 (56.149)	lr 0.02487
Train [6][1650/3239]	Time 0.548 (0.836)	Data Time 0.001 (0.012)	Loss 3.9596 (3.9288)	Entropy 1.74180 (1.75482)	Top-1 acc 30.859 (32.203)	Top-5 acc 52.734 (56.145)	lr 0.02487
Train [6][1660/3239]	Time 0.399 (0.835)	Data Time 0.001 (0.012)	Loss 3.8611 (3.9290)	Entropy 1.74180 (1.75474)	Top-1 acc 33.203 (32.199)	Top-5 acc 58.594 (56.148)	lr 0.02487
Train [6][1670/3239]	Time 0.645 (0.835)	Data Time 0.001 (0.012)	Loss 3.7868 (3.9290)	Entropy 1.74158 (1.75467)	Top-1 acc 34.766 (32.196)	Top-5 acc 62.891 (56.152)	lr 0.02487
Train [6][1680/3239]	Time 0.572 (0.835)	Data Time 0.001 (0.012)	Loss 4.1386 (3.9288)	Entropy 1.74138 (1.75459)	Top-1 acc 28.516 (32.196)	Top-5 acc 54.297 (56.164)	lr 0.02487
Train [6][1690/3239]	Time 0.518 (0.834)	Data Time 0.001 (0.011)	Loss 3.9339 (3.9288)	Entropy 1.74119 (1.75451)	Top-1 acc 33.594 (32.200)	Top-5 acc 58.203 (56.163)	lr 0.02487
Train [6][1700/3239]	Time 0.484 (0.834)	Data Time 0.001 (0.011)	Loss 3.8944 (3.9284)	Entropy 1.74098 (1.75443)	Top-1 acc 31.641 (32.204)	Top-5 acc 55.859 (56.171)	lr 0.02487
Train [6][1710/3239]	Time 0.598 (0.834)	Data Time 0.001 (0.011)	Loss 3.9976 (3.9285)	Entropy 1.74085 (1.75435)	Top-1 acc 31.250 (32.202)	Top-5 acc 54.688 (56.169)	lr 0.02487
Train [6][1720/3239]	Time 0.533 (0.834)	Data Time 0.001 (0.011)	Loss 3.8778 (3.9285)	Entropy 1.74059 (1.75427)	Top-1 acc 33.203 (32.204)	Top-5 acc 57.812 (56.173)	lr 0.02487
Train [6][1730/3239]	Time 0.525 (0.833)	Data Time 0.001 (0.011)	Loss 3.9421 (3.9286)	Entropy 1.74038 (1.75419)	Top-1 acc 29.297 (32.202)	Top-5 acc 55.859 (56.162)	lr 0.02487
Train [6][1740/3239]	Time 0.527 (0.833)	Data Time 0.001 (0.011)	Loss 4.0332 (3.9285)	Entropy 1.74013 (1.75411)	Top-1 acc 27.734 (32.200)	Top-5 acc 53.125 (56.166)	lr 0.02487
Train [6][1750/3239]	Time 0.563 (0.833)	Data Time 0.001 (0.011)	Loss 4.0781 (3.9287)	Entropy 1.73982 (1.75403)	Top-1 acc 28.125 (32.195)	Top-5 acc 50.781 (56.168)	lr 0.02487
Train [6][1760/3239]	Time 0.552 (0.833)	Data Time 0.001 (0.011)	Loss 3.7886 (3.9284)	Entropy 1.73935 (1.75395)	Top-1 acc 32.812 (32.202)	Top-5 acc 58.594 (56.169)	lr 0.02487
Train [6][1770/3239]	Time 0.417 (0.832)	Data Time 0.001 (0.011)	Loss 3.9440 (3.9284)	Entropy 1.73915 (1.75387)	Top-1 acc 32.422 (32.201)	Top-5 acc 55.469 (56.168)	lr 0.02487
Train [6][1780/3239]	Time 0.516 (0.832)	Data Time 0.001 (0.011)	Loss 4.0280 (3.9283)	Entropy 1.73898 (1.75379)	Top-1 acc 31.641 (32.207)	Top-5 acc 51.953 (56.168)	lr 0.02487
Train [6][1790/3239]	Time 0.577 (0.832)	Data Time 0.001 (0.011)	Loss 4.0985 (3.9283)	Entropy 1.73879 (1.75370)	Top-1 acc 32.422 (32.214)	Top-5 acc 49.219 (56.164)	lr 0.02487
Train [6][1800/3239]	Time 0.515 (0.832)	Data Time 0.001 (0.011)	Loss 3.9134 (3.9282)	Entropy 1.73852 (1.75362)	Top-1 acc 35.156 (32.210)	Top-5 acc 57.422 (56.168)	lr 0.02487
Train [6][1810/3239]	Time 0.566 (0.832)	Data Time 0.001 (0.011)	Loss 3.8450 (3.9281)	Entropy 1.73819 (1.75354)	Top-1 acc 32.812 (32.217)	Top-5 acc 57.812 (56.167)	lr 0.02487
Train [6][1820/3239]	Time 0.588 (0.832)	Data Time 0.001 (0.011)	Loss 3.8188 (3.9279)	Entropy 1.73825 (1.75345)	Top-1 acc 38.281 (32.223)	Top-5 acc 57.422 (56.174)	lr 0.02487
Train [6][1830/3239]	Time 0.568 (0.831)	Data Time 0.001 (0.011)	Loss 4.0378 (3.9282)	Entropy 1.73793 (1.75337)	Top-1 acc 31.641 (32.220)	Top-5 acc 51.953 (56.171)	lr 0.02487
Train [6][1840/3239]	Time 0.617 (0.831)	Data Time 0.001 (0.011)	Loss 4.1001 (3.9281)	Entropy 1.73763 (1.75328)	Top-1 acc 30.078 (32.218)	Top-5 acc 53.516 (56.170)	lr 0.02487
Train [6][1850/3239]	Time 0.592 (0.831)	Data Time 0.001 (0.011)	Loss 3.9643 (3.9282)	Entropy 1.73759 (1.75320)	Top-1 acc 30.078 (32.218)	Top-5 acc 56.250 (56.163)	lr 0.02487
Train [6][1860/3239]	Time 0.527 (0.831)	Data Time 0.001 (0.011)	Loss 3.9449 (3.9282)	Entropy 1.73746 (1.75311)	Top-1 acc 29.297 (32.219)	Top-5 acc 57.812 (56.161)	lr 0.02487
Train [6][1870/3239]	Time 0.584 (0.830)	Data Time 0.001 (0.011)	Loss 3.7891 (3.9277)	Entropy 1.73729 (1.75303)	Top-1 acc 37.500 (32.233)	Top-5 acc 62.109 (56.172)	lr 0.02487
Train [6][1880/3239]	Time 0.557 (0.830)	Data Time 0.001 (0.011)	Loss 3.8112 (3.9277)	Entropy 1.73699 (1.75295)	Top-1 acc 35.156 (32.227)	Top-5 acc 58.203 (56.173)	lr 0.02487
Train [6][1890/3239]	Time 0.630 (0.830)	Data Time 0.001 (0.011)	Loss 4.0756 (3.9277)	Entropy 1.73704 (1.75286)	Top-1 acc 32.812 (32.232)	Top-5 acc 51.953 (56.171)	lr 0.02487
Train [6][1900/3239]	Time 0.545 (0.830)	Data Time 0.001 (0.011)	Loss 3.9829 (3.9275)	Entropy 1.73693 (1.75278)	Top-1 acc 30.859 (32.234)	Top-5 acc 55.078 (56.175)	lr 0.02487
Train [6][1910/3239]	Time 0.554 (0.829)	Data Time 0.001 (0.010)	Loss 4.2232 (3.9276)	Entropy 1.73692 (1.75270)	Top-1 acc 27.734 (32.231)	Top-5 acc 49.609 (56.169)	lr 0.02487
Train [6][1920/3239]	Time 0.588 (0.829)	Data Time 0.001 (0.010)	Loss 3.8925 (3.9277)	Entropy 1.73693 (1.75261)	Top-1 acc 32.812 (32.235)	Top-5 acc 55.469 (56.164)	lr 0.02487
Train [6][1930/3239]	Time 0.505 (0.829)	Data Time 0.001 (0.010)	Loss 3.8929 (3.9280)	Entropy 1.73673 (1.75253)	Top-1 acc 33.203 (32.236)	Top-5 acc 55.078 (56.155)	lr 0.02487
Train [6][1940/3239]	Time 0.580 (0.829)	Data Time 0.001 (0.010)	Loss 3.8127 (3.9277)	Entropy 1.73642 (1.75245)	Top-1 acc 37.891 (32.234)	Top-5 acc 58.984 (56.160)	lr 0.02487
Train [6][1950/3239]	Time 0.576 (0.829)	Data Time 0.001 (0.010)	Loss 3.9693 (3.9274)	Entropy 1.73629 (1.75237)	Top-1 acc 33.984 (32.244)	Top-5 acc 57.422 (56.168)	lr 0.02487
Train [6][1960/3239]	Time 0.498 (0.829)	Data Time 0.001 (0.010)	Loss 3.7787 (3.9275)	Entropy 1.73631 (1.75229)	Top-1 acc 33.594 (32.244)	Top-5 acc 56.250 (56.167)	lr 0.02487
Train [6][1970/3239]	Time 0.530 (0.829)	Data Time 0.001 (0.010)	Loss 3.8516 (3.9271)	Entropy 1.73624 (1.75220)	Top-1 acc 33.594 (32.245)	Top-5 acc 55.469 (56.168)	lr 0.02487
Train [6][1980/3239]	Time 0.585 (0.828)	Data Time 0.001 (0.010)	Loss 3.9099 (3.9271)	Entropy 1.73588 (1.75212)	Top-1 acc 30.859 (32.244)	Top-5 acc 55.859 (56.171)	lr 0.02487
Train [6][1990/3239]	Time 0.490 (0.828)	Data Time 0.001 (0.010)	Loss 3.8526 (3.9269)	Entropy 1.73574 (1.75204)	Top-1 acc 34.375 (32.251)	Top-5 acc 56.250 (56.176)	lr 0.02487
Train [6][2000/3239]	Time 0.600 (0.828)	Data Time 0.001 (0.010)	Loss 3.7936 (3.9269)	Entropy 1.73568 (1.75196)	Top-1 acc 30.859 (32.252)	Top-5 acc 57.031 (56.179)	lr 0.02487
Train [6][2010/3239]	Time 0.691 (0.828)	Data Time 0.001 (0.010)	Loss 3.8160 (3.9271)	Entropy 1.73524 (1.75188)	Top-1 acc 36.328 (32.248)	Top-5 acc 60.156 (56.174)	lr 0.02486
Train [6][2020/3239]	Time 0.572 (0.828)	Data Time 0.001 (0.010)	Loss 3.9268 (3.9270)	Entropy 1.73508 (1.75180)	Top-1 acc 30.469 (32.252)	Top-5 acc 57.422 (56.179)	lr 0.02486
Train [6][2030/3239]	Time 0.560 (0.828)	Data Time 0.001 (0.010)	Loss 4.0226 (3.9271)	Entropy 1.73500 (1.75171)	Top-1 acc 36.719 (32.253)	Top-5 acc 55.078 (56.175)	lr 0.02486
Train [6][2040/3239]	Time 0.486 (0.827)	Data Time 0.001 (0.010)	Loss 3.6636 (3.9270)	Entropy 1.73494 (1.75163)	Top-1 acc 41.406 (32.257)	Top-5 acc 63.672 (56.178)	lr 0.02486
Train [6][2050/3239]	Time 0.536 (0.827)	Data Time 0.002 (0.010)	Loss 4.0194 (3.9269)	Entropy 1.73484 (1.75155)	Top-1 acc 30.469 (32.265)	Top-5 acc 52.734 (56.177)	lr 0.02486
Train [6][2060/3239]	Time 0.518 (0.827)	Data Time 0.001 (0.010)	Loss 3.9189 (3.9270)	Entropy 1.73467 (1.75147)	Top-1 acc 33.203 (32.259)	Top-5 acc 54.688 (56.172)	lr 0.02486
Train [6][2070/3239]	Time 0.497 (0.827)	Data Time 0.001 (0.010)	Loss 3.9012 (3.9270)	Entropy 1.73448 (1.75139)	Top-1 acc 34.766 (32.259)	Top-5 acc 54.297 (56.173)	lr 0.02486
Train [6][2080/3239]	Time 0.567 (0.827)	Data Time 0.001 (0.010)	Loss 3.9555 (3.9270)	Entropy 1.73428 (1.75131)	Top-1 acc 28.906 (32.256)	Top-5 acc 53.906 (56.169)	lr 0.02486
Train [6][2090/3239]	Time 0.604 (0.827)	Data Time 0.001 (0.010)	Loss 3.7404 (3.9266)	Entropy 1.73402 (1.75122)	Top-1 acc 36.719 (32.265)	Top-5 acc 60.938 (56.180)	lr 0.02486
Train [6][2100/3239]	Time 0.581 (0.827)	Data Time 0.001 (0.010)	Loss 3.9050 (3.9265)	Entropy 1.73381 (1.75114)	Top-1 acc 31.250 (32.265)	Top-5 acc 55.078 (56.183)	lr 0.02486
Train [6][2110/3239]	Time 0.635 (0.835)	Data Time 0.004 (0.010)	Loss 4.0224 (3.9263)	Entropy 1.73365 (1.75106)	Top-1 acc 28.906 (32.270)	Top-5 acc 51.172 (56.182)	lr 0.02486
Train [6][2120/3239]	Time 0.501 (0.835)	Data Time 0.002 (0.010)	Loss 3.8204 (3.9265)	Entropy 1.73347 (1.75098)	Top-1 acc 32.031 (32.266)	Top-5 acc 59.766 (56.179)	lr 0.02486
Train [6][2130/3239]	Time 0.643 (0.835)	Data Time 0.002 (0.010)	Loss 3.9215 (3.9263)	Entropy 1.73346 (1.75089)	Top-1 acc 32.031 (32.275)	Top-5 acc 52.734 (56.183)	lr 0.02486
Train [6][2140/3239]	Time 0.599 (0.835)	Data Time 0.001 (0.010)	Loss 3.9070 (3.9263)	Entropy 1.73321 (1.75081)	Top-1 acc 30.078 (32.278)	Top-5 acc 55.859 (56.187)	lr 0.02486
Train [6][2150/3239]	Time 0.533 (0.835)	Data Time 0.001 (0.010)	Loss 3.9690 (3.9262)	Entropy 1.73291 (1.75073)	Top-1 acc 33.594 (32.273)	Top-5 acc 56.250 (56.186)	lr 0.02486
Train [6][2160/3239]	Time 0.564 (0.834)	Data Time 0.001 (0.010)	Loss 4.1778 (3.9265)	Entropy 1.73283 (1.75065)	Top-1 acc 26.172 (32.273)	Top-5 acc 50.391 (56.181)	lr 0.02486
Train [6][2170/3239]	Time 0.499 (0.834)	Data Time 0.001 (0.010)	Loss 3.7309 (3.9264)	Entropy 1.73272 (1.75057)	Top-1 acc 37.891 (32.278)	Top-5 acc 60.547 (56.180)	lr 0.02486
Train [6][2180/3239]	Time 0.597 (0.834)	Data Time 0.001 (0.010)	Loss 3.9241 (3.9262)	Entropy 1.73261 (1.75048)	Top-1 acc 32.812 (32.283)	Top-5 acc 56.250 (56.186)	lr 0.02486
Train [6][2190/3239]	Time 0.544 (0.833)	Data Time 0.001 (0.009)	Loss 3.7318 (3.9259)	Entropy 1.73228 (1.75040)	Top-1 acc 33.594 (32.288)	Top-5 acc 58.984 (56.190)	lr 0.02486
Train [6][2200/3239]	Time 0.440 (0.833)	Data Time 0.001 (0.009)	Loss 3.9085 (3.9259)	Entropy 1.73214 (1.75032)	Top-1 acc 34.766 (32.289)	Top-5 acc 57.812 (56.190)	lr 0.02486
Train [6][2210/3239]	Time 0.510 (0.833)	Data Time 0.001 (0.009)	Loss 3.9415 (3.9261)	Entropy 1.73194 (1.75024)	Top-1 acc 33.594 (32.286)	Top-5 acc 57.422 (56.185)	lr 0.02486
Train [6][2220/3239]	Time 0.589 (0.833)	Data Time 0.001 (0.009)	Loss 3.7514 (3.9260)	Entropy 1.73166 (1.75015)	Top-1 acc 37.500 (32.288)	Top-5 acc 57.812 (56.187)	lr 0.02486
Train [6][2230/3239]	Time 0.516 (0.833)	Data Time 0.001 (0.009)	Loss 3.9517 (3.9263)	Entropy 1.73162 (1.75007)	Top-1 acc 30.859 (32.282)	Top-5 acc 56.250 (56.183)	lr 0.02486
Train [6][2240/3239]	Time 0.530 (0.833)	Data Time 0.001 (0.009)	Loss 3.7800 (3.9261)	Entropy 1.73160 (1.74999)	Top-1 acc 33.594 (32.283)	Top-5 acc 58.594 (56.186)	lr 0.02486
Train [6][2250/3239]	Time 0.676 (0.833)	Data Time 0.001 (0.009)	Loss 3.8772 (3.9260)	Entropy 1.73141 (1.74991)	Top-1 acc 34.766 (32.283)	Top-5 acc 57.422 (56.184)	lr 0.02486
Train [6][2260/3239]	Time 0.550 (0.833)	Data Time 0.001 (0.009)	Loss 3.9825 (3.9259)	Entropy 1.73137 (1.74982)	Top-1 acc 34.766 (32.288)	Top-5 acc 59.766 (56.189)	lr 0.02486
Train [6][2270/3239]	Time 0.584 (0.833)	Data Time 0.001 (0.009)	Loss 3.8976 (3.9259)	Entropy 1.73118 (1.74974)	Top-1 acc 30.859 (32.289)	Top-5 acc 55.469 (56.188)	lr 0.02486
Train [6][2280/3239]	Time 0.510 (0.832)	Data Time 0.001 (0.009)	Loss 3.9173 (3.9259)	Entropy 1.73103 (1.74966)	Top-1 acc 33.984 (32.287)	Top-5 acc 55.078 (56.183)	lr 0.02486
Train [6][2290/3239]	Time 0.599 (0.832)	Data Time 0.001 (0.009)	Loss 3.8849 (3.9260)	Entropy 1.73080 (1.74958)	Top-1 acc 32.812 (32.283)	Top-5 acc 55.078 (56.178)	lr 0.02486
Train [6][2300/3239]	Time 0.622 (0.832)	Data Time 0.001 (0.009)	Loss 3.8965 (3.9259)	Entropy 1.73062 (1.74950)	Top-1 acc 30.859 (32.286)	Top-5 acc 55.078 (56.184)	lr 0.02486
Train [6][2310/3239]	Time 0.615 (0.832)	Data Time 0.001 (0.009)	Loss 3.7320 (3.9258)	Entropy 1.73031 (1.74941)	Top-1 acc 37.109 (32.290)	Top-5 acc 61.719 (56.183)	lr 0.02486
Train [6][2320/3239]	Time 0.552 (0.832)	Data Time 0.002 (0.009)	Loss 3.9231 (3.9258)	Entropy 1.73015 (1.74933)	Top-1 acc 32.812 (32.289)	Top-5 acc 56.250 (56.180)	lr 0.02486
Train [6][2330/3239]	Time 0.383 (0.832)	Data Time 0.002 (0.009)	Loss 4.0672 (3.9257)	Entropy 1.72994 (1.74925)	Top-1 acc 32.812 (32.292)	Top-5 acc 53.516 (56.182)	lr 0.02486
Train [6][2340/3239]	Time 0.539 (0.832)	Data Time 0.002 (0.009)	Loss 3.9560 (3.9257)	Entropy 1.72975 (1.74917)	Top-1 acc 31.250 (32.291)	Top-5 acc 54.688 (56.179)	lr 0.02486
Train [6][2350/3239]	Time 0.645 (0.831)	Data Time 0.001 (0.009)	Loss 3.9941 (3.9258)	Entropy 1.72942 (1.74908)	Top-1 acc 30.078 (32.287)	Top-5 acc 51.562 (56.178)	lr 0.02486
Train [6][2360/3239]	Time 0.532 (0.831)	Data Time 0.001 (0.009)	Loss 3.7829 (3.9254)	Entropy 1.72919 (1.74900)	Top-1 acc 31.641 (32.296)	Top-5 acc 57.812 (56.187)	lr 0.02486
Train [6][2370/3239]	Time 0.488 (0.831)	Data Time 0.002 (0.009)	Loss 3.8316 (3.9253)	Entropy 1.72900 (1.74892)	Top-1 acc 36.719 (32.300)	Top-5 acc 56.641 (56.188)	lr 0.02486
Train [6][2380/3239]	Time 0.553 (0.831)	Data Time 0.001 (0.009)	Loss 3.8606 (3.9252)	Entropy 1.72862 (1.74883)	Top-1 acc 31.641 (32.300)	Top-5 acc 56.250 (56.190)	lr 0.02486
Train [6][2390/3239]	Time 0.549 (0.831)	Data Time 0.001 (0.009)	Loss 3.6446 (3.9250)	Entropy 1.72866 (1.74875)	Top-1 acc 36.328 (32.308)	Top-5 acc 63.281 (56.196)	lr 0.02486
Train [6][2400/3239]	Time 0.648 (0.830)	Data Time 0.001 (0.009)	Loss 3.6900 (3.9250)	Entropy 1.72829 (1.74866)	Top-1 acc 39.062 (32.313)	Top-5 acc 60.547 (56.196)	lr 0.02486
Train [6][2410/3239]	Time 0.486 (0.830)	Data Time 0.001 (0.009)	Loss 3.7384 (3.9247)	Entropy 1.72809 (1.74858)	Top-1 acc 36.719 (32.320)	Top-5 acc 61.328 (56.207)	lr 0.02486
Train [6][2420/3239]	Time 0.428 (0.830)	Data Time 0.001 (0.009)	Loss 4.0260 (3.9248)	Entropy 1.72788 (1.74849)	Top-1 acc 27.734 (32.313)	Top-5 acc 53.906 (56.205)	lr 0.02486
Train [6][2430/3239]	Time 0.550 (0.830)	Data Time 0.001 (0.009)	Loss 4.1005 (3.9250)	Entropy 1.72800 (1.74841)	Top-1 acc 30.469 (32.306)	Top-5 acc 50.000 (56.198)	lr 0.02486
Train [6][2440/3239]	Time 0.544 (0.830)	Data Time 0.001 (0.009)	Loss 3.7132 (3.9249)	Entropy 1.72801 (1.74833)	Top-1 acc 39.453 (32.313)	Top-5 acc 61.719 (56.201)	lr 0.02486
Train [6][2450/3239]	Time 0.586 (0.830)	Data Time 0.001 (0.009)	Loss 4.0867 (3.9246)	Entropy 1.72797 (1.74824)	Top-1 acc 30.469 (32.318)	Top-5 acc 51.172 (56.206)	lr 0.02486
Train [6][2460/3239]	Time 0.551 (0.830)	Data Time 0.001 (0.009)	Loss 3.8695 (3.9245)	Entropy 1.72781 (1.74816)	Top-1 acc 35.547 (32.317)	Top-5 acc 58.984 (56.208)	lr 0.02486
Train [6][2470/3239]	Time 0.634 (0.830)	Data Time 0.001 (0.009)	Loss 3.9244 (3.9245)	Entropy 1.72747 (1.74808)	Top-1 acc 33.984 (32.318)	Top-5 acc 58.594 (56.207)	lr 0.02486
Train [6][2480/3239]	Time 0.539 (0.830)	Data Time 0.002 (0.009)	Loss 3.7706 (3.9244)	Entropy 1.72710 (1.74799)	Top-1 acc 37.500 (32.322)	Top-5 acc 62.500 (56.214)	lr 0.02486
Train [6][2490/3239]	Time 0.603 (0.829)	Data Time 0.001 (0.009)	Loss 3.9336 (3.9246)	Entropy 1.72699 (1.74791)	Top-1 acc 28.516 (32.315)	Top-5 acc 57.031 (56.213)	lr 0.02486
Train [6][2500/3239]	Time 0.526 (0.829)	Data Time 0.001 (0.009)	Loss 4.1078 (3.9247)	Entropy 1.72677 (1.74783)	Top-1 acc 28.516 (32.313)	Top-5 acc 51.953 (56.210)	lr 0.02486
Train [6][2510/3239]	Time 0.563 (0.829)	Data Time 0.001 (0.009)	Loss 3.7487 (3.9245)	Entropy 1.72657 (1.74774)	Top-1 acc 35.156 (32.318)	Top-5 acc 62.500 (56.212)	lr 0.02486
Train [6][2520/3239]	Time 0.623 (0.829)	Data Time 0.003 (0.009)	Loss 3.7391 (3.9243)	Entropy 1.72637 (1.74766)	Top-1 acc 37.109 (32.323)	Top-5 acc 62.109 (56.222)	lr 0.02486
Train [6][2530/3239]	Time 0.543 (0.829)	Data Time 0.002 (0.009)	Loss 3.8768 (3.9241)	Entropy 1.72610 (1.74757)	Top-1 acc 31.641 (32.323)	Top-5 acc 57.031 (56.229)	lr 0.02486
Train [6][2540/3239]	Time 0.574 (0.829)	Data Time 0.001 (0.009)	Loss 3.7732 (3.9241)	Entropy 1.72582 (1.74749)	Top-1 acc 35.547 (32.326)	Top-5 acc 58.594 (56.229)	lr 0.02486
Train [6][2550/3239]	Time 0.580 (0.828)	Data Time 0.001 (0.009)	Loss 3.9526 (3.9243)	Entropy 1.72550 (1.74740)	Top-1 acc 28.906 (32.321)	Top-5 acc 57.812 (56.227)	lr 0.02486
Train [6][2560/3239]	Time 0.582 (0.828)	Data Time 0.001 (0.009)	Loss 3.7804 (3.9241)	Entropy 1.72554 (1.74732)	Top-1 acc 35.547 (32.324)	Top-5 acc 60.547 (56.230)	lr 0.02486
Train [6][2570/3239]	Time 0.591 (0.828)	Data Time 0.001 (0.009)	Loss 3.7886 (3.9241)	Entropy 1.72551 (1.74723)	Top-1 acc 41.016 (32.331)	Top-5 acc 59.375 (56.230)	lr 0.02486
Train [6][2580/3239]	Time 0.549 (0.828)	Data Time 0.001 (0.008)	Loss 3.5828 (3.9239)	Entropy 1.72543 (1.74715)	Top-1 acc 43.750 (32.337)	Top-5 acc 67.578 (56.237)	lr 0.02486
Train [6][2590/3239]	Time 0.605 (0.828)	Data Time 0.001 (0.008)	Loss 3.7228 (3.9236)	Entropy 1.72506 (1.74706)	Top-1 acc 37.109 (32.338)	Top-5 acc 58.594 (56.241)	lr 0.02486
Train [6][2600/3239]	Time 0.488 (0.828)	Data Time 0.001 (0.008)	Loss 3.8515 (3.9234)	Entropy 1.72506 (1.74698)	Top-1 acc 32.812 (32.345)	Top-5 acc 55.859 (56.248)	lr 0.02486
Train [6][2610/3239]	Time 0.519 (0.828)	Data Time 0.001 (0.008)	Loss 3.7981 (3.9233)	Entropy 1.72494 (1.74689)	Top-1 acc 33.594 (32.345)	Top-5 acc 57.812 (56.246)	lr 0.02486
Train [6][2620/3239]	Time 0.643 (0.828)	Data Time 0.001 (0.008)	Loss 3.8852 (3.9235)	Entropy 1.72479 (1.74681)	Top-1 acc 31.641 (32.337)	Top-5 acc 58.203 (56.245)	lr 0.02486
Train [6][2630/3239]	Time 0.598 (0.828)	Data Time 0.001 (0.008)	Loss 4.0488 (3.9233)	Entropy 1.72469 (1.74673)	Top-1 acc 31.250 (32.346)	Top-5 acc 53.906 (56.250)	lr 0.02486
Train [6][2640/3239]	Time 0.543 (0.828)	Data Time 0.001 (0.008)	Loss 3.9631 (3.9233)	Entropy 1.72457 (1.74664)	Top-1 acc 33.203 (32.348)	Top-5 acc 57.031 (56.254)	lr 0.02486
Train [6][2650/3239]	Time 0.564 (0.828)	Data Time 0.001 (0.008)	Loss 3.8906 (3.9232)	Entropy 1.72429 (1.74656)	Top-1 acc 33.203 (32.350)	Top-5 acc 55.859 (56.256)	lr 0.02486
Train [6][2660/3239]	Time 0.531 (0.828)	Data Time 0.001 (0.008)	Loss 3.9179 (3.9231)	Entropy 1.72404 (1.74648)	Top-1 acc 31.641 (32.350)	Top-5 acc 56.250 (56.261)	lr 0.02486
Train [6][2670/3239]	Time 0.575 (0.828)	Data Time 0.001 (0.008)	Loss 3.9402 (3.9230)	Entropy 1.72382 (1.74639)	Top-1 acc 33.203 (32.348)	Top-5 acc 57.422 (56.264)	lr 0.02485
Train [6][2680/3239]	Time 0.564 (0.828)	Data Time 0.001 (0.008)	Loss 3.8412 (3.9229)	Entropy 1.72381 (1.74631)	Top-1 acc 33.203 (32.352)	Top-5 acc 57.031 (56.265)	lr 0.02485
Train [6][2690/3239]	Time 0.547 (0.827)	Data Time 0.001 (0.008)	Loss 3.9828 (3.9227)	Entropy 1.72377 (1.74622)	Top-1 acc 30.469 (32.355)	Top-5 acc 55.859 (56.268)	lr 0.02485
Train [6][2700/3239]	Time 0.520 (0.827)	Data Time 0.002 (0.008)	Loss 4.0084 (3.9227)	Entropy 1.72358 (1.74614)	Top-1 acc 31.641 (32.358)	Top-5 acc 57.031 (56.267)	lr 0.02485
Train [6][2710/3239]	Time 0.427 (0.827)	Data Time 0.001 (0.008)	Loss 4.1518 (3.9228)	Entropy 1.72307 (1.74606)	Top-1 acc 28.516 (32.360)	Top-5 acc 49.219 (56.267)	lr 0.02485
Train [6][2720/3239]	Time 0.544 (0.827)	Data Time 0.001 (0.008)	Loss 4.0206 (3.9227)	Entropy 1.72287 (1.74597)	Top-1 acc 32.422 (32.362)	Top-5 acc 52.344 (56.268)	lr 0.02485
Train [6][2730/3239]	Time 0.522 (0.827)	Data Time 0.001 (0.008)	Loss 3.8571 (3.9225)	Entropy 1.72279 (1.74589)	Top-1 acc 33.984 (32.367)	Top-5 acc 60.156 (56.274)	lr 0.02485
Train [6][2740/3239]	Time 0.554 (0.827)	Data Time 0.001 (0.008)	Loss 3.9815 (3.9225)	Entropy 1.72261 (1.74580)	Top-1 acc 30.859 (32.366)	Top-5 acc 58.203 (56.276)	lr 0.02485
Train [6][2750/3239]	Time 0.603 (0.827)	Data Time 0.003 (0.008)	Loss 3.8933 (3.9225)	Entropy 1.72256 (1.74572)	Top-1 acc 30.469 (32.366)	Top-5 acc 58.203 (56.275)	lr 0.02485
Train [6][2760/3239]	Time 0.658 (0.827)	Data Time 0.001 (0.008)	Loss 4.0967 (3.9227)	Entropy 1.72227 (1.74563)	Top-1 acc 25.781 (32.362)	Top-5 acc 51.562 (56.269)	lr 0.02485
Train [6][2770/3239]	Time 0.495 (0.833)	Data Time 0.002 (0.008)	Loss 3.8886 (3.9226)	Entropy 1.72208 (1.74555)	Top-1 acc 33.203 (32.364)	Top-5 acc 57.031 (56.269)	lr 0.02485
Train [6][2780/3239]	Time 0.550 (0.833)	Data Time 0.001 (0.008)	Loss 4.0852 (3.9229)	Entropy 1.72164 (1.74546)	Top-1 acc 30.859 (32.362)	Top-5 acc 53.125 (56.263)	lr 0.02485
Train [6][2790/3239]	Time 0.622 (0.833)	Data Time 0.001 (0.008)	Loss 3.8911 (3.9228)	Entropy 1.72131 (1.74538)	Top-1 acc 33.203 (32.367)	Top-5 acc 53.906 (56.265)	lr 0.02485
Train [6][2800/3239]	Time 0.541 (0.833)	Data Time 0.001 (0.008)	Loss 3.8876 (3.9226)	Entropy 1.72116 (1.74529)	Top-1 acc 28.516 (32.372)	Top-5 acc 55.469 (56.270)	lr 0.02485
Train [6][2810/3239]	Time 0.589 (0.832)	Data Time 0.001 (0.008)	Loss 3.8156 (3.9224)	Entropy 1.72092 (1.74521)	Top-1 acc 32.422 (32.374)	Top-5 acc 58.984 (56.275)	lr 0.02485
Train [6][2820/3239]	Time 0.557 (0.832)	Data Time 0.001 (0.008)	Loss 3.8450 (3.9224)	Entropy 1.72069 (1.74512)	Top-1 acc 33.594 (32.374)	Top-5 acc 56.641 (56.274)	lr 0.02485
Train [6][2830/3239]	Time 0.570 (0.832)	Data Time 0.001 (0.008)	Loss 4.0425 (3.9222)	Entropy 1.72046 (1.74503)	Top-1 acc 28.906 (32.378)	Top-5 acc 53.125 (56.279)	lr 0.02485
Train [6][2840/3239]	Time 0.578 (0.832)	Data Time 0.001 (0.008)	Loss 4.0394 (3.9221)	Entropy 1.72043 (1.74495)	Top-1 acc 29.297 (32.380)	Top-5 acc 54.297 (56.282)	lr 0.02485
Train [6][2850/3239]	Time 0.523 (0.832)	Data Time 0.001 (0.008)	Loss 4.0798 (3.9221)	Entropy 1.72024 (1.74486)	Top-1 acc 31.641 (32.384)	Top-5 acc 53.516 (56.279)	lr 0.02485
Train [6][2860/3239]	Time 0.602 (0.832)	Data Time 0.001 (0.008)	Loss 3.9984 (3.9222)	Entropy 1.72014 (1.74477)	Top-1 acc 28.906 (32.382)	Top-5 acc 53.125 (56.276)	lr 0.02485
Train [6][2870/3239]	Time 0.546 (0.831)	Data Time 0.001 (0.008)	Loss 3.7929 (3.9221)	Entropy 1.72012 (1.74469)	Top-1 acc 36.719 (32.386)	Top-5 acc 58.984 (56.275)	lr 0.02485
Train [6][2880/3239]	Time 0.561 (0.831)	Data Time 0.001 (0.008)	Loss 3.8807 (3.9220)	Entropy 1.72009 (1.74460)	Top-1 acc 32.031 (32.385)	Top-5 acc 55.469 (56.277)	lr 0.02485
Train [6][2890/3239]	Time 0.536 (0.831)	Data Time 0.001 (0.008)	Loss 3.7404 (3.9218)	Entropy 1.72018 (1.74452)	Top-1 acc 36.328 (32.387)	Top-5 acc 63.672 (56.280)	lr 0.02485
Train [6][2900/3239]	Time 0.655 (0.831)	Data Time 0.002 (0.008)	Loss 3.7502 (3.9218)	Entropy 1.72024 (1.74444)	Top-1 acc 33.984 (32.388)	Top-5 acc 62.109 (56.280)	lr 0.02485
Train [6][2910/3239]	Time 0.587 (0.831)	Data Time 0.001 (0.008)	Loss 3.7343 (3.9219)	Entropy 1.72013 (1.74435)	Top-1 acc 31.641 (32.386)	Top-5 acc 62.109 (56.279)	lr 0.02485
Train [6][2920/3239]	Time 0.505 (0.831)	Data Time 0.001 (0.008)	Loss 4.0428 (3.9219)	Entropy 1.71988 (1.74427)	Top-1 acc 33.594 (32.383)	Top-5 acc 51.562 (56.278)	lr 0.02485
Train [6][2930/3239]	Time 0.567 (0.831)	Data Time 0.001 (0.008)	Loss 3.9863 (3.9217)	Entropy 1.71978 (1.74419)	Top-1 acc 28.516 (32.385)	Top-5 acc 54.297 (56.282)	lr 0.02485
Train [6][2940/3239]	Time 0.519 (0.831)	Data Time 0.001 (0.008)	Loss 3.8042 (3.9217)	Entropy 1.71953 (1.74410)	Top-1 acc 36.328 (32.389)	Top-5 acc 56.250 (56.284)	lr 0.02485
Train [6][2950/3239]	Time 0.639 (0.831)	Data Time 0.001 (0.008)	Loss 3.9504 (3.9219)	Entropy 1.71915 (1.74402)	Top-1 acc 33.594 (32.388)	Top-5 acc 55.469 (56.280)	lr 0.02485
Train [6][2960/3239]	Time 0.602 (0.831)	Data Time 0.001 (0.008)	Loss 3.7860 (3.9217)	Entropy 1.71880 (1.74393)	Top-1 acc 35.156 (32.391)	Top-5 acc 62.891 (56.286)	lr 0.02485
Train [6][2970/3239]	Time 0.585 (0.831)	Data Time 0.003 (0.008)	Loss 4.0369 (3.9217)	Entropy 1.71868 (1.74385)	Top-1 acc 30.078 (32.391)	Top-5 acc 53.516 (56.283)	lr 0.02485
Train [6][2980/3239]	Time 0.582 (0.831)	Data Time 0.001 (0.008)	Loss 4.1360 (3.9216)	Entropy 1.71859 (1.74377)	Top-1 acc 30.078 (32.394)	Top-5 acc 53.125 (56.284)	lr 0.02485
Train [6][2990/3239]	Time 0.562 (0.831)	Data Time 0.001 (0.008)	Loss 3.8574 (3.9217)	Entropy 1.71845 (1.74368)	Top-1 acc 37.109 (32.395)	Top-5 acc 57.031 (56.282)	lr 0.02485
Train [6][3000/3239]	Time 0.604 (0.831)	Data Time 0.001 (0.008)	Loss 4.1145 (3.9218)	Entropy 1.71828 (1.74360)	Top-1 acc 30.469 (32.391)	Top-5 acc 49.219 (56.275)	lr 0.02485
Train [6][3010/3239]	Time 0.565 (0.831)	Data Time 0.001 (0.008)	Loss 3.9254 (3.9221)	Entropy 1.71802 (1.74351)	Top-1 acc 31.250 (32.390)	Top-5 acc 55.078 (56.271)	lr 0.02485
Train [6][3020/3239]	Time 0.528 (0.830)	Data Time 0.001 (0.008)	Loss 4.0390 (3.9222)	Entropy 1.71796 (1.74343)	Top-1 acc 30.859 (32.389)	Top-5 acc 50.781 (56.265)	lr 0.02485
Train [6][3030/3239]	Time 0.526 (0.830)	Data Time 0.001 (0.008)	Loss 3.7349 (3.9223)	Entropy 1.71780 (1.74334)	Top-1 acc 34.766 (32.389)	Top-5 acc 62.500 (56.267)	lr 0.02485
Train [6][3040/3239]	Time 0.455 (0.830)	Data Time 0.001 (0.008)	Loss 3.9504 (3.9220)	Entropy 1.71767 (1.74326)	Top-1 acc 29.688 (32.394)	Top-5 acc 52.734 (56.267)	lr 0.02485
Train [6][3050/3239]	Time 0.552 (0.830)	Data Time 0.001 (0.008)	Loss 3.9792 (3.9220)	Entropy 1.71752 (1.74317)	Top-1 acc 32.422 (32.398)	Top-5 acc 55.469 (56.267)	lr 0.02485
Train [6][3060/3239]	Time 0.563 (0.830)	Data Time 0.002 (0.008)	Loss 3.8392 (3.9217)	Entropy 1.71743 (1.74309)	Top-1 acc 32.812 (32.404)	Top-5 acc 53.906 (56.271)	lr 0.02485
Train [6][3070/3239]	Time 0.634 (0.830)	Data Time 0.001 (0.008)	Loss 3.6784 (3.9215)	Entropy 1.71731 (1.74301)	Top-1 acc 35.938 (32.408)	Top-5 acc 60.156 (56.270)	lr 0.02485
Train [6][3080/3239]	Time 0.472 (0.830)	Data Time 0.001 (0.008)	Loss 3.6950 (3.9212)	Entropy 1.71721 (1.74292)	Top-1 acc 37.891 (32.410)	Top-5 acc 59.766 (56.280)	lr 0.02485
Train [6][3090/3239]	Time 0.516 (0.830)	Data Time 0.001 (0.008)	Loss 3.9125 (3.9211)	Entropy 1.71707 (1.74284)	Top-1 acc 34.766 (32.413)	Top-5 acc 57.422 (56.287)	lr 0.02485
Train [6][3100/3239]	Time 0.509 (0.830)	Data Time 0.001 (0.007)	Loss 3.7803 (3.9208)	Entropy 1.71698 (1.74276)	Top-1 acc 35.156 (32.419)	Top-5 acc 58.984 (56.292)	lr 0.02485
Train [6][3110/3239]	Time 0.576 (0.829)	Data Time 0.001 (0.007)	Loss 4.1416 (3.9208)	Entropy 1.71674 (1.74267)	Top-1 acc 28.516 (32.419)	Top-5 acc 53.516 (56.293)	lr 0.02485
Train [6][3120/3239]	Time 0.550 (0.829)	Data Time 0.001 (0.007)	Loss 4.0431 (3.9208)	Entropy 1.71652 (1.74259)	Top-1 acc 32.422 (32.422)	Top-5 acc 54.688 (56.290)	lr 0.02485
Train [6][3130/3239]	Time 0.537 (0.829)	Data Time 0.001 (0.007)	Loss 3.9703 (3.9209)	Entropy 1.71646 (1.74251)	Top-1 acc 30.859 (32.421)	Top-5 acc 55.469 (56.289)	lr 0.02485
Train [6][3140/3239]	Time 0.606 (0.829)	Data Time 0.001 (0.007)	Loss 4.1820 (3.9208)	Entropy 1.71635 (1.74242)	Top-1 acc 28.516 (32.420)	Top-5 acc 52.734 (56.291)	lr 0.02485
Train [6][3150/3239]	Time 0.585 (0.829)	Data Time 0.001 (0.007)	Loss 4.0657 (3.9206)	Entropy 1.71621 (1.74234)	Top-1 acc 28.906 (32.420)	Top-5 acc 52.734 (56.294)	lr 0.02485
Train [6][3160/3239]	Time 0.569 (0.829)	Data Time 0.001 (0.007)	Loss 3.8329 (3.9207)	Entropy 1.71616 (1.74226)	Top-1 acc 35.156 (32.418)	Top-5 acc 60.156 (56.292)	lr 0.02485
Train [6][3170/3239]	Time 0.628 (0.829)	Data Time 0.001 (0.007)	Loss 4.1438 (3.9207)	Entropy 1.71594 (1.74218)	Top-1 acc 29.688 (32.417)	Top-5 acc 55.469 (56.295)	lr 0.02485
Train [6][3180/3239]	Time 0.556 (0.829)	Data Time 0.000 (0.007)	Loss 4.2453 (3.9207)	Entropy 1.71591 (1.74209)	Top-1 acc 25.781 (32.421)	Top-5 acc 50.781 (56.298)	lr 0.02485
Train [6][3190/3239]	Time 0.526 (0.829)	Data Time 0.000 (0.007)	Loss 4.0659 (3.9207)	Entropy 1.71583 (1.74201)	Top-1 acc 31.250 (32.421)	Top-5 acc 51.953 (56.297)	lr 0.02485
Train [6][3200/3239]	Time 0.556 (0.829)	Data Time 0.000 (0.007)	Loss 3.9289 (3.9205)	Entropy 1.71556 (1.74193)	Top-1 acc 33.594 (32.427)	Top-5 acc 58.203 (56.302)	lr 0.02485
Train [6][3210/3239]	Time 0.527 (0.828)	Data Time 0.000 (0.007)	Loss 3.9016 (3.9204)	Entropy 1.71547 (1.74185)	Top-1 acc 35.156 (32.432)	Top-5 acc 58.203 (56.309)	lr 0.02485
Train [6][3220/3239]	Time 0.516 (0.828)	Data Time 0.000 (0.007)	Loss 4.0090 (3.9205)	Entropy 1.71496 (1.74176)	Top-1 acc 32.812 (32.429)	Top-5 acc 54.688 (56.307)	lr 0.02485
Train [6][3230/3239]	Time 0.535 (0.828)	Data Time 0.000 (0.007)	Loss 4.0309 (3.9206)	Entropy 1.71471 (1.74168)	Top-1 acc 28.125 (32.426)	Top-5 acc 54.688 (56.307)	lr 0.02485
Train [6][3239/3239]	Time 1.529 (0.828)	Data Time 0.000 (0.007)	Loss 3.8432 (3.9205)	Entropy 1.71448 (1.74161)	Top-1 acc 35.802 (32.430)	Top-5 acc 56.790 (56.307)	lr 0.02485
==========Valid [6/120]	loss 2.752	top-1 acc 41.715 (41.715)	top-5 acc 66.635	Train top-1 32.430	top-5 56.307	Entropy 1.71448	Latency-None: 0.000ms	Flops: 539.76M
Train [7][0/3239]	Time 19.059 (19.059)	Data Time 16.802 (16.802)	Loss 3.9299 (3.9299)	Entropy 1.71448 (1.71448)	Top-1 acc 36.719 (36.719)	Top-5 acc 57.031 (57.031)	lr 0.02485
Train [7][10/3239]	Time 0.562 (2.485)	Data Time 0.001 (1.529)	Loss 3.8495 (3.8178)	Entropy 1.71434 (1.71447)	Top-1 acc 34.375 (34.872)	Top-5 acc 60.547 (59.482)	lr 0.02485
Train [7][20/3239]	Time 0.575 (1.680)	Data Time 0.001 (0.802)	Loss 3.6299 (3.8348)	Entropy 1.71408 (1.71436)	Top-1 acc 37.891 (34.580)	Top-5 acc 62.891 (58.724)	lr 0.02485
Train [7][30/3239]	Time 0.652 (1.399)	Data Time 0.001 (0.544)	Loss 4.0568 (3.8579)	Entropy 1.71404 (1.71426)	Top-1 acc 29.688 (34.438)	Top-5 acc 55.469 (58.342)	lr 0.02485
Train [7][40/3239]	Time 0.613 (1.251)	Data Time 0.002 (0.412)	Loss 4.0783 (3.8724)	Entropy 1.71396 (1.71421)	Top-1 acc 28.906 (33.861)	Top-5 acc 53.125 (57.965)	lr 0.02485
Train [7][50/3239]	Time 0.564 (1.162)	Data Time 0.001 (0.331)	Loss 3.8361 (3.8640)	Entropy 1.71370 (1.71414)	Top-1 acc 36.328 (33.854)	Top-5 acc 57.812 (58.119)	lr 0.02485
Train [7][60/3239]	Time 0.560 (1.103)	Data Time 0.001 (0.277)	Loss 3.7993 (3.8563)	Entropy 1.71373 (1.71408)	Top-1 acc 30.469 (33.901)	Top-5 acc 58.984 (58.248)	lr 0.02485
Train [7][70/3239]	Time 0.628 (1.060)	Data Time 0.001 (0.239)	Loss 3.8290 (3.8616)	Entropy 1.71352 (1.71402)	Top-1 acc 31.250 (33.709)	Top-5 acc 54.688 (57.862)	lr 0.02484
Train [7][80/3239]	Time 0.662 (1.030)	Data Time 0.001 (0.209)	Loss 3.9510 (3.8642)	Entropy 1.71339 (1.71396)	Top-1 acc 33.203 (33.589)	Top-5 acc 55.859 (57.745)	lr 0.02484
Train [7][90/3239]	Time 0.560 (1.005)	Data Time 0.001 (0.187)	Loss 4.0923 (3.8599)	Entropy 1.71317 (1.71388)	Top-1 acc 26.562 (33.637)	Top-5 acc 53.906 (57.825)	lr 0.02484
Train [7][100/3239]	Time 0.418 (0.985)	Data Time 0.001 (0.168)	Loss 4.0279 (3.8626)	Entropy 1.71287 (1.71381)	Top-1 acc 32.031 (33.648)	Top-5 acc 52.734 (57.646)	lr 0.02484
Train [7][110/3239]	Time 0.538 (0.971)	Data Time 0.001 (0.154)	Loss 3.8737 (3.8652)	Entropy 1.71277 (1.71372)	Top-1 acc 31.641 (33.629)	Top-5 acc 54.688 (57.517)	lr 0.02484
Train [7][120/3239]	Time 0.580 (0.957)	Data Time 0.002 (0.142)	Loss 3.9562 (3.8726)	Entropy 1.71247 (1.71364)	Top-1 acc 32.812 (33.481)	Top-5 acc 55.078 (57.315)	lr 0.02484
Train [7][130/3239]	Time 0.568 (0.944)	Data Time 0.001 (0.131)	Loss 3.7895 (3.8778)	Entropy 1.71228 (1.71354)	Top-1 acc 30.859 (33.299)	Top-5 acc 57.422 (57.189)	lr 0.02484
Train [7][140/3239]	Time 0.535 (0.937)	Data Time 0.001 (0.123)	Loss 4.0503 (3.8805)	Entropy 1.71197 (1.71344)	Top-1 acc 30.469 (33.200)	Top-5 acc 50.391 (57.106)	lr 0.02484
Train [7][150/3239]	Time 0.568 (0.927)	Data Time 0.001 (0.115)	Loss 3.9024 (3.8802)	Entropy 1.71170 (1.71334)	Top-1 acc 33.203 (33.219)	Top-5 acc 55.078 (57.155)	lr 0.02484
Train [7][160/3239]	Time 0.538 (0.919)	Data Time 0.001 (0.108)	Loss 3.8995 (3.8807)	Entropy 1.71141 (1.71323)	Top-1 acc 33.984 (33.203)	Top-5 acc 55.078 (57.123)	lr 0.02484
Train [7][170/3239]	Time 0.595 (0.913)	Data Time 0.001 (0.102)	Loss 3.7146 (3.8765)	Entropy 1.71141 (1.71313)	Top-1 acc 36.719 (33.310)	Top-5 acc 58.203 (57.168)	lr 0.02484
Train [7][180/3239]	Time 0.686 (1.007)	Data Time 0.005 (0.096)	Loss 3.8166 (3.8753)	Entropy 1.71133 (1.71303)	Top-1 acc 36.719 (33.337)	Top-5 acc 60.156 (57.174)	lr 0.02484
Train [7][190/3239]	Time 0.541 (0.997)	Data Time 0.002 (0.092)	Loss 3.8115 (3.8742)	Entropy 1.71133 (1.71294)	Top-1 acc 35.938 (33.377)	Top-5 acc 59.766 (57.176)	lr 0.02484
Train [7][200/3239]	Time 0.612 (0.988)	Data Time 0.001 (0.087)	Loss 3.7144 (3.8729)	Entropy 1.71109 (1.71286)	Top-1 acc 36.719 (33.355)	Top-5 acc 61.328 (57.224)	lr 0.02484
Train [7][210/3239]	Time 0.540 (0.979)	Data Time 0.001 (0.083)	Loss 3.9990 (3.8738)	Entropy 1.71085 (1.71277)	Top-1 acc 29.297 (33.314)	Top-5 acc 55.078 (57.244)	lr 0.02484
Train [7][220/3239]	Time 0.564 (0.970)	Data Time 0.001 (0.079)	Loss 4.0061 (3.8762)	Entropy 1.71047 (1.71268)	Top-1 acc 30.078 (33.276)	Top-5 acc 55.859 (57.224)	lr 0.02484
Train [7][230/3239]	Time 0.568 (0.964)	Data Time 0.001 (0.076)	Loss 3.8405 (3.8774)	Entropy 1.71029 (1.71258)	Top-1 acc 35.938 (33.259)	Top-5 acc 58.203 (57.216)	lr 0.02484
Train [7][240/3239]	Time 0.465 (0.956)	Data Time 0.001 (0.073)	Loss 3.8811 (3.8781)	Entropy 1.71004 (1.71248)	Top-1 acc 32.422 (33.276)	Top-5 acc 59.766 (57.216)	lr 0.02484
Train [7][250/3239]	Time 0.677 (0.951)	Data Time 0.001 (0.071)	Loss 3.9020 (3.8794)	Entropy 1.70982 (1.71239)	Top-1 acc 31.250 (33.197)	Top-5 acc 55.469 (57.185)	lr 0.02484
Train [7][260/3239]	Time 0.531 (0.946)	Data Time 0.001 (0.068)	Loss 3.8356 (3.8802)	Entropy 1.70976 (1.71229)	Top-1 acc 32.031 (33.169)	Top-5 acc 56.641 (57.127)	lr 0.02484
Train [7][270/3239]	Time 0.507 (0.941)	Data Time 0.001 (0.066)	Loss 4.0329 (3.8823)	Entropy 1.70963 (1.71219)	Top-1 acc 26.172 (33.108)	Top-5 acc 56.641 (57.118)	lr 0.02484
Train [7][280/3239]	Time 0.581 (0.937)	Data Time 0.001 (0.063)	Loss 3.9309 (3.8818)	Entropy 1.70949 (1.71210)	Top-1 acc 36.328 (33.110)	Top-5 acc 55.469 (57.134)	lr 0.02484
Train [7][290/3239]	Time 0.541 (0.932)	Data Time 0.001 (0.061)	Loss 3.9754 (3.8833)	Entropy 1.70943 (1.71201)	Top-1 acc 32.031 (33.121)	Top-5 acc 56.641 (57.092)	lr 0.02484
Train [7][300/3239]	Time 0.596 (0.927)	Data Time 0.001 (0.059)	Loss 4.0109 (3.8818)	Entropy 1.70943 (1.71192)	Top-1 acc 30.859 (33.121)	Top-5 acc 50.391 (57.108)	lr 0.02484
Train [7][310/3239]	Time 0.564 (0.923)	Data Time 0.001 (0.058)	Loss 4.0676 (3.8826)	Entropy 1.70937 (1.71184)	Top-1 acc 33.203 (33.109)	Top-5 acc 55.078 (57.092)	lr 0.02484
Train [7][320/3239]	Time 0.548 (0.919)	Data Time 0.001 (0.056)	Loss 3.8118 (3.8835)	Entropy 1.70925 (1.71176)	Top-1 acc 35.156 (33.090)	Top-5 acc 58.594 (57.082)	lr 0.02484
Train [7][330/3239]	Time 0.537 (0.914)	Data Time 0.001 (0.054)	Loss 3.9606 (3.8836)	Entropy 1.70888 (1.71168)	Top-1 acc 32.031 (33.079)	Top-5 acc 54.688 (57.089)	lr 0.02484
Train [7][340/3239]	Time 0.535 (0.911)	Data Time 0.001 (0.053)	Loss 3.8293 (3.8802)	Entropy 1.70894 (1.71160)	Top-1 acc 34.766 (33.148)	Top-5 acc 57.031 (57.149)	lr 0.02484
Train [7][350/3239]	Time 0.510 (0.908)	Data Time 0.001 (0.051)	Loss 3.9580 (3.8805)	Entropy 1.70858 (1.71152)	Top-1 acc 32.422 (33.134)	Top-5 acc 56.641 (57.153)	lr 0.02484
Train [7][360/3239]	Time 0.579 (0.905)	Data Time 0.001 (0.050)	Loss 3.8931 (3.8820)	Entropy 1.70840 (1.71144)	Top-1 acc 32.812 (33.136)	Top-5 acc 52.734 (57.109)	lr 0.02484
Train [7][370/3239]	Time 0.558 (0.902)	Data Time 0.001 (0.049)	Loss 3.6169 (3.8804)	Entropy 1.70827 (1.71135)	Top-1 acc 41.406 (33.165)	Top-5 acc 60.547 (57.133)	lr 0.02484
Train [7][380/3239]	Time 0.482 (0.899)	Data Time 0.001 (0.047)	Loss 3.7908 (3.8792)	Entropy 1.70788 (1.71127)	Top-1 acc 37.109 (33.209)	Top-5 acc 59.766 (57.164)	lr 0.02484
Train [7][390/3239]	Time 0.553 (0.897)	Data Time 0.001 (0.046)	Loss 3.7221 (3.8792)	Entropy 1.70768 (1.71118)	Top-1 acc 35.156 (33.220)	Top-5 acc 59.375 (57.158)	lr 0.02484
Train [7][400/3239]	Time 0.599 (0.895)	Data Time 0.001 (0.045)	Loss 3.9729 (3.8807)	Entropy 1.70733 (1.71109)	Top-1 acc 31.250 (33.212)	Top-5 acc 55.078 (57.129)	lr 0.02484
Train [7][410/3239]	Time 0.450 (0.893)	Data Time 0.001 (0.044)	Loss 4.1226 (3.8798)	Entropy 1.70738 (1.71100)	Top-1 acc 25.781 (33.228)	Top-5 acc 51.562 (57.143)	lr 0.02484
Train [7][420/3239]	Time 0.629 (0.891)	Data Time 0.001 (0.044)	Loss 3.7351 (3.8797)	Entropy 1.70689 (1.71091)	Top-1 acc 33.203 (33.235)	Top-5 acc 62.891 (57.143)	lr 0.02484
Train [7][430/3239]	Time 0.506 (0.889)	Data Time 0.001 (0.043)	Loss 4.1891 (3.8802)	Entropy 1.70656 (1.71081)	Top-1 acc 27.734 (33.229)	Top-5 acc 51.562 (57.106)	lr 0.02484
Train [7][440/3239]	Time 0.485 (0.886)	Data Time 0.001 (0.042)	Loss 3.8633 (3.8816)	Entropy 1.70636 (1.71072)	Top-1 acc 34.375 (33.201)	Top-5 acc 56.641 (57.054)	lr 0.02484
Train [7][450/3239]	Time 0.475 (0.885)	Data Time 0.001 (0.041)	Loss 3.9862 (3.8823)	Entropy 1.70622 (1.71062)	Top-1 acc 30.469 (33.181)	Top-5 acc 53.125 (57.036)	lr 0.02484
Train [7][460/3239]	Time 0.560 (0.883)	Data Time 0.001 (0.040)	Loss 3.8346 (3.8831)	Entropy 1.70605 (1.71052)	Top-1 acc 33.984 (33.178)	Top-5 acc 56.250 (57.005)	lr 0.02484
Train [7][470/3239]	Time 0.588 (0.882)	Data Time 0.001 (0.039)	Loss 3.7259 (3.8823)	Entropy 1.70576 (1.71043)	Top-1 acc 39.453 (33.207)	Top-5 acc 63.672 (57.019)	lr 0.02484
Train [7][480/3239]	Time 0.628 (0.879)	Data Time 0.001 (0.038)	Loss 3.8985 (3.8830)	Entropy 1.70545 (1.71033)	Top-1 acc 30.859 (33.174)	Top-5 acc 55.078 (57.009)	lr 0.02484
Train [7][490/3239]	Time 0.656 (0.877)	Data Time 0.002 (0.038)	Loss 3.9051 (3.8840)	Entropy 1.70514 (1.71023)	Top-1 acc 36.328 (33.171)	Top-5 acc 54.297 (56.995)	lr 0.02484
Train [7][500/3239]	Time 0.416 (0.875)	Data Time 0.001 (0.037)	Loss 3.8286 (3.8845)	Entropy 1.70484 (1.71012)	Top-1 acc 35.938 (33.168)	Top-5 acc 58.203 (56.985)	lr 0.02484
Train [7][510/3239]	Time 0.607 (0.873)	Data Time 0.002 (0.036)	Loss 3.7571 (3.8846)	Entropy 1.70451 (1.71002)	Top-1 acc 34.766 (33.154)	Top-5 acc 60.938 (56.992)	lr 0.02484
Train [7][520/3239]	Time 0.567 (0.872)	Data Time 0.001 (0.036)	Loss 3.9864 (3.8856)	Entropy 1.70416 (1.70991)	Top-1 acc 33.984 (33.147)	Top-5 acc 55.469 (56.974)	lr 0.02484
Train [7][530/3239]	Time 0.568 (0.870)	Data Time 0.001 (0.035)	Loss 4.0621 (3.8862)	Entropy 1.70410 (1.70980)	Top-1 acc 28.125 (33.110)	Top-5 acc 55.859 (56.987)	lr 0.02484
Train [7][540/3239]	Time 0.651 (0.869)	Data Time 0.001 (0.034)	Loss 3.6719 (3.8852)	Entropy 1.70373 (1.70969)	Top-1 acc 40.234 (33.129)	Top-5 acc 61.328 (57.023)	lr 0.02484
Train [7][550/3239]	Time 0.584 (0.868)	Data Time 0.001 (0.034)	Loss 3.8746 (3.8846)	Entropy 1.70349 (1.70958)	Top-1 acc 32.812 (33.149)	Top-5 acc 54.688 (57.024)	lr 0.02484
Train [7][560/3239]	Time 0.570 (0.866)	Data Time 0.001 (0.033)	Loss 3.8797 (3.8836)	Entropy 1.70330 (1.70947)	Top-1 acc 34.766 (33.181)	Top-5 acc 57.812 (57.072)	lr 0.02484
Train [7][570/3239]	Time 0.498 (0.865)	Data Time 0.001 (0.033)	Loss 3.9860 (3.8843)	Entropy 1.70343 (1.70937)	Top-1 acc 30.469 (33.168)	Top-5 acc 53.906 (57.052)	lr 0.02484
Train [7][580/3239]	Time 0.566 (0.864)	Data Time 0.001 (0.032)	Loss 3.6867 (3.8841)	Entropy 1.70343 (1.70926)	Top-1 acc 37.891 (33.185)	Top-5 acc 60.547 (57.064)	lr 0.02484
Train [7][590/3239]	Time 0.573 (0.863)	Data Time 0.001 (0.032)	Loss 3.7895 (3.8838)	Entropy 1.70355 (1.70917)	Top-1 acc 33.203 (33.209)	Top-5 acc 60.547 (57.079)	lr 0.02484
Train [7][600/3239]	Time 0.559 (0.862)	Data Time 0.002 (0.031)	Loss 3.8422 (3.8837)	Entropy 1.70331 (1.70907)	Top-1 acc 38.672 (33.224)	Top-5 acc 57.812 (57.092)	lr 0.02484
Train [7][610/3239]	Time 0.592 (0.861)	Data Time 0.001 (0.031)	Loss 3.7623 (3.8842)	Entropy 1.70310 (1.70898)	Top-1 acc 33.203 (33.202)	Top-5 acc 62.500 (57.084)	lr 0.02484
Train [7][620/3239]	Time 0.561 (0.860)	Data Time 0.001 (0.030)	Loss 3.8552 (3.8840)	Entropy 1.70297 (1.70888)	Top-1 acc 35.938 (33.209)	Top-5 acc 55.859 (57.080)	lr 0.02484
Train [7][630/3239]	Time 0.576 (0.859)	Data Time 0.001 (0.030)	Loss 3.7665 (3.8834)	Entropy 1.70282 (1.70879)	Top-1 acc 36.719 (33.227)	Top-5 acc 58.594 (57.091)	lr 0.02484
Train [7][640/3239]	Time 0.570 (0.859)	Data Time 0.001 (0.029)	Loss 3.8472 (3.8835)	Entropy 1.70273 (1.70869)	Top-1 acc 33.984 (33.224)	Top-5 acc 55.859 (57.100)	lr 0.02484
Train [7][650/3239]	Time 0.444 (0.858)	Data Time 0.001 (0.029)	Loss 3.8941 (3.8839)	Entropy 1.70249 (1.70860)	Top-1 acc 32.031 (33.216)	Top-5 acc 56.250 (57.093)	lr 0.02484
Train [7][660/3239]	Time 0.610 (0.857)	Data Time 0.001 (0.028)	Loss 3.7151 (3.8838)	Entropy 1.70230 (1.70851)	Top-1 acc 38.281 (33.234)	Top-5 acc 61.328 (57.105)	lr 0.02484
Train [7][670/3239]	Time 0.593 (0.856)	Data Time 0.001 (0.028)	Loss 3.9665 (3.8846)	Entropy 1.70211 (1.70841)	Top-1 acc 31.250 (33.225)	Top-5 acc 54.688 (57.078)	lr 0.02484
Train [7][680/3239]	Time 0.644 (0.855)	Data Time 0.002 (0.028)	Loss 3.9051 (3.8845)	Entropy 1.70201 (1.70832)	Top-1 acc 31.250 (33.234)	Top-5 acc 54.297 (57.056)	lr 0.02484
Train [7][690/3239]	Time 0.564 (0.854)	Data Time 0.001 (0.027)	Loss 3.9501 (3.8848)	Entropy 1.70187 (1.70823)	Top-1 acc 33.203 (33.232)	Top-5 acc 58.984 (57.043)	lr 0.02484
Train [7][700/3239]	Time 0.553 (0.853)	Data Time 0.001 (0.027)	Loss 3.7782 (3.8851)	Entropy 1.70191 (1.70814)	Top-1 acc 33.203 (33.224)	Top-5 acc 58.594 (57.052)	lr 0.02483
Train [7][710/3239]	Time 0.586 (0.853)	Data Time 0.001 (0.027)	Loss 3.8222 (3.8843)	Entropy 1.70168 (1.70805)	Top-1 acc 40.625 (33.262)	Top-5 acc 57.031 (57.068)	lr 0.02483
Train [7][720/3239]	Time 0.534 (0.852)	Data Time 0.001 (0.026)	Loss 3.9060 (3.8839)	Entropy 1.70162 (1.70796)	Top-1 acc 31.250 (33.252)	Top-5 acc 55.859 (57.069)	lr 0.02483
Train [7][730/3239]	Time 0.581 (0.851)	Data Time 0.002 (0.026)	Loss 3.8422 (3.8841)	Entropy 1.70163 (1.70787)	Top-1 acc 35.938 (33.239)	Top-5 acc 56.641 (57.060)	lr 0.02483
Train [7][740/3239]	Time 0.499 (0.851)	Data Time 0.001 (0.026)	Loss 3.8274 (3.8840)	Entropy 1.70145 (1.70779)	Top-1 acc 34.766 (33.243)	Top-5 acc 57.031 (57.057)	lr 0.02483
Train [7][750/3239]	Time 0.568 (0.850)	Data Time 0.002 (0.025)	Loss 3.7970 (3.8837)	Entropy 1.70139 (1.70770)	Top-1 acc 34.375 (33.238)	Top-5 acc 55.859 (57.061)	lr 0.02483
Train [7][760/3239]	Time 0.543 (0.850)	Data Time 0.001 (0.025)	Loss 3.8501 (3.8835)	Entropy 1.70118 (1.70762)	Top-1 acc 33.984 (33.250)	Top-5 acc 60.156 (57.070)	lr 0.02483
Train [7][770/3239]	Time 0.590 (0.849)	Data Time 0.001 (0.025)	Loss 3.8794 (3.8835)	Entropy 1.70117 (1.70753)	Top-1 acc 37.891 (33.273)	Top-5 acc 54.688 (57.068)	lr 0.02483
Train [7][780/3239]	Time 0.550 (0.849)	Data Time 0.001 (0.024)	Loss 3.9354 (3.8837)	Entropy 1.70083 (1.70745)	Top-1 acc 31.641 (33.259)	Top-5 acc 55.078 (57.074)	lr 0.02483
Train [7][790/3239]	Time 0.530 (0.848)	Data Time 0.001 (0.024)	Loss 3.9968 (3.8844)	Entropy 1.70053 (1.70736)	Top-1 acc 34.375 (33.256)	Top-5 acc 56.250 (57.071)	lr 0.02483
Train [7][800/3239]	Time 0.575 (0.847)	Data Time 0.001 (0.024)	Loss 3.9691 (3.8853)	Entropy 1.70017 (1.70728)	Top-1 acc 33.594 (33.236)	Top-5 acc 55.469 (57.049)	lr 0.02483
Train [7][810/3239]	Time 0.587 (0.847)	Data Time 0.001 (0.024)	Loss 4.0774 (3.8857)	Entropy 1.69984 (1.70719)	Top-1 acc 30.469 (33.231)	Top-5 acc 50.781 (57.044)	lr 0.02483
Train [7][820/3239]	Time 0.521 (0.846)	Data Time 0.001 (0.023)	Loss 3.7910 (3.8856)	Entropy 1.69971 (1.70710)	Top-1 acc 33.594 (33.231)	Top-5 acc 60.938 (57.043)	lr 0.02483
Train [7][830/3239]	Time 0.590 (0.846)	Data Time 0.001 (0.023)	Loss 3.9426 (3.8849)	Entropy 1.69944 (1.70701)	Top-1 acc 34.375 (33.243)	Top-5 acc 56.641 (57.061)	lr 0.02483
Train [7][840/3239]	Time 0.581 (0.868)	Data Time 0.002 (0.023)	Loss 3.7314 (3.8843)	Entropy 1.69869 (1.70691)	Top-1 acc 37.500 (33.259)	Top-5 acc 62.500 (57.075)	lr 0.02483
Train [7][850/3239]	Time 0.530 (0.868)	Data Time 0.002 (0.023)	Loss 4.0583 (3.8850)	Entropy 1.69859 (1.70682)	Top-1 acc 30.469 (33.249)	Top-5 acc 50.391 (57.055)	lr 0.02483
Train [7][860/3239]	Time 0.564 (0.867)	Data Time 0.001 (0.022)	Loss 3.9202 (3.8849)	Entropy 1.69858 (1.70672)	Top-1 acc 33.594 (33.248)	Top-5 acc 57.031 (57.054)	lr 0.02483
Train [7][870/3239]	Time 0.579 (0.867)	Data Time 0.002 (0.022)	Loss 3.9101 (3.8853)	Entropy 1.69819 (1.70663)	Top-1 acc 35.156 (33.245)	Top-5 acc 53.906 (57.041)	lr 0.02483
Train [7][880/3239]	Time 0.578 (0.866)	Data Time 0.001 (0.022)	Loss 3.8139 (3.8844)	Entropy 1.69795 (1.70653)	Top-1 acc 34.375 (33.245)	Top-5 acc 58.984 (57.061)	lr 0.02483
Train [7][890/3239]	Time 0.508 (0.865)	Data Time 0.001 (0.022)	Loss 4.1532 (3.8844)	Entropy 1.69786 (1.70643)	Top-1 acc 27.734 (33.243)	Top-5 acc 50.391 (57.054)	lr 0.02483
Train [7][900/3239]	Time 0.598 (0.865)	Data Time 0.001 (0.022)	Loss 3.9043 (3.8846)	Entropy 1.69774 (1.70634)	Top-1 acc 34.375 (33.235)	Top-5 acc 56.641 (57.037)	lr 0.02483
Train [7][910/3239]	Time 0.590 (0.864)	Data Time 0.001 (0.021)	Loss 3.9828 (3.8839)	Entropy 1.69731 (1.70624)	Top-1 acc 31.250 (33.241)	Top-5 acc 55.078 (57.053)	lr 0.02483
Train [7][920/3239]	Time 0.454 (0.864)	Data Time 0.001 (0.021)	Loss 3.8009 (3.8843)	Entropy 1.69735 (1.70614)	Top-1 acc 31.250 (33.235)	Top-5 acc 56.250 (57.037)	lr 0.02483
Train [7][930/3239]	Time 0.596 (0.863)	Data Time 0.001 (0.021)	Loss 3.7272 (3.8843)	Entropy 1.69714 (1.70605)	Top-1 acc 35.156 (33.239)	Top-5 acc 59.766 (57.041)	lr 0.02483
Train [7][940/3239]	Time 0.486 (0.863)	Data Time 0.001 (0.021)	Loss 3.9581 (3.8844)	Entropy 1.69720 (1.70596)	Top-1 acc 28.516 (33.236)	Top-5 acc 59.766 (57.039)	lr 0.02483
Train [7][950/3239]	Time 0.630 (0.862)	Data Time 0.001 (0.021)	Loss 3.8495 (3.8845)	Entropy 1.69709 (1.70586)	Top-1 acc 32.422 (33.231)	Top-5 acc 53.906 (57.021)	lr 0.02483
Train [7][960/3239]	Time 0.546 (0.862)	Data Time 0.001 (0.020)	Loss 3.9638 (3.8846)	Entropy 1.69704 (1.70577)	Top-1 acc 29.688 (33.212)	Top-5 acc 56.250 (57.023)	lr 0.02483
Train [7][970/3239]	Time 0.540 (0.861)	Data Time 0.001 (0.020)	Loss 3.9553 (3.8851)	Entropy 1.69703 (1.70568)	Top-1 acc 30.078 (33.202)	Top-5 acc 53.906 (57.015)	lr 0.02483
Train [7][980/3239]	Time 0.521 (0.860)	Data Time 0.001 (0.020)	Loss 3.8503 (3.8849)	Entropy 1.69677 (1.70559)	Top-1 acc 35.547 (33.207)	Top-5 acc 57.812 (57.020)	lr 0.02483
Train [7][990/3239]	Time 0.414 (0.859)	Data Time 0.001 (0.020)	Loss 3.6759 (3.8847)	Entropy 1.69669 (1.70550)	Top-1 acc 36.719 (33.205)	Top-5 acc 61.328 (57.024)	lr 0.02483
Train [7][1000/3239]	Time 0.552 (0.858)	Data Time 0.001 (0.020)	Loss 3.8300 (3.8846)	Entropy 1.69654 (1.70541)	Top-1 acc 35.547 (33.212)	Top-5 acc 56.250 (57.023)	lr 0.02483
Train [7][1010/3239]	Time 0.562 (0.858)	Data Time 0.001 (0.020)	Loss 3.9079 (3.8841)	Entropy 1.69640 (1.70533)	Top-1 acc 32.812 (33.227)	Top-5 acc 57.812 (57.027)	lr 0.02483
Train [7][1020/3239]	Time 0.719 (0.858)	Data Time 0.001 (0.019)	Loss 3.8749 (3.8844)	Entropy 1.69629 (1.70524)	Top-1 acc 34.375 (33.229)	Top-5 acc 57.031 (57.017)	lr 0.02483
Train [7][1030/3239]	Time 0.522 (0.857)	Data Time 0.001 (0.019)	Loss 3.7997 (3.8839)	Entropy 1.69612 (1.70515)	Top-1 acc 37.500 (33.255)	Top-5 acc 58.984 (57.031)	lr 0.02483
Train [7][1040/3239]	Time 0.497 (0.857)	Data Time 0.001 (0.019)	Loss 3.7930 (3.8843)	Entropy 1.69613 (1.70506)	Top-1 acc 38.281 (33.253)	Top-5 acc 62.109 (57.028)	lr 0.02483
Train [7][1050/3239]	Time 0.532 (0.857)	Data Time 0.001 (0.019)	Loss 3.6525 (3.8845)	Entropy 1.69599 (1.70498)	Top-1 acc 39.453 (33.247)	Top-5 acc 60.547 (57.016)	lr 0.02483
Train [7][1060/3239]	Time 0.479 (0.856)	Data Time 0.001 (0.019)	Loss 4.0002 (3.8843)	Entropy 1.69593 (1.70489)	Top-1 acc 28.906 (33.245)	Top-5 acc 51.953 (57.015)	lr 0.02483
Train [7][1070/3239]	Time 0.632 (0.856)	Data Time 0.001 (0.019)	Loss 3.7600 (3.8842)	Entropy 1.69565 (1.70481)	Top-1 acc 35.547 (33.252)	Top-5 acc 58.984 (57.017)	lr 0.02483
Train [7][1080/3239]	Time 0.577 (0.855)	Data Time 0.001 (0.019)	Loss 3.9806 (3.8836)	Entropy 1.69540 (1.70472)	Top-1 acc 32.812 (33.264)	Top-5 acc 55.078 (57.032)	lr 0.02483
Train [7][1090/3239]	Time 0.568 (0.855)	Data Time 0.001 (0.018)	Loss 3.9790 (3.8843)	Entropy 1.69501 (1.70464)	Top-1 acc 33.203 (33.249)	Top-5 acc 56.641 (57.018)	lr 0.02483
Train [7][1100/3239]	Time 0.536 (0.854)	Data Time 0.001 (0.018)	Loss 3.8279 (3.8838)	Entropy 1.69497 (1.70455)	Top-1 acc 33.203 (33.267)	Top-5 acc 58.594 (57.035)	lr 0.02483
Train [7][1110/3239]	Time 0.563 (0.854)	Data Time 0.001 (0.018)	Loss 3.9786 (3.8836)	Entropy 1.69479 (1.70446)	Top-1 acc 29.297 (33.272)	Top-5 acc 56.250 (57.043)	lr 0.02483
Train [7][1120/3239]	Time 0.694 (0.854)	Data Time 0.001 (0.018)	Loss 3.6779 (3.8835)	Entropy 1.69457 (1.70437)	Top-1 acc 35.938 (33.272)	Top-5 acc 61.328 (57.051)	lr 0.02483
Train [7][1130/3239]	Time 0.603 (0.853)	Data Time 0.003 (0.018)	Loss 4.0668 (3.8835)	Entropy 1.69442 (1.70429)	Top-1 acc 31.250 (33.268)	Top-5 acc 53.516 (57.044)	lr 0.02483
Train [7][1140/3239]	Time 0.576 (0.853)	Data Time 0.001 (0.018)	Loss 3.9300 (3.8834)	Entropy 1.69405 (1.70420)	Top-1 acc 34.375 (33.276)	Top-5 acc 53.125 (57.042)	lr 0.02483
Train [7][1150/3239]	Time 0.349 (0.852)	Data Time 0.001 (0.018)	Loss 3.6693 (3.8826)	Entropy 1.69407 (1.70411)	Top-1 acc 37.109 (33.287)	Top-5 acc 60.938 (57.062)	lr 0.02483
Train [7][1160/3239]	Time 0.598 (0.851)	Data Time 0.001 (0.017)	Loss 3.6774 (3.8828)	Entropy 1.69399 (1.70402)	Top-1 acc 38.672 (33.284)	Top-5 acc 62.109 (57.055)	lr 0.02483
Train [7][1170/3239]	Time 0.540 (0.851)	Data Time 0.002 (0.017)	Loss 3.8316 (3.8826)	Entropy 1.69376 (1.70394)	Top-1 acc 35.156 (33.293)	Top-5 acc 57.422 (57.052)	lr 0.02483
Train [7][1180/3239]	Time 0.554 (0.850)	Data Time 0.001 (0.017)	Loss 3.8885 (3.8828)	Entropy 1.69357 (1.70385)	Top-1 acc 35.547 (33.291)	Top-5 acc 60.938 (57.054)	lr 0.02483
Train [7][1190/3239]	Time 0.515 (0.850)	Data Time 0.002 (0.017)	Loss 4.2627 (3.8824)	Entropy 1.69339 (1.70376)	Top-1 acc 24.219 (33.303)	Top-5 acc 50.000 (57.070)	lr 0.02483
Train [7][1200/3239]	Time 0.583 (0.850)	Data Time 0.001 (0.017)	Loss 3.7970 (3.8825)	Entropy 1.69314 (1.70368)	Top-1 acc 36.719 (33.307)	Top-5 acc 59.766 (57.069)	lr 0.02483
Train [7][1210/3239]	Time 0.601 (0.849)	Data Time 0.001 (0.017)	Loss 3.7515 (3.8815)	Entropy 1.69325 (1.70359)	Top-1 acc 37.891 (33.325)	Top-5 acc 59.375 (57.099)	lr 0.02483
Train [7][1220/3239]	Time 0.557 (0.849)	Data Time 0.001 (0.017)	Loss 3.8548 (3.8813)	Entropy 1.69324 (1.70350)	Top-1 acc 32.812 (33.334)	Top-5 acc 55.859 (57.101)	lr 0.02483
Train [7][1230/3239]	Time 0.511 (0.849)	Data Time 0.001 (0.017)	Loss 3.7067 (3.8820)	Entropy 1.69315 (1.70342)	Top-1 acc 33.203 (33.320)	Top-5 acc 60.156 (57.087)	lr 0.02483
Train [7][1240/3239]	Time 0.646 (0.848)	Data Time 0.001 (0.016)	Loss 3.9289 (3.8816)	Entropy 1.69309 (1.70334)	Top-1 acc 34.766 (33.323)	Top-5 acc 55.078 (57.099)	lr 0.02483
Train [7][1250/3239]	Time 0.538 (0.848)	Data Time 0.001 (0.016)	Loss 4.1937 (3.8817)	Entropy 1.69309 (1.70326)	Top-1 acc 26.172 (33.312)	Top-5 acc 49.219 (57.091)	lr 0.02483
Train [7][1260/3239]	Time 0.606 (0.848)	Data Time 0.001 (0.016)	Loss 3.8417 (3.8823)	Entropy 1.69290 (1.70317)	Top-1 acc 30.078 (33.295)	Top-5 acc 58.984 (57.079)	lr 0.02483
Train [7][1270/3239]	Time 0.609 (0.847)	Data Time 0.003 (0.016)	Loss 3.9500 (3.8826)	Entropy 1.69278 (1.70309)	Top-1 acc 30.078 (33.285)	Top-5 acc 55.469 (57.075)	lr 0.02483
Train [7][1280/3239]	Time 0.537 (0.847)	Data Time 0.001 (0.016)	Loss 3.7837 (3.8829)	Entropy 1.69289 (1.70301)	Top-1 acc 31.641 (33.277)	Top-5 acc 57.812 (57.069)	lr 0.02483
Train [7][1290/3239]	Time 0.583 (0.847)	Data Time 0.001 (0.016)	Loss 3.8778 (3.8821)	Entropy 1.69292 (1.70293)	Top-1 acc 29.688 (33.291)	Top-5 acc 60.156 (57.098)	lr 0.02483
Train [7][1300/3239]	Time 0.559 (0.846)	Data Time 0.001 (0.016)	Loss 3.9662 (3.8819)	Entropy 1.69268 (1.70286)	Top-1 acc 32.812 (33.304)	Top-5 acc 56.641 (57.107)	lr 0.02482
Train [7][1310/3239]	Time 0.552 (0.846)	Data Time 0.001 (0.016)	Loss 4.2686 (3.8823)	Entropy 1.69245 (1.70278)	Top-1 acc 23.828 (33.298)	Top-5 acc 47.656 (57.089)	lr 0.02482
Train [7][1320/3239]	Time 0.583 (0.846)	Data Time 0.001 (0.016)	Loss 3.8096 (3.8824)	Entropy 1.69209 (1.70270)	Top-1 acc 35.156 (33.292)	Top-5 acc 58.594 (57.086)	lr 0.02482
Train [7][1330/3239]	Time 0.582 (0.845)	Data Time 0.002 (0.015)	Loss 4.2785 (3.8828)	Entropy 1.69183 (1.70262)	Top-1 acc 27.344 (33.285)	Top-5 acc 47.656 (57.078)	lr 0.02482
Train [7][1340/3239]	Time 0.517 (0.845)	Data Time 0.001 (0.015)	Loss 3.7805 (3.8823)	Entropy 1.69164 (1.70254)	Top-1 acc 34.766 (33.292)	Top-5 acc 59.375 (57.085)	lr 0.02482
Train [7][1350/3239]	Time 0.574 (0.844)	Data Time 0.001 (0.015)	Loss 3.8163 (3.8826)	Entropy 1.69145 (1.70246)	Top-1 acc 33.203 (33.278)	Top-5 acc 61.328 (57.081)	lr 0.02482
Train [7][1360/3239]	Time 0.662 (0.844)	Data Time 0.001 (0.015)	Loss 3.8571 (3.8828)	Entropy 1.69131 (1.70238)	Top-1 acc 32.031 (33.273)	Top-5 acc 52.344 (57.075)	lr 0.02482
Train [7][1370/3239]	Time 0.588 (0.844)	Data Time 0.001 (0.015)	Loss 3.8484 (3.8826)	Entropy 1.69100 (1.70229)	Top-1 acc 37.500 (33.282)	Top-5 acc 58.594 (57.085)	lr 0.02482
Train [7][1380/3239]	Time 0.586 (0.843)	Data Time 0.001 (0.015)	Loss 3.8259 (3.8825)	Entropy 1.69077 (1.70221)	Top-1 acc 34.766 (33.282)	Top-5 acc 57.422 (57.091)	lr 0.02482
Train [7][1390/3239]	Time 0.611 (0.843)	Data Time 0.001 (0.015)	Loss 4.0751 (3.8824)	Entropy 1.69072 (1.70213)	Top-1 acc 32.422 (33.295)	Top-5 acc 48.828 (57.093)	lr 0.02482
Train [7][1400/3239]	Time 0.545 (0.843)	Data Time 0.002 (0.015)	Loss 3.9573 (3.8825)	Entropy 1.69038 (1.70205)	Top-1 acc 27.734 (33.287)	Top-5 acc 57.422 (57.091)	lr 0.02482
Train [7][1410/3239]	Time 0.558 (0.843)	Data Time 0.001 (0.015)	Loss 3.9055 (3.8826)	Entropy 1.69008 (1.70196)	Top-1 acc 30.469 (33.283)	Top-5 acc 58.203 (57.089)	lr 0.02482
Train [7][1420/3239]	Time 0.585 (0.843)	Data Time 0.001 (0.015)	Loss 4.0746 (3.8829)	Entropy 1.68982 (1.70188)	Top-1 acc 31.250 (33.281)	Top-5 acc 52.734 (57.084)	lr 0.02482
Train [7][1430/3239]	Time 0.585 (0.842)	Data Time 0.001 (0.014)	Loss 3.9835 (3.8832)	Entropy 1.68952 (1.70179)	Top-1 acc 30.078 (33.274)	Top-5 acc 51.953 (57.070)	lr 0.02482
Train [7][1440/3239]	Time 0.571 (0.842)	Data Time 0.001 (0.014)	Loss 3.9246 (3.8833)	Entropy 1.68938 (1.70171)	Top-1 acc 29.688 (33.272)	Top-5 acc 56.250 (57.067)	lr 0.02482
Train [7][1450/3239]	Time 0.579 (0.842)	Data Time 0.001 (0.014)	Loss 3.7777 (3.8834)	Entropy 1.68893 (1.70162)	Top-1 acc 38.281 (33.274)	Top-5 acc 60.156 (57.070)	lr 0.02482
Train [7][1460/3239]	Time 0.627 (0.842)	Data Time 0.001 (0.014)	Loss 3.7615 (3.8838)	Entropy 1.68839 (1.70153)	Top-1 acc 36.719 (33.266)	Top-5 acc 57.812 (57.060)	lr 0.02482
Train [7][1470/3239]	Time 0.496 (0.841)	Data Time 0.001 (0.014)	Loss 4.0044 (3.8835)	Entropy 1.68840 (1.70145)	Top-1 acc 29.688 (33.266)	Top-5 acc 55.078 (57.068)	lr 0.02482
Train [7][1480/3239]	Time 0.520 (0.841)	Data Time 0.001 (0.014)	Loss 3.9525 (3.8836)	Entropy 1.68809 (1.70136)	Top-1 acc 31.250 (33.260)	Top-5 acc 54.688 (57.067)	lr 0.02482
Train [7][1490/3239]	Time 0.653 (0.854)	Data Time 0.005 (0.014)	Loss 3.8863 (3.8836)	Entropy 1.68784 (1.70127)	Top-1 acc 36.328 (33.265)	Top-5 acc 58.594 (57.064)	lr 0.02482
Train [7][1500/3239]	Time 0.524 (0.854)	Data Time 0.002 (0.014)	Loss 3.8096 (3.8835)	Entropy 1.68781 (1.70118)	Top-1 acc 31.641 (33.267)	Top-5 acc 58.594 (57.068)	lr 0.02482
Train [7][1510/3239]	Time 0.598 (0.853)	Data Time 0.003 (0.014)	Loss 3.8995 (3.8837)	Entropy 1.68779 (1.70109)	Top-1 acc 31.250 (33.260)	Top-5 acc 54.297 (57.060)	lr 0.02482
Train [7][1520/3239]	Time 0.632 (0.853)	Data Time 0.001 (0.014)	Loss 3.7614 (3.8837)	Entropy 1.68770 (1.70100)	Top-1 acc 37.891 (33.261)	Top-5 acc 62.891 (57.067)	lr 0.02482
Train [7][1530/3239]	Time 0.661 (0.853)	Data Time 0.002 (0.014)	Loss 3.7481 (3.8836)	Entropy 1.68762 (1.70091)	Top-1 acc 33.594 (33.263)	Top-5 acc 57.031 (57.066)	lr 0.02482
Train [7][1540/3239]	Time 0.551 (0.853)	Data Time 0.001 (0.014)	Loss 3.8572 (3.8835)	Entropy 1.68745 (1.70083)	Top-1 acc 33.984 (33.265)	Top-5 acc 58.594 (57.073)	lr 0.02482
Train [7][1550/3239]	Time 0.544 (0.853)	Data Time 0.001 (0.014)	Loss 3.6500 (3.8835)	Entropy 1.68741 (1.70074)	Top-1 acc 38.281 (33.268)	Top-5 acc 62.500 (57.077)	lr 0.02482
Train [7][1560/3239]	Time 0.565 (0.852)	Data Time 0.001 (0.013)	Loss 3.9136 (3.8837)	Entropy 1.68739 (1.70065)	Top-1 acc 30.859 (33.261)	Top-5 acc 56.250 (57.069)	lr 0.02482
Train [7][1570/3239]	Time 0.543 (0.852)	Data Time 0.002 (0.013)	Loss 4.0492 (3.8841)	Entropy 1.68733 (1.70057)	Top-1 acc 30.859 (33.257)	Top-5 acc 53.516 (57.061)	lr 0.02482
Train [7][1580/3239]	Time 0.620 (0.852)	Data Time 0.001 (0.013)	Loss 3.9775 (3.8841)	Entropy 1.68724 (1.70049)	Top-1 acc 32.422 (33.257)	Top-5 acc 54.297 (57.058)	lr 0.02482
Train [7][1590/3239]	Time 0.528 (0.852)	Data Time 0.001 (0.013)	Loss 3.6513 (3.8843)	Entropy 1.68707 (1.70040)	Top-1 acc 35.156 (33.250)	Top-5 acc 63.672 (57.047)	lr 0.02482
Train [7][1600/3239]	Time 0.553 (0.852)	Data Time 0.001 (0.013)	Loss 3.9972 (3.8846)	Entropy 1.68702 (1.70032)	Top-1 acc 31.250 (33.240)	Top-5 acc 57.422 (57.045)	lr 0.02482
Train [7][1610/3239]	Time 0.587 (0.852)	Data Time 0.001 (0.013)	Loss 3.8957 (3.8847)	Entropy 1.68698 (1.70024)	Top-1 acc 34.766 (33.239)	Top-5 acc 57.812 (57.043)	lr 0.02482
Train [7][1620/3239]	Time 0.527 (0.851)	Data Time 0.001 (0.013)	Loss 3.8955 (3.8846)	Entropy 1.68665 (1.70015)	Top-1 acc 34.375 (33.238)	Top-5 acc 58.984 (57.045)	lr 0.02482
Train [7][1630/3239]	Time 0.598 (0.851)	Data Time 0.001 (0.013)	Loss 3.9287 (3.8850)	Entropy 1.68661 (1.70007)	Top-1 acc 31.641 (33.235)	Top-5 acc 55.859 (57.032)	lr 0.02482
Train [7][1640/3239]	Time 0.528 (0.850)	Data Time 0.001 (0.013)	Loss 3.8405 (3.8851)	Entropy 1.68633 (1.69999)	Top-1 acc 34.766 (33.232)	Top-5 acc 56.641 (57.032)	lr 0.02482
Train [7][1650/3239]	Time 0.233 (0.850)	Data Time 0.001 (0.013)	Loss 3.7915 (3.8852)	Entropy 1.68614 (1.69990)	Top-1 acc 35.547 (33.237)	Top-5 acc 59.766 (57.036)	lr 0.02482
Train [7][1660/3239]	Time 0.564 (0.850)	Data Time 0.002 (0.013)	Loss 3.8573 (3.8851)	Entropy 1.68600 (1.69982)	Top-1 acc 33.594 (33.238)	Top-5 acc 57.031 (57.033)	lr 0.02482
Train [7][1670/3239]	Time 0.668 (0.850)	Data Time 0.001 (0.013)	Loss 3.8177 (3.8848)	Entropy 1.68579 (1.69974)	Top-1 acc 35.156 (33.244)	Top-5 acc 58.984 (57.037)	lr 0.02482
Train [7][1680/3239]	Time 0.552 (0.849)	Data Time 0.001 (0.013)	Loss 3.7235 (3.8845)	Entropy 1.68556 (1.69966)	Top-1 acc 35.938 (33.242)	Top-5 acc 60.938 (57.047)	lr 0.02482
Train [7][1690/3239]	Time 0.589 (0.849)	Data Time 0.001 (0.013)	Loss 3.8163 (3.8843)	Entropy 1.68554 (1.69957)	Top-1 acc 33.594 (33.250)	Top-5 acc 55.469 (57.046)	lr 0.02482
Train [7][1700/3239]	Time 0.573 (0.849)	Data Time 0.001 (0.013)	Loss 4.0480 (3.8846)	Entropy 1.68518 (1.69949)	Top-1 acc 33.984 (33.247)	Top-5 acc 52.344 (57.038)	lr 0.02482
Train [7][1710/3239]	Time 0.539 (0.849)	Data Time 0.001 (0.013)	Loss 4.0460 (3.8842)	Entropy 1.68510 (1.69941)	Top-1 acc 30.469 (33.261)	Top-5 acc 54.297 (57.046)	lr 0.02482
Train [7][1720/3239]	Time 0.607 (0.849)	Data Time 0.001 (0.013)	Loss 3.9576 (3.8839)	Entropy 1.68491 (1.69932)	Top-1 acc 30.469 (33.268)	Top-5 acc 55.078 (57.054)	lr 0.02482
Train [7][1730/3239]	Time 0.560 (0.849)	Data Time 0.001 (0.012)	Loss 3.9712 (3.8838)	Entropy 1.68475 (1.69924)	Top-1 acc 32.812 (33.274)	Top-5 acc 56.641 (57.050)	lr 0.02482
Train [7][1740/3239]	Time 0.692 (0.849)	Data Time 0.001 (0.012)	Loss 3.9503 (3.8841)	Entropy 1.68450 (1.69915)	Top-1 acc 30.859 (33.272)	Top-5 acc 58.594 (57.044)	lr 0.02482
Train [7][1750/3239]	Time 0.519 (0.848)	Data Time 0.001 (0.012)	Loss 3.8157 (3.8842)	Entropy 1.68425 (1.69907)	Top-1 acc 36.719 (33.273)	Top-5 acc 58.984 (57.044)	lr 0.02482
Train [7][1760/3239]	Time 0.568 (0.848)	Data Time 0.001 (0.012)	Loss 3.8530 (3.8841)	Entropy 1.68391 (1.69899)	Top-1 acc 30.469 (33.261)	Top-5 acc 57.422 (57.042)	lr 0.02482
Train [7][1770/3239]	Time 0.565 (0.848)	Data Time 0.001 (0.012)	Loss 3.8871 (3.8844)	Entropy 1.68388 (1.69890)	Top-1 acc 33.203 (33.252)	Top-5 acc 60.547 (57.038)	lr 0.02482
Train [7][1780/3239]	Time 0.557 (0.848)	Data Time 0.001 (0.012)	Loss 3.8700 (3.8848)	Entropy 1.68358 (1.69881)	Top-1 acc 36.328 (33.248)	Top-5 acc 58.594 (57.034)	lr 0.02482
Train [7][1790/3239]	Time 0.641 (0.848)	Data Time 0.002 (0.012)	Loss 3.9329 (3.8849)	Entropy 1.68346 (1.69873)	Top-1 acc 33.984 (33.244)	Top-5 acc 55.469 (57.035)	lr 0.02482
Train [7][1800/3239]	Time 0.595 (0.848)	Data Time 0.001 (0.012)	Loss 4.0438 (3.8848)	Entropy 1.68336 (1.69864)	Top-1 acc 32.422 (33.244)	Top-5 acc 53.125 (57.039)	lr 0.02482
Train [7][1810/3239]	Time 0.569 (0.847)	Data Time 0.001 (0.012)	Loss 3.9221 (3.8848)	Entropy 1.68328 (1.69856)	Top-1 acc 34.375 (33.240)	Top-5 acc 55.078 (57.033)	lr 0.02482
Train [7][1820/3239]	Time 0.495 (0.847)	Data Time 0.001 (0.012)	Loss 3.8750 (3.8849)	Entropy 1.68321 (1.69848)	Top-1 acc 32.422 (33.239)	Top-5 acc 56.641 (57.034)	lr 0.02482
Train [7][1830/3239]	Time 0.516 (0.846)	Data Time 0.001 (0.012)	Loss 3.8101 (3.8849)	Entropy 1.68302 (1.69839)	Top-1 acc 35.156 (33.235)	Top-5 acc 57.422 (57.035)	lr 0.02482
Train [7][1840/3239]	Time 0.541 (0.846)	Data Time 0.001 (0.012)	Loss 4.0862 (3.8851)	Entropy 1.68274 (1.69831)	Top-1 acc 31.641 (33.235)	Top-5 acc 53.125 (57.028)	lr 0.02482
Train [7][1850/3239]	Time 0.584 (0.846)	Data Time 0.001 (0.012)	Loss 3.7950 (3.8853)	Entropy 1.68240 (1.69822)	Top-1 acc 35.156 (33.230)	Top-5 acc 58.984 (57.021)	lr 0.02482
Train [7][1860/3239]	Time 0.695 (0.846)	Data Time 0.002 (0.012)	Loss 3.7488 (3.8850)	Entropy 1.68208 (1.69814)	Top-1 acc 35.938 (33.233)	Top-5 acc 61.328 (57.025)	lr 0.02482
Train [7][1870/3239]	Time 0.552 (0.846)	Data Time 0.001 (0.012)	Loss 3.9112 (3.8853)	Entropy 1.68202 (1.69805)	Top-1 acc 34.766 (33.233)	Top-5 acc 54.688 (57.018)	lr 0.02482
Train [7][1880/3239]	Time 0.485 (0.845)	Data Time 0.001 (0.012)	Loss 3.9335 (3.8855)	Entropy 1.68196 (1.69797)	Top-1 acc 28.125 (33.227)	Top-5 acc 56.250 (57.011)	lr 0.02481
Train [7][1890/3239]	Time 0.551 (0.845)	Data Time 0.001 (0.012)	Loss 4.1551 (3.8855)	Entropy 1.68189 (1.69788)	Top-1 acc 26.562 (33.226)	Top-5 acc 49.219 (57.012)	lr 0.02481
Train [7][1900/3239]	Time 0.582 (0.845)	Data Time 0.001 (0.012)	Loss 3.9136 (3.8855)	Entropy 1.68168 (1.69780)	Top-1 acc 34.766 (33.232)	Top-5 acc 56.250 (57.017)	lr 0.02481
Train [7][1910/3239]	Time 0.529 (0.845)	Data Time 0.001 (0.011)	Loss 3.9547 (3.8855)	Entropy 1.68151 (1.69771)	Top-1 acc 32.812 (33.236)	Top-5 acc 56.250 (57.018)	lr 0.02481
Train [7][1920/3239]	Time 0.513 (0.845)	Data Time 0.001 (0.011)	Loss 3.8501 (3.8856)	Entropy 1.68134 (1.69763)	Top-1 acc 32.031 (33.231)	Top-5 acc 57.031 (57.013)	lr 0.02481
Train [7][1930/3239]	Time 0.615 (0.845)	Data Time 0.001 (0.011)	Loss 3.8133 (3.8853)	Entropy 1.68145 (1.69755)	Top-1 acc 34.375 (33.240)	Top-5 acc 62.109 (57.020)	lr 0.02481
Train [7][1940/3239]	Time 0.549 (0.844)	Data Time 0.001 (0.011)	Loss 4.1573 (3.8854)	Entropy 1.68125 (1.69746)	Top-1 acc 26.562 (33.236)	Top-5 acc 50.781 (57.014)	lr 0.02481
Train [7][1950/3239]	Time 0.456 (0.844)	Data Time 0.001 (0.011)	Loss 3.7599 (3.8856)	Entropy 1.68103 (1.69738)	Top-1 acc 36.328 (33.228)	Top-5 acc 62.891 (57.012)	lr 0.02481
Train [7][1960/3239]	Time 0.533 (0.844)	Data Time 0.001 (0.011)	Loss 3.8587 (3.8856)	Entropy 1.68077 (1.69729)	Top-1 acc 33.984 (33.224)	Top-5 acc 57.812 (57.009)	lr 0.02481
Train [7][1970/3239]	Time 0.303 (0.844)	Data Time 0.001 (0.011)	Loss 3.8263 (3.8857)	Entropy 1.68067 (1.69721)	Top-1 acc 32.422 (33.223)	Top-5 acc 61.328 (57.008)	lr 0.02481
Train [7][1980/3239]	Time 0.646 (0.843)	Data Time 0.001 (0.011)	Loss 3.7878 (3.8859)	Entropy 1.68051 (1.69713)	Top-1 acc 30.859 (33.218)	Top-5 acc 57.422 (57.001)	lr 0.02481
Train [7][1990/3239]	Time 0.595 (0.843)	Data Time 0.001 (0.011)	Loss 3.6540 (3.8860)	Entropy 1.68039 (1.69704)	Top-1 acc 33.203 (33.208)	Top-5 acc 60.156 (57.000)	lr 0.02481
Train [7][2000/3239]	Time 0.555 (0.843)	Data Time 0.001 (0.011)	Loss 3.7816 (3.8856)	Entropy 1.68021 (1.69696)	Top-1 acc 32.422 (33.206)	Top-5 acc 57.031 (57.011)	lr 0.02481
Train [7][2010/3239]	Time 0.590 (0.843)	Data Time 0.001 (0.011)	Loss 3.8233 (3.8857)	Entropy 1.67997 (1.69688)	Top-1 acc 31.641 (33.198)	Top-5 acc 55.469 (57.003)	lr 0.02481
Train [7][2020/3239]	Time 0.597 (0.843)	Data Time 0.001 (0.011)	Loss 3.9010 (3.8859)	Entropy 1.67994 (1.69679)	Top-1 acc 31.250 (33.192)	Top-5 acc 56.250 (56.997)	lr 0.02481
Train [7][2030/3239]	Time 0.570 (0.842)	Data Time 0.001 (0.011)	Loss 3.8494 (3.8862)	Entropy 1.67967 (1.69671)	Top-1 acc 35.547 (33.187)	Top-5 acc 57.812 (56.992)	lr 0.02481
Train [7][2040/3239]	Time 0.618 (0.842)	Data Time 0.002 (0.011)	Loss 3.7260 (3.8860)	Entropy 1.67945 (1.69663)	Top-1 acc 37.891 (33.192)	Top-5 acc 61.328 (56.994)	lr 0.02481
Train [7][2050/3239]	Time 0.644 (0.842)	Data Time 0.001 (0.011)	Loss 3.7887 (3.8859)	Entropy 1.67934 (1.69654)	Top-1 acc 36.328 (33.197)	Top-5 acc 57.031 (56.999)	lr 0.02481
Train [7][2060/3239]	Time 0.580 (0.842)	Data Time 0.001 (0.011)	Loss 3.9682 (3.8860)	Entropy 1.67910 (1.69646)	Top-1 acc 32.031 (33.195)	Top-5 acc 51.953 (56.996)	lr 0.02481
Train [7][2070/3239]	Time 0.551 (0.842)	Data Time 0.001 (0.011)	Loss 3.8857 (3.8860)	Entropy 1.67900 (1.69637)	Top-1 acc 30.078 (33.196)	Top-5 acc 57.812 (57.002)	lr 0.02481
Train [7][2080/3239]	Time 0.612 (0.842)	Data Time 0.002 (0.011)	Loss 3.7909 (3.8860)	Entropy 1.67881 (1.69629)	Top-1 acc 39.453 (33.197)	Top-5 acc 58.594 (57.004)	lr 0.02481
Train [7][2090/3239]	Time 0.518 (0.842)	Data Time 0.001 (0.011)	Loss 3.8426 (3.8860)	Entropy 1.67856 (1.69621)	Top-1 acc 31.641 (33.196)	Top-5 acc 61.719 (57.006)	lr 0.02481
Train [7][2100/3239]	Time 0.570 (0.842)	Data Time 0.001 (0.011)	Loss 4.1519 (3.8861)	Entropy 1.67840 (1.69612)	Top-1 acc 30.859 (33.199)	Top-5 acc 48.828 (57.005)	lr 0.02481
Train [7][2110/3239]	Time 0.629 (0.842)	Data Time 0.001 (0.011)	Loss 3.9487 (3.8862)	Entropy 1.67805 (1.69604)	Top-1 acc 31.641 (33.199)	Top-5 acc 52.734 (57.002)	lr 0.02481
Train [7][2120/3239]	Time 0.586 (0.842)	Data Time 0.001 (0.011)	Loss 3.7337 (3.8858)	Entropy 1.67786 (1.69595)	Top-1 acc 37.500 (33.209)	Top-5 acc 62.500 (57.016)	lr 0.02481
Train [7][2130/3239]	Time 0.629 (0.841)	Data Time 0.001 (0.011)	Loss 3.9020 (3.8856)	Entropy 1.67773 (1.69587)	Top-1 acc 33.984 (33.212)	Top-5 acc 54.297 (57.019)	lr 0.02481
Train [7][2140/3239]	Time 0.584 (0.841)	Data Time 0.001 (0.011)	Loss 3.9908 (3.8854)	Entropy 1.67748 (1.69578)	Top-1 acc 32.812 (33.217)	Top-5 acc 53.516 (57.022)	lr 0.02481
Train [7][2150/3239]	Time 0.516 (0.850)	Data Time 0.002 (0.011)	Loss 3.7494 (3.8854)	Entropy 1.67738 (1.69570)	Top-1 acc 34.375 (33.220)	Top-5 acc 61.719 (57.019)	lr 0.02481
Train [7][2160/3239]	Time 0.642 (0.850)	Data Time 0.002 (0.011)	Loss 3.9976 (3.8855)	Entropy 1.67731 (1.69561)	Top-1 acc 35.547 (33.216)	Top-5 acc 57.812 (57.022)	lr 0.02481
Train [7][2170/3239]	Time 0.598 (0.850)	Data Time 0.002 (0.010)	Loss 3.7937 (3.8856)	Entropy 1.67729 (1.69553)	Top-1 acc 37.109 (33.211)	Top-5 acc 60.547 (57.020)	lr 0.02481
Train [7][2180/3239]	Time 0.601 (0.850)	Data Time 0.002 (0.010)	Loss 3.7405 (3.8853)	Entropy 1.67732 (1.69544)	Top-1 acc 34.766 (33.209)	Top-5 acc 62.891 (57.024)	lr 0.02481
Train [7][2190/3239]	Time 0.623 (0.850)	Data Time 0.002 (0.010)	Loss 3.7957 (3.8852)	Entropy 1.67680 (1.69536)	Top-1 acc 37.109 (33.219)	Top-5 acc 57.422 (57.023)	lr 0.02481
Train [7][2200/3239]	Time 0.536 (0.850)	Data Time 0.001 (0.010)	Loss 3.8911 (3.8850)	Entropy 1.67693 (1.69528)	Top-1 acc 33.594 (33.222)	Top-5 acc 56.641 (57.023)	lr 0.02481
Train [7][2210/3239]	Time 0.586 (0.850)	Data Time 0.001 (0.010)	Loss 4.0213 (3.8851)	Entropy 1.67668 (1.69519)	Top-1 acc 30.078 (33.224)	Top-5 acc 52.344 (57.019)	lr 0.02481
Train [7][2220/3239]	Time 0.571 (0.850)	Data Time 0.001 (0.010)	Loss 3.7819 (3.8849)	Entropy 1.67652 (1.69511)	Top-1 acc 33.984 (33.232)	Top-5 acc 56.641 (57.025)	lr 0.02481
Train [7][2230/3239]	Time 0.541 (0.850)	Data Time 0.001 (0.010)	Loss 3.8190 (3.8849)	Entropy 1.67628 (1.69503)	Top-1 acc 34.375 (33.232)	Top-5 acc 59.766 (57.029)	lr 0.02481
Train [7][2240/3239]	Time 0.677 (0.849)	Data Time 0.003 (0.010)	Loss 3.8389 (3.8846)	Entropy 1.67620 (1.69494)	Top-1 acc 32.422 (33.235)	Top-5 acc 60.938 (57.035)	lr 0.02481
Train [7][2250/3239]	Time 0.614 (0.849)	Data Time 0.001 (0.010)	Loss 3.8056 (3.8845)	Entropy 1.67603 (1.69486)	Top-1 acc 33.984 (33.233)	Top-5 acc 58.984 (57.034)	lr 0.02481
Train [7][2260/3239]	Time 0.571 (0.849)	Data Time 0.002 (0.010)	Loss 3.8022 (3.8846)	Entropy 1.67598 (1.69477)	Top-1 acc 35.547 (33.229)	Top-5 acc 58.984 (57.038)	lr 0.02481
Train [7][2270/3239]	Time 0.578 (0.849)	Data Time 0.001 (0.010)	Loss 3.8783 (3.8844)	Entropy 1.67573 (1.69469)	Top-1 acc 30.859 (33.230)	Top-5 acc 57.812 (57.041)	lr 0.02481
Train [7][2280/3239]	Time 0.510 (0.849)	Data Time 0.001 (0.010)	Loss 3.8612 (3.8843)	Entropy 1.67574 (1.69461)	Top-1 acc 35.547 (33.233)	Top-5 acc 58.594 (57.050)	lr 0.02481
Train [7][2290/3239]	Time 0.195 (0.849)	Data Time 0.001 (0.010)	Loss 3.8931 (3.8844)	Entropy 1.67567 (1.69453)	Top-1 acc 33.984 (33.229)	Top-5 acc 60.156 (57.046)	lr 0.02481
Train [7][2300/3239]	Time 0.604 (0.849)	Data Time 0.001 (0.010)	Loss 3.7411 (3.8846)	Entropy 1.67554 (1.69444)	Top-1 acc 33.984 (33.223)	Top-5 acc 60.547 (57.043)	lr 0.02481
Train [7][2310/3239]	Time 0.600 (0.848)	Data Time 0.003 (0.010)	Loss 3.9355 (3.8849)	Entropy 1.67541 (1.69436)	Top-1 acc 33.984 (33.216)	Top-5 acc 58.203 (57.035)	lr 0.02481
Train [7][2320/3239]	Time 0.535 (0.848)	Data Time 0.001 (0.010)	Loss 3.7457 (3.8849)	Entropy 1.67515 (1.69428)	Top-1 acc 35.156 (33.220)	Top-5 acc 60.938 (57.033)	lr 0.02481
Train [7][2330/3239]	Time 0.490 (0.848)	Data Time 0.001 (0.010)	Loss 3.8875 (3.8848)	Entropy 1.67487 (1.69420)	Top-1 acc 33.594 (33.224)	Top-5 acc 59.375 (57.036)	lr 0.02481
Train [7][2340/3239]	Time 0.569 (0.848)	Data Time 0.001 (0.010)	Loss 3.7781 (3.8849)	Entropy 1.67487 (1.69411)	Top-1 acc 35.156 (33.219)	Top-5 acc 60.156 (57.034)	lr 0.02481
Train [7][2350/3239]	Time 0.564 (0.848)	Data Time 0.001 (0.010)	Loss 3.9174 (3.8850)	Entropy 1.67495 (1.69403)	Top-1 acc 32.422 (33.216)	Top-5 acc 58.984 (57.033)	lr 0.02481
Train [7][2360/3239]	Time 0.563 (0.848)	Data Time 0.001 (0.010)	Loss 3.9273 (3.8848)	Entropy 1.67497 (1.69395)	Top-1 acc 34.766 (33.217)	Top-5 acc 55.469 (57.039)	lr 0.02481
Train [7][2370/3239]	Time 0.568 (0.848)	Data Time 0.001 (0.010)	Loss 3.8818 (3.8850)	Entropy 1.67484 (1.69387)	Top-1 acc 32.422 (33.216)	Top-5 acc 56.641 (57.032)	lr 0.02481
Train [7][2380/3239]	Time 0.530 (0.848)	Data Time 0.001 (0.010)	Loss 3.7439 (3.8849)	Entropy 1.67441 (1.69379)	Top-1 acc 32.812 (33.212)	Top-5 acc 62.109 (57.035)	lr 0.02481
Train [7][2390/3239]	Time 0.576 (0.848)	Data Time 0.001 (0.010)	Loss 3.8618 (3.8851)	Entropy 1.67437 (1.69371)	Top-1 acc 35.156 (33.206)	Top-5 acc 55.859 (57.034)	lr 0.02481
Train [7][2400/3239]	Time 0.605 (0.847)	Data Time 0.001 (0.010)	Loss 3.8416 (3.8851)	Entropy 1.67424 (1.69363)	Top-1 acc 30.078 (33.199)	Top-5 acc 55.469 (57.032)	lr 0.02481
Train [7][2410/3239]	Time 0.607 (0.847)	Data Time 0.001 (0.010)	Loss 3.8779 (3.8852)	Entropy 1.67424 (1.69355)	Top-1 acc 33.594 (33.197)	Top-5 acc 55.469 (57.027)	lr 0.02481
Train [7][2420/3239]	Time 0.407 (0.847)	Data Time 0.001 (0.010)	Loss 3.8791 (3.8852)	Entropy 1.67408 (1.69347)	Top-1 acc 32.031 (33.196)	Top-5 acc 58.203 (57.027)	lr 0.02481
Train [7][2430/3239]	Time 0.562 (0.847)	Data Time 0.001 (0.010)	Loss 3.9838 (3.8852)	Entropy 1.67368 (1.69339)	Top-1 acc 30.859 (33.193)	Top-5 acc 55.078 (57.032)	lr 0.02481
Train [7][2440/3239]	Time 0.543 (0.847)	Data Time 0.001 (0.010)	Loss 3.4926 (3.8849)	Entropy 1.67349 (1.69331)	Top-1 acc 42.188 (33.194)	Top-5 acc 67.969 (57.036)	lr 0.02481
Train [7][2450/3239]	Time 0.582 (0.847)	Data Time 0.001 (0.010)	Loss 4.0581 (3.8851)	Entropy 1.67331 (1.69323)	Top-1 acc 30.078 (33.190)	Top-5 acc 53.516 (57.032)	lr 0.02480
Train [7][2460/3239]	Time 0.621 (0.847)	Data Time 0.001 (0.010)	Loss 3.8457 (3.8850)	Entropy 1.67324 (1.69315)	Top-1 acc 35.547 (33.190)	Top-5 acc 57.812 (57.036)	lr 0.02480
Train [7][2470/3239]	Time 0.577 (0.847)	Data Time 0.001 (0.010)	Loss 3.8075 (3.8847)	Entropy 1.67291 (1.69307)	Top-1 acc 37.500 (33.199)	Top-5 acc 60.938 (57.044)	lr 0.02480
Train [7][2480/3239]	Time 0.619 (0.846)	Data Time 0.002 (0.010)	Loss 3.7448 (3.8845)	Entropy 1.67265 (1.69298)	Top-1 acc 38.281 (33.204)	Top-5 acc 59.766 (57.045)	lr 0.02480
Train [7][2490/3239]	Time 0.568 (0.846)	Data Time 0.003 (0.010)	Loss 3.6884 (3.8844)	Entropy 1.67249 (1.69290)	Top-1 acc 39.062 (33.207)	Top-5 acc 58.203 (57.047)	lr 0.02480
Train [7][2500/3239]	Time 0.598 (0.846)	Data Time 0.001 (0.010)	Loss 3.7875 (3.8842)	Entropy 1.67241 (1.69282)	Top-1 acc 34.766 (33.215)	Top-5 acc 60.938 (57.049)	lr 0.02480
Train [7][2510/3239]	Time 0.544 (0.846)	Data Time 0.001 (0.009)	Loss 3.8140 (3.8843)	Entropy 1.67237 (1.69274)	Top-1 acc 33.984 (33.214)	Top-5 acc 58.984 (57.047)	lr 0.02480
Train [7][2520/3239]	Time 0.582 (0.846)	Data Time 0.002 (0.009)	Loss 3.8621 (3.8841)	Entropy 1.67211 (1.69266)	Top-1 acc 30.078 (33.215)	Top-5 acc 55.469 (57.053)	lr 0.02480
Train [7][2530/3239]	Time 0.729 (0.846)	Data Time 0.001 (0.009)	Loss 3.9674 (3.8842)	Entropy 1.67188 (1.69258)	Top-1 acc 28.906 (33.213)	Top-5 acc 54.297 (57.049)	lr 0.02480
Train [7][2540/3239]	Time 0.421 (0.846)	Data Time 0.002 (0.009)	Loss 3.7690 (3.8838)	Entropy 1.67159 (1.69249)	Top-1 acc 34.766 (33.223)	Top-5 acc 56.250 (57.060)	lr 0.02480
Train [7][2550/3239]	Time 0.376 (0.846)	Data Time 0.001 (0.009)	Loss 4.0580 (3.8839)	Entropy 1.67141 (1.69241)	Top-1 acc 31.641 (33.217)	Top-5 acc 51.953 (57.053)	lr 0.02480
Train [7][2560/3239]	Time 0.571 (0.846)	Data Time 0.001 (0.009)	Loss 3.8092 (3.8838)	Entropy 1.67142 (1.69233)	Top-1 acc 32.422 (33.217)	Top-5 acc 59.375 (57.056)	lr 0.02480
Train [7][2570/3239]	Time 0.533 (0.846)	Data Time 0.001 (0.009)	Loss 3.7099 (3.8836)	Entropy 1.67135 (1.69225)	Top-1 acc 33.984 (33.223)	Top-5 acc 60.156 (57.061)	lr 0.02480
Train [7][2580/3239]	Time 0.572 (0.846)	Data Time 0.001 (0.009)	Loss 3.8143 (3.8836)	Entropy 1.67117 (1.69217)	Top-1 acc 32.031 (33.221)	Top-5 acc 57.422 (57.059)	lr 0.02480
Train [7][2590/3239]	Time 0.545 (0.845)	Data Time 0.002 (0.009)	Loss 3.9270 (3.8834)	Entropy 1.67123 (1.69209)	Top-1 acc 34.375 (33.228)	Top-5 acc 57.031 (57.065)	lr 0.02480
Train [7][2600/3239]	Time 0.586 (0.845)	Data Time 0.001 (0.009)	Loss 3.7820 (3.8833)	Entropy 1.67092 (1.69201)	Top-1 acc 36.719 (33.233)	Top-5 acc 62.109 (57.065)	lr 0.02480
Train [7][2610/3239]	Time 0.616 (0.845)	Data Time 0.002 (0.009)	Loss 3.7281 (3.8832)	Entropy 1.67082 (1.69193)	Top-1 acc 35.156 (33.236)	Top-5 acc 62.891 (57.070)	lr 0.02480
Train [7][2620/3239]	Time 0.502 (0.845)	Data Time 0.001 (0.009)	Loss 3.6378 (3.8830)	Entropy 1.67060 (1.69184)	Top-1 acc 39.062 (33.239)	Top-5 acc 62.500 (57.077)	lr 0.02480
Train [7][2630/3239]	Time 0.539 (0.845)	Data Time 0.001 (0.009)	Loss 4.0842 (3.8828)	Entropy 1.67035 (1.69176)	Top-1 acc 28.516 (33.239)	Top-5 acc 51.953 (57.084)	lr 0.02480
Train [7][2640/3239]	Time 0.466 (0.845)	Data Time 0.001 (0.009)	Loss 3.7456 (3.8826)	Entropy 1.67031 (1.69168)	Top-1 acc 32.031 (33.240)	Top-5 acc 61.328 (57.090)	lr 0.02480
Train [7][2650/3239]	Time 0.548 (0.844)	Data Time 0.001 (0.009)	Loss 4.0013 (3.8828)	Entropy 1.66999 (1.69160)	Top-1 acc 29.297 (33.238)	Top-5 acc 51.953 (57.086)	lr 0.02480
Train [7][2660/3239]	Time 0.578 (0.844)	Data Time 0.001 (0.009)	Loss 3.9310 (3.8827)	Entropy 1.66979 (1.69152)	Top-1 acc 28.906 (33.240)	Top-5 acc 53.906 (57.089)	lr 0.02480
Train [7][2670/3239]	Time 0.542 (0.844)	Data Time 0.001 (0.009)	Loss 3.8063 (3.8823)	Entropy 1.66956 (1.69144)	Top-1 acc 35.156 (33.249)	Top-5 acc 57.031 (57.097)	lr 0.02480
Train [7][2680/3239]	Time 0.546 (0.844)	Data Time 0.001 (0.009)	Loss 3.6573 (3.8821)	Entropy 1.66967 (1.69136)	Top-1 acc 37.500 (33.253)	Top-5 acc 62.109 (57.099)	lr 0.02480
Train [7][2690/3239]	Time 0.623 (0.844)	Data Time 0.001 (0.009)	Loss 3.8896 (3.8821)	Entropy 1.66958 (1.69128)	Top-1 acc 33.203 (33.250)	Top-5 acc 53.516 (57.096)	lr 0.02480
Train [7][2700/3239]	Time 0.612 (0.844)	Data Time 0.001 (0.009)	Loss 3.8889 (3.8822)	Entropy 1.66927 (1.69119)	Top-1 acc 32.031 (33.246)	Top-5 acc 57.812 (57.093)	lr 0.02480
Train [7][2710/3239]	Time 0.518 (0.844)	Data Time 0.001 (0.009)	Loss 3.8491 (3.8822)	Entropy 1.66914 (1.69111)	Top-1 acc 32.031 (33.246)	Top-5 acc 56.250 (57.092)	lr 0.02480
Train [7][2720/3239]	Time 0.577 (0.844)	Data Time 0.001 (0.009)	Loss 3.7640 (3.8823)	Entropy 1.66880 (1.69103)	Top-1 acc 36.719 (33.244)	Top-5 acc 59.766 (57.089)	lr 0.02480
Train [7][2730/3239]	Time 0.540 (0.844)	Data Time 0.001 (0.009)	Loss 3.9514 (3.8824)	Entropy 1.66880 (1.69095)	Top-1 acc 29.297 (33.241)	Top-5 acc 55.078 (57.087)	lr 0.02480
Train [7][2740/3239]	Time 0.587 (0.844)	Data Time 0.001 (0.009)	Loss 3.7655 (3.8822)	Entropy 1.66883 (1.69087)	Top-1 acc 35.547 (33.243)	Top-5 acc 60.547 (57.092)	lr 0.02480
Train [7][2750/3239]	Time 0.578 (0.844)	Data Time 0.001 (0.009)	Loss 3.7479 (3.8822)	Entropy 1.66873 (1.69079)	Top-1 acc 33.984 (33.242)	Top-5 acc 59.766 (57.092)	lr 0.02480
Train [7][2760/3239]	Time 0.542 (0.844)	Data Time 0.001 (0.009)	Loss 4.0801 (3.8824)	Entropy 1.66829 (1.69071)	Top-1 acc 33.203 (33.243)	Top-5 acc 54.297 (57.087)	lr 0.02480
Train [7][2770/3239]	Time 0.660 (0.844)	Data Time 0.001 (0.009)	Loss 3.8250 (3.8825)	Entropy 1.66813 (1.69063)	Top-1 acc 34.766 (33.241)	Top-5 acc 57.812 (57.084)	lr 0.02480
Train [7][2780/3239]	Time 0.573 (0.843)	Data Time 0.001 (0.009)	Loss 3.8175 (3.8824)	Entropy 1.66801 (1.69055)	Top-1 acc 32.812 (33.243)	Top-5 acc 56.641 (57.086)	lr 0.02480
Train [7][2790/3239]	Time 0.589 (0.843)	Data Time 0.001 (0.009)	Loss 4.1854 (3.8826)	Entropy 1.66793 (1.69047)	Top-1 acc 26.953 (33.240)	Top-5 acc 48.828 (57.081)	lr 0.02480
Train [7][2800/3239]	Time 0.696 (0.850)	Data Time 0.005 (0.009)	Loss 3.8515 (3.8824)	Entropy 1.66789 (1.69039)	Top-1 acc 32.812 (33.248)	Top-5 acc 56.250 (57.085)	lr 0.02480
Train [7][2810/3239]	Time 0.569 (0.850)	Data Time 0.002 (0.009)	Loss 3.8998 (3.8822)	Entropy 1.66788 (1.69031)	Top-1 acc 32.812 (33.249)	Top-5 acc 56.641 (57.090)	lr 0.02480
Train [7][2820/3239]	Time 0.530 (0.850)	Data Time 0.002 (0.009)	Loss 3.8683 (3.8823)	Entropy 1.66743 (1.69023)	Top-1 acc 35.938 (33.247)	Top-5 acc 56.250 (57.084)	lr 0.02480
Train [7][2830/3239]	Time 0.559 (0.850)	Data Time 0.002 (0.009)	Loss 3.9014 (3.8825)	Entropy 1.66726 (1.69015)	Top-1 acc 30.469 (33.242)	Top-5 acc 52.344 (57.081)	lr 0.02480
Train [7][2840/3239]	Time 0.639 (0.849)	Data Time 0.001 (0.009)	Loss 3.8881 (3.8822)	Entropy 1.66686 (1.69006)	Top-1 acc 33.984 (33.244)	Top-5 acc 55.078 (57.081)	lr 0.02480
Train [7][2850/3239]	Time 0.576 (0.849)	Data Time 0.001 (0.009)	Loss 3.9401 (3.8823)	Entropy 1.66655 (1.68998)	Top-1 acc 32.812 (33.248)	Top-5 acc 58.594 (57.084)	lr 0.02480
Train [7][2860/3239]	Time 0.597 (0.849)	Data Time 0.002 (0.009)	Loss 3.7909 (3.8823)	Entropy 1.66672 (1.68990)	Top-1 acc 34.375 (33.247)	Top-5 acc 56.641 (57.082)	lr 0.02480
Train [7][2870/3239]	Time 0.576 (0.849)	Data Time 0.001 (0.009)	Loss 3.6194 (3.8822)	Entropy 1.66663 (1.68982)	Top-1 acc 36.719 (33.251)	Top-5 acc 65.234 (57.087)	lr 0.02480
Train [7][2880/3239]	Time 0.551 (0.849)	Data Time 0.001 (0.009)	Loss 3.9802 (3.8822)	Entropy 1.66654 (1.68974)	Top-1 acc 34.766 (33.253)	Top-5 acc 53.906 (57.088)	lr 0.02480
Train [7][2890/3239]	Time 0.572 (0.849)	Data Time 0.001 (0.009)	Loss 3.8761 (3.8824)	Entropy 1.66642 (1.68966)	Top-1 acc 35.156 (33.252)	Top-5 acc 57.812 (57.084)	lr 0.02480
Train [7][2900/3239]	Time 0.577 (0.849)	Data Time 0.001 (0.009)	Loss 3.8489 (3.8823)	Entropy 1.66651 (1.68958)	Top-1 acc 35.547 (33.254)	Top-5 acc 59.375 (57.084)	lr 0.02480
Train [7][2910/3239]	Time 0.647 (0.849)	Data Time 0.001 (0.009)	Loss 3.7859 (3.8822)	Entropy 1.66647 (1.68950)	Top-1 acc 33.203 (33.253)	Top-5 acc 60.156 (57.088)	lr 0.02480
Train [7][2920/3239]	Time 0.560 (0.849)	Data Time 0.001 (0.009)	Loss 3.9253 (3.8825)	Entropy 1.66615 (1.68942)	Top-1 acc 31.250 (33.247)	Top-5 acc 58.203 (57.082)	lr 0.02480
Train [7][2930/3239]	Time 0.545 (0.849)	Data Time 0.001 (0.009)	Loss 3.8702 (3.8827)	Entropy 1.66607 (1.68934)	Top-1 acc 35.156 (33.243)	Top-5 acc 55.859 (57.074)	lr 0.02480
Train [7][2940/3239]	Time 0.521 (0.849)	Data Time 0.001 (0.009)	Loss 4.0017 (3.8826)	Entropy 1.66587 (1.68926)	Top-1 acc 29.688 (33.245)	Top-5 acc 51.562 (57.073)	lr 0.02480
Train [7][2950/3239]	Time 0.506 (0.848)	Data Time 0.001 (0.009)	Loss 3.7233 (3.8825)	Entropy 1.66562 (1.68918)	Top-1 acc 35.156 (33.249)	Top-5 acc 60.156 (57.076)	lr 0.02480
Train [7][2960/3239]	Time 0.679 (0.848)	Data Time 0.001 (0.009)	Loss 3.9158 (3.8824)	Entropy 1.66520 (1.68910)	Top-1 acc 35.547 (33.246)	Top-5 acc 57.031 (57.076)	lr 0.02480
Train [7][2970/3239]	Time 0.523 (0.848)	Data Time 0.001 (0.009)	Loss 3.9342 (3.8823)	Entropy 1.66517 (1.68902)	Top-1 acc 32.031 (33.244)	Top-5 acc 56.641 (57.081)	lr 0.02480
Train [7][2980/3239]	Time 0.531 (0.848)	Data Time 0.001 (0.008)	Loss 3.9161 (3.8824)	Entropy 1.66495 (1.68894)	Top-1 acc 36.719 (33.243)	Top-5 acc 58.203 (57.082)	lr 0.02480
Train [7][2990/3239]	Time 0.557 (0.848)	Data Time 0.001 (0.008)	Loss 3.8836 (3.8821)	Entropy 1.66481 (1.68886)	Top-1 acc 29.297 (33.248)	Top-5 acc 55.078 (57.092)	lr 0.02480
Train [7][3000/3239]	Time 0.573 (0.848)	Data Time 0.001 (0.008)	Loss 3.7391 (3.8819)	Entropy 1.66468 (1.68878)	Top-1 acc 33.203 (33.246)	Top-5 acc 59.375 (57.095)	lr 0.02480
Train [7][3010/3239]	Time 0.572 (0.848)	Data Time 0.001 (0.008)	Loss 3.9311 (3.8818)	Entropy 1.66441 (1.68870)	Top-1 acc 30.859 (33.245)	Top-5 acc 56.250 (57.098)	lr 0.02479
Train [7][3020/3239]	Time 0.563 (0.848)	Data Time 0.001 (0.008)	Loss 3.8065 (3.8818)	Entropy 1.66415 (1.68862)	Top-1 acc 35.156 (33.247)	Top-5 acc 60.156 (57.097)	lr 0.02479
Train [7][3030/3239]	Time 0.552 (0.848)	Data Time 0.001 (0.008)	Loss 3.7856 (3.8818)	Entropy 1.66379 (1.68854)	Top-1 acc 36.719 (33.249)	Top-5 acc 56.641 (57.100)	lr 0.02479
Train [7][3040/3239]	Time 0.548 (0.847)	Data Time 0.002 (0.008)	Loss 3.7880 (3.8816)	Entropy 1.66379 (1.68846)	Top-1 acc 36.328 (33.251)	Top-5 acc 57.422 (57.103)	lr 0.02479
Train [7][3050/3239]	Time 0.528 (0.847)	Data Time 0.001 (0.008)	Loss 4.0445 (3.8817)	Entropy 1.66349 (1.68838)	Top-1 acc 34.375 (33.250)	Top-5 acc 55.078 (57.102)	lr 0.02479
Train [7][3060/3239]	Time 0.635 (0.847)	Data Time 0.001 (0.008)	Loss 3.7718 (3.8819)	Entropy 1.66338 (1.68829)	Top-1 acc 32.031 (33.248)	Top-5 acc 60.938 (57.099)	lr 0.02479
Train [7][3070/3239]	Time 0.543 (0.847)	Data Time 0.001 (0.008)	Loss 3.8213 (3.8818)	Entropy 1.66326 (1.68821)	Top-1 acc 35.156 (33.252)	Top-5 acc 56.641 (57.099)	lr 0.02479
Train [7][3080/3239]	Time 0.617 (0.847)	Data Time 0.001 (0.008)	Loss 3.9318 (3.8818)	Entropy 1.66310 (1.68813)	Top-1 acc 34.375 (33.250)	Top-5 acc 54.688 (57.097)	lr 0.02479
Train [7][3090/3239]	Time 0.595 (0.847)	Data Time 0.001 (0.008)	Loss 3.7184 (3.8815)	Entropy 1.66259 (1.68805)	Top-1 acc 34.766 (33.257)	Top-5 acc 62.891 (57.106)	lr 0.02479
Train [7][3100/3239]	Time 0.453 (0.847)	Data Time 0.001 (0.008)	Loss 3.6838 (3.8815)	Entropy 1.66228 (1.68797)	Top-1 acc 34.375 (33.256)	Top-5 acc 60.938 (57.106)	lr 0.02479
Train [7][3110/3239]	Time 0.517 (0.847)	Data Time 0.001 (0.008)	Loss 3.7940 (3.8815)	Entropy 1.66205 (1.68789)	Top-1 acc 35.547 (33.256)	Top-5 acc 64.453 (57.107)	lr 0.02479
Train [7][3120/3239]	Time 0.575 (0.847)	Data Time 0.003 (0.008)	Loss 3.7313 (3.8815)	Entropy 1.66182 (1.68780)	Top-1 acc 35.156 (33.256)	Top-5 acc 60.938 (57.106)	lr 0.02479
Train [7][3130/3239]	Time 0.408 (0.846)	Data Time 0.001 (0.008)	Loss 3.7591 (3.8814)	Entropy 1.66168 (1.68772)	Top-1 acc 36.328 (33.261)	Top-5 acc 57.031 (57.108)	lr 0.02479
Train [7][3140/3239]	Time 0.563 (0.846)	Data Time 0.001 (0.008)	Loss 3.9993 (3.8815)	Entropy 1.66158 (1.68764)	Top-1 acc 34.375 (33.258)	Top-5 acc 54.688 (57.108)	lr 0.02479
Train [7][3150/3239]	Time 0.638 (0.846)	Data Time 0.001 (0.008)	Loss 3.6989 (3.8816)	Entropy 1.66145 (1.68755)	Top-1 acc 37.891 (33.257)	Top-5 acc 62.109 (57.107)	lr 0.02479
Train [7][3160/3239]	Time 0.569 (0.846)	Data Time 0.001 (0.008)	Loss 3.7432 (3.8814)	Entropy 1.66128 (1.68747)	Top-1 acc 35.938 (33.263)	Top-5 acc 58.594 (57.112)	lr 0.02479
Train [7][3170/3239]	Time 0.596 (0.846)	Data Time 0.001 (0.008)	Loss 3.8267 (3.8812)	Entropy 1.66117 (1.68739)	Top-1 acc 34.766 (33.263)	Top-5 acc 56.641 (57.114)	lr 0.02479
Train [7][3180/3239]	Time 0.580 (0.846)	Data Time 0.000 (0.008)	Loss 3.7196 (3.8811)	Entropy 1.66096 (1.68730)	Top-1 acc 32.031 (33.265)	Top-5 acc 61.328 (57.120)	lr 0.02479
Train [7][3190/3239]	Time 0.549 (0.846)	Data Time 0.000 (0.008)	Loss 3.6688 (3.8810)	Entropy 1.66092 (1.68722)	Top-1 acc 39.844 (33.268)	Top-5 acc 61.719 (57.120)	lr 0.02479
Train [7][3200/3239]	Time 0.642 (0.845)	Data Time 0.000 (0.008)	Loss 3.8831 (3.8810)	Entropy 1.66059 (1.68714)	Top-1 acc 32.812 (33.267)	Top-5 acc 55.859 (57.125)	lr 0.02479
Train [7][3210/3239]	Time 0.506 (0.845)	Data Time 0.000 (0.008)	Loss 3.8238 (3.8809)	Entropy 1.66049 (1.68706)	Top-1 acc 32.031 (33.268)	Top-5 acc 58.594 (57.128)	lr 0.02479
Train [7][3220/3239]	Time 0.621 (0.845)	Data Time 0.000 (0.008)	Loss 3.9059 (3.8808)	Entropy 1.66017 (1.68697)	Top-1 acc 28.906 (33.268)	Top-5 acc 57.422 (57.129)	lr 0.02479
Train [7][3230/3239]	Time 0.572 (0.845)	Data Time 0.000 (0.008)	Loss 3.5875 (3.8808)	Entropy 1.65986 (1.68689)	Top-1 acc 41.797 (33.272)	Top-5 acc 63.672 (57.129)	lr 0.02479
Train [7][3239/3239]	Time 1.547 (0.845)	Data Time 0.001 (0.008)	Loss 4.0219 (3.8809)	Entropy 1.66009 (1.68682)	Top-1 acc 25.926 (33.269)	Top-5 acc 55.556 (57.128)	lr 0.02479
==========Valid [7/120]	loss 2.724	top-1 acc 42.246 (42.246)	top-5 acc 67.077	Train top-1 33.269	top-5 57.128	Entropy 1.66009	Latency-None: 0.000ms	Flops: 542.77M
Train [8][0/3239]	Time 17.868 (17.868)	Data Time 16.929 (16.929)	Loss 3.9137 (3.9137)	Entropy 1.66007 (1.66007)	Top-1 acc 33.594 (33.594)	Top-5 acc 56.250 (56.250)	lr 0.02479
Train [8][10/3239]	Time 0.657 (2.462)	Data Time 0.001 (1.541)	Loss 3.9597 (3.8999)	Entropy 1.65964 (1.65996)	Top-1 acc 32.031 (33.239)	Top-5 acc 55.078 (56.747)	lr 0.02479
Train [8][20/3239]	Time 0.546 (1.666)	Data Time 0.001 (0.808)	Loss 3.7126 (3.8746)	Entropy 1.65978 (1.65984)	Top-1 acc 33.984 (33.278)	Top-5 acc 59.375 (57.385)	lr 0.02479
Train [8][30/3239]	Time 0.519 (1.392)	Data Time 0.001 (0.549)	Loss 3.7823 (3.8830)	Entropy 1.65981 (1.65980)	Top-1 acc 37.109 (33.090)	Top-5 acc 60.156 (57.447)	lr 0.02479
Train [8][40/3239]	Time 0.431 (1.255)	Data Time 0.001 (0.417)	Loss 3.7784 (3.8712)	Entropy 1.65949 (1.65978)	Top-1 acc 35.156 (33.317)	Top-5 acc 61.719 (57.622)	lr 0.02479
Train [8][50/3239]	Time 0.605 (1.168)	Data Time 0.002 (0.338)	Loss 3.9641 (3.8732)	Entropy 1.65938 (1.65972)	Top-1 acc 33.594 (33.594)	Top-5 acc 55.859 (57.567)	lr 0.02479
Train [8][60/3239]	Time 0.553 (1.110)	Data Time 0.001 (0.283)	Loss 3.6240 (3.8683)	Entropy 1.65912 (1.65965)	Top-1 acc 41.406 (33.703)	Top-5 acc 64.062 (57.665)	lr 0.02479
Train [8][70/3239]	Time 0.429 (1.068)	Data Time 0.001 (0.244)	Loss 4.0397 (3.8750)	Entropy 1.65884 (1.65957)	Top-1 acc 30.469 (33.539)	Top-5 acc 57.812 (57.581)	lr 0.02479
Train [8][80/3239]	Time 0.616 (1.034)	Data Time 0.002 (0.214)	Loss 3.7707 (3.8722)	Entropy 1.65868 (1.65947)	Top-1 acc 36.328 (33.536)	Top-5 acc 59.375 (57.547)	lr 0.02479
Train [8][90/3239]	Time 0.568 (1.009)	Data Time 0.001 (0.191)	Loss 3.9961 (3.8697)	Entropy 1.65866 (1.65938)	Top-1 acc 28.125 (33.508)	Top-5 acc 50.391 (57.533)	lr 0.02479
Train [8][100/3239]	Time 0.595 (0.983)	Data Time 0.002 (0.172)	Loss 4.0414 (3.8669)	Entropy 1.65867 (1.65930)	Top-1 acc 28.516 (33.524)	Top-5 acc 53.516 (57.615)	lr 0.02479
Train [8][110/3239]	Time 0.602 (0.969)	Data Time 0.002 (0.157)	Loss 3.8224 (3.8681)	Entropy 1.65828 (1.65923)	Top-1 acc 35.938 (33.544)	Top-5 acc 59.375 (57.584)	lr 0.02479
Train [8][120/3239]	Time 0.556 (0.956)	Data Time 0.001 (0.144)	Loss 3.7723 (3.8663)	Entropy 1.65794 (1.65915)	Top-1 acc 31.250 (33.455)	Top-5 acc 57.812 (57.593)	lr 0.02479
Train [8][130/3239]	Time 0.664 (0.947)	Data Time 0.001 (0.133)	Loss 3.9800 (3.8693)	Entropy 1.65778 (1.65905)	Top-1 acc 31.641 (33.385)	Top-5 acc 51.172 (57.467)	lr 0.02479
Train [8][140/3239]	Time 0.593 (0.938)	Data Time 0.002 (0.124)	Loss 3.8578 (3.8685)	Entropy 1.65770 (1.65896)	Top-1 acc 34.375 (33.436)	Top-5 acc 58.594 (57.461)	lr 0.02479
Train [8][150/3239]	Time 0.551 (0.930)	Data Time 0.002 (0.116)	Loss 3.8760 (3.8670)	Entropy 1.65774 (1.65888)	Top-1 acc 35.547 (33.428)	Top-5 acc 58.984 (57.492)	lr 0.02479
Train [8][160/3239]	Time 0.566 (0.924)	Data Time 0.001 (0.108)	Loss 3.7749 (3.8653)	Entropy 1.65773 (1.65881)	Top-1 acc 32.812 (33.463)	Top-5 acc 60.938 (57.529)	lr 0.02479
Train [8][170/3239]	Time 0.583 (0.918)	Data Time 0.001 (0.102)	Loss 3.7882 (3.8659)	Entropy 1.65771 (1.65875)	Top-1 acc 30.469 (33.381)	Top-5 acc 58.203 (57.500)	lr 0.02479
Train [8][180/3239]	Time 0.583 (0.912)	Data Time 0.001 (0.097)	Loss 3.8284 (3.8637)	Entropy 1.65774 (1.65869)	Top-1 acc 31.641 (33.343)	Top-5 acc 58.984 (57.549)	lr 0.02479
Train [8][190/3239]	Time 0.577 (0.907)	Data Time 0.001 (0.092)	Loss 3.6707 (3.8611)	Entropy 1.65757 (1.65864)	Top-1 acc 36.719 (33.379)	Top-5 acc 61.328 (57.602)	lr 0.02479
Train [8][200/3239]	Time 0.668 (0.903)	Data Time 0.002 (0.087)	Loss 3.8346 (3.8576)	Entropy 1.65739 (1.65858)	Top-1 acc 32.812 (33.464)	Top-5 acc 59.375 (57.706)	lr 0.02479
Train [8][210/3239]	Time 0.542 (0.899)	Data Time 0.001 (0.083)	Loss 3.6647 (3.8574)	Entropy 1.65715 (1.65852)	Top-1 acc 42.188 (33.503)	Top-5 acc 62.500 (57.644)	lr 0.02479
Train [8][220/3239]	Time 0.537 (0.983)	Data Time 0.002 (0.080)	Loss 3.8231 (3.8581)	Entropy 1.65715 (1.65846)	Top-1 acc 32.812 (33.507)	Top-5 acc 61.719 (57.659)	lr 0.02479
Train [8][230/3239]	Time 0.572 (0.976)	Data Time 0.002 (0.077)	Loss 4.0016 (3.8593)	Entropy 1.65694 (1.65840)	Top-1 acc 28.125 (33.453)	Top-5 acc 53.125 (57.596)	lr 0.02479
Train [8][240/3239]	Time 0.513 (0.967)	Data Time 0.002 (0.074)	Loss 3.8576 (3.8589)	Entropy 1.65685 (1.65834)	Top-1 acc 33.203 (33.406)	Top-5 acc 55.859 (57.599)	lr 0.02479
Train [8][250/3239]	Time 0.536 (0.961)	Data Time 0.001 (0.071)	Loss 4.0520 (3.8581)	Entropy 1.65658 (1.65828)	Top-1 acc 29.297 (33.452)	Top-5 acc 52.734 (57.615)	lr 0.02479
Train [8][260/3239]	Time 0.564 (0.956)	Data Time 0.002 (0.068)	Loss 3.8362 (3.8576)	Entropy 1.65636 (1.65821)	Top-1 acc 33.594 (33.458)	Top-5 acc 57.812 (57.621)	lr 0.02479
Train [8][270/3239]	Time 0.601 (0.951)	Data Time 0.003 (0.066)	Loss 3.8916 (3.8557)	Entropy 1.65632 (1.65814)	Top-1 acc 31.641 (33.490)	Top-5 acc 57.812 (57.676)	lr 0.02479
Train [8][280/3239]	Time 0.574 (0.947)	Data Time 0.001 (0.064)	Loss 3.8541 (3.8549)	Entropy 1.65609 (1.65807)	Top-1 acc 32.031 (33.521)	Top-5 acc 57.422 (57.692)	lr 0.02479
Train [8][290/3239]	Time 0.587 (0.943)	Data Time 0.001 (0.062)	Loss 3.8795 (3.8546)	Entropy 1.65581 (1.65800)	Top-1 acc 36.719 (33.535)	Top-5 acc 61.328 (57.709)	lr 0.02479
Train [8][300/3239]	Time 0.627 (0.939)	Data Time 0.001 (0.060)	Loss 3.8483 (3.8542)	Entropy 1.65554 (1.65793)	Top-1 acc 32.422 (33.538)	Top-5 acc 58.203 (57.735)	lr 0.02479
Train [8][310/3239]	Time 0.580 (0.935)	Data Time 0.001 (0.058)	Loss 3.9446 (3.8550)	Entropy 1.65530 (1.65785)	Top-1 acc 30.469 (33.541)	Top-5 acc 57.031 (57.688)	lr 0.02478
Train [8][320/3239]	Time 0.597 (0.932)	Data Time 0.001 (0.056)	Loss 3.8800 (3.8563)	Entropy 1.65502 (1.65776)	Top-1 acc 30.469 (33.524)	Top-5 acc 58.203 (57.637)	lr 0.02478
Train [8][330/3239]	Time 0.528 (0.929)	Data Time 0.001 (0.055)	Loss 3.8009 (3.8557)	Entropy 1.65470 (1.65768)	Top-1 acc 34.375 (33.537)	Top-5 acc 59.375 (57.620)	lr 0.02478
Train [8][340/3239]	Time 0.529 (0.924)	Data Time 0.001 (0.053)	Loss 3.6879 (3.8563)	Entropy 1.65445 (1.65759)	Top-1 acc 38.672 (33.542)	Top-5 acc 61.328 (57.620)	lr 0.02478
Train [8][350/3239]	Time 0.577 (0.922)	Data Time 0.001 (0.052)	Loss 3.8327 (3.8550)	Entropy 1.65445 (1.65750)	Top-1 acc 34.766 (33.571)	Top-5 acc 54.688 (57.616)	lr 0.02478
Train [8][360/3239]	Time 0.557 (0.919)	Data Time 0.001 (0.050)	Loss 3.9529 (3.8533)	Entropy 1.65408 (1.65741)	Top-1 acc 30.078 (33.593)	Top-5 acc 54.688 (57.655)	lr 0.02478
Train [8][370/3239]	Time 0.540 (0.916)	Data Time 0.001 (0.049)	Loss 3.8300 (3.8526)	Entropy 1.65379 (1.65732)	Top-1 acc 35.156 (33.641)	Top-5 acc 57.031 (57.680)	lr 0.02478
Train [8][380/3239]	Time 0.417 (0.913)	Data Time 0.001 (0.048)	Loss 3.8637 (3.8529)	Entropy 1.65382 (1.65723)	Top-1 acc 34.375 (33.626)	Top-5 acc 57.422 (57.644)	lr 0.02478
Train [8][390/3239]	Time 0.635 (0.910)	Data Time 0.001 (0.047)	Loss 3.9865 (3.8523)	Entropy 1.65381 (1.65714)	Top-1 acc 31.250 (33.627)	Top-5 acc 51.953 (57.683)	lr 0.02478
Train [8][400/3239]	Time 0.500 (0.907)	Data Time 0.001 (0.046)	Loss 3.8648 (3.8529)	Entropy 1.65371 (1.65705)	Top-1 acc 32.812 (33.623)	Top-5 acc 58.203 (57.704)	lr 0.02478
Train [8][410/3239]	Time 0.591 (0.904)	Data Time 0.001 (0.044)	Loss 3.8888 (3.8542)	Entropy 1.65330 (1.65697)	Top-1 acc 31.250 (33.578)	Top-5 acc 54.297 (57.691)	lr 0.02478
Train [8][420/3239]	Time 0.561 (0.902)	Data Time 0.002 (0.043)	Loss 3.7812 (3.8526)	Entropy 1.65325 (1.65688)	Top-1 acc 32.422 (33.620)	Top-5 acc 59.766 (57.729)	lr 0.02478
Train [8][430/3239]	Time 0.625 (0.900)	Data Time 0.001 (0.043)	Loss 3.7817 (3.8521)	Entropy 1.65300 (1.65679)	Top-1 acc 34.375 (33.638)	Top-5 acc 55.859 (57.745)	lr 0.02478
Train [8][440/3239]	Time 0.676 (0.898)	Data Time 0.001 (0.042)	Loss 4.0640 (3.8525)	Entropy 1.65296 (1.65671)	Top-1 acc 30.859 (33.642)	Top-5 acc 56.641 (57.750)	lr 0.02478
Train [8][450/3239]	Time 0.573 (0.896)	Data Time 0.001 (0.041)	Loss 3.9652 (3.8520)	Entropy 1.65277 (1.65662)	Top-1 acc 35.156 (33.673)	Top-5 acc 56.250 (57.778)	lr 0.02478
Train [8][460/3239]	Time 0.615 (0.894)	Data Time 0.001 (0.040)	Loss 3.9632 (3.8520)	Entropy 1.65266 (1.65654)	Top-1 acc 32.031 (33.665)	Top-5 acc 53.516 (57.776)	lr 0.02478
Train [8][470/3239]	Time 0.575 (0.893)	Data Time 0.001 (0.039)	Loss 3.7930 (3.8519)	Entropy 1.65237 (1.65645)	Top-1 acc 34.766 (33.670)	Top-5 acc 59.375 (57.783)	lr 0.02478
Train [8][480/3239]	Time 0.572 (0.891)	Data Time 0.001 (0.038)	Loss 3.8378 (3.8523)	Entropy 1.65223 (1.65637)	Top-1 acc 33.594 (33.672)	Top-5 acc 55.859 (57.782)	lr 0.02478
Train [8][490/3239]	Time 0.541 (0.889)	Data Time 0.001 (0.038)	Loss 3.7959 (3.8512)	Entropy 1.65218 (1.65628)	Top-1 acc 36.328 (33.700)	Top-5 acc 62.109 (57.822)	lr 0.02478
Train [8][500/3239]	Time 0.523 (0.888)	Data Time 0.001 (0.037)	Loss 3.8150 (3.8497)	Entropy 1.65210 (1.65620)	Top-1 acc 32.031 (33.746)	Top-5 acc 60.156 (57.852)	lr 0.02478
Train [8][510/3239]	Time 0.751 (0.887)	Data Time 0.001 (0.036)	Loss 3.7560 (3.8493)	Entropy 1.65195 (1.65612)	Top-1 acc 35.156 (33.760)	Top-5 acc 59.766 (57.868)	lr 0.02478
Train [8][520/3239]	Time 0.597 (0.886)	Data Time 0.001 (0.036)	Loss 3.8366 (3.8494)	Entropy 1.65182 (1.65604)	Top-1 acc 37.891 (33.762)	Top-5 acc 58.203 (57.859)	lr 0.02478
Train [8][530/3239]	Time 0.599 (0.884)	Data Time 0.001 (0.035)	Loss 4.0887 (3.8496)	Entropy 1.65161 (1.65596)	Top-1 acc 28.906 (33.761)	Top-5 acc 55.469 (57.865)	lr 0.02478
Train [8][540/3239]	Time 0.576 (0.884)	Data Time 0.001 (0.034)	Loss 3.7634 (3.8485)	Entropy 1.65146 (1.65587)	Top-1 acc 38.281 (33.768)	Top-5 acc 58.984 (57.906)	lr 0.02478
Train [8][550/3239]	Time 0.567 (0.882)	Data Time 0.001 (0.034)	Loss 3.7509 (3.8490)	Entropy 1.65124 (1.65579)	Top-1 acc 36.328 (33.772)	Top-5 acc 56.641 (57.895)	lr 0.02478
Train [8][560/3239]	Time 0.554 (0.881)	Data Time 0.001 (0.033)	Loss 3.6508 (3.8477)	Entropy 1.65109 (1.65571)	Top-1 acc 37.500 (33.813)	Top-5 acc 63.281 (57.904)	lr 0.02478
Train [8][570/3239]	Time 0.540 (0.879)	Data Time 0.001 (0.033)	Loss 3.7179 (3.8476)	Entropy 1.65112 (1.65563)	Top-1 acc 37.891 (33.813)	Top-5 acc 58.984 (57.907)	lr 0.02478
Train [8][580/3239]	Time 0.528 (0.877)	Data Time 0.001 (0.032)	Loss 3.7014 (3.8470)	Entropy 1.65104 (1.65555)	Top-1 acc 36.328 (33.830)	Top-5 acc 60.156 (57.902)	lr 0.02478
Train [8][590/3239]	Time 0.606 (0.876)	Data Time 0.001 (0.032)	Loss 3.6758 (3.8472)	Entropy 1.65095 (1.65548)	Top-1 acc 39.844 (33.828)	Top-5 acc 62.109 (57.907)	lr 0.02478
Train [8][600/3239]	Time 0.562 (0.874)	Data Time 0.001 (0.031)	Loss 3.9515 (3.8472)	Entropy 1.65089 (1.65540)	Top-1 acc 34.375 (33.843)	Top-5 acc 57.031 (57.911)	lr 0.02478
Train [8][610/3239]	Time 0.524 (0.873)	Data Time 0.001 (0.031)	Loss 3.9113 (3.8473)	Entropy 1.65094 (1.65533)	Top-1 acc 32.422 (33.841)	Top-5 acc 56.641 (57.919)	lr 0.02478
Train [8][620/3239]	Time 0.569 (0.872)	Data Time 0.001 (0.030)	Loss 4.0379 (3.8473)	Entropy 1.65074 (1.65526)	Top-1 acc 28.516 (33.849)	Top-5 acc 54.297 (57.918)	lr 0.02478
Train [8][630/3239]	Time 0.526 (0.871)	Data Time 0.001 (0.030)	Loss 3.5934 (3.8464)	Entropy 1.65018 (1.65518)	Top-1 acc 38.281 (33.874)	Top-5 acc 62.500 (57.943)	lr 0.02478
Train [8][640/3239]	Time 0.555 (0.870)	Data Time 0.001 (0.029)	Loss 3.9923 (3.8460)	Entropy 1.65011 (1.65510)	Top-1 acc 31.250 (33.892)	Top-5 acc 52.734 (57.949)	lr 0.02478
Train [8][650/3239]	Time 0.623 (0.869)	Data Time 0.001 (0.029)	Loss 3.8601 (3.8454)	Entropy 1.64992 (1.65502)	Top-1 acc 31.641 (33.900)	Top-5 acc 57.031 (57.963)	lr 0.02478
Train [8][660/3239]	Time 0.583 (0.869)	Data Time 0.001 (0.028)	Loss 4.0187 (3.8463)	Entropy 1.64982 (1.65495)	Top-1 acc 26.953 (33.888)	Top-5 acc 54.688 (57.931)	lr 0.02478
Train [8][670/3239]	Time 0.542 (0.868)	Data Time 0.001 (0.028)	Loss 4.0390 (3.8457)	Entropy 1.64944 (1.65487)	Top-1 acc 30.859 (33.897)	Top-5 acc 53.906 (57.952)	lr 0.02478
Train [8][680/3239]	Time 0.550 (0.867)	Data Time 0.001 (0.028)	Loss 3.7910 (3.8452)	Entropy 1.64927 (1.65479)	Top-1 acc 36.719 (33.910)	Top-5 acc 61.328 (57.954)	lr 0.02478
Train [8][690/3239]	Time 0.549 (0.866)	Data Time 0.002 (0.027)	Loss 3.8535 (3.8456)	Entropy 1.64924 (1.65471)	Top-1 acc 30.859 (33.900)	Top-5 acc 57.812 (57.957)	lr 0.02478
Train [8][700/3239]	Time 0.624 (0.866)	Data Time 0.001 (0.027)	Loss 3.8291 (3.8454)	Entropy 1.64902 (1.65463)	Top-1 acc 37.109 (33.915)	Top-5 acc 59.375 (57.957)	lr 0.02478
Train [8][710/3239]	Time 0.535 (0.865)	Data Time 0.001 (0.027)	Loss 3.9716 (3.8459)	Entropy 1.64882 (1.65455)	Top-1 acc 30.469 (33.903)	Top-5 acc 56.641 (57.939)	lr 0.02478
Train [8][720/3239]	Time 0.576 (0.864)	Data Time 0.002 (0.026)	Loss 3.9059 (3.8464)	Entropy 1.64858 (1.65447)	Top-1 acc 32.031 (33.887)	Top-5 acc 53.516 (57.917)	lr 0.02478
Train [8][730/3239]	Time 0.584 (0.863)	Data Time 0.001 (0.026)	Loss 3.7741 (3.8465)	Entropy 1.64831 (1.65439)	Top-1 acc 34.375 (33.892)	Top-5 acc 59.375 (57.907)	lr 0.02478
Train [8][740/3239]	Time 0.495 (0.862)	Data Time 0.001 (0.026)	Loss 3.6811 (3.8463)	Entropy 1.64802 (1.65430)	Top-1 acc 36.328 (33.905)	Top-5 acc 66.016 (57.916)	lr 0.02478
Train [8][750/3239]	Time 0.619 (0.861)	Data Time 0.003 (0.025)	Loss 3.9173 (3.8465)	Entropy 1.64785 (1.65422)	Top-1 acc 33.984 (33.913)	Top-5 acc 55.859 (57.922)	lr 0.02478
Train [8][760/3239]	Time 0.217 (0.860)	Data Time 0.002 (0.025)	Loss 3.7751 (3.8461)	Entropy 1.64769 (1.65414)	Top-1 acc 32.422 (33.919)	Top-5 acc 61.328 (57.930)	lr 0.02478
Train [8][770/3239]	Time 0.397 (0.858)	Data Time 0.001 (0.025)	Loss 3.9117 (3.8460)	Entropy 1.64729 (1.65405)	Top-1 acc 31.641 (33.931)	Top-5 acc 56.250 (57.933)	lr 0.02478
Train [8][780/3239]	Time 0.586 (0.858)	Data Time 0.001 (0.025)	Loss 3.8173 (3.8446)	Entropy 1.64711 (1.65396)	Top-1 acc 34.375 (33.963)	Top-5 acc 60.156 (57.966)	lr 0.02478
Train [8][790/3239]	Time 0.535 (0.857)	Data Time 0.001 (0.024)	Loss 3.8075 (3.8451)	Entropy 1.64697 (1.65388)	Top-1 acc 34.375 (33.960)	Top-5 acc 56.641 (57.951)	lr 0.02478
Train [8][800/3239]	Time 0.542 (0.856)	Data Time 0.001 (0.024)	Loss 4.0343 (3.8457)	Entropy 1.64690 (1.65379)	Top-1 acc 27.734 (33.946)	Top-5 acc 56.641 (57.936)	lr 0.02478
Train [8][810/3239]	Time 0.565 (0.856)	Data Time 0.001 (0.024)	Loss 3.8291 (3.8458)	Entropy 1.64687 (1.65370)	Top-1 acc 32.422 (33.942)	Top-5 acc 60.156 (57.947)	lr 0.02478
Train [8][820/3239]	Time 0.572 (0.855)	Data Time 0.001 (0.024)	Loss 3.8643 (3.8454)	Entropy 1.64644 (1.65362)	Top-1 acc 36.719 (33.945)	Top-5 acc 59.766 (57.960)	lr 0.02478
Train [8][830/3239]	Time 0.380 (0.854)	Data Time 0.001 (0.023)	Loss 3.6533 (3.8445)	Entropy 1.64628 (1.65353)	Top-1 acc 36.328 (33.969)	Top-5 acc 64.453 (57.980)	lr 0.02478
Train [8][840/3239]	Time 0.513 (0.854)	Data Time 0.001 (0.023)	Loss 3.7872 (3.8443)	Entropy 1.64596 (1.65345)	Top-1 acc 33.203 (33.980)	Top-5 acc 61.328 (57.998)	lr 0.02477
Train [8][850/3239]	Time 0.608 (0.854)	Data Time 0.001 (0.023)	Loss 4.0272 (3.8443)	Entropy 1.64573 (1.65336)	Top-1 acc 28.906 (33.982)	Top-5 acc 52.344 (57.992)	lr 0.02477
Train [8][860/3239]	Time 0.551 (0.853)	Data Time 0.001 (0.023)	Loss 3.5928 (3.8434)	Entropy 1.64532 (1.65327)	Top-1 acc 37.500 (34.004)	Top-5 acc 62.109 (58.012)	lr 0.02477
Train [8][870/3239]	Time 0.908 (0.873)	Data Time 0.005 (0.023)	Loss 3.7237 (3.8445)	Entropy 1.64542 (1.65318)	Top-1 acc 31.641 (33.983)	Top-5 acc 63.281 (57.989)	lr 0.02477
Train [8][880/3239]	Time 0.583 (0.872)	Data Time 0.002 (0.022)	Loss 3.8381 (3.8447)	Entropy 1.64528 (1.65309)	Top-1 acc 35.156 (33.981)	Top-5 acc 55.078 (57.987)	lr 0.02477
Train [8][890/3239]	Time 0.502 (0.871)	Data Time 0.001 (0.022)	Loss 3.9345 (3.8442)	Entropy 1.64534 (1.65300)	Top-1 acc 28.516 (33.975)	Top-5 acc 55.469 (57.990)	lr 0.02477
Train [8][900/3239]	Time 0.594 (0.871)	Data Time 0.001 (0.022)	Loss 3.9043 (3.8441)	Entropy 1.64547 (1.65292)	Top-1 acc 33.984 (33.980)	Top-5 acc 57.422 (57.983)	lr 0.02477
Train [8][910/3239]	Time 0.547 (0.869)	Data Time 0.002 (0.022)	Loss 3.9161 (3.8443)	Entropy 1.64543 (1.65283)	Top-1 acc 34.375 (33.974)	Top-5 acc 58.203 (57.981)	lr 0.02477
Train [8][920/3239]	Time 0.516 (0.869)	Data Time 0.001 (0.021)	Loss 3.8940 (3.8443)	Entropy 1.64527 (1.65275)	Top-1 acc 37.500 (33.981)	Top-5 acc 57.031 (57.979)	lr 0.02477
Train [8][930/3239]	Time 0.510 (0.868)	Data Time 0.001 (0.021)	Loss 3.8167 (3.8443)	Entropy 1.64508 (1.65267)	Top-1 acc 36.328 (33.969)	Top-5 acc 59.766 (57.969)	lr 0.02477
Train [8][940/3239]	Time 0.749 (0.868)	Data Time 0.002 (0.021)	Loss 3.6246 (3.8445)	Entropy 1.64484 (1.65259)	Top-1 acc 37.109 (33.958)	Top-5 acc 59.766 (57.970)	lr 0.02477
Train [8][950/3239]	Time 0.553 (0.867)	Data Time 0.001 (0.021)	Loss 3.8500 (3.8440)	Entropy 1.64475 (1.65251)	Top-1 acc 35.156 (33.964)	Top-5 acc 58.203 (57.977)	lr 0.02477
Train [8][960/3239]	Time 0.617 (0.867)	Data Time 0.001 (0.021)	Loss 3.9868 (3.8444)	Entropy 1.64455 (1.65243)	Top-1 acc 31.641 (33.973)	Top-5 acc 56.250 (57.964)	lr 0.02477
Train [8][970/3239]	Time 0.572 (0.866)	Data Time 0.001 (0.020)	Loss 3.6934 (3.8441)	Entropy 1.64452 (1.65235)	Top-1 acc 37.500 (33.984)	Top-5 acc 60.547 (57.972)	lr 0.02477
Train [8][980/3239]	Time 0.577 (0.865)	Data Time 0.001 (0.020)	Loss 3.7279 (3.8439)	Entropy 1.64457 (1.65227)	Top-1 acc 38.281 (34.000)	Top-5 acc 61.719 (57.976)	lr 0.02477
Train [8][990/3239]	Time 0.658 (0.865)	Data Time 0.001 (0.020)	Loss 3.7142 (3.8441)	Entropy 1.64447 (1.65219)	Top-1 acc 35.156 (34.003)	Top-5 acc 60.938 (57.965)	lr 0.02477
Train [8][1000/3239]	Time 0.573 (0.865)	Data Time 0.001 (0.020)	Loss 3.8190 (3.8442)	Entropy 1.64433 (1.65211)	Top-1 acc 35.547 (34.000)	Top-5 acc 58.984 (57.965)	lr 0.02477
Train [8][1010/3239]	Time 0.540 (0.864)	Data Time 0.001 (0.020)	Loss 3.8993 (3.8441)	Entropy 1.64385 (1.65203)	Top-1 acc 35.547 (34.000)	Top-5 acc 55.859 (57.962)	lr 0.02477
Train [8][1020/3239]	Time 0.603 (0.864)	Data Time 0.002 (0.020)	Loss 3.7175 (3.8436)	Entropy 1.64382 (1.65195)	Top-1 acc 35.547 (34.008)	Top-5 acc 59.766 (57.969)	lr 0.02477
Train [8][1030/3239]	Time 0.556 (0.864)	Data Time 0.001 (0.019)	Loss 3.8711 (3.8438)	Entropy 1.64355 (1.65187)	Top-1 acc 34.766 (34.008)	Top-5 acc 56.250 (57.967)	lr 0.02477
Train [8][1040/3239]	Time 0.555 (0.863)	Data Time 0.001 (0.019)	Loss 3.8893 (3.8432)	Entropy 1.64348 (1.65179)	Top-1 acc 31.641 (34.022)	Top-5 acc 56.250 (57.986)	lr 0.02477
Train [8][1050/3239]	Time 0.557 (0.863)	Data Time 0.001 (0.019)	Loss 3.9124 (3.8431)	Entropy 1.64352 (1.65171)	Top-1 acc 31.250 (34.026)	Top-5 acc 55.469 (57.984)	lr 0.02477
Train [8][1060/3239]	Time 0.487 (0.862)	Data Time 0.001 (0.019)	Loss 3.9434 (3.8433)	Entropy 1.64327 (1.65163)	Top-1 acc 33.203 (34.022)	Top-5 acc 55.859 (57.979)	lr 0.02477
Train [8][1070/3239]	Time 0.566 (0.861)	Data Time 0.001 (0.019)	Loss 3.8490 (3.8430)	Entropy 1.64310 (1.65156)	Top-1 acc 33.984 (34.027)	Top-5 acc 55.078 (57.984)	lr 0.02477
Train [8][1080/3239]	Time 0.605 (0.860)	Data Time 0.001 (0.019)	Loss 3.5869 (3.8422)	Entropy 1.64327 (1.65148)	Top-1 acc 38.672 (34.044)	Top-5 acc 62.891 (58.003)	lr 0.02477
Train [8][1090/3239]	Time 0.600 (0.860)	Data Time 0.001 (0.018)	Loss 3.7131 (3.8418)	Entropy 1.64324 (1.65140)	Top-1 acc 36.719 (34.057)	Top-5 acc 55.469 (58.006)	lr 0.02477
Train [8][1100/3239]	Time 0.549 (0.860)	Data Time 0.001 (0.018)	Loss 3.7992 (3.8420)	Entropy 1.64321 (1.65133)	Top-1 acc 34.766 (34.058)	Top-5 acc 58.984 (58.006)	lr 0.02477
Train [8][1110/3239]	Time 0.656 (0.859)	Data Time 0.001 (0.018)	Loss 3.7439 (3.8421)	Entropy 1.64309 (1.65126)	Top-1 acc 35.547 (34.048)	Top-5 acc 60.547 (57.998)	lr 0.02477
Train [8][1120/3239]	Time 0.552 (0.859)	Data Time 0.001 (0.018)	Loss 3.7778 (3.8422)	Entropy 1.64314 (1.65118)	Top-1 acc 34.766 (34.042)	Top-5 acc 60.156 (57.995)	lr 0.02477
Train [8][1130/3239]	Time 0.596 (0.859)	Data Time 0.001 (0.018)	Loss 3.8701 (3.8423)	Entropy 1.64293 (1.65111)	Top-1 acc 33.203 (34.043)	Top-5 acc 56.641 (57.992)	lr 0.02477
Train [8][1140/3239]	Time 0.530 (0.858)	Data Time 0.001 (0.018)	Loss 3.8730 (3.8421)	Entropy 1.64264 (1.65104)	Top-1 acc 35.938 (34.051)	Top-5 acc 56.250 (58.001)	lr 0.02477
Train [8][1150/3239]	Time 0.602 (0.858)	Data Time 0.003 (0.018)	Loss 3.9309 (3.8420)	Entropy 1.64234 (1.65096)	Top-1 acc 30.469 (34.059)	Top-5 acc 57.812 (57.999)	lr 0.02477
Train [8][1160/3239]	Time 0.586 (0.858)	Data Time 0.001 (0.017)	Loss 3.9200 (3.8418)	Entropy 1.64234 (1.65089)	Top-1 acc 32.812 (34.056)	Top-5 acc 54.688 (57.998)	lr 0.02477
Train [8][1170/3239]	Time 0.615 (0.857)	Data Time 0.001 (0.017)	Loss 4.0202 (3.8423)	Entropy 1.64214 (1.65082)	Top-1 acc 29.297 (34.049)	Top-5 acc 56.250 (57.986)	lr 0.02477
Train [8][1180/3239]	Time 0.665 (0.857)	Data Time 0.001 (0.017)	Loss 4.0653 (3.8426)	Entropy 1.64190 (1.65074)	Top-1 acc 29.297 (34.052)	Top-5 acc 53.516 (57.982)	lr 0.02477
Train [8][1190/3239]	Time 0.494 (0.857)	Data Time 0.001 (0.017)	Loss 3.9256 (3.8428)	Entropy 1.64183 (1.65067)	Top-1 acc 35.156 (34.052)	Top-5 acc 56.250 (57.979)	lr 0.02477
Train [8][1200/3239]	Time 0.564 (0.856)	Data Time 0.001 (0.017)	Loss 3.8452 (3.8426)	Entropy 1.64141 (1.65059)	Top-1 acc 35.938 (34.055)	Top-5 acc 55.469 (57.980)	lr 0.02477
Train [8][1210/3239]	Time 0.617 (0.856)	Data Time 0.002 (0.017)	Loss 3.8620 (3.8430)	Entropy 1.64146 (1.65052)	Top-1 acc 32.422 (34.058)	Top-5 acc 58.984 (57.969)	lr 0.02477
Train [8][1220/3239]	Time 0.583 (0.856)	Data Time 0.003 (0.017)	Loss 3.8950 (3.8428)	Entropy 1.64098 (1.65044)	Top-1 acc 34.375 (34.064)	Top-5 acc 55.469 (57.972)	lr 0.02477
Train [8][1230/3239]	Time 0.575 (0.855)	Data Time 0.001 (0.017)	Loss 3.9868 (3.8428)	Entropy 1.64079 (1.65036)	Top-1 acc 34.766 (34.059)	Top-5 acc 53.906 (57.979)	lr 0.02477
Train [8][1240/3239]	Time 0.487 (0.854)	Data Time 0.001 (0.016)	Loss 3.9613 (3.8424)	Entropy 1.64042 (1.65029)	Top-1 acc 32.422 (34.064)	Top-5 acc 57.422 (57.987)	lr 0.02477
Train [8][1250/3239]	Time 0.540 (0.854)	Data Time 0.001 (0.016)	Loss 3.5781 (3.8423)	Entropy 1.64026 (1.65021)	Top-1 acc 42.188 (34.060)	Top-5 acc 64.062 (57.990)	lr 0.02477
Train [8][1260/3239]	Time 0.584 (0.853)	Data Time 0.001 (0.016)	Loss 3.7552 (3.8426)	Entropy 1.64021 (1.65013)	Top-1 acc 33.594 (34.049)	Top-5 acc 58.594 (57.984)	lr 0.02477
Train [8][1270/3239]	Time 0.567 (0.853)	Data Time 0.001 (0.016)	Loss 3.7956 (3.8425)	Entropy 1.64004 (1.65005)	Top-1 acc 32.031 (34.050)	Top-5 acc 59.375 (57.988)	lr 0.02477
Train [8][1280/3239]	Time 0.555 (0.853)	Data Time 0.001 (0.016)	Loss 3.9134 (3.8421)	Entropy 1.63975 (1.64997)	Top-1 acc 35.547 (34.052)	Top-5 acc 58.203 (57.993)	lr 0.02477
Train [8][1290/3239]	Time 0.537 (0.852)	Data Time 0.001 (0.016)	Loss 3.9767 (3.8428)	Entropy 1.63956 (1.64989)	Top-1 acc 33.203 (34.031)	Top-5 acc 54.297 (57.975)	lr 0.02477
Train [8][1300/3239]	Time 0.600 (0.852)	Data Time 0.001 (0.016)	Loss 3.9183 (3.8433)	Entropy 1.63951 (1.64981)	Top-1 acc 34.375 (34.028)	Top-5 acc 56.250 (57.962)	lr 0.02477
Train [8][1310/3239]	Time 0.577 (0.852)	Data Time 0.001 (0.016)	Loss 3.7350 (3.8432)	Entropy 1.63955 (1.64973)	Top-1 acc 36.719 (34.034)	Top-5 acc 56.250 (57.968)	lr 0.02477
Train [8][1320/3239]	Time 0.563 (0.851)	Data Time 0.001 (0.016)	Loss 3.8491 (3.8433)	Entropy 1.63931 (1.64966)	Top-1 acc 32.422 (34.025)	Top-5 acc 55.469 (57.963)	lr 0.02477
Train [8][1330/3239]	Time 0.560 (0.851)	Data Time 0.002 (0.015)	Loss 3.9751 (3.8433)	Entropy 1.63937 (1.64958)	Top-1 acc 30.078 (34.020)	Top-5 acc 54.297 (57.959)	lr 0.02477
Train [8][1340/3239]	Time 0.541 (0.851)	Data Time 0.002 (0.015)	Loss 3.8473 (3.8434)	Entropy 1.63898 (1.64950)	Top-1 acc 35.156 (34.021)	Top-5 acc 58.203 (57.958)	lr 0.02477
Train [8][1350/3239]	Time 0.566 (0.851)	Data Time 0.001 (0.015)	Loss 4.0707 (3.8435)	Entropy 1.63875 (1.64942)	Top-1 acc 29.688 (34.023)	Top-5 acc 53.516 (57.959)	lr 0.02477
Train [8][1360/3239]	Time 0.610 (0.850)	Data Time 0.001 (0.015)	Loss 4.0857 (3.8435)	Entropy 1.63831 (1.64934)	Top-1 acc 29.297 (34.026)	Top-5 acc 56.250 (57.962)	lr 0.02476
Train [8][1370/3239]	Time 0.683 (0.850)	Data Time 0.001 (0.015)	Loss 3.8933 (3.8435)	Entropy 1.63830 (1.64926)	Top-1 acc 33.984 (34.020)	Top-5 acc 56.250 (57.961)	lr 0.02476
Train [8][1380/3239]	Time 0.558 (0.850)	Data Time 0.001 (0.015)	Loss 3.8981 (3.8437)	Entropy 1.63820 (1.64918)	Top-1 acc 32.422 (34.019)	Top-5 acc 59.766 (57.965)	lr 0.02476
Train [8][1390/3239]	Time 0.576 (0.850)	Data Time 0.001 (0.015)	Loss 4.0522 (3.8438)	Entropy 1.63813 (1.64910)	Top-1 acc 32.031 (34.023)	Top-5 acc 55.469 (57.958)	lr 0.02476
Train [8][1400/3239]	Time 0.486 (0.849)	Data Time 0.001 (0.015)	Loss 3.9562 (3.8441)	Entropy 1.63794 (1.64902)	Top-1 acc 32.031 (34.017)	Top-5 acc 56.250 (57.949)	lr 0.02476
Train [8][1410/3239]	Time 0.587 (0.849)	Data Time 0.001 (0.015)	Loss 3.9088 (3.8438)	Entropy 1.63792 (1.64895)	Top-1 acc 30.859 (34.021)	Top-5 acc 58.203 (57.953)	lr 0.02476
Train [8][1420/3239]	Time 0.574 (0.849)	Data Time 0.001 (0.015)	Loss 3.6750 (3.8439)	Entropy 1.63765 (1.64887)	Top-1 acc 42.578 (34.023)	Top-5 acc 62.109 (57.950)	lr 0.02476
Train [8][1430/3239]	Time 0.565 (0.848)	Data Time 0.001 (0.014)	Loss 3.7407 (3.8441)	Entropy 1.63759 (1.64879)	Top-1 acc 35.547 (34.023)	Top-5 acc 60.156 (57.943)	lr 0.02476
Train [8][1440/3239]	Time 0.618 (0.848)	Data Time 0.002 (0.014)	Loss 3.8159 (3.8445)	Entropy 1.63760 (1.64871)	Top-1 acc 33.203 (34.014)	Top-5 acc 58.594 (57.937)	lr 0.02476
Train [8][1450/3239]	Time 0.573 (0.848)	Data Time 0.001 (0.014)	Loss 3.9391 (3.8450)	Entropy 1.63719 (1.64863)	Top-1 acc 28.516 (34.005)	Top-5 acc 55.469 (57.927)	lr 0.02476
Train [8][1460/3239]	Time 0.578 (0.847)	Data Time 0.001 (0.014)	Loss 4.0400 (3.8455)	Entropy 1.63711 (1.64856)	Top-1 acc 30.859 (34.000)	Top-5 acc 54.688 (57.916)	lr 0.02476
Train [8][1470/3239]	Time 0.509 (0.847)	Data Time 0.001 (0.014)	Loss 3.7523 (3.8455)	Entropy 1.63719 (1.64848)	Top-1 acc 34.766 (33.994)	Top-5 acc 62.500 (57.920)	lr 0.02476
Train [8][1480/3239]	Time 0.532 (0.847)	Data Time 0.001 (0.014)	Loss 3.7634 (3.8453)	Entropy 1.63693 (1.64840)	Top-1 acc 34.766 (33.994)	Top-5 acc 62.891 (57.928)	lr 0.02476
Train [8][1490/3239]	Time 0.528 (0.847)	Data Time 0.001 (0.014)	Loss 3.8603 (3.8453)	Entropy 1.63648 (1.64832)	Top-1 acc 33.203 (33.990)	Top-5 acc 58.984 (57.933)	lr 0.02476
Train [8][1500/3239]	Time 0.536 (0.846)	Data Time 0.001 (0.014)	Loss 3.9671 (3.8450)	Entropy 1.63622 (1.64824)	Top-1 acc 30.078 (33.994)	Top-5 acc 52.734 (57.933)	lr 0.02476
Train [8][1510/3239]	Time 0.651 (0.846)	Data Time 0.001 (0.014)	Loss 3.8966 (3.8451)	Entropy 1.63597 (1.64816)	Top-1 acc 30.859 (33.994)	Top-5 acc 58.203 (57.931)	lr 0.02476
Train [8][1520/3239]	Time 0.579 (0.846)	Data Time 0.001 (0.014)	Loss 3.6878 (3.8449)	Entropy 1.63570 (1.64808)	Top-1 acc 40.625 (34.001)	Top-5 acc 63.281 (57.936)	lr 0.02476
Train [8][1530/3239]	Time 0.581 (0.858)	Data Time 0.002 (0.014)	Loss 3.8564 (3.8451)	Entropy 1.63539 (1.64800)	Top-1 acc 32.422 (33.993)	Top-5 acc 58.203 (57.925)	lr 0.02476
Train [8][1540/3239]	Time 0.578 (0.858)	Data Time 0.001 (0.014)	Loss 3.7123 (3.8446)	Entropy 1.63509 (1.64792)	Top-1 acc 36.719 (34.005)	Top-5 acc 57.812 (57.936)	lr 0.02476
Train [8][1550/3239]	Time 0.587 (0.857)	Data Time 0.002 (0.014)	Loss 3.8424 (3.8444)	Entropy 1.63473 (1.64783)	Top-1 acc 36.719 (34.005)	Top-5 acc 60.547 (57.943)	lr 0.02476
Train [8][1560/3239]	Time 0.540 (0.857)	Data Time 0.001 (0.013)	Loss 3.8269 (3.8445)	Entropy 1.63477 (1.64775)	Top-1 acc 32.812 (34.003)	Top-5 acc 57.031 (57.942)	lr 0.02476
Train [8][1570/3239]	Time 0.602 (0.856)	Data Time 0.002 (0.013)	Loss 3.7081 (3.8443)	Entropy 1.63448 (1.64767)	Top-1 acc 35.938 (34.003)	Top-5 acc 59.375 (57.951)	lr 0.02476
Train [8][1580/3239]	Time 0.686 (0.856)	Data Time 0.001 (0.013)	Loss 3.7178 (3.8443)	Entropy 1.63450 (1.64758)	Top-1 acc 33.203 (34.000)	Top-5 acc 62.500 (57.951)	lr 0.02476
Train [8][1590/3239]	Time 0.545 (0.856)	Data Time 0.001 (0.013)	Loss 3.8506 (3.8443)	Entropy 1.63425 (1.64750)	Top-1 acc 32.031 (33.991)	Top-5 acc 54.688 (57.948)	lr 0.02476
Train [8][1600/3239]	Time 0.566 (0.856)	Data Time 0.001 (0.013)	Loss 3.8948 (3.8442)	Entropy 1.63414 (1.64742)	Top-1 acc 31.641 (33.988)	Top-5 acc 57.031 (57.951)	lr 0.02476
Train [8][1610/3239]	Time 0.606 (0.855)	Data Time 0.001 (0.013)	Loss 3.9887 (3.8439)	Entropy 1.63395 (1.64734)	Top-1 acc 33.203 (33.989)	Top-5 acc 53.906 (57.963)	lr 0.02476
Train [8][1620/3239]	Time 0.622 (0.855)	Data Time 0.001 (0.013)	Loss 4.0322 (3.8442)	Entropy 1.63369 (1.64725)	Top-1 acc 27.734 (33.982)	Top-5 acc 56.641 (57.952)	lr 0.02476
Train [8][1630/3239]	Time 0.666 (0.855)	Data Time 0.001 (0.013)	Loss 3.8230 (3.8442)	Entropy 1.63359 (1.64717)	Top-1 acc 35.156 (33.989)	Top-5 acc 57.031 (57.954)	lr 0.02476
Train [8][1640/3239]	Time 0.590 (0.855)	Data Time 0.001 (0.013)	Loss 4.0940 (3.8445)	Entropy 1.63357 (1.64709)	Top-1 acc 28.906 (33.986)	Top-5 acc 50.000 (57.942)	lr 0.02476
Train [8][1650/3239]	Time 0.594 (0.854)	Data Time 0.001 (0.013)	Loss 3.7043 (3.8445)	Entropy 1.63326 (1.64700)	Top-1 acc 34.375 (33.983)	Top-5 acc 59.766 (57.942)	lr 0.02476
Train [8][1660/3239]	Time 0.609 (0.854)	Data Time 0.001 (0.013)	Loss 3.5987 (3.8448)	Entropy 1.63320 (1.64692)	Top-1 acc 39.453 (33.973)	Top-5 acc 64.844 (57.937)	lr 0.02476
Train [8][1670/3239]	Time 0.562 (0.854)	Data Time 0.001 (0.013)	Loss 3.9083 (3.8448)	Entropy 1.63310 (1.64684)	Top-1 acc 29.688 (33.970)	Top-5 acc 55.469 (57.934)	lr 0.02476
Train [8][1680/3239]	Time 0.556 (0.854)	Data Time 0.001 (0.013)	Loss 3.9542 (3.8447)	Entropy 1.63306 (1.64676)	Top-1 acc 30.078 (33.964)	Top-5 acc 53.125 (57.937)	lr 0.02476
Train [8][1690/3239]	Time 0.578 (0.854)	Data Time 0.001 (0.013)	Loss 3.7261 (3.8446)	Entropy 1.63289 (1.64667)	Top-1 acc 36.719 (33.961)	Top-5 acc 60.156 (57.936)	lr 0.02476
Train [8][1700/3239]	Time 0.690 (0.853)	Data Time 0.001 (0.013)	Loss 3.8574 (3.8444)	Entropy 1.63263 (1.64659)	Top-1 acc 33.203 (33.960)	Top-5 acc 57.812 (57.937)	lr 0.02476
Train [8][1710/3239]	Time 0.547 (0.853)	Data Time 0.001 (0.013)	Loss 3.8685 (3.8441)	Entropy 1.63224 (1.64651)	Top-1 acc 33.984 (33.967)	Top-5 acc 58.203 (57.945)	lr 0.02476
Train [8][1720/3239]	Time 0.521 (0.853)	Data Time 0.001 (0.012)	Loss 4.0149 (3.8436)	Entropy 1.63217 (1.64643)	Top-1 acc 31.641 (33.980)	Top-5 acc 52.734 (57.960)	lr 0.02476
Train [8][1730/3239]	Time 0.577 (0.852)	Data Time 0.001 (0.012)	Loss 3.9369 (3.8437)	Entropy 1.63186 (1.64634)	Top-1 acc 32.031 (33.978)	Top-5 acc 56.641 (57.959)	lr 0.02476
Train [8][1740/3239]	Time 0.452 (0.852)	Data Time 0.001 (0.012)	Loss 3.9274 (3.8440)	Entropy 1.63173 (1.64626)	Top-1 acc 34.766 (33.978)	Top-5 acc 53.516 (57.953)	lr 0.02476
Train [8][1750/3239]	Time 0.519 (0.852)	Data Time 0.001 (0.012)	Loss 3.8461 (3.8438)	Entropy 1.63162 (1.64618)	Top-1 acc 34.766 (33.981)	Top-5 acc 59.766 (57.960)	lr 0.02476
Train [8][1760/3239]	Time 0.531 (0.851)	Data Time 0.001 (0.012)	Loss 3.7988 (3.8437)	Entropy 1.63131 (1.64610)	Top-1 acc 35.938 (33.984)	Top-5 acc 59.375 (57.962)	lr 0.02476
Train [8][1770/3239]	Time 0.631 (0.851)	Data Time 0.001 (0.012)	Loss 3.9307 (3.8435)	Entropy 1.63101 (1.64601)	Top-1 acc 32.422 (33.994)	Top-5 acc 57.031 (57.965)	lr 0.02476
Train [8][1780/3239]	Time 0.591 (0.851)	Data Time 0.001 (0.012)	Loss 3.7008 (3.8436)	Entropy 1.63087 (1.64593)	Top-1 acc 37.109 (33.992)	Top-5 acc 60.938 (57.963)	lr 0.02476
Train [8][1790/3239]	Time 0.598 (0.851)	Data Time 0.001 (0.012)	Loss 3.7739 (3.8432)	Entropy 1.63090 (1.64584)	Top-1 acc 37.109 (33.993)	Top-5 acc 60.547 (57.974)	lr 0.02476
Train [8][1800/3239]	Time 0.570 (0.851)	Data Time 0.001 (0.012)	Loss 3.7441 (3.8432)	Entropy 1.63091 (1.64576)	Top-1 acc 36.719 (33.990)	Top-5 acc 62.109 (57.975)	lr 0.02476
Train [8][1810/3239]	Time 0.603 (0.850)	Data Time 0.001 (0.012)	Loss 3.7925 (3.8431)	Entropy 1.63045 (1.64568)	Top-1 acc 37.500 (33.995)	Top-5 acc 55.469 (57.978)	lr 0.02476
Train [8][1820/3239]	Time 0.559 (0.850)	Data Time 0.001 (0.012)	Loss 3.5818 (3.8430)	Entropy 1.63036 (1.64559)	Top-1 acc 42.188 (33.992)	Top-5 acc 63.281 (57.975)	lr 0.02476
Train [8][1830/3239]	Time 0.612 (0.850)	Data Time 0.001 (0.012)	Loss 3.7450 (3.8431)	Entropy 1.63012 (1.64551)	Top-1 acc 35.938 (33.987)	Top-5 acc 60.156 (57.968)	lr 0.02476
Train [8][1840/3239]	Time 0.631 (0.850)	Data Time 0.001 (0.012)	Loss 3.9625 (3.8432)	Entropy 1.62985 (1.64543)	Top-1 acc 34.766 (33.985)	Top-5 acc 53.516 (57.966)	lr 0.02476
Train [8][1850/3239]	Time 0.543 (0.850)	Data Time 0.001 (0.012)	Loss 3.6259 (3.8431)	Entropy 1.62991 (1.64534)	Top-1 acc 33.984 (33.984)	Top-5 acc 64.844 (57.965)	lr 0.02476
Train [8][1860/3239]	Time 0.506 (0.850)	Data Time 0.001 (0.012)	Loss 3.8403 (3.8429)	Entropy 1.62968 (1.64526)	Top-1 acc 36.719 (33.993)	Top-5 acc 59.375 (57.968)	lr 0.02476
Train [8][1870/3239]	Time 0.527 (0.849)	Data Time 0.001 (0.012)	Loss 3.6819 (3.8432)	Entropy 1.62950 (1.64517)	Top-1 acc 38.281 (33.989)	Top-5 acc 62.500 (57.963)	lr 0.02475
Train [8][1880/3239]	Time 0.580 (0.849)	Data Time 0.001 (0.012)	Loss 3.8111 (3.8428)	Entropy 1.62941 (1.64509)	Top-1 acc 35.156 (33.995)	Top-5 acc 58.984 (57.973)	lr 0.02475
Train [8][1890/3239]	Time 0.316 (0.849)	Data Time 0.001 (0.012)	Loss 3.7984 (3.8425)	Entropy 1.62932 (1.64501)	Top-1 acc 30.469 (33.999)	Top-5 acc 57.422 (57.980)	lr 0.02475
Train [8][1900/3239]	Time 0.543 (0.849)	Data Time 0.001 (0.012)	Loss 3.7255 (3.8424)	Entropy 1.62931 (1.64493)	Top-1 acc 33.984 (34.005)	Top-5 acc 62.500 (57.981)	lr 0.02475
Train [8][1910/3239]	Time 0.576 (0.848)	Data Time 0.001 (0.012)	Loss 3.8598 (3.8423)	Entropy 1.62888 (1.64484)	Top-1 acc 32.812 (34.004)	Top-5 acc 53.516 (57.976)	lr 0.02475
Train [8][1920/3239]	Time 0.617 (0.848)	Data Time 0.001 (0.011)	Loss 3.8896 (3.8422)	Entropy 1.62878 (1.64476)	Top-1 acc 36.328 (34.005)	Top-5 acc 55.469 (57.977)	lr 0.02475
Train [8][1930/3239]	Time 0.556 (0.848)	Data Time 0.001 (0.011)	Loss 3.8224 (3.8422)	Entropy 1.62873 (1.64468)	Top-1 acc 35.156 (34.004)	Top-5 acc 57.031 (57.976)	lr 0.02475
Train [8][1940/3239]	Time 0.701 (0.848)	Data Time 0.001 (0.011)	Loss 3.8092 (3.8424)	Entropy 1.62860 (1.64459)	Top-1 acc 35.938 (33.998)	Top-5 acc 60.547 (57.965)	lr 0.02475
Train [8][1950/3239]	Time 0.394 (0.847)	Data Time 0.001 (0.011)	Loss 3.9075 (3.8424)	Entropy 1.62812 (1.64451)	Top-1 acc 31.641 (33.998)	Top-5 acc 58.203 (57.964)	lr 0.02475
Train [8][1960/3239]	Time 0.524 (0.847)	Data Time 0.001 (0.011)	Loss 3.7637 (3.8423)	Entropy 1.62783 (1.64443)	Top-1 acc 38.281 (33.997)	Top-5 acc 60.938 (57.965)	lr 0.02475
Train [8][1970/3239]	Time 0.576 (0.847)	Data Time 0.001 (0.011)	Loss 3.6438 (3.8422)	Entropy 1.62790 (1.64434)	Top-1 acc 30.859 (33.997)	Top-5 acc 65.234 (57.962)	lr 0.02475
Train [8][1980/3239]	Time 0.502 (0.847)	Data Time 0.001 (0.011)	Loss 3.8286 (3.8424)	Entropy 1.62755 (1.64426)	Top-1 acc 30.469 (33.994)	Top-5 acc 60.547 (57.960)	lr 0.02475
Train [8][1990/3239]	Time 0.621 (0.847)	Data Time 0.001 (0.011)	Loss 3.7332 (3.8421)	Entropy 1.62722 (1.64418)	Top-1 acc 37.500 (33.998)	Top-5 acc 61.328 (57.965)	lr 0.02475
Train [8][2000/3239]	Time 0.527 (0.847)	Data Time 0.001 (0.011)	Loss 3.8468 (3.8421)	Entropy 1.62699 (1.64409)	Top-1 acc 33.594 (33.994)	Top-5 acc 55.859 (57.959)	lr 0.02475
Train [8][2010/3239]	Time 0.686 (0.846)	Data Time 0.001 (0.011)	Loss 3.9197 (3.8417)	Entropy 1.62670 (1.64400)	Top-1 acc 34.375 (34.000)	Top-5 acc 53.125 (57.966)	lr 0.02475
Train [8][2020/3239]	Time 0.560 (0.846)	Data Time 0.001 (0.011)	Loss 3.8375 (3.8421)	Entropy 1.62635 (1.64392)	Top-1 acc 35.547 (33.995)	Top-5 acc 58.984 (57.960)	lr 0.02475
Train [8][2030/3239]	Time 0.594 (0.846)	Data Time 0.001 (0.011)	Loss 3.7778 (3.8421)	Entropy 1.62581 (1.64383)	Top-1 acc 37.500 (33.993)	Top-5 acc 59.766 (57.963)	lr 0.02475
Train [8][2040/3239]	Time 0.561 (0.846)	Data Time 0.001 (0.011)	Loss 3.9074 (3.8423)	Entropy 1.62564 (1.64374)	Top-1 acc 33.203 (33.979)	Top-5 acc 55.469 (57.954)	lr 0.02475
Train [8][2050/3239]	Time 0.551 (0.846)	Data Time 0.001 (0.011)	Loss 3.7361 (3.8415)	Entropy 1.62542 (1.64365)	Top-1 acc 36.328 (33.997)	Top-5 acc 58.594 (57.972)	lr 0.02475
Train [8][2060/3239]	Time 0.577 (0.845)	Data Time 0.001 (0.011)	Loss 3.7283 (3.8412)	Entropy 1.62535 (1.64356)	Top-1 acc 40.234 (34.010)	Top-5 acc 61.328 (57.980)	lr 0.02475
Train [8][2070/3239]	Time 0.632 (0.845)	Data Time 0.001 (0.011)	Loss 3.7660 (3.8412)	Entropy 1.62513 (1.64348)	Top-1 acc 38.281 (34.011)	Top-5 acc 60.938 (57.979)	lr 0.02475
Train [8][2080/3239]	Time 0.591 (0.845)	Data Time 0.002 (0.011)	Loss 3.7559 (3.8414)	Entropy 1.62499 (1.64339)	Top-1 acc 37.500 (34.007)	Top-5 acc 60.938 (57.976)	lr 0.02475
Train [8][2090/3239]	Time 0.540 (0.845)	Data Time 0.001 (0.011)	Loss 3.9552 (3.8413)	Entropy 1.62473 (1.64330)	Top-1 acc 30.859 (34.011)	Top-5 acc 55.078 (57.978)	lr 0.02475
Train [8][2100/3239]	Time 0.548 (0.844)	Data Time 0.001 (0.011)	Loss 3.9825 (3.8414)	Entropy 1.62435 (1.64321)	Top-1 acc 31.250 (34.007)	Top-5 acc 56.641 (57.978)	lr 0.02475
Train [8][2110/3239]	Time 0.547 (0.844)	Data Time 0.001 (0.011)	Loss 3.6940 (3.8412)	Entropy 1.62471 (1.64312)	Top-1 acc 34.375 (34.007)	Top-5 acc 60.938 (57.980)	lr 0.02475
Train [8][2120/3239]	Time 0.561 (0.844)	Data Time 0.001 (0.011)	Loss 3.9020 (3.8411)	Entropy 1.62457 (1.64304)	Top-1 acc 33.203 (34.011)	Top-5 acc 58.984 (57.983)	lr 0.02475
Train [8][2130/3239]	Time 0.682 (0.844)	Data Time 0.001 (0.011)	Loss 4.0342 (3.8416)	Entropy 1.62441 (1.64295)	Top-1 acc 30.469 (34.002)	Top-5 acc 55.469 (57.968)	lr 0.02475
Train [8][2140/3239]	Time 0.547 (0.844)	Data Time 0.001 (0.011)	Loss 3.7068 (3.8415)	Entropy 1.62420 (1.64286)	Top-1 acc 33.984 (33.992)	Top-5 acc 58.203 (57.967)	lr 0.02475
Train [8][2150/3239]	Time 0.569 (0.844)	Data Time 0.001 (0.010)	Loss 3.8507 (3.8413)	Entropy 1.62386 (1.64277)	Top-1 acc 33.203 (34.000)	Top-5 acc 55.078 (57.968)	lr 0.02475
Train [8][2160/3239]	Time 0.575 (0.844)	Data Time 0.001 (0.010)	Loss 3.7761 (3.8411)	Entropy 1.62381 (1.64269)	Top-1 acc 37.500 (34.006)	Top-5 acc 61.719 (57.976)	lr 0.02475
Train [8][2170/3239]	Time 0.545 (0.843)	Data Time 0.001 (0.010)	Loss 3.8838 (3.8409)	Entropy 1.62381 (1.64260)	Top-1 acc 32.812 (34.006)	Top-5 acc 57.031 (57.977)	lr 0.02475
Train [8][2180/3239]	Time 0.661 (0.852)	Data Time 0.005 (0.010)	Loss 3.9206 (3.8410)	Entropy 1.62346 (1.64251)	Top-1 acc 32.422 (34.007)	Top-5 acc 54.688 (57.974)	lr 0.02475
Train [8][2190/3239]	Time 0.581 (0.852)	Data Time 0.002 (0.010)	Loss 3.8789 (3.8407)	Entropy 1.62316 (1.64243)	Top-1 acc 36.328 (34.015)	Top-5 acc 56.250 (57.981)	lr 0.02475
Train [8][2200/3239]	Time 0.655 (0.852)	Data Time 0.001 (0.010)	Loss 3.8154 (3.8407)	Entropy 1.62291 (1.64234)	Top-1 acc 35.547 (34.012)	Top-5 acc 60.938 (57.978)	lr 0.02475
Train [8][2210/3239]	Time 0.576 (0.852)	Data Time 0.002 (0.010)	Loss 3.5369 (3.8409)	Entropy 1.62299 (1.64225)	Top-1 acc 41.016 (34.009)	Top-5 acc 65.234 (57.971)	lr 0.02475
Train [8][2220/3239]	Time 0.585 (0.852)	Data Time 0.001 (0.010)	Loss 3.6313 (3.8406)	Entropy 1.62290 (1.64216)	Top-1 acc 36.328 (34.017)	Top-5 acc 62.109 (57.974)	lr 0.02475
Train [8][2230/3239]	Time 0.460 (0.851)	Data Time 0.001 (0.010)	Loss 3.8660 (3.8405)	Entropy 1.62267 (1.64208)	Top-1 acc 31.641 (34.020)	Top-5 acc 54.688 (57.976)	lr 0.02475
Train [8][2240/3239]	Time 0.648 (0.851)	Data Time 0.001 (0.010)	Loss 3.7443 (3.8405)	Entropy 1.62260 (1.64199)	Top-1 acc 35.156 (34.020)	Top-5 acc 60.938 (57.977)	lr 0.02475
Train [8][2250/3239]	Time 0.548 (0.851)	Data Time 0.003 (0.010)	Loss 3.8278 (3.8406)	Entropy 1.62246 (1.64190)	Top-1 acc 34.375 (34.024)	Top-5 acc 58.203 (57.979)	lr 0.02475
Train [8][2260/3239]	Time 0.568 (0.851)	Data Time 0.001 (0.010)	Loss 3.9374 (3.8408)	Entropy 1.62216 (1.64182)	Top-1 acc 29.688 (34.017)	Top-5 acc 53.516 (57.976)	lr 0.02475
Train [8][2270/3239]	Time 0.655 (0.851)	Data Time 0.001 (0.010)	Loss 3.9248 (3.8408)	Entropy 1.62220 (1.64173)	Top-1 acc 29.688 (34.018)	Top-5 acc 54.297 (57.973)	lr 0.02475
Train [8][2280/3239]	Time 0.568 (0.851)	Data Time 0.002 (0.010)	Loss 3.8711 (3.8410)	Entropy 1.62205 (1.64164)	Top-1 acc 32.812 (34.014)	Top-5 acc 57.812 (57.973)	lr 0.02475
Train [8][2290/3239]	Time 0.559 (0.851)	Data Time 0.001 (0.010)	Loss 3.9431 (3.8409)	Entropy 1.62166 (1.64156)	Top-1 acc 34.375 (34.018)	Top-5 acc 57.031 (57.977)	lr 0.02475
Train [8][2300/3239]	Time 0.557 (0.850)	Data Time 0.001 (0.010)	Loss 3.9501 (3.8409)	Entropy 1.62153 (1.64147)	Top-1 acc 34.766 (34.021)	Top-5 acc 53.906 (57.976)	lr 0.02475
Train [8][2310/3239]	Time 0.524 (0.850)	Data Time 0.001 (0.010)	Loss 3.8216 (3.8408)	Entropy 1.62158 (1.64139)	Top-1 acc 33.594 (34.023)	Top-5 acc 58.594 (57.978)	lr 0.02475
Train [8][2320/3239]	Time 0.547 (0.850)	Data Time 0.001 (0.010)	Loss 3.8018 (3.8406)	Entropy 1.62144 (1.64130)	Top-1 acc 32.422 (34.028)	Top-5 acc 58.984 (57.981)	lr 0.02475
Train [8][2330/3239]	Time 0.583 (0.850)	Data Time 0.001 (0.010)	Loss 3.8148 (3.8404)	Entropy 1.62140 (1.64121)	Top-1 acc 33.984 (34.030)	Top-5 acc 58.984 (57.986)	lr 0.02475
Train [8][2340/3239]	Time 0.632 (0.850)	Data Time 0.002 (0.010)	Loss 3.7609 (3.8403)	Entropy 1.62105 (1.64113)	Top-1 acc 35.156 (34.030)	Top-5 acc 59.766 (57.986)	lr 0.02475
Train [8][2350/3239]	Time 0.536 (0.850)	Data Time 0.001 (0.010)	Loss 3.9647 (3.8403)	Entropy 1.62086 (1.64104)	Top-1 acc 28.906 (34.030)	Top-5 acc 52.734 (57.986)	lr 0.02475
Train [8][2360/3239]	Time 0.546 (0.850)	Data Time 0.001 (0.010)	Loss 3.9533 (3.8404)	Entropy 1.62070 (1.64096)	Top-1 acc 33.203 (34.026)	Top-5 acc 56.641 (57.987)	lr 0.02475
Train [8][2370/3239]	Time 0.603 (0.849)	Data Time 0.002 (0.010)	Loss 3.8207 (3.8401)	Entropy 1.62058 (1.64087)	Top-1 acc 34.375 (34.033)	Top-5 acc 58.984 (57.994)	lr 0.02474
Train [8][2380/3239]	Time 0.563 (0.849)	Data Time 0.001 (0.010)	Loss 4.0760 (3.8402)	Entropy 1.62037 (1.64079)	Top-1 acc 32.812 (34.037)	Top-5 acc 53.125 (57.990)	lr 0.02474
Train [8][2390/3239]	Time 0.487 (0.849)	Data Time 0.001 (0.010)	Loss 3.8717 (3.8399)	Entropy 1.62023 (1.64070)	Top-1 acc 30.859 (34.037)	Top-5 acc 58.203 (57.996)	lr 0.02474
Train [8][2400/3239]	Time 0.511 (0.849)	Data Time 0.001 (0.010)	Loss 3.8404 (3.8400)	Entropy 1.61993 (1.64062)	Top-1 acc 33.594 (34.040)	Top-5 acc 56.641 (57.995)	lr 0.02474
Train [8][2410/3239]	Time 0.527 (0.848)	Data Time 0.001 (0.010)	Loss 3.8941 (3.8400)	Entropy 1.61966 (1.64053)	Top-1 acc 30.859 (34.037)	Top-5 acc 58.203 (57.991)	lr 0.02474
Train [8][2420/3239]	Time 0.614 (0.848)	Data Time 0.001 (0.010)	Loss 3.5615 (3.8399)	Entropy 1.61943 (1.64044)	Top-1 acc 34.375 (34.033)	Top-5 acc 64.453 (57.997)	lr 0.02474
Train [8][2430/3239]	Time 0.560 (0.848)	Data Time 0.001 (0.010)	Loss 3.8841 (3.8399)	Entropy 1.61904 (1.64036)	Top-1 acc 33.203 (34.033)	Top-5 acc 58.203 (58.000)	lr 0.02474
Train [8][2440/3239]	Time 0.633 (0.848)	Data Time 0.001 (0.010)	Loss 3.8480 (3.8399)	Entropy 1.61884 (1.64027)	Top-1 acc 32.812 (34.035)	Top-5 acc 56.641 (57.996)	lr 0.02474
Train [8][2450/3239]	Time 0.595 (0.848)	Data Time 0.001 (0.010)	Loss 4.0799 (3.8400)	Entropy 1.61863 (1.64018)	Top-1 acc 29.688 (34.035)	Top-5 acc 50.000 (57.995)	lr 0.02474
Train [8][2460/3239]	Time 0.584 (0.848)	Data Time 0.001 (0.010)	Loss 3.7669 (3.8398)	Entropy 1.61833 (1.64009)	Top-1 acc 33.203 (34.040)	Top-5 acc 55.469 (58.001)	lr 0.02474
Train [8][2470/3239]	Time 0.510 (0.848)	Data Time 0.001 (0.009)	Loss 3.7652 (3.8396)	Entropy 1.61813 (1.64001)	Top-1 acc 35.938 (34.039)	Top-5 acc 65.234 (58.007)	lr 0.02474
Train [8][2480/3239]	Time 0.595 (0.848)	Data Time 0.001 (0.009)	Loss 3.7829 (3.8396)	Entropy 1.61782 (1.63992)	Top-1 acc 35.547 (34.038)	Top-5 acc 60.156 (58.008)	lr 0.02474
Train [8][2490/3239]	Time 0.526 (0.847)	Data Time 0.001 (0.009)	Loss 3.7467 (3.8395)	Entropy 1.61752 (1.63983)	Top-1 acc 35.156 (34.043)	Top-5 acc 59.766 (58.009)	lr 0.02474
Train [8][2500/3239]	Time 0.571 (0.847)	Data Time 0.001 (0.009)	Loss 3.9900 (3.8394)	Entropy 1.61724 (1.63974)	Top-1 acc 30.859 (34.042)	Top-5 acc 54.297 (58.013)	lr 0.02474
Train [8][2510/3239]	Time 0.650 (0.847)	Data Time 0.002 (0.009)	Loss 3.6445 (3.8392)	Entropy 1.61691 (1.63965)	Top-1 acc 39.453 (34.048)	Top-5 acc 60.938 (58.018)	lr 0.02474
Train [8][2520/3239]	Time 0.631 (0.847)	Data Time 0.001 (0.009)	Loss 3.7117 (3.8391)	Entropy 1.61682 (1.63956)	Top-1 acc 33.203 (34.052)	Top-5 acc 63.281 (58.022)	lr 0.02474
Train [8][2530/3239]	Time 0.610 (0.847)	Data Time 0.001 (0.009)	Loss 3.6012 (3.8388)	Entropy 1.61683 (1.63947)	Top-1 acc 39.453 (34.053)	Top-5 acc 61.328 (58.027)	lr 0.02474
Train [8][2540/3239]	Time 0.544 (0.847)	Data Time 0.001 (0.009)	Loss 4.0668 (3.8388)	Entropy 1.61655 (1.63938)	Top-1 acc 31.250 (34.054)	Top-5 acc 51.172 (58.023)	lr 0.02474
Train [8][2550/3239]	Time 0.632 (0.847)	Data Time 0.001 (0.009)	Loss 3.7916 (3.8388)	Entropy 1.61655 (1.63929)	Top-1 acc 37.109 (34.053)	Top-5 acc 57.031 (58.023)	lr 0.02474
Train [8][2560/3239]	Time 0.633 (0.846)	Data Time 0.001 (0.009)	Loss 3.6067 (3.8386)	Entropy 1.61616 (1.63920)	Top-1 acc 41.406 (34.057)	Top-5 acc 63.672 (58.025)	lr 0.02474
Train [8][2570/3239]	Time 0.561 (0.846)	Data Time 0.001 (0.009)	Loss 3.8776 (3.8387)	Entropy 1.61605 (1.63911)	Top-1 acc 32.422 (34.058)	Top-5 acc 58.203 (58.024)	lr 0.02474
Train [8][2580/3239]	Time 0.467 (0.846)	Data Time 0.001 (0.009)	Loss 3.6714 (3.8387)	Entropy 1.61598 (1.63902)	Top-1 acc 36.719 (34.057)	Top-5 acc 61.719 (58.024)	lr 0.02474
Train [8][2590/3239]	Time 0.495 (0.846)	Data Time 0.001 (0.009)	Loss 4.0094 (3.8390)	Entropy 1.61578 (1.63893)	Top-1 acc 30.859 (34.050)	Top-5 acc 53.516 (58.018)	lr 0.02474
Train [8][2600/3239]	Time 0.570 (0.846)	Data Time 0.001 (0.009)	Loss 3.8715 (3.8388)	Entropy 1.61566 (1.63884)	Top-1 acc 29.297 (34.056)	Top-5 acc 58.594 (58.026)	lr 0.02474
Train [8][2610/3239]	Time 0.580 (0.846)	Data Time 0.001 (0.009)	Loss 3.9587 (3.8386)	Entropy 1.61545 (1.63875)	Top-1 acc 34.375 (34.061)	Top-5 acc 57.422 (58.032)	lr 0.02474
Train [8][2620/3239]	Time 0.526 (0.845)	Data Time 0.001 (0.009)	Loss 3.8042 (3.8383)	Entropy 1.61530 (1.63866)	Top-1 acc 35.547 (34.065)	Top-5 acc 58.984 (58.039)	lr 0.02474
Train [8][2630/3239]	Time 0.708 (0.845)	Data Time 0.001 (0.009)	Loss 3.7781 (3.8381)	Entropy 1.61478 (1.63857)	Top-1 acc 32.812 (34.069)	Top-5 acc 58.594 (58.043)	lr 0.02474
Train [8][2640/3239]	Time 0.532 (0.845)	Data Time 0.001 (0.009)	Loss 3.8837 (3.8380)	Entropy 1.61483 (1.63848)	Top-1 acc 30.469 (34.069)	Top-5 acc 55.859 (58.042)	lr 0.02474
Train [8][2650/3239]	Time 0.550 (0.845)	Data Time 0.001 (0.009)	Loss 3.8646 (3.8380)	Entropy 1.61472 (1.63839)	Top-1 acc 31.250 (34.064)	Top-5 acc 57.031 (58.043)	lr 0.02474
Train [8][2660/3239]	Time 0.530 (0.845)	Data Time 0.001 (0.009)	Loss 3.7017 (3.8379)	Entropy 1.61439 (1.63830)	Top-1 acc 35.156 (34.067)	Top-5 acc 61.328 (58.045)	lr 0.02474
Train [8][2670/3239]	Time 0.535 (0.845)	Data Time 0.001 (0.009)	Loss 4.0287 (3.8380)	Entropy 1.61461 (1.63822)	Top-1 acc 34.766 (34.064)	Top-5 acc 51.172 (58.041)	lr 0.02474
Train [8][2680/3239]	Time 0.516 (0.845)	Data Time 0.001 (0.009)	Loss 3.7448 (3.8378)	Entropy 1.61461 (1.63813)	Top-1 acc 34.766 (34.067)	Top-5 acc 58.984 (58.043)	lr 0.02474
Train [8][2690/3239]	Time 0.564 (0.845)	Data Time 0.001 (0.009)	Loss 3.8023 (3.8377)	Entropy 1.61429 (1.63804)	Top-1 acc 33.984 (34.068)	Top-5 acc 58.594 (58.048)	lr 0.02474
Train [8][2700/3239]	Time 0.640 (0.845)	Data Time 0.001 (0.009)	Loss 3.8350 (3.8377)	Entropy 1.61414 (1.63795)	Top-1 acc 34.766 (34.072)	Top-5 acc 55.859 (58.046)	lr 0.02474
Train [8][2710/3239]	Time 0.588 (0.844)	Data Time 0.002 (0.009)	Loss 3.8593 (3.8377)	Entropy 1.61410 (1.63786)	Top-1 acc 33.203 (34.071)	Top-5 acc 59.766 (58.043)	lr 0.02474
Train [8][2720/3239]	Time 0.604 (0.844)	Data Time 0.001 (0.009)	Loss 3.6649 (3.8377)	Entropy 1.61385 (1.63778)	Top-1 acc 35.547 (34.072)	Top-5 acc 63.281 (58.042)	lr 0.02474
Train [8][2730/3239]	Time 0.427 (0.844)	Data Time 0.001 (0.009)	Loss 3.7724 (3.8378)	Entropy 1.61389 (1.63769)	Top-1 acc 35.547 (34.069)	Top-5 acc 60.547 (58.039)	lr 0.02474
Train [8][2740/3239]	Time 0.556 (0.844)	Data Time 0.001 (0.009)	Loss 3.8072 (3.8377)	Entropy 1.61387 (1.63760)	Top-1 acc 39.062 (34.072)	Top-5 acc 58.594 (58.038)	lr 0.02474
Train [8][2750/3239]	Time 0.528 (0.844)	Data Time 0.001 (0.009)	Loss 3.8642 (3.8375)	Entropy 1.61363 (1.63751)	Top-1 acc 35.938 (34.074)	Top-5 acc 57.031 (58.041)	lr 0.02474
Train [8][2760/3239]	Time 0.621 (0.844)	Data Time 0.001 (0.009)	Loss 3.7911 (3.8376)	Entropy 1.61353 (1.63743)	Top-1 acc 32.031 (34.070)	Top-5 acc 57.031 (58.037)	lr 0.02474
Train [8][2770/3239]	Time 0.551 (0.844)	Data Time 0.001 (0.009)	Loss 3.5203 (3.8374)	Entropy 1.61326 (1.63734)	Top-1 acc 41.797 (34.076)	Top-5 acc 64.844 (58.045)	lr 0.02474
Train [8][2780/3239]	Time 0.587 (0.843)	Data Time 0.001 (0.009)	Loss 3.9527 (3.8372)	Entropy 1.61332 (1.63726)	Top-1 acc 31.641 (34.082)	Top-5 acc 50.000 (58.047)	lr 0.02474
Train [8][2790/3239]	Time 0.592 (0.843)	Data Time 0.001 (0.009)	Loss 3.7538 (3.8372)	Entropy 1.61307 (1.63717)	Top-1 acc 36.328 (34.081)	Top-5 acc 60.156 (58.045)	lr 0.02474
Train [8][2800/3239]	Time 0.508 (0.843)	Data Time 0.001 (0.009)	Loss 3.9148 (3.8370)	Entropy 1.61266 (1.63708)	Top-1 acc 32.031 (34.081)	Top-5 acc 55.859 (58.049)	lr 0.02474
Train [8][2810/3239]	Time 0.505 (0.843)	Data Time 0.001 (0.009)	Loss 4.0624 (3.8370)	Entropy 1.61250 (1.63700)	Top-1 acc 33.594 (34.085)	Top-5 acc 53.125 (58.048)	lr 0.02474
Train [8][2820/3239]	Time 0.494 (0.843)	Data Time 0.002 (0.009)	Loss 3.8058 (3.8368)	Entropy 1.61229 (1.63691)	Top-1 acc 37.500 (34.091)	Top-5 acc 62.891 (58.059)	lr 0.02474
Train [8][2830/3239]	Time 0.552 (0.843)	Data Time 0.001 (0.009)	Loss 3.9423 (3.8369)	Entropy 1.61183 (1.63682)	Top-1 acc 32.031 (34.085)	Top-5 acc 59.766 (58.056)	lr 0.02474
Train [8][2840/3239]	Time 0.715 (0.850)	Data Time 0.002 (0.009)	Loss 3.7956 (3.8370)	Entropy 1.61164 (1.63673)	Top-1 acc 32.812 (34.081)	Top-5 acc 59.766 (58.052)	lr 0.02474
Train [8][2850/3239]	Time 0.547 (0.850)	Data Time 0.002 (0.009)	Loss 3.9495 (3.8371)	Entropy 1.61129 (1.63664)	Top-1 acc 30.859 (34.078)	Top-5 acc 53.125 (58.049)	lr 0.02473
Train [8][2860/3239]	Time 0.614 (0.850)	Data Time 0.002 (0.009)	Loss 3.6843 (3.8371)	Entropy 1.61101 (1.63655)	Top-1 acc 40.234 (34.078)	Top-5 acc 59.375 (58.048)	lr 0.02473
Train [8][2870/3239]	Time 0.547 (0.850)	Data Time 0.001 (0.009)	Loss 3.8314 (3.8373)	Entropy 1.61108 (1.63647)	Top-1 acc 32.812 (34.072)	Top-5 acc 61.328 (58.042)	lr 0.02473
Train [8][2880/3239]	Time 0.539 (0.849)	Data Time 0.001 (0.009)	Loss 3.8777 (3.8373)	Entropy 1.61113 (1.63638)	Top-1 acc 33.984 (34.070)	Top-5 acc 55.078 (58.046)	lr 0.02473
Train [8][2890/3239]	Time 0.513 (0.849)	Data Time 0.003 (0.009)	Loss 3.9010 (3.8373)	Entropy 1.61087 (1.63629)	Top-1 acc 32.422 (34.074)	Top-5 acc 55.078 (58.048)	lr 0.02473
Train [8][2900/3239]	Time 0.579 (0.849)	Data Time 0.001 (0.009)	Loss 3.9682 (3.8371)	Entropy 1.61079 (1.63620)	Top-1 acc 30.078 (34.075)	Top-5 acc 54.688 (58.049)	lr 0.02473
Train [8][2910/3239]	Time 0.539 (0.849)	Data Time 0.001 (0.008)	Loss 3.9038 (3.8370)	Entropy 1.61046 (1.63611)	Top-1 acc 34.766 (34.076)	Top-5 acc 58.594 (58.052)	lr 0.02473
Train [8][2920/3239]	Time 0.621 (0.849)	Data Time 0.001 (0.008)	Loss 3.9245 (3.8369)	Entropy 1.61018 (1.63603)	Top-1 acc 36.328 (34.079)	Top-5 acc 55.469 (58.052)	lr 0.02473
Train [8][2930/3239]	Time 0.528 (0.849)	Data Time 0.001 (0.008)	Loss 3.9386 (3.8369)	Entropy 1.61004 (1.63594)	Top-1 acc 29.688 (34.078)	Top-5 acc 56.250 (58.051)	lr 0.02473
Train [8][2940/3239]	Time 0.593 (0.849)	Data Time 0.003 (0.008)	Loss 4.0696 (3.8371)	Entropy 1.60999 (1.63585)	Top-1 acc 30.078 (34.078)	Top-5 acc 55.469 (58.048)	lr 0.02473
Train [8][2950/3239]	Time 0.585 (0.849)	Data Time 0.001 (0.008)	Loss 3.5401 (3.8370)	Entropy 1.60974 (1.63576)	Top-1 acc 39.062 (34.080)	Top-5 acc 60.156 (58.049)	lr 0.02473
Train [8][2960/3239]	Time 0.566 (0.849)	Data Time 0.001 (0.008)	Loss 3.8628 (3.8370)	Entropy 1.60942 (1.63567)	Top-1 acc 34.766 (34.081)	Top-5 acc 54.688 (58.047)	lr 0.02473
Train [8][2970/3239]	Time 0.553 (0.849)	Data Time 0.001 (0.008)	Loss 3.6688 (3.8368)	Entropy 1.60936 (1.63559)	Top-1 acc 42.578 (34.089)	Top-5 acc 62.891 (58.053)	lr 0.02473
Train [8][2980/3239]	Time 0.606 (0.848)	Data Time 0.001 (0.008)	Loss 3.8340 (3.8368)	Entropy 1.60923 (1.63550)	Top-1 acc 32.422 (34.087)	Top-5 acc 59.766 (58.055)	lr 0.02473
Train [8][2990/3239]	Time 0.591 (0.848)	Data Time 0.001 (0.008)	Loss 3.8691 (3.8366)	Entropy 1.60921 (1.63541)	Top-1 acc 37.500 (34.090)	Top-5 acc 57.422 (58.057)	lr 0.02473
Train [8][3000/3239]	Time 0.570 (0.848)	Data Time 0.001 (0.008)	Loss 3.8093 (3.8366)	Entropy 1.60906 (1.63532)	Top-1 acc 36.328 (34.091)	Top-5 acc 57.422 (58.054)	lr 0.02473
Train [8][3010/3239]	Time 0.593 (0.848)	Data Time 0.001 (0.008)	Loss 3.7843 (3.8365)	Entropy 1.60914 (1.63524)	Top-1 acc 33.594 (34.095)	Top-5 acc 60.156 (58.059)	lr 0.02473
Train [8][3020/3239]	Time 0.535 (0.848)	Data Time 0.001 (0.008)	Loss 3.8467 (3.8367)	Entropy 1.60869 (1.63515)	Top-1 acc 32.812 (34.090)	Top-5 acc 57.812 (58.054)	lr 0.02473
Train [8][3030/3239]	Time 0.677 (0.848)	Data Time 0.001 (0.008)	Loss 3.6872 (3.8367)	Entropy 1.60868 (1.63506)	Top-1 acc 38.672 (34.092)	Top-5 acc 61.719 (58.053)	lr 0.02473
Train [8][3040/3239]	Time 0.563 (0.848)	Data Time 0.001 (0.008)	Loss 3.7526 (3.8367)	Entropy 1.60861 (1.63497)	Top-1 acc 41.406 (34.094)	Top-5 acc 61.719 (58.052)	lr 0.02473
Train [8][3050/3239]	Time 0.579 (0.848)	Data Time 0.001 (0.008)	Loss 3.6681 (3.8366)	Entropy 1.60859 (1.63489)	Top-1 acc 38.281 (34.097)	Top-5 acc 62.109 (58.058)	lr 0.02473
Train [8][3060/3239]	Time 0.571 (0.847)	Data Time 0.001 (0.008)	Loss 4.1381 (3.8368)	Entropy 1.60847 (1.63480)	Top-1 acc 28.125 (34.094)	Top-5 acc 50.391 (58.053)	lr 0.02473
Train [8][3070/3239]	Time 0.605 (0.847)	Data Time 0.001 (0.008)	Loss 3.7641 (3.8366)	Entropy 1.60836 (1.63472)	Top-1 acc 34.766 (34.097)	Top-5 acc 60.156 (58.059)	lr 0.02473
Train [8][3080/3239]	Time 0.601 (0.847)	Data Time 0.001 (0.008)	Loss 3.8320 (3.8365)	Entropy 1.60840 (1.63463)	Top-1 acc 34.375 (34.098)	Top-5 acc 60.156 (58.063)	lr 0.02473
Train [8][3090/3239]	Time 0.567 (0.847)	Data Time 0.001 (0.008)	Loss 3.7276 (3.8364)	Entropy 1.60827 (1.63455)	Top-1 acc 36.719 (34.104)	Top-5 acc 59.766 (58.066)	lr 0.02473
Train [8][3100/3239]	Time 0.687 (0.847)	Data Time 0.001 (0.008)	Loss 3.5963 (3.8362)	Entropy 1.60791 (1.63446)	Top-1 acc 35.547 (34.105)	Top-5 acc 64.062 (58.068)	lr 0.02473
Train [8][3110/3239]	Time 0.547 (0.847)	Data Time 0.001 (0.008)	Loss 3.5693 (3.8363)	Entropy 1.60784 (1.63438)	Top-1 acc 43.359 (34.107)	Top-5 acc 62.891 (58.068)	lr 0.02473
Train [8][3120/3239]	Time 0.590 (0.847)	Data Time 0.001 (0.008)	Loss 3.7658 (3.8363)	Entropy 1.60773 (1.63429)	Top-1 acc 31.250 (34.106)	Top-5 acc 57.422 (58.068)	lr 0.02473
Train [8][3130/3239]	Time 0.555 (0.847)	Data Time 0.001 (0.008)	Loss 3.8983 (3.8364)	Entropy 1.60772 (1.63421)	Top-1 acc 33.984 (34.103)	Top-5 acc 57.812 (58.069)	lr 0.02473
Train [8][3140/3239]	Time 0.518 (0.847)	Data Time 0.039 (0.008)	Loss 3.7779 (3.8364)	Entropy 1.60773 (1.63412)	Top-1 acc 34.375 (34.106)	Top-5 acc 59.766 (58.068)	lr 0.02473
Train [8][3150/3239]	Time 0.605 (0.847)	Data Time 0.001 (0.008)	Loss 3.8591 (3.8363)	Entropy 1.60765 (1.63404)	Top-1 acc 32.812 (34.112)	Top-5 acc 60.938 (58.073)	lr 0.02473
Train [8][3160/3239]	Time 0.605 (0.846)	Data Time 0.001 (0.008)	Loss 3.8058 (3.8363)	Entropy 1.60750 (1.63395)	Top-1 acc 34.766 (34.108)	Top-5 acc 60.938 (58.075)	lr 0.02473
Train [8][3170/3239]	Time 0.663 (0.846)	Data Time 0.001 (0.008)	Loss 3.7024 (3.8363)	Entropy 1.60731 (1.63387)	Top-1 acc 33.594 (34.107)	Top-5 acc 64.453 (58.074)	lr 0.02473
Train [8][3180/3239]	Time 0.576 (0.846)	Data Time 0.000 (0.008)	Loss 3.6035 (3.8361)	Entropy 1.60721 (1.63379)	Top-1 acc 38.672 (34.111)	Top-5 acc 61.719 (58.075)	lr 0.02473
Train [8][3190/3239]	Time 0.610 (0.846)	Data Time 0.000 (0.008)	Loss 3.7270 (3.8360)	Entropy 1.60704 (1.63370)	Top-1 acc 35.547 (34.111)	Top-5 acc 58.984 (58.080)	lr 0.02473
Train [8][3200/3239]	Time 0.587 (0.846)	Data Time 0.000 (0.008)	Loss 3.6205 (3.8357)	Entropy 1.60672 (1.63362)	Top-1 acc 37.109 (34.120)	Top-5 acc 62.891 (58.086)	lr 0.02473
Train [8][3210/3239]	Time 0.529 (0.846)	Data Time 0.000 (0.008)	Loss 3.8795 (3.8357)	Entropy 1.60648 (1.63354)	Top-1 acc 33.203 (34.119)	Top-5 acc 53.125 (58.082)	lr 0.02473
Train [8][3220/3239]	Time 0.575 (0.846)	Data Time 0.000 (0.008)	Loss 3.5269 (3.8354)	Entropy 1.60623 (1.63345)	Top-1 acc 39.453 (34.121)	Top-5 acc 63.281 (58.086)	lr 0.02473
Train [8][3230/3239]	Time 0.514 (0.845)	Data Time 0.000 (0.008)	Loss 3.8179 (3.8352)	Entropy 1.60604 (1.63337)	Top-1 acc 35.156 (34.125)	Top-5 acc 56.641 (58.088)	lr 0.02473
Train [8][3239/3239]	Time 1.491 (0.845)	Data Time 0.000 (0.008)	Loss 4.0979 (3.8351)	Entropy 1.60601 (1.63329)	Top-1 acc 30.864 (34.128)	Top-5 acc 50.617 (58.088)	lr 0.02473
==========Valid [8/120]	loss 2.644	top-1 acc 43.525 (43.525)	top-5 acc 68.264	Train top-1 34.128	top-5 58.088	Entropy 1.60601	Latency-None: 0.000ms	Flops: 542.77M
Train [9][0/3239]	Time 18.007 (18.007)	Data Time 16.564 (16.564)	Loss 3.7925 (3.7925)	Entropy 1.60595 (1.60595)	Top-1 acc 37.500 (37.500)	Top-5 acc 62.500 (62.500)	lr 0.02473
Train [9][10/3239]	Time 0.550 (2.449)	Data Time 0.001 (1.510)	Loss 3.7993 (3.8297)	Entropy 1.60559 (1.60588)	Top-1 acc 33.984 (33.629)	Top-5 acc 60.938 (58.913)	lr 0.02473
Train [9][20/3239]	Time 0.563 (1.651)	Data Time 0.001 (0.792)	Loss 3.7759 (3.8245)	Entropy 1.60497 (1.60566)	Top-1 acc 33.984 (33.929)	Top-5 acc 60.156 (58.891)	lr 0.02473
Train [9][30/3239]	Time 0.579 (1.371)	Data Time 0.001 (0.537)	Loss 3.5535 (3.8428)	Entropy 1.60473 (1.60540)	Top-1 acc 37.891 (33.430)	Top-5 acc 64.062 (58.317)	lr 0.02473
Train [9][40/3239]	Time 0.419 (1.226)	Data Time 0.001 (0.407)	Loss 3.8964 (3.8295)	Entropy 1.60439 (1.60520)	Top-1 acc 35.938 (33.965)	Top-5 acc 54.688 (58.641)	lr 0.02473
Train [9][50/3239]	Time 0.668 (1.139)	Data Time 0.001 (0.327)	Loss 3.8488 (3.8290)	Entropy 1.60421 (1.60503)	Top-1 acc 32.422 (34.015)	Top-5 acc 59.766 (58.601)	lr 0.02473
Train [9][60/3239]	Time 0.591 (1.084)	Data Time 0.001 (0.274)	Loss 3.9946 (3.8145)	Entropy 1.60421 (1.60490)	Top-1 acc 29.688 (34.253)	Top-5 acc 55.469 (58.920)	lr 0.02473
Train [9][70/3239]	Time 0.530 (1.045)	Data Time 0.001 (0.236)	Loss 3.6844 (3.8153)	Entropy 1.60410 (1.60480)	Top-1 acc 41.406 (34.237)	Top-5 acc 63.281 (58.918)	lr 0.02473
Train [9][80/3239]	Time 0.553 (1.016)	Data Time 0.001 (0.207)	Loss 3.8151 (3.8171)	Entropy 1.60427 (1.60472)	Top-1 acc 34.766 (34.211)	Top-5 acc 57.031 (58.873)	lr 0.02473
Train [9][90/3239]	Time 0.542 (0.992)	Data Time 0.001 (0.185)	Loss 3.7135 (3.8190)	Entropy 1.60393 (1.60465)	Top-1 acc 35.547 (34.190)	Top-5 acc 59.766 (58.813)	lr 0.02472
Train [9][100/3239]	Time 0.601 (0.974)	Data Time 0.001 (0.167)	Loss 3.7556 (3.8117)	Entropy 1.60370 (1.60458)	Top-1 acc 33.594 (34.491)	Top-5 acc 62.500 (58.880)	lr 0.02472
Train [9][110/3239]	Time 0.596 (0.961)	Data Time 0.001 (0.152)	Loss 3.8751 (3.8058)	Entropy 1.60375 (1.60450)	Top-1 acc 32.812 (34.646)	Top-5 acc 58.594 (58.963)	lr 0.02472
Train [9][120/3239]	Time 0.617 (0.949)	Data Time 0.001 (0.139)	Loss 3.9736 (3.8002)	Entropy 1.60337 (1.60442)	Top-1 acc 33.594 (34.762)	Top-5 acc 56.250 (59.136)	lr 0.02472
Train [9][130/3239]	Time 0.571 (0.939)	Data Time 0.001 (0.129)	Loss 3.7431 (3.8009)	Entropy 1.60301 (1.60434)	Top-1 acc 41.406 (34.742)	Top-5 acc 57.422 (59.104)	lr 0.02472
Train [9][140/3239]	Time 0.591 (0.932)	Data Time 0.001 (0.120)	Loss 3.8426 (3.8004)	Entropy 1.60288 (1.60424)	Top-1 acc 33.203 (34.630)	Top-5 acc 55.078 (59.018)	lr 0.02472
Train [9][150/3239]	Time 0.536 (0.925)	Data Time 0.001 (0.112)	Loss 3.7530 (3.7989)	Entropy 1.60282 (1.60415)	Top-1 acc 31.250 (34.660)	Top-5 acc 60.938 (59.018)	lr 0.02472
Train [9][160/3239]	Time 0.557 (0.916)	Data Time 0.002 (0.105)	Loss 3.6928 (3.8001)	Entropy 1.60258 (1.60406)	Top-1 acc 38.672 (34.603)	Top-5 acc 62.500 (58.997)	lr 0.02472
Train [9][170/3239]	Time 0.592 (0.910)	Data Time 0.001 (0.099)	Loss 3.7022 (3.7983)	Entropy 1.60241 (1.60397)	Top-1 acc 36.328 (34.677)	Top-5 acc 58.984 (58.959)	lr 0.02472
Train [9][180/3239]	Time 0.571 (0.906)	Data Time 0.001 (0.094)	Loss 3.8486 (3.7935)	Entropy 1.60234 (1.60388)	Top-1 acc 37.891 (34.845)	Top-5 acc 57.031 (59.075)	lr 0.02472
Train [9][190/3239]	Time 0.405 (0.901)	Data Time 0.001 (0.089)	Loss 3.9358 (3.7916)	Entropy 1.60242 (1.60380)	Top-1 acc 36.328 (34.929)	Top-5 acc 55.078 (59.103)	lr 0.02472
Train [9][200/3239]	Time 0.582 (0.895)	Data Time 0.001 (0.085)	Loss 3.7443 (3.7948)	Entropy 1.60236 (1.60373)	Top-1 acc 32.812 (34.880)	Top-5 acc 60.156 (59.070)	lr 0.02472
Train [9][210/3239]	Time 0.595 (0.891)	Data Time 0.001 (0.081)	Loss 3.7114 (3.7952)	Entropy 1.60205 (1.60366)	Top-1 acc 37.891 (34.880)	Top-5 acc 62.109 (59.071)	lr 0.02472
Train [9][220/3239]	Time 0.572 (0.886)	Data Time 0.001 (0.077)	Loss 3.7033 (3.7953)	Entropy 1.60180 (1.60358)	Top-1 acc 35.547 (34.865)	Top-5 acc 59.766 (59.067)	lr 0.02472
Train [9][230/3239]	Time 0.593 (0.883)	Data Time 0.002 (0.074)	Loss 3.8905 (3.7964)	Entropy 1.60168 (1.60350)	Top-1 acc 32.812 (34.860)	Top-5 acc 57.031 (59.000)	lr 0.02472
Train [9][240/3239]	Time 0.576 (0.881)	Data Time 0.001 (0.071)	Loss 3.9204 (3.7998)	Entropy 1.60138 (1.60342)	Top-1 acc 30.469 (34.800)	Top-5 acc 55.859 (58.941)	lr 0.02472
Train [9][250/3239]	Time 0.654 (0.955)	Data Time 0.004 (0.068)	Loss 3.7082 (3.7996)	Entropy 1.60105 (1.60333)	Top-1 acc 37.891 (34.847)	Top-5 acc 60.547 (58.930)	lr 0.02472
Train [9][260/3239]	Time 0.555 (0.950)	Data Time 0.002 (0.066)	Loss 3.7793 (3.8017)	Entropy 1.60084 (1.60324)	Top-1 acc 35.156 (34.822)	Top-5 acc 59.375 (58.911)	lr 0.02472
Train [9][270/3239]	Time 0.539 (0.945)	Data Time 0.001 (0.064)	Loss 3.6161 (3.8021)	Entropy 1.60094 (1.60315)	Top-1 acc 39.844 (34.838)	Top-5 acc 63.672 (58.911)	lr 0.02472
Train [9][280/3239]	Time 0.528 (0.940)	Data Time 0.001 (0.061)	Loss 3.8172 (3.8023)	Entropy 1.60090 (1.60307)	Top-1 acc 35.156 (34.864)	Top-5 acc 57.422 (58.898)	lr 0.02472
Train [9][290/3239]	Time 0.664 (0.936)	Data Time 0.001 (0.059)	Loss 3.5997 (3.8014)	Entropy 1.60044 (1.60299)	Top-1 acc 40.234 (34.868)	Top-5 acc 65.234 (58.907)	lr 0.02472
Train [9][300/3239]	Time 0.590 (0.932)	Data Time 0.001 (0.057)	Loss 3.8667 (3.8029)	Entropy 1.60035 (1.60291)	Top-1 acc 33.984 (34.863)	Top-5 acc 55.859 (58.869)	lr 0.02472
Train [9][310/3239]	Time 0.585 (0.929)	Data Time 0.001 (0.056)	Loss 3.7957 (3.8030)	Entropy 1.59995 (1.60282)	Top-1 acc 33.984 (34.860)	Top-5 acc 58.594 (58.859)	lr 0.02472
Train [9][320/3239]	Time 0.614 (0.925)	Data Time 0.001 (0.054)	Loss 3.9110 (3.8039)	Entropy 1.59953 (1.60273)	Top-1 acc 33.203 (34.813)	Top-5 acc 58.594 (58.861)	lr 0.02472
Train [9][330/3239]	Time 0.588 (0.921)	Data Time 0.001 (0.052)	Loss 3.8649 (3.8044)	Entropy 1.59904 (1.60263)	Top-1 acc 30.469 (34.781)	Top-5 acc 57.422 (58.857)	lr 0.02472
Train [9][340/3239]	Time 0.479 (0.917)	Data Time 0.001 (0.051)	Loss 3.6041 (3.8039)	Entropy 1.59879 (1.60252)	Top-1 acc 40.625 (34.787)	Top-5 acc 62.500 (58.881)	lr 0.02472
Train [9][350/3239]	Time 0.534 (0.914)	Data Time 0.003 (0.050)	Loss 3.9461 (3.8046)	Entropy 1.59852 (1.60241)	Top-1 acc 32.031 (34.786)	Top-5 acc 52.344 (58.836)	lr 0.02472
Train [9][360/3239]	Time 0.589 (0.910)	Data Time 0.001 (0.048)	Loss 3.8816 (3.8037)	Entropy 1.59819 (1.60230)	Top-1 acc 33.984 (34.797)	Top-5 acc 54.297 (58.838)	lr 0.02472
Train [9][370/3239]	Time 0.591 (0.908)	Data Time 0.001 (0.047)	Loss 3.5847 (3.8047)	Entropy 1.59810 (1.60219)	Top-1 acc 36.719 (34.770)	Top-5 acc 63.281 (58.797)	lr 0.02472
Train [9][380/3239]	Time 0.599 (0.905)	Data Time 0.002 (0.046)	Loss 3.9462 (3.8040)	Entropy 1.59795 (1.60208)	Top-1 acc 28.516 (34.789)	Top-5 acc 53.516 (58.805)	lr 0.02472
Train [9][390/3239]	Time 0.569 (0.903)	Data Time 0.001 (0.045)	Loss 3.8028 (3.8039)	Entropy 1.59766 (1.60198)	Top-1 acc 35.156 (34.776)	Top-5 acc 60.547 (58.812)	lr 0.02472
Train [9][400/3239]	Time 0.599 (0.901)	Data Time 0.001 (0.044)	Loss 3.7149 (3.8026)	Entropy 1.59740 (1.60187)	Top-1 acc 35.938 (34.811)	Top-5 acc 64.062 (58.839)	lr 0.02472
Train [9][410/3239]	Time 0.554 (0.899)	Data Time 0.001 (0.043)	Loss 3.6720 (3.8023)	Entropy 1.59712 (1.60175)	Top-1 acc 34.375 (34.811)	Top-5 acc 62.109 (58.864)	lr 0.02472
Train [9][420/3239]	Time 0.579 (0.897)	Data Time 0.001 (0.042)	Loss 3.8551 (3.8019)	Entropy 1.59696 (1.60164)	Top-1 acc 33.594 (34.803)	Top-5 acc 58.203 (58.859)	lr 0.02472
Train [9][430/3239]	Time 0.551 (0.896)	Data Time 0.001 (0.041)	Loss 3.9530 (3.8022)	Entropy 1.59697 (1.60153)	Top-1 acc 32.812 (34.806)	Top-5 acc 55.078 (58.859)	lr 0.02472
Train [9][440/3239]	Time 0.557 (0.894)	Data Time 0.002 (0.040)	Loss 3.6833 (3.8025)	Entropy 1.59676 (1.60143)	Top-1 acc 33.984 (34.803)	Top-5 acc 59.766 (58.845)	lr 0.02472
Train [9][450/3239]	Time 0.568 (0.893)	Data Time 0.001 (0.039)	Loss 3.8311 (3.8012)	Entropy 1.59650 (1.60132)	Top-1 acc 32.422 (34.825)	Top-5 acc 54.688 (58.855)	lr 0.02472
Train [9][460/3239]	Time 0.542 (0.891)	Data Time 0.001 (0.038)	Loss 3.7335 (3.8011)	Entropy 1.59651 (1.60122)	Top-1 acc 32.812 (34.805)	Top-5 acc 63.281 (58.869)	lr 0.02472
Train [9][470/3239]	Time 0.695 (0.890)	Data Time 0.001 (0.038)	Loss 3.8048 (3.8004)	Entropy 1.59601 (1.60112)	Top-1 acc 31.641 (34.827)	Top-5 acc 58.203 (58.859)	lr 0.02472
Train [9][480/3239]	Time 0.533 (0.888)	Data Time 0.001 (0.037)	Loss 3.9613 (3.8006)	Entropy 1.59565 (1.60100)	Top-1 acc 31.641 (34.820)	Top-5 acc 51.562 (58.851)	lr 0.02472
Train [9][490/3239]	Time 0.536 (0.886)	Data Time 0.001 (0.036)	Loss 3.7233 (3.8028)	Entropy 1.59538 (1.60089)	Top-1 acc 33.984 (34.778)	Top-5 acc 62.500 (58.817)	lr 0.02472
Train [9][500/3239]	Time 0.567 (0.885)	Data Time 0.001 (0.035)	Loss 3.7487 (3.8043)	Entropy 1.59509 (1.60078)	Top-1 acc 32.812 (34.740)	Top-5 acc 62.109 (58.811)	lr 0.02472
Train [9][510/3239]	Time 0.560 (0.883)	Data Time 0.001 (0.035)	Loss 3.9128 (3.8049)	Entropy 1.59456 (1.60066)	Top-1 acc 30.859 (34.737)	Top-5 acc 57.422 (58.796)	lr 0.02472
Train [9][520/3239]	Time 0.494 (0.881)	Data Time 0.001 (0.034)	Loss 3.6820 (3.8043)	Entropy 1.59454 (1.60055)	Top-1 acc 38.672 (34.755)	Top-5 acc 59.766 (58.811)	lr 0.02472
Train [9][530/3239]	Time 0.432 (0.879)	Data Time 0.001 (0.034)	Loss 3.7076 (3.8049)	Entropy 1.59446 (1.60043)	Top-1 acc 40.234 (34.766)	Top-5 acc 63.281 (58.796)	lr 0.02472
Train [9][540/3239]	Time 0.686 (0.878)	Data Time 0.001 (0.033)	Loss 3.6980 (3.8035)	Entropy 1.59425 (1.60032)	Top-1 acc 36.719 (34.786)	Top-5 acc 61.719 (58.811)	lr 0.02472
Train [9][550/3239]	Time 0.551 (0.877)	Data Time 0.001 (0.032)	Loss 3.7997 (3.8030)	Entropy 1.59381 (1.60021)	Top-1 acc 35.938 (34.805)	Top-5 acc 60.938 (58.828)	lr 0.02472
Train [9][560/3239]	Time 0.604 (0.876)	Data Time 0.001 (0.032)	Loss 3.6684 (3.8029)	Entropy 1.59388 (1.60009)	Top-1 acc 40.234 (34.797)	Top-5 acc 62.109 (58.837)	lr 0.02471
Train [9][570/3239]	Time 0.567 (0.875)	Data Time 0.001 (0.031)	Loss 3.6237 (3.8017)	Entropy 1.59369 (1.59998)	Top-1 acc 34.375 (34.829)	Top-5 acc 63.281 (58.867)	lr 0.02471
Train [9][580/3239]	Time 0.526 (0.874)	Data Time 0.001 (0.031)	Loss 3.8814 (3.8004)	Entropy 1.59364 (1.59988)	Top-1 acc 32.422 (34.844)	Top-5 acc 58.594 (58.890)	lr 0.02471
Train [9][590/3239]	Time 0.534 (0.873)	Data Time 0.001 (0.030)	Loss 3.6685 (3.7990)	Entropy 1.59361 (1.59977)	Top-1 acc 38.281 (34.895)	Top-5 acc 60.547 (58.930)	lr 0.02471
Train [9][600/3239]	Time 0.597 (0.872)	Data Time 0.001 (0.030)	Loss 3.7240 (3.7978)	Entropy 1.59339 (1.59967)	Top-1 acc 37.500 (34.916)	Top-5 acc 61.719 (58.949)	lr 0.02471
Train [9][610/3239]	Time 0.683 (0.872)	Data Time 0.001 (0.029)	Loss 3.6254 (3.7969)	Entropy 1.59318 (1.59956)	Top-1 acc 38.281 (34.954)	Top-5 acc 66.797 (58.968)	lr 0.02471
Train [9][620/3239]	Time 0.561 (0.871)	Data Time 0.001 (0.029)	Loss 3.8057 (3.7974)	Entropy 1.59325 (1.59946)	Top-1 acc 33.984 (34.940)	Top-5 acc 57.812 (58.946)	lr 0.02471
Train [9][630/3239]	Time 0.638 (0.870)	Data Time 0.001 (0.029)	Loss 3.5472 (3.7963)	Entropy 1.59290 (1.59936)	Top-1 acc 38.672 (34.966)	Top-5 acc 66.406 (58.969)	lr 0.02471
Train [9][640/3239]	Time 0.567 (0.869)	Data Time 0.001 (0.028)	Loss 3.9367 (3.7960)	Entropy 1.59280 (1.59926)	Top-1 acc 30.859 (34.970)	Top-5 acc 57.422 (58.959)	lr 0.02471
Train [9][650/3239]	Time 0.587 (0.869)	Data Time 0.001 (0.028)	Loss 4.0268 (3.7962)	Entropy 1.59275 (1.59916)	Top-1 acc 34.766 (34.969)	Top-5 acc 54.688 (58.947)	lr 0.02471
Train [9][660/3239]	Time 0.637 (0.868)	Data Time 0.001 (0.027)	Loss 3.7255 (3.7950)	Entropy 1.59276 (1.59906)	Top-1 acc 37.500 (34.988)	Top-5 acc 57.812 (58.962)	lr 0.02471
Train [9][670/3239]	Time 0.543 (0.867)	Data Time 0.001 (0.027)	Loss 3.9424 (3.7956)	Entropy 1.59290 (1.59897)	Top-1 acc 33.594 (34.985)	Top-5 acc 60.547 (58.952)	lr 0.02471
Train [9][680/3239]	Time 0.531 (0.866)	Data Time 0.001 (0.027)	Loss 3.7033 (3.7955)	Entropy 1.59271 (1.59888)	Top-1 acc 37.891 (34.996)	Top-5 acc 60.547 (58.961)	lr 0.02471
Train [9][690/3239]	Time 0.534 (0.865)	Data Time 0.004 (0.026)	Loss 3.7546 (3.7955)	Entropy 1.59241 (1.59879)	Top-1 acc 35.156 (35.009)	Top-5 acc 59.375 (58.961)	lr 0.02471
Train [9][700/3239]	Time 0.647 (0.863)	Data Time 0.001 (0.026)	Loss 3.6723 (3.7954)	Entropy 1.59221 (1.59870)	Top-1 acc 32.812 (34.998)	Top-5 acc 61.719 (58.948)	lr 0.02471
Train [9][710/3239]	Time 0.542 (0.862)	Data Time 0.001 (0.026)	Loss 3.9614 (3.7968)	Entropy 1.59227 (1.59861)	Top-1 acc 32.422 (34.979)	Top-5 acc 53.125 (58.924)	lr 0.02471
Train [9][720/3239]	Time 0.529 (0.861)	Data Time 0.001 (0.025)	Loss 3.7153 (3.7979)	Entropy 1.59178 (1.59852)	Top-1 acc 35.547 (34.957)	Top-5 acc 60.547 (58.894)	lr 0.02471
Train [9][730/3239]	Time 0.679 (0.861)	Data Time 0.001 (0.025)	Loss 3.7667 (3.7986)	Entropy 1.59154 (1.59842)	Top-1 acc 40.625 (34.955)	Top-5 acc 60.156 (58.871)	lr 0.02471
Train [9][740/3239]	Time 0.635 (0.860)	Data Time 0.001 (0.025)	Loss 3.8855 (3.7990)	Entropy 1.59121 (1.59833)	Top-1 acc 32.812 (34.936)	Top-5 acc 59.766 (58.864)	lr 0.02471
Train [9][750/3239]	Time 0.589 (0.859)	Data Time 0.001 (0.024)	Loss 3.7449 (3.7999)	Entropy 1.59098 (1.59823)	Top-1 acc 34.375 (34.905)	Top-5 acc 62.109 (58.856)	lr 0.02471
Train [9][760/3239]	Time 0.559 (0.859)	Data Time 0.020 (0.024)	Loss 3.8174 (3.7995)	Entropy 1.59101 (1.59814)	Top-1 acc 35.938 (34.916)	Top-5 acc 57.031 (58.860)	lr 0.02471
Train [9][770/3239]	Time 0.559 (0.858)	Data Time 0.001 (0.024)	Loss 3.7275 (3.7988)	Entropy 1.59069 (1.59804)	Top-1 acc 40.234 (34.948)	Top-5 acc 60.156 (58.873)	lr 0.02471
Train [9][780/3239]	Time 0.590 (0.858)	Data Time 0.001 (0.023)	Loss 3.7654 (3.7985)	Entropy 1.59060 (1.59795)	Top-1 acc 38.672 (34.963)	Top-5 acc 57.812 (58.886)	lr 0.02471
Train [9][790/3239]	Time 0.566 (0.857)	Data Time 0.003 (0.023)	Loss 3.8301 (3.7988)	Entropy 1.59031 (1.59786)	Top-1 acc 33.203 (34.965)	Top-5 acc 58.984 (58.887)	lr 0.02471
Train [9][800/3239]	Time 0.630 (0.857)	Data Time 0.001 (0.023)	Loss 3.9262 (3.7999)	Entropy 1.59030 (1.59776)	Top-1 acc 31.250 (34.931)	Top-5 acc 54.297 (58.853)	lr 0.02471
Train [9][810/3239]	Time 0.586 (0.856)	Data Time 0.001 (0.023)	Loss 3.8439 (3.8001)	Entropy 1.58980 (1.59767)	Top-1 acc 36.328 (34.917)	Top-5 acc 56.250 (58.850)	lr 0.02471
Train [9][820/3239]	Time 0.570 (0.856)	Data Time 0.001 (0.022)	Loss 3.8388 (3.7994)	Entropy 1.58967 (1.59757)	Top-1 acc 37.109 (34.942)	Top-5 acc 57.812 (58.869)	lr 0.02471
Train [9][830/3239]	Time 0.562 (0.855)	Data Time 0.001 (0.022)	Loss 3.7350 (3.7986)	Entropy 1.58967 (1.59748)	Top-1 acc 35.156 (34.956)	Top-5 acc 58.203 (58.878)	lr 0.02471
Train [9][840/3239]	Time 0.593 (0.855)	Data Time 0.001 (0.022)	Loss 3.8693 (3.7986)	Entropy 1.58947 (1.59738)	Top-1 acc 32.422 (34.942)	Top-5 acc 58.594 (58.879)	lr 0.02471
Train [9][850/3239]	Time 0.609 (0.855)	Data Time 0.001 (0.022)	Loss 3.9037 (3.7988)	Entropy 1.58910 (1.59729)	Top-1 acc 32.812 (34.926)	Top-5 acc 56.250 (58.870)	lr 0.02471
Train [9][860/3239]	Time 0.574 (0.854)	Data Time 0.001 (0.021)	Loss 3.4506 (3.7978)	Entropy 1.58902 (1.59719)	Top-1 acc 39.062 (34.935)	Top-5 acc 68.359 (58.898)	lr 0.02471
Train [9][870/3239]	Time 0.592 (0.854)	Data Time 0.001 (0.021)	Loss 3.8211 (3.7976)	Entropy 1.58846 (1.59710)	Top-1 acc 35.547 (34.940)	Top-5 acc 59.375 (58.906)	lr 0.02471
Train [9][880/3239]	Time 0.539 (0.853)	Data Time 0.001 (0.021)	Loss 3.9216 (3.7970)	Entropy 1.58805 (1.59700)	Top-1 acc 34.375 (34.955)	Top-5 acc 56.641 (58.923)	lr 0.02471
Train [9][890/3239]	Time 0.557 (0.852)	Data Time 0.001 (0.021)	Loss 3.8089 (3.7973)	Entropy 1.58775 (1.59690)	Top-1 acc 35.938 (34.943)	Top-5 acc 60.156 (58.920)	lr 0.02471
Train [9][900/3239]	Time 0.596 (0.852)	Data Time 0.002 (0.021)	Loss 3.6964 (3.7969)	Entropy 1.58723 (1.59679)	Top-1 acc 37.891 (34.946)	Top-5 acc 61.719 (58.937)	lr 0.02471
Train [9][910/3239]	Time 0.508 (0.873)	Data Time 0.002 (0.020)	Loss 3.7732 (3.7967)	Entropy 1.58709 (1.59669)	Top-1 acc 36.328 (34.965)	Top-5 acc 57.812 (58.931)	lr 0.02471
Train [9][920/3239]	Time 0.510 (0.872)	Data Time 0.002 (0.020)	Loss 3.5562 (3.7959)	Entropy 1.58695 (1.59658)	Top-1 acc 40.234 (34.985)	Top-5 acc 64.062 (58.950)	lr 0.02471
Train [9][930/3239]	Time 0.573 (0.871)	Data Time 0.001 (0.020)	Loss 3.8919 (3.7956)	Entropy 1.58672 (1.59648)	Top-1 acc 32.812 (35.008)	Top-5 acc 57.031 (58.952)	lr 0.02471
Train [9][940/3239]	Time 0.605 (0.871)	Data Time 0.001 (0.020)	Loss 3.7829 (3.7961)	Entropy 1.58653 (1.59637)	Top-1 acc 35.156 (34.997)	Top-5 acc 57.812 (58.942)	lr 0.02471
Train [9][950/3239]	Time 0.551 (0.870)	Data Time 0.001 (0.020)	Loss 3.7406 (3.7964)	Entropy 1.58647 (1.59627)	Top-1 acc 34.766 (34.989)	Top-5 acc 58.984 (58.938)	lr 0.02471
Train [9][960/3239]	Time 0.591 (0.870)	Data Time 0.001 (0.020)	Loss 3.7661 (3.7969)	Entropy 1.58648 (1.59617)	Top-1 acc 32.812 (34.982)	Top-5 acc 57.812 (58.921)	lr 0.02471
Train [9][970/3239]	Time 0.526 (0.870)	Data Time 0.001 (0.019)	Loss 3.9362 (3.7970)	Entropy 1.58651 (1.59607)	Top-1 acc 35.156 (34.980)	Top-5 acc 57.031 (58.923)	lr 0.02471
Train [9][980/3239]	Time 0.555 (0.869)	Data Time 0.001 (0.019)	Loss 3.8270 (3.7967)	Entropy 1.58621 (1.59597)	Top-1 acc 37.500 (34.985)	Top-5 acc 60.938 (58.937)	lr 0.02471
Train [9][990/3239]	Time 0.483 (0.869)	Data Time 0.001 (0.019)	Loss 3.7195 (3.7976)	Entropy 1.58614 (1.59587)	Top-1 acc 32.031 (34.952)	Top-5 acc 62.109 (58.913)	lr 0.02471
Train [9][1000/3239]	Time 0.522 (0.868)	Data Time 0.001 (0.019)	Loss 3.7294 (3.7973)	Entropy 1.58622 (1.59578)	Top-1 acc 37.109 (34.963)	Top-5 acc 61.719 (58.934)	lr 0.02471
Train [9][1010/3239]	Time 0.580 (0.867)	Data Time 0.001 (0.019)	Loss 3.8910 (3.7968)	Entropy 1.58582 (1.59568)	Top-1 acc 31.641 (34.968)	Top-5 acc 58.594 (58.941)	lr 0.02471
Train [9][1020/3239]	Time 0.500 (0.866)	Data Time 0.001 (0.019)	Loss 3.7244 (3.7968)	Entropy 1.58556 (1.59558)	Top-1 acc 38.672 (34.968)	Top-5 acc 60.547 (58.948)	lr 0.02471
Train [9][1030/3239]	Time 0.567 (0.866)	Data Time 0.001 (0.018)	Loss 3.8716 (3.7970)	Entropy 1.58534 (1.59548)	Top-1 acc 34.375 (34.966)	Top-5 acc 58.203 (58.951)	lr 0.02470
Train [9][1040/3239]	Time 0.529 (0.865)	Data Time 0.001 (0.018)	Loss 3.5992 (3.7971)	Entropy 1.58525 (1.59539)	Top-1 acc 40.625 (34.969)	Top-5 acc 64.453 (58.943)	lr 0.02470
Train [9][1050/3239]	Time 0.586 (0.865)	Data Time 0.001 (0.018)	Loss 3.6595 (3.7967)	Entropy 1.58492 (1.59529)	Top-1 acc 36.328 (34.980)	Top-5 acc 60.938 (58.945)	lr 0.02470
Train [9][1060/3239]	Time 0.578 (0.865)	Data Time 0.001 (0.018)	Loss 3.5149 (3.7969)	Entropy 1.58491 (1.59519)	Top-1 acc 40.625 (34.975)	Top-5 acc 61.719 (58.943)	lr 0.02470
Train [9][1070/3239]	Time 0.610 (0.864)	Data Time 0.001 (0.018)	Loss 3.8307 (3.7966)	Entropy 1.58437 (1.59509)	Top-1 acc 33.594 (34.978)	Top-5 acc 57.031 (58.946)	lr 0.02470
Train [9][1080/3239]	Time 0.701 (0.864)	Data Time 0.002 (0.018)	Loss 3.5977 (3.7959)	Entropy 1.58455 (1.59500)	Top-1 acc 39.062 (34.984)	Top-5 acc 65.234 (58.960)	lr 0.02470
Train [9][1090/3239]	Time 0.503 (0.863)	Data Time 0.001 (0.018)	Loss 3.8445 (3.7961)	Entropy 1.58420 (1.59490)	Top-1 acc 32.812 (34.980)	Top-5 acc 56.641 (58.964)	lr 0.02470
Train [9][1100/3239]	Time 0.606 (0.863)	Data Time 0.001 (0.017)	Loss 3.7478 (3.7962)	Entropy 1.58406 (1.59480)	Top-1 acc 36.328 (34.972)	Top-5 acc 62.109 (58.963)	lr 0.02470
Train [9][1110/3239]	Time 0.637 (0.863)	Data Time 0.004 (0.017)	Loss 3.5980 (3.7961)	Entropy 1.58403 (1.59471)	Top-1 acc 41.406 (34.973)	Top-5 acc 60.156 (58.964)	lr 0.02470
Train [9][1120/3239]	Time 0.591 (0.862)	Data Time 0.001 (0.017)	Loss 3.7359 (3.7962)	Entropy 1.58407 (1.59461)	Top-1 acc 36.328 (34.968)	Top-5 acc 60.938 (58.960)	lr 0.02470
Train [9][1130/3239]	Time 0.567 (0.862)	Data Time 0.001 (0.017)	Loss 3.7672 (3.7962)	Entropy 1.58401 (1.59452)	Top-1 acc 34.375 (34.961)	Top-5 acc 60.156 (58.969)	lr 0.02470
Train [9][1140/3239]	Time 0.533 (0.862)	Data Time 0.001 (0.017)	Loss 3.6424 (3.7959)	Entropy 1.58396 (1.59442)	Top-1 acc 34.766 (34.961)	Top-5 acc 64.844 (58.980)	lr 0.02470
Train [9][1150/3239]	Time 0.684 (0.861)	Data Time 0.001 (0.017)	Loss 3.9746 (3.7961)	Entropy 1.58379 (1.59433)	Top-1 acc 33.984 (34.959)	Top-5 acc 57.422 (58.972)	lr 0.02470
Train [9][1160/3239]	Time 0.569 (0.861)	Data Time 0.001 (0.017)	Loss 3.6221 (3.7960)	Entropy 1.58340 (1.59424)	Top-1 acc 38.281 (34.965)	Top-5 acc 66.016 (58.980)	lr 0.02470
Train [9][1170/3239]	Time 0.603 (0.860)	Data Time 0.001 (0.016)	Loss 3.8930 (3.7962)	Entropy 1.58322 (1.59415)	Top-1 acc 34.766 (34.963)	Top-5 acc 57.422 (58.974)	lr 0.02470
Train [9][1180/3239]	Time 0.517 (0.860)	Data Time 0.002 (0.016)	Loss 3.8143 (3.7972)	Entropy 1.58304 (1.59405)	Top-1 acc 32.422 (34.948)	Top-5 acc 58.203 (58.956)	lr 0.02470
Train [9][1190/3239]	Time 0.562 (0.859)	Data Time 0.001 (0.016)	Loss 3.8667 (3.7969)	Entropy 1.58299 (1.59396)	Top-1 acc 32.812 (34.951)	Top-5 acc 59.766 (58.969)	lr 0.02470
Train [9][1200/3239]	Time 0.570 (0.858)	Data Time 0.001 (0.016)	Loss 3.7009 (3.7968)	Entropy 1.58268 (1.59387)	Top-1 acc 32.031 (34.940)	Top-5 acc 64.453 (58.974)	lr 0.02470
Train [9][1210/3239]	Time 0.554 (0.858)	Data Time 0.001 (0.016)	Loss 3.8754 (3.7967)	Entropy 1.58261 (1.59378)	Top-1 acc 32.031 (34.941)	Top-5 acc 58.984 (58.978)	lr 0.02470
Train [9][1220/3239]	Time 0.689 (0.858)	Data Time 0.001 (0.016)	Loss 3.7949 (3.7969)	Entropy 1.58223 (1.59368)	Top-1 acc 34.766 (34.935)	Top-5 acc 60.938 (58.977)	lr 0.02470
Train [9][1230/3239]	Time 0.612 (0.857)	Data Time 0.001 (0.016)	Loss 3.8374 (3.7973)	Entropy 1.58208 (1.59359)	Top-1 acc 35.547 (34.938)	Top-5 acc 60.156 (58.977)	lr 0.02470
Train [9][1240/3239]	Time 0.553 (0.857)	Data Time 0.001 (0.016)	Loss 3.8373 (3.7971)	Entropy 1.58218 (1.59350)	Top-1 acc 32.422 (34.943)	Top-5 acc 55.859 (58.977)	lr 0.02470
Train [9][1250/3239]	Time 0.536 (0.857)	Data Time 0.001 (0.016)	Loss 3.7828 (3.7975)	Entropy 1.58197 (1.59341)	Top-1 acc 33.203 (34.935)	Top-5 acc 56.641 (58.971)	lr 0.02470
Train [9][1260/3239]	Time 0.521 (0.857)	Data Time 0.001 (0.016)	Loss 3.8406 (3.7974)	Entropy 1.58191 (1.59331)	Top-1 acc 35.547 (34.944)	Top-5 acc 56.641 (58.978)	lr 0.02470
Train [9][1270/3239]	Time 0.537 (0.856)	Data Time 0.001 (0.015)	Loss 3.8540 (3.7973)	Entropy 1.58174 (1.59322)	Top-1 acc 34.375 (34.938)	Top-5 acc 56.250 (58.975)	lr 0.02470
Train [9][1280/3239]	Time 0.531 (0.856)	Data Time 0.001 (0.015)	Loss 3.6778 (3.7975)	Entropy 1.58163 (1.59314)	Top-1 acc 38.672 (34.931)	Top-5 acc 65.234 (58.980)	lr 0.02470
Train [9][1290/3239]	Time 0.700 (0.856)	Data Time 0.001 (0.015)	Loss 3.7194 (3.7971)	Entropy 1.58120 (1.59304)	Top-1 acc 37.109 (34.935)	Top-5 acc 60.156 (58.986)	lr 0.02470
Train [9][1300/3239]	Time 0.572 (0.856)	Data Time 0.001 (0.015)	Loss 3.6874 (3.7974)	Entropy 1.58127 (1.59295)	Top-1 acc 32.812 (34.925)	Top-5 acc 63.672 (58.986)	lr 0.02470
Train [9][1310/3239]	Time 0.579 (0.855)	Data Time 0.001 (0.015)	Loss 3.7269 (3.7973)	Entropy 1.58094 (1.59286)	Top-1 acc 37.500 (34.925)	Top-5 acc 58.594 (58.982)	lr 0.02470
Train [9][1320/3239]	Time 0.601 (0.855)	Data Time 0.001 (0.015)	Loss 3.6538 (3.7969)	Entropy 1.58069 (1.59277)	Top-1 acc 40.234 (34.935)	Top-5 acc 60.547 (58.989)	lr 0.02470
Train [9][1330/3239]	Time 0.544 (0.855)	Data Time 0.001 (0.015)	Loss 3.7724 (3.7968)	Entropy 1.58036 (1.59268)	Top-1 acc 35.156 (34.934)	Top-5 acc 59.766 (58.994)	lr 0.02470
Train [9][1340/3239]	Time 0.545 (0.854)	Data Time 0.001 (0.015)	Loss 3.7151 (3.7966)	Entropy 1.58015 (1.59259)	Top-1 acc 37.891 (34.937)	Top-5 acc 55.859 (58.995)	lr 0.02470
Train [9][1350/3239]	Time 0.595 (0.854)	Data Time 0.001 (0.015)	Loss 3.8454 (3.7969)	Entropy 1.57966 (1.59250)	Top-1 acc 33.203 (34.928)	Top-5 acc 58.984 (58.993)	lr 0.02470
Train [9][1360/3239]	Time 0.670 (0.853)	Data Time 0.001 (0.015)	Loss 3.8151 (3.7967)	Entropy 1.57973 (1.59240)	Top-1 acc 37.109 (34.935)	Top-5 acc 58.203 (58.998)	lr 0.02470
Train [9][1370/3239]	Time 0.486 (0.853)	Data Time 0.001 (0.014)	Loss 3.8988 (3.7967)	Entropy 1.57933 (1.59231)	Top-1 acc 34.375 (34.948)	Top-5 acc 54.297 (58.993)	lr 0.02470
Train [9][1380/3239]	Time 0.613 (0.853)	Data Time 0.002 (0.014)	Loss 3.9644 (3.7968)	Entropy 1.57922 (1.59221)	Top-1 acc 31.250 (34.947)	Top-5 acc 55.469 (58.985)	lr 0.02470
Train [9][1390/3239]	Time 0.570 (0.852)	Data Time 0.001 (0.014)	Loss 3.7315 (3.7966)	Entropy 1.57871 (1.59212)	Top-1 acc 37.500 (34.957)	Top-5 acc 60.156 (58.987)	lr 0.02470
Train [9][1400/3239]	Time 0.579 (0.852)	Data Time 0.001 (0.014)	Loss 3.8789 (3.7967)	Entropy 1.57835 (1.59202)	Top-1 acc 33.984 (34.956)	Top-5 acc 55.469 (58.980)	lr 0.02470
Train [9][1410/3239]	Time 0.582 (0.852)	Data Time 0.002 (0.014)	Loss 3.6089 (3.7968)	Entropy 1.57821 (1.59193)	Top-1 acc 41.797 (34.960)	Top-5 acc 62.891 (58.975)	lr 0.02470
Train [9][1420/3239]	Time 0.571 (0.852)	Data Time 0.001 (0.014)	Loss 3.8064 (3.7973)	Entropy 1.57805 (1.59183)	Top-1 acc 34.766 (34.947)	Top-5 acc 56.641 (58.965)	lr 0.02470
Train [9][1430/3239]	Time 0.526 (0.852)	Data Time 0.002 (0.014)	Loss 3.7663 (3.7971)	Entropy 1.57756 (1.59173)	Top-1 acc 40.625 (34.947)	Top-5 acc 58.203 (58.970)	lr 0.02470
Train [9][1440/3239]	Time 0.569 (0.851)	Data Time 0.001 (0.014)	Loss 3.8039 (3.7973)	Entropy 1.57718 (1.59163)	Top-1 acc 33.594 (34.935)	Top-5 acc 58.984 (58.973)	lr 0.02470
Train [9][1450/3239]	Time 0.545 (0.851)	Data Time 0.001 (0.014)	Loss 3.6893 (3.7969)	Entropy 1.57717 (1.59153)	Top-1 acc 38.281 (34.949)	Top-5 acc 60.156 (58.983)	lr 0.02470
Train [9][1460/3239]	Time 0.564 (0.851)	Data Time 0.001 (0.014)	Loss 3.9870 (3.7974)	Entropy 1.57723 (1.59144)	Top-1 acc 29.297 (34.937)	Top-5 acc 56.250 (58.970)	lr 0.02470
Train [9][1470/3239]	Time 0.609 (0.851)	Data Time 0.001 (0.014)	Loss 3.7920 (3.7978)	Entropy 1.57696 (1.59134)	Top-1 acc 34.766 (34.924)	Top-5 acc 59.766 (58.955)	lr 0.02470
Train [9][1480/3239]	Time 0.675 (0.851)	Data Time 0.001 (0.014)	Loss 3.9259 (3.7978)	Entropy 1.57679 (1.59124)	Top-1 acc 33.203 (34.924)	Top-5 acc 57.812 (58.957)	lr 0.02469
Train [9][1490/3239]	Time 0.603 (0.851)	Data Time 0.001 (0.013)	Loss 3.9189 (3.7978)	Entropy 1.57652 (1.59114)	Top-1 acc 31.250 (34.918)	Top-5 acc 55.078 (58.957)	lr 0.02469
Train [9][1500/3239]	Time 0.502 (0.850)	Data Time 0.002 (0.013)	Loss 3.7799 (3.7985)	Entropy 1.57663 (1.59105)	Top-1 acc 36.719 (34.903)	Top-5 acc 62.109 (58.947)	lr 0.02469
Train [9][1510/3239]	Time 0.612 (0.850)	Data Time 0.001 (0.013)	Loss 3.7121 (3.7989)	Entropy 1.57627 (1.59095)	Top-1 acc 33.594 (34.892)	Top-5 acc 60.938 (58.946)	lr 0.02469
Train [9][1520/3239]	Time 0.590 (0.850)	Data Time 0.001 (0.013)	Loss 4.0189 (3.7988)	Entropy 1.57616 (1.59085)	Top-1 acc 28.516 (34.893)	Top-5 acc 53.125 (58.943)	lr 0.02469
Train [9][1530/3239]	Time 0.424 (0.850)	Data Time 0.001 (0.013)	Loss 3.8018 (3.7989)	Entropy 1.57590 (1.59076)	Top-1 acc 35.938 (34.891)	Top-5 acc 60.156 (58.948)	lr 0.02469
Train [9][1540/3239]	Time 0.583 (0.849)	Data Time 0.001 (0.013)	Loss 3.9646 (3.7986)	Entropy 1.57560 (1.59066)	Top-1 acc 28.906 (34.892)	Top-5 acc 57.812 (58.963)	lr 0.02469
Train [9][1550/3239]	Time 0.614 (0.849)	Data Time 0.001 (0.013)	Loss 3.9413 (3.7985)	Entropy 1.57553 (1.59056)	Top-1 acc 33.984 (34.893)	Top-5 acc 53.516 (58.962)	lr 0.02469
Train [9][1560/3239]	Time 0.804 (0.860)	Data Time 0.007 (0.013)	Loss 3.8945 (3.7985)	Entropy 1.57564 (1.59047)	Top-1 acc 34.375 (34.900)	Top-5 acc 57.031 (58.970)	lr 0.02469
Train [9][1570/3239]	Time 0.681 (0.860)	Data Time 0.002 (0.013)	Loss 3.7897 (3.7982)	Entropy 1.57543 (1.59037)	Top-1 acc 31.641 (34.902)	Top-5 acc 57.422 (58.972)	lr 0.02469
Train [9][1580/3239]	Time 0.610 (0.860)	Data Time 0.001 (0.013)	Loss 3.7653 (3.7982)	Entropy 1.57496 (1.59028)	Top-1 acc 33.594 (34.897)	Top-5 acc 59.375 (58.969)	lr 0.02469
Train [9][1590/3239]	Time 0.542 (0.860)	Data Time 0.001 (0.013)	Loss 3.8607 (3.7982)	Entropy 1.57463 (1.59018)	Top-1 acc 35.547 (34.894)	Top-5 acc 57.422 (58.964)	lr 0.02469
Train [9][1600/3239]	Time 0.564 (0.860)	Data Time 0.002 (0.013)	Loss 3.7170 (3.7984)	Entropy 1.57444 (1.59008)	Top-1 acc 38.672 (34.891)	Top-5 acc 59.766 (58.959)	lr 0.02469
Train [9][1610/3239]	Time 0.577 (0.859)	Data Time 0.001 (0.013)	Loss 3.9220 (3.7987)	Entropy 1.57416 (1.58998)	Top-1 acc 33.594 (34.882)	Top-5 acc 55.859 (58.962)	lr 0.02469
Train [9][1620/3239]	Time 0.586 (0.859)	Data Time 0.001 (0.013)	Loss 3.7846 (3.7983)	Entropy 1.57402 (1.58989)	Top-1 acc 34.375 (34.884)	Top-5 acc 65.234 (58.983)	lr 0.02469
Train [9][1630/3239]	Time 0.556 (0.859)	Data Time 0.002 (0.013)	Loss 3.6454 (3.7982)	Entropy 1.57376 (1.58979)	Top-1 acc 37.891 (34.881)	Top-5 acc 66.016 (58.983)	lr 0.02469
Train [9][1640/3239]	Time 0.558 (0.859)	Data Time 0.001 (0.012)	Loss 3.7820 (3.7983)	Entropy 1.57347 (1.58969)	Top-1 acc 36.328 (34.874)	Top-5 acc 57.812 (58.979)	lr 0.02469
Train [9][1650/3239]	Time 0.547 (0.859)	Data Time 0.001 (0.012)	Loss 3.7417 (3.7984)	Entropy 1.57318 (1.58959)	Top-1 acc 32.812 (34.871)	Top-5 acc 62.500 (58.978)	lr 0.02469
Train [9][1660/3239]	Time 0.529 (0.858)	Data Time 0.001 (0.012)	Loss 3.7306 (3.7983)	Entropy 1.57310 (1.58949)	Top-1 acc 36.719 (34.872)	Top-5 acc 58.594 (58.977)	lr 0.02469
Train [9][1670/3239]	Time 0.537 (0.858)	Data Time 0.001 (0.012)	Loss 3.9757 (3.7984)	Entropy 1.57328 (1.58939)	Top-1 acc 29.688 (34.873)	Top-5 acc 54.688 (58.976)	lr 0.02469
Train [9][1680/3239]	Time 0.418 (0.857)	Data Time 0.001 (0.012)	Loss 3.8504 (3.7987)	Entropy 1.57298 (1.58930)	Top-1 acc 35.938 (34.865)	Top-5 acc 58.203 (58.964)	lr 0.02469
Train [9][1690/3239]	Time 0.722 (0.857)	Data Time 0.001 (0.012)	Loss 3.7705 (3.7991)	Entropy 1.57279 (1.58920)	Top-1 acc 36.328 (34.859)	Top-5 acc 62.109 (58.959)	lr 0.02469
Train [9][1700/3239]	Time 0.523 (0.857)	Data Time 0.002 (0.012)	Loss 3.6971 (3.7988)	Entropy 1.57298 (1.58910)	Top-1 acc 31.250 (34.860)	Top-5 acc 61.719 (58.965)	lr 0.02469
Train [9][1710/3239]	Time 0.511 (0.857)	Data Time 0.001 (0.012)	Loss 3.8538 (3.7988)	Entropy 1.57318 (1.58901)	Top-1 acc 35.938 (34.860)	Top-5 acc 56.250 (58.967)	lr 0.02469
Train [9][1720/3239]	Time 0.554 (0.857)	Data Time 0.001 (0.012)	Loss 3.6145 (3.7991)	Entropy 1.57303 (1.58892)	Top-1 acc 43.359 (34.858)	Top-5 acc 64.844 (58.965)	lr 0.02469
Train [9][1730/3239]	Time 0.562 (0.856)	Data Time 0.001 (0.012)	Loss 3.8953 (3.7991)	Entropy 1.57282 (1.58883)	Top-1 acc 31.250 (34.855)	Top-5 acc 57.422 (58.967)	lr 0.02469
Train [9][1740/3239]	Time 0.608 (0.856)	Data Time 0.001 (0.012)	Loss 3.7338 (3.7992)	Entropy 1.57249 (1.58873)	Top-1 acc 38.281 (34.852)	Top-5 acc 60.156 (58.966)	lr 0.02469
Train [9][1750/3239]	Time 0.554 (0.856)	Data Time 0.002 (0.012)	Loss 3.8996 (3.7991)	Entropy 1.57248 (1.58864)	Top-1 acc 28.125 (34.844)	Top-5 acc 58.594 (58.967)	lr 0.02469
Train [9][1760/3239]	Time 0.688 (0.856)	Data Time 0.001 (0.012)	Loss 3.8392 (3.7986)	Entropy 1.57195 (1.58855)	Top-1 acc 35.938 (34.852)	Top-5 acc 57.031 (58.982)	lr 0.02469
Train [9][1770/3239]	Time 0.561 (0.856)	Data Time 0.001 (0.012)	Loss 3.9660 (3.7990)	Entropy 1.57207 (1.58845)	Top-1 acc 31.641 (34.848)	Top-5 acc 56.250 (58.973)	lr 0.02469
Train [9][1780/3239]	Time 0.606 (0.856)	Data Time 0.001 (0.012)	Loss 3.8703 (3.7990)	Entropy 1.57190 (1.58836)	Top-1 acc 28.125 (34.848)	Top-5 acc 51.562 (58.966)	lr 0.02469
Train [9][1790/3239]	Time 0.553 (0.855)	Data Time 0.001 (0.012)	Loss 3.6933 (3.7989)	Entropy 1.57151 (1.58827)	Top-1 acc 35.156 (34.853)	Top-5 acc 62.500 (58.970)	lr 0.02469
Train [9][1800/3239]	Time 0.568 (0.855)	Data Time 0.001 (0.012)	Loss 3.6692 (3.7989)	Entropy 1.57119 (1.58818)	Top-1 acc 39.062 (34.856)	Top-5 acc 62.500 (58.969)	lr 0.02469
Train [9][1810/3239]	Time 0.561 (0.855)	Data Time 0.001 (0.011)	Loss 3.6591 (3.7988)	Entropy 1.57083 (1.58808)	Top-1 acc 37.891 (34.853)	Top-5 acc 62.500 (58.973)	lr 0.02469
Train [9][1820/3239]	Time 0.446 (0.855)	Data Time 0.001 (0.011)	Loss 3.6490 (3.7985)	Entropy 1.57048 (1.58799)	Top-1 acc 39.062 (34.861)	Top-5 acc 60.547 (58.979)	lr 0.02469
Train [9][1830/3239]	Time 0.692 (0.855)	Data Time 0.001 (0.011)	Loss 4.0897 (3.7986)	Entropy 1.57055 (1.58789)	Top-1 acc 24.609 (34.852)	Top-5 acc 53.516 (58.976)	lr 0.02469
Train [9][1840/3239]	Time 0.601 (0.854)	Data Time 0.001 (0.011)	Loss 3.7887 (3.7986)	Entropy 1.57015 (1.58780)	Top-1 acc 34.766 (34.850)	Top-5 acc 61.328 (58.973)	lr 0.02469
Train [9][1850/3239]	Time 0.621 (0.854)	Data Time 0.001 (0.011)	Loss 3.8365 (3.7985)	Entropy 1.56989 (1.58770)	Top-1 acc 32.422 (34.855)	Top-5 acc 57.031 (58.977)	lr 0.02469
Train [9][1860/3239]	Time 0.583 (0.853)	Data Time 0.001 (0.011)	Loss 3.8827 (3.7986)	Entropy 1.56991 (1.58760)	Top-1 acc 33.203 (34.854)	Top-5 acc 58.984 (58.973)	lr 0.02469
Train [9][1870/3239]	Time 0.539 (0.853)	Data Time 0.001 (0.011)	Loss 3.9548 (3.7989)	Entropy 1.56961 (1.58751)	Top-1 acc 30.469 (34.845)	Top-5 acc 55.859 (58.967)	lr 0.02469
Train [9][1880/3239]	Time 0.564 (0.853)	Data Time 0.001 (0.011)	Loss 3.7029 (3.7990)	Entropy 1.56967 (1.58741)	Top-1 acc 38.672 (34.850)	Top-5 acc 61.328 (58.963)	lr 0.02469
Train [9][1890/3239]	Time 0.530 (0.853)	Data Time 0.001 (0.011)	Loss 3.6911 (3.7989)	Entropy 1.56960 (1.58732)	Top-1 acc 41.016 (34.852)	Top-5 acc 64.453 (58.972)	lr 0.02469
Train [9][1900/3239]	Time 0.576 (0.853)	Data Time 0.001 (0.011)	Loss 3.7670 (3.7987)	Entropy 1.56939 (1.58723)	Top-1 acc 38.281 (34.853)	Top-5 acc 60.547 (58.976)	lr 0.02469
Train [9][1910/3239]	Time 0.564 (0.853)	Data Time 0.001 (0.011)	Loss 3.8570 (3.7988)	Entropy 1.56931 (1.58713)	Top-1 acc 35.156 (34.856)	Top-5 acc 55.859 (58.972)	lr 0.02469
Train [9][1920/3239]	Time 0.606 (0.852)	Data Time 0.001 (0.011)	Loss 3.7270 (3.7987)	Entropy 1.56910 (1.58704)	Top-1 acc 37.891 (34.858)	Top-5 acc 60.156 (58.969)	lr 0.02469
Train [9][1930/3239]	Time 0.564 (0.852)	Data Time 0.001 (0.011)	Loss 3.8500 (3.7987)	Entropy 1.56863 (1.58695)	Top-1 acc 37.109 (34.857)	Top-5 acc 57.422 (58.972)	lr 0.02468
Train [9][1940/3239]	Time 0.598 (0.852)	Data Time 0.001 (0.011)	Loss 3.5454 (3.7979)	Entropy 1.56834 (1.58685)	Top-1 acc 41.016 (34.872)	Top-5 acc 65.234 (58.988)	lr 0.02468
Train [9][1950/3239]	Time 0.514 (0.852)	Data Time 0.001 (0.011)	Loss 3.6901 (3.7975)	Entropy 1.56818 (1.58676)	Top-1 acc 40.234 (34.878)	Top-5 acc 60.156 (58.993)	lr 0.02468
Train [9][1960/3239]	Time 0.569 (0.852)	Data Time 0.001 (0.011)	Loss 3.7293 (3.7973)	Entropy 1.56792 (1.58666)	Top-1 acc 37.109 (34.879)	Top-5 acc 57.812 (59.001)	lr 0.02468
Train [9][1970/3239]	Time 0.606 (0.852)	Data Time 0.001 (0.011)	Loss 3.9564 (3.7973)	Entropy 1.56768 (1.58657)	Top-1 acc 33.984 (34.882)	Top-5 acc 56.250 (59.002)	lr 0.02468
Train [9][1980/3239]	Time 0.576 (0.852)	Data Time 0.001 (0.011)	Loss 3.5119 (3.7971)	Entropy 1.56755 (1.58647)	Top-1 acc 40.234 (34.883)	Top-5 acc 65.625 (59.004)	lr 0.02468
Train [9][1990/3239]	Time 0.558 (0.851)	Data Time 0.001 (0.011)	Loss 3.6680 (3.7971)	Entropy 1.56732 (1.58638)	Top-1 acc 38.281 (34.886)	Top-5 acc 60.547 (59.003)	lr 0.02468
Train [9][2000/3239]	Time 0.585 (0.851)	Data Time 0.001 (0.011)	Loss 3.7207 (3.7970)	Entropy 1.56717 (1.58628)	Top-1 acc 39.844 (34.893)	Top-5 acc 58.984 (59.005)	lr 0.02468
Train [9][2010/3239]	Time 0.556 (0.851)	Data Time 0.001 (0.011)	Loss 3.7221 (3.7969)	Entropy 1.56712 (1.58619)	Top-1 acc 35.156 (34.895)	Top-5 acc 60.547 (59.009)	lr 0.02468
Train [9][2020/3239]	Time 0.538 (0.851)	Data Time 0.001 (0.011)	Loss 3.8731 (3.7973)	Entropy 1.56732 (1.58609)	Top-1 acc 33.594 (34.887)	Top-5 acc 56.250 (59.003)	lr 0.02468
Train [9][2030/3239]	Time 0.432 (0.851)	Data Time 0.001 (0.011)	Loss 3.8145 (3.7972)	Entropy 1.56722 (1.58600)	Top-1 acc 33.203 (34.888)	Top-5 acc 58.203 (59.005)	lr 0.02468
Train [9][2040/3239]	Time 0.598 (0.850)	Data Time 0.001 (0.010)	Loss 3.7314 (3.7971)	Entropy 1.56705 (1.58591)	Top-1 acc 37.891 (34.887)	Top-5 acc 62.500 (59.009)	lr 0.02468
Train [9][2050/3239]	Time 0.573 (0.850)	Data Time 0.001 (0.010)	Loss 3.6084 (3.7973)	Entropy 1.56697 (1.58581)	Top-1 acc 37.500 (34.885)	Top-5 acc 63.672 (59.005)	lr 0.02468
Train [9][2060/3239]	Time 0.672 (0.850)	Data Time 0.001 (0.010)	Loss 3.6568 (3.7972)	Entropy 1.56647 (1.58572)	Top-1 acc 32.812 (34.884)	Top-5 acc 62.500 (59.003)	lr 0.02468
Train [9][2070/3239]	Time 0.658 (0.850)	Data Time 0.001 (0.010)	Loss 3.6248 (3.7968)	Entropy 1.56613 (1.58563)	Top-1 acc 37.109 (34.891)	Top-5 acc 63.281 (59.015)	lr 0.02468
Train [9][2080/3239]	Time 0.584 (0.850)	Data Time 0.001 (0.010)	Loss 3.7933 (3.7969)	Entropy 1.56612 (1.58554)	Top-1 acc 35.547 (34.891)	Top-5 acc 60.938 (59.015)	lr 0.02468
Train [9][2090/3239]	Time 0.548 (0.850)	Data Time 0.001 (0.010)	Loss 3.5555 (3.7968)	Entropy 1.56589 (1.58544)	Top-1 acc 40.625 (34.888)	Top-5 acc 64.062 (59.016)	lr 0.02468
Train [9][2100/3239]	Time 0.557 (0.850)	Data Time 0.001 (0.010)	Loss 3.7540 (3.7967)	Entropy 1.56535 (1.58535)	Top-1 acc 37.500 (34.893)	Top-5 acc 61.719 (59.020)	lr 0.02468
Train [9][2110/3239]	Time 0.641 (0.850)	Data Time 0.001 (0.010)	Loss 3.9974 (3.7968)	Entropy 1.56537 (1.58525)	Top-1 acc 31.250 (34.893)	Top-5 acc 54.688 (59.021)	lr 0.02468
Train [9][2120/3239]	Time 0.602 (0.849)	Data Time 0.001 (0.010)	Loss 3.9333 (3.7969)	Entropy 1.56513 (1.58516)	Top-1 acc 28.516 (34.888)	Top-5 acc 54.297 (59.017)	lr 0.02468
Train [9][2130/3239]	Time 0.538 (0.849)	Data Time 0.001 (0.010)	Loss 3.7147 (3.7968)	Entropy 1.56472 (1.58506)	Top-1 acc 38.672 (34.892)	Top-5 acc 57.422 (59.015)	lr 0.02468
Train [9][2140/3239]	Time 0.623 (0.849)	Data Time 0.002 (0.010)	Loss 3.7689 (3.7969)	Entropy 1.56441 (1.58497)	Top-1 acc 37.109 (34.890)	Top-5 acc 60.547 (59.018)	lr 0.02468
Train [9][2150/3239]	Time 0.546 (0.849)	Data Time 0.001 (0.010)	Loss 3.7709 (3.7972)	Entropy 1.56405 (1.58487)	Top-1 acc 30.859 (34.883)	Top-5 acc 58.984 (59.015)	lr 0.02468
Train [9][2160/3239]	Time 0.456 (0.849)	Data Time 0.001 (0.010)	Loss 3.7669 (3.7973)	Entropy 1.56364 (1.58478)	Top-1 acc 38.672 (34.883)	Top-5 acc 55.469 (59.010)	lr 0.02468
Train [9][2170/3239]	Time 0.622 (0.849)	Data Time 0.001 (0.010)	Loss 3.7981 (3.7971)	Entropy 1.56374 (1.58468)	Top-1 acc 33.984 (34.888)	Top-5 acc 59.766 (59.011)	lr 0.02468
Train [9][2180/3239]	Time 0.614 (0.849)	Data Time 0.001 (0.010)	Loss 3.8658 (3.7970)	Entropy 1.56366 (1.58458)	Top-1 acc 32.812 (34.896)	Top-5 acc 55.859 (59.009)	lr 0.02468
Train [9][2190/3239]	Time 0.606 (0.848)	Data Time 0.001 (0.010)	Loss 3.6733 (3.7972)	Entropy 1.56336 (1.58449)	Top-1 acc 40.625 (34.900)	Top-5 acc 61.328 (59.002)	lr 0.02468
Train [9][2200/3239]	Time 0.615 (0.848)	Data Time 0.001 (0.010)	Loss 3.8003 (3.7976)	Entropy 1.56323 (1.58439)	Top-1 acc 32.812 (34.892)	Top-5 acc 57.422 (58.990)	lr 0.02468
Train [9][2210/3239]	Time 0.551 (0.848)	Data Time 0.001 (0.010)	Loss 3.7038 (3.7975)	Entropy 1.56318 (1.58429)	Top-1 acc 36.328 (34.895)	Top-5 acc 63.281 (58.997)	lr 0.02468
Train [9][2220/3239]	Time 0.567 (0.857)	Data Time 0.002 (0.010)	Loss 3.7513 (3.7972)	Entropy 1.56313 (1.58420)	Top-1 acc 41.406 (34.898)	Top-5 acc 59.766 (59.001)	lr 0.02468
Train [9][2230/3239]	Time 0.639 (0.857)	Data Time 0.002 (0.010)	Loss 3.8369 (3.7970)	Entropy 1.56272 (1.58410)	Top-1 acc 35.156 (34.903)	Top-5 acc 58.594 (59.005)	lr 0.02468
Train [9][2240/3239]	Time 0.573 (0.856)	Data Time 0.001 (0.010)	Loss 3.9504 (3.7972)	Entropy 1.56246 (1.58401)	Top-1 acc 34.375 (34.903)	Top-5 acc 56.641 (59.001)	lr 0.02468
Train [9][2250/3239]	Time 0.644 (0.856)	Data Time 0.001 (0.010)	Loss 4.0546 (3.7970)	Entropy 1.56228 (1.58391)	Top-1 acc 27.344 (34.907)	Top-5 acc 55.078 (59.002)	lr 0.02468
Train [9][2260/3239]	Time 0.595 (0.856)	Data Time 0.002 (0.010)	Loss 3.6225 (3.7971)	Entropy 1.56190 (1.58382)	Top-1 acc 38.672 (34.908)	Top-5 acc 62.109 (59.006)	lr 0.02468
Train [9][2270/3239]	Time 0.577 (0.856)	Data Time 0.001 (0.010)	Loss 3.9424 (3.7973)	Entropy 1.56168 (1.58372)	Top-1 acc 30.078 (34.908)	Top-5 acc 58.203 (59.001)	lr 0.02468
Train [9][2280/3239]	Time 0.579 (0.856)	Data Time 0.001 (0.010)	Loss 3.9343 (3.7973)	Entropy 1.56129 (1.58362)	Top-1 acc 33.594 (34.911)	Top-5 acc 53.516 (58.998)	lr 0.02468
Train [9][2290/3239]	Time 0.493 (0.856)	Data Time 0.002 (0.010)	Loss 4.1972 (3.7976)	Entropy 1.56105 (1.58352)	Top-1 acc 27.734 (34.909)	Top-5 acc 49.219 (58.989)	lr 0.02468
Train [9][2300/3239]	Time 0.565 (0.856)	Data Time 0.001 (0.010)	Loss 3.8552 (3.7977)	Entropy 1.56104 (1.58343)	Top-1 acc 32.812 (34.909)	Top-5 acc 58.594 (58.992)	lr 0.02468
Train [9][2310/3239]	Time 0.556 (0.856)	Data Time 0.001 (0.010)	Loss 3.8767 (3.7981)	Entropy 1.56072 (1.58333)	Top-1 acc 34.766 (34.904)	Top-5 acc 58.203 (58.981)	lr 0.02468
Train [9][2320/3239]	Time 0.600 (0.855)	Data Time 0.001 (0.010)	Loss 3.9420 (3.7982)	Entropy 1.56045 (1.58323)	Top-1 acc 30.859 (34.902)	Top-5 acc 54.297 (58.977)	lr 0.02468
Train [9][2330/3239]	Time 0.544 (0.855)	Data Time 0.001 (0.010)	Loss 3.7173 (3.7979)	Entropy 1.56026 (1.58313)	Top-1 acc 36.719 (34.910)	Top-5 acc 61.719 (58.987)	lr 0.02468
Train [9][2340/3239]	Time 0.445 (0.855)	Data Time 0.002 (0.009)	Loss 4.0339 (3.7980)	Entropy 1.55995 (1.58304)	Top-1 acc 32.422 (34.905)	Top-5 acc 54.297 (58.986)	lr 0.02468
Train [9][2350/3239]	Time 0.618 (0.855)	Data Time 0.001 (0.009)	Loss 3.7424 (3.7979)	Entropy 1.55977 (1.58294)	Top-1 acc 37.500 (34.905)	Top-5 acc 62.500 (58.987)	lr 0.02468
Train [9][2360/3239]	Time 0.592 (0.854)	Data Time 0.001 (0.009)	Loss 3.6506 (3.7981)	Entropy 1.55936 (1.58284)	Top-1 acc 37.500 (34.903)	Top-5 acc 63.281 (58.988)	lr 0.02468
Train [9][2370/3239]	Time 0.668 (0.854)	Data Time 0.001 (0.009)	Loss 3.6851 (3.7982)	Entropy 1.55904 (1.58274)	Top-1 acc 39.062 (34.899)	Top-5 acc 60.547 (58.980)	lr 0.02467
Train [9][2380/3239]	Time 0.539 (0.854)	Data Time 0.001 (0.009)	Loss 3.8000 (3.7983)	Entropy 1.55925 (1.58264)	Top-1 acc 32.031 (34.895)	Top-5 acc 59.766 (58.980)	lr 0.02467
Train [9][2390/3239]	Time 0.598 (0.854)	Data Time 0.001 (0.009)	Loss 3.7547 (3.7982)	Entropy 1.55913 (1.58254)	Top-1 acc 34.375 (34.892)	Top-5 acc 60.156 (58.983)	lr 0.02467
Train [9][2400/3239]	Time 0.570 (0.854)	Data Time 0.001 (0.009)	Loss 3.7351 (3.7984)	Entropy 1.55878 (1.58244)	Top-1 acc 37.109 (34.891)	Top-5 acc 60.547 (58.979)	lr 0.02467
Train [9][2410/3239]	Time 0.597 (0.854)	Data Time 0.001 (0.009)	Loss 3.7904 (3.7980)	Entropy 1.55830 (1.58235)	Top-1 acc 32.812 (34.902)	Top-5 acc 61.328 (58.987)	lr 0.02467
Train [9][2420/3239]	Time 0.577 (0.854)	Data Time 0.001 (0.009)	Loss 3.7981 (3.7978)	Entropy 1.55810 (1.58225)	Top-1 acc 37.109 (34.907)	Top-5 acc 58.594 (58.988)	lr 0.02467
Train [9][2430/3239]	Time 0.586 (0.854)	Data Time 0.002 (0.009)	Loss 3.8845 (3.7977)	Entropy 1.55809 (1.58215)	Top-1 acc 35.156 (34.912)	Top-5 acc 53.906 (58.989)	lr 0.02467
Train [9][2440/3239]	Time 0.619 (0.854)	Data Time 0.001 (0.009)	Loss 3.9380 (3.7980)	Entropy 1.55817 (1.58205)	Top-1 acc 31.641 (34.911)	Top-5 acc 58.594 (58.985)	lr 0.02467
Train [9][2450/3239]	Time 0.601 (0.854)	Data Time 0.001 (0.009)	Loss 3.8433 (3.7979)	Entropy 1.55829 (1.58195)	Top-1 acc 35.156 (34.911)	Top-5 acc 58.984 (58.990)	lr 0.02467
Train [9][2460/3239]	Time 0.615 (0.854)	Data Time 0.001 (0.009)	Loss 3.8005 (3.7976)	Entropy 1.55842 (1.58185)	Top-1 acc 35.156 (34.911)	Top-5 acc 57.031 (58.998)	lr 0.02467
Train [9][2470/3239]	Time 0.593 (0.853)	Data Time 0.002 (0.009)	Loss 3.9788 (3.7977)	Entropy 1.55831 (1.58176)	Top-1 acc 31.641 (34.905)	Top-5 acc 55.469 (58.995)	lr 0.02467
Train [9][2480/3239]	Time 0.628 (0.853)	Data Time 0.001 (0.009)	Loss 3.7299 (3.7977)	Entropy 1.55804 (1.58166)	Top-1 acc 33.203 (34.904)	Top-5 acc 58.984 (58.994)	lr 0.02467
Train [9][2490/3239]	Time 0.546 (0.853)	Data Time 0.001 (0.009)	Loss 3.9183 (3.7978)	Entropy 1.55794 (1.58157)	Top-1 acc 30.469 (34.903)	Top-5 acc 57.031 (58.997)	lr 0.02467
Train [9][2500/3239]	Time 0.502 (0.853)	Data Time 0.001 (0.009)	Loss 3.8867 (3.7978)	Entropy 1.55761 (1.58147)	Top-1 acc 32.031 (34.904)	Top-5 acc 57.422 (58.995)	lr 0.02467
Train [9][2510/3239]	Time 0.568 (0.853)	Data Time 0.001 (0.009)	Loss 3.8196 (3.7981)	Entropy 1.55782 (1.58138)	Top-1 acc 33.203 (34.900)	Top-5 acc 58.984 (58.988)	lr 0.02467
Train [9][2520/3239]	Time 0.582 (0.853)	Data Time 0.001 (0.009)	Loss 3.7872 (3.7981)	Entropy 1.55762 (1.58129)	Top-1 acc 32.031 (34.900)	Top-5 acc 62.500 (58.988)	lr 0.02467
Train [9][2530/3239]	Time 0.616 (0.852)	Data Time 0.001 (0.009)	Loss 3.7556 (3.7982)	Entropy 1.55740 (1.58119)	Top-1 acc 35.938 (34.897)	Top-5 acc 60.156 (58.989)	lr 0.02467
Train [9][2540/3239]	Time 0.586 (0.852)	Data Time 0.001 (0.009)	Loss 3.6634 (3.7981)	Entropy 1.55749 (1.58110)	Top-1 acc 35.938 (34.899)	Top-5 acc 59.766 (58.993)	lr 0.02467
Train [9][2550/3239]	Time 0.578 (0.852)	Data Time 0.001 (0.009)	Loss 3.7310 (3.7979)	Entropy 1.55759 (1.58101)	Top-1 acc 38.672 (34.903)	Top-5 acc 61.328 (58.995)	lr 0.02467
Train [9][2560/3239]	Time 0.533 (0.852)	Data Time 0.001 (0.009)	Loss 3.8559 (3.7977)	Entropy 1.55735 (1.58091)	Top-1 acc 33.203 (34.909)	Top-5 acc 57.422 (59.002)	lr 0.02467
Train [9][2570/3239]	Time 0.597 (0.852)	Data Time 0.001 (0.009)	Loss 3.6250 (3.7975)	Entropy 1.55733 (1.58082)	Top-1 acc 36.719 (34.912)	Top-5 acc 61.328 (59.005)	lr 0.02467
Train [9][2580/3239]	Time 0.572 (0.852)	Data Time 0.001 (0.009)	Loss 3.7404 (3.7973)	Entropy 1.55698 (1.58073)	Top-1 acc 35.938 (34.915)	Top-5 acc 64.453 (59.009)	lr 0.02467
Train [9][2590/3239]	Time 0.566 (0.852)	Data Time 0.002 (0.009)	Loss 3.7237 (3.7973)	Entropy 1.55693 (1.58064)	Top-1 acc 34.766 (34.911)	Top-5 acc 58.203 (59.008)	lr 0.02467
Train [9][2600/3239]	Time 0.584 (0.852)	Data Time 0.001 (0.009)	Loss 3.7542 (3.7973)	Entropy 1.55668 (1.58055)	Top-1 acc 35.156 (34.916)	Top-5 acc 59.375 (59.009)	lr 0.02467
Train [9][2610/3239]	Time 0.507 (0.852)	Data Time 0.002 (0.009)	Loss 3.9769 (3.7972)	Entropy 1.55629 (1.58046)	Top-1 acc 32.031 (34.918)	Top-5 acc 52.734 (59.013)	lr 0.02467
Train [9][2620/3239]	Time 0.578 (0.852)	Data Time 0.002 (0.009)	Loss 3.7990 (3.7971)	Entropy 1.55621 (1.58036)	Top-1 acc 35.156 (34.921)	Top-5 acc 56.250 (59.013)	lr 0.02467
Train [9][2630/3239]	Time 0.706 (0.852)	Data Time 0.001 (0.009)	Loss 3.8193 (3.7971)	Entropy 1.55572 (1.58027)	Top-1 acc 35.156 (34.917)	Top-5 acc 58.594 (59.012)	lr 0.02467
Train [9][2640/3239]	Time 0.532 (0.851)	Data Time 0.001 (0.009)	Loss 3.7540 (3.7971)	Entropy 1.55531 (1.58018)	Top-1 acc 37.891 (34.924)	Top-5 acc 58.203 (59.012)	lr 0.02467
Train [9][2650/3239]	Time 0.586 (0.851)	Data Time 0.001 (0.009)	Loss 3.8106 (3.7970)	Entropy 1.55486 (1.58008)	Top-1 acc 33.594 (34.922)	Top-5 acc 58.203 (59.013)	lr 0.02467
Train [9][2660/3239]	Time 0.576 (0.851)	Data Time 0.001 (0.009)	Loss 3.7927 (3.7970)	Entropy 1.55475 (1.57999)	Top-1 acc 35.156 (34.921)	Top-5 acc 58.203 (59.012)	lr 0.02467
Train [9][2670/3239]	Time 0.590 (0.851)	Data Time 0.001 (0.009)	Loss 3.8531 (3.7971)	Entropy 1.55504 (1.57989)	Top-1 acc 33.984 (34.923)	Top-5 acc 55.469 (59.012)	lr 0.02467
Train [9][2680/3239]	Time 0.551 (0.851)	Data Time 0.001 (0.009)	Loss 3.8286 (3.7973)	Entropy 1.55500 (1.57980)	Top-1 acc 31.641 (34.923)	Top-5 acc 57.812 (59.008)	lr 0.02467
Train [9][2690/3239]	Time 0.588 (0.851)	Data Time 0.001 (0.009)	Loss 3.7317 (3.7972)	Entropy 1.55493 (1.57971)	Top-1 acc 33.984 (34.926)	Top-5 acc 62.891 (59.013)	lr 0.02467
Train [9][2700/3239]	Time 0.645 (0.851)	Data Time 0.002 (0.008)	Loss 3.6675 (3.7970)	Entropy 1.55467 (1.57962)	Top-1 acc 35.938 (34.929)	Top-5 acc 60.547 (59.018)	lr 0.02467
Train [9][2710/3239]	Time 0.585 (0.850)	Data Time 0.001 (0.008)	Loss 3.8715 (3.7969)	Entropy 1.55460 (1.57952)	Top-1 acc 33.594 (34.932)	Top-5 acc 58.594 (59.014)	lr 0.02467
Train [9][2720/3239]	Time 0.562 (0.850)	Data Time 0.001 (0.008)	Loss 3.7785 (3.7968)	Entropy 1.55448 (1.57943)	Top-1 acc 37.891 (34.936)	Top-5 acc 59.375 (59.015)	lr 0.02467
Train [9][2730/3239]	Time 0.580 (0.850)	Data Time 0.001 (0.008)	Loss 3.9191 (3.7967)	Entropy 1.55443 (1.57934)	Top-1 acc 30.469 (34.940)	Top-5 acc 55.859 (59.017)	lr 0.02467
Train [9][2740/3239]	Time 0.603 (0.850)	Data Time 0.001 (0.008)	Loss 3.7672 (3.7966)	Entropy 1.55443 (1.57925)	Top-1 acc 35.938 (34.944)	Top-5 acc 56.250 (59.019)	lr 0.02467
Train [9][2750/3239]	Time 0.679 (0.850)	Data Time 0.001 (0.008)	Loss 3.9379 (3.7966)	Entropy 1.55447 (1.57916)	Top-1 acc 31.641 (34.941)	Top-5 acc 55.859 (59.016)	lr 0.02467
Train [9][2760/3239]	Time 0.554 (0.850)	Data Time 0.001 (0.008)	Loss 3.8228 (3.7966)	Entropy 1.55420 (1.57907)	Top-1 acc 32.422 (34.937)	Top-5 acc 58.203 (59.009)	lr 0.02467
Train [9][2770/3239]	Time 0.635 (0.850)	Data Time 0.002 (0.008)	Loss 3.8531 (3.7969)	Entropy 1.55386 (1.57898)	Top-1 acc 37.500 (34.940)	Top-5 acc 57.812 (59.007)	lr 0.02467
Train [9][2780/3239]	Time 0.615 (0.850)	Data Time 0.001 (0.008)	Loss 3.7324 (3.7968)	Entropy 1.55392 (1.57889)	Top-1 acc 34.375 (34.947)	Top-5 acc 61.328 (59.009)	lr 0.02467
Train [9][2790/3239]	Time 0.551 (0.850)	Data Time 0.001 (0.008)	Loss 3.7636 (3.7969)	Entropy 1.55402 (1.57880)	Top-1 acc 39.062 (34.945)	Top-5 acc 64.062 (59.007)	lr 0.02467
Train [9][2800/3239]	Time 0.562 (0.850)	Data Time 0.001 (0.008)	Loss 3.7174 (3.7970)	Entropy 1.55402 (1.57871)	Top-1 acc 37.500 (34.946)	Top-5 acc 58.203 (59.004)	lr 0.02466
Train [9][2810/3239]	Time 0.586 (0.850)	Data Time 0.001 (0.008)	Loss 3.6262 (3.7970)	Entropy 1.55381 (1.57862)	Top-1 acc 37.109 (34.944)	Top-5 acc 62.109 (59.000)	lr 0.02466
Train [9][2820/3239]	Time 0.545 (0.850)	Data Time 0.001 (0.008)	Loss 3.8432 (3.7969)	Entropy 1.55337 (1.57854)	Top-1 acc 34.375 (34.947)	Top-5 acc 57.422 (58.999)	lr 0.02466
Train [9][2830/3239]	Time 0.557 (0.849)	Data Time 0.001 (0.008)	Loss 3.8476 (3.7969)	Entropy 1.55303 (1.57845)	Top-1 acc 32.422 (34.948)	Top-5 acc 57.812 (58.999)	lr 0.02466
Train [9][2840/3239]	Time 0.583 (0.849)	Data Time 0.001 (0.008)	Loss 3.7583 (3.7969)	Entropy 1.55301 (1.57836)	Top-1 acc 38.672 (34.948)	Top-5 acc 59.375 (58.999)	lr 0.02466
Train [9][2850/3239]	Time 0.563 (0.849)	Data Time 0.001 (0.008)	Loss 4.0063 (3.7968)	Entropy 1.55295 (1.57827)	Top-1 acc 31.250 (34.950)	Top-5 acc 55.859 (59.003)	lr 0.02466
Train [9][2860/3239]	Time 0.437 (0.849)	Data Time 0.001 (0.008)	Loss 3.9119 (3.7968)	Entropy 1.55269 (1.57818)	Top-1 acc 33.984 (34.953)	Top-5 acc 57.812 (59.001)	lr 0.02466
Train [9][2870/3239]	Time 0.756 (0.855)	Data Time 0.052 (0.008)	Loss 3.6259 (3.7966)	Entropy 1.55241 (1.57809)	Top-1 acc 36.719 (34.956)	Top-5 acc 61.719 (59.003)	lr 0.02466
Train [9][2880/3239]	Time 0.594 (0.855)	Data Time 0.002 (0.008)	Loss 3.8976 (3.7966)	Entropy 1.55214 (1.57800)	Top-1 acc 31.250 (34.959)	Top-5 acc 53.125 (59.003)	lr 0.02466
Train [9][2890/3239]	Time 0.529 (0.855)	Data Time 0.002 (0.008)	Loss 3.7166 (3.7966)	Entropy 1.55206 (1.57791)	Top-1 acc 35.156 (34.962)	Top-5 acc 60.547 (59.005)	lr 0.02466
Train [9][2900/3239]	Time 0.516 (0.855)	Data Time 0.001 (0.008)	Loss 3.7991 (3.7965)	Entropy 1.55178 (1.57782)	Top-1 acc 35.938 (34.959)	Top-5 acc 61.328 (59.007)	lr 0.02466
Train [9][2910/3239]	Time 0.542 (0.855)	Data Time 0.001 (0.008)	Loss 3.8358 (3.7966)	Entropy 1.55155 (1.57773)	Top-1 acc 32.031 (34.957)	Top-5 acc 58.594 (59.007)	lr 0.02466
Train [9][2920/3239]	Time 0.597 (0.855)	Data Time 0.001 (0.008)	Loss 3.7472 (3.7964)	Entropy 1.55100 (1.57764)	Top-1 acc 33.203 (34.960)	Top-5 acc 61.719 (59.010)	lr 0.02466
Train [9][2930/3239]	Time 0.534 (0.855)	Data Time 0.001 (0.008)	Loss 3.8389 (3.7963)	Entropy 1.55081 (1.57755)	Top-1 acc 32.031 (34.965)	Top-5 acc 60.547 (59.012)	lr 0.02466
Train [9][2940/3239]	Time 0.527 (0.855)	Data Time 0.001 (0.008)	Loss 3.8640 (3.7964)	Entropy 1.55063 (1.57746)	Top-1 acc 33.203 (34.965)	Top-5 acc 58.594 (59.012)	lr 0.02466
Train [9][2950/3239]	Time 0.549 (0.854)	Data Time 0.001 (0.008)	Loss 3.7308 (3.7965)	Entropy 1.55035 (1.57737)	Top-1 acc 34.766 (34.964)	Top-5 acc 60.156 (59.008)	lr 0.02466
Train [9][2960/3239]	Time 0.599 (0.854)	Data Time 0.001 (0.008)	Loss 3.8166 (3.7964)	Entropy 1.55020 (1.57728)	Top-1 acc 31.641 (34.963)	Top-5 acc 57.031 (59.013)	lr 0.02466
Train [9][2970/3239]	Time 0.535 (0.854)	Data Time 0.001 (0.008)	Loss 3.7690 (3.7964)	Entropy 1.55010 (1.57719)	Top-1 acc 35.156 (34.966)	Top-5 acc 61.719 (59.016)	lr 0.02466
Train [9][2980/3239]	Time 0.659 (0.854)	Data Time 0.001 (0.008)	Loss 3.8028 (3.7963)	Entropy 1.54993 (1.57710)	Top-1 acc 33.984 (34.965)	Top-5 acc 56.641 (59.017)	lr 0.02466
Train [9][2990/3239]	Time 0.531 (0.854)	Data Time 0.001 (0.008)	Loss 3.7109 (3.7962)	Entropy 1.54966 (1.57700)	Top-1 acc 36.328 (34.971)	Top-5 acc 59.766 (59.021)	lr 0.02466
Train [9][3000/3239]	Time 0.583 (0.854)	Data Time 0.001 (0.008)	Loss 3.6520 (3.7961)	Entropy 1.54963 (1.57691)	Top-1 acc 37.891 (34.972)	Top-5 acc 60.938 (59.022)	lr 0.02466
Train [9][3010/3239]	Time 0.567 (0.853)	Data Time 0.001 (0.008)	Loss 3.8025 (3.7958)	Entropy 1.54927 (1.57682)	Top-1 acc 36.719 (34.978)	Top-5 acc 57.031 (59.026)	lr 0.02466
Train [9][3020/3239]	Time 0.619 (0.853)	Data Time 0.001 (0.008)	Loss 3.7926 (3.7958)	Entropy 1.54925 (1.57673)	Top-1 acc 33.203 (34.979)	Top-5 acc 59.766 (59.027)	lr 0.02466
Train [9][3030/3239]	Time 0.641 (0.853)	Data Time 0.001 (0.008)	Loss 3.8021 (3.7955)	Entropy 1.54911 (1.57664)	Top-1 acc 36.719 (34.989)	Top-5 acc 58.203 (59.028)	lr 0.02466
Train [9][3040/3239]	Time 0.557 (0.853)	Data Time 0.001 (0.008)	Loss 3.7579 (3.7954)	Entropy 1.54900 (1.57655)	Top-1 acc 36.719 (34.991)	Top-5 acc 63.281 (59.031)	lr 0.02466
Train [9][3050/3239]	Time 0.585 (0.853)	Data Time 0.001 (0.008)	Loss 3.5481 (3.7953)	Entropy 1.54897 (1.57646)	Top-1 acc 41.016 (34.994)	Top-5 acc 67.578 (59.034)	lr 0.02466
Train [9][3060/3239]	Time 0.606 (0.853)	Data Time 0.001 (0.008)	Loss 3.6236 (3.7954)	Entropy 1.54887 (1.57637)	Top-1 acc 41.016 (34.993)	Top-5 acc 62.891 (59.032)	lr 0.02466
Train [9][3070/3239]	Time 0.492 (0.853)	Data Time 0.001 (0.008)	Loss 3.7262 (3.7953)	Entropy 1.54883 (1.57628)	Top-1 acc 37.109 (34.994)	Top-5 acc 58.984 (59.034)	lr 0.02466
Train [9][3080/3239]	Time 0.595 (0.853)	Data Time 0.001 (0.008)	Loss 3.7222 (3.7953)	Entropy 1.54877 (1.57619)	Top-1 acc 42.188 (34.996)	Top-5 acc 61.328 (59.035)	lr 0.02466
Train [9][3090/3239]	Time 0.575 (0.853)	Data Time 0.001 (0.008)	Loss 3.8239 (3.7952)	Entropy 1.54863 (1.57610)	Top-1 acc 30.078 (34.995)	Top-5 acc 60.547 (59.037)	lr 0.02466
Train [9][3100/3239]	Time 0.537 (0.853)	Data Time 0.001 (0.008)	Loss 3.7928 (3.7953)	Entropy 1.54853 (1.57601)	Top-1 acc 35.547 (34.994)	Top-5 acc 60.156 (59.036)	lr 0.02466
Train [9][3110/3239]	Time 0.606 (0.853)	Data Time 0.001 (0.008)	Loss 3.7202 (3.7951)	Entropy 1.54846 (1.57592)	Top-1 acc 37.109 (34.999)	Top-5 acc 59.375 (59.041)	lr 0.02466
Train [9][3120/3239]	Time 0.681 (0.852)	Data Time 0.001 (0.008)	Loss 3.6275 (3.7952)	Entropy 1.54839 (1.57584)	Top-1 acc 35.547 (34.998)	Top-5 acc 62.891 (59.036)	lr 0.02466
Train [9][3130/3239]	Time 0.590 (0.852)	Data Time 0.001 (0.008)	Loss 3.9712 (3.7953)	Entropy 1.54834 (1.57575)	Top-1 acc 31.641 (34.993)	Top-5 acc 51.953 (59.034)	lr 0.02466
Train [9][3140/3239]	Time 0.599 (0.852)	Data Time 0.001 (0.008)	Loss 3.9590 (3.7952)	Entropy 1.54805 (1.57566)	Top-1 acc 31.641 (34.994)	Top-5 acc 54.297 (59.033)	lr 0.02466
Train [9][3150/3239]	Time 0.518 (0.852)	Data Time 0.001 (0.008)	Loss 3.6340 (3.7950)	Entropy 1.54759 (1.57557)	Top-1 acc 39.844 (35.001)	Top-5 acc 59.375 (59.035)	lr 0.02466
Train [9][3160/3239]	Time 0.551 (0.852)	Data Time 0.001 (0.008)	Loss 3.7410 (3.7951)	Entropy 1.54747 (1.57548)	Top-1 acc 35.156 (34.998)	Top-5 acc 59.375 (59.034)	lr 0.02466
Train [9][3170/3239]	Time 0.460 (0.852)	Data Time 0.001 (0.008)	Loss 3.9574 (3.7951)	Entropy 1.54729 (1.57540)	Top-1 acc 33.594 (34.999)	Top-5 acc 59.375 (59.033)	lr 0.02466
Train [9][3180/3239]	Time 0.531 (0.852)	Data Time 0.000 (0.008)	Loss 3.6359 (3.7951)	Entropy 1.54743 (1.57531)	Top-1 acc 37.891 (34.999)	Top-5 acc 61.719 (59.033)	lr 0.02466
Train [9][3190/3239]	Time 0.568 (0.851)	Data Time 0.000 (0.008)	Loss 3.9279 (3.7950)	Entropy 1.54712 (1.57522)	Top-1 acc 32.422 (35.001)	Top-5 acc 57.031 (59.038)	lr 0.02466
Train [9][3200/3239]	Time 0.508 (0.851)	Data Time 0.000 (0.008)	Loss 3.9950 (3.7951)	Entropy 1.54683 (1.57513)	Top-1 acc 32.031 (34.999)	Top-5 acc 52.734 (59.035)	lr 0.02466
Train [9][3210/3239]	Time 0.541 (0.851)	Data Time 0.000 (0.007)	Loss 3.8122 (3.7951)	Entropy 1.54675 (1.57504)	Top-1 acc 37.109 (35.000)	Top-5 acc 57.812 (59.035)	lr 0.02466
Train [9][3220/3239]	Time 0.614 (0.851)	Data Time 0.000 (0.007)	Loss 3.8828 (3.7950)	Entropy 1.54653 (1.57496)	Top-1 acc 30.078 (35.000)	Top-5 acc 55.859 (59.038)	lr 0.02466
Train [9][3230/3239]	Time 0.581 (0.851)	Data Time 0.000 (0.007)	Loss 3.7767 (3.7948)	Entropy 1.54621 (1.57487)	Top-1 acc 33.203 (35.005)	Top-5 acc 58.984 (59.039)	lr 0.02465
Train [9][3239/3239]	Time 1.435 (0.851)	Data Time 0.000 (0.007)	Loss 4.5052 (3.7947)	Entropy 1.54602 (1.57479)	Top-1 acc 23.457 (35.008)	Top-5 acc 40.741 (59.042)	lr 0.02465
==========Valid [9/120]	loss 2.594	top-1 acc 44.442 (44.442)	top-5 acc 69.125	Train top-1 35.008	top-5 59.042	Entropy 1.54602	Latency-None: 0.000ms	Flops: 542.77M
Train [10][0/3239]	Time 20.445 (20.445)	Data Time 18.104 (18.104)	Loss 3.5064 (3.5064)	Entropy 1.54585 (1.54585)	Top-1 acc 39.062 (39.062)	Top-5 acc 64.062 (64.062)	lr 0.02465
Train [10][10/3239]	Time 0.582 (2.668)	Data Time 0.001 (1.650)	Loss 3.7914 (3.6792)	Entropy 1.54547 (1.54575)	Top-1 acc 33.984 (36.683)	Top-5 acc 60.938 (61.435)	lr 0.02465
Train [10][20/3239]	Time 0.558 (1.783)	Data Time 0.001 (0.865)	Loss 3.9174 (3.7215)	Entropy 1.54548 (1.54564)	Top-1 acc 34.766 (35.677)	Top-5 acc 55.078 (60.640)	lr 0.02465
Train [10][30/3239]	Time 0.585 (1.477)	Data Time 0.001 (0.587)	Loss 3.9860 (3.7339)	Entropy 1.54510 (1.54553)	Top-1 acc 32.812 (35.673)	Top-5 acc 54.688 (60.471)	lr 0.02465
Train [10][40/3239]	Time 0.589 (1.318)	Data Time 0.001 (0.445)	Loss 3.6753 (3.7470)	Entropy 1.54502 (1.54541)	Top-1 acc 35.156 (35.575)	Top-5 acc 63.281 (60.280)	lr 0.02465
Train [10][50/3239]	Time 0.572 (1.224)	Data Time 0.001 (0.358)	Loss 3.8253 (3.7525)	Entropy 1.54466 (1.54531)	Top-1 acc 37.891 (35.524)	Top-5 acc 59.375 (60.302)	lr 0.02465
Train [10][60/3239]	Time 0.560 (1.160)	Data Time 0.001 (0.299)	Loss 3.6037 (3.7440)	Entropy 1.54458 (1.54520)	Top-1 acc 34.375 (35.713)	Top-5 acc 61.719 (60.368)	lr 0.02465
Train [10][70/3239]	Time 0.538 (1.114)	Data Time 0.002 (0.258)	Loss 3.7497 (3.7434)	Entropy 1.54471 (1.54512)	Top-1 acc 33.203 (35.613)	Top-5 acc 62.891 (60.321)	lr 0.02465
Train [10][80/3239]	Time 0.545 (1.079)	Data Time 0.001 (0.226)	Loss 3.7744 (3.7385)	Entropy 1.54466 (1.54507)	Top-1 acc 32.812 (35.812)	Top-5 acc 58.594 (60.450)	lr 0.02465
Train [10][90/3239]	Time 0.610 (1.051)	Data Time 0.001 (0.201)	Loss 3.7403 (3.7372)	Entropy 1.54445 (1.54502)	Top-1 acc 36.719 (35.955)	Top-5 acc 58.203 (60.405)	lr 0.02465
Train [10][100/3239]	Time 0.559 (1.030)	Data Time 0.001 (0.182)	Loss 3.9418 (3.7380)	Entropy 1.54455 (1.54497)	Top-1 acc 32.812 (35.814)	Top-5 acc 55.469 (60.299)	lr 0.02465
Train [10][110/3239]	Time 0.532 (1.012)	Data Time 0.001 (0.166)	Loss 3.7112 (3.7411)	Entropy 1.54474 (1.54494)	Top-1 acc 37.891 (35.814)	Top-5 acc 60.156 (60.167)	lr 0.02465
Train [10][120/3239]	Time 0.609 (0.998)	Data Time 0.001 (0.152)	Loss 3.9078 (3.7427)	Entropy 1.54426 (1.54491)	Top-1 acc 35.547 (35.763)	Top-5 acc 56.641 (60.121)	lr 0.02465
Train [10][130/3239]	Time 0.457 (0.983)	Data Time 0.002 (0.141)	Loss 3.7100 (3.7456)	Entropy 1.54412 (1.54486)	Top-1 acc 37.891 (35.660)	Top-5 acc 58.203 (60.031)	lr 0.02465
Train [10][140/3239]	Time 0.645 (0.974)	Data Time 0.001 (0.131)	Loss 3.9652 (3.7436)	Entropy 1.54386 (1.54480)	Top-1 acc 31.250 (35.677)	Top-5 acc 54.297 (60.070)	lr 0.02465
Train [10][150/3239]	Time 0.527 (0.961)	Data Time 0.001 (0.122)	Loss 3.7791 (3.7423)	Entropy 1.54359 (1.54473)	Top-1 acc 33.984 (35.694)	Top-5 acc 59.766 (60.130)	lr 0.02465
Train [10][160/3239]	Time 0.583 (0.949)	Data Time 0.001 (0.115)	Loss 3.7741 (3.7429)	Entropy 1.54342 (1.54466)	Top-1 acc 32.812 (35.656)	Top-5 acc 61.719 (60.120)	lr 0.02465
Train [10][170/3239]	Time 0.552 (0.942)	Data Time 0.001 (0.108)	Loss 3.8309 (3.7446)	Entropy 1.54327 (1.54458)	Top-1 acc 33.203 (35.588)	Top-5 acc 55.469 (60.021)	lr 0.02465
Train [10][180/3239]	Time 0.589 (0.935)	Data Time 0.001 (0.103)	Loss 3.8537 (3.7440)	Entropy 1.54340 (1.54451)	Top-1 acc 30.859 (35.620)	Top-5 acc 58.594 (60.018)	lr 0.02465
Train [10][190/3239]	Time 0.577 (0.930)	Data Time 0.001 (0.097)	Loss 3.8741 (3.7426)	Entropy 1.54318 (1.54445)	Top-1 acc 33.984 (35.668)	Top-5 acc 53.516 (60.054)	lr 0.02465
Train [10][200/3239]	Time 0.613 (0.924)	Data Time 0.001 (0.093)	Loss 3.8090 (3.7409)	Entropy 1.54301 (1.54439)	Top-1 acc 32.812 (35.765)	Top-5 acc 60.547 (60.131)	lr 0.02465
Train [10][210/3239]	Time 0.640 (0.918)	Data Time 0.001 (0.088)	Loss 3.5561 (3.7446)	Entropy 1.54269 (1.54432)	Top-1 acc 41.016 (35.747)	Top-5 acc 61.328 (60.062)	lr 0.02465
Train [10][220/3239]	Time 0.538 (0.915)	Data Time 0.001 (0.084)	Loss 3.7338 (3.7476)	Entropy 1.54256 (1.54424)	Top-1 acc 32.031 (35.727)	Top-5 acc 60.938 (59.990)	lr 0.02465
Train [10][230/3239]	Time 0.588 (0.911)	Data Time 0.001 (0.081)	Loss 3.6304 (3.7491)	Entropy 1.54250 (1.54417)	Top-1 acc 35.938 (35.719)	Top-5 acc 62.109 (59.943)	lr 0.02465
Train [10][240/3239]	Time 0.496 (0.908)	Data Time 0.001 (0.078)	Loss 3.7458 (3.7485)	Entropy 1.54239 (1.54410)	Top-1 acc 34.375 (35.737)	Top-5 acc 60.156 (59.978)	lr 0.02465
Train [10][250/3239]	Time 0.607 (0.904)	Data Time 0.001 (0.075)	Loss 3.6294 (3.7462)	Entropy 1.54205 (1.54403)	Top-1 acc 38.281 (35.787)	Top-5 acc 65.625 (60.066)	lr 0.02465
Train [10][260/3239]	Time 0.570 (0.902)	Data Time 0.001 (0.072)	Loss 3.9067 (3.7478)	Entropy 1.54209 (1.54395)	Top-1 acc 30.469 (35.789)	Top-5 acc 56.250 (60.028)	lr 0.02465
Train [10][270/3239]	Time 0.575 (0.899)	Data Time 0.002 (0.069)	Loss 3.6535 (3.7459)	Entropy 1.54174 (1.54388)	Top-1 acc 41.016 (35.809)	Top-5 acc 62.109 (60.050)	lr 0.02465
Train [10][280/3239]	Time 0.605 (0.895)	Data Time 0.001 (0.067)	Loss 3.6845 (3.7456)	Entropy 1.54154 (1.54380)	Top-1 acc 37.891 (35.821)	Top-5 acc 61.328 (60.044)	lr 0.02465
Train [10][290/3239]	Time 0.579 (0.957)	Data Time 0.002 (0.065)	Loss 3.6543 (3.7460)	Entropy 1.54150 (1.54372)	Top-1 acc 35.938 (35.783)	Top-5 acc 62.891 (60.050)	lr 0.02465
Train [10][300/3239]	Time 0.607 (0.951)	Data Time 0.002 (0.063)	Loss 3.9991 (3.7489)	Entropy 1.54131 (1.54364)	Top-1 acc 30.859 (35.778)	Top-5 acc 56.250 (59.976)	lr 0.02465
Train [10][310/3239]	Time 0.598 (0.948)	Data Time 0.001 (0.061)	Loss 3.6897 (3.7495)	Entropy 1.54122 (1.54357)	Top-1 acc 34.766 (35.729)	Top-5 acc 64.062 (59.958)	lr 0.02465
Train [10][320/3239]	Time 0.588 (0.944)	Data Time 0.001 (0.059)	Loss 3.7149 (3.7494)	Entropy 1.54081 (1.54349)	Top-1 acc 41.797 (35.749)	Top-5 acc 62.500 (59.965)	lr 0.02465
Train [10][330/3239]	Time 0.407 (0.940)	Data Time 0.001 (0.057)	Loss 3.7522 (3.7509)	Entropy 1.54038 (1.54340)	Top-1 acc 34.766 (35.705)	Top-5 acc 60.547 (59.938)	lr 0.02465
Train [10][340/3239]	Time 0.568 (0.937)	Data Time 0.001 (0.056)	Loss 3.7924 (3.7522)	Entropy 1.54023 (1.54331)	Top-1 acc 31.641 (35.660)	Top-5 acc 61.719 (59.899)	lr 0.02465
Train [10][350/3239]	Time 0.553 (0.934)	Data Time 0.001 (0.054)	Loss 3.6064 (3.7525)	Entropy 1.54010 (1.54322)	Top-1 acc 39.844 (35.682)	Top-5 acc 61.719 (59.872)	lr 0.02465
Train [10][360/3239]	Time 0.577 (0.931)	Data Time 0.001 (0.053)	Loss 3.5683 (3.7516)	Entropy 1.54022 (1.54314)	Top-1 acc 37.500 (35.680)	Top-5 acc 64.062 (59.898)	lr 0.02465
Train [10][370/3239]	Time 0.606 (0.928)	Data Time 0.002 (0.052)	Loss 3.6136 (3.7520)	Entropy 1.53992 (1.54306)	Top-1 acc 41.406 (35.671)	Top-5 acc 65.625 (59.909)	lr 0.02465
Train [10][380/3239]	Time 0.603 (0.925)	Data Time 0.001 (0.050)	Loss 3.7708 (3.7524)	Entropy 1.53964 (1.54298)	Top-1 acc 35.547 (35.662)	Top-5 acc 59.766 (59.895)	lr 0.02465
Train [10][390/3239]	Time 0.535 (0.923)	Data Time 0.001 (0.049)	Loss 3.9077 (3.7531)	Entropy 1.53944 (1.54289)	Top-1 acc 31.641 (35.655)	Top-5 acc 54.297 (59.884)	lr 0.02465
Train [10][400/3239]	Time 0.641 (0.920)	Data Time 0.001 (0.048)	Loss 3.9632 (3.7522)	Entropy 1.53909 (1.54280)	Top-1 acc 32.422 (35.655)	Top-5 acc 55.469 (59.892)	lr 0.02465
Train [10][410/3239]	Time 0.554 (0.918)	Data Time 0.001 (0.047)	Loss 3.7923 (3.7532)	Entropy 1.53929 (1.54271)	Top-1 acc 32.812 (35.624)	Top-5 acc 60.938 (59.881)	lr 0.02464
Train [10][420/3239]	Time 0.607 (0.915)	Data Time 0.001 (0.046)	Loss 3.6204 (3.7527)	Entropy 1.53900 (1.54262)	Top-1 acc 33.594 (35.618)	Top-5 acc 62.109 (59.905)	lr 0.02464
Train [10][430/3239]	Time 0.543 (0.913)	Data Time 0.001 (0.045)	Loss 3.7667 (3.7540)	Entropy 1.53882 (1.54254)	Top-1 acc 34.375 (35.587)	Top-5 acc 61.328 (59.869)	lr 0.02464
Train [10][440/3239]	Time 0.566 (0.911)	Data Time 0.001 (0.044)	Loss 3.8001 (3.7535)	Entropy 1.53857 (1.54245)	Top-1 acc 32.422 (35.599)	Top-5 acc 59.375 (59.878)	lr 0.02464
Train [10][450/3239]	Time 0.565 (0.909)	Data Time 0.001 (0.043)	Loss 3.7900 (3.7533)	Entropy 1.53829 (1.54237)	Top-1 acc 33.594 (35.592)	Top-5 acc 60.156 (59.895)	lr 0.02464
Train [10][460/3239]	Time 0.595 (0.906)	Data Time 0.001 (0.042)	Loss 3.8211 (3.7526)	Entropy 1.53803 (1.54227)	Top-1 acc 34.766 (35.628)	Top-5 acc 61.328 (59.935)	lr 0.02464
Train [10][470/3239]	Time 0.555 (0.904)	Data Time 0.003 (0.041)	Loss 3.6819 (3.7528)	Entropy 1.53803 (1.54219)	Top-1 acc 38.672 (35.635)	Top-5 acc 64.844 (59.951)	lr 0.02464
Train [10][480/3239]	Time 0.572 (0.902)	Data Time 0.001 (0.040)	Loss 3.8494 (3.7527)	Entropy 1.53786 (1.54210)	Top-1 acc 35.938 (35.644)	Top-5 acc 60.156 (59.934)	lr 0.02464
Train [10][490/3239]	Time 0.572 (0.901)	Data Time 0.001 (0.040)	Loss 3.5238 (3.7538)	Entropy 1.53756 (1.54201)	Top-1 acc 41.797 (35.623)	Top-5 acc 64.453 (59.908)	lr 0.02464
Train [10][500/3239]	Time 0.622 (0.899)	Data Time 0.001 (0.039)	Loss 3.8922 (3.7540)	Entropy 1.53757 (1.54192)	Top-1 acc 33.984 (35.634)	Top-5 acc 56.250 (59.916)	lr 0.02464
Train [10][510/3239]	Time 0.582 (0.897)	Data Time 0.001 (0.038)	Loss 3.7267 (3.7540)	Entropy 1.53752 (1.54184)	Top-1 acc 36.719 (35.640)	Top-5 acc 59.375 (59.911)	lr 0.02464
Train [10][520/3239]	Time 0.583 (0.896)	Data Time 0.001 (0.038)	Loss 3.7547 (3.7542)	Entropy 1.53748 (1.54175)	Top-1 acc 35.938 (35.646)	Top-5 acc 61.719 (59.898)	lr 0.02464
Train [10][530/3239]	Time 0.581 (0.895)	Data Time 0.002 (0.037)	Loss 3.6160 (3.7542)	Entropy 1.53728 (1.54167)	Top-1 acc 38.281 (35.645)	Top-5 acc 64.453 (59.893)	lr 0.02464
Train [10][540/3239]	Time 0.541 (0.893)	Data Time 0.001 (0.036)	Loss 3.6902 (3.7532)	Entropy 1.53743 (1.54159)	Top-1 acc 33.984 (35.686)	Top-5 acc 61.328 (59.914)	lr 0.02464
Train [10][550/3239]	Time 0.604 (0.892)	Data Time 0.001 (0.036)	Loss 3.6488 (3.7534)	Entropy 1.53733 (1.54152)	Top-1 acc 37.500 (35.691)	Top-5 acc 61.328 (59.897)	lr 0.02464
Train [10][560/3239]	Time 0.574 (0.891)	Data Time 0.001 (0.035)	Loss 3.6576 (3.7535)	Entropy 1.53687 (1.54144)	Top-1 acc 40.234 (35.692)	Top-5 acc 64.062 (59.914)	lr 0.02464
Train [10][570/3239]	Time 0.597 (0.890)	Data Time 0.001 (0.034)	Loss 3.8020 (3.7540)	Entropy 1.53695 (1.54136)	Top-1 acc 34.375 (35.683)	Top-5 acc 59.375 (59.904)	lr 0.02464
Train [10][580/3239]	Time 0.526 (0.888)	Data Time 0.001 (0.034)	Loss 3.8565 (3.7535)	Entropy 1.53709 (1.54128)	Top-1 acc 33.203 (35.685)	Top-5 acc 56.250 (59.920)	lr 0.02464
Train [10][590/3239]	Time 0.526 (0.887)	Data Time 0.001 (0.033)	Loss 3.8768 (3.7535)	Entropy 1.53668 (1.54121)	Top-1 acc 33.203 (35.691)	Top-5 acc 59.375 (59.920)	lr 0.02464
Train [10][600/3239]	Time 0.581 (0.886)	Data Time 0.001 (0.033)	Loss 4.0114 (3.7549)	Entropy 1.53618 (1.54113)	Top-1 acc 32.422 (35.665)	Top-5 acc 53.516 (59.902)	lr 0.02464
Train [10][610/3239]	Time 0.634 (0.885)	Data Time 0.001 (0.032)	Loss 3.8341 (3.7555)	Entropy 1.53598 (1.54105)	Top-1 acc 34.375 (35.656)	Top-5 acc 56.641 (59.886)	lr 0.02464
Train [10][620/3239]	Time 0.573 (0.884)	Data Time 0.020 (0.032)	Loss 3.7023 (3.7552)	Entropy 1.53598 (1.54097)	Top-1 acc 34.766 (35.671)	Top-5 acc 60.156 (59.898)	lr 0.02464
Train [10][630/3239]	Time 0.626 (0.883)	Data Time 0.001 (0.031)	Loss 3.8379 (3.7549)	Entropy 1.53619 (1.54089)	Top-1 acc 31.641 (35.662)	Top-5 acc 55.469 (59.902)	lr 0.02464
Train [10][640/3239]	Time 0.569 (0.881)	Data Time 0.001 (0.031)	Loss 3.7110 (3.7548)	Entropy 1.53607 (1.54082)	Top-1 acc 39.453 (35.681)	Top-5 acc 58.594 (59.900)	lr 0.02464
Train [10][650/3239]	Time 0.547 (0.880)	Data Time 0.001 (0.030)	Loss 3.8174 (3.7551)	Entropy 1.53581 (1.54074)	Top-1 acc 34.766 (35.663)	Top-5 acc 57.812 (59.896)	lr 0.02464
Train [10][660/3239]	Time 0.544 (0.879)	Data Time 0.001 (0.030)	Loss 3.6236 (3.7549)	Entropy 1.53555 (1.54067)	Top-1 acc 37.891 (35.664)	Top-5 acc 62.109 (59.913)	lr 0.02464
Train [10][670/3239]	Time 0.583 (0.878)	Data Time 0.001 (0.030)	Loss 3.5188 (3.7546)	Entropy 1.53538 (1.54059)	Top-1 acc 37.891 (35.676)	Top-5 acc 66.406 (59.925)	lr 0.02464
Train [10][680/3239]	Time 0.614 (0.878)	Data Time 0.001 (0.029)	Loss 3.8314 (3.7553)	Entropy 1.53495 (1.54051)	Top-1 acc 34.766 (35.682)	Top-5 acc 57.812 (59.904)	lr 0.02464
Train [10][690/3239]	Time 0.572 (0.876)	Data Time 0.001 (0.029)	Loss 3.5285 (3.7557)	Entropy 1.53448 (1.54043)	Top-1 acc 42.578 (35.685)	Top-5 acc 65.234 (59.887)	lr 0.02464
Train [10][700/3239]	Time 0.594 (0.876)	Data Time 0.001 (0.028)	Loss 3.6458 (3.7552)	Entropy 1.53409 (1.54035)	Top-1 acc 37.891 (35.697)	Top-5 acc 62.500 (59.890)	lr 0.02464
Train [10][710/3239]	Time 0.529 (0.875)	Data Time 0.001 (0.028)	Loss 3.8294 (3.7557)	Entropy 1.53398 (1.54026)	Top-1 acc 35.156 (35.691)	Top-5 acc 58.594 (59.876)	lr 0.02464
Train [10][720/3239]	Time 0.554 (0.874)	Data Time 0.001 (0.028)	Loss 3.8534 (3.7556)	Entropy 1.53391 (1.54017)	Top-1 acc 34.766 (35.695)	Top-5 acc 62.109 (59.884)	lr 0.02464
Train [10][730/3239]	Time 0.499 (0.873)	Data Time 0.001 (0.027)	Loss 3.8136 (3.7553)	Entropy 1.53368 (1.54008)	Top-1 acc 34.766 (35.701)	Top-5 acc 56.641 (59.880)	lr 0.02464
Train [10][740/3239]	Time 0.553 (0.873)	Data Time 0.002 (0.027)	Loss 3.7544 (3.7551)	Entropy 1.53341 (1.53999)	Top-1 acc 37.109 (35.708)	Top-5 acc 62.109 (59.883)	lr 0.02464
Train [10][750/3239]	Time 0.658 (0.872)	Data Time 0.001 (0.027)	Loss 3.7050 (3.7551)	Entropy 1.53308 (1.53991)	Top-1 acc 38.672 (35.719)	Top-5 acc 60.547 (59.893)	lr 0.02464
Train [10][760/3239]	Time 0.560 (0.872)	Data Time 0.002 (0.026)	Loss 3.9566 (3.7559)	Entropy 1.53276 (1.53981)	Top-1 acc 33.203 (35.700)	Top-5 acc 53.516 (59.865)	lr 0.02464
Train [10][770/3239]	Time 0.549 (0.871)	Data Time 0.001 (0.026)	Loss 3.6829 (3.7564)	Entropy 1.53270 (1.53972)	Top-1 acc 37.891 (35.702)	Top-5 acc 60.547 (59.861)	lr 0.02464
Train [10][780/3239]	Time 0.589 (0.871)	Data Time 0.001 (0.026)	Loss 3.7853 (3.7564)	Entropy 1.53222 (1.53963)	Top-1 acc 35.547 (35.686)	Top-5 acc 58.203 (59.850)	lr 0.02464
Train [10][790/3239]	Time 0.621 (0.870)	Data Time 0.001 (0.025)	Loss 3.7400 (3.7554)	Entropy 1.53211 (1.53953)	Top-1 acc 38.281 (35.706)	Top-5 acc 58.594 (59.873)	lr 0.02464
Train [10][800/3239]	Time 0.519 (0.869)	Data Time 0.001 (0.025)	Loss 3.9634 (3.7558)	Entropy 1.53174 (1.53944)	Top-1 acc 32.031 (35.702)	Top-5 acc 56.250 (59.871)	lr 0.02464
Train [10][810/3239]	Time 0.550 (0.868)	Data Time 0.001 (0.025)	Loss 3.9644 (3.7562)	Entropy 1.53165 (1.53935)	Top-1 acc 33.203 (35.693)	Top-5 acc 53.906 (59.860)	lr 0.02464
Train [10][820/3239]	Time 0.451 (0.868)	Data Time 0.001 (0.025)	Loss 3.6481 (3.7560)	Entropy 1.53154 (1.53925)	Top-1 acc 39.453 (35.689)	Top-5 acc 59.375 (59.856)	lr 0.02464
Train [10][830/3239]	Time 0.603 (0.867)	Data Time 0.001 (0.024)	Loss 3.7804 (3.7562)	Entropy 1.53164 (1.53916)	Top-1 acc 34.375 (35.682)	Top-5 acc 60.938 (59.855)	lr 0.02463
Train [10][840/3239]	Time 0.519 (0.866)	Data Time 0.001 (0.024)	Loss 3.9009 (3.7566)	Entropy 1.53130 (1.53907)	Top-1 acc 30.859 (35.668)	Top-5 acc 53.516 (59.835)	lr 0.02463
Train [10][850/3239]	Time 0.559 (0.866)	Data Time 0.001 (0.024)	Loss 3.7961 (3.7566)	Entropy 1.53100 (1.53898)	Top-1 acc 36.328 (35.672)	Top-5 acc 58.984 (59.832)	lr 0.02463
Train [10][860/3239]	Time 0.612 (0.865)	Data Time 0.001 (0.024)	Loss 3.8417 (3.7566)	Entropy 1.53088 (1.53888)	Top-1 acc 36.328 (35.674)	Top-5 acc 57.031 (59.838)	lr 0.02463
Train [10][870/3239]	Time 0.697 (0.865)	Data Time 0.002 (0.023)	Loss 3.9422 (3.7566)	Entropy 1.53081 (1.53879)	Top-1 acc 36.328 (35.691)	Top-5 acc 58.203 (59.852)	lr 0.02463
Train [10][880/3239]	Time 0.586 (0.864)	Data Time 0.001 (0.023)	Loss 3.7805 (3.7556)	Entropy 1.53061 (1.53870)	Top-1 acc 34.375 (35.722)	Top-5 acc 58.594 (59.877)	lr 0.02463
Train [10][890/3239]	Time 0.578 (0.864)	Data Time 0.001 (0.023)	Loss 4.0093 (3.7562)	Entropy 1.53055 (1.53861)	Top-1 acc 27.344 (35.723)	Top-5 acc 56.250 (59.868)	lr 0.02463
Train [10][900/3239]	Time 0.586 (0.863)	Data Time 0.001 (0.023)	Loss 3.6568 (3.7556)	Entropy 1.53048 (1.53852)	Top-1 acc 34.766 (35.723)	Top-5 acc 60.547 (59.885)	lr 0.02463
Train [10][910/3239]	Time 0.581 (0.863)	Data Time 0.002 (0.022)	Loss 3.5563 (3.7553)	Entropy 1.53049 (1.53843)	Top-1 acc 44.531 (35.739)	Top-5 acc 64.844 (59.891)	lr 0.02463
Train [10][920/3239]	Time 0.583 (0.863)	Data Time 0.002 (0.022)	Loss 3.8005 (3.7554)	Entropy 1.53025 (1.53834)	Top-1 acc 33.984 (35.737)	Top-5 acc 58.984 (59.879)	lr 0.02463
Train [10][930/3239]	Time 0.570 (0.862)	Data Time 0.001 (0.022)	Loss 3.5868 (3.7551)	Entropy 1.52997 (1.53826)	Top-1 acc 41.016 (35.748)	Top-5 acc 63.672 (59.887)	lr 0.02463
Train [10][940/3239]	Time 0.504 (0.884)	Data Time 0.006 (0.022)	Loss 3.7629 (3.7553)	Entropy 1.52967 (1.53817)	Top-1 acc 36.328 (35.742)	Top-5 acc 60.156 (59.880)	lr 0.02463
Train [10][950/3239]	Time 0.594 (0.883)	Data Time 0.002 (0.022)	Loss 3.5578 (3.7548)	Entropy 1.52930 (1.53808)	Top-1 acc 41.016 (35.760)	Top-5 acc 60.547 (59.892)	lr 0.02463
Train [10][960/3239]	Time 0.567 (0.882)	Data Time 0.001 (0.021)	Loss 3.7563 (3.7553)	Entropy 1.52906 (1.53798)	Top-1 acc 35.547 (35.757)	Top-5 acc 57.812 (59.882)	lr 0.02463
Train [10][970/3239]	Time 0.486 (0.882)	Data Time 0.001 (0.021)	Loss 3.6000 (3.7553)	Entropy 1.52879 (1.53789)	Top-1 acc 38.672 (35.753)	Top-5 acc 60.938 (59.878)	lr 0.02463
Train [10][980/3239]	Time 0.550 (0.881)	Data Time 0.001 (0.021)	Loss 3.8309 (3.7556)	Entropy 1.52888 (1.53780)	Top-1 acc 34.766 (35.750)	Top-5 acc 60.156 (59.878)	lr 0.02463
Train [10][990/3239]	Time 0.556 (0.881)	Data Time 0.001 (0.021)	Loss 3.9016 (3.7559)	Entropy 1.52860 (1.53771)	Top-1 acc 32.422 (35.757)	Top-5 acc 58.984 (59.880)	lr 0.02463
Train [10][1000/3239]	Time 0.534 (0.880)	Data Time 0.001 (0.021)	Loss 3.8559 (3.7564)	Entropy 1.52813 (1.53761)	Top-1 acc 32.812 (35.744)	Top-5 acc 57.031 (59.862)	lr 0.02463
Train [10][1010/3239]	Time 0.670 (0.880)	Data Time 0.002 (0.020)	Loss 4.0213 (3.7566)	Entropy 1.52783 (1.53752)	Top-1 acc 32.812 (35.744)	Top-5 acc 53.125 (59.859)	lr 0.02463
Train [10][1020/3239]	Time 0.565 (0.879)	Data Time 0.001 (0.020)	Loss 3.7419 (3.7565)	Entropy 1.52742 (1.53742)	Top-1 acc 35.938 (35.744)	Top-5 acc 58.594 (59.856)	lr 0.02463
Train [10][1030/3239]	Time 0.625 (0.879)	Data Time 0.001 (0.020)	Loss 3.7786 (3.7567)	Entropy 1.52750 (1.53732)	Top-1 acc 34.766 (35.733)	Top-5 acc 57.812 (59.852)	lr 0.02463
Train [10][1040/3239]	Time 0.572 (0.878)	Data Time 0.001 (0.020)	Loss 3.7371 (3.7568)	Entropy 1.52741 (1.53723)	Top-1 acc 37.500 (35.743)	Top-5 acc 58.594 (59.843)	lr 0.02463
Train [10][1050/3239]	Time 0.618 (0.878)	Data Time 0.001 (0.020)	Loss 3.6886 (3.7563)	Entropy 1.52739 (1.53714)	Top-1 acc 34.766 (35.741)	Top-5 acc 60.547 (59.844)	lr 0.02463
Train [10][1060/3239]	Time 0.503 (0.877)	Data Time 0.001 (0.020)	Loss 3.9041 (3.7559)	Entropy 1.52717 (1.53704)	Top-1 acc 33.203 (35.747)	Top-5 acc 58.984 (59.856)	lr 0.02463
Train [10][1070/3239]	Time 0.551 (0.877)	Data Time 0.001 (0.019)	Loss 3.9580 (3.7558)	Entropy 1.52708 (1.53695)	Top-1 acc 31.641 (35.746)	Top-5 acc 55.469 (59.862)	lr 0.02463
Train [10][1080/3239]	Time 0.679 (0.877)	Data Time 0.001 (0.019)	Loss 3.7882 (3.7556)	Entropy 1.52715 (1.53686)	Top-1 acc 37.109 (35.751)	Top-5 acc 58.203 (59.860)	lr 0.02463
Train [10][1090/3239]	Time 0.583 (0.876)	Data Time 0.001 (0.019)	Loss 3.5050 (3.7550)	Entropy 1.52636 (1.53677)	Top-1 acc 41.016 (35.761)	Top-5 acc 62.891 (59.875)	lr 0.02463
Train [10][1100/3239]	Time 0.458 (0.875)	Data Time 0.001 (0.019)	Loss 3.6744 (3.7550)	Entropy 1.52638 (1.53667)	Top-1 acc 35.547 (35.766)	Top-5 acc 62.891 (59.882)	lr 0.02463
Train [10][1110/3239]	Time 0.582 (0.875)	Data Time 0.001 (0.019)	Loss 3.7800 (3.7549)	Entropy 1.52570 (1.53658)	Top-1 acc 37.109 (35.769)	Top-5 acc 55.078 (59.873)	lr 0.02463
Train [10][1120/3239]	Time 0.583 (0.874)	Data Time 0.001 (0.019)	Loss 3.7402 (3.7545)	Entropy 1.52550 (1.53648)	Top-1 acc 37.500 (35.779)	Top-5 acc 59.375 (59.878)	lr 0.02463
Train [10][1130/3239]	Time 0.615 (0.874)	Data Time 0.001 (0.019)	Loss 3.5414 (3.7547)	Entropy 1.52536 (1.53638)	Top-1 acc 40.625 (35.782)	Top-5 acc 62.500 (59.876)	lr 0.02463
Train [10][1140/3239]	Time 0.529 (0.873)	Data Time 0.001 (0.018)	Loss 3.8231 (3.7541)	Entropy 1.52561 (1.53629)	Top-1 acc 33.984 (35.794)	Top-5 acc 56.250 (59.893)	lr 0.02463
Train [10][1150/3239]	Time 0.594 (0.873)	Data Time 0.001 (0.018)	Loss 3.7581 (3.7538)	Entropy 1.52559 (1.53620)	Top-1 acc 35.547 (35.794)	Top-5 acc 58.203 (59.892)	lr 0.02463
Train [10][1160/3239]	Time 0.583 (0.872)	Data Time 0.001 (0.018)	Loss 3.6790 (3.7535)	Entropy 1.52535 (1.53610)	Top-1 acc 36.328 (35.803)	Top-5 acc 58.984 (59.887)	lr 0.02463
Train [10][1170/3239]	Time 0.567 (0.872)	Data Time 0.001 (0.018)	Loss 3.6706 (3.7536)	Entropy 1.52489 (1.53601)	Top-1 acc 35.547 (35.799)	Top-5 acc 64.062 (59.888)	lr 0.02463
Train [10][1180/3239]	Time 0.591 (0.872)	Data Time 0.029 (0.018)	Loss 3.6246 (3.7535)	Entropy 1.52451 (1.53591)	Top-1 acc 34.375 (35.805)	Top-5 acc 64.062 (59.894)	lr 0.02463
Train [10][1190/3239]	Time 0.656 (0.871)	Data Time 0.003 (0.018)	Loss 3.7119 (3.7532)	Entropy 1.52454 (1.53582)	Top-1 acc 34.766 (35.818)	Top-5 acc 61.328 (59.909)	lr 0.02463
Train [10][1200/3239]	Time 0.560 (0.871)	Data Time 0.001 (0.018)	Loss 3.7429 (3.7531)	Entropy 1.52453 (1.53572)	Top-1 acc 37.109 (35.820)	Top-5 acc 57.812 (59.913)	lr 0.02463
Train [10][1210/3239]	Time 0.587 (0.871)	Data Time 0.001 (0.018)	Loss 3.5904 (3.7526)	Entropy 1.52457 (1.53563)	Top-1 acc 37.891 (35.834)	Top-5 acc 64.453 (59.926)	lr 0.02463
Train [10][1220/3239]	Time 0.617 (0.871)	Data Time 0.001 (0.017)	Loss 3.9104 (3.7522)	Entropy 1.52454 (1.53554)	Top-1 acc 30.469 (35.842)	Top-5 acc 59.766 (59.936)	lr 0.02463
Train [10][1230/3239]	Time 0.552 (0.870)	Data Time 0.002 (0.017)	Loss 3.8262 (3.7526)	Entropy 1.52408 (1.53545)	Top-1 acc 35.547 (35.841)	Top-5 acc 55.078 (59.929)	lr 0.02463
Train [10][1240/3239]	Time 0.691 (0.870)	Data Time 0.001 (0.017)	Loss 3.4730 (3.7519)	Entropy 1.52397 (1.53536)	Top-1 acc 42.578 (35.851)	Top-5 acc 62.500 (59.939)	lr 0.02462
Train [10][1250/3239]	Time 0.553 (0.870)	Data Time 0.001 (0.017)	Loss 3.5829 (3.7516)	Entropy 1.52397 (1.53527)	Top-1 acc 41.797 (35.863)	Top-5 acc 62.109 (59.942)	lr 0.02462
Train [10][1260/3239]	Time 0.554 (0.869)	Data Time 0.001 (0.017)	Loss 3.8791 (3.7517)	Entropy 1.52409 (1.53518)	Top-1 acc 32.031 (35.857)	Top-5 acc 59.375 (59.946)	lr 0.02462
Train [10][1270/3239]	Time 0.547 (0.869)	Data Time 0.001 (0.017)	Loss 3.9864 (3.7519)	Entropy 1.52393 (1.53509)	Top-1 acc 29.297 (35.850)	Top-5 acc 57.031 (59.947)	lr 0.02462
Train [10][1280/3239]	Time 0.608 (0.868)	Data Time 0.001 (0.017)	Loss 3.6735 (3.7513)	Entropy 1.52357 (1.53500)	Top-1 acc 34.375 (35.859)	Top-5 acc 61.328 (59.962)	lr 0.02462
Train [10][1290/3239]	Time 0.607 (0.868)	Data Time 0.002 (0.017)	Loss 3.7373 (3.7515)	Entropy 1.52302 (1.53491)	Top-1 acc 35.547 (35.857)	Top-5 acc 60.547 (59.957)	lr 0.02462
Train [10][1300/3239]	Time 0.271 (0.867)	Data Time 0.001 (0.016)	Loss 3.8616 (3.7514)	Entropy 1.52266 (1.53482)	Top-1 acc 32.812 (35.856)	Top-5 acc 57.031 (59.962)	lr 0.02462
Train [10][1310/3239]	Time 0.553 (0.867)	Data Time 0.002 (0.016)	Loss 3.6626 (3.7512)	Entropy 1.52256 (1.53473)	Top-1 acc 40.234 (35.861)	Top-5 acc 59.375 (59.952)	lr 0.02462
Train [10][1320/3239]	Time 0.556 (0.866)	Data Time 0.001 (0.016)	Loss 3.9482 (3.7518)	Entropy 1.52237 (1.53463)	Top-1 acc 31.250 (35.847)	Top-5 acc 55.859 (59.945)	lr 0.02462
Train [10][1330/3239]	Time 0.523 (0.866)	Data Time 0.001 (0.016)	Loss 3.7241 (3.7515)	Entropy 1.52263 (1.53454)	Top-1 acc 37.891 (35.855)	Top-5 acc 58.203 (59.946)	lr 0.02462
Train [10][1340/3239]	Time 0.593 (0.866)	Data Time 0.001 (0.016)	Loss 3.9360 (3.7515)	Entropy 1.52261 (1.53445)	Top-1 acc 34.375 (35.860)	Top-5 acc 55.859 (59.948)	lr 0.02462
Train [10][1350/3239]	Time 0.585 (0.865)	Data Time 0.001 (0.016)	Loss 3.7156 (3.7515)	Entropy 1.52239 (1.53437)	Top-1 acc 37.891 (35.864)	Top-5 acc 62.891 (59.947)	lr 0.02462
Train [10][1360/3239]	Time 0.657 (0.865)	Data Time 0.002 (0.016)	Loss 3.9129 (3.7516)	Entropy 1.52223 (1.53428)	Top-1 acc 29.297 (35.863)	Top-5 acc 58.594 (59.945)	lr 0.02462
Train [10][1370/3239]	Time 0.533 (0.865)	Data Time 0.001 (0.016)	Loss 3.5759 (3.7514)	Entropy 1.52204 (1.53419)	Top-1 acc 39.844 (35.868)	Top-5 acc 64.062 (59.947)	lr 0.02462
Train [10][1380/3239]	Time 0.586 (0.865)	Data Time 0.001 (0.016)	Loss 3.6627 (3.7512)	Entropy 1.52157 (1.53410)	Top-1 acc 34.766 (35.873)	Top-5 acc 59.375 (59.946)	lr 0.02462
Train [10][1390/3239]	Time 0.608 (0.864)	Data Time 0.001 (0.016)	Loss 3.8066 (3.7514)	Entropy 1.52145 (1.53401)	Top-1 acc 33.594 (35.867)	Top-5 acc 56.250 (59.934)	lr 0.02462
Train [10][1400/3239]	Time 0.620 (0.864)	Data Time 0.001 (0.016)	Loss 3.6530 (3.7517)	Entropy 1.52151 (1.53392)	Top-1 acc 40.234 (35.863)	Top-5 acc 63.672 (59.931)	lr 0.02462
Train [10][1410/3239]	Time 0.598 (0.864)	Data Time 0.001 (0.015)	Loss 3.8218 (3.7520)	Entropy 1.52142 (1.53383)	Top-1 acc 32.422 (35.854)	Top-5 acc 54.688 (59.917)	lr 0.02462
Train [10][1420/3239]	Time 0.531 (0.864)	Data Time 0.002 (0.015)	Loss 3.5715 (3.7516)	Entropy 1.52127 (1.53374)	Top-1 acc 39.453 (35.850)	Top-5 acc 65.234 (59.930)	lr 0.02462
Train [10][1430/3239]	Time 0.729 (0.864)	Data Time 0.001 (0.015)	Loss 3.6225 (3.7518)	Entropy 1.52134 (1.53366)	Top-1 acc 42.188 (35.847)	Top-5 acc 62.109 (59.937)	lr 0.02462
Train [10][1440/3239]	Time 0.536 (0.863)	Data Time 0.001 (0.015)	Loss 3.8405 (3.7521)	Entropy 1.52121 (1.53357)	Top-1 acc 35.156 (35.843)	Top-5 acc 57.812 (59.925)	lr 0.02462
Train [10][1450/3239]	Time 0.579 (0.863)	Data Time 0.001 (0.015)	Loss 3.8306 (3.7522)	Entropy 1.52092 (1.53349)	Top-1 acc 33.594 (35.844)	Top-5 acc 57.031 (59.922)	lr 0.02462
Train [10][1460/3239]	Time 0.428 (0.863)	Data Time 0.001 (0.015)	Loss 3.8546 (3.7523)	Entropy 1.52096 (1.53340)	Top-1 acc 31.250 (35.842)	Top-5 acc 57.812 (59.915)	lr 0.02462
Train [10][1470/3239]	Time 0.551 (0.862)	Data Time 0.001 (0.015)	Loss 3.9381 (3.7523)	Entropy 1.52095 (1.53332)	Top-1 acc 33.203 (35.837)	Top-5 acc 55.469 (59.909)	lr 0.02462
Train [10][1480/3239]	Time 0.581 (0.862)	Data Time 0.002 (0.015)	Loss 3.7861 (3.7525)	Entropy 1.52061 (1.53323)	Top-1 acc 31.641 (35.836)	Top-5 acc 60.156 (59.906)	lr 0.02462
Train [10][1490/3239]	Time 0.653 (0.862)	Data Time 0.001 (0.015)	Loss 3.7684 (3.7525)	Entropy 1.52053 (1.53315)	Top-1 acc 33.594 (35.825)	Top-5 acc 57.812 (59.904)	lr 0.02462
Train [10][1500/3239]	Time 0.644 (0.861)	Data Time 0.002 (0.015)	Loss 3.9983 (3.7526)	Entropy 1.52047 (1.53306)	Top-1 acc 30.078 (35.827)	Top-5 acc 56.641 (59.907)	lr 0.02462
Train [10][1510/3239]	Time 0.611 (0.861)	Data Time 0.001 (0.015)	Loss 3.7537 (3.7527)	Entropy 1.52028 (1.53298)	Top-1 acc 37.891 (35.834)	Top-5 acc 61.328 (59.904)	lr 0.02462
Train [10][1520/3239]	Time 0.618 (0.861)	Data Time 0.001 (0.014)	Loss 3.7115 (3.7524)	Entropy 1.52018 (1.53289)	Top-1 acc 34.766 (35.832)	Top-5 acc 60.938 (59.907)	lr 0.02462
Train [10][1530/3239]	Time 0.551 (0.861)	Data Time 0.001 (0.014)	Loss 3.7905 (3.7523)	Entropy 1.51989 (1.53281)	Top-1 acc 35.547 (35.832)	Top-5 acc 55.469 (59.907)	lr 0.02462
Train [10][1540/3239]	Time 0.566 (0.860)	Data Time 0.001 (0.014)	Loss 3.5361 (3.7521)	Entropy 1.51944 (1.53273)	Top-1 acc 40.234 (35.838)	Top-5 acc 66.406 (59.910)	lr 0.02462
Train [10][1550/3239]	Time 0.587 (0.860)	Data Time 0.001 (0.014)	Loss 3.6571 (3.7519)	Entropy 1.51924 (1.53264)	Top-1 acc 39.062 (35.840)	Top-5 acc 60.547 (59.914)	lr 0.02462
Train [10][1560/3239]	Time 0.607 (0.860)	Data Time 0.001 (0.014)	Loss 3.6453 (3.7516)	Entropy 1.51905 (1.53256)	Top-1 acc 40.234 (35.847)	Top-5 acc 62.109 (59.924)	lr 0.02462
Train [10][1570/3239]	Time 0.712 (0.860)	Data Time 0.001 (0.014)	Loss 3.6633 (3.7515)	Entropy 1.51878 (1.53247)	Top-1 acc 36.719 (35.847)	Top-5 acc 61.719 (59.926)	lr 0.02462
Train [10][1580/3239]	Time 0.588 (0.860)	Data Time 0.001 (0.014)	Loss 3.7447 (3.7516)	Entropy 1.51872 (1.53238)	Top-1 acc 36.719 (35.840)	Top-5 acc 58.203 (59.925)	lr 0.02462
Train [10][1590/3239]	Time 0.645 (0.859)	Data Time 0.001 (0.014)	Loss 3.6621 (3.7519)	Entropy 1.51875 (1.53230)	Top-1 acc 39.453 (35.839)	Top-5 acc 64.062 (59.919)	lr 0.02462
Train [10][1600/3239]	Time 0.488 (0.871)	Data Time 0.002 (0.014)	Loss 3.6885 (3.7519)	Entropy 1.51857 (1.53221)	Top-1 acc 37.891 (35.840)	Top-5 acc 65.234 (59.919)	lr 0.02462
Train [10][1610/3239]	Time 0.455 (0.870)	Data Time 0.002 (0.014)	Loss 3.5518 (3.7521)	Entropy 1.51850 (1.53213)	Top-1 acc 41.016 (35.833)	Top-5 acc 64.453 (59.917)	lr 0.02462
Train [10][1620/3239]	Time 0.573 (0.870)	Data Time 0.001 (0.014)	Loss 3.8070 (3.7521)	Entropy 1.51849 (1.53204)	Top-1 acc 39.062 (35.836)	Top-5 acc 55.469 (59.916)	lr 0.02462
Train [10][1630/3239]	Time 0.561 (0.870)	Data Time 0.001 (0.014)	Loss 3.8620 (3.7523)	Entropy 1.51815 (1.53196)	Top-1 acc 34.766 (35.835)	Top-5 acc 58.203 (59.913)	lr 0.02462
Train [10][1640/3239]	Time 0.656 (0.870)	Data Time 0.001 (0.014)	Loss 3.5431 (3.7524)	Entropy 1.51840 (1.53188)	Top-1 acc 39.453 (35.830)	Top-5 acc 65.625 (59.911)	lr 0.02461
Train [10][1650/3239]	Time 0.545 (0.869)	Data Time 0.001 (0.014)	Loss 3.7662 (3.7525)	Entropy 1.51809 (1.53179)	Top-1 acc 36.328 (35.837)	Top-5 acc 58.594 (59.910)	lr 0.02461
Train [10][1660/3239]	Time 0.577 (0.869)	Data Time 0.001 (0.013)	Loss 3.8065 (3.7523)	Entropy 1.51807 (1.53171)	Top-1 acc 38.672 (35.838)	Top-5 acc 61.328 (59.917)	lr 0.02461
Train [10][1670/3239]	Time 0.580 (0.869)	Data Time 0.001 (0.013)	Loss 3.7202 (3.7518)	Entropy 1.51808 (1.53163)	Top-1 acc 33.203 (35.843)	Top-5 acc 61.328 (59.928)	lr 0.02461
Train [10][1680/3239]	Time 0.526 (0.869)	Data Time 0.001 (0.013)	Loss 3.7118 (3.7515)	Entropy 1.51800 (1.53155)	Top-1 acc 37.500 (35.853)	Top-5 acc 55.078 (59.938)	lr 0.02461
Train [10][1690/3239]	Time 0.588 (0.868)	Data Time 0.001 (0.013)	Loss 3.6971 (3.7515)	Entropy 1.51770 (1.53147)	Top-1 acc 37.891 (35.851)	Top-5 acc 62.109 (59.944)	lr 0.02461
Train [10][1700/3239]	Time 0.535 (0.868)	Data Time 0.001 (0.013)	Loss 3.6695 (3.7515)	Entropy 1.51754 (1.53139)	Top-1 acc 38.281 (35.852)	Top-5 acc 61.719 (59.944)	lr 0.02461
Train [10][1710/3239]	Time 0.725 (0.868)	Data Time 0.001 (0.013)	Loss 3.7089 (3.7514)	Entropy 1.51753 (1.53130)	Top-1 acc 37.109 (35.858)	Top-5 acc 60.938 (59.947)	lr 0.02461
Train [10][1720/3239]	Time 0.563 (0.867)	Data Time 0.002 (0.013)	Loss 3.7475 (3.7512)	Entropy 1.51745 (1.53122)	Top-1 acc 35.938 (35.860)	Top-5 acc 60.547 (59.956)	lr 0.02461
Train [10][1730/3239]	Time 0.640 (0.867)	Data Time 0.001 (0.013)	Loss 3.7636 (3.7513)	Entropy 1.51733 (1.53114)	Top-1 acc 34.766 (35.852)	Top-5 acc 60.547 (59.953)	lr 0.02461
Train [10][1740/3239]	Time 0.525 (0.867)	Data Time 0.001 (0.013)	Loss 3.6679 (3.7518)	Entropy 1.51729 (1.53107)	Top-1 acc 39.062 (35.842)	Top-5 acc 64.062 (59.948)	lr 0.02461
Train [10][1750/3239]	Time 0.593 (0.867)	Data Time 0.001 (0.013)	Loss 3.4922 (3.7518)	Entropy 1.51747 (1.53099)	Top-1 acc 41.797 (35.845)	Top-5 acc 62.109 (59.944)	lr 0.02461
Train [10][1760/3239]	Time 0.536 (0.866)	Data Time 0.001 (0.013)	Loss 3.6641 (3.7517)	Entropy 1.51713 (1.53091)	Top-1 acc 32.812 (35.847)	Top-5 acc 61.328 (59.948)	lr 0.02461
Train [10][1770/3239]	Time 0.576 (0.866)	Data Time 0.001 (0.013)	Loss 3.9635 (3.7516)	Entropy 1.51681 (1.53083)	Top-1 acc 32.422 (35.853)	Top-5 acc 57.031 (59.943)	lr 0.02461
Train [10][1780/3239]	Time 0.710 (0.866)	Data Time 0.001 (0.013)	Loss 3.6332 (3.7516)	Entropy 1.51639 (1.53075)	Top-1 acc 37.500 (35.854)	Top-5 acc 58.984 (59.940)	lr 0.02461
Train [10][1790/3239]	Time 0.521 (0.865)	Data Time 0.001 (0.013)	Loss 3.8452 (3.7519)	Entropy 1.51610 (1.53067)	Top-1 acc 32.812 (35.846)	Top-5 acc 59.766 (59.936)	lr 0.02461
Train [10][1800/3239]	Time 0.567 (0.865)	Data Time 0.002 (0.013)	Loss 3.7155 (3.7519)	Entropy 1.51592 (1.53059)	Top-1 acc 37.500 (35.854)	Top-5 acc 60.938 (59.936)	lr 0.02461
Train [10][1810/3239]	Time 0.600 (0.865)	Data Time 0.002 (0.013)	Loss 3.9262 (3.7521)	Entropy 1.51578 (1.53051)	Top-1 acc 32.812 (35.855)	Top-5 acc 57.031 (59.932)	lr 0.02461
Train [10][1820/3239]	Time 0.624 (0.865)	Data Time 0.002 (0.012)	Loss 3.6984 (3.7526)	Entropy 1.51548 (1.53043)	Top-1 acc 36.328 (35.848)	Top-5 acc 59.375 (59.917)	lr 0.02461
Train [10][1830/3239]	Time 0.595 (0.864)	Data Time 0.001 (0.012)	Loss 3.6738 (3.7527)	Entropy 1.51546 (1.53034)	Top-1 acc 41.016 (35.844)	Top-5 acc 58.594 (59.910)	lr 0.02461
Train [10][1840/3239]	Time 0.565 (0.864)	Data Time 0.001 (0.012)	Loss 4.0178 (3.7530)	Entropy 1.51506 (1.53026)	Top-1 acc 30.859 (35.839)	Top-5 acc 54.688 (59.904)	lr 0.02461
Train [10][1850/3239]	Time 0.574 (0.864)	Data Time 0.001 (0.012)	Loss 3.8024 (3.7530)	Entropy 1.51469 (1.53018)	Top-1 acc 35.547 (35.836)	Top-5 acc 55.859 (59.905)	lr 0.02461
Train [10][1860/3239]	Time 0.549 (0.864)	Data Time 0.001 (0.012)	Loss 3.9282 (3.7530)	Entropy 1.51472 (1.53010)	Top-1 acc 29.688 (35.837)	Top-5 acc 53.516 (59.906)	lr 0.02461
Train [10][1870/3239]	Time 0.558 (0.863)	Data Time 0.001 (0.012)	Loss 3.6628 (3.7533)	Entropy 1.51429 (1.53001)	Top-1 acc 39.453 (35.834)	Top-5 acc 62.891 (59.897)	lr 0.02461
Train [10][1880/3239]	Time 0.578 (0.863)	Data Time 0.002 (0.012)	Loss 3.7924 (3.7532)	Entropy 1.51416 (1.52993)	Top-1 acc 34.766 (35.837)	Top-5 acc 58.594 (59.901)	lr 0.02461
Train [10][1890/3239]	Time 0.518 (0.863)	Data Time 0.001 (0.012)	Loss 3.7273 (3.7534)	Entropy 1.51398 (1.52985)	Top-1 acc 32.812 (35.839)	Top-5 acc 59.375 (59.896)	lr 0.02461
Train [10][1900/3239]	Time 0.570 (0.863)	Data Time 0.001 (0.012)	Loss 3.6463 (3.7534)	Entropy 1.51333 (1.52976)	Top-1 acc 40.234 (35.843)	Top-5 acc 61.719 (59.894)	lr 0.02461
Train [10][1910/3239]	Time 0.610 (0.863)	Data Time 0.001 (0.012)	Loss 3.6367 (3.7535)	Entropy 1.51285 (1.52967)	Top-1 acc 41.016 (35.840)	Top-5 acc 63.281 (59.889)	lr 0.02461
Train [10][1920/3239]	Time 0.641 (0.862)	Data Time 0.001 (0.012)	Loss 3.7136 (3.7535)	Entropy 1.51299 (1.52959)	Top-1 acc 40.625 (35.848)	Top-5 acc 58.203 (59.891)	lr 0.02461
Train [10][1930/3239]	Time 0.604 (0.862)	Data Time 0.002 (0.012)	Loss 3.5703 (3.7534)	Entropy 1.51249 (1.52950)	Top-1 acc 39.844 (35.845)	Top-5 acc 66.406 (59.900)	lr 0.02461
Train [10][1940/3239]	Time 0.634 (0.862)	Data Time 0.001 (0.012)	Loss 3.6214 (3.7531)	Entropy 1.51222 (1.52941)	Top-1 acc 37.500 (35.851)	Top-5 acc 62.500 (59.904)	lr 0.02461
Train [10][1950/3239]	Time 0.587 (0.862)	Data Time 0.001 (0.012)	Loss 3.7886 (3.7531)	Entropy 1.51209 (1.52932)	Top-1 acc 34.375 (35.851)	Top-5 acc 56.250 (59.907)	lr 0.02461
Train [10][1960/3239]	Time 0.310 (0.861)	Data Time 0.001 (0.012)	Loss 3.9059 (3.7528)	Entropy 1.51188 (1.52924)	Top-1 acc 35.547 (35.860)	Top-5 acc 55.469 (59.915)	lr 0.02461
Train [10][1970/3239]	Time 0.569 (0.861)	Data Time 0.001 (0.012)	Loss 3.6900 (3.7529)	Entropy 1.51163 (1.52915)	Top-1 acc 37.500 (35.863)	Top-5 acc 62.891 (59.916)	lr 0.02461
Train [10][1980/3239]	Time 0.581 (0.861)	Data Time 0.001 (0.012)	Loss 4.0084 (3.7530)	Entropy 1.51156 (1.52906)	Top-1 acc 29.297 (35.862)	Top-5 acc 53.906 (59.914)	lr 0.02461
Train [10][1990/3239]	Time 0.625 (0.861)	Data Time 0.001 (0.012)	Loss 3.7107 (3.7530)	Entropy 1.51100 (1.52897)	Top-1 acc 39.453 (35.865)	Top-5 acc 62.109 (59.915)	lr 0.02461
Train [10][2000/3239]	Time 0.558 (0.861)	Data Time 0.001 (0.012)	Loss 3.8121 (3.7530)	Entropy 1.51083 (1.52888)	Top-1 acc 35.938 (35.866)	Top-5 acc 57.812 (59.919)	lr 0.02461
Train [10][2010/3239]	Time 0.627 (0.860)	Data Time 0.001 (0.012)	Loss 3.8266 (3.7530)	Entropy 1.51043 (1.52879)	Top-1 acc 37.891 (35.863)	Top-5 acc 58.594 (59.919)	lr 0.02461
Train [10][2020/3239]	Time 0.603 (0.860)	Data Time 0.001 (0.012)	Loss 3.9394 (3.7532)	Entropy 1.50987 (1.52870)	Top-1 acc 31.250 (35.858)	Top-5 acc 56.641 (59.918)	lr 0.02461
Train [10][2030/3239]	Time 0.544 (0.860)	Data Time 0.001 (0.011)	Loss 3.7976 (3.7533)	Entropy 1.50975 (1.52860)	Top-1 acc 34.375 (35.857)	Top-5 acc 59.766 (59.917)	lr 0.02461
Train [10][2040/3239]	Time 0.572 (0.860)	Data Time 0.001 (0.011)	Loss 3.7213 (3.7532)	Entropy 1.50970 (1.52851)	Top-1 acc 36.328 (35.855)	Top-5 acc 61.719 (59.922)	lr 0.02460
Train [10][2050/3239]	Time 0.581 (0.860)	Data Time 0.001 (0.011)	Loss 3.6528 (3.7533)	Entropy 1.50985 (1.52842)	Top-1 acc 37.891 (35.852)	Top-5 acc 61.328 (59.919)	lr 0.02460
Train [10][2060/3239]	Time 0.638 (0.860)	Data Time 0.001 (0.011)	Loss 3.6796 (3.7535)	Entropy 1.50960 (1.52833)	Top-1 acc 33.594 (35.846)	Top-5 acc 62.500 (59.918)	lr 0.02460
Train [10][2070/3239]	Time 0.609 (0.859)	Data Time 0.001 (0.011)	Loss 3.8540 (3.7536)	Entropy 1.50933 (1.52824)	Top-1 acc 32.812 (35.846)	Top-5 acc 55.078 (59.913)	lr 0.02460
Train [10][2080/3239]	Time 0.583 (0.859)	Data Time 0.001 (0.011)	Loss 3.3555 (3.7533)	Entropy 1.50916 (1.52815)	Top-1 acc 43.750 (35.853)	Top-5 acc 70.703 (59.922)	lr 0.02460
Train [10][2090/3239]	Time 0.600 (0.859)	Data Time 0.001 (0.011)	Loss 3.8617 (3.7531)	Entropy 1.50897 (1.52806)	Top-1 acc 35.938 (35.856)	Top-5 acc 58.594 (59.929)	lr 0.02460
Train [10][2100/3239]	Time 0.563 (0.859)	Data Time 0.002 (0.011)	Loss 3.9199 (3.7531)	Entropy 1.50882 (1.52797)	Top-1 acc 35.156 (35.859)	Top-5 acc 56.250 (59.933)	lr 0.02460
Train [10][2110/3239]	Time 0.572 (0.859)	Data Time 0.001 (0.011)	Loss 3.6539 (3.7531)	Entropy 1.50850 (1.52788)	Top-1 acc 32.422 (35.853)	Top-5 acc 60.547 (59.932)	lr 0.02460
Train [10][2120/3239]	Time 0.495 (0.858)	Data Time 0.001 (0.011)	Loss 3.7907 (3.7530)	Entropy 1.50815 (1.52778)	Top-1 acc 35.156 (35.848)	Top-5 acc 57.812 (59.928)	lr 0.02460
Train [10][2130/3239]	Time 0.621 (0.858)	Data Time 0.001 (0.011)	Loss 3.7028 (3.7533)	Entropy 1.50803 (1.52769)	Top-1 acc 37.109 (35.846)	Top-5 acc 59.766 (59.922)	lr 0.02460
Train [10][2140/3239]	Time 0.481 (0.858)	Data Time 0.001 (0.011)	Loss 3.7957 (3.7532)	Entropy 1.50792 (1.52760)	Top-1 acc 35.938 (35.852)	Top-5 acc 59.766 (59.923)	lr 0.02460
Train [10][2150/3239]	Time 0.522 (0.858)	Data Time 0.001 (0.011)	Loss 3.9559 (3.7532)	Entropy 1.50764 (1.52751)	Top-1 acc 35.156 (35.854)	Top-5 acc 54.688 (59.920)	lr 0.02460
Train [10][2160/3239]	Time 0.529 (0.858)	Data Time 0.001 (0.011)	Loss 3.9596 (3.7534)	Entropy 1.50725 (1.52741)	Top-1 acc 32.031 (35.853)	Top-5 acc 53.516 (59.911)	lr 0.02460
Train [10][2170/3239]	Time 0.615 (0.857)	Data Time 0.002 (0.011)	Loss 3.8084 (3.7535)	Entropy 1.50679 (1.52732)	Top-1 acc 35.938 (35.853)	Top-5 acc 57.812 (59.911)	lr 0.02460
Train [10][2180/3239]	Time 0.554 (0.857)	Data Time 0.001 (0.011)	Loss 3.6232 (3.7531)	Entropy 1.50648 (1.52723)	Top-1 acc 38.672 (35.861)	Top-5 acc 65.234 (59.917)	lr 0.02460
Train [10][2190/3239]	Time 0.520 (0.857)	Data Time 0.001 (0.011)	Loss 3.7735 (3.7531)	Entropy 1.50640 (1.52713)	Top-1 acc 33.594 (35.859)	Top-5 acc 57.031 (59.919)	lr 0.02460
Train [10][2200/3239]	Time 0.584 (0.857)	Data Time 0.001 (0.011)	Loss 3.8298 (3.7532)	Entropy 1.50615 (1.52704)	Top-1 acc 35.547 (35.857)	Top-5 acc 58.203 (59.921)	lr 0.02460
Train [10][2210/3239]	Time 0.581 (0.857)	Data Time 0.003 (0.011)	Loss 3.7070 (3.7530)	Entropy 1.50607 (1.52694)	Top-1 acc 39.844 (35.866)	Top-5 acc 62.500 (59.930)	lr 0.02460
Train [10][2220/3239]	Time 0.598 (0.857)	Data Time 0.001 (0.011)	Loss 3.6739 (3.7527)	Entropy 1.50575 (1.52685)	Top-1 acc 38.281 (35.866)	Top-5 acc 61.719 (59.937)	lr 0.02460
Train [10][2230/3239]	Time 0.608 (0.856)	Data Time 0.001 (0.011)	Loss 3.6318 (3.7527)	Entropy 1.50577 (1.52675)	Top-1 acc 34.375 (35.864)	Top-5 acc 60.938 (59.933)	lr 0.02460
Train [10][2240/3239]	Time 0.622 (0.856)	Data Time 0.001 (0.011)	Loss 3.6619 (3.7527)	Entropy 1.50545 (1.52666)	Top-1 acc 42.188 (35.861)	Top-5 acc 62.500 (59.932)	lr 0.02460
Train [10][2250/3239]	Time 0.759 (0.865)	Data Time 0.005 (0.011)	Loss 3.6683 (3.7527)	Entropy 1.50558 (1.52656)	Top-1 acc 39.453 (35.863)	Top-5 acc 64.453 (59.935)	lr 0.02460
Train [10][2260/3239]	Time 0.530 (0.865)	Data Time 0.003 (0.011)	Loss 3.5952 (3.7527)	Entropy 1.50532 (1.52647)	Top-1 acc 41.406 (35.861)	Top-5 acc 65.625 (59.935)	lr 0.02460
Train [10][2270/3239]	Time 0.521 (0.864)	Data Time 0.001 (0.010)	Loss 3.8119 (3.7528)	Entropy 1.50474 (1.52638)	Top-1 acc 35.547 (35.863)	Top-5 acc 58.594 (59.931)	lr 0.02460
Train [10][2280/3239]	Time 0.576 (0.864)	Data Time 0.001 (0.010)	Loss 3.8259 (3.7528)	Entropy 1.50421 (1.52628)	Top-1 acc 33.984 (35.855)	Top-5 acc 57.422 (59.930)	lr 0.02460
Train [10][2290/3239]	Time 0.628 (0.864)	Data Time 0.028 (0.010)	Loss 3.7177 (3.7529)	Entropy 1.50424 (1.52618)	Top-1 acc 39.062 (35.851)	Top-5 acc 60.938 (59.932)	lr 0.02460
Train [10][2300/3239]	Time 0.610 (0.864)	Data Time 0.001 (0.010)	Loss 3.6277 (3.7529)	Entropy 1.50395 (1.52609)	Top-1 acc 37.891 (35.853)	Top-5 acc 63.672 (59.931)	lr 0.02460
Train [10][2310/3239]	Time 0.597 (0.864)	Data Time 0.001 (0.010)	Loss 3.5795 (3.7526)	Entropy 1.50376 (1.52599)	Top-1 acc 39.062 (35.860)	Top-5 acc 63.672 (59.936)	lr 0.02460
Train [10][2320/3239]	Time 0.523 (0.864)	Data Time 0.001 (0.010)	Loss 3.6495 (3.7523)	Entropy 1.50349 (1.52590)	Top-1 acc 39.062 (35.867)	Top-5 acc 61.719 (59.944)	lr 0.02460
Train [10][2330/3239]	Time 0.557 (0.863)	Data Time 0.001 (0.010)	Loss 3.8061 (3.7526)	Entropy 1.50278 (1.52580)	Top-1 acc 33.984 (35.859)	Top-5 acc 59.766 (59.939)	lr 0.02460
Train [10][2340/3239]	Time 0.677 (0.863)	Data Time 0.001 (0.010)	Loss 3.8624 (3.7529)	Entropy 1.50263 (1.52570)	Top-1 acc 34.375 (35.852)	Top-5 acc 57.422 (59.930)	lr 0.02460
Train [10][2350/3239]	Time 0.562 (0.863)	Data Time 0.001 (0.010)	Loss 3.8426 (3.7528)	Entropy 1.50232 (1.52560)	Top-1 acc 35.938 (35.856)	Top-5 acc 54.688 (59.932)	lr 0.02460
Train [10][2360/3239]	Time 0.568 (0.863)	Data Time 0.001 (0.010)	Loss 4.0206 (3.7529)	Entropy 1.50214 (1.52550)	Top-1 acc 30.859 (35.857)	Top-5 acc 53.516 (59.927)	lr 0.02460
Train [10][2370/3239]	Time 0.600 (0.863)	Data Time 0.001 (0.010)	Loss 3.6405 (3.7531)	Entropy 1.50200 (1.52541)	Top-1 acc 36.719 (35.850)	Top-5 acc 58.984 (59.919)	lr 0.02460
Train [10][2380/3239]	Time 0.557 (0.862)	Data Time 0.001 (0.010)	Loss 3.6701 (3.7532)	Entropy 1.50168 (1.52531)	Top-1 acc 39.844 (35.845)	Top-5 acc 60.938 (59.913)	lr 0.02460
Train [10][2390/3239]	Time 0.573 (0.862)	Data Time 0.001 (0.010)	Loss 3.7414 (3.7531)	Entropy 1.50143 (1.52521)	Top-1 acc 35.938 (35.845)	Top-5 acc 60.547 (59.917)	lr 0.02460
Train [10][2400/3239]	Time 0.570 (0.862)	Data Time 0.001 (0.010)	Loss 3.7810 (3.7533)	Entropy 1.50124 (1.52511)	Top-1 acc 36.328 (35.842)	Top-5 acc 61.328 (59.912)	lr 0.02460
Train [10][2410/3239]	Time 0.710 (0.862)	Data Time 0.001 (0.010)	Loss 3.6601 (3.7532)	Entropy 1.50082 (1.52501)	Top-1 acc 38.281 (35.841)	Top-5 acc 62.891 (59.910)	lr 0.02460
Train [10][2420/3239]	Time 0.524 (0.862)	Data Time 0.001 (0.010)	Loss 3.7045 (3.7532)	Entropy 1.50067 (1.52491)	Top-1 acc 38.672 (35.842)	Top-5 acc 61.328 (59.911)	lr 0.02460
Train [10][2430/3239]	Time 0.574 (0.862)	Data Time 0.001 (0.010)	Loss 3.6156 (3.7532)	Entropy 1.50049 (1.52481)	Top-1 acc 38.672 (35.844)	Top-5 acc 60.547 (59.909)	lr 0.02459
Train [10][2440/3239]	Time 0.583 (0.861)	Data Time 0.001 (0.010)	Loss 3.7092 (3.7533)	Entropy 1.50023 (1.52471)	Top-1 acc 38.672 (35.838)	Top-5 acc 58.203 (59.905)	lr 0.02459
Train [10][2450/3239]	Time 0.617 (0.861)	Data Time 0.001 (0.010)	Loss 3.6854 (3.7533)	Entropy 1.50010 (1.52461)	Top-1 acc 36.328 (35.839)	Top-5 acc 60.547 (59.909)	lr 0.02459
Train [10][2460/3239]	Time 0.589 (0.861)	Data Time 0.001 (0.010)	Loss 3.6441 (3.7532)	Entropy 1.50005 (1.52451)	Top-1 acc 37.109 (35.838)	Top-5 acc 63.672 (59.912)	lr 0.02459
Train [10][2470/3239]	Time 0.549 (0.861)	Data Time 0.001 (0.010)	Loss 3.6380 (3.7531)	Entropy 1.49988 (1.52441)	Top-1 acc 37.891 (35.843)	Top-5 acc 61.328 (59.916)	lr 0.02459
Train [10][2480/3239]	Time 0.664 (0.861)	Data Time 0.002 (0.010)	Loss 3.8424 (3.7531)	Entropy 1.49974 (1.52431)	Top-1 acc 32.812 (35.842)	Top-5 acc 58.984 (59.916)	lr 0.02459
Train [10][2490/3239]	Time 0.610 (0.861)	Data Time 0.001 (0.010)	Loss 3.6847 (3.7530)	Entropy 1.49961 (1.52421)	Top-1 acc 37.500 (35.844)	Top-5 acc 61.328 (59.917)	lr 0.02459
Train [10][2500/3239]	Time 0.483 (0.860)	Data Time 0.001 (0.010)	Loss 4.0808 (3.7529)	Entropy 1.49916 (1.52411)	Top-1 acc 28.906 (35.843)	Top-5 acc 54.297 (59.920)	lr 0.02459
Train [10][2510/3239]	Time 0.564 (0.860)	Data Time 0.001 (0.010)	Loss 3.5780 (3.7527)	Entropy 1.49928 (1.52401)	Top-1 acc 41.797 (35.843)	Top-5 acc 66.406 (59.928)	lr 0.02459
Train [10][2520/3239]	Time 0.588 (0.860)	Data Time 0.001 (0.010)	Loss 4.0888 (3.7531)	Entropy 1.49915 (1.52391)	Top-1 acc 32.422 (35.838)	Top-5 acc 51.953 (59.918)	lr 0.02459
Train [10][2530/3239]	Time 0.611 (0.860)	Data Time 0.001 (0.010)	Loss 3.7263 (3.7532)	Entropy 1.49920 (1.52382)	Top-1 acc 35.156 (35.837)	Top-5 acc 61.719 (59.917)	lr 0.02459
Train [10][2540/3239]	Time 0.550 (0.860)	Data Time 0.001 (0.010)	Loss 3.7569 (3.7533)	Entropy 1.49901 (1.52372)	Top-1 acc 34.766 (35.834)	Top-5 acc 61.719 (59.916)	lr 0.02459
Train [10][2550/3239]	Time 0.677 (0.860)	Data Time 0.001 (0.010)	Loss 3.7191 (3.7533)	Entropy 1.49841 (1.52362)	Top-1 acc 36.328 (35.833)	Top-5 acc 59.375 (59.912)	lr 0.02459
Train [10][2560/3239]	Time 0.533 (0.860)	Data Time 0.001 (0.010)	Loss 3.9321 (3.7535)	Entropy 1.49805 (1.52352)	Top-1 acc 31.641 (35.833)	Top-5 acc 55.859 (59.908)	lr 0.02459
Train [10][2570/3239]	Time 0.593 (0.860)	Data Time 0.001 (0.010)	Loss 3.8093 (3.7536)	Entropy 1.49804 (1.52342)	Top-1 acc 31.641 (35.827)	Top-5 acc 60.156 (59.904)	lr 0.02459
Train [10][2580/3239]	Time 0.576 (0.859)	Data Time 0.001 (0.010)	Loss 3.6725 (3.7536)	Entropy 1.49779 (1.52333)	Top-1 acc 38.672 (35.824)	Top-5 acc 60.156 (59.900)	lr 0.02459
Train [10][2590/3239]	Time 0.601 (0.859)	Data Time 0.001 (0.010)	Loss 3.4704 (3.7535)	Entropy 1.49739 (1.52323)	Top-1 acc 37.891 (35.824)	Top-5 acc 65.625 (59.901)	lr 0.02459
Train [10][2600/3239]	Time 0.587 (0.859)	Data Time 0.001 (0.009)	Loss 3.6979 (3.7531)	Entropy 1.49759 (1.52313)	Top-1 acc 37.891 (35.833)	Top-5 acc 59.766 (59.905)	lr 0.02459
Train [10][2610/3239]	Time 0.582 (0.859)	Data Time 0.001 (0.009)	Loss 3.8137 (3.7528)	Entropy 1.49731 (1.52303)	Top-1 acc 35.547 (35.841)	Top-5 acc 58.594 (59.913)	lr 0.02459
Train [10][2620/3239]	Time 0.674 (0.859)	Data Time 0.001 (0.009)	Loss 3.5474 (3.7525)	Entropy 1.49697 (1.52293)	Top-1 acc 41.016 (35.845)	Top-5 acc 62.891 (59.919)	lr 0.02459
Train [10][2630/3239]	Time 0.585 (0.859)	Data Time 0.001 (0.009)	Loss 3.7078 (3.7524)	Entropy 1.49673 (1.52283)	Top-1 acc 37.109 (35.847)	Top-5 acc 58.984 (59.920)	lr 0.02459
Train [10][2640/3239]	Time 0.571 (0.858)	Data Time 0.002 (0.009)	Loss 3.7862 (3.7522)	Entropy 1.49677 (1.52273)	Top-1 acc 33.203 (35.850)	Top-5 acc 62.891 (59.929)	lr 0.02459
Train [10][2650/3239]	Time 0.568 (0.858)	Data Time 0.001 (0.009)	Loss 3.8838 (3.7523)	Entropy 1.49676 (1.52264)	Top-1 acc 34.375 (35.849)	Top-5 acc 54.688 (59.927)	lr 0.02459
Train [10][2660/3239]	Time 0.569 (0.858)	Data Time 0.001 (0.009)	Loss 3.7500 (3.7521)	Entropy 1.49636 (1.52254)	Top-1 acc 33.984 (35.852)	Top-5 acc 60.547 (59.927)	lr 0.02459
Train [10][2670/3239]	Time 0.539 (0.858)	Data Time 0.001 (0.009)	Loss 3.3408 (3.7521)	Entropy 1.49627 (1.52244)	Top-1 acc 44.141 (35.853)	Top-5 acc 68.750 (59.926)	lr 0.02459
Train [10][2680/3239]	Time 0.557 (0.858)	Data Time 0.001 (0.009)	Loss 3.6351 (3.7520)	Entropy 1.49602 (1.52234)	Top-1 acc 39.844 (35.856)	Top-5 acc 60.938 (59.925)	lr 0.02459
Train [10][2690/3239]	Time 0.683 (0.858)	Data Time 0.001 (0.009)	Loss 3.6072 (3.7518)	Entropy 1.49605 (1.52224)	Top-1 acc 43.359 (35.860)	Top-5 acc 63.672 (59.927)	lr 0.02459
Train [10][2700/3239]	Time 0.639 (0.858)	Data Time 0.001 (0.009)	Loss 3.7810 (3.7519)	Entropy 1.49609 (1.52215)	Top-1 acc 35.547 (35.862)	Top-5 acc 60.547 (59.926)	lr 0.02459
Train [10][2710/3239]	Time 0.548 (0.858)	Data Time 0.001 (0.009)	Loss 3.9010 (3.7520)	Entropy 1.49547 (1.52205)	Top-1 acc 36.719 (35.859)	Top-5 acc 57.031 (59.925)	lr 0.02459
Train [10][2720/3239]	Time 0.593 (0.858)	Data Time 0.001 (0.009)	Loss 3.8139 (3.7520)	Entropy 1.49523 (1.52195)	Top-1 acc 33.594 (35.857)	Top-5 acc 58.594 (59.925)	lr 0.02459
Train [10][2730/3239]	Time 0.622 (0.858)	Data Time 0.001 (0.009)	Loss 3.6552 (3.7520)	Entropy 1.49539 (1.52185)	Top-1 acc 36.719 (35.858)	Top-5 acc 60.156 (59.924)	lr 0.02459
Train [10][2740/3239]	Time 0.609 (0.858)	Data Time 0.001 (0.009)	Loss 4.1036 (3.7521)	Entropy 1.49531 (1.52176)	Top-1 acc 30.859 (35.861)	Top-5 acc 49.609 (59.922)	lr 0.02459
Train [10][2750/3239]	Time 0.566 (0.857)	Data Time 0.001 (0.009)	Loss 3.8661 (3.7520)	Entropy 1.49538 (1.52166)	Top-1 acc 31.250 (35.861)	Top-5 acc 59.375 (59.925)	lr 0.02459
Train [10][2760/3239]	Time 0.695 (0.857)	Data Time 0.001 (0.009)	Loss 3.6247 (3.7519)	Entropy 1.49507 (1.52157)	Top-1 acc 41.797 (35.863)	Top-5 acc 59.766 (59.926)	lr 0.02459
Train [10][2770/3239]	Time 0.556 (0.857)	Data Time 0.001 (0.009)	Loss 3.7210 (3.7518)	Entropy 1.49458 (1.52147)	Top-1 acc 33.594 (35.865)	Top-5 acc 60.156 (59.929)	lr 0.02459
Train [10][2780/3239]	Time 0.556 (0.857)	Data Time 0.001 (0.009)	Loss 3.8056 (3.7516)	Entropy 1.49442 (1.52137)	Top-1 acc 36.719 (35.871)	Top-5 acc 58.594 (59.931)	lr 0.02459
Train [10][2790/3239]	Time 0.523 (0.857)	Data Time 0.001 (0.009)	Loss 3.6608 (3.7514)	Entropy 1.49442 (1.52128)	Top-1 acc 34.766 (35.876)	Top-5 acc 59.766 (59.935)	lr 0.02459
Train [10][2800/3239]	Time 0.517 (0.856)	Data Time 0.001 (0.009)	Loss 3.8016 (3.7513)	Entropy 1.49431 (1.52118)	Top-1 acc 35.156 (35.878)	Top-5 acc 57.422 (59.937)	lr 0.02459
Train [10][2810/3239]	Time 0.618 (0.856)	Data Time 0.001 (0.009)	Loss 3.5551 (3.7512)	Entropy 1.49400 (1.52108)	Top-1 acc 36.328 (35.880)	Top-5 acc 64.453 (59.938)	lr 0.02459
Train [10][2820/3239]	Time 0.593 (0.856)	Data Time 0.001 (0.009)	Loss 3.8524 (3.7513)	Entropy 1.49342 (1.52099)	Top-1 acc 35.547 (35.881)	Top-5 acc 60.156 (59.938)	lr 0.02458
Train [10][2830/3239]	Time 0.659 (0.856)	Data Time 0.002 (0.009)	Loss 3.8433 (3.7512)	Entropy 1.49260 (1.52089)	Top-1 acc 32.812 (35.879)	Top-5 acc 57.422 (59.942)	lr 0.02458
Train [10][2840/3239]	Time 0.583 (0.856)	Data Time 0.001 (0.009)	Loss 3.9027 (3.7513)	Entropy 1.49223 (1.52079)	Top-1 acc 28.906 (35.875)	Top-5 acc 58.203 (59.941)	lr 0.02458
Train [10][2850/3239]	Time 0.601 (0.856)	Data Time 0.002 (0.009)	Loss 3.7449 (3.7514)	Entropy 1.49227 (1.52069)	Top-1 acc 32.422 (35.874)	Top-5 acc 60.156 (59.941)	lr 0.02458
Train [10][2860/3239]	Time 0.538 (0.856)	Data Time 0.001 (0.009)	Loss 3.7979 (3.7514)	Entropy 1.49232 (1.52059)	Top-1 acc 34.375 (35.873)	Top-5 acc 58.203 (59.943)	lr 0.02458
Train [10][2870/3239]	Time 0.607 (0.856)	Data Time 0.002 (0.009)	Loss 3.7731 (3.7512)	Entropy 1.49204 (1.52049)	Top-1 acc 33.203 (35.877)	Top-5 acc 59.375 (59.949)	lr 0.02458
Train [10][2880/3239]	Time 0.590 (0.856)	Data Time 0.002 (0.009)	Loss 3.5866 (3.7512)	Entropy 1.49183 (1.52039)	Top-1 acc 39.062 (35.879)	Top-5 acc 61.719 (59.943)	lr 0.02458
Train [10][2890/3239]	Time 0.575 (0.856)	Data Time 0.001 (0.009)	Loss 3.8273 (3.7510)	Entropy 1.49173 (1.52029)	Top-1 acc 34.766 (35.882)	Top-5 acc 56.641 (59.947)	lr 0.02458
Train [10][2900/3239]	Time 0.582 (0.856)	Data Time 0.001 (0.009)	Loss 3.7364 (3.7511)	Entropy 1.49130 (1.52019)	Top-1 acc 36.328 (35.878)	Top-5 acc 62.891 (59.947)	lr 0.02458
Train [10][2910/3239]	Time 0.605 (0.862)	Data Time 0.002 (0.009)	Loss 3.8348 (3.7513)	Entropy 1.49119 (1.52009)	Top-1 acc 34.375 (35.871)	Top-5 acc 59.766 (59.946)	lr 0.02458
Train [10][2920/3239]	Time 0.629 (0.862)	Data Time 0.001 (0.009)	Loss 3.5850 (3.7512)	Entropy 1.49125 (1.52000)	Top-1 acc 37.109 (35.870)	Top-5 acc 60.938 (59.946)	lr 0.02458
Train [10][2930/3239]	Time 0.582 (0.862)	Data Time 0.001 (0.009)	Loss 4.0109 (3.7512)	Entropy 1.49094 (1.51990)	Top-1 acc 28.906 (35.867)	Top-5 acc 49.609 (59.944)	lr 0.02458
Train [10][2940/3239]	Time 0.552 (0.862)	Data Time 0.001 (0.009)	Loss 3.6983 (3.7511)	Entropy 1.49089 (1.51980)	Top-1 acc 38.281 (35.869)	Top-5 acc 61.719 (59.943)	lr 0.02458
Train [10][2950/3239]	Time 0.584 (0.862)	Data Time 0.001 (0.009)	Loss 3.7893 (3.7511)	Entropy 1.49078 (1.51970)	Top-1 acc 35.547 (35.874)	Top-5 acc 63.281 (59.942)	lr 0.02458
Train [10][2960/3239]	Time 0.584 (0.862)	Data Time 0.001 (0.009)	Loss 3.9499 (3.7513)	Entropy 1.49053 (1.51960)	Top-1 acc 32.422 (35.867)	Top-5 acc 55.859 (59.932)	lr 0.02458
Train [10][2970/3239]	Time 0.583 (0.862)	Data Time 0.001 (0.009)	Loss 3.6659 (3.7513)	Entropy 1.49031 (1.51950)	Top-1 acc 38.672 (35.870)	Top-5 acc 58.203 (59.930)	lr 0.02458
Train [10][2980/3239]	Time 0.538 (0.861)	Data Time 0.001 (0.009)	Loss 3.7308 (3.7511)	Entropy 1.49047 (1.51941)	Top-1 acc 32.031 (35.873)	Top-5 acc 62.891 (59.935)	lr 0.02458
Train [10][2990/3239]	Time 0.686 (0.861)	Data Time 0.001 (0.009)	Loss 3.6495 (3.7512)	Entropy 1.49040 (1.51931)	Top-1 acc 37.500 (35.871)	Top-5 acc 62.891 (59.932)	lr 0.02458
Train [10][3000/3239]	Time 0.546 (0.861)	Data Time 0.001 (0.009)	Loss 3.5498 (3.7510)	Entropy 1.49038 (1.51921)	Top-1 acc 39.062 (35.880)	Top-5 acc 66.797 (59.938)	lr 0.02458
Train [10][3010/3239]	Time 0.614 (0.861)	Data Time 0.001 (0.008)	Loss 4.0013 (3.7513)	Entropy 1.49016 (1.51912)	Top-1 acc 29.297 (35.874)	Top-5 acc 56.250 (59.932)	lr 0.02458
Train [10][3020/3239]	Time 0.535 (0.861)	Data Time 0.001 (0.008)	Loss 3.7361 (3.7515)	Entropy 1.49001 (1.51902)	Top-1 acc 35.547 (35.868)	Top-5 acc 62.500 (59.931)	lr 0.02458
Train [10][3030/3239]	Time 0.520 (0.861)	Data Time 0.001 (0.008)	Loss 3.7453 (3.7514)	Entropy 1.48965 (1.51893)	Top-1 acc 34.766 (35.870)	Top-5 acc 62.891 (59.932)	lr 0.02458
Train [10][3040/3239]	Time 0.597 (0.861)	Data Time 0.001 (0.008)	Loss 3.6390 (3.7515)	Entropy 1.48962 (1.51883)	Top-1 acc 36.328 (35.870)	Top-5 acc 62.891 (59.928)	lr 0.02458
Train [10][3050/3239]	Time 0.619 (0.861)	Data Time 0.001 (0.008)	Loss 3.6700 (3.7515)	Entropy 1.48944 (1.51873)	Top-1 acc 39.062 (35.866)	Top-5 acc 60.547 (59.926)	lr 0.02458
Train [10][3060/3239]	Time 0.664 (0.861)	Data Time 0.001 (0.008)	Loss 3.7801 (3.7515)	Entropy 1.48938 (1.51864)	Top-1 acc 35.547 (35.862)	Top-5 acc 55.469 (59.926)	lr 0.02458
Train [10][3070/3239]	Time 0.575 (0.861)	Data Time 0.002 (0.008)	Loss 3.6267 (3.7514)	Entropy 1.48917 (1.51854)	Top-1 acc 34.766 (35.864)	Top-5 acc 61.719 (59.927)	lr 0.02458
Train [10][3080/3239]	Time 0.603 (0.860)	Data Time 0.001 (0.008)	Loss 3.5349 (3.7513)	Entropy 1.48926 (1.51845)	Top-1 acc 41.016 (35.865)	Top-5 acc 66.797 (59.927)	lr 0.02458
Train [10][3090/3239]	Time 0.520 (0.860)	Data Time 0.001 (0.008)	Loss 3.5776 (3.7513)	Entropy 1.48875 (1.51835)	Top-1 acc 38.672 (35.866)	Top-5 acc 62.891 (59.928)	lr 0.02458
Train [10][3100/3239]	Time 0.460 (0.860)	Data Time 0.001 (0.008)	Loss 3.7241 (3.7512)	Entropy 1.48835 (1.51826)	Top-1 acc 35.547 (35.866)	Top-5 acc 62.109 (59.927)	lr 0.02458
Train [10][3110/3239]	Time 0.560 (0.860)	Data Time 0.001 (0.008)	Loss 3.8318 (3.7511)	Entropy 1.48809 (1.51816)	Top-1 acc 33.984 (35.869)	Top-5 acc 57.031 (59.927)	lr 0.02458
Train [10][3120/3239]	Time 0.577 (0.860)	Data Time 0.001 (0.008)	Loss 3.6689 (3.7511)	Entropy 1.48796 (1.51806)	Top-1 acc 37.891 (35.867)	Top-5 acc 60.938 (59.929)	lr 0.02458
Train [10][3130/3239]	Time 0.653 (0.860)	Data Time 0.001 (0.008)	Loss 3.6275 (3.7510)	Entropy 1.48753 (1.51797)	Top-1 acc 35.938 (35.870)	Top-5 acc 60.938 (59.934)	lr 0.02458
Train [10][3140/3239]	Time 0.544 (0.860)	Data Time 0.001 (0.008)	Loss 3.8134 (3.7508)	Entropy 1.48690 (1.51787)	Top-1 acc 35.156 (35.871)	Top-5 acc 55.469 (59.936)	lr 0.02458
Train [10][3150/3239]	Time 0.569 (0.860)	Data Time 0.001 (0.008)	Loss 3.8133 (3.7508)	Entropy 1.48649 (1.51777)	Top-1 acc 40.234 (35.877)	Top-5 acc 58.984 (59.936)	lr 0.02458
Train [10][3160/3239]	Time 0.583 (0.860)	Data Time 0.001 (0.008)	Loss 3.7395 (3.7506)	Entropy 1.48638 (1.51767)	Top-1 acc 37.891 (35.879)	Top-5 acc 58.984 (59.937)	lr 0.02458
Train [10][3170/3239]	Time 0.622 (0.860)	Data Time 0.001 (0.008)	Loss 3.6052 (3.7505)	Entropy 1.48627 (1.51757)	Top-1 acc 37.891 (35.883)	Top-5 acc 61.719 (59.941)	lr 0.02458
Train [10][3180/3239]	Time 0.601 (0.860)	Data Time 0.000 (0.008)	Loss 3.7256 (3.7504)	Entropy 1.48585 (1.51747)	Top-1 acc 35.938 (35.886)	Top-5 acc 57.812 (59.944)	lr 0.02458
Train [10][3190/3239]	Time 0.597 (0.859)	Data Time 0.000 (0.008)	Loss 3.6573 (3.7503)	Entropy 1.48587 (1.51737)	Top-1 acc 36.719 (35.888)	Top-5 acc 65.625 (59.947)	lr 0.02458
Train [10][3200/3239]	Time 0.667 (0.859)	Data Time 0.000 (0.008)	Loss 3.6680 (3.7501)	Entropy 1.48562 (1.51728)	Top-1 acc 37.500 (35.893)	Top-5 acc 59.375 (59.951)	lr 0.02458
Train [10][3210/3239]	Time 0.573 (0.859)	Data Time 0.000 (0.008)	Loss 3.5435 (3.7501)	Entropy 1.48527 (1.51718)	Top-1 acc 35.938 (35.892)	Top-5 acc 66.016 (59.952)	lr 0.02457
Train [10][3220/3239]	Time 0.596 (0.859)	Data Time 0.000 (0.008)	Loss 3.6574 (3.7500)	Entropy 1.48497 (1.51708)	Top-1 acc 37.891 (35.894)	Top-5 acc 62.109 (59.952)	lr 0.02457
Train [10][3230/3239]	Time 0.615 (0.859)	Data Time 0.000 (0.008)	Loss 3.8045 (3.7500)	Entropy 1.48487 (1.51698)	Top-1 acc 33.984 (35.894)	Top-5 acc 59.766 (59.955)	lr 0.02457
Train [10][3239/3239]	Time 1.562 (0.859)	Data Time 0.000 (0.008)	Loss 3.8250 (3.7499)	Entropy 1.48509 (1.51689)	Top-1 acc 33.333 (35.899)	Top-5 acc 58.025 (59.960)	lr 0.02457
==========Valid [10/120]	loss 2.537	top-1 acc 45.837 (45.837)	top-5 acc 70.047	Train top-1 35.899	top-5 59.960	Entropy 1.48509	Latency-None: 0.000ms	Flops: 542.77M
Train [11][0/3239]	Time 20.439 (20.439)	Data Time 18.479 (18.479)	Loss 3.9206 (3.9206)	Entropy 1.48481 (1.48481)	Top-1 acc 28.906 (28.906)	Top-5 acc 55.859 (55.859)	lr 0.02457
Train [11][10/3239]	Time 0.578 (2.689)	Data Time 0.002 (1.682)	Loss 3.8563 (3.6646)	Entropy 1.48445 (1.48466)	Top-1 acc 32.422 (38.175)	Top-5 acc 59.375 (62.074)	lr 0.02457
Train [11][20/3239]	Time 0.574 (1.797)	Data Time 0.001 (0.882)	Loss 3.6424 (3.6688)	Entropy 1.48460 (1.48462)	Top-1 acc 35.547 (37.649)	Top-5 acc 60.938 (61.830)	lr 0.02457
Train [11][30/3239]	Time 0.600 (1.481)	Data Time 0.001 (0.598)	Loss 3.8584 (3.6850)	Entropy 1.48444 (1.48460)	Top-1 acc 34.375 (37.286)	Top-5 acc 58.594 (61.542)	lr 0.02457
Train [11][40/3239]	Time 0.540 (1.323)	Data Time 0.003 (0.453)	Loss 3.7601 (3.7186)	Entropy 1.48469 (1.48458)	Top-1 acc 38.672 (36.795)	Top-5 acc 61.719 (60.699)	lr 0.02457
Train [11][50/3239]	Time 0.546 (1.220)	Data Time 0.001 (0.365)	Loss 3.7587 (3.7141)	Entropy 1.48453 (1.48459)	Top-1 acc 35.938 (36.910)	Top-5 acc 61.328 (60.715)	lr 0.02457
Train [11][60/3239]	Time 0.545 (1.155)	Data Time 0.001 (0.305)	Loss 3.8372 (3.7071)	Entropy 1.48453 (1.48458)	Top-1 acc 31.641 (36.930)	Top-5 acc 57.031 (60.918)	lr 0.02457
Train [11][70/3239]	Time 0.544 (1.110)	Data Time 0.001 (0.263)	Loss 3.6178 (3.7059)	Entropy 1.48444 (1.48456)	Top-1 acc 39.453 (36.752)	Top-5 acc 65.234 (60.998)	lr 0.02457
Train [11][80/3239]	Time 0.583 (1.075)	Data Time 0.001 (0.230)	Loss 3.6513 (3.7044)	Entropy 1.48425 (1.48454)	Top-1 acc 35.547 (36.651)	Top-5 acc 62.109 (61.058)	lr 0.02457
Train [11][90/3239]	Time 0.560 (1.049)	Data Time 0.001 (0.205)	Loss 3.8126 (3.7081)	Entropy 1.48377 (1.48449)	Top-1 acc 36.328 (36.775)	Top-5 acc 55.078 (61.002)	lr 0.02457
Train [11][100/3239]	Time 0.538 (1.027)	Data Time 0.001 (0.185)	Loss 3.9691 (3.7138)	Entropy 1.48376 (1.48442)	Top-1 acc 35.547 (36.703)	Top-5 acc 57.031 (60.837)	lr 0.02457
Train [11][110/3239]	Time 0.577 (1.009)	Data Time 0.001 (0.169)	Loss 3.6207 (3.7126)	Entropy 1.48381 (1.48436)	Top-1 acc 41.016 (36.860)	Top-5 acc 63.281 (60.916)	lr 0.02457
Train [11][120/3239]	Time 0.552 (0.991)	Data Time 0.001 (0.155)	Loss 3.7499 (3.7088)	Entropy 1.48380 (1.48431)	Top-1 acc 38.672 (36.993)	Top-5 acc 62.891 (60.999)	lr 0.02457
Train [11][130/3239]	Time 0.540 (0.979)	Data Time 0.001 (0.143)	Loss 3.6835 (3.7114)	Entropy 1.48368 (1.48427)	Top-1 acc 36.719 (36.942)	Top-5 acc 60.938 (60.938)	lr 0.02457
Train [11][140/3239]	Time 0.589 (0.969)	Data Time 0.001 (0.133)	Loss 3.5799 (3.7115)	Entropy 1.48359 (1.48422)	Top-1 acc 39.062 (36.810)	Top-5 acc 62.109 (60.879)	lr 0.02457
Train [11][150/3239]	Time 0.569 (0.961)	Data Time 0.001 (0.125)	Loss 3.8016 (3.7124)	Entropy 1.48359 (1.48418)	Top-1 acc 33.594 (36.721)	Top-5 acc 57.422 (60.891)	lr 0.02457
Train [11][160/3239]	Time 0.552 (0.952)	Data Time 0.001 (0.117)	Loss 3.6557 (3.7135)	Entropy 1.48327 (1.48414)	Top-1 acc 38.672 (36.726)	Top-5 acc 64.062 (60.843)	lr 0.02457
Train [11][170/3239]	Time 0.661 (0.946)	Data Time 0.001 (0.110)	Loss 3.5858 (3.7139)	Entropy 1.48333 (1.48409)	Top-1 acc 39.844 (36.744)	Top-5 acc 63.281 (60.821)	lr 0.02457
Train [11][180/3239]	Time 0.595 (0.941)	Data Time 0.001 (0.104)	Loss 3.8221 (3.7175)	Entropy 1.48283 (1.48404)	Top-1 acc 34.375 (36.699)	Top-5 acc 56.641 (60.704)	lr 0.02457
Train [11][190/3239]	Time 0.561 (0.935)	Data Time 0.001 (0.099)	Loss 3.7633 (3.7176)	Entropy 1.48299 (1.48397)	Top-1 acc 35.547 (36.694)	Top-5 acc 58.203 (60.692)	lr 0.02457
Train [11][200/3239]	Time 0.554 (0.930)	Data Time 0.001 (0.094)	Loss 3.8751 (3.7176)	Entropy 1.48281 (1.48392)	Top-1 acc 31.641 (36.697)	Top-5 acc 53.906 (60.714)	lr 0.02457
Train [11][210/3239]	Time 0.568 (0.926)	Data Time 0.001 (0.090)	Loss 3.9074 (3.7187)	Entropy 1.48286 (1.48387)	Top-1 acc 32.812 (36.709)	Top-5 acc 57.031 (60.680)	lr 0.02457
Train [11][220/3239]	Time 0.642 (0.920)	Data Time 0.002 (0.086)	Loss 3.4873 (3.7174)	Entropy 1.48248 (1.48382)	Top-1 acc 41.406 (36.721)	Top-5 acc 62.891 (60.671)	lr 0.02457
Train [11][230/3239]	Time 0.462 (0.915)	Data Time 0.001 (0.082)	Loss 3.7755 (3.7174)	Entropy 1.48215 (1.48376)	Top-1 acc 33.984 (36.707)	Top-5 acc 57.812 (60.697)	lr 0.02457
Train [11][240/3239]	Time 0.456 (0.909)	Data Time 0.001 (0.079)	Loss 3.8182 (3.7197)	Entropy 1.48225 (1.48369)	Top-1 acc 35.938 (36.657)	Top-5 acc 59.375 (60.696)	lr 0.02457
Train [11][250/3239]	Time 0.578 (0.905)	Data Time 0.001 (0.077)	Loss 3.8441 (3.7226)	Entropy 1.48226 (1.48363)	Top-1 acc 35.547 (36.586)	Top-5 acc 58.984 (60.632)	lr 0.02457
Train [11][260/3239]	Time 0.510 (0.901)	Data Time 0.001 (0.074)	Loss 3.7779 (3.7249)	Entropy 1.48189 (1.48358)	Top-1 acc 39.844 (36.580)	Top-5 acc 61.328 (60.560)	lr 0.02457
Train [11][270/3239]	Time 0.605 (0.899)	Data Time 0.001 (0.071)	Loss 3.6774 (3.7247)	Entropy 1.48185 (1.48351)	Top-1 acc 32.812 (36.566)	Top-5 acc 58.984 (60.570)	lr 0.02457
Train [11][280/3239]	Time 0.589 (0.897)	Data Time 0.001 (0.069)	Loss 3.7436 (3.7227)	Entropy 1.48181 (1.48345)	Top-1 acc 38.672 (36.578)	Top-5 acc 62.109 (60.628)	lr 0.02457
Train [11][290/3239]	Time 0.613 (0.894)	Data Time 0.001 (0.066)	Loss 3.7109 (3.7242)	Entropy 1.48166 (1.48340)	Top-1 acc 35.547 (36.555)	Top-5 acc 59.766 (60.556)	lr 0.02457
Train [11][300/3239]	Time 0.577 (0.892)	Data Time 0.002 (0.064)	Loss 3.7677 (3.7250)	Entropy 1.48188 (1.48334)	Top-1 acc 37.500 (36.521)	Top-5 acc 59.375 (60.533)	lr 0.02457
Train [11][310/3239]	Time 0.629 (0.890)	Data Time 0.001 (0.062)	Loss 3.5698 (3.7246)	Entropy 1.48195 (1.48330)	Top-1 acc 40.234 (36.534)	Top-5 acc 64.453 (60.552)	lr 0.02457
Train [11][320/3239]	Time 0.780 (0.946)	Data Time 0.006 (0.060)	Loss 3.6393 (3.7238)	Entropy 1.48183 (1.48325)	Top-1 acc 40.625 (36.540)	Top-5 acc 60.938 (60.574)	lr 0.02457
Train [11][330/3239]	Time 0.628 (0.944)	Data Time 0.002 (0.059)	Loss 3.3949 (3.7229)	Entropy 1.48139 (1.48320)	Top-1 acc 44.531 (36.590)	Top-5 acc 66.016 (60.592)	lr 0.02457
Train [11][340/3239]	Time 0.570 (0.941)	Data Time 0.001 (0.057)	Loss 3.6568 (3.7222)	Entropy 1.48092 (1.48315)	Top-1 acc 36.719 (36.612)	Top-5 acc 62.109 (60.606)	lr 0.02457
Train [11][350/3239]	Time 0.598 (0.937)	Data Time 0.001 (0.055)	Loss 3.6059 (3.7218)	Entropy 1.48096 (1.48309)	Top-1 acc 37.109 (36.603)	Top-5 acc 63.281 (60.588)	lr 0.02456
Train [11][360/3239]	Time 0.564 (0.934)	Data Time 0.002 (0.054)	Loss 3.7640 (3.7228)	Entropy 1.48061 (1.48302)	Top-1 acc 32.422 (36.565)	Top-5 acc 59.766 (60.539)	lr 0.02456
Train [11][370/3239]	Time 0.589 (0.930)	Data Time 0.003 (0.053)	Loss 3.6994 (3.7217)	Entropy 1.48030 (1.48296)	Top-1 acc 39.453 (36.563)	Top-5 acc 58.203 (60.567)	lr 0.02456
Train [11][380/3239]	Time 0.681 (0.926)	Data Time 0.003 (0.051)	Loss 3.8735 (3.7227)	Entropy 1.48048 (1.48289)	Top-1 acc 35.547 (36.555)	Top-5 acc 56.641 (60.534)	lr 0.02456
Train [11][390/3239]	Time 0.593 (0.924)	Data Time 0.001 (0.050)	Loss 3.8115 (3.7221)	Entropy 1.48073 (1.48283)	Top-1 acc 34.766 (36.563)	Top-5 acc 58.203 (60.534)	lr 0.02456
Train [11][400/3239]	Time 0.540 (0.922)	Data Time 0.001 (0.049)	Loss 3.7700 (3.7213)	Entropy 1.48067 (1.48278)	Top-1 acc 35.156 (36.613)	Top-5 acc 63.672 (60.551)	lr 0.02456
Train [11][410/3239]	Time 0.544 (0.919)	Data Time 0.003 (0.048)	Loss 3.7079 (3.7210)	Entropy 1.48038 (1.48272)	Top-1 acc 32.812 (36.600)	Top-5 acc 61.719 (60.567)	lr 0.02456
Train [11][420/3239]	Time 0.591 (0.917)	Data Time 0.001 (0.047)	Loss 3.5579 (3.7199)	Entropy 1.48034 (1.48267)	Top-1 acc 39.062 (36.638)	Top-5 acc 62.500 (60.582)	lr 0.02456
Train [11][430/3239]	Time 0.574 (0.915)	Data Time 0.001 (0.046)	Loss 3.7238 (3.7200)	Entropy 1.48017 (1.48261)	Top-1 acc 39.453 (36.621)	Top-5 acc 61.719 (60.573)	lr 0.02456
Train [11][440/3239]	Time 0.573 (0.913)	Data Time 0.001 (0.045)	Loss 3.9033 (3.7191)	Entropy 1.48026 (1.48256)	Top-1 acc 35.938 (36.636)	Top-5 acc 60.938 (60.636)	lr 0.02456
Train [11][450/3239]	Time 0.652 (0.911)	Data Time 0.001 (0.044)	Loss 3.5555 (3.7178)	Entropy 1.48034 (1.48251)	Top-1 acc 37.109 (36.670)	Top-5 acc 64.453 (60.652)	lr 0.02456
Train [11][460/3239]	Time 0.559 (0.909)	Data Time 0.003 (0.043)	Loss 3.8937 (3.7170)	Entropy 1.48025 (1.48246)	Top-1 acc 33.984 (36.710)	Top-5 acc 53.906 (60.666)	lr 0.02456
Train [11][470/3239]	Time 0.575 (0.907)	Data Time 0.002 (0.042)	Loss 3.8071 (3.7177)	Entropy 1.48009 (1.48241)	Top-1 acc 35.156 (36.710)	Top-5 acc 58.594 (60.630)	lr 0.02456
Train [11][480/3239]	Time 0.554 (0.906)	Data Time 0.001 (0.041)	Loss 3.7239 (3.7181)	Entropy 1.47970 (1.48236)	Top-1 acc 37.109 (36.706)	Top-5 acc 58.594 (60.628)	lr 0.02456
Train [11][490/3239]	Time 0.523 (0.904)	Data Time 0.001 (0.040)	Loss 3.7583 (3.7189)	Entropy 1.47943 (1.48231)	Top-1 acc 35.156 (36.679)	Top-5 acc 62.500 (60.604)	lr 0.02456
Train [11][500/3239]	Time 0.561 (0.902)	Data Time 0.001 (0.040)	Loss 3.9279 (3.7194)	Entropy 1.47918 (1.48225)	Top-1 acc 33.594 (36.655)	Top-5 acc 54.688 (60.578)	lr 0.02456
Train [11][510/3239]	Time 0.581 (0.901)	Data Time 0.001 (0.039)	Loss 4.0798 (3.7214)	Entropy 1.47912 (1.48219)	Top-1 acc 30.469 (36.581)	Top-5 acc 53.125 (60.537)	lr 0.02456
Train [11][520/3239]	Time 0.667 (0.899)	Data Time 0.003 (0.038)	Loss 3.4909 (3.7215)	Entropy 1.47897 (1.48212)	Top-1 acc 40.234 (36.597)	Top-5 acc 65.234 (60.526)	lr 0.02456
Train [11][530/3239]	Time 0.585 (0.898)	Data Time 0.003 (0.038)	Loss 3.5251 (3.7212)	Entropy 1.47930 (1.48207)	Top-1 acc 40.625 (36.579)	Top-5 acc 65.625 (60.537)	lr 0.02456
Train [11][540/3239]	Time 0.566 (0.896)	Data Time 0.002 (0.037)	Loss 3.6768 (3.7217)	Entropy 1.47914 (1.48201)	Top-1 acc 34.766 (36.554)	Top-5 acc 59.375 (60.543)	lr 0.02456
Train [11][550/3239]	Time 0.490 (0.894)	Data Time 0.001 (0.036)	Loss 3.4724 (3.7218)	Entropy 1.47909 (1.48196)	Top-1 acc 41.797 (36.542)	Top-5 acc 65.234 (60.526)	lr 0.02456
Train [11][560/3239]	Time 0.609 (0.893)	Data Time 0.001 (0.036)	Loss 3.6524 (3.7220)	Entropy 1.47870 (1.48191)	Top-1 acc 41.406 (36.546)	Top-5 acc 65.234 (60.519)	lr 0.02456
Train [11][570/3239]	Time 0.587 (0.891)	Data Time 0.003 (0.035)	Loss 3.8496 (3.7218)	Entropy 1.47889 (1.48186)	Top-1 acc 33.984 (36.540)	Top-5 acc 58.594 (60.531)	lr 0.02456
Train [11][580/3239]	Time 0.606 (0.890)	Data Time 0.001 (0.034)	Loss 3.7504 (3.7216)	Entropy 1.47872 (1.48180)	Top-1 acc 37.500 (36.525)	Top-5 acc 60.156 (60.537)	lr 0.02456
Train [11][590/3239]	Time 0.685 (0.889)	Data Time 0.001 (0.034)	Loss 3.7955 (3.7209)	Entropy 1.47862 (1.48175)	Top-1 acc 32.812 (36.536)	Top-5 acc 55.859 (60.553)	lr 0.02456
Train [11][600/3239]	Time 0.608 (0.888)	Data Time 0.001 (0.033)	Loss 3.6152 (3.7202)	Entropy 1.47846 (1.48170)	Top-1 acc 38.672 (36.551)	Top-5 acc 63.281 (60.567)	lr 0.02456
Train [11][610/3239]	Time 0.562 (0.887)	Data Time 0.001 (0.033)	Loss 3.8184 (3.7208)	Entropy 1.47820 (1.48165)	Top-1 acc 36.328 (36.537)	Top-5 acc 58.594 (60.551)	lr 0.02456
Train [11][620/3239]	Time 0.572 (0.886)	Data Time 0.002 (0.032)	Loss 3.5987 (3.7198)	Entropy 1.47775 (1.48159)	Top-1 acc 42.578 (36.556)	Top-5 acc 64.062 (60.571)	lr 0.02456
Train [11][630/3239]	Time 0.552 (0.885)	Data Time 0.001 (0.032)	Loss 3.9118 (3.7207)	Entropy 1.47745 (1.48153)	Top-1 acc 30.469 (36.534)	Top-5 acc 53.906 (60.527)	lr 0.02456
Train [11][640/3239]	Time 0.611 (0.884)	Data Time 0.001 (0.031)	Loss 3.7316 (3.7204)	Entropy 1.47706 (1.48146)	Top-1 acc 35.938 (36.539)	Top-5 acc 60.156 (60.533)	lr 0.02456
Train [11][650/3239]	Time 0.591 (0.883)	Data Time 0.001 (0.031)	Loss 3.8081 (3.7201)	Entropy 1.47696 (1.48139)	Top-1 acc 37.500 (36.545)	Top-5 acc 58.203 (60.544)	lr 0.02456
Train [11][660/3239]	Time 0.683 (0.883)	Data Time 0.001 (0.031)	Loss 3.9331 (3.7213)	Entropy 1.47679 (1.48133)	Top-1 acc 33.203 (36.533)	Top-5 acc 58.594 (60.517)	lr 0.02456
Train [11][670/3239]	Time 0.549 (0.882)	Data Time 0.001 (0.030)	Loss 3.5591 (3.7211)	Entropy 1.47694 (1.48126)	Top-1 acc 38.672 (36.540)	Top-5 acc 64.844 (60.520)	lr 0.02456
Train [11][680/3239]	Time 0.562 (0.881)	Data Time 0.001 (0.030)	Loss 3.9667 (3.7214)	Entropy 1.47672 (1.48119)	Top-1 acc 31.641 (36.531)	Top-5 acc 56.641 (60.504)	lr 0.02456
Train [11][690/3239]	Time 0.585 (0.880)	Data Time 0.001 (0.029)	Loss 3.9155 (3.7216)	Entropy 1.47637 (1.48113)	Top-1 acc 36.328 (36.520)	Top-5 acc 58.594 (60.500)	lr 0.02456
Train [11][700/3239]	Time 0.605 (0.879)	Data Time 0.001 (0.029)	Loss 3.6430 (3.7211)	Entropy 1.47638 (1.48106)	Top-1 acc 34.766 (36.516)	Top-5 acc 62.109 (60.515)	lr 0.02456
Train [11][710/3239]	Time 0.600 (0.878)	Data Time 0.001 (0.029)	Loss 3.6193 (3.7198)	Entropy 1.47605 (1.48099)	Top-1 acc 33.203 (36.541)	Top-5 acc 64.062 (60.550)	lr 0.02456
Train [11][720/3239]	Time 0.567 (0.877)	Data Time 0.003 (0.028)	Loss 3.6367 (3.7200)	Entropy 1.47592 (1.48092)	Top-1 acc 42.969 (36.520)	Top-5 acc 60.547 (60.544)	lr 0.02456
Train [11][730/3239]	Time 0.616 (0.876)	Data Time 0.002 (0.028)	Loss 3.7616 (3.7205)	Entropy 1.47577 (1.48086)	Top-1 acc 37.891 (36.531)	Top-5 acc 58.203 (60.536)	lr 0.02455
Train [11][740/3239]	Time 0.569 (0.875)	Data Time 0.001 (0.027)	Loss 3.6693 (3.7201)	Entropy 1.47538 (1.48078)	Top-1 acc 38.281 (36.552)	Top-5 acc 64.844 (60.544)	lr 0.02455
Train [11][750/3239]	Time 0.646 (0.875)	Data Time 0.001 (0.027)	Loss 3.7061 (3.7206)	Entropy 1.47531 (1.48071)	Top-1 acc 33.594 (36.540)	Top-5 acc 64.453 (60.550)	lr 0.02455
Train [11][760/3239]	Time 0.541 (0.874)	Data Time 0.001 (0.027)	Loss 3.7587 (3.7207)	Entropy 1.47502 (1.48064)	Top-1 acc 41.797 (36.548)	Top-5 acc 58.203 (60.543)	lr 0.02455
Train [11][770/3239]	Time 0.598 (0.873)	Data Time 0.001 (0.026)	Loss 3.7057 (3.7212)	Entropy 1.47481 (1.48057)	Top-1 acc 34.375 (36.536)	Top-5 acc 60.938 (60.523)	lr 0.02455
Train [11][780/3239]	Time 0.571 (0.872)	Data Time 0.001 (0.026)	Loss 3.4722 (3.7200)	Entropy 1.47429 (1.48049)	Top-1 acc 40.234 (36.541)	Top-5 acc 65.234 (60.554)	lr 0.02455
Train [11][790/3239]	Time 0.570 (0.872)	Data Time 0.002 (0.026)	Loss 3.7659 (3.7204)	Entropy 1.47402 (1.48041)	Top-1 acc 34.766 (36.547)	Top-5 acc 55.078 (60.545)	lr 0.02455
Train [11][800/3239]	Time 0.556 (0.871)	Data Time 0.001 (0.026)	Loss 3.7820 (3.7206)	Entropy 1.47384 (1.48033)	Top-1 acc 35.547 (36.538)	Top-5 acc 57.031 (60.530)	lr 0.02455
Train [11][810/3239]	Time 0.566 (0.871)	Data Time 0.001 (0.025)	Loss 3.7275 (3.7214)	Entropy 1.47368 (1.48025)	Top-1 acc 34.375 (36.520)	Top-5 acc 60.156 (60.520)	lr 0.02455
Train [11][820/3239]	Time 0.682 (0.870)	Data Time 0.001 (0.025)	Loss 3.7335 (3.7211)	Entropy 1.47333 (1.48017)	Top-1 acc 35.547 (36.518)	Top-5 acc 59.766 (60.519)	lr 0.02455
Train [11][830/3239]	Time 0.576 (0.870)	Data Time 0.001 (0.025)	Loss 3.6758 (3.7209)	Entropy 1.47315 (1.48008)	Top-1 acc 37.109 (36.520)	Top-5 acc 59.375 (60.532)	lr 0.02455
Train [11][840/3239]	Time 0.610 (0.869)	Data Time 0.001 (0.024)	Loss 3.6447 (3.7209)	Entropy 1.47292 (1.48000)	Top-1 acc 38.281 (36.530)	Top-5 acc 64.844 (60.530)	lr 0.02455
Train [11][850/3239]	Time 0.562 (0.869)	Data Time 0.001 (0.024)	Loss 3.6840 (3.7207)	Entropy 1.47268 (1.47992)	Top-1 acc 37.500 (36.545)	Top-5 acc 62.891 (60.536)	lr 0.02455
Train [11][860/3239]	Time 0.574 (0.868)	Data Time 0.001 (0.024)	Loss 3.5157 (3.7198)	Entropy 1.47259 (1.47983)	Top-1 acc 40.625 (36.559)	Top-5 acc 66.406 (60.571)	lr 0.02455
Train [11][870/3239]	Time 0.559 (0.868)	Data Time 0.001 (0.024)	Loss 3.5266 (3.7194)	Entropy 1.47203 (1.47975)	Top-1 acc 37.109 (36.573)	Top-5 acc 65.625 (60.568)	lr 0.02455
Train [11][880/3239]	Time 0.407 (0.867)	Data Time 0.001 (0.023)	Loss 3.7325 (3.7193)	Entropy 1.47192 (1.47966)	Top-1 acc 38.672 (36.570)	Top-5 acc 60.547 (60.571)	lr 0.02455
Train [11][890/3239]	Time 0.698 (0.867)	Data Time 0.001 (0.023)	Loss 3.4528 (3.7186)	Entropy 1.47200 (1.47957)	Top-1 acc 43.359 (36.580)	Top-5 acc 64.453 (60.581)	lr 0.02455
Train [11][900/3239]	Time 0.438 (0.866)	Data Time 0.001 (0.023)	Loss 3.6425 (3.7180)	Entropy 1.47229 (1.47949)	Top-1 acc 37.500 (36.588)	Top-5 acc 63.281 (60.598)	lr 0.02455
Train [11][910/3239]	Time 0.598 (0.866)	Data Time 0.001 (0.023)	Loss 3.6522 (3.7172)	Entropy 1.47192 (1.47941)	Top-1 acc 37.109 (36.600)	Top-5 acc 62.891 (60.623)	lr 0.02455
Train [11][920/3239]	Time 0.602 (0.865)	Data Time 0.002 (0.023)	Loss 3.9129 (3.7172)	Entropy 1.47183 (1.47933)	Top-1 acc 35.547 (36.600)	Top-5 acc 57.812 (60.621)	lr 0.02455
Train [11][930/3239]	Time 0.585 (0.865)	Data Time 0.001 (0.022)	Loss 3.7437 (3.7170)	Entropy 1.47143 (1.47925)	Top-1 acc 35.938 (36.605)	Top-5 acc 61.328 (60.621)	lr 0.02455
Train [11][940/3239]	Time 0.557 (0.865)	Data Time 0.001 (0.022)	Loss 3.7093 (3.7168)	Entropy 1.47112 (1.47916)	Top-1 acc 36.328 (36.611)	Top-5 acc 58.984 (60.633)	lr 0.02455
Train [11][950/3239]	Time 0.573 (0.864)	Data Time 0.001 (0.022)	Loss 3.6682 (3.7167)	Entropy 1.47054 (1.47908)	Top-1 acc 37.891 (36.606)	Top-5 acc 62.891 (60.641)	lr 0.02455
Train [11][960/3239]	Time 0.724 (0.864)	Data Time 0.001 (0.022)	Loss 3.7798 (3.7167)	Entropy 1.47000 (1.47899)	Top-1 acc 35.156 (36.608)	Top-5 acc 57.031 (60.645)	lr 0.02455
Train [11][970/3239]	Time 0.605 (0.863)	Data Time 0.002 (0.022)	Loss 3.5980 (3.7167)	Entropy 1.46979 (1.47889)	Top-1 acc 39.062 (36.600)	Top-5 acc 65.234 (60.644)	lr 0.02455
Train [11][980/3239]	Time 0.594 (0.882)	Data Time 0.002 (0.021)	Loss 3.6018 (3.7170)	Entropy 1.46944 (1.47880)	Top-1 acc 37.891 (36.589)	Top-5 acc 64.844 (60.643)	lr 0.02455
Train [11][990/3239]	Time 0.574 (0.882)	Data Time 0.002 (0.021)	Loss 3.7439 (3.7167)	Entropy 1.46919 (1.47870)	Top-1 acc 37.500 (36.597)	Top-5 acc 57.812 (60.657)	lr 0.02455
Train [11][1000/3239]	Time 0.598 (0.881)	Data Time 0.001 (0.021)	Loss 3.8137 (3.7165)	Entropy 1.46911 (1.47861)	Top-1 acc 35.547 (36.604)	Top-5 acc 58.203 (60.651)	lr 0.02455
Train [11][1010/3239]	Time 0.619 (0.880)	Data Time 0.002 (0.021)	Loss 3.6304 (3.7164)	Entropy 1.46906 (1.47852)	Top-1 acc 37.109 (36.605)	Top-5 acc 62.891 (60.662)	lr 0.02455
Train [11][1020/3239]	Time 0.552 (0.880)	Data Time 0.001 (0.021)	Loss 3.8221 (3.7167)	Entropy 1.46867 (1.47842)	Top-1 acc 33.984 (36.602)	Top-5 acc 57.812 (60.661)	lr 0.02455
Train [11][1030/3239]	Time 0.662 (0.879)	Data Time 0.001 (0.020)	Loss 3.9308 (3.7165)	Entropy 1.46878 (1.47833)	Top-1 acc 37.500 (36.615)	Top-5 acc 55.078 (60.666)	lr 0.02455
Train [11][1040/3239]	Time 0.572 (0.878)	Data Time 0.003 (0.020)	Loss 3.7980 (3.7167)	Entropy 1.46853 (1.47823)	Top-1 acc 36.719 (36.614)	Top-5 acc 60.938 (60.671)	lr 0.02455
Train [11][1050/3239]	Time 0.518 (0.878)	Data Time 0.001 (0.020)	Loss 3.7616 (3.7172)	Entropy 1.46830 (1.47814)	Top-1 acc 36.719 (36.596)	Top-5 acc 60.547 (60.654)	lr 0.02455
Train [11][1060/3239]	Time 0.578 (0.877)	Data Time 0.001 (0.020)	Loss 3.6152 (3.7171)	Entropy 1.46840 (1.47805)	Top-1 acc 39.453 (36.601)	Top-5 acc 64.062 (60.663)	lr 0.02455
Train [11][1070/3239]	Time 0.607 (0.877)	Data Time 0.001 (0.020)	Loss 3.7326 (3.7174)	Entropy 1.46821 (1.47796)	Top-1 acc 39.453 (36.611)	Top-5 acc 63.281 (60.664)	lr 0.02455
Train [11][1080/3239]	Time 0.539 (0.876)	Data Time 0.001 (0.020)	Loss 3.7753 (3.7176)	Entropy 1.46827 (1.47787)	Top-1 acc 37.891 (36.611)	Top-5 acc 60.547 (60.664)	lr 0.02455
Train [11][1090/3239]	Time 0.580 (0.876)	Data Time 0.001 (0.019)	Loss 3.7329 (3.7179)	Entropy 1.46836 (1.47778)	Top-1 acc 35.156 (36.593)	Top-5 acc 60.156 (60.652)	lr 0.02455
Train [11][1100/3239]	Time 0.666 (0.876)	Data Time 0.001 (0.019)	Loss 3.7022 (3.7178)	Entropy 1.46803 (1.47769)	Top-1 acc 38.672 (36.591)	Top-5 acc 58.984 (60.655)	lr 0.02454
Train [11][1110/3239]	Time 0.516 (0.875)	Data Time 0.002 (0.019)	Loss 4.0591 (3.7184)	Entropy 1.46793 (1.47761)	Top-1 acc 32.422 (36.581)	Top-5 acc 51.953 (60.642)	lr 0.02454
Train [11][1120/3239]	Time 0.616 (0.875)	Data Time 0.001 (0.019)	Loss 3.5526 (3.7179)	Entropy 1.46778 (1.47752)	Top-1 acc 37.500 (36.593)	Top-5 acc 63.672 (60.651)	lr 0.02454
Train [11][1130/3239]	Time 0.575 (0.874)	Data Time 0.001 (0.019)	Loss 3.6237 (3.7179)	Entropy 1.46762 (1.47743)	Top-1 acc 39.844 (36.586)	Top-5 acc 62.109 (60.645)	lr 0.02454
Train [11][1140/3239]	Time 0.524 (0.874)	Data Time 0.001 (0.019)	Loss 3.8898 (3.7184)	Entropy 1.46737 (1.47735)	Top-1 acc 34.766 (36.577)	Top-5 acc 59.375 (60.644)	lr 0.02454
Train [11][1150/3239]	Time 0.590 (0.874)	Data Time 0.001 (0.019)	Loss 3.7774 (3.7175)	Entropy 1.46697 (1.47726)	Top-1 acc 32.422 (36.594)	Top-5 acc 58.203 (60.659)	lr 0.02454
Train [11][1160/3239]	Time 0.572 (0.873)	Data Time 0.001 (0.018)	Loss 3.4620 (3.7170)	Entropy 1.46694 (1.47717)	Top-1 acc 40.625 (36.602)	Top-5 acc 67.578 (60.674)	lr 0.02454
Train [11][1170/3239]	Time 0.698 (0.873)	Data Time 0.001 (0.018)	Loss 3.6546 (3.7167)	Entropy 1.46679 (1.47708)	Top-1 acc 36.719 (36.611)	Top-5 acc 60.547 (60.678)	lr 0.02454
Train [11][1180/3239]	Time 0.561 (0.873)	Data Time 0.002 (0.018)	Loss 3.6302 (3.7163)	Entropy 1.46679 (1.47700)	Top-1 acc 35.156 (36.612)	Top-5 acc 62.500 (60.685)	lr 0.02454
Train [11][1190/3239]	Time 0.582 (0.872)	Data Time 0.001 (0.018)	Loss 3.7994 (3.7157)	Entropy 1.46641 (1.47691)	Top-1 acc 37.500 (36.627)	Top-5 acc 61.719 (60.695)	lr 0.02454
Train [11][1200/3239]	Time 0.568 (0.872)	Data Time 0.001 (0.018)	Loss 3.6596 (3.7157)	Entropy 1.46587 (1.47682)	Top-1 acc 37.891 (36.633)	Top-5 acc 59.766 (60.698)	lr 0.02454
Train [11][1210/3239]	Time 0.602 (0.871)	Data Time 0.001 (0.018)	Loss 3.6427 (3.7154)	Entropy 1.46553 (1.47673)	Top-1 acc 37.891 (36.647)	Top-5 acc 63.281 (60.706)	lr 0.02454
Train [11][1220/3239]	Time 0.605 (0.871)	Data Time 0.001 (0.018)	Loss 3.7513 (3.7155)	Entropy 1.46540 (1.47664)	Top-1 acc 33.594 (36.632)	Top-5 acc 58.594 (60.701)	lr 0.02454
Train [11][1230/3239]	Time 0.572 (0.871)	Data Time 0.001 (0.017)	Loss 3.6471 (3.7154)	Entropy 1.46508 (1.47655)	Top-1 acc 41.016 (36.635)	Top-5 acc 62.500 (60.701)	lr 0.02454
Train [11][1240/3239]	Time 0.612 (0.870)	Data Time 0.001 (0.017)	Loss 3.7944 (3.7154)	Entropy 1.46489 (1.47645)	Top-1 acc 34.375 (36.633)	Top-5 acc 59.375 (60.695)	lr 0.02454
Train [11][1250/3239]	Time 0.624 (0.870)	Data Time 0.001 (0.017)	Loss 3.7075 (3.7153)	Entropy 1.46462 (1.47636)	Top-1 acc 36.328 (36.631)	Top-5 acc 61.719 (60.703)	lr 0.02454
Train [11][1260/3239]	Time 0.661 (0.870)	Data Time 0.002 (0.017)	Loss 3.6719 (3.7152)	Entropy 1.46438 (1.47626)	Top-1 acc 33.594 (36.627)	Top-5 acc 60.547 (60.709)	lr 0.02454
Train [11][1270/3239]	Time 0.585 (0.870)	Data Time 0.001 (0.017)	Loss 3.5893 (3.7151)	Entropy 1.46434 (1.47617)	Top-1 acc 44.141 (36.632)	Top-5 acc 63.672 (60.708)	lr 0.02454
Train [11][1280/3239]	Time 0.579 (0.869)	Data Time 0.001 (0.017)	Loss 3.5859 (3.7155)	Entropy 1.46406 (1.47608)	Top-1 acc 37.500 (36.626)	Top-5 acc 62.891 (60.698)	lr 0.02454
Train [11][1290/3239]	Time 0.563 (0.869)	Data Time 0.001 (0.017)	Loss 3.9020 (3.7157)	Entropy 1.46402 (1.47598)	Top-1 acc 33.203 (36.608)	Top-5 acc 57.031 (60.705)	lr 0.02454
Train [11][1300/3239]	Time 0.578 (0.869)	Data Time 0.001 (0.017)	Loss 3.6931 (3.7154)	Entropy 1.46404 (1.47589)	Top-1 acc 39.453 (36.614)	Top-5 acc 62.109 (60.716)	lr 0.02454
Train [11][1310/3239]	Time 0.623 (0.869)	Data Time 0.001 (0.017)	Loss 3.7096 (3.7157)	Entropy 1.46391 (1.47580)	Top-1 acc 33.594 (36.609)	Top-5 acc 59.375 (60.705)	lr 0.02454
Train [11][1320/3239]	Time 0.582 (0.868)	Data Time 0.001 (0.017)	Loss 3.7618 (3.7157)	Entropy 1.46361 (1.47571)	Top-1 acc 37.891 (36.612)	Top-5 acc 59.375 (60.709)	lr 0.02454
Train [11][1330/3239]	Time 0.683 (0.868)	Data Time 0.002 (0.016)	Loss 3.7738 (3.7158)	Entropy 1.46362 (1.47562)	Top-1 acc 35.938 (36.614)	Top-5 acc 60.547 (60.709)	lr 0.02454
Train [11][1340/3239]	Time 0.581 (0.868)	Data Time 0.001 (0.016)	Loss 3.7103 (3.7161)	Entropy 1.46343 (1.47553)	Top-1 acc 35.938 (36.607)	Top-5 acc 63.281 (60.706)	lr 0.02454
Train [11][1350/3239]	Time 0.582 (0.867)	Data Time 0.001 (0.016)	Loss 3.8088 (3.7161)	Entropy 1.46343 (1.47544)	Top-1 acc 35.156 (36.604)	Top-5 acc 58.203 (60.703)	lr 0.02454
Train [11][1360/3239]	Time 0.619 (0.867)	Data Time 0.001 (0.016)	Loss 3.6407 (3.7159)	Entropy 1.46315 (1.47535)	Top-1 acc 37.109 (36.613)	Top-5 acc 61.328 (60.705)	lr 0.02454
Train [11][1370/3239]	Time 0.578 (0.867)	Data Time 0.001 (0.016)	Loss 3.5284 (3.7158)	Entropy 1.46305 (1.47526)	Top-1 acc 42.578 (36.614)	Top-5 acc 66.016 (60.709)	lr 0.02454
Train [11][1380/3239]	Time 0.586 (0.866)	Data Time 0.001 (0.016)	Loss 3.5420 (3.7157)	Entropy 1.46261 (1.47517)	Top-1 acc 38.672 (36.614)	Top-5 acc 63.281 (60.710)	lr 0.02454
Train [11][1390/3239]	Time 0.564 (0.866)	Data Time 0.001 (0.016)	Loss 3.6512 (3.7162)	Entropy 1.46232 (1.47508)	Top-1 acc 37.891 (36.609)	Top-5 acc 60.156 (60.705)	lr 0.02454
Train [11][1400/3239]	Time 0.720 (0.865)	Data Time 0.001 (0.016)	Loss 3.6038 (3.7160)	Entropy 1.46197 (1.47499)	Top-1 acc 38.281 (36.607)	Top-5 acc 62.109 (60.705)	lr 0.02454
Train [11][1410/3239]	Time 0.591 (0.865)	Data Time 0.001 (0.016)	Loss 3.5381 (3.7159)	Entropy 1.46169 (1.47490)	Top-1 acc 40.234 (36.610)	Top-5 acc 63.672 (60.703)	lr 0.02454
Train [11][1420/3239]	Time 0.596 (0.865)	Data Time 0.001 (0.015)	Loss 3.7859 (3.7161)	Entropy 1.46171 (1.47481)	Top-1 acc 33.203 (36.611)	Top-5 acc 62.109 (60.697)	lr 0.02454
Train [11][1430/3239]	Time 0.566 (0.865)	Data Time 0.001 (0.015)	Loss 3.7943 (3.7162)	Entropy 1.46144 (1.47471)	Top-1 acc 36.328 (36.610)	Top-5 acc 58.594 (60.690)	lr 0.02454
Train [11][1440/3239]	Time 0.549 (0.864)	Data Time 0.002 (0.015)	Loss 3.6641 (3.7163)	Entropy 1.46115 (1.47462)	Top-1 acc 39.844 (36.608)	Top-5 acc 62.109 (60.695)	lr 0.02454
Train [11][1450/3239]	Time 0.561 (0.864)	Data Time 0.001 (0.015)	Loss 3.8526 (3.7166)	Entropy 1.46098 (1.47453)	Top-1 acc 30.859 (36.599)	Top-5 acc 57.422 (60.693)	lr 0.02454
Train [11][1460/3239]	Time 0.593 (0.863)	Data Time 0.001 (0.015)	Loss 3.7259 (3.7165)	Entropy 1.46060 (1.47443)	Top-1 acc 35.938 (36.604)	Top-5 acc 59.766 (60.701)	lr 0.02454
Train [11][1470/3239]	Time 0.693 (0.863)	Data Time 0.001 (0.015)	Loss 3.8617 (3.7162)	Entropy 1.46049 (1.47434)	Top-1 acc 33.203 (36.601)	Top-5 acc 57.812 (60.706)	lr 0.02453
Train [11][1480/3239]	Time 0.598 (0.863)	Data Time 0.001 (0.015)	Loss 3.6107 (3.7162)	Entropy 1.46021 (1.47425)	Top-1 acc 36.328 (36.602)	Top-5 acc 60.156 (60.705)	lr 0.02453
Train [11][1490/3239]	Time 0.608 (0.863)	Data Time 0.001 (0.015)	Loss 3.4818 (3.7158)	Entropy 1.45990 (1.47415)	Top-1 acc 41.797 (36.612)	Top-5 acc 66.016 (60.713)	lr 0.02453
Train [11][1500/3239]	Time 0.618 (0.863)	Data Time 0.001 (0.015)	Loss 3.7529 (3.7157)	Entropy 1.45987 (1.47405)	Top-1 acc 36.328 (36.614)	Top-5 acc 60.938 (60.720)	lr 0.02453
Train [11][1510/3239]	Time 0.601 (0.863)	Data Time 0.001 (0.015)	Loss 3.7901 (3.7159)	Entropy 1.45966 (1.47396)	Top-1 acc 37.500 (36.609)	Top-5 acc 58.594 (60.711)	lr 0.02453
Train [11][1520/3239]	Time 0.565 (0.862)	Data Time 0.001 (0.015)	Loss 3.9247 (3.7161)	Entropy 1.45930 (1.47387)	Top-1 acc 35.938 (36.610)	Top-5 acc 54.297 (60.709)	lr 0.02453
Train [11][1530/3239]	Time 0.526 (0.862)	Data Time 0.001 (0.014)	Loss 3.5114 (3.7157)	Entropy 1.45900 (1.47377)	Top-1 acc 39.844 (36.611)	Top-5 acc 65.625 (60.717)	lr 0.02453
Train [11][1540/3239]	Time 0.651 (0.862)	Data Time 0.001 (0.014)	Loss 3.7247 (3.7159)	Entropy 1.45891 (1.47367)	Top-1 acc 36.719 (36.611)	Top-5 acc 59.375 (60.713)	lr 0.02453
Train [11][1550/3239]	Time 0.601 (0.861)	Data Time 0.001 (0.014)	Loss 3.8037 (3.7161)	Entropy 1.45879 (1.47358)	Top-1 acc 31.641 (36.606)	Top-5 acc 58.594 (60.706)	lr 0.02453
Train [11][1560/3239]	Time 0.558 (0.861)	Data Time 0.001 (0.014)	Loss 3.5410 (3.7157)	Entropy 1.45834 (1.47348)	Top-1 acc 39.062 (36.607)	Top-5 acc 65.234 (60.715)	lr 0.02453
Train [11][1570/3239]	Time 0.569 (0.861)	Data Time 0.001 (0.014)	Loss 3.6470 (3.7155)	Entropy 1.45799 (1.47339)	Top-1 acc 41.406 (36.612)	Top-5 acc 62.500 (60.713)	lr 0.02453
Train [11][1580/3239]	Time 0.598 (0.861)	Data Time 0.001 (0.014)	Loss 3.8894 (3.7156)	Entropy 1.45740 (1.47329)	Top-1 acc 30.078 (36.607)	Top-5 acc 55.859 (60.710)	lr 0.02453
Train [11][1590/3239]	Time 0.601 (0.860)	Data Time 0.001 (0.014)	Loss 3.8045 (3.7159)	Entropy 1.45743 (1.47319)	Top-1 acc 29.688 (36.601)	Top-5 acc 60.938 (60.710)	lr 0.02453
Train [11][1600/3239]	Time 0.576 (0.860)	Data Time 0.001 (0.014)	Loss 3.7695 (3.7159)	Entropy 1.45767 (1.47309)	Top-1 acc 36.719 (36.610)	Top-5 acc 60.156 (60.707)	lr 0.02453
Train [11][1610/3239]	Time 0.678 (0.860)	Data Time 0.002 (0.014)	Loss 3.7969 (3.7161)	Entropy 1.45720 (1.47299)	Top-1 acc 36.328 (36.610)	Top-5 acc 60.547 (60.701)	lr 0.02453
Train [11][1620/3239]	Time 0.551 (0.860)	Data Time 0.001 (0.014)	Loss 3.6475 (3.7161)	Entropy 1.45721 (1.47290)	Top-1 acc 38.281 (36.608)	Top-5 acc 61.719 (60.701)	lr 0.02453
Train [11][1630/3239]	Time 0.851 (0.871)	Data Time 0.005 (0.014)	Loss 3.5962 (3.7159)	Entropy 1.45685 (1.47280)	Top-1 acc 41.406 (36.615)	Top-5 acc 62.500 (60.701)	lr 0.02453
Train [11][1640/3239]	Time 0.548 (0.871)	Data Time 0.002 (0.014)	Loss 3.7130 (3.7155)	Entropy 1.45645 (1.47270)	Top-1 acc 38.281 (36.621)	Top-5 acc 59.375 (60.704)	lr 0.02453
Train [11][1650/3239]	Time 0.591 (0.871)	Data Time 0.002 (0.014)	Loss 3.8523 (3.7157)	Entropy 1.45628 (1.47260)	Top-1 acc 32.422 (36.619)	Top-5 acc 58.984 (60.700)	lr 0.02453
Train [11][1660/3239]	Time 0.629 (0.871)	Data Time 0.001 (0.014)	Loss 3.6441 (3.7155)	Entropy 1.45625 (1.47250)	Top-1 acc 35.938 (36.623)	Top-5 acc 63.672 (60.709)	lr 0.02453
Train [11][1670/3239]	Time 0.610 (0.870)	Data Time 0.001 (0.013)	Loss 3.8139 (3.7157)	Entropy 1.45609 (1.47241)	Top-1 acc 33.203 (36.617)	Top-5 acc 57.812 (60.707)	lr 0.02453
Train [11][1680/3239]	Time 0.595 (0.870)	Data Time 0.001 (0.013)	Loss 3.5096 (3.7158)	Entropy 1.45539 (1.47231)	Top-1 acc 43.359 (36.617)	Top-5 acc 65.234 (60.710)	lr 0.02453
Train [11][1690/3239]	Time 0.556 (0.870)	Data Time 0.001 (0.013)	Loss 3.7105 (3.7157)	Entropy 1.45535 (1.47221)	Top-1 acc 37.891 (36.614)	Top-5 acc 59.375 (60.710)	lr 0.02453
Train [11][1700/3239]	Time 0.711 (0.869)	Data Time 0.001 (0.013)	Loss 3.6755 (3.7158)	Entropy 1.45545 (1.47211)	Top-1 acc 38.672 (36.614)	Top-5 acc 62.109 (60.709)	lr 0.02453
Train [11][1710/3239]	Time 0.617 (0.869)	Data Time 0.001 (0.013)	Loss 3.4813 (3.7157)	Entropy 1.45554 (1.47201)	Top-1 acc 44.922 (36.620)	Top-5 acc 69.531 (60.721)	lr 0.02453
Train [11][1720/3239]	Time 0.572 (0.869)	Data Time 0.001 (0.013)	Loss 3.8150 (3.7157)	Entropy 1.45556 (1.47192)	Top-1 acc 32.031 (36.623)	Top-5 acc 57.812 (60.721)	lr 0.02453
Train [11][1730/3239]	Time 0.573 (0.869)	Data Time 0.001 (0.013)	Loss 3.7872 (3.7158)	Entropy 1.45539 (1.47182)	Top-1 acc 33.203 (36.619)	Top-5 acc 57.422 (60.712)	lr 0.02453
Train [11][1740/3239]	Time 0.552 (0.868)	Data Time 0.001 (0.013)	Loss 3.6579 (3.7155)	Entropy 1.45516 (1.47173)	Top-1 acc 38.281 (36.620)	Top-5 acc 64.453 (60.721)	lr 0.02453
Train [11][1750/3239]	Time 0.573 (0.868)	Data Time 0.001 (0.013)	Loss 3.6482 (3.7156)	Entropy 1.45498 (1.47163)	Top-1 acc 39.062 (36.614)	Top-5 acc 62.891 (60.721)	lr 0.02453
Train [11][1760/3239]	Time 0.591 (0.868)	Data Time 0.001 (0.013)	Loss 3.6116 (3.7160)	Entropy 1.45483 (1.47154)	Top-1 acc 41.016 (36.606)	Top-5 acc 63.672 (60.715)	lr 0.02453
Train [11][1770/3239]	Time 0.628 (0.868)	Data Time 0.001 (0.013)	Loss 3.7484 (3.7161)	Entropy 1.45456 (1.47144)	Top-1 acc 32.031 (36.606)	Top-5 acc 59.375 (60.712)	lr 0.02453
Train [11][1780/3239]	Time 0.601 (0.867)	Data Time 0.001 (0.013)	Loss 3.6594 (3.7162)	Entropy 1.45435 (1.47135)	Top-1 acc 38.281 (36.606)	Top-5 acc 64.453 (60.709)	lr 0.02453
Train [11][1790/3239]	Time 0.524 (0.867)	Data Time 0.001 (0.013)	Loss 3.7752 (3.7160)	Entropy 1.45420 (1.47125)	Top-1 acc 34.766 (36.602)	Top-5 acc 59.766 (60.709)	lr 0.02453
Train [11][1800/3239]	Time 0.584 (0.867)	Data Time 0.002 (0.013)	Loss 3.5422 (3.7160)	Entropy 1.45386 (1.47116)	Top-1 acc 38.281 (36.601)	Top-5 acc 65.625 (60.710)	lr 0.02453
Train [11][1810/3239]	Time 0.599 (0.867)	Data Time 0.001 (0.013)	Loss 3.9642 (3.7161)	Entropy 1.45350 (1.47106)	Top-1 acc 34.375 (36.601)	Top-5 acc 53.906 (60.711)	lr 0.02453
Train [11][1820/3239]	Time 0.635 (0.867)	Data Time 0.001 (0.013)	Loss 3.7725 (3.7158)	Entropy 1.45359 (1.47096)	Top-1 acc 36.719 (36.612)	Top-5 acc 60.156 (60.718)	lr 0.02453
Train [11][1830/3239]	Time 0.608 (0.866)	Data Time 0.001 (0.012)	Loss 3.8972 (3.7157)	Entropy 1.45367 (1.47087)	Top-1 acc 35.547 (36.615)	Top-5 acc 57.422 (60.721)	lr 0.02452
Train [11][1840/3239]	Time 0.613 (0.866)	Data Time 0.001 (0.012)	Loss 3.7150 (3.7159)	Entropy 1.45357 (1.47077)	Top-1 acc 33.203 (36.613)	Top-5 acc 60.156 (60.720)	lr 0.02452
Train [11][1850/3239]	Time 0.556 (0.866)	Data Time 0.002 (0.012)	Loss 3.6717 (3.7156)	Entropy 1.45357 (1.47068)	Top-1 acc 33.594 (36.618)	Top-5 acc 62.109 (60.726)	lr 0.02452
Train [11][1860/3239]	Time 0.528 (0.866)	Data Time 0.001 (0.012)	Loss 3.6542 (3.7154)	Entropy 1.45354 (1.47059)	Top-1 acc 34.375 (36.618)	Top-5 acc 64.453 (60.734)	lr 0.02452
Train [11][1870/3239]	Time 0.594 (0.865)	Data Time 0.001 (0.012)	Loss 3.8733 (3.7156)	Entropy 1.45323 (1.47050)	Top-1 acc 33.984 (36.610)	Top-5 acc 55.078 (60.730)	lr 0.02452
Train [11][1880/3239]	Time 0.568 (0.865)	Data Time 0.001 (0.012)	Loss 3.6046 (3.7153)	Entropy 1.45317 (1.47041)	Top-1 acc 40.234 (36.613)	Top-5 acc 63.672 (60.736)	lr 0.02452
Train [11][1890/3239]	Time 0.592 (0.865)	Data Time 0.001 (0.012)	Loss 3.6286 (3.7152)	Entropy 1.45273 (1.47031)	Top-1 acc 37.891 (36.612)	Top-5 acc 64.844 (60.741)	lr 0.02452
Train [11][1900/3239]	Time 0.586 (0.865)	Data Time 0.002 (0.012)	Loss 3.7702 (3.7152)	Entropy 1.45246 (1.47022)	Top-1 acc 38.281 (36.609)	Top-5 acc 57.031 (60.735)	lr 0.02452
Train [11][1910/3239]	Time 0.557 (0.864)	Data Time 0.001 (0.012)	Loss 3.7358 (3.7151)	Entropy 1.45240 (1.47013)	Top-1 acc 37.109 (36.613)	Top-5 acc 59.766 (60.736)	lr 0.02452
Train [11][1920/3239]	Time 0.600 (0.864)	Data Time 0.001 (0.012)	Loss 3.7402 (3.7150)	Entropy 1.45238 (1.47004)	Top-1 acc 32.812 (36.615)	Top-5 acc 58.594 (60.737)	lr 0.02452
Train [11][1930/3239]	Time 0.636 (0.864)	Data Time 0.001 (0.012)	Loss 3.7800 (3.7150)	Entropy 1.45218 (1.46994)	Top-1 acc 33.203 (36.611)	Top-5 acc 58.203 (60.740)	lr 0.02452
Train [11][1940/3239]	Time 0.608 (0.864)	Data Time 0.001 (0.012)	Loss 3.4506 (3.7147)	Entropy 1.45208 (1.46985)	Top-1 acc 39.062 (36.611)	Top-5 acc 67.188 (60.746)	lr 0.02452
Train [11][1950/3239]	Time 0.599 (0.864)	Data Time 0.001 (0.012)	Loss 3.6669 (3.7152)	Entropy 1.45193 (1.46976)	Top-1 acc 34.375 (36.602)	Top-5 acc 62.109 (60.736)	lr 0.02452
Train [11][1960/3239]	Time 0.665 (0.864)	Data Time 0.001 (0.012)	Loss 3.5809 (3.7151)	Entropy 1.45186 (1.46967)	Top-1 acc 41.016 (36.606)	Top-5 acc 66.016 (60.736)	lr 0.02452
Train [11][1970/3239]	Time 0.626 (0.863)	Data Time 0.001 (0.012)	Loss 3.8062 (3.7147)	Entropy 1.45120 (1.46958)	Top-1 acc 38.672 (36.617)	Top-5 acc 58.594 (60.743)	lr 0.02452
Train [11][1980/3239]	Time 0.551 (0.863)	Data Time 0.001 (0.012)	Loss 3.7075 (3.7148)	Entropy 1.45067 (1.46948)	Top-1 acc 40.234 (36.618)	Top-5 acc 60.547 (60.742)	lr 0.02452
Train [11][1990/3239]	Time 0.627 (0.863)	Data Time 0.001 (0.012)	Loss 3.4981 (3.7145)	Entropy 1.45050 (1.46939)	Top-1 acc 44.141 (36.629)	Top-5 acc 66.797 (60.749)	lr 0.02452
Train [11][2000/3239]	Time 0.586 (0.863)	Data Time 0.001 (0.012)	Loss 3.3355 (3.7141)	Entropy 1.45000 (1.46929)	Top-1 acc 40.234 (36.631)	Top-5 acc 66.797 (60.756)	lr 0.02452
Train [11][2010/3239]	Time 0.547 (0.863)	Data Time 0.001 (0.012)	Loss 3.7767 (3.7142)	Entropy 1.44997 (1.46920)	Top-1 acc 33.203 (36.626)	Top-5 acc 57.422 (60.752)	lr 0.02452
Train [11][2020/3239]	Time 0.609 (0.862)	Data Time 0.001 (0.012)	Loss 3.6134 (3.7145)	Entropy 1.44998 (1.46910)	Top-1 acc 32.812 (36.617)	Top-5 acc 64.453 (60.753)	lr 0.02452
Train [11][2030/3239]	Time 0.652 (0.862)	Data Time 0.001 (0.011)	Loss 3.6239 (3.7143)	Entropy 1.44977 (1.46901)	Top-1 acc 39.062 (36.621)	Top-5 acc 64.453 (60.760)	lr 0.02452
Train [11][2040/3239]	Time 0.414 (0.862)	Data Time 0.001 (0.011)	Loss 3.6937 (3.7139)	Entropy 1.44971 (1.46891)	Top-1 acc 36.328 (36.628)	Top-5 acc 60.938 (60.770)	lr 0.02452
Train [11][2050/3239]	Time 0.560 (0.861)	Data Time 0.001 (0.011)	Loss 3.5248 (3.7139)	Entropy 1.44952 (1.46882)	Top-1 acc 42.188 (36.631)	Top-5 acc 67.969 (60.770)	lr 0.02452
Train [11][2060/3239]	Time 0.544 (0.861)	Data Time 0.001 (0.011)	Loss 3.5092 (3.7137)	Entropy 1.44919 (1.46872)	Top-1 acc 40.234 (36.633)	Top-5 acc 65.234 (60.772)	lr 0.02452
Train [11][2070/3239]	Time 0.589 (0.861)	Data Time 0.001 (0.011)	Loss 3.7474 (3.7135)	Entropy 1.44915 (1.46863)	Top-1 acc 34.375 (36.637)	Top-5 acc 60.547 (60.777)	lr 0.02452
Train [11][2080/3239]	Time 0.550 (0.861)	Data Time 0.001 (0.011)	Loss 3.8491 (3.7137)	Entropy 1.44883 (1.46854)	Top-1 acc 35.938 (36.632)	Top-5 acc 56.641 (60.772)	lr 0.02452
Train [11][2090/3239]	Time 0.527 (0.861)	Data Time 0.001 (0.011)	Loss 3.8401 (3.7138)	Entropy 1.44842 (1.46844)	Top-1 acc 31.641 (36.630)	Top-5 acc 55.859 (60.769)	lr 0.02452
Train [11][2100/3239]	Time 0.501 (0.861)	Data Time 0.001 (0.011)	Loss 4.0293 (3.7142)	Entropy 1.44825 (1.46834)	Top-1 acc 33.594 (36.625)	Top-5 acc 53.516 (60.759)	lr 0.02452
Train [11][2110/3239]	Time 0.557 (0.860)	Data Time 0.001 (0.011)	Loss 3.6285 (3.7142)	Entropy 1.44779 (1.46825)	Top-1 acc 41.406 (36.625)	Top-5 acc 62.109 (60.758)	lr 0.02452
Train [11][2120/3239]	Time 0.573 (0.860)	Data Time 0.001 (0.011)	Loss 3.7174 (3.7145)	Entropy 1.44771 (1.46815)	Top-1 acc 33.594 (36.619)	Top-5 acc 61.719 (60.756)	lr 0.02452
Train [11][2130/3239]	Time 0.593 (0.860)	Data Time 0.001 (0.011)	Loss 3.8304 (3.7144)	Entropy 1.44770 (1.46806)	Top-1 acc 34.766 (36.625)	Top-5 acc 58.984 (60.759)	lr 0.02452
Train [11][2140/3239]	Time 0.566 (0.860)	Data Time 0.001 (0.011)	Loss 3.8912 (3.7147)	Entropy 1.44723 (1.46796)	Top-1 acc 32.422 (36.622)	Top-5 acc 57.812 (60.755)	lr 0.02452
Train [11][2150/3239]	Time 0.594 (0.860)	Data Time 0.001 (0.011)	Loss 3.6203 (3.7146)	Entropy 1.44678 (1.46786)	Top-1 acc 39.062 (36.624)	Top-5 acc 60.938 (60.754)	lr 0.02452
Train [11][2160/3239]	Time 0.559 (0.860)	Data Time 0.001 (0.011)	Loss 3.8186 (3.7144)	Entropy 1.44688 (1.46777)	Top-1 acc 37.109 (36.625)	Top-5 acc 58.203 (60.757)	lr 0.02452
Train [11][2170/3239]	Time 0.673 (0.859)	Data Time 0.001 (0.011)	Loss 3.7452 (3.7141)	Entropy 1.44649 (1.46767)	Top-1 acc 37.109 (36.631)	Top-5 acc 59.766 (60.759)	lr 0.02452
Train [11][2180/3239]	Time 0.596 (0.859)	Data Time 0.001 (0.011)	Loss 3.6401 (3.7146)	Entropy 1.44634 (1.46757)	Top-1 acc 39.844 (36.620)	Top-5 acc 64.062 (60.750)	lr 0.02452
Train [11][2190/3239]	Time 0.523 (0.859)	Data Time 0.002 (0.011)	Loss 3.6905 (3.7144)	Entropy 1.44623 (1.46747)	Top-1 acc 39.844 (36.626)	Top-5 acc 63.672 (60.757)	lr 0.02451
Train [11][2200/3239]	Time 0.630 (0.859)	Data Time 0.001 (0.011)	Loss 3.6542 (3.7140)	Entropy 1.44613 (1.46738)	Top-1 acc 39.453 (36.628)	Top-5 acc 60.547 (60.765)	lr 0.02451
Train [11][2210/3239]	Time 0.610 (0.859)	Data Time 0.001 (0.011)	Loss 3.6721 (3.7143)	Entropy 1.44625 (1.46728)	Top-1 acc 33.203 (36.622)	Top-5 acc 66.406 (60.760)	lr 0.02451
Train [11][2220/3239]	Time 0.568 (0.858)	Data Time 0.001 (0.011)	Loss 3.7849 (3.7144)	Entropy 1.44620 (1.46719)	Top-1 acc 36.719 (36.620)	Top-5 acc 62.891 (60.758)	lr 0.02451
Train [11][2230/3239]	Time 0.572 (0.858)	Data Time 0.001 (0.011)	Loss 3.8536 (3.7144)	Entropy 1.44599 (1.46709)	Top-1 acc 32.422 (36.617)	Top-5 acc 56.250 (60.752)	lr 0.02451
Train [11][2240/3239]	Time 0.610 (0.858)	Data Time 0.001 (0.011)	Loss 3.5835 (3.7143)	Entropy 1.44584 (1.46700)	Top-1 acc 39.844 (36.620)	Top-5 acc 66.797 (60.756)	lr 0.02451
Train [11][2250/3239]	Time 0.595 (0.858)	Data Time 0.001 (0.011)	Loss 3.7872 (3.7145)	Entropy 1.44532 (1.46690)	Top-1 acc 33.984 (36.611)	Top-5 acc 59.375 (60.753)	lr 0.02451
Train [11][2260/3239]	Time 0.611 (0.858)	Data Time 0.001 (0.010)	Loss 3.6961 (3.7147)	Entropy 1.44479 (1.46681)	Top-1 acc 38.281 (36.611)	Top-5 acc 62.891 (60.748)	lr 0.02451
Train [11][2270/3239]	Time 0.542 (0.858)	Data Time 0.001 (0.010)	Loss 3.5106 (3.7144)	Entropy 1.44422 (1.46671)	Top-1 acc 40.234 (36.614)	Top-5 acc 67.188 (60.751)	lr 0.02451
Train [11][2280/3239]	Time 0.604 (0.858)	Data Time 0.001 (0.010)	Loss 3.3517 (3.7141)	Entropy 1.44364 (1.46661)	Top-1 acc 44.922 (36.621)	Top-5 acc 67.578 (60.755)	lr 0.02451
Train [11][2290/3239]	Time 0.506 (0.866)	Data Time 0.002 (0.010)	Loss 3.7472 (3.7140)	Entropy 1.44315 (1.46651)	Top-1 acc 35.547 (36.620)	Top-5 acc 60.156 (60.759)	lr 0.02451
Train [11][2300/3239]	Time 0.632 (0.866)	Data Time 0.001 (0.010)	Loss 3.6153 (3.7137)	Entropy 1.44309 (1.46641)	Top-1 acc 40.234 (36.628)	Top-5 acc 62.500 (60.765)	lr 0.02451
Train [11][2310/3239]	Time 0.576 (0.866)	Data Time 0.001 (0.010)	Loss 3.5726 (3.7137)	Entropy 1.44276 (1.46631)	Top-1 acc 42.188 (36.628)	Top-5 acc 62.500 (60.763)	lr 0.02451
Train [11][2320/3239]	Time 0.612 (0.865)	Data Time 0.001 (0.010)	Loss 3.5591 (3.7138)	Entropy 1.44236 (1.46620)	Top-1 acc 39.062 (36.628)	Top-5 acc 62.891 (60.758)	lr 0.02451
Train [11][2330/3239]	Time 0.705 (0.865)	Data Time 0.001 (0.010)	Loss 3.6246 (3.7135)	Entropy 1.44233 (1.46610)	Top-1 acc 38.672 (36.631)	Top-5 acc 64.062 (60.763)	lr 0.02451
Train [11][2340/3239]	Time 0.558 (0.865)	Data Time 0.002 (0.010)	Loss 3.9367 (3.7137)	Entropy 1.44216 (1.46600)	Top-1 acc 33.203 (36.625)	Top-5 acc 57.422 (60.761)	lr 0.02451
Train [11][2350/3239]	Time 0.449 (0.865)	Data Time 0.001 (0.010)	Loss 3.7319 (3.7133)	Entropy 1.44187 (1.46590)	Top-1 acc 36.328 (36.632)	Top-5 acc 61.719 (60.768)	lr 0.02451
Train [11][2360/3239]	Time 0.593 (0.865)	Data Time 0.001 (0.010)	Loss 3.6155 (3.7134)	Entropy 1.44138 (1.46580)	Top-1 acc 38.672 (36.627)	Top-5 acc 60.938 (60.767)	lr 0.02451
Train [11][2370/3239]	Time 0.580 (0.865)	Data Time 0.001 (0.010)	Loss 3.5964 (3.7134)	Entropy 1.44129 (1.46569)	Top-1 acc 38.672 (36.629)	Top-5 acc 65.234 (60.766)	lr 0.02451
Train [11][2380/3239]	Time 0.598 (0.865)	Data Time 0.001 (0.010)	Loss 3.4169 (3.7131)	Entropy 1.44099 (1.46559)	Top-1 acc 44.141 (36.634)	Top-5 acc 67.578 (60.773)	lr 0.02451
Train [11][2390/3239]	Time 0.594 (0.864)	Data Time 0.001 (0.010)	Loss 3.4941 (3.7130)	Entropy 1.44074 (1.46549)	Top-1 acc 39.844 (36.637)	Top-5 acc 67.969 (60.776)	lr 0.02451
Train [11][2400/3239]	Time 0.548 (0.864)	Data Time 0.001 (0.010)	Loss 3.6040 (3.7128)	Entropy 1.44085 (1.46538)	Top-1 acc 36.328 (36.643)	Top-5 acc 62.500 (60.782)	lr 0.02451
Train [11][2410/3239]	Time 0.534 (0.864)	Data Time 0.001 (0.010)	Loss 3.6281 (3.7126)	Entropy 1.44057 (1.46528)	Top-1 acc 35.547 (36.645)	Top-5 acc 64.062 (60.791)	lr 0.02451
Train [11][2420/3239]	Time 0.567 (0.864)	Data Time 0.001 (0.010)	Loss 3.8388 (3.7129)	Entropy 1.44010 (1.46518)	Top-1 acc 32.812 (36.638)	Top-5 acc 55.078 (60.780)	lr 0.02451
Train [11][2430/3239]	Time 0.528 (0.864)	Data Time 0.001 (0.010)	Loss 3.7388 (3.7130)	Entropy 1.44014 (1.46508)	Top-1 acc 38.281 (36.639)	Top-5 acc 62.891 (60.776)	lr 0.02451
Train [11][2440/3239]	Time 0.591 (0.864)	Data Time 0.001 (0.010)	Loss 3.6476 (3.7131)	Entropy 1.43998 (1.46497)	Top-1 acc 37.891 (36.637)	Top-5 acc 59.375 (60.769)	lr 0.02451
Train [11][2450/3239]	Time 0.576 (0.864)	Data Time 0.001 (0.010)	Loss 3.6872 (3.7128)	Entropy 1.43959 (1.46487)	Top-1 acc 33.203 (36.639)	Top-5 acc 62.500 (60.774)	lr 0.02451
Train [11][2460/3239]	Time 0.507 (0.863)	Data Time 0.001 (0.010)	Loss 3.6334 (3.7126)	Entropy 1.43946 (1.46477)	Top-1 acc 37.109 (36.642)	Top-5 acc 59.766 (60.773)	lr 0.02451
Train [11][2470/3239]	Time 0.546 (0.863)	Data Time 0.001 (0.010)	Loss 3.5668 (3.7124)	Entropy 1.43960 (1.46467)	Top-1 acc 38.281 (36.646)	Top-5 acc 63.672 (60.779)	lr 0.02451
Train [11][2480/3239]	Time 0.623 (0.863)	Data Time 0.001 (0.010)	Loss 3.5687 (3.7122)	Entropy 1.43954 (1.46456)	Top-1 acc 36.719 (36.649)	Top-5 acc 65.234 (60.781)	lr 0.02451
Train [11][2490/3239]	Time 0.577 (0.863)	Data Time 0.001 (0.010)	Loss 3.6658 (3.7122)	Entropy 1.43957 (1.46446)	Top-1 acc 34.766 (36.648)	Top-5 acc 61.328 (60.777)	lr 0.02451
Train [11][2500/3239]	Time 0.569 (0.863)	Data Time 0.001 (0.010)	Loss 3.7090 (3.7122)	Entropy 1.43944 (1.46436)	Top-1 acc 32.812 (36.652)	Top-5 acc 57.422 (60.777)	lr 0.02451
Train [11][2510/3239]	Time 0.538 (0.863)	Data Time 0.001 (0.010)	Loss 3.5866 (3.7118)	Entropy 1.43958 (1.46427)	Top-1 acc 42.188 (36.662)	Top-5 acc 65.234 (60.785)	lr 0.02451
Train [11][2520/3239]	Time 0.582 (0.862)	Data Time 0.001 (0.010)	Loss 3.7771 (3.7118)	Entropy 1.43924 (1.46417)	Top-1 acc 37.109 (36.663)	Top-5 acc 57.422 (60.786)	lr 0.02451
Train [11][2530/3239]	Time 0.596 (0.862)	Data Time 0.001 (0.010)	Loss 3.6591 (3.7119)	Entropy 1.43877 (1.46407)	Top-1 acc 39.453 (36.659)	Top-5 acc 61.719 (60.785)	lr 0.02451
Train [11][2540/3239]	Time 0.527 (0.862)	Data Time 0.001 (0.010)	Loss 3.6425 (3.7116)	Entropy 1.43837 (1.46397)	Top-1 acc 35.938 (36.663)	Top-5 acc 64.844 (60.793)	lr 0.02451
Train [11][2550/3239]	Time 0.559 (0.862)	Data Time 0.001 (0.010)	Loss 3.4696 (3.7117)	Entropy 1.43800 (1.46387)	Top-1 acc 38.281 (36.658)	Top-5 acc 67.969 (60.795)	lr 0.02450
Train [11][2560/3239]	Time 0.547 (0.862)	Data Time 0.001 (0.010)	Loss 3.7566 (3.7116)	Entropy 1.43822 (1.46377)	Top-1 acc 34.766 (36.658)	Top-5 acc 61.719 (60.796)	lr 0.02450
Train [11][2570/3239]	Time 0.551 (0.862)	Data Time 0.001 (0.010)	Loss 3.8489 (3.7116)	Entropy 1.43784 (1.46367)	Top-1 acc 37.500 (36.658)	Top-5 acc 60.156 (60.798)	lr 0.02450
Train [11][2580/3239]	Time 0.610 (0.862)	Data Time 0.001 (0.009)	Loss 3.6105 (3.7116)	Entropy 1.43797 (1.46357)	Top-1 acc 36.719 (36.653)	Top-5 acc 61.719 (60.799)	lr 0.02450
Train [11][2590/3239]	Time 0.645 (0.862)	Data Time 0.001 (0.009)	Loss 3.5942 (3.7115)	Entropy 1.43787 (1.46347)	Top-1 acc 37.500 (36.651)	Top-5 acc 63.672 (60.803)	lr 0.02450
Train [11][2600/3239]	Time 0.594 (0.861)	Data Time 0.001 (0.009)	Loss 3.3724 (3.7113)	Entropy 1.43748 (1.46337)	Top-1 acc 46.484 (36.656)	Top-5 acc 68.359 (60.810)	lr 0.02450
Train [11][2610/3239]	Time 0.746 (0.861)	Data Time 0.001 (0.009)	Loss 3.4664 (3.7109)	Entropy 1.43728 (1.46327)	Top-1 acc 42.969 (36.664)	Top-5 acc 66.406 (60.815)	lr 0.02450
Train [11][2620/3239]	Time 0.571 (0.861)	Data Time 0.001 (0.009)	Loss 3.4671 (3.7110)	Entropy 1.43717 (1.46317)	Top-1 acc 43.750 (36.662)	Top-5 acc 68.359 (60.813)	lr 0.02450
Train [11][2630/3239]	Time 0.601 (0.861)	Data Time 0.001 (0.009)	Loss 3.8257 (3.7110)	Entropy 1.43729 (1.46307)	Top-1 acc 32.812 (36.664)	Top-5 acc 55.859 (60.812)	lr 0.02450
Train [11][2640/3239]	Time 0.576 (0.861)	Data Time 0.001 (0.009)	Loss 3.5863 (3.7110)	Entropy 1.43701 (1.46297)	Top-1 acc 35.547 (36.666)	Top-5 acc 63.281 (60.815)	lr 0.02450
Train [11][2650/3239]	Time 0.596 (0.861)	Data Time 0.001 (0.009)	Loss 3.6257 (3.7111)	Entropy 1.43709 (1.46287)	Top-1 acc 37.500 (36.665)	Top-5 acc 61.719 (60.815)	lr 0.02450
Train [11][2660/3239]	Time 0.592 (0.861)	Data Time 0.001 (0.009)	Loss 3.4533 (3.7109)	Entropy 1.43702 (1.46278)	Top-1 acc 44.922 (36.667)	Top-5 acc 64.453 (60.817)	lr 0.02450
Train [11][2670/3239]	Time 0.571 (0.861)	Data Time 0.001 (0.009)	Loss 3.8324 (3.7108)	Entropy 1.43696 (1.46268)	Top-1 acc 39.844 (36.671)	Top-5 acc 56.250 (60.819)	lr 0.02450
Train [11][2680/3239]	Time 0.688 (0.861)	Data Time 0.001 (0.009)	Loss 3.7101 (3.7106)	Entropy 1.43685 (1.46258)	Top-1 acc 37.891 (36.675)	Top-5 acc 59.766 (60.823)	lr 0.02450
Train [11][2690/3239]	Time 0.591 (0.860)	Data Time 0.001 (0.009)	Loss 3.7804 (3.7104)	Entropy 1.43652 (1.46249)	Top-1 acc 37.500 (36.681)	Top-5 acc 59.766 (60.826)	lr 0.02450
Train [11][2700/3239]	Time 0.568 (0.860)	Data Time 0.001 (0.009)	Loss 3.4789 (3.7102)	Entropy 1.43647 (1.46239)	Top-1 acc 41.406 (36.687)	Top-5 acc 68.359 (60.831)	lr 0.02450
Train [11][2710/3239]	Time 0.642 (0.860)	Data Time 0.001 (0.009)	Loss 3.7596 (3.7100)	Entropy 1.43651 (1.46230)	Top-1 acc 35.938 (36.694)	Top-5 acc 58.594 (60.835)	lr 0.02450
Train [11][2720/3239]	Time 0.588 (0.860)	Data Time 0.002 (0.009)	Loss 3.7131 (3.7102)	Entropy 1.43641 (1.46220)	Top-1 acc 39.453 (36.693)	Top-5 acc 61.719 (60.830)	lr 0.02450
Train [11][2730/3239]	Time 0.591 (0.860)	Data Time 0.001 (0.009)	Loss 3.5060 (3.7103)	Entropy 1.43609 (1.46211)	Top-1 acc 43.359 (36.688)	Top-5 acc 64.844 (60.827)	lr 0.02450
Train [11][2740/3239]	Time 0.604 (0.860)	Data Time 0.001 (0.009)	Loss 3.6253 (3.7102)	Entropy 1.43611 (1.46201)	Top-1 acc 42.188 (36.690)	Top-5 acc 62.109 (60.829)	lr 0.02450
Train [11][2750/3239]	Time 0.640 (0.860)	Data Time 0.001 (0.009)	Loss 3.7786 (3.7104)	Entropy 1.43621 (1.46192)	Top-1 acc 32.812 (36.689)	Top-5 acc 61.719 (60.825)	lr 0.02450
Train [11][2760/3239]	Time 0.599 (0.860)	Data Time 0.001 (0.009)	Loss 3.4946 (3.7104)	Entropy 1.43588 (1.46183)	Top-1 acc 39.062 (36.688)	Top-5 acc 64.453 (60.824)	lr 0.02450
Train [11][2770/3239]	Time 0.545 (0.859)	Data Time 0.001 (0.009)	Loss 3.6771 (3.7105)	Entropy 1.43587 (1.46173)	Top-1 acc 35.156 (36.684)	Top-5 acc 60.938 (60.821)	lr 0.02450
Train [11][2780/3239]	Time 0.633 (0.859)	Data Time 0.002 (0.009)	Loss 3.6048 (3.7106)	Entropy 1.43564 (1.46164)	Top-1 acc 40.234 (36.682)	Top-5 acc 64.844 (60.818)	lr 0.02450
Train [11][2790/3239]	Time 0.625 (0.859)	Data Time 0.001 (0.009)	Loss 3.6600 (3.7108)	Entropy 1.43579 (1.46155)	Top-1 acc 37.891 (36.678)	Top-5 acc 63.672 (60.814)	lr 0.02450
Train [11][2800/3239]	Time 0.573 (0.859)	Data Time 0.001 (0.009)	Loss 3.7859 (3.7109)	Entropy 1.43544 (1.46145)	Top-1 acc 35.156 (36.680)	Top-5 acc 60.156 (60.818)	lr 0.02450
Train [11][2810/3239]	Time 0.564 (0.859)	Data Time 0.001 (0.009)	Loss 3.7460 (3.7109)	Entropy 1.43519 (1.46136)	Top-1 acc 32.031 (36.676)	Top-5 acc 61.719 (60.818)	lr 0.02450
Train [11][2820/3239]	Time 0.693 (0.859)	Data Time 0.001 (0.009)	Loss 3.8888 (3.7109)	Entropy 1.43527 (1.46127)	Top-1 acc 32.812 (36.674)	Top-5 acc 54.688 (60.815)	lr 0.02450
Train [11][2830/3239]	Time 0.617 (0.859)	Data Time 0.001 (0.009)	Loss 3.6222 (3.7105)	Entropy 1.43511 (1.46118)	Top-1 acc 39.062 (36.679)	Top-5 acc 59.766 (60.821)	lr 0.02450
Train [11][2840/3239]	Time 0.623 (0.859)	Data Time 0.001 (0.009)	Loss 3.6305 (3.7103)	Entropy 1.43478 (1.46108)	Top-1 acc 34.375 (36.681)	Top-5 acc 62.500 (60.824)	lr 0.02450
Train [11][2850/3239]	Time 0.574 (0.859)	Data Time 0.001 (0.009)	Loss 3.6511 (3.7103)	Entropy 1.43446 (1.46099)	Top-1 acc 35.938 (36.680)	Top-5 acc 63.672 (60.824)	lr 0.02450
Train [11][2860/3239]	Time 0.536 (0.858)	Data Time 0.001 (0.009)	Loss 3.6035 (3.7103)	Entropy 1.43459 (1.46090)	Top-1 acc 39.062 (36.683)	Top-5 acc 66.016 (60.824)	lr 0.02450
Train [11][2870/3239]	Time 0.253 (0.858)	Data Time 0.001 (0.009)	Loss 3.7464 (3.7102)	Entropy 1.43440 (1.46081)	Top-1 acc 32.812 (36.685)	Top-5 acc 58.594 (60.824)	lr 0.02450
Train [11][2880/3239]	Time 0.569 (0.858)	Data Time 0.001 (0.009)	Loss 3.7299 (3.7102)	Entropy 1.43362 (1.46071)	Top-1 acc 35.156 (36.684)	Top-5 acc 59.766 (60.825)	lr 0.02450
Train [11][2890/3239]	Time 0.691 (0.858)	Data Time 0.001 (0.009)	Loss 3.7941 (3.7102)	Entropy 1.43310 (1.46062)	Top-1 acc 38.281 (36.683)	Top-5 acc 58.594 (60.825)	lr 0.02450
Train [11][2900/3239]	Time 0.581 (0.858)	Data Time 0.001 (0.009)	Loss 3.6979 (3.7101)	Entropy 1.43311 (1.46052)	Top-1 acc 37.500 (36.686)	Top-5 acc 62.109 (60.829)	lr 0.02449
Train [11][2910/3239]	Time 0.553 (0.858)	Data Time 0.001 (0.009)	Loss 3.3477 (3.7098)	Entropy 1.43305 (1.46043)	Top-1 acc 46.094 (36.696)	Top-5 acc 67.969 (60.835)	lr 0.02449
Train [11][2920/3239]	Time 0.625 (0.857)	Data Time 0.001 (0.009)	Loss 3.7080 (3.7099)	Entropy 1.43304 (1.46034)	Top-1 acc 42.188 (36.693)	Top-5 acc 62.891 (60.836)	lr 0.02449
Train [11][2930/3239]	Time 0.569 (0.857)	Data Time 0.001 (0.009)	Loss 3.6214 (3.7098)	Entropy 1.43307 (1.46024)	Top-1 acc 33.203 (36.690)	Top-5 acc 62.109 (60.835)	lr 0.02449
Train [11][2940/3239]	Time 0.754 (0.864)	Data Time 0.006 (0.009)	Loss 3.5855 (3.7098)	Entropy 1.43247 (1.46015)	Top-1 acc 43.750 (36.693)	Top-5 acc 60.547 (60.835)	lr 0.02449
Train [11][2950/3239]	Time 0.552 (0.864)	Data Time 0.002 (0.009)	Loss 3.8263 (3.7096)	Entropy 1.43242 (1.46006)	Top-1 acc 33.594 (36.700)	Top-5 acc 58.984 (60.839)	lr 0.02449
Train [11][2960/3239]	Time 0.676 (0.864)	Data Time 0.001 (0.009)	Loss 3.7607 (3.7097)	Entropy 1.43210 (1.45996)	Top-1 acc 38.281 (36.699)	Top-5 acc 60.547 (60.836)	lr 0.02449
Train [11][2970/3239]	Time 0.592 (0.864)	Data Time 0.001 (0.009)	Loss 3.8459 (3.7097)	Entropy 1.43162 (1.45987)	Top-1 acc 33.203 (36.703)	Top-5 acc 58.984 (60.838)	lr 0.02449
Train [11][2980/3239]	Time 0.602 (0.863)	Data Time 0.001 (0.009)	Loss 3.6121 (3.7095)	Entropy 1.43150 (1.45977)	Top-1 acc 41.406 (36.707)	Top-5 acc 64.844 (60.842)	lr 0.02449
Train [11][2990/3239]	Time 0.574 (0.863)	Data Time 0.001 (0.009)	Loss 3.5599 (3.7095)	Entropy 1.43151 (1.45968)	Top-1 acc 37.109 (36.703)	Top-5 acc 64.844 (60.846)	lr 0.02449
Train [11][3000/3239]	Time 0.608 (0.863)	Data Time 0.001 (0.008)	Loss 3.7770 (3.7092)	Entropy 1.43159 (1.45959)	Top-1 acc 34.375 (36.705)	Top-5 acc 60.547 (60.854)	lr 0.02449
Train [11][3010/3239]	Time 0.587 (0.863)	Data Time 0.001 (0.008)	Loss 3.7206 (3.7093)	Entropy 1.43163 (1.45949)	Top-1 acc 37.109 (36.703)	Top-5 acc 60.156 (60.852)	lr 0.02449
Train [11][3020/3239]	Time 0.582 (0.863)	Data Time 0.002 (0.008)	Loss 3.7518 (3.7092)	Entropy 1.43158 (1.45940)	Top-1 acc 39.062 (36.703)	Top-5 acc 61.328 (60.852)	lr 0.02449
Train [11][3030/3239]	Time 0.670 (0.863)	Data Time 0.001 (0.008)	Loss 3.5971 (3.7092)	Entropy 1.43098 (1.45931)	Top-1 acc 39.844 (36.701)	Top-5 acc 62.500 (60.851)	lr 0.02449
Train [11][3040/3239]	Time 0.570 (0.863)	Data Time 0.001 (0.008)	Loss 3.6780 (3.7093)	Entropy 1.43077 (1.45921)	Top-1 acc 37.109 (36.701)	Top-5 acc 59.375 (60.848)	lr 0.02449
Train [11][3050/3239]	Time 0.604 (0.863)	Data Time 0.001 (0.008)	Loss 3.6860 (3.7093)	Entropy 1.43089 (1.45912)	Top-1 acc 35.156 (36.699)	Top-5 acc 60.938 (60.848)	lr 0.02449
Train [11][3060/3239]	Time 0.577 (0.863)	Data Time 0.001 (0.008)	Loss 3.7671 (3.7091)	Entropy 1.43105 (1.45903)	Top-1 acc 37.109 (36.704)	Top-5 acc 59.375 (60.849)	lr 0.02449
Train [11][3070/3239]	Time 0.576 (0.863)	Data Time 0.001 (0.008)	Loss 3.4997 (3.7091)	Entropy 1.43111 (1.45894)	Top-1 acc 40.625 (36.706)	Top-5 acc 65.625 (60.849)	lr 0.02449
Train [11][3080/3239]	Time 0.529 (0.862)	Data Time 0.001 (0.008)	Loss 3.7218 (3.7090)	Entropy 1.43079 (1.45885)	Top-1 acc 35.547 (36.706)	Top-5 acc 61.328 (60.852)	lr 0.02449
Train [11][3090/3239]	Time 0.561 (0.862)	Data Time 0.001 (0.008)	Loss 3.6631 (3.7092)	Entropy 1.43058 (1.45876)	Top-1 acc 39.062 (36.705)	Top-5 acc 64.453 (60.851)	lr 0.02449
Train [11][3100/3239]	Time 0.660 (0.862)	Data Time 0.001 (0.008)	Loss 3.5447 (3.7087)	Entropy 1.43054 (1.45867)	Top-1 acc 38.281 (36.713)	Top-5 acc 65.234 (60.858)	lr 0.02449
Train [11][3110/3239]	Time 0.587 (0.862)	Data Time 0.001 (0.008)	Loss 3.7551 (3.7088)	Entropy 1.43012 (1.45857)	Top-1 acc 35.938 (36.708)	Top-5 acc 55.859 (60.852)	lr 0.02449
Train [11][3120/3239]	Time 0.565 (0.862)	Data Time 0.001 (0.008)	Loss 3.8783 (3.7089)	Entropy 1.42991 (1.45848)	Top-1 acc 32.812 (36.707)	Top-5 acc 55.078 (60.851)	lr 0.02449
Train [11][3130/3239]	Time 0.548 (0.862)	Data Time 0.001 (0.008)	Loss 3.5511 (3.7090)	Entropy 1.42987 (1.45839)	Top-1 acc 36.719 (36.706)	Top-5 acc 64.844 (60.852)	lr 0.02449
Train [11][3140/3239]	Time 0.555 (0.862)	Data Time 0.001 (0.008)	Loss 3.8346 (3.7091)	Entropy 1.43019 (1.45830)	Top-1 acc 37.500 (36.705)	Top-5 acc 58.594 (60.850)	lr 0.02449
Train [11][3150/3239]	Time 0.452 (0.862)	Data Time 0.001 (0.008)	Loss 3.6986 (3.7090)	Entropy 1.42980 (1.45821)	Top-1 acc 37.500 (36.705)	Top-5 acc 58.984 (60.849)	lr 0.02449
Train [11][3160/3239]	Time 0.547 (0.862)	Data Time 0.001 (0.008)	Loss 3.7889 (3.7091)	Entropy 1.42977 (1.45812)	Top-1 acc 34.375 (36.704)	Top-5 acc 58.594 (60.846)	lr 0.02449
Train [11][3170/3239]	Time 0.653 (0.861)	Data Time 0.001 (0.008)	Loss 3.8925 (3.7090)	Entropy 1.43002 (1.45803)	Top-1 acc 34.375 (36.705)	Top-5 acc 57.031 (60.848)	lr 0.02449
Train [11][3180/3239]	Time 0.528 (0.861)	Data Time 0.000 (0.008)	Loss 3.6057 (3.7090)	Entropy 1.42993 (1.45794)	Top-1 acc 39.844 (36.707)	Top-5 acc 62.891 (60.850)	lr 0.02449
Train [11][3190/3239]	Time 0.571 (0.861)	Data Time 0.000 (0.008)	Loss 3.7337 (3.7089)	Entropy 1.42966 (1.45786)	Top-1 acc 34.766 (36.711)	Top-5 acc 57.031 (60.849)	lr 0.02449
Train [11][3200/3239]	Time 0.604 (0.861)	Data Time 0.000 (0.008)	Loss 3.6087 (3.7087)	Entropy 1.42941 (1.45777)	Top-1 acc 39.062 (36.711)	Top-5 acc 64.453 (60.854)	lr 0.02449
Train [11][3210/3239]	Time 0.571 (0.861)	Data Time 0.000 (0.008)	Loss 3.7604 (3.7088)	Entropy 1.42962 (1.45768)	Top-1 acc 39.062 (36.709)	Top-5 acc 60.156 (60.852)	lr 0.02449
Train [11][3220/3239]	Time 0.576 (0.861)	Data Time 0.000 (0.008)	Loss 3.9032 (3.7089)	Entropy 1.42956 (1.45759)	Top-1 acc 32.812 (36.709)	Top-5 acc 53.906 (60.848)	lr 0.02449
Train [11][3230/3239]	Time 0.597 (0.860)	Data Time 0.000 (0.008)	Loss 3.6042 (3.7088)	Entropy 1.42949 (1.45751)	Top-1 acc 42.969 (36.715)	Top-5 acc 66.016 (60.848)	lr 0.02449
Train [11][3239/3239]	Time 1.436 (0.860)	Data Time 0.000 (0.008)	Loss 3.7159 (3.7087)	Entropy 1.42945 (1.45743)	Top-1 acc 37.037 (36.718)	Top-5 acc 60.494 (60.851)	lr 0.02449
==========Valid [11/120]	loss 2.489	top-1 acc 46.338 (46.338)	top-5 acc 70.754	Train top-1 36.718	top-5 60.851	Entropy 1.42945	Latency-None: 0.000ms	Flops: 542.77M
Train [12][0/3239]	Time 20.328 (20.328)	Data Time 19.392 (19.392)	Loss 3.7052 (3.7052)	Entropy 1.42919 (1.42919)	Top-1 acc 33.203 (33.203)	Top-5 acc 57.812 (57.812)	lr 0.02449
Train [12][10/3239]	Time 0.565 (2.681)	Data Time 0.001 (1.793)	Loss 3.6559 (3.7164)	Entropy 1.42892 (1.42905)	Top-1 acc 35.547 (36.151)	Top-5 acc 63.281 (60.192)	lr 0.02448
Train [12][20/3239]	Time 0.557 (1.827)	Data Time 0.001 (0.940)	Loss 3.9244 (3.7017)	Entropy 1.42888 (1.42897)	Top-1 acc 34.375 (37.054)	Top-5 acc 53.906 (60.993)	lr 0.02448
Train [12][30/3239]	Time 0.602 (1.527)	Data Time 0.029 (0.638)	Loss 3.8208 (3.6971)	Entropy 1.42870 (1.42890)	Top-1 acc 35.547 (37.185)	Top-5 acc 59.766 (61.177)	lr 0.02448
Train [12][40/3239]	Time 0.587 (1.353)	Data Time 0.001 (0.483)	Loss 3.5798 (3.6856)	Entropy 1.42841 (1.42883)	Top-1 acc 39.844 (37.557)	Top-5 acc 61.328 (61.385)	lr 0.02448
Train [12][50/3239]	Time 0.634 (1.253)	Data Time 0.001 (0.389)	Loss 3.4752 (3.6838)	Entropy 1.42822 (1.42873)	Top-1 acc 39.844 (37.469)	Top-5 acc 64.453 (61.351)	lr 0.02448
Train [12][60/3239]	Time 0.579 (1.182)	Data Time 0.001 (0.325)	Loss 3.6050 (3.6865)	Entropy 1.42790 (1.42862)	Top-1 acc 37.500 (37.276)	Top-5 acc 59.766 (60.989)	lr 0.02448
Train [12][70/3239]	Time 0.689 (1.132)	Data Time 0.001 (0.280)	Loss 3.7048 (3.6838)	Entropy 1.42735 (1.42850)	Top-1 acc 38.672 (37.506)	Top-5 acc 60.938 (60.943)	lr 0.02448
Train [12][80/3239]	Time 0.564 (1.096)	Data Time 0.001 (0.245)	Loss 3.7351 (3.6864)	Entropy 1.42687 (1.42834)	Top-1 acc 37.109 (37.404)	Top-5 acc 60.938 (60.870)	lr 0.02448
Train [12][90/3239]	Time 0.611 (1.069)	Data Time 0.001 (0.219)	Loss 3.8506 (3.6861)	Entropy 1.42700 (1.42818)	Top-1 acc 31.641 (37.393)	Top-5 acc 61.328 (60.907)	lr 0.02448
Train [12][100/3239]	Time 0.628 (1.046)	Data Time 0.001 (0.197)	Loss 3.7375 (3.6855)	Entropy 1.42724 (1.42808)	Top-1 acc 36.328 (37.399)	Top-5 acc 58.984 (60.868)	lr 0.02448
Train [12][110/3239]	Time 0.607 (1.028)	Data Time 0.001 (0.180)	Loss 3.5755 (3.6812)	Entropy 1.42708 (1.42799)	Top-1 acc 39.062 (37.542)	Top-5 acc 62.500 (61.040)	lr 0.02448
Train [12][120/3239]	Time 0.551 (1.009)	Data Time 0.001 (0.165)	Loss 3.7147 (3.6833)	Entropy 1.42673 (1.42791)	Top-1 acc 39.062 (37.490)	Top-5 acc 62.500 (60.931)	lr 0.02448
Train [12][130/3239]	Time 0.449 (0.993)	Data Time 0.001 (0.153)	Loss 3.5722 (3.6779)	Entropy 1.42646 (1.42781)	Top-1 acc 38.281 (37.575)	Top-5 acc 64.844 (61.075)	lr 0.02448
Train [12][140/3239]	Time 0.558 (0.981)	Data Time 0.001 (0.142)	Loss 3.6411 (3.6785)	Entropy 1.42638 (1.42771)	Top-1 acc 33.203 (37.530)	Top-5 acc 64.453 (61.170)	lr 0.02448
Train [12][150/3239]	Time 0.538 (0.966)	Data Time 0.001 (0.133)	Loss 3.5831 (3.6800)	Entropy 1.42616 (1.42762)	Top-1 acc 39.844 (37.510)	Top-5 acc 60.938 (61.142)	lr 0.02448
Train [12][160/3239]	Time 0.630 (0.958)	Data Time 0.001 (0.124)	Loss 3.6318 (3.6842)	Entropy 1.42585 (1.42752)	Top-1 acc 38.672 (37.471)	Top-5 acc 60.938 (61.071)	lr 0.02448
Train [12][170/3239]	Time 0.605 (0.951)	Data Time 0.001 (0.117)	Loss 3.8770 (3.6907)	Entropy 1.42534 (1.42741)	Top-1 acc 35.547 (37.326)	Top-5 acc 58.203 (60.922)	lr 0.02448
Train [12][180/3239]	Time 0.548 (0.943)	Data Time 0.001 (0.111)	Loss 3.5334 (3.6876)	Entropy 1.42523 (1.42730)	Top-1 acc 44.531 (37.403)	Top-5 acc 65.234 (61.002)	lr 0.02448
Train [12][190/3239]	Time 0.608 (0.938)	Data Time 0.001 (0.105)	Loss 3.6113 (3.6882)	Entropy 1.42520 (1.42718)	Top-1 acc 41.406 (37.445)	Top-5 acc 62.500 (61.009)	lr 0.02448
Train [12][200/3239]	Time 0.570 (0.933)	Data Time 0.001 (0.100)	Loss 3.4885 (3.6914)	Entropy 1.42535 (1.42709)	Top-1 acc 41.797 (37.352)	Top-5 acc 66.797 (61.029)	lr 0.02448
Train [12][210/3239]	Time 0.718 (0.929)	Data Time 0.003 (0.096)	Loss 3.5593 (3.6896)	Entropy 1.42520 (1.42701)	Top-1 acc 40.625 (37.382)	Top-5 acc 63.281 (61.062)	lr 0.02448
Train [12][220/3239]	Time 0.602 (0.925)	Data Time 0.001 (0.091)	Loss 3.6850 (3.6895)	Entropy 1.42507 (1.42693)	Top-1 acc 38.281 (37.394)	Top-5 acc 62.500 (61.075)	lr 0.02448
Train [12][230/3239]	Time 0.552 (0.921)	Data Time 0.001 (0.088)	Loss 3.6201 (3.6891)	Entropy 1.42522 (1.42685)	Top-1 acc 37.109 (37.383)	Top-5 acc 60.547 (61.091)	lr 0.02448
Train [12][240/3239]	Time 0.555 (0.918)	Data Time 0.001 (0.084)	Loss 3.7945 (3.6891)	Entropy 1.42506 (1.42678)	Top-1 acc 33.594 (37.400)	Top-5 acc 58.203 (61.113)	lr 0.02448
Train [12][250/3239]	Time 0.579 (0.915)	Data Time 0.001 (0.081)	Loss 3.5652 (3.6887)	Entropy 1.42481 (1.42671)	Top-1 acc 37.109 (37.386)	Top-5 acc 64.844 (61.070)	lr 0.02448
Train [12][260/3239]	Time 0.547 (0.911)	Data Time 0.001 (0.078)	Loss 3.5008 (3.6874)	Entropy 1.42453 (1.42663)	Top-1 acc 42.188 (37.403)	Top-5 acc 67.969 (61.092)	lr 0.02448
Train [12][270/3239]	Time 0.565 (0.908)	Data Time 0.001 (0.075)	Loss 3.7691 (3.6872)	Entropy 1.42402 (1.42655)	Top-1 acc 35.547 (37.367)	Top-5 acc 58.984 (61.112)	lr 0.02448
Train [12][280/3239]	Time 0.686 (0.906)	Data Time 0.001 (0.072)	Loss 3.7586 (3.6865)	Entropy 1.42374 (1.42646)	Top-1 acc 36.719 (37.378)	Top-5 acc 57.812 (61.115)	lr 0.02448
Train [12][290/3239]	Time 0.473 (0.903)	Data Time 0.001 (0.070)	Loss 3.9232 (3.6876)	Entropy 1.42344 (1.42636)	Top-1 acc 29.688 (37.363)	Top-5 acc 53.906 (61.091)	lr 0.02448
Train [12][300/3239]	Time 0.566 (0.900)	Data Time 0.001 (0.068)	Loss 3.5821 (3.6864)	Entropy 1.42338 (1.42626)	Top-1 acc 37.500 (37.372)	Top-5 acc 63.281 (61.104)	lr 0.02448
Train [12][310/3239]	Time 0.567 (0.897)	Data Time 0.001 (0.066)	Loss 3.6955 (3.6858)	Entropy 1.42359 (1.42617)	Top-1 acc 36.719 (37.387)	Top-5 acc 63.281 (61.145)	lr 0.02448
Train [12][320/3239]	Time 0.584 (0.894)	Data Time 0.001 (0.064)	Loss 3.7713 (3.6839)	Entropy 1.42360 (1.42609)	Top-1 acc 39.453 (37.422)	Top-5 acc 58.594 (61.203)	lr 0.02448
Train [12][330/3239]	Time 0.586 (0.892)	Data Time 0.001 (0.062)	Loss 3.7798 (3.6832)	Entropy 1.42332 (1.42601)	Top-1 acc 37.891 (37.449)	Top-5 acc 58.594 (61.211)	lr 0.02448
Train [12][340/3239]	Time 0.600 (0.890)	Data Time 0.001 (0.060)	Loss 3.3399 (3.6828)	Entropy 1.42312 (1.42593)	Top-1 acc 44.141 (37.423)	Top-5 acc 69.531 (61.199)	lr 0.02448
Train [12][350/3239]	Time 0.636 (0.888)	Data Time 0.001 (0.058)	Loss 3.6802 (3.6842)	Entropy 1.42295 (1.42585)	Top-1 acc 37.891 (37.423)	Top-5 acc 61.719 (61.181)	lr 0.02448
Train [12][360/3239]	Time 0.596 (0.941)	Data Time 0.003 (0.057)	Loss 3.3727 (3.6846)	Entropy 1.42287 (1.42577)	Top-1 acc 43.359 (37.430)	Top-5 acc 70.703 (61.161)	lr 0.02447
Train [12][370/3239]	Time 0.658 (0.939)	Data Time 0.002 (0.055)	Loss 3.7654 (3.6835)	Entropy 1.42302 (1.42569)	Top-1 acc 35.547 (37.429)	Top-5 acc 57.031 (61.201)	lr 0.02447
Train [12][380/3239]	Time 0.559 (0.936)	Data Time 0.001 (0.054)	Loss 3.3517 (3.6835)	Entropy 1.42247 (1.42561)	Top-1 acc 46.875 (37.432)	Top-5 acc 69.922 (61.183)	lr 0.02447
Train [12][390/3239]	Time 0.572 (0.934)	Data Time 0.001 (0.053)	Loss 3.7473 (3.6820)	Entropy 1.42230 (1.42553)	Top-1 acc 37.109 (37.445)	Top-5 acc 58.984 (61.220)	lr 0.02447
Train [12][400/3239]	Time 0.593 (0.932)	Data Time 0.001 (0.051)	Loss 3.6939 (3.6810)	Entropy 1.42248 (1.42545)	Top-1 acc 37.109 (37.472)	Top-5 acc 60.938 (61.233)	lr 0.02447
Train [12][410/3239]	Time 0.585 (0.929)	Data Time 0.001 (0.050)	Loss 3.5955 (3.6819)	Entropy 1.42230 (1.42538)	Top-1 acc 38.672 (37.451)	Top-5 acc 62.109 (61.213)	lr 0.02447
Train [12][420/3239]	Time 0.560 (0.927)	Data Time 0.001 (0.049)	Loss 3.8608 (3.6819)	Entropy 1.42194 (1.42530)	Top-1 acc 32.422 (37.418)	Top-5 acc 58.594 (61.221)	lr 0.02447
Train [12][430/3239]	Time 0.591 (0.924)	Data Time 0.001 (0.048)	Loss 3.7718 (3.6806)	Entropy 1.42210 (1.42522)	Top-1 acc 34.375 (37.445)	Top-5 acc 63.672 (61.267)	lr 0.02447
Train [12][440/3239]	Time 0.677 (0.921)	Data Time 0.001 (0.047)	Loss 3.6745 (3.6813)	Entropy 1.42187 (1.42515)	Top-1 acc 40.234 (37.441)	Top-5 acc 62.109 (61.252)	lr 0.02447
Train [12][450/3239]	Time 0.548 (0.918)	Data Time 0.001 (0.046)	Loss 3.7808 (3.6832)	Entropy 1.42202 (1.42508)	Top-1 acc 35.938 (37.419)	Top-5 acc 58.594 (61.216)	lr 0.02447
Train [12][460/3239]	Time 0.579 (0.915)	Data Time 0.001 (0.045)	Loss 3.7023 (3.6831)	Entropy 1.42177 (1.42501)	Top-1 acc 35.547 (37.419)	Top-5 acc 59.766 (61.232)	lr 0.02447
Train [12][470/3239]	Time 0.566 (0.914)	Data Time 0.002 (0.044)	Loss 3.5275 (3.6812)	Entropy 1.42169 (1.42495)	Top-1 acc 39.844 (37.437)	Top-5 acc 64.844 (61.270)	lr 0.02447
Train [12][480/3239]	Time 0.573 (0.912)	Data Time 0.001 (0.043)	Loss 3.7761 (3.6819)	Entropy 1.42165 (1.42488)	Top-1 acc 33.594 (37.412)	Top-5 acc 60.156 (61.268)	lr 0.02447
Train [12][490/3239]	Time 0.571 (0.910)	Data Time 0.001 (0.042)	Loss 3.4593 (3.6796)	Entropy 1.42096 (1.42481)	Top-1 acc 39.453 (37.451)	Top-5 acc 66.797 (61.320)	lr 0.02447
Train [12][500/3239]	Time 0.518 (0.909)	Data Time 0.001 (0.042)	Loss 3.8348 (3.6800)	Entropy 1.42093 (1.42473)	Top-1 acc 29.688 (37.403)	Top-5 acc 57.031 (61.312)	lr 0.02447
Train [12][510/3239]	Time 0.683 (0.907)	Data Time 0.001 (0.041)	Loss 3.6966 (3.6800)	Entropy 1.42090 (1.42465)	Top-1 acc 37.500 (37.406)	Top-5 acc 61.328 (61.336)	lr 0.02447
Train [12][520/3239]	Time 0.562 (0.906)	Data Time 0.001 (0.040)	Loss 3.8022 (3.6801)	Entropy 1.42077 (1.42458)	Top-1 acc 36.719 (37.414)	Top-5 acc 61.328 (61.336)	lr 0.02447
Train [12][530/3239]	Time 0.605 (0.905)	Data Time 0.001 (0.039)	Loss 3.6355 (3.6795)	Entropy 1.42087 (1.42451)	Top-1 acc 40.625 (37.422)	Top-5 acc 60.938 (61.357)	lr 0.02447
Train [12][540/3239]	Time 0.578 (0.904)	Data Time 0.001 (0.039)	Loss 3.5967 (3.6805)	Entropy 1.42102 (1.42444)	Top-1 acc 37.891 (37.403)	Top-5 acc 65.234 (61.342)	lr 0.02447
Train [12][550/3239]	Time 0.549 (0.902)	Data Time 0.001 (0.038)	Loss 3.6905 (3.6803)	Entropy 1.42063 (1.42438)	Top-1 acc 36.719 (37.383)	Top-5 acc 61.328 (61.339)	lr 0.02447
Train [12][560/3239]	Time 0.570 (0.901)	Data Time 0.001 (0.037)	Loss 3.6353 (3.6809)	Entropy 1.42067 (1.42431)	Top-1 acc 37.891 (37.377)	Top-5 acc 58.984 (61.314)	lr 0.02447
Train [12][570/3239]	Time 0.578 (0.900)	Data Time 0.001 (0.037)	Loss 3.8220 (3.6811)	Entropy 1.42071 (1.42425)	Top-1 acc 33.984 (37.382)	Top-5 acc 59.375 (61.325)	lr 0.02447
Train [12][580/3239]	Time 0.699 (0.899)	Data Time 0.001 (0.036)	Loss 3.7917 (3.6806)	Entropy 1.42026 (1.42418)	Top-1 acc 34.375 (37.390)	Top-5 acc 57.422 (61.326)	lr 0.02447
Train [12][590/3239]	Time 0.538 (0.898)	Data Time 0.001 (0.036)	Loss 3.6029 (3.6795)	Entropy 1.42015 (1.42412)	Top-1 acc 37.109 (37.399)	Top-5 acc 64.844 (61.353)	lr 0.02447
Train [12][600/3239]	Time 0.598 (0.896)	Data Time 0.001 (0.035)	Loss 3.7436 (3.6802)	Entropy 1.42004 (1.42405)	Top-1 acc 35.938 (37.388)	Top-5 acc 59.375 (61.327)	lr 0.02447
Train [12][610/3239]	Time 0.611 (0.895)	Data Time 0.001 (0.035)	Loss 3.6716 (3.6797)	Entropy 1.41971 (1.42398)	Top-1 acc 35.547 (37.393)	Top-5 acc 64.453 (61.343)	lr 0.02447
Train [12][620/3239]	Time 0.643 (0.893)	Data Time 0.001 (0.034)	Loss 3.5749 (3.6789)	Entropy 1.41960 (1.42391)	Top-1 acc 41.406 (37.413)	Top-5 acc 62.109 (61.365)	lr 0.02447
Train [12][630/3239]	Time 0.625 (0.892)	Data Time 0.001 (0.033)	Loss 3.6400 (3.6780)	Entropy 1.41984 (1.42385)	Top-1 acc 38.672 (37.423)	Top-5 acc 63.672 (61.377)	lr 0.02447
Train [12][640/3239]	Time 0.544 (0.891)	Data Time 0.001 (0.033)	Loss 3.6496 (3.6783)	Entropy 1.41960 (1.42378)	Top-1 acc 35.938 (37.410)	Top-5 acc 60.156 (61.378)	lr 0.02447
Train [12][650/3239]	Time 0.584 (0.890)	Data Time 0.001 (0.032)	Loss 3.8461 (3.6796)	Entropy 1.41977 (1.42372)	Top-1 acc 39.844 (37.385)	Top-5 acc 59.766 (61.356)	lr 0.02447
Train [12][660/3239]	Time 0.565 (0.889)	Data Time 0.001 (0.032)	Loss 3.6555 (3.6797)	Entropy 1.41883 (1.42365)	Top-1 acc 36.328 (37.376)	Top-5 acc 60.938 (61.356)	lr 0.02447
Train [12][670/3239]	Time 0.590 (0.888)	Data Time 0.001 (0.032)	Loss 3.7908 (3.6797)	Entropy 1.41881 (1.42358)	Top-1 acc 33.984 (37.361)	Top-5 acc 60.156 (61.354)	lr 0.02447
Train [12][680/3239]	Time 0.571 (0.887)	Data Time 0.001 (0.031)	Loss 3.6062 (3.6786)	Entropy 1.41872 (1.42351)	Top-1 acc 38.672 (37.393)	Top-5 acc 64.062 (61.385)	lr 0.02447
Train [12][690/3239]	Time 0.551 (0.887)	Data Time 0.001 (0.031)	Loss 3.9428 (3.6792)	Entropy 1.41860 (1.42344)	Top-1 acc 33.594 (37.380)	Top-5 acc 57.422 (61.369)	lr 0.02447
Train [12][700/3239]	Time 0.585 (0.886)	Data Time 0.001 (0.030)	Loss 3.5916 (3.6785)	Entropy 1.41851 (1.42337)	Top-1 acc 39.844 (37.397)	Top-5 acc 62.891 (61.378)	lr 0.02446
Train [12][710/3239]	Time 0.634 (0.885)	Data Time 0.001 (0.030)	Loss 3.5649 (3.6786)	Entropy 1.41818 (1.42330)	Top-1 acc 39.453 (37.393)	Top-5 acc 64.453 (61.375)	lr 0.02446
Train [12][720/3239]	Time 0.575 (0.885)	Data Time 0.001 (0.030)	Loss 3.8517 (3.6784)	Entropy 1.41791 (1.42323)	Top-1 acc 35.156 (37.401)	Top-5 acc 55.078 (61.390)	lr 0.02446
Train [12][730/3239]	Time 0.675 (0.884)	Data Time 0.037 (0.029)	Loss 3.6681 (3.6784)	Entropy 1.41791 (1.42316)	Top-1 acc 32.031 (37.389)	Top-5 acc 61.719 (61.387)	lr 0.02446
Train [12][740/3239]	Time 0.651 (0.883)	Data Time 0.001 (0.029)	Loss 3.8094 (3.6790)	Entropy 1.41774 (1.42308)	Top-1 acc 39.844 (37.396)	Top-5 acc 61.719 (61.370)	lr 0.02446
Train [12][750/3239]	Time 0.553 (0.882)	Data Time 0.001 (0.028)	Loss 3.7217 (3.6788)	Entropy 1.41749 (1.42301)	Top-1 acc 38.672 (37.401)	Top-5 acc 58.594 (61.372)	lr 0.02446
Train [12][760/3239]	Time 0.561 (0.882)	Data Time 0.001 (0.028)	Loss 3.7388 (3.6788)	Entropy 1.41743 (1.42294)	Top-1 acc 34.766 (37.393)	Top-5 acc 62.500 (61.370)	lr 0.02446
Train [12][770/3239]	Time 0.518 (0.881)	Data Time 0.001 (0.028)	Loss 3.7274 (3.6790)	Entropy 1.41740 (1.42287)	Top-1 acc 38.672 (37.380)	Top-5 acc 61.328 (61.366)	lr 0.02446
Train [12][780/3239]	Time 0.540 (0.880)	Data Time 0.001 (0.027)	Loss 3.8206 (3.6793)	Entropy 1.41754 (1.42280)	Top-1 acc 33.203 (37.380)	Top-5 acc 58.984 (61.370)	lr 0.02446
Train [12][790/3239]	Time 0.580 (0.879)	Data Time 0.001 (0.027)	Loss 3.7502 (3.6787)	Entropy 1.41737 (1.42273)	Top-1 acc 32.812 (37.380)	Top-5 acc 57.422 (61.377)	lr 0.02446
Train [12][800/3239]	Time 0.417 (0.878)	Data Time 0.002 (0.027)	Loss 3.4537 (3.6786)	Entropy 1.41730 (1.42266)	Top-1 acc 42.188 (37.378)	Top-5 acc 66.016 (61.386)	lr 0.02446
Train [12][810/3239]	Time 0.727 (0.877)	Data Time 0.001 (0.026)	Loss 3.6068 (3.6780)	Entropy 1.41695 (1.42260)	Top-1 acc 41.797 (37.394)	Top-5 acc 59.375 (61.389)	lr 0.02446
Train [12][820/3239]	Time 0.572 (0.877)	Data Time 0.001 (0.026)	Loss 3.7487 (3.6781)	Entropy 1.41678 (1.42253)	Top-1 acc 35.547 (37.402)	Top-5 acc 58.594 (61.386)	lr 0.02446
Train [12][830/3239]	Time 0.593 (0.876)	Data Time 0.001 (0.026)	Loss 3.4576 (3.6786)	Entropy 1.41617 (1.42246)	Top-1 acc 43.359 (37.388)	Top-5 acc 65.625 (61.379)	lr 0.02446
Train [12][840/3239]	Time 0.594 (0.876)	Data Time 0.001 (0.026)	Loss 3.6930 (3.6789)	Entropy 1.41605 (1.42238)	Top-1 acc 36.328 (37.376)	Top-5 acc 62.891 (61.373)	lr 0.02446
Train [12][850/3239]	Time 0.622 (0.875)	Data Time 0.001 (0.025)	Loss 3.7176 (3.6790)	Entropy 1.41599 (1.42231)	Top-1 acc 36.328 (37.373)	Top-5 acc 61.719 (61.364)	lr 0.02446
Train [12][860/3239]	Time 0.568 (0.874)	Data Time 0.001 (0.025)	Loss 3.8299 (3.6791)	Entropy 1.41568 (1.42223)	Top-1 acc 33.203 (37.369)	Top-5 acc 58.203 (61.360)	lr 0.02446
Train [12][870/3239]	Time 0.570 (0.874)	Data Time 0.001 (0.025)	Loss 3.8402 (3.6804)	Entropy 1.41539 (1.42216)	Top-1 acc 29.688 (37.348)	Top-5 acc 55.469 (61.334)	lr 0.02446
Train [12][880/3239]	Time 0.672 (0.874)	Data Time 0.001 (0.025)	Loss 3.7553 (3.6806)	Entropy 1.41505 (1.42208)	Top-1 acc 38.281 (37.334)	Top-5 acc 57.812 (61.326)	lr 0.02446
Train [12][890/3239]	Time 0.622 (0.873)	Data Time 0.001 (0.024)	Loss 3.6193 (3.6805)	Entropy 1.41497 (1.42200)	Top-1 acc 38.672 (37.341)	Top-5 acc 61.328 (61.329)	lr 0.02446
Train [12][900/3239]	Time 0.642 (0.873)	Data Time 0.001 (0.024)	Loss 3.6539 (3.6810)	Entropy 1.41457 (1.42192)	Top-1 acc 37.109 (37.333)	Top-5 acc 62.500 (61.309)	lr 0.02446
Train [12][910/3239]	Time 0.585 (0.872)	Data Time 0.001 (0.024)	Loss 3.7571 (3.6815)	Entropy 1.41448 (1.42184)	Top-1 acc 35.156 (37.325)	Top-5 acc 59.375 (61.300)	lr 0.02446
Train [12][920/3239]	Time 0.623 (0.872)	Data Time 0.001 (0.024)	Loss 3.4706 (3.6807)	Entropy 1.41421 (1.42176)	Top-1 acc 42.188 (37.334)	Top-5 acc 65.234 (61.321)	lr 0.02446
Train [12][930/3239]	Time 0.551 (0.871)	Data Time 0.001 (0.023)	Loss 3.6807 (3.6804)	Entropy 1.41409 (1.42168)	Top-1 acc 39.062 (37.336)	Top-5 acc 62.109 (61.327)	lr 0.02446
Train [12][940/3239]	Time 0.582 (0.871)	Data Time 0.001 (0.023)	Loss 3.8397 (3.6803)	Entropy 1.41384 (1.42160)	Top-1 acc 35.547 (37.335)	Top-5 acc 57.031 (61.347)	lr 0.02446
Train [12][950/3239]	Time 0.688 (0.870)	Data Time 0.002 (0.023)	Loss 3.5382 (3.6806)	Entropy 1.41338 (1.42151)	Top-1 acc 41.406 (37.339)	Top-5 acc 63.672 (61.343)	lr 0.02446
Train [12][960/3239]	Time 0.573 (0.870)	Data Time 0.002 (0.023)	Loss 3.8000 (3.6806)	Entropy 1.41326 (1.42143)	Top-1 acc 36.719 (37.344)	Top-5 acc 58.984 (61.340)	lr 0.02446
Train [12][970/3239]	Time 0.558 (0.869)	Data Time 0.001 (0.022)	Loss 3.7675 (3.6807)	Entropy 1.41315 (1.42134)	Top-1 acc 36.328 (37.349)	Top-5 acc 60.547 (61.339)	lr 0.02446
Train [12][980/3239]	Time 0.617 (0.869)	Data Time 0.001 (0.022)	Loss 3.5174 (3.6803)	Entropy 1.41327 (1.42126)	Top-1 acc 36.719 (37.359)	Top-5 acc 66.797 (61.354)	lr 0.02446
Train [12][990/3239]	Time 0.581 (0.868)	Data Time 0.001 (0.022)	Loss 3.7164 (3.6801)	Entropy 1.41308 (1.42118)	Top-1 acc 36.719 (37.372)	Top-5 acc 58.203 (61.360)	lr 0.02446
Train [12][1000/3239]	Time 0.562 (0.868)	Data Time 0.001 (0.022)	Loss 3.7168 (3.6810)	Entropy 1.41262 (1.42110)	Top-1 acc 36.719 (37.347)	Top-5 acc 59.766 (61.341)	lr 0.02446
Train [12][1010/3239]	Time 0.819 (0.886)	Data Time 0.006 (0.022)	Loss 3.4833 (3.6809)	Entropy 1.41229 (1.42101)	Top-1 acc 41.016 (37.341)	Top-5 acc 63.672 (61.340)	lr 0.02446
Train [12][1020/3239]	Time 0.583 (0.887)	Data Time 0.001 (0.021)	Loss 3.6121 (3.6813)	Entropy 1.41232 (1.42093)	Top-1 acc 38.281 (37.334)	Top-5 acc 62.109 (61.329)	lr 0.02446
Train [12][1030/3239]	Time 0.632 (0.886)	Data Time 0.001 (0.021)	Loss 3.4690 (3.6810)	Entropy 1.41217 (1.42084)	Top-1 acc 38.281 (37.336)	Top-5 acc 64.453 (61.333)	lr 0.02446
Train [12][1040/3239]	Time 0.676 (0.886)	Data Time 0.001 (0.021)	Loss 3.7420 (3.6818)	Entropy 1.41207 (1.42076)	Top-1 acc 38.281 (37.324)	Top-5 acc 60.547 (61.321)	lr 0.02445
Train [12][1050/3239]	Time 0.609 (0.885)	Data Time 0.001 (0.021)	Loss 3.9477 (3.6823)	Entropy 1.41176 (1.42068)	Top-1 acc 35.156 (37.321)	Top-5 acc 55.859 (61.315)	lr 0.02445
Train [12][1060/3239]	Time 0.588 (0.885)	Data Time 0.002 (0.021)	Loss 3.7836 (3.6827)	Entropy 1.41202 (1.42059)	Top-1 acc 35.156 (37.314)	Top-5 acc 60.547 (61.316)	lr 0.02445
Train [12][1070/3239]	Time 0.589 (0.884)	Data Time 0.001 (0.021)	Loss 3.6223 (3.6826)	Entropy 1.41190 (1.42051)	Top-1 acc 38.281 (37.310)	Top-5 acc 61.719 (61.309)	lr 0.02445
Train [12][1080/3239]	Time 0.579 (0.884)	Data Time 0.001 (0.020)	Loss 3.5570 (3.6828)	Entropy 1.41125 (1.42043)	Top-1 acc 39.062 (37.307)	Top-5 acc 66.016 (61.312)	lr 0.02445
Train [12][1090/3239]	Time 0.610 (0.883)	Data Time 0.001 (0.020)	Loss 3.8172 (3.6826)	Entropy 1.41106 (1.42034)	Top-1 acc 36.328 (37.306)	Top-5 acc 57.812 (61.314)	lr 0.02445
Train [12][1100/3239]	Time 0.595 (0.882)	Data Time 0.002 (0.020)	Loss 3.5307 (3.6820)	Entropy 1.41113 (1.42026)	Top-1 acc 40.625 (37.317)	Top-5 acc 61.719 (61.327)	lr 0.02445
Train [12][1110/3239]	Time 0.553 (0.881)	Data Time 0.001 (0.020)	Loss 3.8228 (3.6822)	Entropy 1.41095 (1.42018)	Top-1 acc 36.328 (37.311)	Top-5 acc 58.984 (61.328)	lr 0.02445
Train [12][1120/3239]	Time 0.539 (0.881)	Data Time 0.001 (0.020)	Loss 3.8560 (3.6825)	Entropy 1.41049 (1.42009)	Top-1 acc 30.469 (37.309)	Top-5 acc 59.375 (61.324)	lr 0.02445
Train [12][1130/3239]	Time 0.571 (0.881)	Data Time 0.001 (0.020)	Loss 3.5857 (3.6823)	Entropy 1.41049 (1.42001)	Top-1 acc 39.844 (37.330)	Top-5 acc 66.016 (61.328)	lr 0.02445
Train [12][1140/3239]	Time 0.584 (0.880)	Data Time 0.001 (0.019)	Loss 3.7192 (3.6821)	Entropy 1.41025 (1.41993)	Top-1 acc 35.938 (37.327)	Top-5 acc 58.594 (61.324)	lr 0.02445
Train [12][1150/3239]	Time 0.565 (0.880)	Data Time 0.001 (0.019)	Loss 3.6323 (3.6822)	Entropy 1.41004 (1.41984)	Top-1 acc 43.359 (37.333)	Top-5 acc 63.672 (61.319)	lr 0.02445
Train [12][1160/3239]	Time 0.543 (0.880)	Data Time 0.001 (0.019)	Loss 3.6456 (3.6826)	Entropy 1.40995 (1.41976)	Top-1 acc 39.453 (37.325)	Top-5 acc 62.500 (61.311)	lr 0.02445
Train [12][1170/3239]	Time 0.548 (0.879)	Data Time 0.001 (0.019)	Loss 3.6092 (3.6819)	Entropy 1.40982 (1.41967)	Top-1 acc 40.234 (37.336)	Top-5 acc 63.672 (61.325)	lr 0.02445
Train [12][1180/3239]	Time 0.630 (0.879)	Data Time 0.001 (0.019)	Loss 3.7772 (3.6822)	Entropy 1.40978 (1.41959)	Top-1 acc 31.250 (37.335)	Top-5 acc 62.109 (61.325)	lr 0.02445
Train [12][1190/3239]	Time 0.598 (0.878)	Data Time 0.001 (0.019)	Loss 3.6795 (3.6827)	Entropy 1.40944 (1.41950)	Top-1 acc 37.109 (37.331)	Top-5 acc 60.547 (61.310)	lr 0.02445
Train [12][1200/3239]	Time 0.614 (0.878)	Data Time 0.001 (0.019)	Loss 3.6767 (3.6829)	Entropy 1.40919 (1.41942)	Top-1 acc 37.891 (37.333)	Top-5 acc 65.234 (61.303)	lr 0.02445
Train [12][1210/3239]	Time 0.642 (0.878)	Data Time 0.002 (0.018)	Loss 3.5975 (3.6826)	Entropy 1.40919 (1.41933)	Top-1 acc 37.891 (37.340)	Top-5 acc 61.328 (61.314)	lr 0.02445
Train [12][1220/3239]	Time 0.588 (0.877)	Data Time 0.001 (0.018)	Loss 3.6696 (3.6817)	Entropy 1.40926 (1.41925)	Top-1 acc 35.547 (37.363)	Top-5 acc 60.938 (61.330)	lr 0.02445
Train [12][1230/3239]	Time 0.565 (0.877)	Data Time 0.001 (0.018)	Loss 3.7245 (3.6814)	Entropy 1.40902 (1.41917)	Top-1 acc 37.500 (37.371)	Top-5 acc 57.031 (61.334)	lr 0.02445
Train [12][1240/3239]	Time 0.570 (0.876)	Data Time 0.001 (0.018)	Loss 3.7303 (3.6812)	Entropy 1.40894 (1.41909)	Top-1 acc 36.719 (37.379)	Top-5 acc 61.719 (61.348)	lr 0.02445
Train [12][1250/3239]	Time 0.697 (0.876)	Data Time 0.001 (0.018)	Loss 3.4640 (3.6809)	Entropy 1.40874 (1.41901)	Top-1 acc 39.453 (37.376)	Top-5 acc 64.062 (61.356)	lr 0.02445
Train [12][1260/3239]	Time 0.548 (0.875)	Data Time 0.001 (0.018)	Loss 3.8060 (3.6805)	Entropy 1.40866 (1.41893)	Top-1 acc 32.422 (37.390)	Top-5 acc 58.203 (61.371)	lr 0.02445
Train [12][1270/3239]	Time 0.599 (0.875)	Data Time 0.001 (0.018)	Loss 3.6231 (3.6803)	Entropy 1.40855 (1.41884)	Top-1 acc 38.672 (37.395)	Top-5 acc 61.328 (61.373)	lr 0.02445
Train [12][1280/3239]	Time 0.565 (0.875)	Data Time 0.001 (0.018)	Loss 3.5961 (3.6799)	Entropy 1.40811 (1.41876)	Top-1 acc 36.328 (37.406)	Top-5 acc 63.672 (61.384)	lr 0.02445
Train [12][1290/3239]	Time 0.571 (0.874)	Data Time 0.001 (0.017)	Loss 3.6939 (3.6796)	Entropy 1.40804 (1.41868)	Top-1 acc 39.844 (37.413)	Top-5 acc 62.109 (61.390)	lr 0.02445
Train [12][1300/3239]	Time 0.583 (0.874)	Data Time 0.001 (0.017)	Loss 3.6057 (3.6795)	Entropy 1.40783 (1.41860)	Top-1 acc 37.109 (37.415)	Top-5 acc 61.328 (61.392)	lr 0.02445
Train [12][1310/3239]	Time 0.631 (0.873)	Data Time 0.002 (0.017)	Loss 3.5683 (3.6798)	Entropy 1.40733 (1.41851)	Top-1 acc 40.234 (37.412)	Top-5 acc 64.453 (61.385)	lr 0.02445
Train [12][1320/3239]	Time 0.671 (0.873)	Data Time 0.001 (0.017)	Loss 3.7141 (3.6801)	Entropy 1.40699 (1.41843)	Top-1 acc 34.766 (37.397)	Top-5 acc 62.500 (61.381)	lr 0.02445
Train [12][1330/3239]	Time 0.603 (0.873)	Data Time 0.002 (0.017)	Loss 3.4064 (3.6799)	Entropy 1.40704 (1.41834)	Top-1 acc 43.750 (37.402)	Top-5 acc 68.750 (61.389)	lr 0.02445
Train [12][1340/3239]	Time 0.472 (0.872)	Data Time 0.001 (0.017)	Loss 3.7363 (3.6801)	Entropy 1.40674 (1.41826)	Top-1 acc 30.859 (37.393)	Top-5 acc 63.281 (61.389)	lr 0.02445
Train [12][1350/3239]	Time 0.580 (0.872)	Data Time 0.001 (0.017)	Loss 3.5645 (3.6801)	Entropy 1.40636 (1.41817)	Top-1 acc 37.500 (37.391)	Top-5 acc 60.938 (61.385)	lr 0.02445
Train [12][1360/3239]	Time 0.597 (0.872)	Data Time 0.001 (0.017)	Loss 3.4492 (3.6805)	Entropy 1.40637 (1.41808)	Top-1 acc 41.797 (37.385)	Top-5 acc 67.578 (61.386)	lr 0.02445
Train [12][1370/3239]	Time 0.561 (0.871)	Data Time 0.001 (0.017)	Loss 3.6392 (3.6806)	Entropy 1.40601 (1.41800)	Top-1 acc 37.891 (37.378)	Top-5 acc 64.453 (61.387)	lr 0.02445
Train [12][1380/3239]	Time 0.589 (0.871)	Data Time 0.001 (0.017)	Loss 3.5796 (3.6804)	Entropy 1.40613 (1.41791)	Top-1 acc 41.797 (37.383)	Top-5 acc 62.500 (61.394)	lr 0.02444
Train [12][1390/3239]	Time 0.571 (0.871)	Data Time 0.001 (0.016)	Loss 3.6072 (3.6802)	Entropy 1.40590 (1.41783)	Top-1 acc 39.453 (37.389)	Top-5 acc 64.844 (61.402)	lr 0.02444
Train [12][1400/3239]	Time 0.588 (0.870)	Data Time 0.001 (0.016)	Loss 3.7209 (3.6800)	Entropy 1.40555 (1.41774)	Top-1 acc 36.328 (37.392)	Top-5 acc 60.156 (61.410)	lr 0.02444
Train [12][1410/3239]	Time 0.587 (0.870)	Data Time 0.001 (0.016)	Loss 3.7384 (3.6797)	Entropy 1.40519 (1.41765)	Top-1 acc 33.594 (37.402)	Top-5 acc 60.547 (61.414)	lr 0.02444
Train [12][1420/3239]	Time 0.568 (0.870)	Data Time 0.001 (0.016)	Loss 3.9007 (3.6793)	Entropy 1.40503 (1.41756)	Top-1 acc 33.594 (37.416)	Top-5 acc 57.812 (61.430)	lr 0.02444
Train [12][1430/3239]	Time 0.593 (0.869)	Data Time 0.001 (0.016)	Loss 3.6186 (3.6792)	Entropy 1.40461 (1.41748)	Top-1 acc 38.281 (37.418)	Top-5 acc 64.062 (61.432)	lr 0.02444
Train [12][1440/3239]	Time 0.632 (0.869)	Data Time 0.002 (0.016)	Loss 3.5587 (3.6797)	Entropy 1.40430 (1.41739)	Top-1 acc 42.578 (37.409)	Top-5 acc 60.547 (61.415)	lr 0.02444
Train [12][1450/3239]	Time 0.575 (0.868)	Data Time 0.001 (0.016)	Loss 3.5522 (3.6796)	Entropy 1.40436 (1.41730)	Top-1 acc 42.578 (37.408)	Top-5 acc 63.672 (61.413)	lr 0.02444
Train [12][1460/3239]	Time 0.492 (0.868)	Data Time 0.001 (0.016)	Loss 3.7763 (3.6797)	Entropy 1.40430 (1.41721)	Top-1 acc 35.156 (37.401)	Top-5 acc 59.375 (61.413)	lr 0.02444
Train [12][1470/3239]	Time 0.524 (0.867)	Data Time 0.001 (0.016)	Loss 3.6963 (3.6801)	Entropy 1.40449 (1.41712)	Top-1 acc 39.453 (37.393)	Top-5 acc 62.109 (61.409)	lr 0.02444
Train [12][1480/3239]	Time 0.738 (0.867)	Data Time 0.001 (0.016)	Loss 3.6408 (3.6804)	Entropy 1.40425 (1.41703)	Top-1 acc 35.156 (37.385)	Top-5 acc 61.719 (61.405)	lr 0.02444
Train [12][1490/3239]	Time 0.580 (0.867)	Data Time 0.001 (0.015)	Loss 3.7588 (3.6803)	Entropy 1.40395 (1.41695)	Top-1 acc 37.500 (37.394)	Top-5 acc 59.766 (61.405)	lr 0.02444
Train [12][1500/3239]	Time 0.596 (0.867)	Data Time 0.001 (0.015)	Loss 3.6160 (3.6799)	Entropy 1.40368 (1.41686)	Top-1 acc 39.453 (37.394)	Top-5 acc 65.625 (61.413)	lr 0.02444
Train [12][1510/3239]	Time 0.577 (0.867)	Data Time 0.001 (0.015)	Loss 3.6517 (3.6794)	Entropy 1.40361 (1.41677)	Top-1 acc 36.719 (37.399)	Top-5 acc 63.281 (61.426)	lr 0.02444
Train [12][1520/3239]	Time 0.615 (0.867)	Data Time 0.001 (0.015)	Loss 3.6503 (3.6798)	Entropy 1.40364 (1.41669)	Top-1 acc 33.203 (37.381)	Top-5 acc 62.500 (61.418)	lr 0.02444
Train [12][1530/3239]	Time 0.562 (0.866)	Data Time 0.001 (0.015)	Loss 3.6535 (3.6793)	Entropy 1.40360 (1.41660)	Top-1 acc 42.188 (37.395)	Top-5 acc 61.328 (61.426)	lr 0.02444
Train [12][1540/3239]	Time 0.592 (0.866)	Data Time 0.001 (0.015)	Loss 3.7351 (3.6788)	Entropy 1.40349 (1.41652)	Top-1 acc 33.594 (37.401)	Top-5 acc 57.422 (61.435)	lr 0.02444
Train [12][1550/3239]	Time 0.634 (0.866)	Data Time 0.001 (0.015)	Loss 3.6998 (3.6789)	Entropy 1.40355 (1.41643)	Top-1 acc 38.281 (37.401)	Top-5 acc 62.109 (61.433)	lr 0.02444
Train [12][1560/3239]	Time 0.598 (0.866)	Data Time 0.001 (0.015)	Loss 3.6329 (3.6788)	Entropy 1.40351 (1.41635)	Top-1 acc 34.766 (37.400)	Top-5 acc 62.109 (61.434)	lr 0.02444
Train [12][1570/3239]	Time 0.542 (0.865)	Data Time 0.001 (0.015)	Loss 3.6150 (3.6789)	Entropy 1.40297 (1.41627)	Top-1 acc 36.719 (37.394)	Top-5 acc 62.500 (61.433)	lr 0.02444
Train [12][1580/3239]	Time 0.607 (0.865)	Data Time 0.001 (0.015)	Loss 3.6720 (3.6789)	Entropy 1.40276 (1.41618)	Top-1 acc 37.500 (37.393)	Top-5 acc 62.500 (61.436)	lr 0.02444
Train [12][1590/3239]	Time 0.611 (0.865)	Data Time 0.003 (0.015)	Loss 3.6752 (3.6785)	Entropy 1.40262 (1.41610)	Top-1 acc 39.062 (37.396)	Top-5 acc 60.938 (61.445)	lr 0.02444
Train [12][1600/3239]	Time 0.596 (0.865)	Data Time 0.001 (0.014)	Loss 3.8082 (3.6783)	Entropy 1.40248 (1.41601)	Top-1 acc 36.328 (37.399)	Top-5 acc 60.547 (61.455)	lr 0.02444
Train [12][1610/3239]	Time 0.633 (0.864)	Data Time 0.002 (0.014)	Loss 3.4748 (3.6778)	Entropy 1.40215 (1.41593)	Top-1 acc 39.062 (37.410)	Top-5 acc 64.453 (61.466)	lr 0.02444
Train [12][1620/3239]	Time 0.510 (0.864)	Data Time 0.001 (0.014)	Loss 3.5601 (3.6777)	Entropy 1.40174 (1.41584)	Top-1 acc 34.766 (37.407)	Top-5 acc 62.109 (61.469)	lr 0.02444
Train [12][1630/3239]	Time 0.589 (0.864)	Data Time 0.001 (0.014)	Loss 3.6585 (3.6773)	Entropy 1.40153 (1.41576)	Top-1 acc 37.500 (37.415)	Top-5 acc 59.766 (61.479)	lr 0.02444
Train [12][1640/3239]	Time 0.587 (0.863)	Data Time 0.001 (0.014)	Loss 3.8118 (3.6770)	Entropy 1.40154 (1.41567)	Top-1 acc 36.328 (37.419)	Top-5 acc 61.719 (61.485)	lr 0.02444
Train [12][1650/3239]	Time 0.578 (0.863)	Data Time 0.001 (0.014)	Loss 3.6253 (3.6770)	Entropy 1.40119 (1.41558)	Top-1 acc 34.766 (37.415)	Top-5 acc 62.109 (61.486)	lr 0.02444
Train [12][1660/3239]	Time 0.573 (0.863)	Data Time 0.001 (0.014)	Loss 3.7410 (3.6772)	Entropy 1.40144 (1.41550)	Top-1 acc 38.672 (37.417)	Top-5 acc 62.109 (61.486)	lr 0.02444
Train [12][1670/3239]	Time 0.563 (0.874)	Data Time 0.002 (0.014)	Loss 3.8247 (3.6772)	Entropy 1.40159 (1.41541)	Top-1 acc 33.594 (37.417)	Top-5 acc 58.984 (61.489)	lr 0.02444
Train [12][1680/3239]	Time 0.608 (0.874)	Data Time 0.002 (0.014)	Loss 3.3559 (3.6770)	Entropy 1.40140 (1.41533)	Top-1 acc 48.047 (37.423)	Top-5 acc 69.922 (61.492)	lr 0.02444
Train [12][1690/3239]	Time 0.692 (0.874)	Data Time 0.001 (0.014)	Loss 3.7462 (3.6775)	Entropy 1.40099 (1.41525)	Top-1 acc 33.594 (37.408)	Top-5 acc 58.203 (61.480)	lr 0.02444
Train [12][1700/3239]	Time 0.591 (0.874)	Data Time 0.001 (0.014)	Loss 3.7793 (3.6771)	Entropy 1.40066 (1.41516)	Top-1 acc 33.594 (37.413)	Top-5 acc 56.641 (61.489)	lr 0.02444
Train [12][1710/3239]	Time 0.633 (0.873)	Data Time 0.001 (0.014)	Loss 3.4736 (3.6767)	Entropy 1.40042 (1.41508)	Top-1 acc 41.016 (37.415)	Top-5 acc 65.625 (61.498)	lr 0.02444
Train [12][1720/3239]	Time 0.624 (0.873)	Data Time 0.001 (0.014)	Loss 3.6516 (3.6768)	Entropy 1.39997 (1.41499)	Top-1 acc 41.797 (37.420)	Top-5 acc 62.891 (61.493)	lr 0.02443
Train [12][1730/3239]	Time 0.601 (0.873)	Data Time 0.002 (0.014)	Loss 3.5056 (3.6764)	Entropy 1.39985 (1.41490)	Top-1 acc 39.062 (37.432)	Top-5 acc 66.016 (61.509)	lr 0.02443
Train [12][1740/3239]	Time 0.598 (0.873)	Data Time 0.001 (0.014)	Loss 3.7735 (3.6766)	Entropy 1.39956 (1.41482)	Top-1 acc 36.328 (37.429)	Top-5 acc 58.594 (61.502)	lr 0.02443
Train [12][1750/3239]	Time 0.580 (0.872)	Data Time 0.001 (0.013)	Loss 3.5074 (3.6760)	Entropy 1.39962 (1.41473)	Top-1 acc 42.188 (37.442)	Top-5 acc 64.453 (61.514)	lr 0.02443
Train [12][1760/3239]	Time 0.659 (0.872)	Data Time 0.001 (0.013)	Loss 3.8431 (3.6761)	Entropy 1.39953 (1.41464)	Top-1 acc 33.203 (37.441)	Top-5 acc 56.641 (61.512)	lr 0.02443
Train [12][1770/3239]	Time 0.614 (0.872)	Data Time 0.001 (0.013)	Loss 3.5301 (3.6761)	Entropy 1.39942 (1.41456)	Top-1 acc 39.844 (37.434)	Top-5 acc 64.453 (61.509)	lr 0.02443
Train [12][1780/3239]	Time 0.546 (0.871)	Data Time 0.001 (0.013)	Loss 3.7571 (3.6760)	Entropy 1.39943 (1.41447)	Top-1 acc 34.766 (37.437)	Top-5 acc 57.812 (61.511)	lr 0.02443
Train [12][1790/3239]	Time 0.571 (0.871)	Data Time 0.001 (0.013)	Loss 3.6919 (3.6761)	Entropy 1.39904 (1.41439)	Top-1 acc 37.891 (37.439)	Top-5 acc 62.109 (61.506)	lr 0.02443
Train [12][1800/3239]	Time 0.604 (0.871)	Data Time 0.001 (0.013)	Loss 3.2892 (3.6759)	Entropy 1.39903 (1.41430)	Top-1 acc 42.188 (37.444)	Top-5 acc 69.531 (61.509)	lr 0.02443
Train [12][1810/3239]	Time 0.624 (0.871)	Data Time 0.001 (0.013)	Loss 3.7132 (3.6758)	Entropy 1.39862 (1.41422)	Top-1 acc 39.453 (37.448)	Top-5 acc 58.984 (61.508)	lr 0.02443
Train [12][1820/3239]	Time 0.635 (0.871)	Data Time 0.001 (0.013)	Loss 3.5963 (3.6756)	Entropy 1.39830 (1.41413)	Top-1 acc 40.625 (37.453)	Top-5 acc 61.719 (61.515)	lr 0.02443
Train [12][1830/3239]	Time 0.635 (0.871)	Data Time 0.001 (0.013)	Loss 3.6847 (3.6755)	Entropy 1.39805 (1.41405)	Top-1 acc 39.062 (37.453)	Top-5 acc 64.062 (61.520)	lr 0.02443
Train [12][1840/3239]	Time 0.564 (0.870)	Data Time 0.001 (0.013)	Loss 3.6910 (3.6759)	Entropy 1.39794 (1.41396)	Top-1 acc 41.016 (37.448)	Top-5 acc 61.328 (61.511)	lr 0.02443
Train [12][1850/3239]	Time 0.577 (0.870)	Data Time 0.002 (0.013)	Loss 3.7902 (3.6760)	Entropy 1.39742 (1.41387)	Top-1 acc 33.203 (37.446)	Top-5 acc 61.328 (61.509)	lr 0.02443
Train [12][1860/3239]	Time 0.600 (0.870)	Data Time 0.001 (0.013)	Loss 3.7345 (3.6759)	Entropy 1.39689 (1.41378)	Top-1 acc 38.281 (37.452)	Top-5 acc 62.109 (61.513)	lr 0.02443
Train [12][1870/3239]	Time 0.581 (0.870)	Data Time 0.001 (0.013)	Loss 3.7629 (3.6756)	Entropy 1.39668 (1.41369)	Top-1 acc 34.766 (37.452)	Top-5 acc 59.375 (61.520)	lr 0.02443
Train [12][1880/3239]	Time 0.609 (0.870)	Data Time 0.001 (0.013)	Loss 3.5876 (3.6752)	Entropy 1.39615 (1.41360)	Top-1 acc 41.797 (37.465)	Top-5 acc 60.938 (61.528)	lr 0.02443
Train [12][1890/3239]	Time 0.565 (0.870)	Data Time 0.001 (0.013)	Loss 3.5852 (3.6751)	Entropy 1.39587 (1.41351)	Top-1 acc 37.109 (37.464)	Top-5 acc 64.453 (61.531)	lr 0.02443
Train [12][1900/3239]	Time 0.621 (0.869)	Data Time 0.001 (0.013)	Loss 3.7609 (3.6751)	Entropy 1.39545 (1.41341)	Top-1 acc 35.547 (37.462)	Top-5 acc 57.031 (61.529)	lr 0.02443
Train [12][1910/3239]	Time 0.541 (0.869)	Data Time 0.001 (0.012)	Loss 3.5862 (3.6750)	Entropy 1.39570 (1.41332)	Top-1 acc 37.891 (37.463)	Top-5 acc 61.328 (61.526)	lr 0.02443
Train [12][1920/3239]	Time 0.608 (0.869)	Data Time 0.001 (0.012)	Loss 3.6094 (3.6746)	Entropy 1.39545 (1.41323)	Top-1 acc 37.891 (37.473)	Top-5 acc 61.328 (61.538)	lr 0.02443
Train [12][1930/3239]	Time 0.552 (0.869)	Data Time 0.001 (0.012)	Loss 3.4338 (3.6749)	Entropy 1.39526 (1.41313)	Top-1 acc 45.703 (37.470)	Top-5 acc 64.453 (61.530)	lr 0.02443
Train [12][1940/3239]	Time 0.626 (0.868)	Data Time 0.001 (0.012)	Loss 3.7377 (3.6750)	Entropy 1.39505 (1.41304)	Top-1 acc 35.938 (37.467)	Top-5 acc 62.109 (61.537)	lr 0.02443
Train [12][1950/3239]	Time 0.537 (0.868)	Data Time 0.001 (0.012)	Loss 3.7242 (3.6752)	Entropy 1.39535 (1.41295)	Top-1 acc 38.281 (37.468)	Top-5 acc 64.453 (61.532)	lr 0.02443
Train [12][1960/3239]	Time 0.589 (0.867)	Data Time 0.001 (0.012)	Loss 3.6190 (3.6751)	Entropy 1.39522 (1.41286)	Top-1 acc 39.844 (37.470)	Top-5 acc 60.547 (61.534)	lr 0.02443
Train [12][1970/3239]	Time 0.599 (0.867)	Data Time 0.001 (0.012)	Loss 3.6211 (3.6751)	Entropy 1.39496 (1.41277)	Top-1 acc 39.062 (37.466)	Top-5 acc 63.672 (61.534)	lr 0.02443
Train [12][1980/3239]	Time 0.510 (0.867)	Data Time 0.001 (0.012)	Loss 3.7188 (3.6752)	Entropy 1.39461 (1.41268)	Top-1 acc 37.891 (37.465)	Top-5 acc 61.719 (61.530)	lr 0.02443
Train [12][1990/3239]	Time 0.579 (0.867)	Data Time 0.001 (0.012)	Loss 3.5754 (3.6747)	Entropy 1.39458 (1.41259)	Top-1 acc 36.328 (37.473)	Top-5 acc 67.578 (61.541)	lr 0.02443
Train [12][2000/3239]	Time 0.570 (0.867)	Data Time 0.001 (0.012)	Loss 3.5066 (3.6744)	Entropy 1.39456 (1.41250)	Top-1 acc 37.891 (37.475)	Top-5 acc 65.625 (61.547)	lr 0.02443
Train [12][2010/3239]	Time 0.547 (0.867)	Data Time 0.001 (0.012)	Loss 3.6525 (3.6742)	Entropy 1.39438 (1.41241)	Top-1 acc 38.281 (37.475)	Top-5 acc 62.891 (61.551)	lr 0.02443
Train [12][2020/3239]	Time 0.624 (0.866)	Data Time 0.001 (0.012)	Loss 3.7191 (3.6740)	Entropy 1.39412 (1.41232)	Top-1 acc 35.938 (37.480)	Top-5 acc 60.547 (61.557)	lr 0.02443
Train [12][2030/3239]	Time 0.634 (0.866)	Data Time 0.001 (0.012)	Loss 3.7583 (3.6739)	Entropy 1.39416 (1.41223)	Top-1 acc 32.812 (37.480)	Top-5 acc 61.719 (61.556)	lr 0.02443
Train [12][2040/3239]	Time 0.616 (0.866)	Data Time 0.001 (0.012)	Loss 3.6182 (3.6739)	Entropy 1.39411 (1.41214)	Top-1 acc 38.672 (37.483)	Top-5 acc 63.281 (61.553)	lr 0.02443
Train [12][2050/3239]	Time 0.604 (0.866)	Data Time 0.001 (0.012)	Loss 3.5485 (3.6738)	Entropy 1.39425 (1.41205)	Top-1 acc 41.016 (37.484)	Top-5 acc 64.062 (61.554)	lr 0.02442
Train [12][2060/3239]	Time 0.654 (0.866)	Data Time 0.001 (0.012)	Loss 3.5628 (3.6740)	Entropy 1.39421 (1.41197)	Top-1 acc 43.359 (37.485)	Top-5 acc 64.453 (61.551)	lr 0.02442
Train [12][2070/3239]	Time 0.619 (0.866)	Data Time 0.001 (0.012)	Loss 3.5085 (3.6735)	Entropy 1.39411 (1.41188)	Top-1 acc 41.016 (37.489)	Top-5 acc 64.062 (61.566)	lr 0.02442
Train [12][2080/3239]	Time 0.578 (0.865)	Data Time 0.001 (0.012)	Loss 3.7708 (3.6737)	Entropy 1.39385 (1.41180)	Top-1 acc 34.375 (37.489)	Top-5 acc 59.375 (61.558)	lr 0.02442
Train [12][2090/3239]	Time 0.480 (0.865)	Data Time 0.001 (0.012)	Loss 3.4726 (3.6738)	Entropy 1.39371 (1.41171)	Top-1 acc 39.453 (37.482)	Top-5 acc 62.109 (61.556)	lr 0.02442
Train [12][2100/3239]	Time 0.586 (0.865)	Data Time 0.001 (0.012)	Loss 3.5883 (3.6738)	Entropy 1.39360 (1.41162)	Top-1 acc 37.891 (37.479)	Top-5 acc 62.891 (61.557)	lr 0.02442
Train [12][2110/3239]	Time 0.555 (0.865)	Data Time 0.001 (0.012)	Loss 3.6325 (3.6738)	Entropy 1.39346 (1.41154)	Top-1 acc 35.547 (37.477)	Top-5 acc 60.938 (61.559)	lr 0.02442
Train [12][2120/3239]	Time 0.559 (0.864)	Data Time 0.001 (0.011)	Loss 3.8664 (3.6737)	Entropy 1.39344 (1.41145)	Top-1 acc 34.766 (37.481)	Top-5 acc 58.594 (61.558)	lr 0.02442
Train [12][2130/3239]	Time 0.750 (0.864)	Data Time 0.001 (0.011)	Loss 3.8390 (3.6736)	Entropy 1.39324 (1.41137)	Top-1 acc 30.859 (37.479)	Top-5 acc 58.594 (61.559)	lr 0.02442
Train [12][2140/3239]	Time 0.587 (0.864)	Data Time 0.001 (0.011)	Loss 3.4572 (3.6734)	Entropy 1.39291 (1.41128)	Top-1 acc 42.578 (37.478)	Top-5 acc 67.969 (61.567)	lr 0.02442
Train [12][2150/3239]	Time 0.572 (0.864)	Data Time 0.001 (0.011)	Loss 3.6649 (3.6737)	Entropy 1.39298 (1.41120)	Top-1 acc 37.891 (37.468)	Top-5 acc 64.453 (61.560)	lr 0.02442
Train [12][2160/3239]	Time 0.557 (0.863)	Data Time 0.001 (0.011)	Loss 3.7532 (3.6738)	Entropy 1.39282 (1.41111)	Top-1 acc 34.766 (37.463)	Top-5 acc 58.984 (61.561)	lr 0.02442
Train [12][2170/3239]	Time 0.562 (0.863)	Data Time 0.001 (0.011)	Loss 3.7472 (3.6737)	Entropy 1.39261 (1.41103)	Top-1 acc 36.719 (37.467)	Top-5 acc 61.719 (61.565)	lr 0.02442
Train [12][2180/3239]	Time 0.603 (0.863)	Data Time 0.001 (0.011)	Loss 3.9934 (3.6736)	Entropy 1.39264 (1.41094)	Top-1 acc 31.250 (37.467)	Top-5 acc 52.734 (61.568)	lr 0.02442
Train [12][2190/3239]	Time 0.547 (0.863)	Data Time 0.001 (0.011)	Loss 3.5501 (3.6736)	Entropy 1.39243 (1.41086)	Top-1 acc 39.453 (37.464)	Top-5 acc 66.406 (61.569)	lr 0.02442
Train [12][2200/3239]	Time 0.696 (0.863)	Data Time 0.001 (0.011)	Loss 3.5513 (3.6734)	Entropy 1.39279 (1.41078)	Top-1 acc 40.625 (37.474)	Top-5 acc 65.234 (61.575)	lr 0.02442
Train [12][2210/3239]	Time 0.550 (0.863)	Data Time 0.001 (0.011)	Loss 3.7880 (3.6736)	Entropy 1.39270 (1.41070)	Top-1 acc 37.891 (37.470)	Top-5 acc 62.109 (61.572)	lr 0.02442
Train [12][2220/3239]	Time 0.579 (0.863)	Data Time 0.001 (0.011)	Loss 3.5992 (3.6737)	Entropy 1.39239 (1.41061)	Top-1 acc 35.938 (37.467)	Top-5 acc 62.891 (61.567)	lr 0.02442
Train [12][2230/3239]	Time 0.522 (0.863)	Data Time 0.001 (0.011)	Loss 3.7066 (3.6735)	Entropy 1.39215 (1.41053)	Top-1 acc 34.766 (37.466)	Top-5 acc 59.766 (61.569)	lr 0.02442
Train [12][2240/3239]	Time 0.595 (0.862)	Data Time 0.001 (0.011)	Loss 3.5139 (3.6738)	Entropy 1.39193 (1.41045)	Top-1 acc 40.234 (37.460)	Top-5 acc 63.281 (61.562)	lr 0.02442
Train [12][2250/3239]	Time 0.622 (0.862)	Data Time 0.001 (0.011)	Loss 3.7667 (3.6739)	Entropy 1.39158 (1.41037)	Top-1 acc 37.109 (37.460)	Top-5 acc 61.719 (61.561)	lr 0.02442
Train [12][2260/3239]	Time 0.618 (0.862)	Data Time 0.001 (0.011)	Loss 3.5671 (3.6738)	Entropy 1.39141 (1.41028)	Top-1 acc 40.234 (37.465)	Top-5 acc 61.328 (61.563)	lr 0.02442
Train [12][2270/3239]	Time 0.675 (0.862)	Data Time 0.002 (0.011)	Loss 3.7977 (3.6741)	Entropy 1.39120 (1.41020)	Top-1 acc 35.547 (37.459)	Top-5 acc 54.688 (61.558)	lr 0.02442
Train [12][2280/3239]	Time 0.572 (0.862)	Data Time 0.002 (0.011)	Loss 3.6459 (3.6741)	Entropy 1.39114 (1.41012)	Top-1 acc 38.672 (37.458)	Top-5 acc 62.500 (61.558)	lr 0.02442
Train [12][2290/3239]	Time 0.464 (0.862)	Data Time 0.001 (0.011)	Loss 3.7244 (3.6739)	Entropy 1.39114 (1.41003)	Top-1 acc 38.672 (37.462)	Top-5 acc 61.719 (61.560)	lr 0.02442
Train [12][2300/3239]	Time 0.577 (0.861)	Data Time 0.001 (0.011)	Loss 3.6258 (3.6739)	Entropy 1.39084 (1.40995)	Top-1 acc 36.719 (37.461)	Top-5 acc 61.719 (61.560)	lr 0.02442
Train [12][2310/3239]	Time 0.557 (0.861)	Data Time 0.001 (0.011)	Loss 3.8031 (3.6736)	Entropy 1.39123 (1.40987)	Top-1 acc 36.328 (37.464)	Top-5 acc 54.297 (61.562)	lr 0.02442
Train [12][2320/3239]	Time 0.762 (0.870)	Data Time 0.005 (0.011)	Loss 3.9205 (3.6739)	Entropy 1.39106 (1.40979)	Top-1 acc 33.984 (37.459)	Top-5 acc 54.688 (61.558)	lr 0.02442
Train [12][2330/3239]	Time 0.549 (0.870)	Data Time 0.002 (0.011)	Loss 3.8792 (3.6739)	Entropy 1.39111 (1.40971)	Top-1 acc 33.203 (37.459)	Top-5 acc 55.078 (61.552)	lr 0.02442
Train [12][2340/3239]	Time 0.615 (0.870)	Data Time 0.002 (0.011)	Loss 3.5282 (3.6739)	Entropy 1.39120 (1.40963)	Top-1 acc 39.844 (37.459)	Top-5 acc 63.672 (61.550)	lr 0.02442
Train [12][2350/3239]	Time 0.591 (0.869)	Data Time 0.001 (0.011)	Loss 3.5995 (3.6739)	Entropy 1.39118 (1.40955)	Top-1 acc 39.844 (37.459)	Top-5 acc 62.500 (61.552)	lr 0.02442
Train [12][2360/3239]	Time 0.553 (0.869)	Data Time 0.001 (0.011)	Loss 3.5957 (3.6739)	Entropy 1.39078 (1.40947)	Top-1 acc 40.625 (37.464)	Top-5 acc 60.938 (61.548)	lr 0.02442
Train [12][2370/3239]	Time 0.594 (0.869)	Data Time 0.002 (0.010)	Loss 3.4909 (3.6737)	Entropy 1.39074 (1.40939)	Top-1 acc 42.969 (37.467)	Top-5 acc 62.500 (61.552)	lr 0.02442
Train [12][2380/3239]	Time 0.609 (0.869)	Data Time 0.001 (0.010)	Loss 3.6369 (3.6739)	Entropy 1.39114 (1.40932)	Top-1 acc 40.625 (37.466)	Top-5 acc 62.109 (61.548)	lr 0.02441
Train [12][2390/3239]	Time 0.612 (0.869)	Data Time 0.001 (0.010)	Loss 3.7270 (3.6736)	Entropy 1.39104 (1.40924)	Top-1 acc 34.766 (37.472)	Top-5 acc 59.766 (61.551)	lr 0.02441
Train [12][2400/3239]	Time 0.564 (0.869)	Data Time 0.001 (0.010)	Loss 3.8089 (3.6734)	Entropy 1.39095 (1.40916)	Top-1 acc 34.375 (37.479)	Top-5 acc 59.766 (61.556)	lr 0.02441
Train [12][2410/3239]	Time 0.599 (0.868)	Data Time 0.001 (0.010)	Loss 3.6345 (3.6733)	Entropy 1.39094 (1.40909)	Top-1 acc 38.672 (37.479)	Top-5 acc 60.547 (61.562)	lr 0.02441
Train [12][2420/3239]	Time 0.573 (0.868)	Data Time 0.001 (0.010)	Loss 3.7858 (3.6733)	Entropy 1.39072 (1.40901)	Top-1 acc 36.328 (37.476)	Top-5 acc 60.547 (61.562)	lr 0.02441
Train [12][2430/3239]	Time 0.687 (0.868)	Data Time 0.001 (0.010)	Loss 3.4679 (3.6736)	Entropy 1.39070 (1.40894)	Top-1 acc 43.359 (37.472)	Top-5 acc 63.672 (61.556)	lr 0.02441
Train [12][2440/3239]	Time 0.565 (0.868)	Data Time 0.001 (0.010)	Loss 3.6385 (3.6737)	Entropy 1.39064 (1.40886)	Top-1 acc 36.719 (37.468)	Top-5 acc 62.891 (61.548)	lr 0.02441
Train [12][2450/3239]	Time 0.597 (0.868)	Data Time 0.001 (0.010)	Loss 3.7730 (3.6735)	Entropy 1.39088 (1.40879)	Top-1 acc 36.328 (37.477)	Top-5 acc 60.547 (61.551)	lr 0.02441
Train [12][2460/3239]	Time 0.563 (0.868)	Data Time 0.001 (0.010)	Loss 3.6436 (3.6735)	Entropy 1.39064 (1.40871)	Top-1 acc 40.234 (37.474)	Top-5 acc 62.891 (61.554)	lr 0.02441
Train [12][2470/3239]	Time 0.613 (0.867)	Data Time 0.004 (0.010)	Loss 3.6984 (3.6735)	Entropy 1.39064 (1.40864)	Top-1 acc 36.328 (37.475)	Top-5 acc 62.891 (61.554)	lr 0.02441
Train [12][2480/3239]	Time 0.562 (0.867)	Data Time 0.001 (0.010)	Loss 3.7548 (3.6735)	Entropy 1.39015 (1.40857)	Top-1 acc 34.375 (37.477)	Top-5 acc 62.109 (61.555)	lr 0.02441
Train [12][2490/3239]	Time 0.554 (0.867)	Data Time 0.001 (0.010)	Loss 3.6929 (3.6735)	Entropy 1.38961 (1.40849)	Top-1 acc 36.719 (37.479)	Top-5 acc 57.812 (61.553)	lr 0.02441
Train [12][2500/3239]	Time 0.666 (0.867)	Data Time 0.002 (0.010)	Loss 3.7072 (3.6732)	Entropy 1.38907 (1.40842)	Top-1 acc 35.938 (37.486)	Top-5 acc 57.031 (61.557)	lr 0.02441
Train [12][2510/3239]	Time 0.564 (0.867)	Data Time 0.001 (0.010)	Loss 3.4745 (3.6732)	Entropy 1.38892 (1.40834)	Top-1 acc 41.797 (37.485)	Top-5 acc 67.969 (61.560)	lr 0.02441
Train [12][2520/3239]	Time 0.563 (0.867)	Data Time 0.001 (0.010)	Loss 3.7114 (3.6730)	Entropy 1.38894 (1.40826)	Top-1 acc 37.500 (37.491)	Top-5 acc 62.109 (61.563)	lr 0.02441
Train [12][2530/3239]	Time 0.598 (0.867)	Data Time 0.003 (0.010)	Loss 3.5299 (3.6728)	Entropy 1.38884 (1.40819)	Top-1 acc 40.234 (37.497)	Top-5 acc 62.891 (61.566)	lr 0.02441
Train [12][2540/3239]	Time 0.570 (0.867)	Data Time 0.001 (0.010)	Loss 3.5775 (3.6724)	Entropy 1.38892 (1.40811)	Top-1 acc 35.547 (37.501)	Top-5 acc 63.281 (61.571)	lr 0.02441
Train [12][2550/3239]	Time 0.573 (0.867)	Data Time 0.001 (0.010)	Loss 3.5844 (3.6721)	Entropy 1.38873 (1.40804)	Top-1 acc 38.672 (37.504)	Top-5 acc 64.453 (61.576)	lr 0.02441
Train [12][2560/3239]	Time 0.600 (0.867)	Data Time 0.001 (0.010)	Loss 3.6202 (3.6723)	Entropy 1.38867 (1.40796)	Top-1 acc 38.672 (37.498)	Top-5 acc 61.719 (61.570)	lr 0.02441
Train [12][2570/3239]	Time 0.525 (0.866)	Data Time 0.001 (0.010)	Loss 3.6365 (3.6724)	Entropy 1.38849 (1.40788)	Top-1 acc 37.500 (37.496)	Top-5 acc 60.156 (61.566)	lr 0.02441
Train [12][2580/3239]	Time 0.528 (0.866)	Data Time 0.001 (0.010)	Loss 3.7730 (3.6724)	Entropy 1.38803 (1.40781)	Top-1 acc 36.328 (37.494)	Top-5 acc 58.984 (61.566)	lr 0.02441
Train [12][2590/3239]	Time 0.573 (0.866)	Data Time 0.001 (0.010)	Loss 3.5996 (3.6723)	Entropy 1.38772 (1.40773)	Top-1 acc 38.672 (37.494)	Top-5 acc 63.281 (61.571)	lr 0.02441
Train [12][2600/3239]	Time 0.620 (0.866)	Data Time 0.001 (0.010)	Loss 3.6058 (3.6721)	Entropy 1.38767 (1.40765)	Top-1 acc 41.406 (37.499)	Top-5 acc 65.625 (61.576)	lr 0.02441
Train [12][2610/3239]	Time 0.580 (0.866)	Data Time 0.001 (0.010)	Loss 3.5664 (3.6720)	Entropy 1.38768 (1.40758)	Top-1 acc 41.016 (37.502)	Top-5 acc 63.281 (61.580)	lr 0.02441
Train [12][2620/3239]	Time 0.557 (0.866)	Data Time 0.001 (0.010)	Loss 3.7190 (3.6718)	Entropy 1.38774 (1.40750)	Top-1 acc 38.281 (37.506)	Top-5 acc 60.156 (61.587)	lr 0.02441
Train [12][2630/3239]	Time 0.562 (0.865)	Data Time 0.001 (0.010)	Loss 3.6787 (3.6719)	Entropy 1.38755 (1.40743)	Top-1 acc 38.672 (37.504)	Top-5 acc 62.500 (61.583)	lr 0.02441
Train [12][2640/3239]	Time 0.682 (0.865)	Data Time 0.001 (0.010)	Loss 3.7436 (3.6719)	Entropy 1.38689 (1.40735)	Top-1 acc 37.109 (37.503)	Top-5 acc 58.594 (61.582)	lr 0.02441
Train [12][2650/3239]	Time 0.523 (0.865)	Data Time 0.001 (0.010)	Loss 3.5430 (3.6717)	Entropy 1.38638 (1.40727)	Top-1 acc 38.672 (37.506)	Top-5 acc 64.453 (61.591)	lr 0.02441
Train [12][2660/3239]	Time 0.617 (0.865)	Data Time 0.001 (0.010)	Loss 3.5878 (3.6721)	Entropy 1.38626 (1.40719)	Top-1 acc 41.406 (37.495)	Top-5 acc 61.328 (61.582)	lr 0.02441
Train [12][2670/3239]	Time 0.559 (0.865)	Data Time 0.001 (0.010)	Loss 3.7961 (3.6721)	Entropy 1.38591 (1.40711)	Top-1 acc 36.328 (37.496)	Top-5 acc 60.547 (61.581)	lr 0.02441
Train [12][2680/3239]	Time 0.621 (0.865)	Data Time 0.001 (0.010)	Loss 3.6526 (3.6720)	Entropy 1.38578 (1.40704)	Top-1 acc 38.672 (37.501)	Top-5 acc 58.984 (61.581)	lr 0.02441
Train [12][2690/3239]	Time 0.574 (0.865)	Data Time 0.001 (0.009)	Loss 3.6765 (3.6719)	Entropy 1.38554 (1.40696)	Top-1 acc 38.281 (37.502)	Top-5 acc 61.719 (61.585)	lr 0.02441
Train [12][2700/3239]	Time 0.582 (0.865)	Data Time 0.001 (0.009)	Loss 3.7061 (3.6716)	Entropy 1.38528 (1.40688)	Top-1 acc 36.328 (37.508)	Top-5 acc 62.109 (61.590)	lr 0.02440
Train [12][2710/3239]	Time 0.687 (0.865)	Data Time 0.001 (0.009)	Loss 3.7198 (3.6717)	Entropy 1.38481 (1.40680)	Top-1 acc 36.328 (37.504)	Top-5 acc 62.109 (61.592)	lr 0.02440
Train [12][2720/3239]	Time 0.577 (0.864)	Data Time 0.001 (0.009)	Loss 3.7283 (3.6718)	Entropy 1.38438 (1.40672)	Top-1 acc 38.281 (37.503)	Top-5 acc 63.672 (61.593)	lr 0.02440
Train [12][2730/3239]	Time 0.594 (0.864)	Data Time 0.001 (0.009)	Loss 3.5677 (3.6716)	Entropy 1.38421 (1.40663)	Top-1 acc 41.797 (37.506)	Top-5 acc 60.938 (61.595)	lr 0.02440
Train [12][2740/3239]	Time 0.620 (0.864)	Data Time 0.001 (0.009)	Loss 3.6581 (3.6717)	Entropy 1.38424 (1.40655)	Top-1 acc 39.453 (37.507)	Top-5 acc 61.328 (61.593)	lr 0.02440
Train [12][2750/3239]	Time 0.624 (0.864)	Data Time 0.001 (0.009)	Loss 3.2534 (3.6715)	Entropy 1.38429 (1.40647)	Top-1 acc 42.578 (37.512)	Top-5 acc 71.484 (61.599)	lr 0.02440
Train [12][2760/3239]	Time 0.466 (0.864)	Data Time 0.001 (0.009)	Loss 3.3775 (3.6715)	Entropy 1.38443 (1.40639)	Top-1 acc 39.062 (37.511)	Top-5 acc 68.359 (61.600)	lr 0.02440
Train [12][2770/3239]	Time 0.514 (0.864)	Data Time 0.001 (0.009)	Loss 3.8594 (3.6715)	Entropy 1.38448 (1.40631)	Top-1 acc 35.938 (37.511)	Top-5 acc 57.422 (61.600)	lr 0.02440
Train [12][2780/3239]	Time 0.613 (0.864)	Data Time 0.001 (0.009)	Loss 3.6989 (3.6715)	Entropy 1.38460 (1.40623)	Top-1 acc 34.766 (37.512)	Top-5 acc 62.500 (61.603)	lr 0.02440
Train [12][2790/3239]	Time 0.618 (0.864)	Data Time 0.002 (0.009)	Loss 3.7339 (3.6713)	Entropy 1.38477 (1.40616)	Top-1 acc 35.547 (37.511)	Top-5 acc 59.766 (61.606)	lr 0.02440
Train [12][2800/3239]	Time 0.563 (0.863)	Data Time 0.001 (0.009)	Loss 3.8108 (3.6714)	Entropy 1.38444 (1.40608)	Top-1 acc 35.938 (37.511)	Top-5 acc 58.203 (61.604)	lr 0.02440
Train [12][2810/3239]	Time 0.444 (0.863)	Data Time 0.001 (0.009)	Loss 3.6745 (3.6712)	Entropy 1.38420 (1.40600)	Top-1 acc 36.719 (37.516)	Top-5 acc 59.766 (61.608)	lr 0.02440
Train [12][2820/3239]	Time 0.576 (0.863)	Data Time 0.001 (0.009)	Loss 3.5400 (3.6713)	Entropy 1.38364 (1.40592)	Top-1 acc 38.281 (37.516)	Top-5 acc 66.016 (61.607)	lr 0.02440
Train [12][2830/3239]	Time 0.551 (0.863)	Data Time 0.002 (0.009)	Loss 3.7139 (3.6713)	Entropy 1.38326 (1.40584)	Top-1 acc 35.938 (37.513)	Top-5 acc 59.375 (61.607)	lr 0.02440
Train [12][2840/3239]	Time 0.570 (0.863)	Data Time 0.001 (0.009)	Loss 3.7057 (3.6714)	Entropy 1.38291 (1.40576)	Top-1 acc 39.844 (37.512)	Top-5 acc 62.109 (61.604)	lr 0.02440
Train [12][2850/3239]	Time 0.582 (0.863)	Data Time 0.001 (0.009)	Loss 3.6190 (3.6714)	Entropy 1.38291 (1.40568)	Top-1 acc 40.234 (37.513)	Top-5 acc 61.719 (61.604)	lr 0.02440
Train [12][2860/3239]	Time 0.602 (0.863)	Data Time 0.001 (0.009)	Loss 3.6904 (3.6712)	Entropy 1.38263 (1.40560)	Top-1 acc 37.500 (37.520)	Top-5 acc 57.422 (61.606)	lr 0.02440
Train [12][2870/3239]	Time 0.616 (0.863)	Data Time 0.001 (0.009)	Loss 3.8191 (3.6711)	Entropy 1.38263 (1.40552)	Top-1 acc 35.156 (37.523)	Top-5 acc 58.984 (61.609)	lr 0.02440
Train [12][2880/3239]	Time 0.596 (0.863)	Data Time 0.001 (0.009)	Loss 3.4975 (3.6708)	Entropy 1.38234 (1.40544)	Top-1 acc 35.938 (37.531)	Top-5 acc 66.406 (61.616)	lr 0.02440
Train [12][2890/3239]	Time 0.633 (0.863)	Data Time 0.001 (0.009)	Loss 3.7588 (3.6707)	Entropy 1.38221 (1.40536)	Top-1 acc 31.641 (37.534)	Top-5 acc 60.156 (61.619)	lr 0.02440
Train [12][2900/3239]	Time 0.564 (0.863)	Data Time 0.001 (0.009)	Loss 3.6893 (3.6708)	Entropy 1.38216 (1.40528)	Top-1 acc 37.891 (37.533)	Top-5 acc 61.328 (61.618)	lr 0.02440
Train [12][2910/3239]	Time 0.559 (0.862)	Data Time 0.001 (0.009)	Loss 3.4492 (3.6706)	Entropy 1.38171 (1.40520)	Top-1 acc 38.672 (37.537)	Top-5 acc 65.234 (61.625)	lr 0.02440
Train [12][2920/3239]	Time 0.576 (0.862)	Data Time 0.001 (0.009)	Loss 3.7845 (3.6708)	Entropy 1.38128 (1.40512)	Top-1 acc 36.719 (37.531)	Top-5 acc 56.250 (61.619)	lr 0.02440
Train [12][2930/3239]	Time 0.635 (0.862)	Data Time 0.002 (0.009)	Loss 3.4616 (3.6707)	Entropy 1.38116 (1.40504)	Top-1 acc 39.844 (37.531)	Top-5 acc 64.844 (61.617)	lr 0.02440
Train [12][2940/3239]	Time 0.709 (0.862)	Data Time 0.001 (0.009)	Loss 3.7014 (3.6707)	Entropy 1.38124 (1.40496)	Top-1 acc 37.109 (37.528)	Top-5 acc 62.109 (61.617)	lr 0.02440
Train [12][2950/3239]	Time 0.524 (0.862)	Data Time 0.001 (0.009)	Loss 3.7883 (3.6708)	Entropy 1.38111 (1.40488)	Top-1 acc 31.641 (37.527)	Top-5 acc 60.547 (61.614)	lr 0.02440
Train [12][2960/3239]	Time 0.579 (0.862)	Data Time 0.001 (0.009)	Loss 3.7598 (3.6709)	Entropy 1.38097 (1.40480)	Top-1 acc 33.984 (37.530)	Top-5 acc 62.109 (61.614)	lr 0.02440
Train [12][2970/3239]	Time 0.629 (0.862)	Data Time 0.001 (0.009)	Loss 3.5581 (3.6706)	Entropy 1.38140 (1.40472)	Top-1 acc 36.328 (37.536)	Top-5 acc 62.891 (61.614)	lr 0.02440
Train [12][2980/3239]	Time 0.554 (0.868)	Data Time 0.002 (0.009)	Loss 3.5938 (3.6706)	Entropy 1.38107 (1.40464)	Top-1 acc 38.281 (37.537)	Top-5 acc 64.062 (61.616)	lr 0.02440
Train [12][2990/3239]	Time 0.591 (0.868)	Data Time 0.002 (0.009)	Loss 3.5507 (3.6703)	Entropy 1.38105 (1.40456)	Top-1 acc 41.016 (37.538)	Top-5 acc 61.328 (61.619)	lr 0.02440
Train [12][3000/3239]	Time 0.575 (0.868)	Data Time 0.001 (0.009)	Loss 3.4627 (3.6702)	Entropy 1.38066 (1.40448)	Top-1 acc 42.969 (37.544)	Top-5 acc 67.188 (61.622)	lr 0.02440
Train [12][3010/3239]	Time 0.658 (0.868)	Data Time 0.001 (0.009)	Loss 3.5423 (3.6702)	Entropy 1.38040 (1.40440)	Top-1 acc 37.891 (37.546)	Top-5 acc 62.500 (61.619)	lr 0.02440
Train [12][3020/3239]	Time 0.582 (0.868)	Data Time 0.001 (0.009)	Loss 3.6469 (3.6702)	Entropy 1.38007 (1.40432)	Top-1 acc 34.766 (37.545)	Top-5 acc 61.328 (61.620)	lr 0.02440
Train [12][3030/3239]	Time 0.549 (0.867)	Data Time 0.001 (0.009)	Loss 3.8111 (3.6703)	Entropy 1.38020 (1.40424)	Top-1 acc 34.375 (37.543)	Top-5 acc 56.641 (61.619)	lr 0.02439
Train [12][3040/3239]	Time 0.604 (0.867)	Data Time 0.001 (0.009)	Loss 3.5625 (3.6703)	Entropy 1.38006 (1.40416)	Top-1 acc 38.672 (37.543)	Top-5 acc 64.062 (61.619)	lr 0.02439
Train [12][3050/3239]	Time 0.581 (0.867)	Data Time 0.001 (0.009)	Loss 3.7236 (3.6703)	Entropy 1.37972 (1.40408)	Top-1 acc 38.672 (37.546)	Top-5 acc 57.812 (61.620)	lr 0.02439
Train [12][3060/3239]	Time 0.604 (0.867)	Data Time 0.001 (0.009)	Loss 3.7809 (3.6705)	Entropy 1.37951 (1.40401)	Top-1 acc 38.281 (37.542)	Top-5 acc 62.109 (61.617)	lr 0.02439
Train [12][3070/3239]	Time 0.511 (0.867)	Data Time 0.001 (0.009)	Loss 3.7980 (3.6704)	Entropy 1.37938 (1.40392)	Top-1 acc 35.156 (37.545)	Top-5 acc 60.938 (61.618)	lr 0.02439
Train [12][3080/3239]	Time 0.513 (0.867)	Data Time 0.001 (0.009)	Loss 3.4425 (3.6704)	Entropy 1.37956 (1.40385)	Top-1 acc 39.844 (37.545)	Top-5 acc 65.625 (61.618)	lr 0.02439
Train [12][3090/3239]	Time 0.594 (0.866)	Data Time 0.001 (0.009)	Loss 3.6632 (3.6701)	Entropy 1.37960 (1.40377)	Top-1 acc 39.062 (37.548)	Top-5 acc 61.328 (61.623)	lr 0.02439
Train [12][3100/3239]	Time 0.584 (0.866)	Data Time 0.001 (0.009)	Loss 3.9691 (3.6703)	Entropy 1.37921 (1.40369)	Top-1 acc 35.938 (37.549)	Top-5 acc 55.859 (61.624)	lr 0.02439
Train [12][3110/3239]	Time 0.648 (0.866)	Data Time 0.022 (0.009)	Loss 3.5083 (3.6700)	Entropy 1.37904 (1.40361)	Top-1 acc 43.359 (37.553)	Top-5 acc 66.016 (61.630)	lr 0.02439
Train [12][3120/3239]	Time 0.594 (0.866)	Data Time 0.001 (0.009)	Loss 3.5689 (3.6701)	Entropy 1.37883 (1.40353)	Top-1 acc 42.578 (37.556)	Top-5 acc 65.234 (61.628)	lr 0.02439
Train [12][3130/3239]	Time 0.584 (0.866)	Data Time 0.001 (0.008)	Loss 3.5710 (3.6701)	Entropy 1.37842 (1.40345)	Top-1 acc 36.328 (37.555)	Top-5 acc 64.844 (61.629)	lr 0.02439
Train [12][3140/3239]	Time 0.574 (0.866)	Data Time 0.001 (0.008)	Loss 3.6416 (3.6698)	Entropy 1.37800 (1.40337)	Top-1 acc 33.594 (37.561)	Top-5 acc 61.719 (61.636)	lr 0.02439
Train [12][3150/3239]	Time 0.676 (0.866)	Data Time 0.001 (0.008)	Loss 3.5996 (3.6697)	Entropy 1.37786 (1.40329)	Top-1 acc 37.109 (37.561)	Top-5 acc 64.453 (61.641)	lr 0.02439
Train [12][3160/3239]	Time 0.645 (0.866)	Data Time 0.001 (0.008)	Loss 3.5992 (3.6696)	Entropy 1.37773 (1.40321)	Top-1 acc 37.500 (37.563)	Top-5 acc 65.625 (61.643)	lr 0.02439
Train [12][3170/3239]	Time 0.572 (0.866)	Data Time 0.001 (0.008)	Loss 3.5134 (3.6695)	Entropy 1.37749 (1.40313)	Top-1 acc 41.016 (37.565)	Top-5 acc 67.188 (61.647)	lr 0.02439
Train [12][3180/3239]	Time 0.562 (0.866)	Data Time 0.000 (0.008)	Loss 3.6042 (3.6696)	Entropy 1.37771 (1.40305)	Top-1 acc 37.500 (37.564)	Top-5 acc 61.328 (61.648)	lr 0.02439
Train [12][3190/3239]	Time 0.580 (0.865)	Data Time 0.000 (0.008)	Loss 3.7747 (3.6696)	Entropy 1.37736 (1.40297)	Top-1 acc 32.812 (37.563)	Top-5 acc 58.203 (61.645)	lr 0.02439
Train [12][3200/3239]	Time 0.581 (0.865)	Data Time 0.000 (0.008)	Loss 3.8797 (3.6696)	Entropy 1.37739 (1.40289)	Top-1 acc 34.375 (37.562)	Top-5 acc 56.641 (61.648)	lr 0.02439
Train [12][3210/3239]	Time 0.575 (0.865)	Data Time 0.000 (0.008)	Loss 3.7439 (3.6697)	Entropy 1.37773 (1.40281)	Top-1 acc 33.594 (37.564)	Top-5 acc 58.203 (61.646)	lr 0.02439
Train [12][3220/3239]	Time 0.648 (0.865)	Data Time 0.000 (0.008)	Loss 3.8459 (3.6695)	Entropy 1.37765 (1.40273)	Top-1 acc 35.547 (37.569)	Top-5 acc 61.719 (61.650)	lr 0.02439
Train [12][3230/3239]	Time 0.595 (0.865)	Data Time 0.000 (0.008)	Loss 3.8200 (3.6698)	Entropy 1.37750 (1.40265)	Top-1 acc 35.156 (37.565)	Top-5 acc 60.547 (61.644)	lr 0.02439
Train [12][3239/3239]	Time 1.462 (0.865)	Data Time 0.000 (0.008)	Loss 3.2487 (3.6697)	Entropy 1.37767 (1.40258)	Top-1 acc 50.617 (37.568)	Top-5 acc 69.136 (61.645)	lr 0.02439
==========Valid [12/120]	loss 2.440	top-1 acc 47.466 (47.466)	top-5 acc 71.558	Train top-1 37.568	top-5 61.645	Entropy 1.37767	Latency-None: 0.000ms	Flops: 542.77M
Train [13][0/3239]	Time 19.012 (19.012)	Data Time 17.937 (17.937)	Loss 3.6580 (3.6580)	Entropy 1.37770 (1.37770)	Top-1 acc 38.672 (38.672)	Top-5 acc 64.453 (64.453)	lr 0.02439
Train [13][10/3239]	Time 0.636 (2.642)	Data Time 0.002 (1.677)	Loss 3.6433 (3.6197)	Entropy 1.37763 (1.37768)	Top-1 acc 37.109 (38.956)	Top-5 acc 62.891 (62.571)	lr 0.02439
Train [13][20/3239]	Time 0.538 (1.787)	Data Time 0.001 (0.879)	Loss 3.4719 (3.6134)	Entropy 1.37732 (1.37765)	Top-1 acc 39.453 (38.914)	Top-5 acc 69.531 (63.132)	lr 0.02439
Train [13][30/3239]	Time 0.553 (1.481)	Data Time 0.001 (0.596)	Loss 3.7266 (3.6209)	Entropy 1.37742 (1.37755)	Top-1 acc 33.594 (38.180)	Top-5 acc 61.328 (63.042)	lr 0.02439
Train [13][40/3239]	Time 0.556 (1.319)	Data Time 0.001 (0.451)	Loss 3.8163 (3.6324)	Entropy 1.37722 (1.37750)	Top-1 acc 38.281 (38.138)	Top-5 acc 58.594 (62.881)	lr 0.02439
Train [13][50/3239]	Time 0.588 (1.228)	Data Time 0.001 (0.363)	Loss 3.8405 (3.6372)	Entropy 1.37715 (1.37744)	Top-1 acc 35.156 (37.960)	Top-5 acc 57.031 (62.661)	lr 0.02439
Train [13][60/3239]	Time 0.589 (1.164)	Data Time 0.001 (0.304)	Loss 3.7282 (3.6415)	Entropy 1.37725 (1.37739)	Top-1 acc 37.109 (38.249)	Top-5 acc 59.766 (62.577)	lr 0.02439
Train [13][70/3239]	Time 0.576 (1.116)	Data Time 0.001 (0.261)	Loss 3.4173 (3.6313)	Entropy 1.37717 (1.37737)	Top-1 acc 39.844 (38.391)	Top-5 acc 65.625 (62.792)	lr 0.02439
Train [13][80/3239]	Time 0.526 (1.083)	Data Time 0.001 (0.229)	Loss 3.7292 (3.6277)	Entropy 1.37684 (1.37731)	Top-1 acc 34.375 (38.527)	Top-5 acc 59.375 (62.910)	lr 0.02439
Train [13][90/3239]	Time 0.543 (1.055)	Data Time 0.001 (0.204)	Loss 3.8275 (3.6309)	Entropy 1.37652 (1.37725)	Top-1 acc 34.375 (38.479)	Top-5 acc 56.250 (62.800)	lr 0.02439
Train [13][100/3239]	Time 0.598 (1.034)	Data Time 0.001 (0.184)	Loss 3.4767 (3.6261)	Entropy 1.37593 (1.37717)	Top-1 acc 40.625 (38.548)	Top-5 acc 67.188 (62.898)	lr 0.02439
Train [13][110/3239]	Time 0.600 (1.018)	Data Time 0.001 (0.168)	Loss 3.3407 (3.6252)	Entropy 1.37561 (1.37704)	Top-1 acc 42.578 (38.538)	Top-5 acc 67.578 (62.929)	lr 0.02438
Train [13][120/3239]	Time 0.704 (1.003)	Data Time 0.001 (0.154)	Loss 3.8266 (3.6314)	Entropy 1.37517 (1.37692)	Top-1 acc 34.375 (38.427)	Top-5 acc 56.641 (62.707)	lr 0.02438
Train [13][130/3239]	Time 0.492 (0.988)	Data Time 0.001 (0.143)	Loss 3.8933 (3.6290)	Entropy 1.37464 (1.37677)	Top-1 acc 32.031 (38.412)	Top-5 acc 59.375 (62.753)	lr 0.02438
Train [13][140/3239]	Time 0.565 (0.976)	Data Time 0.002 (0.133)	Loss 3.6113 (3.6322)	Entropy 1.37460 (1.37662)	Top-1 acc 39.062 (38.359)	Top-5 acc 63.672 (62.641)	lr 0.02438
Train [13][150/3239]	Time 0.565 (0.967)	Data Time 0.001 (0.124)	Loss 3.4862 (3.6321)	Entropy 1.37463 (1.37649)	Top-1 acc 38.672 (38.271)	Top-5 acc 64.453 (62.593)	lr 0.02438
Train [13][160/3239]	Time 0.563 (0.959)	Data Time 0.001 (0.116)	Loss 3.8747 (3.6369)	Entropy 1.37488 (1.37638)	Top-1 acc 34.375 (38.116)	Top-5 acc 57.031 (62.500)	lr 0.02438
Train [13][170/3239]	Time 0.552 (0.953)	Data Time 0.001 (0.110)	Loss 3.7595 (3.6354)	Entropy 1.37464 (1.37628)	Top-1 acc 34.766 (38.169)	Top-5 acc 60.547 (62.511)	lr 0.02438
Train [13][180/3239]	Time 0.623 (0.948)	Data Time 0.001 (0.104)	Loss 3.5552 (3.6351)	Entropy 1.37438 (1.37618)	Top-1 acc 37.891 (38.180)	Top-5 acc 64.844 (62.500)	lr 0.02438
Train [13][190/3239]	Time 0.577 (0.943)	Data Time 0.001 (0.098)	Loss 3.6201 (3.6339)	Entropy 1.37450 (1.37609)	Top-1 acc 38.672 (38.224)	Top-5 acc 61.328 (62.500)	lr 0.02438
Train [13][200/3239]	Time 0.607 (0.937)	Data Time 0.001 (0.094)	Loss 3.5758 (3.6349)	Entropy 1.37446 (1.37602)	Top-1 acc 37.500 (38.188)	Top-5 acc 64.844 (62.463)	lr 0.02438
Train [13][210/3239]	Time 0.607 (0.930)	Data Time 0.001 (0.089)	Loss 3.6700 (3.6375)	Entropy 1.37437 (1.37594)	Top-1 acc 34.766 (38.159)	Top-5 acc 60.156 (62.380)	lr 0.02438
Train [13][220/3239]	Time 0.580 (0.926)	Data Time 0.001 (0.085)	Loss 3.4997 (3.6384)	Entropy 1.37420 (1.37587)	Top-1 acc 35.938 (38.124)	Top-5 acc 64.453 (62.346)	lr 0.02438
Train [13][230/3239]	Time 0.568 (0.919)	Data Time 0.001 (0.082)	Loss 3.4772 (3.6374)	Entropy 1.37366 (1.37579)	Top-1 acc 37.109 (38.116)	Top-5 acc 65.625 (62.382)	lr 0.02438
Train [13][240/3239]	Time 0.583 (0.916)	Data Time 0.002 (0.078)	Loss 3.5890 (3.6378)	Entropy 1.37336 (1.37570)	Top-1 acc 38.281 (38.145)	Top-5 acc 62.109 (62.361)	lr 0.02438
Train [13][250/3239]	Time 0.591 (0.913)	Data Time 0.002 (0.075)	Loss 3.4946 (3.6343)	Entropy 1.37287 (1.37560)	Top-1 acc 41.016 (38.242)	Top-5 acc 66.016 (62.411)	lr 0.02438
Train [13][260/3239]	Time 0.603 (0.910)	Data Time 0.001 (0.072)	Loss 3.6050 (3.6347)	Entropy 1.37298 (1.37550)	Top-1 acc 38.672 (38.250)	Top-5 acc 63.672 (62.395)	lr 0.02438
Train [13][270/3239]	Time 0.530 (0.906)	Data Time 0.001 (0.070)	Loss 3.6883 (3.6356)	Entropy 1.37268 (1.37541)	Top-1 acc 35.938 (38.235)	Top-5 acc 64.453 (62.375)	lr 0.02438
Train [13][280/3239]	Time 0.694 (0.904)	Data Time 0.001 (0.067)	Loss 3.5217 (3.6357)	Entropy 1.37243 (1.37531)	Top-1 acc 38.281 (38.228)	Top-5 acc 66.797 (62.328)	lr 0.02438
Train [13][290/3239]	Time 0.566 (0.902)	Data Time 0.001 (0.065)	Loss 3.5531 (3.6363)	Entropy 1.37231 (1.37521)	Top-1 acc 39.453 (38.211)	Top-5 acc 62.500 (62.327)	lr 0.02438
Train [13][300/3239]	Time 0.566 (0.899)	Data Time 0.001 (0.063)	Loss 3.6056 (3.6369)	Entropy 1.37234 (1.37511)	Top-1 acc 41.797 (38.235)	Top-5 acc 63.281 (62.285)	lr 0.02438
Train [13][310/3239]	Time 0.587 (0.897)	Data Time 0.001 (0.061)	Loss 3.5402 (3.6349)	Entropy 1.37246 (1.37503)	Top-1 acc 42.969 (38.260)	Top-5 acc 66.797 (62.319)	lr 0.02438
Train [13][320/3239]	Time 0.618 (0.895)	Data Time 0.001 (0.059)	Loss 3.6005 (3.6314)	Entropy 1.37207 (1.37494)	Top-1 acc 37.500 (38.314)	Top-5 acc 62.109 (62.362)	lr 0.02438
Train [13][330/3239]	Time 0.577 (0.893)	Data Time 0.001 (0.058)	Loss 3.6330 (3.6321)	Entropy 1.37174 (1.37485)	Top-1 acc 40.234 (38.312)	Top-5 acc 64.062 (62.358)	lr 0.02438
Train [13][340/3239]	Time 0.613 (0.891)	Data Time 0.001 (0.056)	Loss 3.4174 (3.6306)	Entropy 1.37185 (1.37476)	Top-1 acc 41.016 (38.324)	Top-5 acc 66.797 (62.376)	lr 0.02438
Train [13][350/3239]	Time 0.681 (0.890)	Data Time 0.001 (0.054)	Loss 3.5345 (3.6304)	Entropy 1.37208 (1.37468)	Top-1 acc 39.844 (38.344)	Top-5 acc 63.672 (62.375)	lr 0.02438
Train [13][360/3239]	Time 0.616 (0.889)	Data Time 0.001 (0.053)	Loss 3.5278 (3.6303)	Entropy 1.37165 (1.37460)	Top-1 acc 39.062 (38.349)	Top-5 acc 62.500 (62.387)	lr 0.02438
Train [13][370/3239]	Time 0.419 (0.887)	Data Time 0.001 (0.052)	Loss 3.6094 (3.6318)	Entropy 1.37161 (1.37452)	Top-1 acc 37.500 (38.316)	Top-5 acc 62.891 (62.338)	lr 0.02438
Train [13][380/3239]	Time 0.599 (0.886)	Data Time 0.001 (0.050)	Loss 3.6688 (3.6322)	Entropy 1.37141 (1.37444)	Top-1 acc 37.109 (38.283)	Top-5 acc 60.547 (62.330)	lr 0.02438
Train [13][390/3239]	Time 0.727 (0.932)	Data Time 0.005 (0.049)	Loss 3.7600 (3.6339)	Entropy 1.37122 (1.37436)	Top-1 acc 38.672 (38.240)	Top-5 acc 61.719 (62.321)	lr 0.02438
Train [13][400/3239]	Time 0.635 (0.931)	Data Time 0.002 (0.048)	Loss 3.6046 (3.6331)	Entropy 1.37148 (1.37429)	Top-1 acc 41.406 (38.278)	Top-5 acc 64.453 (62.338)	lr 0.02438
Train [13][410/3239]	Time 0.665 (0.928)	Data Time 0.001 (0.047)	Loss 3.5862 (3.6335)	Entropy 1.37149 (1.37422)	Top-1 acc 41.406 (38.272)	Top-5 acc 63.672 (62.345)	lr 0.02438
Train [13][420/3239]	Time 0.620 (0.927)	Data Time 0.001 (0.046)	Loss 3.6419 (3.6316)	Entropy 1.37162 (1.37416)	Top-1 acc 35.156 (38.321)	Top-5 acc 59.766 (62.384)	lr 0.02438
Train [13][430/3239]	Time 0.603 (0.924)	Data Time 0.001 (0.045)	Loss 3.4745 (3.6307)	Entropy 1.37132 (1.37409)	Top-1 acc 41.016 (38.347)	Top-5 acc 67.188 (62.394)	lr 0.02437
Train [13][440/3239]	Time 0.543 (0.922)	Data Time 0.001 (0.044)	Loss 3.5219 (3.6326)	Entropy 1.37130 (1.37403)	Top-1 acc 44.922 (38.310)	Top-5 acc 65.625 (62.359)	lr 0.02437
Train [13][450/3239]	Time 0.555 (0.921)	Data Time 0.001 (0.043)	Loss 3.8113 (3.6325)	Entropy 1.37103 (1.37397)	Top-1 acc 36.719 (38.336)	Top-5 acc 55.859 (62.348)	lr 0.02437
Train [13][460/3239]	Time 0.551 (0.919)	Data Time 0.001 (0.042)	Loss 3.6839 (3.6322)	Entropy 1.37093 (1.37390)	Top-1 acc 37.109 (38.353)	Top-5 acc 58.203 (62.354)	lr 0.02437
Train [13][470/3239]	Time 0.604 (0.918)	Data Time 0.001 (0.041)	Loss 3.8007 (3.6313)	Entropy 1.37072 (1.37384)	Top-1 acc 34.375 (38.358)	Top-5 acc 59.766 (62.375)	lr 0.02437
Train [13][480/3239]	Time 0.577 (0.916)	Data Time 0.001 (0.040)	Loss 3.6628 (3.6315)	Entropy 1.37007 (1.37377)	Top-1 acc 42.188 (38.378)	Top-5 acc 61.328 (62.372)	lr 0.02437
Train [13][490/3239]	Time 0.549 (0.915)	Data Time 0.001 (0.040)	Loss 3.5442 (3.6321)	Entropy 1.36991 (1.37369)	Top-1 acc 38.672 (38.366)	Top-5 acc 65.234 (62.346)	lr 0.02437
Train [13][500/3239]	Time 0.586 (0.913)	Data Time 0.001 (0.039)	Loss 3.4783 (3.6318)	Entropy 1.36931 (1.37362)	Top-1 acc 42.188 (38.377)	Top-5 acc 63.672 (62.335)	lr 0.02437
Train [13][510/3239]	Time 0.674 (0.912)	Data Time 0.001 (0.038)	Loss 3.5022 (3.6309)	Entropy 1.36922 (1.37353)	Top-1 acc 44.531 (38.405)	Top-5 acc 63.672 (62.342)	lr 0.02437
Train [13][520/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.037)	Loss 3.6342 (3.6310)	Entropy 1.36885 (1.37345)	Top-1 acc 37.891 (38.419)	Top-5 acc 65.625 (62.382)	lr 0.02437
Train [13][530/3239]	Time 0.437 (0.907)	Data Time 0.001 (0.037)	Loss 3.7755 (3.6317)	Entropy 1.36878 (1.37336)	Top-1 acc 32.812 (38.424)	Top-5 acc 57.422 (62.349)	lr 0.02437
Train [13][540/3239]	Time 0.564 (0.906)	Data Time 0.001 (0.036)	Loss 3.6885 (3.6328)	Entropy 1.36890 (1.37327)	Top-1 acc 37.109 (38.411)	Top-5 acc 60.547 (62.346)	lr 0.02437
Train [13][550/3239]	Time 0.606 (0.904)	Data Time 0.001 (0.035)	Loss 3.5874 (3.6324)	Entropy 1.36881 (1.37319)	Top-1 acc 38.281 (38.418)	Top-5 acc 59.375 (62.355)	lr 0.02437
Train [13][560/3239]	Time 0.599 (0.903)	Data Time 0.001 (0.035)	Loss 3.4702 (3.6328)	Entropy 1.36864 (1.37311)	Top-1 acc 42.188 (38.401)	Top-5 acc 62.109 (62.341)	lr 0.02437
Train [13][570/3239]	Time 0.586 (0.903)	Data Time 0.001 (0.034)	Loss 3.4230 (3.6330)	Entropy 1.36841 (1.37303)	Top-1 acc 39.453 (38.408)	Top-5 acc 69.922 (62.334)	lr 0.02437
Train [13][580/3239]	Time 0.663 (0.902)	Data Time 0.001 (0.034)	Loss 3.5179 (3.6338)	Entropy 1.36815 (1.37295)	Top-1 acc 39.844 (38.391)	Top-5 acc 66.406 (62.320)	lr 0.02437
Train [13][590/3239]	Time 0.580 (0.901)	Data Time 0.001 (0.033)	Loss 3.6234 (3.6344)	Entropy 1.36757 (1.37287)	Top-1 acc 44.141 (38.384)	Top-5 acc 62.500 (62.308)	lr 0.02437
Train [13][600/3239]	Time 0.580 (0.900)	Data Time 0.001 (0.033)	Loss 3.6328 (3.6346)	Entropy 1.36749 (1.37278)	Top-1 acc 38.672 (38.382)	Top-5 acc 61.328 (62.317)	lr 0.02437
Train [13][610/3239]	Time 0.550 (0.899)	Data Time 0.001 (0.032)	Loss 3.6028 (3.6345)	Entropy 1.36760 (1.37269)	Top-1 acc 42.188 (38.387)	Top-5 acc 64.062 (62.320)	lr 0.02437
Train [13][620/3239]	Time 0.579 (0.898)	Data Time 0.001 (0.032)	Loss 3.6149 (3.6342)	Entropy 1.36758 (1.37261)	Top-1 acc 40.234 (38.392)	Top-5 acc 60.938 (62.326)	lr 0.02437
Train [13][630/3239]	Time 0.612 (0.897)	Data Time 0.001 (0.031)	Loss 3.7997 (3.6341)	Entropy 1.36733 (1.37253)	Top-1 acc 31.250 (38.404)	Top-5 acc 57.422 (62.313)	lr 0.02437
Train [13][640/3239]	Time 0.555 (0.896)	Data Time 0.001 (0.031)	Loss 3.7064 (3.6354)	Entropy 1.36720 (1.37245)	Top-1 acc 33.203 (38.368)	Top-5 acc 57.031 (62.269)	lr 0.02437
Train [13][650/3239]	Time 0.669 (0.895)	Data Time 0.001 (0.030)	Loss 3.5714 (3.6351)	Entropy 1.36713 (1.37237)	Top-1 acc 39.062 (38.366)	Top-5 acc 62.891 (62.279)	lr 0.02437
Train [13][660/3239]	Time 0.569 (0.894)	Data Time 0.001 (0.030)	Loss 3.6457 (3.6351)	Entropy 1.36715 (1.37229)	Top-1 acc 41.016 (38.361)	Top-5 acc 63.281 (62.278)	lr 0.02437
Train [13][670/3239]	Time 0.549 (0.893)	Data Time 0.001 (0.029)	Loss 3.5175 (3.6349)	Entropy 1.36697 (1.37221)	Top-1 acc 43.750 (38.376)	Top-5 acc 66.016 (62.275)	lr 0.02437
Train [13][680/3239]	Time 0.542 (0.892)	Data Time 0.001 (0.029)	Loss 3.6015 (3.6348)	Entropy 1.36662 (1.37213)	Top-1 acc 41.406 (38.373)	Top-5 acc 64.062 (62.273)	lr 0.02437
Train [13][690/3239]	Time 0.540 (0.891)	Data Time 0.001 (0.029)	Loss 3.6746 (3.6342)	Entropy 1.36652 (1.37205)	Top-1 acc 37.500 (38.370)	Top-5 acc 63.281 (62.283)	lr 0.02437
Train [13][700/3239]	Time 0.605 (0.890)	Data Time 0.001 (0.028)	Loss 3.6164 (3.6338)	Entropy 1.36631 (1.37197)	Top-1 acc 39.062 (38.374)	Top-5 acc 59.766 (62.294)	lr 0.02437
Train [13][710/3239]	Time 0.619 (0.889)	Data Time 0.002 (0.028)	Loss 3.6731 (3.6334)	Entropy 1.36612 (1.37189)	Top-1 acc 36.719 (38.380)	Top-5 acc 60.938 (62.299)	lr 0.02437
Train [13][720/3239]	Time 0.665 (0.888)	Data Time 0.001 (0.028)	Loss 3.6920 (3.6334)	Entropy 1.36571 (1.37181)	Top-1 acc 37.109 (38.376)	Top-5 acc 60.547 (62.292)	lr 0.02437
Train [13][730/3239]	Time 0.574 (0.888)	Data Time 0.001 (0.027)	Loss 3.4908 (3.6340)	Entropy 1.36555 (1.37172)	Top-1 acc 42.578 (38.375)	Top-5 acc 64.062 (62.280)	lr 0.02437
Train [13][740/3239]	Time 0.581 (0.887)	Data Time 0.001 (0.027)	Loss 3.7465 (3.6335)	Entropy 1.36546 (1.37164)	Top-1 acc 34.766 (38.388)	Top-5 acc 62.109 (62.299)	lr 0.02436
Train [13][750/3239]	Time 0.560 (0.886)	Data Time 0.001 (0.027)	Loss 3.6002 (3.6330)	Entropy 1.36537 (1.37156)	Top-1 acc 37.891 (38.407)	Top-5 acc 62.109 (62.313)	lr 0.02436
Train [13][760/3239]	Time 0.590 (0.886)	Data Time 0.001 (0.026)	Loss 3.6383 (3.6331)	Entropy 1.36542 (1.37148)	Top-1 acc 36.328 (38.411)	Top-5 acc 64.062 (62.317)	lr 0.02436
Train [13][770/3239]	Time 0.634 (0.886)	Data Time 0.001 (0.026)	Loss 3.5315 (3.6331)	Entropy 1.36514 (1.37140)	Top-1 acc 42.188 (38.416)	Top-5 acc 62.500 (62.311)	lr 0.02436
Train [13][780/3239]	Time 0.618 (0.885)	Data Time 0.001 (0.026)	Loss 3.8040 (3.6341)	Entropy 1.36501 (1.37132)	Top-1 acc 35.547 (38.397)	Top-5 acc 57.422 (62.297)	lr 0.02436
Train [13][790/3239]	Time 0.686 (0.885)	Data Time 0.001 (0.025)	Loss 3.5977 (3.6343)	Entropy 1.36487 (1.37124)	Top-1 acc 38.281 (38.389)	Top-5 acc 61.719 (62.295)	lr 0.02436
Train [13][800/3239]	Time 0.554 (0.884)	Data Time 0.001 (0.025)	Loss 3.6154 (3.6337)	Entropy 1.36477 (1.37116)	Top-1 acc 35.156 (38.400)	Top-5 acc 60.547 (62.292)	lr 0.02436
Train [13][810/3239]	Time 0.622 (0.883)	Data Time 0.001 (0.025)	Loss 3.4682 (3.6341)	Entropy 1.36459 (1.37108)	Top-1 acc 46.875 (38.399)	Top-5 acc 64.062 (62.272)	lr 0.02436
Train [13][820/3239]	Time 0.603 (0.883)	Data Time 0.001 (0.025)	Loss 3.5988 (3.6338)	Entropy 1.36418 (1.37100)	Top-1 acc 40.234 (38.418)	Top-5 acc 63.672 (62.280)	lr 0.02436
Train [13][830/3239]	Time 0.587 (0.882)	Data Time 0.001 (0.024)	Loss 3.5561 (3.6339)	Entropy 1.36384 (1.37092)	Top-1 acc 39.453 (38.407)	Top-5 acc 64.453 (62.279)	lr 0.02436
Train [13][840/3239]	Time 0.592 (0.882)	Data Time 0.001 (0.024)	Loss 3.7086 (3.6346)	Entropy 1.36362 (1.37083)	Top-1 acc 36.328 (38.395)	Top-5 acc 58.984 (62.259)	lr 0.02436
Train [13][850/3239]	Time 0.553 (0.881)	Data Time 0.001 (0.024)	Loss 3.5444 (3.6348)	Entropy 1.36365 (1.37075)	Top-1 acc 38.281 (38.396)	Top-5 acc 62.891 (62.247)	lr 0.02436
Train [13][860/3239]	Time 0.590 (0.880)	Data Time 0.001 (0.023)	Loss 3.6115 (3.6357)	Entropy 1.36366 (1.37067)	Top-1 acc 40.625 (38.385)	Top-5 acc 65.234 (62.240)	lr 0.02436
Train [13][870/3239]	Time 0.564 (0.879)	Data Time 0.001 (0.023)	Loss 3.8198 (3.6357)	Entropy 1.36350 (1.37058)	Top-1 acc 38.281 (38.385)	Top-5 acc 56.641 (62.244)	lr 0.02436
Train [13][880/3239]	Time 0.601 (0.878)	Data Time 0.001 (0.023)	Loss 3.4001 (3.6352)	Entropy 1.36327 (1.37050)	Top-1 acc 42.578 (38.389)	Top-5 acc 68.359 (62.251)	lr 0.02436
Train [13][890/3239]	Time 0.607 (0.878)	Data Time 0.001 (0.023)	Loss 3.4297 (3.6352)	Entropy 1.36307 (1.37042)	Top-1 acc 39.844 (38.387)	Top-5 acc 68.750 (62.261)	lr 0.02436
Train [13][900/3239]	Time 0.573 (0.877)	Data Time 0.001 (0.022)	Loss 3.4242 (3.6356)	Entropy 1.36283 (1.37034)	Top-1 acc 44.922 (38.395)	Top-5 acc 64.062 (62.257)	lr 0.02436
Train [13][910/3239]	Time 0.643 (0.877)	Data Time 0.001 (0.022)	Loss 3.5488 (3.6349)	Entropy 1.36244 (1.37026)	Top-1 acc 36.719 (38.391)	Top-5 acc 62.500 (62.265)	lr 0.02436
Train [13][920/3239]	Time 0.588 (0.876)	Data Time 0.001 (0.022)	Loss 3.7587 (3.6348)	Entropy 1.36223 (1.37017)	Top-1 acc 37.891 (38.401)	Top-5 acc 62.891 (62.271)	lr 0.02436
Train [13][930/3239]	Time 0.553 (0.876)	Data Time 0.001 (0.022)	Loss 3.7805 (3.6347)	Entropy 1.36215 (1.37009)	Top-1 acc 30.078 (38.394)	Top-5 acc 61.719 (62.273)	lr 0.02436
Train [13][940/3239]	Time 0.613 (0.876)	Data Time 0.001 (0.022)	Loss 3.7035 (3.6351)	Entropy 1.36216 (1.37000)	Top-1 acc 37.891 (38.378)	Top-5 acc 60.156 (62.263)	lr 0.02436
Train [13][950/3239]	Time 0.564 (0.875)	Data Time 0.001 (0.021)	Loss 3.7272 (3.6362)	Entropy 1.36241 (1.36992)	Top-1 acc 41.016 (38.377)	Top-5 acc 62.109 (62.245)	lr 0.02436
Train [13][960/3239]	Time 0.583 (0.875)	Data Time 0.001 (0.021)	Loss 3.6544 (3.6367)	Entropy 1.36185 (1.36984)	Top-1 acc 36.719 (38.371)	Top-5 acc 62.891 (62.237)	lr 0.02436
Train [13][970/3239]	Time 0.592 (0.875)	Data Time 0.001 (0.021)	Loss 3.5941 (3.6359)	Entropy 1.36150 (1.36975)	Top-1 acc 37.891 (38.390)	Top-5 acc 60.938 (62.263)	lr 0.02436
Train [13][980/3239]	Time 0.542 (0.874)	Data Time 0.001 (0.021)	Loss 3.8033 (3.6354)	Entropy 1.36089 (1.36967)	Top-1 acc 33.203 (38.385)	Top-5 acc 63.281 (62.285)	lr 0.02436
Train [13][990/3239]	Time 0.638 (0.874)	Data Time 0.035 (0.021)	Loss 3.5252 (3.6348)	Entropy 1.36066 (1.36958)	Top-1 acc 44.141 (38.400)	Top-5 acc 66.797 (62.312)	lr 0.02436
Train [13][1000/3239]	Time 0.558 (0.874)	Data Time 0.001 (0.020)	Loss 3.5939 (3.6350)	Entropy 1.36002 (1.36949)	Top-1 acc 37.891 (38.386)	Top-5 acc 66.016 (62.319)	lr 0.02436
Train [13][1010/3239]	Time 0.607 (0.873)	Data Time 0.001 (0.020)	Loss 3.6307 (3.6355)	Entropy 1.36011 (1.36939)	Top-1 acc 35.547 (38.384)	Top-5 acc 64.844 (62.318)	lr 0.02436
Train [13][1020/3239]	Time 0.594 (0.873)	Data Time 0.001 (0.020)	Loss 3.6594 (3.6357)	Entropy 1.35966 (1.36930)	Top-1 acc 39.844 (38.385)	Top-5 acc 63.281 (62.318)	lr 0.02436
Train [13][1030/3239]	Time 0.529 (0.872)	Data Time 0.001 (0.020)	Loss 3.4078 (3.6365)	Entropy 1.35927 (1.36921)	Top-1 acc 42.969 (38.371)	Top-5 acc 66.797 (62.306)	lr 0.02436
Train [13][1040/3239]	Time 0.592 (0.871)	Data Time 0.001 (0.020)	Loss 3.5621 (3.6361)	Entropy 1.35940 (1.36911)	Top-1 acc 40.625 (38.377)	Top-5 acc 67.578 (62.322)	lr 0.02436
Train [13][1050/3239]	Time 0.590 (0.890)	Data Time 0.002 (0.020)	Loss 3.7188 (3.6362)	Entropy 1.35922 (1.36902)	Top-1 acc 38.281 (38.375)	Top-5 acc 58.984 (62.321)	lr 0.02436
Train [13][1060/3239]	Time 0.568 (0.889)	Data Time 0.002 (0.019)	Loss 3.7772 (3.6354)	Entropy 1.35916 (1.36893)	Top-1 acc 37.891 (38.380)	Top-5 acc 56.250 (62.340)	lr 0.02435
Train [13][1070/3239]	Time 0.559 (0.889)	Data Time 0.002 (0.019)	Loss 3.7336 (3.6352)	Entropy 1.35925 (1.36883)	Top-1 acc 33.594 (38.375)	Top-5 acc 60.156 (62.349)	lr 0.02435
Train [13][1080/3239]	Time 0.582 (0.888)	Data Time 0.001 (0.019)	Loss 3.6423 (3.6360)	Entropy 1.35865 (1.36874)	Top-1 acc 37.500 (38.355)	Top-5 acc 60.156 (62.332)	lr 0.02435
Train [13][1090/3239]	Time 0.655 (0.888)	Data Time 0.001 (0.019)	Loss 3.4305 (3.6354)	Entropy 1.35840 (1.36865)	Top-1 acc 40.234 (38.366)	Top-5 acc 67.969 (62.346)	lr 0.02435
Train [13][1100/3239]	Time 0.595 (0.888)	Data Time 0.002 (0.019)	Loss 3.4609 (3.6351)	Entropy 1.35842 (1.36856)	Top-1 acc 40.234 (38.358)	Top-5 acc 66.016 (62.345)	lr 0.02435
Train [13][1110/3239]	Time 0.540 (0.887)	Data Time 0.001 (0.019)	Loss 3.6566 (3.6348)	Entropy 1.35861 (1.36847)	Top-1 acc 41.797 (38.371)	Top-5 acc 64.062 (62.345)	lr 0.02435
Train [13][1120/3239]	Time 0.604 (0.887)	Data Time 0.001 (0.019)	Loss 3.5220 (3.6347)	Entropy 1.35875 (1.36838)	Top-1 acc 41.016 (38.367)	Top-5 acc 67.188 (62.354)	lr 0.02435
Train [13][1130/3239]	Time 0.578 (0.887)	Data Time 0.002 (0.018)	Loss 3.7338 (3.6347)	Entropy 1.35867 (1.36830)	Top-1 acc 33.984 (38.373)	Top-5 acc 58.984 (62.351)	lr 0.02435
Train [13][1140/3239]	Time 0.558 (0.886)	Data Time 0.001 (0.018)	Loss 3.7944 (3.6357)	Entropy 1.35845 (1.36821)	Top-1 acc 35.156 (38.351)	Top-5 acc 59.375 (62.330)	lr 0.02435
Train [13][1150/3239]	Time 0.602 (0.886)	Data Time 0.001 (0.018)	Loss 3.5971 (3.6360)	Entropy 1.35826 (1.36813)	Top-1 acc 37.891 (38.335)	Top-5 acc 63.672 (62.323)	lr 0.02435
Train [13][1160/3239]	Time 0.665 (0.885)	Data Time 0.001 (0.018)	Loss 3.4419 (3.6360)	Entropy 1.35814 (1.36804)	Top-1 acc 46.484 (38.337)	Top-5 acc 64.453 (62.323)	lr 0.02435
Train [13][1170/3239]	Time 0.544 (0.885)	Data Time 0.001 (0.018)	Loss 3.6421 (3.6363)	Entropy 1.35802 (1.36795)	Top-1 acc 41.406 (38.334)	Top-5 acc 62.891 (62.316)	lr 0.02435
Train [13][1180/3239]	Time 0.540 (0.884)	Data Time 0.001 (0.018)	Loss 3.7077 (3.6365)	Entropy 1.35785 (1.36787)	Top-1 acc 39.844 (38.329)	Top-5 acc 58.984 (62.305)	lr 0.02435
Train [13][1190/3239]	Time 0.537 (0.883)	Data Time 0.001 (0.018)	Loss 3.6203 (3.6363)	Entropy 1.35771 (1.36778)	Top-1 acc 37.891 (38.331)	Top-5 acc 63.281 (62.308)	lr 0.02435
Train [13][1200/3239]	Time 0.607 (0.883)	Data Time 0.001 (0.017)	Loss 3.8307 (3.6369)	Entropy 1.35773 (1.36770)	Top-1 acc 39.062 (38.335)	Top-5 acc 60.156 (62.298)	lr 0.02435
Train [13][1210/3239]	Time 0.553 (0.882)	Data Time 0.001 (0.017)	Loss 3.7940 (3.6373)	Entropy 1.35767 (1.36762)	Top-1 acc 35.547 (38.324)	Top-5 acc 61.719 (62.294)	lr 0.02435
Train [13][1220/3239]	Time 0.558 (0.882)	Data Time 0.002 (0.017)	Loss 3.8363 (3.6380)	Entropy 1.35771 (1.36754)	Top-1 acc 33.203 (38.308)	Top-5 acc 59.766 (62.280)	lr 0.02435
Train [13][1230/3239]	Time 0.670 (0.882)	Data Time 0.001 (0.017)	Loss 3.6015 (3.6379)	Entropy 1.35754 (1.36746)	Top-1 acc 40.625 (38.309)	Top-5 acc 65.234 (62.293)	lr 0.02435
Train [13][1240/3239]	Time 0.525 (0.881)	Data Time 0.001 (0.017)	Loss 3.7082 (3.6378)	Entropy 1.35736 (1.36738)	Top-1 acc 33.984 (38.309)	Top-5 acc 59.766 (62.292)	lr 0.02435
Train [13][1250/3239]	Time 0.588 (0.881)	Data Time 0.001 (0.017)	Loss 3.6915 (3.6373)	Entropy 1.35715 (1.36730)	Top-1 acc 35.938 (38.314)	Top-5 acc 62.891 (62.303)	lr 0.02435
Train [13][1260/3239]	Time 0.568 (0.881)	Data Time 0.001 (0.017)	Loss 3.3911 (3.6370)	Entropy 1.35726 (1.36722)	Top-1 acc 44.141 (38.321)	Top-5 acc 66.406 (62.314)	lr 0.02435
Train [13][1270/3239]	Time 0.578 (0.880)	Data Time 0.001 (0.017)	Loss 3.4705 (3.6371)	Entropy 1.35680 (1.36714)	Top-1 acc 37.891 (38.314)	Top-5 acc 66.016 (62.312)	lr 0.02435
Train [13][1280/3239]	Time 0.627 (0.880)	Data Time 0.001 (0.016)	Loss 3.5101 (3.6369)	Entropy 1.35639 (1.36705)	Top-1 acc 42.578 (38.317)	Top-5 acc 65.625 (62.323)	lr 0.02435
Train [13][1290/3239]	Time 0.615 (0.880)	Data Time 0.001 (0.016)	Loss 3.6958 (3.6368)	Entropy 1.35630 (1.36697)	Top-1 acc 37.500 (38.315)	Top-5 acc 60.156 (62.321)	lr 0.02435
Train [13][1300/3239]	Time 0.614 (0.879)	Data Time 0.002 (0.016)	Loss 3.5562 (3.6364)	Entropy 1.35629 (1.36689)	Top-1 acc 39.844 (38.327)	Top-5 acc 65.625 (62.333)	lr 0.02435
Train [13][1310/3239]	Time 0.589 (0.879)	Data Time 0.001 (0.016)	Loss 3.4265 (3.6359)	Entropy 1.35624 (1.36681)	Top-1 acc 42.188 (38.340)	Top-5 acc 68.750 (62.346)	lr 0.02435
Train [13][1320/3239]	Time 0.718 (0.879)	Data Time 0.001 (0.016)	Loss 3.5381 (3.6359)	Entropy 1.35599 (1.36673)	Top-1 acc 36.719 (38.338)	Top-5 acc 64.453 (62.345)	lr 0.02435
Train [13][1330/3239]	Time 0.560 (0.879)	Data Time 0.001 (0.016)	Loss 3.6431 (3.6359)	Entropy 1.35577 (1.36664)	Top-1 acc 40.234 (38.335)	Top-5 acc 60.547 (62.342)	lr 0.02435
Train [13][1340/3239]	Time 0.622 (0.878)	Data Time 0.001 (0.016)	Loss 3.4825 (3.6358)	Entropy 1.35589 (1.36656)	Top-1 acc 37.891 (38.337)	Top-5 acc 61.328 (62.340)	lr 0.02435
Train [13][1350/3239]	Time 0.633 (0.878)	Data Time 0.001 (0.016)	Loss 3.6250 (3.6363)	Entropy 1.35542 (1.36648)	Top-1 acc 37.109 (38.328)	Top-5 acc 62.891 (62.330)	lr 0.02435
Train [13][1360/3239]	Time 0.613 (0.877)	Data Time 0.001 (0.016)	Loss 3.5226 (3.6363)	Entropy 1.35467 (1.36640)	Top-1 acc 40.234 (38.323)	Top-5 acc 62.109 (62.335)	lr 0.02435
Train [13][1370/3239]	Time 0.572 (0.877)	Data Time 0.001 (0.016)	Loss 3.4906 (3.6360)	Entropy 1.35487 (1.36632)	Top-1 acc 41.797 (38.327)	Top-5 acc 65.625 (62.342)	lr 0.02434
Train [13][1380/3239]	Time 0.621 (0.877)	Data Time 0.001 (0.015)	Loss 3.5840 (3.6359)	Entropy 1.35465 (1.36623)	Top-1 acc 35.938 (38.322)	Top-5 acc 62.891 (62.344)	lr 0.02434
Train [13][1390/3239]	Time 0.645 (0.877)	Data Time 0.001 (0.015)	Loss 3.6274 (3.6359)	Entropy 1.35454 (1.36615)	Top-1 acc 37.109 (38.324)	Top-5 acc 62.109 (62.346)	lr 0.02434
Train [13][1400/3239]	Time 0.569 (0.876)	Data Time 0.001 (0.015)	Loss 3.5299 (3.6356)	Entropy 1.35451 (1.36607)	Top-1 acc 36.719 (38.332)	Top-5 acc 64.062 (62.355)	lr 0.02434
Train [13][1410/3239]	Time 0.560 (0.876)	Data Time 0.001 (0.015)	Loss 3.4930 (3.6358)	Entropy 1.35417 (1.36598)	Top-1 acc 42.969 (38.330)	Top-5 acc 65.625 (62.351)	lr 0.02434
Train [13][1420/3239]	Time 0.554 (0.876)	Data Time 0.001 (0.015)	Loss 3.8476 (3.6360)	Entropy 1.35411 (1.36590)	Top-1 acc 35.938 (38.328)	Top-5 acc 57.031 (62.339)	lr 0.02434
Train [13][1430/3239]	Time 0.586 (0.875)	Data Time 0.001 (0.015)	Loss 3.6159 (3.6364)	Entropy 1.35391 (1.36582)	Top-1 acc 37.891 (38.316)	Top-5 acc 63.281 (62.331)	lr 0.02434
Train [13][1440/3239]	Time 0.569 (0.875)	Data Time 0.001 (0.015)	Loss 3.6592 (3.6367)	Entropy 1.35396 (1.36573)	Top-1 acc 37.891 (38.309)	Top-5 acc 61.719 (62.320)	lr 0.02434
Train [13][1450/3239]	Time 0.578 (0.875)	Data Time 0.001 (0.015)	Loss 3.6377 (3.6367)	Entropy 1.35386 (1.36565)	Top-1 acc 37.891 (38.306)	Top-5 acc 62.891 (62.313)	lr 0.02434
Train [13][1460/3239]	Time 0.587 (0.875)	Data Time 0.001 (0.015)	Loss 3.6117 (3.6372)	Entropy 1.35421 (1.36557)	Top-1 acc 37.891 (38.306)	Top-5 acc 64.062 (62.305)	lr 0.02434
Train [13][1470/3239]	Time 0.609 (0.874)	Data Time 0.001 (0.015)	Loss 3.4526 (3.6369)	Entropy 1.35396 (1.36550)	Top-1 acc 45.312 (38.306)	Top-5 acc 65.234 (62.310)	lr 0.02434
Train [13][1480/3239]	Time 0.544 (0.874)	Data Time 0.001 (0.015)	Loss 3.6225 (3.6375)	Entropy 1.35392 (1.36542)	Top-1 acc 42.969 (38.297)	Top-5 acc 64.844 (62.300)	lr 0.02434
Train [13][1490/3239]	Time 0.576 (0.874)	Data Time 0.001 (0.014)	Loss 3.7869 (3.6379)	Entropy 1.35411 (1.36534)	Top-1 acc 34.766 (38.288)	Top-5 acc 57.422 (62.296)	lr 0.02434
Train [13][1500/3239]	Time 0.588 (0.873)	Data Time 0.001 (0.014)	Loss 3.5631 (3.6381)	Entropy 1.35423 (1.36527)	Top-1 acc 38.672 (38.282)	Top-5 acc 64.453 (62.285)	lr 0.02434
Train [13][1510/3239]	Time 0.594 (0.873)	Data Time 0.001 (0.014)	Loss 3.6945 (3.6376)	Entropy 1.35431 (1.36519)	Top-1 acc 35.547 (38.288)	Top-5 acc 59.766 (62.292)	lr 0.02434
Train [13][1520/3239]	Time 0.470 (0.872)	Data Time 0.001 (0.014)	Loss 3.7213 (3.6381)	Entropy 1.35417 (1.36512)	Top-1 acc 34.766 (38.277)	Top-5 acc 57.031 (62.282)	lr 0.02434
Train [13][1530/3239]	Time 0.474 (0.872)	Data Time 0.002 (0.014)	Loss 3.3327 (3.6378)	Entropy 1.35422 (1.36505)	Top-1 acc 42.188 (38.284)	Top-5 acc 69.531 (62.291)	lr 0.02434
Train [13][1540/3239]	Time 0.599 (0.872)	Data Time 0.001 (0.014)	Loss 3.5603 (3.6381)	Entropy 1.35401 (1.36498)	Top-1 acc 40.234 (38.284)	Top-5 acc 64.453 (62.290)	lr 0.02434
Train [13][1550/3239]	Time 0.724 (0.872)	Data Time 0.001 (0.014)	Loss 3.6208 (3.6384)	Entropy 1.35377 (1.36491)	Top-1 acc 38.281 (38.277)	Top-5 acc 60.547 (62.280)	lr 0.02434
Train [13][1560/3239]	Time 0.567 (0.871)	Data Time 0.001 (0.014)	Loss 3.6451 (3.6387)	Entropy 1.35383 (1.36484)	Top-1 acc 37.500 (38.265)	Top-5 acc 60.938 (62.273)	lr 0.02434
Train [13][1570/3239]	Time 0.590 (0.871)	Data Time 0.001 (0.014)	Loss 3.7402 (3.6391)	Entropy 1.35360 (1.36477)	Top-1 acc 32.031 (38.260)	Top-5 acc 60.547 (62.267)	lr 0.02434
Train [13][1580/3239]	Time 0.605 (0.871)	Data Time 0.001 (0.014)	Loss 3.7817 (3.6392)	Entropy 1.35342 (1.36470)	Top-1 acc 35.547 (38.257)	Top-5 acc 55.859 (62.262)	lr 0.02434
Train [13][1590/3239]	Time 0.551 (0.870)	Data Time 0.001 (0.014)	Loss 3.4590 (3.6395)	Entropy 1.35329 (1.36462)	Top-1 acc 42.578 (38.259)	Top-5 acc 64.844 (62.254)	lr 0.02434
Train [13][1600/3239]	Time 0.588 (0.870)	Data Time 0.001 (0.014)	Loss 3.5971 (3.6391)	Entropy 1.35337 (1.36455)	Top-1 acc 39.453 (38.267)	Top-5 acc 64.062 (62.267)	lr 0.02434
Train [13][1610/3239]	Time 0.525 (0.870)	Data Time 0.001 (0.014)	Loss 3.6575 (3.6389)	Entropy 1.35304 (1.36448)	Top-1 acc 38.672 (38.275)	Top-5 acc 60.547 (62.270)	lr 0.02434
Train [13][1620/3239]	Time 0.731 (0.870)	Data Time 0.001 (0.013)	Loss 3.5386 (3.6386)	Entropy 1.35273 (1.36441)	Top-1 acc 41.797 (38.283)	Top-5 acc 64.453 (62.280)	lr 0.02434
Train [13][1630/3239]	Time 0.577 (0.870)	Data Time 0.001 (0.013)	Loss 3.5852 (3.6388)	Entropy 1.35266 (1.36434)	Top-1 acc 42.188 (38.280)	Top-5 acc 59.766 (62.270)	lr 0.02434
Train [13][1640/3239]	Time 0.579 (0.869)	Data Time 0.002 (0.013)	Loss 3.8194 (3.6389)	Entropy 1.35256 (1.36427)	Top-1 acc 34.375 (38.274)	Top-5 acc 56.641 (62.270)	lr 0.02434
Train [13][1650/3239]	Time 0.585 (0.869)	Data Time 0.001 (0.013)	Loss 3.7566 (3.6389)	Entropy 1.35260 (1.36420)	Top-1 acc 34.375 (38.271)	Top-5 acc 61.328 (62.275)	lr 0.02434
Train [13][1660/3239]	Time 0.561 (0.869)	Data Time 0.001 (0.013)	Loss 3.6796 (3.6388)	Entropy 1.35287 (1.36413)	Top-1 acc 38.672 (38.276)	Top-5 acc 64.062 (62.275)	lr 0.02434
Train [13][1670/3239]	Time 0.619 (0.869)	Data Time 0.001 (0.013)	Loss 3.8939 (3.6386)	Entropy 1.35278 (1.36406)	Top-1 acc 29.297 (38.282)	Top-5 acc 55.859 (62.277)	lr 0.02434
Train [13][1680/3239]	Time 0.575 (0.869)	Data Time 0.001 (0.013)	Loss 3.3198 (3.6382)	Entropy 1.35222 (1.36399)	Top-1 acc 44.141 (38.285)	Top-5 acc 70.703 (62.282)	lr 0.02433
Train [13][1690/3239]	Time 0.691 (0.869)	Data Time 0.001 (0.013)	Loss 3.7156 (3.6380)	Entropy 1.35234 (1.36392)	Top-1 acc 33.203 (38.290)	Top-5 acc 62.109 (62.282)	lr 0.02433
Train [13][1700/3239]	Time 0.697 (0.880)	Data Time 0.005 (0.013)	Loss 3.8484 (3.6381)	Entropy 1.35241 (1.36386)	Top-1 acc 32.812 (38.288)	Top-5 acc 57.031 (62.281)	lr 0.02433
Train [13][1710/3239]	Time 0.643 (0.880)	Data Time 0.002 (0.013)	Loss 3.6068 (3.6380)	Entropy 1.35224 (1.36379)	Top-1 acc 41.797 (38.290)	Top-5 acc 61.719 (62.279)	lr 0.02433
Train [13][1720/3239]	Time 0.573 (0.880)	Data Time 0.002 (0.013)	Loss 3.7682 (3.6379)	Entropy 1.35216 (1.36372)	Top-1 acc 35.547 (38.289)	Top-5 acc 59.766 (62.280)	lr 0.02433
Train [13][1730/3239]	Time 0.530 (0.879)	Data Time 0.001 (0.013)	Loss 3.8153 (3.6379)	Entropy 1.35156 (1.36365)	Top-1 acc 33.984 (38.290)	Top-5 acc 60.547 (62.275)	lr 0.02433
Train [13][1740/3239]	Time 0.563 (0.879)	Data Time 0.001 (0.013)	Loss 3.6371 (3.6373)	Entropy 1.35097 (1.36358)	Top-1 acc 37.891 (38.302)	Top-5 acc 60.938 (62.292)	lr 0.02433
Train [13][1750/3239]	Time 0.543 (0.879)	Data Time 0.001 (0.013)	Loss 3.6285 (3.6376)	Entropy 1.35119 (1.36351)	Top-1 acc 37.891 (38.295)	Top-5 acc 65.625 (62.289)	lr 0.02433
Train [13][1760/3239]	Time 0.589 (0.879)	Data Time 0.003 (0.013)	Loss 3.6332 (3.6374)	Entropy 1.35096 (1.36344)	Top-1 acc 39.453 (38.300)	Top-5 acc 62.500 (62.295)	lr 0.02433
Train [13][1770/3239]	Time 0.459 (0.878)	Data Time 0.001 (0.012)	Loss 3.8076 (3.6375)	Entropy 1.35043 (1.36337)	Top-1 acc 33.203 (38.295)	Top-5 acc 58.984 (62.294)	lr 0.02433
Train [13][1780/3239]	Time 0.615 (0.878)	Data Time 0.001 (0.013)	Loss 3.7453 (3.6374)	Entropy 1.35014 (1.36330)	Top-1 acc 35.938 (38.297)	Top-5 acc 59.375 (62.294)	lr 0.02433
Train [13][1790/3239]	Time 0.579 (0.878)	Data Time 0.001 (0.012)	Loss 3.6218 (3.6373)	Entropy 1.34959 (1.36322)	Top-1 acc 38.672 (38.294)	Top-5 acc 60.156 (62.296)	lr 0.02433
Train [13][1800/3239]	Time 0.625 (0.878)	Data Time 0.001 (0.012)	Loss 3.6530 (3.6370)	Entropy 1.34938 (1.36315)	Top-1 acc 35.547 (38.299)	Top-5 acc 62.500 (62.306)	lr 0.02433
Train [13][1810/3239]	Time 0.498 (0.878)	Data Time 0.001 (0.012)	Loss 3.5539 (3.6368)	Entropy 1.34902 (1.36307)	Top-1 acc 35.547 (38.304)	Top-5 acc 62.500 (62.308)	lr 0.02433
Train [13][1820/3239]	Time 0.591 (0.877)	Data Time 0.001 (0.012)	Loss 4.0030 (3.6370)	Entropy 1.34842 (1.36299)	Top-1 acc 26.953 (38.299)	Top-5 acc 53.125 (62.304)	lr 0.02433
Train [13][1830/3239]	Time 0.596 (0.877)	Data Time 0.001 (0.012)	Loss 3.6347 (3.6367)	Entropy 1.34883 (1.36291)	Top-1 acc 37.891 (38.304)	Top-5 acc 64.062 (62.312)	lr 0.02433
Train [13][1840/3239]	Time 0.534 (0.877)	Data Time 0.001 (0.012)	Loss 3.6892 (3.6364)	Entropy 1.34866 (1.36284)	Top-1 acc 35.547 (38.305)	Top-5 acc 59.766 (62.314)	lr 0.02433
Train [13][1850/3239]	Time 0.570 (0.877)	Data Time 0.001 (0.012)	Loss 3.5620 (3.6363)	Entropy 1.34850 (1.36276)	Top-1 acc 36.328 (38.303)	Top-5 acc 65.625 (62.314)	lr 0.02433
Train [13][1860/3239]	Time 0.563 (0.876)	Data Time 0.001 (0.012)	Loss 3.7567 (3.6361)	Entropy 1.34824 (1.36268)	Top-1 acc 33.984 (38.308)	Top-5 acc 58.984 (62.317)	lr 0.02433
Train [13][1870/3239]	Time 0.566 (0.876)	Data Time 0.001 (0.012)	Loss 3.4794 (3.6363)	Entropy 1.34802 (1.36261)	Top-1 acc 42.969 (38.303)	Top-5 acc 67.969 (62.312)	lr 0.02433
Train [13][1880/3239]	Time 0.551 (0.876)	Data Time 0.002 (0.012)	Loss 3.7460 (3.6363)	Entropy 1.34750 (1.36253)	Top-1 acc 35.156 (38.300)	Top-5 acc 62.500 (62.315)	lr 0.02433
Train [13][1890/3239]	Time 0.586 (0.876)	Data Time 0.001 (0.012)	Loss 3.6686 (3.6362)	Entropy 1.34739 (1.36245)	Top-1 acc 36.328 (38.301)	Top-5 acc 61.719 (62.317)	lr 0.02433
Train [13][1900/3239]	Time 0.590 (0.876)	Data Time 0.001 (0.012)	Loss 3.5526 (3.6365)	Entropy 1.34724 (1.36237)	Top-1 acc 39.062 (38.291)	Top-5 acc 61.328 (62.307)	lr 0.02433
Train [13][1910/3239]	Time 0.596 (0.876)	Data Time 0.001 (0.012)	Loss 3.9428 (3.6367)	Entropy 1.34679 (1.36229)	Top-1 acc 32.422 (38.288)	Top-5 acc 54.297 (62.297)	lr 0.02433
Train [13][1920/3239]	Time 0.720 (0.875)	Data Time 0.001 (0.012)	Loss 3.6949 (3.6365)	Entropy 1.34685 (1.36221)	Top-1 acc 38.281 (38.292)	Top-5 acc 59.766 (62.302)	lr 0.02433
Train [13][1930/3239]	Time 0.604 (0.875)	Data Time 0.001 (0.012)	Loss 3.6606 (3.6367)	Entropy 1.34649 (1.36213)	Top-1 acc 39.844 (38.292)	Top-5 acc 62.891 (62.304)	lr 0.02433
Train [13][1940/3239]	Time 0.554 (0.875)	Data Time 0.001 (0.012)	Loss 3.6199 (3.6364)	Entropy 1.34590 (1.36204)	Top-1 acc 40.234 (38.290)	Top-5 acc 63.672 (62.307)	lr 0.02433
Train [13][1950/3239]	Time 0.578 (0.875)	Data Time 0.002 (0.012)	Loss 3.6268 (3.6364)	Entropy 1.34555 (1.36196)	Top-1 acc 38.672 (38.293)	Top-5 acc 63.281 (62.312)	lr 0.02433
Train [13][1960/3239]	Time 0.549 (0.875)	Data Time 0.001 (0.012)	Loss 3.5759 (3.6363)	Entropy 1.34567 (1.36188)	Top-1 acc 40.625 (38.296)	Top-5 acc 62.891 (62.319)	lr 0.02433
Train [13][1970/3239]	Time 0.624 (0.875)	Data Time 0.001 (0.012)	Loss 3.5164 (3.6361)	Entropy 1.34532 (1.36179)	Top-1 acc 39.844 (38.299)	Top-5 acc 66.797 (62.323)	lr 0.02433
Train [13][1980/3239]	Time 0.622 (0.874)	Data Time 0.002 (0.011)	Loss 3.5247 (3.6362)	Entropy 1.34507 (1.36171)	Top-1 acc 37.891 (38.298)	Top-5 acc 65.625 (62.324)	lr 0.02432
Train [13][1990/3239]	Time 0.689 (0.874)	Data Time 0.001 (0.011)	Loss 3.4644 (3.6360)	Entropy 1.34543 (1.36163)	Top-1 acc 40.234 (38.304)	Top-5 acc 65.625 (62.329)	lr 0.02432
Train [13][2000/3239]	Time 0.575 (0.874)	Data Time 0.001 (0.011)	Loss 3.6996 (3.6359)	Entropy 1.34527 (1.36155)	Top-1 acc 36.328 (38.308)	Top-5 acc 60.547 (62.328)	lr 0.02432
Train [13][2010/3239]	Time 0.577 (0.873)	Data Time 0.001 (0.011)	Loss 3.5905 (3.6358)	Entropy 1.34486 (1.36147)	Top-1 acc 37.891 (38.313)	Top-5 acc 61.719 (62.330)	lr 0.02432
Train [13][2020/3239]	Time 0.580 (0.873)	Data Time 0.001 (0.011)	Loss 3.6644 (3.6359)	Entropy 1.34516 (1.36138)	Top-1 acc 39.844 (38.317)	Top-5 acc 60.156 (62.321)	lr 0.02432
Train [13][2030/3239]	Time 0.556 (0.873)	Data Time 0.001 (0.011)	Loss 3.5221 (3.6358)	Entropy 1.34480 (1.36130)	Top-1 acc 42.969 (38.320)	Top-5 acc 63.281 (62.326)	lr 0.02432
Train [13][2040/3239]	Time 0.561 (0.873)	Data Time 0.001 (0.011)	Loss 3.8071 (3.6358)	Entropy 1.34449 (1.36122)	Top-1 acc 32.812 (38.315)	Top-5 acc 56.641 (62.324)	lr 0.02432
Train [13][2050/3239]	Time 0.556 (0.873)	Data Time 0.001 (0.011)	Loss 3.6628 (3.6358)	Entropy 1.34439 (1.36114)	Top-1 acc 39.062 (38.316)	Top-5 acc 60.938 (62.324)	lr 0.02432
Train [13][2060/3239]	Time 0.680 (0.873)	Data Time 0.001 (0.011)	Loss 3.5266 (3.6358)	Entropy 1.34431 (1.36106)	Top-1 acc 39.062 (38.313)	Top-5 acc 64.844 (62.320)	lr 0.02432
Train [13][2070/3239]	Time 0.577 (0.873)	Data Time 0.001 (0.011)	Loss 3.8579 (3.6361)	Entropy 1.34405 (1.36098)	Top-1 acc 32.812 (38.310)	Top-5 acc 55.078 (62.313)	lr 0.02432
Train [13][2080/3239]	Time 0.600 (0.872)	Data Time 0.001 (0.011)	Loss 3.6968 (3.6360)	Entropy 1.34376 (1.36090)	Top-1 acc 37.109 (38.315)	Top-5 acc 62.109 (62.316)	lr 0.02432
Train [13][2090/3239]	Time 0.609 (0.872)	Data Time 0.001 (0.011)	Loss 3.4933 (3.6358)	Entropy 1.34331 (1.36081)	Top-1 acc 40.625 (38.318)	Top-5 acc 65.234 (62.323)	lr 0.02432
Train [13][2100/3239]	Time 0.567 (0.872)	Data Time 0.001 (0.011)	Loss 3.6691 (3.6355)	Entropy 1.34310 (1.36073)	Top-1 acc 37.891 (38.320)	Top-5 acc 60.156 (62.326)	lr 0.02432
Train [13][2110/3239]	Time 0.650 (0.872)	Data Time 0.001 (0.011)	Loss 3.6286 (3.6353)	Entropy 1.34315 (1.36065)	Top-1 acc 38.281 (38.321)	Top-5 acc 62.109 (62.330)	lr 0.02432
Train [13][2120/3239]	Time 0.594 (0.872)	Data Time 0.001 (0.011)	Loss 3.7430 (3.6354)	Entropy 1.34321 (1.36056)	Top-1 acc 33.594 (38.320)	Top-5 acc 61.328 (62.332)	lr 0.02432
Train [13][2130/3239]	Time 0.678 (0.872)	Data Time 0.001 (0.011)	Loss 3.6529 (3.6352)	Entropy 1.34300 (1.36048)	Top-1 acc 33.984 (38.323)	Top-5 acc 60.938 (62.339)	lr 0.02432
Train [13][2140/3239]	Time 0.589 (0.872)	Data Time 0.001 (0.011)	Loss 3.6787 (3.6348)	Entropy 1.34256 (1.36040)	Top-1 acc 42.188 (38.329)	Top-5 acc 60.156 (62.346)	lr 0.02432
Train [13][2150/3239]	Time 0.542 (0.871)	Data Time 0.001 (0.011)	Loss 3.4622 (3.6349)	Entropy 1.34262 (1.36032)	Top-1 acc 38.672 (38.324)	Top-5 acc 68.359 (62.343)	lr 0.02432
Train [13][2160/3239]	Time 0.538 (0.871)	Data Time 0.001 (0.011)	Loss 3.7199 (3.6348)	Entropy 1.34241 (1.36024)	Top-1 acc 38.672 (38.330)	Top-5 acc 60.547 (62.346)	lr 0.02432
Train [13][2170/3239]	Time 0.459 (0.871)	Data Time 0.001 (0.011)	Loss 3.5027 (3.6348)	Entropy 1.34241 (1.36015)	Top-1 acc 42.969 (38.330)	Top-5 acc 65.234 (62.345)	lr 0.02432
Train [13][2180/3239]	Time 0.460 (0.871)	Data Time 0.001 (0.011)	Loss 3.6126 (3.6350)	Entropy 1.34255 (1.36007)	Top-1 acc 39.844 (38.323)	Top-5 acc 64.062 (62.341)	lr 0.02432
Train [13][2190/3239]	Time 0.599 (0.870)	Data Time 0.001 (0.011)	Loss 3.5208 (3.6348)	Entropy 1.34265 (1.35999)	Top-1 acc 40.234 (38.323)	Top-5 acc 62.500 (62.344)	lr 0.02432
Train [13][2200/3239]	Time 0.585 (0.870)	Data Time 0.001 (0.011)	Loss 3.6841 (3.6349)	Entropy 1.34275 (1.35991)	Top-1 acc 37.500 (38.323)	Top-5 acc 61.719 (62.339)	lr 0.02432
Train [13][2210/3239]	Time 0.605 (0.870)	Data Time 0.001 (0.010)	Loss 3.6479 (3.6349)	Entropy 1.34250 (1.35984)	Top-1 acc 34.766 (38.321)	Top-5 acc 63.281 (62.340)	lr 0.02432
Train [13][2220/3239]	Time 0.550 (0.870)	Data Time 0.001 (0.010)	Loss 3.7007 (3.6349)	Entropy 1.34240 (1.35976)	Top-1 acc 38.672 (38.329)	Top-5 acc 59.766 (62.338)	lr 0.02432
Train [13][2230/3239]	Time 0.578 (0.870)	Data Time 0.001 (0.010)	Loss 3.4449 (3.6348)	Entropy 1.34215 (1.35968)	Top-1 acc 43.750 (38.330)	Top-5 acc 67.969 (62.341)	lr 0.02432
Train [13][2240/3239]	Time 0.563 (0.870)	Data Time 0.001 (0.010)	Loss 3.6266 (3.6347)	Entropy 1.34207 (1.35960)	Top-1 acc 40.625 (38.330)	Top-5 acc 60.547 (62.343)	lr 0.02432
Train [13][2250/3239]	Time 0.612 (0.869)	Data Time 0.001 (0.010)	Loss 3.6182 (3.6346)	Entropy 1.34219 (1.35952)	Top-1 acc 39.453 (38.329)	Top-5 acc 65.234 (62.344)	lr 0.02432
Train [13][2260/3239]	Time 0.598 (0.869)	Data Time 0.002 (0.010)	Loss 3.9712 (3.6346)	Entropy 1.34209 (1.35945)	Top-1 acc 31.641 (38.328)	Top-5 acc 55.469 (62.346)	lr 0.02432
Train [13][2270/3239]	Time 0.597 (0.869)	Data Time 0.001 (0.010)	Loss 3.6930 (3.6347)	Entropy 1.34161 (1.35937)	Top-1 acc 40.625 (38.329)	Top-5 acc 59.766 (62.344)	lr 0.02432
Train [13][2280/3239]	Time 0.544 (0.869)	Data Time 0.001 (0.010)	Loss 3.8701 (3.6346)	Entropy 1.34159 (1.35929)	Top-1 acc 30.859 (38.319)	Top-5 acc 57.031 (62.348)	lr 0.02432
Train [13][2290/3239]	Time 0.693 (0.869)	Data Time 0.001 (0.010)	Loss 3.7820 (3.6347)	Entropy 1.34136 (1.35921)	Top-1 acc 36.328 (38.322)	Top-5 acc 58.984 (62.350)	lr 0.02431
Train [13][2300/3239]	Time 0.585 (0.869)	Data Time 0.001 (0.010)	Loss 3.7806 (3.6348)	Entropy 1.34154 (1.35914)	Top-1 acc 34.766 (38.324)	Top-5 acc 59.766 (62.348)	lr 0.02431
Train [13][2310/3239]	Time 0.605 (0.869)	Data Time 0.001 (0.010)	Loss 3.5449 (3.6350)	Entropy 1.34161 (1.35906)	Top-1 acc 41.016 (38.320)	Top-5 acc 64.453 (62.346)	lr 0.02431
Train [13][2320/3239]	Time 0.596 (0.868)	Data Time 0.001 (0.010)	Loss 3.7059 (3.6350)	Entropy 1.34140 (1.35898)	Top-1 acc 38.672 (38.320)	Top-5 acc 60.156 (62.344)	lr 0.02431
Train [13][2330/3239]	Time 0.666 (0.868)	Data Time 0.001 (0.010)	Loss 3.7817 (3.6352)	Entropy 1.34139 (1.35891)	Top-1 acc 34.766 (38.314)	Top-5 acc 60.938 (62.340)	lr 0.02431
Train [13][2340/3239]	Time 0.570 (0.868)	Data Time 0.001 (0.010)	Loss 3.6654 (3.6348)	Entropy 1.34124 (1.35883)	Top-1 acc 35.547 (38.325)	Top-5 acc 63.672 (62.349)	lr 0.02431
Train [13][2350/3239]	Time 0.591 (0.868)	Data Time 0.001 (0.010)	Loss 3.6446 (3.6349)	Entropy 1.34108 (1.35876)	Top-1 acc 38.672 (38.326)	Top-5 acc 60.547 (62.349)	lr 0.02431
Train [13][2360/3239]	Time 0.667 (0.876)	Data Time 0.002 (0.010)	Loss 3.6528 (3.6351)	Entropy 1.34098 (1.35868)	Top-1 acc 38.281 (38.321)	Top-5 acc 62.500 (62.342)	lr 0.02431
Train [13][2370/3239]	Time 0.564 (0.876)	Data Time 0.003 (0.010)	Loss 3.7482 (3.6353)	Entropy 1.34113 (1.35861)	Top-1 acc 33.594 (38.317)	Top-5 acc 59.766 (62.338)	lr 0.02431
Train [13][2380/3239]	Time 0.608 (0.876)	Data Time 0.001 (0.010)	Loss 3.7447 (3.6355)	Entropy 1.34039 (1.35854)	Top-1 acc 33.594 (38.311)	Top-5 acc 58.594 (62.333)	lr 0.02431
Train [13][2390/3239]	Time 0.555 (0.876)	Data Time 0.001 (0.010)	Loss 3.4392 (3.6354)	Entropy 1.34006 (1.35846)	Top-1 acc 42.969 (38.312)	Top-5 acc 66.016 (62.337)	lr 0.02431
Train [13][2400/3239]	Time 0.514 (0.876)	Data Time 0.001 (0.010)	Loss 3.6591 (3.6355)	Entropy 1.33998 (1.35838)	Top-1 acc 36.719 (38.311)	Top-5 acc 59.766 (62.332)	lr 0.02431
Train [13][2410/3239]	Time 0.602 (0.876)	Data Time 0.001 (0.010)	Loss 3.6217 (3.6356)	Entropy 1.33971 (1.35831)	Top-1 acc 41.016 (38.308)	Top-5 acc 64.062 (62.333)	lr 0.02431
Train [13][2420/3239]	Time 0.553 (0.876)	Data Time 0.001 (0.010)	Loss 3.4423 (3.6355)	Entropy 1.33988 (1.35823)	Top-1 acc 40.234 (38.311)	Top-5 acc 66.797 (62.337)	lr 0.02431
Train [13][2430/3239]	Time 0.596 (0.876)	Data Time 0.001 (0.010)	Loss 3.7586 (3.6352)	Entropy 1.33964 (1.35815)	Top-1 acc 37.109 (38.315)	Top-5 acc 60.156 (62.343)	lr 0.02431
Train [13][2440/3239]	Time 0.582 (0.875)	Data Time 0.001 (0.010)	Loss 3.4995 (3.6352)	Entropy 1.33983 (1.35808)	Top-1 acc 40.625 (38.312)	Top-5 acc 66.406 (62.345)	lr 0.02431
Train [13][2450/3239]	Time 0.580 (0.875)	Data Time 0.001 (0.010)	Loss 3.7458 (3.6349)	Entropy 1.33990 (1.35800)	Top-1 acc 36.328 (38.316)	Top-5 acc 62.500 (62.349)	lr 0.02431
Train [13][2460/3239]	Time 0.533 (0.875)	Data Time 0.001 (0.010)	Loss 3.7028 (3.6349)	Entropy 1.33956 (1.35793)	Top-1 acc 37.500 (38.313)	Top-5 acc 62.109 (62.345)	lr 0.02431
Train [13][2470/3239]	Time 0.630 (0.875)	Data Time 0.002 (0.010)	Loss 3.6802 (3.6350)	Entropy 1.33938 (1.35786)	Top-1 acc 37.500 (38.311)	Top-5 acc 62.500 (62.346)	lr 0.02431
Train [13][2480/3239]	Time 0.537 (0.875)	Data Time 0.001 (0.010)	Loss 3.6013 (3.6348)	Entropy 1.33885 (1.35778)	Top-1 acc 40.625 (38.314)	Top-5 acc 62.891 (62.348)	lr 0.02431
Train [13][2490/3239]	Time 0.652 (0.874)	Data Time 0.001 (0.010)	Loss 3.4467 (3.6348)	Entropy 1.33881 (1.35770)	Top-1 acc 42.969 (38.316)	Top-5 acc 63.672 (62.347)	lr 0.02431
Train [13][2500/3239]	Time 0.626 (0.874)	Data Time 0.001 (0.010)	Loss 3.7798 (3.6347)	Entropy 1.33877 (1.35763)	Top-1 acc 36.328 (38.317)	Top-5 acc 56.250 (62.347)	lr 0.02431
Train [13][2510/3239]	Time 0.585 (0.874)	Data Time 0.001 (0.009)	Loss 3.6822 (3.6349)	Entropy 1.33874 (1.35755)	Top-1 acc 39.844 (38.314)	Top-5 acc 62.109 (62.340)	lr 0.02431
Train [13][2520/3239]	Time 0.666 (0.874)	Data Time 0.001 (0.009)	Loss 3.6705 (3.6352)	Entropy 1.33888 (1.35748)	Top-1 acc 37.891 (38.312)	Top-5 acc 62.109 (62.332)	lr 0.02431
Train [13][2530/3239]	Time 0.635 (0.874)	Data Time 0.001 (0.009)	Loss 3.6077 (3.6353)	Entropy 1.33856 (1.35741)	Top-1 acc 40.625 (38.312)	Top-5 acc 59.375 (62.328)	lr 0.02431
Train [13][2540/3239]	Time 0.565 (0.874)	Data Time 0.001 (0.009)	Loss 3.7490 (3.6353)	Entropy 1.33836 (1.35733)	Top-1 acc 36.719 (38.317)	Top-5 acc 59.375 (62.326)	lr 0.02431
Train [13][2550/3239]	Time 0.543 (0.873)	Data Time 0.001 (0.009)	Loss 3.7553 (3.6354)	Entropy 1.33827 (1.35726)	Top-1 acc 35.156 (38.316)	Top-5 acc 60.938 (62.325)	lr 0.02431
Train [13][2560/3239]	Time 0.504 (0.873)	Data Time 0.002 (0.009)	Loss 3.6978 (3.6359)	Entropy 1.33795 (1.35718)	Top-1 acc 37.109 (38.311)	Top-5 acc 59.766 (62.311)	lr 0.02431
Train [13][2570/3239]	Time 0.595 (0.873)	Data Time 0.002 (0.009)	Loss 3.5137 (3.6356)	Entropy 1.33793 (1.35711)	Top-1 acc 39.062 (38.314)	Top-5 acc 66.406 (62.316)	lr 0.02431
Train [13][2580/3239]	Time 0.581 (0.873)	Data Time 0.001 (0.009)	Loss 3.6707 (3.6354)	Entropy 1.33766 (1.35703)	Top-1 acc 37.891 (38.320)	Top-5 acc 60.156 (62.320)	lr 0.02431
Train [13][2590/3239]	Time 0.709 (0.873)	Data Time 0.001 (0.009)	Loss 3.6363 (3.6352)	Entropy 1.33746 (1.35696)	Top-1 acc 40.234 (38.321)	Top-5 acc 62.891 (62.322)	lr 0.02430
Train [13][2600/3239]	Time 0.604 (0.873)	Data Time 0.001 (0.009)	Loss 3.6475 (3.6352)	Entropy 1.33713 (1.35688)	Top-1 acc 35.547 (38.320)	Top-5 acc 59.375 (62.320)	lr 0.02430
Train [13][2610/3239]	Time 0.642 (0.873)	Data Time 0.003 (0.009)	Loss 3.3383 (3.6351)	Entropy 1.33683 (1.35681)	Top-1 acc 46.875 (38.323)	Top-5 acc 67.578 (62.318)	lr 0.02430
Train [13][2620/3239]	Time 0.608 (0.873)	Data Time 0.001 (0.009)	Loss 3.6530 (3.6352)	Entropy 1.33679 (1.35673)	Top-1 acc 37.109 (38.320)	Top-5 acc 62.891 (62.318)	lr 0.02430
Train [13][2630/3239]	Time 0.594 (0.873)	Data Time 0.001 (0.009)	Loss 3.8795 (3.6353)	Entropy 1.33652 (1.35665)	Top-1 acc 33.984 (38.321)	Top-5 acc 56.250 (62.317)	lr 0.02430
Train [13][2640/3239]	Time 0.614 (0.872)	Data Time 0.001 (0.009)	Loss 3.5455 (3.6352)	Entropy 1.33665 (1.35658)	Top-1 acc 38.672 (38.323)	Top-5 acc 62.891 (62.319)	lr 0.02430
Train [13][2650/3239]	Time 0.549 (0.872)	Data Time 0.001 (0.009)	Loss 3.7764 (3.6350)	Entropy 1.33646 (1.35650)	Top-1 acc 35.938 (38.321)	Top-5 acc 60.938 (62.323)	lr 0.02430
Train [13][2660/3239]	Time 0.545 (0.872)	Data Time 0.001 (0.009)	Loss 3.6122 (3.6348)	Entropy 1.33598 (1.35643)	Top-1 acc 32.031 (38.321)	Top-5 acc 65.234 (62.332)	lr 0.02430
Train [13][2670/3239]	Time 0.587 (0.872)	Data Time 0.001 (0.009)	Loss 3.5483 (3.6349)	Entropy 1.33601 (1.35635)	Top-1 acc 38.281 (38.318)	Top-5 acc 63.672 (62.328)	lr 0.02430
Train [13][2680/3239]	Time 0.574 (0.872)	Data Time 0.001 (0.009)	Loss 3.4379 (3.6348)	Entropy 1.33563 (1.35627)	Top-1 acc 42.969 (38.321)	Top-5 acc 66.016 (62.329)	lr 0.02430
Train [13][2690/3239]	Time 0.571 (0.872)	Data Time 0.001 (0.009)	Loss 3.7738 (3.6348)	Entropy 1.33499 (1.35620)	Top-1 acc 34.375 (38.321)	Top-5 acc 60.547 (62.332)	lr 0.02430
Train [13][2700/3239]	Time 0.593 (0.871)	Data Time 0.001 (0.009)	Loss 3.7180 (3.6351)	Entropy 1.33507 (1.35612)	Top-1 acc 37.500 (38.320)	Top-5 acc 63.281 (62.329)	lr 0.02430
Train [13][2710/3239]	Time 0.635 (0.871)	Data Time 0.001 (0.009)	Loss 3.5677 (3.6349)	Entropy 1.33478 (1.35604)	Top-1 acc 40.625 (38.322)	Top-5 acc 63.281 (62.330)	lr 0.02430
Train [13][2720/3239]	Time 0.595 (0.871)	Data Time 0.001 (0.009)	Loss 3.4461 (3.6347)	Entropy 1.33437 (1.35596)	Top-1 acc 41.406 (38.319)	Top-5 acc 66.797 (62.333)	lr 0.02430
Train [13][2730/3239]	Time 0.625 (0.871)	Data Time 0.002 (0.009)	Loss 3.6551 (3.6346)	Entropy 1.33411 (1.35588)	Top-1 acc 36.719 (38.324)	Top-5 acc 60.938 (62.336)	lr 0.02430
Train [13][2740/3239]	Time 0.591 (0.871)	Data Time 0.001 (0.009)	Loss 3.6754 (3.6345)	Entropy 1.33379 (1.35580)	Top-1 acc 30.859 (38.323)	Top-5 acc 64.062 (62.338)	lr 0.02430
Train [13][2750/3239]	Time 0.738 (0.871)	Data Time 0.001 (0.009)	Loss 3.4884 (3.6347)	Entropy 1.33296 (1.35572)	Top-1 acc 39.062 (38.318)	Top-5 acc 66.406 (62.335)	lr 0.02430
Train [13][2760/3239]	Time 0.594 (0.871)	Data Time 0.001 (0.009)	Loss 3.5739 (3.6347)	Entropy 1.33246 (1.35564)	Top-1 acc 33.984 (38.315)	Top-5 acc 66.016 (62.335)	lr 0.02430
Train [13][2770/3239]	Time 0.611 (0.871)	Data Time 0.001 (0.009)	Loss 3.3912 (3.6343)	Entropy 1.33198 (1.35555)	Top-1 acc 46.875 (38.324)	Top-5 acc 67.578 (62.341)	lr 0.02430
Train [13][2780/3239]	Time 0.560 (0.871)	Data Time 0.001 (0.009)	Loss 3.5611 (3.6341)	Entropy 1.33211 (1.35547)	Top-1 acc 37.891 (38.328)	Top-5 acc 66.016 (62.345)	lr 0.02430
Train [13][2790/3239]	Time 0.589 (0.871)	Data Time 0.001 (0.009)	Loss 3.5991 (3.6340)	Entropy 1.33216 (1.35539)	Top-1 acc 39.844 (38.331)	Top-5 acc 66.797 (62.349)	lr 0.02430
Train [13][2800/3239]	Time 0.660 (0.871)	Data Time 0.001 (0.009)	Loss 3.5541 (3.6339)	Entropy 1.33202 (1.35530)	Top-1 acc 37.500 (38.332)	Top-5 acc 62.891 (62.352)	lr 0.02430
Train [13][2810/3239]	Time 0.600 (0.870)	Data Time 0.001 (0.009)	Loss 3.5571 (3.6339)	Entropy 1.33219 (1.35522)	Top-1 acc 41.016 (38.331)	Top-5 acc 64.453 (62.348)	lr 0.02430
Train [13][2820/3239]	Time 0.684 (0.870)	Data Time 0.001 (0.009)	Loss 3.5019 (3.6338)	Entropy 1.33178 (1.35514)	Top-1 acc 39.844 (38.337)	Top-5 acc 62.891 (62.351)	lr 0.02430
Train [13][2830/3239]	Time 0.459 (0.870)	Data Time 0.001 (0.009)	Loss 3.8586 (3.6336)	Entropy 1.33139 (1.35505)	Top-1 acc 32.031 (38.342)	Top-5 acc 55.469 (62.355)	lr 0.02430
Train [13][2840/3239]	Time 0.586 (0.870)	Data Time 0.001 (0.009)	Loss 3.5489 (3.6336)	Entropy 1.33114 (1.35497)	Top-1 acc 41.406 (38.344)	Top-5 acc 64.062 (62.356)	lr 0.02430
Train [13][2850/3239]	Time 0.583 (0.870)	Data Time 0.001 (0.009)	Loss 3.4412 (3.6333)	Entropy 1.33091 (1.35489)	Top-1 acc 42.188 (38.348)	Top-5 acc 67.188 (62.362)	lr 0.02430
Train [13][2860/3239]	Time 0.630 (0.870)	Data Time 0.001 (0.009)	Loss 3.5796 (3.6334)	Entropy 1.33111 (1.35480)	Top-1 acc 40.234 (38.346)	Top-5 acc 64.062 (62.362)	lr 0.02430
Train [13][2870/3239]	Time 0.619 (0.870)	Data Time 0.001 (0.009)	Loss 3.8524 (3.6333)	Entropy 1.33103 (1.35472)	Top-1 acc 37.109 (38.350)	Top-5 acc 59.375 (62.365)	lr 0.02430
Train [13][2880/3239]	Time 0.582 (0.869)	Data Time 0.001 (0.009)	Loss 3.6519 (3.6333)	Entropy 1.33055 (1.35464)	Top-1 acc 39.453 (38.351)	Top-5 acc 61.328 (62.362)	lr 0.02430
Train [13][2890/3239]	Time 0.709 (0.869)	Data Time 0.002 (0.009)	Loss 3.4654 (3.6329)	Entropy 1.33034 (1.35455)	Top-1 acc 41.016 (38.359)	Top-5 acc 65.625 (62.370)	lr 0.02429
Train [13][2900/3239]	Time 0.530 (0.869)	Data Time 0.001 (0.008)	Loss 3.5883 (3.6330)	Entropy 1.33027 (1.35447)	Top-1 acc 38.281 (38.357)	Top-5 acc 62.891 (62.368)	lr 0.02429
Train [13][2910/3239]	Time 0.580 (0.869)	Data Time 0.001 (0.008)	Loss 3.5441 (3.6329)	Entropy 1.33022 (1.35439)	Top-1 acc 36.328 (38.357)	Top-5 acc 64.844 (62.371)	lr 0.02429
Train [13][2920/3239]	Time 0.650 (0.869)	Data Time 0.001 (0.008)	Loss 3.6341 (3.6329)	Entropy 1.33063 (1.35431)	Top-1 acc 36.328 (38.352)	Top-5 acc 60.547 (62.373)	lr 0.02429
Train [13][2930/3239]	Time 0.546 (0.869)	Data Time 0.001 (0.008)	Loss 3.6144 (3.6326)	Entropy 1.33034 (1.35422)	Top-1 acc 39.844 (38.359)	Top-5 acc 61.719 (62.380)	lr 0.02429
Train [13][2940/3239]	Time 0.619 (0.869)	Data Time 0.001 (0.008)	Loss 3.7553 (3.6327)	Entropy 1.33015 (1.35414)	Top-1 acc 35.938 (38.357)	Top-5 acc 59.766 (62.376)	lr 0.02429
Train [13][2950/3239]	Time 0.531 (0.869)	Data Time 0.001 (0.008)	Loss 3.6349 (3.6329)	Entropy 1.32985 (1.35406)	Top-1 acc 37.109 (38.350)	Top-5 acc 64.844 (62.375)	lr 0.02429
Train [13][2960/3239]	Time 0.715 (0.869)	Data Time 0.001 (0.008)	Loss 3.5755 (3.6326)	Entropy 1.33026 (1.35398)	Top-1 acc 37.500 (38.359)	Top-5 acc 61.719 (62.384)	lr 0.02429
Train [13][2970/3239]	Time 0.558 (0.869)	Data Time 0.001 (0.008)	Loss 3.5927 (3.6325)	Entropy 1.33025 (1.35390)	Top-1 acc 36.719 (38.357)	Top-5 acc 61.719 (62.385)	lr 0.02429
Train [13][2980/3239]	Time 0.618 (0.868)	Data Time 0.001 (0.008)	Loss 3.5285 (3.6324)	Entropy 1.33002 (1.35382)	Top-1 acc 43.359 (38.362)	Top-5 acc 66.016 (62.386)	lr 0.02429
Train [13][2990/3239]	Time 0.548 (0.868)	Data Time 0.001 (0.008)	Loss 3.6965 (3.6322)	Entropy 1.32980 (1.35374)	Top-1 acc 41.016 (38.366)	Top-5 acc 61.328 (62.391)	lr 0.02429
Train [13][3000/3239]	Time 0.538 (0.868)	Data Time 0.001 (0.008)	Loss 3.7548 (3.6323)	Entropy 1.32972 (1.35366)	Top-1 acc 37.500 (38.364)	Top-5 acc 59.766 (62.386)	lr 0.02429
Train [13][3010/3239]	Time 0.793 (0.874)	Data Time 0.008 (0.008)	Loss 3.6550 (3.6323)	Entropy 1.32956 (1.35358)	Top-1 acc 34.375 (38.362)	Top-5 acc 59.766 (62.387)	lr 0.02429
Train [13][3020/3239]	Time 0.584 (0.874)	Data Time 0.002 (0.008)	Loss 3.7386 (3.6322)	Entropy 1.32929 (1.35350)	Top-1 acc 37.891 (38.364)	Top-5 acc 58.594 (62.388)	lr 0.02429
Train [13][3030/3239]	Time 0.548 (0.874)	Data Time 0.001 (0.008)	Loss 3.5552 (3.6320)	Entropy 1.32914 (1.35342)	Top-1 acc 40.234 (38.370)	Top-5 acc 64.062 (62.391)	lr 0.02429
Train [13][3040/3239]	Time 0.570 (0.874)	Data Time 0.001 (0.008)	Loss 3.8001 (3.6319)	Entropy 1.32914 (1.35334)	Top-1 acc 34.375 (38.368)	Top-5 acc 58.594 (62.390)	lr 0.02429
Train [13][3050/3239]	Time 0.561 (0.874)	Data Time 0.001 (0.008)	Loss 3.4008 (3.6316)	Entropy 1.32935 (1.35326)	Top-1 acc 42.578 (38.373)	Top-5 acc 66.406 (62.395)	lr 0.02429
Train [13][3060/3239]	Time 0.555 (0.874)	Data Time 0.001 (0.008)	Loss 3.5054 (3.6317)	Entropy 1.32913 (1.35318)	Top-1 acc 41.406 (38.371)	Top-5 acc 63.281 (62.394)	lr 0.02429
Train [13][3070/3239]	Time 0.594 (0.874)	Data Time 0.001 (0.008)	Loss 3.7180 (3.6317)	Entropy 1.32940 (1.35311)	Top-1 acc 37.891 (38.371)	Top-5 acc 60.938 (62.394)	lr 0.02429
Train [13][3080/3239]	Time 0.590 (0.874)	Data Time 0.001 (0.008)	Loss 3.7325 (3.6318)	Entropy 1.32934 (1.35303)	Top-1 acc 33.984 (38.367)	Top-5 acc 59.766 (62.391)	lr 0.02429
Train [13][3090/3239]	Time 0.640 (0.874)	Data Time 0.002 (0.008)	Loss 3.7209 (3.6318)	Entropy 1.32925 (1.35295)	Top-1 acc 35.156 (38.363)	Top-5 acc 57.812 (62.390)	lr 0.02429
Train [13][3100/3239]	Time 0.542 (0.874)	Data Time 0.001 (0.008)	Loss 3.8145 (3.6318)	Entropy 1.32934 (1.35288)	Top-1 acc 34.375 (38.363)	Top-5 acc 59.766 (62.388)	lr 0.02429
Train [13][3110/3239]	Time 0.596 (0.873)	Data Time 0.001 (0.008)	Loss 3.6370 (3.6320)	Entropy 1.32953 (1.35280)	Top-1 acc 39.844 (38.357)	Top-5 acc 65.234 (62.387)	lr 0.02429
Train [13][3120/3239]	Time 0.686 (0.873)	Data Time 0.001 (0.008)	Loss 3.7172 (3.6323)	Entropy 1.32926 (1.35273)	Top-1 acc 37.891 (38.354)	Top-5 acc 62.500 (62.382)	lr 0.02429
Train [13][3130/3239]	Time 0.598 (0.873)	Data Time 0.002 (0.008)	Loss 3.4823 (3.6322)	Entropy 1.32904 (1.35265)	Top-1 acc 43.750 (38.352)	Top-5 acc 65.234 (62.384)	lr 0.02429
Train [13][3140/3239]	Time 0.578 (0.873)	Data Time 0.001 (0.008)	Loss 3.6246 (3.6320)	Entropy 1.32909 (1.35257)	Top-1 acc 36.328 (38.355)	Top-5 acc 61.719 (62.389)	lr 0.02429
Train [13][3150/3239]	Time 0.641 (0.873)	Data Time 0.003 (0.008)	Loss 3.5020 (3.6320)	Entropy 1.32878 (1.35250)	Top-1 acc 39.062 (38.353)	Top-5 acc 67.578 (62.390)	lr 0.02429
Train [13][3160/3239]	Time 0.573 (0.873)	Data Time 0.001 (0.008)	Loss 3.7625 (3.6320)	Entropy 1.32843 (1.35242)	Top-1 acc 38.281 (38.353)	Top-5 acc 59.766 (62.390)	lr 0.02429
Train [13][3170/3239]	Time 0.608 (0.873)	Data Time 0.001 (0.008)	Loss 3.5222 (3.6319)	Entropy 1.32844 (1.35235)	Top-1 acc 41.406 (38.352)	Top-5 acc 65.625 (62.388)	lr 0.02429
Train [13][3180/3239]	Time 0.633 (0.873)	Data Time 0.000 (0.008)	Loss 3.6440 (3.6318)	Entropy 1.32847 (1.35227)	Top-1 acc 38.281 (38.358)	Top-5 acc 62.109 (62.390)	lr 0.02429
Train [13][3190/3239]	Time 0.686 (0.872)	Data Time 0.000 (0.008)	Loss 3.6706 (3.6318)	Entropy 1.32855 (1.35220)	Top-1 acc 39.062 (38.357)	Top-5 acc 61.719 (62.389)	lr 0.02428
Train [13][3200/3239]	Time 0.567 (0.872)	Data Time 0.000 (0.008)	Loss 3.6252 (3.6317)	Entropy 1.32818 (1.35213)	Top-1 acc 40.234 (38.357)	Top-5 acc 62.500 (62.393)	lr 0.02428
Train [13][3210/3239]	Time 0.568 (0.872)	Data Time 0.000 (0.008)	Loss 3.4930 (3.6315)	Entropy 1.32800 (1.35205)	Top-1 acc 40.234 (38.364)	Top-5 acc 63.281 (62.394)	lr 0.02428
Train [13][3220/3239]	Time 0.581 (0.872)	Data Time 0.000 (0.008)	Loss 3.7609 (3.6314)	Entropy 1.32754 (1.35198)	Top-1 acc 36.328 (38.367)	Top-5 acc 58.203 (62.396)	lr 0.02428
Train [13][3230/3239]	Time 0.627 (0.872)	Data Time 0.000 (0.008)	Loss 3.7223 (3.6316)	Entropy 1.32756 (1.35190)	Top-1 acc 35.938 (38.366)	Top-5 acc 61.328 (62.393)	lr 0.02428
Train [13][3239/3239]	Time 1.575 (0.872)	Data Time 0.000 (0.008)	Loss 3.4829 (3.6316)	Entropy 1.32753 (1.35183)	Top-1 acc 46.914 (38.364)	Top-5 acc 62.963 (62.391)	lr 0.02428
==========Valid [13/120]	loss 2.394	top-1 acc 48.273 (48.273)	top-5 acc 72.320	Train top-1 38.364	top-5 62.391	Entropy 1.32753	Latency-None: 0.000ms	Flops: 542.77M
Train [14][0/3239]	Time 22.130 (22.130)	Data Time 19.395 (19.395)	Loss 3.7653 (3.7653)	Entropy 1.32767 (1.32767)	Top-1 acc 34.766 (34.766)	Top-5 acc 59.766 (59.766)	lr 0.02428
Train [14][10/3239]	Time 0.603 (2.811)	Data Time 0.001 (1.765)	Loss 3.4515 (3.5999)	Entropy 1.32744 (1.32759)	Top-1 acc 43.359 (39.098)	Top-5 acc 66.406 (63.459)	lr 0.02428
Train [14][20/3239]	Time 0.689 (1.878)	Data Time 0.001 (0.925)	Loss 3.6534 (3.6134)	Entropy 1.32719 (1.32753)	Top-1 acc 36.719 (38.616)	Top-5 acc 64.844 (63.635)	lr 0.02428
Train [14][30/3239]	Time 0.587 (1.546)	Data Time 0.001 (0.627)	Loss 3.6829 (3.6235)	Entropy 1.32705 (1.32745)	Top-1 acc 37.500 (38.760)	Top-5 acc 57.812 (63.193)	lr 0.02428
Train [14][40/3239]	Time 0.592 (1.374)	Data Time 0.002 (0.475)	Loss 3.9949 (3.6307)	Entropy 1.32670 (1.32733)	Top-1 acc 30.469 (38.510)	Top-5 acc 51.562 (62.681)	lr 0.02428
Train [14][50/3239]	Time 0.613 (1.269)	Data Time 0.001 (0.382)	Loss 3.6791 (3.6260)	Entropy 1.32634 (1.32717)	Top-1 acc 40.234 (38.672)	Top-5 acc 58.203 (62.623)	lr 0.02428
Train [14][60/3239]	Time 0.589 (1.200)	Data Time 0.001 (0.320)	Loss 3.6187 (3.6258)	Entropy 1.32621 (1.32703)	Top-1 acc 37.500 (38.717)	Top-5 acc 62.891 (62.724)	lr 0.02428
Train [14][70/3239]	Time 0.349 (1.146)	Data Time 0.001 (0.275)	Loss 3.5862 (3.6280)	Entropy 1.32629 (1.32692)	Top-1 acc 38.672 (38.639)	Top-5 acc 63.672 (62.616)	lr 0.02428
Train [14][80/3239]	Time 0.583 (1.114)	Data Time 0.001 (0.243)	Loss 3.6468 (3.6231)	Entropy 1.32627 (1.32682)	Top-1 acc 37.891 (38.768)	Top-5 acc 61.719 (62.727)	lr 0.02428
Train [14][90/3239]	Time 0.566 (1.091)	Data Time 0.001 (0.216)	Loss 3.6889 (3.6200)	Entropy 1.32647 (1.32677)	Top-1 acc 37.891 (38.814)	Top-5 acc 60.547 (62.736)	lr 0.02428
Train [14][100/3239]	Time 0.581 (1.062)	Data Time 0.001 (0.195)	Loss 3.6369 (3.6170)	Entropy 1.32566 (1.32671)	Top-1 acc 37.500 (38.846)	Top-5 acc 59.375 (62.798)	lr 0.02428
Train [14][110/3239]	Time 0.586 (1.043)	Data Time 0.001 (0.177)	Loss 3.6925 (3.6213)	Entropy 1.32549 (1.32662)	Top-1 acc 35.938 (38.739)	Top-5 acc 64.062 (62.746)	lr 0.02428
Train [14][120/3239]	Time 0.567 (1.026)	Data Time 0.001 (0.163)	Loss 3.6532 (3.6212)	Entropy 1.32525 (1.32652)	Top-1 acc 37.109 (38.743)	Top-5 acc 64.062 (62.774)	lr 0.02428
Train [14][130/3239]	Time 0.572 (1.012)	Data Time 0.001 (0.151)	Loss 3.6463 (3.6235)	Entropy 1.32510 (1.32642)	Top-1 acc 37.500 (38.627)	Top-5 acc 59.766 (62.691)	lr 0.02428
Train [14][140/3239]	Time 0.607 (0.999)	Data Time 0.001 (0.140)	Loss 3.6275 (3.6193)	Entropy 1.32521 (1.32633)	Top-1 acc 39.844 (38.774)	Top-5 acc 62.109 (62.747)	lr 0.02428
Train [14][150/3239]	Time 0.538 (0.989)	Data Time 0.001 (0.131)	Loss 3.6513 (3.6176)	Entropy 1.32519 (1.32627)	Top-1 acc 37.891 (38.837)	Top-5 acc 62.109 (62.787)	lr 0.02428
Train [14][160/3239]	Time 0.711 (0.980)	Data Time 0.001 (0.123)	Loss 3.6362 (3.6202)	Entropy 1.32454 (1.32619)	Top-1 acc 37.891 (38.791)	Top-5 acc 62.891 (62.706)	lr 0.02428
Train [14][170/3239]	Time 0.662 (0.972)	Data Time 0.001 (0.116)	Loss 3.5941 (3.6185)	Entropy 1.32442 (1.32609)	Top-1 acc 35.547 (38.793)	Top-5 acc 64.062 (62.747)	lr 0.02428
Train [14][180/3239]	Time 0.580 (0.965)	Data Time 0.001 (0.110)	Loss 3.5845 (3.6177)	Entropy 1.32380 (1.32599)	Top-1 acc 40.234 (38.797)	Top-5 acc 62.891 (62.796)	lr 0.02428
Train [14][190/3239]	Time 0.548 (0.958)	Data Time 0.001 (0.104)	Loss 3.9531 (3.6173)	Entropy 1.32352 (1.32587)	Top-1 acc 30.078 (38.756)	Top-5 acc 57.812 (62.866)	lr 0.02428
Train [14][200/3239]	Time 0.616 (0.952)	Data Time 0.001 (0.099)	Loss 3.5067 (3.6175)	Entropy 1.32352 (1.32576)	Top-1 acc 39.844 (38.755)	Top-5 acc 63.672 (62.825)	lr 0.02428
Train [14][210/3239]	Time 0.596 (0.947)	Data Time 0.001 (0.094)	Loss 3.6503 (3.6171)	Entropy 1.32381 (1.32565)	Top-1 acc 40.234 (38.753)	Top-5 acc 61.719 (62.867)	lr 0.02428
Train [14][220/3239]	Time 0.587 (0.942)	Data Time 0.001 (0.090)	Loss 3.7966 (3.6184)	Entropy 1.32364 (1.32557)	Top-1 acc 34.375 (38.755)	Top-5 acc 61.328 (62.848)	lr 0.02428
Train [14][230/3239]	Time 0.574 (0.938)	Data Time 0.001 (0.086)	Loss 3.5940 (3.6170)	Entropy 1.32333 (1.32548)	Top-1 acc 39.062 (38.763)	Top-5 acc 65.625 (62.858)	lr 0.02428
Train [14][240/3239]	Time 0.580 (0.934)	Data Time 0.001 (0.083)	Loss 3.7326 (3.6139)	Entropy 1.32317 (1.32539)	Top-1 acc 35.156 (38.802)	Top-5 acc 62.891 (62.930)	lr 0.02427
Train [14][250/3239]	Time 0.599 (0.929)	Data Time 0.001 (0.080)	Loss 3.5822 (3.6139)	Entropy 1.32301 (1.32530)	Top-1 acc 35.938 (38.842)	Top-5 acc 62.500 (62.919)	lr 0.02427
Train [14][260/3239]	Time 0.570 (0.925)	Data Time 0.001 (0.077)	Loss 3.6047 (3.6099)	Entropy 1.32263 (1.32520)	Top-1 acc 38.281 (38.901)	Top-5 acc 61.328 (62.991)	lr 0.02427
Train [14][270/3239]	Time 0.597 (0.920)	Data Time 0.001 (0.074)	Loss 3.5288 (3.6087)	Entropy 1.32219 (1.32511)	Top-1 acc 45.312 (38.904)	Top-5 acc 65.234 (63.012)	lr 0.02427
Train [14][280/3239]	Time 0.596 (0.916)	Data Time 0.001 (0.071)	Loss 3.4648 (3.6089)	Entropy 1.32194 (1.32501)	Top-1 acc 40.625 (38.903)	Top-5 acc 64.844 (62.982)	lr 0.02427
Train [14][290/3239]	Time 0.591 (0.913)	Data Time 0.003 (0.069)	Loss 3.8046 (3.6103)	Entropy 1.32173 (1.32490)	Top-1 acc 36.328 (38.857)	Top-5 acc 58.594 (62.990)	lr 0.02427
Train [14][300/3239]	Time 0.622 (0.911)	Data Time 0.001 (0.067)	Loss 3.7257 (3.6103)	Entropy 1.32136 (1.32479)	Top-1 acc 37.109 (38.867)	Top-5 acc 59.375 (62.983)	lr 0.02427
Train [14][310/3239]	Time 0.554 (0.909)	Data Time 0.001 (0.065)	Loss 3.4457 (3.6084)	Entropy 1.32086 (1.32467)	Top-1 acc 45.703 (38.904)	Top-5 acc 67.578 (63.044)	lr 0.02427
Train [14][320/3239]	Time 0.694 (0.906)	Data Time 0.001 (0.063)	Loss 3.5425 (3.6071)	Entropy 1.32074 (1.32455)	Top-1 acc 35.547 (38.897)	Top-5 acc 66.016 (63.080)	lr 0.02427
Train [14][330/3239]	Time 0.628 (0.904)	Data Time 0.001 (0.061)	Loss 3.5817 (3.6065)	Entropy 1.32011 (1.32443)	Top-1 acc 38.281 (38.890)	Top-5 acc 64.453 (63.111)	lr 0.02427
Train [14][340/3239]	Time 0.612 (0.902)	Data Time 0.002 (0.059)	Loss 3.4858 (3.6052)	Entropy 1.32034 (1.32430)	Top-1 acc 38.672 (38.911)	Top-5 acc 65.234 (63.132)	lr 0.02427
Train [14][350/3239]	Time 0.553 (0.900)	Data Time 0.001 (0.057)	Loss 3.7656 (3.6070)	Entropy 1.32003 (1.32419)	Top-1 acc 35.938 (38.877)	Top-5 acc 60.938 (63.093)	lr 0.02427
Train [14][360/3239]	Time 0.633 (0.899)	Data Time 0.001 (0.056)	Loss 3.7976 (3.6071)	Entropy 1.31982 (1.32407)	Top-1 acc 32.031 (38.824)	Top-5 acc 58.594 (63.079)	lr 0.02427
Train [14][370/3239]	Time 0.547 (0.897)	Data Time 0.002 (0.055)	Loss 3.3326 (3.6067)	Entropy 1.31970 (1.32395)	Top-1 acc 41.797 (38.842)	Top-5 acc 67.578 (63.099)	lr 0.02427
Train [14][380/3239]	Time 0.607 (0.896)	Data Time 0.001 (0.053)	Loss 3.4580 (3.6045)	Entropy 1.31968 (1.32384)	Top-1 acc 39.844 (38.872)	Top-5 acc 64.844 (63.143)	lr 0.02427
Train [14][390/3239]	Time 0.619 (0.894)	Data Time 0.001 (0.052)	Loss 3.7036 (3.6053)	Entropy 1.31950 (1.32373)	Top-1 acc 39.062 (38.899)	Top-5 acc 63.672 (63.129)	lr 0.02427
Train [14][400/3239]	Time 0.585 (0.893)	Data Time 0.001 (0.051)	Loss 3.6560 (3.6046)	Entropy 1.31907 (1.32362)	Top-1 acc 38.672 (38.953)	Top-5 acc 62.109 (63.125)	lr 0.02427
Train [14][410/3239]	Time 0.624 (0.892)	Data Time 0.001 (0.050)	Loss 3.8763 (3.6054)	Entropy 1.31831 (1.32350)	Top-1 acc 33.984 (38.927)	Top-5 acc 55.859 (63.077)	lr 0.02427
Train [14][420/3239]	Time 0.644 (0.890)	Data Time 0.001 (0.048)	Loss 3.5446 (3.6038)	Entropy 1.31808 (1.32338)	Top-1 acc 42.578 (38.983)	Top-5 acc 65.234 (63.114)	lr 0.02427
Train [14][430/3239]	Time 0.576 (0.934)	Data Time 0.002 (0.047)	Loss 3.7436 (3.6041)	Entropy 1.31779 (1.32325)	Top-1 acc 35.156 (38.964)	Top-5 acc 60.156 (63.102)	lr 0.02427
Train [14][440/3239]	Time 0.574 (0.932)	Data Time 0.001 (0.046)	Loss 3.4429 (3.6039)	Entropy 1.31749 (1.32313)	Top-1 acc 41.016 (38.937)	Top-5 acc 66.406 (63.105)	lr 0.02427
Train [14][450/3239]	Time 0.613 (0.930)	Data Time 0.001 (0.045)	Loss 3.5285 (3.6017)	Entropy 1.31728 (1.32300)	Top-1 acc 38.672 (38.988)	Top-5 acc 64.062 (63.163)	lr 0.02427
Train [14][460/3239]	Time 0.622 (0.928)	Data Time 0.003 (0.045)	Loss 3.6196 (3.6017)	Entropy 1.31685 (1.32287)	Top-1 acc 36.719 (38.978)	Top-5 acc 60.938 (63.165)	lr 0.02427
Train [14][470/3239]	Time 0.551 (0.926)	Data Time 0.001 (0.044)	Loss 3.6902 (3.6022)	Entropy 1.31637 (1.32274)	Top-1 acc 37.891 (38.983)	Top-5 acc 60.547 (63.149)	lr 0.02427
Train [14][480/3239]	Time 0.594 (0.924)	Data Time 0.001 (0.043)	Loss 3.6043 (3.6024)	Entropy 1.31613 (1.32260)	Top-1 acc 39.844 (38.999)	Top-5 acc 64.844 (63.129)	lr 0.02427
Train [14][490/3239]	Time 0.580 (0.923)	Data Time 0.001 (0.042)	Loss 3.6208 (3.6039)	Entropy 1.31558 (1.32247)	Top-1 acc 35.547 (38.946)	Top-5 acc 60.156 (63.087)	lr 0.02427
Train [14][500/3239]	Time 0.576 (0.921)	Data Time 0.002 (0.041)	Loss 3.7398 (3.6057)	Entropy 1.31549 (1.32233)	Top-1 acc 37.891 (38.911)	Top-5 acc 58.594 (63.063)	lr 0.02427
Train [14][510/3239]	Time 0.571 (0.920)	Data Time 0.001 (0.040)	Loss 3.5612 (3.6050)	Entropy 1.31530 (1.32219)	Top-1 acc 39.453 (38.931)	Top-5 acc 66.406 (63.096)	lr 0.02427
Train [14][520/3239]	Time 0.612 (0.918)	Data Time 0.003 (0.040)	Loss 3.4816 (3.6050)	Entropy 1.31545 (1.32206)	Top-1 acc 41.797 (38.926)	Top-5 acc 65.625 (63.087)	lr 0.02427
Train [14][530/3239]	Time 0.580 (0.917)	Data Time 0.001 (0.039)	Loss 3.7682 (3.6053)	Entropy 1.31536 (1.32194)	Top-1 acc 33.203 (38.919)	Top-5 acc 60.938 (63.080)	lr 0.02427
Train [14][540/3239]	Time 0.637 (0.916)	Data Time 0.001 (0.038)	Loss 3.4603 (3.6039)	Entropy 1.31536 (1.32181)	Top-1 acc 41.016 (38.925)	Top-5 acc 65.234 (63.100)	lr 0.02426
Train [14][550/3239]	Time 0.674 (0.914)	Data Time 0.001 (0.038)	Loss 3.4869 (3.6037)	Entropy 1.31542 (1.32170)	Top-1 acc 42.578 (38.941)	Top-5 acc 66.406 (63.098)	lr 0.02426
Train [14][560/3239]	Time 0.485 (0.913)	Data Time 0.001 (0.037)	Loss 3.5239 (3.6038)	Entropy 1.31517 (1.32159)	Top-1 acc 41.016 (38.945)	Top-5 acc 67.188 (63.115)	lr 0.02426
Train [14][570/3239]	Time 0.619 (0.911)	Data Time 0.001 (0.036)	Loss 3.7574 (3.6052)	Entropy 1.31495 (1.32147)	Top-1 acc 32.031 (38.904)	Top-5 acc 57.422 (63.066)	lr 0.02426
Train [14][580/3239]	Time 0.624 (0.909)	Data Time 0.001 (0.036)	Loss 3.6636 (3.6045)	Entropy 1.31455 (1.32136)	Top-1 acc 39.062 (38.913)	Top-5 acc 64.453 (63.102)	lr 0.02426
Train [14][590/3239]	Time 0.585 (0.908)	Data Time 0.001 (0.035)	Loss 3.6616 (3.6048)	Entropy 1.31444 (1.32124)	Top-1 acc 37.891 (38.930)	Top-5 acc 60.547 (63.092)	lr 0.02426
Train [14][600/3239]	Time 0.569 (0.907)	Data Time 0.001 (0.035)	Loss 3.6588 (3.6045)	Entropy 1.31456 (1.32113)	Top-1 acc 35.938 (38.923)	Top-5 acc 64.844 (63.106)	lr 0.02426
Train [14][610/3239]	Time 0.596 (0.906)	Data Time 0.001 (0.034)	Loss 3.4283 (3.6044)	Entropy 1.31493 (1.32103)	Top-1 acc 45.703 (38.937)	Top-5 acc 67.188 (63.103)	lr 0.02426
Train [14][620/3239]	Time 0.700 (0.905)	Data Time 0.001 (0.034)	Loss 3.5221 (3.6039)	Entropy 1.31477 (1.32093)	Top-1 acc 38.281 (38.947)	Top-5 acc 64.062 (63.116)	lr 0.02426
Train [14][630/3239]	Time 0.594 (0.904)	Data Time 0.001 (0.033)	Loss 3.7000 (3.6040)	Entropy 1.31435 (1.32083)	Top-1 acc 34.766 (38.957)	Top-5 acc 61.719 (63.102)	lr 0.02426
Train [14][640/3239]	Time 0.615 (0.903)	Data Time 0.002 (0.033)	Loss 3.5490 (3.6051)	Entropy 1.31384 (1.32072)	Top-1 acc 41.406 (38.952)	Top-5 acc 63.281 (63.086)	lr 0.02426
Train [14][650/3239]	Time 0.620 (0.902)	Data Time 0.001 (0.032)	Loss 3.5979 (3.6054)	Entropy 1.31377 (1.32062)	Top-1 acc 41.016 (38.951)	Top-5 acc 61.719 (63.071)	lr 0.02426
Train [14][660/3239]	Time 0.549 (0.902)	Data Time 0.001 (0.032)	Loss 3.4699 (3.6053)	Entropy 1.31355 (1.32051)	Top-1 acc 44.531 (38.953)	Top-5 acc 64.453 (63.079)	lr 0.02426
Train [14][670/3239]	Time 0.581 (0.900)	Data Time 0.001 (0.031)	Loss 3.9451 (3.6058)	Entropy 1.31304 (1.32041)	Top-1 acc 36.328 (38.942)	Top-5 acc 55.078 (63.052)	lr 0.02426
Train [14][680/3239]	Time 0.569 (0.899)	Data Time 0.001 (0.031)	Loss 3.6935 (3.6058)	Entropy 1.31270 (1.32030)	Top-1 acc 35.938 (38.937)	Top-5 acc 62.109 (63.045)	lr 0.02426
Train [14][690/3239]	Time 0.691 (0.899)	Data Time 0.002 (0.030)	Loss 3.6927 (3.6068)	Entropy 1.31234 (1.32018)	Top-1 acc 35.156 (38.920)	Top-5 acc 64.453 (63.033)	lr 0.02426
Train [14][700/3239]	Time 0.549 (0.898)	Data Time 0.001 (0.030)	Loss 3.6102 (3.6076)	Entropy 1.31219 (1.32007)	Top-1 acc 37.109 (38.905)	Top-5 acc 63.672 (63.013)	lr 0.02426
Train [14][710/3239]	Time 0.631 (0.897)	Data Time 0.001 (0.030)	Loss 3.5732 (3.6076)	Entropy 1.31229 (1.31996)	Top-1 acc 39.844 (38.896)	Top-5 acc 63.672 (63.009)	lr 0.02426
Train [14][720/3239]	Time 0.421 (0.896)	Data Time 0.002 (0.029)	Loss 3.6660 (3.6072)	Entropy 1.31240 (1.31985)	Top-1 acc 37.500 (38.888)	Top-5 acc 62.109 (63.024)	lr 0.02426
Train [14][730/3239]	Time 0.585 (0.895)	Data Time 0.001 (0.029)	Loss 3.7761 (3.6068)	Entropy 1.31212 (1.31975)	Top-1 acc 39.062 (38.905)	Top-5 acc 60.156 (63.038)	lr 0.02426
Train [14][740/3239]	Time 0.564 (0.894)	Data Time 0.001 (0.029)	Loss 3.6404 (3.6076)	Entropy 1.31186 (1.31965)	Top-1 acc 35.938 (38.875)	Top-5 acc 60.547 (63.019)	lr 0.02426
Train [14][750/3239]	Time 0.597 (0.893)	Data Time 0.001 (0.028)	Loss 3.7544 (3.6085)	Entropy 1.31187 (1.31954)	Top-1 acc 35.547 (38.856)	Top-5 acc 57.031 (62.996)	lr 0.02426
Train [14][760/3239]	Time 0.715 (0.892)	Data Time 0.001 (0.028)	Loss 3.5394 (3.6084)	Entropy 1.31202 (1.31944)	Top-1 acc 42.578 (38.869)	Top-5 acc 64.453 (62.998)	lr 0.02426
Train [14][770/3239]	Time 0.605 (0.892)	Data Time 0.001 (0.027)	Loss 3.5518 (3.6080)	Entropy 1.31186 (1.31935)	Top-1 acc 37.500 (38.867)	Top-5 acc 65.234 (63.008)	lr 0.02426
Train [14][780/3239]	Time 0.599 (0.891)	Data Time 0.001 (0.027)	Loss 3.7777 (3.6076)	Entropy 1.31171 (1.31925)	Top-1 acc 33.984 (38.887)	Top-5 acc 57.422 (63.023)	lr 0.02426
Train [14][790/3239]	Time 0.588 (0.890)	Data Time 0.001 (0.027)	Loss 3.7196 (3.6074)	Entropy 1.31143 (1.31915)	Top-1 acc 35.547 (38.886)	Top-5 acc 58.984 (63.021)	lr 0.02426
Train [14][800/3239]	Time 0.588 (0.890)	Data Time 0.001 (0.027)	Loss 3.3910 (3.6065)	Entropy 1.31121 (1.31906)	Top-1 acc 43.359 (38.911)	Top-5 acc 66.797 (63.036)	lr 0.02426
Train [14][810/3239]	Time 0.609 (0.889)	Data Time 0.001 (0.026)	Loss 3.4069 (3.6063)	Entropy 1.31105 (1.31896)	Top-1 acc 45.703 (38.919)	Top-5 acc 67.188 (63.038)	lr 0.02426
Train [14][820/3239]	Time 0.611 (0.888)	Data Time 0.001 (0.026)	Loss 3.6869 (3.6067)	Entropy 1.31083 (1.31886)	Top-1 acc 38.281 (38.915)	Top-5 acc 64.453 (63.027)	lr 0.02426
Train [14][830/3239]	Time 0.603 (0.888)	Data Time 0.001 (0.026)	Loss 3.6184 (3.6070)	Entropy 1.31045 (1.31876)	Top-1 acc 37.500 (38.919)	Top-5 acc 60.938 (63.010)	lr 0.02425
Train [14][840/3239]	Time 0.554 (0.888)	Data Time 0.001 (0.025)	Loss 3.4495 (3.6069)	Entropy 1.31019 (1.31866)	Top-1 acc 41.016 (38.913)	Top-5 acc 66.406 (63.012)	lr 0.02425
Train [14][850/3239]	Time 0.735 (0.887)	Data Time 0.001 (0.025)	Loss 3.4294 (3.6067)	Entropy 1.31004 (1.31857)	Top-1 acc 45.312 (38.922)	Top-5 acc 64.453 (63.014)	lr 0.02425
Train [14][860/3239]	Time 0.588 (0.887)	Data Time 0.001 (0.025)	Loss 3.5622 (3.6058)	Entropy 1.30993 (1.31847)	Top-1 acc 41.016 (38.930)	Top-5 acc 65.625 (63.043)	lr 0.02425
Train [14][870/3239]	Time 0.620 (0.886)	Data Time 0.001 (0.025)	Loss 3.4628 (3.6053)	Entropy 1.30925 (1.31837)	Top-1 acc 43.359 (38.949)	Top-5 acc 67.969 (63.055)	lr 0.02425
Train [14][880/3239]	Time 0.581 (0.886)	Data Time 0.001 (0.024)	Loss 3.4082 (3.6047)	Entropy 1.30905 (1.31826)	Top-1 acc 43.359 (38.947)	Top-5 acc 66.406 (63.068)	lr 0.02425
Train [14][890/3239]	Time 0.595 (0.885)	Data Time 0.002 (0.024)	Loss 3.7340 (3.6049)	Entropy 1.30890 (1.31816)	Top-1 acc 33.984 (38.942)	Top-5 acc 61.719 (63.066)	lr 0.02425
Train [14][900/3239]	Time 0.555 (0.885)	Data Time 0.001 (0.024)	Loss 3.7764 (3.6052)	Entropy 1.30877 (1.31805)	Top-1 acc 31.641 (38.934)	Top-5 acc 58.594 (63.049)	lr 0.02425
Train [14][910/3239]	Time 0.540 (0.884)	Data Time 0.001 (0.024)	Loss 3.5368 (3.6051)	Entropy 1.30885 (1.31795)	Top-1 acc 41.797 (38.937)	Top-5 acc 64.844 (63.044)	lr 0.02425
Train [14][920/3239]	Time 0.710 (0.883)	Data Time 0.001 (0.023)	Loss 3.8163 (3.6046)	Entropy 1.30820 (1.31785)	Top-1 acc 33.984 (38.944)	Top-5 acc 58.984 (63.053)	lr 0.02425
Train [14][930/3239]	Time 0.559 (0.883)	Data Time 0.001 (0.023)	Loss 3.4587 (3.6038)	Entropy 1.30824 (1.31775)	Top-1 acc 42.578 (38.964)	Top-5 acc 66.797 (63.074)	lr 0.02425
Train [14][940/3239]	Time 0.602 (0.882)	Data Time 0.001 (0.023)	Loss 3.5157 (3.6041)	Entropy 1.30772 (1.31764)	Top-1 acc 38.672 (38.955)	Top-5 acc 60.547 (63.062)	lr 0.02425
Train [14][950/3239]	Time 0.558 (0.882)	Data Time 0.001 (0.023)	Loss 3.5962 (3.6036)	Entropy 1.30755 (1.31754)	Top-1 acc 42.969 (38.966)	Top-5 acc 60.938 (63.070)	lr 0.02425
Train [14][960/3239]	Time 0.629 (0.882)	Data Time 0.001 (0.022)	Loss 3.5613 (3.6042)	Entropy 1.30760 (1.31744)	Top-1 acc 34.375 (38.956)	Top-5 acc 63.672 (63.058)	lr 0.02425
Train [14][970/3239]	Time 0.558 (0.881)	Data Time 0.001 (0.022)	Loss 3.5349 (3.6047)	Entropy 1.30757 (1.31733)	Top-1 acc 40.234 (38.941)	Top-5 acc 60.547 (63.042)	lr 0.02425
Train [14][980/3239]	Time 0.537 (0.881)	Data Time 0.001 (0.022)	Loss 3.8174 (3.6050)	Entropy 1.30746 (1.31724)	Top-1 acc 33.203 (38.933)	Top-5 acc 60.156 (63.028)	lr 0.02425
Train [14][990/3239]	Time 0.729 (0.880)	Data Time 0.001 (0.022)	Loss 3.5740 (3.6054)	Entropy 1.30708 (1.31714)	Top-1 acc 39.062 (38.927)	Top-5 acc 65.234 (63.018)	lr 0.02425
Train [14][1000/3239]	Time 0.579 (0.880)	Data Time 0.001 (0.022)	Loss 3.6439 (3.6052)	Entropy 1.30721 (1.31704)	Top-1 acc 38.672 (38.936)	Top-5 acc 62.891 (63.023)	lr 0.02425
Train [14][1010/3239]	Time 0.592 (0.880)	Data Time 0.001 (0.021)	Loss 3.3766 (3.6048)	Entropy 1.30700 (1.31694)	Top-1 acc 44.531 (38.939)	Top-5 acc 67.578 (63.033)	lr 0.02425
Train [14][1020/3239]	Time 0.646 (0.880)	Data Time 0.001 (0.021)	Loss 3.6363 (3.6049)	Entropy 1.30696 (1.31684)	Top-1 acc 38.672 (38.934)	Top-5 acc 63.281 (63.034)	lr 0.02425
Train [14][1030/3239]	Time 0.582 (0.879)	Data Time 0.001 (0.021)	Loss 3.5944 (3.6053)	Entropy 1.30681 (1.31674)	Top-1 acc 39.453 (38.924)	Top-5 acc 64.062 (63.022)	lr 0.02425
Train [14][1040/3239]	Time 0.601 (0.879)	Data Time 0.001 (0.021)	Loss 3.6231 (3.6056)	Entropy 1.30691 (1.31665)	Top-1 acc 37.109 (38.923)	Top-5 acc 61.719 (63.013)	lr 0.02425
Train [14][1050/3239]	Time 0.576 (0.879)	Data Time 0.001 (0.021)	Loss 3.4949 (3.6049)	Entropy 1.30683 (1.31655)	Top-1 acc 41.016 (38.936)	Top-5 acc 68.359 (63.027)	lr 0.02425
Train [14][1060/3239]	Time 0.676 (0.878)	Data Time 0.001 (0.021)	Loss 3.7042 (3.6048)	Entropy 1.30659 (1.31646)	Top-1 acc 33.594 (38.931)	Top-5 acc 60.156 (63.027)	lr 0.02425
Train [14][1070/3239]	Time 0.574 (0.878)	Data Time 0.001 (0.020)	Loss 3.5551 (3.6046)	Entropy 1.30629 (1.31637)	Top-1 acc 41.406 (38.934)	Top-5 acc 66.406 (63.029)	lr 0.02425
Train [14][1080/3239]	Time 0.751 (0.895)	Data Time 0.006 (0.020)	Loss 3.5200 (3.6042)	Entropy 1.30640 (1.31628)	Top-1 acc 39.453 (38.944)	Top-5 acc 64.844 (63.043)	lr 0.02425
Train [14][1090/3239]	Time 0.596 (0.896)	Data Time 0.002 (0.020)	Loss 3.5250 (3.6043)	Entropy 1.30650 (1.31619)	Top-1 acc 39.844 (38.940)	Top-5 acc 63.672 (63.044)	lr 0.02425
Train [14][1100/3239]	Time 0.616 (0.895)	Data Time 0.004 (0.020)	Loss 3.7117 (3.6043)	Entropy 1.30602 (1.31610)	Top-1 acc 36.719 (38.940)	Top-5 acc 62.109 (63.041)	lr 0.02425
Train [14][1110/3239]	Time 0.598 (0.895)	Data Time 0.001 (0.020)	Loss 3.5734 (3.6040)	Entropy 1.30575 (1.31600)	Top-1 acc 39.453 (38.952)	Top-5 acc 64.453 (63.048)	lr 0.02425
Train [14][1120/3239]	Time 0.653 (0.894)	Data Time 0.003 (0.020)	Loss 3.3520 (3.6035)	Entropy 1.30553 (1.31591)	Top-1 acc 41.406 (38.957)	Top-5 acc 71.484 (63.065)	lr 0.02424
Train [14][1130/3239]	Time 0.671 (0.894)	Data Time 0.001 (0.019)	Loss 3.6058 (3.6032)	Entropy 1.30531 (1.31582)	Top-1 acc 39.453 (38.975)	Top-5 acc 62.500 (63.066)	lr 0.02424
Train [14][1140/3239]	Time 0.583 (0.893)	Data Time 0.001 (0.019)	Loss 3.5386 (3.6032)	Entropy 1.30499 (1.31573)	Top-1 acc 40.234 (38.967)	Top-5 acc 63.672 (63.069)	lr 0.02424
Train [14][1150/3239]	Time 0.546 (0.893)	Data Time 0.002 (0.019)	Loss 3.4812 (3.6031)	Entropy 1.30467 (1.31563)	Top-1 acc 43.750 (38.963)	Top-5 acc 62.500 (63.080)	lr 0.02424
Train [14][1160/3239]	Time 0.574 (0.892)	Data Time 0.001 (0.019)	Loss 3.6913 (3.6033)	Entropy 1.30434 (1.31554)	Top-1 acc 38.281 (38.970)	Top-5 acc 64.453 (63.073)	lr 0.02424
Train [14][1170/3239]	Time 0.613 (0.892)	Data Time 0.001 (0.019)	Loss 3.8860 (3.6034)	Entropy 1.30425 (1.31544)	Top-1 acc 32.031 (38.964)	Top-5 acc 53.516 (63.067)	lr 0.02424
Train [14][1180/3239]	Time 0.540 (0.891)	Data Time 0.001 (0.019)	Loss 3.6280 (3.6032)	Entropy 1.30411 (1.31535)	Top-1 acc 38.281 (38.976)	Top-5 acc 64.844 (63.068)	lr 0.02424
Train [14][1190/3239]	Time 0.630 (0.891)	Data Time 0.001 (0.019)	Loss 3.6391 (3.6032)	Entropy 1.30403 (1.31525)	Top-1 acc 39.453 (38.975)	Top-5 acc 60.938 (63.066)	lr 0.02424
Train [14][1200/3239]	Time 0.593 (0.891)	Data Time 0.001 (0.018)	Loss 3.6297 (3.6031)	Entropy 1.30383 (1.31516)	Top-1 acc 37.891 (38.989)	Top-5 acc 64.844 (63.065)	lr 0.02424
Train [14][1210/3239]	Time 0.534 (0.890)	Data Time 0.001 (0.018)	Loss 3.6846 (3.6029)	Entropy 1.30377 (1.31506)	Top-1 acc 41.016 (39.000)	Top-5 acc 62.500 (63.066)	lr 0.02424
Train [14][1220/3239]	Time 0.485 (0.889)	Data Time 0.001 (0.018)	Loss 3.4554 (3.6027)	Entropy 1.30370 (1.31497)	Top-1 acc 44.922 (38.998)	Top-5 acc 67.969 (63.065)	lr 0.02424
Train [14][1230/3239]	Time 0.599 (0.889)	Data Time 0.001 (0.018)	Loss 3.4815 (3.6030)	Entropy 1.30351 (1.31488)	Top-1 acc 41.797 (38.997)	Top-5 acc 65.234 (63.059)	lr 0.02424
Train [14][1240/3239]	Time 0.563 (0.889)	Data Time 0.001 (0.018)	Loss 3.4525 (3.6028)	Entropy 1.30347 (1.31479)	Top-1 acc 41.797 (38.998)	Top-5 acc 66.797 (63.068)	lr 0.02424
Train [14][1250/3239]	Time 0.528 (0.888)	Data Time 0.001 (0.018)	Loss 3.4909 (3.6022)	Entropy 1.30333 (1.31470)	Top-1 acc 42.578 (39.016)	Top-5 acc 67.188 (63.080)	lr 0.02424
Train [14][1260/3239]	Time 0.636 (0.888)	Data Time 0.001 (0.018)	Loss 3.6143 (3.6018)	Entropy 1.30294 (1.31460)	Top-1 acc 38.281 (39.021)	Top-5 acc 61.719 (63.083)	lr 0.02424
Train [14][1270/3239]	Time 0.604 (0.888)	Data Time 0.001 (0.018)	Loss 3.6031 (3.6022)	Entropy 1.30281 (1.31451)	Top-1 acc 39.844 (39.013)	Top-5 acc 62.500 (63.072)	lr 0.02424
Train [14][1280/3239]	Time 0.609 (0.887)	Data Time 0.001 (0.017)	Loss 3.8219 (3.6021)	Entropy 1.30257 (1.31442)	Top-1 acc 34.766 (39.007)	Top-5 acc 58.203 (63.073)	lr 0.02424
Train [14][1290/3239]	Time 0.713 (0.887)	Data Time 0.001 (0.017)	Loss 3.4038 (3.6019)	Entropy 1.30226 (1.31433)	Top-1 acc 42.188 (39.008)	Top-5 acc 67.578 (63.075)	lr 0.02424
Train [14][1300/3239]	Time 0.666 (0.887)	Data Time 0.002 (0.017)	Loss 3.3859 (3.6014)	Entropy 1.30188 (1.31423)	Top-1 acc 47.266 (39.021)	Top-5 acc 68.359 (63.089)	lr 0.02424
Train [14][1310/3239]	Time 0.568 (0.886)	Data Time 0.001 (0.017)	Loss 3.6466 (3.6015)	Entropy 1.30171 (1.31414)	Top-1 acc 36.719 (39.023)	Top-5 acc 61.719 (63.080)	lr 0.02424
Train [14][1320/3239]	Time 0.599 (0.886)	Data Time 0.001 (0.017)	Loss 3.6902 (3.6007)	Entropy 1.30146 (1.31404)	Top-1 acc 36.328 (39.044)	Top-5 acc 59.375 (63.099)	lr 0.02424
Train [14][1330/3239]	Time 0.560 (0.886)	Data Time 0.001 (0.017)	Loss 3.6560 (3.6010)	Entropy 1.30181 (1.31395)	Top-1 acc 37.500 (39.039)	Top-5 acc 60.156 (63.090)	lr 0.02424
Train [14][1340/3239]	Time 0.590 (0.885)	Data Time 0.001 (0.017)	Loss 3.2819 (3.6007)	Entropy 1.30175 (1.31386)	Top-1 acc 44.531 (39.046)	Top-5 acc 71.484 (63.092)	lr 0.02424
Train [14][1350/3239]	Time 0.575 (0.885)	Data Time 0.001 (0.017)	Loss 3.6891 (3.6006)	Entropy 1.30172 (1.31377)	Top-1 acc 37.891 (39.047)	Top-5 acc 62.891 (63.097)	lr 0.02424
Train [14][1360/3239]	Time 0.686 (0.885)	Data Time 0.002 (0.017)	Loss 3.5127 (3.6009)	Entropy 1.30149 (1.31368)	Top-1 acc 39.844 (39.038)	Top-5 acc 63.672 (63.084)	lr 0.02424
Train [14][1370/3239]	Time 0.573 (0.884)	Data Time 0.001 (0.016)	Loss 3.7580 (3.6014)	Entropy 1.30134 (1.31359)	Top-1 acc 33.984 (39.027)	Top-5 acc 56.250 (63.077)	lr 0.02424
Train [14][1380/3239]	Time 0.449 (0.884)	Data Time 0.002 (0.016)	Loss 3.7383 (3.6016)	Entropy 1.30088 (1.31350)	Top-1 acc 31.641 (39.010)	Top-5 acc 60.547 (63.075)	lr 0.02424
Train [14][1390/3239]	Time 0.558 (0.883)	Data Time 0.001 (0.016)	Loss 3.3811 (3.6010)	Entropy 1.30110 (1.31341)	Top-1 acc 48.047 (39.028)	Top-5 acc 66.406 (63.091)	lr 0.02424
Train [14][1400/3239]	Time 0.585 (0.883)	Data Time 0.001 (0.016)	Loss 3.4917 (3.6006)	Entropy 1.30092 (1.31332)	Top-1 acc 39.844 (39.027)	Top-5 acc 66.797 (63.101)	lr 0.02424
Train [14][1410/3239]	Time 0.600 (0.882)	Data Time 0.001 (0.016)	Loss 3.6131 (3.6007)	Entropy 1.30058 (1.31323)	Top-1 acc 37.500 (39.024)	Top-5 acc 62.891 (63.102)	lr 0.02423
Train [14][1420/3239]	Time 0.639 (0.882)	Data Time 0.002 (0.016)	Loss 3.4253 (3.6003)	Entropy 1.30023 (1.31314)	Top-1 acc 43.359 (39.035)	Top-5 acc 64.844 (63.115)	lr 0.02423
Train [14][1430/3239]	Time 0.569 (0.882)	Data Time 0.001 (0.016)	Loss 3.7105 (3.6004)	Entropy 1.29968 (1.31305)	Top-1 acc 35.156 (39.032)	Top-5 acc 61.719 (63.121)	lr 0.02423
Train [14][1440/3239]	Time 0.598 (0.881)	Data Time 0.001 (0.016)	Loss 3.5087 (3.6004)	Entropy 1.29946 (1.31296)	Top-1 acc 41.797 (39.029)	Top-5 acc 66.016 (63.116)	lr 0.02423
Train [14][1450/3239]	Time 0.612 (0.881)	Data Time 0.001 (0.016)	Loss 3.6052 (3.6001)	Entropy 1.29904 (1.31286)	Top-1 acc 41.406 (39.030)	Top-5 acc 62.109 (63.119)	lr 0.02423
Train [14][1460/3239]	Time 0.584 (0.881)	Data Time 0.001 (0.016)	Loss 3.7055 (3.6000)	Entropy 1.29878 (1.31277)	Top-1 acc 35.156 (39.032)	Top-5 acc 59.766 (63.119)	lr 0.02423
Train [14][1470/3239]	Time 0.574 (0.881)	Data Time 0.001 (0.015)	Loss 3.5650 (3.5997)	Entropy 1.29896 (1.31267)	Top-1 acc 39.062 (39.033)	Top-5 acc 63.672 (63.125)	lr 0.02423
Train [14][1480/3239]	Time 0.607 (0.880)	Data Time 0.001 (0.015)	Loss 3.4367 (3.5989)	Entropy 1.29873 (1.31258)	Top-1 acc 39.844 (39.048)	Top-5 acc 67.578 (63.140)	lr 0.02423
Train [14][1490/3239]	Time 0.598 (0.880)	Data Time 0.001 (0.015)	Loss 3.4450 (3.5988)	Entropy 1.29885 (1.31249)	Top-1 acc 40.234 (39.048)	Top-5 acc 66.016 (63.143)	lr 0.02423
Train [14][1500/3239]	Time 0.612 (0.880)	Data Time 0.001 (0.015)	Loss 3.6177 (3.5989)	Entropy 1.29902 (1.31240)	Top-1 acc 41.797 (39.049)	Top-5 acc 63.281 (63.143)	lr 0.02423
Train [14][1510/3239]	Time 0.602 (0.880)	Data Time 0.001 (0.015)	Loss 3.4983 (3.5987)	Entropy 1.29891 (1.31231)	Top-1 acc 42.969 (39.055)	Top-5 acc 66.406 (63.147)	lr 0.02423
Train [14][1520/3239]	Time 0.634 (0.879)	Data Time 0.001 (0.015)	Loss 3.8807 (3.5992)	Entropy 1.29896 (1.31222)	Top-1 acc 36.719 (39.050)	Top-5 acc 55.859 (63.138)	lr 0.02423
Train [14][1530/3239]	Time 0.645 (0.879)	Data Time 0.001 (0.015)	Loss 3.5552 (3.5992)	Entropy 1.29851 (1.31213)	Top-1 acc 42.188 (39.052)	Top-5 acc 65.234 (63.146)	lr 0.02423
Train [14][1540/3239]	Time 0.583 (0.879)	Data Time 0.001 (0.015)	Loss 3.5566 (3.5993)	Entropy 1.29803 (1.31204)	Top-1 acc 46.484 (39.056)	Top-5 acc 64.844 (63.141)	lr 0.02423
Train [14][1550/3239]	Time 0.585 (0.878)	Data Time 0.001 (0.015)	Loss 3.6619 (3.5995)	Entropy 1.29777 (1.31195)	Top-1 acc 37.109 (39.052)	Top-5 acc 58.984 (63.133)	lr 0.02423
Train [14][1560/3239]	Time 0.612 (0.878)	Data Time 0.001 (0.015)	Loss 3.5858 (3.5994)	Entropy 1.29804 (1.31186)	Top-1 acc 36.719 (39.051)	Top-5 acc 63.672 (63.130)	lr 0.02423
Train [14][1570/3239]	Time 0.602 (0.877)	Data Time 0.001 (0.015)	Loss 3.5505 (3.5991)	Entropy 1.29815 (1.31177)	Top-1 acc 41.406 (39.054)	Top-5 acc 62.500 (63.134)	lr 0.02423
Train [14][1580/3239]	Time 0.553 (0.877)	Data Time 0.001 (0.015)	Loss 3.7723 (3.5994)	Entropy 1.29818 (1.31169)	Top-1 acc 35.156 (39.047)	Top-5 acc 59.375 (63.127)	lr 0.02423
Train [14][1590/3239]	Time 0.718 (0.877)	Data Time 0.001 (0.014)	Loss 3.5854 (3.5994)	Entropy 1.29789 (1.31160)	Top-1 acc 44.531 (39.051)	Top-5 acc 64.844 (63.129)	lr 0.02423
Train [14][1600/3239]	Time 0.562 (0.876)	Data Time 0.001 (0.014)	Loss 3.5873 (3.5993)	Entropy 1.29757 (1.31151)	Top-1 acc 42.578 (39.057)	Top-5 acc 65.234 (63.130)	lr 0.02423
Train [14][1610/3239]	Time 0.592 (0.876)	Data Time 0.001 (0.014)	Loss 3.5969 (3.5993)	Entropy 1.29723 (1.31143)	Top-1 acc 37.500 (39.059)	Top-5 acc 62.891 (63.134)	lr 0.02423
Train [14][1620/3239]	Time 0.607 (0.876)	Data Time 0.003 (0.014)	Loss 3.5454 (3.5992)	Entropy 1.29668 (1.31134)	Top-1 acc 40.234 (39.056)	Top-5 acc 59.766 (63.133)	lr 0.02423
Train [14][1630/3239]	Time 0.644 (0.876)	Data Time 0.001 (0.014)	Loss 3.5860 (3.5994)	Entropy 1.29664 (1.31125)	Top-1 acc 41.797 (39.057)	Top-5 acc 63.672 (63.131)	lr 0.02423
Train [14][1640/3239]	Time 0.585 (0.875)	Data Time 0.002 (0.014)	Loss 3.4999 (3.5993)	Entropy 1.29611 (1.31116)	Top-1 acc 42.969 (39.054)	Top-5 acc 66.016 (63.131)	lr 0.02423
Train [14][1650/3239]	Time 0.555 (0.875)	Data Time 0.001 (0.014)	Loss 3.7961 (3.5990)	Entropy 1.29585 (1.31107)	Top-1 acc 40.625 (39.058)	Top-5 acc 61.328 (63.140)	lr 0.02423
Train [14][1660/3239]	Time 0.729 (0.875)	Data Time 0.001 (0.014)	Loss 3.3783 (3.5984)	Entropy 1.29610 (1.31097)	Top-1 acc 43.750 (39.067)	Top-5 acc 68.359 (63.148)	lr 0.02423
Train [14][1670/3239]	Time 0.543 (0.875)	Data Time 0.001 (0.014)	Loss 3.7006 (3.5982)	Entropy 1.29617 (1.31089)	Top-1 acc 34.375 (39.074)	Top-5 acc 60.938 (63.157)	lr 0.02423
Train [14][1680/3239]	Time 0.561 (0.875)	Data Time 0.002 (0.014)	Loss 3.4063 (3.5977)	Entropy 1.29577 (1.31080)	Top-1 acc 40.625 (39.082)	Top-5 acc 68.359 (63.161)	lr 0.02423
Train [14][1690/3239]	Time 0.551 (0.875)	Data Time 0.001 (0.014)	Loss 3.5199 (3.5977)	Entropy 1.29580 (1.31071)	Top-1 acc 43.359 (39.082)	Top-5 acc 67.578 (63.165)	lr 0.02422
Train [14][1700/3239]	Time 0.574 (0.874)	Data Time 0.001 (0.014)	Loss 3.5603 (3.5976)	Entropy 1.29587 (1.31062)	Top-1 acc 37.500 (39.077)	Top-5 acc 62.891 (63.165)	lr 0.02422
Train [14][1710/3239]	Time 0.597 (0.874)	Data Time 0.001 (0.014)	Loss 3.5245 (3.5972)	Entropy 1.29520 (1.31053)	Top-1 acc 41.406 (39.084)	Top-5 acc 64.062 (63.168)	lr 0.02422
Train [14][1720/3239]	Time 0.598 (0.874)	Data Time 0.001 (0.014)	Loss 3.4602 (3.5970)	Entropy 1.29494 (1.31044)	Top-1 acc 42.969 (39.091)	Top-5 acc 62.500 (63.174)	lr 0.02422
Train [14][1730/3239]	Time 0.670 (0.873)	Data Time 0.001 (0.013)	Loss 3.5986 (3.5971)	Entropy 1.29433 (1.31035)	Top-1 acc 35.938 (39.082)	Top-5 acc 63.672 (63.175)	lr 0.02422
Train [14][1740/3239]	Time 0.573 (0.885)	Data Time 0.002 (0.013)	Loss 3.4697 (3.5972)	Entropy 1.29413 (1.31026)	Top-1 acc 41.797 (39.084)	Top-5 acc 64.453 (63.172)	lr 0.02422
Train [14][1750/3239]	Time 0.621 (0.885)	Data Time 0.001 (0.013)	Loss 3.6164 (3.5968)	Entropy 1.29410 (1.31017)	Top-1 acc 37.109 (39.091)	Top-5 acc 62.109 (63.182)	lr 0.02422
Train [14][1760/3239]	Time 0.586 (0.885)	Data Time 0.001 (0.013)	Loss 3.5733 (3.5967)	Entropy 1.29401 (1.31008)	Top-1 acc 36.719 (39.095)	Top-5 acc 62.891 (63.183)	lr 0.02422
Train [14][1770/3239]	Time 0.588 (0.884)	Data Time 0.001 (0.013)	Loss 3.6399 (3.5970)	Entropy 1.29378 (1.30998)	Top-1 acc 41.797 (39.087)	Top-5 acc 63.672 (63.182)	lr 0.02422
Train [14][1780/3239]	Time 0.606 (0.884)	Data Time 0.001 (0.013)	Loss 3.6762 (3.5968)	Entropy 1.29394 (1.30989)	Top-1 acc 35.156 (39.089)	Top-5 acc 63.672 (63.189)	lr 0.02422
Train [14][1790/3239]	Time 0.593 (0.884)	Data Time 0.001 (0.013)	Loss 3.7009 (3.5968)	Entropy 1.29362 (1.30980)	Top-1 acc 34.766 (39.091)	Top-5 acc 62.109 (63.188)	lr 0.02422
Train [14][1800/3239]	Time 0.542 (0.884)	Data Time 0.001 (0.013)	Loss 3.7117 (3.5970)	Entropy 1.29348 (1.30971)	Top-1 acc 33.203 (39.087)	Top-5 acc 59.766 (63.182)	lr 0.02422
Train [14][1810/3239]	Time 0.605 (0.883)	Data Time 0.001 (0.013)	Loss 3.8627 (3.5973)	Entropy 1.29350 (1.30962)	Top-1 acc 34.375 (39.080)	Top-5 acc 58.203 (63.177)	lr 0.02422
Train [14][1820/3239]	Time 0.601 (0.883)	Data Time 0.001 (0.013)	Loss 3.4840 (3.5972)	Entropy 1.29276 (1.30953)	Top-1 acc 42.969 (39.080)	Top-5 acc 62.109 (63.172)	lr 0.02422
Train [14][1830/3239]	Time 0.596 (0.883)	Data Time 0.001 (0.013)	Loss 3.3676 (3.5970)	Entropy 1.29257 (1.30944)	Top-1 acc 43.359 (39.083)	Top-5 acc 68.750 (63.171)	lr 0.02422
Train [14][1840/3239]	Time 0.638 (0.883)	Data Time 0.001 (0.013)	Loss 3.5449 (3.5969)	Entropy 1.29214 (1.30935)	Top-1 acc 41.016 (39.088)	Top-5 acc 67.578 (63.174)	lr 0.02422
Train [14][1850/3239]	Time 0.597 (0.882)	Data Time 0.001 (0.013)	Loss 3.6092 (3.5970)	Entropy 1.29214 (1.30926)	Top-1 acc 39.062 (39.088)	Top-5 acc 59.766 (63.170)	lr 0.02422
Train [14][1860/3239]	Time 0.565 (0.882)	Data Time 0.001 (0.013)	Loss 3.4688 (3.5975)	Entropy 1.29193 (1.30916)	Top-1 acc 42.188 (39.077)	Top-5 acc 69.531 (63.158)	lr 0.02422
Train [14][1870/3239]	Time 0.574 (0.882)	Data Time 0.001 (0.013)	Loss 3.6048 (3.5973)	Entropy 1.29158 (1.30907)	Top-1 acc 38.281 (39.084)	Top-5 acc 65.625 (63.168)	lr 0.02422
Train [14][1880/3239]	Time 0.576 (0.881)	Data Time 0.001 (0.013)	Loss 3.8095 (3.5973)	Entropy 1.29155 (1.30898)	Top-1 acc 36.328 (39.082)	Top-5 acc 60.938 (63.173)	lr 0.02422
Train [14][1890/3239]	Time 0.738 (0.881)	Data Time 0.003 (0.013)	Loss 3.8039 (3.5974)	Entropy 1.29087 (1.30888)	Top-1 acc 38.672 (39.077)	Top-5 acc 56.250 (63.171)	lr 0.02422
Train [14][1900/3239]	Time 0.597 (0.881)	Data Time 0.001 (0.012)	Loss 3.5438 (3.5972)	Entropy 1.29094 (1.30879)	Top-1 acc 42.188 (39.082)	Top-5 acc 61.719 (63.177)	lr 0.02422
Train [14][1910/3239]	Time 0.573 (0.880)	Data Time 0.001 (0.012)	Loss 3.6118 (3.5971)	Entropy 1.29090 (1.30870)	Top-1 acc 35.938 (39.081)	Top-5 acc 62.891 (63.180)	lr 0.02422
Train [14][1920/3239]	Time 0.635 (0.880)	Data Time 0.001 (0.012)	Loss 3.7093 (3.5971)	Entropy 1.29069 (1.30860)	Top-1 acc 38.672 (39.081)	Top-5 acc 60.156 (63.178)	lr 0.02422
Train [14][1930/3239]	Time 0.554 (0.880)	Data Time 0.001 (0.012)	Loss 3.6002 (3.5969)	Entropy 1.29065 (1.30851)	Top-1 acc 41.797 (39.086)	Top-5 acc 64.453 (63.185)	lr 0.02422
Train [14][1940/3239]	Time 0.651 (0.880)	Data Time 0.001 (0.012)	Loss 3.6046 (3.5970)	Entropy 1.29060 (1.30842)	Top-1 acc 40.625 (39.079)	Top-5 acc 62.891 (63.183)	lr 0.02422
Train [14][1950/3239]	Time 0.594 (0.880)	Data Time 0.001 (0.012)	Loss 3.5001 (3.5970)	Entropy 1.29050 (1.30833)	Top-1 acc 41.406 (39.080)	Top-5 acc 63.672 (63.183)	lr 0.02422
Train [14][1960/3239]	Time 0.669 (0.880)	Data Time 0.001 (0.012)	Loss 3.6288 (3.5972)	Entropy 1.29044 (1.30824)	Top-1 acc 36.719 (39.079)	Top-5 acc 64.844 (63.180)	lr 0.02422
Train [14][1970/3239]	Time 0.586 (0.880)	Data Time 0.001 (0.012)	Loss 3.7364 (3.5974)	Entropy 1.29004 (1.30815)	Top-1 acc 37.891 (39.075)	Top-5 acc 62.109 (63.180)	lr 0.02422
Train [14][1980/3239]	Time 0.590 (0.879)	Data Time 0.003 (0.012)	Loss 3.4174 (3.5971)	Entropy 1.28984 (1.30805)	Top-1 acc 41.797 (39.075)	Top-5 acc 65.625 (63.182)	lr 0.02421
Train [14][1990/3239]	Time 0.604 (0.879)	Data Time 0.001 (0.012)	Loss 3.6688 (3.5973)	Entropy 1.29006 (1.30796)	Top-1 acc 40.625 (39.067)	Top-5 acc 63.281 (63.181)	lr 0.02421
Train [14][2000/3239]	Time 0.573 (0.879)	Data Time 0.001 (0.012)	Loss 3.8012 (3.5977)	Entropy 1.29017 (1.30787)	Top-1 acc 37.109 (39.056)	Top-5 acc 58.594 (63.172)	lr 0.02421
Train [14][2010/3239]	Time 0.558 (0.879)	Data Time 0.001 (0.012)	Loss 3.5876 (3.5978)	Entropy 1.29045 (1.30778)	Top-1 acc 39.844 (39.057)	Top-5 acc 66.016 (63.170)	lr 0.02421
Train [14][2020/3239]	Time 0.616 (0.878)	Data Time 0.002 (0.012)	Loss 3.4793 (3.5980)	Entropy 1.29026 (1.30770)	Top-1 acc 43.359 (39.056)	Top-5 acc 67.188 (63.167)	lr 0.02421
Train [14][2030/3239]	Time 0.668 (0.878)	Data Time 0.001 (0.012)	Loss 3.5357 (3.5981)	Entropy 1.29030 (1.30761)	Top-1 acc 41.016 (39.049)	Top-5 acc 67.578 (63.171)	lr 0.02421
Train [14][2040/3239]	Time 0.607 (0.878)	Data Time 0.001 (0.012)	Loss 3.5996 (3.5980)	Entropy 1.29012 (1.30753)	Top-1 acc 40.625 (39.051)	Top-5 acc 62.891 (63.174)	lr 0.02421
Train [14][2050/3239]	Time 0.621 (0.878)	Data Time 0.003 (0.012)	Loss 3.6063 (3.5979)	Entropy 1.29008 (1.30744)	Top-1 acc 41.406 (39.055)	Top-5 acc 61.328 (63.179)	lr 0.02421
Train [14][2060/3239]	Time 0.602 (0.878)	Data Time 0.001 (0.012)	Loss 3.6173 (3.5979)	Entropy 1.28987 (1.30736)	Top-1 acc 42.969 (39.055)	Top-5 acc 65.625 (63.184)	lr 0.02421
Train [14][2070/3239]	Time 0.518 (0.877)	Data Time 0.001 (0.012)	Loss 3.7304 (3.5981)	Entropy 1.28984 (1.30727)	Top-1 acc 40.234 (39.052)	Top-5 acc 60.547 (63.178)	lr 0.02421
Train [14][2080/3239]	Time 0.601 (0.877)	Data Time 0.001 (0.012)	Loss 3.6379 (3.5984)	Entropy 1.28931 (1.30719)	Top-1 acc 37.891 (39.045)	Top-5 acc 60.938 (63.171)	lr 0.02421
Train [14][2090/3239]	Time 0.619 (0.877)	Data Time 0.001 (0.012)	Loss 3.3708 (3.5982)	Entropy 1.28926 (1.30710)	Top-1 acc 44.141 (39.052)	Top-5 acc 71.875 (63.178)	lr 0.02421
Train [14][2100/3239]	Time 0.584 (0.877)	Data Time 0.001 (0.011)	Loss 3.8060 (3.5983)	Entropy 1.28903 (1.30702)	Top-1 acc 32.422 (39.050)	Top-5 acc 59.766 (63.173)	lr 0.02421
Train [14][2110/3239]	Time 0.540 (0.877)	Data Time 0.001 (0.011)	Loss 3.4502 (3.5982)	Entropy 1.28870 (1.30693)	Top-1 acc 43.359 (39.051)	Top-5 acc 66.406 (63.174)	lr 0.02421
Train [14][2120/3239]	Time 0.660 (0.877)	Data Time 0.001 (0.011)	Loss 3.7297 (3.5983)	Entropy 1.28861 (1.30685)	Top-1 acc 34.375 (39.052)	Top-5 acc 59.375 (63.174)	lr 0.02421
Train [14][2130/3239]	Time 0.614 (0.876)	Data Time 0.001 (0.011)	Loss 3.6356 (3.5983)	Entropy 1.28830 (1.30676)	Top-1 acc 32.422 (39.048)	Top-5 acc 62.500 (63.173)	lr 0.02421
Train [14][2140/3239]	Time 0.564 (0.876)	Data Time 0.001 (0.011)	Loss 3.6657 (3.5982)	Entropy 1.28840 (1.30667)	Top-1 acc 37.109 (39.049)	Top-5 acc 61.719 (63.175)	lr 0.02421
Train [14][2150/3239]	Time 0.638 (0.876)	Data Time 0.001 (0.011)	Loss 3.4642 (3.5980)	Entropy 1.28818 (1.30659)	Top-1 acc 41.797 (39.056)	Top-5 acc 62.109 (63.176)	lr 0.02421
Train [14][2160/3239]	Time 0.584 (0.876)	Data Time 0.001 (0.011)	Loss 3.5501 (3.5980)	Entropy 1.28819 (1.30650)	Top-1 acc 41.406 (39.051)	Top-5 acc 65.625 (63.178)	lr 0.02421
Train [14][2170/3239]	Time 0.623 (0.876)	Data Time 0.001 (0.011)	Loss 3.5927 (3.5980)	Entropy 1.28786 (1.30642)	Top-1 acc 40.234 (39.050)	Top-5 acc 64.844 (63.181)	lr 0.02421
Train [14][2180/3239]	Time 0.578 (0.876)	Data Time 0.001 (0.011)	Loss 3.7758 (3.5980)	Entropy 1.28767 (1.30633)	Top-1 acc 36.328 (39.051)	Top-5 acc 55.469 (63.183)	lr 0.02421
Train [14][2190/3239]	Time 0.705 (0.876)	Data Time 0.001 (0.011)	Loss 3.5819 (3.5980)	Entropy 1.28738 (1.30625)	Top-1 acc 39.062 (39.051)	Top-5 acc 62.891 (63.179)	lr 0.02421
Train [14][2200/3239]	Time 0.567 (0.875)	Data Time 0.001 (0.011)	Loss 3.4423 (3.5979)	Entropy 1.28721 (1.30616)	Top-1 acc 42.578 (39.050)	Top-5 acc 65.625 (63.181)	lr 0.02421
Train [14][2210/3239]	Time 0.602 (0.875)	Data Time 0.001 (0.011)	Loss 3.7473 (3.5980)	Entropy 1.28701 (1.30608)	Top-1 acc 33.984 (39.045)	Top-5 acc 62.109 (63.181)	lr 0.02421
Train [14][2220/3239]	Time 0.602 (0.875)	Data Time 0.001 (0.011)	Loss 3.5058 (3.5979)	Entropy 1.28721 (1.30599)	Top-1 acc 42.188 (39.048)	Top-5 acc 65.625 (63.179)	lr 0.02421
Train [14][2230/3239]	Time 0.610 (0.874)	Data Time 0.001 (0.011)	Loss 3.3915 (3.5975)	Entropy 1.28699 (1.30591)	Top-1 acc 42.188 (39.056)	Top-5 acc 65.625 (63.186)	lr 0.02421
Train [14][2240/3239]	Time 0.596 (0.874)	Data Time 0.001 (0.011)	Loss 3.5545 (3.5971)	Entropy 1.28649 (1.30582)	Top-1 acc 38.672 (39.064)	Top-5 acc 60.547 (63.195)	lr 0.02421
Train [14][2250/3239]	Time 0.533 (0.874)	Data Time 0.001 (0.011)	Loss 3.6572 (3.5971)	Entropy 1.28599 (1.30573)	Top-1 acc 36.719 (39.061)	Top-5 acc 58.984 (63.194)	lr 0.02421
Train [14][2260/3239]	Time 0.629 (0.874)	Data Time 0.001 (0.011)	Loss 3.3485 (3.5971)	Entropy 1.28603 (1.30565)	Top-1 acc 44.141 (39.063)	Top-5 acc 66.797 (63.194)	lr 0.02420
Train [14][2270/3239]	Time 0.628 (0.874)	Data Time 0.001 (0.011)	Loss 3.5363 (3.5969)	Entropy 1.28619 (1.30556)	Top-1 acc 44.531 (39.069)	Top-5 acc 66.797 (63.202)	lr 0.02420
Train [14][2280/3239]	Time 0.593 (0.874)	Data Time 0.001 (0.011)	Loss 3.5634 (3.5969)	Entropy 1.28573 (1.30548)	Top-1 acc 40.625 (39.072)	Top-5 acc 66.406 (63.202)	lr 0.02420
Train [14][2290/3239]	Time 0.597 (0.874)	Data Time 0.001 (0.011)	Loss 3.3745 (3.5967)	Entropy 1.28606 (1.30539)	Top-1 acc 45.312 (39.077)	Top-5 acc 68.359 (63.203)	lr 0.02420
Train [14][2300/3239]	Time 0.632 (0.873)	Data Time 0.001 (0.011)	Loss 3.3135 (3.5966)	Entropy 1.28594 (1.30531)	Top-1 acc 44.141 (39.077)	Top-5 acc 71.094 (63.209)	lr 0.02420
Train [14][2310/3239]	Time 0.608 (0.873)	Data Time 0.001 (0.011)	Loss 3.4131 (3.5963)	Entropy 1.28593 (1.30522)	Top-1 acc 42.188 (39.086)	Top-5 acc 64.844 (63.216)	lr 0.02420
Train [14][2320/3239]	Time 0.613 (0.873)	Data Time 0.001 (0.011)	Loss 3.4454 (3.5965)	Entropy 1.28572 (1.30514)	Top-1 acc 41.406 (39.081)	Top-5 acc 67.188 (63.215)	lr 0.02420
Train [14][2330/3239]	Time 0.654 (0.873)	Data Time 0.001 (0.011)	Loss 3.6289 (3.5966)	Entropy 1.28581 (1.30506)	Top-1 acc 39.844 (39.079)	Top-5 acc 61.719 (63.215)	lr 0.02420
Train [14][2340/3239]	Time 0.598 (0.873)	Data Time 0.001 (0.010)	Loss 3.6078 (3.5966)	Entropy 1.28570 (1.30497)	Top-1 acc 37.891 (39.076)	Top-5 acc 64.453 (63.215)	lr 0.02420
Train [14][2350/3239]	Time 0.582 (0.873)	Data Time 0.001 (0.010)	Loss 3.6253 (3.5964)	Entropy 1.28532 (1.30489)	Top-1 acc 41.016 (39.083)	Top-5 acc 62.109 (63.222)	lr 0.02420
Train [14][2360/3239]	Time 0.614 (0.873)	Data Time 0.001 (0.010)	Loss 3.4984 (3.5962)	Entropy 1.28516 (1.30481)	Top-1 acc 41.016 (39.087)	Top-5 acc 64.062 (63.224)	lr 0.02420
Train [14][2370/3239]	Time 0.566 (0.872)	Data Time 0.001 (0.010)	Loss 3.5147 (3.5960)	Entropy 1.28548 (1.30473)	Top-1 acc 41.797 (39.094)	Top-5 acc 65.625 (63.230)	lr 0.02420
Train [14][2380/3239]	Time 0.572 (0.872)	Data Time 0.001 (0.010)	Loss 3.6237 (3.5960)	Entropy 1.28547 (1.30465)	Top-1 acc 38.672 (39.097)	Top-5 acc 61.328 (63.228)	lr 0.02420
Train [14][2390/3239]	Time 0.652 (0.880)	Data Time 0.005 (0.010)	Loss 3.5442 (3.5960)	Entropy 1.28539 (1.30456)	Top-1 acc 41.797 (39.097)	Top-5 acc 66.797 (63.229)	lr 0.02420
Train [14][2400/3239]	Time 0.693 (0.880)	Data Time 0.002 (0.010)	Loss 3.4858 (3.5959)	Entropy 1.28521 (1.30448)	Top-1 acc 44.531 (39.100)	Top-5 acc 66.406 (63.232)	lr 0.02420
Train [14][2410/3239]	Time 0.634 (0.880)	Data Time 0.001 (0.010)	Loss 3.4467 (3.5959)	Entropy 1.28508 (1.30440)	Top-1 acc 41.016 (39.102)	Top-5 acc 64.844 (63.230)	lr 0.02420
Train [14][2420/3239]	Time 0.579 (0.880)	Data Time 0.001 (0.010)	Loss 3.5903 (3.5960)	Entropy 1.28463 (1.30432)	Top-1 acc 39.453 (39.101)	Top-5 acc 60.938 (63.225)	lr 0.02420
Train [14][2430/3239]	Time 0.639 (0.880)	Data Time 0.001 (0.010)	Loss 3.6419 (3.5960)	Entropy 1.28427 (1.30424)	Top-1 acc 39.844 (39.100)	Top-5 acc 63.281 (63.225)	lr 0.02420
Train [14][2440/3239]	Time 0.617 (0.879)	Data Time 0.001 (0.010)	Loss 3.3884 (3.5959)	Entropy 1.28409 (1.30416)	Top-1 acc 44.922 (39.103)	Top-5 acc 65.625 (63.227)	lr 0.02420
Train [14][2450/3239]	Time 0.575 (0.879)	Data Time 0.002 (0.010)	Loss 3.7612 (3.5960)	Entropy 1.28389 (1.30408)	Top-1 acc 36.328 (39.097)	Top-5 acc 62.109 (63.224)	lr 0.02420
Train [14][2460/3239]	Time 0.630 (0.879)	Data Time 0.001 (0.010)	Loss 3.4808 (3.5960)	Entropy 1.28383 (1.30400)	Top-1 acc 44.141 (39.102)	Top-5 acc 67.188 (63.226)	lr 0.02420
Train [14][2470/3239]	Time 0.506 (0.879)	Data Time 0.002 (0.010)	Loss 3.5526 (3.5961)	Entropy 1.28362 (1.30392)	Top-1 acc 40.625 (39.103)	Top-5 acc 63.281 (63.227)	lr 0.02420
Train [14][2480/3239]	Time 0.561 (0.879)	Data Time 0.001 (0.010)	Loss 3.6134 (3.5964)	Entropy 1.28308 (1.30383)	Top-1 acc 35.938 (39.095)	Top-5 acc 61.328 (63.219)	lr 0.02420
Train [14][2490/3239]	Time 0.623 (0.879)	Data Time 0.001 (0.010)	Loss 3.7966 (3.5962)	Entropy 1.28297 (1.30375)	Top-1 acc 33.594 (39.100)	Top-5 acc 58.594 (63.222)	lr 0.02420
Train [14][2500/3239]	Time 0.537 (0.879)	Data Time 0.001 (0.010)	Loss 3.6850 (3.5963)	Entropy 1.28257 (1.30367)	Top-1 acc 36.719 (39.092)	Top-5 acc 59.375 (63.221)	lr 0.02420
Train [14][2510/3239]	Time 0.594 (0.878)	Data Time 0.001 (0.010)	Loss 3.5844 (3.5961)	Entropy 1.28233 (1.30358)	Top-1 acc 42.969 (39.096)	Top-5 acc 62.109 (63.224)	lr 0.02420
Train [14][2520/3239]	Time 0.588 (0.878)	Data Time 0.001 (0.010)	Loss 3.5426 (3.5961)	Entropy 1.28222 (1.30350)	Top-1 acc 42.188 (39.099)	Top-5 acc 62.500 (63.221)	lr 0.02420
Train [14][2530/3239]	Time 0.600 (0.878)	Data Time 0.001 (0.010)	Loss 3.6993 (3.5961)	Entropy 1.28223 (1.30341)	Top-1 acc 39.062 (39.100)	Top-5 acc 61.328 (63.218)	lr 0.02420
Train [14][2540/3239]	Time 0.629 (0.878)	Data Time 0.001 (0.010)	Loss 3.5611 (3.5959)	Entropy 1.28150 (1.30333)	Top-1 acc 40.625 (39.104)	Top-5 acc 62.500 (63.221)	lr 0.02419
Train [14][2550/3239]	Time 0.590 (0.878)	Data Time 0.001 (0.010)	Loss 3.5327 (3.5958)	Entropy 1.28148 (1.30324)	Top-1 acc 42.969 (39.103)	Top-5 acc 67.188 (63.224)	lr 0.02419
Train [14][2560/3239]	Time 0.689 (0.878)	Data Time 0.001 (0.010)	Loss 3.5714 (3.5957)	Entropy 1.28124 (1.30316)	Top-1 acc 40.234 (39.103)	Top-5 acc 66.016 (63.228)	lr 0.02419
Train [14][2570/3239]	Time 0.571 (0.877)	Data Time 0.001 (0.010)	Loss 3.4114 (3.5954)	Entropy 1.28015 (1.30307)	Top-1 acc 45.312 (39.112)	Top-5 acc 71.094 (63.236)	lr 0.02419
Train [14][2580/3239]	Time 0.573 (0.877)	Data Time 0.001 (0.010)	Loss 3.7165 (3.5956)	Entropy 1.28019 (1.30298)	Top-1 acc 39.062 (39.107)	Top-5 acc 62.891 (63.233)	lr 0.02419
Train [14][2590/3239]	Time 0.620 (0.877)	Data Time 0.001 (0.010)	Loss 3.6139 (3.5953)	Entropy 1.28012 (1.30289)	Top-1 acc 37.891 (39.117)	Top-5 acc 62.891 (63.242)	lr 0.02419
Train [14][2600/3239]	Time 0.582 (0.877)	Data Time 0.001 (0.010)	Loss 3.4767 (3.5953)	Entropy 1.27930 (1.30280)	Top-1 acc 39.062 (39.112)	Top-5 acc 69.922 (63.241)	lr 0.02419
Train [14][2610/3239]	Time 0.581 (0.877)	Data Time 0.001 (0.010)	Loss 3.6907 (3.5956)	Entropy 1.27906 (1.30271)	Top-1 acc 38.281 (39.106)	Top-5 acc 62.500 (63.238)	lr 0.02419
Train [14][2620/3239]	Time 0.593 (0.877)	Data Time 0.001 (0.010)	Loss 3.5996 (3.5954)	Entropy 1.27884 (1.30262)	Top-1 acc 38.672 (39.109)	Top-5 acc 64.844 (63.245)	lr 0.02419
Train [14][2630/3239]	Time 0.671 (0.877)	Data Time 0.001 (0.010)	Loss 3.7258 (3.5953)	Entropy 1.27870 (1.30253)	Top-1 acc 33.203 (39.109)	Top-5 acc 60.156 (63.247)	lr 0.02419
Train [14][2640/3239]	Time 0.623 (0.877)	Data Time 0.001 (0.010)	Loss 3.6014 (3.5951)	Entropy 1.27879 (1.30244)	Top-1 acc 41.406 (39.110)	Top-5 acc 60.938 (63.250)	lr 0.02419
Train [14][2650/3239]	Time 0.613 (0.876)	Data Time 0.001 (0.010)	Loss 3.6065 (3.5951)	Entropy 1.27883 (1.30235)	Top-1 acc 39.062 (39.109)	Top-5 acc 60.938 (63.252)	lr 0.02419
Train [14][2660/3239]	Time 0.566 (0.876)	Data Time 0.001 (0.009)	Loss 3.5781 (3.5950)	Entropy 1.27878 (1.30227)	Top-1 acc 40.234 (39.111)	Top-5 acc 62.891 (63.252)	lr 0.02419
Train [14][2670/3239]	Time 0.453 (0.876)	Data Time 0.001 (0.009)	Loss 3.7053 (3.5952)	Entropy 1.27843 (1.30218)	Top-1 acc 35.547 (39.105)	Top-5 acc 58.984 (63.246)	lr 0.02419
Train [14][2680/3239]	Time 0.609 (0.876)	Data Time 0.001 (0.009)	Loss 3.4428 (3.5953)	Entropy 1.27811 (1.30209)	Top-1 acc 40.234 (39.103)	Top-5 acc 65.625 (63.244)	lr 0.02419
Train [14][2690/3239]	Time 0.566 (0.876)	Data Time 0.001 (0.009)	Loss 3.3960 (3.5955)	Entropy 1.27781 (1.30200)	Top-1 acc 44.141 (39.097)	Top-5 acc 65.234 (63.241)	lr 0.02419
Train [14][2700/3239]	Time 0.671 (0.875)	Data Time 0.001 (0.009)	Loss 3.6030 (3.5958)	Entropy 1.27712 (1.30191)	Top-1 acc 35.547 (39.084)	Top-5 acc 64.453 (63.231)	lr 0.02419
Train [14][2710/3239]	Time 0.586 (0.875)	Data Time 0.001 (0.009)	Loss 3.4556 (3.5958)	Entropy 1.27713 (1.30182)	Top-1 acc 41.797 (39.084)	Top-5 acc 67.188 (63.234)	lr 0.02419
Train [14][2720/3239]	Time 0.584 (0.875)	Data Time 0.001 (0.009)	Loss 3.6164 (3.5959)	Entropy 1.27686 (1.30173)	Top-1 acc 40.234 (39.084)	Top-5 acc 63.672 (63.230)	lr 0.02419
Train [14][2730/3239]	Time 0.606 (0.875)	Data Time 0.001 (0.009)	Loss 3.5975 (3.5958)	Entropy 1.27668 (1.30163)	Top-1 acc 39.062 (39.092)	Top-5 acc 64.844 (63.233)	lr 0.02419
Train [14][2740/3239]	Time 0.565 (0.875)	Data Time 0.001 (0.009)	Loss 3.6266 (3.5959)	Entropy 1.27661 (1.30154)	Top-1 acc 38.281 (39.089)	Top-5 acc 64.453 (63.230)	lr 0.02419
Train [14][2750/3239]	Time 0.576 (0.875)	Data Time 0.001 (0.009)	Loss 3.7436 (3.5958)	Entropy 1.27611 (1.30145)	Top-1 acc 33.984 (39.090)	Top-5 acc 62.500 (63.235)	lr 0.02419
Train [14][2760/3239]	Time 0.596 (0.875)	Data Time 0.001 (0.009)	Loss 3.3337 (3.5956)	Entropy 1.27640 (1.30136)	Top-1 acc 42.188 (39.092)	Top-5 acc 64.062 (63.237)	lr 0.02419
Train [14][2770/3239]	Time 0.593 (0.874)	Data Time 0.001 (0.009)	Loss 3.4856 (3.5957)	Entropy 1.27638 (1.30127)	Top-1 acc 39.844 (39.090)	Top-5 acc 60.156 (63.235)	lr 0.02419
Train [14][2780/3239]	Time 0.556 (0.874)	Data Time 0.001 (0.009)	Loss 3.7129 (3.5956)	Entropy 1.27637 (1.30118)	Top-1 acc 34.766 (39.093)	Top-5 acc 60.156 (63.238)	lr 0.02419
Train [14][2790/3239]	Time 0.701 (0.874)	Data Time 0.001 (0.009)	Loss 3.3867 (3.5955)	Entropy 1.27621 (1.30109)	Top-1 acc 43.750 (39.097)	Top-5 acc 68.359 (63.243)	lr 0.02419
Train [14][2800/3239]	Time 0.586 (0.874)	Data Time 0.002 (0.009)	Loss 3.5488 (3.5957)	Entropy 1.27654 (1.30100)	Top-1 acc 38.281 (39.089)	Top-5 acc 62.109 (63.236)	lr 0.02419
Train [14][2810/3239]	Time 0.565 (0.874)	Data Time 0.001 (0.009)	Loss 3.6392 (3.5958)	Entropy 1.27672 (1.30092)	Top-1 acc 40.625 (39.085)	Top-5 acc 63.281 (63.234)	lr 0.02419
Train [14][2820/3239]	Time 0.598 (0.874)	Data Time 0.001 (0.009)	Loss 3.3413 (3.5957)	Entropy 1.27651 (1.30083)	Top-1 acc 44.922 (39.086)	Top-5 acc 66.406 (63.234)	lr 0.02418
Train [14][2830/3239]	Time 0.572 (0.874)	Data Time 0.002 (0.009)	Loss 3.6904 (3.5959)	Entropy 1.27612 (1.30074)	Top-1 acc 37.500 (39.082)	Top-5 acc 60.938 (63.230)	lr 0.02418
Train [14][2840/3239]	Time 0.591 (0.874)	Data Time 0.001 (0.009)	Loss 3.6563 (3.5958)	Entropy 1.27588 (1.30066)	Top-1 acc 36.328 (39.085)	Top-5 acc 62.109 (63.231)	lr 0.02418
Train [14][2850/3239]	Time 0.591 (0.874)	Data Time 0.001 (0.009)	Loss 3.5551 (3.5960)	Entropy 1.27561 (1.30057)	Top-1 acc 38.281 (39.079)	Top-5 acc 65.234 (63.229)	lr 0.02418
Train [14][2860/3239]	Time 0.675 (0.873)	Data Time 0.002 (0.009)	Loss 3.6381 (3.5958)	Entropy 1.27569 (1.30048)	Top-1 acc 39.844 (39.084)	Top-5 acc 60.547 (63.231)	lr 0.02418
Train [14][2870/3239]	Time 0.462 (0.873)	Data Time 0.001 (0.009)	Loss 3.4488 (3.5958)	Entropy 1.27553 (1.30040)	Top-1 acc 41.016 (39.082)	Top-5 acc 66.406 (63.227)	lr 0.02418
Train [14][2880/3239]	Time 0.596 (0.873)	Data Time 0.001 (0.009)	Loss 3.5978 (3.5960)	Entropy 1.27480 (1.30031)	Top-1 acc 41.016 (39.085)	Top-5 acc 64.062 (63.223)	lr 0.02418
Train [14][2890/3239]	Time 0.559 (0.873)	Data Time 0.001 (0.009)	Loss 3.4347 (3.5958)	Entropy 1.27488 (1.30022)	Top-1 acc 43.359 (39.090)	Top-5 acc 65.234 (63.225)	lr 0.02418
Train [14][2900/3239]	Time 0.551 (0.873)	Data Time 0.001 (0.009)	Loss 3.6305 (3.5960)	Entropy 1.27467 (1.30013)	Top-1 acc 39.453 (39.088)	Top-5 acc 60.938 (63.220)	lr 0.02418
Train [14][2910/3239]	Time 0.586 (0.873)	Data Time 0.001 (0.009)	Loss 3.6374 (3.5962)	Entropy 1.27476 (1.30005)	Top-1 acc 39.844 (39.087)	Top-5 acc 60.156 (63.216)	lr 0.02418
Train [14][2920/3239]	Time 0.588 (0.873)	Data Time 0.001 (0.009)	Loss 3.3522 (3.5962)	Entropy 1.27454 (1.29996)	Top-1 acc 44.531 (39.087)	Top-5 acc 67.188 (63.213)	lr 0.02418
Train [14][2930/3239]	Time 0.614 (0.873)	Data Time 0.002 (0.009)	Loss 3.4442 (3.5961)	Entropy 1.27427 (1.29987)	Top-1 acc 43.359 (39.094)	Top-5 acc 66.406 (63.213)	lr 0.02418
Train [14][2940/3239]	Time 0.612 (0.872)	Data Time 0.001 (0.009)	Loss 3.4045 (3.5961)	Entropy 1.27432 (1.29978)	Top-1 acc 42.578 (39.091)	Top-5 acc 65.625 (63.212)	lr 0.02418
Train [14][2950/3239]	Time 0.577 (0.872)	Data Time 0.001 (0.009)	Loss 3.4513 (3.5959)	Entropy 1.27362 (1.29970)	Top-1 acc 38.281 (39.093)	Top-5 acc 62.891 (63.214)	lr 0.02418
Train [14][2960/3239]	Time 0.630 (0.872)	Data Time 0.001 (0.009)	Loss 3.3308 (3.5957)	Entropy 1.27369 (1.29961)	Top-1 acc 46.484 (39.095)	Top-5 acc 67.578 (63.217)	lr 0.02418
Train [14][2970/3239]	Time 0.593 (0.872)	Data Time 0.002 (0.009)	Loss 3.5903 (3.5956)	Entropy 1.27328 (1.29952)	Top-1 acc 36.328 (39.096)	Top-5 acc 59.766 (63.220)	lr 0.02418
Train [14][2980/3239]	Time 0.582 (0.872)	Data Time 0.001 (0.009)	Loss 3.6782 (3.5957)	Entropy 1.27275 (1.29943)	Top-1 acc 37.109 (39.092)	Top-5 acc 63.672 (63.219)	lr 0.02418
Train [14][2990/3239]	Time 0.617 (0.872)	Data Time 0.001 (0.009)	Loss 3.5483 (3.5956)	Entropy 1.27206 (1.29934)	Top-1 acc 39.844 (39.095)	Top-5 acc 63.281 (63.223)	lr 0.02418
Train [14][3000/3239]	Time 0.598 (0.872)	Data Time 0.001 (0.009)	Loss 3.4933 (3.5956)	Entropy 1.27177 (1.29925)	Top-1 acc 41.406 (39.096)	Top-5 acc 61.328 (63.221)	lr 0.02418
Train [14][3010/3239]	Time 0.604 (0.872)	Data Time 0.001 (0.009)	Loss 3.5243 (3.5955)	Entropy 1.27197 (1.29916)	Top-1 acc 43.359 (39.099)	Top-5 acc 62.109 (63.225)	lr 0.02418
Train [14][3020/3239]	Time 0.566 (0.872)	Data Time 0.001 (0.009)	Loss 3.4871 (3.5954)	Entropy 1.27184 (1.29907)	Top-1 acc 42.578 (39.102)	Top-5 acc 67.188 (63.230)	lr 0.02418
Train [14][3030/3239]	Time 0.582 (0.871)	Data Time 0.001 (0.009)	Loss 3.6748 (3.5953)	Entropy 1.27135 (1.29898)	Top-1 acc 39.453 (39.104)	Top-5 acc 64.844 (63.231)	lr 0.02418
Train [14][3040/3239]	Time 0.592 (0.871)	Data Time 0.001 (0.009)	Loss 3.6597 (3.5954)	Entropy 1.27076 (1.29889)	Top-1 acc 38.281 (39.107)	Top-5 acc 62.500 (63.231)	lr 0.02418
Train [14][3050/3239]	Time 0.570 (0.878)	Data Time 0.002 (0.009)	Loss 3.4871 (3.5953)	Entropy 1.27040 (1.29880)	Top-1 acc 37.891 (39.107)	Top-5 acc 65.625 (63.231)	lr 0.02418
Train [14][3060/3239]	Time 0.594 (0.878)	Data Time 0.003 (0.009)	Loss 3.5161 (3.5950)	Entropy 1.27017 (1.29870)	Top-1 acc 39.453 (39.116)	Top-5 acc 66.797 (63.238)	lr 0.02418
Train [14][3070/3239]	Time 0.555 (0.878)	Data Time 0.001 (0.008)	Loss 3.7582 (3.5952)	Entropy 1.27002 (1.29861)	Top-1 acc 35.547 (39.114)	Top-5 acc 60.547 (63.237)	lr 0.02418
Train [14][3080/3239]	Time 0.582 (0.878)	Data Time 0.002 (0.008)	Loss 3.5592 (3.5951)	Entropy 1.26987 (1.29852)	Top-1 acc 39.453 (39.119)	Top-5 acc 64.844 (63.238)	lr 0.02418
Train [14][3090/3239]	Time 0.669 (0.878)	Data Time 0.002 (0.008)	Loss 3.6824 (3.5952)	Entropy 1.26992 (1.29842)	Top-1 acc 34.375 (39.117)	Top-5 acc 64.453 (63.235)	lr 0.02418
Train [14][3100/3239]	Time 0.577 (0.877)	Data Time 0.001 (0.008)	Loss 3.5928 (3.5953)	Entropy 1.26961 (1.29833)	Top-1 acc 42.969 (39.116)	Top-5 acc 67.578 (63.237)	lr 0.02417
Train [14][3110/3239]	Time 0.553 (0.877)	Data Time 0.002 (0.008)	Loss 3.5518 (3.5953)	Entropy 1.26951 (1.29824)	Top-1 acc 40.234 (39.121)	Top-5 acc 62.109 (63.238)	lr 0.02417
Train [14][3120/3239]	Time 0.603 (0.877)	Data Time 0.001 (0.008)	Loss 3.7613 (3.5954)	Entropy 1.26942 (1.29815)	Top-1 acc 35.547 (39.118)	Top-5 acc 61.328 (63.231)	lr 0.02417
Train [14][3130/3239]	Time 0.558 (0.877)	Data Time 0.001 (0.008)	Loss 3.6069 (3.5957)	Entropy 1.26924 (1.29806)	Top-1 acc 37.109 (39.111)	Top-5 acc 62.500 (63.226)	lr 0.02417
Train [14][3140/3239]	Time 0.578 (0.877)	Data Time 0.001 (0.008)	Loss 3.5884 (3.5958)	Entropy 1.26888 (1.29796)	Top-1 acc 38.281 (39.111)	Top-5 acc 64.453 (63.225)	lr 0.02417
Train [14][3150/3239]	Time 0.612 (0.877)	Data Time 0.001 (0.008)	Loss 3.5587 (3.5956)	Entropy 1.26852 (1.29787)	Top-1 acc 39.062 (39.113)	Top-5 acc 63.672 (63.225)	lr 0.02417
Train [14][3160/3239]	Time 0.701 (0.877)	Data Time 0.002 (0.008)	Loss 3.4406 (3.5954)	Entropy 1.26841 (1.29778)	Top-1 acc 42.969 (39.120)	Top-5 acc 66.406 (63.231)	lr 0.02417
Train [14][3170/3239]	Time 0.471 (0.877)	Data Time 0.001 (0.008)	Loss 3.5291 (3.5953)	Entropy 1.26812 (1.29768)	Top-1 acc 41.797 (39.122)	Top-5 acc 61.719 (63.229)	lr 0.02417
Train [14][3180/3239]	Time 0.564 (0.877)	Data Time 0.000 (0.008)	Loss 3.5195 (3.5951)	Entropy 1.26779 (1.29759)	Top-1 acc 39.844 (39.124)	Top-5 acc 68.359 (63.237)	lr 0.02417
Train [14][3190/3239]	Time 0.533 (0.876)	Data Time 0.000 (0.008)	Loss 3.6993 (3.5953)	Entropy 1.26750 (1.29750)	Top-1 acc 36.328 (39.124)	Top-5 acc 58.594 (63.233)	lr 0.02417
Train [14][3200/3239]	Time 0.581 (0.876)	Data Time 0.000 (0.008)	Loss 3.5269 (3.5951)	Entropy 1.26725 (1.29740)	Top-1 acc 43.359 (39.128)	Top-5 acc 63.672 (63.239)	lr 0.02417
Train [14][3210/3239]	Time 0.545 (0.876)	Data Time 0.000 (0.008)	Loss 3.4992 (3.5951)	Entropy 1.26747 (1.29731)	Top-1 acc 39.453 (39.129)	Top-5 acc 63.281 (63.235)	lr 0.02417
Train [14][3220/3239]	Time 0.600 (0.876)	Data Time 0.000 (0.008)	Loss 3.5876 (3.5951)	Entropy 1.26767 (1.29722)	Top-1 acc 38.672 (39.128)	Top-5 acc 59.766 (63.235)	lr 0.02417
Train [14][3230/3239]	Time 0.537 (0.876)	Data Time 0.000 (0.008)	Loss 3.7004 (3.5950)	Entropy 1.26704 (1.29713)	Top-1 acc 37.891 (39.130)	Top-5 acc 60.547 (63.239)	lr 0.02417
Train [14][3239/3239]	Time 1.542 (0.876)	Data Time 0.000 (0.008)	Loss 3.6414 (3.5948)	Entropy 1.26723 (1.29704)	Top-1 acc 46.914 (39.133)	Top-5 acc 64.198 (63.241)	lr 0.02417
==========Valid [14/120]	loss 2.343	top-1 acc 49.122 (49.122)	top-5 acc 73.151	Train top-1 39.133	top-5 63.241	Entropy 1.26723	Latency-None: 0.000ms	Flops: 542.77M
Train [15][0/3239]	Time 21.486 (21.486)	Data Time 18.244 (18.244)	Loss 3.5031 (3.5031)	Entropy 1.26714 (1.26714)	Top-1 acc 39.844 (39.844)	Top-5 acc 63.281 (63.281)	lr 0.02417
Train [15][10/3239]	Time 0.648 (2.747)	Data Time 0.001 (1.660)	Loss 3.3368 (3.5397)	Entropy 1.26673 (1.26696)	Top-1 acc 46.094 (40.412)	Top-5 acc 64.844 (63.707)	lr 0.02417
Train [15][20/3239]	Time 0.624 (1.849)	Data Time 0.001 (0.870)	Loss 3.5195 (3.5325)	Entropy 1.26665 (1.26687)	Top-1 acc 41.016 (41.276)	Top-5 acc 62.891 (64.137)	lr 0.02417
Train [15][30/3239]	Time 0.598 (1.520)	Data Time 0.001 (0.590)	Loss 3.6600 (3.5277)	Entropy 1.26653 (1.26678)	Top-1 acc 38.281 (41.142)	Top-5 acc 64.062 (64.403)	lr 0.02417
Train [15][40/3239]	Time 0.561 (1.357)	Data Time 0.001 (0.447)	Loss 3.7669 (3.5338)	Entropy 1.26621 (1.26669)	Top-1 acc 35.938 (40.454)	Top-5 acc 55.469 (64.282)	lr 0.02417
Train [15][50/3239]	Time 0.595 (1.253)	Data Time 0.002 (0.359)	Loss 3.5616 (3.5342)	Entropy 1.26553 (1.26655)	Top-1 acc 42.188 (40.441)	Top-5 acc 64.062 (64.246)	lr 0.02417
Train [15][60/3239]	Time 0.595 (1.187)	Data Time 0.001 (0.301)	Loss 3.4058 (3.5280)	Entropy 1.26571 (1.26639)	Top-1 acc 41.406 (40.516)	Top-5 acc 68.750 (64.485)	lr 0.02417
Train [15][70/3239]	Time 0.618 (1.141)	Data Time 0.003 (0.259)	Loss 3.4409 (3.5313)	Entropy 1.26589 (1.26630)	Top-1 acc 41.406 (40.542)	Top-5 acc 66.797 (64.459)	lr 0.02417
Train [15][80/3239]	Time 0.617 (1.105)	Data Time 0.001 (0.227)	Loss 3.5357 (3.5285)	Entropy 1.26560 (1.26624)	Top-1 acc 44.922 (40.741)	Top-5 acc 65.234 (64.530)	lr 0.02417
Train [15][90/3239]	Time 0.534 (1.076)	Data Time 0.001 (0.202)	Loss 3.6128 (3.5278)	Entropy 1.26534 (1.26616)	Top-1 acc 39.844 (40.762)	Top-5 acc 65.234 (64.513)	lr 0.02417
Train [15][100/3239]	Time 0.660 (1.056)	Data Time 0.002 (0.182)	Loss 3.7957 (3.5341)	Entropy 1.26567 (1.26610)	Top-1 acc 37.109 (40.668)	Top-5 acc 57.422 (64.337)	lr 0.02417
Train [15][110/3239]	Time 0.577 (1.037)	Data Time 0.002 (0.166)	Loss 3.4968 (3.5366)	Entropy 1.26527 (1.26605)	Top-1 acc 41.016 (40.597)	Top-5 acc 64.062 (64.267)	lr 0.02417
Train [15][120/3239]	Time 0.598 (1.026)	Data Time 0.001 (0.152)	Loss 3.5237 (3.5426)	Entropy 1.26526 (1.26598)	Top-1 acc 41.797 (40.486)	Top-5 acc 66.406 (64.214)	lr 0.02417
Train [15][130/3239]	Time 0.564 (1.008)	Data Time 0.003 (0.141)	Loss 3.5316 (3.5483)	Entropy 1.26543 (1.26593)	Top-1 acc 43.359 (40.386)	Top-5 acc 63.281 (64.045)	lr 0.02417
Train [15][140/3239]	Time 0.620 (0.999)	Data Time 0.001 (0.131)	Loss 3.5902 (3.5442)	Entropy 1.26503 (1.26588)	Top-1 acc 37.109 (40.423)	Top-5 acc 62.500 (64.231)	lr 0.02416
Train [15][150/3239]	Time 0.696 (0.989)	Data Time 0.001 (0.123)	Loss 3.7291 (3.5461)	Entropy 1.26455 (1.26581)	Top-1 acc 36.719 (40.289)	Top-5 acc 59.766 (64.158)	lr 0.02416
Train [15][160/3239]	Time 0.585 (0.978)	Data Time 0.001 (0.115)	Loss 3.6334 (3.5502)	Entropy 1.26425 (1.26572)	Top-1 acc 41.016 (40.210)	Top-5 acc 62.109 (64.058)	lr 0.02416
Train [15][170/3239]	Time 0.613 (0.970)	Data Time 0.001 (0.108)	Loss 3.5944 (3.5522)	Entropy 1.26418 (1.26563)	Top-1 acc 39.062 (40.205)	Top-5 acc 62.500 (64.019)	lr 0.02416
Train [15][180/3239]	Time 0.651 (0.964)	Data Time 0.001 (0.103)	Loss 3.5993 (3.5543)	Entropy 1.26395 (1.26556)	Top-1 acc 40.234 (40.144)	Top-5 acc 62.500 (64.009)	lr 0.02416
Train [15][190/3239]	Time 0.563 (0.958)	Data Time 0.001 (0.097)	Loss 3.5104 (3.5553)	Entropy 1.26389 (1.26547)	Top-1 acc 39.453 (40.106)	Top-5 acc 65.234 (64.003)	lr 0.02416
Train [15][200/3239]	Time 0.586 (0.952)	Data Time 0.001 (0.093)	Loss 3.6241 (3.5545)	Entropy 1.26321 (1.26538)	Top-1 acc 41.016 (40.186)	Top-5 acc 61.328 (64.002)	lr 0.02416
Train [15][210/3239]	Time 0.571 (0.946)	Data Time 0.001 (0.088)	Loss 3.4178 (3.5547)	Entropy 1.26314 (1.26528)	Top-1 acc 44.141 (40.205)	Top-5 acc 64.062 (63.992)	lr 0.02416
Train [15][220/3239]	Time 0.694 (0.942)	Data Time 0.003 (0.084)	Loss 3.5399 (3.5530)	Entropy 1.26266 (1.26517)	Top-1 acc 36.328 (40.218)	Top-5 acc 60.156 (63.990)	lr 0.02416
Train [15][230/3239]	Time 0.591 (0.938)	Data Time 0.001 (0.081)	Loss 3.6863 (3.5544)	Entropy 1.26223 (1.26505)	Top-1 acc 41.016 (40.182)	Top-5 acc 60.547 (63.956)	lr 0.02416
Train [15][240/3239]	Time 0.587 (0.934)	Data Time 0.001 (0.077)	Loss 3.6462 (3.5549)	Entropy 1.26224 (1.26493)	Top-1 acc 37.500 (40.178)	Top-5 acc 61.719 (63.925)	lr 0.02416
Train [15][250/3239]	Time 0.567 (0.930)	Data Time 0.001 (0.074)	Loss 3.5991 (3.5541)	Entropy 1.26208 (1.26483)	Top-1 acc 35.938 (40.200)	Top-5 acc 64.062 (63.933)	lr 0.02416
Train [15][260/3239]	Time 0.573 (0.927)	Data Time 0.001 (0.072)	Loss 3.4312 (3.5549)	Entropy 1.26200 (1.26472)	Top-1 acc 43.750 (40.145)	Top-5 acc 65.625 (63.887)	lr 0.02416
Train [15][270/3239]	Time 0.612 (0.925)	Data Time 0.001 (0.069)	Loss 3.5879 (3.5548)	Entropy 1.26205 (1.26462)	Top-1 acc 42.578 (40.138)	Top-5 acc 63.281 (63.907)	lr 0.02416
Train [15][280/3239]	Time 0.595 (0.921)	Data Time 0.002 (0.067)	Loss 3.7109 (3.5572)	Entropy 1.26210 (1.26453)	Top-1 acc 39.453 (40.094)	Top-5 acc 61.328 (63.887)	lr 0.02416
Train [15][290/3239]	Time 0.675 (0.918)	Data Time 0.001 (0.065)	Loss 3.5472 (3.5588)	Entropy 1.26211 (1.26445)	Top-1 acc 41.797 (40.008)	Top-5 acc 66.406 (63.846)	lr 0.02416
Train [15][300/3239]	Time 0.604 (0.914)	Data Time 0.002 (0.062)	Loss 3.6197 (3.5574)	Entropy 1.26210 (1.26437)	Top-1 acc 37.500 (40.011)	Top-5 acc 64.062 (63.886)	lr 0.02416
Train [15][310/3239]	Time 0.604 (0.912)	Data Time 0.001 (0.061)	Loss 3.3768 (3.5577)	Entropy 1.26204 (1.26430)	Top-1 acc 42.969 (40.011)	Top-5 acc 66.016 (63.909)	lr 0.02416
Train [15][320/3239]	Time 0.613 (0.910)	Data Time 0.001 (0.059)	Loss 3.4219 (3.5563)	Entropy 1.26205 (1.26423)	Top-1 acc 42.578 (40.055)	Top-5 acc 67.969 (63.938)	lr 0.02416
Train [15][330/3239]	Time 0.598 (0.908)	Data Time 0.001 (0.057)	Loss 3.3351 (3.5557)	Entropy 1.26171 (1.26416)	Top-1 acc 45.312 (40.094)	Top-5 acc 67.188 (63.973)	lr 0.02416
Train [15][340/3239]	Time 0.556 (0.907)	Data Time 0.001 (0.055)	Loss 3.3302 (3.5543)	Entropy 1.26183 (1.26408)	Top-1 acc 46.094 (40.112)	Top-5 acc 65.625 (63.985)	lr 0.02416
Train [15][350/3239]	Time 0.632 (0.905)	Data Time 0.001 (0.054)	Loss 3.3248 (3.5539)	Entropy 1.26183 (1.26402)	Top-1 acc 44.531 (40.102)	Top-5 acc 67.969 (63.986)	lr 0.02416
Train [15][360/3239]	Time 0.609 (0.904)	Data Time 0.001 (0.052)	Loss 3.6552 (3.5536)	Entropy 1.26209 (1.26396)	Top-1 acc 36.719 (40.113)	Top-5 acc 62.109 (64.002)	lr 0.02416
Train [15][370/3239]	Time 0.562 (0.902)	Data Time 0.001 (0.051)	Loss 3.5583 (3.5539)	Entropy 1.26172 (1.26391)	Top-1 acc 41.016 (40.115)	Top-5 acc 64.453 (64.006)	lr 0.02416
Train [15][380/3239]	Time 0.694 (0.901)	Data Time 0.001 (0.050)	Loss 3.3985 (3.5545)	Entropy 1.26179 (1.26385)	Top-1 acc 41.016 (40.093)	Top-5 acc 67.578 (63.993)	lr 0.02416
Train [15][390/3239]	Time 0.635 (0.900)	Data Time 0.001 (0.049)	Loss 3.4753 (3.5536)	Entropy 1.26195 (1.26380)	Top-1 acc 42.188 (40.105)	Top-5 acc 63.672 (64.025)	lr 0.02416
Train [15][400/3239]	Time 0.610 (0.898)	Data Time 0.001 (0.047)	Loss 3.6191 (3.5548)	Entropy 1.26153 (1.26375)	Top-1 acc 37.109 (40.132)	Top-5 acc 64.453 (63.997)	lr 0.02416
Train [15][410/3239]	Time 0.586 (0.897)	Data Time 0.001 (0.046)	Loss 3.4979 (3.5549)	Entropy 1.26128 (1.26369)	Top-1 acc 41.406 (40.135)	Top-5 acc 62.500 (63.995)	lr 0.02415
Train [15][420/3239]	Time 0.560 (0.896)	Data Time 0.001 (0.045)	Loss 3.6047 (3.5531)	Entropy 1.26112 (1.26363)	Top-1 acc 42.188 (40.145)	Top-5 acc 66.016 (64.042)	lr 0.02415
Train [15][430/3239]	Time 0.656 (0.895)	Data Time 0.001 (0.044)	Loss 3.3594 (3.5516)	Entropy 1.26097 (1.26357)	Top-1 acc 42.969 (40.162)	Top-5 acc 71.094 (64.062)	lr 0.02415
Train [15][440/3239]	Time 0.667 (0.893)	Data Time 0.002 (0.043)	Loss 3.3994 (3.5518)	Entropy 1.26088 (1.26351)	Top-1 acc 44.141 (40.167)	Top-5 acc 68.750 (64.070)	lr 0.02415
Train [15][450/3239]	Time 0.667 (0.892)	Data Time 0.001 (0.042)	Loss 3.7189 (3.5525)	Entropy 1.26063 (1.26346)	Top-1 acc 36.328 (40.154)	Top-5 acc 60.547 (64.036)	lr 0.02415
Train [15][460/3239]	Time 0.742 (0.931)	Data Time 0.005 (0.042)	Loss 3.6447 (3.5542)	Entropy 1.26053 (1.26339)	Top-1 acc 41.406 (40.117)	Top-5 acc 61.328 (64.011)	lr 0.02415
Train [15][470/3239]	Time 0.587 (0.931)	Data Time 0.002 (0.041)	Loss 3.4789 (3.5544)	Entropy 1.26015 (1.26333)	Top-1 acc 42.969 (40.103)	Top-5 acc 61.328 (63.998)	lr 0.02415
Train [15][480/3239]	Time 0.609 (0.929)	Data Time 0.002 (0.040)	Loss 3.4262 (3.5551)	Entropy 1.25970 (1.26326)	Top-1 acc 41.016 (40.079)	Top-5 acc 65.234 (63.998)	lr 0.02415
Train [15][490/3239]	Time 0.554 (0.927)	Data Time 0.001 (0.039)	Loss 3.5524 (3.5548)	Entropy 1.25972 (1.26319)	Top-1 acc 41.406 (40.078)	Top-5 acc 65.234 (64.029)	lr 0.02415
Train [15][500/3239]	Time 0.535 (0.926)	Data Time 0.001 (0.038)	Loss 3.6262 (3.5555)	Entropy 1.25994 (1.26312)	Top-1 acc 41.797 (40.073)	Top-5 acc 63.281 (64.016)	lr 0.02415
Train [15][510/3239]	Time 0.599 (0.924)	Data Time 0.001 (0.038)	Loss 3.3776 (3.5571)	Entropy 1.26008 (1.26306)	Top-1 acc 40.234 (40.016)	Top-5 acc 63.281 (63.980)	lr 0.02415
Train [15][520/3239]	Time 0.585 (0.923)	Data Time 0.001 (0.037)	Loss 3.7254 (3.5557)	Entropy 1.25946 (1.26300)	Top-1 acc 35.547 (40.063)	Top-5 acc 59.766 (64.003)	lr 0.02415
Train [15][530/3239]	Time 0.583 (0.921)	Data Time 0.001 (0.036)	Loss 3.5224 (3.5554)	Entropy 1.25954 (1.26293)	Top-1 acc 39.453 (40.058)	Top-5 acc 61.719 (63.998)	lr 0.02415
Train [15][540/3239]	Time 0.596 (0.920)	Data Time 0.001 (0.036)	Loss 3.3731 (3.5547)	Entropy 1.25956 (1.26287)	Top-1 acc 46.484 (40.079)	Top-5 acc 64.844 (64.008)	lr 0.02415
Train [15][550/3239]	Time 0.559 (0.918)	Data Time 0.001 (0.035)	Loss 3.4489 (3.5546)	Entropy 1.25927 (1.26281)	Top-1 acc 43.750 (40.095)	Top-5 acc 67.188 (64.017)	lr 0.02415
Train [15][560/3239]	Time 0.535 (0.917)	Data Time 0.001 (0.035)	Loss 3.6675 (3.5548)	Entropy 1.25894 (1.26274)	Top-1 acc 37.109 (40.079)	Top-5 acc 62.109 (64.024)	lr 0.02415
Train [15][570/3239]	Time 0.616 (0.916)	Data Time 0.001 (0.034)	Loss 3.5669 (3.5549)	Entropy 1.25912 (1.26267)	Top-1 acc 35.938 (40.063)	Top-5 acc 61.328 (64.005)	lr 0.02415
Train [15][580/3239]	Time 0.631 (0.914)	Data Time 0.001 (0.033)	Loss 3.4022 (3.5536)	Entropy 1.25875 (1.26261)	Top-1 acc 42.969 (40.082)	Top-5 acc 67.188 (64.028)	lr 0.02415
Train [15][590/3239]	Time 0.595 (0.913)	Data Time 0.001 (0.033)	Loss 3.6846 (3.5542)	Entropy 1.25884 (1.26254)	Top-1 acc 33.984 (40.051)	Top-5 acc 58.984 (64.004)	lr 0.02415
Train [15][600/3239]	Time 0.550 (0.911)	Data Time 0.001 (0.032)	Loss 3.7416 (3.5544)	Entropy 1.25833 (1.26248)	Top-1 acc 33.203 (40.037)	Top-5 acc 56.641 (63.999)	lr 0.02415
Train [15][610/3239]	Time 0.703 (0.910)	Data Time 0.001 (0.032)	Loss 3.4886 (3.5558)	Entropy 1.25857 (1.26241)	Top-1 acc 42.188 (40.002)	Top-5 acc 67.969 (63.984)	lr 0.02415
Train [15][620/3239]	Time 0.627 (0.909)	Data Time 0.002 (0.031)	Loss 3.8213 (3.5557)	Entropy 1.25849 (1.26235)	Top-1 acc 37.500 (40.019)	Top-5 acc 61.328 (63.995)	lr 0.02415
Train [15][630/3239]	Time 0.621 (0.907)	Data Time 0.001 (0.031)	Loss 3.5564 (3.5560)	Entropy 1.25823 (1.26229)	Top-1 acc 40.234 (40.002)	Top-5 acc 65.234 (63.999)	lr 0.02415
Train [15][640/3239]	Time 0.618 (0.906)	Data Time 0.001 (0.031)	Loss 3.3582 (3.5560)	Entropy 1.25832 (1.26223)	Top-1 acc 44.922 (40.003)	Top-5 acc 71.484 (64.005)	lr 0.02415
Train [15][650/3239]	Time 0.570 (0.905)	Data Time 0.001 (0.030)	Loss 3.4818 (3.5555)	Entropy 1.25787 (1.26217)	Top-1 acc 41.406 (40.024)	Top-5 acc 65.625 (64.022)	lr 0.02415
Train [15][660/3239]	Time 0.628 (0.904)	Data Time 0.001 (0.030)	Loss 3.7175 (3.5561)	Entropy 1.25759 (1.26210)	Top-1 acc 37.891 (40.019)	Top-5 acc 62.109 (64.023)	lr 0.02415
Train [15][670/3239]	Time 0.611 (0.904)	Data Time 0.001 (0.029)	Loss 3.5323 (3.5559)	Entropy 1.25725 (1.26203)	Top-1 acc 39.844 (40.022)	Top-5 acc 64.844 (64.032)	lr 0.02415
Train [15][680/3239]	Time 0.699 (0.903)	Data Time 0.001 (0.029)	Loss 3.5676 (3.5557)	Entropy 1.25714 (1.26196)	Top-1 acc 39.453 (40.028)	Top-5 acc 64.453 (64.045)	lr 0.02414
Train [15][690/3239]	Time 0.590 (0.902)	Data Time 0.001 (0.028)	Loss 3.6116 (3.5562)	Entropy 1.25696 (1.26189)	Top-1 acc 41.016 (40.024)	Top-5 acc 63.672 (64.039)	lr 0.02414
Train [15][700/3239]	Time 0.617 (0.901)	Data Time 0.001 (0.028)	Loss 3.6542 (3.5583)	Entropy 1.25694 (1.26182)	Top-1 acc 37.109 (39.984)	Top-5 acc 64.844 (64.005)	lr 0.02414
Train [15][710/3239]	Time 0.597 (0.901)	Data Time 0.001 (0.028)	Loss 3.6271 (3.5587)	Entropy 1.25664 (1.26175)	Top-1 acc 40.625 (39.966)	Top-5 acc 61.719 (64.010)	lr 0.02414
Train [15][720/3239]	Time 0.546 (0.900)	Data Time 0.001 (0.027)	Loss 3.5333 (3.5594)	Entropy 1.25624 (1.26168)	Top-1 acc 41.016 (39.959)	Top-5 acc 63.672 (64.002)	lr 0.02414
Train [15][730/3239]	Time 0.604 (0.900)	Data Time 0.001 (0.027)	Loss 3.6856 (3.5594)	Entropy 1.25612 (1.26160)	Top-1 acc 36.719 (39.948)	Top-5 acc 61.719 (64.000)	lr 0.02414
Train [15][740/3239]	Time 0.624 (0.899)	Data Time 0.001 (0.027)	Loss 3.4105 (3.5592)	Entropy 1.25576 (1.26153)	Top-1 acc 44.922 (39.951)	Top-5 acc 65.625 (63.998)	lr 0.02414
Train [15][750/3239]	Time 0.706 (0.898)	Data Time 0.002 (0.026)	Loss 3.6488 (3.5600)	Entropy 1.25514 (1.26145)	Top-1 acc 37.891 (39.936)	Top-5 acc 59.375 (63.975)	lr 0.02414
Train [15][760/3239]	Time 0.442 (0.897)	Data Time 0.001 (0.026)	Loss 3.5261 (3.5607)	Entropy 1.25508 (1.26136)	Top-1 acc 40.625 (39.937)	Top-5 acc 64.062 (63.960)	lr 0.02414
Train [15][770/3239]	Time 0.571 (0.896)	Data Time 0.001 (0.026)	Loss 3.5791 (3.5605)	Entropy 1.25488 (1.26128)	Top-1 acc 40.625 (39.943)	Top-5 acc 64.844 (63.966)	lr 0.02414
Train [15][780/3239]	Time 0.535 (0.894)	Data Time 0.001 (0.025)	Loss 3.5921 (3.5605)	Entropy 1.25476 (1.26120)	Top-1 acc 38.281 (39.944)	Top-5 acc 64.062 (63.966)	lr 0.02414
Train [15][790/3239]	Time 0.518 (0.892)	Data Time 0.002 (0.025)	Loss 3.6441 (3.5608)	Entropy 1.25420 (1.26112)	Top-1 acc 41.797 (39.943)	Top-5 acc 60.938 (63.957)	lr 0.02414
Train [15][800/3239]	Time 0.603 (0.891)	Data Time 0.001 (0.025)	Loss 3.5428 (3.5602)	Entropy 1.25449 (1.26103)	Top-1 acc 38.672 (39.942)	Top-5 acc 61.328 (63.965)	lr 0.02414
Train [15][810/3239]	Time 0.578 (0.891)	Data Time 0.001 (0.025)	Loss 3.4736 (3.5606)	Entropy 1.25426 (1.26095)	Top-1 acc 41.016 (39.920)	Top-5 acc 68.359 (63.949)	lr 0.02414
Train [15][820/3239]	Time 0.689 (0.890)	Data Time 0.001 (0.024)	Loss 3.5806 (3.5605)	Entropy 1.25456 (1.26087)	Top-1 acc 38.281 (39.931)	Top-5 acc 64.453 (63.962)	lr 0.02414
Train [15][830/3239]	Time 0.613 (0.890)	Data Time 0.001 (0.024)	Loss 3.4650 (3.5603)	Entropy 1.25424 (1.26079)	Top-1 acc 40.625 (39.940)	Top-5 acc 66.406 (63.968)	lr 0.02414
Train [15][840/3239]	Time 0.583 (0.889)	Data Time 0.001 (0.024)	Loss 3.3839 (3.5602)	Entropy 1.25421 (1.26072)	Top-1 acc 46.484 (39.946)	Top-5 acc 69.141 (63.967)	lr 0.02414
Train [15][850/3239]	Time 0.619 (0.889)	Data Time 0.001 (0.023)	Loss 3.6354 (3.5602)	Entropy 1.25427 (1.26064)	Top-1 acc 40.625 (39.950)	Top-5 acc 64.453 (63.969)	lr 0.02414
Train [15][860/3239]	Time 0.586 (0.888)	Data Time 0.001 (0.023)	Loss 3.5947 (3.5605)	Entropy 1.25401 (1.26056)	Top-1 acc 39.844 (39.962)	Top-5 acc 65.625 (63.961)	lr 0.02414
Train [15][870/3239]	Time 0.613 (0.888)	Data Time 0.001 (0.023)	Loss 3.3896 (3.5608)	Entropy 1.25368 (1.26049)	Top-1 acc 41.797 (39.950)	Top-5 acc 67.578 (63.958)	lr 0.02414
Train [15][880/3239]	Time 0.585 (0.887)	Data Time 0.001 (0.023)	Loss 3.5337 (3.5608)	Entropy 1.25383 (1.26041)	Top-1 acc 41.406 (39.954)	Top-5 acc 63.281 (63.946)	lr 0.02414
Train [15][890/3239]	Time 0.606 (0.887)	Data Time 0.001 (0.023)	Loss 3.5097 (3.5605)	Entropy 1.25378 (1.26034)	Top-1 acc 46.484 (39.967)	Top-5 acc 65.234 (63.958)	lr 0.02414
Train [15][900/3239]	Time 0.612 (0.887)	Data Time 0.001 (0.022)	Loss 3.5899 (3.5597)	Entropy 1.25369 (1.26026)	Top-1 acc 37.500 (39.987)	Top-5 acc 64.062 (63.975)	lr 0.02414
Train [15][910/3239]	Time 0.518 (0.886)	Data Time 0.001 (0.022)	Loss 3.5632 (3.5595)	Entropy 1.25363 (1.26019)	Top-1 acc 44.141 (39.990)	Top-5 acc 60.547 (63.980)	lr 0.02414
Train [15][920/3239]	Time 0.602 (0.886)	Data Time 0.001 (0.022)	Loss 3.4795 (3.5588)	Entropy 1.25361 (1.26012)	Top-1 acc 41.797 (39.998)	Top-5 acc 65.625 (63.991)	lr 0.02414
Train [15][930/3239]	Time 0.624 (0.885)	Data Time 0.001 (0.022)	Loss 3.6149 (3.5584)	Entropy 1.25349 (1.26005)	Top-1 acc 39.062 (40.014)	Top-5 acc 63.281 (63.997)	lr 0.02414
Train [15][940/3239]	Time 0.603 (0.885)	Data Time 0.001 (0.021)	Loss 3.7253 (3.5581)	Entropy 1.25329 (1.25998)	Top-1 acc 33.203 (40.015)	Top-5 acc 62.109 (64.011)	lr 0.02414
Train [15][950/3239]	Time 0.580 (0.884)	Data Time 0.001 (0.021)	Loss 3.3771 (3.5579)	Entropy 1.25354 (1.25991)	Top-1 acc 39.453 (40.008)	Top-5 acc 66.797 (64.016)	lr 0.02414
Train [15][960/3239]	Time 0.610 (0.883)	Data Time 0.003 (0.021)	Loss 3.4774 (3.5580)	Entropy 1.25329 (1.25984)	Top-1 acc 42.188 (40.010)	Top-5 acc 65.234 (64.022)	lr 0.02413
Train [15][970/3239]	Time 0.620 (0.883)	Data Time 0.001 (0.021)	Loss 3.4510 (3.5583)	Entropy 1.25339 (1.25977)	Top-1 acc 42.578 (39.999)	Top-5 acc 63.672 (64.007)	lr 0.02413
Train [15][980/3239]	Time 0.665 (0.882)	Data Time 0.001 (0.021)	Loss 3.6340 (3.5584)	Entropy 1.25305 (1.25971)	Top-1 acc 40.234 (39.988)	Top-5 acc 61.328 (64.004)	lr 0.02413
Train [15][990/3239]	Time 0.635 (0.882)	Data Time 0.001 (0.020)	Loss 3.3816 (3.5582)	Entropy 1.25296 (1.25964)	Top-1 acc 41.406 (39.989)	Top-5 acc 66.797 (64.013)	lr 0.02413
Train [15][1000/3239]	Time 0.574 (0.881)	Data Time 0.001 (0.020)	Loss 3.6201 (3.5581)	Entropy 1.25281 (1.25957)	Top-1 acc 38.281 (39.987)	Top-5 acc 62.109 (64.011)	lr 0.02413
Train [15][1010/3239]	Time 0.602 (0.881)	Data Time 0.001 (0.020)	Loss 3.5918 (3.5579)	Entropy 1.25294 (1.25951)	Top-1 acc 38.672 (39.985)	Top-5 acc 62.500 (64.015)	lr 0.02413
Train [15][1020/3239]	Time 0.569 (0.881)	Data Time 0.001 (0.020)	Loss 3.4484 (3.5581)	Entropy 1.25281 (1.25944)	Top-1 acc 42.188 (39.987)	Top-5 acc 66.797 (64.008)	lr 0.02413
Train [15][1030/3239]	Time 0.600 (0.880)	Data Time 0.001 (0.020)	Loss 3.5358 (3.5582)	Entropy 1.25273 (1.25938)	Top-1 acc 41.797 (39.980)	Top-5 acc 62.500 (64.006)	lr 0.02413
Train [15][1040/3239]	Time 0.601 (0.880)	Data Time 0.001 (0.020)	Loss 3.4336 (3.5579)	Entropy 1.25299 (1.25931)	Top-1 acc 42.969 (39.989)	Top-5 acc 67.578 (64.011)	lr 0.02413
Train [15][1050/3239]	Time 0.652 (0.879)	Data Time 0.001 (0.019)	Loss 3.5831 (3.5579)	Entropy 1.25297 (1.25925)	Top-1 acc 39.453 (39.985)	Top-5 acc 65.234 (64.013)	lr 0.02413
Train [15][1060/3239]	Time 0.604 (0.879)	Data Time 0.001 (0.019)	Loss 3.5062 (3.5576)	Entropy 1.25311 (1.25919)	Top-1 acc 39.062 (39.973)	Top-5 acc 64.844 (64.019)	lr 0.02413
Train [15][1070/3239]	Time 0.571 (0.879)	Data Time 0.001 (0.019)	Loss 3.6986 (3.5576)	Entropy 1.25297 (1.25914)	Top-1 acc 36.328 (39.971)	Top-5 acc 62.891 (64.027)	lr 0.02413
Train [15][1080/3239]	Time 0.570 (0.879)	Data Time 0.001 (0.019)	Loss 3.7976 (3.5582)	Entropy 1.25278 (1.25908)	Top-1 acc 35.547 (39.963)	Top-5 acc 58.984 (64.019)	lr 0.02413
Train [15][1090/3239]	Time 0.588 (0.878)	Data Time 0.001 (0.019)	Loss 3.5246 (3.5585)	Entropy 1.25258 (1.25902)	Top-1 acc 41.797 (39.962)	Top-5 acc 63.672 (64.016)	lr 0.02413
Train [15][1100/3239]	Time 0.597 (0.878)	Data Time 0.001 (0.019)	Loss 3.6320 (3.5589)	Entropy 1.25218 (1.25896)	Top-1 acc 35.938 (39.948)	Top-5 acc 64.062 (64.015)	lr 0.02413
Train [15][1110/3239]	Time 0.592 (0.878)	Data Time 0.001 (0.018)	Loss 3.3571 (3.5589)	Entropy 1.25199 (1.25890)	Top-1 acc 42.969 (39.950)	Top-5 acc 69.922 (64.009)	lr 0.02413
Train [15][1120/3239]	Time 0.581 (0.895)	Data Time 0.002 (0.018)	Loss 3.5571 (3.5587)	Entropy 1.25181 (1.25884)	Top-1 acc 40.234 (39.945)	Top-5 acc 60.938 (64.005)	lr 0.02413
Train [15][1130/3239]	Time 0.597 (0.895)	Data Time 0.001 (0.018)	Loss 3.4459 (3.5587)	Entropy 1.25137 (1.25878)	Top-1 acc 44.531 (39.956)	Top-5 acc 66.797 (63.998)	lr 0.02413
Train [15][1140/3239]	Time 0.601 (0.895)	Data Time 0.002 (0.018)	Loss 3.6336 (3.5589)	Entropy 1.25136 (1.25871)	Top-1 acc 38.672 (39.959)	Top-5 acc 64.453 (63.991)	lr 0.02413
Train [15][1150/3239]	Time 0.545 (0.894)	Data Time 0.001 (0.018)	Loss 3.8171 (3.5589)	Entropy 1.25133 (1.25865)	Top-1 acc 35.547 (39.957)	Top-5 acc 60.156 (63.995)	lr 0.02413
Train [15][1160/3239]	Time 0.635 (0.894)	Data Time 0.001 (0.018)	Loss 3.7197 (3.5591)	Entropy 1.25092 (1.25858)	Top-1 acc 41.406 (39.953)	Top-5 acc 59.375 (63.985)	lr 0.02413
Train [15][1170/3239]	Time 0.568 (0.893)	Data Time 0.001 (0.018)	Loss 3.6157 (3.5592)	Entropy 1.25100 (1.25852)	Top-1 acc 36.328 (39.947)	Top-5 acc 61.719 (63.981)	lr 0.02413
Train [15][1180/3239]	Time 0.588 (0.893)	Data Time 0.001 (0.018)	Loss 3.8181 (3.5592)	Entropy 1.25083 (1.25845)	Top-1 acc 33.594 (39.941)	Top-5 acc 58.594 (63.976)	lr 0.02413
Train [15][1190/3239]	Time 0.547 (0.892)	Data Time 0.001 (0.017)	Loss 3.3906 (3.5592)	Entropy 1.25056 (1.25839)	Top-1 acc 45.703 (39.942)	Top-5 acc 67.188 (63.977)	lr 0.02413
Train [15][1200/3239]	Time 0.615 (0.892)	Data Time 0.001 (0.017)	Loss 3.5538 (3.5587)	Entropy 1.25031 (1.25832)	Top-1 acc 38.672 (39.945)	Top-5 acc 61.719 (63.976)	lr 0.02413
Train [15][1210/3239]	Time 0.584 (0.892)	Data Time 0.001 (0.017)	Loss 3.6692 (3.5590)	Entropy 1.25024 (1.25826)	Top-1 acc 37.891 (39.938)	Top-5 acc 60.156 (63.972)	lr 0.02413
Train [15][1220/3239]	Time 0.541 (0.891)	Data Time 0.001 (0.017)	Loss 3.6610 (3.5592)	Entropy 1.25022 (1.25819)	Top-1 acc 36.328 (39.933)	Top-5 acc 61.328 (63.965)	lr 0.02413
Train [15][1230/3239]	Time 0.612 (0.891)	Data Time 0.001 (0.017)	Loss 3.5830 (3.5594)	Entropy 1.25050 (1.25813)	Top-1 acc 41.406 (39.937)	Top-5 acc 63.672 (63.960)	lr 0.02412
Train [15][1240/3239]	Time 0.576 (0.890)	Data Time 0.001 (0.017)	Loss 3.3987 (3.5597)	Entropy 1.25042 (1.25807)	Top-1 acc 42.969 (39.925)	Top-5 acc 67.578 (63.952)	lr 0.02412
Train [15][1250/3239]	Time 0.476 (0.890)	Data Time 0.002 (0.017)	Loss 3.3595 (3.5593)	Entropy 1.25009 (1.25800)	Top-1 acc 42.578 (39.929)	Top-5 acc 68.359 (63.955)	lr 0.02412
Train [15][1260/3239]	Time 0.639 (0.889)	Data Time 0.001 (0.017)	Loss 3.4070 (3.5595)	Entropy 1.24993 (1.25794)	Top-1 acc 41.016 (39.918)	Top-5 acc 68.750 (63.950)	lr 0.02412
Train [15][1270/3239]	Time 0.547 (0.889)	Data Time 0.001 (0.016)	Loss 3.5068 (3.5589)	Entropy 1.25007 (1.25788)	Top-1 acc 42.188 (39.933)	Top-5 acc 66.016 (63.962)	lr 0.02412
Train [15][1280/3239]	Time 0.725 (0.888)	Data Time 0.001 (0.016)	Loss 3.3854 (3.5588)	Entropy 1.24996 (1.25781)	Top-1 acc 40.625 (39.936)	Top-5 acc 63.672 (63.958)	lr 0.02412
Train [15][1290/3239]	Time 0.580 (0.888)	Data Time 0.001 (0.016)	Loss 3.7511 (3.5587)	Entropy 1.24984 (1.25775)	Top-1 acc 35.547 (39.936)	Top-5 acc 58.984 (63.956)	lr 0.02412
Train [15][1300/3239]	Time 0.581 (0.888)	Data Time 0.001 (0.016)	Loss 3.5061 (3.5588)	Entropy 1.24974 (1.25769)	Top-1 acc 39.062 (39.935)	Top-5 acc 64.453 (63.953)	lr 0.02412
Train [15][1310/3239]	Time 0.612 (0.887)	Data Time 0.001 (0.016)	Loss 3.6716 (3.5588)	Entropy 1.25009 (1.25763)	Top-1 acc 42.969 (39.943)	Top-5 acc 60.547 (63.952)	lr 0.02412
Train [15][1320/3239]	Time 0.623 (0.887)	Data Time 0.001 (0.016)	Loss 3.5298 (3.5590)	Entropy 1.24978 (1.25757)	Top-1 acc 39.062 (39.937)	Top-5 acc 63.281 (63.948)	lr 0.02412
Train [15][1330/3239]	Time 0.545 (0.887)	Data Time 0.001 (0.016)	Loss 3.5994 (3.5596)	Entropy 1.24997 (1.25752)	Top-1 acc 39.844 (39.922)	Top-5 acc 63.281 (63.933)	lr 0.02412
Train [15][1340/3239]	Time 0.618 (0.886)	Data Time 0.001 (0.016)	Loss 3.5276 (3.5595)	Entropy 1.24944 (1.25746)	Top-1 acc 39.453 (39.927)	Top-5 acc 67.969 (63.935)	lr 0.02412
Train [15][1350/3239]	Time 0.764 (0.886)	Data Time 0.001 (0.016)	Loss 3.6344 (3.5597)	Entropy 1.24905 (1.25740)	Top-1 acc 40.234 (39.919)	Top-5 acc 60.938 (63.932)	lr 0.02412
Train [15][1360/3239]	Time 0.604 (0.886)	Data Time 0.001 (0.015)	Loss 3.3452 (3.5593)	Entropy 1.24882 (1.25734)	Top-1 acc 42.578 (39.923)	Top-5 acc 70.312 (63.949)	lr 0.02412
Train [15][1370/3239]	Time 0.580 (0.885)	Data Time 0.001 (0.015)	Loss 3.6752 (3.5594)	Entropy 1.24849 (1.25727)	Top-1 acc 36.719 (39.913)	Top-5 acc 62.500 (63.947)	lr 0.02412
Train [15][1380/3239]	Time 0.588 (0.885)	Data Time 0.001 (0.015)	Loss 3.6672 (3.5597)	Entropy 1.24805 (1.25721)	Top-1 acc 36.328 (39.901)	Top-5 acc 59.375 (63.943)	lr 0.02412
Train [15][1390/3239]	Time 0.570 (0.885)	Data Time 0.002 (0.015)	Loss 3.5214 (3.5597)	Entropy 1.24781 (1.25714)	Top-1 acc 39.453 (39.900)	Top-5 acc 66.406 (63.955)	lr 0.02412
Train [15][1400/3239]	Time 0.613 (0.885)	Data Time 0.001 (0.015)	Loss 3.3422 (3.5594)	Entropy 1.24788 (1.25707)	Top-1 acc 44.531 (39.912)	Top-5 acc 67.578 (63.962)	lr 0.02412
Train [15][1410/3239]	Time 0.569 (0.885)	Data Time 0.001 (0.015)	Loss 3.5556 (3.5592)	Entropy 1.24751 (1.25701)	Top-1 acc 39.453 (39.909)	Top-5 acc 64.062 (63.961)	lr 0.02412
Train [15][1420/3239]	Time 0.588 (0.884)	Data Time 0.001 (0.015)	Loss 3.5116 (3.5587)	Entropy 1.24734 (1.25694)	Top-1 acc 43.750 (39.930)	Top-5 acc 65.234 (63.966)	lr 0.02412
Train [15][1430/3239]	Time 0.650 (0.884)	Data Time 0.001 (0.015)	Loss 3.6255 (3.5586)	Entropy 1.24770 (1.25687)	Top-1 acc 39.453 (39.931)	Top-5 acc 64.062 (63.966)	lr 0.02412
Train [15][1440/3239]	Time 0.663 (0.883)	Data Time 0.001 (0.015)	Loss 3.5847 (3.5589)	Entropy 1.24731 (1.25681)	Top-1 acc 41.016 (39.932)	Top-5 acc 60.938 (63.965)	lr 0.02412
Train [15][1450/3239]	Time 0.554 (0.883)	Data Time 0.001 (0.015)	Loss 3.6634 (3.5592)	Entropy 1.24754 (1.25674)	Top-1 acc 35.938 (39.920)	Top-5 acc 64.453 (63.963)	lr 0.02412
Train [15][1460/3239]	Time 0.656 (0.882)	Data Time 0.001 (0.015)	Loss 3.5547 (3.5588)	Entropy 1.24754 (1.25668)	Top-1 acc 40.234 (39.925)	Top-5 acc 63.281 (63.969)	lr 0.02412
Train [15][1470/3239]	Time 0.598 (0.882)	Data Time 0.001 (0.014)	Loss 3.4095 (3.5589)	Entropy 1.24770 (1.25662)	Top-1 acc 41.016 (39.912)	Top-5 acc 70.703 (63.972)	lr 0.02412
Train [15][1480/3239]	Time 0.564 (0.882)	Data Time 0.001 (0.014)	Loss 3.5934 (3.5589)	Entropy 1.24786 (1.25656)	Top-1 acc 41.797 (39.914)	Top-5 acc 64.062 (63.972)	lr 0.02412
Train [15][1490/3239]	Time 0.652 (0.882)	Data Time 0.003 (0.014)	Loss 3.3289 (3.5584)	Entropy 1.24706 (1.25650)	Top-1 acc 43.750 (39.923)	Top-5 acc 70.703 (63.981)	lr 0.02411
Train [15][1500/3239]	Time 0.653 (0.881)	Data Time 0.001 (0.014)	Loss 3.4552 (3.5581)	Entropy 1.24674 (1.25644)	Top-1 acc 42.969 (39.922)	Top-5 acc 67.969 (63.998)	lr 0.02411
Train [15][1510/3239]	Time 0.716 (0.881)	Data Time 0.002 (0.014)	Loss 3.7596 (3.5582)	Entropy 1.24683 (1.25637)	Top-1 acc 33.594 (39.925)	Top-5 acc 58.594 (63.994)	lr 0.02411
Train [15][1520/3239]	Time 0.604 (0.881)	Data Time 0.001 (0.014)	Loss 3.2897 (3.5582)	Entropy 1.24654 (1.25631)	Top-1 acc 42.188 (39.927)	Top-5 acc 67.969 (63.992)	lr 0.02411
Train [15][1530/3239]	Time 0.587 (0.881)	Data Time 0.001 (0.014)	Loss 3.6256 (3.5584)	Entropy 1.24623 (1.25624)	Top-1 acc 38.281 (39.917)	Top-5 acc 62.500 (63.986)	lr 0.02411
Train [15][1540/3239]	Time 0.581 (0.880)	Data Time 0.001 (0.014)	Loss 3.5078 (3.5577)	Entropy 1.24573 (1.25618)	Top-1 acc 40.625 (39.926)	Top-5 acc 64.062 (64.003)	lr 0.02411
Train [15][1550/3239]	Time 0.661 (0.880)	Data Time 0.003 (0.014)	Loss 3.6554 (3.5578)	Entropy 1.24587 (1.25611)	Top-1 acc 36.719 (39.923)	Top-5 acc 61.328 (64.005)	lr 0.02411
Train [15][1560/3239]	Time 0.559 (0.880)	Data Time 0.001 (0.014)	Loss 3.5799 (3.5581)	Entropy 1.24584 (1.25605)	Top-1 acc 44.922 (39.921)	Top-5 acc 64.844 (64.001)	lr 0.02411
Train [15][1570/3239]	Time 0.643 (0.880)	Data Time 0.001 (0.014)	Loss 3.6073 (3.5582)	Entropy 1.24573 (1.25598)	Top-1 acc 38.672 (39.921)	Top-5 acc 64.844 (63.999)	lr 0.02411
Train [15][1580/3239]	Time 0.670 (0.880)	Data Time 0.001 (0.014)	Loss 3.6694 (3.5582)	Entropy 1.24543 (1.25592)	Top-1 acc 35.938 (39.919)	Top-5 acc 64.453 (64.001)	lr 0.02411
Train [15][1590/3239]	Time 0.598 (0.879)	Data Time 0.001 (0.013)	Loss 3.3468 (3.5578)	Entropy 1.24497 (1.25585)	Top-1 acc 45.312 (39.932)	Top-5 acc 69.922 (64.007)	lr 0.02411
Train [15][1600/3239]	Time 0.559 (0.879)	Data Time 0.001 (0.013)	Loss 3.5337 (3.5582)	Entropy 1.24463 (1.25578)	Top-1 acc 40.234 (39.922)	Top-5 acc 63.281 (63.996)	lr 0.02411
Train [15][1610/3239]	Time 0.539 (0.879)	Data Time 0.001 (0.013)	Loss 3.4800 (3.5581)	Entropy 1.24461 (1.25571)	Top-1 acc 41.406 (39.925)	Top-5 acc 62.500 (63.997)	lr 0.02411
Train [15][1620/3239]	Time 0.597 (0.878)	Data Time 0.001 (0.013)	Loss 3.5166 (3.5579)	Entropy 1.24419 (1.25564)	Top-1 acc 42.188 (39.927)	Top-5 acc 64.844 (64.002)	lr 0.02411
Train [15][1630/3239]	Time 0.605 (0.878)	Data Time 0.001 (0.013)	Loss 3.5150 (3.5575)	Entropy 1.24395 (1.25557)	Top-1 acc 40.625 (39.937)	Top-5 acc 63.672 (64.015)	lr 0.02411
Train [15][1640/3239]	Time 0.612 (0.878)	Data Time 0.001 (0.013)	Loss 3.7720 (3.5577)	Entropy 1.24368 (1.25550)	Top-1 acc 33.594 (39.931)	Top-5 acc 60.547 (64.014)	lr 0.02411
Train [15][1650/3239]	Time 0.601 (0.878)	Data Time 0.001 (0.013)	Loss 3.8242 (3.5576)	Entropy 1.24310 (1.25543)	Top-1 acc 33.984 (39.938)	Top-5 acc 57.422 (64.017)	lr 0.02411
Train [15][1660/3239]	Time 0.602 (0.877)	Data Time 0.001 (0.013)	Loss 3.4120 (3.5575)	Entropy 1.24298 (1.25535)	Top-1 acc 44.531 (39.939)	Top-5 acc 68.750 (64.022)	lr 0.02411
Train [15][1670/3239]	Time 0.587 (0.877)	Data Time 0.001 (0.013)	Loss 3.6799 (3.5575)	Entropy 1.24303 (1.25528)	Top-1 acc 39.844 (39.939)	Top-5 acc 64.062 (64.022)	lr 0.02411
Train [15][1680/3239]	Time 0.618 (0.877)	Data Time 0.001 (0.013)	Loss 3.7623 (3.5577)	Entropy 1.24267 (1.25520)	Top-1 acc 35.938 (39.935)	Top-5 acc 59.766 (64.015)	lr 0.02411
Train [15][1690/3239]	Time 0.602 (0.877)	Data Time 0.001 (0.013)	Loss 3.7487 (3.5575)	Entropy 1.24260 (1.25513)	Top-1 acc 38.672 (39.945)	Top-5 acc 58.984 (64.019)	lr 0.02411
Train [15][1700/3239]	Time 0.586 (0.877)	Data Time 0.001 (0.013)	Loss 3.5717 (3.5573)	Entropy 1.24233 (1.25506)	Top-1 acc 37.891 (39.954)	Top-5 acc 63.672 (64.021)	lr 0.02411
Train [15][1710/3239]	Time 0.579 (0.876)	Data Time 0.001 (0.013)	Loss 3.4303 (3.5571)	Entropy 1.24158 (1.25498)	Top-1 acc 42.969 (39.951)	Top-5 acc 66.406 (64.024)	lr 0.02411
Train [15][1720/3239]	Time 0.567 (0.876)	Data Time 0.001 (0.013)	Loss 3.6111 (3.5569)	Entropy 1.24149 (1.25490)	Top-1 acc 40.625 (39.958)	Top-5 acc 62.500 (64.026)	lr 0.02411
Train [15][1730/3239]	Time 0.585 (0.876)	Data Time 0.001 (0.013)	Loss 3.5611 (3.5568)	Entropy 1.24114 (1.25482)	Top-1 acc 40.625 (39.960)	Top-5 acc 66.797 (64.024)	lr 0.02411
Train [15][1740/3239]	Time 0.593 (0.876)	Data Time 0.001 (0.012)	Loss 3.4409 (3.5565)	Entropy 1.24070 (1.25474)	Top-1 acc 44.531 (39.971)	Top-5 acc 65.625 (64.033)	lr 0.02411
Train [15][1750/3239]	Time 0.599 (0.876)	Data Time 0.001 (0.012)	Loss 3.4807 (3.5569)	Entropy 1.24068 (1.25466)	Top-1 acc 42.578 (39.968)	Top-5 acc 62.109 (64.026)	lr 0.02411
Train [15][1760/3239]	Time 0.610 (0.876)	Data Time 0.001 (0.012)	Loss 3.5094 (3.5567)	Entropy 1.24057 (1.25458)	Top-1 acc 43.359 (39.972)	Top-5 acc 64.062 (64.028)	lr 0.02410
Train [15][1770/3239]	Time 0.722 (0.887)	Data Time 0.037 (0.012)	Loss 3.4551 (3.5564)	Entropy 1.24100 (1.25451)	Top-1 acc 41.016 (39.973)	Top-5 acc 66.016 (64.040)	lr 0.02410
Train [15][1780/3239]	Time 0.619 (0.887)	Data Time 0.002 (0.012)	Loss 3.6120 (3.5565)	Entropy 1.24077 (1.25443)	Top-1 acc 41.406 (39.967)	Top-5 acc 64.062 (64.035)	lr 0.02410
Train [15][1790/3239]	Time 0.580 (0.887)	Data Time 0.001 (0.012)	Loss 3.5814 (3.5563)	Entropy 1.24032 (1.25435)	Top-1 acc 39.453 (39.972)	Top-5 acc 60.547 (64.038)	lr 0.02410
Train [15][1800/3239]	Time 0.611 (0.886)	Data Time 0.001 (0.012)	Loss 3.5087 (3.5564)	Entropy 1.23973 (1.25427)	Top-1 acc 42.188 (39.968)	Top-5 acc 65.234 (64.038)	lr 0.02410
Train [15][1810/3239]	Time 0.667 (0.886)	Data Time 0.001 (0.012)	Loss 3.5630 (3.5563)	Entropy 1.23960 (1.25419)	Top-1 acc 40.625 (39.966)	Top-5 acc 61.719 (64.038)	lr 0.02410
Train [15][1820/3239]	Time 0.587 (0.886)	Data Time 0.001 (0.012)	Loss 3.5020 (3.5562)	Entropy 1.23951 (1.25411)	Top-1 acc 42.969 (39.972)	Top-5 acc 65.625 (64.038)	lr 0.02410
Train [15][1830/3239]	Time 0.607 (0.885)	Data Time 0.001 (0.012)	Loss 3.5751 (3.5566)	Entropy 1.24000 (1.25403)	Top-1 acc 36.719 (39.962)	Top-5 acc 62.891 (64.032)	lr 0.02410
Train [15][1840/3239]	Time 0.594 (0.885)	Data Time 0.001 (0.012)	Loss 3.4103 (3.5567)	Entropy 1.24019 (1.25396)	Top-1 acc 43.359 (39.959)	Top-5 acc 66.406 (64.029)	lr 0.02410
Train [15][1850/3239]	Time 0.619 (0.885)	Data Time 0.002 (0.012)	Loss 3.4764 (3.5564)	Entropy 1.23990 (1.25388)	Top-1 acc 42.578 (39.971)	Top-5 acc 65.234 (64.033)	lr 0.02410
Train [15][1860/3239]	Time 0.568 (0.885)	Data Time 0.001 (0.012)	Loss 3.5030 (3.5563)	Entropy 1.23966 (1.25381)	Top-1 acc 41.016 (39.973)	Top-5 acc 64.062 (64.034)	lr 0.02410
Train [15][1870/3239]	Time 0.599 (0.885)	Data Time 0.001 (0.012)	Loss 3.5125 (3.5562)	Entropy 1.23897 (1.25373)	Top-1 acc 44.531 (39.982)	Top-5 acc 65.625 (64.039)	lr 0.02410
Train [15][1880/3239]	Time 0.599 (0.885)	Data Time 0.001 (0.012)	Loss 3.7140 (3.5558)	Entropy 1.23909 (1.25365)	Top-1 acc 36.328 (39.986)	Top-5 acc 59.766 (64.049)	lr 0.02410
Train [15][1890/3239]	Time 0.611 (0.884)	Data Time 0.002 (0.012)	Loss 3.2737 (3.5558)	Entropy 1.23919 (1.25358)	Top-1 acc 43.359 (39.986)	Top-5 acc 67.969 (64.049)	lr 0.02410
Train [15][1900/3239]	Time 0.585 (0.884)	Data Time 0.001 (0.012)	Loss 3.7073 (3.5557)	Entropy 1.23896 (1.25350)	Top-1 acc 38.672 (39.987)	Top-5 acc 62.891 (64.048)	lr 0.02410
Train [15][1910/3239]	Time 0.638 (0.884)	Data Time 0.001 (0.012)	Loss 3.5567 (3.5558)	Entropy 1.23835 (1.25342)	Top-1 acc 36.328 (39.981)	Top-5 acc 61.328 (64.044)	lr 0.02410
Train [15][1920/3239]	Time 0.596 (0.884)	Data Time 0.001 (0.012)	Loss 3.5398 (3.5556)	Entropy 1.23834 (1.25334)	Top-1 acc 37.891 (39.980)	Top-5 acc 61.719 (64.046)	lr 0.02410
Train [15][1930/3239]	Time 0.584 (0.883)	Data Time 0.001 (0.011)	Loss 3.3936 (3.5554)	Entropy 1.23795 (1.25327)	Top-1 acc 44.141 (39.986)	Top-5 acc 65.625 (64.050)	lr 0.02410
Train [15][1940/3239]	Time 0.599 (0.883)	Data Time 0.001 (0.011)	Loss 3.3183 (3.5549)	Entropy 1.23753 (1.25319)	Top-1 acc 45.312 (39.998)	Top-5 acc 68.750 (64.058)	lr 0.02410
Train [15][1950/3239]	Time 0.612 (0.883)	Data Time 0.001 (0.011)	Loss 3.5062 (3.5552)	Entropy 1.23759 (1.25311)	Top-1 acc 39.844 (39.991)	Top-5 acc 65.625 (64.056)	lr 0.02410
Train [15][1960/3239]	Time 0.594 (0.883)	Data Time 0.001 (0.011)	Loss 3.6121 (3.5554)	Entropy 1.23757 (1.25303)	Top-1 acc 41.016 (39.983)	Top-5 acc 62.891 (64.045)	lr 0.02410
Train [15][1970/3239]	Time 0.694 (0.882)	Data Time 0.001 (0.011)	Loss 3.6215 (3.5556)	Entropy 1.23776 (1.25295)	Top-1 acc 39.844 (39.979)	Top-5 acc 64.062 (64.045)	lr 0.02410
Train [15][1980/3239]	Time 0.562 (0.882)	Data Time 0.001 (0.011)	Loss 3.6564 (3.5558)	Entropy 1.23742 (1.25287)	Top-1 acc 40.234 (39.979)	Top-5 acc 60.156 (64.038)	lr 0.02410
Train [15][1990/3239]	Time 0.612 (0.882)	Data Time 0.001 (0.011)	Loss 3.7652 (3.5559)	Entropy 1.23734 (1.25279)	Top-1 acc 37.109 (39.971)	Top-5 acc 61.328 (64.040)	lr 0.02410
Train [15][2000/3239]	Time 0.573 (0.882)	Data Time 0.001 (0.011)	Loss 3.4633 (3.5561)	Entropy 1.23705 (1.25272)	Top-1 acc 41.797 (39.966)	Top-5 acc 64.062 (64.038)	lr 0.02410
Train [15][2010/3239]	Time 0.552 (0.882)	Data Time 0.001 (0.011)	Loss 3.6387 (3.5557)	Entropy 1.23696 (1.25264)	Top-1 acc 39.453 (39.973)	Top-5 acc 61.328 (64.044)	lr 0.02410
Train [15][2020/3239]	Time 0.608 (0.881)	Data Time 0.001 (0.011)	Loss 3.7942 (3.5561)	Entropy 1.23664 (1.25256)	Top-1 acc 36.719 (39.967)	Top-5 acc 58.203 (64.034)	lr 0.02410
Train [15][2030/3239]	Time 0.603 (0.881)	Data Time 0.002 (0.011)	Loss 3.3676 (3.5559)	Entropy 1.23646 (1.25248)	Top-1 acc 44.531 (39.970)	Top-5 acc 67.578 (64.036)	lr 0.02409
Train [15][2040/3239]	Time 0.667 (0.881)	Data Time 0.001 (0.011)	Loss 3.6137 (3.5559)	Entropy 1.23625 (1.25240)	Top-1 acc 40.234 (39.972)	Top-5 acc 61.719 (64.033)	lr 0.02409
Train [15][2050/3239]	Time 0.595 (0.881)	Data Time 0.001 (0.011)	Loss 3.8238 (3.5563)	Entropy 1.23630 (1.25232)	Top-1 acc 34.766 (39.964)	Top-5 acc 60.547 (64.028)	lr 0.02409
Train [15][2060/3239]	Time 0.556 (0.881)	Data Time 0.001 (0.011)	Loss 3.3815 (3.5564)	Entropy 1.23632 (1.25225)	Top-1 acc 46.875 (39.960)	Top-5 acc 66.406 (64.023)	lr 0.02409
Train [15][2070/3239]	Time 0.628 (0.881)	Data Time 0.001 (0.011)	Loss 3.6813 (3.5568)	Entropy 1.23642 (1.25217)	Top-1 acc 39.062 (39.952)	Top-5 acc 64.062 (64.015)	lr 0.02409
Train [15][2080/3239]	Time 0.534 (0.880)	Data Time 0.001 (0.011)	Loss 3.8146 (3.5569)	Entropy 1.23606 (1.25209)	Top-1 acc 37.891 (39.951)	Top-5 acc 58.594 (64.017)	lr 0.02409
Train [15][2090/3239]	Time 0.596 (0.880)	Data Time 0.001 (0.011)	Loss 3.3053 (3.5570)	Entropy 1.23591 (1.25202)	Top-1 acc 46.484 (39.952)	Top-5 acc 72.266 (64.019)	lr 0.02409
Train [15][2100/3239]	Time 0.549 (0.880)	Data Time 0.001 (0.011)	Loss 3.4625 (3.5572)	Entropy 1.23525 (1.25194)	Top-1 acc 45.703 (39.953)	Top-5 acc 65.625 (64.015)	lr 0.02409
Train [15][2110/3239]	Time 0.564 (0.880)	Data Time 0.001 (0.011)	Loss 3.7407 (3.5571)	Entropy 1.23534 (1.25186)	Top-1 acc 35.938 (39.954)	Top-5 acc 60.547 (64.011)	lr 0.02409
Train [15][2120/3239]	Time 0.565 (0.879)	Data Time 0.001 (0.011)	Loss 3.6130 (3.5573)	Entropy 1.23536 (1.25178)	Top-1 acc 37.500 (39.947)	Top-5 acc 62.891 (64.010)	lr 0.02409
Train [15][2130/3239]	Time 0.603 (0.879)	Data Time 0.003 (0.011)	Loss 3.7167 (3.5574)	Entropy 1.23528 (1.25170)	Top-1 acc 38.672 (39.943)	Top-5 acc 63.672 (64.012)	lr 0.02409
Train [15][2140/3239]	Time 0.547 (0.879)	Data Time 0.001 (0.011)	Loss 3.5704 (3.5575)	Entropy 1.23501 (1.25163)	Top-1 acc 38.281 (39.937)	Top-5 acc 64.453 (64.009)	lr 0.02409
Train [15][2150/3239]	Time 0.577 (0.879)	Data Time 0.001 (0.011)	Loss 3.7570 (3.5578)	Entropy 1.23500 (1.25155)	Top-1 acc 35.938 (39.932)	Top-5 acc 56.641 (63.997)	lr 0.02409
Train [15][2160/3239]	Time 0.613 (0.879)	Data Time 0.001 (0.010)	Loss 3.7672 (3.5575)	Entropy 1.23518 (1.25147)	Top-1 acc 37.500 (39.933)	Top-5 acc 62.891 (64.001)	lr 0.02409
Train [15][2170/3239]	Time 0.606 (0.879)	Data Time 0.001 (0.010)	Loss 3.5549 (3.5573)	Entropy 1.23555 (1.25140)	Top-1 acc 36.719 (39.932)	Top-5 acc 64.453 (64.002)	lr 0.02409
Train [15][2180/3239]	Time 0.636 (0.878)	Data Time 0.001 (0.010)	Loss 3.4057 (3.5570)	Entropy 1.23542 (1.25133)	Top-1 acc 43.359 (39.935)	Top-5 acc 67.578 (64.008)	lr 0.02409
Train [15][2190/3239]	Time 0.540 (0.878)	Data Time 0.001 (0.010)	Loss 3.5977 (3.5568)	Entropy 1.23540 (1.25125)	Top-1 acc 42.578 (39.939)	Top-5 acc 63.672 (64.016)	lr 0.02409
Train [15][2200/3239]	Time 0.653 (0.878)	Data Time 0.001 (0.010)	Loss 3.5809 (3.5567)	Entropy 1.23511 (1.25118)	Top-1 acc 41.016 (39.938)	Top-5 acc 62.500 (64.023)	lr 0.02409
Train [15][2210/3239]	Time 0.610 (0.878)	Data Time 0.001 (0.010)	Loss 3.4820 (3.5563)	Entropy 1.23490 (1.25111)	Top-1 acc 40.625 (39.948)	Top-5 acc 63.672 (64.023)	lr 0.02409
Train [15][2220/3239]	Time 0.631 (0.878)	Data Time 0.001 (0.010)	Loss 3.4292 (3.5562)	Entropy 1.23504 (1.25103)	Top-1 acc 44.141 (39.950)	Top-5 acc 67.578 (64.026)	lr 0.02409
Train [15][2230/3239]	Time 0.595 (0.878)	Data Time 0.001 (0.010)	Loss 3.6480 (3.5561)	Entropy 1.23491 (1.25096)	Top-1 acc 38.672 (39.954)	Top-5 acc 63.672 (64.032)	lr 0.02409
Train [15][2240/3239]	Time 0.576 (0.878)	Data Time 0.001 (0.010)	Loss 3.4426 (3.5560)	Entropy 1.23467 (1.25089)	Top-1 acc 42.578 (39.955)	Top-5 acc 64.453 (64.032)	lr 0.02409
Train [15][2250/3239]	Time 0.599 (0.877)	Data Time 0.001 (0.010)	Loss 3.5116 (3.5560)	Entropy 1.23425 (1.25082)	Top-1 acc 37.500 (39.954)	Top-5 acc 64.844 (64.031)	lr 0.02409
Train [15][2260/3239]	Time 0.554 (0.877)	Data Time 0.001 (0.010)	Loss 3.4547 (3.5559)	Entropy 1.23450 (1.25075)	Top-1 acc 41.016 (39.956)	Top-5 acc 64.062 (64.033)	lr 0.02409
Train [15][2270/3239]	Time 0.697 (0.877)	Data Time 0.001 (0.010)	Loss 3.5750 (3.5560)	Entropy 1.23433 (1.25067)	Top-1 acc 37.891 (39.954)	Top-5 acc 63.672 (64.033)	lr 0.02409
Train [15][2280/3239]	Time 0.587 (0.877)	Data Time 0.001 (0.010)	Loss 3.3799 (3.5553)	Entropy 1.23459 (1.25060)	Top-1 acc 41.406 (39.966)	Top-5 acc 65.234 (64.045)	lr 0.02409
Train [15][2290/3239]	Time 0.618 (0.877)	Data Time 0.001 (0.010)	Loss 3.4946 (3.5553)	Entropy 1.23463 (1.25053)	Top-1 acc 41.797 (39.970)	Top-5 acc 67.578 (64.047)	lr 0.02408
Train [15][2300/3239]	Time 0.585 (0.876)	Data Time 0.001 (0.010)	Loss 3.4345 (3.5553)	Entropy 1.23395 (1.25046)	Top-1 acc 41.406 (39.972)	Top-5 acc 67.578 (64.046)	lr 0.02408
Train [15][2310/3239]	Time 0.593 (0.876)	Data Time 0.001 (0.010)	Loss 3.3727 (3.5552)	Entropy 1.23384 (1.25039)	Top-1 acc 46.094 (39.971)	Top-5 acc 67.188 (64.046)	lr 0.02408
Train [15][2320/3239]	Time 0.581 (0.876)	Data Time 0.001 (0.010)	Loss 3.6362 (3.5554)	Entropy 1.23393 (1.25032)	Top-1 acc 34.375 (39.968)	Top-5 acc 61.719 (64.047)	lr 0.02408
Train [15][2330/3239]	Time 0.561 (0.876)	Data Time 0.001 (0.010)	Loss 3.5658 (3.5554)	Entropy 1.23350 (1.25025)	Top-1 acc 42.188 (39.971)	Top-5 acc 63.672 (64.048)	lr 0.02408
Train [15][2340/3239]	Time 0.645 (0.876)	Data Time 0.001 (0.010)	Loss 3.4032 (3.5557)	Entropy 1.23327 (1.25018)	Top-1 acc 40.234 (39.964)	Top-5 acc 67.188 (64.039)	lr 0.02408
Train [15][2350/3239]	Time 0.600 (0.876)	Data Time 0.001 (0.010)	Loss 3.7543 (3.5559)	Entropy 1.23289 (1.25010)	Top-1 acc 38.281 (39.967)	Top-5 acc 58.984 (64.039)	lr 0.02408
Train [15][2360/3239]	Time 0.622 (0.876)	Data Time 0.001 (0.010)	Loss 3.4186 (3.5557)	Entropy 1.23297 (1.25003)	Top-1 acc 42.188 (39.968)	Top-5 acc 65.234 (64.041)	lr 0.02408
Train [15][2370/3239]	Time 0.547 (0.875)	Data Time 0.001 (0.010)	Loss 3.5580 (3.5559)	Entropy 1.23281 (1.24996)	Top-1 acc 37.891 (39.963)	Top-5 acc 64.062 (64.033)	lr 0.02408
Train [15][2380/3239]	Time 0.555 (0.875)	Data Time 0.001 (0.010)	Loss 3.8742 (3.5559)	Entropy 1.23256 (1.24989)	Top-1 acc 32.422 (39.960)	Top-5 acc 58.594 (64.034)	lr 0.02408
Train [15][2390/3239]	Time 0.613 (0.875)	Data Time 0.001 (0.010)	Loss 3.5972 (3.5557)	Entropy 1.23276 (1.24981)	Top-1 acc 35.156 (39.963)	Top-5 acc 62.891 (64.038)	lr 0.02408
Train [15][2400/3239]	Time 0.594 (0.875)	Data Time 0.002 (0.010)	Loss 3.4276 (3.5555)	Entropy 1.23247 (1.24974)	Top-1 acc 47.266 (39.965)	Top-5 acc 68.750 (64.045)	lr 0.02408
Train [15][2410/3239]	Time 0.626 (0.875)	Data Time 0.002 (0.010)	Loss 3.6238 (3.5558)	Entropy 1.23198 (1.24967)	Top-1 acc 38.672 (39.961)	Top-5 acc 62.109 (64.040)	lr 0.02408
Train [15][2420/3239]	Time 0.573 (0.875)	Data Time 0.001 (0.010)	Loss 3.4145 (3.5559)	Entropy 1.23211 (1.24960)	Top-1 acc 42.969 (39.959)	Top-5 acc 65.234 (64.040)	lr 0.02408
Train [15][2430/3239]	Time 0.695 (0.883)	Data Time 0.002 (0.010)	Loss 3.6514 (3.5560)	Entropy 1.23170 (1.24952)	Top-1 acc 34.766 (39.951)	Top-5 acc 60.156 (64.036)	lr 0.02408
Train [15][2440/3239]	Time 0.623 (0.882)	Data Time 0.002 (0.010)	Loss 3.5257 (3.5560)	Entropy 1.23176 (1.24945)	Top-1 acc 40.625 (39.950)	Top-5 acc 62.500 (64.037)	lr 0.02408
Train [15][2450/3239]	Time 0.599 (0.882)	Data Time 0.001 (0.009)	Loss 3.4786 (3.5560)	Entropy 1.23159 (1.24938)	Top-1 acc 38.672 (39.947)	Top-5 acc 68.359 (64.037)	lr 0.02408
Train [15][2460/3239]	Time 0.611 (0.882)	Data Time 0.003 (0.009)	Loss 3.4892 (3.5561)	Entropy 1.23113 (1.24931)	Top-1 acc 34.766 (39.941)	Top-5 acc 67.969 (64.034)	lr 0.02408
Train [15][2470/3239]	Time 0.599 (0.882)	Data Time 0.001 (0.009)	Loss 3.5549 (3.5564)	Entropy 1.23056 (1.24923)	Top-1 acc 40.625 (39.934)	Top-5 acc 61.328 (64.027)	lr 0.02408
Train [15][2480/3239]	Time 0.581 (0.882)	Data Time 0.001 (0.009)	Loss 3.5051 (3.5564)	Entropy 1.23032 (1.24916)	Top-1 acc 41.406 (39.935)	Top-5 acc 66.016 (64.027)	lr 0.02408
Train [15][2490/3239]	Time 0.584 (0.882)	Data Time 0.001 (0.009)	Loss 3.6218 (3.5564)	Entropy 1.23032 (1.24908)	Top-1 acc 39.062 (39.928)	Top-5 acc 61.328 (64.028)	lr 0.02408
Train [15][2500/3239]	Time 0.682 (0.882)	Data Time 0.001 (0.009)	Loss 3.8111 (3.5562)	Entropy 1.23008 (1.24901)	Top-1 acc 34.375 (39.932)	Top-5 acc 57.422 (64.031)	lr 0.02408
Train [15][2510/3239]	Time 0.563 (0.881)	Data Time 0.001 (0.009)	Loss 3.5909 (3.5563)	Entropy 1.23010 (1.24893)	Top-1 acc 37.500 (39.930)	Top-5 acc 66.016 (64.028)	lr 0.02408
Train [15][2520/3239]	Time 0.590 (0.881)	Data Time 0.001 (0.009)	Loss 3.7452 (3.5567)	Entropy 1.22959 (1.24886)	Top-1 acc 38.672 (39.920)	Top-5 acc 60.547 (64.021)	lr 0.02408
Train [15][2530/3239]	Time 0.543 (0.881)	Data Time 0.001 (0.009)	Loss 3.6847 (3.5568)	Entropy 1.22960 (1.24878)	Top-1 acc 34.766 (39.918)	Top-5 acc 61.328 (64.019)	lr 0.02408
Train [15][2540/3239]	Time 0.586 (0.881)	Data Time 0.001 (0.009)	Loss 3.3729 (3.5565)	Entropy 1.22985 (1.24870)	Top-1 acc 45.312 (39.926)	Top-5 acc 69.141 (64.029)	lr 0.02408
Train [15][2550/3239]	Time 0.624 (0.881)	Data Time 0.001 (0.009)	Loss 3.5564 (3.5566)	Entropy 1.22972 (1.24863)	Top-1 acc 41.406 (39.925)	Top-5 acc 62.500 (64.029)	lr 0.02407
Train [15][2560/3239]	Time 0.598 (0.881)	Data Time 0.001 (0.009)	Loss 3.5843 (3.5565)	Entropy 1.22918 (1.24856)	Top-1 acc 35.547 (39.922)	Top-5 acc 66.406 (64.031)	lr 0.02407
Train [15][2570/3239]	Time 0.667 (0.881)	Data Time 0.001 (0.009)	Loss 3.4277 (3.5565)	Entropy 1.22902 (1.24848)	Top-1 acc 44.141 (39.923)	Top-5 acc 69.141 (64.033)	lr 0.02407
Train [15][2580/3239]	Time 0.625 (0.880)	Data Time 0.001 (0.009)	Loss 3.4070 (3.5565)	Entropy 1.22902 (1.24840)	Top-1 acc 43.359 (39.923)	Top-5 acc 66.797 (64.034)	lr 0.02407
Train [15][2590/3239]	Time 0.539 (0.880)	Data Time 0.001 (0.009)	Loss 3.7620 (3.5565)	Entropy 1.22930 (1.24833)	Top-1 acc 38.281 (39.923)	Top-5 acc 60.156 (64.036)	lr 0.02407
Train [15][2600/3239]	Time 0.485 (0.880)	Data Time 0.001 (0.009)	Loss 3.5288 (3.5564)	Entropy 1.22938 (1.24826)	Top-1 acc 38.281 (39.926)	Top-5 acc 65.234 (64.037)	lr 0.02407
Train [15][2610/3239]	Time 0.590 (0.880)	Data Time 0.001 (0.009)	Loss 3.4979 (3.5563)	Entropy 1.22943 (1.24818)	Top-1 acc 39.844 (39.929)	Top-5 acc 64.844 (64.037)	lr 0.02407
Train [15][2620/3239]	Time 0.618 (0.879)	Data Time 0.001 (0.009)	Loss 3.5105 (3.5563)	Entropy 1.22938 (1.24811)	Top-1 acc 39.062 (39.929)	Top-5 acc 62.500 (64.032)	lr 0.02407
Train [15][2630/3239]	Time 0.589 (0.879)	Data Time 0.001 (0.009)	Loss 3.4217 (3.5560)	Entropy 1.22895 (1.24804)	Top-1 acc 39.844 (39.933)	Top-5 acc 66.797 (64.038)	lr 0.02407
Train [15][2640/3239]	Time 0.637 (0.879)	Data Time 0.001 (0.009)	Loss 3.5277 (3.5563)	Entropy 1.22880 (1.24797)	Top-1 acc 37.891 (39.928)	Top-5 acc 65.625 (64.030)	lr 0.02407
Train [15][2650/3239]	Time 0.592 (0.879)	Data Time 0.001 (0.009)	Loss 3.5629 (3.5563)	Entropy 1.22866 (1.24790)	Top-1 acc 41.797 (39.931)	Top-5 acc 66.406 (64.030)	lr 0.02407
Train [15][2660/3239]	Time 0.612 (0.879)	Data Time 0.002 (0.009)	Loss 3.4485 (3.5563)	Entropy 1.22844 (1.24782)	Top-1 acc 40.234 (39.931)	Top-5 acc 67.969 (64.030)	lr 0.02407
Train [15][2670/3239]	Time 0.605 (0.879)	Data Time 0.001 (0.009)	Loss 3.4833 (3.5561)	Entropy 1.22803 (1.24775)	Top-1 acc 43.359 (39.933)	Top-5 acc 64.844 (64.034)	lr 0.02407
Train [15][2680/3239]	Time 0.590 (0.879)	Data Time 0.001 (0.009)	Loss 3.5359 (3.5562)	Entropy 1.22765 (1.24768)	Top-1 acc 41.797 (39.933)	Top-5 acc 64.062 (64.032)	lr 0.02407
Train [15][2690/3239]	Time 0.636 (0.879)	Data Time 0.003 (0.009)	Loss 3.3928 (3.5562)	Entropy 1.22723 (1.24760)	Top-1 acc 39.453 (39.933)	Top-5 acc 66.406 (64.029)	lr 0.02407
Train [15][2700/3239]	Time 0.602 (0.879)	Data Time 0.001 (0.009)	Loss 3.6610 (3.5564)	Entropy 1.22682 (1.24752)	Top-1 acc 36.328 (39.926)	Top-5 acc 60.938 (64.026)	lr 0.02407
Train [15][2710/3239]	Time 0.600 (0.879)	Data Time 0.001 (0.009)	Loss 3.6915 (3.5563)	Entropy 1.22681 (1.24745)	Top-1 acc 36.328 (39.928)	Top-5 acc 58.203 (64.027)	lr 0.02407
Train [15][2720/3239]	Time 0.624 (0.878)	Data Time 0.001 (0.009)	Loss 3.4946 (3.5562)	Entropy 1.22712 (1.24737)	Top-1 acc 42.969 (39.928)	Top-5 acc 67.188 (64.032)	lr 0.02407
Train [15][2730/3239]	Time 0.775 (0.878)	Data Time 0.001 (0.009)	Loss 3.6498 (3.5563)	Entropy 1.22717 (1.24730)	Top-1 acc 34.375 (39.924)	Top-5 acc 61.328 (64.029)	lr 0.02407
Train [15][2740/3239]	Time 0.588 (0.878)	Data Time 0.001 (0.009)	Loss 3.6857 (3.5563)	Entropy 1.22723 (1.24723)	Top-1 acc 35.938 (39.921)	Top-5 acc 59.766 (64.028)	lr 0.02407
Train [15][2750/3239]	Time 0.610 (0.878)	Data Time 0.001 (0.009)	Loss 3.5613 (3.5563)	Entropy 1.22631 (1.24715)	Top-1 acc 37.109 (39.917)	Top-5 acc 67.578 (64.030)	lr 0.02407
Train [15][2760/3239]	Time 0.578 (0.878)	Data Time 0.001 (0.009)	Loss 3.4409 (3.5562)	Entropy 1.22644 (1.24708)	Top-1 acc 42.188 (39.921)	Top-5 acc 68.750 (64.030)	lr 0.02407
Train [15][2770/3239]	Time 0.579 (0.878)	Data Time 0.001 (0.009)	Loss 3.7420 (3.5563)	Entropy 1.22618 (1.24700)	Top-1 acc 37.891 (39.917)	Top-5 acc 57.812 (64.026)	lr 0.02407
Train [15][2780/3239]	Time 0.568 (0.877)	Data Time 0.001 (0.009)	Loss 3.7065 (3.5565)	Entropy 1.22618 (1.24693)	Top-1 acc 36.328 (39.915)	Top-5 acc 57.422 (64.020)	lr 0.02407
Train [15][2790/3239]	Time 0.606 (0.877)	Data Time 0.001 (0.009)	Loss 3.5316 (3.5566)	Entropy 1.22602 (1.24685)	Top-1 acc 38.672 (39.910)	Top-5 acc 66.016 (64.019)	lr 0.02407
Train [15][2800/3239]	Time 0.671 (0.877)	Data Time 0.001 (0.009)	Loss 3.5641 (3.5567)	Entropy 1.22605 (1.24678)	Top-1 acc 41.406 (39.907)	Top-5 acc 60.938 (64.014)	lr 0.02407
Train [15][2810/3239]	Time 0.663 (0.877)	Data Time 0.001 (0.009)	Loss 3.7987 (3.5569)	Entropy 1.22588 (1.24670)	Top-1 acc 35.156 (39.906)	Top-5 acc 60.938 (64.016)	lr 0.02407
Train [15][2820/3239]	Time 0.612 (0.877)	Data Time 0.001 (0.008)	Loss 3.4095 (3.5568)	Entropy 1.22596 (1.24663)	Top-1 acc 41.797 (39.906)	Top-5 acc 66.016 (64.016)	lr 0.02406
Train [15][2830/3239]	Time 0.637 (0.877)	Data Time 0.001 (0.008)	Loss 3.5998 (3.5569)	Entropy 1.22577 (1.24656)	Top-1 acc 42.578 (39.905)	Top-5 acc 62.891 (64.013)	lr 0.02406
Train [15][2840/3239]	Time 0.595 (0.877)	Data Time 0.001 (0.008)	Loss 3.3870 (3.5567)	Entropy 1.22576 (1.24648)	Top-1 acc 42.578 (39.910)	Top-5 acc 69.141 (64.017)	lr 0.02406
Train [15][2850/3239]	Time 0.612 (0.877)	Data Time 0.001 (0.008)	Loss 3.2695 (3.5566)	Entropy 1.22541 (1.24641)	Top-1 acc 48.047 (39.912)	Top-5 acc 69.531 (64.016)	lr 0.02406
Train [15][2860/3239]	Time 0.570 (0.876)	Data Time 0.001 (0.008)	Loss 3.6626 (3.5568)	Entropy 1.22520 (1.24634)	Top-1 acc 37.891 (39.906)	Top-5 acc 62.500 (64.012)	lr 0.02406
Train [15][2870/3239]	Time 0.585 (0.876)	Data Time 0.001 (0.008)	Loss 3.6294 (3.5565)	Entropy 1.22516 (1.24626)	Top-1 acc 41.797 (39.909)	Top-5 acc 63.672 (64.018)	lr 0.02406
Train [15][2880/3239]	Time 0.618 (0.876)	Data Time 0.001 (0.008)	Loss 3.2950 (3.5566)	Entropy 1.22511 (1.24619)	Top-1 acc 43.750 (39.910)	Top-5 acc 67.578 (64.018)	lr 0.02406
Train [15][2890/3239]	Time 0.573 (0.876)	Data Time 0.001 (0.008)	Loss 3.6819 (3.5571)	Entropy 1.22486 (1.24612)	Top-1 acc 39.453 (39.897)	Top-5 acc 60.938 (64.005)	lr 0.02406
Train [15][2900/3239]	Time 0.576 (0.876)	Data Time 0.001 (0.008)	Loss 3.6677 (3.5570)	Entropy 1.22486 (1.24604)	Top-1 acc 41.016 (39.901)	Top-5 acc 62.891 (64.009)	lr 0.02406
Train [15][2910/3239]	Time 0.612 (0.876)	Data Time 0.001 (0.008)	Loss 3.7645 (3.5569)	Entropy 1.22511 (1.24597)	Top-1 acc 39.453 (39.901)	Top-5 acc 60.156 (64.008)	lr 0.02406
Train [15][2920/3239]	Time 0.632 (0.876)	Data Time 0.001 (0.008)	Loss 3.6095 (3.5568)	Entropy 1.22496 (1.24590)	Top-1 acc 40.234 (39.902)	Top-5 acc 64.062 (64.011)	lr 0.02406
Train [15][2930/3239]	Time 0.598 (0.876)	Data Time 0.001 (0.008)	Loss 3.3553 (3.5566)	Entropy 1.22498 (1.24583)	Top-1 acc 47.656 (39.908)	Top-5 acc 68.750 (64.016)	lr 0.02406
Train [15][2940/3239]	Time 0.564 (0.876)	Data Time 0.002 (0.008)	Loss 3.7474 (3.5568)	Entropy 1.22498 (1.24576)	Top-1 acc 38.281 (39.906)	Top-5 acc 57.031 (64.013)	lr 0.02406
Train [15][2950/3239]	Time 0.555 (0.875)	Data Time 0.001 (0.008)	Loss 3.5602 (3.5568)	Entropy 1.22476 (1.24569)	Top-1 acc 37.891 (39.908)	Top-5 acc 65.234 (64.011)	lr 0.02406
Train [15][2960/3239]	Time 0.718 (0.875)	Data Time 0.001 (0.008)	Loss 3.6577 (3.5568)	Entropy 1.22434 (1.24561)	Top-1 acc 35.938 (39.908)	Top-5 acc 62.891 (64.012)	lr 0.02406
Train [15][2970/3239]	Time 0.556 (0.875)	Data Time 0.001 (0.008)	Loss 3.7235 (3.5570)	Entropy 1.22446 (1.24554)	Top-1 acc 34.375 (39.905)	Top-5 acc 61.719 (64.010)	lr 0.02406
Train [15][2980/3239]	Time 0.625 (0.875)	Data Time 0.001 (0.008)	Loss 3.6847 (3.5569)	Entropy 1.22414 (1.24547)	Top-1 acc 37.891 (39.905)	Top-5 acc 62.109 (64.013)	lr 0.02406
Train [15][2990/3239]	Time 0.603 (0.875)	Data Time 0.001 (0.008)	Loss 3.7203 (3.5568)	Entropy 1.22431 (1.24540)	Top-1 acc 41.016 (39.909)	Top-5 acc 58.984 (64.014)	lr 0.02406
Train [15][3000/3239]	Time 0.614 (0.875)	Data Time 0.001 (0.008)	Loss 3.3969 (3.5568)	Entropy 1.22411 (1.24533)	Top-1 acc 41.797 (39.904)	Top-5 acc 68.359 (64.014)	lr 0.02406
Train [15][3010/3239]	Time 0.625 (0.875)	Data Time 0.001 (0.008)	Loss 3.3698 (3.5565)	Entropy 1.22397 (1.24526)	Top-1 acc 43.750 (39.912)	Top-5 acc 71.484 (64.023)	lr 0.02406
Train [15][3020/3239]	Time 0.589 (0.874)	Data Time 0.001 (0.008)	Loss 3.4658 (3.5562)	Entropy 1.22394 (1.24519)	Top-1 acc 42.188 (39.920)	Top-5 acc 66.797 (64.031)	lr 0.02406
Train [15][3030/3239]	Time 0.706 (0.874)	Data Time 0.001 (0.008)	Loss 3.3958 (3.5561)	Entropy 1.22403 (1.24512)	Top-1 acc 45.703 (39.922)	Top-5 acc 65.234 (64.032)	lr 0.02406
Train [15][3040/3239]	Time 0.592 (0.874)	Data Time 0.001 (0.008)	Loss 3.5189 (3.5561)	Entropy 1.22388 (1.24505)	Top-1 acc 39.844 (39.918)	Top-5 acc 65.234 (64.033)	lr 0.02406
Train [15][3050/3239]	Time 0.633 (0.874)	Data Time 0.001 (0.008)	Loss 3.4184 (3.5560)	Entropy 1.22362 (1.24498)	Top-1 acc 40.625 (39.921)	Top-5 acc 65.234 (64.034)	lr 0.02406
Train [15][3060/3239]	Time 0.590 (0.874)	Data Time 0.001 (0.008)	Loss 3.4854 (3.5559)	Entropy 1.22350 (1.24491)	Top-1 acc 42.969 (39.918)	Top-5 acc 62.500 (64.034)	lr 0.02406
Train [15][3070/3239]	Time 0.583 (0.874)	Data Time 0.001 (0.008)	Loss 3.6554 (3.5561)	Entropy 1.22358 (1.24484)	Top-1 acc 39.844 (39.913)	Top-5 acc 59.766 (64.028)	lr 0.02406
Train [15][3080/3239]	Time 0.680 (0.881)	Data Time 0.006 (0.008)	Loss 3.4164 (3.5561)	Entropy 1.22306 (1.24477)	Top-1 acc 42.188 (39.915)	Top-5 acc 65.234 (64.028)	lr 0.02405
Train [15][3090/3239]	Time 0.634 (0.880)	Data Time 0.002 (0.008)	Loss 3.5986 (3.5559)	Entropy 1.22228 (1.24470)	Top-1 acc 40.625 (39.920)	Top-5 acc 62.891 (64.031)	lr 0.02405
Train [15][3100/3239]	Time 0.602 (0.880)	Data Time 0.001 (0.008)	Loss 3.5997 (3.5558)	Entropy 1.22210 (1.24463)	Top-1 acc 35.938 (39.919)	Top-5 acc 63.281 (64.035)	lr 0.02405
Train [15][3110/3239]	Time 0.602 (0.880)	Data Time 0.001 (0.008)	Loss 3.5646 (3.5560)	Entropy 1.22225 (1.24456)	Top-1 acc 42.188 (39.919)	Top-5 acc 62.891 (64.030)	lr 0.02405
Train [15][3120/3239]	Time 0.624 (0.880)	Data Time 0.001 (0.008)	Loss 3.7257 (3.5559)	Entropy 1.22152 (1.24448)	Top-1 acc 33.203 (39.919)	Top-5 acc 61.328 (64.032)	lr 0.02405
Train [15][3130/3239]	Time 0.597 (0.880)	Data Time 0.001 (0.008)	Loss 3.4621 (3.5558)	Entropy 1.22172 (1.24441)	Top-1 acc 45.703 (39.923)	Top-5 acc 65.625 (64.035)	lr 0.02405
Train [15][3140/3239]	Time 0.584 (0.880)	Data Time 0.002 (0.008)	Loss 3.3023 (3.5557)	Entropy 1.22210 (1.24434)	Top-1 acc 45.312 (39.923)	Top-5 acc 69.531 (64.035)	lr 0.02405
Train [15][3150/3239]	Time 0.564 (0.880)	Data Time 0.001 (0.008)	Loss 3.6553 (3.5558)	Entropy 1.22189 (1.24427)	Top-1 acc 33.984 (39.921)	Top-5 acc 63.281 (64.034)	lr 0.02405
Train [15][3160/3239]	Time 0.593 (0.880)	Data Time 0.001 (0.008)	Loss 3.5165 (3.5558)	Entropy 1.22164 (1.24420)	Top-1 acc 44.141 (39.919)	Top-5 acc 66.016 (64.034)	lr 0.02405
Train [15][3170/3239]	Time 0.581 (0.880)	Data Time 0.001 (0.008)	Loss 3.4853 (3.5558)	Entropy 1.22151 (1.24412)	Top-1 acc 39.844 (39.918)	Top-5 acc 62.500 (64.034)	lr 0.02405
Train [15][3180/3239]	Time 0.610 (0.879)	Data Time 0.000 (0.008)	Loss 3.3774 (3.5558)	Entropy 1.22144 (1.24405)	Top-1 acc 40.625 (39.918)	Top-5 acc 68.359 (64.032)	lr 0.02405
Train [15][3190/3239]	Time 0.687 (0.879)	Data Time 0.000 (0.008)	Loss 3.5548 (3.5556)	Entropy 1.22097 (1.24398)	Top-1 acc 41.016 (39.924)	Top-5 acc 63.281 (64.036)	lr 0.02405
Train [15][3200/3239]	Time 0.565 (0.879)	Data Time 0.000 (0.008)	Loss 3.3812 (3.5556)	Entropy 1.22076 (1.24391)	Top-1 acc 40.625 (39.925)	Top-5 acc 66.406 (64.038)	lr 0.02405
Train [15][3210/3239]	Time 0.573 (0.879)	Data Time 0.000 (0.008)	Loss 3.4081 (3.5554)	Entropy 1.22075 (1.24384)	Top-1 acc 39.844 (39.926)	Top-5 acc 66.406 (64.042)	lr 0.02405
Train [15][3220/3239]	Time 0.573 (0.879)	Data Time 0.000 (0.008)	Loss 3.6178 (3.5554)	Entropy 1.22047 (1.24376)	Top-1 acc 39.844 (39.925)	Top-5 acc 60.938 (64.040)	lr 0.02405
Train [15][3230/3239]	Time 0.585 (0.879)	Data Time 0.000 (0.008)	Loss 3.5530 (3.5553)	Entropy 1.22046 (1.24369)	Top-1 acc 39.062 (39.927)	Top-5 acc 63.281 (64.041)	lr 0.02405
Train [15][3239/3239]	Time 1.553 (0.879)	Data Time 0.000 (0.008)	Loss 3.6640 (3.5555)	Entropy 1.22016 (1.24363)	Top-1 acc 43.210 (39.925)	Top-5 acc 62.963 (64.038)	lr 0.02405
==========Valid [15/120]	loss 2.305	top-1 acc 50.021 (50.021)	top-5 acc 73.641	Train top-1 39.925	top-5 64.038	Entropy 1.22016	Latency-None: 0.000ms	Flops: 542.77M
Train [16][0/3239]	Time 21.728 (21.728)	Data Time 20.223 (20.223)	Loss 3.7184 (3.7184)	Entropy 1.21987 (1.21987)	Top-1 acc 35.938 (35.938)	Top-5 acc 60.938 (60.938)	lr 0.02405
Train [16][10/3239]	Time 0.566 (2.811)	Data Time 0.001 (1.840)	Loss 3.6042 (3.5860)	Entropy 1.21972 (1.21990)	Top-1 acc 42.578 (39.524)	Top-5 acc 62.500 (62.962)	lr 0.02405
Train [16][20/3239]	Time 0.644 (1.875)	Data Time 0.001 (0.965)	Loss 3.5010 (3.5464)	Entropy 1.21946 (1.21974)	Top-1 acc 41.016 (40.067)	Top-5 acc 63.281 (63.542)	lr 0.02405
Train [16][30/3239]	Time 0.574 (1.542)	Data Time 0.001 (0.654)	Loss 3.4234 (3.5470)	Entropy 1.21918 (1.21963)	Top-1 acc 44.922 (40.121)	Top-5 acc 67.188 (63.773)	lr 0.02405
Train [16][40/3239]	Time 0.552 (1.364)	Data Time 0.001 (0.495)	Loss 3.6613 (3.5611)	Entropy 1.21923 (1.21954)	Top-1 acc 37.500 (39.825)	Top-5 acc 61.328 (63.643)	lr 0.02405
Train [16][50/3239]	Time 0.469 (1.258)	Data Time 0.001 (0.399)	Loss 3.6826 (3.5572)	Entropy 1.21973 (1.21951)	Top-1 acc 35.938 (39.836)	Top-5 acc 60.156 (63.657)	lr 0.02405
Train [16][60/3239]	Time 0.599 (1.190)	Data Time 0.001 (0.334)	Loss 3.6710 (3.5616)	Entropy 1.21932 (1.21951)	Top-1 acc 40.234 (39.760)	Top-5 acc 61.719 (63.422)	lr 0.02405
Train [16][70/3239]	Time 0.612 (1.141)	Data Time 0.001 (0.287)	Loss 3.4213 (3.5513)	Entropy 1.21930 (1.21949)	Top-1 acc 42.578 (40.003)	Top-5 acc 63.672 (63.672)	lr 0.02405
Train [16][80/3239]	Time 0.663 (1.106)	Data Time 0.001 (0.252)	Loss 3.2343 (3.5415)	Entropy 1.21945 (1.21948)	Top-1 acc 46.875 (40.099)	Top-5 acc 70.703 (63.855)	lr 0.02405
Train [16][90/3239]	Time 0.695 (1.078)	Data Time 0.001 (0.224)	Loss 3.3440 (3.5317)	Entropy 1.21945 (1.21947)	Top-1 acc 42.578 (40.174)	Top-5 acc 68.750 (64.196)	lr 0.02405
Train [16][100/3239]	Time 0.631 (1.054)	Data Time 0.001 (0.202)	Loss 3.5161 (3.5295)	Entropy 1.21935 (1.21946)	Top-1 acc 38.672 (40.339)	Top-5 acc 66.406 (64.283)	lr 0.02404
Train [16][110/3239]	Time 0.591 (1.036)	Data Time 0.001 (0.184)	Loss 3.4424 (3.5304)	Entropy 1.21932 (1.21945)	Top-1 acc 41.016 (40.248)	Top-5 acc 66.406 (64.337)	lr 0.02404
Train [16][120/3239]	Time 0.609 (1.022)	Data Time 0.001 (0.169)	Loss 3.6789 (3.5352)	Entropy 1.21926 (1.21944)	Top-1 acc 36.719 (40.147)	Top-5 acc 64.062 (64.240)	lr 0.02404
Train [16][130/3239]	Time 0.573 (1.007)	Data Time 0.001 (0.156)	Loss 3.4702 (3.5363)	Entropy 1.21890 (1.21942)	Top-1 acc 41.406 (40.091)	Top-5 acc 66.016 (64.235)	lr 0.02404
Train [16][140/3239]	Time 0.636 (0.995)	Data Time 0.001 (0.145)	Loss 3.4161 (3.5351)	Entropy 1.21920 (1.21938)	Top-1 acc 45.703 (40.071)	Top-5 acc 67.969 (64.290)	lr 0.02404
Train [16][150/3239]	Time 0.648 (0.985)	Data Time 0.001 (0.136)	Loss 3.4808 (3.5358)	Entropy 1.21887 (1.21937)	Top-1 acc 41.797 (40.090)	Top-5 acc 64.062 (64.280)	lr 0.02404
Train [16][160/3239]	Time 0.676 (0.976)	Data Time 0.001 (0.127)	Loss 3.5065 (3.5361)	Entropy 1.21893 (1.21934)	Top-1 acc 41.797 (40.128)	Top-5 acc 66.797 (64.281)	lr 0.02404
Train [16][170/3239]	Time 0.580 (0.968)	Data Time 0.001 (0.120)	Loss 3.6394 (3.5328)	Entropy 1.21918 (1.21932)	Top-1 acc 41.406 (40.205)	Top-5 acc 63.281 (64.348)	lr 0.02404
Train [16][180/3239]	Time 0.578 (0.961)	Data Time 0.001 (0.114)	Loss 3.3403 (3.5341)	Entropy 1.21890 (1.21930)	Top-1 acc 41.406 (40.187)	Top-5 acc 68.750 (64.293)	lr 0.02404
Train [16][190/3239]	Time 0.573 (0.955)	Data Time 0.001 (0.108)	Loss 3.5678 (3.5357)	Entropy 1.21911 (1.21928)	Top-1 acc 41.406 (40.202)	Top-5 acc 65.234 (64.290)	lr 0.02404
Train [16][200/3239]	Time 0.613 (0.947)	Data Time 0.001 (0.102)	Loss 3.4282 (3.5333)	Entropy 1.21882 (1.21927)	Top-1 acc 44.141 (40.242)	Top-5 acc 67.188 (64.358)	lr 0.02404
Train [16][210/3239]	Time 0.561 (0.943)	Data Time 0.001 (0.098)	Loss 3.7634 (3.5334)	Entropy 1.21877 (1.21925)	Top-1 acc 39.062 (40.245)	Top-5 acc 61.719 (64.359)	lr 0.02404
Train [16][220/3239]	Time 0.600 (0.937)	Data Time 0.001 (0.093)	Loss 3.5406 (3.5351)	Entropy 1.21846 (1.21923)	Top-1 acc 42.969 (40.208)	Top-5 acc 66.797 (64.358)	lr 0.02404
Train [16][230/3239]	Time 0.591 (0.931)	Data Time 0.002 (0.089)	Loss 3.5764 (3.5358)	Entropy 1.21848 (1.21919)	Top-1 acc 39.844 (40.182)	Top-5 acc 64.062 (64.350)	lr 0.02404
Train [16][240/3239]	Time 0.572 (0.928)	Data Time 0.001 (0.086)	Loss 3.6424 (3.5343)	Entropy 1.21830 (1.21916)	Top-1 acc 38.281 (40.192)	Top-5 acc 62.109 (64.406)	lr 0.02404
Train [16][250/3239]	Time 0.571 (0.924)	Data Time 0.001 (0.082)	Loss 3.2867 (3.5297)	Entropy 1.21845 (1.21913)	Top-1 acc 44.922 (40.292)	Top-5 acc 73.828 (64.548)	lr 0.02404
Train [16][260/3239]	Time 0.638 (0.921)	Data Time 0.001 (0.079)	Loss 3.5616 (3.5287)	Entropy 1.21821 (1.21910)	Top-1 acc 39.062 (40.329)	Top-5 acc 63.672 (64.574)	lr 0.02404
Train [16][270/3239]	Time 0.590 (0.918)	Data Time 0.001 (0.076)	Loss 3.7289 (3.5306)	Entropy 1.21801 (1.21906)	Top-1 acc 37.500 (40.296)	Top-5 acc 60.938 (64.499)	lr 0.02404
Train [16][280/3239]	Time 0.584 (0.915)	Data Time 0.001 (0.074)	Loss 3.3381 (3.5322)	Entropy 1.21774 (1.21902)	Top-1 acc 46.094 (40.293)	Top-5 acc 67.969 (64.457)	lr 0.02404
Train [16][290/3239]	Time 0.571 (0.912)	Data Time 0.001 (0.071)	Loss 3.7491 (3.5352)	Entropy 1.21772 (1.21897)	Top-1 acc 37.109 (40.253)	Top-5 acc 60.547 (64.389)	lr 0.02404
Train [16][300/3239]	Time 0.648 (0.911)	Data Time 0.001 (0.069)	Loss 3.4137 (3.5338)	Entropy 1.21745 (1.21893)	Top-1 acc 42.969 (40.263)	Top-5 acc 65.625 (64.386)	lr 0.02404
Train [16][310/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.067)	Loss 3.6727 (3.5351)	Entropy 1.21715 (1.21887)	Top-1 acc 41.016 (40.272)	Top-5 acc 61.328 (64.373)	lr 0.02404
Train [16][320/3239]	Time 0.652 (0.907)	Data Time 0.001 (0.065)	Loss 3.6129 (3.5367)	Entropy 1.21673 (1.21881)	Top-1 acc 36.328 (40.234)	Top-5 acc 62.500 (64.346)	lr 0.02404
Train [16][330/3239]	Time 0.571 (0.905)	Data Time 0.001 (0.063)	Loss 3.6343 (3.5382)	Entropy 1.21635 (1.21874)	Top-1 acc 42.188 (40.206)	Top-5 acc 60.547 (64.310)	lr 0.02404
Train [16][340/3239]	Time 0.533 (0.903)	Data Time 0.001 (0.061)	Loss 3.6927 (3.5391)	Entropy 1.21641 (1.21868)	Top-1 acc 35.156 (40.176)	Top-5 acc 60.938 (64.297)	lr 0.02404
Train [16][350/3239]	Time 0.555 (0.901)	Data Time 0.001 (0.059)	Loss 3.5187 (3.5384)	Entropy 1.21618 (1.21861)	Top-1 acc 42.188 (40.183)	Top-5 acc 62.891 (64.300)	lr 0.02403
Train [16][360/3239]	Time 0.556 (0.899)	Data Time 0.001 (0.058)	Loss 3.7691 (3.5408)	Entropy 1.21554 (1.21853)	Top-1 acc 33.984 (40.140)	Top-5 acc 57.812 (64.241)	lr 0.02403
Train [16][370/3239]	Time 0.593 (0.898)	Data Time 0.001 (0.056)	Loss 3.5965 (3.5417)	Entropy 1.21573 (1.21845)	Top-1 acc 37.891 (40.141)	Top-5 acc 62.891 (64.212)	lr 0.02403
Train [16][380/3239]	Time 0.578 (0.896)	Data Time 0.001 (0.055)	Loss 3.4686 (3.5405)	Entropy 1.21576 (1.21838)	Top-1 acc 40.234 (40.149)	Top-5 acc 67.969 (64.245)	lr 0.02403
Train [16][390/3239]	Time 0.672 (0.894)	Data Time 0.001 (0.054)	Loss 3.5081 (3.5412)	Entropy 1.21546 (1.21831)	Top-1 acc 39.453 (40.143)	Top-5 acc 63.672 (64.233)	lr 0.02403
Train [16][400/3239]	Time 0.546 (0.892)	Data Time 0.001 (0.052)	Loss 3.5486 (3.5404)	Entropy 1.21568 (1.21824)	Top-1 acc 41.406 (40.178)	Top-5 acc 62.891 (64.235)	lr 0.02403
Train [16][410/3239]	Time 0.615 (0.889)	Data Time 0.001 (0.051)	Loss 3.3905 (3.5407)	Entropy 1.21533 (1.21817)	Top-1 acc 44.531 (40.174)	Top-5 acc 70.703 (64.235)	lr 0.02403
Train [16][420/3239]	Time 0.628 (0.888)	Data Time 0.001 (0.050)	Loss 3.5538 (3.5396)	Entropy 1.21536 (1.21811)	Top-1 acc 41.406 (40.209)	Top-5 acc 64.844 (64.251)	lr 0.02403
Train [16][430/3239]	Time 0.616 (0.887)	Data Time 0.001 (0.049)	Loss 3.5601 (3.5397)	Entropy 1.21546 (1.21804)	Top-1 acc 37.500 (40.208)	Top-5 acc 61.719 (64.238)	lr 0.02403
Train [16][440/3239]	Time 0.579 (0.886)	Data Time 0.001 (0.048)	Loss 3.2816 (3.5385)	Entropy 1.21538 (1.21798)	Top-1 acc 44.141 (40.238)	Top-5 acc 69.922 (64.264)	lr 0.02403
Train [16][450/3239]	Time 0.612 (0.885)	Data Time 0.001 (0.047)	Loss 3.6439 (3.5380)	Entropy 1.21492 (1.21792)	Top-1 acc 33.984 (40.227)	Top-5 acc 60.938 (64.280)	lr 0.02403
Train [16][460/3239]	Time 0.649 (0.884)	Data Time 0.001 (0.046)	Loss 3.5769 (3.5375)	Entropy 1.21514 (1.21786)	Top-1 acc 40.234 (40.212)	Top-5 acc 62.500 (64.284)	lr 0.02403
Train [16][470/3239]	Time 0.622 (0.884)	Data Time 0.001 (0.045)	Loss 3.2868 (3.5369)	Entropy 1.21531 (1.21780)	Top-1 acc 45.703 (40.227)	Top-5 acc 69.922 (64.285)	lr 0.02403
Train [16][480/3239]	Time 0.575 (0.883)	Data Time 0.001 (0.044)	Loss 3.6214 (3.5358)	Entropy 1.21503 (1.21775)	Top-1 acc 37.891 (40.257)	Top-5 acc 63.672 (64.327)	lr 0.02403
Train [16][490/3239]	Time 0.632 (0.882)	Data Time 0.001 (0.043)	Loss 3.4775 (3.5358)	Entropy 1.21479 (1.21769)	Top-1 acc 41.797 (40.253)	Top-5 acc 69.141 (64.344)	lr 0.02403
Train [16][500/3239]	Time 0.558 (0.922)	Data Time 0.002 (0.042)	Loss 3.6135 (3.5354)	Entropy 1.21489 (1.21763)	Top-1 acc 42.969 (40.261)	Top-5 acc 62.500 (64.359)	lr 0.02403
Train [16][510/3239]	Time 0.611 (0.920)	Data Time 0.001 (0.041)	Loss 3.4839 (3.5348)	Entropy 1.21456 (1.21758)	Top-1 acc 38.672 (40.261)	Top-5 acc 63.672 (64.390)	lr 0.02403
Train [16][520/3239]	Time 0.597 (0.919)	Data Time 0.001 (0.041)	Loss 3.5142 (3.5346)	Entropy 1.21480 (1.21752)	Top-1 acc 41.016 (40.294)	Top-5 acc 64.844 (64.378)	lr 0.02403
Train [16][530/3239]	Time 0.632 (0.917)	Data Time 0.001 (0.040)	Loss 3.7533 (3.5346)	Entropy 1.21503 (1.21747)	Top-1 acc 38.672 (40.306)	Top-5 acc 57.422 (64.372)	lr 0.02403
Train [16][540/3239]	Time 0.557 (0.915)	Data Time 0.001 (0.039)	Loss 3.6427 (3.5342)	Entropy 1.21487 (1.21743)	Top-1 acc 35.156 (40.283)	Top-5 acc 64.062 (64.382)	lr 0.02403
Train [16][550/3239]	Time 0.690 (0.914)	Data Time 0.001 (0.039)	Loss 3.6957 (3.5352)	Entropy 1.21426 (1.21737)	Top-1 acc 36.328 (40.256)	Top-5 acc 57.812 (64.368)	lr 0.02403
Train [16][560/3239]	Time 0.639 (0.912)	Data Time 0.001 (0.038)	Loss 3.4042 (3.5347)	Entropy 1.21417 (1.21732)	Top-1 acc 42.188 (40.264)	Top-5 acc 66.016 (64.369)	lr 0.02403
Train [16][570/3239]	Time 0.606 (0.911)	Data Time 0.001 (0.037)	Loss 3.4827 (3.5348)	Entropy 1.21440 (1.21726)	Top-1 acc 41.016 (40.252)	Top-5 acc 65.625 (64.369)	lr 0.02403
Train [16][580/3239]	Time 0.620 (0.910)	Data Time 0.001 (0.037)	Loss 3.6378 (3.5361)	Entropy 1.21465 (1.21722)	Top-1 acc 37.891 (40.203)	Top-5 acc 66.406 (64.360)	lr 0.02403
Train [16][590/3239]	Time 0.564 (0.909)	Data Time 0.001 (0.036)	Loss 3.4278 (3.5355)	Entropy 1.21436 (1.21717)	Top-1 acc 43.359 (40.229)	Top-5 acc 66.016 (64.372)	lr 0.02403
Train [16][600/3239]	Time 0.627 (0.908)	Data Time 0.002 (0.036)	Loss 3.4086 (3.5367)	Entropy 1.21430 (1.21713)	Top-1 acc 42.969 (40.186)	Top-5 acc 65.234 (64.350)	lr 0.02403
Train [16][610/3239]	Time 0.612 (0.907)	Data Time 0.001 (0.035)	Loss 3.3507 (3.5367)	Entropy 1.21441 (1.21708)	Top-1 acc 42.969 (40.191)	Top-5 acc 66.797 (64.345)	lr 0.02402
Train [16][620/3239]	Time 0.721 (0.906)	Data Time 0.001 (0.034)	Loss 3.6821 (3.5365)	Entropy 1.21453 (1.21704)	Top-1 acc 34.375 (40.204)	Top-5 acc 63.281 (64.357)	lr 0.02402
Train [16][630/3239]	Time 0.614 (0.905)	Data Time 0.002 (0.034)	Loss 3.7053 (3.5365)	Entropy 1.21428 (1.21699)	Top-1 acc 39.062 (40.202)	Top-5 acc 61.328 (64.349)	lr 0.02402
Train [16][640/3239]	Time 0.602 (0.904)	Data Time 0.001 (0.033)	Loss 3.5168 (3.5357)	Entropy 1.21367 (1.21695)	Top-1 acc 40.625 (40.212)	Top-5 acc 65.625 (64.365)	lr 0.02402
Train [16][650/3239]	Time 0.596 (0.903)	Data Time 0.001 (0.033)	Loss 3.5170 (3.5359)	Entropy 1.21296 (1.21689)	Top-1 acc 36.719 (40.212)	Top-5 acc 69.922 (64.371)	lr 0.02402
Train [16][660/3239]	Time 0.593 (0.902)	Data Time 0.001 (0.033)	Loss 3.3560 (3.5364)	Entropy 1.21304 (1.21683)	Top-1 acc 47.266 (40.206)	Top-5 acc 67.969 (64.362)	lr 0.02402
Train [16][670/3239]	Time 0.588 (0.901)	Data Time 0.001 (0.032)	Loss 3.6084 (3.5368)	Entropy 1.21247 (1.21677)	Top-1 acc 38.281 (40.191)	Top-5 acc 62.109 (64.357)	lr 0.02402
Train [16][680/3239]	Time 0.584 (0.901)	Data Time 0.001 (0.032)	Loss 3.2800 (3.5363)	Entropy 1.21240 (1.21671)	Top-1 acc 48.047 (40.211)	Top-5 acc 70.703 (64.374)	lr 0.02402
Train [16][690/3239]	Time 0.552 (0.900)	Data Time 0.001 (0.031)	Loss 3.5010 (3.5359)	Entropy 1.21234 (1.21665)	Top-1 acc 41.016 (40.221)	Top-5 acc 67.578 (64.390)	lr 0.02402
Train [16][700/3239]	Time 0.605 (0.899)	Data Time 0.003 (0.031)	Loss 3.5264 (3.5355)	Entropy 1.21217 (1.21659)	Top-1 acc 42.188 (40.242)	Top-5 acc 63.672 (64.400)	lr 0.02402
Train [16][710/3239]	Time 0.500 (0.897)	Data Time 0.001 (0.030)	Loss 3.6796 (3.5353)	Entropy 1.21197 (1.21652)	Top-1 acc 35.938 (40.255)	Top-5 acc 58.594 (64.393)	lr 0.02402
Train [16][720/3239]	Time 0.553 (0.897)	Data Time 0.001 (0.030)	Loss 3.8595 (3.5354)	Entropy 1.21213 (1.21646)	Top-1 acc 32.812 (40.257)	Top-5 acc 57.812 (64.391)	lr 0.02402
Train [16][730/3239]	Time 0.508 (0.896)	Data Time 0.001 (0.030)	Loss 3.3912 (3.5349)	Entropy 1.21189 (1.21640)	Top-1 acc 44.141 (40.258)	Top-5 acc 69.141 (64.409)	lr 0.02402
Train [16][740/3239]	Time 0.629 (0.895)	Data Time 0.001 (0.029)	Loss 3.6296 (3.5344)	Entropy 1.21142 (1.21634)	Top-1 acc 36.328 (40.262)	Top-5 acc 64.844 (64.422)	lr 0.02402
Train [16][750/3239]	Time 0.606 (0.895)	Data Time 0.001 (0.029)	Loss 3.4143 (3.5343)	Entropy 1.21173 (1.21627)	Top-1 acc 42.969 (40.270)	Top-5 acc 66.016 (64.429)	lr 0.02402
Train [16][760/3239]	Time 0.539 (0.894)	Data Time 0.001 (0.029)	Loss 3.6760 (3.5347)	Entropy 1.21175 (1.21621)	Top-1 acc 39.062 (40.273)	Top-5 acc 60.156 (64.410)	lr 0.02402
Train [16][770/3239]	Time 0.629 (0.893)	Data Time 0.001 (0.028)	Loss 3.5680 (3.5345)	Entropy 1.21188 (1.21616)	Top-1 acc 37.109 (40.269)	Top-5 acc 66.797 (64.410)	lr 0.02402
Train [16][780/3239]	Time 0.662 (0.893)	Data Time 0.001 (0.028)	Loss 3.3805 (3.5340)	Entropy 1.21187 (1.21610)	Top-1 acc 40.625 (40.281)	Top-5 acc 66.797 (64.419)	lr 0.02402
Train [16][790/3239]	Time 0.636 (0.892)	Data Time 0.001 (0.028)	Loss 3.7763 (3.5343)	Entropy 1.21171 (1.21605)	Top-1 acc 37.109 (40.268)	Top-5 acc 59.375 (64.409)	lr 0.02402
Train [16][800/3239]	Time 0.602 (0.892)	Data Time 0.001 (0.027)	Loss 3.3953 (3.5345)	Entropy 1.21157 (1.21599)	Top-1 acc 37.109 (40.249)	Top-5 acc 67.578 (64.408)	lr 0.02402
Train [16][810/3239]	Time 0.614 (0.891)	Data Time 0.001 (0.027)	Loss 3.5365 (3.5349)	Entropy 1.21170 (1.21594)	Top-1 acc 41.797 (40.247)	Top-5 acc 65.625 (64.395)	lr 0.02402
Train [16][820/3239]	Time 0.590 (0.891)	Data Time 0.001 (0.027)	Loss 3.4747 (3.5345)	Entropy 1.21189 (1.21589)	Top-1 acc 40.234 (40.253)	Top-5 acc 67.578 (64.401)	lr 0.02402
Train [16][830/3239]	Time 0.606 (0.890)	Data Time 0.001 (0.026)	Loss 3.3404 (3.5348)	Entropy 1.21195 (1.21584)	Top-1 acc 44.531 (40.253)	Top-5 acc 67.969 (64.387)	lr 0.02402
Train [16][840/3239]	Time 0.567 (0.890)	Data Time 0.001 (0.026)	Loss 3.4844 (3.5342)	Entropy 1.21147 (1.21579)	Top-1 acc 42.969 (40.267)	Top-5 acc 67.578 (64.397)	lr 0.02402
Train [16][850/3239]	Time 0.602 (0.889)	Data Time 0.001 (0.026)	Loss 3.3658 (3.5342)	Entropy 1.21118 (1.21574)	Top-1 acc 43.750 (40.283)	Top-5 acc 68.359 (64.394)	lr 0.02402
Train [16][860/3239]	Time 0.647 (0.889)	Data Time 0.001 (0.025)	Loss 3.6436 (3.5337)	Entropy 1.21118 (1.21569)	Top-1 acc 42.188 (40.293)	Top-5 acc 62.500 (64.401)	lr 0.02401
Train [16][870/3239]	Time 0.582 (0.888)	Data Time 0.001 (0.025)	Loss 3.5383 (3.5338)	Entropy 1.21134 (1.21564)	Top-1 acc 43.359 (40.315)	Top-5 acc 61.719 (64.404)	lr 0.02401
Train [16][880/3239]	Time 0.577 (0.887)	Data Time 0.003 (0.025)	Loss 3.3611 (3.5335)	Entropy 1.21121 (1.21559)	Top-1 acc 44.922 (40.326)	Top-5 acc 69.141 (64.415)	lr 0.02401
Train [16][890/3239]	Time 0.636 (0.886)	Data Time 0.001 (0.025)	Loss 3.5425 (3.5338)	Entropy 1.21122 (1.21554)	Top-1 acc 43.359 (40.331)	Top-5 acc 64.062 (64.409)	lr 0.02401
Train [16][900/3239]	Time 0.624 (0.886)	Data Time 0.001 (0.024)	Loss 3.5387 (3.5334)	Entropy 1.21125 (1.21549)	Top-1 acc 36.719 (40.333)	Top-5 acc 62.891 (64.415)	lr 0.02401
Train [16][910/3239]	Time 0.610 (0.886)	Data Time 0.001 (0.024)	Loss 3.8080 (3.5335)	Entropy 1.21122 (1.21545)	Top-1 acc 36.719 (40.340)	Top-5 acc 60.156 (64.421)	lr 0.02401
Train [16][920/3239]	Time 0.578 (0.885)	Data Time 0.001 (0.024)	Loss 3.6520 (3.5338)	Entropy 1.21125 (1.21540)	Top-1 acc 36.719 (40.345)	Top-5 acc 60.156 (64.419)	lr 0.02401
Train [16][930/3239]	Time 0.577 (0.885)	Data Time 0.002 (0.024)	Loss 3.5986 (3.5344)	Entropy 1.21101 (1.21535)	Top-1 acc 37.109 (40.336)	Top-5 acc 64.453 (64.401)	lr 0.02401
Train [16][940/3239]	Time 0.688 (0.884)	Data Time 0.001 (0.023)	Loss 3.5469 (3.5348)	Entropy 1.21061 (1.21530)	Top-1 acc 39.062 (40.335)	Top-5 acc 64.062 (64.397)	lr 0.02401
Train [16][950/3239]	Time 0.591 (0.884)	Data Time 0.001 (0.023)	Loss 3.4802 (3.5339)	Entropy 1.21061 (1.21525)	Top-1 acc 41.016 (40.353)	Top-5 acc 63.281 (64.413)	lr 0.02401
Train [16][960/3239]	Time 0.593 (0.884)	Data Time 0.001 (0.023)	Loss 3.5174 (3.5342)	Entropy 1.21055 (1.21521)	Top-1 acc 39.453 (40.340)	Top-5 acc 64.453 (64.407)	lr 0.02401
Train [16][970/3239]	Time 0.606 (0.883)	Data Time 0.002 (0.023)	Loss 3.5217 (3.5334)	Entropy 1.21017 (1.21516)	Top-1 acc 39.453 (40.343)	Top-5 acc 64.844 (64.426)	lr 0.02401
Train [16][980/3239]	Time 0.605 (0.883)	Data Time 0.003 (0.023)	Loss 3.3655 (3.5327)	Entropy 1.20992 (1.21510)	Top-1 acc 42.969 (40.356)	Top-5 acc 66.406 (64.441)	lr 0.02401
Train [16][990/3239]	Time 0.559 (0.882)	Data Time 0.001 (0.022)	Loss 3.4753 (3.5324)	Entropy 1.21006 (1.21505)	Top-1 acc 39.062 (40.356)	Top-5 acc 62.891 (64.452)	lr 0.02401
Train [16][1000/3239]	Time 0.580 (0.882)	Data Time 0.001 (0.022)	Loss 3.5563 (3.5320)	Entropy 1.20975 (1.21500)	Top-1 acc 40.625 (40.365)	Top-5 acc 62.891 (64.463)	lr 0.02401
Train [16][1010/3239]	Time 0.661 (0.882)	Data Time 0.001 (0.022)	Loss 3.5249 (3.5316)	Entropy 1.20919 (1.21495)	Top-1 acc 37.109 (40.370)	Top-5 acc 65.625 (64.473)	lr 0.02401
Train [16][1020/3239]	Time 0.611 (0.881)	Data Time 0.001 (0.022)	Loss 3.4970 (3.5316)	Entropy 1.20880 (1.21489)	Top-1 acc 41.016 (40.366)	Top-5 acc 64.453 (64.480)	lr 0.02401
Train [16][1030/3239]	Time 0.563 (0.881)	Data Time 0.001 (0.022)	Loss 3.4649 (3.5313)	Entropy 1.20852 (1.21483)	Top-1 acc 42.969 (40.375)	Top-5 acc 66.406 (64.493)	lr 0.02401
Train [16][1040/3239]	Time 0.648 (0.880)	Data Time 0.001 (0.021)	Loss 3.4438 (3.5315)	Entropy 1.20802 (1.21477)	Top-1 acc 42.969 (40.372)	Top-5 acc 67.188 (64.495)	lr 0.02401
Train [16][1050/3239]	Time 0.613 (0.880)	Data Time 0.001 (0.021)	Loss 3.5054 (3.5316)	Entropy 1.20823 (1.21471)	Top-1 acc 39.062 (40.377)	Top-5 acc 67.969 (64.501)	lr 0.02401
Train [16][1060/3239]	Time 0.449 (0.879)	Data Time 0.001 (0.021)	Loss 3.4883 (3.5318)	Entropy 1.20807 (1.21464)	Top-1 acc 39.844 (40.375)	Top-5 acc 65.234 (64.491)	lr 0.02401
Train [16][1070/3239]	Time 0.630 (0.879)	Data Time 0.001 (0.021)	Loss 3.7209 (3.5324)	Entropy 1.20812 (1.21458)	Top-1 acc 35.547 (40.370)	Top-5 acc 59.375 (64.478)	lr 0.02401
Train [16][1080/3239]	Time 0.597 (0.879)	Data Time 0.001 (0.021)	Loss 3.5352 (3.5325)	Entropy 1.20807 (1.21452)	Top-1 acc 37.891 (40.366)	Top-5 acc 66.016 (64.476)	lr 0.02401
Train [16][1090/3239]	Time 0.521 (0.879)	Data Time 0.001 (0.021)	Loss 3.5604 (3.5321)	Entropy 1.20769 (1.21446)	Top-1 acc 38.672 (40.377)	Top-5 acc 65.234 (64.487)	lr 0.02401
Train [16][1100/3239]	Time 0.612 (0.878)	Data Time 0.001 (0.020)	Loss 3.6229 (3.5319)	Entropy 1.20789 (1.21440)	Top-1 acc 37.500 (40.392)	Top-5 acc 61.719 (64.492)	lr 0.02401
Train [16][1110/3239]	Time 0.599 (0.878)	Data Time 0.001 (0.020)	Loss 3.6341 (3.5315)	Entropy 1.20806 (1.21434)	Top-1 acc 39.062 (40.404)	Top-5 acc 61.719 (64.500)	lr 0.02401
Train [16][1120/3239]	Time 0.587 (0.878)	Data Time 0.001 (0.020)	Loss 3.8430 (3.5316)	Entropy 1.20816 (1.21429)	Top-1 acc 34.766 (40.403)	Top-5 acc 56.641 (64.502)	lr 0.02400
Train [16][1130/3239]	Time 0.546 (0.877)	Data Time 0.001 (0.020)	Loss 3.4941 (3.5316)	Entropy 1.20792 (1.21423)	Top-1 acc 45.312 (40.404)	Top-5 acc 64.453 (64.505)	lr 0.02400
Train [16][1140/3239]	Time 0.537 (0.877)	Data Time 0.001 (0.020)	Loss 3.3634 (3.5318)	Entropy 1.20765 (1.21418)	Top-1 acc 44.531 (40.402)	Top-5 acc 70.703 (64.506)	lr 0.02400
Train [16][1150/3239]	Time 0.698 (0.895)	Data Time 0.006 (0.020)	Loss 3.4487 (3.5322)	Entropy 1.20765 (1.21412)	Top-1 acc 41.016 (40.395)	Top-5 acc 67.969 (64.498)	lr 0.02400
Train [16][1160/3239]	Time 0.610 (0.895)	Data Time 0.002 (0.019)	Loss 3.4380 (3.5321)	Entropy 1.20769 (1.21407)	Top-1 acc 41.016 (40.399)	Top-5 acc 63.672 (64.496)	lr 0.02400
Train [16][1170/3239]	Time 0.686 (0.894)	Data Time 0.002 (0.019)	Loss 3.6712 (3.5320)	Entropy 1.20758 (1.21401)	Top-1 acc 37.500 (40.403)	Top-5 acc 61.328 (64.497)	lr 0.02400
Train [16][1180/3239]	Time 0.571 (0.894)	Data Time 0.001 (0.019)	Loss 3.3156 (3.5311)	Entropy 1.20709 (1.21396)	Top-1 acc 44.531 (40.435)	Top-5 acc 71.875 (64.521)	lr 0.02400
Train [16][1190/3239]	Time 0.591 (0.893)	Data Time 0.001 (0.019)	Loss 3.5730 (3.5306)	Entropy 1.20687 (1.21390)	Top-1 acc 40.625 (40.450)	Top-5 acc 65.625 (64.539)	lr 0.02400
Train [16][1200/3239]	Time 0.563 (0.893)	Data Time 0.001 (0.019)	Loss 3.6006 (3.5308)	Entropy 1.20674 (1.21384)	Top-1 acc 36.328 (40.453)	Top-5 acc 64.453 (64.541)	lr 0.02400
Train [16][1210/3239]	Time 0.597 (0.892)	Data Time 0.001 (0.019)	Loss 3.4939 (3.5306)	Entropy 1.20625 (1.21378)	Top-1 acc 38.281 (40.456)	Top-5 acc 65.625 (64.546)	lr 0.02400
Train [16][1220/3239]	Time 0.568 (0.892)	Data Time 0.001 (0.019)	Loss 3.5597 (3.5299)	Entropy 1.20556 (1.21372)	Top-1 acc 39.844 (40.478)	Top-5 acc 67.578 (64.558)	lr 0.02400
Train [16][1230/3239]	Time 0.628 (0.892)	Data Time 0.003 (0.018)	Loss 3.4638 (3.5299)	Entropy 1.20546 (1.21365)	Top-1 acc 39.453 (40.466)	Top-5 acc 65.234 (64.559)	lr 0.02400
Train [16][1240/3239]	Time 0.618 (0.892)	Data Time 0.002 (0.018)	Loss 3.5286 (3.5290)	Entropy 1.20536 (1.21358)	Top-1 acc 39.453 (40.492)	Top-5 acc 63.672 (64.583)	lr 0.02400
Train [16][1250/3239]	Time 0.581 (0.891)	Data Time 0.003 (0.018)	Loss 3.5518 (3.5286)	Entropy 1.20486 (1.21352)	Top-1 acc 35.938 (40.493)	Top-5 acc 64.453 (64.590)	lr 0.02400
Train [16][1260/3239]	Time 0.572 (0.891)	Data Time 0.002 (0.018)	Loss 3.4924 (3.5285)	Entropy 1.20461 (1.21345)	Top-1 acc 44.141 (40.513)	Top-5 acc 64.062 (64.584)	lr 0.02400
Train [16][1270/3239]	Time 0.556 (0.891)	Data Time 0.001 (0.018)	Loss 3.5233 (3.5285)	Entropy 1.20390 (1.21337)	Top-1 acc 39.844 (40.505)	Top-5 acc 66.406 (64.585)	lr 0.02400
Train [16][1280/3239]	Time 0.639 (0.890)	Data Time 0.001 (0.018)	Loss 3.6686 (3.5282)	Entropy 1.20385 (1.21330)	Top-1 acc 36.719 (40.515)	Top-5 acc 62.500 (64.589)	lr 0.02400
Train [16][1290/3239]	Time 0.601 (0.890)	Data Time 0.001 (0.018)	Loss 3.4473 (3.5279)	Entropy 1.20379 (1.21323)	Top-1 acc 41.406 (40.526)	Top-5 acc 66.406 (64.592)	lr 0.02400
Train [16][1300/3239]	Time 0.603 (0.890)	Data Time 0.001 (0.018)	Loss 3.3884 (3.5276)	Entropy 1.20332 (1.21315)	Top-1 acc 42.188 (40.531)	Top-5 acc 67.969 (64.604)	lr 0.02400
Train [16][1310/3239]	Time 0.561 (0.889)	Data Time 0.001 (0.017)	Loss 3.5317 (3.5280)	Entropy 1.20299 (1.21308)	Top-1 acc 41.406 (40.521)	Top-5 acc 67.188 (64.593)	lr 0.02400
Train [16][1320/3239]	Time 0.601 (0.889)	Data Time 0.001 (0.017)	Loss 3.6306 (3.5280)	Entropy 1.20298 (1.21300)	Top-1 acc 41.016 (40.521)	Top-5 acc 64.844 (64.594)	lr 0.02400
Train [16][1330/3239]	Time 0.566 (0.889)	Data Time 0.001 (0.017)	Loss 3.4857 (3.5279)	Entropy 1.20323 (1.21292)	Top-1 acc 40.625 (40.522)	Top-5 acc 61.719 (64.589)	lr 0.02400
Train [16][1340/3239]	Time 0.631 (0.888)	Data Time 0.002 (0.017)	Loss 3.3938 (3.5281)	Entropy 1.20307 (1.21285)	Top-1 acc 46.875 (40.517)	Top-5 acc 67.969 (64.595)	lr 0.02400
Train [16][1350/3239]	Time 0.450 (0.888)	Data Time 0.001 (0.017)	Loss 3.4179 (3.5283)	Entropy 1.20263 (1.21278)	Top-1 acc 40.234 (40.513)	Top-5 acc 65.234 (64.587)	lr 0.02400
Train [16][1360/3239]	Time 0.569 (0.887)	Data Time 0.001 (0.017)	Loss 3.5482 (3.5287)	Entropy 1.20241 (1.21270)	Top-1 acc 41.406 (40.507)	Top-5 acc 62.891 (64.577)	lr 0.02400
Train [16][1370/3239]	Time 0.589 (0.887)	Data Time 0.001 (0.017)	Loss 3.5925 (3.5286)	Entropy 1.20240 (1.21263)	Top-1 acc 39.453 (40.503)	Top-5 acc 67.188 (64.576)	lr 0.02399
Train [16][1380/3239]	Time 0.596 (0.887)	Data Time 0.001 (0.017)	Loss 3.5524 (3.5286)	Entropy 1.20263 (1.21256)	Top-1 acc 40.625 (40.508)	Top-5 acc 64.453 (64.579)	lr 0.02399
Train [16][1390/3239]	Time 0.642 (0.886)	Data Time 0.001 (0.017)	Loss 3.7380 (3.5285)	Entropy 1.20241 (1.21248)	Top-1 acc 36.328 (40.513)	Top-5 acc 61.328 (64.586)	lr 0.02399
Train [16][1400/3239]	Time 0.677 (0.886)	Data Time 0.001 (0.016)	Loss 3.4296 (3.5285)	Entropy 1.20218 (1.21241)	Top-1 acc 43.359 (40.512)	Top-5 acc 67.578 (64.589)	lr 0.02399
Train [16][1410/3239]	Time 0.562 (0.886)	Data Time 0.001 (0.016)	Loss 3.6735 (3.5286)	Entropy 1.20201 (1.21234)	Top-1 acc 38.672 (40.517)	Top-5 acc 62.109 (64.595)	lr 0.02399
Train [16][1420/3239]	Time 0.586 (0.886)	Data Time 0.001 (0.016)	Loss 3.4117 (3.5284)	Entropy 1.20202 (1.21226)	Top-1 acc 46.094 (40.518)	Top-5 acc 67.578 (64.601)	lr 0.02399
Train [16][1430/3239]	Time 0.638 (0.886)	Data Time 0.001 (0.016)	Loss 3.5843 (3.5287)	Entropy 1.20180 (1.21219)	Top-1 acc 38.672 (40.518)	Top-5 acc 62.500 (64.595)	lr 0.02399
Train [16][1440/3239]	Time 0.601 (0.885)	Data Time 0.001 (0.016)	Loss 3.3999 (3.5289)	Entropy 1.20178 (1.21212)	Top-1 acc 43.359 (40.513)	Top-5 acc 66.406 (64.593)	lr 0.02399
Train [16][1450/3239]	Time 0.555 (0.885)	Data Time 0.002 (0.016)	Loss 3.6049 (3.5289)	Entropy 1.20176 (1.21205)	Top-1 acc 32.812 (40.518)	Top-5 acc 64.062 (64.594)	lr 0.02399
Train [16][1460/3239]	Time 0.610 (0.885)	Data Time 0.001 (0.016)	Loss 3.5039 (3.5287)	Entropy 1.20197 (1.21198)	Top-1 acc 39.844 (40.520)	Top-5 acc 67.969 (64.598)	lr 0.02399
Train [16][1470/3239]	Time 0.690 (0.884)	Data Time 0.001 (0.016)	Loss 3.6637 (3.5285)	Entropy 1.20184 (1.21191)	Top-1 acc 37.891 (40.523)	Top-5 acc 60.938 (64.603)	lr 0.02399
Train [16][1480/3239]	Time 0.575 (0.884)	Data Time 0.001 (0.016)	Loss 3.5862 (3.5280)	Entropy 1.20149 (1.21184)	Top-1 acc 39.844 (40.537)	Top-5 acc 62.891 (64.619)	lr 0.02399
Train [16][1490/3239]	Time 0.621 (0.884)	Data Time 0.002 (0.016)	Loss 3.4719 (3.5281)	Entropy 1.20165 (1.21177)	Top-1 acc 41.797 (40.529)	Top-5 acc 69.141 (64.619)	lr 0.02399
Train [16][1500/3239]	Time 0.635 (0.884)	Data Time 0.001 (0.016)	Loss 3.5923 (3.5285)	Entropy 1.20130 (1.21171)	Top-1 acc 38.672 (40.525)	Top-5 acc 60.547 (64.605)	lr 0.02399
Train [16][1510/3239]	Time 0.617 (0.883)	Data Time 0.001 (0.015)	Loss 3.4331 (3.5287)	Entropy 1.20111 (1.21163)	Top-1 acc 44.531 (40.523)	Top-5 acc 67.578 (64.600)	lr 0.02399
Train [16][1520/3239]	Time 0.588 (0.883)	Data Time 0.001 (0.015)	Loss 3.2848 (3.5284)	Entropy 1.20111 (1.21157)	Top-1 acc 48.828 (40.535)	Top-5 acc 68.750 (64.605)	lr 0.02399
Train [16][1530/3239]	Time 0.632 (0.883)	Data Time 0.005 (0.015)	Loss 3.3609 (3.5278)	Entropy 1.20157 (1.21150)	Top-1 acc 44.531 (40.549)	Top-5 acc 68.359 (64.619)	lr 0.02399
Train [16][1540/3239]	Time 0.587 (0.882)	Data Time 0.001 (0.015)	Loss 3.5950 (3.5274)	Entropy 1.20161 (1.21143)	Top-1 acc 41.016 (40.553)	Top-5 acc 62.109 (64.623)	lr 0.02399
Train [16][1550/3239]	Time 0.609 (0.882)	Data Time 0.001 (0.015)	Loss 3.4510 (3.5278)	Entropy 1.20126 (1.21137)	Top-1 acc 40.234 (40.544)	Top-5 acc 65.625 (64.617)	lr 0.02399
Train [16][1560/3239]	Time 0.622 (0.882)	Data Time 0.001 (0.015)	Loss 3.3564 (3.5278)	Entropy 1.20079 (1.21130)	Top-1 acc 40.625 (40.543)	Top-5 acc 69.141 (64.622)	lr 0.02399
Train [16][1570/3239]	Time 0.578 (0.882)	Data Time 0.001 (0.015)	Loss 3.6840 (3.5277)	Entropy 1.20067 (1.21124)	Top-1 acc 36.719 (40.544)	Top-5 acc 63.672 (64.626)	lr 0.02399
Train [16][1580/3239]	Time 0.608 (0.882)	Data Time 0.001 (0.015)	Loss 3.4329 (3.5278)	Entropy 1.20078 (1.21117)	Top-1 acc 46.094 (40.546)	Top-5 acc 66.797 (64.623)	lr 0.02399
Train [16][1590/3239]	Time 0.581 (0.881)	Data Time 0.001 (0.015)	Loss 3.6497 (3.5280)	Entropy 1.20025 (1.21110)	Top-1 acc 37.500 (40.535)	Top-5 acc 62.500 (64.617)	lr 0.02399
Train [16][1600/3239]	Time 0.576 (0.881)	Data Time 0.002 (0.015)	Loss 3.2959 (3.5280)	Entropy 1.20040 (1.21104)	Top-1 acc 43.750 (40.537)	Top-5 acc 67.578 (64.620)	lr 0.02399
Train [16][1610/3239]	Time 0.582 (0.881)	Data Time 0.002 (0.015)	Loss 3.6292 (3.5275)	Entropy 1.20021 (1.21097)	Top-1 acc 39.844 (40.551)	Top-5 acc 61.719 (64.625)	lr 0.02399
Train [16][1620/3239]	Time 0.601 (0.881)	Data Time 0.001 (0.015)	Loss 3.7398 (3.5278)	Entropy 1.19956 (1.21090)	Top-1 acc 35.547 (40.548)	Top-5 acc 60.547 (64.614)	lr 0.02398
Train [16][1630/3239]	Time 0.656 (0.881)	Data Time 0.001 (0.014)	Loss 3.5031 (3.5277)	Entropy 1.19965 (1.21083)	Top-1 acc 41.016 (40.549)	Top-5 acc 68.359 (64.619)	lr 0.02398
Train [16][1640/3239]	Time 0.612 (0.880)	Data Time 0.001 (0.014)	Loss 3.5405 (3.5282)	Entropy 1.19950 (1.21077)	Top-1 acc 40.234 (40.538)	Top-5 acc 67.578 (64.614)	lr 0.02398
Train [16][1650/3239]	Time 0.620 (0.880)	Data Time 0.001 (0.014)	Loss 3.5040 (3.5283)	Entropy 1.19927 (1.21070)	Top-1 acc 42.969 (40.536)	Top-5 acc 67.188 (64.612)	lr 0.02398
Train [16][1660/3239]	Time 0.587 (0.880)	Data Time 0.001 (0.014)	Loss 3.6376 (3.5284)	Entropy 1.19945 (1.21063)	Top-1 acc 37.500 (40.526)	Top-5 acc 62.109 (64.609)	lr 0.02398
Train [16][1670/3239]	Time 0.585 (0.880)	Data Time 0.001 (0.014)	Loss 3.4120 (3.5285)	Entropy 1.19956 (1.21056)	Top-1 acc 41.406 (40.528)	Top-5 acc 69.531 (64.610)	lr 0.02398
Train [16][1680/3239]	Time 0.631 (0.880)	Data Time 0.002 (0.014)	Loss 3.5849 (3.5287)	Entropy 1.19961 (1.21050)	Top-1 acc 38.672 (40.521)	Top-5 acc 63.281 (64.602)	lr 0.02398
Train [16][1690/3239]	Time 0.538 (0.879)	Data Time 0.001 (0.014)	Loss 3.4095 (3.5285)	Entropy 1.19948 (1.21043)	Top-1 acc 42.188 (40.532)	Top-5 acc 67.969 (64.604)	lr 0.02398
Train [16][1700/3239]	Time 0.656 (0.879)	Data Time 0.001 (0.014)	Loss 3.5070 (3.5286)	Entropy 1.19950 (1.21037)	Top-1 acc 42.578 (40.532)	Top-5 acc 62.500 (64.603)	lr 0.02398
Train [16][1710/3239]	Time 0.543 (0.879)	Data Time 0.001 (0.014)	Loss 3.6084 (3.5288)	Entropy 1.19958 (1.21031)	Top-1 acc 36.328 (40.526)	Top-5 acc 62.500 (64.595)	lr 0.02398
Train [16][1720/3239]	Time 0.581 (0.878)	Data Time 0.001 (0.014)	Loss 3.7626 (3.5286)	Entropy 1.19890 (1.21024)	Top-1 acc 35.156 (40.531)	Top-5 acc 57.422 (64.594)	lr 0.02398
Train [16][1730/3239]	Time 0.599 (0.878)	Data Time 0.001 (0.014)	Loss 3.5817 (3.5283)	Entropy 1.19852 (1.21018)	Top-1 acc 39.062 (40.537)	Top-5 acc 63.281 (64.598)	lr 0.02398
Train [16][1740/3239]	Time 0.563 (0.878)	Data Time 0.001 (0.014)	Loss 3.6214 (3.5280)	Entropy 1.19802 (1.21011)	Top-1 acc 39.844 (40.550)	Top-5 acc 64.062 (64.605)	lr 0.02398
Train [16][1750/3239]	Time 0.607 (0.878)	Data Time 0.003 (0.014)	Loss 3.6273 (3.5283)	Entropy 1.19804 (1.21004)	Top-1 acc 40.625 (40.551)	Top-5 acc 61.328 (64.600)	lr 0.02398
Train [16][1760/3239]	Time 0.584 (0.878)	Data Time 0.001 (0.014)	Loss 3.3440 (3.5282)	Entropy 1.19838 (1.20997)	Top-1 acc 44.531 (40.560)	Top-5 acc 68.359 (64.602)	lr 0.02398
Train [16][1770/3239]	Time 0.656 (0.878)	Data Time 0.001 (0.013)	Loss 3.3902 (3.5278)	Entropy 1.19810 (1.20991)	Top-1 acc 43.359 (40.567)	Top-5 acc 68.750 (64.610)	lr 0.02398
Train [16][1780/3239]	Time 0.632 (0.877)	Data Time 0.001 (0.013)	Loss 3.6950 (3.5279)	Entropy 1.19819 (1.20984)	Top-1 acc 35.938 (40.562)	Top-5 acc 60.547 (64.607)	lr 0.02398
Train [16][1790/3239]	Time 0.634 (0.877)	Data Time 0.001 (0.013)	Loss 3.8175 (3.5281)	Entropy 1.19791 (1.20977)	Top-1 acc 36.719 (40.558)	Top-5 acc 58.594 (64.603)	lr 0.02398
Train [16][1800/3239]	Time 0.599 (0.877)	Data Time 0.001 (0.013)	Loss 3.6065 (3.5283)	Entropy 1.19763 (1.20971)	Top-1 acc 38.672 (40.556)	Top-5 acc 62.109 (64.600)	lr 0.02398
Train [16][1810/3239]	Time 0.618 (0.888)	Data Time 0.002 (0.013)	Loss 3.5579 (3.5281)	Entropy 1.19756 (1.20964)	Top-1 acc 40.625 (40.559)	Top-5 acc 65.234 (64.608)	lr 0.02398
Train [16][1820/3239]	Time 0.554 (0.888)	Data Time 0.001 (0.013)	Loss 3.4675 (3.5281)	Entropy 1.19720 (1.20957)	Top-1 acc 42.188 (40.562)	Top-5 acc 63.672 (64.604)	lr 0.02398
Train [16][1830/3239]	Time 0.633 (0.887)	Data Time 0.001 (0.013)	Loss 3.3723 (3.5281)	Entropy 1.19702 (1.20951)	Top-1 acc 44.922 (40.562)	Top-5 acc 66.016 (64.604)	lr 0.02398
Train [16][1840/3239]	Time 0.567 (0.887)	Data Time 0.001 (0.013)	Loss 3.3882 (3.5280)	Entropy 1.19718 (1.20944)	Top-1 acc 44.141 (40.568)	Top-5 acc 70.703 (64.611)	lr 0.02398
Train [16][1850/3239]	Time 0.631 (0.887)	Data Time 0.001 (0.013)	Loss 3.6427 (3.5282)	Entropy 1.19726 (1.20937)	Top-1 acc 38.281 (40.566)	Top-5 acc 63.672 (64.610)	lr 0.02398
Train [16][1860/3239]	Time 0.719 (0.886)	Data Time 0.001 (0.013)	Loss 3.5811 (3.5284)	Entropy 1.19708 (1.20931)	Top-1 acc 40.234 (40.563)	Top-5 acc 62.891 (64.609)	lr 0.02398
Train [16][1870/3239]	Time 0.609 (0.886)	Data Time 0.002 (0.013)	Loss 3.6324 (3.5287)	Entropy 1.19662 (1.20924)	Top-1 acc 36.719 (40.553)	Top-5 acc 63.281 (64.598)	lr 0.02397
Train [16][1880/3239]	Time 0.577 (0.886)	Data Time 0.001 (0.013)	Loss 3.5198 (3.5285)	Entropy 1.19668 (1.20917)	Top-1 acc 41.016 (40.555)	Top-5 acc 64.453 (64.604)	lr 0.02397
Train [16][1890/3239]	Time 0.650 (0.886)	Data Time 0.001 (0.013)	Loss 3.4865 (3.5283)	Entropy 1.19691 (1.20911)	Top-1 acc 41.016 (40.561)	Top-5 acc 62.109 (64.609)	lr 0.02397
Train [16][1900/3239]	Time 0.549 (0.886)	Data Time 0.001 (0.013)	Loss 3.5154 (3.5279)	Entropy 1.19644 (1.20904)	Top-1 acc 43.750 (40.571)	Top-5 acc 65.625 (64.616)	lr 0.02397
Train [16][1910/3239]	Time 0.616 (0.886)	Data Time 0.001 (0.013)	Loss 3.4700 (3.5279)	Entropy 1.19613 (1.20898)	Top-1 acc 40.625 (40.567)	Top-5 acc 62.500 (64.611)	lr 0.02397
Train [16][1920/3239]	Time 0.626 (0.885)	Data Time 0.001 (0.013)	Loss 3.5711 (3.5280)	Entropy 1.19612 (1.20891)	Top-1 acc 39.844 (40.565)	Top-5 acc 61.328 (64.610)	lr 0.02397
Train [16][1930/3239]	Time 0.662 (0.885)	Data Time 0.001 (0.013)	Loss 3.4699 (3.5280)	Entropy 1.19584 (1.20884)	Top-1 acc 41.016 (40.567)	Top-5 acc 66.016 (64.607)	lr 0.02397
Train [16][1940/3239]	Time 0.582 (0.885)	Data Time 0.001 (0.012)	Loss 3.5130 (3.5278)	Entropy 1.19608 (1.20878)	Top-1 acc 43.359 (40.568)	Top-5 acc 64.844 (64.612)	lr 0.02397
Train [16][1950/3239]	Time 0.629 (0.885)	Data Time 0.001 (0.012)	Loss 3.6385 (3.5278)	Entropy 1.19583 (1.20871)	Top-1 acc 41.406 (40.574)	Top-5 acc 60.938 (64.616)	lr 0.02397
Train [16][1960/3239]	Time 0.576 (0.885)	Data Time 0.001 (0.012)	Loss 3.5679 (3.5279)	Entropy 1.19589 (1.20865)	Top-1 acc 43.750 (40.572)	Top-5 acc 62.891 (64.614)	lr 0.02397
Train [16][1970/3239]	Time 0.581 (0.884)	Data Time 0.001 (0.012)	Loss 3.4428 (3.5274)	Entropy 1.19540 (1.20858)	Top-1 acc 38.281 (40.578)	Top-5 acc 64.062 (64.623)	lr 0.02397
Train [16][1980/3239]	Time 0.565 (0.884)	Data Time 0.001 (0.012)	Loss 3.6730 (3.5274)	Entropy 1.19534 (1.20851)	Top-1 acc 38.281 (40.575)	Top-5 acc 64.062 (64.626)	lr 0.02397
Train [16][1990/3239]	Time 0.620 (0.884)	Data Time 0.001 (0.012)	Loss 3.3585 (3.5272)	Entropy 1.19553 (1.20845)	Top-1 acc 42.578 (40.582)	Top-5 acc 65.625 (64.631)	lr 0.02397
Train [16][2000/3239]	Time 0.564 (0.884)	Data Time 0.003 (0.012)	Loss 3.6755 (3.5272)	Entropy 1.19489 (1.20838)	Top-1 acc 35.938 (40.574)	Top-5 acc 60.547 (64.632)	lr 0.02397
Train [16][2010/3239]	Time 0.610 (0.884)	Data Time 0.001 (0.012)	Loss 3.8148 (3.5274)	Entropy 1.19490 (1.20831)	Top-1 acc 34.375 (40.574)	Top-5 acc 53.125 (64.629)	lr 0.02397
Train [16][2020/3239]	Time 0.626 (0.883)	Data Time 0.001 (0.012)	Loss 3.2863 (3.5271)	Entropy 1.19464 (1.20825)	Top-1 acc 43.359 (40.582)	Top-5 acc 69.922 (64.628)	lr 0.02397
Train [16][2030/3239]	Time 0.608 (0.883)	Data Time 0.001 (0.012)	Loss 3.6362 (3.5275)	Entropy 1.19449 (1.20818)	Top-1 acc 38.672 (40.574)	Top-5 acc 60.156 (64.619)	lr 0.02397
Train [16][2040/3239]	Time 0.569 (0.883)	Data Time 0.001 (0.012)	Loss 3.3619 (3.5272)	Entropy 1.19457 (1.20811)	Top-1 acc 42.969 (40.578)	Top-5 acc 69.141 (64.623)	lr 0.02397
Train [16][2050/3239]	Time 0.621 (0.883)	Data Time 0.001 (0.012)	Loss 3.5730 (3.5270)	Entropy 1.19436 (1.20805)	Top-1 acc 42.578 (40.583)	Top-5 acc 62.109 (64.621)	lr 0.02397
Train [16][2060/3239]	Time 0.583 (0.882)	Data Time 0.001 (0.012)	Loss 3.3270 (3.5271)	Entropy 1.19409 (1.20798)	Top-1 acc 46.484 (40.582)	Top-5 acc 71.094 (64.620)	lr 0.02397
Train [16][2070/3239]	Time 0.629 (0.882)	Data Time 0.001 (0.012)	Loss 3.6891 (3.5270)	Entropy 1.19351 (1.20791)	Top-1 acc 39.453 (40.586)	Top-5 acc 62.891 (64.620)	lr 0.02397
Train [16][2080/3239]	Time 0.601 (0.882)	Data Time 0.001 (0.012)	Loss 3.6133 (3.5272)	Entropy 1.19305 (1.20784)	Top-1 acc 39.062 (40.579)	Top-5 acc 60.938 (64.618)	lr 0.02397
Train [16][2090/3239]	Time 0.685 (0.882)	Data Time 0.001 (0.012)	Loss 3.4461 (3.5271)	Entropy 1.19326 (1.20777)	Top-1 acc 44.141 (40.582)	Top-5 acc 66.797 (64.619)	lr 0.02397
Train [16][2100/3239]	Time 0.617 (0.882)	Data Time 0.001 (0.012)	Loss 3.7848 (3.5271)	Entropy 1.19318 (1.20770)	Top-1 acc 35.156 (40.583)	Top-5 acc 59.766 (64.620)	lr 0.02397
Train [16][2110/3239]	Time 0.619 (0.882)	Data Time 0.001 (0.012)	Loss 3.4665 (3.5269)	Entropy 1.19281 (1.20763)	Top-1 acc 44.141 (40.590)	Top-5 acc 65.234 (64.625)	lr 0.02397
Train [16][2120/3239]	Time 0.587 (0.882)	Data Time 0.001 (0.012)	Loss 3.4612 (3.5270)	Entropy 1.19256 (1.20756)	Top-1 acc 38.672 (40.588)	Top-5 acc 68.750 (64.624)	lr 0.02396
Train [16][2130/3239]	Time 0.588 (0.881)	Data Time 0.001 (0.012)	Loss 3.6849 (3.5271)	Entropy 1.19241 (1.20749)	Top-1 acc 40.625 (40.582)	Top-5 acc 62.891 (64.620)	lr 0.02396
Train [16][2140/3239]	Time 0.593 (0.881)	Data Time 0.001 (0.011)	Loss 3.6455 (3.5270)	Entropy 1.19253 (1.20742)	Top-1 acc 35.938 (40.584)	Top-5 acc 61.328 (64.616)	lr 0.02396
Train [16][2150/3239]	Time 0.575 (0.881)	Data Time 0.001 (0.011)	Loss 3.3986 (3.5268)	Entropy 1.19250 (1.20735)	Top-1 acc 42.578 (40.586)	Top-5 acc 67.578 (64.618)	lr 0.02396
Train [16][2160/3239]	Time 0.652 (0.881)	Data Time 0.001 (0.011)	Loss 3.7066 (3.5270)	Entropy 1.19224 (1.20728)	Top-1 acc 35.547 (40.585)	Top-5 acc 58.203 (64.612)	lr 0.02396
Train [16][2170/3239]	Time 0.620 (0.881)	Data Time 0.001 (0.011)	Loss 3.3610 (3.5272)	Entropy 1.19207 (1.20721)	Top-1 acc 42.969 (40.584)	Top-5 acc 68.750 (64.610)	lr 0.02396
Train [16][2180/3239]	Time 0.589 (0.880)	Data Time 0.001 (0.011)	Loss 3.7139 (3.5274)	Entropy 1.19169 (1.20714)	Top-1 acc 33.594 (40.578)	Top-5 acc 59.766 (64.603)	lr 0.02396
Train [16][2190/3239]	Time 0.593 (0.880)	Data Time 0.001 (0.011)	Loss 3.3421 (3.5276)	Entropy 1.19148 (1.20707)	Top-1 acc 42.188 (40.572)	Top-5 acc 68.359 (64.595)	lr 0.02396
Train [16][2200/3239]	Time 0.575 (0.880)	Data Time 0.001 (0.011)	Loss 3.6247 (3.5278)	Entropy 1.19160 (1.20700)	Top-1 acc 39.453 (40.567)	Top-5 acc 61.719 (64.591)	lr 0.02396
Train [16][2210/3239]	Time 0.596 (0.880)	Data Time 0.001 (0.011)	Loss 3.5785 (3.5278)	Entropy 1.19123 (1.20693)	Top-1 acc 41.016 (40.564)	Top-5 acc 62.500 (64.592)	lr 0.02396
Train [16][2220/3239]	Time 0.589 (0.880)	Data Time 0.001 (0.011)	Loss 3.4848 (3.5276)	Entropy 1.19091 (1.20686)	Top-1 acc 44.922 (40.573)	Top-5 acc 64.844 (64.596)	lr 0.02396
Train [16][2230/3239]	Time 0.708 (0.880)	Data Time 0.001 (0.011)	Loss 3.6216 (3.5273)	Entropy 1.19055 (1.20679)	Top-1 acc 41.016 (40.586)	Top-5 acc 63.281 (64.601)	lr 0.02396
Train [16][2240/3239]	Time 0.582 (0.879)	Data Time 0.001 (0.011)	Loss 3.4314 (3.5274)	Entropy 1.19050 (1.20671)	Top-1 acc 42.969 (40.584)	Top-5 acc 67.188 (64.601)	lr 0.02396
Train [16][2250/3239]	Time 0.592 (0.879)	Data Time 0.001 (0.011)	Loss 3.2902 (3.5273)	Entropy 1.19032 (1.20664)	Top-1 acc 41.797 (40.584)	Top-5 acc 67.969 (64.601)	lr 0.02396
Train [16][2260/3239]	Time 0.614 (0.879)	Data Time 0.001 (0.011)	Loss 3.6037 (3.5273)	Entropy 1.19043 (1.20657)	Top-1 acc 36.328 (40.584)	Top-5 acc 60.156 (64.601)	lr 0.02396
Train [16][2270/3239]	Time 0.577 (0.879)	Data Time 0.001 (0.011)	Loss 3.3367 (3.5273)	Entropy 1.19046 (1.20650)	Top-1 acc 45.703 (40.585)	Top-5 acc 69.531 (64.603)	lr 0.02396
Train [16][2280/3239]	Time 0.578 (0.879)	Data Time 0.001 (0.011)	Loss 3.3015 (3.5272)	Entropy 1.19045 (1.20643)	Top-1 acc 49.219 (40.587)	Top-5 acc 70.312 (64.609)	lr 0.02396
Train [16][2290/3239]	Time 0.618 (0.879)	Data Time 0.001 (0.011)	Loss 3.5129 (3.5271)	Entropy 1.19014 (1.20636)	Top-1 acc 41.797 (40.586)	Top-5 acc 64.062 (64.608)	lr 0.02396
Train [16][2300/3239]	Time 0.572 (0.879)	Data Time 0.001 (0.011)	Loss 3.5382 (3.5273)	Entropy 1.19016 (1.20629)	Top-1 acc 38.281 (40.583)	Top-5 acc 65.234 (64.609)	lr 0.02396
Train [16][2310/3239]	Time 0.640 (0.878)	Data Time 0.001 (0.011)	Loss 3.6029 (3.5273)	Entropy 1.18950 (1.20621)	Top-1 acc 42.969 (40.586)	Top-5 acc 61.328 (64.616)	lr 0.02396
Train [16][2320/3239]	Time 0.741 (0.878)	Data Time 0.001 (0.011)	Loss 3.4752 (3.5272)	Entropy 1.18961 (1.20614)	Top-1 acc 42.188 (40.586)	Top-5 acc 66.016 (64.619)	lr 0.02396
Train [16][2330/3239]	Time 0.593 (0.878)	Data Time 0.001 (0.011)	Loss 3.4519 (3.5274)	Entropy 1.18928 (1.20607)	Top-1 acc 43.750 (40.579)	Top-5 acc 66.016 (64.613)	lr 0.02396
Train [16][2340/3239]	Time 0.582 (0.878)	Data Time 0.001 (0.011)	Loss 3.6393 (3.5274)	Entropy 1.18864 (1.20600)	Top-1 acc 40.625 (40.580)	Top-5 acc 62.500 (64.615)	lr 0.02396
Train [16][2350/3239]	Time 0.562 (0.878)	Data Time 0.001 (0.011)	Loss 3.4636 (3.5271)	Entropy 1.18827 (1.20593)	Top-1 acc 42.969 (40.583)	Top-5 acc 64.844 (64.624)	lr 0.02396
Train [16][2360/3239]	Time 0.605 (0.878)	Data Time 0.001 (0.011)	Loss 3.5502 (3.5270)	Entropy 1.18789 (1.20585)	Top-1 acc 39.062 (40.580)	Top-5 acc 60.547 (64.622)	lr 0.02396
Train [16][2370/3239]	Time 0.614 (0.877)	Data Time 0.001 (0.011)	Loss 3.6810 (3.5272)	Entropy 1.18795 (1.20577)	Top-1 acc 40.234 (40.576)	Top-5 acc 60.938 (64.617)	lr 0.02395
Train [16][2380/3239]	Time 0.555 (0.877)	Data Time 0.001 (0.011)	Loss 3.4408 (3.5272)	Entropy 1.18761 (1.20570)	Top-1 acc 41.797 (40.578)	Top-5 acc 69.141 (64.620)	lr 0.02395
Train [16][2390/3239]	Time 0.659 (0.877)	Data Time 0.001 (0.010)	Loss 3.5105 (3.5273)	Entropy 1.18774 (1.20562)	Top-1 acc 42.578 (40.575)	Top-5 acc 64.062 (64.618)	lr 0.02395
Train [16][2400/3239]	Time 0.585 (0.877)	Data Time 0.001 (0.010)	Loss 3.4528 (3.5274)	Entropy 1.18752 (1.20555)	Top-1 acc 40.234 (40.572)	Top-5 acc 66.797 (64.616)	lr 0.02395
Train [16][2410/3239]	Time 0.554 (0.877)	Data Time 0.001 (0.010)	Loss 3.3615 (3.5271)	Entropy 1.18740 (1.20547)	Top-1 acc 46.875 (40.578)	Top-5 acc 68.750 (64.622)	lr 0.02395
Train [16][2420/3239]	Time 0.613 (0.877)	Data Time 0.001 (0.010)	Loss 3.5125 (3.5272)	Entropy 1.18743 (1.20540)	Top-1 acc 41.016 (40.577)	Top-5 acc 62.109 (64.618)	lr 0.02395
Train [16][2430/3239]	Time 0.588 (0.877)	Data Time 0.001 (0.010)	Loss 3.4073 (3.5270)	Entropy 1.18724 (1.20533)	Top-1 acc 42.969 (40.580)	Top-5 acc 67.578 (64.625)	lr 0.02395
Train [16][2440/3239]	Time 0.556 (0.877)	Data Time 0.001 (0.010)	Loss 3.5973 (3.5271)	Entropy 1.18686 (1.20525)	Top-1 acc 38.672 (40.573)	Top-5 acc 62.891 (64.621)	lr 0.02395
Train [16][2450/3239]	Time 0.565 (0.876)	Data Time 0.001 (0.010)	Loss 3.5347 (3.5271)	Entropy 1.18639 (1.20517)	Top-1 acc 40.234 (40.573)	Top-5 acc 65.234 (64.620)	lr 0.02395
Train [16][2460/3239]	Time 0.905 (0.885)	Data Time 0.005 (0.010)	Loss 3.5147 (3.5271)	Entropy 1.18634 (1.20510)	Top-1 acc 41.016 (40.572)	Top-5 acc 64.453 (64.621)	lr 0.02395
Train [16][2470/3239]	Time 0.621 (0.885)	Data Time 0.002 (0.010)	Loss 3.4194 (3.5270)	Entropy 1.18639 (1.20502)	Top-1 acc 42.188 (40.574)	Top-5 acc 66.797 (64.620)	lr 0.02395
Train [16][2480/3239]	Time 0.586 (0.885)	Data Time 0.003 (0.010)	Loss 3.4167 (3.5269)	Entropy 1.18617 (1.20495)	Top-1 acc 41.016 (40.576)	Top-5 acc 64.844 (64.620)	lr 0.02395
Train [16][2490/3239]	Time 0.632 (0.884)	Data Time 0.002 (0.010)	Loss 3.3851 (3.5270)	Entropy 1.18610 (1.20487)	Top-1 acc 43.359 (40.576)	Top-5 acc 68.359 (64.623)	lr 0.02395
Train [16][2500/3239]	Time 0.602 (0.884)	Data Time 0.001 (0.010)	Loss 3.6514 (3.5270)	Entropy 1.18601 (1.20480)	Top-1 acc 39.844 (40.578)	Top-5 acc 61.719 (64.625)	lr 0.02395
Train [16][2510/3239]	Time 0.576 (0.884)	Data Time 0.001 (0.010)	Loss 3.5464 (3.5268)	Entropy 1.18628 (1.20472)	Top-1 acc 38.281 (40.583)	Top-5 acc 63.672 (64.623)	lr 0.02395
Train [16][2520/3239]	Time 0.639 (0.884)	Data Time 0.002 (0.010)	Loss 3.3388 (3.5268)	Entropy 1.18651 (1.20465)	Top-1 acc 46.875 (40.583)	Top-5 acc 72.266 (64.621)	lr 0.02395
Train [16][2530/3239]	Time 0.651 (0.884)	Data Time 0.001 (0.010)	Loss 3.3900 (3.5268)	Entropy 1.18697 (1.20458)	Top-1 acc 41.406 (40.584)	Top-5 acc 69.141 (64.621)	lr 0.02395
Train [16][2540/3239]	Time 0.596 (0.884)	Data Time 0.002 (0.010)	Loss 3.7780 (3.5265)	Entropy 1.18695 (1.20451)	Top-1 acc 34.375 (40.593)	Top-5 acc 60.156 (64.629)	lr 0.02395
Train [16][2550/3239]	Time 0.766 (0.884)	Data Time 0.002 (0.010)	Loss 3.3963 (3.5265)	Entropy 1.18652 (1.20444)	Top-1 acc 40.625 (40.594)	Top-5 acc 68.750 (64.629)	lr 0.02395
Train [16][2560/3239]	Time 0.614 (0.884)	Data Time 0.001 (0.010)	Loss 3.5472 (3.5266)	Entropy 1.18642 (1.20437)	Top-1 acc 39.453 (40.587)	Top-5 acc 66.797 (64.630)	lr 0.02395
Train [16][2570/3239]	Time 0.587 (0.884)	Data Time 0.001 (0.010)	Loss 3.6097 (3.5268)	Entropy 1.18593 (1.20430)	Top-1 acc 39.844 (40.585)	Top-5 acc 63.281 (64.621)	lr 0.02395
Train [16][2580/3239]	Time 0.618 (0.884)	Data Time 0.001 (0.010)	Loss 3.4776 (3.5269)	Entropy 1.18589 (1.20423)	Top-1 acc 41.406 (40.587)	Top-5 acc 64.844 (64.619)	lr 0.02395
Train [16][2590/3239]	Time 0.611 (0.883)	Data Time 0.001 (0.010)	Loss 3.3532 (3.5270)	Entropy 1.18609 (1.20416)	Top-1 acc 45.703 (40.585)	Top-5 acc 66.797 (64.615)	lr 0.02395
Train [16][2600/3239]	Time 0.587 (0.883)	Data Time 0.001 (0.010)	Loss 3.4463 (3.5271)	Entropy 1.18576 (1.20409)	Top-1 acc 41.406 (40.582)	Top-5 acc 64.844 (64.617)	lr 0.02395
Train [16][2610/3239]	Time 0.589 (0.883)	Data Time 0.001 (0.010)	Loss 3.4190 (3.5270)	Entropy 1.18522 (1.20402)	Top-1 acc 39.844 (40.584)	Top-5 acc 66.016 (64.619)	lr 0.02395
Train [16][2620/3239]	Time 0.690 (0.883)	Data Time 0.001 (0.010)	Loss 3.5171 (3.5268)	Entropy 1.18541 (1.20395)	Top-1 acc 40.625 (40.585)	Top-5 acc 62.891 (64.621)	lr 0.02394
Train [16][2630/3239]	Time 0.570 (0.883)	Data Time 0.001 (0.010)	Loss 3.5680 (3.5268)	Entropy 1.18534 (1.20387)	Top-1 acc 38.281 (40.586)	Top-5 acc 61.719 (64.616)	lr 0.02394
Train [16][2640/3239]	Time 0.612 (0.883)	Data Time 0.001 (0.010)	Loss 3.4366 (3.5270)	Entropy 1.18547 (1.20380)	Top-1 acc 42.969 (40.580)	Top-5 acc 67.969 (64.612)	lr 0.02394
Train [16][2650/3239]	Time 0.569 (0.883)	Data Time 0.001 (0.010)	Loss 3.6159 (3.5271)	Entropy 1.18503 (1.20374)	Top-1 acc 39.453 (40.575)	Top-5 acc 62.891 (64.607)	lr 0.02394
Train [16][2660/3239]	Time 0.565 (0.883)	Data Time 0.001 (0.010)	Loss 3.5038 (3.5271)	Entropy 1.18521 (1.20367)	Top-1 acc 40.625 (40.576)	Top-5 acc 65.625 (64.606)	lr 0.02394
Train [16][2670/3239]	Time 0.638 (0.882)	Data Time 0.001 (0.010)	Loss 3.3876 (3.5272)	Entropy 1.18543 (1.20360)	Top-1 acc 41.797 (40.569)	Top-5 acc 66.016 (64.601)	lr 0.02394
Train [16][2680/3239]	Time 0.621 (0.882)	Data Time 0.002 (0.010)	Loss 3.3779 (3.5270)	Entropy 1.18511 (1.20353)	Top-1 acc 43.359 (40.574)	Top-5 acc 69.922 (64.608)	lr 0.02394
Train [16][2690/3239]	Time 0.705 (0.882)	Data Time 0.001 (0.010)	Loss 3.5504 (3.5269)	Entropy 1.18514 (1.20346)	Top-1 acc 39.062 (40.577)	Top-5 acc 61.719 (64.613)	lr 0.02394
Train [16][2700/3239]	Time 0.606 (0.882)	Data Time 0.001 (0.010)	Loss 3.3537 (3.5268)	Entropy 1.18491 (1.20339)	Top-1 acc 44.531 (40.578)	Top-5 acc 67.578 (64.613)	lr 0.02394
Train [16][2710/3239]	Time 0.587 (0.882)	Data Time 0.001 (0.009)	Loss 3.5310 (3.5268)	Entropy 1.18442 (1.20332)	Top-1 acc 41.797 (40.579)	Top-5 acc 63.281 (64.612)	lr 0.02394
Train [16][2720/3239]	Time 0.625 (0.882)	Data Time 0.001 (0.009)	Loss 3.3598 (3.5268)	Entropy 1.18419 (1.20325)	Top-1 acc 46.484 (40.579)	Top-5 acc 72.656 (64.614)	lr 0.02394
Train [16][2730/3239]	Time 0.567 (0.882)	Data Time 0.001 (0.009)	Loss 3.4634 (3.5267)	Entropy 1.18360 (1.20318)	Top-1 acc 43.750 (40.585)	Top-5 acc 64.062 (64.615)	lr 0.02394
Train [16][2740/3239]	Time 0.576 (0.882)	Data Time 0.001 (0.009)	Loss 3.3663 (3.5269)	Entropy 1.18324 (1.20311)	Top-1 acc 41.406 (40.578)	Top-5 acc 68.359 (64.613)	lr 0.02394
Train [16][2750/3239]	Time 0.551 (0.882)	Data Time 0.001 (0.009)	Loss 3.6438 (3.5268)	Entropy 1.18275 (1.20304)	Top-1 acc 35.938 (40.581)	Top-5 acc 61.719 (64.616)	lr 0.02394
Train [16][2760/3239]	Time 0.591 (0.882)	Data Time 0.001 (0.009)	Loss 3.4085 (3.5271)	Entropy 1.18279 (1.20296)	Top-1 acc 43.359 (40.577)	Top-5 acc 66.016 (64.606)	lr 0.02394
Train [16][2770/3239]	Time 0.570 (0.882)	Data Time 0.001 (0.009)	Loss 3.3878 (3.5270)	Entropy 1.18239 (1.20289)	Top-1 acc 44.531 (40.580)	Top-5 acc 69.531 (64.608)	lr 0.02394
Train [16][2780/3239]	Time 0.721 (0.882)	Data Time 0.001 (0.009)	Loss 3.6071 (3.5268)	Entropy 1.18197 (1.20282)	Top-1 acc 39.062 (40.582)	Top-5 acc 63.672 (64.613)	lr 0.02394
Train [16][2790/3239]	Time 0.573 (0.882)	Data Time 0.001 (0.009)	Loss 3.5014 (3.5270)	Entropy 1.18195 (1.20274)	Top-1 acc 41.797 (40.578)	Top-5 acc 65.625 (64.613)	lr 0.02394
Train [16][2800/3239]	Time 0.600 (0.882)	Data Time 0.001 (0.009)	Loss 3.5435 (3.5269)	Entropy 1.18183 (1.20267)	Top-1 acc 42.578 (40.578)	Top-5 acc 63.281 (64.613)	lr 0.02394
Train [16][2810/3239]	Time 0.664 (0.882)	Data Time 0.001 (0.009)	Loss 3.5007 (3.5269)	Entropy 1.18169 (1.20259)	Top-1 acc 42.578 (40.577)	Top-5 acc 66.797 (64.611)	lr 0.02394
Train [16][2820/3239]	Time 0.578 (0.881)	Data Time 0.001 (0.009)	Loss 3.5055 (3.5266)	Entropy 1.18128 (1.20252)	Top-1 acc 38.281 (40.582)	Top-5 acc 63.672 (64.617)	lr 0.02394
Train [16][2830/3239]	Time 0.601 (0.881)	Data Time 0.001 (0.009)	Loss 3.4091 (3.5264)	Entropy 1.18126 (1.20244)	Top-1 acc 43.750 (40.587)	Top-5 acc 67.188 (64.623)	lr 0.02394
Train [16][2840/3239]	Time 0.600 (0.881)	Data Time 0.001 (0.009)	Loss 3.4522 (3.5262)	Entropy 1.18092 (1.20237)	Top-1 acc 42.969 (40.589)	Top-5 acc 67.188 (64.627)	lr 0.02394
Train [16][2850/3239]	Time 0.696 (0.881)	Data Time 0.001 (0.009)	Loss 3.4069 (3.5262)	Entropy 1.18116 (1.20229)	Top-1 acc 42.188 (40.586)	Top-5 acc 67.188 (64.628)	lr 0.02394
Train [16][2860/3239]	Time 0.624 (0.881)	Data Time 0.001 (0.009)	Loss 3.4105 (3.5262)	Entropy 1.18141 (1.20222)	Top-1 acc 43.359 (40.588)	Top-5 acc 66.406 (64.628)	lr 0.02393
Train [16][2870/3239]	Time 0.588 (0.881)	Data Time 0.001 (0.009)	Loss 3.5884 (3.5262)	Entropy 1.18107 (1.20215)	Top-1 acc 40.625 (40.588)	Top-5 acc 63.281 (64.627)	lr 0.02393
Train [16][2880/3239]	Time 0.610 (0.881)	Data Time 0.001 (0.009)	Loss 3.5298 (3.5260)	Entropy 1.18098 (1.20207)	Top-1 acc 41.797 (40.589)	Top-5 acc 64.844 (64.629)	lr 0.02393
Train [16][2890/3239]	Time 0.578 (0.880)	Data Time 0.001 (0.009)	Loss 3.6578 (3.5259)	Entropy 1.18066 (1.20200)	Top-1 acc 39.062 (40.590)	Top-5 acc 61.328 (64.628)	lr 0.02393
Train [16][2900/3239]	Time 0.607 (0.880)	Data Time 0.001 (0.009)	Loss 3.4184 (3.5259)	Entropy 1.18005 (1.20193)	Top-1 acc 41.797 (40.589)	Top-5 acc 69.922 (64.631)	lr 0.02393
Train [16][2910/3239]	Time 0.585 (0.880)	Data Time 0.001 (0.009)	Loss 3.5886 (3.5260)	Entropy 1.17997 (1.20185)	Top-1 acc 37.109 (40.591)	Top-5 acc 64.844 (64.633)	lr 0.02393
Train [16][2920/3239]	Time 0.618 (0.880)	Data Time 0.002 (0.009)	Loss 3.4385 (3.5259)	Entropy 1.17939 (1.20178)	Top-1 acc 42.969 (40.592)	Top-5 acc 68.359 (64.633)	lr 0.02393
Train [16][2930/3239]	Time 0.605 (0.880)	Data Time 0.001 (0.009)	Loss 3.4779 (3.5258)	Entropy 1.17929 (1.20170)	Top-1 acc 38.672 (40.589)	Top-5 acc 63.281 (64.636)	lr 0.02393
Train [16][2940/3239]	Time 0.586 (0.880)	Data Time 0.001 (0.009)	Loss 3.3642 (3.5258)	Entropy 1.17881 (1.20162)	Top-1 acc 43.359 (40.590)	Top-5 acc 68.359 (64.638)	lr 0.02393
Train [16][2950/3239]	Time 0.596 (0.880)	Data Time 0.001 (0.009)	Loss 3.3556 (3.5256)	Entropy 1.17854 (1.20154)	Top-1 acc 44.922 (40.595)	Top-5 acc 68.359 (64.644)	lr 0.02393
Train [16][2960/3239]	Time 0.587 (0.880)	Data Time 0.001 (0.009)	Loss 3.6990 (3.5256)	Entropy 1.17809 (1.20147)	Top-1 acc 38.281 (40.596)	Top-5 acc 57.422 (64.642)	lr 0.02393
Train [16][2970/3239]	Time 0.630 (0.880)	Data Time 0.001 (0.009)	Loss 3.5265 (3.5255)	Entropy 1.17773 (1.20139)	Top-1 acc 39.844 (40.594)	Top-5 acc 66.016 (64.644)	lr 0.02393
Train [16][2980/3239]	Time 0.611 (0.879)	Data Time 0.001 (0.009)	Loss 3.9282 (3.5258)	Entropy 1.17715 (1.20131)	Top-1 acc 29.688 (40.586)	Top-5 acc 60.938 (64.636)	lr 0.02393
Train [16][2990/3239]	Time 0.639 (0.879)	Data Time 0.001 (0.009)	Loss 3.4403 (3.5258)	Entropy 1.17707 (1.20123)	Top-1 acc 42.578 (40.587)	Top-5 acc 66.016 (64.636)	lr 0.02393
Train [16][3000/3239]	Time 0.591 (0.879)	Data Time 0.002 (0.009)	Loss 3.4280 (3.5258)	Entropy 1.17691 (1.20115)	Top-1 acc 45.703 (40.585)	Top-5 acc 68.359 (64.635)	lr 0.02393
Train [16][3010/3239]	Time 0.627 (0.879)	Data Time 0.003 (0.009)	Loss 3.5680 (3.5257)	Entropy 1.17620 (1.20106)	Top-1 acc 37.891 (40.586)	Top-5 acc 61.719 (64.640)	lr 0.02393
Train [16][3020/3239]	Time 0.600 (0.879)	Data Time 0.001 (0.009)	Loss 3.5959 (3.5256)	Entropy 1.17591 (1.20098)	Top-1 acc 37.109 (40.589)	Top-5 acc 61.328 (64.641)	lr 0.02393
Train [16][3030/3239]	Time 0.607 (0.879)	Data Time 0.002 (0.009)	Loss 3.6672 (3.5255)	Entropy 1.17581 (1.20090)	Top-1 acc 39.062 (40.589)	Top-5 acc 60.547 (64.641)	lr 0.02393
Train [16][3040/3239]	Time 0.606 (0.879)	Data Time 0.001 (0.009)	Loss 3.4979 (3.5255)	Entropy 1.17547 (1.20082)	Top-1 acc 39.844 (40.587)	Top-5 acc 64.062 (64.640)	lr 0.02393
Train [16][3050/3239]	Time 0.644 (0.878)	Data Time 0.001 (0.009)	Loss 3.5669 (3.5254)	Entropy 1.17502 (1.20073)	Top-1 acc 42.969 (40.589)	Top-5 acc 62.500 (64.643)	lr 0.02393
Train [16][3060/3239]	Time 0.545 (0.878)	Data Time 0.001 (0.009)	Loss 3.6332 (3.5252)	Entropy 1.17528 (1.20065)	Top-1 acc 33.594 (40.592)	Top-5 acc 62.500 (64.644)	lr 0.02393
Train [16][3070/3239]	Time 0.587 (0.878)	Data Time 0.001 (0.009)	Loss 3.2946 (3.5252)	Entropy 1.17549 (1.20057)	Top-1 acc 43.750 (40.592)	Top-5 acc 70.703 (64.644)	lr 0.02393
Train [16][3080/3239]	Time 0.674 (0.878)	Data Time 0.001 (0.009)	Loss 3.5690 (3.5254)	Entropy 1.17544 (1.20049)	Top-1 acc 37.500 (40.589)	Top-5 acc 62.109 (64.639)	lr 0.02393
Train [16][3090/3239]	Time 0.610 (0.878)	Data Time 0.001 (0.009)	Loss 3.3685 (3.5252)	Entropy 1.17543 (1.20040)	Top-1 acc 46.484 (40.593)	Top-5 acc 68.359 (64.645)	lr 0.02393
Train [16][3100/3239]	Time 0.610 (0.878)	Data Time 0.003 (0.009)	Loss 3.5701 (3.5252)	Entropy 1.17490 (1.20032)	Top-1 acc 39.062 (40.589)	Top-5 acc 64.062 (64.647)	lr 0.02393
Train [16][3110/3239]	Time 0.612 (0.878)	Data Time 0.001 (0.009)	Loss 3.4216 (3.5250)	Entropy 1.17480 (1.20024)	Top-1 acc 40.625 (40.590)	Top-5 acc 67.578 (64.650)	lr 0.02392
Train [16][3120/3239]	Time 0.590 (0.884)	Data Time 0.002 (0.009)	Loss 3.5059 (3.5250)	Entropy 1.17417 (1.20016)	Top-1 acc 39.453 (40.592)	Top-5 acc 66.406 (64.652)	lr 0.02392
Train [16][3130/3239]	Time 0.577 (0.884)	Data Time 0.001 (0.009)	Loss 3.6053 (3.5252)	Entropy 1.17365 (1.20008)	Top-1 acc 39.062 (40.590)	Top-5 acc 64.062 (64.649)	lr 0.02392
Train [16][3140/3239]	Time 0.595 (0.884)	Data Time 0.001 (0.008)	Loss 3.8271 (3.5253)	Entropy 1.17341 (1.19999)	Top-1 acc 31.250 (40.585)	Top-5 acc 57.031 (64.645)	lr 0.02392
Train [16][3150/3239]	Time 0.598 (0.884)	Data Time 0.001 (0.008)	Loss 3.5136 (3.5253)	Entropy 1.17384 (1.19991)	Top-1 acc 35.547 (40.583)	Top-5 acc 64.844 (64.642)	lr 0.02392
Train [16][3160/3239]	Time 0.594 (0.884)	Data Time 0.002 (0.008)	Loss 3.3949 (3.5251)	Entropy 1.17430 (1.19983)	Top-1 acc 41.406 (40.583)	Top-5 acc 66.406 (64.647)	lr 0.02392
Train [16][3170/3239]	Time 0.703 (0.884)	Data Time 0.002 (0.008)	Loss 3.5411 (3.5251)	Entropy 1.17419 (1.19974)	Top-1 acc 40.234 (40.583)	Top-5 acc 63.281 (64.650)	lr 0.02392
Train [16][3180/3239]	Time 0.581 (0.884)	Data Time 0.000 (0.008)	Loss 3.6476 (3.5250)	Entropy 1.17453 (1.19966)	Top-1 acc 37.500 (40.587)	Top-5 acc 65.625 (64.654)	lr 0.02392
Train [16][3190/3239]	Time 0.557 (0.884)	Data Time 0.002 (0.008)	Loss 3.3924 (3.5249)	Entropy 1.17453 (1.19959)	Top-1 acc 42.188 (40.593)	Top-5 acc 69.531 (64.656)	lr 0.02392
Train [16][3200/3239]	Time 0.535 (0.883)	Data Time 0.002 (0.008)	Loss 3.3391 (3.5248)	Entropy 1.17476 (1.19951)	Top-1 acc 43.750 (40.595)	Top-5 acc 69.531 (64.657)	lr 0.02392
Train [16][3210/3239]	Time 0.575 (0.883)	Data Time 0.000 (0.008)	Loss 3.8259 (3.5248)	Entropy 1.17462 (1.19943)	Top-1 acc 33.984 (40.593)	Top-5 acc 60.547 (64.657)	lr 0.02392
Train [16][3220/3239]	Time 0.596 (0.883)	Data Time 0.000 (0.008)	Loss 3.4961 (3.5248)	Entropy 1.17467 (1.19935)	Top-1 acc 40.625 (40.593)	Top-5 acc 65.234 (64.656)	lr 0.02392
Train [16][3230/3239]	Time 0.590 (0.883)	Data Time 0.000 (0.008)	Loss 3.2013 (3.5248)	Entropy 1.17436 (1.19928)	Top-1 acc 48.047 (40.593)	Top-5 acc 69.141 (64.652)	lr 0.02392
Train [16][3239/3239]	Time 1.485 (0.883)	Data Time 0.000 (0.008)	Loss 3.7501 (3.5247)	Entropy 1.17400 (1.19921)	Top-1 acc 29.630 (40.597)	Top-5 acc 55.556 (64.653)	lr 0.02392
==========Valid [16/120]	loss 2.265	top-1 acc 50.623 (50.623)	top-5 acc 74.481	Train top-1 40.597	top-5 64.653	Entropy 1.17400	Latency-None: 0.000ms	Flops: 539.76M
Train [17][0/3239]	Time 19.274 (19.274)	Data Time 17.778 (17.778)	Loss 3.6001 (3.6001)	Entropy 1.17349 (1.17349)	Top-1 acc 40.234 (40.234)	Top-5 acc 65.234 (65.234)	lr 0.02392
Train [17][10/3239]	Time 0.602 (2.613)	Data Time 0.001 (1.622)	Loss 3.4798 (3.5162)	Entropy 1.17340 (1.17348)	Top-1 acc 43.750 (40.945)	Top-5 acc 65.625 (66.193)	lr 0.02392
Train [17][20/3239]	Time 0.620 (1.787)	Data Time 0.001 (0.851)	Loss 3.3022 (3.4605)	Entropy 1.17391 (1.17358)	Top-1 acc 48.828 (42.634)	Top-5 acc 69.141 (66.518)	lr 0.02392
Train [17][30/3239]	Time 0.612 (1.532)	Data Time 0.002 (0.577)	Loss 3.4283 (3.4517)	Entropy 1.17384 (1.17367)	Top-1 acc 43.359 (42.792)	Top-5 acc 67.969 (66.721)	lr 0.02392
Train [17][40/3239]	Time 0.613 (1.378)	Data Time 0.001 (0.437)	Loss 3.5631 (3.4561)	Entropy 1.17385 (1.17374)	Top-1 acc 41.406 (42.540)	Top-5 acc 63.672 (66.444)	lr 0.02392
Train [17][50/3239]	Time 0.641 (1.281)	Data Time 0.002 (0.352)	Loss 3.4720 (3.4593)	Entropy 1.17343 (1.17373)	Top-1 acc 41.016 (42.279)	Top-5 acc 67.188 (66.452)	lr 0.02392
Train [17][60/3239]	Time 0.585 (1.210)	Data Time 0.001 (0.294)	Loss 3.2883 (3.4597)	Entropy 1.17315 (1.17366)	Top-1 acc 48.047 (42.194)	Top-5 acc 71.875 (66.432)	lr 0.02392
Train [17][70/3239]	Time 0.716 (1.160)	Data Time 0.001 (0.253)	Loss 3.3579 (3.4577)	Entropy 1.17310 (1.17358)	Top-1 acc 41.016 (42.243)	Top-5 acc 68.750 (66.489)	lr 0.02392
Train [17][80/3239]	Time 0.610 (1.119)	Data Time 0.001 (0.222)	Loss 3.6978 (3.4679)	Entropy 1.17302 (1.17353)	Top-1 acc 36.719 (42.101)	Top-5 acc 64.062 (66.315)	lr 0.02392
Train [17][90/3239]	Time 0.639 (1.090)	Data Time 0.001 (0.198)	Loss 3.4690 (3.4677)	Entropy 1.17298 (1.17346)	Top-1 acc 38.672 (42.037)	Top-5 acc 64.453 (66.166)	lr 0.02392
Train [17][100/3239]	Time 0.611 (1.064)	Data Time 0.001 (0.179)	Loss 3.4240 (3.4637)	Entropy 1.17255 (1.17340)	Top-1 acc 47.266 (42.160)	Top-5 acc 67.188 (66.252)	lr 0.02392
Train [17][110/3239]	Time 0.553 (1.042)	Data Time 0.001 (0.163)	Loss 3.3414 (3.4601)	Entropy 1.17218 (1.17331)	Top-1 acc 44.141 (42.188)	Top-5 acc 67.969 (66.297)	lr 0.02391
Train [17][120/3239]	Time 0.599 (1.028)	Data Time 0.001 (0.149)	Loss 3.4203 (3.4665)	Entropy 1.17191 (1.17320)	Top-1 acc 46.875 (42.081)	Top-5 acc 66.797 (66.142)	lr 0.02391
Train [17][130/3239]	Time 0.657 (1.015)	Data Time 0.001 (0.138)	Loss 3.5823 (3.4653)	Entropy 1.17188 (1.17309)	Top-1 acc 44.141 (42.146)	Top-5 acc 59.766 (66.120)	lr 0.02391
Train [17][140/3239]	Time 0.643 (1.004)	Data Time 0.001 (0.129)	Loss 3.4927 (3.4651)	Entropy 1.17153 (1.17299)	Top-1 acc 42.578 (42.165)	Top-5 acc 66.016 (66.079)	lr 0.02391
Train [17][150/3239]	Time 0.577 (0.994)	Data Time 0.001 (0.120)	Loss 3.8101 (3.4675)	Entropy 1.17113 (1.17289)	Top-1 acc 35.938 (42.076)	Top-5 acc 57.422 (65.990)	lr 0.02391
Train [17][160/3239]	Time 0.593 (0.985)	Data Time 0.001 (0.113)	Loss 3.5892 (3.4684)	Entropy 1.17083 (1.17277)	Top-1 acc 39.062 (42.032)	Top-5 acc 64.062 (65.950)	lr 0.02391
Train [17][170/3239]	Time 0.624 (0.978)	Data Time 0.001 (0.106)	Loss 3.3640 (3.4699)	Entropy 1.17081 (1.17266)	Top-1 acc 42.969 (42.041)	Top-5 acc 71.484 (65.938)	lr 0.02391
Train [17][180/3239]	Time 0.585 (0.971)	Data Time 0.002 (0.101)	Loss 3.3734 (3.4684)	Entropy 1.17079 (1.17255)	Top-1 acc 42.578 (42.041)	Top-5 acc 69.922 (65.927)	lr 0.02391
Train [17][190/3239]	Time 0.586 (0.966)	Data Time 0.001 (0.095)	Loss 3.4597 (3.4698)	Entropy 1.17097 (1.17247)	Top-1 acc 42.188 (42.026)	Top-5 acc 64.844 (65.879)	lr 0.02391
Train [17][200/3239]	Time 0.562 (0.960)	Data Time 0.001 (0.091)	Loss 3.5834 (3.4711)	Entropy 1.17094 (1.17239)	Top-1 acc 37.109 (41.972)	Top-5 acc 64.844 (65.829)	lr 0.02391
Train [17][210/3239]	Time 0.591 (0.956)	Data Time 0.001 (0.087)	Loss 3.5284 (3.4698)	Entropy 1.17077 (1.17233)	Top-1 acc 40.625 (41.936)	Top-5 acc 66.016 (65.879)	lr 0.02391
Train [17][220/3239]	Time 0.612 (0.950)	Data Time 0.001 (0.083)	Loss 3.5091 (3.4686)	Entropy 1.17023 (1.17225)	Top-1 acc 41.016 (41.975)	Top-5 acc 64.453 (65.871)	lr 0.02391
Train [17][230/3239]	Time 0.661 (0.946)	Data Time 0.001 (0.079)	Loss 3.5587 (3.4730)	Entropy 1.17006 (1.17216)	Top-1 acc 40.234 (41.834)	Top-5 acc 62.891 (65.754)	lr 0.02391
Train [17][240/3239]	Time 0.583 (0.942)	Data Time 0.001 (0.076)	Loss 3.2127 (3.4728)	Entropy 1.16969 (1.17207)	Top-1 acc 45.703 (41.842)	Top-5 acc 70.312 (65.734)	lr 0.02391
Train [17][250/3239]	Time 0.624 (0.938)	Data Time 0.001 (0.073)	Loss 3.4399 (3.4739)	Entropy 1.16966 (1.17197)	Top-1 acc 42.188 (41.848)	Top-5 acc 69.141 (65.695)	lr 0.02391
Train [17][260/3239]	Time 0.580 (0.933)	Data Time 0.002 (0.070)	Loss 3.4846 (3.4748)	Entropy 1.16968 (1.17188)	Top-1 acc 37.891 (41.843)	Top-5 acc 64.453 (65.665)	lr 0.02391
Train [17][270/3239]	Time 0.637 (0.930)	Data Time 0.022 (0.068)	Loss 3.5306 (3.4761)	Entropy 1.16957 (1.17180)	Top-1 acc 39.453 (41.808)	Top-5 acc 64.453 (65.661)	lr 0.02391
Train [17][280/3239]	Time 0.621 (0.925)	Data Time 0.001 (0.066)	Loss 3.6191 (3.4793)	Entropy 1.16929 (1.17172)	Top-1 acc 37.500 (41.740)	Top-5 acc 64.062 (65.617)	lr 0.02391
Train [17][290/3239]	Time 0.556 (0.923)	Data Time 0.002 (0.064)	Loss 3.6719 (3.4786)	Entropy 1.16887 (1.17163)	Top-1 acc 38.672 (41.714)	Top-5 acc 62.500 (65.614)	lr 0.02391
Train [17][300/3239]	Time 0.664 (0.921)	Data Time 0.001 (0.061)	Loss 3.2867 (3.4780)	Entropy 1.16851 (1.17153)	Top-1 acc 44.922 (41.723)	Top-5 acc 69.531 (65.613)	lr 0.02391
Train [17][310/3239]	Time 0.583 (0.919)	Data Time 0.001 (0.060)	Loss 3.4927 (3.4785)	Entropy 1.16846 (1.17143)	Top-1 acc 41.797 (41.720)	Top-5 acc 66.797 (65.602)	lr 0.02391
Train [17][320/3239]	Time 0.599 (0.917)	Data Time 0.001 (0.058)	Loss 3.4689 (3.4768)	Entropy 1.16828 (1.17134)	Top-1 acc 39.844 (41.718)	Top-5 acc 65.625 (65.640)	lr 0.02391
Train [17][330/3239]	Time 0.582 (0.915)	Data Time 0.001 (0.056)	Loss 3.3444 (3.4770)	Entropy 1.16820 (1.17124)	Top-1 acc 48.047 (41.697)	Top-5 acc 68.750 (65.614)	lr 0.02391
Train [17][340/3239]	Time 0.592 (0.913)	Data Time 0.001 (0.054)	Loss 3.7888 (3.4768)	Entropy 1.16767 (1.17115)	Top-1 acc 34.766 (41.680)	Top-5 acc 61.719 (65.620)	lr 0.02391
Train [17][350/3239]	Time 0.597 (0.912)	Data Time 0.001 (0.053)	Loss 3.3251 (3.4783)	Entropy 1.16763 (1.17105)	Top-1 acc 41.016 (41.643)	Top-5 acc 70.703 (65.616)	lr 0.02390
Train [17][360/3239]	Time 0.620 (0.910)	Data Time 0.001 (0.052)	Loss 3.3367 (3.4768)	Entropy 1.16755 (1.17096)	Top-1 acc 40.234 (41.664)	Top-5 acc 71.484 (65.657)	lr 0.02390
Train [17][370/3239]	Time 0.730 (0.909)	Data Time 0.001 (0.050)	Loss 3.5289 (3.4766)	Entropy 1.16767 (1.17087)	Top-1 acc 38.672 (41.663)	Top-5 acc 65.625 (65.663)	lr 0.02390
Train [17][380/3239]	Time 0.631 (0.907)	Data Time 0.002 (0.049)	Loss 3.6281 (3.4774)	Entropy 1.16718 (1.17078)	Top-1 acc 37.500 (41.634)	Top-5 acc 61.719 (65.628)	lr 0.02390
Train [17][390/3239]	Time 0.623 (0.906)	Data Time 0.001 (0.048)	Loss 3.2834 (3.4792)	Entropy 1.16707 (1.17069)	Top-1 acc 44.922 (41.598)	Top-5 acc 68.750 (65.576)	lr 0.02390
Train [17][400/3239]	Time 0.595 (0.904)	Data Time 0.001 (0.047)	Loss 3.5981 (3.4804)	Entropy 1.16706 (1.17060)	Top-1 acc 41.406 (41.564)	Top-5 acc 61.719 (65.544)	lr 0.02390
Train [17][410/3239]	Time 0.628 (0.903)	Data Time 0.001 (0.046)	Loss 3.3915 (3.4797)	Entropy 1.16635 (1.17050)	Top-1 acc 43.750 (41.600)	Top-5 acc 67.578 (65.577)	lr 0.02390
Train [17][420/3239]	Time 0.618 (0.901)	Data Time 0.001 (0.044)	Loss 3.5930 (3.4804)	Entropy 1.16630 (1.17040)	Top-1 acc 39.844 (41.578)	Top-5 acc 64.062 (65.568)	lr 0.02390
Train [17][430/3239]	Time 0.578 (0.900)	Data Time 0.001 (0.044)	Loss 3.4926 (3.4802)	Entropy 1.16628 (1.17031)	Top-1 acc 39.062 (41.594)	Top-5 acc 67.188 (65.587)	lr 0.02390
Train [17][440/3239]	Time 0.567 (0.899)	Data Time 0.001 (0.043)	Loss 3.6416 (3.4820)	Entropy 1.16618 (1.17022)	Top-1 acc 38.672 (41.535)	Top-5 acc 62.109 (65.559)	lr 0.02390
Train [17][450/3239]	Time 0.621 (0.897)	Data Time 0.002 (0.042)	Loss 3.4592 (3.4824)	Entropy 1.16639 (1.17013)	Top-1 acc 41.406 (41.512)	Top-5 acc 64.453 (65.538)	lr 0.02390
Train [17][460/3239]	Time 0.626 (0.895)	Data Time 0.001 (0.041)	Loss 3.4825 (3.4813)	Entropy 1.16630 (1.17005)	Top-1 acc 40.625 (41.528)	Top-5 acc 66.016 (65.563)	lr 0.02390
Train [17][470/3239]	Time 0.626 (0.894)	Data Time 0.001 (0.040)	Loss 3.3376 (3.4813)	Entropy 1.16625 (1.16997)	Top-1 acc 42.969 (41.504)	Top-5 acc 67.969 (65.570)	lr 0.02390
Train [17][480/3239]	Time 0.584 (0.893)	Data Time 0.001 (0.039)	Loss 3.4691 (3.4804)	Entropy 1.16623 (1.16989)	Top-1 acc 42.578 (41.526)	Top-5 acc 65.625 (65.588)	lr 0.02390
Train [17][490/3239]	Time 0.599 (0.892)	Data Time 0.001 (0.038)	Loss 3.3557 (3.4804)	Entropy 1.16646 (1.16982)	Top-1 acc 44.922 (41.510)	Top-5 acc 71.875 (65.613)	lr 0.02390
Train [17][500/3239]	Time 0.548 (0.891)	Data Time 0.001 (0.038)	Loss 3.5140 (3.4793)	Entropy 1.16659 (1.16976)	Top-1 acc 44.531 (41.547)	Top-5 acc 63.672 (65.633)	lr 0.02390
Train [17][510/3239]	Time 0.580 (0.890)	Data Time 0.001 (0.037)	Loss 3.5960 (3.4796)	Entropy 1.16672 (1.16969)	Top-1 acc 42.188 (41.542)	Top-5 acc 62.891 (65.629)	lr 0.02390
Train [17][520/3239]	Time 0.607 (0.890)	Data Time 0.001 (0.036)	Loss 3.4649 (3.4799)	Entropy 1.16686 (1.16964)	Top-1 acc 44.531 (41.540)	Top-5 acc 65.234 (65.638)	lr 0.02390
Train [17][530/3239]	Time 0.869 (0.930)	Data Time 0.005 (0.036)	Loss 3.4199 (3.4799)	Entropy 1.16652 (1.16958)	Top-1 acc 41.797 (41.524)	Top-5 acc 67.578 (65.630)	lr 0.02390
Train [17][540/3239]	Time 0.597 (0.929)	Data Time 0.002 (0.035)	Loss 3.6114 (3.4809)	Entropy 1.16660 (1.16953)	Top-1 acc 41.406 (41.515)	Top-5 acc 64.453 (65.626)	lr 0.02390
Train [17][550/3239]	Time 0.515 (0.927)	Data Time 0.001 (0.034)	Loss 3.6693 (3.4809)	Entropy 1.16646 (1.16947)	Top-1 acc 37.891 (41.509)	Top-5 acc 60.547 (65.618)	lr 0.02390
Train [17][560/3239]	Time 0.586 (0.926)	Data Time 0.001 (0.034)	Loss 3.4952 (3.4806)	Entropy 1.16630 (1.16942)	Top-1 acc 43.359 (41.511)	Top-5 acc 65.234 (65.613)	lr 0.02390
Train [17][570/3239]	Time 0.538 (0.924)	Data Time 0.003 (0.033)	Loss 3.3752 (3.4799)	Entropy 1.16650 (1.16937)	Top-1 acc 44.141 (41.531)	Top-5 acc 67.969 (65.626)	lr 0.02390
Train [17][580/3239]	Time 0.573 (0.922)	Data Time 0.001 (0.033)	Loss 3.6087 (3.4811)	Entropy 1.16627 (1.16932)	Top-1 acc 39.844 (41.504)	Top-5 acc 61.328 (65.597)	lr 0.02390
Train [17][590/3239]	Time 0.564 (0.921)	Data Time 0.001 (0.032)	Loss 3.5505 (3.4811)	Entropy 1.16615 (1.16926)	Top-1 acc 37.109 (41.500)	Top-5 acc 66.016 (65.596)	lr 0.02389
Train [17][600/3239]	Time 0.567 (0.920)	Data Time 0.001 (0.032)	Loss 3.5213 (3.4810)	Entropy 1.16616 (1.16921)	Top-1 acc 38.672 (41.500)	Top-5 acc 65.234 (65.609)	lr 0.02389
Train [17][610/3239]	Time 0.594 (0.919)	Data Time 0.001 (0.031)	Loss 3.5816 (3.4813)	Entropy 1.16592 (1.16916)	Top-1 acc 39.453 (41.508)	Top-5 acc 63.281 (65.602)	lr 0.02389
Train [17][620/3239]	Time 0.577 (0.917)	Data Time 0.001 (0.031)	Loss 3.5068 (3.4820)	Entropy 1.16589 (1.16911)	Top-1 acc 45.312 (41.503)	Top-5 acc 64.062 (65.568)	lr 0.02389
Train [17][630/3239]	Time 0.657 (0.916)	Data Time 0.001 (0.030)	Loss 3.4629 (3.4830)	Entropy 1.16521 (1.16905)	Top-1 acc 40.234 (41.481)	Top-5 acc 66.016 (65.528)	lr 0.02389
Train [17][640/3239]	Time 0.602 (0.916)	Data Time 0.001 (0.030)	Loss 3.4003 (3.4831)	Entropy 1.16534 (1.16899)	Top-1 acc 40.625 (41.473)	Top-5 acc 67.188 (65.524)	lr 0.02389
Train [17][650/3239]	Time 0.587 (0.915)	Data Time 0.001 (0.029)	Loss 3.4410 (3.4821)	Entropy 1.16528 (1.16894)	Top-1 acc 40.234 (41.492)	Top-5 acc 64.453 (65.537)	lr 0.02389
Train [17][660/3239]	Time 0.591 (0.914)	Data Time 0.001 (0.029)	Loss 3.5528 (3.4826)	Entropy 1.16548 (1.16888)	Top-1 acc 42.578 (41.488)	Top-5 acc 66.797 (65.544)	lr 0.02389
Train [17][670/3239]	Time 0.575 (0.913)	Data Time 0.001 (0.029)	Loss 3.7622 (3.4834)	Entropy 1.16567 (1.16883)	Top-1 acc 35.547 (41.470)	Top-5 acc 58.984 (65.518)	lr 0.02389
Train [17][680/3239]	Time 0.595 (0.912)	Data Time 0.001 (0.028)	Loss 3.3661 (3.4835)	Entropy 1.16529 (1.16879)	Top-1 acc 41.797 (41.460)	Top-5 acc 66.016 (65.509)	lr 0.02389
Train [17][690/3239]	Time 0.694 (0.911)	Data Time 0.001 (0.028)	Loss 3.5374 (3.4848)	Entropy 1.16489 (1.16873)	Top-1 acc 39.062 (41.424)	Top-5 acc 64.844 (65.476)	lr 0.02389
Train [17][700/3239]	Time 0.592 (0.910)	Data Time 0.001 (0.028)	Loss 3.5462 (3.4857)	Entropy 1.16460 (1.16868)	Top-1 acc 37.891 (41.387)	Top-5 acc 63.672 (65.458)	lr 0.02389
Train [17][710/3239]	Time 0.602 (0.909)	Data Time 0.001 (0.027)	Loss 3.5416 (3.4846)	Entropy 1.16449 (1.16862)	Top-1 acc 41.797 (41.414)	Top-5 acc 64.844 (65.482)	lr 0.02389
Train [17][720/3239]	Time 0.584 (0.909)	Data Time 0.001 (0.027)	Loss 3.5172 (3.4842)	Entropy 1.16420 (1.16856)	Top-1 acc 39.062 (41.410)	Top-5 acc 60.156 (65.478)	lr 0.02389
Train [17][730/3239]	Time 0.568 (0.908)	Data Time 0.001 (0.026)	Loss 3.6360 (3.4837)	Entropy 1.16444 (1.16850)	Top-1 acc 37.891 (41.420)	Top-5 acc 61.328 (65.493)	lr 0.02389
Train [17][740/3239]	Time 0.666 (0.907)	Data Time 0.001 (0.026)	Loss 3.3754 (3.4834)	Entropy 1.16430 (1.16845)	Top-1 acc 42.578 (41.423)	Top-5 acc 67.578 (65.507)	lr 0.02389
Train [17][750/3239]	Time 0.578 (0.906)	Data Time 0.001 (0.026)	Loss 3.5736 (3.4827)	Entropy 1.16385 (1.16839)	Top-1 acc 41.016 (41.435)	Top-5 acc 63.672 (65.517)	lr 0.02389
Train [17][760/3239]	Time 0.725 (0.905)	Data Time 0.001 (0.026)	Loss 3.3601 (3.4820)	Entropy 1.16318 (1.16833)	Top-1 acc 44.922 (41.443)	Top-5 acc 66.406 (65.528)	lr 0.02389
Train [17][770/3239]	Time 0.569 (0.904)	Data Time 0.001 (0.025)	Loss 3.5322 (3.4828)	Entropy 1.16300 (1.16826)	Top-1 acc 39.844 (41.435)	Top-5 acc 68.359 (65.522)	lr 0.02389
Train [17][780/3239]	Time 0.579 (0.903)	Data Time 0.001 (0.025)	Loss 3.4526 (3.4831)	Entropy 1.16259 (1.16819)	Top-1 acc 39.844 (41.422)	Top-5 acc 65.234 (65.524)	lr 0.02389
Train [17][790/3239]	Time 0.594 (0.902)	Data Time 0.001 (0.025)	Loss 3.4343 (3.4844)	Entropy 1.16265 (1.16812)	Top-1 acc 43.359 (41.386)	Top-5 acc 65.625 (65.505)	lr 0.02389
Train [17][800/3239]	Time 0.602 (0.902)	Data Time 0.001 (0.024)	Loss 3.5394 (3.4835)	Entropy 1.16263 (1.16805)	Top-1 acc 39.062 (41.387)	Top-5 acc 62.109 (65.526)	lr 0.02389
Train [17][810/3239]	Time 0.566 (0.901)	Data Time 0.001 (0.024)	Loss 3.5066 (3.4832)	Entropy 1.16268 (1.16799)	Top-1 acc 38.281 (41.393)	Top-5 acc 66.797 (65.533)	lr 0.02389
Train [17][820/3239]	Time 0.613 (0.901)	Data Time 0.001 (0.024)	Loss 3.4284 (3.4829)	Entropy 1.16251 (1.16792)	Top-1 acc 42.578 (41.388)	Top-5 acc 67.969 (65.538)	lr 0.02389
Train [17][830/3239]	Time 0.602 (0.900)	Data Time 0.001 (0.024)	Loss 3.3994 (3.4823)	Entropy 1.16240 (1.16786)	Top-1 acc 46.484 (41.407)	Top-5 acc 68.750 (65.547)	lr 0.02388
Train [17][840/3239]	Time 0.579 (0.900)	Data Time 0.001 (0.023)	Loss 3.6225 (3.4826)	Entropy 1.16125 (1.16779)	Top-1 acc 36.719 (41.391)	Top-5 acc 62.500 (65.541)	lr 0.02388
Train [17][850/3239]	Time 0.680 (0.899)	Data Time 0.001 (0.023)	Loss 3.4479 (3.4828)	Entropy 1.16086 (1.16771)	Top-1 acc 41.016 (41.387)	Top-5 acc 69.531 (65.535)	lr 0.02388
Train [17][860/3239]	Time 0.591 (0.899)	Data Time 0.001 (0.023)	Loss 3.4176 (3.4833)	Entropy 1.16079 (1.16763)	Top-1 acc 44.141 (41.389)	Top-5 acc 65.234 (65.524)	lr 0.02388
Train [17][870/3239]	Time 0.590 (0.898)	Data Time 0.001 (0.023)	Loss 3.4876 (3.4832)	Entropy 1.16012 (1.16755)	Top-1 acc 41.406 (41.398)	Top-5 acc 66.406 (65.529)	lr 0.02388
Train [17][880/3239]	Time 0.619 (0.898)	Data Time 0.001 (0.022)	Loss 3.7096 (3.4836)	Entropy 1.15994 (1.16746)	Top-1 acc 39.062 (41.393)	Top-5 acc 59.375 (65.523)	lr 0.02388
Train [17][890/3239]	Time 0.582 (0.897)	Data Time 0.001 (0.022)	Loss 3.5301 (3.4833)	Entropy 1.15995 (1.16737)	Top-1 acc 38.672 (41.398)	Top-5 acc 62.500 (65.537)	lr 0.02388
Train [17][900/3239]	Time 0.583 (0.897)	Data Time 0.001 (0.022)	Loss 3.6820 (3.4836)	Entropy 1.15992 (1.16729)	Top-1 acc 36.328 (41.391)	Top-5 acc 62.891 (65.539)	lr 0.02388
Train [17][910/3239]	Time 0.620 (0.896)	Data Time 0.001 (0.022)	Loss 3.5943 (3.4842)	Entropy 1.15966 (1.16721)	Top-1 acc 36.328 (41.377)	Top-5 acc 63.281 (65.516)	lr 0.02388
Train [17][920/3239]	Time 0.662 (0.895)	Data Time 0.001 (0.021)	Loss 3.4315 (3.4840)	Entropy 1.15964 (1.16713)	Top-1 acc 41.797 (41.368)	Top-5 acc 66.016 (65.517)	lr 0.02388
Train [17][930/3239]	Time 0.620 (0.894)	Data Time 0.001 (0.021)	Loss 3.5432 (3.4845)	Entropy 1.15933 (1.16705)	Top-1 acc 37.891 (41.356)	Top-5 acc 64.453 (65.503)	lr 0.02388
Train [17][940/3239]	Time 0.604 (0.894)	Data Time 0.001 (0.021)	Loss 3.5469 (3.4848)	Entropy 1.15914 (1.16696)	Top-1 acc 40.625 (41.344)	Top-5 acc 65.625 (65.495)	lr 0.02388
Train [17][950/3239]	Time 0.605 (0.894)	Data Time 0.001 (0.021)	Loss 3.4731 (3.4845)	Entropy 1.15892 (1.16688)	Top-1 acc 44.531 (41.352)	Top-5 acc 62.500 (65.496)	lr 0.02388
Train [17][960/3239]	Time 0.561 (0.893)	Data Time 0.001 (0.021)	Loss 3.3781 (3.4840)	Entropy 1.15864 (1.16680)	Top-1 acc 42.969 (41.361)	Top-5 acc 66.016 (65.505)	lr 0.02388
Train [17][970/3239]	Time 0.623 (0.893)	Data Time 0.001 (0.020)	Loss 3.3730 (3.4835)	Entropy 1.15803 (1.16671)	Top-1 acc 44.141 (41.376)	Top-5 acc 70.703 (65.526)	lr 0.02388
Train [17][980/3239]	Time 0.637 (0.892)	Data Time 0.001 (0.020)	Loss 3.8284 (3.4847)	Entropy 1.15827 (1.16662)	Top-1 acc 36.328 (41.350)	Top-5 acc 58.594 (65.494)	lr 0.02388
Train [17][990/3239]	Time 0.693 (0.892)	Data Time 0.001 (0.020)	Loss 3.5517 (3.4853)	Entropy 1.15812 (1.16654)	Top-1 acc 41.797 (41.340)	Top-5 acc 64.453 (65.483)	lr 0.02388
Train [17][1000/3239]	Time 0.600 (0.892)	Data Time 0.001 (0.020)	Loss 3.5008 (3.4855)	Entropy 1.15770 (1.16645)	Top-1 acc 40.625 (41.326)	Top-5 acc 63.672 (65.480)	lr 0.02388
Train [17][1010/3239]	Time 0.619 (0.891)	Data Time 0.001 (0.020)	Loss 3.4708 (3.4860)	Entropy 1.15760 (1.16636)	Top-1 acc 39.844 (41.314)	Top-5 acc 65.625 (65.462)	lr 0.02388
Train [17][1020/3239]	Time 0.581 (0.891)	Data Time 0.001 (0.019)	Loss 3.2507 (3.4849)	Entropy 1.15764 (1.16628)	Top-1 acc 46.094 (41.332)	Top-5 acc 69.141 (65.481)	lr 0.02388
Train [17][1030/3239]	Time 0.601 (0.890)	Data Time 0.001 (0.019)	Loss 3.3886 (3.4843)	Entropy 1.15721 (1.16619)	Top-1 acc 45.703 (41.349)	Top-5 acc 70.312 (65.496)	lr 0.02388
Train [17][1040/3239]	Time 0.587 (0.890)	Data Time 0.001 (0.019)	Loss 3.3173 (3.4842)	Entropy 1.15697 (1.16611)	Top-1 acc 40.234 (41.345)	Top-5 acc 69.141 (65.494)	lr 0.02388
Train [17][1050/3239]	Time 0.593 (0.889)	Data Time 0.001 (0.019)	Loss 3.5793 (3.4848)	Entropy 1.15697 (1.16602)	Top-1 acc 40.625 (41.333)	Top-5 acc 64.062 (65.483)	lr 0.02388
Train [17][1060/3239]	Time 0.552 (0.889)	Data Time 0.001 (0.019)	Loss 3.3544 (3.4855)	Entropy 1.15672 (1.16593)	Top-1 acc 42.969 (41.312)	Top-5 acc 69.531 (65.474)	lr 0.02388
Train [17][1070/3239]	Time 0.582 (0.888)	Data Time 0.001 (0.019)	Loss 3.5764 (3.4859)	Entropy 1.15667 (1.16585)	Top-1 acc 38.281 (41.307)	Top-5 acc 62.891 (65.467)	lr 0.02387
Train [17][1080/3239]	Time 0.690 (0.888)	Data Time 0.001 (0.019)	Loss 3.5867 (3.4857)	Entropy 1.15635 (1.16576)	Top-1 acc 40.234 (41.307)	Top-5 acc 62.500 (65.466)	lr 0.02387
Train [17][1090/3239]	Time 0.441 (0.887)	Data Time 0.001 (0.018)	Loss 3.5469 (3.4855)	Entropy 1.15612 (1.16567)	Top-1 acc 39.453 (41.321)	Top-5 acc 62.109 (65.463)	lr 0.02387
Train [17][1100/3239]	Time 0.559 (0.886)	Data Time 0.001 (0.018)	Loss 3.7617 (3.4860)	Entropy 1.15565 (1.16559)	Top-1 acc 38.281 (41.306)	Top-5 acc 61.328 (65.446)	lr 0.02387
Train [17][1110/3239]	Time 0.574 (0.886)	Data Time 0.001 (0.018)	Loss 3.4334 (3.4854)	Entropy 1.15562 (1.16550)	Top-1 acc 42.188 (41.310)	Top-5 acc 67.188 (65.456)	lr 0.02387
Train [17][1120/3239]	Time 0.591 (0.886)	Data Time 0.001 (0.018)	Loss 3.3852 (3.4857)	Entropy 1.15580 (1.16541)	Top-1 acc 42.188 (41.304)	Top-5 acc 66.797 (65.446)	lr 0.02387
Train [17][1130/3239]	Time 0.570 (0.885)	Data Time 0.001 (0.018)	Loss 3.3216 (3.4857)	Entropy 1.15566 (1.16532)	Top-1 acc 49.609 (41.315)	Top-5 acc 69.531 (65.445)	lr 0.02387
Train [17][1140/3239]	Time 0.554 (0.885)	Data Time 0.001 (0.018)	Loss 3.5978 (3.4858)	Entropy 1.15570 (1.16524)	Top-1 acc 35.938 (41.315)	Top-5 acc 62.109 (65.446)	lr 0.02387
Train [17][1150/3239]	Time 0.717 (0.885)	Data Time 0.001 (0.018)	Loss 3.1658 (3.4855)	Entropy 1.15583 (1.16516)	Top-1 acc 48.438 (41.323)	Top-5 acc 72.656 (65.457)	lr 0.02387
Train [17][1160/3239]	Time 0.561 (0.885)	Data Time 0.001 (0.017)	Loss 3.6536 (3.4857)	Entropy 1.15521 (1.16507)	Top-1 acc 37.109 (41.314)	Top-5 acc 61.328 (65.458)	lr 0.02387
Train [17][1170/3239]	Time 0.618 (0.884)	Data Time 0.001 (0.017)	Loss 3.4625 (3.4854)	Entropy 1.15500 (1.16499)	Top-1 acc 42.188 (41.321)	Top-5 acc 66.406 (65.459)	lr 0.02387
Train [17][1180/3239]	Time 0.593 (0.884)	Data Time 0.001 (0.017)	Loss 3.7075 (3.4858)	Entropy 1.15527 (1.16491)	Top-1 acc 39.453 (41.310)	Top-5 acc 60.156 (65.455)	lr 0.02387
Train [17][1190/3239]	Time 0.590 (0.901)	Data Time 0.002 (0.017)	Loss 3.7169 (3.4854)	Entropy 1.15474 (1.16482)	Top-1 acc 34.375 (41.317)	Top-5 acc 62.109 (65.457)	lr 0.02387
Train [17][1200/3239]	Time 0.570 (0.901)	Data Time 0.002 (0.017)	Loss 3.5523 (3.4855)	Entropy 1.15476 (1.16474)	Top-1 acc 39.844 (41.313)	Top-5 acc 61.719 (65.459)	lr 0.02387
Train [17][1210/3239]	Time 0.572 (0.900)	Data Time 0.001 (0.017)	Loss 3.5890 (3.4855)	Entropy 1.15460 (1.16466)	Top-1 acc 38.672 (41.316)	Top-5 acc 65.234 (65.466)	lr 0.02387
Train [17][1220/3239]	Time 0.621 (0.900)	Data Time 0.001 (0.017)	Loss 3.5536 (3.4859)	Entropy 1.15448 (1.16458)	Top-1 acc 37.109 (41.306)	Top-5 acc 64.062 (65.466)	lr 0.02387
Train [17][1230/3239]	Time 0.590 (0.899)	Data Time 0.001 (0.017)	Loss 3.4187 (3.4857)	Entropy 1.15450 (1.16449)	Top-1 acc 42.188 (41.312)	Top-5 acc 68.750 (65.476)	lr 0.02387
Train [17][1240/3239]	Time 0.665 (0.899)	Data Time 0.001 (0.016)	Loss 3.5365 (3.4856)	Entropy 1.15442 (1.16441)	Top-1 acc 38.672 (41.317)	Top-5 acc 66.406 (65.476)	lr 0.02387
Train [17][1250/3239]	Time 0.551 (0.898)	Data Time 0.001 (0.016)	Loss 3.2858 (3.4852)	Entropy 1.15392 (1.16433)	Top-1 acc 47.656 (41.327)	Top-5 acc 71.094 (65.483)	lr 0.02387
Train [17][1260/3239]	Time 0.643 (0.898)	Data Time 0.001 (0.016)	Loss 3.4641 (3.4847)	Entropy 1.15368 (1.16425)	Top-1 acc 42.969 (41.343)	Top-5 acc 67.188 (65.492)	lr 0.02387
Train [17][1270/3239]	Time 0.520 (0.898)	Data Time 0.001 (0.016)	Loss 3.7486 (3.4849)	Entropy 1.15339 (1.16416)	Top-1 acc 39.062 (41.342)	Top-5 acc 60.547 (65.491)	lr 0.02387
Train [17][1280/3239]	Time 0.610 (0.897)	Data Time 0.001 (0.016)	Loss 3.6844 (3.4853)	Entropy 1.15364 (1.16408)	Top-1 acc 37.109 (41.327)	Top-5 acc 60.938 (65.480)	lr 0.02387
Train [17][1290/3239]	Time 0.594 (0.897)	Data Time 0.001 (0.016)	Loss 3.3211 (3.4850)	Entropy 1.15338 (1.16400)	Top-1 acc 44.922 (41.333)	Top-5 acc 68.750 (65.490)	lr 0.02387
Train [17][1300/3239]	Time 0.581 (0.897)	Data Time 0.001 (0.016)	Loss 3.3473 (3.4849)	Entropy 1.15335 (1.16392)	Top-1 acc 44.141 (41.338)	Top-5 acc 72.266 (65.506)	lr 0.02387
Train [17][1310/3239]	Time 0.716 (0.896)	Data Time 0.001 (0.016)	Loss 3.6519 (3.4847)	Entropy 1.15357 (1.16384)	Top-1 acc 38.281 (41.342)	Top-5 acc 63.281 (65.513)	lr 0.02386
Train [17][1320/3239]	Time 0.580 (0.896)	Data Time 0.001 (0.016)	Loss 3.5301 (3.4852)	Entropy 1.15283 (1.16376)	Top-1 acc 38.281 (41.330)	Top-5 acc 64.062 (65.501)	lr 0.02386
Train [17][1330/3239]	Time 0.588 (0.896)	Data Time 0.001 (0.015)	Loss 3.5171 (3.4847)	Entropy 1.15290 (1.16367)	Top-1 acc 39.844 (41.340)	Top-5 acc 64.453 (65.510)	lr 0.02386
Train [17][1340/3239]	Time 0.613 (0.895)	Data Time 0.001 (0.015)	Loss 3.6926 (3.4849)	Entropy 1.15256 (1.16359)	Top-1 acc 35.156 (41.332)	Top-5 acc 63.281 (65.504)	lr 0.02386
Train [17][1350/3239]	Time 0.592 (0.895)	Data Time 0.001 (0.015)	Loss 3.6042 (3.4854)	Entropy 1.15203 (1.16351)	Top-1 acc 38.672 (41.326)	Top-5 acc 62.500 (65.485)	lr 0.02386
Train [17][1360/3239]	Time 0.620 (0.895)	Data Time 0.001 (0.015)	Loss 3.3461 (3.4850)	Entropy 1.15182 (1.16342)	Top-1 acc 44.141 (41.338)	Top-5 acc 68.359 (65.487)	lr 0.02386
Train [17][1370/3239]	Time 0.598 (0.894)	Data Time 0.002 (0.015)	Loss 3.6730 (3.4848)	Entropy 1.15178 (1.16334)	Top-1 acc 38.672 (41.344)	Top-5 acc 60.547 (65.490)	lr 0.02386
Train [17][1380/3239]	Time 0.628 (0.894)	Data Time 0.001 (0.015)	Loss 3.6295 (3.4852)	Entropy 1.15164 (1.16325)	Top-1 acc 43.359 (41.336)	Top-5 acc 66.016 (65.484)	lr 0.02386
Train [17][1390/3239]	Time 0.613 (0.894)	Data Time 0.003 (0.015)	Loss 3.4568 (3.4854)	Entropy 1.15150 (1.16317)	Top-1 acc 40.234 (41.331)	Top-5 acc 64.844 (65.484)	lr 0.02386
Train [17][1400/3239]	Time 0.581 (0.893)	Data Time 0.004 (0.015)	Loss 3.7640 (3.4856)	Entropy 1.15115 (1.16309)	Top-1 acc 36.719 (41.330)	Top-5 acc 58.984 (65.478)	lr 0.02386
Train [17][1410/3239]	Time 0.438 (0.892)	Data Time 0.001 (0.015)	Loss 3.6592 (3.4857)	Entropy 1.15078 (1.16300)	Top-1 acc 38.672 (41.333)	Top-5 acc 61.719 (65.474)	lr 0.02386
Train [17][1420/3239]	Time 0.592 (0.892)	Data Time 0.001 (0.015)	Loss 3.3337 (3.4857)	Entropy 1.15042 (1.16291)	Top-1 acc 46.484 (41.331)	Top-5 acc 69.531 (65.475)	lr 0.02386
Train [17][1430/3239]	Time 0.616 (0.892)	Data Time 0.002 (0.015)	Loss 3.4924 (3.4858)	Entropy 1.15061 (1.16283)	Top-1 acc 38.672 (41.325)	Top-5 acc 64.844 (65.474)	lr 0.02386
Train [17][1440/3239]	Time 0.593 (0.892)	Data Time 0.001 (0.014)	Loss 3.4307 (3.4853)	Entropy 1.15052 (1.16274)	Top-1 acc 42.578 (41.333)	Top-5 acc 65.625 (65.479)	lr 0.02386
Train [17][1450/3239]	Time 0.628 (0.891)	Data Time 0.001 (0.014)	Loss 3.7080 (3.4856)	Entropy 1.15057 (1.16266)	Top-1 acc 36.328 (41.326)	Top-5 acc 58.203 (65.474)	lr 0.02386
Train [17][1460/3239]	Time 0.612 (0.891)	Data Time 0.001 (0.014)	Loss 3.4993 (3.4856)	Entropy 1.15029 (1.16257)	Top-1 acc 41.016 (41.325)	Top-5 acc 65.625 (65.476)	lr 0.02386
Train [17][1470/3239]	Time 0.702 (0.891)	Data Time 0.001 (0.014)	Loss 3.3532 (3.4852)	Entropy 1.15030 (1.16249)	Top-1 acc 43.750 (41.327)	Top-5 acc 70.703 (65.485)	lr 0.02386
Train [17][1480/3239]	Time 0.604 (0.891)	Data Time 0.001 (0.014)	Loss 3.4208 (3.4849)	Entropy 1.14994 (1.16241)	Top-1 acc 46.484 (41.344)	Top-5 acc 64.844 (65.492)	lr 0.02386
Train [17][1490/3239]	Time 0.593 (0.891)	Data Time 0.001 (0.014)	Loss 3.4675 (3.4846)	Entropy 1.15032 (1.16233)	Top-1 acc 38.281 (41.345)	Top-5 acc 60.938 (65.495)	lr 0.02386
Train [17][1500/3239]	Time 0.589 (0.890)	Data Time 0.001 (0.014)	Loss 3.5810 (3.4843)	Entropy 1.14974 (1.16224)	Top-1 acc 39.844 (41.352)	Top-5 acc 60.547 (65.502)	lr 0.02386
Train [17][1510/3239]	Time 0.581 (0.890)	Data Time 0.001 (0.014)	Loss 3.4727 (3.4842)	Entropy 1.15002 (1.16216)	Top-1 acc 40.625 (41.357)	Top-5 acc 65.234 (65.506)	lr 0.02386
Train [17][1520/3239]	Time 0.599 (0.890)	Data Time 0.001 (0.014)	Loss 3.5396 (3.4844)	Entropy 1.14954 (1.16208)	Top-1 acc 38.672 (41.346)	Top-5 acc 65.234 (65.505)	lr 0.02386
Train [17][1530/3239]	Time 0.632 (0.890)	Data Time 0.001 (0.014)	Loss 3.3612 (3.4848)	Entropy 1.14928 (1.16200)	Top-1 acc 41.797 (41.334)	Top-5 acc 66.797 (65.501)	lr 0.02386
Train [17][1540/3239]	Time 0.677 (0.889)	Data Time 0.001 (0.014)	Loss 3.3561 (3.4848)	Entropy 1.14883 (1.16192)	Top-1 acc 39.844 (41.330)	Top-5 acc 71.875 (65.506)	lr 0.02386
Train [17][1550/3239]	Time 0.581 (0.889)	Data Time 0.001 (0.014)	Loss 3.5428 (3.4847)	Entropy 1.14857 (1.16183)	Top-1 acc 39.453 (41.328)	Top-5 acc 62.500 (65.502)	lr 0.02385
Train [17][1560/3239]	Time 0.574 (0.889)	Data Time 0.001 (0.013)	Loss 3.8781 (3.4846)	Entropy 1.14872 (1.16175)	Top-1 acc 32.031 (41.327)	Top-5 acc 61.328 (65.508)	lr 0.02385
Train [17][1570/3239]	Time 0.571 (0.888)	Data Time 0.001 (0.013)	Loss 3.1343 (3.4843)	Entropy 1.14848 (1.16166)	Top-1 acc 48.047 (41.333)	Top-5 acc 72.656 (65.512)	lr 0.02385
Train [17][1580/3239]	Time 0.570 (0.888)	Data Time 0.001 (0.013)	Loss 3.4613 (3.4841)	Entropy 1.14771 (1.16158)	Top-1 acc 41.797 (41.339)	Top-5 acc 66.016 (65.516)	lr 0.02385
Train [17][1590/3239]	Time 0.601 (0.888)	Data Time 0.001 (0.013)	Loss 3.3911 (3.4838)	Entropy 1.14826 (1.16149)	Top-1 acc 44.531 (41.347)	Top-5 acc 69.141 (65.515)	lr 0.02385
Train [17][1600/3239]	Time 0.552 (0.887)	Data Time 0.001 (0.013)	Loss 3.5172 (3.4838)	Entropy 1.14800 (1.16141)	Top-1 acc 46.875 (41.351)	Top-5 acc 65.625 (65.515)	lr 0.02385
Train [17][1610/3239]	Time 0.600 (0.887)	Data Time 0.001 (0.013)	Loss 3.5354 (3.4836)	Entropy 1.14783 (1.16133)	Top-1 acc 40.625 (41.358)	Top-5 acc 67.188 (65.521)	lr 0.02385
Train [17][1620/3239]	Time 0.609 (0.887)	Data Time 0.001 (0.013)	Loss 3.3338 (3.4837)	Entropy 1.14789 (1.16124)	Top-1 acc 44.922 (41.359)	Top-5 acc 70.703 (65.520)	lr 0.02385
Train [17][1630/3239]	Time 0.610 (0.887)	Data Time 0.001 (0.013)	Loss 3.5655 (3.4838)	Entropy 1.14749 (1.16116)	Top-1 acc 36.719 (41.356)	Top-5 acc 64.062 (65.520)	lr 0.02385
Train [17][1640/3239]	Time 0.583 (0.886)	Data Time 0.001 (0.013)	Loss 3.7239 (3.4843)	Entropy 1.14722 (1.16108)	Top-1 acc 37.891 (41.343)	Top-5 acc 59.766 (65.515)	lr 0.02385
Train [17][1650/3239]	Time 0.618 (0.886)	Data Time 0.001 (0.013)	Loss 3.4200 (3.4841)	Entropy 1.14712 (1.16099)	Top-1 acc 42.188 (41.346)	Top-5 acc 69.141 (65.522)	lr 0.02385
Train [17][1660/3239]	Time 0.584 (0.886)	Data Time 0.001 (0.013)	Loss 3.5041 (3.4843)	Entropy 1.14689 (1.16091)	Top-1 acc 37.109 (41.342)	Top-5 acc 64.062 (65.517)	lr 0.02385
Train [17][1670/3239]	Time 0.588 (0.886)	Data Time 0.001 (0.013)	Loss 3.7764 (3.4847)	Entropy 1.14640 (1.16082)	Top-1 acc 37.109 (41.339)	Top-5 acc 62.109 (65.508)	lr 0.02385
Train [17][1680/3239]	Time 0.604 (0.886)	Data Time 0.001 (0.013)	Loss 3.5308 (3.4848)	Entropy 1.14609 (1.16074)	Top-1 acc 39.844 (41.333)	Top-5 acc 62.500 (65.503)	lr 0.02385
Train [17][1690/3239]	Time 0.564 (0.885)	Data Time 0.001 (0.013)	Loss 3.3978 (3.4852)	Entropy 1.14594 (1.16065)	Top-1 acc 41.406 (41.322)	Top-5 acc 66.406 (65.494)	lr 0.02385
Train [17][1700/3239]	Time 0.680 (0.885)	Data Time 0.001 (0.013)	Loss 3.6300 (3.4859)	Entropy 1.14611 (1.16056)	Top-1 acc 39.453 (41.310)	Top-5 acc 60.938 (65.472)	lr 0.02385
Train [17][1710/3239]	Time 0.597 (0.885)	Data Time 0.001 (0.012)	Loss 3.7200 (3.4861)	Entropy 1.14608 (1.16048)	Top-1 acc 38.281 (41.306)	Top-5 acc 63.281 (65.475)	lr 0.02385
Train [17][1720/3239]	Time 0.612 (0.885)	Data Time 0.001 (0.012)	Loss 3.4806 (3.4859)	Entropy 1.14606 (1.16040)	Top-1 acc 42.578 (41.309)	Top-5 acc 62.891 (65.477)	lr 0.02385
Train [17][1730/3239]	Time 0.491 (0.884)	Data Time 0.001 (0.012)	Loss 3.7142 (3.4864)	Entropy 1.14588 (1.16031)	Top-1 acc 33.594 (41.305)	Top-5 acc 61.719 (65.469)	lr 0.02385
Train [17][1740/3239]	Time 0.578 (0.884)	Data Time 0.001 (0.012)	Loss 3.5589 (3.4864)	Entropy 1.14565 (1.16023)	Top-1 acc 40.234 (41.306)	Top-5 acc 61.328 (65.461)	lr 0.02385
Train [17][1750/3239]	Time 0.579 (0.884)	Data Time 0.001 (0.012)	Loss 3.5907 (3.4861)	Entropy 1.14544 (1.16014)	Top-1 acc 39.453 (41.316)	Top-5 acc 62.109 (65.467)	lr 0.02385
Train [17][1760/3239]	Time 0.563 (0.883)	Data Time 0.001 (0.012)	Loss 3.5474 (3.4860)	Entropy 1.14516 (1.16006)	Top-1 acc 39.844 (41.321)	Top-5 acc 63.672 (65.466)	lr 0.02385
Train [17][1770/3239]	Time 0.701 (0.883)	Data Time 0.001 (0.012)	Loss 3.6077 (3.4859)	Entropy 1.14454 (1.15998)	Top-1 acc 40.234 (41.329)	Top-5 acc 65.625 (65.477)	lr 0.02385
Train [17][1780/3239]	Time 0.626 (0.883)	Data Time 0.001 (0.012)	Loss 3.5213 (3.4859)	Entropy 1.14459 (1.15989)	Top-1 acc 42.578 (41.330)	Top-5 acc 65.625 (65.474)	lr 0.02385
Train [17][1790/3239]	Time 0.613 (0.883)	Data Time 0.001 (0.012)	Loss 3.4124 (3.4862)	Entropy 1.14445 (1.15980)	Top-1 acc 40.234 (41.327)	Top-5 acc 67.969 (65.464)	lr 0.02384
Train [17][1800/3239]	Time 0.562 (0.883)	Data Time 0.001 (0.012)	Loss 3.5041 (3.4861)	Entropy 1.14427 (1.15972)	Top-1 acc 41.797 (41.322)	Top-5 acc 65.625 (65.462)	lr 0.02384
Train [17][1810/3239]	Time 0.581 (0.883)	Data Time 0.001 (0.012)	Loss 3.7007 (3.4863)	Entropy 1.14359 (1.15963)	Top-1 acc 34.375 (41.317)	Top-5 acc 61.328 (65.458)	lr 0.02384
Train [17][1820/3239]	Time 0.598 (0.882)	Data Time 0.001 (0.012)	Loss 3.4977 (3.4866)	Entropy 1.14378 (1.15954)	Top-1 acc 43.359 (41.313)	Top-5 acc 65.625 (65.451)	lr 0.02384
Train [17][1830/3239]	Time 0.633 (0.882)	Data Time 0.001 (0.012)	Loss 3.5167 (3.4865)	Entropy 1.14354 (1.15946)	Top-1 acc 41.406 (41.316)	Top-5 acc 64.062 (65.450)	lr 0.02384
Train [17][1840/3239]	Time 0.675 (0.893)	Data Time 0.003 (0.012)	Loss 3.3308 (3.4863)	Entropy 1.14322 (1.15937)	Top-1 acc 43.750 (41.312)	Top-5 acc 70.312 (65.458)	lr 0.02384
Train [17][1850/3239]	Time 0.618 (0.893)	Data Time 0.002 (0.012)	Loss 3.3841 (3.4858)	Entropy 1.14283 (1.15928)	Top-1 acc 44.531 (41.316)	Top-5 acc 68.359 (65.469)	lr 0.02384
Train [17][1860/3239]	Time 0.587 (0.893)	Data Time 0.001 (0.012)	Loss 3.2052 (3.4853)	Entropy 1.14237 (1.15919)	Top-1 acc 44.141 (41.324)	Top-5 acc 70.703 (65.482)	lr 0.02384
Train [17][1870/3239]	Time 0.606 (0.893)	Data Time 0.001 (0.012)	Loss 3.5436 (3.4848)	Entropy 1.14237 (1.15910)	Top-1 acc 37.500 (41.331)	Top-5 acc 64.062 (65.491)	lr 0.02384
Train [17][1880/3239]	Time 0.599 (0.893)	Data Time 0.001 (0.012)	Loss 3.5654 (3.4848)	Entropy 1.14218 (1.15901)	Top-1 acc 39.453 (41.333)	Top-5 acc 64.062 (65.489)	lr 0.02384
Train [17][1890/3239]	Time 0.591 (0.892)	Data Time 0.001 (0.011)	Loss 3.5484 (3.4849)	Entropy 1.14239 (1.15893)	Top-1 acc 41.797 (41.332)	Top-5 acc 64.844 (65.487)	lr 0.02384
Train [17][1900/3239]	Time 0.635 (0.892)	Data Time 0.001 (0.011)	Loss 3.4465 (3.4847)	Entropy 1.14186 (1.15884)	Top-1 acc 44.141 (41.333)	Top-5 acc 64.453 (65.488)	lr 0.02384
Train [17][1910/3239]	Time 0.612 (0.892)	Data Time 0.001 (0.011)	Loss 3.4703 (3.4846)	Entropy 1.14176 (1.15875)	Top-1 acc 43.750 (41.332)	Top-5 acc 64.062 (65.489)	lr 0.02384
Train [17][1920/3239]	Time 0.562 (0.892)	Data Time 0.001 (0.011)	Loss 3.5433 (3.4848)	Entropy 1.14139 (1.15866)	Top-1 acc 38.672 (41.326)	Top-5 acc 64.062 (65.486)	lr 0.02384
Train [17][1930/3239]	Time 0.712 (0.891)	Data Time 0.002 (0.011)	Loss 3.6749 (3.4849)	Entropy 1.14124 (1.15857)	Top-1 acc 40.625 (41.322)	Top-5 acc 63.672 (65.485)	lr 0.02384
Train [17][1940/3239]	Time 0.634 (0.891)	Data Time 0.001 (0.011)	Loss 3.4705 (3.4850)	Entropy 1.14130 (1.15848)	Top-1 acc 41.016 (41.320)	Top-5 acc 64.062 (65.478)	lr 0.02384
Train [17][1950/3239]	Time 0.599 (0.891)	Data Time 0.002 (0.011)	Loss 3.5070 (3.4846)	Entropy 1.14139 (1.15839)	Top-1 acc 38.281 (41.329)	Top-5 acc 64.453 (65.485)	lr 0.02384
Train [17][1960/3239]	Time 0.584 (0.891)	Data Time 0.001 (0.011)	Loss 3.3043 (3.4846)	Entropy 1.14131 (1.15831)	Top-1 acc 50.000 (41.335)	Top-5 acc 73.047 (65.488)	lr 0.02384
Train [17][1970/3239]	Time 0.602 (0.891)	Data Time 0.001 (0.011)	Loss 3.6163 (3.4842)	Entropy 1.14102 (1.15822)	Top-1 acc 38.281 (41.344)	Top-5 acc 65.625 (65.497)	lr 0.02384
Train [17][1980/3239]	Time 0.565 (0.891)	Data Time 0.001 (0.011)	Loss 3.5513 (3.4840)	Entropy 1.14072 (1.15813)	Top-1 acc 41.797 (41.347)	Top-5 acc 59.766 (65.502)	lr 0.02384
Train [17][1990/3239]	Time 0.586 (0.890)	Data Time 0.001 (0.011)	Loss 3.4309 (3.4842)	Entropy 1.14055 (1.15804)	Top-1 acc 39.062 (41.345)	Top-5 acc 67.188 (65.497)	lr 0.02384
Train [17][2000/3239]	Time 0.667 (0.890)	Data Time 0.001 (0.011)	Loss 3.5461 (3.4841)	Entropy 1.14026 (1.15796)	Top-1 acc 41.016 (41.345)	Top-5 acc 63.672 (65.501)	lr 0.02384
Train [17][2010/3239]	Time 0.622 (0.890)	Data Time 0.001 (0.011)	Loss 3.3634 (3.4841)	Entropy 1.13997 (1.15787)	Top-1 acc 40.234 (41.346)	Top-5 acc 66.797 (65.503)	lr 0.02384
Train [17][2020/3239]	Time 0.574 (0.890)	Data Time 0.001 (0.011)	Loss 3.5381 (3.4837)	Entropy 1.13987 (1.15778)	Top-1 acc 38.281 (41.353)	Top-5 acc 67.188 (65.515)	lr 0.02383
Train [17][2030/3239]	Time 0.590 (0.890)	Data Time 0.001 (0.011)	Loss 3.4096 (3.4835)	Entropy 1.13962 (1.15769)	Top-1 acc 40.625 (41.356)	Top-5 acc 64.062 (65.519)	lr 0.02383
Train [17][2040/3239]	Time 0.612 (0.889)	Data Time 0.002 (0.011)	Loss 3.3868 (3.4833)	Entropy 1.13960 (1.15760)	Top-1 acc 48.047 (41.363)	Top-5 acc 66.797 (65.524)	lr 0.02383
Train [17][2050/3239]	Time 0.536 (0.889)	Data Time 0.001 (0.011)	Loss 3.5377 (3.4837)	Entropy 1.13962 (1.15752)	Top-1 acc 41.406 (41.357)	Top-5 acc 62.500 (65.513)	lr 0.02383
Train [17][2060/3239]	Time 0.414 (0.889)	Data Time 0.001 (0.011)	Loss 3.4983 (3.4838)	Entropy 1.13971 (1.15743)	Top-1 acc 41.016 (41.356)	Top-5 acc 65.234 (65.512)	lr 0.02383
Train [17][2070/3239]	Time 0.548 (0.889)	Data Time 0.001 (0.011)	Loss 3.5615 (3.4835)	Entropy 1.13922 (1.15734)	Top-1 acc 39.844 (41.364)	Top-5 acc 65.625 (65.519)	lr 0.02383
Train [17][2080/3239]	Time 0.618 (0.888)	Data Time 0.001 (0.011)	Loss 3.4796 (3.4836)	Entropy 1.13908 (1.15726)	Top-1 acc 43.750 (41.364)	Top-5 acc 66.016 (65.518)	lr 0.02383
Train [17][2090/3239]	Time 0.748 (0.888)	Data Time 0.001 (0.011)	Loss 3.7252 (3.4840)	Entropy 1.13903 (1.15717)	Top-1 acc 34.375 (41.357)	Top-5 acc 59.766 (65.511)	lr 0.02383
Train [17][2100/3239]	Time 0.582 (0.888)	Data Time 0.001 (0.011)	Loss 3.6460 (3.4841)	Entropy 1.13850 (1.15708)	Top-1 acc 39.062 (41.356)	Top-5 acc 60.547 (65.509)	lr 0.02383
Train [17][2110/3239]	Time 0.626 (0.888)	Data Time 0.001 (0.010)	Loss 3.3490 (3.4839)	Entropy 1.13868 (1.15699)	Top-1 acc 42.188 (41.355)	Top-5 acc 69.141 (65.515)	lr 0.02383
Train [17][2120/3239]	Time 0.589 (0.888)	Data Time 0.001 (0.010)	Loss 3.4318 (3.4840)	Entropy 1.13858 (1.15691)	Top-1 acc 36.328 (41.350)	Top-5 acc 66.797 (65.517)	lr 0.02383
Train [17][2130/3239]	Time 0.586 (0.888)	Data Time 0.001 (0.010)	Loss 3.5763 (3.4841)	Entropy 1.13884 (1.15682)	Top-1 acc 39.453 (41.344)	Top-5 acc 62.891 (65.515)	lr 0.02383
Train [17][2140/3239]	Time 0.600 (0.888)	Data Time 0.002 (0.010)	Loss 3.5372 (3.4843)	Entropy 1.13835 (1.15674)	Top-1 acc 41.406 (41.344)	Top-5 acc 62.500 (65.509)	lr 0.02383
Train [17][2150/3239]	Time 0.624 (0.888)	Data Time 0.001 (0.010)	Loss 3.4286 (3.4847)	Entropy 1.13852 (1.15665)	Top-1 acc 41.406 (41.335)	Top-5 acc 65.234 (65.498)	lr 0.02383
Train [17][2160/3239]	Time 0.692 (0.888)	Data Time 0.001 (0.010)	Loss 3.4097 (3.4845)	Entropy 1.13836 (1.15657)	Top-1 acc 41.406 (41.337)	Top-5 acc 65.625 (65.501)	lr 0.02383
Train [17][2170/3239]	Time 0.610 (0.887)	Data Time 0.001 (0.010)	Loss 3.3895 (3.4842)	Entropy 1.13816 (1.15648)	Top-1 acc 44.141 (41.347)	Top-5 acc 70.312 (65.507)	lr 0.02383
Train [17][2180/3239]	Time 0.606 (0.887)	Data Time 0.001 (0.010)	Loss 3.5951 (3.4845)	Entropy 1.13770 (1.15640)	Top-1 acc 42.578 (41.341)	Top-5 acc 61.328 (65.499)	lr 0.02383
Train [17][2190/3239]	Time 0.622 (0.887)	Data Time 0.001 (0.010)	Loss 3.4797 (3.4845)	Entropy 1.13728 (1.15631)	Top-1 acc 43.359 (41.347)	Top-5 acc 64.453 (65.499)	lr 0.02383
Train [17][2200/3239]	Time 0.612 (0.887)	Data Time 0.001 (0.010)	Loss 3.4826 (3.4844)	Entropy 1.13731 (1.15623)	Top-1 acc 39.453 (41.347)	Top-5 acc 64.453 (65.502)	lr 0.02383
Train [17][2210/3239]	Time 0.625 (0.887)	Data Time 0.001 (0.010)	Loss 3.5990 (3.4845)	Entropy 1.13676 (1.15614)	Top-1 acc 37.109 (41.342)	Top-5 acc 63.281 (65.492)	lr 0.02383
Train [17][2220/3239]	Time 0.657 (0.887)	Data Time 0.001 (0.010)	Loss 3.3866 (3.4844)	Entropy 1.13652 (1.15605)	Top-1 acc 42.188 (41.345)	Top-5 acc 67.578 (65.492)	lr 0.02383
Train [17][2230/3239]	Time 0.585 (0.886)	Data Time 0.001 (0.010)	Loss 3.6373 (3.4844)	Entropy 1.13634 (1.15596)	Top-1 acc 35.938 (41.346)	Top-5 acc 61.719 (65.492)	lr 0.02383
Train [17][2240/3239]	Time 0.586 (0.886)	Data Time 0.001 (0.010)	Loss 3.5240 (3.4846)	Entropy 1.13658 (1.15588)	Top-1 acc 38.281 (41.336)	Top-5 acc 64.844 (65.486)	lr 0.02383
Train [17][2250/3239]	Time 0.746 (0.886)	Data Time 0.001 (0.010)	Loss 3.2489 (3.4848)	Entropy 1.13670 (1.15579)	Top-1 acc 45.703 (41.328)	Top-5 acc 71.094 (65.481)	lr 0.02383
Train [17][2260/3239]	Time 0.637 (0.886)	Data Time 0.003 (0.010)	Loss 3.4796 (3.4848)	Entropy 1.13620 (1.15571)	Top-1 acc 43.750 (41.329)	Top-5 acc 65.625 (65.482)	lr 0.02382
Train [17][2270/3239]	Time 0.593 (0.886)	Data Time 0.001 (0.010)	Loss 3.5767 (3.4846)	Entropy 1.13574 (1.15562)	Top-1 acc 41.406 (41.337)	Top-5 acc 64.844 (65.485)	lr 0.02382
Train [17][2280/3239]	Time 0.611 (0.886)	Data Time 0.002 (0.010)	Loss 3.3492 (3.4845)	Entropy 1.13503 (1.15553)	Top-1 acc 44.922 (41.347)	Top-5 acc 70.312 (65.486)	lr 0.02382
Train [17][2290/3239]	Time 0.645 (0.886)	Data Time 0.002 (0.010)	Loss 3.2798 (3.4845)	Entropy 1.13503 (1.15544)	Top-1 acc 47.656 (41.347)	Top-5 acc 71.094 (65.484)	lr 0.02382
Train [17][2300/3239]	Time 0.599 (0.885)	Data Time 0.001 (0.010)	Loss 3.4342 (3.4844)	Entropy 1.13489 (1.15535)	Top-1 acc 41.016 (41.351)	Top-5 acc 67.188 (65.486)	lr 0.02382
Train [17][2310/3239]	Time 0.632 (0.885)	Data Time 0.002 (0.010)	Loss 3.3389 (3.4845)	Entropy 1.13527 (1.15527)	Top-1 acc 41.797 (41.349)	Top-5 acc 71.484 (65.482)	lr 0.02382
Train [17][2320/3239]	Time 0.656 (0.885)	Data Time 0.001 (0.010)	Loss 3.3639 (3.4843)	Entropy 1.13536 (1.15518)	Top-1 acc 44.531 (41.354)	Top-5 acc 69.531 (65.483)	lr 0.02382
Train [17][2330/3239]	Time 0.612 (0.885)	Data Time 0.001 (0.010)	Loss 3.5246 (3.4840)	Entropy 1.13515 (1.15509)	Top-1 acc 39.062 (41.361)	Top-5 acc 64.844 (65.486)	lr 0.02382
Train [17][2340/3239]	Time 0.593 (0.885)	Data Time 0.001 (0.010)	Loss 3.6654 (3.4844)	Entropy 1.13495 (1.15501)	Top-1 acc 40.234 (41.359)	Top-5 acc 63.281 (65.478)	lr 0.02382
Train [17][2350/3239]	Time 0.542 (0.885)	Data Time 0.002 (0.010)	Loss 3.6228 (3.4843)	Entropy 1.13469 (1.15492)	Top-1 acc 39.844 (41.361)	Top-5 acc 61.719 (65.481)	lr 0.02382
Train [17][2360/3239]	Time 0.592 (0.885)	Data Time 0.001 (0.010)	Loss 3.4295 (3.4845)	Entropy 1.13473 (1.15484)	Top-1 acc 45.703 (41.358)	Top-5 acc 68.750 (65.478)	lr 0.02382
Train [17][2370/3239]	Time 0.593 (0.884)	Data Time 0.001 (0.010)	Loss 3.4952 (3.4848)	Entropy 1.13501 (1.15475)	Top-1 acc 41.016 (41.356)	Top-5 acc 62.500 (65.476)	lr 0.02382
Train [17][2380/3239]	Time 0.585 (0.884)	Data Time 0.001 (0.010)	Loss 3.4673 (3.4848)	Entropy 1.13481 (1.15467)	Top-1 acc 41.016 (41.354)	Top-5 acc 66.406 (65.477)	lr 0.02382
Train [17][2390/3239]	Time 0.455 (0.884)	Data Time 0.001 (0.009)	Loss 3.4635 (3.4849)	Entropy 1.13441 (1.15459)	Top-1 acc 42.188 (41.356)	Top-5 acc 63.281 (65.473)	lr 0.02382
Train [17][2400/3239]	Time 0.571 (0.884)	Data Time 0.001 (0.009)	Loss 3.6470 (3.4847)	Entropy 1.13435 (1.15450)	Top-1 acc 40.234 (41.362)	Top-5 acc 58.203 (65.478)	lr 0.02382
Train [17][2410/3239]	Time 0.610 (0.884)	Data Time 0.001 (0.009)	Loss 3.5684 (3.4847)	Entropy 1.13424 (1.15442)	Top-1 acc 39.844 (41.360)	Top-5 acc 62.109 (65.479)	lr 0.02382
Train [17][2420/3239]	Time 0.592 (0.883)	Data Time 0.002 (0.009)	Loss 3.6495 (3.4847)	Entropy 1.13458 (1.15434)	Top-1 acc 39.453 (41.358)	Top-5 acc 61.328 (65.477)	lr 0.02382
Train [17][2430/3239]	Time 0.633 (0.883)	Data Time 0.001 (0.009)	Loss 3.5423 (3.4847)	Entropy 1.13490 (1.15425)	Top-1 acc 42.188 (41.355)	Top-5 acc 64.453 (65.476)	lr 0.02382
Train [17][2440/3239]	Time 0.601 (0.883)	Data Time 0.001 (0.009)	Loss 3.4908 (3.4845)	Entropy 1.13432 (1.15418)	Top-1 acc 39.844 (41.361)	Top-5 acc 63.672 (65.478)	lr 0.02382
Train [17][2450/3239]	Time 0.672 (0.883)	Data Time 0.001 (0.009)	Loss 3.4064 (3.4847)	Entropy 1.13408 (1.15409)	Top-1 acc 44.531 (41.360)	Top-5 acc 67.969 (65.474)	lr 0.02382
Train [17][2460/3239]	Time 0.546 (0.883)	Data Time 0.001 (0.009)	Loss 3.6715 (3.4850)	Entropy 1.13382 (1.15401)	Top-1 acc 34.766 (41.352)	Top-5 acc 63.672 (65.468)	lr 0.02382
Train [17][2470/3239]	Time 0.554 (0.883)	Data Time 0.001 (0.009)	Loss 3.5540 (3.4850)	Entropy 1.13343 (1.15393)	Top-1 acc 42.969 (41.353)	Top-5 acc 65.625 (65.467)	lr 0.02382
Train [17][2480/3239]	Time 0.743 (0.883)	Data Time 0.002 (0.009)	Loss 3.4891 (3.4850)	Entropy 1.13290 (1.15385)	Top-1 acc 42.578 (41.351)	Top-5 acc 62.500 (65.468)	lr 0.02382
Train [17][2490/3239]	Time 0.620 (0.883)	Data Time 0.001 (0.009)	Loss 3.5917 (3.4848)	Entropy 1.13273 (1.15376)	Top-1 acc 39.844 (41.349)	Top-5 acc 61.328 (65.468)	lr 0.02381
Train [17][2500/3239]	Time 0.611 (0.891)	Data Time 0.002 (0.009)	Loss 3.7296 (3.4849)	Entropy 1.13280 (1.15368)	Top-1 acc 36.328 (41.354)	Top-5 acc 58.984 (65.472)	lr 0.02381
Train [17][2510/3239]	Time 0.622 (0.891)	Data Time 0.002 (0.009)	Loss 3.3332 (3.4846)	Entropy 1.13302 (1.15360)	Top-1 acc 41.797 (41.358)	Top-5 acc 68.750 (65.471)	lr 0.02381
Train [17][2520/3239]	Time 0.472 (0.891)	Data Time 0.001 (0.009)	Loss 3.4089 (3.4847)	Entropy 1.13306 (1.15352)	Top-1 acc 43.359 (41.357)	Top-5 acc 69.922 (65.469)	lr 0.02381
Train [17][2530/3239]	Time 0.625 (0.891)	Data Time 0.001 (0.009)	Loss 3.3865 (3.4848)	Entropy 1.13293 (1.15343)	Top-1 acc 44.141 (41.356)	Top-5 acc 65.234 (65.468)	lr 0.02381
Train [17][2540/3239]	Time 0.593 (0.890)	Data Time 0.001 (0.009)	Loss 3.6004 (3.4851)	Entropy 1.13322 (1.15335)	Top-1 acc 42.578 (41.351)	Top-5 acc 58.594 (65.459)	lr 0.02381
Train [17][2550/3239]	Time 0.577 (0.890)	Data Time 0.001 (0.009)	Loss 3.3762 (3.4851)	Entropy 1.13295 (1.15327)	Top-1 acc 40.234 (41.351)	Top-5 acc 67.969 (65.458)	lr 0.02381
Train [17][2560/3239]	Time 0.618 (0.890)	Data Time 0.001 (0.009)	Loss 3.4611 (3.4850)	Entropy 1.13314 (1.15320)	Top-1 acc 39.062 (41.351)	Top-5 acc 64.453 (65.458)	lr 0.02381
Train [17][2570/3239]	Time 0.624 (0.890)	Data Time 0.002 (0.009)	Loss 3.4393 (3.4851)	Entropy 1.13307 (1.15312)	Top-1 acc 42.188 (41.349)	Top-5 acc 62.500 (65.454)	lr 0.02381
Train [17][2580/3239]	Time 0.580 (0.890)	Data Time 0.001 (0.009)	Loss 3.5712 (3.4851)	Entropy 1.13302 (1.15304)	Top-1 acc 38.281 (41.345)	Top-5 acc 59.766 (65.450)	lr 0.02381
Train [17][2590/3239]	Time 0.602 (0.890)	Data Time 0.001 (0.009)	Loss 3.4691 (3.4850)	Entropy 1.13246 (1.15296)	Top-1 acc 41.016 (41.342)	Top-5 acc 63.281 (65.453)	lr 0.02381
Train [17][2600/3239]	Time 0.598 (0.890)	Data Time 0.001 (0.009)	Loss 3.5790 (3.4851)	Entropy 1.13270 (1.15288)	Top-1 acc 37.109 (41.337)	Top-5 acc 65.625 (65.449)	lr 0.02381
Train [17][2610/3239]	Time 0.612 (0.890)	Data Time 0.001 (0.009)	Loss 3.3804 (3.4850)	Entropy 1.13253 (1.15281)	Top-1 acc 42.188 (41.344)	Top-5 acc 67.969 (65.450)	lr 0.02381
Train [17][2620/3239]	Time 0.567 (0.890)	Data Time 0.001 (0.009)	Loss 3.5194 (3.4849)	Entropy 1.13218 (1.15273)	Top-1 acc 41.406 (41.345)	Top-5 acc 64.844 (65.456)	lr 0.02381
Train [17][2630/3239]	Time 0.587 (0.890)	Data Time 0.001 (0.009)	Loss 3.4533 (3.4847)	Entropy 1.13165 (1.15265)	Top-1 acc 44.922 (41.355)	Top-5 acc 67.969 (65.461)	lr 0.02381
Train [17][2640/3239]	Time 0.658 (0.889)	Data Time 0.002 (0.009)	Loss 3.7404 (3.4850)	Entropy 1.13147 (1.15257)	Top-1 acc 36.719 (41.348)	Top-5 acc 61.328 (65.452)	lr 0.02381
Train [17][2650/3239]	Time 0.588 (0.889)	Data Time 0.001 (0.009)	Loss 3.7673 (3.4852)	Entropy 1.13163 (1.15249)	Top-1 acc 32.812 (41.341)	Top-5 acc 60.156 (65.449)	lr 0.02381
Train [17][2660/3239]	Time 0.615 (0.889)	Data Time 0.001 (0.009)	Loss 3.4153 (3.4852)	Entropy 1.13105 (1.15241)	Top-1 acc 41.797 (41.340)	Top-5 acc 67.969 (65.448)	lr 0.02381
Train [17][2670/3239]	Time 0.614 (0.889)	Data Time 0.001 (0.009)	Loss 3.5250 (3.4851)	Entropy 1.13052 (1.15233)	Top-1 acc 38.281 (41.340)	Top-5 acc 65.625 (65.448)	lr 0.02381
Train [17][2680/3239]	Time 0.643 (0.889)	Data Time 0.001 (0.009)	Loss 3.3339 (3.4848)	Entropy 1.13022 (1.15225)	Top-1 acc 43.750 (41.346)	Top-5 acc 67.188 (65.454)	lr 0.02381
Train [17][2690/3239]	Time 0.566 (0.889)	Data Time 0.001 (0.009)	Loss 3.5682 (3.4848)	Entropy 1.13023 (1.15217)	Top-1 acc 37.500 (41.349)	Top-5 acc 62.109 (65.454)	lr 0.02381
Train [17][2700/3239]	Time 0.569 (0.888)	Data Time 0.001 (0.009)	Loss 3.3676 (3.4848)	Entropy 1.13061 (1.15209)	Top-1 acc 42.969 (41.347)	Top-5 acc 66.797 (65.452)	lr 0.02381
Train [17][2710/3239]	Time 0.730 (0.888)	Data Time 0.003 (0.009)	Loss 3.5723 (3.4851)	Entropy 1.13064 (1.15201)	Top-1 acc 35.547 (41.340)	Top-5 acc 64.453 (65.445)	lr 0.02381
Train [17][2720/3239]	Time 0.600 (0.888)	Data Time 0.001 (0.009)	Loss 3.4877 (3.4849)	Entropy 1.13016 (1.15193)	Top-1 acc 42.969 (41.347)	Top-5 acc 63.672 (65.446)	lr 0.02380
Train [17][2730/3239]	Time 0.618 (0.888)	Data Time 0.001 (0.009)	Loss 3.5001 (3.4850)	Entropy 1.12993 (1.15185)	Top-1 acc 39.062 (41.344)	Top-5 acc 60.547 (65.442)	lr 0.02380
Train [17][2740/3239]	Time 0.566 (0.888)	Data Time 0.001 (0.009)	Loss 3.6250 (3.4850)	Entropy 1.12989 (1.15177)	Top-1 acc 36.719 (41.348)	Top-5 acc 63.281 (65.441)	lr 0.02380
Train [17][2750/3239]	Time 0.610 (0.888)	Data Time 0.002 (0.009)	Loss 3.6343 (3.4850)	Entropy 1.12988 (1.15169)	Top-1 acc 36.719 (41.349)	Top-5 acc 62.109 (65.443)	lr 0.02380
Train [17][2760/3239]	Time 0.609 (0.888)	Data Time 0.001 (0.009)	Loss 3.2721 (3.4851)	Entropy 1.12979 (1.15161)	Top-1 acc 44.922 (41.345)	Top-5 acc 71.875 (65.444)	lr 0.02380
Train [17][2770/3239]	Time 0.600 (0.888)	Data Time 0.001 (0.008)	Loss 3.3344 (3.4852)	Entropy 1.13006 (1.15153)	Top-1 acc 44.531 (41.344)	Top-5 acc 70.312 (65.443)	lr 0.02380
Train [17][2780/3239]	Time 0.630 (0.888)	Data Time 0.002 (0.008)	Loss 3.5420 (3.4853)	Entropy 1.13010 (1.15145)	Top-1 acc 39.062 (41.344)	Top-5 acc 64.844 (65.441)	lr 0.02380
Train [17][2790/3239]	Time 0.553 (0.887)	Data Time 0.001 (0.008)	Loss 3.2597 (3.4852)	Entropy 1.13006 (1.15138)	Top-1 acc 45.312 (41.346)	Top-5 acc 72.266 (65.443)	lr 0.02380
Train [17][2800/3239]	Time 0.558 (0.887)	Data Time 0.002 (0.008)	Loss 3.7449 (3.4853)	Entropy 1.12973 (1.15130)	Top-1 acc 35.938 (41.342)	Top-5 acc 62.500 (65.439)	lr 0.02380
Train [17][2810/3239]	Time 0.597 (0.887)	Data Time 0.001 (0.008)	Loss 3.5244 (3.4855)	Entropy 1.12939 (1.15122)	Top-1 acc 39.844 (41.336)	Top-5 acc 63.672 (65.434)	lr 0.02380
Train [17][2820/3239]	Time 0.610 (0.887)	Data Time 0.001 (0.008)	Loss 3.3550 (3.4854)	Entropy 1.12910 (1.15114)	Top-1 acc 44.922 (41.340)	Top-5 acc 65.234 (65.433)	lr 0.02380
Train [17][2830/3239]	Time 0.565 (0.887)	Data Time 0.001 (0.008)	Loss 3.4994 (3.4855)	Entropy 1.12887 (1.15107)	Top-1 acc 43.359 (41.341)	Top-5 acc 67.188 (65.433)	lr 0.02380
Train [17][2840/3239]	Time 0.636 (0.887)	Data Time 0.001 (0.008)	Loss 3.4028 (3.4855)	Entropy 1.12896 (1.15099)	Top-1 acc 47.656 (41.348)	Top-5 acc 68.750 (65.433)	lr 0.02380
Train [17][2850/3239]	Time 0.439 (0.887)	Data Time 0.001 (0.008)	Loss 3.3548 (3.4854)	Entropy 1.12890 (1.15091)	Top-1 acc 44.922 (41.351)	Top-5 acc 68.750 (65.432)	lr 0.02380
Train [17][2860/3239]	Time 0.646 (0.887)	Data Time 0.001 (0.008)	Loss 3.5145 (3.4856)	Entropy 1.12905 (1.15083)	Top-1 acc 41.406 (41.347)	Top-5 acc 67.578 (65.428)	lr 0.02380
Train [17][2870/3239]	Time 0.736 (0.886)	Data Time 0.001 (0.008)	Loss 3.3258 (3.4854)	Entropy 1.12864 (1.15076)	Top-1 acc 44.531 (41.350)	Top-5 acc 67.969 (65.434)	lr 0.02380
Train [17][2880/3239]	Time 0.608 (0.886)	Data Time 0.001 (0.008)	Loss 3.6157 (3.4852)	Entropy 1.12866 (1.15068)	Top-1 acc 39.062 (41.358)	Top-5 acc 64.062 (65.435)	lr 0.02380
Train [17][2890/3239]	Time 0.594 (0.886)	Data Time 0.001 (0.008)	Loss 3.8317 (3.4854)	Entropy 1.12835 (1.15061)	Top-1 acc 38.281 (41.356)	Top-5 acc 59.766 (65.433)	lr 0.02380
Train [17][2900/3239]	Time 0.634 (0.886)	Data Time 0.002 (0.008)	Loss 3.5104 (3.4856)	Entropy 1.12852 (1.15053)	Top-1 acc 41.797 (41.351)	Top-5 acc 65.625 (65.430)	lr 0.02380
Train [17][2910/3239]	Time 0.603 (0.886)	Data Time 0.001 (0.008)	Loss 3.6997 (3.4858)	Entropy 1.12836 (1.15045)	Top-1 acc 38.281 (41.348)	Top-5 acc 58.594 (65.423)	lr 0.02380
Train [17][2920/3239]	Time 0.568 (0.886)	Data Time 0.002 (0.008)	Loss 3.3403 (3.4857)	Entropy 1.12795 (1.15038)	Top-1 acc 45.703 (41.351)	Top-5 acc 69.922 (65.428)	lr 0.02380
Train [17][2930/3239]	Time 0.603 (0.886)	Data Time 0.001 (0.008)	Loss 3.5161 (3.4858)	Entropy 1.12761 (1.15030)	Top-1 acc 35.938 (41.347)	Top-5 acc 64.844 (65.426)	lr 0.02380
Train [17][2940/3239]	Time 0.722 (0.886)	Data Time 0.001 (0.008)	Loss 3.2796 (3.4857)	Entropy 1.12784 (1.15022)	Top-1 acc 49.219 (41.354)	Top-5 acc 69.141 (65.429)	lr 0.02380
Train [17][2950/3239]	Time 0.611 (0.886)	Data Time 0.001 (0.008)	Loss 3.4348 (3.4857)	Entropy 1.12772 (1.15015)	Top-1 acc 40.625 (41.352)	Top-5 acc 69.922 (65.431)	lr 0.02379
Train [17][2960/3239]	Time 0.610 (0.885)	Data Time 0.001 (0.008)	Loss 3.3630 (3.4858)	Entropy 1.12770 (1.15007)	Top-1 acc 45.703 (41.353)	Top-5 acc 67.578 (65.429)	lr 0.02379
Train [17][2970/3239]	Time 0.592 (0.885)	Data Time 0.001 (0.008)	Loss 3.2820 (3.4858)	Entropy 1.12780 (1.15000)	Top-1 acc 47.266 (41.352)	Top-5 acc 68.359 (65.432)	lr 0.02379
Train [17][2980/3239]	Time 0.633 (0.885)	Data Time 0.001 (0.008)	Loss 3.6128 (3.4859)	Entropy 1.12775 (1.14992)	Top-1 acc 37.891 (41.350)	Top-5 acc 62.109 (65.429)	lr 0.02379
Train [17][2990/3239]	Time 0.585 (0.885)	Data Time 0.001 (0.008)	Loss 3.4454 (3.4859)	Entropy 1.12755 (1.14985)	Top-1 acc 42.969 (41.346)	Top-5 acc 66.797 (65.427)	lr 0.02379
Train [17][3000/3239]	Time 0.647 (0.885)	Data Time 0.001 (0.008)	Loss 3.2289 (3.4861)	Entropy 1.12770 (1.14977)	Top-1 acc 46.094 (41.343)	Top-5 acc 70.703 (65.424)	lr 0.02379
Train [17][3010/3239]	Time 0.652 (0.885)	Data Time 0.001 (0.008)	Loss 3.4212 (3.4860)	Entropy 1.12775 (1.14970)	Top-1 acc 42.578 (41.348)	Top-5 acc 66.406 (65.426)	lr 0.02379
Train [17][3020/3239]	Time 0.557 (0.885)	Data Time 0.001 (0.008)	Loss 3.4169 (3.4858)	Entropy 1.12777 (1.14963)	Top-1 acc 44.531 (41.344)	Top-5 acc 67.188 (65.427)	lr 0.02379
Train [17][3030/3239]	Time 0.659 (0.885)	Data Time 0.001 (0.008)	Loss 3.4476 (3.4856)	Entropy 1.12747 (1.14955)	Top-1 acc 42.188 (41.347)	Top-5 acc 65.234 (65.432)	lr 0.02379
Train [17][3040/3239]	Time 0.562 (0.885)	Data Time 0.001 (0.008)	Loss 3.4534 (3.4854)	Entropy 1.12747 (1.14948)	Top-1 acc 42.969 (41.352)	Top-5 acc 67.578 (65.434)	lr 0.02379
Train [17][3050/3239]	Time 0.571 (0.884)	Data Time 0.001 (0.008)	Loss 3.3854 (3.4855)	Entropy 1.12728 (1.14941)	Top-1 acc 43.750 (41.349)	Top-5 acc 67.188 (65.433)	lr 0.02379
Train [17][3060/3239]	Time 0.618 (0.884)	Data Time 0.001 (0.008)	Loss 3.4347 (3.4856)	Entropy 1.12745 (1.14934)	Top-1 acc 40.625 (41.348)	Top-5 acc 66.797 (65.433)	lr 0.02379
Train [17][3070/3239]	Time 0.575 (0.884)	Data Time 0.001 (0.008)	Loss 3.5436 (3.4855)	Entropy 1.12731 (1.14927)	Top-1 acc 38.281 (41.350)	Top-5 acc 65.234 (65.433)	lr 0.02379
Train [17][3080/3239]	Time 0.641 (0.884)	Data Time 0.001 (0.008)	Loss 3.3857 (3.4854)	Entropy 1.12707 (1.14919)	Top-1 acc 44.531 (41.352)	Top-5 acc 67.188 (65.435)	lr 0.02379
Train [17][3090/3239]	Time 0.615 (0.884)	Data Time 0.001 (0.008)	Loss 3.4575 (3.4854)	Entropy 1.12670 (1.14912)	Top-1 acc 40.234 (41.354)	Top-5 acc 66.797 (65.435)	lr 0.02379
Train [17][3100/3239]	Time 0.681 (0.884)	Data Time 0.001 (0.008)	Loss 3.5635 (3.4856)	Entropy 1.12692 (1.14905)	Top-1 acc 38.672 (41.352)	Top-5 acc 64.062 (65.431)	lr 0.02379
Train [17][3110/3239]	Time 0.598 (0.884)	Data Time 0.001 (0.008)	Loss 3.5672 (3.4856)	Entropy 1.12663 (1.14898)	Top-1 acc 33.203 (41.347)	Top-5 acc 67.969 (65.432)	lr 0.02379
Train [17][3120/3239]	Time 0.615 (0.884)	Data Time 0.001 (0.008)	Loss 3.2706 (3.4854)	Entropy 1.12691 (1.14891)	Top-1 acc 44.922 (41.355)	Top-5 acc 69.922 (65.437)	lr 0.02379
Train [17][3130/3239]	Time 0.644 (0.884)	Data Time 0.001 (0.008)	Loss 3.7086 (3.4854)	Entropy 1.12691 (1.14884)	Top-1 acc 41.406 (41.359)	Top-5 acc 58.203 (65.438)	lr 0.02379
Train [17][3140/3239]	Time 0.593 (0.884)	Data Time 0.002 (0.008)	Loss 3.4249 (3.4852)	Entropy 1.12710 (1.14877)	Top-1 acc 44.141 (41.363)	Top-5 acc 66.797 (65.442)	lr 0.02379
Train [17][3150/3239]	Time 0.758 (0.891)	Data Time 0.005 (0.008)	Loss 3.4697 (3.4853)	Entropy 1.12693 (1.14870)	Top-1 acc 41.016 (41.362)	Top-5 acc 63.672 (65.440)	lr 0.02379
Train [17][3160/3239]	Time 0.632 (0.890)	Data Time 0.002 (0.008)	Loss 3.6611 (3.4852)	Entropy 1.12670 (1.14863)	Top-1 acc 38.281 (41.363)	Top-5 acc 59.766 (65.442)	lr 0.02379
Train [17][3170/3239]	Time 0.621 (0.890)	Data Time 0.002 (0.008)	Loss 3.4687 (3.4851)	Entropy 1.12654 (1.14856)	Top-1 acc 42.969 (41.364)	Top-5 acc 65.234 (65.447)	lr 0.02379
Train [17][3180/3239]	Time 0.569 (0.890)	Data Time 0.000 (0.008)	Loss 3.5953 (3.4851)	Entropy 1.12647 (1.14849)	Top-1 acc 37.891 (41.362)	Top-5 acc 62.891 (65.446)	lr 0.02378
Train [17][3190/3239]	Time 0.680 (0.890)	Data Time 0.000 (0.008)	Loss 3.5957 (3.4850)	Entropy 1.12622 (1.14842)	Top-1 acc 39.453 (41.367)	Top-5 acc 63.672 (65.447)	lr 0.02378
Train [17][3200/3239]	Time 0.638 (0.890)	Data Time 0.000 (0.008)	Loss 3.2171 (3.4848)	Entropy 1.12639 (1.14835)	Top-1 acc 48.438 (41.372)	Top-5 acc 68.750 (65.451)	lr 0.02378
Train [17][3210/3239]	Time 0.623 (0.889)	Data Time 0.000 (0.008)	Loss 3.4807 (3.4847)	Entropy 1.12613 (1.14828)	Top-1 acc 39.844 (41.375)	Top-5 acc 63.672 (65.453)	lr 0.02378
Train [17][3220/3239]	Time 0.518 (0.889)	Data Time 0.000 (0.008)	Loss 3.6925 (3.4847)	Entropy 1.12614 (1.14822)	Top-1 acc 34.766 (41.375)	Top-5 acc 60.938 (65.454)	lr 0.02378
Train [17][3230/3239]	Time 0.585 (0.889)	Data Time 0.000 (0.008)	Loss 3.5760 (3.4847)	Entropy 1.12592 (1.14815)	Top-1 acc 38.281 (41.374)	Top-5 acc 64.844 (65.450)	lr 0.02378
Train [17][3239/3239]	Time 1.568 (0.889)	Data Time 0.000 (0.008)	Loss 3.6918 (3.4848)	Entropy 1.12576 (1.14809)	Top-1 acc 38.272 (41.375)	Top-5 acc 66.667 (65.449)	lr 0.02378
==========Valid [17/120]	loss 2.232	top-1 acc 51.199 (51.199)	top-5 acc 75.136	Train top-1 41.375	top-5 65.449	Entropy 1.12576	Latency-None: 0.000ms	Flops: 539.76M
Train [18][0/3239]	Time 22.201 (22.201)	Data Time 21.201 (21.201)	Loss 3.4388 (3.4388)	Entropy 1.12590 (1.12590)	Top-1 acc 42.969 (42.969)	Top-5 acc 64.844 (64.844)	lr 0.02378
Train [18][10/3239]	Time 0.656 (2.884)	Data Time 0.001 (1.929)	Loss 3.5584 (3.5131)	Entropy 1.12616 (1.12596)	Top-1 acc 37.500 (40.057)	Top-5 acc 65.234 (64.560)	lr 0.02378
Train [18][20/3239]	Time 0.677 (1.922)	Data Time 0.001 (1.011)	Loss 3.3315 (3.4648)	Entropy 1.12616 (1.12611)	Top-1 acc 44.922 (41.685)	Top-5 acc 66.797 (65.439)	lr 0.02378
Train [18][30/3239]	Time 0.541 (1.577)	Data Time 0.001 (0.686)	Loss 3.5318 (3.4798)	Entropy 1.12606 (1.12613)	Top-1 acc 40.234 (41.381)	Top-5 acc 64.844 (65.285)	lr 0.02378
Train [18][40/3239]	Time 0.596 (1.406)	Data Time 0.001 (0.519)	Loss 3.4375 (3.4672)	Entropy 1.12610 (1.12610)	Top-1 acc 39.062 (41.673)	Top-5 acc 64.453 (65.701)	lr 0.02378
Train [18][50/3239]	Time 0.576 (1.300)	Data Time 0.001 (0.418)	Loss 3.3652 (3.4580)	Entropy 1.12632 (1.12612)	Top-1 acc 44.922 (42.004)	Top-5 acc 66.016 (65.755)	lr 0.02378
Train [18][60/3239]	Time 0.579 (1.228)	Data Time 0.001 (0.350)	Loss 3.5441 (3.4639)	Entropy 1.12580 (1.12614)	Top-1 acc 37.891 (41.925)	Top-5 acc 65.234 (65.747)	lr 0.02378
Train [18][70/3239]	Time 0.617 (1.184)	Data Time 0.002 (0.301)	Loss 3.5214 (3.4580)	Entropy 1.12563 (1.12608)	Top-1 acc 39.453 (42.050)	Top-5 acc 64.844 (65.977)	lr 0.02378
Train [18][80/3239]	Time 0.567 (1.145)	Data Time 0.001 (0.264)	Loss 3.4268 (3.4558)	Entropy 1.12568 (1.12603)	Top-1 acc 41.016 (42.077)	Top-5 acc 67.969 (66.016)	lr 0.02378
Train [18][90/3239]	Time 0.651 (1.113)	Data Time 0.002 (0.235)	Loss 3.4016 (3.4522)	Entropy 1.12598 (1.12600)	Top-1 acc 42.188 (42.145)	Top-5 acc 65.234 (66.037)	lr 0.02378
Train [18][100/3239]	Time 0.605 (1.086)	Data Time 0.001 (0.212)	Loss 3.5064 (3.4511)	Entropy 1.12589 (1.12600)	Top-1 acc 44.531 (42.199)	Top-5 acc 64.844 (66.108)	lr 0.02378
Train [18][110/3239]	Time 0.549 (1.064)	Data Time 0.001 (0.193)	Loss 3.4529 (3.4560)	Entropy 1.12604 (1.12599)	Top-1 acc 44.141 (42.068)	Top-5 acc 67.188 (66.167)	lr 0.02378
Train [18][120/3239]	Time 0.600 (1.047)	Data Time 0.001 (0.177)	Loss 3.3729 (3.4490)	Entropy 1.12597 (1.12599)	Top-1 acc 45.312 (42.300)	Top-5 acc 70.312 (66.329)	lr 0.02378
Train [18][130/3239]	Time 0.600 (1.030)	Data Time 0.001 (0.164)	Loss 3.3234 (3.4506)	Entropy 1.12568 (1.12598)	Top-1 acc 43.750 (42.331)	Top-5 acc 68.359 (66.350)	lr 0.02378
Train [18][140/3239]	Time 0.480 (1.015)	Data Time 0.001 (0.152)	Loss 3.4359 (3.4572)	Entropy 1.12515 (1.12594)	Top-1 acc 45.312 (42.221)	Top-5 acc 66.016 (66.187)	lr 0.02378
Train [18][150/3239]	Time 0.555 (1.003)	Data Time 0.001 (0.142)	Loss 3.2290 (3.4527)	Entropy 1.12513 (1.12589)	Top-1 acc 46.484 (42.219)	Top-5 acc 72.656 (66.321)	lr 0.02378
Train [18][160/3239]	Time 0.606 (0.995)	Data Time 0.001 (0.134)	Loss 3.3346 (3.4533)	Entropy 1.12473 (1.12584)	Top-1 acc 40.234 (42.190)	Top-5 acc 66.797 (66.283)	lr 0.02378
Train [18][170/3239]	Time 0.569 (0.986)	Data Time 0.001 (0.126)	Loss 3.4106 (3.4545)	Entropy 1.12451 (1.12577)	Top-1 acc 40.625 (42.160)	Top-5 acc 65.234 (66.260)	lr 0.02377
Train [18][180/3239]	Time 0.598 (0.979)	Data Time 0.001 (0.119)	Loss 3.6659 (3.4557)	Entropy 1.12459 (1.12570)	Top-1 acc 37.500 (42.110)	Top-5 acc 60.547 (66.229)	lr 0.02377
Train [18][190/3239]	Time 0.568 (0.972)	Data Time 0.001 (0.113)	Loss 3.7355 (3.4566)	Entropy 1.12469 (1.12564)	Top-1 acc 34.766 (42.018)	Top-5 acc 60.547 (66.194)	lr 0.02377
Train [18][200/3239]	Time 0.630 (0.967)	Data Time 0.001 (0.108)	Loss 3.3480 (3.4556)	Entropy 1.12471 (1.12559)	Top-1 acc 42.969 (42.005)	Top-5 acc 68.359 (66.179)	lr 0.02377
Train [18][210/3239]	Time 0.629 (0.962)	Data Time 0.002 (0.103)	Loss 3.5051 (3.4573)	Entropy 1.12431 (1.12554)	Top-1 acc 40.625 (41.945)	Top-5 acc 60.938 (66.093)	lr 0.02377
Train [18][220/3239]	Time 0.602 (0.957)	Data Time 0.001 (0.098)	Loss 3.3882 (3.4563)	Entropy 1.12409 (1.12549)	Top-1 acc 42.578 (41.956)	Top-5 acc 69.531 (66.136)	lr 0.02377
Train [18][230/3239]	Time 0.618 (0.953)	Data Time 0.001 (0.094)	Loss 3.4615 (3.4565)	Entropy 1.12400 (1.12542)	Top-1 acc 45.312 (41.963)	Top-5 acc 66.406 (66.114)	lr 0.02377
Train [18][240/3239]	Time 0.608 (0.949)	Data Time 0.001 (0.090)	Loss 3.3848 (3.4570)	Entropy 1.12367 (1.12536)	Top-1 acc 41.797 (41.949)	Top-5 acc 68.750 (66.111)	lr 0.02377
Train [18][250/3239]	Time 0.720 (0.945)	Data Time 0.001 (0.087)	Loss 3.3745 (3.4565)	Entropy 1.12308 (1.12528)	Top-1 acc 43.750 (41.988)	Top-5 acc 67.188 (66.103)	lr 0.02377
Train [18][260/3239]	Time 0.636 (0.942)	Data Time 0.002 (0.083)	Loss 3.2389 (3.4547)	Entropy 1.12288 (1.12519)	Top-1 acc 45.703 (42.020)	Top-5 acc 70.703 (66.104)	lr 0.02377
Train [18][270/3239]	Time 0.656 (0.938)	Data Time 0.001 (0.080)	Loss 3.5256 (3.4537)	Entropy 1.12218 (1.12510)	Top-1 acc 43.359 (42.046)	Top-5 acc 67.969 (66.148)	lr 0.02377
Train [18][280/3239]	Time 0.616 (0.936)	Data Time 0.001 (0.077)	Loss 3.4463 (3.4529)	Entropy 1.12166 (1.12498)	Top-1 acc 34.766 (41.990)	Top-5 acc 68.750 (66.194)	lr 0.02377
Train [18][290/3239]	Time 0.607 (0.932)	Data Time 0.001 (0.075)	Loss 3.6100 (3.4525)	Entropy 1.12155 (1.12486)	Top-1 acc 42.578 (42.018)	Top-5 acc 60.938 (66.186)	lr 0.02377
Train [18][300/3239]	Time 0.475 (0.929)	Data Time 0.001 (0.072)	Loss 3.3476 (3.4518)	Entropy 1.12163 (1.12476)	Top-1 acc 42.969 (42.021)	Top-5 acc 69.141 (66.188)	lr 0.02377
Train [18][310/3239]	Time 0.597 (0.925)	Data Time 0.002 (0.070)	Loss 3.6129 (3.4524)	Entropy 1.12146 (1.12465)	Top-1 acc 42.578 (42.028)	Top-5 acc 62.500 (66.193)	lr 0.02377
Train [18][320/3239]	Time 0.703 (0.922)	Data Time 0.001 (0.068)	Loss 3.2454 (3.4500)	Entropy 1.12127 (1.12455)	Top-1 acc 47.656 (42.044)	Top-5 acc 71.875 (66.231)	lr 0.02377
Train [18][330/3239]	Time 0.594 (0.919)	Data Time 0.001 (0.066)	Loss 3.3426 (3.4488)	Entropy 1.12094 (1.12445)	Top-1 acc 42.188 (42.035)	Top-5 acc 67.969 (66.235)	lr 0.02377
Train [18][340/3239]	Time 0.562 (0.917)	Data Time 0.001 (0.064)	Loss 3.6011 (3.4494)	Entropy 1.12040 (1.12434)	Top-1 acc 39.062 (42.010)	Top-5 acc 62.891 (66.237)	lr 0.02377
Train [18][350/3239]	Time 0.600 (0.916)	Data Time 0.001 (0.062)	Loss 3.5881 (3.4490)	Entropy 1.12031 (1.12423)	Top-1 acc 39.844 (42.034)	Top-5 acc 61.719 (66.257)	lr 0.02377
Train [18][360/3239]	Time 0.648 (0.913)	Data Time 0.024 (0.061)	Loss 3.4559 (3.4504)	Entropy 1.12027 (1.12412)	Top-1 acc 39.453 (41.999)	Top-5 acc 66.406 (66.230)	lr 0.02377
Train [18][370/3239]	Time 0.661 (0.912)	Data Time 0.001 (0.059)	Loss 3.7329 (3.4503)	Entropy 1.12024 (1.12402)	Top-1 acc 36.719 (42.015)	Top-5 acc 58.594 (66.219)	lr 0.02377
Train [18][380/3239]	Time 0.577 (0.910)	Data Time 0.001 (0.058)	Loss 3.5881 (3.4503)	Entropy 1.11992 (1.12391)	Top-1 acc 39.844 (42.039)	Top-5 acc 60.547 (66.205)	lr 0.02377
Train [18][390/3239]	Time 0.598 (0.909)	Data Time 0.001 (0.056)	Loss 3.1846 (3.4486)	Entropy 1.11984 (1.12381)	Top-1 acc 49.219 (42.092)	Top-5 acc 71.484 (66.234)	lr 0.02377
Train [18][400/3239]	Time 0.599 (0.908)	Data Time 0.001 (0.055)	Loss 3.4619 (3.4492)	Entropy 1.11960 (1.12371)	Top-1 acc 39.453 (42.097)	Top-5 acc 64.844 (66.216)	lr 0.02376
Train [18][410/3239]	Time 0.685 (0.906)	Data Time 0.001 (0.054)	Loss 3.4759 (3.4486)	Entropy 1.11903 (1.12360)	Top-1 acc 39.844 (42.101)	Top-5 acc 67.188 (66.253)	lr 0.02376
Train [18][420/3239]	Time 0.655 (0.905)	Data Time 0.001 (0.052)	Loss 3.0818 (3.4473)	Entropy 1.11882 (1.12349)	Top-1 acc 46.094 (42.115)	Top-5 acc 73.047 (66.261)	lr 0.02376
Train [18][430/3239]	Time 0.600 (0.903)	Data Time 0.001 (0.051)	Loss 3.1010 (3.4467)	Entropy 1.11832 (1.12338)	Top-1 acc 51.562 (42.139)	Top-5 acc 71.094 (66.271)	lr 0.02376
Train [18][440/3239]	Time 0.588 (0.902)	Data Time 0.001 (0.050)	Loss 3.5606 (3.4487)	Entropy 1.11806 (1.12326)	Top-1 acc 38.672 (42.088)	Top-5 acc 65.625 (66.215)	lr 0.02376
Train [18][450/3239]	Time 0.609 (0.901)	Data Time 0.001 (0.049)	Loss 3.5970 (3.4490)	Entropy 1.11808 (1.12315)	Top-1 acc 37.109 (42.075)	Top-5 acc 62.500 (66.209)	lr 0.02376
Train [18][460/3239]	Time 0.523 (0.899)	Data Time 0.001 (0.048)	Loss 3.5531 (3.4495)	Entropy 1.11775 (1.12304)	Top-1 acc 41.406 (42.061)	Top-5 acc 64.062 (66.189)	lr 0.02376
Train [18][470/3239]	Time 0.537 (0.898)	Data Time 0.001 (0.047)	Loss 3.3154 (3.4491)	Entropy 1.11789 (1.12293)	Top-1 acc 45.312 (42.055)	Top-5 acc 67.188 (66.192)	lr 0.02376
Train [18][480/3239]	Time 0.664 (0.896)	Data Time 0.001 (0.046)	Loss 3.6011 (3.4512)	Entropy 1.11771 (1.12282)	Top-1 acc 38.672 (42.036)	Top-5 acc 62.109 (66.159)	lr 0.02376
Train [18][490/3239]	Time 0.616 (0.894)	Data Time 0.001 (0.045)	Loss 3.3642 (3.4512)	Entropy 1.11751 (1.12271)	Top-1 acc 44.141 (42.022)	Top-5 acc 69.531 (66.164)	lr 0.02376
Train [18][500/3239]	Time 0.594 (0.893)	Data Time 0.001 (0.044)	Loss 3.3944 (3.4513)	Entropy 1.11720 (1.12261)	Top-1 acc 41.016 (42.018)	Top-5 acc 64.844 (66.156)	lr 0.02376
Train [18][510/3239]	Time 0.582 (0.893)	Data Time 0.001 (0.043)	Loss 3.6786 (3.4513)	Entropy 1.11720 (1.12250)	Top-1 acc 38.281 (42.003)	Top-5 acc 61.719 (66.147)	lr 0.02376
Train [18][520/3239]	Time 0.623 (0.892)	Data Time 0.001 (0.043)	Loss 3.1920 (3.4499)	Entropy 1.11688 (1.12240)	Top-1 acc 48.438 (42.042)	Top-5 acc 73.047 (66.189)	lr 0.02376
Train [18][530/3239]	Time 0.578 (0.891)	Data Time 0.001 (0.042)	Loss 3.7118 (3.4501)	Entropy 1.11658 (1.12229)	Top-1 acc 36.719 (42.050)	Top-5 acc 62.500 (66.184)	lr 0.02376
Train [18][540/3239]	Time 0.568 (0.890)	Data Time 0.001 (0.041)	Loss 3.3278 (3.4510)	Entropy 1.11653 (1.12218)	Top-1 acc 44.141 (42.032)	Top-5 acc 68.359 (66.167)	lr 0.02376
Train [18][550/3239]	Time 0.696 (0.890)	Data Time 0.001 (0.040)	Loss 3.3999 (3.4506)	Entropy 1.11633 (1.12208)	Top-1 acc 42.969 (42.038)	Top-5 acc 67.188 (66.187)	lr 0.02376
Train [18][560/3239]	Time 0.621 (0.889)	Data Time 0.001 (0.040)	Loss 3.6278 (3.4511)	Entropy 1.11635 (1.12197)	Top-1 acc 38.281 (42.025)	Top-5 acc 64.062 (66.167)	lr 0.02376
Train [18][570/3239]	Time 0.592 (0.925)	Data Time 0.002 (0.039)	Loss 3.4344 (3.4516)	Entropy 1.11579 (1.12187)	Top-1 acc 39.062 (42.013)	Top-5 acc 66.016 (66.163)	lr 0.02376
Train [18][580/3239]	Time 0.648 (0.924)	Data Time 0.001 (0.038)	Loss 3.3404 (3.4512)	Entropy 1.11569 (1.12177)	Top-1 acc 44.141 (42.042)	Top-5 acc 68.359 (66.185)	lr 0.02376
Train [18][590/3239]	Time 0.677 (0.922)	Data Time 0.002 (0.038)	Loss 3.3922 (3.4508)	Entropy 1.11553 (1.12166)	Top-1 acc 44.922 (42.061)	Top-5 acc 69.141 (66.189)	lr 0.02376
Train [18][600/3239]	Time 0.585 (0.921)	Data Time 0.001 (0.037)	Loss 3.6149 (3.4512)	Entropy 1.11563 (1.12156)	Top-1 acc 40.234 (42.072)	Top-5 acc 61.328 (66.177)	lr 0.02376
Train [18][610/3239]	Time 0.543 (0.919)	Data Time 0.001 (0.037)	Loss 3.5906 (3.4519)	Entropy 1.11565 (1.12146)	Top-1 acc 41.797 (42.076)	Top-5 acc 63.672 (66.144)	lr 0.02376
Train [18][620/3239]	Time 0.604 (0.918)	Data Time 0.001 (0.036)	Loss 3.5252 (3.4510)	Entropy 1.11576 (1.12137)	Top-1 acc 44.922 (42.100)	Top-5 acc 64.453 (66.156)	lr 0.02376
Train [18][630/3239]	Time 0.578 (0.917)	Data Time 0.001 (0.036)	Loss 3.5087 (3.4495)	Entropy 1.11560 (1.12128)	Top-1 acc 39.844 (42.123)	Top-5 acc 65.625 (66.182)	lr 0.02375
Train [18][640/3239]	Time 0.662 (0.916)	Data Time 0.001 (0.035)	Loss 3.5501 (3.4505)	Entropy 1.11522 (1.12119)	Top-1 acc 39.453 (42.106)	Top-5 acc 63.672 (66.155)	lr 0.02375
Train [18][650/3239]	Time 0.608 (0.916)	Data Time 0.002 (0.035)	Loss 3.5164 (3.4511)	Entropy 1.11505 (1.12110)	Top-1 acc 39.062 (42.090)	Top-5 acc 64.844 (66.140)	lr 0.02375
Train [18][660/3239]	Time 0.612 (0.915)	Data Time 0.001 (0.034)	Loss 3.4617 (3.4516)	Entropy 1.11492 (1.12100)	Top-1 acc 37.891 (42.074)	Top-5 acc 63.672 (66.116)	lr 0.02375
Train [18][670/3239]	Time 0.585 (0.914)	Data Time 0.001 (0.034)	Loss 3.3534 (3.4522)	Entropy 1.11444 (1.12091)	Top-1 acc 45.703 (42.066)	Top-5 acc 68.750 (66.105)	lr 0.02375
Train [18][680/3239]	Time 0.557 (0.913)	Data Time 0.001 (0.033)	Loss 3.3129 (3.4525)	Entropy 1.11429 (1.12082)	Top-1 acc 43.750 (42.053)	Top-5 acc 68.750 (66.094)	lr 0.02375
Train [18][690/3239]	Time 0.569 (0.912)	Data Time 0.001 (0.033)	Loss 3.4811 (3.4521)	Entropy 1.11395 (1.12072)	Top-1 acc 43.359 (42.076)	Top-5 acc 60.938 (66.103)	lr 0.02375
Train [18][700/3239]	Time 0.645 (0.911)	Data Time 0.001 (0.032)	Loss 3.6297 (3.4515)	Entropy 1.11411 (1.12062)	Top-1 acc 41.406 (42.103)	Top-5 acc 63.672 (66.119)	lr 0.02375
Train [18][710/3239]	Time 0.668 (0.911)	Data Time 0.001 (0.032)	Loss 3.3558 (3.4506)	Entropy 1.11399 (1.12053)	Top-1 acc 41.797 (42.116)	Top-5 acc 68.359 (66.141)	lr 0.02375
Train [18][720/3239]	Time 0.601 (0.910)	Data Time 0.001 (0.031)	Loss 3.2246 (3.4512)	Entropy 1.11415 (1.12044)	Top-1 acc 48.828 (42.112)	Top-5 acc 69.922 (66.135)	lr 0.02375
Train [18][730/3239]	Time 0.590 (0.909)	Data Time 0.001 (0.031)	Loss 3.4190 (3.4515)	Entropy 1.11380 (1.12036)	Top-1 acc 44.141 (42.108)	Top-5 acc 66.016 (66.135)	lr 0.02375
Train [18][740/3239]	Time 0.604 (0.908)	Data Time 0.001 (0.031)	Loss 3.4213 (3.4514)	Entropy 1.11364 (1.12027)	Top-1 acc 40.625 (42.111)	Top-5 acc 67.578 (66.136)	lr 0.02375
Train [18][750/3239]	Time 0.604 (0.908)	Data Time 0.001 (0.030)	Loss 3.4523 (3.4513)	Entropy 1.11281 (1.12018)	Top-1 acc 41.406 (42.109)	Top-5 acc 66.016 (66.136)	lr 0.02375
Train [18][760/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.030)	Loss 3.5652 (3.4514)	Entropy 1.11257 (1.12008)	Top-1 acc 38.672 (42.103)	Top-5 acc 62.891 (66.135)	lr 0.02375
Train [18][770/3239]	Time 0.628 (0.906)	Data Time 0.001 (0.030)	Loss 3.6343 (3.4516)	Entropy 1.11246 (1.11998)	Top-1 acc 35.156 (42.088)	Top-5 acc 65.234 (66.141)	lr 0.02375
Train [18][780/3239]	Time 0.620 (0.905)	Data Time 0.001 (0.029)	Loss 3.3374 (3.4521)	Entropy 1.11255 (1.11988)	Top-1 acc 46.484 (42.074)	Top-5 acc 65.234 (66.124)	lr 0.02375
Train [18][790/3239]	Time 0.581 (0.904)	Data Time 0.001 (0.029)	Loss 3.5670 (3.4532)	Entropy 1.11275 (1.11979)	Top-1 acc 40.625 (42.059)	Top-5 acc 63.281 (66.097)	lr 0.02375
Train [18][800/3239]	Time 0.647 (0.903)	Data Time 0.001 (0.029)	Loss 3.5850 (3.4540)	Entropy 1.11266 (1.11970)	Top-1 acc 39.453 (42.032)	Top-5 acc 62.500 (66.073)	lr 0.02375
Train [18][810/3239]	Time 0.564 (0.902)	Data Time 0.001 (0.028)	Loss 3.5679 (3.4546)	Entropy 1.11252 (1.11962)	Top-1 acc 42.188 (42.022)	Top-5 acc 60.547 (66.050)	lr 0.02375
Train [18][820/3239]	Time 0.609 (0.902)	Data Time 0.001 (0.028)	Loss 3.3369 (3.4553)	Entropy 1.11252 (1.11953)	Top-1 acc 44.922 (42.005)	Top-5 acc 66.406 (66.040)	lr 0.02375
Train [18][830/3239]	Time 0.597 (0.901)	Data Time 0.001 (0.028)	Loss 3.5064 (3.4549)	Entropy 1.11275 (1.11945)	Top-1 acc 38.672 (42.025)	Top-5 acc 66.016 (66.046)	lr 0.02375
Train [18][840/3239]	Time 0.620 (0.900)	Data Time 0.001 (0.027)	Loss 3.3788 (3.4548)	Entropy 1.11275 (1.11937)	Top-1 acc 42.578 (42.017)	Top-5 acc 69.141 (66.059)	lr 0.02375
Train [18][850/3239]	Time 0.601 (0.900)	Data Time 0.001 (0.027)	Loss 3.4758 (3.4551)	Entropy 1.11309 (1.11929)	Top-1 acc 44.531 (42.016)	Top-5 acc 66.016 (66.051)	lr 0.02375
Train [18][860/3239]	Time 0.627 (0.900)	Data Time 0.001 (0.027)	Loss 3.4539 (3.4556)	Entropy 1.11271 (1.11922)	Top-1 acc 46.484 (42.013)	Top-5 acc 69.141 (66.036)	lr 0.02374
Train [18][870/3239]	Time 0.694 (0.899)	Data Time 0.002 (0.026)	Loss 3.3078 (3.4554)	Entropy 1.11283 (1.11914)	Top-1 acc 46.094 (42.022)	Top-5 acc 66.406 (66.037)	lr 0.02374
Train [18][880/3239]	Time 0.642 (0.899)	Data Time 0.001 (0.026)	Loss 3.4149 (3.4562)	Entropy 1.11312 (1.11907)	Top-1 acc 40.625 (42.003)	Top-5 acc 68.359 (66.032)	lr 0.02374
Train [18][890/3239]	Time 0.621 (0.898)	Data Time 0.001 (0.026)	Loss 3.5592 (3.4561)	Entropy 1.11273 (1.11900)	Top-1 acc 40.234 (42.012)	Top-5 acc 63.672 (66.023)	lr 0.02374
Train [18][900/3239]	Time 0.604 (0.898)	Data Time 0.001 (0.026)	Loss 3.2519 (3.4554)	Entropy 1.11238 (1.11893)	Top-1 acc 46.875 (42.031)	Top-5 acc 70.312 (66.042)	lr 0.02374
Train [18][910/3239]	Time 0.588 (0.898)	Data Time 0.001 (0.025)	Loss 3.7331 (3.4562)	Entropy 1.11181 (1.11886)	Top-1 acc 36.719 (42.017)	Top-5 acc 58.203 (66.022)	lr 0.02374
Train [18][920/3239]	Time 0.617 (0.897)	Data Time 0.001 (0.025)	Loss 3.3721 (3.4561)	Entropy 1.11152 (1.11878)	Top-1 acc 44.531 (42.020)	Top-5 acc 67.188 (66.029)	lr 0.02374
Train [18][930/3239]	Time 0.605 (0.897)	Data Time 0.001 (0.025)	Loss 3.5079 (3.4564)	Entropy 1.11143 (1.11870)	Top-1 acc 41.797 (42.013)	Top-5 acc 64.453 (66.016)	lr 0.02374
Train [18][940/3239]	Time 0.696 (0.896)	Data Time 0.001 (0.025)	Loss 3.5062 (3.4564)	Entropy 1.11160 (1.11863)	Top-1 acc 37.109 (42.014)	Top-5 acc 66.016 (66.020)	lr 0.02374
Train [18][950/3239]	Time 0.591 (0.896)	Data Time 0.001 (0.024)	Loss 3.4710 (3.4565)	Entropy 1.11115 (1.11855)	Top-1 acc 41.797 (42.018)	Top-5 acc 65.625 (66.028)	lr 0.02374
Train [18][960/3239]	Time 0.655 (0.895)	Data Time 0.001 (0.024)	Loss 3.3888 (3.4563)	Entropy 1.11096 (1.11848)	Top-1 acc 42.969 (42.028)	Top-5 acc 67.578 (66.031)	lr 0.02374
Train [18][970/3239]	Time 0.555 (0.894)	Data Time 0.001 (0.024)	Loss 3.5252 (3.4570)	Entropy 1.11138 (1.11840)	Top-1 acc 40.625 (42.023)	Top-5 acc 62.109 (66.008)	lr 0.02374
Train [18][980/3239]	Time 0.626 (0.894)	Data Time 0.002 (0.024)	Loss 3.5426 (3.4571)	Entropy 1.11121 (1.11833)	Top-1 acc 37.109 (42.025)	Top-5 acc 64.062 (66.008)	lr 0.02374
Train [18][990/3239]	Time 0.583 (0.893)	Data Time 0.001 (0.023)	Loss 3.6360 (3.4571)	Entropy 1.11087 (1.11825)	Top-1 acc 35.547 (42.025)	Top-5 acc 62.891 (66.008)	lr 0.02374
Train [18][1000/3239]	Time 0.594 (0.893)	Data Time 0.001 (0.023)	Loss 3.2364 (3.4569)	Entropy 1.11094 (1.11818)	Top-1 acc 44.141 (42.023)	Top-5 acc 72.656 (66.019)	lr 0.02374
Train [18][1010/3239]	Time 0.593 (0.893)	Data Time 0.001 (0.023)	Loss 3.5216 (3.4572)	Entropy 1.11101 (1.11811)	Top-1 acc 41.016 (42.007)	Top-5 acc 67.578 (66.016)	lr 0.02374
Train [18][1020/3239]	Time 0.587 (0.892)	Data Time 0.001 (0.023)	Loss 3.5298 (3.4577)	Entropy 1.11056 (1.11804)	Top-1 acc 40.625 (42.002)	Top-5 acc 64.062 (66.001)	lr 0.02374
Train [18][1030/3239]	Time 0.703 (0.892)	Data Time 0.001 (0.023)	Loss 3.3736 (3.4580)	Entropy 1.11055 (1.11797)	Top-1 acc 43.359 (41.986)	Top-5 acc 65.234 (65.999)	lr 0.02374
Train [18][1040/3239]	Time 0.582 (0.892)	Data Time 0.001 (0.022)	Loss 3.5205 (3.4574)	Entropy 1.11025 (1.11789)	Top-1 acc 39.453 (42.000)	Top-5 acc 64.062 (65.999)	lr 0.02374
Train [18][1050/3239]	Time 0.620 (0.891)	Data Time 0.001 (0.022)	Loss 3.3225 (3.4568)	Entropy 1.11021 (1.11782)	Top-1 acc 46.094 (42.013)	Top-5 acc 68.359 (66.013)	lr 0.02374
Train [18][1060/3239]	Time 0.621 (0.891)	Data Time 0.001 (0.022)	Loss 3.5082 (3.4565)	Entropy 1.10968 (1.11775)	Top-1 acc 44.531 (42.015)	Top-5 acc 61.328 (66.013)	lr 0.02374
Train [18][1070/3239]	Time 0.569 (0.891)	Data Time 0.001 (0.022)	Loss 3.3080 (3.4561)	Entropy 1.10974 (1.11767)	Top-1 acc 43.359 (42.019)	Top-5 acc 69.531 (66.026)	lr 0.02374
Train [18][1080/3239]	Time 0.612 (0.890)	Data Time 0.001 (0.022)	Loss 3.4389 (3.4566)	Entropy 1.10969 (1.11760)	Top-1 acc 42.578 (42.007)	Top-5 acc 69.922 (66.015)	lr 0.02373
Train [18][1090/3239]	Time 0.540 (0.890)	Data Time 0.001 (0.021)	Loss 3.3728 (3.4560)	Entropy 1.10948 (1.11752)	Top-1 acc 44.922 (42.024)	Top-5 acc 69.141 (66.029)	lr 0.02373
Train [18][1100/3239]	Time 0.681 (0.889)	Data Time 0.001 (0.021)	Loss 3.4194 (3.4561)	Entropy 1.10910 (1.11745)	Top-1 acc 41.016 (42.024)	Top-5 acc 65.234 (66.018)	lr 0.02373
Train [18][1110/3239]	Time 0.573 (0.889)	Data Time 0.001 (0.021)	Loss 3.4625 (3.4556)	Entropy 1.10906 (1.11738)	Top-1 acc 42.188 (42.038)	Top-5 acc 64.062 (66.030)	lr 0.02373
Train [18][1120/3239]	Time 0.580 (0.888)	Data Time 0.001 (0.021)	Loss 3.3061 (3.4557)	Entropy 1.10874 (1.11730)	Top-1 acc 46.094 (42.041)	Top-5 acc 68.359 (66.027)	lr 0.02373
Train [18][1130/3239]	Time 0.575 (0.888)	Data Time 0.001 (0.021)	Loss 3.3858 (3.4553)	Entropy 1.10887 (1.11723)	Top-1 acc 46.484 (42.042)	Top-5 acc 66.016 (66.026)	lr 0.02373
Train [18][1140/3239]	Time 0.576 (0.887)	Data Time 0.001 (0.021)	Loss 3.4638 (3.4554)	Entropy 1.10817 (1.11715)	Top-1 acc 43.750 (42.036)	Top-5 acc 63.672 (66.022)	lr 0.02373
Train [18][1150/3239]	Time 0.560 (0.887)	Data Time 0.002 (0.020)	Loss 3.4743 (3.4553)	Entropy 1.10817 (1.11707)	Top-1 acc 43.750 (42.039)	Top-5 acc 66.797 (66.023)	lr 0.02373
Train [18][1160/3239]	Time 0.656 (0.887)	Data Time 0.001 (0.020)	Loss 3.5776 (3.4557)	Entropy 1.10839 (1.11700)	Top-1 acc 42.188 (42.039)	Top-5 acc 66.016 (66.017)	lr 0.02373
Train [18][1170/3239]	Time 0.652 (0.887)	Data Time 0.001 (0.020)	Loss 3.4011 (3.4561)	Entropy 1.10803 (1.11692)	Top-1 acc 43.359 (42.026)	Top-5 acc 67.969 (66.014)	lr 0.02373
Train [18][1180/3239]	Time 0.595 (0.887)	Data Time 0.001 (0.020)	Loss 3.3910 (3.4557)	Entropy 1.10786 (1.11685)	Top-1 acc 44.141 (42.039)	Top-5 acc 64.844 (66.016)	lr 0.02373
Train [18][1190/3239]	Time 0.708 (0.886)	Data Time 0.001 (0.020)	Loss 3.5735 (3.4559)	Entropy 1.10765 (1.11677)	Top-1 acc 41.016 (42.036)	Top-5 acc 62.891 (66.019)	lr 0.02373
Train [18][1200/3239]	Time 0.611 (0.886)	Data Time 0.001 (0.020)	Loss 3.6266 (3.4560)	Entropy 1.10785 (1.11670)	Top-1 acc 38.281 (42.037)	Top-5 acc 62.109 (66.011)	lr 0.02373
Train [18][1210/3239]	Time 0.648 (0.886)	Data Time 0.001 (0.020)	Loss 3.4246 (3.4553)	Entropy 1.10751 (1.11662)	Top-1 acc 44.531 (42.051)	Top-5 acc 67.578 (66.028)	lr 0.02373
Train [18][1220/3239]	Time 0.709 (0.903)	Data Time 0.004 (0.019)	Loss 3.3472 (3.4551)	Entropy 1.10758 (1.11655)	Top-1 acc 45.312 (42.057)	Top-5 acc 69.922 (66.036)	lr 0.02373
Train [18][1230/3239]	Time 0.589 (0.903)	Data Time 0.002 (0.019)	Loss 3.3454 (3.4553)	Entropy 1.10755 (1.11648)	Top-1 acc 44.141 (42.047)	Top-5 acc 68.750 (66.032)	lr 0.02373
Train [18][1240/3239]	Time 0.519 (0.902)	Data Time 0.001 (0.019)	Loss 3.4975 (3.4549)	Entropy 1.10736 (1.11640)	Top-1 acc 43.359 (42.056)	Top-5 acc 64.062 (66.028)	lr 0.02373
Train [18][1250/3239]	Time 0.620 (0.902)	Data Time 0.001 (0.019)	Loss 3.3078 (3.4547)	Entropy 1.10784 (1.11633)	Top-1 acc 41.797 (42.062)	Top-5 acc 68.750 (66.034)	lr 0.02373
Train [18][1260/3239]	Time 0.688 (0.902)	Data Time 0.001 (0.019)	Loss 3.2806 (3.4545)	Entropy 1.10763 (1.11627)	Top-1 acc 48.047 (42.067)	Top-5 acc 69.922 (66.033)	lr 0.02373
Train [18][1270/3239]	Time 0.602 (0.901)	Data Time 0.001 (0.019)	Loss 3.5766 (3.4547)	Entropy 1.10765 (1.11620)	Top-1 acc 40.625 (42.065)	Top-5 acc 64.062 (66.027)	lr 0.02373
Train [18][1280/3239]	Time 0.649 (0.901)	Data Time 0.001 (0.019)	Loss 3.3757 (3.4546)	Entropy 1.10752 (1.11613)	Top-1 acc 45.703 (42.069)	Top-5 acc 65.625 (66.031)	lr 0.02373
Train [18][1290/3239]	Time 0.631 (0.900)	Data Time 0.001 (0.018)	Loss 3.5383 (3.4549)	Entropy 1.10732 (1.11606)	Top-1 acc 40.625 (42.075)	Top-5 acc 66.016 (66.025)	lr 0.02373
Train [18][1300/3239]	Time 0.585 (0.900)	Data Time 0.001 (0.018)	Loss 3.4093 (3.4545)	Entropy 1.10750 (1.11600)	Top-1 acc 44.531 (42.097)	Top-5 acc 67.188 (66.035)	lr 0.02373
Train [18][1310/3239]	Time 0.596 (0.900)	Data Time 0.001 (0.018)	Loss 3.4199 (3.4544)	Entropy 1.10717 (1.11593)	Top-1 acc 44.141 (42.099)	Top-5 acc 65.625 (66.033)	lr 0.02372
Train [18][1320/3239]	Time 0.585 (0.899)	Data Time 0.001 (0.018)	Loss 3.5487 (3.4542)	Entropy 1.10715 (1.11586)	Top-1 acc 40.625 (42.107)	Top-5 acc 65.234 (66.040)	lr 0.02372
Train [18][1330/3239]	Time 0.575 (0.899)	Data Time 0.001 (0.018)	Loss 3.6256 (3.4546)	Entropy 1.10730 (1.11580)	Top-1 acc 37.500 (42.102)	Top-5 acc 63.281 (66.036)	lr 0.02372
Train [18][1340/3239]	Time 0.618 (0.899)	Data Time 0.001 (0.018)	Loss 3.3835 (3.4548)	Entropy 1.10735 (1.11573)	Top-1 acc 43.750 (42.101)	Top-5 acc 68.359 (66.030)	lr 0.02372
Train [18][1350/3239]	Time 0.688 (0.898)	Data Time 0.002 (0.018)	Loss 3.3450 (3.4544)	Entropy 1.10729 (1.11567)	Top-1 acc 45.703 (42.108)	Top-5 acc 66.406 (66.041)	lr 0.02372
Train [18][1360/3239]	Time 0.591 (0.898)	Data Time 0.001 (0.018)	Loss 3.0640 (3.4538)	Entropy 1.10690 (1.11561)	Top-1 acc 53.516 (42.134)	Top-5 acc 69.922 (66.050)	lr 0.02372
Train [18][1370/3239]	Time 0.602 (0.898)	Data Time 0.001 (0.018)	Loss 3.3919 (3.4540)	Entropy 1.10672 (1.11555)	Top-1 acc 41.797 (42.127)	Top-5 acc 67.188 (66.043)	lr 0.02372
Train [18][1380/3239]	Time 0.603 (0.897)	Data Time 0.001 (0.017)	Loss 3.3424 (3.4540)	Entropy 1.10629 (1.11548)	Top-1 acc 44.922 (42.122)	Top-5 acc 67.578 (66.043)	lr 0.02372
Train [18][1390/3239]	Time 0.647 (0.897)	Data Time 0.001 (0.017)	Loss 3.5440 (3.4541)	Entropy 1.10617 (1.11541)	Top-1 acc 36.719 (42.121)	Top-5 acc 62.891 (66.044)	lr 0.02372
Train [18][1400/3239]	Time 0.581 (0.897)	Data Time 0.001 (0.017)	Loss 3.4075 (3.4540)	Entropy 1.10617 (1.11535)	Top-1 acc 42.578 (42.118)	Top-5 acc 68.750 (66.050)	lr 0.02372
Train [18][1410/3239]	Time 0.599 (0.896)	Data Time 0.001 (0.017)	Loss 3.5808 (3.4541)	Entropy 1.10611 (1.11528)	Top-1 acc 38.672 (42.113)	Top-5 acc 63.672 (66.049)	lr 0.02372
Train [18][1420/3239]	Time 0.720 (0.896)	Data Time 0.001 (0.017)	Loss 3.4724 (3.4534)	Entropy 1.10565 (1.11522)	Top-1 acc 38.281 (42.130)	Top-5 acc 62.109 (66.062)	lr 0.02372
Train [18][1430/3239]	Time 0.586 (0.896)	Data Time 0.001 (0.017)	Loss 3.6132 (3.4540)	Entropy 1.10552 (1.11515)	Top-1 acc 40.625 (42.116)	Top-5 acc 60.547 (66.047)	lr 0.02372
Train [18][1440/3239]	Time 0.468 (0.895)	Data Time 0.001 (0.017)	Loss 3.1574 (3.4535)	Entropy 1.10545 (1.11508)	Top-1 acc 49.609 (42.123)	Top-5 acc 73.438 (66.057)	lr 0.02372
Train [18][1450/3239]	Time 0.674 (0.895)	Data Time 0.002 (0.017)	Loss 3.3151 (3.4537)	Entropy 1.10542 (1.11502)	Top-1 acc 43.359 (42.116)	Top-5 acc 72.266 (66.057)	lr 0.02372
Train [18][1460/3239]	Time 0.577 (0.895)	Data Time 0.001 (0.017)	Loss 3.5995 (3.4539)	Entropy 1.10582 (1.11495)	Top-1 acc 39.062 (42.107)	Top-5 acc 60.156 (66.050)	lr 0.02372
Train [18][1470/3239]	Time 0.575 (0.894)	Data Time 0.001 (0.016)	Loss 3.5164 (3.4539)	Entropy 1.10529 (1.11489)	Top-1 acc 41.797 (42.105)	Top-5 acc 64.844 (66.049)	lr 0.02372
Train [18][1480/3239]	Time 0.598 (0.894)	Data Time 0.001 (0.016)	Loss 3.4265 (3.4537)	Entropy 1.10539 (1.11482)	Top-1 acc 42.188 (42.111)	Top-5 acc 66.406 (66.057)	lr 0.02372
Train [18][1490/3239]	Time 0.715 (0.894)	Data Time 0.001 (0.016)	Loss 3.6129 (3.4535)	Entropy 1.10477 (1.11476)	Top-1 acc 41.797 (42.119)	Top-5 acc 64.453 (66.058)	lr 0.02372
Train [18][1500/3239]	Time 0.568 (0.893)	Data Time 0.002 (0.016)	Loss 3.6342 (3.4536)	Entropy 1.10480 (1.11469)	Top-1 acc 35.547 (42.111)	Top-5 acc 63.281 (66.055)	lr 0.02372
Train [18][1510/3239]	Time 0.597 (0.893)	Data Time 0.001 (0.016)	Loss 3.2488 (3.4538)	Entropy 1.10478 (1.11463)	Top-1 acc 46.094 (42.109)	Top-5 acc 70.703 (66.051)	lr 0.02372
Train [18][1520/3239]	Time 0.589 (0.893)	Data Time 0.002 (0.016)	Loss 3.6742 (3.4537)	Entropy 1.10453 (1.11456)	Top-1 acc 35.547 (42.101)	Top-5 acc 61.328 (66.046)	lr 0.02372
Train [18][1530/3239]	Time 0.584 (0.893)	Data Time 0.001 (0.016)	Loss 3.4761 (3.4537)	Entropy 1.10438 (1.11450)	Top-1 acc 42.969 (42.103)	Top-5 acc 67.188 (66.051)	lr 0.02371
Train [18][1540/3239]	Time 0.592 (0.892)	Data Time 0.001 (0.016)	Loss 3.3788 (3.4536)	Entropy 1.10456 (1.11443)	Top-1 acc 45.312 (42.103)	Top-5 acc 68.359 (66.052)	lr 0.02371
Train [18][1550/3239]	Time 0.576 (0.892)	Data Time 0.001 (0.016)	Loss 3.4862 (3.4538)	Entropy 1.10430 (1.11437)	Top-1 acc 40.625 (42.106)	Top-5 acc 64.844 (66.041)	lr 0.02371
Train [18][1560/3239]	Time 0.568 (0.892)	Data Time 0.001 (0.016)	Loss 3.6672 (3.4535)	Entropy 1.10404 (1.11430)	Top-1 acc 39.844 (42.113)	Top-5 acc 60.547 (66.046)	lr 0.02371
Train [18][1570/3239]	Time 0.593 (0.892)	Data Time 0.001 (0.016)	Loss 3.5431 (3.4532)	Entropy 1.10401 (1.11424)	Top-1 acc 42.578 (42.116)	Top-5 acc 63.281 (66.049)	lr 0.02371
Train [18][1580/3239]	Time 0.661 (0.891)	Data Time 0.001 (0.015)	Loss 3.5258 (3.4529)	Entropy 1.10407 (1.11417)	Top-1 acc 41.016 (42.115)	Top-5 acc 65.625 (66.058)	lr 0.02371
Train [18][1590/3239]	Time 0.573 (0.891)	Data Time 0.001 (0.015)	Loss 3.4420 (3.4529)	Entropy 1.10371 (1.11411)	Top-1 acc 43.750 (42.118)	Top-5 acc 69.531 (66.065)	lr 0.02371
Train [18][1600/3239]	Time 0.547 (0.891)	Data Time 0.001 (0.015)	Loss 3.4179 (3.4528)	Entropy 1.10400 (1.11404)	Top-1 acc 44.531 (42.125)	Top-5 acc 65.625 (66.067)	lr 0.02371
Train [18][1610/3239]	Time 0.624 (0.890)	Data Time 0.001 (0.015)	Loss 3.2831 (3.4527)	Entropy 1.10365 (1.11398)	Top-1 acc 46.875 (42.124)	Top-5 acc 66.797 (66.061)	lr 0.02371
Train [18][1620/3239]	Time 0.593 (0.890)	Data Time 0.001 (0.015)	Loss 3.5829 (3.4528)	Entropy 1.10355 (1.11392)	Top-1 acc 41.016 (42.118)	Top-5 acc 66.406 (66.066)	lr 0.02371
Train [18][1630/3239]	Time 0.623 (0.890)	Data Time 0.001 (0.015)	Loss 3.3442 (3.4527)	Entropy 1.10359 (1.11385)	Top-1 acc 48.828 (42.125)	Top-5 acc 67.969 (66.069)	lr 0.02371
Train [18][1640/3239]	Time 0.568 (0.889)	Data Time 0.001 (0.015)	Loss 3.3363 (3.4524)	Entropy 1.10380 (1.11379)	Top-1 acc 43.359 (42.133)	Top-5 acc 69.531 (66.076)	lr 0.02371
Train [18][1650/3239]	Time 0.694 (0.889)	Data Time 0.001 (0.015)	Loss 3.6249 (3.4527)	Entropy 1.10361 (1.11373)	Top-1 acc 39.844 (42.125)	Top-5 acc 62.500 (66.070)	lr 0.02371
Train [18][1660/3239]	Time 0.600 (0.889)	Data Time 0.001 (0.015)	Loss 3.2676 (3.4523)	Entropy 1.10296 (1.11367)	Top-1 acc 46.484 (42.132)	Top-5 acc 69.922 (66.079)	lr 0.02371
Train [18][1670/3239]	Time 0.616 (0.889)	Data Time 0.002 (0.015)	Loss 3.5535 (3.4522)	Entropy 1.10292 (1.11360)	Top-1 acc 38.281 (42.138)	Top-5 acc 63.281 (66.074)	lr 0.02371
Train [18][1680/3239]	Time 0.596 (0.889)	Data Time 0.001 (0.015)	Loss 3.5175 (3.4523)	Entropy 1.10334 (1.11354)	Top-1 acc 41.797 (42.138)	Top-5 acc 63.281 (66.076)	lr 0.02371
Train [18][1690/3239]	Time 0.605 (0.888)	Data Time 0.001 (0.015)	Loss 3.3908 (3.4522)	Entropy 1.10290 (1.11348)	Top-1 acc 44.141 (42.136)	Top-5 acc 70.703 (66.081)	lr 0.02371
Train [18][1700/3239]	Time 0.613 (0.888)	Data Time 0.001 (0.014)	Loss 3.5827 (3.4521)	Entropy 1.10272 (1.11342)	Top-1 acc 35.938 (42.131)	Top-5 acc 62.500 (66.079)	lr 0.02371
Train [18][1710/3239]	Time 0.599 (0.888)	Data Time 0.001 (0.014)	Loss 3.3290 (3.4520)	Entropy 1.10262 (1.11335)	Top-1 acc 44.922 (42.128)	Top-5 acc 69.922 (66.083)	lr 0.02371
Train [18][1720/3239]	Time 0.596 (0.888)	Data Time 0.001 (0.014)	Loss 3.5866 (3.4519)	Entropy 1.10280 (1.11329)	Top-1 acc 37.109 (42.129)	Top-5 acc 62.109 (66.084)	lr 0.02371
Train [18][1730/3239]	Time 0.616 (0.888)	Data Time 0.001 (0.014)	Loss 3.5016 (3.4518)	Entropy 1.10271 (1.11323)	Top-1 acc 39.062 (42.127)	Top-5 acc 66.406 (66.086)	lr 0.02371
Train [18][1740/3239]	Time 0.625 (0.887)	Data Time 0.001 (0.014)	Loss 3.4420 (3.4522)	Entropy 1.10252 (1.11317)	Top-1 acc 40.625 (42.122)	Top-5 acc 63.672 (66.080)	lr 0.02371
Train [18][1750/3239]	Time 0.584 (0.887)	Data Time 0.001 (0.014)	Loss 3.3786 (3.4519)	Entropy 1.10222 (1.11311)	Top-1 acc 41.406 (42.129)	Top-5 acc 71.094 (66.090)	lr 0.02371
Train [18][1760/3239]	Time 0.496 (0.887)	Data Time 0.001 (0.014)	Loss 3.6052 (3.4521)	Entropy 1.10218 (1.11305)	Top-1 acc 37.109 (42.119)	Top-5 acc 64.062 (66.083)	lr 0.02370
Train [18][1770/3239]	Time 0.545 (0.887)	Data Time 0.001 (0.014)	Loss 3.4571 (3.4521)	Entropy 1.10198 (1.11299)	Top-1 acc 43.750 (42.116)	Top-5 acc 62.891 (66.082)	lr 0.02370
Train [18][1780/3239]	Time 0.583 (0.886)	Data Time 0.001 (0.014)	Loss 3.4491 (3.4518)	Entropy 1.10214 (1.11292)	Top-1 acc 40.625 (42.125)	Top-5 acc 67.969 (66.092)	lr 0.02370
Train [18][1790/3239]	Time 0.614 (0.886)	Data Time 0.001 (0.014)	Loss 3.5468 (3.4518)	Entropy 1.10202 (1.11286)	Top-1 acc 40.234 (42.123)	Top-5 acc 62.109 (66.093)	lr 0.02370
Train [18][1800/3239]	Time 0.599 (0.886)	Data Time 0.001 (0.014)	Loss 3.4171 (3.4515)	Entropy 1.10162 (1.11280)	Top-1 acc 40.625 (42.127)	Top-5 acc 67.188 (66.103)	lr 0.02370
Train [18][1810/3239]	Time 0.696 (0.886)	Data Time 0.001 (0.014)	Loss 3.4938 (3.4517)	Entropy 1.10136 (1.11274)	Top-1 acc 39.062 (42.125)	Top-5 acc 66.406 (66.100)	lr 0.02370
Train [18][1820/3239]	Time 0.612 (0.885)	Data Time 0.001 (0.014)	Loss 3.2934 (3.4517)	Entropy 1.10123 (1.11268)	Top-1 acc 45.703 (42.125)	Top-5 acc 69.141 (66.101)	lr 0.02370
Train [18][1830/3239]	Time 0.622 (0.885)	Data Time 0.001 (0.014)	Loss 3.4237 (3.4517)	Entropy 1.10135 (1.11261)	Top-1 acc 42.969 (42.124)	Top-5 acc 67.188 (66.105)	lr 0.02370
Train [18][1840/3239]	Time 0.591 (0.885)	Data Time 0.001 (0.014)	Loss 3.2370 (3.4517)	Entropy 1.10127 (1.11255)	Top-1 acc 44.141 (42.122)	Top-5 acc 69.141 (66.101)	lr 0.02370
Train [18][1850/3239]	Time 0.576 (0.885)	Data Time 0.001 (0.013)	Loss 3.3329 (3.4514)	Entropy 1.10095 (1.11249)	Top-1 acc 41.016 (42.127)	Top-5 acc 66.406 (66.109)	lr 0.02370
Train [18][1860/3239]	Time 0.601 (0.885)	Data Time 0.001 (0.013)	Loss 3.6351 (3.4510)	Entropy 1.10089 (1.11243)	Top-1 acc 39.062 (42.134)	Top-5 acc 63.672 (66.123)	lr 0.02370
Train [18][1870/3239]	Time 0.634 (0.885)	Data Time 0.002 (0.013)	Loss 3.4272 (3.4507)	Entropy 1.10073 (1.11237)	Top-1 acc 42.578 (42.143)	Top-5 acc 65.625 (66.129)	lr 0.02370
Train [18][1880/3239]	Time 0.708 (0.895)	Data Time 0.002 (0.013)	Loss 3.2730 (3.4506)	Entropy 1.10049 (1.11231)	Top-1 acc 45.312 (42.145)	Top-5 acc 69.141 (66.134)	lr 0.02370
Train [18][1890/3239]	Time 0.622 (0.895)	Data Time 0.001 (0.013)	Loss 3.2030 (3.4504)	Entropy 1.10030 (1.11224)	Top-1 acc 47.266 (42.151)	Top-5 acc 71.484 (66.143)	lr 0.02370
Train [18][1900/3239]	Time 0.622 (0.895)	Data Time 0.002 (0.013)	Loss 3.5529 (3.4501)	Entropy 1.09987 (1.11218)	Top-1 acc 40.234 (42.153)	Top-5 acc 65.625 (66.149)	lr 0.02370
Train [18][1910/3239]	Time 0.553 (0.894)	Data Time 0.001 (0.013)	Loss 3.4337 (3.4503)	Entropy 1.10002 (1.11212)	Top-1 acc 44.531 (42.154)	Top-5 acc 64.844 (66.142)	lr 0.02370
Train [18][1920/3239]	Time 0.503 (0.894)	Data Time 0.002 (0.013)	Loss 3.4828 (3.4505)	Entropy 1.10000 (1.11205)	Top-1 acc 41.797 (42.150)	Top-5 acc 65.234 (66.134)	lr 0.02370
Train [18][1930/3239]	Time 0.570 (0.894)	Data Time 0.001 (0.013)	Loss 3.4847 (3.4505)	Entropy 1.09977 (1.11199)	Top-1 acc 42.188 (42.153)	Top-5 acc 64.062 (66.136)	lr 0.02370
Train [18][1940/3239]	Time 0.607 (0.894)	Data Time 0.001 (0.013)	Loss 3.2423 (3.4505)	Entropy 1.09997 (1.11193)	Top-1 acc 46.094 (42.154)	Top-5 acc 70.312 (66.133)	lr 0.02370
Train [18][1950/3239]	Time 0.573 (0.893)	Data Time 0.001 (0.013)	Loss 3.3816 (3.4506)	Entropy 1.09974 (1.11186)	Top-1 acc 42.578 (42.157)	Top-5 acc 66.797 (66.131)	lr 0.02370
Train [18][1960/3239]	Time 0.640 (0.893)	Data Time 0.001 (0.013)	Loss 3.3021 (3.4502)	Entropy 1.09928 (1.11180)	Top-1 acc 44.531 (42.160)	Top-5 acc 69.922 (66.139)	lr 0.02370
Train [18][1970/3239]	Time 0.677 (0.893)	Data Time 0.001 (0.013)	Loss 3.7706 (3.4504)	Entropy 1.09916 (1.11174)	Top-1 acc 37.500 (42.158)	Top-5 acc 59.766 (66.136)	lr 0.02370
Train [18][1980/3239]	Time 0.584 (0.893)	Data Time 0.001 (0.013)	Loss 3.6152 (3.4504)	Entropy 1.09897 (1.11167)	Top-1 acc 42.188 (42.153)	Top-5 acc 64.062 (66.140)	lr 0.02369
Train [18][1990/3239]	Time 0.579 (0.893)	Data Time 0.001 (0.013)	Loss 3.4255 (3.4504)	Entropy 1.09871 (1.11161)	Top-1 acc 38.281 (42.148)	Top-5 acc 67.578 (66.142)	lr 0.02369
Train [18][2000/3239]	Time 0.598 (0.892)	Data Time 0.001 (0.013)	Loss 3.2888 (3.4505)	Entropy 1.09836 (1.11155)	Top-1 acc 43.750 (42.142)	Top-5 acc 67.188 (66.141)	lr 0.02369
Train [18][2010/3239]	Time 0.570 (0.892)	Data Time 0.001 (0.013)	Loss 3.4381 (3.4506)	Entropy 1.09785 (1.11148)	Top-1 acc 44.922 (42.148)	Top-5 acc 66.406 (66.139)	lr 0.02369
Train [18][2020/3239]	Time 0.565 (0.892)	Data Time 0.001 (0.013)	Loss 3.5040 (3.4506)	Entropy 1.09795 (1.11141)	Top-1 acc 39.062 (42.146)	Top-5 acc 64.844 (66.135)	lr 0.02369
Train [18][2030/3239]	Time 0.627 (0.892)	Data Time 0.001 (0.012)	Loss 3.3599 (3.4504)	Entropy 1.09792 (1.11135)	Top-1 acc 43.750 (42.149)	Top-5 acc 67.578 (66.140)	lr 0.02369
Train [18][2040/3239]	Time 0.711 (0.892)	Data Time 0.001 (0.012)	Loss 3.6890 (3.4504)	Entropy 1.09728 (1.11128)	Top-1 acc 35.156 (42.145)	Top-5 acc 58.984 (66.138)	lr 0.02369
Train [18][2050/3239]	Time 0.604 (0.891)	Data Time 0.001 (0.012)	Loss 3.3827 (3.4504)	Entropy 1.09694 (1.11121)	Top-1 acc 43.750 (42.143)	Top-5 acc 66.016 (66.138)	lr 0.02369
Train [18][2060/3239]	Time 0.596 (0.891)	Data Time 0.001 (0.012)	Loss 3.3426 (3.4502)	Entropy 1.09694 (1.11114)	Top-1 acc 44.141 (42.140)	Top-5 acc 68.359 (66.144)	lr 0.02369
Train [18][2070/3239]	Time 0.576 (0.891)	Data Time 0.001 (0.012)	Loss 3.2544 (3.4503)	Entropy 1.09710 (1.11107)	Top-1 acc 44.531 (42.134)	Top-5 acc 71.875 (66.140)	lr 0.02369
Train [18][2080/3239]	Time 0.585 (0.891)	Data Time 0.001 (0.012)	Loss 3.5157 (3.4506)	Entropy 1.09727 (1.11101)	Top-1 acc 37.891 (42.126)	Top-5 acc 68.359 (66.140)	lr 0.02369
Train [18][2090/3239]	Time 0.580 (0.891)	Data Time 0.001 (0.012)	Loss 3.6043 (3.4506)	Entropy 1.09760 (1.11094)	Top-1 acc 38.281 (42.124)	Top-5 acc 65.625 (66.144)	lr 0.02369
Train [18][2100/3239]	Time 0.562 (0.890)	Data Time 0.001 (0.012)	Loss 3.6335 (3.4508)	Entropy 1.09766 (1.11088)	Top-1 acc 41.016 (42.117)	Top-5 acc 64.062 (66.143)	lr 0.02369
Train [18][2110/3239]	Time 0.618 (0.890)	Data Time 0.001 (0.012)	Loss 3.3613 (3.4507)	Entropy 1.09748 (1.11081)	Top-1 acc 46.094 (42.119)	Top-5 acc 67.188 (66.144)	lr 0.02369
Train [18][2120/3239]	Time 0.658 (0.890)	Data Time 0.001 (0.012)	Loss 3.2094 (3.4507)	Entropy 1.09753 (1.11075)	Top-1 acc 49.609 (42.119)	Top-5 acc 72.266 (66.143)	lr 0.02369
Train [18][2130/3239]	Time 0.614 (0.890)	Data Time 0.001 (0.012)	Loss 3.4186 (3.4508)	Entropy 1.09734 (1.11069)	Top-1 acc 42.188 (42.118)	Top-5 acc 64.062 (66.140)	lr 0.02369
Train [18][2140/3239]	Time 0.564 (0.889)	Data Time 0.001 (0.012)	Loss 3.4975 (3.4510)	Entropy 1.09748 (1.11063)	Top-1 acc 38.672 (42.111)	Top-5 acc 66.797 (66.135)	lr 0.02369
Train [18][2150/3239]	Time 0.588 (0.889)	Data Time 0.001 (0.012)	Loss 3.6392 (3.4513)	Entropy 1.09726 (1.11057)	Top-1 acc 32.031 (42.103)	Top-5 acc 62.891 (66.134)	lr 0.02369
Train [18][2160/3239]	Time 0.586 (0.889)	Data Time 0.001 (0.012)	Loss 3.5530 (3.4516)	Entropy 1.09738 (1.11050)	Top-1 acc 42.578 (42.102)	Top-5 acc 68.359 (66.132)	lr 0.02369
Train [18][2170/3239]	Time 0.580 (0.889)	Data Time 0.001 (0.012)	Loss 3.3754 (3.4516)	Entropy 1.09712 (1.11044)	Top-1 acc 42.578 (42.105)	Top-5 acc 70.703 (66.135)	lr 0.02369
Train [18][2180/3239]	Time 0.597 (0.889)	Data Time 0.001 (0.012)	Loss 3.4471 (3.4518)	Entropy 1.09696 (1.11038)	Top-1 acc 42.578 (42.097)	Top-5 acc 64.062 (66.133)	lr 0.02369
Train [18][2190/3239]	Time 0.586 (0.889)	Data Time 0.001 (0.012)	Loss 3.2166 (3.4519)	Entropy 1.09671 (1.11032)	Top-1 acc 45.312 (42.097)	Top-5 acc 72.266 (66.133)	lr 0.02369
Train [18][2200/3239]	Time 0.690 (0.889)	Data Time 0.001 (0.012)	Loss 3.5497 (3.4518)	Entropy 1.09669 (1.11026)	Top-1 acc 41.406 (42.102)	Top-5 acc 63.281 (66.132)	lr 0.02368
Train [18][2210/3239]	Time 0.565 (0.888)	Data Time 0.001 (0.012)	Loss 3.4041 (3.4516)	Entropy 1.09613 (1.11020)	Top-1 acc 41.016 (42.107)	Top-5 acc 65.625 (66.137)	lr 0.02368
Train [18][2220/3239]	Time 0.607 (0.888)	Data Time 0.002 (0.012)	Loss 3.4543 (3.4518)	Entropy 1.09577 (1.11013)	Top-1 acc 44.922 (42.110)	Top-5 acc 65.234 (66.128)	lr 0.02368
Train [18][2230/3239]	Time 0.596 (0.888)	Data Time 0.001 (0.011)	Loss 3.3735 (3.4519)	Entropy 1.09556 (1.11007)	Top-1 acc 38.281 (42.108)	Top-5 acc 68.359 (66.125)	lr 0.02368
Train [18][2240/3239]	Time 0.499 (0.888)	Data Time 0.001 (0.011)	Loss 3.2666 (3.4519)	Entropy 1.09542 (1.11000)	Top-1 acc 44.922 (42.111)	Top-5 acc 71.094 (66.121)	lr 0.02368
Train [18][2250/3239]	Time 0.578 (0.888)	Data Time 0.001 (0.011)	Loss 3.3901 (3.4516)	Entropy 1.09535 (1.10994)	Top-1 acc 41.406 (42.116)	Top-5 acc 66.016 (66.126)	lr 0.02368
Train [18][2260/3239]	Time 0.661 (0.887)	Data Time 0.001 (0.011)	Loss 3.2365 (3.4514)	Entropy 1.09499 (1.10987)	Top-1 acc 45.703 (42.120)	Top-5 acc 70.312 (66.131)	lr 0.02368
Train [18][2270/3239]	Time 0.671 (0.887)	Data Time 0.001 (0.011)	Loss 3.4892 (3.4516)	Entropy 1.09439 (1.10981)	Top-1 acc 42.188 (42.120)	Top-5 acc 63.281 (66.127)	lr 0.02368
Train [18][2280/3239]	Time 0.602 (0.887)	Data Time 0.001 (0.011)	Loss 3.5766 (3.4515)	Entropy 1.09407 (1.10974)	Top-1 acc 41.406 (42.127)	Top-5 acc 64.062 (66.133)	lr 0.02368
Train [18][2290/3239]	Time 0.559 (0.887)	Data Time 0.001 (0.011)	Loss 3.5110 (3.4515)	Entropy 1.09431 (1.10967)	Top-1 acc 44.141 (42.127)	Top-5 acc 64.453 (66.136)	lr 0.02368
Train [18][2300/3239]	Time 0.610 (0.887)	Data Time 0.001 (0.011)	Loss 3.5168 (3.4514)	Entropy 1.09365 (1.10960)	Top-1 acc 41.406 (42.130)	Top-5 acc 66.797 (66.137)	lr 0.02368
Train [18][2310/3239]	Time 0.602 (0.886)	Data Time 0.001 (0.011)	Loss 3.5010 (3.4514)	Entropy 1.09298 (1.10953)	Top-1 acc 40.234 (42.127)	Top-5 acc 62.500 (66.133)	lr 0.02368
Train [18][2320/3239]	Time 0.626 (0.886)	Data Time 0.001 (0.011)	Loss 3.3893 (3.4514)	Entropy 1.09292 (1.10946)	Top-1 acc 46.094 (42.126)	Top-5 acc 64.062 (66.135)	lr 0.02368
Train [18][2330/3239]	Time 0.596 (0.886)	Data Time 0.001 (0.011)	Loss 3.5036 (3.4514)	Entropy 1.09261 (1.10939)	Top-1 acc 40.625 (42.125)	Top-5 acc 62.500 (66.138)	lr 0.02368
Train [18][2340/3239]	Time 0.578 (0.886)	Data Time 0.001 (0.011)	Loss 3.6924 (3.4512)	Entropy 1.09244 (1.10932)	Top-1 acc 29.688 (42.129)	Top-5 acc 58.203 (66.139)	lr 0.02368
Train [18][2350/3239]	Time 0.625 (0.886)	Data Time 0.003 (0.011)	Loss 3.3848 (3.4513)	Entropy 1.09201 (1.10924)	Top-1 acc 46.094 (42.130)	Top-5 acc 67.578 (66.141)	lr 0.02368
Train [18][2360/3239]	Time 0.697 (0.886)	Data Time 0.001 (0.011)	Loss 3.5431 (3.4513)	Entropy 1.09149 (1.10917)	Top-1 acc 42.578 (42.132)	Top-5 acc 66.797 (66.143)	lr 0.02368
Train [18][2370/3239]	Time 0.597 (0.886)	Data Time 0.001 (0.011)	Loss 3.4574 (3.4512)	Entropy 1.09109 (1.10909)	Top-1 acc 39.844 (42.128)	Top-5 acc 68.359 (66.146)	lr 0.02368
Train [18][2380/3239]	Time 0.553 (0.886)	Data Time 0.001 (0.011)	Loss 3.2826 (3.4511)	Entropy 1.09068 (1.10902)	Top-1 acc 42.188 (42.131)	Top-5 acc 70.312 (66.150)	lr 0.02368
Train [18][2390/3239]	Time 0.576 (0.885)	Data Time 0.001 (0.011)	Loss 3.3740 (3.4509)	Entropy 1.09033 (1.10894)	Top-1 acc 40.625 (42.133)	Top-5 acc 69.922 (66.155)	lr 0.02368
Train [18][2400/3239]	Time 0.555 (0.885)	Data Time 0.001 (0.011)	Loss 3.3521 (3.4506)	Entropy 1.09021 (1.10886)	Top-1 acc 44.141 (42.136)	Top-5 acc 65.625 (66.160)	lr 0.02368
Train [18][2410/3239]	Time 0.624 (0.885)	Data Time 0.001 (0.011)	Loss 3.4065 (3.4508)	Entropy 1.08989 (1.10879)	Top-1 acc 41.016 (42.131)	Top-5 acc 65.625 (66.156)	lr 0.02368
Train [18][2420/3239]	Time 0.607 (0.885)	Data Time 0.001 (0.011)	Loss 3.4258 (3.4507)	Entropy 1.08990 (1.10871)	Top-1 acc 45.703 (42.137)	Top-5 acc 67.188 (66.156)	lr 0.02367
Train [18][2430/3239]	Time 0.653 (0.885)	Data Time 0.001 (0.011)	Loss 3.2595 (3.4507)	Entropy 1.08979 (1.10863)	Top-1 acc 42.188 (42.137)	Top-5 acc 69.922 (66.158)	lr 0.02367
Train [18][2440/3239]	Time 0.538 (0.885)	Data Time 0.001 (0.011)	Loss 3.4474 (3.4507)	Entropy 1.08939 (1.10855)	Top-1 acc 43.750 (42.139)	Top-5 acc 66.406 (66.159)	lr 0.02367
Train [18][2450/3239]	Time 0.580 (0.884)	Data Time 0.001 (0.011)	Loss 3.3387 (3.4506)	Entropy 1.08901 (1.10847)	Top-1 acc 42.969 (42.140)	Top-5 acc 68.359 (66.161)	lr 0.02367
Train [18][2460/3239]	Time 0.607 (0.884)	Data Time 0.001 (0.011)	Loss 3.3111 (3.4505)	Entropy 1.08859 (1.10839)	Top-1 acc 44.141 (42.144)	Top-5 acc 65.625 (66.163)	lr 0.02367
Train [18][2470/3239]	Time 0.587 (0.884)	Data Time 0.001 (0.011)	Loss 3.5968 (3.4507)	Entropy 1.08834 (1.10831)	Top-1 acc 38.281 (42.140)	Top-5 acc 64.453 (66.159)	lr 0.02367
Train [18][2480/3239]	Time 0.602 (0.884)	Data Time 0.001 (0.011)	Loss 3.5748 (3.4509)	Entropy 1.08852 (1.10823)	Top-1 acc 39.062 (42.135)	Top-5 acc 62.109 (66.153)	lr 0.02367
Train [18][2490/3239]	Time 0.609 (0.884)	Data Time 0.001 (0.010)	Loss 3.4225 (3.4510)	Entropy 1.08878 (1.10815)	Top-1 acc 43.750 (42.136)	Top-5 acc 67.188 (66.151)	lr 0.02367
Train [18][2500/3239]	Time 0.580 (0.884)	Data Time 0.001 (0.010)	Loss 3.5696 (3.4511)	Entropy 1.08877 (1.10808)	Top-1 acc 40.234 (42.133)	Top-5 acc 64.844 (66.150)	lr 0.02367
Train [18][2510/3239]	Time 0.609 (0.884)	Data Time 0.001 (0.010)	Loss 3.6190 (3.4511)	Entropy 1.08825 (1.10800)	Top-1 acc 38.281 (42.130)	Top-5 acc 62.500 (66.148)	lr 0.02367
Train [18][2520/3239]	Time 0.602 (0.884)	Data Time 0.001 (0.010)	Loss 3.6123 (3.4512)	Entropy 1.08773 (1.10792)	Top-1 acc 40.625 (42.135)	Top-5 acc 61.328 (66.145)	lr 0.02367
Train [18][2530/3239]	Time 0.729 (0.891)	Data Time 0.006 (0.010)	Loss 3.4103 (3.4514)	Entropy 1.08806 (1.10784)	Top-1 acc 43.359 (42.133)	Top-5 acc 65.625 (66.139)	lr 0.02367
Train [18][2540/3239]	Time 0.572 (0.891)	Data Time 0.002 (0.010)	Loss 3.6089 (3.4514)	Entropy 1.08767 (1.10776)	Top-1 acc 38.672 (42.133)	Top-5 acc 60.938 (66.140)	lr 0.02367
Train [18][2550/3239]	Time 0.598 (0.891)	Data Time 0.001 (0.010)	Loss 3.3631 (3.4513)	Entropy 1.08780 (1.10768)	Top-1 acc 42.188 (42.137)	Top-5 acc 67.188 (66.140)	lr 0.02367
Train [18][2560/3239]	Time 0.615 (0.891)	Data Time 0.002 (0.010)	Loss 3.4806 (3.4514)	Entropy 1.08770 (1.10761)	Top-1 acc 40.234 (42.137)	Top-5 acc 68.359 (66.133)	lr 0.02367
Train [18][2570/3239]	Time 0.591 (0.891)	Data Time 0.001 (0.010)	Loss 3.4308 (3.4514)	Entropy 1.08753 (1.10753)	Top-1 acc 43.750 (42.139)	Top-5 acc 66.016 (66.135)	lr 0.02367
Train [18][2580/3239]	Time 0.602 (0.891)	Data Time 0.001 (0.010)	Loss 3.3379 (3.4515)	Entropy 1.08744 (1.10745)	Top-1 acc 42.969 (42.132)	Top-5 acc 69.922 (66.136)	lr 0.02367
Train [18][2590/3239]	Time 0.678 (0.890)	Data Time 0.001 (0.010)	Loss 3.5101 (3.4514)	Entropy 1.08722 (1.10737)	Top-1 acc 38.281 (42.131)	Top-5 acc 68.359 (66.137)	lr 0.02367
Train [18][2600/3239]	Time 0.609 (0.890)	Data Time 0.001 (0.010)	Loss 3.3418 (3.4512)	Entropy 1.08706 (1.10729)	Top-1 acc 43.359 (42.129)	Top-5 acc 67.188 (66.141)	lr 0.02367
Train [18][2610/3239]	Time 0.610 (0.890)	Data Time 0.001 (0.010)	Loss 3.3895 (3.4511)	Entropy 1.08675 (1.10722)	Top-1 acc 42.188 (42.133)	Top-5 acc 67.578 (66.144)	lr 0.02367
Train [18][2620/3239]	Time 0.579 (0.890)	Data Time 0.001 (0.010)	Loss 3.5383 (3.4511)	Entropy 1.08658 (1.10714)	Top-1 acc 40.234 (42.135)	Top-5 acc 64.844 (66.143)	lr 0.02367
Train [18][2630/3239]	Time 0.593 (0.890)	Data Time 0.001 (0.010)	Loss 3.4129 (3.4508)	Entropy 1.08635 (1.10706)	Top-1 acc 40.625 (42.141)	Top-5 acc 66.406 (66.150)	lr 0.02367
Train [18][2640/3239]	Time 0.592 (0.890)	Data Time 0.001 (0.010)	Loss 3.3900 (3.4508)	Entropy 1.08635 (1.10698)	Top-1 acc 42.188 (42.140)	Top-5 acc 67.578 (66.150)	lr 0.02366
Train [18][2650/3239]	Time 0.613 (0.890)	Data Time 0.001 (0.010)	Loss 3.2824 (3.4508)	Entropy 1.08661 (1.10690)	Top-1 acc 47.266 (42.140)	Top-5 acc 69.141 (66.152)	lr 0.02366
Train [18][2660/3239]	Time 0.607 (0.890)	Data Time 0.001 (0.010)	Loss 3.3656 (3.4506)	Entropy 1.08659 (1.10683)	Top-1 acc 43.750 (42.141)	Top-5 acc 67.578 (66.152)	lr 0.02366
Train [18][2670/3239]	Time 0.579 (0.889)	Data Time 0.001 (0.010)	Loss 3.4022 (3.4507)	Entropy 1.08652 (1.10675)	Top-1 acc 43.359 (42.136)	Top-5 acc 66.406 (66.148)	lr 0.02366
Train [18][2680/3239]	Time 0.608 (0.889)	Data Time 0.001 (0.010)	Loss 3.4235 (3.4507)	Entropy 1.08668 (1.10668)	Top-1 acc 39.844 (42.136)	Top-5 acc 63.281 (66.151)	lr 0.02366
Train [18][2690/3239]	Time 0.633 (0.889)	Data Time 0.001 (0.010)	Loss 3.4638 (3.4506)	Entropy 1.08661 (1.10660)	Top-1 acc 43.359 (42.135)	Top-5 acc 65.234 (66.152)	lr 0.02366
Train [18][2700/3239]	Time 0.605 (0.889)	Data Time 0.001 (0.010)	Loss 3.6403 (3.4505)	Entropy 1.08684 (1.10653)	Top-1 acc 38.672 (42.138)	Top-5 acc 64.453 (66.154)	lr 0.02366
Train [18][2710/3239]	Time 0.595 (0.889)	Data Time 0.001 (0.010)	Loss 3.3532 (3.4506)	Entropy 1.08666 (1.10646)	Top-1 acc 42.578 (42.136)	Top-5 acc 66.797 (66.152)	lr 0.02366
Train [18][2720/3239]	Time 0.648 (0.889)	Data Time 0.002 (0.010)	Loss 3.3581 (3.4505)	Entropy 1.08587 (1.10638)	Top-1 acc 44.531 (42.137)	Top-5 acc 69.141 (66.155)	lr 0.02366
Train [18][2730/3239]	Time 0.616 (0.889)	Data Time 0.001 (0.010)	Loss 3.4239 (3.4507)	Entropy 1.08592 (1.10631)	Top-1 acc 41.406 (42.131)	Top-5 acc 67.188 (66.155)	lr 0.02366
Train [18][2740/3239]	Time 0.625 (0.888)	Data Time 0.001 (0.010)	Loss 3.3243 (3.4506)	Entropy 1.08534 (1.10623)	Top-1 acc 47.266 (42.132)	Top-5 acc 72.656 (66.155)	lr 0.02366
Train [18][2750/3239]	Time 0.657 (0.888)	Data Time 0.001 (0.010)	Loss 3.3678 (3.4506)	Entropy 1.08516 (1.10616)	Top-1 acc 42.188 (42.135)	Top-5 acc 65.625 (66.155)	lr 0.02366
Train [18][2760/3239]	Time 0.582 (0.888)	Data Time 0.001 (0.010)	Loss 3.5448 (3.4509)	Entropy 1.08521 (1.10608)	Top-1 acc 40.625 (42.129)	Top-5 acc 61.328 (66.147)	lr 0.02366
Train [18][2770/3239]	Time 0.593 (0.888)	Data Time 0.001 (0.010)	Loss 3.3776 (3.4507)	Entropy 1.08523 (1.10600)	Top-1 acc 39.062 (42.133)	Top-5 acc 67.188 (66.148)	lr 0.02366
Train [18][2780/3239]	Time 0.632 (0.888)	Data Time 0.001 (0.010)	Loss 3.3879 (3.4507)	Entropy 1.08488 (1.10593)	Top-1 acc 43.750 (42.132)	Top-5 acc 70.703 (66.150)	lr 0.02366
Train [18][2790/3239]	Time 0.604 (0.888)	Data Time 0.001 (0.010)	Loss 3.5134 (3.4507)	Entropy 1.08481 (1.10585)	Top-1 acc 39.453 (42.130)	Top-5 acc 64.844 (66.150)	lr 0.02366
Train [18][2800/3239]	Time 0.600 (0.888)	Data Time 0.001 (0.010)	Loss 3.5733 (3.4504)	Entropy 1.08483 (1.10578)	Top-1 acc 40.625 (42.136)	Top-5 acc 64.062 (66.156)	lr 0.02366
Train [18][2810/3239]	Time 0.620 (0.887)	Data Time 0.001 (0.010)	Loss 3.3453 (3.4503)	Entropy 1.08469 (1.10570)	Top-1 acc 42.969 (42.139)	Top-5 acc 66.016 (66.156)	lr 0.02366
Train [18][2820/3239]	Time 0.649 (0.887)	Data Time 0.001 (0.010)	Loss 3.3972 (3.4503)	Entropy 1.08503 (1.10563)	Top-1 acc 46.094 (42.141)	Top-5 acc 66.016 (66.159)	lr 0.02366
Train [18][2830/3239]	Time 0.601 (0.887)	Data Time 0.001 (0.010)	Loss 3.4304 (3.4501)	Entropy 1.08491 (1.10556)	Top-1 acc 44.141 (42.143)	Top-5 acc 69.141 (66.161)	lr 0.02366
Train [18][2840/3239]	Time 0.636 (0.887)	Data Time 0.001 (0.009)	Loss 3.2999 (3.4501)	Entropy 1.08480 (1.10548)	Top-1 acc 46.094 (42.141)	Top-5 acc 66.797 (66.160)	lr 0.02366
Train [18][2850/3239]	Time 0.587 (0.887)	Data Time 0.001 (0.009)	Loss 3.1057 (3.4498)	Entropy 1.08488 (1.10541)	Top-1 acc 47.656 (42.143)	Top-5 acc 71.875 (66.163)	lr 0.02366
Train [18][2860/3239]	Time 0.598 (0.887)	Data Time 0.001 (0.009)	Loss 3.3763 (3.4498)	Entropy 1.08483 (1.10534)	Top-1 acc 46.484 (42.141)	Top-5 acc 68.359 (66.163)	lr 0.02365
Train [18][2870/3239]	Time 0.580 (0.887)	Data Time 0.001 (0.009)	Loss 3.3528 (3.4501)	Entropy 1.08463 (1.10527)	Top-1 acc 48.828 (42.138)	Top-5 acc 68.359 (66.161)	lr 0.02365
Train [18][2880/3239]	Time 0.588 (0.887)	Data Time 0.001 (0.009)	Loss 3.4726 (3.4502)	Entropy 1.08480 (1.10520)	Top-1 acc 41.406 (42.134)	Top-5 acc 65.234 (66.158)	lr 0.02365
Train [18][2890/3239]	Time 0.614 (0.887)	Data Time 0.001 (0.009)	Loss 3.4641 (3.4503)	Entropy 1.08454 (1.10512)	Top-1 acc 42.578 (42.129)	Top-5 acc 67.969 (66.157)	lr 0.02365
Train [18][2900/3239]	Time 0.553 (0.886)	Data Time 0.001 (0.009)	Loss 3.4759 (3.4504)	Entropy 1.08430 (1.10505)	Top-1 acc 37.891 (42.131)	Top-5 acc 66.406 (66.155)	lr 0.02365
Train [18][2910/3239]	Time 0.463 (0.886)	Data Time 0.001 (0.009)	Loss 3.6189 (3.4504)	Entropy 1.08395 (1.10498)	Top-1 acc 37.500 (42.130)	Top-5 acc 60.938 (66.155)	lr 0.02365
Train [18][2920/3239]	Time 0.475 (0.886)	Data Time 0.001 (0.009)	Loss 3.5417 (3.4505)	Entropy 1.08406 (1.10491)	Top-1 acc 41.016 (42.125)	Top-5 acc 64.844 (66.151)	lr 0.02365
Train [18][2930/3239]	Time 0.591 (0.886)	Data Time 0.001 (0.009)	Loss 3.3081 (3.4506)	Entropy 1.08410 (1.10484)	Top-1 acc 46.484 (42.123)	Top-5 acc 68.359 (66.152)	lr 0.02365
Train [18][2940/3239]	Time 0.623 (0.886)	Data Time 0.001 (0.009)	Loss 3.4989 (3.4506)	Entropy 1.08355 (1.10477)	Top-1 acc 39.062 (42.120)	Top-5 acc 63.672 (66.149)	lr 0.02365
Train [18][2950/3239]	Time 0.600 (0.886)	Data Time 0.001 (0.009)	Loss 3.5025 (3.4506)	Entropy 1.08324 (1.10470)	Top-1 acc 43.359 (42.123)	Top-5 acc 63.281 (66.149)	lr 0.02365
Train [18][2960/3239]	Time 0.614 (0.886)	Data Time 0.001 (0.009)	Loss 3.4471 (3.4505)	Entropy 1.08306 (1.10462)	Top-1 acc 42.969 (42.124)	Top-5 acc 65.234 (66.149)	lr 0.02365
Train [18][2970/3239]	Time 0.577 (0.885)	Data Time 0.001 (0.009)	Loss 3.4939 (3.4506)	Entropy 1.08296 (1.10455)	Top-1 acc 42.969 (42.125)	Top-5 acc 63.281 (66.147)	lr 0.02365
Train [18][2980/3239]	Time 0.672 (0.885)	Data Time 0.001 (0.009)	Loss 3.3420 (3.4506)	Entropy 1.08242 (1.10448)	Top-1 acc 42.188 (42.121)	Top-5 acc 68.750 (66.145)	lr 0.02365
Train [18][2990/3239]	Time 0.633 (0.885)	Data Time 0.001 (0.009)	Loss 3.4544 (3.4506)	Entropy 1.08153 (1.10440)	Top-1 acc 39.062 (42.117)	Top-5 acc 67.188 (66.146)	lr 0.02365
Train [18][3000/3239]	Time 0.606 (0.885)	Data Time 0.001 (0.009)	Loss 3.5513 (3.4507)	Entropy 1.08156 (1.10433)	Top-1 acc 39.844 (42.117)	Top-5 acc 62.500 (66.143)	lr 0.02365
Train [18][3010/3239]	Time 0.599 (0.885)	Data Time 0.001 (0.009)	Loss 3.5771 (3.4509)	Entropy 1.08121 (1.10425)	Top-1 acc 41.406 (42.110)	Top-5 acc 66.016 (66.138)	lr 0.02365
Train [18][3020/3239]	Time 0.624 (0.885)	Data Time 0.001 (0.009)	Loss 3.4340 (3.4510)	Entropy 1.08121 (1.10417)	Top-1 acc 43.359 (42.113)	Top-5 acc 65.625 (66.136)	lr 0.02365
Train [18][3030/3239]	Time 0.602 (0.885)	Data Time 0.001 (0.009)	Loss 3.4566 (3.4508)	Entropy 1.08136 (1.10410)	Top-1 acc 44.531 (42.120)	Top-5 acc 63.281 (66.142)	lr 0.02365
Train [18][3040/3239]	Time 0.619 (0.885)	Data Time 0.001 (0.009)	Loss 3.3368 (3.4506)	Entropy 1.08129 (1.10402)	Top-1 acc 45.703 (42.124)	Top-5 acc 67.969 (66.145)	lr 0.02365
Train [18][3050/3239]	Time 0.716 (0.885)	Data Time 0.001 (0.009)	Loss 3.4014 (3.4505)	Entropy 1.08112 (1.10395)	Top-1 acc 44.531 (42.125)	Top-5 acc 66.406 (66.149)	lr 0.02365
Train [18][3060/3239]	Time 0.644 (0.884)	Data Time 0.001 (0.009)	Loss 3.3562 (3.4504)	Entropy 1.08081 (1.10387)	Top-1 acc 42.969 (42.124)	Top-5 acc 68.750 (66.150)	lr 0.02365
Train [18][3070/3239]	Time 0.589 (0.884)	Data Time 0.002 (0.009)	Loss 3.4397 (3.4501)	Entropy 1.08056 (1.10380)	Top-1 acc 46.094 (42.128)	Top-5 acc 68.750 (66.155)	lr 0.02365
Train [18][3080/3239]	Time 0.473 (0.884)	Data Time 0.001 (0.009)	Loss 3.3495 (3.4501)	Entropy 1.08051 (1.10372)	Top-1 acc 40.625 (42.130)	Top-5 acc 68.750 (66.156)	lr 0.02364
Train [18][3090/3239]	Time 0.602 (0.884)	Data Time 0.001 (0.009)	Loss 3.3393 (3.4500)	Entropy 1.08027 (1.10365)	Top-1 acc 44.141 (42.132)	Top-5 acc 71.094 (66.162)	lr 0.02364
Train [18][3100/3239]	Time 0.612 (0.884)	Data Time 0.001 (0.009)	Loss 3.3118 (3.4499)	Entropy 1.07999 (1.10357)	Top-1 acc 42.578 (42.130)	Top-5 acc 69.922 (66.162)	lr 0.02364
Train [18][3110/3239]	Time 0.595 (0.884)	Data Time 0.001 (0.009)	Loss 3.4843 (3.4498)	Entropy 1.07967 (1.10350)	Top-1 acc 42.578 (42.136)	Top-5 acc 65.234 (66.161)	lr 0.02364
Train [18][3120/3239]	Time 0.614 (0.884)	Data Time 0.001 (0.009)	Loss 3.3844 (3.4499)	Entropy 1.07961 (1.10342)	Top-1 acc 41.797 (42.131)	Top-5 acc 70.703 (66.160)	lr 0.02364
Train [18][3130/3239]	Time 0.604 (0.884)	Data Time 0.001 (0.009)	Loss 3.3761 (3.4500)	Entropy 1.07906 (1.10334)	Top-1 acc 46.094 (42.129)	Top-5 acc 67.188 (66.155)	lr 0.02364
Train [18][3140/3239]	Time 0.707 (0.884)	Data Time 0.001 (0.009)	Loss 3.4115 (3.4500)	Entropy 1.07904 (1.10326)	Top-1 acc 41.797 (42.129)	Top-5 acc 64.844 (66.155)	lr 0.02364
Train [18][3150/3239]	Time 0.625 (0.884)	Data Time 0.001 (0.009)	Loss 3.3535 (3.4500)	Entropy 1.07909 (1.10319)	Top-1 acc 41.797 (42.125)	Top-5 acc 67.188 (66.155)	lr 0.02364
Train [18][3160/3239]	Time 0.585 (0.883)	Data Time 0.001 (0.009)	Loss 3.4078 (3.4501)	Entropy 1.07924 (1.10311)	Top-1 acc 44.531 (42.129)	Top-5 acc 65.625 (66.153)	lr 0.02364
Train [18][3170/3239]	Time 0.607 (0.883)	Data Time 0.001 (0.009)	Loss 3.4687 (3.4497)	Entropy 1.07918 (1.10304)	Top-1 acc 42.969 (42.135)	Top-5 acc 66.016 (66.161)	lr 0.02364
Train [18][3180/3239]	Time 0.575 (0.883)	Data Time 0.000 (0.009)	Loss 3.6020 (3.4500)	Entropy 1.07968 (1.10296)	Top-1 acc 38.672 (42.132)	Top-5 acc 62.891 (66.156)	lr 0.02364
Train [18][3190/3239]	Time 0.623 (0.890)	Data Time 0.000 (0.009)	Loss 3.3001 (3.4500)	Entropy 1.07961 (1.10289)	Top-1 acc 46.875 (42.132)	Top-5 acc 69.141 (66.156)	lr 0.02364
Train [18][3200/3239]	Time 0.621 (0.889)	Data Time 0.000 (0.009)	Loss 3.2617 (3.4498)	Entropy 1.07893 (1.10281)	Top-1 acc 43.359 (42.136)	Top-5 acc 71.875 (66.161)	lr 0.02364
Train [18][3210/3239]	Time 0.697 (0.889)	Data Time 0.000 (0.009)	Loss 3.5636 (3.4498)	Entropy 1.07841 (1.10274)	Top-1 acc 38.672 (42.135)	Top-5 acc 66.016 (66.162)	lr 0.02364
Train [18][3220/3239]	Time 0.599 (0.889)	Data Time 0.000 (0.009)	Loss 3.5470 (3.4496)	Entropy 1.07895 (1.10267)	Top-1 acc 41.406 (42.139)	Top-5 acc 65.234 (66.167)	lr 0.02364
Train [18][3230/3239]	Time 0.652 (0.889)	Data Time 0.000 (0.009)	Loss 3.3157 (3.4497)	Entropy 1.07829 (1.10259)	Top-1 acc 45.703 (42.138)	Top-5 acc 70.312 (66.165)	lr 0.02364
Train [18][3239/3239]	Time 1.559 (0.889)	Data Time 0.000 (0.009)	Loss 3.4335 (3.4497)	Entropy 1.07840 (1.10252)	Top-1 acc 44.444 (42.137)	Top-5 acc 64.198 (66.165)	lr 0.02364
==========Valid [18/120]	loss 2.184	top-1 acc 51.994 (51.994)	top-5 acc 75.703	Train top-1 42.137	top-5 66.165	Entropy 1.07840	Latency-None: 0.000ms	Flops: 539.76M
Train [19][0/3239]	Time 20.934 (20.934)	Data Time 17.990 (17.990)	Loss 3.6203 (3.6203)	Entropy 1.07850 (1.07850)	Top-1 acc 41.016 (41.016)	Top-5 acc 62.109 (62.109)	lr 0.02364
Train [19][10/3239]	Time 0.564 (2.807)	Data Time 0.001 (1.690)	Loss 3.4007 (3.4121)	Entropy 1.07855 (1.07859)	Top-1 acc 45.703 (43.643)	Top-5 acc 68.359 (67.010)	lr 0.02364
Train [19][20/3239]	Time 0.630 (1.866)	Data Time 0.001 (0.886)	Loss 3.2993 (3.4184)	Entropy 1.07805 (1.07848)	Top-1 acc 43.359 (42.597)	Top-5 acc 68.750 (66.574)	lr 0.02364
Train [19][30/3239]	Time 0.562 (1.538)	Data Time 0.001 (0.601)	Loss 3.5218 (3.4048)	Entropy 1.07819 (1.07834)	Top-1 acc 37.891 (42.944)	Top-5 acc 64.453 (67.314)	lr 0.02364
Train [19][40/3239]	Time 0.685 (1.367)	Data Time 0.001 (0.455)	Loss 3.5736 (3.4126)	Entropy 1.07835 (1.07833)	Top-1 acc 44.141 (43.121)	Top-5 acc 62.891 (67.045)	lr 0.02364
Train [19][50/3239]	Time 0.620 (1.266)	Data Time 0.001 (0.367)	Loss 3.3971 (3.4235)	Entropy 1.07816 (1.07832)	Top-1 acc 43.359 (43.045)	Top-5 acc 67.969 (66.927)	lr 0.02364
Train [19][60/3239]	Time 0.573 (1.197)	Data Time 0.001 (0.307)	Loss 3.5232 (3.4176)	Entropy 1.07786 (1.07828)	Top-1 acc 35.547 (43.052)	Top-5 acc 64.453 (67.168)	lr 0.02363
Train [19][70/3239]	Time 0.592 (1.150)	Data Time 0.001 (0.264)	Loss 3.6156 (3.4343)	Entropy 1.07802 (1.07823)	Top-1 acc 39.062 (42.732)	Top-5 acc 64.844 (66.951)	lr 0.02363
Train [19][80/3239]	Time 0.595 (1.113)	Data Time 0.001 (0.231)	Loss 3.3475 (3.4293)	Entropy 1.07781 (1.07819)	Top-1 acc 44.531 (42.790)	Top-5 acc 69.531 (66.951)	lr 0.02363
Train [19][90/3239]	Time 0.570 (1.083)	Data Time 0.001 (0.206)	Loss 3.4379 (3.4337)	Entropy 1.07782 (1.07815)	Top-1 acc 45.703 (42.694)	Top-5 acc 64.844 (66.728)	lr 0.02363
Train [19][100/3239]	Time 0.624 (1.061)	Data Time 0.001 (0.186)	Loss 3.3734 (3.4296)	Entropy 1.07764 (1.07812)	Top-1 acc 41.406 (42.644)	Top-5 acc 68.750 (66.890)	lr 0.02363
Train [19][110/3239]	Time 0.613 (1.044)	Data Time 0.001 (0.169)	Loss 3.3083 (3.4274)	Entropy 1.07773 (1.07807)	Top-1 acc 43.750 (42.684)	Top-5 acc 71.094 (66.895)	lr 0.02363
Train [19][120/3239]	Time 0.565 (1.033)	Data Time 0.001 (0.156)	Loss 3.2396 (3.4277)	Entropy 1.07801 (1.07805)	Top-1 acc 42.969 (42.623)	Top-5 acc 69.531 (66.903)	lr 0.02363
Train [19][130/3239]	Time 0.560 (1.018)	Data Time 0.001 (0.144)	Loss 3.4214 (3.4262)	Entropy 1.07825 (1.07805)	Top-1 acc 42.188 (42.644)	Top-5 acc 68.750 (66.955)	lr 0.02363
Train [19][140/3239]	Time 0.637 (1.006)	Data Time 0.001 (0.134)	Loss 3.2808 (3.4222)	Entropy 1.07811 (1.07806)	Top-1 acc 46.094 (42.681)	Top-5 acc 71.094 (67.021)	lr 0.02363
Train [19][150/3239]	Time 0.611 (0.997)	Data Time 0.001 (0.125)	Loss 3.7155 (3.4258)	Entropy 1.07836 (1.07807)	Top-1 acc 37.891 (42.617)	Top-5 acc 62.891 (66.918)	lr 0.02363
Train [19][160/3239]	Time 0.608 (0.988)	Data Time 0.001 (0.117)	Loss 3.3329 (3.4242)	Entropy 1.07838 (1.07809)	Top-1 acc 44.531 (42.712)	Top-5 acc 69.141 (66.913)	lr 0.02363
Train [19][170/3239]	Time 0.622 (0.980)	Data Time 0.002 (0.111)	Loss 3.3225 (3.4220)	Entropy 1.07800 (1.07810)	Top-1 acc 46.484 (42.699)	Top-5 acc 68.359 (66.927)	lr 0.02363
Train [19][180/3239]	Time 0.492 (0.971)	Data Time 0.001 (0.105)	Loss 3.1766 (3.4183)	Entropy 1.07773 (1.07809)	Top-1 acc 46.484 (42.783)	Top-5 acc 74.219 (66.989)	lr 0.02363
Train [19][190/3239]	Time 0.611 (0.962)	Data Time 0.001 (0.099)	Loss 3.3760 (3.4188)	Entropy 1.07764 (1.07808)	Top-1 acc 44.141 (42.703)	Top-5 acc 67.969 (66.948)	lr 0.02363
Train [19][200/3239]	Time 0.684 (0.956)	Data Time 0.001 (0.094)	Loss 3.2523 (3.4174)	Entropy 1.07741 (1.07806)	Top-1 acc 42.969 (42.706)	Top-5 acc 69.141 (66.981)	lr 0.02363
Train [19][210/3239]	Time 0.607 (0.951)	Data Time 0.001 (0.090)	Loss 3.5023 (3.4200)	Entropy 1.07708 (1.07802)	Top-1 acc 44.141 (42.647)	Top-5 acc 66.797 (66.910)	lr 0.02363
Train [19][220/3239]	Time 0.599 (0.945)	Data Time 0.001 (0.086)	Loss 3.5819 (3.4227)	Entropy 1.07706 (1.07798)	Top-1 acc 39.844 (42.559)	Top-5 acc 64.844 (66.883)	lr 0.02363
Train [19][230/3239]	Time 0.625 (0.941)	Data Time 0.001 (0.082)	Loss 3.3069 (3.4230)	Entropy 1.07699 (1.07795)	Top-1 acc 41.797 (42.551)	Top-5 acc 66.406 (66.863)	lr 0.02363
Train [19][240/3239]	Time 0.605 (0.938)	Data Time 0.001 (0.079)	Loss 3.5617 (3.4227)	Entropy 1.07646 (1.07790)	Top-1 acc 41.016 (42.557)	Top-5 acc 64.062 (66.867)	lr 0.02363
Train [19][250/3239]	Time 0.628 (0.935)	Data Time 0.001 (0.076)	Loss 3.5370 (3.4237)	Entropy 1.07595 (1.07784)	Top-1 acc 39.453 (42.536)	Top-5 acc 64.453 (66.814)	lr 0.02363
Train [19][260/3239]	Time 0.572 (0.932)	Data Time 0.001 (0.073)	Loss 3.5609 (3.4269)	Entropy 1.07597 (1.07777)	Top-1 acc 37.891 (42.430)	Top-5 acc 60.547 (66.753)	lr 0.02363
Train [19][270/3239]	Time 0.741 (0.929)	Data Time 0.001 (0.070)	Loss 3.3279 (3.4244)	Entropy 1.07608 (1.07770)	Top-1 acc 46.875 (42.463)	Top-5 acc 68.359 (66.834)	lr 0.02363
Train [19][280/3239]	Time 0.626 (0.927)	Data Time 0.001 (0.068)	Loss 3.4613 (3.4218)	Entropy 1.07594 (1.07764)	Top-1 acc 37.891 (42.464)	Top-5 acc 67.578 (66.884)	lr 0.02362
Train [19][290/3239]	Time 0.568 (0.924)	Data Time 0.001 (0.066)	Loss 3.4285 (3.4233)	Entropy 1.07570 (1.07758)	Top-1 acc 44.141 (42.465)	Top-5 acc 69.141 (66.877)	lr 0.02362
Train [19][300/3239]	Time 0.620 (0.922)	Data Time 0.002 (0.064)	Loss 3.3611 (3.4247)	Entropy 1.07541 (1.07751)	Top-1 acc 47.656 (42.478)	Top-5 acc 67.188 (66.850)	lr 0.02362
Train [19][310/3239]	Time 0.568 (0.920)	Data Time 0.001 (0.062)	Loss 3.4654 (3.4246)	Entropy 1.07550 (1.07745)	Top-1 acc 45.312 (42.505)	Top-5 acc 68.750 (66.856)	lr 0.02362
Train [19][320/3239]	Time 0.563 (0.918)	Data Time 0.001 (0.060)	Loss 3.4353 (3.4250)	Entropy 1.07538 (1.07738)	Top-1 acc 40.625 (42.501)	Top-5 acc 67.188 (66.846)	lr 0.02362
Train [19][330/3239]	Time 0.609 (0.916)	Data Time 0.001 (0.058)	Loss 3.5804 (3.4261)	Entropy 1.07538 (1.07733)	Top-1 acc 38.672 (42.462)	Top-5 acc 64.062 (66.824)	lr 0.02362
Train [19][340/3239]	Time 0.580 (0.914)	Data Time 0.001 (0.056)	Loss 3.1986 (3.4248)	Entropy 1.07506 (1.07727)	Top-1 acc 44.531 (42.503)	Top-5 acc 72.656 (66.820)	lr 0.02362
Train [19][350/3239]	Time 0.559 (0.911)	Data Time 0.001 (0.055)	Loss 3.2839 (3.4266)	Entropy 1.07534 (1.07721)	Top-1 acc 44.922 (42.482)	Top-5 acc 69.922 (66.791)	lr 0.02362
Train [19][360/3239]	Time 0.657 (0.909)	Data Time 0.001 (0.053)	Loss 3.3034 (3.4251)	Entropy 1.07516 (1.07715)	Top-1 acc 46.484 (42.525)	Top-5 acc 70.312 (66.810)	lr 0.02362
Train [19][370/3239]	Time 0.612 (0.907)	Data Time 0.001 (0.052)	Loss 3.3092 (3.4257)	Entropy 1.07501 (1.07710)	Top-1 acc 44.531 (42.528)	Top-5 acc 68.359 (66.791)	lr 0.02362
Train [19][380/3239]	Time 0.618 (0.905)	Data Time 0.001 (0.051)	Loss 3.3170 (3.4248)	Entropy 1.07539 (1.07705)	Top-1 acc 46.875 (42.523)	Top-5 acc 73.828 (66.803)	lr 0.02362
Train [19][390/3239]	Time 0.607 (0.904)	Data Time 0.001 (0.049)	Loss 3.4467 (3.4254)	Entropy 1.07561 (1.07701)	Top-1 acc 40.625 (42.511)	Top-5 acc 65.234 (66.783)	lr 0.02362
Train [19][400/3239]	Time 0.619 (0.903)	Data Time 0.001 (0.048)	Loss 3.4244 (3.4255)	Entropy 1.07571 (1.07697)	Top-1 acc 38.672 (42.518)	Top-5 acc 72.656 (66.779)	lr 0.02362
Train [19][410/3239]	Time 0.626 (0.902)	Data Time 0.001 (0.047)	Loss 3.5534 (3.4250)	Entropy 1.07542 (1.07694)	Top-1 acc 39.844 (42.543)	Top-5 acc 63.281 (66.790)	lr 0.02362
Train [19][420/3239]	Time 0.603 (0.901)	Data Time 0.001 (0.046)	Loss 3.5141 (3.4259)	Entropy 1.07547 (1.07690)	Top-1 acc 39.844 (42.523)	Top-5 acc 66.797 (66.778)	lr 0.02362
Train [19][430/3239]	Time 0.676 (0.899)	Data Time 0.001 (0.045)	Loss 3.4818 (3.4250)	Entropy 1.07507 (1.07687)	Top-1 acc 42.188 (42.571)	Top-5 acc 66.016 (66.805)	lr 0.02362
Train [19][440/3239]	Time 0.580 (0.898)	Data Time 0.001 (0.044)	Loss 3.4335 (3.4226)	Entropy 1.07496 (1.07682)	Top-1 acc 40.625 (42.618)	Top-5 acc 70.703 (66.862)	lr 0.02362
Train [19][450/3239]	Time 0.587 (0.897)	Data Time 0.001 (0.043)	Loss 3.4455 (3.4221)	Entropy 1.07476 (1.07678)	Top-1 acc 41.016 (42.584)	Top-5 acc 65.234 (66.879)	lr 0.02362
Train [19][460/3239]	Time 0.593 (0.896)	Data Time 0.001 (0.042)	Loss 3.3499 (3.4219)	Entropy 1.07436 (1.07674)	Top-1 acc 42.188 (42.573)	Top-5 acc 66.797 (66.877)	lr 0.02362
Train [19][470/3239]	Time 0.607 (0.895)	Data Time 0.001 (0.041)	Loss 3.1473 (3.4205)	Entropy 1.07421 (1.07668)	Top-1 acc 48.828 (42.602)	Top-5 acc 71.875 (66.910)	lr 0.02362
Train [19][480/3239]	Time 0.574 (0.895)	Data Time 0.001 (0.040)	Loss 3.5787 (3.4220)	Entropy 1.07423 (1.07663)	Top-1 acc 38.672 (42.567)	Top-5 acc 65.625 (66.880)	lr 0.02362
Train [19][490/3239]	Time 0.612 (0.894)	Data Time 0.001 (0.040)	Loss 3.3995 (3.4223)	Entropy 1.07417 (1.07658)	Top-1 acc 40.234 (42.573)	Top-5 acc 66.016 (66.869)	lr 0.02362
Train [19][500/3239]	Time 0.599 (0.893)	Data Time 0.001 (0.039)	Loss 3.4344 (3.4226)	Entropy 1.07399 (1.07653)	Top-1 acc 44.531 (42.561)	Top-5 acc 64.453 (66.863)	lr 0.02361
Train [19][510/3239]	Time 0.603 (0.892)	Data Time 0.001 (0.038)	Loss 3.3917 (3.4232)	Entropy 1.07417 (1.07649)	Top-1 acc 44.531 (42.555)	Top-5 acc 69.141 (66.860)	lr 0.02361
Train [19][520/3239]	Time 0.583 (0.891)	Data Time 0.001 (0.037)	Loss 3.2782 (3.4240)	Entropy 1.07396 (1.07644)	Top-1 acc 44.531 (42.559)	Top-5 acc 70.703 (66.838)	lr 0.02361
Train [19][530/3239]	Time 0.568 (0.890)	Data Time 0.001 (0.037)	Loss 3.4566 (3.4241)	Entropy 1.07443 (1.07640)	Top-1 acc 41.797 (42.552)	Top-5 acc 60.938 (66.821)	lr 0.02361
Train [19][540/3239]	Time 0.625 (0.888)	Data Time 0.001 (0.036)	Loss 3.5114 (3.4243)	Entropy 1.07441 (1.07636)	Top-1 acc 42.969 (42.542)	Top-5 acc 65.625 (66.813)	lr 0.02361
Train [19][550/3239]	Time 0.613 (0.888)	Data Time 0.001 (0.036)	Loss 3.3965 (3.4249)	Entropy 1.07480 (1.07633)	Top-1 acc 44.922 (42.514)	Top-5 acc 67.578 (66.806)	lr 0.02361
Train [19][560/3239]	Time 0.658 (0.887)	Data Time 0.002 (0.035)	Loss 3.4224 (3.4244)	Entropy 1.07441 (1.07630)	Top-1 acc 46.875 (42.549)	Top-5 acc 66.406 (66.816)	lr 0.02361
Train [19][570/3239]	Time 0.617 (0.887)	Data Time 0.001 (0.034)	Loss 3.2864 (3.4228)	Entropy 1.07380 (1.07627)	Top-1 acc 42.578 (42.601)	Top-5 acc 70.703 (66.832)	lr 0.02361
Train [19][580/3239]	Time 0.569 (0.886)	Data Time 0.002 (0.034)	Loss 3.4418 (3.4238)	Entropy 1.07370 (1.07622)	Top-1 acc 42.188 (42.566)	Top-5 acc 64.453 (66.806)	lr 0.02361
Train [19][590/3239]	Time 0.697 (0.885)	Data Time 0.002 (0.033)	Loss 3.5734 (3.4231)	Entropy 1.07292 (1.07618)	Top-1 acc 40.234 (42.575)	Top-5 acc 64.453 (66.840)	lr 0.02361
Train [19][600/3239]	Time 0.746 (0.919)	Data Time 0.005 (0.033)	Loss 3.4669 (3.4237)	Entropy 1.07297 (1.07612)	Top-1 acc 38.281 (42.570)	Top-5 acc 64.453 (66.824)	lr 0.02361
Train [19][610/3239]	Time 0.629 (0.919)	Data Time 0.002 (0.032)	Loss 3.2171 (3.4245)	Entropy 1.07247 (1.07607)	Top-1 acc 48.828 (42.554)	Top-5 acc 71.094 (66.807)	lr 0.02361
Train [19][620/3239]	Time 0.590 (0.918)	Data Time 0.001 (0.032)	Loss 3.6030 (3.4246)	Entropy 1.07205 (1.07601)	Top-1 acc 41.016 (42.537)	Top-5 acc 64.844 (66.796)	lr 0.02361
Train [19][630/3239]	Time 0.595 (0.917)	Data Time 0.001 (0.031)	Loss 3.4168 (3.4249)	Entropy 1.07171 (1.07594)	Top-1 acc 43.359 (42.527)	Top-5 acc 70.703 (66.804)	lr 0.02361
Train [19][640/3239]	Time 0.579 (0.916)	Data Time 0.001 (0.031)	Loss 3.3726 (3.4251)	Entropy 1.07177 (1.07588)	Top-1 acc 42.578 (42.534)	Top-5 acc 71.484 (66.805)	lr 0.02361
Train [19][650/3239]	Time 0.606 (0.915)	Data Time 0.001 (0.031)	Loss 3.6811 (3.4256)	Entropy 1.07182 (1.07582)	Top-1 acc 37.109 (42.530)	Top-5 acc 61.328 (66.800)	lr 0.02361
Train [19][660/3239]	Time 0.593 (0.914)	Data Time 0.001 (0.030)	Loss 3.3483 (3.4259)	Entropy 1.07141 (1.07575)	Top-1 acc 44.531 (42.543)	Top-5 acc 68.359 (66.807)	lr 0.02361
Train [19][670/3239]	Time 0.613 (0.912)	Data Time 0.001 (0.030)	Loss 3.3500 (3.4256)	Entropy 1.07126 (1.07569)	Top-1 acc 46.484 (42.559)	Top-5 acc 67.578 (66.799)	lr 0.02361
Train [19][680/3239]	Time 0.624 (0.911)	Data Time 0.002 (0.029)	Loss 3.3194 (3.4249)	Entropy 1.07130 (1.07562)	Top-1 acc 43.750 (42.572)	Top-5 acc 67.578 (66.798)	lr 0.02361
Train [19][690/3239]	Time 0.595 (0.910)	Data Time 0.001 (0.029)	Loss 3.4638 (3.4250)	Entropy 1.07112 (1.07556)	Top-1 acc 37.500 (42.572)	Top-5 acc 63.281 (66.793)	lr 0.02361
Train [19][700/3239]	Time 0.600 (0.909)	Data Time 0.001 (0.028)	Loss 3.1590 (3.4248)	Entropy 1.07070 (1.07549)	Top-1 acc 48.438 (42.581)	Top-5 acc 70.312 (66.809)	lr 0.02361
Train [19][710/3239]	Time 0.596 (0.909)	Data Time 0.001 (0.028)	Loss 3.3616 (3.4247)	Entropy 1.07039 (1.07542)	Top-1 acc 42.969 (42.575)	Top-5 acc 67.969 (66.806)	lr 0.02360
Train [19][720/3239]	Time 0.606 (0.908)	Data Time 0.001 (0.028)	Loss 3.5750 (3.4250)	Entropy 1.07038 (1.07536)	Top-1 acc 37.891 (42.564)	Top-5 acc 64.062 (66.813)	lr 0.02360
Train [19][730/3239]	Time 0.611 (0.907)	Data Time 0.001 (0.027)	Loss 3.3309 (3.4246)	Entropy 1.07020 (1.07529)	Top-1 acc 42.969 (42.564)	Top-5 acc 67.969 (66.827)	lr 0.02360
Train [19][740/3239]	Time 0.640 (0.906)	Data Time 0.001 (0.027)	Loss 3.5437 (3.4247)	Entropy 1.06997 (1.07522)	Top-1 acc 40.625 (42.563)	Top-5 acc 64.062 (66.823)	lr 0.02360
Train [19][750/3239]	Time 0.708 (0.906)	Data Time 0.001 (0.027)	Loss 3.4905 (3.4238)	Entropy 1.06966 (1.07514)	Top-1 acc 38.281 (42.582)	Top-5 acc 64.062 (66.832)	lr 0.02360
Train [19][760/3239]	Time 0.604 (0.905)	Data Time 0.001 (0.026)	Loss 3.2009 (3.4239)	Entropy 1.06959 (1.07507)	Top-1 acc 46.875 (42.578)	Top-5 acc 73.047 (66.839)	lr 0.02360
Train [19][770/3239]	Time 0.629 (0.905)	Data Time 0.001 (0.026)	Loss 3.4898 (3.4240)	Entropy 1.06960 (1.07500)	Top-1 acc 39.844 (42.572)	Top-5 acc 62.109 (66.836)	lr 0.02360
Train [19][780/3239]	Time 0.612 (0.904)	Data Time 0.001 (0.026)	Loss 3.5401 (3.4236)	Entropy 1.06941 (1.07493)	Top-1 acc 41.016 (42.569)	Top-5 acc 64.844 (66.842)	lr 0.02360
Train [19][790/3239]	Time 0.578 (0.903)	Data Time 0.001 (0.025)	Loss 3.4808 (3.4243)	Entropy 1.06938 (1.07486)	Top-1 acc 39.453 (42.568)	Top-5 acc 63.672 (66.826)	lr 0.02360
Train [19][800/3239]	Time 0.609 (0.903)	Data Time 0.001 (0.025)	Loss 3.4877 (3.4254)	Entropy 1.06923 (1.07479)	Top-1 acc 35.547 (42.538)	Top-5 acc 66.406 (66.803)	lr 0.02360
Train [19][810/3239]	Time 0.589 (0.903)	Data Time 0.002 (0.025)	Loss 3.4172 (3.4247)	Entropy 1.06932 (1.07472)	Top-1 acc 44.531 (42.555)	Top-5 acc 65.625 (66.820)	lr 0.02360
Train [19][820/3239]	Time 0.715 (0.902)	Data Time 0.002 (0.025)	Loss 3.4401 (3.4241)	Entropy 1.06943 (1.07466)	Top-1 acc 44.141 (42.563)	Top-5 acc 67.188 (66.838)	lr 0.02360
Train [19][830/3239]	Time 0.513 (0.901)	Data Time 0.001 (0.024)	Loss 3.6927 (3.4246)	Entropy 1.06948 (1.07460)	Top-1 acc 37.109 (42.550)	Top-5 acc 60.938 (66.837)	lr 0.02360
Train [19][840/3239]	Time 0.567 (0.900)	Data Time 0.001 (0.024)	Loss 3.4553 (3.4239)	Entropy 1.06939 (1.07454)	Top-1 acc 45.312 (42.578)	Top-5 acc 67.188 (66.839)	lr 0.02360
Train [19][850/3239]	Time 0.618 (0.899)	Data Time 0.001 (0.024)	Loss 3.5057 (3.4239)	Entropy 1.06907 (1.07447)	Top-1 acc 40.625 (42.562)	Top-5 acc 65.234 (66.841)	lr 0.02360
Train [19][860/3239]	Time 0.612 (0.898)	Data Time 0.001 (0.024)	Loss 3.2534 (3.4234)	Entropy 1.06857 (1.07441)	Top-1 acc 44.922 (42.577)	Top-5 acc 68.750 (66.849)	lr 0.02360
Train [19][870/3239]	Time 0.577 (0.898)	Data Time 0.001 (0.023)	Loss 3.4935 (3.4235)	Entropy 1.06841 (1.07434)	Top-1 acc 40.625 (42.577)	Top-5 acc 63.672 (66.840)	lr 0.02360
Train [19][880/3239]	Time 0.584 (0.898)	Data Time 0.001 (0.023)	Loss 3.4355 (3.4235)	Entropy 1.06794 (1.07427)	Top-1 acc 46.094 (42.587)	Top-5 acc 64.453 (66.837)	lr 0.02360
Train [19][890/3239]	Time 0.609 (0.897)	Data Time 0.001 (0.023)	Loss 3.2019 (3.4226)	Entropy 1.06740 (1.07420)	Top-1 acc 46.484 (42.597)	Top-5 acc 73.047 (66.856)	lr 0.02360
Train [19][900/3239]	Time 0.564 (0.897)	Data Time 0.001 (0.023)	Loss 3.3222 (3.4228)	Entropy 1.06713 (1.07412)	Top-1 acc 39.844 (42.586)	Top-5 acc 69.922 (66.858)	lr 0.02360
Train [19][910/3239]	Time 0.661 (0.896)	Data Time 0.001 (0.022)	Loss 3.4006 (3.4227)	Entropy 1.06745 (1.07405)	Top-1 acc 42.188 (42.587)	Top-5 acc 66.016 (66.865)	lr 0.02360
Train [19][920/3239]	Time 0.549 (0.896)	Data Time 0.001 (0.022)	Loss 3.5244 (3.4229)	Entropy 1.06710 (1.07397)	Top-1 acc 39.453 (42.582)	Top-5 acc 63.672 (66.858)	lr 0.02360
Train [19][930/3239]	Time 0.590 (0.895)	Data Time 0.001 (0.022)	Loss 3.3694 (3.4229)	Entropy 1.06695 (1.07390)	Top-1 acc 44.531 (42.579)	Top-5 acc 64.844 (66.846)	lr 0.02359
Train [19][940/3239]	Time 0.595 (0.895)	Data Time 0.001 (0.022)	Loss 3.4916 (3.4231)	Entropy 1.06683 (1.07382)	Top-1 acc 40.234 (42.577)	Top-5 acc 64.062 (66.839)	lr 0.02359
Train [19][950/3239]	Time 0.606 (0.895)	Data Time 0.001 (0.021)	Loss 3.6078 (3.4227)	Entropy 1.06643 (1.07375)	Top-1 acc 37.891 (42.583)	Top-5 acc 64.844 (66.842)	lr 0.02359
Train [19][960/3239]	Time 0.596 (0.894)	Data Time 0.001 (0.021)	Loss 3.5629 (3.4219)	Entropy 1.06620 (1.07367)	Top-1 acc 38.281 (42.611)	Top-5 acc 64.844 (66.858)	lr 0.02359
Train [19][970/3239]	Time 0.574 (0.894)	Data Time 0.001 (0.021)	Loss 3.6757 (3.4217)	Entropy 1.06623 (1.07360)	Top-1 acc 40.234 (42.614)	Top-5 acc 63.672 (66.863)	lr 0.02359
Train [19][980/3239]	Time 0.647 (0.893)	Data Time 0.001 (0.021)	Loss 3.1545 (3.4204)	Entropy 1.06576 (1.07352)	Top-1 acc 45.312 (42.642)	Top-5 acc 71.875 (66.895)	lr 0.02359
Train [19][990/3239]	Time 0.599 (0.893)	Data Time 0.001 (0.021)	Loss 3.5438 (3.4205)	Entropy 1.06593 (1.07344)	Top-1 acc 44.922 (42.645)	Top-5 acc 65.234 (66.896)	lr 0.02359
Train [19][1000/3239]	Time 0.555 (0.892)	Data Time 0.001 (0.020)	Loss 3.4660 (3.4210)	Entropy 1.06576 (1.07337)	Top-1 acc 40.625 (42.639)	Top-5 acc 65.625 (66.885)	lr 0.02359
Train [19][1010/3239]	Time 0.574 (0.891)	Data Time 0.001 (0.020)	Loss 3.3758 (3.4209)	Entropy 1.06578 (1.07329)	Top-1 acc 39.844 (42.630)	Top-5 acc 70.312 (66.891)	lr 0.02359
Train [19][1020/3239]	Time 0.629 (0.891)	Data Time 0.001 (0.020)	Loss 3.3295 (3.4211)	Entropy 1.06621 (1.07322)	Top-1 acc 44.141 (42.630)	Top-5 acc 67.969 (66.894)	lr 0.02359
Train [19][1030/3239]	Time 0.576 (0.890)	Data Time 0.001 (0.020)	Loss 3.4392 (3.4211)	Entropy 1.06603 (1.07315)	Top-1 acc 42.969 (42.631)	Top-5 acc 67.969 (66.898)	lr 0.02359
Train [19][1040/3239]	Time 0.604 (0.890)	Data Time 0.001 (0.020)	Loss 3.5986 (3.4209)	Entropy 1.06544 (1.07308)	Top-1 acc 40.234 (42.630)	Top-5 acc 60.938 (66.897)	lr 0.02359
Train [19][1050/3239]	Time 0.609 (0.890)	Data Time 0.001 (0.020)	Loss 3.3806 (3.4204)	Entropy 1.06583 (1.07301)	Top-1 acc 44.922 (42.636)	Top-5 acc 67.188 (66.906)	lr 0.02359
Train [19][1060/3239]	Time 0.564 (0.889)	Data Time 0.001 (0.019)	Loss 3.4435 (3.4197)	Entropy 1.06593 (1.07294)	Top-1 acc 35.547 (42.643)	Top-5 acc 67.188 (66.915)	lr 0.02359
Train [19][1070/3239]	Time 0.604 (0.889)	Data Time 0.001 (0.019)	Loss 3.3720 (3.4197)	Entropy 1.06576 (1.07287)	Top-1 acc 42.578 (42.654)	Top-5 acc 68.359 (66.917)	lr 0.02359
Train [19][1080/3239]	Time 0.607 (0.889)	Data Time 0.001 (0.019)	Loss 3.2239 (3.4200)	Entropy 1.06547 (1.07281)	Top-1 acc 43.750 (42.654)	Top-5 acc 71.875 (66.910)	lr 0.02359
Train [19][1090/3239]	Time 0.589 (0.888)	Data Time 0.001 (0.019)	Loss 3.3799 (3.4200)	Entropy 1.06524 (1.07274)	Top-1 acc 44.141 (42.661)	Top-5 acc 67.969 (66.913)	lr 0.02359
Train [19][1100/3239]	Time 0.580 (0.888)	Data Time 0.001 (0.019)	Loss 3.5466 (3.4205)	Entropy 1.06525 (1.07267)	Top-1 acc 39.062 (42.655)	Top-5 acc 63.281 (66.893)	lr 0.02359
Train [19][1110/3239]	Time 0.577 (0.888)	Data Time 0.001 (0.019)	Loss 3.3729 (3.4213)	Entropy 1.06531 (1.07260)	Top-1 acc 42.188 (42.639)	Top-5 acc 69.531 (66.875)	lr 0.02359
Train [19][1120/3239]	Time 0.577 (0.888)	Data Time 0.001 (0.018)	Loss 3.3929 (3.4215)	Entropy 1.06554 (1.07254)	Top-1 acc 42.969 (42.632)	Top-5 acc 63.672 (66.870)	lr 0.02359
Train [19][1130/3239]	Time 0.572 (0.887)	Data Time 0.001 (0.018)	Loss 3.3081 (3.4220)	Entropy 1.06542 (1.07248)	Top-1 acc 43.750 (42.623)	Top-5 acc 69.531 (66.864)	lr 0.02359
Train [19][1140/3239]	Time 0.662 (0.887)	Data Time 0.001 (0.018)	Loss 3.5245 (3.4224)	Entropy 1.06521 (1.07241)	Top-1 acc 41.016 (42.617)	Top-5 acc 62.500 (66.855)	lr 0.02358
Train [19][1150/3239]	Time 0.666 (0.887)	Data Time 0.002 (0.018)	Loss 3.4764 (3.4223)	Entropy 1.06491 (1.07235)	Top-1 acc 42.188 (42.621)	Top-5 acc 69.141 (66.851)	lr 0.02358
Train [19][1160/3239]	Time 0.572 (0.886)	Data Time 0.001 (0.018)	Loss 3.5822 (3.4222)	Entropy 1.06467 (1.07229)	Top-1 acc 42.188 (42.628)	Top-5 acc 65.234 (66.845)	lr 0.02358
Train [19][1170/3239]	Time 0.635 (0.886)	Data Time 0.002 (0.018)	Loss 3.4122 (3.4224)	Entropy 1.06399 (1.07222)	Top-1 acc 46.094 (42.629)	Top-5 acc 64.844 (66.846)	lr 0.02358
Train [19][1180/3239]	Time 0.561 (0.886)	Data Time 0.001 (0.018)	Loss 3.5349 (3.4225)	Entropy 1.06375 (1.07215)	Top-1 acc 44.531 (42.630)	Top-5 acc 64.844 (66.844)	lr 0.02358
Train [19][1190/3239]	Time 0.619 (0.885)	Data Time 0.001 (0.018)	Loss 3.5114 (3.4228)	Entropy 1.06317 (1.07208)	Top-1 acc 39.453 (42.629)	Top-5 acc 67.969 (66.843)	lr 0.02358
Train [19][1200/3239]	Time 0.587 (0.885)	Data Time 0.001 (0.017)	Loss 3.4439 (3.4229)	Entropy 1.06317 (1.07200)	Top-1 acc 41.406 (42.625)	Top-5 acc 66.406 (66.839)	lr 0.02358
Train [19][1210/3239]	Time 0.671 (0.885)	Data Time 0.001 (0.017)	Loss 3.2379 (3.4226)	Entropy 1.06292 (1.07193)	Top-1 acc 46.484 (42.627)	Top-5 acc 69.531 (66.842)	lr 0.02358
Train [19][1220/3239]	Time 0.575 (0.884)	Data Time 0.001 (0.017)	Loss 3.4188 (3.4228)	Entropy 1.06214 (1.07185)	Top-1 acc 46.875 (42.633)	Top-5 acc 65.625 (66.838)	lr 0.02358
Train [19][1230/3239]	Time 0.619 (0.884)	Data Time 0.001 (0.017)	Loss 3.4978 (3.4227)	Entropy 1.06212 (1.07177)	Top-1 acc 41.016 (42.640)	Top-5 acc 63.281 (66.839)	lr 0.02358
Train [19][1240/3239]	Time 0.603 (0.884)	Data Time 0.001 (0.017)	Loss 3.4219 (3.4225)	Entropy 1.06172 (1.07170)	Top-1 acc 41.016 (42.642)	Top-5 acc 67.578 (66.853)	lr 0.02358
Train [19][1250/3239]	Time 0.556 (0.884)	Data Time 0.001 (0.017)	Loss 3.4921 (3.4229)	Entropy 1.06185 (1.07162)	Top-1 acc 43.750 (42.633)	Top-5 acc 64.844 (66.846)	lr 0.02358
Train [19][1260/3239]	Time 0.640 (0.900)	Data Time 0.002 (0.017)	Loss 3.5857 (3.4230)	Entropy 1.06186 (1.07154)	Top-1 acc 37.500 (42.631)	Top-5 acc 64.453 (66.844)	lr 0.02358
Train [19][1270/3239]	Time 0.618 (0.900)	Data Time 0.002 (0.017)	Loss 3.4692 (3.4226)	Entropy 1.06200 (1.07146)	Top-1 acc 42.578 (42.638)	Top-5 acc 64.453 (66.850)	lr 0.02358
Train [19][1280/3239]	Time 0.590 (0.899)	Data Time 0.001 (0.016)	Loss 3.5406 (3.4232)	Entropy 1.06120 (1.07139)	Top-1 acc 39.844 (42.630)	Top-5 acc 68.359 (66.844)	lr 0.02358
Train [19][1290/3239]	Time 0.563 (0.899)	Data Time 0.001 (0.016)	Loss 3.5092 (3.4229)	Entropy 1.06098 (1.07131)	Top-1 acc 41.016 (42.635)	Top-5 acc 64.453 (66.848)	lr 0.02358
Train [19][1300/3239]	Time 0.716 (0.899)	Data Time 0.001 (0.016)	Loss 3.4390 (3.4226)	Entropy 1.06087 (1.07123)	Top-1 acc 42.578 (42.643)	Top-5 acc 66.797 (66.853)	lr 0.02358
Train [19][1310/3239]	Time 0.598 (0.898)	Data Time 0.003 (0.016)	Loss 3.2810 (3.4218)	Entropy 1.06091 (1.07115)	Top-1 acc 45.703 (42.661)	Top-5 acc 68.359 (66.867)	lr 0.02358
Train [19][1320/3239]	Time 0.473 (0.898)	Data Time 0.001 (0.016)	Loss 3.6397 (3.4221)	Entropy 1.06114 (1.07107)	Top-1 acc 39.062 (42.656)	Top-5 acc 60.156 (66.864)	lr 0.02358
Train [19][1330/3239]	Time 0.573 (0.897)	Data Time 0.001 (0.016)	Loss 3.5578 (3.4218)	Entropy 1.06105 (1.07100)	Top-1 acc 39.453 (42.661)	Top-5 acc 67.188 (66.876)	lr 0.02358
Train [19][1340/3239]	Time 0.588 (0.897)	Data Time 0.001 (0.016)	Loss 3.4937 (3.4221)	Entropy 1.06109 (1.07092)	Top-1 acc 41.016 (42.668)	Top-5 acc 66.797 (66.867)	lr 0.02358
Train [19][1350/3239]	Time 0.635 (0.897)	Data Time 0.001 (0.016)	Loss 3.2443 (3.4221)	Entropy 1.06045 (1.07085)	Top-1 acc 49.609 (42.676)	Top-5 acc 71.094 (66.866)	lr 0.02358
Train [19][1360/3239]	Time 0.602 (0.896)	Data Time 0.001 (0.016)	Loss 3.3046 (3.4220)	Entropy 1.06028 (1.07077)	Top-1 acc 43.359 (42.675)	Top-5 acc 69.141 (66.871)	lr 0.02357
Train [19][1370/3239]	Time 0.696 (0.896)	Data Time 0.001 (0.016)	Loss 3.5750 (3.4217)	Entropy 1.06066 (1.07069)	Top-1 acc 38.281 (42.683)	Top-5 acc 64.844 (66.870)	lr 0.02357
Train [19][1380/3239]	Time 0.600 (0.896)	Data Time 0.001 (0.015)	Loss 3.5113 (3.4222)	Entropy 1.06025 (1.07062)	Top-1 acc 41.797 (42.670)	Top-5 acc 63.672 (66.859)	lr 0.02357
Train [19][1390/3239]	Time 0.603 (0.896)	Data Time 0.001 (0.015)	Loss 3.3093 (3.4226)	Entropy 1.05984 (1.07055)	Top-1 acc 47.266 (42.664)	Top-5 acc 72.266 (66.855)	lr 0.02357
Train [19][1400/3239]	Time 0.608 (0.895)	Data Time 0.001 (0.015)	Loss 3.2558 (3.4225)	Entropy 1.05973 (1.07047)	Top-1 acc 45.703 (42.675)	Top-5 acc 71.094 (66.861)	lr 0.02357
Train [19][1410/3239]	Time 0.612 (0.895)	Data Time 0.001 (0.015)	Loss 3.6391 (3.4227)	Entropy 1.05963 (1.07039)	Top-1 acc 39.453 (42.671)	Top-5 acc 60.938 (66.857)	lr 0.02357
Train [19][1420/3239]	Time 0.593 (0.895)	Data Time 0.001 (0.015)	Loss 3.4962 (3.4226)	Entropy 1.05946 (1.07032)	Top-1 acc 42.188 (42.681)	Top-5 acc 64.453 (66.859)	lr 0.02357
Train [19][1430/3239]	Time 0.596 (0.895)	Data Time 0.001 (0.015)	Loss 3.6384 (3.4228)	Entropy 1.05934 (1.07024)	Top-1 acc 37.500 (42.674)	Top-5 acc 61.328 (66.851)	lr 0.02357
Train [19][1440/3239]	Time 0.603 (0.894)	Data Time 0.001 (0.015)	Loss 3.2121 (3.4231)	Entropy 1.05898 (1.07016)	Top-1 acc 50.391 (42.671)	Top-5 acc 70.703 (66.846)	lr 0.02357
Train [19][1450/3239]	Time 0.604 (0.894)	Data Time 0.001 (0.015)	Loss 3.2161 (3.4234)	Entropy 1.05900 (1.07009)	Top-1 acc 46.484 (42.663)	Top-5 acc 71.094 (66.841)	lr 0.02357
Train [19][1460/3239]	Time 0.607 (0.894)	Data Time 0.001 (0.015)	Loss 3.3193 (3.4231)	Entropy 1.05906 (1.07001)	Top-1 acc 46.484 (42.666)	Top-5 acc 66.406 (66.847)	lr 0.02357
Train [19][1470/3239]	Time 0.606 (0.893)	Data Time 0.001 (0.015)	Loss 3.3968 (3.4230)	Entropy 1.05919 (1.06994)	Top-1 acc 41.406 (42.659)	Top-5 acc 67.969 (66.847)	lr 0.02357
Train [19][1480/3239]	Time 0.604 (0.893)	Data Time 0.001 (0.014)	Loss 3.3696 (3.4230)	Entropy 1.05880 (1.06986)	Top-1 acc 42.188 (42.658)	Top-5 acc 70.703 (66.848)	lr 0.02357
Train [19][1490/3239]	Time 0.513 (0.893)	Data Time 0.001 (0.014)	Loss 3.6891 (3.4233)	Entropy 1.05894 (1.06979)	Top-1 acc 35.938 (42.655)	Top-5 acc 60.547 (66.839)	lr 0.02357
Train [19][1500/3239]	Time 0.614 (0.892)	Data Time 0.001 (0.014)	Loss 3.4136 (3.4229)	Entropy 1.05876 (1.06972)	Top-1 acc 42.969 (42.665)	Top-5 acc 66.406 (66.847)	lr 0.02357
Train [19][1510/3239]	Time 0.612 (0.892)	Data Time 0.001 (0.014)	Loss 3.4330 (3.4231)	Entropy 1.05835 (1.06964)	Top-1 acc 44.141 (42.661)	Top-5 acc 66.016 (66.841)	lr 0.02357
Train [19][1520/3239]	Time 0.577 (0.891)	Data Time 0.001 (0.014)	Loss 3.4061 (3.4229)	Entropy 1.05805 (1.06957)	Top-1 acc 41.406 (42.668)	Top-5 acc 66.016 (66.850)	lr 0.02357
Train [19][1530/3239]	Time 0.698 (0.891)	Data Time 0.001 (0.014)	Loss 3.4656 (3.4229)	Entropy 1.05811 (1.06949)	Top-1 acc 42.969 (42.663)	Top-5 acc 65.625 (66.851)	lr 0.02357
Train [19][1540/3239]	Time 0.590 (0.891)	Data Time 0.001 (0.014)	Loss 3.3925 (3.4229)	Entropy 1.05845 (1.06942)	Top-1 acc 46.875 (42.662)	Top-5 acc 67.188 (66.848)	lr 0.02357
Train [19][1550/3239]	Time 0.593 (0.891)	Data Time 0.002 (0.014)	Loss 3.5918 (3.4229)	Entropy 1.05811 (1.06935)	Top-1 acc 38.672 (42.665)	Top-5 acc 62.891 (66.845)	lr 0.02357
Train [19][1560/3239]	Time 0.599 (0.891)	Data Time 0.001 (0.014)	Loss 3.7176 (3.4231)	Entropy 1.05810 (1.06928)	Top-1 acc 37.891 (42.670)	Top-5 acc 59.766 (66.838)	lr 0.02357
Train [19][1570/3239]	Time 0.636 (0.890)	Data Time 0.001 (0.014)	Loss 3.1900 (3.4230)	Entropy 1.05789 (1.06920)	Top-1 acc 51.172 (42.676)	Top-5 acc 70.312 (66.835)	lr 0.02356
Train [19][1580/3239]	Time 0.591 (0.890)	Data Time 0.001 (0.014)	Loss 3.3928 (3.4231)	Entropy 1.05779 (1.06913)	Top-1 acc 41.016 (42.673)	Top-5 acc 65.625 (66.831)	lr 0.02356
Train [19][1590/3239]	Time 0.598 (0.890)	Data Time 0.003 (0.014)	Loss 3.5663 (3.4229)	Entropy 1.05807 (1.06906)	Top-1 acc 40.625 (42.672)	Top-5 acc 64.062 (66.833)	lr 0.02356
Train [19][1600/3239]	Time 0.714 (0.890)	Data Time 0.001 (0.014)	Loss 3.4775 (3.4227)	Entropy 1.05770 (1.06899)	Top-1 acc 39.062 (42.670)	Top-5 acc 61.719 (66.833)	lr 0.02356
Train [19][1610/3239]	Time 0.596 (0.890)	Data Time 0.001 (0.013)	Loss 3.4025 (3.4225)	Entropy 1.05775 (1.06892)	Top-1 acc 41.406 (42.677)	Top-5 acc 67.188 (66.831)	lr 0.02356
Train [19][1620/3239]	Time 0.545 (0.889)	Data Time 0.001 (0.013)	Loss 3.3038 (3.4225)	Entropy 1.05785 (1.06885)	Top-1 acc 43.750 (42.673)	Top-5 acc 72.266 (66.834)	lr 0.02356
Train [19][1630/3239]	Time 0.552 (0.889)	Data Time 0.001 (0.013)	Loss 3.4871 (3.4226)	Entropy 1.05770 (1.06879)	Top-1 acc 36.328 (42.662)	Top-5 acc 63.672 (66.828)	lr 0.02356
Train [19][1640/3239]	Time 0.457 (0.889)	Data Time 0.001 (0.013)	Loss 3.2590 (3.4225)	Entropy 1.05774 (1.06872)	Top-1 acc 48.828 (42.663)	Top-5 acc 72.656 (66.829)	lr 0.02356
Train [19][1650/3239]	Time 0.576 (0.888)	Data Time 0.001 (0.013)	Loss 3.5739 (3.4227)	Entropy 1.05817 (1.06865)	Top-1 acc 40.234 (42.660)	Top-5 acc 62.109 (66.817)	lr 0.02356
Train [19][1660/3239]	Time 0.572 (0.888)	Data Time 0.001 (0.013)	Loss 3.4811 (3.4226)	Entropy 1.05816 (1.06859)	Top-1 acc 44.922 (42.665)	Top-5 acc 64.453 (66.822)	lr 0.02356
Train [19][1670/3239]	Time 0.586 (0.888)	Data Time 0.001 (0.013)	Loss 3.3673 (3.4226)	Entropy 1.05830 (1.06853)	Top-1 acc 40.625 (42.670)	Top-5 acc 66.016 (66.822)	lr 0.02356
Train [19][1680/3239]	Time 0.597 (0.888)	Data Time 0.001 (0.013)	Loss 3.6282 (3.4228)	Entropy 1.05801 (1.06847)	Top-1 acc 38.672 (42.664)	Top-5 acc 63.672 (66.815)	lr 0.02356
Train [19][1690/3239]	Time 0.693 (0.887)	Data Time 0.001 (0.013)	Loss 3.4676 (3.4230)	Entropy 1.05766 (1.06840)	Top-1 acc 44.141 (42.664)	Top-5 acc 65.625 (66.812)	lr 0.02356
Train [19][1700/3239]	Time 0.586 (0.887)	Data Time 0.001 (0.013)	Loss 3.4275 (3.4230)	Entropy 1.05774 (1.06834)	Top-1 acc 41.797 (42.666)	Top-5 acc 64.062 (66.803)	lr 0.02356
Train [19][1710/3239]	Time 0.629 (0.887)	Data Time 0.001 (0.013)	Loss 3.4152 (3.4231)	Entropy 1.05789 (1.06828)	Top-1 acc 41.797 (42.666)	Top-5 acc 67.188 (66.803)	lr 0.02356
Train [19][1720/3239]	Time 0.613 (0.887)	Data Time 0.001 (0.013)	Loss 3.2583 (3.4232)	Entropy 1.05753 (1.06822)	Top-1 acc 43.750 (42.665)	Top-5 acc 69.531 (66.802)	lr 0.02356
Train [19][1730/3239]	Time 0.600 (0.887)	Data Time 0.001 (0.013)	Loss 3.3137 (3.4232)	Entropy 1.05722 (1.06816)	Top-1 acc 44.141 (42.661)	Top-5 acc 68.359 (66.798)	lr 0.02356
Train [19][1740/3239]	Time 0.626 (0.887)	Data Time 0.001 (0.013)	Loss 3.3940 (3.4232)	Entropy 1.05705 (1.06809)	Top-1 acc 40.234 (42.667)	Top-5 acc 66.797 (66.797)	lr 0.02356
Train [19][1750/3239]	Time 0.569 (0.886)	Data Time 0.001 (0.013)	Loss 3.2749 (3.4237)	Entropy 1.05661 (1.06803)	Top-1 acc 44.922 (42.656)	Top-5 acc 69.141 (66.786)	lr 0.02356
Train [19][1760/3239]	Time 0.720 (0.886)	Data Time 0.001 (0.012)	Loss 3.3475 (3.4240)	Entropy 1.05674 (1.06796)	Top-1 acc 44.922 (42.651)	Top-5 acc 66.016 (66.774)	lr 0.02356
Train [19][1770/3239]	Time 0.617 (0.886)	Data Time 0.001 (0.012)	Loss 3.2272 (3.4240)	Entropy 1.05617 (1.06790)	Top-1 acc 46.094 (42.660)	Top-5 acc 70.312 (66.776)	lr 0.02356
Train [19][1780/3239]	Time 0.577 (0.886)	Data Time 0.001 (0.012)	Loss 3.5110 (3.4240)	Entropy 1.05542 (1.06783)	Top-1 acc 40.625 (42.663)	Top-5 acc 63.672 (66.772)	lr 0.02355
Train [19][1790/3239]	Time 0.594 (0.886)	Data Time 0.001 (0.012)	Loss 3.2096 (3.4238)	Entropy 1.05493 (1.06776)	Top-1 acc 48.438 (42.668)	Top-5 acc 72.266 (66.777)	lr 0.02355
Train [19][1800/3239]	Time 0.622 (0.886)	Data Time 0.001 (0.012)	Loss 3.5329 (3.4237)	Entropy 1.05493 (1.06769)	Top-1 acc 40.625 (42.667)	Top-5 acc 64.062 (66.774)	lr 0.02355
Train [19][1810/3239]	Time 0.607 (0.885)	Data Time 0.001 (0.012)	Loss 3.3221 (3.4239)	Entropy 1.05454 (1.06762)	Top-1 acc 45.703 (42.664)	Top-5 acc 71.875 (66.771)	lr 0.02355
Train [19][1820/3239]	Time 0.604 (0.885)	Data Time 0.001 (0.012)	Loss 3.3728 (3.4235)	Entropy 1.05380 (1.06755)	Top-1 acc 43.359 (42.668)	Top-5 acc 70.703 (66.781)	lr 0.02355
Train [19][1830/3239]	Time 0.501 (0.885)	Data Time 0.001 (0.012)	Loss 3.2858 (3.4234)	Entropy 1.05404 (1.06747)	Top-1 acc 45.703 (42.671)	Top-5 acc 69.141 (66.783)	lr 0.02355
Train [19][1840/3239]	Time 0.560 (0.885)	Data Time 0.001 (0.012)	Loss 3.5898 (3.4233)	Entropy 1.05380 (1.06740)	Top-1 acc 41.016 (42.672)	Top-5 acc 63.672 (66.786)	lr 0.02355
Train [19][1850/3239]	Time 0.598 (0.884)	Data Time 0.001 (0.012)	Loss 3.3781 (3.4231)	Entropy 1.05377 (1.06732)	Top-1 acc 42.578 (42.676)	Top-5 acc 68.359 (66.795)	lr 0.02355
Train [19][1860/3239]	Time 0.610 (0.884)	Data Time 0.001 (0.012)	Loss 3.2729 (3.4230)	Entropy 1.05386 (1.06725)	Top-1 acc 44.922 (42.679)	Top-5 acc 72.266 (66.797)	lr 0.02355
Train [19][1870/3239]	Time 0.621 (0.884)	Data Time 0.002 (0.012)	Loss 3.5243 (3.4234)	Entropy 1.05422 (1.06718)	Top-1 acc 39.844 (42.664)	Top-5 acc 66.406 (66.785)	lr 0.02355
Train [19][1880/3239]	Time 0.581 (0.884)	Data Time 0.001 (0.012)	Loss 3.6012 (3.4237)	Entropy 1.05394 (1.06711)	Top-1 acc 35.938 (42.654)	Top-5 acc 64.453 (66.780)	lr 0.02355
Train [19][1890/3239]	Time 0.584 (0.883)	Data Time 0.001 (0.012)	Loss 3.5458 (3.4235)	Entropy 1.05367 (1.06704)	Top-1 acc 40.625 (42.661)	Top-5 acc 63.672 (66.783)	lr 0.02355
Train [19][1900/3239]	Time 0.623 (0.883)	Data Time 0.001 (0.012)	Loss 3.2082 (3.4233)	Entropy 1.05342 (1.06697)	Top-1 acc 48.438 (42.665)	Top-5 acc 66.406 (66.787)	lr 0.02355
Train [19][1910/3239]	Time 0.825 (0.894)	Data Time 0.042 (0.012)	Loss 3.4682 (3.4231)	Entropy 1.05299 (1.06690)	Top-1 acc 38.672 (42.667)	Top-5 acc 66.016 (66.788)	lr 0.02355
Train [19][1920/3239]	Time 0.648 (0.894)	Data Time 0.002 (0.012)	Loss 3.4040 (3.4234)	Entropy 1.05286 (1.06683)	Top-1 acc 43.750 (42.661)	Top-5 acc 69.531 (66.785)	lr 0.02355
Train [19][1930/3239]	Time 0.602 (0.893)	Data Time 0.001 (0.012)	Loss 3.4766 (3.4233)	Entropy 1.05265 (1.06675)	Top-1 acc 41.797 (42.660)	Top-5 acc 68.359 (66.787)	lr 0.02355
Train [19][1940/3239]	Time 0.593 (0.893)	Data Time 0.001 (0.012)	Loss 3.3837 (3.4233)	Entropy 1.05197 (1.06668)	Top-1 acc 42.578 (42.655)	Top-5 acc 66.797 (66.788)	lr 0.02355
Train [19][1950/3239]	Time 0.616 (0.893)	Data Time 0.001 (0.011)	Loss 3.3993 (3.4231)	Entropy 1.05207 (1.06660)	Top-1 acc 39.844 (42.653)	Top-5 acc 70.312 (66.790)	lr 0.02355
Train [19][1960/3239]	Time 0.513 (0.893)	Data Time 0.001 (0.011)	Loss 3.3596 (3.4227)	Entropy 1.05202 (1.06653)	Top-1 acc 45.703 (42.667)	Top-5 acc 69.531 (66.800)	lr 0.02355
Train [19][1970/3239]	Time 0.568 (0.892)	Data Time 0.001 (0.011)	Loss 3.4385 (3.4227)	Entropy 1.05163 (1.06646)	Top-1 acc 40.625 (42.669)	Top-5 acc 67.188 (66.805)	lr 0.02355
Train [19][1980/3239]	Time 0.600 (0.892)	Data Time 0.001 (0.011)	Loss 3.4588 (3.4229)	Entropy 1.05138 (1.06638)	Top-1 acc 41.406 (42.659)	Top-5 acc 69.141 (66.805)	lr 0.02355
Train [19][1990/3239]	Time 0.672 (0.892)	Data Time 0.001 (0.011)	Loss 3.4997 (3.4233)	Entropy 1.05152 (1.06631)	Top-1 acc 44.141 (42.654)	Top-5 acc 64.453 (66.798)	lr 0.02354
Train [19][2000/3239]	Time 0.620 (0.892)	Data Time 0.001 (0.011)	Loss 3.3064 (3.4230)	Entropy 1.05190 (1.06623)	Top-1 acc 45.703 (42.662)	Top-5 acc 70.312 (66.809)	lr 0.02354
Train [19][2010/3239]	Time 0.627 (0.891)	Data Time 0.002 (0.011)	Loss 3.4477 (3.4228)	Entropy 1.05171 (1.06616)	Top-1 acc 42.969 (42.669)	Top-5 acc 71.484 (66.818)	lr 0.02354
Train [19][2020/3239]	Time 0.578 (0.891)	Data Time 0.001 (0.011)	Loss 3.3139 (3.4229)	Entropy 1.05168 (1.06609)	Top-1 acc 46.484 (42.666)	Top-5 acc 65.625 (66.808)	lr 0.02354
Train [19][2030/3239]	Time 0.573 (0.891)	Data Time 0.001 (0.011)	Loss 3.5098 (3.4228)	Entropy 1.05177 (1.06602)	Top-1 acc 37.109 (42.669)	Top-5 acc 61.328 (66.809)	lr 0.02354
Train [19][2040/3239]	Time 0.567 (0.891)	Data Time 0.001 (0.011)	Loss 3.3373 (3.4228)	Entropy 1.05173 (1.06595)	Top-1 acc 46.094 (42.670)	Top-5 acc 67.969 (66.810)	lr 0.02354
Train [19][2050/3239]	Time 0.593 (0.891)	Data Time 0.001 (0.011)	Loss 3.2427 (3.4228)	Entropy 1.05139 (1.06588)	Top-1 acc 46.875 (42.674)	Top-5 acc 71.484 (66.814)	lr 0.02354
Train [19][2060/3239]	Time 0.578 (0.891)	Data Time 0.001 (0.011)	Loss 3.3711 (3.4228)	Entropy 1.05098 (1.06581)	Top-1 acc 42.578 (42.675)	Top-5 acc 67.969 (66.811)	lr 0.02354
Train [19][2070/3239]	Time 0.628 (0.891)	Data Time 0.001 (0.011)	Loss 3.3228 (3.4226)	Entropy 1.05093 (1.06574)	Top-1 acc 42.969 (42.677)	Top-5 acc 67.578 (66.815)	lr 0.02354
Train [19][2080/3239]	Time 0.712 (0.890)	Data Time 0.001 (0.011)	Loss 3.5198 (3.4224)	Entropy 1.05118 (1.06566)	Top-1 acc 43.359 (42.677)	Top-5 acc 66.406 (66.820)	lr 0.02354
Train [19][2090/3239]	Time 0.546 (0.890)	Data Time 0.001 (0.011)	Loss 3.2700 (3.4220)	Entropy 1.05095 (1.06559)	Top-1 acc 48.047 (42.687)	Top-5 acc 69.922 (66.828)	lr 0.02354
Train [19][2100/3239]	Time 0.602 (0.890)	Data Time 0.001 (0.011)	Loss 3.5750 (3.4222)	Entropy 1.05061 (1.06552)	Top-1 acc 39.844 (42.682)	Top-5 acc 64.062 (66.824)	lr 0.02354
Train [19][2110/3239]	Time 0.577 (0.890)	Data Time 0.001 (0.011)	Loss 3.5340 (3.4222)	Entropy 1.05051 (1.06545)	Top-1 acc 42.188 (42.685)	Top-5 acc 66.016 (66.824)	lr 0.02354
Train [19][2120/3239]	Time 0.562 (0.890)	Data Time 0.001 (0.011)	Loss 3.4508 (3.4223)	Entropy 1.05042 (1.06538)	Top-1 acc 41.016 (42.680)	Top-5 acc 67.188 (66.824)	lr 0.02354
Train [19][2130/3239]	Time 0.597 (0.890)	Data Time 0.001 (0.011)	Loss 3.4332 (3.4223)	Entropy 1.05029 (1.06531)	Top-1 acc 42.969 (42.681)	Top-5 acc 67.578 (66.824)	lr 0.02354
Train [19][2140/3239]	Time 0.579 (0.889)	Data Time 0.001 (0.011)	Loss 3.4894 (3.4222)	Entropy 1.04984 (1.06524)	Top-1 acc 43.750 (42.681)	Top-5 acc 63.672 (66.826)	lr 0.02354
Train [19][2150/3239]	Time 0.715 (0.889)	Data Time 0.001 (0.011)	Loss 3.3539 (3.4224)	Entropy 1.04977 (1.06517)	Top-1 acc 43.750 (42.677)	Top-5 acc 68.359 (66.822)	lr 0.02354
Train [19][2160/3239]	Time 0.635 (0.889)	Data Time 0.001 (0.011)	Loss 3.3631 (3.4225)	Entropy 1.04968 (1.06510)	Top-1 acc 43.359 (42.674)	Top-5 acc 64.844 (66.818)	lr 0.02354
Train [19][2170/3239]	Time 0.608 (0.889)	Data Time 0.001 (0.011)	Loss 3.3439 (3.4221)	Entropy 1.04927 (1.06503)	Top-1 acc 43.750 (42.683)	Top-5 acc 71.094 (66.827)	lr 0.02354
Train [19][2180/3239]	Time 0.571 (0.888)	Data Time 0.001 (0.010)	Loss 3.2420 (3.4224)	Entropy 1.04922 (1.06495)	Top-1 acc 46.875 (42.681)	Top-5 acc 71.875 (66.821)	lr 0.02354
Train [19][2190/3239]	Time 0.642 (0.888)	Data Time 0.001 (0.010)	Loss 3.4827 (3.4223)	Entropy 1.04969 (1.06488)	Top-1 acc 39.453 (42.680)	Top-5 acc 64.453 (66.821)	lr 0.02354
Train [19][2200/3239]	Time 0.611 (0.888)	Data Time 0.001 (0.010)	Loss 3.3494 (3.4224)	Entropy 1.04967 (1.06481)	Top-1 acc 46.094 (42.679)	Top-5 acc 70.312 (66.822)	lr 0.02353
Train [19][2210/3239]	Time 0.616 (0.888)	Data Time 0.001 (0.010)	Loss 3.6275 (3.4224)	Entropy 1.04984 (1.06474)	Top-1 acc 36.328 (42.678)	Top-5 acc 62.500 (66.820)	lr 0.02353
Train [19][2220/3239]	Time 0.627 (0.888)	Data Time 0.003 (0.010)	Loss 3.3780 (3.4225)	Entropy 1.04991 (1.06468)	Top-1 acc 44.141 (42.681)	Top-5 acc 67.188 (66.818)	lr 0.02353
Train [19][2230/3239]	Time 0.650 (0.888)	Data Time 0.001 (0.010)	Loss 3.2953 (3.4224)	Entropy 1.04956 (1.06461)	Top-1 acc 44.922 (42.682)	Top-5 acc 69.141 (66.820)	lr 0.02353
Train [19][2240/3239]	Time 0.673 (0.888)	Data Time 0.001 (0.010)	Loss 3.5011 (3.4222)	Entropy 1.04993 (1.06454)	Top-1 acc 40.234 (42.687)	Top-5 acc 64.844 (66.827)	lr 0.02353
Train [19][2250/3239]	Time 0.615 (0.888)	Data Time 0.001 (0.010)	Loss 3.4756 (3.4217)	Entropy 1.04996 (1.06448)	Top-1 acc 41.797 (42.695)	Top-5 acc 66.016 (66.834)	lr 0.02353
Train [19][2260/3239]	Time 0.632 (0.888)	Data Time 0.001 (0.010)	Loss 3.3419 (3.4214)	Entropy 1.04987 (1.06442)	Top-1 acc 44.922 (42.702)	Top-5 acc 70.312 (66.837)	lr 0.02353
Train [19][2270/3239]	Time 0.602 (0.887)	Data Time 0.001 (0.010)	Loss 3.6847 (3.4215)	Entropy 1.05003 (1.06435)	Top-1 acc 37.109 (42.700)	Top-5 acc 62.891 (66.835)	lr 0.02353
Train [19][2280/3239]	Time 0.584 (0.887)	Data Time 0.001 (0.010)	Loss 3.2582 (3.4216)	Entropy 1.04981 (1.06429)	Top-1 acc 46.484 (42.698)	Top-5 acc 72.656 (66.833)	lr 0.02353
Train [19][2290/3239]	Time 0.629 (0.887)	Data Time 0.001 (0.010)	Loss 3.4209 (3.4220)	Entropy 1.04986 (1.06423)	Top-1 acc 43.359 (42.687)	Top-5 acc 68.359 (66.826)	lr 0.02353
Train [19][2300/3239]	Time 0.605 (0.887)	Data Time 0.001 (0.010)	Loss 3.3599 (3.4222)	Entropy 1.04966 (1.06416)	Top-1 acc 44.922 (42.683)	Top-5 acc 70.312 (66.823)	lr 0.02353
Train [19][2310/3239]	Time 0.695 (0.887)	Data Time 0.001 (0.010)	Loss 3.3099 (3.4225)	Entropy 1.04941 (1.06410)	Top-1 acc 48.047 (42.680)	Top-5 acc 68.750 (66.816)	lr 0.02353
Train [19][2320/3239]	Time 0.552 (0.886)	Data Time 0.001 (0.010)	Loss 3.4351 (3.4223)	Entropy 1.04925 (1.06404)	Top-1 acc 45.703 (42.682)	Top-5 acc 66.797 (66.817)	lr 0.02353
Train [19][2330/3239]	Time 0.573 (0.886)	Data Time 0.001 (0.010)	Loss 3.5370 (3.4224)	Entropy 1.04919 (1.06397)	Top-1 acc 42.188 (42.678)	Top-5 acc 63.281 (66.817)	lr 0.02353
Train [19][2340/3239]	Time 0.602 (0.886)	Data Time 0.001 (0.010)	Loss 3.1848 (3.4223)	Entropy 1.04894 (1.06391)	Top-1 acc 50.000 (42.679)	Top-5 acc 69.531 (66.816)	lr 0.02353
Train [19][2350/3239]	Time 0.591 (0.886)	Data Time 0.001 (0.010)	Loss 3.2394 (3.4221)	Entropy 1.04776 (1.06384)	Top-1 acc 44.141 (42.680)	Top-5 acc 71.875 (66.818)	lr 0.02353
Train [19][2360/3239]	Time 0.647 (0.886)	Data Time 0.001 (0.010)	Loss 3.3309 (3.4220)	Entropy 1.04788 (1.06378)	Top-1 acc 42.188 (42.679)	Top-5 acc 70.312 (66.822)	lr 0.02353
Train [19][2370/3239]	Time 0.574 (0.886)	Data Time 0.001 (0.010)	Loss 3.5524 (3.4221)	Entropy 1.04787 (1.06371)	Top-1 acc 36.719 (42.673)	Top-5 acc 60.156 (66.818)	lr 0.02353
Train [19][2380/3239]	Time 0.582 (0.885)	Data Time 0.001 (0.010)	Loss 3.3724 (3.4221)	Entropy 1.04792 (1.06364)	Top-1 acc 46.484 (42.676)	Top-5 acc 67.969 (66.814)	lr 0.02353
Train [19][2390/3239]	Time 0.635 (0.885)	Data Time 0.001 (0.010)	Loss 3.5559 (3.4219)	Entropy 1.04754 (1.06358)	Top-1 acc 42.578 (42.684)	Top-5 acc 62.891 (66.817)	lr 0.02353
Train [19][2400/3239]	Time 0.577 (0.885)	Data Time 0.001 (0.010)	Loss 3.4796 (3.4215)	Entropy 1.04760 (1.06351)	Top-1 acc 43.750 (42.692)	Top-5 acc 65.234 (66.825)	lr 0.02353
Train [19][2410/3239]	Time 0.546 (0.885)	Data Time 0.001 (0.010)	Loss 3.4101 (3.4211)	Entropy 1.04762 (1.06344)	Top-1 acc 43.359 (42.704)	Top-5 acc 69.531 (66.836)	lr 0.02352
Train [19][2420/3239]	Time 0.617 (0.885)	Data Time 0.001 (0.010)	Loss 3.4650 (3.4212)	Entropy 1.04774 (1.06338)	Top-1 acc 41.797 (42.699)	Top-5 acc 65.234 (66.837)	lr 0.02352
Train [19][2430/3239]	Time 0.585 (0.885)	Data Time 0.001 (0.010)	Loss 3.3264 (3.4211)	Entropy 1.04790 (1.06332)	Top-1 acc 42.969 (42.701)	Top-5 acc 69.531 (66.840)	lr 0.02352
Train [19][2440/3239]	Time 0.634 (0.885)	Data Time 0.001 (0.010)	Loss 3.4314 (3.4210)	Entropy 1.04781 (1.06325)	Top-1 acc 42.578 (42.705)	Top-5 acc 67.188 (66.843)	lr 0.02352
Train [19][2450/3239]	Time 0.595 (0.885)	Data Time 0.002 (0.010)	Loss 3.3890 (3.4212)	Entropy 1.04798 (1.06319)	Top-1 acc 41.016 (42.693)	Top-5 acc 66.406 (66.838)	lr 0.02352
Train [19][2460/3239]	Time 0.644 (0.884)	Data Time 0.001 (0.009)	Loss 3.4074 (3.4213)	Entropy 1.04822 (1.06313)	Top-1 acc 41.406 (42.693)	Top-5 acc 69.531 (66.840)	lr 0.02352
Train [19][2470/3239]	Time 0.716 (0.884)	Data Time 0.001 (0.009)	Loss 3.4287 (3.4213)	Entropy 1.04797 (1.06307)	Top-1 acc 39.844 (42.694)	Top-5 acc 63.672 (66.837)	lr 0.02352
Train [19][2480/3239]	Time 0.568 (0.884)	Data Time 0.002 (0.009)	Loss 3.1625 (3.4211)	Entropy 1.04806 (1.06301)	Top-1 acc 46.484 (42.698)	Top-5 acc 73.047 (66.844)	lr 0.02352
Train [19][2490/3239]	Time 0.551 (0.884)	Data Time 0.001 (0.009)	Loss 3.3294 (3.4210)	Entropy 1.04823 (1.06295)	Top-1 acc 42.188 (42.699)	Top-5 acc 65.234 (66.844)	lr 0.02352
Train [19][2500/3239]	Time 0.552 (0.884)	Data Time 0.001 (0.009)	Loss 3.5219 (3.4210)	Entropy 1.04840 (1.06289)	Top-1 acc 42.188 (42.699)	Top-5 acc 62.891 (66.847)	lr 0.02352
Train [19][2510/3239]	Time 0.627 (0.884)	Data Time 0.001 (0.009)	Loss 3.1178 (3.4209)	Entropy 1.04847 (1.06283)	Top-1 acc 51.562 (42.700)	Top-5 acc 75.000 (66.848)	lr 0.02352
Train [19][2520/3239]	Time 0.599 (0.883)	Data Time 0.001 (0.009)	Loss 3.3573 (3.4210)	Entropy 1.04794 (1.06277)	Top-1 acc 46.875 (42.699)	Top-5 acc 66.016 (66.847)	lr 0.02352
Train [19][2530/3239]	Time 0.618 (0.883)	Data Time 0.001 (0.009)	Loss 3.3707 (3.4208)	Entropy 1.04768 (1.06271)	Top-1 acc 44.141 (42.705)	Top-5 acc 67.578 (66.851)	lr 0.02352
Train [19][2540/3239]	Time 0.689 (0.883)	Data Time 0.001 (0.009)	Loss 3.7216 (3.4209)	Entropy 1.04713 (1.06265)	Top-1 acc 32.812 (42.702)	Top-5 acc 61.719 (66.848)	lr 0.02352
Train [19][2550/3239]	Time 0.600 (0.883)	Data Time 0.001 (0.009)	Loss 3.4089 (3.4210)	Entropy 1.04720 (1.06259)	Top-1 acc 44.531 (42.700)	Top-5 acc 64.453 (66.847)	lr 0.02352
Train [19][2560/3239]	Time 0.577 (0.883)	Data Time 0.001 (0.009)	Loss 3.6753 (3.4210)	Entropy 1.04715 (1.06253)	Top-1 acc 40.234 (42.703)	Top-5 acc 60.156 (66.849)	lr 0.02352
Train [19][2570/3239]	Time 0.615 (0.892)	Data Time 0.002 (0.009)	Loss 3.2812 (3.4213)	Entropy 1.04710 (1.06247)	Top-1 acc 46.094 (42.697)	Top-5 acc 71.484 (66.847)	lr 0.02352
Train [19][2580/3239]	Time 0.617 (0.891)	Data Time 0.002 (0.009)	Loss 3.2866 (3.4214)	Entropy 1.04651 (1.06241)	Top-1 acc 46.484 (42.696)	Top-5 acc 71.094 (66.845)	lr 0.02352
Train [19][2590/3239]	Time 0.571 (0.891)	Data Time 0.001 (0.009)	Loss 3.4731 (3.4213)	Entropy 1.04630 (1.06235)	Top-1 acc 39.062 (42.695)	Top-5 acc 67.188 (66.851)	lr 0.02352
Train [19][2600/3239]	Time 0.584 (0.891)	Data Time 0.001 (0.009)	Loss 3.3962 (3.4212)	Entropy 1.04599 (1.06229)	Top-1 acc 46.094 (42.698)	Top-5 acc 65.234 (66.851)	lr 0.02352
Train [19][2610/3239]	Time 0.563 (0.891)	Data Time 0.002 (0.009)	Loss 3.3553 (3.4212)	Entropy 1.04557 (1.06223)	Top-1 acc 44.531 (42.692)	Top-5 acc 64.453 (66.849)	lr 0.02352
Train [19][2620/3239]	Time 0.566 (0.891)	Data Time 0.001 (0.009)	Loss 3.1495 (3.4211)	Entropy 1.04547 (1.06216)	Top-1 acc 49.609 (42.699)	Top-5 acc 72.656 (66.853)	lr 0.02351
Train [19][2630/3239]	Time 0.699 (0.890)	Data Time 0.001 (0.009)	Loss 3.4936 (3.4212)	Entropy 1.04571 (1.06210)	Top-1 acc 42.188 (42.701)	Top-5 acc 67.969 (66.855)	lr 0.02351
Train [19][2640/3239]	Time 0.607 (0.890)	Data Time 0.001 (0.009)	Loss 3.4132 (3.4211)	Entropy 1.04544 (1.06204)	Top-1 acc 42.969 (42.704)	Top-5 acc 68.750 (66.858)	lr 0.02351
Train [19][2650/3239]	Time 0.630 (0.890)	Data Time 0.001 (0.009)	Loss 3.1832 (3.4211)	Entropy 1.04542 (1.06197)	Top-1 acc 44.531 (42.702)	Top-5 acc 70.312 (66.857)	lr 0.02351
Train [19][2660/3239]	Time 0.592 (0.890)	Data Time 0.001 (0.009)	Loss 3.5206 (3.4211)	Entropy 1.04518 (1.06191)	Top-1 acc 41.406 (42.702)	Top-5 acc 67.969 (66.853)	lr 0.02351
Train [19][2670/3239]	Time 0.599 (0.890)	Data Time 0.001 (0.009)	Loss 3.2817 (3.4210)	Entropy 1.04507 (1.06185)	Top-1 acc 45.312 (42.704)	Top-5 acc 67.969 (66.853)	lr 0.02351
Train [19][2680/3239]	Time 0.576 (0.890)	Data Time 0.001 (0.009)	Loss 3.3965 (3.4211)	Entropy 1.04467 (1.06179)	Top-1 acc 39.453 (42.703)	Top-5 acc 68.359 (66.855)	lr 0.02351
Train [19][2690/3239]	Time 0.603 (0.890)	Data Time 0.001 (0.009)	Loss 3.3810 (3.4211)	Entropy 1.04434 (1.06172)	Top-1 acc 44.531 (42.703)	Top-5 acc 69.922 (66.851)	lr 0.02351
Train [19][2700/3239]	Time 0.701 (0.890)	Data Time 0.002 (0.009)	Loss 3.5423 (3.4211)	Entropy 1.04408 (1.06166)	Top-1 acc 40.625 (42.699)	Top-5 acc 62.500 (66.849)	lr 0.02351
Train [19][2710/3239]	Time 0.595 (0.890)	Data Time 0.001 (0.009)	Loss 3.2018 (3.4210)	Entropy 1.04421 (1.06159)	Top-1 acc 47.266 (42.701)	Top-5 acc 69.141 (66.851)	lr 0.02351
Train [19][2720/3239]	Time 0.615 (0.889)	Data Time 0.002 (0.009)	Loss 3.4398 (3.4211)	Entropy 1.04426 (1.06153)	Top-1 acc 42.969 (42.697)	Top-5 acc 69.531 (66.850)	lr 0.02351
Train [19][2730/3239]	Time 0.618 (0.889)	Data Time 0.001 (0.009)	Loss 3.3951 (3.4212)	Entropy 1.04400 (1.06146)	Top-1 acc 41.797 (42.696)	Top-5 acc 67.578 (66.851)	lr 0.02351
Train [19][2740/3239]	Time 0.600 (0.889)	Data Time 0.001 (0.009)	Loss 3.3001 (3.4210)	Entropy 1.04364 (1.06140)	Top-1 acc 42.578 (42.700)	Top-5 acc 69.141 (66.855)	lr 0.02351
Train [19][2750/3239]	Time 0.595 (0.889)	Data Time 0.001 (0.009)	Loss 3.4196 (3.4210)	Entropy 1.04365 (1.06134)	Top-1 acc 44.141 (42.698)	Top-5 acc 66.016 (66.855)	lr 0.02351
Train [19][2760/3239]	Time 0.603 (0.889)	Data Time 0.001 (0.009)	Loss 3.2993 (3.4209)	Entropy 1.04382 (1.06127)	Top-1 acc 46.094 (42.703)	Top-5 acc 69.531 (66.858)	lr 0.02351
Train [19][2770/3239]	Time 0.693 (0.889)	Data Time 0.001 (0.009)	Loss 3.3808 (3.4209)	Entropy 1.04365 (1.06121)	Top-1 acc 41.797 (42.704)	Top-5 acc 67.188 (66.858)	lr 0.02351
Train [19][2780/3239]	Time 0.589 (0.889)	Data Time 0.001 (0.009)	Loss 3.2777 (3.4211)	Entropy 1.04367 (1.06114)	Top-1 acc 46.875 (42.701)	Top-5 acc 71.094 (66.860)	lr 0.02351
Train [19][2790/3239]	Time 0.570 (0.889)	Data Time 0.001 (0.009)	Loss 3.2312 (3.4210)	Entropy 1.04405 (1.06108)	Top-1 acc 45.312 (42.701)	Top-5 acc 68.750 (66.861)	lr 0.02351
Train [19][2800/3239]	Time 0.597 (0.888)	Data Time 0.001 (0.009)	Loss 3.4800 (3.4212)	Entropy 1.04465 (1.06102)	Top-1 acc 43.750 (42.696)	Top-5 acc 62.891 (66.853)	lr 0.02351
Train [19][2810/3239]	Time 0.592 (0.888)	Data Time 0.001 (0.009)	Loss 3.6260 (3.4212)	Entropy 1.04446 (1.06096)	Top-1 acc 41.016 (42.695)	Top-5 acc 66.797 (66.856)	lr 0.02351
Train [19][2820/3239]	Time 0.625 (0.888)	Data Time 0.001 (0.009)	Loss 3.3605 (3.4211)	Entropy 1.04459 (1.06091)	Top-1 acc 41.406 (42.696)	Top-5 acc 69.531 (66.861)	lr 0.02351
Train [19][2830/3239]	Time 0.570 (0.888)	Data Time 0.001 (0.009)	Loss 3.6102 (3.4209)	Entropy 1.04469 (1.06085)	Top-1 acc 41.016 (42.704)	Top-5 acc 66.797 (66.866)	lr 0.02350
Train [19][2840/3239]	Time 0.561 (0.888)	Data Time 0.001 (0.008)	Loss 3.3513 (3.4208)	Entropy 1.04450 (1.06079)	Top-1 acc 44.922 (42.705)	Top-5 acc 69.141 (66.866)	lr 0.02350
Train [19][2850/3239]	Time 0.621 (0.888)	Data Time 0.001 (0.008)	Loss 3.4794 (3.4207)	Entropy 1.04459 (1.06074)	Top-1 acc 38.672 (42.708)	Top-5 acc 67.969 (66.866)	lr 0.02350
Train [19][2860/3239]	Time 0.709 (0.888)	Data Time 0.001 (0.008)	Loss 3.2902 (3.4206)	Entropy 1.04489 (1.06068)	Top-1 acc 46.875 (42.715)	Top-5 acc 69.922 (66.868)	lr 0.02350
Train [19][2870/3239]	Time 0.629 (0.887)	Data Time 0.001 (0.008)	Loss 3.3221 (3.4205)	Entropy 1.04480 (1.06062)	Top-1 acc 46.094 (42.719)	Top-5 acc 66.016 (66.869)	lr 0.02350
Train [19][2880/3239]	Time 0.584 (0.887)	Data Time 0.001 (0.008)	Loss 3.5218 (3.4207)	Entropy 1.04491 (1.06057)	Top-1 acc 38.281 (42.721)	Top-5 acc 65.625 (66.864)	lr 0.02350
Train [19][2890/3239]	Time 0.571 (0.887)	Data Time 0.001 (0.008)	Loss 3.4902 (3.4205)	Entropy 1.04502 (1.06052)	Top-1 acc 41.406 (42.722)	Top-5 acc 62.891 (66.864)	lr 0.02350
Train [19][2900/3239]	Time 0.584 (0.887)	Data Time 0.001 (0.008)	Loss 3.2096 (3.4204)	Entropy 1.04506 (1.06046)	Top-1 acc 43.750 (42.722)	Top-5 acc 71.875 (66.869)	lr 0.02350
Train [19][2910/3239]	Time 0.611 (0.887)	Data Time 0.001 (0.008)	Loss 3.5578 (3.4205)	Entropy 1.04493 (1.06041)	Top-1 acc 41.016 (42.722)	Top-5 acc 66.406 (66.866)	lr 0.02350
Train [19][2920/3239]	Time 0.617 (0.887)	Data Time 0.001 (0.008)	Loss 3.2643 (3.4205)	Entropy 1.04514 (1.06036)	Top-1 acc 44.922 (42.722)	Top-5 acc 72.266 (66.868)	lr 0.02350
Train [19][2930/3239]	Time 0.653 (0.887)	Data Time 0.001 (0.008)	Loss 3.6665 (3.4203)	Entropy 1.04471 (1.06030)	Top-1 acc 38.281 (42.725)	Top-5 acc 62.109 (66.871)	lr 0.02350
Train [19][2940/3239]	Time 0.570 (0.887)	Data Time 0.001 (0.008)	Loss 3.5436 (3.4203)	Entropy 1.04456 (1.06025)	Top-1 acc 37.891 (42.720)	Top-5 acc 64.844 (66.869)	lr 0.02350
Train [19][2950/3239]	Time 0.629 (0.887)	Data Time 0.001 (0.008)	Loss 3.4205 (3.4204)	Entropy 1.04468 (1.06020)	Top-1 acc 43.750 (42.718)	Top-5 acc 65.625 (66.865)	lr 0.02350
Train [19][2960/3239]	Time 0.562 (0.886)	Data Time 0.001 (0.008)	Loss 3.4276 (3.4205)	Entropy 1.04496 (1.06015)	Top-1 acc 42.188 (42.717)	Top-5 acc 66.016 (66.864)	lr 0.02350
Train [19][2970/3239]	Time 0.480 (0.886)	Data Time 0.001 (0.008)	Loss 3.5444 (3.4205)	Entropy 1.04517 (1.06009)	Top-1 acc 40.625 (42.720)	Top-5 acc 62.891 (66.865)	lr 0.02350
Train [19][2980/3239]	Time 0.601 (0.886)	Data Time 0.001 (0.008)	Loss 3.3785 (3.4205)	Entropy 1.04502 (1.06004)	Top-1 acc 40.625 (42.718)	Top-5 acc 68.750 (66.867)	lr 0.02350
Train [19][2990/3239]	Time 0.599 (0.886)	Data Time 0.001 (0.008)	Loss 3.3902 (3.4205)	Entropy 1.04516 (1.05999)	Top-1 acc 41.016 (42.715)	Top-5 acc 64.844 (66.865)	lr 0.02350
Train [19][3000/3239]	Time 0.607 (0.886)	Data Time 0.001 (0.008)	Loss 3.4672 (3.4206)	Entropy 1.04530 (1.05994)	Top-1 acc 42.578 (42.711)	Top-5 acc 66.797 (66.859)	lr 0.02350
Train [19][3010/3239]	Time 0.589 (0.886)	Data Time 0.001 (0.008)	Loss 3.3987 (3.4205)	Entropy 1.04489 (1.05990)	Top-1 acc 44.141 (42.712)	Top-5 acc 64.844 (66.863)	lr 0.02350
Train [19][3020/3239]	Time 0.600 (0.886)	Data Time 0.001 (0.008)	Loss 3.3956 (3.4205)	Entropy 1.04457 (1.05985)	Top-1 acc 44.531 (42.718)	Top-5 acc 67.188 (66.860)	lr 0.02350
Train [19][3030/3239]	Time 0.583 (0.885)	Data Time 0.001 (0.008)	Loss 3.6325 (3.4206)	Entropy 1.04445 (1.05980)	Top-1 acc 42.188 (42.714)	Top-5 acc 62.891 (66.855)	lr 0.02350
Train [19][3040/3239]	Time 0.615 (0.885)	Data Time 0.001 (0.008)	Loss 3.4624 (3.4205)	Entropy 1.04350 (1.05974)	Top-1 acc 43.750 (42.717)	Top-5 acc 67.188 (66.857)	lr 0.02349
Train [19][3050/3239]	Time 0.613 (0.885)	Data Time 0.001 (0.008)	Loss 3.5225 (3.4208)	Entropy 1.04285 (1.05969)	Top-1 acc 42.188 (42.710)	Top-5 acc 62.891 (66.849)	lr 0.02349
Train [19][3060/3239]	Time 0.612 (0.885)	Data Time 0.002 (0.008)	Loss 3.5081 (3.4209)	Entropy 1.04264 (1.05963)	Top-1 acc 41.797 (42.710)	Top-5 acc 63.672 (66.848)	lr 0.02349
Train [19][3070/3239]	Time 0.600 (0.885)	Data Time 0.001 (0.008)	Loss 3.3748 (3.4206)	Entropy 1.04298 (1.05958)	Top-1 acc 43.359 (42.718)	Top-5 acc 66.016 (66.853)	lr 0.02349
Train [19][3080/3239]	Time 0.610 (0.885)	Data Time 0.001 (0.008)	Loss 3.4984 (3.4205)	Entropy 1.04332 (1.05953)	Top-1 acc 42.578 (42.720)	Top-5 acc 62.500 (66.854)	lr 0.02349
Train [19][3090/3239]	Time 0.677 (0.885)	Data Time 0.002 (0.008)	Loss 3.5141 (3.4207)	Entropy 1.04314 (1.05947)	Top-1 acc 40.625 (42.716)	Top-5 acc 65.234 (66.851)	lr 0.02349
Train [19][3100/3239]	Time 0.621 (0.885)	Data Time 0.001 (0.008)	Loss 3.4985 (3.4209)	Entropy 1.04295 (1.05942)	Top-1 acc 44.922 (42.713)	Top-5 acc 61.328 (66.844)	lr 0.02349
Train [19][3110/3239]	Time 0.597 (0.885)	Data Time 0.001 (0.008)	Loss 3.2591 (3.4209)	Entropy 1.04275 (1.05937)	Top-1 acc 46.094 (42.714)	Top-5 acc 67.188 (66.841)	lr 0.02349
Train [19][3120/3239]	Time 0.626 (0.884)	Data Time 0.001 (0.008)	Loss 3.4233 (3.4209)	Entropy 1.04259 (1.05931)	Top-1 acc 39.062 (42.716)	Top-5 acc 69.531 (66.842)	lr 0.02349
Train [19][3130/3239]	Time 0.498 (0.884)	Data Time 0.001 (0.008)	Loss 3.2431 (3.4208)	Entropy 1.04198 (1.05926)	Top-1 acc 47.656 (42.718)	Top-5 acc 66.797 (66.841)	lr 0.02349
Train [19][3140/3239]	Time 0.606 (0.884)	Data Time 0.001 (0.008)	Loss 3.1429 (3.4205)	Entropy 1.04221 (1.05920)	Top-1 acc 49.219 (42.725)	Top-5 acc 70.703 (66.846)	lr 0.02349
Train [19][3150/3239]	Time 0.589 (0.884)	Data Time 0.001 (0.008)	Loss 3.4661 (3.4205)	Entropy 1.04232 (1.05915)	Top-1 acc 43.359 (42.722)	Top-5 acc 66.016 (66.847)	lr 0.02349
Train [19][3160/3239]	Time 0.680 (0.884)	Data Time 0.001 (0.008)	Loss 3.2595 (3.4206)	Entropy 1.04194 (1.05910)	Top-1 acc 46.875 (42.721)	Top-5 acc 72.266 (66.845)	lr 0.02349
Train [19][3170/3239]	Time 0.585 (0.884)	Data Time 0.001 (0.008)	Loss 3.3678 (3.4205)	Entropy 1.04191 (1.05904)	Top-1 acc 45.703 (42.727)	Top-5 acc 68.359 (66.847)	lr 0.02349
Train [19][3180/3239]	Time 0.579 (0.884)	Data Time 0.000 (0.008)	Loss 3.5208 (3.4206)	Entropy 1.04164 (1.05899)	Top-1 acc 39.844 (42.721)	Top-5 acc 64.062 (66.843)	lr 0.02349
Train [19][3190/3239]	Time 0.587 (0.883)	Data Time 0.000 (0.008)	Loss 3.4837 (3.4207)	Entropy 1.04133 (1.05894)	Top-1 acc 39.453 (42.723)	Top-5 acc 66.797 (66.842)	lr 0.02349
Train [19][3200/3239]	Time 0.619 (0.883)	Data Time 0.000 (0.008)	Loss 3.4522 (3.4206)	Entropy 1.04094 (1.05888)	Top-1 acc 41.406 (42.724)	Top-5 acc 66.016 (66.843)	lr 0.02349
Train [19][3210/3239]	Time 0.606 (0.883)	Data Time 0.000 (0.008)	Loss 3.3493 (3.4205)	Entropy 1.04053 (1.05882)	Top-1 acc 43.750 (42.728)	Top-5 acc 70.703 (66.848)	lr 0.02349
Train [19][3220/3239]	Time 0.758 (0.889)	Data Time 0.000 (0.008)	Loss 3.2927 (3.4205)	Entropy 1.04035 (1.05877)	Top-1 acc 46.875 (42.729)	Top-5 acc 68.359 (66.845)	lr 0.02349
Train [19][3230/3239]	Time 0.599 (0.889)	Data Time 0.000 (0.008)	Loss 3.4904 (3.4204)	Entropy 1.04015 (1.05871)	Top-1 acc 45.312 (42.737)	Top-5 acc 65.234 (66.844)	lr 0.02349
Train [19][3239/3239]	Time 1.577 (0.889)	Data Time 0.000 (0.008)	Loss 3.3604 (3.4204)	Entropy 1.04035 (1.05866)	Top-1 acc 41.975 (42.737)	Top-5 acc 71.605 (66.841)	lr 0.02349
==========Valid [19/120]	loss 2.145	top-1 acc 52.914 (52.914)	top-5 acc 76.481	Train top-1 42.737	top-5 66.841	Entropy 1.04035	Latency-None: 0.000ms	Flops: 539.76M
Train [20][0/3239]	Time 22.131 (22.131)	Data Time 20.580 (20.580)	Loss 3.3203 (3.3203)	Entropy 1.04026 (1.04026)	Top-1 acc 44.141 (44.141)	Top-5 acc 66.406 (66.406)	lr 0.02349
Train [20][10/3239]	Time 0.595 (2.883)	Data Time 0.001 (1.875)	Loss 3.5402 (3.4083)	Entropy 1.04028 (1.04035)	Top-1 acc 37.500 (42.294)	Top-5 acc 65.234 (67.259)	lr 0.02348
Train [20][20/3239]	Time 0.584 (1.924)	Data Time 0.001 (0.983)	Loss 3.4337 (3.4147)	Entropy 1.04009 (1.04022)	Top-1 acc 41.406 (42.690)	Top-5 acc 66.406 (66.946)	lr 0.02348
Train [20][30/3239]	Time 0.642 (1.593)	Data Time 0.001 (0.667)	Loss 3.5364 (3.3947)	Entropy 1.04031 (1.04021)	Top-1 acc 45.312 (43.246)	Top-5 acc 66.016 (67.414)	lr 0.02348
Train [20][40/3239]	Time 0.634 (1.417)	Data Time 0.001 (0.505)	Loss 3.4263 (3.3969)	Entropy 1.04030 (1.04025)	Top-1 acc 43.750 (43.436)	Top-5 acc 65.625 (67.216)	lr 0.02348
Train [20][50/3239]	Time 0.636 (1.307)	Data Time 0.001 (0.406)	Loss 3.4298 (3.4065)	Entropy 1.04022 (1.04025)	Top-1 acc 42.188 (43.145)	Top-5 acc 67.969 (67.019)	lr 0.02348
Train [20][60/3239]	Time 0.548 (1.230)	Data Time 0.001 (0.340)	Loss 3.3881 (3.4068)	Entropy 1.04016 (1.04025)	Top-1 acc 39.844 (42.828)	Top-5 acc 69.531 (67.021)	lr 0.02348
Train [20][70/3239]	Time 0.650 (1.172)	Data Time 0.001 (0.292)	Loss 3.3517 (3.3971)	Entropy 1.03969 (1.04024)	Top-1 acc 41.797 (42.963)	Top-5 acc 69.922 (67.226)	lr 0.02348
Train [20][80/3239]	Time 0.701 (1.130)	Data Time 0.001 (0.256)	Loss 3.4076 (3.4094)	Entropy 1.03937 (1.04016)	Top-1 acc 42.188 (42.757)	Top-5 acc 65.625 (66.884)	lr 0.02348
Train [20][90/3239]	Time 0.581 (1.098)	Data Time 0.001 (0.228)	Loss 3.3664 (3.4150)	Entropy 1.03940 (1.04007)	Top-1 acc 43.359 (42.746)	Top-5 acc 68.359 (66.745)	lr 0.02348
Train [20][100/3239]	Time 0.610 (1.073)	Data Time 0.001 (0.206)	Loss 3.4306 (3.4149)	Entropy 1.03938 (1.04000)	Top-1 acc 43.750 (42.837)	Top-5 acc 66.016 (66.704)	lr 0.02348
Train [20][110/3239]	Time 0.595 (1.054)	Data Time 0.001 (0.188)	Loss 3.5761 (3.4143)	Entropy 1.03953 (1.03996)	Top-1 acc 33.203 (42.884)	Top-5 acc 63.281 (66.723)	lr 0.02348
Train [20][120/3239]	Time 0.634 (1.037)	Data Time 0.001 (0.172)	Loss 3.5947 (3.4119)	Entropy 1.03934 (1.03992)	Top-1 acc 38.672 (42.856)	Top-5 acc 63.672 (66.723)	lr 0.02348
Train [20][130/3239]	Time 0.594 (1.023)	Data Time 0.001 (0.159)	Loss 3.4749 (3.4118)	Entropy 1.03927 (1.03987)	Top-1 acc 43.750 (42.921)	Top-5 acc 66.406 (66.713)	lr 0.02348
Train [20][140/3239]	Time 0.551 (1.011)	Data Time 0.001 (0.148)	Loss 3.5813 (3.4131)	Entropy 1.03902 (1.03982)	Top-1 acc 42.188 (42.911)	Top-5 acc 62.109 (66.758)	lr 0.02348
Train [20][150/3239]	Time 0.611 (1.001)	Data Time 0.001 (0.138)	Loss 3.6035 (3.4101)	Entropy 1.03920 (1.03977)	Top-1 acc 40.625 (43.039)	Top-5 acc 64.062 (66.789)	lr 0.02348
Train [20][160/3239]	Time 0.541 (0.992)	Data Time 0.001 (0.130)	Loss 3.4154 (3.4127)	Entropy 1.03939 (1.03974)	Top-1 acc 41.406 (42.940)	Top-5 acc 63.281 (66.751)	lr 0.02348
Train [20][170/3239]	Time 0.601 (0.983)	Data Time 0.001 (0.122)	Loss 3.6080 (3.4102)	Entropy 1.03901 (1.03972)	Top-1 acc 37.891 (43.019)	Top-5 acc 64.453 (66.817)	lr 0.02348
Train [20][180/3239]	Time 0.560 (0.977)	Data Time 0.001 (0.116)	Loss 3.4898 (3.4061)	Entropy 1.03883 (1.03968)	Top-1 acc 42.969 (43.122)	Top-5 acc 67.578 (66.903)	lr 0.02348
Train [20][190/3239]	Time 0.594 (0.970)	Data Time 0.001 (0.110)	Loss 3.3079 (3.4058)	Entropy 1.03880 (1.03963)	Top-1 acc 48.828 (43.089)	Top-5 acc 73.438 (66.956)	lr 0.02348
Train [20][200/3239]	Time 0.601 (0.964)	Data Time 0.001 (0.105)	Loss 3.5987 (3.4036)	Entropy 1.03881 (1.03959)	Top-1 acc 34.766 (43.064)	Top-5 acc 61.328 (67.016)	lr 0.02348
Train [20][210/3239]	Time 0.603 (0.959)	Data Time 0.001 (0.100)	Loss 3.5640 (3.4044)	Entropy 1.03842 (1.03954)	Top-1 acc 38.281 (43.021)	Top-5 acc 64.453 (66.967)	lr 0.02348
Train [20][220/3239]	Time 0.590 (0.954)	Data Time 0.001 (0.095)	Loss 3.3036 (3.4047)	Entropy 1.03816 (1.03949)	Top-1 acc 42.969 (43.029)	Top-5 acc 69.531 (66.965)	lr 0.02347
Train [20][230/3239]	Time 0.617 (0.950)	Data Time 0.001 (0.091)	Loss 3.2949 (3.4037)	Entropy 1.03817 (1.03943)	Top-1 acc 45.703 (43.057)	Top-5 acc 70.312 (66.976)	lr 0.02347
Train [20][240/3239]	Time 0.581 (0.943)	Data Time 0.001 (0.088)	Loss 3.4425 (3.4031)	Entropy 1.03834 (1.03938)	Top-1 acc 40.625 (43.082)	Top-5 acc 67.578 (66.977)	lr 0.02347
Train [20][250/3239]	Time 0.605 (0.938)	Data Time 0.001 (0.084)	Loss 3.4192 (3.4033)	Entropy 1.03836 (1.03934)	Top-1 acc 42.188 (43.085)	Top-5 acc 67.188 (66.988)	lr 0.02347
Train [20][260/3239]	Time 0.666 (0.934)	Data Time 0.001 (0.081)	Loss 3.2010 (3.4022)	Entropy 1.03827 (1.03930)	Top-1 acc 45.312 (43.106)	Top-5 acc 71.875 (67.027)	lr 0.02347
Train [20][270/3239]	Time 0.576 (0.931)	Data Time 0.001 (0.078)	Loss 3.6110 (3.4042)	Entropy 1.03808 (1.03926)	Top-1 acc 43.359 (43.086)	Top-5 acc 61.328 (67.013)	lr 0.02347
Train [20][280/3239]	Time 0.619 (0.928)	Data Time 0.001 (0.075)	Loss 3.3099 (3.4023)	Entropy 1.03784 (1.03922)	Top-1 acc 44.531 (43.149)	Top-5 acc 69.141 (67.062)	lr 0.02347
Train [20][290/3239]	Time 0.596 (0.926)	Data Time 0.001 (0.073)	Loss 3.3663 (3.4022)	Entropy 1.03736 (1.03916)	Top-1 acc 39.844 (43.166)	Top-5 acc 67.188 (67.063)	lr 0.02347
Train [20][300/3239]	Time 0.596 (0.924)	Data Time 0.001 (0.071)	Loss 3.4630 (3.4005)	Entropy 1.03716 (1.03910)	Top-1 acc 39.453 (43.189)	Top-5 acc 65.234 (67.120)	lr 0.02347
Train [20][310/3239]	Time 0.665 (0.922)	Data Time 0.001 (0.068)	Loss 3.3897 (3.4000)	Entropy 1.03734 (1.03904)	Top-1 acc 48.047 (43.210)	Top-5 acc 67.188 (67.150)	lr 0.02347
Train [20][320/3239]	Time 0.596 (0.919)	Data Time 0.001 (0.066)	Loss 3.2803 (3.3975)	Entropy 1.03729 (1.03899)	Top-1 acc 46.484 (43.260)	Top-5 acc 69.531 (67.212)	lr 0.02347
Train [20][330/3239]	Time 0.572 (0.918)	Data Time 0.001 (0.064)	Loss 3.3157 (3.3963)	Entropy 1.03702 (1.03893)	Top-1 acc 42.188 (43.293)	Top-5 acc 69.531 (67.247)	lr 0.02347
Train [20][340/3239]	Time 0.590 (0.916)	Data Time 0.001 (0.062)	Loss 3.4185 (3.3959)	Entropy 1.03718 (1.03888)	Top-1 acc 42.969 (43.319)	Top-5 acc 64.844 (67.232)	lr 0.02347
Train [20][350/3239]	Time 0.608 (0.914)	Data Time 0.001 (0.061)	Loss 3.3852 (3.3952)	Entropy 1.03706 (1.03883)	Top-1 acc 43.750 (43.327)	Top-5 acc 67.188 (67.230)	lr 0.02347
Train [20][360/3239]	Time 0.614 (0.913)	Data Time 0.001 (0.059)	Loss 3.4448 (3.3957)	Entropy 1.03724 (1.03878)	Top-1 acc 40.234 (43.320)	Top-5 acc 67.188 (67.218)	lr 0.02347
Train [20][370/3239]	Time 0.592 (0.911)	Data Time 0.001 (0.058)	Loss 3.3139 (3.3956)	Entropy 1.03701 (1.03874)	Top-1 acc 43.750 (43.326)	Top-5 acc 68.750 (67.229)	lr 0.02347
Train [20][380/3239]	Time 0.693 (0.909)	Data Time 0.001 (0.056)	Loss 3.4170 (3.3944)	Entropy 1.03721 (1.03869)	Top-1 acc 44.141 (43.359)	Top-5 acc 65.625 (67.234)	lr 0.02347
Train [20][390/3239]	Time 0.582 (0.908)	Data Time 0.001 (0.055)	Loss 3.3207 (3.3942)	Entropy 1.03715 (1.03865)	Top-1 acc 44.141 (43.362)	Top-5 acc 68.750 (67.251)	lr 0.02347
Train [20][400/3239]	Time 0.610 (0.906)	Data Time 0.001 (0.053)	Loss 3.5667 (3.3954)	Entropy 1.03713 (1.03862)	Top-1 acc 41.016 (43.335)	Top-5 acc 66.797 (67.228)	lr 0.02347
Train [20][410/3239]	Time 0.560 (0.904)	Data Time 0.001 (0.052)	Loss 3.4285 (3.3957)	Entropy 1.03715 (1.03858)	Top-1 acc 41.797 (43.350)	Top-5 acc 65.234 (67.234)	lr 0.02347
Train [20][420/3239]	Time 0.627 (0.903)	Data Time 0.001 (0.051)	Loss 3.5321 (3.3969)	Entropy 1.03757 (1.03855)	Top-1 acc 39.844 (43.303)	Top-5 acc 64.062 (67.186)	lr 0.02346
Train [20][430/3239]	Time 0.563 (0.901)	Data Time 0.002 (0.050)	Loss 3.7144 (3.3964)	Entropy 1.03770 (1.03853)	Top-1 acc 34.375 (43.316)	Top-5 acc 62.109 (67.198)	lr 0.02346
Train [20][440/3239]	Time 0.608 (0.900)	Data Time 0.001 (0.049)	Loss 3.3556 (3.3966)	Entropy 1.03750 (1.03851)	Top-1 acc 45.312 (43.308)	Top-5 acc 69.531 (67.198)	lr 0.02346
Train [20][450/3239]	Time 0.550 (0.899)	Data Time 0.001 (0.048)	Loss 3.3677 (3.3948)	Entropy 1.03785 (1.03849)	Top-1 acc 47.656 (43.366)	Top-5 acc 65.625 (67.234)	lr 0.02346
Train [20][460/3239]	Time 0.583 (0.898)	Data Time 0.001 (0.047)	Loss 3.1838 (3.3937)	Entropy 1.03806 (1.03847)	Top-1 acc 49.609 (43.392)	Top-5 acc 71.484 (67.261)	lr 0.02346
Train [20][470/3239]	Time 0.711 (0.896)	Data Time 0.001 (0.046)	Loss 3.1969 (3.3943)	Entropy 1.03757 (1.03846)	Top-1 acc 46.484 (43.378)	Top-5 acc 74.609 (67.263)	lr 0.02346
Train [20][480/3239]	Time 0.618 (0.896)	Data Time 0.001 (0.045)	Loss 3.1886 (3.3935)	Entropy 1.03739 (1.03844)	Top-1 acc 45.703 (43.388)	Top-5 acc 68.750 (67.258)	lr 0.02346
Train [20][490/3239]	Time 0.628 (0.894)	Data Time 0.002 (0.044)	Loss 3.1829 (3.3943)	Entropy 1.03762 (1.03842)	Top-1 acc 47.266 (43.356)	Top-5 acc 73.047 (67.251)	lr 0.02346
Train [20][500/3239]	Time 0.604 (0.894)	Data Time 0.001 (0.043)	Loss 3.3930 (3.3951)	Entropy 1.03729 (1.03840)	Top-1 acc 43.750 (43.357)	Top-5 acc 67.188 (67.241)	lr 0.02346
Train [20][510/3239]	Time 0.614 (0.893)	Data Time 0.001 (0.042)	Loss 3.3696 (3.3957)	Entropy 1.03699 (1.03838)	Top-1 acc 42.969 (43.348)	Top-5 acc 67.188 (67.210)	lr 0.02346
Train [20][520/3239]	Time 0.606 (0.892)	Data Time 0.001 (0.042)	Loss 3.1821 (3.3946)	Entropy 1.03734 (1.03835)	Top-1 acc 50.781 (43.362)	Top-5 acc 71.875 (67.232)	lr 0.02346
Train [20][530/3239]	Time 0.578 (0.892)	Data Time 0.001 (0.041)	Loss 3.3655 (3.3950)	Entropy 1.03721 (1.03833)	Top-1 acc 42.188 (43.326)	Top-5 acc 70.312 (67.232)	lr 0.02346
Train [20][540/3239]	Time 0.709 (0.891)	Data Time 0.001 (0.040)	Loss 3.2596 (3.3945)	Entropy 1.03726 (1.03831)	Top-1 acc 43.750 (43.327)	Top-5 acc 67.578 (67.241)	lr 0.02346
Train [20][550/3239]	Time 0.598 (0.890)	Data Time 0.001 (0.039)	Loss 3.5273 (3.3947)	Entropy 1.03692 (1.03829)	Top-1 acc 42.188 (43.310)	Top-5 acc 65.625 (67.244)	lr 0.02346
Train [20][560/3239]	Time 0.640 (0.889)	Data Time 0.001 (0.039)	Loss 3.5620 (3.3951)	Entropy 1.03652 (1.03827)	Top-1 acc 34.375 (43.280)	Top-5 acc 62.891 (67.247)	lr 0.02346
Train [20][570/3239]	Time 0.568 (0.889)	Data Time 0.001 (0.038)	Loss 3.3194 (3.3949)	Entropy 1.03640 (1.03823)	Top-1 acc 43.359 (43.296)	Top-5 acc 68.750 (67.239)	lr 0.02346
Train [20][580/3239]	Time 0.601 (0.888)	Data Time 0.001 (0.037)	Loss 3.3738 (3.3947)	Entropy 1.03627 (1.03820)	Top-1 acc 45.312 (43.308)	Top-5 acc 68.359 (67.250)	lr 0.02346
Train [20][590/3239]	Time 0.575 (0.887)	Data Time 0.001 (0.037)	Loss 3.2503 (3.3946)	Entropy 1.03599 (1.03816)	Top-1 acc 43.750 (43.291)	Top-5 acc 69.531 (67.252)	lr 0.02346
Train [20][600/3239]	Time 0.597 (0.885)	Data Time 0.001 (0.036)	Loss 3.3923 (3.3937)	Entropy 1.03604 (1.03813)	Top-1 acc 45.312 (43.336)	Top-5 acc 68.359 (67.262)	lr 0.02346
Train [20][610/3239]	Time 0.614 (0.885)	Data Time 0.001 (0.036)	Loss 3.3796 (3.3942)	Entropy 1.03603 (1.03809)	Top-1 acc 40.625 (43.326)	Top-5 acc 67.578 (67.273)	lr 0.02346
Train [20][620/3239]	Time 0.641 (0.884)	Data Time 0.001 (0.035)	Loss 3.7569 (3.3942)	Entropy 1.03590 (1.03806)	Top-1 acc 38.281 (43.337)	Top-5 acc 63.281 (67.290)	lr 0.02346
Train [20][630/3239]	Time 0.631 (0.884)	Data Time 0.001 (0.035)	Loss 3.3217 (3.3936)	Entropy 1.03632 (1.03803)	Top-1 acc 46.484 (43.359)	Top-5 acc 67.969 (67.291)	lr 0.02345
Train [20][640/3239]	Time 0.578 (0.916)	Data Time 0.003 (0.034)	Loss 3.3683 (3.3933)	Entropy 1.03604 (1.03800)	Top-1 acc 45.312 (43.373)	Top-5 acc 67.969 (67.298)	lr 0.02345
Train [20][650/3239]	Time 0.594 (0.915)	Data Time 0.002 (0.034)	Loss 3.6071 (3.3930)	Entropy 1.03620 (1.03797)	Top-1 acc 38.672 (43.371)	Top-5 acc 62.891 (67.294)	lr 0.02345
Train [20][660/3239]	Time 0.569 (0.914)	Data Time 0.002 (0.033)	Loss 3.4353 (3.3934)	Entropy 1.03566 (1.03794)	Top-1 acc 43.750 (43.374)	Top-5 acc 67.188 (67.288)	lr 0.02345
Train [20][670/3239]	Time 0.597 (0.913)	Data Time 0.001 (0.033)	Loss 3.6686 (3.3936)	Entropy 1.03582 (1.03791)	Top-1 acc 36.328 (43.362)	Top-5 acc 60.547 (67.279)	lr 0.02345
Train [20][680/3239]	Time 0.599 (0.912)	Data Time 0.001 (0.032)	Loss 3.2431 (3.3929)	Entropy 1.03552 (1.03788)	Top-1 acc 46.875 (43.368)	Top-5 acc 72.266 (67.294)	lr 0.02345
Train [20][690/3239]	Time 0.594 (0.911)	Data Time 0.001 (0.032)	Loss 3.4927 (3.3920)	Entropy 1.03547 (1.03784)	Top-1 acc 41.797 (43.385)	Top-5 acc 63.672 (67.316)	lr 0.02345
Train [20][700/3239]	Time 0.716 (0.911)	Data Time 0.001 (0.031)	Loss 3.2677 (3.3919)	Entropy 1.03504 (1.03781)	Top-1 acc 43.359 (43.381)	Top-5 acc 69.531 (67.306)	lr 0.02345
Train [20][710/3239]	Time 0.590 (0.910)	Data Time 0.001 (0.031)	Loss 3.3986 (3.3914)	Entropy 1.03505 (1.03777)	Top-1 acc 43.359 (43.391)	Top-5 acc 67.578 (67.319)	lr 0.02345
Train [20][720/3239]	Time 0.561 (0.908)	Data Time 0.001 (0.031)	Loss 3.5695 (3.3911)	Entropy 1.03509 (1.03773)	Top-1 acc 36.719 (43.391)	Top-5 acc 66.016 (67.334)	lr 0.02345
Train [20][730/3239]	Time 0.423 (0.907)	Data Time 0.001 (0.030)	Loss 3.2868 (3.3906)	Entropy 1.03479 (1.03769)	Top-1 acc 46.875 (43.399)	Top-5 acc 66.406 (67.356)	lr 0.02345
Train [20][740/3239]	Time 0.553 (0.906)	Data Time 0.001 (0.030)	Loss 3.5682 (3.3907)	Entropy 1.03466 (1.03765)	Top-1 acc 38.672 (43.391)	Top-5 acc 60.156 (67.350)	lr 0.02345
Train [20][750/3239]	Time 0.603 (0.906)	Data Time 0.001 (0.029)	Loss 3.4139 (3.3910)	Entropy 1.03477 (1.03761)	Top-1 acc 39.844 (43.371)	Top-5 acc 68.359 (67.341)	lr 0.02345
Train [20][760/3239]	Time 0.640 (0.905)	Data Time 0.002 (0.029)	Loss 3.2990 (3.3908)	Entropy 1.03430 (1.03758)	Top-1 acc 41.797 (43.376)	Top-5 acc 68.750 (67.347)	lr 0.02345
Train [20][770/3239]	Time 0.602 (0.905)	Data Time 0.001 (0.029)	Loss 3.3694 (3.3909)	Entropy 1.03434 (1.03753)	Top-1 acc 41.797 (43.362)	Top-5 acc 69.922 (67.357)	lr 0.02345
Train [20][780/3239]	Time 0.607 (0.904)	Data Time 0.001 (0.028)	Loss 3.3670 (3.3905)	Entropy 1.03401 (1.03749)	Top-1 acc 45.312 (43.375)	Top-5 acc 67.188 (67.378)	lr 0.02345
Train [20][790/3239]	Time 0.653 (0.903)	Data Time 0.001 (0.028)	Loss 3.4024 (3.3904)	Entropy 1.03382 (1.03745)	Top-1 acc 42.969 (43.362)	Top-5 acc 66.406 (67.383)	lr 0.02345
Train [20][800/3239]	Time 0.600 (0.903)	Data Time 0.001 (0.028)	Loss 3.5775 (3.3918)	Entropy 1.03362 (1.03740)	Top-1 acc 41.016 (43.351)	Top-5 acc 61.719 (67.345)	lr 0.02345
Train [20][810/3239]	Time 0.591 (0.902)	Data Time 0.001 (0.027)	Loss 3.5041 (3.3921)	Entropy 1.03348 (1.03735)	Top-1 acc 41.406 (43.353)	Top-5 acc 64.844 (67.348)	lr 0.02345
Train [20][820/3239]	Time 0.583 (0.902)	Data Time 0.001 (0.027)	Loss 3.3348 (3.3920)	Entropy 1.03300 (1.03730)	Top-1 acc 49.609 (43.362)	Top-5 acc 69.531 (67.351)	lr 0.02345
Train [20][830/3239]	Time 0.587 (0.901)	Data Time 0.001 (0.027)	Loss 3.2976 (3.3916)	Entropy 1.03241 (1.03725)	Top-1 acc 45.703 (43.376)	Top-5 acc 69.531 (67.352)	lr 0.02344
Train [20][840/3239]	Time 0.586 (0.901)	Data Time 0.001 (0.027)	Loss 3.3621 (3.3919)	Entropy 1.03208 (1.03719)	Top-1 acc 41.016 (43.356)	Top-5 acc 70.703 (67.343)	lr 0.02344
Train [20][850/3239]	Time 0.575 (0.900)	Data Time 0.001 (0.026)	Loss 3.4378 (3.3919)	Entropy 1.03184 (1.03713)	Top-1 acc 43.359 (43.350)	Top-5 acc 69.922 (67.344)	lr 0.02344
Train [20][860/3239]	Time 0.712 (0.900)	Data Time 0.002 (0.026)	Loss 3.4255 (3.3916)	Entropy 1.03209 (1.03707)	Top-1 acc 44.141 (43.355)	Top-5 acc 67.188 (67.344)	lr 0.02344
Train [20][870/3239]	Time 0.621 (0.899)	Data Time 0.001 (0.026)	Loss 3.4078 (3.3915)	Entropy 1.03217 (1.03701)	Top-1 acc 44.531 (43.352)	Top-5 acc 66.797 (67.346)	lr 0.02344
Train [20][880/3239]	Time 0.601 (0.899)	Data Time 0.001 (0.025)	Loss 3.3371 (3.3909)	Entropy 1.03207 (1.03695)	Top-1 acc 42.578 (43.360)	Top-5 acc 66.406 (67.359)	lr 0.02344
Train [20][890/3239]	Time 0.430 (0.898)	Data Time 0.001 (0.025)	Loss 3.5591 (3.3918)	Entropy 1.03211 (1.03690)	Top-1 acc 37.891 (43.342)	Top-5 acc 64.453 (67.342)	lr 0.02344
Train [20][900/3239]	Time 0.614 (0.897)	Data Time 0.001 (0.025)	Loss 3.3442 (3.3912)	Entropy 1.03173 (1.03684)	Top-1 acc 42.969 (43.358)	Top-5 acc 67.969 (67.361)	lr 0.02344
Train [20][910/3239]	Time 0.630 (0.896)	Data Time 0.001 (0.025)	Loss 3.5770 (3.3912)	Entropy 1.03132 (1.03679)	Top-1 acc 38.281 (43.352)	Top-5 acc 62.500 (67.363)	lr 0.02344
Train [20][920/3239]	Time 0.645 (0.896)	Data Time 0.002 (0.024)	Loss 3.4492 (3.3915)	Entropy 1.03131 (1.03673)	Top-1 acc 44.141 (43.342)	Top-5 acc 66.797 (67.365)	lr 0.02344
Train [20][930/3239]	Time 0.649 (0.895)	Data Time 0.001 (0.024)	Loss 3.2402 (3.3914)	Entropy 1.03087 (1.03667)	Top-1 acc 49.609 (43.354)	Top-5 acc 69.922 (67.358)	lr 0.02344
Train [20][940/3239]	Time 0.607 (0.895)	Data Time 0.001 (0.024)	Loss 3.3444 (3.3923)	Entropy 1.03023 (1.03660)	Top-1 acc 42.578 (43.340)	Top-5 acc 69.922 (67.342)	lr 0.02344
Train [20][950/3239]	Time 0.599 (0.894)	Data Time 0.001 (0.024)	Loss 3.2483 (3.3928)	Entropy 1.02999 (1.03653)	Top-1 acc 46.875 (43.321)	Top-5 acc 70.703 (67.336)	lr 0.02344
Train [20][960/3239]	Time 0.641 (0.894)	Data Time 0.001 (0.023)	Loss 3.2072 (3.3931)	Entropy 1.02991 (1.03646)	Top-1 acc 46.094 (43.323)	Top-5 acc 69.922 (67.332)	lr 0.02344
Train [20][970/3239]	Time 0.593 (0.894)	Data Time 0.001 (0.023)	Loss 3.3212 (3.3926)	Entropy 1.02918 (1.03639)	Top-1 acc 46.094 (43.331)	Top-5 acc 70.312 (67.350)	lr 0.02344
Train [20][980/3239]	Time 0.611 (0.893)	Data Time 0.002 (0.023)	Loss 3.2144 (3.3920)	Entropy 1.02921 (1.03632)	Top-1 acc 50.391 (43.351)	Top-5 acc 75.391 (67.369)	lr 0.02344
Train [20][990/3239]	Time 0.583 (0.893)	Data Time 0.001 (0.023)	Loss 3.5458 (3.3916)	Entropy 1.02905 (1.03625)	Top-1 acc 39.844 (43.357)	Top-5 acc 64.844 (67.371)	lr 0.02344
Train [20][1000/3239]	Time 0.618 (0.893)	Data Time 0.001 (0.023)	Loss 3.4391 (3.3909)	Entropy 1.02895 (1.03618)	Top-1 acc 35.156 (43.368)	Top-5 acc 69.531 (67.386)	lr 0.02344
Train [20][1010/3239]	Time 0.639 (0.892)	Data Time 0.001 (0.022)	Loss 3.1585 (3.3906)	Entropy 1.02915 (1.03610)	Top-1 acc 50.781 (43.371)	Top-5 acc 71.875 (67.389)	lr 0.02344
Train [20][1020/3239]	Time 0.685 (0.892)	Data Time 0.002 (0.022)	Loss 3.5494 (3.3916)	Entropy 1.02866 (1.03604)	Top-1 acc 40.234 (43.345)	Top-5 acc 62.109 (67.360)	lr 0.02344
Train [20][1030/3239]	Time 0.588 (0.892)	Data Time 0.001 (0.022)	Loss 3.2446 (3.3913)	Entropy 1.02855 (1.03596)	Top-1 acc 52.344 (43.369)	Top-5 acc 71.484 (67.373)	lr 0.02344
Train [20][1040/3239]	Time 0.582 (0.891)	Data Time 0.001 (0.022)	Loss 3.4203 (3.3914)	Entropy 1.02843 (1.03589)	Top-1 acc 41.797 (43.356)	Top-5 acc 66.797 (67.381)	lr 0.02343
Train [20][1050/3239]	Time 0.568 (0.891)	Data Time 0.001 (0.022)	Loss 3.2773 (3.3908)	Entropy 1.02851 (1.03582)	Top-1 acc 48.438 (43.372)	Top-5 acc 67.578 (67.388)	lr 0.02343
Train [20][1060/3239]	Time 0.569 (0.890)	Data Time 0.001 (0.021)	Loss 3.3796 (3.3911)	Entropy 1.02849 (1.03575)	Top-1 acc 45.312 (43.379)	Top-5 acc 64.844 (67.377)	lr 0.02343
Train [20][1070/3239]	Time 0.578 (0.890)	Data Time 0.001 (0.021)	Loss 3.4553 (3.3913)	Entropy 1.02858 (1.03568)	Top-1 acc 42.969 (43.375)	Top-5 acc 66.406 (67.380)	lr 0.02343
Train [20][1080/3239]	Time 0.574 (0.889)	Data Time 0.001 (0.021)	Loss 3.3641 (3.3917)	Entropy 1.02871 (1.03562)	Top-1 acc 42.969 (43.367)	Top-5 acc 67.969 (67.376)	lr 0.02343
Train [20][1090/3239]	Time 0.696 (0.889)	Data Time 0.001 (0.021)	Loss 3.6004 (3.3912)	Entropy 1.02852 (1.03556)	Top-1 acc 38.672 (43.383)	Top-5 acc 61.719 (67.382)	lr 0.02343
Train [20][1100/3239]	Time 0.578 (0.889)	Data Time 0.001 (0.021)	Loss 3.3238 (3.3909)	Entropy 1.02812 (1.03549)	Top-1 acc 49.219 (43.391)	Top-5 acc 68.750 (67.391)	lr 0.02343
Train [20][1110/3239]	Time 0.597 (0.888)	Data Time 0.001 (0.021)	Loss 3.5217 (3.3916)	Entropy 1.02772 (1.03542)	Top-1 acc 42.578 (43.383)	Top-5 acc 64.062 (67.371)	lr 0.02343
Train [20][1120/3239]	Time 0.606 (0.888)	Data Time 0.001 (0.020)	Loss 3.5623 (3.3913)	Entropy 1.02770 (1.03535)	Top-1 acc 38.672 (43.394)	Top-5 acc 63.672 (67.368)	lr 0.02343
Train [20][1130/3239]	Time 0.537 (0.888)	Data Time 0.001 (0.020)	Loss 3.4144 (3.3915)	Entropy 1.02728 (1.03528)	Top-1 acc 46.875 (43.395)	Top-5 acc 66.016 (67.363)	lr 0.02343
Train [20][1140/3239]	Time 0.621 (0.887)	Data Time 0.001 (0.020)	Loss 3.3522 (3.3914)	Entropy 1.02676 (1.03521)	Top-1 acc 42.969 (43.397)	Top-5 acc 66.797 (67.373)	lr 0.02343
Train [20][1150/3239]	Time 0.581 (0.887)	Data Time 0.001 (0.020)	Loss 3.3307 (3.3913)	Entropy 1.02697 (1.03514)	Top-1 acc 41.797 (43.394)	Top-5 acc 69.531 (67.373)	lr 0.02343
Train [20][1160/3239]	Time 0.625 (0.887)	Data Time 0.001 (0.020)	Loss 3.1810 (3.3911)	Entropy 1.02642 (1.03507)	Top-1 acc 46.484 (43.393)	Top-5 acc 71.094 (67.375)	lr 0.02343
Train [20][1170/3239]	Time 0.614 (0.886)	Data Time 0.001 (0.020)	Loss 3.2713 (3.3910)	Entropy 1.02649 (1.03499)	Top-1 acc 42.188 (43.397)	Top-5 acc 71.484 (67.374)	lr 0.02343
Train [20][1180/3239]	Time 0.605 (0.886)	Data Time 0.001 (0.019)	Loss 3.3724 (3.3918)	Entropy 1.02677 (1.03492)	Top-1 acc 43.750 (43.382)	Top-5 acc 70.703 (67.360)	lr 0.02343
Train [20][1190/3239]	Time 0.594 (0.886)	Data Time 0.001 (0.019)	Loss 3.4284 (3.3913)	Entropy 1.02669 (1.03485)	Top-1 acc 43.359 (43.393)	Top-5 acc 66.016 (67.376)	lr 0.02343
Train [20][1200/3239]	Time 0.613 (0.885)	Data Time 0.001 (0.019)	Loss 3.2196 (3.3910)	Entropy 1.02604 (1.03478)	Top-1 acc 46.484 (43.396)	Top-5 acc 71.094 (67.383)	lr 0.02343
Train [20][1210/3239]	Time 0.610 (0.885)	Data Time 0.001 (0.019)	Loss 3.3288 (3.3908)	Entropy 1.02595 (1.03471)	Top-1 acc 42.188 (43.396)	Top-5 acc 68.750 (67.395)	lr 0.02343
Train [20][1220/3239]	Time 0.640 (0.885)	Data Time 0.002 (0.019)	Loss 3.3890 (3.3905)	Entropy 1.02587 (1.03464)	Top-1 acc 46.094 (43.413)	Top-5 acc 61.719 (67.402)	lr 0.02343
Train [20][1230/3239]	Time 0.567 (0.884)	Data Time 0.001 (0.019)	Loss 3.4763 (3.3905)	Entropy 1.02617 (1.03457)	Top-1 acc 42.578 (43.416)	Top-5 acc 62.500 (67.401)	lr 0.02343
Train [20][1240/3239]	Time 0.485 (0.884)	Data Time 0.001 (0.019)	Loss 3.2331 (3.3905)	Entropy 1.02620 (1.03450)	Top-1 acc 45.703 (43.411)	Top-5 acc 69.922 (67.401)	lr 0.02342
Train [20][1250/3239]	Time 0.731 (0.884)	Data Time 0.001 (0.018)	Loss 3.0733 (3.3902)	Entropy 1.02616 (1.03444)	Top-1 acc 50.000 (43.416)	Top-5 acc 70.312 (67.401)	lr 0.02342
Train [20][1260/3239]	Time 0.609 (0.883)	Data Time 0.001 (0.018)	Loss 3.2651 (3.3896)	Entropy 1.02614 (1.03437)	Top-1 acc 43.750 (43.424)	Top-5 acc 67.969 (67.412)	lr 0.02342
Train [20][1270/3239]	Time 0.627 (0.883)	Data Time 0.001 (0.018)	Loss 3.3163 (3.3895)	Entropy 1.02579 (1.03430)	Top-1 acc 42.969 (43.421)	Top-5 acc 68.359 (67.416)	lr 0.02342
Train [20][1280/3239]	Time 0.632 (0.883)	Data Time 0.001 (0.018)	Loss 3.2197 (3.3896)	Entropy 1.02543 (1.03424)	Top-1 acc 44.922 (43.417)	Top-5 acc 73.047 (67.420)	lr 0.02342
Train [20][1290/3239]	Time 0.776 (0.899)	Data Time 0.006 (0.018)	Loss 3.2514 (3.3903)	Entropy 1.02528 (1.03417)	Top-1 acc 48.047 (43.400)	Top-5 acc 70.703 (67.405)	lr 0.02342
Train [20][1300/3239]	Time 0.628 (0.899)	Data Time 0.002 (0.018)	Loss 3.4608 (3.3904)	Entropy 1.02499 (1.03410)	Top-1 acc 39.844 (43.391)	Top-5 acc 63.281 (67.401)	lr 0.02342
Train [20][1310/3239]	Time 0.600 (0.899)	Data Time 0.002 (0.018)	Loss 3.5446 (3.3905)	Entropy 1.02459 (1.03403)	Top-1 acc 35.156 (43.384)	Top-5 acc 64.844 (67.399)	lr 0.02342
Train [20][1320/3239]	Time 0.617 (0.898)	Data Time 0.001 (0.018)	Loss 3.4039 (3.3908)	Entropy 1.02413 (1.03396)	Top-1 acc 42.969 (43.377)	Top-5 acc 66.406 (67.394)	lr 0.02342
Train [20][1330/3239]	Time 0.595 (0.898)	Data Time 0.001 (0.017)	Loss 3.2170 (3.3906)	Entropy 1.02414 (1.03388)	Top-1 acc 43.359 (43.373)	Top-5 acc 72.656 (67.402)	lr 0.02342
Train [20][1340/3239]	Time 0.621 (0.898)	Data Time 0.001 (0.017)	Loss 3.3490 (3.3909)	Entropy 1.02402 (1.03381)	Top-1 acc 44.922 (43.367)	Top-5 acc 64.844 (67.402)	lr 0.02342
Train [20][1350/3239]	Time 0.640 (0.898)	Data Time 0.002 (0.017)	Loss 3.4114 (3.3912)	Entropy 1.02406 (1.03374)	Top-1 acc 39.062 (43.359)	Top-5 acc 67.969 (67.399)	lr 0.02342
Train [20][1360/3239]	Time 0.592 (0.897)	Data Time 0.001 (0.017)	Loss 3.2624 (3.3913)	Entropy 1.02356 (1.03367)	Top-1 acc 47.656 (43.358)	Top-5 acc 72.656 (67.407)	lr 0.02342
Train [20][1370/3239]	Time 0.469 (0.897)	Data Time 0.001 (0.017)	Loss 3.2425 (3.3919)	Entropy 1.02366 (1.03359)	Top-1 acc 46.094 (43.355)	Top-5 acc 71.484 (67.398)	lr 0.02342
Train [20][1380/3239]	Time 0.535 (0.896)	Data Time 0.001 (0.017)	Loss 3.4573 (3.3915)	Entropy 1.02374 (1.03352)	Top-1 acc 46.875 (43.372)	Top-5 acc 67.578 (67.405)	lr 0.02342
Train [20][1390/3239]	Time 0.536 (0.896)	Data Time 0.001 (0.017)	Loss 3.8216 (3.3914)	Entropy 1.02343 (1.03345)	Top-1 acc 31.641 (43.377)	Top-5 acc 62.500 (67.404)	lr 0.02342
Train [20][1400/3239]	Time 0.583 (0.896)	Data Time 0.001 (0.017)	Loss 3.5610 (3.3915)	Entropy 1.02371 (1.03338)	Top-1 acc 41.016 (43.378)	Top-5 acc 61.719 (67.403)	lr 0.02342
Train [20][1410/3239]	Time 0.778 (0.896)	Data Time 0.003 (0.017)	Loss 3.4955 (3.3917)	Entropy 1.02375 (1.03331)	Top-1 acc 40.625 (43.370)	Top-5 acc 67.188 (67.399)	lr 0.02342
Train [20][1420/3239]	Time 0.587 (0.895)	Data Time 0.001 (0.017)	Loss 3.2911 (3.3920)	Entropy 1.02346 (1.03324)	Top-1 acc 43.359 (43.362)	Top-5 acc 73.047 (67.391)	lr 0.02342
Train [20][1430/3239]	Time 0.596 (0.895)	Data Time 0.001 (0.016)	Loss 3.5330 (3.3918)	Entropy 1.02327 (1.03317)	Top-1 acc 39.062 (43.366)	Top-5 acc 63.672 (67.390)	lr 0.02342
Train [20][1440/3239]	Time 0.630 (0.895)	Data Time 0.001 (0.016)	Loss 3.2355 (3.3919)	Entropy 1.02270 (1.03310)	Top-1 acc 47.266 (43.363)	Top-5 acc 73.438 (67.394)	lr 0.02342
Train [20][1450/3239]	Time 0.625 (0.895)	Data Time 0.001 (0.016)	Loss 3.3159 (3.3919)	Entropy 1.02210 (1.03303)	Top-1 acc 44.531 (43.364)	Top-5 acc 69.922 (67.391)	lr 0.02341
Train [20][1460/3239]	Time 0.564 (0.895)	Data Time 0.001 (0.016)	Loss 3.4277 (3.3918)	Entropy 1.02211 (1.03296)	Top-1 acc 41.016 (43.367)	Top-5 acc 68.359 (67.390)	lr 0.02341
Train [20][1470/3239]	Time 0.635 (0.895)	Data Time 0.001 (0.016)	Loss 3.2238 (3.3916)	Entropy 1.02149 (1.03288)	Top-1 acc 47.266 (43.373)	Top-5 acc 68.359 (67.392)	lr 0.02341
Train [20][1480/3239]	Time 0.718 (0.895)	Data Time 0.001 (0.016)	Loss 3.2649 (3.3915)	Entropy 1.02140 (1.03280)	Top-1 acc 48.047 (43.369)	Top-5 acc 69.531 (67.390)	lr 0.02341
Train [20][1490/3239]	Time 0.619 (0.894)	Data Time 0.001 (0.016)	Loss 3.4340 (3.3914)	Entropy 1.02115 (1.03273)	Top-1 acc 38.672 (43.370)	Top-5 acc 65.625 (67.392)	lr 0.02341
Train [20][1500/3239]	Time 0.571 (0.894)	Data Time 0.002 (0.016)	Loss 3.4439 (3.3911)	Entropy 1.02109 (1.03265)	Top-1 acc 42.188 (43.381)	Top-5 acc 68.750 (67.400)	lr 0.02341
Train [20][1510/3239]	Time 0.602 (0.894)	Data Time 0.001 (0.016)	Loss 3.0741 (3.3907)	Entropy 1.02125 (1.03257)	Top-1 acc 49.219 (43.387)	Top-5 acc 71.094 (67.403)	lr 0.02341
Train [20][1520/3239]	Time 0.616 (0.894)	Data Time 0.001 (0.016)	Loss 3.3117 (3.3906)	Entropy 1.02120 (1.03250)	Top-1 acc 44.141 (43.387)	Top-5 acc 67.578 (67.403)	lr 0.02341
Train [20][1530/3239]	Time 0.575 (0.893)	Data Time 0.001 (0.016)	Loss 3.2668 (3.3904)	Entropy 1.02131 (1.03243)	Top-1 acc 46.875 (43.393)	Top-5 acc 71.875 (67.404)	lr 0.02341
Train [20][1540/3239]	Time 0.492 (0.893)	Data Time 0.001 (0.015)	Loss 3.2719 (3.3901)	Entropy 1.02097 (1.03235)	Top-1 acc 46.484 (43.394)	Top-5 acc 68.359 (67.410)	lr 0.02341
Train [20][1550/3239]	Time 0.602 (0.893)	Data Time 0.001 (0.015)	Loss 3.3642 (3.3898)	Entropy 1.02104 (1.03228)	Top-1 acc 40.234 (43.395)	Top-5 acc 68.359 (67.417)	lr 0.02341
Train [20][1560/3239]	Time 0.461 (0.892)	Data Time 0.001 (0.015)	Loss 3.5512 (3.3898)	Entropy 1.02110 (1.03221)	Top-1 acc 39.844 (43.400)	Top-5 acc 62.109 (67.417)	lr 0.02341
Train [20][1570/3239]	Time 0.573 (0.891)	Data Time 0.001 (0.015)	Loss 3.4199 (3.3901)	Entropy 1.02070 (1.03214)	Top-1 acc 40.625 (43.393)	Top-5 acc 67.578 (67.409)	lr 0.02341
Train [20][1580/3239]	Time 0.587 (0.891)	Data Time 0.001 (0.015)	Loss 3.5526 (3.3900)	Entropy 1.02064 (1.03207)	Top-1 acc 38.672 (43.400)	Top-5 acc 64.844 (67.410)	lr 0.02341
Train [20][1590/3239]	Time 0.537 (0.890)	Data Time 0.001 (0.015)	Loss 3.7148 (3.3901)	Entropy 1.02039 (1.03199)	Top-1 acc 35.547 (43.393)	Top-5 acc 57.812 (67.406)	lr 0.02341
Train [20][1600/3239]	Time 0.601 (0.890)	Data Time 0.001 (0.015)	Loss 3.2539 (3.3895)	Entropy 1.02054 (1.03192)	Top-1 acc 44.531 (43.404)	Top-5 acc 67.969 (67.420)	lr 0.02341
Train [20][1610/3239]	Time 0.585 (0.890)	Data Time 0.001 (0.015)	Loss 3.3881 (3.3890)	Entropy 1.02004 (1.03185)	Top-1 acc 45.703 (43.421)	Top-5 acc 66.797 (67.428)	lr 0.02341
Train [20][1620/3239]	Time 0.617 (0.890)	Data Time 0.001 (0.015)	Loss 3.1626 (3.3886)	Entropy 1.02012 (1.03178)	Top-1 acc 49.609 (43.426)	Top-5 acc 69.531 (67.436)	lr 0.02341
Train [20][1630/3239]	Time 0.556 (0.890)	Data Time 0.001 (0.015)	Loss 3.4639 (3.3889)	Entropy 1.02036 (1.03171)	Top-1 acc 41.406 (43.414)	Top-5 acc 64.844 (67.427)	lr 0.02341
Train [20][1640/3239]	Time 0.699 (0.890)	Data Time 0.001 (0.015)	Loss 3.3595 (3.3888)	Entropy 1.02045 (1.03164)	Top-1 acc 44.531 (43.417)	Top-5 acc 71.094 (67.435)	lr 0.02341
Train [20][1650/3239]	Time 0.586 (0.889)	Data Time 0.001 (0.015)	Loss 3.4269 (3.3889)	Entropy 1.02040 (1.03157)	Top-1 acc 39.844 (43.419)	Top-5 acc 67.969 (67.430)	lr 0.02340
Train [20][1660/3239]	Time 0.619 (0.889)	Data Time 0.001 (0.014)	Loss 3.0592 (3.3885)	Entropy 1.02089 (1.03150)	Top-1 acc 47.266 (43.430)	Top-5 acc 73.828 (67.441)	lr 0.02340
Train [20][1670/3239]	Time 0.557 (0.889)	Data Time 0.001 (0.014)	Loss 3.3784 (3.3882)	Entropy 1.02018 (1.03144)	Top-1 acc 44.141 (43.440)	Top-5 acc 69.922 (67.451)	lr 0.02340
Train [20][1680/3239]	Time 0.550 (0.889)	Data Time 0.001 (0.014)	Loss 3.3263 (3.3884)	Entropy 1.02036 (1.03137)	Top-1 acc 46.484 (43.434)	Top-5 acc 69.922 (67.448)	lr 0.02340
Train [20][1690/3239]	Time 0.597 (0.889)	Data Time 0.001 (0.014)	Loss 3.3049 (3.3886)	Entropy 1.02001 (1.03131)	Top-1 acc 46.875 (43.426)	Top-5 acc 68.750 (67.450)	lr 0.02340
Train [20][1700/3239]	Time 0.575 (0.889)	Data Time 0.001 (0.014)	Loss 3.4540 (3.3888)	Entropy 1.02008 (1.03124)	Top-1 acc 42.969 (43.425)	Top-5 acc 65.234 (67.442)	lr 0.02340
Train [20][1710/3239]	Time 0.615 (0.888)	Data Time 0.001 (0.014)	Loss 3.4644 (3.3889)	Entropy 1.01968 (1.03117)	Top-1 acc 45.703 (43.421)	Top-5 acc 64.453 (67.445)	lr 0.02340
Train [20][1720/3239]	Time 0.635 (0.888)	Data Time 0.001 (0.014)	Loss 3.4300 (3.3891)	Entropy 1.01927 (1.03111)	Top-1 acc 42.578 (43.417)	Top-5 acc 68.359 (67.443)	lr 0.02340
Train [20][1730/3239]	Time 0.605 (0.888)	Data Time 0.001 (0.014)	Loss 3.3814 (3.3895)	Entropy 1.01939 (1.03104)	Top-1 acc 44.141 (43.403)	Top-5 acc 67.188 (67.436)	lr 0.02340
Train [20][1740/3239]	Time 0.556 (0.887)	Data Time 0.001 (0.014)	Loss 3.4994 (3.3896)	Entropy 1.01921 (1.03097)	Top-1 acc 42.188 (43.401)	Top-5 acc 66.797 (67.435)	lr 0.02340
Train [20][1750/3239]	Time 0.584 (0.887)	Data Time 0.001 (0.014)	Loss 3.4024 (3.3897)	Entropy 1.01882 (1.03090)	Top-1 acc 42.578 (43.399)	Top-5 acc 69.531 (67.429)	lr 0.02340
Train [20][1760/3239]	Time 0.606 (0.887)	Data Time 0.001 (0.014)	Loss 3.3022 (3.3898)	Entropy 1.01836 (1.03083)	Top-1 acc 45.312 (43.392)	Top-5 acc 71.484 (67.430)	lr 0.02340
Train [20][1770/3239]	Time 0.612 (0.887)	Data Time 0.002 (0.014)	Loss 3.1787 (3.3893)	Entropy 1.01848 (1.03076)	Top-1 acc 45.703 (43.397)	Top-5 acc 72.266 (67.441)	lr 0.02340
Train [20][1780/3239]	Time 0.597 (0.886)	Data Time 0.001 (0.014)	Loss 3.4508 (3.3889)	Entropy 1.01795 (1.03069)	Top-1 acc 40.625 (43.407)	Top-5 acc 59.766 (67.448)	lr 0.02340
Train [20][1790/3239]	Time 0.584 (0.886)	Data Time 0.001 (0.014)	Loss 3.5870 (3.3894)	Entropy 1.01795 (1.03062)	Top-1 acc 41.406 (43.393)	Top-5 acc 65.234 (67.441)	lr 0.02340
Train [20][1800/3239]	Time 0.681 (0.886)	Data Time 0.001 (0.013)	Loss 3.5230 (3.3894)	Entropy 1.01723 (1.03055)	Top-1 acc 39.062 (43.388)	Top-5 acc 64.453 (67.440)	lr 0.02340
Train [20][1810/3239]	Time 0.606 (0.886)	Data Time 0.001 (0.013)	Loss 3.2277 (3.3895)	Entropy 1.01708 (1.03048)	Top-1 acc 45.703 (43.385)	Top-5 acc 71.094 (67.439)	lr 0.02340
Train [20][1820/3239]	Time 0.618 (0.886)	Data Time 0.001 (0.013)	Loss 3.4308 (3.3893)	Entropy 1.01681 (1.03040)	Top-1 acc 40.625 (43.392)	Top-5 acc 66.016 (67.441)	lr 0.02340
Train [20][1830/3239]	Time 0.638 (0.886)	Data Time 0.001 (0.013)	Loss 3.4846 (3.3893)	Entropy 1.01644 (1.03033)	Top-1 acc 41.797 (43.393)	Top-5 acc 66.406 (67.441)	lr 0.02340
Train [20][1840/3239]	Time 0.554 (0.886)	Data Time 0.001 (0.013)	Loss 3.6042 (3.3894)	Entropy 1.01629 (1.03025)	Top-1 acc 38.281 (43.391)	Top-5 acc 64.062 (67.439)	lr 0.02340
Train [20][1850/3239]	Time 0.588 (0.885)	Data Time 0.001 (0.013)	Loss 3.4131 (3.3892)	Entropy 1.01623 (1.03018)	Top-1 acc 40.625 (43.390)	Top-5 acc 65.625 (67.443)	lr 0.02339
Train [20][1860/3239]	Time 0.606 (0.885)	Data Time 0.001 (0.013)	Loss 3.3038 (3.3890)	Entropy 1.01579 (1.03010)	Top-1 acc 47.266 (43.400)	Top-5 acc 66.797 (67.445)	lr 0.02339
Train [20][1870/3239]	Time 0.690 (0.885)	Data Time 0.001 (0.013)	Loss 3.5995 (3.3892)	Entropy 1.01515 (1.03002)	Top-1 acc 38.281 (43.397)	Top-5 acc 63.672 (67.445)	lr 0.02339
Train [20][1880/3239]	Time 0.607 (0.885)	Data Time 0.001 (0.013)	Loss 3.6500 (3.3888)	Entropy 1.01471 (1.02994)	Top-1 acc 39.062 (43.407)	Top-5 acc 63.281 (67.455)	lr 0.02339
Train [20][1890/3239]	Time 0.577 (0.885)	Data Time 0.001 (0.013)	Loss 3.3450 (3.3887)	Entropy 1.01467 (1.02986)	Top-1 acc 46.094 (43.409)	Top-5 acc 69.141 (67.450)	lr 0.02339
Train [20][1900/3239]	Time 0.599 (0.885)	Data Time 0.001 (0.013)	Loss 3.2314 (3.3883)	Entropy 1.01473 (1.02978)	Top-1 acc 47.656 (43.423)	Top-5 acc 69.922 (67.460)	lr 0.02339
Train [20][1910/3239]	Time 0.583 (0.884)	Data Time 0.001 (0.013)	Loss 3.4287 (3.3880)	Entropy 1.01472 (1.02970)	Top-1 acc 41.797 (43.435)	Top-5 acc 67.578 (67.466)	lr 0.02339
Train [20][1920/3239]	Time 0.585 (0.884)	Data Time 0.001 (0.013)	Loss 3.6018 (3.3880)	Entropy 1.01465 (1.02962)	Top-1 acc 39.062 (43.437)	Top-5 acc 64.844 (67.471)	lr 0.02339
Train [20][1930/3239]	Time 0.611 (0.884)	Data Time 0.001 (0.013)	Loss 3.2331 (3.3877)	Entropy 1.01470 (1.02955)	Top-1 acc 46.484 (43.441)	Top-5 acc 68.750 (67.475)	lr 0.02339
Train [20][1940/3239]	Time 0.599 (0.884)	Data Time 0.001 (0.013)	Loss 3.5320 (3.3880)	Entropy 1.01521 (1.02947)	Top-1 acc 41.797 (43.428)	Top-5 acc 67.188 (67.471)	lr 0.02339
Train [20][1950/3239]	Time 0.590 (0.895)	Data Time 0.002 (0.013)	Loss 3.2907 (3.3879)	Entropy 1.01545 (1.02940)	Top-1 acc 45.312 (43.432)	Top-5 acc 67.969 (67.476)	lr 0.02339
Train [20][1960/3239]	Time 0.744 (0.895)	Data Time 0.002 (0.013)	Loss 3.6271 (3.3880)	Entropy 1.01488 (1.02933)	Top-1 acc 37.500 (43.426)	Top-5 acc 64.453 (67.471)	lr 0.02339
Train [20][1970/3239]	Time 0.645 (0.894)	Data Time 0.003 (0.012)	Loss 3.4540 (3.3882)	Entropy 1.01467 (1.02925)	Top-1 acc 43.750 (43.420)	Top-5 acc 65.625 (67.468)	lr 0.02339
Train [20][1980/3239]	Time 0.628 (0.894)	Data Time 0.001 (0.012)	Loss 3.3361 (3.3881)	Entropy 1.01478 (1.02918)	Top-1 acc 42.969 (43.425)	Top-5 acc 69.141 (67.468)	lr 0.02339
Train [20][1990/3239]	Time 0.683 (0.894)	Data Time 0.001 (0.012)	Loss 3.2509 (3.3879)	Entropy 1.01506 (1.02911)	Top-1 acc 42.578 (43.423)	Top-5 acc 69.922 (67.466)	lr 0.02339
Train [20][2000/3239]	Time 0.584 (0.894)	Data Time 0.001 (0.012)	Loss 3.4271 (3.3880)	Entropy 1.01507 (1.02904)	Top-1 acc 42.578 (43.418)	Top-5 acc 66.406 (67.463)	lr 0.02339
Train [20][2010/3239]	Time 0.608 (0.894)	Data Time 0.001 (0.012)	Loss 3.3094 (3.3878)	Entropy 1.01512 (1.02897)	Top-1 acc 48.828 (43.420)	Top-5 acc 70.312 (67.465)	lr 0.02339
Train [20][2020/3239]	Time 0.631 (0.894)	Data Time 0.001 (0.012)	Loss 3.3958 (3.3883)	Entropy 1.01489 (1.02890)	Top-1 acc 41.406 (43.406)	Top-5 acc 67.188 (67.462)	lr 0.02339
Train [20][2030/3239]	Time 0.710 (0.894)	Data Time 0.001 (0.012)	Loss 3.5553 (3.3882)	Entropy 1.01469 (1.02883)	Top-1 acc 43.359 (43.408)	Top-5 acc 64.844 (67.466)	lr 0.02339
Train [20][2040/3239]	Time 0.647 (0.894)	Data Time 0.001 (0.012)	Loss 3.1863 (3.3882)	Entropy 1.01507 (1.02876)	Top-1 acc 46.875 (43.411)	Top-5 acc 73.438 (67.465)	lr 0.02339
Train [20][2050/3239]	Time 0.557 (0.893)	Data Time 0.001 (0.012)	Loss 3.3503 (3.3885)	Entropy 1.01517 (1.02870)	Top-1 acc 43.750 (43.404)	Top-5 acc 69.141 (67.457)	lr 0.02338
Train [20][2060/3239]	Time 0.631 (0.893)	Data Time 0.001 (0.012)	Loss 3.4182 (3.3884)	Entropy 1.01486 (1.02863)	Top-1 acc 46.875 (43.402)	Top-5 acc 67.188 (67.459)	lr 0.02338
Train [20][2070/3239]	Time 0.617 (0.893)	Data Time 0.001 (0.012)	Loss 3.5141 (3.3882)	Entropy 1.01450 (1.02856)	Top-1 acc 43.359 (43.405)	Top-5 acc 63.281 (67.464)	lr 0.02338
Train [20][2080/3239]	Time 0.621 (0.893)	Data Time 0.001 (0.012)	Loss 3.4592 (3.3882)	Entropy 1.01439 (1.02849)	Top-1 acc 42.969 (43.406)	Top-5 acc 63.281 (67.467)	lr 0.02338
Train [20][2090/3239]	Time 0.601 (0.893)	Data Time 0.001 (0.012)	Loss 3.5346 (3.3880)	Entropy 1.01419 (1.02843)	Top-1 acc 41.406 (43.409)	Top-5 acc 64.844 (67.475)	lr 0.02338
Train [20][2100/3239]	Time 0.602 (0.893)	Data Time 0.001 (0.012)	Loss 3.3858 (3.3879)	Entropy 1.01375 (1.02836)	Top-1 acc 41.016 (43.414)	Top-5 acc 67.578 (67.478)	lr 0.02338
Train [20][2110/3239]	Time 0.575 (0.893)	Data Time 0.001 (0.012)	Loss 3.3855 (3.3880)	Entropy 1.01352 (1.02829)	Top-1 acc 46.094 (43.412)	Top-5 acc 63.672 (67.474)	lr 0.02338
Train [20][2120/3239]	Time 0.583 (0.893)	Data Time 0.002 (0.012)	Loss 3.3339 (3.3882)	Entropy 1.01333 (1.02822)	Top-1 acc 42.578 (43.411)	Top-5 acc 66.016 (67.472)	lr 0.02338
Train [20][2130/3239]	Time 0.618 (0.893)	Data Time 0.001 (0.012)	Loss 3.5411 (3.3882)	Entropy 1.01330 (1.02815)	Top-1 acc 40.234 (43.411)	Top-5 acc 62.109 (67.467)	lr 0.02338
Train [20][2140/3239]	Time 0.542 (0.892)	Data Time 0.001 (0.012)	Loss 3.3447 (3.3881)	Entropy 1.01346 (1.02808)	Top-1 acc 40.234 (43.402)	Top-5 acc 68.359 (67.471)	lr 0.02338
Train [20][2150/3239]	Time 0.626 (0.892)	Data Time 0.001 (0.012)	Loss 3.3339 (3.3880)	Entropy 1.01366 (1.02801)	Top-1 acc 44.141 (43.406)	Top-5 acc 68.750 (67.480)	lr 0.02338
Train [20][2160/3239]	Time 0.647 (0.892)	Data Time 0.001 (0.012)	Loss 3.3745 (3.3878)	Entropy 1.01379 (1.02795)	Top-1 acc 44.141 (43.411)	Top-5 acc 68.750 (67.482)	lr 0.02338
Train [20][2170/3239]	Time 0.603 (0.892)	Data Time 0.001 (0.012)	Loss 3.2320 (3.3879)	Entropy 1.01365 (1.02788)	Top-1 acc 46.875 (43.408)	Top-5 acc 69.922 (67.481)	lr 0.02338
Train [20][2180/3239]	Time 0.599 (0.892)	Data Time 0.001 (0.012)	Loss 3.7207 (3.3883)	Entropy 1.01359 (1.02782)	Top-1 acc 35.547 (43.397)	Top-5 acc 57.812 (67.470)	lr 0.02338
Train [20][2190/3239]	Time 0.703 (0.892)	Data Time 0.001 (0.011)	Loss 3.4419 (3.3882)	Entropy 1.01354 (1.02775)	Top-1 acc 42.578 (43.404)	Top-5 acc 65.625 (67.472)	lr 0.02338
Train [20][2200/3239]	Time 0.588 (0.892)	Data Time 0.001 (0.011)	Loss 3.1600 (3.3881)	Entropy 1.01339 (1.02769)	Top-1 acc 45.703 (43.405)	Top-5 acc 73.047 (67.472)	lr 0.02338
Train [20][2210/3239]	Time 0.472 (0.891)	Data Time 0.001 (0.011)	Loss 3.4941 (3.3881)	Entropy 1.01337 (1.02762)	Top-1 acc 44.531 (43.405)	Top-5 acc 64.062 (67.468)	lr 0.02338
Train [20][2220/3239]	Time 0.600 (0.891)	Data Time 0.002 (0.011)	Loss 3.4115 (3.3883)	Entropy 1.01354 (1.02756)	Top-1 acc 44.531 (43.406)	Top-5 acc 65.234 (67.466)	lr 0.02338
Train [20][2230/3239]	Time 0.610 (0.891)	Data Time 0.001 (0.011)	Loss 3.2925 (3.3883)	Entropy 1.01379 (1.02750)	Top-1 acc 45.312 (43.408)	Top-5 acc 67.969 (67.466)	lr 0.02338
Train [20][2240/3239]	Time 0.601 (0.891)	Data Time 0.001 (0.011)	Loss 3.3329 (3.3884)	Entropy 1.01378 (1.02743)	Top-1 acc 50.781 (43.410)	Top-5 acc 71.875 (67.466)	lr 0.02338
Train [20][2250/3239]	Time 0.572 (0.891)	Data Time 0.001 (0.011)	Loss 3.3615 (3.3882)	Entropy 1.01359 (1.02737)	Top-1 acc 44.141 (43.414)	Top-5 acc 69.531 (67.469)	lr 0.02337
Train [20][2260/3239]	Time 0.632 (0.891)	Data Time 0.001 (0.011)	Loss 3.5574 (3.3880)	Entropy 1.01347 (1.02731)	Top-1 acc 38.672 (43.416)	Top-5 acc 63.672 (67.474)	lr 0.02337
Train [20][2270/3239]	Time 0.606 (0.891)	Data Time 0.001 (0.011)	Loss 3.3096 (3.3878)	Entropy 1.01328 (1.02725)	Top-1 acc 44.141 (43.422)	Top-5 acc 68.359 (67.473)	lr 0.02337
Train [20][2280/3239]	Time 0.640 (0.890)	Data Time 0.001 (0.011)	Loss 3.4329 (3.3882)	Entropy 1.01320 (1.02719)	Top-1 acc 40.625 (43.416)	Top-5 acc 66.016 (67.466)	lr 0.02337
Train [20][2290/3239]	Time 0.607 (0.890)	Data Time 0.001 (0.011)	Loss 3.4931 (3.3883)	Entropy 1.01262 (1.02713)	Top-1 acc 41.016 (43.418)	Top-5 acc 67.188 (67.465)	lr 0.02337
Train [20][2300/3239]	Time 0.592 (0.890)	Data Time 0.001 (0.011)	Loss 3.5522 (3.3885)	Entropy 1.01242 (1.02706)	Top-1 acc 38.281 (43.413)	Top-5 acc 68.750 (67.465)	lr 0.02337
Train [20][2310/3239]	Time 0.609 (0.890)	Data Time 0.002 (0.011)	Loss 3.3893 (3.3884)	Entropy 1.01255 (1.02700)	Top-1 acc 42.188 (43.415)	Top-5 acc 68.359 (67.469)	lr 0.02337
Train [20][2320/3239]	Time 0.563 (0.890)	Data Time 0.001 (0.011)	Loss 3.3190 (3.3883)	Entropy 1.01200 (1.02694)	Top-1 acc 43.359 (43.415)	Top-5 acc 70.703 (67.469)	lr 0.02337
Train [20][2330/3239]	Time 0.576 (0.890)	Data Time 0.001 (0.011)	Loss 3.4363 (3.3885)	Entropy 1.01179 (1.02687)	Top-1 acc 40.234 (43.412)	Top-5 acc 64.844 (67.464)	lr 0.02337
Train [20][2340/3239]	Time 0.604 (0.890)	Data Time 0.001 (0.011)	Loss 3.3555 (3.3885)	Entropy 1.01186 (1.02681)	Top-1 acc 43.750 (43.415)	Top-5 acc 69.141 (67.464)	lr 0.02337
Train [20][2350/3239]	Time 0.677 (0.890)	Data Time 0.001 (0.011)	Loss 3.6067 (3.3887)	Entropy 1.01163 (1.02675)	Top-1 acc 37.500 (43.412)	Top-5 acc 62.109 (67.463)	lr 0.02337
Train [20][2360/3239]	Time 0.607 (0.890)	Data Time 0.001 (0.011)	Loss 3.4291 (3.3885)	Entropy 1.01126 (1.02668)	Top-1 acc 46.094 (43.421)	Top-5 acc 67.969 (67.464)	lr 0.02337
Train [20][2370/3239]	Time 0.486 (0.889)	Data Time 0.001 (0.011)	Loss 3.5278 (3.3885)	Entropy 1.01087 (1.02662)	Top-1 acc 40.234 (43.428)	Top-5 acc 68.359 (67.464)	lr 0.02337
Train [20][2380/3239]	Time 0.566 (0.889)	Data Time 0.001 (0.011)	Loss 3.5478 (3.3887)	Entropy 1.01078 (1.02655)	Top-1 acc 44.141 (43.426)	Top-5 acc 65.234 (67.462)	lr 0.02337
Train [20][2390/3239]	Time 0.592 (0.889)	Data Time 0.001 (0.011)	Loss 3.4975 (3.3887)	Entropy 1.01008 (1.02648)	Top-1 acc 39.844 (43.423)	Top-5 acc 68.359 (67.465)	lr 0.02337
Train [20][2400/3239]	Time 0.549 (0.889)	Data Time 0.001 (0.011)	Loss 3.5246 (3.3885)	Entropy 1.01019 (1.02641)	Top-1 acc 43.359 (43.428)	Top-5 acc 62.891 (67.468)	lr 0.02337
Train [20][2410/3239]	Time 0.616 (0.889)	Data Time 0.002 (0.011)	Loss 3.4102 (3.3883)	Entropy 1.01041 (1.02635)	Top-1 acc 41.016 (43.427)	Top-5 acc 67.578 (67.472)	lr 0.02337
Train [20][2420/3239]	Time 0.658 (0.888)	Data Time 0.001 (0.011)	Loss 3.4688 (3.3883)	Entropy 1.01003 (1.02628)	Top-1 acc 41.797 (43.426)	Top-5 acc 67.578 (67.468)	lr 0.02337
Train [20][2430/3239]	Time 0.570 (0.888)	Data Time 0.001 (0.011)	Loss 3.6947 (3.3883)	Entropy 1.01011 (1.02621)	Top-1 acc 36.719 (43.426)	Top-5 acc 61.328 (67.467)	lr 0.02337
Train [20][2440/3239]	Time 0.617 (0.888)	Data Time 0.002 (0.011)	Loss 3.2810 (3.3882)	Entropy 1.01022 (1.02615)	Top-1 acc 44.531 (43.428)	Top-5 acc 73.828 (67.471)	lr 0.02337
Train [20][2450/3239]	Time 0.588 (0.888)	Data Time 0.001 (0.010)	Loss 3.5491 (3.3881)	Entropy 1.00929 (1.02608)	Top-1 acc 39.453 (43.429)	Top-5 acc 64.844 (67.472)	lr 0.02336
Train [20][2460/3239]	Time 0.638 (0.888)	Data Time 0.001 (0.010)	Loss 3.4640 (3.3880)	Entropy 1.00921 (1.02601)	Top-1 acc 41.797 (43.432)	Top-5 acc 68.359 (67.475)	lr 0.02336
Train [20][2470/3239]	Time 0.628 (0.888)	Data Time 0.001 (0.010)	Loss 3.2233 (3.3878)	Entropy 1.00898 (1.02594)	Top-1 acc 50.000 (43.437)	Top-5 acc 70.703 (67.482)	lr 0.02336
Train [20][2480/3239]	Time 0.619 (0.888)	Data Time 0.001 (0.010)	Loss 3.3248 (3.3876)	Entropy 1.00847 (1.02587)	Top-1 acc 46.875 (43.441)	Top-5 acc 67.969 (67.484)	lr 0.02336
Train [20][2490/3239]	Time 0.625 (0.888)	Data Time 0.001 (0.010)	Loss 3.3824 (3.3876)	Entropy 1.00807 (1.02580)	Top-1 acc 44.531 (43.440)	Top-5 acc 66.797 (67.486)	lr 0.02336
Train [20][2500/3239]	Time 0.643 (0.888)	Data Time 0.001 (0.010)	Loss 3.2819 (3.3874)	Entropy 1.00768 (1.02573)	Top-1 acc 47.656 (43.442)	Top-5 acc 72.266 (67.485)	lr 0.02336
Train [20][2510/3239]	Time 0.721 (0.888)	Data Time 0.002 (0.010)	Loss 3.4213 (3.3872)	Entropy 1.00728 (1.02566)	Top-1 acc 44.141 (43.443)	Top-5 acc 66.016 (67.487)	lr 0.02336
Train [20][2520/3239]	Time 0.593 (0.888)	Data Time 0.001 (0.010)	Loss 3.5519 (3.3871)	Entropy 1.00765 (1.02559)	Top-1 acc 39.453 (43.447)	Top-5 acc 64.453 (67.491)	lr 0.02336
Train [20][2530/3239]	Time 0.591 (0.887)	Data Time 0.001 (0.010)	Loss 3.0921 (3.3870)	Entropy 1.00748 (1.02552)	Top-1 acc 47.266 (43.448)	Top-5 acc 77.344 (67.495)	lr 0.02336
Train [20][2540/3239]	Time 0.629 (0.887)	Data Time 0.001 (0.010)	Loss 3.4906 (3.3871)	Entropy 1.00727 (1.02544)	Top-1 acc 42.969 (43.446)	Top-5 acc 67.578 (67.494)	lr 0.02336
Train [20][2550/3239]	Time 0.612 (0.887)	Data Time 0.001 (0.010)	Loss 3.5399 (3.3870)	Entropy 1.00759 (1.02537)	Top-1 acc 39.844 (43.448)	Top-5 acc 65.234 (67.497)	lr 0.02336
Train [20][2560/3239]	Time 0.618 (0.887)	Data Time 0.001 (0.010)	Loss 3.4267 (3.3869)	Entropy 1.00759 (1.02530)	Top-1 acc 42.578 (43.450)	Top-5 acc 65.625 (67.498)	lr 0.02336
Train [20][2570/3239]	Time 0.486 (0.887)	Data Time 0.001 (0.010)	Loss 3.5767 (3.3868)	Entropy 1.00688 (1.02523)	Top-1 acc 37.891 (43.452)	Top-5 acc 62.109 (67.498)	lr 0.02336
Train [20][2580/3239]	Time 0.676 (0.887)	Data Time 0.001 (0.010)	Loss 3.1268 (3.3866)	Entropy 1.00681 (1.02516)	Top-1 acc 47.266 (43.454)	Top-5 acc 69.531 (67.502)	lr 0.02336
Train [20][2590/3239]	Time 0.616 (0.887)	Data Time 0.001 (0.010)	Loss 3.4207 (3.3867)	Entropy 1.00676 (1.02509)	Top-1 acc 39.844 (43.454)	Top-5 acc 67.188 (67.498)	lr 0.02336
Train [20][2600/3239]	Time 0.732 (0.895)	Data Time 0.005 (0.010)	Loss 3.6616 (3.3869)	Entropy 1.00676 (1.02502)	Top-1 acc 38.281 (43.450)	Top-5 acc 63.281 (67.494)	lr 0.02336
Train [20][2610/3239]	Time 0.612 (0.895)	Data Time 0.002 (0.010)	Loss 3.3284 (3.3871)	Entropy 1.00676 (1.02495)	Top-1 acc 45.312 (43.448)	Top-5 acc 67.969 (67.488)	lr 0.02336
Train [20][2620/3239]	Time 0.619 (0.895)	Data Time 0.002 (0.010)	Loss 3.4693 (3.3870)	Entropy 1.00646 (1.02488)	Top-1 acc 44.922 (43.453)	Top-5 acc 63.672 (67.489)	lr 0.02336
Train [20][2630/3239]	Time 0.621 (0.895)	Data Time 0.002 (0.010)	Loss 3.2738 (3.3866)	Entropy 1.00616 (1.02481)	Top-1 acc 47.656 (43.456)	Top-5 acc 68.750 (67.495)	lr 0.02336
Train [20][2640/3239]	Time 0.634 (0.895)	Data Time 0.001 (0.010)	Loss 3.4755 (3.3865)	Entropy 1.00587 (1.02474)	Top-1 acc 41.797 (43.460)	Top-5 acc 67.188 (67.495)	lr 0.02336
Train [20][2650/3239]	Time 0.647 (0.895)	Data Time 0.002 (0.010)	Loss 3.2393 (3.3865)	Entropy 1.00532 (1.02467)	Top-1 acc 46.484 (43.457)	Top-5 acc 71.094 (67.499)	lr 0.02335
Train [20][2660/3239]	Time 0.693 (0.895)	Data Time 0.002 (0.010)	Loss 3.5377 (3.3868)	Entropy 1.00519 (1.02460)	Top-1 acc 41.016 (43.448)	Top-5 acc 64.844 (67.492)	lr 0.02335
Train [20][2670/3239]	Time 0.717 (0.895)	Data Time 0.002 (0.010)	Loss 3.3432 (3.3866)	Entropy 1.00520 (1.02452)	Top-1 acc 41.406 (43.454)	Top-5 acc 68.750 (67.497)	lr 0.02335
Train [20][2680/3239]	Time 0.612 (0.895)	Data Time 0.001 (0.010)	Loss 3.3707 (3.3864)	Entropy 1.00544 (1.02445)	Top-1 acc 43.750 (43.460)	Top-5 acc 66.406 (67.496)	lr 0.02335
Train [20][2690/3239]	Time 0.559 (0.895)	Data Time 0.001 (0.010)	Loss 3.5852 (3.3865)	Entropy 1.00572 (1.02438)	Top-1 acc 40.234 (43.456)	Top-5 acc 60.938 (67.494)	lr 0.02335
Train [20][2700/3239]	Time 0.605 (0.895)	Data Time 0.001 (0.010)	Loss 3.5793 (3.3867)	Entropy 1.00614 (1.02431)	Top-1 acc 39.844 (43.455)	Top-5 acc 62.891 (67.489)	lr 0.02335
Train [20][2710/3239]	Time 0.598 (0.894)	Data Time 0.001 (0.010)	Loss 3.2895 (3.3867)	Entropy 1.00559 (1.02425)	Top-1 acc 46.094 (43.457)	Top-5 acc 68.359 (67.486)	lr 0.02335
Train [20][2720/3239]	Time 0.662 (0.894)	Data Time 0.008 (0.010)	Loss 3.2687 (3.3866)	Entropy 1.00584 (1.02418)	Top-1 acc 44.922 (43.461)	Top-5 acc 67.969 (67.489)	lr 0.02335
Train [20][2730/3239]	Time 0.619 (0.894)	Data Time 0.001 (0.010)	Loss 3.4728 (3.3865)	Entropy 1.00547 (1.02411)	Top-1 acc 38.672 (43.460)	Top-5 acc 65.625 (67.492)	lr 0.02335
Train [20][2740/3239]	Time 0.743 (0.894)	Data Time 0.001 (0.010)	Loss 3.4075 (3.3864)	Entropy 1.00514 (1.02404)	Top-1 acc 42.188 (43.464)	Top-5 acc 63.281 (67.493)	lr 0.02335
Train [20][2750/3239]	Time 0.623 (0.894)	Data Time 0.001 (0.010)	Loss 3.5357 (3.3865)	Entropy 1.00487 (1.02397)	Top-1 acc 40.625 (43.465)	Top-5 acc 67.188 (67.494)	lr 0.02335
Train [20][2760/3239]	Time 0.634 (0.894)	Data Time 0.001 (0.010)	Loss 3.4571 (3.3865)	Entropy 1.00513 (1.02390)	Top-1 acc 44.141 (43.467)	Top-5 acc 63.672 (67.499)	lr 0.02335
Train [20][2770/3239]	Time 0.631 (0.894)	Data Time 0.001 (0.010)	Loss 3.4193 (3.3865)	Entropy 1.00440 (1.02383)	Top-1 acc 43.359 (43.470)	Top-5 acc 68.359 (67.497)	lr 0.02335
Train [20][2780/3239]	Time 0.600 (0.894)	Data Time 0.001 (0.009)	Loss 3.4104 (3.3865)	Entropy 1.00420 (1.02376)	Top-1 acc 45.312 (43.471)	Top-5 acc 62.891 (67.495)	lr 0.02335
Train [20][2790/3239]	Time 0.597 (0.894)	Data Time 0.003 (0.009)	Loss 3.5901 (3.3868)	Entropy 1.00438 (1.02369)	Top-1 acc 35.156 (43.464)	Top-5 acc 62.109 (67.491)	lr 0.02335
Train [20][2800/3239]	Time 0.619 (0.894)	Data Time 0.001 (0.009)	Loss 3.6477 (3.3868)	Entropy 1.00455 (1.02363)	Top-1 acc 37.109 (43.467)	Top-5 acc 60.547 (67.489)	lr 0.02335
Train [20][2810/3239]	Time 0.699 (0.894)	Data Time 0.001 (0.009)	Loss 3.3781 (3.3866)	Entropy 1.00467 (1.02356)	Top-1 acc 41.797 (43.471)	Top-5 acc 65.625 (67.491)	lr 0.02335
Train [20][2820/3239]	Time 0.641 (0.894)	Data Time 0.001 (0.009)	Loss 3.1371 (3.3865)	Entropy 1.00412 (1.02349)	Top-1 acc 47.656 (43.474)	Top-5 acc 73.828 (67.496)	lr 0.02335
Train [20][2830/3239]	Time 0.599 (0.893)	Data Time 0.001 (0.009)	Loss 3.4794 (3.3865)	Entropy 1.00406 (1.02342)	Top-1 acc 42.578 (43.475)	Top-5 acc 65.234 (67.498)	lr 0.02335
Train [20][2840/3239]	Time 0.620 (0.894)	Data Time 0.001 (0.009)	Loss 3.2927 (3.3865)	Entropy 1.00432 (1.02335)	Top-1 acc 43.359 (43.473)	Top-5 acc 65.625 (67.495)	lr 0.02335
Train [20][2850/3239]	Time 0.605 (0.893)	Data Time 0.001 (0.009)	Loss 3.3588 (3.3863)	Entropy 1.00426 (1.02329)	Top-1 acc 41.406 (43.476)	Top-5 acc 68.750 (67.500)	lr 0.02334
Train [20][2860/3239]	Time 0.533 (0.893)	Data Time 0.001 (0.009)	Loss 3.4736 (3.3863)	Entropy 1.00388 (1.02322)	Top-1 acc 43.750 (43.470)	Top-5 acc 66.016 (67.496)	lr 0.02334
Train [20][2870/3239]	Time 0.539 (0.893)	Data Time 0.001 (0.009)	Loss 3.5382 (3.3865)	Entropy 1.00373 (1.02315)	Top-1 acc 37.109 (43.463)	Top-5 acc 63.672 (67.494)	lr 0.02334
Train [20][2880/3239]	Time 0.595 (0.893)	Data Time 0.001 (0.009)	Loss 3.2335 (3.3864)	Entropy 1.00369 (1.02309)	Top-1 acc 46.875 (43.463)	Top-5 acc 73.047 (67.494)	lr 0.02334
Train [20][2890/3239]	Time 0.566 (0.893)	Data Time 0.001 (0.009)	Loss 3.4355 (3.3865)	Entropy 1.00362 (1.02302)	Top-1 acc 44.141 (43.460)	Top-5 acc 65.234 (67.489)	lr 0.02334
Train [20][2900/3239]	Time 0.628 (0.893)	Data Time 0.001 (0.009)	Loss 3.5035 (3.3865)	Entropy 1.00312 (1.02295)	Top-1 acc 39.453 (43.463)	Top-5 acc 66.016 (67.489)	lr 0.02334
Train [20][2910/3239]	Time 0.609 (0.892)	Data Time 0.001 (0.009)	Loss 3.4792 (3.3864)	Entropy 1.00339 (1.02288)	Top-1 acc 42.188 (43.466)	Top-5 acc 67.188 (67.494)	lr 0.02334
Train [20][2920/3239]	Time 0.620 (0.892)	Data Time 0.001 (0.009)	Loss 3.3833 (3.3863)	Entropy 1.00347 (1.02282)	Top-1 acc 44.922 (43.469)	Top-5 acc 68.750 (67.495)	lr 0.02334
Train [20][2930/3239]	Time 0.636 (0.892)	Data Time 0.001 (0.009)	Loss 3.3941 (3.3864)	Entropy 1.00299 (1.02275)	Top-1 acc 46.484 (43.468)	Top-5 acc 65.234 (67.496)	lr 0.02334
Train [20][2940/3239]	Time 0.642 (0.892)	Data Time 0.001 (0.009)	Loss 3.2218 (3.3862)	Entropy 1.00297 (1.02268)	Top-1 acc 44.922 (43.471)	Top-5 acc 69.531 (67.501)	lr 0.02334
Train [20][2950/3239]	Time 0.554 (0.892)	Data Time 0.001 (0.009)	Loss 3.3191 (3.3863)	Entropy 1.00310 (1.02262)	Top-1 acc 40.625 (43.467)	Top-5 acc 69.531 (67.500)	lr 0.02334
Train [20][2960/3239]	Time 0.611 (0.892)	Data Time 0.001 (0.009)	Loss 3.5040 (3.3864)	Entropy 1.00257 (1.02255)	Top-1 acc 40.234 (43.466)	Top-5 acc 67.969 (67.499)	lr 0.02334
Train [20][2970/3239]	Time 0.707 (0.892)	Data Time 0.002 (0.009)	Loss 3.4939 (3.3863)	Entropy 1.00262 (1.02248)	Top-1 acc 41.406 (43.470)	Top-5 acc 66.797 (67.502)	lr 0.02334
Train [20][2980/3239]	Time 0.637 (0.892)	Data Time 0.001 (0.009)	Loss 3.2736 (3.3862)	Entropy 1.00220 (1.02241)	Top-1 acc 43.359 (43.470)	Top-5 acc 69.141 (67.504)	lr 0.02334
Train [20][2990/3239]	Time 0.625 (0.892)	Data Time 0.002 (0.009)	Loss 3.4193 (3.3862)	Entropy 1.00247 (1.02235)	Top-1 acc 44.141 (43.469)	Top-5 acc 66.016 (67.504)	lr 0.02334
Train [20][3000/3239]	Time 0.615 (0.892)	Data Time 0.001 (0.009)	Loss 3.0885 (3.3863)	Entropy 1.00215 (1.02228)	Top-1 acc 53.906 (43.467)	Top-5 acc 73.438 (67.504)	lr 0.02334
Train [20][3010/3239]	Time 0.603 (0.891)	Data Time 0.001 (0.009)	Loss 3.4560 (3.3864)	Entropy 1.00219 (1.02221)	Top-1 acc 41.797 (43.464)	Top-5 acc 69.922 (67.505)	lr 0.02334
Train [20][3020/3239]	Time 0.581 (0.891)	Data Time 0.001 (0.009)	Loss 3.2902 (3.3863)	Entropy 1.00210 (1.02215)	Top-1 acc 45.312 (43.461)	Top-5 acc 70.703 (67.506)	lr 0.02334
Train [20][3030/3239]	Time 0.569 (0.891)	Data Time 0.001 (0.009)	Loss 3.3536 (3.3863)	Entropy 1.00179 (1.02208)	Top-1 acc 41.406 (43.460)	Top-5 acc 66.797 (67.505)	lr 0.02334
Train [20][3040/3239]	Time 0.459 (0.891)	Data Time 0.001 (0.009)	Loss 3.5472 (3.3863)	Entropy 1.00186 (1.02201)	Top-1 acc 41.016 (43.460)	Top-5 acc 59.766 (67.502)	lr 0.02334
Train [20][3050/3239]	Time 0.616 (0.891)	Data Time 0.002 (0.009)	Loss 3.2188 (3.3862)	Entropy 1.00162 (1.02195)	Top-1 acc 48.047 (43.462)	Top-5 acc 72.656 (67.505)	lr 0.02333
Train [20][3060/3239]	Time 0.662 (0.891)	Data Time 0.001 (0.009)	Loss 3.3560 (3.3863)	Entropy 1.00137 (1.02188)	Top-1 acc 46.484 (43.462)	Top-5 acc 70.312 (67.504)	lr 0.02333
Train [20][3070/3239]	Time 0.568 (0.891)	Data Time 0.001 (0.009)	Loss 3.2743 (3.3861)	Entropy 1.00110 (1.02181)	Top-1 acc 48.047 (43.466)	Top-5 acc 69.141 (67.510)	lr 0.02333
Train [20][3080/3239]	Time 0.631 (0.890)	Data Time 0.001 (0.009)	Loss 3.1479 (3.3859)	Entropy 1.00098 (1.02175)	Top-1 acc 46.094 (43.471)	Top-5 acc 73.438 (67.513)	lr 0.02333
Train [20][3090/3239]	Time 0.596 (0.890)	Data Time 0.001 (0.009)	Loss 3.6526 (3.3860)	Entropy 1.00060 (1.02168)	Top-1 acc 37.891 (43.469)	Top-5 acc 59.766 (67.513)	lr 0.02333
Train [20][3100/3239]	Time 0.590 (0.890)	Data Time 0.001 (0.009)	Loss 3.5788 (3.3860)	Entropy 1.00032 (1.02161)	Top-1 acc 38.672 (43.469)	Top-5 acc 63.672 (67.511)	lr 0.02333
Train [20][3110/3239]	Time 0.598 (0.890)	Data Time 0.001 (0.009)	Loss 3.5653 (3.3860)	Entropy 1.00004 (1.02154)	Top-1 acc 40.625 (43.468)	Top-5 acc 65.625 (67.512)	lr 0.02333
Train [20][3120/3239]	Time 0.634 (0.890)	Data Time 0.001 (0.009)	Loss 3.3698 (3.3859)	Entropy 0.99948 (1.02147)	Top-1 acc 41.406 (43.466)	Top-5 acc 69.531 (67.517)	lr 0.02333
Train [20][3130/3239]	Time 0.723 (0.890)	Data Time 0.001 (0.009)	Loss 3.4465 (3.3859)	Entropy 0.99934 (1.02140)	Top-1 acc 39.844 (43.461)	Top-5 acc 67.969 (67.519)	lr 0.02333
Train [20][3140/3239]	Time 0.596 (0.890)	Data Time 0.001 (0.009)	Loss 3.5999 (3.3859)	Entropy 0.99949 (1.02133)	Top-1 acc 39.062 (43.462)	Top-5 acc 63.281 (67.518)	lr 0.02333
Train [20][3150/3239]	Time 0.590 (0.890)	Data Time 0.001 (0.009)	Loss 3.3700 (3.3859)	Entropy 0.99962 (1.02126)	Top-1 acc 45.312 (43.458)	Top-5 acc 66.797 (67.516)	lr 0.02333
Train [20][3160/3239]	Time 0.593 (0.890)	Data Time 0.001 (0.009)	Loss 3.0999 (3.3858)	Entropy 0.99919 (1.02119)	Top-1 acc 53.125 (43.462)	Top-5 acc 75.000 (67.518)	lr 0.02333
Train [20][3170/3239]	Time 0.596 (0.890)	Data Time 0.001 (0.009)	Loss 3.2807 (3.3859)	Entropy 0.99913 (1.02112)	Top-1 acc 44.922 (43.464)	Top-5 acc 69.922 (67.517)	lr 0.02333
Train [20][3180/3239]	Time 0.591 (0.890)	Data Time 0.000 (0.009)	Loss 3.4681 (3.3858)	Entropy 0.99905 (1.02106)	Top-1 acc 43.750 (43.465)	Top-5 acc 64.453 (67.518)	lr 0.02333
Train [20][3190/3239]	Time 0.603 (0.889)	Data Time 0.000 (0.009)	Loss 3.5155 (3.3860)	Entropy 0.99970 (1.02099)	Top-1 acc 39.062 (43.458)	Top-5 acc 64.062 (67.516)	lr 0.02333
Train [20][3200/3239]	Time 0.614 (0.889)	Data Time 0.000 (0.009)	Loss 3.3705 (3.3861)	Entropy 0.99948 (1.02092)	Top-1 acc 46.484 (43.460)	Top-5 acc 67.578 (67.514)	lr 0.02333
Train [20][3210/3239]	Time 0.570 (0.889)	Data Time 0.000 (0.008)	Loss 3.4513 (3.3861)	Entropy 0.99954 (1.02085)	Top-1 acc 44.922 (43.461)	Top-5 acc 66.797 (67.515)	lr 0.02333
Train [20][3220/3239]	Time 0.601 (0.889)	Data Time 0.000 (0.008)	Loss 3.1857 (3.3858)	Entropy 0.99940 (1.02079)	Top-1 acc 49.219 (43.466)	Top-5 acc 71.484 (67.521)	lr 0.02333
Train [20][3230/3239]	Time 0.615 (0.889)	Data Time 0.000 (0.008)	Loss 3.2088 (3.3858)	Entropy 0.99890 (1.02072)	Top-1 acc 45.312 (43.465)	Top-5 acc 68.750 (67.522)	lr 0.02333
Train [20][3239/3239]	Time 1.497 (0.888)	Data Time 0.000 (0.008)	Loss 3.7127 (3.3859)	Entropy 0.99860 (1.02066)	Top-1 acc 37.037 (43.462)	Top-5 acc 53.086 (67.518)	lr 0.02333
==========Valid [20/120]	loss 2.119	top-1 acc 53.326 (53.326)	top-5 acc 76.792	Train top-1 43.462	top-5 67.518	Entropy 0.99860	Latency-None: 0.000ms	Flops: 539.76M
Train [21][0/3239]	Time 21.906 (21.906)	Data Time 20.492 (20.492)	Loss 3.2462 (3.2462)	Entropy 0.99858 (0.99858)	Top-1 acc 43.359 (43.359)	Top-5 acc 68.359 (68.359)	lr 0.02333
Train [21][10/3239]	Time 0.650 (2.849)	Data Time 0.001 (1.868)	Loss 3.4159 (3.3083)	Entropy 0.99858 (0.99855)	Top-1 acc 43.359 (45.384)	Top-5 acc 68.750 (68.928)	lr 0.02332
Train [21][20/3239]	Time 0.559 (3.074)	Data Time 0.002 (0.980)	Loss 3.2582 (3.3239)	Entropy 0.99877 (0.99859)	Top-1 acc 46.094 (44.922)	Top-5 acc 71.484 (68.341)	lr 0.02332
Train [21][30/3239]	Time 0.717 (2.356)	Data Time 0.001 (0.665)	Loss 3.2653 (3.3185)	Entropy 0.99900 (0.99869)	Top-1 acc 47.266 (45.086)	Top-5 acc 68.359 (68.435)	lr 0.02332
Train [21][40/3239]	Time 0.625 (1.989)	Data Time 0.001 (0.503)	Loss 3.3071 (3.3246)	Entropy 0.99886 (0.99876)	Top-1 acc 44.922 (44.769)	Top-5 acc 68.359 (68.388)	lr 0.02332
Train [21][50/3239]	Time 0.560 (1.766)	Data Time 0.001 (0.405)	Loss 3.3229 (3.3330)	Entropy 0.99889 (0.99877)	Top-1 acc 41.797 (44.646)	Top-5 acc 70.703 (68.329)	lr 0.02332
Train [21][60/3239]	Time 0.660 (1.621)	Data Time 0.001 (0.339)	Loss 3.1438 (3.3377)	Entropy 0.99883 (0.99879)	Top-1 acc 49.609 (44.672)	Top-5 acc 71.484 (68.154)	lr 0.02332
Train [21][70/3239]	Time 0.596 (1.511)	Data Time 0.001 (0.292)	Loss 3.4163 (3.3365)	Entropy 0.99849 (0.99877)	Top-1 acc 43.750 (44.663)	Top-5 acc 66.797 (68.266)	lr 0.02332
Train [21][80/3239]	Time 0.621 (1.431)	Data Time 0.003 (0.256)	Loss 3.2637 (3.3447)	Entropy 0.99861 (0.99875)	Top-1 acc 43.359 (44.334)	Top-5 acc 68.359 (68.138)	lr 0.02332
Train [21][90/3239]	Time 0.617 (1.368)	Data Time 0.002 (0.228)	Loss 3.3455 (3.3439)	Entropy 0.99877 (0.99873)	Top-1 acc 43.750 (44.325)	Top-5 acc 69.141 (68.213)	lr 0.02332
Train [21][100/3239]	Time 0.628 (1.319)	Data Time 0.001 (0.206)	Loss 3.2615 (3.3463)	Entropy 0.99861 (0.99873)	Top-1 acc 50.000 (44.261)	Top-5 acc 68.359 (68.139)	lr 0.02332
Train [21][110/3239]	Time 0.598 (1.275)	Data Time 0.001 (0.187)	Loss 3.2849 (3.3512)	Entropy 0.99855 (0.99872)	Top-1 acc 45.703 (44.084)	Top-5 acc 68.750 (68.074)	lr 0.02332
Train [21][120/3239]	Time 0.722 (1.241)	Data Time 0.001 (0.172)	Loss 3.2673 (3.3455)	Entropy 0.99788 (0.99868)	Top-1 acc 46.094 (44.257)	Top-5 acc 71.875 (68.159)	lr 0.02332
Train [21][130/3239]	Time 0.603 (1.209)	Data Time 0.003 (0.159)	Loss 3.3569 (3.3446)	Entropy 0.99773 (0.99862)	Top-1 acc 43.359 (44.346)	Top-5 acc 67.969 (68.174)	lr 0.02332
Train [21][140/3239]	Time 0.605 (1.184)	Data Time 0.001 (0.148)	Loss 3.2193 (3.3436)	Entropy 0.99800 (0.99856)	Top-1 acc 42.578 (44.323)	Top-5 acc 69.141 (68.182)	lr 0.02332
Train [21][150/3239]	Time 0.632 (1.163)	Data Time 0.001 (0.138)	Loss 3.4672 (3.3482)	Entropy 0.99754 (0.99851)	Top-1 acc 41.016 (44.254)	Top-5 acc 64.844 (68.108)	lr 0.02332
Train [21][160/3239]	Time 0.577 (1.144)	Data Time 0.001 (0.130)	Loss 3.2112 (3.3462)	Entropy 0.99795 (0.99846)	Top-1 acc 46.484 (44.306)	Top-5 acc 67.969 (68.153)	lr 0.02332
Train [21][170/3239]	Time 0.577 (1.128)	Data Time 0.001 (0.122)	Loss 3.4707 (3.3462)	Entropy 0.99777 (0.99843)	Top-1 acc 40.625 (44.282)	Top-5 acc 64.844 (68.147)	lr 0.02332
Train [21][180/3239]	Time 0.662 (1.114)	Data Time 0.001 (0.116)	Loss 3.5247 (3.3481)	Entropy 0.99731 (0.99839)	Top-1 acc 42.969 (44.298)	Top-5 acc 64.062 (68.128)	lr 0.02332
Train [21][190/3239]	Time 0.687 (1.101)	Data Time 0.001 (0.110)	Loss 3.4576 (3.3475)	Entropy 0.99707 (0.99832)	Top-1 acc 42.969 (44.282)	Top-5 acc 65.234 (68.155)	lr 0.02332
Train [21][200/3239]	Time 0.583 (1.088)	Data Time 0.001 (0.104)	Loss 3.3482 (3.3428)	Entropy 0.99701 (0.99826)	Top-1 acc 46.875 (44.407)	Top-5 acc 65.234 (68.252)	lr 0.02332
Train [21][210/3239]	Time 0.582 (1.077)	Data Time 0.001 (0.099)	Loss 3.3652 (3.3419)	Entropy 0.99696 (0.99820)	Top-1 acc 44.531 (44.405)	Top-5 acc 67.578 (68.276)	lr 0.02331
Train [21][220/3239]	Time 0.615 (1.068)	Data Time 0.001 (0.095)	Loss 3.5329 (3.3403)	Entropy 0.99664 (0.99814)	Top-1 acc 39.062 (44.445)	Top-5 acc 60.156 (68.301)	lr 0.02331
Train [21][230/3239]	Time 0.586 (1.059)	Data Time 0.001 (0.091)	Loss 3.2797 (3.3440)	Entropy 0.99663 (0.99808)	Top-1 acc 44.531 (44.360)	Top-5 acc 71.875 (68.217)	lr 0.02331
Train [21][240/3239]	Time 0.586 (1.051)	Data Time 0.001 (0.087)	Loss 3.3841 (3.3414)	Entropy 0.99620 (0.99801)	Top-1 acc 42.188 (44.429)	Top-5 acc 67.969 (68.261)	lr 0.02331
Train [21][250/3239]	Time 0.557 (1.044)	Data Time 0.001 (0.084)	Loss 3.3699 (3.3397)	Entropy 0.99599 (0.99793)	Top-1 acc 44.922 (44.463)	Top-5 acc 67.188 (68.336)	lr 0.02331
Train [21][260/3239]	Time 0.534 (1.037)	Data Time 0.001 (0.081)	Loss 3.6418 (3.3419)	Entropy 0.99627 (0.99786)	Top-1 acc 38.672 (44.435)	Top-5 acc 62.109 (68.301)	lr 0.02331
Train [21][270/3239]	Time 0.568 (1.030)	Data Time 0.001 (0.078)	Loss 3.4286 (3.3461)	Entropy 0.99594 (0.99780)	Top-1 acc 41.797 (44.331)	Top-5 acc 64.453 (68.208)	lr 0.02331
Train [21][280/3239]	Time 0.683 (1.023)	Data Time 0.001 (0.075)	Loss 3.2576 (3.3438)	Entropy 0.99561 (0.99773)	Top-1 acc 45.312 (44.410)	Top-5 acc 71.875 (68.284)	lr 0.02331
Train [21][290/3239]	Time 0.597 (1.017)	Data Time 0.002 (0.073)	Loss 3.2956 (3.3439)	Entropy 0.99563 (0.99766)	Top-1 acc 44.922 (44.413)	Top-5 acc 67.188 (68.282)	lr 0.02331
Train [21][300/3239]	Time 0.606 (1.011)	Data Time 0.001 (0.070)	Loss 3.3979 (3.3471)	Entropy 0.99533 (0.99759)	Top-1 acc 45.312 (44.351)	Top-5 acc 65.234 (68.210)	lr 0.02331
Train [21][310/3239]	Time 0.611 (1.005)	Data Time 0.001 (0.068)	Loss 3.3703 (3.3478)	Entropy 0.99537 (0.99752)	Top-1 acc 39.453 (44.318)	Top-5 acc 67.188 (68.210)	lr 0.02331
Train [21][320/3239]	Time 0.606 (1.001)	Data Time 0.001 (0.066)	Loss 3.5279 (3.3493)	Entropy 0.99525 (0.99745)	Top-1 acc 41.016 (44.278)	Top-5 acc 66.797 (68.191)	lr 0.02331
Train [21][330/3239]	Time 0.617 (0.997)	Data Time 0.002 (0.064)	Loss 3.4589 (3.3500)	Entropy 0.99465 (0.99738)	Top-1 acc 41.406 (44.276)	Top-5 acc 65.234 (68.166)	lr 0.02331
Train [21][340/3239]	Time 0.631 (0.993)	Data Time 0.001 (0.062)	Loss 3.3523 (3.3496)	Entropy 0.99465 (0.99730)	Top-1 acc 44.531 (44.319)	Top-5 acc 67.969 (68.149)	lr 0.02331
Train [21][350/3239]	Time 0.685 (0.989)	Data Time 0.001 (0.061)	Loss 3.3363 (3.3500)	Entropy 0.99422 (0.99722)	Top-1 acc 44.141 (44.306)	Top-5 acc 67.188 (68.131)	lr 0.02331
Train [21][360/3239]	Time 0.616 (0.985)	Data Time 0.001 (0.059)	Loss 3.4210 (3.3515)	Entropy 0.99379 (0.99713)	Top-1 acc 43.359 (44.319)	Top-5 acc 68.750 (68.142)	lr 0.02331
Train [21][370/3239]	Time 0.596 (0.982)	Data Time 0.001 (0.057)	Loss 3.2981 (3.3526)	Entropy 0.99355 (0.99704)	Top-1 acc 48.047 (44.278)	Top-5 acc 71.094 (68.134)	lr 0.02331
Train [21][380/3239]	Time 0.607 (0.979)	Data Time 0.001 (0.056)	Loss 3.3570 (3.3533)	Entropy 0.99384 (0.99695)	Top-1 acc 45.312 (44.261)	Top-5 acc 68.750 (68.161)	lr 0.02331
Train [21][390/3239]	Time 0.597 (0.975)	Data Time 0.001 (0.055)	Loss 3.4061 (3.3518)	Entropy 0.99341 (0.99687)	Top-1 acc 44.922 (44.283)	Top-5 acc 68.359 (68.206)	lr 0.02331
Train [21][400/3239]	Time 0.603 (0.973)	Data Time 0.001 (0.053)	Loss 3.4334 (3.3522)	Entropy 0.99317 (0.99678)	Top-1 acc 40.234 (44.262)	Top-5 acc 68.750 (68.187)	lr 0.02331
Train [21][410/3239]	Time 0.603 (0.970)	Data Time 0.001 (0.052)	Loss 3.2130 (3.3504)	Entropy 0.99309 (0.99669)	Top-1 acc 46.094 (44.281)	Top-5 acc 70.312 (68.232)	lr 0.02330
Train [21][420/3239]	Time 0.598 (0.968)	Data Time 0.001 (0.051)	Loss 3.2806 (3.3511)	Entropy 0.99321 (0.99660)	Top-1 acc 48.047 (44.273)	Top-5 acc 70.703 (68.219)	lr 0.02330
Train [21][430/3239]	Time 0.564 (0.965)	Data Time 0.001 (0.050)	Loss 3.4765 (3.3520)	Entropy 0.99348 (0.99652)	Top-1 acc 41.406 (44.229)	Top-5 acc 63.672 (68.223)	lr 0.02330
Train [21][440/3239]	Time 0.628 (0.963)	Data Time 0.002 (0.049)	Loss 3.2793 (3.3509)	Entropy 0.99332 (0.99645)	Top-1 acc 44.922 (44.236)	Top-5 acc 68.359 (68.229)	lr 0.02330
Train [21][450/3239]	Time 0.469 (0.961)	Data Time 0.001 (0.048)	Loss 3.5719 (3.3512)	Entropy 0.99365 (0.99638)	Top-1 acc 37.109 (44.255)	Top-5 acc 64.062 (68.223)	lr 0.02330
Train [21][460/3239]	Time 0.614 (0.958)	Data Time 0.001 (0.047)	Loss 3.4011 (3.3518)	Entropy 0.99356 (0.99633)	Top-1 acc 42.578 (44.220)	Top-5 acc 68.750 (68.214)	lr 0.02330
Train [21][470/3239]	Time 0.623 (0.956)	Data Time 0.002 (0.046)	Loss 3.7433 (3.3512)	Entropy 0.99289 (0.99626)	Top-1 acc 36.719 (44.238)	Top-5 acc 60.547 (68.218)	lr 0.02330
Train [21][480/3239]	Time 0.616 (0.953)	Data Time 0.001 (0.045)	Loss 3.4818 (3.3508)	Entropy 0.99286 (0.99619)	Top-1 acc 42.969 (44.262)	Top-5 acc 65.625 (68.222)	lr 0.02330
Train [21][490/3239]	Time 0.584 (0.950)	Data Time 0.001 (0.044)	Loss 3.4858 (3.3511)	Entropy 0.99275 (0.99612)	Top-1 acc 39.844 (44.258)	Top-5 acc 66.797 (68.229)	lr 0.02330
Train [21][500/3239]	Time 0.637 (0.949)	Data Time 0.001 (0.043)	Loss 3.2598 (3.3514)	Entropy 0.99232 (0.99605)	Top-1 acc 45.703 (44.247)	Top-5 acc 72.266 (68.224)	lr 0.02330
Train [21][510/3239]	Time 0.721 (0.947)	Data Time 0.001 (0.042)	Loss 3.1601 (3.3514)	Entropy 0.99228 (0.99598)	Top-1 acc 45.312 (44.233)	Top-5 acc 73.438 (68.216)	lr 0.02330
Train [21][520/3239]	Time 0.552 (0.945)	Data Time 0.001 (0.042)	Loss 3.3681 (3.3521)	Entropy 0.99251 (0.99591)	Top-1 acc 44.531 (44.227)	Top-5 acc 66.797 (68.209)	lr 0.02330
Train [21][530/3239]	Time 0.625 (0.944)	Data Time 0.001 (0.041)	Loss 3.5725 (3.3527)	Entropy 0.99294 (0.99585)	Top-1 acc 36.328 (44.206)	Top-5 acc 66.797 (68.191)	lr 0.02330
Train [21][540/3239]	Time 0.623 (0.943)	Data Time 0.003 (0.040)	Loss 3.2557 (3.3524)	Entropy 0.99270 (0.99579)	Top-1 acc 47.266 (44.216)	Top-5 acc 69.922 (68.174)	lr 0.02330
Train [21][550/3239]	Time 0.584 (0.941)	Data Time 0.001 (0.039)	Loss 3.4033 (3.3525)	Entropy 0.99245 (0.99574)	Top-1 acc 44.922 (44.204)	Top-5 acc 69.141 (68.184)	lr 0.02330
Train [21][560/3239]	Time 0.618 (0.940)	Data Time 0.002 (0.039)	Loss 3.3498 (3.3527)	Entropy 0.99271 (0.99568)	Top-1 acc 43.750 (44.191)	Top-5 acc 70.312 (68.176)	lr 0.02330
Train [21][570/3239]	Time 0.588 (0.938)	Data Time 0.001 (0.038)	Loss 3.3925 (3.3522)	Entropy 0.99233 (0.99563)	Top-1 acc 41.016 (44.195)	Top-5 acc 67.578 (68.184)	lr 0.02330
Train [21][580/3239]	Time 0.690 (0.937)	Data Time 0.001 (0.038)	Loss 3.2341 (3.3527)	Entropy 0.99202 (0.99557)	Top-1 acc 46.875 (44.194)	Top-5 acc 71.875 (68.183)	lr 0.02330
Train [21][590/3239]	Time 0.593 (0.935)	Data Time 0.001 (0.037)	Loss 3.3639 (3.3529)	Entropy 0.99234 (0.99551)	Top-1 acc 45.312 (44.178)	Top-5 acc 67.578 (68.177)	lr 0.02330
Train [21][600/3239]	Time 0.657 (0.934)	Data Time 0.001 (0.036)	Loss 3.2887 (3.3528)	Entropy 0.99184 (0.99545)	Top-1 acc 51.172 (44.197)	Top-5 acc 71.094 (68.179)	lr 0.02329
Train [21][610/3239]	Time 0.613 (0.933)	Data Time 0.001 (0.036)	Loss 3.3686 (3.3533)	Entropy 0.99129 (0.99539)	Top-1 acc 45.703 (44.180)	Top-5 acc 68.750 (68.168)	lr 0.02329
Train [21][620/3239]	Time 0.592 (0.932)	Data Time 0.001 (0.035)	Loss 3.3449 (3.3535)	Entropy 0.99147 (0.99533)	Top-1 acc 44.922 (44.171)	Top-5 acc 69.141 (68.167)	lr 0.02329
Train [21][630/3239]	Time 0.600 (0.931)	Data Time 0.002 (0.035)	Loss 3.4336 (3.3527)	Entropy 0.99096 (0.99526)	Top-1 acc 39.453 (44.173)	Top-5 acc 67.969 (68.179)	lr 0.02329
Train [21][640/3239]	Time 0.640 (0.929)	Data Time 0.001 (0.034)	Loss 3.3606 (3.3525)	Entropy 0.99085 (0.99520)	Top-1 acc 39.844 (44.188)	Top-5 acc 69.922 (68.189)	lr 0.02329
Train [21][650/3239]	Time 0.579 (0.928)	Data Time 0.001 (0.034)	Loss 3.2433 (3.3527)	Entropy 0.99057 (0.99513)	Top-1 acc 45.703 (44.174)	Top-5 acc 70.312 (68.183)	lr 0.02329
Train [21][660/3239]	Time 0.594 (0.926)	Data Time 0.001 (0.033)	Loss 3.2459 (3.3527)	Entropy 0.99055 (0.99506)	Top-1 acc 43.359 (44.179)	Top-5 acc 69.531 (68.177)	lr 0.02329
Train [21][670/3239]	Time 0.865 (0.957)	Data Time 0.005 (0.033)	Loss 3.4000 (3.3535)	Entropy 0.99048 (0.99499)	Top-1 acc 42.578 (44.141)	Top-5 acc 69.531 (68.163)	lr 0.02329
Train [21][680/3239]	Time 0.618 (0.956)	Data Time 0.002 (0.032)	Loss 3.3158 (3.3528)	Entropy 0.99046 (0.99492)	Top-1 acc 47.656 (44.170)	Top-5 acc 68.750 (68.188)	lr 0.02329
Train [21][690/3239]	Time 0.607 (0.955)	Data Time 0.001 (0.032)	Loss 3.6020 (3.3530)	Entropy 0.99062 (0.99486)	Top-1 acc 41.016 (44.152)	Top-5 acc 59.766 (68.176)	lr 0.02329
Train [21][700/3239]	Time 0.628 (0.954)	Data Time 0.002 (0.031)	Loss 3.2404 (3.3540)	Entropy 0.99003 (0.99479)	Top-1 acc 44.531 (44.119)	Top-5 acc 68.750 (68.150)	lr 0.02329
Train [21][710/3239]	Time 0.596 (0.953)	Data Time 0.002 (0.031)	Loss 3.4065 (3.3554)	Entropy 0.99010 (0.99473)	Top-1 acc 44.141 (44.082)	Top-5 acc 67.969 (68.133)	lr 0.02329
Train [21][720/3239]	Time 0.595 (0.951)	Data Time 0.005 (0.031)	Loss 3.4426 (3.3553)	Entropy 0.99024 (0.99466)	Top-1 acc 43.359 (44.085)	Top-5 acc 66.016 (68.136)	lr 0.02329
Train [21][730/3239]	Time 0.612 (0.950)	Data Time 0.001 (0.030)	Loss 3.2762 (3.3550)	Entropy 0.99009 (0.99460)	Top-1 acc 45.312 (44.081)	Top-5 acc 69.531 (68.138)	lr 0.02329
Train [21][740/3239]	Time 0.672 (0.949)	Data Time 0.001 (0.030)	Loss 3.3756 (3.3549)	Entropy 0.98963 (0.99454)	Top-1 acc 42.969 (44.084)	Top-5 acc 66.016 (68.136)	lr 0.02329
Train [21][750/3239]	Time 0.586 (0.948)	Data Time 0.001 (0.030)	Loss 3.5455 (3.3551)	Entropy 0.98920 (0.99447)	Top-1 acc 40.234 (44.096)	Top-5 acc 62.109 (68.129)	lr 0.02329
Train [21][760/3239]	Time 0.618 (0.947)	Data Time 0.001 (0.029)	Loss 3.4454 (3.3548)	Entropy 0.98897 (0.99440)	Top-1 acc 41.016 (44.107)	Top-5 acc 67.188 (68.144)	lr 0.02329
Train [21][770/3239]	Time 0.613 (0.946)	Data Time 0.001 (0.029)	Loss 3.3330 (3.3550)	Entropy 0.98901 (0.99433)	Top-1 acc 41.016 (44.096)	Top-5 acc 65.625 (68.136)	lr 0.02329
Train [21][780/3239]	Time 0.613 (0.944)	Data Time 0.001 (0.029)	Loss 3.3237 (3.3549)	Entropy 0.98865 (0.99426)	Top-1 acc 43.750 (44.105)	Top-5 acc 67.578 (68.124)	lr 0.02329
Train [21][790/3239]	Time 0.566 (0.943)	Data Time 0.001 (0.028)	Loss 3.4673 (3.3552)	Entropy 0.98812 (0.99419)	Top-1 acc 43.750 (44.104)	Top-5 acc 67.969 (68.129)	lr 0.02329
Train [21][800/3239]	Time 0.554 (0.942)	Data Time 0.001 (0.028)	Loss 3.3708 (3.3566)	Entropy 0.98785 (0.99411)	Top-1 acc 43.750 (44.070)	Top-5 acc 64.453 (68.087)	lr 0.02328
Train [21][810/3239]	Time 0.593 (0.941)	Data Time 0.001 (0.028)	Loss 3.5286 (3.3572)	Entropy 0.98736 (0.99403)	Top-1 acc 40.234 (44.050)	Top-5 acc 64.453 (68.074)	lr 0.02328
Train [21][820/3239]	Time 0.559 (0.940)	Data Time 0.002 (0.027)	Loss 3.4545 (3.3572)	Entropy 0.98694 (0.99395)	Top-1 acc 40.625 (44.045)	Top-5 acc 65.625 (68.068)	lr 0.02328
Train [21][830/3239]	Time 0.605 (0.939)	Data Time 0.002 (0.027)	Loss 3.3013 (3.3567)	Entropy 0.98703 (0.99387)	Top-1 acc 46.484 (44.064)	Top-5 acc 68.359 (68.079)	lr 0.02328
Train [21][840/3239]	Time 0.600 (0.938)	Data Time 0.001 (0.027)	Loss 3.4867 (3.3568)	Entropy 0.98680 (0.99378)	Top-1 acc 41.406 (44.056)	Top-5 acc 63.281 (68.076)	lr 0.02328
Train [21][850/3239]	Time 0.645 (0.937)	Data Time 0.002 (0.026)	Loss 3.3091 (3.3566)	Entropy 0.98666 (0.99370)	Top-1 acc 42.969 (44.065)	Top-5 acc 68.359 (68.077)	lr 0.02328
Train [21][860/3239]	Time 0.575 (0.936)	Data Time 0.001 (0.026)	Loss 3.2057 (3.3560)	Entropy 0.98679 (0.99362)	Top-1 acc 47.656 (44.074)	Top-5 acc 71.094 (68.090)	lr 0.02328
Train [21][870/3239]	Time 0.546 (0.935)	Data Time 0.001 (0.026)	Loss 3.4343 (3.3560)	Entropy 0.98686 (0.99354)	Top-1 acc 46.094 (44.078)	Top-5 acc 64.453 (68.084)	lr 0.02328
Train [21][880/3239]	Time 0.575 (0.935)	Data Time 0.001 (0.026)	Loss 3.3115 (3.3562)	Entropy 0.98696 (0.99347)	Top-1 acc 44.141 (44.073)	Top-5 acc 70.703 (68.085)	lr 0.02328
Train [21][890/3239]	Time 0.609 (0.934)	Data Time 0.001 (0.025)	Loss 3.4191 (3.3558)	Entropy 0.98674 (0.99339)	Top-1 acc 43.750 (44.071)	Top-5 acc 66.406 (68.082)	lr 0.02328
Train [21][900/3239]	Time 0.711 (0.933)	Data Time 0.001 (0.025)	Loss 3.3454 (3.3559)	Entropy 0.98681 (0.99332)	Top-1 acc 46.094 (44.065)	Top-5 acc 70.312 (68.087)	lr 0.02328
Train [21][910/3239]	Time 0.599 (0.932)	Data Time 0.001 (0.025)	Loss 3.2310 (3.3559)	Entropy 0.98652 (0.99324)	Top-1 acc 48.828 (44.072)	Top-5 acc 71.484 (68.082)	lr 0.02328
Train [21][920/3239]	Time 0.596 (0.932)	Data Time 0.001 (0.024)	Loss 3.3323 (3.3569)	Entropy 0.98646 (0.99317)	Top-1 acc 45.703 (44.048)	Top-5 acc 65.625 (68.060)	lr 0.02328
Train [21][930/3239]	Time 0.551 (0.931)	Data Time 0.002 (0.024)	Loss 3.2675 (3.3565)	Entropy 0.98556 (0.99310)	Top-1 acc 46.484 (44.062)	Top-5 acc 68.359 (68.066)	lr 0.02328
Train [21][940/3239]	Time 0.621 (0.930)	Data Time 0.001 (0.024)	Loss 3.1176 (3.3558)	Entropy 0.98572 (0.99302)	Top-1 acc 50.781 (44.083)	Top-5 acc 72.266 (68.074)	lr 0.02328
Train [21][950/3239]	Time 0.636 (0.929)	Data Time 0.001 (0.024)	Loss 3.2060 (3.3565)	Entropy 0.98499 (0.99294)	Top-1 acc 47.656 (44.072)	Top-5 acc 70.703 (68.063)	lr 0.02328
Train [21][960/3239]	Time 0.620 (0.928)	Data Time 0.002 (0.024)	Loss 3.3642 (3.3569)	Entropy 0.98449 (0.99285)	Top-1 acc 42.188 (44.068)	Top-5 acc 70.703 (68.055)	lr 0.02328
Train [21][970/3239]	Time 0.699 (0.927)	Data Time 0.002 (0.023)	Loss 3.3377 (3.3573)	Entropy 0.98442 (0.99277)	Top-1 acc 43.359 (44.060)	Top-5 acc 68.359 (68.058)	lr 0.02328
Train [21][980/3239]	Time 0.622 (0.927)	Data Time 0.001 (0.023)	Loss 3.1598 (3.3570)	Entropy 0.98426 (0.99268)	Top-1 acc 51.172 (44.058)	Top-5 acc 71.484 (68.067)	lr 0.02328
Train [21][990/3239]	Time 0.611 (0.926)	Data Time 0.001 (0.023)	Loss 3.2529 (3.3565)	Entropy 0.98369 (0.99259)	Top-1 acc 47.266 (44.073)	Top-5 acc 71.484 (68.074)	lr 0.02327
Train [21][1000/3239]	Time 0.615 (0.926)	Data Time 0.001 (0.023)	Loss 3.3798 (3.3563)	Entropy 0.98344 (0.99250)	Top-1 acc 43.750 (44.079)	Top-5 acc 66.797 (68.074)	lr 0.02327
Train [21][1010/3239]	Time 0.585 (0.925)	Data Time 0.001 (0.023)	Loss 3.5664 (3.3556)	Entropy 0.98409 (0.99242)	Top-1 acc 42.578 (44.095)	Top-5 acc 64.453 (68.089)	lr 0.02327
Train [21][1020/3239]	Time 0.601 (0.925)	Data Time 0.001 (0.022)	Loss 3.0427 (3.3551)	Entropy 0.98410 (0.99233)	Top-1 acc 50.000 (44.103)	Top-5 acc 74.609 (68.106)	lr 0.02327
Train [21][1030/3239]	Time 0.628 (0.924)	Data Time 0.001 (0.022)	Loss 3.3784 (3.3552)	Entropy 0.98382 (0.99225)	Top-1 acc 46.094 (44.106)	Top-5 acc 67.188 (68.106)	lr 0.02327
Train [21][1040/3239]	Time 0.632 (0.923)	Data Time 0.001 (0.022)	Loss 3.2114 (3.3550)	Entropy 0.98359 (0.99217)	Top-1 acc 48.047 (44.115)	Top-5 acc 69.141 (68.103)	lr 0.02327
Train [21][1050/3239]	Time 0.578 (0.923)	Data Time 0.001 (0.022)	Loss 3.5725 (3.3550)	Entropy 0.98357 (0.99209)	Top-1 acc 40.234 (44.111)	Top-5 acc 62.891 (68.101)	lr 0.02327
Train [21][1060/3239]	Time 0.698 (0.922)	Data Time 0.001 (0.022)	Loss 3.2484 (3.3551)	Entropy 0.98340 (0.99201)	Top-1 acc 46.875 (44.105)	Top-5 acc 73.438 (68.102)	lr 0.02327
Train [21][1070/3239]	Time 0.632 (0.922)	Data Time 0.001 (0.021)	Loss 3.3721 (3.3557)	Entropy 0.98369 (0.99193)	Top-1 acc 42.188 (44.089)	Top-5 acc 65.234 (68.089)	lr 0.02327
Train [21][1080/3239]	Time 0.606 (0.921)	Data Time 0.002 (0.021)	Loss 3.3619 (3.3556)	Entropy 0.98334 (0.99185)	Top-1 acc 41.406 (44.091)	Top-5 acc 67.969 (68.095)	lr 0.02327
Train [21][1090/3239]	Time 0.605 (0.921)	Data Time 0.001 (0.021)	Loss 3.2046 (3.3554)	Entropy 0.98322 (0.99177)	Top-1 acc 48.828 (44.101)	Top-5 acc 71.484 (68.099)	lr 0.02327
Train [21][1100/3239]	Time 0.614 (0.920)	Data Time 0.002 (0.021)	Loss 3.3846 (3.3556)	Entropy 0.98350 (0.99170)	Top-1 acc 45.312 (44.099)	Top-5 acc 70.703 (68.095)	lr 0.02327
Train [21][1110/3239]	Time 0.602 (0.919)	Data Time 0.001 (0.021)	Loss 3.3412 (3.3555)	Entropy 0.98349 (0.99162)	Top-1 acc 43.750 (44.099)	Top-5 acc 67.578 (68.093)	lr 0.02327
Train [21][1120/3239]	Time 0.552 (0.918)	Data Time 0.001 (0.021)	Loss 3.3766 (3.3548)	Entropy 0.98383 (0.99155)	Top-1 acc 42.578 (44.104)	Top-5 acc 67.578 (68.106)	lr 0.02327
Train [21][1130/3239]	Time 0.756 (0.918)	Data Time 0.001 (0.020)	Loss 3.2793 (3.3549)	Entropy 0.98372 (0.99148)	Top-1 acc 48.047 (44.105)	Top-5 acc 66.797 (68.107)	lr 0.02327
Train [21][1140/3239]	Time 0.564 (0.917)	Data Time 0.001 (0.020)	Loss 3.2664 (3.3550)	Entropy 0.98357 (0.99141)	Top-1 acc 44.141 (44.109)	Top-5 acc 68.359 (68.102)	lr 0.02327
Train [21][1150/3239]	Time 0.589 (0.916)	Data Time 0.001 (0.020)	Loss 3.6825 (3.3550)	Entropy 0.98337 (0.99135)	Top-1 acc 39.062 (44.105)	Top-5 acc 61.719 (68.107)	lr 0.02327
Train [21][1160/3239]	Time 0.597 (0.916)	Data Time 0.001 (0.020)	Loss 3.3212 (3.3547)	Entropy 0.98308 (0.99128)	Top-1 acc 47.656 (44.105)	Top-5 acc 69.922 (68.107)	lr 0.02327
Train [21][1170/3239]	Time 0.603 (0.916)	Data Time 0.001 (0.020)	Loss 3.2397 (3.3551)	Entropy 0.98296 (0.99121)	Top-1 acc 48.047 (44.096)	Top-5 acc 72.656 (68.111)	lr 0.02327
Train [21][1180/3239]	Time 0.602 (0.915)	Data Time 0.003 (0.020)	Loss 3.4420 (3.3552)	Entropy 0.98331 (0.99114)	Top-1 acc 42.969 (44.096)	Top-5 acc 65.234 (68.109)	lr 0.02327
Train [21][1190/3239]	Time 0.596 (0.915)	Data Time 0.001 (0.019)	Loss 3.3668 (3.3553)	Entropy 0.98310 (0.99107)	Top-1 acc 46.094 (44.086)	Top-5 acc 68.750 (68.102)	lr 0.02326
Train [21][1200/3239]	Time 0.639 (0.914)	Data Time 0.001 (0.019)	Loss 3.4570 (3.3548)	Entropy 0.98317 (0.99100)	Top-1 acc 41.016 (44.091)	Top-5 acc 64.062 (68.116)	lr 0.02326
Train [21][1210/3239]	Time 0.610 (0.914)	Data Time 0.001 (0.019)	Loss 3.2986 (3.3548)	Entropy 0.98314 (0.99094)	Top-1 acc 45.312 (44.089)	Top-5 acc 68.359 (68.116)	lr 0.02326
Train [21][1220/3239]	Time 0.580 (0.913)	Data Time 0.001 (0.019)	Loss 3.2958 (3.3552)	Entropy 0.98308 (0.99087)	Top-1 acc 48.047 (44.081)	Top-5 acc 66.797 (68.104)	lr 0.02326
Train [21][1230/3239]	Time 0.634 (0.913)	Data Time 0.001 (0.019)	Loss 3.2222 (3.3554)	Entropy 0.98316 (0.99081)	Top-1 acc 48.047 (44.084)	Top-5 acc 71.875 (68.098)	lr 0.02326
Train [21][1240/3239]	Time 0.661 (0.912)	Data Time 0.001 (0.019)	Loss 3.1597 (3.3547)	Entropy 0.98320 (0.99075)	Top-1 acc 45.312 (44.100)	Top-5 acc 72.266 (68.110)	lr 0.02326
Train [21][1250/3239]	Time 0.592 (0.912)	Data Time 0.001 (0.019)	Loss 3.2334 (3.3547)	Entropy 0.98302 (0.99069)	Top-1 acc 44.531 (44.107)	Top-5 acc 71.484 (68.115)	lr 0.02326
Train [21][1260/3239]	Time 0.577 (0.911)	Data Time 0.001 (0.018)	Loss 3.2656 (3.3551)	Entropy 0.98269 (0.99063)	Top-1 acc 46.094 (44.093)	Top-5 acc 70.703 (68.104)	lr 0.02326
Train [21][1270/3239]	Time 0.615 (0.911)	Data Time 0.001 (0.018)	Loss 3.1490 (3.3551)	Entropy 0.98273 (0.99056)	Top-1 acc 46.094 (44.088)	Top-5 acc 71.484 (68.104)	lr 0.02326
Train [21][1280/3239]	Time 0.488 (0.910)	Data Time 0.001 (0.018)	Loss 3.2223 (3.3551)	Entropy 0.98263 (0.99050)	Top-1 acc 47.656 (44.090)	Top-5 acc 68.750 (68.098)	lr 0.02326
Train [21][1290/3239]	Time 0.699 (0.910)	Data Time 0.001 (0.018)	Loss 3.6042 (3.3552)	Entropy 0.98208 (0.99044)	Top-1 acc 39.453 (44.082)	Top-5 acc 59.766 (68.099)	lr 0.02326
Train [21][1300/3239]	Time 0.546 (0.909)	Data Time 0.001 (0.018)	Loss 3.7944 (3.3561)	Entropy 0.98186 (0.99037)	Top-1 acc 35.547 (44.060)	Top-5 acc 58.203 (68.088)	lr 0.02326
Train [21][1310/3239]	Time 0.589 (0.909)	Data Time 0.001 (0.018)	Loss 3.5077 (3.3564)	Entropy 0.98186 (0.99031)	Top-1 acc 40.625 (44.052)	Top-5 acc 67.188 (68.089)	lr 0.02326
Train [21][1320/3239]	Time 0.583 (0.908)	Data Time 0.001 (0.018)	Loss 3.4569 (3.3560)	Entropy 0.98171 (0.99024)	Top-1 acc 41.406 (44.050)	Top-5 acc 69.531 (68.093)	lr 0.02326
Train [21][1330/3239]	Time 0.608 (0.925)	Data Time 0.002 (0.018)	Loss 3.1559 (3.3554)	Entropy 0.98143 (0.99018)	Top-1 acc 49.609 (44.070)	Top-5 acc 72.656 (68.108)	lr 0.02326
Train [21][1340/3239]	Time 0.601 (0.924)	Data Time 0.002 (0.017)	Loss 3.4766 (3.3555)	Entropy 0.98178 (0.99011)	Top-1 acc 42.969 (44.061)	Top-5 acc 66.016 (68.107)	lr 0.02326
Train [21][1350/3239]	Time 0.623 (0.924)	Data Time 0.003 (0.017)	Loss 3.5409 (3.3559)	Entropy 0.98168 (0.99005)	Top-1 acc 42.578 (44.055)	Top-5 acc 65.234 (68.099)	lr 0.02326
Train [21][1360/3239]	Time 0.606 (0.923)	Data Time 0.001 (0.017)	Loss 3.2878 (3.3563)	Entropy 0.98140 (0.98999)	Top-1 acc 42.578 (44.047)	Top-5 acc 70.703 (68.090)	lr 0.02326
Train [21][1370/3239]	Time 0.610 (0.923)	Data Time 0.001 (0.017)	Loss 3.5254 (3.3561)	Entropy 0.98177 (0.98993)	Top-1 acc 39.062 (44.041)	Top-5 acc 66.406 (68.097)	lr 0.02326
Train [21][1380/3239]	Time 0.578 (0.922)	Data Time 0.001 (0.017)	Loss 3.6350 (3.3562)	Entropy 0.98147 (0.98987)	Top-1 acc 36.328 (44.038)	Top-5 acc 62.500 (68.095)	lr 0.02325
Train [21][1390/3239]	Time 0.613 (0.922)	Data Time 0.001 (0.017)	Loss 3.2631 (3.3565)	Entropy 0.98177 (0.98981)	Top-1 acc 46.875 (44.026)	Top-5 acc 71.094 (68.089)	lr 0.02325
Train [21][1400/3239]	Time 0.641 (0.922)	Data Time 0.001 (0.017)	Loss 3.2316 (3.3568)	Entropy 0.98192 (0.98975)	Top-1 acc 45.312 (44.015)	Top-5 acc 72.656 (68.089)	lr 0.02325
Train [21][1410/3239]	Time 0.459 (0.921)	Data Time 0.001 (0.017)	Loss 3.2289 (3.3564)	Entropy 0.98170 (0.98970)	Top-1 acc 47.266 (44.022)	Top-5 acc 67.188 (68.095)	lr 0.02325
Train [21][1420/3239]	Time 0.589 (0.921)	Data Time 0.001 (0.017)	Loss 3.4607 (3.3565)	Entropy 0.98172 (0.98964)	Top-1 acc 44.531 (44.024)	Top-5 acc 66.797 (68.090)	lr 0.02325
Train [21][1430/3239]	Time 0.639 (0.920)	Data Time 0.001 (0.016)	Loss 3.3944 (3.3565)	Entropy 0.98150 (0.98958)	Top-1 acc 39.844 (44.025)	Top-5 acc 64.844 (68.086)	lr 0.02325
Train [21][1440/3239]	Time 0.620 (0.919)	Data Time 0.001 (0.016)	Loss 3.4994 (3.3567)	Entropy 0.98129 (0.98953)	Top-1 acc 41.016 (44.024)	Top-5 acc 62.891 (68.081)	lr 0.02325
Train [21][1450/3239]	Time 0.688 (0.919)	Data Time 0.001 (0.016)	Loss 3.4892 (3.3565)	Entropy 0.98111 (0.98947)	Top-1 acc 40.625 (44.031)	Top-5 acc 65.234 (68.083)	lr 0.02325
Train [21][1460/3239]	Time 0.616 (0.919)	Data Time 0.001 (0.016)	Loss 3.2959 (3.3562)	Entropy 0.98080 (0.98941)	Top-1 acc 44.922 (44.040)	Top-5 acc 69.922 (68.092)	lr 0.02325
Train [21][1470/3239]	Time 0.605 (0.918)	Data Time 0.001 (0.016)	Loss 3.5010 (3.3562)	Entropy 0.98087 (0.98935)	Top-1 acc 39.062 (44.041)	Top-5 acc 67.188 (68.092)	lr 0.02325
Train [21][1480/3239]	Time 0.622 (0.918)	Data Time 0.001 (0.016)	Loss 3.5584 (3.3560)	Entropy 0.98082 (0.98930)	Top-1 acc 37.500 (44.043)	Top-5 acc 66.406 (68.097)	lr 0.02325
Train [21][1490/3239]	Time 0.588 (0.917)	Data Time 0.001 (0.016)	Loss 3.3072 (3.3559)	Entropy 0.98057 (0.98924)	Top-1 acc 48.438 (44.050)	Top-5 acc 70.312 (68.100)	lr 0.02325
Train [21][1500/3239]	Time 0.625 (0.917)	Data Time 0.001 (0.016)	Loss 3.1099 (3.3559)	Entropy 0.98072 (0.98918)	Top-1 acc 52.344 (44.051)	Top-5 acc 75.391 (68.104)	lr 0.02325
Train [21][1510/3239]	Time 0.632 (0.917)	Data Time 0.001 (0.016)	Loss 3.2395 (3.3559)	Entropy 0.98056 (0.98912)	Top-1 acc 46.094 (44.048)	Top-5 acc 70.703 (68.105)	lr 0.02325
Train [21][1520/3239]	Time 0.695 (0.916)	Data Time 0.001 (0.016)	Loss 3.3377 (3.3561)	Entropy 0.98035 (0.98907)	Top-1 acc 45.703 (44.053)	Top-5 acc 68.359 (68.096)	lr 0.02325
Train [21][1530/3239]	Time 0.663 (0.916)	Data Time 0.001 (0.016)	Loss 3.3478 (3.3562)	Entropy 0.98010 (0.98901)	Top-1 acc 42.188 (44.061)	Top-5 acc 65.625 (68.094)	lr 0.02325
Train [21][1540/3239]	Time 0.618 (0.916)	Data Time 0.001 (0.015)	Loss 3.3006 (3.3561)	Entropy 0.97993 (0.98895)	Top-1 acc 44.922 (44.064)	Top-5 acc 72.266 (68.099)	lr 0.02325
Train [21][1550/3239]	Time 0.578 (0.915)	Data Time 0.001 (0.015)	Loss 3.5372 (3.3561)	Entropy 0.97972 (0.98889)	Top-1 acc 38.672 (44.066)	Top-5 acc 63.281 (68.094)	lr 0.02325
Train [21][1560/3239]	Time 0.620 (0.915)	Data Time 0.001 (0.015)	Loss 3.6129 (3.3564)	Entropy 0.97982 (0.98883)	Top-1 acc 37.891 (44.060)	Top-5 acc 63.281 (68.085)	lr 0.02325
Train [21][1570/3239]	Time 0.555 (0.915)	Data Time 0.001 (0.015)	Loss 3.3622 (3.3564)	Entropy 0.97953 (0.98878)	Top-1 acc 44.141 (44.057)	Top-5 acc 67.969 (68.087)	lr 0.02325
Train [21][1580/3239]	Time 0.622 (0.914)	Data Time 0.001 (0.015)	Loss 3.3996 (3.3564)	Entropy 0.97951 (0.98872)	Top-1 acc 44.141 (44.058)	Top-5 acc 69.922 (68.090)	lr 0.02324
Train [21][1590/3239]	Time 0.596 (0.914)	Data Time 0.001 (0.015)	Loss 3.2803 (3.3562)	Entropy 0.97929 (0.98866)	Top-1 acc 46.094 (44.067)	Top-5 acc 73.047 (68.096)	lr 0.02324
Train [21][1600/3239]	Time 0.624 (0.913)	Data Time 0.001 (0.015)	Loss 3.4607 (3.3563)	Entropy 0.97956 (0.98860)	Top-1 acc 41.797 (44.069)	Top-5 acc 64.844 (68.093)	lr 0.02324
Train [21][1610/3239]	Time 0.443 (0.913)	Data Time 0.001 (0.015)	Loss 3.3866 (3.3563)	Entropy 0.97935 (0.98854)	Top-1 acc 42.188 (44.064)	Top-5 acc 69.531 (68.094)	lr 0.02324
Train [21][1620/3239]	Time 0.609 (0.913)	Data Time 0.001 (0.015)	Loss 3.2132 (3.3561)	Entropy 0.97962 (0.98849)	Top-1 acc 48.828 (44.068)	Top-5 acc 71.484 (68.102)	lr 0.02324
Train [21][1630/3239]	Time 0.590 (0.912)	Data Time 0.001 (0.015)	Loss 3.3450 (3.3560)	Entropy 0.97954 (0.98843)	Top-1 acc 42.969 (44.070)	Top-5 acc 68.359 (68.100)	lr 0.02324
Train [21][1640/3239]	Time 0.613 (0.912)	Data Time 0.001 (0.015)	Loss 3.2845 (3.3563)	Entropy 0.97961 (0.98838)	Top-1 acc 47.656 (44.067)	Top-5 acc 69.141 (68.090)	lr 0.02324
Train [21][1650/3239]	Time 0.606 (0.912)	Data Time 0.001 (0.015)	Loss 3.2509 (3.3560)	Entropy 0.97945 (0.98833)	Top-1 acc 51.172 (44.073)	Top-5 acc 68.750 (68.094)	lr 0.02324
Train [21][1660/3239]	Time 0.604 (0.911)	Data Time 0.001 (0.014)	Loss 3.3370 (3.3559)	Entropy 0.97925 (0.98827)	Top-1 acc 44.922 (44.076)	Top-5 acc 67.188 (68.092)	lr 0.02324
Train [21][1670/3239]	Time 0.565 (0.911)	Data Time 0.001 (0.014)	Loss 3.3842 (3.3560)	Entropy 0.97936 (0.98822)	Top-1 acc 44.141 (44.081)	Top-5 acc 69.922 (68.089)	lr 0.02324
Train [21][1680/3239]	Time 0.675 (0.911)	Data Time 0.001 (0.014)	Loss 3.3252 (3.3560)	Entropy 0.97930 (0.98817)	Top-1 acc 46.094 (44.083)	Top-5 acc 67.578 (68.082)	lr 0.02324
Train [21][1690/3239]	Time 0.586 (0.910)	Data Time 0.001 (0.014)	Loss 3.3956 (3.3559)	Entropy 0.97910 (0.98811)	Top-1 acc 43.750 (44.084)	Top-5 acc 70.312 (68.086)	lr 0.02324
Train [21][1700/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.014)	Loss 3.2380 (3.3557)	Entropy 0.97860 (0.98806)	Top-1 acc 47.266 (44.083)	Top-5 acc 71.484 (68.088)	lr 0.02324
Train [21][1710/3239]	Time 0.564 (0.910)	Data Time 0.001 (0.014)	Loss 3.2403 (3.3556)	Entropy 0.97833 (0.98800)	Top-1 acc 46.094 (44.084)	Top-5 acc 72.656 (68.094)	lr 0.02324
Train [21][1720/3239]	Time 0.621 (0.909)	Data Time 0.001 (0.014)	Loss 3.4113 (3.3555)	Entropy 0.97826 (0.98795)	Top-1 acc 41.016 (44.086)	Top-5 acc 71.484 (68.097)	lr 0.02324
Train [21][1730/3239]	Time 0.591 (0.909)	Data Time 0.001 (0.014)	Loss 3.4477 (3.3553)	Entropy 0.97803 (0.98789)	Top-1 acc 44.531 (44.090)	Top-5 acc 65.625 (68.100)	lr 0.02324
Train [21][1740/3239]	Time 0.574 (0.909)	Data Time 0.001 (0.014)	Loss 3.5523 (3.3551)	Entropy 0.97776 (0.98783)	Top-1 acc 38.281 (44.094)	Top-5 acc 63.281 (68.102)	lr 0.02324
Train [21][1750/3239]	Time 0.702 (0.909)	Data Time 0.001 (0.014)	Loss 3.0595 (3.3549)	Entropy 0.97779 (0.98778)	Top-1 acc 53.125 (44.104)	Top-5 acc 75.391 (68.112)	lr 0.02324
Train [21][1760/3239]	Time 0.628 (0.908)	Data Time 0.001 (0.014)	Loss 3.3335 (3.3546)	Entropy 0.97790 (0.98772)	Top-1 acc 44.531 (44.114)	Top-5 acc 66.016 (68.115)	lr 0.02324
Train [21][1770/3239]	Time 0.604 (0.908)	Data Time 0.002 (0.014)	Loss 3.1749 (3.3542)	Entropy 0.97782 (0.98766)	Top-1 acc 48.828 (44.122)	Top-5 acc 69.531 (68.121)	lr 0.02323
Train [21][1780/3239]	Time 0.623 (0.908)	Data Time 0.001 (0.014)	Loss 3.2786 (3.3541)	Entropy 0.97718 (0.98761)	Top-1 acc 46.094 (44.125)	Top-5 acc 73.047 (68.129)	lr 0.02323
Train [21][1790/3239]	Time 0.587 (0.907)	Data Time 0.001 (0.014)	Loss 3.6101 (3.3542)	Entropy 0.97732 (0.98755)	Top-1 acc 40.234 (44.119)	Top-5 acc 61.719 (68.132)	lr 0.02323
Train [21][1800/3239]	Time 0.575 (0.907)	Data Time 0.001 (0.014)	Loss 3.5195 (3.3542)	Entropy 0.97728 (0.98749)	Top-1 acc 42.578 (44.118)	Top-5 acc 65.234 (68.132)	lr 0.02323
Train [21][1810/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.013)	Loss 3.5448 (3.3542)	Entropy 0.97724 (0.98744)	Top-1 acc 35.938 (44.120)	Top-5 acc 65.234 (68.131)	lr 0.02323
Train [21][1820/3239]	Time 0.635 (0.906)	Data Time 0.001 (0.013)	Loss 3.5288 (3.3544)	Entropy 0.97702 (0.98738)	Top-1 acc 41.016 (44.119)	Top-5 acc 63.281 (68.128)	lr 0.02323
Train [21][1830/3239]	Time 0.551 (0.906)	Data Time 0.001 (0.013)	Loss 3.3260 (3.3545)	Entropy 0.97690 (0.98732)	Top-1 acc 43.359 (44.123)	Top-5 acc 67.969 (68.128)	lr 0.02323
Train [21][1840/3239]	Time 0.586 (0.906)	Data Time 0.001 (0.013)	Loss 3.3481 (3.3544)	Entropy 0.97677 (0.98727)	Top-1 acc 43.750 (44.120)	Top-5 acc 69.141 (68.131)	lr 0.02323
Train [21][1850/3239]	Time 0.613 (0.906)	Data Time 0.001 (0.013)	Loss 3.4468 (3.3550)	Entropy 0.97670 (0.98721)	Top-1 acc 41.016 (44.109)	Top-5 acc 67.188 (68.119)	lr 0.02323
Train [21][1860/3239]	Time 0.565 (0.905)	Data Time 0.001 (0.013)	Loss 3.4580 (3.3551)	Entropy 0.97655 (0.98715)	Top-1 acc 39.844 (44.110)	Top-5 acc 66.406 (68.119)	lr 0.02323
Train [21][1870/3239]	Time 0.572 (0.905)	Data Time 0.001 (0.013)	Loss 3.1981 (3.3552)	Entropy 0.97670 (0.98709)	Top-1 acc 46.094 (44.110)	Top-5 acc 74.609 (68.122)	lr 0.02323
Train [21][1880/3239]	Time 0.612 (0.905)	Data Time 0.001 (0.013)	Loss 3.4572 (3.3553)	Entropy 0.97690 (0.98704)	Top-1 acc 47.656 (44.112)	Top-5 acc 65.234 (68.120)	lr 0.02323
Train [21][1890/3239]	Time 0.598 (0.904)	Data Time 0.001 (0.013)	Loss 3.4106 (3.3554)	Entropy 0.97697 (0.98699)	Top-1 acc 42.969 (44.111)	Top-5 acc 64.844 (68.117)	lr 0.02323
Train [21][1900/3239]	Time 0.597 (0.904)	Data Time 0.001 (0.013)	Loss 3.3992 (3.3553)	Entropy 0.97684 (0.98693)	Top-1 acc 42.969 (44.110)	Top-5 acc 68.750 (68.121)	lr 0.02323
Train [21][1910/3239]	Time 0.758 (0.904)	Data Time 0.001 (0.013)	Loss 3.3863 (3.3555)	Entropy 0.97678 (0.98688)	Top-1 acc 42.969 (44.108)	Top-5 acc 67.969 (68.118)	lr 0.02323
Train [21][1920/3239]	Time 0.562 (0.904)	Data Time 0.001 (0.013)	Loss 3.5990 (3.3553)	Entropy 0.97647 (0.98683)	Top-1 acc 40.625 (44.111)	Top-5 acc 63.672 (68.124)	lr 0.02323
Train [21][1930/3239]	Time 0.610 (0.903)	Data Time 0.001 (0.013)	Loss 3.3594 (3.3558)	Entropy 0.97656 (0.98677)	Top-1 acc 45.703 (44.102)	Top-5 acc 65.234 (68.112)	lr 0.02323
Train [21][1940/3239]	Time 0.574 (0.903)	Data Time 0.001 (0.013)	Loss 3.4831 (3.3558)	Entropy 0.97652 (0.98672)	Top-1 acc 39.844 (44.102)	Top-5 acc 66.406 (68.112)	lr 0.02323
Train [21][1950/3239]	Time 0.621 (0.903)	Data Time 0.001 (0.013)	Loss 3.4793 (3.3556)	Entropy 0.97649 (0.98667)	Top-1 acc 43.359 (44.104)	Top-5 acc 65.234 (68.115)	lr 0.02323
Train [21][1960/3239]	Time 0.535 (0.902)	Data Time 0.002 (0.013)	Loss 3.5125 (3.3557)	Entropy 0.97631 (0.98662)	Top-1 acc 41.016 (44.105)	Top-5 acc 64.844 (68.110)	lr 0.02322
Train [21][1970/3239]	Time 0.587 (0.902)	Data Time 0.001 (0.013)	Loss 3.2706 (3.3560)	Entropy 0.97662 (0.98656)	Top-1 acc 41.016 (44.100)	Top-5 acc 69.141 (68.104)	lr 0.02322
Train [21][1980/3239]	Time 0.726 (0.913)	Data Time 0.005 (0.012)	Loss 3.3378 (3.3558)	Entropy 0.97652 (0.98651)	Top-1 acc 44.141 (44.107)	Top-5 acc 69.531 (68.109)	lr 0.02322
Train [21][1990/3239]	Time 0.577 (0.913)	Data Time 0.002 (0.012)	Loss 3.2187 (3.3554)	Entropy 0.97630 (0.98646)	Top-1 acc 47.656 (44.117)	Top-5 acc 69.141 (68.114)	lr 0.02322
Train [21][2000/3239]	Time 0.586 (0.913)	Data Time 0.001 (0.012)	Loss 3.3992 (3.3557)	Entropy 0.97598 (0.98641)	Top-1 acc 47.656 (44.120)	Top-5 acc 63.672 (68.106)	lr 0.02322
Train [21][2010/3239]	Time 0.619 (0.912)	Data Time 0.002 (0.012)	Loss 3.4396 (3.3555)	Entropy 0.97582 (0.98636)	Top-1 acc 38.281 (44.121)	Top-5 acc 65.625 (68.108)	lr 0.02322
Train [21][2020/3239]	Time 0.571 (0.912)	Data Time 0.001 (0.012)	Loss 3.4940 (3.3554)	Entropy 0.97580 (0.98631)	Top-1 acc 40.625 (44.123)	Top-5 acc 64.062 (68.111)	lr 0.02322
Train [21][2030/3239]	Time 0.601 (0.912)	Data Time 0.001 (0.012)	Loss 3.4214 (3.3551)	Entropy 0.97578 (0.98626)	Top-1 acc 39.844 (44.128)	Top-5 acc 67.578 (68.113)	lr 0.02322
Train [21][2040/3239]	Time 0.583 (0.912)	Data Time 0.001 (0.012)	Loss 3.4049 (3.3554)	Entropy 0.97531 (0.98620)	Top-1 acc 41.797 (44.125)	Top-5 acc 67.188 (68.111)	lr 0.02322
Train [21][2050/3239]	Time 0.590 (0.911)	Data Time 0.001 (0.012)	Loss 3.3914 (3.3549)	Entropy 0.97518 (0.98615)	Top-1 acc 40.625 (44.128)	Top-5 acc 66.406 (68.125)	lr 0.02322
Train [21][2060/3239]	Time 0.608 (0.911)	Data Time 0.001 (0.012)	Loss 3.3909 (3.3550)	Entropy 0.97477 (0.98610)	Top-1 acc 40.234 (44.120)	Top-5 acc 66.406 (68.125)	lr 0.02322
Train [21][2070/3239]	Time 0.684 (0.911)	Data Time 0.002 (0.012)	Loss 3.1965 (3.3550)	Entropy 0.97469 (0.98604)	Top-1 acc 48.047 (44.123)	Top-5 acc 70.703 (68.121)	lr 0.02322
Train [21][2080/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.012)	Loss 3.2330 (3.3550)	Entropy 0.97418 (0.98599)	Top-1 acc 49.219 (44.126)	Top-5 acc 69.531 (68.122)	lr 0.02322
Train [21][2090/3239]	Time 0.617 (0.910)	Data Time 0.001 (0.012)	Loss 3.3170 (3.3551)	Entropy 0.97402 (0.98593)	Top-1 acc 43.359 (44.122)	Top-5 acc 70.703 (68.120)	lr 0.02322
Train [21][2100/3239]	Time 0.588 (0.910)	Data Time 0.001 (0.012)	Loss 3.4617 (3.3553)	Entropy 0.97393 (0.98587)	Top-1 acc 45.312 (44.116)	Top-5 acc 65.625 (68.110)	lr 0.02322
Train [21][2110/3239]	Time 0.618 (0.909)	Data Time 0.001 (0.012)	Loss 3.4376 (3.3552)	Entropy 0.97348 (0.98582)	Top-1 acc 42.188 (44.119)	Top-5 acc 65.625 (68.114)	lr 0.02322
Train [21][2120/3239]	Time 0.572 (0.909)	Data Time 0.001 (0.012)	Loss 3.3766 (3.3552)	Entropy 0.97331 (0.98576)	Top-1 acc 41.797 (44.115)	Top-5 acc 67.188 (68.115)	lr 0.02322
Train [21][2130/3239]	Time 0.574 (0.909)	Data Time 0.001 (0.012)	Loss 3.3752 (3.3551)	Entropy 0.97299 (0.98570)	Top-1 acc 42.578 (44.118)	Top-5 acc 67.969 (68.114)	lr 0.02322
Train [21][2140/3239]	Time 0.715 (0.909)	Data Time 0.001 (0.012)	Loss 3.4461 (3.3552)	Entropy 0.97291 (0.98564)	Top-1 acc 41.797 (44.118)	Top-5 acc 67.188 (68.110)	lr 0.02322
Train [21][2150/3239]	Time 0.620 (0.908)	Data Time 0.001 (0.012)	Loss 3.2505 (3.3552)	Entropy 0.97279 (0.98558)	Top-1 acc 46.094 (44.113)	Top-5 acc 70.703 (68.106)	lr 0.02322
Train [21][2160/3239]	Time 0.603 (0.908)	Data Time 0.001 (0.012)	Loss 3.1767 (3.3551)	Entropy 0.97242 (0.98552)	Top-1 acc 50.781 (44.117)	Top-5 acc 69.141 (68.108)	lr 0.02321
Train [21][2170/3239]	Time 0.609 (0.908)	Data Time 0.001 (0.012)	Loss 3.4025 (3.3552)	Entropy 0.97260 (0.98546)	Top-1 acc 41.797 (44.114)	Top-5 acc 66.797 (68.102)	lr 0.02321
Train [21][2180/3239]	Time 0.595 (0.908)	Data Time 0.001 (0.012)	Loss 3.2605 (3.3548)	Entropy 0.97259 (0.98540)	Top-1 acc 50.781 (44.121)	Top-5 acc 71.094 (68.109)	lr 0.02321
Train [21][2190/3239]	Time 0.625 (0.908)	Data Time 0.001 (0.011)	Loss 3.1956 (3.3547)	Entropy 0.97220 (0.98534)	Top-1 acc 49.609 (44.121)	Top-5 acc 71.094 (68.110)	lr 0.02321
Train [21][2200/3239]	Time 0.593 (0.907)	Data Time 0.001 (0.011)	Loss 3.2835 (3.3544)	Entropy 0.97257 (0.98528)	Top-1 acc 44.141 (44.126)	Top-5 acc 69.531 (68.115)	lr 0.02321
Train [21][2210/3239]	Time 0.595 (0.907)	Data Time 0.001 (0.011)	Loss 3.3747 (3.3543)	Entropy 0.97241 (0.98523)	Top-1 acc 41.797 (44.134)	Top-5 acc 67.188 (68.121)	lr 0.02321
Train [21][2220/3239]	Time 0.594 (0.907)	Data Time 0.001 (0.011)	Loss 3.1023 (3.3543)	Entropy 0.97266 (0.98517)	Top-1 acc 49.609 (44.133)	Top-5 acc 73.828 (68.123)	lr 0.02321
Train [21][2230/3239]	Time 0.670 (0.907)	Data Time 0.001 (0.011)	Loss 3.3017 (3.3542)	Entropy 0.97296 (0.98511)	Top-1 acc 41.797 (44.132)	Top-5 acc 71.484 (68.126)	lr 0.02321
Train [21][2240/3239]	Time 0.597 (0.907)	Data Time 0.001 (0.011)	Loss 3.1924 (3.3542)	Entropy 0.97269 (0.98506)	Top-1 acc 48.047 (44.132)	Top-5 acc 73.047 (68.126)	lr 0.02321
Train [21][2250/3239]	Time 0.608 (0.906)	Data Time 0.001 (0.011)	Loss 3.3156 (3.3543)	Entropy 0.97247 (0.98500)	Top-1 acc 47.656 (44.134)	Top-5 acc 67.188 (68.119)	lr 0.02321
Train [21][2260/3239]	Time 0.554 (0.906)	Data Time 0.001 (0.011)	Loss 3.3806 (3.3543)	Entropy 0.97222 (0.98495)	Top-1 acc 43.359 (44.137)	Top-5 acc 69.531 (68.118)	lr 0.02321
Train [21][2270/3239]	Time 0.613 (0.906)	Data Time 0.001 (0.011)	Loss 3.5248 (3.3545)	Entropy 0.97240 (0.98489)	Top-1 acc 40.234 (44.134)	Top-5 acc 64.062 (68.111)	lr 0.02321
Train [21][2280/3239]	Time 0.607 (0.906)	Data Time 0.001 (0.011)	Loss 3.4463 (3.3542)	Entropy 0.97291 (0.98484)	Top-1 acc 44.922 (44.145)	Top-5 acc 65.234 (68.114)	lr 0.02321
Train [21][2290/3239]	Time 0.639 (0.905)	Data Time 0.001 (0.011)	Loss 3.4229 (3.3542)	Entropy 0.97306 (0.98479)	Top-1 acc 46.875 (44.144)	Top-5 acc 67.188 (68.117)	lr 0.02321
Train [21][2300/3239]	Time 0.719 (0.905)	Data Time 0.001 (0.011)	Loss 3.2539 (3.3542)	Entropy 0.97305 (0.98473)	Top-1 acc 44.141 (44.149)	Top-5 acc 70.312 (68.120)	lr 0.02321
Train [21][2310/3239]	Time 0.530 (0.905)	Data Time 0.001 (0.011)	Loss 3.5828 (3.3541)	Entropy 0.97294 (0.98468)	Top-1 acc 34.375 (44.142)	Top-5 acc 62.109 (68.123)	lr 0.02321
Train [21][2320/3239]	Time 0.594 (0.905)	Data Time 0.001 (0.011)	Loss 3.3867 (3.3540)	Entropy 0.97240 (0.98463)	Top-1 acc 39.453 (44.144)	Top-5 acc 67.188 (68.125)	lr 0.02321
Train [21][2330/3239]	Time 0.615 (0.904)	Data Time 0.001 (0.011)	Loss 3.1130 (3.3539)	Entropy 0.97235 (0.98458)	Top-1 acc 49.219 (44.146)	Top-5 acc 72.656 (68.127)	lr 0.02321
Train [21][2340/3239]	Time 0.600 (0.904)	Data Time 0.001 (0.011)	Loss 3.2843 (3.3537)	Entropy 0.97198 (0.98453)	Top-1 acc 45.703 (44.149)	Top-5 acc 71.094 (68.131)	lr 0.02321
Train [21][2350/3239]	Time 0.634 (0.904)	Data Time 0.001 (0.011)	Loss 3.3188 (3.3534)	Entropy 0.97149 (0.98447)	Top-1 acc 44.922 (44.159)	Top-5 acc 67.969 (68.134)	lr 0.02320
Train [21][2360/3239]	Time 0.606 (0.904)	Data Time 0.002 (0.011)	Loss 3.2149 (3.3534)	Entropy 0.97138 (0.98442)	Top-1 acc 46.094 (44.162)	Top-5 acc 72.656 (68.131)	lr 0.02320
Train [21][2370/3239]	Time 0.689 (0.904)	Data Time 0.001 (0.011)	Loss 3.4127 (3.3533)	Entropy 0.97157 (0.98436)	Top-1 acc 44.531 (44.161)	Top-5 acc 65.625 (68.129)	lr 0.02320
Train [21][2380/3239]	Time 0.557 (0.903)	Data Time 0.001 (0.011)	Loss 3.2468 (3.3531)	Entropy 0.97181 (0.98431)	Top-1 acc 46.875 (44.165)	Top-5 acc 70.312 (68.136)	lr 0.02320
Train [21][2390/3239]	Time 0.604 (0.903)	Data Time 0.002 (0.011)	Loss 3.2041 (3.3530)	Entropy 0.97131 (0.98425)	Top-1 acc 47.266 (44.165)	Top-5 acc 70.312 (68.140)	lr 0.02320
Train [21][2400/3239]	Time 0.598 (0.903)	Data Time 0.001 (0.011)	Loss 3.5031 (3.3529)	Entropy 0.97103 (0.98420)	Top-1 acc 41.797 (44.166)	Top-5 acc 62.109 (68.139)	lr 0.02320
Train [21][2410/3239]	Time 0.677 (0.903)	Data Time 0.001 (0.011)	Loss 3.3127 (3.3530)	Entropy 0.97102 (0.98415)	Top-1 acc 47.266 (44.163)	Top-5 acc 70.312 (68.136)	lr 0.02320
Train [21][2420/3239]	Time 0.619 (0.903)	Data Time 0.001 (0.011)	Loss 3.5258 (3.3532)	Entropy 0.97089 (0.98409)	Top-1 acc 41.016 (44.157)	Top-5 acc 64.844 (68.131)	lr 0.02320
Train [21][2430/3239]	Time 0.546 (0.902)	Data Time 0.001 (0.011)	Loss 3.4908 (3.3531)	Entropy 0.97066 (0.98404)	Top-1 acc 41.406 (44.155)	Top-5 acc 63.281 (68.134)	lr 0.02320
Train [21][2440/3239]	Time 0.592 (0.902)	Data Time 0.001 (0.010)	Loss 3.3748 (3.3530)	Entropy 0.97059 (0.98398)	Top-1 acc 44.922 (44.159)	Top-5 acc 69.141 (68.133)	lr 0.02320
Train [21][2450/3239]	Time 0.571 (0.902)	Data Time 0.001 (0.010)	Loss 3.3154 (3.3531)	Entropy 0.97069 (0.98393)	Top-1 acc 41.797 (44.163)	Top-5 acc 71.094 (68.134)	lr 0.02320
Train [21][2460/3239]	Time 0.662 (0.902)	Data Time 0.001 (0.010)	Loss 3.5675 (3.3531)	Entropy 0.97039 (0.98387)	Top-1 acc 38.672 (44.163)	Top-5 acc 62.500 (68.132)	lr 0.02320
Train [21][2470/3239]	Time 0.648 (0.901)	Data Time 0.001 (0.010)	Loss 3.3315 (3.3532)	Entropy 0.97032 (0.98382)	Top-1 acc 46.875 (44.164)	Top-5 acc 65.625 (68.133)	lr 0.02320
Train [21][2480/3239]	Time 0.567 (0.901)	Data Time 0.001 (0.010)	Loss 3.3811 (3.3532)	Entropy 0.97012 (0.98376)	Top-1 acc 45.703 (44.166)	Top-5 acc 67.188 (68.135)	lr 0.02320
Train [21][2490/3239]	Time 0.627 (0.901)	Data Time 0.001 (0.010)	Loss 3.4716 (3.3531)	Entropy 0.97042 (0.98371)	Top-1 acc 40.625 (44.172)	Top-5 acc 66.797 (68.139)	lr 0.02320
Train [21][2500/3239]	Time 0.615 (0.901)	Data Time 0.001 (0.010)	Loss 3.3881 (3.3532)	Entropy 0.97031 (0.98366)	Top-1 acc 43.359 (44.169)	Top-5 acc 67.969 (68.140)	lr 0.02320
Train [21][2510/3239]	Time 0.586 (0.901)	Data Time 0.001 (0.010)	Loss 3.3041 (3.3530)	Entropy 0.97001 (0.98360)	Top-1 acc 43.750 (44.176)	Top-5 acc 69.141 (68.143)	lr 0.02320
Train [21][2520/3239]	Time 0.626 (0.901)	Data Time 0.001 (0.010)	Loss 3.3131 (3.3530)	Entropy 0.96992 (0.98355)	Top-1 acc 45.703 (44.182)	Top-5 acc 69.141 (68.143)	lr 0.02320
Train [21][2530/3239]	Time 0.662 (0.901)	Data Time 0.001 (0.010)	Loss 3.5721 (3.3531)	Entropy 0.96993 (0.98349)	Top-1 acc 40.234 (44.182)	Top-5 acc 59.375 (68.135)	lr 0.02320
Train [21][2540/3239]	Time 0.597 (0.900)	Data Time 0.001 (0.010)	Loss 3.1275 (3.3527)	Entropy 0.96979 (0.98344)	Top-1 acc 50.000 (44.193)	Top-5 acc 71.875 (68.142)	lr 0.02319
Train [21][2550/3239]	Time 0.601 (0.900)	Data Time 0.001 (0.010)	Loss 3.3143 (3.3525)	Entropy 0.97015 (0.98339)	Top-1 acc 46.484 (44.195)	Top-5 acc 69.922 (68.146)	lr 0.02319
Train [21][2560/3239]	Time 0.619 (0.900)	Data Time 0.001 (0.010)	Loss 3.3469 (3.3526)	Entropy 0.97001 (0.98334)	Top-1 acc 45.312 (44.194)	Top-5 acc 71.094 (68.147)	lr 0.02319
Train [21][2570/3239]	Time 0.604 (0.900)	Data Time 0.001 (0.010)	Loss 3.3099 (3.3525)	Entropy 0.96993 (0.98329)	Top-1 acc 44.141 (44.198)	Top-5 acc 69.922 (68.150)	lr 0.02319
Train [21][2580/3239]	Time 0.624 (0.900)	Data Time 0.001 (0.010)	Loss 3.5329 (3.3529)	Entropy 0.96947 (0.98323)	Top-1 acc 44.922 (44.190)	Top-5 acc 63.281 (68.140)	lr 0.02319
Train [21][2590/3239]	Time 0.608 (0.900)	Data Time 0.001 (0.010)	Loss 3.1085 (3.3528)	Entropy 0.96956 (0.98318)	Top-1 acc 50.391 (44.191)	Top-5 acc 73.828 (68.142)	lr 0.02319
Train [21][2600/3239]	Time 0.564 (0.899)	Data Time 0.001 (0.010)	Loss 3.5517 (3.3529)	Entropy 0.96944 (0.98313)	Top-1 acc 41.797 (44.191)	Top-5 acc 63.672 (68.144)	lr 0.02319
Train [21][2610/3239]	Time 0.558 (0.899)	Data Time 0.001 (0.010)	Loss 3.3890 (3.3529)	Entropy 0.96906 (0.98308)	Top-1 acc 44.531 (44.190)	Top-5 acc 66.406 (68.145)	lr 0.02319
Train [21][2620/3239]	Time 0.595 (0.899)	Data Time 0.001 (0.010)	Loss 3.1704 (3.3532)	Entropy 0.96896 (0.98302)	Top-1 acc 49.609 (44.185)	Top-5 acc 69.922 (68.143)	lr 0.02319
Train [21][2630/3239]	Time 0.596 (0.898)	Data Time 0.001 (0.010)	Loss 3.4964 (3.3532)	Entropy 0.96901 (0.98297)	Top-1 acc 39.453 (44.180)	Top-5 acc 66.797 (68.143)	lr 0.02319
Train [21][2640/3239]	Time 0.601 (0.907)	Data Time 0.002 (0.010)	Loss 3.4184 (3.3533)	Entropy 0.96883 (0.98291)	Top-1 acc 40.234 (44.177)	Top-5 acc 66.016 (68.140)	lr 0.02319
Train [21][2650/3239]	Time 0.580 (0.907)	Data Time 0.002 (0.010)	Loss 3.5650 (3.3535)	Entropy 0.96865 (0.98286)	Top-1 acc 41.797 (44.177)	Top-5 acc 66.406 (68.134)	lr 0.02319
Train [21][2660/3239]	Time 0.610 (0.907)	Data Time 0.002 (0.010)	Loss 3.3027 (3.3534)	Entropy 0.96897 (0.98281)	Top-1 acc 45.703 (44.181)	Top-5 acc 69.531 (68.136)	lr 0.02319
Train [21][2670/3239]	Time 0.644 (0.906)	Data Time 0.003 (0.010)	Loss 3.4068 (3.3534)	Entropy 0.96919 (0.98276)	Top-1 acc 40.625 (44.178)	Top-5 acc 66.016 (68.136)	lr 0.02319
Train [21][2680/3239]	Time 0.596 (0.906)	Data Time 0.001 (0.010)	Loss 3.2021 (3.3535)	Entropy 0.96896 (0.98271)	Top-1 acc 48.438 (44.174)	Top-5 acc 70.703 (68.136)	lr 0.02319
Train [21][2690/3239]	Time 0.716 (0.906)	Data Time 0.001 (0.010)	Loss 3.3841 (3.3535)	Entropy 0.96951 (0.98265)	Top-1 acc 43.750 (44.175)	Top-5 acc 66.016 (68.136)	lr 0.02319
Train [21][2700/3239]	Time 0.654 (0.906)	Data Time 0.001 (0.010)	Loss 3.4127 (3.3538)	Entropy 0.96962 (0.98261)	Top-1 acc 44.922 (44.168)	Top-5 acc 67.578 (68.129)	lr 0.02319
Train [21][2710/3239]	Time 0.637 (0.906)	Data Time 0.001 (0.010)	Loss 3.3069 (3.3538)	Entropy 0.96971 (0.98256)	Top-1 acc 43.359 (44.165)	Top-5 acc 71.875 (68.128)	lr 0.02319
Train [21][2720/3239]	Time 0.616 (0.906)	Data Time 0.001 (0.010)	Loss 3.4830 (3.3537)	Entropy 0.96974 (0.98251)	Top-1 acc 43.359 (44.166)	Top-5 acc 66.406 (68.130)	lr 0.02319
Train [21][2730/3239]	Time 0.602 (0.905)	Data Time 0.001 (0.010)	Loss 3.4325 (3.3539)	Entropy 0.96932 (0.98246)	Top-1 acc 42.188 (44.158)	Top-5 acc 69.141 (68.129)	lr 0.02318
Train [21][2740/3239]	Time 0.652 (0.905)	Data Time 0.001 (0.010)	Loss 3.4073 (3.3538)	Entropy 0.96881 (0.98242)	Top-1 acc 44.141 (44.160)	Top-5 acc 64.453 (68.128)	lr 0.02318
Train [21][2750/3239]	Time 0.590 (0.905)	Data Time 0.004 (0.010)	Loss 3.3337 (3.3536)	Entropy 0.96860 (0.98237)	Top-1 acc 44.922 (44.165)	Top-5 acc 68.359 (68.132)	lr 0.02318
Train [21][2760/3239]	Time 0.611 (0.905)	Data Time 0.001 (0.010)	Loss 3.5327 (3.3537)	Entropy 0.96864 (0.98232)	Top-1 acc 42.188 (44.159)	Top-5 acc 63.281 (68.131)	lr 0.02318
Train [21][2770/3239]	Time 0.597 (0.904)	Data Time 0.001 (0.009)	Loss 3.3104 (3.3538)	Entropy 0.96894 (0.98227)	Top-1 acc 40.625 (44.153)	Top-5 acc 68.750 (68.129)	lr 0.02318
Train [21][2780/3239]	Time 0.633 (0.904)	Data Time 0.034 (0.009)	Loss 3.3952 (3.3538)	Entropy 0.96860 (0.98222)	Top-1 acc 45.312 (44.156)	Top-5 acc 67.578 (68.128)	lr 0.02318
Train [21][2790/3239]	Time 0.615 (0.904)	Data Time 0.001 (0.009)	Loss 3.3177 (3.3539)	Entropy 0.96800 (0.98217)	Top-1 acc 43.750 (44.148)	Top-5 acc 68.750 (68.126)	lr 0.02318
Train [21][2800/3239]	Time 0.630 (0.904)	Data Time 0.001 (0.009)	Loss 3.2973 (3.3539)	Entropy 0.96758 (0.98212)	Top-1 acc 46.875 (44.151)	Top-5 acc 71.484 (68.129)	lr 0.02318
Train [21][2810/3239]	Time 0.631 (0.904)	Data Time 0.001 (0.009)	Loss 3.1818 (3.3538)	Entropy 0.96786 (0.98207)	Top-1 acc 51.172 (44.156)	Top-5 acc 71.484 (68.130)	lr 0.02318
Train [21][2820/3239]	Time 0.614 (0.904)	Data Time 0.001 (0.009)	Loss 3.2055 (3.3535)	Entropy 0.96807 (0.98202)	Top-1 acc 48.047 (44.163)	Top-5 acc 74.609 (68.136)	lr 0.02318
Train [21][2830/3239]	Time 0.593 (0.903)	Data Time 0.001 (0.009)	Loss 3.3544 (3.3534)	Entropy 0.96807 (0.98197)	Top-1 acc 42.188 (44.169)	Top-5 acc 67.969 (68.138)	lr 0.02318
Train [21][2840/3239]	Time 0.633 (0.903)	Data Time 0.001 (0.009)	Loss 3.1840 (3.3533)	Entropy 0.96796 (0.98192)	Top-1 acc 50.391 (44.175)	Top-5 acc 69.922 (68.137)	lr 0.02318
Train [21][2850/3239]	Time 0.727 (0.903)	Data Time 0.001 (0.009)	Loss 3.3549 (3.3532)	Entropy 0.96807 (0.98187)	Top-1 acc 46.094 (44.175)	Top-5 acc 69.141 (68.139)	lr 0.02318
Train [21][2860/3239]	Time 0.604 (0.903)	Data Time 0.001 (0.009)	Loss 3.3869 (3.3530)	Entropy 0.96819 (0.98182)	Top-1 acc 43.359 (44.177)	Top-5 acc 69.141 (68.144)	lr 0.02318
Train [21][2870/3239]	Time 0.536 (0.903)	Data Time 0.001 (0.009)	Loss 3.2276 (3.3529)	Entropy 0.96780 (0.98177)	Top-1 acc 49.219 (44.181)	Top-5 acc 71.875 (68.146)	lr 0.02318
Train [21][2880/3239]	Time 0.605 (0.903)	Data Time 0.001 (0.009)	Loss 3.3509 (3.3529)	Entropy 0.96751 (0.98172)	Top-1 acc 46.094 (44.179)	Top-5 acc 65.625 (68.147)	lr 0.02318
Train [21][2890/3239]	Time 0.660 (0.903)	Data Time 0.001 (0.009)	Loss 3.4076 (3.3529)	Entropy 0.96735 (0.98167)	Top-1 acc 39.844 (44.178)	Top-5 acc 69.141 (68.148)	lr 0.02318
Train [21][2900/3239]	Time 0.605 (0.902)	Data Time 0.002 (0.009)	Loss 3.6027 (3.3532)	Entropy 0.96720 (0.98162)	Top-1 acc 39.062 (44.173)	Top-5 acc 63.281 (68.140)	lr 0.02318
Train [21][2910/3239]	Time 0.626 (0.902)	Data Time 0.001 (0.009)	Loss 3.3950 (3.3532)	Entropy 0.96719 (0.98157)	Top-1 acc 47.266 (44.177)	Top-5 acc 67.578 (68.139)	lr 0.02318
Train [21][2920/3239]	Time 0.701 (0.902)	Data Time 0.001 (0.009)	Loss 3.3211 (3.3532)	Entropy 0.96703 (0.98153)	Top-1 acc 44.922 (44.176)	Top-5 acc 68.359 (68.140)	lr 0.02317
Train [21][2930/3239]	Time 0.604 (0.902)	Data Time 0.001 (0.009)	Loss 3.2476 (3.3532)	Entropy 0.96696 (0.98148)	Top-1 acc 50.391 (44.174)	Top-5 acc 71.094 (68.135)	lr 0.02317
Train [21][2940/3239]	Time 0.590 (0.902)	Data Time 0.001 (0.009)	Loss 3.2906 (3.3529)	Entropy 0.96672 (0.98143)	Top-1 acc 46.094 (44.181)	Top-5 acc 68.359 (68.142)	lr 0.02317
Train [21][2950/3239]	Time 0.605 (0.901)	Data Time 0.001 (0.009)	Loss 3.0324 (3.3530)	Entropy 0.96603 (0.98137)	Top-1 acc 52.734 (44.178)	Top-5 acc 72.656 (68.141)	lr 0.02317
Train [21][2960/3239]	Time 0.600 (0.901)	Data Time 0.001 (0.009)	Loss 3.1738 (3.3532)	Entropy 0.96585 (0.98132)	Top-1 acc 44.922 (44.172)	Top-5 acc 72.266 (68.137)	lr 0.02317
Train [21][2970/3239]	Time 0.603 (0.901)	Data Time 0.001 (0.009)	Loss 3.4743 (3.3533)	Entropy 0.96569 (0.98127)	Top-1 acc 43.359 (44.171)	Top-5 acc 66.016 (68.133)	lr 0.02317
Train [21][2980/3239]	Time 0.621 (0.901)	Data Time 0.001 (0.009)	Loss 3.2747 (3.3535)	Entropy 0.96545 (0.98122)	Top-1 acc 46.484 (44.165)	Top-5 acc 70.703 (68.127)	lr 0.02317
Train [21][2990/3239]	Time 0.591 (0.901)	Data Time 0.001 (0.009)	Loss 3.4860 (3.3534)	Entropy 0.96522 (0.98116)	Top-1 acc 43.359 (44.167)	Top-5 acc 62.109 (68.131)	lr 0.02317
Train [21][3000/3239]	Time 0.576 (0.901)	Data Time 0.001 (0.009)	Loss 3.2608 (3.3532)	Entropy 0.96495 (0.98111)	Top-1 acc 46.094 (44.171)	Top-5 acc 70.312 (68.134)	lr 0.02317
Train [21][3010/3239]	Time 0.647 (0.901)	Data Time 0.001 (0.009)	Loss 3.2546 (3.3531)	Entropy 0.96516 (0.98106)	Top-1 acc 47.266 (44.171)	Top-5 acc 69.141 (68.140)	lr 0.02317
Train [21][3020/3239]	Time 0.640 (0.901)	Data Time 0.002 (0.009)	Loss 3.4226 (3.3533)	Entropy 0.96488 (0.98100)	Top-1 acc 45.312 (44.168)	Top-5 acc 67.969 (68.137)	lr 0.02317
Train [21][3030/3239]	Time 0.620 (0.900)	Data Time 0.001 (0.009)	Loss 3.4624 (3.3532)	Entropy 0.96492 (0.98095)	Top-1 acc 39.062 (44.170)	Top-5 acc 66.797 (68.138)	lr 0.02317
Train [21][3040/3239]	Time 0.630 (0.900)	Data Time 0.001 (0.009)	Loss 3.2564 (3.3530)	Entropy 0.96482 (0.98090)	Top-1 acc 50.391 (44.174)	Top-5 acc 72.656 (68.139)	lr 0.02317
Train [21][3050/3239]	Time 0.595 (0.900)	Data Time 0.001 (0.009)	Loss 3.2623 (3.3531)	Entropy 0.96435 (0.98085)	Top-1 acc 47.266 (44.175)	Top-5 acc 71.094 (68.137)	lr 0.02317
Train [21][3060/3239]	Time 0.618 (0.900)	Data Time 0.001 (0.009)	Loss 3.4521 (3.3529)	Entropy 0.96434 (0.98079)	Top-1 acc 41.016 (44.180)	Top-5 acc 67.969 (68.140)	lr 0.02317
Train [21][3070/3239]	Time 0.565 (0.900)	Data Time 0.001 (0.009)	Loss 3.3574 (3.3532)	Entropy 0.96424 (0.98074)	Top-1 acc 41.797 (44.171)	Top-5 acc 67.188 (68.136)	lr 0.02317
Train [21][3080/3239]	Time 0.700 (0.900)	Data Time 0.001 (0.009)	Loss 3.4990 (3.3534)	Entropy 0.96381 (0.98068)	Top-1 acc 43.359 (44.168)	Top-5 acc 62.109 (68.132)	lr 0.02317
Train [21][3090/3239]	Time 0.578 (0.899)	Data Time 0.001 (0.009)	Loss 3.5718 (3.3534)	Entropy 0.96326 (0.98063)	Top-1 acc 39.844 (44.168)	Top-5 acc 61.328 (68.130)	lr 0.02317
Train [21][3100/3239]	Time 0.570 (0.899)	Data Time 0.001 (0.009)	Loss 3.3291 (3.3534)	Entropy 0.96306 (0.98057)	Top-1 acc 48.438 (44.170)	Top-5 acc 66.797 (68.129)	lr 0.02317
Train [21][3110/3239]	Time 0.584 (0.899)	Data Time 0.001 (0.009)	Loss 3.4160 (3.3533)	Entropy 0.96336 (0.98052)	Top-1 acc 42.969 (44.172)	Top-5 acc 66.406 (68.128)	lr 0.02316
Train [21][3120/3239]	Time 0.611 (0.899)	Data Time 0.001 (0.009)	Loss 3.4054 (3.3530)	Entropy 0.96316 (0.98046)	Top-1 acc 42.969 (44.178)	Top-5 acc 65.234 (68.131)	lr 0.02316
Train [21][3130/3239]	Time 0.571 (0.899)	Data Time 0.001 (0.009)	Loss 3.2913 (3.3530)	Entropy 0.96334 (0.98041)	Top-1 acc 44.922 (44.179)	Top-5 acc 71.484 (68.134)	lr 0.02316
Train [21][3140/3239]	Time 0.616 (0.899)	Data Time 0.001 (0.009)	Loss 3.2016 (3.3530)	Entropy 0.96341 (0.98035)	Top-1 acc 50.391 (44.182)	Top-5 acc 73.828 (68.138)	lr 0.02316
Train [21][3150/3239]	Time 0.630 (0.898)	Data Time 0.001 (0.009)	Loss 3.2479 (3.3529)	Entropy 0.96340 (0.98030)	Top-1 acc 44.531 (44.181)	Top-5 acc 67.969 (68.142)	lr 0.02316
Train [21][3160/3239]	Time 0.566 (0.898)	Data Time 0.001 (0.009)	Loss 3.4193 (3.3528)	Entropy 0.96381 (0.98025)	Top-1 acc 44.531 (44.186)	Top-5 acc 64.453 (68.143)	lr 0.02316
Train [21][3170/3239]	Time 0.692 (0.898)	Data Time 0.001 (0.009)	Loss 3.2584 (3.3528)	Entropy 0.96383 (0.98019)	Top-1 acc 45.312 (44.183)	Top-5 acc 72.656 (68.145)	lr 0.02316
Train [21][3180/3239]	Time 0.587 (0.898)	Data Time 0.000 (0.009)	Loss 3.1960 (3.3527)	Entropy 0.96390 (0.98014)	Top-1 acc 50.000 (44.186)	Top-5 acc 72.656 (68.146)	lr 0.02316
Train [21][3190/3239]	Time 0.595 (0.898)	Data Time 0.000 (0.009)	Loss 3.3786 (3.3527)	Entropy 0.96366 (0.98009)	Top-1 acc 43.750 (44.187)	Top-5 acc 66.016 (68.147)	lr 0.02316
Train [21][3200/3239]	Time 0.562 (0.898)	Data Time 0.000 (0.008)	Loss 3.4289 (3.3526)	Entropy 0.96359 (0.98004)	Top-1 acc 45.703 (44.189)	Top-5 acc 66.016 (68.149)	lr 0.02316
Train [21][3210/3239]	Time 0.617 (0.898)	Data Time 0.000 (0.008)	Loss 3.2947 (3.3526)	Entropy 0.96357 (0.97999)	Top-1 acc 47.266 (44.191)	Top-5 acc 69.141 (68.148)	lr 0.02316
Train [21][3220/3239]	Time 0.605 (0.897)	Data Time 0.000 (0.008)	Loss 3.4739 (3.3527)	Entropy 0.96363 (0.97994)	Top-1 acc 42.578 (44.193)	Top-5 acc 66.406 (68.146)	lr 0.02316
Train [21][3230/3239]	Time 0.576 (0.897)	Data Time 0.000 (0.008)	Loss 3.2774 (3.3526)	Entropy 0.96367 (0.97989)	Top-1 acc 44.531 (44.195)	Top-5 acc 69.922 (68.147)	lr 0.02316
Train [21][3239/3239]	Time 1.451 (0.897)	Data Time 0.000 (0.008)	Loss 3.4139 (3.3525)	Entropy 0.96342 (0.97984)	Top-1 acc 39.506 (44.198)	Top-5 acc 67.901 (68.149)	lr 0.02316
==========Valid [21/120]	loss 2.085	top-1 acc 54.030 (54.030)	top-5 acc 77.326	Train top-1 44.198	top-5 68.149	Entropy 0.96342	Latency-None: 0.000ms	Flops: 539.76M
Train [22][0/3239]	Time 22.841 (22.841)	Data Time 21.423 (21.423)	Loss 3.0984 (3.0984)	Entropy 0.96328 (0.96328)	Top-1 acc 47.656 (47.656)	Top-5 acc 72.266 (72.266)	lr 0.02316
Train [22][10/3239]	Time 0.593 (2.890)	Data Time 0.001 (1.949)	Loss 3.1529 (3.2500)	Entropy 0.96320 (0.96329)	Top-1 acc 47.266 (46.058)	Top-5 acc 69.141 (69.673)	lr 0.02316
Train [22][20/3239]	Time 0.586 (1.918)	Data Time 0.001 (1.022)	Loss 3.1661 (3.2940)	Entropy 0.96328 (0.96326)	Top-1 acc 47.656 (44.996)	Top-5 acc 69.531 (69.029)	lr 0.02316
Train [22][30/3239]	Time 0.561 (1.578)	Data Time 0.001 (0.693)	Loss 3.4860 (3.2869)	Entropy 0.96351 (0.96327)	Top-1 acc 37.891 (45.325)	Top-5 acc 67.188 (69.279)	lr 0.02316
Train [22][40/3239]	Time 0.663 (1.396)	Data Time 0.001 (0.524)	Loss 3.1275 (3.2840)	Entropy 0.96362 (0.96335)	Top-1 acc 50.000 (45.179)	Top-5 acc 73.047 (69.303)	lr 0.02316
Train [22][50/3239]	Time 0.713 (1.731)	Data Time 0.006 (0.422)	Loss 3.3364 (3.2922)	Entropy 0.96331 (0.96341)	Top-1 acc 45.703 (45.190)	Top-5 acc 66.797 (69.240)	lr 0.02316
Train [22][60/3239]	Time 0.638 (1.591)	Data Time 0.002 (0.353)	Loss 3.3566 (3.3093)	Entropy 0.96287 (0.96337)	Top-1 acc 44.922 (44.730)	Top-5 acc 70.312 (68.820)	lr 0.02315
Train [22][70/3239]	Time 0.725 (1.489)	Data Time 0.002 (0.304)	Loss 3.1239 (3.3071)	Entropy 0.96318 (0.96332)	Top-1 acc 49.219 (44.955)	Top-5 acc 74.609 (68.827)	lr 0.02315
Train [22][80/3239]	Time 0.559 (1.409)	Data Time 0.001 (0.267)	Loss 3.3398 (3.3121)	Entropy 0.96277 (0.96327)	Top-1 acc 44.531 (45.038)	Top-5 acc 69.141 (68.789)	lr 0.02315
Train [22][90/3239]	Time 0.603 (1.349)	Data Time 0.003 (0.238)	Loss 3.3050 (3.3131)	Entropy 0.96289 (0.96321)	Top-1 acc 45.703 (44.943)	Top-5 acc 67.969 (68.776)	lr 0.02315
Train [22][100/3239]	Time 0.623 (1.303)	Data Time 0.001 (0.214)	Loss 3.3064 (3.3111)	Entropy 0.96262 (0.96318)	Top-1 acc 44.141 (45.092)	Top-5 acc 66.797 (68.765)	lr 0.02315
Train [22][110/3239]	Time 0.611 (1.262)	Data Time 0.001 (0.195)	Loss 3.3492 (3.3132)	Entropy 0.96251 (0.96313)	Top-1 acc 45.312 (45.003)	Top-5 acc 69.922 (68.782)	lr 0.02315
Train [22][120/3239]	Time 0.567 (1.230)	Data Time 0.001 (0.179)	Loss 3.4643 (3.3147)	Entropy 0.96235 (0.96308)	Top-1 acc 42.188 (45.041)	Top-5 acc 64.844 (68.711)	lr 0.02315
Train [22][130/3239]	Time 0.634 (1.202)	Data Time 0.001 (0.166)	Loss 3.4275 (3.3192)	Entropy 0.96195 (0.96301)	Top-1 acc 39.453 (44.943)	Top-5 acc 67.188 (68.702)	lr 0.02315
Train [22][140/3239]	Time 0.684 (1.177)	Data Time 0.001 (0.154)	Loss 3.4583 (3.3207)	Entropy 0.96198 (0.96293)	Top-1 acc 39.844 (44.936)	Top-5 acc 67.969 (68.689)	lr 0.02315
Train [22][150/3239]	Time 0.625 (1.156)	Data Time 0.001 (0.144)	Loss 3.2564 (3.3213)	Entropy 0.96233 (0.96287)	Top-1 acc 46.484 (45.002)	Top-5 acc 67.969 (68.685)	lr 0.02315
Train [22][160/3239]	Time 0.613 (1.137)	Data Time 0.002 (0.135)	Loss 3.2723 (3.3212)	Entropy 0.96228 (0.96284)	Top-1 acc 48.047 (44.966)	Top-5 acc 69.922 (68.660)	lr 0.02315
Train [22][170/3239]	Time 0.600 (1.120)	Data Time 0.001 (0.127)	Loss 3.2618 (3.3170)	Entropy 0.96238 (0.96280)	Top-1 acc 48.047 (45.059)	Top-5 acc 71.484 (68.752)	lr 0.02315
Train [22][180/3239]	Time 0.575 (1.104)	Data Time 0.001 (0.120)	Loss 3.0354 (3.3172)	Entropy 0.96241 (0.96277)	Top-1 acc 51.953 (45.051)	Top-5 acc 73.828 (68.705)	lr 0.02315
Train [22][190/3239]	Time 0.586 (1.090)	Data Time 0.002 (0.114)	Loss 3.2964 (3.3250)	Entropy 0.96260 (0.96276)	Top-1 acc 46.875 (44.895)	Top-5 acc 67.969 (68.533)	lr 0.02315
Train [22][200/3239]	Time 0.583 (1.076)	Data Time 0.001 (0.109)	Loss 3.2388 (3.3239)	Entropy 0.96231 (0.96274)	Top-1 acc 45.312 (44.922)	Top-5 acc 69.922 (68.546)	lr 0.02315
Train [22][210/3239]	Time 0.655 (1.066)	Data Time 0.001 (0.104)	Loss 3.2801 (3.3219)	Entropy 0.96240 (0.96272)	Top-1 acc 47.656 (44.939)	Top-5 acc 70.703 (68.632)	lr 0.02315
Train [22][220/3239]	Time 0.611 (1.056)	Data Time 0.001 (0.099)	Loss 3.2007 (3.3229)	Entropy 0.96268 (0.96271)	Top-1 acc 47.266 (44.904)	Top-5 acc 71.484 (68.607)	lr 0.02315
Train [22][230/3239]	Time 0.688 (1.047)	Data Time 0.002 (0.095)	Loss 3.3223 (3.3215)	Entropy 0.96251 (0.96271)	Top-1 acc 42.969 (44.961)	Top-5 acc 66.797 (68.642)	lr 0.02315
Train [22][240/3239]	Time 0.606 (1.039)	Data Time 0.001 (0.091)	Loss 3.2456 (3.3212)	Entropy 0.96210 (0.96269)	Top-1 acc 43.750 (44.906)	Top-5 acc 68.750 (68.638)	lr 0.02315
Train [22][250/3239]	Time 0.640 (1.032)	Data Time 0.001 (0.087)	Loss 3.4085 (3.3224)	Entropy 0.96225 (0.96267)	Top-1 acc 42.188 (44.874)	Top-5 acc 63.672 (68.638)	lr 0.02314
Train [22][260/3239]	Time 0.587 (1.025)	Data Time 0.001 (0.084)	Loss 3.4340 (3.3239)	Entropy 0.96181 (0.96265)	Top-1 acc 39.062 (44.807)	Top-5 acc 69.141 (68.623)	lr 0.02314
Train [22][270/3239]	Time 0.631 (1.019)	Data Time 0.001 (0.081)	Loss 3.3018 (3.3255)	Entropy 0.96161 (0.96262)	Top-1 acc 46.875 (44.791)	Top-5 acc 69.922 (68.617)	lr 0.02314
Train [22][280/3239]	Time 0.614 (1.013)	Data Time 0.001 (0.078)	Loss 3.0723 (3.3271)	Entropy 0.96161 (0.96258)	Top-1 acc 50.000 (44.743)	Top-5 acc 75.391 (68.572)	lr 0.02314
Train [22][290/3239]	Time 0.637 (1.008)	Data Time 0.001 (0.076)	Loss 3.2438 (3.3265)	Entropy 0.96143 (0.96255)	Top-1 acc 49.609 (44.777)	Top-5 acc 71.094 (68.617)	lr 0.02314
Train [22][300/3239]	Time 0.671 (1.003)	Data Time 0.001 (0.073)	Loss 3.3116 (3.3257)	Entropy 0.96143 (0.96251)	Top-1 acc 44.531 (44.817)	Top-5 acc 70.703 (68.634)	lr 0.02314
Train [22][310/3239]	Time 0.572 (0.998)	Data Time 0.001 (0.071)	Loss 3.1832 (3.3226)	Entropy 0.96159 (0.96247)	Top-1 acc 49.219 (44.907)	Top-5 acc 72.656 (68.696)	lr 0.02314
Train [22][320/3239]	Time 0.590 (0.994)	Data Time 0.001 (0.069)	Loss 3.4209 (3.3223)	Entropy 0.96160 (0.96245)	Top-1 acc 42.969 (44.905)	Top-5 acc 68.750 (68.695)	lr 0.02314
Train [22][330/3239]	Time 0.606 (0.990)	Data Time 0.001 (0.067)	Loss 3.2829 (3.3229)	Entropy 0.96112 (0.96241)	Top-1 acc 46.484 (44.888)	Top-5 acc 68.750 (68.691)	lr 0.02314
Train [22][340/3239]	Time 0.577 (0.986)	Data Time 0.001 (0.065)	Loss 3.2953 (3.3252)	Entropy 0.96066 (0.96237)	Top-1 acc 44.922 (44.816)	Top-5 acc 69.141 (68.638)	lr 0.02314
Train [22][350/3239]	Time 0.601 (0.982)	Data Time 0.001 (0.063)	Loss 3.3076 (3.3254)	Entropy 0.96092 (0.96232)	Top-1 acc 45.703 (44.836)	Top-5 acc 69.922 (68.625)	lr 0.02314
Train [22][360/3239]	Time 0.554 (0.978)	Data Time 0.001 (0.061)	Loss 3.3042 (3.3244)	Entropy 0.96115 (0.96229)	Top-1 acc 44.531 (44.869)	Top-5 acc 68.359 (68.645)	lr 0.02314
Train [22][370/3239]	Time 0.594 (0.975)	Data Time 0.001 (0.060)	Loss 3.4826 (3.3251)	Entropy 0.96119 (0.96225)	Top-1 acc 39.844 (44.852)	Top-5 acc 65.234 (68.623)	lr 0.02314
Train [22][380/3239]	Time 0.610 (0.971)	Data Time 0.001 (0.058)	Loss 3.1417 (3.3239)	Entropy 0.96145 (0.96223)	Top-1 acc 48.828 (44.861)	Top-5 acc 72.656 (68.664)	lr 0.02314
Train [22][390/3239]	Time 0.692 (0.968)	Data Time 0.001 (0.057)	Loss 3.2538 (3.3226)	Entropy 0.96158 (0.96221)	Top-1 acc 44.141 (44.885)	Top-5 acc 69.141 (68.685)	lr 0.02314
Train [22][400/3239]	Time 0.601 (0.965)	Data Time 0.001 (0.055)	Loss 3.0231 (3.3233)	Entropy 0.96155 (0.96220)	Top-1 acc 49.219 (44.894)	Top-5 acc 76.172 (68.684)	lr 0.02314
Train [22][410/3239]	Time 0.636 (0.963)	Data Time 0.002 (0.054)	Loss 3.4886 (3.3213)	Entropy 0.96180 (0.96218)	Top-1 acc 43.750 (44.954)	Top-5 acc 65.625 (68.720)	lr 0.02314
Train [22][420/3239]	Time 0.610 (0.961)	Data Time 0.001 (0.053)	Loss 3.2475 (3.3203)	Entropy 0.96165 (0.96217)	Top-1 acc 48.828 (44.981)	Top-5 acc 69.141 (68.739)	lr 0.02314
Train [22][430/3239]	Time 0.607 (0.958)	Data Time 0.001 (0.052)	Loss 3.2321 (3.3213)	Entropy 0.96152 (0.96216)	Top-1 acc 44.531 (44.979)	Top-5 acc 68.750 (68.723)	lr 0.02314
Train [22][440/3239]	Time 0.616 (0.957)	Data Time 0.001 (0.051)	Loss 3.1258 (3.3201)	Entropy 0.96140 (0.96214)	Top-1 acc 50.000 (45.007)	Top-5 acc 71.875 (68.744)	lr 0.02313
Train [22][450/3239]	Time 0.631 (0.954)	Data Time 0.001 (0.049)	Loss 3.2853 (3.3199)	Entropy 0.96144 (0.96213)	Top-1 acc 41.797 (45.015)	Top-5 acc 68.359 (68.736)	lr 0.02313
Train [22][460/3239]	Time 0.711 (0.952)	Data Time 0.001 (0.048)	Loss 3.5107 (3.3207)	Entropy 0.96131 (0.96211)	Top-1 acc 37.500 (44.980)	Top-5 acc 62.500 (68.697)	lr 0.02313
Train [22][470/3239]	Time 0.612 (0.951)	Data Time 0.001 (0.047)	Loss 3.1918 (3.3194)	Entropy 0.96153 (0.96209)	Top-1 acc 50.391 (45.016)	Top-5 acc 71.484 (68.722)	lr 0.02313
Train [22][480/3239]	Time 0.609 (0.949)	Data Time 0.001 (0.046)	Loss 3.5117 (3.3201)	Entropy 0.96172 (0.96208)	Top-1 acc 43.359 (45.014)	Top-5 acc 60.547 (68.703)	lr 0.02313
Train [22][490/3239]	Time 0.591 (0.947)	Data Time 0.001 (0.046)	Loss 3.2383 (3.3196)	Entropy 0.96169 (0.96208)	Top-1 acc 46.094 (45.013)	Top-5 acc 70.312 (68.704)	lr 0.02313
Train [22][500/3239]	Time 0.604 (0.946)	Data Time 0.001 (0.045)	Loss 3.2560 (3.3193)	Entropy 0.96163 (0.96207)	Top-1 acc 44.531 (45.013)	Top-5 acc 71.094 (68.713)	lr 0.02313
Train [22][510/3239]	Time 0.623 (0.944)	Data Time 0.001 (0.044)	Loss 3.3133 (3.3204)	Entropy 0.96128 (0.96206)	Top-1 acc 46.094 (44.992)	Top-5 acc 72.656 (68.696)	lr 0.02313
Train [22][520/3239]	Time 0.581 (0.942)	Data Time 0.001 (0.043)	Loss 3.4367 (3.3204)	Entropy 0.96106 (0.96204)	Top-1 acc 39.844 (45.003)	Top-5 acc 66.797 (68.695)	lr 0.02313
Train [22][530/3239]	Time 0.676 (0.940)	Data Time 0.001 (0.042)	Loss 3.3488 (3.3203)	Entropy 0.96105 (0.96202)	Top-1 acc 42.969 (44.992)	Top-5 acc 70.312 (68.696)	lr 0.02313
Train [22][540/3239]	Time 0.622 (0.938)	Data Time 0.001 (0.042)	Loss 3.2500 (3.3195)	Entropy 0.96038 (0.96200)	Top-1 acc 45.703 (44.996)	Top-5 acc 71.484 (68.706)	lr 0.02313
Train [22][550/3239]	Time 0.642 (0.936)	Data Time 0.001 (0.041)	Loss 3.4822 (3.3206)	Entropy 0.96045 (0.96197)	Top-1 acc 41.016 (44.976)	Top-5 acc 65.625 (68.697)	lr 0.02313
Train [22][560/3239]	Time 0.578 (0.935)	Data Time 0.001 (0.040)	Loss 3.3135 (3.3213)	Entropy 0.96042 (0.96194)	Top-1 acc 44.531 (44.969)	Top-5 acc 71.094 (68.680)	lr 0.02313
Train [22][570/3239]	Time 0.624 (0.934)	Data Time 0.001 (0.039)	Loss 3.4018 (3.3211)	Entropy 0.96004 (0.96192)	Top-1 acc 45.703 (44.983)	Top-5 acc 69.141 (68.672)	lr 0.02313
Train [22][580/3239]	Time 0.639 (0.933)	Data Time 0.002 (0.039)	Loss 3.3825 (3.3216)	Entropy 0.95999 (0.96188)	Top-1 acc 43.750 (44.965)	Top-5 acc 67.969 (68.654)	lr 0.02313
Train [22][590/3239]	Time 0.619 (0.932)	Data Time 0.001 (0.038)	Loss 3.2527 (3.3202)	Entropy 0.96040 (0.96186)	Top-1 acc 46.094 (44.995)	Top-5 acc 71.094 (68.698)	lr 0.02313
Train [22][600/3239]	Time 0.617 (0.931)	Data Time 0.001 (0.038)	Loss 3.3112 (3.3215)	Entropy 0.96084 (0.96183)	Top-1 acc 43.359 (44.969)	Top-5 acc 71.484 (68.673)	lr 0.02313
Train [22][610/3239]	Time 0.593 (0.930)	Data Time 0.001 (0.037)	Loss 3.5179 (3.3234)	Entropy 0.96044 (0.96181)	Top-1 acc 41.016 (44.921)	Top-5 acc 64.844 (68.637)	lr 0.02313
Train [22][620/3239]	Time 0.689 (0.929)	Data Time 0.002 (0.036)	Loss 3.1721 (3.3228)	Entropy 0.96081 (0.96179)	Top-1 acc 44.141 (44.925)	Top-5 acc 71.094 (68.652)	lr 0.02313
Train [22][630/3239]	Time 0.627 (0.928)	Data Time 0.001 (0.036)	Loss 3.3431 (3.3235)	Entropy 0.96033 (0.96177)	Top-1 acc 44.141 (44.909)	Top-5 acc 68.750 (68.647)	lr 0.02312
Train [22][640/3239]	Time 0.643 (0.927)	Data Time 0.001 (0.035)	Loss 3.2775 (3.3226)	Entropy 0.96085 (0.96175)	Top-1 acc 47.656 (44.946)	Top-5 acc 67.969 (68.676)	lr 0.02312
Train [22][650/3239]	Time 0.611 (0.926)	Data Time 0.001 (0.035)	Loss 3.1943 (3.3216)	Entropy 0.96059 (0.96174)	Top-1 acc 43.359 (44.965)	Top-5 acc 71.484 (68.701)	lr 0.02312
Train [22][660/3239]	Time 0.568 (0.926)	Data Time 0.002 (0.034)	Loss 3.4806 (3.3216)	Entropy 0.96067 (0.96172)	Top-1 acc 42.969 (44.977)	Top-5 acc 67.188 (68.704)	lr 0.02312
Train [22][670/3239]	Time 0.586 (0.924)	Data Time 0.001 (0.034)	Loss 3.5799 (3.3212)	Entropy 0.96091 (0.96171)	Top-1 acc 36.719 (44.997)	Top-5 acc 65.625 (68.717)	lr 0.02312
Train [22][680/3239]	Time 0.632 (0.923)	Data Time 0.001 (0.033)	Loss 3.3462 (3.3214)	Entropy 0.96037 (0.96169)	Top-1 acc 44.922 (44.983)	Top-5 acc 67.188 (68.712)	lr 0.02312
Train [22][690/3239]	Time 0.707 (0.923)	Data Time 0.001 (0.033)	Loss 3.2155 (3.3217)	Entropy 0.95995 (0.96167)	Top-1 acc 48.438 (44.972)	Top-5 acc 71.484 (68.706)	lr 0.02312
Train [22][700/3239]	Time 0.623 (0.921)	Data Time 0.002 (0.032)	Loss 3.3107 (3.3224)	Entropy 0.96003 (0.96165)	Top-1 acc 47.266 (44.970)	Top-5 acc 67.578 (68.691)	lr 0.02312
Train [22][710/3239]	Time 0.574 (0.953)	Data Time 0.002 (0.032)	Loss 3.3121 (3.3217)	Entropy 0.95957 (0.96162)	Top-1 acc 44.141 (44.988)	Top-5 acc 70.312 (68.703)	lr 0.02312
Train [22][720/3239]	Time 0.610 (0.952)	Data Time 0.002 (0.032)	Loss 3.1712 (3.3214)	Entropy 0.95943 (0.96159)	Top-1 acc 50.391 (45.005)	Top-5 acc 73.828 (68.709)	lr 0.02312
Train [22][730/3239]	Time 0.614 (0.950)	Data Time 0.001 (0.031)	Loss 3.4141 (3.3214)	Entropy 0.95897 (0.96156)	Top-1 acc 40.625 (44.990)	Top-5 acc 68.359 (68.708)	lr 0.02312
Train [22][740/3239]	Time 0.617 (0.949)	Data Time 0.003 (0.031)	Loss 3.5420 (3.3227)	Entropy 0.95912 (0.96153)	Top-1 acc 41.406 (44.974)	Top-5 acc 65.234 (68.689)	lr 0.02312
Train [22][750/3239]	Time 0.591 (0.948)	Data Time 0.002 (0.031)	Loss 3.1184 (3.3226)	Entropy 0.95866 (0.96149)	Top-1 acc 46.094 (44.976)	Top-5 acc 72.656 (68.681)	lr 0.02312
Train [22][760/3239]	Time 0.590 (0.947)	Data Time 0.001 (0.030)	Loss 3.2178 (3.3227)	Entropy 0.95852 (0.96146)	Top-1 acc 50.391 (44.978)	Top-5 acc 68.359 (68.674)	lr 0.02312
Train [22][770/3239]	Time 0.588 (0.946)	Data Time 0.001 (0.030)	Loss 3.2718 (3.3219)	Entropy 0.95818 (0.96142)	Top-1 acc 47.656 (44.998)	Top-5 acc 70.703 (68.705)	lr 0.02312
Train [22][780/3239]	Time 0.716 (0.945)	Data Time 0.001 (0.029)	Loss 3.1522 (3.3215)	Entropy 0.95837 (0.96137)	Top-1 acc 46.875 (45.008)	Top-5 acc 75.391 (68.725)	lr 0.02312
Train [22][790/3239]	Time 0.568 (0.944)	Data Time 0.001 (0.029)	Loss 3.4800 (3.3213)	Entropy 0.95783 (0.96133)	Top-1 acc 41.406 (45.000)	Top-5 acc 65.625 (68.726)	lr 0.02312
Train [22][800/3239]	Time 0.583 (0.943)	Data Time 0.001 (0.029)	Loss 3.5141 (3.3220)	Entropy 0.95822 (0.96129)	Top-1 acc 37.891 (44.980)	Top-5 acc 66.797 (68.715)	lr 0.02312
Train [22][810/3239]	Time 0.620 (0.943)	Data Time 0.001 (0.028)	Loss 3.3004 (3.3231)	Entropy 0.95836 (0.96125)	Top-1 acc 43.359 (44.950)	Top-5 acc 69.531 (68.696)	lr 0.02312
Train [22][820/3239]	Time 0.518 (0.942)	Data Time 0.001 (0.028)	Loss 3.2517 (3.3227)	Entropy 0.95832 (0.96122)	Top-1 acc 48.438 (44.974)	Top-5 acc 70.312 (68.699)	lr 0.02311
Train [22][830/3239]	Time 0.639 (0.940)	Data Time 0.001 (0.028)	Loss 3.4449 (3.3228)	Entropy 0.95796 (0.96118)	Top-1 acc 43.750 (44.992)	Top-5 acc 64.844 (68.694)	lr 0.02311
Train [22][840/3239]	Time 0.629 (0.939)	Data Time 0.001 (0.028)	Loss 3.3580 (3.3228)	Entropy 0.95776 (0.96115)	Top-1 acc 45.703 (44.992)	Top-5 acc 67.969 (68.696)	lr 0.02311
Train [22][850/3239]	Time 0.761 (0.938)	Data Time 0.001 (0.027)	Loss 3.1825 (3.3228)	Entropy 0.95758 (0.96111)	Top-1 acc 50.000 (45.004)	Top-5 acc 70.312 (68.700)	lr 0.02311
Train [22][860/3239]	Time 0.592 (0.937)	Data Time 0.001 (0.027)	Loss 3.4570 (3.3226)	Entropy 0.95755 (0.96106)	Top-1 acc 41.016 (45.011)	Top-5 acc 66.016 (68.708)	lr 0.02311
Train [22][870/3239]	Time 0.610 (0.936)	Data Time 0.001 (0.027)	Loss 3.3345 (3.3220)	Entropy 0.95762 (0.96102)	Top-1 acc 46.094 (45.017)	Top-5 acc 70.703 (68.728)	lr 0.02311
Train [22][880/3239]	Time 0.633 (0.936)	Data Time 0.001 (0.026)	Loss 3.2980 (3.3224)	Entropy 0.95805 (0.96099)	Top-1 acc 48.828 (45.013)	Top-5 acc 68.359 (68.727)	lr 0.02311
Train [22][890/3239]	Time 0.608 (0.935)	Data Time 0.001 (0.026)	Loss 3.2862 (3.3219)	Entropy 0.95813 (0.96095)	Top-1 acc 45.312 (45.033)	Top-5 acc 67.188 (68.736)	lr 0.02311
Train [22][900/3239]	Time 0.584 (0.934)	Data Time 0.001 (0.026)	Loss 3.5078 (3.3220)	Entropy 0.95784 (0.96092)	Top-1 acc 42.969 (45.041)	Top-5 acc 63.672 (68.740)	lr 0.02311
Train [22][910/3239]	Time 0.597 (0.934)	Data Time 0.001 (0.026)	Loss 3.3204 (3.3219)	Entropy 0.95793 (0.96089)	Top-1 acc 43.750 (45.041)	Top-5 acc 68.359 (68.745)	lr 0.02311
Train [22][920/3239]	Time 0.634 (0.933)	Data Time 0.001 (0.025)	Loss 3.1725 (3.3213)	Entropy 0.95809 (0.96086)	Top-1 acc 48.047 (45.052)	Top-5 acc 73.828 (68.764)	lr 0.02311
Train [22][930/3239]	Time 0.597 (0.932)	Data Time 0.001 (0.025)	Loss 3.3110 (3.3213)	Entropy 0.95801 (0.96082)	Top-1 acc 42.969 (45.044)	Top-5 acc 69.531 (68.773)	lr 0.02311
Train [22][940/3239]	Time 0.661 (0.932)	Data Time 0.001 (0.025)	Loss 3.1897 (3.3210)	Entropy 0.95764 (0.96079)	Top-1 acc 47.656 (45.042)	Top-5 acc 71.875 (68.783)	lr 0.02311
Train [22][950/3239]	Time 0.649 (0.931)	Data Time 0.001 (0.025)	Loss 3.2589 (3.3210)	Entropy 0.95795 (0.96076)	Top-1 acc 46.875 (45.029)	Top-5 acc 69.922 (68.789)	lr 0.02311
Train [22][960/3239]	Time 0.619 (0.930)	Data Time 0.002 (0.024)	Loss 3.2773 (3.3211)	Entropy 0.95760 (0.96073)	Top-1 acc 45.312 (45.041)	Top-5 acc 70.703 (68.788)	lr 0.02311
Train [22][970/3239]	Time 0.592 (0.930)	Data Time 0.001 (0.024)	Loss 3.5293 (3.3220)	Entropy 0.95766 (0.96070)	Top-1 acc 39.844 (45.021)	Top-5 acc 62.891 (68.757)	lr 0.02311
Train [22][980/3239]	Time 0.538 (0.929)	Data Time 0.001 (0.024)	Loss 3.4011 (3.3222)	Entropy 0.95764 (0.96067)	Top-1 acc 42.578 (45.013)	Top-5 acc 68.750 (68.755)	lr 0.02311
Train [22][990/3239]	Time 0.599 (0.928)	Data Time 0.001 (0.024)	Loss 3.2767 (3.3229)	Entropy 0.95727 (0.96064)	Top-1 acc 44.922 (45.009)	Top-5 acc 69.922 (68.744)	lr 0.02311
Train [22][1000/3239]	Time 0.622 (0.927)	Data Time 0.001 (0.023)	Loss 3.5232 (3.3230)	Entropy 0.95698 (0.96060)	Top-1 acc 35.547 (44.997)	Top-5 acc 66.016 (68.749)	lr 0.02310
Train [22][1010/3239]	Time 0.716 (0.927)	Data Time 0.001 (0.023)	Loss 3.1423 (3.3231)	Entropy 0.95676 (0.96056)	Top-1 acc 49.219 (44.985)	Top-5 acc 71.875 (68.753)	lr 0.02310
Train [22][1020/3239]	Time 0.437 (0.926)	Data Time 0.001 (0.023)	Loss 3.3685 (3.3235)	Entropy 0.95649 (0.96053)	Top-1 acc 39.844 (44.968)	Top-5 acc 66.016 (68.747)	lr 0.02310
Train [22][1030/3239]	Time 0.619 (0.925)	Data Time 0.001 (0.023)	Loss 3.2247 (3.3230)	Entropy 0.95638 (0.96049)	Top-1 acc 46.094 (44.975)	Top-5 acc 71.484 (68.765)	lr 0.02310
Train [22][1040/3239]	Time 0.610 (0.925)	Data Time 0.001 (0.023)	Loss 3.4616 (3.3232)	Entropy 0.95611 (0.96045)	Top-1 acc 42.188 (44.972)	Top-5 acc 64.844 (68.755)	lr 0.02310
Train [22][1050/3239]	Time 0.617 (0.924)	Data Time 0.001 (0.022)	Loss 3.4314 (3.3227)	Entropy 0.95597 (0.96041)	Top-1 acc 42.188 (44.988)	Top-5 acc 64.844 (68.763)	lr 0.02310
Train [22][1060/3239]	Time 0.620 (0.924)	Data Time 0.001 (0.022)	Loss 3.2647 (3.3227)	Entropy 0.95572 (0.96037)	Top-1 acc 43.750 (44.984)	Top-5 acc 69.141 (68.759)	lr 0.02310
Train [22][1070/3239]	Time 0.586 (0.923)	Data Time 0.001 (0.022)	Loss 3.3007 (3.3225)	Entropy 0.95617 (0.96032)	Top-1 acc 44.141 (44.986)	Top-5 acc 66.797 (68.757)	lr 0.02310
Train [22][1080/3239]	Time 0.606 (0.923)	Data Time 0.001 (0.022)	Loss 3.3614 (3.3226)	Entropy 0.95602 (0.96028)	Top-1 acc 47.266 (44.987)	Top-5 acc 69.922 (68.759)	lr 0.02310
Train [22][1090/3239]	Time 0.592 (0.922)	Data Time 0.001 (0.022)	Loss 3.3354 (3.3234)	Entropy 0.95602 (0.96025)	Top-1 acc 47.656 (44.968)	Top-5 acc 67.188 (68.745)	lr 0.02310
Train [22][1100/3239]	Time 0.607 (0.922)	Data Time 0.001 (0.021)	Loss 3.3045 (3.3233)	Entropy 0.95558 (0.96021)	Top-1 acc 44.141 (44.971)	Top-5 acc 71.094 (68.742)	lr 0.02310
Train [22][1110/3239]	Time 0.621 (0.921)	Data Time 0.001 (0.021)	Loss 3.4988 (3.3237)	Entropy 0.95530 (0.96017)	Top-1 acc 42.578 (44.964)	Top-5 acc 63.281 (68.727)	lr 0.02310
Train [22][1120/3239]	Time 0.618 (0.920)	Data Time 0.001 (0.021)	Loss 3.2470 (3.3240)	Entropy 0.95481 (0.96012)	Top-1 acc 46.094 (44.945)	Top-5 acc 73.438 (68.732)	lr 0.02310
Train [22][1130/3239]	Time 0.631 (0.920)	Data Time 0.001 (0.021)	Loss 3.2244 (3.3241)	Entropy 0.95443 (0.96007)	Top-1 acc 44.922 (44.932)	Top-5 acc 71.875 (68.729)	lr 0.02310
Train [22][1140/3239]	Time 0.547 (0.919)	Data Time 0.001 (0.021)	Loss 3.4656 (3.3239)	Entropy 0.95450 (0.96002)	Top-1 acc 43.359 (44.926)	Top-5 acc 65.625 (68.742)	lr 0.02310
Train [22][1150/3239]	Time 0.611 (0.919)	Data Time 0.001 (0.021)	Loss 3.4646 (3.3247)	Entropy 0.95461 (0.95998)	Top-1 acc 41.016 (44.911)	Top-5 acc 64.844 (68.730)	lr 0.02310
Train [22][1160/3239]	Time 0.624 (0.918)	Data Time 0.001 (0.020)	Loss 3.3380 (3.3243)	Entropy 0.95495 (0.95993)	Top-1 acc 44.141 (44.915)	Top-5 acc 67.969 (68.747)	lr 0.02310
Train [22][1170/3239]	Time 0.704 (0.918)	Data Time 0.001 (0.020)	Loss 3.2888 (3.3240)	Entropy 0.95421 (0.95989)	Top-1 acc 43.750 (44.924)	Top-5 acc 69.141 (68.753)	lr 0.02310
Train [22][1180/3239]	Time 0.490 (0.917)	Data Time 0.001 (0.020)	Loss 3.3683 (3.3242)	Entropy 0.95385 (0.95984)	Top-1 acc 43.750 (44.910)	Top-5 acc 65.625 (68.744)	lr 0.02310
Train [22][1190/3239]	Time 0.571 (0.917)	Data Time 0.002 (0.020)	Loss 3.4812 (3.3247)	Entropy 0.95331 (0.95979)	Top-1 acc 44.141 (44.898)	Top-5 acc 64.844 (68.731)	lr 0.02309
Train [22][1200/3239]	Time 0.616 (0.916)	Data Time 0.002 (0.020)	Loss 3.3504 (3.3244)	Entropy 0.95325 (0.95973)	Top-1 acc 43.750 (44.905)	Top-5 acc 65.625 (68.729)	lr 0.02309
Train [22][1210/3239]	Time 0.586 (0.916)	Data Time 0.001 (0.020)	Loss 3.2217 (3.3243)	Entropy 0.95320 (0.95968)	Top-1 acc 44.141 (44.904)	Top-5 acc 70.703 (68.738)	lr 0.02309
Train [22][1220/3239]	Time 0.641 (0.916)	Data Time 0.001 (0.020)	Loss 3.2489 (3.3243)	Entropy 0.95271 (0.95962)	Top-1 acc 44.922 (44.904)	Top-5 acc 71.484 (68.738)	lr 0.02309
Train [22][1230/3239]	Time 0.594 (0.915)	Data Time 0.001 (0.019)	Loss 3.4754 (3.3250)	Entropy 0.95299 (0.95957)	Top-1 acc 39.844 (44.885)	Top-5 acc 67.578 (68.726)	lr 0.02309
Train [22][1240/3239]	Time 0.683 (0.915)	Data Time 0.001 (0.019)	Loss 3.2521 (3.3252)	Entropy 0.95256 (0.95951)	Top-1 acc 42.969 (44.880)	Top-5 acc 69.922 (68.723)	lr 0.02309
Train [22][1250/3239]	Time 0.595 (0.914)	Data Time 0.001 (0.019)	Loss 3.2355 (3.3252)	Entropy 0.95274 (0.95946)	Top-1 acc 49.219 (44.876)	Top-5 acc 71.484 (68.730)	lr 0.02309
Train [22][1260/3239]	Time 0.623 (0.914)	Data Time 0.001 (0.019)	Loss 3.2830 (3.3252)	Entropy 0.95232 (0.95940)	Top-1 acc 48.438 (44.881)	Top-5 acc 66.406 (68.728)	lr 0.02309
Train [22][1270/3239]	Time 0.640 (0.914)	Data Time 0.002 (0.019)	Loss 3.1431 (3.3245)	Entropy 0.95227 (0.95935)	Top-1 acc 48.438 (44.895)	Top-5 acc 68.750 (68.731)	lr 0.02309
Train [22][1280/3239]	Time 0.644 (0.913)	Data Time 0.001 (0.019)	Loss 3.1938 (3.3246)	Entropy 0.95189 (0.95929)	Top-1 acc 50.781 (44.899)	Top-5 acc 69.922 (68.726)	lr 0.02309
Train [22][1290/3239]	Time 0.645 (0.913)	Data Time 0.001 (0.019)	Loss 3.1358 (3.3241)	Entropy 0.95155 (0.95923)	Top-1 acc 49.219 (44.908)	Top-5 acc 70.312 (68.738)	lr 0.02309
Train [22][1300/3239]	Time 0.585 (0.913)	Data Time 0.001 (0.018)	Loss 3.3859 (3.3237)	Entropy 0.95162 (0.95918)	Top-1 acc 41.016 (44.920)	Top-5 acc 66.406 (68.743)	lr 0.02309
Train [22][1310/3239]	Time 0.618 (0.912)	Data Time 0.001 (0.018)	Loss 3.0716 (3.3242)	Entropy 0.95151 (0.95912)	Top-1 acc 49.609 (44.903)	Top-5 acc 75.000 (68.734)	lr 0.02309
Train [22][1320/3239]	Time 0.592 (0.912)	Data Time 0.001 (0.018)	Loss 3.3593 (3.3243)	Entropy 0.95138 (0.95906)	Top-1 acc 44.141 (44.889)	Top-5 acc 67.969 (68.731)	lr 0.02309
Train [22][1330/3239]	Time 0.710 (0.912)	Data Time 0.002 (0.018)	Loss 3.3009 (3.3240)	Entropy 0.95137 (0.95900)	Top-1 acc 47.656 (44.891)	Top-5 acc 70.312 (68.740)	lr 0.02309
Train [22][1340/3239]	Time 0.448 (0.911)	Data Time 0.001 (0.018)	Loss 3.2805 (3.3240)	Entropy 0.95173 (0.95895)	Top-1 acc 45.312 (44.897)	Top-5 acc 68.750 (68.745)	lr 0.02309
Train [22][1350/3239]	Time 0.577 (0.911)	Data Time 0.001 (0.018)	Loss 3.4515 (3.3238)	Entropy 0.95138 (0.95889)	Top-1 acc 40.234 (44.902)	Top-5 acc 66.797 (68.752)	lr 0.02309
Train [22][1360/3239]	Time 0.738 (0.928)	Data Time 0.004 (0.018)	Loss 3.3778 (3.3239)	Entropy 0.95085 (0.95884)	Top-1 acc 41.797 (44.898)	Top-5 acc 70.312 (68.752)	lr 0.02309
Train [22][1370/3239]	Time 0.601 (0.928)	Data Time 0.002 (0.018)	Loss 3.2482 (3.3242)	Entropy 0.95101 (0.95878)	Top-1 acc 49.219 (44.891)	Top-5 acc 70.312 (68.743)	lr 0.02309
Train [22][1380/3239]	Time 0.603 (0.927)	Data Time 0.001 (0.018)	Loss 3.2091 (3.3243)	Entropy 0.95096 (0.95872)	Top-1 acc 50.000 (44.892)	Top-5 acc 70.703 (68.734)	lr 0.02308
Train [22][1390/3239]	Time 0.618 (0.927)	Data Time 0.001 (0.017)	Loss 3.7096 (3.3247)	Entropy 0.95118 (0.95867)	Top-1 acc 36.719 (44.882)	Top-5 acc 62.891 (68.730)	lr 0.02308
Train [22][1400/3239]	Time 0.663 (0.926)	Data Time 0.001 (0.017)	Loss 3.3738 (3.3250)	Entropy 0.95140 (0.95861)	Top-1 acc 42.578 (44.874)	Top-5 acc 69.531 (68.724)	lr 0.02308
Train [22][1410/3239]	Time 0.588 (0.926)	Data Time 0.001 (0.017)	Loss 3.2940 (3.3248)	Entropy 0.95081 (0.95856)	Top-1 acc 44.922 (44.881)	Top-5 acc 69.531 (68.728)	lr 0.02308
Train [22][1420/3239]	Time 0.634 (0.925)	Data Time 0.001 (0.017)	Loss 3.4282 (3.3250)	Entropy 0.95060 (0.95851)	Top-1 acc 42.969 (44.876)	Top-5 acc 65.625 (68.720)	lr 0.02308
Train [22][1430/3239]	Time 0.609 (0.925)	Data Time 0.001 (0.017)	Loss 3.4423 (3.3256)	Entropy 0.95103 (0.95845)	Top-1 acc 44.922 (44.872)	Top-5 acc 66.016 (68.712)	lr 0.02308
Train [22][1440/3239]	Time 0.603 (0.925)	Data Time 0.001 (0.017)	Loss 3.2985 (3.3253)	Entropy 0.95128 (0.95840)	Top-1 acc 44.531 (44.877)	Top-5 acc 66.797 (68.708)	lr 0.02308
Train [22][1450/3239]	Time 0.602 (0.924)	Data Time 0.001 (0.017)	Loss 3.2772 (3.3249)	Entropy 0.95119 (0.95835)	Top-1 acc 43.750 (44.880)	Top-5 acc 69.531 (68.717)	lr 0.02308
Train [22][1460/3239]	Time 0.604 (0.924)	Data Time 0.001 (0.017)	Loss 3.3780 (3.3251)	Entropy 0.95133 (0.95830)	Top-1 acc 49.609 (44.882)	Top-5 acc 71.484 (68.718)	lr 0.02308
Train [22][1470/3239]	Time 0.613 (0.923)	Data Time 0.001 (0.017)	Loss 2.9619 (3.3245)	Entropy 0.95113 (0.95826)	Top-1 acc 52.734 (44.902)	Top-5 acc 75.000 (68.724)	lr 0.02308
Train [22][1480/3239]	Time 0.582 (0.923)	Data Time 0.001 (0.017)	Loss 3.3027 (3.3245)	Entropy 0.95105 (0.95821)	Top-1 acc 47.656 (44.896)	Top-5 acc 68.750 (68.727)	lr 0.02308
Train [22][1490/3239]	Time 0.714 (0.922)	Data Time 0.001 (0.016)	Loss 3.3433 (3.3245)	Entropy 0.95118 (0.95816)	Top-1 acc 48.047 (44.896)	Top-5 acc 71.484 (68.729)	lr 0.02308
Train [22][1500/3239]	Time 0.606 (0.922)	Data Time 0.001 (0.016)	Loss 3.3114 (3.3246)	Entropy 0.95121 (0.95811)	Top-1 acc 43.750 (44.897)	Top-5 acc 68.750 (68.724)	lr 0.02308
Train [22][1510/3239]	Time 0.564 (0.921)	Data Time 0.001 (0.016)	Loss 3.3934 (3.3248)	Entropy 0.95132 (0.95807)	Top-1 acc 41.406 (44.887)	Top-5 acc 66.016 (68.718)	lr 0.02308
Train [22][1520/3239]	Time 0.632 (0.921)	Data Time 0.001 (0.016)	Loss 3.1417 (3.3244)	Entropy 0.95211 (0.95803)	Top-1 acc 51.172 (44.892)	Top-5 acc 69.922 (68.729)	lr 0.02308
Train [22][1530/3239]	Time 0.638 (0.921)	Data Time 0.002 (0.016)	Loss 3.3121 (3.3246)	Entropy 0.95122 (0.95798)	Top-1 acc 42.578 (44.890)	Top-5 acc 69.922 (68.734)	lr 0.02308
Train [22][1540/3239]	Time 0.657 (0.920)	Data Time 0.001 (0.016)	Loss 3.4363 (3.3244)	Entropy 0.95094 (0.95794)	Top-1 acc 42.578 (44.882)	Top-5 acc 69.141 (68.741)	lr 0.02308
Train [22][1550/3239]	Time 0.621 (0.920)	Data Time 0.002 (0.016)	Loss 3.2685 (3.3248)	Entropy 0.95097 (0.95789)	Top-1 acc 45.703 (44.875)	Top-5 acc 71.094 (68.732)	lr 0.02308
Train [22][1560/3239]	Time 0.711 (0.920)	Data Time 0.001 (0.016)	Loss 3.4537 (3.3251)	Entropy 0.95076 (0.95785)	Top-1 acc 40.625 (44.869)	Top-5 acc 68.359 (68.724)	lr 0.02307
Train [22][1570/3239]	Time 0.576 (0.919)	Data Time 0.001 (0.016)	Loss 3.4644 (3.3252)	Entropy 0.95081 (0.95780)	Top-1 acc 41.406 (44.862)	Top-5 acc 66.016 (68.717)	lr 0.02307
Train [22][1580/3239]	Time 0.600 (0.919)	Data Time 0.001 (0.016)	Loss 3.3152 (3.3257)	Entropy 0.95076 (0.95776)	Top-1 acc 43.750 (44.852)	Top-5 acc 68.750 (68.709)	lr 0.02307
Train [22][1590/3239]	Time 0.651 (0.919)	Data Time 0.001 (0.016)	Loss 3.3420 (3.3258)	Entropy 0.95058 (0.95772)	Top-1 acc 47.266 (44.855)	Top-5 acc 68.359 (68.709)	lr 0.02307
Train [22][1600/3239]	Time 0.618 (0.918)	Data Time 0.001 (0.015)	Loss 3.2881 (3.3253)	Entropy 0.95069 (0.95767)	Top-1 acc 46.094 (44.868)	Top-5 acc 66.797 (68.716)	lr 0.02307
Train [22][1610/3239]	Time 0.617 (0.918)	Data Time 0.001 (0.015)	Loss 3.3731 (3.3251)	Entropy 0.95039 (0.95763)	Top-1 acc 41.016 (44.865)	Top-5 acc 68.750 (68.725)	lr 0.02307
Train [22][1620/3239]	Time 0.608 (0.918)	Data Time 0.001 (0.015)	Loss 3.3045 (3.3250)	Entropy 0.95046 (0.95758)	Top-1 acc 48.438 (44.865)	Top-5 acc 67.969 (68.728)	lr 0.02307
Train [22][1630/3239]	Time 0.655 (0.917)	Data Time 0.001 (0.015)	Loss 3.3437 (3.3249)	Entropy 0.95025 (0.95754)	Top-1 acc 44.141 (44.864)	Top-5 acc 69.922 (68.729)	lr 0.02307
Train [22][1640/3239]	Time 0.606 (0.917)	Data Time 0.001 (0.015)	Loss 3.3156 (3.3252)	Entropy 0.95022 (0.95749)	Top-1 acc 46.484 (44.858)	Top-5 acc 68.750 (68.720)	lr 0.02307
Train [22][1650/3239]	Time 0.605 (0.917)	Data Time 0.003 (0.015)	Loss 3.6135 (3.3252)	Entropy 0.94992 (0.95745)	Top-1 acc 41.016 (44.858)	Top-5 acc 64.062 (68.712)	lr 0.02307
Train [22][1660/3239]	Time 0.575 (0.916)	Data Time 0.001 (0.015)	Loss 3.0859 (3.3249)	Entropy 0.94955 (0.95740)	Top-1 acc 50.000 (44.864)	Top-5 acc 69.531 (68.713)	lr 0.02307
Train [22][1670/3239]	Time 0.603 (0.916)	Data Time 0.003 (0.015)	Loss 3.4448 (3.3248)	Entropy 0.94949 (0.95736)	Top-1 acc 42.969 (44.865)	Top-5 acc 68.359 (68.718)	lr 0.02307
Train [22][1680/3239]	Time 0.597 (0.915)	Data Time 0.001 (0.015)	Loss 3.0492 (3.3245)	Entropy 0.94929 (0.95731)	Top-1 acc 50.781 (44.868)	Top-5 acc 73.047 (68.725)	lr 0.02307
Train [22][1690/3239]	Time 0.544 (0.915)	Data Time 0.001 (0.015)	Loss 3.6070 (3.3244)	Entropy 0.94892 (0.95726)	Top-1 acc 37.500 (44.869)	Top-5 acc 64.844 (68.730)	lr 0.02307
Train [22][1700/3239]	Time 0.616 (0.915)	Data Time 0.001 (0.015)	Loss 3.1388 (3.3245)	Entropy 0.94885 (0.95721)	Top-1 acc 46.875 (44.860)	Top-5 acc 70.703 (68.726)	lr 0.02307
Train [22][1710/3239]	Time 0.610 (0.914)	Data Time 0.001 (0.015)	Loss 3.2811 (3.3243)	Entropy 0.94896 (0.95716)	Top-1 acc 45.703 (44.867)	Top-5 acc 70.312 (68.732)	lr 0.02307
Train [22][1720/3239]	Time 0.659 (0.914)	Data Time 0.002 (0.015)	Loss 3.5762 (3.3245)	Entropy 0.94863 (0.95711)	Top-1 acc 39.844 (44.859)	Top-5 acc 66.406 (68.725)	lr 0.02307
Train [22][1730/3239]	Time 0.594 (0.914)	Data Time 0.001 (0.014)	Loss 3.4901 (3.3242)	Entropy 0.94851 (0.95706)	Top-1 acc 41.016 (44.866)	Top-5 acc 62.500 (68.729)	lr 0.02307
Train [22][1740/3239]	Time 0.579 (0.913)	Data Time 0.002 (0.014)	Loss 3.4538 (3.3240)	Entropy 0.94743 (0.95701)	Top-1 acc 39.062 (44.864)	Top-5 acc 65.625 (68.731)	lr 0.02307
Train [22][1750/3239]	Time 0.619 (0.913)	Data Time 0.001 (0.014)	Loss 3.2535 (3.3239)	Entropy 0.94762 (0.95696)	Top-1 acc 47.266 (44.862)	Top-5 acc 69.922 (68.732)	lr 0.02306
Train [22][1760/3239]	Time 0.581 (0.913)	Data Time 0.001 (0.014)	Loss 3.4889 (3.3243)	Entropy 0.94736 (0.95690)	Top-1 acc 39.453 (44.854)	Top-5 acc 67.188 (68.726)	lr 0.02306
Train [22][1770/3239]	Time 0.590 (0.913)	Data Time 0.001 (0.014)	Loss 3.2521 (3.3242)	Entropy 0.94715 (0.95685)	Top-1 acc 46.875 (44.857)	Top-5 acc 72.266 (68.732)	lr 0.02306
Train [22][1780/3239]	Time 0.621 (0.912)	Data Time 0.001 (0.014)	Loss 3.3732 (3.3239)	Entropy 0.94720 (0.95679)	Top-1 acc 42.969 (44.861)	Top-5 acc 67.188 (68.740)	lr 0.02306
Train [22][1790/3239]	Time 0.707 (0.912)	Data Time 0.001 (0.014)	Loss 3.0798 (3.3238)	Entropy 0.94660 (0.95674)	Top-1 acc 47.266 (44.868)	Top-5 acc 73.047 (68.739)	lr 0.02306
Train [22][1800/3239]	Time 0.584 (0.912)	Data Time 0.001 (0.014)	Loss 3.2473 (3.3237)	Entropy 0.94699 (0.95668)	Top-1 acc 44.531 (44.869)	Top-5 acc 70.703 (68.743)	lr 0.02306
Train [22][1810/3239]	Time 0.568 (0.911)	Data Time 0.001 (0.014)	Loss 3.1894 (3.3240)	Entropy 0.94718 (0.95663)	Top-1 acc 48.828 (44.860)	Top-5 acc 71.875 (68.739)	lr 0.02306
Train [22][1820/3239]	Time 0.589 (0.911)	Data Time 0.001 (0.014)	Loss 3.1993 (3.3240)	Entropy 0.94772 (0.95658)	Top-1 acc 48.047 (44.860)	Top-5 acc 69.531 (68.742)	lr 0.02306
Train [22][1830/3239]	Time 0.629 (0.911)	Data Time 0.001 (0.014)	Loss 3.4765 (3.3240)	Entropy 0.94762 (0.95653)	Top-1 acc 41.016 (44.860)	Top-5 acc 67.188 (68.743)	lr 0.02306
Train [22][1840/3239]	Time 0.574 (0.910)	Data Time 0.001 (0.014)	Loss 3.2679 (3.3241)	Entropy 0.94773 (0.95648)	Top-1 acc 46.094 (44.859)	Top-5 acc 69.922 (68.744)	lr 0.02306
Train [22][1850/3239]	Time 0.583 (0.910)	Data Time 0.001 (0.014)	Loss 3.2237 (3.3241)	Entropy 0.94739 (0.95644)	Top-1 acc 47.266 (44.862)	Top-5 acc 69.922 (68.745)	lr 0.02306
Train [22][1860/3239]	Time 0.609 (0.910)	Data Time 0.001 (0.014)	Loss 3.4348 (3.3240)	Entropy 0.94742 (0.95639)	Top-1 acc 43.359 (44.864)	Top-5 acc 66.797 (68.745)	lr 0.02306
Train [22][1870/3239]	Time 0.664 (0.909)	Data Time 0.001 (0.014)	Loss 3.6208 (3.3240)	Entropy 0.94703 (0.95634)	Top-1 acc 39.844 (44.864)	Top-5 acc 64.453 (68.747)	lr 0.02306
Train [22][1880/3239]	Time 0.595 (0.909)	Data Time 0.001 (0.013)	Loss 3.3921 (3.3241)	Entropy 0.94741 (0.95629)	Top-1 acc 42.578 (44.865)	Top-5 acc 64.062 (68.740)	lr 0.02306
Train [22][1890/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.013)	Loss 3.4613 (3.3239)	Entropy 0.94719 (0.95624)	Top-1 acc 42.969 (44.869)	Top-5 acc 64.453 (68.741)	lr 0.02306
Train [22][1900/3239]	Time 0.631 (0.909)	Data Time 0.001 (0.013)	Loss 3.2307 (3.3239)	Entropy 0.94730 (0.95620)	Top-1 acc 48.438 (44.874)	Top-5 acc 71.484 (68.743)	lr 0.02306
Train [22][1910/3239]	Time 0.592 (0.908)	Data Time 0.001 (0.013)	Loss 3.3048 (3.3241)	Entropy 0.94724 (0.95615)	Top-1 acc 41.016 (44.867)	Top-5 acc 70.703 (68.738)	lr 0.02306
Train [22][1920/3239]	Time 0.576 (0.908)	Data Time 0.001 (0.013)	Loss 3.1620 (3.3238)	Entropy 0.94647 (0.95610)	Top-1 acc 48.438 (44.871)	Top-5 acc 74.609 (68.743)	lr 0.02306
Train [22][1930/3239]	Time 0.618 (0.908)	Data Time 0.001 (0.013)	Loss 3.1433 (3.3237)	Entropy 0.94653 (0.95605)	Top-1 acc 50.391 (44.873)	Top-5 acc 72.656 (68.740)	lr 0.02305
Train [22][1940/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.013)	Loss 3.2755 (3.3236)	Entropy 0.94629 (0.95600)	Top-1 acc 46.484 (44.874)	Top-5 acc 71.875 (68.743)	lr 0.02305
Train [22][1950/3239]	Time 0.728 (0.907)	Data Time 0.001 (0.013)	Loss 3.2873 (3.3234)	Entropy 0.94588 (0.95595)	Top-1 acc 44.922 (44.877)	Top-5 acc 69.531 (68.745)	lr 0.02305
Train [22][1960/3239]	Time 0.603 (0.907)	Data Time 0.001 (0.013)	Loss 3.1234 (3.3231)	Entropy 0.94600 (0.95590)	Top-1 acc 48.047 (44.884)	Top-5 acc 72.266 (68.750)	lr 0.02305
Train [22][1970/3239]	Time 0.630 (0.907)	Data Time 0.001 (0.013)	Loss 3.3454 (3.3229)	Entropy 0.94577 (0.95585)	Top-1 acc 44.141 (44.884)	Top-5 acc 66.797 (68.756)	lr 0.02305
Train [22][1980/3239]	Time 0.548 (0.907)	Data Time 0.001 (0.013)	Loss 3.5567 (3.3227)	Entropy 0.94556 (0.95580)	Top-1 acc 40.234 (44.890)	Top-5 acc 64.062 (68.761)	lr 0.02305
Train [22][1990/3239]	Time 0.599 (0.907)	Data Time 0.001 (0.013)	Loss 3.2656 (3.3223)	Entropy 0.94582 (0.95575)	Top-1 acc 43.750 (44.899)	Top-5 acc 71.484 (68.773)	lr 0.02305
Train [22][2000/3239]	Time 0.607 (0.906)	Data Time 0.001 (0.013)	Loss 3.2149 (3.3222)	Entropy 0.94516 (0.95570)	Top-1 acc 46.875 (44.898)	Top-5 acc 69.531 (68.771)	lr 0.02305
Train [22][2010/3239]	Time 0.625 (0.906)	Data Time 0.002 (0.013)	Loss 3.5334 (3.3222)	Entropy 0.94585 (0.95565)	Top-1 acc 41.016 (44.895)	Top-5 acc 62.500 (68.768)	lr 0.02305
Train [22][2020/3239]	Time 0.581 (0.919)	Data Time 0.003 (0.013)	Loss 3.1882 (3.3220)	Entropy 0.94587 (0.95560)	Top-1 acc 46.484 (44.898)	Top-5 acc 72.266 (68.774)	lr 0.02305
Train [22][2030/3239]	Time 0.624 (0.919)	Data Time 0.002 (0.013)	Loss 3.3472 (3.3223)	Entropy 0.94556 (0.95555)	Top-1 acc 42.188 (44.891)	Top-5 acc 67.969 (68.770)	lr 0.02305
Train [22][2040/3239]	Time 0.596 (0.919)	Data Time 0.001 (0.013)	Loss 3.3458 (3.3224)	Entropy 0.94536 (0.95550)	Top-1 acc 42.578 (44.889)	Top-5 acc 66.016 (68.766)	lr 0.02305
Train [22][2050/3239]	Time 0.580 (0.919)	Data Time 0.001 (0.013)	Loss 3.4533 (3.3224)	Entropy 0.94501 (0.95545)	Top-1 acc 44.141 (44.885)	Top-5 acc 66.797 (68.772)	lr 0.02305
Train [22][2060/3239]	Time 0.608 (0.918)	Data Time 0.001 (0.012)	Loss 3.4368 (3.3223)	Entropy 0.94490 (0.95540)	Top-1 acc 41.406 (44.884)	Top-5 acc 66.016 (68.770)	lr 0.02305
Train [22][2070/3239]	Time 0.602 (0.918)	Data Time 0.001 (0.012)	Loss 3.2622 (3.3222)	Entropy 0.94461 (0.95535)	Top-1 acc 42.188 (44.880)	Top-5 acc 67.188 (68.767)	lr 0.02305
Train [22][2080/3239]	Time 0.691 (0.918)	Data Time 0.001 (0.012)	Loss 3.1342 (3.3221)	Entropy 0.94436 (0.95530)	Top-1 acc 47.266 (44.879)	Top-5 acc 71.094 (68.768)	lr 0.02305
Train [22][2090/3239]	Time 0.596 (0.918)	Data Time 0.001 (0.012)	Loss 3.2410 (3.3225)	Entropy 0.94418 (0.95524)	Top-1 acc 45.312 (44.872)	Top-5 acc 69.922 (68.762)	lr 0.02305
Train [22][2100/3239]	Time 0.622 (0.918)	Data Time 0.001 (0.012)	Loss 3.2587 (3.3226)	Entropy 0.94459 (0.95519)	Top-1 acc 47.656 (44.874)	Top-5 acc 71.484 (68.758)	lr 0.02305
Train [22][2110/3239]	Time 0.733 (0.917)	Data Time 0.001 (0.012)	Loss 3.2719 (3.3225)	Entropy 0.94415 (0.95514)	Top-1 acc 47.656 (44.878)	Top-5 acc 68.750 (68.761)	lr 0.02305
Train [22][2120/3239]	Time 0.510 (0.917)	Data Time 0.001 (0.012)	Loss 3.1236 (3.3224)	Entropy 0.94409 (0.95509)	Top-1 acc 47.266 (44.882)	Top-5 acc 73.047 (68.762)	lr 0.02304
Train [22][2130/3239]	Time 0.646 (0.917)	Data Time 0.001 (0.012)	Loss 3.0596 (3.3221)	Entropy 0.94371 (0.95504)	Top-1 acc 50.000 (44.884)	Top-5 acc 73.047 (68.767)	lr 0.02304
Train [22][2140/3239]	Time 0.658 (0.917)	Data Time 0.001 (0.012)	Loss 3.2792 (3.3215)	Entropy 0.94363 (0.95498)	Top-1 acc 46.875 (44.898)	Top-5 acc 67.969 (68.778)	lr 0.02304
Train [22][2150/3239]	Time 0.642 (0.916)	Data Time 0.001 (0.012)	Loss 3.4650 (3.3215)	Entropy 0.94348 (0.95493)	Top-1 acc 37.109 (44.900)	Top-5 acc 63.281 (68.777)	lr 0.02304
Train [22][2160/3239]	Time 0.582 (0.916)	Data Time 0.001 (0.012)	Loss 3.3193 (3.3216)	Entropy 0.94334 (0.95488)	Top-1 acc 42.578 (44.895)	Top-5 acc 68.750 (68.775)	lr 0.02304
Train [22][2170/3239]	Time 0.639 (0.916)	Data Time 0.001 (0.012)	Loss 3.2476 (3.3217)	Entropy 0.94313 (0.95482)	Top-1 acc 46.875 (44.893)	Top-5 acc 71.094 (68.776)	lr 0.02304
Train [22][2180/3239]	Time 0.667 (0.916)	Data Time 0.001 (0.012)	Loss 3.4467 (3.3216)	Entropy 0.94279 (0.95477)	Top-1 acc 39.844 (44.895)	Top-5 acc 67.578 (68.778)	lr 0.02304
Train [22][2190/3239]	Time 0.616 (0.915)	Data Time 0.002 (0.012)	Loss 3.4289 (3.3215)	Entropy 0.94267 (0.95471)	Top-1 acc 41.016 (44.895)	Top-5 acc 66.797 (68.786)	lr 0.02304
Train [22][2200/3239]	Time 0.630 (0.915)	Data Time 0.001 (0.012)	Loss 3.4055 (3.3217)	Entropy 0.94275 (0.95466)	Top-1 acc 41.406 (44.887)	Top-5 acc 67.188 (68.780)	lr 0.02304
Train [22][2210/3239]	Time 0.598 (0.915)	Data Time 0.001 (0.012)	Loss 3.3289 (3.3217)	Entropy 0.94239 (0.95461)	Top-1 acc 44.141 (44.888)	Top-5 acc 67.969 (68.780)	lr 0.02304
Train [22][2220/3239]	Time 0.642 (0.915)	Data Time 0.002 (0.012)	Loss 3.1661 (3.3215)	Entropy 0.94251 (0.95455)	Top-1 acc 47.656 (44.887)	Top-5 acc 70.703 (68.782)	lr 0.02304
Train [22][2230/3239]	Time 0.571 (0.915)	Data Time 0.001 (0.012)	Loss 3.3899 (3.3213)	Entropy 0.94269 (0.95450)	Top-1 acc 42.969 (44.887)	Top-5 acc 69.531 (68.786)	lr 0.02304
Train [22][2240/3239]	Time 0.638 (0.915)	Data Time 0.001 (0.012)	Loss 3.3881 (3.3215)	Entropy 0.94233 (0.95444)	Top-1 acc 46.875 (44.881)	Top-5 acc 67.578 (68.782)	lr 0.02304
Train [22][2250/3239]	Time 0.589 (0.914)	Data Time 0.001 (0.012)	Loss 3.1343 (3.3214)	Entropy 0.94191 (0.95439)	Top-1 acc 46.875 (44.883)	Top-5 acc 73.828 (68.779)	lr 0.02304
Train [22][2260/3239]	Time 0.615 (0.914)	Data Time 0.001 (0.012)	Loss 3.0856 (3.3217)	Entropy 0.94181 (0.95433)	Top-1 acc 52.344 (44.883)	Top-5 acc 72.266 (68.776)	lr 0.02304
Train [22][2270/3239]	Time 0.669 (0.914)	Data Time 0.001 (0.011)	Loss 3.2775 (3.3218)	Entropy 0.94173 (0.95428)	Top-1 acc 44.922 (44.879)	Top-5 acc 69.922 (68.773)	lr 0.02304
Train [22][2280/3239]	Time 0.608 (0.914)	Data Time 0.001 (0.011)	Loss 3.3984 (3.3219)	Entropy 0.94170 (0.95422)	Top-1 acc 43.750 (44.876)	Top-5 acc 66.406 (68.767)	lr 0.02304
Train [22][2290/3239]	Time 0.564 (0.913)	Data Time 0.002 (0.011)	Loss 3.2599 (3.3219)	Entropy 0.94133 (0.95417)	Top-1 acc 44.531 (44.880)	Top-5 acc 69.922 (68.769)	lr 0.02304
Train [22][2300/3239]	Time 0.631 (0.913)	Data Time 0.002 (0.011)	Loss 3.3421 (3.3220)	Entropy 0.94123 (0.95411)	Top-1 acc 44.922 (44.876)	Top-5 acc 66.406 (68.764)	lr 0.02303
Train [22][2310/3239]	Time 0.590 (0.913)	Data Time 0.001 (0.011)	Loss 3.2401 (3.3220)	Entropy 0.94020 (0.95406)	Top-1 acc 46.875 (44.875)	Top-5 acc 69.141 (68.763)	lr 0.02303
Train [22][2320/3239]	Time 0.617 (0.913)	Data Time 0.001 (0.011)	Loss 3.1514 (3.3219)	Entropy 0.93996 (0.95400)	Top-1 acc 51.562 (44.880)	Top-5 acc 71.484 (68.762)	lr 0.02303
Train [22][2330/3239]	Time 0.598 (0.912)	Data Time 0.001 (0.011)	Loss 3.3690 (3.3217)	Entropy 0.93969 (0.95394)	Top-1 acc 44.531 (44.881)	Top-5 acc 69.141 (68.771)	lr 0.02303
Train [22][2340/3239]	Time 0.647 (0.912)	Data Time 0.001 (0.011)	Loss 3.5420 (3.3215)	Entropy 0.93985 (0.95387)	Top-1 acc 39.453 (44.889)	Top-5 acc 64.062 (68.775)	lr 0.02303
Train [22][2350/3239]	Time 0.650 (0.912)	Data Time 0.001 (0.011)	Loss 3.2061 (3.3216)	Entropy 0.93992 (0.95381)	Top-1 acc 51.953 (44.890)	Top-5 acc 71.094 (68.774)	lr 0.02303
Train [22][2360/3239]	Time 0.589 (0.912)	Data Time 0.001 (0.011)	Loss 3.0417 (3.3215)	Entropy 0.94017 (0.95376)	Top-1 acc 52.344 (44.894)	Top-5 acc 74.609 (68.776)	lr 0.02303
Train [22][2370/3239]	Time 0.586 (0.912)	Data Time 0.001 (0.011)	Loss 3.2651 (3.3214)	Entropy 0.93994 (0.95370)	Top-1 acc 48.047 (44.894)	Top-5 acc 71.094 (68.781)	lr 0.02303
Train [22][2380/3239]	Time 0.612 (0.911)	Data Time 0.001 (0.011)	Loss 3.2191 (3.3217)	Entropy 0.94004 (0.95364)	Top-1 acc 44.531 (44.883)	Top-5 acc 66.797 (68.771)	lr 0.02303
Train [22][2390/3239]	Time 0.647 (0.911)	Data Time 0.001 (0.011)	Loss 3.3624 (3.3216)	Entropy 0.93960 (0.95358)	Top-1 acc 41.016 (44.885)	Top-5 acc 70.703 (68.773)	lr 0.02303
Train [22][2400/3239]	Time 0.571 (0.911)	Data Time 0.001 (0.011)	Loss 3.1680 (3.3219)	Entropy 0.93938 (0.95352)	Top-1 acc 48.047 (44.878)	Top-5 acc 71.094 (68.762)	lr 0.02303
Train [22][2410/3239]	Time 0.617 (0.911)	Data Time 0.001 (0.011)	Loss 3.3811 (3.3218)	Entropy 0.93952 (0.95347)	Top-1 acc 43.359 (44.879)	Top-5 acc 67.578 (68.760)	lr 0.02303
Train [22][2420/3239]	Time 0.585 (0.911)	Data Time 0.001 (0.011)	Loss 3.0856 (3.3217)	Entropy 0.93879 (0.95341)	Top-1 acc 51.953 (44.881)	Top-5 acc 74.609 (68.760)	lr 0.02303
Train [22][2430/3239]	Time 0.594 (0.910)	Data Time 0.001 (0.011)	Loss 3.2538 (3.3221)	Entropy 0.93892 (0.95335)	Top-1 acc 45.703 (44.873)	Top-5 acc 71.484 (68.755)	lr 0.02303
Train [22][2440/3239]	Time 0.571 (0.910)	Data Time 0.001 (0.011)	Loss 3.4072 (3.3223)	Entropy 0.93858 (0.95329)	Top-1 acc 44.922 (44.869)	Top-5 acc 67.188 (68.752)	lr 0.02303
Train [22][2450/3239]	Time 0.626 (0.910)	Data Time 0.001 (0.011)	Loss 3.4193 (3.3222)	Entropy 0.93832 (0.95323)	Top-1 acc 45.312 (44.873)	Top-5 acc 70.312 (68.762)	lr 0.02303
Train [22][2460/3239]	Time 0.602 (0.910)	Data Time 0.002 (0.011)	Loss 3.4364 (3.3220)	Entropy 0.93842 (0.95317)	Top-1 acc 42.578 (44.879)	Top-5 acc 64.062 (68.766)	lr 0.02303
Train [22][2470/3239]	Time 0.598 (0.909)	Data Time 0.001 (0.011)	Loss 3.3901 (3.3219)	Entropy 0.93761 (0.95311)	Top-1 acc 47.656 (44.877)	Top-5 acc 66.406 (68.762)	lr 0.02303
Train [22][2480/3239]	Time 0.531 (0.909)	Data Time 0.001 (0.011)	Loss 3.0992 (3.3217)	Entropy 0.93717 (0.95304)	Top-1 acc 48.828 (44.880)	Top-5 acc 74.219 (68.764)	lr 0.02302
Train [22][2490/3239]	Time 0.593 (0.909)	Data Time 0.001 (0.011)	Loss 3.3257 (3.3218)	Entropy 0.93693 (0.95298)	Top-1 acc 45.703 (44.878)	Top-5 acc 68.750 (68.763)	lr 0.02302
Train [22][2500/3239]	Time 0.725 (0.909)	Data Time 0.002 (0.011)	Loss 3.0831 (3.3217)	Entropy 0.93661 (0.95291)	Top-1 acc 49.219 (44.880)	Top-5 acc 71.875 (68.765)	lr 0.02302
Train [22][2510/3239]	Time 0.624 (0.909)	Data Time 0.001 (0.011)	Loss 3.2255 (3.3219)	Entropy 0.93692 (0.95285)	Top-1 acc 51.172 (44.874)	Top-5 acc 71.484 (68.761)	lr 0.02302
Train [22][2520/3239]	Time 0.560 (0.908)	Data Time 0.001 (0.011)	Loss 3.2584 (3.3217)	Entropy 0.93662 (0.95279)	Top-1 acc 43.359 (44.877)	Top-5 acc 69.141 (68.768)	lr 0.02302
Train [22][2530/3239]	Time 0.603 (0.908)	Data Time 0.002 (0.011)	Loss 3.4039 (3.3217)	Entropy 0.93675 (0.95272)	Top-1 acc 46.094 (44.875)	Top-5 acc 67.969 (68.767)	lr 0.02302
Train [22][2540/3239]	Time 0.582 (0.908)	Data Time 0.001 (0.010)	Loss 3.2234 (3.3217)	Entropy 0.93684 (0.95266)	Top-1 acc 46.875 (44.878)	Top-5 acc 70.703 (68.768)	lr 0.02302
Train [22][2550/3239]	Time 0.632 (0.908)	Data Time 0.001 (0.010)	Loss 3.4282 (3.3218)	Entropy 0.93684 (0.95260)	Top-1 acc 43.359 (44.879)	Top-5 acc 67.969 (68.761)	lr 0.02302
Train [22][2560/3239]	Time 0.588 (0.908)	Data Time 0.001 (0.010)	Loss 3.2452 (3.3219)	Entropy 0.93661 (0.95254)	Top-1 acc 46.094 (44.876)	Top-5 acc 70.312 (68.762)	lr 0.02302
Train [22][2570/3239]	Time 0.683 (0.908)	Data Time 0.001 (0.010)	Loss 3.3722 (3.3220)	Entropy 0.93645 (0.95247)	Top-1 acc 41.406 (44.879)	Top-5 acc 71.094 (68.765)	lr 0.02302
Train [22][2580/3239]	Time 0.608 (0.907)	Data Time 0.001 (0.010)	Loss 3.5121 (3.3222)	Entropy 0.93639 (0.95241)	Top-1 acc 40.234 (44.869)	Top-5 acc 65.625 (68.761)	lr 0.02302
Train [22][2590/3239]	Time 0.632 (0.907)	Data Time 0.001 (0.010)	Loss 3.5198 (3.3222)	Entropy 0.93623 (0.95235)	Top-1 acc 43.750 (44.869)	Top-5 acc 66.797 (68.761)	lr 0.02302
Train [22][2600/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.010)	Loss 3.0698 (3.3221)	Entropy 0.93593 (0.95229)	Top-1 acc 48.438 (44.867)	Top-5 acc 76.172 (68.761)	lr 0.02302
Train [22][2610/3239]	Time 0.624 (0.907)	Data Time 0.001 (0.010)	Loss 3.3878 (3.3221)	Entropy 0.93602 (0.95222)	Top-1 acc 44.141 (44.874)	Top-5 acc 69.141 (68.760)	lr 0.02302
Train [22][2620/3239]	Time 0.599 (0.907)	Data Time 0.001 (0.010)	Loss 3.4291 (3.3222)	Entropy 0.93614 (0.95216)	Top-1 acc 42.188 (44.870)	Top-5 acc 64.844 (68.759)	lr 0.02302
Train [22][2630/3239]	Time 0.614 (0.907)	Data Time 0.001 (0.010)	Loss 3.2373 (3.3222)	Entropy 0.93604 (0.95210)	Top-1 acc 52.344 (44.872)	Top-5 acc 69.141 (68.761)	lr 0.02302
Train [22][2640/3239]	Time 0.556 (0.906)	Data Time 0.001 (0.010)	Loss 3.3815 (3.3222)	Entropy 0.93623 (0.95204)	Top-1 acc 39.844 (44.871)	Top-5 acc 65.625 (68.758)	lr 0.02302
Train [22][2650/3239]	Time 0.633 (0.906)	Data Time 0.001 (0.010)	Loss 3.3004 (3.3221)	Entropy 0.93643 (0.95198)	Top-1 acc 45.703 (44.876)	Top-5 acc 71.875 (68.761)	lr 0.02302
Train [22][2660/3239]	Time 0.726 (0.906)	Data Time 0.001 (0.010)	Loss 3.2290 (3.3220)	Entropy 0.93620 (0.95192)	Top-1 acc 48.047 (44.879)	Top-5 acc 69.531 (68.762)	lr 0.02302
Train [22][2670/3239]	Time 0.721 (0.915)	Data Time 0.005 (0.010)	Loss 3.3768 (3.3219)	Entropy 0.93606 (0.95186)	Top-1 acc 44.531 (44.878)	Top-5 acc 66.797 (68.763)	lr 0.02301
Train [22][2680/3239]	Time 0.616 (0.915)	Data Time 0.002 (0.010)	Loss 3.3383 (3.3220)	Entropy 0.93580 (0.95180)	Top-1 acc 42.578 (44.875)	Top-5 acc 68.359 (68.759)	lr 0.02301
Train [22][2690/3239]	Time 0.586 (0.915)	Data Time 0.002 (0.010)	Loss 3.4681 (3.3220)	Entropy 0.93563 (0.95174)	Top-1 acc 45.312 (44.872)	Top-5 acc 67.578 (68.761)	lr 0.02301
Train [22][2700/3239]	Time 0.598 (0.914)	Data Time 0.001 (0.010)	Loss 3.0999 (3.3218)	Entropy 0.93560 (0.95168)	Top-1 acc 53.125 (44.877)	Top-5 acc 73.828 (68.767)	lr 0.02301
Train [22][2710/3239]	Time 0.585 (0.914)	Data Time 0.001 (0.010)	Loss 3.3368 (3.3216)	Entropy 0.93527 (0.95162)	Top-1 acc 47.656 (44.881)	Top-5 acc 70.312 (68.769)	lr 0.02301
Train [22][2720/3239]	Time 0.612 (0.914)	Data Time 0.001 (0.010)	Loss 3.2149 (3.3218)	Entropy 0.93517 (0.95156)	Top-1 acc 51.953 (44.876)	Top-5 acc 71.094 (68.768)	lr 0.02301
Train [22][2730/3239]	Time 0.686 (0.914)	Data Time 0.001 (0.010)	Loss 3.1023 (3.3218)	Entropy 0.93505 (0.95150)	Top-1 acc 44.922 (44.871)	Top-5 acc 72.266 (68.766)	lr 0.02301
Train [22][2740/3239]	Time 0.556 (0.914)	Data Time 0.001 (0.010)	Loss 3.1518 (3.3218)	Entropy 0.93521 (0.95144)	Top-1 acc 49.609 (44.873)	Top-5 acc 73.828 (68.766)	lr 0.02301
Train [22][2750/3239]	Time 0.633 (0.914)	Data Time 0.001 (0.010)	Loss 3.6155 (3.3219)	Entropy 0.93473 (0.95138)	Top-1 acc 39.453 (44.865)	Top-5 acc 60.156 (68.762)	lr 0.02301
Train [22][2760/3239]	Time 0.576 (0.913)	Data Time 0.001 (0.010)	Loss 3.3265 (3.3218)	Entropy 0.93484 (0.95132)	Top-1 acc 41.797 (44.863)	Top-5 acc 66.797 (68.763)	lr 0.02301
Train [22][2770/3239]	Time 0.580 (0.913)	Data Time 0.001 (0.010)	Loss 3.3776 (3.3219)	Entropy 0.93450 (0.95126)	Top-1 acc 42.969 (44.861)	Top-5 acc 67.578 (68.761)	lr 0.02301
Train [22][2780/3239]	Time 0.606 (0.913)	Data Time 0.001 (0.010)	Loss 3.4257 (3.3216)	Entropy 0.93423 (0.95120)	Top-1 acc 42.188 (44.869)	Top-5 acc 68.750 (68.770)	lr 0.02301
Train [22][2790/3239]	Time 0.592 (0.913)	Data Time 0.001 (0.010)	Loss 3.0826 (3.3213)	Entropy 0.93384 (0.95114)	Top-1 acc 53.906 (44.876)	Top-5 acc 75.781 (68.776)	lr 0.02301
Train [22][2800/3239]	Time 0.621 (0.912)	Data Time 0.001 (0.010)	Loss 3.1639 (3.3212)	Entropy 0.93328 (0.95108)	Top-1 acc 50.781 (44.879)	Top-5 acc 71.094 (68.780)	lr 0.02301
Train [22][2810/3239]	Time 0.605 (0.912)	Data Time 0.001 (0.010)	Loss 3.5584 (3.3216)	Entropy 0.93291 (0.95102)	Top-1 acc 41.016 (44.872)	Top-5 acc 61.328 (68.773)	lr 0.02301
Train [22][2820/3239]	Time 0.702 (0.912)	Data Time 0.001 (0.010)	Loss 3.3833 (3.3217)	Entropy 0.93262 (0.95095)	Top-1 acc 42.188 (44.872)	Top-5 acc 66.406 (68.770)	lr 0.02301
Train [22][2830/3239]	Time 0.623 (0.912)	Data Time 0.001 (0.010)	Loss 3.3604 (3.3219)	Entropy 0.93226 (0.95089)	Top-1 acc 44.531 (44.869)	Top-5 acc 67.188 (68.769)	lr 0.02301
Train [22][2840/3239]	Time 0.635 (0.912)	Data Time 0.002 (0.010)	Loss 3.2250 (3.3217)	Entropy 0.93180 (0.95082)	Top-1 acc 48.047 (44.877)	Top-5 acc 71.875 (68.773)	lr 0.02301
Train [22][2850/3239]	Time 0.595 (0.912)	Data Time 0.001 (0.010)	Loss 3.5564 (3.3218)	Entropy 0.93138 (0.95075)	Top-1 acc 39.844 (44.875)	Top-5 acc 65.625 (68.771)	lr 0.02300
Train [22][2860/3239]	Time 0.573 (0.911)	Data Time 0.001 (0.010)	Loss 3.2964 (3.3219)	Entropy 0.93131 (0.95068)	Top-1 acc 41.797 (44.872)	Top-5 acc 69.141 (68.768)	lr 0.02300
Train [22][2870/3239]	Time 0.618 (0.911)	Data Time 0.001 (0.010)	Loss 3.1648 (3.3218)	Entropy 0.93148 (0.95062)	Top-1 acc 47.266 (44.872)	Top-5 acc 71.094 (68.771)	lr 0.02300
Train [22][2880/3239]	Time 0.617 (0.911)	Data Time 0.001 (0.010)	Loss 3.5582 (3.3221)	Entropy 0.93128 (0.95055)	Top-1 acc 42.969 (44.868)	Top-5 acc 62.891 (68.765)	lr 0.02300
Train [22][2890/3239]	Time 0.687 (0.911)	Data Time 0.001 (0.009)	Loss 3.3210 (3.3221)	Entropy 0.93098 (0.95048)	Top-1 acc 42.188 (44.868)	Top-5 acc 69.141 (68.762)	lr 0.02300
Train [22][2900/3239]	Time 0.588 (0.911)	Data Time 0.001 (0.009)	Loss 3.2000 (3.3217)	Entropy 0.93102 (0.95042)	Top-1 acc 47.266 (44.877)	Top-5 acc 68.359 (68.766)	lr 0.02300
Train [22][2910/3239]	Time 0.634 (0.911)	Data Time 0.001 (0.009)	Loss 3.4756 (3.3218)	Entropy 0.93092 (0.95035)	Top-1 acc 45.312 (44.876)	Top-5 acc 66.406 (68.765)	lr 0.02300
Train [22][2920/3239]	Time 0.588 (0.911)	Data Time 0.001 (0.009)	Loss 3.3483 (3.3216)	Entropy 0.93099 (0.95028)	Top-1 acc 46.484 (44.879)	Top-5 acc 68.750 (68.765)	lr 0.02300
Train [22][2930/3239]	Time 0.602 (0.910)	Data Time 0.002 (0.009)	Loss 3.4041 (3.3216)	Entropy 0.93094 (0.95022)	Top-1 acc 44.531 (44.880)	Top-5 acc 66.797 (68.761)	lr 0.02300
Train [22][2940/3239]	Time 0.610 (0.910)	Data Time 0.001 (0.009)	Loss 3.2636 (3.3214)	Entropy 0.93070 (0.95015)	Top-1 acc 45.703 (44.884)	Top-5 acc 66.797 (68.762)	lr 0.02300
Train [22][2950/3239]	Time 0.486 (0.910)	Data Time 0.001 (0.009)	Loss 3.1934 (3.3214)	Entropy 0.93027 (0.95009)	Top-1 acc 49.219 (44.884)	Top-5 acc 70.312 (68.765)	lr 0.02300
Train [22][2960/3239]	Time 0.624 (0.910)	Data Time 0.001 (0.009)	Loss 3.2676 (3.3213)	Entropy 0.93019 (0.95002)	Top-1 acc 46.094 (44.886)	Top-5 acc 68.750 (68.767)	lr 0.02300
Train [22][2970/3239]	Time 0.622 (0.910)	Data Time 0.001 (0.009)	Loss 3.3778 (3.3211)	Entropy 0.93014 (0.94995)	Top-1 acc 41.406 (44.891)	Top-5 acc 68.359 (68.771)	lr 0.02300
Train [22][2980/3239]	Time 0.643 (0.910)	Data Time 0.001 (0.009)	Loss 3.4617 (3.3209)	Entropy 0.92966 (0.94988)	Top-1 acc 39.453 (44.898)	Top-5 acc 64.453 (68.775)	lr 0.02300
Train [22][2990/3239]	Time 0.613 (0.909)	Data Time 0.002 (0.009)	Loss 3.1226 (3.3207)	Entropy 0.92927 (0.94982)	Top-1 acc 47.266 (44.905)	Top-5 acc 69.922 (68.780)	lr 0.02300
Train [22][3000/3239]	Time 0.565 (0.909)	Data Time 0.001 (0.009)	Loss 3.4530 (3.3209)	Entropy 0.92909 (0.94975)	Top-1 acc 41.016 (44.899)	Top-5 acc 65.234 (68.779)	lr 0.02300
Train [22][3010/3239]	Time 0.616 (0.909)	Data Time 0.001 (0.009)	Loss 3.3591 (3.3209)	Entropy 0.92919 (0.94968)	Top-1 acc 42.578 (44.897)	Top-5 acc 67.578 (68.777)	lr 0.02300
Train [22][3020/3239]	Time 0.624 (0.909)	Data Time 0.001 (0.009)	Loss 3.3378 (3.3207)	Entropy 0.92914 (0.94961)	Top-1 acc 41.797 (44.901)	Top-5 acc 65.625 (68.781)	lr 0.02300
Train [22][3030/3239]	Time 0.621 (0.909)	Data Time 0.001 (0.009)	Loss 3.5668 (3.3207)	Entropy 0.92919 (0.94954)	Top-1 acc 39.062 (44.900)	Top-5 acc 64.062 (68.782)	lr 0.02299
Train [22][3040/3239]	Time 0.568 (0.909)	Data Time 0.001 (0.009)	Loss 3.4639 (3.3208)	Entropy 0.92901 (0.94948)	Top-1 acc 39.844 (44.895)	Top-5 acc 63.281 (68.779)	lr 0.02299
Train [22][3050/3239]	Time 0.722 (0.909)	Data Time 0.002 (0.009)	Loss 3.3764 (3.3206)	Entropy 0.92886 (0.94941)	Top-1 acc 44.531 (44.897)	Top-5 acc 64.844 (68.784)	lr 0.02299
Train [22][3060/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.009)	Loss 3.5450 (3.3206)	Entropy 0.92879 (0.94934)	Top-1 acc 37.109 (44.896)	Top-5 acc 61.719 (68.781)	lr 0.02299
Train [22][3070/3239]	Time 0.618 (0.908)	Data Time 0.002 (0.009)	Loss 3.2826 (3.3205)	Entropy 0.92886 (0.94928)	Top-1 acc 44.531 (44.901)	Top-5 acc 69.141 (68.785)	lr 0.02299
Train [22][3080/3239]	Time 0.614 (0.908)	Data Time 0.002 (0.009)	Loss 3.1979 (3.3204)	Entropy 0.92839 (0.94921)	Top-1 acc 45.703 (44.900)	Top-5 acc 72.656 (68.787)	lr 0.02299
Train [22][3090/3239]	Time 0.622 (0.908)	Data Time 0.001 (0.009)	Loss 3.2982 (3.3203)	Entropy 0.92801 (0.94914)	Top-1 acc 43.359 (44.899)	Top-5 acc 68.359 (68.789)	lr 0.02299
Train [22][3100/3239]	Time 0.595 (0.908)	Data Time 0.002 (0.009)	Loss 3.3350 (3.3203)	Entropy 0.92745 (0.94907)	Top-1 acc 41.016 (44.897)	Top-5 acc 69.141 (68.790)	lr 0.02299
Train [22][3110/3239]	Time 0.578 (0.908)	Data Time 0.001 (0.009)	Loss 3.4407 (3.3202)	Entropy 0.92747 (0.94900)	Top-1 acc 39.062 (44.895)	Top-5 acc 66.797 (68.791)	lr 0.02299
Train [22][3120/3239]	Time 0.652 (0.907)	Data Time 0.001 (0.009)	Loss 3.7526 (3.3204)	Entropy 0.92748 (0.94893)	Top-1 acc 33.984 (44.889)	Top-5 acc 60.156 (68.788)	lr 0.02299
Train [22][3130/3239]	Time 0.582 (0.907)	Data Time 0.001 (0.009)	Loss 3.1121 (3.3203)	Entropy 0.92753 (0.94886)	Top-1 acc 50.781 (44.889)	Top-5 acc 74.609 (68.789)	lr 0.02299
Train [22][3140/3239]	Time 0.621 (0.907)	Data Time 0.001 (0.009)	Loss 3.3181 (3.3205)	Entropy 0.92757 (0.94880)	Top-1 acc 45.703 (44.888)	Top-5 acc 66.797 (68.784)	lr 0.02299
Train [22][3150/3239]	Time 0.640 (0.907)	Data Time 0.001 (0.009)	Loss 3.1991 (3.3205)	Entropy 0.92777 (0.94873)	Top-1 acc 46.875 (44.888)	Top-5 acc 72.266 (68.787)	lr 0.02299
Train [22][3160/3239]	Time 0.577 (0.907)	Data Time 0.001 (0.009)	Loss 3.3336 (3.3205)	Entropy 0.92761 (0.94866)	Top-1 acc 44.922 (44.890)	Top-5 acc 68.359 (68.788)	lr 0.02299
Train [22][3170/3239]	Time 0.551 (0.907)	Data Time 0.001 (0.009)	Loss 3.3224 (3.3205)	Entropy 0.92713 (0.94860)	Top-1 acc 41.797 (44.890)	Top-5 acc 67.969 (68.787)	lr 0.02299
Train [22][3180/3239]	Time 0.621 (0.907)	Data Time 0.000 (0.009)	Loss 3.2782 (3.3206)	Entropy 0.92726 (0.94853)	Top-1 acc 48.047 (44.890)	Top-5 acc 70.312 (68.784)	lr 0.02299
Train [22][3190/3239]	Time 0.586 (0.906)	Data Time 0.000 (0.009)	Loss 3.2128 (3.3205)	Entropy 0.92747 (0.94846)	Top-1 acc 51.172 (44.896)	Top-5 acc 72.656 (68.783)	lr 0.02299
Train [22][3200/3239]	Time 0.592 (0.906)	Data Time 0.000 (0.009)	Loss 3.4691 (3.3205)	Entropy 0.92704 (0.94840)	Top-1 acc 40.234 (44.893)	Top-5 acc 65.234 (68.781)	lr 0.02299
Train [22][3210/3239]	Time 0.738 (0.906)	Data Time 0.000 (0.009)	Loss 3.5377 (3.3204)	Entropy 0.92655 (0.94833)	Top-1 acc 44.141 (44.898)	Top-5 acc 66.406 (68.784)	lr 0.02299
Train [22][3220/3239]	Time 0.596 (0.906)	Data Time 0.000 (0.009)	Loss 3.1039 (3.3204)	Entropy 0.92609 (0.94826)	Top-1 acc 53.516 (44.898)	Top-5 acc 73.047 (68.784)	lr 0.02298
Train [22][3230/3239]	Time 0.564 (0.906)	Data Time 0.000 (0.009)	Loss 3.2576 (3.3204)	Entropy 0.92630 (0.94819)	Top-1 acc 44.531 (44.900)	Top-5 acc 70.703 (68.785)	lr 0.02298
Train [22][3239/3239]	Time 1.602 (0.906)	Data Time 0.000 (0.009)	Loss 3.4580 (3.3205)	Entropy 0.92622 (0.94813)	Top-1 acc 40.741 (44.898)	Top-5 acc 64.198 (68.781)	lr 0.02298
==========Valid [22/120]	loss 2.048	top-1 acc 54.487 (54.487)	top-5 acc 78.142	Train top-1 44.898	top-5 68.781	Entropy 0.92622	Latency-None: 0.000ms	Flops: 539.76M
Train [23][0/3239]	Time 28.743 (28.743)	Data Time 25.064 (25.064)	Loss 3.3885 (3.3885)	Entropy 0.92622 (0.92622)	Top-1 acc 44.531 (44.531)	Top-5 acc 68.359 (68.359)	lr 0.02298
Train [23][10/3239]	Time 0.583 (3.498)	Data Time 0.001 (2.348)	Loss 3.3386 (3.3030)	Entropy 0.92564 (0.92604)	Top-1 acc 45.312 (46.307)	Top-5 acc 67.188 (69.070)	lr 0.02298
Train [23][20/3239]	Time 0.616 (2.251)	Data Time 0.001 (1.231)	Loss 3.4975 (3.2897)	Entropy 0.92557 (0.92588)	Top-1 acc 39.062 (46.298)	Top-5 acc 66.016 (69.196)	lr 0.02298
Train [23][30/3239]	Time 0.597 (1.804)	Data Time 0.001 (0.835)	Loss 3.1701 (3.3035)	Entropy 0.92550 (0.92575)	Top-1 acc 51.172 (45.640)	Top-5 acc 72.656 (68.939)	lr 0.02298
Train [23][40/3239]	Time 0.616 (1.572)	Data Time 0.001 (0.631)	Loss 3.3111 (3.3144)	Entropy 0.92554 (0.92569)	Top-1 acc 45.703 (45.417)	Top-5 acc 68.359 (68.788)	lr 0.02298
Train [23][50/3239]	Time 0.584 (1.434)	Data Time 0.001 (0.508)	Loss 3.3152 (3.3095)	Entropy 0.92577 (0.92569)	Top-1 acc 46.094 (45.404)	Top-5 acc 68.750 (68.827)	lr 0.02298
Train [23][60/3239]	Time 0.669 (1.336)	Data Time 0.001 (0.425)	Loss 3.3527 (3.3091)	Entropy 0.92558 (0.92568)	Top-1 acc 42.969 (45.274)	Top-5 acc 66.016 (68.929)	lr 0.02298
Train [23][70/3239]	Time 0.578 (1.274)	Data Time 0.001 (0.365)	Loss 3.1883 (3.3003)	Entropy 0.92581 (0.92568)	Top-1 acc 50.391 (45.648)	Top-5 acc 69.922 (69.086)	lr 0.02298
Train [23][80/3239]	Time 0.593 (1.223)	Data Time 0.001 (0.321)	Loss 3.4395 (3.3027)	Entropy 0.92631 (0.92571)	Top-1 acc 45.312 (45.496)	Top-5 acc 66.016 (69.141)	lr 0.02298
Train [23][90/3239]	Time 0.572 (1.501)	Data Time 0.002 (0.286)	Loss 3.3451 (3.2948)	Entropy 0.92565 (0.92575)	Top-1 acc 44.141 (45.622)	Top-5 acc 67.188 (69.222)	lr 0.02298
Train [23][100/3239]	Time 0.607 (1.439)	Data Time 0.002 (0.258)	Loss 3.1763 (3.2962)	Entropy 0.92537 (0.92571)	Top-1 acc 48.438 (45.599)	Top-5 acc 71.484 (69.137)	lr 0.02298
Train [23][110/3239]	Time 0.680 (1.388)	Data Time 0.001 (0.235)	Loss 3.3638 (3.2983)	Entropy 0.92531 (0.92568)	Top-1 acc 47.656 (45.605)	Top-5 acc 65.234 (69.014)	lr 0.02298
Train [23][120/3239]	Time 0.602 (1.345)	Data Time 0.001 (0.215)	Loss 3.2144 (3.2965)	Entropy 0.92506 (0.92564)	Top-1 acc 44.922 (45.574)	Top-5 acc 71.484 (69.021)	lr 0.02298
Train [23][130/3239]	Time 0.605 (1.307)	Data Time 0.001 (0.199)	Loss 3.4182 (3.2948)	Entropy 0.92533 (0.92559)	Top-1 acc 42.969 (45.599)	Top-5 acc 69.531 (69.099)	lr 0.02298
Train [23][140/3239]	Time 0.595 (1.277)	Data Time 0.001 (0.185)	Loss 3.3031 (3.2938)	Entropy 0.92512 (0.92557)	Top-1 acc 44.141 (45.518)	Top-5 acc 68.750 (69.188)	lr 0.02298
Train [23][150/3239]	Time 0.661 (1.250)	Data Time 0.001 (0.173)	Loss 3.3832 (3.2945)	Entropy 0.92501 (0.92554)	Top-1 acc 42.188 (45.470)	Top-5 acc 67.578 (69.200)	lr 0.02298
Train [23][160/3239]	Time 0.589 (1.226)	Data Time 0.002 (0.162)	Loss 3.2293 (3.2931)	Entropy 0.92520 (0.92551)	Top-1 acc 48.438 (45.490)	Top-5 acc 72.656 (69.267)	lr 0.02297
Train [23][170/3239]	Time 0.470 (1.203)	Data Time 0.001 (0.153)	Loss 3.4461 (3.2924)	Entropy 0.92506 (0.92548)	Top-1 acc 44.531 (45.514)	Top-5 acc 67.188 (69.301)	lr 0.02297
Train [23][180/3239]	Time 0.601 (1.184)	Data Time 0.001 (0.145)	Loss 3.1408 (3.2907)	Entropy 0.92480 (0.92545)	Top-1 acc 51.562 (45.608)	Top-5 acc 72.656 (69.341)	lr 0.02297
Train [23][190/3239]	Time 0.592 (1.167)	Data Time 0.001 (0.137)	Loss 3.2800 (3.2911)	Entropy 0.92429 (0.92540)	Top-1 acc 47.266 (45.672)	Top-5 acc 69.141 (69.343)	lr 0.02297
Train [23][200/3239]	Time 0.615 (1.152)	Data Time 0.003 (0.131)	Loss 3.4592 (3.2923)	Entropy 0.92414 (0.92534)	Top-1 acc 40.625 (45.610)	Top-5 acc 67.188 (69.327)	lr 0.02297
Train [23][210/3239]	Time 0.614 (1.138)	Data Time 0.002 (0.125)	Loss 3.2827 (3.2920)	Entropy 0.92412 (0.92529)	Top-1 acc 45.703 (45.586)	Top-5 acc 70.312 (69.346)	lr 0.02297
Train [23][220/3239]	Time 0.602 (1.125)	Data Time 0.001 (0.119)	Loss 3.4498 (3.2910)	Entropy 0.92383 (0.92522)	Top-1 acc 43.750 (45.590)	Top-5 acc 67.188 (69.381)	lr 0.02297
Train [23][230/3239]	Time 0.612 (1.114)	Data Time 0.001 (0.114)	Loss 3.2049 (3.2898)	Entropy 0.92336 (0.92516)	Top-1 acc 47.656 (45.649)	Top-5 acc 71.094 (69.416)	lr 0.02297
Train [23][240/3239]	Time 0.643 (1.104)	Data Time 0.001 (0.109)	Loss 3.4284 (3.2908)	Entropy 0.92342 (0.92509)	Top-1 acc 41.797 (45.629)	Top-5 acc 65.625 (69.405)	lr 0.02297
Train [23][250/3239]	Time 0.608 (1.095)	Data Time 0.001 (0.105)	Loss 3.2982 (3.2898)	Entropy 0.92324 (0.92502)	Top-1 acc 43.359 (45.656)	Top-5 acc 71.875 (69.441)	lr 0.02297
Train [23][260/3239]	Time 0.604 (1.087)	Data Time 0.001 (0.101)	Loss 3.2299 (3.2904)	Entropy 0.92334 (0.92495)	Top-1 acc 46.094 (45.639)	Top-5 acc 68.359 (69.415)	lr 0.02297
Train [23][270/3239]	Time 0.728 (1.079)	Data Time 0.001 (0.097)	Loss 3.4123 (3.2905)	Entropy 0.92300 (0.92489)	Top-1 acc 44.922 (45.658)	Top-5 acc 66.016 (69.406)	lr 0.02297
Train [23][280/3239]	Time 0.615 (1.071)	Data Time 0.001 (0.094)	Loss 3.3272 (3.2897)	Entropy 0.92292 (0.92482)	Top-1 acc 44.531 (45.681)	Top-5 acc 72.266 (69.437)	lr 0.02297
Train [23][290/3239]	Time 0.598 (1.065)	Data Time 0.002 (0.091)	Loss 3.4115 (3.2907)	Entropy 0.92292 (0.92475)	Top-1 acc 44.141 (45.627)	Top-5 acc 68.750 (69.455)	lr 0.02297
Train [23][300/3239]	Time 0.620 (1.059)	Data Time 0.001 (0.088)	Loss 3.5088 (3.2919)	Entropy 0.92274 (0.92469)	Top-1 acc 39.844 (45.581)	Top-5 acc 64.844 (69.407)	lr 0.02297
Train [23][310/3239]	Time 0.653 (1.053)	Data Time 0.001 (0.085)	Loss 3.2810 (3.2914)	Entropy 0.92298 (0.92463)	Top-1 acc 46.875 (45.603)	Top-5 acc 71.094 (69.399)	lr 0.02297
Train [23][320/3239]	Time 0.624 (1.047)	Data Time 0.001 (0.083)	Loss 3.1945 (3.2931)	Entropy 0.92302 (0.92458)	Top-1 acc 47.656 (45.570)	Top-5 acc 72.266 (69.393)	lr 0.02297
Train [23][330/3239]	Time 0.601 (1.041)	Data Time 0.001 (0.080)	Loss 3.2658 (3.2939)	Entropy 0.92308 (0.92453)	Top-1 acc 43.359 (45.547)	Top-5 acc 69.922 (69.370)	lr 0.02297
Train [23][340/3239]	Time 0.722 (1.036)	Data Time 0.002 (0.078)	Loss 3.3410 (3.2937)	Entropy 0.92332 (0.92449)	Top-1 acc 43.750 (45.527)	Top-5 acc 66.406 (69.345)	lr 0.02296
Train [23][350/3239]	Time 0.608 (1.030)	Data Time 0.001 (0.076)	Loss 3.1253 (3.2933)	Entropy 0.92309 (0.92445)	Top-1 acc 51.562 (45.540)	Top-5 acc 73.828 (69.365)	lr 0.02296
Train [23][360/3239]	Time 0.619 (1.026)	Data Time 0.002 (0.074)	Loss 3.1815 (3.2912)	Entropy 0.92278 (0.92441)	Top-1 acc 44.922 (45.578)	Top-5 acc 72.266 (69.398)	lr 0.02296
Train [23][370/3239]	Time 0.614 (1.021)	Data Time 0.001 (0.072)	Loss 3.2531 (3.2918)	Entropy 0.92278 (0.92437)	Top-1 acc 44.141 (45.576)	Top-5 acc 68.359 (69.381)	lr 0.02296
Train [23][380/3239]	Time 0.607 (1.017)	Data Time 0.001 (0.070)	Loss 3.3676 (3.2917)	Entropy 0.92277 (0.92432)	Top-1 acc 41.797 (45.593)	Top-5 acc 67.578 (69.382)	lr 0.02296
Train [23][390/3239]	Time 0.628 (1.013)	Data Time 0.001 (0.068)	Loss 3.3072 (3.2924)	Entropy 0.92278 (0.92428)	Top-1 acc 46.875 (45.587)	Top-5 acc 68.750 (69.372)	lr 0.02296
Train [23][400/3239]	Time 0.514 (1.009)	Data Time 0.001 (0.067)	Loss 3.3289 (3.2921)	Entropy 0.92249 (0.92424)	Top-1 acc 41.797 (45.573)	Top-5 acc 66.797 (69.386)	lr 0.02296
Train [23][410/3239]	Time 0.579 (1.006)	Data Time 0.001 (0.065)	Loss 3.3016 (3.2911)	Entropy 0.92229 (0.92420)	Top-1 acc 48.828 (45.606)	Top-5 acc 69.141 (69.392)	lr 0.02296
Train [23][420/3239]	Time 0.632 (1.002)	Data Time 0.001 (0.063)	Loss 3.1158 (3.2919)	Entropy 0.92181 (0.92416)	Top-1 acc 48.047 (45.584)	Top-5 acc 75.781 (69.391)	lr 0.02296
Train [23][430/3239]	Time 0.695 (0.999)	Data Time 0.002 (0.062)	Loss 3.1528 (3.2903)	Entropy 0.92162 (0.92410)	Top-1 acc 53.906 (45.622)	Top-5 acc 71.875 (69.432)	lr 0.02296
Train [23][440/3239]	Time 0.606 (0.996)	Data Time 0.001 (0.061)	Loss 3.1356 (3.2896)	Entropy 0.92138 (0.92404)	Top-1 acc 51.172 (45.630)	Top-5 acc 71.094 (69.452)	lr 0.02296
Train [23][450/3239]	Time 0.652 (0.994)	Data Time 0.001 (0.059)	Loss 3.2729 (3.2901)	Entropy 0.92161 (0.92398)	Top-1 acc 47.656 (45.593)	Top-5 acc 71.484 (69.431)	lr 0.02296
Train [23][460/3239]	Time 0.598 (0.991)	Data Time 0.001 (0.058)	Loss 3.1171 (3.2898)	Entropy 0.92168 (0.92393)	Top-1 acc 53.906 (45.623)	Top-5 acc 73.047 (69.448)	lr 0.02296
Train [23][470/3239]	Time 0.597 (0.988)	Data Time 0.002 (0.057)	Loss 3.1924 (3.2875)	Entropy 0.92150 (0.92388)	Top-1 acc 47.266 (45.663)	Top-5 acc 73.438 (69.496)	lr 0.02296
Train [23][480/3239]	Time 0.626 (0.986)	Data Time 0.001 (0.056)	Loss 3.2203 (3.2871)	Entropy 0.92125 (0.92383)	Top-1 acc 47.266 (45.661)	Top-5 acc 69.922 (69.483)	lr 0.02296
Train [23][490/3239]	Time 0.619 (0.983)	Data Time 0.001 (0.055)	Loss 3.2589 (3.2875)	Entropy 0.92079 (0.92377)	Top-1 acc 45.703 (45.651)	Top-5 acc 68.750 (69.498)	lr 0.02296
Train [23][500/3239]	Time 0.689 (0.981)	Data Time 0.001 (0.054)	Loss 3.2475 (3.2877)	Entropy 0.92086 (0.92371)	Top-1 acc 44.531 (45.654)	Top-5 acc 70.703 (69.496)	lr 0.02296
Train [23][510/3239]	Time 0.624 (0.977)	Data Time 0.001 (0.053)	Loss 3.2476 (3.2881)	Entropy 0.92078 (0.92365)	Top-1 acc 46.875 (45.638)	Top-5 acc 69.531 (69.484)	lr 0.02296
Train [23][520/3239]	Time 0.635 (0.975)	Data Time 0.001 (0.052)	Loss 3.2704 (3.2876)	Entropy 0.92056 (0.92360)	Top-1 acc 49.609 (45.663)	Top-5 acc 68.750 (69.489)	lr 0.02295
Train [23][530/3239]	Time 0.628 (0.973)	Data Time 0.002 (0.051)	Loss 3.1492 (3.2894)	Entropy 0.92010 (0.92354)	Top-1 acc 48.047 (45.633)	Top-5 acc 72.656 (69.453)	lr 0.02295
Train [23][540/3239]	Time 0.615 (0.971)	Data Time 0.002 (0.050)	Loss 3.5477 (3.2903)	Entropy 0.91997 (0.92347)	Top-1 acc 38.281 (45.603)	Top-5 acc 66.406 (69.443)	lr 0.02295
Train [23][550/3239]	Time 0.611 (0.969)	Data Time 0.001 (0.049)	Loss 3.2572 (3.2899)	Entropy 0.91960 (0.92341)	Top-1 acc 48.828 (45.619)	Top-5 acc 71.484 (69.438)	lr 0.02295
Train [23][560/3239]	Time 0.593 (0.967)	Data Time 0.001 (0.048)	Loss 3.2713 (3.2892)	Entropy 0.91908 (0.92333)	Top-1 acc 45.703 (45.638)	Top-5 acc 68.750 (69.443)	lr 0.02295
Train [23][570/3239]	Time 0.565 (0.965)	Data Time 0.001 (0.047)	Loss 3.6737 (3.2909)	Entropy 0.91906 (0.92326)	Top-1 acc 38.281 (45.592)	Top-5 acc 63.672 (69.415)	lr 0.02295
Train [23][580/3239]	Time 0.617 (0.964)	Data Time 0.001 (0.047)	Loss 3.4395 (3.2919)	Entropy 0.91887 (0.92319)	Top-1 acc 39.062 (45.574)	Top-5 acc 67.969 (69.389)	lr 0.02295
Train [23][590/3239]	Time 0.720 (0.962)	Data Time 0.001 (0.046)	Loss 3.2862 (3.2925)	Entropy 0.91868 (0.92311)	Top-1 acc 47.656 (45.572)	Top-5 acc 69.141 (69.368)	lr 0.02295
Train [23][600/3239]	Time 0.607 (0.961)	Data Time 0.001 (0.045)	Loss 3.2506 (3.2924)	Entropy 0.91868 (0.92304)	Top-1 acc 46.484 (45.576)	Top-5 acc 69.922 (69.364)	lr 0.02295
Train [23][610/3239]	Time 0.606 (0.959)	Data Time 0.001 (0.044)	Loss 3.4548 (3.2921)	Entropy 0.91919 (0.92297)	Top-1 acc 42.578 (45.589)	Top-5 acc 66.797 (69.369)	lr 0.02295
Train [23][620/3239]	Time 0.556 (0.957)	Data Time 0.001 (0.044)	Loss 3.2129 (3.2930)	Entropy 0.91895 (0.92290)	Top-1 acc 51.172 (45.571)	Top-5 acc 68.750 (69.340)	lr 0.02295
Train [23][630/3239]	Time 0.601 (0.955)	Data Time 0.001 (0.043)	Loss 3.2248 (3.2930)	Entropy 0.91875 (0.92284)	Top-1 acc 46.484 (45.563)	Top-5 acc 71.875 (69.339)	lr 0.02295
Train [23][640/3239]	Time 0.616 (0.954)	Data Time 0.001 (0.042)	Loss 3.3278 (3.2935)	Entropy 0.91889 (0.92278)	Top-1 acc 44.531 (45.529)	Top-5 acc 65.625 (69.320)	lr 0.02295
Train [23][650/3239]	Time 0.598 (0.952)	Data Time 0.001 (0.042)	Loss 3.4190 (3.2943)	Entropy 0.91884 (0.92272)	Top-1 acc 40.625 (45.493)	Top-5 acc 67.188 (69.301)	lr 0.02295
Train [23][660/3239]	Time 0.731 (0.951)	Data Time 0.001 (0.041)	Loss 3.2632 (3.2940)	Entropy 0.91907 (0.92266)	Top-1 acc 46.484 (45.486)	Top-5 acc 69.922 (69.294)	lr 0.02295
Train [23][670/3239]	Time 0.625 (0.950)	Data Time 0.001 (0.041)	Loss 3.2790 (3.2933)	Entropy 0.91921 (0.92261)	Top-1 acc 46.875 (45.514)	Top-5 acc 67.188 (69.307)	lr 0.02295
Train [23][680/3239]	Time 0.592 (0.948)	Data Time 0.001 (0.040)	Loss 3.1868 (3.2922)	Entropy 0.91894 (0.92256)	Top-1 acc 48.438 (45.534)	Top-5 acc 71.094 (69.323)	lr 0.02295
Train [23][690/3239]	Time 0.550 (0.947)	Data Time 0.001 (0.039)	Loss 3.1405 (3.2923)	Entropy 0.91894 (0.92251)	Top-1 acc 49.219 (45.525)	Top-5 acc 71.484 (69.318)	lr 0.02295
Train [23][700/3239]	Time 0.611 (0.945)	Data Time 0.002 (0.039)	Loss 3.2859 (3.2917)	Entropy 0.91935 (0.92246)	Top-1 acc 44.531 (45.542)	Top-5 acc 68.359 (69.328)	lr 0.02294
Train [23][710/3239]	Time 0.594 (0.944)	Data Time 0.001 (0.038)	Loss 3.2244 (3.2912)	Entropy 0.91940 (0.92242)	Top-1 acc 46.094 (45.537)	Top-5 acc 68.750 (69.328)	lr 0.02294
Train [23][720/3239]	Time 0.620 (0.943)	Data Time 0.001 (0.038)	Loss 3.4236 (3.2907)	Entropy 0.91952 (0.92237)	Top-1 acc 41.016 (45.532)	Top-5 acc 66.797 (69.348)	lr 0.02294
Train [23][730/3239]	Time 0.593 (0.942)	Data Time 0.001 (0.037)	Loss 3.0067 (3.2905)	Entropy 0.91944 (0.92233)	Top-1 acc 55.469 (45.565)	Top-5 acc 74.609 (69.362)	lr 0.02294
Train [23][740/3239]	Time 0.783 (0.977)	Data Time 0.005 (0.037)	Loss 3.4836 (3.2910)	Entropy 0.91912 (0.92229)	Top-1 acc 41.016 (45.563)	Top-5 acc 68.359 (69.360)	lr 0.02294
Train [23][750/3239]	Time 0.690 (0.976)	Data Time 0.002 (0.036)	Loss 3.2031 (3.2914)	Entropy 0.91908 (0.92225)	Top-1 acc 48.828 (45.555)	Top-5 acc 69.531 (69.363)	lr 0.02294
Train [23][760/3239]	Time 0.623 (0.975)	Data Time 0.002 (0.036)	Loss 3.2131 (3.2922)	Entropy 0.91886 (0.92221)	Top-1 acc 48.047 (45.534)	Top-5 acc 71.094 (69.343)	lr 0.02294
Train [23][770/3239]	Time 0.624 (0.973)	Data Time 0.002 (0.036)	Loss 3.3857 (3.2922)	Entropy 0.91933 (0.92217)	Top-1 acc 44.141 (45.537)	Top-5 acc 67.188 (69.342)	lr 0.02294
Train [23][780/3239]	Time 0.579 (0.972)	Data Time 0.001 (0.035)	Loss 3.2475 (3.2925)	Entropy 0.91887 (0.92213)	Top-1 acc 44.141 (45.534)	Top-5 acc 70.703 (69.341)	lr 0.02294
Train [23][790/3239]	Time 0.592 (0.970)	Data Time 0.001 (0.035)	Loss 3.2460 (3.2928)	Entropy 0.91886 (0.92209)	Top-1 acc 46.875 (45.523)	Top-5 acc 70.703 (69.329)	lr 0.02294
Train [23][800/3239]	Time 0.611 (0.969)	Data Time 0.001 (0.034)	Loss 3.2205 (3.2929)	Entropy 0.91812 (0.92205)	Top-1 acc 46.094 (45.509)	Top-5 acc 71.094 (69.332)	lr 0.02294
Train [23][810/3239]	Time 0.590 (0.967)	Data Time 0.001 (0.034)	Loss 3.2622 (3.2920)	Entropy 0.91784 (0.92200)	Top-1 acc 45.312 (45.512)	Top-5 acc 71.875 (69.358)	lr 0.02294
Train [23][820/3239]	Time 0.702 (0.965)	Data Time 0.006 (0.034)	Loss 3.6332 (3.2922)	Entropy 0.91780 (0.92195)	Top-1 acc 37.109 (45.508)	Top-5 acc 60.547 (69.352)	lr 0.02294
Train [23][830/3239]	Time 0.590 (0.964)	Data Time 0.001 (0.033)	Loss 3.2287 (3.2919)	Entropy 0.91766 (0.92189)	Top-1 acc 48.438 (45.510)	Top-5 acc 71.094 (69.362)	lr 0.02294
Train [23][840/3239]	Time 0.574 (0.963)	Data Time 0.001 (0.033)	Loss 3.4649 (3.2918)	Entropy 0.91811 (0.92185)	Top-1 acc 41.406 (45.511)	Top-5 acc 64.844 (69.366)	lr 0.02294
Train [23][850/3239]	Time 0.627 (0.962)	Data Time 0.001 (0.032)	Loss 3.5096 (3.2920)	Entropy 0.91817 (0.92180)	Top-1 acc 43.359 (45.513)	Top-5 acc 65.234 (69.358)	lr 0.02294
Train [23][860/3239]	Time 0.573 (0.961)	Data Time 0.001 (0.032)	Loss 3.3513 (3.2923)	Entropy 0.91830 (0.92176)	Top-1 acc 41.016 (45.513)	Top-5 acc 68.359 (69.335)	lr 0.02294
Train [23][870/3239]	Time 0.596 (0.960)	Data Time 0.001 (0.032)	Loss 3.2612 (3.2924)	Entropy 0.91822 (0.92172)	Top-1 acc 44.922 (45.511)	Top-5 acc 69.922 (69.334)	lr 0.02294
Train [23][880/3239]	Time 0.601 (0.959)	Data Time 0.002 (0.031)	Loss 3.0930 (3.2922)	Entropy 0.91828 (0.92168)	Top-1 acc 48.438 (45.505)	Top-5 acc 72.266 (69.341)	lr 0.02293
Train [23][890/3239]	Time 0.594 (0.958)	Data Time 0.001 (0.031)	Loss 3.3806 (3.2928)	Entropy 0.91803 (0.92164)	Top-1 acc 44.922 (45.502)	Top-5 acc 67.188 (69.316)	lr 0.02293
Train [23][900/3239]	Time 0.626 (0.957)	Data Time 0.001 (0.031)	Loss 3.0537 (3.2924)	Entropy 0.91829 (0.92160)	Top-1 acc 50.000 (45.521)	Top-5 acc 72.656 (69.329)	lr 0.02293
Train [23][910/3239]	Time 0.589 (0.956)	Data Time 0.001 (0.030)	Loss 3.5110 (3.2934)	Entropy 0.91821 (0.92157)	Top-1 acc 40.625 (45.494)	Top-5 acc 64.844 (69.307)	lr 0.02293
Train [23][920/3239]	Time 0.596 (0.955)	Data Time 0.001 (0.030)	Loss 3.2192 (3.2934)	Entropy 0.91793 (0.92153)	Top-1 acc 48.828 (45.505)	Top-5 acc 69.531 (69.296)	lr 0.02293
Train [23][930/3239]	Time 0.597 (0.954)	Data Time 0.002 (0.030)	Loss 3.3423 (3.2935)	Entropy 0.91776 (0.92149)	Top-1 acc 46.094 (45.515)	Top-5 acc 66.406 (69.290)	lr 0.02293
Train [23][940/3239]	Time 0.588 (0.953)	Data Time 0.001 (0.030)	Loss 3.3486 (3.2934)	Entropy 0.91751 (0.92145)	Top-1 acc 45.312 (45.516)	Top-5 acc 64.453 (69.289)	lr 0.02293
Train [23][950/3239]	Time 0.625 (0.952)	Data Time 0.001 (0.029)	Loss 2.9710 (3.2924)	Entropy 0.91787 (0.92141)	Top-1 acc 52.344 (45.541)	Top-5 acc 77.734 (69.311)	lr 0.02293
Train [23][960/3239]	Time 0.607 (0.951)	Data Time 0.001 (0.029)	Loss 3.3621 (3.2922)	Entropy 0.91779 (0.92137)	Top-1 acc 45.312 (45.535)	Top-5 acc 67.578 (69.313)	lr 0.02293
Train [23][970/3239]	Time 0.632 (0.950)	Data Time 0.001 (0.029)	Loss 3.0928 (3.2920)	Entropy 0.91769 (0.92134)	Top-1 acc 46.875 (45.528)	Top-5 acc 74.609 (69.318)	lr 0.02293
Train [23][980/3239]	Time 0.615 (0.949)	Data Time 0.001 (0.028)	Loss 3.4575 (3.2920)	Entropy 0.91751 (0.92130)	Top-1 acc 41.406 (45.526)	Top-5 acc 65.234 (69.322)	lr 0.02293
Train [23][990/3239]	Time 0.596 (0.948)	Data Time 0.001 (0.028)	Loss 3.4258 (3.2918)	Entropy 0.91720 (0.92126)	Top-1 acc 39.062 (45.520)	Top-5 acc 64.062 (69.325)	lr 0.02293
Train [23][1000/3239]	Time 0.598 (0.947)	Data Time 0.002 (0.028)	Loss 3.3396 (3.2922)	Entropy 0.91733 (0.92122)	Top-1 acc 45.703 (45.513)	Top-5 acc 66.406 (69.320)	lr 0.02293
Train [23][1010/3239]	Time 0.562 (0.946)	Data Time 0.001 (0.028)	Loss 3.4692 (3.2923)	Entropy 0.91680 (0.92118)	Top-1 acc 43.359 (45.511)	Top-5 acc 64.062 (69.311)	lr 0.02293
Train [23][1020/3239]	Time 0.598 (0.945)	Data Time 0.001 (0.027)	Loss 3.1716 (3.2925)	Entropy 0.91665 (0.92114)	Top-1 acc 46.484 (45.513)	Top-5 acc 72.656 (69.305)	lr 0.02293
Train [23][1030/3239]	Time 0.645 (0.944)	Data Time 0.001 (0.027)	Loss 3.1925 (3.2925)	Entropy 0.91633 (0.92109)	Top-1 acc 45.703 (45.507)	Top-5 acc 71.875 (69.301)	lr 0.02293
Train [23][1040/3239]	Time 0.626 (0.944)	Data Time 0.001 (0.027)	Loss 3.3448 (3.2928)	Entropy 0.91655 (0.92105)	Top-1 acc 44.141 (45.492)	Top-5 acc 65.625 (69.283)	lr 0.02293
Train [23][1050/3239]	Time 0.719 (0.943)	Data Time 0.001 (0.027)	Loss 3.3616 (3.2920)	Entropy 0.91634 (0.92100)	Top-1 acc 44.531 (45.504)	Top-5 acc 69.922 (69.302)	lr 0.02293
Train [23][1060/3239]	Time 0.611 (0.942)	Data Time 0.001 (0.026)	Loss 3.2899 (3.2917)	Entropy 0.91657 (0.92096)	Top-1 acc 43.750 (45.512)	Top-5 acc 71.094 (69.317)	lr 0.02292
Train [23][1070/3239]	Time 0.632 (0.942)	Data Time 0.001 (0.026)	Loss 3.1292 (3.2909)	Entropy 0.91612 (0.92092)	Top-1 acc 45.703 (45.529)	Top-5 acc 73.828 (69.335)	lr 0.02292
Train [23][1080/3239]	Time 0.608 (0.941)	Data Time 0.001 (0.026)	Loss 3.3623 (3.2907)	Entropy 0.91653 (0.92087)	Top-1 acc 43.750 (45.542)	Top-5 acc 67.578 (69.332)	lr 0.02292
Train [23][1090/3239]	Time 0.613 (0.940)	Data Time 0.001 (0.026)	Loss 3.2868 (3.2907)	Entropy 0.91599 (0.92083)	Top-1 acc 42.188 (45.539)	Top-5 acc 68.359 (69.334)	lr 0.02292
Train [23][1100/3239]	Time 0.597 (0.940)	Data Time 0.001 (0.026)	Loss 3.2333 (3.2903)	Entropy 0.91573 (0.92079)	Top-1 acc 46.875 (45.554)	Top-5 acc 71.875 (69.343)	lr 0.02292
Train [23][1110/3239]	Time 0.609 (0.939)	Data Time 0.001 (0.025)	Loss 3.2420 (3.2903)	Entropy 0.91582 (0.92074)	Top-1 acc 48.828 (45.564)	Top-5 acc 71.484 (69.344)	lr 0.02292
Train [23][1120/3239]	Time 0.617 (0.938)	Data Time 0.002 (0.025)	Loss 3.4272 (3.2906)	Entropy 0.91575 (0.92070)	Top-1 acc 44.922 (45.558)	Top-5 acc 67.578 (69.337)	lr 0.02292
Train [23][1130/3239]	Time 0.598 (0.938)	Data Time 0.001 (0.025)	Loss 3.2408 (3.2904)	Entropy 0.91560 (0.92065)	Top-1 acc 47.656 (45.564)	Top-5 acc 67.578 (69.338)	lr 0.02292
Train [23][1140/3239]	Time 0.683 (0.937)	Data Time 0.001 (0.025)	Loss 3.1583 (3.2898)	Entropy 0.91575 (0.92061)	Top-1 acc 50.391 (45.577)	Top-5 acc 71.094 (69.345)	lr 0.02292
Train [23][1150/3239]	Time 0.620 (0.936)	Data Time 0.002 (0.025)	Loss 3.3163 (3.2902)	Entropy 0.91555 (0.92057)	Top-1 acc 46.484 (45.573)	Top-5 acc 66.797 (69.335)	lr 0.02292
Train [23][1160/3239]	Time 0.452 (0.935)	Data Time 0.001 (0.024)	Loss 3.4952 (3.2909)	Entropy 0.91591 (0.92052)	Top-1 acc 43.750 (45.566)	Top-5 acc 66.406 (69.326)	lr 0.02292
Train [23][1170/3239]	Time 0.637 (0.934)	Data Time 0.001 (0.024)	Loss 3.3915 (3.2910)	Entropy 0.91565 (0.92048)	Top-1 acc 44.922 (45.552)	Top-5 acc 69.141 (69.328)	lr 0.02292
Train [23][1180/3239]	Time 0.595 (0.934)	Data Time 0.001 (0.024)	Loss 3.2312 (3.2909)	Entropy 0.91519 (0.92044)	Top-1 acc 46.484 (45.560)	Top-5 acc 71.094 (69.327)	lr 0.02292
Train [23][1190/3239]	Time 0.577 (0.933)	Data Time 0.002 (0.024)	Loss 3.2384 (3.2909)	Entropy 0.91509 (0.92040)	Top-1 acc 48.047 (45.572)	Top-5 acc 73.047 (69.331)	lr 0.02292
Train [23][1200/3239]	Time 0.594 (0.933)	Data Time 0.001 (0.024)	Loss 3.2564 (3.2903)	Entropy 0.91506 (0.92035)	Top-1 acc 42.969 (45.588)	Top-5 acc 71.484 (69.342)	lr 0.02292
Train [23][1210/3239]	Time 0.699 (0.932)	Data Time 0.001 (0.023)	Loss 3.2557 (3.2907)	Entropy 0.91482 (0.92031)	Top-1 acc 48.438 (45.572)	Top-5 acc 68.750 (69.337)	lr 0.02292
Train [23][1220/3239]	Time 0.659 (0.932)	Data Time 0.001 (0.023)	Loss 3.2686 (3.2910)	Entropy 0.91453 (0.92026)	Top-1 acc 47.266 (45.569)	Top-5 acc 70.703 (69.330)	lr 0.02292
Train [23][1230/3239]	Time 0.601 (0.931)	Data Time 0.002 (0.023)	Loss 3.3365 (3.2906)	Entropy 0.91468 (0.92022)	Top-1 acc 44.922 (45.577)	Top-5 acc 67.969 (69.330)	lr 0.02292
Train [23][1240/3239]	Time 0.596 (0.931)	Data Time 0.002 (0.023)	Loss 3.2955 (3.2910)	Entropy 0.91505 (0.92017)	Top-1 acc 45.703 (45.561)	Top-5 acc 70.703 (69.322)	lr 0.02291
Train [23][1250/3239]	Time 0.605 (0.930)	Data Time 0.001 (0.023)	Loss 3.3177 (3.2913)	Entropy 0.91495 (0.92013)	Top-1 acc 41.016 (45.553)	Top-5 acc 66.406 (69.308)	lr 0.02291
Train [23][1260/3239]	Time 0.625 (0.930)	Data Time 0.001 (0.023)	Loss 3.3881 (3.2914)	Entropy 0.91477 (0.92009)	Top-1 acc 47.656 (45.556)	Top-5 acc 66.406 (69.299)	lr 0.02291
Train [23][1270/3239]	Time 0.605 (0.929)	Data Time 0.001 (0.022)	Loss 3.2666 (3.2911)	Entropy 0.91484 (0.92005)	Top-1 acc 46.875 (45.563)	Top-5 acc 69.531 (69.305)	lr 0.02291
Train [23][1280/3239]	Time 0.624 (0.929)	Data Time 0.001 (0.022)	Loss 3.2598 (3.2910)	Entropy 0.91527 (0.92001)	Top-1 acc 50.000 (45.562)	Top-5 acc 67.969 (69.301)	lr 0.02291
Train [23][1290/3239]	Time 0.584 (0.928)	Data Time 0.001 (0.022)	Loss 3.3019 (3.2910)	Entropy 0.91493 (0.91997)	Top-1 acc 44.531 (45.555)	Top-5 acc 69.531 (69.299)	lr 0.02291
Train [23][1300/3239]	Time 0.598 (0.928)	Data Time 0.002 (0.022)	Loss 3.3977 (3.2910)	Entropy 0.91529 (0.91993)	Top-1 acc 42.578 (45.553)	Top-5 acc 68.750 (69.297)	lr 0.02291
Train [23][1310/3239]	Time 0.644 (0.927)	Data Time 0.001 (0.022)	Loss 3.1331 (3.2909)	Entropy 0.91503 (0.91990)	Top-1 acc 49.609 (45.554)	Top-5 acc 69.922 (69.301)	lr 0.02291
Train [23][1320/3239]	Time 0.625 (0.927)	Data Time 0.001 (0.022)	Loss 3.0644 (3.2907)	Entropy 0.91491 (0.91986)	Top-1 acc 50.000 (45.557)	Top-5 acc 76.953 (69.300)	lr 0.02291
Train [23][1330/3239]	Time 0.606 (0.926)	Data Time 0.002 (0.022)	Loss 3.2119 (3.2908)	Entropy 0.91471 (0.91982)	Top-1 acc 46.094 (45.552)	Top-5 acc 69.531 (69.295)	lr 0.02291
Train [23][1340/3239]	Time 0.577 (0.925)	Data Time 0.003 (0.021)	Loss 3.5142 (3.2913)	Entropy 0.91490 (0.91979)	Top-1 acc 40.625 (45.544)	Top-5 acc 63.672 (69.288)	lr 0.02291
Train [23][1350/3239]	Time 0.603 (0.925)	Data Time 0.001 (0.021)	Loss 3.5740 (3.2913)	Entropy 0.91418 (0.91975)	Top-1 acc 39.453 (45.538)	Top-5 acc 63.672 (69.288)	lr 0.02291
Train [23][1360/3239]	Time 0.577 (0.924)	Data Time 0.001 (0.021)	Loss 3.2960 (3.2912)	Entropy 0.91464 (0.91971)	Top-1 acc 44.922 (45.545)	Top-5 acc 71.094 (69.294)	lr 0.02291
Train [23][1370/3239]	Time 0.716 (0.924)	Data Time 0.001 (0.021)	Loss 3.3713 (3.2908)	Entropy 0.91445 (0.91967)	Top-1 acc 43.359 (45.553)	Top-5 acc 66.406 (69.304)	lr 0.02291
Train [23][1380/3239]	Time 0.656 (0.924)	Data Time 0.002 (0.021)	Loss 3.2781 (3.2909)	Entropy 0.91435 (0.91963)	Top-1 acc 47.656 (45.547)	Top-5 acc 69.922 (69.304)	lr 0.02291
Train [23][1390/3239]	Time 0.632 (0.923)	Data Time 0.001 (0.021)	Loss 3.2545 (3.2909)	Entropy 0.91396 (0.91959)	Top-1 acc 49.609 (45.554)	Top-5 acc 68.359 (69.304)	lr 0.02291
Train [23][1400/3239]	Time 0.606 (0.942)	Data Time 0.002 (0.021)	Loss 3.1840 (3.2906)	Entropy 0.91413 (0.91955)	Top-1 acc 46.484 (45.556)	Top-5 acc 71.484 (69.308)	lr 0.02291
Train [23][1410/3239]	Time 0.619 (0.941)	Data Time 0.002 (0.020)	Loss 3.3774 (3.2909)	Entropy 0.91452 (0.91952)	Top-1 acc 46.875 (45.554)	Top-5 acc 67.578 (69.304)	lr 0.02291
Train [23][1420/3239]	Time 0.594 (0.941)	Data Time 0.002 (0.020)	Loss 3.3665 (3.2911)	Entropy 0.91475 (0.91948)	Top-1 acc 45.312 (45.555)	Top-5 acc 65.234 (69.297)	lr 0.02290
Train [23][1430/3239]	Time 0.586 (0.940)	Data Time 0.002 (0.020)	Loss 3.2805 (3.2913)	Entropy 0.91470 (0.91945)	Top-1 acc 47.266 (45.548)	Top-5 acc 70.703 (69.293)	lr 0.02290
Train [23][1440/3239]	Time 0.580 (0.940)	Data Time 0.002 (0.020)	Loss 3.1398 (3.2910)	Entropy 0.91494 (0.91942)	Top-1 acc 48.438 (45.552)	Top-5 acc 74.219 (69.304)	lr 0.02290
Train [23][1450/3239]	Time 0.562 (0.939)	Data Time 0.001 (0.020)	Loss 3.4251 (3.2912)	Entropy 0.91510 (0.91939)	Top-1 acc 44.531 (45.552)	Top-5 acc 66.797 (69.295)	lr 0.02290
Train [23][1460/3239]	Time 0.578 (0.938)	Data Time 0.003 (0.020)	Loss 3.3499 (3.2915)	Entropy 0.91540 (0.91936)	Top-1 acc 42.188 (45.541)	Top-5 acc 67.578 (69.287)	lr 0.02290
Train [23][1470/3239]	Time 0.607 (0.938)	Data Time 0.001 (0.020)	Loss 3.1930 (3.2911)	Entropy 0.91568 (0.91933)	Top-1 acc 48.047 (45.554)	Top-5 acc 74.219 (69.298)	lr 0.02290
Train [23][1480/3239]	Time 0.639 (0.937)	Data Time 0.001 (0.020)	Loss 3.3041 (3.2908)	Entropy 0.91523 (0.91931)	Top-1 acc 42.969 (45.551)	Top-5 acc 69.531 (69.300)	lr 0.02290
Train [23][1490/3239]	Time 0.624 (0.937)	Data Time 0.001 (0.019)	Loss 3.3999 (3.2911)	Entropy 0.91521 (0.91928)	Top-1 acc 45.703 (45.547)	Top-5 acc 65.625 (69.290)	lr 0.02290
Train [23][1500/3239]	Time 0.597 (0.937)	Data Time 0.001 (0.019)	Loss 3.5577 (3.2909)	Entropy 0.91496 (0.91925)	Top-1 acc 39.844 (45.548)	Top-5 acc 64.453 (69.297)	lr 0.02290
Train [23][1510/3239]	Time 0.625 (0.936)	Data Time 0.001 (0.019)	Loss 3.2468 (3.2907)	Entropy 0.91505 (0.91922)	Top-1 acc 46.094 (45.547)	Top-5 acc 69.141 (69.304)	lr 0.02290
Train [23][1520/3239]	Time 0.620 (0.936)	Data Time 0.001 (0.019)	Loss 3.2330 (3.2906)	Entropy 0.91512 (0.91919)	Top-1 acc 45.312 (45.545)	Top-5 acc 69.531 (69.302)	lr 0.02290
Train [23][1530/3239]	Time 0.701 (0.935)	Data Time 0.001 (0.019)	Loss 3.4555 (3.2905)	Entropy 0.91478 (0.91917)	Top-1 acc 40.625 (45.550)	Top-5 acc 65.625 (69.302)	lr 0.02290
Train [23][1540/3239]	Time 0.600 (0.935)	Data Time 0.001 (0.019)	Loss 3.2451 (3.2904)	Entropy 0.91520 (0.91914)	Top-1 acc 46.484 (45.552)	Top-5 acc 70.312 (69.302)	lr 0.02290
Train [23][1550/3239]	Time 0.575 (0.934)	Data Time 0.001 (0.019)	Loss 3.2421 (3.2903)	Entropy 0.91478 (0.91911)	Top-1 acc 46.875 (45.558)	Top-5 acc 70.703 (69.302)	lr 0.02290
Train [23][1560/3239]	Time 0.584 (0.934)	Data Time 0.001 (0.019)	Loss 3.2844 (3.2902)	Entropy 0.91457 (0.91908)	Top-1 acc 47.656 (45.563)	Top-5 acc 68.750 (69.304)	lr 0.02290
Train [23][1570/3239]	Time 0.637 (0.934)	Data Time 0.001 (0.019)	Loss 3.2328 (3.2901)	Entropy 0.91463 (0.91906)	Top-1 acc 45.312 (45.568)	Top-5 acc 71.094 (69.302)	lr 0.02290
Train [23][1580/3239]	Time 0.647 (0.934)	Data Time 0.001 (0.018)	Loss 3.1617 (3.2899)	Entropy 0.91457 (0.91903)	Top-1 acc 48.828 (45.572)	Top-5 acc 72.656 (69.306)	lr 0.02290
Train [23][1590/3239]	Time 0.602 (0.933)	Data Time 0.001 (0.018)	Loss 3.3199 (3.2899)	Entropy 0.91484 (0.91900)	Top-1 acc 42.578 (45.569)	Top-5 acc 68.359 (69.308)	lr 0.02290
Train [23][1600/3239]	Time 0.686 (0.933)	Data Time 0.001 (0.018)	Loss 3.3282 (3.2894)	Entropy 0.91473 (0.91898)	Top-1 acc 48.047 (45.582)	Top-5 acc 67.969 (69.318)	lr 0.02289
Train [23][1610/3239]	Time 0.585 (0.932)	Data Time 0.001 (0.018)	Loss 3.1185 (3.2889)	Entropy 0.91466 (0.91895)	Top-1 acc 48.828 (45.594)	Top-5 acc 73.828 (69.332)	lr 0.02289
Train [23][1620/3239]	Time 0.589 (0.932)	Data Time 0.001 (0.018)	Loss 3.4343 (3.2892)	Entropy 0.91461 (0.91892)	Top-1 acc 42.188 (45.588)	Top-5 acc 67.969 (69.329)	lr 0.02289
Train [23][1630/3239]	Time 0.587 (0.931)	Data Time 0.002 (0.018)	Loss 3.5228 (3.2897)	Entropy 0.91491 (0.91890)	Top-1 acc 42.578 (45.580)	Top-5 acc 63.672 (69.322)	lr 0.02289
Train [23][1640/3239]	Time 0.611 (0.930)	Data Time 0.002 (0.018)	Loss 3.4083 (3.2897)	Entropy 0.91499 (0.91887)	Top-1 acc 39.844 (45.576)	Top-5 acc 67.578 (69.322)	lr 0.02289
Train [23][1650/3239]	Time 0.573 (0.930)	Data Time 0.001 (0.018)	Loss 3.3921 (3.2897)	Entropy 0.91446 (0.91885)	Top-1 acc 41.016 (45.578)	Top-5 acc 68.359 (69.326)	lr 0.02289
Train [23][1660/3239]	Time 0.594 (0.930)	Data Time 0.002 (0.018)	Loss 3.3303 (3.2896)	Entropy 0.91425 (0.91882)	Top-1 acc 44.531 (45.575)	Top-5 acc 69.141 (69.326)	lr 0.02289
Train [23][1670/3239]	Time 0.620 (0.929)	Data Time 0.001 (0.018)	Loss 3.3284 (3.2895)	Entropy 0.91405 (0.91879)	Top-1 acc 41.797 (45.573)	Top-5 acc 67.969 (69.325)	lr 0.02289
Train [23][1680/3239]	Time 0.603 (0.929)	Data Time 0.001 (0.018)	Loss 3.0743 (3.2895)	Entropy 0.91432 (0.91877)	Top-1 acc 44.922 (45.575)	Top-5 acc 73.438 (69.330)	lr 0.02289
Train [23][1690/3239]	Time 0.730 (0.929)	Data Time 0.001 (0.017)	Loss 3.4426 (3.2899)	Entropy 0.91426 (0.91874)	Top-1 acc 41.016 (45.562)	Top-5 acc 67.969 (69.330)	lr 0.02289
Train [23][1700/3239]	Time 0.613 (0.929)	Data Time 0.001 (0.017)	Loss 3.1838 (3.2900)	Entropy 0.91426 (0.91871)	Top-1 acc 45.312 (45.550)	Top-5 acc 70.703 (69.329)	lr 0.02289
Train [23][1710/3239]	Time 0.606 (0.928)	Data Time 0.001 (0.017)	Loss 3.3393 (3.2902)	Entropy 0.91450 (0.91869)	Top-1 acc 44.531 (45.549)	Top-5 acc 66.797 (69.327)	lr 0.02289
Train [23][1720/3239]	Time 0.588 (0.928)	Data Time 0.001 (0.017)	Loss 3.4619 (3.2903)	Entropy 0.91441 (0.91866)	Top-1 acc 40.625 (45.540)	Top-5 acc 67.969 (69.327)	lr 0.02289
Train [23][1730/3239]	Time 0.585 (0.928)	Data Time 0.001 (0.017)	Loss 3.2716 (3.2907)	Entropy 0.91395 (0.91864)	Top-1 acc 47.266 (45.529)	Top-5 acc 69.922 (69.317)	lr 0.02289
Train [23][1740/3239]	Time 0.638 (0.927)	Data Time 0.001 (0.017)	Loss 3.1388 (3.2906)	Entropy 0.91406 (0.91861)	Top-1 acc 48.438 (45.531)	Top-5 acc 72.266 (69.309)	lr 0.02289
Train [23][1750/3239]	Time 0.607 (0.927)	Data Time 0.001 (0.017)	Loss 3.2377 (3.2909)	Entropy 0.91414 (0.91859)	Top-1 acc 48.828 (45.531)	Top-5 acc 69.922 (69.302)	lr 0.02289
Train [23][1760/3239]	Time 0.740 (0.926)	Data Time 0.001 (0.017)	Loss 3.2748 (3.2910)	Entropy 0.91395 (0.91856)	Top-1 acc 42.969 (45.522)	Top-5 acc 67.578 (69.298)	lr 0.02289
Train [23][1770/3239]	Time 0.621 (0.926)	Data Time 0.001 (0.017)	Loss 3.1367 (3.2910)	Entropy 0.91432 (0.91854)	Top-1 acc 45.312 (45.521)	Top-5 acc 69.922 (69.293)	lr 0.02288
Train [23][1780/3239]	Time 0.605 (0.926)	Data Time 0.001 (0.017)	Loss 3.2250 (3.2906)	Entropy 0.91410 (0.91851)	Top-1 acc 46.875 (45.531)	Top-5 acc 70.703 (69.304)	lr 0.02288
Train [23][1790/3239]	Time 0.680 (0.925)	Data Time 0.003 (0.017)	Loss 3.1569 (3.2910)	Entropy 0.91415 (0.91849)	Top-1 acc 46.094 (45.524)	Top-5 acc 69.141 (69.294)	lr 0.02288
Train [23][1800/3239]	Time 0.448 (0.925)	Data Time 0.001 (0.016)	Loss 3.5064 (3.2909)	Entropy 0.91387 (0.91846)	Top-1 acc 41.797 (45.532)	Top-5 acc 64.844 (69.294)	lr 0.02288
Train [23][1810/3239]	Time 0.596 (0.924)	Data Time 0.001 (0.016)	Loss 3.2446 (3.2908)	Entropy 0.91343 (0.91844)	Top-1 acc 44.531 (45.527)	Top-5 acc 72.656 (69.299)	lr 0.02288
Train [23][1820/3239]	Time 0.637 (0.924)	Data Time 0.001 (0.016)	Loss 3.1027 (3.2905)	Entropy 0.91328 (0.91841)	Top-1 acc 46.875 (45.530)	Top-5 acc 72.266 (69.302)	lr 0.02288
Train [23][1830/3239]	Time 0.609 (0.924)	Data Time 0.001 (0.016)	Loss 3.0621 (3.2902)	Entropy 0.91288 (0.91838)	Top-1 acc 54.688 (45.544)	Top-5 acc 73.438 (69.309)	lr 0.02288
Train [23][1840/3239]	Time 0.659 (0.923)	Data Time 0.001 (0.016)	Loss 3.4126 (3.2905)	Entropy 0.91307 (0.91835)	Top-1 acc 40.234 (45.534)	Top-5 acc 66.797 (69.306)	lr 0.02288
Train [23][1850/3239]	Time 0.584 (0.923)	Data Time 0.001 (0.016)	Loss 3.2766 (3.2904)	Entropy 0.91273 (0.91832)	Top-1 acc 46.875 (45.533)	Top-5 acc 69.922 (69.305)	lr 0.02288
Train [23][1860/3239]	Time 0.607 (0.923)	Data Time 0.001 (0.016)	Loss 3.3461 (3.2905)	Entropy 0.91264 (0.91829)	Top-1 acc 45.703 (45.538)	Top-5 acc 69.531 (69.305)	lr 0.02288
Train [23][1870/3239]	Time 0.587 (0.923)	Data Time 0.001 (0.016)	Loss 3.3215 (3.2904)	Entropy 0.91249 (0.91826)	Top-1 acc 46.875 (45.545)	Top-5 acc 67.969 (69.307)	lr 0.02288
Train [23][1880/3239]	Time 0.567 (0.922)	Data Time 0.001 (0.016)	Loss 3.3981 (3.2902)	Entropy 0.91205 (0.91823)	Top-1 acc 39.844 (45.550)	Top-5 acc 65.625 (69.308)	lr 0.02288
Train [23][1890/3239]	Time 0.603 (0.922)	Data Time 0.001 (0.016)	Loss 3.1360 (3.2902)	Entropy 0.91195 (0.91820)	Top-1 acc 50.000 (45.553)	Top-5 acc 71.484 (69.307)	lr 0.02288
Train [23][1900/3239]	Time 0.592 (0.922)	Data Time 0.001 (0.016)	Loss 3.3385 (3.2899)	Entropy 0.91236 (0.91816)	Top-1 acc 42.188 (45.559)	Top-5 acc 67.578 (69.314)	lr 0.02288
Train [23][1910/3239]	Time 0.623 (0.921)	Data Time 0.001 (0.016)	Loss 3.3178 (3.2897)	Entropy 0.91217 (0.91813)	Top-1 acc 44.531 (45.563)	Top-5 acc 66.797 (69.312)	lr 0.02288
Train [23][1920/3239]	Time 0.719 (0.921)	Data Time 0.001 (0.016)	Loss 3.2374 (3.2894)	Entropy 0.91219 (0.91810)	Top-1 acc 50.000 (45.571)	Top-5 acc 69.531 (69.317)	lr 0.02288
Train [23][1930/3239]	Time 0.558 (0.921)	Data Time 0.001 (0.016)	Loss 3.4041 (3.2895)	Entropy 0.91241 (0.91807)	Top-1 acc 41.016 (45.568)	Top-5 acc 64.453 (69.315)	lr 0.02288
Train [23][1940/3239]	Time 0.542 (0.920)	Data Time 0.001 (0.015)	Loss 3.3852 (3.2893)	Entropy 0.91246 (0.91804)	Top-1 acc 42.578 (45.572)	Top-5 acc 66.016 (69.323)	lr 0.02288
Train [23][1950/3239]	Time 0.605 (0.920)	Data Time 0.001 (0.015)	Loss 3.3394 (3.2893)	Entropy 0.91244 (0.91801)	Top-1 acc 48.438 (45.575)	Top-5 acc 69.531 (69.319)	lr 0.02287
Train [23][1960/3239]	Time 0.605 (0.920)	Data Time 0.001 (0.015)	Loss 3.4837 (3.2893)	Entropy 0.91209 (0.91798)	Top-1 acc 44.141 (45.574)	Top-5 acc 63.281 (69.317)	lr 0.02287
Train [23][1970/3239]	Time 0.617 (0.919)	Data Time 0.001 (0.015)	Loss 3.0350 (3.2893)	Entropy 0.91207 (0.91795)	Top-1 acc 50.391 (45.570)	Top-5 acc 74.219 (69.317)	lr 0.02287
Train [23][1980/3239]	Time 0.597 (0.919)	Data Time 0.001 (0.015)	Loss 3.3431 (3.2894)	Entropy 0.91186 (0.91792)	Top-1 acc 44.531 (45.569)	Top-5 acc 69.922 (69.319)	lr 0.02287
Train [23][1990/3239]	Time 0.703 (0.919)	Data Time 0.001 (0.015)	Loss 3.5638 (3.2895)	Entropy 0.91179 (0.91789)	Top-1 acc 37.891 (45.561)	Top-5 acc 61.719 (69.320)	lr 0.02287
Train [23][2000/3239]	Time 0.597 (0.918)	Data Time 0.001 (0.015)	Loss 3.3222 (3.2896)	Entropy 0.91178 (0.91786)	Top-1 acc 44.531 (45.558)	Top-5 acc 67.969 (69.317)	lr 0.02287
Train [23][2010/3239]	Time 0.567 (0.918)	Data Time 0.001 (0.015)	Loss 3.5285 (3.2897)	Entropy 0.91128 (0.91783)	Top-1 acc 39.062 (45.555)	Top-5 acc 64.062 (69.314)	lr 0.02287
Train [23][2020/3239]	Time 0.571 (0.918)	Data Time 0.001 (0.015)	Loss 3.4922 (3.2899)	Entropy 0.91168 (0.91780)	Top-1 acc 39.062 (45.551)	Top-5 acc 64.844 (69.309)	lr 0.02287
Train [23][2030/3239]	Time 0.583 (0.918)	Data Time 0.001 (0.015)	Loss 3.2252 (3.2896)	Entropy 0.91155 (0.91777)	Top-1 acc 48.047 (45.560)	Top-5 acc 69.922 (69.316)	lr 0.02287
Train [23][2040/3239]	Time 0.599 (0.917)	Data Time 0.001 (0.015)	Loss 3.1219 (3.2891)	Entropy 0.91143 (0.91774)	Top-1 acc 44.922 (45.575)	Top-5 acc 74.609 (69.325)	lr 0.02287
Train [23][2050/3239]	Time 0.781 (0.930)	Data Time 0.007 (0.015)	Loss 3.4520 (3.2891)	Entropy 0.91177 (0.91771)	Top-1 acc 42.188 (45.578)	Top-5 acc 63.672 (69.321)	lr 0.02287
Train [23][2060/3239]	Time 0.635 (0.930)	Data Time 0.002 (0.015)	Loss 3.3532 (3.2893)	Entropy 0.91160 (0.91768)	Top-1 acc 47.656 (45.572)	Top-5 acc 66.797 (69.317)	lr 0.02287
Train [23][2070/3239]	Time 0.598 (0.930)	Data Time 0.002 (0.015)	Loss 3.3046 (3.2895)	Entropy 0.91122 (0.91765)	Top-1 acc 45.703 (45.571)	Top-5 acc 69.531 (69.313)	lr 0.02287
Train [23][2080/3239]	Time 0.712 (0.930)	Data Time 0.002 (0.015)	Loss 3.2851 (3.2893)	Entropy 0.91133 (0.91762)	Top-1 acc 45.312 (45.579)	Top-5 acc 70.312 (69.322)	lr 0.02287
Train [23][2090/3239]	Time 0.447 (0.929)	Data Time 0.001 (0.015)	Loss 3.2334 (3.2892)	Entropy 0.91160 (0.91759)	Top-1 acc 45.312 (45.578)	Top-5 acc 69.922 (69.325)	lr 0.02287
Train [23][2100/3239]	Time 0.577 (0.929)	Data Time 0.001 (0.014)	Loss 3.2351 (3.2892)	Entropy 0.91151 (0.91756)	Top-1 acc 44.922 (45.577)	Top-5 acc 69.922 (69.322)	lr 0.02287
Train [23][2110/3239]	Time 0.615 (0.929)	Data Time 0.002 (0.014)	Loss 3.2604 (3.2890)	Entropy 0.91108 (0.91753)	Top-1 acc 47.656 (45.583)	Top-5 acc 70.703 (69.323)	lr 0.02287
Train [23][2120/3239]	Time 0.638 (0.928)	Data Time 0.001 (0.014)	Loss 3.3610 (3.2890)	Entropy 0.91083 (0.91750)	Top-1 acc 44.922 (45.582)	Top-5 acc 68.750 (69.322)	lr 0.02287
Train [23][2130/3239]	Time 0.625 (0.928)	Data Time 0.001 (0.014)	Loss 3.3442 (3.2889)	Entropy 0.91083 (0.91747)	Top-1 acc 41.016 (45.585)	Top-5 acc 71.094 (69.323)	lr 0.02286
Train [23][2140/3239]	Time 0.597 (0.928)	Data Time 0.002 (0.014)	Loss 3.2927 (3.2886)	Entropy 0.91089 (0.91744)	Top-1 acc 45.703 (45.592)	Top-5 acc 68.359 (69.325)	lr 0.02286
Train [23][2150/3239]	Time 0.704 (0.927)	Data Time 0.001 (0.014)	Loss 3.3602 (3.2883)	Entropy 0.91049 (0.91741)	Top-1 acc 39.844 (45.599)	Top-5 acc 67.578 (69.331)	lr 0.02286
Train [23][2160/3239]	Time 0.612 (0.927)	Data Time 0.001 (0.014)	Loss 3.3050 (3.2880)	Entropy 0.91034 (0.91737)	Top-1 acc 41.016 (45.600)	Top-5 acc 67.578 (69.335)	lr 0.02286
Train [23][2170/3239]	Time 0.635 (0.927)	Data Time 0.001 (0.014)	Loss 3.4561 (3.2883)	Entropy 0.91056 (0.91734)	Top-1 acc 41.797 (45.592)	Top-5 acc 67.188 (69.329)	lr 0.02286
Train [23][2180/3239]	Time 0.614 (0.927)	Data Time 0.002 (0.014)	Loss 3.2892 (3.2882)	Entropy 0.91072 (0.91731)	Top-1 acc 46.484 (45.593)	Top-5 acc 67.578 (69.333)	lr 0.02286
Train [23][2190/3239]	Time 0.616 (0.926)	Data Time 0.001 (0.014)	Loss 3.1565 (3.2882)	Entropy 0.91049 (0.91728)	Top-1 acc 46.484 (45.592)	Top-5 acc 71.484 (69.337)	lr 0.02286
Train [23][2200/3239]	Time 0.649 (0.926)	Data Time 0.001 (0.014)	Loss 3.3627 (3.2885)	Entropy 0.91017 (0.91725)	Top-1 acc 42.578 (45.583)	Top-5 acc 70.312 (69.334)	lr 0.02286
Train [23][2210/3239]	Time 0.591 (0.926)	Data Time 0.002 (0.014)	Loss 3.1163 (3.2887)	Entropy 0.90961 (0.91722)	Top-1 acc 51.172 (45.577)	Top-5 acc 72.656 (69.331)	lr 0.02286
Train [23][2220/3239]	Time 0.611 (0.926)	Data Time 0.001 (0.014)	Loss 3.3436 (3.2888)	Entropy 0.90942 (0.91718)	Top-1 acc 46.875 (45.573)	Top-5 acc 66.406 (69.327)	lr 0.02286
Train [23][2230/3239]	Time 0.576 (0.925)	Data Time 0.001 (0.014)	Loss 3.2393 (3.2890)	Entropy 0.90951 (0.91715)	Top-1 acc 50.000 (45.570)	Top-5 acc 68.750 (69.320)	lr 0.02286
Train [23][2240/3239]	Time 0.689 (0.925)	Data Time 0.001 (0.014)	Loss 3.3501 (3.2892)	Entropy 0.90927 (0.91711)	Top-1 acc 43.359 (45.563)	Top-5 acc 66.797 (69.312)	lr 0.02286
Train [23][2250/3239]	Time 0.588 (0.925)	Data Time 0.001 (0.014)	Loss 3.1603 (3.2891)	Entropy 0.90885 (0.91708)	Top-1 acc 49.609 (45.568)	Top-5 acc 69.922 (69.312)	lr 0.02286
Train [23][2260/3239]	Time 0.582 (0.925)	Data Time 0.001 (0.014)	Loss 3.3112 (3.2890)	Entropy 0.90898 (0.91704)	Top-1 acc 45.312 (45.575)	Top-5 acc 66.016 (69.313)	lr 0.02286
Train [23][2270/3239]	Time 0.580 (0.924)	Data Time 0.001 (0.014)	Loss 3.3391 (3.2888)	Entropy 0.90880 (0.91700)	Top-1 acc 44.922 (45.577)	Top-5 acc 67.969 (69.319)	lr 0.02286
Train [23][2280/3239]	Time 0.628 (0.924)	Data Time 0.001 (0.013)	Loss 3.3186 (3.2887)	Entropy 0.90897 (0.91697)	Top-1 acc 40.625 (45.584)	Top-5 acc 68.750 (69.322)	lr 0.02286
Train [23][2290/3239]	Time 0.574 (0.924)	Data Time 0.001 (0.013)	Loss 3.2118 (3.2886)	Entropy 0.90903 (0.91693)	Top-1 acc 46.875 (45.588)	Top-5 acc 70.703 (69.325)	lr 0.02286
Train [23][2300/3239]	Time 0.602 (0.924)	Data Time 0.002 (0.013)	Loss 3.6264 (3.2890)	Entropy 0.90879 (0.91690)	Top-1 acc 39.062 (45.580)	Top-5 acc 62.109 (69.315)	lr 0.02286
Train [23][2310/3239]	Time 0.719 (0.923)	Data Time 0.001 (0.013)	Loss 3.4003 (3.2891)	Entropy 0.90886 (0.91687)	Top-1 acc 43.359 (45.579)	Top-5 acc 66.016 (69.308)	lr 0.02285
Train [23][2320/3239]	Time 0.568 (0.923)	Data Time 0.001 (0.013)	Loss 3.4424 (3.2891)	Entropy 0.90865 (0.91683)	Top-1 acc 44.531 (45.580)	Top-5 acc 66.406 (69.309)	lr 0.02285
Train [23][2330/3239]	Time 0.620 (0.923)	Data Time 0.001 (0.013)	Loss 3.3038 (3.2893)	Entropy 0.90838 (0.91679)	Top-1 acc 44.922 (45.573)	Top-5 acc 73.438 (69.309)	lr 0.02285
Train [23][2340/3239]	Time 0.595 (0.923)	Data Time 0.001 (0.013)	Loss 3.4149 (3.2894)	Entropy 0.90843 (0.91676)	Top-1 acc 40.234 (45.575)	Top-5 acc 65.625 (69.306)	lr 0.02285
Train [23][2350/3239]	Time 0.609 (0.922)	Data Time 0.001 (0.013)	Loss 3.2116 (3.2895)	Entropy 0.90834 (0.91672)	Top-1 acc 50.000 (45.570)	Top-5 acc 73.438 (69.307)	lr 0.02285
Train [23][2360/3239]	Time 0.623 (0.922)	Data Time 0.002 (0.013)	Loss 3.3784 (3.2895)	Entropy 0.90847 (0.91669)	Top-1 acc 42.969 (45.572)	Top-5 acc 64.844 (69.302)	lr 0.02285
Train [23][2370/3239]	Time 0.641 (0.922)	Data Time 0.001 (0.013)	Loss 3.3827 (3.2894)	Entropy 0.90805 (0.91665)	Top-1 acc 44.922 (45.577)	Top-5 acc 66.406 (69.301)	lr 0.02285
Train [23][2380/3239]	Time 0.695 (0.922)	Data Time 0.001 (0.013)	Loss 3.3729 (3.2895)	Entropy 0.90808 (0.91662)	Top-1 acc 47.656 (45.578)	Top-5 acc 67.188 (69.295)	lr 0.02285
Train [23][2390/3239]	Time 0.607 (0.921)	Data Time 0.001 (0.013)	Loss 3.1152 (3.2897)	Entropy 0.90759 (0.91658)	Top-1 acc 48.828 (45.570)	Top-5 acc 71.875 (69.293)	lr 0.02285
Train [23][2400/3239]	Time 0.624 (0.921)	Data Time 0.001 (0.013)	Loss 3.3651 (3.2896)	Entropy 0.90731 (0.91654)	Top-1 acc 41.797 (45.572)	Top-5 acc 67.578 (69.298)	lr 0.02285
Train [23][2410/3239]	Time 0.579 (0.921)	Data Time 0.001 (0.013)	Loss 3.4222 (3.2897)	Entropy 0.90742 (0.91650)	Top-1 acc 45.312 (45.573)	Top-5 acc 66.406 (69.299)	lr 0.02285
Train [23][2420/3239]	Time 0.614 (0.921)	Data Time 0.001 (0.013)	Loss 3.2105 (3.2897)	Entropy 0.90735 (0.91647)	Top-1 acc 48.047 (45.570)	Top-5 acc 71.094 (69.298)	lr 0.02285
Train [23][2430/3239]	Time 0.571 (0.920)	Data Time 0.002 (0.013)	Loss 3.1260 (3.2897)	Entropy 0.90734 (0.91643)	Top-1 acc 48.047 (45.569)	Top-5 acc 73.438 (69.297)	lr 0.02285
Train [23][2440/3239]	Time 0.588 (0.920)	Data Time 0.001 (0.013)	Loss 3.5752 (3.2898)	Entropy 0.90715 (0.91639)	Top-1 acc 37.109 (45.569)	Top-5 acc 64.062 (69.299)	lr 0.02285
Train [23][2450/3239]	Time 0.633 (0.920)	Data Time 0.001 (0.013)	Loss 3.2663 (3.2898)	Entropy 0.90703 (0.91635)	Top-1 acc 43.750 (45.568)	Top-5 acc 69.531 (69.299)	lr 0.02285
Train [23][2460/3239]	Time 0.606 (0.919)	Data Time 0.001 (0.013)	Loss 3.2735 (3.2899)	Entropy 0.90677 (0.91632)	Top-1 acc 45.312 (45.567)	Top-5 acc 66.406 (69.297)	lr 0.02285
Train [23][2470/3239]	Time 0.738 (0.919)	Data Time 0.001 (0.013)	Loss 3.3763 (3.2899)	Entropy 0.90656 (0.91628)	Top-1 acc 44.141 (45.562)	Top-5 acc 66.016 (69.296)	lr 0.02285
Train [23][2480/3239]	Time 0.605 (0.919)	Data Time 0.003 (0.013)	Loss 3.4939 (3.2900)	Entropy 0.90596 (0.91624)	Top-1 acc 42.578 (45.556)	Top-5 acc 64.453 (69.293)	lr 0.02284
Train [23][2490/3239]	Time 0.572 (0.919)	Data Time 0.001 (0.013)	Loss 3.3926 (3.2900)	Entropy 0.90584 (0.91620)	Top-1 acc 42.578 (45.554)	Top-5 acc 67.969 (69.293)	lr 0.02284
Train [23][2500/3239]	Time 0.636 (0.919)	Data Time 0.002 (0.012)	Loss 3.1012 (3.2902)	Entropy 0.90609 (0.91615)	Top-1 acc 50.000 (45.553)	Top-5 acc 71.094 (69.292)	lr 0.02284
Train [23][2510/3239]	Time 0.609 (0.918)	Data Time 0.001 (0.012)	Loss 3.0050 (3.2897)	Entropy 0.90612 (0.91611)	Top-1 acc 51.172 (45.562)	Top-5 acc 77.344 (69.303)	lr 0.02284
Train [23][2520/3239]	Time 0.588 (0.918)	Data Time 0.001 (0.012)	Loss 3.4230 (3.2897)	Entropy 0.90641 (0.91608)	Top-1 acc 40.234 (45.563)	Top-5 acc 67.578 (69.305)	lr 0.02284
Train [23][2530/3239]	Time 0.608 (0.918)	Data Time 0.001 (0.012)	Loss 3.3007 (3.2896)	Entropy 0.90612 (0.91604)	Top-1 acc 42.578 (45.561)	Top-5 acc 73.047 (69.303)	lr 0.02284
Train [23][2540/3239]	Time 0.683 (0.918)	Data Time 0.001 (0.012)	Loss 3.0417 (3.2896)	Entropy 0.90606 (0.91600)	Top-1 acc 51.562 (45.556)	Top-5 acc 73.438 (69.301)	lr 0.02284
Train [23][2550/3239]	Time 0.626 (0.918)	Data Time 0.001 (0.012)	Loss 3.2518 (3.2899)	Entropy 0.90609 (0.91596)	Top-1 acc 41.406 (45.550)	Top-5 acc 73.047 (69.298)	lr 0.02284
Train [23][2560/3239]	Time 0.607 (0.917)	Data Time 0.001 (0.012)	Loss 3.2982 (3.2901)	Entropy 0.90598 (0.91592)	Top-1 acc 43.750 (45.542)	Top-5 acc 69.141 (69.296)	lr 0.02284
Train [23][2570/3239]	Time 0.580 (0.917)	Data Time 0.002 (0.012)	Loss 3.1988 (3.2903)	Entropy 0.90579 (0.91588)	Top-1 acc 49.219 (45.542)	Top-5 acc 70.312 (69.292)	lr 0.02284
Train [23][2580/3239]	Time 0.651 (0.917)	Data Time 0.001 (0.012)	Loss 3.2593 (3.2902)	Entropy 0.90571 (0.91584)	Top-1 acc 50.000 (45.543)	Top-5 acc 67.578 (69.294)	lr 0.02284
Train [23][2590/3239]	Time 0.578 (0.917)	Data Time 0.001 (0.012)	Loss 3.2820 (3.2901)	Entropy 0.90559 (0.91580)	Top-1 acc 46.875 (45.545)	Top-5 acc 70.312 (69.298)	lr 0.02284
Train [23][2600/3239]	Time 0.615 (0.916)	Data Time 0.002 (0.012)	Loss 3.4918 (3.2898)	Entropy 0.90548 (0.91576)	Top-1 acc 39.453 (45.549)	Top-5 acc 65.625 (69.306)	lr 0.02284
Train [23][2610/3239]	Time 0.450 (0.916)	Data Time 0.001 (0.012)	Loss 3.2459 (3.2894)	Entropy 0.90540 (0.91572)	Top-1 acc 48.438 (45.560)	Top-5 acc 69.922 (69.317)	lr 0.02284
Train [23][2620/3239]	Time 0.594 (0.916)	Data Time 0.001 (0.012)	Loss 3.2061 (3.2893)	Entropy 0.90501 (0.91568)	Top-1 acc 49.219 (45.561)	Top-5 acc 69.922 (69.318)	lr 0.02284
Train [23][2630/3239]	Time 0.699 (0.916)	Data Time 0.001 (0.012)	Loss 3.4554 (3.2894)	Entropy 0.90468 (0.91564)	Top-1 acc 46.094 (45.557)	Top-5 acc 66.406 (69.316)	lr 0.02284
Train [23][2640/3239]	Time 0.617 (0.915)	Data Time 0.001 (0.012)	Loss 3.3316 (3.2894)	Entropy 0.90485 (0.91560)	Top-1 acc 44.922 (45.556)	Top-5 acc 67.969 (69.315)	lr 0.02284
Train [23][2650/3239]	Time 0.622 (0.915)	Data Time 0.001 (0.012)	Loss 3.3905 (3.2893)	Entropy 0.90479 (0.91556)	Top-1 acc 41.406 (45.557)	Top-5 acc 67.969 (69.317)	lr 0.02284
Train [23][2660/3239]	Time 0.577 (0.915)	Data Time 0.001 (0.012)	Loss 3.3275 (3.2896)	Entropy 0.90471 (0.91552)	Top-1 acc 43.750 (45.550)	Top-5 acc 69.922 (69.314)	lr 0.02283
Train [23][2670/3239]	Time 0.594 (0.915)	Data Time 0.002 (0.012)	Loss 3.2270 (3.2897)	Entropy 0.90497 (0.91548)	Top-1 acc 49.609 (45.551)	Top-5 acc 71.484 (69.315)	lr 0.02283
Train [23][2680/3239]	Time 0.630 (0.915)	Data Time 0.001 (0.012)	Loss 3.3654 (3.2897)	Entropy 0.90546 (0.91544)	Top-1 acc 40.625 (45.550)	Top-5 acc 66.406 (69.315)	lr 0.02283
Train [23][2690/3239]	Time 0.613 (0.915)	Data Time 0.001 (0.012)	Loss 3.2912 (3.2898)	Entropy 0.90513 (0.91540)	Top-1 acc 42.969 (45.546)	Top-5 acc 69.531 (69.313)	lr 0.02283
Train [23][2700/3239]	Time 0.721 (0.915)	Data Time 0.002 (0.012)	Loss 3.1999 (3.2898)	Entropy 0.90527 (0.91537)	Top-1 acc 46.875 (45.547)	Top-5 acc 70.703 (69.311)	lr 0.02283
Train [23][2710/3239]	Time 0.613 (0.925)	Data Time 0.002 (0.012)	Loss 3.2457 (3.2901)	Entropy 0.90550 (0.91533)	Top-1 acc 50.781 (45.539)	Top-5 acc 68.359 (69.303)	lr 0.02283
Train [23][2720/3239]	Time 0.568 (0.924)	Data Time 0.002 (0.012)	Loss 3.4785 (3.2902)	Entropy 0.90536 (0.91529)	Top-1 acc 41.016 (45.540)	Top-5 acc 67.578 (69.302)	lr 0.02283
Train [23][2730/3239]	Time 0.592 (0.924)	Data Time 0.001 (0.012)	Loss 3.4087 (3.2904)	Entropy 0.90527 (0.91526)	Top-1 acc 44.922 (45.534)	Top-5 acc 67.969 (69.302)	lr 0.02283
Train [23][2740/3239]	Time 0.648 (0.924)	Data Time 0.002 (0.012)	Loss 3.3843 (3.2904)	Entropy 0.90552 (0.91522)	Top-1 acc 45.312 (45.537)	Top-5 acc 65.625 (69.300)	lr 0.02283
Train [23][2750/3239]	Time 0.570 (0.924)	Data Time 0.001 (0.012)	Loss 3.1156 (3.2904)	Entropy 0.90548 (0.91519)	Top-1 acc 49.609 (45.536)	Top-5 acc 73.828 (69.303)	lr 0.02283
Train [23][2760/3239]	Time 0.585 (0.923)	Data Time 0.001 (0.012)	Loss 3.1093 (3.2904)	Entropy 0.90572 (0.91515)	Top-1 acc 50.000 (45.539)	Top-5 acc 71.875 (69.301)	lr 0.02283
Train [23][2770/3239]	Time 0.602 (0.923)	Data Time 0.001 (0.011)	Loss 3.2907 (3.2905)	Entropy 0.90592 (0.91512)	Top-1 acc 44.141 (45.538)	Top-5 acc 70.703 (69.300)	lr 0.02283
Train [23][2780/3239]	Time 0.589 (0.923)	Data Time 0.001 (0.011)	Loss 3.3489 (3.2904)	Entropy 0.90630 (0.91508)	Top-1 acc 44.531 (45.540)	Top-5 acc 67.188 (69.300)	lr 0.02283
Train [23][2790/3239]	Time 0.542 (0.923)	Data Time 0.001 (0.011)	Loss 3.0804 (3.2904)	Entropy 0.90633 (0.91505)	Top-1 acc 51.953 (45.541)	Top-5 acc 71.484 (69.299)	lr 0.02283
Train [23][2800/3239]	Time 0.588 (0.923)	Data Time 0.001 (0.011)	Loss 3.2471 (3.2900)	Entropy 0.90634 (0.91502)	Top-1 acc 46.875 (45.551)	Top-5 acc 69.531 (69.304)	lr 0.02283
Train [23][2810/3239]	Time 0.617 (0.922)	Data Time 0.001 (0.011)	Loss 3.3564 (3.2900)	Entropy 0.90621 (0.91499)	Top-1 acc 44.531 (45.552)	Top-5 acc 69.531 (69.305)	lr 0.02283
Train [23][2820/3239]	Time 0.630 (0.922)	Data Time 0.001 (0.011)	Loss 3.1656 (3.2900)	Entropy 0.90629 (0.91496)	Top-1 acc 46.484 (45.551)	Top-5 acc 75.000 (69.309)	lr 0.02283
Train [23][2830/3239]	Time 0.610 (0.922)	Data Time 0.001 (0.011)	Loss 3.4928 (3.2902)	Entropy 0.90624 (0.91493)	Top-1 acc 41.016 (45.551)	Top-5 acc 65.625 (69.306)	lr 0.02282
Train [23][2840/3239]	Time 0.648 (0.922)	Data Time 0.002 (0.011)	Loss 2.9715 (3.2899)	Entropy 0.90630 (0.91490)	Top-1 acc 52.734 (45.552)	Top-5 acc 78.125 (69.312)	lr 0.02282
Train [23][2850/3239]	Time 0.596 (0.922)	Data Time 0.001 (0.011)	Loss 3.5036 (3.2900)	Entropy 0.90592 (0.91487)	Top-1 acc 41.797 (45.550)	Top-5 acc 65.234 (69.308)	lr 0.02282
Train [23][2860/3239]	Time 0.745 (0.922)	Data Time 0.001 (0.011)	Loss 3.5222 (3.2900)	Entropy 0.90598 (0.91484)	Top-1 acc 41.016 (45.552)	Top-5 acc 63.672 (69.306)	lr 0.02282
Train [23][2870/3239]	Time 0.565 (0.921)	Data Time 0.001 (0.011)	Loss 3.4064 (3.2901)	Entropy 0.90593 (0.91481)	Top-1 acc 44.922 (45.552)	Top-5 acc 69.922 (69.307)	lr 0.02282
Train [23][2880/3239]	Time 0.607 (0.921)	Data Time 0.001 (0.011)	Loss 3.2113 (3.2901)	Entropy 0.90557 (0.91478)	Top-1 acc 47.656 (45.554)	Top-5 acc 70.703 (69.307)	lr 0.02282
Train [23][2890/3239]	Time 0.629 (0.921)	Data Time 0.001 (0.011)	Loss 3.2871 (3.2899)	Entropy 0.90533 (0.91474)	Top-1 acc 44.922 (45.555)	Top-5 acc 70.312 (69.311)	lr 0.02282
Train [23][2900/3239]	Time 0.493 (0.921)	Data Time 0.001 (0.011)	Loss 3.2756 (3.2901)	Entropy 0.90493 (0.91471)	Top-1 acc 47.266 (45.554)	Top-5 acc 69.922 (69.307)	lr 0.02282
Train [23][2910/3239]	Time 0.576 (0.920)	Data Time 0.001 (0.011)	Loss 3.4973 (3.2899)	Entropy 0.90454 (0.91468)	Top-1 acc 39.062 (45.557)	Top-5 acc 67.188 (69.313)	lr 0.02282
Train [23][2920/3239]	Time 0.584 (0.920)	Data Time 0.001 (0.011)	Loss 3.3362 (3.2898)	Entropy 0.90457 (0.91464)	Top-1 acc 45.312 (45.558)	Top-5 acc 66.797 (69.314)	lr 0.02282
Train [23][2930/3239]	Time 0.694 (0.920)	Data Time 0.001 (0.011)	Loss 3.4087 (3.2900)	Entropy 0.90445 (0.91461)	Top-1 acc 41.016 (45.553)	Top-5 acc 64.453 (69.311)	lr 0.02282
Train [23][2940/3239]	Time 0.615 (0.920)	Data Time 0.001 (0.011)	Loss 3.2504 (3.2899)	Entropy 0.90437 (0.91457)	Top-1 acc 44.531 (45.555)	Top-5 acc 71.484 (69.317)	lr 0.02282
Train [23][2950/3239]	Time 0.604 (0.920)	Data Time 0.001 (0.011)	Loss 3.2369 (3.2896)	Entropy 0.90415 (0.91454)	Top-1 acc 48.828 (45.559)	Top-5 acc 68.359 (69.323)	lr 0.02282
Train [23][2960/3239]	Time 0.615 (0.920)	Data Time 0.001 (0.011)	Loss 3.2056 (3.2894)	Entropy 0.90446 (0.91450)	Top-1 acc 50.000 (45.565)	Top-5 acc 69.141 (69.328)	lr 0.02282
Train [23][2970/3239]	Time 0.597 (0.919)	Data Time 0.001 (0.011)	Loss 3.2677 (3.2895)	Entropy 0.90435 (0.91447)	Top-1 acc 43.359 (45.561)	Top-5 acc 67.188 (69.323)	lr 0.02282
Train [23][2980/3239]	Time 0.575 (0.919)	Data Time 0.001 (0.011)	Loss 3.2752 (3.2896)	Entropy 0.90392 (0.91443)	Top-1 acc 48.438 (45.559)	Top-5 acc 67.969 (69.324)	lr 0.02282
Train [23][2990/3239]	Time 0.624 (0.919)	Data Time 0.001 (0.011)	Loss 3.1766 (3.2897)	Entropy 0.90367 (0.91440)	Top-1 acc 51.172 (45.560)	Top-5 acc 72.266 (69.320)	lr 0.02282
Train [23][3000/3239]	Time 0.622 (0.919)	Data Time 0.001 (0.011)	Loss 3.2897 (3.2898)	Entropy 0.90367 (0.91436)	Top-1 acc 47.266 (45.558)	Top-5 acc 73.828 (69.321)	lr 0.02282
Train [23][3010/3239]	Time 0.604 (0.919)	Data Time 0.001 (0.011)	Loss 3.0800 (3.2897)	Entropy 0.90334 (0.91433)	Top-1 acc 48.047 (45.557)	Top-5 acc 72.656 (69.321)	lr 0.02281
Train [23][3020/3239]	Time 0.722 (0.919)	Data Time 0.001 (0.011)	Loss 3.1116 (3.2897)	Entropy 0.90361 (0.91429)	Top-1 acc 45.703 (45.554)	Top-5 acc 76.172 (69.326)	lr 0.02281
Train [23][3030/3239]	Time 0.615 (0.918)	Data Time 0.001 (0.011)	Loss 3.2875 (3.2895)	Entropy 0.90383 (0.91426)	Top-1 acc 47.266 (45.557)	Top-5 acc 69.922 (69.331)	lr 0.02281
Train [23][3040/3239]	Time 0.576 (0.918)	Data Time 0.001 (0.011)	Loss 3.5167 (3.2896)	Entropy 0.90380 (0.91422)	Top-1 acc 46.094 (45.557)	Top-5 acc 66.797 (69.330)	lr 0.02281
Train [23][3050/3239]	Time 0.626 (0.918)	Data Time 0.001 (0.011)	Loss 3.3316 (3.2895)	Entropy 0.90372 (0.91419)	Top-1 acc 47.266 (45.558)	Top-5 acc 70.312 (69.332)	lr 0.02281
Train [23][3060/3239]	Time 0.579 (0.918)	Data Time 0.001 (0.011)	Loss 3.2386 (3.2895)	Entropy 0.90328 (0.91415)	Top-1 acc 46.094 (45.559)	Top-5 acc 71.484 (69.333)	lr 0.02281
Train [23][3070/3239]	Time 0.614 (0.918)	Data Time 0.001 (0.011)	Loss 3.4439 (3.2895)	Entropy 0.90280 (0.91412)	Top-1 acc 41.797 (45.555)	Top-5 acc 65.234 (69.332)	lr 0.02281
Train [23][3080/3239]	Time 0.596 (0.917)	Data Time 0.001 (0.011)	Loss 3.1495 (3.2895)	Entropy 0.90265 (0.91408)	Top-1 acc 45.703 (45.557)	Top-5 acc 72.266 (69.331)	lr 0.02281
Train [23][3090/3239]	Time 0.731 (0.917)	Data Time 0.001 (0.011)	Loss 3.2362 (3.2893)	Entropy 0.90261 (0.91404)	Top-1 acc 41.406 (45.560)	Top-5 acc 73.047 (69.334)	lr 0.02281
Train [23][3100/3239]	Time 0.632 (0.917)	Data Time 0.001 (0.010)	Loss 3.5642 (3.2895)	Entropy 0.90271 (0.91401)	Top-1 acc 39.062 (45.552)	Top-5 acc 64.453 (69.332)	lr 0.02281
Train [23][3110/3239]	Time 0.611 (0.917)	Data Time 0.002 (0.010)	Loss 3.3992 (3.2894)	Entropy 0.90286 (0.91397)	Top-1 acc 40.625 (45.557)	Top-5 acc 68.750 (69.337)	lr 0.02281
Train [23][3120/3239]	Time 0.582 (0.917)	Data Time 0.001 (0.010)	Loss 3.0618 (3.2891)	Entropy 0.90257 (0.91393)	Top-1 acc 50.000 (45.562)	Top-5 acc 74.609 (69.339)	lr 0.02281
Train [23][3130/3239]	Time 0.604 (0.916)	Data Time 0.001 (0.010)	Loss 3.3396 (3.2892)	Entropy 0.90249 (0.91390)	Top-1 acc 42.188 (45.558)	Top-5 acc 68.359 (69.337)	lr 0.02281
Train [23][3140/3239]	Time 0.659 (0.916)	Data Time 0.001 (0.010)	Loss 3.0717 (3.2892)	Entropy 0.90222 (0.91386)	Top-1 acc 49.219 (45.558)	Top-5 acc 70.703 (69.337)	lr 0.02281
Train [23][3150/3239]	Time 0.571 (0.916)	Data Time 0.001 (0.010)	Loss 3.3558 (3.2893)	Entropy 0.90226 (0.91382)	Top-1 acc 44.141 (45.556)	Top-5 acc 66.406 (69.333)	lr 0.02281
Train [23][3160/3239]	Time 0.555 (0.916)	Data Time 0.001 (0.010)	Loss 3.4246 (3.2894)	Entropy 0.90257 (0.91379)	Top-1 acc 42.969 (45.557)	Top-5 acc 66.406 (69.330)	lr 0.02281
Train [23][3170/3239]	Time 0.609 (0.916)	Data Time 0.001 (0.010)	Loss 3.1802 (3.2893)	Entropy 0.90214 (0.91375)	Top-1 acc 45.312 (45.562)	Top-5 acc 74.609 (69.332)	lr 0.02281
Train [23][3180/3239]	Time 0.693 (0.916)	Data Time 0.000 (0.010)	Loss 3.1051 (3.2893)	Entropy 0.90177 (0.91371)	Top-1 acc 50.781 (45.561)	Top-5 acc 76.562 (69.331)	lr 0.02281
Train [23][3190/3239]	Time 0.578 (0.916)	Data Time 0.000 (0.010)	Loss 3.2752 (3.2892)	Entropy 0.90167 (0.91368)	Top-1 acc 44.141 (45.563)	Top-5 acc 68.750 (69.332)	lr 0.02280
Train [23][3200/3239]	Time 0.610 (0.915)	Data Time 0.000 (0.010)	Loss 3.3033 (3.2892)	Entropy 0.90184 (0.91364)	Top-1 acc 46.484 (45.565)	Top-5 acc 70.703 (69.330)	lr 0.02280
Train [23][3210/3239]	Time 0.622 (0.915)	Data Time 0.000 (0.010)	Loss 3.3111 (3.2891)	Entropy 0.90152 (0.91360)	Top-1 acc 45.703 (45.562)	Top-5 acc 68.359 (69.331)	lr 0.02280
Train [23][3220/3239]	Time 0.536 (0.915)	Data Time 0.000 (0.010)	Loss 3.0075 (3.2889)	Entropy 0.90141 (0.91356)	Top-1 acc 51.562 (45.567)	Top-5 acc 72.656 (69.338)	lr 0.02280
Train [23][3230/3239]	Time 0.573 (0.915)	Data Time 0.000 (0.010)	Loss 3.3107 (3.2891)	Entropy 0.90150 (0.91353)	Top-1 acc 44.922 (45.563)	Top-5 acc 74.609 (69.339)	lr 0.02280
Train [23][3239/3239]	Time 1.526 (0.914)	Data Time 0.000 (0.010)	Loss 3.7620 (3.2892)	Entropy 0.90156 (0.91349)	Top-1 acc 38.272 (45.561)	Top-5 acc 62.963 (69.338)	lr 0.02280
==========Valid [23/120]	loss 2.017	top-1 acc 55.154 (55.154)	top-5 acc 78.347	Train top-1 45.561	top-5 69.338	Entropy 0.90156	Latency-None: 0.000ms	Flops: 539.76M
Train [24][0/3239]	Time 27.908 (27.908)	Data Time 26.246 (26.246)	Loss 3.1114 (3.1114)	Entropy 0.90123 (0.90123)	Top-1 acc 51.172 (51.172)	Top-5 acc 71.484 (71.484)	lr 0.02280
Train [24][10/3239]	Time 0.569 (3.381)	Data Time 0.001 (2.390)	Loss 3.3977 (3.2884)	Entropy 0.90091 (0.90106)	Top-1 acc 45.703 (46.058)	Top-5 acc 67.969 (68.288)	lr 0.02280
Train [24][20/3239]	Time 0.558 (2.173)	Data Time 0.001 (1.253)	Loss 3.2522 (3.2843)	Entropy 0.90064 (0.90098)	Top-1 acc 47.266 (46.019)	Top-5 acc 70.703 (69.029)	lr 0.02280
Train [24][30/3239]	Time 0.577 (1.749)	Data Time 0.001 (0.850)	Loss 3.2936 (3.2746)	Entropy 0.90062 (0.90089)	Top-1 acc 46.094 (46.106)	Top-5 acc 71.484 (69.582)	lr 0.02280
Train [24][40/3239]	Time 0.624 (1.540)	Data Time 0.001 (0.643)	Loss 3.6833 (3.2611)	Entropy 0.90055 (0.90083)	Top-1 acc 34.766 (46.208)	Top-5 acc 60.938 (69.846)	lr 0.02280
Train [24][50/3239]	Time 0.601 (1.409)	Data Time 0.001 (0.517)	Loss 3.3372 (3.2616)	Entropy 0.90052 (0.90078)	Top-1 acc 44.141 (46.362)	Top-5 acc 70.312 (69.677)	lr 0.02280
Train [24][60/3239]	Time 0.630 (1.320)	Data Time 0.001 (0.433)	Loss 3.3612 (3.2620)	Entropy 0.90038 (0.90073)	Top-1 acc 45.703 (46.337)	Top-5 acc 66.016 (69.608)	lr 0.02280
Train [24][70/3239]	Time 0.614 (1.257)	Data Time 0.001 (0.372)	Loss 3.2983 (3.2619)	Entropy 0.90045 (0.90068)	Top-1 acc 44.922 (46.319)	Top-5 acc 68.359 (69.768)	lr 0.02280
Train [24][80/3239]	Time 0.687 (1.208)	Data Time 0.002 (0.326)	Loss 3.2686 (3.2587)	Entropy 0.90055 (0.90065)	Top-1 acc 46.484 (46.359)	Top-5 acc 66.406 (69.768)	lr 0.02280
Train [24][90/3239]	Time 0.627 (1.170)	Data Time 0.002 (0.291)	Loss 3.0328 (3.2569)	Entropy 0.90050 (0.90064)	Top-1 acc 52.734 (46.403)	Top-5 acc 74.219 (69.780)	lr 0.02280
Train [24][100/3239]	Time 0.592 (1.138)	Data Time 0.001 (0.262)	Loss 3.3478 (3.2593)	Entropy 0.90059 (0.90063)	Top-1 acc 42.969 (46.260)	Top-5 acc 66.016 (69.732)	lr 0.02280
Train [24][110/3239]	Time 0.570 (1.115)	Data Time 0.001 (0.239)	Loss 3.2192 (3.2575)	Entropy 0.90048 (0.90061)	Top-1 acc 45.703 (46.414)	Top-5 acc 71.875 (69.844)	lr 0.02280
Train [24][120/3239]	Time 0.735 (1.322)	Data Time 0.006 (0.219)	Loss 3.3034 (3.2612)	Entropy 0.90046 (0.90060)	Top-1 acc 47.266 (46.320)	Top-5 acc 67.188 (69.790)	lr 0.02279
Train [24][130/3239]	Time 0.473 (1.289)	Data Time 0.002 (0.203)	Loss 3.1946 (3.2556)	Entropy 0.90069 (0.90060)	Top-1 acc 51.172 (46.386)	Top-5 acc 72.656 (69.976)	lr 0.02279
Train [24][140/3239]	Time 0.619 (1.258)	Data Time 0.002 (0.189)	Loss 3.2399 (3.2579)	Entropy 0.90102 (0.90061)	Top-1 acc 46.094 (46.338)	Top-5 acc 68.359 (69.930)	lr 0.02279
Train [24][150/3239]	Time 0.708 (1.233)	Data Time 0.001 (0.176)	Loss 3.5307 (3.2605)	Entropy 0.90107 (0.90064)	Top-1 acc 39.453 (46.210)	Top-5 acc 64.844 (69.943)	lr 0.02279
Train [24][160/3239]	Time 0.610 (1.211)	Data Time 0.001 (0.166)	Loss 3.2955 (3.2656)	Entropy 0.90102 (0.90067)	Top-1 acc 45.312 (46.079)	Top-5 acc 70.312 (69.900)	lr 0.02279
Train [24][170/3239]	Time 0.581 (1.190)	Data Time 0.001 (0.156)	Loss 3.1837 (3.2672)	Entropy 0.90119 (0.90069)	Top-1 acc 49.219 (46.048)	Top-5 acc 69.922 (69.842)	lr 0.02279
Train [24][180/3239]	Time 0.641 (1.173)	Data Time 0.003 (0.148)	Loss 3.4350 (3.2677)	Entropy 0.90089 (0.90071)	Top-1 acc 44.531 (46.102)	Top-5 acc 61.328 (69.805)	lr 0.02279
Train [24][190/3239]	Time 0.606 (1.157)	Data Time 0.003 (0.140)	Loss 3.1552 (3.2641)	Entropy 0.90092 (0.90073)	Top-1 acc 47.266 (46.198)	Top-5 acc 71.094 (69.914)	lr 0.02279
Train [24][200/3239]	Time 0.586 (1.143)	Data Time 0.001 (0.133)	Loss 3.2405 (3.2613)	Entropy 0.90042 (0.90073)	Top-1 acc 46.875 (46.315)	Top-5 acc 72.266 (69.982)	lr 0.02279
Train [24][210/3239]	Time 0.611 (1.130)	Data Time 0.001 (0.127)	Loss 3.6551 (3.2643)	Entropy 0.90017 (0.90071)	Top-1 acc 38.672 (46.290)	Top-5 acc 60.156 (69.926)	lr 0.02279
Train [24][220/3239]	Time 0.673 (1.119)	Data Time 0.001 (0.121)	Loss 3.0418 (3.2633)	Entropy 0.90063 (0.90069)	Top-1 acc 48.047 (46.286)	Top-5 acc 76.172 (69.940)	lr 0.02279
Train [24][230/3239]	Time 0.597 (1.108)	Data Time 0.001 (0.116)	Loss 3.2891 (3.2629)	Entropy 0.90042 (0.90069)	Top-1 acc 47.656 (46.305)	Top-5 acc 69.531 (69.934)	lr 0.02279
Train [24][240/3239]	Time 0.698 (1.099)	Data Time 0.002 (0.111)	Loss 3.2964 (3.2615)	Entropy 0.89997 (0.90067)	Top-1 acc 48.828 (46.340)	Top-5 acc 69.141 (69.948)	lr 0.02279
Train [24][250/3239]	Time 0.619 (1.090)	Data Time 0.001 (0.107)	Loss 3.1514 (3.2622)	Entropy 0.90017 (0.90064)	Top-1 acc 48.438 (46.309)	Top-5 acc 71.875 (69.979)	lr 0.02279
Train [24][260/3239]	Time 0.618 (1.081)	Data Time 0.001 (0.103)	Loss 3.1335 (3.2596)	Entropy 0.89973 (0.90062)	Top-1 acc 53.125 (46.324)	Top-5 acc 70.703 (70.046)	lr 0.02279
Train [24][270/3239]	Time 0.604 (1.074)	Data Time 0.001 (0.099)	Loss 3.1366 (3.2605)	Entropy 0.89954 (0.90058)	Top-1 acc 51.172 (46.296)	Top-5 acc 75.391 (70.046)	lr 0.02279
Train [24][280/3239]	Time 0.564 (1.066)	Data Time 0.001 (0.096)	Loss 3.4481 (3.2612)	Entropy 0.89911 (0.90054)	Top-1 acc 43.359 (46.299)	Top-5 acc 65.625 (70.032)	lr 0.02279
Train [24][290/3239]	Time 0.607 (1.058)	Data Time 0.001 (0.093)	Loss 3.2976 (3.2596)	Entropy 0.89894 (0.90049)	Top-1 acc 42.188 (46.294)	Top-5 acc 66.016 (70.059)	lr 0.02278
Train [24][300/3239]	Time 0.570 (1.050)	Data Time 0.001 (0.090)	Loss 3.1394 (3.2591)	Entropy 0.89853 (0.90044)	Top-1 acc 48.047 (46.281)	Top-5 acc 69.922 (70.069)	lr 0.02278
Train [24][310/3239]	Time 0.669 (1.043)	Data Time 0.001 (0.087)	Loss 3.2777 (3.2604)	Entropy 0.89854 (0.90038)	Top-1 acc 46.484 (46.260)	Top-5 acc 68.750 (70.056)	lr 0.02278
Train [24][320/3239]	Time 0.625 (1.038)	Data Time 0.001 (0.084)	Loss 3.2263 (3.2601)	Entropy 0.89838 (0.90032)	Top-1 acc 46.094 (46.273)	Top-5 acc 72.656 (70.090)	lr 0.02278
Train [24][330/3239]	Time 0.610 (1.032)	Data Time 0.001 (0.082)	Loss 3.2502 (3.2613)	Entropy 0.89819 (0.90026)	Top-1 acc 45.703 (46.231)	Top-5 acc 68.359 (70.078)	lr 0.02278
Train [24][340/3239]	Time 0.614 (1.027)	Data Time 0.002 (0.079)	Loss 3.2225 (3.2607)	Entropy 0.89795 (0.90019)	Top-1 acc 47.656 (46.247)	Top-5 acc 70.312 (70.082)	lr 0.02278
Train [24][350/3239]	Time 0.646 (1.022)	Data Time 0.001 (0.077)	Loss 3.1881 (3.2628)	Entropy 0.89792 (0.90013)	Top-1 acc 45.312 (46.173)	Top-5 acc 73.047 (70.024)	lr 0.02278
Train [24][360/3239]	Time 0.628 (1.018)	Data Time 0.001 (0.075)	Loss 3.3851 (3.2638)	Entropy 0.89786 (0.90006)	Top-1 acc 42.578 (46.137)	Top-5 acc 66.406 (70.027)	lr 0.02278
Train [24][370/3239]	Time 0.635 (1.014)	Data Time 0.001 (0.073)	Loss 3.3759 (3.2637)	Entropy 0.89776 (0.90000)	Top-1 acc 43.750 (46.138)	Top-5 acc 65.625 (70.044)	lr 0.02278
Train [24][380/3239]	Time 0.587 (1.010)	Data Time 0.001 (0.071)	Loss 3.3252 (3.2623)	Entropy 0.89792 (0.89995)	Top-1 acc 42.188 (46.173)	Top-5 acc 67.188 (70.071)	lr 0.02278
Train [24][390/3239]	Time 0.582 (1.006)	Data Time 0.001 (0.069)	Loss 3.2014 (3.2627)	Entropy 0.89819 (0.89990)	Top-1 acc 50.391 (46.162)	Top-5 acc 69.531 (70.048)	lr 0.02278
Train [24][400/3239]	Time 0.723 (1.003)	Data Time 0.001 (0.068)	Loss 3.1587 (3.2625)	Entropy 0.89832 (0.89986)	Top-1 acc 49.609 (46.155)	Top-5 acc 69.531 (70.050)	lr 0.02278
Train [24][410/3239]	Time 0.652 (1.000)	Data Time 0.001 (0.066)	Loss 3.2553 (3.2618)	Entropy 0.89838 (0.89982)	Top-1 acc 48.828 (46.196)	Top-5 acc 71.484 (70.043)	lr 0.02278
Train [24][420/3239]	Time 0.612 (0.996)	Data Time 0.001 (0.065)	Loss 3.2045 (3.2623)	Entropy 0.89859 (0.89979)	Top-1 acc 49.609 (46.178)	Top-5 acc 68.750 (70.031)	lr 0.02278
Train [24][430/3239]	Time 0.605 (0.993)	Data Time 0.001 (0.063)	Loss 3.2942 (3.2627)	Entropy 0.89885 (0.89976)	Top-1 acc 41.406 (46.168)	Top-5 acc 69.141 (70.035)	lr 0.02278
Train [24][440/3239]	Time 0.603 (0.990)	Data Time 0.001 (0.062)	Loss 3.4260 (3.2615)	Entropy 0.89884 (0.89974)	Top-1 acc 41.797 (46.188)	Top-5 acc 68.750 (70.057)	lr 0.02278
Train [24][450/3239]	Time 0.568 (0.987)	Data Time 0.001 (0.060)	Loss 3.5341 (3.2611)	Entropy 0.89894 (0.89973)	Top-1 acc 40.625 (46.197)	Top-5 acc 66.797 (70.067)	lr 0.02278
Train [24][460/3239]	Time 0.584 (0.984)	Data Time 0.001 (0.059)	Loss 3.5315 (3.2604)	Entropy 0.89876 (0.89971)	Top-1 acc 40.625 (46.228)	Top-5 acc 64.062 (70.079)	lr 0.02278
Train [24][470/3239]	Time 0.701 (0.980)	Data Time 0.001 (0.058)	Loss 3.2454 (3.2614)	Entropy 0.89927 (0.89969)	Top-1 acc 48.047 (46.204)	Top-5 acc 69.531 (70.053)	lr 0.02277
Train [24][480/3239]	Time 0.546 (0.977)	Data Time 0.001 (0.057)	Loss 3.0974 (3.2626)	Entropy 0.89924 (0.89968)	Top-1 acc 50.000 (46.194)	Top-5 acc 70.312 (70.031)	lr 0.02277
Train [24][490/3239]	Time 0.577 (0.975)	Data Time 0.001 (0.056)	Loss 3.3465 (3.2634)	Entropy 0.89960 (0.89968)	Top-1 acc 44.141 (46.196)	Top-5 acc 69.141 (70.001)	lr 0.02277
Train [24][500/3239]	Time 0.597 (0.972)	Data Time 0.001 (0.055)	Loss 3.3992 (3.2629)	Entropy 0.89893 (0.89967)	Top-1 acc 41.406 (46.216)	Top-5 acc 67.969 (70.012)	lr 0.02277
Train [24][510/3239]	Time 0.618 (0.970)	Data Time 0.001 (0.054)	Loss 3.0176 (3.2607)	Entropy 0.89914 (0.89966)	Top-1 acc 50.781 (46.283)	Top-5 acc 75.391 (70.056)	lr 0.02277
Train [24][520/3239]	Time 0.604 (0.968)	Data Time 0.001 (0.053)	Loss 3.2025 (3.2605)	Entropy 0.89922 (0.89965)	Top-1 acc 50.391 (46.290)	Top-5 acc 69.141 (70.052)	lr 0.02277
Train [24][530/3239]	Time 0.629 (0.966)	Data Time 0.001 (0.052)	Loss 3.2089 (3.2601)	Entropy 0.89911 (0.89964)	Top-1 acc 43.359 (46.307)	Top-5 acc 72.266 (70.052)	lr 0.02277
Train [24][540/3239]	Time 0.610 (0.964)	Data Time 0.001 (0.051)	Loss 3.0859 (3.2596)	Entropy 0.89927 (0.89963)	Top-1 acc 50.781 (46.300)	Top-5 acc 72.656 (70.045)	lr 0.02277
Train [24][550/3239]	Time 0.670 (0.963)	Data Time 0.001 (0.050)	Loss 3.3147 (3.2600)	Entropy 0.89903 (0.89962)	Top-1 acc 46.094 (46.285)	Top-5 acc 73.438 (70.041)	lr 0.02277
Train [24][560/3239]	Time 0.590 (0.961)	Data Time 0.001 (0.049)	Loss 3.2365 (3.2606)	Entropy 0.89918 (0.89961)	Top-1 acc 48.047 (46.285)	Top-5 acc 69.141 (70.007)	lr 0.02277
Train [24][570/3239]	Time 0.623 (0.959)	Data Time 0.002 (0.048)	Loss 3.2132 (3.2606)	Entropy 0.89921 (0.89961)	Top-1 acc 45.312 (46.297)	Top-5 acc 69.531 (69.998)	lr 0.02277
Train [24][580/3239]	Time 0.621 (0.957)	Data Time 0.001 (0.047)	Loss 3.2475 (3.2602)	Entropy 0.89935 (0.89960)	Top-1 acc 48.438 (46.316)	Top-5 acc 73.828 (70.009)	lr 0.02277
Train [24][590/3239]	Time 0.594 (0.955)	Data Time 0.026 (0.047)	Loss 3.3341 (3.2603)	Entropy 0.89935 (0.89960)	Top-1 acc 47.266 (46.315)	Top-5 acc 67.969 (70.003)	lr 0.02277
Train [24][600/3239]	Time 0.584 (0.953)	Data Time 0.001 (0.046)	Loss 3.1762 (3.2604)	Entropy 0.89924 (0.89959)	Top-1 acc 49.219 (46.306)	Top-5 acc 68.359 (69.988)	lr 0.02277
Train [24][610/3239]	Time 0.597 (0.952)	Data Time 0.001 (0.045)	Loss 3.2219 (3.2600)	Entropy 0.89879 (0.89959)	Top-1 acc 47.656 (46.320)	Top-5 acc 72.266 (69.998)	lr 0.02277
Train [24][620/3239]	Time 0.575 (0.950)	Data Time 0.001 (0.044)	Loss 3.3863 (3.2587)	Entropy 0.89809 (0.89957)	Top-1 acc 46.094 (46.352)	Top-5 acc 67.969 (70.030)	lr 0.02277
Train [24][630/3239]	Time 0.717 (0.949)	Data Time 0.002 (0.044)	Loss 3.3983 (3.2591)	Entropy 0.89824 (0.89955)	Top-1 acc 44.141 (46.335)	Top-5 acc 66.406 (70.005)	lr 0.02277
Train [24][640/3239]	Time 0.603 (0.947)	Data Time 0.001 (0.043)	Loss 3.3899 (3.2592)	Entropy 0.89824 (0.89953)	Top-1 acc 41.797 (46.325)	Top-5 acc 67.969 (70.004)	lr 0.02276
Train [24][650/3239]	Time 0.603 (0.945)	Data Time 0.001 (0.042)	Loss 3.1963 (3.2585)	Entropy 0.89823 (0.89951)	Top-1 acc 47.266 (46.330)	Top-5 acc 70.312 (70.002)	lr 0.02276
Train [24][660/3239]	Time 0.619 (0.943)	Data Time 0.001 (0.042)	Loss 3.1491 (3.2590)	Entropy 0.89806 (0.89949)	Top-1 acc 48.438 (46.301)	Top-5 acc 73.047 (69.977)	lr 0.02276
Train [24][670/3239]	Time 0.616 (0.942)	Data Time 0.001 (0.041)	Loss 3.2280 (3.2593)	Entropy 0.89806 (0.89947)	Top-1 acc 49.219 (46.302)	Top-5 acc 68.359 (69.961)	lr 0.02276
Train [24][680/3239]	Time 0.628 (0.941)	Data Time 0.001 (0.041)	Loss 3.0486 (3.2589)	Entropy 0.89798 (0.89944)	Top-1 acc 52.734 (46.323)	Top-5 acc 72.266 (69.958)	lr 0.02276
Train [24][690/3239]	Time 0.670 (0.939)	Data Time 0.001 (0.040)	Loss 3.0886 (3.2591)	Entropy 0.89782 (0.89942)	Top-1 acc 50.391 (46.330)	Top-5 acc 70.703 (69.958)	lr 0.02276
Train [24][700/3239]	Time 0.698 (0.938)	Data Time 0.001 (0.040)	Loss 3.2125 (3.2591)	Entropy 0.89809 (0.89940)	Top-1 acc 45.312 (46.326)	Top-5 acc 72.266 (69.952)	lr 0.02276
Train [24][710/3239]	Time 0.613 (0.937)	Data Time 0.001 (0.039)	Loss 3.2308 (3.2592)	Entropy 0.89817 (0.89938)	Top-1 acc 46.484 (46.314)	Top-5 acc 70.312 (69.938)	lr 0.02276
Train [24][720/3239]	Time 0.565 (0.936)	Data Time 0.001 (0.039)	Loss 3.3383 (3.2589)	Entropy 0.89741 (0.89936)	Top-1 acc 41.016 (46.319)	Top-5 acc 66.016 (69.940)	lr 0.02276
Train [24][730/3239]	Time 0.596 (0.935)	Data Time 0.001 (0.038)	Loss 3.3576 (3.2591)	Entropy 0.89709 (0.89933)	Top-1 acc 46.094 (46.304)	Top-5 acc 66.797 (69.940)	lr 0.02276
Train [24][740/3239]	Time 0.572 (0.934)	Data Time 0.002 (0.038)	Loss 3.2268 (3.2596)	Entropy 0.89702 (0.89930)	Top-1 acc 43.750 (46.290)	Top-5 acc 71.094 (69.924)	lr 0.02276
Train [24][750/3239]	Time 0.603 (0.933)	Data Time 0.001 (0.037)	Loss 2.9168 (3.2592)	Entropy 0.89718 (0.89927)	Top-1 acc 53.125 (46.297)	Top-5 acc 75.781 (69.937)	lr 0.02276
Train [24][760/3239]	Time 0.605 (0.932)	Data Time 0.001 (0.037)	Loss 3.3590 (3.2598)	Entropy 0.89720 (0.89924)	Top-1 acc 45.312 (46.289)	Top-5 acc 67.188 (69.921)	lr 0.02276
Train [24][770/3239]	Time 0.662 (0.931)	Data Time 0.001 (0.036)	Loss 3.1561 (3.2592)	Entropy 0.89741 (0.89922)	Top-1 acc 47.266 (46.296)	Top-5 acc 72.266 (69.923)	lr 0.02276
Train [24][780/3239]	Time 0.563 (0.960)	Data Time 0.002 (0.036)	Loss 3.5477 (3.2599)	Entropy 0.89742 (0.89919)	Top-1 acc 41.797 (46.283)	Top-5 acc 62.109 (69.900)	lr 0.02276
Train [24][790/3239]	Time 0.715 (0.958)	Data Time 0.001 (0.035)	Loss 3.3804 (3.2593)	Entropy 0.89711 (0.89917)	Top-1 acc 44.141 (46.285)	Top-5 acc 66.016 (69.920)	lr 0.02276
Train [24][800/3239]	Time 0.599 (0.957)	Data Time 0.001 (0.035)	Loss 3.3068 (3.2593)	Entropy 0.89668 (0.89914)	Top-1 acc 46.094 (46.278)	Top-5 acc 70.312 (69.927)	lr 0.02276
Train [24][810/3239]	Time 0.613 (0.956)	Data Time 0.001 (0.035)	Loss 3.2725 (3.2597)	Entropy 0.89618 (0.89911)	Top-1 acc 44.922 (46.264)	Top-5 acc 67.969 (69.919)	lr 0.02276
Train [24][820/3239]	Time 0.587 (0.955)	Data Time 0.002 (0.034)	Loss 3.4547 (3.2599)	Entropy 0.89655 (0.89907)	Top-1 acc 38.672 (46.266)	Top-5 acc 65.234 (69.921)	lr 0.02275
Train [24][830/3239]	Time 0.636 (0.954)	Data Time 0.001 (0.034)	Loss 2.9824 (3.2598)	Entropy 0.89614 (0.89904)	Top-1 acc 51.953 (46.273)	Top-5 acc 75.391 (69.934)	lr 0.02275
Train [24][840/3239]	Time 0.643 (0.953)	Data Time 0.001 (0.033)	Loss 3.4801 (3.2602)	Entropy 0.89585 (0.89900)	Top-1 acc 43.359 (46.282)	Top-5 acc 64.062 (69.923)	lr 0.02275
Train [24][850/3239]	Time 0.602 (0.951)	Data Time 0.001 (0.033)	Loss 3.4258 (3.2605)	Entropy 0.89570 (0.89897)	Top-1 acc 45.703 (46.274)	Top-5 acc 68.359 (69.919)	lr 0.02275
Train [24][860/3239]	Time 0.730 (0.951)	Data Time 0.001 (0.033)	Loss 3.2133 (3.2600)	Entropy 0.89553 (0.89893)	Top-1 acc 46.094 (46.279)	Top-5 acc 70.703 (69.932)	lr 0.02275
Train [24][870/3239]	Time 0.616 (0.950)	Data Time 0.001 (0.032)	Loss 3.4356 (3.2600)	Entropy 0.89557 (0.89889)	Top-1 acc 42.578 (46.289)	Top-5 acc 66.406 (69.937)	lr 0.02275
Train [24][880/3239]	Time 0.598 (0.948)	Data Time 0.002 (0.032)	Loss 3.2220 (3.2596)	Entropy 0.89544 (0.89885)	Top-1 acc 47.266 (46.293)	Top-5 acc 72.266 (69.937)	lr 0.02275
Train [24][890/3239]	Time 0.658 (0.948)	Data Time 0.001 (0.032)	Loss 3.2715 (3.2596)	Entropy 0.89532 (0.89881)	Top-1 acc 47.266 (46.288)	Top-5 acc 70.312 (69.940)	lr 0.02275
Train [24][900/3239]	Time 0.601 (0.946)	Data Time 0.001 (0.031)	Loss 3.4714 (3.2593)	Entropy 0.89543 (0.89878)	Top-1 acc 42.969 (46.283)	Top-5 acc 64.062 (69.931)	lr 0.02275
Train [24][910/3239]	Time 0.615 (0.946)	Data Time 0.005 (0.031)	Loss 3.2876 (3.2588)	Entropy 0.89537 (0.89874)	Top-1 acc 43.750 (46.303)	Top-5 acc 68.359 (69.941)	lr 0.02275
Train [24][920/3239]	Time 0.617 (0.945)	Data Time 0.001 (0.031)	Loss 3.1579 (3.2587)	Entropy 0.89550 (0.89870)	Top-1 acc 46.875 (46.311)	Top-5 acc 73.438 (69.941)	lr 0.02275
Train [24][930/3239]	Time 0.654 (0.944)	Data Time 0.001 (0.030)	Loss 3.4948 (3.2581)	Entropy 0.89539 (0.89867)	Top-1 acc 40.234 (46.327)	Top-5 acc 64.062 (69.952)	lr 0.02275
Train [24][940/3239]	Time 0.645 (0.943)	Data Time 0.001 (0.030)	Loss 3.2136 (3.2581)	Entropy 0.89527 (0.89863)	Top-1 acc 50.391 (46.321)	Top-5 acc 70.703 (69.951)	lr 0.02275
Train [24][950/3239]	Time 0.638 (0.942)	Data Time 0.001 (0.030)	Loss 3.0577 (3.2581)	Entropy 0.89510 (0.89860)	Top-1 acc 52.344 (46.323)	Top-5 acc 75.000 (69.946)	lr 0.02275
Train [24][960/3239]	Time 0.571 (0.941)	Data Time 0.001 (0.029)	Loss 3.3837 (3.2584)	Entropy 0.89525 (0.89856)	Top-1 acc 45.703 (46.321)	Top-5 acc 65.625 (69.941)	lr 0.02275
Train [24][970/3239]	Time 0.601 (0.939)	Data Time 0.001 (0.029)	Loss 3.3051 (3.2594)	Entropy 0.89505 (0.89853)	Top-1 acc 43.750 (46.298)	Top-5 acc 69.141 (69.931)	lr 0.02275
Train [24][980/3239]	Time 0.597 (0.938)	Data Time 0.001 (0.029)	Loss 3.2847 (3.2595)	Entropy 0.89494 (0.89849)	Top-1 acc 47.656 (46.304)	Top-5 acc 67.188 (69.925)	lr 0.02275
Train [24][990/3239]	Time 0.598 (0.938)	Data Time 0.001 (0.029)	Loss 3.2815 (3.2595)	Entropy 0.89495 (0.89845)	Top-1 acc 48.047 (46.307)	Top-5 acc 68.750 (69.935)	lr 0.02274
Train [24][1000/3239]	Time 0.592 (0.937)	Data Time 0.001 (0.028)	Loss 3.0646 (3.2597)	Entropy 0.89407 (0.89841)	Top-1 acc 51.172 (46.301)	Top-5 acc 73.047 (69.935)	lr 0.02274
Train [24][1010/3239]	Time 0.617 (0.936)	Data Time 0.001 (0.028)	Loss 3.1242 (3.2595)	Entropy 0.89374 (0.89837)	Top-1 acc 46.875 (46.296)	Top-5 acc 73.438 (69.930)	lr 0.02274
Train [24][1020/3239]	Time 0.637 (0.935)	Data Time 0.001 (0.028)	Loss 3.1838 (3.2589)	Entropy 0.89337 (0.89832)	Top-1 acc 46.094 (46.296)	Top-5 acc 73.438 (69.948)	lr 0.02274
Train [24][1030/3239]	Time 0.618 (0.935)	Data Time 0.002 (0.028)	Loss 3.1749 (3.2587)	Entropy 0.89347 (0.89828)	Top-1 acc 47.656 (46.292)	Top-5 acc 71.094 (69.952)	lr 0.02274
Train [24][1040/3239]	Time 0.580 (0.934)	Data Time 0.001 (0.027)	Loss 3.4403 (3.2590)	Entropy 0.89399 (0.89823)	Top-1 acc 41.797 (46.292)	Top-5 acc 64.062 (69.945)	lr 0.02274
Train [24][1050/3239]	Time 0.618 (0.933)	Data Time 0.002 (0.027)	Loss 3.2177 (3.2597)	Entropy 0.89382 (0.89819)	Top-1 acc 48.047 (46.283)	Top-5 acc 69.922 (69.939)	lr 0.02274
Train [24][1060/3239]	Time 0.619 (0.933)	Data Time 0.001 (0.027)	Loss 3.2669 (3.2599)	Entropy 0.89414 (0.89815)	Top-1 acc 51.562 (46.287)	Top-5 acc 69.531 (69.934)	lr 0.02274
Train [24][1070/3239]	Time 0.551 (0.932)	Data Time 0.001 (0.027)	Loss 3.2627 (3.2595)	Entropy 0.89464 (0.89812)	Top-1 acc 46.484 (46.291)	Top-5 acc 69.531 (69.946)	lr 0.02274
Train [24][1080/3239]	Time 0.669 (0.932)	Data Time 0.002 (0.026)	Loss 3.0770 (3.2598)	Entropy 0.89449 (0.89808)	Top-1 acc 46.094 (46.274)	Top-5 acc 74.609 (69.938)	lr 0.02274
Train [24][1090/3239]	Time 0.689 (0.931)	Data Time 0.001 (0.026)	Loss 3.4191 (3.2598)	Entropy 0.89452 (0.89805)	Top-1 acc 40.234 (46.281)	Top-5 acc 64.453 (69.943)	lr 0.02274
Train [24][1100/3239]	Time 0.644 (0.931)	Data Time 0.001 (0.026)	Loss 3.1431 (3.2603)	Entropy 0.89481 (0.89802)	Top-1 acc 48.828 (46.263)	Top-5 acc 70.703 (69.925)	lr 0.02274
Train [24][1110/3239]	Time 0.547 (0.930)	Data Time 0.001 (0.026)	Loss 3.1073 (3.2602)	Entropy 0.89494 (0.89799)	Top-1 acc 50.781 (46.266)	Top-5 acc 73.047 (69.928)	lr 0.02274
Train [24][1120/3239]	Time 0.609 (0.929)	Data Time 0.001 (0.026)	Loss 3.1796 (3.2599)	Entropy 0.89478 (0.89796)	Top-1 acc 48.828 (46.267)	Top-5 acc 71.484 (69.940)	lr 0.02274
Train [24][1130/3239]	Time 0.612 (0.928)	Data Time 0.001 (0.025)	Loss 3.1578 (3.2599)	Entropy 0.89483 (0.89794)	Top-1 acc 49.609 (46.270)	Top-5 acc 70.703 (69.934)	lr 0.02274
Train [24][1140/3239]	Time 0.606 (0.927)	Data Time 0.001 (0.025)	Loss 3.3477 (3.2603)	Entropy 0.89479 (0.89791)	Top-1 acc 40.234 (46.265)	Top-5 acc 67.578 (69.927)	lr 0.02274
Train [24][1150/3239]	Time 0.586 (0.927)	Data Time 0.001 (0.025)	Loss 3.1735 (3.2599)	Entropy 0.89504 (0.89788)	Top-1 acc 46.875 (46.274)	Top-5 acc 73.047 (69.935)	lr 0.02274
Train [24][1160/3239]	Time 0.645 (0.926)	Data Time 0.002 (0.025)	Loss 3.2908 (3.2603)	Entropy 0.89523 (0.89786)	Top-1 acc 43.359 (46.270)	Top-5 acc 68.750 (69.923)	lr 0.02273
Train [24][1170/3239]	Time 0.546 (0.926)	Data Time 0.001 (0.025)	Loss 3.2881 (3.2606)	Entropy 0.89496 (0.89784)	Top-1 acc 47.266 (46.263)	Top-5 acc 67.578 (69.921)	lr 0.02273
Train [24][1180/3239]	Time 0.681 (0.925)	Data Time 0.001 (0.024)	Loss 3.2002 (3.2605)	Entropy 0.89484 (0.89781)	Top-1 acc 46.875 (46.260)	Top-5 acc 73.047 (69.924)	lr 0.02273
Train [24][1190/3239]	Time 0.600 (0.925)	Data Time 0.001 (0.024)	Loss 3.1900 (3.2603)	Entropy 0.89498 (0.89779)	Top-1 acc 50.000 (46.261)	Top-5 acc 71.875 (69.932)	lr 0.02273
Train [24][1200/3239]	Time 0.541 (0.924)	Data Time 0.001 (0.024)	Loss 3.4465 (3.2607)	Entropy 0.89443 (0.89776)	Top-1 acc 40.625 (46.250)	Top-5 acc 65.234 (69.921)	lr 0.02273
Train [24][1210/3239]	Time 0.595 (0.924)	Data Time 0.001 (0.024)	Loss 3.2624 (3.2605)	Entropy 0.89465 (0.89773)	Top-1 acc 48.438 (46.260)	Top-5 acc 69.922 (69.925)	lr 0.02273
Train [24][1220/3239]	Time 0.611 (0.923)	Data Time 0.002 (0.024)	Loss 3.4175 (3.2605)	Entropy 0.89454 (0.89771)	Top-1 acc 44.141 (46.259)	Top-5 acc 67.578 (69.933)	lr 0.02273
Train [24][1230/3239]	Time 0.568 (0.923)	Data Time 0.001 (0.023)	Loss 3.3809 (3.2606)	Entropy 0.89437 (0.89768)	Top-1 acc 43.750 (46.251)	Top-5 acc 68.750 (69.934)	lr 0.02273
Train [24][1240/3239]	Time 0.595 (0.922)	Data Time 0.001 (0.023)	Loss 3.3591 (3.2612)	Entropy 0.89421 (0.89765)	Top-1 acc 45.312 (46.242)	Top-5 acc 69.141 (69.922)	lr 0.02273
Train [24][1250/3239]	Time 0.686 (0.922)	Data Time 0.001 (0.023)	Loss 3.1615 (3.2612)	Entropy 0.89406 (0.89763)	Top-1 acc 47.266 (46.242)	Top-5 acc 71.484 (69.923)	lr 0.02273
Train [24][1260/3239]	Time 0.604 (0.921)	Data Time 0.001 (0.023)	Loss 3.2788 (3.2609)	Entropy 0.89392 (0.89760)	Top-1 acc 44.531 (46.239)	Top-5 acc 70.312 (69.934)	lr 0.02273
Train [24][1270/3239]	Time 0.617 (0.921)	Data Time 0.001 (0.023)	Loss 3.3922 (3.2613)	Entropy 0.89369 (0.89757)	Top-1 acc 41.406 (46.224)	Top-5 acc 66.406 (69.925)	lr 0.02273
Train [24][1280/3239]	Time 0.617 (0.920)	Data Time 0.001 (0.023)	Loss 3.1923 (3.2612)	Entropy 0.89419 (0.89754)	Top-1 acc 50.000 (46.231)	Top-5 acc 70.312 (69.929)	lr 0.02273
Train [24][1290/3239]	Time 0.608 (0.919)	Data Time 0.001 (0.022)	Loss 3.3932 (3.2614)	Entropy 0.89436 (0.89751)	Top-1 acc 40.234 (46.230)	Top-5 acc 66.016 (69.930)	lr 0.02273
Train [24][1300/3239]	Time 0.597 (0.919)	Data Time 0.001 (0.022)	Loss 3.1385 (3.2617)	Entropy 0.89396 (0.89749)	Top-1 acc 51.172 (46.227)	Top-5 acc 73.828 (69.927)	lr 0.02273
Train [24][1310/3239]	Time 0.573 (0.918)	Data Time 0.001 (0.022)	Loss 3.2418 (3.2619)	Entropy 0.89352 (0.89746)	Top-1 acc 48.047 (46.225)	Top-5 acc 69.922 (69.922)	lr 0.02273
Train [24][1320/3239]	Time 0.600 (0.918)	Data Time 0.001 (0.022)	Loss 3.1926 (3.2615)	Entropy 0.89387 (0.89743)	Top-1 acc 49.219 (46.227)	Top-5 acc 70.312 (69.926)	lr 0.02273
Train [24][1330/3239]	Time 0.600 (0.917)	Data Time 0.001 (0.022)	Loss 3.1857 (3.2612)	Entropy 0.89319 (0.89740)	Top-1 acc 49.609 (46.236)	Top-5 acc 74.609 (69.934)	lr 0.02272
Train [24][1340/3239]	Time 0.694 (0.917)	Data Time 0.001 (0.022)	Loss 3.1831 (3.2610)	Entropy 0.89305 (0.89737)	Top-1 acc 49.219 (46.240)	Top-5 acc 70.703 (69.934)	lr 0.02272
Train [24][1350/3239]	Time 0.557 (0.916)	Data Time 0.001 (0.022)	Loss 3.2954 (3.2614)	Entropy 0.89317 (0.89734)	Top-1 acc 46.484 (46.228)	Top-5 acc 69.141 (69.931)	lr 0.02272
Train [24][1360/3239]	Time 0.605 (0.916)	Data Time 0.001 (0.021)	Loss 3.1501 (3.2616)	Entropy 0.89299 (0.89731)	Top-1 acc 47.266 (46.227)	Top-5 acc 71.094 (69.924)	lr 0.02272
Train [24][1370/3239]	Time 0.601 (0.915)	Data Time 0.001 (0.021)	Loss 3.1733 (3.2620)	Entropy 0.89276 (0.89728)	Top-1 acc 48.047 (46.220)	Top-5 acc 73.828 (69.918)	lr 0.02272
Train [24][1380/3239]	Time 0.591 (0.915)	Data Time 0.001 (0.021)	Loss 3.2949 (3.2619)	Entropy 0.89281 (0.89724)	Top-1 acc 41.406 (46.222)	Top-5 acc 65.625 (69.911)	lr 0.02272
Train [24][1390/3239]	Time 0.620 (0.915)	Data Time 0.001 (0.021)	Loss 3.3757 (3.2620)	Entropy 0.89267 (0.89721)	Top-1 acc 44.531 (46.222)	Top-5 acc 70.312 (69.911)	lr 0.02272
Train [24][1400/3239]	Time 0.588 (0.914)	Data Time 0.001 (0.021)	Loss 3.4064 (3.2620)	Entropy 0.89254 (0.89718)	Top-1 acc 44.141 (46.216)	Top-5 acc 69.531 (69.907)	lr 0.02272
Train [24][1410/3239]	Time 0.689 (0.914)	Data Time 0.001 (0.021)	Loss 3.2712 (3.2620)	Entropy 0.89269 (0.89715)	Top-1 acc 46.094 (46.224)	Top-5 acc 70.703 (69.909)	lr 0.02272
Train [24][1420/3239]	Time 0.540 (0.914)	Data Time 0.001 (0.021)	Loss 3.2229 (3.2619)	Entropy 0.89211 (0.89711)	Top-1 acc 44.922 (46.232)	Top-5 acc 70.703 (69.911)	lr 0.02272
Train [24][1430/3239]	Time 0.703 (0.932)	Data Time 0.004 (0.020)	Loss 3.4149 (3.2620)	Entropy 0.89207 (0.89708)	Top-1 acc 41.797 (46.226)	Top-5 acc 68.359 (69.910)	lr 0.02272
Train [24][1440/3239]	Time 0.611 (0.932)	Data Time 0.002 (0.020)	Loss 3.0291 (3.2615)	Entropy 0.89191 (0.89704)	Top-1 acc 50.781 (46.242)	Top-5 acc 72.656 (69.922)	lr 0.02272
Train [24][1450/3239]	Time 0.614 (0.931)	Data Time 0.002 (0.020)	Loss 3.1296 (3.2613)	Entropy 0.89223 (0.89701)	Top-1 acc 49.609 (46.243)	Top-5 acc 70.703 (69.927)	lr 0.02272
Train [24][1460/3239]	Time 0.638 (0.931)	Data Time 0.001 (0.020)	Loss 3.4633 (3.2612)	Entropy 0.89215 (0.89698)	Top-1 acc 39.062 (46.240)	Top-5 acc 65.234 (69.928)	lr 0.02272
Train [24][1470/3239]	Time 0.579 (0.931)	Data Time 0.001 (0.020)	Loss 3.3359 (3.2616)	Entropy 0.89242 (0.89694)	Top-1 acc 45.703 (46.236)	Top-5 acc 66.797 (69.920)	lr 0.02272
Train [24][1480/3239]	Time 0.581 (0.930)	Data Time 0.001 (0.020)	Loss 3.1060 (3.2614)	Entropy 0.89226 (0.89691)	Top-1 acc 49.219 (46.242)	Top-5 acc 75.000 (69.925)	lr 0.02272
Train [24][1490/3239]	Time 0.573 (0.930)	Data Time 0.002 (0.020)	Loss 3.6452 (3.2616)	Entropy 0.89251 (0.89688)	Top-1 acc 36.719 (46.238)	Top-5 acc 62.109 (69.914)	lr 0.02272
Train [24][1500/3239]	Time 0.596 (0.929)	Data Time 0.001 (0.020)	Loss 3.2093 (3.2617)	Entropy 0.89227 (0.89685)	Top-1 acc 43.359 (46.231)	Top-5 acc 69.922 (69.914)	lr 0.02272
Train [24][1510/3239]	Time 0.598 (0.929)	Data Time 0.001 (0.019)	Loss 3.2002 (3.2617)	Entropy 0.89231 (0.89682)	Top-1 acc 46.094 (46.227)	Top-5 acc 71.875 (69.915)	lr 0.02271
Train [24][1520/3239]	Time 0.588 (0.928)	Data Time 0.001 (0.019)	Loss 2.9425 (3.2612)	Entropy 0.89249 (0.89679)	Top-1 acc 52.734 (46.231)	Top-5 acc 79.297 (69.924)	lr 0.02271
Train [24][1530/3239]	Time 0.614 (0.928)	Data Time 0.001 (0.019)	Loss 3.1953 (3.2609)	Entropy 0.89252 (0.89676)	Top-1 acc 49.219 (46.233)	Top-5 acc 70.312 (69.935)	lr 0.02271
Train [24][1540/3239]	Time 0.556 (0.927)	Data Time 0.001 (0.019)	Loss 3.3217 (3.2610)	Entropy 0.89284 (0.89674)	Top-1 acc 42.969 (46.231)	Top-5 acc 67.969 (69.931)	lr 0.02271
Train [24][1550/3239]	Time 0.603 (0.927)	Data Time 0.001 (0.019)	Loss 3.1496 (3.2611)	Entropy 0.89274 (0.89671)	Top-1 acc 51.562 (46.232)	Top-5 acc 70.312 (69.926)	lr 0.02271
Train [24][1560/3239]	Time 0.613 (0.926)	Data Time 0.001 (0.019)	Loss 3.4171 (3.2610)	Entropy 0.89286 (0.89669)	Top-1 acc 40.234 (46.233)	Top-5 acc 69.922 (69.926)	lr 0.02271
Train [24][1570/3239]	Time 0.732 (0.926)	Data Time 0.001 (0.019)	Loss 3.3217 (3.2611)	Entropy 0.89280 (0.89666)	Top-1 acc 48.047 (46.231)	Top-5 acc 65.234 (69.924)	lr 0.02271
Train [24][1580/3239]	Time 0.652 (0.926)	Data Time 0.002 (0.019)	Loss 3.4408 (3.2615)	Entropy 0.89245 (0.89663)	Top-1 acc 45.312 (46.226)	Top-5 acc 64.453 (69.913)	lr 0.02271
Train [24][1590/3239]	Time 0.642 (0.925)	Data Time 0.001 (0.019)	Loss 3.0242 (3.2615)	Entropy 0.89235 (0.89661)	Top-1 acc 53.125 (46.225)	Top-5 acc 73.047 (69.914)	lr 0.02271
Train [24][1600/3239]	Time 0.600 (0.925)	Data Time 0.001 (0.018)	Loss 3.4035 (3.2619)	Entropy 0.89194 (0.89658)	Top-1 acc 41.797 (46.217)	Top-5 acc 64.844 (69.902)	lr 0.02271
Train [24][1610/3239]	Time 0.452 (0.924)	Data Time 0.001 (0.018)	Loss 3.4299 (3.2619)	Entropy 0.89191 (0.89655)	Top-1 acc 44.922 (46.220)	Top-5 acc 66.406 (69.903)	lr 0.02271
Train [24][1620/3239]	Time 0.658 (0.923)	Data Time 0.001 (0.018)	Loss 3.0773 (3.2619)	Entropy 0.89182 (0.89652)	Top-1 acc 48.438 (46.215)	Top-5 acc 74.609 (69.902)	lr 0.02271
Train [24][1630/3239]	Time 0.599 (0.923)	Data Time 0.001 (0.018)	Loss 3.2126 (3.2618)	Entropy 0.89144 (0.89649)	Top-1 acc 43.750 (46.213)	Top-5 acc 73.438 (69.901)	lr 0.02271
Train [24][1640/3239]	Time 0.570 (0.923)	Data Time 0.002 (0.018)	Loss 3.4826 (3.2620)	Entropy 0.89109 (0.89646)	Top-1 acc 41.016 (46.204)	Top-5 acc 63.672 (69.900)	lr 0.02271
Train [24][1650/3239]	Time 0.614 (0.922)	Data Time 0.001 (0.018)	Loss 3.3105 (3.2623)	Entropy 0.89118 (0.89643)	Top-1 acc 50.000 (46.198)	Top-5 acc 71.094 (69.902)	lr 0.02271
Train [24][1660/3239]	Time 0.594 (0.922)	Data Time 0.001 (0.018)	Loss 3.3353 (3.2622)	Entropy 0.89146 (0.89640)	Top-1 acc 42.578 (46.195)	Top-5 acc 66.797 (69.903)	lr 0.02271
Train [24][1670/3239]	Time 0.591 (0.922)	Data Time 0.001 (0.018)	Loss 3.2412 (3.2627)	Entropy 0.89152 (0.89637)	Top-1 acc 42.969 (46.178)	Top-5 acc 71.094 (69.888)	lr 0.02271
Train [24][1680/3239]	Time 0.605 (0.921)	Data Time 0.001 (0.018)	Loss 3.3706 (3.2633)	Entropy 0.89180 (0.89634)	Top-1 acc 44.531 (46.175)	Top-5 acc 66.016 (69.877)	lr 0.02270
Train [24][1690/3239]	Time 0.611 (0.921)	Data Time 0.001 (0.018)	Loss 3.3240 (3.2636)	Entropy 0.89165 (0.89631)	Top-1 acc 44.141 (46.165)	Top-5 acc 67.969 (69.873)	lr 0.02270
Train [24][1700/3239]	Time 0.581 (0.920)	Data Time 0.001 (0.018)	Loss 3.1530 (3.2635)	Entropy 0.89200 (0.89629)	Top-1 acc 50.781 (46.168)	Top-5 acc 73.828 (69.872)	lr 0.02270
Train [24][1710/3239]	Time 0.615 (0.920)	Data Time 0.001 (0.017)	Loss 3.1553 (3.2635)	Entropy 0.89127 (0.89626)	Top-1 acc 44.922 (46.161)	Top-5 acc 73.047 (69.870)	lr 0.02270
Train [24][1720/3239]	Time 0.581 (0.920)	Data Time 0.001 (0.017)	Loss 3.4611 (3.2641)	Entropy 0.89090 (0.89623)	Top-1 acc 42.188 (46.148)	Top-5 acc 64.062 (69.855)	lr 0.02270
Train [24][1730/3239]	Time 0.728 (0.920)	Data Time 0.001 (0.017)	Loss 3.3860 (3.2638)	Entropy 0.89112 (0.89620)	Top-1 acc 43.750 (46.155)	Top-5 acc 65.625 (69.862)	lr 0.02270
Train [24][1740/3239]	Time 0.624 (0.919)	Data Time 0.001 (0.017)	Loss 3.0979 (3.2638)	Entropy 0.89106 (0.89617)	Top-1 acc 48.828 (46.155)	Top-5 acc 75.391 (69.863)	lr 0.02270
Train [24][1750/3239]	Time 0.633 (0.919)	Data Time 0.001 (0.017)	Loss 3.3972 (3.2639)	Entropy 0.89115 (0.89614)	Top-1 acc 38.281 (46.154)	Top-5 acc 69.141 (69.860)	lr 0.02270
Train [24][1760/3239]	Time 0.618 (0.919)	Data Time 0.001 (0.017)	Loss 3.4332 (3.2641)	Entropy 0.89102 (0.89611)	Top-1 acc 40.234 (46.146)	Top-5 acc 66.016 (69.858)	lr 0.02270
Train [24][1770/3239]	Time 0.582 (0.918)	Data Time 0.001 (0.017)	Loss 3.1171 (3.2638)	Entropy 0.89058 (0.89608)	Top-1 acc 50.000 (46.151)	Top-5 acc 73.438 (69.864)	lr 0.02270
Train [24][1780/3239]	Time 0.596 (0.918)	Data Time 0.001 (0.017)	Loss 3.3687 (3.2638)	Entropy 0.89091 (0.89605)	Top-1 acc 44.141 (46.151)	Top-5 acc 71.094 (69.867)	lr 0.02270
Train [24][1790/3239]	Time 0.635 (0.917)	Data Time 0.001 (0.017)	Loss 3.3935 (3.2641)	Entropy 0.89149 (0.89603)	Top-1 acc 42.578 (46.151)	Top-5 acc 66.797 (69.860)	lr 0.02270
Train [24][1800/3239]	Time 0.690 (0.917)	Data Time 0.001 (0.017)	Loss 3.2637 (3.2642)	Entropy 0.89126 (0.89600)	Top-1 acc 46.875 (46.147)	Top-5 acc 72.266 (69.856)	lr 0.02270
Train [24][1810/3239]	Time 0.609 (0.916)	Data Time 0.001 (0.017)	Loss 3.2596 (3.2643)	Entropy 0.89146 (0.89597)	Top-1 acc 49.219 (46.149)	Top-5 acc 70.703 (69.851)	lr 0.02270
Train [24][1820/3239]	Time 0.603 (0.916)	Data Time 0.001 (0.016)	Loss 3.5356 (3.2645)	Entropy 0.89140 (0.89595)	Top-1 acc 42.969 (46.143)	Top-5 acc 63.672 (69.843)	lr 0.02270
Train [24][1830/3239]	Time 0.599 (0.916)	Data Time 0.001 (0.016)	Loss 3.1163 (3.2643)	Entropy 0.89136 (0.89592)	Top-1 acc 49.609 (46.144)	Top-5 acc 74.219 (69.848)	lr 0.02270
Train [24][1840/3239]	Time 0.603 (0.915)	Data Time 0.001 (0.016)	Loss 3.3316 (3.2641)	Entropy 0.89113 (0.89590)	Top-1 acc 45.703 (46.150)	Top-5 acc 71.094 (69.859)	lr 0.02270
Train [24][1850/3239]	Time 0.582 (0.915)	Data Time 0.001 (0.016)	Loss 3.2510 (3.2641)	Entropy 0.89181 (0.89587)	Top-1 acc 46.094 (46.152)	Top-5 acc 73.047 (69.863)	lr 0.02269
Train [24][1860/3239]	Time 0.578 (0.915)	Data Time 0.001 (0.016)	Loss 3.2382 (3.2639)	Entropy 0.89192 (0.89585)	Top-1 acc 48.828 (46.152)	Top-5 acc 69.531 (69.866)	lr 0.02269
Train [24][1870/3239]	Time 0.572 (0.915)	Data Time 0.001 (0.016)	Loss 3.3410 (3.2637)	Entropy 0.89217 (0.89583)	Top-1 acc 41.016 (46.157)	Top-5 acc 69.141 (69.872)	lr 0.02269
Train [24][1880/3239]	Time 0.597 (0.914)	Data Time 0.001 (0.016)	Loss 3.1780 (3.2638)	Entropy 0.89172 (0.89581)	Top-1 acc 48.828 (46.151)	Top-5 acc 71.094 (69.876)	lr 0.02269
Train [24][1890/3239]	Time 0.727 (0.914)	Data Time 0.001 (0.016)	Loss 3.2964 (3.2638)	Entropy 0.89196 (0.89579)	Top-1 acc 47.266 (46.155)	Top-5 acc 70.312 (69.878)	lr 0.02269
Train [24][1900/3239]	Time 0.603 (0.914)	Data Time 0.001 (0.016)	Loss 3.4007 (3.2636)	Entropy 0.89193 (0.89577)	Top-1 acc 42.578 (46.158)	Top-5 acc 68.750 (69.883)	lr 0.02269
Train [24][1910/3239]	Time 0.642 (0.913)	Data Time 0.001 (0.016)	Loss 3.0192 (3.2634)	Entropy 0.89192 (0.89575)	Top-1 acc 52.734 (46.165)	Top-5 acc 73.047 (69.887)	lr 0.02269
Train [24][1920/3239]	Time 0.602 (0.913)	Data Time 0.001 (0.016)	Loss 3.0947 (3.2633)	Entropy 0.89142 (0.89573)	Top-1 acc 50.000 (46.168)	Top-5 acc 73.047 (69.889)	lr 0.02269
Train [24][1930/3239]	Time 0.617 (0.913)	Data Time 0.001 (0.016)	Loss 3.3423 (3.2634)	Entropy 0.89107 (0.89570)	Top-1 acc 44.922 (46.167)	Top-5 acc 68.359 (69.888)	lr 0.02269
Train [24][1940/3239]	Time 0.608 (0.913)	Data Time 0.001 (0.016)	Loss 3.2089 (3.2634)	Entropy 0.89086 (0.89568)	Top-1 acc 45.312 (46.170)	Top-5 acc 70.703 (69.888)	lr 0.02269
Train [24][1950/3239]	Time 0.614 (0.912)	Data Time 0.001 (0.016)	Loss 3.1030 (3.2631)	Entropy 0.89091 (0.89566)	Top-1 acc 54.297 (46.181)	Top-5 acc 73.047 (69.896)	lr 0.02269
Train [24][1960/3239]	Time 0.663 (0.912)	Data Time 0.001 (0.015)	Loss 3.5512 (3.2632)	Entropy 0.89097 (0.89563)	Top-1 acc 45.312 (46.179)	Top-5 acc 64.453 (69.895)	lr 0.02269
Train [24][1970/3239]	Time 0.609 (0.911)	Data Time 0.001 (0.015)	Loss 3.3347 (3.2631)	Entropy 0.89082 (0.89561)	Top-1 acc 47.656 (46.177)	Top-5 acc 66.797 (69.893)	lr 0.02269
Train [24][1980/3239]	Time 0.573 (0.911)	Data Time 0.001 (0.015)	Loss 3.3694 (3.2632)	Entropy 0.89014 (0.89558)	Top-1 acc 44.922 (46.176)	Top-5 acc 66.797 (69.889)	lr 0.02269
Train [24][1990/3239]	Time 0.586 (0.911)	Data Time 0.001 (0.015)	Loss 3.3052 (3.2630)	Entropy 0.89029 (0.89556)	Top-1 acc 41.406 (46.178)	Top-5 acc 69.141 (69.894)	lr 0.02269
Train [24][2000/3239]	Time 0.611 (0.910)	Data Time 0.001 (0.015)	Loss 3.4843 (3.2629)	Entropy 0.89030 (0.89553)	Top-1 acc 38.672 (46.177)	Top-5 acc 61.328 (69.897)	lr 0.02269
Train [24][2010/3239]	Time 0.574 (0.910)	Data Time 0.001 (0.015)	Loss 3.2387 (3.2629)	Entropy 0.89036 (0.89550)	Top-1 acc 45.312 (46.182)	Top-5 acc 75.781 (69.899)	lr 0.02269
Train [24][2020/3239]	Time 0.583 (0.910)	Data Time 0.001 (0.015)	Loss 3.0885 (3.2629)	Entropy 0.89034 (0.89548)	Top-1 acc 47.266 (46.181)	Top-5 acc 76.172 (69.895)	lr 0.02268
Train [24][2030/3239]	Time 0.713 (0.910)	Data Time 0.001 (0.015)	Loss 3.4371 (3.2627)	Entropy 0.89038 (0.89545)	Top-1 acc 42.578 (46.186)	Top-5 acc 67.969 (69.898)	lr 0.02268
Train [24][2040/3239]	Time 0.584 (0.910)	Data Time 0.001 (0.015)	Loss 3.3122 (3.2630)	Entropy 0.89066 (0.89543)	Top-1 acc 44.922 (46.182)	Top-5 acc 68.750 (69.889)	lr 0.02268
Train [24][2050/3239]	Time 0.600 (0.909)	Data Time 0.002 (0.015)	Loss 3.5112 (3.2633)	Entropy 0.89048 (0.89541)	Top-1 acc 41.406 (46.173)	Top-5 acc 65.625 (69.882)	lr 0.02268
Train [24][2060/3239]	Time 0.652 (0.909)	Data Time 0.002 (0.015)	Loss 3.1431 (3.2633)	Entropy 0.89036 (0.89538)	Top-1 acc 51.953 (46.173)	Top-5 acc 70.312 (69.877)	lr 0.02268
Train [24][2070/3239]	Time 0.570 (0.909)	Data Time 0.001 (0.015)	Loss 3.0453 (3.2630)	Entropy 0.89005 (0.89536)	Top-1 acc 50.781 (46.176)	Top-5 acc 72.266 (69.881)	lr 0.02268
Train [24][2080/3239]	Time 0.605 (0.909)	Data Time 0.001 (0.015)	Loss 3.3359 (3.2630)	Entropy 0.89002 (0.89533)	Top-1 acc 46.484 (46.174)	Top-5 acc 71.875 (69.883)	lr 0.02268
Train [24][2090/3239]	Time 0.627 (0.921)	Data Time 0.002 (0.015)	Loss 3.3363 (3.2628)	Entropy 0.89004 (0.89530)	Top-1 acc 43.750 (46.179)	Top-5 acc 69.531 (69.889)	lr 0.02268
Train [24][2100/3239]	Time 0.594 (0.921)	Data Time 0.001 (0.015)	Loss 3.2680 (3.2627)	Entropy 0.89024 (0.89528)	Top-1 acc 44.531 (46.173)	Top-5 acc 72.656 (69.892)	lr 0.02268
Train [24][2110/3239]	Time 0.610 (0.920)	Data Time 0.001 (0.014)	Loss 3.4737 (3.2629)	Entropy 0.89044 (0.89526)	Top-1 acc 39.062 (46.166)	Top-5 acc 64.844 (69.888)	lr 0.02268
Train [24][2120/3239]	Time 0.687 (0.920)	Data Time 0.001 (0.014)	Loss 3.3478 (3.2629)	Entropy 0.89038 (0.89523)	Top-1 acc 46.875 (46.170)	Top-5 acc 67.969 (69.890)	lr 0.02268
Train [24][2130/3239]	Time 0.563 (0.920)	Data Time 0.001 (0.014)	Loss 3.3288 (3.2632)	Entropy 0.89004 (0.89521)	Top-1 acc 42.578 (46.163)	Top-5 acc 70.312 (69.889)	lr 0.02268
Train [24][2140/3239]	Time 0.602 (0.919)	Data Time 0.002 (0.014)	Loss 3.4224 (3.2629)	Entropy 0.89023 (0.89519)	Top-1 acc 43.750 (46.172)	Top-5 acc 69.531 (69.896)	lr 0.02268
Train [24][2150/3239]	Time 0.571 (0.919)	Data Time 0.001 (0.014)	Loss 3.1340 (3.2627)	Entropy 0.89004 (0.89516)	Top-1 acc 50.391 (46.175)	Top-5 acc 74.609 (69.904)	lr 0.02268
Train [24][2160/3239]	Time 0.604 (0.919)	Data Time 0.001 (0.014)	Loss 3.2490 (3.2626)	Entropy 0.88999 (0.89514)	Top-1 acc 44.531 (46.172)	Top-5 acc 67.188 (69.903)	lr 0.02268
Train [24][2170/3239]	Time 0.620 (0.919)	Data Time 0.001 (0.014)	Loss 3.1533 (3.2624)	Entropy 0.89016 (0.89512)	Top-1 acc 48.047 (46.177)	Top-5 acc 71.094 (69.906)	lr 0.02268
Train [24][2180/3239]	Time 0.635 (0.919)	Data Time 0.001 (0.014)	Loss 3.3260 (3.2626)	Entropy 0.89021 (0.89509)	Top-1 acc 46.094 (46.176)	Top-5 acc 68.750 (69.901)	lr 0.02268
Train [24][2190/3239]	Time 0.708 (0.918)	Data Time 0.001 (0.014)	Loss 3.4787 (3.2625)	Entropy 0.89035 (0.89507)	Top-1 acc 38.672 (46.174)	Top-5 acc 66.797 (69.909)	lr 0.02267
Train [24][2200/3239]	Time 0.554 (0.918)	Data Time 0.001 (0.014)	Loss 3.1301 (3.2622)	Entropy 0.89067 (0.89505)	Top-1 acc 52.344 (46.181)	Top-5 acc 71.875 (69.914)	lr 0.02267
Train [24][2210/3239]	Time 0.601 (0.918)	Data Time 0.001 (0.014)	Loss 3.4667 (3.2623)	Entropy 0.89058 (0.89503)	Top-1 acc 42.188 (46.177)	Top-5 acc 64.062 (69.914)	lr 0.02267
Train [24][2220/3239]	Time 0.621 (0.918)	Data Time 0.001 (0.014)	Loss 3.2510 (3.2624)	Entropy 0.89043 (0.89501)	Top-1 acc 46.094 (46.177)	Top-5 acc 67.969 (69.908)	lr 0.02267
Train [24][2230/3239]	Time 0.594 (0.918)	Data Time 0.001 (0.014)	Loss 3.2525 (3.2627)	Entropy 0.89078 (0.89499)	Top-1 acc 46.484 (46.170)	Top-5 acc 70.312 (69.905)	lr 0.02267
Train [24][2240/3239]	Time 0.613 (0.917)	Data Time 0.001 (0.014)	Loss 3.1614 (3.2627)	Entropy 0.89098 (0.89497)	Top-1 acc 46.875 (46.167)	Top-5 acc 69.141 (69.905)	lr 0.02267
Train [24][2250/3239]	Time 0.588 (0.917)	Data Time 0.001 (0.014)	Loss 3.1657 (3.2626)	Entropy 0.89096 (0.89495)	Top-1 acc 47.656 (46.167)	Top-5 acc 72.656 (69.904)	lr 0.02267
Train [24][2260/3239]	Time 0.474 (0.916)	Data Time 0.001 (0.014)	Loss 3.2842 (3.2627)	Entropy 0.89090 (0.89494)	Top-1 acc 45.703 (46.168)	Top-5 acc 69.531 (69.907)	lr 0.02267
Train [24][2270/3239]	Time 0.637 (0.916)	Data Time 0.001 (0.014)	Loss 3.4474 (3.2627)	Entropy 0.89077 (0.89492)	Top-1 acc 38.672 (46.165)	Top-5 acc 63.281 (69.905)	lr 0.02267
Train [24][2280/3239]	Time 0.666 (0.916)	Data Time 0.001 (0.014)	Loss 3.3249 (3.2627)	Entropy 0.89087 (0.89490)	Top-1 acc 42.188 (46.167)	Top-5 acc 68.750 (69.907)	lr 0.02267
Train [24][2290/3239]	Time 0.599 (0.916)	Data Time 0.001 (0.014)	Loss 3.4394 (3.2629)	Entropy 0.89050 (0.89488)	Top-1 acc 39.453 (46.161)	Top-5 acc 65.234 (69.901)	lr 0.02267
Train [24][2300/3239]	Time 0.583 (0.915)	Data Time 0.001 (0.013)	Loss 3.2320 (3.2630)	Entropy 0.89060 (0.89486)	Top-1 acc 46.875 (46.157)	Top-5 acc 68.750 (69.899)	lr 0.02267
Train [24][2310/3239]	Time 0.564 (0.915)	Data Time 0.001 (0.013)	Loss 3.1662 (3.2629)	Entropy 0.89096 (0.89484)	Top-1 acc 49.609 (46.161)	Top-5 acc 71.484 (69.902)	lr 0.02267
Train [24][2320/3239]	Time 0.649 (0.915)	Data Time 0.001 (0.013)	Loss 3.1757 (3.2629)	Entropy 0.89100 (0.89483)	Top-1 acc 49.219 (46.160)	Top-5 acc 73.828 (69.902)	lr 0.02267
Train [24][2330/3239]	Time 0.626 (0.915)	Data Time 0.001 (0.013)	Loss 3.2848 (3.2628)	Entropy 0.89093 (0.89481)	Top-1 acc 47.266 (46.162)	Top-5 acc 70.703 (69.905)	lr 0.02267
Train [24][2340/3239]	Time 0.610 (0.915)	Data Time 0.001 (0.013)	Loss 3.2338 (3.2627)	Entropy 0.89127 (0.89479)	Top-1 acc 44.141 (46.160)	Top-5 acc 70.312 (69.907)	lr 0.02267
Train [24][2350/3239]	Time 0.697 (0.914)	Data Time 0.001 (0.013)	Loss 3.4883 (3.2626)	Entropy 0.89146 (0.89478)	Top-1 acc 42.578 (46.169)	Top-5 acc 63.281 (69.906)	lr 0.02267
Train [24][2360/3239]	Time 0.612 (0.914)	Data Time 0.001 (0.013)	Loss 3.1345 (3.2627)	Entropy 0.89158 (0.89477)	Top-1 acc 51.562 (46.165)	Top-5 acc 74.219 (69.904)	lr 0.02266
Train [24][2370/3239]	Time 0.587 (0.914)	Data Time 0.001 (0.013)	Loss 3.1705 (3.2625)	Entropy 0.89162 (0.89475)	Top-1 acc 49.609 (46.168)	Top-5 acc 72.266 (69.908)	lr 0.02266
Train [24][2380/3239]	Time 0.593 (0.914)	Data Time 0.001 (0.013)	Loss 3.3120 (3.2626)	Entropy 0.89153 (0.89474)	Top-1 acc 42.969 (46.166)	Top-5 acc 68.359 (69.908)	lr 0.02266
Train [24][2390/3239]	Time 0.617 (0.913)	Data Time 0.001 (0.013)	Loss 3.4556 (3.2626)	Entropy 0.89155 (0.89473)	Top-1 acc 41.406 (46.166)	Top-5 acc 64.844 (69.904)	lr 0.02266
Train [24][2400/3239]	Time 0.610 (0.913)	Data Time 0.001 (0.013)	Loss 3.3184 (3.2626)	Entropy 0.89171 (0.89471)	Top-1 acc 43.750 (46.165)	Top-5 acc 68.359 (69.904)	lr 0.02266
Train [24][2410/3239]	Time 0.642 (0.913)	Data Time 0.001 (0.013)	Loss 3.3173 (3.2623)	Entropy 0.89172 (0.89470)	Top-1 acc 42.578 (46.173)	Top-5 acc 69.141 (69.910)	lr 0.02266
Train [24][2420/3239]	Time 0.625 (0.913)	Data Time 0.001 (0.013)	Loss 3.2868 (3.2622)	Entropy 0.89124 (0.89469)	Top-1 acc 42.188 (46.174)	Top-5 acc 68.359 (69.912)	lr 0.02266
Train [24][2430/3239]	Time 0.571 (0.912)	Data Time 0.001 (0.013)	Loss 3.3624 (3.2618)	Entropy 0.89133 (0.89467)	Top-1 acc 45.312 (46.183)	Top-5 acc 66.797 (69.920)	lr 0.02266
Train [24][2440/3239]	Time 0.677 (0.912)	Data Time 0.001 (0.013)	Loss 3.1976 (3.2616)	Entropy 0.89126 (0.89466)	Top-1 acc 50.391 (46.191)	Top-5 acc 72.266 (69.924)	lr 0.02266
Train [24][2450/3239]	Time 0.663 (0.912)	Data Time 0.001 (0.013)	Loss 3.0216 (3.2614)	Entropy 0.89108 (0.89465)	Top-1 acc 51.172 (46.196)	Top-5 acc 75.000 (69.928)	lr 0.02266
Train [24][2460/3239]	Time 0.653 (0.911)	Data Time 0.001 (0.013)	Loss 3.2626 (3.2616)	Entropy 0.89147 (0.89463)	Top-1 acc 48.047 (46.190)	Top-5 acc 68.750 (69.924)	lr 0.02266
Train [24][2470/3239]	Time 0.592 (0.911)	Data Time 0.001 (0.013)	Loss 3.4170 (3.2619)	Entropy 0.89125 (0.89462)	Top-1 acc 42.969 (46.182)	Top-5 acc 66.797 (69.917)	lr 0.02266
Train [24][2480/3239]	Time 0.655 (0.911)	Data Time 0.001 (0.013)	Loss 3.3370 (3.2622)	Entropy 0.89152 (0.89461)	Top-1 acc 46.094 (46.176)	Top-5 acc 71.094 (69.912)	lr 0.02266
Train [24][2490/3239]	Time 0.569 (0.911)	Data Time 0.001 (0.013)	Loss 3.2151 (3.2620)	Entropy 0.89192 (0.89459)	Top-1 acc 45.312 (46.173)	Top-5 acc 72.266 (69.914)	lr 0.02266
Train [24][2500/3239]	Time 0.623 (0.910)	Data Time 0.001 (0.013)	Loss 3.2139 (3.2619)	Entropy 0.89150 (0.89458)	Top-1 acc 46.875 (46.174)	Top-5 acc 71.875 (69.917)	lr 0.02266
Train [24][2510/3239]	Time 0.711 (0.910)	Data Time 0.001 (0.013)	Loss 2.8967 (3.2620)	Entropy 0.89151 (0.89457)	Top-1 acc 54.297 (46.170)	Top-5 acc 76.953 (69.916)	lr 0.02266
Train [24][2520/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.012)	Loss 3.1550 (3.2618)	Entropy 0.89175 (0.89456)	Top-1 acc 46.875 (46.173)	Top-5 acc 73.438 (69.918)	lr 0.02266
Train [24][2530/3239]	Time 0.577 (0.910)	Data Time 0.001 (0.012)	Loss 3.2443 (3.2616)	Entropy 0.89117 (0.89455)	Top-1 acc 42.969 (46.172)	Top-5 acc 70.703 (69.924)	lr 0.02265
Train [24][2540/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.012)	Loss 3.1580 (3.2613)	Entropy 0.89132 (0.89453)	Top-1 acc 51.172 (46.178)	Top-5 acc 72.266 (69.928)	lr 0.02265
Train [24][2550/3239]	Time 0.585 (0.910)	Data Time 0.001 (0.012)	Loss 3.2219 (3.2612)	Entropy 0.89131 (0.89452)	Top-1 acc 44.922 (46.178)	Top-5 acc 68.750 (69.929)	lr 0.02265
Train [24][2560/3239]	Time 0.582 (0.909)	Data Time 0.001 (0.012)	Loss 3.4877 (3.2613)	Entropy 0.89153 (0.89451)	Top-1 acc 44.922 (46.178)	Top-5 acc 66.406 (69.924)	lr 0.02265
Train [24][2570/3239]	Time 0.595 (0.909)	Data Time 0.001 (0.012)	Loss 3.0857 (3.2615)	Entropy 0.89177 (0.89450)	Top-1 acc 51.172 (46.180)	Top-5 acc 72.266 (69.923)	lr 0.02265
Train [24][2580/3239]	Time 0.585 (0.909)	Data Time 0.001 (0.012)	Loss 3.4270 (3.2614)	Entropy 0.89178 (0.89449)	Top-1 acc 42.969 (46.184)	Top-5 acc 66.797 (69.921)	lr 0.02265
Train [24][2590/3239]	Time 0.571 (0.909)	Data Time 0.001 (0.012)	Loss 3.3318 (3.2614)	Entropy 0.89169 (0.89448)	Top-1 acc 42.969 (46.187)	Top-5 acc 67.578 (69.922)	lr 0.02265
Train [24][2600/3239]	Time 0.556 (0.909)	Data Time 0.001 (0.012)	Loss 3.0357 (3.2610)	Entropy 0.89182 (0.89447)	Top-1 acc 51.562 (46.197)	Top-5 acc 73.828 (69.930)	lr 0.02265
Train [24][2610/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.012)	Loss 3.3620 (3.2611)	Entropy 0.89182 (0.89446)	Top-1 acc 46.875 (46.199)	Top-5 acc 65.625 (69.930)	lr 0.02265
Train [24][2620/3239]	Time 0.613 (0.908)	Data Time 0.001 (0.012)	Loss 3.2787 (3.2609)	Entropy 0.89183 (0.89445)	Top-1 acc 43.750 (46.204)	Top-5 acc 70.312 (69.936)	lr 0.02265
Train [24][2630/3239]	Time 0.590 (0.908)	Data Time 0.001 (0.012)	Loss 3.1034 (3.2606)	Entropy 0.89183 (0.89444)	Top-1 acc 52.344 (46.206)	Top-5 acc 72.656 (69.942)	lr 0.02265
Train [24][2640/3239]	Time 0.631 (0.908)	Data Time 0.001 (0.012)	Loss 3.4035 (3.2606)	Entropy 0.89150 (0.89443)	Top-1 acc 44.531 (46.208)	Top-5 acc 71.484 (69.948)	lr 0.02265
Train [24][2650/3239]	Time 0.605 (0.907)	Data Time 0.001 (0.012)	Loss 3.2794 (3.2609)	Entropy 0.89125 (0.89442)	Top-1 acc 44.141 (46.200)	Top-5 acc 69.922 (69.942)	lr 0.02265
Train [24][2660/3239]	Time 0.583 (0.907)	Data Time 0.001 (0.012)	Loss 3.1743 (3.2610)	Entropy 0.89110 (0.89440)	Top-1 acc 48.438 (46.194)	Top-5 acc 72.656 (69.936)	lr 0.02265
Train [24][2670/3239]	Time 0.713 (0.907)	Data Time 0.001 (0.012)	Loss 3.2679 (3.2611)	Entropy 0.89088 (0.89439)	Top-1 acc 50.781 (46.192)	Top-5 acc 67.969 (69.939)	lr 0.02265
Train [24][2680/3239]	Time 0.568 (0.907)	Data Time 0.001 (0.012)	Loss 3.2658 (3.2610)	Entropy 0.89087 (0.89438)	Top-1 acc 46.875 (46.193)	Top-5 acc 67.188 (69.941)	lr 0.02265
Train [24][2690/3239]	Time 0.613 (0.907)	Data Time 0.001 (0.012)	Loss 3.4084 (3.2610)	Entropy 0.89122 (0.89437)	Top-1 acc 44.531 (46.193)	Top-5 acc 68.359 (69.939)	lr 0.02265
Train [24][2700/3239]	Time 0.584 (0.907)	Data Time 0.001 (0.012)	Loss 3.3617 (3.2610)	Entropy 0.89122 (0.89435)	Top-1 acc 44.141 (46.193)	Top-5 acc 67.188 (69.938)	lr 0.02264
Train [24][2710/3239]	Time 0.646 (0.906)	Data Time 0.001 (0.012)	Loss 3.1077 (3.2609)	Entropy 0.89114 (0.89434)	Top-1 acc 48.047 (46.196)	Top-5 acc 71.094 (69.939)	lr 0.02264
Train [24][2720/3239]	Time 0.602 (0.906)	Data Time 0.001 (0.012)	Loss 3.4541 (3.2609)	Entropy 0.89084 (0.89433)	Top-1 acc 44.141 (46.195)	Top-5 acc 63.672 (69.936)	lr 0.02264
Train [24][2730/3239]	Time 0.591 (0.906)	Data Time 0.001 (0.012)	Loss 3.2834 (3.2610)	Entropy 0.89112 (0.89432)	Top-1 acc 47.656 (46.196)	Top-5 acc 71.484 (69.937)	lr 0.02264
Train [24][2740/3239]	Time 0.798 (0.916)	Data Time 0.005 (0.012)	Loss 3.1838 (3.2610)	Entropy 0.89084 (0.89430)	Top-1 acc 47.266 (46.194)	Top-5 acc 67.578 (69.937)	lr 0.02264
Train [24][2750/3239]	Time 0.611 (0.916)	Data Time 0.002 (0.012)	Loss 3.3127 (3.2610)	Entropy 0.89064 (0.89429)	Top-1 acc 45.703 (46.197)	Top-5 acc 67.188 (69.936)	lr 0.02264
Train [24][2760/3239]	Time 0.606 (0.916)	Data Time 0.001 (0.012)	Loss 3.1830 (3.2609)	Entropy 0.89101 (0.89428)	Top-1 acc 44.141 (46.197)	Top-5 acc 71.875 (69.939)	lr 0.02264
Train [24][2770/3239]	Time 0.670 (0.915)	Data Time 0.001 (0.012)	Loss 3.3408 (3.2609)	Entropy 0.89081 (0.89427)	Top-1 acc 44.922 (46.196)	Top-5 acc 73.047 (69.942)	lr 0.02264
Train [24][2780/3239]	Time 0.575 (0.915)	Data Time 0.001 (0.011)	Loss 3.3012 (3.2609)	Entropy 0.89082 (0.89425)	Top-1 acc 45.312 (46.198)	Top-5 acc 70.703 (69.947)	lr 0.02264
Train [24][2790/3239]	Time 0.620 (0.915)	Data Time 0.001 (0.011)	Loss 3.0929 (3.2609)	Entropy 0.89024 (0.89424)	Top-1 acc 46.875 (46.197)	Top-5 acc 75.781 (69.949)	lr 0.02264
Train [24][2800/3239]	Time 0.603 (0.915)	Data Time 0.001 (0.011)	Loss 3.1610 (3.2608)	Entropy 0.89009 (0.89423)	Top-1 acc 50.781 (46.202)	Top-5 acc 73.047 (69.952)	lr 0.02264
Train [24][2810/3239]	Time 0.638 (0.915)	Data Time 0.001 (0.011)	Loss 3.2106 (3.2607)	Entropy 0.88985 (0.89421)	Top-1 acc 46.484 (46.205)	Top-5 acc 74.609 (69.955)	lr 0.02264
Train [24][2820/3239]	Time 0.605 (0.914)	Data Time 0.001 (0.011)	Loss 3.3714 (3.2605)	Entropy 0.88923 (0.89420)	Top-1 acc 44.531 (46.206)	Top-5 acc 67.188 (69.955)	lr 0.02264
Train [24][2830/3239]	Time 0.698 (0.914)	Data Time 0.001 (0.011)	Loss 3.1085 (3.2604)	Entropy 0.88908 (0.89418)	Top-1 acc 48.828 (46.206)	Top-5 acc 71.484 (69.958)	lr 0.02264
Train [24][2840/3239]	Time 0.608 (0.914)	Data Time 0.001 (0.011)	Loss 3.4661 (3.2605)	Entropy 0.88889 (0.89416)	Top-1 acc 39.062 (46.203)	Top-5 acc 66.406 (69.957)	lr 0.02264
Train [24][2850/3239]	Time 0.601 (0.914)	Data Time 0.001 (0.011)	Loss 3.2664 (3.2605)	Entropy 0.88909 (0.89414)	Top-1 acc 47.656 (46.203)	Top-5 acc 70.703 (69.957)	lr 0.02264
Train [24][2860/3239]	Time 0.637 (0.914)	Data Time 0.001 (0.011)	Loss 3.3604 (3.2605)	Entropy 0.88897 (0.89413)	Top-1 acc 41.016 (46.205)	Top-5 acc 67.969 (69.955)	lr 0.02264
Train [24][2870/3239]	Time 0.626 (0.914)	Data Time 0.001 (0.011)	Loss 3.1658 (3.2603)	Entropy 0.88857 (0.89411)	Top-1 acc 45.312 (46.207)	Top-5 acc 71.875 (69.959)	lr 0.02263
Train [24][2880/3239]	Time 0.589 (0.913)	Data Time 0.001 (0.011)	Loss 3.3438 (3.2604)	Entropy 0.88852 (0.89409)	Top-1 acc 47.266 (46.206)	Top-5 acc 69.922 (69.957)	lr 0.02263
Train [24][2890/3239]	Time 0.628 (0.913)	Data Time 0.001 (0.011)	Loss 3.2392 (3.2605)	Entropy 0.88849 (0.89407)	Top-1 acc 46.484 (46.207)	Top-5 acc 69.531 (69.953)	lr 0.02263
Train [24][2900/3239]	Time 0.645 (0.913)	Data Time 0.001 (0.011)	Loss 3.2317 (3.2605)	Entropy 0.88844 (0.89405)	Top-1 acc 41.797 (46.203)	Top-5 acc 69.922 (69.954)	lr 0.02263
Train [24][2910/3239]	Time 0.579 (0.912)	Data Time 0.001 (0.011)	Loss 3.3742 (3.2605)	Entropy 0.88858 (0.89403)	Top-1 acc 44.922 (46.203)	Top-5 acc 64.844 (69.953)	lr 0.02263
Train [24][2920/3239]	Time 0.649 (0.912)	Data Time 0.001 (0.011)	Loss 3.1333 (3.2605)	Entropy 0.88856 (0.89401)	Top-1 acc 46.875 (46.203)	Top-5 acc 71.875 (69.954)	lr 0.02263
Train [24][2930/3239]	Time 0.590 (0.912)	Data Time 0.001 (0.011)	Loss 3.4011 (3.2605)	Entropy 0.88868 (0.89399)	Top-1 acc 41.016 (46.203)	Top-5 acc 67.578 (69.956)	lr 0.02263
Train [24][2940/3239]	Time 0.609 (0.912)	Data Time 0.001 (0.011)	Loss 3.1763 (3.2605)	Entropy 0.88871 (0.89398)	Top-1 acc 47.266 (46.200)	Top-5 acc 71.094 (69.958)	lr 0.02263
Train [24][2950/3239]	Time 0.589 (0.912)	Data Time 0.001 (0.011)	Loss 3.2157 (3.2604)	Entropy 0.88843 (0.89396)	Top-1 acc 46.484 (46.203)	Top-5 acc 70.312 (69.958)	lr 0.02263
Train [24][2960/3239]	Time 0.656 (0.912)	Data Time 0.001 (0.011)	Loss 3.3986 (3.2607)	Entropy 0.88835 (0.89394)	Top-1 acc 45.312 (46.196)	Top-5 acc 67.578 (69.951)	lr 0.02263
Train [24][2970/3239]	Time 0.608 (0.912)	Data Time 0.001 (0.011)	Loss 3.2255 (3.2606)	Entropy 0.88841 (0.89392)	Top-1 acc 46.484 (46.201)	Top-5 acc 71.875 (69.955)	lr 0.02263
Train [24][2980/3239]	Time 0.628 (0.911)	Data Time 0.001 (0.011)	Loss 3.0698 (3.2607)	Entropy 0.88853 (0.89390)	Top-1 acc 50.000 (46.199)	Top-5 acc 76.172 (69.957)	lr 0.02263
Train [24][2990/3239]	Time 0.664 (0.911)	Data Time 0.001 (0.011)	Loss 3.1454 (3.2605)	Entropy 0.88869 (0.89388)	Top-1 acc 47.656 (46.204)	Top-5 acc 72.656 (69.959)	lr 0.02263
Train [24][3000/3239]	Time 0.591 (0.911)	Data Time 0.001 (0.011)	Loss 3.4120 (3.2606)	Entropy 0.88865 (0.89387)	Top-1 acc 44.141 (46.204)	Top-5 acc 69.141 (69.957)	lr 0.02263
Train [24][3010/3239]	Time 0.589 (0.911)	Data Time 0.001 (0.011)	Loss 3.1870 (3.2605)	Entropy 0.88832 (0.89385)	Top-1 acc 50.781 (46.209)	Top-5 acc 71.484 (69.962)	lr 0.02263
Train [24][3020/3239]	Time 0.600 (0.911)	Data Time 0.001 (0.011)	Loss 3.1569 (3.2607)	Entropy 0.88831 (0.89383)	Top-1 acc 44.922 (46.205)	Top-5 acc 71.484 (69.956)	lr 0.02263
Train [24][3030/3239]	Time 0.583 (0.911)	Data Time 0.001 (0.011)	Loss 3.4647 (3.2604)	Entropy 0.88774 (0.89381)	Top-1 acc 43.359 (46.212)	Top-5 acc 67.188 (69.963)	lr 0.02263
Train [24][3040/3239]	Time 0.621 (0.910)	Data Time 0.001 (0.011)	Loss 3.3262 (3.2604)	Entropy 0.88793 (0.89379)	Top-1 acc 45.703 (46.213)	Top-5 acc 69.531 (69.964)	lr 0.02262
Train [24][3050/3239]	Time 0.548 (0.910)	Data Time 0.001 (0.011)	Loss 2.9867 (3.2602)	Entropy 0.88774 (0.89377)	Top-1 acc 55.859 (46.221)	Top-5 acc 70.703 (69.967)	lr 0.02262
Train [24][3060/3239]	Time 0.725 (0.910)	Data Time 0.001 (0.011)	Loss 3.1257 (3.2601)	Entropy 0.88793 (0.89375)	Top-1 acc 48.828 (46.221)	Top-5 acc 71.484 (69.968)	lr 0.02262
Train [24][3070/3239]	Time 0.592 (0.910)	Data Time 0.001 (0.011)	Loss 3.3170 (3.2601)	Entropy 0.88780 (0.89373)	Top-1 acc 44.922 (46.221)	Top-5 acc 67.578 (69.967)	lr 0.02262
Train [24][3080/3239]	Time 0.591 (0.910)	Data Time 0.001 (0.011)	Loss 3.3107 (3.2601)	Entropy 0.88775 (0.89371)	Top-1 acc 43.750 (46.223)	Top-5 acc 70.312 (69.965)	lr 0.02262
Train [24][3090/3239]	Time 0.584 (0.909)	Data Time 0.001 (0.011)	Loss 3.4413 (3.2604)	Entropy 0.88769 (0.89369)	Top-1 acc 42.578 (46.217)	Top-5 acc 63.672 (69.957)	lr 0.02262
Train [24][3100/3239]	Time 0.620 (0.909)	Data Time 0.001 (0.010)	Loss 3.1218 (3.2601)	Entropy 0.88728 (0.89367)	Top-1 acc 47.266 (46.220)	Top-5 acc 73.828 (69.962)	lr 0.02262
Train [24][3110/3239]	Time 0.624 (0.909)	Data Time 0.001 (0.010)	Loss 3.1009 (3.2601)	Entropy 0.88695 (0.89365)	Top-1 acc 52.734 (46.219)	Top-5 acc 72.656 (69.965)	lr 0.02262
Train [24][3120/3239]	Time 0.567 (0.909)	Data Time 0.001 (0.010)	Loss 3.3559 (3.2602)	Entropy 0.88702 (0.89363)	Top-1 acc 40.625 (46.214)	Top-5 acc 65.234 (69.962)	lr 0.02262
Train [24][3130/3239]	Time 0.681 (0.909)	Data Time 0.001 (0.010)	Loss 3.3401 (3.2603)	Entropy 0.88661 (0.89361)	Top-1 acc 42.969 (46.210)	Top-5 acc 64.062 (69.957)	lr 0.02262
Train [24][3140/3239]	Time 0.618 (0.908)	Data Time 0.001 (0.010)	Loss 3.1571 (3.2601)	Entropy 0.88669 (0.89359)	Top-1 acc 44.531 (46.213)	Top-5 acc 71.484 (69.961)	lr 0.02262
Train [24][3150/3239]	Time 0.621 (0.908)	Data Time 0.001 (0.010)	Loss 3.2768 (3.2600)	Entropy 0.88644 (0.89357)	Top-1 acc 44.922 (46.216)	Top-5 acc 69.922 (69.964)	lr 0.02262
Train [24][3160/3239]	Time 0.622 (0.908)	Data Time 0.001 (0.010)	Loss 3.2607 (3.2598)	Entropy 0.88682 (0.89354)	Top-1 acc 45.703 (46.221)	Top-5 acc 71.875 (69.967)	lr 0.02262
Train [24][3170/3239]	Time 0.609 (0.908)	Data Time 0.001 (0.010)	Loss 3.2925 (3.2597)	Entropy 0.88716 (0.89352)	Top-1 acc 42.969 (46.219)	Top-5 acc 68.750 (69.965)	lr 0.02262
Train [24][3180/3239]	Time 0.584 (0.908)	Data Time 0.000 (0.010)	Loss 3.4177 (3.2597)	Entropy 0.88737 (0.89350)	Top-1 acc 43.359 (46.216)	Top-5 acc 66.797 (69.968)	lr 0.02262
Train [24][3190/3239]	Time 0.585 (0.908)	Data Time 0.000 (0.010)	Loss 3.0010 (3.2598)	Entropy 0.88691 (0.89348)	Top-1 acc 46.094 (46.212)	Top-5 acc 77.344 (69.967)	lr 0.02262
Train [24][3200/3239]	Time 0.549 (0.907)	Data Time 0.000 (0.010)	Loss 3.1964 (3.2599)	Entropy 0.88761 (0.89346)	Top-1 acc 46.094 (46.208)	Top-5 acc 73.438 (69.964)	lr 0.02262
Train [24][3210/3239]	Time 0.591 (0.907)	Data Time 0.000 (0.010)	Loss 3.2399 (3.2598)	Entropy 0.88786 (0.89344)	Top-1 acc 47.656 (46.210)	Top-5 acc 71.875 (69.968)	lr 0.02261
Train [24][3220/3239]	Time 0.696 (0.907)	Data Time 0.000 (0.010)	Loss 3.1579 (3.2596)	Entropy 0.88801 (0.89343)	Top-1 acc 50.000 (46.215)	Top-5 acc 71.484 (69.970)	lr 0.02261
Train [24][3230/3239]	Time 0.605 (0.907)	Data Time 0.000 (0.010)	Loss 3.3164 (3.2597)	Entropy 0.88816 (0.89341)	Top-1 acc 44.922 (46.212)	Top-5 acc 68.750 (69.969)	lr 0.02261
Train [24][3239/3239]	Time 1.476 (0.907)	Data Time 0.000 (0.010)	Loss 3.6461 (3.2597)	Entropy 0.88847 (0.89340)	Top-1 acc 39.506 (46.213)	Top-5 acc 58.025 (69.971)	lr 0.02261
==========Valid [24/120]	loss 1.979	top-1 acc 55.834 (55.834)	top-5 acc 78.798	Train top-1 46.213	top-5 69.971	Entropy 0.88847	Latency-None: 0.000ms	Flops: 539.76M
Train [25][0/3239]	Time 23.049 (23.049)	Data Time 21.531 (21.531)	Loss 3.0294 (3.0294)	Entropy 0.88860 (0.88860)	Top-1 acc 50.000 (50.000)	Top-5 acc 75.000 (75.000)	lr 0.02261
Train [25][10/3239]	Time 0.589 (3.011)	Data Time 0.001 (2.036)	Loss 3.2550 (3.1690)	Entropy 0.88885 (0.88868)	Top-1 acc 50.391 (48.082)	Top-5 acc 71.875 (72.017)	lr 0.02261
Train [25][20/3239]	Time 0.607 (1.980)	Data Time 0.001 (1.067)	Loss 3.0956 (3.1741)	Entropy 0.88862 (0.88873)	Top-1 acc 49.609 (48.084)	Top-5 acc 73.438 (72.154)	lr 0.02261
Train [25][30/3239]	Time 0.453 (1.615)	Data Time 0.001 (0.724)	Loss 2.8598 (3.1854)	Entropy 0.88849 (0.88870)	Top-1 acc 56.250 (47.933)	Top-5 acc 78.906 (71.963)	lr 0.02261
Train [25][40/3239]	Time 0.599 (1.425)	Data Time 0.001 (0.548)	Loss 3.2794 (3.1986)	Entropy 0.88865 (0.88865)	Top-1 acc 42.578 (47.590)	Top-5 acc 69.141 (71.580)	lr 0.02261
Train [25][50/3239]	Time 0.590 (1.311)	Data Time 0.001 (0.441)	Loss 3.2241 (3.1986)	Entropy 0.88856 (0.88866)	Top-1 acc 44.531 (47.580)	Top-5 acc 73.047 (71.576)	lr 0.02261
Train [25][60/3239]	Time 0.619 (1.237)	Data Time 0.001 (0.369)	Loss 3.1084 (3.1959)	Entropy 0.88829 (0.88864)	Top-1 acc 49.609 (47.586)	Top-5 acc 73.438 (71.523)	lr 0.02261
Train [25][70/3239]	Time 0.617 (1.183)	Data Time 0.001 (0.317)	Loss 3.1545 (3.2002)	Entropy 0.88801 (0.88856)	Top-1 acc 51.953 (47.453)	Top-5 acc 70.312 (71.314)	lr 0.02261
Train [25][80/3239]	Time 0.573 (1.142)	Data Time 0.001 (0.278)	Loss 3.2835 (3.2037)	Entropy 0.88793 (0.88850)	Top-1 acc 45.703 (47.425)	Top-5 acc 69.922 (71.166)	lr 0.02261
Train [25][90/3239]	Time 0.582 (1.111)	Data Time 0.002 (0.248)	Loss 3.2280 (3.2087)	Entropy 0.88797 (0.88844)	Top-1 acc 44.531 (47.236)	Top-5 acc 72.656 (71.188)	lr 0.02261
Train [25][100/3239]	Time 0.590 (1.086)	Data Time 0.001 (0.223)	Loss 3.3835 (3.2171)	Entropy 0.88801 (0.88840)	Top-1 acc 48.438 (47.196)	Top-5 acc 67.188 (70.962)	lr 0.02261
Train [25][110/3239]	Time 0.597 (1.066)	Data Time 0.001 (0.203)	Loss 3.1180 (3.2219)	Entropy 0.88776 (0.88837)	Top-1 acc 51.172 (47.174)	Top-5 acc 71.875 (70.872)	lr 0.02261
Train [25][120/3239]	Time 0.658 (1.052)	Data Time 0.001 (0.187)	Loss 3.2927 (3.2227)	Entropy 0.88795 (0.88832)	Top-1 acc 45.703 (47.120)	Top-5 acc 69.531 (70.897)	lr 0.02261
Train [25][130/3239]	Time 0.609 (1.036)	Data Time 0.001 (0.173)	Loss 3.5520 (3.2268)	Entropy 0.88751 (0.88828)	Top-1 acc 41.406 (47.042)	Top-5 acc 63.281 (70.730)	lr 0.02260
Train [25][140/3239]	Time 0.617 (1.024)	Data Time 0.001 (0.161)	Loss 3.3606 (3.2293)	Entropy 0.88742 (0.88822)	Top-1 acc 43.359 (47.027)	Top-5 acc 67.969 (70.695)	lr 0.02260
Train [25][150/3239]	Time 0.614 (1.014)	Data Time 0.001 (0.150)	Loss 3.0854 (3.2266)	Entropy 0.88694 (0.88817)	Top-1 acc 51.172 (47.074)	Top-5 acc 73.828 (70.765)	lr 0.02260
Train [25][160/3239]	Time 0.646 (1.156)	Data Time 0.002 (0.141)	Loss 3.4257 (3.2296)	Entropy 0.88703 (0.88809)	Top-1 acc 44.141 (47.030)	Top-5 acc 67.969 (70.757)	lr 0.02260
Train [25][170/3239]	Time 0.481 (1.137)	Data Time 0.001 (0.133)	Loss 3.0800 (3.2275)	Entropy 0.88742 (0.88803)	Top-1 acc 49.219 (47.062)	Top-5 acc 73.047 (70.776)	lr 0.02260
Train [25][180/3239]	Time 0.630 (1.120)	Data Time 0.001 (0.126)	Loss 3.1491 (3.2296)	Entropy 0.88693 (0.88800)	Top-1 acc 49.609 (46.957)	Top-5 acc 71.875 (70.690)	lr 0.02260
Train [25][190/3239]	Time 0.599 (1.106)	Data Time 0.001 (0.119)	Loss 3.1906 (3.2266)	Entropy 0.88656 (0.88794)	Top-1 acc 49.609 (47.022)	Top-5 acc 71.484 (70.752)	lr 0.02260
Train [25][200/3239]	Time 0.574 (1.093)	Data Time 0.002 (0.113)	Loss 3.3023 (3.2284)	Entropy 0.88641 (0.88787)	Top-1 acc 44.531 (46.982)	Top-5 acc 70.703 (70.738)	lr 0.02260
Train [25][210/3239]	Time 0.588 (1.081)	Data Time 0.001 (0.108)	Loss 2.9539 (3.2279)	Entropy 0.88665 (0.88780)	Top-1 acc 53.125 (47.006)	Top-5 acc 75.391 (70.753)	lr 0.02260
Train [25][220/3239]	Time 0.603 (1.071)	Data Time 0.001 (0.103)	Loss 3.1329 (3.2252)	Entropy 0.88641 (0.88775)	Top-1 acc 50.781 (47.066)	Top-5 acc 72.266 (70.823)	lr 0.02260
Train [25][230/3239]	Time 0.607 (1.062)	Data Time 0.001 (0.099)	Loss 3.0763 (3.2267)	Entropy 0.88616 (0.88769)	Top-1 acc 50.781 (46.990)	Top-5 acc 75.000 (70.791)	lr 0.02260
Train [25][240/3239]	Time 0.608 (1.053)	Data Time 0.001 (0.095)	Loss 3.3947 (3.2284)	Entropy 0.88591 (0.88762)	Top-1 acc 46.094 (46.940)	Top-5 acc 65.234 (70.774)	lr 0.02260
Train [25][250/3239]	Time 0.631 (1.045)	Data Time 0.001 (0.091)	Loss 3.2465 (3.2272)	Entropy 0.88617 (0.88756)	Top-1 acc 46.094 (46.953)	Top-5 acc 70.703 (70.776)	lr 0.02260
Train [25][260/3239]	Time 0.602 (1.038)	Data Time 0.001 (0.088)	Loss 3.1862 (3.2270)	Entropy 0.88604 (0.88750)	Top-1 acc 47.656 (46.935)	Top-5 acc 72.266 (70.769)	lr 0.02260
Train [25][270/3239]	Time 0.621 (1.031)	Data Time 0.001 (0.085)	Loss 3.3557 (3.2281)	Entropy 0.88581 (0.88744)	Top-1 acc 45.703 (46.891)	Top-5 acc 67.578 (70.726)	lr 0.02260
Train [25][280/3239]	Time 0.722 (1.026)	Data Time 0.001 (0.082)	Loss 3.2166 (3.2285)	Entropy 0.88548 (0.88738)	Top-1 acc 48.047 (46.917)	Top-5 acc 70.703 (70.725)	lr 0.02260
Train [25][290/3239]	Time 0.632 (1.020)	Data Time 0.001 (0.079)	Loss 3.2451 (3.2282)	Entropy 0.88499 (0.88731)	Top-1 acc 45.703 (46.917)	Top-5 acc 69.141 (70.725)	lr 0.02260
Train [25][300/3239]	Time 0.610 (1.015)	Data Time 0.001 (0.076)	Loss 3.3757 (3.2279)	Entropy 0.88533 (0.88724)	Top-1 acc 41.016 (46.920)	Top-5 acc 66.016 (70.733)	lr 0.02259
Train [25][310/3239]	Time 0.619 (1.010)	Data Time 0.002 (0.074)	Loss 3.3822 (3.2281)	Entropy 0.88533 (0.88718)	Top-1 acc 46.094 (46.934)	Top-5 acc 67.188 (70.733)	lr 0.02259
Train [25][320/3239]	Time 0.466 (1.005)	Data Time 0.001 (0.072)	Loss 3.3025 (3.2294)	Entropy 0.88522 (0.88712)	Top-1 acc 44.141 (46.921)	Top-5 acc 66.797 (70.686)	lr 0.02259
Train [25][330/3239]	Time 0.594 (1.000)	Data Time 0.001 (0.070)	Loss 3.2277 (3.2284)	Entropy 0.88508 (0.88706)	Top-1 acc 46.094 (46.934)	Top-5 acc 73.047 (70.682)	lr 0.02259
Train [25][340/3239]	Time 0.563 (0.996)	Data Time 0.002 (0.068)	Loss 3.3899 (3.2289)	Entropy 0.88519 (0.88701)	Top-1 acc 41.406 (46.902)	Top-5 acc 66.016 (70.694)	lr 0.02259
Train [25][350/3239]	Time 0.661 (0.990)	Data Time 0.001 (0.066)	Loss 3.3928 (3.2298)	Entropy 0.88530 (0.88696)	Top-1 acc 42.578 (46.869)	Top-5 acc 69.531 (70.670)	lr 0.02259
Train [25][360/3239]	Time 0.610 (0.987)	Data Time 0.001 (0.064)	Loss 3.3474 (3.2321)	Entropy 0.88556 (0.88692)	Top-1 acc 44.141 (46.805)	Top-5 acc 68.750 (70.635)	lr 0.02259
Train [25][370/3239]	Time 0.586 (0.983)	Data Time 0.001 (0.062)	Loss 3.3399 (3.2326)	Entropy 0.88500 (0.88687)	Top-1 acc 46.484 (46.808)	Top-5 acc 69.141 (70.645)	lr 0.02259
Train [25][380/3239]	Time 0.613 (0.980)	Data Time 0.001 (0.061)	Loss 3.3606 (3.2335)	Entropy 0.88539 (0.88683)	Top-1 acc 42.188 (46.791)	Top-5 acc 67.969 (70.623)	lr 0.02259
Train [25][390/3239]	Time 0.582 (0.976)	Data Time 0.001 (0.059)	Loss 3.2606 (3.2325)	Entropy 0.88474 (0.88678)	Top-1 acc 48.047 (46.794)	Top-5 acc 70.312 (70.624)	lr 0.02259
Train [25][400/3239]	Time 0.585 (0.974)	Data Time 0.001 (0.058)	Loss 3.0667 (3.2317)	Entropy 0.88457 (0.88673)	Top-1 acc 50.781 (46.804)	Top-5 acc 75.000 (70.633)	lr 0.02259
Train [25][410/3239]	Time 0.603 (0.971)	Data Time 0.001 (0.056)	Loss 2.8600 (3.2317)	Entropy 0.88391 (0.88667)	Top-1 acc 52.734 (46.793)	Top-5 acc 77.344 (70.624)	lr 0.02259
Train [25][420/3239]	Time 0.609 (0.969)	Data Time 0.001 (0.055)	Loss 3.3288 (3.2322)	Entropy 0.88404 (0.88661)	Top-1 acc 48.828 (46.796)	Top-5 acc 69.141 (70.617)	lr 0.02259
Train [25][430/3239]	Time 0.591 (0.966)	Data Time 0.001 (0.054)	Loss 3.1601 (3.2312)	Entropy 0.88413 (0.88655)	Top-1 acc 47.266 (46.828)	Top-5 acc 72.656 (70.631)	lr 0.02259
Train [25][440/3239]	Time 0.751 (0.964)	Data Time 0.001 (0.053)	Loss 3.2761 (3.2309)	Entropy 0.88392 (0.88649)	Top-1 acc 42.578 (46.832)	Top-5 acc 71.875 (70.631)	lr 0.02259
Train [25][450/3239]	Time 0.623 (0.962)	Data Time 0.001 (0.052)	Loss 3.1029 (3.2300)	Entropy 0.88343 (0.88643)	Top-1 acc 53.125 (46.846)	Top-5 acc 72.656 (70.655)	lr 0.02259
Train [25][460/3239]	Time 0.605 (0.960)	Data Time 0.001 (0.050)	Loss 3.1341 (3.2311)	Entropy 0.88319 (0.88637)	Top-1 acc 49.609 (46.820)	Top-5 acc 71.484 (70.622)	lr 0.02259
Train [25][470/3239]	Time 0.579 (0.958)	Data Time 0.001 (0.049)	Loss 3.3338 (3.2313)	Entropy 0.88301 (0.88630)	Top-1 acc 44.531 (46.818)	Top-5 acc 69.141 (70.618)	lr 0.02258
Train [25][480/3239]	Time 0.633 (0.956)	Data Time 0.001 (0.048)	Loss 3.4616 (3.2309)	Entropy 0.88313 (0.88623)	Top-1 acc 44.141 (46.829)	Top-5 acc 64.453 (70.619)	lr 0.02258
Train [25][490/3239]	Time 0.609 (0.954)	Data Time 0.001 (0.047)	Loss 3.0576 (3.2296)	Entropy 0.88273 (0.88617)	Top-1 acc 47.266 (46.871)	Top-5 acc 75.000 (70.647)	lr 0.02258
Train [25][500/3239]	Time 0.587 (0.952)	Data Time 0.001 (0.047)	Loss 3.3129 (3.2290)	Entropy 0.88295 (0.88610)	Top-1 acc 43.359 (46.883)	Top-5 acc 70.312 (70.671)	lr 0.02258
Train [25][510/3239]	Time 0.655 (0.950)	Data Time 0.001 (0.046)	Loss 3.2246 (3.2292)	Entropy 0.88300 (0.88604)	Top-1 acc 46.484 (46.867)	Top-5 acc 68.750 (70.674)	lr 0.02258
Train [25][520/3239]	Time 0.569 (0.948)	Data Time 0.001 (0.045)	Loss 3.2887 (3.2278)	Entropy 0.88269 (0.88598)	Top-1 acc 44.531 (46.883)	Top-5 acc 69.141 (70.703)	lr 0.02258
Train [25][530/3239]	Time 0.613 (0.946)	Data Time 0.001 (0.044)	Loss 3.3494 (3.2269)	Entropy 0.88259 (0.88592)	Top-1 acc 47.266 (46.911)	Top-5 acc 68.359 (70.725)	lr 0.02258
Train [25][540/3239]	Time 0.634 (0.944)	Data Time 0.001 (0.043)	Loss 3.2159 (3.2279)	Entropy 0.88279 (0.88586)	Top-1 acc 47.266 (46.879)	Top-5 acc 72.656 (70.705)	lr 0.02258
Train [25][550/3239]	Time 0.589 (0.942)	Data Time 0.001 (0.043)	Loss 3.3358 (3.2286)	Entropy 0.88286 (0.88580)	Top-1 acc 44.531 (46.879)	Top-5 acc 67.188 (70.681)	lr 0.02258
Train [25][560/3239]	Time 0.605 (0.941)	Data Time 0.002 (0.042)	Loss 3.1071 (3.2284)	Entropy 0.88309 (0.88575)	Top-1 acc 50.391 (46.872)	Top-5 acc 74.219 (70.693)	lr 0.02258
Train [25][570/3239]	Time 0.590 (0.940)	Data Time 0.001 (0.041)	Loss 3.1855 (3.2290)	Entropy 0.88301 (0.88570)	Top-1 acc 51.172 (46.867)	Top-5 acc 68.359 (70.670)	lr 0.02258
Train [25][580/3239]	Time 0.612 (0.939)	Data Time 0.001 (0.041)	Loss 3.1279 (3.2292)	Entropy 0.88257 (0.88566)	Top-1 acc 46.875 (46.858)	Top-5 acc 72.656 (70.657)	lr 0.02258
Train [25][590/3239]	Time 0.615 (0.937)	Data Time 0.002 (0.040)	Loss 3.0433 (3.2289)	Entropy 0.88252 (0.88560)	Top-1 acc 50.391 (46.856)	Top-5 acc 73.438 (70.661)	lr 0.02258
Train [25][600/3239]	Time 0.599 (0.936)	Data Time 0.001 (0.039)	Loss 3.2086 (3.2286)	Entropy 0.88235 (0.88555)	Top-1 acc 45.703 (46.867)	Top-5 acc 67.188 (70.657)	lr 0.02258
Train [25][610/3239]	Time 0.607 (0.935)	Data Time 0.001 (0.039)	Loss 3.2093 (3.2281)	Entropy 0.88194 (0.88549)	Top-1 acc 47.656 (46.878)	Top-5 acc 72.266 (70.667)	lr 0.02258
Train [25][620/3239]	Time 0.618 (0.934)	Data Time 0.001 (0.038)	Loss 2.9633 (3.2276)	Entropy 0.88175 (0.88543)	Top-1 acc 51.953 (46.881)	Top-5 acc 76.562 (70.682)	lr 0.02258
Train [25][630/3239]	Time 0.609 (0.933)	Data Time 0.001 (0.037)	Loss 3.4102 (3.2273)	Entropy 0.88179 (0.88538)	Top-1 acc 45.312 (46.887)	Top-5 acc 66.406 (70.692)	lr 0.02258
Train [25][640/3239]	Time 0.601 (0.931)	Data Time 0.002 (0.037)	Loss 3.1236 (3.2277)	Entropy 0.88161 (0.88532)	Top-1 acc 51.562 (46.888)	Top-5 acc 71.875 (70.682)	lr 0.02257
Train [25][650/3239]	Time 0.599 (0.930)	Data Time 0.001 (0.036)	Loss 3.3454 (3.2278)	Entropy 0.88168 (0.88526)	Top-1 acc 48.047 (46.892)	Top-5 acc 66.406 (70.671)	lr 0.02257
Train [25][660/3239]	Time 0.589 (0.929)	Data Time 0.001 (0.036)	Loss 3.2052 (3.2279)	Entropy 0.88159 (0.88521)	Top-1 acc 51.953 (46.901)	Top-5 acc 69.531 (70.674)	lr 0.02257
Train [25][670/3239]	Time 0.756 (0.929)	Data Time 0.002 (0.035)	Loss 3.1745 (3.2269)	Entropy 0.88124 (0.88515)	Top-1 acc 46.875 (46.912)	Top-5 acc 74.219 (70.697)	lr 0.02257
Train [25][680/3239]	Time 0.611 (0.927)	Data Time 0.001 (0.035)	Loss 3.1842 (3.2280)	Entropy 0.88115 (0.88509)	Top-1 acc 50.000 (46.892)	Top-5 acc 70.703 (70.682)	lr 0.02257
Train [25][690/3239]	Time 0.624 (0.926)	Data Time 0.001 (0.034)	Loss 3.1259 (3.2278)	Entropy 0.88106 (0.88503)	Top-1 acc 46.094 (46.890)	Top-5 acc 73.438 (70.688)	lr 0.02257
Train [25][700/3239]	Time 0.442 (0.924)	Data Time 0.001 (0.034)	Loss 3.3859 (3.2274)	Entropy 0.88146 (0.88498)	Top-1 acc 44.141 (46.907)	Top-5 acc 67.969 (70.691)	lr 0.02257
Train [25][710/3239]	Time 0.567 (0.923)	Data Time 0.001 (0.033)	Loss 3.2976 (3.2281)	Entropy 0.88109 (0.88493)	Top-1 acc 46.094 (46.907)	Top-5 acc 69.531 (70.669)	lr 0.02257
Train [25][720/3239]	Time 0.609 (0.922)	Data Time 0.001 (0.033)	Loss 3.1364 (3.2272)	Entropy 0.88035 (0.88487)	Top-1 acc 51.953 (46.933)	Top-5 acc 70.703 (70.684)	lr 0.02257
Train [25][730/3239]	Time 0.643 (0.922)	Data Time 0.001 (0.033)	Loss 3.2740 (3.2276)	Entropy 0.88064 (0.88481)	Top-1 acc 44.922 (46.950)	Top-5 acc 66.797 (70.671)	lr 0.02257
Train [25][740/3239]	Time 0.700 (0.921)	Data Time 0.001 (0.032)	Loss 3.3025 (3.2279)	Entropy 0.87994 (0.88475)	Top-1 acc 48.047 (46.948)	Top-5 acc 69.531 (70.666)	lr 0.02257
Train [25][750/3239]	Time 0.600 (0.920)	Data Time 0.002 (0.032)	Loss 3.2555 (3.2276)	Entropy 0.87988 (0.88469)	Top-1 acc 49.609 (46.958)	Top-5 acc 73.828 (70.677)	lr 0.02257
Train [25][760/3239]	Time 0.598 (0.919)	Data Time 0.001 (0.031)	Loss 3.5387 (3.2276)	Entropy 0.88021 (0.88463)	Top-1 acc 41.016 (46.958)	Top-5 acc 64.844 (70.669)	lr 0.02257
Train [25][770/3239]	Time 0.614 (0.918)	Data Time 0.001 (0.031)	Loss 3.4619 (3.2276)	Entropy 0.87984 (0.88457)	Top-1 acc 41.797 (46.954)	Top-5 acc 69.922 (70.686)	lr 0.02257
Train [25][780/3239]	Time 0.649 (0.918)	Data Time 0.001 (0.031)	Loss 3.2970 (3.2286)	Entropy 0.87973 (0.88451)	Top-1 acc 42.969 (46.927)	Top-5 acc 71.094 (70.660)	lr 0.02257
Train [25][790/3239]	Time 0.613 (0.917)	Data Time 0.001 (0.030)	Loss 3.2476 (3.2294)	Entropy 0.88000 (0.88445)	Top-1 acc 43.750 (46.915)	Top-5 acc 68.750 (70.640)	lr 0.02257
Train [25][800/3239]	Time 0.569 (0.916)	Data Time 0.002 (0.030)	Loss 3.1069 (3.2285)	Entropy 0.88002 (0.88439)	Top-1 acc 50.781 (46.939)	Top-5 acc 73.438 (70.660)	lr 0.02257
Train [25][810/3239]	Time 0.771 (0.945)	Data Time 0.046 (0.030)	Loss 3.2156 (3.2285)	Entropy 0.88057 (0.88434)	Top-1 acc 47.656 (46.922)	Top-5 acc 68.359 (70.653)	lr 0.02256
Train [25][820/3239]	Time 0.626 (0.944)	Data Time 0.002 (0.029)	Loss 3.1300 (3.2280)	Entropy 0.88010 (0.88429)	Top-1 acc 48.438 (46.921)	Top-5 acc 75.000 (70.669)	lr 0.02256
Train [25][830/3239]	Time 0.725 (0.942)	Data Time 0.001 (0.029)	Loss 3.1050 (3.2281)	Entropy 0.88010 (0.88424)	Top-1 acc 50.000 (46.916)	Top-5 acc 75.000 (70.670)	lr 0.02256
Train [25][840/3239]	Time 0.612 (0.942)	Data Time 0.001 (0.029)	Loss 3.0488 (3.2288)	Entropy 0.87993 (0.88419)	Top-1 acc 51.172 (46.904)	Top-5 acc 76.172 (70.662)	lr 0.02256
Train [25][850/3239]	Time 0.589 (0.940)	Data Time 0.001 (0.028)	Loss 3.5316 (3.2294)	Entropy 0.87984 (0.88414)	Top-1 acc 40.625 (46.893)	Top-5 acc 63.672 (70.652)	lr 0.02256
Train [25][860/3239]	Time 0.601 (0.940)	Data Time 0.001 (0.028)	Loss 3.1972 (3.2301)	Entropy 0.87963 (0.88409)	Top-1 acc 50.781 (46.888)	Top-5 acc 68.359 (70.638)	lr 0.02256
Train [25][870/3239]	Time 0.590 (0.939)	Data Time 0.001 (0.028)	Loss 3.2678 (3.2300)	Entropy 0.87918 (0.88403)	Top-1 acc 46.094 (46.890)	Top-5 acc 71.094 (70.633)	lr 0.02256
Train [25][880/3239]	Time 0.600 (0.938)	Data Time 0.001 (0.027)	Loss 3.2303 (3.2297)	Entropy 0.87897 (0.88398)	Top-1 acc 49.609 (46.887)	Top-5 acc 71.484 (70.638)	lr 0.02256
Train [25][890/3239]	Time 0.655 (0.937)	Data Time 0.001 (0.027)	Loss 3.1490 (3.2296)	Entropy 0.87786 (0.88392)	Top-1 acc 48.438 (46.899)	Top-5 acc 72.656 (70.650)	lr 0.02256
Train [25][900/3239]	Time 0.686 (0.936)	Data Time 0.001 (0.027)	Loss 3.1152 (3.2296)	Entropy 0.87732 (0.88385)	Top-1 acc 46.094 (46.888)	Top-5 acc 75.391 (70.649)	lr 0.02256
Train [25][910/3239]	Time 0.626 (0.935)	Data Time 0.001 (0.027)	Loss 3.1226 (3.2299)	Entropy 0.87735 (0.88378)	Top-1 acc 51.562 (46.879)	Top-5 acc 71.094 (70.638)	lr 0.02256
Train [25][920/3239]	Time 0.622 (0.934)	Data Time 0.001 (0.026)	Loss 3.3145 (3.2303)	Entropy 0.87702 (0.88371)	Top-1 acc 47.266 (46.871)	Top-5 acc 69.141 (70.632)	lr 0.02256
Train [25][930/3239]	Time 0.599 (0.934)	Data Time 0.002 (0.026)	Loss 3.0087 (3.2294)	Entropy 0.87682 (0.88363)	Top-1 acc 49.219 (46.888)	Top-5 acc 70.703 (70.641)	lr 0.02256
Train [25][940/3239]	Time 0.608 (0.933)	Data Time 0.001 (0.026)	Loss 3.2108 (3.2295)	Entropy 0.87694 (0.88356)	Top-1 acc 48.828 (46.882)	Top-5 acc 74.219 (70.637)	lr 0.02256
Train [25][950/3239]	Time 0.609 (0.932)	Data Time 0.001 (0.026)	Loss 3.3160 (3.2303)	Entropy 0.87692 (0.88349)	Top-1 acc 42.578 (46.863)	Top-5 acc 68.750 (70.612)	lr 0.02256
Train [25][960/3239]	Time 0.613 (0.932)	Data Time 0.001 (0.025)	Loss 3.0502 (3.2309)	Entropy 0.87664 (0.88342)	Top-1 acc 51.953 (46.863)	Top-5 acc 75.781 (70.597)	lr 0.02256
Train [25][970/3239]	Time 0.575 (0.931)	Data Time 0.001 (0.025)	Loss 3.1061 (3.2301)	Entropy 0.87611 (0.88335)	Top-1 acc 45.703 (46.877)	Top-5 acc 69.922 (70.616)	lr 0.02255
Train [25][980/3239]	Time 0.610 (0.930)	Data Time 0.001 (0.025)	Loss 3.2846 (3.2303)	Entropy 0.87636 (0.88328)	Top-1 acc 44.531 (46.864)	Top-5 acc 68.359 (70.615)	lr 0.02255
Train [25][990/3239]	Time 0.676 (0.929)	Data Time 0.002 (0.025)	Loss 3.3978 (3.2306)	Entropy 0.87633 (0.88321)	Top-1 acc 42.188 (46.860)	Top-5 acc 69.922 (70.613)	lr 0.02255
Train [25][1000/3239]	Time 0.625 (0.929)	Data Time 0.001 (0.024)	Loss 3.2480 (3.2308)	Entropy 0.87639 (0.88314)	Top-1 acc 42.578 (46.842)	Top-5 acc 69.531 (70.612)	lr 0.02255
Train [25][1010/3239]	Time 0.639 (0.927)	Data Time 0.001 (0.024)	Loss 3.3887 (3.2317)	Entropy 0.87602 (0.88307)	Top-1 acc 42.969 (46.820)	Top-5 acc 70.312 (70.597)	lr 0.02255
Train [25][1020/3239]	Time 0.571 (0.927)	Data Time 0.001 (0.024)	Loss 3.3213 (3.2321)	Entropy 0.87560 (0.88300)	Top-1 acc 46.484 (46.811)	Top-5 acc 68.750 (70.583)	lr 0.02255
Train [25][1030/3239]	Time 0.585 (0.926)	Data Time 0.002 (0.024)	Loss 3.1603 (3.2317)	Entropy 0.87559 (0.88293)	Top-1 acc 51.172 (46.823)	Top-5 acc 71.094 (70.588)	lr 0.02255
Train [25][1040/3239]	Time 0.583 (0.926)	Data Time 0.001 (0.024)	Loss 3.0403 (3.2313)	Entropy 0.87532 (0.88285)	Top-1 acc 51.953 (46.842)	Top-5 acc 74.219 (70.597)	lr 0.02255
Train [25][1050/3239]	Time 0.605 (0.925)	Data Time 0.001 (0.023)	Loss 3.0088 (3.2309)	Entropy 0.87519 (0.88278)	Top-1 acc 52.344 (46.854)	Top-5 acc 74.609 (70.607)	lr 0.02255
Train [25][1060/3239]	Time 0.720 (0.924)	Data Time 0.001 (0.023)	Loss 3.1354 (3.2309)	Entropy 0.87499 (0.88271)	Top-1 acc 43.359 (46.849)	Top-5 acc 72.656 (70.610)	lr 0.02255
Train [25][1070/3239]	Time 0.622 (0.924)	Data Time 0.002 (0.023)	Loss 3.2736 (3.2310)	Entropy 0.87482 (0.88264)	Top-1 acc 42.969 (46.843)	Top-5 acc 69.531 (70.607)	lr 0.02255
Train [25][1080/3239]	Time 0.592 (0.923)	Data Time 0.001 (0.023)	Loss 3.3152 (3.2315)	Entropy 0.87490 (0.88257)	Top-1 acc 47.266 (46.833)	Top-5 acc 69.141 (70.603)	lr 0.02255
Train [25][1090/3239]	Time 0.596 (0.923)	Data Time 0.001 (0.023)	Loss 3.5931 (3.2319)	Entropy 0.87478 (0.88250)	Top-1 acc 40.234 (46.821)	Top-5 acc 64.062 (70.588)	lr 0.02255
Train [25][1100/3239]	Time 0.620 (0.922)	Data Time 0.001 (0.022)	Loss 3.2627 (3.2320)	Entropy 0.87466 (0.88243)	Top-1 acc 46.875 (46.816)	Top-5 acc 70.312 (70.587)	lr 0.02255
Train [25][1110/3239]	Time 0.603 (0.922)	Data Time 0.001 (0.022)	Loss 3.4203 (3.2326)	Entropy 0.87420 (0.88235)	Top-1 acc 43.750 (46.802)	Top-5 acc 64.453 (70.567)	lr 0.02255
Train [25][1120/3239]	Time 0.601 (0.921)	Data Time 0.001 (0.022)	Loss 3.2701 (3.2325)	Entropy 0.87375 (0.88228)	Top-1 acc 47.656 (46.809)	Top-5 acc 69.531 (70.574)	lr 0.02255
Train [25][1130/3239]	Time 0.709 (0.920)	Data Time 0.001 (0.022)	Loss 3.2463 (3.2330)	Entropy 0.87396 (0.88221)	Top-1 acc 47.656 (46.800)	Top-5 acc 71.094 (70.559)	lr 0.02255
Train [25][1140/3239]	Time 0.578 (0.920)	Data Time 0.001 (0.022)	Loss 3.1863 (3.2327)	Entropy 0.87369 (0.88213)	Top-1 acc 48.828 (46.806)	Top-5 acc 71.875 (70.565)	lr 0.02254
Train [25][1150/3239]	Time 0.586 (0.919)	Data Time 0.001 (0.021)	Loss 3.2480 (3.2333)	Entropy 0.87341 (0.88206)	Top-1 acc 46.875 (46.789)	Top-5 acc 69.922 (70.549)	lr 0.02254
Train [25][1160/3239]	Time 0.596 (0.919)	Data Time 0.001 (0.021)	Loss 3.3268 (3.2332)	Entropy 0.87363 (0.88199)	Top-1 acc 43.359 (46.794)	Top-5 acc 69.141 (70.547)	lr 0.02254
Train [25][1170/3239]	Time 0.585 (0.918)	Data Time 0.001 (0.021)	Loss 3.2547 (3.2335)	Entropy 0.87389 (0.88191)	Top-1 acc 43.750 (46.789)	Top-5 acc 67.578 (70.542)	lr 0.02254
Train [25][1180/3239]	Time 0.487 (0.917)	Data Time 0.002 (0.021)	Loss 3.2239 (3.2332)	Entropy 0.87371 (0.88185)	Top-1 acc 48.438 (46.792)	Top-5 acc 69.141 (70.543)	lr 0.02254
Train [25][1190/3239]	Time 0.535 (0.917)	Data Time 0.003 (0.021)	Loss 3.3581 (3.2335)	Entropy 0.87390 (0.88178)	Top-1 acc 44.531 (46.783)	Top-5 acc 69.531 (70.529)	lr 0.02254
Train [25][1200/3239]	Time 0.590 (0.916)	Data Time 0.003 (0.021)	Loss 3.1788 (3.2335)	Entropy 0.87361 (0.88171)	Top-1 acc 45.312 (46.788)	Top-5 acc 69.531 (70.536)	lr 0.02254
Train [25][1210/3239]	Time 0.606 (0.916)	Data Time 0.001 (0.020)	Loss 3.1655 (3.2337)	Entropy 0.87325 (0.88164)	Top-1 acc 45.703 (46.780)	Top-5 acc 70.703 (70.532)	lr 0.02254
Train [25][1220/3239]	Time 0.654 (0.915)	Data Time 0.001 (0.020)	Loss 3.1749 (3.2336)	Entropy 0.87334 (0.88158)	Top-1 acc 46.875 (46.775)	Top-5 acc 71.094 (70.530)	lr 0.02254
Train [25][1230/3239]	Time 0.622 (0.915)	Data Time 0.001 (0.020)	Loss 3.2075 (3.2333)	Entropy 0.87376 (0.88151)	Top-1 acc 46.875 (46.779)	Top-5 acc 70.312 (70.531)	lr 0.02254
Train [25][1240/3239]	Time 0.655 (0.914)	Data Time 0.027 (0.020)	Loss 3.1645 (3.2330)	Entropy 0.87382 (0.88145)	Top-1 acc 50.391 (46.776)	Top-5 acc 71.094 (70.541)	lr 0.02254
Train [25][1250/3239]	Time 0.663 (0.914)	Data Time 0.001 (0.020)	Loss 3.3841 (3.2335)	Entropy 0.87387 (0.88139)	Top-1 acc 42.969 (46.769)	Top-5 acc 70.312 (70.530)	lr 0.02254
Train [25][1260/3239]	Time 0.559 (0.914)	Data Time 0.001 (0.020)	Loss 3.6148 (3.2341)	Entropy 0.87344 (0.88133)	Top-1 acc 40.234 (46.761)	Top-5 acc 62.500 (70.520)	lr 0.02254
Train [25][1270/3239]	Time 0.606 (0.913)	Data Time 0.001 (0.020)	Loss 3.2225 (3.2339)	Entropy 0.87288 (0.88126)	Top-1 acc 51.562 (46.763)	Top-5 acc 72.266 (70.529)	lr 0.02254
Train [25][1280/3239]	Time 0.591 (0.913)	Data Time 0.001 (0.019)	Loss 3.1825 (3.2342)	Entropy 0.87312 (0.88120)	Top-1 acc 48.047 (46.761)	Top-5 acc 71.875 (70.524)	lr 0.02254
Train [25][1290/3239]	Time 0.685 (0.912)	Data Time 0.001 (0.019)	Loss 3.4522 (3.2345)	Entropy 0.87303 (0.88113)	Top-1 acc 42.578 (46.749)	Top-5 acc 67.188 (70.514)	lr 0.02254
Train [25][1300/3239]	Time 0.646 (0.912)	Data Time 0.001 (0.019)	Loss 3.0195 (3.2342)	Entropy 0.87304 (0.88107)	Top-1 acc 50.391 (46.749)	Top-5 acc 75.000 (70.521)	lr 0.02253
Train [25][1310/3239]	Time 0.602 (0.911)	Data Time 0.001 (0.019)	Loss 3.3248 (3.2344)	Entropy 0.87264 (0.88101)	Top-1 acc 42.969 (46.735)	Top-5 acc 67.188 (70.518)	lr 0.02253
Train [25][1320/3239]	Time 0.600 (0.911)	Data Time 0.001 (0.019)	Loss 3.2509 (3.2343)	Entropy 0.87266 (0.88095)	Top-1 acc 44.922 (46.732)	Top-5 acc 72.656 (70.522)	lr 0.02253
Train [25][1330/3239]	Time 0.631 (0.910)	Data Time 0.001 (0.019)	Loss 3.3090 (3.2340)	Entropy 0.87251 (0.88089)	Top-1 acc 46.484 (46.736)	Top-5 acc 69.922 (70.528)	lr 0.02253
Train [25][1340/3239]	Time 0.593 (0.910)	Data Time 0.001 (0.019)	Loss 3.0931 (3.2337)	Entropy 0.87221 (0.88082)	Top-1 acc 53.906 (46.738)	Top-5 acc 74.219 (70.533)	lr 0.02253
Train [25][1350/3239]	Time 0.634 (0.910)	Data Time 0.001 (0.019)	Loss 3.1602 (3.2343)	Entropy 0.87180 (0.88076)	Top-1 acc 49.219 (46.723)	Top-5 acc 71.484 (70.516)	lr 0.02253
Train [25][1360/3239]	Time 0.601 (0.909)	Data Time 0.001 (0.018)	Loss 3.0825 (3.2347)	Entropy 0.87180 (0.88069)	Top-1 acc 48.828 (46.713)	Top-5 acc 74.219 (70.506)	lr 0.02253
Train [25][1370/3239]	Time 0.632 (0.908)	Data Time 0.001 (0.018)	Loss 3.4258 (3.2351)	Entropy 0.87130 (0.88063)	Top-1 acc 42.188 (46.705)	Top-5 acc 67.578 (70.493)	lr 0.02253
Train [25][1380/3239]	Time 0.606 (0.908)	Data Time 0.001 (0.018)	Loss 3.0583 (3.2348)	Entropy 0.87087 (0.88056)	Top-1 acc 51.953 (46.712)	Top-5 acc 75.391 (70.500)	lr 0.02253
Train [25][1390/3239]	Time 0.651 (0.908)	Data Time 0.002 (0.018)	Loss 2.9335 (3.2345)	Entropy 0.87066 (0.88049)	Top-1 acc 53.906 (46.722)	Top-5 acc 76.953 (70.508)	lr 0.02253
Train [25][1400/3239]	Time 0.588 (0.907)	Data Time 0.001 (0.018)	Loss 3.1300 (3.2346)	Entropy 0.87081 (0.88042)	Top-1 acc 49.219 (46.718)	Top-5 acc 73.438 (70.497)	lr 0.02253
Train [25][1410/3239]	Time 0.591 (0.907)	Data Time 0.002 (0.018)	Loss 3.2944 (3.2340)	Entropy 0.87040 (0.88035)	Top-1 acc 44.922 (46.728)	Top-5 acc 71.094 (70.508)	lr 0.02253
Train [25][1420/3239]	Time 0.652 (0.907)	Data Time 0.001 (0.018)	Loss 3.1176 (3.2343)	Entropy 0.87027 (0.88028)	Top-1 acc 45.703 (46.720)	Top-5 acc 71.875 (70.506)	lr 0.02253
Train [25][1430/3239]	Time 0.599 (0.906)	Data Time 0.001 (0.018)	Loss 3.1163 (3.2341)	Entropy 0.87012 (0.88021)	Top-1 acc 49.219 (46.720)	Top-5 acc 73.828 (70.512)	lr 0.02253
Train [25][1440/3239]	Time 0.614 (0.906)	Data Time 0.001 (0.018)	Loss 3.2162 (3.2341)	Entropy 0.87010 (0.88014)	Top-1 acc 46.484 (46.716)	Top-5 acc 67.578 (70.507)	lr 0.02253
Train [25][1450/3239]	Time 0.745 (0.906)	Data Time 0.001 (0.017)	Loss 3.1765 (3.2338)	Entropy 0.86988 (0.88007)	Top-1 acc 50.391 (46.726)	Top-5 acc 70.703 (70.513)	lr 0.02253
Train [25][1460/3239]	Time 0.639 (0.906)	Data Time 0.001 (0.017)	Loss 3.0826 (3.2336)	Entropy 0.86966 (0.88000)	Top-1 acc 48.438 (46.730)	Top-5 acc 73.828 (70.513)	lr 0.02253
Train [25][1470/3239]	Time 0.610 (0.921)	Data Time 0.002 (0.017)	Loss 3.1429 (3.2334)	Entropy 0.86923 (0.87993)	Top-1 acc 48.438 (46.733)	Top-5 acc 73.438 (70.518)	lr 0.02252
Train [25][1480/3239]	Time 0.632 (0.921)	Data Time 0.001 (0.017)	Loss 3.0612 (3.2333)	Entropy 0.86902 (0.87985)	Top-1 acc 53.125 (46.735)	Top-5 acc 75.781 (70.523)	lr 0.02252
Train [25][1490/3239]	Time 0.641 (0.920)	Data Time 0.003 (0.017)	Loss 3.3071 (3.2327)	Entropy 0.86940 (0.87978)	Top-1 acc 45.312 (46.745)	Top-5 acc 68.359 (70.535)	lr 0.02252
Train [25][1500/3239]	Time 0.627 (0.920)	Data Time 0.001 (0.017)	Loss 3.2630 (3.2329)	Entropy 0.86934 (0.87971)	Top-1 acc 47.266 (46.737)	Top-5 acc 71.484 (70.538)	lr 0.02252
Train [25][1510/3239]	Time 0.642 (0.919)	Data Time 0.001 (0.017)	Loss 3.2399 (3.2331)	Entropy 0.86940 (0.87964)	Top-1 acc 45.703 (46.736)	Top-5 acc 71.094 (70.529)	lr 0.02252
Train [25][1520/3239]	Time 0.605 (0.919)	Data Time 0.001 (0.017)	Loss 3.0815 (3.2329)	Entropy 0.86907 (0.87957)	Top-1 acc 51.953 (46.745)	Top-5 acc 75.000 (70.533)	lr 0.02252
Train [25][1530/3239]	Time 0.572 (0.918)	Data Time 0.001 (0.017)	Loss 3.1405 (3.2323)	Entropy 0.86904 (0.87950)	Top-1 acc 46.484 (46.757)	Top-5 acc 73.438 (70.546)	lr 0.02252
Train [25][1540/3239]	Time 0.602 (0.918)	Data Time 0.020 (0.017)	Loss 3.3034 (3.2318)	Entropy 0.86883 (0.87944)	Top-1 acc 45.312 (46.765)	Top-5 acc 68.750 (70.553)	lr 0.02252
Train [25][1550/3239]	Time 0.620 (0.918)	Data Time 0.001 (0.016)	Loss 3.2335 (3.2321)	Entropy 0.86826 (0.87937)	Top-1 acc 46.094 (46.756)	Top-5 acc 68.750 (70.548)	lr 0.02252
Train [25][1560/3239]	Time 0.660 (0.917)	Data Time 0.001 (0.016)	Loss 3.1101 (3.2321)	Entropy 0.86795 (0.87929)	Top-1 acc 46.484 (46.757)	Top-5 acc 72.266 (70.544)	lr 0.02252
Train [25][1570/3239]	Time 0.636 (0.917)	Data Time 0.001 (0.016)	Loss 3.1057 (3.2322)	Entropy 0.86812 (0.87922)	Top-1 acc 51.172 (46.758)	Top-5 acc 72.656 (70.544)	lr 0.02252
Train [25][1580/3239]	Time 0.643 (0.916)	Data Time 0.001 (0.016)	Loss 3.4485 (3.2323)	Entropy 0.86779 (0.87915)	Top-1 acc 42.188 (46.756)	Top-5 acc 66.406 (70.539)	lr 0.02252
Train [25][1590/3239]	Time 0.611 (0.916)	Data Time 0.001 (0.016)	Loss 3.0334 (3.2320)	Entropy 0.86779 (0.87908)	Top-1 acc 50.000 (46.767)	Top-5 acc 75.781 (70.543)	lr 0.02252
Train [25][1600/3239]	Time 0.634 (0.916)	Data Time 0.001 (0.016)	Loss 3.2425 (3.2318)	Entropy 0.86802 (0.87901)	Top-1 acc 51.562 (46.771)	Top-5 acc 70.703 (70.546)	lr 0.02252
Train [25][1610/3239]	Time 0.732 (0.916)	Data Time 0.002 (0.016)	Loss 2.9709 (3.2314)	Entropy 0.86791 (0.87894)	Top-1 acc 56.641 (46.782)	Top-5 acc 73.047 (70.558)	lr 0.02252
Train [25][1620/3239]	Time 0.641 (0.915)	Data Time 0.001 (0.016)	Loss 3.2680 (3.2314)	Entropy 0.86740 (0.87887)	Top-1 acc 44.141 (46.784)	Top-5 acc 67.969 (70.552)	lr 0.02252
Train [25][1630/3239]	Time 0.595 (0.915)	Data Time 0.001 (0.016)	Loss 3.1461 (3.2315)	Entropy 0.86698 (0.87880)	Top-1 acc 48.438 (46.788)	Top-5 acc 71.484 (70.549)	lr 0.02252
Train [25][1640/3239]	Time 0.622 (0.915)	Data Time 0.001 (0.016)	Loss 3.2053 (3.2314)	Entropy 0.86662 (0.87873)	Top-1 acc 45.312 (46.789)	Top-5 acc 71.094 (70.551)	lr 0.02251
Train [25][1650/3239]	Time 0.559 (0.914)	Data Time 0.001 (0.016)	Loss 3.2715 (3.2318)	Entropy 0.86662 (0.87866)	Top-1 acc 46.875 (46.785)	Top-5 acc 69.141 (70.542)	lr 0.02251
Train [25][1660/3239]	Time 0.593 (0.914)	Data Time 0.001 (0.015)	Loss 3.4198 (3.2317)	Entropy 0.86664 (0.87858)	Top-1 acc 40.625 (46.786)	Top-5 acc 65.234 (70.542)	lr 0.02251
Train [25][1670/3239]	Time 0.604 (0.913)	Data Time 0.001 (0.015)	Loss 3.3638 (3.2319)	Entropy 0.86663 (0.87851)	Top-1 acc 44.922 (46.788)	Top-5 acc 66.406 (70.535)	lr 0.02251
Train [25][1680/3239]	Time 0.715 (0.913)	Data Time 0.002 (0.015)	Loss 3.2690 (3.2325)	Entropy 0.86654 (0.87844)	Top-1 acc 47.266 (46.773)	Top-5 acc 68.359 (70.526)	lr 0.02251
Train [25][1690/3239]	Time 0.611 (0.912)	Data Time 0.001 (0.015)	Loss 3.0602 (3.2323)	Entropy 0.86631 (0.87837)	Top-1 acc 52.344 (46.775)	Top-5 acc 73.438 (70.526)	lr 0.02251
Train [25][1700/3239]	Time 0.621 (0.912)	Data Time 0.001 (0.015)	Loss 3.2852 (3.2323)	Entropy 0.86609 (0.87830)	Top-1 acc 43.750 (46.772)	Top-5 acc 69.141 (70.525)	lr 0.02251
Train [25][1710/3239]	Time 0.651 (0.912)	Data Time 0.001 (0.015)	Loss 2.9352 (3.2320)	Entropy 0.86562 (0.87823)	Top-1 acc 48.828 (46.779)	Top-5 acc 75.391 (70.527)	lr 0.02251
Train [25][1720/3239]	Time 0.610 (0.911)	Data Time 0.001 (0.015)	Loss 3.1616 (3.2323)	Entropy 0.86576 (0.87815)	Top-1 acc 46.094 (46.767)	Top-5 acc 71.875 (70.524)	lr 0.02251
Train [25][1730/3239]	Time 0.648 (0.911)	Data Time 0.001 (0.015)	Loss 3.1816 (3.2323)	Entropy 0.86608 (0.87808)	Top-1 acc 48.047 (46.769)	Top-5 acc 73.828 (70.525)	lr 0.02251
Train [25][1740/3239]	Time 0.640 (0.911)	Data Time 0.001 (0.015)	Loss 3.0414 (3.2324)	Entropy 0.86626 (0.87801)	Top-1 acc 52.734 (46.770)	Top-5 acc 73.438 (70.521)	lr 0.02251
Train [25][1750/3239]	Time 0.594 (0.910)	Data Time 0.001 (0.015)	Loss 3.1615 (3.2322)	Entropy 0.86618 (0.87795)	Top-1 acc 48.047 (46.771)	Top-5 acc 73.047 (70.526)	lr 0.02251
Train [25][1760/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.015)	Loss 3.1043 (3.2320)	Entropy 0.86645 (0.87788)	Top-1 acc 49.609 (46.779)	Top-5 acc 73.828 (70.531)	lr 0.02251
Train [25][1770/3239]	Time 0.734 (0.910)	Data Time 0.001 (0.015)	Loss 3.2875 (3.2320)	Entropy 0.86629 (0.87782)	Top-1 acc 44.141 (46.776)	Top-5 acc 70.703 (70.528)	lr 0.02251
Train [25][1780/3239]	Time 0.591 (0.910)	Data Time 0.001 (0.015)	Loss 3.3326 (3.2322)	Entropy 0.86622 (0.87775)	Top-1 acc 48.438 (46.773)	Top-5 acc 67.578 (70.524)	lr 0.02251
Train [25][1790/3239]	Time 0.611 (0.910)	Data Time 0.001 (0.014)	Loss 3.1169 (3.2322)	Entropy 0.86600 (0.87769)	Top-1 acc 50.000 (46.777)	Top-5 acc 71.875 (70.518)	lr 0.02251
Train [25][1800/3239]	Time 0.589 (0.909)	Data Time 0.001 (0.014)	Loss 3.2659 (3.2326)	Entropy 0.86618 (0.87762)	Top-1 acc 44.531 (46.767)	Top-5 acc 71.094 (70.511)	lr 0.02250
Train [25][1810/3239]	Time 0.592 (0.909)	Data Time 0.001 (0.014)	Loss 3.3511 (3.2327)	Entropy 0.86594 (0.87756)	Top-1 acc 42.578 (46.765)	Top-5 acc 69.141 (70.511)	lr 0.02250
Train [25][1820/3239]	Time 0.606 (0.909)	Data Time 0.001 (0.014)	Loss 3.3683 (3.2328)	Entropy 0.86578 (0.87750)	Top-1 acc 42.969 (46.761)	Top-5 acc 67.969 (70.514)	lr 0.02250
Train [25][1830/3239]	Time 0.584 (0.908)	Data Time 0.001 (0.014)	Loss 3.2318 (3.2331)	Entropy 0.86558 (0.87743)	Top-1 acc 46.484 (46.754)	Top-5 acc 70.312 (70.508)	lr 0.02250
Train [25][1840/3239]	Time 0.600 (0.908)	Data Time 0.001 (0.014)	Loss 3.3702 (3.2333)	Entropy 0.86531 (0.87737)	Top-1 acc 39.453 (46.750)	Top-5 acc 68.359 (70.508)	lr 0.02250
Train [25][1850/3239]	Time 0.584 (0.908)	Data Time 0.001 (0.014)	Loss 3.2737 (3.2337)	Entropy 0.86529 (0.87730)	Top-1 acc 43.750 (46.736)	Top-5 acc 73.047 (70.501)	lr 0.02250
Train [25][1860/3239]	Time 0.609 (0.907)	Data Time 0.001 (0.014)	Loss 3.2738 (3.2337)	Entropy 0.86501 (0.87724)	Top-1 acc 46.484 (46.735)	Top-5 acc 69.531 (70.504)	lr 0.02250
Train [25][1870/3239]	Time 0.627 (0.907)	Data Time 0.001 (0.014)	Loss 3.0584 (3.2338)	Entropy 0.86477 (0.87717)	Top-1 acc 53.906 (46.737)	Top-5 acc 76.562 (70.505)	lr 0.02250
Train [25][1880/3239]	Time 0.623 (0.907)	Data Time 0.001 (0.014)	Loss 3.2036 (3.2336)	Entropy 0.86452 (0.87710)	Top-1 acc 46.484 (46.742)	Top-5 acc 69.141 (70.507)	lr 0.02250
Train [25][1890/3239]	Time 0.609 (0.907)	Data Time 0.002 (0.014)	Loss 3.4173 (3.2338)	Entropy 0.86430 (0.87704)	Top-1 acc 40.234 (46.740)	Top-5 acc 68.359 (70.505)	lr 0.02250
Train [25][1900/3239]	Time 0.614 (0.906)	Data Time 0.001 (0.014)	Loss 3.1516 (3.2342)	Entropy 0.86385 (0.87697)	Top-1 acc 47.656 (46.730)	Top-5 acc 69.922 (70.495)	lr 0.02250
Train [25][1910/3239]	Time 0.604 (0.906)	Data Time 0.002 (0.014)	Loss 3.2534 (3.2346)	Entropy 0.86381 (0.87690)	Top-1 acc 44.141 (46.720)	Top-5 acc 70.312 (70.493)	lr 0.02250
Train [25][1920/3239]	Time 0.624 (0.906)	Data Time 0.001 (0.014)	Loss 3.1262 (3.2347)	Entropy 0.86354 (0.87683)	Top-1 acc 47.656 (46.718)	Top-5 acc 73.828 (70.483)	lr 0.02250
Train [25][1930/3239]	Time 0.735 (0.906)	Data Time 0.001 (0.014)	Loss 3.2380 (3.2350)	Entropy 0.86305 (0.87676)	Top-1 acc 47.266 (46.716)	Top-5 acc 71.484 (70.481)	lr 0.02250
Train [25][1940/3239]	Time 0.610 (0.905)	Data Time 0.002 (0.014)	Loss 3.3891 (3.2349)	Entropy 0.86291 (0.87669)	Top-1 acc 44.922 (46.722)	Top-5 acc 68.359 (70.483)	lr 0.02250
Train [25][1950/3239]	Time 0.621 (0.905)	Data Time 0.002 (0.013)	Loss 3.1905 (3.2352)	Entropy 0.86311 (0.87662)	Top-1 acc 47.656 (46.715)	Top-5 acc 65.625 (70.474)	lr 0.02250
Train [25][1960/3239]	Time 0.635 (0.905)	Data Time 0.001 (0.013)	Loss 3.2792 (3.2351)	Entropy 0.86300 (0.87655)	Top-1 acc 43.750 (46.712)	Top-5 acc 70.703 (70.480)	lr 0.02250
Train [25][1970/3239]	Time 0.586 (0.905)	Data Time 0.001 (0.013)	Loss 3.4391 (3.2350)	Entropy 0.86272 (0.87648)	Top-1 acc 42.578 (46.713)	Top-5 acc 64.453 (70.479)	lr 0.02249
Train [25][1980/3239]	Time 0.597 (0.905)	Data Time 0.001 (0.013)	Loss 3.1826 (3.2351)	Entropy 0.86299 (0.87641)	Top-1 acc 46.094 (46.709)	Top-5 acc 72.266 (70.474)	lr 0.02249
Train [25][1990/3239]	Time 0.611 (0.904)	Data Time 0.001 (0.013)	Loss 3.0810 (3.2350)	Entropy 0.86307 (0.87635)	Top-1 acc 50.391 (46.713)	Top-5 acc 72.266 (70.474)	lr 0.02249
Train [25][2000/3239]	Time 0.722 (0.904)	Data Time 0.002 (0.013)	Loss 3.0860 (3.2350)	Entropy 0.86307 (0.87628)	Top-1 acc 50.781 (46.710)	Top-5 acc 72.656 (70.471)	lr 0.02249
Train [25][2010/3239]	Time 0.536 (0.904)	Data Time 0.001 (0.013)	Loss 3.2021 (3.2352)	Entropy 0.86294 (0.87621)	Top-1 acc 46.875 (46.709)	Top-5 acc 69.531 (70.463)	lr 0.02249
Train [25][2020/3239]	Time 0.602 (0.903)	Data Time 0.001 (0.013)	Loss 3.3298 (3.2356)	Entropy 0.86323 (0.87615)	Top-1 acc 41.797 (46.703)	Top-5 acc 67.188 (70.461)	lr 0.02249
Train [25][2030/3239]	Time 0.595 (0.903)	Data Time 0.001 (0.013)	Loss 3.0979 (3.2357)	Entropy 0.86312 (0.87609)	Top-1 acc 50.391 (46.702)	Top-5 acc 69.141 (70.461)	lr 0.02249
Train [25][2040/3239]	Time 0.625 (0.903)	Data Time 0.001 (0.013)	Loss 3.0659 (3.2356)	Entropy 0.86327 (0.87602)	Top-1 acc 46.484 (46.697)	Top-5 acc 76.172 (70.460)	lr 0.02249
Train [25][2050/3239]	Time 0.582 (0.903)	Data Time 0.001 (0.013)	Loss 3.2387 (3.2351)	Entropy 0.86321 (0.87596)	Top-1 acc 50.000 (46.709)	Top-5 acc 71.094 (70.468)	lr 0.02249
Train [25][2060/3239]	Time 0.628 (0.902)	Data Time 0.001 (0.013)	Loss 3.1583 (3.2352)	Entropy 0.86290 (0.87590)	Top-1 acc 48.047 (46.707)	Top-5 acc 72.266 (70.467)	lr 0.02249
Train [25][2070/3239]	Time 0.596 (0.902)	Data Time 0.001 (0.013)	Loss 3.2500 (3.2351)	Entropy 0.86287 (0.87584)	Top-1 acc 48.047 (46.712)	Top-5 acc 70.312 (70.470)	lr 0.02249
Train [25][2080/3239]	Time 0.632 (0.902)	Data Time 0.001 (0.013)	Loss 3.4291 (3.2350)	Entropy 0.86269 (0.87577)	Top-1 acc 39.062 (46.711)	Top-5 acc 67.969 (70.471)	lr 0.02249
Train [25][2090/3239]	Time 0.620 (0.902)	Data Time 0.001 (0.013)	Loss 3.0031 (3.2350)	Entropy 0.86262 (0.87571)	Top-1 acc 50.391 (46.712)	Top-5 acc 75.391 (70.472)	lr 0.02249
Train [25][2100/3239]	Time 0.609 (0.902)	Data Time 0.001 (0.013)	Loss 3.3015 (3.2354)	Entropy 0.86277 (0.87565)	Top-1 acc 47.266 (46.705)	Top-5 acc 71.094 (70.465)	lr 0.02249
Train [25][2110/3239]	Time 0.641 (0.902)	Data Time 0.001 (0.013)	Loss 3.4275 (3.2354)	Entropy 0.86308 (0.87559)	Top-1 acc 42.969 (46.701)	Top-5 acc 66.406 (70.465)	lr 0.02249
Train [25][2120/3239]	Time 0.747 (0.912)	Data Time 0.004 (0.013)	Loss 3.0943 (3.2352)	Entropy 0.86283 (0.87553)	Top-1 acc 51.953 (46.711)	Top-5 acc 74.609 (70.468)	lr 0.02249
Train [25][2130/3239]	Time 0.646 (0.912)	Data Time 0.002 (0.012)	Loss 2.9604 (3.2346)	Entropy 0.86295 (0.87547)	Top-1 acc 51.953 (46.730)	Top-5 acc 76.172 (70.482)	lr 0.02248
Train [25][2140/3239]	Time 0.604 (0.912)	Data Time 0.002 (0.012)	Loss 3.3956 (3.2346)	Entropy 0.86277 (0.87541)	Top-1 acc 41.797 (46.724)	Top-5 acc 67.578 (70.481)	lr 0.02248
Train [25][2150/3239]	Time 0.463 (0.911)	Data Time 0.001 (0.012)	Loss 3.2908 (3.2348)	Entropy 0.86228 (0.87535)	Top-1 acc 50.000 (46.726)	Top-5 acc 67.188 (70.478)	lr 0.02248
Train [25][2160/3239]	Time 0.568 (0.910)	Data Time 0.001 (0.012)	Loss 3.3755 (3.2350)	Entropy 0.86289 (0.87529)	Top-1 acc 43.359 (46.719)	Top-5 acc 71.875 (70.473)	lr 0.02248
Train [25][2170/3239]	Time 0.607 (0.910)	Data Time 0.001 (0.012)	Loss 3.3391 (3.2352)	Entropy 0.86292 (0.87523)	Top-1 acc 44.922 (46.709)	Top-5 acc 67.188 (70.468)	lr 0.02248
Train [25][2180/3239]	Time 0.581 (0.909)	Data Time 0.001 (0.012)	Loss 3.3986 (3.2356)	Entropy 0.86299 (0.87518)	Top-1 acc 42.188 (46.701)	Top-5 acc 66.797 (70.461)	lr 0.02248
Train [25][2190/3239]	Time 0.629 (0.909)	Data Time 0.001 (0.012)	Loss 3.1002 (3.2356)	Entropy 0.86337 (0.87512)	Top-1 acc 48.047 (46.700)	Top-5 acc 70.703 (70.460)	lr 0.02248
Train [25][2200/3239]	Time 0.631 (0.909)	Data Time 0.001 (0.012)	Loss 3.2285 (3.2358)	Entropy 0.86345 (0.87507)	Top-1 acc 47.656 (46.696)	Top-5 acc 70.312 (70.453)	lr 0.02248
Train [25][2210/3239]	Time 0.593 (0.909)	Data Time 0.001 (0.012)	Loss 3.3450 (3.2361)	Entropy 0.86344 (0.87502)	Top-1 acc 42.188 (46.691)	Top-5 acc 68.359 (70.446)	lr 0.02248
Train [25][2220/3239]	Time 0.592 (0.909)	Data Time 0.001 (0.012)	Loss 3.1300 (3.2360)	Entropy 0.86335 (0.87496)	Top-1 acc 47.266 (46.691)	Top-5 acc 72.266 (70.451)	lr 0.02248
Train [25][2230/3239]	Time 0.585 (0.908)	Data Time 0.001 (0.012)	Loss 3.4204 (3.2360)	Entropy 0.86366 (0.87491)	Top-1 acc 42.969 (46.688)	Top-5 acc 68.750 (70.450)	lr 0.02248
Train [25][2240/3239]	Time 0.575 (0.908)	Data Time 0.001 (0.012)	Loss 3.3806 (3.2359)	Entropy 0.86376 (0.87486)	Top-1 acc 44.141 (46.697)	Top-5 acc 69.141 (70.451)	lr 0.02248
Train [25][2250/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.012)	Loss 3.2117 (3.2358)	Entropy 0.86387 (0.87481)	Top-1 acc 48.047 (46.704)	Top-5 acc 70.312 (70.453)	lr 0.02248
Train [25][2260/3239]	Time 0.604 (0.908)	Data Time 0.001 (0.012)	Loss 3.3103 (3.2359)	Entropy 0.86385 (0.87476)	Top-1 acc 44.141 (46.699)	Top-5 acc 69.922 (70.453)	lr 0.02248
Train [25][2270/3239]	Time 0.635 (0.908)	Data Time 0.001 (0.012)	Loss 2.9071 (3.2360)	Entropy 0.86404 (0.87472)	Top-1 acc 55.469 (46.701)	Top-5 acc 77.344 (70.451)	lr 0.02248
Train [25][2280/3239]	Time 0.581 (0.907)	Data Time 0.001 (0.012)	Loss 3.2214 (3.2359)	Entropy 0.86395 (0.87467)	Top-1 acc 51.172 (46.702)	Top-5 acc 69.141 (70.453)	lr 0.02248
Train [25][2290/3239]	Time 0.600 (0.907)	Data Time 0.001 (0.012)	Loss 3.1235 (3.2361)	Entropy 0.86402 (0.87462)	Top-1 acc 49.219 (46.694)	Top-5 acc 72.656 (70.446)	lr 0.02248
Train [25][2300/3239]	Time 0.605 (0.907)	Data Time 0.001 (0.012)	Loss 3.0220 (3.2361)	Entropy 0.86344 (0.87458)	Top-1 acc 48.438 (46.690)	Top-5 acc 73.047 (70.445)	lr 0.02247
Train [25][2310/3239]	Time 0.638 (0.907)	Data Time 0.001 (0.012)	Loss 3.1506 (3.2360)	Entropy 0.86335 (0.87453)	Top-1 acc 42.969 (46.689)	Top-5 acc 74.219 (70.448)	lr 0.02247
Train [25][2320/3239]	Time 0.675 (0.906)	Data Time 0.001 (0.012)	Loss 3.2064 (3.2361)	Entropy 0.86340 (0.87448)	Top-1 acc 48.438 (46.687)	Top-5 acc 71.484 (70.443)	lr 0.02247
Train [25][2330/3239]	Time 0.630 (0.906)	Data Time 0.001 (0.012)	Loss 3.3220 (3.2363)	Entropy 0.86362 (0.87443)	Top-1 acc 44.922 (46.681)	Top-5 acc 67.578 (70.438)	lr 0.02247
Train [25][2340/3239]	Time 0.591 (0.906)	Data Time 0.001 (0.012)	Loss 3.1248 (3.2360)	Entropy 0.86363 (0.87439)	Top-1 acc 49.609 (46.687)	Top-5 acc 73.047 (70.442)	lr 0.02247
Train [25][2350/3239]	Time 0.584 (0.906)	Data Time 0.001 (0.011)	Loss 3.1251 (3.2358)	Entropy 0.86389 (0.87434)	Top-1 acc 48.438 (46.689)	Top-5 acc 72.656 (70.445)	lr 0.02247
Train [25][2360/3239]	Time 0.609 (0.905)	Data Time 0.001 (0.011)	Loss 3.0672 (3.2358)	Entropy 0.86385 (0.87430)	Top-1 acc 48.828 (46.687)	Top-5 acc 72.266 (70.446)	lr 0.02247
Train [25][2370/3239]	Time 0.609 (0.905)	Data Time 0.001 (0.011)	Loss 3.2444 (3.2356)	Entropy 0.86370 (0.87425)	Top-1 acc 46.484 (46.691)	Top-5 acc 70.312 (70.448)	lr 0.02247
Train [25][2380/3239]	Time 0.639 (0.905)	Data Time 0.001 (0.011)	Loss 3.1286 (3.2356)	Entropy 0.86352 (0.87421)	Top-1 acc 49.609 (46.693)	Top-5 acc 69.922 (70.445)	lr 0.02247
Train [25][2390/3239]	Time 0.699 (0.905)	Data Time 0.002 (0.011)	Loss 3.4352 (3.2355)	Entropy 0.86358 (0.87416)	Top-1 acc 42.188 (46.697)	Top-5 acc 64.453 (70.446)	lr 0.02247
Train [25][2400/3239]	Time 0.628 (0.905)	Data Time 0.001 (0.011)	Loss 3.2740 (3.2355)	Entropy 0.86358 (0.87412)	Top-1 acc 42.969 (46.703)	Top-5 acc 68.750 (70.448)	lr 0.02247
Train [25][2410/3239]	Time 0.563 (0.905)	Data Time 0.001 (0.011)	Loss 3.3161 (3.2351)	Entropy 0.86360 (0.87408)	Top-1 acc 47.266 (46.712)	Top-5 acc 66.016 (70.456)	lr 0.02247
Train [25][2420/3239]	Time 0.601 (0.904)	Data Time 0.001 (0.011)	Loss 3.1033 (3.2353)	Entropy 0.86362 (0.87403)	Top-1 acc 47.656 (46.708)	Top-5 acc 75.391 (70.456)	lr 0.02247
Train [25][2430/3239]	Time 0.597 (0.904)	Data Time 0.001 (0.011)	Loss 3.1780 (3.2352)	Entropy 0.86336 (0.87399)	Top-1 acc 48.047 (46.710)	Top-5 acc 73.047 (70.458)	lr 0.02247
Train [25][2440/3239]	Time 0.621 (0.904)	Data Time 0.001 (0.011)	Loss 3.2159 (3.2349)	Entropy 0.86297 (0.87394)	Top-1 acc 46.484 (46.718)	Top-5 acc 73.047 (70.465)	lr 0.02247
Train [25][2450/3239]	Time 0.623 (0.904)	Data Time 0.001 (0.011)	Loss 2.9828 (3.2348)	Entropy 0.86286 (0.87390)	Top-1 acc 50.391 (46.719)	Top-5 acc 73.828 (70.468)	lr 0.02247
Train [25][2460/3239]	Time 0.626 (0.904)	Data Time 0.001 (0.011)	Loss 3.2591 (3.2347)	Entropy 0.86252 (0.87385)	Top-1 acc 47.266 (46.720)	Top-5 acc 70.703 (70.471)	lr 0.02246
Train [25][2470/3239]	Time 0.582 (0.904)	Data Time 0.001 (0.011)	Loss 3.0520 (3.2347)	Entropy 0.86278 (0.87381)	Top-1 acc 50.391 (46.721)	Top-5 acc 73.438 (70.470)	lr 0.02246
Train [25][2480/3239]	Time 0.566 (0.903)	Data Time 0.001 (0.011)	Loss 3.4358 (3.2347)	Entropy 0.86239 (0.87376)	Top-1 acc 45.703 (46.724)	Top-5 acc 66.406 (70.473)	lr 0.02246
Train [25][2490/3239]	Time 0.637 (0.903)	Data Time 0.002 (0.011)	Loss 3.1889 (3.2344)	Entropy 0.86224 (0.87372)	Top-1 acc 45.703 (46.725)	Top-5 acc 73.828 (70.478)	lr 0.02246
Train [25][2500/3239]	Time 0.617 (0.903)	Data Time 0.001 (0.011)	Loss 3.4637 (3.2343)	Entropy 0.86228 (0.87367)	Top-1 acc 41.797 (46.725)	Top-5 acc 64.844 (70.479)	lr 0.02246
Train [25][2510/3239]	Time 0.618 (0.903)	Data Time 0.001 (0.011)	Loss 3.2500 (3.2345)	Entropy 0.86218 (0.87363)	Top-1 acc 42.578 (46.723)	Top-5 acc 67.969 (70.472)	lr 0.02246
Train [25][2520/3239]	Time 0.620 (0.902)	Data Time 0.001 (0.011)	Loss 3.4517 (3.2345)	Entropy 0.86204 (0.87358)	Top-1 acc 47.266 (46.724)	Top-5 acc 65.625 (70.471)	lr 0.02246
Train [25][2530/3239]	Time 0.625 (0.902)	Data Time 0.001 (0.011)	Loss 3.0891 (3.2345)	Entropy 0.86184 (0.87354)	Top-1 acc 48.047 (46.724)	Top-5 acc 73.047 (70.476)	lr 0.02246
Train [25][2540/3239]	Time 0.623 (0.902)	Data Time 0.001 (0.011)	Loss 3.1742 (3.2345)	Entropy 0.86215 (0.87349)	Top-1 acc 44.922 (46.722)	Top-5 acc 73.047 (70.472)	lr 0.02246
Train [25][2550/3239]	Time 0.687 (0.902)	Data Time 0.001 (0.011)	Loss 3.3035 (3.2342)	Entropy 0.86232 (0.87345)	Top-1 acc 42.188 (46.725)	Top-5 acc 72.656 (70.478)	lr 0.02246
Train [25][2560/3239]	Time 0.624 (0.902)	Data Time 0.001 (0.011)	Loss 3.2771 (3.2345)	Entropy 0.86237 (0.87340)	Top-1 acc 45.312 (46.719)	Top-5 acc 69.141 (70.471)	lr 0.02246
Train [25][2570/3239]	Time 0.610 (0.902)	Data Time 0.001 (0.011)	Loss 3.2661 (3.2346)	Entropy 0.86213 (0.87336)	Top-1 acc 43.750 (46.715)	Top-5 acc 69.531 (70.466)	lr 0.02246
Train [25][2580/3239]	Time 0.578 (0.902)	Data Time 0.001 (0.011)	Loss 3.1305 (3.2346)	Entropy 0.86183 (0.87332)	Top-1 acc 50.391 (46.718)	Top-5 acc 71.484 (70.465)	lr 0.02246
Train [25][2590/3239]	Time 0.653 (0.901)	Data Time 0.001 (0.011)	Loss 3.2038 (3.2345)	Entropy 0.86205 (0.87327)	Top-1 acc 50.000 (46.718)	Top-5 acc 71.094 (70.464)	lr 0.02246
Train [25][2600/3239]	Time 0.623 (0.901)	Data Time 0.001 (0.011)	Loss 3.2041 (3.2345)	Entropy 0.86225 (0.87323)	Top-1 acc 45.312 (46.716)	Top-5 acc 71.875 (70.469)	lr 0.02246
Train [25][2610/3239]	Time 0.610 (0.901)	Data Time 0.001 (0.011)	Loss 3.0957 (3.2343)	Entropy 0.86227 (0.87319)	Top-1 acc 50.000 (46.724)	Top-5 acc 73.438 (70.474)	lr 0.02246
Train [25][2620/3239]	Time 0.611 (0.901)	Data Time 0.001 (0.010)	Loss 3.0922 (3.2346)	Entropy 0.86206 (0.87315)	Top-1 acc 50.000 (46.719)	Top-5 acc 73.047 (70.468)	lr 0.02245
Train [25][2630/3239]	Time 0.618 (0.901)	Data Time 0.001 (0.010)	Loss 3.1048 (3.2344)	Entropy 0.86244 (0.87310)	Top-1 acc 51.172 (46.724)	Top-5 acc 73.828 (70.472)	lr 0.02245
Train [25][2640/3239]	Time 0.573 (0.901)	Data Time 0.001 (0.010)	Loss 3.2372 (3.2345)	Entropy 0.86211 (0.87306)	Top-1 acc 51.172 (46.722)	Top-5 acc 69.141 (70.467)	lr 0.02245
Train [25][2650/3239]	Time 0.589 (0.901)	Data Time 0.001 (0.010)	Loss 3.4158 (3.2344)	Entropy 0.86228 (0.87302)	Top-1 acc 42.969 (46.724)	Top-5 acc 66.406 (70.468)	lr 0.02245
Train [25][2660/3239]	Time 0.578 (0.900)	Data Time 0.001 (0.010)	Loss 3.4334 (3.2346)	Entropy 0.86210 (0.87298)	Top-1 acc 45.703 (46.722)	Top-5 acc 66.406 (70.464)	lr 0.02245
Train [25][2670/3239]	Time 0.594 (0.900)	Data Time 0.001 (0.010)	Loss 3.2616 (3.2347)	Entropy 0.86204 (0.87294)	Top-1 acc 43.750 (46.717)	Top-5 acc 68.750 (70.461)	lr 0.02245
Train [25][2680/3239]	Time 0.506 (0.900)	Data Time 0.002 (0.010)	Loss 3.0496 (3.2346)	Entropy 0.86214 (0.87290)	Top-1 acc 50.781 (46.716)	Top-5 acc 72.656 (70.463)	lr 0.02245
Train [25][2690/3239]	Time 0.625 (0.900)	Data Time 0.001 (0.010)	Loss 3.3653 (3.2345)	Entropy 0.86193 (0.87286)	Top-1 acc 46.094 (46.717)	Top-5 acc 66.406 (70.463)	lr 0.02245
Train [25][2700/3239]	Time 0.614 (0.900)	Data Time 0.001 (0.010)	Loss 3.1794 (3.2346)	Entropy 0.86198 (0.87282)	Top-1 acc 46.875 (46.715)	Top-5 acc 69.531 (70.460)	lr 0.02245
Train [25][2710/3239]	Time 0.687 (0.899)	Data Time 0.001 (0.010)	Loss 3.1726 (3.2345)	Entropy 0.86193 (0.87278)	Top-1 acc 48.828 (46.713)	Top-5 acc 71.875 (70.462)	lr 0.02245
Train [25][2720/3239]	Time 0.604 (0.899)	Data Time 0.001 (0.010)	Loss 3.2383 (3.2344)	Entropy 0.86191 (0.87274)	Top-1 acc 48.438 (46.716)	Top-5 acc 69.141 (70.464)	lr 0.02245
Train [25][2730/3239]	Time 0.605 (0.899)	Data Time 0.002 (0.010)	Loss 3.0587 (3.2346)	Entropy 0.86202 (0.87270)	Top-1 acc 50.000 (46.713)	Top-5 acc 75.391 (70.460)	lr 0.02245
Train [25][2740/3239]	Time 0.572 (0.899)	Data Time 0.001 (0.010)	Loss 3.1959 (3.2347)	Entropy 0.86193 (0.87266)	Top-1 acc 48.047 (46.712)	Top-5 acc 71.094 (70.458)	lr 0.02245
Train [25][2750/3239]	Time 0.613 (0.899)	Data Time 0.001 (0.010)	Loss 3.1814 (3.2342)	Entropy 0.86169 (0.87262)	Top-1 acc 44.141 (46.717)	Top-5 acc 70.703 (70.467)	lr 0.02245
Train [25][2760/3239]	Time 0.621 (0.899)	Data Time 0.001 (0.010)	Loss 3.3723 (3.2344)	Entropy 0.86136 (0.87258)	Top-1 acc 45.703 (46.716)	Top-5 acc 69.922 (70.464)	lr 0.02245
Train [25][2770/3239]	Time 0.602 (0.899)	Data Time 0.001 (0.010)	Loss 3.3320 (3.2347)	Entropy 0.86145 (0.87254)	Top-1 acc 47.656 (46.712)	Top-5 acc 67.969 (70.460)	lr 0.02245
Train [25][2780/3239]	Time 0.577 (0.907)	Data Time 0.005 (0.010)	Loss 3.3975 (3.2347)	Entropy 0.86165 (0.87250)	Top-1 acc 44.531 (46.710)	Top-5 acc 66.797 (70.457)	lr 0.02245
Train [25][2790/3239]	Time 0.644 (0.907)	Data Time 0.003 (0.010)	Loss 3.1233 (3.2349)	Entropy 0.86191 (0.87246)	Top-1 acc 50.000 (46.708)	Top-5 acc 71.484 (70.456)	lr 0.02244
Train [25][2800/3239]	Time 0.685 (0.907)	Data Time 0.001 (0.010)	Loss 3.4883 (3.2349)	Entropy 0.86228 (0.87243)	Top-1 acc 41.406 (46.708)	Top-5 acc 62.891 (70.456)	lr 0.02244
Train [25][2810/3239]	Time 0.615 (0.907)	Data Time 0.001 (0.010)	Loss 3.3862 (3.2351)	Entropy 0.86224 (0.87239)	Top-1 acc 40.625 (46.701)	Top-5 acc 68.750 (70.455)	lr 0.02244
Train [25][2820/3239]	Time 0.601 (0.906)	Data Time 0.002 (0.010)	Loss 3.0915 (3.2351)	Entropy 0.86232 (0.87235)	Top-1 acc 52.344 (46.705)	Top-5 acc 71.094 (70.454)	lr 0.02244
Train [25][2830/3239]	Time 0.617 (0.906)	Data Time 0.003 (0.010)	Loss 3.4031 (3.2351)	Entropy 0.86214 (0.87232)	Top-1 acc 43.750 (46.706)	Top-5 acc 67.188 (70.454)	lr 0.02244
Train [25][2840/3239]	Time 0.593 (0.906)	Data Time 0.001 (0.010)	Loss 3.1090 (3.2352)	Entropy 0.86216 (0.87228)	Top-1 acc 47.266 (46.704)	Top-5 acc 73.438 (70.451)	lr 0.02244
Train [25][2850/3239]	Time 0.592 (0.906)	Data Time 0.001 (0.010)	Loss 3.2625 (3.2351)	Entropy 0.86211 (0.87225)	Top-1 acc 45.703 (46.705)	Top-5 acc 69.531 (70.451)	lr 0.02244
Train [25][2860/3239]	Time 0.645 (0.906)	Data Time 0.001 (0.010)	Loss 3.2437 (3.2350)	Entropy 0.86244 (0.87221)	Top-1 acc 47.656 (46.706)	Top-5 acc 69.922 (70.455)	lr 0.02244
Train [25][2870/3239]	Time 0.709 (0.906)	Data Time 0.001 (0.010)	Loss 3.1753 (3.2350)	Entropy 0.86223 (0.87218)	Top-1 acc 48.438 (46.709)	Top-5 acc 70.312 (70.453)	lr 0.02244
Train [25][2880/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.010)	Loss 3.0861 (3.2350)	Entropy 0.86230 (0.87214)	Top-1 acc 52.734 (46.708)	Top-5 acc 73.438 (70.455)	lr 0.02244
Train [25][2890/3239]	Time 0.624 (0.905)	Data Time 0.002 (0.010)	Loss 3.2782 (3.2350)	Entropy 0.86210 (0.87211)	Top-1 acc 46.484 (46.712)	Top-5 acc 68.750 (70.458)	lr 0.02244
Train [25][2900/3239]	Time 0.584 (0.905)	Data Time 0.001 (0.010)	Loss 3.2177 (3.2349)	Entropy 0.86202 (0.87207)	Top-1 acc 46.875 (46.713)	Top-5 acc 73.047 (70.459)	lr 0.02244
Train [25][2910/3239]	Time 0.600 (0.905)	Data Time 0.001 (0.010)	Loss 3.3504 (3.2349)	Entropy 0.86203 (0.87204)	Top-1 acc 43.359 (46.716)	Top-5 acc 67.969 (70.458)	lr 0.02244
Train [25][2920/3239]	Time 0.554 (0.905)	Data Time 0.001 (0.010)	Loss 3.2508 (3.2350)	Entropy 0.86200 (0.87201)	Top-1 acc 43.359 (46.713)	Top-5 acc 69.141 (70.457)	lr 0.02244
Train [25][2930/3239]	Time 0.620 (0.905)	Data Time 0.001 (0.010)	Loss 3.3968 (3.2350)	Entropy 0.86210 (0.87197)	Top-1 acc 42.578 (46.711)	Top-5 acc 69.922 (70.462)	lr 0.02244
Train [25][2940/3239]	Time 0.600 (0.905)	Data Time 0.001 (0.010)	Loss 3.3707 (3.2349)	Entropy 0.86173 (0.87194)	Top-1 acc 46.094 (46.714)	Top-5 acc 66.797 (70.465)	lr 0.02244
Train [25][2950/3239]	Time 0.631 (0.905)	Data Time 0.001 (0.010)	Loss 3.1333 (3.2349)	Entropy 0.86161 (0.87190)	Top-1 acc 47.266 (46.711)	Top-5 acc 74.219 (70.464)	lr 0.02243
Train [25][2960/3239]	Time 0.443 (0.904)	Data Time 0.001 (0.010)	Loss 3.4137 (3.2351)	Entropy 0.86182 (0.87187)	Top-1 acc 43.359 (46.707)	Top-5 acc 64.844 (70.459)	lr 0.02243
Train [25][2970/3239]	Time 0.583 (0.904)	Data Time 0.001 (0.009)	Loss 3.3897 (3.2350)	Entropy 0.86157 (0.87183)	Top-1 acc 47.266 (46.710)	Top-5 acc 68.359 (70.464)	lr 0.02243
Train [25][2980/3239]	Time 0.595 (0.904)	Data Time 0.001 (0.009)	Loss 3.1007 (3.2349)	Entropy 0.86171 (0.87180)	Top-1 acc 48.438 (46.711)	Top-5 acc 75.000 (70.469)	lr 0.02243
Train [25][2990/3239]	Time 0.633 (0.904)	Data Time 0.001 (0.009)	Loss 3.0653 (3.2346)	Entropy 0.86205 (0.87177)	Top-1 acc 51.562 (46.719)	Top-5 acc 74.219 (70.476)	lr 0.02243
Train [25][3000/3239]	Time 0.616 (0.904)	Data Time 0.001 (0.009)	Loss 3.1472 (3.2345)	Entropy 0.86189 (0.87173)	Top-1 acc 50.781 (46.718)	Top-5 acc 70.703 (70.471)	lr 0.02243
Train [25][3010/3239]	Time 0.599 (0.904)	Data Time 0.001 (0.009)	Loss 3.1875 (3.2344)	Entropy 0.86189 (0.87170)	Top-1 acc 41.797 (46.720)	Top-5 acc 71.875 (70.475)	lr 0.02243
Train [25][3020/3239]	Time 0.641 (0.903)	Data Time 0.001 (0.009)	Loss 3.0649 (3.2341)	Entropy 0.86201 (0.87167)	Top-1 acc 51.172 (46.721)	Top-5 acc 75.781 (70.483)	lr 0.02243
Train [25][3030/3239]	Time 0.714 (0.903)	Data Time 0.001 (0.009)	Loss 3.4045 (3.2339)	Entropy 0.86155 (0.87164)	Top-1 acc 45.312 (46.730)	Top-5 acc 68.359 (70.488)	lr 0.02243
Train [25][3040/3239]	Time 0.621 (0.903)	Data Time 0.001 (0.009)	Loss 3.3390 (3.2341)	Entropy 0.86130 (0.87160)	Top-1 acc 45.703 (46.724)	Top-5 acc 71.094 (70.487)	lr 0.02243
Train [25][3050/3239]	Time 0.606 (0.903)	Data Time 0.001 (0.009)	Loss 3.0722 (3.2340)	Entropy 0.86115 (0.87157)	Top-1 acc 46.875 (46.723)	Top-5 acc 71.875 (70.488)	lr 0.02243
Train [25][3060/3239]	Time 0.608 (0.903)	Data Time 0.001 (0.009)	Loss 3.3457 (3.2341)	Entropy 0.86089 (0.87154)	Top-1 acc 40.234 (46.717)	Top-5 acc 67.188 (70.485)	lr 0.02243
Train [25][3070/3239]	Time 0.611 (0.903)	Data Time 0.001 (0.009)	Loss 3.0908 (3.2337)	Entropy 0.86096 (0.87150)	Top-1 acc 50.781 (46.728)	Top-5 acc 72.266 (70.492)	lr 0.02243
Train [25][3080/3239]	Time 0.587 (0.903)	Data Time 0.001 (0.009)	Loss 3.0956 (3.2337)	Entropy 0.86072 (0.87147)	Top-1 acc 48.047 (46.728)	Top-5 acc 72.266 (70.490)	lr 0.02243
Train [25][3090/3239]	Time 0.612 (0.903)	Data Time 0.001 (0.009)	Loss 3.3136 (3.2334)	Entropy 0.86073 (0.87143)	Top-1 acc 46.094 (46.738)	Top-5 acc 69.922 (70.497)	lr 0.02243
Train [25][3100/3239]	Time 0.718 (0.903)	Data Time 0.001 (0.009)	Loss 3.2606 (3.2333)	Entropy 0.86054 (0.87140)	Top-1 acc 50.000 (46.742)	Top-5 acc 70.703 (70.497)	lr 0.02243
Train [25][3110/3239]	Time 0.626 (0.903)	Data Time 0.001 (0.009)	Loss 3.1581 (3.2334)	Entropy 0.86057 (0.87136)	Top-1 acc 46.484 (46.738)	Top-5 acc 71.484 (70.497)	lr 0.02242
Train [25][3120/3239]	Time 0.611 (0.902)	Data Time 0.001 (0.009)	Loss 3.0898 (3.2336)	Entropy 0.86064 (0.87133)	Top-1 acc 51.562 (46.737)	Top-5 acc 74.219 (70.493)	lr 0.02242
Train [25][3130/3239]	Time 0.496 (0.902)	Data Time 0.001 (0.009)	Loss 3.3167 (3.2337)	Entropy 0.86063 (0.87129)	Top-1 acc 49.219 (46.738)	Top-5 acc 71.484 (70.492)	lr 0.02242
Train [25][3140/3239]	Time 0.633 (0.902)	Data Time 0.001 (0.009)	Loss 3.1125 (3.2334)	Entropy 0.86041 (0.87126)	Top-1 acc 49.219 (46.742)	Top-5 acc 71.484 (70.498)	lr 0.02242
Train [25][3150/3239]	Time 0.598 (0.902)	Data Time 0.001 (0.009)	Loss 3.3709 (3.2332)	Entropy 0.86035 (0.87122)	Top-1 acc 39.844 (46.746)	Top-5 acc 68.359 (70.505)	lr 0.02242
Train [25][3160/3239]	Time 0.610 (0.902)	Data Time 0.001 (0.009)	Loss 3.1158 (3.2331)	Entropy 0.85997 (0.87119)	Top-1 acc 47.656 (46.749)	Top-5 acc 75.781 (70.507)	lr 0.02242
Train [25][3170/3239]	Time 0.612 (0.902)	Data Time 0.001 (0.009)	Loss 3.2929 (3.2330)	Entropy 0.85994 (0.87115)	Top-1 acc 46.875 (46.753)	Top-5 acc 66.797 (70.511)	lr 0.02242
Train [25][3180/3239]	Time 0.613 (0.902)	Data Time 0.000 (0.009)	Loss 3.2540 (3.2331)	Entropy 0.85964 (0.87112)	Top-1 acc 51.953 (46.755)	Top-5 acc 71.875 (70.508)	lr 0.02242
Train [25][3190/3239]	Time 0.707 (0.901)	Data Time 0.000 (0.009)	Loss 3.1425 (3.2330)	Entropy 0.85954 (0.87108)	Top-1 acc 47.656 (46.759)	Top-5 acc 72.266 (70.510)	lr 0.02242
Train [25][3200/3239]	Time 0.596 (0.901)	Data Time 0.000 (0.009)	Loss 3.1728 (3.2329)	Entropy 0.85948 (0.87105)	Top-1 acc 48.047 (46.759)	Top-5 acc 73.438 (70.509)	lr 0.02242
Train [25][3210/3239]	Time 0.602 (0.901)	Data Time 0.000 (0.009)	Loss 3.2219 (3.2330)	Entropy 0.85943 (0.87101)	Top-1 acc 48.828 (46.758)	Top-5 acc 70.703 (70.507)	lr 0.02242
Train [25][3220/3239]	Time 0.605 (0.901)	Data Time 0.000 (0.009)	Loss 3.3184 (3.2329)	Entropy 0.85935 (0.87097)	Top-1 acc 45.312 (46.761)	Top-5 acc 67.969 (70.508)	lr 0.02242
Train [25][3230/3239]	Time 0.623 (0.901)	Data Time 0.000 (0.009)	Loss 3.0846 (3.2326)	Entropy 0.85921 (0.87094)	Top-1 acc 48.047 (46.768)	Top-5 acc 74.609 (70.510)	lr 0.02242
Train [25][3239/3239]	Time 1.578 (0.901)	Data Time 0.000 (0.009)	Loss 3.5813 (3.2326)	Entropy 0.85937 (0.87091)	Top-1 acc 38.272 (46.770)	Top-5 acc 65.432 (70.510)	lr 0.02242
==========Valid [25/120]	loss 1.945	top-1 acc 56.680 (56.680)	top-5 acc 79.605	Train top-1 46.770	top-5 70.510	Entropy 0.85937	Latency-None: 0.000ms	Flops: 539.76M
Train [26][0/3239]	Time 25.425 (25.425)	Data Time 24.492 (24.492)	Loss 3.1826 (3.1826)	Entropy 0.85925 (0.85925)	Top-1 acc 47.266 (47.266)	Top-5 acc 72.656 (72.656)	lr 0.02242
Train [26][10/3239]	Time 0.585 (3.129)	Data Time 0.001 (2.231)	Loss 3.4935 (3.2332)	Entropy 0.85926 (0.85918)	Top-1 acc 44.922 (45.739)	Top-5 acc 64.062 (71.165)	lr 0.02242
Train [26][20/3239]	Time 0.609 (2.050)	Data Time 0.001 (1.169)	Loss 3.3209 (3.2213)	Entropy 0.85911 (0.85916)	Top-1 acc 44.531 (46.726)	Top-5 acc 68.359 (71.243)	lr 0.02242
Train [26][30/3239]	Time 0.627 (1.667)	Data Time 0.001 (0.793)	Loss 3.1130 (3.2240)	Entropy 0.85860 (0.85909)	Top-1 acc 51.953 (46.825)	Top-5 acc 72.266 (71.132)	lr 0.02242
Train [26][40/3239]	Time 0.578 (1.472)	Data Time 0.001 (0.600)	Loss 3.1100 (3.2210)	Entropy 0.85860 (0.85898)	Top-1 acc 48.438 (46.713)	Top-5 acc 72.656 (71.018)	lr 0.02241
Train [26][50/3239]	Time 0.619 (1.353)	Data Time 0.001 (0.483)	Loss 3.1318 (3.2338)	Entropy 0.85852 (0.85890)	Top-1 acc 48.828 (46.438)	Top-5 acc 74.609 (70.818)	lr 0.02241
Train [26][60/3239]	Time 0.660 (1.272)	Data Time 0.035 (0.404)	Loss 3.1782 (3.2424)	Entropy 0.85820 (0.85879)	Top-1 acc 49.609 (46.311)	Top-5 acc 70.312 (70.569)	lr 0.02241
Train [26][70/3239]	Time 0.492 (1.215)	Data Time 0.001 (0.348)	Loss 3.3171 (3.2337)	Entropy 0.85830 (0.85871)	Top-1 acc 46.484 (46.644)	Top-5 acc 69.922 (70.764)	lr 0.02241
Train [26][80/3239]	Time 0.570 (1.170)	Data Time 0.001 (0.305)	Loss 3.3501 (3.2310)	Entropy 0.85832 (0.85866)	Top-1 acc 46.094 (46.706)	Top-5 acc 67.969 (70.761)	lr 0.02241
Train [26][90/3239]	Time 0.659 (1.134)	Data Time 0.001 (0.272)	Loss 3.1969 (3.2273)	Entropy 0.85840 (0.85863)	Top-1 acc 50.391 (46.781)	Top-5 acc 73.047 (70.845)	lr 0.02241
Train [26][100/3239]	Time 0.626 (1.103)	Data Time 0.001 (0.245)	Loss 3.3671 (3.2241)	Entropy 0.85846 (0.85862)	Top-1 acc 42.578 (46.805)	Top-5 acc 66.016 (70.831)	lr 0.02241
Train [26][110/3239]	Time 0.611 (1.081)	Data Time 0.001 (0.223)	Loss 3.1481 (3.2233)	Entropy 0.85824 (0.85860)	Top-1 acc 47.266 (46.773)	Top-5 acc 72.656 (70.854)	lr 0.02241
Train [26][120/3239]	Time 0.577 (1.063)	Data Time 0.001 (0.205)	Loss 2.8392 (3.2195)	Entropy 0.85825 (0.85857)	Top-1 acc 54.688 (46.810)	Top-5 acc 80.469 (70.910)	lr 0.02241
Train [26][130/3239]	Time 0.618 (1.048)	Data Time 0.001 (0.189)	Loss 3.1672 (3.2198)	Entropy 0.85821 (0.85855)	Top-1 acc 50.781 (46.869)	Top-5 acc 72.656 (70.900)	lr 0.02241
Train [26][140/3239]	Time 0.583 (1.036)	Data Time 0.001 (0.176)	Loss 3.2563 (3.2227)	Entropy 0.85838 (0.85853)	Top-1 acc 49.609 (46.858)	Top-5 acc 69.531 (70.750)	lr 0.02241
Train [26][150/3239]	Time 0.616 (1.025)	Data Time 0.001 (0.164)	Loss 2.8469 (3.2184)	Entropy 0.85799 (0.85851)	Top-1 acc 52.734 (46.929)	Top-5 acc 75.391 (70.830)	lr 0.02241
Train [26][160/3239]	Time 0.643 (1.014)	Data Time 0.001 (0.154)	Loss 3.1619 (3.2183)	Entropy 0.85761 (0.85846)	Top-1 acc 44.922 (46.911)	Top-5 acc 71.875 (70.810)	lr 0.02241
Train [26][170/3239]	Time 0.646 (1.006)	Data Time 0.001 (0.145)	Loss 3.3085 (3.2176)	Entropy 0.85772 (0.85841)	Top-1 acc 44.531 (46.898)	Top-5 acc 71.484 (70.849)	lr 0.02241
Train [26][180/3239]	Time 0.567 (0.997)	Data Time 0.001 (0.137)	Loss 3.2741 (3.2170)	Entropy 0.85800 (0.85838)	Top-1 acc 45.312 (46.897)	Top-5 acc 68.750 (70.876)	lr 0.02241
Train [26][190/3239]	Time 0.705 (1.118)	Data Time 0.005 (0.130)	Loss 3.2387 (3.2162)	Entropy 0.85797 (0.85835)	Top-1 acc 44.922 (46.826)	Top-5 acc 69.531 (70.904)	lr 0.02241
Train [26][200/3239]	Time 0.610 (1.106)	Data Time 0.002 (0.124)	Loss 3.6166 (3.2185)	Entropy 0.85748 (0.85832)	Top-1 acc 40.234 (46.823)	Top-5 acc 62.109 (70.833)	lr 0.02240
Train [26][210/3239]	Time 0.560 (1.093)	Data Time 0.002 (0.118)	Loss 3.0292 (3.2174)	Entropy 0.85754 (0.85828)	Top-1 acc 49.219 (46.829)	Top-5 acc 73.047 (70.822)	lr 0.02240
Train [26][220/3239]	Time 0.494 (1.081)	Data Time 0.001 (0.113)	Loss 3.0331 (3.2187)	Entropy 0.85755 (0.85825)	Top-1 acc 53.125 (46.857)	Top-5 acc 76.562 (70.779)	lr 0.02240
Train [26][230/3239]	Time 0.590 (1.072)	Data Time 0.002 (0.108)	Loss 3.2958 (3.2170)	Entropy 0.85709 (0.85822)	Top-1 acc 43.359 (46.887)	Top-5 acc 70.703 (70.835)	lr 0.02240
Train [26][240/3239]	Time 0.617 (1.063)	Data Time 0.001 (0.104)	Loss 3.3156 (3.2177)	Entropy 0.85674 (0.85816)	Top-1 acc 46.875 (46.893)	Top-5 acc 69.922 (70.818)	lr 0.02240
Train [26][250/3239]	Time 0.673 (1.055)	Data Time 0.001 (0.100)	Loss 3.0035 (3.2178)	Entropy 0.85702 (0.85811)	Top-1 acc 53.125 (46.869)	Top-5 acc 74.609 (70.809)	lr 0.02240
Train [26][260/3239]	Time 0.605 (1.048)	Data Time 0.001 (0.096)	Loss 3.1180 (3.2165)	Entropy 0.85734 (0.85807)	Top-1 acc 49.219 (46.897)	Top-5 acc 69.531 (70.812)	lr 0.02240
Train [26][270/3239]	Time 0.598 (1.041)	Data Time 0.001 (0.093)	Loss 3.1508 (3.2151)	Entropy 0.85714 (0.85804)	Top-1 acc 46.484 (46.914)	Top-5 acc 75.781 (70.859)	lr 0.02240
Train [26][280/3239]	Time 0.613 (1.035)	Data Time 0.001 (0.089)	Loss 3.3245 (3.2145)	Entropy 0.85756 (0.85801)	Top-1 acc 44.922 (46.942)	Top-5 acc 66.016 (70.844)	lr 0.02240
Train [26][290/3239]	Time 0.608 (1.029)	Data Time 0.001 (0.086)	Loss 3.1443 (3.2134)	Entropy 0.85769 (0.85800)	Top-1 acc 53.125 (46.968)	Top-5 acc 73.047 (70.862)	lr 0.02240
Train [26][300/3239]	Time 0.583 (1.024)	Data Time 0.001 (0.084)	Loss 3.1576 (3.2111)	Entropy 0.85746 (0.85799)	Top-1 acc 45.703 (47.042)	Top-5 acc 72.656 (70.919)	lr 0.02240
Train [26][310/3239]	Time 0.615 (1.018)	Data Time 0.001 (0.081)	Loss 3.2073 (3.2111)	Entropy 0.85752 (0.85797)	Top-1 acc 46.484 (46.991)	Top-5 acc 70.312 (70.908)	lr 0.02240
Train [26][320/3239]	Time 0.708 (1.013)	Data Time 0.001 (0.078)	Loss 3.0219 (3.2087)	Entropy 0.85719 (0.85795)	Top-1 acc 54.297 (47.050)	Top-5 acc 75.000 (70.962)	lr 0.02240
Train [26][330/3239]	Time 0.622 (1.009)	Data Time 0.001 (0.076)	Loss 3.2689 (3.2094)	Entropy 0.85703 (0.85793)	Top-1 acc 47.266 (47.039)	Top-5 acc 70.703 (70.943)	lr 0.02240
Train [26][340/3239]	Time 0.585 (1.004)	Data Time 0.001 (0.074)	Loss 3.2975 (3.2109)	Entropy 0.85698 (0.85790)	Top-1 acc 46.875 (47.004)	Top-5 acc 68.750 (70.915)	lr 0.02240
Train [26][350/3239]	Time 0.559 (1.000)	Data Time 0.001 (0.072)	Loss 3.2719 (3.2107)	Entropy 0.85687 (0.85787)	Top-1 acc 43.750 (47.000)	Top-5 acc 67.578 (70.911)	lr 0.02240
Train [26][360/3239]	Time 0.614 (0.996)	Data Time 0.002 (0.070)	Loss 3.1343 (3.2091)	Entropy 0.85692 (0.85784)	Top-1 acc 46.875 (47.018)	Top-5 acc 74.609 (70.970)	lr 0.02239
Train [26][370/3239]	Time 0.619 (0.993)	Data Time 0.001 (0.068)	Loss 3.2679 (3.2095)	Entropy 0.85668 (0.85782)	Top-1 acc 44.531 (46.992)	Top-5 acc 69.531 (70.938)	lr 0.02239
Train [26][380/3239]	Time 0.615 (0.990)	Data Time 0.001 (0.066)	Loss 2.8930 (3.2077)	Entropy 0.85654 (0.85778)	Top-1 acc 54.297 (47.052)	Top-5 acc 77.734 (70.990)	lr 0.02239
Train [26][390/3239]	Time 0.609 (0.986)	Data Time 0.001 (0.065)	Loss 3.4153 (3.2074)	Entropy 0.85667 (0.85775)	Top-1 acc 42.578 (47.080)	Top-5 acc 68.750 (71.011)	lr 0.02239
Train [26][400/3239]	Time 0.616 (0.983)	Data Time 0.001 (0.063)	Loss 3.1812 (3.2061)	Entropy 0.85607 (0.85772)	Top-1 acc 49.609 (47.119)	Top-5 acc 71.875 (71.043)	lr 0.02239
Train [26][410/3239]	Time 0.676 (0.980)	Data Time 0.001 (0.062)	Loss 3.1645 (3.2063)	Entropy 0.85610 (0.85768)	Top-1 acc 48.438 (47.133)	Top-5 acc 69.922 (71.051)	lr 0.02239
Train [26][420/3239]	Time 0.582 (0.977)	Data Time 0.001 (0.060)	Loss 3.2308 (3.2067)	Entropy 0.85597 (0.85764)	Top-1 acc 51.172 (47.113)	Top-5 acc 71.484 (71.049)	lr 0.02239
Train [26][430/3239]	Time 0.566 (0.974)	Data Time 0.001 (0.059)	Loss 3.3736 (3.2076)	Entropy 0.85588 (0.85760)	Top-1 acc 47.266 (47.105)	Top-5 acc 71.094 (71.054)	lr 0.02239
Train [26][440/3239]	Time 0.589 (0.972)	Data Time 0.001 (0.058)	Loss 3.2033 (3.2084)	Entropy 0.85571 (0.85755)	Top-1 acc 47.656 (47.091)	Top-5 acc 73.047 (71.041)	lr 0.02239
Train [26][450/3239]	Time 0.617 (0.970)	Data Time 0.001 (0.056)	Loss 3.1673 (3.2080)	Entropy 0.85538 (0.85751)	Top-1 acc 51.172 (47.133)	Top-5 acc 73.047 (71.070)	lr 0.02239
Train [26][460/3239]	Time 0.595 (0.967)	Data Time 0.001 (0.055)	Loss 3.3728 (3.2079)	Entropy 0.85575 (0.85747)	Top-1 acc 43.750 (47.157)	Top-5 acc 67.188 (71.066)	lr 0.02239
Train [26][470/3239]	Time 0.609 (0.965)	Data Time 0.001 (0.054)	Loss 3.3164 (3.2089)	Entropy 0.85585 (0.85743)	Top-1 acc 43.750 (47.147)	Top-5 acc 69.922 (71.047)	lr 0.02239
Train [26][480/3239]	Time 0.701 (0.963)	Data Time 0.001 (0.053)	Loss 3.2018 (3.2086)	Entropy 0.85612 (0.85740)	Top-1 acc 48.047 (47.162)	Top-5 acc 68.750 (71.063)	lr 0.02239
Train [26][490/3239]	Time 0.604 (0.961)	Data Time 0.001 (0.052)	Loss 3.1528 (3.2080)	Entropy 0.85597 (0.85738)	Top-1 acc 47.266 (47.161)	Top-5 acc 74.219 (71.085)	lr 0.02239
Train [26][500/3239]	Time 0.639 (0.959)	Data Time 0.001 (0.051)	Loss 2.9528 (3.2072)	Entropy 0.85531 (0.85735)	Top-1 acc 53.516 (47.186)	Top-5 acc 73.438 (71.118)	lr 0.02239
Train [26][510/3239]	Time 0.601 (0.957)	Data Time 0.001 (0.050)	Loss 3.1609 (3.2077)	Entropy 0.85540 (0.85731)	Top-1 acc 49.609 (47.195)	Top-5 acc 71.094 (71.112)	lr 0.02239
Train [26][520/3239]	Time 0.608 (0.956)	Data Time 0.001 (0.049)	Loss 3.2115 (3.2076)	Entropy 0.85552 (0.85727)	Top-1 acc 43.750 (47.191)	Top-5 acc 72.656 (71.120)	lr 0.02238
Train [26][530/3239]	Time 0.590 (0.954)	Data Time 0.001 (0.048)	Loss 3.0791 (3.2075)	Entropy 0.85562 (0.85724)	Top-1 acc 51.562 (47.209)	Top-5 acc 75.391 (71.122)	lr 0.02238
Train [26][540/3239]	Time 0.629 (0.952)	Data Time 0.001 (0.047)	Loss 3.1988 (3.2072)	Entropy 0.85579 (0.85721)	Top-1 acc 50.781 (47.222)	Top-5 acc 67.969 (71.109)	lr 0.02238
Train [26][550/3239]	Time 0.506 (0.950)	Data Time 0.001 (0.047)	Loss 2.9294 (3.2068)	Entropy 0.85578 (0.85718)	Top-1 acc 53.516 (47.232)	Top-5 acc 77.734 (71.131)	lr 0.02238
Train [26][560/3239]	Time 0.580 (0.948)	Data Time 0.002 (0.046)	Loss 3.0429 (3.2068)	Entropy 0.85573 (0.85716)	Top-1 acc 51.172 (47.221)	Top-5 acc 72.656 (71.136)	lr 0.02238
Train [26][570/3239]	Time 0.543 (0.946)	Data Time 0.001 (0.045)	Loss 3.3340 (3.2062)	Entropy 0.85553 (0.85713)	Top-1 acc 46.875 (47.244)	Top-5 acc 67.188 (71.144)	lr 0.02238
Train [26][580/3239]	Time 0.594 (0.944)	Data Time 0.001 (0.044)	Loss 3.2226 (3.2066)	Entropy 0.85601 (0.85710)	Top-1 acc 47.656 (47.237)	Top-5 acc 69.922 (71.166)	lr 0.02238
Train [26][590/3239]	Time 0.595 (0.943)	Data Time 0.001 (0.044)	Loss 3.2837 (3.2055)	Entropy 0.85552 (0.85708)	Top-1 acc 46.094 (47.260)	Top-5 acc 71.875 (71.194)	lr 0.02238
Train [26][600/3239]	Time 0.596 (0.941)	Data Time 0.001 (0.043)	Loss 3.1944 (3.2064)	Entropy 0.85568 (0.85705)	Top-1 acc 46.484 (47.247)	Top-5 acc 71.484 (71.180)	lr 0.02238
Train [26][610/3239]	Time 0.612 (0.940)	Data Time 0.001 (0.042)	Loss 2.8943 (3.2051)	Entropy 0.85610 (0.85703)	Top-1 acc 55.859 (47.287)	Top-5 acc 75.781 (71.202)	lr 0.02238
Train [26][620/3239]	Time 0.603 (0.939)	Data Time 0.001 (0.041)	Loss 3.4846 (3.2052)	Entropy 0.85631 (0.85702)	Top-1 acc 43.750 (47.278)	Top-5 acc 67.578 (71.204)	lr 0.02238
Train [26][630/3239]	Time 0.584 (0.938)	Data Time 0.001 (0.041)	Loss 3.3393 (3.2056)	Entropy 0.85632 (0.85701)	Top-1 acc 44.922 (47.277)	Top-5 acc 69.141 (71.196)	lr 0.02238
Train [26][640/3239]	Time 0.684 (0.936)	Data Time 0.001 (0.040)	Loss 2.8782 (3.2052)	Entropy 0.85626 (0.85700)	Top-1 acc 54.688 (47.280)	Top-5 acc 77.734 (71.204)	lr 0.02238
Train [26][650/3239]	Time 0.625 (0.935)	Data Time 0.001 (0.040)	Loss 3.3541 (3.2055)	Entropy 0.85639 (0.85699)	Top-1 acc 43.359 (47.282)	Top-5 acc 66.406 (71.192)	lr 0.02238
Train [26][660/3239]	Time 0.573 (0.934)	Data Time 0.001 (0.039)	Loss 3.3451 (3.2054)	Entropy 0.85652 (0.85698)	Top-1 acc 43.359 (47.290)	Top-5 acc 69.531 (71.198)	lr 0.02238
Train [26][670/3239]	Time 0.640 (0.933)	Data Time 0.001 (0.039)	Loss 3.0733 (3.2051)	Entropy 0.85668 (0.85697)	Top-1 acc 49.609 (47.283)	Top-5 acc 71.094 (71.196)	lr 0.02238
Train [26][680/3239]	Time 0.587 (0.932)	Data Time 0.001 (0.038)	Loss 3.1167 (3.2055)	Entropy 0.85676 (0.85697)	Top-1 acc 50.391 (47.271)	Top-5 acc 73.438 (71.187)	lr 0.02237
Train [26][690/3239]	Time 0.617 (0.931)	Data Time 0.001 (0.037)	Loss 3.3037 (3.2059)	Entropy 0.85662 (0.85697)	Top-1 acc 46.875 (47.263)	Top-5 acc 69.922 (71.175)	lr 0.02237
Train [26][700/3239]	Time 0.623 (0.930)	Data Time 0.001 (0.037)	Loss 3.0825 (3.2066)	Entropy 0.85655 (0.85696)	Top-1 acc 50.391 (47.250)	Top-5 acc 72.656 (71.163)	lr 0.02237
Train [26][710/3239]	Time 0.728 (0.929)	Data Time 0.001 (0.036)	Loss 3.2143 (3.2069)	Entropy 0.85661 (0.85696)	Top-1 acc 48.047 (47.243)	Top-5 acc 69.141 (71.153)	lr 0.02237
Train [26][720/3239]	Time 0.622 (0.928)	Data Time 0.001 (0.036)	Loss 3.1731 (3.2075)	Entropy 0.85658 (0.85695)	Top-1 acc 50.391 (47.221)	Top-5 acc 69.531 (71.145)	lr 0.02237
Train [26][730/3239]	Time 0.582 (0.926)	Data Time 0.001 (0.036)	Loss 3.2348 (3.2073)	Entropy 0.85616 (0.85694)	Top-1 acc 48.047 (47.226)	Top-5 acc 69.531 (71.151)	lr 0.02237
Train [26][740/3239]	Time 0.560 (0.925)	Data Time 0.001 (0.035)	Loss 3.2701 (3.2069)	Entropy 0.85622 (0.85693)	Top-1 acc 46.094 (47.233)	Top-5 acc 70.703 (71.161)	lr 0.02237
Train [26][750/3239]	Time 0.597 (0.924)	Data Time 0.001 (0.035)	Loss 2.8925 (3.2070)	Entropy 0.85647 (0.85693)	Top-1 acc 51.953 (47.230)	Top-5 acc 78.516 (71.170)	lr 0.02237
Train [26][760/3239]	Time 0.617 (0.924)	Data Time 0.002 (0.034)	Loss 3.1385 (3.2073)	Entropy 0.85663 (0.85692)	Top-1 acc 51.172 (47.229)	Top-5 acc 73.047 (71.158)	lr 0.02237
Train [26][770/3239]	Time 0.639 (0.923)	Data Time 0.001 (0.034)	Loss 3.3054 (3.2080)	Entropy 0.85631 (0.85692)	Top-1 acc 45.312 (47.226)	Top-5 acc 70.312 (71.143)	lr 0.02237
Train [26][780/3239]	Time 0.602 (0.922)	Data Time 0.001 (0.033)	Loss 3.3958 (3.2077)	Entropy 0.85578 (0.85691)	Top-1 acc 38.672 (47.227)	Top-5 acc 70.703 (71.163)	lr 0.02237
Train [26][790/3239]	Time 0.637 (0.921)	Data Time 0.001 (0.033)	Loss 3.0501 (3.2077)	Entropy 0.85594 (0.85689)	Top-1 acc 49.219 (47.221)	Top-5 acc 75.000 (71.161)	lr 0.02237
Train [26][800/3239]	Time 0.701 (0.921)	Data Time 0.001 (0.033)	Loss 3.1821 (3.2072)	Entropy 0.85549 (0.85688)	Top-1 acc 46.094 (47.221)	Top-5 acc 71.875 (71.169)	lr 0.02237
Train [26][810/3239]	Time 0.588 (0.920)	Data Time 0.002 (0.032)	Loss 3.3494 (3.2082)	Entropy 0.85557 (0.85686)	Top-1 acc 43.359 (47.200)	Top-5 acc 68.359 (71.139)	lr 0.02237
Train [26][820/3239]	Time 0.608 (0.919)	Data Time 0.001 (0.032)	Loss 3.2496 (3.2081)	Entropy 0.85547 (0.85685)	Top-1 acc 44.531 (47.195)	Top-5 acc 69.922 (71.130)	lr 0.02237
Train [26][830/3239]	Time 0.608 (0.919)	Data Time 0.001 (0.031)	Loss 3.2332 (3.2079)	Entropy 0.85536 (0.85683)	Top-1 acc 48.047 (47.196)	Top-5 acc 68.750 (71.121)	lr 0.02237
Train [26][840/3239]	Time 0.575 (0.918)	Data Time 0.001 (0.031)	Loss 3.2968 (3.2088)	Entropy 0.85549 (0.85681)	Top-1 acc 44.922 (47.189)	Top-5 acc 70.312 (71.111)	lr 0.02237
Train [26][850/3239]	Time 0.562 (0.946)	Data Time 0.002 (0.031)	Loss 3.3079 (3.2089)	Entropy 0.85563 (0.85680)	Top-1 acc 44.531 (47.194)	Top-5 acc 67.969 (71.106)	lr 0.02236
Train [26][860/3239]	Time 0.503 (0.945)	Data Time 0.002 (0.030)	Loss 3.1414 (3.2083)	Entropy 0.85523 (0.85678)	Top-1 acc 49.609 (47.194)	Top-5 acc 73.828 (71.118)	lr 0.02236
Train [26][870/3239]	Time 0.603 (0.944)	Data Time 0.001 (0.030)	Loss 3.5712 (3.2084)	Entropy 0.85526 (0.85676)	Top-1 acc 41.406 (47.199)	Top-5 acc 65.625 (71.115)	lr 0.02236
Train [26][880/3239]	Time 0.596 (0.943)	Data Time 0.001 (0.030)	Loss 3.0792 (3.2084)	Entropy 0.85516 (0.85675)	Top-1 acc 48.828 (47.196)	Top-5 acc 73.047 (71.115)	lr 0.02236
Train [26][890/3239]	Time 0.613 (0.942)	Data Time 0.001 (0.030)	Loss 3.1630 (3.2090)	Entropy 0.85499 (0.85673)	Top-1 acc 48.438 (47.175)	Top-5 acc 69.531 (71.099)	lr 0.02236
Train [26][900/3239]	Time 0.611 (0.941)	Data Time 0.001 (0.029)	Loss 3.2586 (3.2084)	Entropy 0.85478 (0.85671)	Top-1 acc 47.266 (47.191)	Top-5 acc 73.438 (71.118)	lr 0.02236
Train [26][910/3239]	Time 0.588 (0.940)	Data Time 0.001 (0.029)	Loss 3.2120 (3.2086)	Entropy 0.85458 (0.85669)	Top-1 acc 48.047 (47.189)	Top-5 acc 71.094 (71.107)	lr 0.02236
Train [26][920/3239]	Time 0.601 (0.939)	Data Time 0.001 (0.029)	Loss 3.2780 (3.2086)	Entropy 0.85456 (0.85666)	Top-1 acc 42.969 (47.180)	Top-5 acc 71.094 (71.104)	lr 0.02236
Train [26][930/3239]	Time 0.567 (0.938)	Data Time 0.001 (0.028)	Loss 3.0201 (3.2090)	Entropy 0.85469 (0.85664)	Top-1 acc 50.781 (47.182)	Top-5 acc 75.781 (71.100)	lr 0.02236
Train [26][940/3239]	Time 0.577 (0.937)	Data Time 0.002 (0.028)	Loss 3.3159 (3.2093)	Entropy 0.85505 (0.85662)	Top-1 acc 47.656 (47.183)	Top-5 acc 67.578 (71.096)	lr 0.02236
Train [26][950/3239]	Time 0.584 (0.936)	Data Time 0.001 (0.028)	Loss 3.2760 (3.2093)	Entropy 0.85505 (0.85660)	Top-1 acc 47.656 (47.197)	Top-5 acc 69.922 (71.090)	lr 0.02236
Train [26][960/3239]	Time 0.662 (0.936)	Data Time 0.001 (0.028)	Loss 3.3657 (3.2096)	Entropy 0.85531 (0.85659)	Top-1 acc 44.922 (47.189)	Top-5 acc 68.359 (71.084)	lr 0.02236
Train [26][970/3239]	Time 0.673 (0.935)	Data Time 0.003 (0.027)	Loss 3.1515 (3.2088)	Entropy 0.85520 (0.85658)	Top-1 acc 47.656 (47.190)	Top-5 acc 73.047 (71.101)	lr 0.02236
Train [26][980/3239]	Time 0.610 (0.934)	Data Time 0.001 (0.027)	Loss 3.1738 (3.2088)	Entropy 0.85524 (0.85656)	Top-1 acc 44.531 (47.185)	Top-5 acc 72.266 (71.103)	lr 0.02236
Train [26][990/3239]	Time 0.609 (0.934)	Data Time 0.001 (0.027)	Loss 3.1788 (3.2086)	Entropy 0.85517 (0.85655)	Top-1 acc 48.047 (47.195)	Top-5 acc 68.750 (71.103)	lr 0.02236
Train [26][1000/3239]	Time 0.582 (0.933)	Data Time 0.001 (0.027)	Loss 3.2815 (3.2077)	Entropy 0.85464 (0.85653)	Top-1 acc 49.219 (47.225)	Top-5 acc 66.797 (71.122)	lr 0.02236
Train [26][1010/3239]	Time 0.635 (0.932)	Data Time 0.001 (0.026)	Loss 3.2769 (3.2077)	Entropy 0.85468 (0.85651)	Top-1 acc 46.875 (47.222)	Top-5 acc 69.531 (71.118)	lr 0.02235
Train [26][1020/3239]	Time 0.578 (0.931)	Data Time 0.002 (0.026)	Loss 2.9224 (3.2077)	Entropy 0.85488 (0.85649)	Top-1 acc 55.078 (47.227)	Top-5 acc 75.391 (71.115)	lr 0.02235
Train [26][1030/3239]	Time 0.627 (0.930)	Data Time 0.001 (0.026)	Loss 3.2057 (3.2076)	Entropy 0.85521 (0.85648)	Top-1 acc 46.875 (47.219)	Top-5 acc 70.703 (71.114)	lr 0.02235
Train [26][1040/3239]	Time 0.606 (0.929)	Data Time 0.001 (0.026)	Loss 3.1049 (3.2065)	Entropy 0.85484 (0.85647)	Top-1 acc 50.391 (47.245)	Top-5 acc 75.391 (71.142)	lr 0.02235
Train [26][1050/3239]	Time 0.573 (0.929)	Data Time 0.001 (0.025)	Loss 2.9825 (3.2061)	Entropy 0.85512 (0.85645)	Top-1 acc 51.562 (47.247)	Top-5 acc 76.953 (71.154)	lr 0.02235
Train [26][1060/3239]	Time 0.617 (0.928)	Data Time 0.001 (0.025)	Loss 3.2042 (3.2063)	Entropy 0.85482 (0.85644)	Top-1 acc 47.266 (47.242)	Top-5 acc 71.875 (71.147)	lr 0.02235
Train [26][1070/3239]	Time 0.616 (0.927)	Data Time 0.001 (0.025)	Loss 3.1710 (3.2064)	Entropy 0.85534 (0.85643)	Top-1 acc 46.484 (47.239)	Top-5 acc 73.438 (71.146)	lr 0.02235
Train [26][1080/3239]	Time 0.605 (0.927)	Data Time 0.001 (0.025)	Loss 3.3323 (3.2070)	Entropy 0.85527 (0.85642)	Top-1 acc 45.703 (47.223)	Top-5 acc 67.969 (71.127)	lr 0.02235
Train [26][1090/3239]	Time 0.609 (0.926)	Data Time 0.001 (0.024)	Loss 3.1491 (3.2075)	Entropy 0.85532 (0.85641)	Top-1 acc 46.484 (47.212)	Top-5 acc 71.484 (71.115)	lr 0.02235
Train [26][1100/3239]	Time 0.567 (0.926)	Data Time 0.001 (0.024)	Loss 3.3360 (3.2074)	Entropy 0.85511 (0.85640)	Top-1 acc 47.656 (47.203)	Top-5 acc 66.797 (71.126)	lr 0.02235
Train [26][1110/3239]	Time 0.592 (0.925)	Data Time 0.001 (0.024)	Loss 3.2701 (3.2075)	Entropy 0.85496 (0.85638)	Top-1 acc 45.312 (47.197)	Top-5 acc 69.922 (71.120)	lr 0.02235
Train [26][1120/3239]	Time 0.723 (0.925)	Data Time 0.002 (0.024)	Loss 3.1845 (3.2074)	Entropy 0.85492 (0.85637)	Top-1 acc 46.094 (47.199)	Top-5 acc 74.219 (71.128)	lr 0.02235
Train [26][1130/3239]	Time 0.629 (0.924)	Data Time 0.001 (0.024)	Loss 3.0816 (3.2078)	Entropy 0.85418 (0.85636)	Top-1 acc 51.172 (47.202)	Top-5 acc 75.000 (71.121)	lr 0.02235
Train [26][1140/3239]	Time 0.607 (0.924)	Data Time 0.002 (0.024)	Loss 3.1871 (3.2077)	Entropy 0.85389 (0.85634)	Top-1 acc 46.875 (47.205)	Top-5 acc 73.438 (71.127)	lr 0.02235
Train [26][1150/3239]	Time 0.616 (0.923)	Data Time 0.001 (0.023)	Loss 3.1671 (3.2080)	Entropy 0.85370 (0.85631)	Top-1 acc 44.531 (47.205)	Top-5 acc 72.656 (71.121)	lr 0.02235
Train [26][1160/3239]	Time 0.583 (0.922)	Data Time 0.001 (0.023)	Loss 3.1961 (3.2078)	Entropy 0.85307 (0.85629)	Top-1 acc 48.828 (47.214)	Top-5 acc 69.141 (71.132)	lr 0.02235
Train [26][1170/3239]	Time 0.611 (0.922)	Data Time 0.001 (0.023)	Loss 3.2110 (3.2076)	Entropy 0.85271 (0.85626)	Top-1 acc 46.875 (47.221)	Top-5 acc 71.875 (71.142)	lr 0.02234
Train [26][1180/3239]	Time 0.631 (0.921)	Data Time 0.001 (0.023)	Loss 3.0181 (3.2079)	Entropy 0.85279 (0.85623)	Top-1 acc 51.172 (47.215)	Top-5 acc 74.609 (71.134)	lr 0.02234
Train [26][1190/3239]	Time 0.685 (0.921)	Data Time 0.001 (0.023)	Loss 3.3278 (3.2078)	Entropy 0.85269 (0.85620)	Top-1 acc 47.266 (47.231)	Top-5 acc 66.797 (71.134)	lr 0.02234
Train [26][1200/3239]	Time 0.598 (0.920)	Data Time 0.001 (0.022)	Loss 3.3601 (3.2083)	Entropy 0.85249 (0.85617)	Top-1 acc 41.797 (47.210)	Top-5 acc 68.359 (71.124)	lr 0.02234
Train [26][1210/3239]	Time 0.599 (0.919)	Data Time 0.001 (0.022)	Loss 3.4053 (3.2091)	Entropy 0.85207 (0.85614)	Top-1 acc 40.625 (47.189)	Top-5 acc 63.672 (71.106)	lr 0.02234
Train [26][1220/3239]	Time 0.591 (0.919)	Data Time 0.001 (0.022)	Loss 3.1218 (3.2088)	Entropy 0.85188 (0.85611)	Top-1 acc 49.609 (47.184)	Top-5 acc 73.828 (71.117)	lr 0.02234
Train [26][1230/3239]	Time 0.624 (0.919)	Data Time 0.001 (0.022)	Loss 3.1986 (3.2086)	Entropy 0.85150 (0.85607)	Top-1 acc 48.828 (47.197)	Top-5 acc 73.828 (71.123)	lr 0.02234
Train [26][1240/3239]	Time 0.565 (0.918)	Data Time 0.001 (0.022)	Loss 3.2342 (3.2084)	Entropy 0.85112 (0.85603)	Top-1 acc 52.344 (47.214)	Top-5 acc 71.484 (71.126)	lr 0.02234
Train [26][1250/3239]	Time 0.602 (0.918)	Data Time 0.001 (0.022)	Loss 3.4434 (3.2084)	Entropy 0.85143 (0.85600)	Top-1 acc 43.359 (47.213)	Top-5 acc 67.578 (71.123)	lr 0.02234
Train [26][1260/3239]	Time 0.634 (0.917)	Data Time 0.001 (0.021)	Loss 3.1660 (3.2087)	Entropy 0.85160 (0.85596)	Top-1 acc 44.141 (47.201)	Top-5 acc 71.094 (71.116)	lr 0.02234
Train [26][1270/3239]	Time 0.573 (0.917)	Data Time 0.001 (0.021)	Loss 3.0856 (3.2085)	Entropy 0.85146 (0.85592)	Top-1 acc 50.391 (47.208)	Top-5 acc 72.266 (71.119)	lr 0.02234
Train [26][1280/3239]	Time 0.611 (0.917)	Data Time 0.001 (0.021)	Loss 3.0422 (3.2084)	Entropy 0.85190 (0.85589)	Top-1 acc 50.000 (47.204)	Top-5 acc 73.438 (71.116)	lr 0.02234
Train [26][1290/3239]	Time 0.595 (0.916)	Data Time 0.001 (0.021)	Loss 3.2628 (3.2082)	Entropy 0.85176 (0.85586)	Top-1 acc 44.531 (47.199)	Top-5 acc 68.750 (71.116)	lr 0.02234
Train [26][1300/3239]	Time 0.604 (0.916)	Data Time 0.001 (0.021)	Loss 3.1865 (3.2080)	Entropy 0.85162 (0.85583)	Top-1 acc 46.094 (47.208)	Top-5 acc 70.703 (71.124)	lr 0.02234
Train [26][1310/3239]	Time 0.603 (0.915)	Data Time 0.001 (0.021)	Loss 3.2793 (3.2078)	Entropy 0.85177 (0.85579)	Top-1 acc 42.969 (47.212)	Top-5 acc 68.359 (71.124)	lr 0.02234
Train [26][1320/3239]	Time 0.622 (0.915)	Data Time 0.001 (0.021)	Loss 3.1388 (3.2079)	Entropy 0.85172 (0.85576)	Top-1 acc 49.609 (47.211)	Top-5 acc 71.094 (71.113)	lr 0.02234
Train [26][1330/3239]	Time 0.548 (0.914)	Data Time 0.001 (0.020)	Loss 3.3344 (3.2085)	Entropy 0.85150 (0.85573)	Top-1 acc 41.406 (47.200)	Top-5 acc 69.922 (71.099)	lr 0.02233
Train [26][1340/3239]	Time 0.631 (0.914)	Data Time 0.001 (0.020)	Loss 3.3905 (3.2092)	Entropy 0.85122 (0.85570)	Top-1 acc 44.141 (47.179)	Top-5 acc 67.578 (71.084)	lr 0.02233
Train [26][1350/3239]	Time 0.781 (0.913)	Data Time 0.001 (0.020)	Loss 3.0053 (3.2096)	Entropy 0.85081 (0.85567)	Top-1 acc 51.172 (47.175)	Top-5 acc 77.734 (71.077)	lr 0.02233
Train [26][1360/3239]	Time 0.620 (0.913)	Data Time 0.001 (0.020)	Loss 3.1800 (3.2092)	Entropy 0.85075 (0.85563)	Top-1 acc 45.703 (47.176)	Top-5 acc 70.312 (71.087)	lr 0.02233
Train [26][1370/3239]	Time 0.565 (0.912)	Data Time 0.001 (0.020)	Loss 3.3386 (3.2090)	Entropy 0.85052 (0.85559)	Top-1 acc 46.875 (47.178)	Top-5 acc 66.797 (71.091)	lr 0.02233
Train [26][1380/3239]	Time 0.606 (0.912)	Data Time 0.001 (0.020)	Loss 3.2513 (3.2088)	Entropy 0.84995 (0.85556)	Top-1 acc 50.391 (47.190)	Top-5 acc 71.484 (71.093)	lr 0.02233
Train [26][1390/3239]	Time 0.603 (0.911)	Data Time 0.002 (0.020)	Loss 3.2093 (3.2084)	Entropy 0.84995 (0.85552)	Top-1 acc 48.047 (47.192)	Top-5 acc 71.484 (71.097)	lr 0.02233
Train [26][1400/3239]	Time 0.611 (0.911)	Data Time 0.001 (0.019)	Loss 3.3265 (3.2087)	Entropy 0.84999 (0.85548)	Top-1 acc 47.656 (47.194)	Top-5 acc 68.359 (71.089)	lr 0.02233
Train [26][1410/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.019)	Loss 3.2038 (3.2086)	Entropy 0.84995 (0.85544)	Top-1 acc 46.094 (47.204)	Top-5 acc 69.531 (71.093)	lr 0.02233
Train [26][1420/3239]	Time 0.711 (0.910)	Data Time 0.001 (0.019)	Loss 3.1552 (3.2082)	Entropy 0.84975 (0.85540)	Top-1 acc 49.219 (47.207)	Top-5 acc 71.875 (71.099)	lr 0.02233
Train [26][1430/3239]	Time 0.639 (0.910)	Data Time 0.001 (0.019)	Loss 3.1442 (3.2082)	Entropy 0.84960 (0.85536)	Top-1 acc 48.438 (47.206)	Top-5 acc 73.828 (71.099)	lr 0.02233
Train [26][1440/3239]	Time 0.613 (0.909)	Data Time 0.001 (0.019)	Loss 2.9167 (3.2076)	Entropy 0.84969 (0.85532)	Top-1 acc 54.297 (47.221)	Top-5 acc 76.172 (71.115)	lr 0.02233
Train [26][1450/3239]	Time 0.585 (0.909)	Data Time 0.001 (0.019)	Loss 3.1655 (3.2077)	Entropy 0.84967 (0.85528)	Top-1 acc 45.703 (47.213)	Top-5 acc 72.656 (71.111)	lr 0.02233
Train [26][1460/3239]	Time 0.647 (0.909)	Data Time 0.001 (0.019)	Loss 3.2247 (3.2076)	Entropy 0.84956 (0.85524)	Top-1 acc 46.094 (47.215)	Top-5 acc 73.438 (71.109)	lr 0.02233
Train [26][1470/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.019)	Loss 3.0713 (3.2074)	Entropy 0.84920 (0.85520)	Top-1 acc 50.391 (47.223)	Top-5 acc 75.391 (71.116)	lr 0.02233
Train [26][1480/3239]	Time 0.579 (0.908)	Data Time 0.001 (0.019)	Loss 3.2785 (3.2073)	Entropy 0.84868 (0.85516)	Top-1 acc 44.922 (47.227)	Top-5 acc 67.969 (71.113)	lr 0.02233
Train [26][1490/3239]	Time 0.625 (0.908)	Data Time 0.002 (0.018)	Loss 3.2934 (3.2075)	Entropy 0.84852 (0.85511)	Top-1 acc 47.266 (47.222)	Top-5 acc 69.531 (71.114)	lr 0.02232
Train [26][1500/3239]	Time 0.721 (0.923)	Data Time 0.006 (0.018)	Loss 3.2820 (3.2076)	Entropy 0.84818 (0.85507)	Top-1 acc 45.312 (47.223)	Top-5 acc 68.750 (71.113)	lr 0.02232
Train [26][1510/3239]	Time 0.714 (0.922)	Data Time 0.002 (0.018)	Loss 3.3372 (3.2076)	Entropy 0.84823 (0.85502)	Top-1 acc 46.484 (47.226)	Top-5 acc 72.656 (71.111)	lr 0.02232
Train [26][1520/3239]	Time 0.626 (0.922)	Data Time 0.004 (0.018)	Loss 3.1779 (3.2078)	Entropy 0.84820 (0.85498)	Top-1 acc 46.094 (47.213)	Top-5 acc 73.828 (71.110)	lr 0.02232
Train [26][1530/3239]	Time 0.614 (0.922)	Data Time 0.001 (0.018)	Loss 3.0681 (3.2077)	Entropy 0.84847 (0.85494)	Top-1 acc 49.609 (47.215)	Top-5 acc 73.828 (71.112)	lr 0.02232
Train [26][1540/3239]	Time 0.597 (0.922)	Data Time 0.001 (0.018)	Loss 3.0210 (3.2077)	Entropy 0.84833 (0.85489)	Top-1 acc 50.391 (47.214)	Top-5 acc 76.172 (71.116)	lr 0.02232
Train [26][1550/3239]	Time 0.614 (0.921)	Data Time 0.001 (0.018)	Loss 3.1387 (3.2076)	Entropy 0.84820 (0.85485)	Top-1 acc 49.219 (47.214)	Top-5 acc 69.922 (71.112)	lr 0.02232
Train [26][1560/3239]	Time 0.607 (0.921)	Data Time 0.001 (0.018)	Loss 3.2626 (3.2077)	Entropy 0.84806 (0.85481)	Top-1 acc 48.438 (47.214)	Top-5 acc 69.141 (71.109)	lr 0.02232
Train [26][1570/3239]	Time 0.595 (0.920)	Data Time 0.001 (0.018)	Loss 3.2363 (3.2078)	Entropy 0.84765 (0.85476)	Top-1 acc 48.047 (47.211)	Top-5 acc 68.750 (71.105)	lr 0.02232
Train [26][1580/3239]	Time 0.741 (0.920)	Data Time 0.001 (0.018)	Loss 3.3527 (3.2077)	Entropy 0.84802 (0.85472)	Top-1 acc 43.750 (47.218)	Top-5 acc 69.531 (71.112)	lr 0.02232
Train [26][1590/3239]	Time 0.613 (0.920)	Data Time 0.001 (0.017)	Loss 3.1297 (3.2074)	Entropy 0.84817 (0.85468)	Top-1 acc 50.781 (47.225)	Top-5 acc 71.875 (71.115)	lr 0.02232
Train [26][1600/3239]	Time 0.590 (0.919)	Data Time 0.001 (0.017)	Loss 3.1175 (3.2072)	Entropy 0.84788 (0.85464)	Top-1 acc 47.266 (47.224)	Top-5 acc 72.656 (71.121)	lr 0.02232
Train [26][1610/3239]	Time 0.600 (0.919)	Data Time 0.001 (0.017)	Loss 3.1694 (3.2070)	Entropy 0.84808 (0.85459)	Top-1 acc 49.219 (47.223)	Top-5 acc 69.531 (71.122)	lr 0.02232
Train [26][1620/3239]	Time 0.569 (0.919)	Data Time 0.001 (0.017)	Loss 3.1746 (3.2066)	Entropy 0.84843 (0.85456)	Top-1 acc 48.438 (47.241)	Top-5 acc 71.875 (71.128)	lr 0.02232
Train [26][1630/3239]	Time 0.610 (0.918)	Data Time 0.001 (0.017)	Loss 3.2843 (3.2072)	Entropy 0.84849 (0.85452)	Top-1 acc 42.969 (47.225)	Top-5 acc 69.531 (71.112)	lr 0.02232
Train [26][1640/3239]	Time 0.591 (0.918)	Data Time 0.001 (0.017)	Loss 3.0691 (3.2072)	Entropy 0.84828 (0.85448)	Top-1 acc 51.172 (47.224)	Top-5 acc 75.781 (71.109)	lr 0.02232
Train [26][1650/3239]	Time 0.625 (0.918)	Data Time 0.001 (0.017)	Loss 3.0957 (3.2069)	Entropy 0.84793 (0.85444)	Top-1 acc 48.438 (47.227)	Top-5 acc 74.609 (71.115)	lr 0.02231
Train [26][1660/3239]	Time 0.569 (0.917)	Data Time 0.001 (0.017)	Loss 3.5224 (3.2073)	Entropy 0.84795 (0.85440)	Top-1 acc 38.672 (47.217)	Top-5 acc 65.625 (71.106)	lr 0.02231
Train [26][1670/3239]	Time 0.635 (0.917)	Data Time 0.001 (0.017)	Loss 3.2172 (3.2072)	Entropy 0.84762 (0.85436)	Top-1 acc 48.047 (47.222)	Top-5 acc 70.312 (71.108)	lr 0.02231
Train [26][1680/3239]	Time 0.580 (0.916)	Data Time 0.001 (0.017)	Loss 3.3951 (3.2072)	Entropy 0.84824 (0.85432)	Top-1 acc 43.750 (47.231)	Top-5 acc 68.750 (71.107)	lr 0.02231
Train [26][1690/3239]	Time 0.604 (0.916)	Data Time 0.001 (0.017)	Loss 3.1822 (3.2074)	Entropy 0.84809 (0.85429)	Top-1 acc 48.438 (47.227)	Top-5 acc 72.266 (71.101)	lr 0.02231
Train [26][1700/3239]	Time 0.606 (0.916)	Data Time 0.001 (0.016)	Loss 3.4108 (3.2077)	Entropy 0.84819 (0.85425)	Top-1 acc 46.875 (47.230)	Top-5 acc 67.969 (71.093)	lr 0.02231
Train [26][1710/3239]	Time 0.632 (0.915)	Data Time 0.002 (0.016)	Loss 3.2239 (3.2079)	Entropy 0.84831 (0.85421)	Top-1 acc 50.000 (47.232)	Top-5 acc 68.750 (71.089)	lr 0.02231
Train [26][1720/3239]	Time 0.635 (0.915)	Data Time 0.001 (0.016)	Loss 3.2568 (3.2080)	Entropy 0.84843 (0.85418)	Top-1 acc 45.703 (47.227)	Top-5 acc 69.922 (71.086)	lr 0.02231
Train [26][1730/3239]	Time 0.610 (0.915)	Data Time 0.002 (0.016)	Loss 3.2768 (3.2081)	Entropy 0.84835 (0.85415)	Top-1 acc 48.047 (47.224)	Top-5 acc 71.484 (71.085)	lr 0.02231
Train [26][1740/3239]	Time 0.720 (0.915)	Data Time 0.001 (0.016)	Loss 3.1747 (3.2078)	Entropy 0.84841 (0.85411)	Top-1 acc 46.484 (47.227)	Top-5 acc 70.703 (71.095)	lr 0.02231
Train [26][1750/3239]	Time 0.642 (0.914)	Data Time 0.001 (0.016)	Loss 3.2189 (3.2076)	Entropy 0.84840 (0.85408)	Top-1 acc 46.484 (47.233)	Top-5 acc 70.703 (71.095)	lr 0.02231
Train [26][1760/3239]	Time 0.611 (0.914)	Data Time 0.001 (0.016)	Loss 3.1063 (3.2076)	Entropy 0.84821 (0.85405)	Top-1 acc 47.656 (47.231)	Top-5 acc 75.000 (71.097)	lr 0.02231
Train [26][1770/3239]	Time 0.600 (0.914)	Data Time 0.001 (0.016)	Loss 3.2430 (3.2074)	Entropy 0.84791 (0.85402)	Top-1 acc 48.828 (47.241)	Top-5 acc 68.359 (71.104)	lr 0.02231
Train [26][1780/3239]	Time 0.630 (0.913)	Data Time 0.001 (0.016)	Loss 3.3025 (3.2071)	Entropy 0.84805 (0.85398)	Top-1 acc 47.656 (47.254)	Top-5 acc 65.234 (71.107)	lr 0.02231
Train [26][1790/3239]	Time 0.631 (0.913)	Data Time 0.001 (0.016)	Loss 3.0141 (3.2068)	Entropy 0.84838 (0.85395)	Top-1 acc 49.609 (47.256)	Top-5 acc 76.562 (71.117)	lr 0.02231
Train [26][1800/3239]	Time 0.602 (0.913)	Data Time 0.001 (0.016)	Loss 3.2475 (3.2069)	Entropy 0.84816 (0.85392)	Top-1 acc 48.047 (47.263)	Top-5 acc 66.406 (71.110)	lr 0.02231
Train [26][1810/3239]	Time 0.698 (0.912)	Data Time 0.001 (0.016)	Loss 3.5093 (3.2072)	Entropy 0.84822 (0.85389)	Top-1 acc 41.016 (47.255)	Top-5 acc 62.109 (71.101)	lr 0.02230
Train [26][1820/3239]	Time 0.605 (0.912)	Data Time 0.001 (0.015)	Loss 3.2300 (3.2072)	Entropy 0.84801 (0.85385)	Top-1 acc 50.000 (47.262)	Top-5 acc 74.609 (71.103)	lr 0.02230
Train [26][1830/3239]	Time 0.578 (0.912)	Data Time 0.001 (0.015)	Loss 3.2574 (3.2073)	Entropy 0.84790 (0.85382)	Top-1 acc 50.781 (47.264)	Top-5 acc 74.609 (71.100)	lr 0.02230
Train [26][1840/3239]	Time 0.598 (0.911)	Data Time 0.001 (0.015)	Loss 3.0938 (3.2071)	Entropy 0.84812 (0.85379)	Top-1 acc 49.609 (47.267)	Top-5 acc 72.656 (71.101)	lr 0.02230
Train [26][1850/3239]	Time 0.602 (0.911)	Data Time 0.003 (0.015)	Loss 3.4632 (3.2074)	Entropy 0.84807 (0.85376)	Top-1 acc 39.453 (47.258)	Top-5 acc 66.016 (71.088)	lr 0.02230
Train [26][1860/3239]	Time 0.597 (0.911)	Data Time 0.002 (0.015)	Loss 3.2556 (3.2076)	Entropy 0.84830 (0.85373)	Top-1 acc 43.750 (47.256)	Top-5 acc 70.703 (71.086)	lr 0.02230
Train [26][1870/3239]	Time 0.589 (0.910)	Data Time 0.001 (0.015)	Loss 3.3920 (3.2076)	Entropy 0.84807 (0.85370)	Top-1 acc 40.625 (47.252)	Top-5 acc 69.922 (71.084)	lr 0.02230
Train [26][1880/3239]	Time 0.606 (0.910)	Data Time 0.001 (0.015)	Loss 3.3139 (3.2078)	Entropy 0.84759 (0.85367)	Top-1 acc 48.438 (47.245)	Top-5 acc 66.797 (71.079)	lr 0.02230
Train [26][1890/3239]	Time 0.587 (0.910)	Data Time 0.001 (0.015)	Loss 3.5607 (3.2082)	Entropy 0.84787 (0.85364)	Top-1 acc 41.797 (47.236)	Top-5 acc 62.891 (71.069)	lr 0.02230
Train [26][1900/3239]	Time 0.718 (0.910)	Data Time 0.001 (0.015)	Loss 3.2785 (3.2082)	Entropy 0.84806 (0.85361)	Top-1 acc 46.875 (47.232)	Top-5 acc 69.531 (71.068)	lr 0.02230
Train [26][1910/3239]	Time 0.588 (0.909)	Data Time 0.001 (0.015)	Loss 3.5412 (3.2086)	Entropy 0.84810 (0.85358)	Top-1 acc 39.062 (47.221)	Top-5 acc 66.016 (71.063)	lr 0.02230
Train [26][1920/3239]	Time 0.629 (0.909)	Data Time 0.001 (0.015)	Loss 3.0183 (3.2083)	Entropy 0.84810 (0.85355)	Top-1 acc 50.391 (47.225)	Top-5 acc 76.953 (71.071)	lr 0.02230
Train [26][1930/3239]	Time 0.602 (0.909)	Data Time 0.002 (0.015)	Loss 3.2470 (3.2083)	Entropy 0.84788 (0.85352)	Top-1 acc 46.484 (47.226)	Top-5 acc 69.141 (71.071)	lr 0.02230
Train [26][1940/3239]	Time 0.607 (0.909)	Data Time 0.001 (0.015)	Loss 3.3950 (3.2083)	Entropy 0.84760 (0.85349)	Top-1 acc 44.141 (47.227)	Top-5 acc 65.625 (71.067)	lr 0.02230
Train [26][1950/3239]	Time 0.653 (0.908)	Data Time 0.001 (0.015)	Loss 3.2885 (3.2081)	Entropy 0.84782 (0.85346)	Top-1 acc 46.875 (47.230)	Top-5 acc 69.531 (71.073)	lr 0.02230
Train [26][1960/3239]	Time 0.609 (0.908)	Data Time 0.001 (0.014)	Loss 3.2490 (3.2081)	Entropy 0.84788 (0.85343)	Top-1 acc 45.312 (47.236)	Top-5 acc 69.531 (71.070)	lr 0.02230
Train [26][1970/3239]	Time 0.737 (0.908)	Data Time 0.002 (0.014)	Loss 3.1473 (3.2080)	Entropy 0.84768 (0.85341)	Top-1 acc 46.484 (47.235)	Top-5 acc 72.656 (71.074)	lr 0.02229
Train [26][1980/3239]	Time 0.592 (0.908)	Data Time 0.001 (0.014)	Loss 3.3564 (3.2078)	Entropy 0.84788 (0.85338)	Top-1 acc 44.531 (47.244)	Top-5 acc 66.016 (71.073)	lr 0.02229
Train [26][1990/3239]	Time 0.609 (0.908)	Data Time 0.001 (0.014)	Loss 3.2202 (3.2081)	Entropy 0.84785 (0.85335)	Top-1 acc 47.266 (47.234)	Top-5 acc 71.094 (71.066)	lr 0.02229
Train [26][2000/3239]	Time 0.561 (0.907)	Data Time 0.001 (0.014)	Loss 3.5221 (3.2082)	Entropy 0.84814 (0.85332)	Top-1 acc 39.062 (47.232)	Top-5 acc 64.453 (71.060)	lr 0.02229
Train [26][2010/3239]	Time 0.590 (0.907)	Data Time 0.002 (0.014)	Loss 2.9812 (3.2080)	Entropy 0.84839 (0.85330)	Top-1 acc 55.859 (47.240)	Top-5 acc 73.047 (71.063)	lr 0.02229
Train [26][2020/3239]	Time 0.495 (0.907)	Data Time 0.001 (0.014)	Loss 3.0184 (3.2076)	Entropy 0.84835 (0.85327)	Top-1 acc 53.516 (47.254)	Top-5 acc 73.438 (71.069)	lr 0.02229
Train [26][2030/3239]	Time 0.604 (0.906)	Data Time 0.001 (0.014)	Loss 3.0756 (3.2076)	Entropy 0.84808 (0.85325)	Top-1 acc 50.781 (47.261)	Top-5 acc 76.562 (71.074)	lr 0.02229
Train [26][2040/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.014)	Loss 3.2336 (3.2076)	Entropy 0.84817 (0.85322)	Top-1 acc 47.266 (47.258)	Top-5 acc 69.922 (71.075)	lr 0.02229
Train [26][2050/3239]	Time 0.611 (0.906)	Data Time 0.001 (0.014)	Loss 3.0095 (3.2075)	Entropy 0.84834 (0.85320)	Top-1 acc 53.125 (47.258)	Top-5 acc 74.219 (71.074)	lr 0.02229
Train [26][2060/3239]	Time 0.637 (0.906)	Data Time 0.001 (0.014)	Loss 2.9768 (3.2070)	Entropy 0.84808 (0.85318)	Top-1 acc 53.906 (47.273)	Top-5 acc 76.172 (71.088)	lr 0.02229
Train [26][2070/3239]	Time 0.584 (0.906)	Data Time 0.001 (0.014)	Loss 3.1690 (3.2069)	Entropy 0.84817 (0.85315)	Top-1 acc 51.172 (47.277)	Top-5 acc 71.484 (71.089)	lr 0.02229
Train [26][2080/3239]	Time 0.610 (0.905)	Data Time 0.001 (0.014)	Loss 3.2023 (3.2069)	Entropy 0.84829 (0.85313)	Top-1 acc 46.875 (47.274)	Top-5 acc 68.750 (71.084)	lr 0.02229
Train [26][2090/3239]	Time 0.618 (0.905)	Data Time 0.001 (0.014)	Loss 3.4380 (3.2071)	Entropy 0.84860 (0.85311)	Top-1 acc 43.359 (47.273)	Top-5 acc 66.016 (71.079)	lr 0.02229
Train [26][2100/3239]	Time 0.619 (0.905)	Data Time 0.001 (0.014)	Loss 3.3186 (3.2072)	Entropy 0.84877 (0.85308)	Top-1 acc 42.188 (47.268)	Top-5 acc 67.578 (71.076)	lr 0.02229
Train [26][2110/3239]	Time 0.618 (0.905)	Data Time 0.001 (0.014)	Loss 3.2219 (3.2070)	Entropy 0.84849 (0.85306)	Top-1 acc 46.484 (47.269)	Top-5 acc 71.484 (71.080)	lr 0.02229
Train [26][2120/3239]	Time 0.609 (0.905)	Data Time 0.001 (0.014)	Loss 3.5123 (3.2065)	Entropy 0.84846 (0.85304)	Top-1 acc 42.578 (47.286)	Top-5 acc 68.359 (71.091)	lr 0.02229
Train [26][2130/3239]	Time 0.665 (0.904)	Data Time 0.001 (0.013)	Loss 3.2753 (3.2063)	Entropy 0.84827 (0.85302)	Top-1 acc 44.531 (47.289)	Top-5 acc 71.094 (71.093)	lr 0.02228
Train [26][2140/3239]	Time 0.561 (0.904)	Data Time 0.001 (0.013)	Loss 3.3432 (3.2068)	Entropy 0.84796 (0.85300)	Top-1 acc 45.312 (47.282)	Top-5 acc 65.625 (71.083)	lr 0.02228
Train [26][2150/3239]	Time 0.540 (0.904)	Data Time 0.001 (0.013)	Loss 3.3477 (3.2068)	Entropy 0.84796 (0.85297)	Top-1 acc 44.922 (47.285)	Top-5 acc 68.359 (71.075)	lr 0.02228
Train [26][2160/3239]	Time 0.592 (0.915)	Data Time 0.002 (0.013)	Loss 3.0826 (3.2070)	Entropy 0.84794 (0.85295)	Top-1 acc 53.125 (47.281)	Top-5 acc 75.391 (71.066)	lr 0.02228
Train [26][2170/3239]	Time 0.602 (0.915)	Data Time 0.002 (0.013)	Loss 3.1389 (3.2068)	Entropy 0.84795 (0.85293)	Top-1 acc 47.266 (47.281)	Top-5 acc 72.656 (71.068)	lr 0.02228
Train [26][2180/3239]	Time 0.658 (0.915)	Data Time 0.003 (0.013)	Loss 3.2200 (3.2068)	Entropy 0.84778 (0.85290)	Top-1 acc 42.188 (47.286)	Top-5 acc 73.047 (71.069)	lr 0.02228
Train [26][2190/3239]	Time 0.620 (0.915)	Data Time 0.001 (0.013)	Loss 3.2527 (3.2068)	Entropy 0.84764 (0.85288)	Top-1 acc 50.000 (47.290)	Top-5 acc 71.875 (71.067)	lr 0.02228
Train [26][2200/3239]	Time 0.660 (0.915)	Data Time 0.001 (0.013)	Loss 3.3002 (3.2068)	Entropy 0.84742 (0.85286)	Top-1 acc 45.703 (47.293)	Top-5 acc 67.969 (71.063)	lr 0.02228
Train [26][2210/3239]	Time 0.600 (0.914)	Data Time 0.001 (0.013)	Loss 3.1317 (3.2070)	Entropy 0.84747 (0.85283)	Top-1 acc 49.609 (47.287)	Top-5 acc 71.484 (71.055)	lr 0.02228
Train [26][2220/3239]	Time 0.726 (0.914)	Data Time 0.001 (0.013)	Loss 3.2537 (3.2070)	Entropy 0.84723 (0.85281)	Top-1 acc 45.312 (47.280)	Top-5 acc 71.094 (71.055)	lr 0.02228
Train [26][2230/3239]	Time 0.621 (0.914)	Data Time 0.001 (0.013)	Loss 3.4589 (3.2069)	Entropy 0.84679 (0.85278)	Top-1 acc 40.234 (47.281)	Top-5 acc 66.406 (71.057)	lr 0.02228
Train [26][2240/3239]	Time 0.648 (0.914)	Data Time 0.001 (0.013)	Loss 3.3120 (3.2073)	Entropy 0.84699 (0.85276)	Top-1 acc 49.609 (47.277)	Top-5 acc 67.969 (71.046)	lr 0.02228
Train [26][2250/3239]	Time 0.663 (0.914)	Data Time 0.001 (0.013)	Loss 3.2705 (3.2072)	Entropy 0.84659 (0.85273)	Top-1 acc 45.312 (47.280)	Top-5 acc 68.750 (71.048)	lr 0.02228
Train [26][2260/3239]	Time 0.605 (0.913)	Data Time 0.001 (0.013)	Loss 3.0236 (3.2071)	Entropy 0.84658 (0.85270)	Top-1 acc 50.391 (47.288)	Top-5 acc 75.391 (71.052)	lr 0.02228
Train [26][2270/3239]	Time 0.646 (0.913)	Data Time 0.001 (0.013)	Loss 3.4056 (3.2071)	Entropy 0.84652 (0.85268)	Top-1 acc 45.703 (47.289)	Top-5 acc 65.625 (71.051)	lr 0.02228
Train [26][2280/3239]	Time 0.602 (0.913)	Data Time 0.001 (0.013)	Loss 3.2167 (3.2072)	Entropy 0.84668 (0.85265)	Top-1 acc 46.094 (47.290)	Top-5 acc 67.969 (71.049)	lr 0.02228
Train [26][2290/3239]	Time 0.705 (0.913)	Data Time 0.001 (0.013)	Loss 3.2086 (3.2073)	Entropy 0.84678 (0.85262)	Top-1 acc 51.953 (47.292)	Top-5 acc 70.312 (71.047)	lr 0.02227
Train [26][2300/3239]	Time 0.561 (0.912)	Data Time 0.001 (0.013)	Loss 3.0530 (3.2074)	Entropy 0.84665 (0.85260)	Top-1 acc 48.047 (47.297)	Top-5 acc 72.656 (71.045)	lr 0.02227
Train [26][2310/3239]	Time 0.592 (0.912)	Data Time 0.001 (0.013)	Loss 3.2902 (3.2073)	Entropy 0.84671 (0.85257)	Top-1 acc 44.922 (47.293)	Top-5 acc 70.703 (71.048)	lr 0.02227
Train [26][2320/3239]	Time 0.654 (0.912)	Data Time 0.001 (0.013)	Loss 3.1037 (3.2071)	Entropy 0.84701 (0.85255)	Top-1 acc 53.516 (47.298)	Top-5 acc 72.266 (71.052)	lr 0.02227
Train [26][2330/3239]	Time 0.588 (0.912)	Data Time 0.001 (0.012)	Loss 3.1644 (3.2073)	Entropy 0.84730 (0.85252)	Top-1 acc 51.172 (47.292)	Top-5 acc 72.656 (71.048)	lr 0.02227
Train [26][2340/3239]	Time 0.623 (0.912)	Data Time 0.001 (0.012)	Loss 3.1355 (3.2073)	Entropy 0.84732 (0.85250)	Top-1 acc 47.656 (47.287)	Top-5 acc 73.047 (71.050)	lr 0.02227
Train [26][2350/3239]	Time 0.564 (0.911)	Data Time 0.001 (0.012)	Loss 3.1931 (3.2075)	Entropy 0.84683 (0.85248)	Top-1 acc 46.484 (47.284)	Top-5 acc 70.703 (71.046)	lr 0.02227
Train [26][2360/3239]	Time 0.579 (0.911)	Data Time 0.001 (0.012)	Loss 3.3439 (3.2076)	Entropy 0.84694 (0.85245)	Top-1 acc 44.531 (47.282)	Top-5 acc 64.844 (71.036)	lr 0.02227
Train [26][2370/3239]	Time 0.557 (0.911)	Data Time 0.001 (0.012)	Loss 3.2614 (3.2077)	Entropy 0.84682 (0.85243)	Top-1 acc 46.875 (47.283)	Top-5 acc 70.312 (71.037)	lr 0.02227
Train [26][2380/3239]	Time 0.619 (0.911)	Data Time 0.001 (0.012)	Loss 3.3455 (3.2077)	Entropy 0.84676 (0.85241)	Top-1 acc 42.578 (47.279)	Top-5 acc 69.922 (71.036)	lr 0.02227
Train [26][2390/3239]	Time 0.598 (0.910)	Data Time 0.001 (0.012)	Loss 3.2422 (3.2078)	Entropy 0.84639 (0.85238)	Top-1 acc 48.828 (47.280)	Top-5 acc 72.656 (71.036)	lr 0.02227
Train [26][2400/3239]	Time 0.597 (0.910)	Data Time 0.001 (0.012)	Loss 3.0669 (3.2079)	Entropy 0.84631 (0.85236)	Top-1 acc 50.391 (47.270)	Top-5 acc 71.094 (71.031)	lr 0.02227
Train [26][2410/3239]	Time 0.608 (0.910)	Data Time 0.001 (0.012)	Loss 3.0508 (3.2074)	Entropy 0.84603 (0.85233)	Top-1 acc 53.516 (47.282)	Top-5 acc 75.781 (71.040)	lr 0.02227
Train [26][2420/3239]	Time 0.611 (0.910)	Data Time 0.001 (0.012)	Loss 3.2430 (3.2077)	Entropy 0.84625 (0.85231)	Top-1 acc 42.188 (47.274)	Top-5 acc 69.531 (71.041)	lr 0.02227
Train [26][2430/3239]	Time 0.628 (0.910)	Data Time 0.001 (0.012)	Loss 3.1641 (3.2077)	Entropy 0.84617 (0.85228)	Top-1 acc 44.922 (47.272)	Top-5 acc 75.781 (71.038)	lr 0.02227
Train [26][2440/3239]	Time 0.605 (0.910)	Data Time 0.001 (0.012)	Loss 3.1048 (3.2078)	Entropy 0.84613 (0.85226)	Top-1 acc 51.172 (47.273)	Top-5 acc 74.609 (71.040)	lr 0.02226
Train [26][2450/3239]	Time 0.700 (0.909)	Data Time 0.002 (0.012)	Loss 3.3057 (3.2079)	Entropy 0.84599 (0.85223)	Top-1 acc 44.141 (47.272)	Top-5 acc 67.969 (71.037)	lr 0.02226
Train [26][2460/3239]	Time 0.456 (0.909)	Data Time 0.001 (0.012)	Loss 3.1262 (3.2077)	Entropy 0.84596 (0.85221)	Top-1 acc 52.344 (47.275)	Top-5 acc 72.266 (71.042)	lr 0.02226
Train [26][2470/3239]	Time 0.638 (0.909)	Data Time 0.001 (0.012)	Loss 3.0600 (3.2077)	Entropy 0.84590 (0.85218)	Top-1 acc 51.172 (47.275)	Top-5 acc 75.391 (71.044)	lr 0.02226
Train [26][2480/3239]	Time 0.565 (0.909)	Data Time 0.001 (0.012)	Loss 3.2074 (3.2079)	Entropy 0.84598 (0.85216)	Top-1 acc 47.656 (47.275)	Top-5 acc 71.094 (71.036)	lr 0.02226
Train [26][2490/3239]	Time 0.633 (0.908)	Data Time 0.001 (0.012)	Loss 3.2935 (3.2079)	Entropy 0.84560 (0.85213)	Top-1 acc 49.609 (47.276)	Top-5 acc 70.703 (71.034)	lr 0.02226
Train [26][2500/3239]	Time 0.567 (0.908)	Data Time 0.001 (0.012)	Loss 3.2973 (3.2079)	Entropy 0.84520 (0.85210)	Top-1 acc 46.094 (47.277)	Top-5 acc 69.531 (71.034)	lr 0.02226
Train [26][2510/3239]	Time 0.659 (0.908)	Data Time 0.001 (0.012)	Loss 2.9448 (3.2076)	Entropy 0.84555 (0.85208)	Top-1 acc 50.391 (47.284)	Top-5 acc 77.344 (71.039)	lr 0.02226
Train [26][2520/3239]	Time 0.734 (0.908)	Data Time 0.001 (0.012)	Loss 3.0786 (3.2078)	Entropy 0.84564 (0.85205)	Top-1 acc 48.828 (47.278)	Top-5 acc 73.828 (71.035)	lr 0.02226
Train [26][2530/3239]	Time 0.631 (0.908)	Data Time 0.001 (0.012)	Loss 3.1778 (3.2078)	Entropy 0.84567 (0.85203)	Top-1 acc 44.922 (47.276)	Top-5 acc 72.266 (71.034)	lr 0.02226
Train [26][2540/3239]	Time 0.584 (0.907)	Data Time 0.001 (0.012)	Loss 3.1647 (3.2078)	Entropy 0.84569 (0.85200)	Top-1 acc 46.094 (47.278)	Top-5 acc 71.875 (71.032)	lr 0.02226
Train [26][2550/3239]	Time 0.584 (0.907)	Data Time 0.001 (0.012)	Loss 3.4439 (3.2080)	Entropy 0.84579 (0.85198)	Top-1 acc 44.141 (47.275)	Top-5 acc 63.281 (71.027)	lr 0.02226
Train [26][2560/3239]	Time 0.583 (0.907)	Data Time 0.001 (0.012)	Loss 3.3389 (3.2077)	Entropy 0.84554 (0.85195)	Top-1 acc 44.531 (47.283)	Top-5 acc 69.531 (71.035)	lr 0.02226
Train [26][2570/3239]	Time 0.558 (0.907)	Data Time 0.001 (0.011)	Loss 3.0790 (3.2074)	Entropy 0.84518 (0.85193)	Top-1 acc 52.734 (47.289)	Top-5 acc 72.656 (71.043)	lr 0.02226
Train [26][2580/3239]	Time 0.574 (0.907)	Data Time 0.001 (0.011)	Loss 3.3071 (3.2075)	Entropy 0.84515 (0.85190)	Top-1 acc 47.656 (47.286)	Top-5 acc 69.922 (71.041)	lr 0.02226
Train [26][2590/3239]	Time 0.569 (0.906)	Data Time 0.001 (0.011)	Loss 2.9833 (3.2073)	Entropy 0.84531 (0.85187)	Top-1 acc 50.391 (47.292)	Top-5 acc 76.562 (71.044)	lr 0.02226
Train [26][2600/3239]	Time 0.608 (0.906)	Data Time 0.001 (0.011)	Loss 3.1139 (3.2073)	Entropy 0.84543 (0.85185)	Top-1 acc 51.172 (47.296)	Top-5 acc 71.875 (71.045)	lr 0.02225
Train [26][2610/3239]	Time 0.685 (0.906)	Data Time 0.001 (0.011)	Loss 3.0564 (3.2070)	Entropy 0.84535 (0.85183)	Top-1 acc 50.000 (47.304)	Top-5 acc 76.953 (71.052)	lr 0.02225
Train [26][2620/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.011)	Loss 3.3417 (3.2073)	Entropy 0.84517 (0.85180)	Top-1 acc 50.000 (47.306)	Top-5 acc 67.969 (71.047)	lr 0.02225
Train [26][2630/3239]	Time 0.643 (0.906)	Data Time 0.001 (0.011)	Loss 3.2806 (3.2074)	Entropy 0.84505 (0.85177)	Top-1 acc 50.000 (47.305)	Top-5 acc 66.797 (71.043)	lr 0.02225
Train [26][2640/3239]	Time 0.629 (0.906)	Data Time 0.003 (0.011)	Loss 2.9644 (3.2070)	Entropy 0.84481 (0.85175)	Top-1 acc 52.344 (47.309)	Top-5 acc 76.562 (71.051)	lr 0.02225
Train [26][2650/3239]	Time 0.603 (0.905)	Data Time 0.001 (0.011)	Loss 3.3554 (3.2069)	Entropy 0.84472 (0.85172)	Top-1 acc 45.312 (47.312)	Top-5 acc 68.359 (71.051)	lr 0.02225
Train [26][2660/3239]	Time 0.477 (0.905)	Data Time 0.001 (0.011)	Loss 3.0804 (3.2068)	Entropy 0.84443 (0.85170)	Top-1 acc 53.516 (47.316)	Top-5 acc 71.875 (71.050)	lr 0.02225
Train [26][2670/3239]	Time 0.602 (0.905)	Data Time 0.001 (0.011)	Loss 3.2367 (3.2068)	Entropy 0.84476 (0.85167)	Top-1 acc 48.828 (47.320)	Top-5 acc 71.875 (71.049)	lr 0.02225
Train [26][2680/3239]	Time 0.708 (0.905)	Data Time 0.001 (0.011)	Loss 2.9023 (3.2069)	Entropy 0.84500 (0.85164)	Top-1 acc 53.516 (47.316)	Top-5 acc 78.906 (71.050)	lr 0.02225
Train [26][2690/3239]	Time 0.616 (0.905)	Data Time 0.001 (0.011)	Loss 2.9590 (3.2071)	Entropy 0.84513 (0.85162)	Top-1 acc 55.469 (47.310)	Top-5 acc 74.219 (71.042)	lr 0.02225
Train [26][2700/3239]	Time 0.589 (0.904)	Data Time 0.002 (0.011)	Loss 3.1506 (3.2070)	Entropy 0.84499 (0.85159)	Top-1 acc 49.609 (47.310)	Top-5 acc 71.875 (71.041)	lr 0.02225
Train [26][2710/3239]	Time 0.629 (0.904)	Data Time 0.001 (0.011)	Loss 3.1703 (3.2071)	Entropy 0.84496 (0.85157)	Top-1 acc 49.219 (47.311)	Top-5 acc 71.094 (71.038)	lr 0.02225
Train [26][2720/3239]	Time 0.603 (0.904)	Data Time 0.001 (0.011)	Loss 3.4291 (3.2071)	Entropy 0.84546 (0.85155)	Top-1 acc 42.578 (47.311)	Top-5 acc 69.922 (71.042)	lr 0.02225
Train [26][2730/3239]	Time 0.631 (0.904)	Data Time 0.001 (0.011)	Loss 3.0851 (3.2071)	Entropy 0.84564 (0.85152)	Top-1 acc 52.734 (47.314)	Top-5 acc 71.484 (71.043)	lr 0.02225
Train [26][2740/3239]	Time 0.584 (0.904)	Data Time 0.001 (0.011)	Loss 3.0780 (3.2070)	Entropy 0.84588 (0.85150)	Top-1 acc 46.094 (47.317)	Top-5 acc 74.219 (71.048)	lr 0.02225
Train [26][2750/3239]	Time 0.591 (0.904)	Data Time 0.001 (0.011)	Loss 3.4047 (3.2070)	Entropy 0.84604 (0.85148)	Top-1 acc 43.359 (47.316)	Top-5 acc 67.969 (71.046)	lr 0.02225
Train [26][2760/3239]	Time 0.593 (0.904)	Data Time 0.001 (0.011)	Loss 3.3498 (3.2071)	Entropy 0.84584 (0.85146)	Top-1 acc 47.266 (47.316)	Top-5 acc 69.922 (71.047)	lr 0.02224
Train [26][2770/3239]	Time 0.607 (0.903)	Data Time 0.001 (0.011)	Loss 3.0816 (3.2068)	Entropy 0.84594 (0.85144)	Top-1 acc 49.609 (47.321)	Top-5 acc 71.484 (71.052)	lr 0.02224
Train [26][2780/3239]	Time 0.639 (0.903)	Data Time 0.001 (0.011)	Loss 3.3447 (3.2067)	Entropy 0.84562 (0.85142)	Top-1 acc 43.359 (47.324)	Top-5 acc 67.578 (71.053)	lr 0.02224
Train [26][2790/3239]	Time 0.676 (0.903)	Data Time 0.002 (0.011)	Loss 3.1594 (3.2067)	Entropy 0.84527 (0.85140)	Top-1 acc 46.875 (47.323)	Top-5 acc 69.531 (71.054)	lr 0.02224
Train [26][2800/3239]	Time 0.633 (0.903)	Data Time 0.002 (0.011)	Loss 3.0591 (3.2069)	Entropy 0.84511 (0.85138)	Top-1 acc 53.906 (47.321)	Top-5 acc 77.734 (71.053)	lr 0.02224
Train [26][2810/3239]	Time 0.776 (0.911)	Data Time 0.005 (0.011)	Loss 3.2712 (3.2068)	Entropy 0.84486 (0.85136)	Top-1 acc 47.266 (47.321)	Top-5 acc 66.797 (71.054)	lr 0.02224
Train [26][2820/3239]	Time 0.565 (0.911)	Data Time 0.002 (0.011)	Loss 3.2328 (3.2067)	Entropy 0.84471 (0.85133)	Top-1 acc 47.266 (47.323)	Top-5 acc 71.094 (71.054)	lr 0.02224
Train [26][2830/3239]	Time 0.599 (0.911)	Data Time 0.001 (0.011)	Loss 3.1263 (3.2067)	Entropy 0.84474 (0.85131)	Top-1 acc 48.047 (47.325)	Top-5 acc 68.359 (71.054)	lr 0.02224
Train [26][2840/3239]	Time 0.681 (0.911)	Data Time 0.001 (0.011)	Loss 3.2395 (3.2065)	Entropy 0.84466 (0.85129)	Top-1 acc 48.047 (47.329)	Top-5 acc 70.312 (71.057)	lr 0.02224
Train [26][2850/3239]	Time 0.590 (0.911)	Data Time 0.002 (0.011)	Loss 3.4303 (3.2066)	Entropy 0.84453 (0.85126)	Top-1 acc 42.188 (47.327)	Top-5 acc 65.625 (71.055)	lr 0.02224
Train [26][2860/3239]	Time 0.627 (0.910)	Data Time 0.002 (0.011)	Loss 3.0909 (3.2065)	Entropy 0.84464 (0.85124)	Top-1 acc 50.781 (47.332)	Top-5 acc 71.875 (71.058)	lr 0.02224
Train [26][2870/3239]	Time 0.613 (0.910)	Data Time 0.002 (0.010)	Loss 3.0217 (3.2065)	Entropy 0.84464 (0.85122)	Top-1 acc 48.828 (47.328)	Top-5 acc 74.609 (71.060)	lr 0.02224
Train [26][2880/3239]	Time 0.607 (0.910)	Data Time 0.001 (0.010)	Loss 3.1050 (3.2064)	Entropy 0.84460 (0.85119)	Top-1 acc 49.609 (47.333)	Top-5 acc 71.484 (71.061)	lr 0.02224
Train [26][2890/3239]	Time 0.577 (0.910)	Data Time 0.001 (0.010)	Loss 3.0944 (3.2064)	Entropy 0.84423 (0.85117)	Top-1 acc 46.484 (47.332)	Top-5 acc 70.703 (71.062)	lr 0.02224
Train [26][2900/3239]	Time 0.592 (0.910)	Data Time 0.001 (0.010)	Loss 3.1648 (3.2062)	Entropy 0.84419 (0.85115)	Top-1 acc 48.438 (47.338)	Top-5 acc 71.484 (71.062)	lr 0.02224
Train [26][2910/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.010)	Loss 3.2725 (3.2063)	Entropy 0.84388 (0.85112)	Top-1 acc 44.922 (47.337)	Top-5 acc 68.359 (71.058)	lr 0.02224
Train [26][2920/3239]	Time 0.653 (0.910)	Data Time 0.001 (0.010)	Loss 3.0718 (3.2062)	Entropy 0.84351 (0.85110)	Top-1 acc 51.172 (47.341)	Top-5 acc 72.266 (71.061)	lr 0.02223
Train [26][2930/3239]	Time 0.480 (0.909)	Data Time 0.001 (0.010)	Loss 3.2676 (3.2062)	Entropy 0.84361 (0.85107)	Top-1 acc 46.875 (47.337)	Top-5 acc 71.094 (71.063)	lr 0.02223
Train [26][2940/3239]	Time 0.628 (0.909)	Data Time 0.001 (0.010)	Loss 3.1187 (3.2063)	Entropy 0.84351 (0.85105)	Top-1 acc 51.172 (47.334)	Top-5 acc 74.219 (71.061)	lr 0.02223
Train [26][2950/3239]	Time 0.573 (0.909)	Data Time 0.001 (0.010)	Loss 3.1162 (3.2062)	Entropy 0.84396 (0.85102)	Top-1 acc 47.656 (47.337)	Top-5 acc 72.656 (71.062)	lr 0.02223
Train [26][2960/3239]	Time 0.618 (0.909)	Data Time 0.001 (0.010)	Loss 3.3036 (3.2062)	Entropy 0.84370 (0.85100)	Top-1 acc 44.531 (47.340)	Top-5 acc 65.234 (71.063)	lr 0.02223
Train [26][2970/3239]	Time 0.654 (0.908)	Data Time 0.001 (0.010)	Loss 3.2419 (3.2063)	Entropy 0.84362 (0.85097)	Top-1 acc 47.266 (47.336)	Top-5 acc 69.922 (71.062)	lr 0.02223
Train [26][2980/3239]	Time 0.609 (0.908)	Data Time 0.001 (0.010)	Loss 3.1420 (3.2062)	Entropy 0.84376 (0.85095)	Top-1 acc 49.609 (47.338)	Top-5 acc 72.266 (71.061)	lr 0.02223
Train [26][2990/3239]	Time 0.588 (0.908)	Data Time 0.001 (0.010)	Loss 3.4816 (3.2065)	Entropy 0.84361 (0.85092)	Top-1 acc 43.359 (47.336)	Top-5 acc 64.844 (71.056)	lr 0.02223
Train [26][3000/3239]	Time 0.699 (0.908)	Data Time 0.001 (0.010)	Loss 3.2135 (3.2068)	Entropy 0.84331 (0.85090)	Top-1 acc 44.141 (47.326)	Top-5 acc 71.094 (71.049)	lr 0.02223
Train [26][3010/3239]	Time 0.658 (0.908)	Data Time 0.002 (0.010)	Loss 3.0912 (3.2067)	Entropy 0.84326 (0.85088)	Top-1 acc 49.219 (47.328)	Top-5 acc 75.000 (71.053)	lr 0.02223
Train [26][3020/3239]	Time 0.568 (0.908)	Data Time 0.001 (0.010)	Loss 3.0569 (3.2066)	Entropy 0.84284 (0.85085)	Top-1 acc 52.344 (47.328)	Top-5 acc 74.219 (71.053)	lr 0.02223
Train [26][3030/3239]	Time 0.615 (0.908)	Data Time 0.001 (0.010)	Loss 3.2989 (3.2066)	Entropy 0.84243 (0.85082)	Top-1 acc 42.969 (47.326)	Top-5 acc 67.969 (71.050)	lr 0.02223
Train [26][3040/3239]	Time 0.594 (0.907)	Data Time 0.001 (0.010)	Loss 3.0797 (3.2065)	Entropy 0.84272 (0.85080)	Top-1 acc 51.172 (47.332)	Top-5 acc 75.000 (71.052)	lr 0.02223
Train [26][3050/3239]	Time 0.619 (0.907)	Data Time 0.001 (0.010)	Loss 3.1674 (3.2064)	Entropy 0.84302 (0.85077)	Top-1 acc 49.219 (47.333)	Top-5 acc 71.094 (71.054)	lr 0.02223
Train [26][3060/3239]	Time 0.608 (0.907)	Data Time 0.002 (0.010)	Loss 3.3762 (3.2062)	Entropy 0.84343 (0.85074)	Top-1 acc 42.578 (47.335)	Top-5 acc 69.531 (71.060)	lr 0.02223
Train [26][3070/3239]	Time 0.681 (0.907)	Data Time 0.001 (0.010)	Loss 3.1396 (3.2060)	Entropy 0.84346 (0.85072)	Top-1 acc 48.047 (47.337)	Top-5 acc 72.266 (71.068)	lr 0.02223
Train [26][3080/3239]	Time 0.578 (0.907)	Data Time 0.001 (0.010)	Loss 3.2669 (3.2059)	Entropy 0.84320 (0.85070)	Top-1 acc 42.578 (47.339)	Top-5 acc 69.922 (71.070)	lr 0.02222
Train [26][3090/3239]	Time 0.608 (0.907)	Data Time 0.001 (0.010)	Loss 3.3430 (3.2059)	Entropy 0.84339 (0.85067)	Top-1 acc 43.750 (47.342)	Top-5 acc 67.578 (71.067)	lr 0.02222
Train [26][3100/3239]	Time 0.569 (0.907)	Data Time 0.001 (0.010)	Loss 3.1964 (3.2058)	Entropy 0.84310 (0.85065)	Top-1 acc 44.531 (47.346)	Top-5 acc 71.484 (71.070)	lr 0.02222
Train [26][3110/3239]	Time 0.587 (0.906)	Data Time 0.001 (0.010)	Loss 3.2413 (3.2057)	Entropy 0.84269 (0.85062)	Top-1 acc 47.266 (47.351)	Top-5 acc 69.141 (71.074)	lr 0.02222
Train [26][3120/3239]	Time 0.639 (0.906)	Data Time 0.003 (0.010)	Loss 3.3652 (3.2057)	Entropy 0.84309 (0.85060)	Top-1 acc 44.922 (47.349)	Top-5 acc 68.359 (71.071)	lr 0.02222
Train [26][3130/3239]	Time 0.660 (0.906)	Data Time 0.002 (0.010)	Loss 3.1033 (3.2057)	Entropy 0.84360 (0.85058)	Top-1 acc 50.781 (47.350)	Top-5 acc 70.703 (71.072)	lr 0.02222
Train [26][3140/3239]	Time 0.575 (0.906)	Data Time 0.001 (0.010)	Loss 3.2477 (3.2056)	Entropy 0.84278 (0.85055)	Top-1 acc 44.531 (47.348)	Top-5 acc 73.047 (71.074)	lr 0.02222
Train [26][3150/3239]	Time 0.622 (0.906)	Data Time 0.001 (0.010)	Loss 3.3525 (3.2056)	Entropy 0.84294 (0.85053)	Top-1 acc 46.094 (47.346)	Top-5 acc 66.797 (71.071)	lr 0.02222
Train [26][3160/3239]	Time 0.701 (0.906)	Data Time 0.001 (0.010)	Loss 3.1993 (3.2058)	Entropy 0.84290 (0.85050)	Top-1 acc 43.750 (47.345)	Top-5 acc 72.266 (71.068)	lr 0.02222
Train [26][3170/3239]	Time 0.596 (0.905)	Data Time 0.001 (0.010)	Loss 2.9131 (3.2060)	Entropy 0.84295 (0.85048)	Top-1 acc 50.781 (47.337)	Top-5 acc 77.734 (71.064)	lr 0.02222
Train [26][3180/3239]	Time 0.601 (0.905)	Data Time 0.000 (0.010)	Loss 2.9431 (3.2058)	Entropy 0.84315 (0.85046)	Top-1 acc 55.078 (47.340)	Top-5 acc 76.953 (71.070)	lr 0.02222
Train [26][3190/3239]	Time 0.609 (0.905)	Data Time 0.000 (0.010)	Loss 3.4003 (3.2059)	Entropy 0.84289 (0.85043)	Top-1 acc 42.969 (47.337)	Top-5 acc 67.578 (71.066)	lr 0.02222
Train [26][3200/3239]	Time 0.624 (0.905)	Data Time 0.000 (0.010)	Loss 3.3418 (3.2059)	Entropy 0.84278 (0.85041)	Top-1 acc 43.750 (47.338)	Top-5 acc 69.922 (71.070)	lr 0.02222
Train [26][3210/3239]	Time 0.578 (0.905)	Data Time 0.000 (0.010)	Loss 3.2911 (3.2060)	Entropy 0.84284 (0.85039)	Top-1 acc 46.094 (47.335)	Top-5 acc 73.438 (71.069)	lr 0.02222
Train [26][3220/3239]	Time 0.630 (0.905)	Data Time 0.000 (0.010)	Loss 3.3221 (3.2059)	Entropy 0.84321 (0.85036)	Top-1 acc 45.312 (47.336)	Top-5 acc 70.312 (71.072)	lr 0.02222
Train [26][3230/3239]	Time 0.703 (0.904)	Data Time 0.000 (0.010)	Loss 3.1605 (3.2059)	Entropy 0.84307 (0.85034)	Top-1 acc 47.656 (47.336)	Top-5 acc 73.047 (71.071)	lr 0.02221
Train [26][3239/3239]	Time 1.592 (0.904)	Data Time 0.000 (0.010)	Loss 3.0677 (3.2059)	Entropy 0.84315 (0.85032)	Top-1 acc 49.383 (47.336)	Top-5 acc 71.605 (71.073)	lr 0.02221
==========Valid [26/120]	loss 1.915	top-1 acc 57.160 (57.160)	top-5 acc 80.000	Train top-1 47.336	top-5 71.073	Entropy 0.84315	Latency-None: 0.000ms	Flops: 539.76M
Train [27][0/3239]	Time 23.028 (23.028)	Data Time 21.121 (21.121)	Loss 2.9878 (2.9878)	Entropy 0.84292 (0.84292)	Top-1 acc 50.000 (50.000)	Top-5 acc 75.000 (75.000)	lr 0.02221
Train [27][10/3239]	Time 0.621 (2.971)	Data Time 0.001 (1.923)	Loss 3.1613 (3.1449)	Entropy 0.84259 (0.84262)	Top-1 acc 49.219 (48.722)	Top-5 acc 69.531 (71.839)	lr 0.02221
Train [27][20/3239]	Time 0.600 (1.969)	Data Time 0.001 (1.008)	Loss 3.3005 (3.1672)	Entropy 0.84278 (0.84262)	Top-1 acc 43.750 (48.196)	Top-5 acc 69.531 (71.968)	lr 0.02221
Train [27][30/3239]	Time 0.598 (1.607)	Data Time 0.001 (0.683)	Loss 3.1032 (3.1838)	Entropy 0.84307 (0.84270)	Top-1 acc 51.172 (48.248)	Top-5 acc 71.484 (71.497)	lr 0.02221
Train [27][40/3239]	Time 0.630 (1.428)	Data Time 0.001 (0.517)	Loss 3.2041 (3.1880)	Entropy 0.84313 (0.84279)	Top-1 acc 50.391 (48.009)	Top-5 acc 70.312 (71.322)	lr 0.02221
Train [27][50/3239]	Time 0.586 (1.316)	Data Time 0.001 (0.416)	Loss 3.0221 (3.1998)	Entropy 0.84271 (0.84284)	Top-1 acc 50.391 (47.679)	Top-5 acc 75.781 (71.147)	lr 0.02221
Train [27][60/3239]	Time 0.702 (1.241)	Data Time 0.001 (0.348)	Loss 3.0386 (3.1892)	Entropy 0.84233 (0.84279)	Top-1 acc 48.047 (47.772)	Top-5 acc 76.172 (71.420)	lr 0.02221
Train [27][70/3239]	Time 0.616 (1.185)	Data Time 0.001 (0.299)	Loss 3.1168 (3.1911)	Entropy 0.84210 (0.84271)	Top-1 acc 50.781 (47.695)	Top-5 acc 71.875 (71.380)	lr 0.02221
Train [27][80/3239]	Time 0.570 (1.141)	Data Time 0.001 (0.263)	Loss 3.2228 (3.1897)	Entropy 0.84236 (0.84265)	Top-1 acc 47.266 (47.815)	Top-5 acc 68.359 (71.388)	lr 0.02221
Train [27][90/3239]	Time 0.598 (1.109)	Data Time 0.001 (0.234)	Loss 3.3606 (3.1877)	Entropy 0.84206 (0.84261)	Top-1 acc 48.828 (47.991)	Top-5 acc 70.312 (71.441)	lr 0.02221
Train [27][100/3239]	Time 0.620 (1.084)	Data Time 0.001 (0.211)	Loss 3.1226 (3.1836)	Entropy 0.84152 (0.84253)	Top-1 acc 50.391 (48.028)	Top-5 acc 71.875 (71.539)	lr 0.02221
Train [27][110/3239]	Time 0.603 (1.064)	Data Time 0.001 (0.192)	Loss 3.0275 (3.1797)	Entropy 0.84164 (0.84244)	Top-1 acc 49.609 (48.128)	Top-5 acc 75.391 (71.650)	lr 0.02221
Train [27][120/3239]	Time 0.617 (1.047)	Data Time 0.001 (0.177)	Loss 2.9554 (3.1759)	Entropy 0.84131 (0.84237)	Top-1 acc 51.953 (48.170)	Top-5 acc 76.172 (71.710)	lr 0.02221
Train [27][130/3239]	Time 0.711 (1.032)	Data Time 0.001 (0.163)	Loss 3.0743 (3.1753)	Entropy 0.84161 (0.84229)	Top-1 acc 53.125 (48.169)	Top-5 acc 70.703 (71.672)	lr 0.02221
Train [27][140/3239]	Time 0.658 (1.021)	Data Time 0.001 (0.152)	Loss 3.1324 (3.1723)	Entropy 0.84137 (0.84224)	Top-1 acc 52.734 (48.246)	Top-5 acc 71.875 (71.698)	lr 0.02221
Train [27][150/3239]	Time 0.623 (1.009)	Data Time 0.001 (0.142)	Loss 3.3805 (3.1762)	Entropy 0.84101 (0.84218)	Top-1 acc 45.703 (48.223)	Top-5 acc 67.188 (71.621)	lr 0.02220
Train [27][160/3239]	Time 0.609 (1.001)	Data Time 0.001 (0.133)	Loss 3.4654 (3.1736)	Entropy 0.84119 (0.84211)	Top-1 acc 44.531 (48.321)	Top-5 acc 65.234 (71.693)	lr 0.02220
Train [27][170/3239]	Time 0.584 (0.992)	Data Time 0.001 (0.125)	Loss 2.9879 (3.1728)	Entropy 0.84155 (0.84206)	Top-1 acc 54.688 (48.364)	Top-5 acc 76.953 (71.745)	lr 0.02220
Train [27][180/3239]	Time 0.615 (0.986)	Data Time 0.001 (0.119)	Loss 3.1544 (3.1747)	Entropy 0.84133 (0.84202)	Top-1 acc 50.781 (48.362)	Top-5 acc 70.312 (71.702)	lr 0.02220
Train [27][190/3239]	Time 0.620 (0.979)	Data Time 0.001 (0.113)	Loss 3.4207 (3.1789)	Entropy 0.84141 (0.84199)	Top-1 acc 46.875 (48.237)	Top-5 acc 64.453 (71.580)	lr 0.02220
Train [27][200/3239]	Time 0.595 (0.974)	Data Time 0.001 (0.107)	Loss 3.2222 (3.1795)	Entropy 0.84153 (0.84197)	Top-1 acc 43.750 (48.224)	Top-5 acc 71.875 (71.560)	lr 0.02220
Train [27][210/3239]	Time 0.609 (0.968)	Data Time 0.001 (0.102)	Loss 3.2655 (3.1799)	Entropy 0.84178 (0.84195)	Top-1 acc 47.266 (48.195)	Top-5 acc 71.094 (71.573)	lr 0.02220
Train [27][220/3239]	Time 0.719 (0.964)	Data Time 0.001 (0.098)	Loss 3.0759 (3.1767)	Entropy 0.84184 (0.84195)	Top-1 acc 50.000 (48.194)	Top-5 acc 74.219 (71.643)	lr 0.02220
Train [27][230/3239]	Time 0.569 (1.072)	Data Time 0.002 (0.093)	Loss 2.9580 (3.1762)	Entropy 0.84196 (0.84194)	Top-1 acc 50.000 (48.191)	Top-5 acc 75.000 (71.648)	lr 0.02220
Train [27][240/3239]	Time 0.607 (1.063)	Data Time 0.002 (0.090)	Loss 3.3856 (3.1777)	Entropy 0.84208 (0.84194)	Top-1 acc 45.312 (48.157)	Top-5 acc 69.922 (71.664)	lr 0.02220
Train [27][250/3239]	Time 0.591 (1.055)	Data Time 0.002 (0.086)	Loss 3.3381 (3.1789)	Entropy 0.84234 (0.84195)	Top-1 acc 41.797 (48.159)	Top-5 acc 69.922 (71.635)	lr 0.02220
Train [27][260/3239]	Time 0.584 (1.048)	Data Time 0.001 (0.083)	Loss 3.0425 (3.1776)	Entropy 0.84213 (0.84196)	Top-1 acc 51.172 (48.170)	Top-5 acc 74.219 (71.703)	lr 0.02220
Train [27][270/3239]	Time 0.574 (1.041)	Data Time 0.001 (0.080)	Loss 3.0318 (3.1776)	Entropy 0.84162 (0.84196)	Top-1 acc 50.391 (48.175)	Top-5 acc 75.391 (71.685)	lr 0.02220
Train [27][280/3239]	Time 0.603 (1.035)	Data Time 0.001 (0.077)	Loss 3.2033 (3.1790)	Entropy 0.84143 (0.84195)	Top-1 acc 46.875 (48.144)	Top-5 acc 70.312 (71.629)	lr 0.02220
Train [27][290/3239]	Time 0.704 (1.030)	Data Time 0.001 (0.075)	Loss 3.2083 (3.1799)	Entropy 0.84140 (0.84193)	Top-1 acc 47.266 (48.144)	Top-5 acc 72.266 (71.607)	lr 0.02220
Train [27][300/3239]	Time 0.592 (1.024)	Data Time 0.001 (0.072)	Loss 3.0050 (3.1773)	Entropy 0.84135 (0.84192)	Top-1 acc 49.609 (48.195)	Top-5 acc 75.391 (71.634)	lr 0.02220
Train [27][310/3239]	Time 0.625 (1.018)	Data Time 0.001 (0.070)	Loss 3.2092 (3.1771)	Entropy 0.84127 (0.84190)	Top-1 acc 48.438 (48.219)	Top-5 acc 70.703 (71.634)	lr 0.02219
Train [27][320/3239]	Time 0.608 (1.014)	Data Time 0.001 (0.068)	Loss 3.0638 (3.1786)	Entropy 0.84166 (0.84188)	Top-1 acc 49.609 (48.182)	Top-5 acc 74.219 (71.598)	lr 0.02219
Train [27][330/3239]	Time 0.603 (1.009)	Data Time 0.001 (0.066)	Loss 3.2085 (3.1775)	Entropy 0.84160 (0.84187)	Top-1 acc 50.391 (48.220)	Top-5 acc 71.094 (71.620)	lr 0.02219
Train [27][340/3239]	Time 0.547 (1.005)	Data Time 0.001 (0.064)	Loss 3.1116 (3.1744)	Entropy 0.84195 (0.84187)	Top-1 acc 48.047 (48.239)	Top-5 acc 73.438 (71.691)	lr 0.02219
Train [27][350/3239]	Time 0.610 (1.001)	Data Time 0.001 (0.062)	Loss 3.1225 (3.1735)	Entropy 0.84209 (0.84187)	Top-1 acc 48.047 (48.265)	Top-5 acc 71.094 (71.697)	lr 0.02219
Train [27][360/3239]	Time 0.619 (0.997)	Data Time 0.001 (0.060)	Loss 3.4198 (3.1761)	Entropy 0.84179 (0.84187)	Top-1 acc 41.797 (48.194)	Top-5 acc 63.672 (71.656)	lr 0.02219
Train [27][370/3239]	Time 0.592 (0.992)	Data Time 0.001 (0.059)	Loss 3.1142 (3.1784)	Entropy 0.84175 (0.84187)	Top-1 acc 49.219 (48.129)	Top-5 acc 74.609 (71.629)	lr 0.02219
Train [27][380/3239]	Time 0.704 (0.988)	Data Time 0.001 (0.057)	Loss 3.1055 (3.1799)	Entropy 0.84181 (0.84187)	Top-1 acc 47.656 (48.064)	Top-5 acc 71.484 (71.594)	lr 0.02219
Train [27][390/3239]	Time 0.580 (0.985)	Data Time 0.001 (0.056)	Loss 3.2925 (3.1805)	Entropy 0.84181 (0.84186)	Top-1 acc 46.094 (48.046)	Top-5 acc 67.969 (71.579)	lr 0.02219
Train [27][400/3239]	Time 0.575 (0.982)	Data Time 0.001 (0.055)	Loss 3.0775 (3.1822)	Entropy 0.84118 (0.84185)	Top-1 acc 52.344 (48.003)	Top-5 acc 72.656 (71.524)	lr 0.02219
Train [27][410/3239]	Time 0.614 (0.980)	Data Time 0.001 (0.053)	Loss 3.1138 (3.1823)	Entropy 0.84142 (0.84184)	Top-1 acc 47.266 (47.977)	Top-5 acc 72.656 (71.526)	lr 0.02219
Train [27][420/3239]	Time 0.603 (0.977)	Data Time 0.001 (0.052)	Loss 3.2386 (3.1838)	Entropy 0.84133 (0.84183)	Top-1 acc 45.312 (47.940)	Top-5 acc 72.656 (71.506)	lr 0.02219
Train [27][430/3239]	Time 0.583 (0.974)	Data Time 0.001 (0.051)	Loss 3.1312 (3.1857)	Entropy 0.84120 (0.84182)	Top-1 acc 48.828 (47.876)	Top-5 acc 72.266 (71.456)	lr 0.02219
Train [27][440/3239]	Time 0.614 (0.972)	Data Time 0.001 (0.050)	Loss 3.2157 (3.1854)	Entropy 0.84145 (0.84180)	Top-1 acc 46.094 (47.885)	Top-5 acc 70.703 (71.451)	lr 0.02219
Train [27][450/3239]	Time 0.706 (0.969)	Data Time 0.001 (0.049)	Loss 2.8147 (3.1856)	Entropy 0.84103 (0.84179)	Top-1 acc 58.203 (47.876)	Top-5 acc 76.172 (71.454)	lr 0.02219
Train [27][460/3239]	Time 0.614 (0.967)	Data Time 0.001 (0.048)	Loss 3.2303 (3.1855)	Entropy 0.84102 (0.84178)	Top-1 acc 48.047 (47.884)	Top-5 acc 69.531 (71.472)	lr 0.02219
Train [27][470/3239]	Time 0.579 (0.965)	Data Time 0.001 (0.047)	Loss 3.1946 (3.1852)	Entropy 0.84087 (0.84176)	Top-1 acc 46.094 (47.887)	Top-5 acc 69.141 (71.472)	lr 0.02218
Train [27][480/3239]	Time 0.618 (0.963)	Data Time 0.001 (0.046)	Loss 3.1923 (3.1826)	Entropy 0.84049 (0.84174)	Top-1 acc 48.438 (47.940)	Top-5 acc 71.094 (71.529)	lr 0.02218
Train [27][490/3239]	Time 0.602 (0.961)	Data Time 0.001 (0.045)	Loss 3.4286 (3.1830)	Entropy 0.84008 (0.84171)	Top-1 acc 41.406 (47.929)	Top-5 acc 66.406 (71.503)	lr 0.02218
Train [27][500/3239]	Time 0.616 (0.959)	Data Time 0.001 (0.044)	Loss 2.9859 (3.1824)	Entropy 0.84018 (0.84168)	Top-1 acc 54.688 (47.956)	Top-5 acc 73.438 (71.508)	lr 0.02218
Train [27][510/3239]	Time 0.618 (0.957)	Data Time 0.001 (0.043)	Loss 3.2436 (3.1828)	Entropy 0.83999 (0.84164)	Top-1 acc 47.266 (47.949)	Top-5 acc 70.703 (71.500)	lr 0.02218
Train [27][520/3239]	Time 0.601 (0.955)	Data Time 0.001 (0.043)	Loss 3.1602 (3.1823)	Entropy 0.84023 (0.84161)	Top-1 acc 47.266 (47.946)	Top-5 acc 73.828 (71.495)	lr 0.02218
Train [27][530/3239]	Time 0.611 (0.953)	Data Time 0.001 (0.042)	Loss 3.2510 (3.1822)	Entropy 0.84026 (0.84159)	Top-1 acc 46.484 (47.955)	Top-5 acc 71.094 (71.513)	lr 0.02218
Train [27][540/3239]	Time 0.645 (0.951)	Data Time 0.001 (0.041)	Loss 3.1863 (3.1819)	Entropy 0.84033 (0.84157)	Top-1 acc 46.094 (47.965)	Top-5 acc 71.484 (71.536)	lr 0.02218
Train [27][550/3239]	Time 0.454 (0.949)	Data Time 0.001 (0.040)	Loss 3.0761 (3.1823)	Entropy 0.84016 (0.84154)	Top-1 acc 47.266 (47.941)	Top-5 acc 76.953 (71.529)	lr 0.02218
Train [27][560/3239]	Time 0.641 (0.947)	Data Time 0.001 (0.040)	Loss 2.9704 (3.1811)	Entropy 0.83948 (0.84152)	Top-1 acc 51.172 (47.951)	Top-5 acc 77.344 (71.541)	lr 0.02218
Train [27][570/3239]	Time 0.592 (0.946)	Data Time 0.001 (0.039)	Loss 3.2815 (3.1798)	Entropy 0.83905 (0.84147)	Top-1 acc 50.000 (48.006)	Top-5 acc 71.484 (71.560)	lr 0.02218
Train [27][580/3239]	Time 0.618 (0.944)	Data Time 0.001 (0.038)	Loss 3.0278 (3.1795)	Entropy 0.83945 (0.84143)	Top-1 acc 48.828 (48.003)	Top-5 acc 77.344 (71.563)	lr 0.02218
Train [27][590/3239]	Time 0.616 (0.943)	Data Time 0.001 (0.038)	Loss 3.3402 (3.1794)	Entropy 0.83954 (0.84140)	Top-1 acc 44.141 (48.028)	Top-5 acc 66.797 (71.550)	lr 0.02218
Train [27][600/3239]	Time 0.643 (0.942)	Data Time 0.001 (0.037)	Loss 3.0402 (3.1786)	Entropy 0.83963 (0.84137)	Top-1 acc 48.828 (48.042)	Top-5 acc 74.219 (71.570)	lr 0.02218
Train [27][610/3239]	Time 0.683 (0.940)	Data Time 0.001 (0.037)	Loss 3.2476 (3.1787)	Entropy 0.83968 (0.84134)	Top-1 acc 49.609 (48.051)	Top-5 acc 72.656 (71.573)	lr 0.02218
Train [27][620/3239]	Time 0.639 (0.939)	Data Time 0.001 (0.036)	Loss 3.1158 (3.1787)	Entropy 0.83966 (0.84132)	Top-1 acc 50.781 (48.064)	Top-5 acc 72.266 (71.567)	lr 0.02217
Train [27][630/3239]	Time 0.595 (0.937)	Data Time 0.001 (0.035)	Loss 3.1858 (3.1791)	Entropy 0.83979 (0.84129)	Top-1 acc 48.047 (48.056)	Top-5 acc 71.484 (71.565)	lr 0.02217
Train [27][640/3239]	Time 0.630 (0.936)	Data Time 0.001 (0.035)	Loss 3.1868 (3.1793)	Entropy 0.83979 (0.84127)	Top-1 acc 48.438 (48.051)	Top-5 acc 71.094 (71.551)	lr 0.02217
Train [27][650/3239]	Time 0.623 (0.935)	Data Time 0.001 (0.034)	Loss 3.0182 (3.1793)	Entropy 0.83935 (0.84124)	Top-1 acc 54.688 (48.061)	Top-5 acc 75.391 (71.548)	lr 0.02217
Train [27][660/3239]	Time 0.617 (0.934)	Data Time 0.001 (0.034)	Loss 3.0358 (3.1797)	Entropy 0.83944 (0.84122)	Top-1 acc 48.438 (48.056)	Top-5 acc 71.875 (71.538)	lr 0.02217
Train [27][670/3239]	Time 0.665 (0.933)	Data Time 0.001 (0.033)	Loss 3.3823 (3.1799)	Entropy 0.83925 (0.84119)	Top-1 acc 42.188 (48.048)	Top-5 acc 67.969 (71.535)	lr 0.02217
Train [27][680/3239]	Time 0.620 (0.932)	Data Time 0.001 (0.033)	Loss 3.1251 (3.1803)	Entropy 0.83927 (0.84116)	Top-1 acc 49.219 (48.041)	Top-5 acc 71.094 (71.514)	lr 0.02217
Train [27][690/3239]	Time 0.614 (0.931)	Data Time 0.001 (0.033)	Loss 3.2389 (3.1811)	Entropy 0.83906 (0.84113)	Top-1 acc 47.656 (48.014)	Top-5 acc 71.094 (71.491)	lr 0.02217
Train [27][700/3239]	Time 0.619 (0.930)	Data Time 0.001 (0.032)	Loss 3.1414 (3.1817)	Entropy 0.83910 (0.84110)	Top-1 acc 50.781 (47.986)	Top-5 acc 73.438 (71.487)	lr 0.02217
Train [27][710/3239]	Time 0.588 (0.929)	Data Time 0.001 (0.032)	Loss 3.2275 (3.1816)	Entropy 0.83906 (0.84107)	Top-1 acc 48.047 (47.989)	Top-5 acc 69.141 (71.477)	lr 0.02217
Train [27][720/3239]	Time 0.594 (0.927)	Data Time 0.001 (0.031)	Loss 3.2058 (3.1816)	Entropy 0.83884 (0.84104)	Top-1 acc 48.047 (47.989)	Top-5 acc 70.312 (71.473)	lr 0.02217
Train [27][730/3239]	Time 0.594 (0.926)	Data Time 0.001 (0.031)	Loss 3.2087 (3.1820)	Entropy 0.83867 (0.84101)	Top-1 acc 48.828 (47.985)	Top-5 acc 72.656 (71.462)	lr 0.02217
Train [27][740/3239]	Time 0.644 (0.925)	Data Time 0.001 (0.030)	Loss 3.2646 (3.1822)	Entropy 0.83870 (0.84098)	Top-1 acc 47.266 (47.987)	Top-5 acc 68.359 (71.466)	lr 0.02217
Train [27][750/3239]	Time 0.631 (0.924)	Data Time 0.001 (0.030)	Loss 3.1161 (3.1820)	Entropy 0.83855 (0.84095)	Top-1 acc 51.172 (47.994)	Top-5 acc 73.438 (71.480)	lr 0.02217
Train [27][760/3239]	Time 0.598 (0.924)	Data Time 0.001 (0.030)	Loss 3.2735 (3.1829)	Entropy 0.83836 (0.84092)	Top-1 acc 46.484 (47.986)	Top-5 acc 67.969 (71.452)	lr 0.02217
Train [27][770/3239]	Time 0.695 (0.923)	Data Time 0.001 (0.029)	Loss 3.0579 (3.1820)	Entropy 0.83831 (0.84089)	Top-1 acc 50.000 (48.004)	Top-5 acc 73.828 (71.474)	lr 0.02217
Train [27][780/3239]	Time 0.598 (0.922)	Data Time 0.001 (0.029)	Loss 3.2114 (3.1821)	Entropy 0.83812 (0.84085)	Top-1 acc 45.703 (48.001)	Top-5 acc 74.219 (71.482)	lr 0.02216
Train [27][790/3239]	Time 0.595 (0.921)	Data Time 0.001 (0.029)	Loss 2.9990 (3.1818)	Entropy 0.83815 (0.84082)	Top-1 acc 51.953 (48.010)	Top-5 acc 76.562 (71.490)	lr 0.02216
Train [27][800/3239]	Time 0.565 (0.921)	Data Time 0.002 (0.028)	Loss 3.2784 (3.1827)	Entropy 0.83758 (0.84078)	Top-1 acc 45.703 (47.995)	Top-5 acc 69.922 (71.467)	lr 0.02216
Train [27][810/3239]	Time 0.624 (0.920)	Data Time 0.002 (0.028)	Loss 3.1574 (3.1825)	Entropy 0.83806 (0.84075)	Top-1 acc 46.094 (47.988)	Top-5 acc 71.875 (71.473)	lr 0.02216
Train [27][820/3239]	Time 0.607 (0.919)	Data Time 0.001 (0.028)	Loss 3.2335 (3.1833)	Entropy 0.83836 (0.84071)	Top-1 acc 46.484 (47.975)	Top-5 acc 71.875 (71.460)	lr 0.02216
Train [27][830/3239]	Time 0.595 (0.918)	Data Time 0.001 (0.027)	Loss 3.2523 (3.1827)	Entropy 0.83832 (0.84069)	Top-1 acc 48.438 (47.996)	Top-5 acc 69.141 (71.470)	lr 0.02216
Train [27][840/3239]	Time 0.686 (0.918)	Data Time 0.001 (0.027)	Loss 3.2073 (3.1825)	Entropy 0.83808 (0.84065)	Top-1 acc 44.141 (48.000)	Top-5 acc 72.656 (71.476)	lr 0.02216
Train [27][850/3239]	Time 0.642 (0.917)	Data Time 0.001 (0.027)	Loss 2.9893 (3.1826)	Entropy 0.83836 (0.84063)	Top-1 acc 50.781 (48.000)	Top-5 acc 76.953 (71.472)	lr 0.02216
Train [27][860/3239]	Time 0.591 (0.916)	Data Time 0.001 (0.026)	Loss 3.2305 (3.1826)	Entropy 0.83828 (0.84060)	Top-1 acc 47.266 (47.986)	Top-5 acc 73.047 (71.486)	lr 0.02216
Train [27][870/3239]	Time 0.641 (0.915)	Data Time 0.001 (0.026)	Loss 3.0025 (3.1817)	Entropy 0.83771 (0.84057)	Top-1 acc 51.953 (47.992)	Top-5 acc 76.172 (71.510)	lr 0.02216
Train [27][880/3239]	Time 0.777 (0.941)	Data Time 0.006 (0.026)	Loss 3.1741 (3.1824)	Entropy 0.83744 (0.84054)	Top-1 acc 51.172 (47.978)	Top-5 acc 71.875 (71.494)	lr 0.02216
Train [27][890/3239]	Time 0.614 (0.941)	Data Time 0.002 (0.026)	Loss 3.3914 (3.1826)	Entropy 0.83695 (0.84050)	Top-1 acc 42.578 (47.963)	Top-5 acc 67.969 (71.489)	lr 0.02216
Train [27][900/3239]	Time 0.610 (0.940)	Data Time 0.001 (0.025)	Loss 3.1593 (3.1823)	Entropy 0.83682 (0.84046)	Top-1 acc 48.438 (47.968)	Top-5 acc 72.656 (71.497)	lr 0.02216
Train [27][910/3239]	Time 0.602 (0.939)	Data Time 0.002 (0.025)	Loss 3.2868 (3.1829)	Entropy 0.83674 (0.84042)	Top-1 acc 46.094 (47.957)	Top-5 acc 66.797 (71.471)	lr 0.02216
Train [27][920/3239]	Time 0.638 (0.938)	Data Time 0.001 (0.025)	Loss 3.1838 (3.1826)	Entropy 0.83619 (0.84038)	Top-1 acc 46.484 (47.955)	Top-5 acc 68.750 (71.476)	lr 0.02216
Train [27][930/3239]	Time 0.696 (0.937)	Data Time 0.001 (0.025)	Loss 3.2151 (3.1822)	Entropy 0.83630 (0.84034)	Top-1 acc 48.047 (47.950)	Top-5 acc 70.312 (71.494)	lr 0.02215
Train [27][940/3239]	Time 0.618 (0.937)	Data Time 0.001 (0.024)	Loss 3.0596 (3.1828)	Entropy 0.83646 (0.84029)	Top-1 acc 53.125 (47.931)	Top-5 acc 73.047 (71.477)	lr 0.02215
Train [27][950/3239]	Time 0.583 (0.936)	Data Time 0.001 (0.024)	Loss 3.2805 (3.1826)	Entropy 0.83613 (0.84025)	Top-1 acc 45.312 (47.935)	Top-5 acc 68.750 (71.485)	lr 0.02215
Train [27][960/3239]	Time 0.644 (0.935)	Data Time 0.001 (0.024)	Loss 3.2615 (3.1828)	Entropy 0.83642 (0.84021)	Top-1 acc 46.875 (47.926)	Top-5 acc 67.578 (71.487)	lr 0.02215
Train [27][970/3239]	Time 0.604 (0.934)	Data Time 0.001 (0.024)	Loss 3.2431 (3.1828)	Entropy 0.83605 (0.84017)	Top-1 acc 46.484 (47.924)	Top-5 acc 71.094 (71.484)	lr 0.02215
Train [27][980/3239]	Time 0.623 (0.934)	Data Time 0.001 (0.023)	Loss 3.0110 (3.1831)	Entropy 0.83600 (0.84013)	Top-1 acc 55.859 (47.910)	Top-5 acc 78.125 (71.487)	lr 0.02215
Train [27][990/3239]	Time 0.638 (0.933)	Data Time 0.001 (0.023)	Loss 3.2422 (3.1829)	Entropy 0.83533 (0.84008)	Top-1 acc 48.828 (47.907)	Top-5 acc 70.703 (71.499)	lr 0.02215
Train [27][1000/3239]	Time 0.657 (0.932)	Data Time 0.001 (0.023)	Loss 3.1967 (3.1830)	Entropy 0.83544 (0.84004)	Top-1 acc 44.141 (47.890)	Top-5 acc 71.875 (71.507)	lr 0.02215
Train [27][1010/3239]	Time 0.603 (0.931)	Data Time 0.002 (0.023)	Loss 3.3116 (3.1828)	Entropy 0.83541 (0.83999)	Top-1 acc 43.750 (47.901)	Top-5 acc 68.750 (71.508)	lr 0.02215
Train [27][1020/3239]	Time 0.624 (0.931)	Data Time 0.001 (0.023)	Loss 3.2945 (3.1824)	Entropy 0.83501 (0.83994)	Top-1 acc 43.359 (47.910)	Top-5 acc 69.531 (71.517)	lr 0.02215
Train [27][1030/3239]	Time 0.630 (0.930)	Data Time 0.001 (0.022)	Loss 3.2513 (3.1827)	Entropy 0.83470 (0.83990)	Top-1 acc 44.141 (47.897)	Top-5 acc 71.484 (71.509)	lr 0.02215
Train [27][1040/3239]	Time 0.591 (0.929)	Data Time 0.002 (0.022)	Loss 3.2377 (3.1826)	Entropy 0.83490 (0.83985)	Top-1 acc 51.953 (47.901)	Top-5 acc 71.484 (71.512)	lr 0.02215
Train [27][1050/3239]	Time 0.566 (0.929)	Data Time 0.001 (0.022)	Loss 3.5183 (3.1827)	Entropy 0.83467 (0.83980)	Top-1 acc 42.188 (47.902)	Top-5 acc 69.141 (71.516)	lr 0.02215
Train [27][1060/3239]	Time 0.614 (0.928)	Data Time 0.001 (0.022)	Loss 3.2569 (3.1831)	Entropy 0.83478 (0.83975)	Top-1 acc 44.922 (47.892)	Top-5 acc 71.484 (71.503)	lr 0.02215
Train [27][1070/3239]	Time 0.583 (0.927)	Data Time 0.001 (0.022)	Loss 3.1562 (3.1829)	Entropy 0.83483 (0.83970)	Top-1 acc 48.828 (47.901)	Top-5 acc 73.828 (71.517)	lr 0.02215
Train [27][1080/3239]	Time 0.627 (0.927)	Data Time 0.001 (0.021)	Loss 3.4246 (3.1838)	Entropy 0.83478 (0.83966)	Top-1 acc 42.969 (47.871)	Top-5 acc 67.969 (71.506)	lr 0.02215
Train [27][1090/3239]	Time 0.667 (0.926)	Data Time 0.001 (0.021)	Loss 3.2899 (3.1848)	Entropy 0.83422 (0.83961)	Top-1 acc 45.703 (47.844)	Top-5 acc 68.359 (71.490)	lr 0.02214
Train [27][1100/3239]	Time 0.623 (0.925)	Data Time 0.001 (0.021)	Loss 3.3968 (3.1857)	Entropy 0.83386 (0.83956)	Top-1 acc 46.094 (47.816)	Top-5 acc 66.406 (71.471)	lr 0.02214
Train [27][1110/3239]	Time 0.622 (0.925)	Data Time 0.001 (0.021)	Loss 3.2840 (3.1849)	Entropy 0.83366 (0.83951)	Top-1 acc 50.000 (47.837)	Top-5 acc 68.750 (71.476)	lr 0.02214
Train [27][1120/3239]	Time 0.586 (0.925)	Data Time 0.001 (0.021)	Loss 3.1666 (3.1848)	Entropy 0.83353 (0.83946)	Top-1 acc 48.828 (47.837)	Top-5 acc 73.828 (71.479)	lr 0.02214
Train [27][1130/3239]	Time 0.594 (0.924)	Data Time 0.001 (0.021)	Loss 3.2247 (3.1848)	Entropy 0.83364 (0.83941)	Top-1 acc 44.922 (47.840)	Top-5 acc 71.875 (71.477)	lr 0.02214
Train [27][1140/3239]	Time 0.642 (0.923)	Data Time 0.001 (0.020)	Loss 3.0987 (3.1843)	Entropy 0.83352 (0.83936)	Top-1 acc 48.047 (47.847)	Top-5 acc 72.266 (71.485)	lr 0.02214
Train [27][1150/3239]	Time 0.570 (0.923)	Data Time 0.001 (0.020)	Loss 3.2825 (3.1842)	Entropy 0.83373 (0.83931)	Top-1 acc 50.000 (47.848)	Top-5 acc 69.531 (71.488)	lr 0.02214
Train [27][1160/3239]	Time 0.677 (0.922)	Data Time 0.001 (0.020)	Loss 3.3488 (3.1837)	Entropy 0.83362 (0.83926)	Top-1 acc 47.656 (47.864)	Top-5 acc 68.359 (71.493)	lr 0.02214
Train [27][1170/3239]	Time 0.616 (0.922)	Data Time 0.001 (0.020)	Loss 3.2829 (3.1833)	Entropy 0.83385 (0.83921)	Top-1 acc 44.922 (47.869)	Top-5 acc 67.578 (71.508)	lr 0.02214
Train [27][1180/3239]	Time 0.490 (0.921)	Data Time 0.001 (0.020)	Loss 3.0496 (3.1835)	Entropy 0.83397 (0.83916)	Top-1 acc 51.562 (47.860)	Top-5 acc 71.875 (71.501)	lr 0.02214
Train [27][1190/3239]	Time 0.584 (0.920)	Data Time 0.001 (0.020)	Loss 3.0485 (3.1831)	Entropy 0.83388 (0.83912)	Top-1 acc 49.219 (47.866)	Top-5 acc 72.266 (71.507)	lr 0.02214
Train [27][1200/3239]	Time 0.579 (0.920)	Data Time 0.001 (0.020)	Loss 3.0483 (3.1833)	Entropy 0.83370 (0.83908)	Top-1 acc 51.562 (47.855)	Top-5 acc 73.828 (71.504)	lr 0.02214
Train [27][1210/3239]	Time 0.612 (0.919)	Data Time 0.001 (0.019)	Loss 3.1802 (3.1828)	Entropy 0.83359 (0.83903)	Top-1 acc 47.266 (47.859)	Top-5 acc 71.094 (71.508)	lr 0.02214
Train [27][1220/3239]	Time 0.629 (0.919)	Data Time 0.001 (0.019)	Loss 3.1159 (3.1832)	Entropy 0.83333 (0.83899)	Top-1 acc 50.391 (47.855)	Top-5 acc 73.047 (71.499)	lr 0.02214
Train [27][1230/3239]	Time 0.610 (0.918)	Data Time 0.001 (0.019)	Loss 3.1979 (3.1833)	Entropy 0.83364 (0.83894)	Top-1 acc 49.219 (47.850)	Top-5 acc 70.312 (71.488)	lr 0.02214
Train [27][1240/3239]	Time 0.611 (0.918)	Data Time 0.001 (0.019)	Loss 3.2767 (3.1832)	Entropy 0.83330 (0.83890)	Top-1 acc 49.219 (47.861)	Top-5 acc 67.578 (71.490)	lr 0.02214
Train [27][1250/3239]	Time 0.594 (0.917)	Data Time 0.001 (0.019)	Loss 3.1231 (3.1829)	Entropy 0.83320 (0.83885)	Top-1 acc 48.047 (47.870)	Top-5 acc 74.609 (71.505)	lr 0.02213
Train [27][1260/3239]	Time 0.609 (0.917)	Data Time 0.001 (0.019)	Loss 3.2336 (3.1835)	Entropy 0.83318 (0.83881)	Top-1 acc 52.344 (47.863)	Top-5 acc 72.656 (71.495)	lr 0.02213
Train [27][1270/3239]	Time 0.552 (0.916)	Data Time 0.001 (0.019)	Loss 3.2967 (3.1833)	Entropy 0.83270 (0.83876)	Top-1 acc 42.969 (47.866)	Top-5 acc 69.141 (71.496)	lr 0.02213
Train [27][1280/3239]	Time 0.630 (0.916)	Data Time 0.001 (0.018)	Loss 3.1433 (3.1840)	Entropy 0.83305 (0.83872)	Top-1 acc 50.000 (47.851)	Top-5 acc 75.391 (71.488)	lr 0.02213
Train [27][1290/3239]	Time 0.637 (0.915)	Data Time 0.001 (0.018)	Loss 3.0107 (3.1836)	Entropy 0.83228 (0.83867)	Top-1 acc 50.391 (47.860)	Top-5 acc 74.609 (71.493)	lr 0.02213
Train [27][1300/3239]	Time 0.595 (0.915)	Data Time 0.001 (0.018)	Loss 3.1542 (3.1833)	Entropy 0.83209 (0.83862)	Top-1 acc 47.266 (47.869)	Top-5 acc 73.828 (71.507)	lr 0.02213
Train [27][1310/3239]	Time 0.599 (0.915)	Data Time 0.001 (0.018)	Loss 3.1952 (3.1829)	Entropy 0.83200 (0.83857)	Top-1 acc 44.141 (47.880)	Top-5 acc 71.875 (71.513)	lr 0.02213
Train [27][1320/3239]	Time 0.686 (0.914)	Data Time 0.001 (0.018)	Loss 3.1033 (3.1832)	Entropy 0.83206 (0.83852)	Top-1 acc 50.000 (47.875)	Top-5 acc 73.047 (71.505)	lr 0.02213
Train [27][1330/3239]	Time 0.622 (0.914)	Data Time 0.001 (0.018)	Loss 3.0675 (3.1831)	Entropy 0.83186 (0.83847)	Top-1 acc 51.953 (47.880)	Top-5 acc 73.047 (71.503)	lr 0.02213
Train [27][1340/3239]	Time 0.601 (0.913)	Data Time 0.002 (0.018)	Loss 3.1899 (3.1831)	Entropy 0.83193 (0.83842)	Top-1 acc 50.000 (47.887)	Top-5 acc 72.266 (71.504)	lr 0.02213
Train [27][1350/3239]	Time 0.597 (0.913)	Data Time 0.001 (0.018)	Loss 3.1981 (3.1831)	Entropy 0.83177 (0.83837)	Top-1 acc 48.438 (47.881)	Top-5 acc 68.359 (71.502)	lr 0.02213
Train [27][1360/3239]	Time 0.593 (0.912)	Data Time 0.001 (0.017)	Loss 3.3695 (3.1834)	Entropy 0.83159 (0.83832)	Top-1 acc 44.922 (47.878)	Top-5 acc 67.578 (71.496)	lr 0.02213
Train [27][1370/3239]	Time 0.630 (0.912)	Data Time 0.001 (0.017)	Loss 3.0532 (3.1830)	Entropy 0.83162 (0.83828)	Top-1 acc 50.000 (47.884)	Top-5 acc 75.000 (71.500)	lr 0.02213
Train [27][1380/3239]	Time 0.637 (0.911)	Data Time 0.001 (0.017)	Loss 3.3007 (3.1830)	Entropy 0.83165 (0.83823)	Top-1 acc 48.047 (47.878)	Top-5 acc 69.922 (71.500)	lr 0.02213
Train [27][1390/3239]	Time 0.708 (0.911)	Data Time 0.001 (0.017)	Loss 3.1812 (3.1835)	Entropy 0.83155 (0.83818)	Top-1 acc 50.000 (47.875)	Top-5 acc 74.219 (71.498)	lr 0.02213
Train [27][1400/3239]	Time 0.605 (0.910)	Data Time 0.001 (0.017)	Loss 3.1411 (3.1840)	Entropy 0.83105 (0.83813)	Top-1 acc 47.656 (47.862)	Top-5 acc 73.047 (71.482)	lr 0.02212
Train [27][1410/3239]	Time 0.580 (0.910)	Data Time 0.001 (0.017)	Loss 3.3312 (3.1842)	Entropy 0.83100 (0.83808)	Top-1 acc 45.703 (47.853)	Top-5 acc 70.703 (71.474)	lr 0.02212
Train [27][1420/3239]	Time 0.641 (0.910)	Data Time 0.001 (0.017)	Loss 3.1494 (3.1844)	Entropy 0.83140 (0.83803)	Top-1 acc 49.609 (47.853)	Top-5 acc 69.531 (71.472)	lr 0.02212
Train [27][1430/3239]	Time 0.617 (0.909)	Data Time 0.001 (0.017)	Loss 3.0435 (3.1842)	Entropy 0.83110 (0.83798)	Top-1 acc 52.344 (47.856)	Top-5 acc 74.609 (71.469)	lr 0.02212
Train [27][1440/3239]	Time 0.617 (0.909)	Data Time 0.001 (0.017)	Loss 3.0149 (3.1842)	Entropy 0.83062 (0.83794)	Top-1 acc 52.344 (47.851)	Top-5 acc 74.219 (71.471)	lr 0.02212
Train [27][1450/3239]	Time 0.604 (0.909)	Data Time 0.001 (0.016)	Loss 3.2316 (3.1844)	Entropy 0.83040 (0.83789)	Top-1 acc 44.531 (47.846)	Top-5 acc 67.188 (71.464)	lr 0.02212
Train [27][1460/3239]	Time 0.618 (0.908)	Data Time 0.001 (0.016)	Loss 2.8497 (3.1845)	Entropy 0.83014 (0.83783)	Top-1 acc 56.250 (47.853)	Top-5 acc 75.781 (71.460)	lr 0.02212
Train [27][1470/3239]	Time 0.627 (0.908)	Data Time 0.001 (0.016)	Loss 3.3738 (3.1845)	Entropy 0.82977 (0.83778)	Top-1 acc 42.578 (47.850)	Top-5 acc 66.797 (71.454)	lr 0.02212
Train [27][1480/3239]	Time 0.714 (0.908)	Data Time 0.001 (0.016)	Loss 3.2287 (3.1840)	Entropy 0.82984 (0.83773)	Top-1 acc 46.875 (47.861)	Top-5 acc 70.312 (71.465)	lr 0.02212
Train [27][1490/3239]	Time 0.596 (0.908)	Data Time 0.001 (0.016)	Loss 3.1730 (3.1848)	Entropy 0.82961 (0.83767)	Top-1 acc 49.219 (47.845)	Top-5 acc 70.703 (71.446)	lr 0.02212
Train [27][1500/3239]	Time 0.585 (0.907)	Data Time 0.001 (0.016)	Loss 3.0454 (3.1847)	Entropy 0.82934 (0.83762)	Top-1 acc 51.172 (47.845)	Top-5 acc 75.000 (71.451)	lr 0.02212
Train [27][1510/3239]	Time 0.567 (0.907)	Data Time 0.001 (0.016)	Loss 3.0675 (3.1849)	Entropy 0.82951 (0.83757)	Top-1 acc 53.906 (47.841)	Top-5 acc 75.000 (71.452)	lr 0.02212
Train [27][1520/3239]	Time 0.588 (0.907)	Data Time 0.001 (0.016)	Loss 3.0062 (3.1847)	Entropy 0.82962 (0.83751)	Top-1 acc 51.562 (47.847)	Top-5 acc 74.219 (71.458)	lr 0.02212
Train [27][1530/3239]	Time 0.643 (0.906)	Data Time 0.001 (0.016)	Loss 3.1803 (3.1847)	Entropy 0.82945 (0.83746)	Top-1 acc 50.781 (47.853)	Top-5 acc 73.828 (71.456)	lr 0.02212
Train [27][1540/3239]	Time 0.619 (0.921)	Data Time 0.002 (0.016)	Loss 3.3075 (3.1850)	Entropy 0.82940 (0.83741)	Top-1 acc 45.703 (47.850)	Top-5 acc 69.922 (71.448)	lr 0.02212
Train [27][1550/3239]	Time 0.731 (0.921)	Data Time 0.002 (0.016)	Loss 3.1972 (3.1853)	Entropy 0.82948 (0.83736)	Top-1 acc 49.219 (47.849)	Top-5 acc 70.312 (71.435)	lr 0.02212
Train [27][1560/3239]	Time 0.571 (0.920)	Data Time 0.001 (0.015)	Loss 3.1645 (3.1855)	Entropy 0.82937 (0.83731)	Top-1 acc 50.781 (47.842)	Top-5 acc 70.703 (71.435)	lr 0.02211
Train [27][1570/3239]	Time 0.657 (0.920)	Data Time 0.001 (0.015)	Loss 3.1554 (3.1853)	Entropy 0.82922 (0.83726)	Top-1 acc 51.172 (47.843)	Top-5 acc 70.312 (71.435)	lr 0.02211
Train [27][1580/3239]	Time 0.613 (0.919)	Data Time 0.001 (0.015)	Loss 2.9561 (3.1853)	Entropy 0.82895 (0.83720)	Top-1 acc 50.000 (47.839)	Top-5 acc 77.344 (71.435)	lr 0.02211
Train [27][1590/3239]	Time 0.585 (0.919)	Data Time 0.001 (0.015)	Loss 3.2072 (3.1848)	Entropy 0.82885 (0.83715)	Top-1 acc 51.172 (47.852)	Top-5 acc 71.875 (71.443)	lr 0.02211
Train [27][1600/3239]	Time 0.615 (0.919)	Data Time 0.002 (0.015)	Loss 3.1981 (3.1848)	Entropy 0.82924 (0.83710)	Top-1 acc 49.219 (47.853)	Top-5 acc 72.266 (71.440)	lr 0.02211
Train [27][1610/3239]	Time 0.592 (0.918)	Data Time 0.001 (0.015)	Loss 3.1235 (3.1848)	Entropy 0.82910 (0.83705)	Top-1 acc 48.047 (47.852)	Top-5 acc 72.656 (71.441)	lr 0.02211
Train [27][1620/3239]	Time 0.607 (0.918)	Data Time 0.001 (0.015)	Loss 3.2252 (3.1848)	Entropy 0.82921 (0.83700)	Top-1 acc 46.875 (47.845)	Top-5 acc 72.266 (71.449)	lr 0.02211
Train [27][1630/3239]	Time 0.624 (0.918)	Data Time 0.001 (0.015)	Loss 3.1320 (3.1848)	Entropy 0.82878 (0.83695)	Top-1 acc 50.000 (47.839)	Top-5 acc 71.094 (71.442)	lr 0.02211
Train [27][1640/3239]	Time 0.614 (0.918)	Data Time 0.002 (0.015)	Loss 3.1761 (3.1847)	Entropy 0.82873 (0.83690)	Top-1 acc 50.000 (47.843)	Top-5 acc 71.484 (71.442)	lr 0.02211
Train [27][1650/3239]	Time 0.644 (0.917)	Data Time 0.001 (0.015)	Loss 3.1394 (3.1846)	Entropy 0.82830 (0.83685)	Top-1 acc 48.438 (47.835)	Top-5 acc 71.484 (71.447)	lr 0.02211
Train [27][1660/3239]	Time 0.585 (0.917)	Data Time 0.001 (0.015)	Loss 3.1502 (3.1844)	Entropy 0.82800 (0.83680)	Top-1 acc 49.219 (47.838)	Top-5 acc 75.000 (71.449)	lr 0.02211
Train [27][1670/3239]	Time 0.663 (0.916)	Data Time 0.001 (0.015)	Loss 3.2202 (3.1845)	Entropy 0.82813 (0.83675)	Top-1 acc 47.266 (47.841)	Top-5 acc 69.922 (71.453)	lr 0.02211
Train [27][1680/3239]	Time 0.605 (0.916)	Data Time 0.001 (0.014)	Loss 3.0310 (3.1842)	Entropy 0.82789 (0.83670)	Top-1 acc 47.266 (47.843)	Top-5 acc 72.266 (71.454)	lr 0.02211
Train [27][1690/3239]	Time 0.612 (0.915)	Data Time 0.001 (0.014)	Loss 3.0372 (3.1844)	Entropy 0.82795 (0.83664)	Top-1 acc 47.656 (47.839)	Top-5 acc 71.875 (71.449)	lr 0.02211
Train [27][1700/3239]	Time 0.571 (0.915)	Data Time 0.001 (0.014)	Loss 3.3788 (3.1844)	Entropy 0.82771 (0.83659)	Top-1 acc 41.797 (47.840)	Top-5 acc 68.750 (71.452)	lr 0.02211
Train [27][1710/3239]	Time 0.694 (0.915)	Data Time 0.001 (0.014)	Loss 3.4036 (3.1847)	Entropy 0.82794 (0.83654)	Top-1 acc 44.141 (47.835)	Top-5 acc 65.625 (71.443)	lr 0.02210
Train [27][1720/3239]	Time 0.616 (0.915)	Data Time 0.001 (0.014)	Loss 3.1839 (3.1845)	Entropy 0.82791 (0.83649)	Top-1 acc 48.047 (47.839)	Top-5 acc 71.094 (71.442)	lr 0.02210
Train [27][1730/3239]	Time 0.573 (0.914)	Data Time 0.001 (0.014)	Loss 3.2591 (3.1843)	Entropy 0.82800 (0.83644)	Top-1 acc 47.266 (47.841)	Top-5 acc 69.922 (71.447)	lr 0.02210
Train [27][1740/3239]	Time 0.634 (0.914)	Data Time 0.001 (0.014)	Loss 3.0184 (3.1839)	Entropy 0.82790 (0.83639)	Top-1 acc 52.734 (47.848)	Top-5 acc 76.562 (71.456)	lr 0.02210
Train [27][1750/3239]	Time 0.616 (0.914)	Data Time 0.001 (0.014)	Loss 3.2128 (3.1836)	Entropy 0.82810 (0.83635)	Top-1 acc 47.656 (47.856)	Top-5 acc 71.094 (71.459)	lr 0.02210
Train [27][1760/3239]	Time 0.614 (0.913)	Data Time 0.001 (0.014)	Loss 3.0563 (3.1838)	Entropy 0.82815 (0.83630)	Top-1 acc 51.172 (47.851)	Top-5 acc 69.922 (71.453)	lr 0.02210
Train [27][1770/3239]	Time 0.608 (0.913)	Data Time 0.001 (0.014)	Loss 3.3099 (3.1835)	Entropy 0.82819 (0.83625)	Top-1 acc 42.969 (47.851)	Top-5 acc 69.922 (71.457)	lr 0.02210
Train [27][1780/3239]	Time 0.606 (0.913)	Data Time 0.001 (0.014)	Loss 3.1451 (3.1835)	Entropy 0.82815 (0.83621)	Top-1 acc 44.922 (47.855)	Top-5 acc 71.875 (71.457)	lr 0.02210
Train [27][1790/3239]	Time 0.598 (0.913)	Data Time 0.001 (0.014)	Loss 3.1624 (3.1835)	Entropy 0.82836 (0.83616)	Top-1 acc 47.266 (47.853)	Top-5 acc 72.266 (71.453)	lr 0.02210
Train [27][1800/3239]	Time 0.618 (0.913)	Data Time 0.001 (0.014)	Loss 3.0534 (3.1833)	Entropy 0.82817 (0.83612)	Top-1 acc 50.000 (47.859)	Top-5 acc 72.266 (71.456)	lr 0.02210
Train [27][1810/3239]	Time 0.642 (0.912)	Data Time 0.001 (0.014)	Loss 3.2030 (3.1832)	Entropy 0.82779 (0.83608)	Top-1 acc 48.047 (47.864)	Top-5 acc 71.094 (71.455)	lr 0.02210
Train [27][1820/3239]	Time 0.588 (0.912)	Data Time 0.001 (0.014)	Loss 3.0124 (3.1829)	Entropy 0.82791 (0.83603)	Top-1 acc 50.000 (47.870)	Top-5 acc 74.219 (71.464)	lr 0.02210
Train [27][1830/3239]	Time 0.607 (0.912)	Data Time 0.001 (0.013)	Loss 3.0077 (3.1829)	Entropy 0.82791 (0.83599)	Top-1 acc 48.438 (47.873)	Top-5 acc 77.344 (71.460)	lr 0.02210
Train [27][1840/3239]	Time 0.624 (0.911)	Data Time 0.001 (0.013)	Loss 3.2547 (3.1828)	Entropy 0.82771 (0.83594)	Top-1 acc 47.656 (47.879)	Top-5 acc 68.359 (71.465)	lr 0.02210
Train [27][1850/3239]	Time 0.586 (0.911)	Data Time 0.001 (0.013)	Loss 3.4026 (3.1823)	Entropy 0.82735 (0.83590)	Top-1 acc 44.922 (47.891)	Top-5 acc 67.578 (71.471)	lr 0.02210
Train [27][1860/3239]	Time 0.634 (0.911)	Data Time 0.001 (0.013)	Loss 3.4078 (3.1823)	Entropy 0.82698 (0.83585)	Top-1 acc 41.406 (47.891)	Top-5 acc 67.188 (71.467)	lr 0.02210
Train [27][1870/3239]	Time 0.734 (0.911)	Data Time 0.001 (0.013)	Loss 3.1360 (3.1824)	Entropy 0.82661 (0.83580)	Top-1 acc 47.656 (47.892)	Top-5 acc 72.266 (71.469)	lr 0.02209
Train [27][1880/3239]	Time 0.612 (0.910)	Data Time 0.001 (0.013)	Loss 3.0427 (3.1825)	Entropy 0.82682 (0.83575)	Top-1 acc 52.344 (47.892)	Top-5 acc 74.609 (71.464)	lr 0.02209
Train [27][1890/3239]	Time 0.561 (0.910)	Data Time 0.001 (0.013)	Loss 3.4925 (3.1826)	Entropy 0.82647 (0.83570)	Top-1 acc 43.750 (47.893)	Top-5 acc 65.234 (71.463)	lr 0.02209
Train [27][1900/3239]	Time 0.604 (0.910)	Data Time 0.001 (0.013)	Loss 3.3273 (3.1826)	Entropy 0.82631 (0.83566)	Top-1 acc 41.797 (47.890)	Top-5 acc 65.625 (71.462)	lr 0.02209
Train [27][1910/3239]	Time 0.596 (0.910)	Data Time 0.001 (0.013)	Loss 3.0876 (3.1823)	Entropy 0.82579 (0.83561)	Top-1 acc 49.219 (47.897)	Top-5 acc 75.000 (71.470)	lr 0.02209
Train [27][1920/3239]	Time 0.631 (0.909)	Data Time 0.002 (0.013)	Loss 3.0853 (3.1826)	Entropy 0.82547 (0.83556)	Top-1 acc 50.000 (47.894)	Top-5 acc 71.875 (71.464)	lr 0.02209
Train [27][1930/3239]	Time 0.558 (0.909)	Data Time 0.001 (0.013)	Loss 3.2715 (3.1825)	Entropy 0.82535 (0.83550)	Top-1 acc 46.875 (47.894)	Top-5 acc 68.359 (71.464)	lr 0.02209
Train [27][1940/3239]	Time 0.681 (0.909)	Data Time 0.001 (0.013)	Loss 3.0047 (3.1825)	Entropy 0.82520 (0.83545)	Top-1 acc 52.344 (47.897)	Top-5 acc 71.484 (71.464)	lr 0.02209
Train [27][1950/3239]	Time 0.597 (0.909)	Data Time 0.001 (0.013)	Loss 3.1634 (3.1827)	Entropy 0.82491 (0.83540)	Top-1 acc 48.828 (47.887)	Top-5 acc 73.047 (71.460)	lr 0.02209
Train [27][1960/3239]	Time 0.600 (0.908)	Data Time 0.001 (0.013)	Loss 3.1267 (3.1825)	Entropy 0.82479 (0.83534)	Top-1 acc 48.828 (47.894)	Top-5 acc 72.266 (71.463)	lr 0.02209
Train [27][1970/3239]	Time 0.613 (0.908)	Data Time 0.001 (0.013)	Loss 3.0894 (3.1823)	Entropy 0.82457 (0.83529)	Top-1 acc 50.391 (47.903)	Top-5 acc 75.000 (71.466)	lr 0.02209
Train [27][1980/3239]	Time 0.607 (0.908)	Data Time 0.001 (0.013)	Loss 3.1943 (3.1822)	Entropy 0.82511 (0.83524)	Top-1 acc 52.344 (47.906)	Top-5 acc 71.094 (71.473)	lr 0.02209
Train [27][1990/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.013)	Loss 3.0049 (3.1819)	Entropy 0.82541 (0.83519)	Top-1 acc 53.125 (47.912)	Top-5 acc 73.828 (71.475)	lr 0.02209
Train [27][2000/3239]	Time 0.610 (0.907)	Data Time 0.001 (0.012)	Loss 3.2060 (3.1822)	Entropy 0.82564 (0.83514)	Top-1 acc 46.484 (47.914)	Top-5 acc 66.406 (71.465)	lr 0.02209
Train [27][2010/3239]	Time 0.459 (0.907)	Data Time 0.001 (0.012)	Loss 3.4431 (3.1823)	Entropy 0.82589 (0.83509)	Top-1 acc 42.188 (47.915)	Top-5 acc 66.406 (71.465)	lr 0.02209
Train [27][2020/3239]	Time 0.602 (0.907)	Data Time 0.001 (0.012)	Loss 3.2718 (3.1826)	Entropy 0.82565 (0.83505)	Top-1 acc 48.047 (47.911)	Top-5 acc 71.094 (71.461)	lr 0.02208
Train [27][2030/3239]	Time 0.694 (0.907)	Data Time 0.001 (0.012)	Loss 3.1316 (3.1824)	Entropy 0.82590 (0.83500)	Top-1 acc 52.734 (47.913)	Top-5 acc 70.703 (71.464)	lr 0.02208
Train [27][2040/3239]	Time 0.648 (0.906)	Data Time 0.001 (0.012)	Loss 3.1270 (3.1826)	Entropy 0.82583 (0.83495)	Top-1 acc 51.953 (47.911)	Top-5 acc 71.484 (71.462)	lr 0.02208
Train [27][2050/3239]	Time 0.572 (0.906)	Data Time 0.001 (0.012)	Loss 3.2572 (3.1825)	Entropy 0.82592 (0.83491)	Top-1 acc 46.094 (47.910)	Top-5 acc 67.578 (71.464)	lr 0.02208
Train [27][2060/3239]	Time 0.629 (0.906)	Data Time 0.001 (0.012)	Loss 3.2613 (3.1825)	Entropy 0.82600 (0.83487)	Top-1 acc 46.094 (47.912)	Top-5 acc 73.047 (71.465)	lr 0.02208
Train [27][2070/3239]	Time 0.596 (0.906)	Data Time 0.001 (0.012)	Loss 3.1414 (3.1824)	Entropy 0.82598 (0.83482)	Top-1 acc 48.438 (47.915)	Top-5 acc 71.875 (71.469)	lr 0.02208
Train [27][2080/3239]	Time 0.601 (0.905)	Data Time 0.001 (0.012)	Loss 3.0041 (3.1821)	Entropy 0.82601 (0.83478)	Top-1 acc 52.344 (47.922)	Top-5 acc 74.609 (71.477)	lr 0.02208
Train [27][2090/3239]	Time 0.614 (0.905)	Data Time 0.001 (0.012)	Loss 3.3142 (3.1818)	Entropy 0.82590 (0.83474)	Top-1 acc 48.047 (47.931)	Top-5 acc 71.875 (71.483)	lr 0.02208
Train [27][2100/3239]	Time 0.709 (0.905)	Data Time 0.001 (0.012)	Loss 3.1742 (3.1817)	Entropy 0.82562 (0.83470)	Top-1 acc 45.703 (47.933)	Top-5 acc 70.703 (71.484)	lr 0.02208
Train [27][2110/3239]	Time 0.619 (0.905)	Data Time 0.002 (0.012)	Loss 3.1434 (3.1818)	Entropy 0.82563 (0.83465)	Top-1 acc 51.562 (47.936)	Top-5 acc 74.609 (71.486)	lr 0.02208
Train [27][2120/3239]	Time 0.644 (0.905)	Data Time 0.001 (0.012)	Loss 3.0937 (3.1818)	Entropy 0.82561 (0.83461)	Top-1 acc 50.781 (47.939)	Top-5 acc 75.391 (71.487)	lr 0.02208
Train [27][2130/3239]	Time 0.642 (0.905)	Data Time 0.023 (0.012)	Loss 2.9133 (3.1816)	Entropy 0.82552 (0.83457)	Top-1 acc 53.516 (47.940)	Top-5 acc 76.953 (71.492)	lr 0.02208
Train [27][2140/3239]	Time 0.629 (0.904)	Data Time 0.002 (0.012)	Loss 3.0107 (3.1817)	Entropy 0.82549 (0.83453)	Top-1 acc 50.000 (47.943)	Top-5 acc 76.562 (71.492)	lr 0.02208
Train [27][2150/3239]	Time 0.598 (0.904)	Data Time 0.001 (0.012)	Loss 3.1484 (3.1816)	Entropy 0.82550 (0.83448)	Top-1 acc 45.703 (47.941)	Top-5 acc 71.875 (71.498)	lr 0.02208
Train [27][2160/3239]	Time 0.610 (0.904)	Data Time 0.001 (0.012)	Loss 3.0173 (3.1814)	Entropy 0.82559 (0.83444)	Top-1 acc 52.344 (47.941)	Top-5 acc 73.047 (71.500)	lr 0.02208
Train [27][2170/3239]	Time 0.612 (0.904)	Data Time 0.001 (0.012)	Loss 3.0369 (3.1812)	Entropy 0.82546 (0.83440)	Top-1 acc 50.391 (47.944)	Top-5 acc 75.000 (71.502)	lr 0.02207
Train [27][2180/3239]	Time 0.550 (0.903)	Data Time 0.001 (0.012)	Loss 3.1533 (3.1811)	Entropy 0.82506 (0.83436)	Top-1 acc 49.609 (47.952)	Top-5 acc 71.875 (71.504)	lr 0.02207
Train [27][2190/3239]	Time 0.949 (0.913)	Data Time 0.005 (0.012)	Loss 2.9452 (3.1808)	Entropy 0.82515 (0.83432)	Top-1 acc 51.562 (47.958)	Top-5 acc 76.562 (71.511)	lr 0.02207
Train [27][2200/3239]	Time 0.609 (0.914)	Data Time 0.002 (0.012)	Loss 3.1604 (3.1808)	Entropy 0.82413 (0.83428)	Top-1 acc 48.828 (47.957)	Top-5 acc 72.266 (71.513)	lr 0.02207
Train [27][2210/3239]	Time 0.638 (0.913)	Data Time 0.002 (0.011)	Loss 3.0881 (3.1807)	Entropy 0.82383 (0.83423)	Top-1 acc 48.438 (47.960)	Top-5 acc 71.484 (71.515)	lr 0.02207
Train [27][2220/3239]	Time 0.592 (0.913)	Data Time 0.001 (0.011)	Loss 3.0230 (3.1806)	Entropy 0.82354 (0.83418)	Top-1 acc 51.953 (47.967)	Top-5 acc 75.391 (71.514)	lr 0.02207
Train [27][2230/3239]	Time 0.613 (0.913)	Data Time 0.001 (0.011)	Loss 3.0306 (3.1804)	Entropy 0.82350 (0.83413)	Top-1 acc 51.172 (47.968)	Top-5 acc 71.875 (71.516)	lr 0.02207
Train [27][2240/3239]	Time 0.590 (0.913)	Data Time 0.001 (0.011)	Loss 3.2872 (3.1808)	Entropy 0.82314 (0.83409)	Top-1 acc 41.406 (47.963)	Top-5 acc 71.484 (71.512)	lr 0.02207
Train [27][2250/3239]	Time 0.620 (0.912)	Data Time 0.001 (0.011)	Loss 3.3485 (3.1809)	Entropy 0.82335 (0.83404)	Top-1 acc 42.188 (47.962)	Top-5 acc 66.797 (71.513)	lr 0.02207
Train [27][2260/3239]	Time 0.686 (0.912)	Data Time 0.001 (0.011)	Loss 3.2869 (3.1808)	Entropy 0.82301 (0.83399)	Top-1 acc 45.703 (47.962)	Top-5 acc 67.969 (71.514)	lr 0.02207
Train [27][2270/3239]	Time 0.606 (0.912)	Data Time 0.001 (0.011)	Loss 3.1623 (3.1808)	Entropy 0.82311 (0.83394)	Top-1 acc 49.609 (47.963)	Top-5 acc 71.875 (71.516)	lr 0.02207
Train [27][2280/3239]	Time 0.626 (0.912)	Data Time 0.001 (0.011)	Loss 3.1719 (3.1807)	Entropy 0.82303 (0.83389)	Top-1 acc 48.828 (47.961)	Top-5 acc 71.875 (71.515)	lr 0.02207
Train [27][2290/3239]	Time 0.590 (0.912)	Data Time 0.001 (0.011)	Loss 3.3917 (3.1807)	Entropy 0.82298 (0.83385)	Top-1 acc 47.266 (47.967)	Top-5 acc 67.578 (71.515)	lr 0.02207
Train [27][2300/3239]	Time 0.583 (0.911)	Data Time 0.001 (0.011)	Loss 3.0821 (3.1806)	Entropy 0.82274 (0.83380)	Top-1 acc 51.562 (47.975)	Top-5 acc 74.609 (71.515)	lr 0.02207
Train [27][2310/3239]	Time 0.648 (0.911)	Data Time 0.001 (0.011)	Loss 3.1423 (3.1808)	Entropy 0.82271 (0.83375)	Top-1 acc 48.828 (47.968)	Top-5 acc 71.875 (71.509)	lr 0.02207
Train [27][2320/3239]	Time 0.594 (0.911)	Data Time 0.001 (0.011)	Loss 3.0969 (3.1810)	Entropy 0.82228 (0.83370)	Top-1 acc 50.000 (47.960)	Top-5 acc 72.656 (71.508)	lr 0.02207
Train [27][2330/3239]	Time 0.612 (0.911)	Data Time 0.001 (0.011)	Loss 3.0438 (3.1808)	Entropy 0.82212 (0.83365)	Top-1 acc 50.781 (47.962)	Top-5 acc 72.266 (71.507)	lr 0.02206
Train [27][2340/3239]	Time 0.631 (0.910)	Data Time 0.001 (0.011)	Loss 3.1287 (3.1806)	Entropy 0.82183 (0.83360)	Top-1 acc 48.828 (47.966)	Top-5 acc 71.094 (71.505)	lr 0.02206
Train [27][2350/3239]	Time 0.674 (0.910)	Data Time 0.001 (0.011)	Loss 3.4934 (3.1808)	Entropy 0.82190 (0.83355)	Top-1 acc 41.406 (47.962)	Top-5 acc 66.797 (71.504)	lr 0.02206
Train [27][2360/3239]	Time 0.617 (0.910)	Data Time 0.001 (0.011)	Loss 3.2555 (3.1807)	Entropy 0.82180 (0.83350)	Top-1 acc 48.438 (47.968)	Top-5 acc 70.312 (71.507)	lr 0.02206
Train [27][2370/3239]	Time 0.613 (0.910)	Data Time 0.001 (0.011)	Loss 2.9543 (3.1806)	Entropy 0.82169 (0.83345)	Top-1 acc 55.469 (47.971)	Top-5 acc 76.953 (71.511)	lr 0.02206
Train [27][2380/3239]	Time 0.611 (0.910)	Data Time 0.001 (0.011)	Loss 3.1614 (3.1802)	Entropy 0.82126 (0.83340)	Top-1 acc 53.125 (47.977)	Top-5 acc 71.094 (71.517)	lr 0.02206
Train [27][2390/3239]	Time 0.629 (0.910)	Data Time 0.001 (0.011)	Loss 2.9152 (3.1799)	Entropy 0.82103 (0.83335)	Top-1 acc 51.953 (47.980)	Top-5 acc 78.516 (71.527)	lr 0.02206
Train [27][2400/3239]	Time 0.614 (0.909)	Data Time 0.001 (0.011)	Loss 3.2122 (3.1797)	Entropy 0.82080 (0.83330)	Top-1 acc 48.047 (47.985)	Top-5 acc 69.922 (71.530)	lr 0.02206
Train [27][2410/3239]	Time 0.638 (0.909)	Data Time 0.001 (0.011)	Loss 3.0233 (3.1799)	Entropy 0.82069 (0.83325)	Top-1 acc 53.125 (47.983)	Top-5 acc 75.781 (71.527)	lr 0.02206
Train [27][2420/3239]	Time 0.714 (0.909)	Data Time 0.001 (0.011)	Loss 3.3355 (3.1799)	Entropy 0.82082 (0.83320)	Top-1 acc 47.266 (47.978)	Top-5 acc 66.797 (71.523)	lr 0.02206
Train [27][2430/3239]	Time 0.610 (0.909)	Data Time 0.001 (0.011)	Loss 2.9941 (3.1798)	Entropy 0.82038 (0.83315)	Top-1 acc 51.953 (47.983)	Top-5 acc 75.781 (71.525)	lr 0.02206
Train [27][2440/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.011)	Loss 3.2489 (3.1797)	Entropy 0.82022 (0.83309)	Top-1 acc 50.391 (47.983)	Top-5 acc 69.922 (71.527)	lr 0.02206
Train [27][2450/3239]	Time 0.612 (0.909)	Data Time 0.001 (0.011)	Loss 3.1380 (3.1797)	Entropy 0.81987 (0.83304)	Top-1 acc 51.953 (47.988)	Top-5 acc 71.484 (71.526)	lr 0.02206
Train [27][2460/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.011)	Loss 3.2479 (3.1796)	Entropy 0.82014 (0.83299)	Top-1 acc 45.703 (47.990)	Top-5 acc 71.875 (71.530)	lr 0.02206
Train [27][2470/3239]	Time 0.627 (0.908)	Data Time 0.001 (0.010)	Loss 2.9953 (3.1792)	Entropy 0.82024 (0.83293)	Top-1 acc 52.734 (47.995)	Top-5 acc 75.391 (71.539)	lr 0.02206
Train [27][2480/3239]	Time 0.502 (0.908)	Data Time 0.001 (0.010)	Loss 3.0300 (3.1789)	Entropy 0.82013 (0.83288)	Top-1 acc 48.438 (47.997)	Top-5 acc 72.266 (71.541)	lr 0.02205
Train [27][2490/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.010)	Loss 3.2081 (3.1786)	Entropy 0.82012 (0.83283)	Top-1 acc 50.000 (48.005)	Top-5 acc 70.703 (71.545)	lr 0.02205
Train [27][2500/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.010)	Loss 3.1536 (3.1788)	Entropy 0.81984 (0.83278)	Top-1 acc 46.094 (48.003)	Top-5 acc 71.484 (71.542)	lr 0.02205
Train [27][2510/3239]	Time 0.619 (0.907)	Data Time 0.001 (0.010)	Loss 3.0606 (3.1787)	Entropy 0.81985 (0.83273)	Top-1 acc 52.344 (48.009)	Top-5 acc 74.219 (71.544)	lr 0.02205
Train [27][2520/3239]	Time 0.596 (0.907)	Data Time 0.001 (0.010)	Loss 3.1335 (3.1787)	Entropy 0.81988 (0.83268)	Top-1 acc 50.781 (48.010)	Top-5 acc 71.094 (71.544)	lr 0.02205
Train [27][2530/3239]	Time 0.640 (0.907)	Data Time 0.001 (0.010)	Loss 3.2119 (3.1787)	Entropy 0.82022 (0.83263)	Top-1 acc 50.391 (48.012)	Top-5 acc 71.094 (71.543)	lr 0.02205
Train [27][2540/3239]	Time 0.620 (0.907)	Data Time 0.001 (0.010)	Loss 2.9177 (3.1785)	Entropy 0.82059 (0.83258)	Top-1 acc 50.781 (48.016)	Top-5 acc 76.172 (71.544)	lr 0.02205
Train [27][2550/3239]	Time 0.612 (0.907)	Data Time 0.001 (0.010)	Loss 3.3034 (3.1783)	Entropy 0.82018 (0.83253)	Top-1 acc 43.359 (48.024)	Top-5 acc 68.359 (71.549)	lr 0.02205
Train [27][2560/3239]	Time 0.611 (0.906)	Data Time 0.001 (0.010)	Loss 3.1719 (3.1784)	Entropy 0.82012 (0.83248)	Top-1 acc 47.266 (48.020)	Top-5 acc 72.656 (71.548)	lr 0.02205
Train [27][2570/3239]	Time 0.628 (0.906)	Data Time 0.001 (0.010)	Loss 2.9458 (3.1784)	Entropy 0.82014 (0.83243)	Top-1 acc 51.953 (48.021)	Top-5 acc 76.562 (71.553)	lr 0.02205
Train [27][2580/3239]	Time 0.669 (0.906)	Data Time 0.001 (0.010)	Loss 3.0771 (3.1782)	Entropy 0.81999 (0.83239)	Top-1 acc 50.391 (48.020)	Top-5 acc 72.656 (71.556)	lr 0.02205
Train [27][2590/3239]	Time 0.571 (0.906)	Data Time 0.001 (0.010)	Loss 3.1731 (3.1781)	Entropy 0.81995 (0.83234)	Top-1 acc 48.438 (48.020)	Top-5 acc 72.266 (71.561)	lr 0.02205
Train [27][2600/3239]	Time 0.586 (0.906)	Data Time 0.001 (0.010)	Loss 3.3909 (3.1782)	Entropy 0.81963 (0.83229)	Top-1 acc 42.188 (48.019)	Top-5 acc 67.188 (71.560)	lr 0.02205
Train [27][2610/3239]	Time 0.603 (0.906)	Data Time 0.002 (0.010)	Loss 3.1061 (3.1784)	Entropy 0.81943 (0.83224)	Top-1 acc 50.391 (48.015)	Top-5 acc 74.219 (71.557)	lr 0.02205
Train [27][2620/3239]	Time 0.628 (0.905)	Data Time 0.001 (0.010)	Loss 2.8472 (3.1779)	Entropy 0.81884 (0.83219)	Top-1 acc 57.031 (48.026)	Top-5 acc 77.734 (71.568)	lr 0.02205
Train [27][2630/3239]	Time 0.640 (0.905)	Data Time 0.001 (0.010)	Loss 3.0279 (3.1778)	Entropy 0.81914 (0.83214)	Top-1 acc 49.219 (48.023)	Top-5 acc 76.562 (71.572)	lr 0.02204
Train [27][2640/3239]	Time 0.611 (0.905)	Data Time 0.001 (0.010)	Loss 3.1348 (3.1775)	Entropy 0.81907 (0.83209)	Top-1 acc 48.047 (48.024)	Top-5 acc 72.266 (71.582)	lr 0.02204
Train [27][2650/3239]	Time 0.670 (0.905)	Data Time 0.001 (0.010)	Loss 3.2614 (3.1776)	Entropy 0.81934 (0.83204)	Top-1 acc 43.359 (48.022)	Top-5 acc 68.750 (71.580)	lr 0.02204
Train [27][2660/3239]	Time 0.607 (0.905)	Data Time 0.001 (0.010)	Loss 3.1698 (3.1776)	Entropy 0.81966 (0.83200)	Top-1 acc 49.219 (48.022)	Top-5 acc 71.094 (71.584)	lr 0.02204
Train [27][2670/3239]	Time 0.633 (0.904)	Data Time 0.001 (0.010)	Loss 3.2802 (3.1774)	Entropy 0.81959 (0.83195)	Top-1 acc 48.047 (48.026)	Top-5 acc 67.969 (71.586)	lr 0.02204
Train [27][2680/3239]	Time 0.631 (0.904)	Data Time 0.001 (0.010)	Loss 3.2263 (3.1773)	Entropy 0.81943 (0.83190)	Top-1 acc 46.484 (48.031)	Top-5 acc 71.484 (71.587)	lr 0.02204
Train [27][2690/3239]	Time 0.585 (0.904)	Data Time 0.001 (0.010)	Loss 3.1951 (3.1773)	Entropy 0.81920 (0.83186)	Top-1 acc 46.484 (48.033)	Top-5 acc 72.266 (71.590)	lr 0.02204
Train [27][2700/3239]	Time 0.594 (0.904)	Data Time 0.001 (0.010)	Loss 3.2471 (3.1772)	Entropy 0.81938 (0.83181)	Top-1 acc 42.188 (48.030)	Top-5 acc 67.969 (71.591)	lr 0.02204
Train [27][2710/3239]	Time 0.604 (0.904)	Data Time 0.001 (0.010)	Loss 2.9463 (3.1773)	Entropy 0.81946 (0.83176)	Top-1 acc 53.516 (48.033)	Top-5 acc 78.516 (71.592)	lr 0.02204
Train [27][2720/3239]	Time 0.644 (0.904)	Data Time 0.001 (0.010)	Loss 3.2111 (3.1770)	Entropy 0.81945 (0.83172)	Top-1 acc 47.656 (48.036)	Top-5 acc 68.750 (71.594)	lr 0.02204
Train [27][2730/3239]	Time 0.660 (0.904)	Data Time 0.001 (0.010)	Loss 3.5765 (3.1769)	Entropy 0.81937 (0.83167)	Top-1 acc 41.406 (48.038)	Top-5 acc 61.328 (71.597)	lr 0.02204
Train [27][2740/3239]	Time 0.727 (0.903)	Data Time 0.001 (0.010)	Loss 3.1834 (3.1769)	Entropy 0.81957 (0.83163)	Top-1 acc 46.875 (48.039)	Top-5 acc 72.266 (71.600)	lr 0.02204
Train [27][2750/3239]	Time 0.619 (0.903)	Data Time 0.001 (0.010)	Loss 3.2562 (3.1768)	Entropy 0.81933 (0.83159)	Top-1 acc 43.750 (48.040)	Top-5 acc 70.703 (71.598)	lr 0.02204
Train [27][2760/3239]	Time 0.582 (0.903)	Data Time 0.002 (0.010)	Loss 3.0491 (3.1769)	Entropy 0.81881 (0.83154)	Top-1 acc 51.562 (48.037)	Top-5 acc 74.219 (71.597)	lr 0.02204
Train [27][2770/3239]	Time 0.631 (0.903)	Data Time 0.001 (0.010)	Loss 3.0451 (3.1770)	Entropy 0.81826 (0.83149)	Top-1 acc 52.344 (48.040)	Top-5 acc 75.000 (71.596)	lr 0.02204
Train [27][2780/3239]	Time 0.579 (0.903)	Data Time 0.001 (0.010)	Loss 3.2409 (3.1768)	Entropy 0.81836 (0.83145)	Top-1 acc 46.875 (48.042)	Top-5 acc 72.656 (71.601)	lr 0.02204
Train [27][2790/3239]	Time 0.593 (0.903)	Data Time 0.001 (0.009)	Loss 3.0942 (3.1768)	Entropy 0.81794 (0.83140)	Top-1 acc 48.828 (48.038)	Top-5 acc 72.656 (71.601)	lr 0.02203
Train [27][2800/3239]	Time 0.600 (0.902)	Data Time 0.001 (0.009)	Loss 3.3182 (3.1770)	Entropy 0.81796 (0.83135)	Top-1 acc 45.312 (48.032)	Top-5 acc 69.531 (71.601)	lr 0.02203
Train [27][2810/3239]	Time 0.540 (0.902)	Data Time 0.001 (0.009)	Loss 3.2663 (3.1772)	Entropy 0.81790 (0.83130)	Top-1 acc 45.703 (48.026)	Top-5 acc 70.312 (71.599)	lr 0.02203
Train [27][2820/3239]	Time 0.596 (0.902)	Data Time 0.020 (0.009)	Loss 3.2664 (3.1773)	Entropy 0.81793 (0.83126)	Top-1 acc 46.094 (48.023)	Top-5 acc 71.094 (71.599)	lr 0.02203
Train [27][2830/3239]	Time 0.588 (0.902)	Data Time 0.001 (0.009)	Loss 3.0885 (3.1772)	Entropy 0.81787 (0.83121)	Top-1 acc 50.781 (48.027)	Top-5 acc 72.656 (71.601)	lr 0.02203
Train [27][2840/3239]	Time 0.607 (0.902)	Data Time 0.002 (0.009)	Loss 3.2339 (3.1773)	Entropy 0.81791 (0.83116)	Top-1 acc 45.703 (48.023)	Top-5 acc 73.047 (71.599)	lr 0.02203
Train [27][2850/3239]	Time 0.646 (0.910)	Data Time 0.002 (0.009)	Loss 3.0453 (3.1769)	Entropy 0.81793 (0.83112)	Top-1 acc 50.781 (48.035)	Top-5 acc 73.828 (71.609)	lr 0.02203
Train [27][2860/3239]	Time 0.612 (0.910)	Data Time 0.002 (0.009)	Loss 3.1305 (3.1770)	Entropy 0.81728 (0.83107)	Top-1 acc 47.656 (48.030)	Top-5 acc 71.875 (71.607)	lr 0.02203
Train [27][2870/3239]	Time 0.601 (0.910)	Data Time 0.001 (0.009)	Loss 3.2303 (3.1772)	Entropy 0.81687 (0.83102)	Top-1 acc 51.172 (48.030)	Top-5 acc 70.703 (71.601)	lr 0.02203
Train [27][2880/3239]	Time 0.610 (0.909)	Data Time 0.001 (0.009)	Loss 3.2088 (3.1770)	Entropy 0.81690 (0.83097)	Top-1 acc 49.609 (48.037)	Top-5 acc 72.266 (71.605)	lr 0.02203
Train [27][2890/3239]	Time 0.644 (0.909)	Data Time 0.001 (0.009)	Loss 3.2519 (3.1772)	Entropy 0.81675 (0.83092)	Top-1 acc 46.094 (48.037)	Top-5 acc 67.969 (71.601)	lr 0.02203
Train [27][2900/3239]	Time 0.679 (0.909)	Data Time 0.001 (0.009)	Loss 3.1664 (3.1774)	Entropy 0.81674 (0.83087)	Top-1 acc 48.438 (48.030)	Top-5 acc 72.266 (71.590)	lr 0.02203
Train [27][2910/3239]	Time 0.624 (0.909)	Data Time 0.001 (0.009)	Loss 3.2155 (3.1775)	Entropy 0.81618 (0.83082)	Top-1 acc 44.531 (48.028)	Top-5 acc 71.875 (71.589)	lr 0.02203
Train [27][2920/3239]	Time 0.650 (0.909)	Data Time 0.001 (0.009)	Loss 3.1603 (3.1776)	Entropy 0.81616 (0.83077)	Top-1 acc 42.969 (48.026)	Top-5 acc 74.609 (71.590)	lr 0.02203
Train [27][2930/3239]	Time 0.594 (0.909)	Data Time 0.001 (0.009)	Loss 3.2940 (3.1777)	Entropy 0.81599 (0.83072)	Top-1 acc 45.703 (48.021)	Top-5 acc 70.312 (71.588)	lr 0.02203
Train [27][2940/3239]	Time 0.578 (0.908)	Data Time 0.001 (0.009)	Loss 3.1240 (3.1776)	Entropy 0.81618 (0.83067)	Top-1 acc 49.219 (48.024)	Top-5 acc 72.656 (71.591)	lr 0.02202
Train [27][2950/3239]	Time 0.642 (0.908)	Data Time 0.001 (0.009)	Loss 3.2178 (3.1776)	Entropy 0.81631 (0.83062)	Top-1 acc 46.875 (48.024)	Top-5 acc 72.656 (71.591)	lr 0.02202
Train [27][2960/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.009)	Loss 3.2732 (3.1779)	Entropy 0.81631 (0.83058)	Top-1 acc 45.312 (48.022)	Top-5 acc 67.188 (71.585)	lr 0.02202
Train [27][2970/3239]	Time 0.738 (0.908)	Data Time 0.001 (0.009)	Loss 2.9946 (3.1775)	Entropy 0.81601 (0.83053)	Top-1 acc 51.953 (48.034)	Top-5 acc 75.391 (71.594)	lr 0.02202
Train [27][2980/3239]	Time 0.592 (0.908)	Data Time 0.001 (0.009)	Loss 2.9030 (3.1773)	Entropy 0.81574 (0.83048)	Top-1 acc 54.688 (48.040)	Top-5 acc 75.391 (71.600)	lr 0.02202
Train [27][2990/3239]	Time 0.618 (0.908)	Data Time 0.001 (0.009)	Loss 3.2039 (3.1774)	Entropy 0.81555 (0.83043)	Top-1 acc 51.562 (48.038)	Top-5 acc 71.094 (71.599)	lr 0.02202
Train [27][3000/3239]	Time 0.615 (0.908)	Data Time 0.001 (0.009)	Loss 3.0824 (3.1774)	Entropy 0.81538 (0.83038)	Top-1 acc 48.828 (48.035)	Top-5 acc 73.828 (71.600)	lr 0.02202
Train [27][3010/3239]	Time 0.628 (0.907)	Data Time 0.001 (0.009)	Loss 3.0345 (3.1777)	Entropy 0.81547 (0.83033)	Top-1 acc 49.219 (48.029)	Top-5 acc 71.484 (71.594)	lr 0.02202
Train [27][3020/3239]	Time 0.580 (0.907)	Data Time 0.001 (0.009)	Loss 3.0113 (3.1778)	Entropy 0.81547 (0.83028)	Top-1 acc 52.344 (48.029)	Top-5 acc 75.391 (71.593)	lr 0.02202
Train [27][3030/3239]	Time 0.602 (0.907)	Data Time 0.001 (0.009)	Loss 3.2178 (3.1781)	Entropy 0.81537 (0.83023)	Top-1 acc 45.703 (48.021)	Top-5 acc 71.875 (71.588)	lr 0.02202
Train [27][3040/3239]	Time 0.593 (0.907)	Data Time 0.001 (0.009)	Loss 3.3737 (3.1781)	Entropy 0.81501 (0.83018)	Top-1 acc 43.359 (48.018)	Top-5 acc 68.750 (71.587)	lr 0.02202
Train [27][3050/3239]	Time 0.597 (0.907)	Data Time 0.001 (0.009)	Loss 3.3152 (3.1782)	Entropy 0.81484 (0.83013)	Top-1 acc 42.969 (48.013)	Top-5 acc 67.578 (71.585)	lr 0.02202
Train [27][3060/3239]	Time 0.584 (0.907)	Data Time 0.001 (0.009)	Loss 3.0939 (3.1780)	Entropy 0.81521 (0.83008)	Top-1 acc 44.141 (48.013)	Top-5 acc 76.953 (71.592)	lr 0.02202
Train [27][3070/3239]	Time 0.609 (0.907)	Data Time 0.001 (0.009)	Loss 3.3314 (3.1780)	Entropy 0.81560 (0.83004)	Top-1 acc 43.750 (48.015)	Top-5 acc 69.141 (71.593)	lr 0.02202
Train [27][3080/3239]	Time 0.630 (0.907)	Data Time 0.001 (0.009)	Loss 3.0702 (3.1779)	Entropy 0.81521 (0.82999)	Top-1 acc 47.656 (48.018)	Top-5 acc 72.266 (71.596)	lr 0.02202
Train [27][3090/3239]	Time 0.585 (0.907)	Data Time 0.001 (0.009)	Loss 3.1187 (3.1777)	Entropy 0.81535 (0.82994)	Top-1 acc 45.312 (48.023)	Top-5 acc 73.047 (71.599)	lr 0.02201
Train [27][3100/3239]	Time 0.655 (0.906)	Data Time 0.001 (0.009)	Loss 3.0748 (3.1775)	Entropy 0.81556 (0.82989)	Top-1 acc 49.219 (48.026)	Top-5 acc 72.266 (71.602)	lr 0.02201
Train [27][3110/3239]	Time 0.610 (0.906)	Data Time 0.001 (0.009)	Loss 3.1841 (3.1774)	Entropy 0.81554 (0.82985)	Top-1 acc 48.438 (48.027)	Top-5 acc 73.438 (71.604)	lr 0.02201
Train [27][3120/3239]	Time 0.673 (0.906)	Data Time 0.001 (0.009)	Loss 2.9554 (3.1772)	Entropy 0.81523 (0.82980)	Top-1 acc 53.516 (48.032)	Top-5 acc 75.391 (71.609)	lr 0.02201
Train [27][3130/3239]	Time 0.744 (0.906)	Data Time 0.001 (0.009)	Loss 3.2309 (3.1772)	Entropy 0.81487 (0.82975)	Top-1 acc 49.609 (48.029)	Top-5 acc 70.312 (71.606)	lr 0.02201
Train [27][3140/3239]	Time 0.618 (0.906)	Data Time 0.002 (0.009)	Loss 3.2687 (3.1772)	Entropy 0.81498 (0.82971)	Top-1 acc 47.266 (48.028)	Top-5 acc 70.703 (71.607)	lr 0.02201
Train [27][3150/3239]	Time 0.593 (0.906)	Data Time 0.001 (0.009)	Loss 3.1772 (3.1773)	Entropy 0.81487 (0.82966)	Top-1 acc 51.172 (48.026)	Top-5 acc 75.000 (71.608)	lr 0.02201
Train [27][3160/3239]	Time 0.593 (0.905)	Data Time 0.001 (0.009)	Loss 3.1158 (3.1772)	Entropy 0.81475 (0.82961)	Top-1 acc 50.781 (48.027)	Top-5 acc 73.828 (71.607)	lr 0.02201
Train [27][3170/3239]	Time 0.639 (0.905)	Data Time 0.001 (0.009)	Loss 3.2299 (3.1772)	Entropy 0.81432 (0.82957)	Top-1 acc 40.625 (48.026)	Top-5 acc 71.484 (71.607)	lr 0.02201
Train [27][3180/3239]	Time 0.609 (0.905)	Data Time 0.000 (0.009)	Loss 3.1461 (3.1769)	Entropy 0.81444 (0.82952)	Top-1 acc 48.828 (48.029)	Top-5 acc 74.609 (71.611)	lr 0.02201
Train [27][3190/3239]	Time 0.633 (0.905)	Data Time 0.000 (0.009)	Loss 3.2155 (3.1769)	Entropy 0.81436 (0.82947)	Top-1 acc 48.438 (48.031)	Top-5 acc 71.875 (71.612)	lr 0.02201
Train [27][3200/3239]	Time 0.696 (0.905)	Data Time 0.000 (0.009)	Loss 3.2314 (3.1768)	Entropy 0.81441 (0.82942)	Top-1 acc 46.094 (48.033)	Top-5 acc 70.312 (71.614)	lr 0.02201
Train [27][3210/3239]	Time 0.567 (0.905)	Data Time 0.000 (0.009)	Loss 3.1417 (3.1769)	Entropy 0.81454 (0.82938)	Top-1 acc 48.047 (48.032)	Top-5 acc 74.219 (71.615)	lr 0.02201
Train [27][3220/3239]	Time 0.631 (0.904)	Data Time 0.000 (0.008)	Loss 3.2962 (3.1770)	Entropy 0.81451 (0.82933)	Top-1 acc 46.094 (48.026)	Top-5 acc 70.312 (71.611)	lr 0.02201
Train [27][3230/3239]	Time 0.584 (0.904)	Data Time 0.000 (0.008)	Loss 3.1168 (3.1770)	Entropy 0.81456 (0.82929)	Top-1 acc 48.438 (48.029)	Top-5 acc 72.266 (71.613)	lr 0.02201
Train [27][3239/3239]	Time 1.558 (0.904)	Data Time 0.000 (0.008)	Loss 3.1729 (3.1772)	Entropy 0.81437 (0.82924)	Top-1 acc 48.148 (48.026)	Top-5 acc 80.247 (71.609)	lr 0.02201
==========Valid [27/120]	loss 1.895	top-1 acc 57.706 (57.706)	top-5 acc 80.187	Train top-1 48.026	top-5 71.609	Entropy 0.81437	Latency-None: 0.000ms	Flops: 539.76M
Train [28][0/3239]	Time 25.835 (25.835)	Data Time 24.552 (24.552)	Loss 3.4707 (3.4707)	Entropy 0.81440 (0.81440)	Top-1 acc 40.234 (40.234)	Top-5 acc 64.453 (64.453)	lr 0.02201
Train [28][10/3239]	Time 0.594 (3.209)	Data Time 0.001 (2.234)	Loss 2.8980 (3.1576)	Entropy 0.81435 (0.81439)	Top-1 acc 47.656 (47.124)	Top-5 acc 74.609 (71.555)	lr 0.02200
Train [28][20/3239]	Time 0.638 (2.084)	Data Time 0.002 (1.171)	Loss 3.1543 (3.1782)	Entropy 0.81457 (0.81445)	Top-1 acc 46.875 (46.968)	Top-5 acc 70.703 (71.038)	lr 0.02200
Train [28][30/3239]	Time 0.703 (1.694)	Data Time 0.001 (0.794)	Loss 3.0944 (3.1499)	Entropy 0.81477 (0.81453)	Top-1 acc 48.828 (47.959)	Top-5 acc 71.094 (71.623)	lr 0.02200
Train [28][40/3239]	Time 0.642 (1.493)	Data Time 0.001 (0.601)	Loss 2.9264 (3.1457)	Entropy 0.81454 (0.81455)	Top-1 acc 56.250 (48.447)	Top-5 acc 73.438 (71.885)	lr 0.02200
Train [28][50/3239]	Time 0.560 (1.364)	Data Time 0.001 (0.483)	Loss 3.2513 (3.1412)	Entropy 0.81484 (0.81458)	Top-1 acc 46.875 (48.729)	Top-5 acc 67.188 (72.044)	lr 0.02200
Train [28][60/3239]	Time 0.585 (1.277)	Data Time 0.001 (0.404)	Loss 3.3252 (3.1461)	Entropy 0.81491 (0.81463)	Top-1 acc 42.969 (48.546)	Top-5 acc 70.703 (71.933)	lr 0.02200
Train [28][70/3239]	Time 0.467 (1.210)	Data Time 0.001 (0.348)	Loss 3.1544 (3.1481)	Entropy 0.81475 (0.81466)	Top-1 acc 52.734 (48.449)	Top-5 acc 69.922 (72.013)	lr 0.02200
Train [28][80/3239]	Time 0.611 (1.168)	Data Time 0.003 (0.305)	Loss 3.3968 (3.1424)	Entropy 0.81456 (0.81467)	Top-1 acc 42.188 (48.717)	Top-5 acc 67.188 (72.184)	lr 0.02200
Train [28][90/3239]	Time 0.629 (1.135)	Data Time 0.001 (0.272)	Loss 3.2459 (3.1392)	Entropy 0.81450 (0.81464)	Top-1 acc 42.188 (48.725)	Top-5 acc 70.312 (72.257)	lr 0.02200
Train [28][100/3239]	Time 0.596 (1.108)	Data Time 0.001 (0.245)	Loss 3.3737 (3.1413)	Entropy 0.81436 (0.81463)	Top-1 acc 43.359 (48.793)	Top-5 acc 67.188 (72.235)	lr 0.02200
Train [28][110/3239]	Time 0.644 (1.085)	Data Time 0.001 (0.223)	Loss 3.0968 (3.1422)	Entropy 0.81454 (0.81461)	Top-1 acc 48.438 (48.705)	Top-5 acc 72.656 (72.245)	lr 0.02200
Train [28][120/3239]	Time 0.598 (1.066)	Data Time 0.001 (0.205)	Loss 3.0904 (3.1493)	Entropy 0.81486 (0.81461)	Top-1 acc 48.828 (48.638)	Top-5 acc 75.781 (72.156)	lr 0.02200
Train [28][130/3239]	Time 0.599 (1.049)	Data Time 0.001 (0.189)	Loss 3.0269 (3.1430)	Entropy 0.81466 (0.81462)	Top-1 acc 53.516 (48.783)	Top-5 acc 71.484 (72.212)	lr 0.02200
Train [28][140/3239]	Time 0.630 (1.035)	Data Time 0.001 (0.176)	Loss 3.1501 (3.1395)	Entropy 0.81483 (0.81463)	Top-1 acc 49.609 (48.956)	Top-5 acc 71.094 (72.260)	lr 0.02200
Train [28][150/3239]	Time 0.628 (1.024)	Data Time 0.001 (0.164)	Loss 3.1266 (3.1388)	Entropy 0.81489 (0.81464)	Top-1 acc 47.266 (48.999)	Top-5 acc 71.875 (72.284)	lr 0.02200
Train [28][160/3239]	Time 0.593 (1.013)	Data Time 0.001 (0.154)	Loss 3.1477 (3.1415)	Entropy 0.81471 (0.81466)	Top-1 acc 48.047 (48.935)	Top-5 acc 70.703 (72.188)	lr 0.02199
Train [28][170/3239]	Time 0.570 (1.005)	Data Time 0.001 (0.145)	Loss 3.0679 (3.1374)	Entropy 0.81466 (0.81466)	Top-1 acc 51.172 (49.045)	Top-5 acc 73.828 (72.307)	lr 0.02199
Train [28][180/3239]	Time 0.648 (0.997)	Data Time 0.001 (0.137)	Loss 3.1189 (3.1383)	Entropy 0.81451 (0.81465)	Top-1 acc 49.609 (49.029)	Top-5 acc 71.484 (72.298)	lr 0.02199
Train [28][190/3239]	Time 0.737 (0.991)	Data Time 0.001 (0.130)	Loss 3.1388 (3.1409)	Entropy 0.81469 (0.81465)	Top-1 acc 50.000 (48.977)	Top-5 acc 73.047 (72.274)	lr 0.02199
Train [28][200/3239]	Time 0.611 (0.984)	Data Time 0.001 (0.124)	Loss 3.1646 (3.1413)	Entropy 0.81457 (0.81465)	Top-1 acc 49.219 (48.974)	Top-5 acc 72.266 (72.266)	lr 0.02199
Train [28][210/3239]	Time 0.594 (0.978)	Data Time 0.001 (0.118)	Loss 2.9129 (3.1406)	Entropy 0.81446 (0.81464)	Top-1 acc 52.344 (48.906)	Top-5 acc 77.344 (72.330)	lr 0.02199
Train [28][220/3239]	Time 0.603 (0.973)	Data Time 0.001 (0.113)	Loss 3.1623 (3.1399)	Entropy 0.81450 (0.81464)	Top-1 acc 51.172 (48.994)	Top-5 acc 70.312 (72.285)	lr 0.02199
Train [28][230/3239]	Time 0.609 (0.967)	Data Time 0.001 (0.108)	Loss 3.1146 (3.1413)	Entropy 0.81454 (0.81463)	Top-1 acc 48.828 (48.977)	Top-5 acc 71.875 (72.215)	lr 0.02199
Train [28][240/3239]	Time 0.551 (0.961)	Data Time 0.001 (0.104)	Loss 3.2409 (3.1406)	Entropy 0.81485 (0.81463)	Top-1 acc 48.438 (48.977)	Top-5 acc 70.312 (72.214)	lr 0.02199
Train [28][250/3239]	Time 0.619 (0.956)	Data Time 0.001 (0.100)	Loss 3.1982 (3.1420)	Entropy 0.81462 (0.81464)	Top-1 acc 49.609 (48.939)	Top-5 acc 71.484 (72.194)	lr 0.02199
Train [28][260/3239]	Time 0.723 (1.044)	Data Time 0.005 (0.096)	Loss 3.1442 (3.1421)	Entropy 0.81473 (0.81464)	Top-1 acc 50.781 (48.954)	Top-5 acc 72.266 (72.192)	lr 0.02199
Train [28][270/3239]	Time 0.587 (1.039)	Data Time 0.002 (0.092)	Loss 3.1481 (3.1439)	Entropy 0.81446 (0.81464)	Top-1 acc 50.000 (48.928)	Top-5 acc 74.219 (72.168)	lr 0.02199
Train [28][280/3239]	Time 0.630 (1.032)	Data Time 0.001 (0.089)	Loss 3.1121 (3.1429)	Entropy 0.81487 (0.81464)	Top-1 acc 48.828 (48.956)	Top-5 acc 73.047 (72.192)	lr 0.02199
Train [28][290/3239]	Time 0.612 (1.026)	Data Time 0.001 (0.086)	Loss 3.1633 (3.1419)	Entropy 0.81456 (0.81465)	Top-1 acc 46.484 (48.945)	Top-5 acc 74.219 (72.201)	lr 0.02199
Train [28][300/3239]	Time 0.586 (1.021)	Data Time 0.001 (0.083)	Loss 3.2443 (3.1422)	Entropy 0.81459 (0.81464)	Top-1 acc 48.047 (48.958)	Top-5 acc 69.531 (72.196)	lr 0.02199
Train [28][310/3239]	Time 0.619 (1.016)	Data Time 0.001 (0.081)	Loss 3.1921 (3.1417)	Entropy 0.81461 (0.81464)	Top-1 acc 50.000 (48.998)	Top-5 acc 69.531 (72.217)	lr 0.02198
Train [28][320/3239]	Time 0.593 (1.010)	Data Time 0.001 (0.078)	Loss 3.1916 (3.1415)	Entropy 0.81450 (0.81464)	Top-1 acc 48.828 (49.017)	Top-5 acc 73.047 (72.223)	lr 0.02198
Train [28][330/3239]	Time 0.619 (1.006)	Data Time 0.001 (0.076)	Loss 3.1085 (3.1425)	Entropy 0.81460 (0.81464)	Top-1 acc 51.562 (48.977)	Top-5 acc 71.875 (72.189)	lr 0.02198
Train [28][340/3239]	Time 0.510 (1.002)	Data Time 0.001 (0.074)	Loss 3.0824 (3.1414)	Entropy 0.81448 (0.81463)	Top-1 acc 52.734 (49.007)	Top-5 acc 74.219 (72.234)	lr 0.02198
Train [28][350/3239]	Time 0.693 (0.998)	Data Time 0.002 (0.072)	Loss 3.0107 (3.1406)	Entropy 0.81491 (0.81463)	Top-1 acc 50.000 (49.022)	Top-5 acc 74.219 (72.242)	lr 0.02198
Train [28][360/3239]	Time 0.610 (0.993)	Data Time 0.001 (0.070)	Loss 3.0171 (3.1397)	Entropy 0.81478 (0.81464)	Top-1 acc 54.688 (49.048)	Top-5 acc 75.000 (72.262)	lr 0.02198
Train [28][370/3239]	Time 0.595 (0.989)	Data Time 0.001 (0.068)	Loss 2.8643 (3.1388)	Entropy 0.81453 (0.81464)	Top-1 acc 54.297 (49.072)	Top-5 acc 78.906 (72.277)	lr 0.02198
Train [28][380/3239]	Time 0.610 (0.986)	Data Time 0.001 (0.066)	Loss 3.1368 (3.1393)	Entropy 0.81455 (0.81464)	Top-1 acc 50.391 (49.052)	Top-5 acc 71.484 (72.272)	lr 0.02198
Train [28][390/3239]	Time 0.633 (0.983)	Data Time 0.001 (0.065)	Loss 3.2589 (3.1407)	Entropy 0.81457 (0.81464)	Top-1 acc 48.047 (49.012)	Top-5 acc 70.703 (72.273)	lr 0.02198
Train [28][400/3239]	Time 0.575 (0.980)	Data Time 0.001 (0.063)	Loss 3.3192 (3.1413)	Entropy 0.81455 (0.81464)	Top-1 acc 43.750 (48.993)	Top-5 acc 70.312 (72.266)	lr 0.02198
Train [28][410/3239]	Time 0.568 (0.977)	Data Time 0.001 (0.062)	Loss 3.2224 (3.1415)	Entropy 0.81475 (0.81464)	Top-1 acc 50.781 (48.988)	Top-5 acc 73.828 (72.266)	lr 0.02198
Train [28][420/3239]	Time 0.675 (0.974)	Data Time 0.001 (0.060)	Loss 3.0358 (3.1391)	Entropy 0.81459 (0.81464)	Top-1 acc 52.734 (49.035)	Top-5 acc 74.609 (72.317)	lr 0.02198
Train [28][430/3239]	Time 0.610 (0.971)	Data Time 0.001 (0.059)	Loss 3.3225 (3.1386)	Entropy 0.81470 (0.81464)	Top-1 acc 47.656 (49.061)	Top-5 acc 65.625 (72.333)	lr 0.02198
Train [28][440/3239]	Time 0.651 (0.969)	Data Time 0.001 (0.058)	Loss 3.0794 (3.1403)	Entropy 0.81468 (0.81464)	Top-1 acc 51.172 (49.016)	Top-5 acc 73.438 (72.289)	lr 0.02198
Train [28][450/3239]	Time 0.603 (0.967)	Data Time 0.001 (0.056)	Loss 3.1321 (3.1396)	Entropy 0.81471 (0.81464)	Top-1 acc 54.688 (49.019)	Top-5 acc 73.047 (72.307)	lr 0.02198
Train [28][460/3239]	Time 0.591 (0.965)	Data Time 0.001 (0.055)	Loss 3.3228 (3.1401)	Entropy 0.81478 (0.81464)	Top-1 acc 42.969 (48.986)	Top-5 acc 66.406 (72.292)	lr 0.02197
Train [28][470/3239]	Time 0.617 (0.963)	Data Time 0.001 (0.054)	Loss 2.9784 (3.1394)	Entropy 0.81490 (0.81465)	Top-1 acc 55.078 (48.988)	Top-5 acc 77.734 (72.318)	lr 0.02197
Train [28][480/3239]	Time 0.630 (0.960)	Data Time 0.001 (0.053)	Loss 3.0581 (3.1381)	Entropy 0.81474 (0.81465)	Top-1 acc 50.781 (49.025)	Top-5 acc 75.000 (72.332)	lr 0.02197
Train [28][490/3239]	Time 0.595 (0.959)	Data Time 0.001 (0.052)	Loss 3.2459 (3.1388)	Entropy 0.81448 (0.81465)	Top-1 acc 48.047 (49.016)	Top-5 acc 70.312 (72.308)	lr 0.02197
Train [28][500/3239]	Time 0.583 (0.956)	Data Time 0.001 (0.051)	Loss 3.3398 (3.1395)	Entropy 0.81415 (0.81465)	Top-1 acc 45.703 (48.993)	Top-5 acc 66.797 (72.307)	lr 0.02197
Train [28][510/3239]	Time 0.679 (0.955)	Data Time 0.001 (0.050)	Loss 3.3978 (3.1402)	Entropy 0.81391 (0.81464)	Top-1 acc 42.188 (48.975)	Top-5 acc 69.141 (72.286)	lr 0.02197
Train [28][520/3239]	Time 0.604 (0.953)	Data Time 0.001 (0.049)	Loss 2.9903 (3.1386)	Entropy 0.81361 (0.81462)	Top-1 acc 51.953 (48.976)	Top-5 acc 73.438 (72.304)	lr 0.02197
Train [28][530/3239]	Time 0.609 (0.951)	Data Time 0.001 (0.048)	Loss 3.1654 (3.1396)	Entropy 0.81387 (0.81460)	Top-1 acc 49.219 (48.936)	Top-5 acc 69.531 (72.274)	lr 0.02197
Train [28][540/3239]	Time 0.629 (0.949)	Data Time 0.002 (0.047)	Loss 3.2434 (3.1402)	Entropy 0.81390 (0.81459)	Top-1 acc 45.312 (48.922)	Top-5 acc 71.484 (72.273)	lr 0.02197
Train [28][550/3239]	Time 0.594 (0.947)	Data Time 0.001 (0.046)	Loss 3.2105 (3.1395)	Entropy 0.81370 (0.81457)	Top-1 acc 49.219 (48.945)	Top-5 acc 71.094 (72.288)	lr 0.02197
Train [28][560/3239]	Time 0.607 (0.946)	Data Time 0.001 (0.046)	Loss 3.0513 (3.1402)	Entropy 0.81391 (0.81456)	Top-1 acc 52.344 (48.941)	Top-5 acc 74.219 (72.271)	lr 0.02197
Train [28][570/3239]	Time 0.618 (0.944)	Data Time 0.001 (0.045)	Loss 3.4760 (3.1410)	Entropy 0.81348 (0.81455)	Top-1 acc 44.141 (48.922)	Top-5 acc 67.188 (72.262)	lr 0.02197
Train [28][580/3239]	Time 0.689 (0.943)	Data Time 0.001 (0.044)	Loss 3.1713 (3.1418)	Entropy 0.81317 (0.81453)	Top-1 acc 48.047 (48.914)	Top-5 acc 73.047 (72.250)	lr 0.02197
Train [28][590/3239]	Time 0.603 (0.942)	Data Time 0.001 (0.043)	Loss 3.2643 (3.1431)	Entropy 0.81319 (0.81450)	Top-1 acc 44.141 (48.879)	Top-5 acc 67.578 (72.207)	lr 0.02197
Train [28][600/3239]	Time 0.632 (0.940)	Data Time 0.003 (0.043)	Loss 3.0299 (3.1434)	Entropy 0.81367 (0.81448)	Top-1 acc 49.609 (48.868)	Top-5 acc 73.047 (72.186)	lr 0.02197
Train [28][610/3239]	Time 0.636 (0.939)	Data Time 0.001 (0.042)	Loss 3.2132 (3.1432)	Entropy 0.81343 (0.81447)	Top-1 acc 46.484 (48.857)	Top-5 acc 70.312 (72.191)	lr 0.02196
Train [28][620/3239]	Time 0.579 (0.938)	Data Time 0.001 (0.041)	Loss 3.2309 (3.1428)	Entropy 0.81295 (0.81445)	Top-1 acc 45.703 (48.856)	Top-5 acc 67.578 (72.191)	lr 0.02196
Train [28][630/3239]	Time 0.615 (0.937)	Data Time 0.001 (0.041)	Loss 3.0789 (3.1425)	Entropy 0.81276 (0.81442)	Top-1 acc 48.047 (48.866)	Top-5 acc 75.000 (72.203)	lr 0.02196
Train [28][640/3239]	Time 0.597 (0.935)	Data Time 0.001 (0.040)	Loss 3.2366 (3.1438)	Entropy 0.81246 (0.81440)	Top-1 acc 44.531 (48.843)	Top-5 acc 73.047 (72.168)	lr 0.02196
Train [28][650/3239]	Time 0.621 (0.934)	Data Time 0.001 (0.040)	Loss 3.0428 (3.1445)	Entropy 0.81209 (0.81436)	Top-1 acc 53.906 (48.813)	Top-5 acc 76.562 (72.149)	lr 0.02196
Train [28][660/3239]	Time 0.604 (0.933)	Data Time 0.001 (0.039)	Loss 3.1547 (3.1448)	Entropy 0.81202 (0.81433)	Top-1 acc 46.094 (48.793)	Top-5 acc 73.047 (72.143)	lr 0.02196
Train [28][670/3239]	Time 0.584 (0.932)	Data Time 0.001 (0.038)	Loss 3.3905 (3.1454)	Entropy 0.81159 (0.81429)	Top-1 acc 42.188 (48.775)	Top-5 acc 66.016 (72.139)	lr 0.02196
Train [28][680/3239]	Time 0.596 (0.931)	Data Time 0.001 (0.038)	Loss 3.1560 (3.1453)	Entropy 0.81181 (0.81425)	Top-1 acc 45.312 (48.793)	Top-5 acc 75.000 (72.145)	lr 0.02196
Train [28][690/3239]	Time 0.591 (0.930)	Data Time 0.001 (0.037)	Loss 3.2440 (3.1457)	Entropy 0.81144 (0.81422)	Top-1 acc 46.484 (48.794)	Top-5 acc 70.312 (72.141)	lr 0.02196
Train [28][700/3239]	Time 0.588 (0.929)	Data Time 0.001 (0.037)	Loss 3.0691 (3.1461)	Entropy 0.81137 (0.81418)	Top-1 acc 51.172 (48.788)	Top-5 acc 74.609 (72.137)	lr 0.02196
Train [28][710/3239]	Time 0.641 (0.927)	Data Time 0.001 (0.036)	Loss 2.9447 (3.1461)	Entropy 0.81110 (0.81414)	Top-1 acc 53.516 (48.764)	Top-5 acc 75.391 (72.143)	lr 0.02196
Train [28][720/3239]	Time 0.630 (0.926)	Data Time 0.001 (0.036)	Loss 3.3102 (3.1467)	Entropy 0.81129 (0.81409)	Top-1 acc 42.969 (48.751)	Top-5 acc 69.922 (72.127)	lr 0.02196
Train [28][730/3239]	Time 0.652 (0.925)	Data Time 0.001 (0.035)	Loss 3.2714 (3.1470)	Entropy 0.81128 (0.81406)	Top-1 acc 47.656 (48.766)	Top-5 acc 66.797 (72.110)	lr 0.02196
Train [28][740/3239]	Time 0.697 (0.924)	Data Time 0.001 (0.035)	Loss 3.2516 (3.1470)	Entropy 0.81122 (0.81402)	Top-1 acc 48.047 (48.774)	Top-5 acc 69.922 (72.113)	lr 0.02196
Train [28][750/3239]	Time 0.610 (0.923)	Data Time 0.001 (0.035)	Loss 2.8750 (3.1483)	Entropy 0.81093 (0.81398)	Top-1 acc 54.297 (48.745)	Top-5 acc 77.734 (72.090)	lr 0.02196
Train [28][760/3239]	Time 0.591 (0.923)	Data Time 0.001 (0.034)	Loss 3.0478 (3.1481)	Entropy 0.81056 (0.81394)	Top-1 acc 51.953 (48.749)	Top-5 acc 74.219 (72.092)	lr 0.02196
Train [28][770/3239]	Time 0.603 (0.922)	Data Time 0.001 (0.034)	Loss 3.3860 (3.1490)	Entropy 0.81051 (0.81390)	Top-1 acc 46.094 (48.718)	Top-5 acc 69.531 (72.069)	lr 0.02195
Train [28][780/3239]	Time 0.624 (0.921)	Data Time 0.002 (0.033)	Loss 3.0363 (3.1494)	Entropy 0.80962 (0.81385)	Top-1 acc 50.000 (48.713)	Top-5 acc 75.000 (72.053)	lr 0.02195
Train [28][790/3239]	Time 0.614 (0.920)	Data Time 0.001 (0.033)	Loss 2.8099 (3.1497)	Entropy 0.80902 (0.81379)	Top-1 acc 58.594 (48.707)	Top-5 acc 77.344 (72.046)	lr 0.02195
Train [28][800/3239]	Time 0.595 (0.920)	Data Time 0.001 (0.033)	Loss 3.2125 (3.1500)	Entropy 0.80879 (0.81373)	Top-1 acc 46.094 (48.686)	Top-5 acc 71.094 (72.046)	lr 0.02195
Train [28][810/3239]	Time 0.695 (0.919)	Data Time 0.001 (0.032)	Loss 3.2404 (3.1503)	Entropy 0.80878 (0.81367)	Top-1 acc 46.094 (48.670)	Top-5 acc 69.531 (72.044)	lr 0.02195
Train [28][820/3239]	Time 0.602 (0.918)	Data Time 0.001 (0.032)	Loss 3.0701 (3.1500)	Entropy 0.80903 (0.81361)	Top-1 acc 53.125 (48.693)	Top-5 acc 73.047 (72.036)	lr 0.02195
Train [28][830/3239]	Time 0.622 (0.917)	Data Time 0.001 (0.031)	Loss 2.8348 (3.1490)	Entropy 0.80939 (0.81356)	Top-1 acc 57.422 (48.713)	Top-5 acc 80.078 (72.061)	lr 0.02195
Train [28][840/3239]	Time 0.623 (0.917)	Data Time 0.001 (0.031)	Loss 3.0369 (3.1486)	Entropy 0.80955 (0.81351)	Top-1 acc 51.953 (48.727)	Top-5 acc 73.047 (72.071)	lr 0.02195
Train [28][850/3239]	Time 0.572 (0.916)	Data Time 0.001 (0.031)	Loss 3.2613 (3.1480)	Entropy 0.80954 (0.81346)	Top-1 acc 47.656 (48.729)	Top-5 acc 69.922 (72.086)	lr 0.02195
Train [28][860/3239]	Time 0.654 (0.916)	Data Time 0.001 (0.030)	Loss 3.0493 (3.1483)	Entropy 0.80950 (0.81342)	Top-1 acc 46.094 (48.722)	Top-5 acc 75.781 (72.084)	lr 0.02195
Train [28][870/3239]	Time 0.606 (0.915)	Data Time 0.001 (0.030)	Loss 2.9115 (3.1484)	Entropy 0.80964 (0.81337)	Top-1 acc 55.859 (48.720)	Top-5 acc 75.781 (72.086)	lr 0.02195
Train [28][880/3239]	Time 0.558 (0.914)	Data Time 0.001 (0.030)	Loss 3.0961 (3.1480)	Entropy 0.80968 (0.81333)	Top-1 acc 49.609 (48.733)	Top-5 acc 73.828 (72.090)	lr 0.02195
Train [28][890/3239]	Time 0.595 (0.913)	Data Time 0.001 (0.029)	Loss 3.1847 (3.1481)	Entropy 0.80970 (0.81329)	Top-1 acc 48.828 (48.722)	Top-5 acc 70.312 (72.087)	lr 0.02195
Train [28][900/3239]	Time 0.683 (0.913)	Data Time 0.001 (0.029)	Loss 3.1925 (3.1482)	Entropy 0.80982 (0.81325)	Top-1 acc 44.141 (48.718)	Top-5 acc 67.578 (72.084)	lr 0.02195
Train [28][910/3239]	Time 0.614 (0.912)	Data Time 0.001 (0.029)	Loss 3.1634 (3.1478)	Entropy 0.80998 (0.81322)	Top-1 acc 48.438 (48.727)	Top-5 acc 75.781 (72.096)	lr 0.02195
Train [28][920/3239]	Time 0.593 (0.937)	Data Time 0.002 (0.029)	Loss 2.9873 (3.1478)	Entropy 0.80981 (0.81318)	Top-1 acc 50.781 (48.724)	Top-5 acc 75.391 (72.099)	lr 0.02194
Train [28][930/3239]	Time 0.605 (0.937)	Data Time 0.002 (0.028)	Loss 3.1466 (3.1464)	Entropy 0.80955 (0.81314)	Top-1 acc 51.562 (48.740)	Top-5 acc 71.875 (72.129)	lr 0.02194
Train [28][940/3239]	Time 0.594 (0.936)	Data Time 0.001 (0.028)	Loss 3.2838 (3.1462)	Entropy 0.80990 (0.81310)	Top-1 acc 44.141 (48.749)	Top-5 acc 70.703 (72.130)	lr 0.02194
Train [28][950/3239]	Time 0.588 (0.935)	Data Time 0.001 (0.028)	Loss 3.3135 (3.1470)	Entropy 0.80974 (0.81307)	Top-1 acc 45.703 (48.731)	Top-5 acc 69.922 (72.116)	lr 0.02194
Train [28][960/3239]	Time 0.603 (0.935)	Data Time 0.001 (0.028)	Loss 3.0663 (3.1470)	Entropy 0.80962 (0.81304)	Top-1 acc 55.469 (48.743)	Top-5 acc 71.484 (72.107)	lr 0.02194
Train [28][970/3239]	Time 0.696 (0.934)	Data Time 0.001 (0.027)	Loss 2.8641 (3.1471)	Entropy 0.80942 (0.81300)	Top-1 acc 54.688 (48.745)	Top-5 acc 80.078 (72.107)	lr 0.02194
Train [28][980/3239]	Time 0.602 (0.933)	Data Time 0.001 (0.027)	Loss 3.2174 (3.1473)	Entropy 0.80920 (0.81296)	Top-1 acc 43.359 (48.749)	Top-5 acc 66.797 (72.090)	lr 0.02194
Train [28][990/3239]	Time 0.610 (0.932)	Data Time 0.001 (0.027)	Loss 3.1183 (3.1470)	Entropy 0.80893 (0.81293)	Top-1 acc 51.953 (48.758)	Top-5 acc 76.562 (72.108)	lr 0.02194
Train [28][1000/3239]	Time 0.615 (0.932)	Data Time 0.002 (0.027)	Loss 3.1785 (3.1468)	Entropy 0.80901 (0.81289)	Top-1 acc 46.875 (48.748)	Top-5 acc 73.828 (72.115)	lr 0.02194
Train [28][1010/3239]	Time 0.470 (0.931)	Data Time 0.001 (0.026)	Loss 3.1677 (3.1468)	Entropy 0.80896 (0.81285)	Top-1 acc 49.219 (48.752)	Top-5 acc 73.438 (72.117)	lr 0.02194
Train [28][1020/3239]	Time 0.597 (0.930)	Data Time 0.001 (0.026)	Loss 3.1921 (3.1471)	Entropy 0.80890 (0.81281)	Top-1 acc 48.438 (48.738)	Top-5 acc 69.922 (72.106)	lr 0.02194
Train [28][1030/3239]	Time 0.638 (0.929)	Data Time 0.001 (0.026)	Loss 3.0673 (3.1472)	Entropy 0.80884 (0.81277)	Top-1 acc 46.094 (48.729)	Top-5 acc 78.125 (72.106)	lr 0.02194
Train [28][1040/3239]	Time 0.613 (0.929)	Data Time 0.001 (0.026)	Loss 2.9197 (3.1466)	Entropy 0.80837 (0.81273)	Top-1 acc 56.641 (48.746)	Top-5 acc 77.344 (72.121)	lr 0.02194
Train [28][1050/3239]	Time 0.634 (0.928)	Data Time 0.001 (0.025)	Loss 3.2200 (3.1472)	Entropy 0.80857 (0.81269)	Top-1 acc 46.094 (48.732)	Top-5 acc 71.875 (72.107)	lr 0.02194
Train [28][1060/3239]	Time 0.695 (0.927)	Data Time 0.001 (0.025)	Loss 3.4459 (3.1485)	Entropy 0.80864 (0.81265)	Top-1 acc 44.141 (48.697)	Top-5 acc 65.625 (72.073)	lr 0.02194
Train [28][1070/3239]	Time 0.606 (0.927)	Data Time 0.001 (0.025)	Loss 3.3252 (3.1490)	Entropy 0.80846 (0.81262)	Top-1 acc 44.141 (48.688)	Top-5 acc 67.578 (72.069)	lr 0.02193
Train [28][1080/3239]	Time 0.649 (0.926)	Data Time 0.001 (0.025)	Loss 3.0722 (3.1497)	Entropy 0.80839 (0.81258)	Top-1 acc 47.266 (48.676)	Top-5 acc 70.312 (72.054)	lr 0.02193
Train [28][1090/3239]	Time 0.564 (0.926)	Data Time 0.001 (0.024)	Loss 3.2516 (3.1496)	Entropy 0.80807 (0.81254)	Top-1 acc 46.094 (48.683)	Top-5 acc 73.047 (72.058)	lr 0.02193
Train [28][1100/3239]	Time 0.639 (0.925)	Data Time 0.001 (0.024)	Loss 3.4210 (3.1499)	Entropy 0.80801 (0.81250)	Top-1 acc 44.922 (48.678)	Top-5 acc 69.141 (72.056)	lr 0.02193
Train [28][1110/3239]	Time 0.609 (0.924)	Data Time 0.001 (0.024)	Loss 3.0568 (3.1499)	Entropy 0.80785 (0.81246)	Top-1 acc 50.391 (48.675)	Top-5 acc 74.609 (72.055)	lr 0.02193
Train [28][1120/3239]	Time 0.617 (0.924)	Data Time 0.001 (0.024)	Loss 2.9996 (3.1490)	Entropy 0.80813 (0.81242)	Top-1 acc 50.391 (48.694)	Top-5 acc 76.953 (72.078)	lr 0.02193
Train [28][1130/3239]	Time 0.711 (0.923)	Data Time 0.002 (0.024)	Loss 2.8980 (3.1485)	Entropy 0.80794 (0.81238)	Top-1 acc 53.516 (48.705)	Top-5 acc 78.125 (72.090)	lr 0.02193
Train [28][1140/3239]	Time 0.607 (0.923)	Data Time 0.001 (0.023)	Loss 3.2811 (3.1493)	Entropy 0.80787 (0.81234)	Top-1 acc 46.484 (48.689)	Top-5 acc 66.406 (72.072)	lr 0.02193
Train [28][1150/3239]	Time 0.608 (0.922)	Data Time 0.002 (0.023)	Loss 3.1513 (3.1494)	Entropy 0.80758 (0.81230)	Top-1 acc 47.266 (48.687)	Top-5 acc 70.703 (72.063)	lr 0.02193
Train [28][1160/3239]	Time 0.591 (0.922)	Data Time 0.001 (0.023)	Loss 3.2029 (3.1502)	Entropy 0.80726 (0.81226)	Top-1 acc 48.828 (48.673)	Top-5 acc 68.359 (72.047)	lr 0.02193
Train [28][1170/3239]	Time 0.624 (0.921)	Data Time 0.001 (0.023)	Loss 3.1242 (3.1502)	Entropy 0.80732 (0.81221)	Top-1 acc 50.000 (48.683)	Top-5 acc 71.484 (72.043)	lr 0.02193
Train [28][1180/3239]	Time 0.573 (0.920)	Data Time 0.001 (0.023)	Loss 3.1129 (3.1506)	Entropy 0.80709 (0.81217)	Top-1 acc 50.391 (48.673)	Top-5 acc 70.703 (72.037)	lr 0.02193
Train [28][1190/3239]	Time 0.598 (0.919)	Data Time 0.001 (0.023)	Loss 3.0675 (3.1509)	Entropy 0.80755 (0.81213)	Top-1 acc 50.000 (48.664)	Top-5 acc 73.828 (72.035)	lr 0.02193
Train [28][1200/3239]	Time 0.623 (0.919)	Data Time 0.001 (0.022)	Loss 3.3390 (3.1517)	Entropy 0.80768 (0.81209)	Top-1 acc 43.750 (48.644)	Top-5 acc 67.578 (72.016)	lr 0.02193
Train [28][1210/3239]	Time 0.641 (0.919)	Data Time 0.002 (0.022)	Loss 3.1439 (3.1520)	Entropy 0.80780 (0.81206)	Top-1 acc 48.047 (48.641)	Top-5 acc 75.000 (72.012)	lr 0.02193
Train [28][1220/3239]	Time 0.594 (0.918)	Data Time 0.001 (0.022)	Loss 2.7806 (3.1517)	Entropy 0.80801 (0.81202)	Top-1 acc 57.422 (48.653)	Top-5 acc 78.906 (72.019)	lr 0.02192
Train [28][1230/3239]	Time 0.632 (0.918)	Data Time 0.001 (0.022)	Loss 3.5025 (3.1519)	Entropy 0.80763 (0.81199)	Top-1 acc 42.188 (48.652)	Top-5 acc 64.844 (72.018)	lr 0.02192
Train [28][1240/3239]	Time 0.571 (0.917)	Data Time 0.002 (0.022)	Loss 3.0425 (3.1522)	Entropy 0.80743 (0.81195)	Top-1 acc 50.781 (48.643)	Top-5 acc 76.172 (72.009)	lr 0.02192
Train [28][1250/3239]	Time 0.559 (0.917)	Data Time 0.001 (0.022)	Loss 3.0292 (3.1516)	Entropy 0.80748 (0.81192)	Top-1 acc 50.781 (48.650)	Top-5 acc 74.609 (72.019)	lr 0.02192
Train [28][1260/3239]	Time 0.611 (0.916)	Data Time 0.001 (0.021)	Loss 3.2128 (3.1523)	Entropy 0.80736 (0.81188)	Top-1 acc 47.656 (48.627)	Top-5 acc 73.438 (72.013)	lr 0.02192
Train [28][1270/3239]	Time 0.622 (0.916)	Data Time 0.001 (0.021)	Loss 3.1714 (3.1525)	Entropy 0.80738 (0.81184)	Top-1 acc 50.781 (48.617)	Top-5 acc 71.875 (72.006)	lr 0.02192
Train [28][1280/3239]	Time 0.616 (0.915)	Data Time 0.001 (0.021)	Loss 3.3485 (3.1531)	Entropy 0.80726 (0.81181)	Top-1 acc 41.797 (48.593)	Top-5 acc 67.578 (71.990)	lr 0.02192
Train [28][1290/3239]	Time 0.749 (0.915)	Data Time 0.001 (0.021)	Loss 2.9684 (3.1526)	Entropy 0.80710 (0.81177)	Top-1 acc 52.344 (48.602)	Top-5 acc 75.391 (72.001)	lr 0.02192
Train [28][1300/3239]	Time 0.616 (0.914)	Data Time 0.002 (0.021)	Loss 3.1691 (3.1534)	Entropy 0.80714 (0.81174)	Top-1 acc 49.219 (48.585)	Top-5 acc 72.656 (71.990)	lr 0.02192
Train [28][1310/3239]	Time 0.620 (0.914)	Data Time 0.001 (0.021)	Loss 3.0793 (3.1532)	Entropy 0.80685 (0.81170)	Top-1 acc 50.000 (48.582)	Top-5 acc 73.828 (71.995)	lr 0.02192
Train [28][1320/3239]	Time 0.625 (0.914)	Data Time 0.001 (0.021)	Loss 2.9854 (3.1529)	Entropy 0.80630 (0.81166)	Top-1 acc 51.953 (48.592)	Top-5 acc 73.438 (72.003)	lr 0.02192
Train [28][1330/3239]	Time 0.587 (0.913)	Data Time 0.001 (0.020)	Loss 3.2363 (3.1531)	Entropy 0.80586 (0.81162)	Top-1 acc 45.703 (48.590)	Top-5 acc 69.141 (71.992)	lr 0.02192
Train [28][1340/3239]	Time 0.598 (0.913)	Data Time 0.001 (0.020)	Loss 3.1064 (3.1533)	Entropy 0.80610 (0.81158)	Top-1 acc 51.562 (48.593)	Top-5 acc 73.047 (71.990)	lr 0.02192
Train [28][1350/3239]	Time 0.525 (0.912)	Data Time 0.001 (0.020)	Loss 3.0792 (3.1534)	Entropy 0.80595 (0.81154)	Top-1 acc 51.562 (48.596)	Top-5 acc 73.438 (71.989)	lr 0.02192
Train [28][1360/3239]	Time 0.720 (0.911)	Data Time 0.001 (0.020)	Loss 3.0233 (3.1530)	Entropy 0.80592 (0.81150)	Top-1 acc 51.172 (48.607)	Top-5 acc 73.828 (72.002)	lr 0.02192
Train [28][1370/3239]	Time 0.626 (0.911)	Data Time 0.001 (0.020)	Loss 2.9973 (3.1525)	Entropy 0.80588 (0.81146)	Top-1 acc 54.297 (48.616)	Top-5 acc 76.562 (72.021)	lr 0.02191
Train [28][1380/3239]	Time 0.640 (0.911)	Data Time 0.001 (0.020)	Loss 3.1145 (3.1529)	Entropy 0.80610 (0.81142)	Top-1 acc 48.828 (48.605)	Top-5 acc 71.484 (72.011)	lr 0.02191
Train [28][1390/3239]	Time 0.634 (0.910)	Data Time 0.001 (0.020)	Loss 3.0721 (3.1529)	Entropy 0.80594 (0.81138)	Top-1 acc 46.484 (48.594)	Top-5 acc 74.609 (72.009)	lr 0.02191
Train [28][1400/3239]	Time 0.648 (0.910)	Data Time 0.001 (0.019)	Loss 3.1521 (3.1524)	Entropy 0.80582 (0.81134)	Top-1 acc 48.828 (48.609)	Top-5 acc 71.875 (72.028)	lr 0.02191
Train [28][1410/3239]	Time 0.616 (0.910)	Data Time 0.002 (0.019)	Loss 3.1924 (3.1521)	Entropy 0.80557 (0.81130)	Top-1 acc 45.703 (48.609)	Top-5 acc 73.047 (72.030)	lr 0.02191
Train [28][1420/3239]	Time 0.602 (0.909)	Data Time 0.001 (0.019)	Loss 3.0390 (3.1519)	Entropy 0.80561 (0.81126)	Top-1 acc 50.391 (48.612)	Top-5 acc 76.172 (72.038)	lr 0.02191
Train [28][1430/3239]	Time 0.584 (0.909)	Data Time 0.001 (0.019)	Loss 3.2519 (3.1520)	Entropy 0.80554 (0.81122)	Top-1 acc 46.484 (48.615)	Top-5 acc 70.703 (72.046)	lr 0.02191
Train [28][1440/3239]	Time 0.602 (0.909)	Data Time 0.001 (0.019)	Loss 3.1335 (3.1520)	Entropy 0.80541 (0.81118)	Top-1 acc 45.312 (48.614)	Top-5 acc 71.094 (72.043)	lr 0.02191
Train [28][1450/3239]	Time 0.708 (0.908)	Data Time 0.001 (0.019)	Loss 2.9543 (3.1520)	Entropy 0.80557 (0.81114)	Top-1 acc 52.344 (48.622)	Top-5 acc 76.953 (72.043)	lr 0.02191
Train [28][1460/3239]	Time 0.607 (0.908)	Data Time 0.001 (0.019)	Loss 3.2999 (3.1516)	Entropy 0.80552 (0.81110)	Top-1 acc 45.312 (48.632)	Top-5 acc 68.750 (72.053)	lr 0.02191
Train [28][1470/3239]	Time 0.603 (0.908)	Data Time 0.001 (0.019)	Loss 3.5239 (3.1518)	Entropy 0.80515 (0.81106)	Top-1 acc 43.359 (48.622)	Top-5 acc 65.234 (72.049)	lr 0.02191
Train [28][1480/3239]	Time 0.603 (0.908)	Data Time 0.001 (0.019)	Loss 3.2338 (3.1516)	Entropy 0.80565 (0.81103)	Top-1 acc 44.922 (48.627)	Top-5 acc 71.094 (72.052)	lr 0.02191
Train [28][1490/3239]	Time 0.616 (0.907)	Data Time 0.001 (0.018)	Loss 3.1392 (3.1516)	Entropy 0.80563 (0.81099)	Top-1 acc 51.172 (48.628)	Top-5 acc 71.484 (72.046)	lr 0.02191
Train [28][1500/3239]	Time 0.617 (0.907)	Data Time 0.001 (0.018)	Loss 2.9902 (3.1518)	Entropy 0.80568 (0.81095)	Top-1 acc 51.172 (48.633)	Top-5 acc 76.172 (72.038)	lr 0.02191
Train [28][1510/3239]	Time 0.635 (0.907)	Data Time 0.001 (0.018)	Loss 3.1251 (3.1520)	Entropy 0.80555 (0.81092)	Top-1 acc 49.609 (48.627)	Top-5 acc 74.219 (72.044)	lr 0.02191
Train [28][1520/3239]	Time 0.738 (0.906)	Data Time 0.001 (0.018)	Loss 3.1418 (3.1515)	Entropy 0.80546 (0.81088)	Top-1 acc 47.656 (48.637)	Top-5 acc 71.094 (72.055)	lr 0.02190
Train [28][1530/3239]	Time 0.617 (0.906)	Data Time 0.001 (0.018)	Loss 3.2124 (3.1518)	Entropy 0.80489 (0.81085)	Top-1 acc 47.656 (48.630)	Top-5 acc 73.047 (72.055)	lr 0.02190
Train [28][1540/3239]	Time 0.632 (0.905)	Data Time 0.001 (0.018)	Loss 3.0374 (3.1516)	Entropy 0.80495 (0.81081)	Top-1 acc 49.219 (48.627)	Top-5 acc 72.656 (72.057)	lr 0.02190
Train [28][1550/3239]	Time 0.616 (0.905)	Data Time 0.001 (0.018)	Loss 3.0305 (3.1513)	Entropy 0.80480 (0.81077)	Top-1 acc 52.734 (48.630)	Top-5 acc 73.438 (72.064)	lr 0.02190
Train [28][1560/3239]	Time 0.587 (0.905)	Data Time 0.001 (0.018)	Loss 3.2886 (3.1515)	Entropy 0.80452 (0.81073)	Top-1 acc 44.531 (48.625)	Top-5 acc 69.141 (72.065)	lr 0.02190
Train [28][1570/3239]	Time 0.808 (0.920)	Data Time 0.006 (0.018)	Loss 2.9232 (3.1514)	Entropy 0.80473 (0.81069)	Top-1 acc 50.000 (48.623)	Top-5 acc 76.953 (72.068)	lr 0.02190
Train [28][1580/3239]	Time 0.608 (0.920)	Data Time 0.003 (0.018)	Loss 2.9031 (3.1508)	Entropy 0.80453 (0.81065)	Top-1 acc 56.250 (48.640)	Top-5 acc 75.781 (72.085)	lr 0.02190
Train [28][1590/3239]	Time 0.595 (0.919)	Data Time 0.002 (0.017)	Loss 3.1932 (3.1509)	Entropy 0.80465 (0.81062)	Top-1 acc 45.703 (48.632)	Top-5 acc 69.922 (72.079)	lr 0.02190
Train [28][1600/3239]	Time 0.595 (0.919)	Data Time 0.001 (0.017)	Loss 2.9967 (3.1511)	Entropy 0.80480 (0.81058)	Top-1 acc 54.688 (48.631)	Top-5 acc 77.734 (72.079)	lr 0.02190
Train [28][1610/3239]	Time 0.689 (0.919)	Data Time 0.001 (0.017)	Loss 3.2024 (3.1510)	Entropy 0.80465 (0.81054)	Top-1 acc 44.141 (48.630)	Top-5 acc 71.875 (72.082)	lr 0.02190
Train [28][1620/3239]	Time 0.593 (0.918)	Data Time 0.001 (0.017)	Loss 2.8924 (3.1513)	Entropy 0.80431 (0.81050)	Top-1 acc 54.688 (48.624)	Top-5 acc 75.391 (72.071)	lr 0.02190
Train [28][1630/3239]	Time 0.582 (0.918)	Data Time 0.001 (0.017)	Loss 3.3804 (3.1512)	Entropy 0.80450 (0.81047)	Top-1 acc 42.188 (48.621)	Top-5 acc 72.266 (72.078)	lr 0.02190
Train [28][1640/3239]	Time 0.588 (0.918)	Data Time 0.001 (0.017)	Loss 3.2325 (3.1510)	Entropy 0.80404 (0.81043)	Top-1 acc 50.781 (48.622)	Top-5 acc 71.094 (72.080)	lr 0.02190
Train [28][1650/3239]	Time 0.534 (0.917)	Data Time 0.001 (0.017)	Loss 2.9795 (3.1513)	Entropy 0.80401 (0.81039)	Top-1 acc 55.078 (48.618)	Top-5 acc 76.953 (72.073)	lr 0.02190
Train [28][1660/3239]	Time 0.655 (0.917)	Data Time 0.001 (0.017)	Loss 3.1472 (3.1514)	Entropy 0.80394 (0.81035)	Top-1 acc 50.781 (48.617)	Top-5 acc 71.484 (72.071)	lr 0.02190
Train [28][1670/3239]	Time 0.612 (0.916)	Data Time 0.001 (0.017)	Loss 3.0750 (3.1512)	Entropy 0.80383 (0.81032)	Top-1 acc 50.000 (48.618)	Top-5 acc 73.047 (72.077)	lr 0.02189
Train [28][1680/3239]	Time 0.700 (0.916)	Data Time 0.001 (0.017)	Loss 3.2552 (3.1509)	Entropy 0.80362 (0.81027)	Top-1 acc 48.438 (48.626)	Top-5 acc 70.703 (72.085)	lr 0.02189
Train [28][1690/3239]	Time 0.623 (0.916)	Data Time 0.001 (0.017)	Loss 2.9910 (3.1507)	Entropy 0.80374 (0.81024)	Top-1 acc 53.906 (48.632)	Top-5 acc 75.000 (72.088)	lr 0.02189
Train [28][1700/3239]	Time 0.588 (0.916)	Data Time 0.001 (0.016)	Loss 3.0314 (3.1507)	Entropy 0.80300 (0.81020)	Top-1 acc 51.172 (48.634)	Top-5 acc 71.875 (72.084)	lr 0.02189
Train [28][1710/3239]	Time 0.632 (0.915)	Data Time 0.001 (0.016)	Loss 3.3157 (3.1506)	Entropy 0.80308 (0.81016)	Top-1 acc 42.578 (48.636)	Top-5 acc 68.359 (72.086)	lr 0.02189
Train [28][1720/3239]	Time 0.604 (0.915)	Data Time 0.001 (0.016)	Loss 3.1494 (3.1505)	Entropy 0.80324 (0.81011)	Top-1 acc 46.094 (48.630)	Top-5 acc 74.219 (72.091)	lr 0.02189
Train [28][1730/3239]	Time 0.616 (0.915)	Data Time 0.001 (0.016)	Loss 3.2272 (3.1507)	Entropy 0.80286 (0.81007)	Top-1 acc 48.828 (48.630)	Top-5 acc 70.703 (72.084)	lr 0.02189
Train [28][1740/3239]	Time 0.598 (0.915)	Data Time 0.001 (0.016)	Loss 3.1092 (3.1510)	Entropy 0.80264 (0.81003)	Top-1 acc 50.391 (48.622)	Top-5 acc 72.266 (72.081)	lr 0.02189
Train [28][1750/3239]	Time 0.634 (0.914)	Data Time 0.001 (0.016)	Loss 3.0871 (3.1506)	Entropy 0.80250 (0.80999)	Top-1 acc 51.953 (48.635)	Top-5 acc 72.656 (72.087)	lr 0.02189
Train [28][1760/3239]	Time 0.573 (0.914)	Data Time 0.001 (0.016)	Loss 3.1834 (3.1510)	Entropy 0.80296 (0.80995)	Top-1 acc 47.656 (48.628)	Top-5 acc 72.266 (72.080)	lr 0.02189
Train [28][1770/3239]	Time 0.727 (0.914)	Data Time 0.001 (0.016)	Loss 3.0666 (3.1508)	Entropy 0.80323 (0.80991)	Top-1 acc 53.516 (48.633)	Top-5 acc 70.312 (72.084)	lr 0.02189
Train [28][1780/3239]	Time 0.601 (0.914)	Data Time 0.001 (0.016)	Loss 3.2568 (3.1504)	Entropy 0.80295 (0.80987)	Top-1 acc 45.703 (48.643)	Top-5 acc 70.312 (72.089)	lr 0.02189
Train [28][1790/3239]	Time 0.601 (0.913)	Data Time 0.001 (0.016)	Loss 3.3563 (3.1504)	Entropy 0.80294 (0.80983)	Top-1 acc 46.484 (48.636)	Top-5 acc 67.578 (72.088)	lr 0.02189
Train [28][1800/3239]	Time 0.625 (0.913)	Data Time 0.001 (0.016)	Loss 3.0733 (3.1503)	Entropy 0.80274 (0.80979)	Top-1 acc 51.562 (48.638)	Top-5 acc 75.000 (72.094)	lr 0.02189
Train [28][1810/3239]	Time 0.630 (0.913)	Data Time 0.003 (0.016)	Loss 3.2551 (3.1502)	Entropy 0.80280 (0.80975)	Top-1 acc 48.438 (48.643)	Top-5 acc 69.531 (72.097)	lr 0.02189
Train [28][1820/3239]	Time 0.611 (0.912)	Data Time 0.001 (0.015)	Loss 3.2770 (3.1506)	Entropy 0.80274 (0.80972)	Top-1 acc 44.922 (48.629)	Top-5 acc 67.969 (72.092)	lr 0.02188
Train [28][1830/3239]	Time 0.596 (0.912)	Data Time 0.001 (0.015)	Loss 3.1144 (3.1505)	Entropy 0.80279 (0.80968)	Top-1 acc 47.266 (48.631)	Top-5 acc 73.828 (72.096)	lr 0.02188
Train [28][1840/3239]	Time 0.729 (0.911)	Data Time 0.001 (0.015)	Loss 3.1859 (3.1508)	Entropy 0.80270 (0.80964)	Top-1 acc 49.609 (48.628)	Top-5 acc 71.094 (72.092)	lr 0.02188
Train [28][1850/3239]	Time 0.617 (0.911)	Data Time 0.001 (0.015)	Loss 3.1940 (3.1508)	Entropy 0.80250 (0.80960)	Top-1 acc 51.172 (48.632)	Top-5 acc 71.484 (72.090)	lr 0.02188
Train [28][1860/3239]	Time 0.616 (0.911)	Data Time 0.001 (0.015)	Loss 3.2198 (3.1509)	Entropy 0.80196 (0.80956)	Top-1 acc 48.047 (48.629)	Top-5 acc 67.578 (72.086)	lr 0.02188
Train [28][1870/3239]	Time 0.615 (0.911)	Data Time 0.001 (0.015)	Loss 3.1538 (3.1510)	Entropy 0.80184 (0.80952)	Top-1 acc 47.266 (48.625)	Top-5 acc 71.094 (72.084)	lr 0.02188
Train [28][1880/3239]	Time 0.601 (0.911)	Data Time 0.001 (0.015)	Loss 3.1917 (3.1508)	Entropy 0.80203 (0.80948)	Top-1 acc 46.484 (48.627)	Top-5 acc 71.875 (72.090)	lr 0.02188
Train [28][1890/3239]	Time 0.596 (0.910)	Data Time 0.001 (0.015)	Loss 3.1270 (3.1512)	Entropy 0.80202 (0.80944)	Top-1 acc 49.609 (48.620)	Top-5 acc 69.531 (72.081)	lr 0.02188
Train [28][1900/3239]	Time 0.611 (0.910)	Data Time 0.001 (0.015)	Loss 3.3338 (3.1515)	Entropy 0.80182 (0.80940)	Top-1 acc 44.531 (48.611)	Top-5 acc 68.750 (72.072)	lr 0.02188
Train [28][1910/3239]	Time 0.635 (0.910)	Data Time 0.001 (0.015)	Loss 3.0279 (3.1516)	Entropy 0.80152 (0.80936)	Top-1 acc 50.391 (48.608)	Top-5 acc 72.266 (72.072)	lr 0.02188
Train [28][1920/3239]	Time 0.620 (0.910)	Data Time 0.002 (0.015)	Loss 3.1897 (3.1516)	Entropy 0.80131 (0.80932)	Top-1 acc 44.531 (48.604)	Top-5 acc 72.266 (72.074)	lr 0.02188
Train [28][1930/3239]	Time 0.625 (0.909)	Data Time 0.001 (0.015)	Loss 3.1829 (3.1519)	Entropy 0.80078 (0.80928)	Top-1 acc 48.047 (48.597)	Top-5 acc 70.703 (72.071)	lr 0.02188
Train [28][1940/3239]	Time 0.562 (0.909)	Data Time 0.001 (0.015)	Loss 3.2486 (3.1515)	Entropy 0.80084 (0.80924)	Top-1 acc 43.750 (48.609)	Top-5 acc 68.750 (72.077)	lr 0.02188
Train [28][1950/3239]	Time 0.651 (0.909)	Data Time 0.001 (0.015)	Loss 3.2664 (3.1515)	Entropy 0.80091 (0.80919)	Top-1 acc 43.359 (48.610)	Top-5 acc 68.750 (72.074)	lr 0.02188
Train [28][1960/3239]	Time 0.621 (0.909)	Data Time 0.002 (0.015)	Loss 3.1680 (3.1516)	Entropy 0.80067 (0.80915)	Top-1 acc 47.656 (48.608)	Top-5 acc 72.656 (72.072)	lr 0.02188
Train [28][1970/3239]	Time 0.605 (0.908)	Data Time 0.001 (0.014)	Loss 3.2361 (3.1516)	Entropy 0.80038 (0.80911)	Top-1 acc 48.047 (48.610)	Top-5 acc 71.875 (72.072)	lr 0.02187
Train [28][1980/3239]	Time 0.632 (0.908)	Data Time 0.001 (0.014)	Loss 3.2269 (3.1516)	Entropy 0.80046 (0.80906)	Top-1 acc 44.922 (48.608)	Top-5 acc 72.656 (72.076)	lr 0.02187
Train [28][1990/3239]	Time 0.581 (0.908)	Data Time 0.001 (0.014)	Loss 2.9875 (3.1517)	Entropy 0.80049 (0.80902)	Top-1 acc 49.609 (48.610)	Top-5 acc 77.344 (72.077)	lr 0.02187
Train [28][2000/3239]	Time 0.665 (0.907)	Data Time 0.001 (0.014)	Loss 3.2706 (3.1516)	Entropy 0.80050 (0.80898)	Top-1 acc 44.922 (48.608)	Top-5 acc 69.141 (72.079)	lr 0.02187
Train [28][2010/3239]	Time 0.609 (0.907)	Data Time 0.001 (0.014)	Loss 3.3122 (3.1516)	Entropy 0.80055 (0.80894)	Top-1 acc 43.750 (48.608)	Top-5 acc 71.094 (72.080)	lr 0.02187
Train [28][2020/3239]	Time 0.623 (0.907)	Data Time 0.001 (0.014)	Loss 3.1536 (3.1514)	Entropy 0.80044 (0.80889)	Top-1 acc 50.781 (48.609)	Top-5 acc 71.875 (72.082)	lr 0.02187
Train [28][2030/3239]	Time 0.620 (0.907)	Data Time 0.001 (0.014)	Loss 3.0885 (3.1515)	Entropy 0.80068 (0.80885)	Top-1 acc 48.438 (48.603)	Top-5 acc 72.266 (72.077)	lr 0.02187
Train [28][2040/3239]	Time 0.575 (0.907)	Data Time 0.001 (0.014)	Loss 3.3432 (3.1515)	Entropy 0.80059 (0.80881)	Top-1 acc 41.406 (48.608)	Top-5 acc 69.141 (72.076)	lr 0.02187
Train [28][2050/3239]	Time 0.598 (0.906)	Data Time 0.001 (0.014)	Loss 3.1577 (3.1515)	Entropy 0.80018 (0.80877)	Top-1 acc 49.219 (48.615)	Top-5 acc 71.094 (72.073)	lr 0.02187
Train [28][2060/3239]	Time 0.621 (0.906)	Data Time 0.001 (0.014)	Loss 3.0214 (3.1514)	Entropy 0.80002 (0.80873)	Top-1 acc 50.391 (48.611)	Top-5 acc 73.828 (72.075)	lr 0.02187
Train [28][2070/3239]	Time 0.694 (0.906)	Data Time 0.001 (0.014)	Loss 3.1307 (3.1514)	Entropy 0.79963 (0.80869)	Top-1 acc 45.312 (48.612)	Top-5 acc 74.219 (72.076)	lr 0.02187
Train [28][2080/3239]	Time 0.625 (0.906)	Data Time 0.001 (0.014)	Loss 3.0420 (3.1514)	Entropy 0.79925 (0.80864)	Top-1 acc 51.172 (48.613)	Top-5 acc 74.609 (72.080)	lr 0.02187
Train [28][2090/3239]	Time 0.607 (0.906)	Data Time 0.001 (0.014)	Loss 3.2034 (3.1514)	Entropy 0.79954 (0.80860)	Top-1 acc 48.828 (48.610)	Top-5 acc 73.438 (72.079)	lr 0.02187
Train [28][2100/3239]	Time 0.602 (0.905)	Data Time 0.001 (0.014)	Loss 3.1901 (3.1519)	Entropy 0.79960 (0.80856)	Top-1 acc 44.922 (48.602)	Top-5 acc 72.266 (72.072)	lr 0.02187
Train [28][2110/3239]	Time 0.595 (0.905)	Data Time 0.001 (0.014)	Loss 3.1625 (3.1519)	Entropy 0.79948 (0.80851)	Top-1 acc 47.656 (48.602)	Top-5 acc 70.703 (72.071)	lr 0.02187
Train [28][2120/3239]	Time 0.616 (0.905)	Data Time 0.001 (0.014)	Loss 3.1532 (3.1520)	Entropy 0.79985 (0.80847)	Top-1 acc 46.875 (48.604)	Top-5 acc 71.875 (72.074)	lr 0.02186
Train [28][2130/3239]	Time 0.635 (0.905)	Data Time 0.001 (0.014)	Loss 3.0695 (3.1517)	Entropy 0.79972 (0.80843)	Top-1 acc 51.562 (48.606)	Top-5 acc 75.391 (72.083)	lr 0.02186
Train [28][2140/3239]	Time 0.527 (0.905)	Data Time 0.001 (0.013)	Loss 3.1155 (3.1518)	Entropy 0.80000 (0.80839)	Top-1 acc 48.047 (48.602)	Top-5 acc 71.094 (72.082)	lr 0.02186
Train [28][2150/3239]	Time 0.591 (0.904)	Data Time 0.001 (0.013)	Loss 3.1034 (3.1516)	Entropy 0.79972 (0.80835)	Top-1 acc 50.000 (48.607)	Top-5 acc 74.219 (72.087)	lr 0.02186
Train [28][2160/3239]	Time 0.662 (0.904)	Data Time 0.001 (0.013)	Loss 3.2098 (3.1517)	Entropy 0.79972 (0.80831)	Top-1 acc 46.094 (48.601)	Top-5 acc 72.656 (72.090)	lr 0.02186
Train [28][2170/3239]	Time 0.589 (0.904)	Data Time 0.001 (0.013)	Loss 3.2501 (3.1516)	Entropy 0.79998 (0.80827)	Top-1 acc 48.828 (48.604)	Top-5 acc 66.406 (72.093)	lr 0.02186
Train [28][2180/3239]	Time 0.609 (0.904)	Data Time 0.001 (0.013)	Loss 2.9962 (3.1517)	Entropy 0.80012 (0.80824)	Top-1 acc 51.562 (48.598)	Top-5 acc 74.609 (72.087)	lr 0.02186
Train [28][2190/3239]	Time 0.620 (0.903)	Data Time 0.001 (0.013)	Loss 3.2605 (3.1517)	Entropy 0.80002 (0.80820)	Top-1 acc 48.438 (48.596)	Top-5 acc 71.094 (72.094)	lr 0.02186
Train [28][2200/3239]	Time 0.596 (0.903)	Data Time 0.001 (0.013)	Loss 3.1696 (3.1520)	Entropy 0.80048 (0.80816)	Top-1 acc 46.484 (48.592)	Top-5 acc 73.047 (72.086)	lr 0.02186
Train [28][2210/3239]	Time 0.587 (0.903)	Data Time 0.001 (0.013)	Loss 3.0938 (3.1521)	Entropy 0.80046 (0.80813)	Top-1 acc 52.734 (48.591)	Top-5 acc 72.266 (72.082)	lr 0.02186
Train [28][2220/3239]	Time 0.619 (0.903)	Data Time 0.001 (0.013)	Loss 3.0620 (3.1522)	Entropy 0.80016 (0.80809)	Top-1 acc 50.000 (48.592)	Top-5 acc 72.266 (72.080)	lr 0.02186
Train [28][2230/3239]	Time 0.707 (0.914)	Data Time 0.002 (0.013)	Loss 3.1688 (3.1522)	Entropy 0.79950 (0.80806)	Top-1 acc 46.484 (48.588)	Top-5 acc 69.922 (72.079)	lr 0.02186
Train [28][2240/3239]	Time 0.594 (0.914)	Data Time 0.001 (0.013)	Loss 3.1870 (3.1523)	Entropy 0.79923 (0.80802)	Top-1 acc 44.922 (48.586)	Top-5 acc 69.141 (72.076)	lr 0.02186
Train [28][2250/3239]	Time 0.628 (0.913)	Data Time 0.001 (0.013)	Loss 3.1661 (3.1524)	Entropy 0.79904 (0.80798)	Top-1 acc 50.000 (48.588)	Top-5 acc 74.609 (72.079)	lr 0.02186
Train [28][2260/3239]	Time 0.642 (0.913)	Data Time 0.003 (0.013)	Loss 3.0532 (3.1523)	Entropy 0.79901 (0.80794)	Top-1 acc 48.047 (48.588)	Top-5 acc 71.875 (72.078)	lr 0.02186
Train [28][2270/3239]	Time 0.627 (0.913)	Data Time 0.003 (0.013)	Loss 3.3691 (3.1527)	Entropy 0.79860 (0.80790)	Top-1 acc 41.797 (48.577)	Top-5 acc 67.969 (72.071)	lr 0.02185
Train [28][2280/3239]	Time 0.584 (0.913)	Data Time 0.001 (0.013)	Loss 3.1896 (3.1526)	Entropy 0.79881 (0.80786)	Top-1 acc 48.047 (48.584)	Top-5 acc 70.312 (72.071)	lr 0.02185
Train [28][2290/3239]	Time 0.460 (0.912)	Data Time 0.001 (0.013)	Loss 3.1090 (3.1525)	Entropy 0.79907 (0.80782)	Top-1 acc 52.734 (48.588)	Top-5 acc 70.312 (72.071)	lr 0.02185
Train [28][2300/3239]	Time 0.612 (0.912)	Data Time 0.001 (0.013)	Loss 3.2035 (3.1525)	Entropy 0.79878 (0.80778)	Top-1 acc 48.047 (48.582)	Top-5 acc 71.094 (72.075)	lr 0.02185
Train [28][2310/3239]	Time 0.588 (0.912)	Data Time 0.001 (0.013)	Loss 3.0634 (3.1524)	Entropy 0.79931 (0.80774)	Top-1 acc 49.609 (48.587)	Top-5 acc 72.656 (72.077)	lr 0.02185
Train [28][2320/3239]	Time 0.712 (0.912)	Data Time 0.001 (0.013)	Loss 3.0209 (3.1519)	Entropy 0.79940 (0.80771)	Top-1 acc 51.172 (48.598)	Top-5 acc 75.391 (72.088)	lr 0.02185
Train [28][2330/3239]	Time 0.607 (0.911)	Data Time 0.001 (0.013)	Loss 3.1441 (3.1519)	Entropy 0.79938 (0.80767)	Top-1 acc 47.266 (48.596)	Top-5 acc 73.438 (72.092)	lr 0.02185
Train [28][2340/3239]	Time 0.608 (0.911)	Data Time 0.001 (0.012)	Loss 3.1196 (3.1521)	Entropy 0.79955 (0.80764)	Top-1 acc 50.391 (48.599)	Top-5 acc 70.703 (72.088)	lr 0.02185
Train [28][2350/3239]	Time 0.617 (0.911)	Data Time 0.001 (0.012)	Loss 3.2378 (3.1520)	Entropy 0.79971 (0.80760)	Top-1 acc 49.219 (48.600)	Top-5 acc 69.531 (72.089)	lr 0.02185
Train [28][2360/3239]	Time 0.599 (0.911)	Data Time 0.001 (0.012)	Loss 3.3907 (3.1519)	Entropy 0.80024 (0.80757)	Top-1 acc 47.266 (48.605)	Top-5 acc 68.359 (72.090)	lr 0.02185
Train [28][2370/3239]	Time 0.629 (0.911)	Data Time 0.001 (0.012)	Loss 3.1427 (3.1517)	Entropy 0.80050 (0.80754)	Top-1 acc 51.562 (48.611)	Top-5 acc 70.312 (72.093)	lr 0.02185
Train [28][2380/3239]	Time 0.595 (0.910)	Data Time 0.001 (0.012)	Loss 3.2297 (3.1518)	Entropy 0.80033 (0.80751)	Top-1 acc 47.656 (48.607)	Top-5 acc 69.531 (72.089)	lr 0.02185
Train [28][2390/3239]	Time 0.692 (0.910)	Data Time 0.001 (0.012)	Loss 3.0684 (3.1516)	Entropy 0.80051 (0.80748)	Top-1 acc 50.000 (48.614)	Top-5 acc 75.781 (72.097)	lr 0.02185
Train [28][2400/3239]	Time 0.569 (0.910)	Data Time 0.001 (0.012)	Loss 2.8590 (3.1516)	Entropy 0.80045 (0.80745)	Top-1 acc 57.422 (48.619)	Top-5 acc 76.172 (72.093)	lr 0.02185
Train [28][2410/3239]	Time 0.603 (0.910)	Data Time 0.001 (0.012)	Loss 2.9968 (3.1516)	Entropy 0.80019 (0.80742)	Top-1 acc 53.125 (48.619)	Top-5 acc 73.438 (72.090)	lr 0.02185
Train [28][2420/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.012)	Loss 3.0802 (3.1516)	Entropy 0.80055 (0.80739)	Top-1 acc 49.219 (48.618)	Top-5 acc 73.828 (72.089)	lr 0.02184
Train [28][2430/3239]	Time 0.610 (0.910)	Data Time 0.001 (0.012)	Loss 3.1811 (3.1516)	Entropy 0.80018 (0.80736)	Top-1 acc 47.656 (48.620)	Top-5 acc 69.141 (72.086)	lr 0.02184
Train [28][2440/3239]	Time 0.615 (0.909)	Data Time 0.001 (0.012)	Loss 3.2398 (3.1513)	Entropy 0.80004 (0.80733)	Top-1 acc 47.656 (48.624)	Top-5 acc 70.703 (72.096)	lr 0.02184
Train [28][2450/3239]	Time 0.615 (0.909)	Data Time 0.001 (0.012)	Loss 3.0647 (3.1511)	Entropy 0.79991 (0.80730)	Top-1 acc 49.609 (48.629)	Top-5 acc 75.000 (72.100)	lr 0.02184
Train [28][2460/3239]	Time 0.574 (0.909)	Data Time 0.001 (0.012)	Loss 2.9851 (3.1510)	Entropy 0.79999 (0.80727)	Top-1 acc 51.562 (48.634)	Top-5 acc 75.781 (72.100)	lr 0.02184
Train [28][2470/3239]	Time 0.613 (0.908)	Data Time 0.001 (0.012)	Loss 3.4035 (3.1512)	Entropy 0.80024 (0.80724)	Top-1 acc 42.578 (48.631)	Top-5 acc 67.188 (72.097)	lr 0.02184
Train [28][2480/3239]	Time 0.747 (0.908)	Data Time 0.001 (0.012)	Loss 3.0810 (3.1514)	Entropy 0.80020 (0.80722)	Top-1 acc 52.344 (48.629)	Top-5 acc 73.047 (72.093)	lr 0.02184
Train [28][2490/3239]	Time 0.579 (0.908)	Data Time 0.001 (0.012)	Loss 3.3414 (3.1518)	Entropy 0.80009 (0.80719)	Top-1 acc 45.703 (48.618)	Top-5 acc 71.484 (72.085)	lr 0.02184
Train [28][2500/3239]	Time 0.620 (0.908)	Data Time 0.001 (0.012)	Loss 3.0496 (3.1519)	Entropy 0.80014 (0.80716)	Top-1 acc 55.078 (48.622)	Top-5 acc 75.000 (72.077)	lr 0.02184
Train [28][2510/3239]	Time 0.623 (0.908)	Data Time 0.001 (0.012)	Loss 3.1631 (3.1519)	Entropy 0.80008 (0.80713)	Top-1 acc 46.094 (48.619)	Top-5 acc 69.531 (72.078)	lr 0.02184
Train [28][2520/3239]	Time 0.634 (0.908)	Data Time 0.001 (0.012)	Loss 3.1448 (3.1520)	Entropy 0.80029 (0.80710)	Top-1 acc 46.875 (48.618)	Top-5 acc 73.047 (72.076)	lr 0.02184
Train [28][2530/3239]	Time 0.597 (0.907)	Data Time 0.001 (0.012)	Loss 3.1995 (3.1517)	Entropy 0.80038 (0.80708)	Top-1 acc 50.000 (48.622)	Top-5 acc 71.484 (72.083)	lr 0.02184
Train [28][2540/3239]	Time 0.575 (0.907)	Data Time 0.001 (0.012)	Loss 3.1793 (3.1520)	Entropy 0.80025 (0.80705)	Top-1 acc 47.266 (48.613)	Top-5 acc 70.703 (72.079)	lr 0.02184
Train [28][2550/3239]	Time 0.717 (0.907)	Data Time 0.001 (0.012)	Loss 3.0635 (3.1518)	Entropy 0.80026 (0.80702)	Top-1 acc 49.609 (48.618)	Top-5 acc 75.000 (72.084)	lr 0.02184
Train [28][2560/3239]	Time 0.617 (0.907)	Data Time 0.001 (0.012)	Loss 3.4465 (3.1521)	Entropy 0.80015 (0.80700)	Top-1 acc 44.141 (48.614)	Top-5 acc 66.797 (72.082)	lr 0.02184
Train [28][2570/3239]	Time 0.635 (0.907)	Data Time 0.002 (0.012)	Loss 3.1567 (3.1517)	Entropy 0.80033 (0.80697)	Top-1 acc 50.391 (48.624)	Top-5 acc 69.531 (72.091)	lr 0.02183
Train [28][2580/3239]	Time 0.564 (0.907)	Data Time 0.001 (0.011)	Loss 3.2837 (3.1519)	Entropy 0.80043 (0.80695)	Top-1 acc 44.531 (48.622)	Top-5 acc 70.312 (72.086)	lr 0.02183
Train [28][2590/3239]	Time 0.617 (0.906)	Data Time 0.001 (0.011)	Loss 2.9585 (3.1514)	Entropy 0.80076 (0.80692)	Top-1 acc 55.469 (48.632)	Top-5 acc 75.781 (72.093)	lr 0.02183
Train [28][2600/3239]	Time 0.601 (0.906)	Data Time 0.001 (0.011)	Loss 3.0508 (3.1515)	Entropy 0.80042 (0.80690)	Top-1 acc 52.344 (48.630)	Top-5 acc 71.094 (72.091)	lr 0.02183
Train [28][2610/3239]	Time 0.609 (0.906)	Data Time 0.001 (0.011)	Loss 3.1243 (3.1515)	Entropy 0.80029 (0.80687)	Top-1 acc 51.953 (48.634)	Top-5 acc 74.609 (72.096)	lr 0.02183
Train [28][2620/3239]	Time 0.466 (0.906)	Data Time 0.001 (0.011)	Loss 3.1269 (3.1514)	Entropy 0.79993 (0.80685)	Top-1 acc 51.172 (48.637)	Top-5 acc 70.312 (72.096)	lr 0.02183
Train [28][2630/3239]	Time 0.597 (0.906)	Data Time 0.001 (0.011)	Loss 3.1382 (3.1516)	Entropy 0.79963 (0.80682)	Top-1 acc 51.172 (48.635)	Top-5 acc 69.531 (72.091)	lr 0.02183
Train [28][2640/3239]	Time 0.575 (0.905)	Data Time 0.001 (0.011)	Loss 3.4017 (3.1515)	Entropy 0.79965 (0.80679)	Top-1 acc 45.312 (48.634)	Top-5 acc 68.359 (72.096)	lr 0.02183
Train [28][2650/3239]	Time 0.615 (0.905)	Data Time 0.001 (0.011)	Loss 3.2184 (3.1517)	Entropy 0.79990 (0.80677)	Top-1 acc 46.484 (48.629)	Top-5 acc 70.312 (72.091)	lr 0.02183
Train [28][2660/3239]	Time 0.634 (0.905)	Data Time 0.003 (0.011)	Loss 3.2014 (3.1516)	Entropy 0.79953 (0.80674)	Top-1 acc 46.875 (48.632)	Top-5 acc 74.219 (72.094)	lr 0.02183
Train [28][2670/3239]	Time 0.571 (0.905)	Data Time 0.001 (0.011)	Loss 3.1245 (3.1516)	Entropy 0.79935 (0.80671)	Top-1 acc 46.875 (48.633)	Top-5 acc 75.000 (72.094)	lr 0.02183
Train [28][2680/3239]	Time 0.599 (0.905)	Data Time 0.001 (0.011)	Loss 3.1922 (3.1517)	Entropy 0.79995 (0.80668)	Top-1 acc 48.438 (48.628)	Top-5 acc 75.000 (72.093)	lr 0.02183
Train [28][2690/3239]	Time 0.581 (0.904)	Data Time 0.001 (0.011)	Loss 3.2069 (3.1519)	Entropy 0.79972 (0.80666)	Top-1 acc 47.266 (48.621)	Top-5 acc 73.828 (72.088)	lr 0.02183
Train [28][2700/3239]	Time 0.603 (0.904)	Data Time 0.001 (0.011)	Loss 3.1799 (3.1521)	Entropy 0.79966 (0.80663)	Top-1 acc 45.703 (48.624)	Top-5 acc 71.875 (72.085)	lr 0.02183
Train [28][2710/3239]	Time 0.706 (0.904)	Data Time 0.001 (0.011)	Loss 3.4383 (3.1523)	Entropy 0.79966 (0.80661)	Top-1 acc 45.703 (48.619)	Top-5 acc 67.578 (72.080)	lr 0.02183
Train [28][2720/3239]	Time 0.607 (0.904)	Data Time 0.001 (0.011)	Loss 3.1699 (3.1523)	Entropy 0.79923 (0.80658)	Top-1 acc 48.438 (48.623)	Top-5 acc 76.172 (72.084)	lr 0.02182
Train [28][2730/3239]	Time 0.589 (0.904)	Data Time 0.001 (0.011)	Loss 3.3377 (3.1525)	Entropy 0.79970 (0.80656)	Top-1 acc 43.359 (48.618)	Top-5 acc 70.703 (72.084)	lr 0.02182
Train [28][2740/3239]	Time 0.616 (0.904)	Data Time 0.001 (0.011)	Loss 3.0305 (3.1524)	Entropy 0.79952 (0.80653)	Top-1 acc 51.562 (48.620)	Top-5 acc 72.266 (72.086)	lr 0.02182
Train [28][2750/3239]	Time 0.593 (0.904)	Data Time 0.001 (0.011)	Loss 3.0695 (3.1524)	Entropy 0.79963 (0.80650)	Top-1 acc 51.953 (48.622)	Top-5 acc 73.438 (72.087)	lr 0.02182
Train [28][2760/3239]	Time 0.623 (0.903)	Data Time 0.001 (0.011)	Loss 3.0766 (3.1523)	Entropy 0.79967 (0.80648)	Top-1 acc 48.047 (48.622)	Top-5 acc 70.703 (72.086)	lr 0.02182
Train [28][2770/3239]	Time 0.631 (0.903)	Data Time 0.001 (0.011)	Loss 3.0505 (3.1522)	Entropy 0.79953 (0.80646)	Top-1 acc 52.344 (48.623)	Top-5 acc 73.828 (72.085)	lr 0.02182
Train [28][2780/3239]	Time 0.552 (0.903)	Data Time 0.001 (0.011)	Loss 3.1542 (3.1522)	Entropy 0.79942 (0.80643)	Top-1 acc 50.391 (48.624)	Top-5 acc 70.312 (72.082)	lr 0.02182
Train [28][2790/3239]	Time 0.585 (0.903)	Data Time 0.001 (0.011)	Loss 3.2676 (3.1523)	Entropy 0.79953 (0.80640)	Top-1 acc 42.188 (48.621)	Top-5 acc 68.359 (72.081)	lr 0.02182
Train [28][2800/3239]	Time 0.592 (0.903)	Data Time 0.001 (0.011)	Loss 3.1011 (3.1523)	Entropy 0.79906 (0.80638)	Top-1 acc 53.125 (48.623)	Top-5 acc 74.219 (72.081)	lr 0.02182
Train [28][2810/3239]	Time 0.590 (0.902)	Data Time 0.002 (0.011)	Loss 3.4552 (3.1523)	Entropy 0.79889 (0.80635)	Top-1 acc 42.578 (48.620)	Top-5 acc 66.406 (72.084)	lr 0.02182
Train [28][2820/3239]	Time 0.616 (0.902)	Data Time 0.001 (0.011)	Loss 3.1787 (3.1524)	Entropy 0.79872 (0.80633)	Top-1 acc 49.219 (48.617)	Top-5 acc 68.750 (72.078)	lr 0.02182
Train [28][2830/3239]	Time 0.589 (0.902)	Data Time 0.001 (0.011)	Loss 3.0489 (3.1524)	Entropy 0.79828 (0.80630)	Top-1 acc 52.344 (48.617)	Top-5 acc 73.438 (72.079)	lr 0.02182
Train [28][2840/3239]	Time 0.582 (0.902)	Data Time 0.001 (0.011)	Loss 3.3469 (3.1524)	Entropy 0.79830 (0.80627)	Top-1 acc 44.141 (48.616)	Top-5 acc 71.094 (72.078)	lr 0.02182
Train [28][2850/3239]	Time 0.618 (0.902)	Data Time 0.002 (0.011)	Loss 3.1237 (3.1528)	Entropy 0.79831 (0.80624)	Top-1 acc 47.266 (48.611)	Top-5 acc 72.266 (72.071)	lr 0.02182
Train [28][2860/3239]	Time 0.587 (0.902)	Data Time 0.001 (0.011)	Loss 3.2041 (3.1528)	Entropy 0.79856 (0.80621)	Top-1 acc 47.656 (48.609)	Top-5 acc 72.656 (72.073)	lr 0.02181
Train [28][2870/3239]	Time 0.696 (0.902)	Data Time 0.001 (0.011)	Loss 3.1833 (3.1529)	Entropy 0.79835 (0.80619)	Top-1 acc 49.219 (48.609)	Top-5 acc 71.875 (72.071)	lr 0.02181
Train [28][2880/3239]	Time 0.742 (0.909)	Data Time 0.006 (0.010)	Loss 3.0562 (3.1527)	Entropy 0.79832 (0.80616)	Top-1 acc 52.344 (48.611)	Top-5 acc 72.656 (72.075)	lr 0.02181
Train [28][2890/3239]	Time 0.602 (0.909)	Data Time 0.002 (0.010)	Loss 3.1961 (3.1525)	Entropy 0.79815 (0.80613)	Top-1 acc 46.875 (48.615)	Top-5 acc 71.484 (72.076)	lr 0.02181
Train [28][2900/3239]	Time 0.615 (0.909)	Data Time 0.002 (0.010)	Loss 3.0100 (3.1524)	Entropy 0.79819 (0.80611)	Top-1 acc 54.688 (48.619)	Top-5 acc 73.828 (72.078)	lr 0.02181
Train [28][2910/3239]	Time 0.617 (0.909)	Data Time 0.001 (0.010)	Loss 3.1483 (3.1527)	Entropy 0.79836 (0.80608)	Top-1 acc 49.219 (48.613)	Top-5 acc 71.094 (72.070)	lr 0.02181
Train [28][2920/3239]	Time 0.593 (0.909)	Data Time 0.001 (0.010)	Loss 3.2359 (3.1528)	Entropy 0.79847 (0.80605)	Top-1 acc 46.875 (48.611)	Top-5 acc 69.922 (72.064)	lr 0.02181
Train [28][2930/3239]	Time 0.576 (0.909)	Data Time 0.001 (0.010)	Loss 3.1712 (3.1526)	Entropy 0.79854 (0.80603)	Top-1 acc 48.047 (48.614)	Top-5 acc 73.438 (72.070)	lr 0.02181
Train [28][2940/3239]	Time 0.724 (0.908)	Data Time 0.002 (0.010)	Loss 2.9649 (3.1524)	Entropy 0.79837 (0.80600)	Top-1 acc 51.172 (48.617)	Top-5 acc 75.781 (72.072)	lr 0.02181
Train [28][2950/3239]	Time 0.607 (0.908)	Data Time 0.001 (0.010)	Loss 3.3177 (3.1526)	Entropy 0.79820 (0.80597)	Top-1 acc 43.359 (48.611)	Top-5 acc 67.578 (72.070)	lr 0.02181
Train [28][2960/3239]	Time 0.577 (0.908)	Data Time 0.002 (0.010)	Loss 3.1743 (3.1525)	Entropy 0.79856 (0.80595)	Top-1 acc 50.781 (48.612)	Top-5 acc 70.312 (72.070)	lr 0.02181
Train [28][2970/3239]	Time 0.604 (0.908)	Data Time 0.001 (0.010)	Loss 3.0396 (3.1523)	Entropy 0.79857 (0.80592)	Top-1 acc 51.562 (48.616)	Top-5 acc 72.266 (72.073)	lr 0.02181
Train [28][2980/3239]	Time 0.603 (0.908)	Data Time 0.002 (0.010)	Loss 2.8465 (3.1526)	Entropy 0.79863 (0.80590)	Top-1 acc 54.688 (48.612)	Top-5 acc 80.078 (72.066)	lr 0.02181
Train [28][2990/3239]	Time 0.605 (0.908)	Data Time 0.001 (0.010)	Loss 2.9423 (3.1526)	Entropy 0.79844 (0.80587)	Top-1 acc 54.688 (48.612)	Top-5 acc 77.344 (72.066)	lr 0.02181
Train [28][3000/3239]	Time 0.589 (0.908)	Data Time 0.001 (0.010)	Loss 3.1214 (3.1526)	Entropy 0.79804 (0.80585)	Top-1 acc 48.438 (48.612)	Top-5 acc 76.172 (72.069)	lr 0.02181
Train [28][3010/3239]	Time 0.628 (0.907)	Data Time 0.001 (0.010)	Loss 3.1819 (3.1525)	Entropy 0.79806 (0.80582)	Top-1 acc 44.922 (48.614)	Top-5 acc 70.312 (72.070)	lr 0.02180
Train [28][3020/3239]	Time 0.617 (0.907)	Data Time 0.001 (0.010)	Loss 3.0191 (3.1525)	Entropy 0.79836 (0.80580)	Top-1 acc 55.469 (48.615)	Top-5 acc 76.562 (72.069)	lr 0.02180
Train [28][3030/3239]	Time 0.762 (0.907)	Data Time 0.001 (0.010)	Loss 3.1946 (3.1522)	Entropy 0.79870 (0.80577)	Top-1 acc 50.391 (48.622)	Top-5 acc 69.141 (72.073)	lr 0.02180
Train [28][3040/3239]	Time 0.620 (0.907)	Data Time 0.001 (0.010)	Loss 3.0318 (3.1521)	Entropy 0.79886 (0.80575)	Top-1 acc 50.781 (48.624)	Top-5 acc 74.609 (72.074)	lr 0.02180
Train [28][3050/3239]	Time 0.659 (0.907)	Data Time 0.001 (0.010)	Loss 3.1413 (3.1521)	Entropy 0.79829 (0.80573)	Top-1 acc 45.312 (48.620)	Top-5 acc 70.312 (72.073)	lr 0.02180
Train [28][3060/3239]	Time 0.570 (0.907)	Data Time 0.001 (0.010)	Loss 3.3327 (3.1523)	Entropy 0.79864 (0.80570)	Top-1 acc 42.578 (48.616)	Top-5 acc 70.703 (72.072)	lr 0.02180
Train [28][3070/3239]	Time 0.613 (0.907)	Data Time 0.001 (0.010)	Loss 3.1054 (3.1522)	Entropy 0.79851 (0.80568)	Top-1 acc 50.391 (48.622)	Top-5 acc 72.656 (72.074)	lr 0.02180
Train [28][3080/3239]	Time 0.608 (0.907)	Data Time 0.001 (0.010)	Loss 2.9503 (3.1521)	Entropy 0.79869 (0.80566)	Top-1 acc 51.953 (48.628)	Top-5 acc 76.172 (72.076)	lr 0.02180
Train [28][3090/3239]	Time 0.668 (0.906)	Data Time 0.001 (0.010)	Loss 3.0191 (3.1521)	Entropy 0.79880 (0.80563)	Top-1 acc 50.391 (48.629)	Top-5 acc 75.781 (72.075)	lr 0.02180
Train [28][3100/3239]	Time 0.661 (0.906)	Data Time 0.001 (0.010)	Loss 3.1836 (3.1519)	Entropy 0.79876 (0.80561)	Top-1 acc 47.266 (48.631)	Top-5 acc 70.703 (72.078)	lr 0.02180
Train [28][3110/3239]	Time 0.614 (0.906)	Data Time 0.001 (0.010)	Loss 3.0305 (3.1518)	Entropy 0.79889 (0.80559)	Top-1 acc 48.828 (48.634)	Top-5 acc 73.438 (72.079)	lr 0.02180
Train [28][3120/3239]	Time 0.657 (0.906)	Data Time 0.001 (0.010)	Loss 2.9625 (3.1518)	Entropy 0.79845 (0.80557)	Top-1 acc 52.734 (48.631)	Top-5 acc 78.906 (72.078)	lr 0.02180
Train [28][3130/3239]	Time 0.603 (0.906)	Data Time 0.001 (0.010)	Loss 3.3730 (3.1519)	Entropy 0.79874 (0.80555)	Top-1 acc 41.797 (48.633)	Top-5 acc 67.969 (72.077)	lr 0.02180
Train [28][3140/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.010)	Loss 3.1747 (3.1518)	Entropy 0.79875 (0.80552)	Top-1 acc 50.391 (48.635)	Top-5 acc 72.266 (72.079)	lr 0.02180
Train [28][3150/3239]	Time 0.628 (0.906)	Data Time 0.001 (0.010)	Loss 2.8282 (3.1518)	Entropy 0.79850 (0.80550)	Top-1 acc 54.297 (48.634)	Top-5 acc 77.344 (72.080)	lr 0.02180
Train [28][3160/3239]	Time 0.583 (0.906)	Data Time 0.001 (0.010)	Loss 3.1527 (3.1516)	Entropy 0.79849 (0.80548)	Top-1 acc 49.219 (48.638)	Top-5 acc 73.047 (72.084)	lr 0.02179
Train [28][3170/3239]	Time 0.614 (0.905)	Data Time 0.001 (0.010)	Loss 3.1936 (3.1515)	Entropy 0.79830 (0.80546)	Top-1 acc 47.266 (48.640)	Top-5 acc 69.922 (72.087)	lr 0.02179
Train [28][3180/3239]	Time 0.626 (0.905)	Data Time 0.000 (0.010)	Loss 2.9642 (3.1514)	Entropy 0.79858 (0.80544)	Top-1 acc 51.172 (48.639)	Top-5 acc 74.609 (72.086)	lr 0.02179
Train [28][3190/3239]	Time 0.602 (0.905)	Data Time 0.000 (0.010)	Loss 3.0738 (3.1512)	Entropy 0.79825 (0.80541)	Top-1 acc 49.219 (48.646)	Top-5 acc 73.828 (72.091)	lr 0.02179
Train [28][3200/3239]	Time 0.591 (0.905)	Data Time 0.000 (0.010)	Loss 3.1133 (3.1513)	Entropy 0.79840 (0.80539)	Top-1 acc 50.391 (48.643)	Top-5 acc 75.781 (72.089)	lr 0.02179
Train [28][3210/3239]	Time 0.583 (0.905)	Data Time 0.000 (0.010)	Loss 3.1741 (3.1515)	Entropy 0.79818 (0.80537)	Top-1 acc 44.141 (48.639)	Top-5 acc 73.047 (72.085)	lr 0.02179
Train [28][3220/3239]	Time 0.612 (0.905)	Data Time 0.000 (0.010)	Loss 3.1315 (3.1516)	Entropy 0.79819 (0.80535)	Top-1 acc 50.781 (48.636)	Top-5 acc 69.922 (72.084)	lr 0.02179
Train [28][3230/3239]	Time 0.606 (0.904)	Data Time 0.000 (0.010)	Loss 3.2694 (3.1515)	Entropy 0.79858 (0.80533)	Top-1 acc 44.922 (48.637)	Top-5 acc 68.359 (72.085)	lr 0.02179
Train [28][3239/3239]	Time 1.606 (0.904)	Data Time 0.000 (0.010)	Loss 3.0590 (3.1517)	Entropy 0.79861 (0.80531)	Top-1 acc 53.086 (48.631)	Top-5 acc 72.840 (72.080)	lr 0.02179
==========Valid [28/120]	loss 1.873	top-1 acc 58.045 (58.045)	top-5 acc 80.881	Train top-1 48.631	top-5 72.080	Entropy 0.79861	Latency-None: 0.000ms	Flops: 539.76M
Train [29][0/3239]	Time 25.421 (25.421)	Data Time 24.451 (24.451)	Loss 3.1389 (3.1389)	Entropy 0.79854 (0.79854)	Top-1 acc 48.438 (48.438)	Top-5 acc 71.484 (71.484)	lr 0.02179
Train [29][10/3239]	Time 0.612 (3.155)	Data Time 0.001 (2.225)	Loss 3.1401 (3.1129)	Entropy 0.79838 (0.79849)	Top-1 acc 48.047 (49.077)	Top-5 acc 72.266 (73.082)	lr 0.02179
Train [29][20/3239]	Time 0.646 (2.058)	Data Time 0.001 (1.166)	Loss 3.0922 (3.1281)	Entropy 0.79853 (0.79846)	Top-1 acc 51.953 (49.014)	Top-5 acc 75.391 (72.563)	lr 0.02179
Train [29][30/3239]	Time 0.609 (1.675)	Data Time 0.001 (0.791)	Loss 3.3898 (3.1210)	Entropy 0.79864 (0.79850)	Top-1 acc 44.922 (49.156)	Top-5 acc 63.672 (72.631)	lr 0.02179
Train [29][40/3239]	Time 0.625 (1.467)	Data Time 0.001 (0.598)	Loss 3.2066 (3.1181)	Entropy 0.79853 (0.79850)	Top-1 acc 48.438 (49.143)	Top-5 acc 68.750 (72.685)	lr 0.02179
Train [29][50/3239]	Time 0.623 (1.343)	Data Time 0.002 (0.481)	Loss 3.0757 (3.1153)	Entropy 0.79894 (0.79855)	Top-1 acc 53.906 (49.288)	Top-5 acc 73.047 (72.786)	lr 0.02179
Train [29][60/3239]	Time 0.617 (1.266)	Data Time 0.002 (0.403)	Loss 3.1386 (3.1180)	Entropy 0.79906 (0.79862)	Top-1 acc 50.000 (49.071)	Top-5 acc 75.391 (72.887)	lr 0.02179
Train [29][70/3239]	Time 0.605 (1.211)	Data Time 0.001 (0.346)	Loss 3.1653 (3.1102)	Entropy 0.79897 (0.79867)	Top-1 acc 49.609 (49.301)	Top-5 acc 69.922 (73.047)	lr 0.02178
Train [29][80/3239]	Time 0.591 (1.167)	Data Time 0.001 (0.304)	Loss 3.1548 (3.1111)	Entropy 0.79928 (0.79872)	Top-1 acc 51.953 (49.359)	Top-5 acc 71.094 (73.028)	lr 0.02178
Train [29][90/3239]	Time 0.692 (1.134)	Data Time 0.001 (0.271)	Loss 3.3420 (3.1147)	Entropy 0.79955 (0.79881)	Top-1 acc 45.703 (49.223)	Top-5 acc 66.797 (72.952)	lr 0.02178
Train [29][100/3239]	Time 0.600 (1.108)	Data Time 0.001 (0.244)	Loss 3.1597 (3.1138)	Entropy 0.79987 (0.79889)	Top-1 acc 52.344 (49.354)	Top-5 acc 71.875 (73.043)	lr 0.02178
Train [29][110/3239]	Time 0.611 (1.087)	Data Time 0.001 (0.222)	Loss 2.9491 (3.1214)	Entropy 0.79977 (0.79898)	Top-1 acc 53.516 (49.177)	Top-5 acc 76.953 (72.910)	lr 0.02178
Train [29][120/3239]	Time 0.632 (1.070)	Data Time 0.001 (0.204)	Loss 3.1735 (3.1165)	Entropy 0.79966 (0.79905)	Top-1 acc 51.172 (49.329)	Top-5 acc 72.656 (72.963)	lr 0.02178
Train [29][130/3239]	Time 0.599 (1.054)	Data Time 0.001 (0.189)	Loss 3.0571 (3.1157)	Entropy 0.79994 (0.79911)	Top-1 acc 49.609 (49.371)	Top-5 acc 72.656 (72.889)	lr 0.02178
Train [29][140/3239]	Time 0.603 (1.040)	Data Time 0.001 (0.175)	Loss 3.1617 (3.1168)	Entropy 0.80004 (0.79917)	Top-1 acc 48.047 (49.354)	Top-5 acc 71.875 (72.911)	lr 0.02178
Train [29][150/3239]	Time 0.611 (1.028)	Data Time 0.001 (0.164)	Loss 3.2144 (3.1162)	Entropy 0.80013 (0.79923)	Top-1 acc 50.000 (49.379)	Top-5 acc 69.922 (72.881)	lr 0.02178
Train [29][160/3239]	Time 0.667 (1.018)	Data Time 0.001 (0.154)	Loss 3.0026 (3.1179)	Entropy 0.80004 (0.79929)	Top-1 acc 51.562 (49.326)	Top-5 acc 76.172 (72.901)	lr 0.02178
Train [29][170/3239]	Time 0.593 (1.010)	Data Time 0.001 (0.145)	Loss 2.9979 (3.1157)	Entropy 0.79980 (0.79933)	Top-1 acc 52.344 (49.392)	Top-5 acc 73.047 (72.953)	lr 0.02178
Train [29][180/3239]	Time 0.592 (1.001)	Data Time 0.001 (0.137)	Loss 3.4358 (3.1167)	Entropy 0.79971 (0.79936)	Top-1 acc 42.578 (49.381)	Top-5 acc 68.750 (72.891)	lr 0.02178
Train [29][190/3239]	Time 0.604 (0.994)	Data Time 0.001 (0.130)	Loss 3.1585 (3.1176)	Entropy 0.79981 (0.79938)	Top-1 acc 47.656 (49.401)	Top-5 acc 70.312 (72.828)	lr 0.02178
Train [29][200/3239]	Time 0.659 (0.986)	Data Time 0.002 (0.124)	Loss 2.9997 (3.1139)	Entropy 0.80006 (0.79941)	Top-1 acc 50.781 (49.462)	Top-5 acc 74.219 (72.901)	lr 0.02178
Train [29][210/3239]	Time 0.610 (0.980)	Data Time 0.001 (0.118)	Loss 3.0989 (3.1153)	Entropy 0.79946 (0.79942)	Top-1 acc 52.734 (49.437)	Top-5 acc 71.484 (72.862)	lr 0.02178
Train [29][220/3239]	Time 0.639 (0.972)	Data Time 0.001 (0.113)	Loss 3.1496 (3.1157)	Entropy 0.79959 (0.79943)	Top-1 acc 47.266 (49.429)	Top-5 acc 71.094 (72.805)	lr 0.02177
Train [29][230/3239]	Time 0.589 (0.968)	Data Time 0.001 (0.108)	Loss 3.1837 (3.1167)	Entropy 0.79922 (0.79943)	Top-1 acc 47.656 (49.430)	Top-5 acc 71.875 (72.834)	lr 0.02177
Train [29][240/3239]	Time 0.605 (0.963)	Data Time 0.001 (0.103)	Loss 3.3521 (3.1220)	Entropy 0.79879 (0.79942)	Top-1 acc 44.141 (49.303)	Top-5 acc 71.094 (72.737)	lr 0.02177
Train [29][250/3239]	Time 0.690 (0.959)	Data Time 0.001 (0.099)	Loss 3.0592 (3.1224)	Entropy 0.79849 (0.79939)	Top-1 acc 50.391 (49.275)	Top-5 acc 74.219 (72.771)	lr 0.02177
Train [29][260/3239]	Time 0.579 (0.956)	Data Time 0.001 (0.096)	Loss 3.0684 (3.1213)	Entropy 0.79830 (0.79935)	Top-1 acc 52.734 (49.330)	Top-5 acc 74.609 (72.785)	lr 0.02177
Train [29][270/3239]	Time 0.591 (0.952)	Data Time 0.001 (0.092)	Loss 2.9223 (3.1204)	Entropy 0.79862 (0.79931)	Top-1 acc 54.688 (49.328)	Top-5 acc 75.781 (72.810)	lr 0.02177
Train [29][280/3239]	Time 0.613 (0.949)	Data Time 0.001 (0.089)	Loss 3.0989 (3.1210)	Entropy 0.79899 (0.79929)	Top-1 acc 50.000 (49.320)	Top-5 acc 72.266 (72.802)	lr 0.02177
Train [29][290/3239]	Time 0.587 (0.945)	Data Time 0.001 (0.086)	Loss 3.1395 (3.1206)	Entropy 0.79886 (0.79928)	Top-1 acc 48.047 (49.306)	Top-5 acc 73.828 (72.840)	lr 0.02177
Train [29][300/3239]	Time 0.605 (1.024)	Data Time 0.002 (0.083)	Loss 3.2374 (3.1209)	Entropy 0.79862 (0.79926)	Top-1 acc 47.266 (49.302)	Top-5 acc 69.141 (72.833)	lr 0.02177
Train [29][310/3239]	Time 0.578 (1.019)	Data Time 0.002 (0.081)	Loss 2.9415 (3.1217)	Entropy 0.79869 (0.79924)	Top-1 acc 55.859 (49.314)	Top-5 acc 74.609 (72.789)	lr 0.02177
Train [29][320/3239]	Time 0.722 (1.014)	Data Time 0.001 (0.078)	Loss 2.7778 (3.1235)	Entropy 0.79872 (0.79923)	Top-1 acc 58.203 (49.271)	Top-5 acc 79.688 (72.769)	lr 0.02177
Train [29][330/3239]	Time 0.510 (1.009)	Data Time 0.001 (0.076)	Loss 3.1354 (3.1233)	Entropy 0.79836 (0.79921)	Top-1 acc 53.516 (49.300)	Top-5 acc 72.656 (72.773)	lr 0.02177
Train [29][340/3239]	Time 0.592 (1.004)	Data Time 0.002 (0.074)	Loss 2.9805 (3.1248)	Entropy 0.79830 (0.79919)	Top-1 acc 50.000 (49.257)	Top-5 acc 79.297 (72.743)	lr 0.02177
Train [29][350/3239]	Time 0.597 (0.999)	Data Time 0.001 (0.072)	Loss 3.1678 (3.1245)	Entropy 0.79839 (0.79916)	Top-1 acc 50.000 (49.289)	Top-5 acc 75.391 (72.779)	lr 0.02177
Train [29][360/3239]	Time 0.591 (0.995)	Data Time 0.001 (0.070)	Loss 2.9488 (3.1237)	Entropy 0.79856 (0.79914)	Top-1 acc 55.078 (49.315)	Top-5 acc 74.609 (72.767)	lr 0.02176
Train [29][370/3239]	Time 0.616 (0.992)	Data Time 0.001 (0.068)	Loss 3.1579 (3.1259)	Entropy 0.79832 (0.79912)	Top-1 acc 50.391 (49.275)	Top-5 acc 70.703 (72.696)	lr 0.02176
Train [29][380/3239]	Time 0.548 (0.988)	Data Time 0.001 (0.066)	Loss 3.2590 (3.1276)	Entropy 0.79841 (0.79910)	Top-1 acc 45.312 (49.225)	Top-5 acc 69.531 (72.657)	lr 0.02176
Train [29][390/3239]	Time 0.605 (0.985)	Data Time 0.001 (0.065)	Loss 3.0046 (3.1294)	Entropy 0.79885 (0.79909)	Top-1 acc 50.781 (49.179)	Top-5 acc 75.391 (72.636)	lr 0.02176
Train [29][400/3239]	Time 0.622 (0.982)	Data Time 0.001 (0.063)	Loss 3.0630 (3.1302)	Entropy 0.79932 (0.79909)	Top-1 acc 50.391 (49.168)	Top-5 acc 74.219 (72.624)	lr 0.02176
Train [29][410/3239]	Time 0.674 (0.979)	Data Time 0.001 (0.061)	Loss 3.1007 (3.1310)	Entropy 0.79915 (0.79909)	Top-1 acc 50.000 (49.158)	Top-5 acc 73.438 (72.602)	lr 0.02176
Train [29][420/3239]	Time 0.625 (0.977)	Data Time 0.001 (0.060)	Loss 3.3069 (3.1321)	Entropy 0.79891 (0.79909)	Top-1 acc 43.750 (49.135)	Top-5 acc 70.312 (72.585)	lr 0.02176
Train [29][430/3239]	Time 0.616 (0.974)	Data Time 0.001 (0.059)	Loss 3.0679 (3.1332)	Entropy 0.79882 (0.79908)	Top-1 acc 48.828 (49.072)	Top-5 acc 74.219 (72.562)	lr 0.02176
Train [29][440/3239]	Time 0.610 (0.972)	Data Time 0.001 (0.057)	Loss 3.2852 (3.1331)	Entropy 0.79894 (0.79908)	Top-1 acc 47.266 (49.090)	Top-5 acc 70.703 (72.577)	lr 0.02176
Train [29][450/3239]	Time 0.579 (0.969)	Data Time 0.001 (0.056)	Loss 3.0675 (3.1325)	Entropy 0.79884 (0.79907)	Top-1 acc 46.875 (49.097)	Top-5 acc 76.172 (72.597)	lr 0.02176
Train [29][460/3239]	Time 0.586 (0.967)	Data Time 0.001 (0.055)	Loss 3.1160 (3.1332)	Entropy 0.79865 (0.79906)	Top-1 acc 51.172 (49.078)	Top-5 acc 73.047 (72.593)	lr 0.02176
Train [29][470/3239]	Time 0.633 (0.965)	Data Time 0.001 (0.054)	Loss 3.1053 (3.1334)	Entropy 0.79864 (0.79905)	Top-1 acc 47.656 (49.065)	Top-5 acc 72.266 (72.580)	lr 0.02176
Train [29][480/3239]	Time 0.734 (0.963)	Data Time 0.002 (0.053)	Loss 3.3943 (3.1342)	Entropy 0.79857 (0.79904)	Top-1 acc 45.703 (49.058)	Top-5 acc 65.234 (72.546)	lr 0.02176
Train [29][490/3239]	Time 0.609 (0.960)	Data Time 0.001 (0.052)	Loss 3.1437 (3.1333)	Entropy 0.79843 (0.79903)	Top-1 acc 47.656 (49.061)	Top-5 acc 69.531 (72.563)	lr 0.02176
Train [29][500/3239]	Time 0.491 (0.958)	Data Time 0.001 (0.051)	Loss 3.1682 (3.1333)	Entropy 0.79854 (0.79902)	Top-1 acc 52.734 (49.073)	Top-5 acc 73.438 (72.568)	lr 0.02176
Train [29][510/3239]	Time 0.582 (0.956)	Data Time 0.001 (0.050)	Loss 3.5558 (3.1345)	Entropy 0.79868 (0.79901)	Top-1 acc 41.406 (49.049)	Top-5 acc 62.500 (72.532)	lr 0.02175
Train [29][520/3239]	Time 0.603 (0.953)	Data Time 0.001 (0.049)	Loss 3.1283 (3.1338)	Entropy 0.79846 (0.79901)	Top-1 acc 49.609 (49.078)	Top-5 acc 73.047 (72.545)	lr 0.02175
Train [29][530/3239]	Time 0.628 (0.952)	Data Time 0.001 (0.048)	Loss 3.0697 (3.1342)	Entropy 0.79892 (0.79900)	Top-1 acc 48.828 (49.051)	Top-5 acc 72.266 (72.533)	lr 0.02175
Train [29][540/3239]	Time 0.598 (0.950)	Data Time 0.001 (0.047)	Loss 3.1320 (3.1336)	Entropy 0.79882 (0.79900)	Top-1 acc 48.047 (49.062)	Top-5 acc 74.609 (72.563)	lr 0.02175
Train [29][550/3239]	Time 0.619 (0.949)	Data Time 0.001 (0.046)	Loss 3.0480 (3.1338)	Entropy 0.79858 (0.79900)	Top-1 acc 49.609 (49.042)	Top-5 acc 71.094 (72.551)	lr 0.02175
Train [29][560/3239]	Time 0.608 (0.947)	Data Time 0.001 (0.046)	Loss 3.2874 (3.1351)	Entropy 0.79859 (0.79899)	Top-1 acc 48.438 (49.041)	Top-5 acc 69.531 (72.526)	lr 0.02175
Train [29][570/3239]	Time 0.628 (0.946)	Data Time 0.001 (0.045)	Loss 3.2183 (3.1345)	Entropy 0.79852 (0.79898)	Top-1 acc 47.656 (49.037)	Top-5 acc 71.094 (72.530)	lr 0.02175
Train [29][580/3239]	Time 0.604 (0.944)	Data Time 0.001 (0.044)	Loss 3.1361 (3.1336)	Entropy 0.79870 (0.79897)	Top-1 acc 48.438 (49.056)	Top-5 acc 70.312 (72.535)	lr 0.02175
Train [29][590/3239]	Time 0.628 (0.943)	Data Time 0.001 (0.043)	Loss 3.1212 (3.1338)	Entropy 0.79811 (0.79897)	Top-1 acc 50.781 (49.061)	Top-5 acc 70.703 (72.519)	lr 0.02175
Train [29][600/3239]	Time 0.594 (0.941)	Data Time 0.001 (0.043)	Loss 2.8834 (3.1328)	Entropy 0.79798 (0.79895)	Top-1 acc 51.953 (49.076)	Top-5 acc 77.734 (72.538)	lr 0.02175
Train [29][610/3239]	Time 0.595 (0.940)	Data Time 0.001 (0.042)	Loss 3.2360 (3.1319)	Entropy 0.79742 (0.79894)	Top-1 acc 48.828 (49.107)	Top-5 acc 71.484 (72.557)	lr 0.02175
Train [29][620/3239]	Time 0.578 (0.939)	Data Time 0.001 (0.041)	Loss 2.9386 (3.1316)	Entropy 0.79716 (0.79891)	Top-1 acc 50.391 (49.113)	Top-5 acc 76.172 (72.552)	lr 0.02175
Train [29][630/3239]	Time 0.621 (0.938)	Data Time 0.001 (0.041)	Loss 3.1877 (3.1317)	Entropy 0.79729 (0.79888)	Top-1 acc 49.219 (49.113)	Top-5 acc 71.094 (72.546)	lr 0.02175
Train [29][640/3239]	Time 0.701 (0.937)	Data Time 0.001 (0.040)	Loss 3.1617 (3.1322)	Entropy 0.79703 (0.79886)	Top-1 acc 48.047 (49.116)	Top-5 acc 74.609 (72.529)	lr 0.02175
Train [29][650/3239]	Time 0.612 (0.935)	Data Time 0.001 (0.040)	Loss 3.0469 (3.1330)	Entropy 0.79715 (0.79883)	Top-1 acc 48.438 (49.098)	Top-5 acc 74.219 (72.525)	lr 0.02175
Train [29][660/3239]	Time 0.634 (0.934)	Data Time 0.001 (0.039)	Loss 3.0099 (3.1326)	Entropy 0.79702 (0.79881)	Top-1 acc 53.125 (49.102)	Top-5 acc 75.391 (72.529)	lr 0.02174
Train [29][670/3239]	Time 0.610 (0.933)	Data Time 0.001 (0.038)	Loss 3.0892 (3.1328)	Entropy 0.79731 (0.79878)	Top-1 acc 50.781 (49.106)	Top-5 acc 73.438 (72.515)	lr 0.02174
Train [29][680/3239]	Time 0.574 (0.931)	Data Time 0.001 (0.038)	Loss 3.0664 (3.1333)	Entropy 0.79719 (0.79876)	Top-1 acc 50.000 (49.114)	Top-5 acc 76.562 (72.508)	lr 0.02174
Train [29][690/3239]	Time 0.620 (0.930)	Data Time 0.002 (0.037)	Loss 3.2457 (3.1328)	Entropy 0.79697 (0.79874)	Top-1 acc 45.703 (49.120)	Top-5 acc 71.484 (72.511)	lr 0.02174
Train [29][700/3239]	Time 0.591 (0.929)	Data Time 0.001 (0.037)	Loss 2.9232 (3.1328)	Entropy 0.79684 (0.79871)	Top-1 acc 55.859 (49.116)	Top-5 acc 76.953 (72.507)	lr 0.02174
Train [29][710/3239]	Time 0.723 (0.928)	Data Time 0.001 (0.036)	Loss 3.2611 (3.1342)	Entropy 0.79657 (0.79868)	Top-1 acc 44.141 (49.084)	Top-5 acc 69.922 (72.473)	lr 0.02174
Train [29][720/3239]	Time 0.633 (0.927)	Data Time 0.002 (0.036)	Loss 3.1167 (3.1344)	Entropy 0.79650 (0.79865)	Top-1 acc 48.828 (49.077)	Top-5 acc 71.484 (72.463)	lr 0.02174
Train [29][730/3239]	Time 0.616 (0.926)	Data Time 0.002 (0.035)	Loss 3.1574 (3.1347)	Entropy 0.79608 (0.79862)	Top-1 acc 50.781 (49.064)	Top-5 acc 69.531 (72.438)	lr 0.02174
Train [29][740/3239]	Time 0.585 (0.925)	Data Time 0.001 (0.035)	Loss 3.1096 (3.1348)	Entropy 0.79591 (0.79859)	Top-1 acc 48.438 (49.073)	Top-5 acc 74.609 (72.441)	lr 0.02174
Train [29][750/3239]	Time 0.608 (0.924)	Data Time 0.001 (0.035)	Loss 3.1082 (3.1351)	Entropy 0.79580 (0.79855)	Top-1 acc 47.266 (49.058)	Top-5 acc 72.656 (72.438)	lr 0.02174
Train [29][760/3239]	Time 0.637 (0.923)	Data Time 0.001 (0.034)	Loss 3.3019 (3.1359)	Entropy 0.79580 (0.79851)	Top-1 acc 42.578 (49.047)	Top-5 acc 68.750 (72.421)	lr 0.02174
Train [29][770/3239]	Time 0.610 (0.923)	Data Time 0.001 (0.034)	Loss 2.9092 (3.1361)	Entropy 0.79593 (0.79848)	Top-1 acc 55.859 (49.041)	Top-5 acc 75.391 (72.415)	lr 0.02174
Train [29][780/3239]	Time 0.624 (0.922)	Data Time 0.001 (0.033)	Loss 3.2772 (3.1370)	Entropy 0.79599 (0.79845)	Top-1 acc 45.312 (49.024)	Top-5 acc 64.844 (72.391)	lr 0.02174
Train [29][790/3239]	Time 0.615 (0.921)	Data Time 0.001 (0.033)	Loss 3.4306 (3.1375)	Entropy 0.79623 (0.79842)	Top-1 acc 41.406 (49.010)	Top-5 acc 63.281 (72.378)	lr 0.02174
Train [29][800/3239]	Time 0.593 (0.920)	Data Time 0.001 (0.032)	Loss 2.9461 (3.1370)	Entropy 0.79621 (0.79839)	Top-1 acc 57.031 (49.020)	Top-5 acc 76.953 (72.395)	lr 0.02174
Train [29][810/3239]	Time 0.644 (0.920)	Data Time 0.001 (0.032)	Loss 3.1384 (3.1370)	Entropy 0.79619 (0.79836)	Top-1 acc 48.047 (49.010)	Top-5 acc 71.094 (72.390)	lr 0.02173
Train [29][820/3239]	Time 0.593 (0.919)	Data Time 0.001 (0.032)	Loss 3.2996 (3.1375)	Entropy 0.79624 (0.79834)	Top-1 acc 44.531 (48.997)	Top-5 acc 73.438 (72.396)	lr 0.02173
Train [29][830/3239]	Time 0.617 (0.918)	Data Time 0.001 (0.031)	Loss 3.1362 (3.1373)	Entropy 0.79580 (0.79831)	Top-1 acc 48.828 (48.990)	Top-5 acc 75.781 (72.400)	lr 0.02173
Train [29][840/3239]	Time 0.616 (0.917)	Data Time 0.001 (0.031)	Loss 3.1657 (3.1374)	Entropy 0.79550 (0.79828)	Top-1 acc 47.266 (48.970)	Top-5 acc 72.266 (72.392)	lr 0.02173
Train [29][850/3239]	Time 0.592 (0.916)	Data Time 0.002 (0.031)	Loss 3.0851 (3.1380)	Entropy 0.79565 (0.79825)	Top-1 acc 48.438 (48.952)	Top-5 acc 70.703 (72.379)	lr 0.02173
Train [29][860/3239]	Time 0.511 (0.916)	Data Time 0.001 (0.030)	Loss 3.1451 (3.1375)	Entropy 0.79591 (0.79822)	Top-1 acc 50.391 (48.963)	Top-5 acc 71.875 (72.388)	lr 0.02173
Train [29][870/3239]	Time 0.676 (0.915)	Data Time 0.002 (0.030)	Loss 3.2680 (3.1379)	Entropy 0.79598 (0.79819)	Top-1 acc 44.531 (48.947)	Top-5 acc 70.703 (72.374)	lr 0.02173
Train [29][880/3239]	Time 0.629 (0.914)	Data Time 0.001 (0.030)	Loss 3.2683 (3.1383)	Entropy 0.79577 (0.79817)	Top-1 acc 45.312 (48.948)	Top-5 acc 69.922 (72.365)	lr 0.02173
Train [29][890/3239]	Time 0.595 (0.914)	Data Time 0.001 (0.029)	Loss 3.0011 (3.1382)	Entropy 0.79560 (0.79814)	Top-1 acc 51.172 (48.953)	Top-5 acc 73.828 (72.367)	lr 0.02173
Train [29][900/3239]	Time 0.626 (0.914)	Data Time 0.001 (0.029)	Loss 3.2474 (3.1385)	Entropy 0.79555 (0.79811)	Top-1 acc 48.438 (48.941)	Top-5 acc 68.359 (72.363)	lr 0.02173
Train [29][910/3239]	Time 0.626 (0.913)	Data Time 0.001 (0.029)	Loss 2.9913 (3.1380)	Entropy 0.79566 (0.79808)	Top-1 acc 53.516 (48.946)	Top-5 acc 72.656 (72.375)	lr 0.02173
Train [29][920/3239]	Time 0.599 (0.913)	Data Time 0.001 (0.029)	Loss 3.2430 (3.1368)	Entropy 0.79579 (0.79806)	Top-1 acc 47.656 (48.968)	Top-5 acc 70.703 (72.402)	lr 0.02173
Train [29][930/3239]	Time 0.588 (0.912)	Data Time 0.001 (0.028)	Loss 3.1496 (3.1366)	Entropy 0.79574 (0.79803)	Top-1 acc 44.922 (48.967)	Top-5 acc 71.484 (72.402)	lr 0.02173
Train [29][940/3239]	Time 0.707 (0.912)	Data Time 0.002 (0.028)	Loss 3.0393 (3.1364)	Entropy 0.79561 (0.79801)	Top-1 acc 51.953 (48.976)	Top-5 acc 76.172 (72.402)	lr 0.02173
Train [29][950/3239]	Time 0.696 (0.938)	Data Time 0.005 (0.028)	Loss 3.0425 (3.1360)	Entropy 0.79549 (0.79798)	Top-1 acc 52.734 (48.991)	Top-5 acc 74.219 (72.408)	lr 0.02172
Train [29][960/3239]	Time 0.680 (0.938)	Data Time 0.002 (0.027)	Loss 3.3233 (3.1360)	Entropy 0.79534 (0.79795)	Top-1 acc 43.359 (48.984)	Top-5 acc 71.094 (72.403)	lr 0.02172
Train [29][970/3239]	Time 0.586 (0.937)	Data Time 0.001 (0.027)	Loss 3.2140 (3.1360)	Entropy 0.79561 (0.79793)	Top-1 acc 47.656 (48.984)	Top-5 acc 69.531 (72.397)	lr 0.02172
Train [29][980/3239]	Time 0.645 (0.935)	Data Time 0.001 (0.027)	Loss 3.0901 (3.1364)	Entropy 0.79562 (0.79790)	Top-1 acc 52.734 (48.974)	Top-5 acc 72.656 (72.385)	lr 0.02172
Train [29][990/3239]	Time 0.601 (0.935)	Data Time 0.001 (0.027)	Loss 3.0573 (3.1363)	Entropy 0.79570 (0.79788)	Top-1 acc 50.781 (48.975)	Top-5 acc 75.391 (72.389)	lr 0.02172
Train [29][1000/3239]	Time 0.581 (0.934)	Data Time 0.001 (0.026)	Loss 3.1315 (3.1367)	Entropy 0.79545 (0.79786)	Top-1 acc 50.391 (48.973)	Top-5 acc 71.484 (72.374)	lr 0.02172
Train [29][1010/3239]	Time 0.592 (0.933)	Data Time 0.001 (0.026)	Loss 3.0756 (3.1369)	Entropy 0.79547 (0.79783)	Top-1 acc 51.172 (48.969)	Top-5 acc 73.438 (72.358)	lr 0.02172
Train [29][1020/3239]	Time 0.587 (0.933)	Data Time 0.001 (0.026)	Loss 3.0823 (3.1364)	Entropy 0.79521 (0.79781)	Top-1 acc 47.656 (48.978)	Top-5 acc 75.391 (72.367)	lr 0.02172
Train [29][1030/3239]	Time 0.709 (0.932)	Data Time 0.002 (0.026)	Loss 3.1199 (3.1362)	Entropy 0.79531 (0.79779)	Top-1 acc 47.656 (48.984)	Top-5 acc 72.656 (72.371)	lr 0.02172
Train [29][1040/3239]	Time 0.603 (0.932)	Data Time 0.001 (0.025)	Loss 3.0636 (3.1360)	Entropy 0.79509 (0.79776)	Top-1 acc 49.609 (48.985)	Top-5 acc 75.391 (72.379)	lr 0.02172
Train [29][1050/3239]	Time 0.551 (0.931)	Data Time 0.001 (0.025)	Loss 2.9789 (3.1361)	Entropy 0.79467 (0.79773)	Top-1 acc 55.469 (48.986)	Top-5 acc 74.609 (72.371)	lr 0.02172
Train [29][1060/3239]	Time 0.593 (0.931)	Data Time 0.002 (0.025)	Loss 3.0734 (3.1360)	Entropy 0.79498 (0.79771)	Top-1 acc 52.734 (48.985)	Top-5 acc 73.047 (72.373)	lr 0.02172
Train [29][1070/3239]	Time 0.626 (0.930)	Data Time 0.001 (0.025)	Loss 3.0828 (3.1362)	Entropy 0.79487 (0.79768)	Top-1 acc 50.781 (48.980)	Top-5 acc 71.875 (72.364)	lr 0.02172
Train [29][1080/3239]	Time 0.620 (0.930)	Data Time 0.002 (0.025)	Loss 3.1394 (3.1365)	Entropy 0.79530 (0.79765)	Top-1 acc 48.047 (48.977)	Top-5 acc 71.484 (72.355)	lr 0.02172
Train [29][1090/3239]	Time 0.610 (0.929)	Data Time 0.001 (0.024)	Loss 3.1146 (3.1363)	Entropy 0.79526 (0.79763)	Top-1 acc 48.438 (48.980)	Top-5 acc 73.047 (72.354)	lr 0.02172
Train [29][1100/3239]	Time 0.629 (0.929)	Data Time 0.001 (0.024)	Loss 3.1308 (3.1363)	Entropy 0.79480 (0.79761)	Top-1 acc 47.656 (48.986)	Top-5 acc 72.656 (72.356)	lr 0.02171
Train [29][1110/3239]	Time 0.621 (0.928)	Data Time 0.001 (0.024)	Loss 2.9928 (3.1358)	Entropy 0.79493 (0.79759)	Top-1 acc 50.000 (48.994)	Top-5 acc 75.000 (72.360)	lr 0.02171
Train [29][1120/3239]	Time 0.624 (0.928)	Data Time 0.002 (0.024)	Loss 3.1531 (3.1360)	Entropy 0.79491 (0.79756)	Top-1 acc 49.219 (48.992)	Top-5 acc 73.438 (72.360)	lr 0.02171
Train [29][1130/3239]	Time 0.618 (0.927)	Data Time 0.001 (0.024)	Loss 3.1891 (3.1359)	Entropy 0.79478 (0.79754)	Top-1 acc 45.703 (48.991)	Top-5 acc 72.266 (72.361)	lr 0.02171
Train [29][1140/3239]	Time 0.602 (0.926)	Data Time 0.001 (0.023)	Loss 3.0734 (3.1366)	Entropy 0.79402 (0.79751)	Top-1 acc 48.047 (48.976)	Top-5 acc 71.484 (72.344)	lr 0.02171
Train [29][1150/3239]	Time 0.499 (0.925)	Data Time 0.001 (0.023)	Loss 3.0648 (3.1360)	Entropy 0.79452 (0.79748)	Top-1 acc 51.172 (48.997)	Top-5 acc 77.734 (72.358)	lr 0.02171
Train [29][1160/3239]	Time 0.608 (0.925)	Data Time 0.001 (0.023)	Loss 3.1562 (3.1355)	Entropy 0.79473 (0.79746)	Top-1 acc 49.609 (49.011)	Top-5 acc 72.656 (72.374)	lr 0.02171
Train [29][1170/3239]	Time 0.606 (0.924)	Data Time 0.001 (0.023)	Loss 3.2126 (3.1352)	Entropy 0.79467 (0.79743)	Top-1 acc 46.094 (49.014)	Top-5 acc 68.359 (72.379)	lr 0.02171
Train [29][1180/3239]	Time 0.612 (0.924)	Data Time 0.002 (0.023)	Loss 3.1518 (3.1354)	Entropy 0.79459 (0.79741)	Top-1 acc 50.000 (49.013)	Top-5 acc 71.875 (72.380)	lr 0.02171
Train [29][1190/3239]	Time 0.730 (0.924)	Data Time 0.001 (0.023)	Loss 2.8395 (3.1349)	Entropy 0.79439 (0.79738)	Top-1 acc 53.125 (49.021)	Top-5 acc 77.734 (72.382)	lr 0.02171
Train [29][1200/3239]	Time 0.627 (0.923)	Data Time 0.001 (0.022)	Loss 2.9962 (3.1348)	Entropy 0.79425 (0.79736)	Top-1 acc 54.297 (49.018)	Top-5 acc 74.609 (72.388)	lr 0.02171
Train [29][1210/3239]	Time 0.627 (0.923)	Data Time 0.001 (0.022)	Loss 3.1090 (3.1349)	Entropy 0.79424 (0.79733)	Top-1 acc 49.609 (49.015)	Top-5 acc 76.172 (72.392)	lr 0.02171
Train [29][1220/3239]	Time 0.610 (0.922)	Data Time 0.001 (0.022)	Loss 3.0894 (3.1350)	Entropy 0.79444 (0.79731)	Top-1 acc 45.703 (49.011)	Top-5 acc 71.875 (72.393)	lr 0.02171
Train [29][1230/3239]	Time 0.622 (0.922)	Data Time 0.001 (0.022)	Loss 3.2163 (3.1349)	Entropy 0.79396 (0.79728)	Top-1 acc 47.656 (49.009)	Top-5 acc 72.266 (72.391)	lr 0.02171
Train [29][1240/3239]	Time 0.627 (0.921)	Data Time 0.002 (0.022)	Loss 3.2109 (3.1349)	Entropy 0.79383 (0.79726)	Top-1 acc 50.391 (49.010)	Top-5 acc 71.875 (72.387)	lr 0.02171
Train [29][1250/3239]	Time 0.597 (0.921)	Data Time 0.001 (0.022)	Loss 3.1748 (3.1349)	Entropy 0.79383 (0.79723)	Top-1 acc 47.656 (49.006)	Top-5 acc 68.750 (72.380)	lr 0.02170
Train [29][1260/3239]	Time 0.717 (0.921)	Data Time 0.001 (0.021)	Loss 3.1403 (3.1342)	Entropy 0.79395 (0.79720)	Top-1 acc 50.391 (49.024)	Top-5 acc 70.703 (72.389)	lr 0.02170
Train [29][1270/3239]	Time 0.591 (0.920)	Data Time 0.001 (0.021)	Loss 3.0507 (3.1343)	Entropy 0.79375 (0.79718)	Top-1 acc 50.781 (49.027)	Top-5 acc 73.438 (72.392)	lr 0.02170
Train [29][1280/3239]	Time 0.600 (0.920)	Data Time 0.001 (0.021)	Loss 3.1385 (3.1351)	Entropy 0.79359 (0.79715)	Top-1 acc 47.656 (49.008)	Top-5 acc 72.266 (72.376)	lr 0.02170
Train [29][1290/3239]	Time 0.579 (0.919)	Data Time 0.001 (0.021)	Loss 3.0899 (3.1348)	Entropy 0.79380 (0.79712)	Top-1 acc 50.781 (49.023)	Top-5 acc 76.562 (72.384)	lr 0.02170
Train [29][1300/3239]	Time 0.640 (0.919)	Data Time 0.001 (0.021)	Loss 2.9846 (3.1348)	Entropy 0.79360 (0.79710)	Top-1 acc 53.516 (49.028)	Top-5 acc 76.953 (72.382)	lr 0.02170
Train [29][1310/3239]	Time 0.601 (0.918)	Data Time 0.001 (0.021)	Loss 3.3089 (3.1349)	Entropy 0.79325 (0.79707)	Top-1 acc 41.797 (49.030)	Top-5 acc 67.969 (72.381)	lr 0.02170
Train [29][1320/3239]	Time 0.476 (0.918)	Data Time 0.001 (0.021)	Loss 3.2104 (3.1347)	Entropy 0.79312 (0.79704)	Top-1 acc 48.047 (49.037)	Top-5 acc 71.484 (72.383)	lr 0.02170
Train [29][1330/3239]	Time 0.596 (0.917)	Data Time 0.001 (0.020)	Loss 3.0047 (3.1344)	Entropy 0.79300 (0.79701)	Top-1 acc 53.125 (49.043)	Top-5 acc 74.609 (72.387)	lr 0.02170
Train [29][1340/3239]	Time 0.610 (0.917)	Data Time 0.001 (0.020)	Loss 3.1321 (3.1341)	Entropy 0.79312 (0.79698)	Top-1 acc 48.438 (49.045)	Top-5 acc 74.219 (72.402)	lr 0.02170
Train [29][1350/3239]	Time 0.725 (0.916)	Data Time 0.001 (0.020)	Loss 3.1230 (3.1339)	Entropy 0.79330 (0.79695)	Top-1 acc 45.703 (49.048)	Top-5 acc 75.391 (72.407)	lr 0.02170
Train [29][1360/3239]	Time 0.603 (0.916)	Data Time 0.001 (0.020)	Loss 3.1893 (3.1339)	Entropy 0.79375 (0.79693)	Top-1 acc 47.656 (49.046)	Top-5 acc 71.094 (72.408)	lr 0.02170
Train [29][1370/3239]	Time 0.571 (0.916)	Data Time 0.001 (0.020)	Loss 2.9676 (3.1337)	Entropy 0.79406 (0.79691)	Top-1 acc 52.344 (49.047)	Top-5 acc 74.219 (72.412)	lr 0.02170
Train [29][1380/3239]	Time 0.636 (0.915)	Data Time 0.001 (0.020)	Loss 2.9735 (3.1332)	Entropy 0.79368 (0.79688)	Top-1 acc 55.469 (49.061)	Top-5 acc 75.781 (72.421)	lr 0.02170
Train [29][1390/3239]	Time 0.597 (0.915)	Data Time 0.001 (0.020)	Loss 3.2154 (3.1332)	Entropy 0.79390 (0.79686)	Top-1 acc 46.094 (49.061)	Top-5 acc 68.750 (72.425)	lr 0.02169
Train [29][1400/3239]	Time 0.612 (0.915)	Data Time 0.001 (0.019)	Loss 3.0866 (3.1331)	Entropy 0.79385 (0.79684)	Top-1 acc 48.438 (49.065)	Top-5 acc 70.703 (72.426)	lr 0.02169
Train [29][1410/3239]	Time 0.586 (0.914)	Data Time 0.001 (0.019)	Loss 3.1984 (3.1329)	Entropy 0.79351 (0.79682)	Top-1 acc 47.656 (49.071)	Top-5 acc 71.094 (72.440)	lr 0.02169
Train [29][1420/3239]	Time 0.726 (0.914)	Data Time 0.001 (0.019)	Loss 3.0904 (3.1330)	Entropy 0.79349 (0.79680)	Top-1 acc 50.391 (49.073)	Top-5 acc 73.828 (72.438)	lr 0.02169
Train [29][1430/3239]	Time 0.643 (0.914)	Data Time 0.001 (0.019)	Loss 3.0615 (3.1330)	Entropy 0.79311 (0.79677)	Top-1 acc 52.344 (49.075)	Top-5 acc 70.312 (72.437)	lr 0.02169
Train [29][1440/3239]	Time 0.598 (0.913)	Data Time 0.001 (0.019)	Loss 3.0994 (3.1329)	Entropy 0.79274 (0.79674)	Top-1 acc 49.609 (49.083)	Top-5 acc 73.047 (72.435)	lr 0.02169
Train [29][1450/3239]	Time 0.609 (0.913)	Data Time 0.001 (0.019)	Loss 2.9254 (3.1332)	Entropy 0.79279 (0.79672)	Top-1 acc 55.469 (49.077)	Top-5 acc 76.562 (72.428)	lr 0.02169
Train [29][1460/3239]	Time 0.618 (0.913)	Data Time 0.001 (0.019)	Loss 3.2320 (3.1331)	Entropy 0.79269 (0.79669)	Top-1 acc 47.266 (49.076)	Top-5 acc 71.484 (72.432)	lr 0.02169
Train [29][1470/3239]	Time 0.614 (0.912)	Data Time 0.002 (0.019)	Loss 2.9871 (3.1327)	Entropy 0.79230 (0.79666)	Top-1 acc 52.344 (49.083)	Top-5 acc 74.609 (72.437)	lr 0.02169
Train [29][1480/3239]	Time 0.592 (0.912)	Data Time 0.001 (0.019)	Loss 3.1871 (3.1323)	Entropy 0.79263 (0.79663)	Top-1 acc 45.312 (49.092)	Top-5 acc 72.266 (72.445)	lr 0.02169
Train [29][1490/3239]	Time 0.582 (0.911)	Data Time 0.001 (0.018)	Loss 3.2600 (3.1323)	Entropy 0.79226 (0.79661)	Top-1 acc 47.266 (49.092)	Top-5 acc 72.266 (72.445)	lr 0.02169
Train [29][1500/3239]	Time 0.650 (0.911)	Data Time 0.001 (0.018)	Loss 3.1329 (3.1324)	Entropy 0.79235 (0.79658)	Top-1 acc 49.609 (49.093)	Top-5 acc 71.875 (72.444)	lr 0.02169
Train [29][1510/3239]	Time 0.647 (0.910)	Data Time 0.001 (0.018)	Loss 3.0569 (3.1320)	Entropy 0.79232 (0.79655)	Top-1 acc 52.734 (49.102)	Top-5 acc 77.734 (72.454)	lr 0.02169
Train [29][1520/3239]	Time 0.575 (0.910)	Data Time 0.001 (0.018)	Loss 3.1780 (3.1317)	Entropy 0.79195 (0.79652)	Top-1 acc 45.312 (49.103)	Top-5 acc 72.656 (72.465)	lr 0.02169
Train [29][1530/3239]	Time 0.613 (0.910)	Data Time 0.001 (0.018)	Loss 3.3086 (3.1317)	Entropy 0.79185 (0.79649)	Top-1 acc 47.266 (49.107)	Top-5 acc 67.188 (72.463)	lr 0.02169
Train [29][1540/3239]	Time 0.599 (0.910)	Data Time 0.001 (0.018)	Loss 3.1864 (3.1318)	Entropy 0.79177 (0.79646)	Top-1 acc 46.484 (49.106)	Top-5 acc 73.047 (72.462)	lr 0.02168
Train [29][1550/3239]	Time 0.602 (0.909)	Data Time 0.001 (0.018)	Loss 3.1908 (3.1321)	Entropy 0.79193 (0.79643)	Top-1 acc 51.172 (49.098)	Top-5 acc 70.703 (72.458)	lr 0.02168
Train [29][1560/3239]	Time 0.639 (0.909)	Data Time 0.001 (0.018)	Loss 2.9389 (3.1316)	Entropy 0.79181 (0.79640)	Top-1 acc 54.297 (49.113)	Top-5 acc 76.562 (72.473)	lr 0.02168
Train [29][1570/3239]	Time 0.613 (0.909)	Data Time 0.001 (0.018)	Loss 2.9848 (3.1314)	Entropy 0.79194 (0.79637)	Top-1 acc 50.781 (49.118)	Top-5 acc 76.953 (72.482)	lr 0.02168
Train [29][1580/3239]	Time 0.690 (0.909)	Data Time 0.001 (0.017)	Loss 3.2150 (3.1313)	Entropy 0.79205 (0.79634)	Top-1 acc 48.047 (49.122)	Top-5 acc 73.438 (72.486)	lr 0.02168
Train [29][1590/3239]	Time 0.545 (0.908)	Data Time 0.001 (0.017)	Loss 3.1473 (3.1311)	Entropy 0.79199 (0.79632)	Top-1 acc 51.172 (49.128)	Top-5 acc 73.047 (72.489)	lr 0.02168
Train [29][1600/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.017)	Loss 3.2496 (3.1314)	Entropy 0.79192 (0.79629)	Top-1 acc 45.703 (49.117)	Top-5 acc 69.922 (72.483)	lr 0.02168
Train [29][1610/3239]	Time 0.575 (0.924)	Data Time 0.002 (0.017)	Loss 3.4118 (3.1316)	Entropy 0.79205 (0.79626)	Top-1 acc 44.922 (49.116)	Top-5 acc 67.188 (72.479)	lr 0.02168
Train [29][1620/3239]	Time 0.585 (0.923)	Data Time 0.002 (0.017)	Loss 3.1398 (3.1312)	Entropy 0.79204 (0.79624)	Top-1 acc 48.828 (49.124)	Top-5 acc 71.094 (72.489)	lr 0.02168
Train [29][1630/3239]	Time 0.620 (0.923)	Data Time 0.001 (0.017)	Loss 3.0746 (3.1311)	Entropy 0.79132 (0.79621)	Top-1 acc 50.391 (49.128)	Top-5 acc 73.828 (72.493)	lr 0.02168
Train [29][1640/3239]	Time 0.601 (0.923)	Data Time 0.001 (0.017)	Loss 2.9496 (3.1311)	Entropy 0.79105 (0.79618)	Top-1 acc 53.125 (49.136)	Top-5 acc 77.344 (72.493)	lr 0.02168
Train [29][1650/3239]	Time 0.598 (0.922)	Data Time 0.001 (0.017)	Loss 3.2101 (3.1308)	Entropy 0.79108 (0.79615)	Top-1 acc 48.828 (49.142)	Top-5 acc 69.531 (72.499)	lr 0.02168
Train [29][1660/3239]	Time 0.578 (0.922)	Data Time 0.001 (0.017)	Loss 3.1024 (3.1307)	Entropy 0.79113 (0.79612)	Top-1 acc 51.172 (49.151)	Top-5 acc 71.875 (72.503)	lr 0.02168
Train [29][1670/3239]	Time 0.701 (0.922)	Data Time 0.001 (0.017)	Loss 2.9895 (3.1303)	Entropy 0.79124 (0.79609)	Top-1 acc 49.609 (49.154)	Top-5 acc 77.344 (72.515)	lr 0.02168
Train [29][1680/3239]	Time 0.629 (0.921)	Data Time 0.001 (0.017)	Loss 3.4257 (3.1310)	Entropy 0.79131 (0.79606)	Top-1 acc 42.188 (49.137)	Top-5 acc 66.016 (72.498)	lr 0.02167
Train [29][1690/3239]	Time 0.618 (0.921)	Data Time 0.001 (0.016)	Loss 3.1637 (3.1309)	Entropy 0.79095 (0.79603)	Top-1 acc 50.781 (49.143)	Top-5 acc 74.219 (72.503)	lr 0.02167
Train [29][1700/3239]	Time 0.595 (0.921)	Data Time 0.001 (0.016)	Loss 3.1412 (3.1305)	Entropy 0.79073 (0.79600)	Top-1 acc 49.609 (49.148)	Top-5 acc 73.047 (72.511)	lr 0.02167
Train [29][1710/3239]	Time 0.607 (0.920)	Data Time 0.001 (0.016)	Loss 3.1830 (3.1303)	Entropy 0.79021 (0.79597)	Top-1 acc 49.219 (49.155)	Top-5 acc 72.656 (72.520)	lr 0.02167
Train [29][1720/3239]	Time 0.610 (0.920)	Data Time 0.001 (0.016)	Loss 3.0914 (3.1305)	Entropy 0.79034 (0.79594)	Top-1 acc 48.828 (49.154)	Top-5 acc 71.484 (72.515)	lr 0.02167
Train [29][1730/3239]	Time 0.542 (0.920)	Data Time 0.001 (0.016)	Loss 3.1069 (3.1306)	Entropy 0.79037 (0.79590)	Top-1 acc 48.438 (49.157)	Top-5 acc 72.266 (72.508)	lr 0.02167
Train [29][1740/3239]	Time 0.682 (0.919)	Data Time 0.001 (0.016)	Loss 2.9549 (3.1304)	Entropy 0.79056 (0.79587)	Top-1 acc 54.688 (49.164)	Top-5 acc 72.656 (72.507)	lr 0.02167
Train [29][1750/3239]	Time 0.604 (0.919)	Data Time 0.001 (0.016)	Loss 2.7971 (3.1301)	Entropy 0.79055 (0.79584)	Top-1 acc 57.031 (49.170)	Top-5 acc 78.125 (72.512)	lr 0.02167
Train [29][1760/3239]	Time 0.626 (0.919)	Data Time 0.001 (0.016)	Loss 3.2862 (3.1300)	Entropy 0.79070 (0.79581)	Top-1 acc 45.703 (49.166)	Top-5 acc 70.312 (72.513)	lr 0.02167
Train [29][1770/3239]	Time 0.626 (0.918)	Data Time 0.001 (0.016)	Loss 3.1431 (3.1302)	Entropy 0.79057 (0.79578)	Top-1 acc 48.047 (49.160)	Top-5 acc 72.266 (72.511)	lr 0.02167
Train [29][1780/3239]	Time 0.598 (0.918)	Data Time 0.001 (0.016)	Loss 2.9928 (3.1303)	Entropy 0.79041 (0.79575)	Top-1 acc 52.734 (49.158)	Top-5 acc 75.000 (72.512)	lr 0.02167
Train [29][1790/3239]	Time 0.626 (0.917)	Data Time 0.001 (0.016)	Loss 3.1094 (3.1301)	Entropy 0.79005 (0.79572)	Top-1 acc 49.219 (49.162)	Top-5 acc 76.172 (72.517)	lr 0.02167
Train [29][1800/3239]	Time 0.632 (0.917)	Data Time 0.002 (0.016)	Loss 3.0871 (3.1299)	Entropy 0.78998 (0.79569)	Top-1 acc 48.438 (49.164)	Top-5 acc 69.922 (72.520)	lr 0.02167
Train [29][1810/3239]	Time 0.572 (0.917)	Data Time 0.001 (0.015)	Loss 3.2628 (3.1303)	Entropy 0.79007 (0.79566)	Top-1 acc 46.094 (49.157)	Top-5 acc 69.922 (72.507)	lr 0.02167
Train [29][1820/3239]	Time 0.634 (0.917)	Data Time 0.001 (0.015)	Loss 3.2650 (3.1305)	Entropy 0.78996 (0.79563)	Top-1 acc 45.703 (49.151)	Top-5 acc 69.531 (72.502)	lr 0.02167
Train [29][1830/3239]	Time 0.623 (0.916)	Data Time 0.001 (0.015)	Loss 2.9701 (3.1302)	Entropy 0.79025 (0.79560)	Top-1 acc 53.906 (49.158)	Top-5 acc 73.047 (72.503)	lr 0.02166
Train [29][1840/3239]	Time 0.601 (0.916)	Data Time 0.001 (0.015)	Loss 3.1163 (3.1300)	Entropy 0.78975 (0.79557)	Top-1 acc 47.656 (49.161)	Top-5 acc 71.875 (72.504)	lr 0.02166
Train [29][1850/3239]	Time 0.589 (0.916)	Data Time 0.001 (0.015)	Loss 3.1022 (3.1296)	Entropy 0.78988 (0.79554)	Top-1 acc 49.609 (49.168)	Top-5 acc 73.438 (72.514)	lr 0.02166
Train [29][1860/3239]	Time 0.593 (0.915)	Data Time 0.001 (0.015)	Loss 3.4393 (3.1296)	Entropy 0.78968 (0.79551)	Top-1 acc 43.359 (49.170)	Top-5 acc 65.234 (72.517)	lr 0.02166
Train [29][1870/3239]	Time 0.640 (0.915)	Data Time 0.001 (0.015)	Loss 3.0679 (3.1298)	Entropy 0.78940 (0.79547)	Top-1 acc 48.047 (49.161)	Top-5 acc 72.656 (72.512)	lr 0.02166
Train [29][1880/3239]	Time 0.638 (0.915)	Data Time 0.003 (0.015)	Loss 3.0298 (3.1298)	Entropy 0.78939 (0.79544)	Top-1 acc 53.906 (49.160)	Top-5 acc 75.391 (72.514)	lr 0.02166
Train [29][1890/3239]	Time 0.617 (0.915)	Data Time 0.001 (0.015)	Loss 3.0325 (3.1297)	Entropy 0.78914 (0.79541)	Top-1 acc 51.172 (49.167)	Top-5 acc 76.953 (72.511)	lr 0.02166
Train [29][1900/3239]	Time 0.672 (0.914)	Data Time 0.001 (0.015)	Loss 2.9461 (3.1297)	Entropy 0.78887 (0.79538)	Top-1 acc 53.516 (49.165)	Top-5 acc 77.734 (72.511)	lr 0.02166
Train [29][1910/3239]	Time 0.607 (0.914)	Data Time 0.001 (0.015)	Loss 3.1081 (3.1297)	Entropy 0.78863 (0.79534)	Top-1 acc 49.609 (49.166)	Top-5 acc 77.344 (72.509)	lr 0.02166
Train [29][1920/3239]	Time 0.574 (0.914)	Data Time 0.001 (0.015)	Loss 3.3383 (3.1298)	Entropy 0.78874 (0.79531)	Top-1 acc 44.141 (49.165)	Top-5 acc 69.141 (72.508)	lr 0.02166
Train [29][1930/3239]	Time 0.652 (0.914)	Data Time 0.001 (0.015)	Loss 3.0845 (3.1299)	Entropy 0.78814 (0.79527)	Top-1 acc 51.172 (49.163)	Top-5 acc 72.656 (72.508)	lr 0.02166
Train [29][1940/3239]	Time 0.629 (0.913)	Data Time 0.001 (0.015)	Loss 3.0558 (3.1296)	Entropy 0.78833 (0.79524)	Top-1 acc 51.172 (49.168)	Top-5 acc 72.656 (72.511)	lr 0.02166
Train [29][1950/3239]	Time 0.591 (0.913)	Data Time 0.001 (0.015)	Loss 3.1968 (3.1296)	Entropy 0.78850 (0.79520)	Top-1 acc 46.094 (49.168)	Top-5 acc 72.656 (72.514)	lr 0.02166
Train [29][1960/3239]	Time 0.631 (0.912)	Data Time 0.001 (0.014)	Loss 3.3470 (3.1298)	Entropy 0.78876 (0.79517)	Top-1 acc 44.141 (49.159)	Top-5 acc 69.922 (72.510)	lr 0.02166
Train [29][1970/3239]	Time 0.713 (0.912)	Data Time 0.001 (0.014)	Loss 3.1348 (3.1298)	Entropy 0.78799 (0.79513)	Top-1 acc 48.828 (49.153)	Top-5 acc 74.609 (72.509)	lr 0.02165
Train [29][1980/3239]	Time 0.613 (0.912)	Data Time 0.002 (0.014)	Loss 3.2637 (3.1298)	Entropy 0.78823 (0.79510)	Top-1 acc 46.094 (49.151)	Top-5 acc 64.062 (72.509)	lr 0.02165
Train [29][1990/3239]	Time 0.577 (0.912)	Data Time 0.001 (0.014)	Loss 3.1056 (3.1297)	Entropy 0.78812 (0.79506)	Top-1 acc 49.609 (49.152)	Top-5 acc 73.438 (72.511)	lr 0.02165
Train [29][2000/3239]	Time 0.564 (0.911)	Data Time 0.002 (0.014)	Loss 3.0226 (3.1298)	Entropy 0.78845 (0.79503)	Top-1 acc 50.781 (49.150)	Top-5 acc 73.047 (72.507)	lr 0.02165
Train [29][2010/3239]	Time 0.580 (0.911)	Data Time 0.002 (0.014)	Loss 3.0976 (3.1300)	Entropy 0.78843 (0.79499)	Top-1 acc 49.609 (49.146)	Top-5 acc 76.172 (72.504)	lr 0.02165
Train [29][2020/3239]	Time 0.581 (0.911)	Data Time 0.001 (0.014)	Loss 3.1019 (3.1297)	Entropy 0.78823 (0.79496)	Top-1 acc 53.516 (49.151)	Top-5 acc 71.484 (72.506)	lr 0.02165
Train [29][2030/3239]	Time 0.590 (0.911)	Data Time 0.001 (0.014)	Loss 3.2120 (3.1299)	Entropy 0.78777 (0.79493)	Top-1 acc 43.750 (49.142)	Top-5 acc 68.359 (72.504)	lr 0.02165
Train [29][2040/3239]	Time 0.621 (0.910)	Data Time 0.001 (0.014)	Loss 3.1180 (3.1297)	Entropy 0.78779 (0.79489)	Top-1 acc 50.781 (49.149)	Top-5 acc 72.266 (72.509)	lr 0.02165
Train [29][2050/3239]	Time 0.605 (0.910)	Data Time 0.001 (0.014)	Loss 3.0842 (3.1298)	Entropy 0.78780 (0.79486)	Top-1 acc 50.781 (49.148)	Top-5 acc 72.266 (72.506)	lr 0.02165
Train [29][2060/3239]	Time 0.698 (0.910)	Data Time 0.001 (0.014)	Loss 3.1546 (3.1295)	Entropy 0.78786 (0.79482)	Top-1 acc 50.781 (49.156)	Top-5 acc 71.875 (72.510)	lr 0.02165
Train [29][2070/3239]	Time 0.624 (0.910)	Data Time 0.001 (0.014)	Loss 3.0442 (3.1293)	Entropy 0.78728 (0.79479)	Top-1 acc 48.828 (49.163)	Top-5 acc 73.438 (72.516)	lr 0.02165
Train [29][2080/3239]	Time 0.583 (0.910)	Data Time 0.001 (0.014)	Loss 3.2207 (3.1290)	Entropy 0.78683 (0.79475)	Top-1 acc 47.656 (49.165)	Top-5 acc 69.141 (72.522)	lr 0.02165
Train [29][2090/3239]	Time 0.574 (0.909)	Data Time 0.001 (0.014)	Loss 3.2073 (3.1291)	Entropy 0.78710 (0.79471)	Top-1 acc 42.969 (49.163)	Top-5 acc 69.922 (72.522)	lr 0.02165
Train [29][2100/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.014)	Loss 3.1609 (3.1292)	Entropy 0.78675 (0.79468)	Top-1 acc 49.609 (49.159)	Top-5 acc 73.828 (72.518)	lr 0.02165
Train [29][2110/3239]	Time 0.618 (0.909)	Data Time 0.001 (0.014)	Loss 2.9651 (3.1289)	Entropy 0.78702 (0.79464)	Top-1 acc 53.125 (49.162)	Top-5 acc 75.391 (72.524)	lr 0.02165
Train [29][2120/3239]	Time 0.578 (0.908)	Data Time 0.001 (0.014)	Loss 3.1928 (3.1285)	Entropy 0.78691 (0.79460)	Top-1 acc 48.047 (49.173)	Top-5 acc 71.875 (72.534)	lr 0.02164
Train [29][2130/3239]	Time 0.598 (0.908)	Data Time 0.001 (0.013)	Loss 3.2077 (3.1283)	Entropy 0.78701 (0.79457)	Top-1 acc 48.438 (49.177)	Top-5 acc 69.531 (72.537)	lr 0.02164
Train [29][2140/3239]	Time 0.634 (0.908)	Data Time 0.001 (0.013)	Loss 3.0296 (3.1285)	Entropy 0.78666 (0.79453)	Top-1 acc 51.172 (49.170)	Top-5 acc 75.781 (72.530)	lr 0.02164
Train [29][2150/3239]	Time 0.567 (0.908)	Data Time 0.001 (0.013)	Loss 3.0645 (3.1284)	Entropy 0.78664 (0.79450)	Top-1 acc 50.781 (49.174)	Top-5 acc 74.609 (72.531)	lr 0.02164
Train [29][2160/3239]	Time 0.571 (0.908)	Data Time 0.001 (0.013)	Loss 3.2778 (3.1282)	Entropy 0.78667 (0.79446)	Top-1 acc 46.484 (49.178)	Top-5 acc 66.016 (72.533)	lr 0.02164
Train [29][2170/3239]	Time 0.610 (0.907)	Data Time 0.001 (0.013)	Loss 3.0228 (3.1282)	Entropy 0.78640 (0.79442)	Top-1 acc 50.000 (49.178)	Top-5 acc 73.047 (72.532)	lr 0.02164
Train [29][2180/3239]	Time 0.603 (0.907)	Data Time 0.001 (0.013)	Loss 3.2905 (3.1282)	Entropy 0.78627 (0.79439)	Top-1 acc 45.703 (49.181)	Top-5 acc 69.922 (72.531)	lr 0.02164
Train [29][2190/3239]	Time 0.619 (0.907)	Data Time 0.001 (0.013)	Loss 3.1961 (3.1285)	Entropy 0.78643 (0.79435)	Top-1 acc 45.312 (49.173)	Top-5 acc 69.531 (72.528)	lr 0.02164
Train [29][2200/3239]	Time 0.651 (0.907)	Data Time 0.001 (0.013)	Loss 3.1571 (3.1286)	Entropy 0.78633 (0.79431)	Top-1 acc 46.875 (49.166)	Top-5 acc 73.047 (72.526)	lr 0.02164
Train [29][2210/3239]	Time 0.631 (0.907)	Data Time 0.001 (0.013)	Loss 3.0127 (3.1285)	Entropy 0.78596 (0.79428)	Top-1 acc 51.562 (49.171)	Top-5 acc 74.219 (72.530)	lr 0.02164
Train [29][2220/3239]	Time 0.592 (0.906)	Data Time 0.001 (0.013)	Loss 3.3358 (3.1283)	Entropy 0.78621 (0.79424)	Top-1 acc 46.094 (49.173)	Top-5 acc 68.750 (72.530)	lr 0.02164
Train [29][2230/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.013)	Loss 3.2556 (3.1283)	Entropy 0.78626 (0.79420)	Top-1 acc 45.312 (49.172)	Top-5 acc 69.922 (72.528)	lr 0.02164
Train [29][2240/3239]	Time 0.653 (0.906)	Data Time 0.001 (0.013)	Loss 3.0562 (3.1283)	Entropy 0.78588 (0.79417)	Top-1 acc 50.000 (49.174)	Top-5 acc 71.875 (72.527)	lr 0.02164
Train [29][2250/3239]	Time 0.630 (0.906)	Data Time 0.001 (0.013)	Loss 3.0210 (3.1281)	Entropy 0.78535 (0.79413)	Top-1 acc 51.562 (49.179)	Top-5 acc 75.000 (72.530)	lr 0.02164
Train [29][2260/3239]	Time 0.793 (0.917)	Data Time 0.006 (0.013)	Loss 3.1063 (3.1285)	Entropy 0.78557 (0.79409)	Top-1 acc 50.391 (49.166)	Top-5 acc 74.219 (72.523)	lr 0.02164
Train [29][2270/3239]	Time 0.588 (0.916)	Data Time 0.002 (0.013)	Loss 3.0121 (3.1284)	Entropy 0.78542 (0.79405)	Top-1 acc 52.734 (49.167)	Top-5 acc 74.219 (72.523)	lr 0.02163
Train [29][2280/3239]	Time 0.624 (0.916)	Data Time 0.001 (0.013)	Loss 3.2661 (3.1288)	Entropy 0.78535 (0.79402)	Top-1 acc 46.484 (49.156)	Top-5 acc 70.312 (72.514)	lr 0.02163
Train [29][2290/3239]	Time 0.723 (0.916)	Data Time 0.001 (0.013)	Loss 3.2269 (3.1286)	Entropy 0.78532 (0.79398)	Top-1 acc 49.219 (49.158)	Top-5 acc 70.703 (72.518)	lr 0.02163
Train [29][2300/3239]	Time 0.627 (0.916)	Data Time 0.001 (0.013)	Loss 3.3955 (3.1287)	Entropy 0.78508 (0.79394)	Top-1 acc 42.969 (49.154)	Top-5 acc 66.016 (72.515)	lr 0.02163
Train [29][2310/3239]	Time 0.601 (0.916)	Data Time 0.001 (0.013)	Loss 3.2110 (3.1289)	Entropy 0.78536 (0.79390)	Top-1 acc 48.828 (49.151)	Top-5 acc 71.875 (72.508)	lr 0.02163
Train [29][2320/3239]	Time 0.589 (0.916)	Data Time 0.001 (0.013)	Loss 3.1857 (3.1288)	Entropy 0.78556 (0.79387)	Top-1 acc 49.609 (49.153)	Top-5 acc 69.922 (72.506)	lr 0.02163
Train [29][2330/3239]	Time 0.612 (0.915)	Data Time 0.001 (0.012)	Loss 3.0397 (3.1286)	Entropy 0.78564 (0.79383)	Top-1 acc 53.516 (49.158)	Top-5 acc 72.266 (72.509)	lr 0.02163
Train [29][2340/3239]	Time 0.636 (0.915)	Data Time 0.001 (0.012)	Loss 2.9781 (3.1289)	Entropy 0.78557 (0.79380)	Top-1 acc 51.953 (49.145)	Top-5 acc 77.344 (72.507)	lr 0.02163
Train [29][2350/3239]	Time 0.615 (0.915)	Data Time 0.001 (0.012)	Loss 3.0129 (3.1291)	Entropy 0.78561 (0.79376)	Top-1 acc 53.906 (49.136)	Top-5 acc 74.609 (72.504)	lr 0.02163
Train [29][2360/3239]	Time 0.609 (0.915)	Data Time 0.001 (0.012)	Loss 3.5390 (3.1294)	Entropy 0.78508 (0.79373)	Top-1 acc 39.844 (49.130)	Top-5 acc 64.844 (72.503)	lr 0.02163
Train [29][2370/3239]	Time 0.605 (0.915)	Data Time 0.001 (0.012)	Loss 3.1310 (3.1293)	Entropy 0.78525 (0.79369)	Top-1 acc 50.000 (49.132)	Top-5 acc 71.094 (72.502)	lr 0.02163
Train [29][2380/3239]	Time 0.603 (0.914)	Data Time 0.001 (0.012)	Loss 3.2712 (3.1294)	Entropy 0.78466 (0.79365)	Top-1 acc 44.922 (49.127)	Top-5 acc 69.922 (72.503)	lr 0.02163
Train [29][2390/3239]	Time 0.618 (0.914)	Data Time 0.001 (0.012)	Loss 3.1935 (3.1293)	Entropy 0.78481 (0.79362)	Top-1 acc 46.094 (49.127)	Top-5 acc 69.531 (72.504)	lr 0.02163
Train [29][2400/3239]	Time 0.646 (0.914)	Data Time 0.001 (0.012)	Loss 3.2058 (3.1298)	Entropy 0.78495 (0.79358)	Top-1 acc 47.266 (49.119)	Top-5 acc 71.094 (72.492)	lr 0.02163
Train [29][2410/3239]	Time 0.612 (0.914)	Data Time 0.001 (0.012)	Loss 2.9962 (3.1296)	Entropy 0.78504 (0.79354)	Top-1 acc 53.516 (49.124)	Top-5 acc 73.047 (72.492)	lr 0.02162
Train [29][2420/3239]	Time 0.611 (0.913)	Data Time 0.001 (0.012)	Loss 3.1298 (3.1298)	Entropy 0.78520 (0.79351)	Top-1 acc 49.219 (49.121)	Top-5 acc 74.219 (72.490)	lr 0.02162
Train [29][2430/3239]	Time 0.600 (0.913)	Data Time 0.001 (0.012)	Loss 3.1511 (3.1298)	Entropy 0.78558 (0.79348)	Top-1 acc 48.828 (49.122)	Top-5 acc 73.828 (72.489)	lr 0.02162
Train [29][2440/3239]	Time 0.620 (0.913)	Data Time 0.001 (0.012)	Loss 3.2490 (3.1297)	Entropy 0.78485 (0.79344)	Top-1 acc 46.094 (49.126)	Top-5 acc 69.922 (72.493)	lr 0.02162
Train [29][2450/3239]	Time 0.680 (0.913)	Data Time 0.001 (0.012)	Loss 3.1010 (3.1297)	Entropy 0.78459 (0.79341)	Top-1 acc 51.172 (49.128)	Top-5 acc 73.438 (72.495)	lr 0.02162
Train [29][2460/3239]	Time 0.613 (0.912)	Data Time 0.001 (0.012)	Loss 3.0933 (3.1295)	Entropy 0.78496 (0.79337)	Top-1 acc 51.562 (49.131)	Top-5 acc 71.875 (72.497)	lr 0.02162
Train [29][2470/3239]	Time 0.597 (0.912)	Data Time 0.001 (0.012)	Loss 3.0392 (3.1299)	Entropy 0.78495 (0.79334)	Top-1 acc 47.656 (49.123)	Top-5 acc 73.438 (72.490)	lr 0.02162
Train [29][2480/3239]	Time 0.648 (0.912)	Data Time 0.001 (0.012)	Loss 3.0382 (3.1296)	Entropy 0.78518 (0.79330)	Top-1 acc 54.297 (49.128)	Top-5 acc 72.656 (72.493)	lr 0.02162
Train [29][2490/3239]	Time 0.624 (0.912)	Data Time 0.002 (0.012)	Loss 3.1166 (3.1296)	Entropy 0.78480 (0.79327)	Top-1 acc 48.047 (49.127)	Top-5 acc 73.438 (72.497)	lr 0.02162
Train [29][2500/3239]	Time 0.580 (0.912)	Data Time 0.001 (0.012)	Loss 3.3670 (3.1297)	Entropy 0.78507 (0.79324)	Top-1 acc 43.359 (49.123)	Top-5 acc 67.969 (72.494)	lr 0.02162
Train [29][2510/3239]	Time 0.575 (0.911)	Data Time 0.001 (0.012)	Loss 3.1340 (3.1299)	Entropy 0.78501 (0.79321)	Top-1 acc 51.172 (49.124)	Top-5 acc 69.531 (72.490)	lr 0.02162
Train [29][2520/3239]	Time 0.715 (0.911)	Data Time 0.004 (0.012)	Loss 3.1060 (3.1297)	Entropy 0.78461 (0.79317)	Top-1 acc 50.391 (49.122)	Top-5 acc 73.047 (72.496)	lr 0.02162
Train [29][2530/3239]	Time 0.609 (0.911)	Data Time 0.001 (0.012)	Loss 2.8795 (3.1293)	Entropy 0.78457 (0.79314)	Top-1 acc 56.641 (49.131)	Top-5 acc 77.734 (72.506)	lr 0.02162
Train [29][2540/3239]	Time 0.589 (0.911)	Data Time 0.001 (0.012)	Loss 3.2137 (3.1294)	Entropy 0.78390 (0.79310)	Top-1 acc 44.922 (49.128)	Top-5 acc 69.922 (72.505)	lr 0.02162
Train [29][2550/3239]	Time 0.599 (0.911)	Data Time 0.001 (0.012)	Loss 2.9886 (3.1293)	Entropy 0.78367 (0.79307)	Top-1 acc 54.688 (49.129)	Top-5 acc 73.828 (72.503)	lr 0.02162
Train [29][2560/3239]	Time 0.581 (0.911)	Data Time 0.001 (0.012)	Loss 3.2689 (3.1293)	Entropy 0.78329 (0.79303)	Top-1 acc 43.750 (49.127)	Top-5 acc 69.922 (72.506)	lr 0.02161
Train [29][2570/3239]	Time 0.507 (0.910)	Data Time 0.001 (0.011)	Loss 3.3973 (3.1295)	Entropy 0.78272 (0.79299)	Top-1 acc 40.234 (49.125)	Top-5 acc 68.750 (72.504)	lr 0.02161
Train [29][2580/3239]	Time 0.603 (0.910)	Data Time 0.001 (0.011)	Loss 3.0255 (3.1294)	Entropy 0.78287 (0.79295)	Top-1 acc 54.297 (49.122)	Top-5 acc 74.609 (72.505)	lr 0.02161
Train [29][2590/3239]	Time 0.573 (0.910)	Data Time 0.001 (0.011)	Loss 3.1286 (3.1293)	Entropy 0.78279 (0.79291)	Top-1 acc 51.172 (49.126)	Top-5 acc 74.219 (72.507)	lr 0.02161
Train [29][2600/3239]	Time 0.620 (0.910)	Data Time 0.001 (0.011)	Loss 3.2433 (3.1291)	Entropy 0.78309 (0.79288)	Top-1 acc 50.000 (49.137)	Top-5 acc 71.875 (72.511)	lr 0.02161
Train [29][2610/3239]	Time 0.721 (0.910)	Data Time 0.001 (0.011)	Loss 3.2718 (3.1291)	Entropy 0.78311 (0.79284)	Top-1 acc 45.312 (49.132)	Top-5 acc 70.703 (72.515)	lr 0.02161
Train [29][2620/3239]	Time 0.634 (0.909)	Data Time 0.001 (0.011)	Loss 3.0626 (3.1291)	Entropy 0.78301 (0.79280)	Top-1 acc 50.391 (49.128)	Top-5 acc 73.438 (72.518)	lr 0.02161
Train [29][2630/3239]	Time 0.610 (0.909)	Data Time 0.002 (0.011)	Loss 3.1209 (3.1291)	Entropy 0.78332 (0.79277)	Top-1 acc 50.000 (49.133)	Top-5 acc 75.391 (72.520)	lr 0.02161
Train [29][2640/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.011)	Loss 3.2457 (3.1293)	Entropy 0.78331 (0.79273)	Top-1 acc 48.828 (49.131)	Top-5 acc 69.922 (72.514)	lr 0.02161
Train [29][2650/3239]	Time 0.607 (0.909)	Data Time 0.001 (0.011)	Loss 3.1456 (3.1291)	Entropy 0.78367 (0.79269)	Top-1 acc 46.875 (49.133)	Top-5 acc 72.656 (72.522)	lr 0.02161
Train [29][2660/3239]	Time 0.612 (0.909)	Data Time 0.001 (0.011)	Loss 3.0541 (3.1291)	Entropy 0.78346 (0.79266)	Top-1 acc 48.828 (49.131)	Top-5 acc 73.828 (72.522)	lr 0.02161
Train [29][2670/3239]	Time 0.627 (0.909)	Data Time 0.002 (0.011)	Loss 3.2458 (3.1293)	Entropy 0.78327 (0.79263)	Top-1 acc 48.047 (49.132)	Top-5 acc 70.703 (72.515)	lr 0.02161
Train [29][2680/3239]	Time 0.716 (0.908)	Data Time 0.001 (0.011)	Loss 2.9560 (3.1293)	Entropy 0.78322 (0.79259)	Top-1 acc 54.688 (49.131)	Top-5 acc 78.125 (72.518)	lr 0.02161
Train [29][2690/3239]	Time 0.572 (0.908)	Data Time 0.001 (0.011)	Loss 2.9971 (3.1291)	Entropy 0.78302 (0.79256)	Top-1 acc 49.609 (49.130)	Top-5 acc 75.000 (72.521)	lr 0.02161
Train [29][2700/3239]	Time 0.619 (0.908)	Data Time 0.001 (0.011)	Loss 3.1654 (3.1291)	Entropy 0.78328 (0.79252)	Top-1 acc 45.703 (49.128)	Top-5 acc 71.875 (72.525)	lr 0.02160
Train [29][2710/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.011)	Loss 3.0602 (3.1290)	Entropy 0.78314 (0.79249)	Top-1 acc 52.344 (49.135)	Top-5 acc 75.781 (72.525)	lr 0.02160
Train [29][2720/3239]	Time 0.629 (0.908)	Data Time 0.001 (0.011)	Loss 3.2387 (3.1287)	Entropy 0.78304 (0.79245)	Top-1 acc 44.922 (49.141)	Top-5 acc 69.141 (72.529)	lr 0.02160
Train [29][2730/3239]	Time 0.633 (0.908)	Data Time 0.001 (0.011)	Loss 3.3334 (3.1288)	Entropy 0.78292 (0.79242)	Top-1 acc 41.797 (49.137)	Top-5 acc 67.578 (72.526)	lr 0.02160
Train [29][2740/3239]	Time 0.584 (0.907)	Data Time 0.001 (0.011)	Loss 3.2366 (3.1289)	Entropy 0.78286 (0.79238)	Top-1 acc 50.000 (49.134)	Top-5 acc 71.094 (72.522)	lr 0.02160
Train [29][2750/3239]	Time 0.609 (0.907)	Data Time 0.001 (0.011)	Loss 2.9512 (3.1287)	Entropy 0.78252 (0.79235)	Top-1 acc 52.344 (49.140)	Top-5 acc 78.516 (72.526)	lr 0.02160
Train [29][2760/3239]	Time 0.572 (0.907)	Data Time 0.001 (0.011)	Loss 2.9213 (3.1286)	Entropy 0.78256 (0.79231)	Top-1 acc 51.953 (49.142)	Top-5 acc 76.562 (72.530)	lr 0.02160
Train [29][2770/3239]	Time 0.470 (0.907)	Data Time 0.001 (0.011)	Loss 2.9954 (3.1287)	Entropy 0.78273 (0.79228)	Top-1 acc 51.562 (49.141)	Top-5 acc 74.609 (72.527)	lr 0.02160
Train [29][2780/3239]	Time 0.661 (0.907)	Data Time 0.001 (0.011)	Loss 3.2991 (3.1289)	Entropy 0.78294 (0.79224)	Top-1 acc 48.047 (49.138)	Top-5 acc 69.141 (72.518)	lr 0.02160
Train [29][2790/3239]	Time 0.626 (0.906)	Data Time 0.001 (0.011)	Loss 2.9476 (3.1291)	Entropy 0.78260 (0.79221)	Top-1 acc 54.297 (49.138)	Top-5 acc 74.609 (72.513)	lr 0.02160
Train [29][2800/3239]	Time 0.592 (0.906)	Data Time 0.001 (0.011)	Loss 2.7916 (3.1290)	Entropy 0.78250 (0.79218)	Top-1 acc 55.469 (49.140)	Top-5 acc 81.250 (72.513)	lr 0.02160
Train [29][2810/3239]	Time 0.612 (0.906)	Data Time 0.001 (0.011)	Loss 3.2051 (3.1290)	Entropy 0.78260 (0.79214)	Top-1 acc 43.750 (49.137)	Top-5 acc 69.922 (72.510)	lr 0.02160
Train [29][2820/3239]	Time 0.604 (0.906)	Data Time 0.001 (0.011)	Loss 2.8317 (3.1289)	Entropy 0.78269 (0.79211)	Top-1 acc 57.422 (49.139)	Top-5 acc 80.078 (72.512)	lr 0.02160
Train [29][2830/3239]	Time 0.623 (0.906)	Data Time 0.001 (0.011)	Loss 2.9601 (3.1288)	Entropy 0.78237 (0.79207)	Top-1 acc 54.297 (49.140)	Top-5 acc 77.344 (72.519)	lr 0.02160
Train [29][2840/3239]	Time 0.648 (0.906)	Data Time 0.001 (0.011)	Loss 3.1804 (3.1288)	Entropy 0.78239 (0.79204)	Top-1 acc 48.438 (49.141)	Top-5 acc 73.438 (72.517)	lr 0.02159
Train [29][2850/3239]	Time 0.594 (0.905)	Data Time 0.001 (0.011)	Loss 3.3923 (3.1290)	Entropy 0.78235 (0.79201)	Top-1 acc 41.797 (49.135)	Top-5 acc 65.234 (72.511)	lr 0.02159
Train [29][2860/3239]	Time 0.582 (0.905)	Data Time 0.001 (0.011)	Loss 3.1209 (3.1293)	Entropy 0.78205 (0.79197)	Top-1 acc 49.219 (49.128)	Top-5 acc 72.656 (72.506)	lr 0.02159
Train [29][2870/3239]	Time 0.621 (0.905)	Data Time 0.001 (0.010)	Loss 2.9311 (3.1290)	Entropy 0.78166 (0.79194)	Top-1 acc 52.734 (49.135)	Top-5 acc 76.953 (72.509)	lr 0.02159
Train [29][2880/3239]	Time 0.611 (0.905)	Data Time 0.001 (0.010)	Loss 3.1544 (3.1290)	Entropy 0.78145 (0.79190)	Top-1 acc 48.828 (49.135)	Top-5 acc 70.703 (72.512)	lr 0.02159
Train [29][2890/3239]	Time 0.601 (0.905)	Data Time 0.001 (0.010)	Loss 3.0108 (3.1288)	Entropy 0.78128 (0.79187)	Top-1 acc 48.047 (49.139)	Top-5 acc 76.953 (72.517)	lr 0.02159
Train [29][2900/3239]	Time 0.612 (0.905)	Data Time 0.002 (0.010)	Loss 3.4299 (3.1289)	Entropy 0.78146 (0.79183)	Top-1 acc 44.922 (49.140)	Top-5 acc 66.797 (72.516)	lr 0.02159
Train [29][2910/3239]	Time 0.690 (0.905)	Data Time 0.001 (0.010)	Loss 2.9988 (3.1287)	Entropy 0.78163 (0.79179)	Top-1 acc 53.516 (49.142)	Top-5 acc 74.219 (72.517)	lr 0.02159
Train [29][2920/3239]	Time 0.596 (0.913)	Data Time 0.002 (0.010)	Loss 3.1276 (3.1288)	Entropy 0.78137 (0.79176)	Top-1 acc 48.438 (49.140)	Top-5 acc 73.047 (72.516)	lr 0.02159
Train [29][2930/3239]	Time 0.610 (0.913)	Data Time 0.002 (0.010)	Loss 3.1337 (3.1287)	Entropy 0.78139 (0.79172)	Top-1 acc 48.047 (49.137)	Top-5 acc 73.438 (72.518)	lr 0.02159
Train [29][2940/3239]	Time 0.635 (0.912)	Data Time 0.001 (0.010)	Loss 3.1038 (3.1287)	Entropy 0.78185 (0.79169)	Top-1 acc 48.047 (49.139)	Top-5 acc 72.266 (72.517)	lr 0.02159
Train [29][2950/3239]	Time 0.606 (0.912)	Data Time 0.001 (0.010)	Loss 2.9504 (3.1286)	Entropy 0.78166 (0.79165)	Top-1 acc 57.031 (49.142)	Top-5 acc 75.781 (72.520)	lr 0.02159
Train [29][2960/3239]	Time 0.633 (0.912)	Data Time 0.001 (0.010)	Loss 3.0286 (3.1285)	Entropy 0.78170 (0.79162)	Top-1 acc 53.125 (49.144)	Top-5 acc 74.609 (72.521)	lr 0.02159
Train [29][2970/3239]	Time 0.629 (0.912)	Data Time 0.003 (0.010)	Loss 2.8104 (3.1283)	Entropy 0.78175 (0.79159)	Top-1 acc 54.688 (49.147)	Top-5 acc 77.734 (72.528)	lr 0.02159
Train [29][2980/3239]	Time 0.591 (0.912)	Data Time 0.001 (0.010)	Loss 3.1763 (3.1284)	Entropy 0.78180 (0.79156)	Top-1 acc 48.047 (49.146)	Top-5 acc 71.094 (72.527)	lr 0.02159
Train [29][2990/3239]	Time 0.669 (0.912)	Data Time 0.001 (0.010)	Loss 3.0715 (3.1282)	Entropy 0.78213 (0.79152)	Top-1 acc 48.438 (49.150)	Top-5 acc 76.172 (72.533)	lr 0.02158
Train [29][3000/3239]	Time 0.701 (0.912)	Data Time 0.001 (0.010)	Loss 3.1015 (3.1283)	Entropy 0.78183 (0.79149)	Top-1 acc 48.047 (49.148)	Top-5 acc 73.047 (72.529)	lr 0.02158
Train [29][3010/3239]	Time 0.601 (0.911)	Data Time 0.001 (0.010)	Loss 3.0677 (3.1283)	Entropy 0.78149 (0.79146)	Top-1 acc 48.438 (49.146)	Top-5 acc 76.562 (72.533)	lr 0.02158
Train [29][3020/3239]	Time 0.608 (0.911)	Data Time 0.001 (0.010)	Loss 3.2128 (3.1283)	Entropy 0.78108 (0.79143)	Top-1 acc 48.047 (49.148)	Top-5 acc 71.094 (72.533)	lr 0.02158
Train [29][3030/3239]	Time 0.601 (0.911)	Data Time 0.001 (0.010)	Loss 3.2596 (3.1285)	Entropy 0.78083 (0.79139)	Top-1 acc 46.875 (49.146)	Top-5 acc 71.484 (72.533)	lr 0.02158
Train [29][3040/3239]	Time 0.444 (0.911)	Data Time 0.001 (0.010)	Loss 2.9964 (3.1285)	Entropy 0.78077 (0.79136)	Top-1 acc 53.516 (49.145)	Top-5 acc 76.172 (72.530)	lr 0.02158
Train [29][3050/3239]	Time 0.598 (0.911)	Data Time 0.001 (0.010)	Loss 2.9669 (3.1285)	Entropy 0.78082 (0.79132)	Top-1 acc 51.562 (49.146)	Top-5 acc 75.000 (72.532)	lr 0.02158
Train [29][3060/3239]	Time 0.591 (0.911)	Data Time 0.001 (0.010)	Loss 3.1944 (3.1285)	Entropy 0.78080 (0.79129)	Top-1 acc 49.609 (49.145)	Top-5 acc 69.922 (72.532)	lr 0.02158
Train [29][3070/3239]	Time 0.699 (0.910)	Data Time 0.001 (0.010)	Loss 3.0672 (3.1287)	Entropy 0.78086 (0.79125)	Top-1 acc 48.828 (49.144)	Top-5 acc 73.438 (72.527)	lr 0.02158
Train [29][3080/3239]	Time 0.624 (0.910)	Data Time 0.001 (0.010)	Loss 3.1143 (3.1287)	Entropy 0.78044 (0.79122)	Top-1 acc 48.438 (49.143)	Top-5 acc 70.703 (72.529)	lr 0.02158
Train [29][3090/3239]	Time 0.624 (0.910)	Data Time 0.001 (0.010)	Loss 3.3634 (3.1290)	Entropy 0.78011 (0.79118)	Top-1 acc 44.922 (49.139)	Top-5 acc 68.750 (72.523)	lr 0.02158
Train [29][3100/3239]	Time 0.621 (0.910)	Data Time 0.001 (0.010)	Loss 3.0492 (3.1289)	Entropy 0.78035 (0.79115)	Top-1 acc 49.609 (49.139)	Top-5 acc 74.219 (72.524)	lr 0.02158
Train [29][3110/3239]	Time 0.606 (0.910)	Data Time 0.001 (0.010)	Loss 3.0617 (3.1289)	Entropy 0.78035 (0.79111)	Top-1 acc 53.125 (49.139)	Top-5 acc 75.391 (72.525)	lr 0.02158
Train [29][3120/3239]	Time 0.626 (0.910)	Data Time 0.003 (0.010)	Loss 3.1516 (3.1290)	Entropy 0.78085 (0.79108)	Top-1 acc 46.875 (49.139)	Top-5 acc 73.047 (72.527)	lr 0.02158
Train [29][3130/3239]	Time 0.575 (0.909)	Data Time 0.001 (0.010)	Loss 3.1241 (3.1290)	Entropy 0.78078 (0.79105)	Top-1 acc 50.000 (49.141)	Top-5 acc 73.828 (72.526)	lr 0.02157
Train [29][3140/3239]	Time 0.635 (0.909)	Data Time 0.001 (0.010)	Loss 3.2905 (3.1291)	Entropy 0.78076 (0.79101)	Top-1 acc 47.266 (49.138)	Top-5 acc 72.266 (72.526)	lr 0.02157
Train [29][3150/3239]	Time 0.621 (0.909)	Data Time 0.001 (0.010)	Loss 2.8968 (3.1290)	Entropy 0.78064 (0.79098)	Top-1 acc 53.906 (49.137)	Top-5 acc 77.344 (72.529)	lr 0.02157
Train [29][3160/3239]	Time 0.725 (0.909)	Data Time 0.001 (0.010)	Loss 3.2031 (3.1291)	Entropy 0.78080 (0.79095)	Top-1 acc 44.141 (49.136)	Top-5 acc 72.266 (72.528)	lr 0.02157
Train [29][3170/3239]	Time 0.621 (0.909)	Data Time 0.002 (0.010)	Loss 3.0422 (3.1291)	Entropy 0.78042 (0.79092)	Top-1 acc 49.219 (49.135)	Top-5 acc 74.609 (72.526)	lr 0.02157
Train [29][3180/3239]	Time 0.589 (0.909)	Data Time 0.000 (0.010)	Loss 2.8504 (3.1290)	Entropy 0.78048 (0.79088)	Top-1 acc 52.344 (49.132)	Top-5 acc 78.125 (72.526)	lr 0.02157
Train [29][3190/3239]	Time 0.622 (0.909)	Data Time 0.000 (0.010)	Loss 3.0099 (3.1289)	Entropy 0.78065 (0.79085)	Top-1 acc 50.391 (49.135)	Top-5 acc 76.172 (72.531)	lr 0.02157
Train [29][3200/3239]	Time 0.627 (0.908)	Data Time 0.000 (0.010)	Loss 3.1680 (3.1290)	Entropy 0.78082 (0.79082)	Top-1 acc 49.219 (49.132)	Top-5 acc 72.656 (72.526)	lr 0.02157
Train [29][3210/3239]	Time 0.587 (0.908)	Data Time 0.000 (0.010)	Loss 3.0910 (3.1290)	Entropy 0.78050 (0.79079)	Top-1 acc 51.953 (49.133)	Top-5 acc 71.094 (72.523)	lr 0.02157
Train [29][3220/3239]	Time 0.586 (0.908)	Data Time 0.000 (0.010)	Loss 2.9584 (3.1291)	Entropy 0.78093 (0.79076)	Top-1 acc 52.344 (49.131)	Top-5 acc 76.172 (72.522)	lr 0.02157
Train [29][3230/3239]	Time 0.699 (0.908)	Data Time 0.000 (0.010)	Loss 3.0444 (3.1291)	Entropy 0.78089 (0.79073)	Top-1 acc 54.688 (49.134)	Top-5 acc 74.609 (72.522)	lr 0.02157
Train [29][3239/3239]	Time 1.398 (0.908)	Data Time 0.000 (0.010)	Loss 3.5225 (3.1290)	Entropy 0.78106 (0.79070)	Top-1 acc 46.914 (49.140)	Top-5 acc 65.432 (72.522)	lr 0.02157
==========Valid [29/120]	loss 1.840	top-1 acc 58.739 (58.739)	top-5 acc 81.163	Train top-1 49.140	top-5 72.522	Entropy 0.78106	Latency-None: 0.000ms	Flops: 539.76M
Train [30][0/3239]	Time 24.148 (24.148)	Data Time 23.220 (23.220)	Loss 3.2759 (3.2759)	Entropy 0.78106 (0.78106)	Top-1 acc 44.531 (44.531)	Top-5 acc 69.531 (69.531)	lr 0.02157
Train [30][10/3239]	Time 0.604 (3.011)	Data Time 0.001 (2.113)	Loss 3.0155 (3.1069)	Entropy 0.78112 (0.78115)	Top-1 acc 50.781 (50.213)	Top-5 acc 75.000 (73.438)	lr 0.02157
Train [30][20/3239]	Time 0.638 (1.973)	Data Time 0.003 (1.107)	Loss 2.8515 (3.0853)	Entropy 0.78100 (0.78109)	Top-1 acc 57.812 (50.688)	Top-5 acc 79.688 (73.828)	lr 0.02157
Train [30][30/3239]	Time 0.616 (1.609)	Data Time 0.001 (0.751)	Loss 2.8429 (3.0781)	Entropy 0.78084 (0.78105)	Top-1 acc 53.125 (50.731)	Top-5 acc 77.734 (73.853)	lr 0.02157
Train [30][40/3239]	Time 0.651 (1.435)	Data Time 0.001 (0.568)	Loss 3.0155 (3.0934)	Entropy 0.78136 (0.78103)	Top-1 acc 52.344 (50.276)	Top-5 acc 75.391 (73.371)	lr 0.02156
Train [30][50/3239]	Time 0.622 (1.323)	Data Time 0.001 (0.457)	Loss 3.1519 (3.0929)	Entropy 0.78143 (0.78109)	Top-1 acc 48.828 (50.214)	Top-5 acc 73.828 (73.323)	lr 0.02156
Train [30][60/3239]	Time 0.686 (1.248)	Data Time 0.001 (0.382)	Loss 3.0707 (3.0838)	Entropy 0.78123 (0.78113)	Top-1 acc 51.562 (50.435)	Top-5 acc 73.047 (73.540)	lr 0.02156
Train [30][70/3239]	Time 0.620 (1.193)	Data Time 0.001 (0.329)	Loss 3.2476 (3.0809)	Entropy 0.78145 (0.78116)	Top-1 acc 49.609 (50.479)	Top-5 acc 69.922 (73.570)	lr 0.02156
Train [30][80/3239]	Time 0.608 (1.153)	Data Time 0.001 (0.288)	Loss 3.0989 (3.0947)	Entropy 0.78134 (0.78119)	Top-1 acc 46.875 (50.231)	Top-5 acc 74.219 (73.259)	lr 0.02156
Train [30][90/3239]	Time 0.598 (1.122)	Data Time 0.001 (0.257)	Loss 2.8974 (3.0933)	Entropy 0.78139 (0.78122)	Top-1 acc 52.344 (50.189)	Top-5 acc 76.562 (73.262)	lr 0.02156
Train [30][100/3239]	Time 0.620 (1.097)	Data Time 0.001 (0.232)	Loss 3.0993 (3.0914)	Entropy 0.78092 (0.78122)	Top-1 acc 52.734 (50.213)	Top-5 acc 72.656 (73.329)	lr 0.02156
Train [30][110/3239]	Time 0.608 (1.077)	Data Time 0.001 (0.211)	Loss 3.0154 (3.0942)	Entropy 0.78122 (0.78120)	Top-1 acc 53.906 (50.208)	Top-5 acc 72.656 (73.177)	lr 0.02156
Train [30][120/3239]	Time 0.622 (1.058)	Data Time 0.002 (0.194)	Loss 2.9069 (3.0978)	Entropy 0.78103 (0.78120)	Top-1 acc 52.734 (50.142)	Top-5 acc 77.344 (73.111)	lr 0.02156
Train [30][130/3239]	Time 0.678 (1.042)	Data Time 0.002 (0.179)	Loss 3.1156 (3.0991)	Entropy 0.78100 (0.78118)	Top-1 acc 48.438 (50.092)	Top-5 acc 70.703 (73.035)	lr 0.02156
Train [30][140/3239]	Time 0.589 (1.029)	Data Time 0.001 (0.167)	Loss 3.0765 (3.0976)	Entropy 0.78102 (0.78117)	Top-1 acc 49.609 (50.044)	Top-5 acc 72.266 (72.991)	lr 0.02156
Train [30][150/3239]	Time 0.639 (1.017)	Data Time 0.001 (0.156)	Loss 3.0277 (3.0996)	Entropy 0.78082 (0.78115)	Top-1 acc 52.344 (49.938)	Top-5 acc 73.828 (72.974)	lr 0.02156
Train [30][160/3239]	Time 0.594 (1.009)	Data Time 0.001 (0.146)	Loss 3.0942 (3.0987)	Entropy 0.78070 (0.78113)	Top-1 acc 52.734 (49.978)	Top-5 acc 73.047 (72.998)	lr 0.02156
Train [30][170/3239]	Time 0.616 (1.000)	Data Time 0.001 (0.138)	Loss 3.1529 (3.1022)	Entropy 0.78069 (0.78110)	Top-1 acc 51.953 (49.968)	Top-5 acc 70.312 (72.969)	lr 0.02156
Train [30][180/3239]	Time 0.620 (0.990)	Data Time 0.001 (0.130)	Loss 3.0737 (3.1031)	Entropy 0.78082 (0.78108)	Top-1 acc 48.047 (49.883)	Top-5 acc 73.047 (72.917)	lr 0.02155
Train [30][190/3239]	Time 0.620 (0.981)	Data Time 0.001 (0.123)	Loss 3.1210 (3.1003)	Entropy 0.78092 (0.78107)	Top-1 acc 51.953 (49.928)	Top-5 acc 72.656 (72.973)	lr 0.02155
Train [30][200/3239]	Time 0.637 (0.976)	Data Time 0.001 (0.117)	Loss 3.1203 (3.1004)	Entropy 0.78080 (0.78106)	Top-1 acc 52.344 (49.876)	Top-5 acc 73.438 (73.006)	lr 0.02155
Train [30][210/3239]	Time 0.609 (0.970)	Data Time 0.001 (0.112)	Loss 3.0112 (3.0971)	Entropy 0.78042 (0.78104)	Top-1 acc 49.609 (49.898)	Top-5 acc 78.125 (73.080)	lr 0.02155
Train [30][220/3239]	Time 0.705 (0.966)	Data Time 0.001 (0.107)	Loss 3.1720 (3.0965)	Entropy 0.78066 (0.78101)	Top-1 acc 49.609 (49.926)	Top-5 acc 71.875 (73.073)	lr 0.02155
Train [30][230/3239]	Time 0.594 (0.962)	Data Time 0.001 (0.102)	Loss 3.0666 (3.0957)	Entropy 0.78064 (0.78100)	Top-1 acc 50.781 (49.909)	Top-5 acc 73.438 (73.084)	lr 0.02155
Train [30][240/3239]	Time 0.605 (0.958)	Data Time 0.001 (0.098)	Loss 3.1551 (3.0993)	Entropy 0.78100 (0.78099)	Top-1 acc 48.438 (49.844)	Top-5 acc 69.531 (72.976)	lr 0.02155
Train [30][250/3239]	Time 0.647 (0.954)	Data Time 0.001 (0.094)	Loss 2.9388 (3.0977)	Entropy 0.78095 (0.78099)	Top-1 acc 51.562 (49.868)	Top-5 acc 76.172 (73.038)	lr 0.02155
Train [30][260/3239]	Time 0.609 (0.951)	Data Time 0.001 (0.091)	Loss 3.1389 (3.0978)	Entropy 0.78097 (0.78099)	Top-1 acc 49.609 (49.855)	Top-5 acc 74.219 (73.048)	lr 0.02155
Train [30][270/3239]	Time 0.598 (0.948)	Data Time 0.001 (0.088)	Loss 3.1350 (3.0941)	Entropy 0.78140 (0.78100)	Top-1 acc 50.000 (49.945)	Top-5 acc 71.875 (73.115)	lr 0.02155
Train [30][280/3239]	Time 0.617 (0.945)	Data Time 0.001 (0.084)	Loss 2.9970 (3.0943)	Entropy 0.78153 (0.78102)	Top-1 acc 53.516 (49.942)	Top-5 acc 75.781 (73.114)	lr 0.02155
Train [30][290/3239]	Time 0.714 (0.942)	Data Time 0.001 (0.082)	Loss 3.1119 (3.0923)	Entropy 0.78123 (0.78103)	Top-1 acc 48.438 (49.984)	Top-5 acc 69.531 (73.154)	lr 0.02155
Train [30][300/3239]	Time 0.584 (0.939)	Data Time 0.001 (0.079)	Loss 3.1320 (3.0930)	Entropy 0.78090 (0.78104)	Top-1 acc 48.828 (49.978)	Top-5 acc 69.922 (73.175)	lr 0.02155
Train [30][310/3239]	Time 0.567 (0.936)	Data Time 0.001 (0.077)	Loss 3.4222 (3.0956)	Entropy 0.78083 (0.78103)	Top-1 acc 41.797 (49.931)	Top-5 acc 67.188 (73.134)	lr 0.02155
Train [30][320/3239]	Time 0.640 (0.934)	Data Time 0.002 (0.074)	Loss 3.1141 (3.0953)	Entropy 0.78077 (0.78102)	Top-1 acc 51.172 (49.926)	Top-5 acc 75.391 (73.170)	lr 0.02154
Train [30][330/3239]	Time 0.797 (1.006)	Data Time 0.045 (0.072)	Loss 3.1308 (3.0983)	Entropy 0.78078 (0.78102)	Top-1 acc 48.047 (49.841)	Top-5 acc 74.609 (73.158)	lr 0.02154
Train [30][340/3239]	Time 0.638 (1.004)	Data Time 0.002 (0.070)	Loss 3.0480 (3.0973)	Entropy 0.78060 (0.78101)	Top-1 acc 52.734 (49.842)	Top-5 acc 73.438 (73.152)	lr 0.02154
Train [30][350/3239]	Time 0.577 (1.000)	Data Time 0.002 (0.068)	Loss 3.4275 (3.0954)	Entropy 0.78066 (0.78099)	Top-1 acc 43.750 (49.905)	Top-5 acc 67.578 (73.183)	lr 0.02154
Train [30][360/3239]	Time 0.637 (0.997)	Data Time 0.002 (0.066)	Loss 3.0894 (3.0972)	Entropy 0.78039 (0.78098)	Top-1 acc 53.125 (49.880)	Top-5 acc 70.312 (73.140)	lr 0.02154
Train [30][370/3239]	Time 0.635 (0.994)	Data Time 0.001 (0.065)	Loss 2.9283 (3.0976)	Entropy 0.77962 (0.78096)	Top-1 acc 51.562 (49.879)	Top-5 acc 75.000 (73.133)	lr 0.02154
Train [30][380/3239]	Time 0.719 (0.990)	Data Time 0.001 (0.063)	Loss 3.1018 (3.0980)	Entropy 0.77944 (0.78092)	Top-1 acc 50.000 (49.876)	Top-5 acc 72.656 (73.105)	lr 0.02154
Train [30][390/3239]	Time 0.629 (0.987)	Data Time 0.001 (0.061)	Loss 3.0909 (3.0994)	Entropy 0.77968 (0.78088)	Top-1 acc 51.172 (49.874)	Top-5 acc 74.219 (73.070)	lr 0.02154
Train [30][400/3239]	Time 0.630 (0.984)	Data Time 0.001 (0.060)	Loss 2.9811 (3.0990)	Entropy 0.78010 (0.78086)	Top-1 acc 53.906 (49.893)	Top-5 acc 73.047 (73.097)	lr 0.02154
Train [30][410/3239]	Time 0.621 (0.982)	Data Time 0.001 (0.059)	Loss 2.9373 (3.1008)	Entropy 0.78006 (0.78084)	Top-1 acc 53.906 (49.832)	Top-5 acc 76.562 (73.055)	lr 0.02154
Train [30][420/3239]	Time 0.591 (0.979)	Data Time 0.001 (0.057)	Loss 3.0592 (3.1003)	Entropy 0.78000 (0.78082)	Top-1 acc 55.469 (49.836)	Top-5 acc 74.219 (73.093)	lr 0.02154
Train [30][430/3239]	Time 0.619 (0.977)	Data Time 0.001 (0.056)	Loss 3.1301 (3.0992)	Entropy 0.78006 (0.78080)	Top-1 acc 50.391 (49.850)	Top-5 acc 70.703 (73.106)	lr 0.02154
Train [30][440/3239]	Time 0.683 (0.974)	Data Time 0.001 (0.055)	Loss 3.0467 (3.1001)	Entropy 0.77992 (0.78079)	Top-1 acc 51.953 (49.809)	Top-5 acc 73.438 (73.115)	lr 0.02154
Train [30][450/3239]	Time 0.693 (0.972)	Data Time 0.001 (0.054)	Loss 3.1352 (3.1005)	Entropy 0.77958 (0.78076)	Top-1 acc 46.875 (49.797)	Top-5 acc 72.656 (73.094)	lr 0.02154
Train [30][460/3239]	Time 0.612 (0.969)	Data Time 0.002 (0.052)	Loss 2.8642 (3.1011)	Entropy 0.77951 (0.78073)	Top-1 acc 55.078 (49.809)	Top-5 acc 76.172 (73.076)	lr 0.02154
Train [30][470/3239]	Time 0.567 (0.966)	Data Time 0.001 (0.051)	Loss 3.1369 (3.1011)	Entropy 0.77956 (0.78071)	Top-1 acc 47.266 (49.796)	Top-5 acc 73.047 (73.073)	lr 0.02153
Train [30][480/3239]	Time 0.463 (0.964)	Data Time 0.001 (0.050)	Loss 3.4115 (3.1020)	Entropy 0.77935 (0.78068)	Top-1 acc 42.188 (49.739)	Top-5 acc 69.141 (73.074)	lr 0.02153
Train [30][490/3239]	Time 0.585 (0.962)	Data Time 0.001 (0.049)	Loss 3.0181 (3.1025)	Entropy 0.77907 (0.78065)	Top-1 acc 51.562 (49.728)	Top-5 acc 76.172 (73.060)	lr 0.02153
Train [30][500/3239]	Time 0.573 (0.960)	Data Time 0.001 (0.048)	Loss 2.9605 (3.1021)	Entropy 0.77903 (0.78062)	Top-1 acc 52.734 (49.721)	Top-5 acc 76.562 (73.076)	lr 0.02153
Train [30][510/3239]	Time 0.607 (0.959)	Data Time 0.001 (0.047)	Loss 3.0804 (3.1020)	Entropy 0.77888 (0.78059)	Top-1 acc 49.609 (49.713)	Top-5 acc 71.875 (73.087)	lr 0.02153
Train [30][520/3239]	Time 0.619 (0.957)	Data Time 0.001 (0.047)	Loss 3.0513 (3.1017)	Entropy 0.77911 (0.78056)	Top-1 acc 52.344 (49.714)	Top-5 acc 73.828 (73.095)	lr 0.02153
Train [30][530/3239]	Time 0.631 (0.955)	Data Time 0.001 (0.046)	Loss 3.0884 (3.1007)	Entropy 0.77887 (0.78053)	Top-1 acc 46.484 (49.737)	Top-5 acc 71.875 (73.124)	lr 0.02153
Train [30][540/3239]	Time 0.619 (0.954)	Data Time 0.001 (0.045)	Loss 3.3852 (3.1001)	Entropy 0.77844 (0.78049)	Top-1 acc 44.141 (49.742)	Top-5 acc 66.406 (73.120)	lr 0.02153
Train [30][550/3239]	Time 0.577 (0.952)	Data Time 0.001 (0.044)	Loss 3.2125 (3.1001)	Entropy 0.77815 (0.78046)	Top-1 acc 46.875 (49.755)	Top-5 acc 74.609 (73.135)	lr 0.02153
Train [30][560/3239]	Time 0.613 (0.951)	Data Time 0.001 (0.043)	Loss 3.2407 (3.1002)	Entropy 0.77817 (0.78041)	Top-1 acc 46.875 (49.749)	Top-5 acc 71.094 (73.135)	lr 0.02153
Train [30][570/3239]	Time 0.637 (0.949)	Data Time 0.001 (0.043)	Loss 2.9384 (3.0994)	Entropy 0.77813 (0.78037)	Top-1 acc 53.906 (49.761)	Top-5 acc 76.172 (73.153)	lr 0.02153
Train [30][580/3239]	Time 0.603 (0.948)	Data Time 0.001 (0.042)	Loss 2.9212 (3.0998)	Entropy 0.77848 (0.78034)	Top-1 acc 50.781 (49.744)	Top-5 acc 80.078 (73.148)	lr 0.02153
Train [30][590/3239]	Time 0.595 (0.947)	Data Time 0.001 (0.041)	Loss 3.1339 (3.1007)	Entropy 0.77823 (0.78030)	Top-1 acc 49.609 (49.728)	Top-5 acc 72.656 (73.129)	lr 0.02153
Train [30][600/3239]	Time 0.607 (0.946)	Data Time 0.001 (0.041)	Loss 2.9292 (3.1006)	Entropy 0.77848 (0.78027)	Top-1 acc 55.078 (49.721)	Top-5 acc 75.391 (73.131)	lr 0.02153
Train [30][610/3239]	Time 0.696 (0.944)	Data Time 0.001 (0.040)	Loss 2.9846 (3.1017)	Entropy 0.77858 (0.78024)	Top-1 acc 50.391 (49.702)	Top-5 acc 77.344 (73.118)	lr 0.02152
Train [30][620/3239]	Time 0.595 (0.943)	Data Time 0.001 (0.039)	Loss 3.3785 (3.1022)	Entropy 0.77823 (0.78021)	Top-1 acc 42.578 (49.699)	Top-5 acc 68.359 (73.101)	lr 0.02152
Train [30][630/3239]	Time 0.616 (0.942)	Data Time 0.001 (0.039)	Loss 3.1507 (3.1032)	Entropy 0.77829 (0.78018)	Top-1 acc 49.219 (49.675)	Top-5 acc 69.531 (73.085)	lr 0.02152
Train [30][640/3239]	Time 0.609 (0.941)	Data Time 0.001 (0.038)	Loss 3.0917 (3.1030)	Entropy 0.77828 (0.78015)	Top-1 acc 48.828 (49.681)	Top-5 acc 71.875 (73.075)	lr 0.02152
Train [30][650/3239]	Time 0.468 (0.939)	Data Time 0.001 (0.038)	Loss 3.2464 (3.1027)	Entropy 0.77816 (0.78013)	Top-1 acc 46.484 (49.691)	Top-5 acc 68.359 (73.083)	lr 0.02152
Train [30][660/3239]	Time 0.612 (0.938)	Data Time 0.002 (0.037)	Loss 3.0909 (3.1035)	Entropy 0.77795 (0.78009)	Top-1 acc 52.734 (49.685)	Top-5 acc 71.875 (73.072)	lr 0.02152
Train [30][670/3239]	Time 0.604 (0.937)	Data Time 0.001 (0.037)	Loss 3.1846 (3.1033)	Entropy 0.77847 (0.78006)	Top-1 acc 48.438 (49.693)	Top-5 acc 73.047 (73.086)	lr 0.02152
Train [30][680/3239]	Time 0.729 (0.936)	Data Time 0.001 (0.036)	Loss 3.1544 (3.1033)	Entropy 0.77839 (0.78004)	Top-1 acc 49.219 (49.705)	Top-5 acc 74.609 (73.093)	lr 0.02152
Train [30][690/3239]	Time 0.586 (0.935)	Data Time 0.002 (0.036)	Loss 3.4057 (3.1039)	Entropy 0.77761 (0.78001)	Top-1 acc 44.922 (49.692)	Top-5 acc 66.797 (73.075)	lr 0.02152
Train [30][700/3239]	Time 0.586 (0.934)	Data Time 0.001 (0.035)	Loss 2.9609 (3.1037)	Entropy 0.77747 (0.77998)	Top-1 acc 53.516 (49.676)	Top-5 acc 76.172 (73.067)	lr 0.02152
Train [30][710/3239]	Time 0.608 (0.933)	Data Time 0.001 (0.035)	Loss 2.9581 (3.1036)	Entropy 0.77744 (0.77995)	Top-1 acc 51.953 (49.683)	Top-5 acc 75.391 (73.072)	lr 0.02152
Train [30][720/3239]	Time 0.595 (0.932)	Data Time 0.001 (0.034)	Loss 2.9707 (3.1039)	Entropy 0.77756 (0.77991)	Top-1 acc 54.688 (49.671)	Top-5 acc 75.781 (73.063)	lr 0.02152
Train [30][730/3239]	Time 0.635 (0.931)	Data Time 0.001 (0.034)	Loss 2.9917 (3.1032)	Entropy 0.77751 (0.77988)	Top-1 acc 51.562 (49.685)	Top-5 acc 75.000 (73.072)	lr 0.02152
Train [30][740/3239]	Time 0.624 (0.930)	Data Time 0.001 (0.033)	Loss 3.0072 (3.1025)	Entropy 0.77727 (0.77985)	Top-1 acc 49.609 (49.700)	Top-5 acc 75.391 (73.087)	lr 0.02152
Train [30][750/3239]	Time 0.601 (0.929)	Data Time 0.001 (0.033)	Loss 3.1707 (3.1026)	Entropy 0.77705 (0.77981)	Top-1 acc 48.828 (49.711)	Top-5 acc 70.312 (73.075)	lr 0.02151
Train [30][760/3239]	Time 0.650 (0.929)	Data Time 0.002 (0.033)	Loss 3.1660 (3.1029)	Entropy 0.77701 (0.77978)	Top-1 acc 49.219 (49.700)	Top-5 acc 73.047 (73.068)	lr 0.02151
Train [30][770/3239]	Time 0.737 (0.928)	Data Time 0.001 (0.032)	Loss 3.0756 (3.1016)	Entropy 0.77680 (0.77974)	Top-1 acc 50.391 (49.727)	Top-5 acc 75.000 (73.082)	lr 0.02151
Train [30][780/3239]	Time 0.645 (0.927)	Data Time 0.001 (0.032)	Loss 3.0437 (3.1007)	Entropy 0.77659 (0.77970)	Top-1 acc 49.609 (49.740)	Top-5 acc 75.781 (73.108)	lr 0.02151
Train [30][790/3239]	Time 0.622 (0.927)	Data Time 0.001 (0.031)	Loss 2.8538 (3.1008)	Entropy 0.77667 (0.77966)	Top-1 acc 57.812 (49.738)	Top-5 acc 78.125 (73.097)	lr 0.02151
Train [30][800/3239]	Time 0.598 (0.926)	Data Time 0.001 (0.031)	Loss 3.0449 (3.1004)	Entropy 0.77659 (0.77962)	Top-1 acc 49.219 (49.736)	Top-5 acc 72.656 (73.103)	lr 0.02151
Train [30][810/3239]	Time 0.609 (0.925)	Data Time 0.001 (0.031)	Loss 3.1195 (3.1008)	Entropy 0.77631 (0.77959)	Top-1 acc 51.562 (49.728)	Top-5 acc 75.000 (73.098)	lr 0.02151
Train [30][820/3239]	Time 0.618 (0.923)	Data Time 0.001 (0.030)	Loss 2.9753 (3.1005)	Entropy 0.77667 (0.77955)	Top-1 acc 53.125 (49.731)	Top-5 acc 75.781 (73.098)	lr 0.02151
Train [30][830/3239]	Time 0.649 (0.922)	Data Time 0.001 (0.030)	Loss 3.1505 (3.1011)	Entropy 0.77667 (0.77951)	Top-1 acc 48.047 (49.700)	Top-5 acc 70.703 (73.086)	lr 0.02151
Train [30][840/3239]	Time 0.728 (0.922)	Data Time 0.001 (0.030)	Loss 3.0440 (3.1013)	Entropy 0.77687 (0.77948)	Top-1 acc 48.828 (49.691)	Top-5 acc 74.219 (73.081)	lr 0.02151
Train [30][850/3239]	Time 0.592 (0.921)	Data Time 0.001 (0.029)	Loss 3.0990 (3.1013)	Entropy 0.77691 (0.77945)	Top-1 acc 50.781 (49.701)	Top-5 acc 71.875 (73.080)	lr 0.02151
Train [30][860/3239]	Time 0.619 (0.920)	Data Time 0.001 (0.029)	Loss 3.3086 (3.1013)	Entropy 0.77673 (0.77942)	Top-1 acc 42.969 (49.707)	Top-5 acc 67.969 (73.080)	lr 0.02151
Train [30][870/3239]	Time 0.642 (0.920)	Data Time 0.001 (0.029)	Loss 3.3106 (3.1011)	Entropy 0.77667 (0.77939)	Top-1 acc 43.359 (49.707)	Top-5 acc 67.578 (73.081)	lr 0.02151
Train [30][880/3239]	Time 0.605 (0.919)	Data Time 0.001 (0.028)	Loss 3.3168 (3.1011)	Entropy 0.77684 (0.77936)	Top-1 acc 43.750 (49.710)	Top-5 acc 68.750 (73.094)	lr 0.02151
Train [30][890/3239]	Time 0.604 (0.919)	Data Time 0.001 (0.028)	Loss 3.0419 (3.1015)	Entropy 0.77699 (0.77933)	Top-1 acc 53.125 (49.714)	Top-5 acc 72.656 (73.094)	lr 0.02151
Train [30][900/3239]	Time 0.648 (0.918)	Data Time 0.001 (0.028)	Loss 3.1986 (3.1008)	Entropy 0.77726 (0.77930)	Top-1 acc 49.609 (49.726)	Top-5 acc 71.875 (73.104)	lr 0.02150
Train [30][910/3239]	Time 0.612 (0.918)	Data Time 0.001 (0.028)	Loss 3.1318 (3.1011)	Entropy 0.77746 (0.77928)	Top-1 acc 48.828 (49.723)	Top-5 acc 72.656 (73.100)	lr 0.02150
Train [30][920/3239]	Time 0.605 (0.917)	Data Time 0.001 (0.027)	Loss 2.8378 (3.1006)	Entropy 0.77728 (0.77926)	Top-1 acc 55.078 (49.736)	Top-5 acc 79.297 (73.115)	lr 0.02150
Train [30][930/3239]	Time 0.727 (0.916)	Data Time 0.001 (0.027)	Loss 3.3153 (3.1008)	Entropy 0.77685 (0.77924)	Top-1 acc 46.484 (49.730)	Top-5 acc 69.531 (73.117)	lr 0.02150
Train [30][940/3239]	Time 0.625 (0.916)	Data Time 0.001 (0.027)	Loss 3.0735 (3.1005)	Entropy 0.77718 (0.77921)	Top-1 acc 47.656 (49.732)	Top-5 acc 75.000 (73.122)	lr 0.02150
Train [30][950/3239]	Time 0.617 (0.915)	Data Time 0.001 (0.026)	Loss 3.3868 (3.1005)	Entropy 0.77710 (0.77919)	Top-1 acc 42.578 (49.719)	Top-5 acc 70.312 (73.128)	lr 0.02150
Train [30][960/3239]	Time 0.607 (0.915)	Data Time 0.001 (0.026)	Loss 3.0239 (3.1011)	Entropy 0.77703 (0.77917)	Top-1 acc 50.391 (49.718)	Top-5 acc 73.047 (73.112)	lr 0.02150
Train [30][970/3239]	Time 0.612 (0.914)	Data Time 0.001 (0.026)	Loss 3.4185 (3.1008)	Entropy 0.77663 (0.77915)	Top-1 acc 45.312 (49.712)	Top-5 acc 68.750 (73.115)	lr 0.02150
Train [30][980/3239]	Time 0.631 (0.914)	Data Time 0.001 (0.026)	Loss 3.0363 (3.1009)	Entropy 0.77674 (0.77912)	Top-1 acc 48.828 (49.714)	Top-5 acc 75.781 (73.115)	lr 0.02150
Train [30][990/3239]	Time 0.638 (0.938)	Data Time 0.002 (0.025)	Loss 3.1031 (3.1008)	Entropy 0.77613 (0.77910)	Top-1 acc 51.562 (49.719)	Top-5 acc 73.047 (73.122)	lr 0.02150
Train [30][1000/3239]	Time 0.707 (0.937)	Data Time 0.001 (0.025)	Loss 3.2314 (3.1010)	Entropy 0.77633 (0.77907)	Top-1 acc 43.750 (49.708)	Top-5 acc 68.750 (73.114)	lr 0.02150
Train [30][1010/3239]	Time 0.623 (0.937)	Data Time 0.001 (0.025)	Loss 3.1163 (3.1011)	Entropy 0.77593 (0.77904)	Top-1 acc 49.609 (49.704)	Top-5 acc 74.609 (73.114)	lr 0.02150
Train [30][1020/3239]	Time 0.607 (0.936)	Data Time 0.001 (0.025)	Loss 3.0206 (3.1012)	Entropy 0.77570 (0.77901)	Top-1 acc 57.031 (49.696)	Top-5 acc 77.344 (73.121)	lr 0.02150
Train [30][1030/3239]	Time 0.628 (0.935)	Data Time 0.001 (0.025)	Loss 2.8641 (3.1018)	Entropy 0.77577 (0.77898)	Top-1 acc 56.250 (49.698)	Top-5 acc 79.297 (73.113)	lr 0.02150
Train [30][1040/3239]	Time 0.622 (0.935)	Data Time 0.001 (0.024)	Loss 2.9968 (3.1018)	Entropy 0.77554 (0.77895)	Top-1 acc 52.734 (49.698)	Top-5 acc 75.391 (73.110)	lr 0.02149
Train [30][1050/3239]	Time 0.621 (0.934)	Data Time 0.001 (0.024)	Loss 3.1972 (3.1017)	Entropy 0.77535 (0.77891)	Top-1 acc 48.828 (49.705)	Top-5 acc 71.094 (73.111)	lr 0.02149
Train [30][1060/3239]	Time 0.598 (0.934)	Data Time 0.001 (0.024)	Loss 3.0798 (3.1017)	Entropy 0.77503 (0.77888)	Top-1 acc 49.219 (49.703)	Top-5 acc 73.828 (73.112)	lr 0.02149
Train [30][1070/3239]	Time 0.627 (0.933)	Data Time 0.001 (0.024)	Loss 3.0186 (3.1018)	Entropy 0.77495 (0.77884)	Top-1 acc 51.562 (49.689)	Top-5 acc 74.609 (73.114)	lr 0.02149
Train [30][1080/3239]	Time 0.610 (0.932)	Data Time 0.001 (0.024)	Loss 3.2065 (3.1021)	Entropy 0.77532 (0.77881)	Top-1 acc 47.266 (49.674)	Top-5 acc 70.703 (73.099)	lr 0.02149
Train [30][1090/3239]	Time 0.602 (0.932)	Data Time 0.001 (0.023)	Loss 3.0970 (3.1017)	Entropy 0.77544 (0.77877)	Top-1 acc 50.781 (49.684)	Top-5 acc 75.000 (73.108)	lr 0.02149
Train [30][1100/3239]	Time 0.618 (0.931)	Data Time 0.001 (0.023)	Loss 2.9817 (3.1014)	Entropy 0.77538 (0.77874)	Top-1 acc 52.344 (49.690)	Top-5 acc 75.000 (73.117)	lr 0.02149
Train [30][1110/3239]	Time 0.630 (0.930)	Data Time 0.002 (0.023)	Loss 3.0016 (3.1008)	Entropy 0.77539 (0.77871)	Top-1 acc 50.391 (49.704)	Top-5 acc 73.438 (73.126)	lr 0.02149
Train [30][1120/3239]	Time 0.649 (0.929)	Data Time 0.001 (0.023)	Loss 3.2531 (3.1009)	Entropy 0.77539 (0.77868)	Top-1 acc 44.141 (49.699)	Top-5 acc 68.359 (73.119)	lr 0.02149
Train [30][1130/3239]	Time 0.601 (0.929)	Data Time 0.001 (0.023)	Loss 3.3101 (3.1008)	Entropy 0.77490 (0.77865)	Top-1 acc 43.750 (49.701)	Top-5 acc 68.750 (73.123)	lr 0.02149
Train [30][1140/3239]	Time 0.661 (0.928)	Data Time 0.001 (0.022)	Loss 3.1003 (3.1009)	Entropy 0.77513 (0.77862)	Top-1 acc 50.391 (49.703)	Top-5 acc 73.438 (73.120)	lr 0.02149
Train [30][1150/3239]	Time 0.603 (0.928)	Data Time 0.001 (0.022)	Loss 2.8858 (3.1009)	Entropy 0.77507 (0.77859)	Top-1 acc 57.031 (49.703)	Top-5 acc 75.781 (73.117)	lr 0.02149
Train [30][1160/3239]	Time 0.702 (0.927)	Data Time 0.001 (0.022)	Loss 3.1708 (3.1007)	Entropy 0.77453 (0.77856)	Top-1 acc 43.750 (49.699)	Top-5 acc 72.656 (73.120)	lr 0.02149
Train [30][1170/3239]	Time 0.612 (0.927)	Data Time 0.001 (0.022)	Loss 3.0549 (3.1007)	Entropy 0.77458 (0.77852)	Top-1 acc 50.781 (49.694)	Top-5 acc 72.656 (73.116)	lr 0.02149
Train [30][1180/3239]	Time 0.622 (0.926)	Data Time 0.001 (0.022)	Loss 3.3228 (3.1007)	Entropy 0.77479 (0.77849)	Top-1 acc 46.094 (49.700)	Top-5 acc 67.188 (73.119)	lr 0.02148
Train [30][1190/3239]	Time 0.598 (0.926)	Data Time 0.001 (0.022)	Loss 3.0919 (3.1009)	Entropy 0.77492 (0.77846)	Top-1 acc 50.781 (49.699)	Top-5 acc 70.703 (73.115)	lr 0.02148
Train [30][1200/3239]	Time 0.638 (0.925)	Data Time 0.001 (0.021)	Loss 3.1753 (3.1008)	Entropy 0.77466 (0.77843)	Top-1 acc 48.438 (49.712)	Top-5 acc 71.875 (73.112)	lr 0.02148
Train [30][1210/3239]	Time 0.599 (0.925)	Data Time 0.001 (0.021)	Loss 3.0282 (3.1010)	Entropy 0.77432 (0.77840)	Top-1 acc 50.391 (49.706)	Top-5 acc 72.656 (73.106)	lr 0.02148
Train [30][1220/3239]	Time 0.655 (0.925)	Data Time 0.001 (0.021)	Loss 3.0843 (3.1011)	Entropy 0.77417 (0.77837)	Top-1 acc 47.656 (49.697)	Top-5 acc 71.094 (73.099)	lr 0.02148
Train [30][1230/3239]	Time 0.601 (0.924)	Data Time 0.001 (0.021)	Loss 3.0238 (3.1015)	Entropy 0.77405 (0.77833)	Top-1 acc 51.562 (49.698)	Top-5 acc 73.047 (73.092)	lr 0.02148
Train [30][1240/3239]	Time 0.622 (0.924)	Data Time 0.001 (0.021)	Loss 3.0059 (3.1019)	Entropy 0.77372 (0.77829)	Top-1 acc 52.344 (49.683)	Top-5 acc 74.609 (73.083)	lr 0.02148
Train [30][1250/3239]	Time 0.633 (0.923)	Data Time 0.001 (0.021)	Loss 2.7493 (3.1015)	Entropy 0.77383 (0.77826)	Top-1 acc 56.641 (49.678)	Top-5 acc 81.250 (73.093)	lr 0.02148
Train [30][1260/3239]	Time 0.456 (0.923)	Data Time 0.001 (0.020)	Loss 3.0371 (3.1011)	Entropy 0.77370 (0.77822)	Top-1 acc 50.000 (49.681)	Top-5 acc 75.781 (73.104)	lr 0.02148
Train [30][1270/3239]	Time 0.645 (0.922)	Data Time 0.001 (0.020)	Loss 3.0402 (3.1011)	Entropy 0.77359 (0.77819)	Top-1 acc 49.219 (49.681)	Top-5 acc 73.047 (73.101)	lr 0.02148
Train [30][1280/3239]	Time 0.625 (0.922)	Data Time 0.001 (0.020)	Loss 3.1208 (3.1016)	Entropy 0.77320 (0.77815)	Top-1 acc 48.828 (49.666)	Top-5 acc 71.875 (73.085)	lr 0.02148
Train [30][1290/3239]	Time 0.644 (0.921)	Data Time 0.001 (0.020)	Loss 3.0631 (3.1018)	Entropy 0.77305 (0.77811)	Top-1 acc 50.781 (49.669)	Top-5 acc 72.656 (73.081)	lr 0.02148
Train [30][1300/3239]	Time 0.631 (0.921)	Data Time 0.002 (0.020)	Loss 3.4903 (3.1018)	Entropy 0.77273 (0.77807)	Top-1 acc 42.188 (49.672)	Top-5 acc 65.234 (73.075)	lr 0.02148
Train [30][1310/3239]	Time 0.619 (0.920)	Data Time 0.001 (0.020)	Loss 3.2068 (3.1019)	Entropy 0.77305 (0.77803)	Top-1 acc 42.969 (49.670)	Top-5 acc 72.656 (73.069)	lr 0.02148
Train [30][1320/3239]	Time 0.685 (0.920)	Data Time 0.001 (0.020)	Loss 3.0890 (3.1020)	Entropy 0.77348 (0.77800)	Top-1 acc 52.734 (49.680)	Top-5 acc 75.000 (73.066)	lr 0.02147
Train [30][1330/3239]	Time 0.633 (0.920)	Data Time 0.001 (0.019)	Loss 3.0281 (3.1022)	Entropy 0.77332 (0.77796)	Top-1 acc 50.781 (49.682)	Top-5 acc 76.172 (73.070)	lr 0.02147
Train [30][1340/3239]	Time 0.602 (0.919)	Data Time 0.001 (0.019)	Loss 3.0914 (3.1023)	Entropy 0.77343 (0.77793)	Top-1 acc 48.438 (49.680)	Top-5 acc 72.266 (73.064)	lr 0.02147
Train [30][1350/3239]	Time 0.603 (0.919)	Data Time 0.001 (0.019)	Loss 2.8280 (3.1023)	Entropy 0.77309 (0.77789)	Top-1 acc 57.422 (49.684)	Top-5 acc 78.125 (73.062)	lr 0.02147
Train [30][1360/3239]	Time 0.611 (0.918)	Data Time 0.001 (0.019)	Loss 3.0322 (3.1026)	Entropy 0.77262 (0.77786)	Top-1 acc 52.734 (49.681)	Top-5 acc 74.609 (73.064)	lr 0.02147
Train [30][1370/3239]	Time 0.636 (0.918)	Data Time 0.001 (0.019)	Loss 3.2587 (3.1030)	Entropy 0.77277 (0.77782)	Top-1 acc 46.484 (49.674)	Top-5 acc 69.141 (73.054)	lr 0.02147
Train [30][1380/3239]	Time 0.623 (0.918)	Data Time 0.001 (0.019)	Loss 2.9554 (3.1033)	Entropy 0.77256 (0.77778)	Top-1 acc 53.516 (49.671)	Top-5 acc 75.781 (73.049)	lr 0.02147
Train [30][1390/3239]	Time 0.706 (0.917)	Data Time 0.001 (0.019)	Loss 3.2515 (3.1031)	Entropy 0.77220 (0.77774)	Top-1 acc 43.359 (49.669)	Top-5 acc 70.703 (73.054)	lr 0.02147
Train [30][1400/3239]	Time 0.616 (0.917)	Data Time 0.001 (0.019)	Loss 3.0769 (3.1032)	Entropy 0.77210 (0.77770)	Top-1 acc 51.172 (49.674)	Top-5 acc 73.828 (73.049)	lr 0.02147
Train [30][1410/3239]	Time 0.586 (0.917)	Data Time 0.001 (0.018)	Loss 3.0545 (3.1031)	Entropy 0.77187 (0.77767)	Top-1 acc 49.219 (49.671)	Top-5 acc 73.047 (73.048)	lr 0.02147
Train [30][1420/3239]	Time 0.624 (0.916)	Data Time 0.001 (0.018)	Loss 3.0625 (3.1030)	Entropy 0.77230 (0.77762)	Top-1 acc 48.047 (49.661)	Top-5 acc 73.438 (73.048)	lr 0.02147
Train [30][1430/3239]	Time 0.618 (0.916)	Data Time 0.001 (0.018)	Loss 3.1242 (3.1027)	Entropy 0.77260 (0.77759)	Top-1 acc 49.219 (49.665)	Top-5 acc 73.047 (73.058)	lr 0.02147
Train [30][1440/3239]	Time 0.582 (0.915)	Data Time 0.001 (0.018)	Loss 3.3160 (3.1033)	Entropy 0.77219 (0.77755)	Top-1 acc 46.484 (49.652)	Top-5 acc 70.312 (73.049)	lr 0.02147
Train [30][1450/3239]	Time 0.609 (0.915)	Data Time 0.001 (0.018)	Loss 3.2612 (3.1032)	Entropy 0.77201 (0.77752)	Top-1 acc 48.438 (49.663)	Top-5 acc 66.797 (73.047)	lr 0.02147
Train [30][1460/3239]	Time 0.595 (0.914)	Data Time 0.001 (0.018)	Loss 3.2103 (3.1036)	Entropy 0.77148 (0.77748)	Top-1 acc 48.828 (49.657)	Top-5 acc 72.656 (73.038)	lr 0.02147
Train [30][1470/3239]	Time 0.616 (0.914)	Data Time 0.001 (0.018)	Loss 3.1016 (3.1037)	Entropy 0.77157 (0.77744)	Top-1 acc 50.000 (49.653)	Top-5 acc 73.828 (73.033)	lr 0.02146
Train [30][1480/3239]	Time 0.684 (0.914)	Data Time 0.001 (0.018)	Loss 3.0759 (3.1035)	Entropy 0.77153 (0.77740)	Top-1 acc 50.000 (49.656)	Top-5 acc 75.391 (73.034)	lr 0.02146
Train [30][1490/3239]	Time 0.629 (0.914)	Data Time 0.001 (0.018)	Loss 2.9378 (3.1039)	Entropy 0.77177 (0.77736)	Top-1 acc 55.078 (49.650)	Top-5 acc 75.000 (73.029)	lr 0.02146
Train [30][1500/3239]	Time 0.635 (0.913)	Data Time 0.001 (0.017)	Loss 3.0748 (3.1041)	Entropy 0.77162 (0.77732)	Top-1 acc 52.734 (49.646)	Top-5 acc 74.219 (73.024)	lr 0.02146
Train [30][1510/3239]	Time 0.634 (0.913)	Data Time 0.001 (0.017)	Loss 3.0909 (3.1040)	Entropy 0.77148 (0.77728)	Top-1 acc 53.125 (49.642)	Top-5 acc 74.219 (73.025)	lr 0.02146
Train [30][1520/3239]	Time 0.609 (0.913)	Data Time 0.003 (0.017)	Loss 3.2313 (3.1035)	Entropy 0.77123 (0.77724)	Top-1 acc 48.438 (49.654)	Top-5 acc 71.094 (73.038)	lr 0.02146
Train [30][1530/3239]	Time 0.605 (0.912)	Data Time 0.001 (0.017)	Loss 3.0437 (3.1033)	Entropy 0.77121 (0.77720)	Top-1 acc 51.172 (49.658)	Top-5 acc 74.609 (73.042)	lr 0.02146
Train [30][1540/3239]	Time 0.627 (0.912)	Data Time 0.001 (0.017)	Loss 3.1077 (3.1033)	Entropy 0.77089 (0.77716)	Top-1 acc 50.000 (49.660)	Top-5 acc 73.438 (73.039)	lr 0.02146
Train [30][1550/3239]	Time 0.687 (0.912)	Data Time 0.001 (0.017)	Loss 3.0599 (3.1030)	Entropy 0.77094 (0.77712)	Top-1 acc 50.000 (49.669)	Top-5 acc 71.875 (73.045)	lr 0.02146
Train [30][1560/3239]	Time 0.603 (0.911)	Data Time 0.001 (0.017)	Loss 2.9472 (3.1030)	Entropy 0.77089 (0.77708)	Top-1 acc 53.125 (49.666)	Top-5 acc 77.344 (73.042)	lr 0.02146
Train [30][1570/3239]	Time 0.607 (0.911)	Data Time 0.001 (0.017)	Loss 3.2970 (3.1031)	Entropy 0.77111 (0.77704)	Top-1 acc 44.531 (49.663)	Top-5 acc 68.750 (73.044)	lr 0.02146
Train [30][1580/3239]	Time 0.614 (0.911)	Data Time 0.001 (0.017)	Loss 2.9809 (3.1033)	Entropy 0.77095 (0.77701)	Top-1 acc 52.734 (49.660)	Top-5 acc 75.000 (73.040)	lr 0.02146
Train [30][1590/3239]	Time 0.588 (0.910)	Data Time 0.001 (0.017)	Loss 3.1919 (3.1028)	Entropy 0.77074 (0.77697)	Top-1 acc 47.266 (49.664)	Top-5 acc 72.266 (73.054)	lr 0.02146
Train [30][1600/3239]	Time 0.616 (0.910)	Data Time 0.001 (0.017)	Loss 2.9689 (3.1031)	Entropy 0.77100 (0.77693)	Top-1 acc 53.125 (49.665)	Top-5 acc 75.391 (73.048)	lr 0.02146
Train [30][1610/3239]	Time 0.605 (0.910)	Data Time 0.001 (0.016)	Loss 2.9206 (3.1027)	Entropy 0.77105 (0.77689)	Top-1 acc 52.734 (49.667)	Top-5 acc 79.297 (73.057)	lr 0.02145
Train [30][1620/3239]	Time 0.556 (0.909)	Data Time 0.001 (0.016)	Loss 3.0254 (3.1027)	Entropy 0.77128 (0.77686)	Top-1 acc 51.172 (49.661)	Top-5 acc 75.781 (73.061)	lr 0.02145
Train [30][1630/3239]	Time 0.486 (0.909)	Data Time 0.001 (0.016)	Loss 3.2387 (3.1031)	Entropy 0.77116 (0.77682)	Top-1 acc 40.625 (49.653)	Top-5 acc 71.094 (73.059)	lr 0.02145
Train [30][1640/3239]	Time 0.868 (0.924)	Data Time 0.007 (0.016)	Loss 3.0987 (3.1029)	Entropy 0.77089 (0.77679)	Top-1 acc 53.125 (49.654)	Top-5 acc 71.875 (73.060)	lr 0.02145
Train [30][1650/3239]	Time 0.622 (0.924)	Data Time 0.002 (0.016)	Loss 3.0371 (3.1036)	Entropy 0.77099 (0.77675)	Top-1 acc 48.438 (49.642)	Top-5 acc 74.609 (73.041)	lr 0.02145
Train [30][1660/3239]	Time 0.606 (0.923)	Data Time 0.001 (0.016)	Loss 3.1296 (3.1035)	Entropy 0.77110 (0.77672)	Top-1 acc 44.922 (49.635)	Top-5 acc 72.656 (73.046)	lr 0.02145
Train [30][1670/3239]	Time 0.622 (0.923)	Data Time 0.001 (0.016)	Loss 3.2731 (3.1037)	Entropy 0.77083 (0.77668)	Top-1 acc 43.359 (49.630)	Top-5 acc 65.234 (73.036)	lr 0.02145
Train [30][1680/3239]	Time 0.606 (0.923)	Data Time 0.001 (0.016)	Loss 3.2223 (3.1034)	Entropy 0.77082 (0.77665)	Top-1 acc 48.828 (49.634)	Top-5 acc 70.312 (73.040)	lr 0.02145
Train [30][1690/3239]	Time 0.644 (0.922)	Data Time 0.003 (0.016)	Loss 3.2875 (3.1037)	Entropy 0.77081 (0.77661)	Top-1 acc 42.578 (49.627)	Top-5 acc 70.312 (73.036)	lr 0.02145
Train [30][1700/3239]	Time 0.613 (0.922)	Data Time 0.001 (0.016)	Loss 3.2628 (3.1037)	Entropy 0.77073 (0.77658)	Top-1 acc 48.828 (49.631)	Top-5 acc 70.703 (73.040)	lr 0.02145
Train [30][1710/3239]	Time 0.732 (0.922)	Data Time 0.001 (0.016)	Loss 3.1488 (3.1032)	Entropy 0.77039 (0.77654)	Top-1 acc 48.047 (49.639)	Top-5 acc 70.703 (73.048)	lr 0.02145
Train [30][1720/3239]	Time 0.579 (0.921)	Data Time 0.002 (0.016)	Loss 3.0868 (3.1033)	Entropy 0.77050 (0.77651)	Top-1 acc 51.172 (49.639)	Top-5 acc 74.609 (73.044)	lr 0.02145
Train [30][1730/3239]	Time 0.622 (0.921)	Data Time 0.001 (0.015)	Loss 3.2976 (3.1035)	Entropy 0.77088 (0.77647)	Top-1 acc 45.312 (49.633)	Top-5 acc 69.531 (73.040)	lr 0.02145
Train [30][1740/3239]	Time 0.583 (0.921)	Data Time 0.001 (0.015)	Loss 3.1496 (3.1039)	Entropy 0.77075 (0.77644)	Top-1 acc 47.656 (49.626)	Top-5 acc 71.094 (73.037)	lr 0.02145
Train [30][1750/3239]	Time 0.467 (0.920)	Data Time 0.001 (0.015)	Loss 3.1905 (3.1039)	Entropy 0.77091 (0.77641)	Top-1 acc 46.875 (49.627)	Top-5 acc 69.531 (73.033)	lr 0.02144
Train [30][1760/3239]	Time 0.570 (0.920)	Data Time 0.001 (0.015)	Loss 3.0817 (3.1039)	Entropy 0.77092 (0.77638)	Top-1 acc 48.438 (49.626)	Top-5 acc 75.391 (73.032)	lr 0.02144
Train [30][1770/3239]	Time 0.586 (0.919)	Data Time 0.001 (0.015)	Loss 3.1564 (3.1046)	Entropy 0.77084 (0.77635)	Top-1 acc 46.094 (49.607)	Top-5 acc 74.609 (73.021)	lr 0.02144
Train [30][1780/3239]	Time 0.609 (0.919)	Data Time 0.003 (0.015)	Loss 3.1510 (3.1048)	Entropy 0.77090 (0.77632)	Top-1 acc 45.703 (49.603)	Top-5 acc 73.828 (73.023)	lr 0.02144
Train [30][1790/3239]	Time 0.639 (0.919)	Data Time 0.001 (0.015)	Loss 2.9103 (3.1043)	Entropy 0.77064 (0.77629)	Top-1 acc 53.516 (49.614)	Top-5 acc 75.391 (73.032)	lr 0.02144
Train [30][1800/3239]	Time 0.582 (0.919)	Data Time 0.001 (0.015)	Loss 3.1350 (3.1046)	Entropy 0.77041 (0.77625)	Top-1 acc 51.562 (49.618)	Top-5 acc 71.875 (73.025)	lr 0.02144
Train [30][1810/3239]	Time 0.588 (0.918)	Data Time 0.001 (0.015)	Loss 3.1323 (3.1046)	Entropy 0.77056 (0.77622)	Top-1 acc 48.047 (49.618)	Top-5 acc 71.094 (73.024)	lr 0.02144
Train [30][1820/3239]	Time 0.607 (0.918)	Data Time 0.001 (0.015)	Loss 3.2643 (3.1048)	Entropy 0.77047 (0.77619)	Top-1 acc 45.703 (49.611)	Top-5 acc 69.531 (73.018)	lr 0.02144
Train [30][1830/3239]	Time 0.605 (0.918)	Data Time 0.001 (0.015)	Loss 2.9768 (3.1046)	Entropy 0.77032 (0.77616)	Top-1 acc 56.641 (49.613)	Top-5 acc 76.953 (73.026)	lr 0.02144
Train [30][1840/3239]	Time 0.608 (0.917)	Data Time 0.001 (0.015)	Loss 3.0585 (3.1048)	Entropy 0.77084 (0.77613)	Top-1 acc 49.609 (49.611)	Top-5 acc 75.781 (73.018)	lr 0.02144
Train [30][1850/3239]	Time 0.600 (0.917)	Data Time 0.001 (0.015)	Loss 2.9657 (3.1043)	Entropy 0.77037 (0.77610)	Top-1 acc 49.219 (49.616)	Top-5 acc 78.125 (73.030)	lr 0.02144
Train [30][1860/3239]	Time 0.588 (0.917)	Data Time 0.001 (0.014)	Loss 3.1342 (3.1045)	Entropy 0.77037 (0.77607)	Top-1 acc 47.656 (49.611)	Top-5 acc 73.047 (73.026)	lr 0.02144
Train [30][1870/3239]	Time 0.740 (0.917)	Data Time 0.001 (0.014)	Loss 2.9904 (3.1043)	Entropy 0.76985 (0.77603)	Top-1 acc 52.734 (49.619)	Top-5 acc 76.953 (73.027)	lr 0.02144
Train [30][1880/3239]	Time 0.662 (0.917)	Data Time 0.001 (0.014)	Loss 2.9679 (3.1042)	Entropy 0.76948 (0.77600)	Top-1 acc 52.734 (49.623)	Top-5 acc 77.344 (73.036)	lr 0.02144
Train [30][1890/3239]	Time 0.610 (0.916)	Data Time 0.001 (0.014)	Loss 3.0268 (3.1042)	Entropy 0.76891 (0.77597)	Top-1 acc 53.516 (49.629)	Top-5 acc 74.609 (73.038)	lr 0.02143
Train [30][1900/3239]	Time 0.629 (0.916)	Data Time 0.001 (0.014)	Loss 2.9780 (3.1039)	Entropy 0.76836 (0.77593)	Top-1 acc 53.125 (49.639)	Top-5 acc 77.344 (73.044)	lr 0.02143
Train [30][1910/3239]	Time 0.571 (0.916)	Data Time 0.001 (0.014)	Loss 3.0858 (3.1040)	Entropy 0.76807 (0.77589)	Top-1 acc 52.344 (49.638)	Top-5 acc 73.828 (73.038)	lr 0.02143
Train [30][1920/3239]	Time 0.452 (0.915)	Data Time 0.001 (0.014)	Loss 3.2886 (3.1042)	Entropy 0.76826 (0.77585)	Top-1 acc 44.922 (49.638)	Top-5 acc 73.047 (73.028)	lr 0.02143
Train [30][1930/3239]	Time 0.632 (0.915)	Data Time 0.001 (0.014)	Loss 3.0100 (3.1044)	Entropy 0.76811 (0.77581)	Top-1 acc 54.688 (49.634)	Top-5 acc 74.609 (73.027)	lr 0.02143
Train [30][1940/3239]	Time 0.761 (0.915)	Data Time 0.001 (0.014)	Loss 2.8930 (3.1042)	Entropy 0.76808 (0.77577)	Top-1 acc 55.859 (49.640)	Top-5 acc 75.391 (73.034)	lr 0.02143
Train [30][1950/3239]	Time 0.624 (0.914)	Data Time 0.001 (0.014)	Loss 2.9188 (3.1042)	Entropy 0.76836 (0.77573)	Top-1 acc 51.172 (49.642)	Top-5 acc 82.422 (73.038)	lr 0.02143
Train [30][1960/3239]	Time 0.586 (0.914)	Data Time 0.001 (0.014)	Loss 3.1026 (3.1044)	Entropy 0.76810 (0.77569)	Top-1 acc 50.391 (49.644)	Top-5 acc 71.094 (73.033)	lr 0.02143
Train [30][1970/3239]	Time 0.618 (0.914)	Data Time 0.001 (0.014)	Loss 3.0434 (3.1044)	Entropy 0.76820 (0.77565)	Top-1 acc 52.734 (49.646)	Top-5 acc 72.656 (73.029)	lr 0.02143
Train [30][1980/3239]	Time 0.615 (0.914)	Data Time 0.001 (0.014)	Loss 2.9674 (3.1043)	Entropy 0.76801 (0.77561)	Top-1 acc 52.344 (49.650)	Top-5 acc 75.391 (73.029)	lr 0.02143
Train [30][1990/3239]	Time 0.594 (0.913)	Data Time 0.001 (0.014)	Loss 3.1777 (3.1044)	Entropy 0.76775 (0.77558)	Top-1 acc 48.828 (49.652)	Top-5 acc 72.656 (73.032)	lr 0.02143
Train [30][2000/3239]	Time 0.610 (0.913)	Data Time 0.001 (0.014)	Loss 2.9929 (3.1042)	Entropy 0.76807 (0.77554)	Top-1 acc 51.953 (49.653)	Top-5 acc 75.391 (73.033)	lr 0.02143
Train [30][2010/3239]	Time 0.596 (0.913)	Data Time 0.001 (0.014)	Loss 3.2470 (3.1044)	Entropy 0.76805 (0.77550)	Top-1 acc 45.703 (49.646)	Top-5 acc 68.359 (73.026)	lr 0.02143
Train [30][2020/3239]	Time 0.608 (0.913)	Data Time 0.001 (0.013)	Loss 3.0450 (3.1043)	Entropy 0.76791 (0.77546)	Top-1 acc 50.391 (49.645)	Top-5 acc 72.656 (73.029)	lr 0.02143
Train [30][2030/3239]	Time 0.800 (0.912)	Data Time 0.001 (0.013)	Loss 2.9732 (3.1044)	Entropy 0.76812 (0.77543)	Top-1 acc 50.781 (49.642)	Top-5 acc 78.516 (73.033)	lr 0.02142
Train [30][2040/3239]	Time 0.604 (0.912)	Data Time 0.001 (0.013)	Loss 3.2276 (3.1044)	Entropy 0.76814 (0.77539)	Top-1 acc 42.969 (49.642)	Top-5 acc 73.828 (73.033)	lr 0.02142
Train [30][2050/3239]	Time 0.600 (0.912)	Data Time 0.002 (0.013)	Loss 2.8893 (3.1042)	Entropy 0.76833 (0.77535)	Top-1 acc 53.125 (49.643)	Top-5 acc 78.516 (73.037)	lr 0.02142
Train [30][2060/3239]	Time 0.599 (0.912)	Data Time 0.001 (0.013)	Loss 2.9081 (3.1040)	Entropy 0.76870 (0.77532)	Top-1 acc 54.297 (49.645)	Top-5 acc 79.297 (73.041)	lr 0.02142
Train [30][2070/3239]	Time 0.601 (0.912)	Data Time 0.001 (0.013)	Loss 3.0171 (3.1038)	Entropy 0.76846 (0.77529)	Top-1 acc 51.562 (49.653)	Top-5 acc 73.438 (73.045)	lr 0.02142
Train [30][2080/3239]	Time 0.581 (0.911)	Data Time 0.001 (0.013)	Loss 3.0717 (3.1035)	Entropy 0.76819 (0.77525)	Top-1 acc 51.953 (49.663)	Top-5 acc 75.391 (73.053)	lr 0.02142
Train [30][2090/3239]	Time 0.594 (0.911)	Data Time 0.002 (0.013)	Loss 3.0070 (3.1036)	Entropy 0.76763 (0.77522)	Top-1 acc 50.781 (49.659)	Top-5 acc 75.391 (73.053)	lr 0.02142
Train [30][2100/3239]	Time 0.691 (0.911)	Data Time 0.001 (0.013)	Loss 3.2120 (3.1035)	Entropy 0.76776 (0.77518)	Top-1 acc 47.656 (49.661)	Top-5 acc 73.438 (73.055)	lr 0.02142
Train [30][2110/3239]	Time 0.631 (0.910)	Data Time 0.002 (0.013)	Loss 3.3309 (3.1033)	Entropy 0.76743 (0.77515)	Top-1 acc 42.969 (49.662)	Top-5 acc 68.750 (73.060)	lr 0.02142
Train [30][2120/3239]	Time 0.565 (0.910)	Data Time 0.001 (0.013)	Loss 3.0225 (3.1033)	Entropy 0.76754 (0.77511)	Top-1 acc 51.953 (49.657)	Top-5 acc 76.953 (73.062)	lr 0.02142
Train [30][2130/3239]	Time 0.617 (0.910)	Data Time 0.001 (0.013)	Loss 3.0292 (3.1033)	Entropy 0.76723 (0.77508)	Top-1 acc 53.906 (49.654)	Top-5 acc 73.828 (73.060)	lr 0.02142
Train [30][2140/3239]	Time 0.597 (0.910)	Data Time 0.001 (0.013)	Loss 3.0383 (3.1032)	Entropy 0.76725 (0.77504)	Top-1 acc 47.656 (49.658)	Top-5 acc 74.609 (73.062)	lr 0.02142
Train [30][2150/3239]	Time 0.633 (0.910)	Data Time 0.001 (0.013)	Loss 2.9313 (3.1031)	Entropy 0.76698 (0.77500)	Top-1 acc 53.906 (49.660)	Top-5 acc 75.391 (73.068)	lr 0.02142
Train [30][2160/3239]	Time 0.579 (0.909)	Data Time 0.001 (0.013)	Loss 3.2641 (3.1033)	Entropy 0.76663 (0.77496)	Top-1 acc 48.438 (49.657)	Top-5 acc 66.797 (73.059)	lr 0.02142
Train [30][2170/3239]	Time 0.640 (0.909)	Data Time 0.001 (0.013)	Loss 3.1185 (3.1032)	Entropy 0.76678 (0.77493)	Top-1 acc 46.875 (49.658)	Top-5 acc 73.047 (73.065)	lr 0.02141
Train [30][2180/3239]	Time 0.610 (0.909)	Data Time 0.001 (0.013)	Loss 3.0389 (3.1034)	Entropy 0.76667 (0.77489)	Top-1 acc 51.172 (49.660)	Top-5 acc 75.000 (73.063)	lr 0.02141
Train [30][2190/3239]	Time 0.718 (0.909)	Data Time 0.001 (0.013)	Loss 3.2151 (3.1035)	Entropy 0.76647 (0.77485)	Top-1 acc 49.609 (49.658)	Top-5 acc 71.094 (73.059)	lr 0.02141
Train [30][2200/3239]	Time 0.570 (0.909)	Data Time 0.001 (0.013)	Loss 3.0953 (3.1038)	Entropy 0.76640 (0.77481)	Top-1 acc 51.172 (49.652)	Top-5 acc 71.484 (73.055)	lr 0.02141
Train [30][2210/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.012)	Loss 2.9981 (3.1038)	Entropy 0.76630 (0.77477)	Top-1 acc 50.781 (49.648)	Top-5 acc 75.000 (73.056)	lr 0.02141
Train [30][2220/3239]	Time 0.658 (0.908)	Data Time 0.001 (0.012)	Loss 2.9681 (3.1038)	Entropy 0.76669 (0.77474)	Top-1 acc 52.344 (49.646)	Top-5 acc 76.562 (73.056)	lr 0.02141
Train [30][2230/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.012)	Loss 3.1806 (3.1039)	Entropy 0.76630 (0.77470)	Top-1 acc 48.047 (49.645)	Top-5 acc 71.094 (73.052)	lr 0.02141
Train [30][2240/3239]	Time 0.631 (0.908)	Data Time 0.001 (0.012)	Loss 3.1794 (3.1039)	Entropy 0.76637 (0.77466)	Top-1 acc 49.609 (49.640)	Top-5 acc 70.312 (73.050)	lr 0.02141
Train [30][2250/3239]	Time 0.473 (0.908)	Data Time 0.001 (0.012)	Loss 3.0330 (3.1040)	Entropy 0.76653 (0.77463)	Top-1 acc 50.000 (49.644)	Top-5 acc 73.828 (73.045)	lr 0.02141
Train [30][2260/3239]	Time 0.703 (0.907)	Data Time 0.001 (0.012)	Loss 3.1000 (3.1040)	Entropy 0.76638 (0.77459)	Top-1 acc 51.172 (49.636)	Top-5 acc 72.266 (73.043)	lr 0.02141
Train [30][2270/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.012)	Loss 3.1701 (3.1040)	Entropy 0.76645 (0.77455)	Top-1 acc 48.828 (49.640)	Top-5 acc 71.875 (73.044)	lr 0.02141
Train [30][2280/3239]	Time 0.624 (0.907)	Data Time 0.001 (0.012)	Loss 2.8833 (3.1038)	Entropy 0.76677 (0.77452)	Top-1 acc 52.344 (49.639)	Top-5 acc 78.906 (73.049)	lr 0.02141
Train [30][2290/3239]	Time 0.604 (0.907)	Data Time 0.001 (0.012)	Loss 2.9308 (3.1036)	Entropy 0.76606 (0.77448)	Top-1 acc 51.172 (49.642)	Top-5 acc 75.000 (73.054)	lr 0.02141
Train [30][2300/3239]	Time 0.594 (0.917)	Data Time 0.002 (0.012)	Loss 3.2738 (3.1038)	Entropy 0.76591 (0.77445)	Top-1 acc 45.703 (49.641)	Top-5 acc 70.703 (73.055)	lr 0.02141
Train [30][2310/3239]	Time 0.626 (0.917)	Data Time 0.001 (0.012)	Loss 3.0457 (3.1038)	Entropy 0.76557 (0.77441)	Top-1 acc 51.953 (49.639)	Top-5 acc 74.219 (73.052)	lr 0.02141
Train [30][2320/3239]	Time 0.602 (0.917)	Data Time 0.001 (0.012)	Loss 2.8316 (3.1037)	Entropy 0.76548 (0.77437)	Top-1 acc 53.516 (49.639)	Top-5 acc 80.859 (73.058)	lr 0.02140
Train [30][2330/3239]	Time 0.592 (0.917)	Data Time 0.002 (0.012)	Loss 3.0175 (3.1037)	Entropy 0.76557 (0.77433)	Top-1 acc 49.219 (49.641)	Top-5 acc 73.828 (73.059)	lr 0.02140
Train [30][2340/3239]	Time 0.626 (0.916)	Data Time 0.001 (0.012)	Loss 3.0796 (3.1034)	Entropy 0.76574 (0.77430)	Top-1 acc 49.219 (49.651)	Top-5 acc 73.438 (73.061)	lr 0.02140
Train [30][2350/3239]	Time 0.692 (0.916)	Data Time 0.001 (0.012)	Loss 2.8531 (3.1034)	Entropy 0.76602 (0.77426)	Top-1 acc 51.953 (49.650)	Top-5 acc 76.953 (73.058)	lr 0.02140
Train [30][2360/3239]	Time 0.591 (0.916)	Data Time 0.001 (0.012)	Loss 3.0502 (3.1034)	Entropy 0.76613 (0.77422)	Top-1 acc 53.125 (49.653)	Top-5 acc 73.828 (73.056)	lr 0.02140
Train [30][2370/3239]	Time 0.600 (0.916)	Data Time 0.001 (0.012)	Loss 3.1987 (3.1034)	Entropy 0.76581 (0.77419)	Top-1 acc 47.656 (49.651)	Top-5 acc 69.531 (73.059)	lr 0.02140
Train [30][2380/3239]	Time 0.630 (0.915)	Data Time 0.002 (0.012)	Loss 3.0333 (3.1032)	Entropy 0.76560 (0.77415)	Top-1 acc 51.172 (49.655)	Top-5 acc 76.562 (73.063)	lr 0.02140
Train [30][2390/3239]	Time 0.602 (0.915)	Data Time 0.001 (0.012)	Loss 3.0925 (3.1032)	Entropy 0.76579 (0.77412)	Top-1 acc 52.344 (49.653)	Top-5 acc 69.922 (73.058)	lr 0.02140
Train [30][2400/3239]	Time 0.599 (0.915)	Data Time 0.001 (0.012)	Loss 2.9623 (3.1032)	Entropy 0.76573 (0.77408)	Top-1 acc 53.516 (49.655)	Top-5 acc 74.219 (73.060)	lr 0.02140
Train [30][2410/3239]	Time 0.600 (0.915)	Data Time 0.001 (0.012)	Loss 2.9407 (3.1030)	Entropy 0.76554 (0.77405)	Top-1 acc 56.250 (49.660)	Top-5 acc 78.516 (73.064)	lr 0.02140
Train [30][2420/3239]	Time 0.677 (0.914)	Data Time 0.001 (0.012)	Loss 3.3005 (3.1032)	Entropy 0.76555 (0.77401)	Top-1 acc 44.922 (49.658)	Top-5 acc 70.312 (73.060)	lr 0.02140
Train [30][2430/3239]	Time 0.618 (0.914)	Data Time 0.001 (0.012)	Loss 3.1299 (3.1032)	Entropy 0.76586 (0.77398)	Top-1 acc 46.484 (49.659)	Top-5 acc 71.094 (73.061)	lr 0.02140
Train [30][2440/3239]	Time 0.605 (0.914)	Data Time 0.001 (0.011)	Loss 3.2259 (3.1028)	Entropy 0.76594 (0.77394)	Top-1 acc 46.875 (49.669)	Top-5 acc 68.359 (73.070)	lr 0.02140
Train [30][2450/3239]	Time 0.608 (0.914)	Data Time 0.001 (0.011)	Loss 3.1048 (3.1025)	Entropy 0.76600 (0.77391)	Top-1 acc 48.828 (49.672)	Top-5 acc 73.828 (73.076)	lr 0.02140
Train [30][2460/3239]	Time 0.628 (0.914)	Data Time 0.002 (0.011)	Loss 3.1488 (3.1026)	Entropy 0.76558 (0.77388)	Top-1 acc 47.656 (49.671)	Top-5 acc 70.312 (73.074)	lr 0.02139
Train [30][2470/3239]	Time 0.610 (0.914)	Data Time 0.001 (0.011)	Loss 3.0375 (3.1028)	Entropy 0.76586 (0.77385)	Top-1 acc 51.172 (49.669)	Top-5 acc 75.391 (73.071)	lr 0.02139
Train [30][2480/3239]	Time 0.630 (0.913)	Data Time 0.001 (0.011)	Loss 3.0811 (3.1028)	Entropy 0.76584 (0.77381)	Top-1 acc 47.266 (49.670)	Top-5 acc 73.828 (73.074)	lr 0.02139
Train [30][2490/3239]	Time 0.593 (0.913)	Data Time 0.001 (0.011)	Loss 3.2342 (3.1026)	Entropy 0.76623 (0.77378)	Top-1 acc 45.312 (49.671)	Top-5 acc 71.094 (73.079)	lr 0.02139
Train [30][2500/3239]	Time 0.595 (0.913)	Data Time 0.001 (0.011)	Loss 3.1633 (3.1024)	Entropy 0.76589 (0.77375)	Top-1 acc 46.875 (49.676)	Top-5 acc 70.312 (73.082)	lr 0.02139
Train [30][2510/3239]	Time 0.590 (0.913)	Data Time 0.002 (0.011)	Loss 3.1534 (3.1026)	Entropy 0.76579 (0.77372)	Top-1 acc 47.656 (49.672)	Top-5 acc 74.219 (73.082)	lr 0.02139
Train [30][2520/3239]	Time 0.592 (0.913)	Data Time 0.001 (0.011)	Loss 3.2900 (3.1024)	Entropy 0.76543 (0.77369)	Top-1 acc 48.047 (49.679)	Top-5 acc 69.922 (73.085)	lr 0.02139
Train [30][2530/3239]	Time 0.481 (0.912)	Data Time 0.001 (0.011)	Loss 3.0589 (3.1023)	Entropy 0.76492 (0.77366)	Top-1 acc 51.953 (49.682)	Top-5 acc 71.875 (73.087)	lr 0.02139
Train [30][2540/3239]	Time 0.595 (0.912)	Data Time 0.001 (0.011)	Loss 3.1496 (3.1022)	Entropy 0.76483 (0.77362)	Top-1 acc 51.953 (49.687)	Top-5 acc 70.312 (73.091)	lr 0.02139
Train [30][2550/3239]	Time 0.583 (0.912)	Data Time 0.001 (0.011)	Loss 3.3759 (3.1021)	Entropy 0.76514 (0.77359)	Top-1 acc 41.797 (49.689)	Top-5 acc 66.016 (73.091)	lr 0.02139
Train [30][2560/3239]	Time 0.486 (0.911)	Data Time 0.001 (0.011)	Loss 3.1496 (3.1021)	Entropy 0.76480 (0.77356)	Top-1 acc 49.609 (49.694)	Top-5 acc 72.266 (73.090)	lr 0.02139
Train [30][2570/3239]	Time 0.453 (0.911)	Data Time 0.001 (0.011)	Loss 3.2730 (3.1021)	Entropy 0.76460 (0.77352)	Top-1 acc 47.266 (49.696)	Top-5 acc 66.016 (73.088)	lr 0.02139
Train [30][2580/3239]	Time 0.694 (0.910)	Data Time 0.002 (0.011)	Loss 3.2480 (3.1019)	Entropy 0.76446 (0.77349)	Top-1 acc 47.656 (49.701)	Top-5 acc 68.750 (73.093)	lr 0.02139
Train [30][2590/3239]	Time 0.621 (0.910)	Data Time 0.001 (0.011)	Loss 3.0778 (3.1018)	Entropy 0.76458 (0.77345)	Top-1 acc 50.781 (49.703)	Top-5 acc 74.609 (73.093)	lr 0.02139
Train [30][2600/3239]	Time 0.588 (0.910)	Data Time 0.001 (0.011)	Loss 3.0131 (3.1017)	Entropy 0.76429 (0.77342)	Top-1 acc 52.734 (49.707)	Top-5 acc 74.219 (73.092)	lr 0.02138
Train [30][2610/3239]	Time 0.612 (0.910)	Data Time 0.003 (0.011)	Loss 3.0650 (3.1019)	Entropy 0.76416 (0.77338)	Top-1 acc 46.875 (49.701)	Top-5 acc 76.172 (73.089)	lr 0.02138
Train [30][2620/3239]	Time 0.578 (0.909)	Data Time 0.001 (0.011)	Loss 3.2805 (3.1023)	Entropy 0.76405 (0.77335)	Top-1 acc 47.656 (49.693)	Top-5 acc 68.359 (73.079)	lr 0.02138
Train [30][2630/3239]	Time 0.609 (0.909)	Data Time 0.001 (0.011)	Loss 2.8847 (3.1020)	Entropy 0.76418 (0.77331)	Top-1 acc 53.516 (49.700)	Top-5 acc 80.078 (73.083)	lr 0.02138
Train [30][2640/3239]	Time 0.611 (0.909)	Data Time 0.001 (0.011)	Loss 3.2766 (3.1022)	Entropy 0.76423 (0.77328)	Top-1 acc 48.047 (49.696)	Top-5 acc 69.141 (73.083)	lr 0.02138
Train [30][2650/3239]	Time 0.687 (0.909)	Data Time 0.001 (0.011)	Loss 3.1211 (3.1023)	Entropy 0.76389 (0.77324)	Top-1 acc 49.609 (49.697)	Top-5 acc 73.047 (73.081)	lr 0.02138
Train [30][2660/3239]	Time 0.622 (0.909)	Data Time 0.001 (0.011)	Loss 3.3004 (3.1025)	Entropy 0.76411 (0.77321)	Top-1 acc 44.141 (49.692)	Top-5 acc 69.922 (73.076)	lr 0.02138
Train [30][2670/3239]	Time 0.613 (0.909)	Data Time 0.001 (0.011)	Loss 3.0420 (3.1025)	Entropy 0.76407 (0.77317)	Top-1 acc 50.781 (49.694)	Top-5 acc 71.484 (73.075)	lr 0.02138
Train [30][2680/3239]	Time 0.592 (0.909)	Data Time 0.001 (0.011)	Loss 3.0874 (3.1025)	Entropy 0.76369 (0.77314)	Top-1 acc 46.094 (49.694)	Top-5 acc 74.609 (73.076)	lr 0.02138
Train [30][2690/3239]	Time 0.602 (0.908)	Data Time 0.001 (0.011)	Loss 2.9752 (3.1024)	Entropy 0.76311 (0.77310)	Top-1 acc 53.125 (49.694)	Top-5 acc 77.734 (73.076)	lr 0.02138
Train [30][2700/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.011)	Loss 3.0214 (3.1025)	Entropy 0.76317 (0.77306)	Top-1 acc 50.000 (49.690)	Top-5 acc 71.094 (73.074)	lr 0.02138
Train [30][2710/3239]	Time 0.591 (0.908)	Data Time 0.001 (0.011)	Loss 3.2252 (3.1026)	Entropy 0.76327 (0.77303)	Top-1 acc 46.094 (49.688)	Top-5 acc 73.828 (73.074)	lr 0.02138
Train [30][2720/3239]	Time 0.594 (0.908)	Data Time 0.001 (0.010)	Loss 3.1396 (3.1027)	Entropy 0.76302 (0.77299)	Top-1 acc 47.656 (49.688)	Top-5 acc 74.609 (73.073)	lr 0.02138
Train [30][2730/3239]	Time 0.614 (0.908)	Data Time 0.001 (0.010)	Loss 3.3788 (3.1028)	Entropy 0.76303 (0.77295)	Top-1 acc 46.484 (49.691)	Top-5 acc 66.406 (73.071)	lr 0.02138
Train [30][2740/3239]	Time 0.632 (0.907)	Data Time 0.001 (0.010)	Loss 3.1811 (3.1027)	Entropy 0.76316 (0.77292)	Top-1 acc 45.703 (49.690)	Top-5 acc 67.969 (73.072)	lr 0.02137
Train [30][2750/3239]	Time 0.608 (0.907)	Data Time 0.001 (0.010)	Loss 3.4108 (3.1029)	Entropy 0.76309 (0.77288)	Top-1 acc 43.359 (49.686)	Top-5 acc 66.406 (73.069)	lr 0.02137
Train [30][2760/3239]	Time 0.567 (0.907)	Data Time 0.001 (0.010)	Loss 3.3695 (3.1031)	Entropy 0.76324 (0.77285)	Top-1 acc 43.750 (49.687)	Top-5 acc 66.797 (73.065)	lr 0.02137
Train [30][2770/3239]	Time 0.587 (0.907)	Data Time 0.001 (0.010)	Loss 3.1511 (3.1030)	Entropy 0.76362 (0.77281)	Top-1 acc 52.344 (49.686)	Top-5 acc 71.094 (73.065)	lr 0.02137
Train [30][2780/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.010)	Loss 3.2510 (3.1033)	Entropy 0.76366 (0.77278)	Top-1 acc 47.266 (49.679)	Top-5 acc 71.484 (73.060)	lr 0.02137
Train [30][2790/3239]	Time 0.589 (0.907)	Data Time 0.001 (0.010)	Loss 3.0399 (3.1034)	Entropy 0.76346 (0.77275)	Top-1 acc 53.516 (49.671)	Top-5 acc 71.875 (73.055)	lr 0.02137
Train [30][2800/3239]	Time 0.598 (0.906)	Data Time 0.001 (0.010)	Loss 3.0074 (3.1033)	Entropy 0.76347 (0.77271)	Top-1 acc 50.000 (49.673)	Top-5 acc 71.484 (73.057)	lr 0.02137
Train [30][2810/3239]	Time 0.700 (0.906)	Data Time 0.001 (0.010)	Loss 3.0305 (3.1030)	Entropy 0.76353 (0.77268)	Top-1 acc 49.219 (49.681)	Top-5 acc 73.828 (73.063)	lr 0.02137
Train [30][2820/3239]	Time 0.601 (0.906)	Data Time 0.001 (0.010)	Loss 3.0918 (3.1031)	Entropy 0.76375 (0.77265)	Top-1 acc 50.781 (49.680)	Top-5 acc 73.047 (73.063)	lr 0.02137
Train [30][2830/3239]	Time 0.608 (0.906)	Data Time 0.001 (0.010)	Loss 3.1581 (3.1030)	Entropy 0.76395 (0.77262)	Top-1 acc 50.000 (49.688)	Top-5 acc 70.312 (73.065)	lr 0.02137
Train [30][2840/3239]	Time 0.592 (0.906)	Data Time 0.001 (0.010)	Loss 2.7788 (3.1027)	Entropy 0.76362 (0.77259)	Top-1 acc 56.641 (49.694)	Top-5 acc 82.812 (73.071)	lr 0.02137
Train [30][2850/3239]	Time 0.646 (0.906)	Data Time 0.001 (0.010)	Loss 3.1421 (3.1028)	Entropy 0.76362 (0.77256)	Top-1 acc 46.484 (49.689)	Top-5 acc 71.484 (73.069)	lr 0.02137
Train [30][2860/3239]	Time 0.605 (0.906)	Data Time 0.001 (0.010)	Loss 3.0067 (3.1027)	Entropy 0.76384 (0.77252)	Top-1 acc 53.516 (49.690)	Top-5 acc 74.609 (73.073)	lr 0.02137
Train [30][2870/3239]	Time 0.594 (0.905)	Data Time 0.001 (0.010)	Loss 3.2616 (3.1030)	Entropy 0.76373 (0.77249)	Top-1 acc 45.312 (49.684)	Top-5 acc 67.188 (73.067)	lr 0.02137
Train [30][2880/3239]	Time 0.692 (0.905)	Data Time 0.001 (0.010)	Loss 3.1192 (3.1030)	Entropy 0.76339 (0.77246)	Top-1 acc 50.000 (49.684)	Top-5 acc 72.266 (73.065)	lr 0.02136
Train [30][2890/3239]	Time 0.528 (0.905)	Data Time 0.001 (0.010)	Loss 3.2858 (3.1032)	Entropy 0.76327 (0.77243)	Top-1 acc 44.922 (49.678)	Top-5 acc 69.922 (73.062)	lr 0.02136
Train [30][2900/3239]	Time 0.642 (0.905)	Data Time 0.001 (0.010)	Loss 3.0736 (3.1034)	Entropy 0.76328 (0.77240)	Top-1 acc 51.172 (49.673)	Top-5 acc 72.656 (73.060)	lr 0.02136
Train [30][2910/3239]	Time 0.613 (0.905)	Data Time 0.001 (0.010)	Loss 3.0251 (3.1031)	Entropy 0.76319 (0.77237)	Top-1 acc 53.125 (49.680)	Top-5 acc 74.609 (73.066)	lr 0.02136
Train [30][2920/3239]	Time 0.587 (0.904)	Data Time 0.001 (0.010)	Loss 3.2367 (3.1033)	Entropy 0.76326 (0.77234)	Top-1 acc 48.438 (49.676)	Top-5 acc 69.922 (73.062)	lr 0.02136
Train [30][2930/3239]	Time 0.584 (0.904)	Data Time 0.001 (0.010)	Loss 3.0630 (3.1035)	Entropy 0.76283 (0.77231)	Top-1 acc 50.391 (49.675)	Top-5 acc 76.953 (73.059)	lr 0.02136
Train [30][2940/3239]	Time 0.625 (0.904)	Data Time 0.001 (0.010)	Loss 2.9581 (3.1033)	Entropy 0.76264 (0.77227)	Top-1 acc 57.031 (49.683)	Top-5 acc 75.781 (73.063)	lr 0.02136
Train [30][2950/3239]	Time 0.695 (0.913)	Data Time 0.005 (0.010)	Loss 2.8613 (3.1033)	Entropy 0.76274 (0.77224)	Top-1 acc 52.734 (49.683)	Top-5 acc 77.344 (73.064)	lr 0.02136
Train [30][2960/3239]	Time 0.570 (0.913)	Data Time 0.002 (0.010)	Loss 2.9872 (3.1034)	Entropy 0.76242 (0.77221)	Top-1 acc 51.953 (49.681)	Top-5 acc 74.609 (73.062)	lr 0.02136
Train [30][2970/3239]	Time 0.739 (0.913)	Data Time 0.002 (0.010)	Loss 3.0047 (3.1034)	Entropy 0.76192 (0.77217)	Top-1 acc 53.125 (49.684)	Top-5 acc 76.172 (73.062)	lr 0.02136
Train [30][2980/3239]	Time 0.599 (0.912)	Data Time 0.001 (0.010)	Loss 3.1237 (3.1034)	Entropy 0.76188 (0.77214)	Top-1 acc 47.656 (49.685)	Top-5 acc 71.875 (73.064)	lr 0.02136
Train [30][2990/3239]	Time 0.589 (0.912)	Data Time 0.001 (0.010)	Loss 3.2061 (3.1035)	Entropy 0.76183 (0.77211)	Top-1 acc 46.094 (49.681)	Top-5 acc 68.750 (73.062)	lr 0.02136
Train [30][3000/3239]	Time 0.628 (0.912)	Data Time 0.001 (0.010)	Loss 3.0460 (3.1036)	Entropy 0.76187 (0.77207)	Top-1 acc 50.781 (49.679)	Top-5 acc 70.703 (73.059)	lr 0.02136
Train [30][3010/3239]	Time 0.575 (0.912)	Data Time 0.001 (0.010)	Loss 2.8002 (3.1034)	Entropy 0.76175 (0.77204)	Top-1 acc 55.859 (49.679)	Top-5 acc 79.688 (73.062)	lr 0.02136
Train [30][3020/3239]	Time 0.615 (0.912)	Data Time 0.001 (0.010)	Loss 2.9600 (3.1035)	Entropy 0.76137 (0.77200)	Top-1 acc 51.953 (49.676)	Top-5 acc 75.000 (73.060)	lr 0.02135
Train [30][3030/3239]	Time 0.607 (0.911)	Data Time 0.001 (0.010)	Loss 2.9622 (3.1034)	Entropy 0.76158 (0.77197)	Top-1 acc 55.078 (49.683)	Top-5 acc 77.344 (73.063)	lr 0.02135
Train [30][3040/3239]	Time 0.704 (0.911)	Data Time 0.001 (0.010)	Loss 2.9972 (3.1033)	Entropy 0.76144 (0.77193)	Top-1 acc 55.469 (49.682)	Top-5 acc 71.094 (73.060)	lr 0.02135
Train [30][3050/3239]	Time 0.593 (0.911)	Data Time 0.001 (0.010)	Loss 3.2965 (3.1033)	Entropy 0.76191 (0.77190)	Top-1 acc 46.875 (49.681)	Top-5 acc 66.016 (73.058)	lr 0.02135
Train [30][3060/3239]	Time 0.606 (0.911)	Data Time 0.002 (0.010)	Loss 3.1687 (3.1032)	Entropy 0.76190 (0.77187)	Top-1 acc 50.391 (49.683)	Top-5 acc 74.219 (73.059)	lr 0.02135
Train [30][3070/3239]	Time 0.613 (0.911)	Data Time 0.002 (0.010)	Loss 3.1360 (3.1033)	Entropy 0.76187 (0.77183)	Top-1 acc 47.656 (49.682)	Top-5 acc 70.312 (73.058)	lr 0.02135
Train [30][3080/3239]	Time 0.578 (0.911)	Data Time 0.001 (0.010)	Loss 3.2767 (3.1034)	Entropy 0.76210 (0.77180)	Top-1 acc 44.531 (49.677)	Top-5 acc 68.359 (73.058)	lr 0.02135
Train [30][3090/3239]	Time 0.600 (0.911)	Data Time 0.001 (0.009)	Loss 3.1210 (3.1035)	Entropy 0.76188 (0.77177)	Top-1 acc 49.609 (49.675)	Top-5 acc 73.828 (73.054)	lr 0.02135
Train [30][3100/3239]	Time 0.607 (0.910)	Data Time 0.001 (0.009)	Loss 3.1107 (3.1036)	Entropy 0.76175 (0.77174)	Top-1 acc 50.000 (49.677)	Top-5 acc 72.266 (73.052)	lr 0.02135
Train [30][3110/3239]	Time 0.595 (0.910)	Data Time 0.001 (0.009)	Loss 3.1893 (3.1036)	Entropy 0.76214 (0.77171)	Top-1 acc 49.609 (49.675)	Top-5 acc 74.219 (73.054)	lr 0.02135
Train [30][3120/3239]	Time 0.618 (0.910)	Data Time 0.001 (0.009)	Loss 3.0269 (3.1035)	Entropy 0.76174 (0.77168)	Top-1 acc 53.906 (49.677)	Top-5 acc 73.828 (73.054)	lr 0.02135
Train [30][3130/3239]	Time 0.691 (0.910)	Data Time 0.001 (0.009)	Loss 2.9837 (3.1036)	Entropy 0.76203 (0.77164)	Top-1 acc 52.734 (49.674)	Top-5 acc 74.609 (73.052)	lr 0.02135
Train [30][3140/3239]	Time 0.628 (0.910)	Data Time 0.001 (0.009)	Loss 3.2646 (3.1038)	Entropy 0.76225 (0.77161)	Top-1 acc 44.531 (49.669)	Top-5 acc 69.531 (73.050)	lr 0.02135
Train [30][3150/3239]	Time 0.564 (0.910)	Data Time 0.001 (0.009)	Loss 2.9455 (3.1037)	Entropy 0.76231 (0.77158)	Top-1 acc 51.172 (49.670)	Top-5 acc 76.172 (73.052)	lr 0.02135
Train [30][3160/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.009)	Loss 3.2297 (3.1039)	Entropy 0.76231 (0.77156)	Top-1 acc 43.359 (49.668)	Top-5 acc 74.609 (73.046)	lr 0.02134
Train [30][3170/3239]	Time 0.591 (0.909)	Data Time 0.001 (0.009)	Loss 2.9150 (3.1038)	Entropy 0.76238 (0.77153)	Top-1 acc 51.953 (49.672)	Top-5 acc 76.172 (73.045)	lr 0.02134
Train [30][3180/3239]	Time 0.566 (0.909)	Data Time 0.000 (0.009)	Loss 3.0560 (3.1038)	Entropy 0.76270 (0.77150)	Top-1 acc 48.438 (49.672)	Top-5 acc 77.344 (73.048)	lr 0.02134
Train [30][3190/3239]	Time 0.558 (0.909)	Data Time 0.000 (0.009)	Loss 3.2146 (3.1039)	Entropy 0.76295 (0.77147)	Top-1 acc 47.266 (49.672)	Top-5 acc 71.875 (73.046)	lr 0.02134
Train [30][3200/3239]	Time 0.672 (0.909)	Data Time 0.000 (0.009)	Loss 3.0259 (3.1040)	Entropy 0.76311 (0.77144)	Top-1 acc 50.000 (49.668)	Top-5 acc 75.391 (73.042)	lr 0.02134
Train [30][3210/3239]	Time 0.592 (0.909)	Data Time 0.000 (0.009)	Loss 3.0835 (3.1041)	Entropy 0.76307 (0.77142)	Top-1 acc 46.484 (49.667)	Top-5 acc 73.828 (73.043)	lr 0.02134
Train [30][3220/3239]	Time 0.600 (0.908)	Data Time 0.000 (0.009)	Loss 3.0058 (3.1041)	Entropy 0.76310 (0.77139)	Top-1 acc 48.438 (49.665)	Top-5 acc 76.562 (73.041)	lr 0.02134
Train [30][3230/3239]	Time 0.618 (0.908)	Data Time 0.000 (0.009)	Loss 3.0544 (3.1040)	Entropy 0.76336 (0.77137)	Top-1 acc 48.828 (49.663)	Top-5 acc 71.875 (73.042)	lr 0.02134
Train [30][3239/3239]	Time 1.579 (0.908)	Data Time 0.000 (0.009)	Loss 3.3979 (3.1042)	Entropy 0.76327 (0.77134)	Top-1 acc 46.914 (49.657)	Top-5 acc 67.901 (73.038)	lr 0.02134
==========Valid [30/120]	loss 1.820	top-1 acc 59.217 (59.217)	top-5 acc 81.297	Train top-1 49.657	top-5 73.038	Entropy 0.76327	Latency-None: 0.000ms	Flops: 539.76M
Train [31][0/3239]	Time 28.784 (28.784)	Data Time 27.029 (27.029)	Loss 3.0437 (3.0437)	Entropy 0.76319 (0.76319)	Top-1 acc 51.172 (51.172)	Top-5 acc 74.219 (74.219)	lr 0.02134
Train [31][10/3239]	Time 0.627 (3.437)	Data Time 0.002 (2.459)	Loss 3.3107 (3.1462)	Entropy 0.76319 (0.76312)	Top-1 acc 43.359 (48.686)	Top-5 acc 69.141 (71.982)	lr 0.02134
Train [31][20/3239]	Time 0.607 (2.217)	Data Time 0.001 (1.289)	Loss 2.9742 (3.0871)	Entropy 0.76311 (0.76314)	Top-1 acc 48.047 (49.851)	Top-5 acc 75.000 (73.400)	lr 0.02134
Train [31][30/3239]	Time 0.774 (1.823)	Data Time 0.001 (0.874)	Loss 3.1029 (3.0884)	Entropy 0.76304 (0.76310)	Top-1 acc 48.438 (49.546)	Top-5 acc 73.438 (73.349)	lr 0.02134
Train [31][40/3239]	Time 0.591 (1.590)	Data Time 0.001 (0.661)	Loss 3.1841 (3.1134)	Entropy 0.76302 (0.76308)	Top-1 acc 51.562 (49.162)	Top-5 acc 69.141 (72.961)	lr 0.02134
Train [31][50/3239]	Time 0.628 (1.450)	Data Time 0.001 (0.532)	Loss 3.1394 (3.0971)	Entropy 0.76314 (0.76308)	Top-1 acc 46.875 (49.494)	Top-5 acc 71.484 (73.353)	lr 0.02134
Train [31][60/3239]	Time 0.595 (1.357)	Data Time 0.001 (0.445)	Loss 3.1391 (3.0928)	Entropy 0.76295 (0.76307)	Top-1 acc 46.094 (49.456)	Top-5 acc 71.484 (73.297)	lr 0.02133
Train [31][70/3239]	Time 0.618 (1.287)	Data Time 0.001 (0.383)	Loss 2.9942 (3.0869)	Entropy 0.76237 (0.76301)	Top-1 acc 51.953 (49.499)	Top-5 acc 74.609 (73.393)	lr 0.02133
Train [31][80/3239]	Time 0.615 (1.233)	Data Time 0.001 (0.336)	Loss 3.1198 (3.0848)	Entropy 0.76223 (0.76293)	Top-1 acc 48.828 (49.658)	Top-5 acc 73.828 (73.481)	lr 0.02133
Train [31][90/3239]	Time 0.615 (1.190)	Data Time 0.001 (0.299)	Loss 3.0358 (3.0839)	Entropy 0.76257 (0.76287)	Top-1 acc 52.344 (49.803)	Top-5 acc 75.391 (73.489)	lr 0.02133
Train [31][100/3239]	Time 0.632 (1.156)	Data Time 0.001 (0.270)	Loss 3.1517 (3.0831)	Entropy 0.76238 (0.76283)	Top-1 acc 48.828 (49.988)	Top-5 acc 71.094 (73.445)	lr 0.02133
Train [31][110/3239]	Time 0.594 (1.130)	Data Time 0.001 (0.245)	Loss 2.9601 (3.0816)	Entropy 0.76227 (0.76279)	Top-1 acc 55.078 (50.081)	Top-5 acc 78.125 (73.466)	lr 0.02133
Train [31][120/3239]	Time 0.608 (1.108)	Data Time 0.001 (0.226)	Loss 2.9392 (3.0797)	Entropy 0.76257 (0.76276)	Top-1 acc 55.078 (50.139)	Top-5 acc 76.562 (73.376)	lr 0.02133
Train [31][130/3239]	Time 0.647 (1.089)	Data Time 0.001 (0.208)	Loss 3.1527 (3.0764)	Entropy 0.76276 (0.76275)	Top-1 acc 51.562 (50.304)	Top-5 acc 70.703 (73.423)	lr 0.02133
Train [31][140/3239]	Time 0.623 (1.072)	Data Time 0.002 (0.194)	Loss 3.0691 (3.0706)	Entropy 0.76221 (0.76275)	Top-1 acc 46.875 (50.443)	Top-5 acc 76.562 (73.537)	lr 0.02133
Train [31][150/3239]	Time 0.603 (1.059)	Data Time 0.001 (0.181)	Loss 3.0913 (3.0660)	Entropy 0.76223 (0.76271)	Top-1 acc 49.609 (50.471)	Top-5 acc 73.047 (73.668)	lr 0.02133
Train [31][160/3239]	Time 0.605 (1.046)	Data Time 0.001 (0.170)	Loss 3.0514 (3.0655)	Entropy 0.76192 (0.76267)	Top-1 acc 50.781 (50.454)	Top-5 acc 73.047 (73.646)	lr 0.02133
Train [31][170/3239]	Time 0.614 (1.036)	Data Time 0.001 (0.160)	Loss 3.1185 (3.0621)	Entropy 0.76181 (0.76263)	Top-1 acc 51.953 (50.583)	Top-5 acc 72.266 (73.689)	lr 0.02133
Train [31][180/3239]	Time 0.625 (1.026)	Data Time 0.001 (0.151)	Loss 3.1646 (3.0620)	Entropy 0.76228 (0.76259)	Top-1 acc 49.219 (50.622)	Top-5 acc 71.875 (73.748)	lr 0.02133
Train [31][190/3239]	Time 0.691 (1.018)	Data Time 0.001 (0.143)	Loss 3.1286 (3.0617)	Entropy 0.76236 (0.76257)	Top-1 acc 49.609 (50.554)	Top-5 acc 73.047 (73.750)	lr 0.02133
Train [31][200/3239]	Time 0.597 (1.011)	Data Time 0.001 (0.136)	Loss 3.1439 (3.0601)	Entropy 0.76167 (0.76255)	Top-1 acc 50.000 (50.577)	Top-5 acc 70.312 (73.783)	lr 0.02132
Train [31][210/3239]	Time 0.611 (1.004)	Data Time 0.001 (0.130)	Loss 3.0674 (3.0587)	Entropy 0.76151 (0.76250)	Top-1 acc 50.781 (50.607)	Top-5 acc 73.047 (73.808)	lr 0.02132
Train [31][220/3239]	Time 0.618 (0.998)	Data Time 0.001 (0.124)	Loss 2.8267 (3.0612)	Entropy 0.76177 (0.76246)	Top-1 acc 53.516 (50.544)	Top-5 acc 76.953 (73.763)	lr 0.02132
Train [31][230/3239]	Time 0.620 (0.991)	Data Time 0.001 (0.119)	Loss 3.1815 (3.0622)	Entropy 0.76174 (0.76243)	Top-1 acc 45.703 (50.516)	Top-5 acc 72.266 (73.764)	lr 0.02132
Train [31][240/3239]	Time 0.584 (0.985)	Data Time 0.001 (0.114)	Loss 3.0798 (3.0613)	Entropy 0.76195 (0.76240)	Top-1 acc 51.172 (50.556)	Top-5 acc 73.438 (73.792)	lr 0.02132
Train [31][250/3239]	Time 0.575 (0.980)	Data Time 0.001 (0.110)	Loss 3.1630 (3.0624)	Entropy 0.76184 (0.76239)	Top-1 acc 47.266 (50.526)	Top-5 acc 71.484 (73.769)	lr 0.02132
Train [31][260/3239]	Time 0.671 (0.975)	Data Time 0.001 (0.105)	Loss 2.9576 (3.0595)	Entropy 0.76183 (0.76237)	Top-1 acc 52.734 (50.557)	Top-5 acc 71.875 (73.812)	lr 0.02132
Train [31][270/3239]	Time 0.594 (0.969)	Data Time 0.001 (0.102)	Loss 3.2230 (3.0627)	Entropy 0.76160 (0.76234)	Top-1 acc 47.266 (50.493)	Top-5 acc 73.047 (73.757)	lr 0.02132
Train [31][280/3239]	Time 0.627 (0.966)	Data Time 0.001 (0.098)	Loss 3.1022 (3.0672)	Entropy 0.76135 (0.76231)	Top-1 acc 49.609 (50.441)	Top-5 acc 73.828 (73.659)	lr 0.02132
Train [31][290/3239]	Time 0.606 (0.962)	Data Time 0.001 (0.095)	Loss 3.0362 (3.0682)	Entropy 0.76136 (0.76227)	Top-1 acc 54.297 (50.396)	Top-5 acc 73.047 (73.638)	lr 0.02132
Train [31][300/3239]	Time 0.596 (0.958)	Data Time 0.001 (0.092)	Loss 3.0308 (3.0706)	Entropy 0.76156 (0.76224)	Top-1 acc 51.953 (50.382)	Top-5 acc 73.828 (73.611)	lr 0.02132
Train [31][310/3239]	Time 0.657 (0.955)	Data Time 0.003 (0.089)	Loss 2.9644 (3.0694)	Entropy 0.76162 (0.76222)	Top-1 acc 50.781 (50.394)	Top-5 acc 75.781 (73.650)	lr 0.02132
Train [31][320/3239]	Time 0.633 (0.953)	Data Time 0.001 (0.086)	Loss 3.2847 (3.0723)	Entropy 0.76168 (0.76220)	Top-1 acc 47.656 (50.366)	Top-5 acc 71.094 (73.590)	lr 0.02132
Train [31][330/3239]	Time 0.589 (0.950)	Data Time 0.001 (0.084)	Loss 3.0579 (3.0709)	Entropy 0.76152 (0.76219)	Top-1 acc 49.609 (50.378)	Top-5 acc 71.875 (73.629)	lr 0.02132
Train [31][340/3239]	Time 0.624 (0.948)	Data Time 0.001 (0.081)	Loss 3.0109 (3.0697)	Entropy 0.76161 (0.76217)	Top-1 acc 48.438 (50.387)	Top-5 acc 76.172 (73.633)	lr 0.02131
Train [31][350/3239]	Time 0.687 (0.946)	Data Time 0.001 (0.079)	Loss 3.0377 (3.0701)	Entropy 0.76133 (0.76215)	Top-1 acc 52.734 (50.361)	Top-5 acc 73.828 (73.611)	lr 0.02131
Train [31][360/3239]	Time 0.596 (0.943)	Data Time 0.001 (0.077)	Loss 3.0668 (3.0725)	Entropy 0.76102 (0.76212)	Top-1 acc 53.906 (50.322)	Top-5 acc 71.094 (73.561)	lr 0.02131
Train [31][370/3239]	Time 0.605 (1.009)	Data Time 0.002 (0.075)	Loss 3.2661 (3.0738)	Entropy 0.76066 (0.76209)	Top-1 acc 45.312 (50.284)	Top-5 acc 70.312 (73.543)	lr 0.02131
Train [31][380/3239]	Time 0.576 (1.005)	Data Time 0.001 (0.073)	Loss 3.3317 (3.0752)	Entropy 0.76065 (0.76205)	Top-1 acc 46.875 (50.251)	Top-5 acc 67.578 (73.500)	lr 0.02131
Train [31][390/3239]	Time 0.620 (1.001)	Data Time 0.001 (0.071)	Loss 2.8970 (3.0756)	Entropy 0.76067 (0.76201)	Top-1 acc 55.469 (50.204)	Top-5 acc 75.781 (73.500)	lr 0.02131
Train [31][400/3239]	Time 0.600 (0.998)	Data Time 0.001 (0.069)	Loss 2.8891 (3.0741)	Entropy 0.76069 (0.76198)	Top-1 acc 54.297 (50.228)	Top-5 acc 75.391 (73.544)	lr 0.02131
Train [31][410/3239]	Time 0.608 (0.995)	Data Time 0.001 (0.068)	Loss 2.9757 (3.0738)	Entropy 0.76115 (0.76195)	Top-1 acc 50.781 (50.230)	Top-5 acc 76.172 (73.539)	lr 0.02131
Train [31][420/3239]	Time 0.693 (0.991)	Data Time 0.001 (0.066)	Loss 3.1122 (3.0744)	Entropy 0.76032 (0.76192)	Top-1 acc 44.531 (50.220)	Top-5 acc 72.266 (73.526)	lr 0.02131
Train [31][430/3239]	Time 0.587 (0.988)	Data Time 0.001 (0.065)	Loss 2.9483 (3.0758)	Entropy 0.75999 (0.76188)	Top-1 acc 54.297 (50.187)	Top-5 acc 76.172 (73.505)	lr 0.02131
Train [31][440/3239]	Time 0.619 (0.986)	Data Time 0.001 (0.063)	Loss 3.2392 (3.0771)	Entropy 0.75978 (0.76184)	Top-1 acc 44.922 (50.163)	Top-5 acc 65.625 (73.461)	lr 0.02131
Train [31][450/3239]	Time 0.573 (0.983)	Data Time 0.001 (0.062)	Loss 3.3549 (3.0772)	Entropy 0.75945 (0.76179)	Top-1 acc 45.703 (50.160)	Top-5 acc 68.359 (73.469)	lr 0.02131
Train [31][460/3239]	Time 0.584 (0.980)	Data Time 0.001 (0.061)	Loss 3.1095 (3.0777)	Entropy 0.75953 (0.76174)	Top-1 acc 50.391 (50.152)	Top-5 acc 69.922 (73.459)	lr 0.02131
Train [31][470/3239]	Time 0.640 (0.978)	Data Time 0.001 (0.059)	Loss 3.2814 (3.0784)	Entropy 0.75950 (0.76169)	Top-1 acc 46.484 (50.123)	Top-5 acc 69.531 (73.456)	lr 0.02131
Train [31][480/3239]	Time 0.644 (0.975)	Data Time 0.001 (0.058)	Loss 3.2619 (3.0793)	Entropy 0.75989 (0.76165)	Top-1 acc 46.484 (50.097)	Top-5 acc 68.750 (73.452)	lr 0.02130
Train [31][490/3239]	Time 0.583 (0.973)	Data Time 0.001 (0.057)	Loss 2.9890 (3.0795)	Entropy 0.75949 (0.76161)	Top-1 acc 49.219 (50.106)	Top-5 acc 76.953 (73.474)	lr 0.02130
Train [31][500/3239]	Time 0.593 (0.971)	Data Time 0.001 (0.056)	Loss 2.8474 (3.0789)	Entropy 0.75936 (0.76156)	Top-1 acc 58.594 (50.133)	Top-5 acc 79.688 (73.491)	lr 0.02130
Train [31][510/3239]	Time 0.707 (0.970)	Data Time 0.001 (0.055)	Loss 3.0603 (3.0779)	Entropy 0.75938 (0.76152)	Top-1 acc 52.734 (50.166)	Top-5 acc 75.781 (73.502)	lr 0.02130
Train [31][520/3239]	Time 0.606 (0.968)	Data Time 0.001 (0.054)	Loss 3.0318 (3.0783)	Entropy 0.75956 (0.76148)	Top-1 acc 52.344 (50.150)	Top-5 acc 73.047 (73.496)	lr 0.02130
Train [31][530/3239]	Time 0.633 (0.965)	Data Time 0.002 (0.053)	Loss 2.9878 (3.0767)	Entropy 0.75929 (0.76144)	Top-1 acc 52.344 (50.209)	Top-5 acc 74.219 (73.521)	lr 0.02130
Train [31][540/3239]	Time 0.470 (0.963)	Data Time 0.001 (0.052)	Loss 3.1527 (3.0775)	Entropy 0.75915 (0.76140)	Top-1 acc 49.609 (50.173)	Top-5 acc 71.094 (73.502)	lr 0.02130
Train [31][550/3239]	Time 0.610 (0.961)	Data Time 0.001 (0.051)	Loss 3.0294 (3.0770)	Entropy 0.75936 (0.76136)	Top-1 acc 53.906 (50.192)	Top-5 acc 71.875 (73.510)	lr 0.02130
Train [31][560/3239]	Time 0.607 (0.959)	Data Time 0.001 (0.050)	Loss 3.0151 (3.0766)	Entropy 0.75869 (0.76132)	Top-1 acc 53.516 (50.205)	Top-5 acc 76.172 (73.523)	lr 0.02130
Train [31][570/3239]	Time 0.645 (0.957)	Data Time 0.001 (0.049)	Loss 3.1534 (3.0752)	Entropy 0.75845 (0.76127)	Top-1 acc 48.828 (50.233)	Top-5 acc 72.656 (73.556)	lr 0.02130
Train [31][580/3239]	Time 0.717 (0.956)	Data Time 0.001 (0.049)	Loss 2.9892 (3.0752)	Entropy 0.75854 (0.76122)	Top-1 acc 50.781 (50.235)	Top-5 acc 72.656 (73.560)	lr 0.02130
Train [31][590/3239]	Time 0.593 (0.954)	Data Time 0.001 (0.048)	Loss 2.9315 (3.0755)	Entropy 0.75850 (0.76118)	Top-1 acc 51.172 (50.221)	Top-5 acc 75.000 (73.551)	lr 0.02130
Train [31][600/3239]	Time 0.636 (0.953)	Data Time 0.001 (0.047)	Loss 2.9493 (3.0764)	Entropy 0.75815 (0.76113)	Top-1 acc 49.219 (50.207)	Top-5 acc 79.688 (73.551)	lr 0.02130
Train [31][610/3239]	Time 0.592 (0.952)	Data Time 0.001 (0.046)	Loss 2.8754 (3.0762)	Entropy 0.75813 (0.76108)	Top-1 acc 52.734 (50.218)	Top-5 acc 76.953 (73.562)	lr 0.02130
Train [31][620/3239]	Time 0.614 (0.950)	Data Time 0.002 (0.046)	Loss 3.2928 (3.0771)	Entropy 0.75818 (0.76104)	Top-1 acc 44.141 (50.192)	Top-5 acc 69.922 (73.551)	lr 0.02129
Train [31][630/3239]	Time 0.627 (0.949)	Data Time 0.001 (0.045)	Loss 3.0450 (3.0768)	Entropy 0.75785 (0.76099)	Top-1 acc 48.828 (50.188)	Top-5 acc 72.656 (73.551)	lr 0.02129
Train [31][640/3239]	Time 0.616 (0.948)	Data Time 0.001 (0.044)	Loss 2.9723 (3.0771)	Entropy 0.75786 (0.76094)	Top-1 acc 53.906 (50.182)	Top-5 acc 75.781 (73.547)	lr 0.02129
Train [31][650/3239]	Time 0.620 (0.947)	Data Time 0.001 (0.043)	Loss 2.9433 (3.0767)	Entropy 0.75779 (0.76089)	Top-1 acc 53.906 (50.183)	Top-5 acc 76.172 (73.540)	lr 0.02129
Train [31][660/3239]	Time 0.619 (0.945)	Data Time 0.001 (0.043)	Loss 3.2465 (3.0766)	Entropy 0.75782 (0.76085)	Top-1 acc 46.875 (50.189)	Top-5 acc 71.094 (73.539)	lr 0.02129
Train [31][670/3239]	Time 0.642 (0.944)	Data Time 0.001 (0.042)	Loss 2.7903 (3.0765)	Entropy 0.75719 (0.76080)	Top-1 acc 58.984 (50.214)	Top-5 acc 78.125 (73.543)	lr 0.02129
Train [31][680/3239]	Time 0.590 (0.943)	Data Time 0.001 (0.042)	Loss 2.9576 (3.0774)	Entropy 0.75689 (0.76074)	Top-1 acc 51.953 (50.189)	Top-5 acc 76.172 (73.529)	lr 0.02129
Train [31][690/3239]	Time 0.609 (0.942)	Data Time 0.001 (0.041)	Loss 2.9513 (3.0767)	Entropy 0.75710 (0.76069)	Top-1 acc 50.781 (50.202)	Top-5 acc 75.781 (73.534)	lr 0.02129
Train [31][700/3239]	Time 0.594 (0.940)	Data Time 0.001 (0.041)	Loss 3.3806 (3.0772)	Entropy 0.75712 (0.76064)	Top-1 acc 43.359 (50.203)	Top-5 acc 68.750 (73.533)	lr 0.02129
Train [31][710/3239]	Time 0.603 (0.939)	Data Time 0.001 (0.040)	Loss 3.3855 (3.0783)	Entropy 0.75738 (0.76059)	Top-1 acc 44.531 (50.179)	Top-5 acc 66.016 (73.508)	lr 0.02129
Train [31][720/3239]	Time 0.579 (0.938)	Data Time 0.001 (0.039)	Loss 3.0462 (3.0787)	Entropy 0.75743 (0.76054)	Top-1 acc 51.562 (50.180)	Top-5 acc 74.609 (73.511)	lr 0.02129
Train [31][730/3239]	Time 0.590 (0.937)	Data Time 0.001 (0.039)	Loss 2.9826 (3.0785)	Entropy 0.75749 (0.76050)	Top-1 acc 49.609 (50.185)	Top-5 acc 77.344 (73.528)	lr 0.02129
Train [31][740/3239]	Time 0.708 (0.936)	Data Time 0.001 (0.038)	Loss 3.0863 (3.0795)	Entropy 0.75726 (0.76046)	Top-1 acc 48.438 (50.164)	Top-5 acc 71.484 (73.504)	lr 0.02129
Train [31][750/3239]	Time 0.589 (0.935)	Data Time 0.001 (0.038)	Loss 3.1628 (3.0801)	Entropy 0.75747 (0.76042)	Top-1 acc 47.656 (50.164)	Top-5 acc 69.922 (73.479)	lr 0.02129
Train [31][760/3239]	Time 0.619 (0.934)	Data Time 0.001 (0.037)	Loss 2.9936 (3.0797)	Entropy 0.75727 (0.76038)	Top-1 acc 53.516 (50.183)	Top-5 acc 75.391 (73.474)	lr 0.02128
Train [31][770/3239]	Time 0.621 (0.933)	Data Time 0.001 (0.037)	Loss 3.0389 (3.0802)	Entropy 0.75696 (0.76034)	Top-1 acc 50.391 (50.189)	Top-5 acc 74.609 (73.464)	lr 0.02128
Train [31][780/3239]	Time 0.627 (0.932)	Data Time 0.001 (0.037)	Loss 2.9855 (3.0806)	Entropy 0.75739 (0.76029)	Top-1 acc 51.562 (50.186)	Top-5 acc 76.953 (73.455)	lr 0.02128
Train [31][790/3239]	Time 0.576 (0.932)	Data Time 0.001 (0.036)	Loss 3.2289 (3.0812)	Entropy 0.75744 (0.76026)	Top-1 acc 48.047 (50.179)	Top-5 acc 72.266 (73.439)	lr 0.02128
Train [31][800/3239]	Time 0.643 (0.931)	Data Time 0.001 (0.036)	Loss 3.0286 (3.0809)	Entropy 0.75657 (0.76022)	Top-1 acc 50.781 (50.187)	Top-5 acc 74.609 (73.449)	lr 0.02128
Train [31][810/3239]	Time 0.681 (0.930)	Data Time 0.001 (0.035)	Loss 3.1418 (3.0812)	Entropy 0.75641 (0.76017)	Top-1 acc 46.094 (50.181)	Top-5 acc 74.219 (73.445)	lr 0.02128
Train [31][820/3239]	Time 0.597 (0.929)	Data Time 0.001 (0.035)	Loss 2.9974 (3.0800)	Entropy 0.75662 (0.76013)	Top-1 acc 50.781 (50.213)	Top-5 acc 74.219 (73.466)	lr 0.02128
Train [31][830/3239]	Time 0.616 (0.928)	Data Time 0.002 (0.034)	Loss 2.9521 (3.0795)	Entropy 0.75676 (0.76009)	Top-1 acc 54.297 (50.222)	Top-5 acc 76.562 (73.480)	lr 0.02128
Train [31][840/3239]	Time 0.609 (0.928)	Data Time 0.001 (0.034)	Loss 3.2278 (3.0795)	Entropy 0.75656 (0.76005)	Top-1 acc 44.141 (50.209)	Top-5 acc 69.922 (73.475)	lr 0.02128
Train [31][850/3239]	Time 0.595 (0.927)	Data Time 0.001 (0.034)	Loss 3.0253 (3.0799)	Entropy 0.75644 (0.76000)	Top-1 acc 48.828 (50.201)	Top-5 acc 76.172 (73.476)	lr 0.02128
Train [31][860/3239]	Time 0.584 (0.926)	Data Time 0.001 (0.033)	Loss 3.0153 (3.0796)	Entropy 0.75603 (0.75996)	Top-1 acc 49.609 (50.201)	Top-5 acc 73.828 (73.489)	lr 0.02128
Train [31][870/3239]	Time 0.655 (0.925)	Data Time 0.001 (0.033)	Loss 2.8908 (3.0788)	Entropy 0.75595 (0.75992)	Top-1 acc 57.031 (50.222)	Top-5 acc 74.609 (73.496)	lr 0.02128
Train [31][880/3239]	Time 0.652 (0.924)	Data Time 0.001 (0.033)	Loss 3.1094 (3.0784)	Entropy 0.75614 (0.75987)	Top-1 acc 46.094 (50.235)	Top-5 acc 70.703 (73.503)	lr 0.02128
Train [31][890/3239]	Time 0.639 (0.923)	Data Time 0.001 (0.032)	Loss 3.0759 (3.0783)	Entropy 0.75586 (0.75983)	Top-1 acc 50.781 (50.237)	Top-5 acc 72.656 (73.507)	lr 0.02128
Train [31][900/3239]	Time 0.711 (0.923)	Data Time 0.001 (0.032)	Loss 3.1401 (3.0787)	Entropy 0.75631 (0.75979)	Top-1 acc 48.438 (50.227)	Top-5 acc 74.219 (73.504)	lr 0.02127
Train [31][910/3239]	Time 0.585 (0.922)	Data Time 0.001 (0.032)	Loss 3.1500 (3.0791)	Entropy 0.75646 (0.75975)	Top-1 acc 47.266 (50.219)	Top-5 acc 73.438 (73.504)	lr 0.02127
Train [31][920/3239]	Time 0.630 (0.922)	Data Time 0.001 (0.031)	Loss 3.1012 (3.0799)	Entropy 0.75613 (0.75971)	Top-1 acc 44.922 (50.187)	Top-5 acc 73.438 (73.483)	lr 0.02127
Train [31][930/3239]	Time 0.619 (0.921)	Data Time 0.001 (0.031)	Loss 2.9709 (3.0799)	Entropy 0.75603 (0.75967)	Top-1 acc 51.172 (50.181)	Top-5 acc 77.344 (73.485)	lr 0.02127
Train [31][940/3239]	Time 0.594 (0.921)	Data Time 0.001 (0.031)	Loss 3.0799 (3.0798)	Entropy 0.75621 (0.75963)	Top-1 acc 50.391 (50.190)	Top-5 acc 71.484 (73.488)	lr 0.02127
Train [31][950/3239]	Time 0.603 (0.920)	Data Time 0.001 (0.030)	Loss 2.9514 (3.0795)	Entropy 0.75665 (0.75960)	Top-1 acc 51.953 (50.209)	Top-5 acc 78.906 (73.500)	lr 0.02127
Train [31][960/3239]	Time 0.597 (0.919)	Data Time 0.001 (0.030)	Loss 3.2263 (3.0799)	Entropy 0.75651 (0.75957)	Top-1 acc 48.047 (50.200)	Top-5 acc 68.359 (73.489)	lr 0.02127
Train [31][970/3239]	Time 0.683 (0.919)	Data Time 0.001 (0.030)	Loss 2.9763 (3.0808)	Entropy 0.75668 (0.75954)	Top-1 acc 54.297 (50.190)	Top-5 acc 76.562 (73.470)	lr 0.02127
Train [31][980/3239]	Time 0.610 (0.918)	Data Time 0.001 (0.029)	Loss 2.9050 (3.0805)	Entropy 0.75628 (0.75951)	Top-1 acc 54.688 (50.199)	Top-5 acc 74.609 (73.480)	lr 0.02127
Train [31][990/3239]	Time 0.623 (0.918)	Data Time 0.001 (0.029)	Loss 2.9654 (3.0801)	Entropy 0.75633 (0.75947)	Top-1 acc 54.297 (50.195)	Top-5 acc 78.125 (73.490)	lr 0.02127
Train [31][1000/3239]	Time 0.638 (0.917)	Data Time 0.001 (0.029)	Loss 3.0558 (3.0803)	Entropy 0.75584 (0.75944)	Top-1 acc 50.781 (50.197)	Top-5 acc 74.219 (73.484)	lr 0.02127
Train [31][1010/3239]	Time 0.616 (0.917)	Data Time 0.001 (0.029)	Loss 2.9514 (3.0798)	Entropy 0.75562 (0.75940)	Top-1 acc 54.688 (50.214)	Top-5 acc 75.391 (73.496)	lr 0.02127
Train [31][1020/3239]	Time 0.682 (0.941)	Data Time 0.006 (0.028)	Loss 3.0503 (3.0802)	Entropy 0.75540 (0.75937)	Top-1 acc 54.297 (50.215)	Top-5 acc 73.438 (73.485)	lr 0.02127
Train [31][1030/3239]	Time 0.624 (0.941)	Data Time 0.002 (0.028)	Loss 3.0094 (3.0798)	Entropy 0.75528 (0.75933)	Top-1 acc 53.125 (50.224)	Top-5 acc 74.219 (73.497)	lr 0.02126
Train [31][1040/3239]	Time 0.670 (0.940)	Data Time 0.002 (0.028)	Loss 3.1608 (3.0796)	Entropy 0.75535 (0.75929)	Top-1 acc 53.125 (50.230)	Top-5 acc 72.266 (73.503)	lr 0.02126
Train [31][1050/3239]	Time 0.615 (0.939)	Data Time 0.001 (0.028)	Loss 3.2113 (3.0806)	Entropy 0.75527 (0.75925)	Top-1 acc 48.438 (50.209)	Top-5 acc 69.531 (73.487)	lr 0.02126
Train [31][1060/3239]	Time 0.720 (0.939)	Data Time 0.001 (0.027)	Loss 3.2127 (3.0800)	Entropy 0.75528 (0.75921)	Top-1 acc 48.438 (50.222)	Top-5 acc 70.703 (73.485)	lr 0.02126
Train [31][1070/3239]	Time 0.615 (0.938)	Data Time 0.001 (0.027)	Loss 3.1057 (3.0799)	Entropy 0.75479 (0.75917)	Top-1 acc 47.266 (50.218)	Top-5 acc 72.656 (73.485)	lr 0.02126
Train [31][1080/3239]	Time 0.606 (0.938)	Data Time 0.001 (0.027)	Loss 3.0142 (3.0800)	Entropy 0.75519 (0.75913)	Top-1 acc 51.953 (50.222)	Top-5 acc 75.781 (73.477)	lr 0.02126
Train [31][1090/3239]	Time 0.624 (0.937)	Data Time 0.001 (0.027)	Loss 2.9895 (3.0803)	Entropy 0.75501 (0.75910)	Top-1 acc 47.266 (50.222)	Top-5 acc 76.562 (73.464)	lr 0.02126
Train [31][1100/3239]	Time 0.566 (0.937)	Data Time 0.001 (0.026)	Loss 3.2985 (3.0797)	Entropy 0.75500 (0.75906)	Top-1 acc 46.875 (50.239)	Top-5 acc 70.703 (73.476)	lr 0.02126
Train [31][1110/3239]	Time 0.571 (0.936)	Data Time 0.001 (0.026)	Loss 3.2017 (3.0802)	Entropy 0.75472 (0.75902)	Top-1 acc 48.828 (50.231)	Top-5 acc 72.266 (73.463)	lr 0.02126
Train [31][1120/3239]	Time 0.639 (0.935)	Data Time 0.002 (0.026)	Loss 2.9664 (3.0800)	Entropy 0.75492 (0.75899)	Top-1 acc 53.516 (50.238)	Top-5 acc 77.344 (73.469)	lr 0.02126
Train [31][1130/3239]	Time 0.727 (0.935)	Data Time 0.001 (0.026)	Loss 3.1109 (3.0801)	Entropy 0.75505 (0.75895)	Top-1 acc 49.609 (50.231)	Top-5 acc 70.703 (73.462)	lr 0.02126
Train [31][1140/3239]	Time 0.580 (0.934)	Data Time 0.002 (0.026)	Loss 3.0240 (3.0801)	Entropy 0.75493 (0.75891)	Top-1 acc 48.438 (50.225)	Top-5 acc 72.266 (73.459)	lr 0.02126
Train [31][1150/3239]	Time 0.594 (0.933)	Data Time 0.001 (0.025)	Loss 3.0024 (3.0803)	Entropy 0.75514 (0.75888)	Top-1 acc 50.781 (50.213)	Top-5 acc 77.344 (73.455)	lr 0.02126
Train [31][1160/3239]	Time 0.626 (0.933)	Data Time 0.001 (0.025)	Loss 3.1613 (3.0802)	Entropy 0.75504 (0.75885)	Top-1 acc 41.406 (50.210)	Top-5 acc 73.828 (73.456)	lr 0.02126
Train [31][1170/3239]	Time 0.636 (0.932)	Data Time 0.001 (0.025)	Loss 2.8776 (3.0796)	Entropy 0.75504 (0.75882)	Top-1 acc 51.562 (50.222)	Top-5 acc 77.734 (73.469)	lr 0.02125
Train [31][1180/3239]	Time 0.570 (0.932)	Data Time 0.001 (0.025)	Loss 3.1741 (3.0795)	Entropy 0.75480 (0.75878)	Top-1 acc 45.703 (50.226)	Top-5 acc 70.703 (73.465)	lr 0.02125
Train [31][1190/3239]	Time 0.598 (0.931)	Data Time 0.001 (0.025)	Loss 3.0624 (3.0790)	Entropy 0.75481 (0.75875)	Top-1 acc 50.391 (50.237)	Top-5 acc 74.219 (73.475)	lr 0.02125
Train [31][1200/3239]	Time 0.644 (0.931)	Data Time 0.001 (0.024)	Loss 2.8436 (3.0792)	Entropy 0.75436 (0.75872)	Top-1 acc 58.594 (50.233)	Top-5 acc 77.344 (73.469)	lr 0.02125
Train [31][1210/3239]	Time 0.577 (0.931)	Data Time 0.001 (0.024)	Loss 3.0695 (3.0790)	Entropy 0.75408 (0.75868)	Top-1 acc 50.391 (50.238)	Top-5 acc 72.266 (73.471)	lr 0.02125
Train [31][1220/3239]	Time 0.724 (0.930)	Data Time 0.001 (0.024)	Loss 3.0261 (3.0795)	Entropy 0.75394 (0.75864)	Top-1 acc 49.219 (50.236)	Top-5 acc 76.562 (73.469)	lr 0.02125
Train [31][1230/3239]	Time 0.603 (0.930)	Data Time 0.001 (0.024)	Loss 3.0934 (3.0797)	Entropy 0.75411 (0.75860)	Top-1 acc 52.344 (50.228)	Top-5 acc 70.312 (73.466)	lr 0.02125
Train [31][1240/3239]	Time 0.605 (0.929)	Data Time 0.001 (0.024)	Loss 3.1616 (3.0789)	Entropy 0.75406 (0.75857)	Top-1 acc 46.094 (50.240)	Top-5 acc 71.484 (73.482)	lr 0.02125
Train [31][1250/3239]	Time 0.604 (0.929)	Data Time 0.001 (0.024)	Loss 2.9807 (3.0786)	Entropy 0.75420 (0.75853)	Top-1 acc 52.344 (50.242)	Top-5 acc 74.609 (73.488)	lr 0.02125
Train [31][1260/3239]	Time 0.615 (0.928)	Data Time 0.001 (0.023)	Loss 3.0896 (3.0781)	Entropy 0.75467 (0.75850)	Top-1 acc 50.000 (50.258)	Top-5 acc 69.922 (73.490)	lr 0.02125
Train [31][1270/3239]	Time 0.609 (0.928)	Data Time 0.001 (0.023)	Loss 2.9910 (3.0779)	Entropy 0.75449 (0.75847)	Top-1 acc 52.734 (50.269)	Top-5 acc 75.391 (73.493)	lr 0.02125
Train [31][1280/3239]	Time 0.634 (0.927)	Data Time 0.001 (0.023)	Loss 3.0787 (3.0780)	Entropy 0.75431 (0.75844)	Top-1 acc 47.266 (50.254)	Top-5 acc 73.047 (73.492)	lr 0.02125
Train [31][1290/3239]	Time 0.711 (0.927)	Data Time 0.001 (0.023)	Loss 3.0699 (3.0778)	Entropy 0.75445 (0.75840)	Top-1 acc 51.172 (50.255)	Top-5 acc 71.094 (73.489)	lr 0.02125
Train [31][1300/3239]	Time 0.563 (0.926)	Data Time 0.001 (0.023)	Loss 3.2613 (3.0784)	Entropy 0.75459 (0.75837)	Top-1 acc 49.219 (50.247)	Top-5 acc 71.094 (73.486)	lr 0.02125
Train [31][1310/3239]	Time 0.604 (0.925)	Data Time 0.001 (0.023)	Loss 3.0784 (3.0782)	Entropy 0.75470 (0.75835)	Top-1 acc 48.828 (50.249)	Top-5 acc 73.047 (73.491)	lr 0.02124
Train [31][1320/3239]	Time 0.595 (0.925)	Data Time 0.001 (0.022)	Loss 2.8386 (3.0779)	Entropy 0.75449 (0.75832)	Top-1 acc 58.984 (50.263)	Top-5 acc 77.344 (73.503)	lr 0.02124
Train [31][1330/3239]	Time 0.616 (0.925)	Data Time 0.002 (0.022)	Loss 3.0378 (3.0780)	Entropy 0.75442 (0.75829)	Top-1 acc 53.906 (50.265)	Top-5 acc 72.266 (73.501)	lr 0.02124
Train [31][1340/3239]	Time 0.601 (0.924)	Data Time 0.001 (0.022)	Loss 3.0676 (3.0774)	Entropy 0.75427 (0.75826)	Top-1 acc 50.781 (50.280)	Top-5 acc 74.609 (73.512)	lr 0.02124
Train [31][1350/3239]	Time 0.632 (0.924)	Data Time 0.001 (0.022)	Loss 3.3326 (3.0775)	Entropy 0.75399 (0.75823)	Top-1 acc 44.531 (50.278)	Top-5 acc 67.969 (73.515)	lr 0.02124
Train [31][1360/3239]	Time 0.610 (0.923)	Data Time 0.001 (0.022)	Loss 2.9268 (3.0777)	Entropy 0.75383 (0.75820)	Top-1 acc 57.422 (50.273)	Top-5 acc 77.344 (73.512)	lr 0.02124
Train [31][1370/3239]	Time 0.627 (0.923)	Data Time 0.001 (0.022)	Loss 3.1585 (3.0778)	Entropy 0.75349 (0.75817)	Top-1 acc 48.828 (50.268)	Top-5 acc 68.750 (73.506)	lr 0.02124
Train [31][1380/3239]	Time 0.637 (0.923)	Data Time 0.002 (0.022)	Loss 3.0225 (3.0777)	Entropy 0.75361 (0.75813)	Top-1 acc 52.734 (50.268)	Top-5 acc 74.609 (73.508)	lr 0.02124
Train [31][1390/3239]	Time 0.603 (0.922)	Data Time 0.001 (0.021)	Loss 3.2680 (3.0777)	Entropy 0.75359 (0.75810)	Top-1 acc 41.016 (50.265)	Top-5 acc 67.578 (73.505)	lr 0.02124
Train [31][1400/3239]	Time 0.634 (0.922)	Data Time 0.001 (0.021)	Loss 3.0474 (3.0776)	Entropy 0.75361 (0.75807)	Top-1 acc 50.781 (50.265)	Top-5 acc 74.609 (73.513)	lr 0.02124
Train [31][1410/3239]	Time 0.616 (0.922)	Data Time 0.001 (0.021)	Loss 3.1282 (3.0775)	Entropy 0.75390 (0.75804)	Top-1 acc 48.828 (50.264)	Top-5 acc 71.484 (73.513)	lr 0.02124
Train [31][1420/3239]	Time 0.618 (0.921)	Data Time 0.001 (0.021)	Loss 3.1256 (3.0778)	Entropy 0.75406 (0.75801)	Top-1 acc 49.609 (50.254)	Top-5 acc 73.438 (73.506)	lr 0.02124
Train [31][1430/3239]	Time 0.632 (0.921)	Data Time 0.001 (0.021)	Loss 3.2737 (3.0779)	Entropy 0.75413 (0.75798)	Top-1 acc 48.438 (50.254)	Top-5 acc 69.531 (73.502)	lr 0.02124
Train [31][1440/3239]	Time 0.650 (0.921)	Data Time 0.001 (0.021)	Loss 3.1169 (3.0777)	Entropy 0.75411 (0.75795)	Top-1 acc 51.562 (50.260)	Top-5 acc 73.828 (73.506)	lr 0.02124
Train [31][1450/3239]	Time 0.730 (0.920)	Data Time 0.001 (0.021)	Loss 2.9786 (3.0778)	Entropy 0.75374 (0.75793)	Top-1 acc 55.078 (50.258)	Top-5 acc 72.656 (73.505)	lr 0.02123
Train [31][1460/3239]	Time 0.605 (0.919)	Data Time 0.001 (0.020)	Loss 2.8775 (3.0777)	Entropy 0.75366 (0.75790)	Top-1 acc 56.641 (50.271)	Top-5 acc 78.516 (73.505)	lr 0.02123
Train [31][1470/3239]	Time 0.457 (0.919)	Data Time 0.002 (0.020)	Loss 3.2143 (3.0781)	Entropy 0.75293 (0.75787)	Top-1 acc 48.828 (50.261)	Top-5 acc 71.484 (73.494)	lr 0.02123
Train [31][1480/3239]	Time 0.582 (0.919)	Data Time 0.003 (0.020)	Loss 3.1659 (3.0788)	Entropy 0.75318 (0.75783)	Top-1 acc 48.047 (50.245)	Top-5 acc 73.828 (73.488)	lr 0.02123
Train [31][1490/3239]	Time 0.631 (0.918)	Data Time 0.001 (0.020)	Loss 2.9698 (3.0788)	Entropy 0.75339 (0.75780)	Top-1 acc 55.078 (50.251)	Top-5 acc 76.562 (73.484)	lr 0.02123
Train [31][1500/3239]	Time 0.599 (0.918)	Data Time 0.001 (0.020)	Loss 3.3439 (3.0788)	Entropy 0.75356 (0.75777)	Top-1 acc 40.625 (50.238)	Top-5 acc 66.016 (73.481)	lr 0.02123
Train [31][1510/3239]	Time 0.581 (0.918)	Data Time 0.001 (0.020)	Loss 3.0628 (3.0791)	Entropy 0.75368 (0.75775)	Top-1 acc 53.906 (50.235)	Top-5 acc 75.781 (73.480)	lr 0.02123
Train [31][1520/3239]	Time 0.693 (0.917)	Data Time 0.001 (0.020)	Loss 2.9557 (3.0792)	Entropy 0.75387 (0.75772)	Top-1 acc 50.781 (50.234)	Top-5 acc 76.953 (73.481)	lr 0.02123
Train [31][1530/3239]	Time 0.612 (0.917)	Data Time 0.001 (0.020)	Loss 3.2991 (3.0794)	Entropy 0.75420 (0.75770)	Top-1 acc 44.922 (50.231)	Top-5 acc 71.484 (73.477)	lr 0.02123
Train [31][1540/3239]	Time 0.611 (0.917)	Data Time 0.001 (0.019)	Loss 2.9450 (3.0793)	Entropy 0.75409 (0.75767)	Top-1 acc 50.000 (50.222)	Top-5 acc 76.172 (73.479)	lr 0.02123
Train [31][1550/3239]	Time 0.606 (0.916)	Data Time 0.001 (0.019)	Loss 3.0525 (3.0791)	Entropy 0.75359 (0.75765)	Top-1 acc 51.953 (50.224)	Top-5 acc 75.000 (73.484)	lr 0.02123
Train [31][1560/3239]	Time 0.561 (0.916)	Data Time 0.001 (0.019)	Loss 3.4383 (3.0792)	Entropy 0.75343 (0.75762)	Top-1 acc 41.797 (50.219)	Top-5 acc 65.625 (73.485)	lr 0.02123
Train [31][1570/3239]	Time 0.607 (0.916)	Data Time 0.001 (0.019)	Loss 2.9629 (3.0792)	Entropy 0.75361 (0.75760)	Top-1 acc 51.172 (50.221)	Top-5 acc 76.172 (73.489)	lr 0.02123
Train [31][1580/3239]	Time 0.618 (0.915)	Data Time 0.001 (0.019)	Loss 3.3670 (3.0792)	Entropy 0.75385 (0.75757)	Top-1 acc 46.875 (50.222)	Top-5 acc 68.359 (73.489)	lr 0.02123
Train [31][1590/3239]	Time 0.628 (0.915)	Data Time 0.001 (0.019)	Loss 3.0626 (3.0793)	Entropy 0.75417 (0.75755)	Top-1 acc 50.781 (50.215)	Top-5 acc 71.875 (73.489)	lr 0.02122
Train [31][1600/3239]	Time 0.631 (0.915)	Data Time 0.001 (0.019)	Loss 3.0938 (3.0801)	Entropy 0.75374 (0.75753)	Top-1 acc 46.484 (50.195)	Top-5 acc 74.609 (73.473)	lr 0.02122
Train [31][1610/3239]	Time 0.599 (0.914)	Data Time 0.001 (0.019)	Loss 3.1665 (3.0803)	Entropy 0.75372 (0.75751)	Top-1 acc 46.484 (50.187)	Top-5 acc 74.219 (73.474)	lr 0.02122
Train [31][1620/3239]	Time 0.469 (0.914)	Data Time 0.001 (0.019)	Loss 3.2422 (3.0805)	Entropy 0.75346 (0.75748)	Top-1 acc 48.047 (50.185)	Top-5 acc 70.703 (73.468)	lr 0.02122
Train [31][1630/3239]	Time 0.591 (0.913)	Data Time 0.001 (0.018)	Loss 3.0529 (3.0805)	Entropy 0.75285 (0.75746)	Top-1 acc 49.609 (50.190)	Top-5 acc 72.656 (73.464)	lr 0.02122
Train [31][1640/3239]	Time 0.595 (0.913)	Data Time 0.001 (0.018)	Loss 3.1658 (3.0807)	Entropy 0.75292 (0.75743)	Top-1 acc 44.531 (50.181)	Top-5 acc 72.266 (73.458)	lr 0.02122
Train [31][1650/3239]	Time 0.632 (0.913)	Data Time 0.001 (0.018)	Loss 3.1964 (3.0809)	Entropy 0.75284 (0.75740)	Top-1 acc 48.047 (50.178)	Top-5 acc 70.312 (73.455)	lr 0.02122
Train [31][1660/3239]	Time 0.622 (0.912)	Data Time 0.001 (0.018)	Loss 3.0184 (3.0808)	Entropy 0.75284 (0.75737)	Top-1 acc 53.906 (50.181)	Top-5 acc 73.438 (73.463)	lr 0.02122
Train [31][1670/3239]	Time 0.614 (0.912)	Data Time 0.001 (0.018)	Loss 3.0270 (3.0808)	Entropy 0.75285 (0.75735)	Top-1 acc 51.562 (50.179)	Top-5 acc 75.000 (73.457)	lr 0.02122
Train [31][1680/3239]	Time 0.716 (0.927)	Data Time 0.002 (0.018)	Loss 3.1502 (3.0803)	Entropy 0.75306 (0.75732)	Top-1 acc 46.094 (50.186)	Top-5 acc 72.656 (73.466)	lr 0.02122
Train [31][1690/3239]	Time 0.606 (0.926)	Data Time 0.002 (0.018)	Loss 3.1225 (3.0806)	Entropy 0.75282 (0.75729)	Top-1 acc 48.828 (50.179)	Top-5 acc 71.094 (73.459)	lr 0.02122
Train [31][1700/3239]	Time 0.643 (0.926)	Data Time 0.001 (0.018)	Loss 2.9612 (3.0807)	Entropy 0.75262 (0.75727)	Top-1 acc 52.734 (50.178)	Top-5 acc 77.344 (73.460)	lr 0.02122
Train [31][1710/3239]	Time 0.643 (0.926)	Data Time 0.001 (0.018)	Loss 3.1922 (3.0810)	Entropy 0.75252 (0.75724)	Top-1 acc 43.750 (50.174)	Top-5 acc 71.875 (73.453)	lr 0.02122
Train [31][1720/3239]	Time 0.619 (0.926)	Data Time 0.001 (0.018)	Loss 3.0759 (3.0812)	Entropy 0.75267 (0.75721)	Top-1 acc 51.953 (50.176)	Top-5 acc 72.266 (73.444)	lr 0.02122
Train [31][1730/3239]	Time 0.628 (0.925)	Data Time 0.001 (0.018)	Loss 3.0903 (3.0810)	Entropy 0.75268 (0.75719)	Top-1 acc 53.516 (50.176)	Top-5 acc 73.047 (73.447)	lr 0.02121
Train [31][1740/3239]	Time 0.616 (0.925)	Data Time 0.001 (0.017)	Loss 2.9923 (3.0812)	Entropy 0.75269 (0.75716)	Top-1 acc 53.125 (50.166)	Top-5 acc 75.391 (73.443)	lr 0.02121
Train [31][1750/3239]	Time 0.622 (0.924)	Data Time 0.001 (0.017)	Loss 2.9602 (3.0811)	Entropy 0.75250 (0.75714)	Top-1 acc 55.859 (50.168)	Top-5 acc 71.875 (73.443)	lr 0.02121
Train [31][1760/3239]	Time 0.652 (0.924)	Data Time 0.001 (0.017)	Loss 3.0623 (3.0809)	Entropy 0.75273 (0.75711)	Top-1 acc 51.562 (50.169)	Top-5 acc 75.391 (73.448)	lr 0.02121
Train [31][1770/3239]	Time 0.610 (0.924)	Data Time 0.001 (0.017)	Loss 3.0922 (3.0810)	Entropy 0.75275 (0.75709)	Top-1 acc 50.000 (50.169)	Top-5 acc 73.047 (73.447)	lr 0.02121
Train [31][1780/3239]	Time 0.624 (0.923)	Data Time 0.001 (0.017)	Loss 3.2116 (3.0810)	Entropy 0.75290 (0.75706)	Top-1 acc 49.219 (50.164)	Top-5 acc 69.141 (73.446)	lr 0.02121
Train [31][1790/3239]	Time 0.586 (0.923)	Data Time 0.001 (0.017)	Loss 3.1828 (3.0812)	Entropy 0.75276 (0.75704)	Top-1 acc 46.484 (50.161)	Top-5 acc 71.484 (73.440)	lr 0.02121
Train [31][1800/3239]	Time 0.637 (0.923)	Data Time 0.001 (0.017)	Loss 3.2777 (3.0815)	Entropy 0.75284 (0.75701)	Top-1 acc 47.266 (50.151)	Top-5 acc 71.484 (73.437)	lr 0.02121
Train [31][1810/3239]	Time 0.616 (0.922)	Data Time 0.001 (0.017)	Loss 3.0635 (3.0815)	Entropy 0.75224 (0.75699)	Top-1 acc 50.781 (50.152)	Top-5 acc 71.875 (73.436)	lr 0.02121
Train [31][1820/3239]	Time 0.612 (0.922)	Data Time 0.001 (0.017)	Loss 2.8614 (3.0813)	Entropy 0.75229 (0.75696)	Top-1 acc 57.031 (50.156)	Top-5 acc 78.906 (73.439)	lr 0.02121
Train [31][1830/3239]	Time 0.679 (0.922)	Data Time 0.001 (0.017)	Loss 3.0595 (3.0815)	Entropy 0.75257 (0.75694)	Top-1 acc 53.516 (50.156)	Top-5 acc 73.438 (73.438)	lr 0.02121
Train [31][1840/3239]	Time 0.741 (0.921)	Data Time 0.001 (0.017)	Loss 3.1854 (3.0819)	Entropy 0.75266 (0.75691)	Top-1 acc 49.219 (50.148)	Top-5 acc 73.047 (73.429)	lr 0.02121
Train [31][1850/3239]	Time 0.624 (0.921)	Data Time 0.001 (0.017)	Loss 3.0786 (3.0817)	Entropy 0.75267 (0.75689)	Top-1 acc 47.266 (50.149)	Top-5 acc 72.266 (73.434)	lr 0.02121
Train [31][1860/3239]	Time 0.622 (0.921)	Data Time 0.001 (0.016)	Loss 2.8145 (3.0816)	Entropy 0.75283 (0.75687)	Top-1 acc 57.422 (50.154)	Top-5 acc 79.297 (73.439)	lr 0.02121
Train [31][1870/3239]	Time 0.636 (0.921)	Data Time 0.001 (0.016)	Loss 2.8666 (3.0818)	Entropy 0.75295 (0.75685)	Top-1 acc 55.469 (50.152)	Top-5 acc 76.953 (73.436)	lr 0.02120
Train [31][1880/3239]	Time 0.592 (0.920)	Data Time 0.001 (0.016)	Loss 2.9381 (3.0817)	Entropy 0.75281 (0.75683)	Top-1 acc 53.516 (50.151)	Top-5 acc 76.562 (73.435)	lr 0.02120
Train [31][1890/3239]	Time 0.621 (0.920)	Data Time 0.001 (0.016)	Loss 3.2450 (3.0822)	Entropy 0.75263 (0.75681)	Top-1 acc 46.094 (50.140)	Top-5 acc 71.094 (73.427)	lr 0.02120
Train [31][1900/3239]	Time 0.667 (0.920)	Data Time 0.001 (0.016)	Loss 3.0429 (3.0821)	Entropy 0.75245 (0.75678)	Top-1 acc 46.484 (50.134)	Top-5 acc 76.562 (73.432)	lr 0.02120
Train [31][1910/3239]	Time 0.727 (0.919)	Data Time 0.001 (0.016)	Loss 3.2253 (3.0824)	Entropy 0.75223 (0.75676)	Top-1 acc 49.219 (50.128)	Top-5 acc 68.359 (73.421)	lr 0.02120
Train [31][1920/3239]	Time 0.618 (0.919)	Data Time 0.001 (0.016)	Loss 3.1980 (3.0826)	Entropy 0.75212 (0.75674)	Top-1 acc 48.828 (50.125)	Top-5 acc 67.578 (73.418)	lr 0.02120
Train [31][1930/3239]	Time 0.581 (0.919)	Data Time 0.001 (0.016)	Loss 3.2124 (3.0825)	Entropy 0.75243 (0.75671)	Top-1 acc 46.484 (50.127)	Top-5 acc 69.922 (73.420)	lr 0.02120
Train [31][1940/3239]	Time 0.574 (0.918)	Data Time 0.001 (0.016)	Loss 3.0880 (3.0823)	Entropy 0.75245 (0.75669)	Top-1 acc 49.219 (50.129)	Top-5 acc 70.703 (73.424)	lr 0.02120
Train [31][1950/3239]	Time 0.625 (0.918)	Data Time 0.001 (0.016)	Loss 3.0520 (3.0822)	Entropy 0.75265 (0.75667)	Top-1 acc 46.484 (50.135)	Top-5 acc 73.438 (73.425)	lr 0.02120
Train [31][1960/3239]	Time 0.627 (0.918)	Data Time 0.002 (0.016)	Loss 2.9761 (3.0824)	Entropy 0.75250 (0.75665)	Top-1 acc 50.391 (50.132)	Top-5 acc 75.781 (73.426)	lr 0.02120
Train [31][1970/3239]	Time 0.605 (0.917)	Data Time 0.001 (0.016)	Loss 3.1826 (3.0826)	Entropy 0.75252 (0.75663)	Top-1 acc 49.219 (50.132)	Top-5 acc 72.266 (73.422)	lr 0.02120
Train [31][1980/3239]	Time 0.618 (0.917)	Data Time 0.001 (0.016)	Loss 2.9478 (3.0825)	Entropy 0.75245 (0.75661)	Top-1 acc 53.516 (50.136)	Top-5 acc 73.828 (73.420)	lr 0.02120
Train [31][1990/3239]	Time 0.625 (0.917)	Data Time 0.001 (0.016)	Loss 3.1065 (3.0826)	Entropy 0.75254 (0.75659)	Top-1 acc 50.781 (50.137)	Top-5 acc 74.219 (73.423)	lr 0.02120
Train [31][2000/3239]	Time 0.687 (0.917)	Data Time 0.001 (0.015)	Loss 3.1090 (3.0823)	Entropy 0.75253 (0.75657)	Top-1 acc 46.875 (50.142)	Top-5 acc 73.828 (73.429)	lr 0.02119
Train [31][2010/3239]	Time 0.555 (0.916)	Data Time 0.001 (0.015)	Loss 3.2296 (3.0823)	Entropy 0.75251 (0.75655)	Top-1 acc 48.047 (50.143)	Top-5 acc 72.266 (73.431)	lr 0.02119
Train [31][2020/3239]	Time 0.577 (0.916)	Data Time 0.001 (0.015)	Loss 3.1278 (3.0824)	Entropy 0.75275 (0.75653)	Top-1 acc 47.266 (50.138)	Top-5 acc 74.609 (73.429)	lr 0.02119
Train [31][2030/3239]	Time 0.599 (0.916)	Data Time 0.001 (0.015)	Loss 3.1435 (3.0823)	Entropy 0.75262 (0.75651)	Top-1 acc 48.047 (50.142)	Top-5 acc 72.266 (73.430)	lr 0.02119
Train [31][2040/3239]	Time 0.596 (0.916)	Data Time 0.001 (0.015)	Loss 3.1781 (3.0824)	Entropy 0.75222 (0.75649)	Top-1 acc 49.219 (50.140)	Top-5 acc 71.875 (73.430)	lr 0.02119
Train [31][2050/3239]	Time 0.636 (0.915)	Data Time 0.001 (0.015)	Loss 3.1055 (3.0826)	Entropy 0.75206 (0.75647)	Top-1 acc 51.172 (50.137)	Top-5 acc 75.000 (73.429)	lr 0.02119
Train [31][2060/3239]	Time 0.470 (0.915)	Data Time 0.001 (0.015)	Loss 3.0804 (3.0825)	Entropy 0.75174 (0.75645)	Top-1 acc 50.391 (50.138)	Top-5 acc 70.703 (73.429)	lr 0.02119
Train [31][2070/3239]	Time 0.682 (0.915)	Data Time 0.001 (0.015)	Loss 3.2790 (3.0827)	Entropy 0.75174 (0.75642)	Top-1 acc 46.094 (50.137)	Top-5 acc 67.969 (73.424)	lr 0.02119
Train [31][2080/3239]	Time 0.605 (0.914)	Data Time 0.001 (0.015)	Loss 3.0868 (3.0827)	Entropy 0.75171 (0.75640)	Top-1 acc 50.781 (50.138)	Top-5 acc 72.656 (73.421)	lr 0.02119
Train [31][2090/3239]	Time 0.596 (0.914)	Data Time 0.001 (0.015)	Loss 3.0376 (3.0829)	Entropy 0.75182 (0.75638)	Top-1 acc 52.344 (50.134)	Top-5 acc 75.391 (73.416)	lr 0.02119
Train [31][2100/3239]	Time 0.598 (0.914)	Data Time 0.001 (0.015)	Loss 2.9900 (3.0830)	Entropy 0.75199 (0.75636)	Top-1 acc 56.641 (50.135)	Top-5 acc 74.219 (73.412)	lr 0.02119
Train [31][2110/3239]	Time 0.609 (0.914)	Data Time 0.001 (0.015)	Loss 3.1426 (3.0827)	Entropy 0.75189 (0.75634)	Top-1 acc 48.047 (50.140)	Top-5 acc 71.875 (73.417)	lr 0.02119
Train [31][2120/3239]	Time 0.626 (0.913)	Data Time 0.001 (0.015)	Loss 2.9704 (3.0823)	Entropy 0.75232 (0.75632)	Top-1 acc 54.297 (50.149)	Top-5 acc 74.219 (73.426)	lr 0.02119
Train [31][2130/3239]	Time 0.614 (0.913)	Data Time 0.001 (0.015)	Loss 3.3277 (3.0826)	Entropy 0.75244 (0.75630)	Top-1 acc 45.312 (50.148)	Top-5 acc 67.969 (73.424)	lr 0.02119
Train [31][2140/3239]	Time 0.625 (0.913)	Data Time 0.001 (0.015)	Loss 2.7082 (3.0826)	Entropy 0.75256 (0.75628)	Top-1 acc 62.109 (50.149)	Top-5 acc 78.906 (73.421)	lr 0.02118
Train [31][2150/3239]	Time 0.583 (0.913)	Data Time 0.001 (0.014)	Loss 3.1467 (3.0824)	Entropy 0.75270 (0.75626)	Top-1 acc 47.656 (50.149)	Top-5 acc 73.438 (73.423)	lr 0.02118
Train [31][2160/3239]	Time 0.715 (0.913)	Data Time 0.001 (0.014)	Loss 2.9895 (3.0824)	Entropy 0.75235 (0.75625)	Top-1 acc 53.125 (50.155)	Top-5 acc 73.828 (73.421)	lr 0.02118
Train [31][2170/3239]	Time 0.598 (0.912)	Data Time 0.001 (0.014)	Loss 2.8793 (3.0824)	Entropy 0.75267 (0.75623)	Top-1 acc 55.859 (50.152)	Top-5 acc 78.516 (73.421)	lr 0.02118
Train [31][2180/3239]	Time 0.616 (0.912)	Data Time 0.001 (0.014)	Loss 3.2864 (3.0828)	Entropy 0.75236 (0.75621)	Top-1 acc 42.969 (50.145)	Top-5 acc 68.750 (73.411)	lr 0.02118
Train [31][2190/3239]	Time 0.624 (0.912)	Data Time 0.001 (0.014)	Loss 2.9567 (3.0827)	Entropy 0.75269 (0.75619)	Top-1 acc 54.297 (50.144)	Top-5 acc 76.562 (73.411)	lr 0.02118
Train [31][2200/3239]	Time 0.661 (0.912)	Data Time 0.001 (0.014)	Loss 3.0545 (3.0826)	Entropy 0.75296 (0.75618)	Top-1 acc 53.906 (50.151)	Top-5 acc 73.828 (73.413)	lr 0.02118
Train [31][2210/3239]	Time 0.582 (0.911)	Data Time 0.001 (0.014)	Loss 3.0679 (3.0825)	Entropy 0.75253 (0.75616)	Top-1 acc 51.172 (50.153)	Top-5 acc 71.094 (73.413)	lr 0.02118
Train [31][2220/3239]	Time 0.607 (0.911)	Data Time 0.001 (0.014)	Loss 2.9800 (3.0820)	Entropy 0.75274 (0.75615)	Top-1 acc 51.172 (50.162)	Top-5 acc 73.047 (73.421)	lr 0.02118
Train [31][2230/3239]	Time 0.627 (0.911)	Data Time 0.001 (0.014)	Loss 3.0922 (3.0822)	Entropy 0.75214 (0.75613)	Top-1 acc 48.438 (50.156)	Top-5 acc 70.312 (73.415)	lr 0.02118
Train [31][2240/3239]	Time 0.607 (0.910)	Data Time 0.001 (0.014)	Loss 3.0141 (3.0820)	Entropy 0.75204 (0.75611)	Top-1 acc 53.516 (50.165)	Top-5 acc 75.781 (73.421)	lr 0.02118
Train [31][2250/3239]	Time 0.591 (0.910)	Data Time 0.001 (0.014)	Loss 2.9287 (3.0822)	Entropy 0.75215 (0.75610)	Top-1 acc 55.469 (50.164)	Top-5 acc 75.000 (73.415)	lr 0.02118
Train [31][2260/3239]	Time 0.580 (0.910)	Data Time 0.001 (0.014)	Loss 3.2533 (3.0825)	Entropy 0.75244 (0.75608)	Top-1 acc 46.484 (50.155)	Top-5 acc 70.312 (73.413)	lr 0.02118
Train [31][2270/3239]	Time 0.628 (0.910)	Data Time 0.001 (0.014)	Loss 2.8470 (3.0824)	Entropy 0.75246 (0.75606)	Top-1 acc 52.344 (50.159)	Top-5 acc 79.688 (73.416)	lr 0.02118
Train [31][2280/3239]	Time 0.607 (0.909)	Data Time 0.001 (0.014)	Loss 3.2022 (3.0826)	Entropy 0.75250 (0.75605)	Top-1 acc 48.438 (50.153)	Top-5 acc 69.531 (73.411)	lr 0.02117
Train [31][2290/3239]	Time 0.623 (0.909)	Data Time 0.001 (0.014)	Loss 3.0562 (3.0823)	Entropy 0.75236 (0.75603)	Top-1 acc 53.906 (50.164)	Top-5 acc 74.219 (73.418)	lr 0.02117
Train [31][2300/3239]	Time 0.618 (0.909)	Data Time 0.001 (0.014)	Loss 3.0872 (3.0824)	Entropy 0.75214 (0.75601)	Top-1 acc 54.297 (50.162)	Top-5 acc 73.047 (73.413)	lr 0.02117
Train [31][2310/3239]	Time 0.612 (0.909)	Data Time 0.001 (0.014)	Loss 3.2309 (3.0823)	Entropy 0.75216 (0.75600)	Top-1 acc 44.922 (50.158)	Top-5 acc 71.875 (73.414)	lr 0.02117
Train [31][2320/3239]	Time 0.664 (0.909)	Data Time 0.001 (0.014)	Loss 3.1109 (3.0825)	Entropy 0.75222 (0.75598)	Top-1 acc 51.172 (50.158)	Top-5 acc 73.828 (73.410)	lr 0.02117
Train [31][2330/3239]	Time 0.747 (0.920)	Data Time 0.004 (0.014)	Loss 2.8937 (3.0819)	Entropy 0.75157 (0.75596)	Top-1 acc 58.984 (50.169)	Top-5 acc 75.391 (73.418)	lr 0.02117
Train [31][2340/3239]	Time 0.626 (0.920)	Data Time 0.002 (0.013)	Loss 2.8817 (3.0821)	Entropy 0.75158 (0.75594)	Top-1 acc 53.125 (50.161)	Top-5 acc 78.125 (73.417)	lr 0.02117
Train [31][2350/3239]	Time 0.515 (0.919)	Data Time 0.001 (0.013)	Loss 3.0071 (3.0820)	Entropy 0.75134 (0.75593)	Top-1 acc 55.469 (50.163)	Top-5 acc 71.484 (73.420)	lr 0.02117
Train [31][2360/3239]	Time 0.648 (0.919)	Data Time 0.001 (0.013)	Loss 3.0893 (3.0822)	Entropy 0.75125 (0.75591)	Top-1 acc 46.875 (50.156)	Top-5 acc 76.172 (73.419)	lr 0.02117
Train [31][2370/3239]	Time 0.618 (0.919)	Data Time 0.001 (0.013)	Loss 2.9511 (3.0822)	Entropy 0.75121 (0.75589)	Top-1 acc 51.953 (50.152)	Top-5 acc 75.781 (73.418)	lr 0.02117
Train [31][2380/3239]	Time 0.601 (0.918)	Data Time 0.001 (0.013)	Loss 2.7986 (3.0822)	Entropy 0.75162 (0.75587)	Top-1 acc 53.516 (50.152)	Top-5 acc 79.688 (73.421)	lr 0.02117
Train [31][2390/3239]	Time 0.715 (0.918)	Data Time 0.001 (0.013)	Loss 3.1073 (3.0819)	Entropy 0.75186 (0.75585)	Top-1 acc 50.781 (50.158)	Top-5 acc 71.484 (73.425)	lr 0.02117
Train [31][2400/3239]	Time 0.621 (0.918)	Data Time 0.003 (0.013)	Loss 3.2166 (3.0821)	Entropy 0.75185 (0.75583)	Top-1 acc 45.312 (50.153)	Top-5 acc 72.656 (73.422)	lr 0.02117
Train [31][2410/3239]	Time 0.582 (0.918)	Data Time 0.001 (0.013)	Loss 3.0151 (3.0819)	Entropy 0.75153 (0.75582)	Top-1 acc 50.781 (50.160)	Top-5 acc 76.562 (73.425)	lr 0.02117
Train [31][2420/3239]	Time 0.625 (0.918)	Data Time 0.001 (0.013)	Loss 2.8900 (3.0816)	Entropy 0.75152 (0.75580)	Top-1 acc 55.859 (50.167)	Top-5 acc 76.172 (73.430)	lr 0.02116
Train [31][2430/3239]	Time 0.573 (0.917)	Data Time 0.001 (0.013)	Loss 3.0295 (3.0814)	Entropy 0.75158 (0.75578)	Top-1 acc 50.391 (50.169)	Top-5 acc 76.562 (73.437)	lr 0.02116
Train [31][2440/3239]	Time 0.597 (0.917)	Data Time 0.001 (0.013)	Loss 3.1369 (3.0813)	Entropy 0.75184 (0.75576)	Top-1 acc 51.172 (50.168)	Top-5 acc 72.656 (73.438)	lr 0.02116
Train [31][2450/3239]	Time 0.612 (0.917)	Data Time 0.001 (0.013)	Loss 3.0864 (3.0813)	Entropy 0.75165 (0.75575)	Top-1 acc 49.609 (50.170)	Top-5 acc 73.047 (73.437)	lr 0.02116
Train [31][2460/3239]	Time 0.636 (0.917)	Data Time 0.001 (0.013)	Loss 3.0720 (3.0812)	Entropy 0.75170 (0.75573)	Top-1 acc 51.172 (50.172)	Top-5 acc 75.000 (73.438)	lr 0.02116
Train [31][2470/3239]	Time 0.635 (0.917)	Data Time 0.001 (0.013)	Loss 3.0164 (3.0812)	Entropy 0.75160 (0.75571)	Top-1 acc 49.609 (50.167)	Top-5 acc 75.000 (73.436)	lr 0.02116
Train [31][2480/3239]	Time 0.595 (0.916)	Data Time 0.001 (0.013)	Loss 3.0242 (3.0812)	Entropy 0.75123 (0.75570)	Top-1 acc 51.172 (50.171)	Top-5 acc 76.562 (73.439)	lr 0.02116
Train [31][2490/3239]	Time 0.623 (0.916)	Data Time 0.001 (0.013)	Loss 2.8758 (3.0811)	Entropy 0.75140 (0.75568)	Top-1 acc 54.297 (50.172)	Top-5 acc 76.953 (73.440)	lr 0.02116
Train [31][2500/3239]	Time 0.565 (0.916)	Data Time 0.002 (0.013)	Loss 3.2311 (3.0812)	Entropy 0.75133 (0.75566)	Top-1 acc 48.828 (50.171)	Top-5 acc 71.094 (73.439)	lr 0.02116
Train [31][2510/3239]	Time 0.616 (0.916)	Data Time 0.001 (0.013)	Loss 3.1543 (3.0811)	Entropy 0.75150 (0.75565)	Top-1 acc 49.219 (50.177)	Top-5 acc 71.875 (73.443)	lr 0.02116
Train [31][2520/3239]	Time 0.646 (0.915)	Data Time 0.001 (0.013)	Loss 2.7857 (3.0807)	Entropy 0.75143 (0.75563)	Top-1 acc 59.375 (50.191)	Top-5 acc 76.172 (73.447)	lr 0.02116
Train [31][2530/3239]	Time 0.613 (0.915)	Data Time 0.001 (0.013)	Loss 2.9290 (3.0805)	Entropy 0.75144 (0.75561)	Top-1 acc 51.953 (50.199)	Top-5 acc 75.000 (73.450)	lr 0.02116
Train [31][2540/3239]	Time 0.598 (0.915)	Data Time 0.001 (0.013)	Loss 3.3056 (3.0805)	Entropy 0.75113 (0.75560)	Top-1 acc 44.531 (50.199)	Top-5 acc 68.750 (73.452)	lr 0.02116
Train [31][2550/3239]	Time 0.712 (0.915)	Data Time 0.001 (0.013)	Loss 2.6699 (3.0804)	Entropy 0.75145 (0.75558)	Top-1 acc 59.766 (50.201)	Top-5 acc 82.812 (73.454)	lr 0.02115
Train [31][2560/3239]	Time 0.594 (0.915)	Data Time 0.001 (0.012)	Loss 3.1141 (3.0806)	Entropy 0.75136 (0.75556)	Top-1 acc 49.219 (50.197)	Top-5 acc 73.438 (73.450)	lr 0.02115
Train [31][2570/3239]	Time 0.599 (0.914)	Data Time 0.001 (0.012)	Loss 3.2072 (3.0806)	Entropy 0.75140 (0.75555)	Top-1 acc 49.609 (50.202)	Top-5 acc 71.094 (73.448)	lr 0.02115
Train [31][2580/3239]	Time 0.617 (0.914)	Data Time 0.001 (0.012)	Loss 3.1604 (3.0806)	Entropy 0.75124 (0.75553)	Top-1 acc 47.656 (50.198)	Top-5 acc 71.094 (73.452)	lr 0.02115
Train [31][2590/3239]	Time 0.611 (0.914)	Data Time 0.001 (0.012)	Loss 3.0857 (3.0805)	Entropy 0.75097 (0.75551)	Top-1 acc 53.516 (50.202)	Top-5 acc 70.703 (73.452)	lr 0.02115
Train [31][2600/3239]	Time 0.606 (0.914)	Data Time 0.001 (0.012)	Loss 2.9533 (3.0804)	Entropy 0.75076 (0.75549)	Top-1 acc 55.469 (50.207)	Top-5 acc 73.047 (73.454)	lr 0.02115
Train [31][2610/3239]	Time 0.642 (0.914)	Data Time 0.001 (0.012)	Loss 3.1161 (3.0805)	Entropy 0.75109 (0.75548)	Top-1 acc 50.781 (50.206)	Top-5 acc 73.828 (73.448)	lr 0.02115
Train [31][2620/3239]	Time 0.712 (0.914)	Data Time 0.001 (0.012)	Loss 3.0114 (3.0804)	Entropy 0.75076 (0.75546)	Top-1 acc 51.172 (50.206)	Top-5 acc 74.609 (73.450)	lr 0.02115
Train [31][2630/3239]	Time 0.633 (0.914)	Data Time 0.001 (0.012)	Loss 3.1916 (3.0805)	Entropy 0.75050 (0.75544)	Top-1 acc 45.703 (50.204)	Top-5 acc 73.047 (73.451)	lr 0.02115
Train [31][2640/3239]	Time 0.634 (0.913)	Data Time 0.001 (0.012)	Loss 3.0655 (3.0801)	Entropy 0.75005 (0.75542)	Top-1 acc 49.609 (50.210)	Top-5 acc 73.047 (73.458)	lr 0.02115
Train [31][2650/3239]	Time 0.575 (0.913)	Data Time 0.001 (0.012)	Loss 3.0855 (3.0802)	Entropy 0.74995 (0.75540)	Top-1 acc 45.312 (50.209)	Top-5 acc 73.047 (73.455)	lr 0.02115
Train [31][2660/3239]	Time 0.581 (0.913)	Data Time 0.001 (0.012)	Loss 3.0208 (3.0800)	Entropy 0.75004 (0.75538)	Top-1 acc 51.562 (50.213)	Top-5 acc 74.219 (73.458)	lr 0.02115
Train [31][2670/3239]	Time 0.627 (0.913)	Data Time 0.001 (0.012)	Loss 3.0962 (3.0801)	Entropy 0.75009 (0.75536)	Top-1 acc 50.391 (50.208)	Top-5 acc 73.438 (73.455)	lr 0.02115
Train [31][2680/3239]	Time 0.591 (0.912)	Data Time 0.001 (0.012)	Loss 3.0892 (3.0799)	Entropy 0.74998 (0.75534)	Top-1 acc 51.562 (50.211)	Top-5 acc 72.656 (73.459)	lr 0.02115
Train [31][2690/3239]	Time 0.593 (0.912)	Data Time 0.001 (0.012)	Loss 3.1153 (3.0800)	Entropy 0.75013 (0.75532)	Top-1 acc 52.344 (50.210)	Top-5 acc 74.219 (73.460)	lr 0.02114
Train [31][2700/3239]	Time 0.658 (0.912)	Data Time 0.001 (0.012)	Loss 2.9399 (3.0798)	Entropy 0.75004 (0.75530)	Top-1 acc 50.000 (50.214)	Top-5 acc 76.172 (73.463)	lr 0.02114
Train [31][2710/3239]	Time 0.714 (0.912)	Data Time 0.001 (0.012)	Loss 2.9774 (3.0798)	Entropy 0.75008 (0.75528)	Top-1 acc 52.344 (50.212)	Top-5 acc 77.734 (73.463)	lr 0.02114
Train [31][2720/3239]	Time 0.600 (0.912)	Data Time 0.001 (0.012)	Loss 3.0797 (3.0797)	Entropy 0.74985 (0.75526)	Top-1 acc 51.172 (50.211)	Top-5 acc 73.438 (73.461)	lr 0.02114
Train [31][2730/3239]	Time 0.583 (0.912)	Data Time 0.001 (0.012)	Loss 3.2573 (3.0801)	Entropy 0.75031 (0.75524)	Top-1 acc 43.359 (50.202)	Top-5 acc 70.312 (73.448)	lr 0.02114
Train [31][2740/3239]	Time 0.609 (0.911)	Data Time 0.001 (0.012)	Loss 3.0598 (3.0806)	Entropy 0.75092 (0.75523)	Top-1 acc 53.906 (50.194)	Top-5 acc 73.438 (73.440)	lr 0.02114
Train [31][2750/3239]	Time 0.588 (0.911)	Data Time 0.001 (0.012)	Loss 3.0784 (3.0806)	Entropy 0.75059 (0.75521)	Top-1 acc 50.000 (50.195)	Top-5 acc 73.828 (73.437)	lr 0.02114
Train [31][2760/3239]	Time 0.597 (0.911)	Data Time 0.001 (0.012)	Loss 2.9712 (3.0805)	Entropy 0.75078 (0.75519)	Top-1 acc 52.344 (50.200)	Top-5 acc 76.562 (73.441)	lr 0.02114
Train [31][2770/3239]	Time 0.617 (0.911)	Data Time 0.001 (0.012)	Loss 2.9436 (3.0807)	Entropy 0.75091 (0.75518)	Top-1 acc 55.469 (50.196)	Top-5 acc 76.562 (73.436)	lr 0.02114
Train [31][2780/3239]	Time 0.708 (0.911)	Data Time 0.001 (0.012)	Loss 2.9231 (3.0808)	Entropy 0.75096 (0.75516)	Top-1 acc 52.344 (50.196)	Top-5 acc 77.344 (73.436)	lr 0.02114
Train [31][2790/3239]	Time 0.602 (0.911)	Data Time 0.001 (0.012)	Loss 3.1992 (3.0806)	Entropy 0.75099 (0.75515)	Top-1 acc 49.609 (50.198)	Top-5 acc 70.312 (73.437)	lr 0.02114
Train [31][2800/3239]	Time 0.606 (0.910)	Data Time 0.001 (0.012)	Loss 2.8468 (3.0804)	Entropy 0.75092 (0.75513)	Top-1 acc 57.031 (50.202)	Top-5 acc 76.562 (73.440)	lr 0.02114
Train [31][2810/3239]	Time 0.588 (0.910)	Data Time 0.001 (0.012)	Loss 3.3694 (3.0804)	Entropy 0.75101 (0.75512)	Top-1 acc 41.406 (50.199)	Top-5 acc 69.141 (73.441)	lr 0.02114
Train [31][2820/3239]	Time 0.604 (0.910)	Data Time 0.001 (0.011)	Loss 3.2107 (3.0804)	Entropy 0.75079 (0.75510)	Top-1 acc 47.266 (50.199)	Top-5 acc 70.312 (73.445)	lr 0.02114
Train [31][2830/3239]	Time 0.481 (0.910)	Data Time 0.001 (0.011)	Loss 3.1942 (3.0805)	Entropy 0.75037 (0.75509)	Top-1 acc 48.828 (50.198)	Top-5 acc 71.094 (73.440)	lr 0.02113
Train [31][2840/3239]	Time 0.579 (0.909)	Data Time 0.001 (0.011)	Loss 3.0430 (3.0804)	Entropy 0.75023 (0.75507)	Top-1 acc 52.344 (50.204)	Top-5 acc 75.781 (73.441)	lr 0.02113
Train [31][2850/3239]	Time 0.613 (0.909)	Data Time 0.001 (0.011)	Loss 3.0539 (3.0802)	Entropy 0.75008 (0.75505)	Top-1 acc 51.953 (50.205)	Top-5 acc 74.219 (73.442)	lr 0.02113
Train [31][2860/3239]	Time 0.626 (0.909)	Data Time 0.001 (0.011)	Loss 3.1623 (3.0801)	Entropy 0.74986 (0.75504)	Top-1 acc 49.609 (50.209)	Top-5 acc 72.266 (73.448)	lr 0.02113
Train [31][2870/3239]	Time 0.628 (0.909)	Data Time 0.001 (0.011)	Loss 2.8671 (3.0800)	Entropy 0.74973 (0.75502)	Top-1 acc 51.172 (50.207)	Top-5 acc 77.734 (73.449)	lr 0.02113
Train [31][2880/3239]	Time 0.588 (0.909)	Data Time 0.002 (0.011)	Loss 3.3295 (3.0800)	Entropy 0.74994 (0.75500)	Top-1 acc 46.094 (50.206)	Top-5 acc 67.578 (73.450)	lr 0.02113
Train [31][2890/3239]	Time 0.620 (0.909)	Data Time 0.001 (0.011)	Loss 2.8334 (3.0800)	Entropy 0.75012 (0.75498)	Top-1 acc 55.078 (50.203)	Top-5 acc 78.125 (73.449)	lr 0.02113
Train [31][2900/3239]	Time 0.617 (0.908)	Data Time 0.001 (0.011)	Loss 2.9250 (3.0800)	Entropy 0.74967 (0.75496)	Top-1 acc 53.125 (50.202)	Top-5 acc 75.391 (73.449)	lr 0.02113
Train [31][2910/3239]	Time 0.603 (0.908)	Data Time 0.001 (0.011)	Loss 3.3043 (3.0803)	Entropy 0.74984 (0.75495)	Top-1 acc 47.656 (50.198)	Top-5 acc 69.531 (73.442)	lr 0.02113
Train [31][2920/3239]	Time 0.584 (0.908)	Data Time 0.001 (0.011)	Loss 3.0626 (3.0803)	Entropy 0.74971 (0.75493)	Top-1 acc 50.781 (50.197)	Top-5 acc 72.266 (73.445)	lr 0.02113
Train [31][2930/3239]	Time 0.596 (0.908)	Data Time 0.001 (0.011)	Loss 2.9586 (3.0804)	Entropy 0.74969 (0.75491)	Top-1 acc 48.828 (50.192)	Top-5 acc 77.344 (73.444)	lr 0.02113
Train [31][2940/3239]	Time 0.673 (0.908)	Data Time 0.001 (0.011)	Loss 2.9722 (3.0805)	Entropy 0.74993 (0.75489)	Top-1 acc 53.906 (50.187)	Top-5 acc 75.391 (73.441)	lr 0.02113
Train [31][2950/3239]	Time 0.582 (0.908)	Data Time 0.001 (0.011)	Loss 3.1258 (3.0806)	Entropy 0.74971 (0.75488)	Top-1 acc 46.484 (50.182)	Top-5 acc 73.047 (73.439)	lr 0.02113
Train [31][2960/3239]	Time 0.597 (0.908)	Data Time 0.001 (0.011)	Loss 3.1796 (3.0806)	Entropy 0.74975 (0.75486)	Top-1 acc 49.219 (50.182)	Top-5 acc 70.703 (73.437)	lr 0.02112
Train [31][2970/3239]	Time 0.611 (0.907)	Data Time 0.001 (0.011)	Loss 3.0338 (3.0805)	Entropy 0.74976 (0.75484)	Top-1 acc 55.078 (50.186)	Top-5 acc 71.875 (73.439)	lr 0.02112
Train [31][2980/3239]	Time 0.579 (0.907)	Data Time 0.001 (0.011)	Loss 3.1103 (3.0806)	Entropy 0.74970 (0.75482)	Top-1 acc 51.562 (50.187)	Top-5 acc 70.703 (73.438)	lr 0.02112
Train [31][2990/3239]	Time 0.603 (0.916)	Data Time 0.002 (0.011)	Loss 3.0135 (3.0804)	Entropy 0.74969 (0.75481)	Top-1 acc 53.125 (50.194)	Top-5 acc 73.047 (73.439)	lr 0.02112
Train [31][3000/3239]	Time 0.615 (0.916)	Data Time 0.001 (0.011)	Loss 2.9144 (3.0801)	Entropy 0.74983 (0.75479)	Top-1 acc 51.172 (50.199)	Top-5 acc 73.828 (73.444)	lr 0.02112
Train [31][3010/3239]	Time 0.603 (0.916)	Data Time 0.001 (0.011)	Loss 3.0073 (3.0802)	Entropy 0.74985 (0.75477)	Top-1 acc 51.953 (50.197)	Top-5 acc 75.391 (73.442)	lr 0.02112
Train [31][3020/3239]	Time 0.611 (0.915)	Data Time 0.001 (0.011)	Loss 3.1772 (3.0801)	Entropy 0.74967 (0.75476)	Top-1 acc 47.266 (50.200)	Top-5 acc 72.656 (73.444)	lr 0.02112
Train [31][3030/3239]	Time 0.704 (0.915)	Data Time 0.001 (0.011)	Loss 3.1734 (3.0801)	Entropy 0.74955 (0.75474)	Top-1 acc 52.734 (50.201)	Top-5 acc 71.875 (73.445)	lr 0.02112
Train [31][3040/3239]	Time 0.594 (0.915)	Data Time 0.001 (0.011)	Loss 2.9729 (3.0801)	Entropy 0.75007 (0.75472)	Top-1 acc 51.172 (50.199)	Top-5 acc 76.172 (73.445)	lr 0.02112
Train [31][3050/3239]	Time 0.619 (0.915)	Data Time 0.001 (0.011)	Loss 3.1943 (3.0800)	Entropy 0.75003 (0.75471)	Top-1 acc 51.562 (50.202)	Top-5 acc 72.656 (73.450)	lr 0.02112
Train [31][3060/3239]	Time 0.625 (0.915)	Data Time 0.001 (0.011)	Loss 2.9823 (3.0800)	Entropy 0.74974 (0.75469)	Top-1 acc 49.609 (50.203)	Top-5 acc 75.781 (73.451)	lr 0.02112
Train [31][3070/3239]	Time 0.634 (0.915)	Data Time 0.001 (0.011)	Loss 3.2213 (3.0801)	Entropy 0.74949 (0.75468)	Top-1 acc 45.703 (50.204)	Top-5 acc 72.266 (73.452)	lr 0.02112
Train [31][3080/3239]	Time 0.598 (0.914)	Data Time 0.001 (0.011)	Loss 3.0547 (3.0802)	Entropy 0.74966 (0.75466)	Top-1 acc 52.344 (50.203)	Top-5 acc 73.438 (73.452)	lr 0.02112
Train [31][3090/3239]	Time 0.596 (0.914)	Data Time 0.001 (0.011)	Loss 3.0402 (3.0802)	Entropy 0.74994 (0.75464)	Top-1 acc 49.219 (50.202)	Top-5 acc 73.828 (73.450)	lr 0.02112
Train [31][3100/3239]	Time 0.716 (0.914)	Data Time 0.001 (0.011)	Loss 2.9280 (3.0801)	Entropy 0.75027 (0.75463)	Top-1 acc 55.859 (50.204)	Top-5 acc 76.953 (73.452)	lr 0.02111
Train [31][3110/3239]	Time 0.582 (0.914)	Data Time 0.001 (0.011)	Loss 3.1634 (3.0801)	Entropy 0.75024 (0.75461)	Top-1 acc 47.266 (50.204)	Top-5 acc 69.922 (73.450)	lr 0.02111
Train [31][3120/3239]	Time 0.619 (0.914)	Data Time 0.001 (0.011)	Loss 3.1271 (3.0801)	Entropy 0.75047 (0.75460)	Top-1 acc 50.391 (50.205)	Top-5 acc 72.266 (73.450)	lr 0.02111
Train [31][3130/3239]	Time 0.582 (0.914)	Data Time 0.001 (0.011)	Loss 2.9986 (3.0801)	Entropy 0.75001 (0.75459)	Top-1 acc 51.562 (50.200)	Top-5 acc 74.219 (73.452)	lr 0.02111
Train [31][3140/3239]	Time 0.637 (0.913)	Data Time 0.001 (0.011)	Loss 2.9510 (3.0800)	Entropy 0.75033 (0.75457)	Top-1 acc 53.125 (50.204)	Top-5 acc 77.734 (73.455)	lr 0.02111
Train [31][3150/3239]	Time 0.605 (0.913)	Data Time 0.001 (0.011)	Loss 3.3680 (3.0801)	Entropy 0.75027 (0.75456)	Top-1 acc 42.969 (50.202)	Top-5 acc 72.266 (73.453)	lr 0.02111
Train [31][3160/3239]	Time 0.638 (0.913)	Data Time 0.001 (0.010)	Loss 3.3341 (3.0800)	Entropy 0.75037 (0.75455)	Top-1 acc 40.625 (50.201)	Top-5 acc 69.531 (73.457)	lr 0.02111
Train [31][3170/3239]	Time 0.607 (0.913)	Data Time 0.001 (0.010)	Loss 2.9970 (3.0800)	Entropy 0.74999 (0.75453)	Top-1 acc 51.172 (50.200)	Top-5 acc 76.172 (73.459)	lr 0.02111
Train [31][3180/3239]	Time 0.620 (0.913)	Data Time 0.000 (0.010)	Loss 3.1135 (3.0800)	Entropy 0.74989 (0.75452)	Top-1 acc 50.000 (50.197)	Top-5 acc 72.656 (73.456)	lr 0.02111
Train [31][3190/3239]	Time 0.588 (0.913)	Data Time 0.000 (0.010)	Loss 3.1348 (3.0801)	Entropy 0.74984 (0.75450)	Top-1 acc 47.656 (50.192)	Top-5 acc 73.438 (73.455)	lr 0.02111
Train [31][3200/3239]	Time 0.569 (0.913)	Data Time 0.000 (0.010)	Loss 3.2735 (3.0802)	Entropy 0.74969 (0.75449)	Top-1 acc 44.141 (50.185)	Top-5 acc 69.141 (73.452)	lr 0.02111
Train [31][3210/3239]	Time 0.584 (0.912)	Data Time 0.000 (0.010)	Loss 3.1553 (3.0803)	Entropy 0.74998 (0.75447)	Top-1 acc 53.516 (50.184)	Top-5 acc 73.438 (73.451)	lr 0.02111
Train [31][3220/3239]	Time 0.624 (0.912)	Data Time 0.000 (0.010)	Loss 2.9834 (3.0803)	Entropy 0.74997 (0.75446)	Top-1 acc 55.078 (50.186)	Top-5 acc 75.000 (73.451)	lr 0.02111
Train [31][3230/3239]	Time 0.623 (0.912)	Data Time 0.000 (0.010)	Loss 3.0775 (3.0805)	Entropy 0.75000 (0.75445)	Top-1 acc 47.656 (50.179)	Top-5 acc 73.828 (73.447)	lr 0.02111
Train [31][3239/3239]	Time 1.570 (0.912)	Data Time 0.000 (0.010)	Loss 3.0600 (3.0807)	Entropy 0.74983 (0.75443)	Top-1 acc 49.383 (50.176)	Top-5 acc 74.074 (73.443)	lr 0.02110
==========Valid [31/120]	loss 1.798	top-1 acc 59.353 (59.353)	top-5 acc 81.647	Train top-1 50.176	top-5 73.443	Entropy 0.74983	Latency-None: 0.000ms	Flops: 539.76M
Train [32][0/3239]	Time 25.769 (25.769)	Data Time 24.428 (24.428)	Loss 2.9274 (2.9274)	Entropy 0.74959 (0.74959)	Top-1 acc 55.859 (55.859)	Top-5 acc 74.609 (74.609)	lr 0.02110
Train [32][10/3239]	Time 0.588 (3.200)	Data Time 0.001 (2.223)	Loss 3.0785 (3.0355)	Entropy 0.74935 (0.74953)	Top-1 acc 51.953 (51.491)	Top-5 acc 70.703 (73.899)	lr 0.02110
Train [32][20/3239]	Time 0.635 (2.089)	Data Time 0.030 (1.168)	Loss 3.2724 (3.0628)	Entropy 0.74940 (0.74948)	Top-1 acc 47.656 (51.042)	Top-5 acc 67.188 (73.698)	lr 0.02110
Train [32][30/3239]	Time 0.661 (1.697)	Data Time 0.001 (0.792)	Loss 2.9436 (3.0663)	Entropy 0.74956 (0.74946)	Top-1 acc 51.953 (50.844)	Top-5 acc 75.391 (73.841)	lr 0.02110
Train [32][40/3239]	Time 0.583 (1.486)	Data Time 0.001 (0.599)	Loss 3.0889 (3.0692)	Entropy 0.74946 (0.74948)	Top-1 acc 43.359 (50.457)	Top-5 acc 73.828 (73.981)	lr 0.02110
Train [32][50/3239]	Time 0.611 (1.359)	Data Time 0.001 (0.482)	Loss 2.9508 (3.0708)	Entropy 0.74937 (0.74948)	Top-1 acc 54.688 (50.437)	Top-5 acc 76.172 (73.889)	lr 0.02110
Train [32][60/3239]	Time 0.608 (1.294)	Data Time 0.001 (0.403)	Loss 2.9933 (3.0658)	Entropy 0.74934 (0.74948)	Top-1 acc 51.172 (50.429)	Top-5 acc 75.781 (74.084)	lr 0.02110
Train [32][70/3239]	Time 0.593 (1.234)	Data Time 0.001 (0.347)	Loss 3.0516 (3.0553)	Entropy 0.74924 (0.74945)	Top-1 acc 48.828 (50.671)	Top-5 acc 72.656 (74.164)	lr 0.02110
Train [32][80/3239]	Time 0.601 (1.189)	Data Time 0.001 (0.304)	Loss 3.1164 (3.0495)	Entropy 0.74946 (0.74943)	Top-1 acc 48.828 (50.733)	Top-5 acc 75.391 (74.262)	lr 0.02110
Train [32][90/3239]	Time 0.656 (1.154)	Data Time 0.001 (0.271)	Loss 3.2771 (3.0487)	Entropy 0.74934 (0.74942)	Top-1 acc 44.531 (50.786)	Top-5 acc 69.141 (74.232)	lr 0.02110
Train [32][100/3239]	Time 0.637 (1.124)	Data Time 0.001 (0.244)	Loss 3.1482 (3.0518)	Entropy 0.74922 (0.74942)	Top-1 acc 52.734 (50.808)	Top-5 acc 72.266 (74.107)	lr 0.02110
Train [32][110/3239]	Time 0.609 (1.100)	Data Time 0.003 (0.222)	Loss 2.8748 (3.0498)	Entropy 0.74922 (0.74941)	Top-1 acc 55.078 (50.845)	Top-5 acc 81.641 (74.201)	lr 0.02110
Train [32][120/3239]	Time 0.617 (1.081)	Data Time 0.001 (0.204)	Loss 3.1500 (3.0504)	Entropy 0.74903 (0.74938)	Top-1 acc 49.609 (50.936)	Top-5 acc 71.875 (74.151)	lr 0.02110
Train [32][130/3239]	Time 0.600 (1.064)	Data Time 0.001 (0.189)	Loss 3.1890 (3.0501)	Entropy 0.74918 (0.74936)	Top-1 acc 50.391 (50.990)	Top-5 acc 70.703 (74.126)	lr 0.02109
Train [32][140/3239]	Time 0.634 (1.050)	Data Time 0.001 (0.176)	Loss 3.0847 (3.0560)	Entropy 0.74948 (0.74936)	Top-1 acc 52.344 (50.790)	Top-5 acc 74.609 (74.011)	lr 0.02109
Train [32][150/3239]	Time 0.635 (1.038)	Data Time 0.001 (0.164)	Loss 3.0091 (3.0555)	Entropy 0.74950 (0.74937)	Top-1 acc 50.000 (50.797)	Top-5 acc 75.000 (74.025)	lr 0.02109
Train [32][160/3239]	Time 0.737 (1.028)	Data Time 0.001 (0.154)	Loss 2.9704 (3.0502)	Entropy 0.74956 (0.74937)	Top-1 acc 53.906 (50.912)	Top-5 acc 74.219 (74.117)	lr 0.02109
Train [32][170/3239]	Time 0.595 (1.018)	Data Time 0.001 (0.145)	Loss 2.9803 (3.0461)	Entropy 0.74955 (0.74939)	Top-1 acc 54.297 (51.021)	Top-5 acc 75.391 (74.205)	lr 0.02109
Train [32][180/3239]	Time 0.627 (1.010)	Data Time 0.001 (0.137)	Loss 2.8913 (3.0462)	Entropy 0.74971 (0.74940)	Top-1 acc 54.297 (51.027)	Top-5 acc 77.344 (74.171)	lr 0.02109
Train [32][190/3239]	Time 0.613 (1.002)	Data Time 0.001 (0.130)	Loss 2.8920 (3.0482)	Entropy 0.74993 (0.74942)	Top-1 acc 52.344 (51.014)	Top-5 acc 75.781 (74.129)	lr 0.02109
Train [32][200/3239]	Time 0.611 (0.993)	Data Time 0.001 (0.124)	Loss 3.1512 (3.0484)	Entropy 0.75037 (0.74946)	Top-1 acc 46.484 (51.042)	Top-5 acc 73.828 (74.127)	lr 0.02109
Train [32][210/3239]	Time 0.516 (0.985)	Data Time 0.002 (0.118)	Loss 2.9447 (3.0483)	Entropy 0.75040 (0.74951)	Top-1 acc 55.078 (51.092)	Top-5 acc 73.047 (74.148)	lr 0.02109
Train [32][220/3239]	Time 0.636 (0.979)	Data Time 0.002 (0.113)	Loss 3.3209 (3.0519)	Entropy 0.75046 (0.74955)	Top-1 acc 47.656 (50.976)	Top-5 acc 69.141 (74.054)	lr 0.02109
Train [32][230/3239]	Time 0.615 (0.975)	Data Time 0.001 (0.108)	Loss 3.0510 (3.0518)	Entropy 0.75035 (0.74959)	Top-1 acc 50.781 (50.996)	Top-5 acc 75.391 (74.063)	lr 0.02109
Train [32][240/3239]	Time 0.609 (0.970)	Data Time 0.001 (0.104)	Loss 3.0187 (3.0506)	Entropy 0.75016 (0.74962)	Top-1 acc 53.516 (51.047)	Top-5 acc 75.000 (74.081)	lr 0.02109
Train [32][250/3239]	Time 0.582 (0.966)	Data Time 0.001 (0.099)	Loss 3.1206 (3.0492)	Entropy 0.75005 (0.74964)	Top-1 acc 50.000 (51.114)	Top-5 acc 71.484 (74.125)	lr 0.02109
Train [32][260/3239]	Time 0.592 (0.962)	Data Time 0.001 (0.096)	Loss 3.0975 (3.0517)	Entropy 0.75036 (0.74966)	Top-1 acc 46.094 (51.021)	Top-5 acc 74.609 (74.069)	lr 0.02109
Train [32][270/3239]	Time 0.631 (0.958)	Data Time 0.002 (0.092)	Loss 3.2845 (3.0514)	Entropy 0.75024 (0.74969)	Top-1 acc 44.141 (50.984)	Top-5 acc 69.531 (74.086)	lr 0.02108
Train [32][280/3239]	Time 0.603 (0.955)	Data Time 0.001 (0.089)	Loss 2.8928 (3.0508)	Entropy 0.75010 (0.74971)	Top-1 acc 52.344 (50.973)	Top-5 acc 78.906 (74.117)	lr 0.02108
Train [32][290/3239]	Time 0.670 (0.952)	Data Time 0.001 (0.086)	Loss 3.0232 (3.0468)	Entropy 0.74999 (0.74972)	Top-1 acc 49.219 (51.071)	Top-5 acc 72.266 (74.200)	lr 0.02108
Train [32][300/3239]	Time 0.616 (0.949)	Data Time 0.001 (0.083)	Loss 3.1414 (3.0470)	Entropy 0.75006 (0.74973)	Top-1 acc 51.172 (51.054)	Top-5 acc 74.219 (74.203)	lr 0.02108
Train [32][310/3239]	Time 0.623 (0.946)	Data Time 0.001 (0.081)	Loss 2.8776 (3.0483)	Entropy 0.75030 (0.74974)	Top-1 acc 52.734 (51.029)	Top-5 acc 78.125 (74.160)	lr 0.02108
Train [32][320/3239]	Time 0.680 (0.944)	Data Time 0.001 (0.078)	Loss 3.0072 (3.0512)	Entropy 0.75031 (0.74976)	Top-1 acc 50.391 (50.976)	Top-5 acc 75.781 (74.080)	lr 0.02108
Train [32][330/3239]	Time 0.632 (0.942)	Data Time 0.001 (0.076)	Loss 2.9763 (3.0496)	Entropy 0.75055 (0.74978)	Top-1 acc 52.734 (51.017)	Top-5 acc 77.344 (74.118)	lr 0.02108
Train [32][340/3239]	Time 0.600 (0.939)	Data Time 0.001 (0.074)	Loss 3.0094 (3.0500)	Entropy 0.75077 (0.74980)	Top-1 acc 50.000 (51.012)	Top-5 acc 74.219 (74.101)	lr 0.02108
Train [32][350/3239]	Time 0.592 (0.937)	Data Time 0.001 (0.072)	Loss 3.1915 (3.0496)	Entropy 0.75059 (0.74983)	Top-1 acc 48.438 (50.997)	Top-5 acc 73.047 (74.135)	lr 0.02108
Train [32][360/3239]	Time 0.615 (0.935)	Data Time 0.001 (0.070)	Loss 3.1314 (3.0486)	Entropy 0.75042 (0.74985)	Top-1 acc 49.609 (51.012)	Top-5 acc 72.656 (74.146)	lr 0.02108
Train [32][370/3239]	Time 0.561 (0.932)	Data Time 0.001 (0.068)	Loss 2.9612 (3.0489)	Entropy 0.75005 (0.74986)	Top-1 acc 56.641 (51.027)	Top-5 acc 76.172 (74.117)	lr 0.02108
Train [32][380/3239]	Time 0.598 (0.929)	Data Time 0.001 (0.066)	Loss 2.9008 (3.0490)	Entropy 0.74955 (0.74986)	Top-1 acc 52.344 (51.001)	Top-5 acc 78.516 (74.104)	lr 0.02108
Train [32][390/3239]	Time 0.721 (0.928)	Data Time 0.001 (0.065)	Loss 3.1906 (3.0500)	Entropy 0.74932 (0.74985)	Top-1 acc 48.828 (50.979)	Top-5 acc 70.703 (74.076)	lr 0.02108
Train [32][400/3239]	Time 0.747 (0.988)	Data Time 0.004 (0.063)	Loss 2.9772 (3.0487)	Entropy 0.74880 (0.74983)	Top-1 acc 51.953 (50.998)	Top-5 acc 77.734 (74.127)	lr 0.02108
Train [32][410/3239]	Time 0.617 (0.986)	Data Time 0.002 (0.062)	Loss 3.0775 (3.0486)	Entropy 0.74835 (0.74980)	Top-1 acc 52.344 (50.986)	Top-5 acc 73.047 (74.116)	lr 0.02107
Train [32][420/3239]	Time 0.650 (0.983)	Data Time 0.002 (0.060)	Loss 3.1670 (3.0488)	Entropy 0.74862 (0.74977)	Top-1 acc 44.141 (50.963)	Top-5 acc 69.922 (74.095)	lr 0.02107
Train [32][430/3239]	Time 0.628 (0.980)	Data Time 0.001 (0.059)	Loss 3.1715 (3.0509)	Entropy 0.74926 (0.74975)	Top-1 acc 44.531 (50.887)	Top-5 acc 72.266 (74.074)	lr 0.02107
Train [32][440/3239]	Time 0.583 (0.977)	Data Time 0.001 (0.057)	Loss 3.1473 (3.0508)	Entropy 0.74910 (0.74974)	Top-1 acc 45.703 (50.872)	Top-5 acc 73.438 (74.091)	lr 0.02107
Train [32][450/3239]	Time 0.633 (0.975)	Data Time 0.001 (0.056)	Loss 3.0245 (3.0514)	Entropy 0.74934 (0.74972)	Top-1 acc 48.828 (50.845)	Top-5 acc 77.344 (74.074)	lr 0.02107
Train [32][460/3239]	Time 0.600 (0.973)	Data Time 0.001 (0.055)	Loss 3.0688 (3.0522)	Entropy 0.74940 (0.74972)	Top-1 acc 50.781 (50.846)	Top-5 acc 77.344 (74.067)	lr 0.02107
Train [32][470/3239]	Time 0.647 (0.970)	Data Time 0.002 (0.054)	Loss 2.8678 (3.0540)	Entropy 0.74962 (0.74971)	Top-1 acc 53.125 (50.797)	Top-5 acc 78.906 (74.021)	lr 0.02107
Train [32][480/3239]	Time 0.671 (0.967)	Data Time 0.001 (0.053)	Loss 3.3234 (3.0543)	Entropy 0.74950 (0.74971)	Top-1 acc 44.141 (50.774)	Top-5 acc 70.312 (74.007)	lr 0.02107
Train [32][490/3239]	Time 0.465 (0.964)	Data Time 0.001 (0.052)	Loss 3.1941 (3.0533)	Entropy 0.74931 (0.74970)	Top-1 acc 45.703 (50.784)	Top-5 acc 67.578 (74.017)	lr 0.02107
Train [32][500/3239]	Time 0.597 (0.962)	Data Time 0.001 (0.051)	Loss 3.0438 (3.0538)	Entropy 0.74921 (0.74969)	Top-1 acc 52.734 (50.774)	Top-5 acc 74.219 (74.005)	lr 0.02107
Train [32][510/3239]	Time 0.601 (0.960)	Data Time 0.001 (0.050)	Loss 3.1021 (3.0526)	Entropy 0.74927 (0.74968)	Top-1 acc 51.172 (50.803)	Top-5 acc 75.391 (74.036)	lr 0.02107
Train [32][520/3239]	Time 0.603 (0.959)	Data Time 0.001 (0.049)	Loss 2.8450 (3.0514)	Entropy 0.74892 (0.74967)	Top-1 acc 55.469 (50.828)	Top-5 acc 76.172 (74.057)	lr 0.02107
Train [32][530/3239]	Time 0.611 (0.957)	Data Time 0.001 (0.048)	Loss 3.0117 (3.0506)	Entropy 0.74877 (0.74966)	Top-1 acc 51.172 (50.845)	Top-5 acc 74.219 (74.086)	lr 0.02107
Train [32][540/3239]	Time 0.627 (0.955)	Data Time 0.001 (0.047)	Loss 2.9366 (3.0508)	Entropy 0.74869 (0.74964)	Top-1 acc 51.953 (50.846)	Top-5 acc 77.734 (74.088)	lr 0.02106
Train [32][550/3239]	Time 0.684 (0.953)	Data Time 0.001 (0.046)	Loss 3.1071 (3.0526)	Entropy 0.74862 (0.74962)	Top-1 acc 48.828 (50.826)	Top-5 acc 69.531 (74.050)	lr 0.02106
Train [32][560/3239]	Time 0.658 (0.952)	Data Time 0.001 (0.046)	Loss 3.0394 (3.0534)	Entropy 0.74861 (0.74961)	Top-1 acc 53.125 (50.816)	Top-5 acc 74.609 (74.029)	lr 0.02106
Train [32][570/3239]	Time 0.600 (0.951)	Data Time 0.001 (0.045)	Loss 2.9556 (3.0539)	Entropy 0.74857 (0.74959)	Top-1 acc 55.078 (50.819)	Top-5 acc 75.391 (74.014)	lr 0.02106
Train [32][580/3239]	Time 0.636 (0.949)	Data Time 0.002 (0.044)	Loss 2.9232 (3.0536)	Entropy 0.74882 (0.74957)	Top-1 acc 51.172 (50.815)	Top-5 acc 75.781 (74.019)	lr 0.02106
Train [32][590/3239]	Time 0.606 (0.948)	Data Time 0.001 (0.043)	Loss 2.8262 (3.0528)	Entropy 0.74861 (0.74956)	Top-1 acc 53.906 (50.836)	Top-5 acc 80.078 (74.049)	lr 0.02106
Train [32][600/3239]	Time 0.644 (0.946)	Data Time 0.001 (0.043)	Loss 3.0914 (3.0522)	Entropy 0.74773 (0.74954)	Top-1 acc 49.219 (50.856)	Top-5 acc 74.219 (74.061)	lr 0.02106
Train [32][610/3239]	Time 0.609 (0.945)	Data Time 0.001 (0.042)	Loss 2.8789 (3.0515)	Entropy 0.74772 (0.74951)	Top-1 acc 54.297 (50.870)	Top-5 acc 78.125 (74.083)	lr 0.02106
Train [32][620/3239]	Time 0.629 (0.944)	Data Time 0.001 (0.041)	Loss 3.0039 (3.0521)	Entropy 0.74764 (0.74948)	Top-1 acc 51.562 (50.857)	Top-5 acc 74.219 (74.078)	lr 0.02106
Train [32][630/3239]	Time 0.602 (0.942)	Data Time 0.001 (0.041)	Loss 3.1685 (3.0518)	Entropy 0.74750 (0.74945)	Top-1 acc 51.562 (50.866)	Top-5 acc 70.312 (74.101)	lr 0.02106
Train [32][640/3239]	Time 0.571 (0.941)	Data Time 0.001 (0.040)	Loss 3.2524 (3.0518)	Entropy 0.74784 (0.74942)	Top-1 acc 46.875 (50.871)	Top-5 acc 70.703 (74.102)	lr 0.02106
Train [32][650/3239]	Time 0.610 (0.939)	Data Time 0.001 (0.040)	Loss 3.1434 (3.0513)	Entropy 0.74763 (0.74940)	Top-1 acc 48.828 (50.892)	Top-5 acc 73.438 (74.114)	lr 0.02106
Train [32][660/3239]	Time 0.605 (0.938)	Data Time 0.001 (0.039)	Loss 2.9690 (3.0507)	Entropy 0.74724 (0.74937)	Top-1 acc 51.172 (50.894)	Top-5 acc 75.391 (74.130)	lr 0.02106
Train [32][670/3239]	Time 0.640 (0.937)	Data Time 0.001 (0.038)	Loss 2.9141 (3.0503)	Entropy 0.74682 (0.74934)	Top-1 acc 52.734 (50.910)	Top-5 acc 75.781 (74.127)	lr 0.02106
Train [32][680/3239]	Time 0.624 (0.936)	Data Time 0.001 (0.038)	Loss 3.1341 (3.0505)	Entropy 0.74720 (0.74930)	Top-1 acc 47.266 (50.900)	Top-5 acc 71.875 (74.121)	lr 0.02105
Train [32][690/3239]	Time 0.631 (0.935)	Data Time 0.001 (0.037)	Loss 3.0400 (3.0502)	Entropy 0.74729 (0.74927)	Top-1 acc 53.906 (50.904)	Top-5 acc 72.266 (74.119)	lr 0.02105
Train [32][700/3239]	Time 0.585 (0.933)	Data Time 0.001 (0.037)	Loss 3.2342 (3.0512)	Entropy 0.74690 (0.74924)	Top-1 acc 48.828 (50.873)	Top-5 acc 71.094 (74.113)	lr 0.02105
Train [32][710/3239]	Time 0.698 (0.933)	Data Time 0.001 (0.036)	Loss 2.9506 (3.0514)	Entropy 0.74696 (0.74921)	Top-1 acc 49.219 (50.859)	Top-5 acc 73.828 (74.115)	lr 0.02105
Train [32][720/3239]	Time 0.623 (0.932)	Data Time 0.001 (0.036)	Loss 3.1034 (3.0511)	Entropy 0.74689 (0.74918)	Top-1 acc 50.391 (50.869)	Top-5 acc 71.094 (74.127)	lr 0.02105
Train [32][730/3239]	Time 0.572 (0.931)	Data Time 0.001 (0.035)	Loss 3.0465 (3.0519)	Entropy 0.74645 (0.74914)	Top-1 acc 51.562 (50.837)	Top-5 acc 73.438 (74.111)	lr 0.02105
Train [32][740/3239]	Time 0.632 (0.930)	Data Time 0.001 (0.035)	Loss 2.7584 (3.0520)	Entropy 0.74665 (0.74911)	Top-1 acc 51.953 (50.832)	Top-5 acc 80.469 (74.100)	lr 0.02105
Train [32][750/3239]	Time 0.612 (0.929)	Data Time 0.001 (0.035)	Loss 2.9847 (3.0529)	Entropy 0.74698 (0.74908)	Top-1 acc 50.391 (50.804)	Top-5 acc 76.172 (74.081)	lr 0.02105
Train [32][760/3239]	Time 0.601 (0.928)	Data Time 0.001 (0.034)	Loss 2.8404 (3.0530)	Entropy 0.74733 (0.74905)	Top-1 acc 57.031 (50.811)	Top-5 acc 77.734 (74.071)	lr 0.02105
Train [32][770/3239]	Time 0.591 (0.928)	Data Time 0.001 (0.034)	Loss 3.1116 (3.0524)	Entropy 0.74737 (0.74903)	Top-1 acc 49.609 (50.826)	Top-5 acc 73.828 (74.074)	lr 0.02105
Train [32][780/3239]	Time 0.609 (0.927)	Data Time 0.001 (0.033)	Loss 2.8977 (3.0510)	Entropy 0.74733 (0.74901)	Top-1 acc 51.562 (50.853)	Top-5 acc 78.125 (74.103)	lr 0.02105
Train [32][790/3239]	Time 0.705 (0.926)	Data Time 0.001 (0.033)	Loss 3.1367 (3.0506)	Entropy 0.74715 (0.74899)	Top-1 acc 51.953 (50.865)	Top-5 acc 73.047 (74.127)	lr 0.02105
Train [32][800/3239]	Time 0.634 (0.925)	Data Time 0.001 (0.033)	Loss 3.0059 (3.0510)	Entropy 0.74714 (0.74896)	Top-1 acc 57.031 (50.856)	Top-5 acc 76.562 (74.121)	lr 0.02105
Train [32][810/3239]	Time 0.576 (0.924)	Data Time 0.001 (0.032)	Loss 3.1758 (3.0514)	Entropy 0.74683 (0.74894)	Top-1 acc 47.266 (50.844)	Top-5 acc 69.531 (74.111)	lr 0.02104
Train [32][820/3239]	Time 0.598 (0.922)	Data Time 0.001 (0.032)	Loss 3.0008 (3.0511)	Entropy 0.74720 (0.74892)	Top-1 acc 51.953 (50.864)	Top-5 acc 76.172 (74.114)	lr 0.02104
Train [32][830/3239]	Time 0.626 (0.921)	Data Time 0.001 (0.031)	Loss 2.8767 (3.0510)	Entropy 0.74707 (0.74889)	Top-1 acc 56.641 (50.859)	Top-5 acc 78.125 (74.121)	lr 0.02104
Train [32][840/3239]	Time 0.578 (0.921)	Data Time 0.001 (0.031)	Loss 2.7599 (3.0510)	Entropy 0.74650 (0.74887)	Top-1 acc 55.078 (50.856)	Top-5 acc 81.641 (74.127)	lr 0.02104
Train [32][850/3239]	Time 0.619 (0.920)	Data Time 0.001 (0.031)	Loss 3.0547 (3.0511)	Entropy 0.74650 (0.74884)	Top-1 acc 53.125 (50.852)	Top-5 acc 75.391 (74.119)	lr 0.02104
Train [32][860/3239]	Time 0.624 (0.920)	Data Time 0.001 (0.030)	Loss 3.1178 (3.0506)	Entropy 0.74638 (0.74881)	Top-1 acc 49.609 (50.857)	Top-5 acc 74.219 (74.131)	lr 0.02104
Train [32][870/3239]	Time 0.694 (0.919)	Data Time 0.001 (0.030)	Loss 3.0590 (3.0504)	Entropy 0.74649 (0.74879)	Top-1 acc 52.344 (50.866)	Top-5 acc 75.000 (74.138)	lr 0.02104
Train [32][880/3239]	Time 0.602 (0.918)	Data Time 0.001 (0.030)	Loss 3.4110 (3.0509)	Entropy 0.74653 (0.74876)	Top-1 acc 42.578 (50.855)	Top-5 acc 69.141 (74.128)	lr 0.02104
Train [32][890/3239]	Time 0.554 (0.918)	Data Time 0.001 (0.029)	Loss 2.8613 (3.0509)	Entropy 0.74628 (0.74873)	Top-1 acc 55.078 (50.851)	Top-5 acc 80.859 (74.135)	lr 0.02104
Train [32][900/3239]	Time 0.601 (0.917)	Data Time 0.001 (0.029)	Loss 2.7739 (3.0507)	Entropy 0.74667 (0.74871)	Top-1 acc 57.812 (50.850)	Top-5 acc 80.469 (74.142)	lr 0.02104
Train [32][910/3239]	Time 0.642 (0.917)	Data Time 0.001 (0.029)	Loss 3.1296 (3.0502)	Entropy 0.74656 (0.74869)	Top-1 acc 47.656 (50.865)	Top-5 acc 75.391 (74.142)	lr 0.02104
Train [32][920/3239]	Time 0.606 (0.916)	Data Time 0.001 (0.029)	Loss 2.9636 (3.0502)	Entropy 0.74635 (0.74866)	Top-1 acc 53.125 (50.867)	Top-5 acc 79.297 (74.146)	lr 0.02104
Train [32][930/3239]	Time 0.620 (0.916)	Data Time 0.001 (0.028)	Loss 3.0206 (3.0502)	Entropy 0.74613 (0.74864)	Top-1 acc 51.562 (50.872)	Top-5 acc 75.781 (74.156)	lr 0.02104
Train [32][940/3239]	Time 0.628 (0.915)	Data Time 0.001 (0.028)	Loss 2.9350 (3.0501)	Entropy 0.74611 (0.74861)	Top-1 acc 52.344 (50.875)	Top-5 acc 76.172 (74.144)	lr 0.02104
Train [32][950/3239]	Time 0.635 (0.915)	Data Time 0.001 (0.028)	Loss 2.9898 (3.0494)	Entropy 0.74658 (0.74858)	Top-1 acc 55.078 (50.907)	Top-5 acc 76.562 (74.152)	lr 0.02103
Train [32][960/3239]	Time 0.631 (0.914)	Data Time 0.003 (0.027)	Loss 2.9971 (3.0495)	Entropy 0.74666 (0.74856)	Top-1 acc 50.391 (50.901)	Top-5 acc 74.609 (74.141)	lr 0.02103
Train [32][970/3239]	Time 0.605 (0.914)	Data Time 0.001 (0.027)	Loss 3.0342 (3.0502)	Entropy 0.74688 (0.74855)	Top-1 acc 51.562 (50.891)	Top-5 acc 75.000 (74.122)	lr 0.02103
Train [32][980/3239]	Time 0.610 (0.913)	Data Time 0.002 (0.027)	Loss 2.9402 (3.0502)	Entropy 0.74703 (0.74853)	Top-1 acc 53.125 (50.890)	Top-5 acc 77.734 (74.120)	lr 0.02103
Train [32][990/3239]	Time 0.613 (0.912)	Data Time 0.001 (0.027)	Loss 3.0085 (3.0502)	Entropy 0.74668 (0.74851)	Top-1 acc 55.469 (50.891)	Top-5 acc 73.047 (74.119)	lr 0.02103
Train [32][1000/3239]	Time 0.631 (0.911)	Data Time 0.001 (0.026)	Loss 3.2009 (3.0502)	Entropy 0.74693 (0.74850)	Top-1 acc 49.219 (50.896)	Top-5 acc 69.141 (74.111)	lr 0.02103
Train [32][1010/3239]	Time 0.584 (0.911)	Data Time 0.001 (0.026)	Loss 2.9784 (3.0508)	Entropy 0.74690 (0.74848)	Top-1 acc 55.859 (50.881)	Top-5 acc 75.000 (74.101)	lr 0.02103
Train [32][1020/3239]	Time 0.653 (0.910)	Data Time 0.001 (0.026)	Loss 3.2359 (3.0509)	Entropy 0.74682 (0.74846)	Top-1 acc 46.094 (50.886)	Top-5 acc 68.750 (74.103)	lr 0.02103
Train [32][1030/3239]	Time 0.709 (0.910)	Data Time 0.002 (0.026)	Loss 3.2481 (3.0512)	Entropy 0.74661 (0.74845)	Top-1 acc 48.047 (50.880)	Top-5 acc 73.438 (74.094)	lr 0.02103
Train [32][1040/3239]	Time 0.594 (0.909)	Data Time 0.001 (0.025)	Loss 3.1500 (3.0517)	Entropy 0.74635 (0.74843)	Top-1 acc 48.828 (50.870)	Top-5 acc 71.875 (74.086)	lr 0.02103
Train [32][1050/3239]	Time 0.606 (0.909)	Data Time 0.001 (0.025)	Loss 2.9043 (3.0518)	Entropy 0.74611 (0.74841)	Top-1 acc 52.344 (50.863)	Top-5 acc 78.125 (74.087)	lr 0.02103
Train [32][1060/3239]	Time 0.618 (0.933)	Data Time 0.002 (0.025)	Loss 3.1159 (3.0515)	Entropy 0.74635 (0.74839)	Top-1 acc 53.516 (50.882)	Top-5 acc 71.094 (74.093)	lr 0.02103
Train [32][1070/3239]	Time 0.599 (0.932)	Data Time 0.002 (0.025)	Loss 3.0087 (3.0520)	Entropy 0.74600 (0.74837)	Top-1 acc 51.172 (50.867)	Top-5 acc 75.391 (74.087)	lr 0.02103
Train [32][1080/3239]	Time 0.579 (0.932)	Data Time 0.002 (0.025)	Loss 3.2009 (3.0527)	Entropy 0.74604 (0.74835)	Top-1 acc 46.875 (50.843)	Top-5 acc 71.094 (74.071)	lr 0.02102
Train [32][1090/3239]	Time 0.545 (0.931)	Data Time 0.001 (0.024)	Loss 3.1415 (3.0528)	Entropy 0.74579 (0.74832)	Top-1 acc 48.438 (50.832)	Top-5 acc 74.219 (74.079)	lr 0.02102
Train [32][1100/3239]	Time 0.598 (0.930)	Data Time 0.002 (0.024)	Loss 3.0906 (3.0524)	Entropy 0.74590 (0.74830)	Top-1 acc 50.000 (50.834)	Top-5 acc 76.172 (74.088)	lr 0.02102
Train [32][1110/3239]	Time 0.615 (0.929)	Data Time 0.001 (0.024)	Loss 3.0197 (3.0522)	Entropy 0.74614 (0.74828)	Top-1 acc 54.688 (50.844)	Top-5 acc 75.781 (74.100)	lr 0.02102
Train [32][1120/3239]	Time 0.616 (0.929)	Data Time 0.001 (0.024)	Loss 3.0538 (3.0520)	Entropy 0.74633 (0.74826)	Top-1 acc 52.344 (50.850)	Top-5 acc 73.047 (74.103)	lr 0.02102
Train [32][1130/3239]	Time 0.636 (0.928)	Data Time 0.001 (0.024)	Loss 3.1390 (3.0522)	Entropy 0.74586 (0.74824)	Top-1 acc 48.828 (50.853)	Top-5 acc 71.484 (74.094)	lr 0.02102
Train [32][1140/3239]	Time 0.576 (0.928)	Data Time 0.001 (0.023)	Loss 3.1199 (3.0524)	Entropy 0.74618 (0.74822)	Top-1 acc 49.219 (50.845)	Top-5 acc 73.828 (74.091)	lr 0.02102
Train [32][1150/3239]	Time 0.582 (0.927)	Data Time 0.001 (0.023)	Loss 3.1855 (3.0522)	Entropy 0.74529 (0.74820)	Top-1 acc 48.438 (50.845)	Top-5 acc 71.484 (74.093)	lr 0.02102
Train [32][1160/3239]	Time 0.604 (0.927)	Data Time 0.001 (0.023)	Loss 2.9512 (3.0519)	Entropy 0.74552 (0.74818)	Top-1 acc 52.344 (50.852)	Top-5 acc 73.438 (74.093)	lr 0.02102
Train [32][1170/3239]	Time 0.581 (0.926)	Data Time 0.001 (0.023)	Loss 3.2430 (3.0521)	Entropy 0.74512 (0.74815)	Top-1 acc 46.094 (50.851)	Top-5 acc 70.312 (74.086)	lr 0.02102
Train [32][1180/3239]	Time 0.587 (0.926)	Data Time 0.001 (0.023)	Loss 3.0674 (3.0525)	Entropy 0.74529 (0.74813)	Top-1 acc 46.484 (50.844)	Top-5 acc 74.609 (74.074)	lr 0.02102
Train [32][1190/3239]	Time 0.701 (0.925)	Data Time 0.001 (0.023)	Loss 3.0610 (3.0524)	Entropy 0.74555 (0.74811)	Top-1 acc 50.781 (50.842)	Top-5 acc 72.656 (74.073)	lr 0.02102
Train [32][1200/3239]	Time 0.616 (0.925)	Data Time 0.001 (0.022)	Loss 3.0234 (3.0523)	Entropy 0.74562 (0.74809)	Top-1 acc 54.297 (50.845)	Top-5 acc 72.266 (74.080)	lr 0.02102
Train [32][1210/3239]	Time 0.591 (0.924)	Data Time 0.001 (0.022)	Loss 3.0250 (3.0526)	Entropy 0.74549 (0.74807)	Top-1 acc 50.781 (50.838)	Top-5 acc 73.828 (74.070)	lr 0.02102
Train [32][1220/3239]	Time 0.598 (0.924)	Data Time 0.001 (0.022)	Loss 3.2587 (3.0526)	Entropy 0.74555 (0.74804)	Top-1 acc 44.531 (50.829)	Top-5 acc 69.922 (74.076)	lr 0.02101
Train [32][1230/3239]	Time 0.615 (0.923)	Data Time 0.001 (0.022)	Loss 3.0912 (3.0527)	Entropy 0.74568 (0.74802)	Top-1 acc 47.656 (50.815)	Top-5 acc 74.609 (74.073)	lr 0.02101
Train [32][1240/3239]	Time 0.614 (0.923)	Data Time 0.001 (0.022)	Loss 2.8366 (3.0529)	Entropy 0.74541 (0.74800)	Top-1 acc 58.203 (50.809)	Top-5 acc 78.906 (74.076)	lr 0.02101
Train [32][1250/3239]	Time 0.620 (0.922)	Data Time 0.001 (0.022)	Loss 3.1719 (3.0530)	Entropy 0.74499 (0.74798)	Top-1 acc 51.172 (50.803)	Top-5 acc 71.875 (74.075)	lr 0.02101
Train [32][1260/3239]	Time 0.717 (0.921)	Data Time 0.001 (0.021)	Loss 3.0596 (3.0527)	Entropy 0.74526 (0.74796)	Top-1 acc 51.562 (50.813)	Top-5 acc 74.609 (74.077)	lr 0.02101
Train [32][1270/3239]	Time 0.615 (0.921)	Data Time 0.001 (0.021)	Loss 2.9740 (3.0530)	Entropy 0.74515 (0.74794)	Top-1 acc 54.688 (50.816)	Top-5 acc 76.562 (74.074)	lr 0.02101
Train [32][1280/3239]	Time 0.573 (0.920)	Data Time 0.001 (0.021)	Loss 3.1397 (3.0529)	Entropy 0.74503 (0.74792)	Top-1 acc 52.734 (50.825)	Top-5 acc 71.484 (74.073)	lr 0.02101
Train [32][1290/3239]	Time 0.608 (0.920)	Data Time 0.001 (0.021)	Loss 3.1018 (3.0528)	Entropy 0.74529 (0.74790)	Top-1 acc 49.609 (50.825)	Top-5 acc 73.438 (74.077)	lr 0.02101
Train [32][1300/3239]	Time 0.602 (0.919)	Data Time 0.001 (0.021)	Loss 3.1644 (3.0525)	Entropy 0.74496 (0.74787)	Top-1 acc 47.656 (50.826)	Top-5 acc 72.266 (74.077)	lr 0.02101
Train [32][1310/3239]	Time 0.617 (0.919)	Data Time 0.001 (0.021)	Loss 3.0867 (3.0525)	Entropy 0.74476 (0.74785)	Top-1 acc 51.953 (50.824)	Top-5 acc 71.484 (74.070)	lr 0.02101
Train [32][1320/3239]	Time 0.602 (0.919)	Data Time 0.001 (0.020)	Loss 3.1688 (3.0528)	Entropy 0.74469 (0.74783)	Top-1 acc 50.391 (50.820)	Top-5 acc 73.828 (74.071)	lr 0.02101
Train [32][1330/3239]	Time 0.619 (0.918)	Data Time 0.001 (0.020)	Loss 2.9358 (3.0532)	Entropy 0.74476 (0.74780)	Top-1 acc 53.906 (50.809)	Top-5 acc 76.172 (74.063)	lr 0.02101
Train [32][1340/3239]	Time 0.609 (0.918)	Data Time 0.001 (0.020)	Loss 3.1273 (3.0532)	Entropy 0.74479 (0.74778)	Top-1 acc 49.219 (50.811)	Top-5 acc 73.828 (74.064)	lr 0.02101
Train [32][1350/3239]	Time 0.698 (0.918)	Data Time 0.001 (0.020)	Loss 3.1412 (3.0533)	Entropy 0.74467 (0.74776)	Top-1 acc 46.484 (50.802)	Top-5 acc 72.266 (74.066)	lr 0.02101
Train [32][1360/3239]	Time 0.611 (0.917)	Data Time 0.001 (0.020)	Loss 3.0958 (3.0535)	Entropy 0.74414 (0.74774)	Top-1 acc 51.953 (50.798)	Top-5 acc 71.875 (74.059)	lr 0.02100
Train [32][1370/3239]	Time 0.599 (0.917)	Data Time 0.001 (0.020)	Loss 3.0994 (3.0537)	Entropy 0.74394 (0.74771)	Top-1 acc 49.609 (50.793)	Top-5 acc 73.047 (74.047)	lr 0.02100
Train [32][1380/3239]	Time 0.592 (0.916)	Data Time 0.001 (0.020)	Loss 3.0196 (3.0536)	Entropy 0.74423 (0.74768)	Top-1 acc 50.781 (50.792)	Top-5 acc 74.609 (74.050)	lr 0.02100
Train [32][1390/3239]	Time 0.586 (0.916)	Data Time 0.001 (0.020)	Loss 3.2120 (3.0540)	Entropy 0.74422 (0.74766)	Top-1 acc 44.922 (50.785)	Top-5 acc 69.531 (74.038)	lr 0.02100
Train [32][1400/3239]	Time 0.601 (0.916)	Data Time 0.001 (0.019)	Loss 3.0799 (3.0541)	Entropy 0.74409 (0.74763)	Top-1 acc 51.172 (50.780)	Top-5 acc 73.047 (74.037)	lr 0.02100
Train [32][1410/3239]	Time 0.559 (0.915)	Data Time 0.001 (0.019)	Loss 2.9343 (3.0540)	Entropy 0.74354 (0.74761)	Top-1 acc 55.859 (50.775)	Top-5 acc 73.438 (74.035)	lr 0.02100
Train [32][1420/3239]	Time 0.674 (0.915)	Data Time 0.001 (0.019)	Loss 2.8807 (3.0536)	Entropy 0.74354 (0.74758)	Top-1 acc 54.297 (50.788)	Top-5 acc 76.953 (74.043)	lr 0.02100
Train [32][1430/3239]	Time 0.610 (0.914)	Data Time 0.001 (0.019)	Loss 3.0267 (3.0536)	Entropy 0.74398 (0.74755)	Top-1 acc 50.000 (50.780)	Top-5 acc 75.391 (74.039)	lr 0.02100
Train [32][1440/3239]	Time 0.636 (0.914)	Data Time 0.001 (0.019)	Loss 3.1631 (3.0538)	Entropy 0.74385 (0.74753)	Top-1 acc 51.172 (50.775)	Top-5 acc 72.266 (74.035)	lr 0.02100
Train [32][1450/3239]	Time 0.586 (0.913)	Data Time 0.001 (0.019)	Loss 3.3507 (3.0542)	Entropy 0.74397 (0.74750)	Top-1 acc 44.531 (50.765)	Top-5 acc 68.750 (74.036)	lr 0.02100
Train [32][1460/3239]	Time 0.582 (0.913)	Data Time 0.001 (0.019)	Loss 3.1662 (3.0541)	Entropy 0.74388 (0.74748)	Top-1 acc 49.219 (50.767)	Top-5 acc 70.312 (74.030)	lr 0.02100
Train [32][1470/3239]	Time 0.603 (0.913)	Data Time 0.001 (0.019)	Loss 3.0384 (3.0537)	Entropy 0.74398 (0.74745)	Top-1 acc 53.906 (50.774)	Top-5 acc 73.047 (74.039)	lr 0.02100
Train [32][1480/3239]	Time 0.611 (0.912)	Data Time 0.001 (0.018)	Loss 3.0497 (3.0537)	Entropy 0.74393 (0.74743)	Top-1 acc 51.172 (50.773)	Top-5 acc 75.391 (74.039)	lr 0.02100
Train [32][1490/3239]	Time 0.589 (0.912)	Data Time 0.001 (0.018)	Loss 3.2148 (3.0540)	Entropy 0.74351 (0.74740)	Top-1 acc 47.656 (50.759)	Top-5 acc 72.266 (74.036)	lr 0.02099
Train [32][1500/3239]	Time 0.581 (0.912)	Data Time 0.001 (0.018)	Loss 2.8517 (3.0540)	Entropy 0.74342 (0.74738)	Top-1 acc 53.906 (50.760)	Top-5 acc 75.781 (74.037)	lr 0.02099
Train [32][1510/3239]	Time 0.579 (0.911)	Data Time 0.001 (0.018)	Loss 3.0449 (3.0537)	Entropy 0.74337 (0.74735)	Top-1 acc 49.609 (50.768)	Top-5 acc 71.875 (74.037)	lr 0.02099
Train [32][1520/3239]	Time 0.588 (0.911)	Data Time 0.001 (0.018)	Loss 3.1697 (3.0537)	Entropy 0.74374 (0.74733)	Top-1 acc 51.172 (50.768)	Top-5 acc 75.781 (74.035)	lr 0.02099
Train [32][1530/3239]	Time 0.566 (0.911)	Data Time 0.001 (0.018)	Loss 3.3187 (3.0540)	Entropy 0.74356 (0.74730)	Top-1 acc 44.531 (50.761)	Top-5 acc 67.969 (74.032)	lr 0.02099
Train [32][1540/3239]	Time 0.596 (0.910)	Data Time 0.001 (0.018)	Loss 3.3398 (3.0536)	Entropy 0.74357 (0.74728)	Top-1 acc 49.219 (50.779)	Top-5 acc 68.359 (74.035)	lr 0.02099
Train [32][1550/3239]	Time 0.600 (0.910)	Data Time 0.001 (0.018)	Loss 3.2448 (3.0537)	Entropy 0.74371 (0.74726)	Top-1 acc 48.438 (50.782)	Top-5 acc 71.875 (74.038)	lr 0.02099
Train [32][1560/3239]	Time 0.615 (0.910)	Data Time 0.001 (0.018)	Loss 3.1567 (3.0539)	Entropy 0.74366 (0.74723)	Top-1 acc 47.266 (50.777)	Top-5 acc 72.656 (74.037)	lr 0.02099
Train [32][1570/3239]	Time 0.610 (0.909)	Data Time 0.001 (0.018)	Loss 3.1025 (3.0536)	Entropy 0.74352 (0.74721)	Top-1 acc 50.000 (50.785)	Top-5 acc 70.703 (74.039)	lr 0.02099
Train [32][1580/3239]	Time 0.705 (0.909)	Data Time 0.001 (0.017)	Loss 3.0388 (3.0537)	Entropy 0.74387 (0.74719)	Top-1 acc 50.391 (50.784)	Top-5 acc 73.828 (74.039)	lr 0.02099
Train [32][1590/3239]	Time 0.582 (0.908)	Data Time 0.001 (0.017)	Loss 3.0892 (3.0538)	Entropy 0.74399 (0.74717)	Top-1 acc 50.000 (50.784)	Top-5 acc 73.438 (74.033)	lr 0.02099
Train [32][1600/3239]	Time 0.620 (0.908)	Data Time 0.001 (0.017)	Loss 2.9359 (3.0537)	Entropy 0.74399 (0.74715)	Top-1 acc 52.734 (50.781)	Top-5 acc 78.906 (74.033)	lr 0.02099
Train [32][1610/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.017)	Loss 3.1040 (3.0534)	Entropy 0.74411 (0.74713)	Top-1 acc 53.516 (50.790)	Top-5 acc 73.438 (74.036)	lr 0.02099
Train [32][1620/3239]	Time 0.618 (0.908)	Data Time 0.001 (0.017)	Loss 3.0015 (3.0530)	Entropy 0.74455 (0.74711)	Top-1 acc 52.344 (50.802)	Top-5 acc 72.266 (74.044)	lr 0.02099
Train [32][1630/3239]	Time 0.642 (0.907)	Data Time 0.001 (0.017)	Loss 3.0207 (3.0527)	Entropy 0.74413 (0.74709)	Top-1 acc 51.172 (50.807)	Top-5 acc 76.953 (74.052)	lr 0.02098
Train [32][1640/3239]	Time 0.629 (0.907)	Data Time 0.001 (0.017)	Loss 3.1182 (3.0531)	Entropy 0.74408 (0.74708)	Top-1 acc 48.438 (50.793)	Top-5 acc 73.438 (74.046)	lr 0.02098
Train [32][1650/3239]	Time 0.691 (0.907)	Data Time 0.001 (0.017)	Loss 3.3155 (3.0530)	Entropy 0.74408 (0.74706)	Top-1 acc 47.656 (50.800)	Top-5 acc 69.141 (74.050)	lr 0.02098
Train [32][1660/3239]	Time 0.647 (0.907)	Data Time 0.001 (0.017)	Loss 3.1559 (3.0529)	Entropy 0.74409 (0.74704)	Top-1 acc 48.047 (50.795)	Top-5 acc 71.875 (74.052)	lr 0.02098
Train [32][1670/3239]	Time 0.619 (0.906)	Data Time 0.001 (0.017)	Loss 3.1129 (3.0530)	Entropy 0.74398 (0.74702)	Top-1 acc 51.562 (50.791)	Top-5 acc 72.266 (74.053)	lr 0.02098
Train [32][1680/3239]	Time 0.586 (0.906)	Data Time 0.001 (0.016)	Loss 3.0814 (3.0528)	Entropy 0.74426 (0.74700)	Top-1 acc 50.391 (50.796)	Top-5 acc 75.000 (74.053)	lr 0.02098
Train [32][1690/3239]	Time 0.587 (0.906)	Data Time 0.001 (0.016)	Loss 2.9358 (3.0528)	Entropy 0.74394 (0.74699)	Top-1 acc 53.906 (50.793)	Top-5 acc 77.734 (74.049)	lr 0.02098
Train [32][1700/3239]	Time 0.620 (0.906)	Data Time 0.001 (0.016)	Loss 3.0804 (3.0527)	Entropy 0.74429 (0.74697)	Top-1 acc 51.172 (50.799)	Top-5 acc 71.875 (74.052)	lr 0.02098
Train [32][1710/3239]	Time 0.739 (0.921)	Data Time 0.004 (0.016)	Loss 3.0597 (3.0525)	Entropy 0.74402 (0.74695)	Top-1 acc 51.172 (50.799)	Top-5 acc 75.000 (74.058)	lr 0.02098
Train [32][1720/3239]	Time 0.628 (0.921)	Data Time 0.002 (0.016)	Loss 3.0769 (3.0527)	Entropy 0.74422 (0.74694)	Top-1 acc 49.219 (50.794)	Top-5 acc 75.391 (74.057)	lr 0.02098
Train [32][1730/3239]	Time 0.655 (0.920)	Data Time 0.001 (0.016)	Loss 3.0251 (3.0530)	Entropy 0.74430 (0.74692)	Top-1 acc 49.609 (50.791)	Top-5 acc 72.656 (74.049)	lr 0.02098
Train [32][1740/3239]	Time 0.744 (0.920)	Data Time 0.001 (0.016)	Loss 2.8738 (3.0531)	Entropy 0.74415 (0.74691)	Top-1 acc 55.078 (50.788)	Top-5 acc 78.516 (74.049)	lr 0.02098
Train [32][1750/3239]	Time 0.612 (0.920)	Data Time 0.001 (0.016)	Loss 2.9446 (3.0529)	Entropy 0.74403 (0.74689)	Top-1 acc 53.125 (50.796)	Top-5 acc 77.344 (74.051)	lr 0.02098
Train [32][1760/3239]	Time 0.605 (0.919)	Data Time 0.001 (0.016)	Loss 2.9907 (3.0531)	Entropy 0.74419 (0.74687)	Top-1 acc 51.953 (50.790)	Top-5 acc 75.781 (74.050)	lr 0.02097
Train [32][1770/3239]	Time 0.585 (0.919)	Data Time 0.001 (0.016)	Loss 2.9406 (3.0531)	Entropy 0.74431 (0.74686)	Top-1 acc 52.734 (50.795)	Top-5 acc 74.609 (74.051)	lr 0.02097
Train [32][1780/3239]	Time 0.646 (0.919)	Data Time 0.001 (0.016)	Loss 3.0503 (3.0532)	Entropy 0.74435 (0.74684)	Top-1 acc 49.219 (50.793)	Top-5 acc 70.312 (74.046)	lr 0.02097
Train [32][1790/3239]	Time 0.594 (0.919)	Data Time 0.001 (0.016)	Loss 3.1184 (3.0534)	Entropy 0.74459 (0.74683)	Top-1 acc 48.438 (50.789)	Top-5 acc 73.047 (74.043)	lr 0.02097
Train [32][1800/3239]	Time 0.572 (0.918)	Data Time 0.001 (0.016)	Loss 3.1655 (3.0535)	Entropy 0.74460 (0.74682)	Top-1 acc 50.391 (50.790)	Top-5 acc 69.922 (74.039)	lr 0.02097
Train [32][1810/3239]	Time 0.692 (0.918)	Data Time 0.001 (0.015)	Loss 2.8818 (3.0529)	Entropy 0.74457 (0.74681)	Top-1 acc 51.953 (50.800)	Top-5 acc 79.297 (74.049)	lr 0.02097
Train [32][1820/3239]	Time 0.627 (0.918)	Data Time 0.001 (0.015)	Loss 3.1162 (3.0533)	Entropy 0.74451 (0.74679)	Top-1 acc 50.391 (50.788)	Top-5 acc 70.703 (74.038)	lr 0.02097
Train [32][1830/3239]	Time 0.615 (0.917)	Data Time 0.001 (0.015)	Loss 3.0599 (3.0537)	Entropy 0.74509 (0.74678)	Top-1 acc 51.562 (50.787)	Top-5 acc 75.000 (74.031)	lr 0.02097
Train [32][1840/3239]	Time 0.618 (0.917)	Data Time 0.001 (0.015)	Loss 3.0628 (3.0540)	Entropy 0.74522 (0.74677)	Top-1 acc 50.000 (50.778)	Top-5 acc 71.875 (74.025)	lr 0.02097
Train [32][1850/3239]	Time 0.491 (0.917)	Data Time 0.001 (0.015)	Loss 3.1241 (3.0542)	Entropy 0.74526 (0.74677)	Top-1 acc 50.391 (50.772)	Top-5 acc 72.656 (74.022)	lr 0.02097
Train [32][1860/3239]	Time 0.594 (0.916)	Data Time 0.001 (0.015)	Loss 3.1523 (3.0545)	Entropy 0.74514 (0.74676)	Top-1 acc 51.172 (50.769)	Top-5 acc 71.094 (74.012)	lr 0.02097
Train [32][1870/3239]	Time 0.622 (0.916)	Data Time 0.001 (0.015)	Loss 3.3317 (3.0548)	Entropy 0.74540 (0.74675)	Top-1 acc 44.922 (50.764)	Top-5 acc 69.141 (74.008)	lr 0.02097
Train [32][1880/3239]	Time 0.611 (0.916)	Data Time 0.001 (0.015)	Loss 2.8519 (3.0545)	Entropy 0.74563 (0.74674)	Top-1 acc 55.469 (50.770)	Top-5 acc 78.125 (74.014)	lr 0.02097
Train [32][1890/3239]	Time 0.585 (0.915)	Data Time 0.001 (0.015)	Loss 2.9933 (3.0546)	Entropy 0.74520 (0.74674)	Top-1 acc 53.906 (50.769)	Top-5 acc 77.734 (74.016)	lr 0.02096
Train [32][1900/3239]	Time 0.682 (0.915)	Data Time 0.001 (0.015)	Loss 2.9889 (3.0545)	Entropy 0.74539 (0.74673)	Top-1 acc 51.953 (50.781)	Top-5 acc 75.000 (74.017)	lr 0.02096
Train [32][1910/3239]	Time 0.599 (0.915)	Data Time 0.001 (0.015)	Loss 2.8789 (3.0547)	Entropy 0.74539 (0.74672)	Top-1 acc 55.859 (50.783)	Top-5 acc 80.469 (74.016)	lr 0.02096
Train [32][1920/3239]	Time 0.585 (0.914)	Data Time 0.001 (0.015)	Loss 3.0832 (3.0551)	Entropy 0.74533 (0.74671)	Top-1 acc 51.562 (50.777)	Top-5 acc 71.484 (74.010)	lr 0.02096
Train [32][1930/3239]	Time 0.657 (0.914)	Data Time 0.001 (0.015)	Loss 3.0427 (3.0550)	Entropy 0.74561 (0.74671)	Top-1 acc 48.047 (50.776)	Top-5 acc 73.438 (74.009)	lr 0.02096
Train [32][1940/3239]	Time 0.612 (0.914)	Data Time 0.002 (0.015)	Loss 3.1909 (3.0550)	Entropy 0.74558 (0.74670)	Top-1 acc 48.828 (50.776)	Top-5 acc 69.531 (74.008)	lr 0.02096
Train [32][1950/3239]	Time 0.626 (0.914)	Data Time 0.003 (0.014)	Loss 3.0841 (3.0548)	Entropy 0.74550 (0.74669)	Top-1 acc 49.219 (50.785)	Top-5 acc 71.875 (74.010)	lr 0.02096
Train [32][1960/3239]	Time 0.650 (0.913)	Data Time 0.001 (0.014)	Loss 2.9150 (3.0550)	Entropy 0.74546 (0.74669)	Top-1 acc 55.859 (50.782)	Top-5 acc 78.516 (74.010)	lr 0.02096
Train [32][1970/3239]	Time 0.663 (0.913)	Data Time 0.001 (0.014)	Loss 3.0182 (3.0550)	Entropy 0.74569 (0.74668)	Top-1 acc 50.000 (50.783)	Top-5 acc 73.438 (74.008)	lr 0.02096
Train [32][1980/3239]	Time 0.617 (0.913)	Data Time 0.001 (0.014)	Loss 2.9300 (3.0552)	Entropy 0.74598 (0.74668)	Top-1 acc 54.688 (50.784)	Top-5 acc 75.781 (74.003)	lr 0.02096
Train [32][1990/3239]	Time 0.582 (0.913)	Data Time 0.001 (0.014)	Loss 3.2041 (3.0556)	Entropy 0.74624 (0.74667)	Top-1 acc 46.484 (50.770)	Top-5 acc 69.922 (73.999)	lr 0.02096
Train [32][2000/3239]	Time 0.618 (0.912)	Data Time 0.001 (0.014)	Loss 3.1910 (3.0554)	Entropy 0.74644 (0.74667)	Top-1 acc 46.875 (50.770)	Top-5 acc 70.312 (74.006)	lr 0.02096
Train [32][2010/3239]	Time 0.563 (0.912)	Data Time 0.001 (0.014)	Loss 3.0946 (3.0553)	Entropy 0.74601 (0.74667)	Top-1 acc 52.344 (50.778)	Top-5 acc 73.047 (74.003)	lr 0.02096
Train [32][2020/3239]	Time 0.602 (0.912)	Data Time 0.001 (0.014)	Loss 3.2256 (3.0558)	Entropy 0.74560 (0.74667)	Top-1 acc 45.703 (50.766)	Top-5 acc 71.094 (73.995)	lr 0.02096
Train [32][2030/3239]	Time 0.615 (0.911)	Data Time 0.001 (0.014)	Loss 2.9207 (3.0560)	Entropy 0.74551 (0.74666)	Top-1 acc 55.469 (50.763)	Top-5 acc 75.391 (73.990)	lr 0.02095
Train [32][2040/3239]	Time 0.585 (0.911)	Data Time 0.001 (0.014)	Loss 3.0542 (3.0560)	Entropy 0.74546 (0.74665)	Top-1 acc 55.469 (50.765)	Top-5 acc 74.219 (73.989)	lr 0.02095
Train [32][2050/3239]	Time 0.601 (0.911)	Data Time 0.001 (0.014)	Loss 2.9926 (3.0563)	Entropy 0.74543 (0.74665)	Top-1 acc 50.391 (50.758)	Top-5 acc 73.828 (73.982)	lr 0.02095
Train [32][2060/3239]	Time 0.564 (0.911)	Data Time 0.001 (0.014)	Loss 3.0502 (3.0564)	Entropy 0.74515 (0.74664)	Top-1 acc 49.219 (50.752)	Top-5 acc 76.562 (73.982)	lr 0.02095
Train [32][2070/3239]	Time 0.586 (0.911)	Data Time 0.001 (0.014)	Loss 3.2358 (3.0566)	Entropy 0.74496 (0.74663)	Top-1 acc 44.922 (50.749)	Top-5 acc 71.484 (73.978)	lr 0.02095
Train [32][2080/3239]	Time 0.624 (0.910)	Data Time 0.001 (0.014)	Loss 2.8599 (3.0567)	Entropy 0.74506 (0.74663)	Top-1 acc 49.609 (50.741)	Top-5 acc 80.859 (73.980)	lr 0.02095
Train [32][2090/3239]	Time 0.614 (0.910)	Data Time 0.001 (0.014)	Loss 3.1101 (3.0570)	Entropy 0.74507 (0.74662)	Top-1 acc 48.828 (50.734)	Top-5 acc 72.656 (73.971)	lr 0.02095
Train [32][2100/3239]	Time 0.598 (0.910)	Data Time 0.001 (0.014)	Loss 3.0496 (3.0572)	Entropy 0.74543 (0.74661)	Top-1 acc 48.438 (50.730)	Top-5 acc 73.438 (73.966)	lr 0.02095
Train [32][2110/3239]	Time 0.581 (0.910)	Data Time 0.001 (0.014)	Loss 2.8203 (3.0573)	Entropy 0.74527 (0.74661)	Top-1 acc 52.734 (50.729)	Top-5 acc 80.078 (73.964)	lr 0.02095
Train [32][2120/3239]	Time 0.606 (0.910)	Data Time 0.001 (0.013)	Loss 3.1762 (3.0575)	Entropy 0.74518 (0.74660)	Top-1 acc 48.047 (50.722)	Top-5 acc 71.484 (73.965)	lr 0.02095
Train [32][2130/3239]	Time 0.699 (0.909)	Data Time 0.001 (0.013)	Loss 2.8785 (3.0574)	Entropy 0.74529 (0.74659)	Top-1 acc 56.250 (50.718)	Top-5 acc 75.781 (73.965)	lr 0.02095
Train [32][2140/3239]	Time 0.591 (0.909)	Data Time 0.001 (0.013)	Loss 3.3758 (3.0575)	Entropy 0.74570 (0.74659)	Top-1 acc 45.312 (50.716)	Top-5 acc 66.016 (73.958)	lr 0.02095
Train [32][2150/3239]	Time 0.594 (0.909)	Data Time 0.001 (0.013)	Loss 2.9991 (3.0576)	Entropy 0.74588 (0.74658)	Top-1 acc 49.609 (50.717)	Top-5 acc 77.734 (73.960)	lr 0.02095
Train [32][2160/3239]	Time 0.630 (0.909)	Data Time 0.001 (0.013)	Loss 3.0110 (3.0578)	Entropy 0.74602 (0.74658)	Top-1 acc 50.391 (50.711)	Top-5 acc 73.438 (73.956)	lr 0.02094
Train [32][2170/3239]	Time 0.610 (0.909)	Data Time 0.001 (0.013)	Loss 2.8829 (3.0581)	Entropy 0.74590 (0.74658)	Top-1 acc 52.344 (50.701)	Top-5 acc 75.781 (73.947)	lr 0.02094
Train [32][2180/3239]	Time 0.614 (0.908)	Data Time 0.002 (0.013)	Loss 2.7702 (3.0581)	Entropy 0.74605 (0.74657)	Top-1 acc 58.984 (50.701)	Top-5 acc 80.859 (73.946)	lr 0.02094
Train [32][2190/3239]	Time 0.544 (0.908)	Data Time 0.001 (0.013)	Loss 3.1495 (3.0583)	Entropy 0.74540 (0.74657)	Top-1 acc 46.094 (50.698)	Top-5 acc 72.266 (73.941)	lr 0.02094
Train [32][2200/3239]	Time 0.705 (0.908)	Data Time 0.001 (0.013)	Loss 2.9605 (3.0584)	Entropy 0.74543 (0.74657)	Top-1 acc 50.781 (50.693)	Top-5 acc 79.297 (73.939)	lr 0.02094
Train [32][2210/3239]	Time 0.599 (0.907)	Data Time 0.001 (0.013)	Loss 3.0208 (3.0585)	Entropy 0.74543 (0.74656)	Top-1 acc 48.828 (50.687)	Top-5 acc 77.344 (73.941)	lr 0.02094
Train [32][2220/3239]	Time 0.633 (0.907)	Data Time 0.001 (0.013)	Loss 3.1829 (3.0584)	Entropy 0.74527 (0.74656)	Top-1 acc 50.781 (50.691)	Top-5 acc 71.875 (73.943)	lr 0.02094
Train [32][2230/3239]	Time 0.588 (0.907)	Data Time 0.001 (0.013)	Loss 2.9784 (3.0584)	Entropy 0.74515 (0.74655)	Top-1 acc 47.656 (50.691)	Top-5 acc 78.906 (73.941)	lr 0.02094
Train [32][2240/3239]	Time 0.615 (0.907)	Data Time 0.001 (0.013)	Loss 3.0679 (3.0582)	Entropy 0.74554 (0.74654)	Top-1 acc 49.609 (50.693)	Top-5 acc 74.219 (73.946)	lr 0.02094
Train [32][2250/3239]	Time 0.611 (0.907)	Data Time 0.001 (0.013)	Loss 3.0786 (3.0582)	Entropy 0.74498 (0.74654)	Top-1 acc 47.656 (50.692)	Top-5 acc 69.922 (73.942)	lr 0.02094
Train [32][2260/3239]	Time 0.620 (0.906)	Data Time 0.001 (0.013)	Loss 2.7529 (3.0578)	Entropy 0.74498 (0.74653)	Top-1 acc 58.594 (50.698)	Top-5 acc 78.906 (73.949)	lr 0.02094
Train [32][2270/3239]	Time 0.606 (0.906)	Data Time 0.001 (0.013)	Loss 3.1106 (3.0579)	Entropy 0.74457 (0.74652)	Top-1 acc 51.562 (50.697)	Top-5 acc 72.266 (73.948)	lr 0.02094
Train [32][2280/3239]	Time 0.594 (0.906)	Data Time 0.001 (0.013)	Loss 3.3973 (3.0582)	Entropy 0.74438 (0.74651)	Top-1 acc 46.094 (50.688)	Top-5 acc 67.969 (73.942)	lr 0.02094
Train [32][2290/3239]	Time 0.676 (0.906)	Data Time 0.001 (0.013)	Loss 3.0444 (3.0581)	Entropy 0.74458 (0.74651)	Top-1 acc 47.266 (50.685)	Top-5 acc 73.047 (73.943)	lr 0.02094
Train [32][2300/3239]	Time 0.627 (0.906)	Data Time 0.001 (0.013)	Loss 2.9080 (3.0580)	Entropy 0.74425 (0.74650)	Top-1 acc 52.344 (50.686)	Top-5 acc 75.781 (73.945)	lr 0.02093
Train [32][2310/3239]	Time 0.612 (0.905)	Data Time 0.001 (0.013)	Loss 2.9988 (3.0584)	Entropy 0.74432 (0.74649)	Top-1 acc 50.000 (50.679)	Top-5 acc 75.391 (73.936)	lr 0.02093
Train [32][2320/3239]	Time 0.604 (0.905)	Data Time 0.001 (0.012)	Loss 2.9889 (3.0583)	Entropy 0.74504 (0.74648)	Top-1 acc 51.953 (50.683)	Top-5 acc 76.562 (73.940)	lr 0.02093
Train [32][2330/3239]	Time 0.491 (0.905)	Data Time 0.001 (0.012)	Loss 3.0536 (3.0581)	Entropy 0.74520 (0.74647)	Top-1 acc 51.562 (50.687)	Top-5 acc 77.734 (73.945)	lr 0.02093
Train [32][2340/3239]	Time 0.617 (0.905)	Data Time 0.001 (0.012)	Loss 3.0889 (3.0580)	Entropy 0.74551 (0.74647)	Top-1 acc 48.047 (50.688)	Top-5 acc 73.047 (73.950)	lr 0.02093
Train [32][2350/3239]	Time 0.581 (0.905)	Data Time 0.001 (0.012)	Loss 3.0103 (3.0581)	Entropy 0.74555 (0.74646)	Top-1 acc 52.344 (50.682)	Top-5 acc 74.219 (73.946)	lr 0.02093
Train [32][2360/3239]	Time 0.692 (0.904)	Data Time 0.001 (0.012)	Loss 2.9958 (3.0581)	Entropy 0.74511 (0.74646)	Top-1 acc 53.125 (50.682)	Top-5 acc 75.391 (73.944)	lr 0.02093
Train [32][2370/3239]	Time 0.606 (0.915)	Data Time 0.002 (0.012)	Loss 2.9125 (3.0578)	Entropy 0.74497 (0.74645)	Top-1 acc 54.297 (50.689)	Top-5 acc 78.125 (73.952)	lr 0.02093
Train [32][2380/3239]	Time 0.595 (0.914)	Data Time 0.002 (0.012)	Loss 3.3145 (3.0580)	Entropy 0.74472 (0.74644)	Top-1 acc 46.484 (50.686)	Top-5 acc 67.188 (73.948)	lr 0.02093
Train [32][2390/3239]	Time 0.594 (0.914)	Data Time 0.001 (0.012)	Loss 3.0784 (3.0578)	Entropy 0.74438 (0.74644)	Top-1 acc 50.781 (50.688)	Top-5 acc 72.656 (73.951)	lr 0.02093
Train [32][2400/3239]	Time 0.597 (0.914)	Data Time 0.001 (0.012)	Loss 2.9949 (3.0580)	Entropy 0.74430 (0.74643)	Top-1 acc 54.688 (50.685)	Top-5 acc 75.781 (73.947)	lr 0.02093
Train [32][2410/3239]	Time 0.624 (0.914)	Data Time 0.001 (0.012)	Loss 2.9835 (3.0579)	Entropy 0.74403 (0.74642)	Top-1 acc 53.516 (50.689)	Top-5 acc 75.000 (73.947)	lr 0.02093
Train [32][2420/3239]	Time 0.590 (0.914)	Data Time 0.001 (0.012)	Loss 3.2834 (3.0579)	Entropy 0.74405 (0.74641)	Top-1 acc 42.969 (50.689)	Top-5 acc 67.969 (73.945)	lr 0.02093
Train [32][2430/3239]	Time 0.644 (0.914)	Data Time 0.001 (0.012)	Loss 2.9908 (3.0577)	Entropy 0.74381 (0.74640)	Top-1 acc 51.562 (50.692)	Top-5 acc 75.391 (73.949)	lr 0.02092
Train [32][2440/3239]	Time 0.549 (0.913)	Data Time 0.001 (0.012)	Loss 3.2639 (3.0578)	Entropy 0.74405 (0.74639)	Top-1 acc 48.438 (50.690)	Top-5 acc 67.969 (73.947)	lr 0.02092
Train [32][2450/3239]	Time 0.721 (0.913)	Data Time 0.001 (0.012)	Loss 3.0430 (3.0579)	Entropy 0.74403 (0.74638)	Top-1 acc 54.297 (50.690)	Top-5 acc 72.656 (73.943)	lr 0.02092
Train [32][2460/3239]	Time 0.612 (0.913)	Data Time 0.001 (0.012)	Loss 3.1524 (3.0579)	Entropy 0.74431 (0.74637)	Top-1 acc 45.312 (50.688)	Top-5 acc 70.703 (73.943)	lr 0.02092
Train [32][2470/3239]	Time 0.446 (0.912)	Data Time 0.001 (0.012)	Loss 3.1469 (3.0579)	Entropy 0.74437 (0.74636)	Top-1 acc 47.266 (50.685)	Top-5 acc 73.828 (73.945)	lr 0.02092
Train [32][2480/3239]	Time 0.592 (0.912)	Data Time 0.001 (0.012)	Loss 3.1746 (3.0579)	Entropy 0.74484 (0.74635)	Top-1 acc 52.344 (50.689)	Top-5 acc 70.312 (73.943)	lr 0.02092
Train [32][2490/3239]	Time 0.612 (0.912)	Data Time 0.001 (0.012)	Loss 3.1010 (3.0579)	Entropy 0.74456 (0.74635)	Top-1 acc 52.734 (50.690)	Top-5 acc 75.000 (73.943)	lr 0.02092
Train [32][2500/3239]	Time 0.590 (0.912)	Data Time 0.001 (0.012)	Loss 3.2720 (3.0581)	Entropy 0.74439 (0.74634)	Top-1 acc 49.219 (50.685)	Top-5 acc 70.312 (73.941)	lr 0.02092
Train [32][2510/3239]	Time 0.627 (0.912)	Data Time 0.001 (0.012)	Loss 3.0503 (3.0579)	Entropy 0.74459 (0.74633)	Top-1 acc 50.781 (50.687)	Top-5 acc 75.781 (73.946)	lr 0.02092
Train [32][2520/3239]	Time 0.665 (0.912)	Data Time 0.001 (0.012)	Loss 3.2889 (3.0579)	Entropy 0.74505 (0.74633)	Top-1 acc 47.266 (50.690)	Top-5 acc 68.359 (73.944)	lr 0.02092
Train [32][2530/3239]	Time 0.608 (0.911)	Data Time 0.001 (0.012)	Loss 2.9018 (3.0577)	Entropy 0.74497 (0.74632)	Top-1 acc 51.562 (50.694)	Top-5 acc 77.344 (73.950)	lr 0.02092
Train [32][2540/3239]	Time 0.609 (0.911)	Data Time 0.001 (0.012)	Loss 3.0463 (3.0576)	Entropy 0.74519 (0.74632)	Top-1 acc 51.953 (50.695)	Top-5 acc 75.391 (73.950)	lr 0.02092
Train [32][2550/3239]	Time 0.674 (0.911)	Data Time 0.001 (0.012)	Loss 3.0034 (3.0575)	Entropy 0.74486 (0.74631)	Top-1 acc 50.391 (50.694)	Top-5 acc 74.219 (73.950)	lr 0.02092
Train [32][2560/3239]	Time 0.550 (0.911)	Data Time 0.001 (0.012)	Loss 3.1120 (3.0574)	Entropy 0.74448 (0.74631)	Top-1 acc 48.828 (50.696)	Top-5 acc 71.484 (73.950)	lr 0.02092
Train [32][2570/3239]	Time 0.597 (0.911)	Data Time 0.001 (0.011)	Loss 3.1928 (3.0574)	Entropy 0.74436 (0.74630)	Top-1 acc 47.266 (50.698)	Top-5 acc 72.266 (73.952)	lr 0.02091
Train [32][2580/3239]	Time 0.631 (0.911)	Data Time 0.001 (0.011)	Loss 3.0131 (3.0574)	Entropy 0.74415 (0.74629)	Top-1 acc 51.562 (50.701)	Top-5 acc 77.344 (73.953)	lr 0.02091
Train [32][2590/3239]	Time 0.620 (0.910)	Data Time 0.001 (0.011)	Loss 3.0532 (3.0575)	Entropy 0.74382 (0.74628)	Top-1 acc 50.391 (50.696)	Top-5 acc 75.000 (73.953)	lr 0.02091
Train [32][2600/3239]	Time 0.582 (0.910)	Data Time 0.001 (0.011)	Loss 2.9996 (3.0574)	Entropy 0.74398 (0.74627)	Top-1 acc 53.125 (50.697)	Top-5 acc 75.000 (73.955)	lr 0.02091
Train [32][2610/3239]	Time 0.674 (0.910)	Data Time 0.001 (0.011)	Loss 3.2784 (3.0571)	Entropy 0.74392 (0.74626)	Top-1 acc 46.094 (50.702)	Top-5 acc 66.406 (73.961)	lr 0.02091
Train [32][2620/3239]	Time 0.631 (0.910)	Data Time 0.002 (0.011)	Loss 3.0745 (3.0575)	Entropy 0.74418 (0.74625)	Top-1 acc 50.000 (50.695)	Top-5 acc 73.047 (73.952)	lr 0.02091
Train [32][2630/3239]	Time 0.559 (0.910)	Data Time 0.001 (0.011)	Loss 3.1882 (3.0573)	Entropy 0.74422 (0.74625)	Top-1 acc 48.438 (50.695)	Top-5 acc 74.219 (73.955)	lr 0.02091
Train [32][2640/3239]	Time 0.590 (0.909)	Data Time 0.001 (0.011)	Loss 3.3410 (3.0574)	Entropy 0.74410 (0.74624)	Top-1 acc 45.703 (50.692)	Top-5 acc 68.359 (73.952)	lr 0.02091
Train [32][2650/3239]	Time 0.629 (0.909)	Data Time 0.001 (0.011)	Loss 3.0340 (3.0574)	Entropy 0.74429 (0.74623)	Top-1 acc 51.953 (50.694)	Top-5 acc 74.219 (73.954)	lr 0.02091
Train [32][2660/3239]	Time 0.653 (0.909)	Data Time 0.001 (0.011)	Loss 2.9450 (3.0571)	Entropy 0.74396 (0.74622)	Top-1 acc 54.297 (50.698)	Top-5 acc 72.266 (73.959)	lr 0.02091
Train [32][2670/3239]	Time 0.572 (0.909)	Data Time 0.001 (0.011)	Loss 3.2029 (3.0571)	Entropy 0.74408 (0.74621)	Top-1 acc 49.219 (50.696)	Top-5 acc 69.141 (73.958)	lr 0.02091
Train [32][2680/3239]	Time 0.733 (0.908)	Data Time 0.001 (0.011)	Loss 3.1493 (3.0573)	Entropy 0.74412 (0.74621)	Top-1 acc 48.828 (50.691)	Top-5 acc 71.484 (73.951)	lr 0.02091
Train [32][2690/3239]	Time 0.634 (0.908)	Data Time 0.001 (0.011)	Loss 2.9268 (3.0570)	Entropy 0.74379 (0.74620)	Top-1 acc 56.250 (50.701)	Top-5 acc 78.906 (73.962)	lr 0.02091
Train [32][2700/3239]	Time 0.616 (0.908)	Data Time 0.001 (0.011)	Loss 3.2575 (3.0570)	Entropy 0.74386 (0.74619)	Top-1 acc 46.484 (50.697)	Top-5 acc 66.016 (73.957)	lr 0.02090
Train [32][2710/3239]	Time 0.595 (0.908)	Data Time 0.001 (0.011)	Loss 2.9778 (3.0568)	Entropy 0.74349 (0.74618)	Top-1 acc 53.906 (50.705)	Top-5 acc 75.000 (73.962)	lr 0.02090
Train [32][2720/3239]	Time 0.612 (0.908)	Data Time 0.001 (0.011)	Loss 2.9015 (3.0567)	Entropy 0.74322 (0.74617)	Top-1 acc 49.609 (50.704)	Top-5 acc 76.172 (73.965)	lr 0.02090
Train [32][2730/3239]	Time 0.637 (0.908)	Data Time 0.001 (0.011)	Loss 2.8265 (3.0565)	Entropy 0.74297 (0.74616)	Top-1 acc 55.859 (50.709)	Top-5 acc 78.906 (73.972)	lr 0.02090
Train [32][2740/3239]	Time 0.614 (0.908)	Data Time 0.001 (0.011)	Loss 3.0888 (3.0567)	Entropy 0.74313 (0.74615)	Top-1 acc 48.438 (50.701)	Top-5 acc 71.094 (73.966)	lr 0.02090
Train [32][2750/3239]	Time 0.704 (0.907)	Data Time 0.001 (0.011)	Loss 3.3328 (3.0567)	Entropy 0.74346 (0.74614)	Top-1 acc 41.797 (50.700)	Top-5 acc 69.531 (73.966)	lr 0.02090
Train [32][2760/3239]	Time 0.600 (0.907)	Data Time 0.001 (0.011)	Loss 3.1016 (3.0566)	Entropy 0.74334 (0.74613)	Top-1 acc 48.047 (50.703)	Top-5 acc 73.828 (73.965)	lr 0.02090
Train [32][2770/3239]	Time 0.610 (0.907)	Data Time 0.001 (0.011)	Loss 2.7635 (3.0565)	Entropy 0.74303 (0.74612)	Top-1 acc 59.375 (50.705)	Top-5 acc 82.812 (73.968)	lr 0.02090
Train [32][2780/3239]	Time 0.613 (0.907)	Data Time 0.001 (0.011)	Loss 2.8530 (3.0565)	Entropy 0.74306 (0.74611)	Top-1 acc 52.344 (50.705)	Top-5 acc 77.344 (73.968)	lr 0.02090
Train [32][2790/3239]	Time 0.577 (0.907)	Data Time 0.001 (0.011)	Loss 3.2116 (3.0564)	Entropy 0.74308 (0.74609)	Top-1 acc 50.000 (50.707)	Top-5 acc 72.266 (73.970)	lr 0.02090
Train [32][2800/3239]	Time 0.635 (0.906)	Data Time 0.001 (0.011)	Loss 3.0690 (3.0566)	Entropy 0.74282 (0.74608)	Top-1 acc 47.656 (50.701)	Top-5 acc 74.609 (73.965)	lr 0.02090
Train [32][2810/3239]	Time 0.651 (0.906)	Data Time 0.001 (0.011)	Loss 3.0443 (3.0567)	Entropy 0.74301 (0.74607)	Top-1 acc 51.172 (50.699)	Top-5 acc 73.828 (73.967)	lr 0.02090
Train [32][2820/3239]	Time 0.571 (0.906)	Data Time 0.001 (0.011)	Loss 3.1669 (3.0570)	Entropy 0.74332 (0.74606)	Top-1 acc 49.219 (50.691)	Top-5 acc 72.266 (73.959)	lr 0.02090
Train [32][2830/3239]	Time 0.612 (0.906)	Data Time 0.001 (0.011)	Loss 3.0113 (3.0569)	Entropy 0.74355 (0.74605)	Top-1 acc 54.297 (50.699)	Top-5 acc 74.609 (73.963)	lr 0.02089
Train [32][2840/3239]	Time 0.712 (0.906)	Data Time 0.001 (0.011)	Loss 3.1348 (3.0568)	Entropy 0.74342 (0.74604)	Top-1 acc 46.484 (50.703)	Top-5 acc 70.703 (73.963)	lr 0.02089
Train [32][2850/3239]	Time 0.628 (0.906)	Data Time 0.001 (0.011)	Loss 3.0484 (3.0569)	Entropy 0.74325 (0.74603)	Top-1 acc 52.344 (50.701)	Top-5 acc 75.000 (73.961)	lr 0.02089
Train [32][2860/3239]	Time 0.603 (0.906)	Data Time 0.001 (0.011)	Loss 3.0873 (3.0568)	Entropy 0.74327 (0.74602)	Top-1 acc 50.000 (50.705)	Top-5 acc 70.312 (73.964)	lr 0.02089
Train [32][2870/3239]	Time 0.626 (0.905)	Data Time 0.001 (0.010)	Loss 3.1635 (3.0568)	Entropy 0.74329 (0.74601)	Top-1 acc 46.094 (50.707)	Top-5 acc 71.484 (73.966)	lr 0.02089
Train [32][2880/3239]	Time 0.604 (0.905)	Data Time 0.001 (0.010)	Loss 3.2351 (3.0569)	Entropy 0.74313 (0.74600)	Top-1 acc 50.000 (50.705)	Top-5 acc 71.484 (73.964)	lr 0.02089
Train [32][2890/3239]	Time 0.601 (0.905)	Data Time 0.001 (0.010)	Loss 3.1230 (3.0568)	Entropy 0.74263 (0.74599)	Top-1 acc 47.656 (50.702)	Top-5 acc 73.438 (73.965)	lr 0.02089
Train [32][2900/3239]	Time 0.615 (0.905)	Data Time 0.001 (0.010)	Loss 3.2517 (3.0569)	Entropy 0.74290 (0.74598)	Top-1 acc 47.266 (50.698)	Top-5 acc 71.875 (73.966)	lr 0.02089
Train [32][2910/3239]	Time 0.742 (0.905)	Data Time 0.002 (0.010)	Loss 2.9527 (3.0570)	Entropy 0.74307 (0.74597)	Top-1 acc 52.344 (50.694)	Top-5 acc 72.656 (73.960)	lr 0.02089
Train [32][2920/3239]	Time 0.585 (0.905)	Data Time 0.001 (0.010)	Loss 2.8274 (3.0567)	Entropy 0.74266 (0.74596)	Top-1 acc 54.688 (50.698)	Top-5 acc 80.469 (73.967)	lr 0.02089
Train [32][2930/3239]	Time 0.616 (0.905)	Data Time 0.001 (0.010)	Loss 2.9067 (3.0565)	Entropy 0.74282 (0.74595)	Top-1 acc 55.078 (50.705)	Top-5 acc 75.391 (73.972)	lr 0.02089
Train [32][2940/3239]	Time 0.621 (0.904)	Data Time 0.001 (0.010)	Loss 2.9900 (3.0564)	Entropy 0.74229 (0.74594)	Top-1 acc 51.953 (50.701)	Top-5 acc 76.172 (73.973)	lr 0.02089
Train [32][2950/3239]	Time 0.577 (0.904)	Data Time 0.002 (0.010)	Loss 3.0633 (3.0561)	Entropy 0.74216 (0.74593)	Top-1 acc 46.875 (50.707)	Top-5 acc 75.781 (73.978)	lr 0.02089
Train [32][2960/3239]	Time 0.603 (0.904)	Data Time 0.001 (0.010)	Loss 3.0846 (3.0562)	Entropy 0.74193 (0.74591)	Top-1 acc 50.000 (50.706)	Top-5 acc 71.094 (73.976)	lr 0.02089
Train [32][2970/3239]	Time 0.617 (0.904)	Data Time 0.001 (0.010)	Loss 2.9817 (3.0564)	Entropy 0.74204 (0.74590)	Top-1 acc 50.391 (50.703)	Top-5 acc 78.125 (73.972)	lr 0.02088
Train [32][2980/3239]	Time 0.584 (0.904)	Data Time 0.001 (0.010)	Loss 2.9742 (3.0563)	Entropy 0.74165 (0.74589)	Top-1 acc 54.297 (50.704)	Top-5 acc 75.000 (73.972)	lr 0.02088
Train [32][2990/3239]	Time 0.600 (0.904)	Data Time 0.001 (0.010)	Loss 3.0413 (3.0562)	Entropy 0.74154 (0.74587)	Top-1 acc 50.391 (50.708)	Top-5 acc 73.438 (73.974)	lr 0.02088
Train [32][3000/3239]	Time 0.727 (0.903)	Data Time 0.001 (0.010)	Loss 3.0503 (3.0562)	Entropy 0.74160 (0.74586)	Top-1 acc 48.047 (50.707)	Top-5 acc 75.391 (73.975)	lr 0.02088
Train [32][3010/3239]	Time 0.612 (0.903)	Data Time 0.001 (0.010)	Loss 2.9700 (3.0562)	Entropy 0.74165 (0.74584)	Top-1 acc 51.562 (50.705)	Top-5 acc 76.172 (73.974)	lr 0.02088
Train [32][3020/3239]	Time 0.822 (0.911)	Data Time 0.050 (0.010)	Loss 3.0498 (3.0560)	Entropy 0.74124 (0.74583)	Top-1 acc 49.609 (50.705)	Top-5 acc 74.609 (73.979)	lr 0.02088
Train [32][3030/3239]	Time 0.612 (0.911)	Data Time 0.002 (0.010)	Loss 3.2189 (3.0562)	Entropy 0.74153 (0.74581)	Top-1 acc 46.875 (50.700)	Top-5 acc 73.438 (73.977)	lr 0.02088
Train [32][3040/3239]	Time 0.586 (0.911)	Data Time 0.001 (0.010)	Loss 3.0680 (3.0563)	Entropy 0.74154 (0.74580)	Top-1 acc 46.875 (50.698)	Top-5 acc 75.391 (73.973)	lr 0.02088
Train [32][3050/3239]	Time 0.499 (0.911)	Data Time 0.001 (0.010)	Loss 3.1055 (3.0563)	Entropy 0.74150 (0.74579)	Top-1 acc 46.094 (50.695)	Top-5 acc 74.219 (73.973)	lr 0.02088
Train [32][3060/3239]	Time 0.258 (0.910)	Data Time 0.002 (0.010)	Loss 3.1920 (3.0564)	Entropy 0.74100 (0.74577)	Top-1 acc 50.000 (50.696)	Top-5 acc 70.312 (73.969)	lr 0.02088
Train [32][3070/3239]	Time 0.350 (0.909)	Data Time 0.001 (0.010)	Loss 3.1143 (3.0566)	Entropy 0.74063 (0.74575)	Top-1 acc 50.000 (50.692)	Top-5 acc 69.922 (73.964)	lr 0.02088
Train [32][3080/3239]	Time 0.266 (0.908)	Data Time 0.001 (0.010)	Loss 3.0552 (3.0566)	Entropy 0.74058 (0.74574)	Top-1 acc 50.000 (50.689)	Top-5 acc 73.438 (73.963)	lr 0.02088
Train [32][3090/3239]	Time 0.253 (0.906)	Data Time 0.001 (0.010)	Loss 3.0071 (3.0566)	Entropy 0.74055 (0.74572)	Top-1 acc 49.609 (50.690)	Top-5 acc 69.922 (73.962)	lr 0.02088
Train [32][3100/3239]	Time 0.311 (0.905)	Data Time 0.004 (0.010)	Loss 2.7446 (3.0566)	Entropy 0.74033 (0.74570)	Top-1 acc 57.422 (50.691)	Top-5 acc 80.859 (73.963)	lr 0.02087
Train [32][3110/3239]	Time 0.501 (0.904)	Data Time 0.001 (0.010)	Loss 3.0405 (3.0566)	Entropy 0.74041 (0.74569)	Top-1 acc 51.953 (50.694)	Top-5 acc 73.438 (73.966)	lr 0.02087
Train [32][3120/3239]	Time 0.312 (0.902)	Data Time 0.001 (0.010)	Loss 3.0481 (3.0564)	Entropy 0.74037 (0.74567)	Top-1 acc 54.688 (50.698)	Top-5 acc 73.047 (73.970)	lr 0.02087
Train [32][3130/3239]	Time 0.254 (0.901)	Data Time 0.001 (0.010)	Loss 3.1245 (3.0563)	Entropy 0.74046 (0.74565)	Top-1 acc 50.000 (50.701)	Top-5 acc 70.703 (73.972)	lr 0.02087
Train [32][3140/3239]	Time 0.236 (0.900)	Data Time 0.001 (0.010)	Loss 3.1436 (3.0563)	Entropy 0.74020 (0.74564)	Top-1 acc 49.219 (50.702)	Top-5 acc 71.094 (73.970)	lr 0.02087
Train [32][3150/3239]	Time 0.297 (0.898)	Data Time 0.001 (0.010)	Loss 2.9754 (3.0563)	Entropy 0.73980 (0.74562)	Top-1 acc 51.172 (50.700)	Top-5 acc 74.219 (73.970)	lr 0.02087
Train [32][3160/3239]	Time 0.349 (0.897)	Data Time 0.001 (0.010)	Loss 3.2110 (3.0563)	Entropy 0.74009 (0.74560)	Top-1 acc 45.312 (50.694)	Top-5 acc 66.406 (73.969)	lr 0.02087
Train [32][3170/3239]	Time 0.235 (0.895)	Data Time 0.001 (0.010)	Loss 2.9738 (3.0562)	Entropy 0.73969 (0.74558)	Top-1 acc 52.344 (50.698)	Top-5 acc 76.953 (73.972)	lr 0.02087
Train [32][3180/3239]	Time 0.239 (0.894)	Data Time 0.000 (0.010)	Loss 3.2120 (3.0561)	Entropy 0.73925 (0.74556)	Top-1 acc 44.531 (50.699)	Top-5 acc 74.609 (73.972)	lr 0.02087
Train [32][3190/3239]	Time 0.231 (0.892)	Data Time 0.000 (0.010)	Loss 3.2377 (3.0561)	Entropy 0.73925 (0.74554)	Top-1 acc 41.406 (50.694)	Top-5 acc 70.703 (73.974)	lr 0.02087
Train [32][3200/3239]	Time 0.233 (0.891)	Data Time 0.000 (0.010)	Loss 3.1605 (3.0563)	Entropy 0.73915 (0.74552)	Top-1 acc 49.219 (50.690)	Top-5 acc 75.000 (73.972)	lr 0.02087
Train [32][3210/3239]	Time 0.224 (0.889)	Data Time 0.000 (0.010)	Loss 3.0313 (3.0563)	Entropy 0.73950 (0.74550)	Top-1 acc 48.828 (50.691)	Top-5 acc 74.219 (73.975)	lr 0.02087
Train [32][3220/3239]	Time 0.223 (0.888)	Data Time 0.000 (0.010)	Loss 2.9749 (3.0561)	Entropy 0.73952 (0.74549)	Top-1 acc 50.391 (50.695)	Top-5 acc 80.078 (73.979)	lr 0.02087
Train [32][3230/3239]	Time 0.346 (0.886)	Data Time 0.000 (0.010)	Loss 2.8521 (3.0560)	Entropy 0.74011 (0.74547)	Top-1 acc 53.125 (50.700)	Top-5 acc 77.734 (73.979)	lr 0.02086
Train [32][3239/3239]	Time 0.951 (0.885)	Data Time 0.000 (0.009)	Loss 3.3338 (3.0558)	Entropy 0.74002 (0.74545)	Top-1 acc 43.210 (50.703)	Top-5 acc 66.667 (73.982)	lr 0.02086
==========Valid [32/120]	loss 1.772	top-1 acc 59.985 (59.985)	top-5 acc 82.074	Train top-1 50.703	top-5 73.982	Entropy 0.74002	Latency-None: 0.000ms	Flops: 539.76M
Train [33][0/3239]	Time 23.576 (23.576)	Data Time 22.103 (22.103)	Loss 3.1487 (3.1487)	Entropy 0.74003 (0.74003)	Top-1 acc 48.438 (48.438)	Top-5 acc 70.312 (70.312)	lr 0.02086
Train [33][10/3239]	Time 0.280 (2.743)	Data Time 0.003 (2.156)	Loss 2.8849 (3.0292)	Entropy 0.73970 (0.73993)	Top-1 acc 53.125 (51.740)	Top-5 acc 78.516 (73.438)	lr 0.02086
Train [33][20/3239]	Time 0.224 (1.638)	Data Time 0.001 (1.130)	Loss 2.8763 (3.0159)	Entropy 0.73962 (0.73983)	Top-1 acc 53.125 (51.786)	Top-5 acc 76.172 (73.772)	lr 0.02086
Train [33][30/3239]	Time 0.237 (1.238)	Data Time 0.001 (0.766)	Loss 3.1352 (3.0053)	Entropy 0.73954 (0.73975)	Top-1 acc 50.000 (51.764)	Top-5 acc 70.703 (74.546)	lr 0.02086
Train [33][40/3239]	Time 0.245 (1.042)	Data Time 0.001 (0.580)	Loss 2.8275 (2.9971)	Entropy 0.73970 (0.73969)	Top-1 acc 59.766 (52.248)	Top-5 acc 77.344 (74.752)	lr 0.02086
Train [33][50/3239]	Time 0.247 (0.919)	Data Time 0.001 (0.466)	Loss 2.7486 (3.0084)	Entropy 0.73956 (0.73968)	Top-1 acc 58.594 (52.206)	Top-5 acc 80.078 (74.686)	lr 0.02086
Train [33][60/3239]	Time 0.381 (0.843)	Data Time 0.001 (0.390)	Loss 3.1812 (3.0092)	Entropy 0.73955 (0.73966)	Top-1 acc 48.828 (52.094)	Top-5 acc 72.266 (74.680)	lr 0.02086
Train [33][70/3239]	Time 0.265 (0.784)	Data Time 0.001 (0.335)	Loss 3.1200 (3.0122)	Entropy 0.73959 (0.73963)	Top-1 acc 53.516 (52.014)	Top-5 acc 71.875 (74.719)	lr 0.02086
Train [33][80/3239]	Time 0.230 (0.738)	Data Time 0.001 (0.294)	Loss 3.0523 (3.0205)	Entropy 0.73937 (0.73961)	Top-1 acc 50.781 (51.915)	Top-5 acc 75.781 (74.547)	lr 0.02086
Train [33][90/3239]	Time 0.223 (0.703)	Data Time 0.001 (0.262)	Loss 3.1135 (3.0271)	Entropy 0.73931 (0.73958)	Top-1 acc 50.000 (51.747)	Top-5 acc 75.781 (74.438)	lr 0.02086
Train [33][100/3239]	Time 0.225 (0.684)	Data Time 0.002 (0.236)	Loss 3.0879 (3.0270)	Entropy 0.73921 (0.73955)	Top-1 acc 51.172 (51.717)	Top-5 acc 75.000 (74.478)	lr 0.02086
Train [33][110/3239]	Time 0.245 (0.660)	Data Time 0.002 (0.215)	Loss 3.0736 (3.0297)	Entropy 0.73938 (0.73952)	Top-1 acc 51.562 (51.643)	Top-5 acc 73.438 (74.391)	lr 0.02086
Train [33][120/3239]	Time 0.235 (0.639)	Data Time 0.001 (0.198)	Loss 2.8697 (3.0275)	Entropy 0.73969 (0.73953)	Top-1 acc 53.125 (51.601)	Top-5 acc 77.344 (74.432)	lr 0.02086
Train [33][130/3239]	Time 0.330 (0.622)	Data Time 0.001 (0.183)	Loss 3.0376 (3.0291)	Entropy 0.74013 (0.73955)	Top-1 acc 50.391 (51.518)	Top-5 acc 72.656 (74.407)	lr 0.02085
Train [33][140/3239]	Time 0.229 (0.606)	Data Time 0.001 (0.170)	Loss 3.2103 (3.0357)	Entropy 0.74004 (0.73959)	Top-1 acc 43.750 (51.297)	Top-5 acc 69.531 (74.307)	lr 0.02085
Train [33][150/3239]	Time 0.230 (0.592)	Data Time 0.001 (0.159)	Loss 2.8181 (3.0325)	Entropy 0.73990 (0.73961)	Top-1 acc 53.125 (51.337)	Top-5 acc 80.859 (74.405)	lr 0.02085
Train [33][160/3239]	Time 0.234 (0.580)	Data Time 0.001 (0.149)	Loss 2.9180 (3.0357)	Entropy 0.74023 (0.73963)	Top-1 acc 53.516 (51.228)	Top-5 acc 76.172 (74.415)	lr 0.02085
Train [33][170/3239]	Time 0.253 (0.570)	Data Time 0.001 (0.141)	Loss 2.9590 (3.0367)	Entropy 0.74029 (0.73967)	Top-1 acc 51.953 (51.227)	Top-5 acc 73.828 (74.386)	lr 0.02085
Train [33][180/3239]	Time 0.246 (0.561)	Data Time 0.001 (0.133)	Loss 2.8973 (3.0370)	Entropy 0.74017 (0.73970)	Top-1 acc 52.734 (51.226)	Top-5 acc 76.562 (74.400)	lr 0.02085
Train [33][190/3239]	Time 0.220 (0.553)	Data Time 0.001 (0.126)	Loss 2.9237 (3.0359)	Entropy 0.74039 (0.73972)	Top-1 acc 56.641 (51.284)	Top-5 acc 73.438 (74.403)	lr 0.02085
Train [33][200/3239]	Time 0.233 (0.546)	Data Time 0.001 (0.120)	Loss 3.1182 (3.0385)	Entropy 0.74082 (0.73976)	Top-1 acc 51.172 (51.222)	Top-5 acc 70.312 (74.361)	lr 0.02085
Train [33][210/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.114)	Loss 2.9856 (3.0372)	Entropy 0.74073 (0.73981)	Top-1 acc 53.906 (51.279)	Top-5 acc 76.562 (74.361)	lr 0.02085
Train [33][220/3239]	Time 0.300 (0.533)	Data Time 0.001 (0.109)	Loss 3.1635 (3.0361)	Entropy 0.74047 (0.73984)	Top-1 acc 48.438 (51.292)	Top-5 acc 72.656 (74.337)	lr 0.02085
Train [33][230/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.104)	Loss 3.2591 (3.0352)	Entropy 0.74057 (0.73987)	Top-1 acc 45.703 (51.297)	Top-5 acc 67.969 (74.347)	lr 0.02085
Train [33][240/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.100)	Loss 3.0394 (3.0353)	Entropy 0.74063 (0.73990)	Top-1 acc 50.781 (51.264)	Top-5 acc 73.438 (74.352)	lr 0.02085
Train [33][250/3239]	Time 0.251 (0.518)	Data Time 0.001 (0.096)	Loss 3.0069 (3.0370)	Entropy 0.74047 (0.73993)	Top-1 acc 50.391 (51.208)	Top-5 acc 76.172 (74.363)	lr 0.02085
Train [33][260/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.093)	Loss 3.0052 (3.0373)	Entropy 0.74063 (0.73996)	Top-1 acc 50.391 (51.187)	Top-5 acc 76.953 (74.368)	lr 0.02084
Train [33][270/3239]	Time 0.239 (0.509)	Data Time 0.001 (0.089)	Loss 2.9679 (3.0357)	Entropy 0.74049 (0.73998)	Top-1 acc 55.469 (51.251)	Top-5 acc 73.047 (74.390)	lr 0.02084
Train [33][280/3239]	Time 0.240 (0.506)	Data Time 0.001 (0.086)	Loss 2.7628 (3.0363)	Entropy 0.74015 (0.74000)	Top-1 acc 53.516 (51.236)	Top-5 acc 79.688 (74.395)	lr 0.02084
Train [33][290/3239]	Time 0.321 (0.502)	Data Time 0.001 (0.083)	Loss 3.0313 (3.0365)	Entropy 0.74005 (0.74000)	Top-1 acc 52.344 (51.204)	Top-5 acc 73.828 (74.395)	lr 0.02084
Train [33][300/3239]	Time 0.218 (0.499)	Data Time 0.001 (0.081)	Loss 2.9699 (3.0375)	Entropy 0.73974 (0.74000)	Top-1 acc 50.000 (51.182)	Top-5 acc 73.438 (74.352)	lr 0.02084
Train [33][310/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.078)	Loss 2.9093 (3.0375)	Entropy 0.74017 (0.73999)	Top-1 acc 52.344 (51.158)	Top-5 acc 77.734 (74.338)	lr 0.02084
Train [33][320/3239]	Time 0.227 (0.493)	Data Time 0.001 (0.076)	Loss 3.1526 (3.0359)	Entropy 0.73978 (0.74000)	Top-1 acc 48.438 (51.177)	Top-5 acc 73.438 (74.357)	lr 0.02084
Train [33][330/3239]	Time 0.237 (0.490)	Data Time 0.001 (0.073)	Loss 3.0525 (3.0344)	Entropy 0.73945 (0.73999)	Top-1 acc 51.172 (51.201)	Top-5 acc 72.656 (74.408)	lr 0.02084
Train [33][340/3239]	Time 0.234 (0.487)	Data Time 0.001 (0.071)	Loss 3.0855 (3.0345)	Entropy 0.73984 (0.73998)	Top-1 acc 51.172 (51.189)	Top-5 acc 73.047 (74.372)	lr 0.02084
Train [33][350/3239]	Time 0.251 (0.485)	Data Time 0.001 (0.069)	Loss 3.1252 (3.0351)	Entropy 0.73990 (0.73997)	Top-1 acc 49.609 (51.209)	Top-5 acc 76.953 (74.370)	lr 0.02084
Train [33][360/3239]	Time 0.277 (0.483)	Data Time 0.001 (0.067)	Loss 2.8582 (3.0340)	Entropy 0.74008 (0.73997)	Top-1 acc 56.641 (51.216)	Top-5 acc 76.953 (74.388)	lr 0.02084
Train [33][370/3239]	Time 0.227 (0.481)	Data Time 0.001 (0.066)	Loss 2.9678 (3.0346)	Entropy 0.74039 (0.73998)	Top-1 acc 51.953 (51.198)	Top-5 acc 76.562 (74.383)	lr 0.02084
Train [33][380/3239]	Time 0.307 (0.479)	Data Time 0.001 (0.064)	Loss 2.9965 (3.0341)	Entropy 0.74055 (0.73999)	Top-1 acc 51.172 (51.190)	Top-5 acc 75.391 (74.387)	lr 0.02084
Train [33][390/3239]	Time 0.239 (0.478)	Data Time 0.001 (0.062)	Loss 3.0627 (3.0341)	Entropy 0.74043 (0.74001)	Top-1 acc 50.391 (51.160)	Top-5 acc 71.094 (74.378)	lr 0.02083
Train [33][400/3239]	Time 0.266 (0.476)	Data Time 0.001 (0.061)	Loss 3.1117 (3.0347)	Entropy 0.74029 (0.74002)	Top-1 acc 46.484 (51.132)	Top-5 acc 72.656 (74.355)	lr 0.02083
Train [33][410/3239]	Time 0.232 (0.475)	Data Time 0.001 (0.060)	Loss 2.9402 (3.0332)	Entropy 0.73995 (0.74002)	Top-1 acc 51.562 (51.173)	Top-5 acc 76.953 (74.375)	lr 0.02083
Train [33][420/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.058)	Loss 2.9105 (3.0322)	Entropy 0.73999 (0.74002)	Top-1 acc 54.297 (51.193)	Top-5 acc 75.391 (74.380)	lr 0.02083
Train [33][430/3239]	Time 0.229 (0.472)	Data Time 0.001 (0.057)	Loss 2.9361 (3.0316)	Entropy 0.74024 (0.74002)	Top-1 acc 53.516 (51.202)	Top-5 acc 76.562 (74.397)	lr 0.02083
Train [33][440/3239]	Time 0.382 (0.531)	Data Time 0.006 (0.056)	Loss 3.1458 (3.0315)	Entropy 0.73996 (0.74002)	Top-1 acc 48.828 (51.208)	Top-5 acc 73.828 (74.410)	lr 0.02083
Train [33][450/3239]	Time 0.312 (0.528)	Data Time 0.002 (0.054)	Loss 2.8850 (3.0311)	Entropy 0.74015 (0.74002)	Top-1 acc 54.688 (51.205)	Top-5 acc 75.781 (74.426)	lr 0.02083
Train [33][460/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.053)	Loss 3.0537 (3.0316)	Entropy 0.74040 (0.74003)	Top-1 acc 53.125 (51.182)	Top-5 acc 71.875 (74.420)	lr 0.02083
Train [33][470/3239]	Time 0.250 (0.523)	Data Time 0.002 (0.052)	Loss 2.9918 (3.0326)	Entropy 0.74046 (0.74004)	Top-1 acc 50.781 (51.161)	Top-5 acc 75.781 (74.404)	lr 0.02083
Train [33][480/3239]	Time 0.238 (0.521)	Data Time 0.001 (0.051)	Loss 2.9842 (3.0316)	Entropy 0.74018 (0.74004)	Top-1 acc 50.391 (51.169)	Top-5 acc 76.953 (74.436)	lr 0.02083
Train [33][490/3239]	Time 0.276 (0.519)	Data Time 0.003 (0.050)	Loss 2.8493 (3.0299)	Entropy 0.74029 (0.74005)	Top-1 acc 55.469 (51.222)	Top-5 acc 76.562 (74.467)	lr 0.02083
Train [33][500/3239]	Time 0.239 (0.518)	Data Time 0.001 (0.049)	Loss 3.1510 (3.0307)	Entropy 0.74039 (0.74005)	Top-1 acc 50.391 (51.213)	Top-5 acc 72.266 (74.451)	lr 0.02083
Train [33][510/3239]	Time 0.265 (0.516)	Data Time 0.001 (0.048)	Loss 3.0279 (3.0303)	Entropy 0.74060 (0.74006)	Top-1 acc 50.781 (51.236)	Top-5 acc 73.828 (74.463)	lr 0.02083
Train [33][520/3239]	Time 0.270 (0.514)	Data Time 0.001 (0.047)	Loss 3.1825 (3.0316)	Entropy 0.74092 (0.74007)	Top-1 acc 48.828 (51.220)	Top-5 acc 74.219 (74.442)	lr 0.02083
Train [33][530/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.047)	Loss 2.8555 (3.0313)	Entropy 0.74097 (0.74009)	Top-1 acc 53.906 (51.212)	Top-5 acc 77.734 (74.448)	lr 0.02082
Train [33][540/3239]	Time 0.242 (0.510)	Data Time 0.001 (0.046)	Loss 2.9813 (3.0306)	Entropy 0.74035 (0.74010)	Top-1 acc 48.828 (51.209)	Top-5 acc 73.438 (74.451)	lr 0.02082
Train [33][550/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.045)	Loss 2.9705 (3.0305)	Entropy 0.74042 (0.74010)	Top-1 acc 54.297 (51.212)	Top-5 acc 76.562 (74.452)	lr 0.02082
Train [33][560/3239]	Time 0.212 (0.506)	Data Time 0.001 (0.044)	Loss 3.3688 (3.0301)	Entropy 0.74068 (0.74011)	Top-1 acc 42.578 (51.237)	Top-5 acc 65.625 (74.462)	lr 0.02082
Train [33][570/3239]	Time 0.262 (0.505)	Data Time 0.001 (0.043)	Loss 2.9764 (3.0293)	Entropy 0.74076 (0.74012)	Top-1 acc 53.516 (51.244)	Top-5 acc 74.609 (74.483)	lr 0.02082
Train [33][580/3239]	Time 0.234 (0.503)	Data Time 0.001 (0.043)	Loss 2.9918 (3.0281)	Entropy 0.74105 (0.74013)	Top-1 acc 51.953 (51.279)	Top-5 acc 76.172 (74.511)	lr 0.02082
Train [33][590/3239]	Time 0.262 (0.501)	Data Time 0.001 (0.042)	Loss 2.9867 (3.0281)	Entropy 0.74055 (0.74015)	Top-1 acc 49.219 (51.280)	Top-5 acc 75.000 (74.516)	lr 0.02082
Train [33][600/3239]	Time 0.227 (0.500)	Data Time 0.001 (0.041)	Loss 3.0773 (3.0290)	Entropy 0.74056 (0.74015)	Top-1 acc 51.172 (51.268)	Top-5 acc 73.438 (74.488)	lr 0.02082
Train [33][610/3239]	Time 0.315 (0.498)	Data Time 0.001 (0.041)	Loss 3.2005 (3.0297)	Entropy 0.74036 (0.74016)	Top-1 acc 48.438 (51.249)	Top-5 acc 69.922 (74.480)	lr 0.02082
Train [33][620/3239]	Time 0.217 (0.496)	Data Time 0.001 (0.040)	Loss 2.9389 (3.0295)	Entropy 0.74017 (0.74016)	Top-1 acc 50.391 (51.249)	Top-5 acc 76.953 (74.476)	lr 0.02082
Train [33][630/3239]	Time 0.225 (0.495)	Data Time 0.001 (0.039)	Loss 2.9272 (3.0290)	Entropy 0.74027 (0.74016)	Top-1 acc 53.906 (51.255)	Top-5 acc 75.391 (74.487)	lr 0.02082
Train [33][640/3239]	Time 0.242 (0.494)	Data Time 0.001 (0.039)	Loss 2.8986 (3.0297)	Entropy 0.74012 (0.74016)	Top-1 acc 51.562 (51.241)	Top-5 acc 74.609 (74.463)	lr 0.02082
Train [33][650/3239]	Time 0.234 (0.492)	Data Time 0.001 (0.038)	Loss 2.8100 (3.0287)	Entropy 0.73979 (0.74016)	Top-1 acc 55.469 (51.270)	Top-5 acc 78.516 (74.474)	lr 0.02082
Train [33][660/3239]	Time 0.219 (0.491)	Data Time 0.001 (0.038)	Loss 2.8983 (3.0293)	Entropy 0.73966 (0.74015)	Top-1 acc 54.297 (51.267)	Top-5 acc 78.516 (74.459)	lr 0.02081
Train [33][670/3239]	Time 0.275 (0.490)	Data Time 0.004 (0.037)	Loss 3.4082 (3.0295)	Entropy 0.73954 (0.74014)	Top-1 acc 40.234 (51.262)	Top-5 acc 64.453 (74.448)	lr 0.02081
Train [33][680/3239]	Time 0.392 (0.489)	Data Time 0.002 (0.037)	Loss 2.9490 (3.0296)	Entropy 0.73976 (0.74013)	Top-1 acc 54.688 (51.265)	Top-5 acc 74.219 (74.440)	lr 0.02081
Train [33][690/3239]	Time 0.220 (0.488)	Data Time 0.001 (0.036)	Loss 3.1430 (3.0299)	Entropy 0.73998 (0.74013)	Top-1 acc 48.047 (51.254)	Top-5 acc 74.219 (74.429)	lr 0.02081
Train [33][700/3239]	Time 0.233 (0.487)	Data Time 0.001 (0.036)	Loss 2.9559 (3.0305)	Entropy 0.73964 (0.74013)	Top-1 acc 49.609 (51.244)	Top-5 acc 73.438 (74.405)	lr 0.02081
Train [33][710/3239]	Time 0.237 (0.486)	Data Time 0.001 (0.035)	Loss 3.0124 (3.0310)	Entropy 0.73986 (0.74012)	Top-1 acc 51.953 (51.236)	Top-5 acc 75.391 (74.398)	lr 0.02081
Train [33][720/3239]	Time 0.232 (0.485)	Data Time 0.001 (0.035)	Loss 3.1243 (3.0307)	Entropy 0.73954 (0.74012)	Top-1 acc 46.094 (51.254)	Top-5 acc 71.484 (74.392)	lr 0.02081
Train [33][730/3239]	Time 0.258 (0.484)	Data Time 0.002 (0.034)	Loss 3.0069 (3.0305)	Entropy 0.73951 (0.74011)	Top-1 acc 53.516 (51.263)	Top-5 acc 75.391 (74.390)	lr 0.02081
Train [33][740/3239]	Time 0.229 (0.483)	Data Time 0.001 (0.034)	Loss 2.8941 (3.0300)	Entropy 0.73952 (0.74010)	Top-1 acc 56.250 (51.270)	Top-5 acc 76.953 (74.408)	lr 0.02081
Train [33][750/3239]	Time 0.231 (0.482)	Data Time 0.001 (0.033)	Loss 3.1005 (3.0311)	Entropy 0.73947 (0.74010)	Top-1 acc 51.172 (51.244)	Top-5 acc 73.047 (74.394)	lr 0.02081
Train [33][760/3239]	Time 0.225 (0.481)	Data Time 0.001 (0.033)	Loss 2.9071 (3.0297)	Entropy 0.73976 (0.74009)	Top-1 acc 53.125 (51.263)	Top-5 acc 76.953 (74.418)	lr 0.02081
Train [33][770/3239]	Time 0.322 (0.480)	Data Time 0.001 (0.033)	Loss 2.9898 (3.0303)	Entropy 0.73909 (0.74008)	Top-1 acc 50.781 (51.248)	Top-5 acc 76.953 (74.401)	lr 0.02081
Train [33][780/3239]	Time 0.234 (0.479)	Data Time 0.001 (0.032)	Loss 3.0954 (3.0295)	Entropy 0.73905 (0.74007)	Top-1 acc 49.609 (51.262)	Top-5 acc 72.656 (74.418)	lr 0.02081
Train [33][790/3239]	Time 0.261 (0.479)	Data Time 0.001 (0.032)	Loss 2.7559 (3.0299)	Entropy 0.73902 (0.74006)	Top-1 acc 58.594 (51.263)	Top-5 acc 77.734 (74.413)	lr 0.02080
Train [33][800/3239]	Time 0.228 (0.478)	Data Time 0.001 (0.031)	Loss 3.0499 (3.0304)	Entropy 0.73905 (0.74004)	Top-1 acc 55.078 (51.252)	Top-5 acc 73.047 (74.410)	lr 0.02080
Train [33][810/3239]	Time 0.226 (0.477)	Data Time 0.001 (0.031)	Loss 3.0481 (3.0311)	Entropy 0.73892 (0.74003)	Top-1 acc 48.047 (51.235)	Top-5 acc 77.344 (74.403)	lr 0.02080
Train [33][820/3239]	Time 0.234 (0.476)	Data Time 0.001 (0.031)	Loss 3.1794 (3.0309)	Entropy 0.73900 (0.74002)	Top-1 acc 44.922 (51.244)	Top-5 acc 75.391 (74.411)	lr 0.02080
Train [33][830/3239]	Time 0.231 (0.475)	Data Time 0.001 (0.030)	Loss 3.0937 (3.0304)	Entropy 0.73871 (0.74001)	Top-1 acc 49.219 (51.252)	Top-5 acc 74.219 (74.419)	lr 0.02080
Train [33][840/3239]	Time 0.325 (0.474)	Data Time 0.001 (0.030)	Loss 3.1158 (3.0299)	Entropy 0.73840 (0.73999)	Top-1 acc 49.609 (51.278)	Top-5 acc 73.438 (74.429)	lr 0.02080
Train [33][850/3239]	Time 0.231 (0.473)	Data Time 0.001 (0.030)	Loss 3.0921 (3.0297)	Entropy 0.73844 (0.73997)	Top-1 acc 50.391 (51.291)	Top-5 acc 74.219 (74.424)	lr 0.02080
Train [33][860/3239]	Time 0.222 (0.472)	Data Time 0.001 (0.029)	Loss 3.2615 (3.0306)	Entropy 0.73792 (0.73995)	Top-1 acc 48.828 (51.268)	Top-5 acc 73.047 (74.417)	lr 0.02080
Train [33][870/3239]	Time 0.231 (0.471)	Data Time 0.001 (0.029)	Loss 2.9077 (3.0301)	Entropy 0.73806 (0.73993)	Top-1 acc 53.125 (51.281)	Top-5 acc 76.953 (74.416)	lr 0.02080
Train [33][880/3239]	Time 0.213 (0.470)	Data Time 0.001 (0.029)	Loss 3.1168 (3.0305)	Entropy 0.73823 (0.73991)	Top-1 acc 49.219 (51.269)	Top-5 acc 73.828 (74.410)	lr 0.02080
Train [33][890/3239]	Time 0.255 (0.470)	Data Time 0.002 (0.028)	Loss 3.1662 (3.0313)	Entropy 0.73780 (0.73989)	Top-1 acc 46.875 (51.245)	Top-5 acc 72.656 (74.398)	lr 0.02080
Train [33][900/3239]	Time 0.217 (0.469)	Data Time 0.001 (0.028)	Loss 3.2749 (3.0310)	Entropy 0.73771 (0.73986)	Top-1 acc 48.047 (51.244)	Top-5 acc 69.531 (74.404)	lr 0.02080
Train [33][910/3239]	Time 0.226 (0.468)	Data Time 0.001 (0.028)	Loss 3.1452 (3.0314)	Entropy 0.73800 (0.73984)	Top-1 acc 53.906 (51.246)	Top-5 acc 71.875 (74.410)	lr 0.02080
Train [33][920/3239]	Time 0.221 (0.468)	Data Time 0.001 (0.028)	Loss 3.2389 (3.0315)	Entropy 0.73807 (0.73982)	Top-1 acc 50.781 (51.243)	Top-5 acc 69.922 (74.418)	lr 0.02079
Train [33][930/3239]	Time 0.307 (0.467)	Data Time 0.001 (0.027)	Loss 2.9608 (3.0316)	Entropy 0.73768 (0.73980)	Top-1 acc 56.250 (51.248)	Top-5 acc 75.781 (74.411)	lr 0.02079
Train [33][940/3239]	Time 0.220 (0.466)	Data Time 0.001 (0.027)	Loss 2.8538 (3.0316)	Entropy 0.73735 (0.73978)	Top-1 acc 55.469 (51.244)	Top-5 acc 76.562 (74.409)	lr 0.02079
Train [33][950/3239]	Time 0.220 (0.465)	Data Time 0.001 (0.027)	Loss 2.7271 (3.0312)	Entropy 0.73720 (0.73975)	Top-1 acc 58.984 (51.245)	Top-5 acc 81.250 (74.420)	lr 0.02079
Train [33][960/3239]	Time 0.231 (0.465)	Data Time 0.001 (0.026)	Loss 2.8530 (3.0313)	Entropy 0.73708 (0.73973)	Top-1 acc 58.203 (51.248)	Top-5 acc 77.734 (74.420)	lr 0.02079
Train [33][970/3239]	Time 0.228 (0.464)	Data Time 0.001 (0.026)	Loss 3.1675 (3.0314)	Entropy 0.73710 (0.73970)	Top-1 acc 47.656 (51.244)	Top-5 acc 73.438 (74.422)	lr 0.02079
Train [33][980/3239]	Time 0.222 (0.463)	Data Time 0.001 (0.026)	Loss 3.0080 (3.0315)	Entropy 0.73693 (0.73967)	Top-1 acc 52.344 (51.247)	Top-5 acc 72.266 (74.421)	lr 0.02079
Train [33][990/3239]	Time 0.249 (0.463)	Data Time 0.001 (0.026)	Loss 3.1636 (3.0317)	Entropy 0.73658 (0.73964)	Top-1 acc 50.781 (51.251)	Top-5 acc 70.703 (74.415)	lr 0.02079
Train [33][1000/3239]	Time 0.313 (0.462)	Data Time 0.001 (0.025)	Loss 2.9045 (3.0307)	Entropy 0.73698 (0.73961)	Top-1 acc 52.344 (51.280)	Top-5 acc 76.172 (74.426)	lr 0.02079
Train [33][1010/3239]	Time 0.229 (0.462)	Data Time 0.001 (0.025)	Loss 2.9471 (3.0312)	Entropy 0.73712 (0.73958)	Top-1 acc 53.516 (51.267)	Top-5 acc 76.172 (74.416)	lr 0.02079
Train [33][1020/3239]	Time 0.214 (0.461)	Data Time 0.001 (0.025)	Loss 2.8103 (3.0310)	Entropy 0.73742 (0.73956)	Top-1 acc 55.469 (51.271)	Top-5 acc 77.734 (74.411)	lr 0.02079
Train [33][1030/3239]	Time 0.220 (0.460)	Data Time 0.001 (0.025)	Loss 2.8868 (3.0313)	Entropy 0.73752 (0.73954)	Top-1 acc 55.469 (51.270)	Top-5 acc 74.609 (74.407)	lr 0.02079
Train [33][1040/3239]	Time 0.224 (0.460)	Data Time 0.001 (0.025)	Loss 3.0741 (3.0312)	Entropy 0.73777 (0.73952)	Top-1 acc 50.391 (51.270)	Top-5 acc 74.609 (74.419)	lr 0.02079
Train [33][1050/3239]	Time 0.240 (0.459)	Data Time 0.001 (0.024)	Loss 2.7697 (3.0308)	Entropy 0.73764 (0.73951)	Top-1 acc 56.641 (51.278)	Top-5 acc 82.812 (74.428)	lr 0.02079
Train [33][1060/3239]	Time 0.232 (0.459)	Data Time 0.001 (0.024)	Loss 3.0465 (3.0315)	Entropy 0.73783 (0.73949)	Top-1 acc 51.562 (51.253)	Top-5 acc 73.828 (74.413)	lr 0.02078
Train [33][1070/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.024)	Loss 2.8586 (3.0320)	Entropy 0.73784 (0.73947)	Top-1 acc 54.688 (51.241)	Top-5 acc 78.906 (74.412)	lr 0.02078
Train [33][1080/3239]	Time 0.230 (0.457)	Data Time 0.001 (0.024)	Loss 3.1157 (3.0326)	Entropy 0.73779 (0.73946)	Top-1 acc 48.438 (51.231)	Top-5 acc 76.953 (74.402)	lr 0.02078
Train [33][1090/3239]	Time 0.482 (0.481)	Data Time 0.005 (0.024)	Loss 3.0553 (3.0328)	Entropy 0.73753 (0.73944)	Top-1 acc 54.688 (51.241)	Top-5 acc 70.312 (74.396)	lr 0.02078
Train [33][1100/3239]	Time 0.267 (0.481)	Data Time 0.004 (0.023)	Loss 2.9101 (3.0328)	Entropy 0.73746 (0.73942)	Top-1 acc 54.688 (51.245)	Top-5 acc 75.391 (74.397)	lr 0.02078
Train [33][1110/3239]	Time 0.236 (0.480)	Data Time 0.002 (0.023)	Loss 2.8730 (3.0333)	Entropy 0.73746 (0.73941)	Top-1 acc 55.859 (51.236)	Top-5 acc 76.562 (74.383)	lr 0.02078
Train [33][1120/3239]	Time 0.226 (0.480)	Data Time 0.001 (0.023)	Loss 2.9080 (3.0334)	Entropy 0.73737 (0.73939)	Top-1 acc 53.906 (51.235)	Top-5 acc 77.344 (74.380)	lr 0.02078
Train [33][1130/3239]	Time 0.231 (0.479)	Data Time 0.001 (0.023)	Loss 3.0722 (3.0337)	Entropy 0.73749 (0.73937)	Top-1 acc 50.000 (51.232)	Top-5 acc 73.828 (74.370)	lr 0.02078
Train [33][1140/3239]	Time 0.221 (0.479)	Data Time 0.001 (0.023)	Loss 2.9260 (3.0331)	Entropy 0.73727 (0.73935)	Top-1 acc 54.297 (51.243)	Top-5 acc 73.047 (74.377)	lr 0.02078
Train [33][1150/3239]	Time 0.218 (0.478)	Data Time 0.001 (0.022)	Loss 3.0279 (3.0332)	Entropy 0.73733 (0.73934)	Top-1 acc 51.562 (51.236)	Top-5 acc 73.047 (74.377)	lr 0.02078
Train [33][1160/3239]	Time 0.326 (0.477)	Data Time 0.001 (0.022)	Loss 3.1492 (3.0332)	Entropy 0.73730 (0.73932)	Top-1 acc 51.562 (51.239)	Top-5 acc 74.219 (74.374)	lr 0.02078
Train [33][1170/3239]	Time 0.221 (0.477)	Data Time 0.001 (0.022)	Loss 2.9724 (3.0334)	Entropy 0.73714 (0.73930)	Top-1 acc 51.562 (51.242)	Top-5 acc 75.391 (74.365)	lr 0.02078
Train [33][1180/3239]	Time 0.248 (0.476)	Data Time 0.001 (0.022)	Loss 3.1643 (3.0334)	Entropy 0.73690 (0.73928)	Top-1 acc 47.656 (51.240)	Top-5 acc 72.656 (74.363)	lr 0.02078
Train [33][1190/3239]	Time 0.217 (0.476)	Data Time 0.001 (0.022)	Loss 2.7973 (3.0336)	Entropy 0.73651 (0.73926)	Top-1 acc 51.953 (51.225)	Top-5 acc 80.469 (74.360)	lr 0.02077
Train [33][1200/3239]	Time 0.248 (0.475)	Data Time 0.001 (0.022)	Loss 3.1390 (3.0337)	Entropy 0.73673 (0.73924)	Top-1 acc 50.000 (51.217)	Top-5 acc 68.750 (74.356)	lr 0.02077
Train [33][1210/3239]	Time 0.239 (0.475)	Data Time 0.001 (0.021)	Loss 3.1258 (3.0343)	Entropy 0.73654 (0.73922)	Top-1 acc 49.609 (51.206)	Top-5 acc 71.484 (74.337)	lr 0.02077
Train [33][1220/3239]	Time 0.232 (0.475)	Data Time 0.001 (0.021)	Loss 2.9666 (3.0341)	Entropy 0.73643 (0.73920)	Top-1 acc 50.781 (51.207)	Top-5 acc 76.172 (74.340)	lr 0.02077
Train [33][1230/3239]	Time 0.237 (0.474)	Data Time 0.001 (0.021)	Loss 3.3636 (3.0346)	Entropy 0.73630 (0.73917)	Top-1 acc 44.922 (51.195)	Top-5 acc 69.531 (74.333)	lr 0.02077
Train [33][1240/3239]	Time 0.248 (0.474)	Data Time 0.002 (0.021)	Loss 2.7909 (3.0347)	Entropy 0.73608 (0.73915)	Top-1 acc 55.078 (51.191)	Top-5 acc 80.078 (74.329)	lr 0.02077
Train [33][1250/3239]	Time 0.255 (0.473)	Data Time 0.001 (0.021)	Loss 3.1207 (3.0351)	Entropy 0.73623 (0.73912)	Top-1 acc 46.875 (51.178)	Top-5 acc 72.266 (74.319)	lr 0.02077
Train [33][1260/3239]	Time 0.254 (0.473)	Data Time 0.001 (0.021)	Loss 2.9715 (3.0349)	Entropy 0.73629 (0.73910)	Top-1 acc 52.734 (51.188)	Top-5 acc 76.172 (74.323)	lr 0.02077
Train [33][1270/3239]	Time 0.225 (0.472)	Data Time 0.001 (0.020)	Loss 3.2004 (3.0354)	Entropy 0.73639 (0.73908)	Top-1 acc 46.484 (51.179)	Top-5 acc 69.531 (74.310)	lr 0.02077
Train [33][1280/3239]	Time 0.232 (0.472)	Data Time 0.001 (0.020)	Loss 3.0907 (3.0350)	Entropy 0.73633 (0.73906)	Top-1 acc 51.953 (51.184)	Top-5 acc 71.875 (74.308)	lr 0.02077
Train [33][1290/3239]	Time 0.223 (0.471)	Data Time 0.001 (0.020)	Loss 3.1520 (3.0353)	Entropy 0.73609 (0.73904)	Top-1 acc 47.266 (51.176)	Top-5 acc 71.484 (74.307)	lr 0.02077
Train [33][1300/3239]	Time 0.239 (0.471)	Data Time 0.001 (0.020)	Loss 3.0133 (3.0354)	Entropy 0.73558 (0.73901)	Top-1 acc 51.953 (51.176)	Top-5 acc 75.391 (74.312)	lr 0.02077
Train [33][1310/3239]	Time 0.220 (0.470)	Data Time 0.001 (0.020)	Loss 3.0351 (3.0354)	Entropy 0.73545 (0.73898)	Top-1 acc 49.219 (51.167)	Top-5 acc 74.609 (74.305)	lr 0.02077
Train [33][1320/3239]	Time 0.319 (0.470)	Data Time 0.001 (0.020)	Loss 3.1442 (3.0361)	Entropy 0.73525 (0.73896)	Top-1 acc 51.172 (51.148)	Top-5 acc 73.828 (74.295)	lr 0.02076
Train [33][1330/3239]	Time 0.230 (0.469)	Data Time 0.001 (0.020)	Loss 2.9050 (3.0353)	Entropy 0.73540 (0.73893)	Top-1 acc 55.469 (51.168)	Top-5 acc 77.344 (74.308)	lr 0.02076
Train [33][1340/3239]	Time 0.225 (0.469)	Data Time 0.001 (0.019)	Loss 3.0033 (3.0352)	Entropy 0.73552 (0.73890)	Top-1 acc 48.047 (51.174)	Top-5 acc 75.000 (74.312)	lr 0.02076
Train [33][1350/3239]	Time 0.225 (0.468)	Data Time 0.001 (0.019)	Loss 3.0033 (3.0350)	Entropy 0.73526 (0.73888)	Top-1 acc 51.953 (51.180)	Top-5 acc 75.781 (74.319)	lr 0.02076
Train [33][1360/3239]	Time 0.230 (0.468)	Data Time 0.001 (0.019)	Loss 2.7421 (3.0348)	Entropy 0.73551 (0.73885)	Top-1 acc 56.641 (51.179)	Top-5 acc 80.859 (74.328)	lr 0.02076
Train [33][1370/3239]	Time 0.227 (0.467)	Data Time 0.001 (0.019)	Loss 3.0469 (3.0350)	Entropy 0.73606 (0.73883)	Top-1 acc 51.562 (51.173)	Top-5 acc 73.438 (74.326)	lr 0.02076
Train [33][1380/3239]	Time 0.232 (0.467)	Data Time 0.001 (0.019)	Loss 3.0038 (3.0349)	Entropy 0.73644 (0.73881)	Top-1 acc 54.688 (51.174)	Top-5 acc 79.297 (74.336)	lr 0.02076
Train [33][1390/3239]	Time 0.312 (0.467)	Data Time 0.001 (0.019)	Loss 2.9944 (3.0346)	Entropy 0.73647 (0.73879)	Top-1 acc 51.953 (51.185)	Top-5 acc 76.172 (74.345)	lr 0.02076
Train [33][1400/3239]	Time 0.263 (0.466)	Data Time 0.001 (0.019)	Loss 2.8007 (3.0344)	Entropy 0.73631 (0.73878)	Top-1 acc 57.031 (51.193)	Top-5 acc 77.344 (74.343)	lr 0.02076
Train [33][1410/3239]	Time 0.227 (0.466)	Data Time 0.001 (0.019)	Loss 3.3184 (3.0348)	Entropy 0.73652 (0.73876)	Top-1 acc 44.922 (51.180)	Top-5 acc 68.359 (74.331)	lr 0.02076
Train [33][1420/3239]	Time 0.221 (0.465)	Data Time 0.001 (0.018)	Loss 3.0195 (3.0350)	Entropy 0.73684 (0.73874)	Top-1 acc 52.344 (51.182)	Top-5 acc 72.656 (74.333)	lr 0.02076
Train [33][1430/3239]	Time 0.221 (0.465)	Data Time 0.001 (0.018)	Loss 3.0264 (3.0350)	Entropy 0.73629 (0.73873)	Top-1 acc 52.344 (51.183)	Top-5 acc 72.266 (74.335)	lr 0.02076
Train [33][1440/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.018)	Loss 2.9620 (3.0346)	Entropy 0.73613 (0.73871)	Top-1 acc 53.906 (51.188)	Top-5 acc 74.609 (74.337)	lr 0.02076
Train [33][1450/3239]	Time 0.222 (0.464)	Data Time 0.001 (0.018)	Loss 3.0928 (3.0347)	Entropy 0.73628 (0.73869)	Top-1 acc 55.078 (51.193)	Top-5 acc 73.828 (74.337)	lr 0.02075
Train [33][1460/3239]	Time 0.233 (0.464)	Data Time 0.001 (0.018)	Loss 3.0586 (3.0344)	Entropy 0.73632 (0.73868)	Top-1 acc 48.828 (51.204)	Top-5 acc 71.875 (74.338)	lr 0.02075
Train [33][1470/3239]	Time 0.237 (0.463)	Data Time 0.001 (0.018)	Loss 3.0194 (3.0342)	Entropy 0.73624 (0.73866)	Top-1 acc 52.344 (51.205)	Top-5 acc 75.781 (74.337)	lr 0.02075
Train [33][1480/3239]	Time 0.332 (0.463)	Data Time 0.001 (0.018)	Loss 3.0679 (3.0342)	Entropy 0.73603 (0.73864)	Top-1 acc 51.953 (51.214)	Top-5 acc 73.047 (74.340)	lr 0.02075
Train [33][1490/3239]	Time 0.224 (0.462)	Data Time 0.001 (0.018)	Loss 2.9211 (3.0343)	Entropy 0.73588 (0.73863)	Top-1 acc 56.641 (51.208)	Top-5 acc 78.516 (74.343)	lr 0.02075
Train [33][1500/3239]	Time 0.226 (0.462)	Data Time 0.001 (0.018)	Loss 3.1513 (3.0344)	Entropy 0.73554 (0.73861)	Top-1 acc 48.438 (51.202)	Top-5 acc 71.484 (74.341)	lr 0.02075
Train [33][1510/3239]	Time 0.223 (0.462)	Data Time 0.001 (0.017)	Loss 3.0305 (3.0339)	Entropy 0.73511 (0.73859)	Top-1 acc 53.516 (51.217)	Top-5 acc 76.172 (74.353)	lr 0.02075
Train [33][1520/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.017)	Loss 3.0746 (3.0339)	Entropy 0.73491 (0.73856)	Top-1 acc 49.219 (51.213)	Top-5 acc 69.922 (74.355)	lr 0.02075
Train [33][1530/3239]	Time 0.220 (0.461)	Data Time 0.001 (0.017)	Loss 2.9244 (3.0340)	Entropy 0.73451 (0.73854)	Top-1 acc 55.078 (51.204)	Top-5 acc 75.000 (74.353)	lr 0.02075
Train [33][1540/3239]	Time 0.232 (0.460)	Data Time 0.001 (0.017)	Loss 3.0362 (3.0338)	Entropy 0.73488 (0.73851)	Top-1 acc 50.781 (51.205)	Top-5 acc 73.828 (74.357)	lr 0.02075
Train [33][1550/3239]	Time 0.316 (0.460)	Data Time 0.001 (0.017)	Loss 3.3478 (3.0345)	Entropy 0.73506 (0.73849)	Top-1 acc 41.797 (51.184)	Top-5 acc 68.750 (74.344)	lr 0.02075
Train [33][1560/3239]	Time 0.223 (0.460)	Data Time 0.001 (0.017)	Loss 3.1412 (3.0352)	Entropy 0.73525 (0.73847)	Top-1 acc 51.562 (51.178)	Top-5 acc 71.875 (74.328)	lr 0.02075
Train [33][1570/3239]	Time 0.221 (0.459)	Data Time 0.001 (0.017)	Loss 2.7894 (3.0349)	Entropy 0.73496 (0.73845)	Top-1 acc 57.031 (51.186)	Top-5 acc 78.125 (74.331)	lr 0.02075
Train [33][1580/3239]	Time 0.224 (0.459)	Data Time 0.001 (0.017)	Loss 3.0742 (3.0350)	Entropy 0.73478 (0.73842)	Top-1 acc 49.219 (51.181)	Top-5 acc 73.438 (74.332)	lr 0.02074
Train [33][1590/3239]	Time 0.225 (0.459)	Data Time 0.001 (0.017)	Loss 2.8794 (3.0346)	Entropy 0.73444 (0.73840)	Top-1 acc 53.906 (51.184)	Top-5 acc 74.609 (74.335)	lr 0.02074
Train [33][1600/3239]	Time 0.227 (0.458)	Data Time 0.001 (0.017)	Loss 2.8427 (3.0345)	Entropy 0.73468 (0.73838)	Top-1 acc 55.469 (51.187)	Top-5 acc 78.125 (74.341)	lr 0.02074
Train [33][1610/3239]	Time 0.232 (0.458)	Data Time 0.001 (0.016)	Loss 2.8561 (3.0346)	Entropy 0.73435 (0.73835)	Top-1 acc 53.125 (51.180)	Top-5 acc 80.469 (74.343)	lr 0.02074
Train [33][1620/3239]	Time 0.232 (0.458)	Data Time 0.001 (0.016)	Loss 3.0624 (3.0347)	Entropy 0.73409 (0.73833)	Top-1 acc 48.828 (51.170)	Top-5 acc 74.609 (74.341)	lr 0.02074
Train [33][1630/3239]	Time 0.217 (0.457)	Data Time 0.001 (0.016)	Loss 3.1796 (3.0346)	Entropy 0.73429 (0.73830)	Top-1 acc 47.656 (51.175)	Top-5 acc 71.484 (74.338)	lr 0.02074
Train [33][1640/3239]	Time 0.239 (0.457)	Data Time 0.001 (0.016)	Loss 2.9665 (3.0346)	Entropy 0.73419 (0.73828)	Top-1 acc 51.172 (51.181)	Top-5 acc 78.125 (74.344)	lr 0.02074
Train [33][1650/3239]	Time 0.222 (0.456)	Data Time 0.001 (0.016)	Loss 3.2909 (3.0347)	Entropy 0.73454 (0.73825)	Top-1 acc 46.484 (51.177)	Top-5 acc 67.969 (74.342)	lr 0.02074
Train [33][1660/3239]	Time 0.232 (0.456)	Data Time 0.001 (0.016)	Loss 3.1627 (3.0346)	Entropy 0.73466 (0.73823)	Top-1 acc 48.047 (51.178)	Top-5 acc 73.047 (74.345)	lr 0.02074
Train [33][1670/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.016)	Loss 3.1755 (3.0347)	Entropy 0.73514 (0.73821)	Top-1 acc 47.656 (51.172)	Top-5 acc 71.484 (74.346)	lr 0.02074
Train [33][1680/3239]	Time 0.223 (0.455)	Data Time 0.001 (0.016)	Loss 3.3216 (3.0351)	Entropy 0.73507 (0.73819)	Top-1 acc 46.875 (51.171)	Top-5 acc 71.875 (74.341)	lr 0.02074
Train [33][1690/3239]	Time 0.228 (0.455)	Data Time 0.001 (0.016)	Loss 3.1103 (3.0351)	Entropy 0.73524 (0.73818)	Top-1 acc 47.266 (51.165)	Top-5 acc 76.172 (74.344)	lr 0.02074
Train [33][1700/3239]	Time 0.226 (0.455)	Data Time 0.001 (0.016)	Loss 3.2258 (3.0348)	Entropy 0.73519 (0.73816)	Top-1 acc 47.266 (51.167)	Top-5 acc 73.047 (74.353)	lr 0.02074
Train [33][1710/3239]	Time 0.326 (0.455)	Data Time 0.001 (0.016)	Loss 2.9449 (3.0346)	Entropy 0.73507 (0.73814)	Top-1 acc 52.344 (51.174)	Top-5 acc 74.609 (74.357)	lr 0.02073
Train [33][1720/3239]	Time 0.246 (0.454)	Data Time 0.001 (0.016)	Loss 3.0806 (3.0346)	Entropy 0.73512 (0.73812)	Top-1 acc 51.953 (51.176)	Top-5 acc 72.266 (74.356)	lr 0.02073
Train [33][1730/3239]	Time 0.229 (0.454)	Data Time 0.001 (0.015)	Loss 3.1601 (3.0346)	Entropy 0.73520 (0.73811)	Top-1 acc 50.391 (51.176)	Top-5 acc 73.828 (74.355)	lr 0.02073
Train [33][1740/3239]	Time 0.227 (0.454)	Data Time 0.001 (0.015)	Loss 3.0180 (3.0346)	Entropy 0.73500 (0.73809)	Top-1 acc 52.344 (51.174)	Top-5 acc 75.000 (74.355)	lr 0.02073
Train [33][1750/3239]	Time 0.238 (0.469)	Data Time 0.002 (0.015)	Loss 3.0108 (3.0342)	Entropy 0.73507 (0.73807)	Top-1 acc 50.781 (51.181)	Top-5 acc 73.438 (74.361)	lr 0.02073
Train [33][1760/3239]	Time 0.230 (0.469)	Data Time 0.002 (0.015)	Loss 3.0933 (3.0345)	Entropy 0.73498 (0.73805)	Top-1 acc 55.078 (51.175)	Top-5 acc 73.047 (74.354)	lr 0.02073
Train [33][1770/3239]	Time 0.235 (0.468)	Data Time 0.001 (0.015)	Loss 3.1041 (3.0345)	Entropy 0.73494 (0.73804)	Top-1 acc 50.391 (51.173)	Top-5 acc 74.609 (74.357)	lr 0.02073
Train [33][1780/3239]	Time 0.259 (0.468)	Data Time 0.001 (0.015)	Loss 3.2127 (3.0345)	Entropy 0.73488 (0.73802)	Top-1 acc 53.125 (51.169)	Top-5 acc 70.703 (74.355)	lr 0.02073
Train [33][1790/3239]	Time 0.235 (0.468)	Data Time 0.001 (0.015)	Loss 2.7976 (3.0342)	Entropy 0.73520 (0.73800)	Top-1 acc 56.641 (51.176)	Top-5 acc 77.344 (74.362)	lr 0.02073
Train [33][1800/3239]	Time 0.316 (0.468)	Data Time 0.001 (0.015)	Loss 2.8206 (3.0343)	Entropy 0.73535 (0.73799)	Top-1 acc 56.250 (51.183)	Top-5 acc 80.469 (74.363)	lr 0.02073
Train [33][1810/3239]	Time 0.241 (0.468)	Data Time 0.001 (0.015)	Loss 3.0011 (3.0344)	Entropy 0.73561 (0.73797)	Top-1 acc 50.781 (51.176)	Top-5 acc 75.781 (74.362)	lr 0.02073
Train [33][1820/3239]	Time 0.233 (0.467)	Data Time 0.001 (0.015)	Loss 2.9918 (3.0341)	Entropy 0.73531 (0.73796)	Top-1 acc 48.047 (51.181)	Top-5 acc 76.172 (74.373)	lr 0.02073
Train [33][1830/3239]	Time 0.234 (0.467)	Data Time 0.001 (0.015)	Loss 2.9749 (3.0342)	Entropy 0.73485 (0.73794)	Top-1 acc 50.391 (51.178)	Top-5 acc 78.516 (74.368)	lr 0.02073
Train [33][1840/3239]	Time 0.225 (0.467)	Data Time 0.001 (0.015)	Loss 2.9397 (3.0346)	Entropy 0.73456 (0.73793)	Top-1 acc 55.859 (51.167)	Top-5 acc 76.562 (74.358)	lr 0.02073
Train [33][1850/3239]	Time 0.238 (0.466)	Data Time 0.001 (0.015)	Loss 2.9733 (3.0343)	Entropy 0.73438 (0.73791)	Top-1 acc 53.906 (51.178)	Top-5 acc 73.047 (74.361)	lr 0.02072
Train [33][1860/3239]	Time 0.215 (0.466)	Data Time 0.001 (0.015)	Loss 3.0337 (3.0342)	Entropy 0.73439 (0.73789)	Top-1 acc 51.172 (51.182)	Top-5 acc 73.047 (74.361)	lr 0.02072
Train [33][1870/3239]	Time 0.317 (0.466)	Data Time 0.001 (0.014)	Loss 2.9777 (3.0342)	Entropy 0.73400 (0.73787)	Top-1 acc 55.078 (51.184)	Top-5 acc 75.391 (74.360)	lr 0.02072
Train [33][1880/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.014)	Loss 3.0299 (3.0340)	Entropy 0.73407 (0.73785)	Top-1 acc 50.781 (51.190)	Top-5 acc 74.219 (74.361)	lr 0.02072
Train [33][1890/3239]	Time 0.240 (0.465)	Data Time 0.001 (0.014)	Loss 2.9505 (3.0338)	Entropy 0.73461 (0.73783)	Top-1 acc 55.078 (51.197)	Top-5 acc 75.000 (74.362)	lr 0.02072
Train [33][1900/3239]	Time 0.241 (0.465)	Data Time 0.001 (0.014)	Loss 3.0549 (3.0335)	Entropy 0.73423 (0.73781)	Top-1 acc 51.562 (51.205)	Top-5 acc 73.828 (74.364)	lr 0.02072
Train [33][1910/3239]	Time 0.237 (0.465)	Data Time 0.001 (0.014)	Loss 3.3028 (3.0336)	Entropy 0.73421 (0.73779)	Top-1 acc 44.922 (51.208)	Top-5 acc 67.188 (74.361)	lr 0.02072
Train [33][1920/3239]	Time 0.289 (0.465)	Data Time 0.002 (0.014)	Loss 2.9761 (3.0332)	Entropy 0.73399 (0.73777)	Top-1 acc 50.391 (51.215)	Top-5 acc 74.609 (74.376)	lr 0.02072
Train [33][1930/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.014)	Loss 3.3961 (3.0332)	Entropy 0.73349 (0.73775)	Top-1 acc 44.531 (51.215)	Top-5 acc 66.406 (74.374)	lr 0.02072
Train [33][1940/3239]	Time 0.322 (0.464)	Data Time 0.001 (0.014)	Loss 2.9947 (3.0332)	Entropy 0.73340 (0.73773)	Top-1 acc 54.688 (51.213)	Top-5 acc 75.391 (74.374)	lr 0.02072
Train [33][1950/3239]	Time 0.232 (0.464)	Data Time 0.001 (0.014)	Loss 2.8734 (3.0332)	Entropy 0.73356 (0.73771)	Top-1 acc 54.688 (51.215)	Top-5 acc 80.078 (74.375)	lr 0.02072
Train [33][1960/3239]	Time 0.261 (0.464)	Data Time 0.001 (0.014)	Loss 3.1363 (3.0336)	Entropy 0.73379 (0.73769)	Top-1 acc 46.484 (51.210)	Top-5 acc 69.141 (74.368)	lr 0.02072
Train [33][1970/3239]	Time 0.231 (0.463)	Data Time 0.001 (0.014)	Loss 3.0959 (3.0336)	Entropy 0.73379 (0.73767)	Top-1 acc 48.438 (51.209)	Top-5 acc 73.828 (74.368)	lr 0.02072
Train [33][1980/3239]	Time 0.226 (0.463)	Data Time 0.001 (0.014)	Loss 3.0665 (3.0338)	Entropy 0.73410 (0.73765)	Top-1 acc 51.562 (51.202)	Top-5 acc 73.828 (74.365)	lr 0.02071
Train [33][1990/3239]	Time 0.230 (0.463)	Data Time 0.001 (0.014)	Loss 3.0892 (3.0340)	Entropy 0.73438 (0.73763)	Top-1 acc 50.000 (51.199)	Top-5 acc 75.391 (74.362)	lr 0.02071
Train [33][2000/3239]	Time 0.242 (0.463)	Data Time 0.001 (0.014)	Loss 3.1473 (3.0342)	Entropy 0.73481 (0.73762)	Top-1 acc 49.219 (51.192)	Top-5 acc 72.656 (74.356)	lr 0.02071
Train [33][2010/3239]	Time 0.233 (0.462)	Data Time 0.001 (0.014)	Loss 2.8379 (3.0341)	Entropy 0.73521 (0.73760)	Top-1 acc 57.812 (51.196)	Top-5 acc 79.688 (74.358)	lr 0.02071
Train [33][2020/3239]	Time 0.226 (0.462)	Data Time 0.001 (0.013)	Loss 3.1442 (3.0340)	Entropy 0.73479 (0.73759)	Top-1 acc 50.391 (51.203)	Top-5 acc 68.750 (74.360)	lr 0.02071
Train [33][2030/3239]	Time 0.340 (0.462)	Data Time 0.001 (0.013)	Loss 2.9554 (3.0341)	Entropy 0.73454 (0.73758)	Top-1 acc 56.641 (51.200)	Top-5 acc 77.734 (74.359)	lr 0.02071
Train [33][2040/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.013)	Loss 2.9176 (3.0339)	Entropy 0.73424 (0.73756)	Top-1 acc 53.125 (51.207)	Top-5 acc 75.391 (74.361)	lr 0.02071
Train [33][2050/3239]	Time 0.228 (0.461)	Data Time 0.001 (0.013)	Loss 2.8596 (3.0338)	Entropy 0.73414 (0.73754)	Top-1 acc 53.516 (51.215)	Top-5 acc 77.734 (74.361)	lr 0.02071
Train [33][2060/3239]	Time 0.223 (0.461)	Data Time 0.001 (0.013)	Loss 2.9393 (3.0337)	Entropy 0.73442 (0.73753)	Top-1 acc 53.906 (51.218)	Top-5 acc 75.391 (74.360)	lr 0.02071
Train [33][2070/3239]	Time 0.262 (0.461)	Data Time 0.001 (0.013)	Loss 3.2222 (3.0341)	Entropy 0.73437 (0.73751)	Top-1 acc 47.656 (51.217)	Top-5 acc 67.188 (74.355)	lr 0.02071
Train [33][2080/3239]	Time 0.229 (0.461)	Data Time 0.001 (0.013)	Loss 3.2049 (3.0344)	Entropy 0.73478 (0.73750)	Top-1 acc 48.438 (51.207)	Top-5 acc 70.703 (74.348)	lr 0.02071
Train [33][2090/3239]	Time 0.237 (0.460)	Data Time 0.001 (0.013)	Loss 2.8152 (3.0343)	Entropy 0.73434 (0.73749)	Top-1 acc 56.250 (51.206)	Top-5 acc 76.172 (74.350)	lr 0.02071
Train [33][2100/3239]	Time 0.354 (0.460)	Data Time 0.001 (0.013)	Loss 2.9437 (3.0343)	Entropy 0.73451 (0.73747)	Top-1 acc 52.344 (51.195)	Top-5 acc 75.391 (74.355)	lr 0.02071
Train [33][2110/3239]	Time 0.226 (0.460)	Data Time 0.001 (0.013)	Loss 2.9788 (3.0345)	Entropy 0.73444 (0.73746)	Top-1 acc 53.906 (51.195)	Top-5 acc 75.000 (74.349)	lr 0.02070
Train [33][2120/3239]	Time 0.231 (0.460)	Data Time 0.001 (0.013)	Loss 3.1191 (3.0342)	Entropy 0.73418 (0.73744)	Top-1 acc 53.125 (51.191)	Top-5 acc 70.312 (74.357)	lr 0.02070
Train [33][2130/3239]	Time 0.240 (0.459)	Data Time 0.001 (0.013)	Loss 3.1412 (3.0341)	Entropy 0.73449 (0.73743)	Top-1 acc 47.266 (51.193)	Top-5 acc 71.484 (74.358)	lr 0.02070
Train [33][2140/3239]	Time 0.234 (0.459)	Data Time 0.001 (0.013)	Loss 2.8923 (3.0342)	Entropy 0.73442 (0.73741)	Top-1 acc 52.734 (51.190)	Top-5 acc 76.172 (74.357)	lr 0.02070
Train [33][2150/3239]	Time 0.226 (0.459)	Data Time 0.001 (0.013)	Loss 3.0769 (3.0342)	Entropy 0.73420 (0.73740)	Top-1 acc 49.609 (51.190)	Top-5 acc 74.219 (74.355)	lr 0.02070
Train [33][2160/3239]	Time 0.236 (0.458)	Data Time 0.001 (0.013)	Loss 3.0844 (3.0343)	Entropy 0.73424 (0.73738)	Top-1 acc 47.266 (51.187)	Top-5 acc 73.828 (74.356)	lr 0.02070
Train [33][2170/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.013)	Loss 2.9109 (3.0341)	Entropy 0.73414 (0.73737)	Top-1 acc 52.734 (51.188)	Top-5 acc 75.391 (74.358)	lr 0.02070
Train [33][2180/3239]	Time 0.228 (0.458)	Data Time 0.001 (0.013)	Loss 3.1773 (3.0343)	Entropy 0.73449 (0.73736)	Top-1 acc 45.312 (51.178)	Top-5 acc 71.094 (74.359)	lr 0.02070
Train [33][2190/3239]	Time 0.326 (0.458)	Data Time 0.001 (0.013)	Loss 3.1943 (3.0342)	Entropy 0.73435 (0.73734)	Top-1 acc 44.531 (51.176)	Top-5 acc 68.750 (74.361)	lr 0.02070
Train [33][2200/3239]	Time 0.258 (0.457)	Data Time 0.001 (0.013)	Loss 3.1672 (3.0343)	Entropy 0.73445 (0.73733)	Top-1 acc 45.703 (51.174)	Top-5 acc 73.438 (74.363)	lr 0.02070
Train [33][2210/3239]	Time 0.233 (0.457)	Data Time 0.001 (0.012)	Loss 2.8402 (3.0340)	Entropy 0.73407 (0.73732)	Top-1 acc 52.734 (51.181)	Top-5 acc 78.906 (74.372)	lr 0.02070
Train [33][2220/3239]	Time 0.248 (0.457)	Data Time 0.001 (0.012)	Loss 3.1252 (3.0340)	Entropy 0.73398 (0.73730)	Top-1 acc 49.219 (51.186)	Top-5 acc 72.656 (74.374)	lr 0.02070
Train [33][2230/3239]	Time 0.231 (0.457)	Data Time 0.001 (0.012)	Loss 2.8314 (3.0337)	Entropy 0.73394 (0.73729)	Top-1 acc 53.516 (51.194)	Top-5 acc 76.172 (74.377)	lr 0.02070
Train [33][2240/3239]	Time 0.230 (0.456)	Data Time 0.001 (0.012)	Loss 2.9247 (3.0336)	Entropy 0.73386 (0.73727)	Top-1 acc 51.953 (51.202)	Top-5 acc 75.000 (74.381)	lr 0.02069
Train [33][2250/3239]	Time 0.247 (0.456)	Data Time 0.001 (0.012)	Loss 3.1681 (3.0338)	Entropy 0.73337 (0.73726)	Top-1 acc 47.656 (51.201)	Top-5 acc 75.000 (74.373)	lr 0.02069
Train [33][2260/3239]	Time 0.322 (0.456)	Data Time 0.001 (0.012)	Loss 3.0183 (3.0340)	Entropy 0.73312 (0.73724)	Top-1 acc 51.562 (51.198)	Top-5 acc 71.875 (74.369)	lr 0.02069
Train [33][2270/3239]	Time 0.247 (0.456)	Data Time 0.001 (0.012)	Loss 3.0056 (3.0339)	Entropy 0.73290 (0.73722)	Top-1 acc 52.344 (51.201)	Top-5 acc 75.000 (74.372)	lr 0.02069
Train [33][2280/3239]	Time 0.252 (0.455)	Data Time 0.001 (0.012)	Loss 3.0404 (3.0341)	Entropy 0.73285 (0.73720)	Top-1 acc 48.828 (51.197)	Top-5 acc 73.438 (74.368)	lr 0.02069
Train [33][2290/3239]	Time 0.218 (0.455)	Data Time 0.001 (0.012)	Loss 3.1402 (3.0341)	Entropy 0.73267 (0.73718)	Top-1 acc 49.609 (51.195)	Top-5 acc 71.875 (74.366)	lr 0.02069
Train [33][2300/3239]	Time 0.218 (0.455)	Data Time 0.001 (0.012)	Loss 2.9526 (3.0342)	Entropy 0.73238 (0.73716)	Top-1 acc 53.125 (51.193)	Top-5 acc 76.172 (74.365)	lr 0.02069
Train [33][2310/3239]	Time 0.228 (0.455)	Data Time 0.001 (0.012)	Loss 3.1073 (3.0343)	Entropy 0.73260 (0.73714)	Top-1 acc 51.562 (51.195)	Top-5 acc 74.609 (74.365)	lr 0.02069
Train [33][2320/3239]	Time 0.224 (0.454)	Data Time 0.001 (0.012)	Loss 2.8897 (3.0343)	Entropy 0.73202 (0.73712)	Top-1 acc 55.078 (51.198)	Top-5 acc 75.781 (74.360)	lr 0.02069
Train [33][2330/3239]	Time 0.244 (0.454)	Data Time 0.001 (0.012)	Loss 3.1848 (3.0343)	Entropy 0.73218 (0.73710)	Top-1 acc 47.656 (51.194)	Top-5 acc 71.484 (74.361)	lr 0.02069
Train [33][2340/3239]	Time 0.223 (0.454)	Data Time 0.001 (0.012)	Loss 3.0892 (3.0341)	Entropy 0.73253 (0.73708)	Top-1 acc 49.609 (51.197)	Top-5 acc 74.609 (74.368)	lr 0.02069
Train [33][2350/3239]	Time 0.243 (0.454)	Data Time 0.001 (0.012)	Loss 3.0223 (3.0343)	Entropy 0.73218 (0.73706)	Top-1 acc 54.688 (51.193)	Top-5 acc 74.219 (74.363)	lr 0.02069
Train [33][2360/3239]	Time 0.233 (0.454)	Data Time 0.001 (0.012)	Loss 2.8739 (3.0340)	Entropy 0.73240 (0.73704)	Top-1 acc 57.422 (51.201)	Top-5 acc 76.953 (74.366)	lr 0.02069
Train [33][2370/3239]	Time 0.223 (0.453)	Data Time 0.001 (0.012)	Loss 3.2159 (3.0342)	Entropy 0.73232 (0.73702)	Top-1 acc 49.219 (51.201)	Top-5 acc 72.266 (74.362)	lr 0.02068
Train [33][2380/3239]	Time 0.243 (0.453)	Data Time 0.002 (0.012)	Loss 3.3939 (3.0345)	Entropy 0.73230 (0.73700)	Top-1 acc 46.484 (51.193)	Top-5 acc 67.188 (74.361)	lr 0.02068
Train [33][2390/3239]	Time 0.248 (0.453)	Data Time 0.001 (0.012)	Loss 3.0710 (3.0344)	Entropy 0.73204 (0.73698)	Top-1 acc 50.781 (51.190)	Top-5 acc 74.219 (74.365)	lr 0.02068
Train [33][2400/3239]	Time 0.332 (0.464)	Data Time 0.030 (0.012)	Loss 3.0078 (3.0345)	Entropy 0.73147 (0.73696)	Top-1 acc 52.734 (51.187)	Top-5 acc 76.172 (74.363)	lr 0.02068
Train [33][2410/3239]	Time 0.235 (0.464)	Data Time 0.002 (0.012)	Loss 2.9024 (3.0342)	Entropy 0.73161 (0.73694)	Top-1 acc 52.734 (51.192)	Top-5 acc 76.172 (74.366)	lr 0.02068
Train [33][2420/3239]	Time 0.335 (0.464)	Data Time 0.002 (0.012)	Loss 3.2379 (3.0341)	Entropy 0.73197 (0.73691)	Top-1 acc 45.312 (51.196)	Top-5 acc 70.312 (74.366)	lr 0.02068
Train [33][2430/3239]	Time 0.259 (0.464)	Data Time 0.001 (0.012)	Loss 2.9299 (3.0340)	Entropy 0.73208 (0.73689)	Top-1 acc 54.688 (51.200)	Top-5 acc 78.906 (74.368)	lr 0.02068
Train [33][2440/3239]	Time 0.245 (0.463)	Data Time 0.001 (0.011)	Loss 3.3172 (3.0342)	Entropy 0.73250 (0.73688)	Top-1 acc 43.750 (51.192)	Top-5 acc 67.578 (74.363)	lr 0.02068
Train [33][2450/3239]	Time 0.256 (0.463)	Data Time 0.001 (0.011)	Loss 2.8594 (3.0342)	Entropy 0.73283 (0.73686)	Top-1 acc 55.078 (51.191)	Top-5 acc 76.953 (74.364)	lr 0.02068
Train [33][2460/3239]	Time 0.236 (0.463)	Data Time 0.001 (0.011)	Loss 3.0122 (3.0343)	Entropy 0.73280 (0.73684)	Top-1 acc 53.125 (51.190)	Top-5 acc 75.000 (74.363)	lr 0.02068
Train [33][2470/3239]	Time 0.266 (0.463)	Data Time 0.003 (0.011)	Loss 3.0203 (3.0342)	Entropy 0.73233 (0.73683)	Top-1 acc 50.781 (51.191)	Top-5 acc 73.828 (74.363)	lr 0.02068
Train [33][2480/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.011)	Loss 3.0668 (3.0342)	Entropy 0.73233 (0.73681)	Top-1 acc 52.344 (51.190)	Top-5 acc 72.266 (74.362)	lr 0.02068
Train [33][2490/3239]	Time 0.258 (0.463)	Data Time 0.001 (0.011)	Loss 3.1412 (3.0342)	Entropy 0.73171 (0.73679)	Top-1 acc 46.875 (51.194)	Top-5 acc 73.438 (74.363)	lr 0.02068
Train [33][2500/3239]	Time 0.231 (0.462)	Data Time 0.001 (0.011)	Loss 2.8210 (3.0342)	Entropy 0.73180 (0.73677)	Top-1 acc 55.859 (51.196)	Top-5 acc 78.125 (74.365)	lr 0.02067
Train [33][2510/3239]	Time 0.237 (0.462)	Data Time 0.001 (0.011)	Loss 3.0290 (3.0338)	Entropy 0.73172 (0.73675)	Top-1 acc 49.609 (51.196)	Top-5 acc 76.953 (74.373)	lr 0.02067
Train [33][2520/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.011)	Loss 3.0573 (3.0339)	Entropy 0.73117 (0.73673)	Top-1 acc 52.734 (51.195)	Top-5 acc 76.562 (74.371)	lr 0.02067
Train [33][2530/3239]	Time 0.252 (0.462)	Data Time 0.001 (0.011)	Loss 3.0660 (3.0339)	Entropy 0.73087 (0.73670)	Top-1 acc 51.172 (51.201)	Top-5 acc 74.219 (74.369)	lr 0.02067
Train [33][2540/3239]	Time 0.226 (0.461)	Data Time 0.001 (0.011)	Loss 3.1526 (3.0340)	Entropy 0.73056 (0.73668)	Top-1 acc 51.562 (51.200)	Top-5 acc 71.875 (74.369)	lr 0.02067
Train [33][2550/3239]	Time 0.236 (0.461)	Data Time 0.001 (0.011)	Loss 2.9976 (3.0340)	Entropy 0.73075 (0.73666)	Top-1 acc 53.125 (51.198)	Top-5 acc 69.531 (74.365)	lr 0.02067
Train [33][2560/3239]	Time 0.222 (0.461)	Data Time 0.001 (0.011)	Loss 3.1521 (3.0341)	Entropy 0.73049 (0.73663)	Top-1 acc 47.266 (51.199)	Top-5 acc 73.047 (74.361)	lr 0.02067
Train [33][2570/3239]	Time 0.245 (0.461)	Data Time 0.001 (0.011)	Loss 2.9243 (3.0340)	Entropy 0.73013 (0.73661)	Top-1 acc 56.641 (51.203)	Top-5 acc 77.734 (74.362)	lr 0.02067
Train [33][2580/3239]	Time 0.325 (0.461)	Data Time 0.001 (0.011)	Loss 2.9483 (3.0339)	Entropy 0.73031 (0.73658)	Top-1 acc 55.469 (51.205)	Top-5 acc 73.828 (74.365)	lr 0.02067
Train [33][2590/3239]	Time 0.229 (0.460)	Data Time 0.001 (0.011)	Loss 3.2074 (3.0341)	Entropy 0.73028 (0.73656)	Top-1 acc 46.875 (51.200)	Top-5 acc 69.531 (74.361)	lr 0.02067
Train [33][2600/3239]	Time 0.237 (0.460)	Data Time 0.001 (0.011)	Loss 3.0886 (3.0339)	Entropy 0.72979 (0.73654)	Top-1 acc 51.562 (51.202)	Top-5 acc 73.828 (74.367)	lr 0.02067
Train [33][2610/3239]	Time 0.226 (0.460)	Data Time 0.001 (0.011)	Loss 3.0819 (3.0341)	Entropy 0.72964 (0.73651)	Top-1 acc 49.609 (51.196)	Top-5 acc 75.000 (74.363)	lr 0.02067
Train [33][2620/3239]	Time 0.228 (0.460)	Data Time 0.001 (0.011)	Loss 3.0303 (3.0343)	Entropy 0.72959 (0.73648)	Top-1 acc 52.734 (51.193)	Top-5 acc 74.609 (74.358)	lr 0.02067
Train [33][2630/3239]	Time 0.244 (0.460)	Data Time 0.001 (0.011)	Loss 3.0205 (3.0341)	Entropy 0.72963 (0.73646)	Top-1 acc 51.172 (51.197)	Top-5 acc 73.438 (74.362)	lr 0.02066
Train [33][2640/3239]	Time 0.219 (0.460)	Data Time 0.001 (0.011)	Loss 3.0886 (3.0340)	Entropy 0.72958 (0.73643)	Top-1 acc 49.219 (51.197)	Top-5 acc 71.875 (74.364)	lr 0.02066
Train [33][2650/3239]	Time 0.328 (0.459)	Data Time 0.001 (0.011)	Loss 2.9246 (3.0339)	Entropy 0.72963 (0.73641)	Top-1 acc 55.078 (51.200)	Top-5 acc 75.000 (74.364)	lr 0.02066
Train [33][2660/3239]	Time 0.211 (0.459)	Data Time 0.001 (0.011)	Loss 3.1331 (3.0340)	Entropy 0.72942 (0.73638)	Top-1 acc 47.656 (51.194)	Top-5 acc 73.828 (74.364)	lr 0.02066
Train [33][2670/3239]	Time 0.238 (0.459)	Data Time 0.001 (0.011)	Loss 2.9183 (3.0342)	Entropy 0.72961 (0.73635)	Top-1 acc 52.734 (51.191)	Top-5 acc 76.953 (74.360)	lr 0.02066
Train [33][2680/3239]	Time 0.263 (0.459)	Data Time 0.001 (0.011)	Loss 3.1259 (3.0343)	Entropy 0.72956 (0.73633)	Top-1 acc 46.875 (51.190)	Top-5 acc 74.219 (74.359)	lr 0.02066
Train [33][2690/3239]	Time 0.224 (0.459)	Data Time 0.001 (0.011)	Loss 2.9403 (3.0340)	Entropy 0.72993 (0.73630)	Top-1 acc 51.953 (51.196)	Top-5 acc 76.562 (74.367)	lr 0.02066
Train [33][2700/3239]	Time 0.270 (0.459)	Data Time 0.001 (0.011)	Loss 3.0925 (3.0342)	Entropy 0.72985 (0.73628)	Top-1 acc 48.828 (51.190)	Top-5 acc 72.656 (74.362)	lr 0.02066
Train [33][2710/3239]	Time 0.227 (0.458)	Data Time 0.001 (0.011)	Loss 3.2092 (3.0345)	Entropy 0.73023 (0.73626)	Top-1 acc 48.828 (51.181)	Top-5 acc 68.750 (74.358)	lr 0.02066
Train [33][2720/3239]	Time 0.224 (0.458)	Data Time 0.001 (0.010)	Loss 3.2318 (3.0344)	Entropy 0.73035 (0.73624)	Top-1 acc 48.828 (51.184)	Top-5 acc 72.656 (74.361)	lr 0.02066
Train [33][2730/3239]	Time 0.231 (0.458)	Data Time 0.001 (0.010)	Loss 2.7874 (3.0346)	Entropy 0.73044 (0.73621)	Top-1 acc 54.688 (51.181)	Top-5 acc 81.250 (74.361)	lr 0.02066
Train [33][2740/3239]	Time 0.395 (0.458)	Data Time 0.002 (0.010)	Loss 2.9277 (3.0343)	Entropy 0.73004 (0.73619)	Top-1 acc 51.172 (51.187)	Top-5 acc 78.516 (74.366)	lr 0.02066
Train [33][2750/3239]	Time 0.249 (0.458)	Data Time 0.001 (0.010)	Loss 3.2775 (3.0346)	Entropy 0.72997 (0.73617)	Top-1 acc 45.703 (51.181)	Top-5 acc 68.750 (74.360)	lr 0.02066
Train [33][2760/3239]	Time 0.226 (0.458)	Data Time 0.001 (0.010)	Loss 2.8884 (3.0346)	Entropy 0.72993 (0.73615)	Top-1 acc 51.172 (51.178)	Top-5 acc 78.516 (74.361)	lr 0.02065
Train [33][2770/3239]	Time 0.229 (0.457)	Data Time 0.001 (0.010)	Loss 3.1126 (3.0346)	Entropy 0.72986 (0.73612)	Top-1 acc 50.781 (51.178)	Top-5 acc 72.656 (74.360)	lr 0.02065
Train [33][2780/3239]	Time 0.243 (0.457)	Data Time 0.001 (0.010)	Loss 2.9765 (3.0348)	Entropy 0.72965 (0.73610)	Top-1 acc 56.641 (51.177)	Top-5 acc 73.828 (74.356)	lr 0.02065
Train [33][2790/3239]	Time 0.255 (0.457)	Data Time 0.001 (0.010)	Loss 3.0270 (3.0347)	Entropy 0.72968 (0.73608)	Top-1 acc 49.219 (51.182)	Top-5 acc 73.047 (74.358)	lr 0.02065
Train [33][2800/3239]	Time 0.239 (0.457)	Data Time 0.001 (0.010)	Loss 3.0393 (3.0344)	Entropy 0.72981 (0.73606)	Top-1 acc 53.906 (51.186)	Top-5 acc 74.609 (74.361)	lr 0.02065
Train [33][2810/3239]	Time 0.316 (0.457)	Data Time 0.001 (0.010)	Loss 3.3640 (3.0344)	Entropy 0.72995 (0.73603)	Top-1 acc 40.234 (51.188)	Top-5 acc 69.141 (74.363)	lr 0.02065
Train [33][2820/3239]	Time 0.230 (0.457)	Data Time 0.001 (0.010)	Loss 3.3035 (3.0343)	Entropy 0.73020 (0.73601)	Top-1 acc 46.484 (51.191)	Top-5 acc 71.875 (74.362)	lr 0.02065
Train [33][2830/3239]	Time 0.234 (0.456)	Data Time 0.001 (0.010)	Loss 3.0342 (3.0345)	Entropy 0.72984 (0.73599)	Top-1 acc 53.516 (51.187)	Top-5 acc 72.656 (74.357)	lr 0.02065
Train [33][2840/3239]	Time 0.229 (0.456)	Data Time 0.001 (0.010)	Loss 3.0385 (3.0344)	Entropy 0.73015 (0.73597)	Top-1 acc 53.516 (51.190)	Top-5 acc 73.438 (74.359)	lr 0.02065
Train [33][2850/3239]	Time 0.280 (0.456)	Data Time 0.003 (0.010)	Loss 2.9013 (3.0343)	Entropy 0.72998 (0.73595)	Top-1 acc 55.078 (51.192)	Top-5 acc 77.734 (74.362)	lr 0.02065
Train [33][2860/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.010)	Loss 3.1413 (3.0343)	Entropy 0.73001 (0.73593)	Top-1 acc 46.484 (51.190)	Top-5 acc 71.875 (74.363)	lr 0.02065
Train [33][2870/3239]	Time 0.215 (0.456)	Data Time 0.001 (0.010)	Loss 3.3430 (3.0346)	Entropy 0.73061 (0.73591)	Top-1 acc 41.016 (51.180)	Top-5 acc 70.312 (74.357)	lr 0.02065
Train [33][2880/3239]	Time 0.239 (0.456)	Data Time 0.001 (0.010)	Loss 3.2013 (3.0345)	Entropy 0.73064 (0.73589)	Top-1 acc 48.828 (51.184)	Top-5 acc 72.656 (74.360)	lr 0.02065
Train [33][2890/3239]	Time 0.223 (0.455)	Data Time 0.001 (0.010)	Loss 3.1804 (3.0345)	Entropy 0.73043 (0.73587)	Top-1 acc 49.609 (51.183)	Top-5 acc 71.484 (74.360)	lr 0.02064
Train [33][2900/3239]	Time 0.242 (0.455)	Data Time 0.001 (0.010)	Loss 3.0445 (3.0346)	Entropy 0.73023 (0.73585)	Top-1 acc 50.000 (51.183)	Top-5 acc 76.172 (74.360)	lr 0.02064
Train [33][2910/3239]	Time 0.236 (0.455)	Data Time 0.001 (0.010)	Loss 2.9081 (3.0347)	Entropy 0.73008 (0.73583)	Top-1 acc 52.734 (51.179)	Top-5 acc 74.609 (74.357)	lr 0.02064
Train [33][2920/3239]	Time 0.232 (0.455)	Data Time 0.001 (0.010)	Loss 3.0508 (3.0348)	Entropy 0.73010 (0.73581)	Top-1 acc 53.125 (51.177)	Top-5 acc 73.828 (74.353)	lr 0.02064
Train [33][2930/3239]	Time 0.229 (0.455)	Data Time 0.001 (0.010)	Loss 3.0645 (3.0346)	Entropy 0.72987 (0.73579)	Top-1 acc 49.219 (51.184)	Top-5 acc 75.391 (74.355)	lr 0.02064
Train [33][2940/3239]	Time 0.248 (0.454)	Data Time 0.002 (0.010)	Loss 2.9887 (3.0344)	Entropy 0.72981 (0.73577)	Top-1 acc 53.516 (51.188)	Top-5 acc 73.438 (74.359)	lr 0.02064
Train [33][2950/3239]	Time 0.262 (0.454)	Data Time 0.001 (0.010)	Loss 2.9201 (3.0344)	Entropy 0.72997 (0.73575)	Top-1 acc 49.219 (51.189)	Top-5 acc 78.516 (74.358)	lr 0.02064
Train [33][2960/3239]	Time 0.222 (0.454)	Data Time 0.001 (0.010)	Loss 2.8543 (3.0344)	Entropy 0.72963 (0.73573)	Top-1 acc 57.422 (51.192)	Top-5 acc 78.125 (74.360)	lr 0.02064
Train [33][2970/3239]	Time 0.324 (0.454)	Data Time 0.001 (0.010)	Loss 2.9888 (3.0342)	Entropy 0.72956 (0.73571)	Top-1 acc 53.516 (51.194)	Top-5 acc 74.219 (74.364)	lr 0.02064
Train [33][2980/3239]	Time 0.233 (0.454)	Data Time 0.001 (0.010)	Loss 3.1755 (3.0344)	Entropy 0.72958 (0.73569)	Top-1 acc 49.219 (51.194)	Top-5 acc 73.047 (74.360)	lr 0.02064
Train [33][2990/3239]	Time 0.225 (0.454)	Data Time 0.001 (0.010)	Loss 2.9782 (3.0346)	Entropy 0.72973 (0.73567)	Top-1 acc 53.516 (51.192)	Top-5 acc 75.000 (74.357)	lr 0.02064
Train [33][3000/3239]	Time 0.235 (0.454)	Data Time 0.001 (0.010)	Loss 3.0881 (3.0346)	Entropy 0.72960 (0.73565)	Top-1 acc 46.094 (51.192)	Top-5 acc 74.219 (74.356)	lr 0.02064
Train [33][3010/3239]	Time 0.229 (0.453)	Data Time 0.001 (0.010)	Loss 2.9606 (3.0344)	Entropy 0.72928 (0.73563)	Top-1 acc 54.297 (51.198)	Top-5 acc 76.562 (74.359)	lr 0.02064
Train [33][3020/3239]	Time 0.252 (0.453)	Data Time 0.001 (0.010)	Loss 2.8421 (3.0343)	Entropy 0.72953 (0.73561)	Top-1 acc 55.859 (51.199)	Top-5 acc 77.734 (74.362)	lr 0.02063
Train [33][3030/3239]	Time 0.234 (0.453)	Data Time 0.001 (0.010)	Loss 2.9131 (3.0344)	Entropy 0.72974 (0.73559)	Top-1 acc 53.516 (51.197)	Top-5 acc 76.172 (74.358)	lr 0.02063
Train [33][3040/3239]	Time 0.332 (0.453)	Data Time 0.001 (0.010)	Loss 3.2357 (3.0346)	Entropy 0.72943 (0.73557)	Top-1 acc 50.391 (51.197)	Top-5 acc 67.578 (74.355)	lr 0.02063
Train [33][3050/3239]	Time 0.230 (0.453)	Data Time 0.001 (0.010)	Loss 3.0906 (3.0345)	Entropy 0.72974 (0.73555)	Top-1 acc 50.781 (51.198)	Top-5 acc 73.828 (74.357)	lr 0.02063
Train [33][3060/3239]	Time 0.427 (0.462)	Data Time 0.032 (0.010)	Loss 2.8771 (3.0343)	Entropy 0.72911 (0.73553)	Top-1 acc 56.641 (51.203)	Top-5 acc 75.000 (74.359)	lr 0.02063
Train [33][3070/3239]	Time 0.274 (0.462)	Data Time 0.002 (0.010)	Loss 3.1122 (3.0344)	Entropy 0.72903 (0.73551)	Top-1 acc 45.312 (51.198)	Top-5 acc 71.875 (74.360)	lr 0.02063
Train [33][3080/3239]	Time 0.241 (0.461)	Data Time 0.002 (0.009)	Loss 3.1998 (3.0344)	Entropy 0.72873 (0.73549)	Top-1 acc 45.703 (51.199)	Top-5 acc 68.750 (74.361)	lr 0.02063
Train [33][3090/3239]	Time 0.266 (0.461)	Data Time 0.001 (0.009)	Loss 2.7780 (3.0342)	Entropy 0.72862 (0.73547)	Top-1 acc 57.422 (51.199)	Top-5 acc 79.688 (74.364)	lr 0.02063
Train [33][3100/3239]	Time 0.239 (0.461)	Data Time 0.002 (0.009)	Loss 3.2539 (3.0342)	Entropy 0.72897 (0.73545)	Top-1 acc 44.922 (51.196)	Top-5 acc 68.750 (74.363)	lr 0.02063
Train [33][3110/3239]	Time 0.229 (0.461)	Data Time 0.001 (0.009)	Loss 2.6578 (3.0342)	Entropy 0.72870 (0.73543)	Top-1 acc 61.719 (51.204)	Top-5 acc 80.859 (74.366)	lr 0.02063
Train [33][3120/3239]	Time 0.233 (0.461)	Data Time 0.001 (0.009)	Loss 2.8906 (3.0340)	Entropy 0.72875 (0.73540)	Top-1 acc 53.516 (51.205)	Top-5 acc 77.734 (74.372)	lr 0.02063
Train [33][3130/3239]	Time 0.370 (0.461)	Data Time 0.001 (0.009)	Loss 3.2987 (3.0342)	Entropy 0.72862 (0.73538)	Top-1 acc 43.750 (51.197)	Top-5 acc 66.797 (74.367)	lr 0.02063
Train [33][3140/3239]	Time 0.235 (0.461)	Data Time 0.001 (0.009)	Loss 2.9879 (3.0341)	Entropy 0.72878 (0.73536)	Top-1 acc 52.344 (51.200)	Top-5 acc 75.391 (74.368)	lr 0.02063
Train [33][3150/3239]	Time 0.233 (0.461)	Data Time 0.001 (0.009)	Loss 3.0220 (3.0342)	Entropy 0.72901 (0.73534)	Top-1 acc 52.734 (51.198)	Top-5 acc 70.703 (74.362)	lr 0.02063
Train [33][3160/3239]	Time 0.228 (0.460)	Data Time 0.001 (0.009)	Loss 3.1592 (3.0344)	Entropy 0.72872 (0.73532)	Top-1 acc 47.656 (51.197)	Top-5 acc 71.875 (74.360)	lr 0.02062
Train [33][3170/3239]	Time 0.216 (0.460)	Data Time 0.001 (0.009)	Loss 3.2378 (3.0344)	Entropy 0.72881 (0.73530)	Top-1 acc 46.094 (51.194)	Top-5 acc 67.969 (74.359)	lr 0.02062
Train [33][3180/3239]	Time 0.230 (0.460)	Data Time 0.000 (0.009)	Loss 3.1043 (3.0344)	Entropy 0.72873 (0.73528)	Top-1 acc 53.906 (51.197)	Top-5 acc 70.703 (74.359)	lr 0.02062
Train [33][3190/3239]	Time 0.250 (0.460)	Data Time 0.000 (0.009)	Loss 3.0889 (3.0343)	Entropy 0.72861 (0.73526)	Top-1 acc 51.562 (51.200)	Top-5 acc 73.438 (74.361)	lr 0.02062
Train [33][3200/3239]	Time 0.231 (0.460)	Data Time 0.000 (0.009)	Loss 3.1616 (3.0343)	Entropy 0.72904 (0.73524)	Top-1 acc 49.609 (51.200)	Top-5 acc 71.484 (74.363)	lr 0.02062
Train [33][3210/3239]	Time 0.233 (0.460)	Data Time 0.000 (0.009)	Loss 3.2538 (3.0344)	Entropy 0.72901 (0.73522)	Top-1 acc 46.875 (51.199)	Top-5 acc 68.750 (74.361)	lr 0.02062
Train [33][3220/3239]	Time 0.228 (0.459)	Data Time 0.000 (0.009)	Loss 2.9554 (3.0344)	Entropy 0.72886 (0.73520)	Top-1 acc 53.516 (51.202)	Top-5 acc 75.000 (74.362)	lr 0.02062
Train [33][3230/3239]	Time 0.230 (0.459)	Data Time 0.000 (0.009)	Loss 2.8202 (3.0344)	Entropy 0.72888 (0.73518)	Top-1 acc 58.594 (51.201)	Top-5 acc 77.734 (74.361)	lr 0.02062
Train [33][3239/3239]	Time 0.859 (0.459)	Data Time 0.000 (0.009)	Loss 3.1382 (3.0346)	Entropy 0.72882 (0.73516)	Top-1 acc 46.914 (51.198)	Top-5 acc 72.840 (74.358)	lr 0.02062
==========Valid [33/120]	loss 1.744	top-1 acc 60.677 (60.677)	top-5 acc 82.374	Train top-1 51.198	top-5 74.358	Entropy 0.72882	Latency-None: 0.000ms	Flops: 539.76M
Train [34][0/3239]	Time 31.138 (31.138)	Data Time 30.382 (30.382)	Loss 2.9434 (2.9434)	Entropy 0.72908 (0.72908)	Top-1 acc 51.562 (51.562)	Top-5 acc 79.688 (79.688)	lr 0.02062
Train [34][10/3239]	Time 0.271 (3.328)	Data Time 0.003 (2.764)	Loss 2.7109 (2.9405)	Entropy 0.72960 (0.72919)	Top-1 acc 58.203 (52.912)	Top-5 acc 80.078 (76.882)	lr 0.02062
Train [34][20/3239]	Time 0.225 (1.938)	Data Time 0.001 (1.449)	Loss 2.8627 (2.9423)	Entropy 0.72945 (0.72930)	Top-1 acc 53.906 (52.604)	Top-5 acc 77.344 (76.618)	lr 0.02062
Train [34][30/3239]	Time 0.318 (1.446)	Data Time 0.001 (0.982)	Loss 2.9888 (2.9521)	Entropy 0.72947 (0.72936)	Top-1 acc 51.953 (52.722)	Top-5 acc 75.781 (76.323)	lr 0.02062
Train [34][40/3239]	Time 0.229 (1.193)	Data Time 0.001 (0.743)	Loss 2.8389 (2.9578)	Entropy 0.72943 (0.72937)	Top-1 acc 54.297 (52.506)	Top-5 acc 78.516 (76.372)	lr 0.02062
Train [34][50/3239]	Time 0.226 (1.036)	Data Time 0.001 (0.597)	Loss 2.9513 (2.9713)	Entropy 0.72953 (0.72939)	Top-1 acc 53.125 (52.298)	Top-5 acc 75.781 (76.026)	lr 0.02061
Train [34][60/3239]	Time 0.224 (0.934)	Data Time 0.001 (0.500)	Loss 3.0570 (2.9787)	Entropy 0.72888 (0.72939)	Top-1 acc 48.438 (51.960)	Top-5 acc 73.047 (75.800)	lr 0.02061
Train [34][70/3239]	Time 0.227 (0.860)	Data Time 0.001 (0.430)	Loss 3.0398 (2.9796)	Entropy 0.72898 (0.72931)	Top-1 acc 46.875 (52.019)	Top-5 acc 73.828 (75.759)	lr 0.02061
Train [34][80/3239]	Time 0.248 (0.805)	Data Time 0.001 (0.377)	Loss 2.9748 (2.9780)	Entropy 0.72912 (0.72929)	Top-1 acc 50.000 (51.977)	Top-5 acc 77.344 (75.887)	lr 0.02061
Train [34][90/3239]	Time 0.222 (0.760)	Data Time 0.001 (0.335)	Loss 2.9413 (2.9789)	Entropy 0.72935 (0.72927)	Top-1 acc 52.344 (51.992)	Top-5 acc 77.344 (75.846)	lr 0.02061
Train [34][100/3239]	Time 0.227 (0.725)	Data Time 0.001 (0.302)	Loss 2.9879 (2.9804)	Entropy 0.72969 (0.72930)	Top-1 acc 50.000 (52.015)	Top-5 acc 74.609 (75.715)	lr 0.02061
Train [34][110/3239]	Time 0.282 (0.702)	Data Time 0.001 (0.275)	Loss 3.0317 (2.9838)	Entropy 0.72949 (0.72934)	Top-1 acc 51.562 (51.978)	Top-5 acc 76.953 (75.637)	lr 0.02061
Train [34][120/3239]	Time 0.311 (0.677)	Data Time 0.001 (0.253)	Loss 3.2425 (2.9904)	Entropy 0.73002 (0.72937)	Top-1 acc 42.969 (51.905)	Top-5 acc 71.094 (75.497)	lr 0.02061
Train [34][130/3239]	Time 0.232 (0.657)	Data Time 0.001 (0.233)	Loss 3.0107 (2.9852)	Entropy 0.72990 (0.72941)	Top-1 acc 53.516 (51.998)	Top-5 acc 71.484 (75.555)	lr 0.02061
Train [34][140/3239]	Time 0.246 (0.642)	Data Time 0.001 (0.217)	Loss 2.9628 (2.9902)	Entropy 0.72982 (0.72945)	Top-1 acc 54.688 (51.961)	Top-5 acc 74.609 (75.463)	lr 0.02061
Train [34][150/3239]	Time 0.219 (0.626)	Data Time 0.001 (0.203)	Loss 2.8546 (2.9927)	Entropy 0.73011 (0.72948)	Top-1 acc 55.469 (51.932)	Top-5 acc 76.562 (75.378)	lr 0.02061
Train [34][160/3239]	Time 0.224 (0.610)	Data Time 0.001 (0.190)	Loss 2.6288 (2.9916)	Entropy 0.72984 (0.72951)	Top-1 acc 57.422 (51.980)	Top-5 acc 85.156 (75.425)	lr 0.02061
Train [34][170/3239]	Time 0.216 (0.598)	Data Time 0.001 (0.179)	Loss 2.9739 (2.9902)	Entropy 0.72973 (0.72952)	Top-1 acc 53.125 (52.060)	Top-5 acc 75.000 (75.434)	lr 0.02061
Train [34][180/3239]	Time 0.228 (0.586)	Data Time 0.001 (0.170)	Loss 2.9341 (2.9918)	Entropy 0.72908 (0.72951)	Top-1 acc 55.469 (51.983)	Top-5 acc 74.609 (75.358)	lr 0.02060
Train [34][190/3239]	Time 0.306 (0.576)	Data Time 0.001 (0.161)	Loss 2.9968 (2.9906)	Entropy 0.72894 (0.72948)	Top-1 acc 49.219 (52.002)	Top-5 acc 73.828 (75.384)	lr 0.02060
Train [34][200/3239]	Time 0.221 (0.567)	Data Time 0.001 (0.153)	Loss 2.9279 (2.9878)	Entropy 0.72880 (0.72945)	Top-1 acc 49.219 (52.068)	Top-5 acc 75.391 (75.396)	lr 0.02060
Train [34][210/3239]	Time 0.226 (0.558)	Data Time 0.001 (0.146)	Loss 3.0515 (2.9862)	Entropy 0.72876 (0.72941)	Top-1 acc 51.562 (52.101)	Top-5 acc 76.172 (75.442)	lr 0.02060
Train [34][220/3239]	Time 0.222 (0.551)	Data Time 0.001 (0.139)	Loss 3.0134 (2.9842)	Entropy 0.72874 (0.72939)	Top-1 acc 50.781 (52.135)	Top-5 acc 74.609 (75.438)	lr 0.02060
Train [34][230/3239]	Time 0.222 (0.545)	Data Time 0.001 (0.133)	Loss 3.0666 (2.9834)	Entropy 0.72901 (0.72936)	Top-1 acc 50.781 (52.185)	Top-5 acc 74.219 (75.441)	lr 0.02060
Train [34][240/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.128)	Loss 2.9339 (2.9849)	Entropy 0.72891 (0.72935)	Top-1 acc 51.172 (52.164)	Top-5 acc 78.125 (75.426)	lr 0.02060
Train [34][250/3239]	Time 0.225 (0.533)	Data Time 0.001 (0.123)	Loss 2.9641 (2.9836)	Entropy 0.72870 (0.72933)	Top-1 acc 53.906 (52.168)	Top-5 acc 73.438 (75.478)	lr 0.02060
Train [34][260/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.118)	Loss 3.0020 (2.9834)	Entropy 0.72853 (0.72930)	Top-1 acc 51.562 (52.200)	Top-5 acc 75.781 (75.483)	lr 0.02060
Train [34][270/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.114)	Loss 3.1835 (2.9846)	Entropy 0.72813 (0.72926)	Top-1 acc 47.656 (52.155)	Top-5 acc 68.359 (75.461)	lr 0.02060
Train [34][280/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.110)	Loss 2.9525 (2.9864)	Entropy 0.72778 (0.72922)	Top-1 acc 52.344 (52.085)	Top-5 acc 76.562 (75.456)	lr 0.02060
Train [34][290/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.106)	Loss 2.9068 (2.9868)	Entropy 0.72724 (0.72916)	Top-1 acc 53.516 (52.098)	Top-5 acc 77.734 (75.450)	lr 0.02060
Train [34][300/3239]	Time 0.219 (0.509)	Data Time 0.001 (0.103)	Loss 3.0392 (2.9881)	Entropy 0.72747 (0.72910)	Top-1 acc 50.781 (52.061)	Top-5 acc 72.656 (75.407)	lr 0.02060
Train [34][310/3239]	Time 0.225 (0.506)	Data Time 0.001 (0.099)	Loss 3.1344 (2.9893)	Entropy 0.72748 (0.72905)	Top-1 acc 45.703 (52.044)	Top-5 acc 72.656 (75.362)	lr 0.02059
Train [34][320/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.096)	Loss 3.2444 (2.9894)	Entropy 0.72761 (0.72900)	Top-1 acc 43.750 (52.046)	Top-5 acc 71.484 (75.350)	lr 0.02059
Train [34][330/3239]	Time 0.255 (0.499)	Data Time 0.002 (0.093)	Loss 3.1389 (2.9904)	Entropy 0.72776 (0.72896)	Top-1 acc 50.391 (51.998)	Top-5 acc 74.219 (75.330)	lr 0.02059
Train [34][340/3239]	Time 0.229 (0.496)	Data Time 0.001 (0.091)	Loss 2.9131 (2.9923)	Entropy 0.72817 (0.72893)	Top-1 acc 53.125 (51.991)	Top-5 acc 75.391 (75.284)	lr 0.02059
Train [34][350/3239]	Time 0.317 (0.493)	Data Time 0.001 (0.088)	Loss 2.9461 (2.9944)	Entropy 0.72799 (0.72890)	Top-1 acc 55.469 (51.941)	Top-5 acc 76.172 (75.267)	lr 0.02059
Train [34][360/3239]	Time 0.232 (0.491)	Data Time 0.001 (0.086)	Loss 3.2360 (2.9951)	Entropy 0.72820 (0.72888)	Top-1 acc 49.219 (51.923)	Top-5 acc 72.656 (75.263)	lr 0.02059
Train [34][370/3239]	Time 0.225 (0.488)	Data Time 0.001 (0.083)	Loss 3.0423 (2.9952)	Entropy 0.72829 (0.72886)	Top-1 acc 48.438 (51.919)	Top-5 acc 73.047 (75.246)	lr 0.02059
Train [34][380/3239]	Time 0.224 (0.485)	Data Time 0.001 (0.081)	Loss 3.0325 (2.9945)	Entropy 0.72794 (0.72884)	Top-1 acc 52.734 (51.933)	Top-5 acc 72.266 (75.243)	lr 0.02059
Train [34][390/3239]	Time 0.223 (0.483)	Data Time 0.001 (0.079)	Loss 2.9987 (2.9954)	Entropy 0.72816 (0.72882)	Top-1 acc 50.000 (51.925)	Top-5 acc 75.781 (75.213)	lr 0.02059
Train [34][400/3239]	Time 0.213 (0.480)	Data Time 0.001 (0.077)	Loss 2.7593 (2.9951)	Entropy 0.72832 (0.72880)	Top-1 acc 57.031 (51.920)	Top-5 acc 79.688 (75.205)	lr 0.02059
Train [34][410/3239]	Time 0.229 (0.478)	Data Time 0.001 (0.076)	Loss 2.9766 (2.9932)	Entropy 0.72831 (0.72878)	Top-1 acc 54.297 (51.985)	Top-5 acc 77.344 (75.239)	lr 0.02059
Train [34][420/3239]	Time 0.306 (0.476)	Data Time 0.001 (0.074)	Loss 2.9027 (2.9933)	Entropy 0.72818 (0.72877)	Top-1 acc 54.688 (51.996)	Top-5 acc 76.562 (75.221)	lr 0.02059
Train [34][430/3239]	Time 0.220 (0.474)	Data Time 0.001 (0.072)	Loss 3.0839 (2.9941)	Entropy 0.72845 (0.72876)	Top-1 acc 49.219 (51.981)	Top-5 acc 75.000 (75.210)	lr 0.02059
Train [34][440/3239]	Time 0.223 (0.472)	Data Time 0.001 (0.070)	Loss 2.9840 (2.9953)	Entropy 0.72880 (0.72876)	Top-1 acc 48.828 (51.939)	Top-5 acc 76.172 (75.198)	lr 0.02058
Train [34][450/3239]	Time 0.227 (0.471)	Data Time 0.001 (0.069)	Loss 2.8725 (2.9954)	Entropy 0.72895 (0.72876)	Top-1 acc 55.078 (51.946)	Top-5 acc 78.516 (75.193)	lr 0.02058
Train [34][460/3239]	Time 0.210 (0.469)	Data Time 0.001 (0.068)	Loss 3.1102 (2.9975)	Entropy 0.72889 (0.72876)	Top-1 acc 50.000 (51.921)	Top-5 acc 71.875 (75.134)	lr 0.02058
Train [34][470/3239]	Time 0.319 (0.522)	Data Time 0.007 (0.066)	Loss 3.4046 (2.9989)	Entropy 0.72853 (0.72876)	Top-1 acc 45.703 (51.898)	Top-5 acc 67.188 (75.115)	lr 0.02058
Train [34][480/3239]	Time 0.253 (0.522)	Data Time 0.002 (0.065)	Loss 3.0234 (2.9990)	Entropy 0.72857 (0.72876)	Top-1 acc 53.125 (51.907)	Top-5 acc 72.266 (75.118)	lr 0.02058
Train [34][490/3239]	Time 0.237 (0.520)	Data Time 0.001 (0.064)	Loss 2.8496 (2.9980)	Entropy 0.72842 (0.72875)	Top-1 acc 51.172 (51.917)	Top-5 acc 79.688 (75.146)	lr 0.02058
Train [34][500/3239]	Time 0.219 (0.517)	Data Time 0.001 (0.062)	Loss 2.7516 (2.9981)	Entropy 0.72872 (0.72875)	Top-1 acc 58.594 (51.933)	Top-5 acc 82.812 (75.140)	lr 0.02058
Train [34][510/3239]	Time 0.315 (0.515)	Data Time 0.001 (0.061)	Loss 3.0918 (2.9993)	Entropy 0.72848 (0.72875)	Top-1 acc 51.172 (51.926)	Top-5 acc 73.047 (75.111)	lr 0.02058
Train [34][520/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.060)	Loss 2.9964 (3.0002)	Entropy 0.72831 (0.72874)	Top-1 acc 53.516 (51.922)	Top-5 acc 77.344 (75.085)	lr 0.02058
Train [34][530/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.059)	Loss 2.8848 (2.9994)	Entropy 0.72781 (0.72873)	Top-1 acc 55.078 (51.930)	Top-5 acc 76.172 (75.089)	lr 0.02058
Train [34][540/3239]	Time 0.249 (0.509)	Data Time 0.001 (0.058)	Loss 3.1315 (2.9992)	Entropy 0.72768 (0.72871)	Top-1 acc 48.047 (51.954)	Top-5 acc 74.219 (75.109)	lr 0.02058
Train [34][550/3239]	Time 0.224 (0.507)	Data Time 0.001 (0.057)	Loss 3.1634 (2.9999)	Entropy 0.72826 (0.72870)	Top-1 acc 49.219 (51.929)	Top-5 acc 71.094 (75.081)	lr 0.02058
Train [34][560/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.056)	Loss 3.0153 (2.9999)	Entropy 0.72815 (0.72869)	Top-1 acc 51.562 (51.925)	Top-5 acc 74.609 (75.075)	lr 0.02058
Train [34][570/3239]	Time 0.228 (0.503)	Data Time 0.001 (0.055)	Loss 3.0514 (3.0002)	Entropy 0.72823 (0.72868)	Top-1 acc 50.000 (51.931)	Top-5 acc 73.047 (75.052)	lr 0.02057
Train [34][580/3239]	Time 0.318 (0.501)	Data Time 0.001 (0.054)	Loss 3.0815 (3.0019)	Entropy 0.72820 (0.72867)	Top-1 acc 51.172 (51.891)	Top-5 acc 70.312 (75.015)	lr 0.02057
Train [34][590/3239]	Time 0.226 (0.500)	Data Time 0.001 (0.053)	Loss 2.9542 (3.0026)	Entropy 0.72825 (0.72867)	Top-1 acc 53.906 (51.868)	Top-5 acc 72.656 (74.991)	lr 0.02057
Train [34][600/3239]	Time 0.241 (0.498)	Data Time 0.002 (0.052)	Loss 3.1830 (3.0034)	Entropy 0.72847 (0.72866)	Top-1 acc 45.312 (51.852)	Top-5 acc 72.266 (74.976)	lr 0.02057
Train [34][610/3239]	Time 0.215 (0.496)	Data Time 0.001 (0.051)	Loss 3.1779 (3.0036)	Entropy 0.72844 (0.72866)	Top-1 acc 44.141 (51.836)	Top-5 acc 72.266 (74.987)	lr 0.02057
Train [34][620/3239]	Time 0.221 (0.495)	Data Time 0.001 (0.051)	Loss 2.8514 (3.0041)	Entropy 0.72860 (0.72865)	Top-1 acc 56.250 (51.819)	Top-5 acc 77.734 (74.967)	lr 0.02057
Train [34][630/3239]	Time 0.223 (0.493)	Data Time 0.001 (0.050)	Loss 2.9409 (3.0046)	Entropy 0.72897 (0.72865)	Top-1 acc 55.469 (51.831)	Top-5 acc 77.734 (74.955)	lr 0.02057
Train [34][640/3239]	Time 0.231 (0.492)	Data Time 0.001 (0.049)	Loss 3.3138 (3.0049)	Entropy 0.72890 (0.72866)	Top-1 acc 45.312 (51.826)	Top-5 acc 70.703 (74.952)	lr 0.02057
Train [34][650/3239]	Time 0.251 (0.490)	Data Time 0.001 (0.048)	Loss 3.0192 (3.0052)	Entropy 0.72941 (0.72866)	Top-1 acc 53.906 (51.816)	Top-5 acc 72.266 (74.939)	lr 0.02057
Train [34][660/3239]	Time 0.214 (0.489)	Data Time 0.001 (0.048)	Loss 2.8969 (3.0056)	Entropy 0.72921 (0.72868)	Top-1 acc 56.250 (51.802)	Top-5 acc 75.781 (74.918)	lr 0.02057
Train [34][670/3239]	Time 0.306 (0.488)	Data Time 0.001 (0.047)	Loss 3.1562 (3.0052)	Entropy 0.72900 (0.72868)	Top-1 acc 46.875 (51.792)	Top-5 acc 73.828 (74.936)	lr 0.02057
Train [34][680/3239]	Time 0.221 (0.487)	Data Time 0.001 (0.046)	Loss 3.0758 (3.0055)	Entropy 0.72883 (0.72868)	Top-1 acc 52.344 (51.778)	Top-5 acc 72.656 (74.921)	lr 0.02057
Train [34][690/3239]	Time 0.233 (0.485)	Data Time 0.001 (0.046)	Loss 3.0155 (3.0055)	Entropy 0.72897 (0.72869)	Top-1 acc 47.656 (51.765)	Top-5 acc 76.953 (74.929)	lr 0.02056
Train [34][700/3239]	Time 0.223 (0.484)	Data Time 0.001 (0.045)	Loss 2.9947 (3.0051)	Entropy 0.72896 (0.72869)	Top-1 acc 48.828 (51.770)	Top-5 acc 74.219 (74.928)	lr 0.02056
Train [34][710/3239]	Time 0.229 (0.483)	Data Time 0.001 (0.044)	Loss 2.9006 (3.0054)	Entropy 0.72908 (0.72870)	Top-1 acc 55.859 (51.752)	Top-5 acc 76.562 (74.927)	lr 0.02056
Train [34][720/3239]	Time 0.229 (0.482)	Data Time 0.001 (0.044)	Loss 3.0150 (3.0061)	Entropy 0.72943 (0.72870)	Top-1 acc 50.391 (51.735)	Top-5 acc 73.828 (74.908)	lr 0.02056
Train [34][730/3239]	Time 0.218 (0.481)	Data Time 0.001 (0.043)	Loss 2.9403 (3.0065)	Entropy 0.72989 (0.72872)	Top-1 acc 55.078 (51.735)	Top-5 acc 75.391 (74.888)	lr 0.02056
Train [34][740/3239]	Time 0.323 (0.479)	Data Time 0.001 (0.043)	Loss 3.0626 (3.0070)	Entropy 0.73007 (0.72873)	Top-1 acc 53.906 (51.732)	Top-5 acc 76.172 (74.871)	lr 0.02056
Train [34][750/3239]	Time 0.232 (0.478)	Data Time 0.002 (0.042)	Loss 3.0325 (3.0073)	Entropy 0.72991 (0.72875)	Top-1 acc 51.562 (51.723)	Top-5 acc 75.391 (74.864)	lr 0.02056
Train [34][760/3239]	Time 0.226 (0.477)	Data Time 0.001 (0.042)	Loss 2.9253 (3.0085)	Entropy 0.73012 (0.72876)	Top-1 acc 56.250 (51.706)	Top-5 acc 75.781 (74.823)	lr 0.02056
Train [34][770/3239]	Time 0.224 (0.476)	Data Time 0.001 (0.041)	Loss 2.9983 (3.0089)	Entropy 0.73046 (0.72878)	Top-1 acc 52.344 (51.695)	Top-5 acc 74.609 (74.806)	lr 0.02056
Train [34][780/3239]	Time 0.230 (0.475)	Data Time 0.001 (0.041)	Loss 2.7586 (3.0088)	Entropy 0.73053 (0.72881)	Top-1 acc 58.984 (51.709)	Top-5 acc 77.344 (74.809)	lr 0.02056
Train [34][790/3239]	Time 0.255 (0.475)	Data Time 0.001 (0.040)	Loss 3.2263 (3.0091)	Entropy 0.73068 (0.72883)	Top-1 acc 52.344 (51.704)	Top-5 acc 70.312 (74.813)	lr 0.02056
Train [34][800/3239]	Time 0.230 (0.474)	Data Time 0.001 (0.040)	Loss 3.0848 (3.0093)	Entropy 0.73029 (0.72885)	Top-1 acc 48.828 (51.711)	Top-5 acc 75.000 (74.810)	lr 0.02056
Train [34][810/3239]	Time 0.218 (0.473)	Data Time 0.001 (0.039)	Loss 3.0738 (3.0098)	Entropy 0.73045 (0.72887)	Top-1 acc 51.562 (51.705)	Top-5 acc 73.828 (74.798)	lr 0.02056
Train [34][820/3239]	Time 0.218 (0.472)	Data Time 0.001 (0.039)	Loss 3.1132 (3.0092)	Entropy 0.73041 (0.72889)	Top-1 acc 48.047 (51.719)	Top-5 acc 72.656 (74.812)	lr 0.02055
Train [34][830/3239]	Time 0.232 (0.471)	Data Time 0.001 (0.038)	Loss 2.9416 (3.0094)	Entropy 0.73041 (0.72890)	Top-1 acc 50.391 (51.711)	Top-5 acc 74.609 (74.803)	lr 0.02055
Train [34][840/3239]	Time 0.234 (0.470)	Data Time 0.001 (0.038)	Loss 3.0519 (3.0089)	Entropy 0.73041 (0.72892)	Top-1 acc 50.391 (51.718)	Top-5 acc 74.219 (74.816)	lr 0.02055
Train [34][850/3239]	Time 0.220 (0.469)	Data Time 0.001 (0.037)	Loss 3.0739 (3.0094)	Entropy 0.73030 (0.72894)	Top-1 acc 48.828 (51.705)	Top-5 acc 75.391 (74.808)	lr 0.02055
Train [34][860/3239]	Time 0.226 (0.468)	Data Time 0.001 (0.037)	Loss 2.8854 (3.0094)	Entropy 0.73025 (0.72896)	Top-1 acc 55.469 (51.709)	Top-5 acc 77.734 (74.807)	lr 0.02055
Train [34][870/3239]	Time 0.230 (0.467)	Data Time 0.001 (0.037)	Loss 3.0420 (3.0091)	Entropy 0.73047 (0.72897)	Top-1 acc 54.297 (51.712)	Top-5 acc 75.781 (74.817)	lr 0.02055
Train [34][880/3239]	Time 0.228 (0.466)	Data Time 0.001 (0.036)	Loss 3.1563 (3.0091)	Entropy 0.73057 (0.72899)	Top-1 acc 50.000 (51.720)	Top-5 acc 69.531 (74.821)	lr 0.02055
Train [34][890/3239]	Time 0.227 (0.466)	Data Time 0.001 (0.036)	Loss 2.9400 (3.0090)	Entropy 0.73079 (0.72901)	Top-1 acc 57.422 (51.714)	Top-5 acc 77.344 (74.829)	lr 0.02055
Train [34][900/3239]	Time 0.325 (0.465)	Data Time 0.001 (0.035)	Loss 3.0503 (3.0089)	Entropy 0.73060 (0.72903)	Top-1 acc 50.781 (51.728)	Top-5 acc 73.047 (74.821)	lr 0.02055
Train [34][910/3239]	Time 0.231 (0.464)	Data Time 0.001 (0.035)	Loss 2.9412 (3.0084)	Entropy 0.73064 (0.72904)	Top-1 acc 55.859 (51.743)	Top-5 acc 74.609 (74.830)	lr 0.02055
Train [34][920/3239]	Time 0.228 (0.463)	Data Time 0.001 (0.035)	Loss 2.8846 (3.0089)	Entropy 0.73076 (0.72906)	Top-1 acc 51.562 (51.743)	Top-5 acc 75.391 (74.813)	lr 0.02055
Train [34][930/3239]	Time 0.231 (0.462)	Data Time 0.001 (0.034)	Loss 2.9054 (3.0096)	Entropy 0.73089 (0.72908)	Top-1 acc 55.078 (51.729)	Top-5 acc 77.344 (74.796)	lr 0.02055
Train [34][940/3239]	Time 0.230 (0.462)	Data Time 0.001 (0.034)	Loss 2.9227 (3.0095)	Entropy 0.73113 (0.72910)	Top-1 acc 49.609 (51.743)	Top-5 acc 76.953 (74.795)	lr 0.02055
Train [34][950/3239]	Time 0.234 (0.461)	Data Time 0.001 (0.034)	Loss 2.9521 (3.0094)	Entropy 0.73077 (0.72912)	Top-1 acc 54.688 (51.737)	Top-5 acc 78.906 (74.804)	lr 0.02054
Train [34][960/3239]	Time 0.245 (0.461)	Data Time 0.001 (0.033)	Loss 2.8783 (3.0092)	Entropy 0.73028 (0.72914)	Top-1 acc 56.250 (51.744)	Top-5 acc 78.516 (74.808)	lr 0.02054
Train [34][970/3239]	Time 0.320 (0.460)	Data Time 0.001 (0.033)	Loss 3.0087 (3.0092)	Entropy 0.73039 (0.72915)	Top-1 acc 48.828 (51.744)	Top-5 acc 73.828 (74.815)	lr 0.02054
Train [34][980/3239]	Time 0.231 (0.459)	Data Time 0.001 (0.033)	Loss 2.9609 (3.0094)	Entropy 0.73063 (0.72916)	Top-1 acc 52.734 (51.735)	Top-5 acc 74.609 (74.813)	lr 0.02054
Train [34][990/3239]	Time 0.229 (0.459)	Data Time 0.001 (0.032)	Loss 2.9106 (3.0095)	Entropy 0.73105 (0.72918)	Top-1 acc 53.516 (51.736)	Top-5 acc 77.344 (74.814)	lr 0.02054
Train [34][1000/3239]	Time 0.228 (0.458)	Data Time 0.001 (0.032)	Loss 3.1069 (3.0090)	Entropy 0.73120 (0.72920)	Top-1 acc 44.922 (51.744)	Top-5 acc 71.484 (74.820)	lr 0.02054
Train [34][1010/3239]	Time 0.236 (0.457)	Data Time 0.001 (0.032)	Loss 2.9898 (3.0097)	Entropy 0.73110 (0.72922)	Top-1 acc 51.953 (51.728)	Top-5 acc 75.781 (74.805)	lr 0.02054
Train [34][1020/3239]	Time 0.227 (0.457)	Data Time 0.001 (0.031)	Loss 2.9762 (3.0098)	Entropy 0.73134 (0.72924)	Top-1 acc 51.953 (51.724)	Top-5 acc 73.438 (74.801)	lr 0.02054
Train [34][1030/3239]	Time 0.211 (0.456)	Data Time 0.001 (0.031)	Loss 3.1445 (3.0098)	Entropy 0.73167 (0.72926)	Top-1 acc 46.875 (51.719)	Top-5 acc 72.266 (74.803)	lr 0.02054
Train [34][1040/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.031)	Loss 3.0223 (3.0104)	Entropy 0.73182 (0.72928)	Top-1 acc 49.609 (51.708)	Top-5 acc 75.781 (74.797)	lr 0.02054
Train [34][1050/3239]	Time 0.231 (0.455)	Data Time 0.001 (0.031)	Loss 3.1120 (3.0107)	Entropy 0.73232 (0.72931)	Top-1 acc 44.922 (51.694)	Top-5 acc 75.391 (74.803)	lr 0.02054
Train [34][1060/3239]	Time 0.306 (0.455)	Data Time 0.001 (0.030)	Loss 2.8873 (3.0098)	Entropy 0.73230 (0.72933)	Top-1 acc 55.859 (51.719)	Top-5 acc 74.219 (74.810)	lr 0.02054
Train [34][1070/3239]	Time 0.229 (0.454)	Data Time 0.001 (0.030)	Loss 2.9120 (3.0096)	Entropy 0.73203 (0.72936)	Top-1 acc 53.516 (51.725)	Top-5 acc 76.562 (74.820)	lr 0.02054
Train [34][1080/3239]	Time 0.219 (0.453)	Data Time 0.001 (0.030)	Loss 3.1173 (3.0098)	Entropy 0.73221 (0.72938)	Top-1 acc 49.219 (51.727)	Top-5 acc 73.438 (74.817)	lr 0.02053
Train [34][1090/3239]	Time 0.226 (0.453)	Data Time 0.001 (0.029)	Loss 3.2807 (3.0107)	Entropy 0.73221 (0.72941)	Top-1 acc 47.656 (51.716)	Top-5 acc 67.578 (74.794)	lr 0.02053
Train [34][1100/3239]	Time 0.219 (0.452)	Data Time 0.001 (0.029)	Loss 3.0813 (3.0105)	Entropy 0.73267 (0.72944)	Top-1 acc 52.344 (51.721)	Top-5 acc 73.438 (74.797)	lr 0.02053
Train [34][1110/3239]	Time 0.226 (0.452)	Data Time 0.001 (0.029)	Loss 2.9649 (3.0105)	Entropy 0.73268 (0.72947)	Top-1 acc 56.641 (51.729)	Top-5 acc 74.219 (74.793)	lr 0.02053
Train [34][1120/3239]	Time 0.232 (0.451)	Data Time 0.001 (0.029)	Loss 2.9608 (3.0107)	Entropy 0.73278 (0.72950)	Top-1 acc 51.562 (51.724)	Top-5 acc 76.953 (74.790)	lr 0.02053
Train [34][1130/3239]	Time 0.385 (0.475)	Data Time 0.002 (0.029)	Loss 2.9104 (3.0112)	Entropy 0.73248 (0.72953)	Top-1 acc 55.859 (51.717)	Top-5 acc 76.953 (74.782)	lr 0.02053
Train [34][1140/3239]	Time 0.242 (0.475)	Data Time 0.002 (0.028)	Loss 2.9271 (3.0113)	Entropy 0.73245 (0.72955)	Top-1 acc 53.906 (51.712)	Top-5 acc 73.828 (74.780)	lr 0.02053
Train [34][1150/3239]	Time 0.237 (0.474)	Data Time 0.002 (0.028)	Loss 2.7570 (3.0111)	Entropy 0.73198 (0.72958)	Top-1 acc 53.516 (51.719)	Top-5 acc 80.469 (74.781)	lr 0.02053
Train [34][1160/3239]	Time 0.241 (0.474)	Data Time 0.001 (0.028)	Loss 3.0828 (3.0113)	Entropy 0.73218 (0.72960)	Top-1 acc 50.391 (51.717)	Top-5 acc 75.391 (74.780)	lr 0.02053
Train [34][1170/3239]	Time 0.238 (0.473)	Data Time 0.001 (0.028)	Loss 3.1563 (3.0117)	Entropy 0.73188 (0.72962)	Top-1 acc 51.562 (51.723)	Top-5 acc 69.531 (74.764)	lr 0.02053
Train [34][1180/3239]	Time 0.241 (0.473)	Data Time 0.001 (0.027)	Loss 3.0390 (3.0110)	Entropy 0.73187 (0.72964)	Top-1 acc 51.562 (51.740)	Top-5 acc 75.391 (74.788)	lr 0.02053
Train [34][1190/3239]	Time 0.234 (0.472)	Data Time 0.001 (0.027)	Loss 3.0412 (3.0113)	Entropy 0.73146 (0.72966)	Top-1 acc 53.125 (51.731)	Top-5 acc 72.656 (74.782)	lr 0.02053
Train [34][1200/3239]	Time 0.227 (0.471)	Data Time 0.001 (0.027)	Loss 3.0574 (3.0113)	Entropy 0.73139 (0.72967)	Top-1 acc 52.734 (51.733)	Top-5 acc 74.219 (74.784)	lr 0.02053
Train [34][1210/3239]	Time 0.233 (0.471)	Data Time 0.001 (0.027)	Loss 3.0571 (3.0113)	Entropy 0.73165 (0.72969)	Top-1 acc 55.078 (51.739)	Top-5 acc 72.656 (74.775)	lr 0.02052
Train [34][1220/3239]	Time 0.356 (0.470)	Data Time 0.001 (0.027)	Loss 3.1453 (3.0119)	Entropy 0.73198 (0.72970)	Top-1 acc 45.703 (51.725)	Top-5 acc 74.219 (74.771)	lr 0.02052
Train [34][1230/3239]	Time 0.229 (0.470)	Data Time 0.001 (0.026)	Loss 3.0820 (3.0124)	Entropy 0.73213 (0.72972)	Top-1 acc 50.000 (51.720)	Top-5 acc 74.219 (74.764)	lr 0.02052
Train [34][1240/3239]	Time 0.233 (0.469)	Data Time 0.001 (0.026)	Loss 3.0415 (3.0125)	Entropy 0.73163 (0.72974)	Top-1 acc 50.391 (51.711)	Top-5 acc 75.000 (74.760)	lr 0.02052
Train [34][1250/3239]	Time 0.223 (0.469)	Data Time 0.001 (0.026)	Loss 2.8088 (3.0129)	Entropy 0.73103 (0.72975)	Top-1 acc 57.422 (51.705)	Top-5 acc 77.734 (74.749)	lr 0.02052
Train [34][1260/3239]	Time 0.236 (0.468)	Data Time 0.001 (0.026)	Loss 2.9509 (3.0131)	Entropy 0.73116 (0.72977)	Top-1 acc 52.734 (51.698)	Top-5 acc 78.516 (74.746)	lr 0.02052
Train [34][1270/3239]	Time 0.231 (0.468)	Data Time 0.001 (0.026)	Loss 3.2005 (3.0135)	Entropy 0.73126 (0.72978)	Top-1 acc 46.094 (51.685)	Top-5 acc 71.484 (74.740)	lr 0.02052
Train [34][1280/3239]	Time 0.231 (0.468)	Data Time 0.001 (0.025)	Loss 2.9578 (3.0131)	Entropy 0.73080 (0.72979)	Top-1 acc 53.516 (51.691)	Top-5 acc 79.297 (74.755)	lr 0.02052
Train [34][1290/3239]	Time 0.328 (0.467)	Data Time 0.001 (0.025)	Loss 2.8930 (3.0130)	Entropy 0.73094 (0.72980)	Top-1 acc 50.781 (51.685)	Top-5 acc 77.734 (74.765)	lr 0.02052
Train [34][1300/3239]	Time 0.229 (0.467)	Data Time 0.001 (0.025)	Loss 3.1281 (3.0134)	Entropy 0.73108 (0.72981)	Top-1 acc 48.047 (51.683)	Top-5 acc 72.656 (74.759)	lr 0.02052
Train [34][1310/3239]	Time 0.228 (0.466)	Data Time 0.001 (0.025)	Loss 2.9832 (3.0133)	Entropy 0.73127 (0.72982)	Top-1 acc 57.422 (51.681)	Top-5 acc 74.219 (74.757)	lr 0.02052
Train [34][1320/3239]	Time 0.224 (0.466)	Data Time 0.001 (0.025)	Loss 2.8009 (3.0133)	Entropy 0.73124 (0.72983)	Top-1 acc 54.688 (51.684)	Top-5 acc 80.469 (74.754)	lr 0.02052
Train [34][1330/3239]	Time 0.231 (0.465)	Data Time 0.001 (0.025)	Loss 2.9769 (3.0134)	Entropy 0.73114 (0.72984)	Top-1 acc 48.047 (51.680)	Top-5 acc 75.000 (74.757)	lr 0.02052
Train [34][1340/3239]	Time 0.219 (0.465)	Data Time 0.001 (0.024)	Loss 3.4704 (3.0135)	Entropy 0.73119 (0.72985)	Top-1 acc 43.359 (51.675)	Top-5 acc 63.672 (74.759)	lr 0.02051
Train [34][1350/3239]	Time 0.226 (0.464)	Data Time 0.001 (0.024)	Loss 3.1953 (3.0137)	Entropy 0.73128 (0.72986)	Top-1 acc 49.219 (51.673)	Top-5 acc 72.656 (74.758)	lr 0.02051
Train [34][1360/3239]	Time 0.266 (0.464)	Data Time 0.002 (0.024)	Loss 2.8569 (3.0142)	Entropy 0.73125 (0.72987)	Top-1 acc 54.688 (51.667)	Top-5 acc 77.344 (74.749)	lr 0.02051
Train [34][1370/3239]	Time 0.238 (0.464)	Data Time 0.001 (0.024)	Loss 2.8599 (3.0139)	Entropy 0.73156 (0.72988)	Top-1 acc 55.859 (51.666)	Top-5 acc 77.734 (74.756)	lr 0.02051
Train [34][1380/3239]	Time 0.247 (0.463)	Data Time 0.001 (0.024)	Loss 2.9912 (3.0141)	Entropy 0.73184 (0.72989)	Top-1 acc 51.172 (51.664)	Top-5 acc 74.219 (74.753)	lr 0.02051
Train [34][1390/3239]	Time 0.227 (0.463)	Data Time 0.001 (0.024)	Loss 3.0349 (3.0139)	Entropy 0.73155 (0.72991)	Top-1 acc 51.172 (51.670)	Top-5 acc 76.953 (74.757)	lr 0.02051
Train [34][1400/3239]	Time 0.237 (0.462)	Data Time 0.001 (0.023)	Loss 2.7504 (3.0134)	Entropy 0.73157 (0.72992)	Top-1 acc 56.641 (51.694)	Top-5 acc 78.906 (74.769)	lr 0.02051
Train [34][1410/3239]	Time 0.225 (0.462)	Data Time 0.001 (0.023)	Loss 2.9772 (3.0135)	Entropy 0.73145 (0.72993)	Top-1 acc 53.906 (51.686)	Top-5 acc 77.344 (74.769)	lr 0.02051
Train [34][1420/3239]	Time 0.235 (0.462)	Data Time 0.001 (0.023)	Loss 2.8654 (3.0136)	Entropy 0.73120 (0.72994)	Top-1 acc 52.734 (51.679)	Top-5 acc 77.344 (74.767)	lr 0.02051
Train [34][1430/3239]	Time 0.265 (0.461)	Data Time 0.001 (0.023)	Loss 2.9690 (3.0138)	Entropy 0.73129 (0.72995)	Top-1 acc 52.344 (51.676)	Top-5 acc 75.391 (74.760)	lr 0.02051
Train [34][1440/3239]	Time 0.222 (0.461)	Data Time 0.001 (0.023)	Loss 2.9739 (3.0139)	Entropy 0.73103 (0.72996)	Top-1 acc 51.953 (51.675)	Top-5 acc 75.000 (74.757)	lr 0.02051
Train [34][1450/3239]	Time 0.319 (0.461)	Data Time 0.001 (0.023)	Loss 3.1629 (3.0139)	Entropy 0.73094 (0.72996)	Top-1 acc 50.391 (51.684)	Top-5 acc 70.703 (74.754)	lr 0.02051
Train [34][1460/3239]	Time 0.223 (0.460)	Data Time 0.001 (0.022)	Loss 2.9218 (3.0139)	Entropy 0.73092 (0.72997)	Top-1 acc 52.344 (51.680)	Top-5 acc 77.734 (74.760)	lr 0.02051
Train [34][1470/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.022)	Loss 3.0775 (3.0135)	Entropy 0.73048 (0.72998)	Top-1 acc 49.609 (51.692)	Top-5 acc 71.875 (74.767)	lr 0.02050
Train [34][1480/3239]	Time 0.226 (0.459)	Data Time 0.001 (0.022)	Loss 3.1028 (3.0132)	Entropy 0.73042 (0.72998)	Top-1 acc 47.266 (51.698)	Top-5 acc 71.484 (74.770)	lr 0.02050
Train [34][1490/3239]	Time 0.233 (0.459)	Data Time 0.001 (0.022)	Loss 3.0792 (3.0134)	Entropy 0.73033 (0.72998)	Top-1 acc 51.562 (51.690)	Top-5 acc 72.656 (74.766)	lr 0.02050
Train [34][1500/3239]	Time 0.237 (0.458)	Data Time 0.001 (0.022)	Loss 3.1017 (3.0138)	Entropy 0.73004 (0.72998)	Top-1 acc 49.609 (51.680)	Top-5 acc 75.000 (74.762)	lr 0.02050
Train [34][1510/3239]	Time 0.230 (0.458)	Data Time 0.001 (0.022)	Loss 2.9615 (3.0137)	Entropy 0.73018 (0.72998)	Top-1 acc 52.734 (51.683)	Top-5 acc 73.438 (74.762)	lr 0.02050
Train [34][1520/3239]	Time 0.317 (0.458)	Data Time 0.001 (0.022)	Loss 2.9865 (3.0134)	Entropy 0.72982 (0.72998)	Top-1 acc 51.562 (51.695)	Top-5 acc 74.219 (74.764)	lr 0.02050
Train [34][1530/3239]	Time 0.238 (0.457)	Data Time 0.001 (0.022)	Loss 3.1966 (3.0134)	Entropy 0.72951 (0.72998)	Top-1 acc 46.484 (51.695)	Top-5 acc 71.484 (74.769)	lr 0.02050
Train [34][1540/3239]	Time 0.229 (0.457)	Data Time 0.001 (0.021)	Loss 3.0235 (3.0136)	Entropy 0.72914 (0.72998)	Top-1 acc 50.000 (51.693)	Top-5 acc 73.047 (74.768)	lr 0.02050
Train [34][1550/3239]	Time 0.231 (0.456)	Data Time 0.001 (0.021)	Loss 2.8466 (3.0136)	Entropy 0.72946 (0.72997)	Top-1 acc 55.859 (51.682)	Top-5 acc 76.172 (74.766)	lr 0.02050
Train [34][1560/3239]	Time 0.212 (0.456)	Data Time 0.001 (0.021)	Loss 3.0599 (3.0136)	Entropy 0.72918 (0.72997)	Top-1 acc 52.344 (51.689)	Top-5 acc 75.000 (74.769)	lr 0.02050
Train [34][1570/3239]	Time 0.254 (0.456)	Data Time 0.001 (0.021)	Loss 2.7945 (3.0135)	Entropy 0.72921 (0.72996)	Top-1 acc 57.812 (51.699)	Top-5 acc 79.688 (74.768)	lr 0.02050
Train [34][1580/3239]	Time 0.225 (0.455)	Data Time 0.001 (0.021)	Loss 2.9286 (3.0134)	Entropy 0.72902 (0.72996)	Top-1 acc 53.906 (51.700)	Top-5 acc 74.609 (74.772)	lr 0.02050
Train [34][1590/3239]	Time 0.246 (0.455)	Data Time 0.001 (0.021)	Loss 3.1163 (3.0133)	Entropy 0.72884 (0.72995)	Top-1 acc 49.219 (51.697)	Top-5 acc 72.266 (74.770)	lr 0.02050
Train [34][1600/3239]	Time 0.226 (0.454)	Data Time 0.001 (0.021)	Loss 2.8609 (3.0132)	Entropy 0.72820 (0.72994)	Top-1 acc 54.688 (51.697)	Top-5 acc 77.734 (74.769)	lr 0.02049
Train [34][1610/3239]	Time 0.320 (0.454)	Data Time 0.001 (0.021)	Loss 2.9136 (3.0133)	Entropy 0.72808 (0.72993)	Top-1 acc 54.688 (51.700)	Top-5 acc 79.297 (74.766)	lr 0.02049
Train [34][1620/3239]	Time 0.217 (0.454)	Data Time 0.001 (0.020)	Loss 3.0588 (3.0139)	Entropy 0.72754 (0.72992)	Top-1 acc 51.172 (51.688)	Top-5 acc 74.219 (74.752)	lr 0.02049
Train [34][1630/3239]	Time 0.228 (0.453)	Data Time 0.001 (0.020)	Loss 3.0121 (3.0138)	Entropy 0.72798 (0.72991)	Top-1 acc 51.562 (51.688)	Top-5 acc 73.438 (74.755)	lr 0.02049
Train [34][1640/3239]	Time 0.234 (0.453)	Data Time 0.001 (0.020)	Loss 2.8654 (3.0139)	Entropy 0.72763 (0.72989)	Top-1 acc 51.953 (51.684)	Top-5 acc 77.734 (74.745)	lr 0.02049
Train [34][1650/3239]	Time 0.233 (0.453)	Data Time 0.001 (0.020)	Loss 2.9702 (3.0141)	Entropy 0.72755 (0.72988)	Top-1 acc 51.172 (51.682)	Top-5 acc 75.000 (74.743)	lr 0.02049
Train [34][1660/3239]	Time 0.222 (0.452)	Data Time 0.001 (0.020)	Loss 2.9199 (3.0143)	Entropy 0.72749 (0.72987)	Top-1 acc 51.172 (51.675)	Top-5 acc 75.000 (74.743)	lr 0.02049
Train [34][1670/3239]	Time 0.233 (0.452)	Data Time 0.001 (0.020)	Loss 2.8740 (3.0140)	Entropy 0.72759 (0.72985)	Top-1 acc 56.250 (51.683)	Top-5 acc 75.781 (74.748)	lr 0.02049
Train [34][1680/3239]	Time 0.319 (0.452)	Data Time 0.001 (0.020)	Loss 2.7954 (3.0138)	Entropy 0.72767 (0.72984)	Top-1 acc 53.906 (51.688)	Top-5 acc 78.125 (74.750)	lr 0.02049
Train [34][1690/3239]	Time 0.220 (0.451)	Data Time 0.001 (0.020)	Loss 3.2334 (3.0139)	Entropy 0.72765 (0.72983)	Top-1 acc 48.047 (51.686)	Top-5 acc 72.266 (74.752)	lr 0.02049
Train [34][1700/3239]	Time 0.230 (0.451)	Data Time 0.001 (0.020)	Loss 2.8435 (3.0141)	Entropy 0.72773 (0.72981)	Top-1 acc 58.984 (51.681)	Top-5 acc 76.953 (74.752)	lr 0.02049
Train [34][1710/3239]	Time 0.228 (0.451)	Data Time 0.001 (0.019)	Loss 3.1429 (3.0138)	Entropy 0.72798 (0.72980)	Top-1 acc 49.219 (51.688)	Top-5 acc 71.484 (74.756)	lr 0.02049
Train [34][1720/3239]	Time 0.223 (0.450)	Data Time 0.001 (0.019)	Loss 2.9023 (3.0138)	Entropy 0.72789 (0.72979)	Top-1 acc 53.125 (51.688)	Top-5 acc 76.172 (74.755)	lr 0.02049
Train [34][1730/3239]	Time 0.219 (0.450)	Data Time 0.001 (0.019)	Loss 2.8043 (3.0135)	Entropy 0.72784 (0.72978)	Top-1 acc 55.859 (51.693)	Top-5 acc 78.125 (74.755)	lr 0.02048
Train [34][1740/3239]	Time 0.232 (0.450)	Data Time 0.001 (0.019)	Loss 2.8734 (3.0134)	Entropy 0.72773 (0.72977)	Top-1 acc 54.297 (51.700)	Top-5 acc 78.125 (74.757)	lr 0.02048
Train [34][1750/3239]	Time 0.234 (0.450)	Data Time 0.001 (0.019)	Loss 2.9588 (3.0133)	Entropy 0.72717 (0.72976)	Top-1 acc 51.562 (51.705)	Top-5 acc 75.000 (74.762)	lr 0.02048
Train [34][1760/3239]	Time 0.237 (0.449)	Data Time 0.001 (0.019)	Loss 2.9605 (3.0131)	Entropy 0.72687 (0.72974)	Top-1 acc 57.812 (51.708)	Top-5 acc 76.562 (74.763)	lr 0.02048
Train [34][1770/3239]	Time 0.321 (0.449)	Data Time 0.001 (0.019)	Loss 2.8844 (3.0128)	Entropy 0.72671 (0.72972)	Top-1 acc 53.906 (51.715)	Top-5 acc 77.734 (74.772)	lr 0.02048
Train [34][1780/3239]	Time 0.324 (0.464)	Data Time 0.006 (0.019)	Loss 3.2111 (3.0129)	Entropy 0.72657 (0.72971)	Top-1 acc 45.312 (51.707)	Top-5 acc 70.703 (74.768)	lr 0.02048
Train [34][1790/3239]	Time 0.245 (0.464)	Data Time 0.002 (0.019)	Loss 2.8925 (3.0126)	Entropy 0.72627 (0.72969)	Top-1 acc 55.469 (51.712)	Top-5 acc 79.297 (74.774)	lr 0.02048
Train [34][1800/3239]	Time 0.235 (0.464)	Data Time 0.002 (0.019)	Loss 3.0006 (3.0131)	Entropy 0.72627 (0.72967)	Top-1 acc 51.953 (51.701)	Top-5 acc 74.219 (74.764)	lr 0.02048
Train [34][1810/3239]	Time 0.262 (0.463)	Data Time 0.003 (0.018)	Loss 3.0932 (3.0132)	Entropy 0.72564 (0.72965)	Top-1 acc 49.219 (51.697)	Top-5 acc 72.656 (74.757)	lr 0.02048
Train [34][1820/3239]	Time 0.276 (0.463)	Data Time 0.001 (0.018)	Loss 3.0684 (3.0134)	Entropy 0.72556 (0.72963)	Top-1 acc 51.172 (51.696)	Top-5 acc 73.438 (74.755)	lr 0.02048
Train [34][1830/3239]	Time 0.247 (0.463)	Data Time 0.001 (0.018)	Loss 2.9534 (3.0130)	Entropy 0.72541 (0.72960)	Top-1 acc 50.391 (51.704)	Top-5 acc 74.219 (74.761)	lr 0.02048
Train [34][1840/3239]	Time 0.327 (0.463)	Data Time 0.001 (0.018)	Loss 2.9443 (3.0129)	Entropy 0.72568 (0.72958)	Top-1 acc 50.000 (51.709)	Top-5 acc 79.688 (74.763)	lr 0.02048
Train [34][1850/3239]	Time 0.235 (0.462)	Data Time 0.001 (0.018)	Loss 3.0741 (3.0129)	Entropy 0.72587 (0.72956)	Top-1 acc 50.781 (51.707)	Top-5 acc 73.047 (74.760)	lr 0.02048
Train [34][1860/3239]	Time 0.236 (0.462)	Data Time 0.001 (0.018)	Loss 2.9909 (3.0130)	Entropy 0.72566 (0.72954)	Top-1 acc 50.781 (51.705)	Top-5 acc 75.781 (74.754)	lr 0.02047
Train [34][1870/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.018)	Loss 3.1634 (3.0128)	Entropy 0.72573 (0.72952)	Top-1 acc 50.781 (51.708)	Top-5 acc 71.484 (74.757)	lr 0.02047
Train [34][1880/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.018)	Loss 3.2215 (3.0132)	Entropy 0.72564 (0.72950)	Top-1 acc 42.578 (51.694)	Top-5 acc 69.922 (74.745)	lr 0.02047
Train [34][1890/3239]	Time 0.232 (0.461)	Data Time 0.001 (0.018)	Loss 2.8870 (3.0129)	Entropy 0.72589 (0.72948)	Top-1 acc 55.859 (51.698)	Top-5 acc 76.172 (74.747)	lr 0.02047
Train [34][1900/3239]	Time 0.225 (0.461)	Data Time 0.001 (0.018)	Loss 2.9991 (3.0131)	Entropy 0.72596 (0.72946)	Top-1 acc 48.828 (51.686)	Top-5 acc 74.609 (74.743)	lr 0.02047
Train [34][1910/3239]	Time 0.241 (0.461)	Data Time 0.001 (0.018)	Loss 2.9257 (3.0128)	Entropy 0.72598 (0.72944)	Top-1 acc 51.562 (51.694)	Top-5 acc 78.125 (74.753)	lr 0.02047
Train [34][1920/3239]	Time 0.223 (0.460)	Data Time 0.001 (0.018)	Loss 3.1450 (3.0127)	Entropy 0.72570 (0.72942)	Top-1 acc 45.312 (51.694)	Top-5 acc 74.219 (74.752)	lr 0.02047
Train [34][1930/3239]	Time 0.330 (0.460)	Data Time 0.001 (0.017)	Loss 2.8607 (3.0128)	Entropy 0.72559 (0.72940)	Top-1 acc 50.000 (51.688)	Top-5 acc 80.469 (74.756)	lr 0.02047
Train [34][1940/3239]	Time 0.249 (0.460)	Data Time 0.001 (0.017)	Loss 3.1874 (3.0126)	Entropy 0.72606 (0.72939)	Top-1 acc 50.000 (51.692)	Top-5 acc 70.312 (74.759)	lr 0.02047
Train [34][1950/3239]	Time 0.219 (0.460)	Data Time 0.001 (0.017)	Loss 2.8425 (3.0125)	Entropy 0.72566 (0.72937)	Top-1 acc 54.297 (51.693)	Top-5 acc 76.172 (74.762)	lr 0.02047
Train [34][1960/3239]	Time 0.255 (0.459)	Data Time 0.001 (0.017)	Loss 3.1457 (3.0124)	Entropy 0.72570 (0.72935)	Top-1 acc 44.922 (51.692)	Top-5 acc 74.219 (74.766)	lr 0.02047
Train [34][1970/3239]	Time 0.233 (0.459)	Data Time 0.001 (0.017)	Loss 3.0734 (3.0125)	Entropy 0.72584 (0.72933)	Top-1 acc 51.953 (51.691)	Top-5 acc 74.219 (74.757)	lr 0.02047
Train [34][1980/3239]	Time 0.221 (0.459)	Data Time 0.001 (0.017)	Loss 3.1430 (3.0127)	Entropy 0.72602 (0.72931)	Top-1 acc 52.344 (51.687)	Top-5 acc 71.484 (74.754)	lr 0.02046
Train [34][1990/3239]	Time 0.227 (0.459)	Data Time 0.001 (0.017)	Loss 2.9347 (3.0129)	Entropy 0.72589 (0.72930)	Top-1 acc 56.250 (51.683)	Top-5 acc 75.781 (74.744)	lr 0.02046
Train [34][2000/3239]	Time 0.330 (0.458)	Data Time 0.001 (0.017)	Loss 2.9756 (3.0128)	Entropy 0.72580 (0.72928)	Top-1 acc 54.297 (51.691)	Top-5 acc 75.000 (74.748)	lr 0.02046
Train [34][2010/3239]	Time 0.226 (0.458)	Data Time 0.001 (0.017)	Loss 2.8630 (3.0124)	Entropy 0.72575 (0.72926)	Top-1 acc 54.688 (51.694)	Top-5 acc 77.734 (74.758)	lr 0.02046
Train [34][2020/3239]	Time 0.226 (0.458)	Data Time 0.001 (0.017)	Loss 3.2188 (3.0127)	Entropy 0.72555 (0.72924)	Top-1 acc 47.266 (51.688)	Top-5 acc 72.656 (74.751)	lr 0.02046
Train [34][2030/3239]	Time 0.234 (0.457)	Data Time 0.001 (0.017)	Loss 3.0401 (3.0127)	Entropy 0.72547 (0.72923)	Top-1 acc 52.344 (51.686)	Top-5 acc 71.875 (74.749)	lr 0.02046
Train [34][2040/3239]	Time 0.223 (0.457)	Data Time 0.001 (0.017)	Loss 3.0262 (3.0128)	Entropy 0.72562 (0.72921)	Top-1 acc 48.828 (51.683)	Top-5 acc 71.875 (74.742)	lr 0.02046
Train [34][2050/3239]	Time 0.251 (0.457)	Data Time 0.001 (0.017)	Loss 3.2112 (3.0130)	Entropy 0.72572 (0.72919)	Top-1 acc 47.266 (51.682)	Top-5 acc 70.703 (74.735)	lr 0.02046
Train [34][2060/3239]	Time 0.265 (0.457)	Data Time 0.001 (0.016)	Loss 3.1789 (3.0133)	Entropy 0.72560 (0.72917)	Top-1 acc 46.875 (51.676)	Top-5 acc 73.047 (74.731)	lr 0.02046
Train [34][2070/3239]	Time 0.231 (0.457)	Data Time 0.001 (0.016)	Loss 2.9853 (3.0133)	Entropy 0.72584 (0.72916)	Top-1 acc 50.000 (51.675)	Top-5 acc 73.438 (74.728)	lr 0.02046
Train [34][2080/3239]	Time 0.226 (0.456)	Data Time 0.001 (0.016)	Loss 3.1770 (3.0134)	Entropy 0.72543 (0.72914)	Top-1 acc 48.438 (51.669)	Top-5 acc 67.969 (74.726)	lr 0.02046
Train [34][2090/3239]	Time 0.276 (0.456)	Data Time 0.002 (0.016)	Loss 3.1799 (3.0136)	Entropy 0.72543 (0.72912)	Top-1 acc 50.781 (51.666)	Top-5 acc 73.047 (74.724)	lr 0.02046
Train [34][2100/3239]	Time 0.232 (0.456)	Data Time 0.001 (0.016)	Loss 2.9607 (3.0135)	Entropy 0.72532 (0.72911)	Top-1 acc 53.516 (51.666)	Top-5 acc 78.516 (74.730)	lr 0.02046
Train [34][2110/3239]	Time 0.230 (0.456)	Data Time 0.001 (0.016)	Loss 3.0637 (3.0139)	Entropy 0.72554 (0.72909)	Top-1 acc 53.906 (51.657)	Top-5 acc 73.047 (74.721)	lr 0.02045
Train [34][2120/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.016)	Loss 2.9273 (3.0140)	Entropy 0.72569 (0.72907)	Top-1 acc 51.953 (51.651)	Top-5 acc 77.344 (74.716)	lr 0.02045
Train [34][2130/3239]	Time 0.229 (0.456)	Data Time 0.001 (0.016)	Loss 2.9226 (3.0140)	Entropy 0.72551 (0.72906)	Top-1 acc 53.125 (51.650)	Top-5 acc 77.734 (74.722)	lr 0.02045
Train [34][2140/3239]	Time 0.224 (0.455)	Data Time 0.001 (0.016)	Loss 3.0884 (3.0139)	Entropy 0.72541 (0.72904)	Top-1 acc 49.609 (51.653)	Top-5 acc 74.609 (74.722)	lr 0.02045
Train [34][2150/3239]	Time 0.220 (0.455)	Data Time 0.001 (0.016)	Loss 3.0164 (3.0141)	Entropy 0.72525 (0.72902)	Top-1 acc 51.172 (51.649)	Top-5 acc 75.000 (74.717)	lr 0.02045
Train [34][2160/3239]	Time 0.321 (0.455)	Data Time 0.001 (0.016)	Loss 2.8652 (3.0141)	Entropy 0.72490 (0.72900)	Top-1 acc 57.812 (51.650)	Top-5 acc 76.172 (74.715)	lr 0.02045
Train [34][2170/3239]	Time 0.223 (0.455)	Data Time 0.001 (0.016)	Loss 3.1233 (3.0142)	Entropy 0.72472 (0.72898)	Top-1 acc 50.000 (51.649)	Top-5 acc 70.312 (74.715)	lr 0.02045
Train [34][2180/3239]	Time 0.229 (0.454)	Data Time 0.001 (0.016)	Loss 2.7540 (3.0140)	Entropy 0.72461 (0.72896)	Top-1 acc 60.547 (51.653)	Top-5 acc 79.297 (74.722)	lr 0.02045
Train [34][2190/3239]	Time 0.228 (0.454)	Data Time 0.001 (0.016)	Loss 2.9524 (3.0140)	Entropy 0.72501 (0.72895)	Top-1 acc 55.078 (51.648)	Top-5 acc 75.781 (74.721)	lr 0.02045
Train [34][2200/3239]	Time 0.229 (0.454)	Data Time 0.001 (0.015)	Loss 2.9931 (3.0141)	Entropy 0.72513 (0.72893)	Top-1 acc 49.609 (51.647)	Top-5 acc 73.438 (74.720)	lr 0.02045
Train [34][2210/3239]	Time 0.235 (0.454)	Data Time 0.001 (0.015)	Loss 3.0598 (3.0141)	Entropy 0.72479 (0.72891)	Top-1 acc 53.516 (51.648)	Top-5 acc 72.266 (74.721)	lr 0.02045
Train [34][2220/3239]	Time 0.242 (0.453)	Data Time 0.001 (0.015)	Loss 2.8713 (3.0145)	Entropy 0.72495 (0.72889)	Top-1 acc 55.859 (51.635)	Top-5 acc 76.953 (74.710)	lr 0.02045
Train [34][2230/3239]	Time 0.318 (0.453)	Data Time 0.001 (0.015)	Loss 2.8011 (3.0143)	Entropy 0.72533 (0.72887)	Top-1 acc 57.422 (51.641)	Top-5 acc 78.516 (74.717)	lr 0.02045
Train [34][2240/3239]	Time 0.221 (0.453)	Data Time 0.001 (0.015)	Loss 2.9110 (3.0143)	Entropy 0.72542 (0.72886)	Top-1 acc 51.953 (51.643)	Top-5 acc 75.781 (74.715)	lr 0.02044
Train [34][2250/3239]	Time 0.232 (0.453)	Data Time 0.001 (0.015)	Loss 3.1185 (3.0143)	Entropy 0.72531 (0.72884)	Top-1 acc 48.828 (51.641)	Top-5 acc 73.438 (74.717)	lr 0.02044
Train [34][2260/3239]	Time 0.231 (0.452)	Data Time 0.001 (0.015)	Loss 2.9428 (3.0139)	Entropy 0.72504 (0.72883)	Top-1 acc 55.859 (51.651)	Top-5 acc 75.391 (74.725)	lr 0.02044
Train [34][2270/3239]	Time 0.243 (0.452)	Data Time 0.001 (0.015)	Loss 3.1032 (3.0140)	Entropy 0.72518 (0.72881)	Top-1 acc 48.047 (51.647)	Top-5 acc 73.438 (74.721)	lr 0.02044
Train [34][2280/3239]	Time 0.225 (0.452)	Data Time 0.001 (0.015)	Loss 2.8893 (3.0140)	Entropy 0.72513 (0.72880)	Top-1 acc 57.031 (51.650)	Top-5 acc 78.125 (74.717)	lr 0.02044
Train [34][2290/3239]	Time 0.231 (0.452)	Data Time 0.001 (0.015)	Loss 3.1096 (3.0141)	Entropy 0.72490 (0.72878)	Top-1 acc 50.781 (51.649)	Top-5 acc 72.266 (74.712)	lr 0.02044
Train [34][2300/3239]	Time 0.211 (0.451)	Data Time 0.001 (0.015)	Loss 3.1889 (3.0142)	Entropy 0.72523 (0.72876)	Top-1 acc 45.703 (51.650)	Top-5 acc 73.047 (74.711)	lr 0.02044
Train [34][2310/3239]	Time 0.235 (0.451)	Data Time 0.001 (0.015)	Loss 2.7944 (3.0141)	Entropy 0.72490 (0.72875)	Top-1 acc 54.688 (51.654)	Top-5 acc 76.953 (74.711)	lr 0.02044
Train [34][2320/3239]	Time 0.327 (0.451)	Data Time 0.001 (0.015)	Loss 3.0425 (3.0143)	Entropy 0.72484 (0.72873)	Top-1 acc 51.172 (51.647)	Top-5 acc 73.047 (74.707)	lr 0.02044
Train [34][2330/3239]	Time 0.219 (0.451)	Data Time 0.001 (0.015)	Loss 3.1711 (3.0144)	Entropy 0.72450 (0.72871)	Top-1 acc 51.953 (51.647)	Top-5 acc 70.703 (74.701)	lr 0.02044
Train [34][2340/3239]	Time 0.230 (0.450)	Data Time 0.001 (0.015)	Loss 3.0483 (3.0142)	Entropy 0.72442 (0.72870)	Top-1 acc 49.219 (51.650)	Top-5 acc 76.562 (74.704)	lr 0.02044
Train [34][2350/3239]	Time 0.244 (0.450)	Data Time 0.001 (0.015)	Loss 3.0728 (3.0141)	Entropy 0.72448 (0.72868)	Top-1 acc 51.953 (51.649)	Top-5 acc 70.703 (74.704)	lr 0.02044
Train [34][2360/3239]	Time 0.227 (0.450)	Data Time 0.001 (0.015)	Loss 2.8179 (3.0139)	Entropy 0.72453 (0.72866)	Top-1 acc 56.250 (51.656)	Top-5 acc 78.516 (74.711)	lr 0.02044
Train [34][2370/3239]	Time 0.236 (0.450)	Data Time 0.001 (0.015)	Loss 2.8089 (3.0136)	Entropy 0.72453 (0.72864)	Top-1 acc 56.250 (51.661)	Top-5 acc 78.125 (74.716)	lr 0.02043
Train [34][2380/3239]	Time 0.226 (0.450)	Data Time 0.001 (0.014)	Loss 3.0380 (3.0134)	Entropy 0.72445 (0.72862)	Top-1 acc 51.172 (51.667)	Top-5 acc 72.266 (74.719)	lr 0.02043
Train [34][2390/3239]	Time 0.329 (0.449)	Data Time 0.002 (0.014)	Loss 3.0956 (3.0134)	Entropy 0.72461 (0.72861)	Top-1 acc 48.438 (51.663)	Top-5 acc 74.609 (74.715)	lr 0.02043
Train [34][2400/3239]	Time 0.232 (0.449)	Data Time 0.001 (0.014)	Loss 2.8983 (3.0131)	Entropy 0.72456 (0.72859)	Top-1 acc 50.391 (51.671)	Top-5 acc 78.125 (74.722)	lr 0.02043
Train [34][2410/3239]	Time 0.233 (0.449)	Data Time 0.001 (0.014)	Loss 2.9085 (3.0131)	Entropy 0.72419 (0.72857)	Top-1 acc 57.031 (51.676)	Top-5 acc 75.781 (74.721)	lr 0.02043
Train [34][2420/3239]	Time 0.233 (0.449)	Data Time 0.001 (0.014)	Loss 2.9743 (3.0132)	Entropy 0.72379 (0.72855)	Top-1 acc 54.688 (51.674)	Top-5 acc 74.609 (74.719)	lr 0.02043
Train [34][2430/3239]	Time 0.218 (0.448)	Data Time 0.001 (0.014)	Loss 3.0190 (3.0133)	Entropy 0.72361 (0.72853)	Top-1 acc 50.391 (51.671)	Top-5 acc 74.219 (74.718)	lr 0.02043
Train [34][2440/3239]	Time 0.227 (0.460)	Data Time 0.002 (0.014)	Loss 3.1151 (3.0136)	Entropy 0.72382 (0.72851)	Top-1 acc 44.531 (51.658)	Top-5 acc 73.438 (74.714)	lr 0.02043
Train [34][2450/3239]	Time 0.230 (0.459)	Data Time 0.002 (0.014)	Loss 3.1067 (3.0139)	Entropy 0.72333 (0.72849)	Top-1 acc 48.828 (51.657)	Top-5 acc 76.562 (74.711)	lr 0.02043
Train [34][2460/3239]	Time 0.236 (0.459)	Data Time 0.002 (0.014)	Loss 2.9794 (3.0138)	Entropy 0.72327 (0.72847)	Top-1 acc 48.828 (51.657)	Top-5 acc 77.734 (74.713)	lr 0.02043
Train [34][2470/3239]	Time 0.234 (0.459)	Data Time 0.001 (0.014)	Loss 2.8610 (3.0141)	Entropy 0.72350 (0.72845)	Top-1 acc 51.172 (51.645)	Top-5 acc 77.734 (74.707)	lr 0.02043
Train [34][2480/3239]	Time 0.348 (0.459)	Data Time 0.001 (0.014)	Loss 3.0286 (3.0138)	Entropy 0.72328 (0.72843)	Top-1 acc 49.609 (51.649)	Top-5 acc 75.781 (74.712)	lr 0.02043
Train [34][2490/3239]	Time 0.225 (0.458)	Data Time 0.001 (0.014)	Loss 2.8104 (3.0137)	Entropy 0.72365 (0.72841)	Top-1 acc 58.594 (51.655)	Top-5 acc 76.172 (74.719)	lr 0.02043
Train [34][2500/3239]	Time 0.267 (0.458)	Data Time 0.001 (0.014)	Loss 2.9097 (3.0136)	Entropy 0.72340 (0.72839)	Top-1 acc 55.859 (51.655)	Top-5 acc 78.125 (74.722)	lr 0.02042
Train [34][2510/3239]	Time 0.231 (0.458)	Data Time 0.001 (0.014)	Loss 2.9169 (3.0137)	Entropy 0.72288 (0.72837)	Top-1 acc 52.734 (51.654)	Top-5 acc 78.906 (74.722)	lr 0.02042
Train [34][2520/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.014)	Loss 2.9765 (3.0139)	Entropy 0.72276 (0.72835)	Top-1 acc 53.125 (51.652)	Top-5 acc 76.172 (74.721)	lr 0.02042
Train [34][2530/3239]	Time 0.223 (0.458)	Data Time 0.001 (0.014)	Loss 2.9738 (3.0139)	Entropy 0.72239 (0.72833)	Top-1 acc 51.953 (51.647)	Top-5 acc 76.562 (74.722)	lr 0.02042
Train [34][2540/3239]	Time 0.238 (0.457)	Data Time 0.001 (0.014)	Loss 2.8735 (3.0139)	Entropy 0.72269 (0.72830)	Top-1 acc 57.812 (51.655)	Top-5 acc 77.734 (74.725)	lr 0.02042
Train [34][2550/3239]	Time 0.327 (0.457)	Data Time 0.001 (0.014)	Loss 2.8350 (3.0141)	Entropy 0.72228 (0.72828)	Top-1 acc 57.031 (51.653)	Top-5 acc 79.297 (74.721)	lr 0.02042
Train [34][2560/3239]	Time 0.218 (0.457)	Data Time 0.001 (0.014)	Loss 2.9558 (3.0142)	Entropy 0.72251 (0.72826)	Top-1 acc 52.734 (51.652)	Top-5 acc 76.172 (74.721)	lr 0.02042
Train [34][2570/3239]	Time 0.244 (0.457)	Data Time 0.001 (0.014)	Loss 2.9959 (3.0141)	Entropy 0.72271 (0.72824)	Top-1 acc 55.078 (51.661)	Top-5 acc 76.172 (74.724)	lr 0.02042
Train [34][2580/3239]	Time 0.232 (0.457)	Data Time 0.001 (0.013)	Loss 2.8467 (3.0139)	Entropy 0.72260 (0.72821)	Top-1 acc 58.203 (51.663)	Top-5 acc 80.469 (74.727)	lr 0.02042
Train [34][2590/3239]	Time 0.217 (0.456)	Data Time 0.001 (0.013)	Loss 2.9964 (3.0139)	Entropy 0.72278 (0.72819)	Top-1 acc 50.000 (51.664)	Top-5 acc 77.734 (74.729)	lr 0.02042
Train [34][2600/3239]	Time 0.228 (0.456)	Data Time 0.001 (0.013)	Loss 3.0594 (3.0139)	Entropy 0.72286 (0.72817)	Top-1 acc 51.562 (51.667)	Top-5 acc 76.562 (74.727)	lr 0.02042
Train [34][2610/3239]	Time 0.221 (0.456)	Data Time 0.001 (0.013)	Loss 3.2087 (3.0138)	Entropy 0.72289 (0.72815)	Top-1 acc 48.828 (51.668)	Top-5 acc 72.656 (74.730)	lr 0.02042
Train [34][2620/3239]	Time 0.248 (0.456)	Data Time 0.002 (0.013)	Loss 2.8790 (3.0137)	Entropy 0.72320 (0.72813)	Top-1 acc 51.172 (51.673)	Top-5 acc 74.609 (74.732)	lr 0.02042
Train [34][2630/3239]	Time 0.231 (0.456)	Data Time 0.001 (0.013)	Loss 3.0206 (3.0138)	Entropy 0.72332 (0.72811)	Top-1 acc 50.391 (51.671)	Top-5 acc 76.562 (74.731)	lr 0.02041
Train [34][2640/3239]	Time 0.247 (0.456)	Data Time 0.001 (0.013)	Loss 3.1410 (3.0140)	Entropy 0.72322 (0.72810)	Top-1 acc 46.875 (51.668)	Top-5 acc 73.047 (74.728)	lr 0.02041
Train [34][2650/3239]	Time 0.223 (0.455)	Data Time 0.001 (0.013)	Loss 3.0747 (3.0141)	Entropy 0.72323 (0.72808)	Top-1 acc 50.000 (51.663)	Top-5 acc 75.391 (74.730)	lr 0.02041
Train [34][2660/3239]	Time 0.214 (0.455)	Data Time 0.001 (0.013)	Loss 2.7898 (3.0138)	Entropy 0.72295 (0.72806)	Top-1 acc 56.641 (51.672)	Top-5 acc 78.516 (74.734)	lr 0.02041
Train [34][2670/3239]	Time 0.231 (0.455)	Data Time 0.001 (0.013)	Loss 2.9937 (3.0137)	Entropy 0.72303 (0.72804)	Top-1 acc 49.609 (51.678)	Top-5 acc 78.516 (74.739)	lr 0.02041
Train [34][2680/3239]	Time 0.222 (0.455)	Data Time 0.001 (0.013)	Loss 2.9807 (3.0136)	Entropy 0.72319 (0.72802)	Top-1 acc 48.828 (51.675)	Top-5 acc 78.125 (74.740)	lr 0.02041
Train [34][2690/3239]	Time 0.283 (0.455)	Data Time 0.001 (0.013)	Loss 3.1852 (3.0137)	Entropy 0.72307 (0.72800)	Top-1 acc 51.172 (51.675)	Top-5 acc 71.094 (74.739)	lr 0.02041
Train [34][2700/3239]	Time 0.261 (0.454)	Data Time 0.001 (0.013)	Loss 2.8772 (3.0134)	Entropy 0.72319 (0.72798)	Top-1 acc 59.375 (51.679)	Top-5 acc 76.172 (74.744)	lr 0.02041
Train [34][2710/3239]	Time 0.348 (0.454)	Data Time 0.001 (0.013)	Loss 3.2611 (3.0138)	Entropy 0.72319 (0.72797)	Top-1 acc 45.312 (51.672)	Top-5 acc 67.578 (74.737)	lr 0.02041
Train [34][2720/3239]	Time 0.225 (0.454)	Data Time 0.001 (0.013)	Loss 2.9225 (3.0138)	Entropy 0.72290 (0.72795)	Top-1 acc 54.688 (51.672)	Top-5 acc 74.609 (74.732)	lr 0.02041
Train [34][2730/3239]	Time 0.246 (0.454)	Data Time 0.001 (0.013)	Loss 3.2029 (3.0135)	Entropy 0.72250 (0.72793)	Top-1 acc 45.312 (51.674)	Top-5 acc 70.703 (74.736)	lr 0.02041
Train [34][2740/3239]	Time 0.230 (0.454)	Data Time 0.001 (0.013)	Loss 2.9643 (3.0136)	Entropy 0.72238 (0.72791)	Top-1 acc 47.656 (51.668)	Top-5 acc 76.172 (74.734)	lr 0.02041
Train [34][2750/3239]	Time 0.227 (0.454)	Data Time 0.001 (0.013)	Loss 3.0304 (3.0136)	Entropy 0.72248 (0.72789)	Top-1 acc 53.125 (51.670)	Top-5 acc 75.781 (74.735)	lr 0.02040
Train [34][2760/3239]	Time 0.233 (0.454)	Data Time 0.001 (0.013)	Loss 3.0616 (3.0137)	Entropy 0.72279 (0.72787)	Top-1 acc 51.562 (51.668)	Top-5 acc 71.094 (74.733)	lr 0.02040
Train [34][2770/3239]	Time 0.227 (0.453)	Data Time 0.001 (0.013)	Loss 3.0441 (3.0138)	Entropy 0.72294 (0.72785)	Top-1 acc 50.391 (51.671)	Top-5 acc 74.609 (74.733)	lr 0.02040
Train [34][2780/3239]	Time 0.325 (0.453)	Data Time 0.001 (0.013)	Loss 2.8931 (3.0139)	Entropy 0.72272 (0.72784)	Top-1 acc 49.609 (51.663)	Top-5 acc 77.344 (74.730)	lr 0.02040
Train [34][2790/3239]	Time 0.215 (0.453)	Data Time 0.001 (0.013)	Loss 3.0344 (3.0138)	Entropy 0.72266 (0.72782)	Top-1 acc 52.734 (51.670)	Top-5 acc 75.781 (74.734)	lr 0.02040
Train [34][2800/3239]	Time 0.221 (0.453)	Data Time 0.001 (0.013)	Loss 3.1337 (3.0137)	Entropy 0.72277 (0.72780)	Top-1 acc 45.312 (51.671)	Top-5 acc 75.391 (74.739)	lr 0.02040
Train [34][2810/3239]	Time 0.221 (0.453)	Data Time 0.001 (0.013)	Loss 3.1060 (3.0138)	Entropy 0.72287 (0.72778)	Top-1 acc 52.344 (51.668)	Top-5 acc 73.047 (74.739)	lr 0.02040
Train [34][2820/3239]	Time 0.236 (0.453)	Data Time 0.001 (0.012)	Loss 2.9251 (3.0135)	Entropy 0.72323 (0.72776)	Top-1 acc 52.734 (51.677)	Top-5 acc 78.516 (74.748)	lr 0.02040
Train [34][2830/3239]	Time 0.228 (0.452)	Data Time 0.001 (0.012)	Loss 2.8616 (3.0131)	Entropy 0.72346 (0.72775)	Top-1 acc 55.469 (51.682)	Top-5 acc 76.562 (74.756)	lr 0.02040
Train [34][2840/3239]	Time 0.225 (0.452)	Data Time 0.001 (0.012)	Loss 2.8934 (3.0130)	Entropy 0.72333 (0.72773)	Top-1 acc 53.906 (51.683)	Top-5 acc 76.172 (74.758)	lr 0.02040
Train [34][2850/3239]	Time 0.232 (0.452)	Data Time 0.001 (0.012)	Loss 3.0995 (3.0130)	Entropy 0.72331 (0.72772)	Top-1 acc 49.219 (51.684)	Top-5 acc 73.047 (74.756)	lr 0.02040
Train [34][2860/3239]	Time 0.229 (0.452)	Data Time 0.001 (0.012)	Loss 2.9231 (3.0130)	Entropy 0.72301 (0.72770)	Top-1 acc 54.297 (51.686)	Top-5 acc 76.562 (74.758)	lr 0.02040
Train [34][2870/3239]	Time 0.313 (0.452)	Data Time 0.001 (0.012)	Loss 2.9147 (3.0130)	Entropy 0.72289 (0.72769)	Top-1 acc 54.297 (51.683)	Top-5 acc 76.562 (74.757)	lr 0.02040
Train [34][2880/3239]	Time 0.227 (0.451)	Data Time 0.001 (0.012)	Loss 2.7548 (3.0129)	Entropy 0.72296 (0.72767)	Top-1 acc 52.734 (51.681)	Top-5 acc 82.422 (74.757)	lr 0.02039
Train [34][2890/3239]	Time 0.227 (0.451)	Data Time 0.001 (0.012)	Loss 2.8427 (3.0130)	Entropy 0.72257 (0.72765)	Top-1 acc 50.781 (51.682)	Top-5 acc 76.953 (74.754)	lr 0.02039
Train [34][2900/3239]	Time 0.222 (0.451)	Data Time 0.001 (0.012)	Loss 2.8925 (3.0131)	Entropy 0.72178 (0.72763)	Top-1 acc 55.469 (51.680)	Top-5 acc 75.000 (74.749)	lr 0.02039
Train [34][2910/3239]	Time 0.222 (0.451)	Data Time 0.001 (0.012)	Loss 2.9650 (3.0130)	Entropy 0.72119 (0.72761)	Top-1 acc 52.344 (51.678)	Top-5 acc 77.344 (74.752)	lr 0.02039
Train [34][2920/3239]	Time 0.230 (0.451)	Data Time 0.001 (0.012)	Loss 2.9221 (3.0128)	Entropy 0.72119 (0.72759)	Top-1 acc 52.734 (51.680)	Top-5 acc 76.172 (74.757)	lr 0.02039
Train [34][2930/3239]	Time 0.230 (0.450)	Data Time 0.001 (0.012)	Loss 2.8549 (3.0128)	Entropy 0.72081 (0.72757)	Top-1 acc 52.734 (51.679)	Top-5 acc 77.344 (74.756)	lr 0.02039
Train [34][2940/3239]	Time 0.311 (0.450)	Data Time 0.001 (0.012)	Loss 3.0330 (3.0129)	Entropy 0.72092 (0.72755)	Top-1 acc 49.219 (51.677)	Top-5 acc 73.828 (74.755)	lr 0.02039
Train [34][2950/3239]	Time 0.230 (0.450)	Data Time 0.001 (0.012)	Loss 3.1262 (3.0130)	Entropy 0.72118 (0.72752)	Top-1 acc 48.438 (51.673)	Top-5 acc 72.266 (74.750)	lr 0.02039
Train [34][2960/3239]	Time 0.218 (0.450)	Data Time 0.001 (0.012)	Loss 3.1082 (3.0132)	Entropy 0.72088 (0.72750)	Top-1 acc 51.562 (51.672)	Top-5 acc 71.094 (74.747)	lr 0.02039
Train [34][2970/3239]	Time 0.233 (0.450)	Data Time 0.001 (0.012)	Loss 2.8787 (3.0130)	Entropy 0.72102 (0.72748)	Top-1 acc 53.125 (51.678)	Top-5 acc 78.906 (74.753)	lr 0.02039
Train [34][2980/3239]	Time 0.234 (0.450)	Data Time 0.001 (0.012)	Loss 2.9241 (3.0128)	Entropy 0.72101 (0.72746)	Top-1 acc 51.172 (51.679)	Top-5 acc 78.906 (74.757)	lr 0.02039
Train [34][2990/3239]	Time 0.224 (0.449)	Data Time 0.001 (0.012)	Loss 3.0106 (3.0128)	Entropy 0.72095 (0.72744)	Top-1 acc 50.781 (51.680)	Top-5 acc 74.609 (74.759)	lr 0.02039
Train [34][3000/3239]	Time 0.228 (0.449)	Data Time 0.001 (0.012)	Loss 3.1998 (3.0128)	Entropy 0.72057 (0.72741)	Top-1 acc 47.656 (51.678)	Top-5 acc 68.359 (74.755)	lr 0.02039
Train [34][3010/3239]	Time 0.224 (0.449)	Data Time 0.001 (0.012)	Loss 3.1369 (3.0131)	Entropy 0.72063 (0.72739)	Top-1 acc 47.656 (51.673)	Top-5 acc 70.703 (74.747)	lr 0.02038
Train [34][3020/3239]	Time 0.224 (0.449)	Data Time 0.001 (0.012)	Loss 2.9654 (3.0129)	Entropy 0.72053 (0.72737)	Top-1 acc 54.297 (51.676)	Top-5 acc 76.172 (74.748)	lr 0.02038
Train [34][3030/3239]	Time 0.317 (0.449)	Data Time 0.001 (0.012)	Loss 3.0619 (3.0131)	Entropy 0.72049 (0.72735)	Top-1 acc 52.344 (51.672)	Top-5 acc 72.656 (74.746)	lr 0.02038
Train [34][3040/3239]	Time 0.233 (0.448)	Data Time 0.001 (0.012)	Loss 2.8657 (3.0131)	Entropy 0.72057 (0.72732)	Top-1 acc 53.906 (51.670)	Top-5 acc 80.078 (74.745)	lr 0.02038
Train [34][3050/3239]	Time 0.229 (0.448)	Data Time 0.002 (0.012)	Loss 2.8854 (3.0130)	Entropy 0.72040 (0.72730)	Top-1 acc 56.641 (51.673)	Top-5 acc 77.734 (74.747)	lr 0.02038
Train [34][3060/3239]	Time 0.222 (0.448)	Data Time 0.001 (0.012)	Loss 3.0806 (3.0132)	Entropy 0.72048 (0.72728)	Top-1 acc 50.000 (51.665)	Top-5 acc 75.000 (74.744)	lr 0.02038
Train [34][3070/3239]	Time 0.224 (0.448)	Data Time 0.001 (0.012)	Loss 2.9172 (3.0131)	Entropy 0.72038 (0.72726)	Top-1 acc 53.516 (51.669)	Top-5 acc 78.516 (74.747)	lr 0.02038
Train [34][3080/3239]	Time 0.242 (0.448)	Data Time 0.001 (0.012)	Loss 2.8835 (3.0130)	Entropy 0.72039 (0.72724)	Top-1 acc 54.688 (51.670)	Top-5 acc 75.391 (74.750)	lr 0.02038
Train [34][3090/3239]	Time 0.305 (0.456)	Data Time 0.004 (0.012)	Loss 2.9189 (3.0129)	Entropy 0.72013 (0.72721)	Top-1 acc 53.906 (51.676)	Top-5 acc 77.734 (74.752)	lr 0.02038
Train [34][3100/3239]	Time 0.340 (0.456)	Data Time 0.002 (0.011)	Loss 2.8304 (3.0126)	Entropy 0.72007 (0.72719)	Top-1 acc 57.031 (51.682)	Top-5 acc 78.516 (74.759)	lr 0.02038
Train [34][3110/3239]	Time 0.231 (0.456)	Data Time 0.001 (0.011)	Loss 2.9969 (3.0128)	Entropy 0.72028 (0.72717)	Top-1 acc 51.562 (51.675)	Top-5 acc 76.562 (74.757)	lr 0.02038
Train [34][3120/3239]	Time 0.233 (0.456)	Data Time 0.001 (0.011)	Loss 2.9899 (3.0127)	Entropy 0.72052 (0.72715)	Top-1 acc 53.516 (51.681)	Top-5 acc 76.953 (74.759)	lr 0.02038
Train [34][3130/3239]	Time 0.233 (0.456)	Data Time 0.002 (0.011)	Loss 3.1857 (3.0127)	Entropy 0.72072 (0.72713)	Top-1 acc 48.828 (51.679)	Top-5 acc 72.266 (74.759)	lr 0.02038
Train [34][3140/3239]	Time 0.240 (0.456)	Data Time 0.001 (0.011)	Loss 3.0233 (3.0127)	Entropy 0.72055 (0.72711)	Top-1 acc 50.000 (51.677)	Top-5 acc 73.438 (74.757)	lr 0.02037
Train [34][3150/3239]	Time 0.236 (0.456)	Data Time 0.001 (0.011)	Loss 2.9153 (3.0128)	Entropy 0.72028 (0.72708)	Top-1 acc 53.516 (51.675)	Top-5 acc 75.391 (74.753)	lr 0.02037
Train [34][3160/3239]	Time 0.255 (0.456)	Data Time 0.001 (0.011)	Loss 2.8486 (3.0128)	Entropy 0.72031 (0.72706)	Top-1 acc 55.078 (51.678)	Top-5 acc 77.344 (74.751)	lr 0.02037
Train [34][3170/3239]	Time 0.245 (0.456)	Data Time 0.001 (0.011)	Loss 3.2810 (3.0130)	Entropy 0.72010 (0.72704)	Top-1 acc 47.656 (51.678)	Top-5 acc 71.875 (74.749)	lr 0.02037
Train [34][3180/3239]	Time 0.227 (0.455)	Data Time 0.000 (0.011)	Loss 3.2028 (3.0128)	Entropy 0.72029 (0.72702)	Top-1 acc 46.875 (51.682)	Top-5 acc 68.359 (74.752)	lr 0.02037
Train [34][3190/3239]	Time 0.352 (0.455)	Data Time 0.000 (0.011)	Loss 2.7023 (3.0127)	Entropy 0.72041 (0.72700)	Top-1 acc 60.547 (51.684)	Top-5 acc 81.641 (74.754)	lr 0.02037
Train [34][3200/3239]	Time 0.245 (0.455)	Data Time 0.000 (0.011)	Loss 3.2559 (3.0128)	Entropy 0.72037 (0.72698)	Top-1 acc 44.531 (51.684)	Top-5 acc 68.359 (74.752)	lr 0.02037
Train [34][3210/3239]	Time 0.239 (0.455)	Data Time 0.000 (0.011)	Loss 2.8956 (3.0129)	Entropy 0.72007 (0.72696)	Top-1 acc 57.422 (51.686)	Top-5 acc 76.953 (74.748)	lr 0.02037
Train [34][3220/3239]	Time 0.244 (0.455)	Data Time 0.000 (0.011)	Loss 2.7406 (3.0132)	Entropy 0.71989 (0.72694)	Top-1 acc 62.891 (51.679)	Top-5 acc 80.859 (74.745)	lr 0.02037
Train [34][3230/3239]	Time 0.246 (0.455)	Data Time 0.000 (0.011)	Loss 2.9284 (3.0132)	Entropy 0.71958 (0.72691)	Top-1 acc 55.859 (51.676)	Top-5 acc 75.000 (74.744)	lr 0.02037
Train [34][3239/3239]	Time 1.060 (0.455)	Data Time 0.000 (0.011)	Loss 2.9352 (3.0130)	Entropy 0.71970 (0.72689)	Top-1 acc 56.790 (51.682)	Top-5 acc 74.074 (74.748)	lr 0.02037
==========Valid [34/120]	loss 1.727	top-1 acc 60.970 (60.970)	top-5 acc 82.674	Train top-1 51.682	top-5 74.748	Entropy 0.71970	Latency-None: 0.000ms	Flops: 539.76M
Train [35][0/3239]	Time 28.308 (28.308)	Data Time 25.762 (25.762)	Loss 3.1859 (3.1859)	Entropy 0.71993 (0.71993)	Top-1 acc 48.828 (48.828)	Top-5 acc 68.750 (68.750)	lr 0.02037
Train [35][10/3239]	Time 0.227 (3.137)	Data Time 0.001 (2.346)	Loss 2.9041 (3.0318)	Entropy 0.71977 (0.71997)	Top-1 acc 53.906 (50.036)	Top-5 acc 76.953 (74.574)	lr 0.02037
Train [35][20/3239]	Time 0.240 (1.835)	Data Time 0.001 (1.230)	Loss 3.0029 (3.0523)	Entropy 0.71982 (0.71988)	Top-1 acc 52.344 (49.833)	Top-5 acc 72.656 (73.828)	lr 0.02036
Train [35][30/3239]	Time 0.262 (1.379)	Data Time 0.001 (0.834)	Loss 2.8119 (3.0382)	Entropy 0.71967 (0.71987)	Top-1 acc 57.422 (50.743)	Top-5 acc 78.125 (74.055)	lr 0.02036
Train [35][40/3239]	Time 0.250 (1.146)	Data Time 0.001 (0.631)	Loss 3.0347 (3.0255)	Entropy 0.71975 (0.71981)	Top-1 acc 49.609 (51.086)	Top-5 acc 76.172 (74.276)	lr 0.02036
Train [35][50/3239]	Time 0.269 (1.004)	Data Time 0.002 (0.507)	Loss 2.9411 (3.0213)	Entropy 0.71981 (0.71980)	Top-1 acc 54.688 (51.287)	Top-5 acc 76.172 (74.395)	lr 0.02036
Train [35][60/3239]	Time 0.251 (0.910)	Data Time 0.001 (0.425)	Loss 3.1251 (3.0281)	Entropy 0.72002 (0.71982)	Top-1 acc 49.219 (51.050)	Top-5 acc 70.703 (74.321)	lr 0.02036
Train [35][70/3239]	Time 0.281 (0.844)	Data Time 0.001 (0.365)	Loss 2.9130 (3.0212)	Entropy 0.72037 (0.71987)	Top-1 acc 55.469 (51.238)	Top-5 acc 75.391 (74.532)	lr 0.02036
Train [35][80/3239]	Time 0.234 (0.791)	Data Time 0.001 (0.320)	Loss 3.0837 (3.0220)	Entropy 0.72039 (0.71993)	Top-1 acc 46.484 (51.254)	Top-5 acc 75.781 (74.537)	lr 0.02036
Train [35][90/3239]	Time 0.342 (0.750)	Data Time 0.001 (0.285)	Loss 3.0276 (3.0214)	Entropy 0.72045 (0.71999)	Top-1 acc 51.562 (51.361)	Top-5 acc 72.266 (74.554)	lr 0.02036
Train [35][100/3239]	Time 0.236 (0.716)	Data Time 0.001 (0.257)	Loss 2.8494 (3.0115)	Entropy 0.72042 (0.72003)	Top-1 acc 54.688 (51.725)	Top-5 acc 80.469 (74.752)	lr 0.02036
Train [35][110/3239]	Time 0.229 (0.689)	Data Time 0.001 (0.234)	Loss 2.8238 (3.0109)	Entropy 0.72047 (0.72007)	Top-1 acc 53.906 (51.735)	Top-5 acc 80.078 (74.722)	lr 0.02036
Train [35][120/3239]	Time 0.225 (0.667)	Data Time 0.001 (0.215)	Loss 2.9612 (3.0076)	Entropy 0.72024 (0.72009)	Top-1 acc 51.172 (51.740)	Top-5 acc 78.516 (74.748)	lr 0.02036
Train [35][130/3239]	Time 0.228 (0.648)	Data Time 0.001 (0.199)	Loss 3.0267 (3.0046)	Entropy 0.72007 (0.72010)	Top-1 acc 55.859 (51.804)	Top-5 acc 75.391 (74.788)	lr 0.02036
Train [35][140/3239]	Time 0.232 (0.631)	Data Time 0.001 (0.185)	Loss 2.8362 (3.0024)	Entropy 0.71976 (0.72008)	Top-1 acc 55.078 (51.801)	Top-5 acc 80.078 (74.850)	lr 0.02036
Train [35][150/3239]	Time 0.231 (0.617)	Data Time 0.001 (0.173)	Loss 2.9554 (3.0016)	Entropy 0.71951 (0.72006)	Top-1 acc 53.906 (51.829)	Top-5 acc 76.172 (74.873)	lr 0.02035
Train [35][160/3239]	Time 0.336 (0.604)	Data Time 0.001 (0.162)	Loss 2.9730 (3.0002)	Entropy 0.71958 (0.72002)	Top-1 acc 55.469 (51.856)	Top-5 acc 75.391 (74.944)	lr 0.02035
Train [35][170/3239]	Time 0.232 (0.593)	Data Time 0.001 (0.153)	Loss 3.0648 (2.9986)	Entropy 0.71957 (0.72000)	Top-1 acc 53.125 (51.898)	Top-5 acc 74.609 (75.027)	lr 0.02035
Train [35][180/3239]	Time 0.233 (0.583)	Data Time 0.001 (0.144)	Loss 3.0373 (2.9988)	Entropy 0.71990 (0.71998)	Top-1 acc 52.734 (51.903)	Top-5 acc 73.828 (75.006)	lr 0.02035
Train [35][190/3239]	Time 0.238 (0.575)	Data Time 0.001 (0.137)	Loss 3.2037 (2.9984)	Entropy 0.71946 (0.71997)	Top-1 acc 46.094 (51.935)	Top-5 acc 70.703 (74.961)	lr 0.02035
Train [35][200/3239]	Time 0.237 (0.566)	Data Time 0.002 (0.130)	Loss 3.0778 (2.9982)	Entropy 0.71976 (0.71995)	Top-1 acc 51.172 (51.980)	Top-5 acc 70.703 (74.938)	lr 0.02035
Train [35][210/3239]	Time 0.273 (0.560)	Data Time 0.003 (0.124)	Loss 3.1604 (2.9980)	Entropy 0.71965 (0.71994)	Top-1 acc 49.219 (51.979)	Top-5 acc 71.875 (74.930)	lr 0.02035
Train [35][220/3239]	Time 0.248 (0.553)	Data Time 0.001 (0.118)	Loss 2.8951 (3.0005)	Entropy 0.72004 (0.71993)	Top-1 acc 55.859 (51.921)	Top-5 acc 77.344 (74.862)	lr 0.02035
Train [35][230/3239]	Time 0.263 (0.548)	Data Time 0.001 (0.113)	Loss 2.8739 (2.9995)	Entropy 0.71967 (0.71993)	Top-1 acc 54.688 (51.928)	Top-5 acc 75.391 (74.850)	lr 0.02035
Train [35][240/3239]	Time 0.248 (0.543)	Data Time 0.001 (0.109)	Loss 2.7554 (2.9999)	Entropy 0.71983 (0.71992)	Top-1 acc 53.516 (51.887)	Top-5 acc 81.641 (74.846)	lr 0.02035
Train [35][250/3239]	Time 0.337 (0.538)	Data Time 0.001 (0.105)	Loss 2.9388 (2.9979)	Entropy 0.71989 (0.71992)	Top-1 acc 54.297 (51.955)	Top-5 acc 76.562 (74.894)	lr 0.02035
Train [35][260/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.101)	Loss 3.0898 (2.9969)	Entropy 0.71988 (0.71992)	Top-1 acc 49.219 (51.977)	Top-5 acc 72.656 (74.943)	lr 0.02035
Train [35][270/3239]	Time 0.238 (0.528)	Data Time 0.001 (0.097)	Loss 2.9295 (2.9941)	Entropy 0.71973 (0.71992)	Top-1 acc 54.297 (52.055)	Top-5 acc 78.516 (75.029)	lr 0.02035
Train [35][280/3239]	Time 0.218 (0.524)	Data Time 0.001 (0.094)	Loss 3.0557 (2.9927)	Entropy 0.71959 (0.71991)	Top-1 acc 50.391 (52.113)	Top-5 acc 76.562 (75.078)	lr 0.02034
Train [35][290/3239]	Time 0.237 (0.520)	Data Time 0.001 (0.090)	Loss 3.0920 (2.9938)	Entropy 0.71984 (0.71990)	Top-1 acc 48.438 (52.102)	Top-5 acc 75.000 (75.056)	lr 0.02034
Train [35][300/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.087)	Loss 3.1340 (2.9932)	Entropy 0.71953 (0.71989)	Top-1 acc 48.438 (52.106)	Top-5 acc 69.531 (75.047)	lr 0.02034
Train [35][310/3239]	Time 0.236 (0.512)	Data Time 0.001 (0.085)	Loss 2.9931 (2.9918)	Entropy 0.71947 (0.71988)	Top-1 acc 51.562 (52.137)	Top-5 acc 74.609 (75.055)	lr 0.02034
Train [35][320/3239]	Time 0.329 (0.509)	Data Time 0.001 (0.082)	Loss 2.9020 (2.9929)	Entropy 0.71972 (0.71987)	Top-1 acc 55.859 (52.108)	Top-5 acc 74.219 (75.001)	lr 0.02034
Train [35][330/3239]	Time 0.239 (0.506)	Data Time 0.001 (0.080)	Loss 3.0358 (2.9947)	Entropy 0.72014 (0.71987)	Top-1 acc 49.609 (52.061)	Top-5 acc 74.609 (74.986)	lr 0.02034
Train [35][340/3239]	Time 0.264 (0.503)	Data Time 0.001 (0.077)	Loss 2.9441 (2.9952)	Entropy 0.72000 (0.71988)	Top-1 acc 52.734 (52.038)	Top-5 acc 73.828 (74.973)	lr 0.02034
Train [35][350/3239]	Time 0.221 (0.501)	Data Time 0.001 (0.075)	Loss 2.8642 (2.9967)	Entropy 0.71961 (0.71988)	Top-1 acc 57.031 (52.010)	Top-5 acc 77.344 (74.905)	lr 0.02034
Train [35][360/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.073)	Loss 3.1341 (2.9981)	Entropy 0.71961 (0.71987)	Top-1 acc 47.266 (51.980)	Top-5 acc 68.359 (74.859)	lr 0.02034
Train [35][370/3239]	Time 0.222 (0.496)	Data Time 0.001 (0.071)	Loss 2.8816 (2.9971)	Entropy 0.71968 (0.71987)	Top-1 acc 55.859 (52.043)	Top-5 acc 76.953 (74.884)	lr 0.02034
Train [35][380/3239]	Time 0.235 (0.493)	Data Time 0.001 (0.069)	Loss 3.0353 (2.9968)	Entropy 0.71957 (0.71986)	Top-1 acc 51.953 (52.022)	Top-5 acc 73.828 (74.904)	lr 0.02034
Train [35][390/3239]	Time 0.257 (0.491)	Data Time 0.001 (0.068)	Loss 2.9048 (2.9976)	Entropy 0.71974 (0.71985)	Top-1 acc 55.469 (52.010)	Top-5 acc 76.953 (74.886)	lr 0.02034
Train [35][400/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.066)	Loss 3.1056 (2.9977)	Entropy 0.71978 (0.71985)	Top-1 acc 48.047 (52.018)	Top-5 acc 73.438 (74.884)	lr 0.02034
Train [35][410/3239]	Time 0.260 (0.487)	Data Time 0.001 (0.064)	Loss 2.9640 (2.9974)	Entropy 0.71990 (0.71985)	Top-1 acc 50.391 (51.999)	Top-5 acc 74.609 (74.880)	lr 0.02033
Train [35][420/3239]	Time 0.236 (0.485)	Data Time 0.001 (0.063)	Loss 2.9179 (2.9974)	Entropy 0.72010 (0.71985)	Top-1 acc 55.469 (52.020)	Top-5 acc 77.734 (74.880)	lr 0.02033
Train [35][430/3239]	Time 0.236 (0.483)	Data Time 0.001 (0.062)	Loss 3.2431 (2.9971)	Entropy 0.71988 (0.71986)	Top-1 acc 48.438 (52.046)	Top-5 acc 69.141 (74.893)	lr 0.02033
Train [35][440/3239]	Time 0.227 (0.482)	Data Time 0.001 (0.060)	Loss 2.9347 (2.9968)	Entropy 0.72013 (0.71986)	Top-1 acc 52.734 (52.057)	Top-5 acc 75.781 (74.923)	lr 0.02033
Train [35][450/3239]	Time 0.242 (0.480)	Data Time 0.001 (0.059)	Loss 2.8986 (2.9956)	Entropy 0.71999 (0.71987)	Top-1 acc 54.297 (52.100)	Top-5 acc 77.344 (74.955)	lr 0.02033
Train [35][460/3239]	Time 0.232 (0.478)	Data Time 0.001 (0.058)	Loss 3.2466 (2.9956)	Entropy 0.71997 (0.71987)	Top-1 acc 44.531 (52.080)	Top-5 acc 74.609 (74.963)	lr 0.02033
Train [35][470/3239]	Time 0.236 (0.477)	Data Time 0.001 (0.056)	Loss 2.7050 (2.9950)	Entropy 0.72005 (0.71987)	Top-1 acc 60.156 (52.081)	Top-5 acc 80.078 (74.980)	lr 0.02033
Train [35][480/3239]	Time 0.321 (0.475)	Data Time 0.001 (0.055)	Loss 3.2893 (2.9974)	Entropy 0.72002 (0.71987)	Top-1 acc 41.797 (52.014)	Top-5 acc 70.703 (74.940)	lr 0.02033
Train [35][490/3239]	Time 0.223 (0.474)	Data Time 0.001 (0.054)	Loss 3.0364 (2.9978)	Entropy 0.72012 (0.71988)	Top-1 acc 49.609 (52.000)	Top-5 acc 75.000 (74.922)	lr 0.02033
Train [35][500/3239]	Time 0.238 (0.472)	Data Time 0.003 (0.053)	Loss 3.0341 (2.9969)	Entropy 0.72030 (0.71989)	Top-1 acc 50.781 (52.023)	Top-5 acc 73.828 (74.945)	lr 0.02033
Train [35][510/3239]	Time 0.272 (0.527)	Data Time 0.002 (0.052)	Loss 3.0109 (2.9981)	Entropy 0.71976 (0.71989)	Top-1 acc 53.125 (52.001)	Top-5 acc 72.266 (74.911)	lr 0.02033
Train [35][520/3239]	Time 0.272 (0.525)	Data Time 0.002 (0.051)	Loss 3.0701 (2.9983)	Entropy 0.72001 (0.71989)	Top-1 acc 50.000 (51.994)	Top-5 acc 75.000 (74.918)	lr 0.02033
Train [35][530/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.050)	Loss 2.9402 (2.9987)	Entropy 0.71990 (0.71989)	Top-1 acc 51.172 (51.966)	Top-5 acc 73.828 (74.912)	lr 0.02032
Train [35][540/3239]	Time 0.230 (0.521)	Data Time 0.002 (0.049)	Loss 2.9136 (2.9976)	Entropy 0.71962 (0.71989)	Top-1 acc 46.875 (51.979)	Top-5 acc 79.297 (74.941)	lr 0.02032
Train [35][550/3239]	Time 0.254 (0.519)	Data Time 0.001 (0.049)	Loss 2.8150 (2.9981)	Entropy 0.71955 (0.71988)	Top-1 acc 57.422 (51.962)	Top-5 acc 80.078 (74.945)	lr 0.02032
Train [35][560/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.048)	Loss 3.0112 (2.9984)	Entropy 0.71956 (0.71988)	Top-1 acc 53.906 (51.975)	Top-5 acc 71.484 (74.930)	lr 0.02032
Train [35][570/3239]	Time 0.240 (0.514)	Data Time 0.001 (0.047)	Loss 3.0492 (2.9983)	Entropy 0.71955 (0.71987)	Top-1 acc 49.219 (51.983)	Top-5 acc 73.828 (74.916)	lr 0.02032
Train [35][580/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.046)	Loss 3.0339 (2.9977)	Entropy 0.71939 (0.71986)	Top-1 acc 50.781 (51.982)	Top-5 acc 71.484 (74.935)	lr 0.02032
Train [35][590/3239]	Time 0.234 (0.511)	Data Time 0.001 (0.045)	Loss 3.1570 (2.9990)	Entropy 0.71921 (0.71986)	Top-1 acc 51.172 (51.966)	Top-5 acc 72.266 (74.900)	lr 0.02032
Train [35][600/3239]	Time 0.231 (0.509)	Data Time 0.001 (0.045)	Loss 2.9801 (2.9983)	Entropy 0.71911 (0.71985)	Top-1 acc 53.516 (51.983)	Top-5 acc 74.219 (74.919)	lr 0.02032
Train [35][610/3239]	Time 0.230 (0.507)	Data Time 0.001 (0.044)	Loss 3.0319 (2.9994)	Entropy 0.71891 (0.71983)	Top-1 acc 53.125 (51.970)	Top-5 acc 73.438 (74.897)	lr 0.02032
Train [35][620/3239]	Time 0.265 (0.506)	Data Time 0.001 (0.043)	Loss 3.0006 (2.9991)	Entropy 0.71880 (0.71982)	Top-1 acc 53.125 (51.978)	Top-5 acc 75.781 (74.919)	lr 0.02032
Train [35][630/3239]	Time 0.235 (0.504)	Data Time 0.001 (0.043)	Loss 2.8236 (2.9996)	Entropy 0.71854 (0.71980)	Top-1 acc 55.469 (51.961)	Top-5 acc 79.688 (74.920)	lr 0.02032
Train [35][640/3239]	Time 0.324 (0.502)	Data Time 0.002 (0.042)	Loss 3.0348 (2.9992)	Entropy 0.71868 (0.71978)	Top-1 acc 54.297 (51.975)	Top-5 acc 71.484 (74.937)	lr 0.02032
Train [35][650/3239]	Time 0.225 (0.501)	Data Time 0.001 (0.041)	Loss 2.8058 (2.9982)	Entropy 0.71889 (0.71977)	Top-1 acc 55.078 (51.993)	Top-5 acc 78.906 (74.959)	lr 0.02032
Train [35][660/3239]	Time 0.235 (0.499)	Data Time 0.001 (0.041)	Loss 3.0960 (2.9980)	Entropy 0.71912 (0.71976)	Top-1 acc 51.172 (52.005)	Top-5 acc 71.875 (74.962)	lr 0.02031
Train [35][670/3239]	Time 0.235 (0.498)	Data Time 0.001 (0.040)	Loss 2.9868 (2.9979)	Entropy 0.71920 (0.71975)	Top-1 acc 53.125 (52.004)	Top-5 acc 75.391 (74.973)	lr 0.02031
Train [35][680/3239]	Time 0.224 (0.497)	Data Time 0.001 (0.040)	Loss 2.9190 (2.9977)	Entropy 0.71873 (0.71974)	Top-1 acc 54.688 (51.993)	Top-5 acc 79.297 (74.974)	lr 0.02031
Train [35][690/3239]	Time 0.227 (0.496)	Data Time 0.001 (0.039)	Loss 3.0095 (2.9981)	Entropy 0.71857 (0.71972)	Top-1 acc 52.734 (51.980)	Top-5 acc 74.609 (74.973)	lr 0.02031
Train [35][700/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.038)	Loss 3.0104 (2.9981)	Entropy 0.71846 (0.71971)	Top-1 acc 52.734 (51.967)	Top-5 acc 76.172 (74.970)	lr 0.02031
Train [35][710/3239]	Time 0.321 (0.493)	Data Time 0.001 (0.038)	Loss 3.0126 (2.9982)	Entropy 0.71843 (0.71969)	Top-1 acc 50.000 (51.963)	Top-5 acc 75.391 (74.979)	lr 0.02031
Train [35][720/3239]	Time 0.225 (0.492)	Data Time 0.001 (0.037)	Loss 2.8463 (2.9979)	Entropy 0.71837 (0.71967)	Top-1 acc 58.594 (51.967)	Top-5 acc 78.125 (74.979)	lr 0.02031
Train [35][730/3239]	Time 0.237 (0.491)	Data Time 0.001 (0.037)	Loss 3.0102 (2.9975)	Entropy 0.71837 (0.71965)	Top-1 acc 48.438 (51.971)	Top-5 acc 73.828 (74.990)	lr 0.02031
Train [35][740/3239]	Time 0.220 (0.490)	Data Time 0.001 (0.036)	Loss 3.1890 (2.9973)	Entropy 0.71823 (0.71963)	Top-1 acc 51.172 (51.987)	Top-5 acc 70.703 (74.992)	lr 0.02031
Train [35][750/3239]	Time 0.231 (0.488)	Data Time 0.001 (0.036)	Loss 3.1256 (2.9977)	Entropy 0.71823 (0.71962)	Top-1 acc 48.438 (51.969)	Top-5 acc 71.875 (74.990)	lr 0.02031
Train [35][760/3239]	Time 0.215 (0.487)	Data Time 0.001 (0.036)	Loss 3.0184 (2.9984)	Entropy 0.71814 (0.71960)	Top-1 acc 50.391 (51.955)	Top-5 acc 75.391 (74.980)	lr 0.02031
Train [35][770/3239]	Time 0.231 (0.486)	Data Time 0.001 (0.035)	Loss 2.7685 (2.9982)	Entropy 0.71740 (0.71958)	Top-1 acc 55.078 (51.959)	Top-5 acc 80.078 (74.993)	lr 0.02031
Train [35][780/3239]	Time 0.266 (0.485)	Data Time 0.001 (0.035)	Loss 3.3852 (2.9994)	Entropy 0.71676 (0.71954)	Top-1 acc 41.797 (51.939)	Top-5 acc 68.359 (74.969)	lr 0.02031
Train [35][790/3239]	Time 0.223 (0.484)	Data Time 0.001 (0.034)	Loss 2.9379 (2.9995)	Entropy 0.71700 (0.71951)	Top-1 acc 55.078 (51.941)	Top-5 acc 76.953 (74.967)	lr 0.02030
Train [35][800/3239]	Time 0.320 (0.483)	Data Time 0.001 (0.034)	Loss 2.9958 (2.9990)	Entropy 0.71693 (0.71948)	Top-1 acc 51.953 (51.946)	Top-5 acc 74.219 (74.978)	lr 0.02030
Train [35][810/3239]	Time 0.236 (0.482)	Data Time 0.001 (0.033)	Loss 2.9866 (2.9989)	Entropy 0.71705 (0.71945)	Top-1 acc 50.781 (51.938)	Top-5 acc 73.438 (74.982)	lr 0.02030
Train [35][820/3239]	Time 0.223 (0.481)	Data Time 0.001 (0.033)	Loss 3.0966 (2.9977)	Entropy 0.71714 (0.71942)	Top-1 acc 50.781 (51.971)	Top-5 acc 73.828 (75.005)	lr 0.02030
Train [35][830/3239]	Time 0.242 (0.480)	Data Time 0.001 (0.033)	Loss 2.8616 (2.9971)	Entropy 0.71730 (0.71939)	Top-1 acc 58.984 (51.984)	Top-5 acc 78.125 (75.026)	lr 0.02030
Train [35][840/3239]	Time 0.217 (0.479)	Data Time 0.001 (0.032)	Loss 2.9559 (2.9972)	Entropy 0.71715 (0.71936)	Top-1 acc 54.688 (51.985)	Top-5 acc 76.953 (75.028)	lr 0.02030
Train [35][850/3239]	Time 0.227 (0.478)	Data Time 0.001 (0.032)	Loss 3.0484 (2.9975)	Entropy 0.71709 (0.71934)	Top-1 acc 47.266 (51.964)	Top-5 acc 76.172 (75.022)	lr 0.02030
Train [35][860/3239]	Time 0.236 (0.477)	Data Time 0.001 (0.032)	Loss 2.8986 (2.9974)	Entropy 0.71717 (0.71931)	Top-1 acc 54.297 (51.973)	Top-5 acc 77.734 (75.029)	lr 0.02030
Train [35][870/3239]	Time 0.310 (0.477)	Data Time 0.001 (0.031)	Loss 2.8391 (2.9968)	Entropy 0.71710 (0.71929)	Top-1 acc 51.172 (51.971)	Top-5 acc 80.078 (75.040)	lr 0.02030
Train [35][880/3239]	Time 0.237 (0.476)	Data Time 0.001 (0.031)	Loss 2.7948 (2.9962)	Entropy 0.71726 (0.71926)	Top-1 acc 53.516 (51.984)	Top-5 acc 77.734 (75.044)	lr 0.02030
Train [35][890/3239]	Time 0.219 (0.475)	Data Time 0.001 (0.031)	Loss 2.9202 (2.9959)	Entropy 0.71704 (0.71924)	Top-1 acc 57.031 (51.999)	Top-5 acc 75.781 (75.053)	lr 0.02030
Train [35][900/3239]	Time 0.231 (0.474)	Data Time 0.001 (0.030)	Loss 2.8973 (2.9960)	Entropy 0.71653 (0.71921)	Top-1 acc 53.516 (51.988)	Top-5 acc 77.344 (75.040)	lr 0.02030
Train [35][910/3239]	Time 0.222 (0.473)	Data Time 0.001 (0.030)	Loss 2.9003 (2.9951)	Entropy 0.71658 (0.71919)	Top-1 acc 53.516 (52.004)	Top-5 acc 70.312 (75.051)	lr 0.02029
Train [35][920/3239]	Time 0.234 (0.472)	Data Time 0.001 (0.030)	Loss 3.1834 (2.9943)	Entropy 0.71665 (0.71916)	Top-1 acc 43.750 (52.008)	Top-5 acc 69.141 (75.072)	lr 0.02029
Train [35][930/3239]	Time 0.229 (0.471)	Data Time 0.001 (0.029)	Loss 3.1192 (2.9945)	Entropy 0.71662 (0.71913)	Top-1 acc 50.781 (52.008)	Top-5 acc 72.656 (75.068)	lr 0.02029
Train [35][940/3239]	Time 0.237 (0.471)	Data Time 0.001 (0.029)	Loss 2.9547 (2.9946)	Entropy 0.71639 (0.71910)	Top-1 acc 56.641 (52.011)	Top-5 acc 76.172 (75.064)	lr 0.02029
Train [35][950/3239]	Time 0.226 (0.470)	Data Time 0.001 (0.029)	Loss 3.1202 (2.9950)	Entropy 0.71622 (0.71907)	Top-1 acc 48.828 (52.000)	Top-5 acc 73.438 (75.060)	lr 0.02029
Train [35][960/3239]	Time 0.310 (0.469)	Data Time 0.001 (0.029)	Loss 2.7009 (2.9947)	Entropy 0.71608 (0.71904)	Top-1 acc 60.547 (52.005)	Top-5 acc 80.469 (75.070)	lr 0.02029
Train [35][970/3239]	Time 0.232 (0.468)	Data Time 0.001 (0.028)	Loss 2.9983 (2.9946)	Entropy 0.71599 (0.71901)	Top-1 acc 53.906 (52.002)	Top-5 acc 76.562 (75.074)	lr 0.02029
Train [35][980/3239]	Time 0.217 (0.467)	Data Time 0.001 (0.028)	Loss 2.9045 (2.9945)	Entropy 0.71606 (0.71898)	Top-1 acc 55.078 (52.012)	Top-5 acc 79.297 (75.076)	lr 0.02029
Train [35][990/3239]	Time 0.230 (0.467)	Data Time 0.001 (0.028)	Loss 3.0749 (2.9946)	Entropy 0.71568 (0.71895)	Top-1 acc 47.266 (52.000)	Top-5 acc 75.781 (75.081)	lr 0.02029
Train [35][1000/3239]	Time 0.228 (0.466)	Data Time 0.001 (0.027)	Loss 3.0846 (2.9940)	Entropy 0.71599 (0.71892)	Top-1 acc 49.219 (52.017)	Top-5 acc 72.266 (75.092)	lr 0.02029
Train [35][1010/3239]	Time 0.240 (0.465)	Data Time 0.001 (0.027)	Loss 2.6891 (2.9929)	Entropy 0.71588 (0.71889)	Top-1 acc 56.250 (52.035)	Top-5 acc 82.422 (75.114)	lr 0.02029
Train [35][1020/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.027)	Loss 2.8666 (2.9925)	Entropy 0.71572 (0.71886)	Top-1 acc 58.984 (52.052)	Top-5 acc 78.906 (75.125)	lr 0.02029
Train [35][1030/3239]	Time 0.315 (0.464)	Data Time 0.001 (0.027)	Loss 3.0394 (2.9931)	Entropy 0.71509 (0.71883)	Top-1 acc 55.078 (52.040)	Top-5 acc 74.609 (75.117)	lr 0.02029
Train [35][1040/3239]	Time 0.230 (0.463)	Data Time 0.001 (0.026)	Loss 3.0397 (2.9937)	Entropy 0.71525 (0.71879)	Top-1 acc 52.344 (52.027)	Top-5 acc 73.828 (75.102)	lr 0.02028
Train [35][1050/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.026)	Loss 2.9420 (2.9938)	Entropy 0.71512 (0.71876)	Top-1 acc 53.906 (52.017)	Top-5 acc 75.781 (75.103)	lr 0.02028
Train [35][1060/3239]	Time 0.224 (0.462)	Data Time 0.001 (0.026)	Loss 2.9627 (2.9938)	Entropy 0.71504 (0.71872)	Top-1 acc 55.078 (52.025)	Top-5 acc 76.953 (75.100)	lr 0.02028
Train [35][1070/3239]	Time 0.218 (0.461)	Data Time 0.001 (0.026)	Loss 3.0306 (2.9938)	Entropy 0.71472 (0.71869)	Top-1 acc 51.562 (52.031)	Top-5 acc 73.438 (75.100)	lr 0.02028
Train [35][1080/3239]	Time 0.236 (0.461)	Data Time 0.001 (0.026)	Loss 2.9599 (2.9938)	Entropy 0.71475 (0.71865)	Top-1 acc 51.172 (52.031)	Top-5 acc 74.219 (75.097)	lr 0.02028
Train [35][1090/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.025)	Loss 2.8533 (2.9941)	Entropy 0.71478 (0.71861)	Top-1 acc 54.688 (52.035)	Top-5 acc 76.953 (75.089)	lr 0.02028
Train [35][1100/3239]	Time 0.264 (0.460)	Data Time 0.001 (0.025)	Loss 2.9323 (2.9936)	Entropy 0.71443 (0.71858)	Top-1 acc 53.906 (52.046)	Top-5 acc 71.875 (75.093)	lr 0.02028
Train [35][1110/3239]	Time 0.259 (0.459)	Data Time 0.001 (0.025)	Loss 3.0016 (2.9940)	Entropy 0.71419 (0.71854)	Top-1 acc 50.000 (52.039)	Top-5 acc 76.172 (75.091)	lr 0.02028
Train [35][1120/3239]	Time 0.228 (0.459)	Data Time 0.001 (0.025)	Loss 3.0629 (2.9942)	Entropy 0.71419 (0.71850)	Top-1 acc 45.703 (52.020)	Top-5 acc 76.953 (75.089)	lr 0.02028
Train [35][1130/3239]	Time 0.233 (0.458)	Data Time 0.001 (0.024)	Loss 2.8561 (2.9944)	Entropy 0.71415 (0.71846)	Top-1 acc 60.938 (52.025)	Top-5 acc 82.031 (75.093)	lr 0.02028
Train [35][1140/3239]	Time 0.235 (0.458)	Data Time 0.001 (0.024)	Loss 2.8926 (2.9937)	Entropy 0.71406 (0.71843)	Top-1 acc 59.375 (52.041)	Top-5 acc 76.172 (75.100)	lr 0.02028
Train [35][1150/3239]	Time 0.234 (0.457)	Data Time 0.001 (0.024)	Loss 3.0217 (2.9939)	Entropy 0.71406 (0.71839)	Top-1 acc 50.781 (52.044)	Top-5 acc 73.438 (75.095)	lr 0.02028
Train [35][1160/3239]	Time 0.286 (0.481)	Data Time 0.003 (0.024)	Loss 3.1754 (2.9942)	Entropy 0.71350 (0.71835)	Top-1 acc 48.047 (52.033)	Top-5 acc 70.703 (75.085)	lr 0.02028
Train [35][1170/3239]	Time 0.245 (0.481)	Data Time 0.002 (0.024)	Loss 3.0259 (2.9944)	Entropy 0.71354 (0.71831)	Top-1 acc 53.125 (52.021)	Top-5 acc 71.875 (75.084)	lr 0.02027
Train [35][1180/3239]	Time 0.236 (0.480)	Data Time 0.001 (0.024)	Loss 3.1267 (2.9939)	Entropy 0.71359 (0.71827)	Top-1 acc 49.609 (52.037)	Top-5 acc 75.391 (75.096)	lr 0.02027
Train [35][1190/3239]	Time 0.323 (0.479)	Data Time 0.001 (0.023)	Loss 3.0342 (2.9937)	Entropy 0.71355 (0.71823)	Top-1 acc 49.219 (52.043)	Top-5 acc 73.047 (75.102)	lr 0.02027
Train [35][1200/3239]	Time 0.230 (0.479)	Data Time 0.001 (0.023)	Loss 2.8876 (2.9933)	Entropy 0.71359 (0.71819)	Top-1 acc 54.297 (52.054)	Top-5 acc 77.734 (75.118)	lr 0.02027
Train [35][1210/3239]	Time 0.231 (0.478)	Data Time 0.001 (0.023)	Loss 3.1434 (2.9936)	Entropy 0.71399 (0.71815)	Top-1 acc 51.172 (52.057)	Top-5 acc 72.266 (75.115)	lr 0.02027
Train [35][1220/3239]	Time 0.244 (0.478)	Data Time 0.001 (0.023)	Loss 2.9032 (2.9936)	Entropy 0.71389 (0.71812)	Top-1 acc 55.078 (52.056)	Top-5 acc 79.688 (75.122)	lr 0.02027
Train [35][1230/3239]	Time 0.230 (0.477)	Data Time 0.001 (0.023)	Loss 2.7860 (2.9931)	Entropy 0.71413 (0.71809)	Top-1 acc 53.125 (52.066)	Top-5 acc 78.516 (75.134)	lr 0.02027
Train [35][1240/3239]	Time 0.247 (0.477)	Data Time 0.001 (0.022)	Loss 2.8633 (2.9930)	Entropy 0.71393 (0.71805)	Top-1 acc 56.641 (52.071)	Top-5 acc 79.688 (75.144)	lr 0.02027
Train [35][1250/3239]	Time 0.235 (0.476)	Data Time 0.001 (0.022)	Loss 3.1552 (2.9932)	Entropy 0.71407 (0.71802)	Top-1 acc 48.828 (52.063)	Top-5 acc 70.703 (75.142)	lr 0.02027
Train [35][1260/3239]	Time 0.231 (0.475)	Data Time 0.001 (0.022)	Loss 3.3783 (2.9936)	Entropy 0.71410 (0.71799)	Top-1 acc 46.484 (52.066)	Top-5 acc 64.453 (75.132)	lr 0.02027
Train [35][1270/3239]	Time 0.224 (0.475)	Data Time 0.001 (0.022)	Loss 2.9906 (2.9933)	Entropy 0.71361 (0.71796)	Top-1 acc 51.172 (52.069)	Top-5 acc 74.609 (75.136)	lr 0.02027
Train [35][1280/3239]	Time 0.248 (0.474)	Data Time 0.001 (0.022)	Loss 3.0911 (2.9934)	Entropy 0.71386 (0.71792)	Top-1 acc 50.781 (52.070)	Top-5 acc 71.875 (75.131)	lr 0.02027
Train [35][1290/3239]	Time 0.227 (0.474)	Data Time 0.001 (0.022)	Loss 3.1963 (2.9934)	Entropy 0.71405 (0.71789)	Top-1 acc 47.266 (52.067)	Top-5 acc 71.484 (75.133)	lr 0.02026
Train [35][1300/3239]	Time 0.233 (0.473)	Data Time 0.001 (0.021)	Loss 2.8897 (2.9938)	Entropy 0.71393 (0.71786)	Top-1 acc 51.562 (52.056)	Top-5 acc 76.562 (75.124)	lr 0.02026
Train [35][1310/3239]	Time 0.232 (0.473)	Data Time 0.001 (0.021)	Loss 2.8190 (2.9934)	Entropy 0.71368 (0.71783)	Top-1 acc 55.078 (52.065)	Top-5 acc 80.859 (75.134)	lr 0.02026
Train [35][1320/3239]	Time 0.226 (0.472)	Data Time 0.001 (0.021)	Loss 2.9901 (2.9931)	Entropy 0.71349 (0.71780)	Top-1 acc 51.953 (52.075)	Top-5 acc 75.781 (75.135)	lr 0.02026
Train [35][1330/3239]	Time 0.227 (0.472)	Data Time 0.001 (0.021)	Loss 3.0047 (2.9934)	Entropy 0.71297 (0.71777)	Top-1 acc 55.078 (52.073)	Top-5 acc 75.781 (75.130)	lr 0.02026
Train [35][1340/3239]	Time 0.236 (0.471)	Data Time 0.001 (0.021)	Loss 2.6730 (2.9931)	Entropy 0.71287 (0.71773)	Top-1 acc 59.766 (52.079)	Top-5 acc 82.422 (75.140)	lr 0.02026
Train [35][1350/3239]	Time 0.322 (0.471)	Data Time 0.001 (0.021)	Loss 2.8995 (2.9927)	Entropy 0.71278 (0.71770)	Top-1 acc 53.906 (52.086)	Top-5 acc 75.781 (75.147)	lr 0.02026
Train [35][1360/3239]	Time 0.230 (0.470)	Data Time 0.001 (0.021)	Loss 2.8234 (2.9926)	Entropy 0.71301 (0.71766)	Top-1 acc 53.906 (52.088)	Top-5 acc 78.125 (75.150)	lr 0.02026
Train [35][1370/3239]	Time 0.225 (0.470)	Data Time 0.001 (0.020)	Loss 3.0443 (2.9926)	Entropy 0.71291 (0.71763)	Top-1 acc 50.391 (52.087)	Top-5 acc 72.656 (75.149)	lr 0.02026
Train [35][1380/3239]	Time 0.235 (0.469)	Data Time 0.001 (0.020)	Loss 3.0131 (2.9924)	Entropy 0.71286 (0.71759)	Top-1 acc 51.953 (52.091)	Top-5 acc 75.781 (75.159)	lr 0.02026
Train [35][1390/3239]	Time 0.235 (0.469)	Data Time 0.001 (0.020)	Loss 3.2594 (2.9929)	Entropy 0.71300 (0.71756)	Top-1 acc 48.047 (52.076)	Top-5 acc 68.750 (75.152)	lr 0.02026
Train [35][1400/3239]	Time 0.226 (0.468)	Data Time 0.001 (0.020)	Loss 2.9374 (2.9926)	Entropy 0.71324 (0.71753)	Top-1 acc 58.594 (52.095)	Top-5 acc 73.438 (75.158)	lr 0.02026
Train [35][1410/3239]	Time 0.242 (0.468)	Data Time 0.001 (0.020)	Loss 3.1273 (2.9930)	Entropy 0.71293 (0.71750)	Top-1 acc 49.609 (52.085)	Top-5 acc 75.391 (75.149)	lr 0.02026
Train [35][1420/3239]	Time 0.318 (0.468)	Data Time 0.001 (0.020)	Loss 2.9546 (2.9930)	Entropy 0.71279 (0.71746)	Top-1 acc 53.906 (52.088)	Top-5 acc 77.344 (75.152)	lr 0.02025
Train [35][1430/3239]	Time 0.230 (0.467)	Data Time 0.001 (0.020)	Loss 2.9308 (2.9931)	Entropy 0.71290 (0.71743)	Top-1 acc 52.344 (52.089)	Top-5 acc 76.562 (75.150)	lr 0.02025
Train [35][1440/3239]	Time 0.231 (0.467)	Data Time 0.001 (0.020)	Loss 2.9528 (2.9931)	Entropy 0.71326 (0.71740)	Top-1 acc 50.391 (52.094)	Top-5 acc 76.172 (75.156)	lr 0.02025
Train [35][1450/3239]	Time 0.227 (0.466)	Data Time 0.001 (0.019)	Loss 3.1751 (2.9934)	Entropy 0.71327 (0.71737)	Top-1 acc 49.219 (52.090)	Top-5 acc 73.047 (75.145)	lr 0.02025
Train [35][1460/3239]	Time 0.236 (0.466)	Data Time 0.001 (0.019)	Loss 3.0633 (2.9932)	Entropy 0.71307 (0.71734)	Top-1 acc 49.219 (52.090)	Top-5 acc 73.438 (75.152)	lr 0.02025
Train [35][1470/3239]	Time 0.235 (0.466)	Data Time 0.001 (0.019)	Loss 3.0517 (2.9932)	Entropy 0.71253 (0.71731)	Top-1 acc 53.906 (52.098)	Top-5 acc 73.828 (75.150)	lr 0.02025
Train [35][1480/3239]	Time 0.228 (0.465)	Data Time 0.001 (0.019)	Loss 3.0993 (2.9935)	Entropy 0.71210 (0.71728)	Top-1 acc 50.391 (52.087)	Top-5 acc 73.047 (75.140)	lr 0.02025
Train [35][1490/3239]	Time 0.247 (0.465)	Data Time 0.001 (0.019)	Loss 3.0283 (2.9940)	Entropy 0.71215 (0.71725)	Top-1 acc 50.391 (52.074)	Top-5 acc 73.438 (75.128)	lr 0.02025
Train [35][1500/3239]	Time 0.224 (0.464)	Data Time 0.001 (0.019)	Loss 3.0409 (2.9935)	Entropy 0.71255 (0.71721)	Top-1 acc 52.734 (52.090)	Top-5 acc 74.609 (75.139)	lr 0.02025
Train [35][1510/3239]	Time 0.321 (0.464)	Data Time 0.001 (0.019)	Loss 3.0216 (2.9936)	Entropy 0.71244 (0.71718)	Top-1 acc 49.219 (52.087)	Top-5 acc 74.219 (75.138)	lr 0.02025
Train [35][1520/3239]	Time 0.238 (0.463)	Data Time 0.001 (0.019)	Loss 2.8519 (2.9933)	Entropy 0.71230 (0.71715)	Top-1 acc 55.078 (52.098)	Top-5 acc 76.562 (75.144)	lr 0.02025
Train [35][1530/3239]	Time 0.219 (0.463)	Data Time 0.001 (0.018)	Loss 2.9740 (2.9933)	Entropy 0.71234 (0.71712)	Top-1 acc 52.344 (52.096)	Top-5 acc 75.391 (75.144)	lr 0.02025
Train [35][1540/3239]	Time 0.234 (0.463)	Data Time 0.001 (0.018)	Loss 2.8051 (2.9933)	Entropy 0.71229 (0.71709)	Top-1 acc 51.172 (52.091)	Top-5 acc 78.516 (75.145)	lr 0.02025
Train [35][1550/3239]	Time 0.249 (0.462)	Data Time 0.001 (0.018)	Loss 3.0034 (2.9935)	Entropy 0.71190 (0.71706)	Top-1 acc 50.391 (52.087)	Top-5 acc 74.219 (75.148)	lr 0.02024
Train [35][1560/3239]	Time 0.251 (0.462)	Data Time 0.001 (0.018)	Loss 2.8690 (2.9936)	Entropy 0.71197 (0.71702)	Top-1 acc 53.125 (52.086)	Top-5 acc 76.562 (75.151)	lr 0.02024
Train [35][1570/3239]	Time 0.231 (0.461)	Data Time 0.001 (0.018)	Loss 2.7743 (2.9933)	Entropy 0.71181 (0.71699)	Top-1 acc 58.203 (52.099)	Top-5 acc 78.516 (75.158)	lr 0.02024
Train [35][1580/3239]	Time 0.316 (0.461)	Data Time 0.001 (0.018)	Loss 3.1107 (2.9933)	Entropy 0.71157 (0.71696)	Top-1 acc 49.609 (52.096)	Top-5 acc 70.703 (75.156)	lr 0.02024
Train [35][1590/3239]	Time 0.225 (0.461)	Data Time 0.001 (0.018)	Loss 3.1806 (2.9936)	Entropy 0.71145 (0.71692)	Top-1 acc 44.531 (52.091)	Top-5 acc 72.266 (75.151)	lr 0.02024
Train [35][1600/3239]	Time 0.223 (0.460)	Data Time 0.001 (0.018)	Loss 2.9419 (2.9938)	Entropy 0.71201 (0.71689)	Top-1 acc 52.734 (52.093)	Top-5 acc 76.562 (75.147)	lr 0.02024
Train [35][1610/3239]	Time 0.224 (0.460)	Data Time 0.001 (0.018)	Loss 2.7848 (2.9941)	Entropy 0.71208 (0.71686)	Top-1 acc 60.547 (52.096)	Top-5 acc 77.344 (75.144)	lr 0.02024
Train [35][1620/3239]	Time 0.225 (0.459)	Data Time 0.001 (0.018)	Loss 2.8028 (2.9935)	Entropy 0.71229 (0.71683)	Top-1 acc 54.297 (52.111)	Top-5 acc 79.297 (75.150)	lr 0.02024
Train [35][1630/3239]	Time 0.235 (0.459)	Data Time 0.001 (0.017)	Loss 2.9455 (2.9936)	Entropy 0.71235 (0.71680)	Top-1 acc 53.516 (52.111)	Top-5 acc 75.391 (75.148)	lr 0.02024
Train [35][1640/3239]	Time 0.226 (0.459)	Data Time 0.001 (0.017)	Loss 2.8408 (2.9938)	Entropy 0.71195 (0.71678)	Top-1 acc 57.031 (52.106)	Top-5 acc 78.125 (75.147)	lr 0.02024
Train [35][1650/3239]	Time 0.232 (0.458)	Data Time 0.001 (0.017)	Loss 2.9976 (2.9941)	Entropy 0.71204 (0.71675)	Top-1 acc 53.125 (52.099)	Top-5 acc 74.609 (75.144)	lr 0.02024
Train [35][1660/3239]	Time 0.223 (0.458)	Data Time 0.001 (0.017)	Loss 3.1938 (2.9949)	Entropy 0.71215 (0.71672)	Top-1 acc 47.266 (52.082)	Top-5 acc 74.219 (75.126)	lr 0.02024
Train [35][1670/3239]	Time 0.237 (0.458)	Data Time 0.001 (0.017)	Loss 2.6597 (2.9951)	Entropy 0.71203 (0.71669)	Top-1 acc 56.641 (52.072)	Top-5 acc 82.812 (75.119)	lr 0.02023
Train [35][1680/3239]	Time 0.235 (0.457)	Data Time 0.001 (0.017)	Loss 2.9988 (2.9952)	Entropy 0.71180 (0.71666)	Top-1 acc 50.000 (52.068)	Top-5 acc 71.875 (75.114)	lr 0.02023
Train [35][1690/3239]	Time 0.246 (0.457)	Data Time 0.001 (0.017)	Loss 2.9394 (2.9949)	Entropy 0.71188 (0.71663)	Top-1 acc 52.734 (52.079)	Top-5 acc 76.562 (75.120)	lr 0.02023
Train [35][1700/3239]	Time 0.233 (0.457)	Data Time 0.001 (0.017)	Loss 2.8951 (2.9949)	Entropy 0.71236 (0.71661)	Top-1 acc 56.641 (52.076)	Top-5 acc 77.344 (75.119)	lr 0.02023
Train [35][1710/3239]	Time 0.226 (0.456)	Data Time 0.001 (0.017)	Loss 3.0786 (2.9950)	Entropy 0.71220 (0.71658)	Top-1 acc 48.438 (52.071)	Top-5 acc 73.047 (75.120)	lr 0.02023
Train [35][1720/3239]	Time 0.223 (0.456)	Data Time 0.001 (0.017)	Loss 2.8746 (2.9948)	Entropy 0.71213 (0.71656)	Top-1 acc 55.469 (52.072)	Top-5 acc 76.953 (75.123)	lr 0.02023
Train [35][1730/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.017)	Loss 2.9038 (2.9946)	Entropy 0.71212 (0.71653)	Top-1 acc 52.344 (52.079)	Top-5 acc 75.000 (75.127)	lr 0.02023
Train [35][1740/3239]	Time 0.324 (0.456)	Data Time 0.001 (0.016)	Loss 3.0740 (2.9946)	Entropy 0.71184 (0.71650)	Top-1 acc 51.172 (52.083)	Top-5 acc 75.000 (75.131)	lr 0.02023
Train [35][1750/3239]	Time 0.229 (0.455)	Data Time 0.001 (0.016)	Loss 2.9988 (2.9944)	Entropy 0.71186 (0.71648)	Top-1 acc 51.562 (52.086)	Top-5 acc 74.609 (75.135)	lr 0.02023
Train [35][1760/3239]	Time 0.230 (0.455)	Data Time 0.001 (0.016)	Loss 2.9891 (2.9947)	Entropy 0.71154 (0.71645)	Top-1 acc 50.391 (52.078)	Top-5 acc 74.609 (75.132)	lr 0.02023
Train [35][1770/3239]	Time 0.231 (0.455)	Data Time 0.001 (0.016)	Loss 2.8739 (2.9947)	Entropy 0.71147 (0.71642)	Top-1 acc 51.562 (52.075)	Top-5 acc 76.562 (75.130)	lr 0.02023
Train [35][1780/3239]	Time 0.234 (0.454)	Data Time 0.001 (0.016)	Loss 3.0208 (2.9948)	Entropy 0.71115 (0.71639)	Top-1 acc 51.953 (52.079)	Top-5 acc 74.609 (75.127)	lr 0.02023
Train [35][1790/3239]	Time 0.224 (0.454)	Data Time 0.001 (0.016)	Loss 2.9610 (2.9949)	Entropy 0.71094 (0.71636)	Top-1 acc 54.297 (52.073)	Top-5 acc 73.828 (75.122)	lr 0.02023
Train [35][1800/3239]	Time 0.237 (0.454)	Data Time 0.001 (0.016)	Loss 2.8396 (2.9947)	Entropy 0.71097 (0.71633)	Top-1 acc 58.594 (52.079)	Top-5 acc 76.953 (75.129)	lr 0.02022
Train [35][1810/3239]	Time 0.327 (0.453)	Data Time 0.001 (0.016)	Loss 2.8646 (2.9944)	Entropy 0.71125 (0.71631)	Top-1 acc 53.906 (52.077)	Top-5 acc 76.172 (75.131)	lr 0.02022
Train [35][1820/3239]	Time 0.233 (0.469)	Data Time 0.002 (0.016)	Loss 2.8844 (2.9943)	Entropy 0.71139 (0.71628)	Top-1 acc 52.734 (52.085)	Top-5 acc 76.953 (75.130)	lr 0.02022
Train [35][1830/3239]	Time 0.361 (0.469)	Data Time 0.002 (0.016)	Loss 2.9991 (2.9942)	Entropy 0.71166 (0.71625)	Top-1 acc 56.250 (52.085)	Top-5 acc 75.781 (75.133)	lr 0.02022
Train [35][1840/3239]	Time 0.238 (0.468)	Data Time 0.001 (0.016)	Loss 3.1465 (2.9945)	Entropy 0.71147 (0.71623)	Top-1 acc 50.000 (52.076)	Top-5 acc 72.656 (75.126)	lr 0.02022
Train [35][1850/3239]	Time 0.230 (0.468)	Data Time 0.001 (0.016)	Loss 2.8472 (2.9945)	Entropy 0.71145 (0.71620)	Top-1 acc 52.734 (52.068)	Top-5 acc 80.078 (75.129)	lr 0.02022
Train [35][1860/3239]	Time 0.238 (0.468)	Data Time 0.001 (0.015)	Loss 2.8635 (2.9944)	Entropy 0.71125 (0.71618)	Top-1 acc 53.906 (52.070)	Top-5 acc 76.562 (75.129)	lr 0.02022
Train [35][1870/3239]	Time 0.228 (0.467)	Data Time 0.001 (0.015)	Loss 3.1494 (2.9945)	Entropy 0.71082 (0.71615)	Top-1 acc 46.094 (52.066)	Top-5 acc 72.266 (75.125)	lr 0.02022
Train [35][1880/3239]	Time 0.238 (0.467)	Data Time 0.001 (0.015)	Loss 2.8223 (2.9942)	Entropy 0.71040 (0.71612)	Top-1 acc 58.203 (52.070)	Top-5 acc 76.172 (75.131)	lr 0.02022
Train [35][1890/3239]	Time 0.239 (0.467)	Data Time 0.001 (0.015)	Loss 2.8690 (2.9941)	Entropy 0.71048 (0.71609)	Top-1 acc 57.031 (52.075)	Top-5 acc 77.734 (75.132)	lr 0.02022
Train [35][1900/3239]	Time 0.308 (0.467)	Data Time 0.001 (0.015)	Loss 3.1639 (2.9942)	Entropy 0.70985 (0.71606)	Top-1 acc 46.094 (52.066)	Top-5 acc 71.875 (75.126)	lr 0.02022
Train [35][1910/3239]	Time 0.231 (0.466)	Data Time 0.001 (0.015)	Loss 3.0620 (2.9941)	Entropy 0.70974 (0.71603)	Top-1 acc 53.516 (52.071)	Top-5 acc 72.266 (75.129)	lr 0.02022
Train [35][1920/3239]	Time 0.243 (0.466)	Data Time 0.001 (0.015)	Loss 3.1229 (2.9944)	Entropy 0.70989 (0.71599)	Top-1 acc 48.438 (52.070)	Top-5 acc 71.875 (75.120)	lr 0.02021
Train [35][1930/3239]	Time 0.226 (0.466)	Data Time 0.001 (0.015)	Loss 3.0543 (2.9944)	Entropy 0.71001 (0.71596)	Top-1 acc 47.266 (52.073)	Top-5 acc 74.219 (75.118)	lr 0.02021
Train [35][1940/3239]	Time 0.230 (0.465)	Data Time 0.001 (0.015)	Loss 3.2038 (2.9944)	Entropy 0.70992 (0.71593)	Top-1 acc 46.875 (52.071)	Top-5 acc 71.484 (75.119)	lr 0.02021
Train [35][1950/3239]	Time 0.235 (0.465)	Data Time 0.001 (0.015)	Loss 3.0239 (2.9943)	Entropy 0.70936 (0.71590)	Top-1 acc 53.125 (52.076)	Top-5 acc 72.656 (75.118)	lr 0.02021
Train [35][1960/3239]	Time 0.268 (0.465)	Data Time 0.001 (0.015)	Loss 2.9437 (2.9943)	Entropy 0.70940 (0.71587)	Top-1 acc 55.078 (52.073)	Top-5 acc 79.297 (75.116)	lr 0.02021
Train [35][1970/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.015)	Loss 2.9868 (2.9940)	Entropy 0.70932 (0.71583)	Top-1 acc 50.391 (52.076)	Top-5 acc 75.391 (75.122)	lr 0.02021
Train [35][1980/3239]	Time 0.236 (0.465)	Data Time 0.001 (0.015)	Loss 2.7866 (2.9937)	Entropy 0.70925 (0.71580)	Top-1 acc 55.078 (52.085)	Top-5 acc 76.953 (75.127)	lr 0.02021
Train [35][1990/3239]	Time 0.264 (0.464)	Data Time 0.001 (0.015)	Loss 3.0121 (2.9936)	Entropy 0.70945 (0.71577)	Top-1 acc 53.125 (52.087)	Top-5 acc 74.219 (75.127)	lr 0.02021
Train [35][2000/3239]	Time 0.223 (0.464)	Data Time 0.001 (0.014)	Loss 3.1628 (2.9935)	Entropy 0.70930 (0.71574)	Top-1 acc 43.750 (52.086)	Top-5 acc 71.484 (75.126)	lr 0.02021
Train [35][2010/3239]	Time 0.231 (0.464)	Data Time 0.001 (0.014)	Loss 2.8660 (2.9935)	Entropy 0.70887 (0.71570)	Top-1 acc 54.688 (52.084)	Top-5 acc 76.562 (75.128)	lr 0.02021
Train [35][2020/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.014)	Loss 2.7648 (2.9932)	Entropy 0.70861 (0.71567)	Top-1 acc 56.250 (52.089)	Top-5 acc 80.859 (75.133)	lr 0.02021
Train [35][2030/3239]	Time 0.252 (0.463)	Data Time 0.001 (0.014)	Loss 3.3346 (2.9932)	Entropy 0.70893 (0.71563)	Top-1 acc 46.484 (52.093)	Top-5 acc 67.969 (75.133)	lr 0.02021
Train [35][2040/3239]	Time 0.235 (0.463)	Data Time 0.001 (0.014)	Loss 2.9717 (2.9928)	Entropy 0.70893 (0.71560)	Top-1 acc 53.516 (52.101)	Top-5 acc 76.953 (75.141)	lr 0.02021
Train [35][2050/3239]	Time 0.227 (0.463)	Data Time 0.001 (0.014)	Loss 2.9929 (2.9930)	Entropy 0.70918 (0.71557)	Top-1 acc 53.125 (52.099)	Top-5 acc 73.828 (75.136)	lr 0.02020
Train [35][2060/3239]	Time 0.369 (0.463)	Data Time 0.001 (0.014)	Loss 3.0565 (2.9929)	Entropy 0.70947 (0.71554)	Top-1 acc 52.344 (52.098)	Top-5 acc 71.484 (75.136)	lr 0.02020
Train [35][2070/3239]	Time 0.219 (0.462)	Data Time 0.001 (0.014)	Loss 3.4805 (2.9931)	Entropy 0.70951 (0.71551)	Top-1 acc 41.016 (52.091)	Top-5 acc 67.969 (75.129)	lr 0.02020
Train [35][2080/3239]	Time 0.239 (0.462)	Data Time 0.001 (0.014)	Loss 3.0097 (2.9933)	Entropy 0.70911 (0.71548)	Top-1 acc 49.609 (52.088)	Top-5 acc 74.219 (75.124)	lr 0.02020
Train [35][2090/3239]	Time 0.255 (0.462)	Data Time 0.001 (0.014)	Loss 2.8969 (2.9934)	Entropy 0.70927 (0.71545)	Top-1 acc 52.344 (52.082)	Top-5 acc 75.391 (75.122)	lr 0.02020
Train [35][2100/3239]	Time 0.225 (0.462)	Data Time 0.001 (0.014)	Loss 3.3733 (2.9941)	Entropy 0.70900 (0.71542)	Top-1 acc 44.141 (52.066)	Top-5 acc 68.359 (75.106)	lr 0.02020
Train [35][2110/3239]	Time 0.220 (0.462)	Data Time 0.001 (0.014)	Loss 2.9388 (2.9937)	Entropy 0.70932 (0.71539)	Top-1 acc 53.906 (52.073)	Top-5 acc 76.172 (75.116)	lr 0.02020
Train [35][2120/3239]	Time 0.226 (0.461)	Data Time 0.001 (0.014)	Loss 3.0169 (2.9935)	Entropy 0.70952 (0.71536)	Top-1 acc 51.562 (52.073)	Top-5 acc 72.656 (75.119)	lr 0.02020
Train [35][2130/3239]	Time 0.324 (0.461)	Data Time 0.001 (0.014)	Loss 3.0266 (2.9934)	Entropy 0.70932 (0.71533)	Top-1 acc 53.516 (52.079)	Top-5 acc 74.219 (75.121)	lr 0.02020
Train [35][2140/3239]	Time 0.232 (0.461)	Data Time 0.001 (0.014)	Loss 3.0473 (2.9932)	Entropy 0.70936 (0.71531)	Top-1 acc 53.125 (52.092)	Top-5 acc 74.609 (75.124)	lr 0.02020
Train [35][2150/3239]	Time 0.234 (0.461)	Data Time 0.001 (0.014)	Loss 3.0196 (2.9931)	Entropy 0.70978 (0.71528)	Top-1 acc 53.516 (52.092)	Top-5 acc 75.391 (75.129)	lr 0.02020
Train [35][2160/3239]	Time 0.229 (0.460)	Data Time 0.001 (0.014)	Loss 3.0589 (2.9931)	Entropy 0.70979 (0.71525)	Top-1 acc 52.734 (52.095)	Top-5 acc 74.219 (75.130)	lr 0.02020
Train [35][2170/3239]	Time 0.231 (0.460)	Data Time 0.001 (0.013)	Loss 2.9560 (2.9932)	Entropy 0.70947 (0.71523)	Top-1 acc 52.734 (52.090)	Top-5 acc 72.266 (75.127)	lr 0.02019
Train [35][2180/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.013)	Loss 2.9301 (2.9930)	Entropy 0.70951 (0.71520)	Top-1 acc 53.906 (52.094)	Top-5 acc 78.125 (75.130)	lr 0.02019
Train [35][2190/3239]	Time 0.230 (0.460)	Data Time 0.001 (0.013)	Loss 2.8554 (2.9932)	Entropy 0.70962 (0.71518)	Top-1 acc 53.125 (52.086)	Top-5 acc 77.734 (75.128)	lr 0.02019
Train [35][2200/3239]	Time 0.238 (0.459)	Data Time 0.001 (0.013)	Loss 2.9268 (2.9929)	Entropy 0.70931 (0.71515)	Top-1 acc 54.297 (52.091)	Top-5 acc 76.953 (75.134)	lr 0.02019
Train [35][2210/3239]	Time 0.227 (0.459)	Data Time 0.001 (0.013)	Loss 2.9847 (2.9931)	Entropy 0.70939 (0.71512)	Top-1 acc 54.297 (52.086)	Top-5 acc 72.656 (75.129)	lr 0.02019
Train [35][2220/3239]	Time 0.327 (0.459)	Data Time 0.001 (0.013)	Loss 2.9028 (2.9930)	Entropy 0.70890 (0.71510)	Top-1 acc 50.391 (52.088)	Top-5 acc 77.344 (75.130)	lr 0.02019
Train [35][2230/3239]	Time 0.237 (0.459)	Data Time 0.001 (0.013)	Loss 2.8837 (2.9928)	Entropy 0.70861 (0.71507)	Top-1 acc 57.031 (52.093)	Top-5 acc 76.562 (75.133)	lr 0.02019
Train [35][2240/3239]	Time 0.237 (0.458)	Data Time 0.001 (0.013)	Loss 2.9864 (2.9928)	Entropy 0.70776 (0.71504)	Top-1 acc 54.297 (52.097)	Top-5 acc 75.781 (75.134)	lr 0.02019
Train [35][2250/3239]	Time 0.228 (0.458)	Data Time 0.001 (0.013)	Loss 2.8637 (2.9926)	Entropy 0.70798 (0.71501)	Top-1 acc 53.125 (52.104)	Top-5 acc 77.344 (75.139)	lr 0.02019
Train [35][2260/3239]	Time 0.235 (0.458)	Data Time 0.001 (0.013)	Loss 3.1150 (2.9928)	Entropy 0.70826 (0.71498)	Top-1 acc 48.828 (52.103)	Top-5 acc 69.922 (75.136)	lr 0.02019
Train [35][2270/3239]	Time 0.228 (0.458)	Data Time 0.001 (0.013)	Loss 2.9279 (2.9926)	Entropy 0.70853 (0.71495)	Top-1 acc 53.125 (52.108)	Top-5 acc 78.516 (75.138)	lr 0.02019
Train [35][2280/3239]	Time 0.237 (0.457)	Data Time 0.001 (0.013)	Loss 2.9074 (2.9925)	Entropy 0.70857 (0.71492)	Top-1 acc 54.688 (52.112)	Top-5 acc 76.172 (75.138)	lr 0.02019
Train [35][2290/3239]	Time 0.319 (0.457)	Data Time 0.001 (0.013)	Loss 3.2870 (2.9928)	Entropy 0.70852 (0.71489)	Top-1 acc 47.656 (52.105)	Top-5 acc 73.047 (75.137)	lr 0.02019
Train [35][2300/3239]	Time 0.224 (0.457)	Data Time 0.001 (0.013)	Loss 2.8377 (2.9925)	Entropy 0.70849 (0.71486)	Top-1 acc 54.688 (52.111)	Top-5 acc 77.734 (75.144)	lr 0.02018
Train [35][2310/3239]	Time 0.234 (0.457)	Data Time 0.001 (0.013)	Loss 3.2820 (2.9925)	Entropy 0.70855 (0.71484)	Top-1 acc 46.875 (52.114)	Top-5 acc 69.531 (75.145)	lr 0.02018
Train [35][2320/3239]	Time 0.235 (0.457)	Data Time 0.001 (0.013)	Loss 2.9217 (2.9924)	Entropy 0.70862 (0.71481)	Top-1 acc 53.906 (52.117)	Top-5 acc 74.609 (75.148)	lr 0.02018
Train [35][2330/3239]	Time 0.221 (0.456)	Data Time 0.001 (0.013)	Loss 2.9053 (2.9923)	Entropy 0.70887 (0.71478)	Top-1 acc 53.516 (52.119)	Top-5 acc 74.219 (75.145)	lr 0.02018
Train [35][2340/3239]	Time 0.225 (0.456)	Data Time 0.001 (0.013)	Loss 2.9344 (2.9921)	Entropy 0.70876 (0.71476)	Top-1 acc 52.734 (52.118)	Top-5 acc 75.000 (75.149)	lr 0.02018
Train [35][2350/3239]	Time 0.233 (0.456)	Data Time 0.001 (0.013)	Loss 2.7877 (2.9918)	Entropy 0.70897 (0.71473)	Top-1 acc 59.375 (52.124)	Top-5 acc 79.688 (75.158)	lr 0.02018
Train [35][2360/3239]	Time 0.226 (0.456)	Data Time 0.001 (0.013)	Loss 3.1284 (2.9919)	Entropy 0.70853 (0.71471)	Top-1 acc 48.047 (52.119)	Top-5 acc 73.438 (75.160)	lr 0.02018
Train [35][2370/3239]	Time 0.225 (0.455)	Data Time 0.001 (0.012)	Loss 2.8487 (2.9920)	Entropy 0.70843 (0.71468)	Top-1 acc 54.297 (52.115)	Top-5 acc 80.469 (75.158)	lr 0.02018
Train [35][2380/3239]	Time 0.248 (0.455)	Data Time 0.001 (0.012)	Loss 2.9458 (2.9919)	Entropy 0.70882 (0.71466)	Top-1 acc 53.516 (52.116)	Top-5 acc 76.172 (75.161)	lr 0.02018
Train [35][2390/3239]	Time 0.219 (0.455)	Data Time 0.001 (0.012)	Loss 3.1227 (2.9922)	Entropy 0.70934 (0.71463)	Top-1 acc 50.391 (52.110)	Top-5 acc 73.438 (75.153)	lr 0.02018
Train [35][2400/3239]	Time 0.240 (0.455)	Data Time 0.001 (0.012)	Loss 3.1074 (2.9925)	Entropy 0.70922 (0.71461)	Top-1 acc 51.172 (52.101)	Top-5 acc 74.219 (75.146)	lr 0.02018
Train [35][2410/3239]	Time 0.238 (0.455)	Data Time 0.001 (0.012)	Loss 3.2405 (2.9926)	Entropy 0.70899 (0.71459)	Top-1 acc 48.047 (52.098)	Top-5 acc 71.094 (75.142)	lr 0.02018
Train [35][2420/3239]	Time 0.232 (0.454)	Data Time 0.001 (0.012)	Loss 2.9096 (2.9926)	Entropy 0.70902 (0.71457)	Top-1 acc 51.562 (52.095)	Top-5 acc 78.125 (75.145)	lr 0.02018
Train [35][2430/3239]	Time 0.247 (0.454)	Data Time 0.001 (0.012)	Loss 2.8711 (2.9925)	Entropy 0.70892 (0.71454)	Top-1 acc 52.734 (52.092)	Top-5 acc 78.516 (75.150)	lr 0.02017
Train [35][2440/3239]	Time 0.228 (0.454)	Data Time 0.001 (0.012)	Loss 3.1805 (2.9925)	Entropy 0.70830 (0.71452)	Top-1 acc 49.219 (52.091)	Top-5 acc 72.266 (75.151)	lr 0.02017
Train [35][2450/3239]	Time 0.338 (0.454)	Data Time 0.001 (0.012)	Loss 3.2761 (2.9927)	Entropy 0.70808 (0.71449)	Top-1 acc 41.797 (52.086)	Top-5 acc 72.656 (75.150)	lr 0.02017
Train [35][2460/3239]	Time 0.232 (0.454)	Data Time 0.001 (0.012)	Loss 3.1289 (2.9928)	Entropy 0.70806 (0.71447)	Top-1 acc 50.781 (52.086)	Top-5 acc 70.312 (75.146)	lr 0.02017
Train [35][2470/3239]	Time 0.327 (0.465)	Data Time 0.004 (0.012)	Loss 3.0560 (2.9929)	Entropy 0.70805 (0.71444)	Top-1 acc 48.047 (52.083)	Top-5 acc 74.219 (75.147)	lr 0.02017
Train [35][2480/3239]	Time 0.241 (0.465)	Data Time 0.002 (0.012)	Loss 2.9148 (2.9929)	Entropy 0.70804 (0.71442)	Top-1 acc 55.078 (52.082)	Top-5 acc 75.391 (75.146)	lr 0.02017
Train [35][2490/3239]	Time 0.231 (0.465)	Data Time 0.002 (0.012)	Loss 3.0074 (2.9929)	Entropy 0.70804 (0.71439)	Top-1 acc 51.172 (52.079)	Top-5 acc 75.391 (75.150)	lr 0.02017
Train [35][2500/3239]	Time 0.217 (0.464)	Data Time 0.001 (0.012)	Loss 2.9580 (2.9929)	Entropy 0.70775 (0.71436)	Top-1 acc 53.125 (52.076)	Top-5 acc 75.781 (75.146)	lr 0.02017
Train [35][2510/3239]	Time 0.226 (0.464)	Data Time 0.001 (0.012)	Loss 2.7567 (2.9930)	Entropy 0.70786 (0.71434)	Top-1 acc 54.688 (52.075)	Top-5 acc 80.859 (75.146)	lr 0.02017
Train [35][2520/3239]	Time 0.241 (0.464)	Data Time 0.001 (0.012)	Loss 3.0665 (2.9930)	Entropy 0.70778 (0.71431)	Top-1 acc 51.562 (52.070)	Top-5 acc 75.000 (75.147)	lr 0.02017
Train [35][2530/3239]	Time 0.235 (0.464)	Data Time 0.001 (0.012)	Loss 3.0036 (2.9930)	Entropy 0.70767 (0.71429)	Top-1 acc 55.469 (52.074)	Top-5 acc 75.781 (75.145)	lr 0.02017
Train [35][2540/3239]	Time 0.268 (0.464)	Data Time 0.002 (0.012)	Loss 3.0981 (2.9930)	Entropy 0.70730 (0.71426)	Top-1 acc 51.172 (52.074)	Top-5 acc 71.875 (75.143)	lr 0.02017
Train [35][2550/3239]	Time 0.237 (0.464)	Data Time 0.001 (0.012)	Loss 3.0921 (2.9929)	Entropy 0.70699 (0.71423)	Top-1 acc 48.438 (52.076)	Top-5 acc 75.000 (75.142)	lr 0.02016
Train [35][2560/3239]	Time 0.236 (0.463)	Data Time 0.001 (0.012)	Loss 2.8724 (2.9927)	Entropy 0.70672 (0.71420)	Top-1 acc 55.469 (52.084)	Top-5 acc 78.125 (75.145)	lr 0.02016
Train [35][2570/3239]	Time 0.253 (0.463)	Data Time 0.002 (0.012)	Loss 2.7682 (2.9929)	Entropy 0.70717 (0.71417)	Top-1 acc 56.250 (52.084)	Top-5 acc 80.469 (75.141)	lr 0.02016
Train [35][2580/3239]	Time 0.255 (0.463)	Data Time 0.001 (0.012)	Loss 3.1497 (2.9929)	Entropy 0.70726 (0.71415)	Top-1 acc 48.047 (52.083)	Top-5 acc 72.656 (75.143)	lr 0.02016
Train [35][2590/3239]	Time 0.234 (0.463)	Data Time 0.001 (0.012)	Loss 2.9272 (2.9928)	Entropy 0.70726 (0.71412)	Top-1 acc 52.344 (52.084)	Top-5 acc 75.781 (75.147)	lr 0.02016
Train [35][2600/3239]	Time 0.238 (0.463)	Data Time 0.001 (0.012)	Loss 2.9832 (2.9929)	Entropy 0.70713 (0.71409)	Top-1 acc 52.734 (52.079)	Top-5 acc 78.906 (75.145)	lr 0.02016
Train [35][2610/3239]	Time 0.341 (0.463)	Data Time 0.001 (0.011)	Loss 2.9848 (2.9929)	Entropy 0.70741 (0.71407)	Top-1 acc 50.391 (52.078)	Top-5 acc 78.125 (75.148)	lr 0.02016
Train [35][2620/3239]	Time 0.241 (0.462)	Data Time 0.001 (0.011)	Loss 3.0217 (2.9927)	Entropy 0.70685 (0.71404)	Top-1 acc 51.562 (52.083)	Top-5 acc 77.344 (75.149)	lr 0.02016
Train [35][2630/3239]	Time 0.251 (0.462)	Data Time 0.001 (0.011)	Loss 3.0306 (2.9928)	Entropy 0.70647 (0.71401)	Top-1 acc 50.391 (52.083)	Top-5 acc 77.344 (75.152)	lr 0.02016
Train [35][2640/3239]	Time 0.232 (0.462)	Data Time 0.001 (0.011)	Loss 2.7505 (2.9927)	Entropy 0.70625 (0.71398)	Top-1 acc 60.156 (52.084)	Top-5 acc 78.906 (75.151)	lr 0.02016
Train [35][2650/3239]	Time 0.229 (0.462)	Data Time 0.001 (0.011)	Loss 3.0393 (2.9926)	Entropy 0.70608 (0.71395)	Top-1 acc 54.297 (52.088)	Top-5 acc 73.438 (75.153)	lr 0.02016
Train [35][2660/3239]	Time 0.248 (0.462)	Data Time 0.001 (0.011)	Loss 3.1590 (2.9927)	Entropy 0.70648 (0.71393)	Top-1 acc 50.781 (52.089)	Top-5 acc 72.656 (75.150)	lr 0.02016
Train [35][2670/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.011)	Loss 3.0851 (2.9926)	Entropy 0.70594 (0.71390)	Top-1 acc 51.953 (52.092)	Top-5 acc 74.609 (75.152)	lr 0.02016
Train [35][2680/3239]	Time 0.355 (0.462)	Data Time 0.001 (0.011)	Loss 3.1740 (2.9929)	Entropy 0.70541 (0.71387)	Top-1 acc 47.266 (52.085)	Top-5 acc 73.828 (75.147)	lr 0.02015
Train [35][2690/3239]	Time 0.238 (0.461)	Data Time 0.001 (0.011)	Loss 3.1805 (2.9931)	Entropy 0.70537 (0.71384)	Top-1 acc 48.047 (52.077)	Top-5 acc 72.266 (75.144)	lr 0.02015
Train [35][2700/3239]	Time 0.234 (0.461)	Data Time 0.001 (0.011)	Loss 3.0081 (2.9931)	Entropy 0.70514 (0.71380)	Top-1 acc 50.391 (52.079)	Top-5 acc 72.656 (75.143)	lr 0.02015
Train [35][2710/3239]	Time 0.243 (0.461)	Data Time 0.001 (0.011)	Loss 3.0777 (2.9933)	Entropy 0.70502 (0.71377)	Top-1 acc 52.734 (52.074)	Top-5 acc 73.047 (75.141)	lr 0.02015
Train [35][2720/3239]	Time 0.251 (0.461)	Data Time 0.001 (0.011)	Loss 3.0004 (2.9930)	Entropy 0.70510 (0.71374)	Top-1 acc 53.906 (52.079)	Top-5 acc 71.875 (75.147)	lr 0.02015
Train [35][2730/3239]	Time 0.239 (0.461)	Data Time 0.001 (0.011)	Loss 2.9242 (2.9930)	Entropy 0.70531 (0.71371)	Top-1 acc 53.906 (52.079)	Top-5 acc 75.391 (75.149)	lr 0.02015
Train [35][2740/3239]	Time 0.235 (0.460)	Data Time 0.001 (0.011)	Loss 2.9397 (2.9932)	Entropy 0.70531 (0.71368)	Top-1 acc 53.906 (52.075)	Top-5 acc 78.125 (75.146)	lr 0.02015
Train [35][2750/3239]	Time 0.248 (0.460)	Data Time 0.001 (0.011)	Loss 2.9025 (2.9931)	Entropy 0.70546 (0.71365)	Top-1 acc 50.781 (52.078)	Top-5 acc 73.438 (75.145)	lr 0.02015
Train [35][2760/3239]	Time 0.237 (0.460)	Data Time 0.001 (0.011)	Loss 2.9037 (2.9931)	Entropy 0.70492 (0.71362)	Top-1 acc 55.469 (52.077)	Top-5 acc 76.562 (75.145)	lr 0.02015
Train [35][2770/3239]	Time 0.335 (0.460)	Data Time 0.001 (0.011)	Loss 3.1252 (2.9931)	Entropy 0.70528 (0.71359)	Top-1 acc 50.000 (52.076)	Top-5 acc 71.094 (75.146)	lr 0.02015
Train [35][2780/3239]	Time 0.237 (0.460)	Data Time 0.001 (0.011)	Loss 2.9822 (2.9933)	Entropy 0.70542 (0.71356)	Top-1 acc 51.953 (52.067)	Top-5 acc 73.438 (75.142)	lr 0.02015
Train [35][2790/3239]	Time 0.247 (0.460)	Data Time 0.001 (0.011)	Loss 2.8598 (2.9932)	Entropy 0.70543 (0.71353)	Top-1 acc 53.906 (52.071)	Top-5 acc 76.562 (75.142)	lr 0.02015
Train [35][2800/3239]	Time 0.233 (0.460)	Data Time 0.001 (0.011)	Loss 2.9805 (2.9930)	Entropy 0.70578 (0.71350)	Top-1 acc 52.734 (52.074)	Top-5 acc 75.781 (75.144)	lr 0.02014
Train [35][2810/3239]	Time 0.227 (0.459)	Data Time 0.001 (0.011)	Loss 3.2631 (2.9929)	Entropy 0.70555 (0.71347)	Top-1 acc 48.047 (52.076)	Top-5 acc 69.141 (75.145)	lr 0.02014
Train [35][2820/3239]	Time 0.238 (0.459)	Data Time 0.001 (0.011)	Loss 2.8533 (2.9928)	Entropy 0.70529 (0.71344)	Top-1 acc 53.125 (52.076)	Top-5 acc 78.516 (75.147)	lr 0.02014
Train [35][2830/3239]	Time 0.230 (0.459)	Data Time 0.001 (0.011)	Loss 2.8413 (2.9928)	Entropy 0.70544 (0.71341)	Top-1 acc 56.641 (52.075)	Top-5 acc 77.734 (75.144)	lr 0.02014
Train [35][2840/3239]	Time 0.354 (0.459)	Data Time 0.001 (0.011)	Loss 3.0168 (2.9930)	Entropy 0.70555 (0.71338)	Top-1 acc 53.125 (52.071)	Top-5 acc 75.000 (75.143)	lr 0.02014
Train [35][2850/3239]	Time 0.228 (0.459)	Data Time 0.001 (0.011)	Loss 2.8312 (2.9928)	Entropy 0.70554 (0.71336)	Top-1 acc 50.781 (52.076)	Top-5 acc 79.297 (75.147)	lr 0.02014
Train [35][2860/3239]	Time 0.230 (0.459)	Data Time 0.001 (0.011)	Loss 3.1007 (2.9928)	Entropy 0.70560 (0.71333)	Top-1 acc 50.000 (52.076)	Top-5 acc 71.875 (75.147)	lr 0.02014
Train [35][2870/3239]	Time 0.242 (0.458)	Data Time 0.001 (0.011)	Loss 2.9008 (2.9929)	Entropy 0.70580 (0.71330)	Top-1 acc 55.078 (52.072)	Top-5 acc 76.562 (75.143)	lr 0.02014
Train [35][2880/3239]	Time 0.238 (0.458)	Data Time 0.001 (0.011)	Loss 2.8460 (2.9928)	Entropy 0.70582 (0.71328)	Top-1 acc 57.422 (52.077)	Top-5 acc 76.953 (75.143)	lr 0.02014
Train [35][2890/3239]	Time 0.233 (0.458)	Data Time 0.001 (0.011)	Loss 2.8148 (2.9927)	Entropy 0.70575 (0.71325)	Top-1 acc 53.125 (52.078)	Top-5 acc 80.469 (75.145)	lr 0.02014
Train [35][2900/3239]	Time 0.235 (0.458)	Data Time 0.001 (0.010)	Loss 3.0294 (2.9926)	Entropy 0.70597 (0.71322)	Top-1 acc 44.922 (52.077)	Top-5 acc 73.438 (75.146)	lr 0.02014
Train [35][2910/3239]	Time 0.231 (0.458)	Data Time 0.001 (0.010)	Loss 3.2014 (2.9926)	Entropy 0.70561 (0.71320)	Top-1 acc 47.266 (52.077)	Top-5 acc 72.266 (75.145)	lr 0.02014
Train [35][2920/3239]	Time 0.237 (0.458)	Data Time 0.001 (0.010)	Loss 3.1673 (2.9926)	Entropy 0.70547 (0.71317)	Top-1 acc 46.875 (52.080)	Top-5 acc 73.047 (75.144)	lr 0.02014
Train [35][2930/3239]	Time 0.329 (0.457)	Data Time 0.001 (0.010)	Loss 3.1227 (2.9928)	Entropy 0.70500 (0.71315)	Top-1 acc 51.562 (52.077)	Top-5 acc 71.875 (75.144)	lr 0.02013
Train [35][2940/3239]	Time 0.235 (0.457)	Data Time 0.001 (0.010)	Loss 3.0137 (2.9931)	Entropy 0.70495 (0.71312)	Top-1 acc 52.734 (52.071)	Top-5 acc 75.781 (75.135)	lr 0.02013
Train [35][2950/3239]	Time 0.250 (0.457)	Data Time 0.001 (0.010)	Loss 2.9834 (2.9931)	Entropy 0.70494 (0.71309)	Top-1 acc 53.125 (52.071)	Top-5 acc 75.391 (75.137)	lr 0.02013
Train [35][2960/3239]	Time 0.232 (0.457)	Data Time 0.001 (0.010)	Loss 3.0409 (2.9931)	Entropy 0.70514 (0.71306)	Top-1 acc 53.516 (52.074)	Top-5 acc 74.609 (75.132)	lr 0.02013
Train [35][2970/3239]	Time 0.228 (0.457)	Data Time 0.001 (0.010)	Loss 3.1311 (2.9932)	Entropy 0.70512 (0.71304)	Top-1 acc 48.828 (52.073)	Top-5 acc 73.047 (75.129)	lr 0.02013
Train [35][2980/3239]	Time 0.241 (0.456)	Data Time 0.001 (0.010)	Loss 3.1374 (2.9932)	Entropy 0.70513 (0.71301)	Top-1 acc 51.172 (52.070)	Top-5 acc 72.266 (75.129)	lr 0.02013
Train [35][2990/3239]	Time 0.236 (0.456)	Data Time 0.001 (0.010)	Loss 2.8590 (2.9933)	Entropy 0.70451 (0.71298)	Top-1 acc 52.344 (52.067)	Top-5 acc 77.734 (75.125)	lr 0.02013
Train [35][3000/3239]	Time 0.349 (0.456)	Data Time 0.001 (0.010)	Loss 3.1116 (2.9931)	Entropy 0.70437 (0.71295)	Top-1 acc 51.562 (52.067)	Top-5 acc 72.656 (75.126)	lr 0.02013
Train [35][3010/3239]	Time 0.231 (0.456)	Data Time 0.001 (0.010)	Loss 2.9011 (2.9931)	Entropy 0.70400 (0.71293)	Top-1 acc 53.125 (52.067)	Top-5 acc 75.781 (75.125)	lr 0.02013
Train [35][3020/3239]	Time 0.235 (0.456)	Data Time 0.001 (0.010)	Loss 2.7502 (2.9931)	Entropy 0.70425 (0.71290)	Top-1 acc 57.422 (52.066)	Top-5 acc 80.859 (75.126)	lr 0.02013
Train [35][3030/3239]	Time 0.236 (0.456)	Data Time 0.001 (0.010)	Loss 3.1319 (2.9931)	Entropy 0.70453 (0.71287)	Top-1 acc 46.484 (52.067)	Top-5 acc 74.609 (75.125)	lr 0.02013
Train [35][3040/3239]	Time 0.233 (0.455)	Data Time 0.001 (0.010)	Loss 3.1697 (2.9929)	Entropy 0.70450 (0.71284)	Top-1 acc 50.000 (52.070)	Top-5 acc 73.047 (75.131)	lr 0.02013
Train [35][3050/3239]	Time 0.230 (0.455)	Data Time 0.001 (0.010)	Loss 2.9912 (2.9930)	Entropy 0.70419 (0.71281)	Top-1 acc 49.219 (52.066)	Top-5 acc 77.734 (75.128)	lr 0.02012
Train [35][3060/3239]	Time 0.229 (0.455)	Data Time 0.001 (0.010)	Loss 3.2414 (2.9930)	Entropy 0.70392 (0.71278)	Top-1 acc 50.000 (52.069)	Top-5 acc 71.094 (75.128)	lr 0.02012
Train [35][3070/3239]	Time 0.239 (0.455)	Data Time 0.001 (0.010)	Loss 2.9091 (2.9928)	Entropy 0.70350 (0.71276)	Top-1 acc 54.297 (52.075)	Top-5 acc 75.000 (75.132)	lr 0.02012
Train [35][3080/3239]	Time 0.232 (0.455)	Data Time 0.001 (0.010)	Loss 2.6871 (2.9927)	Entropy 0.70308 (0.71272)	Top-1 acc 59.766 (52.080)	Top-5 acc 81.641 (75.135)	lr 0.02012
Train [35][3090/3239]	Time 0.224 (0.455)	Data Time 0.001 (0.010)	Loss 3.0605 (2.9928)	Entropy 0.70318 (0.71269)	Top-1 acc 51.562 (52.081)	Top-5 acc 73.438 (75.134)	lr 0.02012
Train [35][3100/3239]	Time 0.233 (0.455)	Data Time 0.001 (0.010)	Loss 2.9034 (2.9927)	Entropy 0.70285 (0.71266)	Top-1 acc 53.906 (52.081)	Top-5 acc 77.344 (75.135)	lr 0.02012
Train [35][3110/3239]	Time 0.231 (0.454)	Data Time 0.001 (0.010)	Loss 2.7533 (2.9924)	Entropy 0.70256 (0.71263)	Top-1 acc 58.984 (52.088)	Top-5 acc 78.516 (75.142)	lr 0.02012
Train [35][3120/3239]	Time 0.233 (0.454)	Data Time 0.001 (0.010)	Loss 2.8912 (2.9923)	Entropy 0.70177 (0.71260)	Top-1 acc 49.219 (52.089)	Top-5 acc 77.344 (75.146)	lr 0.02012
Train [35][3130/3239]	Time 0.229 (0.463)	Data Time 0.002 (0.010)	Loss 2.9927 (2.9922)	Entropy 0.70170 (0.71256)	Top-1 acc 53.906 (52.087)	Top-5 acc 74.609 (75.148)	lr 0.02012
Train [35][3140/3239]	Time 0.237 (0.463)	Data Time 0.002 (0.010)	Loss 3.1397 (2.9923)	Entropy 0.70177 (0.71253)	Top-1 acc 49.609 (52.083)	Top-5 acc 75.000 (75.146)	lr 0.02012
Train [35][3150/3239]	Time 0.234 (0.463)	Data Time 0.002 (0.010)	Loss 3.0958 (2.9925)	Entropy 0.70171 (0.71249)	Top-1 acc 48.438 (52.080)	Top-5 acc 72.266 (75.143)	lr 0.02012
Train [35][3160/3239]	Time 0.350 (0.463)	Data Time 0.002 (0.010)	Loss 3.0036 (2.9928)	Entropy 0.70159 (0.71246)	Top-1 acc 51.172 (52.075)	Top-5 acc 75.391 (75.140)	lr 0.02012
Train [35][3170/3239]	Time 0.236 (0.463)	Data Time 0.001 (0.010)	Loss 2.7389 (2.9928)	Entropy 0.70186 (0.71243)	Top-1 acc 58.984 (52.080)	Top-5 acc 80.859 (75.137)	lr 0.02012
Train [35][3180/3239]	Time 0.225 (0.463)	Data Time 0.000 (0.010)	Loss 2.9315 (2.9928)	Entropy 0.70193 (0.71239)	Top-1 acc 53.125 (52.081)	Top-5 acc 76.562 (75.139)	lr 0.02011
Train [35][3190/3239]	Time 0.230 (0.462)	Data Time 0.000 (0.010)	Loss 3.0342 (2.9929)	Entropy 0.70174 (0.71236)	Top-1 acc 50.781 (52.075)	Top-5 acc 75.391 (75.137)	lr 0.02011
Train [35][3200/3239]	Time 0.238 (0.462)	Data Time 0.000 (0.010)	Loss 2.9034 (2.9928)	Entropy 0.70201 (0.71233)	Top-1 acc 54.688 (52.078)	Top-5 acc 75.391 (75.138)	lr 0.02011
Train [35][3210/3239]	Time 0.232 (0.462)	Data Time 0.000 (0.010)	Loss 2.9750 (2.9928)	Entropy 0.70177 (0.71229)	Top-1 acc 48.438 (52.080)	Top-5 acc 75.000 (75.135)	lr 0.02011
Train [35][3220/3239]	Time 0.233 (0.462)	Data Time 0.000 (0.010)	Loss 3.1791 (2.9928)	Entropy 0.70172 (0.71226)	Top-1 acc 44.531 (52.080)	Top-5 acc 71.094 (75.138)	lr 0.02011
Train [35][3230/3239]	Time 0.231 (0.462)	Data Time 0.000 (0.010)	Loss 3.0005 (2.9926)	Entropy 0.70152 (0.71223)	Top-1 acc 50.391 (52.087)	Top-5 acc 77.734 (75.142)	lr 0.02011
Train [35][3239/3239]	Time 0.946 (0.461)	Data Time 0.000 (0.010)	Loss 3.4338 (2.9927)	Entropy 0.70167 (0.71220)	Top-1 acc 39.506 (52.084)	Top-5 acc 66.667 (75.139)	lr 0.02011
==========Valid [35/120]	loss 1.703	top-1 acc 61.588 (61.588)	top-5 acc 83.184	Train top-1 52.084	top-5 75.139	Entropy 0.70167	Latency-None: 0.000ms	Flops: 539.76M
Train [36][0/3239]	Time 27.286 (27.286)	Data Time 25.922 (25.922)	Loss 2.9565 (2.9565)	Entropy 0.70164 (0.70164)	Top-1 acc 53.516 (53.516)	Top-5 acc 75.781 (75.781)	lr 0.02011
Train [36][10/3239]	Time 0.246 (2.943)	Data Time 0.001 (2.358)	Loss 2.8805 (2.9781)	Entropy 0.70172 (0.70170)	Top-1 acc 54.297 (53.089)	Top-5 acc 75.781 (74.893)	lr 0.02011
Train [36][20/3239]	Time 0.248 (1.751)	Data Time 0.001 (1.236)	Loss 2.7991 (2.9459)	Entropy 0.70167 (0.70167)	Top-1 acc 55.078 (53.311)	Top-5 acc 79.688 (75.744)	lr 0.02011
Train [36][30/3239]	Time 0.232 (1.318)	Data Time 0.001 (0.838)	Loss 2.8483 (2.9515)	Entropy 0.70149 (0.70163)	Top-1 acc 55.078 (53.163)	Top-5 acc 78.906 (76.084)	lr 0.02011
Train [36][40/3239]	Time 0.232 (1.116)	Data Time 0.001 (0.634)	Loss 3.0424 (2.9678)	Entropy 0.70134 (0.70161)	Top-1 acc 52.734 (52.887)	Top-5 acc 73.438 (75.781)	lr 0.02011
Train [36][50/3239]	Time 0.237 (0.990)	Data Time 0.001 (0.510)	Loss 2.9696 (2.9646)	Entropy 0.70163 (0.70157)	Top-1 acc 48.438 (52.788)	Top-5 acc 76.562 (75.957)	lr 0.02011
Train [36][60/3239]	Time 0.319 (0.896)	Data Time 0.001 (0.426)	Loss 2.9243 (2.9701)	Entropy 0.70147 (0.70157)	Top-1 acc 51.953 (52.517)	Top-5 acc 76.172 (75.884)	lr 0.02010
Train [36][70/3239]	Time 0.233 (0.827)	Data Time 0.001 (0.367)	Loss 2.9247 (2.9690)	Entropy 0.70159 (0.70157)	Top-1 acc 48.828 (52.448)	Top-5 acc 75.781 (75.825)	lr 0.02010
Train [36][80/3239]	Time 0.236 (0.774)	Data Time 0.001 (0.321)	Loss 2.7465 (2.9722)	Entropy 0.70187 (0.70158)	Top-1 acc 54.688 (52.387)	Top-5 acc 78.906 (75.815)	lr 0.02010
Train [36][90/3239]	Time 0.226 (0.734)	Data Time 0.001 (0.286)	Loss 3.1379 (2.9753)	Entropy 0.70224 (0.70164)	Top-1 acc 50.391 (52.434)	Top-5 acc 72.656 (75.725)	lr 0.02010
Train [36][100/3239]	Time 0.222 (0.702)	Data Time 0.001 (0.258)	Loss 2.7922 (2.9711)	Entropy 0.70245 (0.70171)	Top-1 acc 55.859 (52.468)	Top-5 acc 80.078 (75.890)	lr 0.02010
Train [36][110/3239]	Time 0.230 (0.677)	Data Time 0.001 (0.235)	Loss 3.0451 (2.9716)	Entropy 0.70244 (0.70177)	Top-1 acc 54.688 (52.509)	Top-5 acc 71.484 (75.883)	lr 0.02010
Train [36][120/3239]	Time 0.230 (0.654)	Data Time 0.001 (0.216)	Loss 2.9309 (2.9694)	Entropy 0.70230 (0.70182)	Top-1 acc 49.219 (52.479)	Top-5 acc 79.297 (75.920)	lr 0.02010
Train [36][130/3239]	Time 0.233 (0.636)	Data Time 0.001 (0.199)	Loss 2.8545 (2.9709)	Entropy 0.70217 (0.70186)	Top-1 acc 55.469 (52.502)	Top-5 acc 78.125 (75.844)	lr 0.02010
Train [36][140/3239]	Time 0.247 (0.620)	Data Time 0.001 (0.185)	Loss 3.0866 (2.9717)	Entropy 0.70171 (0.70187)	Top-1 acc 53.906 (52.524)	Top-5 acc 75.781 (75.773)	lr 0.02010
Train [36][150/3239]	Time 0.320 (0.606)	Data Time 0.001 (0.173)	Loss 2.7369 (2.9709)	Entropy 0.70193 (0.70187)	Top-1 acc 58.984 (52.540)	Top-5 acc 81.250 (75.797)	lr 0.02010
Train [36][160/3239]	Time 0.226 (0.593)	Data Time 0.001 (0.162)	Loss 2.9508 (2.9695)	Entropy 0.70201 (0.70188)	Top-1 acc 55.469 (52.615)	Top-5 acc 72.656 (75.796)	lr 0.02010
Train [36][170/3239]	Time 0.224 (0.582)	Data Time 0.001 (0.153)	Loss 3.0652 (2.9712)	Entropy 0.70179 (0.70188)	Top-1 acc 48.828 (52.586)	Top-5 acc 76.172 (75.729)	lr 0.02010
Train [36][180/3239]	Time 0.223 (0.572)	Data Time 0.001 (0.145)	Loss 2.9261 (2.9729)	Entropy 0.70119 (0.70187)	Top-1 acc 52.344 (52.488)	Top-5 acc 76.172 (75.691)	lr 0.02010
Train [36][190/3239]	Time 0.234 (0.563)	Data Time 0.001 (0.137)	Loss 2.9500 (2.9749)	Entropy 0.70121 (0.70183)	Top-1 acc 57.031 (52.493)	Top-5 acc 75.000 (75.659)	lr 0.02009
Train [36][200/3239]	Time 0.221 (0.555)	Data Time 0.001 (0.130)	Loss 3.2384 (2.9783)	Entropy 0.70133 (0.70181)	Top-1 acc 46.875 (52.420)	Top-5 acc 68.750 (75.618)	lr 0.02009
Train [36][210/3239]	Time 0.227 (0.548)	Data Time 0.001 (0.124)	Loss 2.7715 (2.9761)	Entropy 0.70149 (0.70179)	Top-1 acc 54.688 (52.488)	Top-5 acc 81.250 (75.665)	lr 0.02009
Train [36][220/3239]	Time 0.338 (0.542)	Data Time 0.001 (0.119)	Loss 3.2482 (2.9768)	Entropy 0.70148 (0.70177)	Top-1 acc 45.703 (52.478)	Top-5 acc 67.578 (75.619)	lr 0.02009
Train [36][230/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.114)	Loss 3.0950 (2.9787)	Entropy 0.70136 (0.70176)	Top-1 acc 50.391 (52.486)	Top-5 acc 73.438 (75.565)	lr 0.02009
Train [36][240/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.109)	Loss 2.8478 (2.9764)	Entropy 0.70133 (0.70175)	Top-1 acc 53.125 (52.532)	Top-5 acc 80.078 (75.593)	lr 0.02009
Train [36][250/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.105)	Loss 3.3654 (2.9750)	Entropy 0.70168 (0.70174)	Top-1 acc 42.969 (52.566)	Top-5 acc 67.969 (75.609)	lr 0.02009
Train [36][260/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.101)	Loss 3.0205 (2.9732)	Entropy 0.70184 (0.70174)	Top-1 acc 51.172 (52.624)	Top-5 acc 76.562 (75.629)	lr 0.02009
Train [36][270/3239]	Time 0.230 (0.516)	Data Time 0.001 (0.097)	Loss 3.0328 (2.9746)	Entropy 0.70185 (0.70174)	Top-1 acc 52.734 (52.537)	Top-5 acc 71.875 (75.608)	lr 0.02009
Train [36][280/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.094)	Loss 3.0609 (2.9722)	Entropy 0.70186 (0.70175)	Top-1 acc 50.781 (52.595)	Top-5 acc 72.656 (75.635)	lr 0.02009
Train [36][290/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.091)	Loss 2.8578 (2.9722)	Entropy 0.70170 (0.70175)	Top-1 acc 55.859 (52.575)	Top-5 acc 76.953 (75.640)	lr 0.02009
Train [36][300/3239]	Time 0.222 (0.504)	Data Time 0.001 (0.088)	Loss 2.7863 (2.9717)	Entropy 0.70184 (0.70175)	Top-1 acc 57.422 (52.583)	Top-5 acc 76.562 (75.646)	lr 0.02009
Train [36][310/3239]	Time 0.239 (0.501)	Data Time 0.001 (0.085)	Loss 2.7991 (2.9719)	Entropy 0.70147 (0.70175)	Top-1 acc 53.125 (52.548)	Top-5 acc 78.516 (75.651)	lr 0.02008
Train [36][320/3239]	Time 0.225 (0.497)	Data Time 0.002 (0.082)	Loss 3.2880 (2.9732)	Entropy 0.70116 (0.70174)	Top-1 acc 45.312 (52.532)	Top-5 acc 67.188 (75.600)	lr 0.02008
Train [36][330/3239]	Time 0.234 (0.494)	Data Time 0.001 (0.080)	Loss 3.1427 (2.9731)	Entropy 0.70112 (0.70172)	Top-1 acc 51.172 (52.547)	Top-5 acc 71.484 (75.594)	lr 0.02008
Train [36][340/3239]	Time 0.236 (0.492)	Data Time 0.001 (0.077)	Loss 2.8571 (2.9739)	Entropy 0.70163 (0.70171)	Top-1 acc 53.516 (52.505)	Top-5 acc 78.906 (75.573)	lr 0.02008
Train [36][350/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.075)	Loss 3.1962 (2.9754)	Entropy 0.70168 (0.70170)	Top-1 acc 48.828 (52.486)	Top-5 acc 68.750 (75.553)	lr 0.02008
Train [36][360/3239]	Time 0.236 (0.487)	Data Time 0.001 (0.073)	Loss 2.8766 (2.9744)	Entropy 0.70177 (0.70170)	Top-1 acc 57.812 (52.515)	Top-5 acc 78.516 (75.561)	lr 0.02008
Train [36][370/3239]	Time 0.213 (0.484)	Data Time 0.001 (0.071)	Loss 3.1254 (2.9747)	Entropy 0.70178 (0.70170)	Top-1 acc 48.828 (52.496)	Top-5 acc 73.047 (75.568)	lr 0.02008
Train [36][380/3239]	Time 0.317 (0.482)	Data Time 0.001 (0.070)	Loss 2.9748 (2.9747)	Entropy 0.70193 (0.70171)	Top-1 acc 51.562 (52.491)	Top-5 acc 74.609 (75.573)	lr 0.02008
Train [36][390/3239]	Time 0.230 (0.480)	Data Time 0.001 (0.068)	Loss 2.8088 (2.9755)	Entropy 0.70185 (0.70171)	Top-1 acc 58.203 (52.489)	Top-5 acc 81.250 (75.579)	lr 0.02008
Train [36][400/3239]	Time 0.232 (0.477)	Data Time 0.001 (0.066)	Loss 2.7668 (2.9758)	Entropy 0.70192 (0.70172)	Top-1 acc 55.859 (52.476)	Top-5 acc 80.859 (75.568)	lr 0.02008
Train [36][410/3239]	Time 0.231 (0.476)	Data Time 0.001 (0.065)	Loss 2.9493 (2.9764)	Entropy 0.70184 (0.70172)	Top-1 acc 48.828 (52.450)	Top-5 acc 75.000 (75.565)	lr 0.02008
Train [36][420/3239]	Time 0.214 (0.474)	Data Time 0.001 (0.063)	Loss 3.1651 (2.9774)	Entropy 0.70208 (0.70173)	Top-1 acc 48.828 (52.444)	Top-5 acc 74.609 (75.534)	lr 0.02008
Train [36][430/3239]	Time 0.240 (0.472)	Data Time 0.001 (0.062)	Loss 2.8139 (2.9763)	Entropy 0.70222 (0.70174)	Top-1 acc 56.641 (52.454)	Top-5 acc 78.125 (75.563)	lr 0.02008
Train [36][440/3239]	Time 0.228 (0.471)	Data Time 0.001 (0.060)	Loss 2.9448 (2.9742)	Entropy 0.70171 (0.70175)	Top-1 acc 55.078 (52.522)	Top-5 acc 76.562 (75.608)	lr 0.02007
Train [36][450/3239]	Time 0.318 (0.469)	Data Time 0.001 (0.059)	Loss 2.8678 (2.9731)	Entropy 0.70134 (0.70174)	Top-1 acc 56.250 (52.567)	Top-5 acc 78.906 (75.626)	lr 0.02007
Train [36][460/3239]	Time 0.246 (0.468)	Data Time 0.001 (0.058)	Loss 3.1081 (2.9745)	Entropy 0.70096 (0.70173)	Top-1 acc 50.000 (52.535)	Top-5 acc 70.312 (75.597)	lr 0.02007
Train [36][470/3239]	Time 0.237 (0.466)	Data Time 0.001 (0.056)	Loss 3.1949 (2.9748)	Entropy 0.70109 (0.70172)	Top-1 acc 48.438 (52.543)	Top-5 acc 70.312 (75.571)	lr 0.02007
Train [36][480/3239]	Time 0.228 (0.465)	Data Time 0.001 (0.055)	Loss 3.1031 (2.9754)	Entropy 0.70105 (0.70170)	Top-1 acc 53.125 (52.535)	Top-5 acc 75.391 (75.592)	lr 0.02007
Train [36][490/3239]	Time 0.226 (0.464)	Data Time 0.001 (0.054)	Loss 3.0059 (2.9752)	Entropy 0.70143 (0.70169)	Top-1 acc 51.953 (52.567)	Top-5 acc 75.391 (75.593)	lr 0.02007
Train [36][500/3239]	Time 0.261 (0.463)	Data Time 0.001 (0.053)	Loss 2.9590 (2.9746)	Entropy 0.70165 (0.70169)	Top-1 acc 52.344 (52.585)	Top-5 acc 76.172 (75.613)	lr 0.02007
Train [36][510/3239]	Time 0.223 (0.461)	Data Time 0.001 (0.052)	Loss 3.1061 (2.9748)	Entropy 0.70168 (0.70169)	Top-1 acc 49.219 (52.591)	Top-5 acc 75.391 (75.610)	lr 0.02007
Train [36][520/3239]	Time 0.263 (0.460)	Data Time 0.001 (0.051)	Loss 2.9994 (2.9749)	Entropy 0.70193 (0.70169)	Top-1 acc 50.000 (52.572)	Top-5 acc 75.781 (75.602)	lr 0.02007
Train [36][530/3239]	Time 0.220 (0.459)	Data Time 0.001 (0.050)	Loss 3.0064 (2.9755)	Entropy 0.70195 (0.70170)	Top-1 acc 50.000 (52.577)	Top-5 acc 73.438 (75.594)	lr 0.02007
Train [36][540/3239]	Time 0.642 (0.506)	Data Time 0.005 (0.049)	Loss 2.9123 (2.9756)	Entropy 0.70175 (0.70170)	Top-1 acc 51.562 (52.574)	Top-5 acc 78.125 (75.587)	lr 0.02007
Train [36][550/3239]	Time 0.242 (0.508)	Data Time 0.002 (0.049)	Loss 2.8549 (2.9759)	Entropy 0.70175 (0.70170)	Top-1 acc 56.641 (52.571)	Top-5 acc 76.953 (75.581)	lr 0.02007
Train [36][560/3239]	Time 0.230 (0.506)	Data Time 0.001 (0.048)	Loss 2.8097 (2.9749)	Entropy 0.70168 (0.70170)	Top-1 acc 56.250 (52.592)	Top-5 acc 78.125 (75.591)	lr 0.02006
Train [36][570/3239]	Time 0.239 (0.505)	Data Time 0.001 (0.047)	Loss 3.0347 (2.9753)	Entropy 0.70138 (0.70170)	Top-1 acc 50.391 (52.591)	Top-5 acc 75.391 (75.584)	lr 0.02006
Train [36][580/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.046)	Loss 2.9075 (2.9769)	Entropy 0.70179 (0.70170)	Top-1 acc 54.297 (52.553)	Top-5 acc 78.906 (75.571)	lr 0.02006
Train [36][590/3239]	Time 0.224 (0.502)	Data Time 0.001 (0.045)	Loss 3.0432 (2.9778)	Entropy 0.70159 (0.70170)	Top-1 acc 49.609 (52.541)	Top-5 acc 73.828 (75.554)	lr 0.02006
Train [36][600/3239]	Time 0.234 (0.501)	Data Time 0.001 (0.045)	Loss 2.9629 (2.9772)	Entropy 0.70153 (0.70169)	Top-1 acc 53.125 (52.573)	Top-5 acc 75.000 (75.549)	lr 0.02006
Train [36][610/3239]	Time 0.345 (0.500)	Data Time 0.001 (0.044)	Loss 2.8168 (2.9777)	Entropy 0.70204 (0.70170)	Top-1 acc 57.422 (52.559)	Top-5 acc 80.469 (75.538)	lr 0.02006
Train [36][620/3239]	Time 0.228 (0.499)	Data Time 0.001 (0.043)	Loss 2.9012 (2.9780)	Entropy 0.70228 (0.70170)	Top-1 acc 58.203 (52.553)	Top-5 acc 76.953 (75.523)	lr 0.02006
Train [36][630/3239]	Time 0.230 (0.497)	Data Time 0.001 (0.043)	Loss 3.0821 (2.9784)	Entropy 0.70227 (0.70171)	Top-1 acc 50.391 (52.555)	Top-5 acc 73.438 (75.505)	lr 0.02006
Train [36][640/3239]	Time 0.225 (0.496)	Data Time 0.001 (0.042)	Loss 3.2194 (2.9782)	Entropy 0.70221 (0.70172)	Top-1 acc 49.609 (52.559)	Top-5 acc 71.484 (75.513)	lr 0.02006
Train [36][650/3239]	Time 0.228 (0.495)	Data Time 0.001 (0.041)	Loss 2.9129 (2.9782)	Entropy 0.70205 (0.70172)	Top-1 acc 55.859 (52.566)	Top-5 acc 77.344 (75.525)	lr 0.02006
Train [36][660/3239]	Time 0.244 (0.493)	Data Time 0.001 (0.041)	Loss 2.9538 (2.9778)	Entropy 0.70213 (0.70173)	Top-1 acc 50.000 (52.562)	Top-5 acc 75.000 (75.534)	lr 0.02006
Train [36][670/3239]	Time 0.234 (0.492)	Data Time 0.001 (0.040)	Loss 2.7839 (2.9769)	Entropy 0.70221 (0.70174)	Top-1 acc 56.250 (52.595)	Top-5 acc 78.906 (75.541)	lr 0.02006
Train [36][680/3239]	Time 0.228 (0.491)	Data Time 0.001 (0.040)	Loss 3.1552 (2.9769)	Entropy 0.70187 (0.70174)	Top-1 acc 51.172 (52.608)	Top-5 acc 72.266 (75.531)	lr 0.02005
Train [36][690/3239]	Time 0.239 (0.490)	Data Time 0.001 (0.039)	Loss 3.0974 (2.9770)	Entropy 0.70140 (0.70174)	Top-1 acc 48.828 (52.596)	Top-5 acc 71.875 (75.524)	lr 0.02005
Train [36][700/3239]	Time 0.318 (0.489)	Data Time 0.001 (0.039)	Loss 2.9113 (2.9771)	Entropy 0.70118 (0.70173)	Top-1 acc 51.172 (52.597)	Top-5 acc 75.391 (75.523)	lr 0.02005
Train [36][710/3239]	Time 0.230 (0.488)	Data Time 0.001 (0.038)	Loss 3.0107 (2.9765)	Entropy 0.70126 (0.70172)	Top-1 acc 50.000 (52.614)	Top-5 acc 76.172 (75.537)	lr 0.02005
Train [36][720/3239]	Time 0.239 (0.487)	Data Time 0.001 (0.038)	Loss 3.0717 (2.9761)	Entropy 0.70108 (0.70172)	Top-1 acc 51.953 (52.623)	Top-5 acc 73.438 (75.540)	lr 0.02005
Train [36][730/3239]	Time 0.225 (0.486)	Data Time 0.001 (0.037)	Loss 3.0736 (2.9760)	Entropy 0.70113 (0.70171)	Top-1 acc 50.000 (52.623)	Top-5 acc 74.219 (75.543)	lr 0.02005
Train [36][740/3239]	Time 0.231 (0.485)	Data Time 0.001 (0.037)	Loss 3.0639 (2.9762)	Entropy 0.70129 (0.70170)	Top-1 acc 53.516 (52.616)	Top-5 acc 74.609 (75.531)	lr 0.02005
Train [36][750/3239]	Time 0.227 (0.484)	Data Time 0.001 (0.036)	Loss 3.1948 (2.9771)	Entropy 0.70120 (0.70169)	Top-1 acc 48.047 (52.605)	Top-5 acc 69.922 (75.506)	lr 0.02005
Train [36][760/3239]	Time 0.218 (0.483)	Data Time 0.001 (0.036)	Loss 2.9128 (2.9768)	Entropy 0.70103 (0.70169)	Top-1 acc 52.734 (52.606)	Top-5 acc 77.734 (75.518)	lr 0.02005
Train [36][770/3239]	Time 0.321 (0.482)	Data Time 0.001 (0.035)	Loss 2.8619 (2.9776)	Entropy 0.70069 (0.70168)	Top-1 acc 57.031 (52.586)	Top-5 acc 78.125 (75.497)	lr 0.02005
Train [36][780/3239]	Time 0.238 (0.481)	Data Time 0.001 (0.035)	Loss 2.7493 (2.9765)	Entropy 0.70060 (0.70166)	Top-1 acc 56.250 (52.605)	Top-5 acc 80.859 (75.511)	lr 0.02005
Train [36][790/3239]	Time 0.229 (0.480)	Data Time 0.001 (0.034)	Loss 2.9860 (2.9769)	Entropy 0.70049 (0.70165)	Top-1 acc 46.875 (52.584)	Top-5 acc 75.391 (75.502)	lr 0.02005
Train [36][800/3239]	Time 0.232 (0.479)	Data Time 0.001 (0.034)	Loss 3.1245 (2.9774)	Entropy 0.70025 (0.70163)	Top-1 acc 49.219 (52.583)	Top-5 acc 71.484 (75.486)	lr 0.02005
Train [36][810/3239]	Time 0.234 (0.478)	Data Time 0.001 (0.034)	Loss 3.0891 (2.9768)	Entropy 0.69999 (0.70161)	Top-1 acc 49.219 (52.608)	Top-5 acc 71.875 (75.498)	lr 0.02004
Train [36][820/3239]	Time 0.223 (0.477)	Data Time 0.001 (0.033)	Loss 2.7727 (2.9761)	Entropy 0.70012 (0.70160)	Top-1 acc 56.641 (52.623)	Top-5 acc 77.344 (75.514)	lr 0.02004
Train [36][830/3239]	Time 0.229 (0.477)	Data Time 0.001 (0.033)	Loss 2.9844 (2.9760)	Entropy 0.69963 (0.70158)	Top-1 acc 50.391 (52.619)	Top-5 acc 72.656 (75.514)	lr 0.02004
Train [36][840/3239]	Time 0.231 (0.476)	Data Time 0.001 (0.032)	Loss 3.0262 (2.9756)	Entropy 0.69955 (0.70155)	Top-1 acc 50.391 (52.626)	Top-5 acc 73.828 (75.510)	lr 0.02004
Train [36][850/3239]	Time 0.235 (0.475)	Data Time 0.001 (0.032)	Loss 3.0530 (2.9753)	Entropy 0.69948 (0.70153)	Top-1 acc 51.562 (52.618)	Top-5 acc 72.656 (75.517)	lr 0.02004
Train [36][860/3239]	Time 0.272 (0.475)	Data Time 0.001 (0.032)	Loss 3.2290 (2.9758)	Entropy 0.69933 (0.70150)	Top-1 acc 47.656 (52.606)	Top-5 acc 70.703 (75.507)	lr 0.02004
Train [36][870/3239]	Time 0.236 (0.474)	Data Time 0.001 (0.031)	Loss 2.9980 (2.9764)	Entropy 0.69938 (0.70148)	Top-1 acc 49.609 (52.581)	Top-5 acc 74.609 (75.487)	lr 0.02004
Train [36][880/3239]	Time 0.230 (0.473)	Data Time 0.001 (0.031)	Loss 3.1715 (2.9766)	Entropy 0.69946 (0.70145)	Top-1 acc 50.000 (52.578)	Top-5 acc 71.484 (75.490)	lr 0.02004
Train [36][890/3239]	Time 0.231 (0.472)	Data Time 0.001 (0.031)	Loss 3.0400 (2.9762)	Entropy 0.69969 (0.70143)	Top-1 acc 50.781 (52.587)	Top-5 acc 73.047 (75.490)	lr 0.02004
Train [36][900/3239]	Time 0.234 (0.471)	Data Time 0.001 (0.030)	Loss 3.2295 (2.9764)	Entropy 0.69988 (0.70141)	Top-1 acc 43.359 (52.565)	Top-5 acc 68.750 (75.490)	lr 0.02004
Train [36][910/3239]	Time 0.221 (0.471)	Data Time 0.001 (0.030)	Loss 3.0889 (2.9764)	Entropy 0.70013 (0.70140)	Top-1 acc 53.125 (52.580)	Top-5 acc 71.484 (75.484)	lr 0.02004
Train [36][920/3239]	Time 0.224 (0.470)	Data Time 0.001 (0.030)	Loss 2.7776 (2.9764)	Entropy 0.70040 (0.70138)	Top-1 acc 53.516 (52.573)	Top-5 acc 80.859 (75.484)	lr 0.02004
Train [36][930/3239]	Time 0.323 (0.469)	Data Time 0.001 (0.029)	Loss 2.8993 (2.9755)	Entropy 0.70078 (0.70137)	Top-1 acc 53.125 (52.596)	Top-5 acc 77.734 (75.501)	lr 0.02003
Train [36][940/3239]	Time 0.229 (0.468)	Data Time 0.001 (0.029)	Loss 2.7173 (2.9757)	Entropy 0.70081 (0.70137)	Top-1 acc 59.766 (52.588)	Top-5 acc 82.422 (75.494)	lr 0.02003
Train [36][950/3239]	Time 0.232 (0.467)	Data Time 0.001 (0.029)	Loss 2.7077 (2.9758)	Entropy 0.70074 (0.70136)	Top-1 acc 60.547 (52.596)	Top-5 acc 79.688 (75.496)	lr 0.02003
Train [36][960/3239]	Time 0.227 (0.467)	Data Time 0.001 (0.029)	Loss 2.7954 (2.9758)	Entropy 0.70068 (0.70135)	Top-1 acc 55.859 (52.592)	Top-5 acc 77.734 (75.494)	lr 0.02003
Train [36][970/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.028)	Loss 2.9900 (2.9758)	Entropy 0.70076 (0.70135)	Top-1 acc 55.469 (52.600)	Top-5 acc 73.438 (75.485)	lr 0.02003
Train [36][980/3239]	Time 0.233 (0.465)	Data Time 0.001 (0.028)	Loss 3.0000 (2.9761)	Entropy 0.70063 (0.70134)	Top-1 acc 53.906 (52.601)	Top-5 acc 75.781 (75.478)	lr 0.02003
Train [36][990/3239]	Time 0.225 (0.465)	Data Time 0.001 (0.028)	Loss 2.9911 (2.9762)	Entropy 0.70059 (0.70133)	Top-1 acc 55.078 (52.593)	Top-5 acc 75.391 (75.473)	lr 0.02003
Train [36][1000/3239]	Time 0.333 (0.464)	Data Time 0.001 (0.027)	Loss 2.9129 (2.9772)	Entropy 0.70059 (0.70133)	Top-1 acc 50.781 (52.560)	Top-5 acc 77.734 (75.454)	lr 0.02003
Train [36][1010/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.027)	Loss 2.9279 (2.9773)	Entropy 0.70062 (0.70132)	Top-1 acc 56.641 (52.569)	Top-5 acc 73.828 (75.447)	lr 0.02003
Train [36][1020/3239]	Time 0.229 (0.463)	Data Time 0.001 (0.027)	Loss 3.1346 (2.9777)	Entropy 0.70040 (0.70131)	Top-1 acc 51.172 (52.563)	Top-5 acc 71.875 (75.431)	lr 0.02003
Train [36][1030/3239]	Time 0.231 (0.462)	Data Time 0.001 (0.027)	Loss 2.9863 (2.9774)	Entropy 0.70070 (0.70131)	Top-1 acc 50.781 (52.566)	Top-5 acc 74.219 (75.441)	lr 0.02003
Train [36][1040/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.026)	Loss 3.0731 (2.9774)	Entropy 0.70069 (0.70130)	Top-1 acc 50.391 (52.567)	Top-5 acc 74.609 (75.446)	lr 0.02003
Train [36][1050/3239]	Time 0.226 (0.461)	Data Time 0.001 (0.026)	Loss 3.2253 (2.9776)	Entropy 0.70048 (0.70129)	Top-1 acc 49.219 (52.560)	Top-5 acc 68.359 (75.436)	lr 0.02003
Train [36][1060/3239]	Time 0.226 (0.460)	Data Time 0.001 (0.026)	Loss 2.8499 (2.9775)	Entropy 0.69991 (0.70128)	Top-1 acc 52.344 (52.560)	Top-5 acc 77.344 (75.438)	lr 0.02002
Train [36][1070/3239]	Time 0.219 (0.460)	Data Time 0.001 (0.026)	Loss 2.9345 (2.9774)	Entropy 0.69995 (0.70127)	Top-1 acc 47.656 (52.563)	Top-5 acc 73.438 (75.438)	lr 0.02002
Train [36][1080/3239]	Time 0.231 (0.459)	Data Time 0.001 (0.026)	Loss 2.8951 (2.9770)	Entropy 0.70028 (0.70126)	Top-1 acc 54.688 (52.571)	Top-5 acc 76.953 (75.444)	lr 0.02002
Train [36][1090/3239]	Time 0.319 (0.459)	Data Time 0.001 (0.025)	Loss 2.9144 (2.9767)	Entropy 0.70020 (0.70125)	Top-1 acc 53.906 (52.575)	Top-5 acc 78.125 (75.451)	lr 0.02002
Train [36][1100/3239]	Time 0.236 (0.458)	Data Time 0.001 (0.025)	Loss 2.9337 (2.9763)	Entropy 0.70025 (0.70124)	Top-1 acc 51.172 (52.585)	Top-5 acc 76.953 (75.457)	lr 0.02002
Train [36][1110/3239]	Time 0.218 (0.458)	Data Time 0.001 (0.025)	Loss 3.0750 (2.9770)	Entropy 0.70028 (0.70123)	Top-1 acc 52.734 (52.568)	Top-5 acc 71.094 (75.439)	lr 0.02002
Train [36][1120/3239]	Time 0.224 (0.457)	Data Time 0.001 (0.025)	Loss 2.8546 (2.9770)	Entropy 0.70023 (0.70122)	Top-1 acc 56.250 (52.571)	Top-5 acc 78.125 (75.436)	lr 0.02002
Train [36][1130/3239]	Time 0.233 (0.457)	Data Time 0.001 (0.024)	Loss 3.0601 (2.9767)	Entropy 0.70039 (0.70122)	Top-1 acc 52.734 (52.569)	Top-5 acc 72.656 (75.432)	lr 0.02002
Train [36][1140/3239]	Time 0.231 (0.456)	Data Time 0.001 (0.024)	Loss 3.0509 (2.9768)	Entropy 0.70047 (0.70121)	Top-1 acc 50.781 (52.555)	Top-5 acc 73.047 (75.427)	lr 0.02002
Train [36][1150/3239]	Time 0.234 (0.456)	Data Time 0.001 (0.024)	Loss 2.9794 (2.9773)	Entropy 0.70013 (0.70120)	Top-1 acc 48.828 (52.529)	Top-5 acc 74.219 (75.418)	lr 0.02002
Train [36][1160/3239]	Time 0.327 (0.455)	Data Time 0.001 (0.024)	Loss 2.9719 (2.9776)	Entropy 0.70042 (0.70119)	Top-1 acc 50.781 (52.524)	Top-5 acc 75.391 (75.416)	lr 0.02002
Train [36][1170/3239]	Time 0.228 (0.455)	Data Time 0.001 (0.024)	Loss 3.0173 (2.9773)	Entropy 0.70002 (0.70119)	Top-1 acc 51.562 (52.534)	Top-5 acc 75.781 (75.429)	lr 0.02002
Train [36][1180/3239]	Time 0.223 (0.454)	Data Time 0.001 (0.024)	Loss 3.1535 (2.9777)	Entropy 0.69988 (0.70118)	Top-1 acc 51.953 (52.532)	Top-5 acc 73.828 (75.416)	lr 0.02001
Train [36][1190/3239]	Time 0.236 (0.454)	Data Time 0.001 (0.023)	Loss 2.8415 (2.9777)	Entropy 0.69952 (0.70117)	Top-1 acc 54.688 (52.528)	Top-5 acc 77.344 (75.407)	lr 0.02001
Train [36][1200/3239]	Time 0.269 (0.477)	Data Time 0.004 (0.023)	Loss 3.1578 (2.9780)	Entropy 0.69978 (0.70115)	Top-1 acc 47.656 (52.521)	Top-5 acc 70.312 (75.407)	lr 0.02001
Train [36][1210/3239]	Time 0.237 (0.477)	Data Time 0.002 (0.023)	Loss 3.0195 (2.9784)	Entropy 0.69998 (0.70114)	Top-1 acc 51.562 (52.517)	Top-5 acc 75.391 (75.397)	lr 0.02001
Train [36][1220/3239]	Time 0.260 (0.476)	Data Time 0.001 (0.023)	Loss 2.8183 (2.9790)	Entropy 0.69930 (0.70113)	Top-1 acc 59.375 (52.489)	Top-5 acc 78.906 (75.384)	lr 0.02001
Train [36][1230/3239]	Time 0.271 (0.476)	Data Time 0.001 (0.023)	Loss 2.8612 (2.9784)	Entropy 0.69917 (0.70112)	Top-1 acc 52.734 (52.501)	Top-5 acc 77.344 (75.395)	lr 0.02001
Train [36][1240/3239]	Time 0.250 (0.476)	Data Time 0.001 (0.023)	Loss 2.8515 (2.9777)	Entropy 0.69900 (0.70110)	Top-1 acc 57.812 (52.523)	Top-5 acc 78.516 (75.408)	lr 0.02001
Train [36][1250/3239]	Time 0.346 (0.476)	Data Time 0.001 (0.022)	Loss 2.8960 (2.9777)	Entropy 0.69923 (0.70108)	Top-1 acc 53.906 (52.526)	Top-5 acc 76.172 (75.400)	lr 0.02001
Train [36][1260/3239]	Time 0.232 (0.475)	Data Time 0.001 (0.022)	Loss 2.7973 (2.9776)	Entropy 0.69910 (0.70107)	Top-1 acc 56.250 (52.531)	Top-5 acc 77.734 (75.402)	lr 0.02001
Train [36][1270/3239]	Time 0.231 (0.475)	Data Time 0.001 (0.022)	Loss 2.9835 (2.9775)	Entropy 0.69886 (0.70105)	Top-1 acc 55.078 (52.528)	Top-5 acc 76.172 (75.406)	lr 0.02001
Train [36][1280/3239]	Time 0.225 (0.475)	Data Time 0.001 (0.022)	Loss 2.9537 (2.9774)	Entropy 0.69855 (0.70104)	Top-1 acc 53.906 (52.527)	Top-5 acc 76.953 (75.409)	lr 0.02001
Train [36][1290/3239]	Time 0.232 (0.474)	Data Time 0.001 (0.022)	Loss 3.0869 (2.9768)	Entropy 0.69825 (0.70102)	Top-1 acc 47.656 (52.544)	Top-5 acc 70.703 (75.418)	lr 0.02001
Train [36][1300/3239]	Time 0.244 (0.474)	Data Time 0.001 (0.022)	Loss 2.8561 (2.9764)	Entropy 0.69818 (0.70099)	Top-1 acc 52.734 (52.552)	Top-5 acc 78.906 (75.424)	lr 0.02000
Train [36][1310/3239]	Time 0.239 (0.474)	Data Time 0.001 (0.021)	Loss 2.8930 (2.9762)	Entropy 0.69820 (0.70097)	Top-1 acc 53.516 (52.551)	Top-5 acc 80.078 (75.437)	lr 0.02000
Train [36][1320/3239]	Time 0.346 (0.473)	Data Time 0.001 (0.021)	Loss 2.9777 (2.9760)	Entropy 0.69827 (0.70095)	Top-1 acc 50.000 (52.545)	Top-5 acc 73.828 (75.441)	lr 0.02000
Train [36][1330/3239]	Time 0.231 (0.473)	Data Time 0.001 (0.021)	Loss 3.2318 (2.9761)	Entropy 0.69804 (0.70093)	Top-1 acc 48.438 (52.531)	Top-5 acc 72.656 (75.442)	lr 0.02000
Train [36][1340/3239]	Time 0.233 (0.473)	Data Time 0.001 (0.021)	Loss 3.1250 (2.9762)	Entropy 0.69773 (0.70091)	Top-1 acc 49.609 (52.526)	Top-5 acc 70.703 (75.439)	lr 0.02000
Train [36][1350/3239]	Time 0.238 (0.472)	Data Time 0.003 (0.021)	Loss 2.8204 (2.9761)	Entropy 0.69771 (0.70088)	Top-1 acc 57.812 (52.527)	Top-5 acc 77.344 (75.440)	lr 0.02000
Train [36][1360/3239]	Time 0.227 (0.472)	Data Time 0.001 (0.021)	Loss 2.9575 (2.9761)	Entropy 0.69754 (0.70086)	Top-1 acc 52.344 (52.531)	Top-5 acc 76.562 (75.445)	lr 0.02000
Train [36][1370/3239]	Time 0.287 (0.472)	Data Time 0.001 (0.021)	Loss 3.2084 (2.9766)	Entropy 0.69773 (0.70084)	Top-1 acc 50.391 (52.523)	Top-5 acc 71.875 (75.437)	lr 0.02000
Train [36][1380/3239]	Time 0.233 (0.471)	Data Time 0.001 (0.020)	Loss 2.6952 (2.9768)	Entropy 0.69741 (0.70081)	Top-1 acc 58.594 (52.517)	Top-5 acc 79.688 (75.432)	lr 0.02000
Train [36][1390/3239]	Time 0.235 (0.471)	Data Time 0.001 (0.020)	Loss 2.9388 (2.9764)	Entropy 0.69726 (0.70079)	Top-1 acc 54.297 (52.527)	Top-5 acc 75.781 (75.442)	lr 0.02000
Train [36][1400/3239]	Time 0.230 (0.471)	Data Time 0.001 (0.020)	Loss 2.9079 (2.9762)	Entropy 0.69748 (0.70076)	Top-1 acc 52.734 (52.529)	Top-5 acc 76.172 (75.449)	lr 0.02000
Train [36][1410/3239]	Time 0.250 (0.470)	Data Time 0.001 (0.020)	Loss 2.8079 (2.9760)	Entropy 0.69759 (0.70074)	Top-1 acc 57.422 (52.539)	Top-5 acc 75.781 (75.450)	lr 0.02000
Train [36][1420/3239]	Time 0.257 (0.470)	Data Time 0.001 (0.020)	Loss 2.9998 (2.9760)	Entropy 0.69799 (0.70072)	Top-1 acc 50.000 (52.533)	Top-5 acc 74.609 (75.451)	lr 0.02000
Train [36][1430/3239]	Time 0.233 (0.470)	Data Time 0.001 (0.020)	Loss 2.9631 (2.9759)	Entropy 0.69799 (0.70070)	Top-1 acc 53.906 (52.539)	Top-5 acc 76.562 (75.456)	lr 0.01999
Train [36][1440/3239]	Time 0.264 (0.469)	Data Time 0.001 (0.020)	Loss 3.0578 (2.9758)	Entropy 0.69802 (0.70068)	Top-1 acc 49.219 (52.545)	Top-5 acc 76.953 (75.459)	lr 0.01999
Train [36][1450/3239]	Time 0.237 (0.469)	Data Time 0.001 (0.020)	Loss 2.8770 (2.9757)	Entropy 0.69798 (0.70066)	Top-1 acc 55.078 (52.550)	Top-5 acc 76.953 (75.462)	lr 0.01999
Train [36][1460/3239]	Time 0.233 (0.469)	Data Time 0.001 (0.019)	Loss 2.9620 (2.9756)	Entropy 0.69773 (0.70064)	Top-1 acc 51.953 (52.553)	Top-5 acc 79.297 (75.466)	lr 0.01999
Train [36][1470/3239]	Time 0.244 (0.468)	Data Time 0.001 (0.019)	Loss 2.9482 (2.9753)	Entropy 0.69767 (0.70062)	Top-1 acc 51.562 (52.560)	Top-5 acc 75.781 (75.481)	lr 0.01999
Train [36][1480/3239]	Time 0.331 (0.468)	Data Time 0.001 (0.019)	Loss 2.9288 (2.9754)	Entropy 0.69762 (0.70060)	Top-1 acc 53.125 (52.561)	Top-5 acc 73.047 (75.473)	lr 0.01999
Train [36][1490/3239]	Time 0.230 (0.468)	Data Time 0.001 (0.019)	Loss 2.8960 (2.9750)	Entropy 0.69739 (0.70058)	Top-1 acc 52.344 (52.570)	Top-5 acc 76.562 (75.482)	lr 0.01999
Train [36][1500/3239]	Time 0.234 (0.467)	Data Time 0.001 (0.019)	Loss 2.8667 (2.9749)	Entropy 0.69744 (0.70056)	Top-1 acc 52.734 (52.571)	Top-5 acc 78.125 (75.481)	lr 0.01999
Train [36][1510/3239]	Time 0.228 (0.467)	Data Time 0.001 (0.019)	Loss 3.0156 (2.9746)	Entropy 0.69740 (0.70054)	Top-1 acc 50.391 (52.572)	Top-5 acc 75.781 (75.491)	lr 0.01999
Train [36][1520/3239]	Time 0.230 (0.467)	Data Time 0.001 (0.019)	Loss 2.7975 (2.9745)	Entropy 0.69727 (0.70052)	Top-1 acc 54.297 (52.572)	Top-5 acc 77.734 (75.498)	lr 0.01999
Train [36][1530/3239]	Time 0.221 (0.466)	Data Time 0.001 (0.019)	Loss 2.8463 (2.9744)	Entropy 0.69708 (0.70050)	Top-1 acc 56.641 (52.576)	Top-5 acc 78.906 (75.499)	lr 0.01999
Train [36][1540/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.018)	Loss 2.8198 (2.9741)	Entropy 0.69710 (0.70048)	Top-1 acc 57.812 (52.585)	Top-5 acc 78.906 (75.505)	lr 0.01999
Train [36][1550/3239]	Time 0.328 (0.466)	Data Time 0.001 (0.018)	Loss 2.9931 (2.9740)	Entropy 0.69739 (0.70045)	Top-1 acc 50.391 (52.583)	Top-5 acc 73.438 (75.511)	lr 0.01998
Train [36][1560/3239]	Time 0.235 (0.465)	Data Time 0.001 (0.018)	Loss 2.9772 (2.9739)	Entropy 0.69770 (0.70044)	Top-1 acc 54.297 (52.587)	Top-5 acc 73.438 (75.509)	lr 0.01998
Train [36][1570/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.018)	Loss 2.8985 (2.9741)	Entropy 0.69748 (0.70042)	Top-1 acc 54.297 (52.585)	Top-5 acc 76.953 (75.505)	lr 0.01998
Train [36][1580/3239]	Time 0.231 (0.464)	Data Time 0.001 (0.018)	Loss 2.8853 (2.9738)	Entropy 0.69737 (0.70040)	Top-1 acc 54.688 (52.596)	Top-5 acc 74.609 (75.512)	lr 0.01998
Train [36][1590/3239]	Time 0.247 (0.464)	Data Time 0.001 (0.018)	Loss 3.0848 (2.9739)	Entropy 0.69739 (0.70038)	Top-1 acc 50.781 (52.596)	Top-5 acc 74.609 (75.511)	lr 0.01998
Train [36][1600/3239]	Time 0.235 (0.464)	Data Time 0.001 (0.018)	Loss 2.7998 (2.9736)	Entropy 0.69724 (0.70036)	Top-1 acc 55.078 (52.602)	Top-5 acc 76.953 (75.516)	lr 0.01998
Train [36][1610/3239]	Time 0.229 (0.463)	Data Time 0.001 (0.018)	Loss 2.9375 (2.9734)	Entropy 0.69752 (0.70034)	Top-1 acc 49.609 (52.604)	Top-5 acc 76.172 (75.516)	lr 0.01998
Train [36][1620/3239]	Time 0.224 (0.463)	Data Time 0.001 (0.018)	Loss 2.9665 (2.9737)	Entropy 0.69743 (0.70032)	Top-1 acc 51.172 (52.590)	Top-5 acc 76.953 (75.505)	lr 0.01998
Train [36][1630/3239]	Time 0.229 (0.462)	Data Time 0.001 (0.018)	Loss 2.9963 (2.9736)	Entropy 0.69744 (0.70031)	Top-1 acc 51.562 (52.591)	Top-5 acc 72.656 (75.507)	lr 0.01998
Train [36][1640/3239]	Time 0.325 (0.462)	Data Time 0.001 (0.017)	Loss 2.8933 (2.9733)	Entropy 0.69754 (0.70029)	Top-1 acc 55.469 (52.600)	Top-5 acc 76.562 (75.511)	lr 0.01998
Train [36][1650/3239]	Time 0.226 (0.462)	Data Time 0.001 (0.017)	Loss 3.0989 (2.9731)	Entropy 0.69758 (0.70027)	Top-1 acc 51.172 (52.601)	Top-5 acc 69.531 (75.517)	lr 0.01998
Train [36][1660/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.017)	Loss 3.0038 (2.9734)	Entropy 0.69764 (0.70026)	Top-1 acc 53.906 (52.598)	Top-5 acc 78.125 (75.512)	lr 0.01998
Train [36][1670/3239]	Time 0.235 (0.461)	Data Time 0.001 (0.017)	Loss 2.8578 (2.9732)	Entropy 0.69772 (0.70024)	Top-1 acc 53.906 (52.603)	Top-5 acc 76.562 (75.510)	lr 0.01998
Train [36][1680/3239]	Time 0.263 (0.461)	Data Time 0.001 (0.017)	Loss 2.8760 (2.9731)	Entropy 0.69805 (0.70023)	Top-1 acc 53.906 (52.605)	Top-5 acc 77.734 (75.511)	lr 0.01997
Train [36][1690/3239]	Time 0.243 (0.460)	Data Time 0.001 (0.017)	Loss 3.2325 (2.9736)	Entropy 0.69779 (0.70021)	Top-1 acc 50.000 (52.593)	Top-5 acc 69.922 (75.507)	lr 0.01997
Train [36][1700/3239]	Time 0.231 (0.460)	Data Time 0.001 (0.017)	Loss 3.1582 (2.9742)	Entropy 0.69761 (0.70020)	Top-1 acc 46.875 (52.576)	Top-5 acc 72.656 (75.497)	lr 0.01997
Train [36][1710/3239]	Time 0.328 (0.460)	Data Time 0.001 (0.017)	Loss 3.2024 (2.9742)	Entropy 0.69771 (0.70018)	Top-1 acc 49.219 (52.576)	Top-5 acc 71.094 (75.496)	lr 0.01997
Train [36][1720/3239]	Time 0.234 (0.460)	Data Time 0.001 (0.017)	Loss 3.0510 (2.9743)	Entropy 0.69758 (0.70017)	Top-1 acc 50.000 (52.572)	Top-5 acc 73.047 (75.493)	lr 0.01997
Train [36][1730/3239]	Time 0.231 (0.459)	Data Time 0.001 (0.017)	Loss 2.8687 (2.9740)	Entropy 0.69740 (0.70015)	Top-1 acc 53.906 (52.582)	Top-5 acc 80.859 (75.496)	lr 0.01997
Train [36][1740/3239]	Time 0.221 (0.459)	Data Time 0.001 (0.017)	Loss 3.2061 (2.9741)	Entropy 0.69735 (0.70014)	Top-1 acc 46.094 (52.577)	Top-5 acc 71.484 (75.494)	lr 0.01997
Train [36][1750/3239]	Time 0.235 (0.459)	Data Time 0.001 (0.016)	Loss 3.1210 (2.9743)	Entropy 0.69738 (0.70012)	Top-1 acc 49.609 (52.570)	Top-5 acc 71.484 (75.490)	lr 0.01997
Train [36][1760/3239]	Time 0.231 (0.459)	Data Time 0.001 (0.016)	Loss 2.8715 (2.9741)	Entropy 0.69714 (0.70010)	Top-1 acc 58.203 (52.577)	Top-5 acc 77.734 (75.495)	lr 0.01997
Train [36][1770/3239]	Time 0.232 (0.458)	Data Time 0.001 (0.016)	Loss 3.1417 (2.9742)	Entropy 0.69697 (0.70009)	Top-1 acc 48.438 (52.569)	Top-5 acc 71.094 (75.491)	lr 0.01997
Train [36][1780/3239]	Time 0.237 (0.458)	Data Time 0.001 (0.016)	Loss 2.8337 (2.9743)	Entropy 0.69661 (0.70007)	Top-1 acc 60.156 (52.565)	Top-5 acc 79.297 (75.491)	lr 0.01997
Train [36][1790/3239]	Time 0.234 (0.458)	Data Time 0.001 (0.016)	Loss 2.9281 (2.9740)	Entropy 0.69642 (0.70005)	Top-1 acc 55.469 (52.569)	Top-5 acc 75.391 (75.495)	lr 0.01997
Train [36][1800/3239]	Time 0.341 (0.458)	Data Time 0.001 (0.016)	Loss 3.0149 (2.9742)	Entropy 0.69619 (0.70003)	Top-1 acc 52.344 (52.564)	Top-5 acc 73.828 (75.492)	lr 0.01996
Train [36][1810/3239]	Time 0.227 (0.457)	Data Time 0.001 (0.016)	Loss 2.7019 (2.9742)	Entropy 0.69652 (0.70001)	Top-1 acc 58.203 (52.561)	Top-5 acc 82.031 (75.493)	lr 0.01996
Train [36][1820/3239]	Time 0.226 (0.457)	Data Time 0.001 (0.016)	Loss 3.1901 (2.9743)	Entropy 0.69667 (0.69999)	Top-1 acc 49.219 (52.557)	Top-5 acc 73.438 (75.491)	lr 0.01996
Train [36][1830/3239]	Time 0.235 (0.457)	Data Time 0.001 (0.016)	Loss 2.9253 (2.9741)	Entropy 0.69670 (0.69997)	Top-1 acc 51.953 (52.558)	Top-5 acc 77.734 (75.500)	lr 0.01996
Train [36][1840/3239]	Time 0.223 (0.456)	Data Time 0.001 (0.016)	Loss 3.2345 (2.9742)	Entropy 0.69611 (0.69995)	Top-1 acc 45.312 (52.559)	Top-5 acc 68.359 (75.496)	lr 0.01996
Train [36][1850/3239]	Time 0.416 (0.471)	Data Time 0.004 (0.016)	Loss 3.1135 (2.9739)	Entropy 0.69603 (0.69993)	Top-1 acc 49.219 (52.560)	Top-5 acc 73.828 (75.502)	lr 0.01996
Train [36][1860/3239]	Time 0.238 (0.471)	Data Time 0.002 (0.016)	Loss 3.0098 (2.9739)	Entropy 0.69589 (0.69991)	Top-1 acc 54.688 (52.558)	Top-5 acc 75.391 (75.502)	lr 0.01996
Train [36][1870/3239]	Time 0.332 (0.471)	Data Time 0.001 (0.015)	Loss 3.3921 (2.9740)	Entropy 0.69566 (0.69989)	Top-1 acc 40.234 (52.550)	Top-5 acc 68.750 (75.497)	lr 0.01996
Train [36][1880/3239]	Time 0.246 (0.471)	Data Time 0.001 (0.015)	Loss 2.9347 (2.9741)	Entropy 0.69620 (0.69987)	Top-1 acc 53.906 (52.549)	Top-5 acc 74.609 (75.490)	lr 0.01996
Train [36][1890/3239]	Time 0.235 (0.470)	Data Time 0.001 (0.015)	Loss 3.0046 (2.9741)	Entropy 0.69615 (0.69985)	Top-1 acc 52.734 (52.546)	Top-5 acc 73.828 (75.490)	lr 0.01996
Train [36][1900/3239]	Time 0.240 (0.470)	Data Time 0.001 (0.015)	Loss 3.0757 (2.9743)	Entropy 0.69599 (0.69983)	Top-1 acc 50.391 (52.538)	Top-5 acc 75.000 (75.491)	lr 0.01996
Train [36][1910/3239]	Time 0.232 (0.470)	Data Time 0.001 (0.015)	Loss 3.2946 (2.9744)	Entropy 0.69574 (0.69981)	Top-1 acc 47.656 (52.538)	Top-5 acc 67.578 (75.488)	lr 0.01996
Train [36][1920/3239]	Time 0.232 (0.469)	Data Time 0.001 (0.015)	Loss 2.9865 (2.9744)	Entropy 0.69563 (0.69979)	Top-1 acc 56.250 (52.538)	Top-5 acc 73.438 (75.487)	lr 0.01995
Train [36][1930/3239]	Time 0.230 (0.469)	Data Time 0.001 (0.015)	Loss 3.0290 (2.9745)	Entropy 0.69590 (0.69977)	Top-1 acc 52.734 (52.538)	Top-5 acc 76.172 (75.485)	lr 0.01995
Train [36][1940/3239]	Time 0.237 (0.469)	Data Time 0.001 (0.015)	Loss 3.1641 (2.9746)	Entropy 0.69593 (0.69975)	Top-1 acc 46.484 (52.533)	Top-5 acc 73.438 (75.486)	lr 0.01995
Train [36][1950/3239]	Time 0.235 (0.469)	Data Time 0.001 (0.015)	Loss 2.9270 (2.9744)	Entropy 0.69579 (0.69973)	Top-1 acc 53.516 (52.539)	Top-5 acc 75.781 (75.485)	lr 0.01995
Train [36][1960/3239]	Time 0.338 (0.468)	Data Time 0.001 (0.015)	Loss 2.9317 (2.9745)	Entropy 0.69553 (0.69971)	Top-1 acc 54.297 (52.532)	Top-5 acc 74.219 (75.484)	lr 0.01995
Train [36][1970/3239]	Time 0.239 (0.468)	Data Time 0.001 (0.015)	Loss 3.0410 (2.9744)	Entropy 0.69550 (0.69969)	Top-1 acc 51.562 (52.537)	Top-5 acc 74.609 (75.487)	lr 0.01995
Train [36][1980/3239]	Time 0.218 (0.468)	Data Time 0.001 (0.015)	Loss 3.1695 (2.9745)	Entropy 0.69565 (0.69966)	Top-1 acc 44.531 (52.533)	Top-5 acc 71.094 (75.483)	lr 0.01995
Train [36][1990/3239]	Time 0.233 (0.467)	Data Time 0.001 (0.015)	Loss 2.9397 (2.9746)	Entropy 0.69566 (0.69964)	Top-1 acc 53.125 (52.528)	Top-5 acc 77.734 (75.486)	lr 0.01995
Train [36][2000/3239]	Time 0.225 (0.467)	Data Time 0.001 (0.015)	Loss 2.8700 (2.9746)	Entropy 0.69574 (0.69962)	Top-1 acc 54.688 (52.524)	Top-5 acc 78.516 (75.485)	lr 0.01995
Train [36][2010/3239]	Time 0.234 (0.467)	Data Time 0.001 (0.015)	Loss 3.0684 (2.9747)	Entropy 0.69592 (0.69961)	Top-1 acc 49.219 (52.525)	Top-5 acc 74.219 (75.484)	lr 0.01995
Train [36][2020/3239]	Time 0.228 (0.467)	Data Time 0.001 (0.014)	Loss 2.9979 (2.9748)	Entropy 0.69595 (0.69959)	Top-1 acc 51.172 (52.518)	Top-5 acc 76.562 (75.485)	lr 0.01995
Train [36][2030/3239]	Time 0.322 (0.466)	Data Time 0.001 (0.014)	Loss 3.0666 (2.9746)	Entropy 0.69642 (0.69957)	Top-1 acc 51.172 (52.525)	Top-5 acc 72.266 (75.490)	lr 0.01995
Train [36][2040/3239]	Time 0.237 (0.466)	Data Time 0.001 (0.014)	Loss 3.0126 (2.9748)	Entropy 0.69642 (0.69955)	Top-1 acc 52.734 (52.527)	Top-5 acc 71.094 (75.483)	lr 0.01995
Train [36][2050/3239]	Time 0.245 (0.466)	Data Time 0.001 (0.014)	Loss 2.8850 (2.9750)	Entropy 0.69636 (0.69954)	Top-1 acc 50.391 (52.522)	Top-5 acc 76.172 (75.484)	lr 0.01994
Train [36][2060/3239]	Time 0.236 (0.466)	Data Time 0.001 (0.014)	Loss 3.2073 (2.9751)	Entropy 0.69634 (0.69952)	Top-1 acc 48.438 (52.521)	Top-5 acc 71.094 (75.482)	lr 0.01994
Train [36][2070/3239]	Time 0.243 (0.466)	Data Time 0.001 (0.014)	Loss 3.2227 (2.9750)	Entropy 0.69587 (0.69951)	Top-1 acc 46.094 (52.522)	Top-5 acc 72.266 (75.485)	lr 0.01994
Train [36][2080/3239]	Time 0.235 (0.465)	Data Time 0.001 (0.014)	Loss 3.1084 (2.9751)	Entropy 0.69579 (0.69949)	Top-1 acc 48.828 (52.522)	Top-5 acc 73.828 (75.482)	lr 0.01994
Train [36][2090/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.014)	Loss 3.1980 (2.9749)	Entropy 0.69594 (0.69947)	Top-1 acc 51.953 (52.526)	Top-5 acc 72.656 (75.488)	lr 0.01994
Train [36][2100/3239]	Time 0.236 (0.465)	Data Time 0.001 (0.014)	Loss 3.0798 (2.9750)	Entropy 0.69594 (0.69945)	Top-1 acc 48.828 (52.526)	Top-5 acc 74.609 (75.484)	lr 0.01994
Train [36][2110/3239]	Time 0.251 (0.465)	Data Time 0.001 (0.014)	Loss 2.8694 (2.9748)	Entropy 0.69589 (0.69944)	Top-1 acc 54.297 (52.530)	Top-5 acc 78.906 (75.491)	lr 0.01994
Train [36][2120/3239]	Time 0.285 (0.465)	Data Time 0.001 (0.014)	Loss 3.0472 (2.9745)	Entropy 0.69612 (0.69942)	Top-1 acc 53.125 (52.535)	Top-5 acc 73.047 (75.497)	lr 0.01994
Train [36][2130/3239]	Time 0.234 (0.465)	Data Time 0.001 (0.014)	Loss 2.7765 (2.9745)	Entropy 0.69549 (0.69941)	Top-1 acc 51.953 (52.532)	Top-5 acc 80.859 (75.497)	lr 0.01994
Train [36][2140/3239]	Time 0.242 (0.464)	Data Time 0.001 (0.014)	Loss 3.0092 (2.9743)	Entropy 0.69539 (0.69939)	Top-1 acc 51.953 (52.536)	Top-5 acc 74.219 (75.503)	lr 0.01994
Train [36][2150/3239]	Time 0.243 (0.464)	Data Time 0.001 (0.014)	Loss 2.9158 (2.9744)	Entropy 0.69527 (0.69937)	Top-1 acc 50.781 (52.539)	Top-5 acc 74.609 (75.500)	lr 0.01994
Train [36][2160/3239]	Time 0.237 (0.464)	Data Time 0.001 (0.014)	Loss 2.7982 (2.9747)	Entropy 0.69519 (0.69935)	Top-1 acc 59.766 (52.536)	Top-5 acc 81.641 (75.497)	lr 0.01994
Train [36][2170/3239]	Time 0.246 (0.464)	Data Time 0.001 (0.014)	Loss 3.0606 (2.9751)	Entropy 0.69537 (0.69933)	Top-1 acc 48.828 (52.529)	Top-5 acc 72.266 (75.486)	lr 0.01993
Train [36][2180/3239]	Time 0.245 (0.464)	Data Time 0.001 (0.014)	Loss 2.8960 (2.9749)	Entropy 0.69556 (0.69931)	Top-1 acc 50.000 (52.529)	Top-5 acc 76.172 (75.492)	lr 0.01993
Train [36][2190/3239]	Time 0.332 (0.464)	Data Time 0.001 (0.013)	Loss 2.7509 (2.9747)	Entropy 0.69543 (0.69930)	Top-1 acc 57.812 (52.531)	Top-5 acc 80.859 (75.499)	lr 0.01993
Train [36][2200/3239]	Time 0.223 (0.463)	Data Time 0.001 (0.013)	Loss 2.9636 (2.9748)	Entropy 0.69515 (0.69928)	Top-1 acc 51.172 (52.524)	Top-5 acc 75.391 (75.501)	lr 0.01993
Train [36][2210/3239]	Time 0.231 (0.463)	Data Time 0.001 (0.013)	Loss 3.0691 (2.9748)	Entropy 0.69544 (0.69926)	Top-1 acc 49.609 (52.523)	Top-5 acc 74.219 (75.500)	lr 0.01993
Train [36][2220/3239]	Time 0.228 (0.463)	Data Time 0.001 (0.013)	Loss 2.9613 (2.9746)	Entropy 0.69515 (0.69924)	Top-1 acc 53.906 (52.531)	Top-5 acc 76.562 (75.500)	lr 0.01993
Train [36][2230/3239]	Time 0.220 (0.463)	Data Time 0.001 (0.013)	Loss 2.9679 (2.9746)	Entropy 0.69545 (0.69922)	Top-1 acc 53.125 (52.533)	Top-5 acc 75.391 (75.500)	lr 0.01993
Train [36][2240/3239]	Time 0.244 (0.463)	Data Time 0.001 (0.013)	Loss 2.9610 (2.9746)	Entropy 0.69518 (0.69921)	Top-1 acc 49.609 (52.536)	Top-5 acc 76.562 (75.499)	lr 0.01993
Train [36][2250/3239]	Time 0.228 (0.462)	Data Time 0.002 (0.013)	Loss 3.0987 (2.9747)	Entropy 0.69534 (0.69919)	Top-1 acc 47.266 (52.531)	Top-5 acc 75.781 (75.500)	lr 0.01993
Train [36][2260/3239]	Time 0.323 (0.462)	Data Time 0.001 (0.013)	Loss 3.0393 (2.9746)	Entropy 0.69557 (0.69917)	Top-1 acc 51.953 (52.533)	Top-5 acc 73.047 (75.497)	lr 0.01993
Train [36][2270/3239]	Time 0.220 (0.462)	Data Time 0.001 (0.013)	Loss 3.2195 (2.9747)	Entropy 0.69560 (0.69916)	Top-1 acc 46.484 (52.530)	Top-5 acc 71.094 (75.498)	lr 0.01993
Train [36][2280/3239]	Time 0.219 (0.461)	Data Time 0.001 (0.013)	Loss 3.1380 (2.9744)	Entropy 0.69548 (0.69914)	Top-1 acc 46.484 (52.534)	Top-5 acc 73.438 (75.504)	lr 0.01993
Train [36][2290/3239]	Time 0.224 (0.461)	Data Time 0.001 (0.013)	Loss 2.8437 (2.9744)	Entropy 0.69535 (0.69913)	Top-1 acc 57.031 (52.536)	Top-5 acc 79.688 (75.507)	lr 0.01992
Train [36][2300/3239]	Time 0.228 (0.461)	Data Time 0.001 (0.013)	Loss 2.8695 (2.9744)	Entropy 0.69542 (0.69911)	Top-1 acc 57.031 (52.536)	Top-5 acc 78.516 (75.507)	lr 0.01992
Train [36][2310/3239]	Time 0.228 (0.461)	Data Time 0.001 (0.013)	Loss 2.9734 (2.9744)	Entropy 0.69583 (0.69909)	Top-1 acc 53.516 (52.532)	Top-5 acc 76.172 (75.505)	lr 0.01992
Train [36][2320/3239]	Time 0.240 (0.460)	Data Time 0.001 (0.013)	Loss 2.8582 (2.9745)	Entropy 0.69571 (0.69908)	Top-1 acc 55.859 (52.530)	Top-5 acc 76.953 (75.504)	lr 0.01992
Train [36][2330/3239]	Time 0.230 (0.460)	Data Time 0.001 (0.013)	Loss 3.0492 (2.9744)	Entropy 0.69528 (0.69906)	Top-1 acc 49.609 (52.531)	Top-5 acc 72.656 (75.505)	lr 0.01992
Train [36][2340/3239]	Time 0.232 (0.460)	Data Time 0.001 (0.013)	Loss 3.0132 (2.9745)	Entropy 0.69546 (0.69905)	Top-1 acc 51.953 (52.532)	Top-5 acc 75.000 (75.504)	lr 0.01992
Train [36][2350/3239]	Time 0.326 (0.460)	Data Time 0.001 (0.013)	Loss 2.8736 (2.9742)	Entropy 0.69513 (0.69903)	Top-1 acc 57.422 (52.535)	Top-5 acc 78.516 (75.502)	lr 0.01992
Train [36][2360/3239]	Time 0.251 (0.459)	Data Time 0.001 (0.013)	Loss 3.1142 (2.9742)	Entropy 0.69532 (0.69902)	Top-1 acc 46.094 (52.535)	Top-5 acc 71.484 (75.502)	lr 0.01992
Train [36][2370/3239]	Time 0.222 (0.459)	Data Time 0.001 (0.013)	Loss 2.8855 (2.9742)	Entropy 0.69456 (0.69900)	Top-1 acc 55.469 (52.530)	Top-5 acc 75.391 (75.502)	lr 0.01992
Train [36][2380/3239]	Time 0.228 (0.459)	Data Time 0.001 (0.013)	Loss 3.0367 (2.9741)	Entropy 0.69471 (0.69898)	Top-1 acc 46.875 (52.530)	Top-5 acc 74.609 (75.502)	lr 0.01992
Train [36][2390/3239]	Time 0.233 (0.459)	Data Time 0.001 (0.012)	Loss 2.8111 (2.9739)	Entropy 0.69476 (0.69896)	Top-1 acc 57.031 (52.539)	Top-5 acc 78.516 (75.507)	lr 0.01992
Train [36][2400/3239]	Time 0.231 (0.458)	Data Time 0.001 (0.012)	Loss 3.1553 (2.9740)	Entropy 0.69496 (0.69895)	Top-1 acc 50.000 (52.543)	Top-5 acc 70.312 (75.505)	lr 0.01992
Train [36][2410/3239]	Time 0.230 (0.458)	Data Time 0.001 (0.012)	Loss 3.0069 (2.9739)	Entropy 0.69511 (0.69893)	Top-1 acc 55.859 (52.545)	Top-5 acc 76.953 (75.507)	lr 0.01991
Train [36][2420/3239]	Time 0.326 (0.458)	Data Time 0.001 (0.012)	Loss 3.1204 (2.9742)	Entropy 0.69535 (0.69892)	Top-1 acc 47.266 (52.538)	Top-5 acc 73.828 (75.501)	lr 0.01991
Train [36][2430/3239]	Time 0.214 (0.458)	Data Time 0.001 (0.012)	Loss 3.0507 (2.9744)	Entropy 0.69528 (0.69890)	Top-1 acc 49.219 (52.532)	Top-5 acc 76.953 (75.499)	lr 0.01991
Train [36][2440/3239]	Time 0.241 (0.458)	Data Time 0.001 (0.012)	Loss 3.1069 (2.9745)	Entropy 0.69522 (0.69889)	Top-1 acc 49.609 (52.530)	Top-5 acc 70.703 (75.498)	lr 0.01991
Train [36][2450/3239]	Time 0.228 (0.457)	Data Time 0.001 (0.012)	Loss 2.8952 (2.9745)	Entropy 0.69572 (0.69887)	Top-1 acc 55.469 (52.532)	Top-5 acc 76.562 (75.497)	lr 0.01991
Train [36][2460/3239]	Time 0.228 (0.457)	Data Time 0.001 (0.012)	Loss 2.7595 (2.9742)	Entropy 0.69563 (0.69886)	Top-1 acc 56.641 (52.541)	Top-5 acc 78.125 (75.499)	lr 0.01991
Train [36][2470/3239]	Time 0.232 (0.457)	Data Time 0.001 (0.012)	Loss 3.0529 (2.9746)	Entropy 0.69554 (0.69884)	Top-1 acc 52.734 (52.536)	Top-5 acc 74.219 (75.494)	lr 0.01991
Train [36][2480/3239]	Time 0.221 (0.457)	Data Time 0.001 (0.012)	Loss 3.0644 (2.9747)	Entropy 0.69540 (0.69883)	Top-1 acc 50.781 (52.535)	Top-5 acc 70.703 (75.490)	lr 0.01991
Train [36][2490/3239]	Time 0.229 (0.456)	Data Time 0.001 (0.012)	Loss 3.0474 (2.9744)	Entropy 0.69558 (0.69882)	Top-1 acc 51.953 (52.540)	Top-5 acc 73.047 (75.497)	lr 0.01991
Train [36][2500/3239]	Time 0.236 (0.456)	Data Time 0.001 (0.012)	Loss 2.9898 (2.9744)	Entropy 0.69529 (0.69880)	Top-1 acc 52.734 (52.539)	Top-5 acc 76.172 (75.499)	lr 0.01991
Train [36][2510/3239]	Time 0.367 (0.467)	Data Time 0.003 (0.012)	Loss 2.7893 (2.9743)	Entropy 0.69539 (0.69879)	Top-1 acc 56.250 (52.542)	Top-5 acc 78.516 (75.503)	lr 0.01991
Train [36][2520/3239]	Time 0.247 (0.467)	Data Time 0.002 (0.012)	Loss 2.8884 (2.9741)	Entropy 0.69532 (0.69878)	Top-1 acc 56.250 (52.544)	Top-5 acc 75.000 (75.506)	lr 0.01991
Train [36][2530/3239]	Time 0.245 (0.467)	Data Time 0.001 (0.012)	Loss 2.7491 (2.9740)	Entropy 0.69539 (0.69876)	Top-1 acc 57.422 (52.545)	Top-5 acc 80.078 (75.506)	lr 0.01991
Train [36][2540/3239]	Time 0.289 (0.467)	Data Time 0.002 (0.012)	Loss 2.9233 (2.9741)	Entropy 0.69524 (0.69875)	Top-1 acc 51.562 (52.541)	Top-5 acc 76.562 (75.507)	lr 0.01990
Train [36][2550/3239]	Time 0.238 (0.467)	Data Time 0.001 (0.012)	Loss 3.1274 (2.9740)	Entropy 0.69524 (0.69874)	Top-1 acc 49.219 (52.539)	Top-5 acc 67.969 (75.505)	lr 0.01990
Train [36][2560/3239]	Time 0.255 (0.467)	Data Time 0.002 (0.012)	Loss 2.9399 (2.9738)	Entropy 0.69564 (0.69872)	Top-1 acc 54.688 (52.542)	Top-5 acc 75.391 (75.507)	lr 0.01990
Train [36][2570/3239]	Time 0.246 (0.467)	Data Time 0.001 (0.012)	Loss 2.9773 (2.9738)	Entropy 0.69542 (0.69871)	Top-1 acc 48.828 (52.540)	Top-5 acc 75.391 (75.505)	lr 0.01990
Train [36][2580/3239]	Time 0.409 (0.467)	Data Time 0.002 (0.012)	Loss 2.8401 (2.9738)	Entropy 0.69546 (0.69870)	Top-1 acc 57.031 (52.539)	Top-5 acc 77.344 (75.505)	lr 0.01990
Train [36][2590/3239]	Time 0.243 (0.467)	Data Time 0.001 (0.012)	Loss 2.8047 (2.9740)	Entropy 0.69542 (0.69869)	Top-1 acc 58.594 (52.540)	Top-5 acc 80.078 (75.500)	lr 0.01990
Train [36][2600/3239]	Time 0.250 (0.467)	Data Time 0.001 (0.012)	Loss 2.9827 (2.9739)	Entropy 0.69513 (0.69867)	Top-1 acc 53.125 (52.540)	Top-5 acc 75.781 (75.499)	lr 0.01990
Train [36][2610/3239]	Time 0.253 (0.467)	Data Time 0.003 (0.012)	Loss 3.1007 (2.9738)	Entropy 0.69509 (0.69866)	Top-1 acc 49.219 (52.539)	Top-5 acc 71.875 (75.501)	lr 0.01990
Train [36][2620/3239]	Time 0.244 (0.467)	Data Time 0.001 (0.012)	Loss 2.9728 (2.9738)	Entropy 0.69523 (0.69865)	Top-1 acc 52.344 (52.539)	Top-5 acc 77.344 (75.502)	lr 0.01990
Train [36][2630/3239]	Time 0.240 (0.467)	Data Time 0.001 (0.012)	Loss 2.6731 (2.9740)	Entropy 0.69503 (0.69863)	Top-1 acc 56.250 (52.535)	Top-5 acc 80.859 (75.498)	lr 0.01990
Train [36][2640/3239]	Time 0.278 (0.467)	Data Time 0.001 (0.011)	Loss 2.7288 (2.9737)	Entropy 0.69552 (0.69862)	Top-1 acc 60.547 (52.546)	Top-5 acc 81.250 (75.502)	lr 0.01990
Train [36][2650/3239]	Time 0.270 (0.467)	Data Time 0.001 (0.011)	Loss 3.0743 (2.9738)	Entropy 0.69517 (0.69861)	Top-1 acc 48.438 (52.546)	Top-5 acc 72.656 (75.501)	lr 0.01990
Train [36][2660/3239]	Time 0.245 (0.466)	Data Time 0.001 (0.011)	Loss 2.8810 (2.9741)	Entropy 0.69542 (0.69860)	Top-1 acc 55.469 (52.542)	Top-5 acc 80.078 (75.495)	lr 0.01989
Train [36][2670/3239]	Time 0.354 (0.466)	Data Time 0.001 (0.011)	Loss 3.1030 (2.9742)	Entropy 0.69545 (0.69858)	Top-1 acc 49.609 (52.545)	Top-5 acc 70.312 (75.490)	lr 0.01989
Train [36][2680/3239]	Time 0.236 (0.466)	Data Time 0.001 (0.011)	Loss 2.8023 (2.9742)	Entropy 0.69556 (0.69857)	Top-1 acc 55.469 (52.542)	Top-5 acc 80.078 (75.491)	lr 0.01989
Train [36][2690/3239]	Time 0.249 (0.466)	Data Time 0.001 (0.011)	Loss 2.8283 (2.9743)	Entropy 0.69570 (0.69856)	Top-1 acc 55.859 (52.543)	Top-5 acc 77.344 (75.489)	lr 0.01989
Train [36][2700/3239]	Time 0.227 (0.466)	Data Time 0.001 (0.011)	Loss 2.9925 (2.9742)	Entropy 0.69600 (0.69855)	Top-1 acc 51.562 (52.546)	Top-5 acc 75.000 (75.491)	lr 0.01989
Train [36][2710/3239]	Time 0.241 (0.466)	Data Time 0.001 (0.011)	Loss 3.0019 (2.9741)	Entropy 0.69604 (0.69854)	Top-1 acc 51.562 (52.548)	Top-5 acc 75.781 (75.490)	lr 0.01989
Train [36][2720/3239]	Time 0.270 (0.466)	Data Time 0.001 (0.011)	Loss 2.9299 (2.9742)	Entropy 0.69614 (0.69853)	Top-1 acc 52.344 (52.545)	Top-5 acc 76.172 (75.488)	lr 0.01989
Train [36][2730/3239]	Time 0.229 (0.466)	Data Time 0.001 (0.011)	Loss 3.1905 (2.9740)	Entropy 0.69614 (0.69852)	Top-1 acc 49.609 (52.551)	Top-5 acc 70.703 (75.493)	lr 0.01989
Train [36][2740/3239]	Time 0.334 (0.466)	Data Time 0.001 (0.011)	Loss 3.2196 (2.9741)	Entropy 0.69639 (0.69852)	Top-1 acc 46.094 (52.548)	Top-5 acc 69.531 (75.493)	lr 0.01989
Train [36][2750/3239]	Time 0.237 (0.466)	Data Time 0.001 (0.011)	Loss 3.0474 (2.9741)	Entropy 0.69652 (0.69851)	Top-1 acc 48.438 (52.548)	Top-5 acc 73.828 (75.492)	lr 0.01989
Train [36][2760/3239]	Time 0.241 (0.465)	Data Time 0.001 (0.011)	Loss 2.9545 (2.9740)	Entropy 0.69662 (0.69850)	Top-1 acc 52.344 (52.552)	Top-5 acc 75.000 (75.492)	lr 0.01989
Train [36][2770/3239]	Time 0.233 (0.465)	Data Time 0.001 (0.011)	Loss 3.0292 (2.9742)	Entropy 0.69665 (0.69849)	Top-1 acc 52.344 (52.545)	Top-5 acc 72.656 (75.489)	lr 0.01989
Train [36][2780/3239]	Time 0.234 (0.465)	Data Time 0.001 (0.011)	Loss 2.9637 (2.9741)	Entropy 0.69687 (0.69849)	Top-1 acc 49.609 (52.547)	Top-5 acc 76.562 (75.491)	lr 0.01988
Train [36][2790/3239]	Time 0.227 (0.465)	Data Time 0.001 (0.011)	Loss 2.9172 (2.9742)	Entropy 0.69713 (0.69848)	Top-1 acc 54.297 (52.545)	Top-5 acc 74.609 (75.489)	lr 0.01988
Train [36][2800/3239]	Time 0.244 (0.465)	Data Time 0.001 (0.011)	Loss 2.9219 (2.9743)	Entropy 0.69690 (0.69848)	Top-1 acc 55.469 (52.546)	Top-5 acc 76.953 (75.487)	lr 0.01988
Train [36][2810/3239]	Time 0.238 (0.465)	Data Time 0.001 (0.011)	Loss 2.9499 (2.9742)	Entropy 0.69696 (0.69847)	Top-1 acc 53.516 (52.546)	Top-5 acc 75.391 (75.488)	lr 0.01988
Train [36][2820/3239]	Time 0.218 (0.465)	Data Time 0.001 (0.011)	Loss 2.9186 (2.9742)	Entropy 0.69671 (0.69847)	Top-1 acc 55.469 (52.543)	Top-5 acc 76.953 (75.487)	lr 0.01988
Train [36][2830/3239]	Time 0.235 (0.465)	Data Time 0.002 (0.011)	Loss 3.0637 (2.9739)	Entropy 0.69656 (0.69846)	Top-1 acc 49.609 (52.551)	Top-5 acc 76.953 (75.491)	lr 0.01988
Train [36][2840/3239]	Time 0.228 (0.465)	Data Time 0.001 (0.011)	Loss 3.1036 (2.9740)	Entropy 0.69634 (0.69845)	Top-1 acc 47.656 (52.544)	Top-5 acc 73.047 (75.485)	lr 0.01988
Train [36][2850/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.011)	Loss 2.9264 (2.9742)	Entropy 0.69642 (0.69844)	Top-1 acc 53.516 (52.540)	Top-5 acc 77.344 (75.480)	lr 0.01988
Train [36][2860/3239]	Time 0.233 (0.464)	Data Time 0.001 (0.011)	Loss 3.0240 (2.9742)	Entropy 0.69647 (0.69844)	Top-1 acc 51.172 (52.538)	Top-5 acc 75.391 (75.480)	lr 0.01988
Train [36][2870/3239]	Time 0.234 (0.464)	Data Time 0.001 (0.011)	Loss 2.7446 (2.9741)	Entropy 0.69634 (0.69843)	Top-1 acc 59.375 (52.541)	Top-5 acc 80.078 (75.482)	lr 0.01988
Train [36][2880/3239]	Time 0.232 (0.464)	Data Time 0.001 (0.011)	Loss 2.9739 (2.9740)	Entropy 0.69655 (0.69842)	Top-1 acc 53.516 (52.544)	Top-5 acc 77.344 (75.485)	lr 0.01988
Train [36][2890/3239]	Time 0.226 (0.464)	Data Time 0.001 (0.011)	Loss 3.1578 (2.9740)	Entropy 0.69621 (0.69842)	Top-1 acc 48.438 (52.542)	Top-5 acc 72.656 (75.484)	lr 0.01988
Train [36][2900/3239]	Time 0.335 (0.463)	Data Time 0.001 (0.011)	Loss 2.7926 (2.9737)	Entropy 0.69640 (0.69841)	Top-1 acc 57.031 (52.547)	Top-5 acc 76.562 (75.489)	lr 0.01988
Train [36][2910/3239]	Time 0.230 (0.463)	Data Time 0.001 (0.011)	Loss 2.9399 (2.9736)	Entropy 0.69644 (0.69840)	Top-1 acc 53.125 (52.548)	Top-5 acc 76.953 (75.491)	lr 0.01987
Train [36][2920/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.011)	Loss 2.8212 (2.9738)	Entropy 0.69645 (0.69840)	Top-1 acc 54.688 (52.542)	Top-5 acc 80.469 (75.490)	lr 0.01987
Train [36][2930/3239]	Time 0.239 (0.463)	Data Time 0.001 (0.010)	Loss 2.9038 (2.9737)	Entropy 0.69654 (0.69839)	Top-1 acc 52.734 (52.545)	Top-5 acc 80.469 (75.493)	lr 0.01987
Train [36][2940/3239]	Time 0.234 (0.463)	Data Time 0.001 (0.010)	Loss 3.0051 (2.9738)	Entropy 0.69666 (0.69838)	Top-1 acc 50.781 (52.540)	Top-5 acc 72.656 (75.489)	lr 0.01987
Train [36][2950/3239]	Time 0.244 (0.463)	Data Time 0.001 (0.010)	Loss 3.0860 (2.9739)	Entropy 0.69642 (0.69838)	Top-1 acc 51.953 (52.539)	Top-5 acc 72.656 (75.487)	lr 0.01987
Train [36][2960/3239]	Time 0.246 (0.463)	Data Time 0.001 (0.010)	Loss 3.0887 (2.9740)	Entropy 0.69622 (0.69837)	Top-1 acc 48.047 (52.539)	Top-5 acc 73.828 (75.486)	lr 0.01987
Train [36][2970/3239]	Time 0.344 (0.462)	Data Time 0.002 (0.010)	Loss 2.9447 (2.9740)	Entropy 0.69591 (0.69836)	Top-1 acc 52.734 (52.540)	Top-5 acc 74.219 (75.486)	lr 0.01987
Train [36][2980/3239]	Time 0.228 (0.462)	Data Time 0.001 (0.010)	Loss 2.9229 (2.9740)	Entropy 0.69603 (0.69836)	Top-1 acc 52.734 (52.537)	Top-5 acc 80.859 (75.488)	lr 0.01987
Train [36][2990/3239]	Time 0.231 (0.462)	Data Time 0.001 (0.010)	Loss 2.9633 (2.9738)	Entropy 0.69594 (0.69835)	Top-1 acc 53.516 (52.541)	Top-5 acc 76.172 (75.492)	lr 0.01987
Train [36][3000/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.010)	Loss 2.9441 (2.9736)	Entropy 0.69621 (0.69834)	Top-1 acc 54.297 (52.547)	Top-5 acc 75.000 (75.495)	lr 0.01987
Train [36][3010/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.010)	Loss 2.7887 (2.9735)	Entropy 0.69606 (0.69833)	Top-1 acc 58.984 (52.548)	Top-5 acc 80.078 (75.501)	lr 0.01987
Train [36][3020/3239]	Time 0.232 (0.462)	Data Time 0.001 (0.010)	Loss 2.9808 (2.9733)	Entropy 0.69621 (0.69833)	Top-1 acc 48.047 (52.552)	Top-5 acc 75.000 (75.505)	lr 0.01987
Train [36][3030/3239]	Time 0.240 (0.462)	Data Time 0.001 (0.010)	Loss 2.9914 (2.9734)	Entropy 0.69631 (0.69832)	Top-1 acc 54.297 (52.551)	Top-5 acc 75.391 (75.505)	lr 0.01986
Train [36][3040/3239]	Time 0.245 (0.461)	Data Time 0.001 (0.010)	Loss 2.8719 (2.9732)	Entropy 0.69667 (0.69831)	Top-1 acc 53.516 (52.556)	Top-5 acc 77.344 (75.510)	lr 0.01986
Train [36][3050/3239]	Time 0.234 (0.461)	Data Time 0.001 (0.010)	Loss 2.9871 (2.9733)	Entropy 0.69699 (0.69831)	Top-1 acc 54.297 (52.553)	Top-5 acc 75.391 (75.510)	lr 0.01986
Train [36][3060/3239]	Time 0.356 (0.461)	Data Time 0.001 (0.010)	Loss 2.9414 (2.9734)	Entropy 0.69655 (0.69830)	Top-1 acc 55.078 (52.552)	Top-5 acc 77.344 (75.508)	lr 0.01986
Train [36][3070/3239]	Time 0.238 (0.461)	Data Time 0.001 (0.010)	Loss 3.0940 (2.9733)	Entropy 0.69674 (0.69830)	Top-1 acc 50.000 (52.554)	Top-5 acc 73.047 (75.512)	lr 0.01986
Train [36][3080/3239]	Time 0.234 (0.461)	Data Time 0.001 (0.010)	Loss 2.9296 (2.9733)	Entropy 0.69675 (0.69829)	Top-1 acc 55.078 (52.555)	Top-5 acc 77.734 (75.512)	lr 0.01986
Train [36][3090/3239]	Time 0.235 (0.461)	Data Time 0.001 (0.010)	Loss 3.0261 (2.9732)	Entropy 0.69672 (0.69829)	Top-1 acc 52.734 (52.558)	Top-5 acc 71.875 (75.518)	lr 0.01986
Train [36][3100/3239]	Time 0.236 (0.461)	Data Time 0.001 (0.010)	Loss 3.1402 (2.9731)	Entropy 0.69694 (0.69828)	Top-1 acc 50.391 (52.559)	Top-5 acc 73.047 (75.519)	lr 0.01986
Train [36][3110/3239]	Time 0.241 (0.460)	Data Time 0.001 (0.010)	Loss 2.8911 (2.9732)	Entropy 0.69661 (0.69828)	Top-1 acc 53.906 (52.555)	Top-5 acc 76.953 (75.518)	lr 0.01986
Train [36][3120/3239]	Time 0.234 (0.460)	Data Time 0.001 (0.010)	Loss 2.6961 (2.9733)	Entropy 0.69678 (0.69827)	Top-1 acc 60.156 (52.553)	Top-5 acc 80.078 (75.517)	lr 0.01986
Train [36][3130/3239]	Time 0.320 (0.460)	Data Time 0.001 (0.010)	Loss 3.0129 (2.9734)	Entropy 0.69671 (0.69827)	Top-1 acc 52.344 (52.550)	Top-5 acc 74.219 (75.515)	lr 0.01986
Train [36][3140/3239]	Time 0.237 (0.460)	Data Time 0.002 (0.010)	Loss 3.1386 (2.9734)	Entropy 0.69684 (0.69826)	Top-1 acc 50.000 (52.551)	Top-5 acc 75.000 (75.513)	lr 0.01986
Train [36][3150/3239]	Time 0.244 (0.460)	Data Time 0.002 (0.010)	Loss 2.9446 (2.9733)	Entropy 0.69600 (0.69826)	Top-1 acc 57.031 (52.553)	Top-5 acc 75.781 (75.513)	lr 0.01985
Train [36][3160/3239]	Time 0.420 (0.468)	Data Time 0.005 (0.010)	Loss 2.9889 (2.9737)	Entropy 0.69574 (0.69825)	Top-1 acc 50.781 (52.546)	Top-5 acc 75.781 (75.509)	lr 0.01985
Train [36][3170/3239]	Time 0.272 (0.468)	Data Time 0.003 (0.010)	Loss 2.8928 (2.9737)	Entropy 0.69589 (0.69824)	Top-1 acc 56.250 (52.547)	Top-5 acc 77.734 (75.508)	lr 0.01985
Train [36][3180/3239]	Time 0.239 (0.468)	Data Time 0.000 (0.010)	Loss 2.8618 (2.9736)	Entropy 0.69586 (0.69823)	Top-1 acc 52.734 (52.548)	Top-5 acc 79.688 (75.509)	lr 0.01985
Train [36][3190/3239]	Time 0.237 (0.468)	Data Time 0.000 (0.010)	Loss 2.9979 (2.9739)	Entropy 0.69626 (0.69823)	Top-1 acc 52.734 (52.546)	Top-5 acc 74.219 (75.505)	lr 0.01985
Train [36][3200/3239]	Time 0.242 (0.468)	Data Time 0.000 (0.010)	Loss 2.9684 (2.9737)	Entropy 0.69618 (0.69822)	Top-1 acc 51.172 (52.545)	Top-5 acc 75.391 (75.506)	lr 0.01985
Train [36][3210/3239]	Time 0.247 (0.468)	Data Time 0.000 (0.010)	Loss 2.8896 (2.9737)	Entropy 0.69588 (0.69821)	Top-1 acc 57.031 (52.545)	Top-5 acc 75.781 (75.508)	lr 0.01985
Train [36][3220/3239]	Time 0.358 (0.468)	Data Time 0.000 (0.010)	Loss 3.1804 (2.9737)	Entropy 0.69588 (0.69821)	Top-1 acc 48.438 (52.543)	Top-5 acc 71.484 (75.507)	lr 0.01985
Train [36][3230/3239]	Time 0.252 (0.468)	Data Time 0.000 (0.010)	Loss 2.8278 (2.9736)	Entropy 0.69584 (0.69820)	Top-1 acc 58.594 (52.546)	Top-5 acc 75.781 (75.508)	lr 0.01985
Train [36][3239/3239]	Time 0.922 (0.467)	Data Time 0.000 (0.010)	Loss 3.2154 (2.9737)	Entropy 0.69582 (0.69819)	Top-1 acc 48.148 (52.545)	Top-5 acc 75.309 (75.506)	lr 0.01985
==========Valid [36/120]	loss 1.682	top-1 acc 61.688 (61.688)	top-5 acc 83.424	Train top-1 52.545	top-5 75.506	Entropy 0.69582	Latency-None: 0.000ms	Flops: 539.76M
Train [37][0/3239]	Time 26.312 (26.312)	Data Time 24.916 (24.916)	Loss 2.7593 (2.7593)	Entropy 0.69584 (0.69584)	Top-1 acc 57.031 (57.031)	Top-5 acc 81.250 (81.250)	lr 0.01985
Train [37][10/3239]	Time 0.238 (2.916)	Data Time 0.001 (2.299)	Loss 3.0287 (2.9788)	Entropy 0.69602 (0.69591)	Top-1 acc 51.562 (52.983)	Top-5 acc 75.000 (75.746)	lr 0.01985
Train [37][20/3239]	Time 0.239 (1.726)	Data Time 0.001 (1.205)	Loss 2.9601 (2.9668)	Entropy 0.69598 (0.69591)	Top-1 acc 55.078 (53.069)	Top-5 acc 76.172 (75.911)	lr 0.01985
Train [37][30/3239]	Time 0.239 (1.311)	Data Time 0.001 (0.817)	Loss 2.9009 (2.9395)	Entropy 0.69602 (0.69594)	Top-1 acc 55.859 (53.793)	Top-5 acc 77.734 (76.373)	lr 0.01984
Train [37][40/3239]	Time 0.232 (1.092)	Data Time 0.001 (0.618)	Loss 2.8436 (2.9312)	Entropy 0.69621 (0.69600)	Top-1 acc 56.250 (53.897)	Top-5 acc 77.344 (76.467)	lr 0.01984
Train [37][50/3239]	Time 0.232 (0.963)	Data Time 0.001 (0.497)	Loss 3.0884 (2.9447)	Entropy 0.69579 (0.69601)	Top-1 acc 47.266 (53.577)	Top-5 acc 71.875 (76.118)	lr 0.01984
Train [37][60/3239]	Time 0.224 (0.873)	Data Time 0.001 (0.416)	Loss 2.9111 (2.9469)	Entropy 0.69553 (0.69598)	Top-1 acc 53.906 (53.356)	Top-5 acc 76.172 (76.005)	lr 0.01984
Train [37][70/3239]	Time 0.274 (0.810)	Data Time 0.001 (0.357)	Loss 3.1491 (2.9528)	Entropy 0.69546 (0.69590)	Top-1 acc 48.438 (53.042)	Top-5 acc 71.484 (75.875)	lr 0.01984
Train [37][80/3239]	Time 0.236 (0.767)	Data Time 0.001 (0.314)	Loss 3.0046 (2.9563)	Entropy 0.69520 (0.69583)	Top-1 acc 46.094 (52.956)	Top-5 acc 74.609 (75.810)	lr 0.01984
Train [37][90/3239]	Time 0.229 (0.728)	Data Time 0.001 (0.279)	Loss 2.9785 (2.9478)	Entropy 0.69492 (0.69576)	Top-1 acc 55.469 (53.189)	Top-5 acc 76.953 (75.962)	lr 0.01984
Train [37][100/3239]	Time 0.261 (0.700)	Data Time 0.001 (0.252)	Loss 2.7829 (2.9471)	Entropy 0.69454 (0.69568)	Top-1 acc 55.859 (53.098)	Top-5 acc 82.422 (76.013)	lr 0.01984
Train [37][110/3239]	Time 0.246 (0.675)	Data Time 0.002 (0.229)	Loss 2.9671 (2.9515)	Entropy 0.69421 (0.69557)	Top-1 acc 55.078 (53.026)	Top-5 acc 76.562 (75.841)	lr 0.01984
Train [37][120/3239]	Time 0.338 (0.654)	Data Time 0.001 (0.211)	Loss 3.0870 (2.9517)	Entropy 0.69388 (0.69544)	Top-1 acc 52.344 (53.057)	Top-5 acc 73.828 (75.859)	lr 0.01984
Train [37][130/3239]	Time 0.242 (0.636)	Data Time 0.001 (0.195)	Loss 2.7973 (2.9558)	Entropy 0.69385 (0.69532)	Top-1 acc 60.156 (52.979)	Top-5 acc 78.516 (75.868)	lr 0.01984
Train [37][140/3239]	Time 0.229 (0.620)	Data Time 0.001 (0.181)	Loss 2.9374 (2.9592)	Entropy 0.69395 (0.69522)	Top-1 acc 56.250 (52.912)	Top-5 acc 75.391 (75.792)	lr 0.01984
Train [37][150/3239]	Time 0.231 (0.607)	Data Time 0.001 (0.169)	Loss 2.9802 (2.9565)	Entropy 0.69447 (0.69515)	Top-1 acc 52.344 (52.954)	Top-5 acc 75.391 (75.797)	lr 0.01984
Train [37][160/3239]	Time 0.242 (0.595)	Data Time 0.002 (0.159)	Loss 2.8707 (2.9583)	Entropy 0.69429 (0.69510)	Top-1 acc 54.688 (52.962)	Top-5 acc 77.734 (75.806)	lr 0.01983
Train [37][170/3239]	Time 0.286 (0.586)	Data Time 0.003 (0.149)	Loss 3.1337 (2.9559)	Entropy 0.69400 (0.69505)	Top-1 acc 48.438 (53.027)	Top-5 acc 75.781 (75.900)	lr 0.01983
Train [37][180/3239]	Time 0.219 (0.577)	Data Time 0.001 (0.141)	Loss 3.1095 (2.9567)	Entropy 0.69405 (0.69499)	Top-1 acc 50.391 (52.946)	Top-5 acc 70.703 (75.872)	lr 0.01983
Train [37][190/3239]	Time 0.335 (0.569)	Data Time 0.001 (0.134)	Loss 2.9464 (2.9581)	Entropy 0.69446 (0.69494)	Top-1 acc 52.734 (52.939)	Top-5 acc 74.609 (75.804)	lr 0.01983
Train [37][200/3239]	Time 0.237 (0.562)	Data Time 0.001 (0.127)	Loss 2.7425 (2.9562)	Entropy 0.69458 (0.69492)	Top-1 acc 55.859 (52.981)	Top-5 acc 80.859 (75.836)	lr 0.01983
Train [37][210/3239]	Time 0.255 (0.555)	Data Time 0.001 (0.121)	Loss 2.9253 (2.9586)	Entropy 0.69427 (0.69490)	Top-1 acc 53.906 (52.899)	Top-5 acc 75.391 (75.768)	lr 0.01983
Train [37][220/3239]	Time 0.247 (0.550)	Data Time 0.001 (0.116)	Loss 2.8922 (2.9583)	Entropy 0.69385 (0.69486)	Top-1 acc 53.906 (52.909)	Top-5 acc 75.391 (75.792)	lr 0.01983
Train [37][230/3239]	Time 0.241 (0.544)	Data Time 0.001 (0.111)	Loss 2.9471 (2.9568)	Entropy 0.69405 (0.69482)	Top-1 acc 55.859 (52.985)	Top-5 acc 77.734 (75.862)	lr 0.01983
Train [37][240/3239]	Time 0.223 (0.540)	Data Time 0.001 (0.107)	Loss 2.9467 (2.9546)	Entropy 0.69411 (0.69479)	Top-1 acc 55.469 (53.047)	Top-5 acc 77.734 (75.919)	lr 0.01983
Train [37][250/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.102)	Loss 2.9801 (2.9553)	Entropy 0.69421 (0.69477)	Top-1 acc 57.422 (53.071)	Top-5 acc 75.000 (75.898)	lr 0.01983
Train [37][260/3239]	Time 0.236 (0.530)	Data Time 0.001 (0.098)	Loss 2.7919 (2.9526)	Entropy 0.69422 (0.69474)	Top-1 acc 55.859 (53.170)	Top-5 acc 78.906 (75.967)	lr 0.01983
Train [37][270/3239]	Time 0.250 (0.526)	Data Time 0.003 (0.095)	Loss 2.8812 (2.9529)	Entropy 0.69414 (0.69473)	Top-1 acc 56.250 (53.164)	Top-5 acc 78.125 (75.956)	lr 0.01983
Train [37][280/3239]	Time 0.319 (0.522)	Data Time 0.001 (0.092)	Loss 2.8374 (2.9527)	Entropy 0.69409 (0.69471)	Top-1 acc 55.469 (53.186)	Top-5 acc 80.078 (75.966)	lr 0.01982
Train [37][290/3239]	Time 0.256 (0.518)	Data Time 0.001 (0.089)	Loss 2.9371 (2.9517)	Entropy 0.69404 (0.69469)	Top-1 acc 53.906 (53.196)	Top-5 acc 76.562 (75.980)	lr 0.01982
Train [37][300/3239]	Time 0.239 (0.514)	Data Time 0.001 (0.086)	Loss 2.8770 (2.9516)	Entropy 0.69376 (0.69466)	Top-1 acc 53.516 (53.169)	Top-5 acc 73.828 (75.959)	lr 0.01982
Train [37][310/3239]	Time 0.237 (0.511)	Data Time 0.001 (0.083)	Loss 3.2018 (2.9505)	Entropy 0.69390 (0.69463)	Top-1 acc 47.656 (53.193)	Top-5 acc 71.094 (75.962)	lr 0.01982
Train [37][320/3239]	Time 0.237 (0.508)	Data Time 0.001 (0.080)	Loss 2.7820 (2.9486)	Entropy 0.69376 (0.69461)	Top-1 acc 57.812 (53.233)	Top-5 acc 77.734 (75.980)	lr 0.01982
Train [37][330/3239]	Time 0.236 (0.505)	Data Time 0.001 (0.078)	Loss 2.9339 (2.9492)	Entropy 0.69399 (0.69458)	Top-1 acc 54.297 (53.219)	Top-5 acc 75.391 (75.956)	lr 0.01982
Train [37][340/3239]	Time 0.222 (0.502)	Data Time 0.001 (0.076)	Loss 3.0032 (2.9479)	Entropy 0.69375 (0.69456)	Top-1 acc 51.562 (53.259)	Top-5 acc 76.562 (75.983)	lr 0.01982
Train [37][350/3239]	Time 0.319 (0.499)	Data Time 0.001 (0.074)	Loss 2.7872 (2.9476)	Entropy 0.69337 (0.69453)	Top-1 acc 55.078 (53.259)	Top-5 acc 80.078 (76.006)	lr 0.01982
Train [37][360/3239]	Time 0.234 (0.496)	Data Time 0.006 (0.072)	Loss 3.0150 (2.9491)	Entropy 0.69312 (0.69450)	Top-1 acc 54.297 (53.245)	Top-5 acc 73.828 (75.958)	lr 0.01982
Train [37][370/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.070)	Loss 3.0523 (2.9501)	Entropy 0.69324 (0.69446)	Top-1 acc 52.344 (53.237)	Top-5 acc 72.656 (75.936)	lr 0.01982
Train [37][380/3239]	Time 0.219 (0.492)	Data Time 0.001 (0.068)	Loss 3.0192 (2.9498)	Entropy 0.69333 (0.69443)	Top-1 acc 51.562 (53.239)	Top-5 acc 73.438 (75.942)	lr 0.01982
Train [37][390/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.066)	Loss 2.9264 (2.9502)	Entropy 0.69366 (0.69441)	Top-1 acc 54.297 (53.235)	Top-5 acc 76.953 (75.942)	lr 0.01982
Train [37][400/3239]	Time 0.236 (0.488)	Data Time 0.001 (0.065)	Loss 3.0135 (2.9497)	Entropy 0.69402 (0.69439)	Top-1 acc 51.562 (53.237)	Top-5 acc 74.219 (75.951)	lr 0.01981
Train [37][410/3239]	Time 0.251 (0.486)	Data Time 0.001 (0.063)	Loss 2.8625 (2.9490)	Entropy 0.69421 (0.69438)	Top-1 acc 56.641 (53.261)	Top-5 acc 78.516 (75.955)	lr 0.01981
Train [37][420/3239]	Time 0.236 (0.484)	Data Time 0.001 (0.062)	Loss 2.9572 (2.9500)	Entropy 0.69416 (0.69438)	Top-1 acc 53.125 (53.247)	Top-5 acc 78.125 (75.957)	lr 0.01981
Train [37][430/3239]	Time 0.230 (0.482)	Data Time 0.001 (0.060)	Loss 2.9490 (2.9506)	Entropy 0.69410 (0.69437)	Top-1 acc 50.781 (53.235)	Top-5 acc 75.781 (75.954)	lr 0.01981
Train [37][440/3239]	Time 0.274 (0.481)	Data Time 0.002 (0.059)	Loss 2.9117 (2.9498)	Entropy 0.69396 (0.69436)	Top-1 acc 48.438 (53.252)	Top-5 acc 77.344 (75.957)	lr 0.01981
Train [37][450/3239]	Time 0.237 (0.479)	Data Time 0.001 (0.058)	Loss 2.9770 (2.9513)	Entropy 0.69402 (0.69435)	Top-1 acc 50.391 (53.199)	Top-5 acc 75.781 (75.913)	lr 0.01981
Train [37][460/3239]	Time 0.236 (0.477)	Data Time 0.001 (0.056)	Loss 3.1256 (2.9514)	Entropy 0.69423 (0.69435)	Top-1 acc 49.609 (53.180)	Top-5 acc 76.562 (75.930)	lr 0.01981
Train [37][470/3239]	Time 0.239 (0.476)	Data Time 0.001 (0.055)	Loss 2.8924 (2.9516)	Entropy 0.69396 (0.69434)	Top-1 acc 57.812 (53.190)	Top-5 acc 78.125 (75.932)	lr 0.01981
Train [37][480/3239]	Time 0.223 (0.474)	Data Time 0.001 (0.054)	Loss 3.0227 (2.9530)	Entropy 0.69414 (0.69434)	Top-1 acc 51.172 (53.157)	Top-5 acc 74.609 (75.913)	lr 0.01981
Train [37][490/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.053)	Loss 2.8656 (2.9535)	Entropy 0.69438 (0.69433)	Top-1 acc 53.906 (53.156)	Top-5 acc 78.516 (75.893)	lr 0.01981
Train [37][500/3239]	Time 0.233 (0.471)	Data Time 0.001 (0.052)	Loss 2.8723 (2.9530)	Entropy 0.69434 (0.69433)	Top-1 acc 55.078 (53.161)	Top-5 acc 77.734 (75.912)	lr 0.01981
Train [37][510/3239]	Time 0.325 (0.470)	Data Time 0.001 (0.051)	Loss 3.0769 (2.9528)	Entropy 0.69447 (0.69434)	Top-1 acc 50.000 (53.167)	Top-5 acc 69.922 (75.926)	lr 0.01981
Train [37][520/3239]	Time 0.238 (0.469)	Data Time 0.001 (0.050)	Loss 2.8252 (2.9522)	Entropy 0.69445 (0.69434)	Top-1 acc 56.641 (53.200)	Top-5 acc 78.516 (75.936)	lr 0.01980
Train [37][530/3239]	Time 0.230 (0.468)	Data Time 0.001 (0.049)	Loss 2.9540 (2.9521)	Entropy 0.69426 (0.69434)	Top-1 acc 50.391 (53.196)	Top-5 acc 74.219 (75.935)	lr 0.01980
Train [37][540/3239]	Time 0.218 (0.467)	Data Time 0.001 (0.048)	Loss 3.1756 (2.9541)	Entropy 0.69435 (0.69434)	Top-1 acc 51.562 (53.163)	Top-5 acc 69.922 (75.896)	lr 0.01980
Train [37][550/3239]	Time 0.228 (0.465)	Data Time 0.001 (0.047)	Loss 2.8143 (2.9549)	Entropy 0.69448 (0.69434)	Top-1 acc 55.078 (53.160)	Top-5 acc 78.906 (75.873)	lr 0.01980
Train [37][560/3239]	Time 0.220 (0.464)	Data Time 0.001 (0.047)	Loss 2.9981 (2.9539)	Entropy 0.69463 (0.69434)	Top-1 acc 53.516 (53.183)	Top-5 acc 73.828 (75.880)	lr 0.01980
Train [37][570/3239]	Time 0.227 (0.463)	Data Time 0.001 (0.046)	Loss 2.9881 (2.9543)	Entropy 0.69479 (0.69435)	Top-1 acc 51.172 (53.169)	Top-5 acc 75.391 (75.863)	lr 0.01980
Train [37][580/3239]	Time 0.314 (0.521)	Data Time 0.004 (0.045)	Loss 2.9304 (2.9543)	Entropy 0.69460 (0.69436)	Top-1 acc 53.125 (53.161)	Top-5 acc 77.344 (75.866)	lr 0.01980
Train [37][590/3239]	Time 0.240 (0.519)	Data Time 0.002 (0.045)	Loss 3.1651 (2.9549)	Entropy 0.69438 (0.69436)	Top-1 acc 49.609 (53.149)	Top-5 acc 71.094 (75.863)	lr 0.01980
Train [37][600/3239]	Time 0.274 (0.517)	Data Time 0.001 (0.044)	Loss 3.1593 (2.9557)	Entropy 0.69429 (0.69436)	Top-1 acc 49.609 (53.128)	Top-5 acc 69.141 (75.854)	lr 0.01980
Train [37][610/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.043)	Loss 2.8876 (2.9551)	Entropy 0.69420 (0.69436)	Top-1 acc 56.641 (53.139)	Top-5 acc 77.344 (75.870)	lr 0.01980
Train [37][620/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.042)	Loss 2.6191 (2.9545)	Entropy 0.69385 (0.69436)	Top-1 acc 60.938 (53.152)	Top-5 acc 80.469 (75.877)	lr 0.01980
Train [37][630/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.042)	Loss 2.9312 (2.9544)	Entropy 0.69379 (0.69435)	Top-1 acc 51.172 (53.155)	Top-5 acc 76.953 (75.886)	lr 0.01980
Train [37][640/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.041)	Loss 2.7205 (2.9539)	Entropy 0.69364 (0.69434)	Top-1 acc 59.766 (53.166)	Top-5 acc 78.906 (75.891)	lr 0.01979
Train [37][650/3239]	Time 0.267 (0.509)	Data Time 0.001 (0.041)	Loss 2.9774 (2.9539)	Entropy 0.69364 (0.69433)	Top-1 acc 53.516 (53.176)	Top-5 acc 76.953 (75.894)	lr 0.01979
Train [37][660/3239]	Time 0.228 (0.508)	Data Time 0.001 (0.040)	Loss 3.2553 (2.9560)	Entropy 0.69359 (0.69432)	Top-1 acc 44.922 (53.114)	Top-5 acc 67.188 (75.859)	lr 0.01979
Train [37][670/3239]	Time 0.335 (0.507)	Data Time 0.001 (0.039)	Loss 3.0050 (2.9564)	Entropy 0.69371 (0.69431)	Top-1 acc 52.734 (53.106)	Top-5 acc 77.734 (75.850)	lr 0.01979
Train [37][680/3239]	Time 0.224 (0.505)	Data Time 0.001 (0.039)	Loss 2.9357 (2.9560)	Entropy 0.69363 (0.69430)	Top-1 acc 51.562 (53.104)	Top-5 acc 77.734 (75.855)	lr 0.01979
Train [37][690/3239]	Time 0.229 (0.504)	Data Time 0.001 (0.038)	Loss 3.0733 (2.9560)	Entropy 0.69336 (0.69429)	Top-1 acc 50.781 (53.114)	Top-5 acc 70.703 (75.842)	lr 0.01979
Train [37][700/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.038)	Loss 3.0976 (2.9558)	Entropy 0.69342 (0.69427)	Top-1 acc 48.438 (53.128)	Top-5 acc 71.094 (75.830)	lr 0.01979
Train [37][710/3239]	Time 0.243 (0.501)	Data Time 0.001 (0.037)	Loss 2.8065 (2.9552)	Entropy 0.69324 (0.69426)	Top-1 acc 56.641 (53.141)	Top-5 acc 77.734 (75.838)	lr 0.01979
Train [37][720/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.037)	Loss 2.9063 (2.9548)	Entropy 0.69334 (0.69425)	Top-1 acc 54.688 (53.148)	Top-5 acc 76.562 (75.840)	lr 0.01979
Train [37][730/3239]	Time 0.258 (0.498)	Data Time 0.001 (0.036)	Loss 2.9525 (2.9554)	Entropy 0.69315 (0.69423)	Top-1 acc 52.734 (53.131)	Top-5 acc 75.781 (75.820)	lr 0.01979
Train [37][740/3239]	Time 0.359 (0.497)	Data Time 0.001 (0.036)	Loss 2.9135 (2.9556)	Entropy 0.69302 (0.69422)	Top-1 acc 52.344 (53.138)	Top-5 acc 76.172 (75.812)	lr 0.01979
Train [37][750/3239]	Time 0.227 (0.496)	Data Time 0.001 (0.035)	Loss 2.8853 (2.9554)	Entropy 0.69320 (0.69420)	Top-1 acc 54.688 (53.122)	Top-5 acc 76.172 (75.815)	lr 0.01979
Train [37][760/3239]	Time 0.220 (0.495)	Data Time 0.001 (0.035)	Loss 2.8383 (2.9550)	Entropy 0.69339 (0.69419)	Top-1 acc 53.906 (53.121)	Top-5 acc 77.344 (75.829)	lr 0.01979
Train [37][770/3239]	Time 0.231 (0.494)	Data Time 0.001 (0.035)	Loss 3.1282 (2.9540)	Entropy 0.69359 (0.69418)	Top-1 acc 50.000 (53.136)	Top-5 acc 73.438 (75.843)	lr 0.01978
Train [37][780/3239]	Time 0.226 (0.492)	Data Time 0.001 (0.034)	Loss 2.9149 (2.9540)	Entropy 0.69279 (0.69417)	Top-1 acc 53.516 (53.138)	Top-5 acc 73.828 (75.828)	lr 0.01978
Train [37][790/3239]	Time 0.252 (0.491)	Data Time 0.001 (0.034)	Loss 3.0579 (2.9548)	Entropy 0.69277 (0.69415)	Top-1 acc 52.734 (53.135)	Top-5 acc 73.438 (75.809)	lr 0.01978
Train [37][800/3239]	Time 0.258 (0.490)	Data Time 0.001 (0.033)	Loss 2.9954 (2.9550)	Entropy 0.69269 (0.69413)	Top-1 acc 52.734 (53.144)	Top-5 acc 74.609 (75.799)	lr 0.01978
Train [37][810/3239]	Time 0.237 (0.489)	Data Time 0.001 (0.033)	Loss 2.8403 (2.9546)	Entropy 0.69225 (0.69411)	Top-1 acc 55.469 (53.151)	Top-5 acc 78.516 (75.806)	lr 0.01978
Train [37][820/3239]	Time 0.230 (0.488)	Data Time 0.001 (0.033)	Loss 3.0064 (2.9547)	Entropy 0.69218 (0.69409)	Top-1 acc 53.516 (53.147)	Top-5 acc 75.000 (75.806)	lr 0.01978
Train [37][830/3239]	Time 0.334 (0.487)	Data Time 0.001 (0.032)	Loss 2.7388 (2.9547)	Entropy 0.69240 (0.69407)	Top-1 acc 57.031 (53.151)	Top-5 acc 81.641 (75.806)	lr 0.01978
Train [37][840/3239]	Time 0.230 (0.486)	Data Time 0.001 (0.032)	Loss 2.8242 (2.9548)	Entropy 0.69228 (0.69405)	Top-1 acc 55.859 (53.151)	Top-5 acc 77.344 (75.809)	lr 0.01978
Train [37][850/3239]	Time 0.221 (0.485)	Data Time 0.001 (0.031)	Loss 3.2108 (2.9559)	Entropy 0.69219 (0.69403)	Top-1 acc 44.531 (53.136)	Top-5 acc 71.094 (75.776)	lr 0.01978
Train [37][860/3239]	Time 0.238 (0.485)	Data Time 0.001 (0.031)	Loss 2.8332 (2.9555)	Entropy 0.69158 (0.69400)	Top-1 acc 53.906 (53.141)	Top-5 acc 78.516 (75.778)	lr 0.01978
Train [37][870/3239]	Time 0.232 (0.484)	Data Time 0.001 (0.031)	Loss 2.9230 (2.9552)	Entropy 0.69128 (0.69397)	Top-1 acc 51.172 (53.145)	Top-5 acc 75.781 (75.790)	lr 0.01978
Train [37][880/3239]	Time 0.260 (0.483)	Data Time 0.001 (0.030)	Loss 3.0286 (2.9547)	Entropy 0.69165 (0.69394)	Top-1 acc 51.172 (53.160)	Top-5 acc 73.438 (75.803)	lr 0.01978
Train [37][890/3239]	Time 0.232 (0.482)	Data Time 0.001 (0.030)	Loss 2.8149 (2.9546)	Entropy 0.69116 (0.69392)	Top-1 acc 53.906 (53.168)	Top-5 acc 78.516 (75.797)	lr 0.01977
Train [37][900/3239]	Time 0.317 (0.481)	Data Time 0.001 (0.030)	Loss 2.8175 (2.9536)	Entropy 0.69124 (0.69389)	Top-1 acc 56.250 (53.174)	Top-5 acc 81.250 (75.824)	lr 0.01977
Train [37][910/3239]	Time 0.223 (0.480)	Data Time 0.001 (0.029)	Loss 2.9201 (2.9530)	Entropy 0.69133 (0.69386)	Top-1 acc 55.859 (53.198)	Top-5 acc 77.344 (75.840)	lr 0.01977
Train [37][920/3239]	Time 0.237 (0.479)	Data Time 0.001 (0.029)	Loss 2.8694 (2.9535)	Entropy 0.69137 (0.69383)	Top-1 acc 57.422 (53.190)	Top-5 acc 77.734 (75.836)	lr 0.01977
Train [37][930/3239]	Time 0.230 (0.478)	Data Time 0.001 (0.029)	Loss 3.2405 (2.9546)	Entropy 0.69137 (0.69380)	Top-1 acc 45.312 (53.155)	Top-5 acc 72.266 (75.816)	lr 0.01977
Train [37][940/3239]	Time 0.226 (0.477)	Data Time 0.001 (0.029)	Loss 2.9367 (2.9536)	Entropy 0.69139 (0.69378)	Top-1 acc 48.438 (53.169)	Top-5 acc 75.391 (75.833)	lr 0.01977
Train [37][950/3239]	Time 0.218 (0.477)	Data Time 0.001 (0.028)	Loss 2.9990 (2.9534)	Entropy 0.69149 (0.69375)	Top-1 acc 48.828 (53.166)	Top-5 acc 76.953 (75.834)	lr 0.01977
Train [37][960/3239]	Time 0.226 (0.476)	Data Time 0.001 (0.028)	Loss 2.8694 (2.9533)	Entropy 0.69173 (0.69373)	Top-1 acc 55.078 (53.173)	Top-5 acc 76.172 (75.829)	lr 0.01977
Train [37][970/3239]	Time 0.250 (0.475)	Data Time 0.001 (0.028)	Loss 3.0435 (2.9529)	Entropy 0.69179 (0.69371)	Top-1 acc 54.297 (53.176)	Top-5 acc 73.047 (75.840)	lr 0.01977
Train [37][980/3239]	Time 0.235 (0.474)	Data Time 0.001 (0.028)	Loss 2.8627 (2.9531)	Entropy 0.69161 (0.69369)	Top-1 acc 53.516 (53.166)	Top-5 acc 76.953 (75.840)	lr 0.01977
Train [37][990/3239]	Time 0.307 (0.474)	Data Time 0.001 (0.027)	Loss 2.9225 (2.9536)	Entropy 0.69153 (0.69367)	Top-1 acc 54.688 (53.153)	Top-5 acc 76.562 (75.823)	lr 0.01977
Train [37][1000/3239]	Time 0.233 (0.473)	Data Time 0.001 (0.027)	Loss 2.8855 (2.9533)	Entropy 0.69161 (0.69365)	Top-1 acc 54.297 (53.172)	Top-5 acc 75.781 (75.830)	lr 0.01977
Train [37][1010/3239]	Time 0.230 (0.472)	Data Time 0.001 (0.027)	Loss 2.9050 (2.9533)	Entropy 0.69174 (0.69363)	Top-1 acc 56.641 (53.176)	Top-5 acc 78.516 (75.833)	lr 0.01976
Train [37][1020/3239]	Time 0.228 (0.471)	Data Time 0.001 (0.027)	Loss 3.3376 (2.9530)	Entropy 0.69170 (0.69361)	Top-1 acc 42.578 (53.185)	Top-5 acc 69.141 (75.835)	lr 0.01976
Train [37][1030/3239]	Time 0.234 (0.471)	Data Time 0.001 (0.026)	Loss 2.9781 (2.9521)	Entropy 0.69191 (0.69359)	Top-1 acc 52.344 (53.202)	Top-5 acc 73.828 (75.854)	lr 0.01976
Train [37][1040/3239]	Time 0.232 (0.470)	Data Time 0.001 (0.026)	Loss 2.7718 (2.9520)	Entropy 0.69190 (0.69358)	Top-1 acc 60.156 (53.204)	Top-5 acc 77.734 (75.868)	lr 0.01976
Train [37][1050/3239]	Time 0.222 (0.469)	Data Time 0.001 (0.026)	Loss 3.0577 (2.9525)	Entropy 0.69219 (0.69356)	Top-1 acc 52.344 (53.192)	Top-5 acc 74.219 (75.855)	lr 0.01976
Train [37][1060/3239]	Time 0.318 (0.468)	Data Time 0.001 (0.026)	Loss 2.8067 (2.9528)	Entropy 0.69211 (0.69355)	Top-1 acc 58.984 (53.186)	Top-5 acc 80.469 (75.859)	lr 0.01976
Train [37][1070/3239]	Time 0.222 (0.468)	Data Time 0.001 (0.025)	Loss 2.9798 (2.9527)	Entropy 0.69236 (0.69353)	Top-1 acc 54.297 (53.179)	Top-5 acc 71.875 (75.859)	lr 0.01976
Train [37][1080/3239]	Time 0.232 (0.467)	Data Time 0.001 (0.025)	Loss 2.8738 (2.9523)	Entropy 0.69242 (0.69352)	Top-1 acc 56.641 (53.181)	Top-5 acc 76.172 (75.862)	lr 0.01976
Train [37][1090/3239]	Time 0.243 (0.466)	Data Time 0.001 (0.025)	Loss 2.8673 (2.9519)	Entropy 0.69246 (0.69351)	Top-1 acc 54.297 (53.192)	Top-5 acc 76.172 (75.864)	lr 0.01976
Train [37][1100/3239]	Time 0.237 (0.466)	Data Time 0.002 (0.025)	Loss 3.0459 (2.9520)	Entropy 0.69239 (0.69350)	Top-1 acc 50.000 (53.198)	Top-5 acc 73.438 (75.863)	lr 0.01976
Train [37][1110/3239]	Time 0.259 (0.465)	Data Time 0.001 (0.025)	Loss 3.0972 (2.9525)	Entropy 0.69213 (0.69349)	Top-1 acc 51.172 (53.185)	Top-5 acc 71.484 (75.853)	lr 0.01976
Train [37][1120/3239]	Time 0.239 (0.465)	Data Time 0.001 (0.024)	Loss 2.6186 (2.9522)	Entropy 0.69175 (0.69348)	Top-1 acc 60.547 (53.194)	Top-5 acc 81.250 (75.857)	lr 0.01976
Train [37][1130/3239]	Time 0.230 (0.464)	Data Time 0.001 (0.024)	Loss 2.7979 (2.9519)	Entropy 0.69110 (0.69346)	Top-1 acc 57.812 (53.206)	Top-5 acc 78.125 (75.858)	lr 0.01975
Train [37][1140/3239]	Time 0.229 (0.463)	Data Time 0.001 (0.024)	Loss 2.7947 (2.9517)	Entropy 0.69121 (0.69344)	Top-1 acc 57.812 (53.210)	Top-5 acc 78.516 (75.857)	lr 0.01975
Train [37][1150/3239]	Time 0.224 (0.463)	Data Time 0.001 (0.024)	Loss 3.1207 (2.9521)	Entropy 0.69150 (0.69342)	Top-1 acc 47.266 (53.201)	Top-5 acc 71.484 (75.852)	lr 0.01975
Train [37][1160/3239]	Time 0.215 (0.462)	Data Time 0.001 (0.024)	Loss 3.4004 (2.9522)	Entropy 0.69138 (0.69340)	Top-1 acc 43.359 (53.196)	Top-5 acc 64.453 (75.846)	lr 0.01975
Train [37][1170/3239]	Time 0.232 (0.462)	Data Time 0.001 (0.023)	Loss 2.8039 (2.9529)	Entropy 0.69139 (0.69339)	Top-1 acc 58.203 (53.182)	Top-5 acc 80.469 (75.836)	lr 0.01975
Train [37][1180/3239]	Time 0.262 (0.461)	Data Time 0.001 (0.023)	Loss 2.9319 (2.9531)	Entropy 0.69114 (0.69337)	Top-1 acc 55.469 (53.180)	Top-5 acc 76.953 (75.836)	lr 0.01975
Train [37][1190/3239]	Time 0.233 (0.461)	Data Time 0.001 (0.023)	Loss 3.1295 (2.9532)	Entropy 0.69069 (0.69335)	Top-1 acc 48.047 (53.171)	Top-5 acc 72.656 (75.831)	lr 0.01975
Train [37][1200/3239]	Time 0.231 (0.460)	Data Time 0.001 (0.023)	Loss 2.9599 (2.9527)	Entropy 0.69062 (0.69333)	Top-1 acc 49.609 (53.172)	Top-5 acc 76.172 (75.844)	lr 0.01975
Train [37][1210/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.023)	Loss 3.1484 (2.9533)	Entropy 0.69062 (0.69330)	Top-1 acc 51.562 (53.160)	Top-5 acc 70.703 (75.830)	lr 0.01975
Train [37][1220/3239]	Time 0.314 (0.459)	Data Time 0.001 (0.022)	Loss 3.0750 (2.9533)	Entropy 0.69051 (0.69328)	Top-1 acc 49.609 (53.157)	Top-5 acc 73.438 (75.836)	lr 0.01975
Train [37][1230/3239]	Time 0.358 (0.485)	Data Time 0.005 (0.022)	Loss 3.0458 (2.9535)	Entropy 0.69061 (0.69326)	Top-1 acc 49.609 (53.156)	Top-5 acc 74.609 (75.836)	lr 0.01975
Train [37][1240/3239]	Time 0.279 (0.485)	Data Time 0.003 (0.022)	Loss 3.0904 (2.9538)	Entropy 0.69047 (0.69324)	Top-1 acc 53.125 (53.152)	Top-5 acc 74.219 (75.835)	lr 0.01975
Train [37][1250/3239]	Time 0.238 (0.485)	Data Time 0.002 (0.022)	Loss 2.9358 (2.9545)	Entropy 0.68988 (0.69321)	Top-1 acc 53.906 (53.134)	Top-5 acc 75.781 (75.825)	lr 0.01974
Train [37][1260/3239]	Time 0.240 (0.484)	Data Time 0.001 (0.022)	Loss 2.9172 (2.9539)	Entropy 0.68998 (0.69319)	Top-1 acc 52.344 (53.140)	Top-5 acc 76.172 (75.830)	lr 0.01974
Train [37][1270/3239]	Time 0.233 (0.483)	Data Time 0.001 (0.022)	Loss 2.9668 (2.9539)	Entropy 0.68990 (0.69316)	Top-1 acc 58.984 (53.142)	Top-5 acc 74.609 (75.830)	lr 0.01974
Train [37][1280/3239]	Time 0.237 (0.483)	Data Time 0.001 (0.022)	Loss 2.8453 (2.9540)	Entropy 0.68989 (0.69314)	Top-1 acc 55.859 (53.137)	Top-5 acc 76.953 (75.829)	lr 0.01974
Train [37][1290/3239]	Time 0.226 (0.482)	Data Time 0.001 (0.021)	Loss 2.6509 (2.9533)	Entropy 0.69003 (0.69311)	Top-1 acc 60.156 (53.151)	Top-5 acc 82.812 (75.845)	lr 0.01974
Train [37][1300/3239]	Time 0.228 (0.482)	Data Time 0.001 (0.021)	Loss 2.9468 (2.9536)	Entropy 0.69028 (0.69309)	Top-1 acc 51.953 (53.144)	Top-5 acc 75.391 (75.837)	lr 0.01974
Train [37][1310/3239]	Time 0.227 (0.481)	Data Time 0.001 (0.021)	Loss 3.0362 (2.9536)	Entropy 0.69037 (0.69307)	Top-1 acc 46.484 (53.141)	Top-5 acc 75.000 (75.841)	lr 0.01974
Train [37][1320/3239]	Time 0.228 (0.481)	Data Time 0.001 (0.021)	Loss 3.0405 (2.9533)	Entropy 0.69000 (0.69305)	Top-1 acc 51.172 (53.146)	Top-5 acc 73.438 (75.845)	lr 0.01974
Train [37][1330/3239]	Time 0.231 (0.480)	Data Time 0.002 (0.021)	Loss 2.8484 (2.9526)	Entropy 0.68999 (0.69303)	Top-1 acc 52.734 (53.161)	Top-5 acc 77.344 (75.857)	lr 0.01974
Train [37][1340/3239]	Time 0.228 (0.479)	Data Time 0.001 (0.021)	Loss 2.7981 (2.9523)	Entropy 0.68989 (0.69300)	Top-1 acc 53.906 (53.162)	Top-5 acc 79.688 (75.858)	lr 0.01974
Train [37][1350/3239]	Time 0.226 (0.479)	Data Time 0.001 (0.021)	Loss 2.8196 (2.9522)	Entropy 0.69014 (0.69298)	Top-1 acc 54.688 (53.157)	Top-5 acc 78.125 (75.861)	lr 0.01974
Train [37][1360/3239]	Time 0.253 (0.478)	Data Time 0.001 (0.020)	Loss 3.0507 (2.9521)	Entropy 0.69003 (0.69296)	Top-1 acc 51.562 (53.154)	Top-5 acc 75.391 (75.863)	lr 0.01974
Train [37][1370/3239]	Time 0.225 (0.478)	Data Time 0.001 (0.020)	Loss 2.8064 (2.9519)	Entropy 0.69011 (0.69294)	Top-1 acc 59.766 (53.165)	Top-5 acc 81.250 (75.867)	lr 0.01973
Train [37][1380/3239]	Time 0.319 (0.477)	Data Time 0.001 (0.020)	Loss 2.8658 (2.9523)	Entropy 0.69031 (0.69292)	Top-1 acc 54.297 (53.156)	Top-5 acc 76.562 (75.863)	lr 0.01973
Train [37][1390/3239]	Time 0.220 (0.477)	Data Time 0.001 (0.020)	Loss 2.9353 (2.9527)	Entropy 0.69047 (0.69290)	Top-1 acc 54.688 (53.147)	Top-5 acc 76.172 (75.857)	lr 0.01973
Train [37][1400/3239]	Time 0.234 (0.476)	Data Time 0.001 (0.020)	Loss 2.7853 (2.9522)	Entropy 0.69000 (0.69288)	Top-1 acc 56.641 (53.157)	Top-5 acc 78.906 (75.869)	lr 0.01973
Train [37][1410/3239]	Time 0.228 (0.476)	Data Time 0.002 (0.020)	Loss 3.1715 (2.9520)	Entropy 0.69037 (0.69286)	Top-1 acc 48.047 (53.167)	Top-5 acc 72.266 (75.873)	lr 0.01973
Train [37][1420/3239]	Time 0.244 (0.475)	Data Time 0.001 (0.020)	Loss 2.9330 (2.9524)	Entropy 0.68990 (0.69284)	Top-1 acc 51.562 (53.155)	Top-5 acc 77.734 (75.862)	lr 0.01973
Train [37][1430/3239]	Time 0.230 (0.475)	Data Time 0.001 (0.019)	Loss 2.8233 (2.9524)	Entropy 0.68963 (0.69282)	Top-1 acc 57.422 (53.158)	Top-5 acc 78.516 (75.864)	lr 0.01973
Train [37][1440/3239]	Time 0.234 (0.474)	Data Time 0.001 (0.019)	Loss 2.9464 (2.9526)	Entropy 0.68940 (0.69280)	Top-1 acc 53.906 (53.154)	Top-5 acc 74.609 (75.857)	lr 0.01973
Train [37][1450/3239]	Time 0.320 (0.474)	Data Time 0.001 (0.019)	Loss 3.1444 (2.9531)	Entropy 0.68922 (0.69278)	Top-1 acc 49.609 (53.137)	Top-5 acc 71.094 (75.852)	lr 0.01973
Train [37][1460/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.019)	Loss 2.9598 (2.9530)	Entropy 0.68924 (0.69275)	Top-1 acc 53.906 (53.132)	Top-5 acc 75.391 (75.857)	lr 0.01973
Train [37][1470/3239]	Time 0.228 (0.473)	Data Time 0.001 (0.019)	Loss 3.0471 (2.9530)	Entropy 0.68916 (0.69273)	Top-1 acc 53.125 (53.128)	Top-5 acc 76.172 (75.864)	lr 0.01973
Train [37][1480/3239]	Time 0.230 (0.472)	Data Time 0.001 (0.019)	Loss 3.1580 (2.9529)	Entropy 0.68858 (0.69270)	Top-1 acc 50.000 (53.125)	Top-5 acc 70.703 (75.862)	lr 0.01973
Train [37][1490/3239]	Time 0.223 (0.472)	Data Time 0.001 (0.019)	Loss 3.3679 (2.9536)	Entropy 0.68870 (0.69267)	Top-1 acc 43.750 (53.109)	Top-5 acc 67.969 (75.849)	lr 0.01973
Train [37][1500/3239]	Time 0.240 (0.472)	Data Time 0.001 (0.019)	Loss 2.6947 (2.9535)	Entropy 0.68888 (0.69265)	Top-1 acc 59.766 (53.106)	Top-5 acc 82.422 (75.858)	lr 0.01972
Train [37][1510/3239]	Time 0.225 (0.471)	Data Time 0.001 (0.019)	Loss 3.0503 (2.9539)	Entropy 0.68824 (0.69262)	Top-1 acc 46.484 (53.095)	Top-5 acc 72.266 (75.846)	lr 0.01972
Train [37][1520/3239]	Time 0.248 (0.471)	Data Time 0.001 (0.018)	Loss 2.9365 (2.9544)	Entropy 0.68848 (0.69259)	Top-1 acc 53.906 (53.079)	Top-5 acc 73.438 (75.832)	lr 0.01972
Train [37][1530/3239]	Time 0.240 (0.470)	Data Time 0.001 (0.018)	Loss 2.9867 (2.9547)	Entropy 0.68847 (0.69257)	Top-1 acc 52.734 (53.080)	Top-5 acc 76.172 (75.823)	lr 0.01972
Train [37][1540/3239]	Time 0.331 (0.470)	Data Time 0.001 (0.018)	Loss 2.8969 (2.9544)	Entropy 0.68812 (0.69254)	Top-1 acc 51.562 (53.087)	Top-5 acc 75.391 (75.830)	lr 0.01972
Train [37][1550/3239]	Time 0.254 (0.470)	Data Time 0.001 (0.018)	Loss 2.9379 (2.9548)	Entropy 0.68763 (0.69251)	Top-1 acc 53.125 (53.076)	Top-5 acc 73.438 (75.819)	lr 0.01972
Train [37][1560/3239]	Time 0.221 (0.469)	Data Time 0.001 (0.018)	Loss 2.8549 (2.9550)	Entropy 0.68761 (0.69248)	Top-1 acc 54.688 (53.069)	Top-5 acc 79.297 (75.816)	lr 0.01972
Train [37][1570/3239]	Time 0.245 (0.469)	Data Time 0.001 (0.018)	Loss 2.9207 (2.9548)	Entropy 0.68773 (0.69245)	Top-1 acc 55.859 (53.075)	Top-5 acc 76.953 (75.822)	lr 0.01972
Train [37][1580/3239]	Time 0.239 (0.468)	Data Time 0.001 (0.018)	Loss 2.8475 (2.9548)	Entropy 0.68797 (0.69242)	Top-1 acc 55.859 (53.075)	Top-5 acc 77.344 (75.822)	lr 0.01972
Train [37][1590/3239]	Time 0.271 (0.468)	Data Time 0.001 (0.018)	Loss 2.9372 (2.9549)	Entropy 0.68742 (0.69239)	Top-1 acc 51.953 (53.074)	Top-5 acc 77.344 (75.823)	lr 0.01972
Train [37][1600/3239]	Time 0.234 (0.467)	Data Time 0.001 (0.018)	Loss 2.9570 (2.9552)	Entropy 0.68671 (0.69235)	Top-1 acc 52.344 (53.064)	Top-5 acc 73.438 (75.815)	lr 0.01972
Train [37][1610/3239]	Time 0.316 (0.467)	Data Time 0.001 (0.017)	Loss 2.9848 (2.9554)	Entropy 0.68695 (0.69232)	Top-1 acc 49.609 (53.053)	Top-5 acc 75.391 (75.813)	lr 0.01972
Train [37][1620/3239]	Time 0.230 (0.466)	Data Time 0.001 (0.017)	Loss 2.9366 (2.9552)	Entropy 0.68712 (0.69229)	Top-1 acc 53.125 (53.057)	Top-5 acc 75.000 (75.818)	lr 0.01971
Train [37][1630/3239]	Time 0.223 (0.466)	Data Time 0.001 (0.017)	Loss 3.0914 (2.9554)	Entropy 0.68736 (0.69226)	Top-1 acc 49.609 (53.052)	Top-5 acc 73.828 (75.813)	lr 0.01971
Train [37][1640/3239]	Time 0.224 (0.466)	Data Time 0.001 (0.017)	Loss 3.0071 (2.9557)	Entropy 0.68709 (0.69223)	Top-1 acc 50.781 (53.047)	Top-5 acc 74.609 (75.808)	lr 0.01971
Train [37][1650/3239]	Time 0.230 (0.465)	Data Time 0.001 (0.017)	Loss 2.8979 (2.9558)	Entropy 0.68726 (0.69219)	Top-1 acc 53.516 (53.037)	Top-5 acc 77.734 (75.802)	lr 0.01971
Train [37][1660/3239]	Time 0.239 (0.465)	Data Time 0.001 (0.017)	Loss 3.0670 (2.9559)	Entropy 0.68742 (0.69217)	Top-1 acc 51.953 (53.037)	Top-5 acc 76.172 (75.796)	lr 0.01971
Train [37][1670/3239]	Time 0.232 (0.464)	Data Time 0.001 (0.017)	Loss 2.9069 (2.9559)	Entropy 0.68760 (0.69214)	Top-1 acc 55.078 (53.037)	Top-5 acc 76.562 (75.792)	lr 0.01971
Train [37][1680/3239]	Time 0.237 (0.464)	Data Time 0.001 (0.017)	Loss 3.0403 (2.9559)	Entropy 0.68774 (0.69211)	Top-1 acc 50.000 (53.041)	Top-5 acc 73.047 (75.794)	lr 0.01971
Train [37][1690/3239]	Time 0.221 (0.464)	Data Time 0.001 (0.017)	Loss 3.0440 (2.9561)	Entropy 0.68751 (0.69208)	Top-1 acc 51.562 (53.037)	Top-5 acc 74.219 (75.793)	lr 0.01971
Train [37][1700/3239]	Time 0.248 (0.463)	Data Time 0.001 (0.017)	Loss 2.9821 (2.9562)	Entropy 0.68769 (0.69206)	Top-1 acc 50.781 (53.034)	Top-5 acc 76.562 (75.792)	lr 0.01971
Train [37][1710/3239]	Time 0.230 (0.463)	Data Time 0.001 (0.017)	Loss 2.8048 (2.9560)	Entropy 0.68784 (0.69203)	Top-1 acc 58.594 (53.037)	Top-5 acc 78.906 (75.795)	lr 0.01971
Train [37][1720/3239]	Time 0.257 (0.462)	Data Time 0.001 (0.016)	Loss 2.8686 (2.9559)	Entropy 0.68766 (0.69201)	Top-1 acc 56.641 (53.043)	Top-5 acc 76.953 (75.794)	lr 0.01971
Train [37][1730/3239]	Time 0.239 (0.462)	Data Time 0.001 (0.016)	Loss 2.8611 (2.9559)	Entropy 0.68730 (0.69198)	Top-1 acc 57.422 (53.044)	Top-5 acc 78.516 (75.795)	lr 0.01971
Train [37][1740/3239]	Time 0.236 (0.462)	Data Time 0.001 (0.016)	Loss 2.8668 (2.9559)	Entropy 0.68740 (0.69195)	Top-1 acc 52.344 (53.047)	Top-5 acc 75.391 (75.793)	lr 0.01970
Train [37][1750/3239]	Time 0.250 (0.461)	Data Time 0.001 (0.016)	Loss 3.0229 (2.9559)	Entropy 0.68756 (0.69193)	Top-1 acc 53.125 (53.051)	Top-5 acc 74.609 (75.791)	lr 0.01970
Train [37][1760/3239]	Time 0.236 (0.461)	Data Time 0.001 (0.016)	Loss 3.0467 (2.9562)	Entropy 0.68744 (0.69190)	Top-1 acc 50.000 (53.043)	Top-5 acc 74.219 (75.782)	lr 0.01970
Train [37][1770/3239]	Time 0.318 (0.461)	Data Time 0.001 (0.016)	Loss 2.9731 (2.9564)	Entropy 0.68710 (0.69188)	Top-1 acc 52.344 (53.036)	Top-5 acc 76.172 (75.781)	lr 0.01970
Train [37][1780/3239]	Time 0.220 (0.460)	Data Time 0.001 (0.016)	Loss 2.9792 (2.9562)	Entropy 0.68708 (0.69185)	Top-1 acc 53.906 (53.037)	Top-5 acc 74.609 (75.785)	lr 0.01970
Train [37][1790/3239]	Time 0.231 (0.460)	Data Time 0.001 (0.016)	Loss 2.9001 (2.9562)	Entropy 0.68673 (0.69182)	Top-1 acc 53.125 (53.035)	Top-5 acc 77.734 (75.782)	lr 0.01970
Train [37][1800/3239]	Time 0.251 (0.460)	Data Time 0.001 (0.016)	Loss 2.8622 (2.9563)	Entropy 0.68651 (0.69179)	Top-1 acc 54.688 (53.038)	Top-5 acc 77.734 (75.782)	lr 0.01970
Train [37][1810/3239]	Time 0.234 (0.459)	Data Time 0.001 (0.016)	Loss 3.0701 (2.9566)	Entropy 0.68639 (0.69176)	Top-1 acc 53.906 (53.029)	Top-5 acc 69.922 (75.775)	lr 0.01970
Train [37][1820/3239]	Time 0.223 (0.459)	Data Time 0.001 (0.016)	Loss 2.9008 (2.9564)	Entropy 0.68626 (0.69174)	Top-1 acc 57.031 (53.045)	Top-5 acc 75.391 (75.775)	lr 0.01970
Train [37][1830/3239]	Time 0.251 (0.459)	Data Time 0.001 (0.016)	Loss 3.0597 (2.9566)	Entropy 0.68611 (0.69171)	Top-1 acc 53.906 (53.041)	Top-5 acc 75.000 (75.774)	lr 0.01970
Train [37][1840/3239]	Time 0.322 (0.458)	Data Time 0.001 (0.016)	Loss 2.8402 (2.9563)	Entropy 0.68595 (0.69168)	Top-1 acc 55.078 (53.053)	Top-5 acc 77.344 (75.774)	lr 0.01970
Train [37][1850/3239]	Time 0.227 (0.458)	Data Time 0.001 (0.015)	Loss 2.9490 (2.9565)	Entropy 0.68626 (0.69164)	Top-1 acc 58.203 (53.056)	Top-5 acc 75.000 (75.765)	lr 0.01970
Train [37][1860/3239]	Time 0.222 (0.458)	Data Time 0.001 (0.015)	Loss 3.1196 (2.9566)	Entropy 0.68623 (0.69162)	Top-1 acc 51.953 (53.057)	Top-5 acc 71.094 (75.760)	lr 0.01969
Train [37][1870/3239]	Time 0.221 (0.457)	Data Time 0.001 (0.015)	Loss 2.9040 (2.9567)	Entropy 0.68626 (0.69159)	Top-1 acc 52.344 (53.053)	Top-5 acc 76.953 (75.760)	lr 0.01969
Train [37][1880/3239]	Time 0.233 (0.457)	Data Time 0.001 (0.015)	Loss 2.8340 (2.9566)	Entropy 0.68633 (0.69156)	Top-1 acc 53.125 (53.062)	Top-5 acc 79.688 (75.767)	lr 0.01969
Train [37][1890/3239]	Time 0.316 (0.474)	Data Time 0.003 (0.015)	Loss 2.9185 (2.9564)	Entropy 0.68687 (0.69153)	Top-1 acc 55.469 (53.069)	Top-5 acc 75.781 (75.767)	lr 0.01969
Train [37][1900/3239]	Time 0.242 (0.474)	Data Time 0.002 (0.015)	Loss 2.8845 (2.9564)	Entropy 0.68587 (0.69151)	Top-1 acc 54.688 (53.068)	Top-5 acc 76.562 (75.763)	lr 0.01969
Train [37][1910/3239]	Time 0.237 (0.474)	Data Time 0.002 (0.015)	Loss 2.8409 (2.9564)	Entropy 0.68571 (0.69148)	Top-1 acc 55.469 (53.061)	Top-5 acc 78.906 (75.764)	lr 0.01969
Train [37][1920/3239]	Time 0.232 (0.473)	Data Time 0.001 (0.015)	Loss 2.9743 (2.9564)	Entropy 0.68565 (0.69145)	Top-1 acc 53.516 (53.060)	Top-5 acc 76.172 (75.766)	lr 0.01969
Train [37][1930/3239]	Time 0.336 (0.473)	Data Time 0.001 (0.015)	Loss 3.0106 (2.9563)	Entropy 0.68571 (0.69142)	Top-1 acc 50.781 (53.064)	Top-5 acc 73.828 (75.770)	lr 0.01969
Train [37][1940/3239]	Time 0.230 (0.473)	Data Time 0.001 (0.015)	Loss 2.7963 (2.9562)	Entropy 0.68547 (0.69139)	Top-1 acc 55.469 (53.070)	Top-5 acc 79.297 (75.771)	lr 0.01969
Train [37][1950/3239]	Time 0.223 (0.472)	Data Time 0.001 (0.015)	Loss 2.9514 (2.9562)	Entropy 0.68547 (0.69136)	Top-1 acc 53.906 (53.068)	Top-5 acc 73.047 (75.771)	lr 0.01969
Train [37][1960/3239]	Time 0.236 (0.472)	Data Time 0.001 (0.015)	Loss 2.7268 (2.9560)	Entropy 0.68540 (0.69133)	Top-1 acc 58.594 (53.067)	Top-5 acc 79.297 (75.772)	lr 0.01969
Train [37][1970/3239]	Time 0.233 (0.472)	Data Time 0.002 (0.015)	Loss 2.8146 (2.9559)	Entropy 0.68509 (0.69130)	Top-1 acc 55.469 (53.062)	Top-5 acc 74.219 (75.775)	lr 0.01969
Train [37][1980/3239]	Time 0.236 (0.471)	Data Time 0.001 (0.015)	Loss 2.7877 (2.9557)	Entropy 0.68508 (0.69126)	Top-1 acc 56.641 (53.064)	Top-5 acc 80.078 (75.777)	lr 0.01968
Train [37][1990/3239]	Time 0.227 (0.471)	Data Time 0.001 (0.014)	Loss 3.0480 (2.9560)	Entropy 0.68471 (0.69123)	Top-1 acc 49.219 (53.054)	Top-5 acc 75.781 (75.775)	lr 0.01968
Train [37][2000/3239]	Time 0.309 (0.471)	Data Time 0.001 (0.014)	Loss 2.8603 (2.9559)	Entropy 0.68478 (0.69120)	Top-1 acc 53.125 (53.051)	Top-5 acc 79.297 (75.776)	lr 0.01968
Train [37][2010/3239]	Time 0.238 (0.470)	Data Time 0.001 (0.014)	Loss 3.0623 (2.9564)	Entropy 0.68494 (0.69117)	Top-1 acc 50.781 (53.039)	Top-5 acc 73.047 (75.765)	lr 0.01968
Train [37][2020/3239]	Time 0.238 (0.470)	Data Time 0.001 (0.014)	Loss 2.7500 (2.9562)	Entropy 0.68528 (0.69114)	Top-1 acc 56.641 (53.047)	Top-5 acc 82.422 (75.768)	lr 0.01968
Train [37][2030/3239]	Time 0.263 (0.470)	Data Time 0.001 (0.014)	Loss 2.9722 (2.9563)	Entropy 0.68528 (0.69111)	Top-1 acc 53.516 (53.043)	Top-5 acc 71.094 (75.762)	lr 0.01968
Train [37][2040/3239]	Time 0.258 (0.470)	Data Time 0.001 (0.014)	Loss 2.7978 (2.9564)	Entropy 0.68552 (0.69108)	Top-1 acc 57.422 (53.043)	Top-5 acc 82.422 (75.763)	lr 0.01968
Train [37][2050/3239]	Time 0.248 (0.469)	Data Time 0.001 (0.014)	Loss 2.8943 (2.9563)	Entropy 0.68533 (0.69105)	Top-1 acc 56.250 (53.043)	Top-5 acc 75.391 (75.764)	lr 0.01968
Train [37][2060/3239]	Time 0.239 (0.469)	Data Time 0.001 (0.014)	Loss 3.1010 (2.9565)	Entropy 0.68510 (0.69103)	Top-1 acc 50.781 (53.043)	Top-5 acc 69.922 (75.761)	lr 0.01968
Train [37][2070/3239]	Time 0.248 (0.469)	Data Time 0.001 (0.014)	Loss 2.7503 (2.9566)	Entropy 0.68482 (0.69100)	Top-1 acc 58.984 (53.042)	Top-5 acc 79.688 (75.761)	lr 0.01968
Train [37][2080/3239]	Time 0.230 (0.468)	Data Time 0.001 (0.014)	Loss 2.8349 (2.9567)	Entropy 0.68501 (0.69097)	Top-1 acc 52.344 (53.036)	Top-5 acc 78.906 (75.758)	lr 0.01968
Train [37][2090/3239]	Time 0.350 (0.468)	Data Time 0.002 (0.014)	Loss 2.9740 (2.9568)	Entropy 0.68504 (0.69094)	Top-1 acc 49.609 (53.035)	Top-5 acc 81.641 (75.759)	lr 0.01968
Train [37][2100/3239]	Time 0.226 (0.468)	Data Time 0.001 (0.014)	Loss 2.6945 (2.9568)	Entropy 0.68482 (0.69091)	Top-1 acc 58.984 (53.036)	Top-5 acc 82.031 (75.760)	lr 0.01967
Train [37][2110/3239]	Time 0.238 (0.468)	Data Time 0.001 (0.014)	Loss 2.9064 (2.9568)	Entropy 0.68471 (0.69088)	Top-1 acc 53.516 (53.035)	Top-5 acc 75.781 (75.758)	lr 0.01967
Train [37][2120/3239]	Time 0.217 (0.467)	Data Time 0.001 (0.014)	Loss 3.0521 (2.9570)	Entropy 0.68451 (0.69085)	Top-1 acc 52.734 (53.030)	Top-5 acc 73.047 (75.754)	lr 0.01967
Train [37][2130/3239]	Time 0.224 (0.467)	Data Time 0.001 (0.014)	Loss 3.0874 (2.9573)	Entropy 0.68455 (0.69082)	Top-1 acc 49.219 (53.022)	Top-5 acc 71.094 (75.751)	lr 0.01967
Train [37][2140/3239]	Time 0.227 (0.467)	Data Time 0.001 (0.014)	Loss 3.0322 (2.9572)	Entropy 0.68460 (0.69079)	Top-1 acc 50.000 (53.022)	Top-5 acc 74.609 (75.752)	lr 0.01967
Train [37][2150/3239]	Time 0.227 (0.467)	Data Time 0.001 (0.014)	Loss 3.1956 (2.9571)	Entropy 0.68425 (0.69076)	Top-1 acc 45.312 (53.021)	Top-5 acc 71.484 (75.751)	lr 0.01967
Train [37][2160/3239]	Time 0.319 (0.466)	Data Time 0.001 (0.014)	Loss 2.9500 (2.9573)	Entropy 0.68448 (0.69073)	Top-1 acc 52.734 (53.019)	Top-5 acc 75.000 (75.745)	lr 0.01967
Train [37][2170/3239]	Time 0.226 (0.466)	Data Time 0.001 (0.013)	Loss 2.8964 (2.9570)	Entropy 0.68442 (0.69070)	Top-1 acc 51.562 (53.018)	Top-5 acc 79.688 (75.755)	lr 0.01967
Train [37][2180/3239]	Time 0.238 (0.466)	Data Time 0.001 (0.013)	Loss 2.9311 (2.9573)	Entropy 0.68447 (0.69068)	Top-1 acc 55.078 (53.012)	Top-5 acc 73.047 (75.750)	lr 0.01967
Train [37][2190/3239]	Time 0.213 (0.465)	Data Time 0.001 (0.013)	Loss 2.8319 (2.9572)	Entropy 0.68421 (0.69065)	Top-1 acc 60.156 (53.023)	Top-5 acc 78.906 (75.753)	lr 0.01967
Train [37][2200/3239]	Time 0.237 (0.465)	Data Time 0.001 (0.013)	Loss 3.0396 (2.9575)	Entropy 0.68402 (0.69062)	Top-1 acc 51.953 (53.015)	Top-5 acc 75.391 (75.750)	lr 0.01967
Train [37][2210/3239]	Time 0.259 (0.465)	Data Time 0.001 (0.013)	Loss 2.9757 (2.9574)	Entropy 0.68418 (0.69059)	Top-1 acc 49.609 (53.014)	Top-5 acc 76.562 (75.755)	lr 0.01967
Train [37][2220/3239]	Time 0.226 (0.465)	Data Time 0.001 (0.013)	Loss 2.8130 (2.9573)	Entropy 0.68410 (0.69056)	Top-1 acc 58.203 (53.018)	Top-5 acc 77.344 (75.754)	lr 0.01966
Train [37][2230/3239]	Time 0.224 (0.464)	Data Time 0.001 (0.013)	Loss 3.2052 (2.9576)	Entropy 0.68402 (0.69053)	Top-1 acc 46.484 (53.012)	Top-5 acc 69.922 (75.749)	lr 0.01966
Train [37][2240/3239]	Time 0.236 (0.464)	Data Time 0.001 (0.013)	Loss 2.9862 (2.9576)	Entropy 0.68431 (0.69050)	Top-1 acc 52.734 (53.007)	Top-5 acc 77.734 (75.749)	lr 0.01966
Train [37][2250/3239]	Time 0.250 (0.464)	Data Time 0.001 (0.013)	Loss 2.8657 (2.9575)	Entropy 0.68457 (0.69047)	Top-1 acc 50.000 (53.009)	Top-5 acc 81.250 (75.753)	lr 0.01966
Train [37][2260/3239]	Time 0.228 (0.463)	Data Time 0.001 (0.013)	Loss 2.9095 (2.9577)	Entropy 0.68435 (0.69045)	Top-1 acc 53.906 (53.007)	Top-5 acc 76.172 (75.748)	lr 0.01966
Train [37][2270/3239]	Time 0.253 (0.463)	Data Time 0.001 (0.013)	Loss 2.9245 (2.9576)	Entropy 0.68459 (0.69042)	Top-1 acc 56.250 (53.005)	Top-5 acc 74.609 (75.752)	lr 0.01966
Train [37][2280/3239]	Time 0.246 (0.463)	Data Time 0.001 (0.013)	Loss 2.8755 (2.9575)	Entropy 0.68416 (0.69039)	Top-1 acc 48.047 (53.005)	Top-5 acc 78.906 (75.753)	lr 0.01966
Train [37][2290/3239]	Time 0.245 (0.463)	Data Time 0.001 (0.013)	Loss 2.9337 (2.9574)	Entropy 0.68437 (0.69037)	Top-1 acc 55.078 (53.008)	Top-5 acc 77.344 (75.753)	lr 0.01966
Train [37][2300/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.013)	Loss 2.8796 (2.9574)	Entropy 0.68426 (0.69034)	Top-1 acc 52.734 (53.005)	Top-5 acc 77.734 (75.750)	lr 0.01966
Train [37][2310/3239]	Time 0.217 (0.462)	Data Time 0.001 (0.013)	Loss 3.1401 (2.9574)	Entropy 0.68402 (0.69031)	Top-1 acc 49.609 (53.007)	Top-5 acc 69.922 (75.752)	lr 0.01966
Train [37][2320/3239]	Time 0.333 (0.462)	Data Time 0.001 (0.013)	Loss 2.8791 (2.9574)	Entropy 0.68405 (0.69029)	Top-1 acc 51.953 (53.004)	Top-5 acc 77.734 (75.753)	lr 0.01966
Train [37][2330/3239]	Time 0.222 (0.462)	Data Time 0.001 (0.013)	Loss 2.9738 (2.9575)	Entropy 0.68403 (0.69026)	Top-1 acc 50.391 (52.997)	Top-5 acc 75.391 (75.748)	lr 0.01966
Train [37][2340/3239]	Time 0.237 (0.462)	Data Time 0.001 (0.013)	Loss 2.9070 (2.9577)	Entropy 0.68402 (0.69023)	Top-1 acc 53.906 (52.995)	Top-5 acc 77.344 (75.743)	lr 0.01965
Train [37][2350/3239]	Time 0.232 (0.461)	Data Time 0.001 (0.013)	Loss 3.0381 (2.9575)	Entropy 0.68347 (0.69021)	Top-1 acc 53.906 (52.997)	Top-5 acc 72.266 (75.747)	lr 0.01965
Train [37][2360/3239]	Time 0.223 (0.461)	Data Time 0.001 (0.012)	Loss 3.0037 (2.9574)	Entropy 0.68344 (0.69018)	Top-1 acc 51.562 (52.997)	Top-5 acc 76.562 (75.748)	lr 0.01965
Train [37][2370/3239]	Time 0.238 (0.461)	Data Time 0.001 (0.012)	Loss 2.9158 (2.9572)	Entropy 0.68323 (0.69015)	Top-1 acc 50.000 (52.999)	Top-5 acc 76.172 (75.750)	lr 0.01965
Train [37][2380/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.012)	Loss 2.9698 (2.9570)	Entropy 0.68327 (0.69012)	Top-1 acc 55.078 (53.009)	Top-5 acc 76.562 (75.757)	lr 0.01965
Train [37][2390/3239]	Time 0.349 (0.460)	Data Time 0.001 (0.012)	Loss 2.7198 (2.9567)	Entropy 0.68305 (0.69009)	Top-1 acc 58.984 (53.017)	Top-5 acc 81.641 (75.763)	lr 0.01965
Train [37][2400/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.012)	Loss 2.8641 (2.9565)	Entropy 0.68328 (0.69006)	Top-1 acc 52.344 (53.019)	Top-5 acc 75.781 (75.763)	lr 0.01965
Train [37][2410/3239]	Time 0.233 (0.460)	Data Time 0.001 (0.012)	Loss 2.8610 (2.9565)	Entropy 0.68326 (0.69003)	Top-1 acc 52.734 (53.025)	Top-5 acc 77.734 (75.764)	lr 0.01965
Train [37][2420/3239]	Time 0.227 (0.460)	Data Time 0.001 (0.012)	Loss 2.8753 (2.9562)	Entropy 0.68334 (0.69001)	Top-1 acc 53.516 (53.029)	Top-5 acc 77.344 (75.769)	lr 0.01965
Train [37][2430/3239]	Time 0.229 (0.459)	Data Time 0.001 (0.012)	Loss 2.9290 (2.9561)	Entropy 0.68337 (0.68998)	Top-1 acc 48.828 (53.026)	Top-5 acc 77.734 (75.775)	lr 0.01965
Train [37][2440/3239]	Time 0.229 (0.459)	Data Time 0.001 (0.012)	Loss 3.0746 (2.9563)	Entropy 0.68324 (0.68995)	Top-1 acc 51.953 (53.016)	Top-5 acc 74.219 (75.772)	lr 0.01965
Train [37][2450/3239]	Time 0.224 (0.459)	Data Time 0.001 (0.012)	Loss 2.8528 (2.9563)	Entropy 0.68305 (0.68992)	Top-1 acc 54.688 (53.019)	Top-5 acc 78.516 (75.773)	lr 0.01965
Train [37][2460/3239]	Time 0.232 (0.458)	Data Time 0.001 (0.012)	Loss 2.7927 (2.9563)	Entropy 0.68307 (0.68990)	Top-1 acc 54.297 (53.018)	Top-5 acc 80.078 (75.773)	lr 0.01964
Train [37][2470/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.012)	Loss 3.1317 (2.9563)	Entropy 0.68296 (0.68987)	Top-1 acc 46.484 (53.014)	Top-5 acc 72.656 (75.776)	lr 0.01964
Train [37][2480/3239]	Time 0.321 (0.458)	Data Time 0.001 (0.012)	Loss 2.8825 (2.9563)	Entropy 0.68261 (0.68984)	Top-1 acc 54.297 (53.012)	Top-5 acc 74.609 (75.774)	lr 0.01964
Train [37][2490/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.012)	Loss 3.0444 (2.9564)	Entropy 0.68261 (0.68981)	Top-1 acc 49.219 (53.008)	Top-5 acc 74.609 (75.775)	lr 0.01964
Train [37][2500/3239]	Time 0.239 (0.458)	Data Time 0.001 (0.012)	Loss 2.9673 (2.9565)	Entropy 0.68224 (0.68978)	Top-1 acc 53.125 (53.012)	Top-5 acc 73.828 (75.770)	lr 0.01964
Train [37][2510/3239]	Time 0.238 (0.457)	Data Time 0.001 (0.012)	Loss 2.8841 (2.9563)	Entropy 0.68228 (0.68975)	Top-1 acc 57.031 (53.016)	Top-5 acc 77.344 (75.772)	lr 0.01964
Train [37][2520/3239]	Time 0.224 (0.457)	Data Time 0.001 (0.012)	Loss 2.8597 (2.9561)	Entropy 0.68170 (0.68972)	Top-1 acc 53.516 (53.019)	Top-5 acc 76.562 (75.773)	lr 0.01964
Train [37][2530/3239]	Time 0.243 (0.457)	Data Time 0.001 (0.012)	Loss 3.2180 (2.9563)	Entropy 0.68143 (0.68969)	Top-1 acc 48.438 (53.015)	Top-5 acc 70.312 (75.770)	lr 0.01964
Train [37][2540/3239]	Time 0.326 (0.470)	Data Time 0.006 (0.012)	Loss 2.7278 (2.9564)	Entropy 0.68151 (0.68966)	Top-1 acc 56.250 (53.009)	Top-5 acc 80.469 (75.770)	lr 0.01964
Train [37][2550/3239]	Time 0.328 (0.470)	Data Time 0.002 (0.012)	Loss 2.9476 (2.9564)	Entropy 0.68157 (0.68963)	Top-1 acc 54.688 (53.010)	Top-5 acc 75.000 (75.769)	lr 0.01964
Train [37][2560/3239]	Time 0.232 (0.470)	Data Time 0.002 (0.012)	Loss 3.0351 (2.9564)	Entropy 0.68172 (0.68959)	Top-1 acc 46.484 (53.009)	Top-5 acc 74.219 (75.770)	lr 0.01964
Train [37][2570/3239]	Time 0.242 (0.469)	Data Time 0.001 (0.012)	Loss 2.9389 (2.9567)	Entropy 0.68165 (0.68956)	Top-1 acc 53.516 (53.002)	Top-5 acc 77.734 (75.763)	lr 0.01964
Train [37][2580/3239]	Time 0.258 (0.469)	Data Time 0.001 (0.012)	Loss 3.0886 (2.9567)	Entropy 0.68187 (0.68953)	Top-1 acc 49.219 (53.000)	Top-5 acc 73.438 (75.762)	lr 0.01963
Train [37][2590/3239]	Time 0.230 (0.469)	Data Time 0.001 (0.012)	Loss 3.0482 (2.9567)	Entropy 0.68159 (0.68950)	Top-1 acc 50.781 (52.998)	Top-5 acc 76.562 (75.763)	lr 0.01963
Train [37][2600/3239]	Time 0.267 (0.469)	Data Time 0.003 (0.011)	Loss 2.9032 (2.9564)	Entropy 0.68151 (0.68947)	Top-1 acc 56.641 (53.003)	Top-5 acc 76.172 (75.765)	lr 0.01963
Train [37][2610/3239]	Time 0.231 (0.468)	Data Time 0.001 (0.011)	Loss 3.0059 (2.9565)	Entropy 0.68135 (0.68944)	Top-1 acc 53.906 (53.004)	Top-5 acc 76.953 (75.765)	lr 0.01963
Train [37][2620/3239]	Time 0.228 (0.468)	Data Time 0.001 (0.011)	Loss 2.9641 (2.9563)	Entropy 0.68134 (0.68941)	Top-1 acc 50.391 (53.007)	Top-5 acc 75.000 (75.768)	lr 0.01963
Train [37][2630/3239]	Time 0.220 (0.468)	Data Time 0.001 (0.011)	Loss 2.9348 (2.9564)	Entropy 0.68155 (0.68938)	Top-1 acc 52.344 (53.004)	Top-5 acc 79.297 (75.768)	lr 0.01963
Train [37][2640/3239]	Time 0.325 (0.468)	Data Time 0.001 (0.011)	Loss 2.8175 (2.9562)	Entropy 0.68139 (0.68935)	Top-1 acc 54.297 (53.007)	Top-5 acc 79.688 (75.773)	lr 0.01963
Train [37][2650/3239]	Time 0.232 (0.468)	Data Time 0.001 (0.011)	Loss 2.6822 (2.9562)	Entropy 0.68179 (0.68932)	Top-1 acc 59.766 (53.008)	Top-5 acc 80.859 (75.774)	lr 0.01963
Train [37][2660/3239]	Time 0.235 (0.467)	Data Time 0.001 (0.011)	Loss 3.0340 (2.9559)	Entropy 0.68186 (0.68929)	Top-1 acc 51.172 (53.007)	Top-5 acc 75.781 (75.782)	lr 0.01963
Train [37][2670/3239]	Time 0.239 (0.467)	Data Time 0.001 (0.011)	Loss 2.9062 (2.9557)	Entropy 0.68179 (0.68927)	Top-1 acc 56.250 (53.011)	Top-5 acc 76.172 (75.786)	lr 0.01963
Train [37][2680/3239]	Time 0.239 (0.467)	Data Time 0.001 (0.011)	Loss 2.8602 (2.9556)	Entropy 0.68218 (0.68924)	Top-1 acc 56.641 (53.014)	Top-5 acc 76.953 (75.790)	lr 0.01963
Train [37][2690/3239]	Time 0.234 (0.467)	Data Time 0.001 (0.011)	Loss 2.8624 (2.9557)	Entropy 0.68215 (0.68921)	Top-1 acc 55.469 (53.010)	Top-5 acc 79.297 (75.789)	lr 0.01963
Train [37][2700/3239]	Time 0.220 (0.467)	Data Time 0.001 (0.011)	Loss 3.1119 (2.9557)	Entropy 0.68204 (0.68919)	Top-1 acc 48.047 (53.009)	Top-5 acc 72.266 (75.787)	lr 0.01962
Train [37][2710/3239]	Time 0.329 (0.466)	Data Time 0.001 (0.011)	Loss 2.7087 (2.9556)	Entropy 0.68215 (0.68916)	Top-1 acc 59.766 (53.012)	Top-5 acc 80.859 (75.788)	lr 0.01962
Train [37][2720/3239]	Time 0.234 (0.466)	Data Time 0.001 (0.011)	Loss 3.0853 (2.9558)	Entropy 0.68204 (0.68913)	Top-1 acc 48.047 (53.004)	Top-5 acc 72.656 (75.787)	lr 0.01962
Train [37][2730/3239]	Time 0.230 (0.466)	Data Time 0.001 (0.011)	Loss 3.1857 (2.9561)	Entropy 0.68227 (0.68911)	Top-1 acc 49.609 (52.998)	Top-5 acc 70.312 (75.779)	lr 0.01962
Train [37][2740/3239]	Time 0.234 (0.466)	Data Time 0.001 (0.011)	Loss 2.7823 (2.9562)	Entropy 0.68245 (0.68908)	Top-1 acc 56.641 (52.999)	Top-5 acc 77.734 (75.776)	lr 0.01962
Train [37][2750/3239]	Time 0.224 (0.465)	Data Time 0.001 (0.011)	Loss 2.8008 (2.9562)	Entropy 0.68208 (0.68906)	Top-1 acc 53.906 (52.996)	Top-5 acc 79.688 (75.780)	lr 0.01962
Train [37][2760/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.011)	Loss 3.0908 (2.9562)	Entropy 0.68204 (0.68903)	Top-1 acc 53.125 (52.999)	Top-5 acc 73.438 (75.780)	lr 0.01962
Train [37][2770/3239]	Time 0.231 (0.465)	Data Time 0.001 (0.011)	Loss 2.8857 (2.9562)	Entropy 0.68255 (0.68901)	Top-1 acc 55.469 (53.000)	Top-5 acc 75.391 (75.777)	lr 0.01962
Train [37][2780/3239]	Time 0.238 (0.465)	Data Time 0.001 (0.011)	Loss 2.8673 (2.9560)	Entropy 0.68272 (0.68899)	Top-1 acc 51.172 (53.005)	Top-5 acc 75.391 (75.780)	lr 0.01962
Train [37][2790/3239]	Time 0.233 (0.465)	Data Time 0.001 (0.011)	Loss 2.8370 (2.9561)	Entropy 0.68244 (0.68896)	Top-1 acc 53.516 (52.999)	Top-5 acc 76.953 (75.776)	lr 0.01962
Train [37][2800/3239]	Time 0.323 (0.464)	Data Time 0.001 (0.011)	Loss 2.8981 (2.9560)	Entropy 0.68224 (0.68894)	Top-1 acc 51.953 (53.000)	Top-5 acc 74.219 (75.777)	lr 0.01962
Train [37][2810/3239]	Time 0.230 (0.464)	Data Time 0.001 (0.011)	Loss 2.8767 (2.9561)	Entropy 0.68189 (0.68892)	Top-1 acc 57.812 (52.999)	Top-5 acc 78.125 (75.775)	lr 0.01962
Train [37][2820/3239]	Time 0.254 (0.464)	Data Time 0.001 (0.011)	Loss 2.9318 (2.9560)	Entropy 0.68163 (0.68889)	Top-1 acc 52.734 (53.004)	Top-5 acc 76.953 (75.775)	lr 0.01961
Train [37][2830/3239]	Time 0.228 (0.464)	Data Time 0.002 (0.011)	Loss 2.8638 (2.9560)	Entropy 0.68159 (0.68887)	Top-1 acc 60.156 (53.010)	Top-5 acc 75.781 (75.774)	lr 0.01961
Train [37][2840/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.011)	Loss 2.8522 (2.9559)	Entropy 0.68161 (0.68884)	Top-1 acc 56.250 (53.012)	Top-5 acc 76.172 (75.776)	lr 0.01961
Train [37][2850/3239]	Time 0.267 (0.463)	Data Time 0.001 (0.011)	Loss 3.1072 (2.9562)	Entropy 0.68194 (0.68882)	Top-1 acc 51.953 (53.003)	Top-5 acc 72.266 (75.772)	lr 0.01961
Train [37][2860/3239]	Time 0.259 (0.463)	Data Time 0.001 (0.011)	Loss 2.8809 (2.9563)	Entropy 0.68182 (0.68879)	Top-1 acc 54.297 (52.997)	Top-5 acc 76.953 (75.770)	lr 0.01961
Train [37][2870/3239]	Time 0.342 (0.463)	Data Time 0.001 (0.011)	Loss 2.9744 (2.9565)	Entropy 0.68153 (0.68877)	Top-1 acc 52.734 (52.995)	Top-5 acc 75.000 (75.765)	lr 0.01961
Train [37][2880/3239]	Time 0.235 (0.463)	Data Time 0.001 (0.011)	Loss 2.8477 (2.9565)	Entropy 0.68153 (0.68874)	Top-1 acc 57.031 (52.992)	Top-5 acc 76.562 (75.764)	lr 0.01961
Train [37][2890/3239]	Time 0.219 (0.463)	Data Time 0.001 (0.011)	Loss 2.8559 (2.9561)	Entropy 0.68172 (0.68872)	Top-1 acc 53.516 (53.000)	Top-5 acc 77.734 (75.772)	lr 0.01961
Train [37][2900/3239]	Time 0.240 (0.463)	Data Time 0.001 (0.010)	Loss 3.0928 (2.9562)	Entropy 0.68150 (0.68869)	Top-1 acc 49.219 (52.993)	Top-5 acc 73.438 (75.772)	lr 0.01961
Train [37][2910/3239]	Time 0.220 (0.462)	Data Time 0.001 (0.010)	Loss 3.0897 (2.9561)	Entropy 0.68153 (0.68867)	Top-1 acc 51.953 (52.997)	Top-5 acc 71.094 (75.775)	lr 0.01961
Train [37][2920/3239]	Time 0.229 (0.462)	Data Time 0.001 (0.010)	Loss 3.1198 (2.9562)	Entropy 0.68152 (0.68864)	Top-1 acc 53.516 (52.998)	Top-5 acc 70.312 (75.773)	lr 0.01961
Train [37][2930/3239]	Time 0.219 (0.462)	Data Time 0.001 (0.010)	Loss 2.8586 (2.9561)	Entropy 0.68159 (0.68862)	Top-1 acc 52.344 (53.000)	Top-5 acc 78.906 (75.773)	lr 0.01961
Train [37][2940/3239]	Time 0.229 (0.462)	Data Time 0.001 (0.010)	Loss 2.7727 (2.9562)	Entropy 0.68148 (0.68859)	Top-1 acc 57.812 (52.999)	Top-5 acc 80.078 (75.770)	lr 0.01961
Train [37][2950/3239]	Time 0.234 (0.462)	Data Time 0.001 (0.010)	Loss 2.8500 (2.9559)	Entropy 0.68198 (0.68857)	Top-1 acc 50.391 (53.002)	Top-5 acc 77.344 (75.777)	lr 0.01960
Train [37][2960/3239]	Time 0.224 (0.461)	Data Time 0.001 (0.010)	Loss 2.8790 (2.9560)	Entropy 0.68191 (0.68855)	Top-1 acc 55.078 (53.003)	Top-5 acc 76.172 (75.773)	lr 0.01960
Train [37][2970/3239]	Time 0.236 (0.461)	Data Time 0.001 (0.010)	Loss 2.9650 (2.9561)	Entropy 0.68221 (0.68853)	Top-1 acc 53.125 (53.001)	Top-5 acc 75.000 (75.776)	lr 0.01960
Train [37][2980/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.010)	Loss 2.7477 (2.9560)	Entropy 0.68218 (0.68851)	Top-1 acc 54.688 (53.002)	Top-5 acc 82.422 (75.775)	lr 0.01960
Train [37][2990/3239]	Time 0.230 (0.461)	Data Time 0.001 (0.010)	Loss 2.9177 (2.9559)	Entropy 0.68212 (0.68848)	Top-1 acc 55.469 (53.004)	Top-5 acc 75.781 (75.776)	lr 0.01960
Train [37][3000/3239]	Time 0.226 (0.460)	Data Time 0.002 (0.010)	Loss 2.8240 (2.9558)	Entropy 0.68173 (0.68846)	Top-1 acc 54.297 (53.004)	Top-5 acc 78.906 (75.777)	lr 0.01960
Train [37][3010/3239]	Time 0.229 (0.460)	Data Time 0.002 (0.010)	Loss 3.1034 (2.9560)	Entropy 0.68176 (0.68844)	Top-1 acc 51.562 (53.002)	Top-5 acc 72.266 (75.772)	lr 0.01960
Train [37][3020/3239]	Time 0.232 (0.460)	Data Time 0.001 (0.010)	Loss 3.1363 (2.9559)	Entropy 0.68185 (0.68842)	Top-1 acc 51.953 (53.006)	Top-5 acc 69.922 (75.774)	lr 0.01960
Train [37][3030/3239]	Time 0.339 (0.460)	Data Time 0.001 (0.010)	Loss 2.9108 (2.9559)	Entropy 0.68179 (0.68840)	Top-1 acc 57.422 (53.005)	Top-5 acc 78.125 (75.774)	lr 0.01960
Train [37][3040/3239]	Time 0.229 (0.460)	Data Time 0.001 (0.010)	Loss 2.8896 (2.9558)	Entropy 0.68190 (0.68837)	Top-1 acc 57.422 (53.008)	Top-5 acc 75.000 (75.776)	lr 0.01960
Train [37][3050/3239]	Time 0.225 (0.460)	Data Time 0.001 (0.010)	Loss 3.2084 (2.9558)	Entropy 0.68224 (0.68835)	Top-1 acc 45.312 (53.011)	Top-5 acc 73.438 (75.777)	lr 0.01960
Train [37][3060/3239]	Time 0.232 (0.459)	Data Time 0.001 (0.010)	Loss 3.0377 (2.9558)	Entropy 0.68225 (0.68833)	Top-1 acc 48.828 (53.008)	Top-5 acc 72.266 (75.777)	lr 0.01960
Train [37][3070/3239]	Time 0.220 (0.459)	Data Time 0.001 (0.010)	Loss 2.8928 (2.9556)	Entropy 0.68236 (0.68831)	Top-1 acc 52.344 (53.014)	Top-5 acc 75.781 (75.781)	lr 0.01959
Train [37][3080/3239]	Time 0.250 (0.459)	Data Time 0.001 (0.010)	Loss 2.8801 (2.9556)	Entropy 0.68226 (0.68829)	Top-1 acc 54.688 (53.014)	Top-5 acc 77.734 (75.784)	lr 0.01959
Train [37][3090/3239]	Time 0.227 (0.459)	Data Time 0.001 (0.010)	Loss 2.8752 (2.9555)	Entropy 0.68226 (0.68828)	Top-1 acc 52.734 (53.019)	Top-5 acc 79.297 (75.786)	lr 0.01959
Train [37][3100/3239]	Time 0.318 (0.459)	Data Time 0.001 (0.010)	Loss 2.8841 (2.9554)	Entropy 0.68208 (0.68826)	Top-1 acc 52.734 (53.024)	Top-5 acc 77.734 (75.789)	lr 0.01959
Train [37][3110/3239]	Time 0.233 (0.458)	Data Time 0.001 (0.010)	Loss 3.0160 (2.9554)	Entropy 0.68198 (0.68824)	Top-1 acc 55.469 (53.025)	Top-5 acc 73.438 (75.786)	lr 0.01959
Train [37][3120/3239]	Time 0.226 (0.458)	Data Time 0.001 (0.010)	Loss 3.0130 (2.9556)	Entropy 0.68165 (0.68822)	Top-1 acc 51.172 (53.019)	Top-5 acc 77.344 (75.782)	lr 0.01959
Train [37][3130/3239]	Time 0.239 (0.458)	Data Time 0.001 (0.010)	Loss 2.7895 (2.9558)	Entropy 0.68172 (0.68819)	Top-1 acc 55.078 (53.012)	Top-5 acc 78.906 (75.780)	lr 0.01959
Train [37][3140/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.010)	Loss 3.0651 (2.9558)	Entropy 0.68180 (0.68817)	Top-1 acc 50.391 (53.013)	Top-5 acc 75.000 (75.780)	lr 0.01959
Train [37][3150/3239]	Time 0.233 (0.458)	Data Time 0.001 (0.010)	Loss 2.9282 (2.9557)	Entropy 0.68167 (0.68815)	Top-1 acc 50.391 (53.012)	Top-5 acc 76.562 (75.782)	lr 0.01959
Train [37][3160/3239]	Time 0.229 (0.458)	Data Time 0.001 (0.010)	Loss 3.0078 (2.9555)	Entropy 0.68128 (0.68813)	Top-1 acc 51.562 (53.019)	Top-5 acc 75.000 (75.786)	lr 0.01959
Train [37][3170/3239]	Time 0.222 (0.457)	Data Time 0.001 (0.010)	Loss 2.9332 (2.9556)	Entropy 0.68100 (0.68811)	Top-1 acc 55.469 (53.019)	Top-5 acc 74.219 (75.786)	lr 0.01959
Train [37][3180/3239]	Time 0.226 (0.457)	Data Time 0.000 (0.010)	Loss 2.8490 (2.9557)	Entropy 0.68092 (0.68809)	Top-1 acc 56.641 (53.018)	Top-5 acc 76.562 (75.784)	lr 0.01959
Train [37][3190/3239]	Time 0.321 (0.457)	Data Time 0.000 (0.010)	Loss 2.8675 (2.9557)	Entropy 0.68068 (0.68807)	Top-1 acc 53.906 (53.017)	Top-5 acc 78.125 (75.782)	lr 0.01958
Train [37][3200/3239]	Time 0.327 (0.467)	Data Time 0.000 (0.010)	Loss 2.7613 (2.9557)	Entropy 0.68033 (0.68804)	Top-1 acc 60.156 (53.016)	Top-5 acc 78.906 (75.781)	lr 0.01958
Train [37][3210/3239]	Time 0.228 (0.467)	Data Time 0.000 (0.010)	Loss 2.8400 (2.9556)	Entropy 0.68018 (0.68802)	Top-1 acc 57.812 (53.016)	Top-5 acc 79.297 (75.785)	lr 0.01958
Train [37][3220/3239]	Time 0.239 (0.467)	Data Time 0.000 (0.010)	Loss 2.9588 (2.9557)	Entropy 0.68018 (0.68799)	Top-1 acc 57.031 (53.015)	Top-5 acc 74.219 (75.786)	lr 0.01958
Train [37][3230/3239]	Time 0.233 (0.466)	Data Time 0.000 (0.010)	Loss 2.8379 (2.9553)	Entropy 0.68011 (0.68797)	Top-1 acc 55.469 (53.020)	Top-5 acc 77.734 (75.796)	lr 0.01958
Train [37][3239/3239]	Time 1.017 (0.466)	Data Time 0.000 (0.010)	Loss 3.4023 (2.9554)	Entropy 0.68027 (0.68795)	Top-1 acc 39.506 (53.018)	Top-5 acc 69.136 (75.796)	lr 0.01958
==========Valid [37/120]	loss 1.664	top-1 acc 62.371 (62.371)	top-5 acc 83.685	Train top-1 53.018	top-5 75.796	Entropy 0.68027	Latency-None: 0.000ms	Flops: 539.76M
Train [38][0/3239]	Time 32.252 (32.252)	Data Time 30.077 (30.077)	Loss 3.0449 (3.0449)	Entropy 0.68004 (0.68004)	Top-1 acc 50.781 (50.781)	Top-5 acc 74.609 (74.609)	lr 0.01958
Train [38][10/3239]	Time 0.298 (3.575)	Data Time 0.001 (2.825)	Loss 2.9877 (2.9614)	Entropy 0.67990 (0.67995)	Top-1 acc 53.516 (51.989)	Top-5 acc 71.875 (75.675)	lr 0.01958
Train [38][20/3239]	Time 0.326 (2.070)	Data Time 0.001 (1.481)	Loss 2.9879 (2.9293)	Entropy 0.67997 (0.67996)	Top-1 acc 55.078 (53.460)	Top-5 acc 73.438 (76.153)	lr 0.01958
Train [38][30/3239]	Time 0.270 (1.539)	Data Time 0.002 (1.004)	Loss 2.9180 (2.9375)	Entropy 0.68029 (0.67998)	Top-1 acc 53.125 (53.238)	Top-5 acc 75.000 (75.857)	lr 0.01958
Train [38][40/3239]	Time 0.265 (1.268)	Data Time 0.002 (0.759)	Loss 2.7849 (2.9283)	Entropy 0.68028 (0.68005)	Top-1 acc 56.250 (53.325)	Top-5 acc 80.078 (76.239)	lr 0.01958
Train [38][50/3239]	Time 0.236 (1.105)	Data Time 0.001 (0.611)	Loss 2.9352 (2.9264)	Entropy 0.68067 (0.68013)	Top-1 acc 55.469 (53.539)	Top-5 acc 72.266 (76.248)	lr 0.01958
Train [38][60/3239]	Time 0.238 (0.992)	Data Time 0.001 (0.511)	Loss 2.8596 (2.9221)	Entropy 0.67999 (0.68020)	Top-1 acc 57.422 (53.554)	Top-5 acc 76.953 (76.351)	lr 0.01958
Train [38][70/3239]	Time 0.230 (0.914)	Data Time 0.001 (0.439)	Loss 2.8168 (2.9318)	Entropy 0.67997 (0.68016)	Top-1 acc 55.078 (53.230)	Top-5 acc 76.953 (76.177)	lr 0.01957
Train [38][80/3239]	Time 0.221 (0.851)	Data Time 0.001 (0.385)	Loss 3.0183 (2.9329)	Entropy 0.67987 (0.68013)	Top-1 acc 53.516 (53.313)	Top-5 acc 76.172 (76.225)	lr 0.01957
Train [38][90/3239]	Time 0.334 (0.804)	Data Time 0.001 (0.343)	Loss 2.9756 (2.9339)	Entropy 0.67992 (0.68009)	Top-1 acc 51.562 (53.331)	Top-5 acc 75.000 (76.198)	lr 0.01957
Train [38][100/3239]	Time 0.235 (0.765)	Data Time 0.001 (0.309)	Loss 2.9795 (2.9310)	Entropy 0.67987 (0.68007)	Top-1 acc 56.641 (53.434)	Top-5 acc 75.000 (76.245)	lr 0.01957
Train [38][110/3239]	Time 0.236 (0.736)	Data Time 0.001 (0.281)	Loss 3.0529 (2.9338)	Entropy 0.67987 (0.68005)	Top-1 acc 53.906 (53.357)	Top-5 acc 74.609 (76.175)	lr 0.01957
Train [38][120/3239]	Time 0.236 (0.710)	Data Time 0.001 (0.258)	Loss 2.8338 (2.9332)	Entropy 0.68007 (0.68004)	Top-1 acc 55.078 (53.370)	Top-5 acc 76.562 (76.188)	lr 0.01957
Train [38][130/3239]	Time 0.235 (0.690)	Data Time 0.001 (0.239)	Loss 2.6744 (2.9251)	Entropy 0.68000 (0.68004)	Top-1 acc 57.422 (53.522)	Top-5 acc 81.641 (76.288)	lr 0.01957
Train [38][140/3239]	Time 0.233 (0.671)	Data Time 0.001 (0.222)	Loss 2.7653 (2.9270)	Entropy 0.67990 (0.68004)	Top-1 acc 57.812 (53.505)	Top-5 acc 78.516 (76.313)	lr 0.01957
Train [38][150/3239]	Time 0.250 (0.653)	Data Time 0.001 (0.207)	Loss 2.7951 (2.9229)	Entropy 0.67992 (0.68003)	Top-1 acc 57.031 (53.557)	Top-5 acc 75.781 (76.379)	lr 0.01957
Train [38][160/3239]	Time 0.266 (0.639)	Data Time 0.001 (0.194)	Loss 2.9565 (2.9202)	Entropy 0.67925 (0.68001)	Top-1 acc 51.172 (53.635)	Top-5 acc 73.828 (76.381)	lr 0.01957
Train [38][170/3239]	Time 0.237 (0.626)	Data Time 0.001 (0.183)	Loss 2.7316 (2.9163)	Entropy 0.67905 (0.67996)	Top-1 acc 57.422 (53.742)	Top-5 acc 78.906 (76.467)	lr 0.01957
Train [38][180/3239]	Time 0.237 (0.614)	Data Time 0.001 (0.173)	Loss 3.2617 (2.9193)	Entropy 0.67939 (0.67992)	Top-1 acc 43.750 (53.624)	Top-5 acc 71.484 (76.424)	lr 0.01957
Train [38][190/3239]	Time 0.243 (0.604)	Data Time 0.001 (0.164)	Loss 3.1211 (2.9203)	Entropy 0.67900 (0.67989)	Top-1 acc 48.828 (53.669)	Top-5 acc 73.047 (76.440)	lr 0.01956
Train [38][200/3239]	Time 0.249 (0.595)	Data Time 0.001 (0.156)	Loss 2.9116 (2.9187)	Entropy 0.67913 (0.67985)	Top-1 acc 53.125 (53.745)	Top-5 acc 77.734 (76.442)	lr 0.01956
Train [38][210/3239]	Time 0.225 (0.586)	Data Time 0.001 (0.149)	Loss 2.9104 (2.9193)	Entropy 0.67912 (0.67982)	Top-1 acc 56.250 (53.754)	Top-5 acc 76.172 (76.450)	lr 0.01956
Train [38][220/3239]	Time 0.252 (0.579)	Data Time 0.001 (0.142)	Loss 2.8842 (2.9182)	Entropy 0.67901 (0.67979)	Top-1 acc 55.078 (53.722)	Top-5 acc 77.734 (76.483)	lr 0.01956
Train [38][230/3239]	Time 0.244 (0.573)	Data Time 0.001 (0.136)	Loss 2.9087 (2.9180)	Entropy 0.67893 (0.67975)	Top-1 acc 54.688 (53.744)	Top-5 acc 77.344 (76.461)	lr 0.01956
Train [38][240/3239]	Time 0.227 (0.566)	Data Time 0.001 (0.131)	Loss 3.1870 (2.9197)	Entropy 0.67917 (0.67972)	Top-1 acc 49.609 (53.683)	Top-5 acc 72.266 (76.426)	lr 0.01956
Train [38][250/3239]	Time 0.340 (0.560)	Data Time 0.001 (0.125)	Loss 3.1167 (2.9189)	Entropy 0.67878 (0.67969)	Top-1 acc 49.219 (53.704)	Top-5 acc 73.828 (76.413)	lr 0.01956
Train [38][260/3239]	Time 0.231 (0.554)	Data Time 0.001 (0.121)	Loss 3.3096 (2.9209)	Entropy 0.67869 (0.67966)	Top-1 acc 47.656 (53.683)	Top-5 acc 66.016 (76.363)	lr 0.01956
Train [38][270/3239]	Time 0.241 (0.549)	Data Time 0.002 (0.116)	Loss 2.8358 (2.9211)	Entropy 0.67869 (0.67962)	Top-1 acc 53.516 (53.686)	Top-5 acc 78.125 (76.377)	lr 0.01956
Train [38][280/3239]	Time 0.223 (0.544)	Data Time 0.001 (0.112)	Loss 3.0583 (2.9213)	Entropy 0.67861 (0.67958)	Top-1 acc 50.391 (53.667)	Top-5 acc 74.219 (76.390)	lr 0.01956
Train [38][290/3239]	Time 0.256 (0.540)	Data Time 0.001 (0.108)	Loss 2.7167 (2.9180)	Entropy 0.67889 (0.67956)	Top-1 acc 57.812 (53.708)	Top-5 acc 78.125 (76.446)	lr 0.01956
Train [38][300/3239]	Time 0.253 (0.535)	Data Time 0.001 (0.105)	Loss 2.7365 (2.9180)	Entropy 0.67892 (0.67954)	Top-1 acc 58.594 (53.741)	Top-5 acc 79.297 (76.433)	lr 0.01956
Train [38][310/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.102)	Loss 2.6528 (2.9180)	Entropy 0.67907 (0.67952)	Top-1 acc 57.031 (53.748)	Top-5 acc 82.812 (76.426)	lr 0.01955
Train [38][320/3239]	Time 0.352 (0.527)	Data Time 0.001 (0.098)	Loss 2.8649 (2.9211)	Entropy 0.67954 (0.67951)	Top-1 acc 57.422 (53.679)	Top-5 acc 77.734 (76.350)	lr 0.01955
Train [38][330/3239]	Time 0.246 (0.523)	Data Time 0.001 (0.095)	Loss 2.7576 (2.9211)	Entropy 0.67964 (0.67951)	Top-1 acc 57.031 (53.682)	Top-5 acc 79.297 (76.371)	lr 0.01955
Train [38][340/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.093)	Loss 3.0681 (2.9232)	Entropy 0.67944 (0.67951)	Top-1 acc 48.047 (53.637)	Top-5 acc 73.438 (76.349)	lr 0.01955
Train [38][350/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.090)	Loss 3.1416 (2.9244)	Entropy 0.67903 (0.67950)	Top-1 acc 50.000 (53.625)	Top-5 acc 70.703 (76.314)	lr 0.01955
Train [38][360/3239]	Time 0.244 (0.513)	Data Time 0.001 (0.088)	Loss 3.0495 (2.9253)	Entropy 0.67889 (0.67949)	Top-1 acc 53.516 (53.628)	Top-5 acc 76.172 (76.295)	lr 0.01955
Train [38][370/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.085)	Loss 2.9418 (2.9243)	Entropy 0.67904 (0.67948)	Top-1 acc 50.781 (53.623)	Top-5 acc 77.344 (76.336)	lr 0.01955
Train [38][380/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.083)	Loss 2.8978 (2.9248)	Entropy 0.67871 (0.67946)	Top-1 acc 52.734 (53.608)	Top-5 acc 78.906 (76.331)	lr 0.01955
Train [38][390/3239]	Time 0.265 (0.506)	Data Time 0.001 (0.081)	Loss 2.9243 (2.9238)	Entropy 0.67839 (0.67944)	Top-1 acc 52.734 (53.625)	Top-5 acc 76.953 (76.357)	lr 0.01955
Train [38][400/3239]	Time 0.258 (0.504)	Data Time 0.001 (0.079)	Loss 3.1587 (2.9230)	Entropy 0.67822 (0.67942)	Top-1 acc 46.875 (53.635)	Top-5 acc 73.047 (76.371)	lr 0.01955
Train [38][410/3239]	Time 0.334 (0.502)	Data Time 0.001 (0.077)	Loss 2.9001 (2.9224)	Entropy 0.67798 (0.67939)	Top-1 acc 52.344 (53.647)	Top-5 acc 75.391 (76.368)	lr 0.01955
Train [38][420/3239]	Time 0.223 (0.499)	Data Time 0.001 (0.075)	Loss 2.8505 (2.9213)	Entropy 0.67778 (0.67935)	Top-1 acc 56.641 (53.663)	Top-5 acc 78.125 (76.396)	lr 0.01955
Train [38][430/3239]	Time 0.219 (0.497)	Data Time 0.001 (0.074)	Loss 2.8682 (2.9217)	Entropy 0.67759 (0.67931)	Top-1 acc 54.297 (53.652)	Top-5 acc 75.781 (76.367)	lr 0.01954
Train [38][440/3239]	Time 0.224 (0.495)	Data Time 0.001 (0.072)	Loss 2.9515 (2.9211)	Entropy 0.67786 (0.67927)	Top-1 acc 52.344 (53.670)	Top-5 acc 75.781 (76.373)	lr 0.01954
Train [38][450/3239]	Time 0.229 (0.493)	Data Time 0.001 (0.070)	Loss 3.2290 (2.9216)	Entropy 0.67816 (0.67924)	Top-1 acc 45.312 (53.655)	Top-5 acc 70.312 (76.359)	lr 0.01954
Train [38][460/3239]	Time 0.236 (0.491)	Data Time 0.001 (0.069)	Loss 2.9775 (2.9233)	Entropy 0.67836 (0.67922)	Top-1 acc 52.344 (53.633)	Top-5 acc 74.219 (76.332)	lr 0.01954
Train [38][470/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.068)	Loss 2.9342 (2.9239)	Entropy 0.67836 (0.67920)	Top-1 acc 54.297 (53.640)	Top-5 acc 75.781 (76.335)	lr 0.01954
Train [38][480/3239]	Time 0.332 (0.488)	Data Time 0.001 (0.066)	Loss 3.1296 (2.9229)	Entropy 0.67832 (0.67918)	Top-1 acc 47.266 (53.666)	Top-5 acc 70.703 (76.364)	lr 0.01954
Train [38][490/3239]	Time 0.231 (0.486)	Data Time 0.001 (0.065)	Loss 2.8174 (2.9234)	Entropy 0.67846 (0.67917)	Top-1 acc 54.297 (53.638)	Top-5 acc 78.906 (76.353)	lr 0.01954
Train [38][500/3239]	Time 0.233 (0.484)	Data Time 0.001 (0.064)	Loss 2.8316 (2.9238)	Entropy 0.67828 (0.67915)	Top-1 acc 57.031 (53.627)	Top-5 acc 78.906 (76.347)	lr 0.01954
Train [38][510/3239]	Time 0.238 (0.483)	Data Time 0.001 (0.062)	Loss 3.2402 (2.9243)	Entropy 0.67829 (0.67913)	Top-1 acc 50.391 (53.628)	Top-5 acc 70.703 (76.335)	lr 0.01954
Train [38][520/3239]	Time 0.235 (0.482)	Data Time 0.001 (0.061)	Loss 2.8510 (2.9246)	Entropy 0.67833 (0.67912)	Top-1 acc 57.422 (53.636)	Top-5 acc 75.391 (76.323)	lr 0.01954
Train [38][530/3239]	Time 0.238 (0.480)	Data Time 0.001 (0.060)	Loss 2.7473 (2.9244)	Entropy 0.67811 (0.67910)	Top-1 acc 58.984 (53.633)	Top-5 acc 80.078 (76.334)	lr 0.01954
Train [38][540/3239]	Time 0.241 (0.479)	Data Time 0.001 (0.059)	Loss 2.8405 (2.9253)	Entropy 0.67833 (0.67909)	Top-1 acc 56.641 (53.611)	Top-5 acc 77.734 (76.315)	lr 0.01954
Train [38][550/3239]	Time 0.230 (0.478)	Data Time 0.001 (0.058)	Loss 2.7612 (2.9256)	Entropy 0.67869 (0.67908)	Top-1 acc 57.422 (53.613)	Top-5 acc 79.688 (76.332)	lr 0.01953
Train [38][560/3239]	Time 0.234 (0.476)	Data Time 0.001 (0.057)	Loss 2.7958 (2.9255)	Entropy 0.67824 (0.67907)	Top-1 acc 55.078 (53.627)	Top-5 acc 79.688 (76.339)	lr 0.01953
Train [38][570/3239]	Time 0.255 (0.475)	Data Time 0.001 (0.056)	Loss 3.0217 (2.9258)	Entropy 0.67842 (0.67905)	Top-1 acc 50.000 (53.631)	Top-5 acc 75.391 (76.346)	lr 0.01953
Train [38][580/3239]	Time 0.234 (0.474)	Data Time 0.001 (0.055)	Loss 3.0288 (2.9253)	Entropy 0.67842 (0.67904)	Top-1 acc 53.906 (53.642)	Top-5 acc 75.391 (76.351)	lr 0.01953
Train [38][590/3239]	Time 0.231 (0.473)	Data Time 0.001 (0.054)	Loss 2.8134 (2.9245)	Entropy 0.67852 (0.67904)	Top-1 acc 57.422 (53.654)	Top-5 acc 80.469 (76.372)	lr 0.01953
Train [38][600/3239]	Time 0.254 (0.472)	Data Time 0.001 (0.053)	Loss 2.9829 (2.9250)	Entropy 0.67849 (0.67903)	Top-1 acc 53.906 (53.659)	Top-5 acc 74.609 (76.357)	lr 0.01953
Train [38][610/3239]	Time 0.345 (0.525)	Data Time 0.004 (0.052)	Loss 2.7382 (2.9256)	Entropy 0.67873 (0.67902)	Top-1 acc 57.031 (53.653)	Top-5 acc 78.516 (76.353)	lr 0.01953
Train [38][620/3239]	Time 0.232 (0.523)	Data Time 0.002 (0.052)	Loss 2.8384 (2.9256)	Entropy 0.67851 (0.67901)	Top-1 acc 57.031 (53.662)	Top-5 acc 75.391 (76.352)	lr 0.01953
Train [38][630/3239]	Time 0.242 (0.522)	Data Time 0.002 (0.051)	Loss 3.1799 (2.9256)	Entropy 0.67865 (0.67900)	Top-1 acc 46.875 (53.650)	Top-5 acc 71.484 (76.345)	lr 0.01953
Train [38][640/3239]	Time 0.362 (0.520)	Data Time 0.001 (0.050)	Loss 2.8574 (2.9267)	Entropy 0.67846 (0.67900)	Top-1 acc 55.078 (53.619)	Top-5 acc 75.391 (76.340)	lr 0.01953
Train [38][650/3239]	Time 0.272 (0.519)	Data Time 0.001 (0.049)	Loss 2.7754 (2.9264)	Entropy 0.67845 (0.67899)	Top-1 acc 55.859 (53.618)	Top-5 acc 79.297 (76.348)	lr 0.01953
Train [38][660/3239]	Time 0.271 (0.517)	Data Time 0.002 (0.049)	Loss 2.8267 (2.9262)	Entropy 0.67856 (0.67898)	Top-1 acc 56.641 (53.614)	Top-5 acc 79.297 (76.358)	lr 0.01953
Train [38][670/3239]	Time 0.271 (0.516)	Data Time 0.001 (0.048)	Loss 2.9394 (2.9266)	Entropy 0.67834 (0.67897)	Top-1 acc 52.734 (53.609)	Top-5 acc 75.000 (76.362)	lr 0.01952
Train [38][680/3239]	Time 0.244 (0.515)	Data Time 0.001 (0.047)	Loss 3.0487 (2.9266)	Entropy 0.67807 (0.67896)	Top-1 acc 51.562 (53.598)	Top-5 acc 74.609 (76.362)	lr 0.01952
Train [38][690/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.047)	Loss 2.9596 (2.9267)	Entropy 0.67805 (0.67895)	Top-1 acc 50.781 (53.604)	Top-5 acc 76.172 (76.363)	lr 0.01952
Train [38][700/3239]	Time 0.246 (0.512)	Data Time 0.001 (0.046)	Loss 2.8697 (2.9266)	Entropy 0.67797 (0.67894)	Top-1 acc 55.469 (53.602)	Top-5 acc 78.516 (76.379)	lr 0.01952
Train [38][710/3239]	Time 0.240 (0.510)	Data Time 0.001 (0.045)	Loss 3.0222 (2.9260)	Entropy 0.67778 (0.67892)	Top-1 acc 50.391 (53.615)	Top-5 acc 76.562 (76.388)	lr 0.01952
Train [38][720/3239]	Time 0.223 (0.509)	Data Time 0.001 (0.045)	Loss 3.0273 (2.9262)	Entropy 0.67734 (0.67890)	Top-1 acc 53.125 (53.615)	Top-5 acc 74.219 (76.379)	lr 0.01952
Train [38][730/3239]	Time 0.258 (0.507)	Data Time 0.001 (0.044)	Loss 2.8633 (2.9270)	Entropy 0.67747 (0.67888)	Top-1 acc 53.516 (53.600)	Top-5 acc 79.688 (76.365)	lr 0.01952
Train [38][740/3239]	Time 0.246 (0.506)	Data Time 0.001 (0.044)	Loss 2.7948 (2.9266)	Entropy 0.67734 (0.67886)	Top-1 acc 56.641 (53.604)	Top-5 acc 78.906 (76.369)	lr 0.01952
Train [38][750/3239]	Time 0.231 (0.505)	Data Time 0.001 (0.043)	Loss 3.0185 (2.9258)	Entropy 0.67722 (0.67884)	Top-1 acc 57.031 (53.635)	Top-5 acc 73.828 (76.381)	lr 0.01952
Train [38][760/3239]	Time 0.263 (0.504)	Data Time 0.002 (0.042)	Loss 2.8410 (2.9271)	Entropy 0.67765 (0.67882)	Top-1 acc 56.641 (53.599)	Top-5 acc 77.734 (76.343)	lr 0.01952
Train [38][770/3239]	Time 0.220 (0.503)	Data Time 0.001 (0.042)	Loss 3.0008 (2.9275)	Entropy 0.67785 (0.67881)	Top-1 acc 52.344 (53.603)	Top-5 acc 73.438 (76.338)	lr 0.01952
Train [38][780/3239]	Time 0.214 (0.501)	Data Time 0.001 (0.041)	Loss 2.9961 (2.9276)	Entropy 0.67833 (0.67880)	Top-1 acc 52.734 (53.591)	Top-5 acc 76.172 (76.350)	lr 0.01952
Train [38][790/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.041)	Loss 2.9747 (2.9276)	Entropy 0.67840 (0.67880)	Top-1 acc 53.125 (53.605)	Top-5 acc 72.656 (76.355)	lr 0.01951
Train [38][800/3239]	Time 0.345 (0.499)	Data Time 0.001 (0.040)	Loss 2.8538 (2.9273)	Entropy 0.67808 (0.67879)	Top-1 acc 51.172 (53.606)	Top-5 acc 79.688 (76.371)	lr 0.01951
Train [38][810/3239]	Time 0.220 (0.498)	Data Time 0.001 (0.040)	Loss 2.8846 (2.9275)	Entropy 0.67810 (0.67878)	Top-1 acc 54.297 (53.597)	Top-5 acc 77.344 (76.367)	lr 0.01951
Train [38][820/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.039)	Loss 2.8029 (2.9270)	Entropy 0.67834 (0.67877)	Top-1 acc 51.562 (53.604)	Top-5 acc 78.125 (76.377)	lr 0.01951
Train [38][830/3239]	Time 0.233 (0.496)	Data Time 0.001 (0.039)	Loss 2.9080 (2.9275)	Entropy 0.67856 (0.67877)	Top-1 acc 53.906 (53.606)	Top-5 acc 79.297 (76.355)	lr 0.01951
Train [38][840/3239]	Time 0.232 (0.495)	Data Time 0.001 (0.039)	Loss 2.8733 (2.9283)	Entropy 0.67833 (0.67876)	Top-1 acc 55.469 (53.586)	Top-5 acc 78.125 (76.338)	lr 0.01951
Train [38][850/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.038)	Loss 3.1498 (2.9290)	Entropy 0.67813 (0.67876)	Top-1 acc 49.609 (53.565)	Top-5 acc 71.094 (76.318)	lr 0.01951
Train [38][860/3239]	Time 0.228 (0.493)	Data Time 0.001 (0.038)	Loss 2.8932 (2.9291)	Entropy 0.67808 (0.67875)	Top-1 acc 55.859 (53.562)	Top-5 acc 77.734 (76.318)	lr 0.01951
Train [38][870/3239]	Time 0.328 (0.492)	Data Time 0.001 (0.037)	Loss 2.9888 (2.9289)	Entropy 0.67770 (0.67874)	Top-1 acc 48.828 (53.565)	Top-5 acc 75.781 (76.331)	lr 0.01951
Train [38][880/3239]	Time 0.238 (0.491)	Data Time 0.001 (0.037)	Loss 2.9698 (2.9288)	Entropy 0.67753 (0.67873)	Top-1 acc 52.344 (53.572)	Top-5 acc 75.000 (76.339)	lr 0.01951
Train [38][890/3239]	Time 0.230 (0.490)	Data Time 0.001 (0.037)	Loss 2.9746 (2.9287)	Entropy 0.67797 (0.67872)	Top-1 acc 55.078 (53.574)	Top-5 acc 76.172 (76.337)	lr 0.01951
Train [38][900/3239]	Time 0.237 (0.489)	Data Time 0.001 (0.036)	Loss 3.0465 (2.9288)	Entropy 0.67799 (0.67871)	Top-1 acc 50.391 (53.566)	Top-5 acc 73.438 (76.336)	lr 0.01950
Train [38][910/3239]	Time 0.243 (0.489)	Data Time 0.002 (0.036)	Loss 2.8414 (2.9291)	Entropy 0.67780 (0.67870)	Top-1 acc 54.297 (53.570)	Top-5 acc 76.953 (76.331)	lr 0.01950
Train [38][920/3239]	Time 0.239 (0.488)	Data Time 0.002 (0.035)	Loss 2.8716 (2.9290)	Entropy 0.67772 (0.67869)	Top-1 acc 51.953 (53.556)	Top-5 acc 75.781 (76.328)	lr 0.01950
Train [38][930/3239]	Time 0.231 (0.487)	Data Time 0.001 (0.035)	Loss 2.9686 (2.9295)	Entropy 0.67789 (0.67868)	Top-1 acc 50.000 (53.536)	Top-5 acc 76.953 (76.320)	lr 0.01950
Train [38][940/3239]	Time 0.241 (0.487)	Data Time 0.001 (0.035)	Loss 3.0079 (2.9298)	Entropy 0.67734 (0.67867)	Top-1 acc 51.172 (53.530)	Top-5 acc 75.781 (76.307)	lr 0.01950
Train [38][950/3239]	Time 0.224 (0.486)	Data Time 0.001 (0.034)	Loss 2.8497 (2.9298)	Entropy 0.67707 (0.67866)	Top-1 acc 53.516 (53.528)	Top-5 acc 77.344 (76.313)	lr 0.01950
Train [38][960/3239]	Time 0.326 (0.485)	Data Time 0.001 (0.034)	Loss 3.0646 (2.9302)	Entropy 0.67637 (0.67864)	Top-1 acc 53.516 (53.522)	Top-5 acc 72.656 (76.313)	lr 0.01950
Train [38][970/3239]	Time 0.229 (0.484)	Data Time 0.001 (0.034)	Loss 2.9425 (2.9303)	Entropy 0.67620 (0.67861)	Top-1 acc 57.031 (53.528)	Top-5 acc 76.562 (76.311)	lr 0.01950
Train [38][980/3239]	Time 0.228 (0.483)	Data Time 0.001 (0.033)	Loss 3.1186 (2.9305)	Entropy 0.67644 (0.67859)	Top-1 acc 49.609 (53.534)	Top-5 acc 73.828 (76.313)	lr 0.01950
Train [38][990/3239]	Time 0.231 (0.483)	Data Time 0.001 (0.033)	Loss 3.0271 (2.9311)	Entropy 0.67639 (0.67857)	Top-1 acc 47.656 (53.518)	Top-5 acc 75.781 (76.307)	lr 0.01950
Train [38][1000/3239]	Time 0.234 (0.482)	Data Time 0.002 (0.033)	Loss 2.9080 (2.9305)	Entropy 0.67610 (0.67855)	Top-1 acc 53.906 (53.539)	Top-5 acc 78.516 (76.324)	lr 0.01950
Train [38][1010/3239]	Time 0.225 (0.481)	Data Time 0.001 (0.032)	Loss 2.8189 (2.9308)	Entropy 0.67610 (0.67852)	Top-1 acc 57.031 (53.536)	Top-5 acc 78.906 (76.316)	lr 0.01950
Train [38][1020/3239]	Time 0.232 (0.480)	Data Time 0.001 (0.032)	Loss 2.7016 (2.9303)	Entropy 0.67579 (0.67850)	Top-1 acc 60.547 (53.545)	Top-5 acc 80.469 (76.325)	lr 0.01949
Train [38][1030/3239]	Time 0.314 (0.480)	Data Time 0.001 (0.032)	Loss 3.1094 (2.9303)	Entropy 0.67552 (0.67847)	Top-1 acc 51.172 (53.538)	Top-5 acc 71.875 (76.333)	lr 0.01949
Train [38][1040/3239]	Time 0.231 (0.479)	Data Time 0.001 (0.031)	Loss 2.8048 (2.9302)	Entropy 0.67576 (0.67844)	Top-1 acc 57.422 (53.534)	Top-5 acc 77.734 (76.335)	lr 0.01949
Train [38][1050/3239]	Time 0.221 (0.478)	Data Time 0.001 (0.031)	Loss 2.9630 (2.9304)	Entropy 0.67572 (0.67842)	Top-1 acc 54.688 (53.541)	Top-5 acc 72.266 (76.327)	lr 0.01949
Train [38][1060/3239]	Time 0.234 (0.477)	Data Time 0.001 (0.031)	Loss 2.7350 (2.9308)	Entropy 0.67589 (0.67839)	Top-1 acc 59.375 (53.539)	Top-5 acc 81.250 (76.321)	lr 0.01949
Train [38][1070/3239]	Time 0.233 (0.476)	Data Time 0.001 (0.031)	Loss 2.9463 (2.9310)	Entropy 0.67610 (0.67837)	Top-1 acc 54.688 (53.538)	Top-5 acc 75.000 (76.319)	lr 0.01949
Train [38][1080/3239]	Time 0.234 (0.476)	Data Time 0.001 (0.030)	Loss 3.0418 (2.9308)	Entropy 0.67630 (0.67835)	Top-1 acc 47.266 (53.539)	Top-5 acc 76.562 (76.332)	lr 0.01949
Train [38][1090/3239]	Time 0.233 (0.475)	Data Time 0.001 (0.030)	Loss 3.0310 (2.9307)	Entropy 0.67601 (0.67833)	Top-1 acc 50.000 (53.538)	Top-5 acc 74.609 (76.332)	lr 0.01949
Train [38][1100/3239]	Time 0.232 (0.474)	Data Time 0.001 (0.030)	Loss 3.0030 (2.9309)	Entropy 0.67604 (0.67831)	Top-1 acc 53.125 (53.534)	Top-5 acc 72.656 (76.327)	lr 0.01949
Train [38][1110/3239]	Time 0.226 (0.474)	Data Time 0.001 (0.030)	Loss 2.9798 (2.9313)	Entropy 0.67592 (0.67828)	Top-1 acc 48.438 (53.520)	Top-5 acc 77.344 (76.321)	lr 0.01949
Train [38][1120/3239]	Time 0.316 (0.473)	Data Time 0.001 (0.029)	Loss 2.9290 (2.9316)	Entropy 0.67626 (0.67826)	Top-1 acc 55.859 (53.513)	Top-5 acc 75.391 (76.312)	lr 0.01949
Train [38][1130/3239]	Time 0.230 (0.473)	Data Time 0.001 (0.029)	Loss 2.9658 (2.9318)	Entropy 0.67631 (0.67825)	Top-1 acc 55.859 (53.512)	Top-5 acc 75.000 (76.309)	lr 0.01949
Train [38][1140/3239]	Time 0.249 (0.472)	Data Time 0.002 (0.029)	Loss 2.9876 (2.9320)	Entropy 0.67583 (0.67823)	Top-1 acc 53.516 (53.506)	Top-5 acc 75.000 (76.313)	lr 0.01948
Train [38][1150/3239]	Time 0.228 (0.471)	Data Time 0.001 (0.029)	Loss 2.9299 (2.9313)	Entropy 0.67569 (0.67821)	Top-1 acc 56.250 (53.524)	Top-5 acc 76.953 (76.328)	lr 0.01948
Train [38][1160/3239]	Time 0.221 (0.471)	Data Time 0.001 (0.028)	Loss 2.9532 (2.9310)	Entropy 0.67553 (0.67818)	Top-1 acc 53.906 (53.537)	Top-5 acc 75.391 (76.331)	lr 0.01948
Train [38][1170/3239]	Time 0.232 (0.470)	Data Time 0.001 (0.028)	Loss 2.9003 (2.9309)	Entropy 0.67535 (0.67816)	Top-1 acc 50.391 (53.539)	Top-5 acc 76.562 (76.338)	lr 0.01948
Train [38][1180/3239]	Time 0.231 (0.470)	Data Time 0.001 (0.028)	Loss 2.8362 (2.9307)	Entropy 0.67590 (0.67814)	Top-1 acc 59.375 (53.538)	Top-5 acc 76.953 (76.342)	lr 0.01948
Train [38][1190/3239]	Time 0.327 (0.469)	Data Time 0.001 (0.028)	Loss 2.9183 (2.9307)	Entropy 0.67586 (0.67812)	Top-1 acc 52.344 (53.535)	Top-5 acc 75.781 (76.341)	lr 0.01948
Train [38][1200/3239]	Time 0.227 (0.468)	Data Time 0.001 (0.027)	Loss 2.9656 (2.9306)	Entropy 0.67611 (0.67810)	Top-1 acc 52.734 (53.534)	Top-5 acc 74.609 (76.341)	lr 0.01948
Train [38][1210/3239]	Time 0.231 (0.468)	Data Time 0.001 (0.027)	Loss 2.8737 (2.9309)	Entropy 0.67625 (0.67808)	Top-1 acc 58.203 (53.522)	Top-5 acc 75.781 (76.334)	lr 0.01948
Train [38][1220/3239]	Time 0.230 (0.467)	Data Time 0.001 (0.027)	Loss 2.9089 (2.9310)	Entropy 0.67619 (0.67807)	Top-1 acc 55.859 (53.521)	Top-5 acc 77.734 (76.340)	lr 0.01948
Train [38][1230/3239]	Time 0.224 (0.467)	Data Time 0.001 (0.027)	Loss 2.8858 (2.9315)	Entropy 0.67614 (0.67805)	Top-1 acc 57.422 (53.502)	Top-5 acc 76.562 (76.335)	lr 0.01948
Train [38][1240/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.027)	Loss 3.0321 (2.9318)	Entropy 0.67624 (0.67804)	Top-1 acc 49.609 (53.494)	Top-5 acc 72.266 (76.324)	lr 0.01948
Train [38][1250/3239]	Time 0.226 (0.466)	Data Time 0.001 (0.026)	Loss 3.1482 (2.9323)	Entropy 0.67610 (0.67802)	Top-1 acc 48.828 (53.481)	Top-5 acc 69.922 (76.308)	lr 0.01948
Train [38][1260/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.026)	Loss 3.3881 (2.9329)	Entropy 0.67584 (0.67801)	Top-1 acc 42.578 (53.471)	Top-5 acc 65.234 (76.289)	lr 0.01947
Train [38][1270/3239]	Time 0.257 (0.491)	Data Time 0.002 (0.026)	Loss 3.2029 (2.9329)	Entropy 0.67519 (0.67799)	Top-1 acc 50.391 (53.478)	Top-5 acc 68.750 (76.289)	lr 0.01947
Train [38][1280/3239]	Time 0.330 (0.490)	Data Time 0.002 (0.026)	Loss 3.1840 (2.9332)	Entropy 0.67542 (0.67797)	Top-1 acc 50.391 (53.472)	Top-5 acc 70.312 (76.280)	lr 0.01947
Train [38][1290/3239]	Time 0.258 (0.490)	Data Time 0.001 (0.026)	Loss 2.8662 (2.9329)	Entropy 0.67546 (0.67795)	Top-1 acc 54.297 (53.481)	Top-5 acc 78.516 (76.287)	lr 0.01947
Train [38][1300/3239]	Time 0.233 (0.489)	Data Time 0.001 (0.026)	Loss 2.9564 (2.9323)	Entropy 0.67553 (0.67793)	Top-1 acc 53.516 (53.488)	Top-5 acc 76.172 (76.298)	lr 0.01947
Train [38][1310/3239]	Time 0.234 (0.489)	Data Time 0.001 (0.025)	Loss 2.8533 (2.9324)	Entropy 0.67557 (0.67791)	Top-1 acc 52.734 (53.486)	Top-5 acc 78.516 (76.296)	lr 0.01947
Train [38][1320/3239]	Time 0.234 (0.488)	Data Time 0.001 (0.025)	Loss 2.9985 (2.9328)	Entropy 0.67548 (0.67789)	Top-1 acc 53.125 (53.475)	Top-5 acc 75.391 (76.282)	lr 0.01947
Train [38][1330/3239]	Time 0.229 (0.488)	Data Time 0.001 (0.025)	Loss 3.2045 (2.9329)	Entropy 0.67551 (0.67787)	Top-1 acc 48.047 (53.471)	Top-5 acc 73.047 (76.284)	lr 0.01947
Train [38][1340/3239]	Time 0.235 (0.487)	Data Time 0.001 (0.025)	Loss 2.8218 (2.9323)	Entropy 0.67561 (0.67786)	Top-1 acc 57.422 (53.493)	Top-5 acc 77.344 (76.296)	lr 0.01947
Train [38][1350/3239]	Time 0.331 (0.486)	Data Time 0.001 (0.025)	Loss 2.8751 (2.9314)	Entropy 0.67542 (0.67784)	Top-1 acc 52.734 (53.512)	Top-5 acc 77.734 (76.318)	lr 0.01947
Train [38][1360/3239]	Time 0.233 (0.486)	Data Time 0.001 (0.024)	Loss 2.8776 (2.9319)	Entropy 0.67535 (0.67782)	Top-1 acc 53.125 (53.502)	Top-5 acc 80.078 (76.310)	lr 0.01947
Train [38][1370/3239]	Time 0.231 (0.485)	Data Time 0.001 (0.024)	Loss 3.0118 (2.9320)	Entropy 0.67522 (0.67780)	Top-1 acc 50.781 (53.495)	Top-5 acc 75.000 (76.303)	lr 0.01947
Train [38][1380/3239]	Time 0.233 (0.485)	Data Time 0.001 (0.024)	Loss 2.9532 (2.9328)	Entropy 0.67509 (0.67778)	Top-1 acc 52.734 (53.477)	Top-5 acc 74.609 (76.292)	lr 0.01946
Train [38][1390/3239]	Time 0.235 (0.484)	Data Time 0.001 (0.024)	Loss 2.8615 (2.9326)	Entropy 0.67489 (0.67776)	Top-1 acc 56.641 (53.477)	Top-5 acc 76.562 (76.296)	lr 0.01946
Train [38][1400/3239]	Time 0.235 (0.484)	Data Time 0.001 (0.024)	Loss 2.8773 (2.9321)	Entropy 0.67497 (0.67774)	Top-1 acc 54.688 (53.489)	Top-5 acc 76.172 (76.304)	lr 0.01946
Train [38][1410/3239]	Time 0.229 (0.483)	Data Time 0.001 (0.024)	Loss 2.7727 (2.9324)	Entropy 0.67499 (0.67772)	Top-1 acc 60.547 (53.486)	Top-5 acc 79.297 (76.298)	lr 0.01946
Train [38][1420/3239]	Time 0.233 (0.483)	Data Time 0.001 (0.023)	Loss 3.0315 (2.9331)	Entropy 0.67500 (0.67770)	Top-1 acc 53.516 (53.471)	Top-5 acc 76.172 (76.288)	lr 0.01946
Train [38][1430/3239]	Time 0.236 (0.482)	Data Time 0.001 (0.023)	Loss 3.0031 (2.9337)	Entropy 0.67509 (0.67768)	Top-1 acc 52.734 (53.459)	Top-5 acc 76.562 (76.279)	lr 0.01946
Train [38][1440/3239]	Time 0.262 (0.482)	Data Time 0.003 (0.023)	Loss 2.8429 (2.9339)	Entropy 0.67471 (0.67767)	Top-1 acc 55.469 (53.454)	Top-5 acc 76.562 (76.278)	lr 0.01946
Train [38][1450/3239]	Time 0.224 (0.481)	Data Time 0.001 (0.023)	Loss 3.0573 (2.9345)	Entropy 0.67495 (0.67765)	Top-1 acc 48.828 (53.441)	Top-5 acc 74.609 (76.266)	lr 0.01946
Train [38][1460/3239]	Time 0.236 (0.481)	Data Time 0.001 (0.023)	Loss 3.0137 (2.9348)	Entropy 0.67508 (0.67763)	Top-1 acc 49.219 (53.435)	Top-5 acc 75.781 (76.261)	lr 0.01946
Train [38][1470/3239]	Time 0.235 (0.480)	Data Time 0.001 (0.023)	Loss 2.8899 (2.9344)	Entropy 0.67520 (0.67761)	Top-1 acc 55.469 (53.433)	Top-5 acc 76.562 (76.270)	lr 0.01946
Train [38][1480/3239]	Time 0.222 (0.480)	Data Time 0.001 (0.023)	Loss 2.8551 (2.9344)	Entropy 0.67525 (0.67760)	Top-1 acc 54.688 (53.433)	Top-5 acc 77.734 (76.272)	lr 0.01946
Train [38][1490/3239]	Time 0.238 (0.479)	Data Time 0.001 (0.022)	Loss 3.1048 (2.9344)	Entropy 0.67552 (0.67758)	Top-1 acc 51.172 (53.433)	Top-5 acc 72.656 (76.271)	lr 0.01946
Train [38][1500/3239]	Time 0.227 (0.479)	Data Time 0.001 (0.022)	Loss 2.7181 (2.9343)	Entropy 0.67550 (0.67757)	Top-1 acc 57.422 (53.432)	Top-5 acc 80.469 (76.284)	lr 0.01945
Train [38][1510/3239]	Time 0.326 (0.478)	Data Time 0.001 (0.022)	Loss 3.0403 (2.9339)	Entropy 0.67527 (0.67755)	Top-1 acc 54.297 (53.435)	Top-5 acc 74.219 (76.289)	lr 0.01945
Train [38][1520/3239]	Time 0.229 (0.478)	Data Time 0.001 (0.022)	Loss 2.9785 (2.9341)	Entropy 0.67503 (0.67754)	Top-1 acc 50.781 (53.438)	Top-5 acc 74.609 (76.283)	lr 0.01945
Train [38][1530/3239]	Time 0.239 (0.477)	Data Time 0.001 (0.022)	Loss 2.8843 (2.9340)	Entropy 0.67454 (0.67752)	Top-1 acc 54.297 (53.438)	Top-5 acc 79.688 (76.283)	lr 0.01945
Train [38][1540/3239]	Time 0.260 (0.477)	Data Time 0.001 (0.022)	Loss 2.9433 (2.9340)	Entropy 0.67426 (0.67750)	Top-1 acc 53.906 (53.442)	Top-5 acc 75.391 (76.287)	lr 0.01945
Train [38][1550/3239]	Time 0.229 (0.476)	Data Time 0.001 (0.022)	Loss 3.1584 (2.9338)	Entropy 0.67433 (0.67748)	Top-1 acc 48.828 (53.448)	Top-5 acc 70.703 (76.283)	lr 0.01945
Train [38][1560/3239]	Time 0.233 (0.476)	Data Time 0.001 (0.022)	Loss 2.9699 (2.9341)	Entropy 0.67467 (0.67746)	Top-1 acc 52.734 (53.440)	Top-5 acc 75.000 (76.276)	lr 0.01945
Train [38][1570/3239]	Time 0.228 (0.476)	Data Time 0.001 (0.021)	Loss 2.8477 (2.9344)	Entropy 0.67434 (0.67744)	Top-1 acc 57.422 (53.438)	Top-5 acc 78.125 (76.270)	lr 0.01945
Train [38][1580/3239]	Time 0.304 (0.475)	Data Time 0.001 (0.021)	Loss 2.9251 (2.9346)	Entropy 0.67445 (0.67742)	Top-1 acc 50.781 (53.428)	Top-5 acc 76.953 (76.271)	lr 0.01945
Train [38][1590/3239]	Time 0.233 (0.475)	Data Time 0.001 (0.021)	Loss 2.9005 (2.9344)	Entropy 0.67477 (0.67741)	Top-1 acc 54.297 (53.427)	Top-5 acc 76.562 (76.273)	lr 0.01945
Train [38][1600/3239]	Time 0.224 (0.474)	Data Time 0.001 (0.021)	Loss 2.9298 (2.9342)	Entropy 0.67468 (0.67739)	Top-1 acc 53.125 (53.432)	Top-5 acc 76.953 (76.277)	lr 0.01945
Train [38][1610/3239]	Time 0.252 (0.474)	Data Time 0.001 (0.021)	Loss 2.9937 (2.9345)	Entropy 0.67435 (0.67737)	Top-1 acc 51.172 (53.427)	Top-5 acc 73.047 (76.268)	lr 0.01945
Train [38][1620/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.021)	Loss 2.9768 (2.9344)	Entropy 0.67464 (0.67735)	Top-1 acc 53.125 (53.431)	Top-5 acc 75.391 (76.265)	lr 0.01944
Train [38][1630/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.021)	Loss 3.0236 (2.9347)	Entropy 0.67441 (0.67734)	Top-1 acc 52.734 (53.428)	Top-5 acc 74.609 (76.266)	lr 0.01944
Train [38][1640/3239]	Time 0.226 (0.472)	Data Time 0.001 (0.021)	Loss 2.9060 (2.9348)	Entropy 0.67467 (0.67732)	Top-1 acc 52.734 (53.427)	Top-5 acc 73.828 (76.261)	lr 0.01944
Train [38][1650/3239]	Time 0.258 (0.472)	Data Time 0.001 (0.020)	Loss 2.8383 (2.9348)	Entropy 0.67475 (0.67730)	Top-1 acc 57.031 (53.429)	Top-5 acc 79.688 (76.262)	lr 0.01944
Train [38][1660/3239]	Time 0.228 (0.471)	Data Time 0.001 (0.020)	Loss 2.7870 (2.9346)	Entropy 0.67464 (0.67729)	Top-1 acc 56.250 (53.435)	Top-5 acc 77.734 (76.265)	lr 0.01944
Train [38][1670/3239]	Time 0.319 (0.471)	Data Time 0.001 (0.020)	Loss 2.9712 (2.9345)	Entropy 0.67478 (0.67727)	Top-1 acc 55.078 (53.432)	Top-5 acc 74.219 (76.267)	lr 0.01944
Train [38][1680/3239]	Time 0.229 (0.470)	Data Time 0.001 (0.020)	Loss 3.0724 (2.9345)	Entropy 0.67521 (0.67726)	Top-1 acc 50.000 (53.430)	Top-5 acc 73.438 (76.269)	lr 0.01944
Train [38][1690/3239]	Time 0.230 (0.470)	Data Time 0.001 (0.020)	Loss 2.7667 (2.9347)	Entropy 0.67503 (0.67725)	Top-1 acc 56.250 (53.426)	Top-5 acc 80.859 (76.264)	lr 0.01944
Train [38][1700/3239]	Time 0.220 (0.470)	Data Time 0.001 (0.020)	Loss 2.9790 (2.9347)	Entropy 0.67497 (0.67723)	Top-1 acc 52.344 (53.424)	Top-5 acc 76.172 (76.263)	lr 0.01944
Train [38][1710/3239]	Time 0.225 (0.469)	Data Time 0.001 (0.020)	Loss 2.9425 (2.9344)	Entropy 0.67496 (0.67722)	Top-1 acc 49.609 (53.425)	Top-5 acc 78.906 (76.273)	lr 0.01944
Train [38][1720/3239]	Time 0.221 (0.469)	Data Time 0.001 (0.020)	Loss 2.9872 (2.9345)	Entropy 0.67498 (0.67720)	Top-1 acc 53.906 (53.420)	Top-5 acc 76.562 (76.269)	lr 0.01944
Train [38][1730/3239]	Time 0.224 (0.468)	Data Time 0.001 (0.020)	Loss 2.7272 (2.9346)	Entropy 0.67479 (0.67719)	Top-1 acc 59.766 (53.422)	Top-5 acc 80.859 (76.268)	lr 0.01944
Train [38][1740/3239]	Time 0.325 (0.468)	Data Time 0.001 (0.019)	Loss 3.0333 (2.9346)	Entropy 0.67478 (0.67718)	Top-1 acc 51.562 (53.427)	Top-5 acc 74.609 (76.266)	lr 0.01943
Train [38][1750/3239]	Time 0.227 (0.468)	Data Time 0.001 (0.019)	Loss 2.8561 (2.9346)	Entropy 0.67458 (0.67716)	Top-1 acc 55.078 (53.428)	Top-5 acc 79.297 (76.266)	lr 0.01943
Train [38][1760/3239]	Time 0.241 (0.467)	Data Time 0.001 (0.019)	Loss 2.7005 (2.9350)	Entropy 0.67438 (0.67715)	Top-1 acc 56.250 (53.418)	Top-5 acc 82.422 (76.257)	lr 0.01943
Train [38][1770/3239]	Time 0.226 (0.467)	Data Time 0.001 (0.019)	Loss 2.8409 (2.9351)	Entropy 0.67440 (0.67713)	Top-1 acc 56.641 (53.413)	Top-5 acc 78.516 (76.253)	lr 0.01943
Train [38][1780/3239]	Time 0.239 (0.466)	Data Time 0.001 (0.019)	Loss 2.9262 (2.9349)	Entropy 0.67453 (0.67712)	Top-1 acc 56.250 (53.422)	Top-5 acc 76.172 (76.255)	lr 0.01943
Train [38][1790/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.019)	Loss 2.7265 (2.9346)	Entropy 0.67429 (0.67710)	Top-1 acc 58.203 (53.426)	Top-5 acc 79.688 (76.263)	lr 0.01943
Train [38][1800/3239]	Time 0.236 (0.466)	Data Time 0.001 (0.019)	Loss 2.7931 (2.9344)	Entropy 0.67359 (0.67709)	Top-1 acc 57.422 (53.429)	Top-5 acc 78.516 (76.264)	lr 0.01943
Train [38][1810/3239]	Time 0.231 (0.465)	Data Time 0.001 (0.019)	Loss 2.9161 (2.9345)	Entropy 0.67364 (0.67707)	Top-1 acc 57.031 (53.428)	Top-5 acc 75.391 (76.259)	lr 0.01943
Train [38][1820/3239]	Time 0.229 (0.465)	Data Time 0.001 (0.019)	Loss 2.7994 (2.9347)	Entropy 0.67365 (0.67705)	Top-1 acc 57.031 (53.424)	Top-5 acc 78.516 (76.257)	lr 0.01943
Train [38][1830/3239]	Time 0.249 (0.464)	Data Time 0.001 (0.019)	Loss 3.0673 (2.9346)	Entropy 0.67364 (0.67703)	Top-1 acc 50.781 (53.431)	Top-5 acc 72.656 (76.258)	lr 0.01943
Train [38][1840/3239]	Time 0.222 (0.464)	Data Time 0.001 (0.018)	Loss 2.9866 (2.9345)	Entropy 0.67374 (0.67701)	Top-1 acc 53.125 (53.432)	Top-5 acc 76.172 (76.259)	lr 0.01943
Train [38][1850/3239]	Time 0.230 (0.464)	Data Time 0.001 (0.018)	Loss 2.9271 (2.9344)	Entropy 0.67365 (0.67699)	Top-1 acc 51.562 (53.436)	Top-5 acc 74.219 (76.260)	lr 0.01943
Train [38][1860/3239]	Time 0.226 (0.463)	Data Time 0.001 (0.018)	Loss 2.9825 (2.9349)	Entropy 0.67367 (0.67697)	Top-1 acc 52.344 (53.432)	Top-5 acc 75.000 (76.246)	lr 0.01942
Train [38][1870/3239]	Time 0.226 (0.463)	Data Time 0.001 (0.018)	Loss 3.1487 (2.9346)	Entropy 0.67339 (0.67696)	Top-1 acc 51.172 (53.443)	Top-5 acc 71.484 (76.255)	lr 0.01942
Train [38][1880/3239]	Time 0.245 (0.463)	Data Time 0.001 (0.018)	Loss 2.8923 (2.9346)	Entropy 0.67338 (0.67694)	Top-1 acc 55.859 (53.445)	Top-5 acc 79.688 (76.252)	lr 0.01942
Train [38][1890/3239]	Time 0.225 (0.462)	Data Time 0.001 (0.018)	Loss 2.9521 (2.9350)	Entropy 0.67339 (0.67692)	Top-1 acc 55.859 (53.443)	Top-5 acc 77.734 (76.245)	lr 0.01942
Train [38][1900/3239]	Time 0.324 (0.462)	Data Time 0.001 (0.018)	Loss 3.1116 (2.9349)	Entropy 0.67357 (0.67690)	Top-1 acc 45.703 (53.437)	Top-5 acc 74.609 (76.250)	lr 0.01942
Train [38][1910/3239]	Time 0.235 (0.462)	Data Time 0.001 (0.018)	Loss 2.6611 (2.9346)	Entropy 0.67351 (0.67688)	Top-1 acc 60.547 (53.443)	Top-5 acc 81.641 (76.253)	lr 0.01942
Train [38][1920/3239]	Time 0.307 (0.479)	Data Time 0.005 (0.018)	Loss 3.1386 (2.9346)	Entropy 0.67314 (0.67686)	Top-1 acc 48.438 (53.446)	Top-5 acc 71.875 (76.252)	lr 0.01942
Train [38][1930/3239]	Time 0.241 (0.479)	Data Time 0.002 (0.018)	Loss 2.7930 (2.9347)	Entropy 0.67312 (0.67684)	Top-1 acc 57.031 (53.448)	Top-5 acc 78.906 (76.252)	lr 0.01942
Train [38][1940/3239]	Time 0.231 (0.479)	Data Time 0.001 (0.018)	Loss 3.2494 (2.9349)	Entropy 0.67286 (0.67682)	Top-1 acc 46.875 (53.444)	Top-5 acc 71.875 (76.252)	lr 0.01942
Train [38][1950/3239]	Time 0.265 (0.478)	Data Time 0.002 (0.018)	Loss 2.8625 (2.9345)	Entropy 0.67305 (0.67680)	Top-1 acc 53.906 (53.448)	Top-5 acc 76.172 (76.263)	lr 0.01942
Train [38][1960/3239]	Time 0.234 (0.478)	Data Time 0.001 (0.017)	Loss 2.9418 (2.9347)	Entropy 0.67285 (0.67678)	Top-1 acc 51.172 (53.443)	Top-5 acc 75.391 (76.260)	lr 0.01942
Train [38][1970/3239]	Time 0.237 (0.478)	Data Time 0.001 (0.017)	Loss 2.9017 (2.9346)	Entropy 0.67282 (0.67676)	Top-1 acc 53.906 (53.441)	Top-5 acc 79.297 (76.262)	lr 0.01942
Train [38][1980/3239]	Time 0.237 (0.477)	Data Time 0.001 (0.017)	Loss 2.8214 (2.9345)	Entropy 0.67290 (0.67674)	Top-1 acc 56.641 (53.452)	Top-5 acc 78.516 (76.261)	lr 0.01941
Train [38][1990/3239]	Time 0.292 (0.477)	Data Time 0.001 (0.017)	Loss 2.9030 (2.9348)	Entropy 0.67274 (0.67673)	Top-1 acc 55.469 (53.443)	Top-5 acc 78.906 (76.254)	lr 0.01941
Train [38][2000/3239]	Time 0.239 (0.477)	Data Time 0.001 (0.017)	Loss 2.9110 (2.9351)	Entropy 0.67266 (0.67671)	Top-1 acc 51.172 (53.435)	Top-5 acc 76.953 (76.244)	lr 0.01941
Train [38][2010/3239]	Time 0.230 (0.476)	Data Time 0.001 (0.017)	Loss 2.9887 (2.9353)	Entropy 0.67199 (0.67669)	Top-1 acc 50.000 (53.431)	Top-5 acc 75.391 (76.240)	lr 0.01941
Train [38][2020/3239]	Time 0.218 (0.476)	Data Time 0.001 (0.017)	Loss 2.7015 (2.9348)	Entropy 0.67145 (0.67666)	Top-1 acc 56.641 (53.442)	Top-5 acc 81.250 (76.252)	lr 0.01941
Train [38][2030/3239]	Time 0.231 (0.476)	Data Time 0.001 (0.017)	Loss 3.0752 (2.9348)	Entropy 0.67141 (0.67664)	Top-1 acc 53.125 (53.438)	Top-5 acc 73.047 (76.255)	lr 0.01941
Train [38][2040/3239]	Time 0.245 (0.475)	Data Time 0.001 (0.017)	Loss 3.0739 (2.9348)	Entropy 0.67122 (0.67661)	Top-1 acc 47.656 (53.440)	Top-5 acc 71.875 (76.252)	lr 0.01941
Train [38][2050/3239]	Time 0.239 (0.475)	Data Time 0.001 (0.017)	Loss 2.7881 (2.9346)	Entropy 0.67127 (0.67658)	Top-1 acc 60.547 (53.443)	Top-5 acc 79.688 (76.253)	lr 0.01941
Train [38][2060/3239]	Time 0.327 (0.475)	Data Time 0.001 (0.017)	Loss 2.9485 (2.9345)	Entropy 0.67152 (0.67656)	Top-1 acc 51.953 (53.449)	Top-5 acc 74.609 (76.256)	lr 0.01941
Train [38][2070/3239]	Time 0.227 (0.474)	Data Time 0.001 (0.017)	Loss 3.1870 (2.9345)	Entropy 0.67192 (0.67653)	Top-1 acc 49.609 (53.451)	Top-5 acc 71.875 (76.252)	lr 0.01941
Train [38][2080/3239]	Time 0.226 (0.474)	Data Time 0.001 (0.017)	Loss 2.8133 (2.9346)	Entropy 0.67197 (0.67651)	Top-1 acc 55.859 (53.449)	Top-5 acc 77.734 (76.251)	lr 0.01941
Train [38][2090/3239]	Time 0.231 (0.474)	Data Time 0.001 (0.016)	Loss 2.9701 (2.9346)	Entropy 0.67176 (0.67649)	Top-1 acc 52.734 (53.451)	Top-5 acc 76.172 (76.248)	lr 0.01941
Train [38][2100/3239]	Time 0.235 (0.473)	Data Time 0.001 (0.016)	Loss 2.9593 (2.9347)	Entropy 0.67191 (0.67647)	Top-1 acc 53.125 (53.449)	Top-5 acc 75.781 (76.246)	lr 0.01940
Train [38][2110/3239]	Time 0.229 (0.473)	Data Time 0.001 (0.016)	Loss 2.8915 (2.9348)	Entropy 0.67129 (0.67644)	Top-1 acc 54.688 (53.441)	Top-5 acc 76.172 (76.243)	lr 0.01940
Train [38][2120/3239]	Time 0.226 (0.473)	Data Time 0.001 (0.016)	Loss 2.8851 (2.9345)	Entropy 0.67102 (0.67642)	Top-1 acc 51.953 (53.449)	Top-5 acc 81.250 (76.245)	lr 0.01940
Train [38][2130/3239]	Time 0.327 (0.473)	Data Time 0.001 (0.016)	Loss 2.7185 (2.9345)	Entropy 0.67125 (0.67639)	Top-1 acc 56.641 (53.449)	Top-5 acc 79.688 (76.247)	lr 0.01940
Train [38][2140/3239]	Time 0.224 (0.472)	Data Time 0.001 (0.016)	Loss 3.0050 (2.9345)	Entropy 0.67135 (0.67637)	Top-1 acc 53.125 (53.448)	Top-5 acc 76.953 (76.245)	lr 0.01940
Train [38][2150/3239]	Time 0.231 (0.472)	Data Time 0.001 (0.016)	Loss 2.7519 (2.9345)	Entropy 0.67166 (0.67635)	Top-1 acc 57.422 (53.440)	Top-5 acc 78.516 (76.245)	lr 0.01940
Train [38][2160/3239]	Time 0.222 (0.472)	Data Time 0.001 (0.016)	Loss 2.7768 (2.9344)	Entropy 0.67162 (0.67633)	Top-1 acc 55.078 (53.442)	Top-5 acc 80.078 (76.249)	lr 0.01940
Train [38][2170/3239]	Time 0.226 (0.471)	Data Time 0.001 (0.016)	Loss 2.8415 (2.9346)	Entropy 0.67139 (0.67630)	Top-1 acc 57.422 (53.436)	Top-5 acc 76.562 (76.246)	lr 0.01940
Train [38][2180/3239]	Time 0.233 (0.471)	Data Time 0.001 (0.016)	Loss 2.6977 (2.9348)	Entropy 0.67129 (0.67628)	Top-1 acc 61.328 (53.435)	Top-5 acc 80.078 (76.246)	lr 0.01940
Train [38][2190/3239]	Time 0.230 (0.471)	Data Time 0.001 (0.016)	Loss 2.9830 (2.9347)	Entropy 0.67124 (0.67626)	Top-1 acc 55.078 (53.443)	Top-5 acc 77.344 (76.250)	lr 0.01940
Train [38][2200/3239]	Time 0.298 (0.471)	Data Time 0.001 (0.016)	Loss 2.9522 (2.9344)	Entropy 0.67089 (0.67623)	Top-1 acc 55.078 (53.446)	Top-5 acc 73.828 (76.253)	lr 0.01940
Train [38][2210/3239]	Time 0.221 (0.470)	Data Time 0.001 (0.016)	Loss 2.7744 (2.9346)	Entropy 0.67108 (0.67621)	Top-1 acc 58.594 (53.441)	Top-5 acc 80.859 (76.250)	lr 0.01940
Train [38][2220/3239]	Time 0.332 (0.470)	Data Time 0.001 (0.016)	Loss 2.9743 (2.9348)	Entropy 0.67101 (0.67619)	Top-1 acc 48.047 (53.440)	Top-5 acc 76.172 (76.246)	lr 0.01939
Train [38][2230/3239]	Time 0.244 (0.470)	Data Time 0.001 (0.016)	Loss 3.1267 (2.9349)	Entropy 0.67096 (0.67616)	Top-1 acc 47.656 (53.434)	Top-5 acc 72.266 (76.243)	lr 0.01939
Train [38][2240/3239]	Time 0.234 (0.470)	Data Time 0.001 (0.015)	Loss 2.9478 (2.9349)	Entropy 0.67129 (0.67614)	Top-1 acc 50.000 (53.438)	Top-5 acc 73.828 (76.241)	lr 0.01939
Train [38][2250/3239]	Time 0.233 (0.469)	Data Time 0.001 (0.015)	Loss 2.9605 (2.9352)	Entropy 0.67145 (0.67612)	Top-1 acc 53.125 (53.435)	Top-5 acc 74.609 (76.235)	lr 0.01939
Train [38][2260/3239]	Time 0.252 (0.469)	Data Time 0.001 (0.015)	Loss 2.8672 (2.9353)	Entropy 0.67129 (0.67610)	Top-1 acc 53.516 (53.431)	Top-5 acc 77.734 (76.233)	lr 0.01939
Train [38][2270/3239]	Time 0.247 (0.469)	Data Time 0.001 (0.015)	Loss 3.0506 (2.9354)	Entropy 0.67120 (0.67608)	Top-1 acc 48.047 (53.426)	Top-5 acc 75.781 (76.233)	lr 0.01939
Train [38][2280/3239]	Time 0.234 (0.468)	Data Time 0.001 (0.015)	Loss 2.8158 (2.9354)	Entropy 0.67075 (0.67606)	Top-1 acc 58.203 (53.428)	Top-5 acc 80.469 (76.234)	lr 0.01939
Train [38][2290/3239]	Time 0.310 (0.468)	Data Time 0.001 (0.015)	Loss 3.0241 (2.9354)	Entropy 0.67050 (0.67603)	Top-1 acc 51.953 (53.425)	Top-5 acc 72.266 (76.231)	lr 0.01939
Train [38][2300/3239]	Time 0.237 (0.468)	Data Time 0.001 (0.015)	Loss 2.7240 (2.9353)	Entropy 0.67047 (0.67601)	Top-1 acc 57.422 (53.431)	Top-5 acc 80.469 (76.232)	lr 0.01939
Train [38][2310/3239]	Time 0.231 (0.468)	Data Time 0.001 (0.015)	Loss 3.1318 (2.9352)	Entropy 0.67017 (0.67598)	Top-1 acc 49.609 (53.434)	Top-5 acc 74.219 (76.234)	lr 0.01939
Train [38][2320/3239]	Time 0.235 (0.467)	Data Time 0.001 (0.015)	Loss 2.9592 (2.9352)	Entropy 0.67013 (0.67596)	Top-1 acc 52.734 (53.438)	Top-5 acc 76.562 (76.238)	lr 0.01939
Train [38][2330/3239]	Time 0.233 (0.467)	Data Time 0.001 (0.015)	Loss 2.6790 (2.9351)	Entropy 0.67002 (0.67593)	Top-1 acc 60.938 (53.442)	Top-5 acc 81.250 (76.238)	lr 0.01938
Train [38][2340/3239]	Time 0.225 (0.467)	Data Time 0.001 (0.015)	Loss 2.7146 (2.9351)	Entropy 0.67012 (0.67591)	Top-1 acc 56.641 (53.440)	Top-5 acc 78.516 (76.238)	lr 0.01938
Train [38][2350/3239]	Time 0.227 (0.466)	Data Time 0.001 (0.015)	Loss 2.7572 (2.9352)	Entropy 0.67010 (0.67588)	Top-1 acc 58.203 (53.439)	Top-5 acc 79.688 (76.237)	lr 0.01938
Train [38][2360/3239]	Time 0.235 (0.466)	Data Time 0.001 (0.015)	Loss 2.7346 (2.9351)	Entropy 0.67021 (0.67586)	Top-1 acc 57.031 (53.443)	Top-5 acc 78.125 (76.236)	lr 0.01938
Train [38][2370/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.015)	Loss 2.8473 (2.9350)	Entropy 0.67014 (0.67584)	Top-1 acc 56.250 (53.445)	Top-5 acc 76.172 (76.238)	lr 0.01938
Train [38][2380/3239]	Time 0.288 (0.466)	Data Time 0.001 (0.015)	Loss 2.8355 (2.9349)	Entropy 0.66966 (0.67581)	Top-1 acc 57.422 (53.448)	Top-5 acc 76.172 (76.238)	lr 0.01938
Train [38][2390/3239]	Time 0.256 (0.466)	Data Time 0.001 (0.015)	Loss 2.6941 (2.9349)	Entropy 0.66971 (0.67579)	Top-1 acc 61.719 (53.448)	Top-5 acc 81.250 (76.243)	lr 0.01938
Train [38][2400/3239]	Time 0.222 (0.465)	Data Time 0.001 (0.015)	Loss 2.9248 (2.9348)	Entropy 0.66973 (0.67576)	Top-1 acc 54.297 (53.448)	Top-5 acc 76.953 (76.244)	lr 0.01938
Train [38][2410/3239]	Time 0.258 (0.465)	Data Time 0.001 (0.014)	Loss 3.0344 (2.9349)	Entropy 0.66961 (0.67574)	Top-1 acc 49.219 (53.449)	Top-5 acc 77.344 (76.244)	lr 0.01938
Train [38][2420/3239]	Time 0.235 (0.465)	Data Time 0.001 (0.014)	Loss 2.9523 (2.9347)	Entropy 0.66929 (0.67571)	Top-1 acc 53.906 (53.456)	Top-5 acc 77.734 (76.248)	lr 0.01938
Train [38][2430/3239]	Time 0.236 (0.464)	Data Time 0.001 (0.014)	Loss 2.8392 (2.9347)	Entropy 0.66892 (0.67568)	Top-1 acc 56.250 (53.452)	Top-5 acc 79.297 (76.247)	lr 0.01938
Train [38][2440/3239]	Time 0.231 (0.464)	Data Time 0.001 (0.014)	Loss 2.9393 (2.9347)	Entropy 0.66896 (0.67565)	Top-1 acc 51.562 (53.453)	Top-5 acc 75.000 (76.248)	lr 0.01938
Train [38][2450/3239]	Time 0.340 (0.464)	Data Time 0.001 (0.014)	Loss 2.7788 (2.9347)	Entropy 0.66910 (0.67563)	Top-1 acc 56.250 (53.453)	Top-5 acc 80.078 (76.251)	lr 0.01937
Train [38][2460/3239]	Time 0.267 (0.464)	Data Time 0.001 (0.014)	Loss 2.8325 (2.9345)	Entropy 0.66916 (0.67560)	Top-1 acc 53.906 (53.456)	Top-5 acc 78.516 (76.251)	lr 0.01937
Train [38][2470/3239]	Time 0.233 (0.463)	Data Time 0.001 (0.014)	Loss 3.0450 (2.9345)	Entropy 0.66900 (0.67557)	Top-1 acc 50.391 (53.462)	Top-5 acc 74.609 (76.250)	lr 0.01937
Train [38][2480/3239]	Time 0.234 (0.463)	Data Time 0.001 (0.014)	Loss 2.9813 (2.9346)	Entropy 0.66898 (0.67555)	Top-1 acc 49.609 (53.459)	Top-5 acc 75.000 (76.246)	lr 0.01937
Train [38][2490/3239]	Time 0.224 (0.463)	Data Time 0.001 (0.014)	Loss 2.9150 (2.9345)	Entropy 0.66899 (0.67552)	Top-1 acc 52.734 (53.457)	Top-5 acc 76.953 (76.245)	lr 0.01937
Train [38][2500/3239]	Time 0.232 (0.463)	Data Time 0.001 (0.014)	Loss 2.9290 (2.9347)	Entropy 0.66907 (0.67549)	Top-1 acc 52.734 (53.450)	Top-5 acc 75.391 (76.240)	lr 0.01937
Train [38][2510/3239]	Time 0.220 (0.462)	Data Time 0.001 (0.014)	Loss 2.9261 (2.9347)	Entropy 0.66946 (0.67547)	Top-1 acc 51.562 (53.452)	Top-5 acc 77.344 (76.240)	lr 0.01937
Train [38][2520/3239]	Time 0.317 (0.462)	Data Time 0.001 (0.014)	Loss 2.8514 (2.9348)	Entropy 0.66967 (0.67545)	Top-1 acc 55.078 (53.447)	Top-5 acc 77.734 (76.241)	lr 0.01937
Train [38][2530/3239]	Time 0.235 (0.462)	Data Time 0.001 (0.014)	Loss 2.9451 (2.9350)	Entropy 0.66966 (0.67542)	Top-1 acc 53.125 (53.442)	Top-5 acc 76.172 (76.234)	lr 0.01937
Train [38][2540/3239]	Time 0.228 (0.462)	Data Time 0.001 (0.014)	Loss 2.7845 (2.9346)	Entropy 0.66952 (0.67540)	Top-1 acc 58.203 (53.452)	Top-5 acc 79.297 (76.241)	lr 0.01937
Train [38][2550/3239]	Time 0.229 (0.462)	Data Time 0.002 (0.014)	Loss 3.0320 (2.9348)	Entropy 0.66962 (0.67538)	Top-1 acc 53.516 (53.445)	Top-5 acc 74.609 (76.235)	lr 0.01937
Train [38][2560/3239]	Time 0.229 (0.461)	Data Time 0.001 (0.014)	Loss 2.9665 (2.9346)	Entropy 0.66948 (0.67535)	Top-1 acc 53.125 (53.446)	Top-5 acc 75.391 (76.237)	lr 0.01937
Train [38][2570/3239]	Time 0.259 (0.461)	Data Time 0.001 (0.014)	Loss 2.7399 (2.9345)	Entropy 0.66949 (0.67533)	Top-1 acc 57.031 (53.453)	Top-5 acc 79.297 (76.239)	lr 0.01936
Train [38][2580/3239]	Time 0.377 (0.474)	Data Time 0.002 (0.014)	Loss 2.9087 (2.9347)	Entropy 0.66981 (0.67531)	Top-1 acc 52.734 (53.448)	Top-5 acc 78.125 (76.237)	lr 0.01936
Train [38][2590/3239]	Time 0.235 (0.474)	Data Time 0.002 (0.014)	Loss 2.9401 (2.9348)	Entropy 0.66995 (0.67529)	Top-1 acc 51.953 (53.444)	Top-5 acc 78.516 (76.237)	lr 0.01936
Train [38][2600/3239]	Time 0.233 (0.473)	Data Time 0.001 (0.014)	Loss 2.9826 (2.9351)	Entropy 0.66970 (0.67527)	Top-1 acc 52.734 (53.437)	Top-5 acc 75.000 (76.233)	lr 0.01936
Train [38][2610/3239]	Time 0.348 (0.473)	Data Time 0.002 (0.014)	Loss 2.9573 (2.9352)	Entropy 0.66980 (0.67525)	Top-1 acc 51.172 (53.438)	Top-5 acc 75.391 (76.233)	lr 0.01936
Train [38][2620/3239]	Time 0.243 (0.473)	Data Time 0.001 (0.013)	Loss 2.9914 (2.9353)	Entropy 0.66945 (0.67522)	Top-1 acc 52.734 (53.436)	Top-5 acc 75.000 (76.231)	lr 0.01936
Train [38][2630/3239]	Time 0.237 (0.473)	Data Time 0.001 (0.013)	Loss 2.8851 (2.9356)	Entropy 0.66972 (0.67520)	Top-1 acc 56.250 (53.432)	Top-5 acc 78.516 (76.227)	lr 0.01936
Train [38][2640/3239]	Time 0.247 (0.473)	Data Time 0.001 (0.013)	Loss 2.8174 (2.9353)	Entropy 0.66951 (0.67518)	Top-1 acc 55.078 (53.440)	Top-5 acc 77.734 (76.234)	lr 0.01936
Train [38][2650/3239]	Time 0.237 (0.472)	Data Time 0.002 (0.013)	Loss 2.9402 (2.9353)	Entropy 0.66921 (0.67516)	Top-1 acc 48.828 (53.439)	Top-5 acc 78.516 (76.235)	lr 0.01936
Train [38][2660/3239]	Time 0.239 (0.472)	Data Time 0.002 (0.013)	Loss 3.0841 (2.9355)	Entropy 0.66893 (0.67514)	Top-1 acc 50.391 (53.432)	Top-5 acc 74.609 (76.236)	lr 0.01936
Train [38][2670/3239]	Time 0.236 (0.472)	Data Time 0.002 (0.013)	Loss 2.9200 (2.9354)	Entropy 0.66889 (0.67511)	Top-1 acc 55.078 (53.434)	Top-5 acc 78.125 (76.235)	lr 0.01936
Train [38][2680/3239]	Time 0.328 (0.472)	Data Time 0.002 (0.013)	Loss 3.0517 (2.9355)	Entropy 0.66869 (0.67509)	Top-1 acc 54.297 (53.437)	Top-5 acc 75.000 (76.234)	lr 0.01936
Train [38][2690/3239]	Time 0.230 (0.472)	Data Time 0.002 (0.013)	Loss 2.9408 (2.9355)	Entropy 0.66884 (0.67507)	Top-1 acc 51.953 (53.435)	Top-5 acc 77.734 (76.236)	lr 0.01935
Train [38][2700/3239]	Time 0.237 (0.471)	Data Time 0.001 (0.013)	Loss 3.1624 (2.9355)	Entropy 0.66897 (0.67505)	Top-1 acc 48.438 (53.435)	Top-5 acc 71.484 (76.237)	lr 0.01935
Train [38][2710/3239]	Time 0.235 (0.471)	Data Time 0.001 (0.013)	Loss 2.8967 (2.9356)	Entropy 0.66928 (0.67502)	Top-1 acc 51.172 (53.435)	Top-5 acc 80.859 (76.235)	lr 0.01935
Train [38][2720/3239]	Time 0.226 (0.471)	Data Time 0.001 (0.013)	Loss 2.8659 (2.9357)	Entropy 0.66935 (0.67500)	Top-1 acc 52.734 (53.432)	Top-5 acc 75.781 (76.233)	lr 0.01935
Train [38][2730/3239]	Time 0.223 (0.471)	Data Time 0.001 (0.013)	Loss 2.9674 (2.9356)	Entropy 0.66957 (0.67498)	Top-1 acc 56.250 (53.436)	Top-5 acc 75.391 (76.235)	lr 0.01935
Train [38][2740/3239]	Time 0.237 (0.470)	Data Time 0.001 (0.013)	Loss 2.8060 (2.9356)	Entropy 0.66948 (0.67496)	Top-1 acc 55.469 (53.435)	Top-5 acc 76.953 (76.233)	lr 0.01935
Train [38][2750/3239]	Time 0.235 (0.470)	Data Time 0.001 (0.013)	Loss 3.0631 (2.9355)	Entropy 0.66947 (0.67494)	Top-1 acc 50.781 (53.439)	Top-5 acc 74.609 (76.236)	lr 0.01935
Train [38][2760/3239]	Time 0.226 (0.470)	Data Time 0.001 (0.013)	Loss 3.0011 (2.9357)	Entropy 0.66975 (0.67492)	Top-1 acc 53.516 (53.433)	Top-5 acc 76.953 (76.232)	lr 0.01935
Train [38][2770/3239]	Time 0.363 (0.470)	Data Time 0.001 (0.013)	Loss 2.9541 (2.9356)	Entropy 0.66982 (0.67490)	Top-1 acc 52.344 (53.435)	Top-5 acc 76.172 (76.234)	lr 0.01935
Train [38][2780/3239]	Time 0.222 (0.470)	Data Time 0.001 (0.013)	Loss 2.9653 (2.9355)	Entropy 0.66999 (0.67489)	Top-1 acc 53.516 (53.439)	Top-5 acc 76.562 (76.237)	lr 0.01935
Train [38][2790/3239]	Time 0.228 (0.469)	Data Time 0.001 (0.013)	Loss 3.0120 (2.9353)	Entropy 0.67032 (0.67487)	Top-1 acc 46.875 (53.440)	Top-5 acc 73.047 (76.238)	lr 0.01935
Train [38][2800/3239]	Time 0.227 (0.469)	Data Time 0.001 (0.013)	Loss 3.0610 (2.9353)	Entropy 0.67071 (0.67485)	Top-1 acc 48.438 (53.439)	Top-5 acc 74.219 (76.239)	lr 0.01935
Train [38][2810/3239]	Time 0.235 (0.469)	Data Time 0.001 (0.013)	Loss 2.8754 (2.9355)	Entropy 0.67095 (0.67484)	Top-1 acc 51.172 (53.433)	Top-5 acc 79.297 (76.236)	lr 0.01934
Train [38][2820/3239]	Time 0.251 (0.469)	Data Time 0.001 (0.013)	Loss 3.1338 (2.9356)	Entropy 0.67109 (0.67483)	Top-1 acc 47.266 (53.431)	Top-5 acc 71.484 (76.237)	lr 0.01934
Train [38][2830/3239]	Time 0.233 (0.469)	Data Time 0.001 (0.013)	Loss 2.7989 (2.9354)	Entropy 0.67119 (0.67481)	Top-1 acc 58.203 (53.434)	Top-5 acc 80.078 (76.241)	lr 0.01934
Train [38][2840/3239]	Time 0.328 (0.469)	Data Time 0.001 (0.013)	Loss 2.8184 (2.9355)	Entropy 0.67126 (0.67480)	Top-1 acc 57.812 (53.435)	Top-5 acc 80.078 (76.239)	lr 0.01934
Train [38][2850/3239]	Time 0.225 (0.469)	Data Time 0.001 (0.013)	Loss 3.0772 (2.9357)	Entropy 0.67176 (0.67479)	Top-1 acc 50.391 (53.431)	Top-5 acc 74.609 (76.236)	lr 0.01934
Train [38][2860/3239]	Time 0.254 (0.468)	Data Time 0.001 (0.012)	Loss 2.8756 (2.9357)	Entropy 0.67175 (0.67478)	Top-1 acc 57.422 (53.431)	Top-5 acc 78.125 (76.237)	lr 0.01934
Train [38][2870/3239]	Time 0.233 (0.468)	Data Time 0.001 (0.012)	Loss 2.8095 (2.9357)	Entropy 0.67165 (0.67477)	Top-1 acc 55.859 (53.428)	Top-5 acc 77.734 (76.236)	lr 0.01934
Train [38][2880/3239]	Time 0.234 (0.468)	Data Time 0.001 (0.012)	Loss 3.1164 (2.9358)	Entropy 0.67164 (0.67476)	Top-1 acc 49.609 (53.423)	Top-5 acc 74.219 (76.233)	lr 0.01934
Train [38][2890/3239]	Time 0.253 (0.468)	Data Time 0.001 (0.012)	Loss 3.0653 (2.9362)	Entropy 0.67136 (0.67474)	Top-1 acc 51.172 (53.415)	Top-5 acc 72.266 (76.224)	lr 0.01934
Train [38][2900/3239]	Time 0.232 (0.468)	Data Time 0.001 (0.012)	Loss 3.1624 (2.9360)	Entropy 0.67130 (0.67473)	Top-1 acc 46.094 (53.420)	Top-5 acc 73.438 (76.226)	lr 0.01934
Train [38][2910/3239]	Time 0.218 (0.467)	Data Time 0.001 (0.012)	Loss 2.9235 (2.9360)	Entropy 0.67123 (0.67472)	Top-1 acc 51.562 (53.421)	Top-5 acc 78.125 (76.225)	lr 0.01934
Train [38][2920/3239]	Time 0.231 (0.467)	Data Time 0.001 (0.012)	Loss 2.9333 (2.9361)	Entropy 0.67088 (0.67471)	Top-1 acc 52.344 (53.417)	Top-5 acc 75.391 (76.221)	lr 0.01934
Train [38][2930/3239]	Time 0.328 (0.467)	Data Time 0.001 (0.012)	Loss 3.1259 (2.9363)	Entropy 0.67059 (0.67470)	Top-1 acc 50.781 (53.413)	Top-5 acc 71.875 (76.216)	lr 0.01933
Train [38][2940/3239]	Time 0.235 (0.467)	Data Time 0.001 (0.012)	Loss 2.9593 (2.9363)	Entropy 0.67118 (0.67468)	Top-1 acc 49.219 (53.410)	Top-5 acc 75.781 (76.216)	lr 0.01933
Train [38][2950/3239]	Time 0.233 (0.467)	Data Time 0.001 (0.012)	Loss 3.0577 (2.9363)	Entropy 0.67125 (0.67467)	Top-1 acc 52.344 (53.412)	Top-5 acc 73.438 (76.219)	lr 0.01933
Train [38][2960/3239]	Time 0.226 (0.466)	Data Time 0.001 (0.012)	Loss 3.1149 (2.9364)	Entropy 0.67106 (0.67466)	Top-1 acc 47.656 (53.407)	Top-5 acc 71.484 (76.214)	lr 0.01933
Train [38][2970/3239]	Time 0.232 (0.466)	Data Time 0.001 (0.012)	Loss 2.9818 (2.9363)	Entropy 0.67126 (0.67465)	Top-1 acc 54.297 (53.411)	Top-5 acc 73.047 (76.215)	lr 0.01933
Train [38][2980/3239]	Time 0.250 (0.466)	Data Time 0.001 (0.012)	Loss 2.8906 (2.9363)	Entropy 0.67114 (0.67464)	Top-1 acc 55.859 (53.408)	Top-5 acc 78.516 (76.217)	lr 0.01933
Train [38][2990/3239]	Time 0.232 (0.466)	Data Time 0.001 (0.012)	Loss 3.0860 (2.9364)	Entropy 0.67117 (0.67462)	Top-1 acc 53.516 (53.407)	Top-5 acc 69.531 (76.215)	lr 0.01933
Train [38][3000/3239]	Time 0.430 (0.466)	Data Time 0.001 (0.012)	Loss 2.8138 (2.9364)	Entropy 0.67115 (0.67461)	Top-1 acc 60.156 (53.408)	Top-5 acc 81.641 (76.215)	lr 0.01933
Train [38][3010/3239]	Time 0.233 (0.466)	Data Time 0.001 (0.012)	Loss 2.8865 (2.9364)	Entropy 0.67137 (0.67460)	Top-1 acc 55.078 (53.406)	Top-5 acc 78.125 (76.218)	lr 0.01933
Train [38][3020/3239]	Time 0.257 (0.466)	Data Time 0.001 (0.012)	Loss 2.9991 (2.9364)	Entropy 0.67158 (0.67459)	Top-1 acc 51.172 (53.408)	Top-5 acc 75.391 (76.215)	lr 0.01933
Train [38][3030/3239]	Time 0.237 (0.465)	Data Time 0.001 (0.012)	Loss 2.9175 (2.9365)	Entropy 0.67176 (0.67458)	Top-1 acc 55.469 (53.407)	Top-5 acc 77.344 (76.213)	lr 0.01933
Train [38][3040/3239]	Time 0.236 (0.465)	Data Time 0.001 (0.012)	Loss 2.8684 (2.9363)	Entropy 0.67164 (0.67457)	Top-1 acc 53.125 (53.411)	Top-5 acc 75.000 (76.216)	lr 0.01932
Train [38][3050/3239]	Time 0.222 (0.465)	Data Time 0.001 (0.012)	Loss 2.8262 (2.9363)	Entropy 0.67139 (0.67456)	Top-1 acc 53.906 (53.409)	Top-5 acc 79.297 (76.215)	lr 0.01932
Train [38][3060/3239]	Time 0.231 (0.465)	Data Time 0.001 (0.012)	Loss 3.0895 (2.9363)	Entropy 0.67163 (0.67455)	Top-1 acc 46.094 (53.405)	Top-5 acc 75.000 (76.216)	lr 0.01932
Train [38][3070/3239]	Time 0.237 (0.465)	Data Time 0.001 (0.012)	Loss 3.0442 (2.9360)	Entropy 0.67159 (0.67454)	Top-1 acc 51.562 (53.412)	Top-5 acc 76.953 (76.223)	lr 0.01932
Train [38][3080/3239]	Time 0.232 (0.465)	Data Time 0.001 (0.012)	Loss 2.8351 (2.9361)	Entropy 0.67142 (0.67453)	Top-1 acc 55.078 (53.409)	Top-5 acc 78.125 (76.220)	lr 0.01932
Train [38][3090/3239]	Time 0.225 (0.464)	Data Time 0.001 (0.012)	Loss 2.8747 (2.9363)	Entropy 0.67130 (0.67452)	Top-1 acc 53.125 (53.404)	Top-5 acc 72.656 (76.212)	lr 0.01932
Train [38][3100/3239]	Time 0.241 (0.464)	Data Time 0.001 (0.012)	Loss 2.9895 (2.9364)	Entropy 0.67093 (0.67451)	Top-1 acc 54.297 (53.404)	Top-5 acc 76.172 (76.213)	lr 0.01932
Train [38][3110/3239]	Time 0.243 (0.464)	Data Time 0.002 (0.012)	Loss 2.7429 (2.9362)	Entropy 0.67086 (0.67450)	Top-1 acc 57.422 (53.410)	Top-5 acc 77.344 (76.214)	lr 0.01932
Train [38][3120/3239]	Time 0.236 (0.464)	Data Time 0.001 (0.012)	Loss 3.1186 (2.9362)	Entropy 0.67066 (0.67449)	Top-1 acc 50.391 (53.410)	Top-5 acc 72.656 (76.216)	lr 0.01932
Train [38][3130/3239]	Time 0.227 (0.464)	Data Time 0.001 (0.012)	Loss 3.0285 (2.9363)	Entropy 0.67088 (0.67448)	Top-1 acc 52.344 (53.407)	Top-5 acc 76.562 (76.213)	lr 0.01932
Train [38][3140/3239]	Time 0.228 (0.464)	Data Time 0.001 (0.012)	Loss 2.9646 (2.9362)	Entropy 0.67107 (0.67446)	Top-1 acc 50.000 (53.407)	Top-5 acc 78.516 (76.215)	lr 0.01932
Train [38][3150/3239]	Time 0.286 (0.464)	Data Time 0.002 (0.012)	Loss 2.9827 (2.9362)	Entropy 0.67077 (0.67445)	Top-1 acc 53.906 (53.406)	Top-5 acc 73.438 (76.213)	lr 0.01932
Train [38][3160/3239]	Time 0.376 (0.464)	Data Time 0.001 (0.011)	Loss 2.9060 (2.9360)	Entropy 0.67080 (0.67444)	Top-1 acc 52.344 (53.407)	Top-5 acc 77.734 (76.217)	lr 0.01931
Train [38][3170/3239]	Time 0.235 (0.463)	Data Time 0.001 (0.011)	Loss 2.9045 (2.9360)	Entropy 0.67093 (0.67443)	Top-1 acc 54.688 (53.410)	Top-5 acc 76.953 (76.219)	lr 0.01931
Train [38][3180/3239]	Time 0.239 (0.463)	Data Time 0.000 (0.011)	Loss 2.7554 (2.9359)	Entropy 0.67103 (0.67442)	Top-1 acc 57.031 (53.409)	Top-5 acc 78.906 (76.220)	lr 0.01931
Train [38][3190/3239]	Time 0.231 (0.463)	Data Time 0.000 (0.011)	Loss 2.9170 (2.9361)	Entropy 0.67100 (0.67441)	Top-1 acc 52.734 (53.403)	Top-5 acc 73.828 (76.217)	lr 0.01931
Train [38][3200/3239]	Time 0.221 (0.463)	Data Time 0.000 (0.011)	Loss 2.7940 (2.9362)	Entropy 0.67125 (0.67440)	Top-1 acc 56.250 (53.398)	Top-5 acc 80.078 (76.215)	lr 0.01931
Train [38][3210/3239]	Time 0.217 (0.463)	Data Time 0.000 (0.011)	Loss 3.0614 (2.9362)	Entropy 0.67088 (0.67439)	Top-1 acc 48.047 (53.398)	Top-5 acc 71.875 (76.215)	lr 0.01931
Train [38][3220/3239]	Time 0.229 (0.462)	Data Time 0.000 (0.011)	Loss 3.0705 (2.9362)	Entropy 0.67100 (0.67438)	Top-1 acc 54.297 (53.399)	Top-5 acc 72.656 (76.215)	lr 0.01931
Train [38][3230/3239]	Time 0.410 (0.472)	Data Time 0.000 (0.011)	Loss 2.8451 (2.9361)	Entropy 0.67128 (0.67437)	Top-1 acc 55.078 (53.401)	Top-5 acc 76.562 (76.217)	lr 0.01931
Train [38][3239/3239]	Time 0.952 (0.472)	Data Time 0.000 (0.011)	Loss 3.3076 (2.9363)	Entropy 0.67143 (0.67436)	Top-1 acc 40.741 (53.396)	Top-5 acc 67.901 (76.212)	lr 0.01931
==========Valid [38/120]	loss 1.654	top-1 acc 62.825 (62.825)	top-5 acc 83.816	Train top-1 53.396	top-5 76.212	Entropy 0.67143	Latency-None: 0.000ms	Flops: 539.76M
Train [39][0/3239]	Time 33.409 (33.409)	Data Time 32.439 (32.439)	Loss 2.8564 (2.8564)	Entropy 0.67143 (0.67143)	Top-1 acc 56.250 (56.250)	Top-5 acc 78.125 (78.125)	lr 0.01931
Train [39][10/3239]	Time 0.275 (3.579)	Data Time 0.001 (2.951)	Loss 2.9526 (2.9065)	Entropy 0.67147 (0.67140)	Top-1 acc 55.469 (54.439)	Top-5 acc 77.344 (77.202)	lr 0.01931
Train [39][20/3239]	Time 0.223 (2.080)	Data Time 0.001 (1.546)	Loss 2.9660 (2.9644)	Entropy 0.67130 (0.67133)	Top-1 acc 53.516 (53.051)	Top-5 acc 73.438 (75.465)	lr 0.01931
Train [39][30/3239]	Time 0.283 (1.567)	Data Time 0.001 (1.048)	Loss 2.9050 (2.9282)	Entropy 0.67107 (0.67133)	Top-1 acc 51.953 (53.717)	Top-5 acc 76.953 (76.273)	lr 0.01931
Train [39][40/3239]	Time 0.283 (1.315)	Data Time 0.001 (0.793)	Loss 2.8296 (2.9236)	Entropy 0.67116 (0.67128)	Top-1 acc 55.078 (53.887)	Top-5 acc 77.734 (76.439)	lr 0.01930
Train [39][50/3239]	Time 0.230 (1.153)	Data Time 0.001 (0.638)	Loss 3.0938 (2.9109)	Entropy 0.67165 (0.67128)	Top-1 acc 48.828 (54.220)	Top-5 acc 74.609 (76.815)	lr 0.01930
Train [39][60/3239]	Time 0.328 (1.032)	Data Time 0.001 (0.534)	Loss 2.8142 (2.9232)	Entropy 0.67182 (0.67136)	Top-1 acc 55.859 (53.957)	Top-5 acc 77.344 (76.684)	lr 0.01930
Train [39][70/3239]	Time 0.233 (0.947)	Data Time 0.001 (0.459)	Loss 2.8241 (2.9138)	Entropy 0.67194 (0.67142)	Top-1 acc 57.031 (54.104)	Top-5 acc 78.906 (76.849)	lr 0.01930
Train [39][80/3239]	Time 0.230 (0.881)	Data Time 0.001 (0.402)	Loss 3.0431 (2.9050)	Entropy 0.67170 (0.67148)	Top-1 acc 53.125 (54.302)	Top-5 acc 75.000 (76.953)	lr 0.01930
Train [39][90/3239]	Time 0.235 (0.833)	Data Time 0.001 (0.358)	Loss 3.0026 (2.9115)	Entropy 0.67141 (0.67150)	Top-1 acc 50.391 (54.087)	Top-5 acc 76.562 (76.867)	lr 0.01930
Train [39][100/3239]	Time 0.255 (0.793)	Data Time 0.001 (0.323)	Loss 2.8461 (2.9147)	Entropy 0.67154 (0.67149)	Top-1 acc 52.344 (54.018)	Top-5 acc 77.344 (76.771)	lr 0.01930
Train [39][110/3239]	Time 0.254 (0.764)	Data Time 0.001 (0.294)	Loss 2.9661 (2.9129)	Entropy 0.67136 (0.67149)	Top-1 acc 51.562 (53.970)	Top-5 acc 76.172 (76.819)	lr 0.01930
Train [39][120/3239]	Time 0.236 (0.737)	Data Time 0.001 (0.270)	Loss 2.8723 (2.9128)	Entropy 0.67084 (0.67146)	Top-1 acc 57.422 (53.945)	Top-5 acc 78.906 (76.798)	lr 0.01930
Train [39][130/3239]	Time 0.237 (0.713)	Data Time 0.001 (0.249)	Loss 2.9206 (2.9161)	Entropy 0.67071 (0.67140)	Top-1 acc 55.469 (53.844)	Top-5 acc 76.172 (76.652)	lr 0.01930
Train [39][140/3239]	Time 0.238 (0.694)	Data Time 0.002 (0.232)	Loss 3.1486 (2.9153)	Entropy 0.67061 (0.67135)	Top-1 acc 47.656 (53.870)	Top-5 acc 71.484 (76.659)	lr 0.01930
Train [39][150/3239]	Time 0.266 (0.680)	Data Time 0.001 (0.217)	Loss 2.9672 (2.9137)	Entropy 0.67061 (0.67129)	Top-1 acc 51.562 (53.917)	Top-5 acc 74.609 (76.715)	lr 0.01930
Train [39][160/3239]	Time 0.249 (0.663)	Data Time 0.001 (0.203)	Loss 2.5322 (2.9135)	Entropy 0.67052 (0.67125)	Top-1 acc 61.719 (53.977)	Top-5 acc 83.984 (76.701)	lr 0.01929
Train [39][170/3239]	Time 0.231 (0.649)	Data Time 0.001 (0.191)	Loss 2.7290 (2.9123)	Entropy 0.67062 (0.67121)	Top-1 acc 57.812 (54.036)	Top-5 acc 79.688 (76.704)	lr 0.01929
Train [39][180/3239]	Time 0.241 (0.638)	Data Time 0.001 (0.181)	Loss 3.1118 (2.9119)	Entropy 0.67076 (0.67118)	Top-1 acc 51.172 (54.027)	Top-5 acc 74.219 (76.724)	lr 0.01929
Train [39][190/3239]	Time 0.234 (0.627)	Data Time 0.001 (0.172)	Loss 2.7093 (2.9133)	Entropy 0.67052 (0.67116)	Top-1 acc 58.203 (54.033)	Top-5 acc 78.906 (76.673)	lr 0.01929
Train [39][200/3239]	Time 0.239 (0.617)	Data Time 0.001 (0.163)	Loss 2.8813 (2.9147)	Entropy 0.67043 (0.67113)	Top-1 acc 51.172 (54.025)	Top-5 acc 78.125 (76.634)	lr 0.01929
Train [39][210/3239]	Time 0.256 (0.607)	Data Time 0.001 (0.155)	Loss 2.9934 (2.9142)	Entropy 0.67040 (0.67110)	Top-1 acc 50.000 (54.004)	Top-5 acc 74.609 (76.633)	lr 0.01929
Train [39][220/3239]	Time 0.331 (0.599)	Data Time 0.001 (0.148)	Loss 2.7894 (2.9160)	Entropy 0.67060 (0.67107)	Top-1 acc 53.906 (53.936)	Top-5 acc 76.172 (76.630)	lr 0.01929
Train [39][230/3239]	Time 0.229 (0.592)	Data Time 0.001 (0.142)	Loss 3.0553 (2.9165)	Entropy 0.67039 (0.67105)	Top-1 acc 54.297 (53.891)	Top-5 acc 75.781 (76.615)	lr 0.01929
Train [39][240/3239]	Time 0.240 (0.585)	Data Time 0.001 (0.136)	Loss 2.8386 (2.9155)	Entropy 0.67006 (0.67102)	Top-1 acc 52.734 (53.885)	Top-5 acc 77.734 (76.650)	lr 0.01929
Train [39][250/3239]	Time 0.235 (0.579)	Data Time 0.001 (0.131)	Loss 2.7126 (2.9147)	Entropy 0.66997 (0.67098)	Top-1 acc 60.547 (53.931)	Top-5 acc 78.906 (76.661)	lr 0.01929
Train [39][260/3239]	Time 0.236 (0.573)	Data Time 0.001 (0.126)	Loss 2.7865 (2.9153)	Entropy 0.66985 (0.67094)	Top-1 acc 53.125 (53.887)	Top-5 acc 76.953 (76.601)	lr 0.01929
Train [39][270/3239]	Time 0.231 (0.568)	Data Time 0.001 (0.121)	Loss 2.8438 (2.9159)	Entropy 0.66987 (0.67090)	Top-1 acc 56.250 (53.877)	Top-5 acc 78.906 (76.590)	lr 0.01929
Train [39][280/3239]	Time 0.237 (0.563)	Data Time 0.001 (0.117)	Loss 2.9342 (2.9160)	Entropy 0.66966 (0.67086)	Top-1 acc 51.172 (53.878)	Top-5 acc 74.219 (76.578)	lr 0.01928
Train [39][290/3239]	Time 0.339 (0.559)	Data Time 0.001 (0.113)	Loss 3.0256 (2.9157)	Entropy 0.66964 (0.67082)	Top-1 acc 48.828 (53.910)	Top-5 acc 74.609 (76.604)	lr 0.01928
Train [39][300/3239]	Time 0.238 (0.555)	Data Time 0.001 (0.110)	Loss 2.8481 (2.9168)	Entropy 0.66978 (0.67078)	Top-1 acc 54.297 (53.882)	Top-5 acc 75.391 (76.553)	lr 0.01928
Train [39][310/3239]	Time 0.276 (0.551)	Data Time 0.001 (0.106)	Loss 2.9110 (2.9177)	Entropy 0.66972 (0.67075)	Top-1 acc 54.297 (53.876)	Top-5 acc 76.953 (76.524)	lr 0.01928
Train [39][320/3239]	Time 0.287 (0.548)	Data Time 0.001 (0.103)	Loss 2.9257 (2.9162)	Entropy 0.66948 (0.67071)	Top-1 acc 56.641 (53.894)	Top-5 acc 77.344 (76.552)	lr 0.01928
Train [39][330/3239]	Time 0.245 (0.544)	Data Time 0.001 (0.100)	Loss 3.0738 (2.9202)	Entropy 0.66926 (0.67067)	Top-1 acc 50.391 (53.800)	Top-5 acc 75.781 (76.494)	lr 0.01928
Train [39][340/3239]	Time 0.224 (0.541)	Data Time 0.001 (0.097)	Loss 3.0088 (2.9201)	Entropy 0.66912 (0.67063)	Top-1 acc 49.609 (53.795)	Top-5 acc 76.562 (76.510)	lr 0.01928
Train [39][350/3239]	Time 0.223 (0.538)	Data Time 0.001 (0.094)	Loss 3.0282 (2.9205)	Entropy 0.66887 (0.67058)	Top-1 acc 53.125 (53.788)	Top-5 acc 74.609 (76.512)	lr 0.01928
Train [39][360/3239]	Time 0.282 (0.535)	Data Time 0.001 (0.092)	Loss 2.9702 (2.9197)	Entropy 0.66858 (0.67053)	Top-1 acc 53.125 (53.818)	Top-5 acc 74.219 (76.529)	lr 0.01928
Train [39][370/3239]	Time 0.273 (0.532)	Data Time 0.001 (0.089)	Loss 3.0899 (2.9216)	Entropy 0.66859 (0.67048)	Top-1 acc 49.609 (53.767)	Top-5 acc 71.094 (76.448)	lr 0.01928
Train [39][380/3239]	Time 0.432 (0.529)	Data Time 0.005 (0.087)	Loss 2.7605 (2.9214)	Entropy 0.66856 (0.67043)	Top-1 acc 55.859 (53.760)	Top-5 acc 78.516 (76.467)	lr 0.01928
Train [39][390/3239]	Time 0.298 (0.528)	Data Time 0.002 (0.085)	Loss 2.8918 (2.9206)	Entropy 0.66845 (0.67038)	Top-1 acc 53.516 (53.784)	Top-5 acc 77.344 (76.504)	lr 0.01927
Train [39][400/3239]	Time 0.253 (0.526)	Data Time 0.001 (0.083)	Loss 3.0935 (2.9201)	Entropy 0.66810 (0.67033)	Top-1 acc 48.438 (53.790)	Top-5 acc 75.000 (76.537)	lr 0.01927
Train [39][410/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.081)	Loss 2.6585 (2.9192)	Entropy 0.66824 (0.67028)	Top-1 acc 60.938 (53.807)	Top-5 acc 78.516 (76.553)	lr 0.01927
Train [39][420/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.079)	Loss 2.9408 (2.9198)	Entropy 0.66838 (0.67023)	Top-1 acc 51.953 (53.788)	Top-5 acc 76.562 (76.520)	lr 0.01927
Train [39][430/3239]	Time 0.279 (0.519)	Data Time 0.002 (0.077)	Loss 2.9289 (2.9193)	Entropy 0.66815 (0.67018)	Top-1 acc 52.734 (53.776)	Top-5 acc 76.562 (76.536)	lr 0.01927
Train [39][440/3239]	Time 0.244 (0.517)	Data Time 0.001 (0.075)	Loss 2.8976 (2.9184)	Entropy 0.66772 (0.67013)	Top-1 acc 53.516 (53.811)	Top-5 acc 76.953 (76.548)	lr 0.01927
Train [39][450/3239]	Time 0.332 (0.515)	Data Time 0.001 (0.074)	Loss 2.9982 (2.9186)	Entropy 0.66764 (0.67008)	Top-1 acc 49.609 (53.827)	Top-5 acc 75.391 (76.559)	lr 0.01927
Train [39][460/3239]	Time 0.242 (0.513)	Data Time 0.001 (0.072)	Loss 2.8933 (2.9188)	Entropy 0.66760 (0.67003)	Top-1 acc 53.516 (53.824)	Top-5 acc 78.125 (76.535)	lr 0.01927
Train [39][470/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.071)	Loss 2.9958 (2.9184)	Entropy 0.66743 (0.66998)	Top-1 acc 52.344 (53.827)	Top-5 acc 73.828 (76.545)	lr 0.01927
Train [39][480/3239]	Time 0.239 (0.509)	Data Time 0.001 (0.069)	Loss 2.8266 (2.9173)	Entropy 0.66686 (0.66992)	Top-1 acc 57.422 (53.853)	Top-5 acc 78.516 (76.559)	lr 0.01927
Train [39][490/3239]	Time 0.236 (0.507)	Data Time 0.001 (0.068)	Loss 2.9254 (2.9168)	Entropy 0.66679 (0.66986)	Top-1 acc 54.688 (53.869)	Top-5 acc 75.781 (76.568)	lr 0.01927
Train [39][500/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.067)	Loss 2.5546 (2.9146)	Entropy 0.66676 (0.66980)	Top-1 acc 64.062 (53.922)	Top-5 acc 83.203 (76.615)	lr 0.01927
Train [39][510/3239]	Time 0.248 (0.504)	Data Time 0.001 (0.065)	Loss 2.8827 (2.9150)	Entropy 0.66686 (0.66974)	Top-1 acc 55.859 (53.912)	Top-5 acc 76.953 (76.607)	lr 0.01926
Train [39][520/3239]	Time 0.241 (0.503)	Data Time 0.001 (0.064)	Loss 2.6632 (2.9153)	Entropy 0.66725 (0.66969)	Top-1 acc 60.156 (53.926)	Top-5 acc 80.078 (76.601)	lr 0.01926
Train [39][530/3239]	Time 0.253 (0.501)	Data Time 0.001 (0.063)	Loss 2.8122 (2.9148)	Entropy 0.66737 (0.66964)	Top-1 acc 57.812 (53.949)	Top-5 acc 78.125 (76.610)	lr 0.01926
Train [39][540/3239]	Time 0.380 (0.501)	Data Time 0.001 (0.062)	Loss 2.8609 (2.9145)	Entropy 0.66755 (0.66960)	Top-1 acc 56.250 (53.950)	Top-5 acc 76.172 (76.610)	lr 0.01926
Train [39][550/3239]	Time 0.236 (0.499)	Data Time 0.001 (0.061)	Loss 2.9014 (2.9151)	Entropy 0.66758 (0.66957)	Top-1 acc 55.078 (53.928)	Top-5 acc 75.000 (76.612)	lr 0.01926
Train [39][560/3239]	Time 0.216 (0.498)	Data Time 0.001 (0.060)	Loss 2.9017 (2.9146)	Entropy 0.66775 (0.66953)	Top-1 acc 56.250 (53.945)	Top-5 acc 79.688 (76.615)	lr 0.01926
Train [39][570/3239]	Time 0.235 (0.496)	Data Time 0.001 (0.059)	Loss 2.9363 (2.9146)	Entropy 0.66751 (0.66950)	Top-1 acc 54.688 (53.947)	Top-5 acc 76.562 (76.613)	lr 0.01926
Train [39][580/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.058)	Loss 2.9691 (2.9155)	Entropy 0.66746 (0.66947)	Top-1 acc 52.344 (53.931)	Top-5 acc 74.609 (76.595)	lr 0.01926
Train [39][590/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.057)	Loss 2.8050 (2.9159)	Entropy 0.66754 (0.66943)	Top-1 acc 57.031 (53.902)	Top-5 acc 79.688 (76.595)	lr 0.01926
Train [39][600/3239]	Time 0.230 (0.493)	Data Time 0.001 (0.056)	Loss 2.9475 (2.9158)	Entropy 0.66783 (0.66940)	Top-1 acc 54.297 (53.885)	Top-5 acc 75.781 (76.592)	lr 0.01926
Train [39][610/3239]	Time 0.318 (0.492)	Data Time 0.001 (0.055)	Loss 3.0743 (2.9162)	Entropy 0.66769 (0.66938)	Top-1 acc 51.172 (53.870)	Top-5 acc 73.047 (76.589)	lr 0.01926
Train [39][620/3239]	Time 0.228 (0.490)	Data Time 0.001 (0.054)	Loss 3.1143 (2.9171)	Entropy 0.66773 (0.66935)	Top-1 acc 47.656 (53.841)	Top-5 acc 72.656 (76.565)	lr 0.01926
Train [39][630/3239]	Time 0.228 (0.489)	Data Time 0.001 (0.053)	Loss 3.0437 (2.9170)	Entropy 0.66788 (0.66932)	Top-1 acc 54.297 (53.847)	Top-5 acc 71.094 (76.571)	lr 0.01925
Train [39][640/3239]	Time 0.238 (0.488)	Data Time 0.001 (0.052)	Loss 2.7249 (2.9160)	Entropy 0.66749 (0.66930)	Top-1 acc 57.031 (53.879)	Top-5 acc 81.641 (76.584)	lr 0.01925
Train [39][650/3239]	Time 0.297 (0.533)	Data Time 0.002 (0.052)	Loss 2.6603 (2.9158)	Entropy 0.66761 (0.66927)	Top-1 acc 62.891 (53.892)	Top-5 acc 81.250 (76.596)	lr 0.01925
Train [39][660/3239]	Time 0.288 (0.534)	Data Time 0.002 (0.051)	Loss 2.8881 (2.9164)	Entropy 0.66729 (0.66925)	Top-1 acc 53.125 (53.878)	Top-5 acc 73.828 (76.574)	lr 0.01925
Train [39][670/3239]	Time 0.236 (0.533)	Data Time 0.001 (0.050)	Loss 3.0694 (2.9163)	Entropy 0.66705 (0.66922)	Top-1 acc 48.438 (53.875)	Top-5 acc 72.656 (76.572)	lr 0.01925
Train [39][680/3239]	Time 0.269 (0.531)	Data Time 0.001 (0.049)	Loss 2.9148 (2.9162)	Entropy 0.66755 (0.66919)	Top-1 acc 53.516 (53.867)	Top-5 acc 76.953 (76.569)	lr 0.01925
Train [39][690/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.049)	Loss 2.9680 (2.9168)	Entropy 0.66714 (0.66916)	Top-1 acc 50.391 (53.842)	Top-5 acc 76.172 (76.560)	lr 0.01925
Train [39][700/3239]	Time 0.321 (0.528)	Data Time 0.002 (0.048)	Loss 3.2516 (2.9175)	Entropy 0.66702 (0.66913)	Top-1 acc 47.266 (53.829)	Top-5 acc 73.438 (76.545)	lr 0.01925
Train [39][710/3239]	Time 0.266 (0.527)	Data Time 0.001 (0.047)	Loss 2.9115 (2.9174)	Entropy 0.66695 (0.66910)	Top-1 acc 51.562 (53.817)	Top-5 acc 75.781 (76.550)	lr 0.01925
Train [39][720/3239]	Time 0.254 (0.526)	Data Time 0.002 (0.047)	Loss 2.9979 (2.9175)	Entropy 0.66692 (0.66907)	Top-1 acc 51.562 (53.816)	Top-5 acc 76.953 (76.542)	lr 0.01925
Train [39][730/3239]	Time 0.264 (0.526)	Data Time 0.001 (0.046)	Loss 3.1320 (2.9167)	Entropy 0.66673 (0.66904)	Top-1 acc 49.609 (53.834)	Top-5 acc 71.875 (76.557)	lr 0.01925
Train [39][740/3239]	Time 0.257 (0.525)	Data Time 0.002 (0.046)	Loss 2.7657 (2.9164)	Entropy 0.66686 (0.66901)	Top-1 acc 58.203 (53.828)	Top-5 acc 80.859 (76.561)	lr 0.01925
Train [39][750/3239]	Time 0.248 (0.524)	Data Time 0.001 (0.045)	Loss 2.7793 (2.9159)	Entropy 0.66687 (0.66898)	Top-1 acc 56.641 (53.828)	Top-5 acc 80.078 (76.579)	lr 0.01924
Train [39][760/3239]	Time 0.248 (0.523)	Data Time 0.002 (0.044)	Loss 2.8373 (2.9147)	Entropy 0.66687 (0.66895)	Top-1 acc 54.688 (53.868)	Top-5 acc 78.906 (76.600)	lr 0.01924
Train [39][770/3239]	Time 0.355 (0.522)	Data Time 0.001 (0.044)	Loss 3.1162 (2.9143)	Entropy 0.66671 (0.66892)	Top-1 acc 47.266 (53.888)	Top-5 acc 70.703 (76.604)	lr 0.01924
Train [39][780/3239]	Time 0.271 (0.522)	Data Time 0.002 (0.043)	Loss 2.8193 (2.9141)	Entropy 0.66674 (0.66890)	Top-1 acc 53.906 (53.892)	Top-5 acc 76.953 (76.602)	lr 0.01924
Train [39][790/3239]	Time 0.279 (0.521)	Data Time 0.002 (0.043)	Loss 2.8581 (2.9141)	Entropy 0.66684 (0.66887)	Top-1 acc 58.594 (53.894)	Top-5 acc 77.734 (76.597)	lr 0.01924
Train [39][800/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.042)	Loss 2.8975 (2.9147)	Entropy 0.66682 (0.66884)	Top-1 acc 53.125 (53.894)	Top-5 acc 76.562 (76.595)	lr 0.01924
Train [39][810/3239]	Time 0.245 (0.519)	Data Time 0.001 (0.042)	Loss 2.9108 (2.9149)	Entropy 0.66735 (0.66882)	Top-1 acc 53.516 (53.885)	Top-5 acc 78.906 (76.598)	lr 0.01924
Train [39][820/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.041)	Loss 2.9171 (2.9157)	Entropy 0.66726 (0.66880)	Top-1 acc 53.125 (53.870)	Top-5 acc 75.391 (76.575)	lr 0.01924
Train [39][830/3239]	Time 0.248 (0.517)	Data Time 0.002 (0.041)	Loss 3.0596 (2.9162)	Entropy 0.66709 (0.66878)	Top-1 acc 53.906 (53.859)	Top-5 acc 75.781 (76.570)	lr 0.01924
Train [39][840/3239]	Time 0.248 (0.517)	Data Time 0.002 (0.040)	Loss 2.9235 (2.9160)	Entropy 0.66711 (0.66876)	Top-1 acc 53.906 (53.869)	Top-5 acc 77.344 (76.581)	lr 0.01924
Train [39][850/3239]	Time 0.271 (0.516)	Data Time 0.002 (0.040)	Loss 2.6903 (2.9160)	Entropy 0.66753 (0.66875)	Top-1 acc 59.766 (53.864)	Top-5 acc 80.078 (76.579)	lr 0.01924
Train [39][860/3239]	Time 0.308 (0.515)	Data Time 0.003 (0.040)	Loss 2.8421 (2.9154)	Entropy 0.66722 (0.66873)	Top-1 acc 57.031 (53.878)	Top-5 acc 78.906 (76.591)	lr 0.01923
Train [39][870/3239]	Time 0.236 (0.514)	Data Time 0.001 (0.039)	Loss 2.7585 (2.9157)	Entropy 0.66704 (0.66872)	Top-1 acc 59.766 (53.863)	Top-5 acc 79.297 (76.593)	lr 0.01923
Train [39][880/3239]	Time 0.241 (0.514)	Data Time 0.001 (0.039)	Loss 2.8283 (2.9162)	Entropy 0.66724 (0.66870)	Top-1 acc 54.297 (53.857)	Top-5 acc 83.203 (76.591)	lr 0.01923
Train [39][890/3239]	Time 0.262 (0.513)	Data Time 0.002 (0.038)	Loss 2.7136 (2.9165)	Entropy 0.66692 (0.66868)	Top-1 acc 59.375 (53.845)	Top-5 acc 82.031 (76.584)	lr 0.01923
Train [39][900/3239]	Time 0.241 (0.512)	Data Time 0.001 (0.038)	Loss 3.0217 (2.9168)	Entropy 0.66690 (0.66866)	Top-1 acc 48.438 (53.833)	Top-5 acc 74.219 (76.569)	lr 0.01923
Train [39][910/3239]	Time 0.247 (0.512)	Data Time 0.001 (0.038)	Loss 2.8287 (2.9166)	Entropy 0.66699 (0.66864)	Top-1 acc 58.203 (53.839)	Top-5 acc 79.297 (76.570)	lr 0.01923
Train [39][920/3239]	Time 0.241 (0.511)	Data Time 0.001 (0.037)	Loss 2.8535 (2.9160)	Entropy 0.66696 (0.66862)	Top-1 acc 57.031 (53.851)	Top-5 acc 78.906 (76.587)	lr 0.01923
Train [39][930/3239]	Time 0.328 (0.510)	Data Time 0.001 (0.037)	Loss 3.0839 (2.9165)	Entropy 0.66665 (0.66860)	Top-1 acc 52.734 (53.850)	Top-5 acc 71.484 (76.568)	lr 0.01923
Train [39][940/3239]	Time 0.243 (0.510)	Data Time 0.001 (0.036)	Loss 2.7245 (2.9161)	Entropy 0.66707 (0.66858)	Top-1 acc 60.156 (53.864)	Top-5 acc 78.906 (76.566)	lr 0.01923
Train [39][950/3239]	Time 0.251 (0.509)	Data Time 0.001 (0.036)	Loss 2.7747 (2.9162)	Entropy 0.66723 (0.66857)	Top-1 acc 55.078 (53.867)	Top-5 acc 79.297 (76.558)	lr 0.01923
Train [39][960/3239]	Time 0.251 (0.508)	Data Time 0.001 (0.036)	Loss 2.8423 (2.9158)	Entropy 0.66699 (0.66856)	Top-1 acc 55.859 (53.864)	Top-5 acc 79.297 (76.564)	lr 0.01923
Train [39][970/3239]	Time 0.252 (0.507)	Data Time 0.001 (0.035)	Loss 2.9600 (2.9166)	Entropy 0.66718 (0.66854)	Top-1 acc 52.734 (53.844)	Top-5 acc 75.391 (76.552)	lr 0.01923
Train [39][980/3239]	Time 0.246 (0.507)	Data Time 0.001 (0.035)	Loss 3.0189 (2.9166)	Entropy 0.66741 (0.66853)	Top-1 acc 48.828 (53.855)	Top-5 acc 75.781 (76.553)	lr 0.01922
Train [39][990/3239]	Time 0.271 (0.506)	Data Time 0.001 (0.035)	Loss 2.7774 (2.9169)	Entropy 0.66744 (0.66852)	Top-1 acc 55.859 (53.840)	Top-5 acc 79.297 (76.548)	lr 0.01922
Train [39][1000/3239]	Time 0.389 (0.506)	Data Time 0.001 (0.034)	Loss 2.8291 (2.9167)	Entropy 0.66733 (0.66851)	Top-1 acc 55.859 (53.841)	Top-5 acc 79.297 (76.555)	lr 0.01922
Train [39][1010/3239]	Time 0.268 (0.505)	Data Time 0.001 (0.034)	Loss 2.8923 (2.9165)	Entropy 0.66746 (0.66849)	Top-1 acc 58.203 (53.848)	Top-5 acc 75.000 (76.561)	lr 0.01922
Train [39][1020/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.034)	Loss 3.0482 (2.9165)	Entropy 0.66765 (0.66849)	Top-1 acc 51.562 (53.840)	Top-5 acc 75.000 (76.556)	lr 0.01922
Train [39][1030/3239]	Time 0.290 (0.504)	Data Time 0.002 (0.033)	Loss 2.9815 (2.9169)	Entropy 0.66788 (0.66848)	Top-1 acc 53.516 (53.838)	Top-5 acc 74.219 (76.539)	lr 0.01922
Train [39][1040/3239]	Time 0.314 (0.504)	Data Time 0.002 (0.033)	Loss 3.0125 (2.9169)	Entropy 0.66781 (0.66847)	Top-1 acc 52.734 (53.851)	Top-5 acc 74.219 (76.538)	lr 0.01922
Train [39][1050/3239]	Time 0.235 (0.503)	Data Time 0.001 (0.033)	Loss 2.9008 (2.9171)	Entropy 0.66763 (0.66847)	Top-1 acc 53.516 (53.851)	Top-5 acc 77.344 (76.534)	lr 0.01922
Train [39][1060/3239]	Time 0.254 (0.502)	Data Time 0.001 (0.032)	Loss 2.8307 (2.9178)	Entropy 0.66790 (0.66846)	Top-1 acc 53.125 (53.827)	Top-5 acc 80.078 (76.525)	lr 0.01922
Train [39][1070/3239]	Time 0.223 (0.502)	Data Time 0.001 (0.032)	Loss 3.1449 (2.9176)	Entropy 0.66779 (0.66845)	Top-1 acc 47.266 (53.833)	Top-5 acc 69.531 (76.530)	lr 0.01922
Train [39][1080/3239]	Time 0.229 (0.501)	Data Time 0.001 (0.032)	Loss 3.1993 (2.9177)	Entropy 0.66772 (0.66845)	Top-1 acc 46.875 (53.841)	Top-5 acc 68.750 (76.518)	lr 0.01922
Train [39][1090/3239]	Time 0.311 (0.500)	Data Time 0.001 (0.032)	Loss 2.9441 (2.9180)	Entropy 0.66753 (0.66844)	Top-1 acc 54.297 (53.839)	Top-5 acc 75.391 (76.513)	lr 0.01922
Train [39][1100/3239]	Time 0.242 (0.500)	Data Time 0.001 (0.031)	Loss 2.9607 (2.9176)	Entropy 0.66750 (0.66843)	Top-1 acc 51.562 (53.846)	Top-5 acc 74.609 (76.522)	lr 0.01921
Train [39][1110/3239]	Time 0.271 (0.499)	Data Time 0.001 (0.031)	Loss 2.8645 (2.9181)	Entropy 0.66771 (0.66843)	Top-1 acc 52.734 (53.838)	Top-5 acc 73.828 (76.509)	lr 0.01921
Train [39][1120/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.031)	Loss 3.0599 (2.9182)	Entropy 0.66771 (0.66842)	Top-1 acc 50.781 (53.832)	Top-5 acc 75.000 (76.510)	lr 0.01921
Train [39][1130/3239]	Time 0.236 (0.498)	Data Time 0.001 (0.031)	Loss 2.8194 (2.9179)	Entropy 0.66782 (0.66841)	Top-1 acc 55.469 (53.838)	Top-5 acc 78.125 (76.521)	lr 0.01921
Train [39][1140/3239]	Time 0.233 (0.497)	Data Time 0.001 (0.030)	Loss 2.8519 (2.9178)	Entropy 0.66778 (0.66841)	Top-1 acc 57.031 (53.839)	Top-5 acc 74.609 (76.518)	lr 0.01921
Train [39][1150/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.030)	Loss 2.9306 (2.9172)	Entropy 0.66762 (0.66840)	Top-1 acc 52.734 (53.851)	Top-5 acc 74.219 (76.525)	lr 0.01921
Train [39][1160/3239]	Time 0.340 (0.496)	Data Time 0.001 (0.030)	Loss 2.9303 (2.9167)	Entropy 0.66772 (0.66839)	Top-1 acc 56.250 (53.857)	Top-5 acc 76.172 (76.536)	lr 0.01921
Train [39][1170/3239]	Time 0.237 (0.496)	Data Time 0.001 (0.030)	Loss 2.8559 (2.9165)	Entropy 0.66796 (0.66839)	Top-1 acc 55.859 (53.864)	Top-5 acc 76.953 (76.546)	lr 0.01921
Train [39][1180/3239]	Time 0.233 (0.495)	Data Time 0.001 (0.029)	Loss 2.9870 (2.9164)	Entropy 0.66800 (0.66839)	Top-1 acc 55.078 (53.871)	Top-5 acc 73.047 (76.544)	lr 0.01921
Train [39][1190/3239]	Time 0.230 (0.494)	Data Time 0.001 (0.029)	Loss 2.6253 (2.9159)	Entropy 0.66773 (0.66838)	Top-1 acc 59.375 (53.888)	Top-5 acc 82.812 (76.553)	lr 0.01921
Train [39][1200/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.029)	Loss 2.7552 (2.9158)	Entropy 0.66766 (0.66838)	Top-1 acc 58.594 (53.899)	Top-5 acc 80.078 (76.553)	lr 0.01921
Train [39][1210/3239]	Time 0.227 (0.493)	Data Time 0.001 (0.029)	Loss 2.8795 (2.9153)	Entropy 0.66754 (0.66837)	Top-1 acc 57.422 (53.910)	Top-5 acc 78.906 (76.567)	lr 0.01921
Train [39][1220/3239]	Time 0.238 (0.492)	Data Time 0.001 (0.028)	Loss 2.8123 (2.9156)	Entropy 0.66737 (0.66836)	Top-1 acc 54.688 (53.892)	Top-5 acc 78.516 (76.558)	lr 0.01920
Train [39][1230/3239]	Time 0.254 (0.492)	Data Time 0.001 (0.028)	Loss 2.7738 (2.9155)	Entropy 0.66702 (0.66835)	Top-1 acc 56.250 (53.893)	Top-5 acc 80.469 (76.558)	lr 0.01920
Train [39][1240/3239]	Time 0.238 (0.491)	Data Time 0.001 (0.028)	Loss 2.8853 (2.9151)	Entropy 0.66711 (0.66834)	Top-1 acc 55.078 (53.896)	Top-5 acc 76.953 (76.562)	lr 0.01920
Train [39][1250/3239]	Time 0.270 (0.491)	Data Time 0.001 (0.028)	Loss 2.9465 (2.9154)	Entropy 0.66717 (0.66833)	Top-1 acc 51.953 (53.882)	Top-5 acc 76.953 (76.558)	lr 0.01920
Train [39][1260/3239]	Time 0.239 (0.491)	Data Time 0.001 (0.028)	Loss 2.9585 (2.9155)	Entropy 0.66679 (0.66832)	Top-1 acc 53.906 (53.880)	Top-5 acc 74.609 (76.554)	lr 0.01920
Train [39][1270/3239]	Time 0.285 (0.490)	Data Time 0.001 (0.027)	Loss 2.9366 (2.9156)	Entropy 0.66663 (0.66831)	Top-1 acc 57.031 (53.881)	Top-5 acc 76.562 (76.555)	lr 0.01920
Train [39][1280/3239]	Time 0.231 (0.490)	Data Time 0.001 (0.027)	Loss 3.0199 (2.9159)	Entropy 0.66679 (0.66830)	Top-1 acc 54.297 (53.872)	Top-5 acc 73.438 (76.555)	lr 0.01920
Train [39][1290/3239]	Time 0.228 (0.489)	Data Time 0.001 (0.027)	Loss 2.8586 (2.9163)	Entropy 0.66638 (0.66828)	Top-1 acc 60.156 (53.866)	Top-5 acc 76.172 (76.543)	lr 0.01920
Train [39][1300/3239]	Time 0.403 (0.511)	Data Time 0.005 (0.027)	Loss 3.0650 (2.9170)	Entropy 0.66624 (0.66827)	Top-1 acc 50.000 (53.852)	Top-5 acc 73.047 (76.535)	lr 0.01920
Train [39][1310/3239]	Time 0.239 (0.512)	Data Time 0.002 (0.027)	Loss 3.0068 (2.9166)	Entropy 0.66599 (0.66825)	Top-1 acc 51.562 (53.861)	Top-5 acc 76.953 (76.542)	lr 0.01920
Train [39][1320/3239]	Time 0.428 (0.511)	Data Time 0.002 (0.026)	Loss 3.0311 (2.9164)	Entropy 0.66612 (0.66823)	Top-1 acc 50.000 (53.861)	Top-5 acc 75.000 (76.544)	lr 0.01920
Train [39][1330/3239]	Time 0.255 (0.511)	Data Time 0.001 (0.026)	Loss 3.0315 (2.9163)	Entropy 0.66640 (0.66822)	Top-1 acc 49.609 (53.858)	Top-5 acc 75.000 (76.549)	lr 0.01919
Train [39][1340/3239]	Time 0.241 (0.510)	Data Time 0.001 (0.026)	Loss 3.3019 (2.9167)	Entropy 0.66623 (0.66820)	Top-1 acc 44.141 (53.850)	Top-5 acc 71.094 (76.543)	lr 0.01919
Train [39][1350/3239]	Time 0.237 (0.510)	Data Time 0.001 (0.026)	Loss 3.1559 (2.9170)	Entropy 0.66644 (0.66819)	Top-1 acc 51.172 (53.852)	Top-5 acc 73.438 (76.544)	lr 0.01919
Train [39][1360/3239]	Time 0.243 (0.509)	Data Time 0.001 (0.026)	Loss 3.0428 (2.9165)	Entropy 0.66658 (0.66818)	Top-1 acc 52.734 (53.870)	Top-5 acc 75.781 (76.562)	lr 0.01919
Train [39][1370/3239]	Time 0.261 (0.509)	Data Time 0.001 (0.026)	Loss 2.8564 (2.9169)	Entropy 0.66685 (0.66817)	Top-1 acc 57.812 (53.865)	Top-5 acc 77.344 (76.552)	lr 0.01919
Train [39][1380/3239]	Time 0.248 (0.509)	Data Time 0.001 (0.025)	Loss 2.8907 (2.9168)	Entropy 0.66683 (0.66816)	Top-1 acc 56.641 (53.867)	Top-5 acc 77.344 (76.560)	lr 0.01919
Train [39][1390/3239]	Time 0.266 (0.508)	Data Time 0.001 (0.025)	Loss 2.7704 (2.9169)	Entropy 0.66717 (0.66815)	Top-1 acc 57.422 (53.868)	Top-5 acc 79.688 (76.554)	lr 0.01919
Train [39][1400/3239]	Time 0.245 (0.508)	Data Time 0.001 (0.025)	Loss 3.0764 (2.9174)	Entropy 0.66703 (0.66814)	Top-1 acc 50.781 (53.853)	Top-5 acc 73.828 (76.550)	lr 0.01919
Train [39][1410/3239]	Time 0.287 (0.507)	Data Time 0.001 (0.025)	Loss 2.9472 (2.9178)	Entropy 0.66702 (0.66813)	Top-1 acc 55.859 (53.836)	Top-5 acc 76.562 (76.546)	lr 0.01919
Train [39][1420/3239]	Time 0.238 (0.507)	Data Time 0.001 (0.025)	Loss 2.9787 (2.9177)	Entropy 0.66706 (0.66813)	Top-1 acc 53.125 (53.836)	Top-5 acc 75.391 (76.551)	lr 0.01919
Train [39][1430/3239]	Time 0.245 (0.506)	Data Time 0.001 (0.025)	Loss 2.8937 (2.9179)	Entropy 0.66715 (0.66812)	Top-1 acc 55.078 (53.834)	Top-5 acc 77.344 (76.543)	lr 0.01919
Train [39][1440/3239]	Time 0.249 (0.506)	Data Time 0.001 (0.024)	Loss 2.9897 (2.9179)	Entropy 0.66699 (0.66811)	Top-1 acc 53.125 (53.835)	Top-5 acc 76.953 (76.539)	lr 0.01919
Train [39][1450/3239]	Time 0.251 (0.506)	Data Time 0.001 (0.024)	Loss 2.8126 (2.9181)	Entropy 0.66693 (0.66810)	Top-1 acc 55.469 (53.838)	Top-5 acc 80.078 (76.536)	lr 0.01918
Train [39][1460/3239]	Time 0.302 (0.505)	Data Time 0.003 (0.024)	Loss 2.8989 (2.9181)	Entropy 0.66700 (0.66809)	Top-1 acc 55.469 (53.838)	Top-5 acc 78.125 (76.534)	lr 0.01918
Train [39][1470/3239]	Time 0.277 (0.505)	Data Time 0.003 (0.024)	Loss 2.9614 (2.9179)	Entropy 0.66753 (0.66809)	Top-1 acc 51.562 (53.840)	Top-5 acc 74.609 (76.536)	lr 0.01918
Train [39][1480/3239]	Time 0.353 (0.505)	Data Time 0.001 (0.024)	Loss 2.9538 (2.9182)	Entropy 0.66754 (0.66808)	Top-1 acc 56.641 (53.834)	Top-5 acc 75.000 (76.527)	lr 0.01918
Train [39][1490/3239]	Time 0.241 (0.504)	Data Time 0.001 (0.024)	Loss 2.9827 (2.9187)	Entropy 0.66752 (0.66808)	Top-1 acc 52.344 (53.822)	Top-5 acc 75.781 (76.519)	lr 0.01918
Train [39][1500/3239]	Time 0.246 (0.504)	Data Time 0.001 (0.023)	Loss 2.8593 (2.9186)	Entropy 0.66762 (0.66808)	Top-1 acc 55.859 (53.827)	Top-5 acc 78.125 (76.519)	lr 0.01918
Train [39][1510/3239]	Time 0.229 (0.504)	Data Time 0.001 (0.023)	Loss 2.9759 (2.9182)	Entropy 0.66789 (0.66807)	Top-1 acc 53.125 (53.836)	Top-5 acc 74.609 (76.530)	lr 0.01918
Train [39][1520/3239]	Time 0.243 (0.503)	Data Time 0.001 (0.023)	Loss 2.7852 (2.9183)	Entropy 0.66787 (0.66807)	Top-1 acc 57.812 (53.833)	Top-5 acc 80.859 (76.530)	lr 0.01918
Train [39][1530/3239]	Time 0.245 (0.503)	Data Time 0.001 (0.023)	Loss 2.9472 (2.9183)	Entropy 0.66791 (0.66807)	Top-1 acc 51.562 (53.842)	Top-5 acc 75.781 (76.531)	lr 0.01918
Train [39][1540/3239]	Time 0.229 (0.502)	Data Time 0.001 (0.023)	Loss 3.1819 (2.9190)	Entropy 0.66801 (0.66807)	Top-1 acc 46.094 (53.827)	Top-5 acc 73.438 (76.522)	lr 0.01918
Train [39][1550/3239]	Time 0.364 (0.502)	Data Time 0.004 (0.023)	Loss 2.7847 (2.9186)	Entropy 0.66779 (0.66807)	Top-1 acc 54.297 (53.840)	Top-5 acc 77.734 (76.526)	lr 0.01918
Train [39][1560/3239]	Time 0.246 (0.501)	Data Time 0.001 (0.023)	Loss 2.7702 (2.9185)	Entropy 0.66772 (0.66807)	Top-1 acc 60.547 (53.844)	Top-5 acc 77.734 (76.526)	lr 0.01918
Train [39][1570/3239]	Time 0.243 (0.501)	Data Time 0.001 (0.023)	Loss 2.9373 (2.9181)	Entropy 0.66771 (0.66807)	Top-1 acc 53.125 (53.850)	Top-5 acc 76.562 (76.540)	lr 0.01917
Train [39][1580/3239]	Time 0.235 (0.501)	Data Time 0.001 (0.022)	Loss 2.8778 (2.9182)	Entropy 0.66775 (0.66806)	Top-1 acc 58.203 (53.853)	Top-5 acc 76.562 (76.537)	lr 0.01917
Train [39][1590/3239]	Time 0.246 (0.500)	Data Time 0.001 (0.022)	Loss 2.8636 (2.9181)	Entropy 0.66756 (0.66806)	Top-1 acc 53.906 (53.851)	Top-5 acc 78.906 (76.542)	lr 0.01917
Train [39][1600/3239]	Time 0.242 (0.500)	Data Time 0.001 (0.022)	Loss 2.8795 (2.9178)	Entropy 0.66735 (0.66806)	Top-1 acc 56.250 (53.853)	Top-5 acc 79.688 (76.552)	lr 0.01917
Train [39][1610/3239]	Time 0.239 (0.499)	Data Time 0.001 (0.022)	Loss 3.0157 (2.9175)	Entropy 0.66709 (0.66805)	Top-1 acc 51.172 (53.854)	Top-5 acc 75.391 (76.561)	lr 0.01917
Train [39][1620/3239]	Time 0.286 (0.499)	Data Time 0.001 (0.022)	Loss 3.0315 (2.9176)	Entropy 0.66720 (0.66805)	Top-1 acc 55.078 (53.861)	Top-5 acc 72.656 (76.560)	lr 0.01917
Train [39][1630/3239]	Time 0.275 (0.499)	Data Time 0.001 (0.022)	Loss 2.9518 (2.9178)	Entropy 0.66726 (0.66804)	Top-1 acc 50.781 (53.853)	Top-5 acc 76.953 (76.554)	lr 0.01917
Train [39][1640/3239]	Time 0.377 (0.499)	Data Time 0.001 (0.022)	Loss 3.0090 (2.9176)	Entropy 0.66714 (0.66804)	Top-1 acc 55.469 (53.866)	Top-5 acc 74.609 (76.559)	lr 0.01917
Train [39][1650/3239]	Time 0.238 (0.498)	Data Time 0.001 (0.022)	Loss 2.8902 (2.9175)	Entropy 0.66713 (0.66803)	Top-1 acc 57.031 (53.865)	Top-5 acc 78.125 (76.568)	lr 0.01917
Train [39][1660/3239]	Time 0.238 (0.498)	Data Time 0.002 (0.021)	Loss 2.5859 (2.9176)	Entropy 0.66717 (0.66802)	Top-1 acc 58.984 (53.861)	Top-5 acc 82.422 (76.566)	lr 0.01917
Train [39][1670/3239]	Time 0.234 (0.497)	Data Time 0.001 (0.021)	Loss 2.9724 (2.9172)	Entropy 0.66695 (0.66802)	Top-1 acc 53.906 (53.865)	Top-5 acc 75.781 (76.571)	lr 0.01917
Train [39][1680/3239]	Time 0.295 (0.497)	Data Time 0.002 (0.021)	Loss 2.9120 (2.9171)	Entropy 0.66702 (0.66801)	Top-1 acc 54.297 (53.869)	Top-5 acc 78.516 (76.574)	lr 0.01917
Train [39][1690/3239]	Time 0.283 (0.497)	Data Time 0.001 (0.021)	Loss 3.0395 (2.9171)	Entropy 0.66678 (0.66801)	Top-1 acc 52.734 (53.868)	Top-5 acc 75.391 (76.569)	lr 0.01916
Train [39][1700/3239]	Time 0.241 (0.496)	Data Time 0.001 (0.021)	Loss 2.9870 (2.9174)	Entropy 0.66684 (0.66800)	Top-1 acc 53.125 (53.861)	Top-5 acc 75.000 (76.562)	lr 0.01916
Train [39][1710/3239]	Time 0.340 (0.496)	Data Time 0.001 (0.021)	Loss 2.9417 (2.9173)	Entropy 0.66658 (0.66799)	Top-1 acc 51.953 (53.862)	Top-5 acc 77.734 (76.562)	lr 0.01916
Train [39][1720/3239]	Time 0.226 (0.496)	Data Time 0.001 (0.021)	Loss 3.0789 (2.9175)	Entropy 0.66634 (0.66798)	Top-1 acc 49.219 (53.860)	Top-5 acc 73.438 (76.557)	lr 0.01916
Train [39][1730/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.021)	Loss 2.8305 (2.9175)	Entropy 0.66641 (0.66797)	Top-1 acc 54.688 (53.855)	Top-5 acc 78.906 (76.556)	lr 0.01916
Train [39][1740/3239]	Time 0.316 (0.495)	Data Time 0.003 (0.021)	Loss 2.7374 (2.9175)	Entropy 0.66611 (0.66796)	Top-1 acc 56.641 (53.850)	Top-5 acc 79.297 (76.559)	lr 0.01916
Train [39][1750/3239]	Time 0.229 (0.495)	Data Time 0.001 (0.020)	Loss 2.9545 (2.9172)	Entropy 0.66616 (0.66795)	Top-1 acc 53.125 (53.857)	Top-5 acc 75.781 (76.570)	lr 0.01916
Train [39][1760/3239]	Time 0.221 (0.494)	Data Time 0.001 (0.020)	Loss 2.9326 (2.9174)	Entropy 0.66607 (0.66794)	Top-1 acc 52.344 (53.849)	Top-5 acc 77.734 (76.567)	lr 0.01916
Train [39][1770/3239]	Time 0.236 (0.494)	Data Time 0.001 (0.020)	Loss 2.8260 (2.9175)	Entropy 0.66579 (0.66793)	Top-1 acc 59.766 (53.848)	Top-5 acc 78.906 (76.563)	lr 0.01916
Train [39][1780/3239]	Time 0.234 (0.494)	Data Time 0.001 (0.020)	Loss 2.8554 (2.9176)	Entropy 0.66561 (0.66792)	Top-1 acc 53.516 (53.841)	Top-5 acc 76.562 (76.557)	lr 0.01916
Train [39][1790/3239]	Time 0.247 (0.493)	Data Time 0.001 (0.020)	Loss 2.9774 (2.9173)	Entropy 0.66550 (0.66791)	Top-1 acc 52.344 (53.845)	Top-5 acc 75.781 (76.564)	lr 0.01916
Train [39][1800/3239]	Time 0.338 (0.493)	Data Time 0.001 (0.020)	Loss 3.0647 (2.9176)	Entropy 0.66563 (0.66789)	Top-1 acc 46.094 (53.837)	Top-5 acc 72.656 (76.561)	lr 0.01915
Train [39][1810/3239]	Time 0.239 (0.492)	Data Time 0.001 (0.020)	Loss 2.7288 (2.9175)	Entropy 0.66559 (0.66788)	Top-1 acc 58.594 (53.838)	Top-5 acc 80.469 (76.561)	lr 0.01915
Train [39][1820/3239]	Time 0.267 (0.492)	Data Time 0.001 (0.020)	Loss 2.9755 (2.9176)	Entropy 0.66539 (0.66787)	Top-1 acc 51.172 (53.837)	Top-5 acc 72.266 (76.556)	lr 0.01915
Train [39][1830/3239]	Time 0.257 (0.492)	Data Time 0.001 (0.020)	Loss 2.9709 (2.9177)	Entropy 0.66541 (0.66785)	Top-1 acc 51.172 (53.834)	Top-5 acc 75.000 (76.552)	lr 0.01915
Train [39][1840/3239]	Time 0.246 (0.492)	Data Time 0.002 (0.019)	Loss 2.8892 (2.9181)	Entropy 0.66527 (0.66784)	Top-1 acc 56.641 (53.827)	Top-5 acc 76.562 (76.546)	lr 0.01915
Train [39][1850/3239]	Time 0.241 (0.491)	Data Time 0.001 (0.019)	Loss 2.8676 (2.9179)	Entropy 0.66529 (0.66783)	Top-1 acc 55.078 (53.835)	Top-5 acc 75.000 (76.546)	lr 0.01915
Train [39][1860/3239]	Time 0.237 (0.491)	Data Time 0.001 (0.019)	Loss 3.0319 (2.9180)	Entropy 0.66527 (0.66781)	Top-1 acc 51.953 (53.837)	Top-5 acc 74.219 (76.546)	lr 0.01915
Train [39][1870/3239]	Time 0.377 (0.491)	Data Time 0.001 (0.019)	Loss 2.8107 (2.9178)	Entropy 0.66528 (0.66780)	Top-1 acc 58.203 (53.835)	Top-5 acc 79.297 (76.547)	lr 0.01915
Train [39][1880/3239]	Time 0.240 (0.491)	Data Time 0.001 (0.019)	Loss 2.9351 (2.9178)	Entropy 0.66528 (0.66779)	Top-1 acc 53.125 (53.835)	Top-5 acc 74.609 (76.549)	lr 0.01915
Train [39][1890/3239]	Time 0.245 (0.490)	Data Time 0.001 (0.019)	Loss 2.8329 (2.9177)	Entropy 0.66528 (0.66777)	Top-1 acc 57.031 (53.839)	Top-5 acc 77.344 (76.551)	lr 0.01915
Train [39][1900/3239]	Time 0.226 (0.490)	Data Time 0.001 (0.019)	Loss 2.7988 (2.9174)	Entropy 0.66563 (0.66776)	Top-1 acc 54.297 (53.845)	Top-5 acc 80.469 (76.552)	lr 0.01915
Train [39][1910/3239]	Time 0.238 (0.490)	Data Time 0.001 (0.019)	Loss 2.8720 (2.9175)	Entropy 0.66556 (0.66775)	Top-1 acc 49.219 (53.843)	Top-5 acc 79.297 (76.555)	lr 0.01915
Train [39][1920/3239]	Time 0.241 (0.489)	Data Time 0.001 (0.019)	Loss 3.0762 (2.9176)	Entropy 0.66528 (0.66774)	Top-1 acc 51.172 (53.839)	Top-5 acc 72.656 (76.558)	lr 0.01914
Train [39][1930/3239]	Time 0.230 (0.489)	Data Time 0.001 (0.019)	Loss 2.8840 (2.9174)	Entropy 0.66531 (0.66772)	Top-1 acc 53.906 (53.841)	Top-5 acc 76.172 (76.562)	lr 0.01914
Train [39][1940/3239]	Time 0.268 (0.489)	Data Time 0.001 (0.019)	Loss 3.1004 (2.9177)	Entropy 0.66519 (0.66771)	Top-1 acc 50.781 (53.831)	Top-5 acc 70.703 (76.557)	lr 0.01914
Train [39][1950/3239]	Time 0.237 (0.488)	Data Time 0.001 (0.018)	Loss 2.8038 (2.9175)	Entropy 0.66534 (0.66770)	Top-1 acc 57.031 (53.842)	Top-5 acc 80.469 (76.566)	lr 0.01914
Train [39][1960/3239]	Time 0.383 (0.504)	Data Time 0.002 (0.018)	Loss 3.0233 (2.9174)	Entropy 0.66519 (0.66769)	Top-1 acc 50.781 (53.843)	Top-5 acc 73.047 (76.565)	lr 0.01914
Train [39][1970/3239]	Time 0.265 (0.503)	Data Time 0.002 (0.018)	Loss 3.0125 (2.9173)	Entropy 0.66475 (0.66767)	Top-1 acc 52.734 (53.846)	Top-5 acc 76.172 (76.570)	lr 0.01914
Train [39][1980/3239]	Time 0.282 (0.503)	Data Time 0.002 (0.018)	Loss 2.8435 (2.9173)	Entropy 0.66452 (0.66766)	Top-1 acc 58.203 (53.848)	Top-5 acc 76.953 (76.565)	lr 0.01914
Train [39][1990/3239]	Time 0.307 (0.503)	Data Time 0.001 (0.018)	Loss 2.7248 (2.9172)	Entropy 0.66476 (0.66764)	Top-1 acc 57.812 (53.852)	Top-5 acc 76.562 (76.565)	lr 0.01914
Train [39][2000/3239]	Time 0.262 (0.503)	Data Time 0.001 (0.018)	Loss 3.0576 (2.9173)	Entropy 0.66465 (0.66763)	Top-1 acc 50.000 (53.854)	Top-5 acc 71.094 (76.560)	lr 0.01914
Train [39][2010/3239]	Time 0.295 (0.503)	Data Time 0.001 (0.018)	Loss 2.9139 (2.9173)	Entropy 0.66502 (0.66761)	Top-1 acc 51.172 (53.850)	Top-5 acc 74.609 (76.557)	lr 0.01914
Train [39][2020/3239]	Time 0.237 (0.502)	Data Time 0.001 (0.018)	Loss 2.9822 (2.9172)	Entropy 0.66522 (0.66760)	Top-1 acc 51.562 (53.851)	Top-5 acc 73.438 (76.556)	lr 0.01914
Train [39][2030/3239]	Time 0.355 (0.502)	Data Time 0.001 (0.018)	Loss 2.6595 (2.9166)	Entropy 0.66527 (0.66759)	Top-1 acc 59.375 (53.862)	Top-5 acc 81.641 (76.565)	lr 0.01914
Train [39][2040/3239]	Time 0.246 (0.502)	Data Time 0.001 (0.018)	Loss 2.9054 (2.9167)	Entropy 0.66533 (0.66758)	Top-1 acc 56.641 (53.863)	Top-5 acc 76.953 (76.565)	lr 0.01913
Train [39][2050/3239]	Time 0.317 (0.501)	Data Time 0.003 (0.018)	Loss 2.8759 (2.9169)	Entropy 0.66538 (0.66757)	Top-1 acc 57.422 (53.863)	Top-5 acc 74.609 (76.557)	lr 0.01913
Train [39][2060/3239]	Time 0.356 (0.501)	Data Time 0.002 (0.018)	Loss 2.9966 (2.9169)	Entropy 0.66558 (0.66756)	Top-1 acc 53.125 (53.864)	Top-5 acc 73.438 (76.554)	lr 0.01913
Train [39][2070/3239]	Time 0.254 (0.501)	Data Time 0.001 (0.018)	Loss 2.9679 (2.9172)	Entropy 0.66557 (0.66755)	Top-1 acc 50.391 (53.856)	Top-5 acc 77.734 (76.549)	lr 0.01913
Train [39][2080/3239]	Time 0.282 (0.501)	Data Time 0.001 (0.017)	Loss 2.8513 (2.9172)	Entropy 0.66543 (0.66754)	Top-1 acc 56.250 (53.857)	Top-5 acc 76.953 (76.549)	lr 0.01913
Train [39][2090/3239]	Time 0.244 (0.501)	Data Time 0.001 (0.017)	Loss 2.8746 (2.9176)	Entropy 0.66545 (0.66753)	Top-1 acc 56.250 (53.852)	Top-5 acc 77.344 (76.542)	lr 0.01913
Train [39][2100/3239]	Time 0.276 (0.501)	Data Time 0.022 (0.017)	Loss 2.8462 (2.9175)	Entropy 0.66543 (0.66752)	Top-1 acc 57.422 (53.858)	Top-5 acc 77.344 (76.544)	lr 0.01913
Train [39][2110/3239]	Time 0.239 (0.500)	Data Time 0.001 (0.017)	Loss 2.9304 (2.9179)	Entropy 0.66500 (0.66751)	Top-1 acc 53.516 (53.846)	Top-5 acc 75.391 (76.532)	lr 0.01913
Train [39][2120/3239]	Time 0.303 (0.500)	Data Time 0.001 (0.017)	Loss 2.8498 (2.9175)	Entropy 0.66447 (0.66750)	Top-1 acc 57.031 (53.861)	Top-5 acc 77.734 (76.541)	lr 0.01913
Train [39][2130/3239]	Time 0.238 (0.500)	Data Time 0.001 (0.017)	Loss 2.8662 (2.9172)	Entropy 0.66466 (0.66748)	Top-1 acc 52.344 (53.869)	Top-5 acc 77.344 (76.548)	lr 0.01913
Train [39][2140/3239]	Time 0.246 (0.500)	Data Time 0.001 (0.017)	Loss 3.2111 (2.9175)	Entropy 0.66479 (0.66747)	Top-1 acc 43.750 (53.865)	Top-5 acc 69.531 (76.542)	lr 0.01913
Train [39][2150/3239]	Time 0.228 (0.499)	Data Time 0.001 (0.017)	Loss 2.9064 (2.9174)	Entropy 0.66463 (0.66746)	Top-1 acc 55.469 (53.868)	Top-5 acc 77.734 (76.548)	lr 0.01912
Train [39][2160/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.017)	Loss 3.1696 (2.9175)	Entropy 0.66455 (0.66744)	Top-1 acc 51.562 (53.862)	Top-5 acc 70.312 (76.545)	lr 0.01912
Train [39][2170/3239]	Time 0.292 (0.499)	Data Time 0.002 (0.017)	Loss 2.9113 (2.9178)	Entropy 0.66431 (0.66743)	Top-1 acc 54.297 (53.850)	Top-5 acc 76.953 (76.537)	lr 0.01912
Train [39][2180/3239]	Time 0.268 (0.499)	Data Time 0.001 (0.017)	Loss 2.8331 (2.9177)	Entropy 0.66450 (0.66742)	Top-1 acc 54.297 (53.854)	Top-5 acc 78.125 (76.538)	lr 0.01912
Train [39][2190/3239]	Time 0.396 (0.499)	Data Time 0.002 (0.017)	Loss 3.0147 (2.9178)	Entropy 0.66487 (0.66740)	Top-1 acc 52.344 (53.853)	Top-5 acc 73.047 (76.534)	lr 0.01912
Train [39][2200/3239]	Time 0.218 (0.498)	Data Time 0.001 (0.017)	Loss 2.9652 (2.9179)	Entropy 0.66503 (0.66739)	Top-1 acc 52.734 (53.854)	Top-5 acc 76.953 (76.531)	lr 0.01912
Train [39][2210/3239]	Time 0.252 (0.498)	Data Time 0.001 (0.017)	Loss 2.9006 (2.9179)	Entropy 0.66504 (0.66738)	Top-1 acc 58.203 (53.854)	Top-5 acc 76.953 (76.528)	lr 0.01912
Train [39][2220/3239]	Time 0.274 (0.498)	Data Time 0.002 (0.016)	Loss 3.0331 (2.9183)	Entropy 0.66494 (0.66737)	Top-1 acc 48.438 (53.843)	Top-5 acc 74.609 (76.517)	lr 0.01912
Train [39][2230/3239]	Time 0.224 (0.497)	Data Time 0.001 (0.016)	Loss 2.9796 (2.9184)	Entropy 0.66487 (0.66736)	Top-1 acc 52.344 (53.838)	Top-5 acc 75.000 (76.510)	lr 0.01912
Train [39][2240/3239]	Time 0.249 (0.497)	Data Time 0.001 (0.016)	Loss 3.0638 (2.9183)	Entropy 0.66502 (0.66735)	Top-1 acc 50.000 (53.843)	Top-5 acc 73.047 (76.511)	lr 0.01912
Train [39][2250/3239]	Time 0.282 (0.497)	Data Time 0.001 (0.016)	Loss 2.8828 (2.9182)	Entropy 0.66528 (0.66734)	Top-1 acc 55.078 (53.845)	Top-5 acc 76.562 (76.517)	lr 0.01912
Train [39][2260/3239]	Time 0.373 (0.497)	Data Time 0.001 (0.016)	Loss 3.0810 (2.9185)	Entropy 0.66563 (0.66733)	Top-1 acc 46.875 (53.837)	Top-5 acc 73.047 (76.510)	lr 0.01912
Train [39][2270/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.016)	Loss 2.8576 (2.9185)	Entropy 0.66544 (0.66732)	Top-1 acc 53.906 (53.837)	Top-5 acc 76.172 (76.510)	lr 0.01911
Train [39][2280/3239]	Time 0.254 (0.496)	Data Time 0.001 (0.016)	Loss 3.0502 (2.9188)	Entropy 0.66550 (0.66731)	Top-1 acc 48.438 (53.832)	Top-5 acc 75.391 (76.505)	lr 0.01911
Train [39][2290/3239]	Time 0.278 (0.496)	Data Time 0.002 (0.016)	Loss 2.9239 (2.9186)	Entropy 0.66474 (0.66730)	Top-1 acc 53.906 (53.838)	Top-5 acc 77.734 (76.505)	lr 0.01911
Train [39][2300/3239]	Time 0.247 (0.496)	Data Time 0.001 (0.016)	Loss 2.8957 (2.9186)	Entropy 0.66459 (0.66729)	Top-1 acc 53.125 (53.839)	Top-5 acc 77.344 (76.506)	lr 0.01911
Train [39][2310/3239]	Time 0.234 (0.496)	Data Time 0.002 (0.016)	Loss 2.9650 (2.9187)	Entropy 0.66469 (0.66728)	Top-1 acc 53.125 (53.836)	Top-5 acc 76.172 (76.504)	lr 0.01911
Train [39][2320/3239]	Time 0.225 (0.495)	Data Time 0.001 (0.016)	Loss 3.0445 (2.9187)	Entropy 0.66450 (0.66727)	Top-1 acc 47.266 (53.833)	Top-5 acc 76.172 (76.507)	lr 0.01911
Train [39][2330/3239]	Time 0.218 (0.495)	Data Time 0.001 (0.016)	Loss 2.9539 (2.9187)	Entropy 0.66445 (0.66726)	Top-1 acc 50.391 (53.830)	Top-5 acc 76.953 (76.503)	lr 0.01911
Train [39][2340/3239]	Time 0.246 (0.495)	Data Time 0.001 (0.016)	Loss 2.8317 (2.9188)	Entropy 0.66469 (0.66725)	Top-1 acc 54.688 (53.826)	Top-5 acc 74.609 (76.500)	lr 0.01911
Train [39][2350/3239]	Time 0.331 (0.494)	Data Time 0.001 (0.016)	Loss 3.0024 (2.9190)	Entropy 0.66481 (0.66724)	Top-1 acc 57.031 (53.828)	Top-5 acc 77.344 (76.498)	lr 0.01911
Train [39][2360/3239]	Time 0.258 (0.494)	Data Time 0.002 (0.016)	Loss 2.8214 (2.9190)	Entropy 0.66501 (0.66723)	Top-1 acc 57.031 (53.829)	Top-5 acc 78.125 (76.498)	lr 0.01911
Train [39][2370/3239]	Time 0.244 (0.494)	Data Time 0.001 (0.016)	Loss 2.7606 (2.9188)	Entropy 0.66517 (0.66722)	Top-1 acc 59.375 (53.832)	Top-5 acc 80.469 (76.504)	lr 0.01911
Train [39][2380/3239]	Time 0.241 (0.494)	Data Time 0.001 (0.015)	Loss 3.1683 (2.9187)	Entropy 0.66522 (0.66721)	Top-1 acc 47.656 (53.835)	Top-5 acc 71.484 (76.508)	lr 0.01911
Train [39][2390/3239]	Time 0.231 (0.493)	Data Time 0.001 (0.015)	Loss 3.0986 (2.9189)	Entropy 0.66543 (0.66720)	Top-1 acc 48.047 (53.831)	Top-5 acc 71.094 (76.500)	lr 0.01910
Train [39][2400/3239]	Time 0.252 (0.493)	Data Time 0.001 (0.015)	Loss 3.0139 (2.9189)	Entropy 0.66553 (0.66719)	Top-1 acc 50.781 (53.835)	Top-5 acc 73.438 (76.496)	lr 0.01910
Train [39][2410/3239]	Time 0.261 (0.493)	Data Time 0.001 (0.015)	Loss 2.8283 (2.9187)	Entropy 0.66563 (0.66719)	Top-1 acc 54.688 (53.840)	Top-5 acc 77.734 (76.502)	lr 0.01910
Train [39][2420/3239]	Time 0.401 (0.493)	Data Time 0.001 (0.015)	Loss 2.7746 (2.9187)	Entropy 0.66525 (0.66718)	Top-1 acc 54.297 (53.839)	Top-5 acc 80.859 (76.502)	lr 0.01910
Train [39][2430/3239]	Time 0.236 (0.493)	Data Time 0.001 (0.015)	Loss 2.6945 (2.9186)	Entropy 0.66510 (0.66717)	Top-1 acc 60.156 (53.839)	Top-5 acc 79.688 (76.502)	lr 0.01910
Train [39][2440/3239]	Time 0.248 (0.492)	Data Time 0.001 (0.015)	Loss 3.0944 (2.9187)	Entropy 0.66486 (0.66716)	Top-1 acc 48.438 (53.838)	Top-5 acc 71.484 (76.500)	lr 0.01910
Train [39][2450/3239]	Time 0.253 (0.492)	Data Time 0.001 (0.015)	Loss 2.7077 (2.9185)	Entropy 0.66510 (0.66716)	Top-1 acc 59.375 (53.843)	Top-5 acc 78.906 (76.500)	lr 0.01910
Train [39][2460/3239]	Time 0.234 (0.492)	Data Time 0.001 (0.015)	Loss 2.7741 (2.9186)	Entropy 0.66497 (0.66715)	Top-1 acc 58.984 (53.840)	Top-5 acc 80.469 (76.500)	lr 0.01910
Train [39][2470/3239]	Time 0.239 (0.492)	Data Time 0.001 (0.015)	Loss 2.9233 (2.9185)	Entropy 0.66507 (0.66714)	Top-1 acc 55.469 (53.846)	Top-5 acc 76.172 (76.502)	lr 0.01910
Train [39][2480/3239]	Time 0.227 (0.491)	Data Time 0.001 (0.015)	Loss 2.9321 (2.9184)	Entropy 0.66493 (0.66713)	Top-1 acc 51.562 (53.844)	Top-5 acc 78.125 (76.501)	lr 0.01910
Train [39][2490/3239]	Time 0.221 (0.491)	Data Time 0.001 (0.015)	Loss 2.9292 (2.9184)	Entropy 0.66491 (0.66712)	Top-1 acc 51.953 (53.847)	Top-5 acc 78.125 (76.498)	lr 0.01910
Train [39][2500/3239]	Time 0.238 (0.491)	Data Time 0.001 (0.015)	Loss 3.2430 (2.9187)	Entropy 0.66474 (0.66711)	Top-1 acc 49.609 (53.841)	Top-5 acc 67.578 (76.491)	lr 0.01909
Train [39][2510/3239]	Time 0.290 (0.491)	Data Time 0.001 (0.015)	Loss 2.9423 (2.9186)	Entropy 0.66474 (0.66710)	Top-1 acc 50.000 (53.843)	Top-5 acc 75.000 (76.492)	lr 0.01909
Train [39][2520/3239]	Time 0.234 (0.490)	Data Time 0.002 (0.015)	Loss 2.9035 (2.9186)	Entropy 0.66463 (0.66709)	Top-1 acc 51.953 (53.844)	Top-5 acc 77.734 (76.495)	lr 0.01909
Train [39][2530/3239]	Time 0.249 (0.490)	Data Time 0.001 (0.015)	Loss 2.9763 (2.9186)	Entropy 0.66473 (0.66708)	Top-1 acc 55.859 (53.845)	Top-5 acc 75.000 (76.492)	lr 0.01909
Train [39][2540/3239]	Time 0.278 (0.490)	Data Time 0.002 (0.015)	Loss 2.9672 (2.9188)	Entropy 0.66451 (0.66707)	Top-1 acc 48.438 (53.839)	Top-5 acc 76.172 (76.490)	lr 0.01909
Train [39][2550/3239]	Time 0.281 (0.490)	Data Time 0.002 (0.015)	Loss 2.8359 (2.9188)	Entropy 0.66466 (0.66706)	Top-1 acc 50.781 (53.835)	Top-5 acc 77.344 (76.490)	lr 0.01909
Train [39][2560/3239]	Time 0.238 (0.490)	Data Time 0.001 (0.015)	Loss 2.7337 (2.9186)	Entropy 0.66457 (0.66705)	Top-1 acc 56.641 (53.839)	Top-5 acc 80.078 (76.496)	lr 0.01909
Train [39][2570/3239]	Time 0.227 (0.490)	Data Time 0.001 (0.014)	Loss 2.8980 (2.9185)	Entropy 0.66455 (0.66704)	Top-1 acc 58.984 (53.841)	Top-5 acc 74.609 (76.498)	lr 0.01909
Train [39][2580/3239]	Time 0.327 (0.489)	Data Time 0.001 (0.014)	Loss 3.2936 (2.9188)	Entropy 0.66480 (0.66703)	Top-1 acc 46.484 (53.837)	Top-5 acc 69.922 (76.493)	lr 0.01909
Train [39][2590/3239]	Time 0.231 (0.489)	Data Time 0.001 (0.014)	Loss 2.9860 (2.9188)	Entropy 0.66462 (0.66702)	Top-1 acc 49.609 (53.834)	Top-5 acc 79.297 (76.496)	lr 0.01909
Train [39][2600/3239]	Time 0.227 (0.489)	Data Time 0.001 (0.014)	Loss 3.0238 (2.9190)	Entropy 0.66432 (0.66702)	Top-1 acc 51.172 (53.828)	Top-5 acc 74.609 (76.492)	lr 0.01909
Train [39][2610/3239]	Time 0.361 (0.501)	Data Time 0.005 (0.014)	Loss 3.0726 (2.9191)	Entropy 0.66440 (0.66700)	Top-1 acc 51.953 (53.826)	Top-5 acc 73.047 (76.489)	lr 0.01909
Train [39][2620/3239]	Time 0.249 (0.500)	Data Time 0.002 (0.014)	Loss 3.1468 (2.9190)	Entropy 0.66460 (0.66700)	Top-1 acc 50.781 (53.830)	Top-5 acc 73.828 (76.493)	lr 0.01908
Train [39][2630/3239]	Time 0.263 (0.500)	Data Time 0.002 (0.014)	Loss 2.9583 (2.9192)	Entropy 0.66420 (0.66699)	Top-1 acc 52.344 (53.828)	Top-5 acc 74.219 (76.488)	lr 0.01908
Train [39][2640/3239]	Time 0.266 (0.500)	Data Time 0.001 (0.014)	Loss 3.0387 (2.9192)	Entropy 0.66419 (0.66698)	Top-1 acc 46.484 (53.826)	Top-5 acc 76.953 (76.486)	lr 0.01908
Train [39][2650/3239]	Time 0.278 (0.500)	Data Time 0.001 (0.014)	Loss 2.5991 (2.9191)	Entropy 0.66449 (0.66697)	Top-1 acc 57.812 (53.822)	Top-5 acc 87.109 (76.493)	lr 0.01908
Train [39][2660/3239]	Time 0.248 (0.500)	Data Time 0.002 (0.014)	Loss 2.9959 (2.9192)	Entropy 0.66446 (0.66696)	Top-1 acc 51.953 (53.819)	Top-5 acc 76.562 (76.495)	lr 0.01908
Train [39][2670/3239]	Time 0.416 (0.500)	Data Time 0.001 (0.014)	Loss 2.9372 (2.9192)	Entropy 0.66458 (0.66695)	Top-1 acc 56.250 (53.824)	Top-5 acc 75.000 (76.494)	lr 0.01908
Train [39][2680/3239]	Time 0.267 (0.500)	Data Time 0.001 (0.014)	Loss 2.7421 (2.9192)	Entropy 0.66455 (0.66694)	Top-1 acc 58.984 (53.823)	Top-5 acc 78.906 (76.493)	lr 0.01908
Train [39][2690/3239]	Time 0.286 (0.499)	Data Time 0.001 (0.014)	Loss 2.7713 (2.9193)	Entropy 0.66418 (0.66693)	Top-1 acc 57.031 (53.822)	Top-5 acc 80.078 (76.490)	lr 0.01908
Train [39][2700/3239]	Time 0.241 (0.499)	Data Time 0.001 (0.014)	Loss 2.8105 (2.9192)	Entropy 0.66428 (0.66692)	Top-1 acc 55.078 (53.820)	Top-5 acc 80.078 (76.492)	lr 0.01908
Train [39][2710/3239]	Time 0.242 (0.499)	Data Time 0.001 (0.014)	Loss 3.2286 (2.9196)	Entropy 0.66444 (0.66691)	Top-1 acc 48.828 (53.806)	Top-5 acc 71.875 (76.484)	lr 0.01908
Train [39][2720/3239]	Time 0.306 (0.499)	Data Time 0.002 (0.014)	Loss 3.0009 (2.9197)	Entropy 0.66460 (0.66690)	Top-1 acc 51.953 (53.809)	Top-5 acc 74.609 (76.483)	lr 0.01908
Train [39][2730/3239]	Time 0.304 (0.499)	Data Time 0.002 (0.014)	Loss 3.0873 (2.9199)	Entropy 0.66418 (0.66689)	Top-1 acc 51.172 (53.804)	Top-5 acc 76.562 (76.483)	lr 0.01908
Train [39][2740/3239]	Time 0.365 (0.499)	Data Time 0.001 (0.014)	Loss 2.8704 (2.9198)	Entropy 0.66411 (0.66688)	Top-1 acc 54.297 (53.804)	Top-5 acc 78.125 (76.486)	lr 0.01907
Train [39][2750/3239]	Time 0.277 (0.499)	Data Time 0.004 (0.014)	Loss 2.8597 (2.9199)	Entropy 0.66428 (0.66687)	Top-1 acc 53.906 (53.805)	Top-5 acc 76.953 (76.484)	lr 0.01907
Train [39][2760/3239]	Time 0.268 (0.499)	Data Time 0.001 (0.014)	Loss 3.0926 (2.9203)	Entropy 0.66403 (0.66686)	Top-1 acc 50.000 (53.791)	Top-5 acc 72.656 (76.476)	lr 0.01907
Train [39][2770/3239]	Time 0.274 (0.499)	Data Time 0.001 (0.014)	Loss 2.9972 (2.9202)	Entropy 0.66405 (0.66685)	Top-1 acc 51.953 (53.791)	Top-5 acc 72.656 (76.478)	lr 0.01907
Train [39][2780/3239]	Time 0.254 (0.498)	Data Time 0.001 (0.014)	Loss 3.2407 (2.9203)	Entropy 0.66406 (0.66684)	Top-1 acc 50.781 (53.790)	Top-5 acc 70.703 (76.479)	lr 0.01907
Train [39][2790/3239]	Time 0.297 (0.498)	Data Time 0.001 (0.013)	Loss 2.9847 (2.9203)	Entropy 0.66424 (0.66683)	Top-1 acc 50.391 (53.787)	Top-5 acc 76.953 (76.479)	lr 0.01907
Train [39][2800/3239]	Time 0.230 (0.498)	Data Time 0.001 (0.013)	Loss 3.0344 (2.9203)	Entropy 0.66461 (0.66682)	Top-1 acc 53.516 (53.788)	Top-5 acc 75.391 (76.480)	lr 0.01907
Train [39][2810/3239]	Time 0.437 (0.498)	Data Time 0.003 (0.013)	Loss 3.1003 (2.9204)	Entropy 0.66480 (0.66682)	Top-1 acc 50.781 (53.787)	Top-5 acc 71.484 (76.476)	lr 0.01907
Train [39][2820/3239]	Time 0.234 (0.498)	Data Time 0.001 (0.013)	Loss 2.8418 (2.9203)	Entropy 0.66466 (0.66681)	Top-1 acc 56.641 (53.790)	Top-5 acc 77.344 (76.479)	lr 0.01907
Train [39][2830/3239]	Time 0.239 (0.498)	Data Time 0.001 (0.013)	Loss 3.0194 (2.9205)	Entropy 0.66449 (0.66680)	Top-1 acc 50.781 (53.787)	Top-5 acc 73.828 (76.474)	lr 0.01907
Train [39][2840/3239]	Time 0.247 (0.497)	Data Time 0.001 (0.013)	Loss 2.9044 (2.9205)	Entropy 0.66419 (0.66679)	Top-1 acc 53.906 (53.788)	Top-5 acc 78.125 (76.479)	lr 0.01907
Train [39][2850/3239]	Time 0.256 (0.497)	Data Time 0.001 (0.013)	Loss 3.0919 (2.9205)	Entropy 0.66418 (0.66678)	Top-1 acc 49.609 (53.789)	Top-5 acc 71.094 (76.477)	lr 0.01906
Train [39][2860/3239]	Time 0.238 (0.497)	Data Time 0.001 (0.013)	Loss 2.8572 (2.9205)	Entropy 0.66440 (0.66677)	Top-1 acc 53.906 (53.784)	Top-5 acc 78.906 (76.476)	lr 0.01906
Train [39][2870/3239]	Time 0.300 (0.497)	Data Time 0.001 (0.013)	Loss 3.0879 (2.9204)	Entropy 0.66435 (0.66677)	Top-1 acc 50.000 (53.785)	Top-5 acc 72.266 (76.477)	lr 0.01906
Train [39][2880/3239]	Time 0.249 (0.497)	Data Time 0.001 (0.013)	Loss 2.9058 (2.9203)	Entropy 0.66431 (0.66676)	Top-1 acc 51.953 (53.788)	Top-5 acc 75.781 (76.479)	lr 0.01906
Train [39][2890/3239]	Time 0.249 (0.497)	Data Time 0.001 (0.013)	Loss 2.8204 (2.9205)	Entropy 0.66432 (0.66675)	Top-1 acc 54.297 (53.788)	Top-5 acc 79.297 (76.478)	lr 0.01906
Train [39][2900/3239]	Time 0.435 (0.496)	Data Time 0.001 (0.013)	Loss 2.9822 (2.9205)	Entropy 0.66422 (0.66674)	Top-1 acc 53.516 (53.785)	Top-5 acc 76.562 (76.481)	lr 0.01906
Train [39][2910/3239]	Time 0.248 (0.496)	Data Time 0.001 (0.013)	Loss 2.8404 (2.9206)	Entropy 0.66411 (0.66673)	Top-1 acc 59.375 (53.784)	Top-5 acc 78.516 (76.480)	lr 0.01906
Train [39][2920/3239]	Time 0.239 (0.496)	Data Time 0.001 (0.013)	Loss 3.0713 (2.9207)	Entropy 0.66405 (0.66672)	Top-1 acc 53.125 (53.783)	Top-5 acc 73.828 (76.479)	lr 0.01906
Train [39][2930/3239]	Time 0.226 (0.496)	Data Time 0.001 (0.013)	Loss 2.9875 (2.9207)	Entropy 0.66440 (0.66671)	Top-1 acc 51.172 (53.784)	Top-5 acc 75.000 (76.476)	lr 0.01906
Train [39][2940/3239]	Time 0.244 (0.496)	Data Time 0.002 (0.013)	Loss 2.8571 (2.9207)	Entropy 0.66401 (0.66671)	Top-1 acc 54.297 (53.784)	Top-5 acc 76.953 (76.477)	lr 0.01906
Train [39][2950/3239]	Time 0.287 (0.496)	Data Time 0.003 (0.013)	Loss 2.6548 (2.9207)	Entropy 0.66391 (0.66670)	Top-1 acc 59.766 (53.785)	Top-5 acc 78.906 (76.477)	lr 0.01906
Train [39][2960/3239]	Time 0.271 (0.495)	Data Time 0.001 (0.013)	Loss 3.0681 (2.9210)	Entropy 0.66403 (0.66669)	Top-1 acc 51.562 (53.778)	Top-5 acc 73.828 (76.471)	lr 0.01906
Train [39][2970/3239]	Time 0.350 (0.495)	Data Time 0.001 (0.013)	Loss 3.1549 (2.9210)	Entropy 0.66402 (0.66668)	Top-1 acc 48.438 (53.777)	Top-5 acc 72.656 (76.473)	lr 0.01905
Train [39][2980/3239]	Time 0.238 (0.495)	Data Time 0.001 (0.013)	Loss 2.7423 (2.9209)	Entropy 0.66421 (0.66667)	Top-1 acc 58.984 (53.783)	Top-5 acc 78.516 (76.476)	lr 0.01905
Train [39][2990/3239]	Time 0.268 (0.495)	Data Time 0.001 (0.013)	Loss 2.8168 (2.9207)	Entropy 0.66417 (0.66666)	Top-1 acc 58.594 (53.787)	Top-5 acc 77.344 (76.479)	lr 0.01905
Train [39][3000/3239]	Time 0.304 (0.495)	Data Time 0.002 (0.013)	Loss 2.7915 (2.9206)	Entropy 0.66421 (0.66665)	Top-1 acc 55.469 (53.789)	Top-5 acc 79.297 (76.483)	lr 0.01905
Train [39][3010/3239]	Time 0.262 (0.494)	Data Time 0.001 (0.013)	Loss 3.0451 (2.9207)	Entropy 0.66394 (0.66665)	Top-1 acc 49.219 (53.778)	Top-5 acc 76.562 (76.485)	lr 0.01905
Train [39][3020/3239]	Time 0.260 (0.494)	Data Time 0.001 (0.013)	Loss 2.9383 (2.9208)	Entropy 0.66397 (0.66664)	Top-1 acc 51.172 (53.774)	Top-5 acc 76.953 (76.483)	lr 0.01905
Train [39][3030/3239]	Time 0.247 (0.494)	Data Time 0.001 (0.013)	Loss 2.8897 (2.9207)	Entropy 0.66378 (0.66663)	Top-1 acc 54.297 (53.776)	Top-5 acc 78.906 (76.488)	lr 0.01905
Train [39][3040/3239]	Time 0.330 (0.494)	Data Time 0.001 (0.013)	Loss 2.8103 (2.9206)	Entropy 0.66365 (0.66662)	Top-1 acc 57.422 (53.775)	Top-5 acc 78.906 (76.489)	lr 0.01905
Train [39][3050/3239]	Time 0.292 (0.494)	Data Time 0.003 (0.013)	Loss 2.8420 (2.9206)	Entropy 0.66365 (0.66661)	Top-1 acc 51.953 (53.775)	Top-5 acc 80.078 (76.488)	lr 0.01905
Train [39][3060/3239]	Time 0.357 (0.494)	Data Time 0.001 (0.012)	Loss 2.8970 (2.9205)	Entropy 0.66344 (0.66660)	Top-1 acc 52.734 (53.772)	Top-5 acc 76.172 (76.488)	lr 0.01905
Train [39][3070/3239]	Time 0.235 (0.493)	Data Time 0.001 (0.012)	Loss 3.0063 (2.9204)	Entropy 0.66373 (0.66659)	Top-1 acc 51.953 (53.774)	Top-5 acc 73.828 (76.493)	lr 0.01905
Train [39][3080/3239]	Time 0.278 (0.493)	Data Time 0.001 (0.012)	Loss 3.1230 (2.9207)	Entropy 0.66358 (0.66658)	Top-1 acc 49.219 (53.769)	Top-5 acc 75.000 (76.486)	lr 0.01905
Train [39][3090/3239]	Time 0.234 (0.493)	Data Time 0.001 (0.012)	Loss 2.8721 (2.9205)	Entropy 0.66362 (0.66657)	Top-1 acc 53.906 (53.772)	Top-5 acc 79.297 (76.490)	lr 0.01904
Train [39][3100/3239]	Time 0.243 (0.493)	Data Time 0.001 (0.012)	Loss 3.1154 (2.9206)	Entropy 0.66356 (0.66656)	Top-1 acc 46.875 (53.767)	Top-5 acc 73.438 (76.488)	lr 0.01904
Train [39][3110/3239]	Time 0.255 (0.493)	Data Time 0.001 (0.012)	Loss 2.7988 (2.9206)	Entropy 0.66371 (0.66655)	Top-1 acc 58.594 (53.770)	Top-5 acc 78.906 (76.488)	lr 0.01904
Train [39][3120/3239]	Time 0.236 (0.492)	Data Time 0.001 (0.012)	Loss 2.9704 (2.9206)	Entropy 0.66352 (0.66654)	Top-1 acc 56.250 (53.770)	Top-5 acc 75.391 (76.486)	lr 0.01904
Train [39][3130/3239]	Time 0.380 (0.492)	Data Time 0.001 (0.012)	Loss 2.9380 (2.9205)	Entropy 0.66375 (0.66653)	Top-1 acc 54.297 (53.774)	Top-5 acc 75.781 (76.488)	lr 0.01904
Train [39][3140/3239]	Time 0.273 (0.492)	Data Time 0.001 (0.012)	Loss 2.9843 (2.9204)	Entropy 0.66413 (0.66652)	Top-1 acc 50.781 (53.776)	Top-5 acc 75.781 (76.489)	lr 0.01904
Train [39][3150/3239]	Time 0.232 (0.492)	Data Time 0.001 (0.012)	Loss 2.8083 (2.9202)	Entropy 0.66411 (0.66652)	Top-1 acc 58.594 (53.784)	Top-5 acc 80.078 (76.492)	lr 0.01904
Train [39][3160/3239]	Time 0.239 (0.492)	Data Time 0.001 (0.012)	Loss 2.9043 (2.9205)	Entropy 0.66434 (0.66651)	Top-1 acc 55.469 (53.780)	Top-5 acc 73.828 (76.485)	lr 0.01904
Train [39][3170/3239]	Time 0.270 (0.492)	Data Time 0.001 (0.012)	Loss 2.9096 (2.9205)	Entropy 0.66454 (0.66650)	Top-1 acc 51.953 (53.779)	Top-5 acc 78.125 (76.486)	lr 0.01904
Train [39][3180/3239]	Time 0.231 (0.492)	Data Time 0.000 (0.012)	Loss 2.9088 (2.9205)	Entropy 0.66470 (0.66650)	Top-1 acc 51.953 (53.779)	Top-5 acc 78.906 (76.485)	lr 0.01904
Train [39][3190/3239]	Time 0.232 (0.491)	Data Time 0.000 (0.012)	Loss 2.9469 (2.9206)	Entropy 0.66482 (0.66649)	Top-1 acc 52.734 (53.779)	Top-5 acc 76.953 (76.482)	lr 0.01904
Train [39][3200/3239]	Time 0.226 (0.491)	Data Time 0.000 (0.012)	Loss 2.9415 (2.9206)	Entropy 0.66443 (0.66648)	Top-1 acc 54.688 (53.781)	Top-5 acc 76.172 (76.482)	lr 0.01903
Train [39][3210/3239]	Time 0.230 (0.491)	Data Time 0.000 (0.012)	Loss 3.3400 (2.9207)	Entropy 0.66446 (0.66648)	Top-1 acc 44.922 (53.778)	Top-5 acc 69.141 (76.482)	lr 0.01903
Train [39][3220/3239]	Time 0.231 (0.490)	Data Time 0.000 (0.012)	Loss 2.8549 (2.9206)	Entropy 0.66431 (0.66647)	Top-1 acc 55.859 (53.784)	Top-5 acc 79.688 (76.485)	lr 0.01903
Train [39][3230/3239]	Time 0.224 (0.490)	Data Time 0.000 (0.012)	Loss 3.1923 (2.9208)	Entropy 0.66408 (0.66646)	Top-1 acc 48.828 (53.775)	Top-5 acc 70.312 (76.478)	lr 0.01903
Train [39][3239/3239]	Time 0.766 (0.490)	Data Time 0.000 (0.012)	Loss 3.3055 (2.9211)	Entropy 0.66414 (0.66646)	Top-1 acc 45.679 (53.767)	Top-5 acc 69.136 (76.472)	lr 0.01903
==========Valid [39/120]	loss 1.634	top-1 acc 62.938 (62.938)	top-5 acc 84.323	Train top-1 53.767	top-5 76.472	Entropy 0.66414	Latency-None: 0.000ms	Flops: 539.76M
Train [40][0/3239]	Time 30.921 (30.921)	Data Time 29.794 (29.794)	Loss 2.9053 (2.9053)	Entropy 0.66413 (0.66413)	Top-1 acc 56.250 (56.250)	Top-5 acc 76.953 (76.953)	lr 0.01903
Train [40][10/3239]	Time 0.215 (3.284)	Data Time 0.001 (2.731)	Loss 2.8055 (2.8870)	Entropy 0.66441 (0.66424)	Top-1 acc 56.641 (54.439)	Top-5 acc 78.516 (77.770)	lr 0.01903
Train [40][20/3239]	Time 0.237 (1.930)	Data Time 0.001 (1.432)	Loss 2.9229 (2.9136)	Entropy 0.66460 (0.66436)	Top-1 acc 57.422 (53.850)	Top-5 acc 73.438 (76.618)	lr 0.01903
Train [40][30/3239]	Time 0.390 (2.444)	Data Time 0.004 (0.971)	Loss 2.9187 (2.9071)	Entropy 0.66472 (0.66442)	Top-1 acc 51.562 (53.957)	Top-5 acc 79.297 (77.167)	lr 0.01903
Train [40][40/3239]	Time 0.271 (1.967)	Data Time 0.002 (0.735)	Loss 2.9927 (2.9142)	Entropy 0.66484 (0.66450)	Top-1 acc 51.562 (53.925)	Top-5 acc 72.266 (76.820)	lr 0.01903
Train [40][50/3239]	Time 0.282 (1.671)	Data Time 0.002 (0.592)	Loss 3.0713 (2.9140)	Entropy 0.66479 (0.66455)	Top-1 acc 48.047 (53.975)	Top-5 acc 74.219 (76.700)	lr 0.01903
Train [40][60/3239]	Time 0.228 (1.467)	Data Time 0.001 (0.495)	Loss 2.7389 (2.9115)	Entropy 0.66474 (0.66458)	Top-1 acc 57.031 (53.932)	Top-5 acc 78.906 (76.627)	lr 0.01903
Train [40][70/3239]	Time 0.265 (1.326)	Data Time 0.002 (0.426)	Loss 2.9235 (2.9182)	Entropy 0.66497 (0.66462)	Top-1 acc 55.859 (53.763)	Top-5 acc 77.344 (76.540)	lr 0.01903
Train [40][80/3239]	Time 0.239 (1.219)	Data Time 0.001 (0.373)	Loss 3.0257 (2.9136)	Entropy 0.66523 (0.66468)	Top-1 acc 49.609 (53.844)	Top-5 acc 73.828 (76.606)	lr 0.01902
Train [40][90/3239]	Time 0.224 (1.134)	Data Time 0.001 (0.332)	Loss 2.8436 (2.9125)	Entropy 0.66477 (0.66471)	Top-1 acc 56.250 (54.044)	Top-5 acc 77.344 (76.520)	lr 0.01902
Train [40][100/3239]	Time 0.232 (1.064)	Data Time 0.001 (0.300)	Loss 2.7957 (2.9096)	Entropy 0.66448 (0.66471)	Top-1 acc 53.125 (53.995)	Top-5 acc 79.688 (76.667)	lr 0.01902
Train [40][110/3239]	Time 0.252 (1.006)	Data Time 0.001 (0.273)	Loss 2.5745 (2.9080)	Entropy 0.66429 (0.66468)	Top-1 acc 62.500 (54.015)	Top-5 acc 82.422 (76.658)	lr 0.01902
Train [40][120/3239]	Time 0.350 (0.959)	Data Time 0.001 (0.250)	Loss 2.9293 (2.9108)	Entropy 0.66434 (0.66466)	Top-1 acc 51.562 (53.977)	Top-5 acc 73.438 (76.575)	lr 0.01902
Train [40][130/3239]	Time 0.270 (0.919)	Data Time 0.001 (0.231)	Loss 2.9400 (2.9081)	Entropy 0.66450 (0.66463)	Top-1 acc 54.297 (54.097)	Top-5 acc 76.953 (76.613)	lr 0.01902
Train [40][140/3239]	Time 0.271 (0.884)	Data Time 0.002 (0.215)	Loss 3.0982 (2.9096)	Entropy 0.66460 (0.66462)	Top-1 acc 49.609 (54.072)	Top-5 acc 72.656 (76.601)	lr 0.01902
Train [40][150/3239]	Time 0.261 (0.856)	Data Time 0.001 (0.201)	Loss 2.8477 (2.9059)	Entropy 0.66497 (0.66463)	Top-1 acc 57.812 (54.261)	Top-5 acc 75.391 (76.645)	lr 0.01902
Train [40][160/3239]	Time 0.236 (0.830)	Data Time 0.001 (0.189)	Loss 2.8627 (2.9065)	Entropy 0.66481 (0.66464)	Top-1 acc 53.906 (54.229)	Top-5 acc 79.688 (76.635)	lr 0.01902
Train [40][170/3239]	Time 0.257 (0.808)	Data Time 0.002 (0.178)	Loss 2.8672 (2.9059)	Entropy 0.66531 (0.66467)	Top-1 acc 55.469 (54.247)	Top-5 acc 77.734 (76.674)	lr 0.01902
Train [40][180/3239]	Time 0.247 (0.786)	Data Time 0.002 (0.168)	Loss 2.8039 (2.9035)	Entropy 0.66547 (0.66470)	Top-1 acc 56.641 (54.308)	Top-5 acc 79.297 (76.739)	lr 0.01902
Train [40][190/3239]	Time 0.394 (0.769)	Data Time 0.002 (0.159)	Loss 3.1436 (2.9021)	Entropy 0.66559 (0.66475)	Top-1 acc 48.438 (54.344)	Top-5 acc 73.438 (76.802)	lr 0.01901
Train [40][200/3239]	Time 0.234 (0.753)	Data Time 0.001 (0.151)	Loss 2.8965 (2.9042)	Entropy 0.66543 (0.66478)	Top-1 acc 56.250 (54.307)	Top-5 acc 77.734 (76.803)	lr 0.01901
Train [40][210/3239]	Time 0.277 (0.738)	Data Time 0.001 (0.144)	Loss 2.8717 (2.9041)	Entropy 0.66568 (0.66482)	Top-1 acc 54.297 (54.336)	Top-5 acc 73.828 (76.794)	lr 0.01901
Train [40][220/3239]	Time 0.238 (0.725)	Data Time 0.001 (0.138)	Loss 2.9284 (2.9039)	Entropy 0.66567 (0.66486)	Top-1 acc 56.641 (54.353)	Top-5 acc 75.000 (76.801)	lr 0.01901
Train [40][230/3239]	Time 0.227 (0.713)	Data Time 0.001 (0.132)	Loss 3.1330 (2.9044)	Entropy 0.66575 (0.66489)	Top-1 acc 47.656 (54.327)	Top-5 acc 73.438 (76.782)	lr 0.01901
Train [40][240/3239]	Time 0.234 (0.701)	Data Time 0.001 (0.127)	Loss 2.9012 (2.9053)	Entropy 0.66567 (0.66493)	Top-1 acc 53.906 (54.294)	Top-5 acc 76.953 (76.759)	lr 0.01901
Train [40][250/3239]	Time 0.231 (0.690)	Data Time 0.001 (0.122)	Loss 2.9820 (2.9048)	Entropy 0.66555 (0.66496)	Top-1 acc 54.688 (54.325)	Top-5 acc 75.391 (76.746)	lr 0.01901
Train [40][260/3239]	Time 0.239 (0.681)	Data Time 0.001 (0.117)	Loss 2.8006 (2.9026)	Entropy 0.66564 (0.66498)	Top-1 acc 57.812 (54.406)	Top-5 acc 82.031 (76.820)	lr 0.01901
Train [40][270/3239]	Time 0.246 (0.672)	Data Time 0.001 (0.113)	Loss 2.7697 (2.9008)	Entropy 0.66551 (0.66501)	Top-1 acc 53.125 (54.437)	Top-5 acc 77.344 (76.826)	lr 0.01901
Train [40][280/3239]	Time 0.343 (0.663)	Data Time 0.001 (0.109)	Loss 2.9366 (2.9002)	Entropy 0.66530 (0.66502)	Top-1 acc 52.344 (54.412)	Top-5 acc 78.516 (76.884)	lr 0.01901
Train [40][290/3239]	Time 0.234 (0.655)	Data Time 0.001 (0.105)	Loss 2.9342 (2.9004)	Entropy 0.66533 (0.66503)	Top-1 acc 53.516 (54.391)	Top-5 acc 76.953 (76.890)	lr 0.01901
Train [40][300/3239]	Time 0.229 (0.647)	Data Time 0.001 (0.102)	Loss 3.0268 (2.8994)	Entropy 0.66532 (0.66505)	Top-1 acc 47.266 (54.388)	Top-5 acc 73.047 (76.906)	lr 0.01901
Train [40][310/3239]	Time 0.265 (0.641)	Data Time 0.002 (0.098)	Loss 2.8644 (2.8991)	Entropy 0.66558 (0.66505)	Top-1 acc 55.078 (54.373)	Top-5 acc 78.906 (76.895)	lr 0.01900
Train [40][320/3239]	Time 0.251 (0.634)	Data Time 0.001 (0.096)	Loss 2.7691 (2.9008)	Entropy 0.66498 (0.66506)	Top-1 acc 55.078 (54.333)	Top-5 acc 80.469 (76.862)	lr 0.01900
Train [40][330/3239]	Time 0.238 (0.628)	Data Time 0.001 (0.093)	Loss 2.7580 (2.9007)	Entropy 0.66505 (0.66506)	Top-1 acc 55.469 (54.364)	Top-5 acc 79.297 (76.873)	lr 0.01900
Train [40][340/3239]	Time 0.246 (0.623)	Data Time 0.001 (0.090)	Loss 2.9621 (2.9012)	Entropy 0.66499 (0.66506)	Top-1 acc 54.688 (54.336)	Top-5 acc 77.734 (76.860)	lr 0.01900
Train [40][350/3239]	Time 0.324 (0.617)	Data Time 0.001 (0.088)	Loss 2.8246 (2.9029)	Entropy 0.66477 (0.66505)	Top-1 acc 55.078 (54.292)	Top-5 acc 78.906 (76.813)	lr 0.01900
Train [40][360/3239]	Time 0.239 (0.612)	Data Time 0.001 (0.085)	Loss 2.9682 (2.9052)	Entropy 0.66478 (0.66505)	Top-1 acc 54.297 (54.232)	Top-5 acc 74.609 (76.746)	lr 0.01900
Train [40][370/3239]	Time 0.237 (0.607)	Data Time 0.001 (0.083)	Loss 2.7641 (2.9036)	Entropy 0.66439 (0.66504)	Top-1 acc 57.031 (54.271)	Top-5 acc 80.078 (76.779)	lr 0.01900
Train [40][380/3239]	Time 0.245 (0.602)	Data Time 0.001 (0.081)	Loss 2.8779 (2.9037)	Entropy 0.66426 (0.66501)	Top-1 acc 53.906 (54.245)	Top-5 acc 74.609 (76.772)	lr 0.01900
Train [40][390/3239]	Time 0.232 (0.597)	Data Time 0.001 (0.079)	Loss 2.6525 (2.9026)	Entropy 0.66408 (0.66499)	Top-1 acc 62.891 (54.282)	Top-5 acc 83.203 (76.800)	lr 0.01900
Train [40][400/3239]	Time 0.266 (0.594)	Data Time 0.002 (0.077)	Loss 2.8401 (2.9025)	Entropy 0.66414 (0.66497)	Top-1 acc 51.953 (54.271)	Top-5 acc 80.859 (76.815)	lr 0.01900
Train [40][410/3239]	Time 0.245 (0.590)	Data Time 0.001 (0.075)	Loss 2.7466 (2.9036)	Entropy 0.66429 (0.66495)	Top-1 acc 55.469 (54.223)	Top-5 acc 82.422 (76.781)	lr 0.01900
Train [40][420/3239]	Time 0.277 (0.586)	Data Time 0.003 (0.073)	Loss 2.9540 (2.9037)	Entropy 0.66457 (0.66494)	Top-1 acc 53.516 (54.213)	Top-5 acc 75.000 (76.768)	lr 0.01900
Train [40][430/3239]	Time 0.233 (0.582)	Data Time 0.001 (0.072)	Loss 2.7214 (2.9035)	Entropy 0.66468 (0.66493)	Top-1 acc 61.719 (54.246)	Top-5 acc 78.906 (76.773)	lr 0.01899
Train [40][440/3239]	Time 0.299 (0.578)	Data Time 0.001 (0.070)	Loss 2.9461 (2.9053)	Entropy 0.66502 (0.66492)	Top-1 acc 51.562 (54.176)	Top-5 acc 75.000 (76.741)	lr 0.01899
Train [40][450/3239]	Time 0.242 (0.575)	Data Time 0.001 (0.068)	Loss 3.0069 (2.9058)	Entropy 0.66539 (0.66493)	Top-1 acc 51.562 (54.153)	Top-5 acc 74.609 (76.742)	lr 0.01899
Train [40][460/3239]	Time 0.245 (0.572)	Data Time 0.001 (0.067)	Loss 2.9754 (2.9051)	Entropy 0.66545 (0.66494)	Top-1 acc 53.516 (54.164)	Top-5 acc 75.781 (76.763)	lr 0.01899
Train [40][470/3239]	Time 0.220 (0.569)	Data Time 0.001 (0.066)	Loss 2.9028 (2.9062)	Entropy 0.66555 (0.66495)	Top-1 acc 53.125 (54.138)	Top-5 acc 75.391 (76.749)	lr 0.01899
Train [40][480/3239]	Time 0.229 (0.566)	Data Time 0.001 (0.064)	Loss 3.0423 (2.9070)	Entropy 0.66526 (0.66496)	Top-1 acc 53.125 (54.127)	Top-5 acc 72.656 (76.735)	lr 0.01899
Train [40][490/3239]	Time 0.246 (0.563)	Data Time 0.001 (0.063)	Loss 2.9581 (2.9064)	Entropy 0.66507 (0.66497)	Top-1 acc 51.172 (54.154)	Top-5 acc 74.219 (76.743)	lr 0.01899
Train [40][500/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.062)	Loss 3.1325 (2.9056)	Entropy 0.66513 (0.66497)	Top-1 acc 48.047 (54.148)	Top-5 acc 70.703 (76.759)	lr 0.01899
Train [40][510/3239]	Time 0.330 (0.557)	Data Time 0.001 (0.061)	Loss 2.7901 (2.9044)	Entropy 0.66522 (0.66498)	Top-1 acc 57.422 (54.183)	Top-5 acc 80.859 (76.798)	lr 0.01899
Train [40][520/3239]	Time 0.248 (0.554)	Data Time 0.001 (0.059)	Loss 3.0671 (2.9044)	Entropy 0.66518 (0.66498)	Top-1 acc 50.781 (54.193)	Top-5 acc 75.391 (76.788)	lr 0.01899
Train [40][530/3239]	Time 0.241 (0.552)	Data Time 0.001 (0.058)	Loss 2.8841 (2.9039)	Entropy 0.66492 (0.66498)	Top-1 acc 48.828 (54.198)	Top-5 acc 77.344 (76.802)	lr 0.01899
Train [40][540/3239]	Time 0.234 (0.550)	Data Time 0.001 (0.057)	Loss 2.9119 (2.9031)	Entropy 0.66518 (0.66499)	Top-1 acc 51.562 (54.199)	Top-5 acc 76.562 (76.813)	lr 0.01898
Train [40][550/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.056)	Loss 3.1456 (2.9028)	Entropy 0.66560 (0.66499)	Top-1 acc 49.219 (54.221)	Top-5 acc 69.922 (76.813)	lr 0.01898
Train [40][560/3239]	Time 0.235 (0.545)	Data Time 0.001 (0.055)	Loss 2.8674 (2.9023)	Entropy 0.66530 (0.66500)	Top-1 acc 58.203 (54.252)	Top-5 acc 79.688 (76.822)	lr 0.01898
Train [40][570/3239]	Time 0.271 (0.544)	Data Time 0.002 (0.054)	Loss 3.0562 (2.9023)	Entropy 0.66549 (0.66501)	Top-1 acc 47.656 (54.225)	Top-5 acc 73.438 (76.830)	lr 0.01898
Train [40][580/3239]	Time 0.357 (0.542)	Data Time 0.001 (0.053)	Loss 2.9159 (2.9025)	Entropy 0.66534 (0.66501)	Top-1 acc 53.125 (54.204)	Top-5 acc 78.125 (76.844)	lr 0.01898
Train [40][590/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.053)	Loss 2.8565 (2.9005)	Entropy 0.66488 (0.66502)	Top-1 acc 57.422 (54.237)	Top-5 acc 78.125 (76.886)	lr 0.01898
Train [40][600/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.052)	Loss 2.8687 (2.9014)	Entropy 0.66467 (0.66502)	Top-1 acc 54.297 (54.219)	Top-5 acc 76.172 (76.858)	lr 0.01898
Train [40][610/3239]	Time 0.239 (0.536)	Data Time 0.001 (0.051)	Loss 3.0771 (2.9015)	Entropy 0.66460 (0.66501)	Top-1 acc 51.172 (54.199)	Top-5 acc 71.484 (76.858)	lr 0.01898
Train [40][620/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.050)	Loss 2.6622 (2.9003)	Entropy 0.66473 (0.66500)	Top-1 acc 55.469 (54.221)	Top-5 acc 82.422 (76.884)	lr 0.01898
Train [40][630/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.049)	Loss 2.7803 (2.8999)	Entropy 0.66434 (0.66500)	Top-1 acc 54.688 (54.229)	Top-5 acc 80.078 (76.884)	lr 0.01898
Train [40][640/3239]	Time 0.252 (0.531)	Data Time 0.001 (0.049)	Loss 2.9467 (2.8995)	Entropy 0.66450 (0.66499)	Top-1 acc 49.219 (54.232)	Top-5 acc 77.734 (76.893)	lr 0.01898
Train [40][650/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.048)	Loss 2.8792 (2.8996)	Entropy 0.66439 (0.66498)	Top-1 acc 52.734 (54.227)	Top-5 acc 79.297 (76.893)	lr 0.01898
Train [40][660/3239]	Time 0.225 (0.528)	Data Time 0.001 (0.047)	Loss 3.0521 (2.8997)	Entropy 0.66350 (0.66497)	Top-1 acc 47.266 (54.214)	Top-5 acc 70.703 (76.899)	lr 0.01897
Train [40][670/3239]	Time 0.338 (0.526)	Data Time 0.001 (0.047)	Loss 2.8638 (2.8991)	Entropy 0.66371 (0.66495)	Top-1 acc 54.297 (54.227)	Top-5 acc 77.734 (76.914)	lr 0.01897
Train [40][680/3239]	Time 0.311 (0.568)	Data Time 0.006 (0.046)	Loss 2.8764 (2.8987)	Entropy 0.66351 (0.66493)	Top-1 acc 55.859 (54.226)	Top-5 acc 75.781 (76.919)	lr 0.01897
Train [40][690/3239]	Time 0.248 (0.568)	Data Time 0.002 (0.045)	Loss 2.8271 (2.8982)	Entropy 0.66320 (0.66490)	Top-1 acc 50.391 (54.245)	Top-5 acc 80.078 (76.938)	lr 0.01897
Train [40][700/3239]	Time 0.250 (0.566)	Data Time 0.001 (0.045)	Loss 2.8771 (2.8982)	Entropy 0.66363 (0.66488)	Top-1 acc 52.344 (54.239)	Top-5 acc 78.125 (76.940)	lr 0.01897
Train [40][710/3239]	Time 0.247 (0.565)	Data Time 0.001 (0.044)	Loss 2.7582 (2.8981)	Entropy 0.66374 (0.66486)	Top-1 acc 60.156 (54.244)	Top-5 acc 81.641 (76.936)	lr 0.01897
Train [40][720/3239]	Time 0.268 (0.563)	Data Time 0.001 (0.044)	Loss 2.9215 (2.8981)	Entropy 0.66408 (0.66485)	Top-1 acc 52.344 (54.248)	Top-5 acc 76.172 (76.934)	lr 0.01897
Train [40][730/3239]	Time 0.235 (0.561)	Data Time 0.001 (0.043)	Loss 3.0399 (2.8974)	Entropy 0.66435 (0.66484)	Top-1 acc 51.953 (54.272)	Top-5 acc 74.609 (76.937)	lr 0.01897
Train [40][740/3239]	Time 0.357 (0.559)	Data Time 0.001 (0.042)	Loss 2.8352 (2.8973)	Entropy 0.66433 (0.66483)	Top-1 acc 61.328 (54.294)	Top-5 acc 79.297 (76.943)	lr 0.01897
Train [40][750/3239]	Time 0.271 (0.558)	Data Time 0.001 (0.042)	Loss 3.0906 (2.8977)	Entropy 0.66461 (0.66483)	Top-1 acc 51.172 (54.296)	Top-5 acc 75.000 (76.932)	lr 0.01897
Train [40][760/3239]	Time 0.233 (0.556)	Data Time 0.001 (0.041)	Loss 2.7631 (2.8974)	Entropy 0.66457 (0.66482)	Top-1 acc 55.078 (54.295)	Top-5 acc 79.297 (76.940)	lr 0.01897
Train [40][770/3239]	Time 0.265 (0.555)	Data Time 0.002 (0.041)	Loss 2.8560 (2.8966)	Entropy 0.66469 (0.66482)	Top-1 acc 55.469 (54.330)	Top-5 acc 78.906 (76.958)	lr 0.01896
Train [40][780/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.040)	Loss 2.9370 (2.8971)	Entropy 0.66477 (0.66482)	Top-1 acc 52.734 (54.321)	Top-5 acc 77.734 (76.942)	lr 0.01896
Train [40][790/3239]	Time 0.268 (0.552)	Data Time 0.001 (0.040)	Loss 3.1054 (2.8979)	Entropy 0.66456 (0.66482)	Top-1 acc 50.391 (54.313)	Top-5 acc 73.047 (76.926)	lr 0.01896
Train [40][800/3239]	Time 0.231 (0.550)	Data Time 0.001 (0.039)	Loss 2.9982 (2.8983)	Entropy 0.66441 (0.66481)	Top-1 acc 56.641 (54.309)	Top-5 acc 76.172 (76.922)	lr 0.01896
Train [40][810/3239]	Time 0.282 (0.548)	Data Time 0.002 (0.039)	Loss 3.3853 (2.8991)	Entropy 0.66422 (0.66481)	Top-1 acc 44.531 (54.307)	Top-5 acc 69.141 (76.908)	lr 0.01896
Train [40][820/3239]	Time 0.230 (0.547)	Data Time 0.001 (0.038)	Loss 2.9239 (2.8990)	Entropy 0.66436 (0.66480)	Top-1 acc 55.469 (54.313)	Top-5 acc 76.172 (76.911)	lr 0.01896
Train [40][830/3239]	Time 0.326 (0.545)	Data Time 0.001 (0.038)	Loss 2.7930 (2.8986)	Entropy 0.66430 (0.66479)	Top-1 acc 55.859 (54.329)	Top-5 acc 79.297 (76.914)	lr 0.01896
Train [40][840/3239]	Time 0.273 (0.544)	Data Time 0.002 (0.038)	Loss 2.7709 (2.8988)	Entropy 0.66449 (0.66479)	Top-1 acc 58.203 (54.328)	Top-5 acc 81.250 (76.907)	lr 0.01896
Train [40][850/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.037)	Loss 2.8702 (2.8989)	Entropy 0.66474 (0.66479)	Top-1 acc 55.078 (54.317)	Top-5 acc 75.000 (76.900)	lr 0.01896
Train [40][860/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.037)	Loss 2.9629 (2.8988)	Entropy 0.66473 (0.66478)	Top-1 acc 53.516 (54.324)	Top-5 acc 76.172 (76.906)	lr 0.01896
Train [40][870/3239]	Time 0.232 (0.539)	Data Time 0.001 (0.036)	Loss 2.8358 (2.8981)	Entropy 0.66447 (0.66478)	Top-1 acc 55.859 (54.338)	Top-5 acc 79.297 (76.929)	lr 0.01896
Train [40][880/3239]	Time 0.303 (0.538)	Data Time 0.001 (0.036)	Loss 3.0202 (2.8982)	Entropy 0.66396 (0.66478)	Top-1 acc 51.172 (54.333)	Top-5 acc 75.000 (76.928)	lr 0.01896
Train [40][890/3239]	Time 0.271 (0.537)	Data Time 0.001 (0.036)	Loss 2.9914 (2.8986)	Entropy 0.66411 (0.66477)	Top-1 acc 49.609 (54.316)	Top-5 acc 76.172 (76.935)	lr 0.01895
Train [40][900/3239]	Time 0.330 (0.536)	Data Time 0.001 (0.035)	Loss 2.7605 (2.8979)	Entropy 0.66417 (0.66476)	Top-1 acc 53.516 (54.331)	Top-5 acc 80.859 (76.960)	lr 0.01895
Train [40][910/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.035)	Loss 2.6394 (2.8972)	Entropy 0.66397 (0.66475)	Top-1 acc 59.766 (54.340)	Top-5 acc 82.031 (76.980)	lr 0.01895
Train [40][920/3239]	Time 0.243 (0.533)	Data Time 0.001 (0.034)	Loss 3.1352 (2.8977)	Entropy 0.66412 (0.66475)	Top-1 acc 48.047 (54.331)	Top-5 acc 69.531 (76.961)	lr 0.01895
Train [40][930/3239]	Time 0.258 (0.532)	Data Time 0.001 (0.034)	Loss 2.9805 (2.8980)	Entropy 0.66425 (0.66474)	Top-1 acc 50.391 (54.311)	Top-5 acc 75.000 (76.956)	lr 0.01895
Train [40][940/3239]	Time 0.245 (0.531)	Data Time 0.001 (0.034)	Loss 2.8585 (2.8982)	Entropy 0.66429 (0.66474)	Top-1 acc 55.078 (54.306)	Top-5 acc 76.953 (76.945)	lr 0.01895
Train [40][950/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.033)	Loss 3.0438 (2.8985)	Entropy 0.66447 (0.66473)	Top-1 acc 51.953 (54.292)	Top-5 acc 71.094 (76.942)	lr 0.01895
Train [40][960/3239]	Time 0.249 (0.529)	Data Time 0.001 (0.033)	Loss 2.9899 (2.8986)	Entropy 0.66495 (0.66473)	Top-1 acc 53.125 (54.292)	Top-5 acc 74.219 (76.936)	lr 0.01895
Train [40][970/3239]	Time 0.281 (0.528)	Data Time 0.001 (0.033)	Loss 2.8106 (2.8986)	Entropy 0.66501 (0.66473)	Top-1 acc 58.594 (54.290)	Top-5 acc 78.906 (76.928)	lr 0.01895
Train [40][980/3239]	Time 0.262 (0.527)	Data Time 0.001 (0.032)	Loss 2.8878 (2.8984)	Entropy 0.66525 (0.66474)	Top-1 acc 50.391 (54.288)	Top-5 acc 78.125 (76.934)	lr 0.01895
Train [40][990/3239]	Time 0.256 (0.525)	Data Time 0.001 (0.032)	Loss 2.8880 (2.8977)	Entropy 0.66474 (0.66474)	Top-1 acc 53.125 (54.316)	Top-5 acc 76.562 (76.947)	lr 0.01895
Train [40][1000/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.032)	Loss 2.7681 (2.8978)	Entropy 0.66498 (0.66474)	Top-1 acc 54.297 (54.309)	Top-5 acc 81.641 (76.946)	lr 0.01894
Train [40][1010/3239]	Time 0.263 (0.523)	Data Time 0.001 (0.031)	Loss 2.7745 (2.8973)	Entropy 0.66494 (0.66474)	Top-1 acc 55.078 (54.314)	Top-5 acc 79.297 (76.954)	lr 0.01894
Train [40][1020/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.031)	Loss 2.7733 (2.8977)	Entropy 0.66536 (0.66475)	Top-1 acc 56.641 (54.316)	Top-5 acc 77.344 (76.949)	lr 0.01894
Train [40][1030/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.031)	Loss 3.2600 (2.8988)	Entropy 0.66525 (0.66475)	Top-1 acc 43.750 (54.289)	Top-5 acc 69.922 (76.922)	lr 0.01894
Train [40][1040/3239]	Time 0.245 (0.520)	Data Time 0.001 (0.031)	Loss 2.9646 (2.8995)	Entropy 0.66552 (0.66476)	Top-1 acc 54.297 (54.278)	Top-5 acc 74.609 (76.896)	lr 0.01894
Train [40][1050/3239]	Time 0.218 (0.519)	Data Time 0.001 (0.030)	Loss 3.0530 (2.9002)	Entropy 0.66565 (0.66477)	Top-1 acc 46.875 (54.259)	Top-5 acc 75.000 (76.877)	lr 0.01894
Train [40][1060/3239]	Time 0.360 (0.518)	Data Time 0.001 (0.030)	Loss 2.9999 (2.8999)	Entropy 0.66558 (0.66477)	Top-1 acc 52.344 (54.271)	Top-5 acc 75.000 (76.881)	lr 0.01894
Train [40][1070/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.030)	Loss 2.9966 (2.9002)	Entropy 0.66505 (0.66478)	Top-1 acc 53.906 (54.265)	Top-5 acc 74.609 (76.866)	lr 0.01894
Train [40][1080/3239]	Time 0.256 (0.516)	Data Time 0.001 (0.030)	Loss 2.8450 (2.9001)	Entropy 0.66533 (0.66478)	Top-1 acc 55.078 (54.269)	Top-5 acc 75.781 (76.871)	lr 0.01894
Train [40][1090/3239]	Time 0.225 (0.515)	Data Time 0.001 (0.029)	Loss 3.0383 (2.9001)	Entropy 0.66492 (0.66479)	Top-1 acc 54.688 (54.273)	Top-5 acc 74.219 (76.871)	lr 0.01894
Train [40][1100/3239]	Time 0.223 (0.514)	Data Time 0.001 (0.029)	Loss 2.7917 (2.9003)	Entropy 0.66530 (0.66479)	Top-1 acc 56.641 (54.272)	Top-5 acc 78.516 (76.867)	lr 0.01894
Train [40][1110/3239]	Time 0.248 (0.513)	Data Time 0.001 (0.029)	Loss 2.8948 (2.9006)	Entropy 0.66496 (0.66479)	Top-1 acc 54.688 (54.265)	Top-5 acc 75.000 (76.863)	lr 0.01894
Train [40][1120/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.029)	Loss 2.7276 (2.9008)	Entropy 0.66484 (0.66479)	Top-1 acc 56.641 (54.265)	Top-5 acc 81.641 (76.857)	lr 0.01893
Train [40][1130/3239]	Time 0.354 (0.511)	Data Time 0.001 (0.028)	Loss 2.7683 (2.9004)	Entropy 0.66464 (0.66479)	Top-1 acc 58.203 (54.269)	Top-5 acc 79.297 (76.870)	lr 0.01893
Train [40][1140/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.028)	Loss 2.7782 (2.9003)	Entropy 0.66414 (0.66479)	Top-1 acc 57.031 (54.276)	Top-5 acc 77.734 (76.872)	lr 0.01893
Train [40][1150/3239]	Time 0.264 (0.509)	Data Time 0.001 (0.028)	Loss 2.6097 (2.8998)	Entropy 0.66425 (0.66479)	Top-1 acc 60.938 (54.284)	Top-5 acc 82.031 (76.884)	lr 0.01893
Train [40][1160/3239]	Time 0.236 (0.509)	Data Time 0.001 (0.028)	Loss 2.6553 (2.8998)	Entropy 0.66429 (0.66478)	Top-1 acc 60.547 (54.279)	Top-5 acc 83.203 (76.884)	lr 0.01893
Train [40][1170/3239]	Time 0.223 (0.508)	Data Time 0.001 (0.027)	Loss 2.9520 (2.8999)	Entropy 0.66400 (0.66477)	Top-1 acc 53.516 (54.281)	Top-5 acc 73.828 (76.872)	lr 0.01893
Train [40][1180/3239]	Time 0.223 (0.507)	Data Time 0.001 (0.027)	Loss 3.1384 (2.9002)	Entropy 0.66397 (0.66477)	Top-1 acc 47.266 (54.275)	Top-5 acc 73.438 (76.870)	lr 0.01893
Train [40][1190/3239]	Time 0.229 (0.506)	Data Time 0.001 (0.027)	Loss 2.9003 (2.9005)	Entropy 0.66404 (0.66476)	Top-1 acc 57.422 (54.263)	Top-5 acc 75.391 (76.862)	lr 0.01893
Train [40][1200/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.027)	Loss 2.8771 (2.9005)	Entropy 0.66406 (0.66475)	Top-1 acc 55.859 (54.266)	Top-5 acc 75.000 (76.863)	lr 0.01893
Train [40][1210/3239]	Time 0.228 (0.504)	Data Time 0.001 (0.027)	Loss 2.6764 (2.9007)	Entropy 0.66455 (0.66475)	Top-1 acc 62.109 (54.268)	Top-5 acc 82.812 (76.854)	lr 0.01893
Train [40][1220/3239]	Time 0.378 (0.504)	Data Time 0.001 (0.026)	Loss 2.8965 (2.9008)	Entropy 0.66494 (0.66475)	Top-1 acc 53.906 (54.267)	Top-5 acc 78.125 (76.855)	lr 0.01893
Train [40][1230/3239]	Time 0.226 (0.503)	Data Time 0.001 (0.026)	Loss 2.9710 (2.9009)	Entropy 0.66483 (0.66475)	Top-1 acc 53.516 (54.265)	Top-5 acc 77.734 (76.851)	lr 0.01892
Train [40][1240/3239]	Time 0.226 (0.502)	Data Time 0.001 (0.026)	Loss 3.2037 (2.9014)	Entropy 0.66473 (0.66475)	Top-1 acc 46.094 (54.250)	Top-5 acc 70.312 (76.836)	lr 0.01892
Train [40][1250/3239]	Time 0.237 (0.501)	Data Time 0.001 (0.026)	Loss 2.7159 (2.9009)	Entropy 0.66482 (0.66475)	Top-1 acc 57.031 (54.270)	Top-5 acc 81.250 (76.849)	lr 0.01892
Train [40][1260/3239]	Time 0.224 (0.501)	Data Time 0.001 (0.026)	Loss 2.9606 (2.9011)	Entropy 0.66481 (0.66475)	Top-1 acc 55.859 (54.264)	Top-5 acc 75.391 (76.851)	lr 0.01892
Train [40][1270/3239]	Time 0.238 (0.500)	Data Time 0.001 (0.025)	Loss 2.7825 (2.9009)	Entropy 0.66446 (0.66475)	Top-1 acc 58.203 (54.266)	Top-5 acc 81.250 (76.850)	lr 0.01892
Train [40][1280/3239]	Time 0.246 (0.499)	Data Time 0.002 (0.025)	Loss 2.8207 (2.9008)	Entropy 0.66444 (0.66475)	Top-1 acc 55.469 (54.264)	Top-5 acc 78.125 (76.854)	lr 0.01892
Train [40][1290/3239]	Time 0.357 (0.499)	Data Time 0.002 (0.025)	Loss 2.8993 (2.9011)	Entropy 0.66425 (0.66475)	Top-1 acc 57.812 (54.266)	Top-5 acc 78.516 (76.851)	lr 0.01892
Train [40][1300/3239]	Time 0.226 (0.498)	Data Time 0.001 (0.025)	Loss 2.9264 (2.9008)	Entropy 0.66426 (0.66474)	Top-1 acc 52.344 (54.273)	Top-5 acc 73.438 (76.846)	lr 0.01892
Train [40][1310/3239]	Time 0.226 (0.497)	Data Time 0.001 (0.025)	Loss 2.8763 (2.9009)	Entropy 0.66424 (0.66474)	Top-1 acc 53.906 (54.272)	Top-5 acc 76.172 (76.842)	lr 0.01892
Train [40][1320/3239]	Time 0.284 (0.497)	Data Time 0.001 (0.025)	Loss 3.1724 (2.9012)	Entropy 0.66383 (0.66473)	Top-1 acc 45.703 (54.258)	Top-5 acc 71.484 (76.841)	lr 0.01892
Train [40][1330/3239]	Time 0.233 (0.496)	Data Time 0.001 (0.024)	Loss 2.9161 (2.9018)	Entropy 0.66365 (0.66473)	Top-1 acc 53.516 (54.243)	Top-5 acc 76.172 (76.829)	lr 0.01892
Train [40][1340/3239]	Time 0.296 (0.521)	Data Time 0.002 (0.024)	Loss 3.1434 (2.9018)	Entropy 0.66373 (0.66472)	Top-1 acc 49.219 (54.241)	Top-5 acc 73.047 (76.827)	lr 0.01892
Train [40][1350/3239]	Time 0.237 (0.521)	Data Time 0.002 (0.024)	Loss 2.9114 (2.9021)	Entropy 0.66367 (0.66471)	Top-1 acc 52.734 (54.237)	Top-5 acc 77.344 (76.822)	lr 0.01891
Train [40][1360/3239]	Time 0.273 (0.520)	Data Time 0.002 (0.024)	Loss 2.6286 (2.9012)	Entropy 0.66350 (0.66470)	Top-1 acc 62.891 (54.257)	Top-5 acc 84.766 (76.836)	lr 0.01891
Train [40][1370/3239]	Time 0.234 (0.519)	Data Time 0.001 (0.024)	Loss 2.9212 (2.9016)	Entropy 0.66313 (0.66469)	Top-1 acc 49.219 (54.244)	Top-5 acc 76.953 (76.829)	lr 0.01891
Train [40][1380/3239]	Time 0.327 (0.519)	Data Time 0.001 (0.024)	Loss 3.0655 (2.9016)	Entropy 0.66334 (0.66468)	Top-1 acc 48.047 (54.243)	Top-5 acc 75.391 (76.829)	lr 0.01891
Train [40][1390/3239]	Time 0.242 (0.518)	Data Time 0.001 (0.023)	Loss 3.1241 (2.9021)	Entropy 0.66331 (0.66467)	Top-1 acc 49.219 (54.229)	Top-5 acc 74.219 (76.820)	lr 0.01891
Train [40][1400/3239]	Time 0.278 (0.517)	Data Time 0.001 (0.023)	Loss 2.8431 (2.9018)	Entropy 0.66318 (0.66466)	Top-1 acc 55.469 (54.229)	Top-5 acc 74.219 (76.818)	lr 0.01891
Train [40][1410/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.023)	Loss 3.0608 (2.9024)	Entropy 0.66308 (0.66465)	Top-1 acc 54.688 (54.223)	Top-5 acc 73.828 (76.806)	lr 0.01891
Train [40][1420/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.023)	Loss 2.7488 (2.9021)	Entropy 0.66348 (0.66464)	Top-1 acc 56.641 (54.233)	Top-5 acc 79.688 (76.812)	lr 0.01891
Train [40][1430/3239]	Time 0.242 (0.516)	Data Time 0.001 (0.023)	Loss 2.6666 (2.9021)	Entropy 0.66366 (0.66464)	Top-1 acc 62.500 (54.233)	Top-5 acc 80.078 (76.805)	lr 0.01891
Train [40][1440/3239]	Time 0.239 (0.515)	Data Time 0.001 (0.023)	Loss 2.7616 (2.9027)	Entropy 0.66352 (0.66463)	Top-1 acc 55.469 (54.213)	Top-5 acc 79.297 (76.794)	lr 0.01891
Train [40][1450/3239]	Time 0.364 (0.514)	Data Time 0.001 (0.022)	Loss 3.0593 (2.9032)	Entropy 0.66373 (0.66462)	Top-1 acc 49.609 (54.200)	Top-5 acc 72.656 (76.779)	lr 0.01891
Train [40][1460/3239]	Time 0.239 (0.514)	Data Time 0.001 (0.022)	Loss 2.9388 (2.9036)	Entropy 0.66402 (0.66462)	Top-1 acc 53.125 (54.192)	Top-5 acc 78.906 (76.776)	lr 0.01891
Train [40][1470/3239]	Time 0.265 (0.513)	Data Time 0.001 (0.022)	Loss 2.8485 (2.9035)	Entropy 0.66404 (0.66461)	Top-1 acc 57.422 (54.198)	Top-5 acc 75.781 (76.777)	lr 0.01890
Train [40][1480/3239]	Time 0.272 (0.512)	Data Time 0.001 (0.022)	Loss 2.8411 (2.9036)	Entropy 0.66425 (0.66461)	Top-1 acc 52.734 (54.189)	Top-5 acc 77.344 (76.776)	lr 0.01890
Train [40][1490/3239]	Time 0.235 (0.512)	Data Time 0.001 (0.022)	Loss 2.8602 (2.9032)	Entropy 0.66417 (0.66461)	Top-1 acc 53.125 (54.192)	Top-5 acc 76.953 (76.786)	lr 0.01890
Train [40][1500/3239]	Time 0.270 (0.511)	Data Time 0.001 (0.022)	Loss 2.6915 (2.9035)	Entropy 0.66399 (0.66460)	Top-1 acc 56.641 (54.190)	Top-5 acc 82.031 (76.779)	lr 0.01890
Train [40][1510/3239]	Time 0.245 (0.510)	Data Time 0.001 (0.022)	Loss 3.1237 (2.9040)	Entropy 0.66396 (0.66460)	Top-1 acc 50.391 (54.181)	Top-5 acc 71.875 (76.767)	lr 0.01890
Train [40][1520/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.022)	Loss 2.9849 (2.9039)	Entropy 0.66395 (0.66459)	Top-1 acc 52.734 (54.183)	Top-5 acc 76.953 (76.774)	lr 0.01890
Train [40][1530/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.021)	Loss 2.8508 (2.9041)	Entropy 0.66395 (0.66459)	Top-1 acc 55.078 (54.179)	Top-5 acc 78.516 (76.773)	lr 0.01890
Train [40][1540/3239]	Time 0.393 (0.509)	Data Time 0.002 (0.021)	Loss 3.0794 (2.9039)	Entropy 0.66396 (0.66459)	Top-1 acc 50.781 (54.177)	Top-5 acc 75.391 (76.778)	lr 0.01890
Train [40][1550/3239]	Time 0.225 (0.508)	Data Time 0.001 (0.021)	Loss 3.0531 (2.9038)	Entropy 0.66422 (0.66458)	Top-1 acc 51.562 (54.180)	Top-5 acc 74.609 (76.778)	lr 0.01890
Train [40][1560/3239]	Time 0.242 (0.508)	Data Time 0.001 (0.021)	Loss 3.0644 (2.9041)	Entropy 0.66430 (0.66458)	Top-1 acc 50.391 (54.177)	Top-5 acc 74.609 (76.774)	lr 0.01890
Train [40][1570/3239]	Time 0.261 (0.507)	Data Time 0.001 (0.021)	Loss 2.9681 (2.9041)	Entropy 0.66437 (0.66458)	Top-1 acc 50.391 (54.176)	Top-5 acc 72.656 (76.774)	lr 0.01890
Train [40][1580/3239]	Time 0.293 (0.507)	Data Time 0.003 (0.021)	Loss 2.9735 (2.9042)	Entropy 0.66424 (0.66458)	Top-1 acc 50.391 (54.177)	Top-5 acc 75.391 (76.773)	lr 0.01889
Train [40][1590/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.021)	Loss 3.2091 (2.9043)	Entropy 0.66417 (0.66457)	Top-1 acc 46.484 (54.174)	Top-5 acc 69.531 (76.768)	lr 0.01889
Train [40][1600/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.021)	Loss 2.9591 (2.9046)	Entropy 0.66406 (0.66457)	Top-1 acc 53.516 (54.163)	Top-5 acc 75.391 (76.763)	lr 0.01889
Train [40][1610/3239]	Time 0.320 (0.505)	Data Time 0.001 (0.020)	Loss 2.9439 (2.9043)	Entropy 0.66434 (0.66457)	Top-1 acc 54.688 (54.171)	Top-5 acc 75.781 (76.771)	lr 0.01889
Train [40][1620/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.020)	Loss 2.8726 (2.9039)	Entropy 0.66460 (0.66457)	Top-1 acc 58.203 (54.182)	Top-5 acc 79.297 (76.774)	lr 0.01889
Train [40][1630/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.020)	Loss 2.9188 (2.9036)	Entropy 0.66446 (0.66457)	Top-1 acc 52.344 (54.183)	Top-5 acc 76.562 (76.781)	lr 0.01889
Train [40][1640/3239]	Time 0.225 (0.503)	Data Time 0.001 (0.020)	Loss 2.7708 (2.9034)	Entropy 0.66445 (0.66457)	Top-1 acc 58.203 (54.186)	Top-5 acc 79.688 (76.786)	lr 0.01889
Train [40][1650/3239]	Time 0.237 (0.503)	Data Time 0.001 (0.020)	Loss 2.9146 (2.9036)	Entropy 0.66464 (0.66457)	Top-1 acc 53.906 (54.179)	Top-5 acc 76.562 (76.781)	lr 0.01889
Train [40][1660/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.020)	Loss 2.8927 (2.9036)	Entropy 0.66465 (0.66457)	Top-1 acc 56.641 (54.185)	Top-5 acc 78.516 (76.779)	lr 0.01889
Train [40][1670/3239]	Time 0.232 (0.502)	Data Time 0.001 (0.020)	Loss 2.8718 (2.9032)	Entropy 0.66470 (0.66457)	Top-1 acc 50.781 (54.194)	Top-5 acc 76.953 (76.789)	lr 0.01889
Train [40][1680/3239]	Time 0.248 (0.501)	Data Time 0.001 (0.020)	Loss 2.8784 (2.9032)	Entropy 0.66467 (0.66457)	Top-1 acc 54.297 (54.193)	Top-5 acc 77.344 (76.788)	lr 0.01889
Train [40][1690/3239]	Time 0.259 (0.501)	Data Time 0.001 (0.020)	Loss 2.7629 (2.9032)	Entropy 0.66465 (0.66457)	Top-1 acc 58.203 (54.194)	Top-5 acc 77.734 (76.780)	lr 0.01889
Train [40][1700/3239]	Time 0.250 (0.500)	Data Time 0.002 (0.019)	Loss 2.9596 (2.9036)	Entropy 0.66412 (0.66457)	Top-1 acc 52.344 (54.183)	Top-5 acc 76.172 (76.776)	lr 0.01888
Train [40][1710/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.019)	Loss 2.9680 (2.9036)	Entropy 0.66432 (0.66457)	Top-1 acc 52.734 (54.180)	Top-5 acc 75.391 (76.776)	lr 0.01888
Train [40][1720/3239]	Time 0.230 (0.499)	Data Time 0.001 (0.019)	Loss 2.9191 (2.9033)	Entropy 0.66454 (0.66456)	Top-1 acc 55.078 (54.195)	Top-5 acc 76.562 (76.785)	lr 0.01888
Train [40][1730/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.019)	Loss 2.9504 (2.9034)	Entropy 0.66401 (0.66456)	Top-1 acc 52.734 (54.196)	Top-5 acc 73.828 (76.782)	lr 0.01888
Train [40][1740/3239]	Time 0.220 (0.498)	Data Time 0.001 (0.019)	Loss 2.8663 (2.9034)	Entropy 0.66403 (0.66456)	Top-1 acc 54.297 (54.193)	Top-5 acc 76.172 (76.783)	lr 0.01888
Train [40][1750/3239]	Time 0.227 (0.497)	Data Time 0.001 (0.019)	Loss 3.0643 (2.9032)	Entropy 0.66409 (0.66456)	Top-1 acc 50.391 (54.199)	Top-5 acc 75.391 (76.784)	lr 0.01888
Train [40][1760/3239]	Time 0.236 (0.497)	Data Time 0.001 (0.019)	Loss 2.7859 (2.9030)	Entropy 0.66400 (0.66455)	Top-1 acc 54.688 (54.209)	Top-5 acc 78.516 (76.784)	lr 0.01888
Train [40][1770/3239]	Time 0.318 (0.496)	Data Time 0.001 (0.019)	Loss 2.8930 (2.9029)	Entropy 0.66424 (0.66455)	Top-1 acc 55.859 (54.214)	Top-5 acc 76.172 (76.785)	lr 0.01888
Train [40][1780/3239]	Time 0.240 (0.496)	Data Time 0.001 (0.019)	Loss 2.8974 (2.9031)	Entropy 0.66446 (0.66455)	Top-1 acc 53.906 (54.208)	Top-5 acc 75.781 (76.778)	lr 0.01888
Train [40][1790/3239]	Time 0.260 (0.496)	Data Time 0.001 (0.019)	Loss 3.3262 (2.9031)	Entropy 0.66420 (0.66455)	Top-1 acc 43.750 (54.198)	Top-5 acc 67.188 (76.776)	lr 0.01888
Train [40][1800/3239]	Time 0.278 (0.495)	Data Time 0.001 (0.018)	Loss 2.9772 (2.9031)	Entropy 0.66428 (0.66455)	Top-1 acc 52.344 (54.202)	Top-5 acc 76.953 (76.779)	lr 0.01888
Train [40][1810/3239]	Time 0.251 (0.495)	Data Time 0.001 (0.018)	Loss 2.9180 (2.9030)	Entropy 0.66419 (0.66454)	Top-1 acc 55.859 (54.200)	Top-5 acc 75.781 (76.780)	lr 0.01887
Train [40][1820/3239]	Time 0.239 (0.494)	Data Time 0.001 (0.018)	Loss 2.9264 (2.9029)	Entropy 0.66408 (0.66454)	Top-1 acc 52.734 (54.201)	Top-5 acc 74.219 (76.785)	lr 0.01887
Train [40][1830/3239]	Time 0.228 (0.494)	Data Time 0.001 (0.018)	Loss 2.9765 (2.9027)	Entropy 0.66444 (0.66454)	Top-1 acc 50.391 (54.198)	Top-5 acc 75.391 (76.789)	lr 0.01887
Train [40][1840/3239]	Time 0.353 (0.493)	Data Time 0.001 (0.018)	Loss 2.8587 (2.9030)	Entropy 0.66424 (0.66454)	Top-1 acc 55.469 (54.190)	Top-5 acc 74.609 (76.782)	lr 0.01887
Train [40][1850/3239]	Time 0.239 (0.493)	Data Time 0.001 (0.018)	Loss 2.7164 (2.9027)	Entropy 0.66425 (0.66454)	Top-1 acc 56.250 (54.196)	Top-5 acc 80.469 (76.789)	lr 0.01887
Train [40][1860/3239]	Time 0.236 (0.492)	Data Time 0.001 (0.018)	Loss 2.7485 (2.9022)	Entropy 0.66428 (0.66454)	Top-1 acc 55.859 (54.207)	Top-5 acc 79.297 (76.794)	lr 0.01887
Train [40][1870/3239]	Time 0.231 (0.492)	Data Time 0.001 (0.018)	Loss 2.9610 (2.9025)	Entropy 0.66446 (0.66453)	Top-1 acc 53.125 (54.205)	Top-5 acc 73.438 (76.791)	lr 0.01887
Train [40][1880/3239]	Time 0.231 (0.491)	Data Time 0.001 (0.018)	Loss 2.7753 (2.9024)	Entropy 0.66451 (0.66453)	Top-1 acc 58.203 (54.212)	Top-5 acc 81.641 (76.798)	lr 0.01887
Train [40][1890/3239]	Time 0.240 (0.491)	Data Time 0.001 (0.018)	Loss 2.6761 (2.9019)	Entropy 0.66465 (0.66453)	Top-1 acc 60.547 (54.219)	Top-5 acc 79.297 (76.805)	lr 0.01887
Train [40][1900/3239]	Time 0.238 (0.491)	Data Time 0.001 (0.018)	Loss 2.9892 (2.9023)	Entropy 0.66451 (0.66454)	Top-1 acc 51.562 (54.212)	Top-5 acc 76.172 (76.797)	lr 0.01887
Train [40][1910/3239]	Time 0.226 (0.490)	Data Time 0.001 (0.017)	Loss 2.9209 (2.9019)	Entropy 0.66452 (0.66454)	Top-1 acc 55.078 (54.215)	Top-5 acc 75.391 (76.808)	lr 0.01887
Train [40][1920/3239]	Time 0.241 (0.490)	Data Time 0.001 (0.017)	Loss 3.0069 (2.9021)	Entropy 0.66433 (0.66454)	Top-1 acc 48.438 (54.211)	Top-5 acc 77.344 (76.805)	lr 0.01887
Train [40][1930/3239]	Time 0.328 (0.489)	Data Time 0.001 (0.017)	Loss 2.7705 (2.9020)	Entropy 0.66425 (0.66453)	Top-1 acc 56.250 (54.217)	Top-5 acc 79.688 (76.811)	lr 0.01886
Train [40][1940/3239]	Time 0.259 (0.489)	Data Time 0.002 (0.017)	Loss 2.9996 (2.9021)	Entropy 0.66416 (0.66453)	Top-1 acc 52.344 (54.215)	Top-5 acc 73.828 (76.809)	lr 0.01886
Train [40][1950/3239]	Time 0.233 (0.488)	Data Time 0.001 (0.017)	Loss 2.7698 (2.9022)	Entropy 0.66422 (0.66453)	Top-1 acc 56.641 (54.214)	Top-5 acc 80.078 (76.810)	lr 0.01886
Train [40][1960/3239]	Time 0.219 (0.488)	Data Time 0.001 (0.017)	Loss 3.0526 (2.9024)	Entropy 0.66423 (0.66453)	Top-1 acc 50.781 (54.210)	Top-5 acc 76.562 (76.810)	lr 0.01886
Train [40][1970/3239]	Time 0.224 (0.488)	Data Time 0.001 (0.017)	Loss 2.9951 (2.9025)	Entropy 0.66414 (0.66453)	Top-1 acc 53.516 (54.211)	Top-5 acc 76.172 (76.805)	lr 0.01886
Train [40][1980/3239]	Time 0.237 (0.487)	Data Time 0.001 (0.017)	Loss 2.7720 (2.9025)	Entropy 0.66350 (0.66452)	Top-1 acc 58.984 (54.215)	Top-5 acc 78.906 (76.804)	lr 0.01886
Train [40][1990/3239]	Time 0.337 (0.504)	Data Time 0.029 (0.017)	Loss 3.0535 (2.9025)	Entropy 0.66368 (0.66452)	Top-1 acc 51.172 (54.220)	Top-5 acc 76.562 (76.807)	lr 0.01886
Train [40][2000/3239]	Time 0.330 (0.503)	Data Time 0.003 (0.017)	Loss 2.8082 (2.9020)	Entropy 0.66347 (0.66451)	Top-1 acc 54.688 (54.232)	Top-5 acc 78.906 (76.816)	lr 0.01886
Train [40][2010/3239]	Time 0.236 (0.503)	Data Time 0.002 (0.017)	Loss 2.9967 (2.9022)	Entropy 0.66335 (0.66451)	Top-1 acc 50.781 (54.223)	Top-5 acc 73.828 (76.809)	lr 0.01886
Train [40][2020/3239]	Time 0.234 (0.503)	Data Time 0.001 (0.017)	Loss 2.9495 (2.9021)	Entropy 0.66307 (0.66450)	Top-1 acc 52.344 (54.227)	Top-5 acc 75.391 (76.810)	lr 0.01886
Train [40][2030/3239]	Time 0.238 (0.502)	Data Time 0.001 (0.017)	Loss 2.8832 (2.9023)	Entropy 0.66308 (0.66450)	Top-1 acc 54.297 (54.222)	Top-5 acc 79.688 (76.807)	lr 0.01886
Train [40][2040/3239]	Time 0.239 (0.502)	Data Time 0.001 (0.016)	Loss 2.9824 (2.9025)	Entropy 0.66318 (0.66449)	Top-1 acc 54.688 (54.216)	Top-5 acc 73.828 (76.805)	lr 0.01885
Train [40][2050/3239]	Time 0.243 (0.501)	Data Time 0.001 (0.016)	Loss 2.7519 (2.9024)	Entropy 0.66317 (0.66448)	Top-1 acc 60.547 (54.219)	Top-5 acc 78.906 (76.806)	lr 0.01885
Train [40][2060/3239]	Time 0.283 (0.501)	Data Time 0.001 (0.016)	Loss 2.8648 (2.9025)	Entropy 0.66325 (0.66448)	Top-1 acc 55.859 (54.217)	Top-5 acc 76.172 (76.805)	lr 0.01885
Train [40][2070/3239]	Time 0.231 (0.501)	Data Time 0.002 (0.016)	Loss 3.0170 (2.9026)	Entropy 0.66303 (0.66447)	Top-1 acc 51.172 (54.216)	Top-5 acc 75.391 (76.801)	lr 0.01885
Train [40][2080/3239]	Time 0.271 (0.501)	Data Time 0.001 (0.016)	Loss 3.0577 (2.9026)	Entropy 0.66305 (0.66446)	Top-1 acc 51.953 (54.214)	Top-5 acc 74.219 (76.803)	lr 0.01885
Train [40][2090/3239]	Time 0.325 (0.500)	Data Time 0.001 (0.016)	Loss 2.8094 (2.9024)	Entropy 0.66328 (0.66446)	Top-1 acc 58.203 (54.218)	Top-5 acc 76.562 (76.808)	lr 0.01885
Train [40][2100/3239]	Time 0.245 (0.500)	Data Time 0.001 (0.016)	Loss 2.8184 (2.9023)	Entropy 0.66352 (0.66445)	Top-1 acc 56.250 (54.220)	Top-5 acc 75.781 (76.808)	lr 0.01885
Train [40][2110/3239]	Time 0.238 (0.499)	Data Time 0.001 (0.016)	Loss 2.8081 (2.9025)	Entropy 0.66358 (0.66445)	Top-1 acc 55.078 (54.213)	Top-5 acc 79.297 (76.802)	lr 0.01885
Train [40][2120/3239]	Time 0.263 (0.499)	Data Time 0.001 (0.016)	Loss 3.0260 (2.9024)	Entropy 0.66386 (0.66444)	Top-1 acc 52.344 (54.216)	Top-5 acc 74.219 (76.804)	lr 0.01885
Train [40][2130/3239]	Time 0.245 (0.499)	Data Time 0.002 (0.016)	Loss 2.9943 (2.9024)	Entropy 0.66329 (0.66444)	Top-1 acc 51.562 (54.212)	Top-5 acc 75.781 (76.803)	lr 0.01885
Train [40][2140/3239]	Time 0.278 (0.498)	Data Time 0.001 (0.016)	Loss 2.9648 (2.9022)	Entropy 0.66320 (0.66443)	Top-1 acc 54.297 (54.220)	Top-5 acc 79.688 (76.808)	lr 0.01885
Train [40][2150/3239]	Time 0.240 (0.498)	Data Time 0.001 (0.016)	Loss 2.9732 (2.9021)	Entropy 0.66302 (0.66443)	Top-1 acc 53.125 (54.224)	Top-5 acc 75.391 (76.808)	lr 0.01885
Train [40][2160/3239]	Time 0.327 (0.498)	Data Time 0.001 (0.016)	Loss 3.2223 (2.9021)	Entropy 0.66300 (0.66442)	Top-1 acc 46.094 (54.227)	Top-5 acc 68.750 (76.808)	lr 0.01884
Train [40][2170/3239]	Time 0.228 (0.497)	Data Time 0.001 (0.016)	Loss 3.2273 (2.9023)	Entropy 0.66293 (0.66442)	Top-1 acc 43.359 (54.219)	Top-5 acc 73.047 (76.808)	lr 0.01884
Train [40][2180/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.016)	Loss 2.8043 (2.9022)	Entropy 0.66241 (0.66441)	Top-1 acc 56.250 (54.223)	Top-5 acc 78.906 (76.811)	lr 0.01884
Train [40][2190/3239]	Time 0.241 (0.496)	Data Time 0.001 (0.015)	Loss 3.0034 (2.9022)	Entropy 0.66234 (0.66440)	Top-1 acc 49.609 (54.222)	Top-5 acc 76.172 (76.809)	lr 0.01884
Train [40][2200/3239]	Time 0.239 (0.496)	Data Time 0.001 (0.015)	Loss 2.9076 (2.9020)	Entropy 0.66201 (0.66439)	Top-1 acc 53.516 (54.229)	Top-5 acc 76.172 (76.812)	lr 0.01884
Train [40][2210/3239]	Time 0.323 (0.496)	Data Time 0.004 (0.015)	Loss 2.9055 (2.9015)	Entropy 0.66210 (0.66438)	Top-1 acc 56.641 (54.236)	Top-5 acc 75.000 (76.822)	lr 0.01884
Train [40][2220/3239]	Time 0.228 (0.495)	Data Time 0.001 (0.015)	Loss 3.0118 (2.9015)	Entropy 0.66189 (0.66437)	Top-1 acc 54.688 (54.235)	Top-5 acc 73.047 (76.822)	lr 0.01884
Train [40][2230/3239]	Time 0.233 (0.495)	Data Time 0.002 (0.015)	Loss 2.9888 (2.9017)	Entropy 0.66197 (0.66436)	Top-1 acc 55.859 (54.234)	Top-5 acc 78.125 (76.817)	lr 0.01884
Train [40][2240/3239]	Time 0.246 (0.495)	Data Time 0.002 (0.015)	Loss 3.0148 (2.9017)	Entropy 0.66194 (0.66435)	Top-1 acc 54.297 (54.237)	Top-5 acc 75.000 (76.816)	lr 0.01884
Train [40][2250/3239]	Time 0.292 (0.495)	Data Time 0.002 (0.015)	Loss 2.9529 (2.9016)	Entropy 0.66202 (0.66434)	Top-1 acc 55.469 (54.238)	Top-5 acc 75.391 (76.819)	lr 0.01884
Train [40][2260/3239]	Time 0.231 (0.494)	Data Time 0.001 (0.015)	Loss 2.7211 (2.9013)	Entropy 0.66180 (0.66433)	Top-1 acc 58.594 (54.243)	Top-5 acc 79.688 (76.824)	lr 0.01884
Train [40][2270/3239]	Time 0.229 (0.494)	Data Time 0.001 (0.015)	Loss 2.7179 (2.9011)	Entropy 0.66176 (0.66431)	Top-1 acc 56.641 (54.249)	Top-5 acc 80.469 (76.830)	lr 0.01883
Train [40][2280/3239]	Time 0.232 (0.493)	Data Time 0.001 (0.015)	Loss 2.8895 (2.9012)	Entropy 0.66164 (0.66430)	Top-1 acc 57.031 (54.252)	Top-5 acc 77.344 (76.827)	lr 0.01883
Train [40][2290/3239]	Time 0.218 (0.493)	Data Time 0.001 (0.015)	Loss 3.0863 (2.9012)	Entropy 0.66145 (0.66429)	Top-1 acc 51.562 (54.249)	Top-5 acc 70.703 (76.824)	lr 0.01883
Train [40][2300/3239]	Time 0.237 (0.493)	Data Time 0.001 (0.015)	Loss 2.9224 (2.9014)	Entropy 0.66169 (0.66428)	Top-1 acc 50.391 (54.242)	Top-5 acc 78.516 (76.821)	lr 0.01883
Train [40][2310/3239]	Time 0.229 (0.492)	Data Time 0.001 (0.015)	Loss 2.8690 (2.9013)	Entropy 0.66158 (0.66427)	Top-1 acc 55.078 (54.244)	Top-5 acc 79.688 (76.823)	lr 0.01883
Train [40][2320/3239]	Time 0.360 (0.492)	Data Time 0.001 (0.015)	Loss 3.0182 (2.9014)	Entropy 0.66136 (0.66426)	Top-1 acc 53.516 (54.244)	Top-5 acc 71.875 (76.820)	lr 0.01883
Train [40][2330/3239]	Time 0.224 (0.492)	Data Time 0.001 (0.015)	Loss 2.9358 (2.9017)	Entropy 0.66136 (0.66424)	Top-1 acc 55.078 (54.238)	Top-5 acc 74.609 (76.814)	lr 0.01883
Train [40][2340/3239]	Time 0.220 (0.491)	Data Time 0.001 (0.015)	Loss 2.8363 (2.9017)	Entropy 0.66144 (0.66423)	Top-1 acc 53.516 (54.235)	Top-5 acc 78.125 (76.815)	lr 0.01883
Train [40][2350/3239]	Time 0.237 (0.491)	Data Time 0.001 (0.015)	Loss 2.5538 (2.9015)	Entropy 0.66115 (0.66422)	Top-1 acc 63.672 (54.239)	Top-5 acc 83.203 (76.821)	lr 0.01883
Train [40][2360/3239]	Time 0.254 (0.490)	Data Time 0.001 (0.014)	Loss 2.8422 (2.9018)	Entropy 0.66100 (0.66421)	Top-1 acc 53.906 (54.229)	Top-5 acc 76.953 (76.810)	lr 0.01883
Train [40][2370/3239]	Time 0.224 (0.490)	Data Time 0.001 (0.014)	Loss 2.9080 (2.9017)	Entropy 0.66039 (0.66419)	Top-1 acc 54.297 (54.235)	Top-5 acc 76.953 (76.808)	lr 0.01883
Train [40][2380/3239]	Time 0.237 (0.490)	Data Time 0.001 (0.014)	Loss 2.7970 (2.9014)	Entropy 0.66076 (0.66418)	Top-1 acc 55.859 (54.244)	Top-5 acc 75.781 (76.814)	lr 0.01883
Train [40][2390/3239]	Time 0.349 (0.489)	Data Time 0.001 (0.014)	Loss 2.8396 (2.9012)	Entropy 0.66078 (0.66416)	Top-1 acc 57.031 (54.250)	Top-5 acc 78.516 (76.816)	lr 0.01882
Train [40][2400/3239]	Time 0.233 (0.489)	Data Time 0.001 (0.014)	Loss 2.8893 (2.9012)	Entropy 0.66055 (0.66415)	Top-1 acc 58.984 (54.254)	Top-5 acc 75.391 (76.816)	lr 0.01882
Train [40][2410/3239]	Time 0.236 (0.489)	Data Time 0.001 (0.014)	Loss 2.9887 (2.9012)	Entropy 0.66043 (0.66413)	Top-1 acc 52.344 (54.252)	Top-5 acc 73.828 (76.815)	lr 0.01882
Train [40][2420/3239]	Time 0.240 (0.489)	Data Time 0.002 (0.014)	Loss 2.9005 (2.9012)	Entropy 0.66002 (0.66412)	Top-1 acc 55.859 (54.248)	Top-5 acc 76.562 (76.814)	lr 0.01882
Train [40][2430/3239]	Time 0.237 (0.488)	Data Time 0.001 (0.014)	Loss 3.0428 (2.9014)	Entropy 0.65994 (0.66410)	Top-1 acc 50.391 (54.241)	Top-5 acc 71.484 (76.811)	lr 0.01882
Train [40][2440/3239]	Time 0.235 (0.488)	Data Time 0.001 (0.014)	Loss 2.8554 (2.9015)	Entropy 0.65985 (0.66408)	Top-1 acc 57.031 (54.239)	Top-5 acc 76.953 (76.809)	lr 0.01882
Train [40][2450/3239]	Time 0.233 (0.488)	Data Time 0.001 (0.014)	Loss 2.8734 (2.9016)	Entropy 0.66001 (0.66407)	Top-1 acc 55.078 (54.236)	Top-5 acc 78.516 (76.812)	lr 0.01882
Train [40][2460/3239]	Time 0.233 (0.487)	Data Time 0.001 (0.014)	Loss 3.1135 (2.9019)	Entropy 0.65998 (0.66405)	Top-1 acc 51.953 (54.231)	Top-5 acc 72.656 (76.805)	lr 0.01882
Train [40][2470/3239]	Time 0.239 (0.487)	Data Time 0.001 (0.014)	Loss 3.1324 (2.9020)	Entropy 0.65984 (0.66403)	Top-1 acc 50.781 (54.231)	Top-5 acc 74.219 (76.801)	lr 0.01882
Train [40][2480/3239]	Time 0.331 (0.487)	Data Time 0.001 (0.014)	Loss 2.6375 (2.9019)	Entropy 0.66043 (0.66402)	Top-1 acc 62.500 (54.232)	Top-5 acc 78.516 (76.801)	lr 0.01882
Train [40][2490/3239]	Time 0.233 (0.486)	Data Time 0.001 (0.014)	Loss 2.8779 (2.9017)	Entropy 0.66090 (0.66400)	Top-1 acc 57.031 (54.238)	Top-5 acc 74.219 (76.806)	lr 0.01882
Train [40][2500/3239]	Time 0.238 (0.486)	Data Time 0.001 (0.014)	Loss 2.8357 (2.9016)	Entropy 0.66095 (0.66399)	Top-1 acc 55.078 (54.242)	Top-5 acc 78.516 (76.809)	lr 0.01881
Train [40][2510/3239]	Time 0.259 (0.486)	Data Time 0.001 (0.014)	Loss 2.8118 (2.9014)	Entropy 0.66084 (0.66398)	Top-1 acc 58.984 (54.250)	Top-5 acc 80.469 (76.814)	lr 0.01881
Train [40][2520/3239]	Time 0.241 (0.485)	Data Time 0.001 (0.014)	Loss 2.6556 (2.9013)	Entropy 0.66092 (0.66397)	Top-1 acc 60.156 (54.251)	Top-5 acc 79.688 (76.816)	lr 0.01881
Train [40][2530/3239]	Time 0.225 (0.485)	Data Time 0.001 (0.014)	Loss 2.9265 (2.9012)	Entropy 0.66064 (0.66395)	Top-1 acc 51.562 (54.253)	Top-5 acc 75.391 (76.820)	lr 0.01881
Train [40][2540/3239]	Time 0.233 (0.485)	Data Time 0.001 (0.014)	Loss 2.8300 (2.9011)	Entropy 0.66071 (0.66394)	Top-1 acc 56.641 (54.257)	Top-5 acc 77.734 (76.820)	lr 0.01881
Train [40][2550/3239]	Time 0.319 (0.484)	Data Time 0.002 (0.014)	Loss 2.8412 (2.9009)	Entropy 0.66087 (0.66393)	Top-1 acc 59.375 (54.263)	Top-5 acc 74.609 (76.821)	lr 0.01881
Train [40][2560/3239]	Time 0.239 (0.484)	Data Time 0.001 (0.014)	Loss 3.1225 (2.9009)	Entropy 0.66047 (0.66391)	Top-1 acc 47.266 (54.263)	Top-5 acc 73.438 (76.821)	lr 0.01881
Train [40][2570/3239]	Time 0.222 (0.484)	Data Time 0.001 (0.013)	Loss 2.9555 (2.9012)	Entropy 0.66037 (0.66390)	Top-1 acc 48.047 (54.253)	Top-5 acc 76.172 (76.812)	lr 0.01881
Train [40][2580/3239]	Time 0.230 (0.483)	Data Time 0.001 (0.013)	Loss 2.8696 (2.9012)	Entropy 0.66027 (0.66389)	Top-1 acc 55.078 (54.255)	Top-5 acc 77.734 (76.812)	lr 0.01881
Train [40][2590/3239]	Time 0.241 (0.483)	Data Time 0.001 (0.013)	Loss 2.8601 (2.9016)	Entropy 0.66016 (0.66387)	Top-1 acc 58.984 (54.243)	Top-5 acc 76.562 (76.805)	lr 0.01881
Train [40][2600/3239]	Time 0.253 (0.483)	Data Time 0.001 (0.013)	Loss 2.8559 (2.9015)	Entropy 0.66023 (0.66386)	Top-1 acc 52.734 (54.244)	Top-5 acc 77.344 (76.806)	lr 0.01881
Train [40][2610/3239]	Time 0.232 (0.482)	Data Time 0.001 (0.013)	Loss 2.7503 (2.9014)	Entropy 0.66019 (0.66385)	Top-1 acc 58.984 (54.245)	Top-5 acc 78.516 (76.810)	lr 0.01881
Train [40][2620/3239]	Time 0.232 (0.482)	Data Time 0.001 (0.013)	Loss 2.8219 (2.9014)	Entropy 0.66053 (0.66383)	Top-1 acc 51.953 (54.244)	Top-5 acc 80.469 (76.811)	lr 0.01880
Train [40][2630/3239]	Time 0.231 (0.482)	Data Time 0.001 (0.013)	Loss 2.9101 (2.9013)	Entropy 0.66065 (0.66382)	Top-1 acc 53.516 (54.247)	Top-5 acc 78.906 (76.816)	lr 0.01880
Train [40][2640/3239]	Time 0.361 (0.482)	Data Time 0.001 (0.013)	Loss 2.7978 (2.9013)	Entropy 0.66061 (0.66381)	Top-1 acc 54.688 (54.249)	Top-5 acc 80.469 (76.815)	lr 0.01880
Train [40][2650/3239]	Time 0.318 (0.493)	Data Time 0.002 (0.013)	Loss 2.9018 (2.9014)	Entropy 0.66048 (0.66379)	Top-1 acc 52.734 (54.245)	Top-5 acc 76.562 (76.814)	lr 0.01880
Train [40][2660/3239]	Time 0.247 (0.493)	Data Time 0.002 (0.013)	Loss 2.7812 (2.9013)	Entropy 0.66012 (0.66378)	Top-1 acc 56.250 (54.246)	Top-5 acc 76.953 (76.815)	lr 0.01880
Train [40][2670/3239]	Time 0.238 (0.493)	Data Time 0.001 (0.013)	Loss 2.8761 (2.9014)	Entropy 0.66011 (0.66377)	Top-1 acc 54.688 (54.245)	Top-5 acc 75.000 (76.813)	lr 0.01880
Train [40][2680/3239]	Time 0.246 (0.492)	Data Time 0.001 (0.013)	Loss 2.8731 (2.9013)	Entropy 0.65978 (0.66375)	Top-1 acc 54.297 (54.246)	Top-5 acc 76.953 (76.814)	lr 0.01880
Train [40][2690/3239]	Time 0.246 (0.492)	Data Time 0.001 (0.013)	Loss 2.8820 (2.9012)	Entropy 0.66007 (0.66374)	Top-1 acc 57.031 (54.248)	Top-5 acc 77.344 (76.817)	lr 0.01880
Train [40][2700/3239]	Time 0.248 (0.492)	Data Time 0.001 (0.013)	Loss 2.7091 (2.9010)	Entropy 0.65985 (0.66373)	Top-1 acc 58.203 (54.251)	Top-5 acc 82.422 (76.823)	lr 0.01880
Train [40][2710/3239]	Time 0.364 (0.492)	Data Time 0.001 (0.013)	Loss 2.9596 (2.9011)	Entropy 0.65940 (0.66371)	Top-1 acc 55.078 (54.250)	Top-5 acc 76.953 (76.821)	lr 0.01880
Train [40][2720/3239]	Time 0.241 (0.492)	Data Time 0.001 (0.013)	Loss 2.8470 (2.9010)	Entropy 0.65921 (0.66369)	Top-1 acc 55.469 (54.251)	Top-5 acc 76.562 (76.824)	lr 0.01880
Train [40][2730/3239]	Time 0.287 (0.491)	Data Time 0.001 (0.013)	Loss 3.0003 (2.9010)	Entropy 0.65902 (0.66368)	Top-1 acc 47.266 (54.246)	Top-5 acc 76.172 (76.825)	lr 0.01879
Train [40][2740/3239]	Time 0.251 (0.491)	Data Time 0.001 (0.013)	Loss 2.7575 (2.9010)	Entropy 0.65929 (0.66366)	Top-1 acc 58.203 (54.244)	Top-5 acc 83.203 (76.826)	lr 0.01879
Train [40][2750/3239]	Time 0.232 (0.491)	Data Time 0.001 (0.013)	Loss 2.8717 (2.9012)	Entropy 0.65936 (0.66365)	Top-1 acc 54.297 (54.240)	Top-5 acc 78.516 (76.825)	lr 0.01879
Train [40][2760/3239]	Time 0.263 (0.491)	Data Time 0.001 (0.013)	Loss 3.0606 (2.9014)	Entropy 0.65912 (0.66363)	Top-1 acc 48.828 (54.234)	Top-5 acc 72.266 (76.821)	lr 0.01879
Train [40][2770/3239]	Time 0.238 (0.491)	Data Time 0.002 (0.013)	Loss 2.8781 (2.9014)	Entropy 0.65897 (0.66361)	Top-1 acc 55.469 (54.233)	Top-5 acc 75.391 (76.820)	lr 0.01879
Train [40][2780/3239]	Time 0.281 (0.490)	Data Time 0.002 (0.013)	Loss 2.8741 (2.9009)	Entropy 0.65873 (0.66360)	Top-1 acc 58.984 (54.242)	Top-5 acc 76.953 (76.828)	lr 0.01879
Train [40][2790/3239]	Time 0.242 (0.490)	Data Time 0.001 (0.013)	Loss 2.8979 (2.9009)	Entropy 0.65896 (0.66358)	Top-1 acc 54.688 (54.241)	Top-5 acc 78.516 (76.829)	lr 0.01879
Train [40][2800/3239]	Time 0.331 (0.490)	Data Time 0.001 (0.013)	Loss 2.8974 (2.9009)	Entropy 0.65860 (0.66356)	Top-1 acc 57.031 (54.244)	Top-5 acc 78.516 (76.828)	lr 0.01879
Train [40][2810/3239]	Time 0.227 (0.490)	Data Time 0.001 (0.012)	Loss 2.9182 (2.9012)	Entropy 0.65872 (0.66355)	Top-1 acc 53.125 (54.242)	Top-5 acc 76.953 (76.824)	lr 0.01879
Train [40][2820/3239]	Time 0.233 (0.489)	Data Time 0.001 (0.012)	Loss 3.0079 (2.9013)	Entropy 0.65846 (0.66353)	Top-1 acc 52.344 (54.239)	Top-5 acc 75.000 (76.822)	lr 0.01879
Train [40][2830/3239]	Time 0.251 (0.489)	Data Time 0.001 (0.012)	Loss 2.9186 (2.9013)	Entropy 0.65888 (0.66351)	Top-1 acc 51.953 (54.238)	Top-5 acc 78.516 (76.821)	lr 0.01879
Train [40][2840/3239]	Time 0.244 (0.489)	Data Time 0.001 (0.012)	Loss 2.8681 (2.9014)	Entropy 0.65891 (0.66349)	Top-1 acc 54.297 (54.234)	Top-5 acc 79.297 (76.822)	lr 0.01878
Train [40][2850/3239]	Time 0.312 (0.489)	Data Time 0.001 (0.012)	Loss 2.8737 (2.9013)	Entropy 0.65929 (0.66348)	Top-1 acc 51.172 (54.237)	Top-5 acc 76.172 (76.826)	lr 0.01878
Train [40][2860/3239]	Time 0.235 (0.488)	Data Time 0.001 (0.012)	Loss 2.8410 (2.9012)	Entropy 0.65959 (0.66346)	Top-1 acc 57.812 (54.239)	Top-5 acc 77.344 (76.823)	lr 0.01878
Train [40][2870/3239]	Time 0.377 (0.488)	Data Time 0.001 (0.012)	Loss 3.0318 (2.9012)	Entropy 0.65991 (0.66345)	Top-1 acc 50.781 (54.238)	Top-5 acc 74.609 (76.820)	lr 0.01878
Train [40][2880/3239]	Time 0.241 (0.488)	Data Time 0.001 (0.012)	Loss 2.9198 (2.9011)	Entropy 0.66014 (0.66344)	Top-1 acc 54.688 (54.239)	Top-5 acc 76.953 (76.821)	lr 0.01878
Train [40][2890/3239]	Time 0.229 (0.488)	Data Time 0.001 (0.012)	Loss 2.8073 (2.9012)	Entropy 0.66042 (0.66343)	Top-1 acc 57.812 (54.238)	Top-5 acc 79.297 (76.819)	lr 0.01878
Train [40][2900/3239]	Time 0.228 (0.488)	Data Time 0.001 (0.012)	Loss 2.7953 (2.9011)	Entropy 0.66050 (0.66342)	Top-1 acc 56.250 (54.241)	Top-5 acc 79.688 (76.820)	lr 0.01878
Train [40][2910/3239]	Time 0.263 (0.487)	Data Time 0.002 (0.012)	Loss 3.0092 (2.9013)	Entropy 0.66041 (0.66341)	Top-1 acc 50.000 (54.235)	Top-5 acc 76.562 (76.816)	lr 0.01878
Train [40][2920/3239]	Time 0.248 (0.487)	Data Time 0.001 (0.012)	Loss 2.9487 (2.9011)	Entropy 0.66046 (0.66340)	Top-1 acc 55.469 (54.242)	Top-5 acc 74.219 (76.817)	lr 0.01878
Train [40][2930/3239]	Time 0.239 (0.487)	Data Time 0.001 (0.012)	Loss 2.8855 (2.9012)	Entropy 0.66008 (0.66339)	Top-1 acc 55.469 (54.242)	Top-5 acc 76.172 (76.818)	lr 0.01878
Train [40][2940/3239]	Time 0.236 (0.487)	Data Time 0.001 (0.012)	Loss 2.7862 (2.9011)	Entropy 0.65980 (0.66338)	Top-1 acc 58.594 (54.243)	Top-5 acc 76.953 (76.821)	lr 0.01878
Train [40][2950/3239]	Time 0.250 (0.486)	Data Time 0.001 (0.012)	Loss 2.9476 (2.9010)	Entropy 0.65966 (0.66336)	Top-1 acc 51.953 (54.244)	Top-5 acc 74.219 (76.823)	lr 0.01878
Train [40][2960/3239]	Time 0.257 (0.486)	Data Time 0.001 (0.012)	Loss 2.9316 (2.9010)	Entropy 0.65996 (0.66335)	Top-1 acc 52.344 (54.246)	Top-5 acc 77.734 (76.824)	lr 0.01877
Train [40][2970/3239]	Time 0.236 (0.486)	Data Time 0.001 (0.012)	Loss 2.9129 (2.9010)	Entropy 0.65982 (0.66334)	Top-1 acc 57.031 (54.247)	Top-5 acc 76.562 (76.822)	lr 0.01877
Train [40][2980/3239]	Time 0.225 (0.486)	Data Time 0.001 (0.012)	Loss 2.9305 (2.9009)	Entropy 0.65994 (0.66333)	Top-1 acc 53.906 (54.249)	Top-5 acc 75.000 (76.825)	lr 0.01877
Train [40][2990/3239]	Time 0.234 (0.485)	Data Time 0.001 (0.012)	Loss 2.8016 (2.9010)	Entropy 0.65983 (0.66332)	Top-1 acc 56.250 (54.242)	Top-5 acc 78.516 (76.824)	lr 0.01877
Train [40][3000/3239]	Time 0.235 (0.485)	Data Time 0.001 (0.012)	Loss 2.9241 (2.9011)	Entropy 0.65979 (0.66331)	Top-1 acc 51.562 (54.238)	Top-5 acc 74.219 (76.821)	lr 0.01877
Train [40][3010/3239]	Time 0.223 (0.485)	Data Time 0.001 (0.012)	Loss 3.0609 (2.9011)	Entropy 0.66024 (0.66329)	Top-1 acc 49.219 (54.236)	Top-5 acc 73.828 (76.818)	lr 0.01877
Train [40][3020/3239]	Time 0.223 (0.485)	Data Time 0.001 (0.012)	Loss 3.1685 (2.9013)	Entropy 0.66011 (0.66328)	Top-1 acc 48.828 (54.231)	Top-5 acc 72.656 (76.816)	lr 0.01877
Train [40][3030/3239]	Time 0.327 (0.484)	Data Time 0.001 (0.012)	Loss 3.0493 (2.9014)	Entropy 0.65984 (0.66327)	Top-1 acc 53.906 (54.229)	Top-5 acc 73.047 (76.815)	lr 0.01877
Train [40][3040/3239]	Time 0.238 (0.484)	Data Time 0.001 (0.012)	Loss 3.0778 (2.9013)	Entropy 0.65968 (0.66326)	Top-1 acc 52.344 (54.229)	Top-5 acc 71.094 (76.815)	lr 0.01877
Train [40][3050/3239]	Time 0.263 (0.484)	Data Time 0.001 (0.012)	Loss 2.8576 (2.9015)	Entropy 0.65932 (0.66325)	Top-1 acc 57.812 (54.229)	Top-5 acc 78.125 (76.813)	lr 0.01877
Train [40][3060/3239]	Time 0.235 (0.484)	Data Time 0.001 (0.012)	Loss 2.8735 (2.9014)	Entropy 0.65932 (0.66324)	Top-1 acc 53.906 (54.230)	Top-5 acc 75.781 (76.812)	lr 0.01877
Train [40][3070/3239]	Time 0.236 (0.483)	Data Time 0.001 (0.012)	Loss 3.0016 (2.9016)	Entropy 0.65943 (0.66322)	Top-1 acc 51.172 (54.225)	Top-5 acc 76.562 (76.807)	lr 0.01876
Train [40][3080/3239]	Time 0.231 (0.483)	Data Time 0.001 (0.012)	Loss 2.9655 (2.9017)	Entropy 0.65939 (0.66321)	Top-1 acc 54.297 (54.220)	Top-5 acc 74.609 (76.805)	lr 0.01876
Train [40][3090/3239]	Time 0.238 (0.483)	Data Time 0.001 (0.011)	Loss 3.0903 (2.9018)	Entropy 0.65883 (0.66320)	Top-1 acc 49.609 (54.218)	Top-5 acc 73.047 (76.804)	lr 0.01876
Train [40][3100/3239]	Time 0.335 (0.483)	Data Time 0.001 (0.011)	Loss 2.9759 (2.9018)	Entropy 0.65858 (0.66319)	Top-1 acc 50.000 (54.214)	Top-5 acc 73.047 (76.804)	lr 0.01876
Train [40][3110/3239]	Time 0.240 (0.482)	Data Time 0.001 (0.011)	Loss 2.7649 (2.9018)	Entropy 0.65851 (0.66317)	Top-1 acc 57.031 (54.211)	Top-5 acc 79.297 (76.801)	lr 0.01876
Train [40][3120/3239]	Time 0.233 (0.482)	Data Time 0.001 (0.011)	Loss 3.0559 (2.9018)	Entropy 0.65898 (0.66316)	Top-1 acc 50.000 (54.211)	Top-5 acc 71.094 (76.799)	lr 0.01876
Train [40][3130/3239]	Time 0.235 (0.482)	Data Time 0.001 (0.011)	Loss 2.6973 (2.9017)	Entropy 0.65855 (0.66314)	Top-1 acc 60.156 (54.213)	Top-5 acc 79.688 (76.798)	lr 0.01876
Train [40][3140/3239]	Time 0.239 (0.482)	Data Time 0.001 (0.011)	Loss 2.9199 (2.9015)	Entropy 0.65844 (0.66313)	Top-1 acc 57.422 (54.216)	Top-5 acc 75.781 (76.803)	lr 0.01876
Train [40][3150/3239]	Time 0.239 (0.481)	Data Time 0.001 (0.011)	Loss 2.9216 (2.9016)	Entropy 0.65854 (0.66311)	Top-1 acc 53.125 (54.214)	Top-5 acc 75.391 (76.801)	lr 0.01876
Train [40][3160/3239]	Time 0.277 (0.481)	Data Time 0.001 (0.011)	Loss 2.8388 (2.9016)	Entropy 0.65822 (0.66310)	Top-1 acc 54.688 (54.212)	Top-5 acc 77.344 (76.803)	lr 0.01876
Train [40][3170/3239]	Time 0.238 (0.481)	Data Time 0.001 (0.011)	Loss 3.1472 (2.9017)	Entropy 0.65817 (0.66308)	Top-1 acc 45.312 (54.211)	Top-5 acc 73.047 (76.800)	lr 0.01876
Train [40][3180/3239]	Time 0.233 (0.481)	Data Time 0.000 (0.011)	Loss 2.7271 (2.9018)	Entropy 0.65836 (0.66307)	Top-1 acc 57.031 (54.209)	Top-5 acc 78.906 (76.801)	lr 0.01876
Train [40][3190/3239]	Time 0.334 (0.481)	Data Time 0.000 (0.011)	Loss 2.8533 (2.9016)	Entropy 0.65820 (0.66305)	Top-1 acc 53.906 (54.208)	Top-5 acc 78.516 (76.804)	lr 0.01875
Train [40][3200/3239]	Time 0.230 (0.480)	Data Time 0.000 (0.011)	Loss 2.7884 (2.9016)	Entropy 0.65805 (0.66304)	Top-1 acc 57.031 (54.213)	Top-5 acc 78.906 (76.804)	lr 0.01875
Train [40][3210/3239]	Time 0.232 (0.480)	Data Time 0.000 (0.011)	Loss 2.8824 (2.9017)	Entropy 0.65795 (0.66302)	Top-1 acc 58.594 (54.211)	Top-5 acc 76.953 (76.803)	lr 0.01875
Train [40][3220/3239]	Time 0.224 (0.480)	Data Time 0.000 (0.011)	Loss 2.8418 (2.9017)	Entropy 0.65817 (0.66301)	Top-1 acc 54.688 (54.213)	Top-5 acc 79.688 (76.804)	lr 0.01875
Train [40][3230/3239]	Time 0.235 (0.479)	Data Time 0.000 (0.011)	Loss 2.7962 (2.9015)	Entropy 0.65781 (0.66299)	Top-1 acc 56.250 (54.218)	Top-5 acc 80.859 (76.811)	lr 0.01875
Train [40][3239/3239]	Time 0.930 (0.479)	Data Time 0.000 (0.011)	Loss 2.6982 (2.9014)	Entropy 0.65775 (0.66298)	Top-1 acc 53.086 (54.218)	Top-5 acc 82.716 (76.811)	lr 0.01875
==========Valid [40/120]	loss 1.611	top-1 acc 63.460 (63.460)	top-5 acc 84.377	Train top-1 54.218	top-5 76.811	Entropy 0.65775	Latency-None: 0.000ms	Flops: 539.76M
Train [41][0/3239]	Time 32.894 (32.894)	Data Time 32.380 (32.380)	Loss 2.8720 (2.8720)	Entropy 0.65754 (0.65754)	Top-1 acc 58.203 (58.203)	Top-5 acc 76.172 (76.172)	lr 0.01875
Train [41][10/3239]	Time 0.235 (3.528)	Data Time 0.001 (2.946)	Loss 2.8932 (2.8797)	Entropy 0.65750 (0.65761)	Top-1 acc 53.906 (53.622)	Top-5 acc 77.344 (77.166)	lr 0.01875
Train [41][20/3239]	Time 0.244 (2.036)	Data Time 0.001 (1.544)	Loss 2.7925 (2.8713)	Entropy 0.65751 (0.65752)	Top-1 acc 55.078 (54.111)	Top-5 acc 78.516 (77.307)	lr 0.01875
Train [41][30/3239]	Time 0.237 (1.519)	Data Time 0.002 (1.046)	Loss 2.9385 (2.8469)	Entropy 0.65764 (0.65755)	Top-1 acc 50.000 (54.700)	Top-5 acc 78.516 (77.797)	lr 0.01875
Train [41][40/3239]	Time 0.240 (1.249)	Data Time 0.001 (0.791)	Loss 3.1447 (2.8598)	Entropy 0.65735 (0.65756)	Top-1 acc 46.484 (54.526)	Top-5 acc 70.703 (77.449)	lr 0.01875
Train [41][50/3239]	Time 0.265 (1.087)	Data Time 0.001 (0.637)	Loss 2.8420 (2.8620)	Entropy 0.65739 (0.65752)	Top-1 acc 53.125 (54.672)	Top-5 acc 77.344 (77.382)	lr 0.01875
Train [41][60/3239]	Time 0.278 (1.497)	Data Time 0.005 (0.532)	Loss 2.7961 (2.8544)	Entropy 0.65694 (0.65749)	Top-1 acc 56.250 (55.014)	Top-5 acc 78.906 (77.600)	lr 0.01874
Train [41][70/3239]	Time 0.248 (1.349)	Data Time 0.002 (0.458)	Loss 2.6733 (2.8475)	Entropy 0.65675 (0.65740)	Top-1 acc 60.156 (55.177)	Top-5 acc 80.078 (77.833)	lr 0.01874
Train [41][80/3239]	Time 0.273 (1.235)	Data Time 0.001 (0.402)	Loss 2.9699 (2.8444)	Entropy 0.65660 (0.65732)	Top-1 acc 54.297 (55.194)	Top-5 acc 75.391 (77.937)	lr 0.01874
Train [41][90/3239]	Time 0.309 (1.144)	Data Time 0.001 (0.358)	Loss 3.1531 (2.8623)	Entropy 0.65631 (0.65724)	Top-1 acc 51.953 (54.932)	Top-5 acc 72.656 (77.674)	lr 0.01874
Train [41][100/3239]	Time 0.237 (1.071)	Data Time 0.001 (0.322)	Loss 2.7742 (2.8649)	Entropy 0.65592 (0.65715)	Top-1 acc 59.375 (54.889)	Top-5 acc 78.906 (77.591)	lr 0.01874
Train [41][110/3239]	Time 0.225 (1.010)	Data Time 0.001 (0.294)	Loss 3.0365 (2.8619)	Entropy 0.65604 (0.65704)	Top-1 acc 53.906 (55.053)	Top-5 acc 73.438 (77.597)	lr 0.01874
Train [41][120/3239]	Time 0.221 (0.961)	Data Time 0.001 (0.269)	Loss 2.8372 (2.8608)	Entropy 0.65636 (0.65697)	Top-1 acc 53.906 (55.139)	Top-5 acc 78.516 (77.654)	lr 0.01874
Train [41][130/3239]	Time 0.232 (0.919)	Data Time 0.001 (0.249)	Loss 2.8074 (2.8608)	Entropy 0.65639 (0.65692)	Top-1 acc 59.375 (55.159)	Top-5 acc 79.688 (77.708)	lr 0.01874
Train [41][140/3239]	Time 0.231 (0.883)	Data Time 0.001 (0.232)	Loss 2.8643 (2.8658)	Entropy 0.65630 (0.65688)	Top-1 acc 55.859 (54.934)	Top-5 acc 75.391 (77.621)	lr 0.01874
Train [41][150/3239]	Time 0.230 (0.851)	Data Time 0.001 (0.216)	Loss 2.8596 (2.8684)	Entropy 0.65620 (0.65683)	Top-1 acc 54.688 (54.848)	Top-5 acc 79.297 (77.540)	lr 0.01874
Train [41][160/3239]	Time 0.244 (0.824)	Data Time 0.003 (0.203)	Loss 3.0768 (2.8711)	Entropy 0.65591 (0.65679)	Top-1 acc 50.000 (54.826)	Top-5 acc 72.656 (77.484)	lr 0.01874
Train [41][170/3239]	Time 0.238 (0.801)	Data Time 0.001 (0.191)	Loss 2.9956 (2.8739)	Entropy 0.65572 (0.65673)	Top-1 acc 53.516 (54.788)	Top-5 acc 75.781 (77.394)	lr 0.01874
Train [41][180/3239]	Time 0.301 (0.781)	Data Time 0.008 (0.181)	Loss 3.0345 (2.8749)	Entropy 0.65564 (0.65667)	Top-1 acc 50.000 (54.720)	Top-5 acc 77.734 (77.348)	lr 0.01873
Train [41][190/3239]	Time 0.236 (0.762)	Data Time 0.001 (0.171)	Loss 2.7951 (2.8784)	Entropy 0.65561 (0.65662)	Top-1 acc 57.422 (54.675)	Top-5 acc 77.734 (77.282)	lr 0.01873
Train [41][200/3239]	Time 0.233 (0.745)	Data Time 0.001 (0.163)	Loss 3.0120 (2.8836)	Entropy 0.65599 (0.65658)	Top-1 acc 53.125 (54.559)	Top-5 acc 77.734 (77.194)	lr 0.01873
Train [41][210/3239]	Time 0.261 (0.729)	Data Time 0.001 (0.155)	Loss 2.7636 (2.8811)	Entropy 0.65636 (0.65656)	Top-1 acc 57.422 (54.652)	Top-5 acc 81.641 (77.259)	lr 0.01873
Train [41][220/3239]	Time 0.251 (0.715)	Data Time 0.001 (0.148)	Loss 2.7633 (2.8804)	Entropy 0.65638 (0.65655)	Top-1 acc 57.422 (54.590)	Top-5 acc 79.688 (77.289)	lr 0.01873
Train [41][230/3239]	Time 0.263 (0.703)	Data Time 0.001 (0.142)	Loss 2.9344 (2.8809)	Entropy 0.65642 (0.65654)	Top-1 acc 56.250 (54.610)	Top-5 acc 75.781 (77.264)	lr 0.01873
Train [41][240/3239]	Time 0.239 (0.691)	Data Time 0.001 (0.136)	Loss 2.7457 (2.8831)	Entropy 0.65644 (0.65654)	Top-1 acc 60.156 (54.576)	Top-5 acc 78.516 (77.234)	lr 0.01873
Train [41][250/3239]	Time 0.328 (0.680)	Data Time 0.001 (0.131)	Loss 3.0080 (2.8848)	Entropy 0.65641 (0.65653)	Top-1 acc 48.828 (54.487)	Top-5 acc 75.391 (77.204)	lr 0.01873
Train [41][260/3239]	Time 0.269 (0.671)	Data Time 0.001 (0.126)	Loss 2.7295 (2.8832)	Entropy 0.65657 (0.65653)	Top-1 acc 57.422 (54.523)	Top-5 acc 79.297 (77.233)	lr 0.01873
Train [41][270/3239]	Time 0.236 (0.661)	Data Time 0.001 (0.121)	Loss 2.7800 (2.8834)	Entropy 0.65667 (0.65654)	Top-1 acc 58.203 (54.512)	Top-5 acc 78.516 (77.198)	lr 0.01873
Train [41][280/3239]	Time 0.264 (0.653)	Data Time 0.001 (0.117)	Loss 2.9106 (2.8847)	Entropy 0.65653 (0.65654)	Top-1 acc 51.172 (54.469)	Top-5 acc 76.953 (77.159)	lr 0.01873
Train [41][290/3239]	Time 0.234 (0.645)	Data Time 0.001 (0.113)	Loss 2.7003 (2.8821)	Entropy 0.65645 (0.65654)	Top-1 acc 55.469 (54.512)	Top-5 acc 80.469 (77.212)	lr 0.01872
Train [41][300/3239]	Time 0.237 (0.638)	Data Time 0.001 (0.109)	Loss 2.8179 (2.8841)	Entropy 0.65612 (0.65653)	Top-1 acc 52.344 (54.480)	Top-5 acc 79.688 (77.193)	lr 0.01872
Train [41][310/3239]	Time 0.227 (0.631)	Data Time 0.001 (0.106)	Loss 3.0008 (2.8853)	Entropy 0.65591 (0.65651)	Top-1 acc 50.000 (54.405)	Top-5 acc 73.047 (77.173)	lr 0.01872
Train [41][320/3239]	Time 0.350 (0.625)	Data Time 0.001 (0.103)	Loss 2.9153 (2.8826)	Entropy 0.65590 (0.65649)	Top-1 acc 54.297 (54.499)	Top-5 acc 75.781 (77.233)	lr 0.01872
Train [41][330/3239]	Time 0.251 (0.618)	Data Time 0.001 (0.100)	Loss 2.7755 (2.8794)	Entropy 0.65585 (0.65648)	Top-1 acc 54.297 (54.568)	Top-5 acc 78.125 (77.300)	lr 0.01872
Train [41][340/3239]	Time 0.254 (0.612)	Data Time 0.001 (0.097)	Loss 2.9052 (2.8807)	Entropy 0.65555 (0.65645)	Top-1 acc 55.078 (54.556)	Top-5 acc 76.172 (77.277)	lr 0.01872
Train [41][350/3239]	Time 0.223 (0.607)	Data Time 0.001 (0.094)	Loss 2.9443 (2.8805)	Entropy 0.65574 (0.65643)	Top-1 acc 50.781 (54.564)	Top-5 acc 76.172 (77.280)	lr 0.01872
Train [41][360/3239]	Time 0.223 (0.601)	Data Time 0.001 (0.091)	Loss 2.9596 (2.8811)	Entropy 0.65626 (0.65642)	Top-1 acc 55.469 (54.572)	Top-5 acc 78.516 (77.258)	lr 0.01872
Train [41][370/3239]	Time 0.270 (0.597)	Data Time 0.002 (0.089)	Loss 2.9172 (2.8816)	Entropy 0.65644 (0.65641)	Top-1 acc 54.688 (54.538)	Top-5 acc 76.562 (77.257)	lr 0.01872
Train [41][380/3239]	Time 0.226 (0.592)	Data Time 0.001 (0.087)	Loss 3.0413 (2.8812)	Entropy 0.65644 (0.65641)	Top-1 acc 51.562 (54.561)	Top-5 acc 73.047 (77.246)	lr 0.01872
Train [41][390/3239]	Time 0.227 (0.587)	Data Time 0.001 (0.085)	Loss 2.7191 (2.8828)	Entropy 0.65630 (0.65641)	Top-1 acc 55.469 (54.516)	Top-5 acc 80.469 (77.209)	lr 0.01872
Train [41][400/3239]	Time 0.253 (0.583)	Data Time 0.001 (0.082)	Loss 2.9724 (2.8841)	Entropy 0.65629 (0.65641)	Top-1 acc 50.000 (54.511)	Top-5 acc 76.172 (77.187)	lr 0.01871
Train [41][410/3239]	Time 0.328 (0.578)	Data Time 0.001 (0.080)	Loss 3.2334 (2.8858)	Entropy 0.65616 (0.65641)	Top-1 acc 46.875 (54.448)	Top-5 acc 70.703 (77.163)	lr 0.01871
Train [41][420/3239]	Time 0.230 (0.574)	Data Time 0.001 (0.079)	Loss 2.8164 (2.8854)	Entropy 0.65621 (0.65640)	Top-1 acc 57.812 (54.469)	Top-5 acc 80.078 (77.180)	lr 0.01871
Train [41][430/3239]	Time 0.236 (0.570)	Data Time 0.001 (0.077)	Loss 2.8503 (2.8863)	Entropy 0.65595 (0.65639)	Top-1 acc 55.469 (54.448)	Top-5 acc 77.734 (77.176)	lr 0.01871
Train [41][440/3239]	Time 0.245 (0.566)	Data Time 0.001 (0.075)	Loss 2.9514 (2.8858)	Entropy 0.65548 (0.65638)	Top-1 acc 55.078 (54.455)	Top-5 acc 76.562 (77.173)	lr 0.01871
Train [41][450/3239]	Time 0.228 (0.563)	Data Time 0.001 (0.073)	Loss 2.8987 (2.8863)	Entropy 0.65531 (0.65636)	Top-1 acc 50.781 (54.426)	Top-5 acc 81.250 (77.177)	lr 0.01871
Train [41][460/3239]	Time 0.238 (0.559)	Data Time 0.001 (0.072)	Loss 2.8032 (2.8858)	Entropy 0.65554 (0.65634)	Top-1 acc 58.203 (54.438)	Top-5 acc 78.125 (77.187)	lr 0.01871
Train [41][470/3239]	Time 0.232 (0.556)	Data Time 0.001 (0.070)	Loss 2.8935 (2.8871)	Entropy 0.65573 (0.65632)	Top-1 acc 55.469 (54.408)	Top-5 acc 76.953 (77.173)	lr 0.01871
Train [41][480/3239]	Time 0.326 (0.553)	Data Time 0.001 (0.069)	Loss 2.6712 (2.8865)	Entropy 0.65625 (0.65631)	Top-1 acc 57.812 (54.441)	Top-5 acc 81.250 (77.174)	lr 0.01871
Train [41][490/3239]	Time 0.243 (0.550)	Data Time 0.001 (0.068)	Loss 2.7736 (2.8865)	Entropy 0.65619 (0.65631)	Top-1 acc 55.469 (54.456)	Top-5 acc 80.469 (77.156)	lr 0.01871
Train [41][500/3239]	Time 0.232 (0.546)	Data Time 0.001 (0.066)	Loss 2.9832 (2.8878)	Entropy 0.65615 (0.65631)	Top-1 acc 53.906 (54.449)	Top-5 acc 77.344 (77.128)	lr 0.01871
Train [41][510/3239]	Time 0.255 (0.544)	Data Time 0.001 (0.065)	Loss 3.0039 (2.8877)	Entropy 0.65617 (0.65630)	Top-1 acc 51.562 (54.469)	Top-5 acc 75.000 (77.124)	lr 0.01871
Train [41][520/3239]	Time 0.233 (0.541)	Data Time 0.001 (0.064)	Loss 2.7436 (2.8879)	Entropy 0.65574 (0.65630)	Top-1 acc 55.859 (54.467)	Top-5 acc 80.859 (77.119)	lr 0.01870
Train [41][530/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.063)	Loss 2.8250 (2.8874)	Entropy 0.65575 (0.65629)	Top-1 acc 55.469 (54.479)	Top-5 acc 78.516 (77.119)	lr 0.01870
Train [41][540/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.062)	Loss 2.8449 (2.8880)	Entropy 0.65556 (0.65628)	Top-1 acc 54.688 (54.468)	Top-5 acc 78.906 (77.113)	lr 0.01870
Train [41][550/3239]	Time 0.244 (0.534)	Data Time 0.001 (0.060)	Loss 2.8103 (2.8875)	Entropy 0.65520 (0.65626)	Top-1 acc 55.078 (54.478)	Top-5 acc 79.297 (77.118)	lr 0.01870
Train [41][560/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.059)	Loss 2.8804 (2.8867)	Entropy 0.65531 (0.65624)	Top-1 acc 54.297 (54.502)	Top-5 acc 78.125 (77.148)	lr 0.01870
Train [41][570/3239]	Time 0.359 (0.530)	Data Time 0.001 (0.058)	Loss 2.8719 (2.8874)	Entropy 0.65531 (0.65623)	Top-1 acc 51.172 (54.510)	Top-5 acc 76.562 (77.123)	lr 0.01870
Train [41][580/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.057)	Loss 2.9158 (2.8868)	Entropy 0.65538 (0.65621)	Top-1 acc 51.172 (54.501)	Top-5 acc 77.734 (77.149)	lr 0.01870
Train [41][590/3239]	Time 0.239 (0.525)	Data Time 0.001 (0.056)	Loss 2.6829 (2.8864)	Entropy 0.65556 (0.65620)	Top-1 acc 58.984 (54.494)	Top-5 acc 80.469 (77.165)	lr 0.01870
Train [41][600/3239]	Time 0.264 (0.523)	Data Time 0.001 (0.056)	Loss 2.8155 (2.8852)	Entropy 0.65520 (0.65619)	Top-1 acc 58.594 (54.517)	Top-5 acc 79.297 (77.188)	lr 0.01870
Train [41][610/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.055)	Loss 3.0231 (2.8852)	Entropy 0.65511 (0.65617)	Top-1 acc 51.172 (54.526)	Top-5 acc 73.438 (77.189)	lr 0.01870
Train [41][620/3239]	Time 0.242 (0.520)	Data Time 0.001 (0.054)	Loss 2.9425 (2.8864)	Entropy 0.65542 (0.65616)	Top-1 acc 53.906 (54.487)	Top-5 acc 75.000 (77.173)	lr 0.01870
Train [41][630/3239]	Time 0.238 (0.518)	Data Time 0.002 (0.053)	Loss 2.6576 (2.8863)	Entropy 0.65588 (0.65615)	Top-1 acc 61.328 (54.480)	Top-5 acc 81.250 (77.167)	lr 0.01869
Train [41][640/3239]	Time 0.341 (0.517)	Data Time 0.002 (0.052)	Loss 3.0454 (2.8860)	Entropy 0.65565 (0.65614)	Top-1 acc 51.172 (54.480)	Top-5 acc 73.438 (77.175)	lr 0.01869
Train [41][650/3239]	Time 0.254 (0.515)	Data Time 0.001 (0.051)	Loss 2.7686 (2.8858)	Entropy 0.65569 (0.65613)	Top-1 acc 57.031 (54.495)	Top-5 acc 77.734 (77.175)	lr 0.01869
Train [41][660/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.051)	Loss 3.0189 (2.8860)	Entropy 0.65540 (0.65612)	Top-1 acc 48.438 (54.487)	Top-5 acc 76.172 (77.174)	lr 0.01869
Train [41][670/3239]	Time 0.233 (0.512)	Data Time 0.001 (0.050)	Loss 2.9843 (2.8862)	Entropy 0.65545 (0.65611)	Top-1 acc 52.734 (54.506)	Top-5 acc 76.172 (77.170)	lr 0.01869
Train [41][680/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.049)	Loss 2.8483 (2.8848)	Entropy 0.65558 (0.65610)	Top-1 acc 56.250 (54.551)	Top-5 acc 76.562 (77.191)	lr 0.01869
Train [41][690/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.049)	Loss 2.8625 (2.8844)	Entropy 0.65556 (0.65610)	Top-1 acc 60.156 (54.561)	Top-5 acc 75.000 (77.191)	lr 0.01869
Train [41][700/3239]	Time 0.232 (0.508)	Data Time 0.001 (0.048)	Loss 2.7297 (2.8847)	Entropy 0.65532 (0.65609)	Top-1 acc 60.156 (54.548)	Top-5 acc 79.688 (77.179)	lr 0.01869
Train [41][710/3239]	Time 0.239 (0.507)	Data Time 0.001 (0.047)	Loss 2.8218 (2.8849)	Entropy 0.65511 (0.65608)	Top-1 acc 54.297 (54.542)	Top-5 acc 80.078 (77.172)	lr 0.01869
Train [41][720/3239]	Time 0.297 (0.552)	Data Time 0.003 (0.047)	Loss 2.6093 (2.8849)	Entropy 0.65522 (0.65606)	Top-1 acc 63.672 (54.550)	Top-5 acc 83.594 (77.171)	lr 0.01869
Train [41][730/3239]	Time 0.345 (0.551)	Data Time 0.002 (0.046)	Loss 2.8707 (2.8850)	Entropy 0.65501 (0.65605)	Top-1 acc 56.641 (54.546)	Top-5 acc 77.344 (77.166)	lr 0.01869
Train [41][740/3239]	Time 0.253 (0.549)	Data Time 0.001 (0.045)	Loss 3.0066 (2.8854)	Entropy 0.65467 (0.65603)	Top-1 acc 50.000 (54.535)	Top-5 acc 76.562 (77.159)	lr 0.01869
Train [41][750/3239]	Time 0.237 (0.547)	Data Time 0.001 (0.045)	Loss 2.8638 (2.8861)	Entropy 0.65490 (0.65602)	Top-1 acc 55.859 (54.513)	Top-5 acc 78.125 (77.148)	lr 0.01868
Train [41][760/3239]	Time 0.223 (0.545)	Data Time 0.001 (0.044)	Loss 2.8745 (2.8860)	Entropy 0.65510 (0.65600)	Top-1 acc 57.422 (54.525)	Top-5 acc 81.250 (77.166)	lr 0.01868
Train [41][770/3239]	Time 0.218 (0.544)	Data Time 0.001 (0.044)	Loss 2.7530 (2.8865)	Entropy 0.65522 (0.65599)	Top-1 acc 58.203 (54.518)	Top-5 acc 79.297 (77.149)	lr 0.01868
Train [41][780/3239]	Time 0.229 (0.542)	Data Time 0.001 (0.043)	Loss 2.8744 (2.8865)	Entropy 0.65554 (0.65598)	Top-1 acc 51.562 (54.528)	Top-5 acc 75.000 (77.142)	lr 0.01868
Train [41][790/3239]	Time 0.250 (0.540)	Data Time 0.001 (0.043)	Loss 2.9981 (2.8856)	Entropy 0.65505 (0.65597)	Top-1 acc 55.469 (54.554)	Top-5 acc 73.438 (77.157)	lr 0.01868
Train [41][800/3239]	Time 0.330 (0.539)	Data Time 0.001 (0.042)	Loss 2.8438 (2.8850)	Entropy 0.65525 (0.65596)	Top-1 acc 56.250 (54.569)	Top-5 acc 81.641 (77.170)	lr 0.01868
Train [41][810/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.042)	Loss 2.7614 (2.8853)	Entropy 0.65538 (0.65596)	Top-1 acc 56.250 (54.563)	Top-5 acc 78.516 (77.168)	lr 0.01868
Train [41][820/3239]	Time 0.226 (0.536)	Data Time 0.001 (0.041)	Loss 3.1132 (2.8852)	Entropy 0.65548 (0.65595)	Top-1 acc 50.781 (54.559)	Top-5 acc 72.656 (77.168)	lr 0.01868
Train [41][830/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.041)	Loss 3.0457 (2.8857)	Entropy 0.65496 (0.65594)	Top-1 acc 50.781 (54.550)	Top-5 acc 74.219 (77.150)	lr 0.01868
Train [41][840/3239]	Time 0.245 (0.533)	Data Time 0.001 (0.040)	Loss 2.7900 (2.8851)	Entropy 0.65471 (0.65593)	Top-1 acc 58.203 (54.579)	Top-5 acc 78.516 (77.168)	lr 0.01868
Train [41][850/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.040)	Loss 3.0829 (2.8855)	Entropy 0.65493 (0.65591)	Top-1 acc 46.094 (54.564)	Top-5 acc 75.781 (77.162)	lr 0.01868
Train [41][860/3239]	Time 0.238 (0.531)	Data Time 0.001 (0.039)	Loss 2.7604 (2.8840)	Entropy 0.65531 (0.65590)	Top-1 acc 55.078 (54.594)	Top-5 acc 80.469 (77.184)	lr 0.01867
Train [41][870/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.039)	Loss 2.6962 (2.8836)	Entropy 0.65545 (0.65590)	Top-1 acc 58.203 (54.604)	Top-5 acc 82.031 (77.191)	lr 0.01867
Train [41][880/3239]	Time 0.223 (0.528)	Data Time 0.001 (0.039)	Loss 2.8545 (2.8836)	Entropy 0.65566 (0.65589)	Top-1 acc 58.984 (54.614)	Top-5 acc 75.781 (77.199)	lr 0.01867
Train [41][890/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.038)	Loss 2.9679 (2.8836)	Entropy 0.65585 (0.65589)	Top-1 acc 54.688 (54.611)	Top-5 acc 76.172 (77.199)	lr 0.01867
Train [41][900/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.038)	Loss 3.2615 (2.8840)	Entropy 0.65595 (0.65589)	Top-1 acc 42.969 (54.605)	Top-5 acc 67.578 (77.191)	lr 0.01867
Train [41][910/3239]	Time 0.244 (0.524)	Data Time 0.001 (0.037)	Loss 2.9002 (2.8845)	Entropy 0.65571 (0.65589)	Top-1 acc 53.516 (54.596)	Top-5 acc 75.781 (77.180)	lr 0.01867
Train [41][920/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.037)	Loss 2.9164 (2.8848)	Entropy 0.65586 (0.65589)	Top-1 acc 53.516 (54.581)	Top-5 acc 76.953 (77.175)	lr 0.01867
Train [41][930/3239]	Time 0.253 (0.522)	Data Time 0.001 (0.037)	Loss 2.9276 (2.8846)	Entropy 0.65599 (0.65589)	Top-1 acc 50.000 (54.581)	Top-5 acc 79.297 (77.179)	lr 0.01867
Train [41][940/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.036)	Loss 2.9151 (2.8841)	Entropy 0.65609 (0.65589)	Top-1 acc 58.203 (54.591)	Top-5 acc 75.391 (77.194)	lr 0.01867
Train [41][950/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.036)	Loss 2.8823 (2.8840)	Entropy 0.65611 (0.65590)	Top-1 acc 55.469 (54.586)	Top-5 acc 76.562 (77.195)	lr 0.01867
Train [41][960/3239]	Time 0.323 (0.519)	Data Time 0.001 (0.035)	Loss 2.7249 (2.8845)	Entropy 0.65608 (0.65590)	Top-1 acc 59.375 (54.581)	Top-5 acc 78.516 (77.187)	lr 0.01867
Train [41][970/3239]	Time 0.238 (0.518)	Data Time 0.001 (0.035)	Loss 2.8061 (2.8849)	Entropy 0.65617 (0.65590)	Top-1 acc 57.031 (54.576)	Top-5 acc 74.609 (77.166)	lr 0.01866
Train [41][980/3239]	Time 0.241 (0.517)	Data Time 0.001 (0.035)	Loss 2.8202 (2.8853)	Entropy 0.65633 (0.65591)	Top-1 acc 56.250 (54.562)	Top-5 acc 78.125 (77.147)	lr 0.01866
Train [41][990/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.034)	Loss 2.8295 (2.8855)	Entropy 0.65604 (0.65591)	Top-1 acc 53.906 (54.555)	Top-5 acc 77.734 (77.143)	lr 0.01866
Train [41][1000/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.034)	Loss 2.8333 (2.8849)	Entropy 0.65607 (0.65591)	Top-1 acc 57.031 (54.565)	Top-5 acc 78.125 (77.153)	lr 0.01866
Train [41][1010/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.034)	Loss 2.8312 (2.8850)	Entropy 0.65614 (0.65591)	Top-1 acc 57.031 (54.565)	Top-5 acc 77.734 (77.152)	lr 0.01866
Train [41][1020/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.033)	Loss 3.1303 (2.8851)	Entropy 0.65628 (0.65591)	Top-1 acc 48.047 (54.564)	Top-5 acc 71.875 (77.144)	lr 0.01866
Train [41][1030/3239]	Time 0.320 (0.513)	Data Time 0.001 (0.033)	Loss 2.9108 (2.8847)	Entropy 0.65608 (0.65592)	Top-1 acc 51.953 (54.581)	Top-5 acc 73.828 (77.145)	lr 0.01866
Train [41][1040/3239]	Time 0.234 (0.512)	Data Time 0.002 (0.033)	Loss 2.8214 (2.8850)	Entropy 0.65583 (0.65592)	Top-1 acc 55.469 (54.573)	Top-5 acc 78.906 (77.141)	lr 0.01866
Train [41][1050/3239]	Time 0.264 (0.511)	Data Time 0.001 (0.033)	Loss 2.7863 (2.8844)	Entropy 0.65596 (0.65592)	Top-1 acc 55.859 (54.584)	Top-5 acc 77.344 (77.148)	lr 0.01866
Train [41][1060/3239]	Time 0.224 (0.510)	Data Time 0.001 (0.032)	Loss 2.7433 (2.8840)	Entropy 0.65592 (0.65592)	Top-1 acc 59.766 (54.582)	Top-5 acc 79.688 (77.153)	lr 0.01866
Train [41][1070/3239]	Time 0.258 (0.509)	Data Time 0.001 (0.032)	Loss 3.0788 (2.8838)	Entropy 0.65577 (0.65592)	Top-1 acc 49.219 (54.584)	Top-5 acc 75.000 (77.156)	lr 0.01866
Train [41][1080/3239]	Time 0.231 (0.508)	Data Time 0.001 (0.032)	Loss 2.7994 (2.8835)	Entropy 0.65600 (0.65591)	Top-1 acc 54.297 (54.579)	Top-5 acc 80.859 (77.163)	lr 0.01866
Train [41][1090/3239]	Time 0.226 (0.507)	Data Time 0.001 (0.031)	Loss 3.0170 (2.8841)	Entropy 0.65616 (0.65592)	Top-1 acc 49.609 (54.557)	Top-5 acc 74.219 (77.146)	lr 0.01865
Train [41][1100/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.031)	Loss 2.7541 (2.8841)	Entropy 0.65588 (0.65592)	Top-1 acc 57.812 (54.554)	Top-5 acc 79.688 (77.146)	lr 0.01865
Train [41][1110/3239]	Time 0.226 (0.505)	Data Time 0.001 (0.031)	Loss 2.8671 (2.8845)	Entropy 0.65569 (0.65592)	Top-1 acc 56.641 (54.544)	Top-5 acc 80.078 (77.139)	lr 0.01865
Train [41][1120/3239]	Time 0.345 (0.505)	Data Time 0.001 (0.031)	Loss 2.7773 (2.8844)	Entropy 0.65562 (0.65591)	Top-1 acc 62.891 (54.556)	Top-5 acc 79.297 (77.144)	lr 0.01865
Train [41][1130/3239]	Time 0.243 (0.504)	Data Time 0.001 (0.030)	Loss 2.8282 (2.8839)	Entropy 0.65515 (0.65591)	Top-1 acc 57.422 (54.564)	Top-5 acc 78.906 (77.153)	lr 0.01865
Train [41][1140/3239]	Time 0.240 (0.503)	Data Time 0.001 (0.030)	Loss 2.7192 (2.8840)	Entropy 0.65495 (0.65590)	Top-1 acc 56.641 (54.566)	Top-5 acc 81.641 (77.158)	lr 0.01865
Train [41][1150/3239]	Time 0.231 (0.502)	Data Time 0.001 (0.030)	Loss 3.0112 (2.8843)	Entropy 0.65479 (0.65589)	Top-1 acc 55.078 (54.561)	Top-5 acc 74.609 (77.150)	lr 0.01865
Train [41][1160/3239]	Time 0.266 (0.501)	Data Time 0.001 (0.030)	Loss 2.8398 (2.8845)	Entropy 0.65481 (0.65588)	Top-1 acc 54.688 (54.558)	Top-5 acc 80.078 (77.150)	lr 0.01865
Train [41][1170/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.029)	Loss 2.6952 (2.8838)	Entropy 0.65519 (0.65588)	Top-1 acc 61.328 (54.575)	Top-5 acc 80.078 (77.170)	lr 0.01865
Train [41][1180/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.029)	Loss 2.7876 (2.8835)	Entropy 0.65531 (0.65587)	Top-1 acc 61.719 (54.586)	Top-5 acc 77.344 (77.176)	lr 0.01865
Train [41][1190/3239]	Time 0.325 (0.499)	Data Time 0.001 (0.029)	Loss 2.8213 (2.8833)	Entropy 0.65546 (0.65587)	Top-1 acc 53.516 (54.589)	Top-5 acc 79.688 (77.184)	lr 0.01865
Train [41][1200/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.029)	Loss 2.9243 (2.8826)	Entropy 0.65541 (0.65586)	Top-1 acc 56.250 (54.608)	Top-5 acc 78.516 (77.200)	lr 0.01864
Train [41][1210/3239]	Time 0.227 (0.497)	Data Time 0.001 (0.028)	Loss 2.8467 (2.8822)	Entropy 0.65501 (0.65586)	Top-1 acc 52.734 (54.616)	Top-5 acc 76.562 (77.208)	lr 0.01864
Train [41][1220/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.028)	Loss 2.9649 (2.8818)	Entropy 0.65500 (0.65585)	Top-1 acc 50.391 (54.621)	Top-5 acc 75.000 (77.213)	lr 0.01864
Train [41][1230/3239]	Time 0.227 (0.496)	Data Time 0.001 (0.028)	Loss 2.8015 (2.8818)	Entropy 0.65503 (0.65584)	Top-1 acc 56.641 (54.627)	Top-5 acc 79.688 (77.217)	lr 0.01864
Train [41][1240/3239]	Time 0.239 (0.495)	Data Time 0.001 (0.028)	Loss 3.0859 (2.8820)	Entropy 0.65492 (0.65583)	Top-1 acc 51.953 (54.625)	Top-5 acc 73.047 (77.215)	lr 0.01864
Train [41][1250/3239]	Time 0.282 (0.495)	Data Time 0.001 (0.028)	Loss 2.8585 (2.8822)	Entropy 0.65487 (0.65583)	Top-1 acc 52.344 (54.611)	Top-5 acc 79.297 (77.210)	lr 0.01864
Train [41][1260/3239]	Time 0.249 (0.494)	Data Time 0.001 (0.027)	Loss 2.9322 (2.8822)	Entropy 0.65513 (0.65582)	Top-1 acc 54.688 (54.613)	Top-5 acc 76.562 (77.216)	lr 0.01864
Train [41][1270/3239]	Time 0.235 (0.494)	Data Time 0.001 (0.027)	Loss 3.1182 (2.8825)	Entropy 0.65479 (0.65581)	Top-1 acc 48.438 (54.609)	Top-5 acc 71.875 (77.210)	lr 0.01864
Train [41][1280/3239]	Time 0.253 (0.493)	Data Time 0.001 (0.027)	Loss 2.9381 (2.8823)	Entropy 0.65490 (0.65581)	Top-1 acc 53.516 (54.609)	Top-5 acc 79.297 (77.220)	lr 0.01864
Train [41][1290/3239]	Time 0.246 (0.492)	Data Time 0.002 (0.027)	Loss 3.0402 (2.8821)	Entropy 0.65422 (0.65580)	Top-1 acc 54.688 (54.619)	Top-5 acc 75.781 (77.225)	lr 0.01864
Train [41][1300/3239]	Time 0.235 (0.492)	Data Time 0.002 (0.027)	Loss 2.9391 (2.8824)	Entropy 0.65455 (0.65579)	Top-1 acc 53.125 (54.614)	Top-5 acc 75.000 (77.210)	lr 0.01864
Train [41][1310/3239]	Time 0.249 (0.491)	Data Time 0.001 (0.026)	Loss 3.0109 (2.8821)	Entropy 0.65448 (0.65578)	Top-1 acc 50.781 (54.622)	Top-5 acc 76.172 (77.221)	lr 0.01864
Train [41][1320/3239]	Time 0.241 (0.490)	Data Time 0.001 (0.026)	Loss 2.9376 (2.8822)	Entropy 0.65391 (0.65577)	Top-1 acc 55.078 (54.626)	Top-5 acc 72.266 (77.218)	lr 0.01863
Train [41][1330/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.026)	Loss 2.8652 (2.8822)	Entropy 0.65430 (0.65575)	Top-1 acc 55.078 (54.621)	Top-5 acc 78.906 (77.216)	lr 0.01863
Train [41][1340/3239]	Time 0.236 (0.489)	Data Time 0.001 (0.026)	Loss 2.7023 (2.8826)	Entropy 0.65441 (0.65574)	Top-1 acc 62.109 (54.611)	Top-5 acc 81.250 (77.211)	lr 0.01863
Train [41][1350/3239]	Time 0.329 (0.488)	Data Time 0.002 (0.026)	Loss 2.9439 (2.8824)	Entropy 0.65411 (0.65573)	Top-1 acc 57.031 (54.615)	Top-5 acc 73.047 (77.216)	lr 0.01863
Train [41][1360/3239]	Time 0.231 (0.488)	Data Time 0.002 (0.026)	Loss 2.9374 (2.8827)	Entropy 0.65404 (0.65572)	Top-1 acc 51.562 (54.606)	Top-5 acc 77.734 (77.212)	lr 0.01863
Train [41][1370/3239]	Time 0.423 (0.512)	Data Time 0.006 (0.025)	Loss 2.8687 (2.8827)	Entropy 0.65413 (0.65571)	Top-1 acc 55.859 (54.610)	Top-5 acc 78.906 (77.213)	lr 0.01863
Train [41][1380/3239]	Time 0.241 (0.512)	Data Time 0.002 (0.025)	Loss 2.7431 (2.8829)	Entropy 0.65420 (0.65570)	Top-1 acc 55.859 (54.601)	Top-5 acc 77.344 (77.212)	lr 0.01863
Train [41][1390/3239]	Time 0.245 (0.511)	Data Time 0.002 (0.025)	Loss 2.9024 (2.8831)	Entropy 0.65396 (0.65568)	Top-1 acc 54.688 (54.595)	Top-5 acc 79.688 (77.212)	lr 0.01863
Train [41][1400/3239]	Time 0.267 (0.510)	Data Time 0.001 (0.025)	Loss 2.9738 (2.8837)	Entropy 0.65357 (0.65567)	Top-1 acc 51.562 (54.581)	Top-5 acc 76.172 (77.197)	lr 0.01863
Train [41][1410/3239]	Time 0.239 (0.510)	Data Time 0.001 (0.025)	Loss 2.9645 (2.8839)	Entropy 0.65357 (0.65566)	Top-1 acc 50.391 (54.569)	Top-5 acc 76.172 (77.191)	lr 0.01863
Train [41][1420/3239]	Time 0.266 (0.509)	Data Time 0.003 (0.025)	Loss 2.7800 (2.8840)	Entropy 0.65342 (0.65564)	Top-1 acc 56.641 (54.565)	Top-5 acc 80.859 (77.192)	lr 0.01863
Train [41][1430/3239]	Time 0.237 (0.509)	Data Time 0.001 (0.024)	Loss 3.0444 (2.8841)	Entropy 0.65332 (0.65563)	Top-1 acc 50.781 (54.563)	Top-5 acc 71.484 (77.186)	lr 0.01862
Train [41][1440/3239]	Time 0.274 (0.508)	Data Time 0.002 (0.024)	Loss 2.8223 (2.8842)	Entropy 0.65318 (0.65561)	Top-1 acc 57.031 (54.559)	Top-5 acc 80.859 (77.182)	lr 0.01862
Train [41][1450/3239]	Time 0.235 (0.507)	Data Time 0.001 (0.024)	Loss 3.0174 (2.8848)	Entropy 0.65314 (0.65559)	Top-1 acc 53.125 (54.539)	Top-5 acc 79.297 (77.174)	lr 0.01862
Train [41][1460/3239]	Time 0.229 (0.507)	Data Time 0.001 (0.024)	Loss 2.8816 (2.8848)	Entropy 0.65284 (0.65558)	Top-1 acc 52.344 (54.530)	Top-5 acc 77.734 (77.178)	lr 0.01862
Train [41][1470/3239]	Time 0.238 (0.506)	Data Time 0.001 (0.024)	Loss 2.8928 (2.8848)	Entropy 0.65251 (0.65556)	Top-1 acc 55.469 (54.533)	Top-5 acc 76.953 (77.174)	lr 0.01862
Train [41][1480/3239]	Time 0.265 (0.505)	Data Time 0.001 (0.024)	Loss 2.8462 (2.8849)	Entropy 0.65230 (0.65553)	Top-1 acc 55.078 (54.531)	Top-5 acc 78.125 (77.177)	lr 0.01862
Train [41][1490/3239]	Time 0.241 (0.505)	Data Time 0.001 (0.023)	Loss 2.8949 (2.8850)	Entropy 0.65215 (0.65551)	Top-1 acc 53.516 (54.525)	Top-5 acc 77.344 (77.176)	lr 0.01862
Train [41][1500/3239]	Time 0.241 (0.504)	Data Time 0.001 (0.023)	Loss 2.8058 (2.8851)	Entropy 0.65207 (0.65549)	Top-1 acc 55.078 (54.527)	Top-5 acc 79.688 (77.175)	lr 0.01862
Train [41][1510/3239]	Time 0.346 (0.504)	Data Time 0.002 (0.023)	Loss 2.8878 (2.8853)	Entropy 0.65196 (0.65547)	Top-1 acc 57.031 (54.525)	Top-5 acc 77.734 (77.175)	lr 0.01862
Train [41][1520/3239]	Time 0.226 (0.503)	Data Time 0.001 (0.023)	Loss 2.8546 (2.8852)	Entropy 0.65188 (0.65544)	Top-1 acc 56.250 (54.536)	Top-5 acc 75.781 (77.172)	lr 0.01862
Train [41][1530/3239]	Time 0.224 (0.502)	Data Time 0.001 (0.023)	Loss 2.7470 (2.8849)	Entropy 0.65205 (0.65542)	Top-1 acc 57.422 (54.535)	Top-5 acc 81.250 (77.182)	lr 0.01862
Train [41][1540/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.023)	Loss 2.9129 (2.8849)	Entropy 0.65191 (0.65540)	Top-1 acc 50.781 (54.531)	Top-5 acc 77.344 (77.183)	lr 0.01861
Train [41][1550/3239]	Time 0.229 (0.501)	Data Time 0.002 (0.023)	Loss 3.0178 (2.8853)	Entropy 0.65184 (0.65538)	Top-1 acc 51.562 (54.523)	Top-5 acc 75.781 (77.173)	lr 0.01861
Train [41][1560/3239]	Time 0.222 (0.501)	Data Time 0.001 (0.022)	Loss 2.6925 (2.8854)	Entropy 0.65153 (0.65535)	Top-1 acc 57.031 (54.521)	Top-5 acc 81.250 (77.173)	lr 0.01861
Train [41][1570/3239]	Time 0.234 (0.500)	Data Time 0.001 (0.022)	Loss 2.7615 (2.8853)	Entropy 0.65151 (0.65533)	Top-1 acc 56.641 (54.522)	Top-5 acc 77.734 (77.174)	lr 0.01861
Train [41][1580/3239]	Time 0.325 (0.499)	Data Time 0.001 (0.022)	Loss 2.7282 (2.8853)	Entropy 0.65136 (0.65531)	Top-1 acc 60.547 (54.523)	Top-5 acc 80.078 (77.170)	lr 0.01861
Train [41][1590/3239]	Time 0.276 (0.499)	Data Time 0.001 (0.022)	Loss 2.9363 (2.8852)	Entropy 0.65147 (0.65528)	Top-1 acc 55.078 (54.525)	Top-5 acc 75.000 (77.173)	lr 0.01861
Train [41][1600/3239]	Time 0.233 (0.498)	Data Time 0.001 (0.022)	Loss 2.8802 (2.8854)	Entropy 0.65134 (0.65526)	Top-1 acc 50.781 (54.515)	Top-5 acc 77.344 (77.168)	lr 0.01861
Train [41][1610/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.022)	Loss 2.9107 (2.8853)	Entropy 0.65137 (0.65523)	Top-1 acc 51.562 (54.510)	Top-5 acc 74.219 (77.169)	lr 0.01861
Train [41][1620/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.022)	Loss 2.9521 (2.8857)	Entropy 0.65112 (0.65521)	Top-1 acc 51.562 (54.501)	Top-5 acc 76.562 (77.165)	lr 0.01861
Train [41][1630/3239]	Time 0.232 (0.497)	Data Time 0.001 (0.022)	Loss 2.8175 (2.8859)	Entropy 0.65136 (0.65518)	Top-1 acc 55.469 (54.500)	Top-5 acc 76.953 (77.163)	lr 0.01861
Train [41][1640/3239]	Time 0.236 (0.496)	Data Time 0.001 (0.021)	Loss 2.9276 (2.8864)	Entropy 0.65129 (0.65516)	Top-1 acc 50.391 (54.486)	Top-5 acc 74.219 (77.152)	lr 0.01861
Train [41][1650/3239]	Time 0.243 (0.496)	Data Time 0.001 (0.021)	Loss 2.9373 (2.8859)	Entropy 0.65112 (0.65514)	Top-1 acc 52.734 (54.493)	Top-5 acc 75.000 (77.158)	lr 0.01861
Train [41][1660/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.021)	Loss 3.0012 (2.8863)	Entropy 0.65101 (0.65511)	Top-1 acc 54.688 (54.481)	Top-5 acc 77.734 (77.149)	lr 0.01860
Train [41][1670/3239]	Time 0.340 (0.495)	Data Time 0.001 (0.021)	Loss 2.7607 (2.8860)	Entropy 0.65081 (0.65509)	Top-1 acc 58.594 (54.485)	Top-5 acc 80.469 (77.148)	lr 0.01860
Train [41][1680/3239]	Time 0.238 (0.494)	Data Time 0.001 (0.021)	Loss 2.7464 (2.8856)	Entropy 0.65076 (0.65506)	Top-1 acc 57.812 (54.492)	Top-5 acc 82.812 (77.158)	lr 0.01860
Train [41][1690/3239]	Time 0.229 (0.494)	Data Time 0.001 (0.021)	Loss 2.8222 (2.8854)	Entropy 0.65065 (0.65504)	Top-1 acc 53.125 (54.501)	Top-5 acc 77.344 (77.158)	lr 0.01860
Train [41][1700/3239]	Time 0.278 (0.494)	Data Time 0.001 (0.021)	Loss 2.8597 (2.8853)	Entropy 0.65093 (0.65501)	Top-1 acc 55.469 (54.511)	Top-5 acc 76.953 (77.156)	lr 0.01860
Train [41][1710/3239]	Time 0.233 (0.493)	Data Time 0.001 (0.021)	Loss 2.8157 (2.8852)	Entropy 0.65108 (0.65499)	Top-1 acc 56.250 (54.514)	Top-5 acc 75.781 (77.157)	lr 0.01860
Train [41][1720/3239]	Time 0.218 (0.493)	Data Time 0.001 (0.021)	Loss 2.9439 (2.8853)	Entropy 0.65106 (0.65497)	Top-1 acc 54.688 (54.518)	Top-5 acc 75.391 (77.151)	lr 0.01860
Train [41][1730/3239]	Time 0.226 (0.492)	Data Time 0.001 (0.020)	Loss 2.8646 (2.8850)	Entropy 0.65094 (0.65494)	Top-1 acc 54.688 (54.524)	Top-5 acc 77.734 (77.154)	lr 0.01860
Train [41][1740/3239]	Time 0.322 (0.491)	Data Time 0.001 (0.020)	Loss 3.1474 (2.8857)	Entropy 0.65081 (0.65492)	Top-1 acc 52.734 (54.508)	Top-5 acc 71.875 (77.135)	lr 0.01860
Train [41][1750/3239]	Time 0.228 (0.491)	Data Time 0.001 (0.020)	Loss 2.7284 (2.8855)	Entropy 0.65073 (0.65490)	Top-1 acc 55.469 (54.509)	Top-5 acc 80.469 (77.138)	lr 0.01860
Train [41][1760/3239]	Time 0.224 (0.490)	Data Time 0.001 (0.020)	Loss 2.8810 (2.8854)	Entropy 0.65063 (0.65487)	Top-1 acc 53.125 (54.508)	Top-5 acc 77.344 (77.139)	lr 0.01860
Train [41][1770/3239]	Time 0.233 (0.490)	Data Time 0.001 (0.020)	Loss 2.9512 (2.8857)	Entropy 0.65079 (0.65485)	Top-1 acc 55.078 (54.505)	Top-5 acc 75.000 (77.130)	lr 0.01859
Train [41][1780/3239]	Time 0.230 (0.489)	Data Time 0.001 (0.020)	Loss 2.8258 (2.8857)	Entropy 0.65075 (0.65483)	Top-1 acc 56.641 (54.507)	Top-5 acc 79.297 (77.131)	lr 0.01859
Train [41][1790/3239]	Time 0.243 (0.489)	Data Time 0.001 (0.020)	Loss 2.6819 (2.8852)	Entropy 0.65069 (0.65480)	Top-1 acc 57.812 (54.518)	Top-5 acc 80.078 (77.139)	lr 0.01859
Train [41][1800/3239]	Time 0.231 (0.489)	Data Time 0.001 (0.020)	Loss 2.8530 (2.8854)	Entropy 0.65062 (0.65478)	Top-1 acc 54.297 (54.516)	Top-5 acc 77.734 (77.134)	lr 0.01859
Train [41][1810/3239]	Time 0.227 (0.488)	Data Time 0.001 (0.020)	Loss 2.8933 (2.8854)	Entropy 0.65054 (0.65476)	Top-1 acc 55.469 (54.515)	Top-5 acc 80.859 (77.134)	lr 0.01859
Train [41][1820/3239]	Time 0.237 (0.488)	Data Time 0.001 (0.020)	Loss 3.0579 (2.8855)	Entropy 0.65055 (0.65473)	Top-1 acc 50.000 (54.514)	Top-5 acc 71.484 (77.132)	lr 0.01859
Train [41][1830/3239]	Time 0.254 (0.487)	Data Time 0.001 (0.019)	Loss 2.8394 (2.8852)	Entropy 0.65049 (0.65471)	Top-1 acc 55.469 (54.518)	Top-5 acc 77.344 (77.142)	lr 0.01859
Train [41][1840/3239]	Time 0.231 (0.487)	Data Time 0.001 (0.019)	Loss 2.9653 (2.8852)	Entropy 0.65031 (0.65469)	Top-1 acc 53.906 (54.518)	Top-5 acc 73.828 (77.141)	lr 0.01859
Train [41][1850/3239]	Time 0.246 (0.486)	Data Time 0.001 (0.019)	Loss 2.9253 (2.8852)	Entropy 0.65018 (0.65466)	Top-1 acc 53.125 (54.517)	Top-5 acc 74.609 (77.142)	lr 0.01859
Train [41][1860/3239]	Time 0.262 (0.486)	Data Time 0.001 (0.019)	Loss 2.7940 (2.8852)	Entropy 0.65043 (0.65464)	Top-1 acc 58.594 (54.515)	Top-5 acc 79.297 (77.141)	lr 0.01859
Train [41][1870/3239]	Time 0.266 (0.485)	Data Time 0.001 (0.019)	Loss 2.7350 (2.8847)	Entropy 0.65015 (0.65462)	Top-1 acc 56.641 (54.523)	Top-5 acc 78.516 (77.147)	lr 0.01859
Train [41][1880/3239]	Time 0.239 (0.485)	Data Time 0.001 (0.019)	Loss 2.8023 (2.8845)	Entropy 0.64971 (0.65459)	Top-1 acc 56.250 (54.530)	Top-5 acc 78.125 (77.149)	lr 0.01858
Train [41][1890/3239]	Time 0.229 (0.485)	Data Time 0.001 (0.019)	Loss 2.6351 (2.8846)	Entropy 0.64965 (0.65457)	Top-1 acc 62.500 (54.534)	Top-5 acc 81.250 (77.148)	lr 0.01858
Train [41][1900/3239]	Time 0.314 (0.484)	Data Time 0.001 (0.019)	Loss 2.8324 (2.8847)	Entropy 0.64939 (0.65454)	Top-1 acc 55.859 (54.530)	Top-5 acc 76.953 (77.147)	lr 0.01858
Train [41][1910/3239]	Time 0.232 (0.484)	Data Time 0.001 (0.019)	Loss 2.7737 (2.8850)	Entropy 0.64941 (0.65451)	Top-1 acc 53.516 (54.525)	Top-5 acc 79.688 (77.144)	lr 0.01858
Train [41][1920/3239]	Time 0.249 (0.483)	Data Time 0.001 (0.019)	Loss 2.6410 (2.8849)	Entropy 0.64959 (0.65449)	Top-1 acc 60.547 (54.533)	Top-5 acc 82.031 (77.146)	lr 0.01858
Train [41][1930/3239]	Time 0.238 (0.483)	Data Time 0.002 (0.018)	Loss 2.9584 (2.8848)	Entropy 0.64976 (0.65446)	Top-1 acc 53.906 (54.537)	Top-5 acc 76.562 (77.150)	lr 0.01858
Train [41][1940/3239]	Time 0.239 (0.483)	Data Time 0.001 (0.018)	Loss 2.9477 (2.8846)	Entropy 0.65004 (0.65444)	Top-1 acc 53.125 (54.537)	Top-5 acc 75.781 (77.154)	lr 0.01858
Train [41][1950/3239]	Time 0.245 (0.482)	Data Time 0.001 (0.018)	Loss 2.7346 (2.8848)	Entropy 0.65008 (0.65442)	Top-1 acc 56.641 (54.531)	Top-5 acc 81.250 (77.149)	lr 0.01858
Train [41][1960/3239]	Time 0.234 (0.482)	Data Time 0.001 (0.018)	Loss 2.7612 (2.8847)	Entropy 0.65034 (0.65439)	Top-1 acc 57.031 (54.534)	Top-5 acc 77.344 (77.153)	lr 0.01858
Train [41][1970/3239]	Time 0.324 (0.482)	Data Time 0.001 (0.018)	Loss 3.0169 (2.8845)	Entropy 0.65034 (0.65437)	Top-1 acc 53.125 (54.537)	Top-5 acc 77.344 (77.157)	lr 0.01858
Train [41][1980/3239]	Time 0.233 (0.481)	Data Time 0.001 (0.018)	Loss 2.8201 (2.8844)	Entropy 0.65059 (0.65435)	Top-1 acc 55.859 (54.535)	Top-5 acc 79.297 (77.158)	lr 0.01858
Train [41][1990/3239]	Time 0.229 (0.481)	Data Time 0.001 (0.018)	Loss 3.2832 (2.8848)	Entropy 0.65052 (0.65433)	Top-1 acc 44.922 (54.520)	Top-5 acc 70.703 (77.152)	lr 0.01858
Train [41][2000/3239]	Time 0.249 (0.480)	Data Time 0.001 (0.018)	Loss 2.8547 (2.8850)	Entropy 0.65032 (0.65431)	Top-1 acc 57.031 (54.518)	Top-5 acc 77.344 (77.145)	lr 0.01857
Train [41][2010/3239]	Time 0.227 (0.480)	Data Time 0.001 (0.018)	Loss 2.9935 (2.8853)	Entropy 0.65022 (0.65430)	Top-1 acc 51.562 (54.513)	Top-5 acc 75.000 (77.143)	lr 0.01857
Train [41][2020/3239]	Time 0.233 (0.480)	Data Time 0.001 (0.018)	Loss 2.8855 (2.8852)	Entropy 0.64998 (0.65427)	Top-1 acc 54.688 (54.510)	Top-5 acc 77.734 (77.142)	lr 0.01857
Train [41][2030/3239]	Time 0.231 (0.496)	Data Time 0.002 (0.018)	Loss 2.9659 (2.8850)	Entropy 0.65022 (0.65425)	Top-1 acc 54.688 (54.517)	Top-5 acc 73.828 (77.144)	lr 0.01857
Train [41][2040/3239]	Time 0.235 (0.496)	Data Time 0.002 (0.018)	Loss 2.8904 (2.8853)	Entropy 0.64979 (0.65423)	Top-1 acc 54.688 (54.509)	Top-5 acc 78.516 (77.137)	lr 0.01857
Train [41][2050/3239]	Time 0.239 (0.495)	Data Time 0.001 (0.018)	Loss 2.6698 (2.8853)	Entropy 0.64978 (0.65421)	Top-1 acc 60.156 (54.509)	Top-5 acc 80.859 (77.139)	lr 0.01857
Train [41][2060/3239]	Time 0.370 (0.495)	Data Time 0.001 (0.017)	Loss 2.6892 (2.8853)	Entropy 0.65013 (0.65419)	Top-1 acc 58.594 (54.502)	Top-5 acc 82.031 (77.141)	lr 0.01857
Train [41][2070/3239]	Time 0.238 (0.495)	Data Time 0.001 (0.017)	Loss 2.8328 (2.8851)	Entropy 0.65024 (0.65417)	Top-1 acc 54.297 (54.508)	Top-5 acc 82.422 (77.146)	lr 0.01857
Train [41][2080/3239]	Time 0.242 (0.494)	Data Time 0.001 (0.017)	Loss 2.7745 (2.8854)	Entropy 0.65026 (0.65415)	Top-1 acc 59.766 (54.498)	Top-5 acc 78.906 (77.140)	lr 0.01857
Train [41][2090/3239]	Time 0.237 (0.494)	Data Time 0.001 (0.017)	Loss 2.7448 (2.8852)	Entropy 0.65001 (0.65413)	Top-1 acc 59.766 (54.499)	Top-5 acc 77.344 (77.142)	lr 0.01857
Train [41][2100/3239]	Time 0.241 (0.494)	Data Time 0.001 (0.017)	Loss 2.8828 (2.8851)	Entropy 0.65004 (0.65411)	Top-1 acc 56.250 (54.499)	Top-5 acc 78.516 (77.144)	lr 0.01857
Train [41][2110/3239]	Time 0.234 (0.493)	Data Time 0.001 (0.017)	Loss 2.9102 (2.8852)	Entropy 0.65008 (0.65410)	Top-1 acc 54.297 (54.495)	Top-5 acc 76.172 (77.144)	lr 0.01856
Train [41][2120/3239]	Time 0.237 (0.493)	Data Time 0.001 (0.017)	Loss 2.8105 (2.8852)	Entropy 0.64989 (0.65408)	Top-1 acc 58.984 (54.499)	Top-5 acc 78.125 (77.144)	lr 0.01856
Train [41][2130/3239]	Time 0.376 (0.493)	Data Time 0.001 (0.017)	Loss 2.7144 (2.8851)	Entropy 0.64979 (0.65406)	Top-1 acc 56.250 (54.498)	Top-5 acc 80.859 (77.145)	lr 0.01856
Train [41][2140/3239]	Time 0.271 (0.492)	Data Time 0.001 (0.017)	Loss 2.9439 (2.8853)	Entropy 0.64954 (0.65404)	Top-1 acc 54.297 (54.493)	Top-5 acc 75.781 (77.138)	lr 0.01856
Train [41][2150/3239]	Time 0.240 (0.492)	Data Time 0.001 (0.017)	Loss 2.7855 (2.8852)	Entropy 0.64989 (0.65402)	Top-1 acc 56.641 (54.498)	Top-5 acc 80.859 (77.141)	lr 0.01856
Train [41][2160/3239]	Time 0.262 (0.492)	Data Time 0.002 (0.017)	Loss 2.8934 (2.8855)	Entropy 0.64934 (0.65400)	Top-1 acc 56.250 (54.493)	Top-5 acc 75.781 (77.128)	lr 0.01856
Train [41][2170/3239]	Time 0.243 (0.492)	Data Time 0.001 (0.017)	Loss 2.9115 (2.8854)	Entropy 0.64934 (0.65397)	Top-1 acc 53.516 (54.494)	Top-5 acc 76.953 (77.126)	lr 0.01856
Train [41][2180/3239]	Time 0.278 (0.491)	Data Time 0.002 (0.017)	Loss 2.9171 (2.8854)	Entropy 0.64944 (0.65395)	Top-1 acc 52.344 (54.496)	Top-5 acc 77.344 (77.122)	lr 0.01856
Train [41][2190/3239]	Time 0.286 (0.491)	Data Time 0.001 (0.017)	Loss 2.7593 (2.8852)	Entropy 0.64955 (0.65393)	Top-1 acc 57.031 (54.499)	Top-5 acc 78.516 (77.126)	lr 0.01856
Train [41][2200/3239]	Time 0.231 (0.491)	Data Time 0.001 (0.016)	Loss 2.6573 (2.8853)	Entropy 0.64935 (0.65391)	Top-1 acc 58.984 (54.497)	Top-5 acc 82.031 (77.128)	lr 0.01856
Train [41][2210/3239]	Time 0.242 (0.491)	Data Time 0.001 (0.016)	Loss 3.0898 (2.8856)	Entropy 0.64934 (0.65389)	Top-1 acc 50.391 (54.490)	Top-5 acc 74.219 (77.122)	lr 0.01856
Train [41][2220/3239]	Time 0.339 (0.490)	Data Time 0.002 (0.016)	Loss 2.9396 (2.8858)	Entropy 0.64940 (0.65387)	Top-1 acc 53.906 (54.487)	Top-5 acc 77.344 (77.119)	lr 0.01855
Train [41][2230/3239]	Time 0.270 (0.490)	Data Time 0.001 (0.016)	Loss 3.0304 (2.8856)	Entropy 0.64974 (0.65385)	Top-1 acc 53.906 (54.493)	Top-5 acc 78.906 (77.124)	lr 0.01855
Train [41][2240/3239]	Time 0.241 (0.490)	Data Time 0.001 (0.016)	Loss 2.5641 (2.8858)	Entropy 0.65006 (0.65383)	Top-1 acc 60.938 (54.491)	Top-5 acc 82.031 (77.123)	lr 0.01855
Train [41][2250/3239]	Time 0.289 (0.489)	Data Time 0.002 (0.016)	Loss 2.9877 (2.8859)	Entropy 0.64999 (0.65382)	Top-1 acc 52.734 (54.489)	Top-5 acc 74.609 (77.123)	lr 0.01855
Train [41][2260/3239]	Time 0.223 (0.489)	Data Time 0.001 (0.016)	Loss 2.7053 (2.8858)	Entropy 0.64938 (0.65380)	Top-1 acc 56.250 (54.488)	Top-5 acc 83.984 (77.122)	lr 0.01855
Train [41][2270/3239]	Time 0.225 (0.489)	Data Time 0.001 (0.016)	Loss 3.0622 (2.8862)	Entropy 0.64936 (0.65378)	Top-1 acc 52.734 (54.483)	Top-5 acc 75.781 (77.116)	lr 0.01855
Train [41][2280/3239]	Time 0.231 (0.489)	Data Time 0.001 (0.016)	Loss 2.8484 (2.8864)	Entropy 0.64947 (0.65376)	Top-1 acc 59.766 (54.483)	Top-5 acc 75.781 (77.113)	lr 0.01855
Train [41][2290/3239]	Time 0.322 (0.488)	Data Time 0.001 (0.016)	Loss 2.7576 (2.8859)	Entropy 0.64915 (0.65374)	Top-1 acc 57.422 (54.496)	Top-5 acc 79.297 (77.123)	lr 0.01855
Train [41][2300/3239]	Time 0.297 (0.488)	Data Time 0.001 (0.016)	Loss 2.8115 (2.8858)	Entropy 0.64921 (0.65372)	Top-1 acc 51.953 (54.497)	Top-5 acc 78.516 (77.123)	lr 0.01855
Train [41][2310/3239]	Time 0.238 (0.488)	Data Time 0.001 (0.016)	Loss 2.8007 (2.8855)	Entropy 0.64945 (0.65370)	Top-1 acc 57.812 (54.503)	Top-5 acc 78.125 (77.130)	lr 0.01855
Train [41][2320/3239]	Time 0.233 (0.488)	Data Time 0.001 (0.016)	Loss 2.7857 (2.8854)	Entropy 0.64950 (0.65368)	Top-1 acc 60.547 (54.508)	Top-5 acc 78.516 (77.134)	lr 0.01855
Train [41][2330/3239]	Time 0.238 (0.487)	Data Time 0.001 (0.016)	Loss 2.9299 (2.8854)	Entropy 0.64963 (0.65367)	Top-1 acc 52.734 (54.509)	Top-5 acc 76.172 (77.134)	lr 0.01855
Train [41][2340/3239]	Time 0.221 (0.487)	Data Time 0.001 (0.016)	Loss 2.7980 (2.8852)	Entropy 0.64968 (0.65365)	Top-1 acc 57.812 (54.513)	Top-5 acc 78.516 (77.136)	lr 0.01854
Train [41][2350/3239]	Time 0.242 (0.487)	Data Time 0.001 (0.016)	Loss 2.9565 (2.8853)	Entropy 0.64938 (0.65363)	Top-1 acc 58.203 (54.512)	Top-5 acc 75.781 (77.132)	lr 0.01854
Train [41][2360/3239]	Time 0.252 (0.486)	Data Time 0.001 (0.015)	Loss 2.8502 (2.8848)	Entropy 0.64943 (0.65361)	Top-1 acc 54.688 (54.522)	Top-5 acc 76.172 (77.142)	lr 0.01854
Train [41][2370/3239]	Time 0.231 (0.486)	Data Time 0.001 (0.015)	Loss 2.6846 (2.8846)	Entropy 0.64939 (0.65360)	Top-1 acc 57.031 (54.525)	Top-5 acc 81.641 (77.145)	lr 0.01854
Train [41][2380/3239]	Time 0.329 (0.486)	Data Time 0.001 (0.015)	Loss 2.6608 (2.8843)	Entropy 0.64970 (0.65358)	Top-1 acc 61.328 (54.535)	Top-5 acc 80.078 (77.150)	lr 0.01854
Train [41][2390/3239]	Time 0.226 (0.485)	Data Time 0.001 (0.015)	Loss 2.8724 (2.8845)	Entropy 0.64996 (0.65356)	Top-1 acc 53.125 (54.532)	Top-5 acc 76.953 (77.143)	lr 0.01854
Train [41][2400/3239]	Time 0.233 (0.485)	Data Time 0.001 (0.015)	Loss 2.7517 (2.8847)	Entropy 0.65013 (0.65355)	Top-1 acc 55.078 (54.528)	Top-5 acc 81.250 (77.142)	lr 0.01854
Train [41][2410/3239]	Time 0.236 (0.485)	Data Time 0.001 (0.015)	Loss 2.7661 (2.8849)	Entropy 0.65034 (0.65353)	Top-1 acc 58.203 (54.525)	Top-5 acc 80.469 (77.139)	lr 0.01854
Train [41][2420/3239]	Time 0.255 (0.484)	Data Time 0.001 (0.015)	Loss 2.7029 (2.8848)	Entropy 0.65001 (0.65352)	Top-1 acc 56.641 (54.525)	Top-5 acc 80.469 (77.139)	lr 0.01854
Train [41][2430/3239]	Time 0.223 (0.484)	Data Time 0.001 (0.015)	Loss 2.9387 (2.8847)	Entropy 0.65012 (0.65351)	Top-1 acc 53.125 (54.523)	Top-5 acc 76.953 (77.142)	lr 0.01854
Train [41][2440/3239]	Time 0.229 (0.484)	Data Time 0.001 (0.015)	Loss 2.6910 (2.8848)	Entropy 0.64986 (0.65349)	Top-1 acc 53.516 (54.518)	Top-5 acc 80.859 (77.139)	lr 0.01854
Train [41][2450/3239]	Time 0.353 (0.484)	Data Time 0.001 (0.015)	Loss 2.9139 (2.8847)	Entropy 0.65004 (0.65348)	Top-1 acc 52.344 (54.516)	Top-5 acc 77.344 (77.142)	lr 0.01853
Train [41][2460/3239]	Time 0.231 (0.483)	Data Time 0.001 (0.015)	Loss 2.7079 (2.8850)	Entropy 0.64996 (0.65346)	Top-1 acc 57.031 (54.512)	Top-5 acc 80.469 (77.138)	lr 0.01853
Train [41][2470/3239]	Time 0.256 (0.483)	Data Time 0.002 (0.015)	Loss 2.9574 (2.8852)	Entropy 0.64985 (0.65345)	Top-1 acc 50.781 (54.510)	Top-5 acc 76.172 (77.132)	lr 0.01853
Train [41][2480/3239]	Time 0.233 (0.483)	Data Time 0.001 (0.015)	Loss 2.9734 (2.8853)	Entropy 0.64954 (0.65343)	Top-1 acc 46.094 (54.508)	Top-5 acc 79.297 (77.130)	lr 0.01853
Train [41][2490/3239]	Time 0.239 (0.483)	Data Time 0.001 (0.015)	Loss 2.9723 (2.8855)	Entropy 0.64960 (0.65342)	Top-1 acc 53.125 (54.501)	Top-5 acc 73.438 (77.123)	lr 0.01853
Train [41][2500/3239]	Time 0.236 (0.482)	Data Time 0.001 (0.015)	Loss 2.9447 (2.8855)	Entropy 0.64961 (0.65340)	Top-1 acc 55.469 (54.502)	Top-5 acc 75.781 (77.121)	lr 0.01853
Train [41][2510/3239]	Time 0.247 (0.482)	Data Time 0.001 (0.015)	Loss 3.1166 (2.8856)	Entropy 0.64952 (0.65339)	Top-1 acc 45.703 (54.501)	Top-5 acc 75.391 (77.123)	lr 0.01853
Train [41][2520/3239]	Time 0.230 (0.482)	Data Time 0.001 (0.015)	Loss 2.9986 (2.8852)	Entropy 0.64941 (0.65337)	Top-1 acc 54.688 (54.510)	Top-5 acc 76.172 (77.128)	lr 0.01853
Train [41][2530/3239]	Time 0.236 (0.482)	Data Time 0.001 (0.015)	Loss 2.9013 (2.8852)	Entropy 0.64947 (0.65336)	Top-1 acc 54.297 (54.512)	Top-5 acc 75.000 (77.125)	lr 0.01853
Train [41][2540/3239]	Time 0.254 (0.481)	Data Time 0.001 (0.014)	Loss 2.9082 (2.8853)	Entropy 0.64945 (0.65334)	Top-1 acc 55.078 (54.508)	Top-5 acc 77.344 (77.122)	lr 0.01853
Train [41][2550/3239]	Time 0.249 (0.481)	Data Time 0.001 (0.014)	Loss 2.7563 (2.8854)	Entropy 0.64928 (0.65333)	Top-1 acc 58.203 (54.508)	Top-5 acc 77.734 (77.121)	lr 0.01853
Train [41][2560/3239]	Time 0.231 (0.481)	Data Time 0.001 (0.014)	Loss 2.8659 (2.8855)	Entropy 0.64892 (0.65331)	Top-1 acc 53.125 (54.502)	Top-5 acc 78.516 (77.119)	lr 0.01852
Train [41][2570/3239]	Time 0.255 (0.480)	Data Time 0.001 (0.014)	Loss 2.8629 (2.8856)	Entropy 0.64874 (0.65329)	Top-1 acc 60.547 (54.507)	Top-5 acc 78.516 (77.114)	lr 0.01852
Train [41][2580/3239]	Time 0.228 (0.480)	Data Time 0.001 (0.014)	Loss 2.9258 (2.8855)	Entropy 0.64890 (0.65328)	Top-1 acc 53.906 (54.508)	Top-5 acc 78.516 (77.115)	lr 0.01852
Train [41][2590/3239]	Time 0.251 (0.480)	Data Time 0.001 (0.014)	Loss 2.7686 (2.8853)	Entropy 0.64899 (0.65326)	Top-1 acc 58.594 (54.515)	Top-5 acc 76.953 (77.117)	lr 0.01852
Train [41][2600/3239]	Time 0.236 (0.480)	Data Time 0.001 (0.014)	Loss 2.7839 (2.8853)	Entropy 0.64842 (0.65324)	Top-1 acc 53.516 (54.516)	Top-5 acc 80.859 (77.119)	lr 0.01852
Train [41][2610/3239]	Time 0.321 (0.479)	Data Time 0.001 (0.014)	Loss 2.9734 (2.8855)	Entropy 0.64835 (0.65322)	Top-1 acc 51.172 (54.513)	Top-5 acc 75.000 (77.113)	lr 0.01852
Train [41][2620/3239]	Time 0.239 (0.479)	Data Time 0.001 (0.014)	Loss 2.8497 (2.8856)	Entropy 0.64839 (0.65320)	Top-1 acc 53.125 (54.511)	Top-5 acc 79.297 (77.110)	lr 0.01852
Train [41][2630/3239]	Time 0.242 (0.479)	Data Time 0.001 (0.014)	Loss 2.8824 (2.8857)	Entropy 0.64847 (0.65319)	Top-1 acc 56.641 (54.505)	Top-5 acc 74.219 (77.108)	lr 0.01852
Train [41][2640/3239]	Time 0.224 (0.478)	Data Time 0.001 (0.014)	Loss 2.8377 (2.8859)	Entropy 0.64872 (0.65317)	Top-1 acc 54.297 (54.500)	Top-5 acc 78.906 (77.104)	lr 0.01852
Train [41][2650/3239]	Time 0.229 (0.478)	Data Time 0.001 (0.014)	Loss 2.7281 (2.8858)	Entropy 0.64906 (0.65315)	Top-1 acc 58.203 (54.500)	Top-5 acc 78.125 (77.102)	lr 0.01852
Train [41][2660/3239]	Time 0.223 (0.478)	Data Time 0.001 (0.014)	Loss 2.7901 (2.8859)	Entropy 0.64886 (0.65314)	Top-1 acc 54.688 (54.497)	Top-5 acc 78.516 (77.103)	lr 0.01852
Train [41][2670/3239]	Time 0.230 (0.478)	Data Time 0.001 (0.014)	Loss 2.6725 (2.8858)	Entropy 0.64869 (0.65312)	Top-1 acc 59.766 (54.496)	Top-5 acc 82.422 (77.106)	lr 0.01852
Train [41][2680/3239]	Time 0.334 (0.490)	Data Time 0.004 (0.014)	Loss 2.8382 (2.8859)	Entropy 0.64863 (0.65310)	Top-1 acc 55.469 (54.494)	Top-5 acc 78.516 (77.105)	lr 0.01851
Train [41][2690/3239]	Time 0.238 (0.490)	Data Time 0.002 (0.014)	Loss 2.7681 (2.8856)	Entropy 0.64879 (0.65309)	Top-1 acc 56.641 (54.501)	Top-5 acc 78.516 (77.109)	lr 0.01851
Train [41][2700/3239]	Time 0.290 (0.490)	Data Time 0.001 (0.014)	Loss 3.0060 (2.8855)	Entropy 0.64890 (0.65307)	Top-1 acc 49.219 (54.504)	Top-5 acc 73.047 (77.112)	lr 0.01851
Train [41][2710/3239]	Time 0.233 (0.490)	Data Time 0.001 (0.014)	Loss 2.8007 (2.8856)	Entropy 0.64877 (0.65306)	Top-1 acc 54.688 (54.500)	Top-5 acc 76.953 (77.110)	lr 0.01851
Train [41][2720/3239]	Time 0.269 (0.489)	Data Time 0.001 (0.014)	Loss 2.9294 (2.8854)	Entropy 0.64847 (0.65304)	Top-1 acc 53.516 (54.502)	Top-5 acc 75.391 (77.112)	lr 0.01851
Train [41][2730/3239]	Time 0.231 (0.489)	Data Time 0.001 (0.014)	Loss 2.8042 (2.8853)	Entropy 0.64828 (0.65302)	Top-1 acc 53.906 (54.504)	Top-5 acc 78.906 (77.114)	lr 0.01851
Train [41][2740/3239]	Time 0.277 (0.489)	Data Time 0.003 (0.014)	Loss 2.8662 (2.8850)	Entropy 0.64866 (0.65301)	Top-1 acc 55.469 (54.511)	Top-5 acc 76.562 (77.120)	lr 0.01851
Train [41][2750/3239]	Time 0.251 (0.489)	Data Time 0.001 (0.014)	Loss 2.6473 (2.8847)	Entropy 0.64871 (0.65299)	Top-1 acc 60.547 (54.518)	Top-5 acc 83.594 (77.126)	lr 0.01851
Train [41][2760/3239]	Time 0.238 (0.488)	Data Time 0.001 (0.013)	Loss 2.8432 (2.8847)	Entropy 0.64901 (0.65298)	Top-1 acc 53.516 (54.522)	Top-5 acc 77.734 (77.126)	lr 0.01851
Train [41][2770/3239]	Time 0.350 (0.488)	Data Time 0.001 (0.013)	Loss 2.9526 (2.8845)	Entropy 0.64962 (0.65296)	Top-1 acc 53.125 (54.525)	Top-5 acc 77.344 (77.128)	lr 0.01851
Train [41][2780/3239]	Time 0.261 (0.488)	Data Time 0.002 (0.013)	Loss 2.9804 (2.8846)	Entropy 0.64968 (0.65295)	Top-1 acc 51.953 (54.522)	Top-5 acc 73.828 (77.126)	lr 0.01851
Train [41][2790/3239]	Time 0.241 (0.488)	Data Time 0.002 (0.013)	Loss 2.9462 (2.8849)	Entropy 0.64957 (0.65294)	Top-1 acc 53.906 (54.516)	Top-5 acc 76.562 (77.120)	lr 0.01850
Train [41][2800/3239]	Time 0.236 (0.488)	Data Time 0.002 (0.013)	Loss 2.8576 (2.8849)	Entropy 0.64974 (0.65293)	Top-1 acc 54.297 (54.517)	Top-5 acc 76.953 (77.121)	lr 0.01850
Train [41][2810/3239]	Time 0.235 (0.487)	Data Time 0.001 (0.013)	Loss 2.9114 (2.8851)	Entropy 0.64937 (0.65291)	Top-1 acc 57.031 (54.516)	Top-5 acc 77.344 (77.117)	lr 0.01850
Train [41][2820/3239]	Time 0.263 (0.487)	Data Time 0.003 (0.013)	Loss 2.9207 (2.8852)	Entropy 0.64950 (0.65290)	Top-1 acc 54.688 (54.515)	Top-5 acc 76.562 (77.117)	lr 0.01850
Train [41][2830/3239]	Time 0.222 (0.487)	Data Time 0.001 (0.013)	Loss 3.2295 (2.8854)	Entropy 0.64972 (0.65289)	Top-1 acc 44.922 (54.511)	Top-5 acc 73.438 (77.113)	lr 0.01850
Train [41][2840/3239]	Time 0.337 (0.487)	Data Time 0.001 (0.013)	Loss 2.7080 (2.8852)	Entropy 0.64966 (0.65288)	Top-1 acc 58.203 (54.515)	Top-5 acc 80.859 (77.118)	lr 0.01850
Train [41][2850/3239]	Time 0.237 (0.486)	Data Time 0.001 (0.013)	Loss 3.0151 (2.8853)	Entropy 0.64995 (0.65287)	Top-1 acc 48.047 (54.507)	Top-5 acc 76.953 (77.118)	lr 0.01850
Train [41][2860/3239]	Time 0.227 (0.486)	Data Time 0.001 (0.013)	Loss 3.0262 (2.8852)	Entropy 0.64970 (0.65286)	Top-1 acc 50.781 (54.509)	Top-5 acc 75.781 (77.118)	lr 0.01850
Train [41][2870/3239]	Time 0.258 (0.486)	Data Time 0.001 (0.013)	Loss 2.9141 (2.8854)	Entropy 0.64992 (0.65285)	Top-1 acc 54.688 (54.506)	Top-5 acc 74.609 (77.113)	lr 0.01850
Train [41][2880/3239]	Time 0.230 (0.486)	Data Time 0.001 (0.013)	Loss 2.9070 (2.8855)	Entropy 0.64953 (0.65284)	Top-1 acc 53.516 (54.502)	Top-5 acc 77.344 (77.112)	lr 0.01850
Train [41][2890/3239]	Time 0.231 (0.485)	Data Time 0.001 (0.013)	Loss 2.9432 (2.8853)	Entropy 0.64983 (0.65283)	Top-1 acc 51.953 (54.506)	Top-5 acc 75.000 (77.115)	lr 0.01850
Train [41][2900/3239]	Time 0.225 (0.485)	Data Time 0.001 (0.013)	Loss 3.0642 (2.8851)	Entropy 0.64965 (0.65282)	Top-1 acc 53.516 (54.512)	Top-5 acc 71.484 (77.121)	lr 0.01849
Train [41][2910/3239]	Time 0.235 (0.485)	Data Time 0.001 (0.013)	Loss 2.9441 (2.8850)	Entropy 0.64923 (0.65280)	Top-1 acc 53.125 (54.511)	Top-5 acc 73.828 (77.122)	lr 0.01849
Train [41][2920/3239]	Time 0.235 (0.485)	Data Time 0.001 (0.013)	Loss 2.8565 (2.8849)	Entropy 0.64907 (0.65279)	Top-1 acc 51.953 (54.516)	Top-5 acc 78.125 (77.123)	lr 0.01849
Train [41][2930/3239]	Time 0.319 (0.484)	Data Time 0.001 (0.013)	Loss 2.9667 (2.8850)	Entropy 0.64928 (0.65278)	Top-1 acc 55.078 (54.515)	Top-5 acc 78.906 (77.122)	lr 0.01849
Train [41][2940/3239]	Time 0.278 (0.484)	Data Time 0.001 (0.013)	Loss 2.9182 (2.8850)	Entropy 0.64959 (0.65277)	Top-1 acc 51.562 (54.513)	Top-5 acc 78.516 (77.123)	lr 0.01849
Train [41][2950/3239]	Time 0.252 (0.484)	Data Time 0.002 (0.013)	Loss 2.7841 (2.8851)	Entropy 0.64958 (0.65276)	Top-1 acc 55.859 (54.515)	Top-5 acc 82.031 (77.125)	lr 0.01849
Train [41][2960/3239]	Time 0.233 (0.484)	Data Time 0.002 (0.013)	Loss 2.7589 (2.8851)	Entropy 0.64975 (0.65275)	Top-1 acc 55.078 (54.514)	Top-5 acc 78.906 (77.124)	lr 0.01849
Train [41][2970/3239]	Time 0.237 (0.484)	Data Time 0.001 (0.013)	Loss 2.7588 (2.8850)	Entropy 0.64974 (0.65274)	Top-1 acc 57.812 (54.516)	Top-5 acc 80.078 (77.127)	lr 0.01849
Train [41][2980/3239]	Time 0.235 (0.483)	Data Time 0.001 (0.013)	Loss 3.0273 (2.8849)	Entropy 0.65014 (0.65273)	Top-1 acc 51.953 (54.517)	Top-5 acc 73.047 (77.128)	lr 0.01849
Train [41][2990/3239]	Time 0.240 (0.483)	Data Time 0.002 (0.013)	Loss 2.7773 (2.8851)	Entropy 0.64976 (0.65272)	Top-1 acc 53.906 (54.510)	Top-5 acc 78.906 (77.127)	lr 0.01849
Train [41][3000/3239]	Time 0.339 (0.483)	Data Time 0.002 (0.013)	Loss 2.8628 (2.8852)	Entropy 0.64984 (0.65271)	Top-1 acc 57.422 (54.506)	Top-5 acc 78.125 (77.126)	lr 0.01849
Train [41][3010/3239]	Time 0.227 (0.483)	Data Time 0.002 (0.012)	Loss 2.9726 (2.8853)	Entropy 0.64959 (0.65270)	Top-1 acc 55.078 (54.506)	Top-5 acc 74.609 (77.126)	lr 0.01848
Train [41][3020/3239]	Time 0.231 (0.483)	Data Time 0.002 (0.012)	Loss 2.9566 (2.8852)	Entropy 0.64940 (0.65269)	Top-1 acc 53.125 (54.504)	Top-5 acc 75.000 (77.127)	lr 0.01848
Train [41][3030/3239]	Time 0.233 (0.482)	Data Time 0.002 (0.012)	Loss 2.8293 (2.8855)	Entropy 0.64931 (0.65268)	Top-1 acc 55.859 (54.502)	Top-5 acc 78.906 (77.122)	lr 0.01848
Train [41][3040/3239]	Time 0.234 (0.482)	Data Time 0.001 (0.012)	Loss 2.9330 (2.8857)	Entropy 0.64927 (0.65266)	Top-1 acc 55.078 (54.496)	Top-5 acc 76.953 (77.119)	lr 0.01848
Train [41][3050/3239]	Time 0.262 (0.482)	Data Time 0.001 (0.012)	Loss 3.0232 (2.8858)	Entropy 0.64936 (0.65265)	Top-1 acc 50.000 (54.492)	Top-5 acc 73.828 (77.116)	lr 0.01848
Train [41][3060/3239]	Time 0.235 (0.482)	Data Time 0.001 (0.012)	Loss 3.0288 (2.8857)	Entropy 0.64958 (0.65264)	Top-1 acc 50.391 (54.496)	Top-5 acc 75.000 (77.119)	lr 0.01848
Train [41][3070/3239]	Time 0.236 (0.481)	Data Time 0.001 (0.012)	Loss 2.8764 (2.8857)	Entropy 0.64955 (0.65263)	Top-1 acc 54.297 (54.496)	Top-5 acc 78.516 (77.120)	lr 0.01848
Train [41][3080/3239]	Time 0.227 (0.481)	Data Time 0.001 (0.012)	Loss 2.8166 (2.8856)	Entropy 0.64939 (0.65262)	Top-1 acc 56.641 (54.499)	Top-5 acc 77.734 (77.121)	lr 0.01848
Train [41][3090/3239]	Time 0.270 (0.481)	Data Time 0.001 (0.012)	Loss 2.8834 (2.8855)	Entropy 0.64937 (0.65261)	Top-1 acc 52.344 (54.503)	Top-5 acc 79.297 (77.123)	lr 0.01848
Train [41][3100/3239]	Time 0.230 (0.481)	Data Time 0.001 (0.012)	Loss 3.1765 (2.8856)	Entropy 0.64915 (0.65260)	Top-1 acc 48.828 (54.503)	Top-5 acc 71.484 (77.122)	lr 0.01848
Train [41][3110/3239]	Time 0.281 (0.480)	Data Time 0.001 (0.012)	Loss 2.8583 (2.8856)	Entropy 0.64925 (0.65259)	Top-1 acc 52.344 (54.499)	Top-5 acc 78.125 (77.122)	lr 0.01848
Train [41][3120/3239]	Time 0.223 (0.480)	Data Time 0.001 (0.012)	Loss 2.8018 (2.8855)	Entropy 0.64938 (0.65258)	Top-1 acc 57.812 (54.507)	Top-5 acc 79.688 (77.125)	lr 0.01848
Train [41][3130/3239]	Time 0.238 (0.480)	Data Time 0.001 (0.012)	Loss 2.9540 (2.8857)	Entropy 0.64929 (0.65257)	Top-1 acc 53.516 (54.503)	Top-5 acc 72.266 (77.120)	lr 0.01847
Train [41][3140/3239]	Time 0.267 (0.480)	Data Time 0.004 (0.012)	Loss 3.0160 (2.8858)	Entropy 0.64921 (0.65256)	Top-1 acc 55.469 (54.502)	Top-5 acc 74.219 (77.119)	lr 0.01847
Train [41][3150/3239]	Time 0.226 (0.480)	Data Time 0.001 (0.012)	Loss 2.8699 (2.8860)	Entropy 0.64936 (0.65255)	Top-1 acc 55.078 (54.497)	Top-5 acc 78.516 (77.118)	lr 0.01847
Train [41][3160/3239]	Time 0.322 (0.479)	Data Time 0.001 (0.012)	Loss 2.6852 (2.8862)	Entropy 0.64945 (0.65254)	Top-1 acc 56.641 (54.492)	Top-5 acc 82.422 (77.111)	lr 0.01847
Train [41][3170/3239]	Time 0.237 (0.479)	Data Time 0.001 (0.012)	Loss 3.0027 (2.8863)	Entropy 0.64940 (0.65253)	Top-1 acc 52.344 (54.488)	Top-5 acc 73.828 (77.111)	lr 0.01847
Train [41][3180/3239]	Time 0.231 (0.479)	Data Time 0.000 (0.012)	Loss 2.8262 (2.8861)	Entropy 0.64899 (0.65252)	Top-1 acc 55.078 (54.492)	Top-5 acc 78.125 (77.116)	lr 0.01847
Train [41][3190/3239]	Time 0.215 (0.479)	Data Time 0.000 (0.012)	Loss 2.7150 (2.8859)	Entropy 0.64890 (0.65251)	Top-1 acc 58.984 (54.495)	Top-5 acc 80.859 (77.122)	lr 0.01847
Train [41][3200/3239]	Time 0.228 (0.478)	Data Time 0.000 (0.012)	Loss 2.8293 (2.8857)	Entropy 0.64857 (0.65250)	Top-1 acc 54.688 (54.500)	Top-5 acc 76.172 (77.124)	lr 0.01847
Train [41][3210/3239]	Time 0.221 (0.478)	Data Time 0.000 (0.012)	Loss 2.8763 (2.8858)	Entropy 0.64840 (0.65248)	Top-1 acc 56.250 (54.496)	Top-5 acc 75.781 (77.122)	lr 0.01847
Train [41][3220/3239]	Time 0.222 (0.478)	Data Time 0.000 (0.012)	Loss 2.8171 (2.8860)	Entropy 0.64824 (0.65247)	Top-1 acc 55.078 (54.493)	Top-5 acc 78.906 (77.118)	lr 0.01847
Train [41][3230/3239]	Time 0.323 (0.477)	Data Time 0.000 (0.012)	Loss 3.0848 (2.8861)	Entropy 0.64783 (0.65246)	Top-1 acc 50.391 (54.494)	Top-5 acc 71.875 (77.114)	lr 0.01847
Train [41][3239/3239]	Time 0.888 (0.477)	Data Time 0.000 (0.012)	Loss 3.0646 (2.8862)	Entropy 0.64775 (0.65244)	Top-1 acc 41.975 (54.490)	Top-5 acc 77.778 (77.112)	lr 0.01846
==========Valid [41/120]	loss 1.605	top-1 acc 63.706 (63.706)	top-5 acc 84.591	Train top-1 54.490	top-5 77.112	Entropy 0.64775	Latency-None: 0.000ms	Flops: 539.76M
Train [42][0/3239]	Time 32.594 (32.594)	Data Time 31.443 (31.443)	Loss 3.1113 (3.1113)	Entropy 0.64763 (0.64763)	Top-1 acc 50.000 (50.000)	Top-5 acc 74.609 (74.609)	lr 0.01846
Train [42][10/3239]	Time 0.253 (3.460)	Data Time 0.001 (2.860)	Loss 2.8337 (2.9070)	Entropy 0.64783 (0.64772)	Top-1 acc 54.688 (54.261)	Top-5 acc 77.734 (77.486)	lr 0.01846
Train [42][20/3239]	Time 0.236 (2.008)	Data Time 0.001 (1.499)	Loss 2.7609 (2.8677)	Entropy 0.64732 (0.64767)	Top-1 acc 54.688 (54.669)	Top-5 acc 80.469 (77.939)	lr 0.01846
Train [42][30/3239]	Time 0.235 (1.487)	Data Time 0.001 (1.016)	Loss 2.9933 (2.8604)	Entropy 0.64751 (0.64758)	Top-1 acc 57.031 (55.091)	Top-5 acc 71.094 (77.898)	lr 0.01846
Train [42][40/3239]	Time 0.235 (1.222)	Data Time 0.001 (0.768)	Loss 2.8283 (2.8470)	Entropy 0.64775 (0.64757)	Top-1 acc 53.906 (55.564)	Top-5 acc 77.734 (78.249)	lr 0.01846
Train [42][50/3239]	Time 0.260 (1.062)	Data Time 0.001 (0.618)	Loss 2.7401 (2.8625)	Entropy 0.64771 (0.64761)	Top-1 acc 58.984 (55.277)	Top-5 acc 81.250 (77.872)	lr 0.01846
Train [42][60/3239]	Time 0.334 (0.956)	Data Time 0.001 (0.517)	Loss 2.9046 (2.8600)	Entropy 0.64719 (0.64759)	Top-1 acc 52.344 (55.206)	Top-5 acc 75.781 (77.882)	lr 0.01846
Train [42][70/3239]	Time 0.235 (0.880)	Data Time 0.001 (0.444)	Loss 2.9442 (2.8641)	Entropy 0.64756 (0.64755)	Top-1 acc 54.297 (55.144)	Top-5 acc 75.781 (77.756)	lr 0.01846
Train [42][80/3239]	Time 0.239 (0.821)	Data Time 0.001 (0.390)	Loss 2.8928 (2.8700)	Entropy 0.64797 (0.64757)	Top-1 acc 54.688 (54.991)	Top-5 acc 79.297 (77.643)	lr 0.01846
Train [42][90/3239]	Time 0.246 (0.777)	Data Time 0.001 (0.347)	Loss 2.9165 (2.8653)	Entropy 0.64789 (0.64760)	Top-1 acc 52.734 (55.121)	Top-5 acc 76.562 (77.640)	lr 0.01846
Train [42][100/3239]	Time 0.285 (1.081)	Data Time 0.003 (0.313)	Loss 2.9372 (2.8746)	Entropy 0.64820 (0.64764)	Top-1 acc 58.203 (54.989)	Top-5 acc 75.000 (77.452)	lr 0.01846
Train [42][110/3239]	Time 0.247 (1.022)	Data Time 0.002 (0.285)	Loss 2.8145 (2.8709)	Entropy 0.64792 (0.64769)	Top-1 acc 54.688 (55.046)	Top-5 acc 78.125 (77.520)	lr 0.01845
Train [42][120/3239]	Time 0.249 (0.972)	Data Time 0.002 (0.262)	Loss 2.8302 (2.8734)	Entropy 0.64791 (0.64770)	Top-1 acc 57.812 (54.965)	Top-5 acc 78.516 (77.466)	lr 0.01845
Train [42][130/3239]	Time 0.235 (0.932)	Data Time 0.001 (0.242)	Loss 2.8732 (2.8732)	Entropy 0.64778 (0.64771)	Top-1 acc 52.344 (54.881)	Top-5 acc 77.344 (77.517)	lr 0.01845
Train [42][140/3239]	Time 0.238 (0.895)	Data Time 0.001 (0.225)	Loss 3.0785 (2.8716)	Entropy 0.64783 (0.64772)	Top-1 acc 49.609 (54.945)	Top-5 acc 74.219 (77.510)	lr 0.01845
Train [42][150/3239]	Time 0.338 (0.864)	Data Time 0.001 (0.210)	Loss 2.7408 (2.8692)	Entropy 0.64758 (0.64772)	Top-1 acc 60.156 (55.006)	Top-5 acc 75.781 (77.499)	lr 0.01845
Train [42][160/3239]	Time 0.249 (0.836)	Data Time 0.001 (0.197)	Loss 2.7586 (2.8692)	Entropy 0.64745 (0.64770)	Top-1 acc 60.547 (55.071)	Top-5 acc 80.469 (77.451)	lr 0.01845
Train [42][170/3239]	Time 0.232 (0.812)	Data Time 0.001 (0.186)	Loss 2.8702 (2.8751)	Entropy 0.64770 (0.64769)	Top-1 acc 57.031 (54.909)	Top-5 acc 75.000 (77.287)	lr 0.01845
Train [42][180/3239]	Time 0.265 (0.791)	Data Time 0.001 (0.175)	Loss 2.9280 (2.8750)	Entropy 0.64786 (0.64770)	Top-1 acc 53.906 (54.899)	Top-5 acc 76.172 (77.275)	lr 0.01845
Train [42][190/3239]	Time 0.231 (0.771)	Data Time 0.001 (0.166)	Loss 2.7686 (2.8733)	Entropy 0.64775 (0.64770)	Top-1 acc 58.594 (54.941)	Top-5 acc 80.469 (77.319)	lr 0.01845
Train [42][200/3239]	Time 0.243 (0.754)	Data Time 0.001 (0.158)	Loss 2.9194 (2.8749)	Entropy 0.64770 (0.64770)	Top-1 acc 52.344 (54.870)	Top-5 acc 74.609 (77.285)	lr 0.01845
Train [42][210/3239]	Time 0.230 (0.737)	Data Time 0.001 (0.151)	Loss 2.9399 (2.8719)	Entropy 0.64796 (0.64770)	Top-1 acc 51.953 (54.899)	Top-5 acc 75.391 (77.327)	lr 0.01845
Train [42][220/3239]	Time 0.345 (0.723)	Data Time 0.002 (0.144)	Loss 2.6631 (2.8704)	Entropy 0.64765 (0.64772)	Top-1 acc 59.375 (54.868)	Top-5 acc 83.594 (77.377)	lr 0.01844
Train [42][230/3239]	Time 0.261 (0.710)	Data Time 0.001 (0.138)	Loss 3.0662 (2.8715)	Entropy 0.64801 (0.64772)	Top-1 acc 51.953 (54.877)	Top-5 acc 74.219 (77.367)	lr 0.01844
Train [42][240/3239]	Time 0.245 (0.698)	Data Time 0.001 (0.132)	Loss 3.0616 (2.8713)	Entropy 0.64800 (0.64773)	Top-1 acc 52.344 (54.910)	Top-5 acc 72.656 (77.362)	lr 0.01844
Train [42][250/3239]	Time 0.231 (0.687)	Data Time 0.001 (0.127)	Loss 2.7569 (2.8706)	Entropy 0.64803 (0.64774)	Top-1 acc 57.812 (54.943)	Top-5 acc 78.906 (77.390)	lr 0.01844
Train [42][260/3239]	Time 0.228 (0.676)	Data Time 0.001 (0.122)	Loss 2.6793 (2.8719)	Entropy 0.64841 (0.64776)	Top-1 acc 60.156 (54.890)	Top-5 acc 80.469 (77.341)	lr 0.01844
Train [42][270/3239]	Time 0.234 (0.667)	Data Time 0.001 (0.118)	Loss 2.8003 (2.8690)	Entropy 0.64877 (0.64778)	Top-1 acc 58.984 (54.954)	Top-5 acc 78.516 (77.403)	lr 0.01844
Train [42][280/3239]	Time 0.242 (0.658)	Data Time 0.001 (0.114)	Loss 2.8089 (2.8669)	Entropy 0.64875 (0.64782)	Top-1 acc 58.203 (54.971)	Top-5 acc 80.859 (77.452)	lr 0.01844
Train [42][290/3239]	Time 0.237 (0.650)	Data Time 0.001 (0.110)	Loss 2.8294 (2.8679)	Entropy 0.64911 (0.64786)	Top-1 acc 54.297 (54.940)	Top-5 acc 78.125 (77.428)	lr 0.01844
Train [42][300/3239]	Time 0.241 (0.642)	Data Time 0.001 (0.106)	Loss 2.8772 (2.8657)	Entropy 0.64889 (0.64790)	Top-1 acc 50.391 (54.987)	Top-5 acc 76.953 (77.474)	lr 0.01844
Train [42][310/3239]	Time 0.251 (0.634)	Data Time 0.001 (0.103)	Loss 2.8667 (2.8656)	Entropy 0.64886 (0.64793)	Top-1 acc 57.031 (55.009)	Top-5 acc 75.391 (77.493)	lr 0.01844
Train [42][320/3239]	Time 0.231 (0.628)	Data Time 0.001 (0.100)	Loss 2.6136 (2.8653)	Entropy 0.64902 (0.64796)	Top-1 acc 59.375 (54.987)	Top-5 acc 83.594 (77.518)	lr 0.01844
Train [42][330/3239]	Time 0.229 (0.621)	Data Time 0.001 (0.097)	Loss 2.7953 (2.8631)	Entropy 0.64921 (0.64799)	Top-1 acc 57.031 (55.036)	Top-5 acc 76.562 (77.564)	lr 0.01844
Train [42][340/3239]	Time 0.228 (0.615)	Data Time 0.001 (0.094)	Loss 2.7821 (2.8636)	Entropy 0.64933 (0.64803)	Top-1 acc 57.422 (55.012)	Top-5 acc 79.297 (77.567)	lr 0.01843
Train [42][350/3239]	Time 0.240 (0.609)	Data Time 0.001 (0.091)	Loss 2.6625 (2.8622)	Entropy 0.64928 (0.64807)	Top-1 acc 58.984 (55.035)	Top-5 acc 82.031 (77.575)	lr 0.01843
Train [42][360/3239]	Time 0.236 (0.604)	Data Time 0.001 (0.089)	Loss 2.8946 (2.8634)	Entropy 0.64917 (0.64810)	Top-1 acc 53.125 (54.997)	Top-5 acc 74.609 (77.528)	lr 0.01843
Train [42][370/3239]	Time 0.231 (0.599)	Data Time 0.001 (0.086)	Loss 2.6203 (2.8617)	Entropy 0.64886 (0.64813)	Top-1 acc 63.672 (55.037)	Top-5 acc 82.031 (77.570)	lr 0.01843
Train [42][380/3239]	Time 0.320 (0.594)	Data Time 0.002 (0.084)	Loss 3.1318 (2.8639)	Entropy 0.64894 (0.64815)	Top-1 acc 49.609 (54.988)	Top-5 acc 71.875 (77.530)	lr 0.01843
Train [42][390/3239]	Time 0.242 (0.589)	Data Time 0.002 (0.082)	Loss 2.7789 (2.8628)	Entropy 0.64909 (0.64817)	Top-1 acc 58.594 (55.038)	Top-5 acc 79.688 (77.566)	lr 0.01843
Train [42][400/3239]	Time 0.248 (0.585)	Data Time 0.002 (0.080)	Loss 2.7796 (2.8642)	Entropy 0.64941 (0.64819)	Top-1 acc 53.516 (54.994)	Top-5 acc 80.859 (77.554)	lr 0.01843
Train [42][410/3239]	Time 0.219 (0.581)	Data Time 0.001 (0.078)	Loss 2.8469 (2.8633)	Entropy 0.64898 (0.64822)	Top-1 acc 55.469 (55.012)	Top-5 acc 78.516 (77.560)	lr 0.01843
Train [42][420/3239]	Time 0.229 (0.577)	Data Time 0.001 (0.076)	Loss 2.9457 (2.8632)	Entropy 0.64888 (0.64824)	Top-1 acc 51.172 (55.011)	Top-5 acc 77.734 (77.560)	lr 0.01843
Train [42][430/3239]	Time 0.230 (0.574)	Data Time 0.002 (0.075)	Loss 2.7296 (2.8635)	Entropy 0.64872 (0.64825)	Top-1 acc 59.375 (54.995)	Top-5 acc 80.859 (77.566)	lr 0.01843
Train [42][440/3239]	Time 0.231 (0.570)	Data Time 0.001 (0.073)	Loss 2.9992 (2.8639)	Entropy 0.64888 (0.64826)	Top-1 acc 52.344 (54.987)	Top-5 acc 73.828 (77.549)	lr 0.01843
Train [42][450/3239]	Time 0.338 (0.566)	Data Time 0.001 (0.071)	Loss 2.6339 (2.8641)	Entropy 0.64866 (0.64827)	Top-1 acc 60.156 (54.991)	Top-5 acc 81.250 (77.527)	lr 0.01842
Train [42][460/3239]	Time 0.236 (0.563)	Data Time 0.001 (0.070)	Loss 2.9042 (2.8639)	Entropy 0.64846 (0.64828)	Top-1 acc 58.594 (54.997)	Top-5 acc 75.781 (77.545)	lr 0.01842
Train [42][470/3239]	Time 0.232 (0.559)	Data Time 0.001 (0.068)	Loss 2.8138 (2.8629)	Entropy 0.64837 (0.64828)	Top-1 acc 52.344 (55.042)	Top-5 acc 80.078 (77.564)	lr 0.01842
Train [42][480/3239]	Time 0.236 (0.556)	Data Time 0.001 (0.067)	Loss 2.8262 (2.8628)	Entropy 0.64875 (0.64829)	Top-1 acc 54.688 (55.042)	Top-5 acc 79.688 (77.557)	lr 0.01842
Train [42][490/3239]	Time 0.228 (0.552)	Data Time 0.001 (0.066)	Loss 2.9047 (2.8623)	Entropy 0.64865 (0.64829)	Top-1 acc 50.781 (55.057)	Top-5 acc 77.344 (77.572)	lr 0.01842
Train [42][500/3239]	Time 0.251 (0.550)	Data Time 0.001 (0.064)	Loss 2.7807 (2.8616)	Entropy 0.64882 (0.64830)	Top-1 acc 59.375 (55.077)	Top-5 acc 82.031 (77.599)	lr 0.01842
Train [42][510/3239]	Time 0.227 (0.547)	Data Time 0.001 (0.063)	Loss 2.7257 (2.8610)	Entropy 0.64900 (0.64831)	Top-1 acc 57.422 (55.080)	Top-5 acc 81.250 (77.616)	lr 0.01842
Train [42][520/3239]	Time 0.257 (0.545)	Data Time 0.001 (0.062)	Loss 2.8241 (2.8613)	Entropy 0.64918 (0.64833)	Top-1 acc 55.078 (55.075)	Top-5 acc 78.906 (77.599)	lr 0.01842
Train [42][530/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.061)	Loss 2.6585 (2.8605)	Entropy 0.64895 (0.64834)	Top-1 acc 59.766 (55.110)	Top-5 acc 78.125 (77.623)	lr 0.01842
Train [42][540/3239]	Time 0.349 (0.540)	Data Time 0.001 (0.060)	Loss 3.0839 (2.8617)	Entropy 0.64879 (0.64835)	Top-1 acc 49.219 (55.082)	Top-5 acc 76.953 (77.607)	lr 0.01842
Train [42][550/3239]	Time 0.227 (0.537)	Data Time 0.001 (0.059)	Loss 2.9071 (2.8599)	Entropy 0.64877 (0.64836)	Top-1 acc 55.469 (55.120)	Top-5 acc 74.609 (77.639)	lr 0.01842
Train [42][560/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.058)	Loss 2.7468 (2.8593)	Entropy 0.64862 (0.64837)	Top-1 acc 55.469 (55.124)	Top-5 acc 82.031 (77.652)	lr 0.01841
Train [42][570/3239]	Time 0.244 (0.533)	Data Time 0.001 (0.057)	Loss 2.8515 (2.8597)	Entropy 0.64853 (0.64837)	Top-1 acc 53.125 (55.108)	Top-5 acc 75.000 (77.644)	lr 0.01841
Train [42][580/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.056)	Loss 2.8528 (2.8592)	Entropy 0.64874 (0.64838)	Top-1 acc 57.812 (55.128)	Top-5 acc 75.391 (77.648)	lr 0.01841
Train [42][590/3239]	Time 0.241 (0.529)	Data Time 0.001 (0.055)	Loss 3.0485 (2.8591)	Entropy 0.64833 (0.64838)	Top-1 acc 51.172 (55.133)	Top-5 acc 74.219 (77.641)	lr 0.01841
Train [42][600/3239]	Time 0.236 (0.527)	Data Time 0.002 (0.054)	Loss 2.8734 (2.8594)	Entropy 0.64841 (0.64838)	Top-1 acc 51.562 (55.128)	Top-5 acc 79.688 (77.641)	lr 0.01841
Train [42][610/3239]	Time 0.366 (0.525)	Data Time 0.001 (0.053)	Loss 2.9088 (2.8584)	Entropy 0.64822 (0.64838)	Top-1 acc 50.781 (55.154)	Top-5 acc 79.688 (77.660)	lr 0.01841
Train [42][620/3239]	Time 0.280 (0.524)	Data Time 0.002 (0.052)	Loss 2.8988 (2.8577)	Entropy 0.64836 (0.64838)	Top-1 acc 53.906 (55.158)	Top-5 acc 78.516 (77.658)	lr 0.01841
Train [42][630/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.051)	Loss 2.8407 (2.8580)	Entropy 0.64869 (0.64838)	Top-1 acc 54.297 (55.157)	Top-5 acc 76.953 (77.655)	lr 0.01841
Train [42][640/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.051)	Loss 3.1695 (2.8584)	Entropy 0.64861 (0.64839)	Top-1 acc 47.266 (55.126)	Top-5 acc 73.047 (77.661)	lr 0.01841
Train [42][650/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.050)	Loss 2.7234 (2.8578)	Entropy 0.64851 (0.64839)	Top-1 acc 60.156 (55.148)	Top-5 acc 78.516 (77.672)	lr 0.01841
Train [42][660/3239]	Time 0.263 (0.516)	Data Time 0.001 (0.049)	Loss 2.8749 (2.8574)	Entropy 0.64843 (0.64839)	Top-1 acc 56.250 (55.168)	Top-5 acc 73.828 (77.681)	lr 0.01841
Train [42][670/3239]	Time 0.241 (0.515)	Data Time 0.001 (0.049)	Loss 2.8550 (2.8574)	Entropy 0.64858 (0.64839)	Top-1 acc 56.250 (55.170)	Top-5 acc 79.297 (77.683)	lr 0.01840
Train [42][680/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.048)	Loss 3.0545 (2.8580)	Entropy 0.64873 (0.64839)	Top-1 acc 50.391 (55.166)	Top-5 acc 75.781 (77.678)	lr 0.01840
Train [42][690/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.047)	Loss 2.7481 (2.8574)	Entropy 0.64872 (0.64840)	Top-1 acc 58.984 (55.182)	Top-5 acc 78.125 (77.681)	lr 0.01840
Train [42][700/3239]	Time 0.325 (0.510)	Data Time 0.001 (0.047)	Loss 2.6738 (2.8565)	Entropy 0.64882 (0.64841)	Top-1 acc 60.156 (55.206)	Top-5 acc 79.297 (77.700)	lr 0.01840
Train [42][710/3239]	Time 0.232 (0.509)	Data Time 0.001 (0.046)	Loss 2.9308 (2.8569)	Entropy 0.64866 (0.64841)	Top-1 acc 55.078 (55.203)	Top-5 acc 76.953 (77.684)	lr 0.01840
Train [42][720/3239]	Time 0.228 (0.507)	Data Time 0.001 (0.045)	Loss 2.9655 (2.8575)	Entropy 0.64857 (0.64841)	Top-1 acc 51.953 (55.194)	Top-5 acc 76.172 (77.670)	lr 0.01840
Train [42][730/3239]	Time 0.238 (0.506)	Data Time 0.001 (0.045)	Loss 2.8499 (2.8572)	Entropy 0.64843 (0.64841)	Top-1 acc 55.078 (55.198)	Top-5 acc 76.172 (77.682)	lr 0.01840
Train [42][740/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.044)	Loss 2.9661 (2.8581)	Entropy 0.64870 (0.64842)	Top-1 acc 51.562 (55.184)	Top-5 acc 77.734 (77.671)	lr 0.01840
Train [42][750/3239]	Time 0.405 (0.544)	Data Time 0.005 (0.044)	Loss 3.0226 (2.8596)	Entropy 0.64881 (0.64842)	Top-1 acc 51.953 (55.159)	Top-5 acc 75.391 (77.642)	lr 0.01840
Train [42][760/3239]	Time 0.239 (0.543)	Data Time 0.002 (0.043)	Loss 2.8576 (2.8592)	Entropy 0.64887 (0.64843)	Top-1 acc 58.203 (55.167)	Top-5 acc 78.906 (77.657)	lr 0.01840
Train [42][770/3239]	Time 0.311 (0.541)	Data Time 0.001 (0.042)	Loss 2.8164 (2.8591)	Entropy 0.64914 (0.64843)	Top-1 acc 55.859 (55.163)	Top-5 acc 81.250 (77.660)	lr 0.01840
Train [42][780/3239]	Time 0.227 (0.540)	Data Time 0.001 (0.042)	Loss 3.1009 (2.8593)	Entropy 0.64906 (0.64844)	Top-1 acc 46.484 (55.145)	Top-5 acc 71.484 (77.649)	lr 0.01840
Train [42][790/3239]	Time 0.239 (0.538)	Data Time 0.001 (0.041)	Loss 2.7886 (2.8600)	Entropy 0.64897 (0.64845)	Top-1 acc 58.594 (55.142)	Top-5 acc 76.953 (77.640)	lr 0.01839
Train [42][800/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.041)	Loss 2.7549 (2.8596)	Entropy 0.64942 (0.64846)	Top-1 acc 60.156 (55.162)	Top-5 acc 80.078 (77.643)	lr 0.01839
Train [42][810/3239]	Time 0.257 (0.535)	Data Time 0.001 (0.040)	Loss 2.8526 (2.8599)	Entropy 0.64925 (0.64847)	Top-1 acc 56.641 (55.154)	Top-5 acc 77.734 (77.639)	lr 0.01839
Train [42][820/3239]	Time 0.271 (0.534)	Data Time 0.001 (0.040)	Loss 3.0010 (2.8602)	Entropy 0.64947 (0.64848)	Top-1 acc 54.297 (55.154)	Top-5 acc 73.438 (77.634)	lr 0.01839
Train [42][830/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.040)	Loss 2.8186 (2.8603)	Entropy 0.64929 (0.64849)	Top-1 acc 58.594 (55.156)	Top-5 acc 77.734 (77.631)	lr 0.01839
Train [42][840/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.039)	Loss 2.9062 (2.8597)	Entropy 0.64939 (0.64850)	Top-1 acc 56.250 (55.178)	Top-5 acc 77.734 (77.644)	lr 0.01839
Train [42][850/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.039)	Loss 2.7961 (2.8600)	Entropy 0.64950 (0.64851)	Top-1 acc 56.641 (55.159)	Top-5 acc 80.078 (77.632)	lr 0.01839
Train [42][860/3239]	Time 0.320 (0.529)	Data Time 0.001 (0.038)	Loss 2.6395 (2.8601)	Entropy 0.64929 (0.64852)	Top-1 acc 57.812 (55.159)	Top-5 acc 82.031 (77.638)	lr 0.01839
Train [42][870/3239]	Time 0.262 (0.527)	Data Time 0.028 (0.038)	Loss 3.0071 (2.8601)	Entropy 0.64910 (0.64853)	Top-1 acc 49.219 (55.166)	Top-5 acc 77.734 (77.636)	lr 0.01839
Train [42][880/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.037)	Loss 2.6508 (2.8605)	Entropy 0.64901 (0.64854)	Top-1 acc 64.062 (55.154)	Top-5 acc 80.469 (77.620)	lr 0.01839
Train [42][890/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.037)	Loss 2.9479 (2.8608)	Entropy 0.64901 (0.64854)	Top-1 acc 54.688 (55.138)	Top-5 acc 75.781 (77.609)	lr 0.01839
Train [42][900/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.037)	Loss 2.8362 (2.8610)	Entropy 0.64880 (0.64855)	Top-1 acc 53.516 (55.137)	Top-5 acc 79.688 (77.606)	lr 0.01838
Train [42][910/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.036)	Loss 2.8370 (2.8612)	Entropy 0.64874 (0.64855)	Top-1 acc 55.469 (55.138)	Top-5 acc 77.344 (77.594)	lr 0.01838
Train [42][920/3239]	Time 0.229 (0.521)	Data Time 0.001 (0.036)	Loss 2.7342 (2.8605)	Entropy 0.64841 (0.64855)	Top-1 acc 57.812 (55.152)	Top-5 acc 81.250 (77.610)	lr 0.01838
Train [42][930/3239]	Time 0.324 (0.520)	Data Time 0.001 (0.036)	Loss 2.9067 (2.8611)	Entropy 0.64842 (0.64855)	Top-1 acc 55.469 (55.144)	Top-5 acc 76.953 (77.593)	lr 0.01838
Train [42][940/3239]	Time 0.235 (0.519)	Data Time 0.001 (0.035)	Loss 2.6781 (2.8612)	Entropy 0.64823 (0.64855)	Top-1 acc 60.547 (55.152)	Top-5 acc 82.422 (77.582)	lr 0.01838
Train [42][950/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.035)	Loss 3.0475 (2.8614)	Entropy 0.64771 (0.64854)	Top-1 acc 55.078 (55.151)	Top-5 acc 69.922 (77.579)	lr 0.01838
Train [42][960/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.034)	Loss 2.7570 (2.8612)	Entropy 0.64797 (0.64853)	Top-1 acc 56.250 (55.147)	Top-5 acc 79.297 (77.588)	lr 0.01838
Train [42][970/3239]	Time 0.273 (0.516)	Data Time 0.001 (0.034)	Loss 2.7124 (2.8622)	Entropy 0.64786 (0.64853)	Top-1 acc 59.766 (55.129)	Top-5 acc 81.250 (77.568)	lr 0.01838
Train [42][980/3239]	Time 0.236 (0.515)	Data Time 0.001 (0.034)	Loss 2.8777 (2.8622)	Entropy 0.64780 (0.64852)	Top-1 acc 53.125 (55.122)	Top-5 acc 75.781 (77.567)	lr 0.01838
Train [42][990/3239]	Time 0.259 (0.514)	Data Time 0.001 (0.033)	Loss 2.9122 (2.8619)	Entropy 0.64779 (0.64851)	Top-1 acc 54.688 (55.124)	Top-5 acc 75.391 (77.574)	lr 0.01838
Train [42][1000/3239]	Time 0.238 (0.513)	Data Time 0.001 (0.033)	Loss 2.8343 (2.8614)	Entropy 0.64758 (0.64850)	Top-1 acc 56.641 (55.135)	Top-5 acc 78.125 (77.582)	lr 0.01838
Train [42][1010/3239]	Time 0.222 (0.512)	Data Time 0.001 (0.033)	Loss 2.7262 (2.8615)	Entropy 0.64798 (0.64850)	Top-1 acc 57.031 (55.133)	Top-5 acc 78.906 (77.575)	lr 0.01837
Train [42][1020/3239]	Time 0.269 (0.511)	Data Time 0.001 (0.033)	Loss 2.9073 (2.8616)	Entropy 0.64754 (0.64849)	Top-1 acc 55.469 (55.133)	Top-5 acc 76.172 (77.568)	lr 0.01837
Train [42][1030/3239]	Time 0.224 (0.510)	Data Time 0.001 (0.032)	Loss 2.9259 (2.8621)	Entropy 0.64736 (0.64848)	Top-1 acc 53.516 (55.122)	Top-5 acc 75.391 (77.559)	lr 0.01837
Train [42][1040/3239]	Time 0.222 (0.509)	Data Time 0.001 (0.032)	Loss 2.9160 (2.8620)	Entropy 0.64714 (0.64847)	Top-1 acc 53.516 (55.127)	Top-5 acc 75.781 (77.567)	lr 0.01837
Train [42][1050/3239]	Time 0.237 (0.508)	Data Time 0.001 (0.032)	Loss 3.1397 (2.8624)	Entropy 0.64712 (0.64846)	Top-1 acc 48.438 (55.129)	Top-5 acc 69.531 (77.554)	lr 0.01837
Train [42][1060/3239]	Time 0.234 (0.507)	Data Time 0.001 (0.031)	Loss 2.9152 (2.8629)	Entropy 0.64721 (0.64844)	Top-1 acc 52.734 (55.115)	Top-5 acc 77.734 (77.545)	lr 0.01837
Train [42][1070/3239]	Time 0.232 (0.507)	Data Time 0.001 (0.031)	Loss 2.8114 (2.8632)	Entropy 0.64689 (0.64843)	Top-1 acc 53.906 (55.107)	Top-5 acc 81.250 (77.544)	lr 0.01837
Train [42][1080/3239]	Time 0.237 (0.506)	Data Time 0.001 (0.031)	Loss 2.8265 (2.8629)	Entropy 0.64685 (0.64841)	Top-1 acc 57.422 (55.113)	Top-5 acc 79.297 (77.549)	lr 0.01837
Train [42][1090/3239]	Time 0.320 (0.505)	Data Time 0.001 (0.031)	Loss 2.8355 (2.8630)	Entropy 0.64671 (0.64840)	Top-1 acc 57.031 (55.104)	Top-5 acc 78.125 (77.552)	lr 0.01837
Train [42][1100/3239]	Time 0.226 (0.504)	Data Time 0.001 (0.030)	Loss 2.8773 (2.8631)	Entropy 0.64637 (0.64838)	Top-1 acc 53.125 (55.096)	Top-5 acc 76.172 (77.553)	lr 0.01837
Train [42][1110/3239]	Time 0.236 (0.503)	Data Time 0.001 (0.030)	Loss 2.8834 (2.8631)	Entropy 0.64642 (0.64837)	Top-1 acc 53.125 (55.102)	Top-5 acc 78.906 (77.554)	lr 0.01837
Train [42][1120/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.030)	Loss 2.8526 (2.8639)	Entropy 0.64628 (0.64835)	Top-1 acc 56.641 (55.082)	Top-5 acc 77.734 (77.541)	lr 0.01836
Train [42][1130/3239]	Time 0.233 (0.502)	Data Time 0.001 (0.029)	Loss 2.9424 (2.8640)	Entropy 0.64602 (0.64833)	Top-1 acc 53.906 (55.085)	Top-5 acc 74.219 (77.535)	lr 0.01836
Train [42][1140/3239]	Time 0.248 (0.501)	Data Time 0.001 (0.029)	Loss 2.7972 (2.8640)	Entropy 0.64592 (0.64831)	Top-1 acc 55.859 (55.087)	Top-5 acc 78.125 (77.534)	lr 0.01836
Train [42][1150/3239]	Time 0.224 (0.500)	Data Time 0.001 (0.029)	Loss 2.7359 (2.8636)	Entropy 0.64579 (0.64829)	Top-1 acc 55.859 (55.099)	Top-5 acc 80.469 (77.544)	lr 0.01836
Train [42][1160/3239]	Time 0.323 (0.499)	Data Time 0.001 (0.029)	Loss 2.6365 (2.8632)	Entropy 0.64536 (0.64826)	Top-1 acc 65.625 (55.107)	Top-5 acc 80.078 (77.553)	lr 0.01836
Train [42][1170/3239]	Time 0.233 (0.498)	Data Time 0.001 (0.029)	Loss 2.7698 (2.8625)	Entropy 0.64562 (0.64824)	Top-1 acc 55.469 (55.118)	Top-5 acc 80.469 (77.570)	lr 0.01836
Train [42][1180/3239]	Time 0.230 (0.498)	Data Time 0.001 (0.028)	Loss 3.0805 (2.8626)	Entropy 0.64540 (0.64822)	Top-1 acc 51.172 (55.119)	Top-5 acc 75.391 (77.564)	lr 0.01836
Train [42][1190/3239]	Time 0.229 (0.497)	Data Time 0.001 (0.028)	Loss 2.8227 (2.8624)	Entropy 0.64548 (0.64819)	Top-1 acc 56.250 (55.127)	Top-5 acc 78.906 (77.578)	lr 0.01836
Train [42][1200/3239]	Time 0.266 (0.496)	Data Time 0.002 (0.028)	Loss 2.8469 (2.8624)	Entropy 0.64520 (0.64817)	Top-1 acc 55.859 (55.125)	Top-5 acc 78.906 (77.575)	lr 0.01836
Train [42][1210/3239]	Time 0.230 (0.495)	Data Time 0.001 (0.028)	Loss 2.8427 (2.8623)	Entropy 0.64520 (0.64815)	Top-1 acc 54.297 (55.117)	Top-5 acc 77.344 (77.579)	lr 0.01836
Train [42][1220/3239]	Time 0.226 (0.495)	Data Time 0.001 (0.027)	Loss 2.6733 (2.8627)	Entropy 0.64526 (0.64812)	Top-1 acc 61.719 (55.109)	Top-5 acc 80.859 (77.565)	lr 0.01836
Train [42][1230/3239]	Time 0.245 (0.494)	Data Time 0.001 (0.027)	Loss 2.9776 (2.8628)	Entropy 0.64526 (0.64810)	Top-1 acc 50.781 (55.107)	Top-5 acc 76.172 (77.567)	lr 0.01836
Train [42][1240/3239]	Time 0.231 (0.493)	Data Time 0.001 (0.027)	Loss 3.0397 (2.8631)	Entropy 0.64494 (0.64808)	Top-1 acc 51.953 (55.095)	Top-5 acc 69.922 (77.562)	lr 0.01835
Train [42][1250/3239]	Time 0.364 (0.492)	Data Time 0.001 (0.027)	Loss 2.7918 (2.8639)	Entropy 0.64489 (0.64805)	Top-1 acc 54.688 (55.077)	Top-5 acc 77.734 (77.541)	lr 0.01835
Train [42][1260/3239]	Time 0.258 (0.492)	Data Time 0.002 (0.027)	Loss 2.7364 (2.8637)	Entropy 0.64487 (0.64803)	Top-1 acc 59.375 (55.083)	Top-5 acc 79.688 (77.546)	lr 0.01835
Train [42][1270/3239]	Time 0.233 (0.491)	Data Time 0.001 (0.026)	Loss 3.1414 (2.8641)	Entropy 0.64491 (0.64800)	Top-1 acc 48.438 (55.067)	Top-5 acc 72.656 (77.538)	lr 0.01835
Train [42][1280/3239]	Time 0.235 (0.491)	Data Time 0.001 (0.026)	Loss 2.8319 (2.8637)	Entropy 0.64487 (0.64798)	Top-1 acc 57.422 (55.079)	Top-5 acc 78.906 (77.550)	lr 0.01835
Train [42][1290/3239]	Time 0.223 (0.490)	Data Time 0.001 (0.026)	Loss 3.0855 (2.8640)	Entropy 0.64482 (0.64795)	Top-1 acc 49.609 (55.068)	Top-5 acc 74.219 (77.542)	lr 0.01835
Train [42][1300/3239]	Time 0.228 (0.489)	Data Time 0.001 (0.026)	Loss 2.8847 (2.8644)	Entropy 0.64471 (0.64793)	Top-1 acc 54.297 (55.051)	Top-5 acc 76.172 (77.531)	lr 0.01835
Train [42][1310/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.026)	Loss 2.9677 (2.8640)	Entropy 0.64461 (0.64790)	Top-1 acc 55.078 (55.064)	Top-5 acc 73.047 (77.542)	lr 0.01835
Train [42][1320/3239]	Time 0.317 (0.488)	Data Time 0.001 (0.025)	Loss 2.7371 (2.8642)	Entropy 0.64453 (0.64788)	Top-1 acc 62.500 (55.059)	Top-5 acc 78.516 (77.533)	lr 0.01835
Train [42][1330/3239]	Time 0.238 (0.487)	Data Time 0.001 (0.025)	Loss 2.9098 (2.8644)	Entropy 0.64407 (0.64785)	Top-1 acc 54.297 (55.054)	Top-5 acc 79.297 (77.533)	lr 0.01835
Train [42][1340/3239]	Time 0.235 (0.487)	Data Time 0.001 (0.025)	Loss 2.7260 (2.8650)	Entropy 0.64424 (0.64782)	Top-1 acc 60.547 (55.035)	Top-5 acc 79.297 (77.522)	lr 0.01835
Train [42][1350/3239]	Time 0.230 (0.486)	Data Time 0.001 (0.025)	Loss 2.8015 (2.8648)	Entropy 0.64415 (0.64780)	Top-1 acc 55.469 (55.038)	Top-5 acc 78.906 (77.529)	lr 0.01834
Train [42][1360/3239]	Time 0.228 (0.486)	Data Time 0.001 (0.025)	Loss 3.1159 (2.8649)	Entropy 0.64401 (0.64777)	Top-1 acc 52.734 (55.039)	Top-5 acc 73.828 (77.529)	lr 0.01834
Train [42][1370/3239]	Time 0.234 (0.485)	Data Time 0.001 (0.025)	Loss 2.7803 (2.8646)	Entropy 0.64419 (0.64774)	Top-1 acc 53.125 (55.042)	Top-5 acc 76.562 (77.527)	lr 0.01834
Train [42][1380/3239]	Time 0.226 (0.484)	Data Time 0.001 (0.024)	Loss 2.6751 (2.8645)	Entropy 0.64437 (0.64772)	Top-1 acc 60.938 (55.043)	Top-5 acc 80.859 (77.532)	lr 0.01834
Train [42][1390/3239]	Time 0.236 (0.484)	Data Time 0.001 (0.024)	Loss 2.7577 (2.8646)	Entropy 0.64476 (0.64770)	Top-1 acc 55.859 (55.038)	Top-5 acc 80.859 (77.527)	lr 0.01834
Train [42][1400/3239]	Time 0.239 (0.483)	Data Time 0.001 (0.024)	Loss 2.8076 (2.8643)	Entropy 0.64474 (0.64768)	Top-1 acc 57.812 (55.047)	Top-5 acc 77.734 (77.527)	lr 0.01834
Train [42][1410/3239]	Time 0.377 (0.506)	Data Time 0.002 (0.024)	Loss 2.9036 (2.8643)	Entropy 0.64482 (0.64766)	Top-1 acc 54.688 (55.047)	Top-5 acc 77.734 (77.529)	lr 0.01834
Train [42][1420/3239]	Time 0.290 (0.506)	Data Time 0.002 (0.024)	Loss 2.7361 (2.8643)	Entropy 0.64453 (0.64764)	Top-1 acc 58.594 (55.041)	Top-5 acc 82.031 (77.536)	lr 0.01834
Train [42][1430/3239]	Time 0.281 (0.505)	Data Time 0.002 (0.024)	Loss 3.1007 (2.8646)	Entropy 0.64452 (0.64761)	Top-1 acc 48.047 (55.035)	Top-5 acc 71.875 (77.526)	lr 0.01834
Train [42][1440/3239]	Time 0.246 (0.505)	Data Time 0.002 (0.024)	Loss 3.0352 (2.8641)	Entropy 0.64477 (0.64759)	Top-1 acc 49.219 (55.046)	Top-5 acc 72.656 (77.537)	lr 0.01834
Train [42][1450/3239]	Time 0.239 (0.505)	Data Time 0.002 (0.023)	Loss 2.8866 (2.8638)	Entropy 0.64427 (0.64757)	Top-1 acc 58.984 (55.066)	Top-5 acc 79.297 (77.546)	lr 0.01834
Train [42][1460/3239]	Time 0.239 (0.504)	Data Time 0.001 (0.023)	Loss 2.9253 (2.8640)	Entropy 0.64417 (0.64755)	Top-1 acc 52.734 (55.064)	Top-5 acc 79.688 (77.538)	lr 0.01833
Train [42][1470/3239]	Time 0.238 (0.504)	Data Time 0.001 (0.023)	Loss 2.7344 (2.8640)	Entropy 0.64430 (0.64753)	Top-1 acc 57.031 (55.061)	Top-5 acc 82.031 (77.543)	lr 0.01833
Train [42][1480/3239]	Time 0.341 (0.503)	Data Time 0.001 (0.023)	Loss 2.6558 (2.8641)	Entropy 0.64437 (0.64750)	Top-1 acc 63.281 (55.060)	Top-5 acc 82.031 (77.544)	lr 0.01833
Train [42][1490/3239]	Time 0.243 (0.503)	Data Time 0.001 (0.023)	Loss 2.9223 (2.8642)	Entropy 0.64436 (0.64748)	Top-1 acc 53.125 (55.060)	Top-5 acc 73.828 (77.546)	lr 0.01833
Train [42][1500/3239]	Time 0.250 (0.502)	Data Time 0.001 (0.023)	Loss 2.9311 (2.8644)	Entropy 0.64432 (0.64746)	Top-1 acc 51.562 (55.057)	Top-5 acc 75.781 (77.539)	lr 0.01833
Train [42][1510/3239]	Time 0.308 (0.502)	Data Time 0.001 (0.023)	Loss 2.8696 (2.8646)	Entropy 0.64414 (0.64744)	Top-1 acc 54.297 (55.053)	Top-5 acc 80.469 (77.540)	lr 0.01833
Train [42][1520/3239]	Time 0.316 (0.503)	Data Time 0.002 (0.022)	Loss 3.1180 (2.8652)	Entropy 0.64394 (0.64742)	Top-1 acc 50.391 (55.034)	Top-5 acc 71.875 (77.532)	lr 0.01833
Train [42][1530/3239]	Time 0.240 (0.502)	Data Time 0.001 (0.022)	Loss 2.8361 (2.8649)	Entropy 0.64390 (0.64740)	Top-1 acc 53.906 (55.039)	Top-5 acc 78.906 (77.539)	lr 0.01833
Train [42][1540/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.022)	Loss 2.8865 (2.8652)	Entropy 0.64412 (0.64737)	Top-1 acc 53.125 (55.024)	Top-5 acc 76.562 (77.531)	lr 0.01833
Train [42][1550/3239]	Time 0.283 (0.501)	Data Time 0.001 (0.022)	Loss 2.8641 (2.8650)	Entropy 0.64428 (0.64735)	Top-1 acc 56.641 (55.030)	Top-5 acc 77.344 (77.536)	lr 0.01833
Train [42][1560/3239]	Time 0.311 (0.501)	Data Time 0.001 (0.022)	Loss 2.8881 (2.8649)	Entropy 0.64431 (0.64733)	Top-1 acc 56.250 (55.037)	Top-5 acc 75.391 (77.534)	lr 0.01833
Train [42][1570/3239]	Time 0.270 (0.501)	Data Time 0.001 (0.022)	Loss 2.9677 (2.8646)	Entropy 0.64393 (0.64731)	Top-1 acc 51.953 (55.040)	Top-5 acc 75.781 (77.542)	lr 0.01832
Train [42][1580/3239]	Time 0.234 (0.500)	Data Time 0.001 (0.022)	Loss 3.0497 (2.8653)	Entropy 0.64438 (0.64729)	Top-1 acc 48.438 (55.026)	Top-5 acc 75.391 (77.525)	lr 0.01832
Train [42][1590/3239]	Time 0.239 (0.500)	Data Time 0.001 (0.021)	Loss 2.7644 (2.8657)	Entropy 0.64425 (0.64728)	Top-1 acc 56.641 (55.014)	Top-5 acc 80.078 (77.518)	lr 0.01832
Train [42][1600/3239]	Time 0.296 (0.500)	Data Time 0.001 (0.021)	Loss 2.7780 (2.8654)	Entropy 0.64403 (0.64726)	Top-1 acc 57.812 (55.018)	Top-5 acc 78.125 (77.520)	lr 0.01832
Train [42][1610/3239]	Time 0.248 (0.499)	Data Time 0.001 (0.021)	Loss 2.8637 (2.8659)	Entropy 0.64369 (0.64724)	Top-1 acc 53.906 (55.007)	Top-5 acc 78.516 (77.516)	lr 0.01832
Train [42][1620/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.021)	Loss 2.9766 (2.8658)	Entropy 0.64356 (0.64721)	Top-1 acc 52.734 (55.013)	Top-5 acc 76.562 (77.519)	lr 0.01832
Train [42][1630/3239]	Time 0.249 (0.499)	Data Time 0.002 (0.021)	Loss 2.7938 (2.8660)	Entropy 0.64350 (0.64719)	Top-1 acc 54.688 (55.006)	Top-5 acc 77.734 (77.517)	lr 0.01832
Train [42][1640/3239]	Time 0.347 (0.498)	Data Time 0.001 (0.021)	Loss 2.8300 (2.8663)	Entropy 0.64375 (0.64717)	Top-1 acc 57.031 (54.999)	Top-5 acc 79.297 (77.510)	lr 0.01832
Train [42][1650/3239]	Time 0.232 (0.498)	Data Time 0.002 (0.021)	Loss 2.7397 (2.8665)	Entropy 0.64372 (0.64715)	Top-1 acc 55.469 (54.989)	Top-5 acc 78.516 (77.509)	lr 0.01832
Train [42][1660/3239]	Time 0.240 (0.498)	Data Time 0.001 (0.021)	Loss 2.9071 (2.8666)	Entropy 0.64353 (0.64713)	Top-1 acc 54.688 (54.987)	Top-5 acc 78.125 (77.511)	lr 0.01832
Train [42][1670/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.021)	Loss 2.7300 (2.8668)	Entropy 0.64356 (0.64710)	Top-1 acc 55.469 (54.982)	Top-5 acc 77.734 (77.505)	lr 0.01832
Train [42][1680/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.020)	Loss 2.9050 (2.8672)	Entropy 0.64328 (0.64708)	Top-1 acc 51.953 (54.975)	Top-5 acc 77.734 (77.495)	lr 0.01831
Train [42][1690/3239]	Time 0.233 (0.496)	Data Time 0.001 (0.020)	Loss 2.9339 (2.8672)	Entropy 0.64342 (0.64706)	Top-1 acc 51.953 (54.980)	Top-5 acc 76.953 (77.495)	lr 0.01831
Train [42][1700/3239]	Time 0.269 (0.496)	Data Time 0.003 (0.020)	Loss 2.8017 (2.8675)	Entropy 0.64334 (0.64704)	Top-1 acc 59.375 (54.984)	Top-5 acc 78.516 (77.487)	lr 0.01831
Train [42][1710/3239]	Time 0.332 (0.495)	Data Time 0.001 (0.020)	Loss 3.1468 (2.8678)	Entropy 0.64326 (0.64702)	Top-1 acc 50.000 (54.977)	Top-5 acc 73.047 (77.480)	lr 0.01831
Train [42][1720/3239]	Time 0.259 (0.495)	Data Time 0.001 (0.020)	Loss 2.7538 (2.8678)	Entropy 0.64341 (0.64700)	Top-1 acc 56.641 (54.977)	Top-5 acc 80.469 (77.482)	lr 0.01831
Train [42][1730/3239]	Time 0.225 (0.494)	Data Time 0.001 (0.020)	Loss 3.1414 (2.8681)	Entropy 0.64348 (0.64698)	Top-1 acc 50.000 (54.966)	Top-5 acc 71.875 (77.474)	lr 0.01831
Train [42][1740/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.020)	Loss 2.6632 (2.8683)	Entropy 0.64357 (0.64696)	Top-1 acc 59.766 (54.963)	Top-5 acc 83.984 (77.473)	lr 0.01831
Train [42][1750/3239]	Time 0.284 (0.493)	Data Time 0.002 (0.020)	Loss 2.9999 (2.8683)	Entropy 0.64347 (0.64694)	Top-1 acc 50.391 (54.967)	Top-5 acc 76.953 (77.470)	lr 0.01831
Train [42][1760/3239]	Time 0.224 (0.493)	Data Time 0.001 (0.020)	Loss 3.0541 (2.8684)	Entropy 0.64349 (0.64692)	Top-1 acc 51.562 (54.965)	Top-5 acc 75.781 (77.468)	lr 0.01831
Train [42][1770/3239]	Time 0.215 (0.492)	Data Time 0.001 (0.019)	Loss 3.0092 (2.8686)	Entropy 0.64357 (0.64690)	Top-1 acc 53.516 (54.962)	Top-5 acc 76.953 (77.466)	lr 0.01831
Train [42][1780/3239]	Time 0.240 (0.492)	Data Time 0.001 (0.019)	Loss 2.8612 (2.8686)	Entropy 0.64347 (0.64688)	Top-1 acc 54.297 (54.958)	Top-5 acc 75.781 (77.468)	lr 0.01831
Train [42][1790/3239]	Time 0.236 (0.491)	Data Time 0.003 (0.019)	Loss 3.1741 (2.8695)	Entropy 0.64363 (0.64686)	Top-1 acc 48.438 (54.937)	Top-5 acc 71.094 (77.454)	lr 0.01830
Train [42][1800/3239]	Time 0.329 (0.491)	Data Time 0.001 (0.019)	Loss 2.9263 (2.8698)	Entropy 0.64388 (0.64684)	Top-1 acc 54.688 (54.931)	Top-5 acc 75.781 (77.443)	lr 0.01830
Train [42][1810/3239]	Time 0.264 (0.491)	Data Time 0.001 (0.019)	Loss 3.1283 (2.8700)	Entropy 0.64363 (0.64683)	Top-1 acc 45.312 (54.925)	Top-5 acc 74.219 (77.440)	lr 0.01830
Train [42][1820/3239]	Time 0.233 (0.490)	Data Time 0.001 (0.019)	Loss 2.7227 (2.8696)	Entropy 0.64346 (0.64681)	Top-1 acc 58.594 (54.936)	Top-5 acc 79.688 (77.445)	lr 0.01830
Train [42][1830/3239]	Time 0.237 (0.490)	Data Time 0.001 (0.019)	Loss 2.7375 (2.8695)	Entropy 0.64348 (0.64679)	Top-1 acc 58.594 (54.934)	Top-5 acc 81.641 (77.447)	lr 0.01830
Train [42][1840/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.019)	Loss 2.8286 (2.8695)	Entropy 0.64349 (0.64677)	Top-1 acc 57.031 (54.936)	Top-5 acc 76.953 (77.445)	lr 0.01830
Train [42][1850/3239]	Time 0.240 (0.489)	Data Time 0.001 (0.019)	Loss 3.0394 (2.8697)	Entropy 0.64382 (0.64676)	Top-1 acc 52.734 (54.935)	Top-5 acc 72.656 (77.439)	lr 0.01830
Train [42][1860/3239]	Time 0.230 (0.488)	Data Time 0.001 (0.019)	Loss 2.9071 (2.8695)	Entropy 0.64332 (0.64674)	Top-1 acc 51.172 (54.930)	Top-5 acc 73.438 (77.443)	lr 0.01830
Train [42][1870/3239]	Time 0.394 (0.488)	Data Time 0.001 (0.019)	Loss 2.9430 (2.8691)	Entropy 0.64362 (0.64672)	Top-1 acc 54.688 (54.941)	Top-5 acc 75.391 (77.453)	lr 0.01830
Train [42][1880/3239]	Time 0.236 (0.488)	Data Time 0.001 (0.018)	Loss 2.9074 (2.8692)	Entropy 0.64386 (0.64670)	Top-1 acc 54.297 (54.933)	Top-5 acc 75.000 (77.453)	lr 0.01830
Train [42][1890/3239]	Time 0.275 (0.487)	Data Time 0.001 (0.018)	Loss 2.9082 (2.8692)	Entropy 0.64414 (0.64669)	Top-1 acc 54.297 (54.934)	Top-5 acc 74.609 (77.454)	lr 0.01830
Train [42][1900/3239]	Time 0.231 (0.487)	Data Time 0.001 (0.018)	Loss 2.8121 (2.8689)	Entropy 0.64406 (0.64668)	Top-1 acc 56.250 (54.943)	Top-5 acc 77.344 (77.460)	lr 0.01830
Train [42][1910/3239]	Time 0.238 (0.486)	Data Time 0.001 (0.018)	Loss 2.9413 (2.8692)	Entropy 0.64421 (0.64666)	Top-1 acc 51.172 (54.928)	Top-5 acc 71.094 (77.456)	lr 0.01829
Train [42][1920/3239]	Time 0.230 (0.486)	Data Time 0.001 (0.018)	Loss 2.9740 (2.8691)	Entropy 0.64430 (0.64665)	Top-1 acc 52.344 (54.933)	Top-5 acc 75.000 (77.458)	lr 0.01829
Train [42][1930/3239]	Time 0.229 (0.486)	Data Time 0.001 (0.018)	Loss 2.8653 (2.8693)	Entropy 0.64427 (0.64664)	Top-1 acc 52.344 (54.927)	Top-5 acc 77.734 (77.454)	lr 0.01829
Train [42][1940/3239]	Time 0.231 (0.486)	Data Time 0.001 (0.018)	Loss 2.7062 (2.8691)	Entropy 0.64441 (0.64663)	Top-1 acc 59.375 (54.935)	Top-5 acc 80.859 (77.459)	lr 0.01829
Train [42][1950/3239]	Time 0.229 (0.485)	Data Time 0.001 (0.018)	Loss 2.9486 (2.8691)	Entropy 0.64419 (0.64662)	Top-1 acc 54.297 (54.936)	Top-5 acc 73.047 (77.460)	lr 0.01829
Train [42][1960/3239]	Time 0.352 (0.485)	Data Time 0.001 (0.018)	Loss 2.8100 (2.8693)	Entropy 0.64413 (0.64660)	Top-1 acc 58.594 (54.936)	Top-5 acc 76.953 (77.457)	lr 0.01829
Train [42][1970/3239]	Time 0.240 (0.484)	Data Time 0.002 (0.018)	Loss 2.8946 (2.8691)	Entropy 0.64439 (0.64659)	Top-1 acc 55.469 (54.944)	Top-5 acc 77.344 (77.461)	lr 0.01829
Train [42][1980/3239]	Time 0.232 (0.484)	Data Time 0.001 (0.018)	Loss 2.7061 (2.8686)	Entropy 0.64462 (0.64658)	Top-1 acc 60.938 (54.959)	Top-5 acc 80.078 (77.473)	lr 0.01829
Train [42][1990/3239]	Time 0.232 (0.484)	Data Time 0.001 (0.018)	Loss 2.5016 (2.8687)	Entropy 0.64443 (0.64657)	Top-1 acc 64.844 (54.955)	Top-5 acc 84.375 (77.469)	lr 0.01829
Train [42][2000/3239]	Time 0.244 (0.483)	Data Time 0.001 (0.017)	Loss 3.0110 (2.8691)	Entropy 0.64478 (0.64656)	Top-1 acc 50.000 (54.946)	Top-5 acc 75.781 (77.459)	lr 0.01829
Train [42][2010/3239]	Time 0.236 (0.483)	Data Time 0.001 (0.017)	Loss 2.9983 (2.8692)	Entropy 0.64450 (0.64655)	Top-1 acc 51.172 (54.938)	Top-5 acc 73.047 (77.460)	lr 0.01829
Train [42][2020/3239]	Time 0.230 (0.483)	Data Time 0.001 (0.017)	Loss 3.0069 (2.8694)	Entropy 0.64486 (0.64654)	Top-1 acc 53.906 (54.934)	Top-5 acc 75.781 (77.459)	lr 0.01828
Train [42][2030/3239]	Time 0.323 (0.482)	Data Time 0.001 (0.017)	Loss 2.8513 (2.8694)	Entropy 0.64470 (0.64653)	Top-1 acc 53.125 (54.934)	Top-5 acc 76.953 (77.460)	lr 0.01828
Train [42][2040/3239]	Time 0.232 (0.482)	Data Time 0.001 (0.017)	Loss 2.8528 (2.8694)	Entropy 0.64460 (0.64652)	Top-1 acc 55.078 (54.928)	Top-5 acc 78.906 (77.463)	lr 0.01828
Train [42][2050/3239]	Time 0.235 (0.481)	Data Time 0.001 (0.017)	Loss 2.8041 (2.8694)	Entropy 0.64441 (0.64651)	Top-1 acc 55.859 (54.931)	Top-5 acc 79.688 (77.465)	lr 0.01828
Train [42][2060/3239]	Time 0.362 (0.497)	Data Time 0.005 (0.017)	Loss 2.7401 (2.8694)	Entropy 0.64447 (0.64650)	Top-1 acc 62.891 (54.934)	Top-5 acc 82.031 (77.464)	lr 0.01828
Train [42][2070/3239]	Time 0.246 (0.497)	Data Time 0.002 (0.017)	Loss 2.7300 (2.8692)	Entropy 0.64457 (0.64649)	Top-1 acc 53.906 (54.940)	Top-5 acc 78.125 (77.463)	lr 0.01828
Train [42][2080/3239]	Time 0.271 (0.497)	Data Time 0.001 (0.017)	Loss 3.0081 (2.8692)	Entropy 0.64458 (0.64648)	Top-1 acc 48.828 (54.932)	Top-5 acc 73.828 (77.462)	lr 0.01828
Train [42][2090/3239]	Time 0.242 (0.496)	Data Time 0.001 (0.017)	Loss 2.9374 (2.8691)	Entropy 0.64415 (0.64647)	Top-1 acc 53.125 (54.934)	Top-5 acc 76.172 (77.462)	lr 0.01828
Train [42][2100/3239]	Time 0.238 (0.496)	Data Time 0.001 (0.017)	Loss 3.0164 (2.8690)	Entropy 0.64394 (0.64646)	Top-1 acc 52.344 (54.941)	Top-5 acc 74.609 (77.465)	lr 0.01828
Train [42][2110/3239]	Time 0.238 (0.496)	Data Time 0.001 (0.017)	Loss 3.0339 (2.8689)	Entropy 0.64403 (0.64645)	Top-1 acc 53.516 (54.945)	Top-5 acc 75.000 (77.467)	lr 0.01828
Train [42][2120/3239]	Time 0.328 (0.495)	Data Time 0.001 (0.017)	Loss 2.9802 (2.8690)	Entropy 0.64393 (0.64644)	Top-1 acc 53.516 (54.943)	Top-5 acc 74.609 (77.461)	lr 0.01828
Train [42][2130/3239]	Time 0.287 (0.495)	Data Time 0.001 (0.016)	Loss 2.9065 (2.8689)	Entropy 0.64340 (0.64643)	Top-1 acc 51.172 (54.939)	Top-5 acc 77.734 (77.463)	lr 0.01827
Train [42][2140/3239]	Time 0.260 (0.495)	Data Time 0.001 (0.016)	Loss 3.0072 (2.8692)	Entropy 0.64320 (0.64641)	Top-1 acc 50.391 (54.936)	Top-5 acc 76.953 (77.461)	lr 0.01827
Train [42][2150/3239]	Time 0.274 (0.495)	Data Time 0.001 (0.016)	Loss 2.6827 (2.8691)	Entropy 0.64322 (0.64640)	Top-1 acc 59.375 (54.936)	Top-5 acc 80.859 (77.459)	lr 0.01827
Train [42][2160/3239]	Time 0.291 (0.494)	Data Time 0.001 (0.016)	Loss 3.0470 (2.8691)	Entropy 0.64351 (0.64638)	Top-1 acc 49.609 (54.939)	Top-5 acc 71.875 (77.457)	lr 0.01827
Train [42][2170/3239]	Time 0.257 (0.494)	Data Time 0.001 (0.016)	Loss 2.5997 (2.8690)	Entropy 0.64365 (0.64637)	Top-1 acc 61.719 (54.937)	Top-5 acc 84.375 (77.459)	lr 0.01827
Train [42][2180/3239]	Time 0.237 (0.494)	Data Time 0.001 (0.016)	Loss 2.8513 (2.8691)	Entropy 0.64373 (0.64636)	Top-1 acc 56.250 (54.934)	Top-5 acc 79.688 (77.456)	lr 0.01827
Train [42][2190/3239]	Time 0.345 (0.493)	Data Time 0.001 (0.016)	Loss 2.9919 (2.8691)	Entropy 0.64359 (0.64635)	Top-1 acc 48.438 (54.927)	Top-5 acc 73.828 (77.455)	lr 0.01827
Train [42][2200/3239]	Time 0.260 (0.493)	Data Time 0.001 (0.016)	Loss 2.9297 (2.8691)	Entropy 0.64333 (0.64633)	Top-1 acc 51.953 (54.926)	Top-5 acc 73.828 (77.456)	lr 0.01827
Train [42][2210/3239]	Time 0.298 (0.493)	Data Time 0.001 (0.016)	Loss 2.6806 (2.8690)	Entropy 0.64298 (0.64632)	Top-1 acc 59.375 (54.930)	Top-5 acc 82.812 (77.459)	lr 0.01827
Train [42][2220/3239]	Time 0.226 (0.492)	Data Time 0.001 (0.016)	Loss 2.9112 (2.8690)	Entropy 0.64329 (0.64631)	Top-1 acc 51.562 (54.927)	Top-5 acc 75.781 (77.456)	lr 0.01827
Train [42][2230/3239]	Time 0.228 (0.492)	Data Time 0.001 (0.016)	Loss 2.8552 (2.8693)	Entropy 0.64324 (0.64629)	Top-1 acc 60.156 (54.920)	Top-5 acc 77.734 (77.453)	lr 0.01827
Train [42][2240/3239]	Time 0.261 (0.492)	Data Time 0.001 (0.016)	Loss 3.0596 (2.8691)	Entropy 0.64305 (0.64628)	Top-1 acc 49.609 (54.925)	Top-5 acc 76.172 (77.460)	lr 0.01826
Train [42][2250/3239]	Time 0.230 (0.491)	Data Time 0.001 (0.016)	Loss 2.7332 (2.8691)	Entropy 0.64293 (0.64626)	Top-1 acc 56.641 (54.924)	Top-5 acc 82.031 (77.461)	lr 0.01826
Train [42][2260/3239]	Time 0.285 (0.491)	Data Time 0.001 (0.016)	Loss 2.8162 (2.8688)	Entropy 0.64285 (0.64625)	Top-1 acc 53.125 (54.928)	Top-5 acc 79.688 (77.468)	lr 0.01826
Train [42][2270/3239]	Time 0.238 (0.491)	Data Time 0.001 (0.016)	Loss 2.9288 (2.8690)	Entropy 0.64280 (0.64623)	Top-1 acc 55.078 (54.920)	Top-5 acc 74.219 (77.466)	lr 0.01826
Train [42][2280/3239]	Time 0.233 (0.490)	Data Time 0.001 (0.015)	Loss 2.9223 (2.8690)	Entropy 0.64297 (0.64622)	Top-1 acc 51.953 (54.921)	Top-5 acc 79.688 (77.469)	lr 0.01826
Train [42][2290/3239]	Time 0.256 (0.490)	Data Time 0.001 (0.015)	Loss 2.8938 (2.8689)	Entropy 0.64299 (0.64620)	Top-1 acc 55.859 (54.925)	Top-5 acc 78.906 (77.470)	lr 0.01826
Train [42][2300/3239]	Time 0.237 (0.490)	Data Time 0.001 (0.015)	Loss 2.9082 (2.8686)	Entropy 0.64252 (0.64619)	Top-1 acc 55.078 (54.933)	Top-5 acc 76.172 (77.470)	lr 0.01826
Train [42][2310/3239]	Time 0.227 (0.490)	Data Time 0.001 (0.015)	Loss 2.9702 (2.8687)	Entropy 0.64246 (0.64617)	Top-1 acc 54.688 (54.934)	Top-5 acc 74.219 (77.470)	lr 0.01826
Train [42][2320/3239]	Time 0.278 (0.489)	Data Time 0.001 (0.015)	Loss 2.7009 (2.8683)	Entropy 0.64246 (0.64616)	Top-1 acc 59.766 (54.942)	Top-5 acc 79.688 (77.474)	lr 0.01826
Train [42][2330/3239]	Time 0.229 (0.489)	Data Time 0.001 (0.015)	Loss 2.7946 (2.8684)	Entropy 0.64243 (0.64614)	Top-1 acc 57.031 (54.944)	Top-5 acc 77.734 (77.471)	lr 0.01826
Train [42][2340/3239]	Time 0.237 (0.489)	Data Time 0.001 (0.015)	Loss 2.6901 (2.8686)	Entropy 0.64268 (0.64613)	Top-1 acc 59.375 (54.939)	Top-5 acc 80.078 (77.465)	lr 0.01826
Train [42][2350/3239]	Time 0.337 (0.489)	Data Time 0.001 (0.015)	Loss 2.9094 (2.8683)	Entropy 0.64280 (0.64611)	Top-1 acc 55.469 (54.947)	Top-5 acc 75.391 (77.469)	lr 0.01825
Train [42][2360/3239]	Time 0.228 (0.488)	Data Time 0.001 (0.015)	Loss 2.9486 (2.8683)	Entropy 0.64258 (0.64610)	Top-1 acc 54.688 (54.954)	Top-5 acc 76.953 (77.469)	lr 0.01825
Train [42][2370/3239]	Time 0.247 (0.488)	Data Time 0.001 (0.015)	Loss 2.9464 (2.8683)	Entropy 0.64279 (0.64608)	Top-1 acc 50.391 (54.950)	Top-5 acc 73.828 (77.467)	lr 0.01825
Train [42][2380/3239]	Time 0.235 (0.488)	Data Time 0.001 (0.015)	Loss 2.8216 (2.8685)	Entropy 0.64272 (0.64607)	Top-1 acc 55.078 (54.945)	Top-5 acc 77.344 (77.463)	lr 0.01825
Train [42][2390/3239]	Time 0.274 (0.487)	Data Time 0.001 (0.015)	Loss 2.9912 (2.8686)	Entropy 0.64269 (0.64606)	Top-1 acc 53.906 (54.948)	Top-5 acc 77.344 (77.463)	lr 0.01825
Train [42][2400/3239]	Time 0.245 (0.487)	Data Time 0.001 (0.015)	Loss 2.8921 (2.8687)	Entropy 0.64292 (0.64604)	Top-1 acc 53.906 (54.945)	Top-5 acc 78.906 (77.460)	lr 0.01825
Train [42][2410/3239]	Time 0.235 (0.487)	Data Time 0.001 (0.015)	Loss 2.7041 (2.8687)	Entropy 0.64300 (0.64603)	Top-1 acc 58.594 (54.946)	Top-5 acc 82.812 (77.464)	lr 0.01825
Train [42][2420/3239]	Time 0.333 (0.487)	Data Time 0.001 (0.015)	Loss 2.9551 (2.8687)	Entropy 0.64314 (0.64602)	Top-1 acc 53.125 (54.948)	Top-5 acc 73.438 (77.462)	lr 0.01825
Train [42][2430/3239]	Time 0.262 (0.486)	Data Time 0.001 (0.015)	Loss 2.9532 (2.8685)	Entropy 0.64335 (0.64601)	Top-1 acc 53.906 (54.954)	Top-5 acc 75.781 (77.466)	lr 0.01825
Train [42][2440/3239]	Time 0.234 (0.486)	Data Time 0.001 (0.015)	Loss 2.8148 (2.8688)	Entropy 0.64312 (0.64599)	Top-1 acc 55.078 (54.947)	Top-5 acc 76.172 (77.457)	lr 0.01825
Train [42][2450/3239]	Time 0.241 (0.486)	Data Time 0.001 (0.015)	Loss 2.8244 (2.8686)	Entropy 0.64339 (0.64598)	Top-1 acc 55.469 (54.952)	Top-5 acc 75.000 (77.456)	lr 0.01825
Train [42][2460/3239]	Time 0.229 (0.486)	Data Time 0.001 (0.014)	Loss 2.8905 (2.8687)	Entropy 0.64316 (0.64597)	Top-1 acc 53.906 (54.950)	Top-5 acc 77.344 (77.456)	lr 0.01824
Train [42][2470/3239]	Time 0.233 (0.485)	Data Time 0.001 (0.014)	Loss 2.9812 (2.8686)	Entropy 0.64308 (0.64596)	Top-1 acc 53.516 (54.953)	Top-5 acc 74.219 (77.456)	lr 0.01824
Train [42][2480/3239]	Time 0.227 (0.485)	Data Time 0.001 (0.014)	Loss 2.8714 (2.8684)	Entropy 0.64310 (0.64595)	Top-1 acc 57.031 (54.954)	Top-5 acc 76.562 (77.461)	lr 0.01824
Train [42][2490/3239]	Time 0.230 (0.485)	Data Time 0.001 (0.014)	Loss 2.9946 (2.8682)	Entropy 0.64294 (0.64594)	Top-1 acc 51.172 (54.960)	Top-5 acc 72.266 (77.461)	lr 0.01824
Train [42][2500/3239]	Time 0.240 (0.484)	Data Time 0.001 (0.014)	Loss 3.0071 (2.8682)	Entropy 0.64278 (0.64593)	Top-1 acc 49.609 (54.963)	Top-5 acc 74.219 (77.462)	lr 0.01824
Train [42][2510/3239]	Time 0.326 (0.484)	Data Time 0.001 (0.014)	Loss 2.9068 (2.8681)	Entropy 0.64262 (0.64591)	Top-1 acc 56.641 (54.967)	Top-5 acc 75.391 (77.463)	lr 0.01824
Train [42][2520/3239]	Time 0.229 (0.484)	Data Time 0.001 (0.014)	Loss 2.9754 (2.8683)	Entropy 0.64239 (0.64590)	Top-1 acc 54.688 (54.964)	Top-5 acc 73.828 (77.457)	lr 0.01824
Train [42][2530/3239]	Time 0.237 (0.483)	Data Time 0.001 (0.014)	Loss 2.6853 (2.8682)	Entropy 0.64211 (0.64588)	Top-1 acc 58.984 (54.968)	Top-5 acc 79.297 (77.456)	lr 0.01824
Train [42][2540/3239]	Time 0.234 (0.483)	Data Time 0.001 (0.014)	Loss 2.7663 (2.8682)	Entropy 0.64181 (0.64587)	Top-1 acc 56.250 (54.963)	Top-5 acc 78.906 (77.453)	lr 0.01824
Train [42][2550/3239]	Time 0.235 (0.483)	Data Time 0.001 (0.014)	Loss 2.7858 (2.8684)	Entropy 0.64202 (0.64585)	Top-1 acc 54.297 (54.958)	Top-5 acc 81.250 (77.450)	lr 0.01824
Train [42][2560/3239]	Time 0.257 (0.483)	Data Time 0.001 (0.014)	Loss 2.7058 (2.8685)	Entropy 0.64239 (0.64584)	Top-1 acc 58.594 (54.952)	Top-5 acc 80.078 (77.448)	lr 0.01824
Train [42][2570/3239]	Time 0.224 (0.482)	Data Time 0.001 (0.014)	Loss 2.6966 (2.8684)	Entropy 0.64197 (0.64583)	Top-1 acc 58.594 (54.954)	Top-5 acc 78.125 (77.452)	lr 0.01824
Train [42][2580/3239]	Time 0.326 (0.482)	Data Time 0.001 (0.014)	Loss 2.7739 (2.8682)	Entropy 0.64199 (0.64581)	Top-1 acc 57.422 (54.958)	Top-5 acc 78.516 (77.456)	lr 0.01823
Train [42][2590/3239]	Time 0.229 (0.482)	Data Time 0.001 (0.014)	Loss 2.8703 (2.8681)	Entropy 0.64237 (0.64580)	Top-1 acc 54.297 (54.955)	Top-5 acc 76.953 (77.458)	lr 0.01823
Train [42][2600/3239]	Time 0.226 (0.481)	Data Time 0.001 (0.014)	Loss 3.1996 (2.8680)	Entropy 0.64217 (0.64578)	Top-1 acc 45.703 (54.956)	Top-5 acc 70.312 (77.459)	lr 0.01823
Train [42][2610/3239]	Time 0.234 (0.481)	Data Time 0.001 (0.014)	Loss 2.8893 (2.8681)	Entropy 0.64220 (0.64577)	Top-1 acc 56.641 (54.954)	Top-5 acc 77.344 (77.455)	lr 0.01823
Train [42][2620/3239]	Time 0.228 (0.481)	Data Time 0.001 (0.014)	Loss 2.8496 (2.8680)	Entropy 0.64217 (0.64575)	Top-1 acc 55.078 (54.953)	Top-5 acc 77.734 (77.455)	lr 0.01823
Train [42][2630/3239]	Time 0.234 (0.481)	Data Time 0.001 (0.014)	Loss 2.7071 (2.8678)	Entropy 0.64219 (0.64574)	Top-1 acc 57.422 (54.958)	Top-5 acc 81.641 (77.461)	lr 0.01823
Train [42][2640/3239]	Time 0.234 (0.480)	Data Time 0.001 (0.014)	Loss 2.6796 (2.8676)	Entropy 0.64231 (0.64573)	Top-1 acc 61.719 (54.965)	Top-5 acc 81.641 (77.463)	lr 0.01823
Train [42][2650/3239]	Time 0.233 (0.480)	Data Time 0.001 (0.014)	Loss 2.8900 (2.8677)	Entropy 0.64228 (0.64571)	Top-1 acc 55.859 (54.962)	Top-5 acc 74.609 (77.461)	lr 0.01823
Train [42][2660/3239]	Time 0.241 (0.480)	Data Time 0.001 (0.014)	Loss 2.7333 (2.8677)	Entropy 0.64224 (0.64570)	Top-1 acc 56.641 (54.963)	Top-5 acc 82.422 (77.459)	lr 0.01823
Train [42][2670/3239]	Time 0.258 (0.479)	Data Time 0.001 (0.013)	Loss 2.8264 (2.8677)	Entropy 0.64228 (0.64569)	Top-1 acc 56.250 (54.963)	Top-5 acc 76.953 (77.461)	lr 0.01823
Train [42][2680/3239]	Time 0.237 (0.479)	Data Time 0.001 (0.013)	Loss 2.7895 (2.8677)	Entropy 0.64232 (0.64568)	Top-1 acc 61.328 (54.967)	Top-5 acc 80.078 (77.461)	lr 0.01823
Train [42][2690/3239]	Time 0.231 (0.479)	Data Time 0.001 (0.013)	Loss 2.9463 (2.8677)	Entropy 0.64224 (0.64566)	Top-1 acc 51.562 (54.967)	Top-5 acc 74.219 (77.463)	lr 0.01822
Train [42][2700/3239]	Time 0.268 (0.479)	Data Time 0.002 (0.013)	Loss 2.9235 (2.8675)	Entropy 0.64245 (0.64565)	Top-1 acc 56.641 (54.971)	Top-5 acc 75.391 (77.466)	lr 0.01822
Train [42][2710/3239]	Time 0.256 (0.479)	Data Time 0.001 (0.013)	Loss 3.0253 (2.8677)	Entropy 0.64219 (0.64564)	Top-1 acc 49.219 (54.971)	Top-5 acc 75.391 (77.464)	lr 0.01822
Train [42][2720/3239]	Time 0.441 (0.490)	Data Time 0.025 (0.013)	Loss 2.8006 (2.8675)	Entropy 0.64199 (0.64563)	Top-1 acc 55.078 (54.977)	Top-5 acc 80.078 (77.465)	lr 0.01822
Train [42][2730/3239]	Time 0.257 (0.491)	Data Time 0.002 (0.013)	Loss 2.8533 (2.8676)	Entropy 0.64207 (0.64561)	Top-1 acc 50.000 (54.970)	Top-5 acc 79.688 (77.463)	lr 0.01822
Train [42][2740/3239]	Time 0.415 (0.491)	Data Time 0.001 (0.013)	Loss 2.9604 (2.8676)	Entropy 0.64238 (0.64560)	Top-1 acc 52.344 (54.970)	Top-5 acc 73.828 (77.463)	lr 0.01822
Train [42][2750/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.013)	Loss 2.7969 (2.8677)	Entropy 0.64236 (0.64559)	Top-1 acc 56.250 (54.970)	Top-5 acc 77.344 (77.459)	lr 0.01822
Train [42][2760/3239]	Time 0.244 (0.490)	Data Time 0.001 (0.013)	Loss 2.9405 (2.8676)	Entropy 0.64262 (0.64558)	Top-1 acc 51.953 (54.973)	Top-5 acc 79.297 (77.460)	lr 0.01822
Train [42][2770/3239]	Time 0.242 (0.490)	Data Time 0.001 (0.013)	Loss 2.8098 (2.8677)	Entropy 0.64258 (0.64557)	Top-1 acc 57.031 (54.973)	Top-5 acc 80.078 (77.459)	lr 0.01822
Train [42][2780/3239]	Time 0.334 (0.490)	Data Time 0.002 (0.013)	Loss 2.8412 (2.8678)	Entropy 0.64264 (0.64555)	Top-1 acc 53.906 (54.975)	Top-5 acc 77.344 (77.461)	lr 0.01822
Train [42][2790/3239]	Time 0.315 (0.491)	Data Time 0.003 (0.013)	Loss 2.7630 (2.8677)	Entropy 0.64271 (0.64554)	Top-1 acc 55.469 (54.975)	Top-5 acc 79.297 (77.460)	lr 0.01822
Train [42][2800/3239]	Time 0.247 (0.491)	Data Time 0.001 (0.013)	Loss 2.6612 (2.8675)	Entropy 0.64271 (0.64553)	Top-1 acc 62.500 (54.980)	Top-5 acc 78.906 (77.462)	lr 0.01821
Train [42][2810/3239]	Time 0.297 (0.491)	Data Time 0.002 (0.013)	Loss 2.7836 (2.8679)	Entropy 0.64287 (0.64552)	Top-1 acc 55.078 (54.972)	Top-5 acc 79.688 (77.457)	lr 0.01821
Train [42][2820/3239]	Time 0.341 (0.491)	Data Time 0.002 (0.013)	Loss 2.7216 (2.8676)	Entropy 0.64282 (0.64551)	Top-1 acc 57.031 (54.978)	Top-5 acc 80.078 (77.460)	lr 0.01821
Train [42][2830/3239]	Time 0.381 (0.491)	Data Time 0.002 (0.013)	Loss 2.7427 (2.8678)	Entropy 0.64272 (0.64551)	Top-1 acc 56.641 (54.973)	Top-5 acc 78.125 (77.456)	lr 0.01821
Train [42][2840/3239]	Time 0.249 (0.491)	Data Time 0.001 (0.013)	Loss 2.8736 (2.8679)	Entropy 0.64278 (0.64550)	Top-1 acc 56.641 (54.972)	Top-5 acc 79.297 (77.456)	lr 0.01821
Train [42][2850/3239]	Time 0.239 (0.491)	Data Time 0.001 (0.013)	Loss 2.6254 (2.8680)	Entropy 0.64251 (0.64549)	Top-1 acc 59.375 (54.969)	Top-5 acc 81.250 (77.452)	lr 0.01821
Train [42][2860/3239]	Time 0.284 (0.491)	Data Time 0.001 (0.013)	Loss 3.0107 (2.8681)	Entropy 0.64248 (0.64548)	Top-1 acc 48.828 (54.966)	Top-5 acc 75.781 (77.450)	lr 0.01821
Train [42][2870/3239]	Time 0.250 (0.491)	Data Time 0.001 (0.013)	Loss 2.8869 (2.8682)	Entropy 0.64231 (0.64546)	Top-1 acc 52.734 (54.967)	Top-5 acc 74.219 (77.446)	lr 0.01821
Train [42][2880/3239]	Time 0.251 (0.491)	Data Time 0.001 (0.013)	Loss 2.7405 (2.8678)	Entropy 0.64216 (0.64545)	Top-1 acc 59.766 (54.976)	Top-5 acc 80.469 (77.455)	lr 0.01821
Train [42][2890/3239]	Time 0.261 (0.491)	Data Time 0.001 (0.013)	Loss 2.8206 (2.8678)	Entropy 0.64197 (0.64544)	Top-1 acc 55.078 (54.974)	Top-5 acc 77.344 (77.456)	lr 0.01821
Train [42][2900/3239]	Time 0.387 (0.491)	Data Time 0.001 (0.013)	Loss 2.9111 (2.8677)	Entropy 0.64206 (0.64543)	Top-1 acc 53.125 (54.978)	Top-5 acc 75.391 (77.455)	lr 0.01821
Train [42][2910/3239]	Time 0.241 (0.491)	Data Time 0.001 (0.013)	Loss 2.7389 (2.8675)	Entropy 0.64237 (0.64542)	Top-1 acc 59.375 (54.980)	Top-5 acc 80.859 (77.457)	lr 0.01820
Train [42][2920/3239]	Time 0.277 (0.491)	Data Time 0.001 (0.013)	Loss 2.9803 (2.8677)	Entropy 0.64251 (0.64541)	Top-1 acc 48.828 (54.977)	Top-5 acc 76.562 (77.457)	lr 0.01820
Train [42][2930/3239]	Time 0.253 (0.491)	Data Time 0.002 (0.012)	Loss 2.8976 (2.8678)	Entropy 0.64278 (0.64540)	Top-1 acc 52.734 (54.972)	Top-5 acc 76.172 (77.453)	lr 0.01820
Train [42][2940/3239]	Time 0.243 (0.491)	Data Time 0.001 (0.012)	Loss 2.8533 (2.8678)	Entropy 0.64235 (0.64539)	Top-1 acc 54.688 (54.971)	Top-5 acc 76.562 (77.452)	lr 0.01820
Train [42][2950/3239]	Time 0.250 (0.491)	Data Time 0.002 (0.012)	Loss 2.8790 (2.8677)	Entropy 0.64254 (0.64538)	Top-1 acc 54.688 (54.971)	Top-5 acc 79.688 (77.454)	lr 0.01820
Train [42][2960/3239]	Time 0.270 (0.491)	Data Time 0.001 (0.012)	Loss 2.7508 (2.8674)	Entropy 0.64248 (0.64537)	Top-1 acc 60.156 (54.980)	Top-5 acc 78.516 (77.461)	lr 0.01820
Train [42][2970/3239]	Time 0.395 (0.491)	Data Time 0.002 (0.012)	Loss 2.6606 (2.8672)	Entropy 0.64213 (0.64536)	Top-1 acc 59.375 (54.983)	Top-5 acc 82.031 (77.464)	lr 0.01820
Train [42][2980/3239]	Time 0.274 (0.491)	Data Time 0.001 (0.012)	Loss 2.8793 (2.8673)	Entropy 0.64230 (0.64535)	Top-1 acc 52.344 (54.981)	Top-5 acc 80.469 (77.466)	lr 0.01820
Train [42][2990/3239]	Time 0.242 (0.491)	Data Time 0.001 (0.012)	Loss 2.8214 (2.8672)	Entropy 0.64250 (0.64534)	Top-1 acc 55.078 (54.982)	Top-5 acc 78.125 (77.469)	lr 0.01820
Train [42][3000/3239]	Time 0.234 (0.491)	Data Time 0.001 (0.012)	Loss 2.7962 (2.8673)	Entropy 0.64230 (0.64533)	Top-1 acc 56.250 (54.979)	Top-5 acc 80.859 (77.468)	lr 0.01820
Train [42][3010/3239]	Time 0.242 (0.491)	Data Time 0.001 (0.012)	Loss 2.8973 (2.8673)	Entropy 0.64222 (0.64532)	Top-1 acc 54.297 (54.980)	Top-5 acc 76.562 (77.468)	lr 0.01820
Train [42][3020/3239]	Time 0.249 (0.491)	Data Time 0.001 (0.012)	Loss 3.1307 (2.8675)	Entropy 0.64220 (0.64531)	Top-1 acc 51.172 (54.975)	Top-5 acc 73.047 (77.466)	lr 0.01819
Train [42][3030/3239]	Time 0.245 (0.491)	Data Time 0.003 (0.012)	Loss 2.9448 (2.8675)	Entropy 0.64214 (0.64530)	Top-1 acc 56.641 (54.975)	Top-5 acc 75.391 (77.467)	lr 0.01819
Train [42][3040/3239]	Time 0.241 (0.490)	Data Time 0.001 (0.012)	Loss 2.7932 (2.8676)	Entropy 0.64228 (0.64529)	Top-1 acc 53.906 (54.971)	Top-5 acc 78.906 (77.469)	lr 0.01819
Train [42][3050/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.012)	Loss 2.7441 (2.8675)	Entropy 0.64212 (0.64528)	Top-1 acc 57.031 (54.973)	Top-5 acc 79.688 (77.470)	lr 0.01819
Train [42][3060/3239]	Time 0.362 (0.490)	Data Time 0.001 (0.012)	Loss 2.9078 (2.8676)	Entropy 0.64196 (0.64527)	Top-1 acc 52.734 (54.972)	Top-5 acc 76.172 (77.468)	lr 0.01819
Train [42][3070/3239]	Time 0.233 (0.490)	Data Time 0.001 (0.012)	Loss 2.8143 (2.8677)	Entropy 0.64191 (0.64526)	Top-1 acc 55.078 (54.969)	Top-5 acc 78.516 (77.466)	lr 0.01819
Train [42][3080/3239]	Time 0.236 (0.490)	Data Time 0.001 (0.012)	Loss 2.7865 (2.8678)	Entropy 0.64228 (0.64525)	Top-1 acc 57.812 (54.968)	Top-5 acc 81.250 (77.466)	lr 0.01819
Train [42][3090/3239]	Time 0.234 (0.490)	Data Time 0.001 (0.012)	Loss 2.9793 (2.8678)	Entropy 0.64239 (0.64524)	Top-1 acc 50.391 (54.962)	Top-5 acc 76.562 (77.464)	lr 0.01819
Train [42][3100/3239]	Time 0.241 (0.489)	Data Time 0.001 (0.012)	Loss 3.0459 (2.8679)	Entropy 0.64242 (0.64523)	Top-1 acc 50.391 (54.962)	Top-5 acc 72.266 (77.460)	lr 0.01819
Train [42][3110/3239]	Time 0.243 (0.489)	Data Time 0.001 (0.012)	Loss 2.8623 (2.8680)	Entropy 0.64232 (0.64522)	Top-1 acc 58.594 (54.959)	Top-5 acc 77.734 (77.458)	lr 0.01819
Train [42][3120/3239]	Time 0.232 (0.489)	Data Time 0.001 (0.012)	Loss 2.8548 (2.8677)	Entropy 0.64235 (0.64521)	Top-1 acc 51.953 (54.963)	Top-5 acc 78.906 (77.464)	lr 0.01819
Train [42][3130/3239]	Time 0.328 (0.489)	Data Time 0.001 (0.012)	Loss 3.0461 (2.8679)	Entropy 0.64209 (0.64520)	Top-1 acc 50.391 (54.959)	Top-5 acc 74.609 (77.459)	lr 0.01818
Train [42][3140/3239]	Time 0.251 (0.489)	Data Time 0.001 (0.012)	Loss 2.8387 (2.8682)	Entropy 0.64191 (0.64519)	Top-1 acc 53.906 (54.951)	Top-5 acc 77.344 (77.452)	lr 0.01818
Train [42][3150/3239]	Time 0.239 (0.489)	Data Time 0.001 (0.012)	Loss 2.8658 (2.8682)	Entropy 0.64184 (0.64518)	Top-1 acc 51.562 (54.951)	Top-5 acc 78.125 (77.455)	lr 0.01818
Train [42][3160/3239]	Time 0.228 (0.488)	Data Time 0.001 (0.012)	Loss 2.9926 (2.8683)	Entropy 0.64163 (0.64517)	Top-1 acc 48.828 (54.948)	Top-5 acc 77.344 (77.453)	lr 0.01818
Train [42][3170/3239]	Time 0.246 (0.488)	Data Time 0.002 (0.012)	Loss 3.0332 (2.8684)	Entropy 0.64127 (0.64516)	Top-1 acc 50.781 (54.948)	Top-5 acc 74.219 (77.452)	lr 0.01818
Train [42][3180/3239]	Time 0.236 (0.488)	Data Time 0.000 (0.012)	Loss 2.9643 (2.8686)	Entropy 0.64130 (0.64514)	Top-1 acc 50.781 (54.942)	Top-5 acc 74.219 (77.448)	lr 0.01818
Train [42][3190/3239]	Time 0.239 (0.488)	Data Time 0.000 (0.012)	Loss 2.8401 (2.8685)	Entropy 0.64095 (0.64513)	Top-1 acc 57.812 (54.945)	Top-5 acc 78.125 (77.446)	lr 0.01818
Train [42][3200/3239]	Time 0.239 (0.488)	Data Time 0.000 (0.012)	Loss 3.1397 (2.8685)	Entropy 0.64103 (0.64512)	Top-1 acc 44.922 (54.941)	Top-5 acc 75.781 (77.449)	lr 0.01818
Train [42][3210/3239]	Time 0.236 (0.487)	Data Time 0.000 (0.012)	Loss 2.8029 (2.8687)	Entropy 0.64098 (0.64511)	Top-1 acc 55.078 (54.940)	Top-5 acc 76.953 (77.441)	lr 0.01818
Train [42][3220/3239]	Time 0.258 (0.487)	Data Time 0.000 (0.012)	Loss 2.8784 (2.8688)	Entropy 0.64123 (0.64509)	Top-1 acc 52.734 (54.938)	Top-5 acc 77.344 (77.438)	lr 0.01818
Train [42][3230/3239]	Time 0.220 (0.487)	Data Time 0.000 (0.011)	Loss 2.9007 (2.8688)	Entropy 0.64148 (0.64508)	Top-1 acc 52.344 (54.935)	Top-5 acc 77.734 (77.438)	lr 0.01818
Train [42][3239/3239]	Time 0.902 (0.487)	Data Time 0.000 (0.011)	Loss 2.7874 (2.8689)	Entropy 0.64157 (0.64507)	Top-1 acc 53.086 (54.934)	Top-5 acc 82.716 (77.437)	lr 0.01817
==========Valid [42/120]	loss 1.574	top-1 acc 63.947 (63.947)	top-5 acc 85.065	Train top-1 54.934	top-5 77.437	Entropy 0.64157	Latency-None: 0.000ms	Flops: 539.76M
Train [43][0/3239]	Time 35.679 (35.679)	Data Time 33.793 (33.793)	Loss 3.0023 (3.0023)	Entropy 0.64177 (0.64177)	Top-1 acc 52.344 (52.344)	Top-5 acc 76.562 (76.562)	lr 0.01817
Train [43][10/3239]	Time 0.283 (3.787)	Data Time 0.002 (3.080)	Loss 2.8898 (2.9284)	Entropy 0.64197 (0.64177)	Top-1 acc 53.906 (52.344)	Top-5 acc 79.688 (76.634)	lr 0.01817
Train [43][20/3239]	Time 0.256 (2.198)	Data Time 0.001 (1.614)	Loss 2.7583 (2.9031)	Entropy 0.64218 (0.64190)	Top-1 acc 58.203 (53.925)	Top-5 acc 78.125 (76.972)	lr 0.01817
Train [43][30/3239]	Time 0.430 (1.646)	Data Time 0.002 (1.094)	Loss 2.7344 (2.8814)	Entropy 0.64208 (0.64196)	Top-1 acc 58.203 (54.700)	Top-5 acc 78.906 (77.331)	lr 0.01817
Train [43][40/3239]	Time 0.278 (1.354)	Data Time 0.002 (0.828)	Loss 2.8644 (2.8624)	Entropy 0.64189 (0.64194)	Top-1 acc 55.859 (55.145)	Top-5 acc 75.781 (77.458)	lr 0.01817
Train [43][50/3239]	Time 0.259 (1.182)	Data Time 0.001 (0.666)	Loss 2.6753 (2.8490)	Entropy 0.64206 (0.64194)	Top-1 acc 57.031 (55.400)	Top-5 acc 78.125 (77.642)	lr 0.01817
Train [43][60/3239]	Time 0.250 (1.068)	Data Time 0.002 (0.558)	Loss 2.6756 (2.8461)	Entropy 0.64218 (0.64197)	Top-1 acc 58.594 (55.507)	Top-5 acc 81.250 (77.766)	lr 0.01817
Train [43][70/3239]	Time 0.224 (0.981)	Data Time 0.001 (0.479)	Loss 2.7596 (2.8438)	Entropy 0.64188 (0.64200)	Top-1 acc 53.906 (55.546)	Top-5 acc 80.859 (77.899)	lr 0.01817
Train [43][80/3239]	Time 0.250 (0.914)	Data Time 0.001 (0.420)	Loss 2.8084 (2.8475)	Entropy 0.64174 (0.64198)	Top-1 acc 56.641 (55.498)	Top-5 acc 78.906 (77.816)	lr 0.01817
Train [43][90/3239]	Time 0.248 (0.862)	Data Time 0.001 (0.374)	Loss 2.9069 (2.8510)	Entropy 0.64157 (0.64195)	Top-1 acc 53.906 (55.529)	Top-5 acc 73.438 (77.661)	lr 0.01817
Train [43][100/3239]	Time 0.282 (0.824)	Data Time 0.001 (0.337)	Loss 2.7342 (2.8481)	Entropy 0.64130 (0.64191)	Top-1 acc 59.766 (55.635)	Top-5 acc 80.469 (77.734)	lr 0.01817
Train [43][110/3239]	Time 0.249 (0.789)	Data Time 0.001 (0.307)	Loss 2.7563 (2.8421)	Entropy 0.64114 (0.64184)	Top-1 acc 55.469 (55.828)	Top-5 acc 80.859 (77.903)	lr 0.01816
Train [43][120/3239]	Time 0.375 (0.762)	Data Time 0.001 (0.282)	Loss 2.8934 (2.8434)	Entropy 0.64104 (0.64178)	Top-1 acc 53.906 (55.834)	Top-5 acc 80.078 (77.844)	lr 0.01816
Train [43][130/3239]	Time 0.487 (1.011)	Data Time 0.006 (0.261)	Loss 2.8420 (2.8452)	Entropy 0.64060 (0.64172)	Top-1 acc 58.594 (55.809)	Top-5 acc 77.344 (77.836)	lr 0.01816
Train [43][140/3239]	Time 0.292 (0.982)	Data Time 0.002 (0.242)	Loss 2.9025 (2.8451)	Entropy 0.64071 (0.64164)	Top-1 acc 52.734 (55.740)	Top-5 acc 76.953 (77.809)	lr 0.01816
Train [43][150/3239]	Time 0.250 (0.948)	Data Time 0.002 (0.226)	Loss 2.8201 (2.8445)	Entropy 0.64038 (0.64157)	Top-1 acc 52.734 (55.715)	Top-5 acc 78.125 (77.833)	lr 0.01816
Train [43][160/3239]	Time 0.254 (0.918)	Data Time 0.002 (0.213)	Loss 2.8866 (2.8493)	Entropy 0.64020 (0.64149)	Top-1 acc 54.688 (55.539)	Top-5 acc 74.609 (77.744)	lr 0.01816
Train [43][170/3239]	Time 0.297 (0.891)	Data Time 0.003 (0.200)	Loss 2.9291 (2.8517)	Entropy 0.63998 (0.64140)	Top-1 acc 51.953 (55.505)	Top-5 acc 76.172 (77.718)	lr 0.01816
Train [43][180/3239]	Time 0.249 (0.867)	Data Time 0.002 (0.189)	Loss 2.6922 (2.8503)	Entropy 0.63984 (0.64132)	Top-1 acc 58.203 (55.490)	Top-5 acc 81.250 (77.747)	lr 0.01816
Train [43][190/3239]	Time 0.375 (0.845)	Data Time 0.001 (0.180)	Loss 2.8547 (2.8497)	Entropy 0.63985 (0.64124)	Top-1 acc 55.469 (55.463)	Top-5 acc 76.562 (77.745)	lr 0.01816
Train [43][200/3239]	Time 0.303 (0.826)	Data Time 0.002 (0.171)	Loss 2.6821 (2.8482)	Entropy 0.63941 (0.64116)	Top-1 acc 61.328 (55.488)	Top-5 acc 77.734 (77.750)	lr 0.01816
Train [43][210/3239]	Time 0.272 (0.809)	Data Time 0.001 (0.163)	Loss 3.0920 (2.8514)	Entropy 0.63969 (0.64108)	Top-1 acc 48.438 (55.432)	Top-5 acc 71.875 (77.705)	lr 0.01816
Train [43][220/3239]	Time 0.240 (0.793)	Data Time 0.001 (0.156)	Loss 2.8280 (2.8526)	Entropy 0.63973 (0.64102)	Top-1 acc 53.906 (55.439)	Top-5 acc 78.516 (77.729)	lr 0.01816
Train [43][230/3239]	Time 0.254 (0.779)	Data Time 0.001 (0.149)	Loss 2.9450 (2.8533)	Entropy 0.63995 (0.64097)	Top-1 acc 51.953 (55.426)	Top-5 acc 73.828 (77.701)	lr 0.01815
Train [43][240/3239]	Time 0.267 (0.767)	Data Time 0.001 (0.143)	Loss 2.6929 (2.8523)	Entropy 0.64031 (0.64093)	Top-1 acc 59.375 (55.456)	Top-5 acc 80.078 (77.744)	lr 0.01815
Train [43][250/3239]	Time 0.308 (0.755)	Data Time 0.002 (0.137)	Loss 3.1527 (2.8567)	Entropy 0.64040 (0.64091)	Top-1 acc 48.047 (55.332)	Top-5 acc 71.875 (77.706)	lr 0.01815
Train [43][260/3239]	Time 0.273 (0.743)	Data Time 0.001 (0.132)	Loss 2.5607 (2.8540)	Entropy 0.64014 (0.64088)	Top-1 acc 60.938 (55.389)	Top-5 acc 85.547 (77.772)	lr 0.01815
Train [43][270/3239]	Time 0.239 (0.733)	Data Time 0.001 (0.127)	Loss 2.9134 (2.8531)	Entropy 0.64006 (0.64086)	Top-1 acc 56.250 (55.427)	Top-5 acc 75.781 (77.769)	lr 0.01815
Train [43][280/3239]	Time 0.401 (0.724)	Data Time 0.001 (0.123)	Loss 2.7336 (2.8514)	Entropy 0.64010 (0.64083)	Top-1 acc 59.766 (55.488)	Top-5 acc 82.031 (77.789)	lr 0.01815
Train [43][290/3239]	Time 0.294 (0.715)	Data Time 0.002 (0.119)	Loss 2.7327 (2.8525)	Entropy 0.64033 (0.64081)	Top-1 acc 60.547 (55.478)	Top-5 acc 80.078 (77.793)	lr 0.01815
Train [43][300/3239]	Time 0.235 (0.706)	Data Time 0.001 (0.115)	Loss 2.6112 (2.8497)	Entropy 0.64048 (0.64080)	Top-1 acc 58.203 (55.508)	Top-5 acc 82.031 (77.842)	lr 0.01815
Train [43][310/3239]	Time 0.243 (0.698)	Data Time 0.001 (0.111)	Loss 2.9018 (2.8497)	Entropy 0.64060 (0.64079)	Top-1 acc 56.250 (55.516)	Top-5 acc 78.516 (77.850)	lr 0.01815
Train [43][320/3239]	Time 0.251 (0.690)	Data Time 0.001 (0.108)	Loss 2.6716 (2.8487)	Entropy 0.64061 (0.64078)	Top-1 acc 60.156 (55.577)	Top-5 acc 81.641 (77.856)	lr 0.01815
Train [43][330/3239]	Time 0.249 (0.682)	Data Time 0.001 (0.104)	Loss 3.2859 (2.8485)	Entropy 0.64045 (0.64078)	Top-1 acc 41.406 (55.555)	Top-5 acc 73.047 (77.875)	lr 0.01815
Train [43][340/3239]	Time 0.282 (0.675)	Data Time 0.001 (0.101)	Loss 2.9888 (2.8503)	Entropy 0.64078 (0.64077)	Top-1 acc 48.438 (55.485)	Top-5 acc 74.219 (77.859)	lr 0.01814
Train [43][350/3239]	Time 0.339 (0.668)	Data Time 0.001 (0.099)	Loss 2.8561 (2.8513)	Entropy 0.64013 (0.64076)	Top-1 acc 55.469 (55.455)	Top-5 acc 74.609 (77.829)	lr 0.01814
Train [43][360/3239]	Time 0.229 (0.662)	Data Time 0.001 (0.096)	Loss 2.6323 (2.8507)	Entropy 0.63977 (0.64074)	Top-1 acc 55.078 (55.450)	Top-5 acc 82.031 (77.843)	lr 0.01814
Train [43][370/3239]	Time 0.238 (0.656)	Data Time 0.002 (0.093)	Loss 2.9403 (2.8523)	Entropy 0.63976 (0.64072)	Top-1 acc 53.906 (55.428)	Top-5 acc 76.953 (77.799)	lr 0.01814
Train [43][380/3239]	Time 0.268 (0.651)	Data Time 0.001 (0.091)	Loss 2.9544 (2.8532)	Entropy 0.63936 (0.64069)	Top-1 acc 52.344 (55.435)	Top-5 acc 76.172 (77.785)	lr 0.01814
Train [43][390/3239]	Time 0.250 (0.645)	Data Time 0.001 (0.089)	Loss 3.0286 (2.8570)	Entropy 0.63974 (0.64066)	Top-1 acc 53.906 (55.381)	Top-5 acc 72.656 (77.678)	lr 0.01814
Train [43][400/3239]	Time 0.233 (0.640)	Data Time 0.001 (0.086)	Loss 3.1297 (2.8577)	Entropy 0.63961 (0.64063)	Top-1 acc 48.438 (55.341)	Top-5 acc 72.266 (77.687)	lr 0.01814
Train [43][410/3239]	Time 0.240 (0.635)	Data Time 0.001 (0.084)	Loss 2.7164 (2.8575)	Entropy 0.63935 (0.64061)	Top-1 acc 57.031 (55.334)	Top-5 acc 80.078 (77.705)	lr 0.01814
Train [43][420/3239]	Time 0.256 (0.631)	Data Time 0.001 (0.082)	Loss 2.7533 (2.8565)	Entropy 0.63899 (0.64057)	Top-1 acc 57.031 (55.360)	Top-5 acc 80.078 (77.724)	lr 0.01814
Train [43][430/3239]	Time 0.277 (0.627)	Data Time 0.002 (0.081)	Loss 2.9745 (2.8579)	Entropy 0.63910 (0.64053)	Top-1 acc 52.344 (55.327)	Top-5 acc 75.391 (77.694)	lr 0.01814
Train [43][440/3239]	Time 0.288 (0.623)	Data Time 0.001 (0.079)	Loss 2.9835 (2.8589)	Entropy 0.63893 (0.64050)	Top-1 acc 51.172 (55.275)	Top-5 acc 73.828 (77.665)	lr 0.01814
Train [43][450/3239]	Time 0.243 (0.619)	Data Time 0.001 (0.077)	Loss 2.7666 (2.8566)	Entropy 0.63913 (0.64046)	Top-1 acc 56.641 (55.345)	Top-5 acc 78.516 (77.727)	lr 0.01813
Train [43][460/3239]	Time 0.263 (0.615)	Data Time 0.001 (0.075)	Loss 2.7336 (2.8564)	Entropy 0.63880 (0.64043)	Top-1 acc 55.078 (55.347)	Top-5 acc 78.125 (77.729)	lr 0.01813
Train [43][470/3239]	Time 0.234 (0.611)	Data Time 0.001 (0.074)	Loss 2.7896 (2.8575)	Entropy 0.63907 (0.64040)	Top-1 acc 54.688 (55.306)	Top-5 acc 78.906 (77.716)	lr 0.01813
Train [43][480/3239]	Time 0.235 (0.607)	Data Time 0.001 (0.072)	Loss 2.9669 (2.8567)	Entropy 0.63889 (0.64037)	Top-1 acc 54.688 (55.296)	Top-5 acc 75.391 (77.726)	lr 0.01813
Train [43][490/3239]	Time 0.250 (0.604)	Data Time 0.001 (0.071)	Loss 3.1160 (2.8578)	Entropy 0.63854 (0.64033)	Top-1 acc 48.438 (55.271)	Top-5 acc 71.484 (77.701)	lr 0.01813
Train [43][500/3239]	Time 0.246 (0.601)	Data Time 0.002 (0.070)	Loss 2.6229 (2.8574)	Entropy 0.63865 (0.64030)	Top-1 acc 57.812 (55.270)	Top-5 acc 82.422 (77.701)	lr 0.01813
Train [43][510/3239]	Time 0.378 (0.598)	Data Time 0.001 (0.068)	Loss 2.7636 (2.8562)	Entropy 0.63862 (0.64026)	Top-1 acc 55.078 (55.272)	Top-5 acc 77.734 (77.717)	lr 0.01813
Train [43][520/3239]	Time 0.240 (0.594)	Data Time 0.001 (0.067)	Loss 2.7631 (2.8567)	Entropy 0.63835 (0.64023)	Top-1 acc 61.719 (55.271)	Top-5 acc 76.562 (77.705)	lr 0.01813
Train [43][530/3239]	Time 0.256 (0.591)	Data Time 0.001 (0.066)	Loss 2.8407 (2.8565)	Entropy 0.63816 (0.64019)	Top-1 acc 56.641 (55.259)	Top-5 acc 77.344 (77.705)	lr 0.01813
Train [43][540/3239]	Time 0.271 (0.588)	Data Time 0.001 (0.065)	Loss 2.7733 (2.8557)	Entropy 0.63797 (0.64015)	Top-1 acc 58.203 (55.274)	Top-5 acc 80.078 (77.718)	lr 0.01813
Train [43][550/3239]	Time 0.259 (0.585)	Data Time 0.001 (0.063)	Loss 2.7437 (2.8563)	Entropy 0.63759 (0.64011)	Top-1 acc 55.859 (55.239)	Top-5 acc 78.906 (77.718)	lr 0.01813
Train [43][560/3239]	Time 0.239 (0.583)	Data Time 0.001 (0.062)	Loss 2.7276 (2.8544)	Entropy 0.63722 (0.64006)	Top-1 acc 55.469 (55.273)	Top-5 acc 76.172 (77.750)	lr 0.01812
Train [43][570/3239]	Time 0.222 (0.580)	Data Time 0.001 (0.061)	Loss 2.8289 (2.8548)	Entropy 0.63712 (0.64001)	Top-1 acc 55.469 (55.264)	Top-5 acc 77.344 (77.731)	lr 0.01812
Train [43][580/3239]	Time 0.351 (0.578)	Data Time 0.001 (0.060)	Loss 2.8432 (2.8554)	Entropy 0.63715 (0.63997)	Top-1 acc 57.422 (55.254)	Top-5 acc 78.125 (77.708)	lr 0.01812
Train [43][590/3239]	Time 0.218 (0.576)	Data Time 0.001 (0.059)	Loss 2.9807 (2.8551)	Entropy 0.63673 (0.63992)	Top-1 acc 52.344 (55.257)	Top-5 acc 73.828 (77.733)	lr 0.01812
Train [43][600/3239]	Time 0.257 (0.573)	Data Time 0.001 (0.058)	Loss 2.7626 (2.8553)	Entropy 0.63707 (0.63987)	Top-1 acc 59.375 (55.261)	Top-5 acc 78.516 (77.721)	lr 0.01812
Train [43][610/3239]	Time 0.293 (0.571)	Data Time 0.002 (0.057)	Loss 3.0036 (2.8546)	Entropy 0.63701 (0.63982)	Top-1 acc 48.828 (55.254)	Top-5 acc 73.438 (77.731)	lr 0.01812
Train [43][620/3239]	Time 0.246 (0.569)	Data Time 0.001 (0.056)	Loss 2.8792 (2.8543)	Entropy 0.63694 (0.63977)	Top-1 acc 54.688 (55.263)	Top-5 acc 79.297 (77.747)	lr 0.01812
Train [43][630/3239]	Time 0.218 (0.567)	Data Time 0.001 (0.056)	Loss 3.2795 (2.8556)	Entropy 0.63721 (0.63973)	Top-1 acc 48.047 (55.226)	Top-5 acc 69.922 (77.702)	lr 0.01812
Train [43][640/3239]	Time 0.240 (0.565)	Data Time 0.001 (0.055)	Loss 2.9282 (2.8562)	Entropy 0.63746 (0.63969)	Top-1 acc 55.859 (55.229)	Top-5 acc 77.734 (77.687)	lr 0.01812
Train [43][650/3239]	Time 0.229 (0.563)	Data Time 0.001 (0.054)	Loss 2.7126 (2.8550)	Entropy 0.63751 (0.63966)	Top-1 acc 58.594 (55.262)	Top-5 acc 79.688 (77.698)	lr 0.01812
Train [43][660/3239]	Time 0.251 (0.561)	Data Time 0.001 (0.053)	Loss 2.5896 (2.8547)	Entropy 0.63715 (0.63962)	Top-1 acc 61.719 (55.266)	Top-5 acc 82.031 (77.701)	lr 0.01812
Train [43][670/3239]	Time 0.408 (0.559)	Data Time 0.001 (0.052)	Loss 2.8534 (2.8552)	Entropy 0.63731 (0.63959)	Top-1 acc 55.469 (55.245)	Top-5 acc 77.734 (77.697)	lr 0.01811
Train [43][680/3239]	Time 0.228 (0.557)	Data Time 0.001 (0.052)	Loss 2.7711 (2.8546)	Entropy 0.63736 (0.63955)	Top-1 acc 59.766 (55.243)	Top-5 acc 79.688 (77.701)	lr 0.01811
Train [43][690/3239]	Time 0.259 (0.555)	Data Time 0.001 (0.051)	Loss 2.8067 (2.8543)	Entropy 0.63722 (0.63952)	Top-1 acc 54.297 (55.236)	Top-5 acc 79.297 (77.704)	lr 0.01811
Train [43][700/3239]	Time 0.268 (0.553)	Data Time 0.002 (0.050)	Loss 2.9326 (2.8540)	Entropy 0.63734 (0.63949)	Top-1 acc 51.562 (55.249)	Top-5 acc 75.781 (77.709)	lr 0.01811
Train [43][710/3239]	Time 0.234 (0.552)	Data Time 0.001 (0.050)	Loss 2.7270 (2.8537)	Entropy 0.63749 (0.63946)	Top-1 acc 58.594 (55.269)	Top-5 acc 81.250 (77.706)	lr 0.01811
Train [43][720/3239]	Time 0.233 (0.550)	Data Time 0.001 (0.049)	Loss 2.8093 (2.8543)	Entropy 0.63777 (0.63943)	Top-1 acc 52.734 (55.250)	Top-5 acc 81.250 (77.703)	lr 0.01811
Train [43][730/3239]	Time 0.234 (0.548)	Data Time 0.001 (0.048)	Loss 3.0174 (2.8542)	Entropy 0.63783 (0.63941)	Top-1 acc 48.438 (55.243)	Top-5 acc 75.391 (77.708)	lr 0.01811
Train [43][740/3239]	Time 0.322 (0.546)	Data Time 0.001 (0.048)	Loss 2.8753 (2.8543)	Entropy 0.63814 (0.63939)	Top-1 acc 55.469 (55.240)	Top-5 acc 76.953 (77.708)	lr 0.01811
Train [43][750/3239]	Time 0.243 (0.545)	Data Time 0.001 (0.047)	Loss 2.6773 (2.8535)	Entropy 0.63842 (0.63937)	Top-1 acc 63.672 (55.271)	Top-5 acc 81.250 (77.732)	lr 0.01811
Train [43][760/3239]	Time 0.235 (0.543)	Data Time 0.002 (0.046)	Loss 2.8486 (2.8535)	Entropy 0.63857 (0.63936)	Top-1 acc 58.203 (55.275)	Top-5 acc 75.781 (77.728)	lr 0.01811
Train [43][770/3239]	Time 0.345 (0.543)	Data Time 0.001 (0.046)	Loss 2.8132 (2.8542)	Entropy 0.63866 (0.63935)	Top-1 acc 56.250 (55.263)	Top-5 acc 79.297 (77.715)	lr 0.01811
Train [43][780/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.045)	Loss 2.7774 (2.8537)	Entropy 0.63904 (0.63935)	Top-1 acc 55.859 (55.272)	Top-5 acc 76.953 (77.724)	lr 0.01810
Train [43][790/3239]	Time 0.245 (0.585)	Data Time 0.002 (0.045)	Loss 2.5738 (2.8523)	Entropy 0.63866 (0.63934)	Top-1 acc 57.812 (55.304)	Top-5 acc 83.984 (77.751)	lr 0.01810
Train [43][800/3239]	Time 0.242 (0.583)	Data Time 0.002 (0.044)	Loss 2.8992 (2.8530)	Entropy 0.63891 (0.63933)	Top-1 acc 56.250 (55.303)	Top-5 acc 78.516 (77.749)	lr 0.01810
Train [43][810/3239]	Time 0.249 (0.581)	Data Time 0.002 (0.044)	Loss 2.8876 (2.8533)	Entropy 0.63866 (0.63933)	Top-1 acc 56.641 (55.299)	Top-5 acc 73.438 (77.731)	lr 0.01810
Train [43][820/3239]	Time 0.241 (0.579)	Data Time 0.001 (0.043)	Loss 2.9136 (2.8535)	Entropy 0.63878 (0.63932)	Top-1 acc 54.297 (55.286)	Top-5 acc 77.734 (77.725)	lr 0.01810
Train [43][830/3239]	Time 0.341 (0.577)	Data Time 0.001 (0.043)	Loss 2.8862 (2.8534)	Entropy 0.63876 (0.63931)	Top-1 acc 51.953 (55.287)	Top-5 acc 76.562 (77.727)	lr 0.01810
Train [43][840/3239]	Time 0.238 (0.575)	Data Time 0.001 (0.042)	Loss 2.8766 (2.8529)	Entropy 0.63828 (0.63930)	Top-1 acc 55.859 (55.308)	Top-5 acc 76.562 (77.739)	lr 0.01810
Train [43][850/3239]	Time 0.239 (0.574)	Data Time 0.001 (0.042)	Loss 2.9132 (2.8535)	Entropy 0.63806 (0.63929)	Top-1 acc 52.344 (55.287)	Top-5 acc 76.172 (77.723)	lr 0.01810
Train [43][860/3239]	Time 0.230 (0.573)	Data Time 0.001 (0.041)	Loss 2.8050 (2.8526)	Entropy 0.63802 (0.63928)	Top-1 acc 55.859 (55.315)	Top-5 acc 80.469 (77.737)	lr 0.01810
Train [43][870/3239]	Time 0.236 (0.571)	Data Time 0.001 (0.041)	Loss 2.8759 (2.8525)	Entropy 0.63786 (0.63926)	Top-1 acc 51.953 (55.311)	Top-5 acc 76.953 (77.741)	lr 0.01810
Train [43][880/3239]	Time 0.239 (0.569)	Data Time 0.002 (0.040)	Loss 2.8464 (2.8517)	Entropy 0.63794 (0.63925)	Top-1 acc 56.641 (55.331)	Top-5 acc 78.516 (77.757)	lr 0.01810
Train [43][890/3239]	Time 0.219 (0.568)	Data Time 0.001 (0.040)	Loss 2.7928 (2.8513)	Entropy 0.63787 (0.63923)	Top-1 acc 57.812 (55.349)	Top-5 acc 78.125 (77.758)	lr 0.01809
Train [43][900/3239]	Time 0.343 (0.566)	Data Time 0.001 (0.039)	Loss 2.9182 (2.8502)	Entropy 0.63766 (0.63921)	Top-1 acc 51.172 (55.365)	Top-5 acc 76.953 (77.765)	lr 0.01809
Train [43][910/3239]	Time 0.232 (0.564)	Data Time 0.001 (0.039)	Loss 2.9187 (2.8507)	Entropy 0.63787 (0.63920)	Top-1 acc 53.516 (55.358)	Top-5 acc 76.953 (77.764)	lr 0.01809
Train [43][920/3239]	Time 0.246 (0.563)	Data Time 0.001 (0.039)	Loss 2.8359 (2.8515)	Entropy 0.63817 (0.63918)	Top-1 acc 54.297 (55.332)	Top-5 acc 77.344 (77.744)	lr 0.01809
Train [43][930/3239]	Time 0.267 (0.562)	Data Time 0.001 (0.038)	Loss 2.8521 (2.8516)	Entropy 0.63820 (0.63917)	Top-1 acc 58.203 (55.342)	Top-5 acc 80.078 (77.744)	lr 0.01809
Train [43][940/3239]	Time 0.234 (0.561)	Data Time 0.001 (0.038)	Loss 2.9289 (2.8517)	Entropy 0.63843 (0.63916)	Top-1 acc 53.516 (55.345)	Top-5 acc 75.781 (77.739)	lr 0.01809
Train [43][950/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.037)	Loss 2.8089 (2.8518)	Entropy 0.63860 (0.63916)	Top-1 acc 56.250 (55.347)	Top-5 acc 78.125 (77.744)	lr 0.01809
Train [43][960/3239]	Time 0.269 (0.558)	Data Time 0.001 (0.037)	Loss 2.8387 (2.8517)	Entropy 0.63855 (0.63915)	Top-1 acc 56.641 (55.353)	Top-5 acc 76.953 (77.743)	lr 0.01809
Train [43][970/3239]	Time 0.268 (0.557)	Data Time 0.002 (0.037)	Loss 2.7198 (2.8513)	Entropy 0.63867 (0.63914)	Top-1 acc 57.422 (55.358)	Top-5 acc 78.906 (77.742)	lr 0.01809
Train [43][980/3239]	Time 0.236 (0.556)	Data Time 0.001 (0.036)	Loss 2.7710 (2.8514)	Entropy 0.63874 (0.63914)	Top-1 acc 58.203 (55.365)	Top-5 acc 79.297 (77.750)	lr 0.01809
Train [43][990/3239]	Time 0.352 (0.555)	Data Time 0.001 (0.036)	Loss 2.7792 (2.8519)	Entropy 0.63887 (0.63914)	Top-1 acc 61.328 (55.360)	Top-5 acc 78.516 (77.741)	lr 0.01809
Train [43][1000/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.036)	Loss 2.7684 (2.8518)	Entropy 0.63919 (0.63913)	Top-1 acc 55.859 (55.367)	Top-5 acc 78.906 (77.744)	lr 0.01808
Train [43][1010/3239]	Time 0.233 (0.552)	Data Time 0.001 (0.035)	Loss 2.7381 (2.8519)	Entropy 0.63946 (0.63914)	Top-1 acc 59.375 (55.367)	Top-5 acc 78.906 (77.739)	lr 0.01808
Train [43][1020/3239]	Time 0.242 (0.551)	Data Time 0.001 (0.035)	Loss 2.8900 (2.8520)	Entropy 0.63942 (0.63914)	Top-1 acc 55.469 (55.370)	Top-5 acc 77.344 (77.745)	lr 0.01808
Train [43][1030/3239]	Time 0.238 (0.550)	Data Time 0.001 (0.035)	Loss 2.8536 (2.8529)	Entropy 0.63959 (0.63914)	Top-1 acc 58.594 (55.355)	Top-5 acc 80.078 (77.731)	lr 0.01808
Train [43][1040/3239]	Time 0.248 (0.548)	Data Time 0.001 (0.034)	Loss 2.7966 (2.8527)	Entropy 0.63961 (0.63915)	Top-1 acc 53.516 (55.363)	Top-5 acc 79.297 (77.735)	lr 0.01808
Train [43][1050/3239]	Time 0.254 (0.547)	Data Time 0.001 (0.034)	Loss 2.9858 (2.8529)	Entropy 0.64001 (0.63915)	Top-1 acc 53.906 (55.348)	Top-5 acc 76.953 (77.731)	lr 0.01808
Train [43][1060/3239]	Time 0.330 (0.546)	Data Time 0.001 (0.034)	Loss 3.0099 (2.8529)	Entropy 0.64010 (0.63916)	Top-1 acc 50.391 (55.343)	Top-5 acc 75.391 (77.724)	lr 0.01808
Train [43][1070/3239]	Time 0.234 (0.545)	Data Time 0.001 (0.033)	Loss 2.8728 (2.8531)	Entropy 0.64011 (0.63917)	Top-1 acc 51.953 (55.331)	Top-5 acc 76.172 (77.715)	lr 0.01808
Train [43][1080/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.033)	Loss 3.0001 (2.8533)	Entropy 0.64015 (0.63918)	Top-1 acc 50.391 (55.323)	Top-5 acc 77.344 (77.712)	lr 0.01808
Train [43][1090/3239]	Time 0.248 (0.543)	Data Time 0.002 (0.033)	Loss 2.7551 (2.8530)	Entropy 0.64039 (0.63919)	Top-1 acc 57.031 (55.329)	Top-5 acc 76.562 (77.717)	lr 0.01808
Train [43][1100/3239]	Time 0.206 (0.542)	Data Time 0.001 (0.033)	Loss 3.3273 (2.8534)	Entropy 0.64043 (0.63920)	Top-1 acc 44.531 (55.315)	Top-5 acc 66.797 (77.707)	lr 0.01808
Train [43][1110/3239]	Time 0.296 (0.541)	Data Time 0.038 (0.032)	Loss 2.9660 (2.8528)	Entropy 0.64041 (0.63921)	Top-1 acc 52.344 (55.324)	Top-5 acc 73.438 (77.722)	lr 0.01807
Train [43][1120/3239]	Time 0.248 (0.540)	Data Time 0.001 (0.032)	Loss 2.7966 (2.8525)	Entropy 0.64035 (0.63922)	Top-1 acc 57.422 (55.335)	Top-5 acc 78.906 (77.730)	lr 0.01807
Train [43][1130/3239]	Time 0.228 (0.539)	Data Time 0.001 (0.032)	Loss 2.9742 (2.8528)	Entropy 0.63978 (0.63923)	Top-1 acc 50.000 (55.327)	Top-5 acc 76.562 (77.728)	lr 0.01807
Train [43][1140/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.032)	Loss 2.9806 (2.8532)	Entropy 0.63958 (0.63923)	Top-1 acc 53.906 (55.319)	Top-5 acc 76.172 (77.719)	lr 0.01807
Train [43][1150/3239]	Time 0.286 (0.537)	Data Time 0.001 (0.031)	Loss 2.8381 (2.8527)	Entropy 0.63955 (0.63924)	Top-1 acc 57.422 (55.335)	Top-5 acc 74.609 (77.725)	lr 0.01807
Train [43][1160/3239]	Time 0.230 (0.536)	Data Time 0.001 (0.031)	Loss 2.9763 (2.8529)	Entropy 0.63919 (0.63924)	Top-1 acc 53.125 (55.329)	Top-5 acc 75.781 (77.719)	lr 0.01807
Train [43][1170/3239]	Time 0.225 (0.535)	Data Time 0.001 (0.031)	Loss 2.7351 (2.8528)	Entropy 0.63919 (0.63924)	Top-1 acc 60.156 (55.328)	Top-5 acc 79.297 (77.719)	lr 0.01807
Train [43][1180/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.031)	Loss 2.9791 (2.8530)	Entropy 0.63933 (0.63924)	Top-1 acc 50.000 (55.324)	Top-5 acc 75.781 (77.720)	lr 0.01807
Train [43][1190/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.030)	Loss 3.1558 (2.8530)	Entropy 0.63947 (0.63924)	Top-1 acc 49.609 (55.326)	Top-5 acc 71.875 (77.722)	lr 0.01807
Train [43][1200/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.030)	Loss 2.6800 (2.8533)	Entropy 0.63941 (0.63924)	Top-1 acc 58.594 (55.319)	Top-5 acc 81.641 (77.716)	lr 0.01807
Train [43][1210/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.030)	Loss 2.7271 (2.8530)	Entropy 0.63963 (0.63924)	Top-1 acc 59.375 (55.319)	Top-5 acc 80.859 (77.726)	lr 0.01807
Train [43][1220/3239]	Time 0.336 (0.530)	Data Time 0.001 (0.030)	Loss 2.8648 (2.8533)	Entropy 0.63971 (0.63925)	Top-1 acc 53.906 (55.310)	Top-5 acc 77.734 (77.721)	lr 0.01806
Train [43][1230/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.029)	Loss 3.1484 (2.8530)	Entropy 0.63977 (0.63925)	Top-1 acc 50.781 (55.321)	Top-5 acc 72.656 (77.730)	lr 0.01806
Train [43][1240/3239]	Time 0.225 (0.528)	Data Time 0.001 (0.029)	Loss 2.8472 (2.8526)	Entropy 0.63970 (0.63926)	Top-1 acc 56.641 (55.330)	Top-5 acc 76.172 (77.737)	lr 0.01806
Train [43][1250/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.029)	Loss 3.0265 (2.8526)	Entropy 0.63971 (0.63926)	Top-1 acc 52.344 (55.331)	Top-5 acc 74.219 (77.739)	lr 0.01806
Train [43][1260/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.029)	Loss 2.8031 (2.8526)	Entropy 0.63951 (0.63926)	Top-1 acc 55.469 (55.337)	Top-5 acc 78.125 (77.742)	lr 0.01806
Train [43][1270/3239]	Time 0.251 (0.525)	Data Time 0.001 (0.029)	Loss 2.7010 (2.8524)	Entropy 0.63931 (0.63926)	Top-1 acc 58.203 (55.342)	Top-5 acc 79.688 (77.740)	lr 0.01806
Train [43][1280/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.028)	Loss 2.7682 (2.8522)	Entropy 0.63930 (0.63926)	Top-1 acc 57.422 (55.342)	Top-5 acc 79.688 (77.745)	lr 0.01806
Train [43][1290/3239]	Time 0.342 (0.523)	Data Time 0.001 (0.028)	Loss 2.8040 (2.8526)	Entropy 0.63925 (0.63927)	Top-1 acc 57.422 (55.331)	Top-5 acc 78.516 (77.744)	lr 0.01806
Train [43][1300/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.028)	Loss 2.8215 (2.8522)	Entropy 0.63980 (0.63927)	Top-1 acc 55.859 (55.335)	Top-5 acc 77.344 (77.748)	lr 0.01806
Train [43][1310/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.028)	Loss 2.7450 (2.8524)	Entropy 0.63941 (0.63927)	Top-1 acc 58.594 (55.331)	Top-5 acc 78.516 (77.744)	lr 0.01806
Train [43][1320/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.027)	Loss 2.8493 (2.8527)	Entropy 0.63923 (0.63927)	Top-1 acc 55.469 (55.321)	Top-5 acc 76.172 (77.742)	lr 0.01806
Train [43][1330/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.027)	Loss 2.9812 (2.8521)	Entropy 0.63920 (0.63927)	Top-1 acc 50.781 (55.336)	Top-5 acc 75.781 (77.754)	lr 0.01805
Train [43][1340/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.027)	Loss 2.8768 (2.8524)	Entropy 0.63919 (0.63927)	Top-1 acc 54.688 (55.333)	Top-5 acc 78.125 (77.748)	lr 0.01805
Train [43][1350/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.027)	Loss 2.8637 (2.8524)	Entropy 0.63944 (0.63927)	Top-1 acc 50.391 (55.326)	Top-5 acc 77.344 (77.747)	lr 0.01805
Train [43][1360/3239]	Time 0.221 (0.517)	Data Time 0.001 (0.027)	Loss 3.0003 (2.8522)	Entropy 0.63931 (0.63927)	Top-1 acc 53.906 (55.326)	Top-5 acc 75.781 (77.753)	lr 0.01805
Train [43][1370/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.027)	Loss 2.9537 (2.8525)	Entropy 0.63924 (0.63927)	Top-1 acc 55.859 (55.323)	Top-5 acc 77.734 (77.749)	lr 0.01805
Train [43][1380/3239]	Time 0.329 (0.516)	Data Time 0.001 (0.026)	Loss 2.9232 (2.8526)	Entropy 0.63923 (0.63927)	Top-1 acc 54.688 (55.326)	Top-5 acc 75.391 (77.742)	lr 0.01805
Train [43][1390/3239]	Time 0.219 (0.515)	Data Time 0.001 (0.026)	Loss 3.0037 (2.8526)	Entropy 0.63925 (0.63927)	Top-1 acc 53.906 (55.322)	Top-5 acc 76.562 (77.739)	lr 0.01805
Train [43][1400/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.026)	Loss 2.9152 (2.8525)	Entropy 0.63942 (0.63927)	Top-1 acc 51.953 (55.317)	Top-5 acc 76.953 (77.746)	lr 0.01805
Train [43][1410/3239]	Time 0.226 (0.513)	Data Time 0.001 (0.026)	Loss 2.9182 (2.8525)	Entropy 0.63959 (0.63927)	Top-1 acc 53.516 (55.311)	Top-5 acc 78.125 (77.750)	lr 0.01805
Train [43][1420/3239]	Time 0.227 (0.513)	Data Time 0.001 (0.026)	Loss 3.0293 (2.8528)	Entropy 0.63915 (0.63927)	Top-1 acc 53.125 (55.314)	Top-5 acc 72.656 (77.741)	lr 0.01805
Train [43][1430/3239]	Time 0.238 (0.512)	Data Time 0.001 (0.025)	Loss 2.8238 (2.8527)	Entropy 0.63927 (0.63927)	Top-1 acc 54.688 (55.315)	Top-5 acc 78.516 (77.740)	lr 0.01805
Train [43][1440/3239]	Time 0.355 (0.533)	Data Time 0.004 (0.025)	Loss 2.8339 (2.8526)	Entropy 0.63942 (0.63927)	Top-1 acc 56.250 (55.318)	Top-5 acc 76.953 (77.740)	lr 0.01804
Train [43][1450/3239]	Time 0.341 (0.533)	Data Time 0.002 (0.025)	Loss 2.7363 (2.8525)	Entropy 0.63927 (0.63927)	Top-1 acc 55.078 (55.319)	Top-5 acc 81.250 (77.740)	lr 0.01804
Train [43][1460/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.025)	Loss 2.9018 (2.8525)	Entropy 0.63931 (0.63927)	Top-1 acc 52.734 (55.323)	Top-5 acc 76.562 (77.741)	lr 0.01804
Train [43][1470/3239]	Time 0.244 (0.531)	Data Time 0.001 (0.025)	Loss 2.9335 (2.8523)	Entropy 0.63904 (0.63927)	Top-1 acc 57.031 (55.330)	Top-5 acc 75.781 (77.744)	lr 0.01804
Train [43][1480/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.025)	Loss 2.9478 (2.8524)	Entropy 0.63909 (0.63927)	Top-1 acc 57.422 (55.324)	Top-5 acc 74.609 (77.742)	lr 0.01804
Train [43][1490/3239]	Time 0.236 (0.530)	Data Time 0.001 (0.025)	Loss 2.8087 (2.8528)	Entropy 0.63895 (0.63927)	Top-1 acc 55.859 (55.317)	Top-5 acc 81.641 (77.734)	lr 0.01804
Train [43][1500/3239]	Time 0.261 (0.529)	Data Time 0.001 (0.024)	Loss 2.9901 (2.8532)	Entropy 0.63838 (0.63927)	Top-1 acc 50.781 (55.307)	Top-5 acc 73.438 (77.726)	lr 0.01804
Train [43][1510/3239]	Time 0.229 (0.528)	Data Time 0.001 (0.024)	Loss 2.8317 (2.8529)	Entropy 0.63804 (0.63926)	Top-1 acc 57.422 (55.319)	Top-5 acc 80.469 (77.733)	lr 0.01804
Train [43][1520/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.024)	Loss 2.8272 (2.8530)	Entropy 0.63768 (0.63925)	Top-1 acc 54.297 (55.316)	Top-5 acc 82.031 (77.733)	lr 0.01804
Train [43][1530/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.024)	Loss 3.1125 (2.8530)	Entropy 0.63786 (0.63924)	Top-1 acc 49.609 (55.313)	Top-5 acc 72.656 (77.732)	lr 0.01804
Train [43][1540/3239]	Time 0.336 (0.526)	Data Time 0.001 (0.024)	Loss 2.6445 (2.8532)	Entropy 0.63786 (0.63923)	Top-1 acc 64.453 (55.312)	Top-5 acc 83.203 (77.735)	lr 0.01804
Train [43][1550/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.024)	Loss 2.8345 (2.8533)	Entropy 0.63794 (0.63923)	Top-1 acc 57.812 (55.309)	Top-5 acc 77.734 (77.739)	lr 0.01803
Train [43][1560/3239]	Time 0.298 (0.525)	Data Time 0.001 (0.024)	Loss 2.6478 (2.8532)	Entropy 0.63791 (0.63922)	Top-1 acc 62.109 (55.310)	Top-5 acc 80.469 (77.740)	lr 0.01803
Train [43][1570/3239]	Time 0.224 (0.524)	Data Time 0.001 (0.023)	Loss 3.0937 (2.8536)	Entropy 0.63766 (0.63921)	Top-1 acc 49.609 (55.307)	Top-5 acc 72.266 (77.733)	lr 0.01803
Train [43][1580/3239]	Time 0.240 (0.523)	Data Time 0.001 (0.023)	Loss 2.7062 (2.8536)	Entropy 0.63791 (0.63920)	Top-1 acc 60.156 (55.310)	Top-5 acc 78.516 (77.737)	lr 0.01803
Train [43][1590/3239]	Time 0.281 (0.523)	Data Time 0.001 (0.023)	Loss 2.8197 (2.8536)	Entropy 0.63798 (0.63919)	Top-1 acc 57.031 (55.313)	Top-5 acc 77.734 (77.733)	lr 0.01803
Train [43][1600/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.023)	Loss 2.8896 (2.8537)	Entropy 0.63795 (0.63918)	Top-1 acc 55.859 (55.314)	Top-5 acc 79.297 (77.734)	lr 0.01803
Train [43][1610/3239]	Time 0.338 (0.521)	Data Time 0.001 (0.023)	Loss 2.8838 (2.8536)	Entropy 0.63779 (0.63918)	Top-1 acc 54.297 (55.315)	Top-5 acc 75.391 (77.735)	lr 0.01803
Train [43][1620/3239]	Time 0.268 (0.521)	Data Time 0.001 (0.023)	Loss 2.9016 (2.8540)	Entropy 0.63768 (0.63917)	Top-1 acc 54.297 (55.307)	Top-5 acc 76.562 (77.725)	lr 0.01803
Train [43][1630/3239]	Time 0.224 (0.520)	Data Time 0.001 (0.023)	Loss 2.9267 (2.8540)	Entropy 0.63784 (0.63916)	Top-1 acc 53.516 (55.304)	Top-5 acc 74.609 (77.717)	lr 0.01803
Train [43][1640/3239]	Time 0.241 (0.520)	Data Time 0.001 (0.022)	Loss 3.1221 (2.8547)	Entropy 0.63782 (0.63915)	Top-1 acc 49.219 (55.284)	Top-5 acc 74.609 (77.706)	lr 0.01803
Train [43][1650/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.022)	Loss 2.8823 (2.8544)	Entropy 0.63780 (0.63914)	Top-1 acc 58.594 (55.295)	Top-5 acc 76.562 (77.706)	lr 0.01803
Train [43][1660/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.022)	Loss 2.6789 (2.8541)	Entropy 0.63796 (0.63913)	Top-1 acc 58.203 (55.299)	Top-5 acc 80.078 (77.711)	lr 0.01802
Train [43][1670/3239]	Time 0.229 (0.518)	Data Time 0.002 (0.022)	Loss 2.9454 (2.8543)	Entropy 0.63786 (0.63913)	Top-1 acc 53.906 (55.296)	Top-5 acc 75.781 (77.707)	lr 0.01802
Train [43][1680/3239]	Time 0.217 (0.517)	Data Time 0.001 (0.022)	Loss 2.7282 (2.8540)	Entropy 0.63789 (0.63912)	Top-1 acc 58.984 (55.303)	Top-5 acc 78.906 (77.713)	lr 0.01802
Train [43][1690/3239]	Time 0.252 (0.516)	Data Time 0.001 (0.022)	Loss 2.5698 (2.8539)	Entropy 0.63811 (0.63911)	Top-1 acc 62.891 (55.303)	Top-5 acc 83.594 (77.712)	lr 0.01802
Train [43][1700/3239]	Time 0.258 (0.516)	Data Time 0.001 (0.022)	Loss 2.9845 (2.8538)	Entropy 0.63803 (0.63911)	Top-1 acc 55.078 (55.312)	Top-5 acc 75.391 (77.710)	lr 0.01802
Train [43][1710/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.022)	Loss 3.0080 (2.8539)	Entropy 0.63795 (0.63910)	Top-1 acc 50.781 (55.306)	Top-5 acc 76.172 (77.710)	lr 0.01802
Train [43][1720/3239]	Time 0.244 (0.514)	Data Time 0.001 (0.021)	Loss 2.6254 (2.8535)	Entropy 0.63824 (0.63909)	Top-1 acc 57.422 (55.318)	Top-5 acc 81.641 (77.719)	lr 0.01802
Train [43][1730/3239]	Time 0.238 (0.514)	Data Time 0.001 (0.021)	Loss 2.7749 (2.8536)	Entropy 0.63814 (0.63909)	Top-1 acc 59.375 (55.322)	Top-5 acc 79.688 (77.717)	lr 0.01802
Train [43][1740/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.021)	Loss 2.8914 (2.8532)	Entropy 0.63821 (0.63908)	Top-1 acc 51.953 (55.334)	Top-5 acc 78.516 (77.727)	lr 0.01802
Train [43][1750/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.021)	Loss 2.7507 (2.8531)	Entropy 0.63784 (0.63908)	Top-1 acc 57.422 (55.334)	Top-5 acc 80.078 (77.723)	lr 0.01802
Train [43][1760/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.021)	Loss 2.9612 (2.8531)	Entropy 0.63776 (0.63907)	Top-1 acc 50.781 (55.329)	Top-5 acc 76.953 (77.727)	lr 0.01802
Train [43][1770/3239]	Time 0.348 (0.512)	Data Time 0.001 (0.021)	Loss 2.7566 (2.8529)	Entropy 0.63775 (0.63906)	Top-1 acc 55.078 (55.338)	Top-5 acc 78.125 (77.729)	lr 0.01802
Train [43][1780/3239]	Time 0.229 (0.511)	Data Time 0.001 (0.021)	Loss 2.7973 (2.8529)	Entropy 0.63821 (0.63905)	Top-1 acc 58.203 (55.341)	Top-5 acc 78.516 (77.728)	lr 0.01801
Train [43][1790/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.021)	Loss 2.8638 (2.8529)	Entropy 0.63821 (0.63905)	Top-1 acc 56.250 (55.347)	Top-5 acc 77.344 (77.728)	lr 0.01801
Train [43][1800/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.021)	Loss 2.9540 (2.8533)	Entropy 0.63815 (0.63905)	Top-1 acc 51.953 (55.342)	Top-5 acc 74.219 (77.718)	lr 0.01801
Train [43][1810/3239]	Time 0.222 (0.509)	Data Time 0.001 (0.020)	Loss 2.7843 (2.8535)	Entropy 0.63815 (0.63904)	Top-1 acc 56.250 (55.340)	Top-5 acc 75.391 (77.715)	lr 0.01801
Train [43][1820/3239]	Time 0.229 (0.509)	Data Time 0.001 (0.020)	Loss 2.8561 (2.8535)	Entropy 0.63822 (0.63904)	Top-1 acc 55.859 (55.339)	Top-5 acc 78.516 (77.716)	lr 0.01801
Train [43][1830/3239]	Time 0.243 (0.508)	Data Time 0.001 (0.020)	Loss 2.7793 (2.8532)	Entropy 0.63835 (0.63903)	Top-1 acc 57.812 (55.350)	Top-5 acc 79.688 (77.722)	lr 0.01801
Train [43][1840/3239]	Time 0.346 (0.508)	Data Time 0.001 (0.020)	Loss 3.1438 (2.8535)	Entropy 0.63840 (0.63903)	Top-1 acc 49.609 (55.343)	Top-5 acc 71.875 (77.721)	lr 0.01801
Train [43][1850/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.020)	Loss 2.8001 (2.8538)	Entropy 0.63872 (0.63902)	Top-1 acc 56.250 (55.335)	Top-5 acc 78.125 (77.717)	lr 0.01801
Train [43][1860/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.020)	Loss 2.8711 (2.8538)	Entropy 0.63885 (0.63902)	Top-1 acc 56.250 (55.331)	Top-5 acc 76.953 (77.717)	lr 0.01801
Train [43][1870/3239]	Time 0.226 (0.506)	Data Time 0.001 (0.020)	Loss 2.8831 (2.8535)	Entropy 0.63915 (0.63902)	Top-1 acc 55.078 (55.331)	Top-5 acc 79.297 (77.725)	lr 0.01801
Train [43][1880/3239]	Time 0.236 (0.506)	Data Time 0.001 (0.020)	Loss 2.7640 (2.8536)	Entropy 0.63933 (0.63902)	Top-1 acc 56.250 (55.329)	Top-5 acc 80.469 (77.718)	lr 0.01801
Train [43][1890/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.020)	Loss 2.8627 (2.8535)	Entropy 0.63949 (0.63903)	Top-1 acc 55.078 (55.331)	Top-5 acc 79.297 (77.719)	lr 0.01800
Train [43][1900/3239]	Time 0.238 (0.505)	Data Time 0.001 (0.020)	Loss 2.8980 (2.8536)	Entropy 0.63952 (0.63903)	Top-1 acc 52.734 (55.326)	Top-5 acc 77.344 (77.714)	lr 0.01800
Train [43][1910/3239]	Time 0.231 (0.504)	Data Time 0.001 (0.019)	Loss 3.1265 (2.8537)	Entropy 0.63936 (0.63903)	Top-1 acc 48.438 (55.324)	Top-5 acc 72.266 (77.713)	lr 0.01800
Train [43][1920/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.019)	Loss 2.5737 (2.8534)	Entropy 0.63954 (0.63903)	Top-1 acc 63.672 (55.328)	Top-5 acc 82.422 (77.712)	lr 0.01800
Train [43][1930/3239]	Time 0.317 (0.503)	Data Time 0.001 (0.019)	Loss 2.7448 (2.8533)	Entropy 0.63967 (0.63903)	Top-1 acc 58.984 (55.327)	Top-5 acc 79.688 (77.710)	lr 0.01800
Train [43][1940/3239]	Time 0.237 (0.503)	Data Time 0.001 (0.019)	Loss 2.9765 (2.8531)	Entropy 0.63977 (0.63904)	Top-1 acc 52.344 (55.331)	Top-5 acc 73.828 (77.714)	lr 0.01800
Train [43][1950/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.019)	Loss 3.0629 (2.8534)	Entropy 0.64002 (0.63904)	Top-1 acc 50.781 (55.325)	Top-5 acc 75.781 (77.704)	lr 0.01800
Train [43][1960/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.019)	Loss 3.0059 (2.8533)	Entropy 0.64016 (0.63905)	Top-1 acc 52.344 (55.329)	Top-5 acc 75.391 (77.709)	lr 0.01800
Train [43][1970/3239]	Time 0.231 (0.501)	Data Time 0.001 (0.019)	Loss 3.0251 (2.8534)	Entropy 0.64013 (0.63905)	Top-1 acc 51.953 (55.329)	Top-5 acc 74.219 (77.708)	lr 0.01800
Train [43][1980/3239]	Time 0.229 (0.501)	Data Time 0.001 (0.019)	Loss 2.9405 (2.8534)	Entropy 0.63993 (0.63906)	Top-1 acc 51.172 (55.332)	Top-5 acc 75.781 (77.708)	lr 0.01800
Train [43][1990/3239]	Time 0.232 (0.500)	Data Time 0.001 (0.019)	Loss 2.7062 (2.8532)	Entropy 0.64012 (0.63906)	Top-1 acc 60.938 (55.334)	Top-5 acc 79.688 (77.708)	lr 0.01800
Train [43][2000/3239]	Time 0.314 (0.500)	Data Time 0.001 (0.019)	Loss 2.8843 (2.8531)	Entropy 0.64030 (0.63907)	Top-1 acc 53.906 (55.340)	Top-5 acc 80.469 (77.712)	lr 0.01799
Train [43][2010/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.019)	Loss 2.9546 (2.8532)	Entropy 0.64045 (0.63907)	Top-1 acc 51.562 (55.338)	Top-5 acc 78.125 (77.710)	lr 0.01799
Train [43][2020/3239]	Time 0.236 (0.499)	Data Time 0.001 (0.019)	Loss 2.9415 (2.8532)	Entropy 0.64066 (0.63908)	Top-1 acc 57.031 (55.339)	Top-5 acc 73.438 (77.708)	lr 0.01799
Train [43][2030/3239]	Time 0.235 (0.498)	Data Time 0.001 (0.018)	Loss 2.8349 (2.8534)	Entropy 0.64053 (0.63909)	Top-1 acc 54.297 (55.334)	Top-5 acc 81.250 (77.706)	lr 0.01799
Train [43][2040/3239]	Time 0.228 (0.498)	Data Time 0.001 (0.018)	Loss 2.9962 (2.8536)	Entropy 0.64050 (0.63910)	Top-1 acc 52.344 (55.324)	Top-5 acc 76.172 (77.704)	lr 0.01799
Train [43][2050/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.018)	Loss 3.0975 (2.8539)	Entropy 0.64045 (0.63910)	Top-1 acc 50.391 (55.315)	Top-5 acc 72.266 (77.700)	lr 0.01799
Train [43][2060/3239]	Time 0.234 (0.497)	Data Time 0.001 (0.018)	Loss 2.7246 (2.8537)	Entropy 0.64037 (0.63911)	Top-1 acc 55.859 (55.315)	Top-5 acc 81.250 (77.704)	lr 0.01799
Train [43][2070/3239]	Time 0.273 (0.497)	Data Time 0.001 (0.018)	Loss 2.8565 (2.8538)	Entropy 0.64032 (0.63911)	Top-1 acc 53.906 (55.310)	Top-5 acc 79.688 (77.700)	lr 0.01799
Train [43][2080/3239]	Time 0.221 (0.496)	Data Time 0.001 (0.018)	Loss 2.8348 (2.8539)	Entropy 0.64013 (0.63912)	Top-1 acc 55.469 (55.314)	Top-5 acc 79.688 (77.699)	lr 0.01799
Train [43][2090/3239]	Time 0.321 (0.496)	Data Time 0.001 (0.018)	Loss 2.9772 (2.8536)	Entropy 0.63997 (0.63912)	Top-1 acc 54.297 (55.318)	Top-5 acc 75.000 (77.704)	lr 0.01799
Train [43][2100/3239]	Time 0.318 (0.510)	Data Time 0.006 (0.018)	Loss 2.8055 (2.8534)	Entropy 0.63981 (0.63913)	Top-1 acc 58.984 (55.324)	Top-5 acc 77.344 (77.706)	lr 0.01799
Train [43][2110/3239]	Time 0.237 (0.509)	Data Time 0.002 (0.018)	Loss 2.9756 (2.8537)	Entropy 0.63976 (0.63913)	Top-1 acc 53.906 (55.316)	Top-5 acc 75.781 (77.699)	lr 0.01798
Train [43][2120/3239]	Time 0.234 (0.509)	Data Time 0.001 (0.018)	Loss 2.9143 (2.8536)	Entropy 0.63980 (0.63913)	Top-1 acc 52.734 (55.318)	Top-5 acc 73.047 (77.696)	lr 0.01798
Train [43][2130/3239]	Time 0.227 (0.508)	Data Time 0.001 (0.018)	Loss 2.8047 (2.8534)	Entropy 0.63964 (0.63914)	Top-1 acc 53.906 (55.327)	Top-5 acc 80.469 (77.701)	lr 0.01798
Train [43][2140/3239]	Time 0.245 (0.508)	Data Time 0.001 (0.018)	Loss 2.6959 (2.8533)	Entropy 0.63976 (0.63914)	Top-1 acc 62.500 (55.337)	Top-5 acc 82.031 (77.704)	lr 0.01798
Train [43][2150/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.018)	Loss 2.9617 (2.8530)	Entropy 0.63977 (0.63914)	Top-1 acc 51.953 (55.340)	Top-5 acc 75.781 (77.709)	lr 0.01798
Train [43][2160/3239]	Time 0.344 (0.507)	Data Time 0.002 (0.017)	Loss 2.8761 (2.8531)	Entropy 0.63996 (0.63914)	Top-1 acc 53.516 (55.338)	Top-5 acc 77.344 (77.707)	lr 0.01798
Train [43][2170/3239]	Time 0.251 (0.507)	Data Time 0.001 (0.017)	Loss 2.5972 (2.8530)	Entropy 0.64015 (0.63915)	Top-1 acc 59.375 (55.339)	Top-5 acc 80.469 (77.708)	lr 0.01798
Train [43][2180/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.017)	Loss 3.1023 (2.8534)	Entropy 0.64039 (0.63915)	Top-1 acc 51.172 (55.332)	Top-5 acc 71.484 (77.703)	lr 0.01798
Train [43][2190/3239]	Time 0.237 (0.506)	Data Time 0.001 (0.017)	Loss 2.6467 (2.8536)	Entropy 0.64029 (0.63916)	Top-1 acc 59.375 (55.327)	Top-5 acc 80.859 (77.701)	lr 0.01798
Train [43][2200/3239]	Time 0.229 (0.506)	Data Time 0.001 (0.017)	Loss 2.8418 (2.8535)	Entropy 0.64065 (0.63916)	Top-1 acc 55.469 (55.327)	Top-5 acc 78.906 (77.704)	lr 0.01798
Train [43][2210/3239]	Time 0.236 (0.505)	Data Time 0.001 (0.017)	Loss 2.9519 (2.8536)	Entropy 0.64039 (0.63917)	Top-1 acc 55.078 (55.322)	Top-5 acc 73.438 (77.701)	lr 0.01798
Train [43][2220/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.017)	Loss 3.0142 (2.8538)	Entropy 0.64007 (0.63918)	Top-1 acc 52.344 (55.318)	Top-5 acc 75.781 (77.697)	lr 0.01797
Train [43][2230/3239]	Time 0.235 (0.505)	Data Time 0.001 (0.017)	Loss 2.8243 (2.8540)	Entropy 0.64062 (0.63918)	Top-1 acc 55.078 (55.312)	Top-5 acc 79.688 (77.696)	lr 0.01797
Train [43][2240/3239]	Time 0.224 (0.504)	Data Time 0.001 (0.017)	Loss 2.8552 (2.8541)	Entropy 0.64055 (0.63919)	Top-1 acc 53.125 (55.306)	Top-5 acc 79.297 (77.694)	lr 0.01797
Train [43][2250/3239]	Time 0.329 (0.504)	Data Time 0.001 (0.017)	Loss 2.8586 (2.8541)	Entropy 0.64069 (0.63919)	Top-1 acc 56.250 (55.303)	Top-5 acc 76.562 (77.694)	lr 0.01797
Train [43][2260/3239]	Time 0.239 (0.503)	Data Time 0.001 (0.017)	Loss 2.7118 (2.8540)	Entropy 0.64050 (0.63920)	Top-1 acc 57.422 (55.309)	Top-5 acc 78.906 (77.698)	lr 0.01797
Train [43][2270/3239]	Time 0.270 (0.503)	Data Time 0.001 (0.017)	Loss 2.8958 (2.8541)	Entropy 0.64052 (0.63921)	Top-1 acc 55.078 (55.306)	Top-5 acc 76.562 (77.694)	lr 0.01797
Train [43][2280/3239]	Time 0.228 (0.503)	Data Time 0.001 (0.017)	Loss 2.7874 (2.8542)	Entropy 0.64044 (0.63921)	Top-1 acc 57.031 (55.304)	Top-5 acc 78.125 (77.697)	lr 0.01797
Train [43][2290/3239]	Time 0.239 (0.502)	Data Time 0.001 (0.017)	Loss 2.8642 (2.8543)	Entropy 0.64052 (0.63922)	Top-1 acc 57.422 (55.304)	Top-5 acc 75.000 (77.698)	lr 0.01797
Train [43][2300/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.016)	Loss 3.0783 (2.8547)	Entropy 0.64071 (0.63922)	Top-1 acc 48.438 (55.291)	Top-5 acc 71.875 (77.693)	lr 0.01797
Train [43][2310/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.016)	Loss 2.8504 (2.8549)	Entropy 0.64051 (0.63923)	Top-1 acc 53.125 (55.279)	Top-5 acc 76.172 (77.684)	lr 0.01797
Train [43][2320/3239]	Time 0.323 (0.501)	Data Time 0.001 (0.016)	Loss 2.8008 (2.8549)	Entropy 0.64066 (0.63923)	Top-1 acc 56.250 (55.280)	Top-5 acc 78.516 (77.686)	lr 0.01797
Train [43][2330/3239]	Time 0.246 (0.501)	Data Time 0.001 (0.016)	Loss 2.6550 (2.8549)	Entropy 0.64023 (0.63924)	Top-1 acc 58.984 (55.280)	Top-5 acc 80.859 (77.686)	lr 0.01796
Train [43][2340/3239]	Time 0.265 (0.500)	Data Time 0.001 (0.016)	Loss 3.0062 (2.8550)	Entropy 0.64034 (0.63924)	Top-1 acc 53.516 (55.278)	Top-5 acc 76.562 (77.684)	lr 0.01796
Train [43][2350/3239]	Time 0.221 (0.500)	Data Time 0.001 (0.016)	Loss 2.8182 (2.8548)	Entropy 0.64054 (0.63925)	Top-1 acc 59.375 (55.282)	Top-5 acc 78.125 (77.687)	lr 0.01796
Train [43][2360/3239]	Time 0.234 (0.500)	Data Time 0.001 (0.016)	Loss 2.8591 (2.8549)	Entropy 0.64072 (0.63925)	Top-1 acc 57.422 (55.278)	Top-5 acc 76.953 (77.684)	lr 0.01796
Train [43][2370/3239]	Time 0.270 (0.499)	Data Time 0.001 (0.016)	Loss 2.8319 (2.8551)	Entropy 0.64076 (0.63926)	Top-1 acc 58.203 (55.276)	Top-5 acc 76.562 (77.677)	lr 0.01796
Train [43][2380/3239]	Time 0.221 (0.499)	Data Time 0.001 (0.016)	Loss 2.9746 (2.8553)	Entropy 0.64062 (0.63927)	Top-1 acc 54.297 (55.275)	Top-5 acc 76.953 (77.678)	lr 0.01796
Train [43][2390/3239]	Time 0.238 (0.499)	Data Time 0.001 (0.016)	Loss 2.8292 (2.8553)	Entropy 0.64063 (0.63927)	Top-1 acc 55.469 (55.275)	Top-5 acc 79.688 (77.680)	lr 0.01796
Train [43][2400/3239]	Time 0.229 (0.498)	Data Time 0.001 (0.016)	Loss 2.9737 (2.8552)	Entropy 0.64106 (0.63928)	Top-1 acc 51.953 (55.273)	Top-5 acc 73.438 (77.683)	lr 0.01796
Train [43][2410/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.016)	Loss 2.8020 (2.8552)	Entropy 0.64098 (0.63929)	Top-1 acc 55.078 (55.270)	Top-5 acc 76.562 (77.683)	lr 0.01796
Train [43][2420/3239]	Time 0.233 (0.498)	Data Time 0.001 (0.016)	Loss 2.9163 (2.8551)	Entropy 0.64030 (0.63929)	Top-1 acc 52.344 (55.270)	Top-5 acc 77.344 (77.682)	lr 0.01796
Train [43][2430/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.016)	Loss 2.9013 (2.8553)	Entropy 0.64027 (0.63930)	Top-1 acc 53.125 (55.269)	Top-5 acc 80.859 (77.680)	lr 0.01796
Train [43][2440/3239]	Time 0.230 (0.497)	Data Time 0.001 (0.016)	Loss 2.7238 (2.8553)	Entropy 0.64021 (0.63930)	Top-1 acc 57.812 (55.270)	Top-5 acc 80.469 (77.677)	lr 0.01795
Train [43][2450/3239]	Time 0.233 (0.497)	Data Time 0.001 (0.016)	Loss 2.7908 (2.8552)	Entropy 0.64025 (0.63930)	Top-1 acc 53.516 (55.272)	Top-5 acc 80.078 (77.681)	lr 0.01795
Train [43][2460/3239]	Time 0.227 (0.496)	Data Time 0.001 (0.015)	Loss 2.8068 (2.8553)	Entropy 0.64014 (0.63931)	Top-1 acc 59.375 (55.268)	Top-5 acc 77.344 (77.677)	lr 0.01795
Train [43][2470/3239]	Time 0.229 (0.496)	Data Time 0.001 (0.015)	Loss 2.8593 (2.8554)	Entropy 0.64021 (0.63931)	Top-1 acc 56.641 (55.267)	Top-5 acc 77.344 (77.676)	lr 0.01795
Train [43][2480/3239]	Time 0.318 (0.496)	Data Time 0.001 (0.015)	Loss 3.0885 (2.8552)	Entropy 0.64013 (0.63932)	Top-1 acc 51.172 (55.270)	Top-5 acc 74.609 (77.681)	lr 0.01795
Train [43][2490/3239]	Time 0.247 (0.495)	Data Time 0.001 (0.015)	Loss 3.0016 (2.8553)	Entropy 0.64039 (0.63932)	Top-1 acc 49.609 (55.273)	Top-5 acc 74.609 (77.679)	lr 0.01795
Train [43][2500/3239]	Time 0.244 (0.495)	Data Time 0.001 (0.015)	Loss 2.9759 (2.8551)	Entropy 0.64009 (0.63932)	Top-1 acc 52.344 (55.280)	Top-5 acc 74.609 (77.680)	lr 0.01795
Train [43][2510/3239]	Time 0.229 (0.495)	Data Time 0.001 (0.015)	Loss 2.8529 (2.8549)	Entropy 0.64044 (0.63933)	Top-1 acc 56.250 (55.287)	Top-5 acc 79.688 (77.684)	lr 0.01795
Train [43][2520/3239]	Time 0.249 (0.494)	Data Time 0.001 (0.015)	Loss 2.6321 (2.8549)	Entropy 0.64070 (0.63933)	Top-1 acc 59.766 (55.286)	Top-5 acc 80.469 (77.684)	lr 0.01795
Train [43][2530/3239]	Time 0.227 (0.494)	Data Time 0.002 (0.015)	Loss 2.7753 (2.8548)	Entropy 0.64062 (0.63934)	Top-1 acc 56.641 (55.285)	Top-5 acc 77.734 (77.684)	lr 0.01795
Train [43][2540/3239]	Time 0.234 (0.494)	Data Time 0.001 (0.015)	Loss 2.5138 (2.8545)	Entropy 0.64035 (0.63934)	Top-1 acc 62.500 (55.295)	Top-5 acc 83.984 (77.692)	lr 0.01795
Train [43][2550/3239]	Time 0.323 (0.493)	Data Time 0.001 (0.015)	Loss 3.1858 (2.8546)	Entropy 0.64004 (0.63934)	Top-1 acc 46.875 (55.294)	Top-5 acc 73.047 (77.691)	lr 0.01794
Train [43][2560/3239]	Time 0.233 (0.493)	Data Time 0.001 (0.015)	Loss 2.5322 (2.8544)	Entropy 0.63999 (0.63935)	Top-1 acc 59.766 (55.297)	Top-5 acc 85.547 (77.695)	lr 0.01794
Train [43][2570/3239]	Time 0.242 (0.493)	Data Time 0.001 (0.015)	Loss 2.8881 (2.8546)	Entropy 0.63984 (0.63935)	Top-1 acc 51.562 (55.288)	Top-5 acc 80.469 (77.691)	lr 0.01794
Train [43][2580/3239]	Time 0.226 (0.492)	Data Time 0.001 (0.015)	Loss 3.1666 (2.8547)	Entropy 0.64000 (0.63935)	Top-1 acc 50.000 (55.290)	Top-5 acc 71.875 (77.692)	lr 0.01794
Train [43][2590/3239]	Time 0.224 (0.492)	Data Time 0.001 (0.015)	Loss 2.7511 (2.8548)	Entropy 0.63988 (0.63935)	Top-1 acc 55.859 (55.284)	Top-5 acc 80.859 (77.690)	lr 0.01794
Train [43][2600/3239]	Time 0.235 (0.492)	Data Time 0.002 (0.015)	Loss 2.7789 (2.8547)	Entropy 0.64023 (0.63936)	Top-1 acc 59.766 (55.287)	Top-5 acc 76.953 (77.693)	lr 0.01794
Train [43][2610/3239]	Time 0.237 (0.491)	Data Time 0.001 (0.015)	Loss 2.8100 (2.8548)	Entropy 0.64010 (0.63936)	Top-1 acc 57.422 (55.288)	Top-5 acc 79.297 (77.691)	lr 0.01794
Train [43][2620/3239]	Time 0.227 (0.491)	Data Time 0.001 (0.015)	Loss 2.8660 (2.8548)	Entropy 0.63999 (0.63936)	Top-1 acc 56.250 (55.282)	Top-5 acc 74.609 (77.687)	lr 0.01794
Train [43][2630/3239]	Time 0.239 (0.491)	Data Time 0.001 (0.015)	Loss 2.8850 (2.8545)	Entropy 0.63992 (0.63936)	Top-1 acc 55.469 (55.285)	Top-5 acc 78.125 (77.694)	lr 0.01794
Train [43][2640/3239]	Time 0.320 (0.491)	Data Time 0.001 (0.015)	Loss 2.9077 (2.8545)	Entropy 0.63988 (0.63937)	Top-1 acc 50.000 (55.284)	Top-5 acc 79.297 (77.693)	lr 0.01794
Train [43][2650/3239]	Time 0.239 (0.490)	Data Time 0.001 (0.014)	Loss 2.9282 (2.8544)	Entropy 0.63953 (0.63937)	Top-1 acc 55.078 (55.292)	Top-5 acc 75.391 (77.693)	lr 0.01794
Train [43][2660/3239]	Time 0.227 (0.490)	Data Time 0.001 (0.014)	Loss 2.9529 (2.8543)	Entropy 0.63939 (0.63937)	Top-1 acc 49.219 (55.290)	Top-5 acc 76.562 (77.697)	lr 0.01793
Train [43][2670/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.014)	Loss 3.0878 (2.8545)	Entropy 0.63946 (0.63937)	Top-1 acc 46.484 (55.289)	Top-5 acc 71.875 (77.692)	lr 0.01793
Train [43][2680/3239]	Time 0.229 (0.489)	Data Time 0.001 (0.014)	Loss 2.7085 (2.8545)	Entropy 0.63927 (0.63937)	Top-1 acc 59.375 (55.295)	Top-5 acc 79.688 (77.691)	lr 0.01793
Train [43][2690/3239]	Time 0.230 (0.489)	Data Time 0.001 (0.014)	Loss 2.8117 (2.8547)	Entropy 0.63956 (0.63937)	Top-1 acc 57.422 (55.294)	Top-5 acc 78.906 (77.689)	lr 0.01793
Train [43][2700/3239]	Time 0.223 (0.489)	Data Time 0.001 (0.014)	Loss 3.0635 (2.8546)	Entropy 0.63975 (0.63937)	Top-1 acc 53.516 (55.293)	Top-5 acc 73.438 (77.688)	lr 0.01793
Train [43][2710/3239]	Time 0.327 (0.489)	Data Time 0.001 (0.014)	Loss 2.7552 (2.8545)	Entropy 0.63928 (0.63937)	Top-1 acc 60.156 (55.294)	Top-5 acc 79.688 (77.687)	lr 0.01793
Train [43][2720/3239]	Time 0.239 (0.488)	Data Time 0.001 (0.014)	Loss 2.9239 (2.8545)	Entropy 0.63926 (0.63937)	Top-1 acc 51.562 (55.297)	Top-5 acc 76.172 (77.690)	lr 0.01793
Train [43][2730/3239]	Time 0.232 (0.488)	Data Time 0.001 (0.014)	Loss 3.0144 (2.8545)	Entropy 0.63944 (0.63937)	Top-1 acc 51.562 (55.294)	Top-5 acc 75.781 (77.690)	lr 0.01793
Train [43][2740/3239]	Time 0.229 (0.488)	Data Time 0.001 (0.014)	Loss 2.7260 (2.8545)	Entropy 0.63965 (0.63937)	Top-1 acc 61.719 (55.294)	Top-5 acc 79.297 (77.690)	lr 0.01793
Train [43][2750/3239]	Time 0.356 (0.498)	Data Time 0.005 (0.014)	Loss 2.8524 (2.8543)	Entropy 0.63930 (0.63937)	Top-1 acc 55.078 (55.301)	Top-5 acc 76.953 (77.694)	lr 0.01793
Train [43][2760/3239]	Time 0.239 (0.498)	Data Time 0.002 (0.014)	Loss 2.7024 (2.8542)	Entropy 0.63919 (0.63937)	Top-1 acc 55.469 (55.302)	Top-5 acc 79.297 (77.697)	lr 0.01793
Train [43][2770/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.014)	Loss 2.7652 (2.8541)	Entropy 0.63901 (0.63937)	Top-1 acc 60.547 (55.306)	Top-5 acc 79.688 (77.700)	lr 0.01792
Train [43][2780/3239]	Time 0.242 (0.497)	Data Time 0.001 (0.014)	Loss 2.8045 (2.8541)	Entropy 0.63905 (0.63937)	Top-1 acc 59.375 (55.304)	Top-5 acc 78.906 (77.699)	lr 0.01792
Train [43][2790/3239]	Time 0.240 (0.497)	Data Time 0.001 (0.014)	Loss 2.7386 (2.8541)	Entropy 0.63891 (0.63937)	Top-1 acc 56.641 (55.304)	Top-5 acc 80.469 (77.698)	lr 0.01792
Train [43][2800/3239]	Time 0.324 (0.497)	Data Time 0.001 (0.014)	Loss 2.8600 (2.8541)	Entropy 0.63898 (0.63937)	Top-1 acc 57.031 (55.304)	Top-5 acc 75.781 (77.695)	lr 0.01792
Train [43][2810/3239]	Time 0.225 (0.497)	Data Time 0.001 (0.014)	Loss 3.0782 (2.8541)	Entropy 0.63902 (0.63936)	Top-1 acc 52.344 (55.306)	Top-5 acc 76.172 (77.702)	lr 0.01792
Train [43][2820/3239]	Time 0.240 (0.496)	Data Time 0.001 (0.014)	Loss 2.8336 (2.8541)	Entropy 0.63932 (0.63936)	Top-1 acc 52.734 (55.303)	Top-5 acc 75.391 (77.698)	lr 0.01792
Train [43][2830/3239]	Time 0.239 (0.496)	Data Time 0.001 (0.014)	Loss 2.8483 (2.8542)	Entropy 0.63961 (0.63936)	Top-1 acc 54.688 (55.305)	Top-5 acc 74.609 (77.698)	lr 0.01792
Train [43][2840/3239]	Time 0.242 (0.496)	Data Time 0.001 (0.014)	Loss 2.5961 (2.8540)	Entropy 0.63967 (0.63936)	Top-1 acc 60.547 (55.305)	Top-5 acc 83.594 (77.704)	lr 0.01792
Train [43][2850/3239]	Time 0.242 (0.496)	Data Time 0.001 (0.014)	Loss 2.6244 (2.8540)	Entropy 0.63983 (0.63937)	Top-1 acc 60.547 (55.307)	Top-5 acc 83.594 (77.706)	lr 0.01792
Train [43][2860/3239]	Time 0.235 (0.495)	Data Time 0.001 (0.014)	Loss 2.8787 (2.8540)	Entropy 0.63971 (0.63937)	Top-1 acc 54.297 (55.305)	Top-5 acc 76.172 (77.706)	lr 0.01792
Train [43][2870/3239]	Time 0.324 (0.495)	Data Time 0.001 (0.014)	Loss 2.5410 (2.8537)	Entropy 0.63981 (0.63937)	Top-1 acc 60.938 (55.315)	Top-5 acc 84.375 (77.711)	lr 0.01792
Train [43][2880/3239]	Time 0.235 (0.495)	Data Time 0.001 (0.013)	Loss 2.7661 (2.8535)	Entropy 0.64012 (0.63937)	Top-1 acc 57.422 (55.319)	Top-5 acc 80.469 (77.714)	lr 0.01791
Train [43][2890/3239]	Time 0.234 (0.494)	Data Time 0.001 (0.013)	Loss 3.1303 (2.8537)	Entropy 0.64001 (0.63937)	Top-1 acc 48.047 (55.310)	Top-5 acc 71.094 (77.715)	lr 0.01791
Train [43][2900/3239]	Time 0.235 (0.494)	Data Time 0.001 (0.013)	Loss 3.1536 (2.8538)	Entropy 0.63989 (0.63937)	Top-1 acc 46.875 (55.309)	Top-5 acc 72.266 (77.714)	lr 0.01791
Train [43][2910/3239]	Time 0.245 (0.494)	Data Time 0.001 (0.013)	Loss 2.7669 (2.8538)	Entropy 0.63972 (0.63938)	Top-1 acc 56.250 (55.310)	Top-5 acc 81.641 (77.713)	lr 0.01791
Train [43][2920/3239]	Time 0.235 (0.494)	Data Time 0.001 (0.013)	Loss 2.6832 (2.8537)	Entropy 0.63983 (0.63938)	Top-1 acc 61.328 (55.315)	Top-5 acc 80.859 (77.717)	lr 0.01791
Train [43][2930/3239]	Time 0.234 (0.493)	Data Time 0.001 (0.013)	Loss 3.0459 (2.8537)	Entropy 0.63980 (0.63938)	Top-1 acc 51.172 (55.317)	Top-5 acc 71.875 (77.714)	lr 0.01791
Train [43][2940/3239]	Time 0.232 (0.493)	Data Time 0.001 (0.013)	Loss 2.8939 (2.8538)	Entropy 0.63982 (0.63938)	Top-1 acc 53.125 (55.319)	Top-5 acc 75.000 (77.715)	lr 0.01791
Train [43][2950/3239]	Time 0.219 (0.493)	Data Time 0.001 (0.013)	Loss 2.8454 (2.8538)	Entropy 0.63982 (0.63938)	Top-1 acc 55.469 (55.317)	Top-5 acc 78.906 (77.715)	lr 0.01791
Train [43][2960/3239]	Time 0.277 (0.493)	Data Time 0.001 (0.013)	Loss 2.8215 (2.8537)	Entropy 0.63991 (0.63938)	Top-1 acc 56.641 (55.317)	Top-5 acc 78.125 (77.716)	lr 0.01791
Train [43][2970/3239]	Time 0.268 (0.493)	Data Time 0.001 (0.013)	Loss 2.8050 (2.8537)	Entropy 0.63994 (0.63939)	Top-1 acc 60.938 (55.316)	Top-5 acc 76.953 (77.714)	lr 0.01791
Train [43][2980/3239]	Time 0.236 (0.492)	Data Time 0.001 (0.013)	Loss 2.7829 (2.8539)	Entropy 0.64008 (0.63939)	Top-1 acc 59.375 (55.312)	Top-5 acc 78.125 (77.712)	lr 0.01791
Train [43][2990/3239]	Time 0.254 (0.492)	Data Time 0.001 (0.013)	Loss 2.8600 (2.8538)	Entropy 0.64023 (0.63939)	Top-1 acc 57.812 (55.316)	Top-5 acc 77.344 (77.713)	lr 0.01790
Train [43][3000/3239]	Time 0.229 (0.492)	Data Time 0.001 (0.013)	Loss 2.9247 (2.8538)	Entropy 0.64040 (0.63939)	Top-1 acc 54.297 (55.312)	Top-5 acc 74.609 (77.713)	lr 0.01790
Train [43][3010/3239]	Time 0.236 (0.492)	Data Time 0.001 (0.013)	Loss 2.7803 (2.8538)	Entropy 0.64015 (0.63940)	Top-1 acc 58.594 (55.309)	Top-5 acc 76.562 (77.712)	lr 0.01790
Train [43][3020/3239]	Time 0.220 (0.491)	Data Time 0.001 (0.013)	Loss 3.0289 (2.8537)	Entropy 0.64011 (0.63940)	Top-1 acc 49.609 (55.308)	Top-5 acc 75.781 (77.713)	lr 0.01790
Train [43][3030/3239]	Time 0.322 (0.491)	Data Time 0.001 (0.013)	Loss 2.8828 (2.8535)	Entropy 0.64005 (0.63940)	Top-1 acc 51.953 (55.311)	Top-5 acc 78.906 (77.715)	lr 0.01790
Train [43][3040/3239]	Time 0.233 (0.491)	Data Time 0.001 (0.013)	Loss 2.7302 (2.8535)	Entropy 0.64007 (0.63940)	Top-1 acc 58.984 (55.312)	Top-5 acc 80.078 (77.715)	lr 0.01790
Train [43][3050/3239]	Time 0.236 (0.491)	Data Time 0.001 (0.013)	Loss 2.8940 (2.8536)	Entropy 0.64003 (0.63940)	Top-1 acc 56.641 (55.312)	Top-5 acc 77.344 (77.714)	lr 0.01790
Train [43][3060/3239]	Time 0.231 (0.490)	Data Time 0.001 (0.013)	Loss 2.7297 (2.8535)	Entropy 0.63961 (0.63941)	Top-1 acc 56.641 (55.314)	Top-5 acc 81.250 (77.712)	lr 0.01790
Train [43][3070/3239]	Time 0.229 (0.490)	Data Time 0.001 (0.013)	Loss 2.9070 (2.8535)	Entropy 0.63972 (0.63941)	Top-1 acc 51.953 (55.318)	Top-5 acc 76.953 (77.710)	lr 0.01790
Train [43][3080/3239]	Time 0.242 (0.490)	Data Time 0.001 (0.013)	Loss 3.0578 (2.8537)	Entropy 0.63990 (0.63941)	Top-1 acc 49.609 (55.317)	Top-5 acc 73.438 (77.709)	lr 0.01790
Train [43][3090/3239]	Time 0.226 (0.490)	Data Time 0.001 (0.013)	Loss 2.7806 (2.8537)	Entropy 0.63941 (0.63941)	Top-1 acc 58.594 (55.316)	Top-5 acc 78.125 (77.710)	lr 0.01790
Train [43][3100/3239]	Time 0.331 (0.490)	Data Time 0.001 (0.013)	Loss 3.0208 (2.8538)	Entropy 0.63921 (0.63941)	Top-1 acc 48.438 (55.311)	Top-5 acc 72.266 (77.706)	lr 0.01789
Train [43][3110/3239]	Time 0.226 (0.489)	Data Time 0.001 (0.013)	Loss 3.0455 (2.8537)	Entropy 0.63897 (0.63941)	Top-1 acc 51.953 (55.313)	Top-5 acc 72.656 (77.709)	lr 0.01789
Train [43][3120/3239]	Time 0.226 (0.489)	Data Time 0.001 (0.013)	Loss 2.7529 (2.8538)	Entropy 0.63920 (0.63940)	Top-1 acc 55.859 (55.313)	Top-5 acc 78.516 (77.707)	lr 0.01789
Train [43][3130/3239]	Time 0.230 (0.489)	Data Time 0.001 (0.013)	Loss 3.0064 (2.8537)	Entropy 0.63944 (0.63940)	Top-1 acc 49.609 (55.318)	Top-5 acc 73.047 (77.708)	lr 0.01789
Train [43][3140/3239]	Time 0.231 (0.488)	Data Time 0.001 (0.012)	Loss 3.0228 (2.8537)	Entropy 0.63946 (0.63940)	Top-1 acc 50.781 (55.316)	Top-5 acc 71.484 (77.708)	lr 0.01789
Train [43][3150/3239]	Time 0.246 (0.488)	Data Time 0.001 (0.012)	Loss 2.7795 (2.8535)	Entropy 0.63913 (0.63940)	Top-1 acc 55.859 (55.318)	Top-5 acc 81.250 (77.709)	lr 0.01789
Train [43][3160/3239]	Time 0.243 (0.488)	Data Time 0.001 (0.012)	Loss 2.8140 (2.8534)	Entropy 0.63907 (0.63940)	Top-1 acc 59.375 (55.322)	Top-5 acc 78.906 (77.710)	lr 0.01789
Train [43][3170/3239]	Time 0.226 (0.488)	Data Time 0.001 (0.012)	Loss 2.8592 (2.8535)	Entropy 0.63932 (0.63940)	Top-1 acc 55.078 (55.318)	Top-5 acc 77.344 (77.709)	lr 0.01789
Train [43][3180/3239]	Time 0.228 (0.488)	Data Time 0.000 (0.012)	Loss 2.7730 (2.8536)	Entropy 0.63930 (0.63940)	Top-1 acc 57.812 (55.321)	Top-5 acc 78.125 (77.706)	lr 0.01789
Train [43][3190/3239]	Time 0.314 (0.487)	Data Time 0.000 (0.012)	Loss 3.0040 (2.8536)	Entropy 0.63907 (0.63940)	Top-1 acc 55.078 (55.319)	Top-5 acc 74.219 (77.705)	lr 0.01789
Train [43][3200/3239]	Time 0.232 (0.487)	Data Time 0.000 (0.012)	Loss 2.9471 (2.8537)	Entropy 0.63935 (0.63940)	Top-1 acc 51.172 (55.314)	Top-5 acc 75.391 (77.705)	lr 0.01789
Train [43][3210/3239]	Time 0.225 (0.487)	Data Time 0.000 (0.012)	Loss 2.7449 (2.8538)	Entropy 0.63912 (0.63940)	Top-1 acc 58.203 (55.314)	Top-5 acc 78.906 (77.704)	lr 0.01788
Train [43][3220/3239]	Time 0.234 (0.486)	Data Time 0.000 (0.012)	Loss 2.8201 (2.8537)	Entropy 0.63919 (0.63940)	Top-1 acc 57.031 (55.312)	Top-5 acc 77.734 (77.706)	lr 0.01788
Train [43][3230/3239]	Time 0.226 (0.486)	Data Time 0.000 (0.012)	Loss 2.7532 (2.8536)	Entropy 0.63879 (0.63940)	Top-1 acc 59.375 (55.314)	Top-5 acc 78.516 (77.705)	lr 0.01788
Train [43][3239/3239]	Time 0.914 (0.486)	Data Time 0.000 (0.012)	Loss 3.2239 (2.8536)	Entropy 0.63867 (0.63940)	Top-1 acc 45.679 (55.315)	Top-5 acc 71.605 (77.704)	lr 0.01788
==========Valid [43/120]	loss 1.575	top-1 acc 63.935 (63.947)	top-5 acc 85.089	Train top-1 55.315	top-5 77.704	Entropy 0.63867	Latency-None: 0.000ms	Flops: 539.76M
Train [44][0/3239]	Time 32.968 (32.968)	Data Time 31.124 (31.124)	Loss 2.7655 (2.7655)	Entropy 0.63872 (0.63872)	Top-1 acc 58.984 (58.984)	Top-5 acc 80.078 (80.078)	lr 0.01788
Train [44][10/3239]	Time 0.232 (3.476)	Data Time 0.001 (2.831)	Loss 2.8325 (2.8421)	Entropy 0.63873 (0.63863)	Top-1 acc 57.812 (55.824)	Top-5 acc 76.953 (78.161)	lr 0.01788
Train [44][20/3239]	Time 0.397 (2.029)	Data Time 0.001 (1.484)	Loss 2.7395 (2.8083)	Entropy 0.63885 (0.63873)	Top-1 acc 58.594 (56.287)	Top-5 acc 81.250 (78.646)	lr 0.01788
Train [44][30/3239]	Time 0.234 (1.509)	Data Time 0.001 (1.006)	Loss 2.9000 (2.8171)	Entropy 0.63886 (0.63879)	Top-1 acc 51.562 (55.910)	Top-5 acc 76.172 (78.352)	lr 0.01788
Train [44][40/3239]	Time 0.232 (1.245)	Data Time 0.001 (0.761)	Loss 2.9068 (2.8243)	Entropy 0.63874 (0.63879)	Top-1 acc 53.125 (55.859)	Top-5 acc 76.172 (78.230)	lr 0.01788
Train [44][50/3239]	Time 0.237 (1.085)	Data Time 0.001 (0.612)	Loss 2.7449 (2.8293)	Entropy 0.63883 (0.63877)	Top-1 acc 57.031 (55.722)	Top-5 acc 78.125 (78.163)	lr 0.01788
Train [44][60/3239]	Time 0.226 (0.978)	Data Time 0.001 (0.512)	Loss 2.8394 (2.8199)	Entropy 0.63901 (0.63879)	Top-1 acc 55.859 (55.789)	Top-5 acc 75.781 (78.356)	lr 0.01788
Train [44][70/3239]	Time 0.232 (0.900)	Data Time 0.001 (0.440)	Loss 2.7110 (2.8201)	Entropy 0.63935 (0.63884)	Top-1 acc 56.641 (55.837)	Top-5 acc 80.469 (78.257)	lr 0.01788
Train [44][80/3239]	Time 0.233 (0.841)	Data Time 0.001 (0.386)	Loss 3.0144 (2.8293)	Entropy 0.63903 (0.63889)	Top-1 acc 51.953 (55.724)	Top-5 acc 70.703 (78.038)	lr 0.01787
Train [44][90/3239]	Time 0.322 (0.796)	Data Time 0.001 (0.344)	Loss 2.7737 (2.8258)	Entropy 0.63898 (0.63890)	Top-1 acc 58.203 (55.812)	Top-5 acc 79.297 (78.177)	lr 0.01787
Train [44][100/3239]	Time 0.235 (0.759)	Data Time 0.001 (0.310)	Loss 2.6998 (2.8231)	Entropy 0.63858 (0.63890)	Top-1 acc 57.031 (55.856)	Top-5 acc 80.078 (78.206)	lr 0.01787
Train [44][110/3239]	Time 0.246 (0.728)	Data Time 0.001 (0.282)	Loss 2.8238 (2.8208)	Entropy 0.63857 (0.63888)	Top-1 acc 56.641 (55.902)	Top-5 acc 78.125 (78.269)	lr 0.01787
Train [44][120/3239]	Time 0.240 (0.703)	Data Time 0.001 (0.259)	Loss 2.8340 (2.8190)	Entropy 0.63859 (0.63886)	Top-1 acc 55.469 (55.956)	Top-5 acc 79.297 (78.315)	lr 0.01787
Train [44][130/3239]	Time 0.228 (0.682)	Data Time 0.001 (0.240)	Loss 3.0018 (2.8225)	Entropy 0.63849 (0.63883)	Top-1 acc 51.562 (55.937)	Top-5 acc 76.562 (78.286)	lr 0.01787
Train [44][140/3239]	Time 0.242 (0.663)	Data Time 0.001 (0.223)	Loss 2.8162 (2.8213)	Entropy 0.63842 (0.63880)	Top-1 acc 55.859 (55.981)	Top-5 acc 82.031 (78.286)	lr 0.01787
Train [44][150/3239]	Time 0.240 (0.648)	Data Time 0.001 (0.208)	Loss 3.0992 (2.8244)	Entropy 0.63833 (0.63877)	Top-1 acc 47.266 (55.890)	Top-5 acc 75.781 (78.244)	lr 0.01787
Train [44][160/3239]	Time 0.236 (0.635)	Data Time 0.001 (0.195)	Loss 2.8670 (2.8255)	Entropy 0.63809 (0.63875)	Top-1 acc 52.344 (55.872)	Top-5 acc 78.125 (78.210)	lr 0.01787
Train [44][170/3239]	Time 0.272 (0.810)	Data Time 0.002 (0.184)	Loss 2.7593 (2.8269)	Entropy 0.63806 (0.63871)	Top-1 acc 55.469 (55.839)	Top-5 acc 78.125 (78.109)	lr 0.01787
Train [44][180/3239]	Time 0.383 (0.790)	Data Time 0.002 (0.174)	Loss 2.8238 (2.8275)	Entropy 0.63818 (0.63867)	Top-1 acc 55.859 (55.857)	Top-5 acc 74.609 (78.114)	lr 0.01786
Train [44][190/3239]	Time 0.247 (0.772)	Data Time 0.001 (0.165)	Loss 2.9148 (2.8290)	Entropy 0.63820 (0.63865)	Top-1 acc 53.125 (55.786)	Top-5 acc 73.438 (78.039)	lr 0.01786
Train [44][200/3239]	Time 0.245 (0.755)	Data Time 0.001 (0.157)	Loss 2.7023 (2.8293)	Entropy 0.63830 (0.63863)	Top-1 acc 56.641 (55.780)	Top-5 acc 80.469 (78.024)	lr 0.01786
Train [44][210/3239]	Time 0.276 (0.741)	Data Time 0.002 (0.150)	Loss 3.0807 (2.8315)	Entropy 0.63792 (0.63861)	Top-1 acc 50.000 (55.717)	Top-5 acc 74.609 (77.977)	lr 0.01786
Train [44][220/3239]	Time 0.291 (0.729)	Data Time 0.001 (0.143)	Loss 2.8280 (2.8329)	Entropy 0.63812 (0.63858)	Top-1 acc 58.984 (55.693)	Top-5 acc 79.688 (77.959)	lr 0.01786
Train [44][230/3239]	Time 0.238 (0.716)	Data Time 0.001 (0.137)	Loss 2.7352 (2.8336)	Entropy 0.63768 (0.63856)	Top-1 acc 62.500 (55.716)	Top-5 acc 76.562 (77.932)	lr 0.01786
Train [44][240/3239]	Time 0.237 (0.705)	Data Time 0.002 (0.131)	Loss 2.9067 (2.8321)	Entropy 0.63779 (0.63852)	Top-1 acc 55.078 (55.777)	Top-5 acc 78.516 (77.969)	lr 0.01786
Train [44][250/3239]	Time 0.349 (0.694)	Data Time 0.003 (0.126)	Loss 2.9525 (2.8349)	Entropy 0.63803 (0.63849)	Top-1 acc 52.734 (55.702)	Top-5 acc 76.172 (77.924)	lr 0.01786
Train [44][260/3239]	Time 0.223 (0.684)	Data Time 0.001 (0.121)	Loss 2.8710 (2.8378)	Entropy 0.63829 (0.63848)	Top-1 acc 53.906 (55.644)	Top-5 acc 76.953 (77.857)	lr 0.01786
Train [44][270/3239]	Time 0.268 (0.675)	Data Time 0.001 (0.117)	Loss 2.7725 (2.8348)	Entropy 0.63833 (0.63847)	Top-1 acc 58.203 (55.743)	Top-5 acc 79.688 (77.906)	lr 0.01786
Train [44][280/3239]	Time 0.242 (0.667)	Data Time 0.001 (0.113)	Loss 2.8109 (2.8322)	Entropy 0.63840 (0.63847)	Top-1 acc 53.516 (55.783)	Top-5 acc 79.297 (77.935)	lr 0.01786
Train [44][290/3239]	Time 0.239 (0.658)	Data Time 0.001 (0.109)	Loss 2.5962 (2.8323)	Entropy 0.63821 (0.63846)	Top-1 acc 58.594 (55.775)	Top-5 acc 81.250 (77.933)	lr 0.01785
Train [44][300/3239]	Time 0.226 (0.651)	Data Time 0.001 (0.105)	Loss 2.7835 (2.8334)	Entropy 0.63808 (0.63845)	Top-1 acc 53.906 (55.718)	Top-5 acc 81.250 (77.929)	lr 0.01785
Train [44][310/3239]	Time 0.244 (0.644)	Data Time 0.001 (0.102)	Loss 2.7584 (2.8349)	Entropy 0.63828 (0.63844)	Top-1 acc 58.203 (55.660)	Top-5 acc 78.906 (77.894)	lr 0.01785
Train [44][320/3239]	Time 0.247 (0.638)	Data Time 0.001 (0.099)	Loss 2.5714 (2.8323)	Entropy 0.63849 (0.63844)	Top-1 acc 60.547 (55.729)	Top-5 acc 84.375 (77.950)	lr 0.01785
Train [44][330/3239]	Time 0.233 (0.632)	Data Time 0.001 (0.096)	Loss 2.7145 (2.8309)	Entropy 0.63872 (0.63844)	Top-1 acc 59.375 (55.760)	Top-5 acc 82.422 (77.982)	lr 0.01785
Train [44][340/3239]	Time 0.340 (0.626)	Data Time 0.001 (0.093)	Loss 2.6185 (2.8287)	Entropy 0.63847 (0.63845)	Top-1 acc 61.328 (55.801)	Top-5 acc 83.594 (78.041)	lr 0.01785
Train [44][350/3239]	Time 0.236 (0.620)	Data Time 0.005 (0.091)	Loss 2.8147 (2.8284)	Entropy 0.63879 (0.63845)	Top-1 acc 57.422 (55.826)	Top-5 acc 79.688 (78.054)	lr 0.01785
Train [44][360/3239]	Time 0.252 (0.615)	Data Time 0.001 (0.088)	Loss 2.5446 (2.8271)	Entropy 0.63885 (0.63846)	Top-1 acc 63.672 (55.854)	Top-5 acc 80.859 (78.063)	lr 0.01785
Train [44][370/3239]	Time 0.240 (0.611)	Data Time 0.001 (0.086)	Loss 2.7161 (2.8281)	Entropy 0.63887 (0.63847)	Top-1 acc 58.203 (55.793)	Top-5 acc 83.203 (78.072)	lr 0.01785
Train [44][380/3239]	Time 0.233 (0.606)	Data Time 0.001 (0.084)	Loss 2.8593 (2.8275)	Entropy 0.63892 (0.63848)	Top-1 acc 55.078 (55.804)	Top-5 acc 72.266 (78.075)	lr 0.01785
Train [44][390/3239]	Time 0.255 (0.601)	Data Time 0.001 (0.082)	Loss 2.8913 (2.8286)	Entropy 0.63905 (0.63849)	Top-1 acc 54.297 (55.791)	Top-5 acc 79.297 (78.062)	lr 0.01785
Train [44][400/3239]	Time 0.237 (0.597)	Data Time 0.001 (0.080)	Loss 2.7711 (2.8288)	Entropy 0.63903 (0.63851)	Top-1 acc 58.984 (55.821)	Top-5 acc 79.688 (78.067)	lr 0.01784
Train [44][410/3239]	Time 0.418 (0.594)	Data Time 0.001 (0.078)	Loss 2.8082 (2.8291)	Entropy 0.63894 (0.63852)	Top-1 acc 51.172 (55.776)	Top-5 acc 77.734 (78.068)	lr 0.01784
Train [44][420/3239]	Time 0.267 (0.591)	Data Time 0.002 (0.076)	Loss 2.7793 (2.8282)	Entropy 0.63899 (0.63853)	Top-1 acc 57.422 (55.796)	Top-5 acc 78.906 (78.088)	lr 0.01784
Train [44][430/3239]	Time 0.257 (0.587)	Data Time 0.001 (0.074)	Loss 2.6317 (2.8273)	Entropy 0.63902 (0.63854)	Top-1 acc 59.375 (55.811)	Top-5 acc 80.078 (78.103)	lr 0.01784
Train [44][440/3239]	Time 0.239 (0.584)	Data Time 0.001 (0.072)	Loss 2.7216 (2.8278)	Entropy 0.63924 (0.63856)	Top-1 acc 59.375 (55.809)	Top-5 acc 79.297 (78.089)	lr 0.01784
Train [44][450/3239]	Time 0.239 (0.581)	Data Time 0.001 (0.071)	Loss 2.7244 (2.8275)	Entropy 0.63924 (0.63857)	Top-1 acc 57.812 (55.817)	Top-5 acc 78.516 (78.096)	lr 0.01784
Train [44][460/3239]	Time 0.278 (0.578)	Data Time 0.001 (0.069)	Loss 2.8398 (2.8280)	Entropy 0.63923 (0.63858)	Top-1 acc 57.812 (55.817)	Top-5 acc 76.562 (78.106)	lr 0.01784
Train [44][470/3239]	Time 0.256 (0.574)	Data Time 0.001 (0.068)	Loss 2.6432 (2.8276)	Entropy 0.63936 (0.63860)	Top-1 acc 60.547 (55.833)	Top-5 acc 78.906 (78.106)	lr 0.01784
Train [44][480/3239]	Time 0.341 (0.572)	Data Time 0.001 (0.067)	Loss 2.8424 (2.8270)	Entropy 0.63915 (0.63861)	Top-1 acc 55.078 (55.867)	Top-5 acc 78.906 (78.127)	lr 0.01784
Train [44][490/3239]	Time 0.230 (0.569)	Data Time 0.001 (0.065)	Loss 2.7112 (2.8274)	Entropy 0.63916 (0.63862)	Top-1 acc 55.469 (55.855)	Top-5 acc 78.906 (78.119)	lr 0.01784
Train [44][500/3239]	Time 0.243 (0.566)	Data Time 0.002 (0.064)	Loss 2.8586 (2.8267)	Entropy 0.63932 (0.63863)	Top-1 acc 55.078 (55.878)	Top-5 acc 78.516 (78.117)	lr 0.01784
Train [44][510/3239]	Time 0.265 (0.564)	Data Time 0.001 (0.063)	Loss 3.0123 (2.8285)	Entropy 0.63910 (0.63865)	Top-1 acc 53.516 (55.854)	Top-5 acc 73.828 (78.079)	lr 0.01783
Train [44][520/3239]	Time 0.273 (0.561)	Data Time 0.001 (0.062)	Loss 2.7423 (2.8290)	Entropy 0.63895 (0.63866)	Top-1 acc 58.203 (55.849)	Top-5 acc 80.078 (78.058)	lr 0.01783
Train [44][530/3239]	Time 0.237 (0.559)	Data Time 0.001 (0.060)	Loss 2.9767 (2.8300)	Entropy 0.63888 (0.63866)	Top-1 acc 52.344 (55.818)	Top-5 acc 77.734 (78.038)	lr 0.01783
Train [44][540/3239]	Time 0.240 (0.557)	Data Time 0.001 (0.059)	Loss 2.8356 (2.8295)	Entropy 0.63888 (0.63866)	Top-1 acc 54.297 (55.829)	Top-5 acc 78.125 (78.054)	lr 0.01783
Train [44][550/3239]	Time 0.280 (0.555)	Data Time 0.002 (0.058)	Loss 2.8341 (2.8287)	Entropy 0.63906 (0.63867)	Top-1 acc 54.297 (55.848)	Top-5 acc 79.688 (78.073)	lr 0.01783
Train [44][560/3239]	Time 0.250 (0.553)	Data Time 0.001 (0.057)	Loss 2.7298 (2.8285)	Entropy 0.63871 (0.63867)	Top-1 acc 60.938 (55.871)	Top-5 acc 78.125 (78.079)	lr 0.01783
Train [44][570/3239]	Time 0.344 (0.551)	Data Time 0.001 (0.056)	Loss 2.8507 (2.8288)	Entropy 0.63886 (0.63867)	Top-1 acc 57.031 (55.854)	Top-5 acc 78.125 (78.080)	lr 0.01783
Train [44][580/3239]	Time 0.260 (0.549)	Data Time 0.001 (0.055)	Loss 2.9132 (2.8290)	Entropy 0.63861 (0.63867)	Top-1 acc 51.172 (55.841)	Top-5 acc 77.734 (78.086)	lr 0.01783
Train [44][590/3239]	Time 0.249 (0.548)	Data Time 0.001 (0.054)	Loss 2.9650 (2.8290)	Entropy 0.63849 (0.63867)	Top-1 acc 54.688 (55.859)	Top-5 acc 72.656 (78.077)	lr 0.01783
Train [44][600/3239]	Time 0.304 (0.546)	Data Time 0.001 (0.054)	Loss 2.8439 (2.8286)	Entropy 0.63826 (0.63867)	Top-1 acc 55.859 (55.864)	Top-5 acc 78.906 (78.094)	lr 0.01783
Train [44][610/3239]	Time 0.249 (0.545)	Data Time 0.001 (0.053)	Loss 2.6922 (2.8286)	Entropy 0.63810 (0.63866)	Top-1 acc 59.375 (55.873)	Top-5 acc 79.297 (78.090)	lr 0.01783
Train [44][620/3239]	Time 0.266 (0.543)	Data Time 0.001 (0.052)	Loss 2.8233 (2.8284)	Entropy 0.63818 (0.63865)	Top-1 acc 57.812 (55.864)	Top-5 acc 76.172 (78.090)	lr 0.01782
Train [44][630/3239]	Time 0.227 (0.542)	Data Time 0.001 (0.051)	Loss 2.8909 (2.8283)	Entropy 0.63850 (0.63865)	Top-1 acc 54.688 (55.875)	Top-5 acc 80.469 (78.092)	lr 0.01782
Train [44][640/3239]	Time 0.451 (0.542)	Data Time 0.001 (0.050)	Loss 2.7283 (2.8272)	Entropy 0.63866 (0.63864)	Top-1 acc 58.203 (55.915)	Top-5 acc 80.469 (78.122)	lr 0.01782
Train [44][650/3239]	Time 0.256 (0.540)	Data Time 0.001 (0.050)	Loss 2.8422 (2.8267)	Entropy 0.63853 (0.63864)	Top-1 acc 55.859 (55.928)	Top-5 acc 77.734 (78.127)	lr 0.01782
Train [44][660/3239]	Time 0.250 (0.539)	Data Time 0.001 (0.049)	Loss 2.9787 (2.8274)	Entropy 0.63840 (0.63864)	Top-1 acc 50.781 (55.907)	Top-5 acc 75.781 (78.111)	lr 0.01782
Train [44][670/3239]	Time 0.242 (0.538)	Data Time 0.001 (0.048)	Loss 2.9693 (2.8281)	Entropy 0.63832 (0.63864)	Top-1 acc 50.391 (55.896)	Top-5 acc 76.562 (78.094)	lr 0.01782
Train [44][680/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.048)	Loss 3.0041 (2.8274)	Entropy 0.63840 (0.63863)	Top-1 acc 51.953 (55.918)	Top-5 acc 73.047 (78.119)	lr 0.01782
Train [44][690/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.047)	Loss 2.9448 (2.8276)	Entropy 0.63840 (0.63863)	Top-1 acc 54.297 (55.906)	Top-5 acc 76.562 (78.131)	lr 0.01782
Train [44][700/3239]	Time 0.247 (0.533)	Data Time 0.002 (0.046)	Loss 2.8190 (2.8275)	Entropy 0.63829 (0.63863)	Top-1 acc 53.516 (55.907)	Top-5 acc 79.688 (78.127)	lr 0.01782
Train [44][710/3239]	Time 0.267 (0.532)	Data Time 0.002 (0.046)	Loss 2.8620 (2.8275)	Entropy 0.63848 (0.63862)	Top-1 acc 56.250 (55.917)	Top-5 acc 77.344 (78.128)	lr 0.01782
Train [44][720/3239]	Time 0.240 (0.531)	Data Time 0.001 (0.045)	Loss 2.7387 (2.8270)	Entropy 0.63846 (0.63862)	Top-1 acc 58.203 (55.927)	Top-5 acc 81.641 (78.140)	lr 0.01782
Train [44][730/3239]	Time 0.302 (0.530)	Data Time 0.001 (0.044)	Loss 2.8738 (2.8277)	Entropy 0.63868 (0.63862)	Top-1 acc 52.344 (55.914)	Top-5 acc 76.953 (78.134)	lr 0.01781
Train [44][740/3239]	Time 0.254 (0.529)	Data Time 0.001 (0.044)	Loss 2.7415 (2.8280)	Entropy 0.63879 (0.63862)	Top-1 acc 60.547 (55.901)	Top-5 acc 80.859 (78.136)	lr 0.01781
Train [44][750/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.043)	Loss 2.9487 (2.8274)	Entropy 0.63910 (0.63862)	Top-1 acc 54.688 (55.912)	Top-5 acc 72.656 (78.146)	lr 0.01781
Train [44][760/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.043)	Loss 3.0654 (2.8279)	Entropy 0.63914 (0.63863)	Top-1 acc 53.906 (55.915)	Top-5 acc 71.875 (78.134)	lr 0.01781
Train [44][770/3239]	Time 0.277 (0.525)	Data Time 0.001 (0.042)	Loss 3.0691 (2.8284)	Entropy 0.63896 (0.63863)	Top-1 acc 51.172 (55.911)	Top-5 acc 73.047 (78.127)	lr 0.01781
Train [44][780/3239]	Time 0.239 (0.524)	Data Time 0.001 (0.042)	Loss 2.9874 (2.8284)	Entropy 0.63911 (0.63864)	Top-1 acc 52.344 (55.903)	Top-5 acc 72.266 (78.119)	lr 0.01781
Train [44][790/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.041)	Loss 2.9347 (2.8289)	Entropy 0.63926 (0.63864)	Top-1 acc 52.734 (55.892)	Top-5 acc 76.172 (78.114)	lr 0.01781
Train [44][800/3239]	Time 0.377 (0.522)	Data Time 0.001 (0.041)	Loss 2.8890 (2.8296)	Entropy 0.63938 (0.63865)	Top-1 acc 57.812 (55.879)	Top-5 acc 77.344 (78.111)	lr 0.01781
Train [44][810/3239]	Time 0.258 (0.521)	Data Time 0.001 (0.040)	Loss 2.8033 (2.8297)	Entropy 0.63952 (0.63866)	Top-1 acc 57.422 (55.873)	Top-5 acc 78.516 (78.106)	lr 0.01781
Train [44][820/3239]	Time 0.425 (0.560)	Data Time 0.044 (0.040)	Loss 2.6326 (2.8293)	Entropy 0.63929 (0.63867)	Top-1 acc 58.203 (55.880)	Top-5 acc 80.078 (78.118)	lr 0.01781
Train [44][830/3239]	Time 0.255 (0.559)	Data Time 0.002 (0.039)	Loss 2.9305 (2.8296)	Entropy 0.63891 (0.63868)	Top-1 acc 55.078 (55.865)	Top-5 acc 75.391 (78.117)	lr 0.01781
Train [44][840/3239]	Time 0.340 (0.558)	Data Time 0.003 (0.039)	Loss 2.7688 (2.8295)	Entropy 0.63868 (0.63868)	Top-1 acc 60.156 (55.880)	Top-5 acc 78.125 (78.117)	lr 0.01780
Train [44][850/3239]	Time 0.267 (0.557)	Data Time 0.002 (0.038)	Loss 2.5910 (2.8298)	Entropy 0.63866 (0.63868)	Top-1 acc 59.766 (55.866)	Top-5 acc 83.594 (78.112)	lr 0.01780
Train [44][860/3239]	Time 0.271 (0.556)	Data Time 0.001 (0.038)	Loss 2.6803 (2.8291)	Entropy 0.63894 (0.63868)	Top-1 acc 59.766 (55.873)	Top-5 acc 76.953 (78.122)	lr 0.01780
Train [44][870/3239]	Time 0.318 (0.555)	Data Time 0.002 (0.038)	Loss 2.6908 (2.8283)	Entropy 0.63864 (0.63868)	Top-1 acc 56.250 (55.886)	Top-5 acc 77.734 (78.129)	lr 0.01780
Train [44][880/3239]	Time 0.239 (0.554)	Data Time 0.001 (0.037)	Loss 3.2193 (2.8286)	Entropy 0.63872 (0.63868)	Top-1 acc 46.094 (55.864)	Top-5 acc 70.312 (78.125)	lr 0.01780
Train [44][890/3239]	Time 0.381 (0.553)	Data Time 0.001 (0.037)	Loss 2.7731 (2.8286)	Entropy 0.63889 (0.63868)	Top-1 acc 57.422 (55.852)	Top-5 acc 80.078 (78.124)	lr 0.01780
Train [44][900/3239]	Time 0.248 (0.552)	Data Time 0.001 (0.036)	Loss 2.8904 (2.8288)	Entropy 0.63847 (0.63868)	Top-1 acc 54.688 (55.848)	Top-5 acc 75.781 (78.124)	lr 0.01780
Train [44][910/3239]	Time 0.258 (0.551)	Data Time 0.009 (0.036)	Loss 2.6232 (2.8285)	Entropy 0.63813 (0.63868)	Top-1 acc 62.891 (55.863)	Top-5 acc 81.250 (78.134)	lr 0.01780
Train [44][920/3239]	Time 0.291 (0.550)	Data Time 0.003 (0.036)	Loss 2.9850 (2.8280)	Entropy 0.63831 (0.63868)	Top-1 acc 50.781 (55.881)	Top-5 acc 75.000 (78.138)	lr 0.01780
Train [44][930/3239]	Time 0.241 (0.549)	Data Time 0.001 (0.035)	Loss 2.8952 (2.8278)	Entropy 0.63831 (0.63867)	Top-1 acc 55.078 (55.888)	Top-5 acc 78.125 (78.149)	lr 0.01780
Train [44][940/3239]	Time 0.260 (0.548)	Data Time 0.001 (0.035)	Loss 2.7416 (2.8275)	Entropy 0.63799 (0.63867)	Top-1 acc 55.859 (55.893)	Top-5 acc 80.859 (78.156)	lr 0.01780
Train [44][950/3239]	Time 0.267 (0.547)	Data Time 0.001 (0.035)	Loss 2.9003 (2.8275)	Entropy 0.63771 (0.63866)	Top-1 acc 56.641 (55.902)	Top-5 acc 73.047 (78.149)	lr 0.01779
Train [44][960/3239]	Time 0.370 (0.547)	Data Time 0.001 (0.034)	Loss 2.9472 (2.8276)	Entropy 0.63785 (0.63865)	Top-1 acc 54.297 (55.908)	Top-5 acc 74.609 (78.144)	lr 0.01779
Train [44][970/3239]	Time 0.276 (0.546)	Data Time 0.001 (0.034)	Loss 2.9388 (2.8271)	Entropy 0.63786 (0.63864)	Top-1 acc 55.859 (55.916)	Top-5 acc 75.781 (78.160)	lr 0.01779
Train [44][980/3239]	Time 0.238 (0.546)	Data Time 0.001 (0.034)	Loss 2.7042 (2.8277)	Entropy 0.63764 (0.63863)	Top-1 acc 57.031 (55.909)	Top-5 acc 80.469 (78.142)	lr 0.01779
Train [44][990/3239]	Time 0.263 (0.545)	Data Time 0.003 (0.033)	Loss 3.2103 (2.8287)	Entropy 0.63762 (0.63862)	Top-1 acc 52.344 (55.891)	Top-5 acc 69.531 (78.122)	lr 0.01779
Train [44][1000/3239]	Time 0.316 (0.544)	Data Time 0.001 (0.033)	Loss 2.8355 (2.8288)	Entropy 0.63755 (0.63861)	Top-1 acc 52.734 (55.880)	Top-5 acc 75.781 (78.130)	lr 0.01779
Train [44][1010/3239]	Time 0.247 (0.543)	Data Time 0.001 (0.033)	Loss 2.8726 (2.8294)	Entropy 0.63756 (0.63860)	Top-1 acc 55.078 (55.871)	Top-5 acc 74.609 (78.120)	lr 0.01779
Train [44][1020/3239]	Time 0.255 (0.543)	Data Time 0.001 (0.032)	Loss 2.7866 (2.8292)	Entropy 0.63735 (0.63859)	Top-1 acc 56.641 (55.869)	Top-5 acc 79.688 (78.123)	lr 0.01779
Train [44][1030/3239]	Time 0.295 (0.542)	Data Time 0.001 (0.032)	Loss 2.9337 (2.8296)	Entropy 0.63759 (0.63858)	Top-1 acc 53.125 (55.864)	Top-5 acc 76.953 (78.114)	lr 0.01779
Train [44][1040/3239]	Time 0.250 (0.541)	Data Time 0.001 (0.032)	Loss 2.7779 (2.8298)	Entropy 0.63770 (0.63857)	Top-1 acc 58.203 (55.870)	Top-5 acc 78.125 (78.108)	lr 0.01779
Train [44][1050/3239]	Time 0.297 (0.541)	Data Time 0.002 (0.032)	Loss 2.7662 (2.8296)	Entropy 0.63760 (0.63856)	Top-1 acc 58.984 (55.885)	Top-5 acc 78.125 (78.113)	lr 0.01779
Train [44][1060/3239]	Time 0.254 (0.540)	Data Time 0.002 (0.031)	Loss 2.8792 (2.8291)	Entropy 0.63786 (0.63856)	Top-1 acc 54.297 (55.902)	Top-5 acc 78.125 (78.125)	lr 0.01778
Train [44][1070/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.031)	Loss 2.7074 (2.8294)	Entropy 0.63751 (0.63855)	Top-1 acc 60.547 (55.897)	Top-5 acc 78.906 (78.123)	lr 0.01778
Train [44][1080/3239]	Time 0.256 (0.539)	Data Time 0.001 (0.031)	Loss 2.8239 (2.8296)	Entropy 0.63771 (0.63854)	Top-1 acc 56.250 (55.886)	Top-5 acc 80.469 (78.124)	lr 0.01778
Train [44][1090/3239]	Time 0.252 (0.538)	Data Time 0.002 (0.030)	Loss 2.8818 (2.8301)	Entropy 0.63746 (0.63853)	Top-1 acc 55.469 (55.870)	Top-5 acc 76.562 (78.116)	lr 0.01778
Train [44][1100/3239]	Time 0.279 (0.538)	Data Time 0.002 (0.030)	Loss 2.7547 (2.8295)	Entropy 0.63733 (0.63852)	Top-1 acc 55.859 (55.883)	Top-5 acc 80.078 (78.131)	lr 0.01778
Train [44][1110/3239]	Time 0.249 (0.538)	Data Time 0.001 (0.030)	Loss 2.7134 (2.8292)	Entropy 0.63764 (0.63851)	Top-1 acc 57.422 (55.879)	Top-5 acc 80.469 (78.130)	lr 0.01778
Train [44][1120/3239]	Time 0.348 (0.537)	Data Time 0.001 (0.030)	Loss 2.6801 (2.8296)	Entropy 0.63753 (0.63850)	Top-1 acc 61.328 (55.876)	Top-5 acc 81.250 (78.123)	lr 0.01778
Train [44][1130/3239]	Time 0.239 (0.536)	Data Time 0.001 (0.029)	Loss 2.8178 (2.8294)	Entropy 0.63755 (0.63849)	Top-1 acc 53.516 (55.878)	Top-5 acc 77.734 (78.131)	lr 0.01778
Train [44][1140/3239]	Time 0.242 (0.535)	Data Time 0.001 (0.029)	Loss 3.0569 (2.8300)	Entropy 0.63753 (0.63848)	Top-1 acc 50.391 (55.870)	Top-5 acc 71.094 (78.114)	lr 0.01778
Train [44][1150/3239]	Time 0.253 (0.535)	Data Time 0.001 (0.029)	Loss 3.0078 (2.8302)	Entropy 0.63777 (0.63848)	Top-1 acc 50.000 (55.864)	Top-5 acc 77.734 (78.115)	lr 0.01778
Train [44][1160/3239]	Time 0.284 (0.534)	Data Time 0.001 (0.029)	Loss 2.9026 (2.8307)	Entropy 0.63741 (0.63847)	Top-1 acc 53.516 (55.849)	Top-5 acc 75.781 (78.104)	lr 0.01778
Train [44][1170/3239]	Time 0.292 (0.534)	Data Time 0.003 (0.028)	Loss 2.7286 (2.8301)	Entropy 0.63763 (0.63846)	Top-1 acc 59.375 (55.857)	Top-5 acc 79.688 (78.117)	lr 0.01777
Train [44][1180/3239]	Time 0.266 (0.533)	Data Time 0.001 (0.028)	Loss 2.6817 (2.8297)	Entropy 0.63772 (0.63845)	Top-1 acc 59.375 (55.869)	Top-5 acc 80.469 (78.126)	lr 0.01777
Train [44][1190/3239]	Time 0.350 (0.532)	Data Time 0.001 (0.028)	Loss 2.7631 (2.8296)	Entropy 0.63801 (0.63845)	Top-1 acc 56.250 (55.878)	Top-5 acc 79.297 (78.131)	lr 0.01777
Train [44][1200/3239]	Time 0.236 (0.532)	Data Time 0.001 (0.028)	Loss 2.9935 (2.8298)	Entropy 0.63770 (0.63844)	Top-1 acc 51.172 (55.875)	Top-5 acc 74.609 (78.126)	lr 0.01777
Train [44][1210/3239]	Time 0.247 (0.531)	Data Time 0.001 (0.028)	Loss 2.9605 (2.8302)	Entropy 0.63749 (0.63844)	Top-1 acc 55.469 (55.862)	Top-5 acc 75.781 (78.126)	lr 0.01777
Train [44][1220/3239]	Time 0.239 (0.530)	Data Time 0.001 (0.027)	Loss 2.7080 (2.8302)	Entropy 0.63770 (0.63843)	Top-1 acc 58.984 (55.865)	Top-5 acc 80.469 (78.128)	lr 0.01777
Train [44][1230/3239]	Time 0.287 (0.530)	Data Time 0.001 (0.027)	Loss 2.8445 (2.8301)	Entropy 0.63773 (0.63842)	Top-1 acc 59.766 (55.868)	Top-5 acc 75.781 (78.131)	lr 0.01777
Train [44][1240/3239]	Time 0.254 (0.529)	Data Time 0.001 (0.027)	Loss 2.7956 (2.8299)	Entropy 0.63762 (0.63842)	Top-1 acc 56.641 (55.868)	Top-5 acc 78.906 (78.137)	lr 0.01777
Train [44][1250/3239]	Time 0.240 (0.529)	Data Time 0.001 (0.027)	Loss 2.9158 (2.8299)	Entropy 0.63757 (0.63841)	Top-1 acc 50.391 (55.864)	Top-5 acc 75.781 (78.137)	lr 0.01777
Train [44][1260/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.027)	Loss 2.9939 (2.8297)	Entropy 0.63748 (0.63840)	Top-1 acc 51.953 (55.871)	Top-5 acc 75.781 (78.131)	lr 0.01777
Train [44][1270/3239]	Time 0.244 (0.527)	Data Time 0.001 (0.026)	Loss 2.6646 (2.8294)	Entropy 0.63746 (0.63840)	Top-1 acc 61.719 (55.890)	Top-5 acc 78.906 (78.132)	lr 0.01777
Train [44][1280/3239]	Time 0.354 (0.526)	Data Time 0.001 (0.026)	Loss 2.8386 (2.8289)	Entropy 0.63748 (0.63839)	Top-1 acc 55.078 (55.894)	Top-5 acc 77.734 (78.147)	lr 0.01776
Train [44][1290/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.026)	Loss 2.8772 (2.8294)	Entropy 0.63748 (0.63838)	Top-1 acc 55.078 (55.883)	Top-5 acc 79.688 (78.133)	lr 0.01776
Train [44][1300/3239]	Time 0.265 (0.525)	Data Time 0.001 (0.026)	Loss 2.8920 (2.8289)	Entropy 0.63758 (0.63838)	Top-1 acc 55.859 (55.895)	Top-5 acc 76.562 (78.142)	lr 0.01776
Train [44][1310/3239]	Time 0.277 (0.525)	Data Time 0.001 (0.026)	Loss 2.9999 (2.8296)	Entropy 0.63738 (0.63837)	Top-1 acc 53.906 (55.881)	Top-5 acc 75.000 (78.126)	lr 0.01776
Train [44][1320/3239]	Time 0.245 (0.524)	Data Time 0.001 (0.025)	Loss 2.8350 (2.8295)	Entropy 0.63756 (0.63836)	Top-1 acc 52.734 (55.883)	Top-5 acc 79.688 (78.126)	lr 0.01776
Train [44][1330/3239]	Time 0.269 (0.524)	Data Time 0.001 (0.025)	Loss 2.7063 (2.8289)	Entropy 0.63737 (0.63835)	Top-1 acc 52.734 (55.883)	Top-5 acc 80.859 (78.140)	lr 0.01776
Train [44][1340/3239]	Time 0.270 (0.523)	Data Time 0.001 (0.025)	Loss 2.8297 (2.8287)	Entropy 0.63711 (0.63835)	Top-1 acc 55.469 (55.889)	Top-5 acc 77.344 (78.134)	lr 0.01776
Train [44][1350/3239]	Time 0.390 (0.523)	Data Time 0.001 (0.025)	Loss 2.9442 (2.8289)	Entropy 0.63725 (0.63834)	Top-1 acc 53.125 (55.883)	Top-5 acc 79.297 (78.131)	lr 0.01776
Train [44][1360/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.025)	Loss 2.9264 (2.8293)	Entropy 0.63722 (0.63833)	Top-1 acc 53.516 (55.864)	Top-5 acc 74.609 (78.121)	lr 0.01776
Train [44][1370/3239]	Time 0.276 (0.522)	Data Time 0.002 (0.025)	Loss 2.6606 (2.8297)	Entropy 0.63734 (0.63832)	Top-1 acc 61.328 (55.861)	Top-5 acc 80.859 (78.117)	lr 0.01776
Train [44][1380/3239]	Time 0.246 (0.521)	Data Time 0.001 (0.024)	Loss 2.9541 (2.8299)	Entropy 0.63713 (0.63831)	Top-1 acc 54.297 (55.865)	Top-5 acc 75.000 (78.108)	lr 0.01776
Train [44][1390/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.024)	Loss 3.3825 (2.8299)	Entropy 0.63740 (0.63831)	Top-1 acc 42.188 (55.863)	Top-5 acc 67.188 (78.108)	lr 0.01775
Train [44][1400/3239]	Time 0.275 (0.520)	Data Time 0.002 (0.024)	Loss 2.7655 (2.8298)	Entropy 0.63764 (0.63830)	Top-1 acc 60.547 (55.862)	Top-5 acc 76.953 (78.112)	lr 0.01775
Train [44][1410/3239]	Time 0.247 (0.520)	Data Time 0.001 (0.024)	Loss 2.9339 (2.8298)	Entropy 0.63737 (0.63829)	Top-1 acc 53.125 (55.865)	Top-5 acc 74.609 (78.115)	lr 0.01775
Train [44][1420/3239]	Time 0.247 (0.519)	Data Time 0.001 (0.024)	Loss 2.7324 (2.8300)	Entropy 0.63715 (0.63829)	Top-1 acc 57.422 (55.852)	Top-5 acc 76.953 (78.108)	lr 0.01775
Train [44][1430/3239]	Time 0.264 (0.519)	Data Time 0.002 (0.024)	Loss 2.9288 (2.8299)	Entropy 0.63708 (0.63828)	Top-1 acc 55.469 (55.856)	Top-5 acc 75.000 (78.110)	lr 0.01775
Train [44][1440/3239]	Time 0.273 (0.518)	Data Time 0.001 (0.023)	Loss 2.7273 (2.8298)	Entropy 0.63729 (0.63827)	Top-1 acc 60.547 (55.860)	Top-5 acc 80.859 (78.117)	lr 0.01775
Train [44][1450/3239]	Time 0.237 (0.518)	Data Time 0.001 (0.023)	Loss 3.0489 (2.8298)	Entropy 0.63746 (0.63826)	Top-1 acc 50.000 (55.861)	Top-5 acc 75.000 (78.117)	lr 0.01775
Train [44][1460/3239]	Time 0.273 (0.517)	Data Time 0.001 (0.023)	Loss 2.8342 (2.8302)	Entropy 0.63734 (0.63826)	Top-1 acc 55.078 (55.853)	Top-5 acc 77.734 (78.109)	lr 0.01775
Train [44][1470/3239]	Time 0.255 (0.517)	Data Time 0.001 (0.023)	Loss 2.6927 (2.8304)	Entropy 0.63757 (0.63825)	Top-1 acc 61.719 (55.851)	Top-5 acc 78.906 (78.104)	lr 0.01775
Train [44][1480/3239]	Time 0.366 (0.540)	Data Time 0.003 (0.023)	Loss 2.8936 (2.8305)	Entropy 0.63732 (0.63825)	Top-1 acc 55.469 (55.850)	Top-5 acc 76.953 (78.102)	lr 0.01775
Train [44][1490/3239]	Time 0.242 (0.539)	Data Time 0.002 (0.023)	Loss 2.8793 (2.8308)	Entropy 0.63730 (0.63824)	Top-1 acc 51.562 (55.843)	Top-5 acc 76.172 (78.097)	lr 0.01775
Train [44][1500/3239]	Time 0.276 (0.539)	Data Time 0.001 (0.023)	Loss 2.7772 (2.8307)	Entropy 0.63735 (0.63823)	Top-1 acc 59.375 (55.846)	Top-5 acc 80.469 (78.100)	lr 0.01774
Train [44][1510/3239]	Time 0.384 (0.538)	Data Time 0.002 (0.023)	Loss 2.9104 (2.8308)	Entropy 0.63726 (0.63823)	Top-1 acc 56.641 (55.853)	Top-5 acc 78.125 (78.098)	lr 0.01774
Train [44][1520/3239]	Time 0.240 (0.538)	Data Time 0.001 (0.022)	Loss 2.9704 (2.8309)	Entropy 0.63719 (0.63822)	Top-1 acc 53.516 (55.849)	Top-5 acc 77.344 (78.096)	lr 0.01774
Train [44][1530/3239]	Time 0.256 (0.537)	Data Time 0.001 (0.022)	Loss 2.7931 (2.8312)	Entropy 0.63731 (0.63822)	Top-1 acc 53.516 (55.841)	Top-5 acc 78.906 (78.094)	lr 0.01774
Train [44][1540/3239]	Time 0.326 (0.537)	Data Time 0.002 (0.022)	Loss 2.9753 (2.8316)	Entropy 0.63713 (0.63821)	Top-1 acc 53.906 (55.827)	Top-5 acc 76.953 (78.084)	lr 0.01774
Train [44][1550/3239]	Time 0.255 (0.536)	Data Time 0.001 (0.022)	Loss 2.8213 (2.8315)	Entropy 0.63703 (0.63820)	Top-1 acc 56.250 (55.828)	Top-5 acc 79.297 (78.085)	lr 0.01774
Train [44][1560/3239]	Time 0.303 (0.536)	Data Time 0.001 (0.022)	Loss 2.8866 (2.8316)	Entropy 0.63737 (0.63819)	Top-1 acc 54.297 (55.829)	Top-5 acc 79.297 (78.086)	lr 0.01774
Train [44][1570/3239]	Time 0.240 (0.536)	Data Time 0.002 (0.022)	Loss 2.8063 (2.8316)	Entropy 0.63752 (0.63819)	Top-1 acc 56.641 (55.822)	Top-5 acc 80.078 (78.090)	lr 0.01774
Train [44][1580/3239]	Time 0.248 (0.535)	Data Time 0.001 (0.022)	Loss 2.7113 (2.8316)	Entropy 0.63715 (0.63818)	Top-1 acc 60.547 (55.818)	Top-5 acc 83.594 (78.096)	lr 0.01774
Train [44][1590/3239]	Time 0.269 (0.535)	Data Time 0.001 (0.022)	Loss 2.8934 (2.8318)	Entropy 0.63757 (0.63818)	Top-1 acc 51.953 (55.815)	Top-5 acc 76.562 (78.092)	lr 0.01774
Train [44][1600/3239]	Time 0.299 (0.534)	Data Time 0.001 (0.021)	Loss 3.2264 (2.8316)	Entropy 0.63760 (0.63817)	Top-1 acc 46.484 (55.821)	Top-5 acc 68.359 (78.095)	lr 0.01774
Train [44][1610/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.021)	Loss 2.7240 (2.8319)	Entropy 0.63770 (0.63817)	Top-1 acc 56.641 (55.808)	Top-5 acc 82.422 (78.094)	lr 0.01773
Train [44][1620/3239]	Time 0.254 (0.533)	Data Time 0.001 (0.021)	Loss 2.8719 (2.8319)	Entropy 0.63759 (0.63817)	Top-1 acc 53.125 (55.810)	Top-5 acc 76.953 (78.099)	lr 0.01773
Train [44][1630/3239]	Time 0.244 (0.533)	Data Time 0.001 (0.021)	Loss 3.0213 (2.8321)	Entropy 0.63757 (0.63816)	Top-1 acc 54.688 (55.801)	Top-5 acc 76.562 (78.103)	lr 0.01773
Train [44][1640/3239]	Time 0.269 (0.533)	Data Time 0.002 (0.021)	Loss 2.8948 (2.8323)	Entropy 0.63780 (0.63816)	Top-1 acc 53.906 (55.800)	Top-5 acc 77.344 (78.102)	lr 0.01773
Train [44][1650/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.021)	Loss 2.9329 (2.8325)	Entropy 0.63796 (0.63816)	Top-1 acc 55.469 (55.796)	Top-5 acc 75.000 (78.096)	lr 0.01773
Train [44][1660/3239]	Time 0.261 (0.532)	Data Time 0.001 (0.021)	Loss 2.7894 (2.8329)	Entropy 0.63776 (0.63816)	Top-1 acc 57.422 (55.792)	Top-5 acc 79.297 (78.084)	lr 0.01773
Train [44][1670/3239]	Time 0.367 (0.531)	Data Time 0.001 (0.021)	Loss 2.8206 (2.8335)	Entropy 0.63781 (0.63816)	Top-1 acc 54.297 (55.777)	Top-5 acc 78.906 (78.071)	lr 0.01773
Train [44][1680/3239]	Time 0.260 (0.531)	Data Time 0.002 (0.020)	Loss 2.8199 (2.8336)	Entropy 0.63772 (0.63815)	Top-1 acc 57.031 (55.770)	Top-5 acc 76.953 (78.067)	lr 0.01773
Train [44][1690/3239]	Time 0.251 (0.530)	Data Time 0.001 (0.020)	Loss 2.9169 (2.8338)	Entropy 0.63764 (0.63815)	Top-1 acc 53.125 (55.768)	Top-5 acc 77.734 (78.065)	lr 0.01773
Train [44][1700/3239]	Time 0.252 (0.530)	Data Time 0.001 (0.020)	Loss 2.6234 (2.8332)	Entropy 0.63726 (0.63815)	Top-1 acc 60.547 (55.787)	Top-5 acc 82.031 (78.072)	lr 0.01773
Train [44][1710/3239]	Time 0.248 (0.530)	Data Time 0.001 (0.020)	Loss 2.7590 (2.8334)	Entropy 0.63735 (0.63814)	Top-1 acc 53.516 (55.779)	Top-5 acc 80.078 (78.071)	lr 0.01772
Train [44][1720/3239]	Time 0.256 (0.529)	Data Time 0.001 (0.020)	Loss 2.7275 (2.8338)	Entropy 0.63716 (0.63814)	Top-1 acc 55.469 (55.767)	Top-5 acc 80.078 (78.064)	lr 0.01772
Train [44][1730/3239]	Time 0.240 (0.529)	Data Time 0.001 (0.020)	Loss 2.7494 (2.8337)	Entropy 0.63675 (0.63813)	Top-1 acc 56.641 (55.770)	Top-5 acc 81.641 (78.067)	lr 0.01772
Train [44][1740/3239]	Time 0.375 (0.528)	Data Time 0.001 (0.020)	Loss 2.8278 (2.8341)	Entropy 0.63669 (0.63812)	Top-1 acc 58.594 (55.772)	Top-5 acc 75.781 (78.059)	lr 0.01772
Train [44][1750/3239]	Time 0.248 (0.528)	Data Time 0.001 (0.020)	Loss 2.8845 (2.8340)	Entropy 0.63670 (0.63812)	Top-1 acc 53.125 (55.769)	Top-5 acc 75.000 (78.062)	lr 0.01772
Train [44][1760/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.020)	Loss 2.8083 (2.8341)	Entropy 0.63640 (0.63811)	Top-1 acc 55.078 (55.764)	Top-5 acc 79.688 (78.058)	lr 0.01772
Train [44][1770/3239]	Time 0.248 (0.527)	Data Time 0.001 (0.020)	Loss 3.0217 (2.8343)	Entropy 0.63676 (0.63810)	Top-1 acc 53.516 (55.764)	Top-5 acc 75.391 (78.055)	lr 0.01772
Train [44][1780/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.019)	Loss 2.8232 (2.8342)	Entropy 0.63671 (0.63809)	Top-1 acc 57.422 (55.768)	Top-5 acc 79.688 (78.061)	lr 0.01772
Train [44][1790/3239]	Time 0.261 (0.527)	Data Time 0.001 (0.019)	Loss 2.6998 (2.8340)	Entropy 0.63641 (0.63808)	Top-1 acc 55.859 (55.776)	Top-5 acc 81.641 (78.063)	lr 0.01772
Train [44][1800/3239]	Time 0.258 (0.526)	Data Time 0.001 (0.019)	Loss 2.9680 (2.8340)	Entropy 0.63641 (0.63807)	Top-1 acc 48.438 (55.774)	Top-5 acc 77.344 (78.062)	lr 0.01772
Train [44][1810/3239]	Time 0.262 (0.526)	Data Time 0.002 (0.019)	Loss 2.7596 (2.8338)	Entropy 0.63631 (0.63806)	Top-1 acc 58.594 (55.772)	Top-5 acc 78.516 (78.067)	lr 0.01772
Train [44][1820/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.019)	Loss 2.7585 (2.8339)	Entropy 0.63624 (0.63805)	Top-1 acc 58.594 (55.775)	Top-5 acc 80.469 (78.071)	lr 0.01771
Train [44][1830/3239]	Time 0.358 (0.525)	Data Time 0.001 (0.019)	Loss 3.0400 (2.8343)	Entropy 0.63652 (0.63804)	Top-1 acc 51.562 (55.767)	Top-5 acc 76.172 (78.072)	lr 0.01771
Train [44][1840/3239]	Time 0.275 (0.524)	Data Time 0.001 (0.019)	Loss 2.6962 (2.8342)	Entropy 0.63657 (0.63804)	Top-1 acc 60.156 (55.769)	Top-5 acc 80.469 (78.077)	lr 0.01771
Train [44][1850/3239]	Time 0.259 (0.524)	Data Time 0.002 (0.019)	Loss 2.8795 (2.8341)	Entropy 0.63668 (0.63803)	Top-1 acc 52.734 (55.773)	Top-5 acc 80.078 (78.084)	lr 0.01771
Train [44][1860/3239]	Time 0.249 (0.524)	Data Time 0.001 (0.019)	Loss 2.8982 (2.8341)	Entropy 0.63667 (0.63802)	Top-1 acc 54.297 (55.774)	Top-5 acc 76.953 (78.085)	lr 0.01771
Train [44][1870/3239]	Time 0.238 (0.523)	Data Time 0.001 (0.019)	Loss 2.8999 (2.8343)	Entropy 0.63658 (0.63801)	Top-1 acc 55.469 (55.766)	Top-5 acc 76.562 (78.080)	lr 0.01771
Train [44][1880/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.018)	Loss 2.9120 (2.8341)	Entropy 0.63636 (0.63800)	Top-1 acc 55.078 (55.771)	Top-5 acc 75.781 (78.084)	lr 0.01771
Train [44][1890/3239]	Time 0.246 (0.522)	Data Time 0.001 (0.018)	Loss 2.8191 (2.8345)	Entropy 0.63690 (0.63800)	Top-1 acc 53.516 (55.760)	Top-5 acc 80.078 (78.075)	lr 0.01771
Train [44][1900/3239]	Time 0.346 (0.522)	Data Time 0.001 (0.018)	Loss 2.7440 (2.8343)	Entropy 0.63681 (0.63799)	Top-1 acc 59.766 (55.762)	Top-5 acc 78.906 (78.079)	lr 0.01771
Train [44][1910/3239]	Time 0.291 (0.522)	Data Time 0.002 (0.018)	Loss 2.8223 (2.8343)	Entropy 0.63678 (0.63799)	Top-1 acc 53.125 (55.761)	Top-5 acc 78.516 (78.083)	lr 0.01771
Train [44][1920/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.018)	Loss 2.6472 (2.8344)	Entropy 0.63653 (0.63798)	Top-1 acc 58.203 (55.763)	Top-5 acc 83.594 (78.082)	lr 0.01771
Train [44][1930/3239]	Time 0.262 (0.521)	Data Time 0.001 (0.018)	Loss 2.7091 (2.8343)	Entropy 0.63649 (0.63797)	Top-1 acc 57.422 (55.760)	Top-5 acc 79.688 (78.090)	lr 0.01770
Train [44][1940/3239]	Time 0.255 (0.521)	Data Time 0.001 (0.018)	Loss 2.7810 (2.8342)	Entropy 0.63645 (0.63796)	Top-1 acc 59.375 (55.761)	Top-5 acc 77.734 (78.086)	lr 0.01770
Train [44][1950/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.018)	Loss 2.9446 (2.8344)	Entropy 0.63645 (0.63796)	Top-1 acc 51.953 (55.754)	Top-5 acc 75.781 (78.082)	lr 0.01770
Train [44][1960/3239]	Time 0.240 (0.520)	Data Time 0.001 (0.018)	Loss 2.8477 (2.8345)	Entropy 0.63673 (0.63795)	Top-1 acc 54.688 (55.755)	Top-5 acc 78.125 (78.081)	lr 0.01770
Train [44][1970/3239]	Time 0.269 (0.520)	Data Time 0.001 (0.018)	Loss 2.8922 (2.8346)	Entropy 0.63688 (0.63794)	Top-1 acc 54.688 (55.753)	Top-5 acc 80.078 (78.083)	lr 0.01770
Train [44][1980/3239]	Time 0.240 (0.520)	Data Time 0.001 (0.018)	Loss 2.9764 (2.8345)	Entropy 0.63707 (0.63794)	Top-1 acc 50.391 (55.753)	Top-5 acc 77.344 (78.085)	lr 0.01770
Train [44][1990/3239]	Time 0.314 (0.519)	Data Time 0.001 (0.018)	Loss 2.9488 (2.8347)	Entropy 0.63701 (0.63793)	Top-1 acc 54.297 (55.750)	Top-5 acc 75.391 (78.082)	lr 0.01770
Train [44][2000/3239]	Time 0.259 (0.519)	Data Time 0.001 (0.017)	Loss 2.7591 (2.8350)	Entropy 0.63682 (0.63793)	Top-1 acc 56.641 (55.738)	Top-5 acc 80.859 (78.076)	lr 0.01770
Train [44][2010/3239]	Time 0.256 (0.519)	Data Time 0.002 (0.017)	Loss 2.9188 (2.8348)	Entropy 0.63668 (0.63792)	Top-1 acc 52.344 (55.740)	Top-5 acc 76.562 (78.078)	lr 0.01770
Train [44][2020/3239]	Time 0.245 (0.518)	Data Time 0.001 (0.017)	Loss 2.9941 (2.8350)	Entropy 0.63705 (0.63792)	Top-1 acc 53.516 (55.738)	Top-5 acc 72.266 (78.074)	lr 0.01770
Train [44][2030/3239]	Time 0.257 (0.518)	Data Time 0.001 (0.017)	Loss 2.7431 (2.8350)	Entropy 0.63686 (0.63791)	Top-1 acc 60.547 (55.743)	Top-5 acc 80.859 (78.073)	lr 0.01770
Train [44][2040/3239]	Time 0.260 (0.518)	Data Time 0.002 (0.017)	Loss 2.8272 (2.8351)	Entropy 0.63658 (0.63791)	Top-1 acc 56.641 (55.746)	Top-5 acc 78.516 (78.069)	lr 0.01769
Train [44][2050/3239]	Time 0.250 (0.517)	Data Time 0.001 (0.017)	Loss 2.8697 (2.8352)	Entropy 0.63655 (0.63790)	Top-1 acc 57.031 (55.747)	Top-5 acc 76.953 (78.074)	lr 0.01769
Train [44][2060/3239]	Time 0.366 (0.517)	Data Time 0.002 (0.017)	Loss 2.9577 (2.8354)	Entropy 0.63648 (0.63790)	Top-1 acc 54.688 (55.740)	Top-5 acc 73.047 (78.069)	lr 0.01769
Train [44][2070/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.017)	Loss 2.9737 (2.8353)	Entropy 0.63674 (0.63789)	Top-1 acc 55.859 (55.746)	Top-5 acc 75.781 (78.073)	lr 0.01769
Train [44][2080/3239]	Time 0.248 (0.517)	Data Time 0.001 (0.017)	Loss 2.9339 (2.8357)	Entropy 0.63666 (0.63788)	Top-1 acc 57.422 (55.735)	Top-5 acc 75.000 (78.066)	lr 0.01769
Train [44][2090/3239]	Time 0.248 (0.516)	Data Time 0.001 (0.017)	Loss 2.8709 (2.8360)	Entropy 0.63672 (0.63788)	Top-1 acc 51.953 (55.730)	Top-5 acc 75.781 (78.063)	lr 0.01769
Train [44][2100/3239]	Time 0.244 (0.516)	Data Time 0.001 (0.017)	Loss 2.6609 (2.8358)	Entropy 0.63672 (0.63787)	Top-1 acc 60.156 (55.733)	Top-5 acc 82.812 (78.070)	lr 0.01769
Train [44][2110/3239]	Time 0.294 (0.516)	Data Time 0.002 (0.017)	Loss 2.6768 (2.8357)	Entropy 0.63683 (0.63787)	Top-1 acc 61.719 (55.740)	Top-5 acc 81.641 (78.073)	lr 0.01769
Train [44][2120/3239]	Time 0.270 (0.515)	Data Time 0.001 (0.017)	Loss 2.8231 (2.8356)	Entropy 0.63669 (0.63786)	Top-1 acc 53.125 (55.734)	Top-5 acc 82.031 (78.074)	lr 0.01769
Train [44][2130/3239]	Time 0.353 (0.529)	Data Time 0.004 (0.017)	Loss 2.9046 (2.8355)	Entropy 0.63688 (0.63786)	Top-1 acc 55.469 (55.738)	Top-5 acc 77.734 (78.076)	lr 0.01769
Train [44][2140/3239]	Time 0.276 (0.530)	Data Time 0.003 (0.016)	Loss 3.0033 (2.8355)	Entropy 0.63675 (0.63785)	Top-1 acc 51.953 (55.729)	Top-5 acc 76.172 (78.069)	lr 0.01769
Train [44][2150/3239]	Time 0.286 (0.529)	Data Time 0.002 (0.016)	Loss 3.0116 (2.8356)	Entropy 0.63629 (0.63785)	Top-1 acc 55.469 (55.729)	Top-5 acc 74.609 (78.068)	lr 0.01768
Train [44][2160/3239]	Time 0.247 (0.529)	Data Time 0.002 (0.016)	Loss 2.9519 (2.8357)	Entropy 0.63651 (0.63784)	Top-1 acc 56.641 (55.728)	Top-5 acc 75.781 (78.064)	lr 0.01768
Train [44][2170/3239]	Time 0.257 (0.529)	Data Time 0.001 (0.016)	Loss 2.7922 (2.8358)	Entropy 0.63665 (0.63783)	Top-1 acc 53.125 (55.722)	Top-5 acc 82.031 (78.063)	lr 0.01768
Train [44][2180/3239]	Time 0.249 (0.528)	Data Time 0.001 (0.016)	Loss 2.7294 (2.8360)	Entropy 0.63648 (0.63783)	Top-1 acc 59.766 (55.721)	Top-5 acc 80.469 (78.061)	lr 0.01768
Train [44][2190/3239]	Time 0.246 (0.528)	Data Time 0.002 (0.016)	Loss 3.0593 (2.8360)	Entropy 0.63659 (0.63782)	Top-1 acc 51.562 (55.726)	Top-5 acc 73.438 (78.060)	lr 0.01768
Train [44][2200/3239]	Time 0.251 (0.528)	Data Time 0.001 (0.016)	Loss 2.7551 (2.8355)	Entropy 0.63657 (0.63782)	Top-1 acc 60.156 (55.739)	Top-5 acc 77.734 (78.069)	lr 0.01768
Train [44][2210/3239]	Time 0.253 (0.528)	Data Time 0.001 (0.016)	Loss 2.7121 (2.8353)	Entropy 0.63656 (0.63781)	Top-1 acc 57.031 (55.741)	Top-5 acc 80.859 (78.073)	lr 0.01768
Train [44][2220/3239]	Time 0.353 (0.527)	Data Time 0.001 (0.016)	Loss 2.8332 (2.8357)	Entropy 0.63679 (0.63780)	Top-1 acc 57.031 (55.732)	Top-5 acc 77.344 (78.064)	lr 0.01768
Train [44][2230/3239]	Time 0.242 (0.527)	Data Time 0.001 (0.016)	Loss 3.0578 (2.8361)	Entropy 0.63678 (0.63780)	Top-1 acc 49.219 (55.718)	Top-5 acc 72.656 (78.057)	lr 0.01768
Train [44][2240/3239]	Time 0.253 (0.527)	Data Time 0.001 (0.016)	Loss 2.6431 (2.8362)	Entropy 0.63685 (0.63780)	Top-1 acc 60.156 (55.716)	Top-5 acc 81.250 (78.053)	lr 0.01768
Train [44][2250/3239]	Time 0.261 (0.527)	Data Time 0.001 (0.016)	Loss 2.7266 (2.8362)	Entropy 0.63643 (0.63779)	Top-1 acc 60.156 (55.718)	Top-5 acc 78.125 (78.050)	lr 0.01768
Train [44][2260/3239]	Time 0.249 (0.526)	Data Time 0.001 (0.016)	Loss 3.0006 (2.8364)	Entropy 0.63653 (0.63779)	Top-1 acc 50.781 (55.712)	Top-5 acc 73.438 (78.046)	lr 0.01767
Train [44][2270/3239]	Time 0.254 (0.526)	Data Time 0.001 (0.016)	Loss 2.6708 (2.8363)	Entropy 0.63650 (0.63778)	Top-1 acc 61.328 (55.715)	Top-5 acc 83.203 (78.044)	lr 0.01767
Train [44][2280/3239]	Time 0.376 (0.526)	Data Time 0.002 (0.016)	Loss 2.7235 (2.8362)	Entropy 0.63642 (0.63777)	Top-1 acc 58.203 (55.719)	Top-5 acc 80.078 (78.047)	lr 0.01767
Train [44][2290/3239]	Time 0.413 (0.526)	Data Time 0.001 (0.016)	Loss 2.8071 (2.8361)	Entropy 0.63640 (0.63777)	Top-1 acc 56.250 (55.722)	Top-5 acc 76.172 (78.049)	lr 0.01767
Train [44][2300/3239]	Time 0.250 (0.526)	Data Time 0.001 (0.016)	Loss 2.9026 (2.8365)	Entropy 0.63615 (0.63776)	Top-1 acc 56.250 (55.715)	Top-5 acc 78.906 (78.045)	lr 0.01767
Train [44][2310/3239]	Time 0.253 (0.525)	Data Time 0.001 (0.015)	Loss 2.6804 (2.8361)	Entropy 0.63625 (0.63776)	Top-1 acc 58.984 (55.720)	Top-5 acc 81.641 (78.053)	lr 0.01767
Train [44][2320/3239]	Time 0.241 (0.525)	Data Time 0.001 (0.015)	Loss 2.7118 (2.8361)	Entropy 0.63606 (0.63775)	Top-1 acc 57.422 (55.717)	Top-5 acc 80.859 (78.054)	lr 0.01767
Train [44][2330/3239]	Time 0.262 (0.525)	Data Time 0.001 (0.015)	Loss 2.7294 (2.8361)	Entropy 0.63582 (0.63774)	Top-1 acc 56.641 (55.718)	Top-5 acc 82.031 (78.056)	lr 0.01767
Train [44][2340/3239]	Time 0.262 (0.524)	Data Time 0.002 (0.015)	Loss 2.8892 (2.8362)	Entropy 0.63619 (0.63773)	Top-1 acc 53.906 (55.712)	Top-5 acc 78.516 (78.056)	lr 0.01767
Train [44][2350/3239]	Time 0.267 (0.524)	Data Time 0.001 (0.015)	Loss 2.8662 (2.8360)	Entropy 0.63599 (0.63773)	Top-1 acc 56.641 (55.719)	Top-5 acc 77.734 (78.061)	lr 0.01767
Train [44][2360/3239]	Time 0.266 (0.524)	Data Time 0.001 (0.015)	Loss 2.6428 (2.8362)	Entropy 0.63631 (0.63772)	Top-1 acc 58.984 (55.711)	Top-5 acc 81.641 (78.058)	lr 0.01767
Train [44][2370/3239]	Time 0.252 (0.524)	Data Time 0.001 (0.015)	Loss 2.8295 (2.8364)	Entropy 0.63641 (0.63771)	Top-1 acc 57.422 (55.706)	Top-5 acc 80.078 (78.058)	lr 0.01766
Train [44][2380/3239]	Time 0.386 (0.523)	Data Time 0.001 (0.015)	Loss 2.8816 (2.8362)	Entropy 0.63634 (0.63771)	Top-1 acc 56.250 (55.716)	Top-5 acc 77.734 (78.062)	lr 0.01766
Train [44][2390/3239]	Time 0.248 (0.523)	Data Time 0.002 (0.015)	Loss 3.0320 (2.8362)	Entropy 0.63670 (0.63770)	Top-1 acc 53.125 (55.717)	Top-5 acc 72.266 (78.058)	lr 0.01766
Train [44][2400/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.015)	Loss 2.9607 (2.8362)	Entropy 0.63679 (0.63770)	Top-1 acc 54.297 (55.718)	Top-5 acc 75.000 (78.056)	lr 0.01766
Train [44][2410/3239]	Time 0.240 (0.523)	Data Time 0.001 (0.015)	Loss 2.8489 (2.8363)	Entropy 0.63663 (0.63769)	Top-1 acc 53.516 (55.717)	Top-5 acc 77.344 (78.057)	lr 0.01766
Train [44][2420/3239]	Time 0.257 (0.522)	Data Time 0.002 (0.015)	Loss 2.9940 (2.8362)	Entropy 0.63642 (0.63769)	Top-1 acc 56.250 (55.719)	Top-5 acc 73.828 (78.058)	lr 0.01766
Train [44][2430/3239]	Time 0.264 (0.522)	Data Time 0.001 (0.015)	Loss 2.8854 (2.8364)	Entropy 0.63643 (0.63768)	Top-1 acc 53.516 (55.715)	Top-5 acc 75.391 (78.051)	lr 0.01766
Train [44][2440/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.015)	Loss 3.0562 (2.8366)	Entropy 0.63640 (0.63768)	Top-1 acc 50.781 (55.711)	Top-5 acc 71.484 (78.046)	lr 0.01766
Train [44][2450/3239]	Time 0.395 (0.522)	Data Time 0.001 (0.015)	Loss 2.7871 (2.8365)	Entropy 0.63677 (0.63768)	Top-1 acc 56.641 (55.717)	Top-5 acc 77.734 (78.047)	lr 0.01766
Train [44][2460/3239]	Time 0.238 (0.522)	Data Time 0.002 (0.015)	Loss 2.9319 (2.8364)	Entropy 0.63713 (0.63767)	Top-1 acc 53.516 (55.716)	Top-5 acc 75.781 (78.048)	lr 0.01766
Train [44][2470/3239]	Time 0.261 (0.521)	Data Time 0.001 (0.015)	Loss 2.9634 (2.8364)	Entropy 0.63729 (0.63767)	Top-1 acc 55.469 (55.717)	Top-5 acc 78.125 (78.048)	lr 0.01766
Train [44][2480/3239]	Time 0.244 (0.521)	Data Time 0.001 (0.015)	Loss 2.6888 (2.8364)	Entropy 0.63756 (0.63767)	Top-1 acc 60.938 (55.716)	Top-5 acc 80.469 (78.046)	lr 0.01765
Train [44][2490/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.014)	Loss 2.8576 (2.8364)	Entropy 0.63788 (0.63767)	Top-1 acc 57.812 (55.714)	Top-5 acc 78.125 (78.042)	lr 0.01765
Train [44][2500/3239]	Time 0.248 (0.520)	Data Time 0.001 (0.014)	Loss 2.7855 (2.8365)	Entropy 0.63808 (0.63767)	Top-1 acc 59.766 (55.714)	Top-5 acc 80.078 (78.040)	lr 0.01765
Train [44][2510/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.014)	Loss 2.8247 (2.8365)	Entropy 0.63806 (0.63767)	Top-1 acc 58.984 (55.718)	Top-5 acc 79.297 (78.038)	lr 0.01765
Train [44][2520/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.014)	Loss 2.9518 (2.8364)	Entropy 0.63806 (0.63767)	Top-1 acc 48.828 (55.717)	Top-5 acc 76.953 (78.039)	lr 0.01765
Train [44][2530/3239]	Time 0.258 (0.519)	Data Time 0.001 (0.014)	Loss 2.5983 (2.8362)	Entropy 0.63780 (0.63767)	Top-1 acc 62.500 (55.720)	Top-5 acc 82.812 (78.046)	lr 0.01765
Train [44][2540/3239]	Time 0.370 (0.519)	Data Time 0.001 (0.014)	Loss 2.9362 (2.8361)	Entropy 0.63798 (0.63768)	Top-1 acc 50.391 (55.716)	Top-5 acc 75.000 (78.047)	lr 0.01765
Train [44][2550/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.014)	Loss 2.8543 (2.8359)	Entropy 0.63803 (0.63768)	Top-1 acc 55.078 (55.721)	Top-5 acc 74.219 (78.050)	lr 0.01765
Train [44][2560/3239]	Time 0.297 (0.518)	Data Time 0.001 (0.014)	Loss 3.0539 (2.8358)	Entropy 0.63814 (0.63768)	Top-1 acc 51.172 (55.723)	Top-5 acc 73.438 (78.053)	lr 0.01765
Train [44][2570/3239]	Time 0.250 (0.518)	Data Time 0.001 (0.014)	Loss 2.9574 (2.8357)	Entropy 0.63825 (0.63768)	Top-1 acc 56.250 (55.725)	Top-5 acc 76.562 (78.053)	lr 0.01765
Train [44][2580/3239]	Time 0.268 (0.518)	Data Time 0.001 (0.014)	Loss 3.0068 (2.8361)	Entropy 0.63831 (0.63768)	Top-1 acc 50.781 (55.719)	Top-5 acc 75.000 (78.048)	lr 0.01765
Train [44][2590/3239]	Time 0.261 (0.518)	Data Time 0.001 (0.014)	Loss 2.7094 (2.8363)	Entropy 0.63840 (0.63768)	Top-1 acc 60.156 (55.717)	Top-5 acc 81.641 (78.043)	lr 0.01764
Train [44][2600/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.014)	Loss 3.1035 (2.8364)	Entropy 0.63811 (0.63769)	Top-1 acc 49.609 (55.717)	Top-5 acc 72.656 (78.040)	lr 0.01764
Train [44][2610/3239]	Time 0.354 (0.517)	Data Time 0.001 (0.014)	Loss 2.9712 (2.8364)	Entropy 0.63837 (0.63769)	Top-1 acc 55.469 (55.717)	Top-5 acc 73.828 (78.039)	lr 0.01764
Train [44][2620/3239]	Time 0.267 (0.517)	Data Time 0.001 (0.014)	Loss 2.8192 (2.8364)	Entropy 0.63853 (0.63769)	Top-1 acc 57.812 (55.719)	Top-5 acc 76.953 (78.040)	lr 0.01764
Train [44][2630/3239]	Time 0.242 (0.517)	Data Time 0.001 (0.014)	Loss 2.8493 (2.8363)	Entropy 0.63810 (0.63769)	Top-1 acc 55.469 (55.724)	Top-5 acc 77.344 (78.039)	lr 0.01764
Train [44][2640/3239]	Time 0.232 (0.516)	Data Time 0.002 (0.014)	Loss 2.7905 (2.8362)	Entropy 0.63778 (0.63769)	Top-1 acc 57.812 (55.724)	Top-5 acc 77.734 (78.040)	lr 0.01764
Train [44][2650/3239]	Time 0.254 (0.516)	Data Time 0.001 (0.014)	Loss 2.9389 (2.8360)	Entropy 0.63795 (0.63770)	Top-1 acc 55.859 (55.728)	Top-5 acc 76.953 (78.042)	lr 0.01764
Train [44][2660/3239]	Time 0.265 (0.516)	Data Time 0.001 (0.014)	Loss 2.8362 (2.8359)	Entropy 0.63818 (0.63770)	Top-1 acc 59.766 (55.734)	Top-5 acc 79.297 (78.043)	lr 0.01764
Train [44][2670/3239]	Time 0.296 (0.516)	Data Time 0.001 (0.014)	Loss 2.8396 (2.8360)	Entropy 0.63810 (0.63770)	Top-1 acc 54.688 (55.727)	Top-5 acc 76.953 (78.040)	lr 0.01764
Train [44][2680/3239]	Time 0.251 (0.516)	Data Time 0.001 (0.014)	Loss 2.8697 (2.8362)	Entropy 0.63832 (0.63770)	Top-1 acc 53.516 (55.720)	Top-5 acc 75.000 (78.036)	lr 0.01764
Train [44][2690/3239]	Time 0.246 (0.515)	Data Time 0.002 (0.014)	Loss 2.7980 (2.8359)	Entropy 0.63785 (0.63770)	Top-1 acc 57.812 (55.726)	Top-5 acc 79.688 (78.040)	lr 0.01763
Train [44][2700/3239]	Time 0.283 (0.515)	Data Time 0.001 (0.013)	Loss 2.9117 (2.8360)	Entropy 0.63769 (0.63770)	Top-1 acc 52.344 (55.721)	Top-5 acc 76.562 (78.036)	lr 0.01763
Train [44][2710/3239]	Time 0.271 (0.515)	Data Time 0.002 (0.013)	Loss 2.8831 (2.8361)	Entropy 0.63763 (0.63770)	Top-1 acc 54.688 (55.720)	Top-5 acc 79.688 (78.034)	lr 0.01763
Train [44][2720/3239]	Time 0.252 (0.515)	Data Time 0.001 (0.013)	Loss 2.6962 (2.8358)	Entropy 0.63767 (0.63770)	Top-1 acc 59.375 (55.727)	Top-5 acc 80.859 (78.037)	lr 0.01763
Train [44][2730/3239]	Time 0.288 (0.515)	Data Time 0.003 (0.013)	Loss 2.8603 (2.8357)	Entropy 0.63745 (0.63770)	Top-1 acc 55.078 (55.731)	Top-5 acc 77.734 (78.040)	lr 0.01763
Train [44][2740/3239]	Time 0.247 (0.515)	Data Time 0.001 (0.013)	Loss 2.8882 (2.8355)	Entropy 0.63735 (0.63770)	Top-1 acc 57.812 (55.737)	Top-5 acc 76.953 (78.040)	lr 0.01763
Train [44][2750/3239]	Time 0.253 (0.515)	Data Time 0.001 (0.013)	Loss 3.0241 (2.8355)	Entropy 0.63714 (0.63770)	Top-1 acc 48.438 (55.737)	Top-5 acc 74.219 (78.042)	lr 0.01763
Train [44][2760/3239]	Time 0.268 (0.514)	Data Time 0.001 (0.013)	Loss 2.7343 (2.8355)	Entropy 0.63695 (0.63770)	Top-1 acc 58.594 (55.738)	Top-5 acc 78.125 (78.042)	lr 0.01763
Train [44][2770/3239]	Time 0.399 (0.514)	Data Time 0.002 (0.013)	Loss 2.8980 (2.8358)	Entropy 0.63725 (0.63769)	Top-1 acc 52.734 (55.731)	Top-5 acc 79.688 (78.038)	lr 0.01763
Train [44][2780/3239]	Time 0.250 (0.514)	Data Time 0.002 (0.013)	Loss 2.8024 (2.8357)	Entropy 0.63731 (0.63769)	Top-1 acc 58.984 (55.733)	Top-5 acc 77.344 (78.041)	lr 0.01763
Train [44][2790/3239]	Time 0.267 (0.525)	Data Time 0.002 (0.013)	Loss 2.9338 (2.8358)	Entropy 0.63702 (0.63769)	Top-1 acc 52.734 (55.731)	Top-5 acc 74.219 (78.040)	lr 0.01763
Train [44][2800/3239]	Time 0.259 (0.525)	Data Time 0.002 (0.013)	Loss 2.8406 (2.8356)	Entropy 0.63683 (0.63769)	Top-1 acc 55.078 (55.736)	Top-5 acc 78.906 (78.040)	lr 0.01762
Train [44][2810/3239]	Time 0.351 (0.525)	Data Time 0.002 (0.013)	Loss 2.8707 (2.8356)	Entropy 0.63691 (0.63768)	Top-1 acc 57.422 (55.733)	Top-5 acc 79.688 (78.042)	lr 0.01762
Train [44][2820/3239]	Time 0.260 (0.525)	Data Time 0.002 (0.013)	Loss 2.9239 (2.8358)	Entropy 0.63722 (0.63768)	Top-1 acc 54.688 (55.734)	Top-5 acc 77.344 (78.042)	lr 0.01762
Train [44][2830/3239]	Time 0.264 (0.525)	Data Time 0.001 (0.013)	Loss 2.6257 (2.8357)	Entropy 0.63725 (0.63768)	Top-1 acc 60.547 (55.734)	Top-5 acc 80.469 (78.043)	lr 0.01762
Train [44][2840/3239]	Time 0.366 (0.525)	Data Time 0.001 (0.013)	Loss 2.9445 (2.8358)	Entropy 0.63750 (0.63768)	Top-1 acc 51.562 (55.731)	Top-5 acc 75.391 (78.042)	lr 0.01762
Train [44][2850/3239]	Time 0.267 (0.524)	Data Time 0.001 (0.013)	Loss 2.9310 (2.8358)	Entropy 0.63747 (0.63768)	Top-1 acc 53.125 (55.731)	Top-5 acc 77.344 (78.043)	lr 0.01762
Train [44][2860/3239]	Time 0.250 (0.524)	Data Time 0.002 (0.013)	Loss 2.7531 (2.8358)	Entropy 0.63730 (0.63768)	Top-1 acc 60.156 (55.732)	Top-5 acc 78.906 (78.044)	lr 0.01762
Train [44][2870/3239]	Time 0.289 (0.524)	Data Time 0.001 (0.013)	Loss 2.9703 (2.8356)	Entropy 0.63707 (0.63768)	Top-1 acc 51.953 (55.732)	Top-5 acc 76.953 (78.049)	lr 0.01762
Train [44][2880/3239]	Time 0.268 (0.524)	Data Time 0.001 (0.013)	Loss 3.0222 (2.8357)	Entropy 0.63712 (0.63767)	Top-1 acc 51.562 (55.734)	Top-5 acc 73.828 (78.049)	lr 0.01762
Train [44][2890/3239]	Time 0.267 (0.524)	Data Time 0.001 (0.013)	Loss 2.6688 (2.8355)	Entropy 0.63757 (0.63767)	Top-1 acc 59.766 (55.737)	Top-5 acc 81.250 (78.051)	lr 0.01762
Train [44][2900/3239]	Time 0.250 (0.524)	Data Time 0.001 (0.013)	Loss 2.8584 (2.8355)	Entropy 0.63724 (0.63767)	Top-1 acc 54.688 (55.737)	Top-5 acc 78.125 (78.052)	lr 0.01762
Train [44][2910/3239]	Time 0.269 (0.524)	Data Time 0.002 (0.013)	Loss 2.9481 (2.8356)	Entropy 0.63758 (0.63767)	Top-1 acc 51.172 (55.733)	Top-5 acc 74.609 (78.048)	lr 0.01761
Train [44][2920/3239]	Time 0.252 (0.523)	Data Time 0.001 (0.013)	Loss 2.7450 (2.8357)	Entropy 0.63733 (0.63767)	Top-1 acc 56.250 (55.732)	Top-5 acc 78.906 (78.046)	lr 0.01761
Train [44][2930/3239]	Time 0.354 (0.523)	Data Time 0.001 (0.013)	Loss 2.9014 (2.8358)	Entropy 0.63776 (0.63767)	Top-1 acc 54.297 (55.729)	Top-5 acc 75.781 (78.046)	lr 0.01761
Train [44][2940/3239]	Time 0.295 (0.523)	Data Time 0.001 (0.013)	Loss 2.9788 (2.8360)	Entropy 0.63780 (0.63767)	Top-1 acc 51.172 (55.726)	Top-5 acc 77.344 (78.044)	lr 0.01761
Train [44][2950/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.013)	Loss 2.5691 (2.8358)	Entropy 0.63741 (0.63767)	Top-1 acc 61.328 (55.730)	Top-5 acc 82.812 (78.048)	lr 0.01761
Train [44][2960/3239]	Time 0.255 (0.522)	Data Time 0.001 (0.012)	Loss 2.9807 (2.8357)	Entropy 0.63744 (0.63767)	Top-1 acc 53.125 (55.733)	Top-5 acc 73.047 (78.049)	lr 0.01761
Train [44][2970/3239]	Time 0.246 (0.522)	Data Time 0.001 (0.012)	Loss 2.7821 (2.8357)	Entropy 0.63744 (0.63767)	Top-1 acc 58.594 (55.737)	Top-5 acc 79.297 (78.048)	lr 0.01761
Train [44][2980/3239]	Time 0.253 (0.522)	Data Time 0.002 (0.012)	Loss 2.8180 (2.8359)	Entropy 0.63747 (0.63767)	Top-1 acc 58.984 (55.735)	Top-5 acc 78.906 (78.046)	lr 0.01761
Train [44][2990/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.012)	Loss 2.9840 (2.8358)	Entropy 0.63703 (0.63767)	Top-1 acc 55.859 (55.735)	Top-5 acc 75.781 (78.044)	lr 0.01761
Train [44][3000/3239]	Time 0.350 (0.522)	Data Time 0.001 (0.012)	Loss 2.8350 (2.8359)	Entropy 0.63722 (0.63766)	Top-1 acc 55.078 (55.737)	Top-5 acc 77.734 (78.044)	lr 0.01761
Train [44][3010/3239]	Time 0.253 (0.521)	Data Time 0.001 (0.012)	Loss 2.8181 (2.8358)	Entropy 0.63735 (0.63766)	Top-1 acc 53.906 (55.738)	Top-5 acc 77.734 (78.045)	lr 0.01761
Train [44][3020/3239]	Time 0.271 (0.521)	Data Time 0.002 (0.012)	Loss 2.8610 (2.8360)	Entropy 0.63766 (0.63766)	Top-1 acc 52.344 (55.731)	Top-5 acc 77.734 (78.042)	lr 0.01760
Train [44][3030/3239]	Time 0.266 (0.521)	Data Time 0.001 (0.012)	Loss 2.7674 (2.8357)	Entropy 0.63778 (0.63766)	Top-1 acc 59.375 (55.738)	Top-5 acc 79.688 (78.045)	lr 0.01760
Train [44][3040/3239]	Time 0.247 (0.521)	Data Time 0.001 (0.012)	Loss 2.9852 (2.8358)	Entropy 0.63761 (0.63766)	Top-1 acc 49.219 (55.735)	Top-5 acc 75.000 (78.043)	lr 0.01760
Train [44][3050/3239]	Time 0.289 (0.521)	Data Time 0.001 (0.012)	Loss 3.0344 (2.8359)	Entropy 0.63778 (0.63766)	Top-1 acc 50.781 (55.734)	Top-5 acc 77.734 (78.042)	lr 0.01760
Train [44][3060/3239]	Time 0.336 (0.521)	Data Time 0.003 (0.012)	Loss 3.0104 (2.8361)	Entropy 0.63773 (0.63766)	Top-1 acc 49.219 (55.728)	Top-5 acc 75.781 (78.039)	lr 0.01760
Train [44][3070/3239]	Time 0.251 (0.520)	Data Time 0.001 (0.012)	Loss 2.8374 (2.8362)	Entropy 0.63779 (0.63766)	Top-1 acc 58.203 (55.726)	Top-5 acc 76.953 (78.038)	lr 0.01760
Train [44][3080/3239]	Time 0.242 (0.520)	Data Time 0.001 (0.012)	Loss 2.8020 (2.8360)	Entropy 0.63777 (0.63766)	Top-1 acc 58.594 (55.731)	Top-5 acc 79.297 (78.039)	lr 0.01760
Train [44][3090/3239]	Time 0.444 (0.520)	Data Time 0.002 (0.012)	Loss 2.7357 (2.8360)	Entropy 0.63752 (0.63766)	Top-1 acc 55.078 (55.729)	Top-5 acc 80.469 (78.040)	lr 0.01760
Train [44][3100/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.012)	Loss 2.8448 (2.8361)	Entropy 0.63755 (0.63766)	Top-1 acc 54.688 (55.727)	Top-5 acc 76.953 (78.039)	lr 0.01760
Train [44][3110/3239]	Time 0.256 (0.520)	Data Time 0.002 (0.012)	Loss 2.9193 (2.8363)	Entropy 0.63747 (0.63766)	Top-1 acc 53.125 (55.724)	Top-5 acc 77.734 (78.035)	lr 0.01760
Train [44][3120/3239]	Time 0.268 (0.520)	Data Time 0.002 (0.012)	Loss 2.7706 (2.8360)	Entropy 0.63755 (0.63766)	Top-1 acc 57.812 (55.727)	Top-5 acc 79.297 (78.040)	lr 0.01760
Train [44][3130/3239]	Time 0.270 (0.520)	Data Time 0.002 (0.012)	Loss 2.8002 (2.8361)	Entropy 0.63699 (0.63766)	Top-1 acc 52.734 (55.724)	Top-5 acc 78.516 (78.040)	lr 0.01759
Train [44][3140/3239]	Time 0.295 (0.519)	Data Time 0.001 (0.012)	Loss 2.9742 (2.8362)	Entropy 0.63684 (0.63766)	Top-1 acc 54.688 (55.724)	Top-5 acc 73.828 (78.037)	lr 0.01759
Train [44][3150/3239]	Time 0.273 (0.519)	Data Time 0.001 (0.012)	Loss 2.6990 (2.8361)	Entropy 0.63676 (0.63766)	Top-1 acc 62.891 (55.726)	Top-5 acc 80.859 (78.038)	lr 0.01759
Train [44][3160/3239]	Time 0.348 (0.519)	Data Time 0.001 (0.012)	Loss 3.1920 (2.8362)	Entropy 0.63653 (0.63765)	Top-1 acc 51.562 (55.727)	Top-5 acc 69.141 (78.035)	lr 0.01759
Train [44][3170/3239]	Time 0.255 (0.519)	Data Time 0.001 (0.012)	Loss 2.9427 (2.8365)	Entropy 0.63663 (0.63765)	Top-1 acc 52.734 (55.721)	Top-5 acc 76.953 (78.031)	lr 0.01759
Train [44][3180/3239]	Time 0.304 (0.519)	Data Time 0.000 (0.012)	Loss 2.6605 (2.8363)	Entropy 0.63667 (0.63765)	Top-1 acc 62.891 (55.725)	Top-5 acc 83.203 (78.038)	lr 0.01759
Train [44][3190/3239]	Time 0.238 (0.518)	Data Time 0.000 (0.012)	Loss 2.7890 (2.8364)	Entropy 0.63676 (0.63764)	Top-1 acc 53.906 (55.719)	Top-5 acc 79.297 (78.034)	lr 0.01759
Train [44][3200/3239]	Time 0.238 (0.518)	Data Time 0.000 (0.012)	Loss 2.6254 (2.8365)	Entropy 0.63680 (0.63764)	Top-1 acc 59.766 (55.713)	Top-5 acc 81.641 (78.032)	lr 0.01759
Train [44][3210/3239]	Time 0.229 (0.518)	Data Time 0.000 (0.012)	Loss 2.8517 (2.8365)	Entropy 0.63701 (0.63764)	Top-1 acc 57.422 (55.714)	Top-5 acc 79.688 (78.033)	lr 0.01759
Train [44][3220/3239]	Time 0.244 (0.517)	Data Time 0.000 (0.012)	Loss 2.7945 (2.8363)	Entropy 0.63700 (0.63764)	Top-1 acc 58.594 (55.718)	Top-5 acc 82.422 (78.037)	lr 0.01759
Train [44][3230/3239]	Time 0.236 (0.517)	Data Time 0.000 (0.012)	Loss 2.7791 (2.8361)	Entropy 0.63688 (0.63763)	Top-1 acc 58.984 (55.722)	Top-5 acc 80.078 (78.042)	lr 0.01759
Train [44][3239/3239]	Time 1.084 (0.517)	Data Time 0.000 (0.012)	Loss 2.8244 (2.8361)	Entropy 0.63707 (0.63763)	Top-1 acc 53.086 (55.720)	Top-5 acc 77.778 (78.042)	lr 0.01758
==========Valid [44/120]	loss 1.567	top-1 acc 64.131 (64.131)	top-5 acc 85.131	Train top-1 55.720	top-5 78.042	Entropy 0.63707	Latency-None: 0.000ms	Flops: 539.76M
Train [45][0/3239]	Time 31.594 (31.594)	Data Time 29.863 (29.863)	Loss 2.7207 (2.7207)	Entropy 0.63705 (0.63705)	Top-1 acc 57.422 (57.422)	Top-5 acc 80.078 (80.078)	lr 0.01758
Train [45][10/3239]	Time 0.268 (3.426)	Data Time 0.001 (2.754)	Loss 2.8178 (2.8238)	Entropy 0.63711 (0.63706)	Top-1 acc 58.984 (55.611)	Top-5 acc 77.734 (78.622)	lr 0.01758
Train [45][20/3239]	Time 0.250 (2.027)	Data Time 0.001 (1.444)	Loss 2.7958 (2.8562)	Entropy 0.63741 (0.63713)	Top-1 acc 55.859 (55.153)	Top-5 acc 80.469 (77.920)	lr 0.01758
Train [45][30/3239]	Time 0.227 (1.518)	Data Time 0.001 (0.979)	Loss 3.0830 (2.8574)	Entropy 0.63737 (0.63722)	Top-1 acc 52.344 (55.154)	Top-5 acc 74.219 (77.734)	lr 0.01758
Train [45][40/3239]	Time 0.256 (1.257)	Data Time 0.001 (0.740)	Loss 2.8834 (2.8538)	Entropy 0.63712 (0.63724)	Top-1 acc 53.906 (55.259)	Top-5 acc 76.562 (77.706)	lr 0.01758
Train [45][50/3239]	Time 0.260 (1.097)	Data Time 0.002 (0.595)	Loss 2.7516 (2.8364)	Entropy 0.63682 (0.63719)	Top-1 acc 54.688 (55.584)	Top-5 acc 80.469 (78.056)	lr 0.01758
Train [45][60/3239]	Time 0.338 (0.994)	Data Time 0.002 (0.498)	Loss 2.8922 (2.8385)	Entropy 0.63693 (0.63715)	Top-1 acc 52.344 (55.501)	Top-5 acc 76.562 (78.029)	lr 0.01758
Train [45][70/3239]	Time 0.235 (0.917)	Data Time 0.001 (0.428)	Loss 2.6912 (2.8339)	Entropy 0.63711 (0.63713)	Top-1 acc 62.500 (55.755)	Top-5 acc 81.641 (78.075)	lr 0.01758
Train [45][80/3239]	Time 0.305 (0.860)	Data Time 0.001 (0.376)	Loss 2.8243 (2.8259)	Entropy 0.63708 (0.63711)	Top-1 acc 57.031 (55.903)	Top-5 acc 77.344 (78.183)	lr 0.01758
Train [45][90/3239]	Time 0.282 (0.816)	Data Time 0.001 (0.335)	Loss 2.9479 (2.8236)	Entropy 0.63707 (0.63711)	Top-1 acc 52.734 (55.919)	Top-5 acc 76.172 (78.254)	lr 0.01758
Train [45][100/3239]	Time 0.245 (0.779)	Data Time 0.001 (0.302)	Loss 3.1177 (2.8242)	Entropy 0.63686 (0.63710)	Top-1 acc 51.172 (55.917)	Top-5 acc 72.266 (78.183)	lr 0.01757
Train [45][110/3239]	Time 0.253 (0.752)	Data Time 0.001 (0.275)	Loss 2.6522 (2.8188)	Entropy 0.63687 (0.63708)	Top-1 acc 57.031 (56.025)	Top-5 acc 82.422 (78.378)	lr 0.01757
Train [45][120/3239]	Time 0.304 (0.726)	Data Time 0.002 (0.252)	Loss 2.7179 (2.8242)	Entropy 0.63665 (0.63705)	Top-1 acc 57.812 (55.969)	Top-5 acc 78.125 (78.193)	lr 0.01757
Train [45][130/3239]	Time 0.260 (0.707)	Data Time 0.001 (0.233)	Loss 2.6592 (2.8190)	Entropy 0.63642 (0.63702)	Top-1 acc 58.203 (56.125)	Top-5 acc 82.812 (78.292)	lr 0.01757
Train [45][140/3239]	Time 0.291 (0.693)	Data Time 0.002 (0.217)	Loss 2.9654 (2.8124)	Entropy 0.63666 (0.63699)	Top-1 acc 55.469 (56.297)	Top-5 acc 75.000 (78.438)	lr 0.01757
Train [45][150/3239]	Time 0.361 (0.678)	Data Time 0.001 (0.203)	Loss 2.9178 (2.8137)	Entropy 0.63645 (0.63696)	Top-1 acc 52.734 (56.250)	Top-5 acc 76.562 (78.415)	lr 0.01757
Train [45][160/3239]	Time 0.260 (0.664)	Data Time 0.001 (0.190)	Loss 2.8626 (2.8164)	Entropy 0.63670 (0.63693)	Top-1 acc 51.172 (56.175)	Top-5 acc 79.688 (78.377)	lr 0.01757
Train [45][170/3239]	Time 0.257 (0.652)	Data Time 0.001 (0.179)	Loss 2.8378 (2.8166)	Entropy 0.63684 (0.63692)	Top-1 acc 53.125 (56.197)	Top-5 acc 79.297 (78.358)	lr 0.01757
Train [45][180/3239]	Time 0.252 (0.642)	Data Time 0.001 (0.169)	Loss 2.9000 (2.8189)	Entropy 0.63718 (0.63692)	Top-1 acc 54.688 (56.129)	Top-5 acc 76.953 (78.341)	lr 0.01757
Train [45][190/3239]	Time 0.254 (0.633)	Data Time 0.001 (0.160)	Loss 2.6804 (2.8219)	Entropy 0.63711 (0.63693)	Top-1 acc 58.594 (56.035)	Top-5 acc 80.078 (78.260)	lr 0.01757
Train [45][200/3239]	Time 0.411 (0.786)	Data Time 0.006 (0.153)	Loss 2.5283 (2.8213)	Entropy 0.63695 (0.63694)	Top-1 acc 61.328 (56.067)	Top-5 acc 84.375 (78.255)	lr 0.01757
Train [45][210/3239]	Time 0.256 (0.773)	Data Time 0.002 (0.146)	Loss 2.7291 (2.8208)	Entropy 0.63720 (0.63694)	Top-1 acc 57.422 (56.083)	Top-5 acc 78.906 (78.295)	lr 0.01756
Train [45][220/3239]	Time 0.377 (0.760)	Data Time 0.002 (0.139)	Loss 2.8918 (2.8193)	Entropy 0.63738 (0.63696)	Top-1 acc 50.391 (56.064)	Top-5 acc 77.734 (78.321)	lr 0.01756
Train [45][230/3239]	Time 0.253 (0.747)	Data Time 0.002 (0.133)	Loss 2.9392 (2.8200)	Entropy 0.63737 (0.63698)	Top-1 acc 53.516 (56.027)	Top-5 acc 76.953 (78.319)	lr 0.01756
Train [45][240/3239]	Time 0.266 (0.735)	Data Time 0.002 (0.128)	Loss 2.9138 (2.8177)	Entropy 0.63742 (0.63699)	Top-1 acc 50.781 (56.106)	Top-5 acc 76.562 (78.349)	lr 0.01756
Train [45][250/3239]	Time 0.317 (0.725)	Data Time 0.003 (0.123)	Loss 2.6814 (2.8163)	Entropy 0.63741 (0.63701)	Top-1 acc 60.938 (56.146)	Top-5 acc 80.859 (78.385)	lr 0.01756
Train [45][260/3239]	Time 0.247 (0.715)	Data Time 0.002 (0.118)	Loss 3.2438 (2.8164)	Entropy 0.63686 (0.63701)	Top-1 acc 49.219 (56.121)	Top-5 acc 72.266 (78.385)	lr 0.01756
Train [45][270/3239]	Time 0.252 (0.705)	Data Time 0.002 (0.114)	Loss 2.7828 (2.8160)	Entropy 0.63699 (0.63701)	Top-1 acc 57.422 (56.145)	Top-5 acc 76.953 (78.402)	lr 0.01756
Train [45][280/3239]	Time 0.223 (0.696)	Data Time 0.001 (0.110)	Loss 2.9005 (2.8176)	Entropy 0.63733 (0.63701)	Top-1 acc 53.516 (56.097)	Top-5 acc 76.953 (78.360)	lr 0.01756
Train [45][290/3239]	Time 0.292 (0.689)	Data Time 0.002 (0.106)	Loss 2.9444 (2.8195)	Entropy 0.63743 (0.63702)	Top-1 acc 53.516 (56.023)	Top-5 acc 77.344 (78.344)	lr 0.01756
Train [45][300/3239]	Time 0.287 (0.681)	Data Time 0.002 (0.103)	Loss 2.8345 (2.8209)	Entropy 0.63743 (0.63704)	Top-1 acc 55.469 (55.985)	Top-5 acc 78.516 (78.305)	lr 0.01756
Train [45][310/3239]	Time 0.346 (0.674)	Data Time 0.001 (0.099)	Loss 2.5969 (2.8218)	Entropy 0.63739 (0.63705)	Top-1 acc 59.375 (55.969)	Top-5 acc 81.641 (78.279)	lr 0.01756
Train [45][320/3239]	Time 0.239 (0.667)	Data Time 0.001 (0.096)	Loss 2.4812 (2.8232)	Entropy 0.63704 (0.63706)	Top-1 acc 62.109 (55.912)	Top-5 acc 85.547 (78.255)	lr 0.01755
Train [45][330/3239]	Time 0.246 (0.661)	Data Time 0.001 (0.094)	Loss 2.6690 (2.8209)	Entropy 0.63667 (0.63706)	Top-1 acc 58.594 (55.981)	Top-5 acc 80.469 (78.291)	lr 0.01755
Train [45][340/3239]	Time 0.242 (0.655)	Data Time 0.001 (0.091)	Loss 2.9119 (2.8182)	Entropy 0.63650 (0.63704)	Top-1 acc 58.203 (56.079)	Top-5 acc 77.344 (78.333)	lr 0.01755
Train [45][350/3239]	Time 0.238 (0.649)	Data Time 0.001 (0.088)	Loss 2.7353 (2.8165)	Entropy 0.63622 (0.63702)	Top-1 acc 55.078 (56.091)	Top-5 acc 82.031 (78.401)	lr 0.01755
Train [45][360/3239]	Time 0.243 (0.644)	Data Time 0.001 (0.086)	Loss 2.8500 (2.8157)	Entropy 0.63650 (0.63700)	Top-1 acc 56.641 (56.121)	Top-5 acc 78.125 (78.391)	lr 0.01755
Train [45][370/3239]	Time 0.264 (0.639)	Data Time 0.002 (0.084)	Loss 2.7876 (2.8151)	Entropy 0.63651 (0.63699)	Top-1 acc 57.812 (56.146)	Top-5 acc 78.516 (78.409)	lr 0.01755
Train [45][380/3239]	Time 0.401 (0.635)	Data Time 0.001 (0.081)	Loss 2.7912 (2.8140)	Entropy 0.63657 (0.63698)	Top-1 acc 52.734 (56.182)	Top-5 acc 80.859 (78.433)	lr 0.01755
Train [45][390/3239]	Time 0.267 (0.631)	Data Time 0.002 (0.079)	Loss 2.8374 (2.8145)	Entropy 0.63676 (0.63697)	Top-1 acc 56.250 (56.163)	Top-5 acc 76.562 (78.430)	lr 0.01755
Train [45][400/3239]	Time 0.258 (0.626)	Data Time 0.001 (0.078)	Loss 2.7346 (2.8137)	Entropy 0.63650 (0.63696)	Top-1 acc 62.500 (56.194)	Top-5 acc 79.297 (78.447)	lr 0.01755
Train [45][410/3239]	Time 0.260 (0.622)	Data Time 0.001 (0.076)	Loss 2.7236 (2.8131)	Entropy 0.63646 (0.63695)	Top-1 acc 58.203 (56.218)	Top-5 acc 82.031 (78.447)	lr 0.01755
Train [45][420/3239]	Time 0.244 (0.618)	Data Time 0.001 (0.074)	Loss 2.8062 (2.8131)	Entropy 0.63616 (0.63693)	Top-1 acc 57.422 (56.225)	Top-5 acc 79.688 (78.447)	lr 0.01755
Train [45][430/3239]	Time 0.304 (0.615)	Data Time 0.001 (0.072)	Loss 2.7270 (2.8127)	Entropy 0.63594 (0.63691)	Top-1 acc 58.203 (56.236)	Top-5 acc 78.906 (78.462)	lr 0.01754
Train [45][440/3239]	Time 0.244 (0.611)	Data Time 0.001 (0.071)	Loss 2.8923 (2.8126)	Entropy 0.63599 (0.63689)	Top-1 acc 56.250 (56.255)	Top-5 acc 78.125 (78.473)	lr 0.01754
Train [45][450/3239]	Time 0.291 (0.609)	Data Time 0.001 (0.069)	Loss 2.8752 (2.8129)	Entropy 0.63587 (0.63687)	Top-1 acc 51.953 (56.232)	Top-5 acc 79.297 (78.474)	lr 0.01754
Train [45][460/3239]	Time 0.252 (0.605)	Data Time 0.001 (0.068)	Loss 2.8485 (2.8140)	Entropy 0.63564 (0.63685)	Top-1 acc 56.250 (56.194)	Top-5 acc 78.125 (78.463)	lr 0.01754
Train [45][470/3239]	Time 0.284 (0.602)	Data Time 0.001 (0.066)	Loss 2.6031 (2.8124)	Entropy 0.63580 (0.63682)	Top-1 acc 57.031 (56.222)	Top-5 acc 82.422 (78.501)	lr 0.01754
Train [45][480/3239]	Time 0.274 (0.599)	Data Time 0.002 (0.065)	Loss 2.8831 (2.8133)	Entropy 0.63571 (0.63680)	Top-1 acc 55.078 (56.198)	Top-5 acc 74.609 (78.480)	lr 0.01754
Train [45][490/3239]	Time 0.385 (0.597)	Data Time 0.003 (0.064)	Loss 2.8563 (2.8143)	Entropy 0.63579 (0.63678)	Top-1 acc 57.422 (56.170)	Top-5 acc 75.391 (78.449)	lr 0.01754
Train [45][500/3239]	Time 0.240 (0.595)	Data Time 0.001 (0.062)	Loss 2.9272 (2.8152)	Entropy 0.63549 (0.63676)	Top-1 acc 51.953 (56.135)	Top-5 acc 76.172 (78.443)	lr 0.01754
Train [45][510/3239]	Time 0.246 (0.593)	Data Time 0.002 (0.061)	Loss 2.5777 (2.8163)	Entropy 0.63585 (0.63673)	Top-1 acc 60.938 (56.104)	Top-5 acc 84.375 (78.425)	lr 0.01754
Train [45][520/3239]	Time 0.243 (0.590)	Data Time 0.001 (0.060)	Loss 2.6900 (2.8156)	Entropy 0.63588 (0.63672)	Top-1 acc 57.031 (56.100)	Top-5 acc 79.688 (78.436)	lr 0.01754
Train [45][530/3239]	Time 0.233 (0.587)	Data Time 0.001 (0.059)	Loss 2.9599 (2.8153)	Entropy 0.63553 (0.63670)	Top-1 acc 55.078 (56.121)	Top-5 acc 76.172 (78.446)	lr 0.01754
Train [45][540/3239]	Time 0.456 (0.585)	Data Time 0.005 (0.058)	Loss 2.7312 (2.8155)	Entropy 0.63545 (0.63668)	Top-1 acc 57.812 (56.099)	Top-5 acc 80.078 (78.441)	lr 0.01753
Train [45][550/3239]	Time 0.286 (0.583)	Data Time 0.003 (0.057)	Loss 2.9462 (2.8164)	Entropy 0.63514 (0.63665)	Top-1 acc 56.250 (56.071)	Top-5 acc 76.953 (78.431)	lr 0.01753
Train [45][560/3239]	Time 0.314 (0.580)	Data Time 0.004 (0.056)	Loss 2.7656 (2.8158)	Entropy 0.63559 (0.63663)	Top-1 acc 55.859 (56.088)	Top-5 acc 81.641 (78.453)	lr 0.01753
Train [45][570/3239]	Time 0.255 (0.578)	Data Time 0.002 (0.055)	Loss 2.9957 (2.8143)	Entropy 0.63594 (0.63661)	Top-1 acc 52.734 (56.126)	Top-5 acc 75.781 (78.481)	lr 0.01753
Train [45][580/3239]	Time 0.249 (0.576)	Data Time 0.001 (0.054)	Loss 2.8586 (2.8139)	Entropy 0.63601 (0.63660)	Top-1 acc 53.516 (56.148)	Top-5 acc 77.734 (78.485)	lr 0.01753
Train [45][590/3239]	Time 0.248 (0.573)	Data Time 0.001 (0.053)	Loss 2.8835 (2.8149)	Entropy 0.63623 (0.63659)	Top-1 acc 59.375 (56.135)	Top-5 acc 77.344 (78.471)	lr 0.01753
Train [45][600/3239]	Time 0.241 (0.571)	Data Time 0.001 (0.052)	Loss 2.8890 (2.8151)	Entropy 0.63651 (0.63659)	Top-1 acc 55.469 (56.145)	Top-5 acc 78.125 (78.464)	lr 0.01753
Train [45][610/3239]	Time 0.351 (0.569)	Data Time 0.001 (0.052)	Loss 3.0881 (2.8161)	Entropy 0.63706 (0.63659)	Top-1 acc 51.562 (56.120)	Top-5 acc 74.219 (78.438)	lr 0.01753
Train [45][620/3239]	Time 0.265 (0.568)	Data Time 0.002 (0.051)	Loss 2.8471 (2.8166)	Entropy 0.63663 (0.63659)	Top-1 acc 55.859 (56.113)	Top-5 acc 75.781 (78.430)	lr 0.01753
Train [45][630/3239]	Time 0.288 (0.566)	Data Time 0.002 (0.050)	Loss 2.7688 (2.8165)	Entropy 0.63677 (0.63659)	Top-1 acc 57.812 (56.108)	Top-5 acc 80.078 (78.442)	lr 0.01753
Train [45][640/3239]	Time 0.248 (0.564)	Data Time 0.002 (0.049)	Loss 2.6630 (2.8164)	Entropy 0.63702 (0.63660)	Top-1 acc 58.203 (56.124)	Top-5 acc 82.812 (78.444)	lr 0.01753
Train [45][650/3239]	Time 0.262 (0.562)	Data Time 0.001 (0.049)	Loss 2.7024 (2.8154)	Entropy 0.63702 (0.63660)	Top-1 acc 60.547 (56.133)	Top-5 acc 79.688 (78.464)	lr 0.01752
Train [45][660/3239]	Time 0.286 (0.561)	Data Time 0.001 (0.048)	Loss 2.7530 (2.8154)	Entropy 0.63709 (0.63661)	Top-1 acc 60.156 (56.127)	Top-5 acc 82.422 (78.471)	lr 0.01752
Train [45][670/3239]	Time 0.250 (0.559)	Data Time 0.001 (0.047)	Loss 2.9471 (2.8163)	Entropy 0.63732 (0.63662)	Top-1 acc 53.516 (56.110)	Top-5 acc 75.781 (78.440)	lr 0.01752
Train [45][680/3239]	Time 0.234 (0.557)	Data Time 0.001 (0.046)	Loss 2.8748 (2.8169)	Entropy 0.63742 (0.63663)	Top-1 acc 56.641 (56.089)	Top-5 acc 76.953 (78.435)	lr 0.01752
Train [45][690/3239]	Time 0.249 (0.555)	Data Time 0.001 (0.046)	Loss 2.9641 (2.8179)	Entropy 0.63718 (0.63664)	Top-1 acc 50.000 (56.064)	Top-5 acc 78.906 (78.410)	lr 0.01752
Train [45][700/3239]	Time 0.323 (0.554)	Data Time 0.001 (0.045)	Loss 2.6975 (2.8178)	Entropy 0.63711 (0.63665)	Top-1 acc 57.812 (56.061)	Top-5 acc 82.812 (78.409)	lr 0.01752
Train [45][710/3239]	Time 0.276 (0.552)	Data Time 0.001 (0.045)	Loss 3.1341 (2.8184)	Entropy 0.63693 (0.63665)	Top-1 acc 49.219 (56.046)	Top-5 acc 68.750 (78.393)	lr 0.01752
Train [45][720/3239]	Time 0.270 (0.551)	Data Time 0.002 (0.044)	Loss 2.8808 (2.8186)	Entropy 0.63691 (0.63666)	Top-1 acc 53.125 (56.037)	Top-5 acc 75.391 (78.386)	lr 0.01752
Train [45][730/3239]	Time 0.239 (0.550)	Data Time 0.001 (0.043)	Loss 2.6282 (2.8185)	Entropy 0.63718 (0.63666)	Top-1 acc 62.109 (56.043)	Top-5 acc 82.812 (78.395)	lr 0.01752
Train [45][740/3239]	Time 0.233 (0.548)	Data Time 0.001 (0.043)	Loss 2.9409 (2.8189)	Entropy 0.63687 (0.63667)	Top-1 acc 51.953 (56.036)	Top-5 acc 75.391 (78.389)	lr 0.01752
Train [45][750/3239]	Time 0.284 (0.547)	Data Time 0.001 (0.042)	Loss 2.7143 (2.8190)	Entropy 0.63704 (0.63667)	Top-1 acc 58.594 (56.041)	Top-5 acc 79.688 (78.388)	lr 0.01751
Train [45][760/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.042)	Loss 2.9608 (2.8192)	Entropy 0.63717 (0.63668)	Top-1 acc 57.422 (56.039)	Top-5 acc 73.828 (78.380)	lr 0.01751
Train [45][770/3239]	Time 0.360 (0.544)	Data Time 0.001 (0.041)	Loss 2.8617 (2.8188)	Entropy 0.63684 (0.63668)	Top-1 acc 56.641 (56.051)	Top-5 acc 79.688 (78.396)	lr 0.01751
Train [45][780/3239]	Time 0.287 (0.542)	Data Time 0.001 (0.041)	Loss 2.7725 (2.8194)	Entropy 0.63703 (0.63668)	Top-1 acc 53.516 (56.028)	Top-5 acc 78.906 (78.382)	lr 0.01751
Train [45][790/3239]	Time 0.239 (0.541)	Data Time 0.002 (0.040)	Loss 2.7347 (2.8199)	Entropy 0.63647 (0.63669)	Top-1 acc 56.250 (56.000)	Top-5 acc 78.906 (78.371)	lr 0.01751
Train [45][800/3239]	Time 0.238 (0.540)	Data Time 0.002 (0.040)	Loss 2.7127 (2.8198)	Entropy 0.63620 (0.63668)	Top-1 acc 58.203 (56.006)	Top-5 acc 80.469 (78.369)	lr 0.01751
Train [45][810/3239]	Time 0.220 (0.539)	Data Time 0.001 (0.039)	Loss 2.9741 (2.8204)	Entropy 0.63632 (0.63668)	Top-1 acc 53.125 (55.988)	Top-5 acc 76.562 (78.360)	lr 0.01751
Train [45][820/3239]	Time 0.266 (0.538)	Data Time 0.001 (0.039)	Loss 2.9459 (2.8204)	Entropy 0.63650 (0.63667)	Top-1 acc 53.516 (55.988)	Top-5 acc 75.391 (78.359)	lr 0.01751
Train [45][830/3239]	Time 0.259 (0.537)	Data Time 0.002 (0.038)	Loss 2.7736 (2.8205)	Entropy 0.63621 (0.63667)	Top-1 acc 56.641 (55.989)	Top-5 acc 79.688 (78.354)	lr 0.01751
Train [45][840/3239]	Time 0.272 (0.536)	Data Time 0.001 (0.038)	Loss 2.9881 (2.8203)	Entropy 0.63628 (0.63666)	Top-1 acc 50.391 (56.008)	Top-5 acc 75.781 (78.357)	lr 0.01751
Train [45][850/3239]	Time 0.244 (0.535)	Data Time 0.001 (0.038)	Loss 2.8409 (2.8200)	Entropy 0.63623 (0.63666)	Top-1 acc 53.125 (56.022)	Top-5 acc 77.344 (78.355)	lr 0.01751
Train [45][860/3239]	Time 0.340 (0.574)	Data Time 0.002 (0.037)	Loss 2.8885 (2.8203)	Entropy 0.63622 (0.63665)	Top-1 acc 55.859 (56.020)	Top-5 acc 79.688 (78.359)	lr 0.01750
Train [45][870/3239]	Time 0.235 (0.572)	Data Time 0.002 (0.037)	Loss 3.1082 (2.8201)	Entropy 0.63634 (0.63665)	Top-1 acc 50.391 (56.037)	Top-5 acc 72.266 (78.364)	lr 0.01750
Train [45][880/3239]	Time 0.300 (0.571)	Data Time 0.004 (0.036)	Loss 2.8667 (2.8208)	Entropy 0.63629 (0.63665)	Top-1 acc 54.688 (56.014)	Top-5 acc 76.953 (78.348)	lr 0.01750
Train [45][890/3239]	Time 0.267 (0.570)	Data Time 0.002 (0.036)	Loss 3.0103 (2.8205)	Entropy 0.63599 (0.63664)	Top-1 acc 51.562 (56.035)	Top-5 acc 74.609 (78.360)	lr 0.01750
Train [45][900/3239]	Time 0.247 (0.569)	Data Time 0.001 (0.036)	Loss 2.9644 (2.8204)	Entropy 0.63621 (0.63663)	Top-1 acc 50.000 (56.045)	Top-5 acc 76.172 (78.367)	lr 0.01750
Train [45][910/3239]	Time 0.259 (0.568)	Data Time 0.001 (0.035)	Loss 2.8497 (2.8202)	Entropy 0.63614 (0.63663)	Top-1 acc 57.031 (56.042)	Top-5 acc 76.172 (78.362)	lr 0.01750
Train [45][920/3239]	Time 0.250 (0.567)	Data Time 0.001 (0.035)	Loss 2.8103 (2.8200)	Entropy 0.63627 (0.63662)	Top-1 acc 55.859 (56.055)	Top-5 acc 80.469 (78.369)	lr 0.01750
Train [45][930/3239]	Time 0.372 (0.566)	Data Time 0.001 (0.035)	Loss 2.6695 (2.8202)	Entropy 0.63618 (0.63662)	Top-1 acc 58.984 (56.053)	Top-5 acc 80.078 (78.365)	lr 0.01750
Train [45][940/3239]	Time 0.279 (0.565)	Data Time 0.001 (0.034)	Loss 2.9958 (2.8209)	Entropy 0.63644 (0.63662)	Top-1 acc 51.172 (56.045)	Top-5 acc 72.266 (78.352)	lr 0.01750
Train [45][950/3239]	Time 0.256 (0.564)	Data Time 0.001 (0.034)	Loss 2.6572 (2.8206)	Entropy 0.63661 (0.63662)	Top-1 acc 58.594 (56.039)	Top-5 acc 80.469 (78.359)	lr 0.01750
Train [45][960/3239]	Time 0.260 (0.563)	Data Time 0.001 (0.034)	Loss 2.8535 (2.8207)	Entropy 0.63638 (0.63662)	Top-1 acc 53.516 (56.035)	Top-5 acc 75.391 (78.355)	lr 0.01750
Train [45][970/3239]	Time 0.291 (0.562)	Data Time 0.001 (0.033)	Loss 2.8303 (2.8210)	Entropy 0.63619 (0.63661)	Top-1 acc 55.859 (56.028)	Top-5 acc 76.953 (78.353)	lr 0.01749
Train [45][980/3239]	Time 0.244 (0.561)	Data Time 0.001 (0.033)	Loss 2.6786 (2.8208)	Entropy 0.63607 (0.63661)	Top-1 acc 59.375 (56.031)	Top-5 acc 81.250 (78.347)	lr 0.01749
Train [45][990/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.033)	Loss 2.9262 (2.8212)	Entropy 0.63630 (0.63660)	Top-1 acc 54.297 (56.023)	Top-5 acc 75.781 (78.331)	lr 0.01749
Train [45][1000/3239]	Time 0.286 (0.559)	Data Time 0.001 (0.032)	Loss 2.8848 (2.8203)	Entropy 0.63614 (0.63660)	Top-1 acc 50.781 (56.040)	Top-5 acc 76.562 (78.350)	lr 0.01749
Train [45][1010/3239]	Time 0.260 (0.558)	Data Time 0.002 (0.032)	Loss 2.9755 (2.8200)	Entropy 0.63609 (0.63660)	Top-1 acc 51.172 (56.045)	Top-5 acc 74.609 (78.354)	lr 0.01749
Train [45][1020/3239]	Time 0.347 (0.557)	Data Time 0.001 (0.032)	Loss 2.8308 (2.8204)	Entropy 0.63578 (0.63659)	Top-1 acc 55.078 (56.038)	Top-5 acc 78.125 (78.355)	lr 0.01749
Train [45][1030/3239]	Time 0.238 (0.557)	Data Time 0.001 (0.031)	Loss 2.7795 (2.8211)	Entropy 0.63585 (0.63658)	Top-1 acc 58.594 (56.017)	Top-5 acc 78.125 (78.339)	lr 0.01749
Train [45][1040/3239]	Time 0.247 (0.555)	Data Time 0.001 (0.031)	Loss 2.9203 (2.8216)	Entropy 0.63571 (0.63658)	Top-1 acc 53.125 (56.005)	Top-5 acc 78.906 (78.332)	lr 0.01749
Train [45][1050/3239]	Time 0.241 (0.555)	Data Time 0.001 (0.031)	Loss 2.9540 (2.8219)	Entropy 0.63493 (0.63657)	Top-1 acc 54.297 (56.006)	Top-5 acc 76.172 (78.331)	lr 0.01749
Train [45][1060/3239]	Time 0.246 (0.553)	Data Time 0.001 (0.031)	Loss 2.8008 (2.8222)	Entropy 0.63505 (0.63655)	Top-1 acc 56.641 (55.997)	Top-5 acc 78.125 (78.325)	lr 0.01749
Train [45][1070/3239]	Time 0.267 (0.553)	Data Time 0.001 (0.030)	Loss 2.8122 (2.8223)	Entropy 0.63496 (0.63654)	Top-1 acc 57.812 (55.999)	Top-5 acc 80.859 (78.324)	lr 0.01749
Train [45][1080/3239]	Time 0.255 (0.552)	Data Time 0.001 (0.030)	Loss 2.8433 (2.8220)	Entropy 0.63515 (0.63652)	Top-1 acc 57.422 (56.004)	Top-5 acc 75.391 (78.328)	lr 0.01748
Train [45][1090/3239]	Time 0.339 (0.551)	Data Time 0.001 (0.030)	Loss 2.8708 (2.8219)	Entropy 0.63525 (0.63651)	Top-1 acc 54.297 (56.002)	Top-5 acc 76.562 (78.326)	lr 0.01748
Train [45][1100/3239]	Time 0.273 (0.550)	Data Time 0.001 (0.030)	Loss 2.8902 (2.8227)	Entropy 0.63487 (0.63650)	Top-1 acc 54.297 (55.986)	Top-5 acc 77.734 (78.310)	lr 0.01748
Train [45][1110/3239]	Time 0.241 (0.549)	Data Time 0.001 (0.029)	Loss 2.9597 (2.8227)	Entropy 0.63462 (0.63648)	Top-1 acc 51.953 (55.980)	Top-5 acc 76.562 (78.311)	lr 0.01748
Train [45][1120/3239]	Time 0.255 (0.548)	Data Time 0.001 (0.029)	Loss 2.7753 (2.8232)	Entropy 0.63435 (0.63647)	Top-1 acc 54.297 (55.963)	Top-5 acc 79.688 (78.305)	lr 0.01748
Train [45][1130/3239]	Time 0.271 (0.547)	Data Time 0.001 (0.029)	Loss 2.7475 (2.8230)	Entropy 0.63435 (0.63645)	Top-1 acc 57.031 (55.972)	Top-5 acc 78.516 (78.308)	lr 0.01748
Train [45][1140/3239]	Time 0.250 (0.547)	Data Time 0.001 (0.029)	Loss 2.7532 (2.8229)	Entropy 0.63437 (0.63643)	Top-1 acc 57.031 (55.976)	Top-5 acc 80.078 (78.305)	lr 0.01748
Train [45][1150/3239]	Time 0.243 (0.546)	Data Time 0.001 (0.028)	Loss 2.9294 (2.8237)	Entropy 0.63437 (0.63641)	Top-1 acc 53.125 (55.959)	Top-5 acc 76.172 (78.283)	lr 0.01748
Train [45][1160/3239]	Time 0.238 (0.545)	Data Time 0.002 (0.028)	Loss 2.6842 (2.8234)	Entropy 0.63409 (0.63639)	Top-1 acc 55.078 (55.970)	Top-5 acc 82.031 (78.293)	lr 0.01748
Train [45][1170/3239]	Time 0.249 (0.545)	Data Time 0.001 (0.028)	Loss 2.8840 (2.8236)	Entropy 0.63397 (0.63637)	Top-1 acc 57.031 (55.962)	Top-5 acc 73.438 (78.283)	lr 0.01748
Train [45][1180/3239]	Time 0.254 (0.544)	Data Time 0.001 (0.028)	Loss 2.9272 (2.8235)	Entropy 0.63413 (0.63635)	Top-1 acc 53.125 (55.963)	Top-5 acc 74.219 (78.281)	lr 0.01748
Train [45][1190/3239]	Time 0.315 (0.543)	Data Time 0.001 (0.027)	Loss 2.8159 (2.8235)	Entropy 0.63404 (0.63633)	Top-1 acc 56.250 (55.949)	Top-5 acc 78.516 (78.290)	lr 0.01747
Train [45][1200/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.027)	Loss 2.9408 (2.8233)	Entropy 0.63421 (0.63631)	Top-1 acc 54.297 (55.956)	Top-5 acc 75.391 (78.293)	lr 0.01747
Train [45][1210/3239]	Time 0.260 (0.542)	Data Time 0.001 (0.027)	Loss 2.9049 (2.8235)	Entropy 0.63436 (0.63630)	Top-1 acc 53.125 (55.953)	Top-5 acc 75.781 (78.290)	lr 0.01747
Train [45][1220/3239]	Time 0.284 (0.541)	Data Time 0.001 (0.027)	Loss 2.7517 (2.8235)	Entropy 0.63459 (0.63628)	Top-1 acc 56.250 (55.945)	Top-5 acc 80.078 (78.292)	lr 0.01747
Train [45][1230/3239]	Time 0.248 (0.540)	Data Time 0.001 (0.027)	Loss 3.0157 (2.8231)	Entropy 0.63440 (0.63627)	Top-1 acc 50.781 (55.949)	Top-5 acc 75.391 (78.301)	lr 0.01747
Train [45][1240/3239]	Time 0.239 (0.540)	Data Time 0.001 (0.026)	Loss 3.0316 (2.8234)	Entropy 0.63454 (0.63625)	Top-1 acc 51.562 (55.946)	Top-5 acc 76.172 (78.295)	lr 0.01747
Train [45][1250/3239]	Time 0.376 (0.539)	Data Time 0.001 (0.026)	Loss 2.9533 (2.8239)	Entropy 0.63459 (0.63624)	Top-1 acc 51.562 (55.935)	Top-5 acc 74.609 (78.278)	lr 0.01747
Train [45][1260/3239]	Time 0.265 (0.538)	Data Time 0.002 (0.026)	Loss 2.8370 (2.8233)	Entropy 0.63466 (0.63622)	Top-1 acc 58.594 (55.950)	Top-5 acc 77.344 (78.288)	lr 0.01747
Train [45][1270/3239]	Time 0.241 (0.537)	Data Time 0.001 (0.026)	Loss 2.9416 (2.8234)	Entropy 0.63504 (0.63621)	Top-1 acc 53.906 (55.946)	Top-5 acc 78.125 (78.286)	lr 0.01747
Train [45][1280/3239]	Time 0.282 (0.537)	Data Time 0.002 (0.026)	Loss 2.6669 (2.8230)	Entropy 0.63508 (0.63620)	Top-1 acc 58.594 (55.962)	Top-5 acc 79.688 (78.291)	lr 0.01747
Train [45][1290/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.025)	Loss 2.9345 (2.8233)	Entropy 0.63530 (0.63620)	Top-1 acc 52.734 (55.960)	Top-5 acc 76.172 (78.284)	lr 0.01746
Train [45][1300/3239]	Time 0.254 (0.536)	Data Time 0.001 (0.025)	Loss 2.9048 (2.8234)	Entropy 0.63544 (0.63619)	Top-1 acc 57.422 (55.954)	Top-5 acc 75.391 (78.284)	lr 0.01746
Train [45][1310/3239]	Time 0.243 (0.535)	Data Time 0.002 (0.025)	Loss 2.9184 (2.8238)	Entropy 0.63530 (0.63618)	Top-1 acc 53.516 (55.943)	Top-5 acc 76.172 (78.278)	lr 0.01746
Train [45][1320/3239]	Time 0.356 (0.535)	Data Time 0.001 (0.025)	Loss 2.9116 (2.8241)	Entropy 0.63548 (0.63618)	Top-1 acc 52.734 (55.945)	Top-5 acc 77.344 (78.271)	lr 0.01746
Train [45][1330/3239]	Time 0.242 (0.534)	Data Time 0.002 (0.025)	Loss 3.0288 (2.8246)	Entropy 0.63561 (0.63617)	Top-1 acc 51.562 (55.935)	Top-5 acc 73.828 (78.259)	lr 0.01746
Train [45][1340/3239]	Time 0.251 (0.533)	Data Time 0.001 (0.025)	Loss 2.5712 (2.8246)	Entropy 0.63572 (0.63617)	Top-1 acc 58.984 (55.933)	Top-5 acc 81.641 (78.261)	lr 0.01746
Train [45][1350/3239]	Time 0.254 (0.533)	Data Time 0.002 (0.024)	Loss 2.7817 (2.8253)	Entropy 0.63603 (0.63617)	Top-1 acc 57.422 (55.925)	Top-5 acc 79.297 (78.242)	lr 0.01746
Train [45][1360/3239]	Time 0.289 (0.532)	Data Time 0.002 (0.024)	Loss 2.7734 (2.8255)	Entropy 0.63572 (0.63616)	Top-1 acc 58.594 (55.923)	Top-5 acc 80.469 (78.238)	lr 0.01746
Train [45][1370/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.024)	Loss 2.9341 (2.8261)	Entropy 0.63593 (0.63616)	Top-1 acc 53.516 (55.914)	Top-5 acc 76.953 (78.228)	lr 0.01746
Train [45][1380/3239]	Time 0.244 (0.531)	Data Time 0.002 (0.024)	Loss 2.6886 (2.8259)	Entropy 0.63545 (0.63616)	Top-1 acc 62.500 (55.925)	Top-5 acc 81.641 (78.234)	lr 0.01746
Train [45][1390/3239]	Time 0.242 (0.531)	Data Time 0.001 (0.024)	Loss 2.9108 (2.8256)	Entropy 0.63571 (0.63615)	Top-1 acc 53.125 (55.943)	Top-5 acc 75.391 (78.235)	lr 0.01746
Train [45][1400/3239]	Time 0.290 (0.530)	Data Time 0.003 (0.024)	Loss 2.9712 (2.8259)	Entropy 0.63594 (0.63615)	Top-1 acc 53.906 (55.942)	Top-5 acc 77.734 (78.233)	lr 0.01745
Train [45][1410/3239]	Time 0.360 (0.530)	Data Time 0.001 (0.023)	Loss 2.7656 (2.8260)	Entropy 0.63611 (0.63615)	Top-1 acc 55.469 (55.937)	Top-5 acc 81.641 (78.231)	lr 0.01745
Train [45][1420/3239]	Time 0.274 (0.529)	Data Time 0.001 (0.023)	Loss 2.8273 (2.8263)	Entropy 0.63574 (0.63615)	Top-1 acc 55.469 (55.939)	Top-5 acc 78.516 (78.229)	lr 0.01745
Train [45][1430/3239]	Time 0.308 (0.528)	Data Time 0.048 (0.023)	Loss 2.7745 (2.8263)	Entropy 0.63576 (0.63615)	Top-1 acc 53.516 (55.937)	Top-5 acc 79.688 (78.227)	lr 0.01745
Train [45][1440/3239]	Time 0.286 (0.528)	Data Time 0.001 (0.023)	Loss 2.8402 (2.8263)	Entropy 0.63603 (0.63614)	Top-1 acc 55.469 (55.934)	Top-5 acc 75.391 (78.223)	lr 0.01745
Train [45][1450/3239]	Time 0.281 (0.528)	Data Time 0.002 (0.023)	Loss 2.9097 (2.8270)	Entropy 0.63588 (0.63614)	Top-1 acc 50.000 (55.910)	Top-5 acc 77.344 (78.208)	lr 0.01745
Train [45][1460/3239]	Time 0.253 (0.527)	Data Time 0.001 (0.023)	Loss 2.8045 (2.8269)	Entropy 0.63563 (0.63614)	Top-1 acc 55.078 (55.916)	Top-5 acc 76.562 (78.205)	lr 0.01745
Train [45][1470/3239]	Time 0.240 (0.526)	Data Time 0.001 (0.023)	Loss 2.7330 (2.8269)	Entropy 0.63549 (0.63614)	Top-1 acc 57.422 (55.913)	Top-5 acc 81.641 (78.205)	lr 0.01745
Train [45][1480/3239]	Time 0.350 (0.526)	Data Time 0.001 (0.022)	Loss 2.9146 (2.8269)	Entropy 0.63527 (0.63613)	Top-1 acc 58.984 (55.919)	Top-5 acc 76.953 (78.203)	lr 0.01745
Train [45][1490/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.022)	Loss 2.8894 (2.8277)	Entropy 0.63521 (0.63613)	Top-1 acc 55.078 (55.913)	Top-5 acc 76.953 (78.184)	lr 0.01745
Train [45][1500/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.022)	Loss 3.0158 (2.8282)	Entropy 0.63521 (0.63612)	Top-1 acc 51.562 (55.900)	Top-5 acc 75.781 (78.177)	lr 0.01745
Train [45][1510/3239]	Time 0.389 (0.545)	Data Time 0.005 (0.022)	Loss 2.8848 (2.8278)	Entropy 0.63526 (0.63611)	Top-1 acc 55.859 (55.910)	Top-5 acc 76.562 (78.180)	lr 0.01744
Train [45][1520/3239]	Time 0.248 (0.545)	Data Time 0.002 (0.022)	Loss 2.9741 (2.8278)	Entropy 0.63547 (0.63611)	Top-1 acc 53.906 (55.911)	Top-5 acc 76.953 (78.180)	lr 0.01744
Train [45][1530/3239]	Time 0.252 (0.544)	Data Time 0.003 (0.022)	Loss 2.7522 (2.8279)	Entropy 0.63522 (0.63610)	Top-1 acc 58.203 (55.910)	Top-5 acc 77.344 (78.177)	lr 0.01744
Train [45][1540/3239]	Time 0.275 (0.544)	Data Time 0.002 (0.022)	Loss 2.7851 (2.8276)	Entropy 0.63532 (0.63610)	Top-1 acc 55.859 (55.913)	Top-5 acc 76.172 (78.182)	lr 0.01744
Train [45][1550/3239]	Time 0.243 (0.543)	Data Time 0.001 (0.022)	Loss 2.8202 (2.8277)	Entropy 0.63535 (0.63609)	Top-1 acc 57.422 (55.918)	Top-5 acc 76.953 (78.180)	lr 0.01744
Train [45][1560/3239]	Time 0.277 (0.543)	Data Time 0.001 (0.021)	Loss 2.6852 (2.8278)	Entropy 0.63548 (0.63609)	Top-1 acc 57.422 (55.920)	Top-5 acc 82.422 (78.180)	lr 0.01744
Train [45][1570/3239]	Time 0.413 (0.543)	Data Time 0.002 (0.021)	Loss 2.8332 (2.8275)	Entropy 0.63528 (0.63608)	Top-1 acc 56.641 (55.927)	Top-5 acc 77.734 (78.185)	lr 0.01744
Train [45][1580/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.021)	Loss 2.8614 (2.8272)	Entropy 0.63518 (0.63608)	Top-1 acc 58.203 (55.935)	Top-5 acc 78.125 (78.192)	lr 0.01744
Train [45][1590/3239]	Time 0.256 (0.542)	Data Time 0.001 (0.021)	Loss 2.8075 (2.8270)	Entropy 0.63527 (0.63607)	Top-1 acc 58.984 (55.935)	Top-5 acc 77.734 (78.191)	lr 0.01744
Train [45][1600/3239]	Time 0.292 (0.541)	Data Time 0.001 (0.021)	Loss 2.7484 (2.8269)	Entropy 0.63437 (0.63607)	Top-1 acc 58.203 (55.940)	Top-5 acc 76.172 (78.194)	lr 0.01744
Train [45][1610/3239]	Time 0.233 (0.541)	Data Time 0.001 (0.021)	Loss 2.6763 (2.8267)	Entropy 0.63452 (0.63606)	Top-1 acc 58.984 (55.944)	Top-5 acc 80.859 (78.200)	lr 0.01744
Train [45][1620/3239]	Time 0.249 (0.540)	Data Time 0.001 (0.021)	Loss 2.8744 (2.8266)	Entropy 0.63466 (0.63605)	Top-1 acc 55.078 (55.943)	Top-5 acc 76.953 (78.205)	lr 0.01743
Train [45][1630/3239]	Time 0.243 (0.540)	Data Time 0.001 (0.021)	Loss 2.7640 (2.8263)	Entropy 0.63487 (0.63604)	Top-1 acc 59.766 (55.956)	Top-5 acc 77.734 (78.210)	lr 0.01743
Train [45][1640/3239]	Time 0.398 (0.539)	Data Time 0.001 (0.021)	Loss 2.7275 (2.8262)	Entropy 0.63522 (0.63603)	Top-1 acc 57.031 (55.955)	Top-5 acc 81.250 (78.216)	lr 0.01743
Train [45][1650/3239]	Time 0.307 (0.539)	Data Time 0.001 (0.020)	Loss 2.8209 (2.8260)	Entropy 0.63556 (0.63603)	Top-1 acc 55.469 (55.958)	Top-5 acc 77.344 (78.220)	lr 0.01743
Train [45][1660/3239]	Time 0.252 (0.539)	Data Time 0.004 (0.020)	Loss 2.6958 (2.8258)	Entropy 0.63509 (0.63602)	Top-1 acc 58.594 (55.966)	Top-5 acc 80.078 (78.225)	lr 0.01743
Train [45][1670/3239]	Time 0.256 (0.538)	Data Time 0.001 (0.020)	Loss 2.8111 (2.8257)	Entropy 0.63503 (0.63602)	Top-1 acc 58.203 (55.965)	Top-5 acc 80.078 (78.225)	lr 0.01743
Train [45][1680/3239]	Time 0.260 (0.538)	Data Time 0.001 (0.020)	Loss 2.7503 (2.8259)	Entropy 0.63507 (0.63601)	Top-1 acc 62.109 (55.962)	Top-5 acc 79.688 (78.219)	lr 0.01743
Train [45][1690/3239]	Time 0.252 (0.537)	Data Time 0.001 (0.020)	Loss 2.8884 (2.8257)	Entropy 0.63493 (0.63601)	Top-1 acc 54.688 (55.960)	Top-5 acc 76.953 (78.221)	lr 0.01743
Train [45][1700/3239]	Time 0.260 (0.537)	Data Time 0.001 (0.020)	Loss 2.8514 (2.8259)	Entropy 0.63485 (0.63600)	Top-1 acc 54.297 (55.948)	Top-5 acc 78.516 (78.218)	lr 0.01743
Train [45][1710/3239]	Time 0.251 (0.536)	Data Time 0.001 (0.020)	Loss 2.7764 (2.8262)	Entropy 0.63477 (0.63599)	Top-1 acc 55.469 (55.941)	Top-5 acc 78.906 (78.213)	lr 0.01743
Train [45][1720/3239]	Time 0.237 (0.536)	Data Time 0.001 (0.020)	Loss 2.7879 (2.8260)	Entropy 0.63457 (0.63599)	Top-1 acc 55.078 (55.937)	Top-5 acc 80.078 (78.213)	lr 0.01743
Train [45][1730/3239]	Time 0.326 (0.535)	Data Time 0.002 (0.020)	Loss 2.7051 (2.8261)	Entropy 0.63490 (0.63598)	Top-1 acc 60.938 (55.940)	Top-5 acc 79.297 (78.214)	lr 0.01742
Train [45][1740/3239]	Time 0.242 (0.536)	Data Time 0.001 (0.019)	Loss 2.9703 (2.8259)	Entropy 0.63501 (0.63597)	Top-1 acc 52.734 (55.948)	Top-5 acc 74.609 (78.217)	lr 0.01742
Train [45][1750/3239]	Time 0.247 (0.535)	Data Time 0.001 (0.019)	Loss 2.7647 (2.8260)	Entropy 0.63495 (0.63597)	Top-1 acc 53.906 (55.943)	Top-5 acc 82.812 (78.215)	lr 0.01742
Train [45][1760/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.019)	Loss 2.7906 (2.8257)	Entropy 0.63477 (0.63596)	Top-1 acc 52.734 (55.946)	Top-5 acc 82.812 (78.225)	lr 0.01742
Train [45][1770/3239]	Time 0.256 (0.534)	Data Time 0.001 (0.019)	Loss 2.9237 (2.8257)	Entropy 0.63485 (0.63595)	Top-1 acc 52.344 (55.947)	Top-5 acc 76.953 (78.224)	lr 0.01742
Train [45][1780/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.019)	Loss 2.6300 (2.8257)	Entropy 0.63529 (0.63595)	Top-1 acc 60.547 (55.950)	Top-5 acc 84.766 (78.224)	lr 0.01742
Train [45][1790/3239]	Time 0.243 (0.533)	Data Time 0.001 (0.019)	Loss 2.8409 (2.8260)	Entropy 0.63536 (0.63595)	Top-1 acc 56.250 (55.940)	Top-5 acc 76.172 (78.221)	lr 0.01742
Train [45][1800/3239]	Time 0.368 (0.532)	Data Time 0.001 (0.019)	Loss 2.9264 (2.8261)	Entropy 0.63538 (0.63594)	Top-1 acc 52.734 (55.934)	Top-5 acc 75.781 (78.221)	lr 0.01742
Train [45][1810/3239]	Time 0.233 (0.532)	Data Time 0.001 (0.019)	Loss 2.8058 (2.8259)	Entropy 0.63533 (0.63594)	Top-1 acc 57.812 (55.940)	Top-5 acc 78.125 (78.223)	lr 0.01742
Train [45][1820/3239]	Time 0.319 (0.531)	Data Time 0.002 (0.019)	Loss 2.9330 (2.8260)	Entropy 0.63480 (0.63593)	Top-1 acc 54.688 (55.943)	Top-5 acc 77.344 (78.223)	lr 0.01742
Train [45][1830/3239]	Time 0.286 (0.531)	Data Time 0.002 (0.019)	Loss 2.7662 (2.8261)	Entropy 0.63449 (0.63593)	Top-1 acc 55.859 (55.939)	Top-5 acc 81.641 (78.223)	lr 0.01741
Train [45][1840/3239]	Time 0.270 (0.530)	Data Time 0.001 (0.018)	Loss 2.8404 (2.8261)	Entropy 0.63435 (0.63592)	Top-1 acc 55.469 (55.938)	Top-5 acc 78.906 (78.226)	lr 0.01741
Train [45][1850/3239]	Time 0.275 (0.530)	Data Time 0.001 (0.018)	Loss 2.7416 (2.8260)	Entropy 0.63432 (0.63591)	Top-1 acc 57.422 (55.938)	Top-5 acc 80.078 (78.228)	lr 0.01741
Train [45][1860/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.018)	Loss 3.0216 (2.8264)	Entropy 0.63411 (0.63590)	Top-1 acc 50.781 (55.930)	Top-5 acc 72.656 (78.221)	lr 0.01741
Train [45][1870/3239]	Time 0.331 (0.530)	Data Time 0.001 (0.019)	Loss 2.7824 (2.8267)	Entropy 0.63374 (0.63589)	Top-1 acc 55.859 (55.919)	Top-5 acc 78.516 (78.219)	lr 0.01741
Train [45][1880/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.020)	Loss 2.7585 (2.8266)	Entropy 0.63362 (0.63588)	Top-1 acc 57.422 (55.926)	Top-5 acc 79.297 (78.220)	lr 0.01741
Train [45][1890/3239]	Time 0.254 (0.531)	Data Time 0.002 (0.021)	Loss 3.0353 (2.8270)	Entropy 0.63384 (0.63587)	Top-1 acc 51.172 (55.915)	Top-5 acc 73.438 (78.206)	lr 0.01741
Train [45][1900/3239]	Time 0.250 (0.531)	Data Time 0.001 (0.022)	Loss 2.9667 (2.8272)	Entropy 0.63377 (0.63586)	Top-1 acc 52.344 (55.907)	Top-5 acc 78.125 (78.205)	lr 0.01741
Train [45][1910/3239]	Time 0.878 (0.531)	Data Time 0.637 (0.022)	Loss 2.5533 (2.8268)	Entropy 0.63341 (0.63584)	Top-1 acc 60.156 (55.914)	Top-5 acc 85.547 (78.212)	lr 0.01741
Train [45][1920/3239]	Time 0.240 (0.534)	Data Time 0.001 (0.025)	Loss 2.7424 (2.8267)	Entropy 0.63380 (0.63583)	Top-1 acc 57.422 (55.912)	Top-5 acc 76.953 (78.211)	lr 0.01741
Train [45][1930/3239]	Time 0.242 (0.533)	Data Time 0.001 (0.025)	Loss 2.6365 (2.8267)	Entropy 0.63345 (0.63582)	Top-1 acc 59.766 (55.917)	Top-5 acc 81.641 (78.214)	lr 0.01741
Train [45][1940/3239]	Time 0.251 (0.534)	Data Time 0.001 (0.026)	Loss 3.0304 (2.8267)	Entropy 0.63353 (0.63581)	Top-1 acc 46.875 (55.915)	Top-5 acc 73.438 (78.210)	lr 0.01740
Train [45][1950/3239]	Time 0.269 (0.534)	Data Time 0.002 (0.027)	Loss 2.8796 (2.8269)	Entropy 0.63309 (0.63580)	Top-1 acc 53.906 (55.914)	Top-5 acc 76.562 (78.204)	lr 0.01740
Train [45][1960/3239]	Time 0.355 (0.536)	Data Time 0.001 (0.029)	Loss 2.7400 (2.8270)	Entropy 0.63293 (0.63578)	Top-1 acc 58.203 (55.907)	Top-5 acc 79.688 (78.202)	lr 0.01740
Train [45][1970/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.029)	Loss 3.0410 (2.8272)	Entropy 0.63280 (0.63577)	Top-1 acc 50.391 (55.902)	Top-5 acc 76.172 (78.202)	lr 0.01740
Train [45][1980/3239]	Time 0.242 (0.537)	Data Time 0.001 (0.030)	Loss 2.8346 (2.8268)	Entropy 0.63319 (0.63575)	Top-1 acc 55.859 (55.908)	Top-5 acc 80.859 (78.210)	lr 0.01740
Train [45][1990/3239]	Time 0.235 (0.539)	Data Time 0.001 (0.032)	Loss 2.9236 (2.8272)	Entropy 0.63348 (0.63574)	Top-1 acc 55.859 (55.896)	Top-5 acc 78.125 (78.205)	lr 0.01740
Train [45][2000/3239]	Time 0.296 (0.538)	Data Time 0.001 (0.032)	Loss 3.0310 (2.8272)	Entropy 0.63336 (0.63573)	Top-1 acc 48.438 (55.890)	Top-5 acc 75.391 (78.203)	lr 0.01740
Train [45][2010/3239]	Time 0.274 (0.540)	Data Time 0.002 (0.035)	Loss 2.8512 (2.8276)	Entropy 0.63359 (0.63572)	Top-1 acc 53.125 (55.880)	Top-5 acc 76.953 (78.201)	lr 0.01740
Train [45][2020/3239]	Time 3.050 (0.541)	Data Time 2.776 (0.036)	Loss 2.8316 (2.8277)	Entropy 0.63351 (0.63571)	Top-1 acc 53.516 (55.874)	Top-5 acc 78.516 (78.198)	lr 0.01740
Train [45][2030/3239]	Time 0.420 (0.541)	Data Time 0.002 (0.036)	Loss 2.8437 (2.8276)	Entropy 0.63344 (0.63570)	Top-1 acc 54.297 (55.873)	Top-5 acc 78.906 (78.201)	lr 0.01740
Train [45][2040/3239]	Time 0.442 (0.543)	Data Time 0.182 (0.039)	Loss 2.8958 (2.8278)	Entropy 0.63321 (0.63568)	Top-1 acc 56.641 (55.864)	Top-5 acc 77.734 (78.195)	lr 0.01740
Train [45][2050/3239]	Time 0.313 (0.544)	Data Time 0.002 (0.040)	Loss 2.8470 (2.8280)	Entropy 0.63301 (0.63567)	Top-1 acc 56.641 (55.857)	Top-5 acc 77.734 (78.193)	lr 0.01739
Train [45][2060/3239]	Time 0.260 (0.544)	Data Time 0.001 (0.040)	Loss 2.8569 (2.8283)	Entropy 0.63275 (0.63566)	Top-1 acc 55.078 (55.847)	Top-5 acc 75.391 (78.187)	lr 0.01739
Train [45][2070/3239]	Time 3.698 (0.545)	Data Time 3.416 (0.042)	Loss 2.9640 (2.8287)	Entropy 0.63273 (0.63565)	Top-1 acc 56.250 (55.839)	Top-5 acc 75.781 (78.178)	lr 0.01739
Train [45][2080/3239]	Time 0.268 (0.547)	Data Time 0.001 (0.043)	Loss 2.6484 (2.8290)	Entropy 0.63316 (0.63563)	Top-1 acc 58.203 (55.833)	Top-5 acc 84.375 (78.173)	lr 0.01739
Train [45][2090/3239]	Time 0.236 (0.546)	Data Time 0.001 (0.043)	Loss 3.0709 (2.8288)	Entropy 0.63270 (0.63562)	Top-1 acc 50.391 (55.843)	Top-5 acc 74.609 (78.177)	lr 0.01739
Train [45][2100/3239]	Time 1.957 (0.547)	Data Time 1.697 (0.045)	Loss 2.8414 (2.8287)	Entropy 0.63272 (0.63560)	Top-1 acc 53.125 (55.843)	Top-5 acc 77.734 (78.179)	lr 0.01739
Train [45][2110/3239]	Time 0.234 (0.549)	Data Time 0.001 (0.047)	Loss 3.3470 (2.8290)	Entropy 0.63273 (0.63559)	Top-1 acc 46.875 (55.844)	Top-5 acc 66.016 (78.175)	lr 0.01739
Train [45][2120/3239]	Time 0.284 (0.549)	Data Time 0.001 (0.047)	Loss 2.8762 (2.8296)	Entropy 0.63254 (0.63558)	Top-1 acc 55.469 (55.832)	Top-5 acc 75.000 (78.159)	lr 0.01739
Train [45][2130/3239]	Time 0.234 (0.550)	Data Time 0.001 (0.048)	Loss 2.7991 (2.8297)	Entropy 0.63259 (0.63556)	Top-1 acc 55.078 (55.828)	Top-5 acc 79.297 (78.160)	lr 0.01739
Train [45][2140/3239]	Time 0.226 (0.551)	Data Time 0.001 (0.050)	Loss 2.8802 (2.8298)	Entropy 0.63278 (0.63555)	Top-1 acc 57.812 (55.827)	Top-5 acc 76.172 (78.156)	lr 0.01739
Train [45][2150/3239]	Time 0.237 (0.551)	Data Time 0.001 (0.050)	Loss 2.6635 (2.8298)	Entropy 0.63260 (0.63554)	Top-1 acc 61.719 (55.829)	Top-5 acc 82.031 (78.156)	lr 0.01739
Train [45][2160/3239]	Time 0.242 (0.554)	Data Time 0.001 (0.054)	Loss 3.1231 (2.8298)	Entropy 0.63260 (0.63552)	Top-1 acc 49.219 (55.828)	Top-5 acc 73.438 (78.158)	lr 0.01738
Train [45][2170/3239]	Time 0.298 (0.571)	Data Time 0.002 (0.054)	Loss 2.9020 (2.8297)	Entropy 0.63248 (0.63551)	Top-1 acc 54.297 (55.827)	Top-5 acc 76.562 (78.162)	lr 0.01738
Train [45][2180/3239]	Time 0.264 (0.570)	Data Time 0.002 (0.054)	Loss 2.7635 (2.8298)	Entropy 0.63275 (0.63550)	Top-1 acc 56.250 (55.832)	Top-5 acc 83.984 (78.161)	lr 0.01738
Train [45][2190/3239]	Time 0.374 (0.570)	Data Time 0.001 (0.053)	Loss 2.7070 (2.8298)	Entropy 0.63272 (0.63548)	Top-1 acc 58.203 (55.831)	Top-5 acc 80.078 (78.161)	lr 0.01738
Train [45][2200/3239]	Time 0.254 (0.569)	Data Time 0.002 (0.053)	Loss 2.7483 (2.8299)	Entropy 0.63284 (0.63547)	Top-1 acc 57.812 (55.827)	Top-5 acc 80.859 (78.162)	lr 0.01738
Train [45][2210/3239]	Time 0.247 (0.568)	Data Time 0.001 (0.053)	Loss 2.9276 (2.8297)	Entropy 0.63272 (0.63546)	Top-1 acc 55.469 (55.831)	Top-5 acc 76.172 (78.168)	lr 0.01738
Train [45][2220/3239]	Time 0.309 (0.568)	Data Time 0.003 (0.053)	Loss 2.9456 (2.8297)	Entropy 0.63298 (0.63545)	Top-1 acc 51.953 (55.829)	Top-5 acc 74.609 (78.168)	lr 0.01738
Train [45][2230/3239]	Time 0.269 (0.567)	Data Time 0.001 (0.052)	Loss 2.5654 (2.8293)	Entropy 0.63255 (0.63544)	Top-1 acc 62.500 (55.837)	Top-5 acc 84.766 (78.175)	lr 0.01738
Train [45][2240/3239]	Time 0.292 (0.567)	Data Time 0.001 (0.052)	Loss 2.7357 (2.8293)	Entropy 0.63243 (0.63542)	Top-1 acc 59.766 (55.837)	Top-5 acc 80.469 (78.177)	lr 0.01738
Train [45][2250/3239]	Time 0.246 (0.566)	Data Time 0.001 (0.052)	Loss 2.9049 (2.8294)	Entropy 0.63216 (0.63541)	Top-1 acc 59.766 (55.836)	Top-5 acc 77.344 (78.176)	lr 0.01738
Train [45][2260/3239]	Time 0.256 (0.566)	Data Time 0.001 (0.052)	Loss 2.7244 (2.8292)	Entropy 0.63231 (0.63540)	Top-1 acc 59.375 (55.836)	Top-5 acc 79.688 (78.178)	lr 0.01737
Train [45][2270/3239]	Time 0.251 (0.566)	Data Time 0.001 (0.053)	Loss 2.7430 (2.8294)	Entropy 0.63261 (0.63538)	Top-1 acc 60.938 (55.833)	Top-5 acc 82.422 (78.175)	lr 0.01737
Train [45][2280/3239]	Time 0.271 (0.566)	Data Time 0.001 (0.053)	Loss 2.8186 (2.8296)	Entropy 0.63240 (0.63537)	Top-1 acc 56.641 (55.828)	Top-5 acc 79.297 (78.171)	lr 0.01737
Train [45][2290/3239]	Time 0.268 (0.567)	Data Time 0.001 (0.054)	Loss 3.1026 (2.8300)	Entropy 0.63245 (0.63536)	Top-1 acc 46.875 (55.818)	Top-5 acc 71.875 (78.164)	lr 0.01737
Train [45][2300/3239]	Time 0.249 (0.570)	Data Time 0.002 (0.057)	Loss 2.9403 (2.8300)	Entropy 0.63239 (0.63534)	Top-1 acc 52.734 (55.819)	Top-5 acc 74.609 (78.162)	lr 0.01737
Train [45][2310/3239]	Time 0.267 (0.572)	Data Time 0.001 (0.059)	Loss 2.7165 (2.8300)	Entropy 0.63216 (0.63533)	Top-1 acc 60.156 (55.820)	Top-5 acc 79.688 (78.162)	lr 0.01737
Train [45][2320/3239]	Time 0.242 (0.572)	Data Time 0.001 (0.060)	Loss 2.6654 (2.8301)	Entropy 0.63195 (0.63532)	Top-1 acc 60.156 (55.818)	Top-5 acc 79.688 (78.158)	lr 0.01737
Train [45][2330/3239]	Time 0.268 (0.575)	Data Time 0.001 (0.063)	Loss 2.7544 (2.8300)	Entropy 0.63183 (0.63530)	Top-1 acc 56.641 (55.822)	Top-5 acc 78.125 (78.160)	lr 0.01737
Train [45][2340/3239]	Time 0.254 (0.575)	Data Time 0.003 (0.063)	Loss 2.5925 (2.8298)	Entropy 0.63197 (0.63529)	Top-1 acc 62.891 (55.827)	Top-5 acc 79.688 (78.162)	lr 0.01737
Train [45][2350/3239]	Time 0.349 (0.575)	Data Time 0.001 (0.064)	Loss 2.9413 (2.8300)	Entropy 0.63178 (0.63527)	Top-1 acc 56.250 (55.824)	Top-5 acc 76.172 (78.155)	lr 0.01737
Train [45][2360/3239]	Time 0.240 (0.579)	Data Time 0.001 (0.068)	Loss 2.7568 (2.8302)	Entropy 0.63179 (0.63526)	Top-1 acc 53.125 (55.822)	Top-5 acc 78.906 (78.153)	lr 0.01737
Train [45][2370/3239]	Time 0.279 (0.578)	Data Time 0.002 (0.068)	Loss 2.7955 (2.8304)	Entropy 0.63181 (0.63524)	Top-1 acc 57.812 (55.815)	Top-5 acc 78.125 (78.150)	lr 0.01736
Train [45][2380/3239]	Time 0.242 (0.582)	Data Time 0.001 (0.072)	Loss 2.9369 (2.8306)	Entropy 0.63176 (0.63523)	Top-1 acc 55.078 (55.809)	Top-5 acc 76.172 (78.147)	lr 0.01736
Train [45][2390/3239]	Time 0.227 (0.581)	Data Time 0.001 (0.072)	Loss 2.9484 (2.8306)	Entropy 0.63173 (0.63521)	Top-1 acc 53.125 (55.814)	Top-5 acc 76.953 (78.151)	lr 0.01736
Train [45][2400/3239]	Time 0.251 (0.582)	Data Time 0.001 (0.073)	Loss 2.7242 (2.8304)	Entropy 0.63157 (0.63520)	Top-1 acc 58.203 (55.819)	Top-5 acc 80.859 (78.152)	lr 0.01736
Train [45][2410/3239]	Time 10.764 (0.586)	Data Time 10.491 (0.077)	Loss 2.8655 (2.8303)	Entropy 0.63147 (0.63518)	Top-1 acc 54.297 (55.820)	Top-5 acc 76.953 (78.150)	lr 0.01736
Train [45][2420/3239]	Time 0.342 (0.586)	Data Time 0.001 (0.077)	Loss 2.9193 (2.8301)	Entropy 0.63164 (0.63517)	Top-1 acc 57.812 (55.832)	Top-5 acc 76.953 (78.155)	lr 0.01736
Train [45][2430/3239]	Time 0.240 (0.586)	Data Time 0.001 (0.078)	Loss 2.7951 (2.8297)	Entropy 0.63156 (0.63516)	Top-1 acc 56.250 (55.840)	Top-5 acc 77.734 (78.161)	lr 0.01736
Train [45][2440/3239]	Time 0.230 (0.586)	Data Time 0.001 (0.078)	Loss 2.7270 (2.8294)	Entropy 0.63156 (0.63514)	Top-1 acc 59.766 (55.849)	Top-5 acc 76.953 (78.164)	lr 0.01736
Train [45][2450/3239]	Time 0.236 (0.592)	Data Time 0.001 (0.084)	Loss 3.0052 (2.8293)	Entropy 0.63144 (0.63513)	Top-1 acc 51.562 (55.853)	Top-5 acc 72.266 (78.165)	lr 0.01736
Train [45][2460/3239]	Time 0.234 (0.591)	Data Time 0.001 (0.083)	Loss 2.6403 (2.8294)	Entropy 0.63141 (0.63511)	Top-1 acc 62.500 (55.850)	Top-5 acc 80.859 (78.161)	lr 0.01736
Train [45][2470/3239]	Time 0.227 (0.590)	Data Time 0.001 (0.083)	Loss 2.7531 (2.8292)	Entropy 0.63156 (0.63510)	Top-1 acc 55.078 (55.851)	Top-5 acc 82.031 (78.166)	lr 0.01736
Train [45][2480/3239]	Time 0.265 (0.596)	Data Time 0.001 (0.089)	Loss 2.9066 (2.8292)	Entropy 0.63162 (0.63508)	Top-1 acc 55.469 (55.852)	Top-5 acc 76.953 (78.169)	lr 0.01735
Train [45][2490/3239]	Time 0.286 (0.599)	Data Time 0.002 (0.092)	Loss 2.8432 (2.8292)	Entropy 0.63191 (0.63507)	Top-1 acc 56.641 (55.852)	Top-5 acc 77.734 (78.170)	lr 0.01735
Train [45][2500/3239]	Time 0.228 (0.598)	Data Time 0.001 (0.092)	Loss 3.0037 (2.8292)	Entropy 0.63212 (0.63506)	Top-1 acc 51.953 (55.850)	Top-5 acc 75.781 (78.171)	lr 0.01735
Train [45][2510/3239]	Time 0.354 (0.601)	Data Time 0.001 (0.095)	Loss 2.9326 (2.8292)	Entropy 0.63205 (0.63504)	Top-1 acc 51.562 (55.848)	Top-5 acc 75.000 (78.170)	lr 0.01735
Train [45][2520/3239]	Time 0.241 (0.603)	Data Time 0.001 (0.097)	Loss 2.9527 (2.8293)	Entropy 0.63236 (0.63503)	Top-1 acc 53.906 (55.848)	Top-5 acc 75.391 (78.164)	lr 0.01735
Train [45][2530/3239]	Time 0.238 (0.602)	Data Time 0.001 (0.096)	Loss 2.8158 (2.8293)	Entropy 0.63212 (0.63502)	Top-1 acc 58.984 (55.846)	Top-5 acc 79.297 (78.162)	lr 0.01735
Train [45][2540/3239]	Time 0.260 (0.608)	Data Time 0.002 (0.103)	Loss 2.7393 (2.8293)	Entropy 0.63248 (0.63501)	Top-1 acc 57.422 (55.847)	Top-5 acc 80.078 (78.160)	lr 0.01735
Train [45][2550/3239]	Time 0.240 (0.608)	Data Time 0.001 (0.102)	Loss 2.8285 (2.8294)	Entropy 0.63245 (0.63500)	Top-1 acc 57.422 (55.846)	Top-5 acc 75.391 (78.157)	lr 0.01735
Train [45][2560/3239]	Time 0.254 (0.607)	Data Time 0.001 (0.102)	Loss 2.7326 (2.8291)	Entropy 0.63220 (0.63499)	Top-1 acc 59.375 (55.850)	Top-5 acc 78.906 (78.161)	lr 0.01735
Train [45][2570/3239]	Time 10.581 (0.610)	Data Time 10.322 (0.106)	Loss 2.7681 (2.8290)	Entropy 0.63206 (0.63498)	Top-1 acc 57.812 (55.850)	Top-5 acc 78.125 (78.162)	lr 0.01735
Train [45][2580/3239]	Time 0.341 (0.609)	Data Time 0.001 (0.105)	Loss 2.6804 (2.8290)	Entropy 0.63238 (0.63497)	Top-1 acc 60.156 (55.851)	Top-5 acc 80.859 (78.164)	lr 0.01735
Train [45][2590/3239]	Time 0.265 (0.609)	Data Time 0.002 (0.105)	Loss 2.8946 (2.8289)	Entropy 0.63266 (0.63496)	Top-1 acc 56.250 (55.856)	Top-5 acc 74.609 (78.164)	lr 0.01734
Train [45][2600/3239]	Time 0.236 (0.608)	Data Time 0.001 (0.104)	Loss 2.7837 (2.8289)	Entropy 0.63297 (0.63495)	Top-1 acc 57.422 (55.855)	Top-5 acc 78.906 (78.162)	lr 0.01734
Train [45][2610/3239]	Time 0.258 (0.612)	Data Time 0.001 (0.109)	Loss 2.8458 (2.8287)	Entropy 0.63284 (0.63494)	Top-1 acc 52.344 (55.860)	Top-5 acc 78.906 (78.168)	lr 0.01734
Train [45][2620/3239]	Time 0.236 (0.611)	Data Time 0.001 (0.109)	Loss 2.9674 (2.8288)	Entropy 0.63258 (0.63493)	Top-1 acc 53.516 (55.858)	Top-5 acc 73.047 (78.167)	lr 0.01734
Train [45][2630/3239]	Time 0.220 (0.611)	Data Time 0.001 (0.108)	Loss 3.0288 (2.8290)	Entropy 0.63243 (0.63493)	Top-1 acc 52.344 (55.857)	Top-5 acc 74.219 (78.163)	lr 0.01734
Train [45][2640/3239]	Time 0.262 (0.615)	Data Time 0.001 (0.113)	Loss 2.9599 (2.8293)	Entropy 0.63262 (0.63492)	Top-1 acc 53.516 (55.849)	Top-5 acc 75.391 (78.155)	lr 0.01734
Train [45][2650/3239]	Time 0.235 (0.614)	Data Time 0.001 (0.112)	Loss 2.7120 (2.8294)	Entropy 0.63197 (0.63491)	Top-1 acc 55.078 (55.842)	Top-5 acc 80.859 (78.155)	lr 0.01734
Train [45][2660/3239]	Time 0.226 (0.613)	Data Time 0.001 (0.112)	Loss 3.1058 (2.8294)	Entropy 0.63221 (0.63490)	Top-1 acc 51.953 (55.841)	Top-5 acc 72.266 (78.157)	lr 0.01734
Train [45][2670/3239]	Time 0.347 (0.618)	Data Time 0.001 (0.117)	Loss 2.8255 (2.8296)	Entropy 0.63185 (0.63489)	Top-1 acc 56.641 (55.838)	Top-5 acc 79.297 (78.156)	lr 0.01734
Train [45][2680/3239]	Time 0.236 (0.617)	Data Time 0.001 (0.116)	Loss 2.8833 (2.8294)	Entropy 0.63150 (0.63487)	Top-1 acc 55.078 (55.840)	Top-5 acc 75.000 (78.161)	lr 0.01734
Train [45][2690/3239]	Time 0.226 (0.619)	Data Time 0.001 (0.118)	Loss 2.9221 (2.8294)	Entropy 0.63167 (0.63486)	Top-1 acc 56.641 (55.843)	Top-5 acc 80.078 (78.161)	lr 0.01733
Train [45][2700/3239]	Time 0.242 (0.627)	Data Time 0.001 (0.127)	Loss 2.8377 (2.8293)	Entropy 0.63189 (0.63485)	Top-1 acc 55.078 (55.847)	Top-5 acc 78.516 (78.164)	lr 0.01733
Train [45][2710/3239]	Time 0.264 (0.627)	Data Time 0.001 (0.126)	Loss 2.9747 (2.8295)	Entropy 0.63190 (0.63484)	Top-1 acc 50.781 (55.844)	Top-5 acc 76.172 (78.162)	lr 0.01733
Train [45][2720/3239]	Time 0.232 (0.626)	Data Time 0.001 (0.126)	Loss 2.8064 (2.8294)	Entropy 0.63219 (0.63483)	Top-1 acc 57.031 (55.847)	Top-5 acc 81.250 (78.164)	lr 0.01733
Train [45][2730/3239]	Time 25.774 (0.634)	Data Time 25.495 (0.135)	Loss 2.8608 (2.8295)	Entropy 0.63197 (0.63482)	Top-1 acc 51.562 (55.840)	Top-5 acc 79.688 (78.167)	lr 0.01733
Train [45][2740/3239]	Time 0.345 (0.634)	Data Time 0.001 (0.134)	Loss 2.9401 (2.8298)	Entropy 0.63172 (0.63481)	Top-1 acc 53.906 (55.833)	Top-5 acc 75.391 (78.160)	lr 0.01733
Train [45][2750/3239]	Time 0.240 (0.633)	Data Time 0.001 (0.134)	Loss 2.6255 (2.8296)	Entropy 0.63185 (0.63480)	Top-1 acc 64.062 (55.840)	Top-5 acc 81.641 (78.163)	lr 0.01733
Train [45][2760/3239]	Time 0.226 (0.632)	Data Time 0.001 (0.133)	Loss 2.7314 (2.8295)	Entropy 0.63170 (0.63479)	Top-1 acc 58.594 (55.841)	Top-5 acc 80.859 (78.165)	lr 0.01733
Train [45][2770/3239]	Time 0.230 (0.641)	Data Time 0.001 (0.143)	Loss 2.7487 (2.8294)	Entropy 0.63189 (0.63478)	Top-1 acc 58.203 (55.848)	Top-5 acc 78.516 (78.167)	lr 0.01733
Train [45][2780/3239]	Time 0.238 (0.641)	Data Time 0.001 (0.143)	Loss 2.8308 (2.8292)	Entropy 0.63204 (0.63477)	Top-1 acc 57.031 (55.854)	Top-5 acc 80.078 (78.169)	lr 0.01733
Train [45][2790/3239]	Time 0.240 (0.640)	Data Time 0.001 (0.142)	Loss 3.0145 (2.8291)	Entropy 0.63204 (0.63476)	Top-1 acc 51.172 (55.853)	Top-5 acc 73.438 (78.171)	lr 0.01733
Train [45][2800/3239]	Time 0.237 (0.649)	Data Time 0.001 (0.152)	Loss 2.7684 (2.8292)	Entropy 0.63202 (0.63475)	Top-1 acc 58.203 (55.856)	Top-5 acc 77.734 (78.170)	lr 0.01732
Train [45][2810/3239]	Time 0.231 (0.648)	Data Time 0.001 (0.151)	Loss 2.9912 (2.8293)	Entropy 0.63220 (0.63474)	Top-1 acc 54.688 (55.856)	Top-5 acc 76.172 (78.171)	lr 0.01732
Train [45][2820/3239]	Time 0.335 (0.660)	Data Time 0.006 (0.151)	Loss 2.8346 (2.8296)	Entropy 0.63214 (0.63473)	Top-1 acc 58.594 (55.850)	Top-5 acc 77.734 (78.163)	lr 0.01732
Train [45][2830/3239]	Time 0.341 (0.659)	Data Time 0.002 (0.150)	Loss 2.8778 (2.8296)	Entropy 0.63207 (0.63472)	Top-1 acc 53.906 (55.848)	Top-5 acc 76.562 (78.161)	lr 0.01732
Train [45][2840/3239]	Time 0.284 (0.659)	Data Time 0.002 (0.150)	Loss 2.8771 (2.8298)	Entropy 0.63212 (0.63471)	Top-1 acc 56.641 (55.843)	Top-5 acc 79.297 (78.158)	lr 0.01732
Train [45][2850/3239]	Time 0.265 (0.658)	Data Time 0.001 (0.149)	Loss 2.7295 (2.8298)	Entropy 0.63209 (0.63470)	Top-1 acc 56.641 (55.840)	Top-5 acc 79.688 (78.160)	lr 0.01732
Train [45][2860/3239]	Time 0.273 (0.657)	Data Time 0.001 (0.149)	Loss 2.9097 (2.8297)	Entropy 0.63232 (0.63469)	Top-1 acc 57.422 (55.846)	Top-5 acc 75.781 (78.161)	lr 0.01732
Train [45][2870/3239]	Time 0.269 (0.656)	Data Time 0.002 (0.148)	Loss 2.9962 (2.8296)	Entropy 0.63270 (0.63468)	Top-1 acc 53.516 (55.847)	Top-5 acc 74.609 (78.164)	lr 0.01732
Train [45][2880/3239]	Time 0.279 (0.656)	Data Time 0.001 (0.148)	Loss 2.8355 (2.8295)	Entropy 0.63277 (0.63468)	Top-1 acc 57.812 (55.851)	Top-5 acc 77.344 (78.164)	lr 0.01732
Train [45][2890/3239]	Time 0.247 (0.655)	Data Time 0.001 (0.147)	Loss 2.7766 (2.8294)	Entropy 0.63294 (0.63467)	Top-1 acc 58.984 (55.856)	Top-5 acc 77.734 (78.166)	lr 0.01732
Train [45][2900/3239]	Time 0.345 (0.654)	Data Time 0.001 (0.147)	Loss 2.7918 (2.8292)	Entropy 0.63292 (0.63466)	Top-1 acc 55.469 (55.857)	Top-5 acc 79.297 (78.169)	lr 0.01732
Train [45][2910/3239]	Time 0.251 (0.655)	Data Time 0.001 (0.147)	Loss 2.8178 (2.8293)	Entropy 0.63276 (0.63466)	Top-1 acc 57.031 (55.860)	Top-5 acc 76.172 (78.168)	lr 0.01731
Train [45][2920/3239]	Time 0.258 (0.656)	Data Time 0.001 (0.149)	Loss 2.6442 (2.8292)	Entropy 0.63300 (0.63465)	Top-1 acc 58.594 (55.862)	Top-5 acc 80.859 (78.169)	lr 0.01731
Train [45][2930/3239]	Time 0.543 (0.656)	Data Time 0.294 (0.149)	Loss 2.8494 (2.8291)	Entropy 0.63270 (0.63465)	Top-1 acc 56.641 (55.865)	Top-5 acc 76.953 (78.170)	lr 0.01731
Train [45][2940/3239]	Time 0.238 (0.659)	Data Time 0.001 (0.152)	Loss 2.9596 (2.8291)	Entropy 0.63288 (0.63464)	Top-1 acc 54.688 (55.865)	Top-5 acc 76.562 (78.169)	lr 0.01731
Train [45][2950/3239]	Time 2.100 (0.659)	Data Time 1.866 (0.152)	Loss 2.8657 (2.8290)	Entropy 0.63259 (0.63463)	Top-1 acc 52.344 (55.866)	Top-5 acc 77.734 (78.171)	lr 0.01731
Train [45][2960/3239]	Time 0.311 (0.658)	Data Time 0.071 (0.152)	Loss 2.7802 (2.8289)	Entropy 0.63250 (0.63463)	Top-1 acc 57.422 (55.866)	Top-5 acc 78.516 (78.175)	lr 0.01731
Train [45][2970/3239]	Time 0.237 (0.662)	Data Time 0.001 (0.155)	Loss 2.6591 (2.8289)	Entropy 0.63227 (0.63462)	Top-1 acc 60.547 (55.869)	Top-5 acc 81.641 (78.179)	lr 0.01731
Train [45][2980/3239]	Time 0.239 (0.661)	Data Time 0.001 (0.156)	Loss 2.8041 (2.8288)	Entropy 0.63224 (0.63461)	Top-1 acc 58.594 (55.870)	Top-5 acc 78.906 (78.180)	lr 0.01731
Train [45][2990/3239]	Time 0.237 (0.662)	Data Time 0.002 (0.157)	Loss 3.0317 (2.8288)	Entropy 0.63218 (0.63460)	Top-1 acc 51.172 (55.867)	Top-5 acc 75.000 (78.180)	lr 0.01731
Train [45][3000/3239]	Time 2.069 (0.665)	Data Time 1.799 (0.159)	Loss 2.8278 (2.8289)	Entropy 0.63240 (0.63459)	Top-1 acc 58.203 (55.869)	Top-5 acc 76.562 (78.179)	lr 0.01731
Train [45][3010/3239]	Time 0.224 (0.665)	Data Time 0.001 (0.160)	Loss 2.7452 (2.8288)	Entropy 0.63250 (0.63459)	Top-1 acc 57.812 (55.866)	Top-5 acc 79.688 (78.182)	lr 0.01730
Train [45][3020/3239]	Time 0.233 (0.666)	Data Time 0.001 (0.161)	Loss 2.9839 (2.8289)	Entropy 0.63240 (0.63458)	Top-1 acc 54.688 (55.862)	Top-5 acc 76.562 (78.183)	lr 0.01730
Train [45][3030/3239]	Time 0.250 (0.668)	Data Time 0.002 (0.164)	Loss 3.0268 (2.8291)	Entropy 0.63256 (0.63457)	Top-1 acc 51.562 (55.857)	Top-5 acc 74.609 (78.181)	lr 0.01730
Train [45][3040/3239]	Time 0.238 (0.669)	Data Time 0.001 (0.164)	Loss 2.7536 (2.8292)	Entropy 0.63244 (0.63457)	Top-1 acc 57.422 (55.857)	Top-5 acc 77.734 (78.179)	lr 0.01730
Train [45][3050/3239]	Time 0.250 (0.670)	Data Time 0.001 (0.166)	Loss 2.7827 (2.8293)	Entropy 0.63236 (0.63456)	Top-1 acc 57.031 (55.852)	Top-5 acc 76.953 (78.176)	lr 0.01730
Train [45][3060/3239]	Time 0.372 (0.671)	Data Time 0.001 (0.167)	Loss 2.8561 (2.8293)	Entropy 0.63228 (0.63455)	Top-1 acc 56.641 (55.852)	Top-5 acc 77.344 (78.175)	lr 0.01730
Train [45][3070/3239]	Time 2.927 (0.672)	Data Time 2.686 (0.169)	Loss 2.8789 (2.8293)	Entropy 0.63229 (0.63454)	Top-1 acc 52.734 (55.851)	Top-5 acc 76.172 (78.174)	lr 0.01730
Train [45][3080/3239]	Time 2.004 (0.673)	Data Time 1.720 (0.169)	Loss 2.8313 (2.8292)	Entropy 0.63217 (0.63454)	Top-1 acc 57.031 (55.853)	Top-5 acc 76.172 (78.178)	lr 0.01730
Train [45][3090/3239]	Time 1.329 (0.673)	Data Time 1.094 (0.170)	Loss 2.9895 (2.8294)	Entropy 0.63231 (0.63453)	Top-1 acc 50.391 (55.851)	Top-5 acc 73.828 (78.173)	lr 0.01730
Train [45][3100/3239]	Time 0.237 (0.675)	Data Time 0.001 (0.173)	Loss 2.7986 (2.8291)	Entropy 0.63227 (0.63452)	Top-1 acc 54.688 (55.858)	Top-5 acc 79.297 (78.181)	lr 0.01730
Train [45][3110/3239]	Time 0.916 (0.675)	Data Time 0.682 (0.172)	Loss 2.8071 (2.8292)	Entropy 0.63255 (0.63452)	Top-1 acc 56.641 (55.856)	Top-5 acc 78.906 (78.177)	lr 0.01730
Train [45][3120/3239]	Time 0.249 (0.674)	Data Time 0.001 (0.172)	Loss 2.8315 (2.8292)	Entropy 0.63266 (0.63451)	Top-1 acc 52.734 (55.854)	Top-5 acc 78.516 (78.177)	lr 0.01729
Train [45][3130/3239]	Time 0.361 (0.679)	Data Time 0.001 (0.177)	Loss 2.7718 (2.8291)	Entropy 0.63252 (0.63450)	Top-1 acc 57.031 (55.852)	Top-5 acc 78.906 (78.178)	lr 0.01729
Train [45][3140/3239]	Time 0.259 (0.679)	Data Time 0.001 (0.177)	Loss 2.8666 (2.8291)	Entropy 0.63248 (0.63450)	Top-1 acc 56.250 (55.853)	Top-5 acc 78.906 (78.177)	lr 0.01729
Train [45][3150/3239]	Time 0.232 (0.678)	Data Time 0.001 (0.177)	Loss 2.8112 (2.8291)	Entropy 0.63240 (0.63449)	Top-1 acc 55.078 (55.853)	Top-5 acc 76.953 (78.177)	lr 0.01729
Train [45][3160/3239]	Time 0.241 (0.681)	Data Time 0.001 (0.180)	Loss 3.2070 (2.8292)	Entropy 0.63235 (0.63448)	Top-1 acc 46.484 (55.850)	Top-5 acc 70.312 (78.175)	lr 0.01729
Train [45][3170/3239]	Time 0.234 (0.682)	Data Time 0.001 (0.180)	Loss 2.5610 (2.8291)	Entropy 0.63252 (0.63448)	Top-1 acc 64.453 (55.850)	Top-5 acc 81.250 (78.173)	lr 0.01729
Train [45][3180/3239]	Time 0.226 (0.681)	Data Time 0.000 (0.180)	Loss 2.7872 (2.8293)	Entropy 0.63265 (0.63447)	Top-1 acc 58.203 (55.848)	Top-5 acc 78.125 (78.172)	lr 0.01729
Train [45][3190/3239]	Time 0.229 (0.683)	Data Time 0.000 (0.183)	Loss 2.7698 (2.8293)	Entropy 0.63293 (0.63447)	Top-1 acc 59.766 (55.848)	Top-5 acc 78.125 (78.170)	lr 0.01729
Train [45][3200/3239]	Time 0.331 (0.684)	Data Time 0.000 (0.184)	Loss 2.8135 (2.8294)	Entropy 0.63270 (0.63446)	Top-1 acc 58.203 (55.844)	Top-5 acc 78.516 (78.165)	lr 0.01729
Train [45][3210/3239]	Time 0.248 (0.684)	Data Time 0.000 (0.184)	Loss 2.8680 (2.8292)	Entropy 0.63284 (0.63446)	Top-1 acc 55.078 (55.854)	Top-5 acc 78.906 (78.170)	lr 0.01729
Train [45][3220/3239]	Time 0.339 (0.685)	Data Time 0.000 (0.185)	Loss 2.7582 (2.8293)	Entropy 0.63279 (0.63445)	Top-1 acc 54.688 (55.849)	Top-5 acc 82.422 (78.166)	lr 0.01729
Train [45][3230/3239]	Time 0.236 (0.685)	Data Time 0.000 (0.186)	Loss 2.9426 (2.8293)	Entropy 0.63311 (0.63445)	Top-1 acc 55.859 (55.846)	Top-5 acc 75.781 (78.166)	lr 0.01728
Train [45][3239/3239]	Time 0.843 (0.685)	Data Time 0.000 (0.185)	Loss 3.1683 (2.8294)	Entropy 0.63347 (0.63444)	Top-1 acc 55.556 (55.846)	Top-5 acc 69.136 (78.162)	lr 0.01728
==========Valid [45/120]	loss 1.545	top-1 acc 64.561 (64.561)	top-5 acc 85.362	Train top-1 55.846	top-5 78.162	Entropy 0.63347	Latency-None: 0.000ms	Flops: 539.76M
Train [46][0/3239]	Time 45.050 (45.050)	Data Time 43.837 (43.837)	Loss 2.9523 (2.9523)	Entropy 0.63345 (0.63345)	Top-1 acc 54.297 (54.297)	Top-5 acc 75.781 (75.781)	lr 0.01728
Train [46][10/3239]	Time 0.242 (4.759)	Data Time 0.001 (4.205)	Loss 2.8282 (2.8289)	Entropy 0.63348 (0.63344)	Top-1 acc 56.641 (56.179)	Top-5 acc 79.297 (78.303)	lr 0.01728
Train [46][20/3239]	Time 0.261 (2.701)	Data Time 0.001 (2.204)	Loss 2.7305 (2.8092)	Entropy 0.63328 (0.63345)	Top-1 acc 58.594 (56.138)	Top-5 acc 80.469 (78.497)	lr 0.01728
Train [46][30/3239]	Time 0.275 (1.986)	Data Time 0.001 (1.493)	Loss 2.7537 (2.8019)	Entropy 0.63331 (0.63338)	Top-1 acc 60.156 (56.363)	Top-5 acc 79.297 (78.591)	lr 0.01728
Train [46][40/3239]	Time 0.257 (1.653)	Data Time 0.001 (1.162)	Loss 2.9340 (2.8210)	Entropy 0.63318 (0.63334)	Top-1 acc 57.031 (56.098)	Top-5 acc 77.344 (78.306)	lr 0.01728
Train [46][50/3239]	Time 0.251 (1.415)	Data Time 0.001 (0.935)	Loss 2.7238 (2.8195)	Entropy 0.63333 (0.63332)	Top-1 acc 60.547 (56.196)	Top-5 acc 79.297 (78.370)	lr 0.01728
Train [46][60/3239]	Time 0.309 (1.257)	Data Time 0.002 (0.782)	Loss 2.7521 (2.8168)	Entropy 0.63344 (0.63333)	Top-1 acc 56.641 (56.224)	Top-5 acc 77.344 (78.388)	lr 0.01728
Train [46][70/3239]	Time 0.250 (1.172)	Data Time 0.001 (0.700)	Loss 2.8842 (2.8144)	Entropy 0.63350 (0.63335)	Top-1 acc 57.031 (56.344)	Top-5 acc 76.562 (78.318)	lr 0.01728
Train [46][80/3239]	Time 0.243 (1.082)	Data Time 0.001 (0.614)	Loss 2.9466 (2.8145)	Entropy 0.63323 (0.63335)	Top-1 acc 55.078 (56.443)	Top-5 acc 76.172 (78.371)	lr 0.01728
Train [46][90/3239]	Time 0.254 (1.011)	Data Time 0.001 (0.547)	Loss 2.8540 (2.8149)	Entropy 0.63318 (0.63333)	Top-1 acc 54.688 (56.417)	Top-5 acc 80.469 (78.357)	lr 0.01728
Train [46][100/3239]	Time 0.232 (1.020)	Data Time 0.001 (0.552)	Loss 2.8126 (2.8188)	Entropy 0.63317 (0.63331)	Top-1 acc 57.422 (56.300)	Top-5 acc 77.344 (78.226)	lr 0.01727
Train [46][110/3239]	Time 0.246 (0.968)	Data Time 0.001 (0.502)	Loss 2.6149 (2.8086)	Entropy 0.63320 (0.63330)	Top-1 acc 63.672 (56.641)	Top-5 acc 80.859 (78.421)	lr 0.01727
Train [46][120/3239]	Time 0.373 (0.926)	Data Time 0.001 (0.461)	Loss 2.7369 (2.8111)	Entropy 0.63309 (0.63329)	Top-1 acc 59.375 (56.605)	Top-5 acc 78.906 (78.361)	lr 0.01727
Train [46][130/3239]	Time 0.242 (0.890)	Data Time 0.001 (0.426)	Loss 2.7839 (2.8109)	Entropy 0.63301 (0.63327)	Top-1 acc 55.469 (56.542)	Top-5 acc 81.641 (78.435)	lr 0.01727
Train [46][140/3239]	Time 0.286 (0.866)	Data Time 0.001 (0.404)	Loss 2.9838 (2.8104)	Entropy 0.63334 (0.63326)	Top-1 acc 50.000 (56.494)	Top-5 acc 74.609 (78.441)	lr 0.01727
Train [46][150/3239]	Time 0.278 (0.842)	Data Time 0.001 (0.378)	Loss 2.8027 (2.8130)	Entropy 0.63351 (0.63327)	Top-1 acc 59.375 (56.436)	Top-5 acc 76.172 (78.391)	lr 0.01727
Train [46][160/3239]	Time 0.281 (0.819)	Data Time 0.001 (0.354)	Loss 2.7870 (2.8161)	Entropy 0.63368 (0.63329)	Top-1 acc 57.031 (56.376)	Top-5 acc 80.469 (78.339)	lr 0.01727
Train [46][170/3239]	Time 0.256 (0.797)	Data Time 0.001 (0.334)	Loss 2.7916 (2.8101)	Entropy 0.63323 (0.63331)	Top-1 acc 59.375 (56.488)	Top-5 acc 80.078 (78.449)	lr 0.01727
Train [46][180/3239]	Time 0.258 (0.779)	Data Time 0.002 (0.315)	Loss 2.8338 (2.8074)	Entropy 0.63346 (0.63331)	Top-1 acc 55.469 (56.552)	Top-5 acc 77.734 (78.490)	lr 0.01727
Train [46][190/3239]	Time 0.471 (0.763)	Data Time 0.001 (0.299)	Loss 2.9786 (2.8098)	Entropy 0.63340 (0.63332)	Top-1 acc 52.344 (56.448)	Top-5 acc 76.953 (78.465)	lr 0.01727
Train [46][200/3239]	Time 0.232 (0.747)	Data Time 0.001 (0.284)	Loss 3.1355 (2.8117)	Entropy 0.63352 (0.63332)	Top-1 acc 48.828 (56.452)	Top-5 acc 75.781 (78.477)	lr 0.01726
Train [46][210/3239]	Time 0.246 (0.731)	Data Time 0.001 (0.271)	Loss 2.6544 (2.8112)	Entropy 0.63387 (0.63334)	Top-1 acc 58.984 (56.461)	Top-5 acc 80.859 (78.497)	lr 0.01726
Train [46][220/3239]	Time 0.259 (0.719)	Data Time 0.002 (0.259)	Loss 2.7712 (2.8119)	Entropy 0.63391 (0.63336)	Top-1 acc 58.594 (56.397)	Top-5 acc 79.688 (78.484)	lr 0.01726
Train [46][230/3239]	Time 0.280 (0.710)	Data Time 0.001 (0.250)	Loss 2.7378 (2.8138)	Entropy 0.63379 (0.63338)	Top-1 acc 59.375 (56.343)	Top-5 acc 80.859 (78.475)	lr 0.01726
Train [46][240/3239]	Time 0.250 (0.862)	Data Time 0.002 (0.240)	Loss 2.7124 (2.8129)	Entropy 0.63383 (0.63340)	Top-1 acc 55.078 (56.354)	Top-5 acc 83.594 (78.512)	lr 0.01726
Train [46][250/3239]	Time 0.253 (0.844)	Data Time 0.002 (0.231)	Loss 2.8317 (2.8124)	Entropy 0.63378 (0.63341)	Top-1 acc 55.859 (56.334)	Top-5 acc 77.734 (78.519)	lr 0.01726
Train [46][260/3239]	Time 0.251 (0.829)	Data Time 0.002 (0.222)	Loss 2.8242 (2.8105)	Entropy 0.63354 (0.63343)	Top-1 acc 55.859 (56.373)	Top-5 acc 76.953 (78.543)	lr 0.01726
Train [46][270/3239]	Time 0.249 (0.814)	Data Time 0.001 (0.214)	Loss 2.8708 (2.8097)	Entropy 0.63326 (0.63342)	Top-1 acc 55.469 (56.351)	Top-5 acc 76.953 (78.579)	lr 0.01726
Train [46][280/3239]	Time 0.370 (0.802)	Data Time 0.001 (0.206)	Loss 2.8545 (2.8096)	Entropy 0.63345 (0.63343)	Top-1 acc 55.859 (56.333)	Top-5 acc 78.516 (78.592)	lr 0.01726
Train [46][290/3239]	Time 0.271 (0.790)	Data Time 0.001 (0.199)	Loss 2.7038 (2.8099)	Entropy 0.63321 (0.63342)	Top-1 acc 58.984 (56.331)	Top-5 acc 80.859 (78.556)	lr 0.01726
Train [46][300/3239]	Time 0.261 (0.779)	Data Time 0.001 (0.193)	Loss 2.6815 (2.8116)	Entropy 0.63283 (0.63341)	Top-1 acc 58.203 (56.281)	Top-5 acc 82.031 (78.529)	lr 0.01726
Train [46][310/3239]	Time 0.301 (0.769)	Data Time 0.001 (0.187)	Loss 2.7892 (2.8110)	Entropy 0.63268 (0.63339)	Top-1 acc 54.297 (56.274)	Top-5 acc 80.469 (78.532)	lr 0.01725
Train [46][320/3239]	Time 0.240 (0.760)	Data Time 0.001 (0.181)	Loss 2.7553 (2.8104)	Entropy 0.63237 (0.63337)	Top-1 acc 56.250 (56.289)	Top-5 acc 81.250 (78.547)	lr 0.01725
Train [46][330/3239]	Time 0.251 (0.751)	Data Time 0.001 (0.175)	Loss 2.8095 (2.8112)	Entropy 0.63250 (0.63334)	Top-1 acc 55.469 (56.258)	Top-5 acc 81.250 (78.532)	lr 0.01725
Train [46][340/3239]	Time 0.289 (0.743)	Data Time 0.002 (0.170)	Loss 2.8081 (2.8103)	Entropy 0.63265 (0.63331)	Top-1 acc 58.984 (56.314)	Top-5 acc 78.516 (78.520)	lr 0.01725
Train [46][350/3239]	Time 0.353 (0.735)	Data Time 0.001 (0.165)	Loss 2.8221 (2.8095)	Entropy 0.63300 (0.63330)	Top-1 acc 56.641 (56.333)	Top-5 acc 78.906 (78.521)	lr 0.01725
Train [46][360/3239]	Time 0.270 (0.727)	Data Time 0.001 (0.161)	Loss 2.9237 (2.8111)	Entropy 0.63322 (0.63329)	Top-1 acc 53.125 (56.274)	Top-5 acc 76.562 (78.499)	lr 0.01725
Train [46][370/3239]	Time 0.290 (0.720)	Data Time 0.002 (0.157)	Loss 2.9120 (2.8122)	Entropy 0.63321 (0.63329)	Top-1 acc 55.469 (56.270)	Top-5 acc 78.516 (78.498)	lr 0.01725
Train [46][380/3239]	Time 0.233 (0.714)	Data Time 0.001 (0.153)	Loss 2.7281 (2.8129)	Entropy 0.63297 (0.63329)	Top-1 acc 53.125 (56.205)	Top-5 acc 81.250 (78.502)	lr 0.01725
Train [46][390/3239]	Time 0.263 (0.707)	Data Time 0.001 (0.149)	Loss 2.9074 (2.8127)	Entropy 0.63308 (0.63328)	Top-1 acc 55.078 (56.195)	Top-5 acc 77.344 (78.503)	lr 0.01725
Train [46][400/3239]	Time 0.248 (0.701)	Data Time 0.002 (0.145)	Loss 2.7216 (2.8119)	Entropy 0.63284 (0.63327)	Top-1 acc 58.594 (56.198)	Top-5 acc 82.422 (78.506)	lr 0.01725
Train [46][410/3239]	Time 0.254 (0.695)	Data Time 0.001 (0.142)	Loss 2.7685 (2.8113)	Entropy 0.63300 (0.63326)	Top-1 acc 55.078 (56.190)	Top-5 acc 81.641 (78.516)	lr 0.01725
Train [46][420/3239]	Time 0.305 (0.689)	Data Time 0.001 (0.138)	Loss 2.7845 (2.8112)	Entropy 0.63254 (0.63325)	Top-1 acc 57.812 (56.192)	Top-5 acc 77.344 (78.499)	lr 0.01724
Train [46][430/3239]	Time 0.244 (0.684)	Data Time 0.001 (0.135)	Loss 2.9201 (2.8128)	Entropy 0.63280 (0.63324)	Top-1 acc 49.219 (56.144)	Top-5 acc 76.953 (78.468)	lr 0.01724
Train [46][440/3239]	Time 0.361 (0.679)	Data Time 0.001 (0.132)	Loss 2.6882 (2.8114)	Entropy 0.63266 (0.63323)	Top-1 acc 57.812 (56.176)	Top-5 acc 79.297 (78.496)	lr 0.01724
Train [46][450/3239]	Time 0.244 (0.673)	Data Time 0.002 (0.129)	Loss 2.9526 (2.8113)	Entropy 0.63286 (0.63322)	Top-1 acc 52.734 (56.183)	Top-5 acc 73.828 (78.512)	lr 0.01724
Train [46][460/3239]	Time 0.246 (0.669)	Data Time 0.001 (0.126)	Loss 2.7361 (2.8108)	Entropy 0.63269 (0.63321)	Top-1 acc 57.422 (56.184)	Top-5 acc 79.297 (78.511)	lr 0.01724
Train [46][470/3239]	Time 0.285 (0.665)	Data Time 0.002 (0.124)	Loss 2.9127 (2.8097)	Entropy 0.63218 (0.63320)	Top-1 acc 53.906 (56.213)	Top-5 acc 75.000 (78.515)	lr 0.01724
Train [46][480/3239]	Time 0.283 (0.661)	Data Time 0.002 (0.121)	Loss 2.7824 (2.8100)	Entropy 0.63171 (0.63317)	Top-1 acc 53.516 (56.202)	Top-5 acc 77.344 (78.511)	lr 0.01724
Train [46][490/3239]	Time 0.280 (0.657)	Data Time 0.001 (0.119)	Loss 2.8330 (2.8103)	Entropy 0.63143 (0.63314)	Top-1 acc 54.688 (56.194)	Top-5 acc 78.906 (78.501)	lr 0.01724
Train [46][500/3239]	Time 0.253 (0.654)	Data Time 0.001 (0.117)	Loss 2.7440 (2.8102)	Entropy 0.63145 (0.63311)	Top-1 acc 55.859 (56.205)	Top-5 acc 77.344 (78.502)	lr 0.01724
Train [46][510/3239]	Time 0.374 (0.653)	Data Time 0.002 (0.117)	Loss 2.8142 (2.8103)	Entropy 0.63163 (0.63307)	Top-1 acc 56.250 (56.202)	Top-5 acc 77.344 (78.506)	lr 0.01724
Train [46][520/3239]	Time 0.256 (0.650)	Data Time 0.001 (0.115)	Loss 2.7840 (2.8102)	Entropy 0.63150 (0.63305)	Top-1 acc 57.031 (56.189)	Top-5 acc 79.297 (78.513)	lr 0.01723
Train [46][530/3239]	Time 0.268 (0.646)	Data Time 0.001 (0.113)	Loss 2.6428 (2.8105)	Entropy 0.63174 (0.63302)	Top-1 acc 61.328 (56.198)	Top-5 acc 83.594 (78.514)	lr 0.01723
Train [46][540/3239]	Time 0.236 (0.646)	Data Time 0.001 (0.115)	Loss 2.8202 (2.8112)	Entropy 0.63195 (0.63300)	Top-1 acc 55.469 (56.187)	Top-5 acc 79.688 (78.513)	lr 0.01723
Train [46][550/3239]	Time 0.302 (0.643)	Data Time 0.002 (0.113)	Loss 2.7524 (2.8114)	Entropy 0.63230 (0.63298)	Top-1 acc 58.984 (56.171)	Top-5 acc 79.297 (78.511)	lr 0.01723
Train [46][560/3239]	Time 0.237 (0.644)	Data Time 0.001 (0.116)	Loss 2.6903 (2.8107)	Entropy 0.63235 (0.63297)	Top-1 acc 57.031 (56.180)	Top-5 acc 80.078 (78.514)	lr 0.01723
Train [46][570/3239]	Time 0.281 (0.643)	Data Time 0.001 (0.115)	Loss 2.6495 (2.8110)	Entropy 0.63223 (0.63296)	Top-1 acc 60.156 (56.173)	Top-5 acc 82.031 (78.501)	lr 0.01723
Train [46][580/3239]	Time 0.277 (0.640)	Data Time 0.003 (0.114)	Loss 3.0679 (2.8120)	Entropy 0.63172 (0.63294)	Top-1 acc 49.219 (56.154)	Top-5 acc 76.953 (78.483)	lr 0.01723
Train [46][590/3239]	Time 0.243 (0.638)	Data Time 0.001 (0.113)	Loss 2.9417 (2.8122)	Entropy 0.63188 (0.63292)	Top-1 acc 54.688 (56.152)	Top-5 acc 76.562 (78.476)	lr 0.01723
Train [46][600/3239]	Time 0.273 (0.636)	Data Time 0.001 (0.112)	Loss 2.8817 (2.8124)	Entropy 0.63206 (0.63291)	Top-1 acc 51.172 (56.143)	Top-5 acc 76.172 (78.464)	lr 0.01723
Train [46][610/3239]	Time 0.266 (0.635)	Data Time 0.001 (0.113)	Loss 2.8123 (2.8122)	Entropy 0.63208 (0.63289)	Top-1 acc 55.078 (56.126)	Top-5 acc 79.297 (78.464)	lr 0.01723
Train [46][620/3239]	Time 0.265 (0.635)	Data Time 0.001 (0.113)	Loss 2.6877 (2.8130)	Entropy 0.63205 (0.63288)	Top-1 acc 60.938 (56.131)	Top-5 acc 80.859 (78.455)	lr 0.01723
Train [46][630/3239]	Time 0.260 (0.632)	Data Time 0.002 (0.112)	Loss 2.7912 (2.8124)	Entropy 0.63203 (0.63287)	Top-1 acc 58.984 (56.170)	Top-5 acc 80.859 (78.475)	lr 0.01722
Train [46][640/3239]	Time 0.270 (0.633)	Data Time 0.001 (0.114)	Loss 2.7688 (2.8125)	Entropy 0.63196 (0.63285)	Top-1 acc 55.469 (56.171)	Top-5 acc 78.125 (78.473)	lr 0.01722
Train [46][650/3239]	Time 0.252 (0.633)	Data Time 0.001 (0.115)	Loss 2.7153 (2.8127)	Entropy 0.63214 (0.63284)	Top-1 acc 57.812 (56.181)	Top-5 acc 81.250 (78.466)	lr 0.01722
Train [46][660/3239]	Time 0.258 (0.630)	Data Time 0.001 (0.113)	Loss 2.8290 (2.8124)	Entropy 0.63200 (0.63283)	Top-1 acc 54.688 (56.194)	Top-5 acc 78.906 (78.471)	lr 0.01722
Train [46][670/3239]	Time 0.377 (0.636)	Data Time 0.001 (0.120)	Loss 2.6774 (2.8119)	Entropy 0.63187 (0.63282)	Top-1 acc 58.984 (56.208)	Top-5 acc 81.250 (78.485)	lr 0.01722
Train [46][680/3239]	Time 0.265 (0.633)	Data Time 0.002 (0.118)	Loss 2.9851 (2.8116)	Entropy 0.63215 (0.63281)	Top-1 acc 53.516 (56.217)	Top-5 acc 75.391 (78.497)	lr 0.01722
Train [46][690/3239]	Time 0.270 (0.631)	Data Time 0.003 (0.116)	Loss 2.6251 (2.8104)	Entropy 0.63206 (0.63280)	Top-1 acc 62.500 (56.246)	Top-5 acc 83.203 (78.517)	lr 0.01722
Train [46][700/3239]	Time 0.282 (0.634)	Data Time 0.001 (0.120)	Loss 2.8696 (2.8099)	Entropy 0.63187 (0.63279)	Top-1 acc 57.422 (56.253)	Top-5 acc 77.734 (78.525)	lr 0.01722
Train [46][710/3239]	Time 0.296 (0.631)	Data Time 0.002 (0.118)	Loss 2.7203 (2.8090)	Entropy 0.63176 (0.63277)	Top-1 acc 62.109 (56.275)	Top-5 acc 78.906 (78.538)	lr 0.01722
Train [46][720/3239]	Time 0.238 (0.628)	Data Time 0.001 (0.117)	Loss 2.6424 (2.8086)	Entropy 0.63168 (0.63276)	Top-1 acc 59.375 (56.279)	Top-5 acc 79.297 (78.543)	lr 0.01722
Train [46][730/3239]	Time 0.308 (0.634)	Data Time 0.001 (0.123)	Loss 3.1358 (2.8092)	Entropy 0.63133 (0.63274)	Top-1 acc 47.656 (56.253)	Top-5 acc 68.359 (78.525)	lr 0.01722
Train [46][740/3239]	Time 0.371 (0.631)	Data Time 0.022 (0.122)	Loss 2.5775 (2.8093)	Entropy 0.63144 (0.63272)	Top-1 acc 60.938 (56.247)	Top-5 acc 83.594 (78.526)	lr 0.01721
Train [46][750/3239]	Time 0.238 (0.630)	Data Time 0.001 (0.121)	Loss 2.6822 (2.8090)	Entropy 0.63116 (0.63270)	Top-1 acc 60.156 (56.244)	Top-5 acc 82.812 (78.539)	lr 0.01721
Train [46][760/3239]	Time 0.253 (0.627)	Data Time 0.001 (0.120)	Loss 2.7667 (2.8093)	Entropy 0.63060 (0.63268)	Top-1 acc 54.688 (56.227)	Top-5 acc 80.469 (78.534)	lr 0.01721
Train [46][770/3239]	Time 0.243 (0.628)	Data Time 0.001 (0.121)	Loss 2.5877 (2.8085)	Entropy 0.63034 (0.63265)	Top-1 acc 63.281 (56.246)	Top-5 acc 83.594 (78.550)	lr 0.01721
Train [46][780/3239]	Time 0.236 (0.630)	Data Time 0.001 (0.124)	Loss 2.9416 (2.8083)	Entropy 0.63053 (0.63263)	Top-1 acc 52.344 (56.253)	Top-5 acc 72.656 (78.545)	lr 0.01721
Train [46][790/3239]	Time 0.245 (0.628)	Data Time 0.001 (0.123)	Loss 2.9204 (2.8089)	Entropy 0.63029 (0.63260)	Top-1 acc 55.469 (56.236)	Top-5 acc 77.734 (78.541)	lr 0.01721
Train [46][800/3239]	Time 0.249 (0.629)	Data Time 0.001 (0.125)	Loss 2.6812 (2.8089)	Entropy 0.63063 (0.63257)	Top-1 acc 60.547 (56.246)	Top-5 acc 83.203 (78.537)	lr 0.01721
Train [46][810/3239]	Time 0.245 (0.630)	Data Time 0.001 (0.126)	Loss 2.6694 (2.8086)	Entropy 0.63116 (0.63255)	Top-1 acc 55.859 (56.249)	Top-5 acc 80.859 (78.543)	lr 0.01721
Train [46][820/3239]	Time 0.247 (0.627)	Data Time 0.002 (0.125)	Loss 2.5914 (2.8096)	Entropy 0.63138 (0.63253)	Top-1 acc 60.547 (56.236)	Top-5 acc 81.250 (78.527)	lr 0.01721
Train [46][830/3239]	Time 0.387 (0.634)	Data Time 0.002 (0.131)	Loss 2.9526 (2.8105)	Entropy 0.63130 (0.63252)	Top-1 acc 53.516 (56.219)	Top-5 acc 76.172 (78.506)	lr 0.01721
Train [46][840/3239]	Time 0.278 (0.632)	Data Time 0.002 (0.130)	Loss 2.6631 (2.8108)	Entropy 0.63172 (0.63251)	Top-1 acc 58.203 (56.216)	Top-5 acc 81.250 (78.493)	lr 0.01721
Train [46][850/3239]	Time 0.238 (0.630)	Data Time 0.001 (0.128)	Loss 2.8170 (2.8109)	Entropy 0.63172 (0.63250)	Top-1 acc 55.859 (56.212)	Top-5 acc 77.734 (78.486)	lr 0.01720
Train [46][860/3239]	Time 0.298 (0.635)	Data Time 0.001 (0.134)	Loss 2.7939 (2.8104)	Entropy 0.63177 (0.63249)	Top-1 acc 59.766 (56.224)	Top-5 acc 76.953 (78.491)	lr 0.01720
Train [46][870/3239]	Time 0.259 (0.632)	Data Time 0.001 (0.132)	Loss 2.7542 (2.8102)	Entropy 0.63141 (0.63248)	Top-1 acc 58.594 (56.220)	Top-5 acc 78.516 (78.488)	lr 0.01720
Train [46][880/3239]	Time 0.247 (0.630)	Data Time 0.001 (0.131)	Loss 2.6268 (2.8101)	Entropy 0.63175 (0.63247)	Top-1 acc 61.328 (56.214)	Top-5 acc 84.375 (78.504)	lr 0.01720
Train [46][890/3239]	Time 0.320 (0.678)	Data Time 0.004 (0.140)	Loss 2.9398 (2.8098)	Entropy 0.63173 (0.63246)	Top-1 acc 56.641 (56.217)	Top-5 acc 74.609 (78.498)	lr 0.01720
Train [46][900/3239]	Time 0.253 (0.675)	Data Time 0.002 (0.139)	Loss 2.6450 (2.8094)	Entropy 0.63202 (0.63245)	Top-1 acc 56.641 (56.220)	Top-5 acc 83.594 (78.507)	lr 0.01720
Train [46][910/3239]	Time 0.244 (0.672)	Data Time 0.001 (0.137)	Loss 2.7815 (2.8091)	Entropy 0.63215 (0.63245)	Top-1 acc 57.031 (56.223)	Top-5 acc 80.078 (78.508)	lr 0.01720
Train [46][920/3239]	Time 0.251 (0.670)	Data Time 0.002 (0.136)	Loss 2.7681 (2.8094)	Entropy 0.63234 (0.63244)	Top-1 acc 57.031 (56.223)	Top-5 acc 78.125 (78.502)	lr 0.01720
Train [46][930/3239]	Time 0.233 (0.667)	Data Time 0.002 (0.134)	Loss 2.5765 (2.8096)	Entropy 0.63257 (0.63244)	Top-1 acc 57.031 (56.206)	Top-5 acc 83.984 (78.498)	lr 0.01720
Train [46][940/3239]	Time 0.264 (0.665)	Data Time 0.001 (0.133)	Loss 2.7695 (2.8092)	Entropy 0.63246 (0.63244)	Top-1 acc 55.469 (56.218)	Top-5 acc 75.391 (78.503)	lr 0.01720
Train [46][950/3239]	Time 0.246 (0.663)	Data Time 0.001 (0.132)	Loss 2.9031 (2.8097)	Entropy 0.63282 (0.63245)	Top-1 acc 57.031 (56.208)	Top-5 acc 77.734 (78.493)	lr 0.01719
Train [46][960/3239]	Time 0.247 (0.660)	Data Time 0.001 (0.130)	Loss 2.7164 (2.8095)	Entropy 0.63266 (0.63245)	Top-1 acc 58.594 (56.209)	Top-5 acc 81.641 (78.491)	lr 0.01719
Train [46][970/3239]	Time 0.250 (0.658)	Data Time 0.002 (0.129)	Loss 2.9648 (2.8096)	Entropy 0.63257 (0.63245)	Top-1 acc 53.125 (56.214)	Top-5 acc 76.172 (78.492)	lr 0.01719
Train [46][980/3239]	Time 0.248 (0.656)	Data Time 0.001 (0.128)	Loss 2.7288 (2.8098)	Entropy 0.63262 (0.63245)	Top-1 acc 57.422 (56.219)	Top-5 acc 78.906 (78.492)	lr 0.01719
Train [46][990/3239]	Time 0.339 (0.656)	Data Time 0.001 (0.129)	Loss 2.7405 (2.8093)	Entropy 0.63286 (0.63246)	Top-1 acc 60.547 (56.229)	Top-5 acc 80.078 (78.497)	lr 0.01719
Train [46][1000/3239]	Time 0.245 (0.656)	Data Time 0.001 (0.129)	Loss 2.9331 (2.8088)	Entropy 0.63281 (0.63246)	Top-1 acc 53.125 (56.243)	Top-5 acc 75.781 (78.502)	lr 0.01719
Train [46][1010/3239]	Time 0.265 (0.656)	Data Time 0.002 (0.130)	Loss 2.6082 (2.8085)	Entropy 0.63276 (0.63246)	Top-1 acc 62.891 (56.244)	Top-5 acc 82.031 (78.508)	lr 0.01719
Train [46][1020/3239]	Time 0.251 (0.656)	Data Time 0.001 (0.131)	Loss 2.7200 (2.8086)	Entropy 0.63263 (0.63246)	Top-1 acc 61.328 (56.238)	Top-5 acc 80.469 (78.506)	lr 0.01719
Train [46][1030/3239]	Time 0.257 (0.655)	Data Time 0.001 (0.131)	Loss 2.7635 (2.8090)	Entropy 0.63255 (0.63247)	Top-1 acc 57.422 (56.233)	Top-5 acc 78.906 (78.495)	lr 0.01719
Train [46][1040/3239]	Time 0.253 (0.657)	Data Time 0.001 (0.134)	Loss 2.8912 (2.8093)	Entropy 0.63228 (0.63247)	Top-1 acc 53.906 (56.227)	Top-5 acc 78.125 (78.492)	lr 0.01719
Train [46][1050/3239]	Time 2.349 (0.657)	Data Time 2.058 (0.135)	Loss 2.6315 (2.8085)	Entropy 0.63207 (0.63246)	Top-1 acc 60.547 (56.240)	Top-5 acc 82.422 (78.517)	lr 0.01719
Train [46][1060/3239]	Time 0.366 (0.655)	Data Time 0.002 (0.133)	Loss 2.7225 (2.8088)	Entropy 0.63201 (0.63246)	Top-1 acc 60.156 (56.242)	Top-5 acc 78.906 (78.512)	lr 0.01718
Train [46][1070/3239]	Time 0.242 (0.660)	Data Time 0.001 (0.139)	Loss 2.6149 (2.8086)	Entropy 0.63219 (0.63246)	Top-1 acc 63.281 (56.253)	Top-5 acc 80.469 (78.514)	lr 0.01718
Train [46][1080/3239]	Time 0.277 (0.658)	Data Time 0.002 (0.138)	Loss 2.5525 (2.8084)	Entropy 0.63231 (0.63245)	Top-1 acc 60.547 (56.254)	Top-5 acc 82.031 (78.508)	lr 0.01718
Train [46][1090/3239]	Time 0.256 (0.657)	Data Time 0.001 (0.137)	Loss 2.6213 (2.8086)	Entropy 0.63239 (0.63245)	Top-1 acc 56.250 (56.250)	Top-5 acc 80.078 (78.508)	lr 0.01718
Train [46][1100/3239]	Time 0.256 (0.664)	Data Time 0.001 (0.145)	Loss 2.8780 (2.8088)	Entropy 0.63253 (0.63245)	Top-1 acc 54.297 (56.235)	Top-5 acc 77.734 (78.507)	lr 0.01718
Train [46][1110/3239]	Time 0.299 (0.662)	Data Time 0.002 (0.143)	Loss 2.9084 (2.8086)	Entropy 0.63281 (0.63245)	Top-1 acc 55.469 (56.239)	Top-5 acc 75.781 (78.519)	lr 0.01718
Train [46][1120/3239]	Time 0.242 (0.661)	Data Time 0.001 (0.142)	Loss 2.7093 (2.8080)	Entropy 0.63244 (0.63246)	Top-1 acc 60.547 (56.265)	Top-5 acc 78.906 (78.530)	lr 0.01718
Train [46][1130/3239]	Time 0.264 (0.661)	Data Time 0.002 (0.143)	Loss 2.8854 (2.8082)	Entropy 0.63237 (0.63246)	Top-1 acc 51.172 (56.263)	Top-5 acc 78.125 (78.527)	lr 0.01718
Train [46][1140/3239]	Time 0.245 (0.666)	Data Time 0.001 (0.149)	Loss 2.7654 (2.8082)	Entropy 0.63243 (0.63246)	Top-1 acc 60.938 (56.277)	Top-5 acc 78.906 (78.531)	lr 0.01718
Train [46][1150/3239]	Time 0.346 (0.665)	Data Time 0.001 (0.148)	Loss 2.9668 (2.8084)	Entropy 0.63247 (0.63246)	Top-1 acc 50.781 (56.273)	Top-5 acc 75.781 (78.524)	lr 0.01718
Train [46][1160/3239]	Time 0.230 (0.663)	Data Time 0.001 (0.147)	Loss 2.7154 (2.8082)	Entropy 0.63237 (0.63246)	Top-1 acc 58.984 (56.275)	Top-5 acc 82.422 (78.531)	lr 0.01718
Train [46][1170/3239]	Time 0.268 (0.670)	Data Time 0.001 (0.155)	Loss 2.9035 (2.8086)	Entropy 0.63218 (0.63246)	Top-1 acc 53.516 (56.266)	Top-5 acc 74.609 (78.517)	lr 0.01717
Train [46][1180/3239]	Time 0.261 (0.668)	Data Time 0.001 (0.153)	Loss 2.7652 (2.8084)	Entropy 0.63201 (0.63245)	Top-1 acc 55.469 (56.269)	Top-5 acc 78.906 (78.519)	lr 0.01717
Train [46][1190/3239]	Time 0.268 (0.667)	Data Time 0.001 (0.152)	Loss 2.8035 (2.8085)	Entropy 0.63217 (0.63245)	Top-1 acc 58.984 (56.264)	Top-5 acc 77.344 (78.513)	lr 0.01717
Train [46][1200/3239]	Time 0.243 (0.672)	Data Time 0.001 (0.158)	Loss 2.9889 (2.8090)	Entropy 0.63197 (0.63245)	Top-1 acc 52.734 (56.256)	Top-5 acc 76.562 (78.511)	lr 0.01717
Train [46][1210/3239]	Time 0.243 (0.670)	Data Time 0.001 (0.157)	Loss 2.7098 (2.8086)	Entropy 0.63176 (0.63244)	Top-1 acc 55.859 (56.262)	Top-5 acc 78.906 (78.523)	lr 0.01717
Train [46][1220/3239]	Time 0.351 (0.668)	Data Time 0.001 (0.155)	Loss 2.7564 (2.8082)	Entropy 0.63204 (0.63244)	Top-1 acc 59.766 (56.272)	Top-5 acc 80.469 (78.531)	lr 0.01717
Train [46][1230/3239]	Time 0.256 (0.675)	Data Time 0.001 (0.163)	Loss 2.6706 (2.8079)	Entropy 0.63221 (0.63244)	Top-1 acc 58.594 (56.283)	Top-5 acc 82.422 (78.539)	lr 0.01717
Train [46][1240/3239]	Time 0.244 (0.673)	Data Time 0.001 (0.162)	Loss 2.7433 (2.8079)	Entropy 0.63219 (0.63243)	Top-1 acc 60.156 (56.284)	Top-5 acc 79.297 (78.540)	lr 0.01717
Train [46][1250/3239]	Time 0.239 (0.672)	Data Time 0.001 (0.160)	Loss 2.9802 (2.8078)	Entropy 0.63182 (0.63243)	Top-1 acc 54.297 (56.273)	Top-5 acc 74.609 (78.537)	lr 0.01717
Train [46][1260/3239]	Time 0.260 (0.674)	Data Time 0.001 (0.163)	Loss 2.8623 (2.8078)	Entropy 0.63180 (0.63243)	Top-1 acc 54.297 (56.266)	Top-5 acc 76.562 (78.540)	lr 0.01717
Train [46][1270/3239]	Time 0.244 (0.678)	Data Time 0.001 (0.168)	Loss 2.8583 (2.8076)	Entropy 0.63165 (0.63242)	Top-1 acc 56.641 (56.275)	Top-5 acc 77.344 (78.543)	lr 0.01716
Train [46][1280/3239]	Time 0.244 (0.676)	Data Time 0.001 (0.167)	Loss 2.9813 (2.8082)	Entropy 0.63111 (0.63241)	Top-1 acc 52.734 (56.255)	Top-5 acc 75.000 (78.528)	lr 0.01716
Train [46][1290/3239]	Time 0.271 (0.674)	Data Time 0.001 (0.165)	Loss 2.9457 (2.8088)	Entropy 0.63105 (0.63240)	Top-1 acc 51.953 (56.249)	Top-5 acc 77.344 (78.523)	lr 0.01716
Train [46][1300/3239]	Time 0.267 (0.680)	Data Time 0.001 (0.172)	Loss 2.9165 (2.8093)	Entropy 0.63098 (0.63239)	Top-1 acc 53.516 (56.242)	Top-5 acc 79.688 (78.518)	lr 0.01716
Train [46][1310/3239]	Time 0.271 (0.678)	Data Time 0.001 (0.170)	Loss 2.8947 (2.8093)	Entropy 0.63083 (0.63238)	Top-1 acc 53.906 (56.246)	Top-5 acc 79.297 (78.525)	lr 0.01716
Train [46][1320/3239]	Time 0.231 (0.677)	Data Time 0.001 (0.169)	Loss 2.9508 (2.8095)	Entropy 0.63086 (0.63237)	Top-1 acc 51.562 (56.237)	Top-5 acc 78.516 (78.520)	lr 0.01716
Train [46][1330/3239]	Time 0.245 (0.683)	Data Time 0.002 (0.176)	Loss 2.9716 (2.8103)	Entropy 0.63111 (0.63236)	Top-1 acc 54.688 (56.222)	Top-5 acc 73.438 (78.509)	lr 0.01716
Train [46][1340/3239]	Time 0.245 (0.681)	Data Time 0.002 (0.174)	Loss 2.9056 (2.8102)	Entropy 0.63116 (0.63235)	Top-1 acc 52.344 (56.226)	Top-5 acc 76.172 (78.510)	lr 0.01716
Train [46][1350/3239]	Time 0.250 (0.679)	Data Time 0.001 (0.173)	Loss 2.6851 (2.8104)	Entropy 0.63131 (0.63234)	Top-1 acc 60.156 (56.226)	Top-5 acc 77.344 (78.497)	lr 0.01716
Train [46][1360/3239]	Time 0.245 (0.684)	Data Time 0.001 (0.178)	Loss 2.9327 (2.8100)	Entropy 0.63137 (0.63233)	Top-1 acc 53.906 (56.243)	Top-5 acc 75.391 (78.505)	lr 0.01716
Train [46][1370/3239]	Time 0.278 (0.682)	Data Time 0.002 (0.176)	Loss 3.0238 (2.8104)	Entropy 0.63136 (0.63232)	Top-1 acc 51.562 (56.232)	Top-5 acc 74.219 (78.497)	lr 0.01716
Train [46][1380/3239]	Time 0.352 (0.680)	Data Time 0.002 (0.175)	Loss 2.8388 (2.8100)	Entropy 0.63106 (0.63232)	Top-1 acc 56.641 (56.244)	Top-5 acc 77.734 (78.503)	lr 0.01715
Train [46][1390/3239]	Time 0.244 (0.687)	Data Time 0.002 (0.183)	Loss 2.9048 (2.8101)	Entropy 0.63130 (0.63231)	Top-1 acc 54.688 (56.239)	Top-5 acc 75.391 (78.500)	lr 0.01715
Train [46][1400/3239]	Time 0.251 (0.686)	Data Time 0.001 (0.182)	Loss 2.6321 (2.8097)	Entropy 0.63094 (0.63230)	Top-1 acc 58.594 (56.256)	Top-5 acc 81.641 (78.505)	lr 0.01715
Train [46][1410/3239]	Time 0.255 (0.684)	Data Time 0.001 (0.180)	Loss 2.7303 (2.8097)	Entropy 0.63123 (0.63229)	Top-1 acc 62.109 (56.256)	Top-5 acc 78.125 (78.509)	lr 0.01715
Train [46][1420/3239]	Time 0.246 (0.685)	Data Time 0.001 (0.182)	Loss 2.7191 (2.8096)	Entropy 0.63092 (0.63228)	Top-1 acc 58.203 (56.254)	Top-5 acc 81.641 (78.510)	lr 0.01715
Train [46][1430/3239]	Time 0.244 (0.688)	Data Time 0.001 (0.185)	Loss 2.9445 (2.8096)	Entropy 0.63110 (0.63227)	Top-1 acc 51.172 (56.257)	Top-5 acc 75.781 (78.515)	lr 0.01715
Train [46][1440/3239]	Time 0.228 (0.686)	Data Time 0.001 (0.184)	Loss 2.7993 (2.8100)	Entropy 0.63090 (0.63227)	Top-1 acc 56.641 (56.253)	Top-5 acc 78.516 (78.510)	lr 0.01715
Train [46][1450/3239]	Time 0.329 (0.684)	Data Time 0.001 (0.183)	Loss 2.8452 (2.8099)	Entropy 0.63084 (0.63226)	Top-1 acc 56.250 (56.260)	Top-5 acc 77.344 (78.510)	lr 0.01715
Train [46][1460/3239]	Time 0.236 (0.692)	Data Time 0.001 (0.192)	Loss 2.7476 (2.8102)	Entropy 0.63082 (0.63225)	Top-1 acc 59.766 (56.258)	Top-5 acc 77.734 (78.503)	lr 0.01715
Train [46][1470/3239]	Time 0.258 (0.691)	Data Time 0.001 (0.190)	Loss 2.5872 (2.8099)	Entropy 0.63100 (0.63224)	Top-1 acc 62.109 (56.271)	Top-5 acc 80.469 (78.507)	lr 0.01715
Train [46][1480/3239]	Time 0.251 (0.689)	Data Time 0.001 (0.189)	Loss 2.8700 (2.8100)	Entropy 0.63087 (0.63223)	Top-1 acc 52.344 (56.266)	Top-5 acc 76.562 (78.502)	lr 0.01715
Train [46][1490/3239]	Time 0.278 (0.694)	Data Time 0.001 (0.194)	Loss 2.6303 (2.8100)	Entropy 0.63097 (0.63222)	Top-1 acc 59.375 (56.266)	Top-5 acc 81.250 (78.499)	lr 0.01714
Train [46][1500/3239]	Time 0.239 (0.692)	Data Time 0.001 (0.193)	Loss 2.5593 (2.8101)	Entropy 0.63078 (0.63221)	Top-1 acc 63.281 (56.267)	Top-5 acc 83.984 (78.499)	lr 0.01714
Train [46][1510/3239]	Time 0.237 (0.691)	Data Time 0.001 (0.192)	Loss 2.7431 (2.8101)	Entropy 0.63107 (0.63220)	Top-1 acc 57.812 (56.268)	Top-5 acc 79.688 (78.500)	lr 0.01714
Train [46][1520/3239]	Time 0.271 (0.696)	Data Time 0.002 (0.198)	Loss 2.7730 (2.8103)	Entropy 0.63109 (0.63219)	Top-1 acc 57.422 (56.263)	Top-5 acc 77.734 (78.498)	lr 0.01714
Train [46][1530/3239]	Time 0.235 (0.694)	Data Time 0.001 (0.196)	Loss 2.6244 (2.8102)	Entropy 0.63119 (0.63219)	Top-1 acc 59.375 (56.262)	Top-5 acc 84.766 (78.498)	lr 0.01714
Train [46][1540/3239]	Time 0.373 (0.693)	Data Time 0.001 (0.195)	Loss 2.8634 (2.8103)	Entropy 0.63147 (0.63218)	Top-1 acc 55.078 (56.260)	Top-5 acc 78.516 (78.501)	lr 0.01714
Train [46][1550/3239]	Time 0.373 (0.713)	Data Time 0.004 (0.194)	Loss 2.8955 (2.8103)	Entropy 0.63185 (0.63218)	Top-1 acc 55.469 (56.263)	Top-5 acc 76.953 (78.504)	lr 0.01714
Train [46][1560/3239]	Time 0.247 (0.711)	Data Time 0.002 (0.193)	Loss 2.7235 (2.8106)	Entropy 0.63209 (0.63218)	Top-1 acc 61.328 (56.257)	Top-5 acc 78.125 (78.496)	lr 0.01714
Train [46][1570/3239]	Time 0.251 (0.709)	Data Time 0.002 (0.191)	Loss 2.8311 (2.8109)	Entropy 0.63237 (0.63218)	Top-1 acc 57.812 (56.253)	Top-5 acc 79.297 (78.492)	lr 0.01714
Train [46][1580/3239]	Time 0.251 (0.708)	Data Time 0.001 (0.190)	Loss 2.8115 (2.8108)	Entropy 0.63199 (0.63218)	Top-1 acc 61.719 (56.260)	Top-5 acc 81.250 (78.494)	lr 0.01714
Train [46][1590/3239]	Time 0.229 (0.706)	Data Time 0.001 (0.189)	Loss 2.9187 (2.8110)	Entropy 0.63192 (0.63218)	Top-1 acc 58.984 (56.262)	Top-5 acc 75.781 (78.484)	lr 0.01713
Train [46][1600/3239]	Time 0.248 (0.704)	Data Time 0.001 (0.188)	Loss 2.7315 (2.8112)	Entropy 0.63176 (0.63217)	Top-1 acc 59.766 (56.255)	Top-5 acc 78.516 (78.480)	lr 0.01713
Train [46][1610/3239]	Time 0.439 (0.703)	Data Time 0.001 (0.187)	Loss 2.4313 (2.8111)	Entropy 0.63172 (0.63217)	Top-1 acc 62.109 (56.259)	Top-5 acc 87.109 (78.486)	lr 0.01713
Train [46][1620/3239]	Time 0.269 (0.702)	Data Time 0.001 (0.187)	Loss 2.7279 (2.8110)	Entropy 0.63187 (0.63217)	Top-1 acc 59.766 (56.260)	Top-5 acc 82.422 (78.487)	lr 0.01713
Train [46][1630/3239]	Time 0.250 (0.701)	Data Time 0.001 (0.186)	Loss 2.8401 (2.8109)	Entropy 0.63201 (0.63217)	Top-1 acc 54.688 (56.264)	Top-5 acc 80.469 (78.485)	lr 0.01713
Train [46][1640/3239]	Time 1.302 (0.700)	Data Time 1.064 (0.185)	Loss 2.6754 (2.8108)	Entropy 0.63226 (0.63217)	Top-1 acc 57.812 (56.272)	Top-5 acc 78.906 (78.488)	lr 0.01713
Train [46][1650/3239]	Time 0.259 (0.708)	Data Time 0.001 (0.194)	Loss 2.8378 (2.8114)	Entropy 0.63218 (0.63217)	Top-1 acc 55.469 (56.253)	Top-5 acc 76.953 (78.473)	lr 0.01713
Train [46][1660/3239]	Time 0.242 (0.706)	Data Time 0.001 (0.193)	Loss 2.7543 (2.8116)	Entropy 0.63217 (0.63217)	Top-1 acc 58.594 (56.246)	Top-5 acc 78.906 (78.466)	lr 0.01713
Train [46][1670/3239]	Time 0.231 (0.705)	Data Time 0.001 (0.192)	Loss 2.6984 (2.8114)	Entropy 0.63176 (0.63217)	Top-1 acc 58.984 (56.251)	Top-5 acc 82.812 (78.468)	lr 0.01713
Train [46][1680/3239]	Time 0.233 (0.710)	Data Time 0.001 (0.197)	Loss 2.7711 (2.8112)	Entropy 0.63148 (0.63216)	Top-1 acc 59.375 (56.258)	Top-5 acc 79.688 (78.472)	lr 0.01713
Train [46][1690/3239]	Time 0.241 (0.708)	Data Time 0.001 (0.196)	Loss 2.8254 (2.8112)	Entropy 0.63154 (0.63216)	Top-1 acc 54.688 (56.256)	Top-5 acc 78.516 (78.475)	lr 0.01713
Train [46][1700/3239]	Time 0.350 (0.708)	Data Time 0.001 (0.196)	Loss 2.6060 (2.8115)	Entropy 0.63108 (0.63215)	Top-1 acc 59.375 (56.246)	Top-5 acc 82.031 (78.470)	lr 0.01712
Train [46][1710/3239]	Time 0.243 (0.713)	Data Time 0.001 (0.202)	Loss 2.8194 (2.8114)	Entropy 0.63107 (0.63215)	Top-1 acc 53.906 (56.247)	Top-5 acc 78.516 (78.469)	lr 0.01712
Train [46][1720/3239]	Time 0.289 (0.712)	Data Time 0.003 (0.201)	Loss 2.7893 (2.8115)	Entropy 0.63117 (0.63214)	Top-1 acc 62.109 (56.252)	Top-5 acc 78.516 (78.466)	lr 0.01712
Train [46][1730/3239]	Time 0.250 (0.712)	Data Time 0.001 (0.201)	Loss 2.7070 (2.8114)	Entropy 0.63129 (0.63214)	Top-1 acc 57.422 (56.250)	Top-5 acc 79.297 (78.472)	lr 0.01712
Train [46][1740/3239]	Time 2.801 (0.713)	Data Time 2.479 (0.203)	Loss 2.7710 (2.8114)	Entropy 0.63132 (0.63213)	Top-1 acc 56.250 (56.254)	Top-5 acc 78.906 (78.475)	lr 0.01712
Train [46][1750/3239]	Time 0.249 (0.716)	Data Time 0.001 (0.207)	Loss 2.8218 (2.8112)	Entropy 0.63118 (0.63213)	Top-1 acc 58.594 (56.255)	Top-5 acc 81.250 (78.478)	lr 0.01712
Train [46][1760/3239]	Time 0.235 (0.716)	Data Time 0.001 (0.206)	Loss 2.8736 (2.8114)	Entropy 0.63113 (0.63212)	Top-1 acc 54.688 (56.246)	Top-5 acc 76.953 (78.476)	lr 0.01712
Train [46][1770/3239]	Time 1.048 (0.716)	Data Time 0.682 (0.207)	Loss 2.8157 (2.8111)	Entropy 0.63116 (0.63211)	Top-1 acc 56.641 (56.253)	Top-5 acc 80.469 (78.479)	lr 0.01712
Train [46][1780/3239]	Time 0.250 (0.720)	Data Time 0.001 (0.212)	Loss 2.9849 (2.8115)	Entropy 0.63100 (0.63211)	Top-1 acc 48.828 (56.241)	Top-5 acc 76.953 (78.473)	lr 0.01712
Train [46][1790/3239]	Time 0.252 (0.718)	Data Time 0.001 (0.211)	Loss 2.8746 (2.8118)	Entropy 0.63106 (0.63210)	Top-1 acc 54.688 (56.241)	Top-5 acc 74.219 (78.468)	lr 0.01712
Train [46][1800/3239]	Time 0.247 (0.718)	Data Time 0.001 (0.210)	Loss 2.8309 (2.8119)	Entropy 0.63095 (0.63210)	Top-1 acc 55.859 (56.241)	Top-5 acc 76.172 (78.467)	lr 0.01712
Train [46][1810/3239]	Time 0.255 (0.725)	Data Time 0.001 (0.218)	Loss 2.9420 (2.8118)	Entropy 0.63131 (0.63209)	Top-1 acc 52.734 (56.241)	Top-5 acc 76.172 (78.468)	lr 0.01711
Train [46][1820/3239]	Time 0.243 (0.724)	Data Time 0.001 (0.217)	Loss 2.7396 (2.8119)	Entropy 0.63112 (0.63209)	Top-1 acc 55.859 (56.233)	Top-5 acc 79.688 (78.461)	lr 0.01711
Train [46][1830/3239]	Time 0.248 (0.722)	Data Time 0.001 (0.216)	Loss 3.1472 (2.8120)	Entropy 0.63086 (0.63208)	Top-1 acc 49.219 (56.229)	Top-5 acc 71.094 (78.461)	lr 0.01711
Train [46][1840/3239]	Time 0.279 (0.729)	Data Time 0.001 (0.223)	Loss 2.7445 (2.8120)	Entropy 0.63096 (0.63207)	Top-1 acc 56.641 (56.222)	Top-5 acc 81.250 (78.463)	lr 0.01711
Train [46][1850/3239]	Time 0.246 (0.727)	Data Time 0.001 (0.222)	Loss 2.9290 (2.8118)	Entropy 0.63088 (0.63207)	Top-1 acc 50.781 (56.219)	Top-5 acc 76.172 (78.464)	lr 0.01711
Train [46][1860/3239]	Time 0.330 (0.726)	Data Time 0.001 (0.221)	Loss 2.8651 (2.8117)	Entropy 0.63075 (0.63206)	Top-1 acc 57.031 (56.234)	Top-5 acc 77.344 (78.465)	lr 0.01711
Train [46][1870/3239]	Time 0.269 (0.733)	Data Time 0.002 (0.228)	Loss 2.7626 (2.8115)	Entropy 0.63083 (0.63205)	Top-1 acc 55.469 (56.237)	Top-5 acc 81.250 (78.469)	lr 0.01711
Train [46][1880/3239]	Time 0.243 (0.732)	Data Time 0.001 (0.228)	Loss 2.9195 (2.8114)	Entropy 0.63095 (0.63205)	Top-1 acc 53.516 (56.239)	Top-5 acc 77.344 (78.472)	lr 0.01711
Train [46][1890/3239]	Time 0.233 (0.730)	Data Time 0.001 (0.226)	Loss 2.7462 (2.8111)	Entropy 0.63098 (0.63204)	Top-1 acc 55.469 (56.243)	Top-5 acc 78.516 (78.477)	lr 0.01711
Train [46][1900/3239]	Time 3.802 (0.734)	Data Time 3.546 (0.231)	Loss 2.9845 (2.8114)	Entropy 0.63106 (0.63204)	Top-1 acc 51.172 (56.238)	Top-5 acc 76.172 (78.468)	lr 0.01711
Train [46][1910/3239]	Time 0.255 (0.736)	Data Time 0.001 (0.233)	Loss 2.7781 (2.8113)	Entropy 0.63121 (0.63203)	Top-1 acc 54.688 (56.239)	Top-5 acc 77.344 (78.469)	lr 0.01710
Train [46][1920/3239]	Time 0.286 (0.735)	Data Time 0.002 (0.232)	Loss 2.8471 (2.8116)	Entropy 0.63144 (0.63203)	Top-1 acc 59.375 (56.233)	Top-5 acc 77.344 (78.463)	lr 0.01710
Train [46][1930/3239]	Time 4.466 (0.737)	Data Time 4.122 (0.234)	Loss 2.8451 (2.8116)	Entropy 0.63145 (0.63202)	Top-1 acc 58.203 (56.238)	Top-5 acc 76.953 (78.465)	lr 0.01710
Train [46][1940/3239]	Time 0.266 (0.739)	Data Time 0.001 (0.237)	Loss 3.0040 (2.8115)	Entropy 0.63140 (0.63202)	Top-1 acc 50.391 (56.243)	Top-5 acc 75.781 (78.465)	lr 0.01710
Train [46][1950/3239]	Time 0.249 (0.740)	Data Time 0.002 (0.239)	Loss 2.8542 (2.8112)	Entropy 0.63099 (0.63202)	Top-1 acc 54.688 (56.248)	Top-5 acc 77.344 (78.471)	lr 0.01710
Train [46][1960/3239]	Time 0.235 (0.739)	Data Time 0.001 (0.237)	Loss 2.8197 (2.8113)	Entropy 0.63087 (0.63201)	Top-1 acc 54.297 (56.244)	Top-5 acc 80.859 (78.474)	lr 0.01710
Train [46][1970/3239]	Time 0.292 (0.744)	Data Time 0.003 (0.243)	Loss 2.8476 (2.8114)	Entropy 0.63074 (0.63201)	Top-1 acc 55.469 (56.241)	Top-5 acc 77.344 (78.471)	lr 0.01710
Train [46][1980/3239]	Time 0.239 (0.745)	Data Time 0.001 (0.245)	Loss 2.9070 (2.8116)	Entropy 0.63076 (0.63200)	Top-1 acc 55.859 (56.244)	Top-5 acc 77.734 (78.471)	lr 0.01710
Train [46][1990/3239]	Time 0.244 (0.744)	Data Time 0.001 (0.243)	Loss 2.7928 (2.8117)	Entropy 0.63109 (0.63200)	Top-1 acc 54.688 (56.239)	Top-5 acc 78.125 (78.465)	lr 0.01710
Train [46][2000/3239]	Time 0.244 (0.748)	Data Time 0.001 (0.248)	Loss 2.6217 (2.8116)	Entropy 0.63160 (0.63199)	Top-1 acc 64.453 (56.244)	Top-5 acc 81.250 (78.466)	lr 0.01710
Train [46][2010/3239]	Time 0.253 (0.749)	Data Time 0.001 (0.249)	Loss 2.8846 (2.8117)	Entropy 0.63184 (0.63199)	Top-1 acc 53.516 (56.242)	Top-5 acc 75.000 (78.463)	lr 0.01710
Train [46][2020/3239]	Time 0.246 (0.748)	Data Time 0.001 (0.249)	Loss 2.7557 (2.8116)	Entropy 0.63151 (0.63199)	Top-1 acc 59.375 (56.242)	Top-5 acc 80.078 (78.468)	lr 0.01709
Train [46][2030/3239]	Time 0.233 (0.753)	Data Time 0.002 (0.254)	Loss 3.1330 (2.8119)	Entropy 0.63143 (0.63199)	Top-1 acc 50.781 (56.232)	Top-5 acc 71.484 (78.466)	lr 0.01709
Train [46][2040/3239]	Time 0.236 (0.754)	Data Time 0.001 (0.255)	Loss 2.6565 (2.8121)	Entropy 0.63169 (0.63198)	Top-1 acc 62.109 (56.227)	Top-5 acc 82.422 (78.464)	lr 0.01709
Train [46][2050/3239]	Time 0.237 (0.755)	Data Time 0.001 (0.257)	Loss 2.8283 (2.8122)	Entropy 0.63192 (0.63198)	Top-1 acc 58.594 (56.224)	Top-5 acc 76.172 (78.459)	lr 0.01709
Train [46][2060/3239]	Time 5.605 (0.757)	Data Time 5.362 (0.259)	Loss 2.9200 (2.8122)	Entropy 0.63147 (0.63198)	Top-1 acc 52.734 (56.222)	Top-5 acc 77.734 (78.460)	lr 0.01709
Train [46][2070/3239]	Time 0.257 (0.760)	Data Time 0.002 (0.263)	Loss 2.8237 (2.8123)	Entropy 0.63147 (0.63198)	Top-1 acc 53.906 (56.222)	Top-5 acc 79.688 (78.461)	lr 0.01709
Train [46][2080/3239]	Time 0.236 (0.762)	Data Time 0.001 (0.264)	Loss 2.8918 (2.8124)	Entropy 0.63166 (0.63198)	Top-1 acc 55.859 (56.219)	Top-5 acc 75.781 (78.453)	lr 0.01709
Train [46][2090/3239]	Time 0.321 (0.760)	Data Time 0.001 (0.263)	Loss 2.6725 (2.8122)	Entropy 0.63161 (0.63198)	Top-1 acc 57.812 (56.225)	Top-5 acc 81.641 (78.458)	lr 0.01709
Train [46][2100/3239]	Time 0.259 (0.761)	Data Time 0.001 (0.264)	Loss 2.8998 (2.8124)	Entropy 0.63122 (0.63197)	Top-1 acc 54.297 (56.214)	Top-5 acc 78.125 (78.453)	lr 0.01709
Train [46][2110/3239]	Time 0.250 (0.765)	Data Time 0.002 (0.269)	Loss 2.6620 (2.8125)	Entropy 0.63167 (0.63197)	Top-1 acc 58.594 (56.204)	Top-5 acc 83.203 (78.454)	lr 0.01709
Train [46][2120/3239]	Time 0.257 (0.764)	Data Time 0.002 (0.268)	Loss 3.0171 (2.8126)	Entropy 0.63168 (0.63197)	Top-1 acc 51.172 (56.201)	Top-5 acc 75.391 (78.451)	lr 0.01709
Train [46][2130/3239]	Time 0.228 (0.765)	Data Time 0.001 (0.269)	Loss 2.6219 (2.8123)	Entropy 0.63182 (0.63197)	Top-1 acc 61.719 (56.212)	Top-5 acc 83.594 (78.458)	lr 0.01708
Train [46][2140/3239]	Time 0.244 (0.771)	Data Time 0.001 (0.276)	Loss 2.5113 (2.8123)	Entropy 0.63164 (0.63197)	Top-1 acc 63.281 (56.220)	Top-5 acc 82.812 (78.449)	lr 0.01708
Train [46][2150/3239]	Time 0.240 (0.770)	Data Time 0.001 (0.274)	Loss 2.6568 (2.8121)	Entropy 0.63193 (0.63197)	Top-1 acc 60.547 (56.229)	Top-5 acc 80.859 (78.454)	lr 0.01708
Train [46][2160/3239]	Time 1.407 (0.771)	Data Time 1.053 (0.276)	Loss 2.9301 (2.8122)	Entropy 0.63213 (0.63197)	Top-1 acc 52.344 (56.228)	Top-5 acc 76.562 (78.452)	lr 0.01708
Train [46][2170/3239]	Time 0.236 (0.776)	Data Time 0.001 (0.282)	Loss 2.8157 (2.8119)	Entropy 0.63214 (0.63197)	Top-1 acc 54.688 (56.230)	Top-5 acc 77.734 (78.461)	lr 0.01708
Train [46][2180/3239]	Time 0.250 (0.775)	Data Time 0.002 (0.280)	Loss 2.7391 (2.8119)	Entropy 0.63225 (0.63197)	Top-1 acc 58.594 (56.232)	Top-5 acc 76.562 (78.460)	lr 0.01708
Train [46][2190/3239]	Time 0.266 (0.777)	Data Time 0.001 (0.283)	Loss 2.6324 (2.8117)	Entropy 0.63215 (0.63197)	Top-1 acc 59.375 (56.241)	Top-5 acc 80.859 (78.465)	lr 0.01708
Train [46][2200/3239]	Time 0.377 (0.794)	Data Time 0.004 (0.285)	Loss 2.7657 (2.8119)	Entropy 0.63262 (0.63197)	Top-1 acc 57.031 (56.237)	Top-5 acc 79.688 (78.464)	lr 0.01708
Train [46][2210/3239]	Time 0.325 (0.793)	Data Time 0.002 (0.284)	Loss 2.8158 (2.8116)	Entropy 0.63260 (0.63197)	Top-1 acc 57.422 (56.241)	Top-5 acc 82.031 (78.473)	lr 0.01708
Train [46][2220/3239]	Time 0.305 (0.791)	Data Time 0.004 (0.283)	Loss 2.7941 (2.8116)	Entropy 0.63276 (0.63198)	Top-1 acc 57.422 (56.244)	Top-5 acc 80.469 (78.470)	lr 0.01708
Train [46][2230/3239]	Time 0.256 (0.790)	Data Time 0.002 (0.281)	Loss 2.8189 (2.8115)	Entropy 0.63289 (0.63198)	Top-1 acc 58.594 (56.245)	Top-5 acc 77.734 (78.470)	lr 0.01707
Train [46][2240/3239]	Time 0.248 (0.788)	Data Time 0.001 (0.280)	Loss 2.7688 (2.8116)	Entropy 0.63298 (0.63199)	Top-1 acc 57.422 (56.242)	Top-5 acc 78.516 (78.463)	lr 0.01707
Train [46][2250/3239]	Time 0.331 (0.787)	Data Time 0.002 (0.279)	Loss 3.0151 (2.8116)	Entropy 0.63286 (0.63199)	Top-1 acc 49.609 (56.239)	Top-5 acc 76.172 (78.463)	lr 0.01707
Train [46][2260/3239]	Time 0.246 (0.785)	Data Time 0.001 (0.278)	Loss 2.7527 (2.8117)	Entropy 0.63258 (0.63199)	Top-1 acc 55.469 (56.234)	Top-5 acc 80.078 (78.462)	lr 0.01707
Train [46][2270/3239]	Time 0.264 (0.786)	Data Time 0.001 (0.279)	Loss 2.9816 (2.8119)	Entropy 0.63248 (0.63200)	Top-1 acc 53.516 (56.231)	Top-5 acc 76.562 (78.455)	lr 0.01707
Train [46][2280/3239]	Time 0.256 (0.785)	Data Time 0.001 (0.278)	Loss 2.8760 (2.8118)	Entropy 0.63232 (0.63200)	Top-1 acc 55.078 (56.235)	Top-5 acc 74.609 (78.458)	lr 0.01707
Train [46][2290/3239]	Time 0.247 (0.787)	Data Time 0.001 (0.281)	Loss 2.6773 (2.8117)	Entropy 0.63238 (0.63200)	Top-1 acc 58.203 (56.233)	Top-5 acc 82.812 (78.462)	lr 0.01707
Train [46][2300/3239]	Time 4.208 (0.788)	Data Time 3.896 (0.282)	Loss 3.0081 (2.8119)	Entropy 0.63247 (0.63200)	Top-1 acc 50.391 (56.228)	Top-5 acc 75.000 (78.460)	lr 0.01707
Train [46][2310/3239]	Time 0.240 (0.788)	Data Time 0.001 (0.282)	Loss 2.9255 (2.8118)	Entropy 0.63251 (0.63200)	Top-1 acc 53.906 (56.229)	Top-5 acc 78.125 (78.463)	lr 0.01707
Train [46][2320/3239]	Time 0.367 (0.791)	Data Time 0.001 (0.285)	Loss 2.7862 (2.8122)	Entropy 0.63220 (0.63200)	Top-1 acc 56.641 (56.217)	Top-5 acc 78.125 (78.455)	lr 0.01707
Train [46][2330/3239]	Time 0.231 (0.790)	Data Time 0.001 (0.284)	Loss 2.6760 (2.8121)	Entropy 0.63241 (0.63201)	Top-1 acc 59.766 (56.220)	Top-5 acc 82.422 (78.456)	lr 0.01707
Train [46][2340/3239]	Time 0.248 (0.792)	Data Time 0.001 (0.287)	Loss 2.8870 (2.8121)	Entropy 0.63230 (0.63201)	Top-1 acc 53.906 (56.221)	Top-5 acc 76.172 (78.457)	lr 0.01706
Train [46][2350/3239]	Time 0.244 (0.794)	Data Time 0.001 (0.289)	Loss 2.8270 (2.8121)	Entropy 0.63245 (0.63201)	Top-1 acc 55.078 (56.217)	Top-5 acc 76.562 (78.454)	lr 0.01706
Train [46][2360/3239]	Time 0.255 (0.793)	Data Time 0.001 (0.288)	Loss 2.8815 (2.8122)	Entropy 0.63223 (0.63201)	Top-1 acc 51.953 (56.214)	Top-5 acc 77.734 (78.452)	lr 0.01706
Train [46][2370/3239]	Time 0.270 (0.796)	Data Time 0.001 (0.291)	Loss 2.8899 (2.8121)	Entropy 0.63227 (0.63201)	Top-1 acc 52.734 (56.220)	Top-5 acc 79.688 (78.453)	lr 0.01706
Train [46][2380/3239]	Time 0.265 (0.797)	Data Time 0.001 (0.293)	Loss 2.7931 (2.8121)	Entropy 0.63250 (0.63201)	Top-1 acc 55.469 (56.220)	Top-5 acc 79.688 (78.455)	lr 0.01706
Train [46][2390/3239]	Time 0.260 (0.797)	Data Time 0.001 (0.293)	Loss 2.9902 (2.8121)	Entropy 0.63239 (0.63202)	Top-1 acc 48.828 (56.223)	Top-5 acc 74.609 (78.456)	lr 0.01706
Train [46][2400/3239]	Time 0.269 (0.800)	Data Time 0.002 (0.296)	Loss 2.8603 (2.8122)	Entropy 0.63218 (0.63202)	Top-1 acc 55.078 (56.224)	Top-5 acc 79.688 (78.456)	lr 0.01706
Train [46][2410/3239]	Time 3.360 (0.800)	Data Time 2.967 (0.297)	Loss 2.8599 (2.8121)	Entropy 0.63179 (0.63202)	Top-1 acc 50.781 (56.225)	Top-5 acc 78.516 (78.458)	lr 0.01706
Train [46][2420/3239]	Time 2.758 (0.800)	Data Time 2.493 (0.297)	Loss 2.8257 (2.8122)	Entropy 0.63213 (0.63202)	Top-1 acc 55.469 (56.223)	Top-5 acc 76.953 (78.461)	lr 0.01706
Train [46][2430/3239]	Time 4.395 (0.802)	Data Time 4.148 (0.300)	Loss 2.7546 (2.8122)	Entropy 0.63211 (0.63202)	Top-1 acc 52.344 (56.216)	Top-5 acc 80.469 (78.459)	lr 0.01706
Train [46][2440/3239]	Time 3.854 (0.803)	Data Time 3.598 (0.300)	Loss 2.8636 (2.8125)	Entropy 0.63227 (0.63202)	Top-1 acc 53.906 (56.208)	Top-5 acc 75.781 (78.453)	lr 0.01705
Train [46][2450/3239]	Time 0.252 (0.803)	Data Time 0.001 (0.300)	Loss 2.6900 (2.8125)	Entropy 0.63229 (0.63202)	Top-1 acc 57.812 (56.209)	Top-5 acc 79.297 (78.454)	lr 0.01705
Train [46][2460/3239]	Time 0.228 (0.804)	Data Time 0.001 (0.301)	Loss 2.6472 (2.8125)	Entropy 0.63187 (0.63202)	Top-1 acc 62.109 (56.212)	Top-5 acc 81.250 (78.452)	lr 0.01705
Train [46][2470/3239]	Time 0.242 (0.805)	Data Time 0.001 (0.303)	Loss 2.7276 (2.8124)	Entropy 0.63134 (0.63202)	Top-1 acc 58.594 (56.216)	Top-5 acc 78.516 (78.452)	lr 0.01705
Train [46][2480/3239]	Time 3.219 (0.806)	Data Time 2.878 (0.304)	Loss 2.8825 (2.8126)	Entropy 0.63149 (0.63202)	Top-1 acc 54.297 (56.208)	Top-5 acc 75.391 (78.448)	lr 0.01705
Train [46][2490/3239]	Time 0.241 (0.807)	Data Time 0.001 (0.305)	Loss 2.7416 (2.8129)	Entropy 0.63133 (0.63201)	Top-1 acc 58.984 (56.203)	Top-5 acc 82.422 (78.443)	lr 0.01705
Train [46][2500/3239]	Time 0.240 (0.808)	Data Time 0.001 (0.307)	Loss 2.9125 (2.8130)	Entropy 0.63100 (0.63201)	Top-1 acc 54.688 (56.203)	Top-5 acc 74.609 (78.437)	lr 0.01705
Train [46][2510/3239]	Time 0.240 (0.809)	Data Time 0.001 (0.308)	Loss 2.9889 (2.8133)	Entropy 0.63094 (0.63201)	Top-1 acc 48.438 (56.192)	Top-5 acc 77.344 (78.434)	lr 0.01705
Train [46][2520/3239]	Time 0.248 (0.808)	Data Time 0.001 (0.308)	Loss 2.6420 (2.8136)	Entropy 0.63116 (0.63200)	Top-1 acc 60.547 (56.188)	Top-5 acc 83.594 (78.428)	lr 0.01705
Train [46][2530/3239]	Time 0.234 (0.809)	Data Time 0.001 (0.309)	Loss 2.8270 (2.8134)	Entropy 0.63117 (0.63200)	Top-1 acc 53.906 (56.189)	Top-5 acc 76.953 (78.429)	lr 0.01705
Train [46][2540/3239]	Time 0.239 (0.809)	Data Time 0.001 (0.309)	Loss 2.8383 (2.8135)	Entropy 0.63126 (0.63200)	Top-1 acc 55.469 (56.187)	Top-5 acc 78.516 (78.428)	lr 0.01705
Train [46][2550/3239]	Time 0.239 (0.808)	Data Time 0.001 (0.308)	Loss 3.0317 (2.8137)	Entropy 0.63139 (0.63199)	Top-1 acc 51.953 (56.179)	Top-5 acc 75.000 (78.427)	lr 0.01704
Train [46][2560/3239]	Time 0.228 (0.807)	Data Time 0.001 (0.308)	Loss 2.8319 (2.8137)	Entropy 0.63111 (0.63199)	Top-1 acc 55.078 (56.178)	Top-5 acc 76.562 (78.431)	lr 0.01704
Train [46][2570/3239]	Time 8.182 (0.809)	Data Time 7.917 (0.309)	Loss 2.7859 (2.8137)	Entropy 0.63159 (0.63199)	Top-1 acc 58.203 (56.178)	Top-5 acc 77.344 (78.431)	lr 0.01704
Train [46][2580/3239]	Time 1.321 (0.808)	Data Time 1.079 (0.309)	Loss 2.7988 (2.8140)	Entropy 0.63153 (0.63198)	Top-1 acc 56.250 (56.170)	Top-5 acc 79.688 (78.427)	lr 0.01704
Train [46][2590/3239]	Time 4.950 (0.810)	Data Time 4.702 (0.312)	Loss 2.6360 (2.8139)	Entropy 0.63135 (0.63198)	Top-1 acc 60.547 (56.171)	Top-5 acc 81.641 (78.429)	lr 0.01704
Train [46][2600/3239]	Time 0.934 (0.809)	Data Time 0.703 (0.311)	Loss 2.8448 (2.8143)	Entropy 0.63163 (0.63198)	Top-1 acc 58.203 (56.166)	Top-5 acc 77.734 (78.421)	lr 0.01704
Train [46][2610/3239]	Time 0.231 (0.811)	Data Time 0.001 (0.313)	Loss 3.0766 (2.8145)	Entropy 0.63185 (0.63198)	Top-1 acc 51.953 (56.164)	Top-5 acc 75.781 (78.416)	lr 0.01704
Train [46][2620/3239]	Time 0.228 (0.812)	Data Time 0.001 (0.315)	Loss 2.6617 (2.8147)	Entropy 0.63190 (0.63198)	Top-1 acc 60.156 (56.158)	Top-5 acc 83.594 (78.409)	lr 0.01704
Train [46][2630/3239]	Time 0.233 (0.812)	Data Time 0.001 (0.315)	Loss 2.7149 (2.8147)	Entropy 0.63198 (0.63198)	Top-1 acc 57.812 (56.160)	Top-5 acc 78.516 (78.411)	lr 0.01704
Train [46][2640/3239]	Time 1.001 (0.815)	Data Time 0.639 (0.318)	Loss 2.8896 (2.8149)	Entropy 0.63200 (0.63198)	Top-1 acc 54.297 (56.153)	Top-5 acc 76.562 (78.408)	lr 0.01704
Train [46][2650/3239]	Time 0.863 (0.816)	Data Time 0.622 (0.319)	Loss 2.7153 (2.8147)	Entropy 0.63244 (0.63198)	Top-1 acc 59.766 (56.160)	Top-5 acc 80.078 (78.411)	lr 0.01704
Train [46][2660/3239]	Time 0.250 (0.817)	Data Time 0.001 (0.320)	Loss 2.8855 (2.8149)	Entropy 0.63227 (0.63198)	Top-1 acc 52.344 (56.152)	Top-5 acc 77.344 (78.408)	lr 0.01703
Train [46][2670/3239]	Time 0.246 (0.818)	Data Time 0.001 (0.321)	Loss 2.9259 (2.8150)	Entropy 0.63228 (0.63198)	Top-1 acc 53.125 (56.148)	Top-5 acc 75.781 (78.408)	lr 0.01703
Train [46][2680/3239]	Time 0.235 (0.818)	Data Time 0.001 (0.322)	Loss 2.6038 (2.8150)	Entropy 0.63254 (0.63198)	Top-1 acc 65.234 (56.152)	Top-5 acc 82.031 (78.410)	lr 0.01703
Train [46][2690/3239]	Time 0.242 (0.820)	Data Time 0.001 (0.324)	Loss 2.9535 (2.8151)	Entropy 0.63251 (0.63199)	Top-1 acc 50.391 (56.146)	Top-5 acc 75.781 (78.406)	lr 0.01703
Train [46][2700/3239]	Time 0.240 (0.821)	Data Time 0.001 (0.326)	Loss 2.7209 (2.8150)	Entropy 0.63246 (0.63199)	Top-1 acc 58.203 (56.148)	Top-5 acc 79.297 (78.410)	lr 0.01703
Train [46][2710/3239]	Time 0.351 (0.821)	Data Time 0.001 (0.326)	Loss 3.1250 (2.8151)	Entropy 0.63275 (0.63199)	Top-1 acc 51.562 (56.148)	Top-5 acc 72.266 (78.408)	lr 0.01703
Train [46][2720/3239]	Time 0.276 (0.821)	Data Time 0.002 (0.326)	Loss 2.9289 (2.8152)	Entropy 0.63264 (0.63199)	Top-1 acc 52.734 (56.149)	Top-5 acc 76.172 (78.406)	lr 0.01703
Train [46][2730/3239]	Time 3.524 (0.821)	Data Time 3.263 (0.326)	Loss 2.9562 (2.8151)	Entropy 0.63272 (0.63199)	Top-1 acc 54.297 (56.155)	Top-5 acc 76.953 (78.408)	lr 0.01703
Train [46][2740/3239]	Time 0.248 (0.821)	Data Time 0.001 (0.326)	Loss 3.0053 (2.8151)	Entropy 0.63278 (0.63200)	Top-1 acc 55.469 (56.156)	Top-5 acc 72.266 (78.408)	lr 0.01703
Train [46][2750/3239]	Time 0.292 (0.820)	Data Time 0.044 (0.326)	Loss 2.6780 (2.8153)	Entropy 0.63289 (0.63200)	Top-1 acc 57.422 (56.153)	Top-5 acc 79.297 (78.403)	lr 0.01703
Train [46][2760/3239]	Time 0.239 (0.819)	Data Time 0.001 (0.325)	Loss 2.8893 (2.8155)	Entropy 0.63321 (0.63200)	Top-1 acc 55.469 (56.150)	Top-5 acc 76.172 (78.396)	lr 0.01702
Train [46][2770/3239]	Time 0.237 (0.820)	Data Time 0.001 (0.326)	Loss 2.7247 (2.8156)	Entropy 0.63268 (0.63201)	Top-1 acc 54.688 (56.144)	Top-5 acc 79.688 (78.392)	lr 0.01702
Train [46][2780/3239]	Time 0.238 (0.820)	Data Time 0.001 (0.326)	Loss 2.7909 (2.8156)	Entropy 0.63277 (0.63201)	Top-1 acc 55.859 (56.144)	Top-5 acc 79.688 (78.393)	lr 0.01702
Train [46][2790/3239]	Time 0.266 (0.818)	Data Time 0.001 (0.325)	Loss 2.6980 (2.8154)	Entropy 0.63321 (0.63201)	Top-1 acc 54.297 (56.148)	Top-5 acc 82.031 (78.396)	lr 0.01702
Train [46][2800/3239]	Time 7.207 (0.820)	Data Time 6.850 (0.327)	Loss 2.9305 (2.8154)	Entropy 0.63318 (0.63202)	Top-1 acc 52.734 (56.146)	Top-5 acc 75.781 (78.396)	lr 0.01702
Train [46][2810/3239]	Time 4.053 (0.819)	Data Time 3.811 (0.327)	Loss 2.7400 (2.8156)	Entropy 0.63371 (0.63202)	Top-1 acc 58.984 (56.141)	Top-5 acc 78.516 (78.394)	lr 0.01702
Train [46][2820/3239]	Time 0.236 (0.818)	Data Time 0.001 (0.326)	Loss 2.8425 (2.8154)	Entropy 0.63374 (0.63203)	Top-1 acc 54.297 (56.147)	Top-5 acc 77.734 (78.396)	lr 0.01702
Train [46][2830/3239]	Time 0.249 (0.817)	Data Time 0.001 (0.325)	Loss 2.5615 (2.8152)	Entropy 0.63397 (0.63204)	Top-1 acc 59.375 (56.150)	Top-5 acc 82.812 (78.398)	lr 0.01702
Train [46][2840/3239]	Time 0.239 (0.816)	Data Time 0.001 (0.325)	Loss 2.6757 (2.8151)	Entropy 0.63379 (0.63204)	Top-1 acc 58.594 (56.149)	Top-5 acc 80.859 (78.398)	lr 0.01702
Train [46][2850/3239]	Time 0.261 (0.817)	Data Time 0.001 (0.326)	Loss 2.9654 (2.8152)	Entropy 0.63383 (0.63205)	Top-1 acc 53.125 (56.151)	Top-5 acc 75.391 (78.397)	lr 0.01702
Train [46][2860/3239]	Time 0.304 (0.828)	Data Time 0.028 (0.325)	Loss 2.9345 (2.8153)	Entropy 0.63384 (0.63205)	Top-1 acc 53.906 (56.149)	Top-5 acc 75.781 (78.393)	lr 0.01702
Train [46][2870/3239]	Time 0.356 (0.826)	Data Time 0.002 (0.323)	Loss 2.7891 (2.8155)	Entropy 0.63379 (0.63206)	Top-1 acc 58.594 (56.146)	Top-5 acc 79.688 (78.391)	lr 0.01701
Train [46][2880/3239]	Time 0.244 (0.825)	Data Time 0.002 (0.322)	Loss 2.6985 (2.8153)	Entropy 0.63375 (0.63207)	Top-1 acc 57.422 (56.151)	Top-5 acc 83.984 (78.397)	lr 0.01701
Train [46][2890/3239]	Time 0.271 (0.824)	Data Time 0.001 (0.321)	Loss 2.9025 (2.8154)	Entropy 0.63369 (0.63207)	Top-1 acc 53.516 (56.149)	Top-5 acc 75.391 (78.396)	lr 0.01701
Train [46][2900/3239]	Time 0.243 (0.822)	Data Time 0.002 (0.320)	Loss 2.6882 (2.8157)	Entropy 0.63348 (0.63208)	Top-1 acc 60.156 (56.147)	Top-5 acc 81.641 (78.391)	lr 0.01701
Train [46][2910/3239]	Time 0.237 (0.826)	Data Time 0.001 (0.324)	Loss 2.8042 (2.8156)	Entropy 0.63308 (0.63208)	Top-1 acc 53.906 (56.145)	Top-5 acc 75.781 (78.389)	lr 0.01701
Train [46][2920/3239]	Time 0.267 (0.825)	Data Time 0.001 (0.324)	Loss 2.9743 (2.8156)	Entropy 0.63284 (0.63209)	Top-1 acc 50.391 (56.144)	Top-5 acc 75.000 (78.391)	lr 0.01701
Train [46][2930/3239]	Time 0.239 (0.825)	Data Time 0.001 (0.324)	Loss 2.7575 (2.8152)	Entropy 0.63252 (0.63209)	Top-1 acc 59.766 (56.151)	Top-5 acc 80.078 (78.399)	lr 0.01701
Train [46][2940/3239]	Time 0.253 (0.830)	Data Time 0.001 (0.329)	Loss 2.6865 (2.8152)	Entropy 0.63212 (0.63209)	Top-1 acc 59.766 (56.153)	Top-5 acc 79.297 (78.398)	lr 0.01701
Train [46][2950/3239]	Time 4.365 (0.830)	Data Time 4.084 (0.329)	Loss 3.0130 (2.8150)	Entropy 0.63244 (0.63209)	Top-1 acc 49.609 (56.159)	Top-5 acc 74.609 (78.405)	lr 0.01701
Train [46][2960/3239]	Time 1.434 (0.829)	Data Time 1.106 (0.328)	Loss 2.8325 (2.8148)	Entropy 0.63269 (0.63209)	Top-1 acc 57.031 (56.161)	Top-5 acc 79.297 (78.407)	lr 0.01701
Train [46][2970/3239]	Time 3.253 (0.834)	Data Time 3.002 (0.334)	Loss 2.9338 (2.8148)	Entropy 0.63306 (0.63209)	Top-1 acc 55.469 (56.165)	Top-5 acc 77.344 (78.404)	lr 0.01701
Train [46][2980/3239]	Time 0.248 (0.833)	Data Time 0.001 (0.333)	Loss 2.6173 (2.8145)	Entropy 0.63318 (0.63210)	Top-1 acc 61.719 (56.174)	Top-5 acc 82.422 (78.411)	lr 0.01700
Train [46][2990/3239]	Time 0.243 (0.833)	Data Time 0.001 (0.333)	Loss 2.7535 (2.8146)	Entropy 0.63308 (0.63210)	Top-1 acc 60.156 (56.175)	Top-5 acc 77.734 (78.408)	lr 0.01700
Train [46][3000/3239]	Time 0.252 (0.838)	Data Time 0.001 (0.338)	Loss 2.7955 (2.8149)	Entropy 0.63308 (0.63210)	Top-1 acc 60.156 (56.167)	Top-5 acc 79.688 (78.404)	lr 0.01700
Train [46][3010/3239]	Time 0.250 (0.838)	Data Time 0.001 (0.339)	Loss 2.9129 (2.8149)	Entropy 0.63333 (0.63211)	Top-1 acc 55.859 (56.166)	Top-5 acc 76.172 (78.403)	lr 0.01700
Train [46][3020/3239]	Time 0.248 (0.838)	Data Time 0.001 (0.338)	Loss 2.9269 (2.8148)	Entropy 0.63300 (0.63211)	Top-1 acc 50.000 (56.168)	Top-5 acc 76.562 (78.407)	lr 0.01700
Train [46][3030/3239]	Time 0.337 (0.842)	Data Time 0.001 (0.343)	Loss 2.8720 (2.8149)	Entropy 0.63277 (0.63211)	Top-1 acc 56.641 (56.168)	Top-5 acc 78.516 (78.408)	lr 0.01700
Train [46][3040/3239]	Time 0.238 (0.842)	Data Time 0.001 (0.343)	Loss 2.6762 (2.8150)	Entropy 0.63270 (0.63211)	Top-1 acc 58.594 (56.166)	Top-5 acc 82.031 (78.406)	lr 0.01700
Train [46][3050/3239]	Time 3.374 (0.843)	Data Time 3.129 (0.344)	Loss 2.7489 (2.8150)	Entropy 0.63222 (0.63212)	Top-1 acc 61.719 (56.167)	Top-5 acc 77.734 (78.403)	lr 0.01700
Train [46][3060/3239]	Time 2.101 (0.843)	Data Time 1.841 (0.345)	Loss 2.8796 (2.8149)	Entropy 0.63229 (0.63212)	Top-1 acc 57.422 (56.169)	Top-5 acc 76.953 (78.407)	lr 0.01700
Train [46][3070/3239]	Time 0.240 (0.847)	Data Time 0.001 (0.348)	Loss 2.8028 (2.8151)	Entropy 0.63227 (0.63212)	Top-1 acc 56.641 (56.163)	Top-5 acc 81.641 (78.405)	lr 0.01700
Train [46][3080/3239]	Time 3.787 (0.847)	Data Time 3.543 (0.349)	Loss 2.6646 (2.8153)	Entropy 0.63171 (0.63212)	Top-1 acc 63.281 (56.161)	Top-5 acc 82.422 (78.401)	lr 0.01699
Train [46][3090/3239]	Time 0.235 (0.848)	Data Time 0.001 (0.350)	Loss 3.1107 (2.8154)	Entropy 0.63207 (0.63212)	Top-1 acc 47.266 (56.156)	Top-5 acc 71.875 (78.397)	lr 0.01699
Train [46][3100/3239]	Time 0.234 (0.851)	Data Time 0.001 (0.354)	Loss 2.8728 (2.8155)	Entropy 0.63211 (0.63212)	Top-1 acc 50.391 (56.152)	Top-5 acc 80.859 (78.396)	lr 0.01699
Train [46][3110/3239]	Time 6.233 (0.852)	Data Time 5.938 (0.355)	Loss 2.7798 (2.8156)	Entropy 0.63184 (0.63212)	Top-1 acc 58.594 (56.151)	Top-5 acc 78.906 (78.394)	lr 0.01699
Train [46][3120/3239]	Time 0.344 (0.853)	Data Time 0.001 (0.356)	Loss 2.6469 (2.8157)	Entropy 0.63179 (0.63211)	Top-1 acc 58.594 (56.150)	Top-5 acc 80.469 (78.392)	lr 0.01699
Train [46][3130/3239]	Time 7.023 (0.856)	Data Time 6.774 (0.359)	Loss 2.6449 (2.8157)	Entropy 0.63182 (0.63211)	Top-1 acc 60.156 (56.150)	Top-5 acc 80.469 (78.391)	lr 0.01699
Train [46][3140/3239]	Time 0.227 (0.855)	Data Time 0.001 (0.358)	Loss 2.6376 (2.8156)	Entropy 0.63146 (0.63211)	Top-1 acc 57.422 (56.153)	Top-5 acc 82.031 (78.394)	lr 0.01699
Train [46][3150/3239]	Time 0.240 (0.857)	Data Time 0.001 (0.361)	Loss 2.8780 (2.8157)	Entropy 0.63172 (0.63211)	Top-1 acc 57.422 (56.155)	Top-5 acc 75.781 (78.395)	lr 0.01699
Train [46][3160/3239]	Time 0.253 (0.859)	Data Time 0.002 (0.363)	Loss 3.1016 (2.8156)	Entropy 0.63213 (0.63211)	Top-1 acc 49.609 (56.157)	Top-5 acc 73.828 (78.395)	lr 0.01699
Train [46][3170/3239]	Time 0.245 (0.861)	Data Time 0.001 (0.365)	Loss 2.9688 (2.8156)	Entropy 0.63214 (0.63211)	Top-1 acc 50.781 (56.156)	Top-5 acc 73.828 (78.394)	lr 0.01699
Train [46][3180/3239]	Time 0.234 (0.862)	Data Time 0.000 (0.367)	Loss 2.6453 (2.8157)	Entropy 0.63204 (0.63211)	Top-1 acc 58.594 (56.153)	Top-5 acc 82.422 (78.394)	lr 0.01699
Train [46][3190/3239]	Time 0.337 (0.863)	Data Time 0.000 (0.368)	Loss 2.7493 (2.8159)	Entropy 0.63214 (0.63211)	Top-1 acc 58.203 (56.150)	Top-5 acc 80.078 (78.392)	lr 0.01698
Train [46][3200/3239]	Time 0.230 (0.867)	Data Time 0.000 (0.372)	Loss 2.5849 (2.8159)	Entropy 0.63243 (0.63211)	Top-1 acc 63.281 (56.150)	Top-5 acc 82.031 (78.392)	lr 0.01698
Train [46][3210/3239]	Time 5.182 (0.867)	Data Time 4.914 (0.372)	Loss 2.8663 (2.8159)	Entropy 0.63243 (0.63211)	Top-1 acc 55.859 (56.152)	Top-5 acc 76.562 (78.391)	lr 0.01698
Train [46][3220/3239]	Time 0.235 (0.866)	Data Time 0.000 (0.371)	Loss 2.8767 (2.8159)	Entropy 0.63259 (0.63211)	Top-1 acc 55.078 (56.150)	Top-5 acc 76.953 (78.388)	lr 0.01698
Train [46][3230/3239]	Time 0.242 (0.867)	Data Time 0.000 (0.373)	Loss 2.9673 (2.8161)	Entropy 0.63246 (0.63211)	Top-1 acc 49.219 (56.148)	Top-5 acc 76.562 (78.384)	lr 0.01698
Train [46][3239/3239]	Time 0.930 (0.866)	Data Time 0.000 (0.372)	Loss 2.9772 (2.8161)	Entropy 0.63271 (0.63212)	Top-1 acc 48.148 (56.149)	Top-5 acc 74.074 (78.382)	lr 0.01698
==========Valid [46/120]	loss 1.558	top-1 acc 64.335 (64.561)	top-5 acc 85.436	Train top-1 56.149	top-5 78.382	Entropy 0.63271	Latency-None: 0.000ms	Flops: 538.40M
Train [47][0/3239]	Time 46.910 (46.910)	Data Time 44.448 (44.448)	Loss 2.7505 (2.7505)	Entropy 0.63273 (0.63273)	Top-1 acc 56.250 (56.250)	Top-5 acc 78.125 (78.125)	lr 0.01698
Train [47][10/3239]	Time 0.229 (4.657)	Data Time 0.001 (4.043)	Loss 3.1287 (2.8498)	Entropy 0.63241 (0.63266)	Top-1 acc 45.703 (55.788)	Top-5 acc 71.094 (77.060)	lr 0.01698
Train [47][20/3239]	Time 0.388 (2.661)	Data Time 0.002 (2.119)	Loss 2.8723 (2.8158)	Entropy 0.63223 (0.63250)	Top-1 acc 54.688 (56.101)	Top-5 acc 76.953 (77.939)	lr 0.01698
Train [47][30/3239]	Time 0.238 (1.961)	Data Time 0.001 (1.436)	Loss 2.8038 (2.8032)	Entropy 0.63250 (0.63246)	Top-1 acc 56.641 (56.401)	Top-5 acc 79.297 (78.251)	lr 0.01698
Train [47][40/3239]	Time 0.320 (1.596)	Data Time 0.002 (1.086)	Loss 2.7825 (2.7947)	Entropy 0.63252 (0.63249)	Top-1 acc 61.328 (56.679)	Top-5 acc 79.297 (78.620)	lr 0.01698
Train [47][50/3239]	Time 0.254 (1.389)	Data Time 0.002 (0.873)	Loss 2.8161 (2.8004)	Entropy 0.63243 (0.63250)	Top-1 acc 58.203 (56.472)	Top-5 acc 78.516 (78.699)	lr 0.01697
Train [47][60/3239]	Time 0.268 (1.242)	Data Time 0.001 (0.731)	Loss 2.9043 (2.8005)	Entropy 0.63237 (0.63249)	Top-1 acc 53.516 (56.513)	Top-5 acc 78.125 (78.772)	lr 0.01697
Train [47][70/3239]	Time 0.239 (1.131)	Data Time 0.001 (0.628)	Loss 2.7402 (2.7989)	Entropy 0.63234 (0.63246)	Top-1 acc 59.375 (56.531)	Top-5 acc 78.516 (78.686)	lr 0.01697
Train [47][80/3239]	Time 0.266 (1.049)	Data Time 0.001 (0.551)	Loss 2.7022 (2.8005)	Entropy 0.63233 (0.63244)	Top-1 acc 61.328 (56.506)	Top-5 acc 83.203 (78.655)	lr 0.01697
Train [47][90/3239]	Time 0.363 (0.987)	Data Time 0.001 (0.490)	Loss 2.9349 (2.8006)	Entropy 0.63192 (0.63242)	Top-1 acc 53.516 (56.520)	Top-5 acc 76.172 (78.700)	lr 0.01697
Train [47][100/3239]	Time 0.261 (0.931)	Data Time 0.001 (0.442)	Loss 2.6148 (2.8020)	Entropy 0.63172 (0.63236)	Top-1 acc 58.594 (56.416)	Top-5 acc 83.203 (78.697)	lr 0.01697
Train [47][110/3239]	Time 0.275 (0.890)	Data Time 0.002 (0.402)	Loss 2.7904 (2.8043)	Entropy 0.63168 (0.63230)	Top-1 acc 55.078 (56.433)	Top-5 acc 79.688 (78.699)	lr 0.01697
Train [47][120/3239]	Time 0.245 (0.856)	Data Time 0.001 (0.369)	Loss 2.6143 (2.8003)	Entropy 0.63154 (0.63225)	Top-1 acc 59.375 (56.431)	Top-5 acc 83.203 (78.826)	lr 0.01697
Train [47][130/3239]	Time 0.300 (0.826)	Data Time 0.001 (0.341)	Loss 2.8502 (2.7989)	Entropy 0.63172 (0.63220)	Top-1 acc 57.812 (56.447)	Top-5 acc 76.953 (78.829)	lr 0.01697
Train [47][140/3239]	Time 0.282 (0.802)	Data Time 0.003 (0.317)	Loss 2.7173 (2.7932)	Entropy 0.63161 (0.63216)	Top-1 acc 56.250 (56.491)	Top-5 acc 80.078 (78.956)	lr 0.01697
Train [47][150/3239]	Time 0.322 (0.780)	Data Time 0.001 (0.296)	Loss 2.8935 (2.7939)	Entropy 0.63153 (0.63212)	Top-1 acc 53.516 (56.501)	Top-5 acc 76.172 (78.917)	lr 0.01697
Train [47][160/3239]	Time 0.267 (0.762)	Data Time 0.002 (0.278)	Loss 2.4912 (2.7900)	Entropy 0.63162 (0.63209)	Top-1 acc 64.453 (56.614)	Top-5 acc 85.156 (78.960)	lr 0.01696
Train [47][170/3239]	Time 0.243 (0.744)	Data Time 0.001 (0.262)	Loss 2.8336 (2.7883)	Entropy 0.63180 (0.63207)	Top-1 acc 58.594 (56.650)	Top-5 acc 78.125 (78.988)	lr 0.01696
Train [47][180/3239]	Time 0.405 (0.728)	Data Time 0.001 (0.248)	Loss 2.8063 (2.7904)	Entropy 0.63216 (0.63206)	Top-1 acc 54.297 (56.602)	Top-5 acc 78.516 (78.932)	lr 0.01696
Train [47][190/3239]	Time 0.255 (0.713)	Data Time 0.003 (0.235)	Loss 2.6878 (2.7921)	Entropy 0.63239 (0.63207)	Top-1 acc 57.422 (56.559)	Top-5 acc 82.031 (78.906)	lr 0.01696
Train [47][200/3239]	Time 0.295 (0.701)	Data Time 0.001 (0.223)	Loss 2.8000 (2.7917)	Entropy 0.63245 (0.63209)	Top-1 acc 57.031 (56.586)	Top-5 acc 79.297 (78.887)	lr 0.01696
Train [47][210/3239]	Time 0.245 (0.691)	Data Time 0.001 (0.213)	Loss 2.6248 (2.7913)	Entropy 0.63281 (0.63211)	Top-1 acc 62.500 (56.605)	Top-5 acc 81.250 (78.928)	lr 0.01696
Train [47][220/3239]	Time 0.247 (0.679)	Data Time 0.001 (0.203)	Loss 2.8768 (2.7897)	Entropy 0.63263 (0.63214)	Top-1 acc 55.859 (56.680)	Top-5 acc 77.344 (78.894)	lr 0.01696
Train [47][230/3239]	Time 0.248 (0.670)	Data Time 0.001 (0.194)	Loss 2.6581 (2.7881)	Entropy 0.63285 (0.63216)	Top-1 acc 58.203 (56.745)	Top-5 acc 79.688 (78.918)	lr 0.01696
Train [47][240/3239]	Time 0.259 (0.662)	Data Time 0.001 (0.186)	Loss 2.7278 (2.7900)	Entropy 0.63273 (0.63219)	Top-1 acc 63.281 (56.743)	Top-5 acc 80.859 (78.918)	lr 0.01696
Train [47][250/3239]	Time 0.358 (0.654)	Data Time 0.001 (0.179)	Loss 2.7234 (2.7877)	Entropy 0.63271 (0.63221)	Top-1 acc 58.984 (56.793)	Top-5 acc 79.297 (78.986)	lr 0.01696
Train [47][260/3239]	Time 0.254 (0.648)	Data Time 0.001 (0.172)	Loss 2.9551 (2.7878)	Entropy 0.63212 (0.63222)	Top-1 acc 56.641 (56.781)	Top-5 acc 76.562 (78.968)	lr 0.01696
Train [47][270/3239]	Time 0.382 (0.785)	Data Time 0.004 (0.166)	Loss 2.6158 (2.7891)	Entropy 0.63187 (0.63221)	Top-1 acc 59.375 (56.779)	Top-5 acc 82.031 (78.921)	lr 0.01695
Train [47][280/3239]	Time 0.249 (0.776)	Data Time 0.002 (0.160)	Loss 2.9592 (2.7889)	Entropy 0.63171 (0.63220)	Top-1 acc 54.297 (56.814)	Top-5 acc 75.391 (78.894)	lr 0.01695
Train [47][290/3239]	Time 0.262 (0.764)	Data Time 0.002 (0.155)	Loss 2.7492 (2.7895)	Entropy 0.63166 (0.63218)	Top-1 acc 57.422 (56.779)	Top-5 acc 78.516 (78.901)	lr 0.01695
Train [47][300/3239]	Time 0.313 (0.755)	Data Time 0.002 (0.150)	Loss 2.9421 (2.7942)	Entropy 0.63155 (0.63216)	Top-1 acc 57.812 (56.680)	Top-5 acc 75.000 (78.822)	lr 0.01695
Train [47][310/3239]	Time 0.276 (0.746)	Data Time 0.001 (0.145)	Loss 2.9333 (2.7939)	Entropy 0.63153 (0.63214)	Top-1 acc 55.469 (56.693)	Top-5 acc 74.609 (78.808)	lr 0.01695
Train [47][320/3239]	Time 0.257 (0.738)	Data Time 0.001 (0.140)	Loss 2.7881 (2.7944)	Entropy 0.63117 (0.63212)	Top-1 acc 59.375 (56.677)	Top-5 acc 79.297 (78.816)	lr 0.01695
Train [47][330/3239]	Time 0.265 (0.731)	Data Time 0.001 (0.136)	Loss 2.8076 (2.7966)	Entropy 0.63123 (0.63209)	Top-1 acc 57.812 (56.641)	Top-5 acc 78.906 (78.787)	lr 0.01695
Train [47][340/3239]	Time 0.386 (0.725)	Data Time 0.001 (0.132)	Loss 2.8419 (2.7954)	Entropy 0.63099 (0.63207)	Top-1 acc 55.078 (56.712)	Top-5 acc 76.172 (78.812)	lr 0.01695
Train [47][350/3239]	Time 0.257 (0.718)	Data Time 0.001 (0.129)	Loss 2.8902 (2.7958)	Entropy 0.63115 (0.63204)	Top-1 acc 52.344 (56.693)	Top-5 acc 78.516 (78.822)	lr 0.01695
Train [47][360/3239]	Time 0.249 (0.711)	Data Time 0.001 (0.125)	Loss 2.6357 (2.7958)	Entropy 0.63084 (0.63201)	Top-1 acc 62.109 (56.722)	Top-5 acc 82.812 (78.846)	lr 0.01695
Train [47][370/3239]	Time 0.262 (0.706)	Data Time 0.001 (0.122)	Loss 2.8214 (2.7953)	Entropy 0.63085 (0.63198)	Top-1 acc 57.812 (56.739)	Top-5 acc 78.906 (78.838)	lr 0.01694
Train [47][380/3239]	Time 0.246 (0.700)	Data Time 0.001 (0.119)	Loss 2.8299 (2.7955)	Entropy 0.63093 (0.63195)	Top-1 acc 53.125 (56.729)	Top-5 acc 78.906 (78.844)	lr 0.01694
Train [47][390/3239]	Time 0.312 (0.695)	Data Time 0.001 (0.116)	Loss 2.6272 (2.7953)	Entropy 0.63073 (0.63192)	Top-1 acc 60.938 (56.710)	Top-5 acc 80.078 (78.857)	lr 0.01694
Train [47][400/3239]	Time 0.256 (0.689)	Data Time 0.001 (0.113)	Loss 2.5225 (2.7936)	Entropy 0.63051 (0.63189)	Top-1 acc 62.500 (56.767)	Top-5 acc 83.984 (78.886)	lr 0.01694
Train [47][410/3239]	Time 0.373 (0.685)	Data Time 0.001 (0.110)	Loss 2.8292 (2.7936)	Entropy 0.63038 (0.63186)	Top-1 acc 57.812 (56.782)	Top-5 acc 78.516 (78.887)	lr 0.01694
Train [47][420/3239]	Time 0.270 (0.681)	Data Time 0.001 (0.108)	Loss 3.0224 (2.7939)	Entropy 0.63013 (0.63182)	Top-1 acc 53.516 (56.759)	Top-5 acc 71.875 (78.877)	lr 0.01694
Train [47][430/3239]	Time 0.250 (0.677)	Data Time 0.001 (0.105)	Loss 2.6254 (2.7937)	Entropy 0.63037 (0.63178)	Top-1 acc 59.375 (56.743)	Top-5 acc 83.203 (78.875)	lr 0.01694
Train [47][440/3239]	Time 0.255 (0.673)	Data Time 0.001 (0.103)	Loss 2.6654 (2.7921)	Entropy 0.63039 (0.63175)	Top-1 acc 59.375 (56.784)	Top-5 acc 82.422 (78.887)	lr 0.01694
Train [47][450/3239]	Time 0.294 (0.669)	Data Time 0.001 (0.100)	Loss 2.8950 (2.7911)	Entropy 0.63018 (0.63172)	Top-1 acc 54.297 (56.817)	Top-5 acc 77.344 (78.898)	lr 0.01694
Train [47][460/3239]	Time 0.320 (0.665)	Data Time 0.001 (0.098)	Loss 2.8572 (2.7907)	Entropy 0.63033 (0.63169)	Top-1 acc 55.469 (56.819)	Top-5 acc 78.125 (78.895)	lr 0.01694
Train [47][470/3239]	Time 0.254 (0.662)	Data Time 0.002 (0.096)	Loss 2.6476 (2.7904)	Entropy 0.63042 (0.63166)	Top-1 acc 58.984 (56.831)	Top-5 acc 80.859 (78.892)	lr 0.01694
Train [47][480/3239]	Time 0.255 (0.658)	Data Time 0.001 (0.094)	Loss 2.5948 (2.7903)	Entropy 0.63045 (0.63163)	Top-1 acc 62.500 (56.821)	Top-5 acc 80.078 (78.879)	lr 0.01693
Train [47][490/3239]	Time 0.342 (0.655)	Data Time 0.002 (0.092)	Loss 2.8059 (2.7891)	Entropy 0.63088 (0.63161)	Top-1 acc 58.984 (56.849)	Top-5 acc 76.953 (78.906)	lr 0.01693
Train [47][500/3239]	Time 0.447 (0.652)	Data Time 0.002 (0.091)	Loss 2.8357 (2.7898)	Entropy 0.63126 (0.63160)	Top-1 acc 54.688 (56.828)	Top-5 acc 78.125 (78.907)	lr 0.01693
Train [47][510/3239]	Time 0.270 (0.649)	Data Time 0.001 (0.089)	Loss 2.8700 (2.7886)	Entropy 0.63150 (0.63160)	Top-1 acc 58.203 (56.860)	Top-5 acc 76.172 (78.925)	lr 0.01693
Train [47][520/3239]	Time 0.229 (0.645)	Data Time 0.001 (0.087)	Loss 2.7667 (2.7890)	Entropy 0.63141 (0.63159)	Top-1 acc 56.250 (56.849)	Top-5 acc 80.078 (78.906)	lr 0.01693
Train [47][530/3239]	Time 0.229 (0.641)	Data Time 0.001 (0.086)	Loss 2.7732 (2.7880)	Entropy 0.63126 (0.63159)	Top-1 acc 56.250 (56.867)	Top-5 acc 80.078 (78.923)	lr 0.01693
Train [47][540/3239]	Time 0.244 (0.638)	Data Time 0.001 (0.084)	Loss 3.0714 (2.7894)	Entropy 0.63064 (0.63158)	Top-1 acc 51.953 (56.841)	Top-5 acc 76.562 (78.912)	lr 0.01693
Train [47][550/3239]	Time 0.320 (0.635)	Data Time 0.044 (0.083)	Loss 2.7756 (2.7894)	Entropy 0.63079 (0.63156)	Top-1 acc 55.469 (56.843)	Top-5 acc 80.859 (78.913)	lr 0.01693
Train [47][560/3239]	Time 0.256 (0.632)	Data Time 0.002 (0.081)	Loss 2.7894 (2.7900)	Entropy 0.63107 (0.63155)	Top-1 acc 58.594 (56.812)	Top-5 acc 78.906 (78.908)	lr 0.01693
Train [47][570/3239]	Time 0.432 (0.630)	Data Time 0.001 (0.080)	Loss 2.7585 (2.7907)	Entropy 0.63012 (0.63154)	Top-1 acc 58.594 (56.792)	Top-5 acc 80.859 (78.906)	lr 0.01693
Train [47][580/3239]	Time 0.306 (0.627)	Data Time 0.001 (0.078)	Loss 2.8626 (2.7907)	Entropy 0.63029 (0.63152)	Top-1 acc 54.297 (56.783)	Top-5 acc 75.391 (78.909)	lr 0.01692
Train [47][590/3239]	Time 0.250 (0.624)	Data Time 0.001 (0.077)	Loss 2.8184 (2.7905)	Entropy 0.63028 (0.63150)	Top-1 acc 54.297 (56.791)	Top-5 acc 76.953 (78.908)	lr 0.01692
Train [47][600/3239]	Time 0.296 (0.622)	Data Time 0.001 (0.076)	Loss 2.8627 (2.7911)	Entropy 0.63053 (0.63148)	Top-1 acc 54.297 (56.786)	Top-5 acc 79.297 (78.902)	lr 0.01692
Train [47][610/3239]	Time 0.266 (0.619)	Data Time 0.001 (0.075)	Loss 2.8926 (2.7916)	Entropy 0.63071 (0.63146)	Top-1 acc 47.656 (56.761)	Top-5 acc 74.609 (78.894)	lr 0.01692
Train [47][620/3239]	Time 0.283 (0.617)	Data Time 0.002 (0.074)	Loss 2.7797 (2.7918)	Entropy 0.63049 (0.63145)	Top-1 acc 55.859 (56.756)	Top-5 acc 77.734 (78.897)	lr 0.01692
Train [47][630/3239]	Time 0.266 (0.615)	Data Time 0.002 (0.072)	Loss 2.7663 (2.7904)	Entropy 0.63037 (0.63143)	Top-1 acc 55.469 (56.790)	Top-5 acc 81.250 (78.923)	lr 0.01692
Train [47][640/3239]	Time 0.288 (0.613)	Data Time 0.001 (0.071)	Loss 2.6865 (2.7904)	Entropy 0.63023 (0.63141)	Top-1 acc 56.641 (56.781)	Top-5 acc 83.203 (78.926)	lr 0.01692
Train [47][650/3239]	Time 0.264 (0.611)	Data Time 0.001 (0.070)	Loss 3.1323 (2.7909)	Entropy 0.63045 (0.63140)	Top-1 acc 44.922 (56.759)	Top-5 acc 73.047 (78.918)	lr 0.01692
Train [47][660/3239]	Time 0.260 (0.609)	Data Time 0.001 (0.069)	Loss 3.0204 (2.7911)	Entropy 0.63076 (0.63139)	Top-1 acc 50.000 (56.743)	Top-5 acc 73.828 (78.913)	lr 0.01692
Train [47][670/3239]	Time 0.274 (0.607)	Data Time 0.001 (0.068)	Loss 2.8462 (2.7912)	Entropy 0.63071 (0.63138)	Top-1 acc 58.594 (56.744)	Top-5 acc 80.859 (78.912)	lr 0.01692
Train [47][680/3239]	Time 0.263 (0.604)	Data Time 0.001 (0.067)	Loss 2.8629 (2.7918)	Entropy 0.63063 (0.63137)	Top-1 acc 60.156 (56.744)	Top-5 acc 78.516 (78.907)	lr 0.01692
Train [47][690/3239]	Time 0.256 (0.603)	Data Time 0.001 (0.066)	Loss 3.1144 (2.7928)	Entropy 0.63036 (0.63136)	Top-1 acc 47.266 (56.713)	Top-5 acc 75.000 (78.889)	lr 0.01691
Train [47][700/3239]	Time 0.262 (0.601)	Data Time 0.002 (0.065)	Loss 2.9208 (2.7927)	Entropy 0.63053 (0.63134)	Top-1 acc 52.344 (56.740)	Top-5 acc 77.344 (78.886)	lr 0.01691
Train [47][710/3239]	Time 0.297 (0.600)	Data Time 0.002 (0.064)	Loss 2.7510 (2.7926)	Entropy 0.63086 (0.63133)	Top-1 acc 58.984 (56.749)	Top-5 acc 79.688 (78.885)	lr 0.01691
Train [47][720/3239]	Time 0.314 (0.598)	Data Time 0.002 (0.064)	Loss 3.0089 (2.7927)	Entropy 0.63098 (0.63133)	Top-1 acc 51.172 (56.741)	Top-5 acc 75.000 (78.879)	lr 0.01691
Train [47][730/3239]	Time 0.417 (0.597)	Data Time 0.002 (0.063)	Loss 2.7441 (2.7930)	Entropy 0.63083 (0.63132)	Top-1 acc 59.766 (56.732)	Top-5 acc 80.469 (78.878)	lr 0.01691
Train [47][740/3239]	Time 0.234 (0.595)	Data Time 0.001 (0.062)	Loss 2.7720 (2.7928)	Entropy 0.63120 (0.63132)	Top-1 acc 55.469 (56.737)	Top-5 acc 80.859 (78.881)	lr 0.01691
Train [47][750/3239]	Time 0.238 (0.593)	Data Time 0.001 (0.061)	Loss 2.7742 (2.7929)	Entropy 0.63108 (0.63132)	Top-1 acc 58.984 (56.739)	Top-5 acc 77.734 (78.870)	lr 0.01691
Train [47][760/3239]	Time 0.267 (0.591)	Data Time 0.002 (0.060)	Loss 2.8484 (2.7923)	Entropy 0.63111 (0.63131)	Top-1 acc 53.516 (56.748)	Top-5 acc 78.516 (78.876)	lr 0.01691
Train [47][770/3239]	Time 0.304 (0.590)	Data Time 0.003 (0.060)	Loss 2.8512 (2.7918)	Entropy 0.63118 (0.63131)	Top-1 acc 55.469 (56.759)	Top-5 acc 79.297 (78.887)	lr 0.01691
Train [47][780/3239]	Time 0.264 (0.589)	Data Time 0.002 (0.059)	Loss 2.8243 (2.7923)	Entropy 0.63090 (0.63131)	Top-1 acc 53.516 (56.740)	Top-5 acc 76.953 (78.876)	lr 0.01691
Train [47][790/3239]	Time 0.254 (0.587)	Data Time 0.001 (0.058)	Loss 2.8316 (2.7926)	Entropy 0.63101 (0.63130)	Top-1 acc 55.469 (56.732)	Top-5 acc 78.516 (78.865)	lr 0.01691
Train [47][800/3239]	Time 0.439 (0.586)	Data Time 0.001 (0.057)	Loss 2.7466 (2.7916)	Entropy 0.63096 (0.63130)	Top-1 acc 62.109 (56.775)	Top-5 acc 78.125 (78.876)	lr 0.01690
Train [47][810/3239]	Time 0.245 (0.584)	Data Time 0.001 (0.057)	Loss 2.8586 (2.7917)	Entropy 0.63126 (0.63130)	Top-1 acc 51.953 (56.776)	Top-5 acc 78.516 (78.871)	lr 0.01690
Train [47][820/3239]	Time 0.273 (0.583)	Data Time 0.001 (0.056)	Loss 2.7237 (2.7920)	Entropy 0.63075 (0.63129)	Top-1 acc 55.859 (56.767)	Top-5 acc 79.297 (78.862)	lr 0.01690
Train [47][830/3239]	Time 0.230 (0.581)	Data Time 0.001 (0.055)	Loss 2.8323 (2.7927)	Entropy 0.63062 (0.63129)	Top-1 acc 56.641 (56.758)	Top-5 acc 79.297 (78.850)	lr 0.01690
Train [47][840/3239]	Time 0.303 (0.580)	Data Time 0.001 (0.055)	Loss 2.7337 (2.7927)	Entropy 0.63075 (0.63128)	Top-1 acc 61.328 (56.756)	Top-5 acc 79.297 (78.847)	lr 0.01690
Train [47][850/3239]	Time 0.248 (0.578)	Data Time 0.002 (0.054)	Loss 2.8099 (2.7920)	Entropy 0.63077 (0.63127)	Top-1 acc 55.469 (56.759)	Top-5 acc 78.906 (78.870)	lr 0.01690
Train [47][860/3239]	Time 0.261 (0.577)	Data Time 0.002 (0.054)	Loss 3.0303 (2.7924)	Entropy 0.63061 (0.63127)	Top-1 acc 49.219 (56.752)	Top-5 acc 75.781 (78.868)	lr 0.01690
Train [47][870/3239]	Time 0.336 (0.576)	Data Time 0.002 (0.053)	Loss 2.7448 (2.7923)	Entropy 0.63063 (0.63126)	Top-1 acc 56.641 (56.751)	Top-5 acc 81.250 (78.872)	lr 0.01690
Train [47][880/3239]	Time 0.299 (0.575)	Data Time 0.001 (0.052)	Loss 2.6852 (2.7920)	Entropy 0.63050 (0.63125)	Top-1 acc 60.938 (56.762)	Top-5 acc 80.469 (78.880)	lr 0.01690
Train [47][890/3239]	Time 0.365 (0.574)	Data Time 0.001 (0.052)	Loss 2.9551 (2.7921)	Entropy 0.63049 (0.63124)	Top-1 acc 56.641 (56.754)	Top-5 acc 76.562 (78.881)	lr 0.01690
Train [47][900/3239]	Time 0.269 (0.573)	Data Time 0.001 (0.051)	Loss 2.8645 (2.7917)	Entropy 0.63048 (0.63124)	Top-1 acc 56.250 (56.757)	Top-5 acc 78.125 (78.886)	lr 0.01689
Train [47][910/3239]	Time 0.303 (0.572)	Data Time 0.001 (0.051)	Loss 2.6687 (2.7917)	Entropy 0.63035 (0.63123)	Top-1 acc 59.375 (56.762)	Top-5 acc 83.203 (78.884)	lr 0.01689
Train [47][920/3239]	Time 0.254 (0.571)	Data Time 0.002 (0.050)	Loss 2.9680 (2.7924)	Entropy 0.63014 (0.63122)	Top-1 acc 54.688 (56.734)	Top-5 acc 76.172 (78.872)	lr 0.01689
Train [47][930/3239]	Time 0.349 (0.611)	Data Time 0.003 (0.050)	Loss 2.7429 (2.7926)	Entropy 0.63047 (0.63121)	Top-1 acc 55.469 (56.728)	Top-5 acc 77.734 (78.863)	lr 0.01689
Train [47][940/3239]	Time 0.249 (0.609)	Data Time 0.002 (0.049)	Loss 2.6400 (2.7923)	Entropy 0.63013 (0.63120)	Top-1 acc 60.156 (56.721)	Top-5 acc 81.641 (78.864)	lr 0.01689
Train [47][950/3239]	Time 0.246 (0.608)	Data Time 0.001 (0.049)	Loss 2.8363 (2.7923)	Entropy 0.62993 (0.63119)	Top-1 acc 54.297 (56.712)	Top-5 acc 77.734 (78.870)	lr 0.01689
Train [47][960/3239]	Time 0.349 (0.606)	Data Time 0.001 (0.048)	Loss 2.8442 (2.7916)	Entropy 0.62933 (0.63117)	Top-1 acc 54.688 (56.723)	Top-5 acc 77.344 (78.884)	lr 0.01689
Train [47][970/3239]	Time 0.235 (0.604)	Data Time 0.001 (0.048)	Loss 2.7642 (2.7908)	Entropy 0.62956 (0.63115)	Top-1 acc 56.641 (56.738)	Top-5 acc 79.688 (78.886)	lr 0.01689
Train [47][980/3239]	Time 0.306 (0.603)	Data Time 0.001 (0.047)	Loss 2.8750 (2.7900)	Entropy 0.62980 (0.63114)	Top-1 acc 55.078 (56.776)	Top-5 acc 79.297 (78.906)	lr 0.01689
Train [47][990/3239]	Time 0.294 (0.602)	Data Time 0.003 (0.047)	Loss 2.8244 (2.7900)	Entropy 0.62971 (0.63112)	Top-1 acc 55.469 (56.788)	Top-5 acc 76.953 (78.905)	lr 0.01689
Train [47][1000/3239]	Time 0.252 (0.601)	Data Time 0.001 (0.046)	Loss 2.5335 (2.7903)	Entropy 0.62946 (0.63111)	Top-1 acc 62.500 (56.781)	Top-5 acc 85.156 (78.905)	lr 0.01689
Train [47][1010/3239]	Time 0.254 (0.599)	Data Time 0.001 (0.046)	Loss 2.7466 (2.7905)	Entropy 0.62971 (0.63109)	Top-1 acc 58.594 (56.784)	Top-5 acc 80.859 (78.898)	lr 0.01688
Train [47][1020/3239]	Time 0.275 (0.598)	Data Time 0.002 (0.045)	Loss 2.7897 (2.7914)	Entropy 0.62955 (0.63108)	Top-1 acc 56.250 (56.755)	Top-5 acc 79.297 (78.884)	lr 0.01688
Train [47][1030/3239]	Time 0.251 (0.597)	Data Time 0.001 (0.045)	Loss 2.8010 (2.7917)	Entropy 0.62943 (0.63107)	Top-1 acc 53.516 (56.738)	Top-5 acc 81.250 (78.881)	lr 0.01688
Train [47][1040/3239]	Time 0.284 (0.596)	Data Time 0.001 (0.045)	Loss 2.6951 (2.7919)	Entropy 0.62940 (0.63105)	Top-1 acc 60.547 (56.736)	Top-5 acc 80.859 (78.874)	lr 0.01688
Train [47][1050/3239]	Time 0.398 (0.595)	Data Time 0.002 (0.044)	Loss 2.9453 (2.7924)	Entropy 0.62956 (0.63103)	Top-1 acc 53.906 (56.715)	Top-5 acc 75.781 (78.864)	lr 0.01688
Train [47][1060/3239]	Time 0.252 (0.593)	Data Time 0.001 (0.044)	Loss 2.7631 (2.7925)	Entropy 0.62967 (0.63102)	Top-1 acc 57.031 (56.718)	Top-5 acc 78.125 (78.862)	lr 0.01688
Train [47][1070/3239]	Time 0.255 (0.592)	Data Time 0.002 (0.043)	Loss 2.8385 (2.7923)	Entropy 0.62967 (0.63101)	Top-1 acc 54.297 (56.727)	Top-5 acc 76.953 (78.858)	lr 0.01688
Train [47][1080/3239]	Time 0.249 (0.591)	Data Time 0.001 (0.043)	Loss 2.6158 (2.7927)	Entropy 0.62965 (0.63100)	Top-1 acc 60.156 (56.724)	Top-5 acc 80.469 (78.848)	lr 0.01688
Train [47][1090/3239]	Time 0.251 (0.590)	Data Time 0.001 (0.043)	Loss 2.5124 (2.7922)	Entropy 0.62928 (0.63098)	Top-1 acc 64.453 (56.741)	Top-5 acc 81.641 (78.847)	lr 0.01688
Train [47][1100/3239]	Time 0.248 (0.588)	Data Time 0.001 (0.042)	Loss 2.7692 (2.7922)	Entropy 0.62902 (0.63096)	Top-1 acc 60.156 (56.744)	Top-5 acc 80.859 (78.850)	lr 0.01688
Train [47][1110/3239]	Time 0.233 (0.587)	Data Time 0.001 (0.042)	Loss 2.8141 (2.7924)	Entropy 0.62862 (0.63095)	Top-1 acc 55.469 (56.746)	Top-5 acc 73.438 (78.840)	lr 0.01687
Train [47][1120/3239]	Time 0.372 (0.586)	Data Time 0.001 (0.042)	Loss 2.9674 (2.7920)	Entropy 0.62831 (0.63092)	Top-1 acc 55.078 (56.758)	Top-5 acc 76.562 (78.837)	lr 0.01687
Train [47][1130/3239]	Time 0.223 (0.584)	Data Time 0.001 (0.041)	Loss 2.8527 (2.7921)	Entropy 0.62843 (0.63090)	Top-1 acc 54.297 (56.757)	Top-5 acc 75.000 (78.834)	lr 0.01687
Train [47][1140/3239]	Time 0.266 (0.583)	Data Time 0.001 (0.041)	Loss 2.8646 (2.7915)	Entropy 0.62855 (0.63088)	Top-1 acc 53.516 (56.771)	Top-5 acc 74.219 (78.841)	lr 0.01687
Train [47][1150/3239]	Time 0.230 (0.582)	Data Time 0.001 (0.041)	Loss 2.7670 (2.7921)	Entropy 0.62829 (0.63086)	Top-1 acc 55.469 (56.758)	Top-5 acc 80.078 (78.824)	lr 0.01687
Train [47][1160/3239]	Time 0.279 (0.581)	Data Time 0.001 (0.040)	Loss 2.8336 (2.7922)	Entropy 0.62819 (0.63083)	Top-1 acc 55.078 (56.744)	Top-5 acc 79.688 (78.826)	lr 0.01687
Train [47][1170/3239]	Time 0.234 (0.579)	Data Time 0.001 (0.040)	Loss 2.6943 (2.7926)	Entropy 0.62827 (0.63081)	Top-1 acc 56.641 (56.739)	Top-5 acc 81.250 (78.817)	lr 0.01687
Train [47][1180/3239]	Time 0.241 (0.578)	Data Time 0.001 (0.040)	Loss 3.1245 (2.7928)	Entropy 0.62834 (0.63079)	Top-1 acc 46.875 (56.725)	Top-5 acc 73.047 (78.816)	lr 0.01687
Train [47][1190/3239]	Time 0.252 (0.577)	Data Time 0.002 (0.039)	Loss 2.7510 (2.7930)	Entropy 0.62848 (0.63077)	Top-1 acc 61.328 (56.715)	Top-5 acc 79.297 (78.811)	lr 0.01687
Train [47][1200/3239]	Time 0.233 (0.576)	Data Time 0.001 (0.039)	Loss 3.1220 (2.7932)	Entropy 0.62866 (0.63075)	Top-1 acc 47.656 (56.716)	Top-5 acc 73.047 (78.808)	lr 0.01687
Train [47][1210/3239]	Time 0.289 (0.575)	Data Time 0.002 (0.039)	Loss 2.8529 (2.7932)	Entropy 0.62848 (0.63073)	Top-1 acc 57.422 (56.720)	Top-5 acc 78.125 (78.807)	lr 0.01687
Train [47][1220/3239]	Time 0.236 (0.574)	Data Time 0.001 (0.038)	Loss 2.9295 (2.7931)	Entropy 0.62886 (0.63072)	Top-1 acc 53.516 (56.727)	Top-5 acc 75.391 (78.811)	lr 0.01686
Train [47][1230/3239]	Time 0.277 (0.573)	Data Time 0.001 (0.038)	Loss 2.6131 (2.7927)	Entropy 0.62881 (0.63070)	Top-1 acc 62.500 (56.732)	Top-5 acc 80.859 (78.816)	lr 0.01686
Train [47][1240/3239]	Time 0.360 (0.573)	Data Time 0.001 (0.038)	Loss 2.8620 (2.7930)	Entropy 0.62873 (0.63069)	Top-1 acc 53.125 (56.726)	Top-5 acc 78.516 (78.815)	lr 0.01686
Train [47][1250/3239]	Time 0.242 (0.571)	Data Time 0.001 (0.037)	Loss 2.8603 (2.7927)	Entropy 0.62906 (0.63067)	Top-1 acc 55.469 (56.739)	Top-5 acc 77.734 (78.826)	lr 0.01686
Train [47][1260/3239]	Time 0.230 (0.570)	Data Time 0.001 (0.037)	Loss 3.0627 (2.7930)	Entropy 0.62885 (0.63066)	Top-1 acc 50.781 (56.737)	Top-5 acc 74.219 (78.825)	lr 0.01686
Train [47][1270/3239]	Time 0.228 (0.569)	Data Time 0.001 (0.037)	Loss 2.9035 (2.7931)	Entropy 0.62872 (0.63064)	Top-1 acc 53.516 (56.738)	Top-5 acc 74.609 (78.819)	lr 0.01686
Train [47][1280/3239]	Time 0.402 (0.569)	Data Time 0.001 (0.037)	Loss 2.7063 (2.7930)	Entropy 0.62842 (0.63063)	Top-1 acc 59.766 (56.739)	Top-5 acc 82.422 (78.815)	lr 0.01686
Train [47][1290/3239]	Time 0.244 (0.568)	Data Time 0.001 (0.036)	Loss 2.7424 (2.7931)	Entropy 0.62839 (0.63061)	Top-1 acc 59.375 (56.743)	Top-5 acc 80.469 (78.818)	lr 0.01686
Train [47][1300/3239]	Time 0.231 (0.567)	Data Time 0.002 (0.036)	Loss 2.9108 (2.7930)	Entropy 0.62806 (0.63059)	Top-1 acc 59.375 (56.750)	Top-5 acc 75.781 (78.821)	lr 0.01686
Train [47][1310/3239]	Time 0.269 (0.566)	Data Time 0.001 (0.036)	Loss 2.8552 (2.7928)	Entropy 0.62807 (0.63058)	Top-1 acc 52.344 (56.757)	Top-5 acc 80.469 (78.829)	lr 0.01686
Train [47][1320/3239]	Time 0.240 (0.564)	Data Time 0.001 (0.036)	Loss 2.7563 (2.7932)	Entropy 0.62804 (0.63056)	Top-1 acc 62.109 (56.743)	Top-5 acc 79.297 (78.817)	lr 0.01685
Train [47][1330/3239]	Time 0.271 (0.564)	Data Time 0.001 (0.035)	Loss 2.8496 (2.7936)	Entropy 0.62808 (0.63054)	Top-1 acc 51.172 (56.728)	Top-5 acc 78.516 (78.809)	lr 0.01685
Train [47][1340/3239]	Time 0.245 (0.563)	Data Time 0.001 (0.035)	Loss 2.5698 (2.7929)	Entropy 0.62788 (0.63052)	Top-1 acc 62.109 (56.748)	Top-5 acc 80.859 (78.820)	lr 0.01685
Train [47][1350/3239]	Time 0.405 (0.562)	Data Time 0.001 (0.035)	Loss 2.9022 (2.7928)	Entropy 0.62829 (0.63050)	Top-1 acc 55.078 (56.750)	Top-5 acc 75.391 (78.820)	lr 0.01685
Train [47][1360/3239]	Time 0.263 (0.561)	Data Time 0.001 (0.035)	Loss 2.7138 (2.7925)	Entropy 0.62803 (0.63048)	Top-1 acc 53.906 (56.756)	Top-5 acc 82.812 (78.832)	lr 0.01685
Train [47][1370/3239]	Time 0.226 (0.560)	Data Time 0.001 (0.034)	Loss 2.7990 (2.7924)	Entropy 0.62805 (0.63047)	Top-1 acc 53.516 (56.757)	Top-5 acc 77.734 (78.836)	lr 0.01685
Train [47][1380/3239]	Time 0.240 (0.562)	Data Time 0.001 (0.037)	Loss 3.0960 (2.7924)	Entropy 0.62808 (0.63045)	Top-1 acc 51.172 (56.751)	Top-5 acc 72.266 (78.839)	lr 0.01685
Train [47][1390/3239]	Time 0.263 (0.561)	Data Time 0.001 (0.036)	Loss 2.8695 (2.7924)	Entropy 0.62821 (0.63043)	Top-1 acc 55.078 (56.756)	Top-5 acc 80.859 (78.839)	lr 0.01685
Train [47][1400/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.036)	Loss 2.5860 (2.7921)	Entropy 0.62822 (0.63042)	Top-1 acc 60.547 (56.757)	Top-5 acc 83.203 (78.852)	lr 0.01685
Train [47][1410/3239]	Time 0.268 (0.559)	Data Time 0.001 (0.036)	Loss 2.7997 (2.7922)	Entropy 0.62789 (0.63040)	Top-1 acc 57.031 (56.750)	Top-5 acc 77.734 (78.849)	lr 0.01685
Train [47][1420/3239]	Time 0.261 (0.558)	Data Time 0.001 (0.036)	Loss 2.7013 (2.7919)	Entropy 0.62730 (0.63038)	Top-1 acc 56.641 (56.762)	Top-5 acc 80.859 (78.858)	lr 0.01685
Train [47][1430/3239]	Time 0.238 (0.557)	Data Time 0.001 (0.035)	Loss 3.0205 (2.7922)	Entropy 0.62690 (0.63036)	Top-1 acc 52.344 (56.757)	Top-5 acc 72.656 (78.857)	lr 0.01684
Train [47][1440/3239]	Time 0.396 (0.557)	Data Time 0.001 (0.036)	Loss 2.7673 (2.7923)	Entropy 0.62722 (0.63033)	Top-1 acc 57.812 (56.759)	Top-5 acc 81.641 (78.852)	lr 0.01684
Train [47][1450/3239]	Time 0.238 (0.556)	Data Time 0.001 (0.036)	Loss 2.5949 (2.7920)	Entropy 0.62692 (0.63031)	Top-1 acc 58.594 (56.759)	Top-5 acc 84.375 (78.852)	lr 0.01684
Train [47][1460/3239]	Time 0.239 (0.556)	Data Time 0.001 (0.036)	Loss 2.7553 (2.7916)	Entropy 0.62709 (0.63029)	Top-1 acc 60.547 (56.766)	Top-5 acc 80.078 (78.868)	lr 0.01684
Train [47][1470/3239]	Time 1.276 (0.556)	Data Time 1.012 (0.036)	Loss 2.9256 (2.7915)	Entropy 0.62709 (0.63027)	Top-1 acc 55.469 (56.770)	Top-5 acc 76.953 (78.867)	lr 0.01684
Train [47][1480/3239]	Time 0.222 (0.554)	Data Time 0.001 (0.036)	Loss 2.9743 (2.7922)	Entropy 0.62707 (0.63025)	Top-1 acc 52.344 (56.757)	Top-5 acc 75.391 (78.859)	lr 0.01684
Train [47][1490/3239]	Time 0.257 (0.554)	Data Time 0.001 (0.036)	Loss 2.8025 (2.7919)	Entropy 0.62679 (0.63022)	Top-1 acc 55.078 (56.765)	Top-5 acc 78.516 (78.862)	lr 0.01684
Train [47][1500/3239]	Time 0.261 (0.553)	Data Time 0.001 (0.036)	Loss 2.7000 (2.7918)	Entropy 0.62707 (0.63020)	Top-1 acc 61.328 (56.776)	Top-5 acc 78.906 (78.858)	lr 0.01684
Train [47][1510/3239]	Time 0.365 (0.554)	Data Time 0.001 (0.037)	Loss 3.1012 (2.7915)	Entropy 0.62704 (0.63018)	Top-1 acc 50.781 (56.788)	Top-5 acc 72.656 (78.861)	lr 0.01684
Train [47][1520/3239]	Time 0.261 (0.553)	Data Time 0.001 (0.037)	Loss 2.7536 (2.7916)	Entropy 0.62647 (0.63016)	Top-1 acc 58.203 (56.780)	Top-5 acc 80.859 (78.857)	lr 0.01684
Train [47][1530/3239]	Time 0.236 (0.552)	Data Time 0.001 (0.037)	Loss 2.7287 (2.7918)	Entropy 0.62628 (0.63014)	Top-1 acc 59.375 (56.777)	Top-5 acc 79.688 (78.850)	lr 0.01683
Train [47][1540/3239]	Time 0.275 (0.552)	Data Time 0.001 (0.038)	Loss 3.0174 (2.7920)	Entropy 0.62596 (0.63011)	Top-1 acc 53.125 (56.770)	Top-5 acc 75.391 (78.851)	lr 0.01683
Train [47][1550/3239]	Time 0.236 (0.552)	Data Time 0.002 (0.037)	Loss 3.0028 (2.7923)	Entropy 0.62626 (0.63008)	Top-1 acc 51.562 (56.768)	Top-5 acc 74.609 (78.844)	lr 0.01683
Train [47][1560/3239]	Time 0.238 (0.552)	Data Time 0.001 (0.039)	Loss 2.8976 (2.7919)	Entropy 0.62582 (0.63006)	Top-1 acc 54.297 (56.772)	Top-5 acc 75.391 (78.848)	lr 0.01683
Train [47][1570/3239]	Time 0.234 (0.552)	Data Time 0.001 (0.038)	Loss 2.9250 (2.7925)	Entropy 0.62570 (0.63003)	Top-1 acc 57.031 (56.766)	Top-5 acc 76.562 (78.837)	lr 0.01683
Train [47][1580/3239]	Time 0.320 (0.575)	Data Time 0.005 (0.038)	Loss 2.8763 (2.7924)	Entropy 0.62593 (0.63001)	Top-1 acc 55.859 (56.770)	Top-5 acc 73.047 (78.832)	lr 0.01683
Train [47][1590/3239]	Time 0.288 (0.575)	Data Time 0.003 (0.038)	Loss 2.7026 (2.7920)	Entropy 0.62573 (0.62998)	Top-1 acc 62.891 (56.783)	Top-5 acc 78.125 (78.840)	lr 0.01683
Train [47][1600/3239]	Time 0.422 (0.574)	Data Time 0.002 (0.038)	Loss 2.8875 (2.7920)	Entropy 0.62570 (0.62995)	Top-1 acc 53.125 (56.782)	Top-5 acc 78.906 (78.840)	lr 0.01683
Train [47][1610/3239]	Time 0.284 (0.574)	Data Time 0.003 (0.037)	Loss 2.9953 (2.7921)	Entropy 0.62586 (0.62993)	Top-1 acc 51.172 (56.774)	Top-5 acc 74.219 (78.837)	lr 0.01683
Train [47][1620/3239]	Time 0.266 (0.573)	Data Time 0.001 (0.037)	Loss 2.6762 (2.7923)	Entropy 0.62571 (0.62990)	Top-1 acc 64.062 (56.768)	Top-5 acc 80.859 (78.833)	lr 0.01683
Train [47][1630/3239]	Time 0.249 (0.572)	Data Time 0.001 (0.037)	Loss 2.7364 (2.7921)	Entropy 0.62564 (0.62988)	Top-1 acc 56.250 (56.768)	Top-5 acc 82.031 (78.841)	lr 0.01683
Train [47][1640/3239]	Time 0.274 (0.571)	Data Time 0.001 (0.037)	Loss 2.9669 (2.7923)	Entropy 0.62581 (0.62985)	Top-1 acc 50.391 (56.765)	Top-5 acc 75.000 (78.833)	lr 0.01682
Train [47][1650/3239]	Time 0.239 (0.571)	Data Time 0.001 (0.037)	Loss 2.7995 (2.7926)	Entropy 0.62594 (0.62983)	Top-1 acc 57.812 (56.760)	Top-5 acc 78.906 (78.827)	lr 0.01682
Train [47][1660/3239]	Time 0.242 (0.570)	Data Time 0.001 (0.036)	Loss 2.7477 (2.7923)	Entropy 0.62621 (0.62980)	Top-1 acc 56.250 (56.763)	Top-5 acc 79.297 (78.832)	lr 0.01682
Train [47][1670/3239]	Time 0.339 (0.569)	Data Time 0.001 (0.036)	Loss 2.8740 (2.7922)	Entropy 0.62609 (0.62978)	Top-1 acc 50.781 (56.763)	Top-5 acc 77.344 (78.828)	lr 0.01682
Train [47][1680/3239]	Time 0.245 (0.568)	Data Time 0.001 (0.036)	Loss 3.0065 (2.7924)	Entropy 0.62595 (0.62976)	Top-1 acc 48.828 (56.759)	Top-5 acc 76.562 (78.824)	lr 0.01682
Train [47][1690/3239]	Time 0.248 (0.568)	Data Time 0.001 (0.036)	Loss 2.8633 (2.7927)	Entropy 0.62549 (0.62974)	Top-1 acc 55.859 (56.757)	Top-5 acc 76.953 (78.817)	lr 0.01682
Train [47][1700/3239]	Time 0.267 (0.567)	Data Time 0.001 (0.036)	Loss 2.7675 (2.7926)	Entropy 0.62555 (0.62971)	Top-1 acc 61.328 (56.759)	Top-5 acc 78.906 (78.820)	lr 0.01682
Train [47][1710/3239]	Time 0.295 (0.567)	Data Time 0.003 (0.036)	Loss 2.8900 (2.7927)	Entropy 0.62599 (0.62969)	Top-1 acc 52.344 (56.755)	Top-5 acc 78.125 (78.813)	lr 0.01682
Train [47][1720/3239]	Time 0.259 (0.567)	Data Time 0.002 (0.036)	Loss 2.7557 (2.7931)	Entropy 0.62628 (0.62967)	Top-1 acc 56.250 (56.744)	Top-5 acc 77.734 (78.802)	lr 0.01682
Train [47][1730/3239]	Time 0.275 (0.568)	Data Time 0.001 (0.038)	Loss 2.8263 (2.7935)	Entropy 0.62607 (0.62965)	Top-1 acc 58.203 (56.731)	Top-5 acc 77.734 (78.800)	lr 0.01682
Train [47][1740/3239]	Time 1.140 (0.567)	Data Time 0.867 (0.038)	Loss 2.9795 (2.7936)	Entropy 0.62590 (0.62963)	Top-1 acc 51.953 (56.730)	Top-5 acc 75.391 (78.800)	lr 0.01682
Train [47][1750/3239]	Time 0.233 (0.567)	Data Time 0.001 (0.038)	Loss 2.7611 (2.7939)	Entropy 0.62539 (0.62960)	Top-1 acc 58.984 (56.725)	Top-5 acc 78.125 (78.796)	lr 0.01681
Train [47][1760/3239]	Time 0.354 (0.568)	Data Time 0.001 (0.040)	Loss 3.0059 (2.7942)	Entropy 0.62528 (0.62958)	Top-1 acc 49.609 (56.722)	Top-5 acc 74.219 (78.792)	lr 0.01681
Train [47][1770/3239]	Time 0.244 (0.568)	Data Time 0.001 (0.040)	Loss 2.8085 (2.7941)	Entropy 0.62551 (0.62956)	Top-1 acc 58.203 (56.726)	Top-5 acc 78.125 (78.793)	lr 0.01681
Train [47][1780/3239]	Time 0.244 (0.570)	Data Time 0.001 (0.042)	Loss 2.8666 (2.7943)	Entropy 0.62560 (0.62953)	Top-1 acc 54.688 (56.724)	Top-5 acc 78.516 (78.790)	lr 0.01681
Train [47][1790/3239]	Time 0.297 (0.569)	Data Time 0.001 (0.042)	Loss 2.9001 (2.7945)	Entropy 0.62563 (0.62951)	Top-1 acc 55.078 (56.724)	Top-5 acc 75.391 (78.787)	lr 0.01681
Train [47][1800/3239]	Time 0.241 (0.570)	Data Time 0.001 (0.044)	Loss 3.0760 (2.7946)	Entropy 0.62552 (0.62949)	Top-1 acc 51.172 (56.722)	Top-5 acc 72.656 (78.785)	lr 0.01681
Train [47][1810/3239]	Time 0.234 (0.570)	Data Time 0.001 (0.044)	Loss 2.8468 (2.7947)	Entropy 0.62572 (0.62947)	Top-1 acc 58.984 (56.722)	Top-5 acc 76.562 (78.783)	lr 0.01681
Train [47][1820/3239]	Time 0.239 (0.569)	Data Time 0.001 (0.044)	Loss 2.7809 (2.7946)	Entropy 0.62565 (0.62945)	Top-1 acc 56.641 (56.721)	Top-5 acc 81.250 (78.784)	lr 0.01681
Train [47][1830/3239]	Time 0.396 (0.572)	Data Time 0.001 (0.047)	Loss 2.8787 (2.7945)	Entropy 0.62575 (0.62943)	Top-1 acc 57.031 (56.723)	Top-5 acc 75.391 (78.781)	lr 0.01681
Train [47][1840/3239]	Time 0.236 (0.571)	Data Time 0.001 (0.047)	Loss 2.6455 (2.7947)	Entropy 0.62578 (0.62941)	Top-1 acc 57.422 (56.718)	Top-5 acc 82.422 (78.778)	lr 0.01681
Train [47][1850/3239]	Time 0.244 (0.570)	Data Time 0.001 (0.046)	Loss 2.8207 (2.7948)	Entropy 0.62565 (0.62939)	Top-1 acc 57.031 (56.715)	Top-5 acc 75.781 (78.780)	lr 0.01680
Train [47][1860/3239]	Time 0.286 (0.573)	Data Time 0.001 (0.049)	Loss 2.9376 (2.7950)	Entropy 0.62562 (0.62937)	Top-1 acc 57.812 (56.711)	Top-5 acc 76.953 (78.774)	lr 0.01680
Train [47][1870/3239]	Time 0.231 (0.572)	Data Time 0.001 (0.049)	Loss 2.6571 (2.7951)	Entropy 0.62591 (0.62935)	Top-1 acc 58.203 (56.707)	Top-5 acc 82.812 (78.772)	lr 0.01680
Train [47][1880/3239]	Time 0.236 (0.572)	Data Time 0.001 (0.049)	Loss 2.8452 (2.7954)	Entropy 0.62609 (0.62933)	Top-1 acc 57.031 (56.700)	Top-5 acc 75.000 (78.766)	lr 0.01680
Train [47][1890/3239]	Time 0.268 (0.574)	Data Time 0.001 (0.052)	Loss 2.8176 (2.7955)	Entropy 0.62633 (0.62931)	Top-1 acc 55.859 (56.695)	Top-5 acc 76.953 (78.762)	lr 0.01680
Train [47][1900/3239]	Time 0.227 (0.573)	Data Time 0.001 (0.052)	Loss 3.0728 (2.7955)	Entropy 0.62655 (0.62930)	Top-1 acc 50.391 (56.695)	Top-5 acc 72.656 (78.762)	lr 0.01680
Train [47][1910/3239]	Time 0.237 (0.572)	Data Time 0.001 (0.051)	Loss 3.0218 (2.7959)	Entropy 0.62658 (0.62928)	Top-1 acc 55.469 (56.694)	Top-5 acc 75.781 (78.751)	lr 0.01680
Train [47][1920/3239]	Time 0.304 (0.576)	Data Time 0.001 (0.055)	Loss 2.8877 (2.7960)	Entropy 0.62653 (0.62927)	Top-1 acc 55.078 (56.690)	Top-5 acc 77.344 (78.748)	lr 0.01680
Train [47][1930/3239]	Time 0.285 (0.575)	Data Time 0.001 (0.055)	Loss 2.7023 (2.7958)	Entropy 0.62674 (0.62925)	Top-1 acc 60.547 (56.694)	Top-5 acc 82.812 (78.754)	lr 0.01680
Train [47][1940/3239]	Time 0.282 (0.575)	Data Time 0.001 (0.054)	Loss 2.8340 (2.7958)	Entropy 0.62649 (0.62924)	Top-1 acc 55.469 (56.692)	Top-5 acc 78.516 (78.757)	lr 0.01680
Train [47][1950/3239]	Time 0.233 (0.574)	Data Time 0.001 (0.054)	Loss 2.8188 (2.7957)	Entropy 0.62644 (0.62923)	Top-1 acc 53.125 (56.688)	Top-5 acc 78.906 (78.757)	lr 0.01680
Train [47][1960/3239]	Time 0.233 (0.577)	Data Time 0.001 (0.057)	Loss 2.6843 (2.7960)	Entropy 0.62594 (0.62921)	Top-1 acc 58.594 (56.679)	Top-5 acc 78.906 (78.751)	lr 0.01679
Train [47][1970/3239]	Time 0.238 (0.576)	Data Time 0.001 (0.057)	Loss 2.7860 (2.7961)	Entropy 0.62653 (0.62920)	Top-1 acc 56.641 (56.677)	Top-5 acc 80.469 (78.751)	lr 0.01679
Train [47][1980/3239]	Time 0.246 (0.576)	Data Time 0.001 (0.057)	Loss 2.7595 (2.7961)	Entropy 0.62643 (0.62918)	Top-1 acc 57.031 (56.678)	Top-5 acc 79.688 (78.750)	lr 0.01679
Train [47][1990/3239]	Time 0.333 (0.578)	Data Time 0.001 (0.059)	Loss 2.7176 (2.7960)	Entropy 0.62624 (0.62917)	Top-1 acc 58.984 (56.678)	Top-5 acc 82.812 (78.752)	lr 0.01679
Train [47][2000/3239]	Time 0.235 (0.577)	Data Time 0.001 (0.059)	Loss 2.7717 (2.7962)	Entropy 0.62652 (0.62915)	Top-1 acc 58.203 (56.674)	Top-5 acc 77.344 (78.747)	lr 0.01679
Train [47][2010/3239]	Time 0.247 (0.576)	Data Time 0.002 (0.059)	Loss 2.9460 (2.7968)	Entropy 0.62653 (0.62914)	Top-1 acc 55.859 (56.664)	Top-5 acc 78.906 (78.735)	lr 0.01679
Train [47][2020/3239]	Time 0.234 (0.578)	Data Time 0.001 (0.061)	Loss 2.7227 (2.7966)	Entropy 0.62635 (0.62913)	Top-1 acc 57.422 (56.665)	Top-5 acc 82.031 (78.742)	lr 0.01679
Train [47][2030/3239]	Time 0.352 (0.578)	Data Time 0.002 (0.061)	Loss 2.9243 (2.7968)	Entropy 0.62641 (0.62911)	Top-1 acc 55.078 (56.660)	Top-5 acc 75.391 (78.740)	lr 0.01679
Train [47][2040/3239]	Time 0.239 (0.578)	Data Time 0.001 (0.061)	Loss 2.7077 (2.7971)	Entropy 0.62645 (0.62910)	Top-1 acc 57.031 (56.656)	Top-5 acc 79.688 (78.735)	lr 0.01679
Train [47][2050/3239]	Time 0.245 (0.581)	Data Time 0.001 (0.065)	Loss 2.8430 (2.7971)	Entropy 0.62640 (0.62909)	Top-1 acc 53.516 (56.654)	Top-5 acc 75.781 (78.732)	lr 0.01679
Train [47][2060/3239]	Time 0.349 (0.580)	Data Time 0.001 (0.064)	Loss 2.9502 (2.7977)	Entropy 0.62664 (0.62908)	Top-1 acc 55.078 (56.641)	Top-5 acc 73.438 (78.718)	lr 0.01678
Train [47][2070/3239]	Time 0.231 (0.579)	Data Time 0.001 (0.064)	Loss 2.7190 (2.7973)	Entropy 0.62691 (0.62906)	Top-1 acc 60.156 (56.650)	Top-5 acc 79.297 (78.723)	lr 0.01678
Train [47][2080/3239]	Time 0.229 (0.582)	Data Time 0.001 (0.068)	Loss 2.6616 (2.7971)	Entropy 0.62715 (0.62905)	Top-1 acc 58.203 (56.649)	Top-5 acc 83.203 (78.725)	lr 0.01678
Train [47][2090/3239]	Time 0.236 (0.582)	Data Time 0.001 (0.068)	Loss 2.7467 (2.7974)	Entropy 0.62730 (0.62904)	Top-1 acc 58.594 (56.639)	Top-5 acc 80.469 (78.719)	lr 0.01678
Train [47][2100/3239]	Time 0.225 (0.581)	Data Time 0.001 (0.067)	Loss 2.9451 (2.7978)	Entropy 0.62723 (0.62904)	Top-1 acc 53.516 (56.637)	Top-5 acc 76.562 (78.711)	lr 0.01678
Train [47][2110/3239]	Time 0.227 (0.580)	Data Time 0.001 (0.067)	Loss 2.8827 (2.7978)	Entropy 0.62782 (0.62903)	Top-1 acc 52.734 (56.637)	Top-5 acc 76.562 (78.708)	lr 0.01678
Train [47][2120/3239]	Time 0.270 (0.582)	Data Time 0.002 (0.069)	Loss 2.6486 (2.7977)	Entropy 0.62789 (0.62902)	Top-1 acc 62.891 (56.641)	Top-5 acc 82.031 (78.706)	lr 0.01678
Train [47][2130/3239]	Time 0.231 (0.581)	Data Time 0.001 (0.069)	Loss 2.8896 (2.7978)	Entropy 0.62816 (0.62902)	Top-1 acc 56.250 (56.640)	Top-5 acc 76.953 (78.704)	lr 0.01678
Train [47][2140/3239]	Time 0.278 (0.581)	Data Time 0.002 (0.069)	Loss 2.9941 (2.7981)	Entropy 0.62812 (0.62901)	Top-1 acc 56.641 (56.637)	Top-5 acc 76.562 (78.700)	lr 0.01678
Train [47][2150/3239]	Time 0.330 (0.583)	Data Time 0.001 (0.071)	Loss 2.9853 (2.7983)	Entropy 0.62813 (0.62901)	Top-1 acc 57.812 (56.638)	Top-5 acc 74.609 (78.699)	lr 0.01678
Train [47][2160/3239]	Time 0.261 (0.582)	Data Time 0.001 (0.071)	Loss 2.9513 (2.7980)	Entropy 0.62823 (0.62901)	Top-1 acc 53.516 (56.647)	Top-5 acc 74.219 (78.706)	lr 0.01678
Train [47][2170/3239]	Time 0.242 (0.581)	Data Time 0.001 (0.071)	Loss 2.6911 (2.7981)	Entropy 0.62814 (0.62900)	Top-1 acc 58.203 (56.647)	Top-5 acc 81.641 (78.705)	lr 0.01677
Train [47][2180/3239]	Time 0.264 (0.585)	Data Time 0.001 (0.075)	Loss 2.6766 (2.7979)	Entropy 0.62836 (0.62900)	Top-1 acc 57.812 (56.646)	Top-5 acc 80.469 (78.708)	lr 0.01677
Train [47][2190/3239]	Time 0.272 (0.584)	Data Time 0.001 (0.075)	Loss 2.7557 (2.7979)	Entropy 0.62821 (0.62900)	Top-1 acc 59.766 (56.650)	Top-5 acc 80.078 (78.708)	lr 0.01677
Train [47][2200/3239]	Time 0.238 (0.583)	Data Time 0.001 (0.074)	Loss 2.7299 (2.7978)	Entropy 0.62827 (0.62899)	Top-1 acc 58.594 (56.653)	Top-5 acc 80.859 (78.710)	lr 0.01677
Train [47][2210/3239]	Time 0.235 (0.588)	Data Time 0.001 (0.079)	Loss 2.7945 (2.7982)	Entropy 0.62829 (0.62899)	Top-1 acc 59.375 (56.644)	Top-5 acc 78.906 (78.700)	lr 0.01677
Train [47][2220/3239]	Time 0.346 (0.587)	Data Time 0.001 (0.079)	Loss 2.9265 (2.7979)	Entropy 0.62817 (0.62899)	Top-1 acc 50.781 (56.649)	Top-5 acc 75.391 (78.705)	lr 0.01677
Train [47][2230/3239]	Time 0.234 (0.586)	Data Time 0.001 (0.078)	Loss 2.9909 (2.7978)	Entropy 0.62836 (0.62898)	Top-1 acc 50.000 (56.647)	Top-5 acc 78.906 (78.709)	lr 0.01677
Train [47][2240/3239]	Time 0.344 (0.602)	Data Time 0.003 (0.078)	Loss 2.8681 (2.7982)	Entropy 0.62842 (0.62898)	Top-1 acc 57.031 (56.644)	Top-5 acc 76.172 (78.701)	lr 0.01677
Train [47][2250/3239]	Time 0.257 (0.601)	Data Time 0.002 (0.078)	Loss 2.6819 (2.7981)	Entropy 0.62827 (0.62898)	Top-1 acc 60.156 (56.648)	Top-5 acc 81.641 (78.703)	lr 0.01677
Train [47][2260/3239]	Time 0.253 (0.600)	Data Time 0.002 (0.077)	Loss 2.9092 (2.7977)	Entropy 0.62797 (0.62897)	Top-1 acc 49.219 (56.650)	Top-5 acc 75.000 (78.710)	lr 0.01677
Train [47][2270/3239]	Time 0.230 (0.599)	Data Time 0.001 (0.077)	Loss 2.9947 (2.7979)	Entropy 0.62805 (0.62897)	Top-1 acc 50.781 (56.647)	Top-5 acc 75.781 (78.707)	lr 0.01676
Train [47][2280/3239]	Time 0.246 (0.599)	Data Time 0.001 (0.077)	Loss 2.7627 (2.7978)	Entropy 0.62834 (0.62896)	Top-1 acc 56.641 (56.649)	Top-5 acc 79.688 (78.706)	lr 0.01676
Train [47][2290/3239]	Time 0.292 (0.598)	Data Time 0.002 (0.076)	Loss 2.7244 (2.7978)	Entropy 0.62863 (0.62896)	Top-1 acc 57.812 (56.650)	Top-5 acc 81.250 (78.706)	lr 0.01676
Train [47][2300/3239]	Time 0.231 (0.598)	Data Time 0.001 (0.076)	Loss 2.8987 (2.7979)	Entropy 0.62854 (0.62896)	Top-1 acc 54.297 (56.642)	Top-5 acc 78.516 (78.706)	lr 0.01676
Train [47][2310/3239]	Time 1.216 (0.597)	Data Time 0.859 (0.076)	Loss 2.8985 (2.7978)	Entropy 0.62869 (0.62896)	Top-1 acc 56.641 (56.650)	Top-5 acc 75.781 (78.709)	lr 0.01676
Train [47][2320/3239]	Time 0.234 (0.597)	Data Time 0.001 (0.076)	Loss 2.7576 (2.7976)	Entropy 0.62866 (0.62896)	Top-1 acc 61.328 (56.651)	Top-5 acc 80.078 (78.714)	lr 0.01676
Train [47][2330/3239]	Time 0.235 (0.596)	Data Time 0.001 (0.076)	Loss 2.9531 (2.7979)	Entropy 0.62842 (0.62896)	Top-1 acc 51.172 (56.646)	Top-5 acc 76.172 (78.706)	lr 0.01676
Train [47][2340/3239]	Time 0.262 (0.601)	Data Time 0.001 (0.080)	Loss 2.6723 (2.7980)	Entropy 0.62842 (0.62895)	Top-1 acc 57.812 (56.644)	Top-5 acc 80.469 (78.705)	lr 0.01676
Train [47][2350/3239]	Time 0.623 (0.602)	Data Time 0.343 (0.082)	Loss 2.7869 (2.7982)	Entropy 0.62859 (0.62895)	Top-1 acc 62.109 (56.641)	Top-5 acc 77.344 (78.701)	lr 0.01676
Train [47][2360/3239]	Time 0.236 (0.601)	Data Time 0.001 (0.081)	Loss 2.8035 (2.7984)	Entropy 0.62898 (0.62895)	Top-1 acc 53.906 (56.638)	Top-5 acc 80.078 (78.699)	lr 0.01676
Train [47][2370/3239]	Time 1.709 (0.604)	Data Time 1.444 (0.085)	Loss 2.8112 (2.7985)	Entropy 0.62907 (0.62895)	Top-1 acc 52.734 (56.633)	Top-5 acc 76.562 (78.693)	lr 0.01676
Train [47][2380/3239]	Time 0.356 (0.604)	Data Time 0.001 (0.085)	Loss 2.7696 (2.7987)	Entropy 0.62929 (0.62895)	Top-1 acc 53.516 (56.630)	Top-5 acc 82.812 (78.693)	lr 0.01675
Train [47][2390/3239]	Time 0.230 (0.605)	Data Time 0.001 (0.087)	Loss 3.0685 (2.7988)	Entropy 0.62950 (0.62895)	Top-1 acc 52.734 (56.624)	Top-5 acc 75.000 (78.691)	lr 0.01675
Train [47][2400/3239]	Time 0.239 (0.608)	Data Time 0.001 (0.090)	Loss 2.5510 (2.7989)	Entropy 0.62933 (0.62896)	Top-1 acc 65.625 (56.625)	Top-5 acc 82.031 (78.687)	lr 0.01675
Train [47][2410/3239]	Time 0.229 (0.608)	Data Time 0.001 (0.091)	Loss 3.1757 (2.7990)	Entropy 0.62982 (0.62896)	Top-1 acc 47.266 (56.623)	Top-5 acc 71.484 (78.688)	lr 0.01675
Train [47][2420/3239]	Time 0.235 (0.609)	Data Time 0.001 (0.092)	Loss 2.6489 (2.7987)	Entropy 0.63005 (0.62896)	Top-1 acc 60.547 (56.630)	Top-5 acc 80.469 (78.691)	lr 0.01675
Train [47][2430/3239]	Time 0.274 (0.612)	Data Time 0.041 (0.095)	Loss 2.8476 (2.7988)	Entropy 0.62984 (0.62897)	Top-1 acc 57.812 (56.628)	Top-5 acc 77.344 (78.690)	lr 0.01675
Train [47][2440/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.096)	Loss 2.9081 (2.7993)	Entropy 0.62988 (0.62897)	Top-1 acc 55.078 (56.617)	Top-5 acc 75.781 (78.683)	lr 0.01675
Train [47][2450/3239]	Time 0.235 (0.612)	Data Time 0.001 (0.096)	Loss 3.0165 (2.7993)	Entropy 0.63005 (0.62897)	Top-1 acc 49.219 (56.614)	Top-5 acc 72.656 (78.681)	lr 0.01675
Train [47][2460/3239]	Time 0.229 (0.615)	Data Time 0.001 (0.100)	Loss 2.7459 (2.7992)	Entropy 0.63039 (0.62898)	Top-1 acc 57.422 (56.616)	Top-5 acc 78.516 (78.685)	lr 0.01675
Train [47][2470/3239]	Time 0.349 (0.618)	Data Time 0.001 (0.103)	Loss 3.0044 (2.7993)	Entropy 0.63004 (0.62898)	Top-1 acc 48.828 (56.614)	Top-5 acc 72.266 (78.683)	lr 0.01675
Train [47][2480/3239]	Time 0.323 (0.617)	Data Time 0.079 (0.102)	Loss 2.7909 (2.7993)	Entropy 0.63008 (0.62899)	Top-1 acc 57.422 (56.615)	Top-5 acc 80.859 (78.685)	lr 0.01674
Train [47][2490/3239]	Time 0.228 (0.618)	Data Time 0.001 (0.104)	Loss 2.7681 (2.7990)	Entropy 0.63046 (0.62899)	Top-1 acc 59.766 (56.620)	Top-5 acc 81.250 (78.692)	lr 0.01674
Train [47][2500/3239]	Time 0.237 (0.621)	Data Time 0.001 (0.107)	Loss 2.6161 (2.7987)	Entropy 0.63042 (0.62900)	Top-1 acc 62.891 (56.624)	Top-5 acc 79.688 (78.695)	lr 0.01674
Train [47][2510/3239]	Time 0.217 (0.620)	Data Time 0.001 (0.107)	Loss 3.0205 (2.7989)	Entropy 0.63083 (0.62900)	Top-1 acc 51.172 (56.617)	Top-5 acc 74.609 (78.690)	lr 0.01674
Train [47][2520/3239]	Time 0.294 (0.623)	Data Time 0.002 (0.109)	Loss 2.7353 (2.7987)	Entropy 0.63140 (0.62901)	Top-1 acc 54.688 (56.617)	Top-5 acc 77.734 (78.693)	lr 0.01674
Train [47][2530/3239]	Time 0.249 (0.625)	Data Time 0.001 (0.112)	Loss 2.9116 (2.7990)	Entropy 0.63147 (0.62902)	Top-1 acc 55.469 (56.611)	Top-5 acc 75.781 (78.691)	lr 0.01674
Train [47][2540/3239]	Time 0.373 (0.625)	Data Time 0.001 (0.112)	Loss 2.8852 (2.7989)	Entropy 0.63129 (0.62903)	Top-1 acc 58.984 (56.616)	Top-5 acc 75.391 (78.695)	lr 0.01674
Train [47][2550/3239]	Time 0.263 (0.626)	Data Time 0.001 (0.113)	Loss 2.8202 (2.7988)	Entropy 0.63098 (0.62904)	Top-1 acc 55.469 (56.616)	Top-5 acc 78.125 (78.695)	lr 0.01674
Train [47][2560/3239]	Time 0.301 (0.630)	Data Time 0.070 (0.118)	Loss 2.8476 (2.7990)	Entropy 0.63060 (0.62905)	Top-1 acc 57.031 (56.612)	Top-5 acc 79.297 (78.692)	lr 0.01674
Train [47][2570/3239]	Time 0.236 (0.629)	Data Time 0.001 (0.117)	Loss 2.6378 (2.7989)	Entropy 0.63038 (0.62905)	Top-1 acc 62.109 (56.612)	Top-5 acc 81.250 (78.694)	lr 0.01674
Train [47][2580/3239]	Time 0.233 (0.630)	Data Time 0.001 (0.118)	Loss 2.6446 (2.7986)	Entropy 0.63064 (0.62906)	Top-1 acc 59.766 (56.617)	Top-5 acc 80.078 (78.700)	lr 0.01674
Train [47][2590/3239]	Time 0.224 (0.634)	Data Time 0.001 (0.123)	Loss 2.9161 (2.7990)	Entropy 0.63038 (0.62906)	Top-1 acc 53.125 (56.608)	Top-5 acc 78.125 (78.689)	lr 0.01673
Train [47][2600/3239]	Time 0.234 (0.634)	Data Time 0.001 (0.123)	Loss 2.8660 (2.7991)	Entropy 0.63045 (0.62907)	Top-1 acc 55.078 (56.604)	Top-5 acc 78.125 (78.688)	lr 0.01673
Train [47][2610/3239]	Time 0.227 (0.634)	Data Time 0.001 (0.124)	Loss 2.9164 (2.7994)	Entropy 0.63025 (0.62907)	Top-1 acc 54.688 (56.596)	Top-5 acc 78.906 (78.682)	lr 0.01673
Train [47][2620/3239]	Time 0.237 (0.639)	Data Time 0.001 (0.129)	Loss 2.9878 (2.7995)	Entropy 0.63013 (0.62908)	Top-1 acc 55.078 (56.591)	Top-5 acc 75.391 (78.678)	lr 0.01673
Train [47][2630/3239]	Time 0.246 (0.638)	Data Time 0.001 (0.128)	Loss 2.9530 (2.7996)	Entropy 0.63029 (0.62908)	Top-1 acc 54.297 (56.590)	Top-5 acc 76.172 (78.675)	lr 0.01673
Train [47][2640/3239]	Time 3.102 (0.638)	Data Time 2.855 (0.129)	Loss 2.8421 (2.7997)	Entropy 0.63023 (0.62909)	Top-1 acc 54.297 (56.591)	Top-5 acc 76.953 (78.672)	lr 0.01673
Train [47][2650/3239]	Time 0.227 (0.639)	Data Time 0.001 (0.130)	Loss 2.7047 (2.7996)	Entropy 0.63010 (0.62909)	Top-1 acc 53.906 (56.595)	Top-5 acc 81.641 (78.679)	lr 0.01673
Train [47][2660/3239]	Time 0.294 (0.642)	Data Time 0.001 (0.134)	Loss 2.7632 (2.7995)	Entropy 0.63038 (0.62910)	Top-1 acc 59.375 (56.599)	Top-5 acc 80.078 (78.679)	lr 0.01673
Train [47][2670/3239]	Time 0.240 (0.642)	Data Time 0.001 (0.134)	Loss 3.1608 (2.7997)	Entropy 0.63027 (0.62910)	Top-1 acc 47.656 (56.593)	Top-5 acc 71.875 (78.677)	lr 0.01673
Train [47][2680/3239]	Time 0.251 (0.645)	Data Time 0.001 (0.137)	Loss 2.7146 (2.7996)	Entropy 0.62989 (0.62910)	Top-1 acc 60.156 (56.596)	Top-5 acc 78.906 (78.678)	lr 0.01673
Train [47][2690/3239]	Time 0.231 (0.646)	Data Time 0.001 (0.139)	Loss 2.6678 (2.7997)	Entropy 0.63006 (0.62911)	Top-1 acc 60.938 (56.590)	Top-5 acc 82.422 (78.676)	lr 0.01672
Train [47][2700/3239]	Time 0.361 (0.645)	Data Time 0.001 (0.139)	Loss 2.6811 (2.7997)	Entropy 0.63013 (0.62911)	Top-1 acc 58.984 (56.591)	Top-5 acc 80.469 (78.679)	lr 0.01672
Train [47][2710/3239]	Time 0.234 (0.646)	Data Time 0.001 (0.140)	Loss 2.6616 (2.7998)	Entropy 0.63004 (0.62911)	Top-1 acc 58.203 (56.585)	Top-5 acc 80.859 (78.677)	lr 0.01672
Train [47][2720/3239]	Time 0.239 (0.647)	Data Time 0.001 (0.140)	Loss 2.6886 (2.7998)	Entropy 0.62988 (0.62912)	Top-1 acc 58.984 (56.587)	Top-5 acc 80.859 (78.680)	lr 0.01672
Train [47][2730/3239]	Time 0.322 (0.646)	Data Time 0.002 (0.140)	Loss 2.8660 (2.7997)	Entropy 0.62997 (0.62912)	Top-1 acc 55.859 (56.589)	Top-5 acc 75.391 (78.685)	lr 0.01672
Train [47][2740/3239]	Time 0.223 (0.645)	Data Time 0.001 (0.139)	Loss 2.7871 (2.7997)	Entropy 0.63002 (0.62912)	Top-1 acc 54.297 (56.589)	Top-5 acc 80.859 (78.684)	lr 0.01672
Train [47][2750/3239]	Time 0.225 (0.648)	Data Time 0.001 (0.142)	Loss 3.0030 (2.7997)	Entropy 0.63016 (0.62913)	Top-1 acc 50.781 (56.588)	Top-5 acc 75.781 (78.684)	lr 0.01672
Train [47][2760/3239]	Time 0.225 (0.648)	Data Time 0.001 (0.143)	Loss 2.8209 (2.7996)	Entropy 0.63029 (0.62913)	Top-1 acc 56.641 (56.591)	Top-5 acc 78.516 (78.684)	lr 0.01672
Train [47][2770/3239]	Time 0.336 (0.648)	Data Time 0.001 (0.143)	Loss 2.7899 (2.7996)	Entropy 0.63001 (0.62914)	Top-1 acc 56.250 (56.591)	Top-5 acc 79.688 (78.687)	lr 0.01672
Train [47][2780/3239]	Time 0.238 (0.653)	Data Time 0.001 (0.149)	Loss 2.8732 (2.7997)	Entropy 0.63011 (0.62914)	Top-1 acc 51.562 (56.589)	Top-5 acc 77.344 (78.686)	lr 0.01672
Train [47][2790/3239]	Time 0.238 (0.653)	Data Time 0.001 (0.148)	Loss 2.6153 (2.7995)	Entropy 0.62994 (0.62914)	Top-1 acc 60.547 (56.594)	Top-5 acc 80.469 (78.690)	lr 0.01672
Train [47][2800/3239]	Time 0.221 (0.652)	Data Time 0.001 (0.148)	Loss 2.6844 (2.7994)	Entropy 0.63001 (0.62914)	Top-1 acc 57.812 (56.594)	Top-5 acc 78.516 (78.690)	lr 0.01671
Train [47][2810/3239]	Time 0.228 (0.656)	Data Time 0.001 (0.152)	Loss 2.8138 (2.7993)	Entropy 0.63005 (0.62915)	Top-1 acc 58.594 (56.597)	Top-5 acc 77.344 (78.693)	lr 0.01671
Train [47][2820/3239]	Time 0.230 (0.656)	Data Time 0.001 (0.153)	Loss 2.8607 (2.7993)	Entropy 0.63023 (0.62915)	Top-1 acc 56.250 (56.596)	Top-5 acc 75.000 (78.691)	lr 0.01671
Train [47][2830/3239]	Time 3.576 (0.657)	Data Time 3.311 (0.154)	Loss 2.6255 (2.7994)	Entropy 0.63004 (0.62915)	Top-1 acc 58.203 (56.593)	Top-5 acc 84.375 (78.691)	lr 0.01671
Train [47][2840/3239]	Time 0.224 (0.659)	Data Time 0.001 (0.156)	Loss 2.7317 (2.7993)	Entropy 0.62979 (0.62916)	Top-1 acc 56.250 (56.599)	Top-5 acc 77.344 (78.693)	lr 0.01671
Train [47][2850/3239]	Time 0.223 (0.660)	Data Time 0.001 (0.158)	Loss 2.7615 (2.7993)	Entropy 0.62948 (0.62916)	Top-1 acc 57.812 (56.600)	Top-5 acc 80.078 (78.689)	lr 0.01671
Train [47][2860/3239]	Time 3.751 (0.660)	Data Time 3.411 (0.158)	Loss 2.8329 (2.7993)	Entropy 0.62922 (0.62916)	Top-1 acc 54.688 (56.598)	Top-5 acc 77.344 (78.692)	lr 0.01671
Train [47][2870/3239]	Time 0.245 (0.661)	Data Time 0.001 (0.159)	Loss 2.7495 (2.7995)	Entropy 0.62877 (0.62916)	Top-1 acc 58.594 (56.589)	Top-5 acc 77.344 (78.684)	lr 0.01671
Train [47][2880/3239]	Time 0.252 (0.662)	Data Time 0.001 (0.160)	Loss 2.6603 (2.7996)	Entropy 0.62903 (0.62916)	Top-1 acc 59.375 (56.582)	Top-5 acc 82.031 (78.682)	lr 0.01671
Train [47][2890/3239]	Time 0.304 (0.674)	Data Time 0.005 (0.160)	Loss 3.0507 (2.7997)	Entropy 0.62905 (0.62916)	Top-1 acc 48.438 (56.576)	Top-5 acc 74.219 (78.683)	lr 0.01671
Train [47][2900/3239]	Time 0.284 (0.673)	Data Time 0.002 (0.159)	Loss 2.7284 (2.7998)	Entropy 0.62931 (0.62916)	Top-1 acc 53.125 (56.570)	Top-5 acc 83.984 (78.686)	lr 0.01670
Train [47][2910/3239]	Time 0.263 (0.672)	Data Time 0.002 (0.159)	Loss 2.9493 (2.7999)	Entropy 0.62920 (0.62916)	Top-1 acc 53.906 (56.568)	Top-5 acc 78.125 (78.685)	lr 0.01670
Train [47][2920/3239]	Time 0.249 (0.672)	Data Time 0.001 (0.158)	Loss 2.8693 (2.8000)	Entropy 0.62907 (0.62916)	Top-1 acc 52.734 (56.563)	Top-5 acc 77.734 (78.684)	lr 0.01670
Train [47][2930/3239]	Time 0.549 (0.671)	Data Time 0.002 (0.158)	Loss 2.7202 (2.7997)	Entropy 0.62916 (0.62916)	Top-1 acc 60.547 (56.564)	Top-5 acc 78.906 (78.689)	lr 0.01670
Train [47][2940/3239]	Time 0.254 (0.671)	Data Time 0.001 (0.157)	Loss 2.7176 (2.7999)	Entropy 0.62888 (0.62916)	Top-1 acc 57.812 (56.560)	Top-5 acc 78.906 (78.687)	lr 0.01670
Train [47][2950/3239]	Time 0.253 (0.670)	Data Time 0.001 (0.157)	Loss 2.4909 (2.7999)	Entropy 0.62903 (0.62916)	Top-1 acc 64.453 (56.562)	Top-5 acc 83.984 (78.686)	lr 0.01670
Train [47][2960/3239]	Time 0.254 (0.669)	Data Time 0.001 (0.156)	Loss 2.8850 (2.8000)	Entropy 0.62933 (0.62916)	Top-1 acc 53.516 (56.561)	Top-5 acc 79.688 (78.680)	lr 0.01670
Train [47][2970/3239]	Time 0.275 (0.668)	Data Time 0.002 (0.156)	Loss 2.6754 (2.7999)	Entropy 0.62952 (0.62916)	Top-1 acc 57.812 (56.561)	Top-5 acc 83.203 (78.684)	lr 0.01670
Train [47][2980/3239]	Time 0.249 (0.668)	Data Time 0.001 (0.155)	Loss 2.7254 (2.8000)	Entropy 0.62955 (0.62916)	Top-1 acc 60.156 (56.560)	Top-5 acc 79.688 (78.682)	lr 0.01670
Train [47][2990/3239]	Time 0.261 (0.670)	Data Time 0.001 (0.157)	Loss 2.6803 (2.8000)	Entropy 0.62934 (0.62916)	Top-1 acc 60.156 (56.560)	Top-5 acc 81.250 (78.686)	lr 0.01670
Train [47][3000/3239]	Time 0.275 (0.672)	Data Time 0.001 (0.159)	Loss 2.6760 (2.8000)	Entropy 0.62939 (0.62916)	Top-1 acc 60.547 (56.562)	Top-5 acc 79.688 (78.686)	lr 0.01670
Train [47][3010/3239]	Time 0.306 (0.673)	Data Time 0.003 (0.161)	Loss 2.9203 (2.8002)	Entropy 0.62955 (0.62916)	Top-1 acc 50.781 (56.557)	Top-5 acc 75.781 (78.679)	lr 0.01669
Train [47][3020/3239]	Time 6.647 (0.675)	Data Time 6.239 (0.163)	Loss 2.7065 (2.8002)	Entropy 0.62957 (0.62917)	Top-1 acc 59.375 (56.557)	Top-5 acc 81.641 (78.678)	lr 0.01669
Train [47][3030/3239]	Time 1.864 (0.676)	Data Time 1.597 (0.164)	Loss 2.6918 (2.8002)	Entropy 0.62960 (0.62917)	Top-1 acc 61.328 (56.558)	Top-5 acc 80.078 (78.678)	lr 0.01669
Train [47][3040/3239]	Time 0.256 (0.678)	Data Time 0.001 (0.167)	Loss 2.7197 (2.8000)	Entropy 0.62956 (0.62917)	Top-1 acc 60.547 (56.565)	Top-5 acc 80.078 (78.681)	lr 0.01669
Train [47][3050/3239]	Time 0.251 (0.678)	Data Time 0.002 (0.167)	Loss 2.8795 (2.8000)	Entropy 0.62960 (0.62917)	Top-1 acc 57.812 (56.565)	Top-5 acc 75.781 (78.680)	lr 0.01669
Train [47][3060/3239]	Time 3.195 (0.681)	Data Time 2.932 (0.169)	Loss 2.7446 (2.7999)	Entropy 0.62951 (0.62917)	Top-1 acc 60.156 (56.569)	Top-5 acc 78.516 (78.681)	lr 0.01669
Train [47][3070/3239]	Time 0.255 (0.683)	Data Time 0.001 (0.171)	Loss 2.8830 (2.7996)	Entropy 0.62909 (0.62917)	Top-1 acc 54.297 (56.571)	Top-5 acc 79.688 (78.687)	lr 0.01669
Train [47][3080/3239]	Time 0.267 (0.683)	Data Time 0.001 (0.172)	Loss 2.7283 (2.7995)	Entropy 0.62894 (0.62917)	Top-1 acc 62.109 (56.575)	Top-5 acc 76.953 (78.688)	lr 0.01669
Train [47][3090/3239]	Time 0.370 (0.684)	Data Time 0.001 (0.174)	Loss 2.8006 (2.7995)	Entropy 0.62901 (0.62917)	Top-1 acc 55.859 (56.577)	Top-5 acc 77.734 (78.687)	lr 0.01669
Train [47][3100/3239]	Time 1.753 (0.687)	Data Time 1.495 (0.177)	Loss 2.7883 (2.7993)	Entropy 0.62923 (0.62917)	Top-1 acc 51.562 (56.579)	Top-5 acc 78.906 (78.690)	lr 0.01669
Train [47][3110/3239]	Time 0.236 (0.688)	Data Time 0.001 (0.178)	Loss 2.7916 (2.7991)	Entropy 0.62928 (0.62917)	Top-1 acc 57.422 (56.582)	Top-5 acc 77.344 (78.694)	lr 0.01668
Train [47][3120/3239]	Time 0.242 (0.690)	Data Time 0.001 (0.180)	Loss 2.8472 (2.7995)	Entropy 0.62967 (0.62917)	Top-1 acc 54.688 (56.571)	Top-5 acc 78.125 (78.689)	lr 0.01668
Train [47][3130/3239]	Time 0.293 (0.692)	Data Time 0.005 (0.182)	Loss 2.8604 (2.7997)	Entropy 0.62960 (0.62917)	Top-1 acc 54.297 (56.565)	Top-5 acc 77.734 (78.686)	lr 0.01668
Train [47][3140/3239]	Time 0.239 (0.693)	Data Time 0.001 (0.183)	Loss 2.7577 (2.7995)	Entropy 0.62975 (0.62917)	Top-1 acc 55.469 (56.568)	Top-5 acc 80.078 (78.690)	lr 0.01668
Train [47][3150/3239]	Time 0.246 (0.694)	Data Time 0.001 (0.184)	Loss 2.7721 (2.7994)	Entropy 0.62994 (0.62917)	Top-1 acc 53.906 (56.567)	Top-5 acc 76.953 (78.689)	lr 0.01668
Train [47][3160/3239]	Time 1.508 (0.696)	Data Time 1.253 (0.187)	Loss 2.7683 (2.7996)	Entropy 0.63010 (0.62918)	Top-1 acc 56.250 (56.564)	Top-5 acc 77.344 (78.685)	lr 0.01668
Train [47][3170/3239]	Time 0.251 (0.698)	Data Time 0.002 (0.189)	Loss 2.5859 (2.7994)	Entropy 0.63002 (0.62918)	Top-1 acc 57.031 (56.568)	Top-5 acc 84.375 (78.685)	lr 0.01668
Train [47][3180/3239]	Time 5.171 (0.699)	Data Time 4.832 (0.190)	Loss 2.7862 (2.7993)	Entropy 0.63040 (0.62918)	Top-1 acc 55.859 (56.570)	Top-5 acc 79.688 (78.688)	lr 0.01668
Train [47][3190/3239]	Time 2.708 (0.700)	Data Time 2.429 (0.192)	Loss 2.7254 (2.7992)	Entropy 0.63045 (0.62919)	Top-1 acc 57.031 (56.571)	Top-5 acc 80.078 (78.688)	lr 0.01668
Train [47][3200/3239]	Time 0.317 (0.703)	Data Time 0.000 (0.194)	Loss 2.7199 (2.7991)	Entropy 0.63077 (0.62919)	Top-1 acc 56.250 (56.573)	Top-5 acc 81.250 (78.693)	lr 0.01668
Train [47][3210/3239]	Time 0.258 (0.702)	Data Time 0.000 (0.193)	Loss 2.7315 (2.7992)	Entropy 0.63067 (0.62920)	Top-1 acc 58.984 (56.571)	Top-5 acc 83.203 (78.693)	lr 0.01668
Train [47][3220/3239]	Time 0.246 (0.703)	Data Time 0.000 (0.195)	Loss 2.7769 (2.7992)	Entropy 0.63061 (0.62920)	Top-1 acc 58.203 (56.569)	Top-5 acc 78.906 (78.694)	lr 0.01667
Train [47][3230/3239]	Time 0.257 (0.704)	Data Time 0.000 (0.196)	Loss 2.9175 (2.7992)	Entropy 0.63056 (0.62921)	Top-1 acc 52.344 (56.569)	Top-5 acc 77.734 (78.691)	lr 0.01667
Train [47][3239/3239]	Time 1.022 (0.704)	Data Time 0.000 (0.196)	Loss 2.9448 (2.7992)	Entropy 0.63063 (0.62921)	Top-1 acc 53.086 (56.568)	Top-5 acc 82.716 (78.692)	lr 0.01667
==========Valid [47/120]	loss 1.545	top-1 acc 64.864 (64.864)	top-5 acc 85.475	Train top-1 56.568	top-5 78.692	Entropy 0.63063	Latency-None: 0.000ms	Flops: 538.40M
Train [48][0/3239]	Time 42.246 (42.246)	Data Time 40.371 (40.371)	Loss 2.4227 (2.4227)	Entropy 0.63087 (0.63087)	Top-1 acc 66.406 (66.406)	Top-5 acc 85.547 (85.547)	lr 0.01667
Train [48][10/3239]	Time 0.281 (4.275)	Data Time 0.003 (3.675)	Loss 2.7407 (2.8103)	Entropy 0.63127 (0.63099)	Top-1 acc 56.641 (56.143)	Top-5 acc 77.734 (78.054)	lr 0.01667
Train [48][20/3239]	Time 0.238 (2.481)	Data Time 0.001 (1.926)	Loss 2.8050 (2.8022)	Entropy 0.63142 (0.63112)	Top-1 acc 54.688 (56.306)	Top-5 acc 77.734 (77.995)	lr 0.01667
Train [48][30/3239]	Time 0.271 (1.831)	Data Time 0.001 (1.305)	Loss 2.9280 (2.8037)	Entropy 0.63182 (0.63125)	Top-1 acc 57.422 (56.363)	Top-5 acc 78.516 (78.100)	lr 0.01667
Train [48][40/3239]	Time 0.260 (1.502)	Data Time 0.001 (0.987)	Loss 2.7049 (2.8064)	Entropy 0.63180 (0.63139)	Top-1 acc 58.984 (56.193)	Top-5 acc 80.859 (78.268)	lr 0.01667
Train [48][50/3239]	Time 0.238 (1.298)	Data Time 0.001 (0.794)	Loss 2.8165 (2.8031)	Entropy 0.63174 (0.63147)	Top-1 acc 58.984 (56.441)	Top-5 acc 78.516 (78.500)	lr 0.01667
Train [48][60/3239]	Time 0.246 (1.161)	Data Time 0.001 (0.664)	Loss 2.7768 (2.7878)	Entropy 0.63167 (0.63150)	Top-1 acc 56.250 (56.660)	Top-5 acc 75.781 (78.836)	lr 0.01667
Train [48][70/3239]	Time 0.296 (1.063)	Data Time 0.002 (0.571)	Loss 2.8805 (2.7849)	Entropy 0.63210 (0.63155)	Top-1 acc 57.812 (56.877)	Top-5 acc 75.391 (78.840)	lr 0.01667
Train [48][80/3239]	Time 0.357 (0.987)	Data Time 0.001 (0.501)	Loss 2.9498 (2.7896)	Entropy 0.63238 (0.63162)	Top-1 acc 55.078 (56.805)	Top-5 acc 77.344 (78.766)	lr 0.01666
Train [48][90/3239]	Time 0.246 (0.929)	Data Time 0.001 (0.446)	Loss 2.6553 (2.7914)	Entropy 0.63193 (0.63169)	Top-1 acc 58.594 (56.791)	Top-5 acc 80.078 (78.795)	lr 0.01666
Train [48][100/3239]	Time 0.240 (0.879)	Data Time 0.001 (0.402)	Loss 2.6277 (2.7904)	Entropy 0.63211 (0.63172)	Top-1 acc 60.547 (56.795)	Top-5 acc 79.688 (78.852)	lr 0.01666
Train [48][110/3239]	Time 0.234 (0.842)	Data Time 0.001 (0.366)	Loss 2.9190 (2.7943)	Entropy 0.63240 (0.63177)	Top-1 acc 53.125 (56.834)	Top-5 acc 75.781 (78.868)	lr 0.01666
Train [48][120/3239]	Time 0.243 (0.810)	Data Time 0.001 (0.336)	Loss 2.8625 (2.7911)	Entropy 0.63215 (0.63182)	Top-1 acc 58.984 (56.909)	Top-5 acc 78.516 (78.948)	lr 0.01666
Train [48][130/3239]	Time 0.234 (0.781)	Data Time 0.001 (0.310)	Loss 2.7990 (2.7874)	Entropy 0.63220 (0.63185)	Top-1 acc 57.031 (57.064)	Top-5 acc 79.688 (79.026)	lr 0.01666
Train [48][140/3239]	Time 0.239 (0.757)	Data Time 0.001 (0.288)	Loss 2.8755 (2.7882)	Entropy 0.63227 (0.63188)	Top-1 acc 51.953 (56.990)	Top-5 acc 78.906 (79.025)	lr 0.01666
Train [48][150/3239]	Time 0.382 (0.736)	Data Time 0.001 (0.269)	Loss 2.7455 (2.7873)	Entropy 0.63231 (0.63190)	Top-1 acc 57.422 (57.000)	Top-5 acc 81.250 (79.041)	lr 0.01666
Train [48][160/3239]	Time 0.247 (0.719)	Data Time 0.001 (0.253)	Loss 2.7513 (2.7894)	Entropy 0.63259 (0.63193)	Top-1 acc 57.812 (56.985)	Top-5 acc 78.125 (78.989)	lr 0.01666
Train [48][170/3239]	Time 0.271 (0.702)	Data Time 0.001 (0.238)	Loss 2.8804 (2.7873)	Entropy 0.63286 (0.63198)	Top-1 acc 55.469 (57.043)	Top-5 acc 76.953 (79.007)	lr 0.01666
Train [48][180/3239]	Time 0.234 (0.690)	Data Time 0.001 (0.225)	Loss 2.8622 (2.7877)	Entropy 0.63315 (0.63203)	Top-1 acc 54.688 (56.969)	Top-5 acc 76.953 (78.965)	lr 0.01666
Train [48][190/3239]	Time 0.239 (0.678)	Data Time 0.003 (0.213)	Loss 2.7133 (2.7874)	Entropy 0.63328 (0.63209)	Top-1 acc 57.031 (56.921)	Top-5 acc 80.469 (78.966)	lr 0.01665
Train [48][200/3239]	Time 0.298 (0.668)	Data Time 0.002 (0.203)	Loss 2.6407 (2.7906)	Entropy 0.63283 (0.63214)	Top-1 acc 62.500 (56.849)	Top-5 acc 85.938 (78.947)	lr 0.01665
Train [48][210/3239]	Time 0.257 (0.659)	Data Time 0.002 (0.193)	Loss 2.8561 (2.7878)	Entropy 0.63271 (0.63218)	Top-1 acc 53.906 (56.905)	Top-5 acc 75.781 (78.956)	lr 0.01665
Train [48][220/3239]	Time 0.254 (0.650)	Data Time 0.001 (0.185)	Loss 2.8441 (2.7861)	Entropy 0.63272 (0.63220)	Top-1 acc 57.031 (56.953)	Top-5 acc 77.734 (78.966)	lr 0.01665
Train [48][230/3239]	Time 0.268 (0.641)	Data Time 0.001 (0.177)	Loss 2.7210 (2.7871)	Entropy 0.63282 (0.63222)	Top-1 acc 60.156 (56.938)	Top-5 acc 80.859 (78.938)	lr 0.01665
Train [48][240/3239]	Time 0.279 (0.632)	Data Time 0.001 (0.169)	Loss 2.5541 (2.7854)	Entropy 0.63314 (0.63225)	Top-1 acc 61.719 (56.970)	Top-5 acc 83.984 (78.978)	lr 0.01665
Train [48][250/3239]	Time 0.238 (0.626)	Data Time 0.001 (0.163)	Loss 2.8642 (2.7848)	Entropy 0.63256 (0.63227)	Top-1 acc 54.688 (56.966)	Top-5 acc 77.734 (78.992)	lr 0.01665
Train [48][260/3239]	Time 0.245 (0.619)	Data Time 0.001 (0.157)	Loss 2.8568 (2.7855)	Entropy 0.63263 (0.63228)	Top-1 acc 53.906 (56.968)	Top-5 acc 77.734 (78.950)	lr 0.01665
Train [48][270/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.151)	Loss 2.8052 (2.7819)	Entropy 0.63271 (0.63230)	Top-1 acc 55.469 (57.034)	Top-5 acc 77.734 (79.003)	lr 0.01665
Train [48][280/3239]	Time 0.245 (0.607)	Data Time 0.001 (0.146)	Loss 2.4450 (2.7821)	Entropy 0.63240 (0.63231)	Top-1 acc 62.109 (57.035)	Top-5 acc 84.375 (79.001)	lr 0.01665
Train [48][290/3239]	Time 0.243 (0.603)	Data Time 0.001 (0.141)	Loss 2.7371 (2.7818)	Entropy 0.63252 (0.63232)	Top-1 acc 62.109 (57.030)	Top-5 acc 76.953 (78.985)	lr 0.01664
Train [48][300/3239]	Time 0.307 (0.598)	Data Time 0.002 (0.136)	Loss 2.8695 (2.7820)	Entropy 0.63211 (0.63232)	Top-1 acc 50.781 (57.035)	Top-5 acc 79.297 (78.991)	lr 0.01664
Train [48][310/3239]	Time 0.431 (0.715)	Data Time 0.003 (0.132)	Loss 2.7263 (2.7805)	Entropy 0.63219 (0.63231)	Top-1 acc 59.766 (57.039)	Top-5 acc 77.734 (79.000)	lr 0.01664
Train [48][320/3239]	Time 0.243 (0.706)	Data Time 0.002 (0.128)	Loss 2.7907 (2.7812)	Entropy 0.63190 (0.63231)	Top-1 acc 59.766 (57.030)	Top-5 acc 76.562 (78.965)	lr 0.01664
Train [48][330/3239]	Time 0.241 (0.698)	Data Time 0.002 (0.124)	Loss 2.9024 (2.7806)	Entropy 0.63204 (0.63230)	Top-1 acc 52.344 (57.049)	Top-5 acc 76.953 (78.985)	lr 0.01664
Train [48][340/3239]	Time 0.234 (0.691)	Data Time 0.001 (0.120)	Loss 2.6323 (2.7797)	Entropy 0.63187 (0.63229)	Top-1 acc 63.281 (57.098)	Top-5 acc 80.469 (78.969)	lr 0.01664
Train [48][350/3239]	Time 0.250 (0.684)	Data Time 0.001 (0.117)	Loss 2.8579 (2.7792)	Entropy 0.63185 (0.63228)	Top-1 acc 57.812 (57.109)	Top-5 acc 78.906 (78.972)	lr 0.01664
Train [48][360/3239]	Time 0.278 (0.678)	Data Time 0.001 (0.114)	Loss 2.9345 (2.7798)	Entropy 0.63155 (0.63226)	Top-1 acc 55.469 (57.094)	Top-5 acc 78.516 (78.982)	lr 0.01664
Train [48][370/3239]	Time 0.270 (0.673)	Data Time 0.001 (0.111)	Loss 2.8896 (2.7802)	Entropy 0.63178 (0.63224)	Top-1 acc 51.562 (57.057)	Top-5 acc 76.172 (78.994)	lr 0.01664
Train [48][380/3239]	Time 0.258 (0.668)	Data Time 0.001 (0.108)	Loss 2.9057 (2.7808)	Entropy 0.63178 (0.63223)	Top-1 acc 54.297 (57.028)	Top-5 acc 78.906 (78.991)	lr 0.01664
Train [48][390/3239]	Time 0.318 (0.662)	Data Time 0.001 (0.105)	Loss 2.8382 (2.7818)	Entropy 0.63194 (0.63222)	Top-1 acc 56.641 (57.004)	Top-5 acc 76.172 (78.970)	lr 0.01664
Train [48][400/3239]	Time 0.347 (0.657)	Data Time 0.001 (0.103)	Loss 3.0163 (2.7839)	Entropy 0.63218 (0.63222)	Top-1 acc 52.734 (56.951)	Top-5 acc 75.000 (78.932)	lr 0.01663
Train [48][410/3239]	Time 0.229 (0.652)	Data Time 0.001 (0.100)	Loss 2.9047 (2.7835)	Entropy 0.63202 (0.63221)	Top-1 acc 52.734 (56.962)	Top-5 acc 75.000 (78.937)	lr 0.01663
Train [48][420/3239]	Time 0.310 (0.647)	Data Time 0.001 (0.098)	Loss 2.6645 (2.7818)	Entropy 0.63188 (0.63221)	Top-1 acc 60.156 (56.997)	Top-5 acc 79.688 (78.967)	lr 0.01663
Train [48][430/3239]	Time 0.241 (0.643)	Data Time 0.001 (0.096)	Loss 2.6114 (2.7823)	Entropy 0.63194 (0.63220)	Top-1 acc 60.938 (56.980)	Top-5 acc 82.812 (78.981)	lr 0.01663
Train [48][440/3239]	Time 0.281 (0.639)	Data Time 0.003 (0.094)	Loss 2.6073 (2.7822)	Entropy 0.63186 (0.63220)	Top-1 acc 58.984 (56.973)	Top-5 acc 81.641 (78.984)	lr 0.01663
Train [48][450/3239]	Time 0.262 (0.636)	Data Time 0.001 (0.092)	Loss 2.7655 (2.7813)	Entropy 0.63192 (0.63219)	Top-1 acc 55.859 (56.975)	Top-5 acc 78.516 (79.011)	lr 0.01663
Train [48][460/3239]	Time 0.245 (0.632)	Data Time 0.001 (0.090)	Loss 2.7349 (2.7817)	Entropy 0.63156 (0.63218)	Top-1 acc 56.641 (56.980)	Top-5 acc 80.859 (79.003)	lr 0.01663
Train [48][470/3239]	Time 0.497 (0.629)	Data Time 0.001 (0.088)	Loss 2.6601 (2.7815)	Entropy 0.63154 (0.63217)	Top-1 acc 58.594 (56.985)	Top-5 acc 77.344 (78.996)	lr 0.01663
Train [48][480/3239]	Time 0.232 (0.626)	Data Time 0.001 (0.086)	Loss 2.9231 (2.7803)	Entropy 0.63154 (0.63215)	Top-1 acc 50.781 (57.009)	Top-5 acc 76.953 (79.029)	lr 0.01663
Train [48][490/3239]	Time 0.315 (0.622)	Data Time 0.001 (0.084)	Loss 2.8987 (2.7808)	Entropy 0.63183 (0.63214)	Top-1 acc 53.906 (56.990)	Top-5 acc 75.781 (79.018)	lr 0.01663
Train [48][500/3239]	Time 0.256 (0.619)	Data Time 0.002 (0.083)	Loss 3.1071 (2.7820)	Entropy 0.63209 (0.63214)	Top-1 acc 46.094 (56.969)	Top-5 acc 74.219 (78.997)	lr 0.01662
Train [48][510/3239]	Time 0.295 (0.616)	Data Time 0.002 (0.081)	Loss 2.6857 (2.7826)	Entropy 0.63209 (0.63214)	Top-1 acc 58.594 (56.962)	Top-5 acc 80.078 (78.983)	lr 0.01662
Train [48][520/3239]	Time 0.242 (0.613)	Data Time 0.001 (0.079)	Loss 2.7554 (2.7825)	Entropy 0.63229 (0.63214)	Top-1 acc 56.641 (56.968)	Top-5 acc 79.297 (78.999)	lr 0.01662
Train [48][530/3239]	Time 0.255 (0.610)	Data Time 0.001 (0.078)	Loss 2.9276 (2.7828)	Entropy 0.63274 (0.63214)	Top-1 acc 51.953 (56.970)	Top-5 acc 76.172 (78.987)	lr 0.01662
Train [48][540/3239]	Time 0.239 (0.607)	Data Time 0.001 (0.077)	Loss 2.7335 (2.7828)	Entropy 0.63246 (0.63216)	Top-1 acc 58.594 (56.964)	Top-5 acc 78.125 (78.985)	lr 0.01662
Train [48][550/3239]	Time 0.281 (0.605)	Data Time 0.001 (0.075)	Loss 2.9450 (2.7830)	Entropy 0.63215 (0.63216)	Top-1 acc 53.516 (56.972)	Top-5 acc 78.125 (78.976)	lr 0.01662
Train [48][560/3239]	Time 0.299 (0.603)	Data Time 0.001 (0.074)	Loss 2.6946 (2.7825)	Entropy 0.63226 (0.63216)	Top-1 acc 60.156 (56.989)	Top-5 acc 80.469 (78.994)	lr 0.01662
Train [48][570/3239]	Time 0.240 (0.600)	Data Time 0.001 (0.073)	Loss 2.7553 (2.7827)	Entropy 0.63223 (0.63216)	Top-1 acc 57.031 (56.987)	Top-5 acc 78.125 (78.991)	lr 0.01662
Train [48][580/3239]	Time 0.255 (0.598)	Data Time 0.001 (0.071)	Loss 3.0453 (2.7830)	Entropy 0.63231 (0.63216)	Top-1 acc 52.734 (56.972)	Top-5 acc 76.172 (78.996)	lr 0.01662
Train [48][590/3239]	Time 0.268 (0.597)	Data Time 0.001 (0.070)	Loss 2.6436 (2.7844)	Entropy 0.63244 (0.63217)	Top-1 acc 58.984 (56.933)	Top-5 acc 81.641 (78.978)	lr 0.01662
Train [48][600/3239]	Time 0.280 (0.595)	Data Time 0.001 (0.069)	Loss 2.8343 (2.7842)	Entropy 0.63258 (0.63217)	Top-1 acc 56.250 (56.926)	Top-5 acc 80.078 (78.987)	lr 0.01662
Train [48][610/3239]	Time 0.243 (0.592)	Data Time 0.001 (0.068)	Loss 2.6569 (2.7845)	Entropy 0.63275 (0.63218)	Top-1 acc 60.938 (56.914)	Top-5 acc 80.078 (78.976)	lr 0.01661
Train [48][620/3239]	Time 0.246 (0.590)	Data Time 0.001 (0.067)	Loss 2.9612 (2.7853)	Entropy 0.63272 (0.63219)	Top-1 acc 53.516 (56.893)	Top-5 acc 73.438 (78.958)	lr 0.01661
Train [48][630/3239]	Time 0.368 (0.588)	Data Time 0.001 (0.066)	Loss 2.7648 (2.7855)	Entropy 0.63297 (0.63220)	Top-1 acc 51.562 (56.873)	Top-5 acc 83.203 (78.956)	lr 0.01661
Train [48][640/3239]	Time 0.261 (0.586)	Data Time 0.001 (0.065)	Loss 2.5597 (2.7856)	Entropy 0.63337 (0.63221)	Top-1 acc 58.203 (56.865)	Top-5 acc 85.547 (78.962)	lr 0.01661
Train [48][650/3239]	Time 0.298 (0.584)	Data Time 0.002 (0.064)	Loss 2.6635 (2.7856)	Entropy 0.63314 (0.63223)	Top-1 acc 63.281 (56.878)	Top-5 acc 80.859 (78.952)	lr 0.01661
Train [48][660/3239]	Time 0.261 (0.582)	Data Time 0.001 (0.063)	Loss 2.9580 (2.7852)	Entropy 0.63345 (0.63225)	Top-1 acc 50.781 (56.891)	Top-5 acc 74.609 (78.948)	lr 0.01661
Train [48][670/3239]	Time 0.250 (0.580)	Data Time 0.001 (0.062)	Loss 3.0855 (2.7858)	Entropy 0.63365 (0.63226)	Top-1 acc 48.438 (56.879)	Top-5 acc 72.266 (78.935)	lr 0.01661
Train [48][680/3239]	Time 0.253 (0.579)	Data Time 0.001 (0.061)	Loss 3.0172 (2.7861)	Entropy 0.63356 (0.63229)	Top-1 acc 52.344 (56.874)	Top-5 acc 72.656 (78.910)	lr 0.01661
Train [48][690/3239]	Time 0.250 (0.577)	Data Time 0.001 (0.060)	Loss 2.9586 (2.7863)	Entropy 0.63387 (0.63231)	Top-1 acc 56.641 (56.876)	Top-5 acc 73.438 (78.906)	lr 0.01661
Train [48][700/3239]	Time 0.365 (0.575)	Data Time 0.001 (0.060)	Loss 2.7871 (2.7862)	Entropy 0.63379 (0.63233)	Top-1 acc 56.641 (56.886)	Top-5 acc 77.734 (78.913)	lr 0.01661
Train [48][710/3239]	Time 0.237 (0.573)	Data Time 0.001 (0.059)	Loss 2.7206 (2.7858)	Entropy 0.63367 (0.63235)	Top-1 acc 59.766 (56.901)	Top-5 acc 80.078 (78.920)	lr 0.01660
Train [48][720/3239]	Time 0.250 (0.571)	Data Time 0.001 (0.058)	Loss 2.6506 (2.7859)	Entropy 0.63336 (0.63236)	Top-1 acc 59.766 (56.904)	Top-5 acc 82.812 (78.920)	lr 0.01660
Train [48][730/3239]	Time 0.274 (0.570)	Data Time 0.001 (0.057)	Loss 2.7062 (2.7860)	Entropy 0.63330 (0.63238)	Top-1 acc 58.594 (56.902)	Top-5 acc 81.641 (78.917)	lr 0.01660
Train [48][740/3239]	Time 0.239 (0.570)	Data Time 0.001 (0.058)	Loss 2.6484 (2.7861)	Entropy 0.63314 (0.63239)	Top-1 acc 62.500 (56.903)	Top-5 acc 79.688 (78.910)	lr 0.01660
Train [48][750/3239]	Time 0.236 (0.568)	Data Time 0.001 (0.057)	Loss 2.8428 (2.7853)	Entropy 0.63316 (0.63240)	Top-1 acc 59.375 (56.921)	Top-5 acc 79.688 (78.929)	lr 0.01660
Train [48][760/3239]	Time 0.246 (0.567)	Data Time 0.001 (0.056)	Loss 2.7537 (2.7845)	Entropy 0.63321 (0.63241)	Top-1 acc 57.422 (56.938)	Top-5 acc 80.469 (78.941)	lr 0.01660
Train [48][770/3239]	Time 0.270 (0.572)	Data Time 0.001 (0.062)	Loss 2.6844 (2.7842)	Entropy 0.63317 (0.63242)	Top-1 acc 60.547 (56.950)	Top-5 acc 80.469 (78.941)	lr 0.01660
Train [48][780/3239]	Time 0.283 (0.570)	Data Time 0.002 (0.061)	Loss 2.7899 (2.7850)	Entropy 0.63296 (0.63243)	Top-1 acc 53.906 (56.924)	Top-5 acc 76.953 (78.920)	lr 0.01660
Train [48][790/3239]	Time 0.387 (0.568)	Data Time 0.001 (0.061)	Loss 2.7615 (2.7848)	Entropy 0.63304 (0.63244)	Top-1 acc 56.250 (56.931)	Top-5 acc 82.031 (78.924)	lr 0.01660
Train [48][800/3239]	Time 1.344 (0.568)	Data Time 1.103 (0.061)	Loss 2.6421 (2.7837)	Entropy 0.63314 (0.63244)	Top-1 acc 57.812 (56.962)	Top-5 acc 82.422 (78.949)	lr 0.01660
Train [48][810/3239]	Time 0.258 (0.571)	Data Time 0.001 (0.065)	Loss 2.8673 (2.7839)	Entropy 0.63373 (0.63245)	Top-1 acc 55.078 (56.947)	Top-5 acc 74.609 (78.945)	lr 0.01660
Train [48][820/3239]	Time 0.269 (0.570)	Data Time 0.001 (0.064)	Loss 2.9564 (2.7848)	Entropy 0.63368 (0.63247)	Top-1 acc 53.906 (56.933)	Top-5 acc 76.172 (78.924)	lr 0.01659
Train [48][830/3239]	Time 0.249 (0.569)	Data Time 0.001 (0.063)	Loss 2.6435 (2.7845)	Entropy 0.63375 (0.63248)	Top-1 acc 58.203 (56.928)	Top-5 acc 81.250 (78.931)	lr 0.01659
Train [48][840/3239]	Time 0.256 (0.569)	Data Time 0.001 (0.065)	Loss 2.8509 (2.7844)	Entropy 0.63392 (0.63250)	Top-1 acc 56.641 (56.928)	Top-5 acc 77.734 (78.945)	lr 0.01659
Train [48][850/3239]	Time 0.240 (0.568)	Data Time 0.002 (0.064)	Loss 2.8238 (2.7849)	Entropy 0.63394 (0.63252)	Top-1 acc 56.641 (56.922)	Top-5 acc 77.734 (78.934)	lr 0.01659
Train [48][860/3239]	Time 1.245 (0.568)	Data Time 0.866 (0.064)	Loss 2.8121 (2.7846)	Entropy 0.63407 (0.63253)	Top-1 acc 55.469 (56.923)	Top-5 acc 80.469 (78.939)	lr 0.01659
Train [48][870/3239]	Time 0.229 (0.570)	Data Time 0.001 (0.068)	Loss 2.8766 (2.7852)	Entropy 0.63449 (0.63255)	Top-1 acc 57.031 (56.916)	Top-5 acc 78.125 (78.927)	lr 0.01659
Train [48][880/3239]	Time 0.258 (0.569)	Data Time 0.001 (0.067)	Loss 2.7998 (2.7843)	Entropy 0.63468 (0.63257)	Top-1 acc 58.203 (56.944)	Top-5 acc 78.125 (78.943)	lr 0.01659
Train [48][890/3239]	Time 0.282 (0.568)	Data Time 0.001 (0.066)	Loss 2.9775 (2.7847)	Entropy 0.63459 (0.63260)	Top-1 acc 53.516 (56.943)	Top-5 acc 73.828 (78.929)	lr 0.01659
Train [48][900/3239]	Time 0.254 (0.571)	Data Time 0.001 (0.070)	Loss 2.8109 (2.7844)	Entropy 0.63450 (0.63262)	Top-1 acc 55.859 (56.952)	Top-5 acc 75.391 (78.935)	lr 0.01659
Train [48][910/3239]	Time 0.229 (0.569)	Data Time 0.002 (0.069)	Loss 2.7877 (2.7846)	Entropy 0.63465 (0.63264)	Top-1 acc 50.000 (56.931)	Top-5 acc 80.078 (78.935)	lr 0.01659
Train [48][920/3239]	Time 0.255 (0.568)	Data Time 0.001 (0.068)	Loss 2.5474 (2.7847)	Entropy 0.63435 (0.63266)	Top-1 acc 63.281 (56.926)	Top-5 acc 83.594 (78.935)	lr 0.01658
Train [48][930/3239]	Time 0.273 (0.575)	Data Time 0.002 (0.076)	Loss 2.6880 (2.7844)	Entropy 0.63445 (0.63268)	Top-1 acc 62.109 (56.936)	Top-5 acc 78.125 (78.937)	lr 0.01658
Train [48][940/3239]	Time 0.235 (0.574)	Data Time 0.001 (0.075)	Loss 2.8264 (2.7835)	Entropy 0.63426 (0.63269)	Top-1 acc 55.859 (56.947)	Top-5 acc 77.344 (78.955)	lr 0.01658
Train [48][950/3239]	Time 0.363 (0.572)	Data Time 0.001 (0.074)	Loss 2.6332 (2.7834)	Entropy 0.63451 (0.63271)	Top-1 acc 61.719 (56.944)	Top-5 acc 81.250 (78.957)	lr 0.01658
Train [48][960/3239]	Time 0.353 (0.612)	Data Time 0.052 (0.076)	Loss 2.6532 (2.7836)	Entropy 0.63400 (0.63273)	Top-1 acc 60.938 (56.942)	Top-5 acc 82.031 (78.955)	lr 0.01658
Train [48][970/3239]	Time 0.240 (0.612)	Data Time 0.002 (0.075)	Loss 2.9595 (2.7837)	Entropy 0.63438 (0.63274)	Top-1 acc 53.906 (56.943)	Top-5 acc 78.516 (78.957)	lr 0.01658
Train [48][980/3239]	Time 0.247 (0.610)	Data Time 0.001 (0.075)	Loss 2.8952 (2.7839)	Entropy 0.63447 (0.63276)	Top-1 acc 53.125 (56.937)	Top-5 acc 76.562 (78.957)	lr 0.01658
Train [48][990/3239]	Time 0.239 (0.608)	Data Time 0.001 (0.074)	Loss 2.6828 (2.7831)	Entropy 0.63468 (0.63278)	Top-1 acc 56.250 (56.947)	Top-5 acc 81.250 (78.977)	lr 0.01658
Train [48][1000/3239]	Time 0.246 (0.607)	Data Time 0.002 (0.073)	Loss 2.7794 (2.7842)	Entropy 0.63453 (0.63280)	Top-1 acc 57.812 (56.918)	Top-5 acc 77.344 (78.955)	lr 0.01658
Train [48][1010/3239]	Time 0.246 (0.605)	Data Time 0.001 (0.072)	Loss 2.8259 (2.7852)	Entropy 0.63443 (0.63281)	Top-1 acc 54.297 (56.896)	Top-5 acc 76.953 (78.936)	lr 0.01658
Train [48][1020/3239]	Time 0.396 (0.604)	Data Time 0.001 (0.072)	Loss 2.8051 (2.7854)	Entropy 0.63446 (0.63283)	Top-1 acc 56.250 (56.892)	Top-5 acc 79.297 (78.933)	lr 0.01658
Train [48][1030/3239]	Time 0.231 (0.602)	Data Time 0.001 (0.071)	Loss 2.5077 (2.7856)	Entropy 0.63458 (0.63284)	Top-1 acc 64.844 (56.887)	Top-5 acc 83.984 (78.936)	lr 0.01657
Train [48][1040/3239]	Time 0.239 (0.600)	Data Time 0.001 (0.070)	Loss 2.5884 (2.7851)	Entropy 0.63471 (0.63286)	Top-1 acc 60.156 (56.898)	Top-5 acc 83.594 (78.947)	lr 0.01657
Train [48][1050/3239]	Time 0.335 (0.599)	Data Time 0.002 (0.070)	Loss 2.8036 (2.7853)	Entropy 0.63462 (0.63288)	Top-1 acc 53.516 (56.904)	Top-5 acc 77.734 (78.947)	lr 0.01657
Train [48][1060/3239]	Time 0.310 (0.601)	Data Time 0.001 (0.073)	Loss 2.7090 (2.7857)	Entropy 0.63474 (0.63290)	Top-1 acc 59.766 (56.898)	Top-5 acc 77.734 (78.930)	lr 0.01657
Train [48][1070/3239]	Time 0.245 (0.600)	Data Time 0.001 (0.072)	Loss 2.7331 (2.7859)	Entropy 0.63500 (0.63291)	Top-1 acc 57.031 (56.895)	Top-5 acc 79.688 (78.926)	lr 0.01657
Train [48][1080/3239]	Time 0.241 (0.599)	Data Time 0.001 (0.071)	Loss 2.8683 (2.7865)	Entropy 0.63498 (0.63293)	Top-1 acc 53.125 (56.874)	Top-5 acc 76.953 (78.912)	lr 0.01657
Train [48][1090/3239]	Time 0.246 (0.597)	Data Time 0.001 (0.071)	Loss 3.2223 (2.7873)	Entropy 0.63473 (0.63295)	Top-1 acc 48.828 (56.858)	Top-5 acc 68.750 (78.895)	lr 0.01657
Train [48][1100/3239]	Time 0.248 (0.601)	Data Time 0.001 (0.075)	Loss 2.8267 (2.7875)	Entropy 0.63410 (0.63296)	Top-1 acc 55.859 (56.852)	Top-5 acc 79.688 (78.894)	lr 0.01657
Train [48][1110/3239]	Time 0.287 (0.600)	Data Time 0.001 (0.074)	Loss 2.6340 (2.7872)	Entropy 0.63435 (0.63298)	Top-1 acc 57.422 (56.853)	Top-5 acc 80.469 (78.899)	lr 0.01657
Train [48][1120/3239]	Time 0.258 (0.598)	Data Time 0.001 (0.074)	Loss 2.5632 (2.7865)	Entropy 0.63456 (0.63299)	Top-1 acc 62.109 (56.871)	Top-5 acc 83.594 (78.909)	lr 0.01657
Train [48][1130/3239]	Time 0.240 (0.605)	Data Time 0.001 (0.081)	Loss 2.7403 (2.7863)	Entropy 0.63447 (0.63300)	Top-1 acc 56.250 (56.884)	Top-5 acc 78.516 (78.915)	lr 0.01656
Train [48][1140/3239]	Time 0.252 (0.604)	Data Time 0.001 (0.080)	Loss 2.8835 (2.7869)	Entropy 0.63436 (0.63301)	Top-1 acc 53.125 (56.865)	Top-5 acc 73.828 (78.898)	lr 0.01656
Train [48][1150/3239]	Time 0.264 (0.602)	Data Time 0.001 (0.080)	Loss 3.0107 (2.7871)	Entropy 0.63426 (0.63302)	Top-1 acc 50.000 (56.849)	Top-5 acc 75.391 (78.894)	lr 0.01656
Train [48][1160/3239]	Time 0.236 (0.609)	Data Time 0.001 (0.087)	Loss 2.8450 (2.7866)	Entropy 0.63436 (0.63304)	Top-1 acc 58.984 (56.856)	Top-5 acc 78.125 (78.905)	lr 0.01656
Train [48][1170/3239]	Time 0.240 (0.607)	Data Time 0.001 (0.086)	Loss 2.9535 (2.7862)	Entropy 0.63393 (0.63305)	Top-1 acc 53.125 (56.868)	Top-5 acc 75.000 (78.913)	lr 0.01656
Train [48][1180/3239]	Time 0.348 (0.606)	Data Time 0.001 (0.085)	Loss 2.7378 (2.7856)	Entropy 0.63376 (0.63305)	Top-1 acc 58.203 (56.887)	Top-5 acc 80.078 (78.923)	lr 0.01656
Train [48][1190/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.093)	Loss 2.7743 (2.7852)	Entropy 0.63364 (0.63306)	Top-1 acc 52.344 (56.891)	Top-5 acc 80.078 (78.929)	lr 0.01656
Train [48][1200/3239]	Time 0.238 (0.612)	Data Time 0.001 (0.092)	Loss 2.7888 (2.7848)	Entropy 0.63301 (0.63306)	Top-1 acc 57.031 (56.898)	Top-5 acc 78.516 (78.941)	lr 0.01656
Train [48][1210/3239]	Time 0.236 (0.610)	Data Time 0.001 (0.092)	Loss 2.7438 (2.7844)	Entropy 0.63296 (0.63306)	Top-1 acc 55.078 (56.907)	Top-5 acc 81.250 (78.942)	lr 0.01656
Train [48][1220/3239]	Time 0.251 (0.617)	Data Time 0.001 (0.099)	Loss 2.7432 (2.7845)	Entropy 0.63305 (0.63306)	Top-1 acc 60.938 (56.905)	Top-5 acc 77.344 (78.932)	lr 0.01656
Train [48][1230/3239]	Time 0.241 (0.615)	Data Time 0.001 (0.098)	Loss 2.7008 (2.7842)	Entropy 0.63312 (0.63306)	Top-1 acc 57.422 (56.911)	Top-5 acc 79.297 (78.940)	lr 0.01656
Train [48][1240/3239]	Time 0.254 (0.616)	Data Time 0.001 (0.099)	Loss 2.7351 (2.7843)	Entropy 0.63307 (0.63306)	Top-1 acc 57.812 (56.908)	Top-5 acc 79.297 (78.937)	lr 0.01655
Train [48][1250/3239]	Time 0.356 (0.615)	Data Time 0.001 (0.098)	Loss 2.9324 (2.7844)	Entropy 0.63331 (0.63306)	Top-1 acc 50.000 (56.902)	Top-5 acc 75.781 (78.934)	lr 0.01655
Train [48][1260/3239]	Time 0.243 (0.620)	Data Time 0.001 (0.104)	Loss 2.7930 (2.7851)	Entropy 0.63308 (0.63306)	Top-1 acc 57.031 (56.885)	Top-5 acc 78.516 (78.925)	lr 0.01655
Train [48][1270/3239]	Time 0.230 (0.619)	Data Time 0.001 (0.104)	Loss 2.5720 (2.7851)	Entropy 0.63308 (0.63306)	Top-1 acc 62.500 (56.889)	Top-5 acc 82.422 (78.933)	lr 0.01655
Train [48][1280/3239]	Time 0.254 (0.618)	Data Time 0.001 (0.103)	Loss 2.7301 (2.7851)	Entropy 0.63319 (0.63306)	Top-1 acc 59.766 (56.892)	Top-5 acc 78.125 (78.923)	lr 0.01655
Train [48][1290/3239]	Time 0.259 (0.627)	Data Time 0.001 (0.112)	Loss 2.8710 (2.7853)	Entropy 0.63315 (0.63306)	Top-1 acc 56.641 (56.894)	Top-5 acc 78.516 (78.925)	lr 0.01655
Train [48][1300/3239]	Time 0.240 (0.626)	Data Time 0.001 (0.112)	Loss 2.7345 (2.7854)	Entropy 0.63327 (0.63307)	Top-1 acc 57.031 (56.891)	Top-5 acc 80.469 (78.921)	lr 0.01655
Train [48][1310/3239]	Time 0.228 (0.626)	Data Time 0.001 (0.113)	Loss 2.7141 (2.7854)	Entropy 0.63318 (0.63307)	Top-1 acc 61.328 (56.898)	Top-5 acc 80.859 (78.927)	lr 0.01655
Train [48][1320/3239]	Time 0.242 (0.634)	Data Time 0.001 (0.122)	Loss 2.9786 (2.7855)	Entropy 0.63329 (0.63307)	Top-1 acc 55.469 (56.892)	Top-5 acc 75.781 (78.927)	lr 0.01655
Train [48][1330/3239]	Time 0.239 (0.635)	Data Time 0.001 (0.122)	Loss 2.7615 (2.7850)	Entropy 0.63367 (0.63307)	Top-1 acc 53.516 (56.901)	Top-5 acc 81.250 (78.934)	lr 0.01655
Train [48][1340/3239]	Time 0.374 (0.635)	Data Time 0.001 (0.124)	Loss 2.6886 (2.7848)	Entropy 0.63338 (0.63307)	Top-1 acc 58.984 (56.895)	Top-5 acc 79.297 (78.941)	lr 0.01654
Train [48][1350/3239]	Time 0.223 (0.640)	Data Time 0.001 (0.129)	Loss 2.8338 (2.7854)	Entropy 0.63378 (0.63308)	Top-1 acc 55.078 (56.880)	Top-5 acc 76.953 (78.933)	lr 0.01654
Train [48][1360/3239]	Time 0.243 (0.641)	Data Time 0.001 (0.131)	Loss 2.6728 (2.7851)	Entropy 0.63398 (0.63308)	Top-1 acc 57.812 (56.884)	Top-5 acc 80.859 (78.936)	lr 0.01654
Train [48][1370/3239]	Time 0.234 (0.640)	Data Time 0.001 (0.130)	Loss 2.7731 (2.7845)	Entropy 0.63418 (0.63309)	Top-1 acc 61.328 (56.907)	Top-5 acc 78.906 (78.946)	lr 0.01654
Train [48][1380/3239]	Time 0.242 (0.638)	Data Time 0.002 (0.129)	Loss 2.6964 (2.7842)	Entropy 0.63412 (0.63310)	Top-1 acc 60.156 (56.918)	Top-5 acc 79.688 (78.949)	lr 0.01654
Train [48][1390/3239]	Time 0.277 (0.646)	Data Time 0.002 (0.137)	Loss 2.8485 (2.7845)	Entropy 0.63384 (0.63310)	Top-1 acc 52.734 (56.908)	Top-5 acc 75.391 (78.943)	lr 0.01654
Train [48][1400/3239]	Time 0.254 (0.644)	Data Time 0.001 (0.136)	Loss 2.8016 (2.7838)	Entropy 0.63381 (0.63311)	Top-1 acc 55.469 (56.921)	Top-5 acc 77.344 (78.952)	lr 0.01654
Train [48][1410/3239]	Time 0.345 (0.643)	Data Time 0.001 (0.135)	Loss 2.6872 (2.7838)	Entropy 0.63405 (0.63311)	Top-1 acc 58.594 (56.919)	Top-5 acc 78.125 (78.945)	lr 0.01654
Train [48][1420/3239]	Time 0.239 (0.649)	Data Time 0.001 (0.141)	Loss 2.7689 (2.7836)	Entropy 0.63410 (0.63312)	Top-1 acc 55.859 (56.925)	Top-5 acc 78.906 (78.946)	lr 0.01654
Train [48][1430/3239]	Time 0.243 (0.647)	Data Time 0.002 (0.140)	Loss 2.7444 (2.7835)	Entropy 0.63419 (0.63313)	Top-1 acc 62.500 (56.931)	Top-5 acc 77.734 (78.943)	lr 0.01654
Train [48][1440/3239]	Time 0.245 (0.646)	Data Time 0.001 (0.139)	Loss 2.6649 (2.7835)	Entropy 0.63411 (0.63313)	Top-1 acc 58.984 (56.927)	Top-5 acc 80.469 (78.943)	lr 0.01654
Train [48][1450/3239]	Time 0.243 (0.652)	Data Time 0.002 (0.146)	Loss 2.8775 (2.7835)	Entropy 0.63401 (0.63314)	Top-1 acc 56.641 (56.924)	Top-5 acc 74.219 (78.940)	lr 0.01653
Train [48][1460/3239]	Time 0.242 (0.651)	Data Time 0.001 (0.145)	Loss 2.9461 (2.7838)	Entropy 0.63434 (0.63315)	Top-1 acc 55.078 (56.925)	Top-5 acc 73.828 (78.936)	lr 0.01653
Train [48][1470/3239]	Time 0.239 (0.649)	Data Time 0.001 (0.144)	Loss 2.8476 (2.7844)	Entropy 0.63443 (0.63316)	Top-1 acc 55.469 (56.897)	Top-5 acc 76.562 (78.920)	lr 0.01653
Train [48][1480/3239]	Time 0.260 (0.657)	Data Time 0.002 (0.152)	Loss 2.5956 (2.7844)	Entropy 0.63440 (0.63316)	Top-1 acc 61.719 (56.895)	Top-5 acc 83.203 (78.921)	lr 0.01653
Train [48][1490/3239]	Time 0.249 (0.656)	Data Time 0.001 (0.151)	Loss 3.0097 (2.7843)	Entropy 0.63434 (0.63317)	Top-1 acc 53.516 (56.893)	Top-5 acc 73.438 (78.918)	lr 0.01653
Train [48][1500/3239]	Time 0.353 (0.655)	Data Time 0.001 (0.151)	Loss 2.8165 (2.7839)	Entropy 0.63458 (0.63318)	Top-1 acc 58.594 (56.905)	Top-5 acc 78.906 (78.924)	lr 0.01653
Train [48][1510/3239]	Time 0.238 (0.658)	Data Time 0.001 (0.154)	Loss 2.8368 (2.7842)	Entropy 0.63458 (0.63319)	Top-1 acc 55.859 (56.900)	Top-5 acc 76.953 (78.919)	lr 0.01653
Train [48][1520/3239]	Time 0.252 (0.661)	Data Time 0.001 (0.158)	Loss 2.8053 (2.7841)	Entropy 0.63475 (0.63320)	Top-1 acc 53.516 (56.905)	Top-5 acc 77.734 (78.928)	lr 0.01653
Train [48][1530/3239]	Time 0.233 (0.660)	Data Time 0.001 (0.157)	Loss 2.9723 (2.7843)	Entropy 0.63483 (0.63321)	Top-1 acc 57.812 (56.902)	Top-5 acc 73.438 (78.924)	lr 0.01653
Train [48][1540/3239]	Time 0.252 (0.659)	Data Time 0.011 (0.156)	Loss 3.0177 (2.7849)	Entropy 0.63452 (0.63322)	Top-1 acc 48.828 (56.884)	Top-5 acc 74.219 (78.910)	lr 0.01653
Train [48][1550/3239]	Time 0.273 (0.663)	Data Time 0.002 (0.160)	Loss 2.8856 (2.7848)	Entropy 0.63470 (0.63323)	Top-1 acc 52.344 (56.880)	Top-5 acc 76.562 (78.911)	lr 0.01652
Train [48][1560/3239]	Time 0.238 (0.665)	Data Time 0.001 (0.163)	Loss 2.8305 (2.7849)	Entropy 0.63470 (0.63324)	Top-1 acc 53.906 (56.882)	Top-5 acc 77.734 (78.902)	lr 0.01652
Train [48][1570/3239]	Time 0.344 (0.663)	Data Time 0.001 (0.162)	Loss 2.9719 (2.7850)	Entropy 0.63459 (0.63325)	Top-1 acc 52.734 (56.881)	Top-5 acc 77.734 (78.901)	lr 0.01652
Train [48][1580/3239]	Time 0.258 (0.668)	Data Time 0.001 (0.167)	Loss 2.7674 (2.7854)	Entropy 0.63467 (0.63326)	Top-1 acc 55.078 (56.876)	Top-5 acc 80.078 (78.895)	lr 0.01652
Train [48][1590/3239]	Time 0.254 (0.671)	Data Time 0.001 (0.170)	Loss 2.7787 (2.7852)	Entropy 0.63470 (0.63327)	Top-1 acc 54.688 (56.882)	Top-5 acc 80.859 (78.898)	lr 0.01652
Train [48][1600/3239]	Time 0.235 (0.670)	Data Time 0.001 (0.169)	Loss 2.9775 (2.7851)	Entropy 0.63476 (0.63327)	Top-1 acc 50.391 (56.881)	Top-5 acc 75.781 (78.900)	lr 0.01652
Train [48][1610/3239]	Time 0.247 (0.675)	Data Time 0.001 (0.175)	Loss 3.0136 (2.7854)	Entropy 0.63490 (0.63328)	Top-1 acc 51.562 (56.873)	Top-5 acc 74.609 (78.896)	lr 0.01652
Train [48][1620/3239]	Time 0.326 (0.696)	Data Time 0.004 (0.174)	Loss 2.6658 (2.7857)	Entropy 0.63489 (0.63329)	Top-1 acc 60.938 (56.871)	Top-5 acc 80.469 (78.889)	lr 0.01652
Train [48][1630/3239]	Time 0.248 (0.695)	Data Time 0.002 (0.173)	Loss 2.9230 (2.7859)	Entropy 0.63508 (0.63330)	Top-1 acc 54.688 (56.867)	Top-5 acc 78.125 (78.886)	lr 0.01652
Train [48][1640/3239]	Time 0.245 (0.693)	Data Time 0.001 (0.172)	Loss 3.1959 (2.7860)	Entropy 0.63520 (0.63332)	Top-1 acc 49.219 (56.865)	Top-5 acc 71.875 (78.891)	lr 0.01652
Train [48][1650/3239]	Time 0.256 (0.692)	Data Time 0.001 (0.171)	Loss 2.6873 (2.7856)	Entropy 0.63497 (0.63333)	Top-1 acc 60.547 (56.873)	Top-5 acc 81.641 (78.897)	lr 0.01652
Train [48][1660/3239]	Time 0.352 (0.690)	Data Time 0.001 (0.170)	Loss 2.6881 (2.7858)	Entropy 0.63506 (0.63334)	Top-1 acc 58.203 (56.869)	Top-5 acc 79.688 (78.889)	lr 0.01651
Train [48][1670/3239]	Time 0.241 (0.688)	Data Time 0.001 (0.169)	Loss 2.9809 (2.7858)	Entropy 0.63489 (0.63335)	Top-1 acc 55.078 (56.867)	Top-5 acc 69.922 (78.882)	lr 0.01651
Train [48][1680/3239]	Time 0.235 (0.687)	Data Time 0.001 (0.168)	Loss 2.6425 (2.7854)	Entropy 0.63521 (0.63336)	Top-1 acc 63.281 (56.876)	Top-5 acc 80.859 (78.892)	lr 0.01651
Train [48][1690/3239]	Time 0.227 (0.689)	Data Time 0.001 (0.170)	Loss 2.9538 (2.7854)	Entropy 0.63526 (0.63337)	Top-1 acc 55.078 (56.883)	Top-5 acc 76.953 (78.895)	lr 0.01651
Train [48][1700/3239]	Time 0.244 (0.689)	Data Time 0.001 (0.171)	Loss 2.7850 (2.7854)	Entropy 0.63521 (0.63338)	Top-1 acc 54.297 (56.884)	Top-5 acc 78.516 (78.890)	lr 0.01651
Train [48][1710/3239]	Time 0.263 (0.688)	Data Time 0.001 (0.170)	Loss 2.8092 (2.7855)	Entropy 0.63497 (0.63339)	Top-1 acc 57.812 (56.880)	Top-5 acc 78.125 (78.886)	lr 0.01651
Train [48][1720/3239]	Time 2.760 (0.696)	Data Time 2.504 (0.178)	Loss 2.8748 (2.7855)	Entropy 0.63505 (0.63340)	Top-1 acc 54.297 (56.880)	Top-5 acc 79.688 (78.890)	lr 0.01651
Train [48][1730/3239]	Time 0.361 (0.696)	Data Time 0.001 (0.179)	Loss 2.8280 (2.7855)	Entropy 0.63525 (0.63341)	Top-1 acc 55.078 (56.881)	Top-5 acc 76.172 (78.887)	lr 0.01651
Train [48][1740/3239]	Time 0.252 (0.697)	Data Time 0.001 (0.180)	Loss 2.8947 (2.7860)	Entropy 0.63493 (0.63342)	Top-1 acc 53.516 (56.873)	Top-5 acc 76.953 (78.877)	lr 0.01651
Train [48][1750/3239]	Time 1.442 (0.703)	Data Time 1.181 (0.187)	Loss 2.7281 (2.7856)	Entropy 0.63490 (0.63343)	Top-1 acc 57.812 (56.884)	Top-5 acc 80.859 (78.884)	lr 0.01651
Train [48][1760/3239]	Time 0.269 (0.703)	Data Time 0.001 (0.186)	Loss 2.8313 (2.7856)	Entropy 0.63450 (0.63343)	Top-1 acc 56.641 (56.878)	Top-5 acc 76.953 (78.891)	lr 0.01650
Train [48][1770/3239]	Time 0.261 (0.704)	Data Time 0.001 (0.189)	Loss 2.9116 (2.7862)	Entropy 0.63473 (0.63344)	Top-1 acc 55.469 (56.870)	Top-5 acc 76.562 (78.882)	lr 0.01650
Train [48][1780/3239]	Time 3.489 (0.709)	Data Time 3.203 (0.194)	Loss 3.0220 (2.7863)	Entropy 0.63508 (0.63345)	Top-1 acc 49.609 (56.867)	Top-5 acc 72.266 (78.874)	lr 0.01650
Train [48][1790/3239]	Time 0.243 (0.710)	Data Time 0.001 (0.195)	Loss 2.7684 (2.7861)	Entropy 0.63522 (0.63346)	Top-1 acc 59.375 (56.867)	Top-5 acc 78.906 (78.877)	lr 0.01650
Train [48][1800/3239]	Time 0.236 (0.711)	Data Time 0.001 (0.196)	Loss 2.7439 (2.7863)	Entropy 0.63550 (0.63347)	Top-1 acc 58.594 (56.863)	Top-5 acc 78.906 (78.873)	lr 0.01650
Train [48][1810/3239]	Time 0.246 (0.714)	Data Time 0.001 (0.200)	Loss 2.8206 (2.7864)	Entropy 0.63579 (0.63348)	Top-1 acc 53.125 (56.859)	Top-5 acc 80.078 (78.875)	lr 0.01650
Train [48][1820/3239]	Time 0.277 (0.717)	Data Time 0.001 (0.203)	Loss 2.8928 (2.7863)	Entropy 0.63589 (0.63349)	Top-1 acc 52.734 (56.855)	Top-5 acc 80.078 (78.878)	lr 0.01650
Train [48][1830/3239]	Time 0.243 (0.718)	Data Time 0.001 (0.204)	Loss 2.7517 (2.7862)	Entropy 0.63540 (0.63351)	Top-1 acc 59.766 (56.862)	Top-5 acc 80.859 (78.879)	lr 0.01650
Train [48][1840/3239]	Time 1.935 (0.721)	Data Time 1.676 (0.208)	Loss 2.7970 (2.7863)	Entropy 0.63557 (0.63352)	Top-1 acc 54.688 (56.859)	Top-5 acc 78.906 (78.873)	lr 0.01650
Train [48][1850/3239]	Time 0.242 (0.726)	Data Time 0.001 (0.213)	Loss 2.7236 (2.7861)	Entropy 0.63582 (0.63353)	Top-1 acc 52.344 (56.856)	Top-5 acc 80.078 (78.881)	lr 0.01650
Train [48][1860/3239]	Time 0.852 (0.725)	Data Time 0.600 (0.213)	Loss 2.9021 (2.7863)	Entropy 0.63605 (0.63354)	Top-1 acc 55.078 (56.851)	Top-5 acc 77.734 (78.876)	lr 0.01650
Train [48][1870/3239]	Time 0.249 (0.724)	Data Time 0.001 (0.212)	Loss 2.6972 (2.7863)	Entropy 0.63592 (0.63355)	Top-1 acc 60.938 (56.854)	Top-5 acc 81.250 (78.877)	lr 0.01649
Train [48][1880/3239]	Time 0.235 (0.734)	Data Time 0.001 (0.222)	Loss 2.9731 (2.7865)	Entropy 0.63635 (0.63357)	Top-1 acc 54.688 (56.851)	Top-5 acc 75.000 (78.872)	lr 0.01649
Train [48][1890/3239]	Time 0.369 (0.732)	Data Time 0.001 (0.221)	Loss 2.6980 (2.7867)	Entropy 0.63629 (0.63358)	Top-1 acc 57.422 (56.849)	Top-5 acc 82.031 (78.872)	lr 0.01649
Train [48][1900/3239]	Time 0.234 (0.732)	Data Time 0.001 (0.221)	Loss 2.6838 (2.7869)	Entropy 0.63614 (0.63360)	Top-1 acc 57.422 (56.845)	Top-5 acc 81.250 (78.869)	lr 0.01649
Train [48][1910/3239]	Time 3.378 (0.743)	Data Time 3.129 (0.232)	Loss 2.8164 (2.7870)	Entropy 0.63599 (0.63361)	Top-1 acc 56.641 (56.843)	Top-5 acc 76.562 (78.867)	lr 0.01649
Train [48][1920/3239]	Time 0.288 (0.741)	Data Time 0.001 (0.231)	Loss 2.8643 (2.7871)	Entropy 0.63614 (0.63362)	Top-1 acc 54.688 (56.838)	Top-5 acc 81.250 (78.868)	lr 0.01649
Train [48][1930/3239]	Time 0.234 (0.741)	Data Time 0.001 (0.232)	Loss 3.0306 (2.7873)	Entropy 0.63624 (0.63363)	Top-1 acc 50.391 (56.831)	Top-5 acc 73.828 (78.866)	lr 0.01649
Train [48][1940/3239]	Time 7.728 (0.749)	Data Time 7.481 (0.240)	Loss 2.8201 (2.7875)	Entropy 0.63603 (0.63365)	Top-1 acc 60.938 (56.832)	Top-5 acc 75.000 (78.860)	lr 0.01649
Train [48][1950/3239]	Time 0.230 (0.750)	Data Time 0.001 (0.241)	Loss 2.6756 (2.7873)	Entropy 0.63606 (0.63366)	Top-1 acc 57.812 (56.834)	Top-5 acc 81.250 (78.863)	lr 0.01649
Train [48][1960/3239]	Time 0.404 (0.749)	Data Time 0.001 (0.241)	Loss 2.7051 (2.7872)	Entropy 0.63576 (0.63367)	Top-1 acc 62.891 (56.836)	Top-5 acc 78.125 (78.862)	lr 0.01649
Train [48][1970/3239]	Time 0.236 (0.754)	Data Time 0.001 (0.246)	Loss 2.6612 (2.7871)	Entropy 0.63577 (0.63368)	Top-1 acc 60.547 (56.842)	Top-5 acc 82.422 (78.863)	lr 0.01648
Train [48][1980/3239]	Time 0.249 (0.757)	Data Time 0.001 (0.250)	Loss 2.8702 (2.7871)	Entropy 0.63600 (0.63369)	Top-1 acc 51.953 (56.835)	Top-5 acc 78.906 (78.867)	lr 0.01648
Train [48][1990/3239]	Time 6.149 (0.759)	Data Time 5.891 (0.252)	Loss 2.7259 (2.7870)	Entropy 0.63646 (0.63370)	Top-1 acc 56.641 (56.834)	Top-5 acc 80.859 (78.873)	lr 0.01648
Train [48][2000/3239]	Time 0.287 (0.763)	Data Time 0.001 (0.256)	Loss 2.7599 (2.7871)	Entropy 0.63673 (0.63372)	Top-1 acc 56.250 (56.830)	Top-5 acc 77.734 (78.869)	lr 0.01648
Train [48][2010/3239]	Time 0.250 (0.766)	Data Time 0.001 (0.259)	Loss 2.6478 (2.7875)	Entropy 0.63681 (0.63373)	Top-1 acc 58.594 (56.825)	Top-5 acc 78.906 (78.864)	lr 0.01648
Train [48][2020/3239]	Time 0.235 (0.764)	Data Time 0.001 (0.258)	Loss 2.8555 (2.7876)	Entropy 0.63630 (0.63375)	Top-1 acc 52.344 (56.822)	Top-5 acc 76.562 (78.860)	lr 0.01648
Train [48][2030/3239]	Time 0.253 (0.764)	Data Time 0.001 (0.258)	Loss 2.8809 (2.7877)	Entropy 0.63618 (0.63376)	Top-1 acc 53.516 (56.820)	Top-5 acc 78.125 (78.856)	lr 0.01648
Train [48][2040/3239]	Time 0.279 (0.774)	Data Time 0.001 (0.269)	Loss 2.9491 (2.7878)	Entropy 0.63609 (0.63377)	Top-1 acc 49.609 (56.819)	Top-5 acc 74.609 (78.857)	lr 0.01648
Train [48][2050/3239]	Time 0.355 (0.773)	Data Time 0.001 (0.268)	Loss 2.7133 (2.7877)	Entropy 0.63558 (0.63378)	Top-1 acc 58.594 (56.821)	Top-5 acc 80.859 (78.859)	lr 0.01648
Train [48][2060/3239]	Time 0.244 (0.773)	Data Time 0.001 (0.268)	Loss 2.8393 (2.7876)	Entropy 0.63572 (0.63379)	Top-1 acc 57.812 (56.827)	Top-5 acc 75.391 (78.861)	lr 0.01648
Train [48][2070/3239]	Time 3.195 (0.782)	Data Time 2.950 (0.278)	Loss 2.9020 (2.7877)	Entropy 0.63588 (0.63380)	Top-1 acc 55.078 (56.826)	Top-5 acc 75.391 (78.862)	lr 0.01647
Train [48][2080/3239]	Time 0.283 (0.781)	Data Time 0.001 (0.276)	Loss 3.0049 (2.7879)	Entropy 0.63591 (0.63381)	Top-1 acc 48.047 (56.822)	Top-5 acc 75.391 (78.856)	lr 0.01647
Train [48][2090/3239]	Time 0.240 (0.781)	Data Time 0.001 (0.277)	Loss 2.5585 (2.7877)	Entropy 0.63595 (0.63382)	Top-1 acc 58.203 (56.825)	Top-5 acc 83.984 (78.862)	lr 0.01647
Train [48][2100/3239]	Time 0.241 (0.789)	Data Time 0.002 (0.285)	Loss 2.6293 (2.7880)	Entropy 0.63626 (0.63383)	Top-1 acc 60.156 (56.817)	Top-5 acc 82.422 (78.858)	lr 0.01647
Train [48][2110/3239]	Time 0.273 (0.787)	Data Time 0.001 (0.284)	Loss 2.7718 (2.7882)	Entropy 0.63617 (0.63385)	Top-1 acc 58.984 (56.808)	Top-5 acc 80.078 (78.848)	lr 0.01647
Train [48][2120/3239]	Time 0.357 (0.788)	Data Time 0.001 (0.285)	Loss 2.6753 (2.7880)	Entropy 0.63635 (0.63386)	Top-1 acc 58.594 (56.813)	Top-5 acc 82.031 (78.853)	lr 0.01647
Train [48][2130/3239]	Time 0.266 (0.797)	Data Time 0.001 (0.294)	Loss 2.8151 (2.7879)	Entropy 0.63659 (0.63387)	Top-1 acc 55.078 (56.820)	Top-5 acc 76.562 (78.852)	lr 0.01647
Train [48][2140/3239]	Time 0.247 (0.795)	Data Time 0.001 (0.293)	Loss 2.9290 (2.7881)	Entropy 0.63681 (0.63388)	Top-1 acc 57.031 (56.817)	Top-5 acc 74.219 (78.848)	lr 0.01647
Train [48][2150/3239]	Time 1.452 (0.794)	Data Time 1.198 (0.292)	Loss 2.7444 (2.7883)	Entropy 0.63706 (0.63390)	Top-1 acc 58.984 (56.808)	Top-5 acc 77.734 (78.841)	lr 0.01647
Train [48][2160/3239]	Time 0.263 (0.803)	Data Time 0.010 (0.302)	Loss 2.8549 (2.7885)	Entropy 0.63687 (0.63391)	Top-1 acc 53.906 (56.803)	Top-5 acc 76.953 (78.837)	lr 0.01647
Train [48][2170/3239]	Time 0.253 (0.803)	Data Time 0.001 (0.301)	Loss 3.1259 (2.7889)	Entropy 0.63667 (0.63392)	Top-1 acc 46.094 (56.795)	Top-5 acc 69.922 (78.829)	lr 0.01647
Train [48][2180/3239]	Time 0.254 (0.801)	Data Time 0.001 (0.300)	Loss 2.7746 (2.7887)	Entropy 0.63671 (0.63394)	Top-1 acc 57.422 (56.797)	Top-5 acc 80.078 (78.831)	lr 0.01646
Train [48][2190/3239]	Time 0.251 (0.802)	Data Time 0.002 (0.302)	Loss 2.8797 (2.7887)	Entropy 0.63679 (0.63395)	Top-1 acc 51.953 (56.795)	Top-5 acc 78.125 (78.831)	lr 0.01646
Train [48][2200/3239]	Time 0.241 (0.809)	Data Time 0.001 (0.309)	Loss 2.5842 (2.7887)	Entropy 0.63684 (0.63396)	Top-1 acc 60.938 (56.796)	Top-5 acc 82.812 (78.832)	lr 0.01646
Train [48][2210/3239]	Time 0.612 (0.809)	Data Time 0.333 (0.309)	Loss 2.8027 (2.7887)	Entropy 0.63696 (0.63398)	Top-1 acc 56.250 (56.796)	Top-5 acc 80.078 (78.836)	lr 0.01646
Train [48][2220/3239]	Time 0.247 (0.810)	Data Time 0.001 (0.310)	Loss 2.7022 (2.7884)	Entropy 0.63690 (0.63399)	Top-1 acc 56.250 (56.798)	Top-5 acc 79.688 (78.841)	lr 0.01646
Train [48][2230/3239]	Time 0.565 (0.816)	Data Time 0.288 (0.317)	Loss 2.7899 (2.7883)	Entropy 0.63672 (0.63400)	Top-1 acc 58.203 (56.801)	Top-5 acc 78.125 (78.843)	lr 0.01646
Train [48][2240/3239]	Time 0.253 (0.815)	Data Time 0.001 (0.315)	Loss 2.6297 (2.7882)	Entropy 0.63668 (0.63401)	Top-1 acc 58.594 (56.801)	Top-5 acc 82.812 (78.843)	lr 0.01646
Train [48][2250/3239]	Time 0.261 (0.816)	Data Time 0.001 (0.317)	Loss 2.9988 (2.7882)	Entropy 0.63683 (0.63403)	Top-1 acc 53.906 (56.804)	Top-5 acc 74.609 (78.845)	lr 0.01646
Train [48][2260/3239]	Time 0.235 (0.824)	Data Time 0.001 (0.325)	Loss 2.5694 (2.7884)	Entropy 0.63680 (0.63404)	Top-1 acc 65.625 (56.803)	Top-5 acc 82.812 (78.844)	lr 0.01646
Train [48][2270/3239]	Time 0.370 (0.838)	Data Time 0.004 (0.324)	Loss 2.8613 (2.7884)	Entropy 0.63693 (0.63405)	Top-1 acc 53.516 (56.800)	Top-5 acc 75.781 (78.843)	lr 0.01646
Train [48][2280/3239]	Time 0.379 (0.837)	Data Time 0.002 (0.322)	Loss 2.7481 (2.7884)	Entropy 0.63631 (0.63406)	Top-1 acc 57.031 (56.802)	Top-5 acc 82.422 (78.847)	lr 0.01645
Train [48][2290/3239]	Time 0.270 (0.835)	Data Time 0.002 (0.321)	Loss 2.6399 (2.7883)	Entropy 0.63619 (0.63407)	Top-1 acc 60.938 (56.805)	Top-5 acc 81.250 (78.847)	lr 0.01645
Train [48][2300/3239]	Time 0.260 (0.834)	Data Time 0.002 (0.319)	Loss 2.8880 (2.7884)	Entropy 0.63608 (0.63408)	Top-1 acc 53.906 (56.806)	Top-5 acc 77.344 (78.847)	lr 0.01645
Train [48][2310/3239]	Time 0.255 (0.832)	Data Time 0.001 (0.318)	Loss 2.6623 (2.7886)	Entropy 0.63632 (0.63409)	Top-1 acc 56.250 (56.803)	Top-5 acc 79.297 (78.842)	lr 0.01645
Train [48][2320/3239]	Time 0.239 (0.838)	Data Time 0.001 (0.324)	Loss 2.7099 (2.7885)	Entropy 0.63625 (0.63410)	Top-1 acc 59.375 (56.808)	Top-5 acc 78.516 (78.842)	lr 0.01645
Train [48][2330/3239]	Time 0.238 (0.836)	Data Time 0.001 (0.323)	Loss 2.7471 (2.7884)	Entropy 0.63642 (0.63411)	Top-1 acc 60.156 (56.813)	Top-5 acc 80.469 (78.845)	lr 0.01645
Train [48][2340/3239]	Time 0.228 (0.835)	Data Time 0.001 (0.322)	Loss 2.8972 (2.7888)	Entropy 0.63677 (0.63412)	Top-1 acc 58.594 (56.802)	Top-5 acc 73.828 (78.837)	lr 0.01645
Train [48][2350/3239]	Time 0.254 (0.834)	Data Time 0.001 (0.321)	Loss 2.8273 (2.7887)	Entropy 0.63671 (0.63413)	Top-1 acc 56.250 (56.807)	Top-5 acc 77.734 (78.839)	lr 0.01645
Train [48][2360/3239]	Time 0.243 (0.841)	Data Time 0.001 (0.329)	Loss 2.9323 (2.7889)	Entropy 0.63676 (0.63414)	Top-1 acc 57.422 (56.808)	Top-5 acc 76.172 (78.835)	lr 0.01645
Train [48][2370/3239]	Time 3.166 (0.841)	Data Time 2.798 (0.328)	Loss 2.6390 (2.7888)	Entropy 0.63667 (0.63415)	Top-1 acc 61.328 (56.812)	Top-5 acc 80.469 (78.837)	lr 0.01645
Train [48][2380/3239]	Time 0.240 (0.839)	Data Time 0.001 (0.327)	Loss 2.5481 (2.7888)	Entropy 0.63650 (0.63416)	Top-1 acc 62.500 (56.815)	Top-5 acc 82.812 (78.836)	lr 0.01645
Train [48][2390/3239]	Time 0.242 (0.846)	Data Time 0.001 (0.335)	Loss 2.6496 (2.7893)	Entropy 0.63625 (0.63417)	Top-1 acc 60.547 (56.802)	Top-5 acc 77.344 (78.825)	lr 0.01644
Train [48][2400/3239]	Time 0.262 (0.845)	Data Time 0.001 (0.333)	Loss 2.6506 (2.7894)	Entropy 0.63673 (0.63418)	Top-1 acc 57.812 (56.793)	Top-5 acc 83.984 (78.825)	lr 0.01644
Train [48][2410/3239]	Time 0.239 (0.844)	Data Time 0.001 (0.333)	Loss 2.6609 (2.7894)	Entropy 0.63677 (0.63419)	Top-1 acc 63.281 (56.794)	Top-5 acc 81.250 (78.823)	lr 0.01644
Train [48][2420/3239]	Time 0.240 (0.851)	Data Time 0.001 (0.340)	Loss 2.8516 (2.7896)	Entropy 0.63656 (0.63420)	Top-1 acc 57.422 (56.794)	Top-5 acc 77.344 (78.825)	lr 0.01644
Train [48][2430/3239]	Time 0.259 (0.850)	Data Time 0.001 (0.340)	Loss 2.8680 (2.7895)	Entropy 0.63673 (0.63421)	Top-1 acc 57.031 (56.797)	Top-5 acc 76.953 (78.823)	lr 0.01644
Train [48][2440/3239]	Time 0.381 (0.849)	Data Time 0.002 (0.339)	Loss 2.6646 (2.7892)	Entropy 0.63678 (0.63422)	Top-1 acc 58.984 (56.803)	Top-5 acc 78.906 (78.828)	lr 0.01644
Train [48][2450/3239]	Time 0.243 (0.856)	Data Time 0.001 (0.346)	Loss 2.7976 (2.7892)	Entropy 0.63649 (0.63423)	Top-1 acc 58.203 (56.803)	Top-5 acc 79.297 (78.830)	lr 0.01644
Train [48][2460/3239]	Time 0.256 (0.857)	Data Time 0.001 (0.347)	Loss 2.8256 (2.7889)	Entropy 0.63618 (0.63424)	Top-1 acc 52.734 (56.806)	Top-5 acc 79.688 (78.836)	lr 0.01644
Train [48][2470/3239]	Time 0.247 (0.855)	Data Time 0.001 (0.346)	Loss 2.7699 (2.7889)	Entropy 0.63635 (0.63425)	Top-1 acc 58.203 (56.806)	Top-5 acc 79.297 (78.836)	lr 0.01644
Train [48][2480/3239]	Time 0.244 (0.862)	Data Time 0.001 (0.353)	Loss 2.8197 (2.7892)	Entropy 0.63610 (0.63426)	Top-1 acc 58.594 (56.804)	Top-5 acc 78.906 (78.833)	lr 0.01644
Train [48][2490/3239]	Time 0.274 (0.861)	Data Time 0.002 (0.352)	Loss 2.8205 (2.7894)	Entropy 0.63614 (0.63427)	Top-1 acc 56.641 (56.800)	Top-5 acc 78.125 (78.829)	lr 0.01643
Train [48][2500/3239]	Time 0.253 (0.859)	Data Time 0.001 (0.351)	Loss 2.7399 (2.7894)	Entropy 0.63624 (0.63427)	Top-1 acc 57.422 (56.802)	Top-5 acc 79.688 (78.832)	lr 0.01643
Train [48][2510/3239]	Time 0.247 (0.858)	Data Time 0.001 (0.350)	Loss 2.9506 (2.7893)	Entropy 0.63666 (0.63428)	Top-1 acc 51.562 (56.806)	Top-5 acc 77.344 (78.831)	lr 0.01643
Train [48][2520/3239]	Time 0.233 (0.866)	Data Time 0.001 (0.358)	Loss 2.4605 (2.7893)	Entropy 0.63637 (0.63429)	Top-1 acc 62.891 (56.804)	Top-5 acc 85.938 (78.831)	lr 0.01643
Train [48][2530/3239]	Time 0.234 (0.864)	Data Time 0.001 (0.356)	Loss 2.9299 (2.7895)	Entropy 0.63617 (0.63430)	Top-1 acc 53.906 (56.798)	Top-5 acc 72.266 (78.828)	lr 0.01643
Train [48][2540/3239]	Time 0.253 (0.864)	Data Time 0.001 (0.356)	Loss 2.7485 (2.7897)	Entropy 0.63640 (0.63431)	Top-1 acc 56.641 (56.789)	Top-5 acc 78.906 (78.824)	lr 0.01643
Train [48][2550/3239]	Time 0.231 (0.871)	Data Time 0.001 (0.364)	Loss 2.7242 (2.7897)	Entropy 0.63632 (0.63432)	Top-1 acc 60.547 (56.788)	Top-5 acc 80.078 (78.825)	lr 0.01643
Train [48][2560/3239]	Time 0.246 (0.869)	Data Time 0.002 (0.363)	Loss 2.8026 (2.7896)	Entropy 0.63643 (0.63432)	Top-1 acc 55.859 (56.790)	Top-5 acc 79.297 (78.828)	lr 0.01643
Train [48][2570/3239]	Time 0.282 (0.869)	Data Time 0.001 (0.363)	Loss 2.6398 (2.7894)	Entropy 0.63635 (0.63433)	Top-1 acc 58.984 (56.792)	Top-5 acc 84.375 (78.832)	lr 0.01643
Train [48][2580/3239]	Time 0.235 (0.876)	Data Time 0.001 (0.370)	Loss 2.7951 (2.7896)	Entropy 0.63669 (0.63434)	Top-1 acc 57.031 (56.789)	Top-5 acc 78.906 (78.830)	lr 0.01643
Train [48][2590/3239]	Time 0.231 (0.874)	Data Time 0.001 (0.369)	Loss 2.7230 (2.7898)	Entropy 0.63700 (0.63435)	Top-1 acc 58.203 (56.787)	Top-5 acc 80.469 (78.825)	lr 0.01643
Train [48][2600/3239]	Time 0.370 (0.873)	Data Time 0.002 (0.368)	Loss 2.8083 (2.7896)	Entropy 0.63689 (0.63436)	Top-1 acc 56.250 (56.790)	Top-5 acc 79.297 (78.828)	lr 0.01642
Train [48][2610/3239]	Time 0.257 (0.881)	Data Time 0.001 (0.376)	Loss 2.6674 (2.7894)	Entropy 0.63708 (0.63437)	Top-1 acc 60.156 (56.793)	Top-5 acc 79.688 (78.829)	lr 0.01642
Train [48][2620/3239]	Time 0.233 (0.879)	Data Time 0.001 (0.375)	Loss 2.7395 (2.7895)	Entropy 0.63728 (0.63438)	Top-1 acc 54.297 (56.793)	Top-5 acc 82.031 (78.827)	lr 0.01642
Train [48][2630/3239]	Time 0.309 (0.879)	Data Time 0.002 (0.374)	Loss 2.7016 (2.7895)	Entropy 0.63737 (0.63439)	Top-1 acc 58.984 (56.790)	Top-5 acc 81.250 (78.825)	lr 0.01642
Train [48][2640/3239]	Time 0.241 (0.886)	Data Time 0.001 (0.382)	Loss 3.0286 (2.7895)	Entropy 0.63763 (0.63440)	Top-1 acc 54.688 (56.792)	Top-5 acc 74.609 (78.825)	lr 0.01642
Train [48][2650/3239]	Time 0.248 (0.884)	Data Time 0.001 (0.380)	Loss 3.0757 (2.7898)	Entropy 0.63763 (0.63442)	Top-1 acc 51.953 (56.783)	Top-5 acc 74.219 (78.820)	lr 0.01642
Train [48][2660/3239]	Time 1.250 (0.883)	Data Time 0.993 (0.379)	Loss 2.7448 (2.7899)	Entropy 0.63786 (0.63443)	Top-1 acc 57.031 (56.781)	Top-5 acc 77.734 (78.820)	lr 0.01642
Train [48][2670/3239]	Time 0.342 (0.881)	Data Time 0.001 (0.378)	Loss 2.5116 (2.7897)	Entropy 0.63807 (0.63444)	Top-1 acc 63.672 (56.784)	Top-5 acc 87.500 (78.826)	lr 0.01642
Train [48][2680/3239]	Time 0.247 (0.889)	Data Time 0.001 (0.386)	Loss 2.9361 (2.7897)	Entropy 0.63816 (0.63445)	Top-1 acc 55.469 (56.786)	Top-5 acc 76.953 (78.830)	lr 0.01642
Train [48][2690/3239]	Time 0.250 (0.887)	Data Time 0.001 (0.384)	Loss 2.7700 (2.7895)	Entropy 0.63810 (0.63447)	Top-1 acc 59.375 (56.792)	Top-5 acc 79.297 (78.835)	lr 0.01642
Train [48][2700/3239]	Time 0.230 (0.887)	Data Time 0.001 (0.384)	Loss 2.9466 (2.7895)	Entropy 0.63831 (0.63448)	Top-1 acc 52.734 (56.793)	Top-5 acc 77.734 (78.839)	lr 0.01641
Train [48][2710/3239]	Time 0.240 (0.895)	Data Time 0.001 (0.393)	Loss 3.0532 (2.7896)	Entropy 0.63812 (0.63450)	Top-1 acc 52.734 (56.793)	Top-5 acc 74.219 (78.835)	lr 0.01641
Train [48][2720/3239]	Time 0.235 (0.893)	Data Time 0.001 (0.391)	Loss 2.7240 (2.7894)	Entropy 0.63801 (0.63451)	Top-1 acc 58.594 (56.796)	Top-5 acc 80.469 (78.840)	lr 0.01641
Train [48][2730/3239]	Time 0.240 (0.892)	Data Time 0.001 (0.391)	Loss 2.7335 (2.7895)	Entropy 0.63808 (0.63452)	Top-1 acc 57.031 (56.795)	Top-5 acc 82.422 (78.838)	lr 0.01641
Train [48][2740/3239]	Time 0.240 (0.900)	Data Time 0.001 (0.399)	Loss 2.4845 (2.7894)	Entropy 0.63795 (0.63453)	Top-1 acc 62.891 (56.794)	Top-5 acc 85.156 (78.844)	lr 0.01641
Train [48][2750/3239]	Time 0.232 (0.898)	Data Time 0.001 (0.398)	Loss 2.7456 (2.7894)	Entropy 0.63806 (0.63455)	Top-1 acc 57.031 (56.793)	Top-5 acc 78.516 (78.841)	lr 0.01641
Train [48][2760/3239]	Time 0.374 (0.897)	Data Time 0.002 (0.396)	Loss 2.6948 (2.7892)	Entropy 0.63821 (0.63456)	Top-1 acc 61.328 (56.797)	Top-5 acc 79.297 (78.844)	lr 0.01641
Train [48][2770/3239]	Time 0.233 (0.904)	Data Time 0.001 (0.404)	Loss 2.6163 (2.7892)	Entropy 0.63833 (0.63457)	Top-1 acc 63.281 (56.801)	Top-5 acc 84.375 (78.843)	lr 0.01641
Train [48][2780/3239]	Time 0.275 (0.902)	Data Time 0.002 (0.402)	Loss 2.8117 (2.7891)	Entropy 0.63881 (0.63459)	Top-1 acc 54.688 (56.802)	Top-5 acc 76.953 (78.844)	lr 0.01641
Train [48][2790/3239]	Time 0.245 (0.900)	Data Time 0.001 (0.401)	Loss 2.9809 (2.7892)	Entropy 0.63897 (0.63460)	Top-1 acc 55.469 (56.803)	Top-5 acc 74.609 (78.843)	lr 0.01641
Train [48][2800/3239]	Time 0.232 (0.905)	Data Time 0.001 (0.406)	Loss 2.8110 (2.7891)	Entropy 0.63916 (0.63462)	Top-1 acc 55.469 (56.803)	Top-5 acc 80.859 (78.847)	lr 0.01640
Train [48][2810/3239]	Time 0.243 (0.903)	Data Time 0.001 (0.404)	Loss 2.6763 (2.7890)	Entropy 0.63958 (0.63463)	Top-1 acc 58.984 (56.806)	Top-5 acc 80.859 (78.849)	lr 0.01640
Train [48][2820/3239]	Time 0.233 (0.901)	Data Time 0.001 (0.403)	Loss 2.8951 (2.7890)	Entropy 0.63946 (0.63465)	Top-1 acc 50.781 (56.804)	Top-5 acc 73.828 (78.852)	lr 0.01640
Train [48][2830/3239]	Time 0.328 (0.900)	Data Time 0.001 (0.401)	Loss 2.9031 (2.7890)	Entropy 0.63956 (0.63467)	Top-1 acc 57.031 (56.805)	Top-5 acc 75.781 (78.850)	lr 0.01640
Train [48][2840/3239]	Time 0.233 (0.902)	Data Time 0.002 (0.404)	Loss 2.6798 (2.7891)	Entropy 0.63977 (0.63469)	Top-1 acc 57.812 (56.797)	Top-5 acc 81.250 (78.849)	lr 0.01640
Train [48][2850/3239]	Time 0.227 (0.900)	Data Time 0.001 (0.403)	Loss 2.6549 (2.7892)	Entropy 0.64012 (0.63470)	Top-1 acc 60.938 (56.794)	Top-5 acc 80.469 (78.846)	lr 0.01640
Train [48][2860/3239]	Time 0.224 (0.900)	Data Time 0.001 (0.402)	Loss 2.7086 (2.7893)	Entropy 0.64065 (0.63472)	Top-1 acc 57.422 (56.792)	Top-5 acc 79.688 (78.845)	lr 0.01640
Train [48][2870/3239]	Time 0.251 (0.906)	Data Time 0.001 (0.409)	Loss 2.7031 (2.7892)	Entropy 0.64064 (0.63474)	Top-1 acc 57.422 (56.792)	Top-5 acc 80.469 (78.849)	lr 0.01640
Train [48][2880/3239]	Time 0.229 (0.904)	Data Time 0.001 (0.408)	Loss 2.9616 (2.7893)	Entropy 0.64053 (0.63477)	Top-1 acc 57.031 (56.793)	Top-5 acc 76.562 (78.850)	lr 0.01640
Train [48][2890/3239]	Time 0.235 (0.904)	Data Time 0.001 (0.407)	Loss 2.7014 (2.7892)	Entropy 0.64046 (0.63479)	Top-1 acc 60.938 (56.796)	Top-5 acc 79.297 (78.849)	lr 0.01640
Train [48][2900/3239]	Time 0.244 (0.910)	Data Time 0.001 (0.414)	Loss 2.8048 (2.7892)	Entropy 0.64037 (0.63480)	Top-1 acc 54.297 (56.797)	Top-5 acc 82.031 (78.851)	lr 0.01640
Train [48][2910/3239]	Time 0.226 (0.908)	Data Time 0.001 (0.412)	Loss 2.7739 (2.7891)	Entropy 0.63993 (0.63482)	Top-1 acc 58.984 (56.800)	Top-5 acc 76.953 (78.853)	lr 0.01639
Train [48][2920/3239]	Time 0.292 (0.907)	Data Time 0.001 (0.411)	Loss 2.7869 (2.7892)	Entropy 0.64000 (0.63484)	Top-1 acc 53.906 (56.799)	Top-5 acc 76.562 (78.852)	lr 0.01639
Train [48][2930/3239]	Time 0.366 (0.917)	Data Time 0.031 (0.410)	Loss 2.6690 (2.7891)	Entropy 0.64003 (0.63486)	Top-1 acc 57.812 (56.802)	Top-5 acc 82.031 (78.854)	lr 0.01639
Train [48][2940/3239]	Time 0.249 (0.915)	Data Time 0.002 (0.409)	Loss 2.8572 (2.7890)	Entropy 0.63979 (0.63488)	Top-1 acc 54.297 (56.801)	Top-5 acc 78.906 (78.857)	lr 0.01639
Train [48][2950/3239]	Time 0.296 (0.914)	Data Time 0.001 (0.407)	Loss 2.8110 (2.7889)	Entropy 0.63992 (0.63489)	Top-1 acc 57.422 (56.801)	Top-5 acc 78.906 (78.857)	lr 0.01639
Train [48][2960/3239]	Time 0.275 (0.917)	Data Time 0.003 (0.411)	Loss 2.9398 (2.7890)	Entropy 0.63984 (0.63491)	Top-1 acc 53.516 (56.799)	Top-5 acc 76.172 (78.855)	lr 0.01639
Train [48][2970/3239]	Time 0.275 (0.915)	Data Time 0.001 (0.409)	Loss 2.6262 (2.7889)	Entropy 0.64022 (0.63493)	Top-1 acc 64.453 (56.802)	Top-5 acc 80.469 (78.856)	lr 0.01639
Train [48][2980/3239]	Time 0.251 (0.914)	Data Time 0.001 (0.408)	Loss 2.7210 (2.7889)	Entropy 0.64022 (0.63494)	Top-1 acc 55.859 (56.799)	Top-5 acc 82.422 (78.860)	lr 0.01639
Train [48][2990/3239]	Time 0.334 (0.912)	Data Time 0.001 (0.406)	Loss 2.7894 (2.7888)	Entropy 0.64008 (0.63496)	Top-1 acc 54.297 (56.799)	Top-5 acc 78.516 (78.863)	lr 0.01639
Train [48][3000/3239]	Time 0.242 (0.914)	Data Time 0.001 (0.409)	Loss 2.8064 (2.7886)	Entropy 0.64014 (0.63498)	Top-1 acc 55.859 (56.805)	Top-5 acc 76.172 (78.867)	lr 0.01639
Train [48][3010/3239]	Time 0.284 (0.913)	Data Time 0.002 (0.408)	Loss 2.6304 (2.7886)	Entropy 0.64008 (0.63500)	Top-1 acc 59.766 (56.803)	Top-5 acc 82.031 (78.866)	lr 0.01638
Train [48][3020/3239]	Time 0.248 (0.911)	Data Time 0.001 (0.406)	Loss 2.6576 (2.7885)	Entropy 0.64005 (0.63501)	Top-1 acc 64.453 (56.805)	Top-5 acc 81.250 (78.869)	lr 0.01638
Train [48][3030/3239]	Time 0.239 (0.914)	Data Time 0.001 (0.409)	Loss 2.7551 (2.7883)	Entropy 0.64030 (0.63503)	Top-1 acc 54.688 (56.808)	Top-5 acc 79.297 (78.874)	lr 0.01638
Train [48][3040/3239]	Time 0.236 (0.912)	Data Time 0.001 (0.408)	Loss 2.7053 (2.7884)	Entropy 0.64071 (0.63505)	Top-1 acc 61.719 (56.810)	Top-5 acc 80.859 (78.872)	lr 0.01638
Train [48][3050/3239]	Time 0.226 (0.910)	Data Time 0.001 (0.406)	Loss 2.8354 (2.7882)	Entropy 0.64093 (0.63507)	Top-1 acc 55.469 (56.812)	Top-5 acc 76.953 (78.873)	lr 0.01638
Train [48][3060/3239]	Time 0.226 (0.912)	Data Time 0.001 (0.408)	Loss 2.9600 (2.7884)	Entropy 0.64107 (0.63508)	Top-1 acc 50.000 (56.807)	Top-5 acc 76.172 (78.871)	lr 0.01638
Train [48][3070/3239]	Time 0.267 (0.911)	Data Time 0.002 (0.407)	Loss 2.7728 (2.7884)	Entropy 0.64130 (0.63510)	Top-1 acc 58.203 (56.810)	Top-5 acc 80.859 (78.872)	lr 0.01638
Train [48][3080/3239]	Time 0.284 (0.909)	Data Time 0.001 (0.406)	Loss 2.6130 (2.7882)	Entropy 0.64132 (0.63512)	Top-1 acc 57.031 (56.810)	Top-5 acc 83.203 (78.876)	lr 0.01638
Train [48][3090/3239]	Time 0.279 (0.911)	Data Time 0.002 (0.408)	Loss 2.6988 (2.7882)	Entropy 0.64107 (0.63514)	Top-1 acc 58.203 (56.812)	Top-5 acc 80.078 (78.874)	lr 0.01638
Train [48][3100/3239]	Time 0.241 (0.910)	Data Time 0.001 (0.407)	Loss 2.7436 (2.7885)	Entropy 0.64119 (0.63516)	Top-1 acc 56.641 (56.804)	Top-5 acc 81.250 (78.872)	lr 0.01638
Train [48][3110/3239]	Time 0.262 (0.908)	Data Time 0.001 (0.405)	Loss 2.6415 (2.7885)	Entropy 0.64120 (0.63518)	Top-1 acc 55.859 (56.804)	Top-5 acc 82.812 (78.873)	lr 0.01638
Train [48][3120/3239]	Time 0.256 (0.913)	Data Time 0.001 (0.410)	Loss 2.6177 (2.7885)	Entropy 0.64111 (0.63520)	Top-1 acc 62.500 (56.807)	Top-5 acc 81.641 (78.871)	lr 0.01637
Train [48][3130/3239]	Time 0.243 (0.911)	Data Time 0.001 (0.409)	Loss 2.6301 (2.7883)	Entropy 0.64124 (0.63522)	Top-1 acc 55.078 (56.810)	Top-5 acc 84.766 (78.875)	lr 0.01637
Train [48][3140/3239]	Time 0.230 (0.910)	Data Time 0.001 (0.408)	Loss 2.6137 (2.7883)	Entropy 0.64145 (0.63524)	Top-1 acc 61.328 (56.808)	Top-5 acc 82.031 (78.874)	lr 0.01637
Train [48][3150/3239]	Time 0.346 (0.909)	Data Time 0.001 (0.407)	Loss 2.9240 (2.7885)	Entropy 0.64154 (0.63526)	Top-1 acc 52.734 (56.805)	Top-5 acc 78.125 (78.870)	lr 0.01637
Train [48][3160/3239]	Time 0.242 (0.914)	Data Time 0.001 (0.413)	Loss 2.6685 (2.7885)	Entropy 0.64155 (0.63528)	Top-1 acc 57.812 (56.806)	Top-5 acc 81.641 (78.874)	lr 0.01637
Train [48][3170/3239]	Time 0.233 (0.914)	Data Time 0.001 (0.413)	Loss 3.0547 (2.7885)	Entropy 0.64139 (0.63530)	Top-1 acc 53.516 (56.804)	Top-5 acc 72.656 (78.875)	lr 0.01637
Train [48][3180/3239]	Time 0.265 (0.913)	Data Time 0.000 (0.412)	Loss 2.8051 (2.7884)	Entropy 0.64176 (0.63532)	Top-1 acc 55.859 (56.806)	Top-5 acc 78.125 (78.879)	lr 0.01637
Train [48][3190/3239]	Time 0.232 (0.917)	Data Time 0.000 (0.416)	Loss 2.9543 (2.7884)	Entropy 0.64174 (0.63534)	Top-1 acc 48.828 (56.804)	Top-5 acc 76.172 (78.880)	lr 0.01637
Train [48][3200/3239]	Time 7.160 (0.918)	Data Time 6.886 (0.417)	Loss 2.8867 (2.7884)	Entropy 0.64208 (0.63536)	Top-1 acc 53.125 (56.805)	Top-5 acc 77.344 (78.880)	lr 0.01637
Train [48][3210/3239]	Time 0.256 (0.916)	Data Time 0.000 (0.416)	Loss 2.8103 (2.7883)	Entropy 0.64219 (0.63538)	Top-1 acc 56.641 (56.805)	Top-5 acc 77.734 (78.880)	lr 0.01637
Train [48][3220/3239]	Time 0.325 (0.918)	Data Time 0.000 (0.418)	Loss 2.8499 (2.7882)	Entropy 0.64229 (0.63540)	Top-1 acc 55.078 (56.805)	Top-5 acc 80.078 (78.882)	lr 0.01636
Train [48][3230/3239]	Time 0.228 (0.917)	Data Time 0.000 (0.417)	Loss 2.8403 (2.7882)	Entropy 0.64214 (0.63542)	Top-1 acc 58.594 (56.809)	Top-5 acc 76.562 (78.881)	lr 0.01636
Train [48][3239/3239]	Time 0.842 (0.916)	Data Time 0.000 (0.417)	Loss 2.7810 (2.7881)	Entropy 0.64194 (0.63544)	Top-1 acc 56.790 (56.811)	Top-5 acc 80.247 (78.882)	lr 0.01636
==========Valid [48/120]	loss 1.532	top-1 acc 64.792 (64.864)	top-5 acc 85.721	Train top-1 56.811	top-5 78.882	Entropy 0.64194	Latency-None: 0.000ms	Flops: 538.40M
Train [49][0/3239]	Time 36.227 (36.227)	Data Time 35.617 (35.617)	Loss 2.7310 (2.7310)	Entropy 0.64173 (0.64173)	Top-1 acc 59.375 (59.375)	Top-5 acc 79.688 (79.688)	lr 0.01636
Train [49][10/3239]	Time 0.242 (3.793)	Data Time 0.001 (3.325)	Loss 2.8175 (2.7588)	Entropy 0.64162 (0.64164)	Top-1 acc 54.688 (57.422)	Top-5 acc 77.344 (79.865)	lr 0.01636
Train [49][20/3239]	Time 0.239 (2.187)	Data Time 0.001 (1.743)	Loss 2.8890 (2.7593)	Entropy 0.64154 (0.64164)	Top-1 acc 54.688 (57.850)	Top-5 acc 78.906 (79.594)	lr 0.01636
Train [49][30/3239]	Time 0.274 (1.640)	Data Time 0.001 (1.181)	Loss 2.8450 (2.7485)	Entropy 0.64164 (0.64162)	Top-1 acc 54.297 (58.443)	Top-5 acc 80.859 (79.952)	lr 0.01636
Train [49][40/3239]	Time 0.223 (1.340)	Data Time 0.001 (0.893)	Loss 2.7098 (2.7528)	Entropy 0.64167 (0.64163)	Top-1 acc 58.203 (58.260)	Top-5 acc 81.641 (79.783)	lr 0.01636
Train [49][50/3239]	Time 0.390 (1.168)	Data Time 0.001 (0.719)	Loss 2.7782 (2.7498)	Entropy 0.64147 (0.64163)	Top-1 acc 57.422 (58.540)	Top-5 acc 79.297 (79.787)	lr 0.01636
Train [49][60/3239]	Time 0.242 (1.055)	Data Time 0.001 (0.601)	Loss 2.6088 (2.7384)	Entropy 0.64121 (0.64158)	Top-1 acc 60.938 (58.677)	Top-5 acc 82.422 (79.950)	lr 0.01636
Train [49][70/3239]	Time 0.233 (0.970)	Data Time 0.001 (0.517)	Loss 2.8269 (2.7459)	Entropy 0.64128 (0.64154)	Top-1 acc 57.422 (58.544)	Top-5 acc 77.344 (79.765)	lr 0.01636
Train [49][80/3239]	Time 0.243 (0.909)	Data Time 0.001 (0.453)	Loss 2.8107 (2.7536)	Entropy 0.64167 (0.64153)	Top-1 acc 53.125 (58.309)	Top-5 acc 79.297 (79.625)	lr 0.01636
Train [49][90/3239]	Time 0.286 (0.856)	Data Time 0.001 (0.403)	Loss 2.7931 (2.7568)	Entropy 0.64168 (0.64153)	Top-1 acc 57.031 (58.100)	Top-5 acc 79.688 (79.533)	lr 0.01635
Train [49][100/3239]	Time 0.255 (0.813)	Data Time 0.001 (0.364)	Loss 2.7203 (2.7578)	Entropy 0.64191 (0.64155)	Top-1 acc 57.812 (58.056)	Top-5 acc 80.469 (79.483)	lr 0.01635
Train [49][110/3239]	Time 0.337 (0.777)	Data Time 0.001 (0.331)	Loss 2.6371 (2.7582)	Entropy 0.64155 (0.64158)	Top-1 acc 61.328 (58.126)	Top-5 acc 80.469 (79.431)	lr 0.01635
Train [49][120/3239]	Time 0.241 (0.748)	Data Time 0.001 (0.304)	Loss 2.8001 (2.7543)	Entropy 0.64129 (0.64157)	Top-1 acc 57.031 (58.271)	Top-5 acc 78.125 (79.513)	lr 0.01635
Train [49][130/3239]	Time 0.311 (0.725)	Data Time 0.001 (0.281)	Loss 2.7011 (2.7611)	Entropy 0.64093 (0.64154)	Top-1 acc 57.031 (57.977)	Top-5 acc 81.250 (79.452)	lr 0.01635
Train [49][140/3239]	Time 0.307 (0.705)	Data Time 0.001 (0.261)	Loss 2.7975 (2.7696)	Entropy 0.64058 (0.64150)	Top-1 acc 57.031 (57.765)	Top-5 acc 80.078 (79.297)	lr 0.01635
Train [49][150/3239]	Time 0.234 (0.688)	Data Time 0.001 (0.244)	Loss 2.7171 (2.7691)	Entropy 0.64081 (0.64144)	Top-1 acc 57.812 (57.737)	Top-5 acc 80.469 (79.333)	lr 0.01635
Train [49][160/3239]	Time 0.265 (0.670)	Data Time 0.001 (0.229)	Loss 2.6050 (2.7657)	Entropy 0.64071 (0.64140)	Top-1 acc 61.719 (57.800)	Top-5 acc 80.469 (79.416)	lr 0.01635
Train [49][170/3239]	Time 0.238 (0.656)	Data Time 0.001 (0.215)	Loss 2.6438 (2.7623)	Entropy 0.64041 (0.64136)	Top-1 acc 60.938 (57.906)	Top-5 acc 81.250 (79.512)	lr 0.01635
Train [49][180/3239]	Time 0.226 (0.645)	Data Time 0.001 (0.204)	Loss 2.8617 (2.7612)	Entropy 0.64006 (0.64130)	Top-1 acc 58.594 (57.892)	Top-5 acc 77.344 (79.577)	lr 0.01635
Train [49][190/3239]	Time 0.235 (0.633)	Data Time 0.001 (0.193)	Loss 2.7611 (2.7619)	Entropy 0.64003 (0.64123)	Top-1 acc 58.203 (57.843)	Top-5 acc 81.250 (79.567)	lr 0.01634
Train [49][200/3239]	Time 0.222 (0.623)	Data Time 0.001 (0.183)	Loss 2.7313 (2.7597)	Entropy 0.63978 (0.64117)	Top-1 acc 58.594 (57.898)	Top-5 acc 80.469 (79.598)	lr 0.01634
Train [49][210/3239]	Time 0.400 (0.614)	Data Time 0.001 (0.175)	Loss 2.7495 (2.7622)	Entropy 0.64008 (0.64111)	Top-1 acc 57.031 (57.887)	Top-5 acc 83.203 (79.560)	lr 0.01634
Train [49][220/3239]	Time 0.251 (0.606)	Data Time 0.001 (0.167)	Loss 2.7819 (2.7599)	Entropy 0.64023 (0.64107)	Top-1 acc 54.688 (57.910)	Top-5 acc 78.516 (79.611)	lr 0.01634
Train [49][230/3239]	Time 0.294 (0.598)	Data Time 0.002 (0.160)	Loss 2.8562 (2.7641)	Entropy 0.64003 (0.64103)	Top-1 acc 56.250 (57.802)	Top-5 acc 79.297 (79.517)	lr 0.01634
Train [49][240/3239]	Time 0.251 (0.592)	Data Time 0.001 (0.153)	Loss 2.9575 (2.7643)	Entropy 0.63971 (0.64098)	Top-1 acc 52.734 (57.751)	Top-5 acc 73.828 (79.488)	lr 0.01634
Train [49][250/3239]	Time 0.235 (0.586)	Data Time 0.001 (0.147)	Loss 3.0089 (2.7666)	Entropy 0.63971 (0.64093)	Top-1 acc 50.391 (57.679)	Top-5 acc 75.000 (79.437)	lr 0.01634
Train [49][260/3239]	Time 0.227 (0.581)	Data Time 0.001 (0.142)	Loss 2.7917 (2.7684)	Entropy 0.63993 (0.64088)	Top-1 acc 54.297 (57.607)	Top-5 acc 79.297 (79.397)	lr 0.01634
Train [49][270/3239]	Time 0.228 (0.575)	Data Time 0.001 (0.136)	Loss 2.9171 (2.7690)	Entropy 0.63994 (0.64084)	Top-1 acc 54.688 (57.605)	Top-5 acc 75.781 (79.373)	lr 0.01634
Train [49][280/3239]	Time 0.352 (0.570)	Data Time 0.001 (0.132)	Loss 2.7046 (2.7692)	Entropy 0.63996 (0.64081)	Top-1 acc 58.203 (57.594)	Top-5 acc 77.344 (79.347)	lr 0.01634
Train [49][290/3239]	Time 0.236 (0.566)	Data Time 0.001 (0.127)	Loss 2.7855 (2.7694)	Entropy 0.63996 (0.64078)	Top-1 acc 55.469 (57.555)	Top-5 acc 76.953 (79.341)	lr 0.01633
Train [49][300/3239]	Time 0.301 (0.561)	Data Time 0.002 (0.123)	Loss 2.6874 (2.7716)	Entropy 0.64003 (0.64075)	Top-1 acc 57.812 (57.479)	Top-5 acc 80.859 (79.289)	lr 0.01633
Train [49][310/3239]	Time 0.244 (0.557)	Data Time 0.001 (0.119)	Loss 2.6732 (2.7729)	Entropy 0.63985 (0.64073)	Top-1 acc 59.766 (57.461)	Top-5 acc 80.469 (79.254)	lr 0.01633
Train [49][320/3239]	Time 0.298 (0.553)	Data Time 0.001 (0.115)	Loss 2.6126 (2.7728)	Entropy 0.63959 (0.64070)	Top-1 acc 62.109 (57.446)	Top-5 acc 82.422 (79.242)	lr 0.01633
Train [49][330/3239]	Time 0.307 (0.551)	Data Time 0.003 (0.112)	Loss 3.0552 (2.7733)	Entropy 0.63957 (0.64066)	Top-1 acc 53.125 (57.430)	Top-5 acc 73.438 (79.231)	lr 0.01633
Train [49][340/3239]	Time 0.365 (0.649)	Data Time 0.006 (0.109)	Loss 2.8730 (2.7745)	Entropy 0.63944 (0.64063)	Top-1 acc 55.469 (57.408)	Top-5 acc 78.516 (79.203)	lr 0.01633
Train [49][350/3239]	Time 0.234 (0.643)	Data Time 0.002 (0.106)	Loss 2.8126 (2.7738)	Entropy 0.63932 (0.64059)	Top-1 acc 55.469 (57.409)	Top-5 acc 75.000 (79.182)	lr 0.01633
Train [49][360/3239]	Time 0.243 (0.637)	Data Time 0.001 (0.103)	Loss 2.7237 (2.7742)	Entropy 0.63933 (0.64056)	Top-1 acc 58.203 (57.388)	Top-5 acc 78.906 (79.170)	lr 0.01633
Train [49][370/3239]	Time 0.328 (0.631)	Data Time 0.001 (0.100)	Loss 2.7410 (2.7725)	Entropy 0.63957 (0.64052)	Top-1 acc 57.031 (57.390)	Top-5 acc 81.250 (79.209)	lr 0.01633
Train [49][380/3239]	Time 0.229 (0.626)	Data Time 0.001 (0.098)	Loss 2.9103 (2.7719)	Entropy 0.63988 (0.64050)	Top-1 acc 55.078 (57.392)	Top-5 acc 76.953 (79.221)	lr 0.01633
Train [49][390/3239]	Time 0.247 (0.621)	Data Time 0.001 (0.095)	Loss 2.7241 (2.7704)	Entropy 0.63996 (0.64049)	Top-1 acc 57.422 (57.395)	Top-5 acc 82.031 (79.243)	lr 0.01633
Train [49][400/3239]	Time 0.281 (0.617)	Data Time 0.001 (0.093)	Loss 2.6555 (2.7693)	Entropy 0.63988 (0.64047)	Top-1 acc 60.547 (57.403)	Top-5 acc 82.422 (79.262)	lr 0.01632
Train [49][410/3239]	Time 0.236 (0.612)	Data Time 0.001 (0.091)	Loss 2.6011 (2.7700)	Entropy 0.64015 (0.64046)	Top-1 acc 57.422 (57.379)	Top-5 acc 82.031 (79.247)	lr 0.01632
Train [49][420/3239]	Time 0.224 (0.609)	Data Time 0.001 (0.088)	Loss 2.8856 (2.7686)	Entropy 0.63995 (0.64045)	Top-1 acc 51.562 (57.395)	Top-5 acc 77.734 (79.288)	lr 0.01632
Train [49][430/3239]	Time 0.260 (0.605)	Data Time 0.001 (0.086)	Loss 2.8627 (2.7684)	Entropy 0.64004 (0.64043)	Top-1 acc 55.078 (57.399)	Top-5 acc 76.172 (79.298)	lr 0.01632
Train [49][440/3239]	Time 0.233 (0.601)	Data Time 0.001 (0.085)	Loss 2.8516 (2.7684)	Entropy 0.64006 (0.64043)	Top-1 acc 54.297 (57.394)	Top-5 acc 73.828 (79.289)	lr 0.01632
Train [49][450/3239]	Time 0.232 (0.597)	Data Time 0.001 (0.083)	Loss 2.7301 (2.7678)	Entropy 0.64034 (0.64042)	Top-1 acc 55.469 (57.392)	Top-5 acc 80.469 (79.308)	lr 0.01632
Train [49][460/3239]	Time 0.249 (0.594)	Data Time 0.001 (0.081)	Loss 2.6264 (2.7676)	Entropy 0.64038 (0.64042)	Top-1 acc 62.891 (57.393)	Top-5 acc 79.688 (79.313)	lr 0.01632
Train [49][470/3239]	Time 0.246 (0.591)	Data Time 0.002 (0.079)	Loss 2.6619 (2.7679)	Entropy 0.64067 (0.64042)	Top-1 acc 62.891 (57.401)	Top-5 acc 78.906 (79.299)	lr 0.01632
Train [49][480/3239]	Time 0.245 (0.588)	Data Time 0.002 (0.078)	Loss 2.8004 (2.7684)	Entropy 0.64094 (0.64043)	Top-1 acc 56.641 (57.367)	Top-5 acc 77.344 (79.296)	lr 0.01632
Train [49][490/3239]	Time 0.246 (0.585)	Data Time 0.001 (0.076)	Loss 2.8711 (2.7701)	Entropy 0.64089 (0.64044)	Top-1 acc 55.469 (57.349)	Top-5 acc 76.953 (79.257)	lr 0.01632
Train [49][500/3239]	Time 0.227 (0.581)	Data Time 0.001 (0.075)	Loss 2.9274 (2.7703)	Entropy 0.64095 (0.64045)	Top-1 acc 53.516 (57.347)	Top-5 acc 75.391 (79.259)	lr 0.01631
Train [49][510/3239]	Time 0.251 (0.579)	Data Time 0.001 (0.073)	Loss 2.7313 (2.7700)	Entropy 0.64123 (0.64046)	Top-1 acc 57.422 (57.335)	Top-5 acc 80.469 (79.255)	lr 0.01631
Train [49][520/3239]	Time 0.266 (0.576)	Data Time 0.002 (0.072)	Loss 2.8033 (2.7707)	Entropy 0.64086 (0.64047)	Top-1 acc 57.422 (57.297)	Top-5 acc 79.688 (79.244)	lr 0.01631
Train [49][530/3239]	Time 0.344 (0.574)	Data Time 0.001 (0.071)	Loss 2.8375 (2.7715)	Entropy 0.64089 (0.64048)	Top-1 acc 55.469 (57.270)	Top-5 acc 78.125 (79.231)	lr 0.01631
Train [49][540/3239]	Time 0.324 (0.572)	Data Time 0.001 (0.069)	Loss 2.6593 (2.7712)	Entropy 0.64064 (0.64048)	Top-1 acc 59.766 (57.268)	Top-5 acc 82.031 (79.239)	lr 0.01631
Train [49][550/3239]	Time 0.244 (0.570)	Data Time 0.001 (0.068)	Loss 2.8798 (2.7731)	Entropy 0.64038 (0.64048)	Top-1 acc 54.297 (57.235)	Top-5 acc 77.734 (79.199)	lr 0.01631
Train [49][560/3239]	Time 0.279 (0.568)	Data Time 0.002 (0.067)	Loss 2.7215 (2.7727)	Entropy 0.64028 (0.64048)	Top-1 acc 57.031 (57.221)	Top-5 acc 79.688 (79.208)	lr 0.01631
Train [49][570/3239]	Time 0.252 (0.566)	Data Time 0.001 (0.066)	Loss 2.7138 (2.7729)	Entropy 0.64036 (0.64048)	Top-1 acc 59.375 (57.210)	Top-5 acc 81.641 (79.196)	lr 0.01631
Train [49][580/3239]	Time 0.229 (0.563)	Data Time 0.001 (0.065)	Loss 2.7041 (2.7731)	Entropy 0.64018 (0.64048)	Top-1 acc 59.375 (57.209)	Top-5 acc 79.688 (79.196)	lr 0.01631
Train [49][590/3239]	Time 0.243 (0.561)	Data Time 0.001 (0.064)	Loss 2.7626 (2.7732)	Entropy 0.64033 (0.64047)	Top-1 acc 59.375 (57.207)	Top-5 acc 76.953 (79.194)	lr 0.01631
Train [49][600/3239]	Time 0.419 (0.559)	Data Time 0.001 (0.062)	Loss 2.5200 (2.7736)	Entropy 0.64027 (0.64047)	Top-1 acc 60.938 (57.200)	Top-5 acc 81.250 (79.173)	lr 0.01631
Train [49][610/3239]	Time 0.253 (0.557)	Data Time 0.001 (0.061)	Loss 2.8560 (2.7736)	Entropy 0.64012 (0.64046)	Top-1 acc 53.125 (57.212)	Top-5 acc 77.734 (79.170)	lr 0.01630
Train [49][620/3239]	Time 0.275 (0.555)	Data Time 0.001 (0.061)	Loss 2.6579 (2.7740)	Entropy 0.63998 (0.64046)	Top-1 acc 60.547 (57.194)	Top-5 acc 82.031 (79.162)	lr 0.01630
Train [49][630/3239]	Time 0.242 (0.554)	Data Time 0.001 (0.060)	Loss 2.7845 (2.7736)	Entropy 0.63953 (0.64045)	Top-1 acc 59.375 (57.195)	Top-5 acc 79.297 (79.170)	lr 0.01630
Train [49][640/3239]	Time 0.273 (0.552)	Data Time 0.001 (0.059)	Loss 3.1181 (2.7734)	Entropy 0.63942 (0.64043)	Top-1 acc 50.391 (57.206)	Top-5 acc 73.047 (79.177)	lr 0.01630
Train [49][650/3239]	Time 0.244 (0.550)	Data Time 0.001 (0.058)	Loss 2.6645 (2.7735)	Entropy 0.63959 (0.64042)	Top-1 acc 58.203 (57.203)	Top-5 acc 82.422 (79.166)	lr 0.01630
Train [49][660/3239]	Time 0.243 (0.548)	Data Time 0.001 (0.057)	Loss 2.9137 (2.7742)	Entropy 0.63949 (0.64041)	Top-1 acc 53.516 (57.181)	Top-5 acc 76.172 (79.150)	lr 0.01630
Train [49][670/3239]	Time 0.257 (0.547)	Data Time 0.001 (0.056)	Loss 2.7270 (2.7732)	Entropy 0.63949 (0.64039)	Top-1 acc 56.641 (57.208)	Top-5 acc 78.906 (79.164)	lr 0.01630
Train [49][680/3239]	Time 0.247 (0.545)	Data Time 0.001 (0.055)	Loss 2.8369 (2.7723)	Entropy 0.63949 (0.64038)	Top-1 acc 54.688 (57.222)	Top-5 acc 78.516 (79.182)	lr 0.01630
Train [49][690/3239]	Time 0.350 (0.544)	Data Time 0.001 (0.055)	Loss 2.7831 (2.7737)	Entropy 0.63934 (0.64037)	Top-1 acc 57.422 (57.190)	Top-5 acc 79.688 (79.155)	lr 0.01630
Train [49][700/3239]	Time 0.305 (0.542)	Data Time 0.022 (0.054)	Loss 2.8421 (2.7737)	Entropy 0.63919 (0.64035)	Top-1 acc 58.594 (57.205)	Top-5 acc 76.953 (79.147)	lr 0.01630
Train [49][710/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.053)	Loss 2.8304 (2.7735)	Entropy 0.63954 (0.64034)	Top-1 acc 53.516 (57.197)	Top-5 acc 79.297 (79.153)	lr 0.01629
Train [49][720/3239]	Time 0.248 (0.539)	Data Time 0.001 (0.052)	Loss 2.5981 (2.7728)	Entropy 0.63951 (0.64032)	Top-1 acc 58.984 (57.209)	Top-5 acc 82.031 (79.164)	lr 0.01629
Train [49][730/3239]	Time 0.242 (0.537)	Data Time 0.001 (0.052)	Loss 2.9410 (2.7725)	Entropy 0.63965 (0.64031)	Top-1 acc 49.219 (57.215)	Top-5 acc 77.734 (79.172)	lr 0.01629
Train [49][740/3239]	Time 0.252 (0.536)	Data Time 0.001 (0.051)	Loss 2.7050 (2.7723)	Entropy 0.63928 (0.64030)	Top-1 acc 62.109 (57.228)	Top-5 acc 80.078 (79.167)	lr 0.01629
Train [49][750/3239]	Time 0.246 (0.535)	Data Time 0.001 (0.050)	Loss 2.5605 (2.7723)	Entropy 0.63969 (0.64029)	Top-1 acc 63.281 (57.222)	Top-5 acc 82.422 (79.174)	lr 0.01629
Train [49][760/3239]	Time 0.412 (0.534)	Data Time 0.002 (0.050)	Loss 2.8212 (2.7730)	Entropy 0.63986 (0.64029)	Top-1 acc 54.297 (57.200)	Top-5 acc 75.781 (79.152)	lr 0.01629
Train [49][770/3239]	Time 0.252 (0.533)	Data Time 0.001 (0.049)	Loss 2.8621 (2.7729)	Entropy 0.63993 (0.64028)	Top-1 acc 57.422 (57.207)	Top-5 acc 76.172 (79.149)	lr 0.01629
Train [49][780/3239]	Time 0.310 (0.532)	Data Time 0.001 (0.049)	Loss 2.6298 (2.7729)	Entropy 0.63971 (0.64028)	Top-1 acc 62.500 (57.218)	Top-5 acc 83.203 (79.150)	lr 0.01629
Train [49][790/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.048)	Loss 2.6496 (2.7723)	Entropy 0.63984 (0.64027)	Top-1 acc 60.547 (57.238)	Top-5 acc 82.422 (79.169)	lr 0.01629
Train [49][800/3239]	Time 0.274 (0.530)	Data Time 0.001 (0.047)	Loss 2.8622 (2.7720)	Entropy 0.63943 (0.64026)	Top-1 acc 54.297 (57.251)	Top-5 acc 78.516 (79.176)	lr 0.01629
Train [49][810/3239]	Time 0.226 (0.528)	Data Time 0.001 (0.047)	Loss 2.7323 (2.7709)	Entropy 0.63979 (0.64025)	Top-1 acc 57.422 (57.270)	Top-5 acc 80.469 (79.201)	lr 0.01628
Train [49][820/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.046)	Loss 2.6819 (2.7706)	Entropy 0.63985 (0.64025)	Top-1 acc 60.547 (57.278)	Top-5 acc 78.906 (79.207)	lr 0.01628
Train [49][830/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.046)	Loss 2.7635 (2.7718)	Entropy 0.63976 (0.64024)	Top-1 acc 54.688 (57.242)	Top-5 acc 82.422 (79.199)	lr 0.01628
Train [49][840/3239]	Time 0.266 (0.525)	Data Time 0.002 (0.045)	Loss 2.7289 (2.7723)	Entropy 0.63975 (0.64024)	Top-1 acc 55.469 (57.231)	Top-5 acc 79.297 (79.197)	lr 0.01628
Train [49][850/3239]	Time 0.347 (0.524)	Data Time 0.001 (0.045)	Loss 3.0057 (2.7721)	Entropy 0.63998 (0.64023)	Top-1 acc 50.000 (57.227)	Top-5 acc 75.000 (79.197)	lr 0.01628
Train [49][860/3239]	Time 0.254 (0.523)	Data Time 0.001 (0.044)	Loss 3.2318 (2.7723)	Entropy 0.64011 (0.64023)	Top-1 acc 48.828 (57.223)	Top-5 acc 71.875 (79.198)	lr 0.01628
Train [49][870/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.044)	Loss 2.6280 (2.7721)	Entropy 0.64034 (0.64023)	Top-1 acc 61.328 (57.238)	Top-5 acc 83.984 (79.207)	lr 0.01628
Train [49][880/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.043)	Loss 2.8544 (2.7721)	Entropy 0.64000 (0.64023)	Top-1 acc 54.297 (57.235)	Top-5 acc 78.125 (79.206)	lr 0.01628
Train [49][890/3239]	Time 0.245 (0.520)	Data Time 0.001 (0.043)	Loss 2.6317 (2.7717)	Entropy 0.63968 (0.64023)	Top-1 acc 62.891 (57.242)	Top-5 acc 82.422 (79.209)	lr 0.01628
Train [49][900/3239]	Time 0.254 (0.519)	Data Time 0.001 (0.042)	Loss 3.0520 (2.7724)	Entropy 0.63956 (0.64022)	Top-1 acc 48.438 (57.219)	Top-5 acc 74.219 (79.194)	lr 0.01628
Train [49][910/3239]	Time 0.283 (0.519)	Data Time 0.003 (0.042)	Loss 2.8184 (2.7723)	Entropy 0.63928 (0.64021)	Top-1 acc 53.516 (57.222)	Top-5 acc 78.906 (79.203)	lr 0.01628
Train [49][920/3239]	Time 0.375 (0.518)	Data Time 0.001 (0.041)	Loss 2.7484 (2.7721)	Entropy 0.63947 (0.64020)	Top-1 acc 58.984 (57.223)	Top-5 acc 80.078 (79.203)	lr 0.01627
Train [49][930/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.041)	Loss 2.6767 (2.7728)	Entropy 0.63925 (0.64019)	Top-1 acc 59.766 (57.203)	Top-5 acc 80.469 (79.187)	lr 0.01627
Train [49][940/3239]	Time 0.240 (0.516)	Data Time 0.001 (0.041)	Loss 2.8416 (2.7741)	Entropy 0.63847 (0.64018)	Top-1 acc 55.859 (57.166)	Top-5 acc 77.734 (79.157)	lr 0.01627
Train [49][950/3239]	Time 0.289 (0.515)	Data Time 0.001 (0.040)	Loss 2.5984 (2.7733)	Entropy 0.63806 (0.64016)	Top-1 acc 61.328 (57.179)	Top-5 acc 84.766 (79.166)	lr 0.01627
Train [49][960/3239]	Time 0.229 (0.514)	Data Time 0.001 (0.040)	Loss 2.7189 (2.7730)	Entropy 0.63841 (0.64014)	Top-1 acc 57.031 (57.178)	Top-5 acc 80.469 (79.161)	lr 0.01627
Train [49][970/3239]	Time 0.254 (0.513)	Data Time 0.001 (0.039)	Loss 2.9259 (2.7738)	Entropy 0.63771 (0.64012)	Top-1 acc 52.344 (57.161)	Top-5 acc 75.000 (79.151)	lr 0.01627
Train [49][980/3239]	Time 0.245 (0.513)	Data Time 0.001 (0.039)	Loss 2.6276 (2.7739)	Entropy 0.63778 (0.64009)	Top-1 acc 61.719 (57.160)	Top-5 acc 81.641 (79.153)	lr 0.01627
Train [49][990/3239]	Time 0.417 (0.512)	Data Time 0.001 (0.039)	Loss 2.9262 (2.7742)	Entropy 0.63792 (0.64007)	Top-1 acc 54.297 (57.149)	Top-5 acc 75.781 (79.146)	lr 0.01627
Train [49][1000/3239]	Time 0.333 (0.546)	Data Time 0.003 (0.038)	Loss 2.7691 (2.7740)	Entropy 0.63804 (0.64005)	Top-1 acc 55.859 (57.148)	Top-5 acc 78.125 (79.138)	lr 0.01627
Train [49][1010/3239]	Time 0.290 (0.544)	Data Time 0.002 (0.038)	Loss 2.8858 (2.7738)	Entropy 0.63802 (0.64003)	Top-1 acc 57.812 (57.149)	Top-5 acc 74.609 (79.143)	lr 0.01627
Train [49][1020/3239]	Time 0.241 (0.543)	Data Time 0.002 (0.038)	Loss 2.5907 (2.7730)	Entropy 0.63781 (0.64001)	Top-1 acc 62.500 (57.163)	Top-5 acc 82.422 (79.160)	lr 0.01626
Train [49][1030/3239]	Time 0.240 (0.542)	Data Time 0.001 (0.037)	Loss 2.6514 (2.7724)	Entropy 0.63771 (0.63999)	Top-1 acc 62.500 (57.185)	Top-5 acc 82.422 (79.170)	lr 0.01626
Train [49][1040/3239]	Time 0.243 (0.541)	Data Time 0.001 (0.037)	Loss 2.8418 (2.7723)	Entropy 0.63787 (0.63997)	Top-1 acc 54.688 (57.185)	Top-5 acc 77.734 (79.170)	lr 0.01626
Train [49][1050/3239]	Time 0.244 (0.540)	Data Time 0.001 (0.037)	Loss 2.6298 (2.7724)	Entropy 0.63777 (0.63995)	Top-1 acc 60.156 (57.193)	Top-5 acc 82.031 (79.171)	lr 0.01626
Train [49][1060/3239]	Time 0.337 (0.539)	Data Time 0.001 (0.036)	Loss 2.7427 (2.7728)	Entropy 0.63772 (0.63993)	Top-1 acc 57.422 (57.182)	Top-5 acc 79.297 (79.161)	lr 0.01626
Train [49][1070/3239]	Time 0.248 (0.538)	Data Time 0.002 (0.036)	Loss 2.7059 (2.7724)	Entropy 0.63757 (0.63990)	Top-1 acc 55.469 (57.181)	Top-5 acc 79.688 (79.167)	lr 0.01626
Train [49][1080/3239]	Time 0.350 (0.537)	Data Time 0.001 (0.036)	Loss 2.6151 (2.7724)	Entropy 0.63678 (0.63988)	Top-1 acc 61.328 (57.178)	Top-5 acc 82.422 (79.172)	lr 0.01626
Train [49][1090/3239]	Time 0.230 (0.536)	Data Time 0.001 (0.035)	Loss 2.9201 (2.7724)	Entropy 0.63692 (0.63985)	Top-1 acc 54.297 (57.182)	Top-5 acc 78.516 (79.173)	lr 0.01626
Train [49][1100/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.035)	Loss 2.6652 (2.7721)	Entropy 0.63711 (0.63983)	Top-1 acc 59.375 (57.181)	Top-5 acc 81.641 (79.182)	lr 0.01626
Train [49][1110/3239]	Time 0.242 (0.534)	Data Time 0.001 (0.035)	Loss 2.9342 (2.7728)	Entropy 0.63720 (0.63980)	Top-1 acc 51.562 (57.171)	Top-5 acc 77.344 (79.165)	lr 0.01626
Train [49][1120/3239]	Time 0.256 (0.533)	Data Time 0.001 (0.034)	Loss 2.7754 (2.7727)	Entropy 0.63742 (0.63978)	Top-1 acc 56.250 (57.166)	Top-5 acc 79.297 (79.171)	lr 0.01625
Train [49][1130/3239]	Time 0.325 (0.533)	Data Time 0.001 (0.034)	Loss 2.6279 (2.7727)	Entropy 0.63721 (0.63976)	Top-1 acc 61.719 (57.166)	Top-5 acc 82.812 (79.164)	lr 0.01625
Train [49][1140/3239]	Time 0.244 (0.532)	Data Time 0.001 (0.034)	Loss 2.8127 (2.7731)	Entropy 0.63726 (0.63974)	Top-1 acc 57.031 (57.164)	Top-5 acc 78.906 (79.154)	lr 0.01625
Train [49][1150/3239]	Time 0.351 (0.531)	Data Time 0.001 (0.033)	Loss 2.8789 (2.7736)	Entropy 0.63732 (0.63972)	Top-1 acc 53.906 (57.150)	Top-5 acc 76.562 (79.152)	lr 0.01625
Train [49][1160/3239]	Time 0.241 (0.531)	Data Time 0.001 (0.033)	Loss 2.9807 (2.7742)	Entropy 0.63733 (0.63969)	Top-1 acc 51.562 (57.138)	Top-5 acc 71.875 (79.139)	lr 0.01625
Train [49][1170/3239]	Time 0.249 (0.530)	Data Time 0.001 (0.033)	Loss 2.9649 (2.7745)	Entropy 0.63696 (0.63967)	Top-1 acc 56.250 (57.122)	Top-5 acc 74.219 (79.130)	lr 0.01625
Train [49][1180/3239]	Time 0.254 (0.529)	Data Time 0.001 (0.033)	Loss 2.7646 (2.7747)	Entropy 0.63711 (0.63965)	Top-1 acc 57.031 (57.122)	Top-5 acc 79.688 (79.129)	lr 0.01625
Train [49][1190/3239]	Time 0.248 (0.531)	Data Time 0.001 (0.035)	Loss 2.9543 (2.7744)	Entropy 0.63706 (0.63963)	Top-1 acc 54.688 (57.126)	Top-5 acc 75.000 (79.136)	lr 0.01625
Train [49][1200/3239]	Time 0.284 (0.531)	Data Time 0.001 (0.035)	Loss 2.7611 (2.7736)	Entropy 0.63724 (0.63961)	Top-1 acc 59.375 (57.146)	Top-5 acc 78.516 (79.151)	lr 0.01625
Train [49][1210/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.035)	Loss 2.7170 (2.7733)	Entropy 0.63697 (0.63959)	Top-1 acc 57.422 (57.156)	Top-5 acc 83.203 (79.163)	lr 0.01625
Train [49][1220/3239]	Time 4.747 (0.533)	Data Time 4.447 (0.038)	Loss 2.6901 (2.7735)	Entropy 0.63699 (0.63957)	Top-1 acc 58.984 (57.153)	Top-5 acc 82.422 (79.155)	lr 0.01625
Train [49][1230/3239]	Time 0.251 (0.532)	Data Time 0.001 (0.038)	Loss 2.7027 (2.7734)	Entropy 0.63683 (0.63955)	Top-1 acc 58.984 (57.162)	Top-5 acc 78.125 (79.154)	lr 0.01624
Train [49][1240/3239]	Time 0.438 (0.532)	Data Time 0.003 (0.037)	Loss 2.5964 (2.7738)	Entropy 0.63670 (0.63952)	Top-1 acc 56.641 (57.153)	Top-5 acc 83.594 (79.145)	lr 0.01624
Train [49][1250/3239]	Time 0.221 (0.531)	Data Time 0.001 (0.037)	Loss 2.6518 (2.7738)	Entropy 0.63645 (0.63950)	Top-1 acc 60.547 (57.156)	Top-5 acc 82.031 (79.145)	lr 0.01624
Train [49][1260/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.039)	Loss 2.7456 (2.7738)	Entropy 0.63686 (0.63948)	Top-1 acc 61.328 (57.159)	Top-5 acc 79.688 (79.144)	lr 0.01624
Train [49][1270/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.039)	Loss 2.9683 (2.7740)	Entropy 0.63668 (0.63946)	Top-1 acc 50.781 (57.163)	Top-5 acc 74.609 (79.143)	lr 0.01624
Train [49][1280/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.039)	Loss 3.1083 (2.7741)	Entropy 0.63683 (0.63944)	Top-1 acc 50.391 (57.149)	Top-5 acc 73.438 (79.147)	lr 0.01624
Train [49][1290/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.041)	Loss 2.8635 (2.7745)	Entropy 0.63739 (0.63942)	Top-1 acc 55.469 (57.147)	Top-5 acc 75.000 (79.135)	lr 0.01624
Train [49][1300/3239]	Time 0.242 (0.535)	Data Time 0.001 (0.043)	Loss 2.7888 (2.7749)	Entropy 0.63733 (0.63940)	Top-1 acc 56.641 (57.140)	Top-5 acc 78.516 (79.121)	lr 0.01624
Train [49][1310/3239]	Time 0.341 (0.534)	Data Time 0.001 (0.043)	Loss 2.6716 (2.7749)	Entropy 0.63750 (0.63939)	Top-1 acc 58.594 (57.141)	Top-5 acc 81.641 (79.126)	lr 0.01624
Train [49][1320/3239]	Time 0.249 (0.533)	Data Time 0.001 (0.043)	Loss 2.7316 (2.7753)	Entropy 0.63744 (0.63937)	Top-1 acc 56.641 (57.129)	Top-5 acc 78.906 (79.117)	lr 0.01624
Train [49][1330/3239]	Time 5.055 (0.537)	Data Time 4.797 (0.047)	Loss 2.9199 (2.7758)	Entropy 0.63738 (0.63936)	Top-1 acc 50.391 (57.111)	Top-5 acc 76.562 (79.103)	lr 0.01623
Train [49][1340/3239]	Time 0.248 (0.536)	Data Time 0.002 (0.046)	Loss 2.8528 (2.7761)	Entropy 0.63763 (0.63934)	Top-1 acc 56.250 (57.111)	Top-5 acc 80.469 (79.103)	lr 0.01623
Train [49][1350/3239]	Time 0.282 (0.535)	Data Time 0.002 (0.046)	Loss 2.7749 (2.7757)	Entropy 0.63759 (0.63933)	Top-1 acc 55.469 (57.120)	Top-5 acc 81.641 (79.103)	lr 0.01623
Train [49][1360/3239]	Time 0.251 (0.536)	Data Time 0.001 (0.047)	Loss 2.7370 (2.7758)	Entropy 0.63753 (0.63932)	Top-1 acc 59.375 (57.117)	Top-5 acc 79.688 (79.101)	lr 0.01623
Train [49][1370/3239]	Time 0.236 (0.536)	Data Time 0.002 (0.048)	Loss 2.7493 (2.7762)	Entropy 0.63726 (0.63930)	Top-1 acc 58.594 (57.108)	Top-5 acc 78.125 (79.092)	lr 0.01623
Train [49][1380/3239]	Time 0.268 (0.536)	Data Time 0.001 (0.047)	Loss 2.8572 (2.7762)	Entropy 0.63737 (0.63929)	Top-1 acc 60.547 (57.108)	Top-5 acc 76.953 (79.089)	lr 0.01623
Train [49][1390/3239]	Time 0.253 (0.536)	Data Time 0.001 (0.048)	Loss 2.7300 (2.7760)	Entropy 0.63757 (0.63928)	Top-1 acc 57.031 (57.111)	Top-5 acc 79.688 (79.094)	lr 0.01623
Train [49][1400/3239]	Time 0.348 (0.541)	Data Time 0.001 (0.053)	Loss 2.7491 (2.7761)	Entropy 0.63775 (0.63927)	Top-1 acc 59.375 (57.108)	Top-5 acc 77.344 (79.097)	lr 0.01623
Train [49][1410/3239]	Time 0.278 (0.540)	Data Time 0.001 (0.053)	Loss 2.8808 (2.7759)	Entropy 0.63747 (0.63925)	Top-1 acc 53.906 (57.109)	Top-5 acc 79.297 (79.103)	lr 0.01623
Train [49][1420/3239]	Time 0.253 (0.539)	Data Time 0.001 (0.053)	Loss 2.7701 (2.7758)	Entropy 0.63727 (0.63924)	Top-1 acc 57.422 (57.103)	Top-5 acc 79.297 (79.109)	lr 0.01623
Train [49][1430/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.056)	Loss 2.8966 (2.7758)	Entropy 0.63682 (0.63922)	Top-1 acc 53.125 (57.101)	Top-5 acc 77.734 (79.112)	lr 0.01623
Train [49][1440/3239]	Time 0.257 (0.542)	Data Time 0.002 (0.056)	Loss 2.8444 (2.7758)	Entropy 0.63689 (0.63921)	Top-1 acc 57.422 (57.104)	Top-5 acc 76.562 (79.108)	lr 0.01622
Train [49][1450/3239]	Time 0.223 (0.541)	Data Time 0.001 (0.055)	Loss 2.6126 (2.7753)	Entropy 0.63675 (0.63919)	Top-1 acc 59.375 (57.115)	Top-5 acc 80.078 (79.117)	lr 0.01622
Train [49][1460/3239]	Time 0.259 (0.546)	Data Time 0.001 (0.061)	Loss 2.7067 (2.7750)	Entropy 0.63664 (0.63917)	Top-1 acc 62.109 (57.121)	Top-5 acc 82.031 (79.123)	lr 0.01622
Train [49][1470/3239]	Time 0.392 (0.545)	Data Time 0.002 (0.060)	Loss 2.7891 (2.7748)	Entropy 0.63659 (0.63916)	Top-1 acc 57.031 (57.122)	Top-5 acc 77.734 (79.125)	lr 0.01622
Train [49][1480/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.061)	Loss 2.6732 (2.7747)	Entropy 0.63654 (0.63914)	Top-1 acc 59.375 (57.120)	Top-5 acc 81.250 (79.130)	lr 0.01622
Train [49][1490/3239]	Time 4.263 (0.547)	Data Time 4.018 (0.063)	Loss 2.6824 (2.7746)	Entropy 0.63696 (0.63912)	Top-1 acc 58.594 (57.116)	Top-5 acc 78.516 (79.129)	lr 0.01622
Train [49][1500/3239]	Time 0.238 (0.546)	Data Time 0.001 (0.063)	Loss 2.8216 (2.7744)	Entropy 0.63744 (0.63911)	Top-1 acc 57.812 (57.121)	Top-5 acc 78.906 (79.134)	lr 0.01622
Train [49][1510/3239]	Time 0.236 (0.548)	Data Time 0.001 (0.064)	Loss 3.0187 (2.7745)	Entropy 0.63727 (0.63910)	Top-1 acc 51.953 (57.117)	Top-5 acc 77.734 (79.138)	lr 0.01622
Train [49][1520/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.064)	Loss 2.7723 (2.7745)	Entropy 0.63711 (0.63909)	Top-1 acc 58.594 (57.116)	Top-5 acc 78.125 (79.136)	lr 0.01622
Train [49][1530/3239]	Time 0.238 (0.548)	Data Time 0.001 (0.066)	Loss 2.9295 (2.7748)	Entropy 0.63730 (0.63907)	Top-1 acc 46.484 (57.111)	Top-5 acc 76.172 (79.137)	lr 0.01622
Train [49][1540/3239]	Time 0.276 (0.550)	Data Time 0.001 (0.068)	Loss 2.6335 (2.7747)	Entropy 0.63742 (0.63906)	Top-1 acc 57.422 (57.111)	Top-5 acc 79.297 (79.132)	lr 0.01621
Train [49][1550/3239]	Time 0.249 (0.550)	Data Time 0.001 (0.068)	Loss 2.8200 (2.7749)	Entropy 0.63733 (0.63905)	Top-1 acc 55.469 (57.106)	Top-5 acc 77.734 (79.127)	lr 0.01621
Train [49][1560/3239]	Time 0.241 (0.551)	Data Time 0.001 (0.069)	Loss 2.6075 (2.7747)	Entropy 0.63706 (0.63904)	Top-1 acc 57.812 (57.100)	Top-5 acc 82.422 (79.129)	lr 0.01621
Train [49][1570/3239]	Time 1.508 (0.554)	Data Time 1.267 (0.073)	Loss 2.7326 (2.7748)	Entropy 0.63728 (0.63903)	Top-1 acc 61.719 (57.106)	Top-5 acc 78.516 (79.125)	lr 0.01621
Train [49][1580/3239]	Time 0.244 (0.553)	Data Time 0.001 (0.072)	Loss 2.8162 (2.7748)	Entropy 0.63753 (0.63901)	Top-1 acc 57.422 (57.101)	Top-5 acc 77.734 (79.125)	lr 0.01621
Train [49][1590/3239]	Time 0.257 (0.555)	Data Time 0.001 (0.075)	Loss 2.7033 (2.7745)	Entropy 0.63757 (0.63901)	Top-1 acc 57.812 (57.110)	Top-5 acc 79.688 (79.129)	lr 0.01621
Train [49][1600/3239]	Time 0.232 (0.555)	Data Time 0.001 (0.074)	Loss 2.7439 (2.7747)	Entropy 0.63770 (0.63900)	Top-1 acc 53.906 (57.104)	Top-5 acc 78.516 (79.124)	lr 0.01621
Train [49][1610/3239]	Time 0.231 (0.557)	Data Time 0.001 (0.078)	Loss 2.8481 (2.7748)	Entropy 0.63817 (0.63899)	Top-1 acc 56.641 (57.103)	Top-5 acc 77.734 (79.126)	lr 0.01621
Train [49][1620/3239]	Time 0.240 (0.558)	Data Time 0.001 (0.079)	Loss 3.0442 (2.7753)	Entropy 0.63811 (0.63898)	Top-1 acc 55.469 (57.102)	Top-5 acc 72.266 (79.115)	lr 0.01621
Train [49][1630/3239]	Time 0.364 (0.557)	Data Time 0.002 (0.078)	Loss 2.7570 (2.7753)	Entropy 0.63824 (0.63898)	Top-1 acc 57.422 (57.103)	Top-5 acc 80.859 (79.118)	lr 0.01621
Train [49][1640/3239]	Time 0.229 (0.562)	Data Time 0.001 (0.084)	Loss 2.6927 (2.7756)	Entropy 0.63805 (0.63897)	Top-1 acc 56.250 (57.095)	Top-5 acc 80.859 (79.115)	lr 0.01620
Train [49][1650/3239]	Time 0.379 (0.582)	Data Time 0.006 (0.084)	Loss 2.7811 (2.7754)	Entropy 0.63798 (0.63897)	Top-1 acc 56.250 (57.100)	Top-5 acc 79.688 (79.121)	lr 0.01620
Train [49][1660/3239]	Time 0.234 (0.581)	Data Time 0.002 (0.083)	Loss 2.7427 (2.7752)	Entropy 0.63826 (0.63896)	Top-1 acc 58.984 (57.106)	Top-5 acc 77.734 (79.128)	lr 0.01620
Train [49][1670/3239]	Time 0.243 (0.580)	Data Time 0.001 (0.083)	Loss 2.5679 (2.7748)	Entropy 0.63795 (0.63896)	Top-1 acc 61.328 (57.117)	Top-5 acc 83.203 (79.138)	lr 0.01620
Train [49][1680/3239]	Time 0.246 (0.579)	Data Time 0.001 (0.082)	Loss 3.0200 (2.7746)	Entropy 0.63817 (0.63895)	Top-1 acc 52.344 (57.127)	Top-5 acc 73.047 (79.141)	lr 0.01620
Train [49][1690/3239]	Time 0.231 (0.578)	Data Time 0.001 (0.082)	Loss 2.9483 (2.7749)	Entropy 0.63826 (0.63895)	Top-1 acc 53.516 (57.123)	Top-5 acc 73.438 (79.135)	lr 0.01620
Train [49][1700/3239]	Time 0.258 (0.577)	Data Time 0.002 (0.081)	Loss 2.8378 (2.7750)	Entropy 0.63822 (0.63894)	Top-1 acc 55.078 (57.122)	Top-5 acc 80.078 (79.134)	lr 0.01620
Train [49][1710/3239]	Time 0.237 (0.577)	Data Time 0.001 (0.081)	Loss 2.7918 (2.7754)	Entropy 0.63830 (0.63894)	Top-1 acc 53.516 (57.109)	Top-5 acc 78.516 (79.123)	lr 0.01620
Train [49][1720/3239]	Time 0.294 (0.576)	Data Time 0.001 (0.080)	Loss 2.7656 (2.7760)	Entropy 0.63812 (0.63893)	Top-1 acc 55.469 (57.094)	Top-5 acc 78.906 (79.104)	lr 0.01620
Train [49][1730/3239]	Time 0.241 (0.575)	Data Time 0.001 (0.080)	Loss 2.8077 (2.7757)	Entropy 0.63824 (0.63893)	Top-1 acc 56.250 (57.092)	Top-5 acc 74.219 (79.102)	lr 0.01620
Train [49][1740/3239]	Time 0.233 (0.575)	Data Time 0.001 (0.081)	Loss 3.1037 (2.7757)	Entropy 0.63826 (0.63893)	Top-1 acc 47.266 (57.093)	Top-5 acc 75.391 (79.109)	lr 0.01620
Train [49][1750/3239]	Time 0.239 (0.579)	Data Time 0.001 (0.085)	Loss 2.7308 (2.7757)	Entropy 0.63805 (0.63892)	Top-1 acc 56.641 (57.091)	Top-5 acc 79.688 (79.109)	lr 0.01619
Train [49][1760/3239]	Time 0.245 (0.579)	Data Time 0.001 (0.085)	Loss 2.7568 (2.7759)	Entropy 0.63767 (0.63892)	Top-1 acc 56.641 (57.089)	Top-5 acc 77.344 (79.103)	lr 0.01619
Train [49][1770/3239]	Time 0.262 (0.580)	Data Time 0.002 (0.086)	Loss 2.8205 (2.7761)	Entropy 0.63765 (0.63891)	Top-1 acc 58.594 (57.083)	Top-5 acc 79.297 (79.098)	lr 0.01619
Train [49][1780/3239]	Time 0.252 (0.580)	Data Time 0.002 (0.087)	Loss 2.5767 (2.7762)	Entropy 0.63767 (0.63890)	Top-1 acc 64.062 (57.089)	Top-5 acc 85.547 (79.094)	lr 0.01619
Train [49][1790/3239]	Time 0.383 (0.585)	Data Time 0.001 (0.093)	Loss 2.7450 (2.7761)	Entropy 0.63756 (0.63889)	Top-1 acc 58.594 (57.097)	Top-5 acc 82.422 (79.098)	lr 0.01619
Train [49][1800/3239]	Time 0.281 (0.585)	Data Time 0.002 (0.093)	Loss 2.7567 (2.7762)	Entropy 0.63770 (0.63889)	Top-1 acc 58.984 (57.093)	Top-5 acc 78.125 (79.095)	lr 0.01619
Train [49][1810/3239]	Time 2.462 (0.585)	Data Time 2.202 (0.094)	Loss 2.7233 (2.7765)	Entropy 0.63783 (0.63888)	Top-1 acc 56.641 (57.087)	Top-5 acc 79.688 (79.088)	lr 0.01619
Train [49][1820/3239]	Time 0.259 (0.587)	Data Time 0.002 (0.095)	Loss 2.7064 (2.7768)	Entropy 0.63799 (0.63888)	Top-1 acc 56.641 (57.076)	Top-5 acc 82.422 (79.084)	lr 0.01619
Train [49][1830/3239]	Time 0.247 (0.590)	Data Time 0.001 (0.099)	Loss 2.6923 (2.7768)	Entropy 0.63812 (0.63887)	Top-1 acc 57.812 (57.079)	Top-5 acc 79.688 (79.081)	lr 0.01619
Train [49][1840/3239]	Time 0.239 (0.589)	Data Time 0.001 (0.099)	Loss 2.9876 (2.7771)	Entropy 0.63785 (0.63887)	Top-1 acc 50.000 (57.072)	Top-5 acc 73.438 (79.075)	lr 0.01619
Train [49][1850/3239]	Time 0.268 (0.591)	Data Time 0.001 (0.101)	Loss 2.6938 (2.7769)	Entropy 0.63791 (0.63886)	Top-1 acc 60.547 (57.081)	Top-5 acc 78.906 (79.073)	lr 0.01618
Train [49][1860/3239]	Time 0.355 (0.596)	Data Time 0.001 (0.106)	Loss 2.7805 (2.7773)	Entropy 0.63780 (0.63886)	Top-1 acc 55.469 (57.066)	Top-5 acc 79.297 (79.065)	lr 0.01618
Train [49][1870/3239]	Time 0.238 (0.595)	Data Time 0.001 (0.106)	Loss 3.0767 (2.7774)	Entropy 0.63737 (0.63885)	Top-1 acc 49.609 (57.063)	Top-5 acc 74.219 (79.065)	lr 0.01618
Train [49][1880/3239]	Time 0.251 (0.597)	Data Time 0.001 (0.108)	Loss 2.7587 (2.7770)	Entropy 0.63768 (0.63884)	Top-1 acc 59.375 (57.075)	Top-5 acc 79.688 (79.072)	lr 0.01618
Train [49][1890/3239]	Time 0.264 (0.600)	Data Time 0.001 (0.111)	Loss 2.9737 (2.7770)	Entropy 0.63776 (0.63884)	Top-1 acc 51.953 (57.079)	Top-5 acc 76.562 (79.076)	lr 0.01618
Train [49][1900/3239]	Time 0.229 (0.599)	Data Time 0.001 (0.110)	Loss 2.9536 (2.7770)	Entropy 0.63808 (0.63883)	Top-1 acc 51.172 (57.076)	Top-5 acc 75.391 (79.077)	lr 0.01618
Train [49][1910/3239]	Time 0.232 (0.603)	Data Time 0.001 (0.115)	Loss 3.0974 (2.7770)	Entropy 0.63802 (0.63883)	Top-1 acc 50.391 (57.072)	Top-5 acc 69.922 (79.072)	lr 0.01618
Train [49][1920/3239]	Time 0.244 (0.604)	Data Time 0.001 (0.117)	Loss 2.7938 (2.7771)	Entropy 0.63821 (0.63882)	Top-1 acc 55.078 (57.068)	Top-5 acc 78.516 (79.066)	lr 0.01618
Train [49][1930/3239]	Time 0.238 (0.603)	Data Time 0.001 (0.116)	Loss 2.7561 (2.7769)	Entropy 0.63816 (0.63882)	Top-1 acc 58.984 (57.074)	Top-5 acc 78.125 (79.071)	lr 0.01618
Train [49][1940/3239]	Time 0.237 (0.606)	Data Time 0.001 (0.119)	Loss 2.7439 (2.7772)	Entropy 0.63814 (0.63882)	Top-1 acc 58.594 (57.067)	Top-5 acc 78.906 (79.069)	lr 0.01618
Train [49][1950/3239]	Time 0.351 (0.608)	Data Time 0.001 (0.121)	Loss 2.6425 (2.7772)	Entropy 0.63767 (0.63881)	Top-1 acc 57.422 (57.070)	Top-5 acc 82.422 (79.071)	lr 0.01617
Train [49][1960/3239]	Time 0.262 (0.608)	Data Time 0.001 (0.122)	Loss 2.7864 (2.7773)	Entropy 0.63805 (0.63881)	Top-1 acc 58.594 (57.068)	Top-5 acc 77.344 (79.068)	lr 0.01617
Train [49][1970/3239]	Time 8.324 (0.611)	Data Time 8.079 (0.126)	Loss 2.8116 (2.7774)	Entropy 0.63842 (0.63880)	Top-1 acc 56.641 (57.063)	Top-5 acc 74.609 (79.067)	lr 0.01617
Train [49][1980/3239]	Time 0.251 (0.613)	Data Time 0.001 (0.127)	Loss 2.8057 (2.7777)	Entropy 0.63812 (0.63880)	Top-1 acc 58.984 (57.058)	Top-5 acc 78.906 (79.064)	lr 0.01617
Train [49][1990/3239]	Time 0.232 (0.614)	Data Time 0.001 (0.129)	Loss 2.7685 (2.7777)	Entropy 0.63829 (0.63880)	Top-1 acc 53.906 (57.061)	Top-5 acc 78.516 (79.062)	lr 0.01617
Train [49][2000/3239]	Time 0.252 (0.613)	Data Time 0.001 (0.128)	Loss 2.7112 (2.7775)	Entropy 0.63808 (0.63880)	Top-1 acc 58.594 (57.067)	Top-5 acc 81.641 (79.064)	lr 0.01617
Train [49][2010/3239]	Time 0.234 (0.617)	Data Time 0.001 (0.132)	Loss 3.0325 (2.7776)	Entropy 0.63811 (0.63879)	Top-1 acc 49.609 (57.063)	Top-5 acc 75.391 (79.060)	lr 0.01617
Train [49][2020/3239]	Time 0.827 (0.619)	Data Time 0.469 (0.135)	Loss 2.9570 (2.7774)	Entropy 0.63843 (0.63879)	Top-1 acc 50.391 (57.068)	Top-5 acc 73.828 (79.064)	lr 0.01617
Train [49][2030/3239]	Time 0.239 (0.618)	Data Time 0.001 (0.134)	Loss 2.6907 (2.7773)	Entropy 0.63874 (0.63879)	Top-1 acc 59.766 (57.070)	Top-5 acc 79.297 (79.067)	lr 0.01617
Train [49][2040/3239]	Time 0.264 (0.623)	Data Time 0.001 (0.140)	Loss 2.8769 (2.7775)	Entropy 0.63868 (0.63879)	Top-1 acc 55.859 (57.061)	Top-5 acc 78.906 (79.062)	lr 0.01617
Train [49][2050/3239]	Time 0.229 (0.623)	Data Time 0.001 (0.140)	Loss 2.7029 (2.7774)	Entropy 0.63872 (0.63879)	Top-1 acc 58.984 (57.064)	Top-5 acc 80.078 (79.062)	lr 0.01617
Train [49][2060/3239]	Time 0.232 (0.624)	Data Time 0.001 (0.141)	Loss 2.9039 (2.7775)	Entropy 0.63906 (0.63879)	Top-1 acc 53.125 (57.064)	Top-5 acc 78.516 (79.060)	lr 0.01616
Train [49][2070/3239]	Time 0.236 (0.628)	Data Time 0.001 (0.146)	Loss 2.8245 (2.7775)	Entropy 0.63881 (0.63879)	Top-1 acc 56.641 (57.065)	Top-5 acc 78.906 (79.060)	lr 0.01616
Train [49][2080/3239]	Time 0.317 (0.628)	Data Time 0.001 (0.146)	Loss 2.8782 (2.7774)	Entropy 0.63873 (0.63879)	Top-1 acc 57.812 (57.068)	Top-5 acc 76.562 (79.062)	lr 0.01616
Train [49][2090/3239]	Time 0.250 (0.630)	Data Time 0.001 (0.148)	Loss 2.8822 (2.7774)	Entropy 0.63874 (0.63879)	Top-1 acc 55.859 (57.069)	Top-5 acc 82.812 (79.065)	lr 0.01616
Train [49][2100/3239]	Time 0.254 (0.629)	Data Time 0.002 (0.148)	Loss 2.5922 (2.7773)	Entropy 0.63856 (0.63879)	Top-1 acc 58.203 (57.069)	Top-5 acc 80.078 (79.068)	lr 0.01616
Train [49][2110/3239]	Time 0.253 (0.633)	Data Time 0.001 (0.151)	Loss 2.5978 (2.7772)	Entropy 0.63849 (0.63879)	Top-1 acc 58.594 (57.070)	Top-5 acc 81.641 (79.070)	lr 0.01616
Train [49][2120/3239]	Time 0.234 (0.634)	Data Time 0.001 (0.153)	Loss 2.6382 (2.7770)	Entropy 0.63849 (0.63879)	Top-1 acc 58.594 (57.069)	Top-5 acc 80.469 (79.071)	lr 0.01616
Train [49][2130/3239]	Time 3.576 (0.635)	Data Time 3.339 (0.154)	Loss 2.8409 (2.7771)	Entropy 0.63868 (0.63878)	Top-1 acc 54.688 (57.068)	Top-5 acc 77.344 (79.069)	lr 0.01616
Train [49][2140/3239]	Time 0.238 (0.638)	Data Time 0.001 (0.157)	Loss 2.8303 (2.7772)	Entropy 0.63799 (0.63878)	Top-1 acc 55.859 (57.064)	Top-5 acc 77.734 (79.067)	lr 0.01616
Train [49][2150/3239]	Time 0.231 (0.640)	Data Time 0.001 (0.160)	Loss 2.7930 (2.7772)	Entropy 0.63865 (0.63878)	Top-1 acc 55.859 (57.062)	Top-5 acc 78.516 (79.069)	lr 0.01616
Train [49][2160/3239]	Time 2.048 (0.640)	Data Time 1.810 (0.160)	Loss 2.8622 (2.7772)	Entropy 0.63891 (0.63878)	Top-1 acc 58.594 (57.065)	Top-5 acc 76.953 (79.069)	lr 0.01615
Train [49][2170/3239]	Time 0.239 (0.644)	Data Time 0.001 (0.165)	Loss 2.7102 (2.7773)	Entropy 0.63906 (0.63878)	Top-1 acc 59.375 (57.062)	Top-5 acc 80.078 (79.068)	lr 0.01615
Train [49][2180/3239]	Time 0.463 (0.646)	Data Time 0.132 (0.166)	Loss 2.8462 (2.7776)	Entropy 0.63914 (0.63878)	Top-1 acc 56.250 (57.056)	Top-5 acc 75.781 (79.061)	lr 0.01615
Train [49][2190/3239]	Time 0.228 (0.645)	Data Time 0.001 (0.166)	Loss 2.7179 (2.7777)	Entropy 0.63890 (0.63878)	Top-1 acc 56.250 (57.052)	Top-5 acc 79.688 (79.059)	lr 0.01615
Train [49][2200/3239]	Time 0.235 (0.649)	Data Time 0.001 (0.170)	Loss 2.8702 (2.7780)	Entropy 0.63906 (0.63879)	Top-1 acc 54.297 (57.040)	Top-5 acc 75.781 (79.049)	lr 0.01615
Train [49][2210/3239]	Time 0.251 (0.651)	Data Time 0.001 (0.173)	Loss 3.0614 (2.7778)	Entropy 0.63899 (0.63879)	Top-1 acc 49.609 (57.045)	Top-5 acc 74.219 (79.052)	lr 0.01615
Train [49][2220/3239]	Time 0.430 (0.650)	Data Time 0.179 (0.172)	Loss 2.5372 (2.7780)	Entropy 0.63910 (0.63879)	Top-1 acc 62.500 (57.040)	Top-5 acc 82.422 (79.050)	lr 0.01615
Train [49][2230/3239]	Time 0.231 (0.657)	Data Time 0.001 (0.179)	Loss 2.6777 (2.7779)	Entropy 0.63910 (0.63879)	Top-1 acc 58.984 (57.045)	Top-5 acc 80.469 (79.048)	lr 0.01615
Train [49][2240/3239]	Time 0.229 (0.659)	Data Time 0.001 (0.181)	Loss 2.5858 (2.7780)	Entropy 0.63926 (0.63879)	Top-1 acc 62.109 (57.039)	Top-5 acc 81.250 (79.048)	lr 0.01615
Train [49][2250/3239]	Time 0.329 (0.658)	Data Time 0.001 (0.180)	Loss 2.6795 (2.7777)	Entropy 0.63959 (0.63879)	Top-1 acc 59.375 (57.045)	Top-5 acc 81.250 (79.052)	lr 0.01615
Train [49][2260/3239]	Time 0.226 (0.663)	Data Time 0.001 (0.186)	Loss 2.9768 (2.7777)	Entropy 0.63956 (0.63880)	Top-1 acc 53.516 (57.051)	Top-5 acc 75.781 (79.052)	lr 0.01614
Train [49][2270/3239]	Time 5.625 (0.666)	Data Time 5.386 (0.189)	Loss 2.7462 (2.7776)	Entropy 0.63976 (0.63880)	Top-1 acc 55.078 (57.053)	Top-5 acc 78.125 (79.053)	lr 0.01614
Train [49][2280/3239]	Time 0.242 (0.665)	Data Time 0.001 (0.188)	Loss 2.8193 (2.7774)	Entropy 0.64002 (0.63880)	Top-1 acc 55.859 (57.059)	Top-5 acc 79.688 (79.057)	lr 0.01614
Train [49][2290/3239]	Time 13.585 (0.669)	Data Time 13.350 (0.193)	Loss 2.7463 (2.7775)	Entropy 0.64005 (0.63881)	Top-1 acc 56.641 (57.054)	Top-5 acc 78.906 (79.056)	lr 0.01614
Train [49][2300/3239]	Time 0.230 (0.671)	Data Time 0.001 (0.195)	Loss 2.7119 (2.7777)	Entropy 0.63999 (0.63882)	Top-1 acc 57.031 (57.049)	Top-5 acc 81.641 (79.056)	lr 0.01614
Train [49][2310/3239]	Time 0.327 (0.686)	Data Time 0.027 (0.195)	Loss 2.6691 (2.7776)	Entropy 0.64016 (0.63882)	Top-1 acc 57.031 (57.051)	Top-5 acc 81.641 (79.056)	lr 0.01614
Train [49][2320/3239]	Time 0.273 (0.685)	Data Time 0.002 (0.195)	Loss 2.9499 (2.7777)	Entropy 0.64008 (0.63883)	Top-1 acc 54.297 (57.053)	Top-5 acc 77.734 (79.054)	lr 0.01614
Train [49][2330/3239]	Time 0.248 (0.684)	Data Time 0.002 (0.194)	Loss 2.7359 (2.7777)	Entropy 0.64027 (0.63883)	Top-1 acc 58.203 (57.054)	Top-5 acc 80.469 (79.049)	lr 0.01614
Train [49][2340/3239]	Time 0.332 (0.683)	Data Time 0.001 (0.193)	Loss 2.7636 (2.7778)	Entropy 0.64009 (0.63884)	Top-1 acc 56.641 (57.052)	Top-5 acc 78.125 (79.048)	lr 0.01614
Train [49][2350/3239]	Time 0.275 (0.682)	Data Time 0.001 (0.192)	Loss 3.0834 (2.7779)	Entropy 0.63959 (0.63884)	Top-1 acc 46.484 (57.042)	Top-5 acc 74.219 (79.044)	lr 0.01614
Train [49][2360/3239]	Time 0.236 (0.681)	Data Time 0.001 (0.191)	Loss 3.0126 (2.7780)	Entropy 0.63952 (0.63884)	Top-1 acc 49.609 (57.041)	Top-5 acc 74.609 (79.044)	lr 0.01614
Train [49][2370/3239]	Time 0.249 (0.683)	Data Time 0.002 (0.193)	Loss 2.9211 (2.7777)	Entropy 0.63934 (0.63885)	Top-1 acc 56.250 (57.047)	Top-5 acc 75.391 (79.052)	lr 0.01613
Train [49][2380/3239]	Time 0.231 (0.684)	Data Time 0.001 (0.195)	Loss 2.7383 (2.7775)	Entropy 0.63940 (0.63885)	Top-1 acc 60.156 (57.050)	Top-5 acc 78.516 (79.056)	lr 0.01613
Train [49][2390/3239]	Time 0.239 (0.688)	Data Time 0.001 (0.199)	Loss 2.6153 (2.7775)	Entropy 0.63919 (0.63885)	Top-1 acc 60.547 (57.053)	Top-5 acc 80.469 (79.054)	lr 0.01613
Train [49][2400/3239]	Time 0.260 (0.689)	Data Time 0.001 (0.201)	Loss 2.8106 (2.7776)	Entropy 0.63973 (0.63885)	Top-1 acc 56.250 (57.051)	Top-5 acc 79.688 (79.053)	lr 0.01613
Train [49][2410/3239]	Time 1.578 (0.692)	Data Time 1.327 (0.203)	Loss 2.7069 (2.7777)	Entropy 0.63945 (0.63886)	Top-1 acc 56.641 (57.047)	Top-5 acc 79.688 (79.051)	lr 0.01613
Train [49][2420/3239]	Time 0.240 (0.695)	Data Time 0.001 (0.206)	Loss 2.8313 (2.7778)	Entropy 0.63935 (0.63886)	Top-1 acc 51.562 (57.041)	Top-5 acc 75.391 (79.048)	lr 0.01613
Train [49][2430/3239]	Time 4.962 (0.695)	Data Time 4.715 (0.208)	Loss 2.8446 (2.7777)	Entropy 0.63950 (0.63886)	Top-1 acc 54.688 (57.043)	Top-5 acc 78.125 (79.051)	lr 0.01613
Train [49][2440/3239]	Time 0.241 (0.699)	Data Time 0.002 (0.211)	Loss 3.0140 (2.7776)	Entropy 0.63965 (0.63887)	Top-1 acc 50.000 (57.038)	Top-5 acc 74.609 (79.057)	lr 0.01613
Train [49][2450/3239]	Time 6.829 (0.701)	Data Time 6.570 (0.213)	Loss 2.7114 (2.7776)	Entropy 0.63975 (0.63887)	Top-1 acc 58.984 (57.037)	Top-5 acc 82.031 (79.057)	lr 0.01613
Train [49][2460/3239]	Time 0.224 (0.700)	Data Time 0.001 (0.213)	Loss 2.5727 (2.7774)	Entropy 0.63987 (0.63887)	Top-1 acc 60.547 (57.036)	Top-5 acc 85.156 (79.061)	lr 0.01613
Train [49][2470/3239]	Time 6.901 (0.706)	Data Time 6.655 (0.219)	Loss 2.8677 (2.7773)	Entropy 0.64002 (0.63888)	Top-1 acc 53.906 (57.034)	Top-5 acc 73.828 (79.061)	lr 0.01612
Train [49][2480/3239]	Time 0.241 (0.705)	Data Time 0.001 (0.218)	Loss 2.7132 (2.7777)	Entropy 0.64006 (0.63888)	Top-1 acc 56.641 (57.021)	Top-5 acc 79.297 (79.054)	lr 0.01612
Train [49][2490/3239]	Time 0.234 (0.707)	Data Time 0.001 (0.221)	Loss 2.8575 (2.7778)	Entropy 0.64021 (0.63889)	Top-1 acc 56.641 (57.018)	Top-5 acc 77.734 (79.054)	lr 0.01612
Train [49][2500/3239]	Time 0.380 (0.710)	Data Time 0.001 (0.224)	Loss 2.9295 (2.7778)	Entropy 0.64058 (0.63889)	Top-1 acc 53.125 (57.017)	Top-5 acc 76.562 (79.054)	lr 0.01612
Train [49][2510/3239]	Time 0.229 (0.712)	Data Time 0.001 (0.226)	Loss 2.9020 (2.7779)	Entropy 0.64053 (0.63890)	Top-1 acc 54.297 (57.014)	Top-5 acc 75.000 (79.047)	lr 0.01612
Train [49][2520/3239]	Time 0.239 (0.714)	Data Time 0.001 (0.229)	Loss 2.7246 (2.7780)	Entropy 0.64046 (0.63891)	Top-1 acc 56.250 (57.013)	Top-5 acc 79.297 (79.047)	lr 0.01612
Train [49][2530/3239]	Time 5.867 (0.719)	Data Time 5.625 (0.234)	Loss 2.9231 (2.7780)	Entropy 0.64075 (0.63891)	Top-1 acc 52.734 (57.016)	Top-5 acc 74.609 (79.044)	lr 0.01612
Train [49][2540/3239]	Time 0.228 (0.720)	Data Time 0.001 (0.235)	Loss 2.7350 (2.7780)	Entropy 0.64066 (0.63892)	Top-1 acc 57.812 (57.018)	Top-5 acc 80.078 (79.042)	lr 0.01612
Train [49][2550/3239]	Time 0.253 (0.720)	Data Time 0.001 (0.236)	Loss 2.7506 (2.7780)	Entropy 0.64078 (0.63893)	Top-1 acc 58.984 (57.019)	Top-5 acc 77.344 (79.042)	lr 0.01612
Train [49][2560/3239]	Time 0.262 (0.725)	Data Time 0.001 (0.241)	Loss 2.6251 (2.7778)	Entropy 0.64103 (0.63893)	Top-1 acc 58.594 (57.023)	Top-5 acc 80.469 (79.047)	lr 0.01612
Train [49][2570/3239]	Time 0.331 (0.726)	Data Time 0.001 (0.242)	Loss 2.6147 (2.7776)	Entropy 0.64078 (0.63894)	Top-1 acc 57.812 (57.025)	Top-5 acc 81.641 (79.052)	lr 0.01612
Train [49][2580/3239]	Time 0.228 (0.727)	Data Time 0.001 (0.243)	Loss 2.8694 (2.7775)	Entropy 0.64104 (0.63895)	Top-1 acc 53.516 (57.028)	Top-5 acc 78.906 (79.053)	lr 0.01611
Train [49][2590/3239]	Time 12.583 (0.732)	Data Time 12.343 (0.249)	Loss 2.7992 (2.7774)	Entropy 0.64133 (0.63896)	Top-1 acc 58.203 (57.032)	Top-5 acc 80.078 (79.057)	lr 0.01611
Train [49][2600/3239]	Time 0.231 (0.733)	Data Time 0.001 (0.250)	Loss 2.7944 (2.7774)	Entropy 0.64070 (0.63897)	Top-1 acc 55.078 (57.033)	Top-5 acc 82.031 (79.056)	lr 0.01611
Train [49][2610/3239]	Time 3.134 (0.733)	Data Time 2.882 (0.250)	Loss 2.7037 (2.7773)	Entropy 0.64100 (0.63897)	Top-1 acc 61.719 (57.038)	Top-5 acc 80.859 (79.058)	lr 0.01611
Train [49][2620/3239]	Time 0.239 (0.735)	Data Time 0.001 (0.252)	Loss 2.8612 (2.7775)	Entropy 0.64108 (0.63898)	Top-1 acc 58.984 (57.039)	Top-5 acc 78.906 (79.058)	lr 0.01611
Train [49][2630/3239]	Time 2.293 (0.739)	Data Time 2.015 (0.257)	Loss 2.7506 (2.7776)	Entropy 0.64094 (0.63899)	Top-1 acc 57.031 (57.031)	Top-5 acc 78.125 (79.053)	lr 0.01611
Train [49][2640/3239]	Time 0.245 (0.739)	Data Time 0.001 (0.257)	Loss 2.7301 (2.7776)	Entropy 0.64112 (0.63900)	Top-1 acc 59.375 (57.035)	Top-5 acc 81.641 (79.054)	lr 0.01611
Train [49][2650/3239]	Time 0.246 (0.741)	Data Time 0.001 (0.259)	Loss 2.9050 (2.7776)	Entropy 0.64135 (0.63901)	Top-1 acc 57.031 (57.033)	Top-5 acc 76.562 (79.052)	lr 0.01611
Train [49][2660/3239]	Time 0.330 (0.746)	Data Time 0.001 (0.264)	Loss 2.7546 (2.7776)	Entropy 0.64151 (0.63901)	Top-1 acc 59.766 (57.036)	Top-5 acc 78.906 (79.053)	lr 0.01611
Train [49][2670/3239]	Time 0.236 (0.745)	Data Time 0.001 (0.264)	Loss 2.7454 (2.7777)	Entropy 0.64134 (0.63902)	Top-1 acc 58.984 (57.036)	Top-5 acc 80.859 (79.046)	lr 0.01611
Train [49][2680/3239]	Time 0.225 (0.748)	Data Time 0.001 (0.267)	Loss 2.6145 (2.7776)	Entropy 0.64159 (0.63903)	Top-1 acc 62.109 (57.039)	Top-5 acc 83.984 (79.049)	lr 0.01610
Train [49][2690/3239]	Time 7.480 (0.753)	Data Time 7.193 (0.272)	Loss 2.7514 (2.7775)	Entropy 0.64147 (0.63904)	Top-1 acc 58.594 (57.047)	Top-5 acc 79.688 (79.054)	lr 0.01610
Train [49][2700/3239]	Time 0.232 (0.752)	Data Time 0.001 (0.272)	Loss 2.6123 (2.7775)	Entropy 0.64152 (0.63905)	Top-1 acc 61.719 (57.047)	Top-5 acc 83.203 (79.056)	lr 0.01610
Train [49][2710/3239]	Time 0.235 (0.756)	Data Time 0.001 (0.275)	Loss 2.7099 (2.7775)	Entropy 0.64161 (0.63906)	Top-1 acc 55.859 (57.042)	Top-5 acc 80.469 (79.052)	lr 0.01610
Train [49][2720/3239]	Time 0.232 (0.757)	Data Time 0.001 (0.277)	Loss 3.0787 (2.7776)	Entropy 0.64171 (0.63907)	Top-1 acc 49.609 (57.041)	Top-5 acc 73.047 (79.051)	lr 0.01610
Train [49][2730/3239]	Time 0.393 (0.760)	Data Time 0.001 (0.280)	Loss 2.7339 (2.7775)	Entropy 0.64177 (0.63908)	Top-1 acc 59.766 (57.045)	Top-5 acc 82.031 (79.051)	lr 0.01610
Train [49][2740/3239]	Time 0.233 (0.763)	Data Time 0.001 (0.283)	Loss 2.6715 (2.7774)	Entropy 0.64185 (0.63909)	Top-1 acc 58.594 (57.048)	Top-5 acc 80.078 (79.053)	lr 0.01610
Train [49][2750/3239]	Time 4.204 (0.763)	Data Time 3.922 (0.284)	Loss 2.7243 (2.7774)	Entropy 0.64190 (0.63910)	Top-1 acc 56.641 (57.047)	Top-5 acc 79.297 (79.052)	lr 0.01610
Train [49][2760/3239]	Time 0.228 (0.768)	Data Time 0.001 (0.289)	Loss 2.7424 (2.7775)	Entropy 0.64185 (0.63911)	Top-1 acc 58.984 (57.044)	Top-5 acc 78.906 (79.052)	lr 0.01610
Train [49][2770/3239]	Time 12.476 (0.772)	Data Time 12.218 (0.292)	Loss 2.5747 (2.7772)	Entropy 0.64192 (0.63912)	Top-1 acc 62.500 (57.052)	Top-5 acc 82.812 (79.055)	lr 0.01610
Train [49][2780/3239]	Time 0.276 (0.770)	Data Time 0.001 (0.291)	Loss 2.7829 (2.7772)	Entropy 0.64237 (0.63913)	Top-1 acc 59.375 (57.054)	Top-5 acc 78.906 (79.055)	lr 0.01609
Train [49][2790/3239]	Time 7.849 (0.774)	Data Time 7.603 (0.296)	Loss 2.8234 (2.7771)	Entropy 0.64241 (0.63914)	Top-1 acc 54.688 (57.058)	Top-5 acc 77.734 (79.058)	lr 0.01609
Train [49][2800/3239]	Time 0.246 (0.773)	Data Time 0.001 (0.295)	Loss 2.7021 (2.7772)	Entropy 0.64273 (0.63915)	Top-1 acc 58.984 (57.059)	Top-5 acc 81.641 (79.057)	lr 0.01609
Train [49][2810/3239]	Time 0.236 (0.776)	Data Time 0.001 (0.298)	Loss 2.7326 (2.7773)	Entropy 0.64235 (0.63917)	Top-1 acc 59.375 (57.057)	Top-5 acc 81.250 (79.054)	lr 0.01609
Train [49][2820/3239]	Time 0.264 (0.779)	Data Time 0.001 (0.301)	Loss 2.7555 (2.7774)	Entropy 0.64241 (0.63918)	Top-1 acc 56.641 (57.054)	Top-5 acc 82.031 (79.052)	lr 0.01609
Train [49][2830/3239]	Time 0.231 (0.781)	Data Time 0.001 (0.303)	Loss 2.9938 (2.7776)	Entropy 0.64245 (0.63919)	Top-1 acc 51.172 (57.050)	Top-5 acc 75.000 (79.047)	lr 0.01609
Train [49][2840/3239]	Time 0.230 (0.783)	Data Time 0.001 (0.306)	Loss 2.7867 (2.7777)	Entropy 0.64248 (0.63920)	Top-1 acc 58.203 (57.047)	Top-5 acc 78.516 (79.045)	lr 0.01609
Train [49][2850/3239]	Time 4.534 (0.785)	Data Time 4.279 (0.308)	Loss 2.8989 (2.7778)	Entropy 0.64220 (0.63921)	Top-1 acc 55.078 (57.044)	Top-5 acc 75.781 (79.042)	lr 0.01609
Train [49][2860/3239]	Time 0.231 (0.785)	Data Time 0.001 (0.308)	Loss 2.7309 (2.7780)	Entropy 0.64211 (0.63922)	Top-1 acc 57.422 (57.038)	Top-5 acc 79.297 (79.036)	lr 0.01609
Train [49][2870/3239]	Time 0.231 (0.789)	Data Time 0.001 (0.312)	Loss 2.8145 (2.7781)	Entropy 0.64226 (0.63923)	Top-1 acc 57.812 (57.033)	Top-5 acc 76.562 (79.037)	lr 0.01609
Train [49][2880/3239]	Time 0.228 (0.788)	Data Time 0.001 (0.311)	Loss 3.0178 (2.7780)	Entropy 0.64242 (0.63924)	Top-1 acc 50.391 (57.031)	Top-5 acc 72.266 (79.035)	lr 0.01609
Train [49][2890/3239]	Time 0.323 (0.790)	Data Time 0.001 (0.314)	Loss 2.8999 (2.7780)	Entropy 0.64269 (0.63925)	Top-1 acc 53.516 (57.035)	Top-5 acc 75.391 (79.034)	lr 0.01608
Train [49][2900/3239]	Time 0.251 (0.794)	Data Time 0.001 (0.318)	Loss 2.6439 (2.7779)	Entropy 0.64265 (0.63927)	Top-1 acc 59.766 (57.042)	Top-5 acc 80.859 (79.034)	lr 0.01608
Train [49][2910/3239]	Time 0.368 (0.793)	Data Time 0.146 (0.317)	Loss 2.8978 (2.7780)	Entropy 0.64254 (0.63928)	Top-1 acc 57.031 (57.041)	Top-5 acc 79.297 (79.037)	lr 0.01608
Train [49][2920/3239]	Time 0.216 (0.796)	Data Time 0.001 (0.320)	Loss 2.8790 (2.7780)	Entropy 0.64275 (0.63929)	Top-1 acc 56.641 (57.044)	Top-5 acc 77.734 (79.036)	lr 0.01608
Train [49][2930/3239]	Time 12.675 (0.799)	Data Time 12.413 (0.323)	Loss 2.9088 (2.7780)	Entropy 0.64289 (0.63930)	Top-1 acc 58.203 (57.046)	Top-5 acc 76.953 (79.036)	lr 0.01608
Train [49][2940/3239]	Time 0.229 (0.798)	Data Time 0.001 (0.322)	Loss 2.9269 (2.7781)	Entropy 0.64287 (0.63931)	Top-1 acc 51.562 (57.041)	Top-5 acc 75.000 (79.034)	lr 0.01608
Train [49][2950/3239]	Time 7.375 (0.800)	Data Time 7.149 (0.325)	Loss 3.0550 (2.7782)	Entropy 0.64288 (0.63932)	Top-1 acc 50.781 (57.038)	Top-5 acc 72.266 (79.029)	lr 0.01608
Train [49][2960/3239]	Time 0.393 (0.811)	Data Time 0.007 (0.325)	Loss 2.8106 (2.7784)	Entropy 0.64278 (0.63934)	Top-1 acc 57.031 (57.033)	Top-5 acc 76.172 (79.025)	lr 0.01608
Train [49][2970/3239]	Time 0.236 (0.810)	Data Time 0.002 (0.323)	Loss 2.6630 (2.7784)	Entropy 0.64298 (0.63935)	Top-1 acc 60.938 (57.033)	Top-5 acc 82.422 (79.026)	lr 0.01608
Train [49][2980/3239]	Time 0.316 (0.808)	Data Time 0.002 (0.322)	Loss 3.2638 (2.7785)	Entropy 0.64303 (0.63936)	Top-1 acc 47.266 (57.034)	Top-5 acc 67.969 (79.025)	lr 0.01608
Train [49][2990/3239]	Time 0.237 (0.807)	Data Time 0.001 (0.321)	Loss 2.9555 (2.7785)	Entropy 0.64277 (0.63937)	Top-1 acc 52.344 (57.031)	Top-5 acc 75.000 (79.023)	lr 0.01607
Train [49][3000/3239]	Time 0.232 (0.808)	Data Time 0.001 (0.322)	Loss 2.6104 (2.7785)	Entropy 0.64226 (0.63938)	Top-1 acc 60.156 (57.030)	Top-5 acc 83.203 (79.026)	lr 0.01607
Train [49][3010/3239]	Time 5.550 (0.808)	Data Time 5.252 (0.323)	Loss 2.8125 (2.7786)	Entropy 0.64223 (0.63939)	Top-1 acc 56.250 (57.024)	Top-5 acc 79.688 (79.021)	lr 0.01607
Train [49][3020/3239]	Time 0.255 (0.809)	Data Time 0.001 (0.324)	Loss 2.6900 (2.7785)	Entropy 0.64196 (0.63940)	Top-1 acc 59.766 (57.027)	Top-5 acc 80.859 (79.026)	lr 0.01607
Train [49][3030/3239]	Time 0.237 (0.811)	Data Time 0.001 (0.326)	Loss 2.8150 (2.7784)	Entropy 0.64185 (0.63941)	Top-1 acc 53.516 (57.026)	Top-5 acc 77.734 (79.029)	lr 0.01607
Train [49][3040/3239]	Time 0.236 (0.812)	Data Time 0.001 (0.327)	Loss 2.9973 (2.7784)	Entropy 0.64179 (0.63942)	Top-1 acc 50.781 (57.025)	Top-5 acc 75.000 (79.027)	lr 0.01607
Train [49][3050/3239]	Time 0.348 (0.814)	Data Time 0.001 (0.330)	Loss 2.6191 (2.7784)	Entropy 0.64164 (0.63943)	Top-1 acc 60.938 (57.027)	Top-5 acc 80.469 (79.027)	lr 0.01607
Train [49][3060/3239]	Time 0.234 (0.816)	Data Time 0.001 (0.331)	Loss 2.9166 (2.7782)	Entropy 0.64165 (0.63943)	Top-1 acc 52.734 (57.028)	Top-5 acc 76.172 (79.030)	lr 0.01607
Train [49][3070/3239]	Time 0.232 (0.814)	Data Time 0.001 (0.330)	Loss 2.7868 (2.7782)	Entropy 0.64195 (0.63944)	Top-1 acc 58.984 (57.027)	Top-5 acc 77.734 (79.028)	lr 0.01607
Train [49][3080/3239]	Time 0.250 (0.817)	Data Time 0.001 (0.333)	Loss 2.6527 (2.7783)	Entropy 0.64175 (0.63945)	Top-1 acc 57.422 (57.025)	Top-5 acc 81.641 (79.027)	lr 0.01607
Train [49][3090/3239]	Time 3.943 (0.817)	Data Time 3.707 (0.333)	Loss 2.7925 (2.7782)	Entropy 0.64171 (0.63946)	Top-1 acc 58.984 (57.029)	Top-5 acc 78.125 (79.028)	lr 0.01606
Train [49][3100/3239]	Time 0.237 (0.816)	Data Time 0.001 (0.332)	Loss 2.8129 (2.7781)	Entropy 0.64176 (0.63946)	Top-1 acc 57.422 (57.029)	Top-5 acc 79.688 (79.031)	lr 0.01606
Train [49][3110/3239]	Time 3.200 (0.817)	Data Time 2.921 (0.333)	Loss 2.5264 (2.7780)	Entropy 0.64172 (0.63947)	Top-1 acc 63.281 (57.030)	Top-5 acc 81.250 (79.037)	lr 0.01606
Train [49][3120/3239]	Time 0.326 (0.815)	Data Time 0.001 (0.332)	Loss 2.7267 (2.7780)	Entropy 0.64137 (0.63948)	Top-1 acc 58.594 (57.032)	Top-5 acc 80.078 (79.037)	lr 0.01606
Train [49][3130/3239]	Time 0.233 (0.818)	Data Time 0.001 (0.335)	Loss 2.9792 (2.7779)	Entropy 0.64114 (0.63948)	Top-1 acc 54.297 (57.033)	Top-5 acc 75.391 (79.039)	lr 0.01606
Train [49][3140/3239]	Time 0.248 (0.820)	Data Time 0.001 (0.337)	Loss 2.8518 (2.7779)	Entropy 0.64096 (0.63949)	Top-1 acc 57.812 (57.034)	Top-5 acc 77.344 (79.041)	lr 0.01606
Train [49][3150/3239]	Time 0.225 (0.821)	Data Time 0.001 (0.338)	Loss 3.0222 (2.7780)	Entropy 0.64100 (0.63949)	Top-1 acc 47.656 (57.030)	Top-5 acc 73.828 (79.042)	lr 0.01606
Train [49][3160/3239]	Time 0.274 (0.823)	Data Time 0.002 (0.340)	Loss 2.9120 (2.7778)	Entropy 0.64096 (0.63950)	Top-1 acc 53.125 (57.036)	Top-5 acc 77.344 (79.044)	lr 0.01606
Train [49][3170/3239]	Time 2.208 (0.824)	Data Time 1.924 (0.341)	Loss 2.7978 (2.7777)	Entropy 0.64131 (0.63950)	Top-1 acc 58.984 (57.041)	Top-5 acc 78.516 (79.045)	lr 0.01606
Train [49][3180/3239]	Time 0.246 (0.825)	Data Time 0.000 (0.343)	Loss 2.8965 (2.7777)	Entropy 0.64135 (0.63951)	Top-1 acc 53.906 (57.040)	Top-5 acc 75.391 (79.044)	lr 0.01606
Train [49][3190/3239]	Time 0.262 (0.827)	Data Time 0.000 (0.344)	Loss 2.7276 (2.7776)	Entropy 0.64136 (0.63952)	Top-1 acc 63.281 (57.045)	Top-5 acc 80.859 (79.043)	lr 0.01606
Train [49][3200/3239]	Time 0.233 (0.829)	Data Time 0.000 (0.347)	Loss 2.8267 (2.7778)	Entropy 0.64175 (0.63952)	Top-1 acc 57.422 (57.040)	Top-5 acc 77.344 (79.039)	lr 0.01605
Train [49][3210/3239]	Time 0.341 (0.829)	Data Time 0.000 (0.347)	Loss 2.7052 (2.7778)	Entropy 0.64149 (0.63953)	Top-1 acc 60.156 (57.041)	Top-5 acc 79.297 (79.041)	lr 0.01605
Train [49][3220/3239]	Time 0.219 (0.829)	Data Time 0.000 (0.348)	Loss 2.9035 (2.7780)	Entropy 0.64172 (0.63954)	Top-1 acc 52.734 (57.040)	Top-5 acc 77.344 (79.042)	lr 0.01605
Train [49][3230/3239]	Time 0.224 (0.828)	Data Time 0.000 (0.347)	Loss 2.5473 (2.7778)	Entropy 0.64174 (0.63954)	Top-1 acc 61.719 (57.042)	Top-5 acc 83.594 (79.044)	lr 0.01605
Train [49][3239/3239]	Time 0.959 (0.829)	Data Time 0.000 (0.347)	Loss 2.8688 (2.7777)	Entropy 0.64189 (0.63955)	Top-1 acc 64.198 (57.040)	Top-5 acc 75.309 (79.047)	lr 0.01605
==========Valid [49/120]	loss 1.510	top-1 acc 65.564 (65.564)	top-5 acc 85.917	Train top-1 57.040	top-5 79.047	Entropy 0.64189	Latency-None: 0.000ms	Flops: 538.40M
Train [50][0/3239]	Time 33.996 (33.996)	Data Time 32.994 (32.994)	Loss 2.6551 (2.6551)	Entropy 0.64204 (0.64204)	Top-1 acc 60.547 (60.547)	Top-5 acc 83.203 (83.203)	lr 0.01605
Train [50][10/3239]	Time 0.300 (3.667)	Data Time 0.002 (3.164)	Loss 2.6583 (2.7358)	Entropy 0.64209 (0.64212)	Top-1 acc 61.328 (58.736)	Top-5 acc 80.469 (80.575)	lr 0.01605
Train [50][20/3239]	Time 0.232 (2.150)	Data Time 0.002 (1.658)	Loss 2.9039 (2.7444)	Entropy 0.64228 (0.64210)	Top-1 acc 52.734 (57.719)	Top-5 acc 76.562 (80.394)	lr 0.01605
Train [50][30/3239]	Time 0.267 (1.618)	Data Time 0.001 (1.124)	Loss 3.0615 (2.7714)	Entropy 0.64219 (0.64220)	Top-1 acc 49.219 (57.359)	Top-5 acc 72.266 (79.574)	lr 0.01605
Train [50][40/3239]	Time 0.375 (1.333)	Data Time 0.001 (0.850)	Loss 2.8004 (2.7870)	Entropy 0.64213 (0.64218)	Top-1 acc 58.984 (56.764)	Top-5 acc 79.297 (79.440)	lr 0.01605
Train [50][50/3239]	Time 0.343 (1.157)	Data Time 0.001 (0.684)	Loss 2.6541 (2.7806)	Entropy 0.64212 (0.64215)	Top-1 acc 60.547 (57.008)	Top-5 acc 81.641 (79.435)	lr 0.01605
Train [50][60/3239]	Time 0.224 (1.035)	Data Time 0.001 (0.572)	Loss 2.6102 (2.7753)	Entropy 0.64163 (0.64211)	Top-1 acc 55.469 (57.038)	Top-5 acc 82.812 (79.438)	lr 0.01604
Train [50][70/3239]	Time 0.251 (0.949)	Data Time 0.001 (0.491)	Loss 2.9417 (2.7762)	Entropy 0.64180 (0.64204)	Top-1 acc 54.688 (57.004)	Top-5 acc 75.781 (79.429)	lr 0.01604
Train [50][80/3239]	Time 0.258 (0.883)	Data Time 0.003 (0.431)	Loss 2.6931 (2.7796)	Entropy 0.64149 (0.64201)	Top-1 acc 58.984 (56.973)	Top-5 acc 83.203 (79.335)	lr 0.01604
Train [50][90/3239]	Time 0.342 (0.834)	Data Time 0.001 (0.384)	Loss 2.5187 (2.7803)	Entropy 0.64108 (0.64195)	Top-1 acc 61.719 (56.937)	Top-5 acc 83.984 (79.383)	lr 0.01604
Train [50][100/3239]	Time 0.266 (0.797)	Data Time 0.001 (0.346)	Loss 2.7205 (2.7769)	Entropy 0.64102 (0.64186)	Top-1 acc 62.109 (57.132)	Top-5 acc 82.031 (79.366)	lr 0.01604
Train [50][110/3239]	Time 0.336 (0.767)	Data Time 0.002 (0.315)	Loss 2.8364 (2.7699)	Entropy 0.64104 (0.64178)	Top-1 acc 58.203 (57.278)	Top-5 acc 80.078 (79.526)	lr 0.01604
Train [50][120/3239]	Time 0.265 (0.741)	Data Time 0.001 (0.289)	Loss 2.9527 (2.7718)	Entropy 0.64097 (0.64171)	Top-1 acc 50.000 (57.173)	Top-5 acc 75.781 (79.449)	lr 0.01604
Train [50][130/3239]	Time 0.333 (0.722)	Data Time 0.002 (0.267)	Loss 2.8173 (2.7704)	Entropy 0.64132 (0.64166)	Top-1 acc 55.859 (57.210)	Top-5 acc 78.125 (79.407)	lr 0.01604
Train [50][140/3239]	Time 0.221 (0.702)	Data Time 0.001 (0.248)	Loss 2.7312 (2.7718)	Entropy 0.64087 (0.64164)	Top-1 acc 58.203 (57.256)	Top-5 acc 83.203 (79.438)	lr 0.01604
Train [50][150/3239]	Time 0.238 (0.683)	Data Time 0.001 (0.232)	Loss 2.6980 (2.7716)	Entropy 0.64062 (0.64158)	Top-1 acc 60.938 (57.298)	Top-5 acc 80.469 (79.403)	lr 0.01604
Train [50][160/3239]	Time 0.250 (0.668)	Data Time 0.001 (0.218)	Loss 2.8467 (2.7735)	Entropy 0.64087 (0.64153)	Top-1 acc 58.984 (57.254)	Top-5 acc 75.000 (79.319)	lr 0.01603
Train [50][170/3239]	Time 0.240 (0.653)	Data Time 0.002 (0.205)	Loss 2.6263 (2.7734)	Entropy 0.64095 (0.64149)	Top-1 acc 62.109 (57.237)	Top-5 acc 82.422 (79.311)	lr 0.01603
Train [50][180/3239]	Time 0.262 (0.641)	Data Time 0.002 (0.194)	Loss 2.5253 (2.7718)	Entropy 0.64070 (0.64145)	Top-1 acc 64.062 (57.258)	Top-5 acc 83.203 (79.308)	lr 0.01603
Train [50][190/3239]	Time 0.267 (0.629)	Data Time 0.001 (0.184)	Loss 2.6828 (2.7681)	Entropy 0.64074 (0.64141)	Top-1 acc 56.250 (57.363)	Top-5 acc 81.250 (79.368)	lr 0.01603
Train [50][200/3239]	Time 0.253 (0.618)	Data Time 0.002 (0.175)	Loss 2.7605 (2.7679)	Entropy 0.64062 (0.64137)	Top-1 acc 61.719 (57.416)	Top-5 acc 79.297 (79.328)	lr 0.01603
Train [50][210/3239]	Time 0.307 (0.610)	Data Time 0.001 (0.166)	Loss 2.8117 (2.7641)	Entropy 0.64051 (0.64134)	Top-1 acc 54.297 (57.522)	Top-5 acc 78.516 (79.425)	lr 0.01603
Train [50][220/3239]	Time 0.222 (0.602)	Data Time 0.001 (0.159)	Loss 3.0236 (2.7638)	Entropy 0.64019 (0.64129)	Top-1 acc 49.609 (57.494)	Top-5 acc 73.438 (79.421)	lr 0.01603
Train [50][230/3239]	Time 0.275 (0.595)	Data Time 0.001 (0.152)	Loss 2.5827 (2.7633)	Entropy 0.64011 (0.64124)	Top-1 acc 61.719 (57.522)	Top-5 acc 83.594 (79.392)	lr 0.01603
Train [50][240/3239]	Time 0.220 (0.587)	Data Time 0.001 (0.146)	Loss 2.7339 (2.7632)	Entropy 0.64055 (0.64120)	Top-1 acc 59.375 (57.475)	Top-5 acc 81.641 (79.423)	lr 0.01603
Train [50][250/3239]	Time 0.233 (0.581)	Data Time 0.001 (0.140)	Loss 2.6656 (2.7623)	Entropy 0.64044 (0.64118)	Top-1 acc 61.719 (57.490)	Top-5 acc 79.688 (79.437)	lr 0.01603
Train [50][260/3239]	Time 0.225 (0.574)	Data Time 0.001 (0.135)	Loss 2.7742 (2.7615)	Entropy 0.64086 (0.64115)	Top-1 acc 55.859 (57.521)	Top-5 acc 76.953 (79.450)	lr 0.01603
Train [50][270/3239]	Time 0.325 (0.569)	Data Time 0.001 (0.130)	Loss 2.6421 (2.7597)	Entropy 0.64086 (0.64114)	Top-1 acc 59.766 (57.556)	Top-5 acc 81.250 (79.480)	lr 0.01602
Train [50][280/3239]	Time 0.231 (0.564)	Data Time 0.001 (0.125)	Loss 2.5150 (2.7561)	Entropy 0.64089 (0.64113)	Top-1 acc 62.500 (57.610)	Top-5 acc 83.594 (79.569)	lr 0.01602
Train [50][290/3239]	Time 0.264 (0.559)	Data Time 0.002 (0.121)	Loss 2.7744 (2.7567)	Entropy 0.64070 (0.64112)	Top-1 acc 61.719 (57.611)	Top-5 acc 78.125 (79.551)	lr 0.01602
Train [50][300/3239]	Time 0.285 (0.555)	Data Time 0.001 (0.117)	Loss 2.8841 (2.7571)	Entropy 0.64101 (0.64111)	Top-1 acc 52.344 (57.574)	Top-5 acc 78.516 (79.553)	lr 0.01602
Train [50][310/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.113)	Loss 2.9890 (2.7591)	Entropy 0.64121 (0.64111)	Top-1 acc 52.734 (57.545)	Top-5 acc 74.219 (79.514)	lr 0.01602
Train [50][320/3239]	Time 0.275 (0.546)	Data Time 0.001 (0.110)	Loss 2.4858 (2.7579)	Entropy 0.64109 (0.64111)	Top-1 acc 64.453 (57.563)	Top-5 acc 85.156 (79.510)	lr 0.01602
Train [50][330/3239]	Time 0.230 (0.543)	Data Time 0.001 (0.107)	Loss 2.6324 (2.7594)	Entropy 0.64106 (0.64111)	Top-1 acc 59.766 (57.541)	Top-5 acc 82.812 (79.469)	lr 0.01602
Train [50][340/3239]	Time 0.324 (0.539)	Data Time 0.001 (0.104)	Loss 2.5291 (2.7594)	Entropy 0.64127 (0.64111)	Top-1 acc 66.797 (57.555)	Top-5 acc 85.156 (79.465)	lr 0.01602
Train [50][350/3239]	Time 0.254 (0.535)	Data Time 0.001 (0.101)	Loss 2.8205 (2.7586)	Entropy 0.64149 (0.64112)	Top-1 acc 51.953 (57.565)	Top-5 acc 78.906 (79.485)	lr 0.01602
Train [50][360/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.098)	Loss 2.8702 (2.7582)	Entropy 0.64133 (0.64112)	Top-1 acc 57.812 (57.582)	Top-5 acc 76.562 (79.497)	lr 0.01602
Train [50][370/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.095)	Loss 2.9085 (2.7595)	Entropy 0.64091 (0.64113)	Top-1 acc 52.734 (57.535)	Top-5 acc 75.391 (79.471)	lr 0.01601
Train [50][380/3239]	Time 0.311 (0.617)	Data Time 0.002 (0.093)	Loss 2.5948 (2.7590)	Entropy 0.64086 (0.64112)	Top-1 acc 65.625 (57.530)	Top-5 acc 80.469 (79.476)	lr 0.01601
Train [50][390/3239]	Time 0.224 (0.611)	Data Time 0.002 (0.091)	Loss 2.7583 (2.7579)	Entropy 0.64118 (0.64112)	Top-1 acc 56.250 (57.551)	Top-5 acc 80.469 (79.498)	lr 0.01601
Train [50][400/3239]	Time 0.242 (0.606)	Data Time 0.001 (0.088)	Loss 2.7414 (2.7581)	Entropy 0.64127 (0.64112)	Top-1 acc 58.203 (57.539)	Top-5 acc 77.344 (79.481)	lr 0.01601
Train [50][410/3239]	Time 0.266 (0.602)	Data Time 0.001 (0.086)	Loss 2.8181 (2.7575)	Entropy 0.64102 (0.64112)	Top-1 acc 57.812 (57.533)	Top-5 acc 78.125 (79.494)	lr 0.01601
Train [50][420/3239]	Time 0.245 (0.599)	Data Time 0.001 (0.084)	Loss 2.8840 (2.7584)	Entropy 0.64113 (0.64112)	Top-1 acc 51.562 (57.508)	Top-5 acc 77.734 (79.486)	lr 0.01601
Train [50][430/3239]	Time 0.381 (0.595)	Data Time 0.001 (0.082)	Loss 2.7827 (2.7578)	Entropy 0.64108 (0.64112)	Top-1 acc 54.688 (57.524)	Top-5 acc 80.078 (79.506)	lr 0.01601
Train [50][440/3239]	Time 0.263 (0.592)	Data Time 0.001 (0.081)	Loss 2.6815 (2.7568)	Entropy 0.64091 (0.64111)	Top-1 acc 62.109 (57.537)	Top-5 acc 79.688 (79.522)	lr 0.01601
Train [50][450/3239]	Time 0.263 (0.589)	Data Time 0.002 (0.079)	Loss 2.6220 (2.7559)	Entropy 0.64067 (0.64110)	Top-1 acc 61.719 (57.550)	Top-5 acc 80.469 (79.534)	lr 0.01601
Train [50][460/3239]	Time 0.320 (0.586)	Data Time 0.001 (0.077)	Loss 2.9739 (2.7559)	Entropy 0.64047 (0.64109)	Top-1 acc 54.297 (57.561)	Top-5 acc 75.391 (79.533)	lr 0.01601
Train [50][470/3239]	Time 0.260 (0.583)	Data Time 0.001 (0.076)	Loss 3.0016 (2.7562)	Entropy 0.64029 (0.64108)	Top-1 acc 51.953 (57.553)	Top-5 acc 73.438 (79.530)	lr 0.01600
Train [50][480/3239]	Time 0.245 (0.580)	Data Time 0.001 (0.074)	Loss 2.8306 (2.7559)	Entropy 0.64032 (0.64106)	Top-1 acc 56.641 (57.556)	Top-5 acc 77.734 (79.532)	lr 0.01600
Train [50][490/3239]	Time 0.238 (0.577)	Data Time 0.001 (0.073)	Loss 2.6808 (2.7548)	Entropy 0.64062 (0.64105)	Top-1 acc 59.375 (57.592)	Top-5 acc 82.031 (79.552)	lr 0.01600
Train [50][500/3239]	Time 0.338 (0.575)	Data Time 0.001 (0.071)	Loss 2.9315 (2.7546)	Entropy 0.64078 (0.64104)	Top-1 acc 57.031 (57.609)	Top-5 acc 77.734 (79.562)	lr 0.01600
Train [50][510/3239]	Time 0.312 (0.572)	Data Time 0.002 (0.070)	Loss 2.8937 (2.7547)	Entropy 0.64068 (0.64103)	Top-1 acc 55.078 (57.602)	Top-5 acc 77.344 (79.561)	lr 0.01600
Train [50][520/3239]	Time 0.245 (0.570)	Data Time 0.001 (0.069)	Loss 2.8340 (2.7554)	Entropy 0.64083 (0.64103)	Top-1 acc 58.203 (57.582)	Top-5 acc 78.516 (79.557)	lr 0.01600
Train [50][530/3239]	Time 0.319 (0.568)	Data Time 0.002 (0.067)	Loss 2.7440 (2.7563)	Entropy 0.64102 (0.64103)	Top-1 acc 56.250 (57.546)	Top-5 acc 79.688 (79.534)	lr 0.01600
Train [50][540/3239]	Time 0.258 (0.566)	Data Time 0.002 (0.066)	Loss 2.7704 (2.7568)	Entropy 0.64078 (0.64102)	Top-1 acc 56.250 (57.524)	Top-5 acc 78.906 (79.518)	lr 0.01600
Train [50][550/3239]	Time 0.288 (0.565)	Data Time 0.002 (0.065)	Loss 2.6648 (2.7569)	Entropy 0.64059 (0.64102)	Top-1 acc 59.766 (57.526)	Top-5 acc 80.859 (79.512)	lr 0.01600
Train [50][560/3239]	Time 0.298 (0.563)	Data Time 0.001 (0.064)	Loss 2.7567 (2.7569)	Entropy 0.64024 (0.64101)	Top-1 acc 55.078 (57.526)	Top-5 acc 80.469 (79.510)	lr 0.01600
Train [50][570/3239]	Time 0.243 (0.561)	Data Time 0.002 (0.063)	Loss 2.7059 (2.7560)	Entropy 0.64004 (0.64099)	Top-1 acc 60.547 (57.559)	Top-5 acc 79.688 (79.532)	lr 0.01599
Train [50][580/3239]	Time 0.347 (0.560)	Data Time 0.004 (0.062)	Loss 2.6730 (2.7554)	Entropy 0.64001 (0.64098)	Top-1 acc 58.594 (57.564)	Top-5 acc 84.766 (79.559)	lr 0.01599
Train [50][590/3239]	Time 0.348 (0.558)	Data Time 0.001 (0.061)	Loss 3.1374 (2.7570)	Entropy 0.63957 (0.64096)	Top-1 acc 53.516 (57.543)	Top-5 acc 72.656 (79.524)	lr 0.01599
Train [50][600/3239]	Time 0.259 (0.556)	Data Time 0.001 (0.060)	Loss 2.7519 (2.7579)	Entropy 0.63949 (0.64093)	Top-1 acc 58.594 (57.530)	Top-5 acc 78.125 (79.491)	lr 0.01599
Train [50][610/3239]	Time 0.273 (0.554)	Data Time 0.001 (0.059)	Loss 2.7044 (2.7574)	Entropy 0.63988 (0.64091)	Top-1 acc 58.594 (57.538)	Top-5 acc 80.859 (79.498)	lr 0.01599
Train [50][620/3239]	Time 0.263 (0.553)	Data Time 0.001 (0.058)	Loss 2.6198 (2.7572)	Entropy 0.63965 (0.64089)	Top-1 acc 61.719 (57.523)	Top-5 acc 81.250 (79.496)	lr 0.01599
Train [50][630/3239]	Time 0.250 (0.551)	Data Time 0.001 (0.057)	Loss 2.7605 (2.7573)	Entropy 0.63999 (0.64088)	Top-1 acc 56.641 (57.514)	Top-5 acc 82.422 (79.504)	lr 0.01599
Train [50][640/3239]	Time 0.310 (0.551)	Data Time 0.003 (0.056)	Loss 2.8495 (2.7585)	Entropy 0.64016 (0.64086)	Top-1 acc 55.469 (57.490)	Top-5 acc 77.344 (79.483)	lr 0.01599
Train [50][650/3239]	Time 0.257 (0.550)	Data Time 0.001 (0.055)	Loss 2.8635 (2.7588)	Entropy 0.63990 (0.64085)	Top-1 acc 55.859 (57.479)	Top-5 acc 75.000 (79.482)	lr 0.01599
Train [50][660/3239]	Time 0.339 (0.548)	Data Time 0.001 (0.054)	Loss 2.9703 (2.7596)	Entropy 0.64008 (0.64084)	Top-1 acc 52.734 (57.468)	Top-5 acc 76.562 (79.469)	lr 0.01599
Train [50][670/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.054)	Loss 2.8924 (2.7598)	Entropy 0.63982 (0.64083)	Top-1 acc 57.031 (57.473)	Top-5 acc 78.516 (79.469)	lr 0.01599
Train [50][680/3239]	Time 0.259 (0.545)	Data Time 0.001 (0.053)	Loss 2.8462 (2.7607)	Entropy 0.63936 (0.64081)	Top-1 acc 54.688 (57.444)	Top-5 acc 76.953 (79.446)	lr 0.01598
Train [50][690/3239]	Time 0.313 (0.544)	Data Time 0.001 (0.052)	Loss 2.7729 (2.7608)	Entropy 0.63932 (0.64079)	Top-1 acc 55.859 (57.436)	Top-5 acc 78.125 (79.438)	lr 0.01598
Train [50][700/3239]	Time 0.257 (0.543)	Data Time 0.001 (0.051)	Loss 2.7445 (2.7602)	Entropy 0.63918 (0.64077)	Top-1 acc 60.156 (57.455)	Top-5 acc 78.516 (79.443)	lr 0.01598
Train [50][710/3239]	Time 0.249 (0.542)	Data Time 0.001 (0.051)	Loss 2.5789 (2.7603)	Entropy 0.63965 (0.64075)	Top-1 acc 61.328 (57.461)	Top-5 acc 83.203 (79.441)	lr 0.01598
Train [50][720/3239]	Time 0.246 (0.540)	Data Time 0.001 (0.050)	Loss 2.7755 (2.7608)	Entropy 0.63927 (0.64073)	Top-1 acc 56.641 (57.437)	Top-5 acc 76.172 (79.431)	lr 0.01598
Train [50][730/3239]	Time 0.243 (0.539)	Data Time 0.001 (0.049)	Loss 2.6946 (2.7610)	Entropy 0.63925 (0.64071)	Top-1 acc 61.328 (57.435)	Top-5 acc 80.078 (79.425)	lr 0.01598
Train [50][740/3239]	Time 0.263 (0.538)	Data Time 0.028 (0.049)	Loss 2.9089 (2.7612)	Entropy 0.63959 (0.64069)	Top-1 acc 53.125 (57.428)	Top-5 acc 75.781 (79.410)	lr 0.01598
Train [50][750/3239]	Time 0.374 (0.537)	Data Time 0.001 (0.048)	Loss 2.7116 (2.7626)	Entropy 0.63978 (0.64068)	Top-1 acc 58.984 (57.394)	Top-5 acc 81.250 (79.390)	lr 0.01598
Train [50][760/3239]	Time 0.249 (0.536)	Data Time 0.001 (0.048)	Loss 2.6240 (2.7618)	Entropy 0.64002 (0.64067)	Top-1 acc 58.984 (57.404)	Top-5 acc 82.031 (79.397)	lr 0.01598
Train [50][770/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.047)	Loss 2.8780 (2.7619)	Entropy 0.64038 (0.64066)	Top-1 acc 57.031 (57.400)	Top-5 acc 76.953 (79.392)	lr 0.01598
Train [50][780/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.046)	Loss 2.7860 (2.7615)	Entropy 0.64052 (0.64066)	Top-1 acc 58.594 (57.425)	Top-5 acc 77.734 (79.387)	lr 0.01597
Train [50][790/3239]	Time 0.244 (0.532)	Data Time 0.001 (0.046)	Loss 2.7611 (2.7610)	Entropy 0.64070 (0.64065)	Top-1 acc 55.078 (57.437)	Top-5 acc 80.078 (79.389)	lr 0.01597
Train [50][800/3239]	Time 0.296 (0.531)	Data Time 0.003 (0.045)	Loss 2.7075 (2.7610)	Entropy 0.64049 (0.64065)	Top-1 acc 60.156 (57.418)	Top-5 acc 80.469 (79.390)	lr 0.01597
Train [50][810/3239]	Time 0.259 (0.530)	Data Time 0.001 (0.045)	Loss 2.5287 (2.7610)	Entropy 0.64059 (0.64065)	Top-1 acc 59.375 (57.406)	Top-5 acc 84.766 (79.384)	lr 0.01597
Train [50][820/3239]	Time 0.374 (0.529)	Data Time 0.002 (0.044)	Loss 2.7446 (2.7610)	Entropy 0.64049 (0.64065)	Top-1 acc 57.422 (57.401)	Top-5 acc 81.250 (79.385)	lr 0.01597
Train [50][830/3239]	Time 0.243 (0.528)	Data Time 0.001 (0.044)	Loss 2.8128 (2.7599)	Entropy 0.64045 (0.64065)	Top-1 acc 55.469 (57.434)	Top-5 acc 79.297 (79.405)	lr 0.01597
Train [50][840/3239]	Time 0.246 (0.527)	Data Time 0.001 (0.043)	Loss 2.8356 (2.7598)	Entropy 0.64044 (0.64064)	Top-1 acc 51.953 (57.427)	Top-5 acc 75.000 (79.400)	lr 0.01597
Train [50][850/3239]	Time 0.246 (0.526)	Data Time 0.001 (0.043)	Loss 2.8652 (2.7598)	Entropy 0.64051 (0.64064)	Top-1 acc 55.078 (57.423)	Top-5 acc 77.734 (79.401)	lr 0.01597
Train [50][860/3239]	Time 0.317 (0.525)	Data Time 0.001 (0.042)	Loss 2.8142 (2.7604)	Entropy 0.64023 (0.64064)	Top-1 acc 55.078 (57.410)	Top-5 acc 78.516 (79.389)	lr 0.01597
Train [50][870/3239]	Time 0.251 (0.524)	Data Time 0.001 (0.042)	Loss 2.5446 (2.7610)	Entropy 0.64050 (0.64063)	Top-1 acc 64.062 (57.402)	Top-5 acc 83.203 (79.372)	lr 0.01597
Train [50][880/3239]	Time 0.262 (0.523)	Data Time 0.001 (0.041)	Loss 2.9987 (2.7615)	Entropy 0.64054 (0.64063)	Top-1 acc 51.172 (57.387)	Top-5 acc 76.562 (79.367)	lr 0.01596
Train [50][890/3239]	Time 0.331 (0.523)	Data Time 0.001 (0.041)	Loss 2.8618 (2.7613)	Entropy 0.64045 (0.64063)	Top-1 acc 52.734 (57.396)	Top-5 acc 78.516 (79.376)	lr 0.01596
Train [50][900/3239]	Time 0.251 (0.522)	Data Time 0.002 (0.040)	Loss 2.5956 (2.7607)	Entropy 0.64071 (0.64063)	Top-1 acc 61.328 (57.406)	Top-5 acc 83.984 (79.386)	lr 0.01596
Train [50][910/3239]	Time 0.255 (0.521)	Data Time 0.001 (0.040)	Loss 2.8289 (2.7607)	Entropy 0.64099 (0.64063)	Top-1 acc 51.562 (57.409)	Top-5 acc 77.344 (79.384)	lr 0.01596
Train [50][920/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.040)	Loss 2.6752 (2.7599)	Entropy 0.64118 (0.64063)	Top-1 acc 58.984 (57.429)	Top-5 acc 81.250 (79.391)	lr 0.01596
Train [50][930/3239]	Time 0.251 (0.519)	Data Time 0.002 (0.039)	Loss 2.2764 (2.7594)	Entropy 0.64073 (0.64064)	Top-1 acc 67.188 (57.457)	Top-5 acc 86.328 (79.392)	lr 0.01596
Train [50][940/3239]	Time 0.240 (0.518)	Data Time 0.001 (0.039)	Loss 2.6923 (2.7600)	Entropy 0.64073 (0.64064)	Top-1 acc 57.812 (57.446)	Top-5 acc 80.859 (79.389)	lr 0.01596
Train [50][950/3239]	Time 0.270 (0.517)	Data Time 0.002 (0.038)	Loss 2.7585 (2.7604)	Entropy 0.64064 (0.64064)	Top-1 acc 57.812 (57.424)	Top-5 acc 78.125 (79.384)	lr 0.01596
Train [50][960/3239]	Time 0.244 (0.517)	Data Time 0.002 (0.038)	Loss 2.8272 (2.7609)	Entropy 0.64085 (0.64064)	Top-1 acc 56.641 (57.428)	Top-5 acc 80.078 (79.374)	lr 0.01596
Train [50][970/3239]	Time 0.257 (0.516)	Data Time 0.002 (0.038)	Loss 2.7952 (2.7616)	Entropy 0.64118 (0.64065)	Top-1 acc 56.641 (57.408)	Top-5 acc 78.906 (79.367)	lr 0.01596
Train [50][980/3239]	Time 0.360 (0.515)	Data Time 0.001 (0.037)	Loss 2.7386 (2.7612)	Entropy 0.64089 (0.64065)	Top-1 acc 56.641 (57.418)	Top-5 acc 78.906 (79.375)	lr 0.01596
Train [50][990/3239]	Time 0.219 (0.517)	Data Time 0.001 (0.040)	Loss 2.7959 (2.7612)	Entropy 0.64115 (0.64065)	Top-1 acc 59.766 (57.425)	Top-5 acc 79.688 (79.376)	lr 0.01595
Train [50][1000/3239]	Time 0.238 (0.517)	Data Time 0.001 (0.040)	Loss 2.8091 (2.7615)	Entropy 0.64099 (0.64066)	Top-1 acc 55.469 (57.422)	Top-5 acc 76.172 (79.365)	lr 0.01595
Train [50][1010/3239]	Time 0.251 (0.516)	Data Time 0.001 (0.039)	Loss 2.6876 (2.7613)	Entropy 0.64113 (0.64066)	Top-1 acc 62.891 (57.423)	Top-5 acc 81.250 (79.373)	lr 0.01595
Train [50][1020/3239]	Time 0.245 (0.519)	Data Time 0.002 (0.043)	Loss 2.7468 (2.7612)	Entropy 0.64107 (0.64067)	Top-1 acc 55.469 (57.428)	Top-5 acc 81.250 (79.372)	lr 0.01595
Train [50][1030/3239]	Time 0.361 (0.552)	Data Time 0.005 (0.043)	Loss 2.8854 (2.7607)	Entropy 0.64066 (0.64067)	Top-1 acc 52.344 (57.435)	Top-5 acc 77.734 (79.383)	lr 0.01595
Train [50][1040/3239]	Time 0.229 (0.552)	Data Time 0.002 (0.042)	Loss 2.7443 (2.7608)	Entropy 0.64077 (0.64067)	Top-1 acc 55.469 (57.428)	Top-5 acc 80.078 (79.377)	lr 0.01595
Train [50][1050/3239]	Time 0.319 (0.550)	Data Time 0.001 (0.042)	Loss 2.8680 (2.7610)	Entropy 0.64086 (0.64067)	Top-1 acc 51.953 (57.422)	Top-5 acc 74.609 (79.371)	lr 0.01595
Train [50][1060/3239]	Time 0.246 (0.549)	Data Time 0.001 (0.041)	Loss 2.5660 (2.7608)	Entropy 0.64093 (0.64067)	Top-1 acc 65.625 (57.417)	Top-5 acc 82.422 (79.371)	lr 0.01595
Train [50][1070/3239]	Time 0.263 (0.548)	Data Time 0.001 (0.041)	Loss 2.8143 (2.7610)	Entropy 0.64114 (0.64068)	Top-1 acc 57.812 (57.410)	Top-5 acc 75.781 (79.365)	lr 0.01595
Train [50][1080/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.041)	Loss 2.7506 (2.7605)	Entropy 0.64155 (0.64068)	Top-1 acc 59.766 (57.425)	Top-5 acc 81.641 (79.379)	lr 0.01595
Train [50][1090/3239]	Time 0.217 (0.546)	Data Time 0.001 (0.040)	Loss 2.8137 (2.7608)	Entropy 0.64164 (0.64069)	Top-1 acc 58.984 (57.422)	Top-5 acc 79.297 (79.377)	lr 0.01594
Train [50][1100/3239]	Time 0.294 (0.545)	Data Time 0.001 (0.040)	Loss 2.6241 (2.7614)	Entropy 0.64123 (0.64070)	Top-1 acc 62.109 (57.409)	Top-5 acc 81.250 (79.363)	lr 0.01594
Train [50][1110/3239]	Time 0.271 (0.545)	Data Time 0.001 (0.040)	Loss 2.7812 (2.7610)	Entropy 0.64158 (0.64070)	Top-1 acc 55.078 (57.409)	Top-5 acc 79.297 (79.370)	lr 0.01594
Train [50][1120/3239]	Time 0.249 (0.544)	Data Time 0.001 (0.039)	Loss 2.7372 (2.7604)	Entropy 0.64158 (0.64071)	Top-1 acc 58.594 (57.426)	Top-5 acc 77.344 (79.381)	lr 0.01594
Train [50][1130/3239]	Time 0.246 (0.543)	Data Time 0.001 (0.039)	Loss 2.6108 (2.7597)	Entropy 0.64187 (0.64072)	Top-1 acc 57.422 (57.439)	Top-5 acc 81.641 (79.396)	lr 0.01594
Train [50][1140/3239]	Time 0.390 (0.542)	Data Time 0.003 (0.039)	Loss 2.4465 (2.7600)	Entropy 0.64156 (0.64073)	Top-1 acc 63.672 (57.432)	Top-5 acc 84.375 (79.387)	lr 0.01594
Train [50][1150/3239]	Time 0.277 (0.541)	Data Time 0.003 (0.038)	Loss 2.6957 (2.7598)	Entropy 0.64152 (0.64073)	Top-1 acc 61.719 (57.426)	Top-5 acc 79.688 (79.389)	lr 0.01594
Train [50][1160/3239]	Time 0.244 (0.540)	Data Time 0.001 (0.038)	Loss 2.6583 (2.7598)	Entropy 0.64178 (0.64074)	Top-1 acc 60.938 (57.419)	Top-5 acc 82.031 (79.392)	lr 0.01594
Train [50][1170/3239]	Time 0.288 (0.541)	Data Time 0.002 (0.039)	Loss 2.7390 (2.7596)	Entropy 0.64209 (0.64075)	Top-1 acc 57.422 (57.425)	Top-5 acc 82.422 (79.399)	lr 0.01594
Train [50][1180/3239]	Time 0.245 (0.542)	Data Time 0.001 (0.040)	Loss 2.8259 (2.7597)	Entropy 0.64182 (0.64076)	Top-1 acc 57.422 (57.421)	Top-5 acc 78.125 (79.398)	lr 0.01594
Train [50][1190/3239]	Time 0.226 (0.542)	Data Time 0.001 (0.041)	Loss 2.9133 (2.7590)	Entropy 0.64140 (0.64077)	Top-1 acc 54.297 (57.431)	Top-5 acc 78.906 (79.414)	lr 0.01593
Train [50][1200/3239]	Time 0.827 (0.542)	Data Time 0.545 (0.041)	Loss 2.7745 (2.7595)	Entropy 0.64110 (0.64077)	Top-1 acc 61.328 (57.419)	Top-5 acc 80.078 (79.407)	lr 0.01593
Train [50][1210/3239]	Time 0.418 (0.545)	Data Time 0.033 (0.044)	Loss 2.6841 (2.7590)	Entropy 0.64114 (0.64078)	Top-1 acc 58.594 (57.432)	Top-5 acc 80.469 (79.412)	lr 0.01593
Train [50][1220/3239]	Time 0.253 (0.546)	Data Time 0.002 (0.046)	Loss 2.7130 (2.7592)	Entropy 0.64094 (0.64078)	Top-1 acc 60.156 (57.433)	Top-5 acc 81.641 (79.409)	lr 0.01593
Train [50][1230/3239]	Time 0.260 (0.545)	Data Time 0.002 (0.045)	Loss 2.7595 (2.7590)	Entropy 0.64077 (0.64078)	Top-1 acc 59.766 (57.426)	Top-5 acc 81.250 (79.415)	lr 0.01593
Train [50][1240/3239]	Time 0.261 (0.544)	Data Time 0.001 (0.045)	Loss 2.7786 (2.7595)	Entropy 0.64046 (0.64078)	Top-1 acc 54.688 (57.409)	Top-5 acc 78.906 (79.412)	lr 0.01593
Train [50][1250/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.046)	Loss 2.8856 (2.7597)	Entropy 0.64075 (0.64078)	Top-1 acc 52.734 (57.400)	Top-5 acc 77.344 (79.411)	lr 0.01593
Train [50][1260/3239]	Time 0.264 (0.546)	Data Time 0.001 (0.047)	Loss 2.7618 (2.7594)	Entropy 0.64117 (0.64078)	Top-1 acc 57.422 (57.399)	Top-5 acc 77.734 (79.415)	lr 0.01593
Train [50][1270/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.047)	Loss 2.6937 (2.7591)	Entropy 0.64087 (0.64078)	Top-1 acc 61.719 (57.410)	Top-5 acc 81.250 (79.421)	lr 0.01593
Train [50][1280/3239]	Time 0.262 (0.545)	Data Time 0.001 (0.047)	Loss 2.9719 (2.7591)	Entropy 0.64090 (0.64078)	Top-1 acc 52.344 (57.416)	Top-5 acc 74.219 (79.423)	lr 0.01593
Train [50][1290/3239]	Time 0.248 (0.547)	Data Time 0.001 (0.049)	Loss 2.7952 (2.7596)	Entropy 0.64116 (0.64078)	Top-1 acc 58.594 (57.409)	Top-5 acc 77.734 (79.411)	lr 0.01593
Train [50][1300/3239]	Time 0.354 (0.546)	Data Time 0.001 (0.048)	Loss 2.6867 (2.7595)	Entropy 0.64113 (0.64078)	Top-1 acc 55.469 (57.405)	Top-5 acc 81.250 (79.415)	lr 0.01592
Train [50][1310/3239]	Time 0.233 (0.548)	Data Time 0.001 (0.050)	Loss 2.8216 (2.7596)	Entropy 0.64116 (0.64079)	Top-1 acc 56.250 (57.406)	Top-5 acc 75.000 (79.410)	lr 0.01592
Train [50][1320/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.054)	Loss 2.7868 (2.7592)	Entropy 0.64102 (0.64079)	Top-1 acc 58.984 (57.420)	Top-5 acc 77.734 (79.420)	lr 0.01592
Train [50][1330/3239]	Time 0.250 (0.550)	Data Time 0.001 (0.053)	Loss 2.7003 (2.7589)	Entropy 0.64117 (0.64079)	Top-1 acc 58.594 (57.428)	Top-5 acc 80.078 (79.430)	lr 0.01592
Train [50][1340/3239]	Time 0.243 (0.552)	Data Time 0.001 (0.056)	Loss 2.7845 (2.7589)	Entropy 0.64113 (0.64079)	Top-1 acc 55.859 (57.419)	Top-5 acc 77.344 (79.429)	lr 0.01592
Train [50][1350/3239]	Time 0.310 (0.551)	Data Time 0.002 (0.056)	Loss 2.6926 (2.7591)	Entropy 0.64125 (0.64080)	Top-1 acc 60.156 (57.418)	Top-5 acc 79.297 (79.430)	lr 0.01592
Train [50][1360/3239]	Time 0.265 (0.554)	Data Time 0.001 (0.058)	Loss 2.8046 (2.7595)	Entropy 0.64161 (0.64080)	Top-1 acc 54.688 (57.420)	Top-5 acc 79.297 (79.421)	lr 0.01592
Train [50][1370/3239]	Time 0.338 (0.555)	Data Time 0.001 (0.060)	Loss 2.9236 (2.7599)	Entropy 0.64123 (0.64081)	Top-1 acc 53.906 (57.420)	Top-5 acc 77.344 (79.411)	lr 0.01592
Train [50][1380/3239]	Time 0.233 (0.554)	Data Time 0.001 (0.059)	Loss 2.6780 (2.7596)	Entropy 0.64155 (0.64081)	Top-1 acc 58.594 (57.428)	Top-5 acc 83.203 (79.417)	lr 0.01592
Train [50][1390/3239]	Time 0.260 (0.557)	Data Time 0.001 (0.063)	Loss 2.5914 (2.7599)	Entropy 0.64184 (0.64082)	Top-1 acc 62.109 (57.414)	Top-5 acc 80.469 (79.415)	lr 0.01592
Train [50][1400/3239]	Time 0.845 (0.557)	Data Time 0.598 (0.063)	Loss 2.9089 (2.7593)	Entropy 0.64187 (0.64082)	Top-1 acc 53.516 (57.423)	Top-5 acc 76.562 (79.431)	lr 0.01591
Train [50][1410/3239]	Time 0.246 (0.556)	Data Time 0.001 (0.063)	Loss 2.7719 (2.7593)	Entropy 0.64183 (0.64083)	Top-1 acc 57.812 (57.420)	Top-5 acc 81.250 (79.431)	lr 0.01591
Train [50][1420/3239]	Time 0.256 (0.562)	Data Time 0.001 (0.069)	Loss 2.8756 (2.7593)	Entropy 0.64182 (0.64084)	Top-1 acc 55.469 (57.414)	Top-5 acc 76.562 (79.430)	lr 0.01591
Train [50][1430/3239]	Time 0.231 (0.561)	Data Time 0.001 (0.069)	Loss 2.7123 (2.7593)	Entropy 0.64151 (0.64084)	Top-1 acc 62.891 (57.419)	Top-5 acc 80.859 (79.423)	lr 0.01591
Train [50][1440/3239]	Time 0.238 (0.560)	Data Time 0.001 (0.069)	Loss 2.8664 (2.7598)	Entropy 0.64192 (0.64085)	Top-1 acc 56.641 (57.405)	Top-5 acc 77.344 (79.418)	lr 0.01591
Train [50][1450/3239]	Time 0.236 (0.568)	Data Time 0.001 (0.077)	Loss 2.8140 (2.7598)	Entropy 0.64146 (0.64086)	Top-1 acc 53.906 (57.407)	Top-5 acc 74.609 (79.415)	lr 0.01591
Train [50][1460/3239]	Time 0.239 (0.567)	Data Time 0.001 (0.077)	Loss 2.7474 (2.7594)	Entropy 0.64152 (0.64086)	Top-1 acc 58.594 (57.419)	Top-5 acc 77.734 (79.421)	lr 0.01591
Train [50][1470/3239]	Time 0.224 (0.566)	Data Time 0.001 (0.076)	Loss 2.8472 (2.7599)	Entropy 0.64188 (0.64087)	Top-1 acc 57.422 (57.411)	Top-5 acc 76.562 (79.408)	lr 0.01591
Train [50][1480/3239]	Time 0.256 (0.573)	Data Time 0.001 (0.083)	Loss 2.7007 (2.7597)	Entropy 0.64191 (0.64087)	Top-1 acc 58.984 (57.413)	Top-5 acc 80.859 (79.412)	lr 0.01591
Train [50][1490/3239]	Time 0.248 (0.572)	Data Time 0.001 (0.083)	Loss 2.7352 (2.7595)	Entropy 0.64182 (0.64088)	Top-1 acc 58.984 (57.418)	Top-5 acc 77.344 (79.411)	lr 0.01591
Train [50][1500/3239]	Time 0.255 (0.571)	Data Time 0.001 (0.082)	Loss 2.7912 (2.7597)	Entropy 0.64189 (0.64089)	Top-1 acc 57.031 (57.413)	Top-5 acc 80.078 (79.411)	lr 0.01590
Train [50][1510/3239]	Time 0.230 (0.570)	Data Time 0.001 (0.082)	Loss 2.6115 (2.7597)	Entropy 0.64223 (0.64089)	Top-1 acc 60.156 (57.410)	Top-5 acc 80.469 (79.409)	lr 0.01590
Train [50][1520/3239]	Time 0.232 (0.578)	Data Time 0.001 (0.090)	Loss 2.7665 (2.7597)	Entropy 0.64212 (0.64090)	Top-1 acc 58.594 (57.415)	Top-5 acc 79.688 (79.403)	lr 0.01590
Train [50][1530/3239]	Time 0.330 (0.577)	Data Time 0.001 (0.090)	Loss 2.5888 (2.7597)	Entropy 0.64245 (0.64091)	Top-1 acc 62.500 (57.414)	Top-5 acc 83.203 (79.407)	lr 0.01590
Train [50][1540/3239]	Time 0.258 (0.576)	Data Time 0.001 (0.089)	Loss 2.6049 (2.7598)	Entropy 0.64269 (0.64092)	Top-1 acc 59.375 (57.410)	Top-5 acc 83.594 (79.402)	lr 0.01590
Train [50][1550/3239]	Time 0.221 (0.584)	Data Time 0.001 (0.098)	Loss 2.8398 (2.7593)	Entropy 0.64308 (0.64093)	Top-1 acc 55.078 (57.421)	Top-5 acc 79.688 (79.416)	lr 0.01590
Train [50][1560/3239]	Time 0.233 (0.583)	Data Time 0.001 (0.097)	Loss 2.8593 (2.7595)	Entropy 0.64293 (0.64095)	Top-1 acc 53.906 (57.414)	Top-5 acc 79.297 (79.412)	lr 0.01590
Train [50][1570/3239]	Time 0.259 (0.582)	Data Time 0.001 (0.097)	Loss 2.6604 (2.7594)	Entropy 0.64289 (0.64096)	Top-1 acc 62.500 (57.423)	Top-5 acc 81.250 (79.414)	lr 0.01590
Train [50][1580/3239]	Time 0.250 (0.591)	Data Time 0.001 (0.106)	Loss 3.0284 (2.7595)	Entropy 0.64293 (0.64097)	Top-1 acc 51.562 (57.417)	Top-5 acc 72.266 (79.406)	lr 0.01590
Train [50][1590/3239]	Time 0.248 (0.591)	Data Time 0.001 (0.106)	Loss 2.6666 (2.7595)	Entropy 0.64312 (0.64098)	Top-1 acc 57.812 (57.410)	Top-5 acc 80.469 (79.409)	lr 0.01590
Train [50][1600/3239]	Time 0.334 (0.589)	Data Time 0.001 (0.105)	Loss 2.8449 (2.7595)	Entropy 0.64240 (0.64100)	Top-1 acc 54.297 (57.405)	Top-5 acc 79.688 (79.409)	lr 0.01589
Train [50][1610/3239]	Time 0.248 (0.599)	Data Time 0.001 (0.115)	Loss 2.7406 (2.7596)	Entropy 0.64270 (0.64101)	Top-1 acc 57.422 (57.400)	Top-5 acc 80.859 (79.411)	lr 0.01589
Train [50][1620/3239]	Time 0.260 (0.598)	Data Time 0.001 (0.114)	Loss 2.7126 (2.7593)	Entropy 0.64269 (0.64102)	Top-1 acc 58.594 (57.407)	Top-5 acc 80.469 (79.419)	lr 0.01589
Train [50][1630/3239]	Time 0.221 (0.597)	Data Time 0.001 (0.114)	Loss 3.0921 (2.7593)	Entropy 0.64254 (0.64103)	Top-1 acc 49.609 (57.410)	Top-5 acc 74.219 (79.421)	lr 0.01589
Train [50][1640/3239]	Time 0.247 (0.606)	Data Time 0.001 (0.124)	Loss 2.6030 (2.7590)	Entropy 0.64240 (0.64103)	Top-1 acc 59.375 (57.418)	Top-5 acc 82.031 (79.430)	lr 0.01589
Train [50][1650/3239]	Time 0.236 (0.605)	Data Time 0.001 (0.123)	Loss 2.7436 (2.7587)	Entropy 0.64263 (0.64104)	Top-1 acc 53.516 (57.422)	Top-5 acc 82.031 (79.443)	lr 0.01589
Train [50][1660/3239]	Time 0.237 (0.604)	Data Time 0.001 (0.122)	Loss 2.8546 (2.7588)	Entropy 0.64241 (0.64105)	Top-1 acc 55.078 (57.416)	Top-5 acc 78.906 (79.438)	lr 0.01589
Train [50][1670/3239]	Time 0.229 (0.603)	Data Time 0.002 (0.122)	Loss 2.6572 (2.7587)	Entropy 0.64224 (0.64106)	Top-1 acc 59.766 (57.420)	Top-5 acc 82.422 (79.441)	lr 0.01589
Train [50][1680/3239]	Time 1.977 (0.613)	Data Time 1.727 (0.132)	Loss 2.8374 (2.7588)	Entropy 0.64174 (0.64107)	Top-1 acc 57.812 (57.424)	Top-5 acc 76.172 (79.441)	lr 0.01589
Train [50][1690/3239]	Time 0.463 (0.632)	Data Time 0.006 (0.131)	Loss 2.7802 (2.7587)	Entropy 0.64173 (0.64107)	Top-1 acc 55.859 (57.428)	Top-5 acc 77.734 (79.444)	lr 0.01589
Train [50][1700/3239]	Time 0.234 (0.630)	Data Time 0.001 (0.130)	Loss 2.7287 (2.7586)	Entropy 0.64188 (0.64107)	Top-1 acc 57.031 (57.430)	Top-5 acc 82.422 (79.446)	lr 0.01589
Train [50][1710/3239]	Time 0.240 (0.629)	Data Time 0.001 (0.129)	Loss 2.7663 (2.7584)	Entropy 0.64197 (0.64108)	Top-1 acc 57.031 (57.436)	Top-5 acc 78.906 (79.447)	lr 0.01588
Train [50][1720/3239]	Time 0.247 (0.628)	Data Time 0.002 (0.129)	Loss 2.7919 (2.7587)	Entropy 0.64206 (0.64108)	Top-1 acc 60.156 (57.433)	Top-5 acc 76.562 (79.442)	lr 0.01588
Train [50][1730/3239]	Time 0.242 (0.627)	Data Time 0.001 (0.128)	Loss 2.7476 (2.7588)	Entropy 0.64223 (0.64109)	Top-1 acc 55.469 (57.431)	Top-5 acc 79.688 (79.440)	lr 0.01588
Train [50][1740/3239]	Time 0.252 (0.626)	Data Time 0.001 (0.127)	Loss 2.9200 (2.7591)	Entropy 0.64188 (0.64110)	Top-1 acc 54.297 (57.428)	Top-5 acc 76.953 (79.435)	lr 0.01588
Train [50][1750/3239]	Time 1.098 (0.627)	Data Time 0.836 (0.129)	Loss 2.5890 (2.7588)	Entropy 0.64163 (0.64110)	Top-1 acc 62.891 (57.438)	Top-5 acc 84.766 (79.439)	lr 0.01588
Train [50][1760/3239]	Time 1.202 (0.628)	Data Time 0.848 (0.130)	Loss 2.7955 (2.7591)	Entropy 0.64174 (0.64110)	Top-1 acc 58.984 (57.435)	Top-5 acc 76.953 (79.429)	lr 0.01588
Train [50][1770/3239]	Time 0.252 (0.629)	Data Time 0.001 (0.131)	Loss 2.5647 (2.7586)	Entropy 0.64190 (0.64111)	Top-1 acc 63.281 (57.449)	Top-5 acc 83.203 (79.434)	lr 0.01588
Train [50][1780/3239]	Time 0.236 (0.631)	Data Time 0.001 (0.134)	Loss 2.7370 (2.7587)	Entropy 0.64188 (0.64111)	Top-1 acc 59.375 (57.445)	Top-5 acc 77.734 (79.431)	lr 0.01588
Train [50][1790/3239]	Time 0.243 (0.635)	Data Time 0.001 (0.138)	Loss 2.7049 (2.7587)	Entropy 0.64164 (0.64111)	Top-1 acc 55.078 (57.448)	Top-5 acc 80.859 (79.431)	lr 0.01588
Train [50][1800/3239]	Time 0.259 (0.636)	Data Time 0.001 (0.139)	Loss 2.7749 (2.7588)	Entropy 0.64152 (0.64112)	Top-1 acc 53.516 (57.446)	Top-5 acc 79.297 (79.428)	lr 0.01588
Train [50][1810/3239]	Time 0.253 (0.638)	Data Time 0.001 (0.142)	Loss 2.4869 (2.7586)	Entropy 0.64153 (0.64112)	Top-1 acc 63.672 (57.447)	Top-5 acc 83.594 (79.434)	lr 0.01587
Train [50][1820/3239]	Time 4.272 (0.641)	Data Time 3.993 (0.146)	Loss 2.8991 (2.7586)	Entropy 0.64158 (0.64112)	Top-1 acc 51.953 (57.446)	Top-5 acc 78.906 (79.435)	lr 0.01587
Train [50][1830/3239]	Time 0.233 (0.641)	Data Time 0.001 (0.146)	Loss 2.8874 (2.7588)	Entropy 0.64138 (0.64112)	Top-1 acc 56.641 (57.443)	Top-5 acc 77.344 (79.432)	lr 0.01587
Train [50][1840/3239]	Time 8.210 (0.646)	Data Time 7.951 (0.151)	Loss 2.9174 (2.7591)	Entropy 0.64148 (0.64112)	Top-1 acc 51.562 (57.433)	Top-5 acc 79.688 (79.428)	lr 0.01587
Train [50][1850/3239]	Time 1.741 (0.646)	Data Time 1.362 (0.151)	Loss 2.7553 (2.7591)	Entropy 0.64163 (0.64113)	Top-1 acc 57.812 (57.436)	Top-5 acc 78.906 (79.428)	lr 0.01587
Train [50][1860/3239]	Time 0.269 (0.649)	Data Time 0.001 (0.155)	Loss 2.6679 (2.7594)	Entropy 0.64153 (0.64113)	Top-1 acc 57.812 (57.426)	Top-5 acc 83.594 (79.423)	lr 0.01587
Train [50][1870/3239]	Time 1.779 (0.650)	Data Time 1.510 (0.156)	Loss 2.7802 (2.7596)	Entropy 0.64144 (0.64113)	Top-1 acc 55.469 (57.422)	Top-5 acc 76.172 (79.416)	lr 0.01587
Train [50][1880/3239]	Time 0.930 (0.654)	Data Time 0.677 (0.161)	Loss 3.0501 (2.7596)	Entropy 0.64130 (0.64113)	Top-1 acc 51.953 (57.424)	Top-5 acc 73.438 (79.411)	lr 0.01587
Train [50][1890/3239]	Time 0.248 (0.658)	Data Time 0.002 (0.165)	Loss 2.9881 (2.7601)	Entropy 0.64152 (0.64113)	Top-1 acc 54.688 (57.410)	Top-5 acc 75.781 (79.402)	lr 0.01587
Train [50][1900/3239]	Time 0.246 (0.657)	Data Time 0.001 (0.165)	Loss 2.7165 (2.7601)	Entropy 0.64154 (0.64114)	Top-1 acc 58.984 (57.406)	Top-5 acc 81.641 (79.403)	lr 0.01587
Train [50][1910/3239]	Time 5.303 (0.662)	Data Time 5.015 (0.170)	Loss 2.5995 (2.7603)	Entropy 0.64134 (0.64114)	Top-1 acc 63.281 (57.407)	Top-5 acc 84.766 (79.406)	lr 0.01586
Train [50][1920/3239]	Time 5.036 (0.667)	Data Time 4.671 (0.174)	Loss 2.7315 (2.7599)	Entropy 0.64171 (0.64114)	Top-1 acc 57.812 (57.416)	Top-5 acc 80.859 (79.414)	lr 0.01586
Train [50][1930/3239]	Time 0.229 (0.665)	Data Time 0.001 (0.174)	Loss 2.6885 (2.7600)	Entropy 0.64158 (0.64114)	Top-1 acc 62.109 (57.421)	Top-5 acc 83.203 (79.416)	lr 0.01586
Train [50][1940/3239]	Time 0.242 (0.666)	Data Time 0.001 (0.175)	Loss 2.7586 (2.7602)	Entropy 0.64156 (0.64114)	Top-1 acc 55.469 (57.419)	Top-5 acc 78.125 (79.409)	lr 0.01586
Train [50][1950/3239]	Time 0.260 (0.676)	Data Time 0.001 (0.185)	Loss 2.5935 (2.7601)	Entropy 0.64168 (0.64115)	Top-1 acc 56.250 (57.417)	Top-5 acc 83.203 (79.409)	lr 0.01586
Train [50][1960/3239]	Time 0.243 (0.674)	Data Time 0.001 (0.184)	Loss 2.7949 (2.7604)	Entropy 0.64153 (0.64115)	Top-1 acc 54.688 (57.415)	Top-5 acc 75.781 (79.404)	lr 0.01586
Train [50][1970/3239]	Time 0.264 (0.675)	Data Time 0.002 (0.185)	Loss 2.6172 (2.7606)	Entropy 0.64147 (0.64115)	Top-1 acc 61.719 (57.410)	Top-5 acc 82.422 (79.399)	lr 0.01586
Train [50][1980/3239]	Time 4.254 (0.683)	Data Time 3.996 (0.193)	Loss 2.7675 (2.7608)	Entropy 0.64168 (0.64115)	Top-1 acc 60.547 (57.409)	Top-5 acc 82.422 (79.402)	lr 0.01586
Train [50][1990/3239]	Time 0.224 (0.682)	Data Time 0.001 (0.192)	Loss 2.7710 (2.7610)	Entropy 0.64162 (0.64116)	Top-1 acc 57.031 (57.403)	Top-5 acc 80.469 (79.394)	lr 0.01586
Train [50][2000/3239]	Time 1.490 (0.683)	Data Time 1.245 (0.194)	Loss 2.7290 (2.7608)	Entropy 0.64143 (0.64116)	Top-1 acc 60.156 (57.409)	Top-5 acc 79.688 (79.396)	lr 0.01586
Train [50][2010/3239]	Time 0.328 (0.689)	Data Time 0.001 (0.200)	Loss 2.5446 (2.7607)	Entropy 0.64119 (0.64116)	Top-1 acc 64.844 (57.413)	Top-5 acc 82.422 (79.393)	lr 0.01586
Train [50][2020/3239]	Time 0.256 (0.691)	Data Time 0.001 (0.202)	Loss 2.9038 (2.7610)	Entropy 0.64146 (0.64116)	Top-1 acc 54.688 (57.405)	Top-5 acc 77.344 (79.391)	lr 0.01585
Train [50][2030/3239]	Time 3.313 (0.691)	Data Time 3.065 (0.203)	Loss 2.6686 (2.7609)	Entropy 0.64162 (0.64116)	Top-1 acc 57.812 (57.409)	Top-5 acc 82.031 (79.389)	lr 0.01585
Train [50][2040/3239]	Time 0.225 (0.696)	Data Time 0.001 (0.208)	Loss 3.2262 (2.7610)	Entropy 0.64205 (0.64116)	Top-1 acc 45.703 (57.404)	Top-5 acc 74.219 (79.390)	lr 0.01585
Train [50][2050/3239]	Time 0.242 (0.699)	Data Time 0.001 (0.211)	Loss 2.7029 (2.7608)	Entropy 0.64239 (0.64117)	Top-1 acc 60.547 (57.410)	Top-5 acc 80.078 (79.392)	lr 0.01585
Train [50][2060/3239]	Time 0.239 (0.697)	Data Time 0.001 (0.210)	Loss 2.8398 (2.7607)	Entropy 0.64265 (0.64118)	Top-1 acc 52.734 (57.417)	Top-5 acc 79.688 (79.394)	lr 0.01585
Train [50][2070/3239]	Time 6.640 (0.703)	Data Time 6.409 (0.216)	Loss 2.7816 (2.7608)	Entropy 0.64262 (0.64118)	Top-1 acc 58.984 (57.416)	Top-5 acc 80.469 (79.392)	lr 0.01585
Train [50][2080/3239]	Time 0.345 (0.708)	Data Time 0.001 (0.222)	Loss 2.6266 (2.7608)	Entropy 0.64242 (0.64119)	Top-1 acc 56.641 (57.416)	Top-5 acc 83.203 (79.395)	lr 0.01585
Train [50][2090/3239]	Time 0.246 (0.706)	Data Time 0.001 (0.220)	Loss 2.8044 (2.7613)	Entropy 0.64242 (0.64120)	Top-1 acc 53.516 (57.406)	Top-5 acc 79.688 (79.388)	lr 0.01585
Train [50][2100/3239]	Time 0.231 (0.709)	Data Time 0.001 (0.223)	Loss 2.7217 (2.7611)	Entropy 0.64221 (0.64120)	Top-1 acc 56.641 (57.411)	Top-5 acc 79.688 (79.390)	lr 0.01585
Train [50][2110/3239]	Time 0.235 (0.717)	Data Time 0.001 (0.231)	Loss 2.9307 (2.7612)	Entropy 0.64200 (0.64121)	Top-1 acc 53.516 (57.411)	Top-5 acc 75.781 (79.387)	lr 0.01585
Train [50][2120/3239]	Time 0.238 (0.715)	Data Time 0.001 (0.230)	Loss 2.8561 (2.7612)	Entropy 0.64204 (0.64121)	Top-1 acc 58.984 (57.408)	Top-5 acc 78.516 (79.391)	lr 0.01584
Train [50][2130/3239]	Time 0.255 (0.716)	Data Time 0.001 (0.232)	Loss 2.6000 (2.7613)	Entropy 0.64211 (0.64121)	Top-1 acc 57.812 (57.405)	Top-5 acc 83.594 (79.390)	lr 0.01584
Train [50][2140/3239]	Time 14.542 (0.726)	Data Time 14.315 (0.242)	Loss 2.7240 (2.7615)	Entropy 0.64237 (0.64122)	Top-1 acc 61.328 (57.404)	Top-5 acc 80.469 (79.384)	lr 0.01584
Train [50][2150/3239]	Time 0.245 (0.725)	Data Time 0.001 (0.241)	Loss 2.6675 (2.7616)	Entropy 0.64242 (0.64122)	Top-1 acc 60.547 (57.401)	Top-5 acc 81.250 (79.380)	lr 0.01584
Train [50][2160/3239]	Time 1.827 (0.725)	Data Time 1.576 (0.242)	Loss 2.9366 (2.7620)	Entropy 0.64196 (0.64123)	Top-1 acc 49.609 (57.395)	Top-5 acc 76.953 (79.370)	lr 0.01584
Train [50][2170/3239]	Time 0.246 (0.729)	Data Time 0.001 (0.246)	Loss 2.6709 (2.7620)	Entropy 0.64192 (0.64123)	Top-1 acc 60.938 (57.392)	Top-5 acc 81.641 (79.370)	lr 0.01584
Train [50][2180/3239]	Time 0.238 (0.732)	Data Time 0.001 (0.249)	Loss 2.7360 (2.7617)	Entropy 0.64199 (0.64123)	Top-1 acc 56.641 (57.398)	Top-5 acc 80.469 (79.376)	lr 0.01584
Train [50][2190/3239]	Time 4.898 (0.733)	Data Time 4.646 (0.250)	Loss 3.1508 (2.7621)	Entropy 0.64179 (0.64124)	Top-1 acc 49.219 (57.392)	Top-5 acc 73.438 (79.366)	lr 0.01584
Train [50][2200/3239]	Time 9.385 (0.736)	Data Time 9.097 (0.253)	Loss 2.6647 (2.7623)	Entropy 0.64184 (0.64124)	Top-1 acc 60.938 (57.390)	Top-5 acc 80.469 (79.364)	lr 0.01584
Train [50][2210/3239]	Time 0.243 (0.741)	Data Time 0.001 (0.260)	Loss 2.5278 (2.7622)	Entropy 0.64197 (0.64124)	Top-1 acc 63.281 (57.396)	Top-5 acc 82.031 (79.365)	lr 0.01584
Train [50][2220/3239]	Time 0.233 (0.740)	Data Time 0.001 (0.258)	Loss 2.5792 (2.7621)	Entropy 0.64169 (0.64124)	Top-1 acc 63.281 (57.398)	Top-5 acc 83.984 (79.368)	lr 0.01583
Train [50][2230/3239]	Time 0.220 (0.740)	Data Time 0.001 (0.259)	Loss 3.0375 (2.7623)	Entropy 0.64213 (0.64125)	Top-1 acc 47.266 (57.394)	Top-5 acc 76.172 (79.367)	lr 0.01583
Train [50][2240/3239]	Time 0.334 (0.749)	Data Time 0.001 (0.268)	Loss 2.7286 (2.7624)	Entropy 0.64213 (0.64125)	Top-1 acc 58.594 (57.393)	Top-5 acc 77.734 (79.362)	lr 0.01583
Train [50][2250/3239]	Time 0.227 (0.748)	Data Time 0.001 (0.267)	Loss 2.9006 (2.7626)	Entropy 0.64184 (0.64126)	Top-1 acc 53.906 (57.385)	Top-5 acc 79.297 (79.356)	lr 0.01583
Train [50][2260/3239]	Time 0.273 (0.750)	Data Time 0.001 (0.270)	Loss 2.6643 (2.7625)	Entropy 0.64214 (0.64126)	Top-1 acc 58.594 (57.387)	Top-5 acc 80.859 (79.361)	lr 0.01583
Train [50][2270/3239]	Time 0.251 (0.757)	Data Time 0.001 (0.277)	Loss 2.8408 (2.7626)	Entropy 0.64189 (0.64126)	Top-1 acc 53.906 (57.385)	Top-5 acc 76.172 (79.354)	lr 0.01583
Train [50][2280/3239]	Time 0.239 (0.755)	Data Time 0.001 (0.276)	Loss 2.7238 (2.7625)	Entropy 0.64196 (0.64126)	Top-1 acc 55.469 (57.386)	Top-5 acc 79.688 (79.357)	lr 0.01583
Train [50][2290/3239]	Time 0.261 (0.757)	Data Time 0.002 (0.277)	Loss 2.9906 (2.7628)	Entropy 0.64210 (0.64127)	Top-1 acc 54.297 (57.379)	Top-5 acc 71.094 (79.348)	lr 0.01583
Train [50][2300/3239]	Time 15.059 (0.765)	Data Time 14.809 (0.286)	Loss 2.6394 (2.7627)	Entropy 0.64199 (0.64127)	Top-1 acc 57.812 (57.380)	Top-5 acc 80.859 (79.349)	lr 0.01583
Train [50][2310/3239]	Time 0.317 (0.763)	Data Time 0.001 (0.284)	Loss 2.7271 (2.7628)	Entropy 0.64206 (0.64127)	Top-1 acc 60.156 (57.382)	Top-5 acc 81.250 (79.349)	lr 0.01583
Train [50][2320/3239]	Time 0.238 (0.766)	Data Time 0.001 (0.288)	Loss 2.7623 (2.7630)	Entropy 0.64221 (0.64128)	Top-1 acc 57.422 (57.377)	Top-5 acc 77.734 (79.340)	lr 0.01582
Train [50][2330/3239]	Time 0.238 (0.766)	Data Time 0.001 (0.288)	Loss 2.8615 (2.7629)	Entropy 0.64264 (0.64128)	Top-1 acc 55.078 (57.376)	Top-5 acc 75.781 (79.338)	lr 0.01582
Train [50][2340/3239]	Time 0.381 (0.785)	Data Time 0.007 (0.294)	Loss 2.7608 (2.7630)	Entropy 0.64170 (0.64129)	Top-1 acc 59.375 (57.373)	Top-5 acc 79.688 (79.336)	lr 0.01582
Train [50][2350/3239]	Time 0.233 (0.784)	Data Time 0.002 (0.292)	Loss 2.9508 (2.7631)	Entropy 0.64176 (0.64129)	Top-1 acc 55.859 (57.372)	Top-5 acc 75.000 (79.337)	lr 0.01582
Train [50][2360/3239]	Time 0.231 (0.783)	Data Time 0.001 (0.291)	Loss 2.7463 (2.7630)	Entropy 0.64148 (0.64129)	Top-1 acc 55.859 (57.373)	Top-5 acc 78.516 (79.338)	lr 0.01582
Train [50][2370/3239]	Time 0.285 (0.781)	Data Time 0.004 (0.290)	Loss 2.9105 (2.7628)	Entropy 0.64174 (0.64129)	Top-1 acc 49.219 (57.379)	Top-5 acc 76.953 (79.341)	lr 0.01582
Train [50][2380/3239]	Time 0.230 (0.780)	Data Time 0.001 (0.289)	Loss 2.9140 (2.7630)	Entropy 0.64182 (0.64129)	Top-1 acc 53.906 (57.377)	Top-5 acc 76.562 (79.334)	lr 0.01582
Train [50][2390/3239]	Time 0.231 (0.778)	Data Time 0.001 (0.288)	Loss 2.8232 (2.7627)	Entropy 0.64191 (0.64130)	Top-1 acc 54.297 (57.383)	Top-5 acc 78.125 (79.338)	lr 0.01582
Train [50][2400/3239]	Time 0.337 (0.783)	Data Time 0.001 (0.293)	Loss 2.6161 (2.7627)	Entropy 0.64176 (0.64130)	Top-1 acc 63.281 (57.385)	Top-5 acc 79.688 (79.337)	lr 0.01582
Train [50][2410/3239]	Time 0.251 (0.782)	Data Time 0.001 (0.292)	Loss 2.6294 (2.7625)	Entropy 0.64180 (0.64130)	Top-1 acc 59.375 (57.394)	Top-5 acc 82.031 (79.340)	lr 0.01582
Train [50][2420/3239]	Time 0.258 (0.783)	Data Time 0.001 (0.293)	Loss 2.6514 (2.7624)	Entropy 0.64183 (0.64130)	Top-1 acc 61.719 (57.399)	Top-5 acc 79.297 (79.341)	lr 0.01582
Train [50][2430/3239]	Time 0.249 (0.789)	Data Time 0.001 (0.299)	Loss 2.7654 (2.7622)	Entropy 0.64144 (0.64130)	Top-1 acc 55.859 (57.405)	Top-5 acc 81.250 (79.346)	lr 0.01581
Train [50][2440/3239]	Time 0.254 (0.787)	Data Time 0.001 (0.298)	Loss 2.9206 (2.7621)	Entropy 0.64170 (0.64130)	Top-1 acc 54.297 (57.410)	Top-5 acc 75.391 (79.347)	lr 0.01581
Train [50][2450/3239]	Time 0.237 (0.790)	Data Time 0.001 (0.300)	Loss 2.6422 (2.7620)	Entropy 0.64151 (0.64131)	Top-1 acc 57.031 (57.410)	Top-5 acc 81.641 (79.348)	lr 0.01581
Train [50][2460/3239]	Time 6.515 (0.794)	Data Time 6.273 (0.305)	Loss 2.8621 (2.7619)	Entropy 0.64147 (0.64131)	Top-1 acc 52.344 (57.414)	Top-5 acc 74.609 (79.344)	lr 0.01581
Train [50][2470/3239]	Time 0.394 (0.794)	Data Time 0.001 (0.305)	Loss 3.0371 (2.7620)	Entropy 0.64146 (0.64131)	Top-1 acc 53.906 (57.420)	Top-5 acc 73.047 (79.344)	lr 0.01581
Train [50][2480/3239]	Time 7.959 (0.798)	Data Time 7.704 (0.310)	Loss 2.7407 (2.7618)	Entropy 0.64130 (0.64131)	Top-1 acc 57.422 (57.420)	Top-5 acc 79.297 (79.346)	lr 0.01581
Train [50][2490/3239]	Time 0.231 (0.797)	Data Time 0.001 (0.309)	Loss 2.7559 (2.7618)	Entropy 0.64138 (0.64131)	Top-1 acc 59.375 (57.423)	Top-5 acc 79.297 (79.346)	lr 0.01581
Train [50][2500/3239]	Time 0.260 (0.800)	Data Time 0.001 (0.312)	Loss 2.7242 (2.7617)	Entropy 0.64178 (0.64131)	Top-1 acc 58.203 (57.427)	Top-5 acc 76.953 (79.345)	lr 0.01581
Train [50][2510/3239]	Time 1.479 (0.800)	Data Time 1.220 (0.312)	Loss 2.6772 (2.7616)	Entropy 0.64196 (0.64131)	Top-1 acc 59.375 (57.431)	Top-5 acc 79.688 (79.345)	lr 0.01581
Train [50][2520/3239]	Time 0.271 (0.803)	Data Time 0.001 (0.315)	Loss 2.7842 (2.7615)	Entropy 0.64214 (0.64131)	Top-1 acc 58.203 (57.434)	Top-5 acc 80.469 (79.346)	lr 0.01581
Train [50][2530/3239]	Time 0.230 (0.805)	Data Time 0.001 (0.318)	Loss 2.9089 (2.7613)	Entropy 0.64208 (0.64132)	Top-1 acc 52.734 (57.437)	Top-5 acc 74.609 (79.348)	lr 0.01580
Train [50][2540/3239]	Time 0.237 (0.806)	Data Time 0.001 (0.319)	Loss 2.8979 (2.7616)	Entropy 0.64240 (0.64132)	Top-1 acc 53.906 (57.436)	Top-5 acc 77.734 (79.345)	lr 0.01580
Train [50][2550/3239]	Time 0.254 (0.808)	Data Time 0.001 (0.321)	Loss 2.8385 (2.7616)	Entropy 0.64248 (0.64132)	Top-1 acc 55.078 (57.434)	Top-5 acc 77.734 (79.347)	lr 0.01580
Train [50][2560/3239]	Time 0.330 (0.810)	Data Time 0.002 (0.323)	Loss 2.9283 (2.7620)	Entropy 0.64161 (0.64133)	Top-1 acc 51.172 (57.426)	Top-5 acc 78.516 (79.340)	lr 0.01580
Train [50][2570/3239]	Time 0.234 (0.811)	Data Time 0.001 (0.325)	Loss 2.8844 (2.7621)	Entropy 0.64154 (0.64133)	Top-1 acc 58.594 (57.425)	Top-5 acc 75.781 (79.334)	lr 0.01580
Train [50][2580/3239]	Time 0.277 (0.812)	Data Time 0.003 (0.326)	Loss 2.6532 (2.7621)	Entropy 0.64166 (0.64133)	Top-1 acc 57.031 (57.425)	Top-5 acc 82.031 (79.333)	lr 0.01580
Train [50][2590/3239]	Time 0.239 (0.816)	Data Time 0.001 (0.330)	Loss 2.6229 (2.7622)	Entropy 0.64141 (0.64133)	Top-1 acc 62.109 (57.419)	Top-5 acc 83.594 (79.332)	lr 0.01580
Train [50][2600/3239]	Time 0.233 (0.816)	Data Time 0.001 (0.331)	Loss 2.8106 (2.7623)	Entropy 0.64139 (0.64133)	Top-1 acc 52.734 (57.419)	Top-5 acc 77.734 (79.328)	lr 0.01580
Train [50][2610/3239]	Time 0.257 (0.818)	Data Time 0.001 (0.332)	Loss 2.8979 (2.7623)	Entropy 0.64158 (0.64133)	Top-1 acc 55.469 (57.419)	Top-5 acc 78.125 (79.328)	lr 0.01580
Train [50][2620/3239]	Time 2.318 (0.820)	Data Time 2.051 (0.335)	Loss 2.5723 (2.7624)	Entropy 0.64176 (0.64133)	Top-1 acc 59.375 (57.415)	Top-5 acc 85.156 (79.329)	lr 0.01580
Train [50][2630/3239]	Time 0.342 (0.821)	Data Time 0.001 (0.336)	Loss 2.6574 (2.7626)	Entropy 0.64188 (0.64133)	Top-1 acc 59.375 (57.413)	Top-5 acc 78.906 (79.323)	lr 0.01579
Train [50][2640/3239]	Time 6.586 (0.822)	Data Time 6.289 (0.338)	Loss 2.6035 (2.7625)	Entropy 0.64215 (0.64134)	Top-1 acc 59.766 (57.413)	Top-5 acc 80.469 (79.325)	lr 0.01579
Train [50][2650/3239]	Time 0.265 (0.825)	Data Time 0.001 (0.341)	Loss 2.9569 (2.7625)	Entropy 0.64235 (0.64134)	Top-1 acc 48.828 (57.411)	Top-5 acc 76.953 (79.325)	lr 0.01579
Train [50][2660/3239]	Time 0.278 (0.826)	Data Time 0.001 (0.342)	Loss 2.9590 (2.7629)	Entropy 0.64238 (0.64134)	Top-1 acc 50.781 (57.401)	Top-5 acc 73.047 (79.315)	lr 0.01579
Train [50][2670/3239]	Time 0.234 (0.824)	Data Time 0.001 (0.341)	Loss 2.7864 (2.7629)	Entropy 0.64242 (0.64135)	Top-1 acc 62.109 (57.405)	Top-5 acc 79.297 (79.314)	lr 0.01579
Train [50][2680/3239]	Time 8.177 (0.829)	Data Time 7.932 (0.345)	Loss 2.7564 (2.7630)	Entropy 0.64245 (0.64135)	Top-1 acc 58.203 (57.405)	Top-5 acc 76.953 (79.312)	lr 0.01579
Train [50][2690/3239]	Time 0.221 (0.832)	Data Time 0.001 (0.348)	Loss 3.0136 (2.7631)	Entropy 0.64270 (0.64136)	Top-1 acc 51.172 (57.406)	Top-5 acc 76.562 (79.309)	lr 0.01579
Train [50][2700/3239]	Time 0.239 (0.830)	Data Time 0.001 (0.347)	Loss 2.6360 (2.7629)	Entropy 0.64278 (0.64136)	Top-1 acc 58.984 (57.407)	Top-5 acc 83.594 (79.314)	lr 0.01579
Train [50][2710/3239]	Time 0.250 (0.830)	Data Time 0.001 (0.348)	Loss 2.7873 (2.7629)	Entropy 0.64313 (0.64137)	Top-1 acc 53.906 (57.404)	Top-5 acc 80.469 (79.316)	lr 0.01579
Train [50][2720/3239]	Time 0.286 (0.833)	Data Time 0.001 (0.350)	Loss 2.8905 (2.7628)	Entropy 0.64312 (0.64137)	Top-1 acc 53.906 (57.408)	Top-5 acc 76.953 (79.318)	lr 0.01579
Train [50][2730/3239]	Time 0.231 (0.837)	Data Time 0.001 (0.354)	Loss 2.7860 (2.7629)	Entropy 0.64299 (0.64138)	Top-1 acc 55.078 (57.407)	Top-5 acc 78.516 (79.316)	lr 0.01578
Train [50][2740/3239]	Time 0.239 (0.835)	Data Time 0.001 (0.353)	Loss 2.8405 (2.7630)	Entropy 0.64306 (0.64139)	Top-1 acc 58.984 (57.402)	Top-5 acc 78.516 (79.314)	lr 0.01578
Train [50][2750/3239]	Time 0.240 (0.838)	Data Time 0.001 (0.356)	Loss 2.7856 (2.7629)	Entropy 0.64279 (0.64139)	Top-1 acc 56.641 (57.404)	Top-5 acc 78.516 (79.317)	lr 0.01578
Train [50][2760/3239]	Time 0.234 (0.842)	Data Time 0.001 (0.361)	Loss 2.6356 (2.7629)	Entropy 0.64282 (0.64140)	Top-1 acc 62.891 (57.405)	Top-5 acc 79.688 (79.315)	lr 0.01578
Train [50][2770/3239]	Time 0.249 (0.841)	Data Time 0.001 (0.359)	Loss 2.7254 (2.7631)	Entropy 0.64281 (0.64140)	Top-1 acc 58.203 (57.403)	Top-5 acc 80.469 (79.314)	lr 0.01578
Train [50][2780/3239]	Time 5.237 (0.843)	Data Time 4.987 (0.362)	Loss 2.6962 (2.7633)	Entropy 0.64271 (0.64141)	Top-1 acc 57.422 (57.396)	Top-5 acc 79.688 (79.310)	lr 0.01578
Train [50][2790/3239]	Time 0.350 (0.848)	Data Time 0.001 (0.367)	Loss 2.8071 (2.7631)	Entropy 0.64263 (0.64141)	Top-1 acc 57.812 (57.401)	Top-5 acc 76.172 (79.311)	lr 0.01578
Train [50][2800/3239]	Time 0.233 (0.846)	Data Time 0.001 (0.366)	Loss 2.5438 (2.7631)	Entropy 0.64271 (0.64142)	Top-1 acc 60.938 (57.402)	Top-5 acc 82.812 (79.310)	lr 0.01578
Train [50][2810/3239]	Time 0.247 (0.847)	Data Time 0.001 (0.367)	Loss 2.7534 (2.7632)	Entropy 0.64266 (0.64142)	Top-1 acc 56.250 (57.400)	Top-5 acc 78.906 (79.308)	lr 0.01578
Train [50][2820/3239]	Time 0.251 (0.852)	Data Time 0.001 (0.372)	Loss 2.7893 (2.7633)	Entropy 0.64267 (0.64142)	Top-1 acc 57.812 (57.397)	Top-5 acc 77.734 (79.306)	lr 0.01578
Train [50][2830/3239]	Time 0.231 (0.851)	Data Time 0.001 (0.371)	Loss 2.6362 (2.7635)	Entropy 0.64255 (0.64143)	Top-1 acc 58.594 (57.396)	Top-5 acc 81.641 (79.305)	lr 0.01578
Train [50][2840/3239]	Time 7.660 (0.852)	Data Time 7.418 (0.372)	Loss 2.6243 (2.7634)	Entropy 0.64263 (0.64143)	Top-1 acc 58.984 (57.397)	Top-5 acc 83.594 (79.307)	lr 0.01577
Train [50][2850/3239]	Time 0.231 (0.857)	Data Time 0.001 (0.377)	Loss 2.8607 (2.7634)	Entropy 0.64300 (0.64144)	Top-1 acc 55.078 (57.398)	Top-5 acc 79.688 (79.306)	lr 0.01577
Train [50][2860/3239]	Time 0.354 (0.855)	Data Time 0.001 (0.376)	Loss 2.7952 (2.7633)	Entropy 0.64302 (0.64144)	Top-1 acc 59.375 (57.403)	Top-5 acc 78.906 (79.308)	lr 0.01577
Train [50][2870/3239]	Time 0.251 (0.855)	Data Time 0.001 (0.375)	Loss 2.7113 (2.7630)	Entropy 0.64318 (0.64145)	Top-1 acc 56.250 (57.412)	Top-5 acc 80.859 (79.314)	lr 0.01577
Train [50][2880/3239]	Time 0.238 (0.856)	Data Time 0.001 (0.377)	Loss 2.8038 (2.7630)	Entropy 0.64344 (0.64145)	Top-1 acc 56.250 (57.412)	Top-5 acc 78.125 (79.315)	lr 0.01577
Train [50][2890/3239]	Time 0.232 (0.861)	Data Time 0.001 (0.382)	Loss 2.6428 (2.7631)	Entropy 0.64355 (0.64146)	Top-1 acc 57.812 (57.407)	Top-5 acc 84.375 (79.313)	lr 0.01577
Train [50][2900/3239]	Time 0.230 (0.859)	Data Time 0.001 (0.381)	Loss 2.7886 (2.7631)	Entropy 0.64360 (0.64147)	Top-1 acc 53.516 (57.406)	Top-5 acc 78.125 (79.315)	lr 0.01577
Train [50][2910/3239]	Time 0.239 (0.860)	Data Time 0.001 (0.382)	Loss 2.8273 (2.7631)	Entropy 0.64327 (0.64148)	Top-1 acc 54.688 (57.408)	Top-5 acc 79.688 (79.316)	lr 0.01577
Train [50][2920/3239]	Time 0.264 (0.864)	Data Time 0.002 (0.386)	Loss 2.8758 (2.7629)	Entropy 0.64323 (0.64148)	Top-1 acc 54.688 (57.416)	Top-5 acc 76.953 (79.319)	lr 0.01577
Train [50][2930/3239]	Time 0.268 (0.863)	Data Time 0.001 (0.385)	Loss 2.7924 (2.7628)	Entropy 0.64335 (0.64149)	Top-1 acc 59.375 (57.423)	Top-5 acc 79.688 (79.323)	lr 0.01577
Train [50][2940/3239]	Time 0.270 (0.862)	Data Time 0.002 (0.384)	Loss 2.8656 (2.7627)	Entropy 0.64286 (0.64150)	Top-1 acc 58.984 (57.426)	Top-5 acc 78.125 (79.326)	lr 0.01576
Train [50][2950/3239]	Time 0.371 (0.864)	Data Time 0.001 (0.387)	Loss 2.7807 (2.7628)	Entropy 0.64321 (0.64150)	Top-1 acc 58.984 (57.424)	Top-5 acc 79.688 (79.325)	lr 0.01576
Train [50][2960/3239]	Time 0.280 (0.863)	Data Time 0.002 (0.386)	Loss 2.7361 (2.7627)	Entropy 0.64284 (0.64151)	Top-1 acc 61.328 (57.427)	Top-5 acc 78.906 (79.328)	lr 0.01576
Train [50][2970/3239]	Time 0.236 (0.861)	Data Time 0.001 (0.384)	Loss 2.7688 (2.7627)	Entropy 0.64263 (0.64151)	Top-1 acc 59.766 (57.428)	Top-5 acc 78.906 (79.327)	lr 0.01576
Train [50][2980/3239]	Time 0.250 (0.867)	Data Time 0.001 (0.390)	Loss 2.8222 (2.7626)	Entropy 0.64266 (0.64151)	Top-1 acc 56.250 (57.432)	Top-5 acc 78.906 (79.328)	lr 0.01576
Train [50][2990/3239]	Time 0.237 (0.865)	Data Time 0.001 (0.388)	Loss 2.7909 (2.7628)	Entropy 0.64280 (0.64152)	Top-1 acc 57.812 (57.427)	Top-5 acc 78.906 (79.322)	lr 0.01576
Train [50][3000/3239]	Time 0.266 (0.875)	Data Time 0.002 (0.387)	Loss 2.8256 (2.7627)	Entropy 0.64305 (0.64152)	Top-1 acc 57.031 (57.431)	Top-5 acc 78.125 (79.323)	lr 0.01576
Train [50][3010/3239]	Time 0.239 (0.874)	Data Time 0.001 (0.386)	Loss 2.7306 (2.7628)	Entropy 0.64337 (0.64153)	Top-1 acc 57.422 (57.427)	Top-5 acc 80.469 (79.325)	lr 0.01576
Train [50][3020/3239]	Time 0.249 (0.872)	Data Time 0.001 (0.384)	Loss 2.6594 (2.7627)	Entropy 0.64275 (0.64153)	Top-1 acc 56.641 (57.424)	Top-5 acc 83.984 (79.328)	lr 0.01576
Train [50][3030/3239]	Time 0.259 (0.871)	Data Time 0.001 (0.383)	Loss 2.6907 (2.7629)	Entropy 0.64259 (0.64154)	Top-1 acc 58.594 (57.420)	Top-5 acc 80.859 (79.328)	lr 0.01576
Train [50][3040/3239]	Time 0.299 (0.869)	Data Time 0.001 (0.382)	Loss 2.5493 (2.7626)	Entropy 0.64238 (0.64154)	Top-1 acc 60.938 (57.428)	Top-5 acc 86.328 (79.335)	lr 0.01575
Train [50][3050/3239]	Time 0.239 (0.874)	Data Time 0.002 (0.386)	Loss 2.6656 (2.7625)	Entropy 0.64255 (0.64154)	Top-1 acc 60.156 (57.431)	Top-5 acc 82.812 (79.337)	lr 0.01575
Train [50][3060/3239]	Time 0.233 (0.872)	Data Time 0.001 (0.385)	Loss 2.6823 (2.7624)	Entropy 0.64273 (0.64155)	Top-1 acc 59.375 (57.434)	Top-5 acc 80.078 (79.339)	lr 0.01575
Train [50][3070/3239]	Time 0.277 (0.872)	Data Time 0.001 (0.385)	Loss 2.6805 (2.7626)	Entropy 0.64274 (0.64155)	Top-1 acc 55.469 (57.429)	Top-5 acc 80.078 (79.334)	lr 0.01575
Train [50][3080/3239]	Time 0.258 (0.879)	Data Time 0.001 (0.392)	Loss 2.6454 (2.7625)	Entropy 0.64251 (0.64155)	Top-1 acc 57.422 (57.431)	Top-5 acc 84.375 (79.333)	lr 0.01575
Train [50][3090/3239]	Time 0.251 (0.877)	Data Time 0.001 (0.390)	Loss 2.7730 (2.7624)	Entropy 0.64247 (0.64156)	Top-1 acc 57.031 (57.432)	Top-5 acc 76.172 (79.333)	lr 0.01575
Train [50][3100/3239]	Time 2.113 (0.876)	Data Time 1.815 (0.390)	Loss 2.8258 (2.7625)	Entropy 0.64267 (0.64156)	Top-1 acc 56.250 (57.433)	Top-5 acc 80.078 (79.330)	lr 0.01575
Train [50][3110/3239]	Time 0.397 (0.879)	Data Time 0.001 (0.392)	Loss 2.8393 (2.7626)	Entropy 0.64284 (0.64156)	Top-1 acc 53.906 (57.433)	Top-5 acc 78.125 (79.328)	lr 0.01575
Train [50][3120/3239]	Time 0.248 (0.877)	Data Time 0.001 (0.391)	Loss 2.6793 (2.7626)	Entropy 0.64306 (0.64157)	Top-1 acc 58.984 (57.432)	Top-5 acc 82.812 (79.326)	lr 0.01575
Train [50][3130/3239]	Time 0.242 (0.876)	Data Time 0.001 (0.390)	Loss 2.6133 (2.7624)	Entropy 0.64289 (0.64157)	Top-1 acc 59.766 (57.434)	Top-5 acc 83.203 (79.330)	lr 0.01575
Train [50][3140/3239]	Time 0.248 (0.879)	Data Time 0.001 (0.392)	Loss 2.8482 (2.7624)	Entropy 0.64285 (0.64158)	Top-1 acc 53.516 (57.434)	Top-5 acc 78.125 (79.330)	lr 0.01574
Train [50][3150/3239]	Time 0.253 (0.877)	Data Time 0.001 (0.391)	Loss 2.9225 (2.7624)	Entropy 0.64269 (0.64158)	Top-1 acc 53.516 (57.432)	Top-5 acc 79.688 (79.335)	lr 0.01574
Train [50][3160/3239]	Time 0.239 (0.876)	Data Time 0.001 (0.390)	Loss 2.8507 (2.7622)	Entropy 0.64264 (0.64158)	Top-1 acc 56.641 (57.435)	Top-5 acc 80.078 (79.340)	lr 0.01574
Train [50][3170/3239]	Time 0.238 (0.878)	Data Time 0.001 (0.392)	Loss 2.7691 (2.7621)	Entropy 0.64228 (0.64159)	Top-1 acc 59.766 (57.440)	Top-5 acc 77.734 (79.342)	lr 0.01574
Train [50][3180/3239]	Time 0.430 (0.877)	Data Time 0.000 (0.391)	Loss 2.7769 (2.7622)	Entropy 0.64249 (0.64159)	Top-1 acc 57.812 (57.436)	Top-5 acc 76.953 (79.341)	lr 0.01574
Train [50][3190/3239]	Time 0.249 (0.876)	Data Time 0.000 (0.390)	Loss 2.7183 (2.7622)	Entropy 0.64274 (0.64159)	Top-1 acc 54.688 (57.435)	Top-5 acc 80.859 (79.340)	lr 0.01574
Train [50][3200/3239]	Time 0.264 (0.874)	Data Time 0.000 (0.389)	Loss 2.7578 (2.7621)	Entropy 0.64291 (0.64160)	Top-1 acc 57.812 (57.439)	Top-5 acc 78.125 (79.341)	lr 0.01574
Train [50][3210/3239]	Time 0.253 (0.876)	Data Time 0.000 (0.391)	Loss 2.8156 (2.7622)	Entropy 0.64282 (0.64160)	Top-1 acc 57.031 (57.436)	Top-5 acc 79.297 (79.341)	lr 0.01574
Train [50][3220/3239]	Time 0.255 (0.875)	Data Time 0.000 (0.390)	Loss 2.4694 (2.7621)	Entropy 0.64293 (0.64160)	Top-1 acc 62.500 (57.436)	Top-5 acc 82.422 (79.339)	lr 0.01574
Train [50][3230/3239]	Time 0.223 (0.874)	Data Time 0.000 (0.389)	Loss 2.9162 (2.7623)	Entropy 0.64274 (0.64161)	Top-1 acc 53.125 (57.431)	Top-5 acc 75.781 (79.337)	lr 0.01574
Train [50][3239/3239]	Time 0.916 (0.872)	Data Time 0.000 (0.388)	Loss 2.7624 (2.7625)	Entropy 0.64264 (0.64161)	Top-1 acc 55.556 (57.428)	Top-5 acc 82.716 (79.336)	lr 0.01574
==========Valid [50/120]	loss 1.503	top-1 acc 65.742 (65.742)	top-5 acc 85.991	Train top-1 57.428	top-5 79.336	Entropy 0.64264	Latency-None: 0.000ms	Flops: 538.40M
Train [51][0/3239]	Time 46.491 (46.491)	Data Time 45.386 (45.386)	Loss 2.7011 (2.7011)	Entropy 0.64283 (0.64283)	Top-1 acc 58.984 (58.984)	Top-5 acc 81.250 (81.250)	lr 0.01574
Train [51][10/3239]	Time 0.332 (4.987)	Data Time 0.001 (4.398)	Loss 2.6413 (2.7119)	Entropy 0.64256 (0.64272)	Top-1 acc 60.547 (58.310)	Top-5 acc 81.641 (80.398)	lr 0.01573
Train [51][20/3239]	Time 0.253 (2.825)	Data Time 0.002 (2.304)	Loss 2.7117 (2.7134)	Entropy 0.64210 (0.64263)	Top-1 acc 60.547 (58.780)	Top-5 acc 81.641 (80.097)	lr 0.01573
Train [51][30/3239]	Time 0.270 (2.058)	Data Time 0.002 (1.562)	Loss 2.7968 (2.7447)	Entropy 0.64239 (0.64248)	Top-1 acc 53.906 (57.863)	Top-5 acc 77.344 (79.700)	lr 0.01573
Train [51][40/3239]	Time 0.259 (1.780)	Data Time 0.001 (1.285)	Loss 2.5909 (2.7500)	Entropy 0.64246 (0.64247)	Top-1 acc 61.719 (57.755)	Top-5 acc 83.984 (79.535)	lr 0.01573
Train [51][50/3239]	Time 0.263 (1.520)	Data Time 0.002 (1.034)	Loss 2.7548 (2.7323)	Entropy 0.64246 (0.64246)	Top-1 acc 55.859 (58.264)	Top-5 acc 80.469 (79.833)	lr 0.01573
Train [51][60/3239]	Time 0.264 (1.345)	Data Time 0.002 (0.865)	Loss 2.7381 (2.7384)	Entropy 0.64259 (0.64247)	Top-1 acc 55.469 (57.928)	Top-5 acc 78.125 (79.649)	lr 0.01573
Train [51][70/3239]	Time 0.290 (1.334)	Data Time 0.001 (0.845)	Loss 2.5452 (2.7415)	Entropy 0.64253 (0.64246)	Top-1 acc 61.328 (57.884)	Top-5 acc 84.766 (79.682)	lr 0.01573
Train [51][80/3239]	Time 0.256 (1.226)	Data Time 0.001 (0.741)	Loss 2.6877 (2.7414)	Entropy 0.64271 (0.64248)	Top-1 acc 58.594 (57.779)	Top-5 acc 82.031 (79.716)	lr 0.01573
Train [51][90/3239]	Time 0.258 (1.138)	Data Time 0.001 (0.660)	Loss 3.0581 (2.7442)	Entropy 0.64276 (0.64251)	Top-1 acc 49.219 (57.757)	Top-5 acc 70.703 (79.705)	lr 0.01573
Train [51][100/3239]	Time 0.350 (1.148)	Data Time 0.001 (0.672)	Loss 2.9941 (2.7552)	Entropy 0.64227 (0.64252)	Top-1 acc 53.125 (57.526)	Top-5 acc 73.828 (79.490)	lr 0.01573
Train [51][110/3239]	Time 0.246 (1.084)	Data Time 0.001 (0.612)	Loss 2.9491 (2.7578)	Entropy 0.64231 (0.64250)	Top-1 acc 53.125 (57.436)	Top-5 acc 76.172 (79.448)	lr 0.01572
Train [51][120/3239]	Time 0.241 (1.028)	Data Time 0.001 (0.561)	Loss 2.6033 (2.7556)	Entropy 0.64242 (0.64249)	Top-1 acc 59.766 (57.503)	Top-5 acc 83.594 (79.494)	lr 0.01572
Train [51][130/3239]	Time 0.266 (1.054)	Data Time 0.001 (0.591)	Loss 2.6349 (2.7499)	Entropy 0.64215 (0.64247)	Top-1 acc 59.766 (57.702)	Top-5 acc 80.859 (79.574)	lr 0.01572
Train [51][140/3239]	Time 0.245 (1.012)	Data Time 0.001 (0.550)	Loss 2.8369 (2.7481)	Entropy 0.64202 (0.64245)	Top-1 acc 58.203 (57.713)	Top-5 acc 78.125 (79.555)	lr 0.01572
Train [51][150/3239]	Time 0.242 (0.974)	Data Time 0.001 (0.514)	Loss 2.7336 (2.7466)	Entropy 0.64171 (0.64241)	Top-1 acc 57.812 (57.732)	Top-5 acc 81.641 (79.587)	lr 0.01572
Train [51][160/3239]	Time 8.011 (0.988)	Data Time 7.745 (0.530)	Loss 2.9415 (2.7475)	Entropy 0.64194 (0.64237)	Top-1 acc 53.516 (57.662)	Top-5 acc 76.562 (79.624)	lr 0.01572
Train [51][170/3239]	Time 0.358 (0.975)	Data Time 0.001 (0.518)	Loss 2.5867 (2.7430)	Entropy 0.64195 (0.64235)	Top-1 acc 60.938 (57.792)	Top-5 acc 82.031 (79.699)	lr 0.01572
Train [51][180/3239]	Time 0.234 (0.945)	Data Time 0.001 (0.489)	Loss 2.8807 (2.7441)	Entropy 0.64213 (0.64233)	Top-1 acc 57.812 (57.756)	Top-5 acc 75.781 (79.677)	lr 0.01572
Train [51][190/3239]	Time 0.252 (0.918)	Data Time 0.001 (0.464)	Loss 2.7214 (2.7432)	Entropy 0.64226 (0.64233)	Top-1 acc 53.906 (57.741)	Top-5 acc 81.641 (79.683)	lr 0.01572
Train [51][200/3239]	Time 0.297 (0.953)	Data Time 0.001 (0.496)	Loss 2.7862 (2.7443)	Entropy 0.64216 (0.64232)	Top-1 acc 57.812 (57.779)	Top-5 acc 79.688 (79.670)	lr 0.01572
Train [51][210/3239]	Time 0.268 (0.931)	Data Time 0.001 (0.475)	Loss 2.6422 (2.7433)	Entropy 0.64194 (0.64231)	Top-1 acc 60.156 (57.814)	Top-5 acc 81.250 (79.676)	lr 0.01571
Train [51][220/3239]	Time 0.263 (0.908)	Data Time 0.001 (0.453)	Loss 2.7813 (2.7447)	Entropy 0.64167 (0.64229)	Top-1 acc 58.984 (57.768)	Top-5 acc 78.125 (79.622)	lr 0.01571
Train [51][230/3239]	Time 0.289 (0.941)	Data Time 0.001 (0.488)	Loss 2.7197 (2.7430)	Entropy 0.64157 (0.64226)	Top-1 acc 56.641 (57.789)	Top-5 acc 77.344 (79.649)	lr 0.01571
Train [51][240/3239]	Time 0.318 (0.924)	Data Time 0.001 (0.472)	Loss 2.4983 (2.7368)	Entropy 0.64162 (0.64223)	Top-1 acc 65.234 (57.934)	Top-5 acc 83.594 (79.762)	lr 0.01571
Train [51][250/3239]	Time 0.231 (0.909)	Data Time 0.001 (0.459)	Loss 2.7040 (2.7368)	Entropy 0.64147 (0.64221)	Top-1 acc 61.328 (57.956)	Top-5 acc 80.078 (79.803)	lr 0.01571
Train [51][260/3239]	Time 0.240 (0.932)	Data Time 0.001 (0.482)	Loss 2.9117 (2.7383)	Entropy 0.64147 (0.64218)	Top-1 acc 53.906 (57.955)	Top-5 acc 76.953 (79.782)	lr 0.01571
Train [51][270/3239]	Time 0.231 (0.923)	Data Time 0.001 (0.474)	Loss 2.7915 (2.7390)	Entropy 0.64123 (0.64215)	Top-1 acc 58.203 (57.954)	Top-5 acc 76.562 (79.778)	lr 0.01571
Train [51][280/3239]	Time 0.255 (0.905)	Data Time 0.001 (0.457)	Loss 2.6445 (2.7382)	Entropy 0.64130 (0.64211)	Top-1 acc 61.719 (57.947)	Top-5 acc 80.859 (79.821)	lr 0.01571
Train [51][290/3239]	Time 0.266 (0.941)	Data Time 0.001 (0.494)	Loss 2.6318 (2.7371)	Entropy 0.64112 (0.64208)	Top-1 acc 57.812 (57.962)	Top-5 acc 81.250 (79.834)	lr 0.01571
Train [51][300/3239]	Time 0.239 (0.930)	Data Time 0.001 (0.484)	Loss 2.9106 (2.7389)	Entropy 0.64121 (0.64205)	Top-1 acc 58.594 (57.954)	Top-5 acc 73.828 (79.807)	lr 0.01571
Train [51][310/3239]	Time 0.239 (0.914)	Data Time 0.001 (0.469)	Loss 2.5157 (2.7385)	Entropy 0.64098 (0.64202)	Top-1 acc 60.938 (57.966)	Top-5 acc 83.594 (79.807)	lr 0.01570
Train [51][320/3239]	Time 13.446 (0.940)	Data Time 13.206 (0.495)	Loss 2.7126 (2.7400)	Entropy 0.64105 (0.64199)	Top-1 acc 57.031 (57.955)	Top-5 acc 81.641 (79.770)	lr 0.01570
Train [51][330/3239]	Time 0.401 (0.944)	Data Time 0.002 (0.500)	Loss 2.8752 (2.7412)	Entropy 0.64129 (0.64196)	Top-1 acc 53.516 (57.921)	Top-5 acc 77.344 (79.785)	lr 0.01570
Train [51][340/3239]	Time 0.253 (0.929)	Data Time 0.002 (0.485)	Loss 2.8245 (2.7399)	Entropy 0.64135 (0.64194)	Top-1 acc 56.250 (57.955)	Top-5 acc 79.688 (79.827)	lr 0.01570
Train [51][350/3239]	Time 0.244 (0.915)	Data Time 0.001 (0.472)	Loss 2.8691 (2.7397)	Entropy 0.64152 (0.64193)	Top-1 acc 54.688 (57.976)	Top-5 acc 77.734 (79.843)	lr 0.01570
Train [51][360/3239]	Time 0.227 (0.925)	Data Time 0.001 (0.481)	Loss 2.6529 (2.7392)	Entropy 0.64087 (0.64191)	Top-1 acc 59.375 (57.953)	Top-5 acc 81.250 (79.873)	lr 0.01570
Train [51][370/3239]	Time 0.243 (0.927)	Data Time 0.001 (0.485)	Loss 2.6730 (2.7385)	Entropy 0.64081 (0.64189)	Top-1 acc 62.500 (57.969)	Top-5 acc 78.125 (79.871)	lr 0.01570
Train [51][380/3239]	Time 0.263 (0.914)	Data Time 0.002 (0.472)	Loss 2.7906 (2.7374)	Entropy 0.64090 (0.64186)	Top-1 acc 56.250 (57.989)	Top-5 acc 77.344 (79.901)	lr 0.01570
Train [51][390/3239]	Time 0.236 (0.929)	Data Time 0.001 (0.488)	Loss 2.8533 (2.7388)	Entropy 0.64141 (0.64184)	Top-1 acc 59.375 (57.973)	Top-5 acc 77.344 (79.873)	lr 0.01570
Train [51][400/3239]	Time 0.345 (0.930)	Data Time 0.001 (0.489)	Loss 2.7565 (2.7401)	Entropy 0.64159 (0.64183)	Top-1 acc 55.859 (57.937)	Top-5 acc 81.250 (79.850)	lr 0.01570
Train [51][410/3239]	Time 0.560 (1.003)	Data Time 0.006 (0.478)	Loss 2.7191 (2.7390)	Entropy 0.64121 (0.64183)	Top-1 acc 58.984 (57.973)	Top-5 acc 80.859 (79.879)	lr 0.01570
Train [51][420/3239]	Time 0.286 (0.994)	Data Time 0.002 (0.466)	Loss 2.8073 (2.7387)	Entropy 0.64129 (0.64181)	Top-1 acc 53.125 (57.973)	Top-5 acc 80.859 (79.894)	lr 0.01569
Train [51][430/3239]	Time 0.246 (0.981)	Data Time 0.002 (0.456)	Loss 2.9104 (2.7385)	Entropy 0.64128 (0.64180)	Top-1 acc 53.516 (57.969)	Top-5 acc 75.781 (79.890)	lr 0.01569
Train [51][440/3239]	Time 0.242 (0.968)	Data Time 0.001 (0.445)	Loss 2.9047 (2.7384)	Entropy 0.64159 (0.64179)	Top-1 acc 54.297 (57.985)	Top-5 acc 77.344 (79.886)	lr 0.01569
Train [51][450/3239]	Time 0.251 (0.957)	Data Time 0.002 (0.435)	Loss 2.9702 (2.7381)	Entropy 0.64070 (0.64178)	Top-1 acc 55.469 (57.999)	Top-5 acc 76.953 (79.894)	lr 0.01569
Train [51][460/3239]	Time 0.236 (0.945)	Data Time 0.001 (0.426)	Loss 2.7502 (2.7389)	Entropy 0.64078 (0.64176)	Top-1 acc 58.594 (57.988)	Top-5 acc 77.344 (79.872)	lr 0.01569
Train [51][470/3239]	Time 0.242 (0.934)	Data Time 0.001 (0.417)	Loss 2.7993 (2.7390)	Entropy 0.64087 (0.64174)	Top-1 acc 55.859 (57.994)	Top-5 acc 80.469 (79.872)	lr 0.01569
Train [51][480/3239]	Time 2.704 (0.939)	Data Time 2.460 (0.424)	Loss 2.7685 (2.7395)	Entropy 0.64077 (0.64172)	Top-1 acc 58.984 (57.965)	Top-5 acc 79.688 (79.852)	lr 0.01569
Train [51][490/3239]	Time 0.389 (0.949)	Data Time 0.001 (0.436)	Loss 2.7531 (2.7387)	Entropy 0.64073 (0.64170)	Top-1 acc 55.859 (57.969)	Top-5 acc 78.906 (79.858)	lr 0.01569
Train [51][500/3239]	Time 0.238 (0.939)	Data Time 0.001 (0.427)	Loss 2.6123 (2.7402)	Entropy 0.64072 (0.64168)	Top-1 acc 60.938 (57.921)	Top-5 acc 82.031 (79.836)	lr 0.01569
Train [51][510/3239]	Time 0.743 (0.946)	Data Time 0.463 (0.437)	Loss 2.6460 (2.7397)	Entropy 0.64045 (0.64166)	Top-1 acc 60.547 (57.937)	Top-5 acc 82.031 (79.844)	lr 0.01569
Train [51][520/3239]	Time 0.276 (0.941)	Data Time 0.001 (0.432)	Loss 2.6897 (2.7388)	Entropy 0.64075 (0.64164)	Top-1 acc 60.156 (57.949)	Top-5 acc 80.859 (79.861)	lr 0.01568
Train [51][530/3239]	Time 0.242 (0.950)	Data Time 0.001 (0.442)	Loss 2.8460 (2.7393)	Entropy 0.64084 (0.64162)	Top-1 acc 52.734 (57.935)	Top-5 acc 80.469 (79.846)	lr 0.01568
Train [51][540/3239]	Time 1.028 (0.952)	Data Time 0.806 (0.446)	Loss 2.7368 (2.7393)	Entropy 0.64131 (0.64161)	Top-1 acc 58.203 (57.943)	Top-5 acc 78.906 (79.843)	lr 0.01568
Train [51][550/3239]	Time 1.077 (0.953)	Data Time 0.816 (0.447)	Loss 2.7792 (2.7392)	Entropy 0.64135 (0.64160)	Top-1 acc 55.859 (57.959)	Top-5 acc 81.250 (79.855)	lr 0.01568
Train [51][560/3239]	Time 0.336 (0.961)	Data Time 0.001 (0.457)	Loss 2.6705 (2.7379)	Entropy 0.64133 (0.64160)	Top-1 acc 57.031 (57.991)	Top-5 acc 81.641 (79.893)	lr 0.01568
Train [51][570/3239]	Time 0.234 (0.952)	Data Time 0.001 (0.450)	Loss 3.0730 (2.7387)	Entropy 0.64135 (0.64160)	Top-1 acc 53.125 (57.977)	Top-5 acc 74.219 (79.872)	lr 0.01568
Train [51][580/3239]	Time 0.253 (0.965)	Data Time 0.002 (0.463)	Loss 2.6806 (2.7387)	Entropy 0.64142 (0.64159)	Top-1 acc 60.156 (57.955)	Top-5 acc 80.078 (79.872)	lr 0.01568
Train [51][590/3239]	Time 0.242 (0.971)	Data Time 0.001 (0.471)	Loss 2.6904 (2.7391)	Entropy 0.64145 (0.64159)	Top-1 acc 57.031 (57.931)	Top-5 acc 81.641 (79.868)	lr 0.01568
Train [51][600/3239]	Time 0.245 (0.964)	Data Time 0.001 (0.465)	Loss 2.9571 (2.7397)	Entropy 0.64144 (0.64159)	Top-1 acc 53.516 (57.927)	Top-5 acc 78.125 (79.862)	lr 0.01568
Train [51][610/3239]	Time 1.607 (0.978)	Data Time 1.343 (0.481)	Loss 2.7677 (2.7399)	Entropy 0.64101 (0.64158)	Top-1 acc 53.125 (57.929)	Top-5 acc 79.688 (79.849)	lr 0.01568
Train [51][620/3239]	Time 0.235 (0.988)	Data Time 0.001 (0.492)	Loss 3.0603 (2.7404)	Entropy 0.64080 (0.64157)	Top-1 acc 49.609 (57.911)	Top-5 acc 76.953 (79.852)	lr 0.01567
Train [51][630/3239]	Time 0.227 (0.979)	Data Time 0.001 (0.484)	Loss 2.7410 (2.7399)	Entropy 0.64055 (0.64156)	Top-1 acc 59.766 (57.928)	Top-5 acc 81.641 (79.865)	lr 0.01567
Train [51][640/3239]	Time 3.478 (0.985)	Data Time 3.237 (0.491)	Loss 2.6173 (2.7403)	Entropy 0.64048 (0.64155)	Top-1 acc 59.766 (57.913)	Top-5 acc 78.906 (79.861)	lr 0.01567
Train [51][650/3239]	Time 0.351 (0.997)	Data Time 0.001 (0.505)	Loss 2.9894 (2.7411)	Entropy 0.64051 (0.64153)	Top-1 acc 51.172 (57.888)	Top-5 acc 78.125 (79.840)	lr 0.01567
Train [51][660/3239]	Time 0.245 (0.989)	Data Time 0.001 (0.497)	Loss 2.7408 (2.7413)	Entropy 0.64054 (0.64152)	Top-1 acc 55.859 (57.876)	Top-5 acc 80.859 (79.836)	lr 0.01567
Train [51][670/3239]	Time 0.825 (0.995)	Data Time 0.586 (0.504)	Loss 2.8673 (2.7415)	Entropy 0.64042 (0.64150)	Top-1 acc 56.250 (57.861)	Top-5 acc 79.688 (79.837)	lr 0.01567
Train [51][680/3239]	Time 0.261 (0.995)	Data Time 0.002 (0.505)	Loss 2.8504 (2.7421)	Entropy 0.64006 (0.64148)	Top-1 acc 55.859 (57.853)	Top-5 acc 78.906 (79.834)	lr 0.01567
Train [51][690/3239]	Time 0.247 (1.000)	Data Time 0.001 (0.511)	Loss 2.8076 (2.7417)	Entropy 0.63974 (0.64146)	Top-1 acc 52.734 (57.865)	Top-5 acc 81.250 (79.847)	lr 0.01567
Train [51][700/3239]	Time 5.607 (1.005)	Data Time 5.354 (0.517)	Loss 2.6623 (2.7412)	Entropy 0.63959 (0.64143)	Top-1 acc 57.812 (57.880)	Top-5 acc 81.641 (79.847)	lr 0.01567
Train [51][710/3239]	Time 0.250 (1.006)	Data Time 0.001 (0.518)	Loss 2.6242 (2.7406)	Entropy 0.63962 (0.64141)	Top-1 acc 62.109 (57.910)	Top-5 acc 82.812 (79.864)	lr 0.01567
Train [51][720/3239]	Time 0.348 (1.013)	Data Time 0.001 (0.527)	Loss 2.6516 (2.7401)	Entropy 0.63972 (0.64138)	Top-1 acc 59.766 (57.926)	Top-5 acc 80.859 (79.868)	lr 0.01566
Train [51][730/3239]	Time 0.256 (1.005)	Data Time 0.001 (0.519)	Loss 2.8761 (2.7416)	Entropy 0.63966 (0.64136)	Top-1 acc 53.906 (57.899)	Top-5 acc 75.000 (79.832)	lr 0.01566
Train [51][740/3239]	Time 0.243 (1.022)	Data Time 0.001 (0.537)	Loss 2.6254 (2.7407)	Entropy 0.63956 (0.64134)	Top-1 acc 63.281 (57.909)	Top-5 acc 83.203 (79.845)	lr 0.01566
Train [51][750/3239]	Time 0.266 (1.023)	Data Time 0.001 (0.539)	Loss 2.9584 (2.7401)	Entropy 0.63942 (0.64131)	Top-1 acc 56.250 (57.920)	Top-5 acc 78.906 (79.863)	lr 0.01566
Train [51][760/3239]	Time 0.239 (1.016)	Data Time 0.001 (0.533)	Loss 2.8068 (2.7403)	Entropy 0.63939 (0.64129)	Top-1 acc 56.250 (57.905)	Top-5 acc 79.297 (79.857)	lr 0.01566
Train [51][770/3239]	Time 0.238 (1.036)	Data Time 0.002 (0.553)	Loss 2.7657 (2.7399)	Entropy 0.63958 (0.64126)	Top-1 acc 57.422 (57.923)	Top-5 acc 76.562 (79.867)	lr 0.01566
Train [51][780/3239]	Time 0.257 (1.037)	Data Time 0.001 (0.556)	Loss 2.6442 (2.7398)	Entropy 0.63940 (0.64124)	Top-1 acc 59.375 (57.933)	Top-5 acc 82.812 (79.868)	lr 0.01566
Train [51][790/3239]	Time 0.228 (1.030)	Data Time 0.001 (0.549)	Loss 2.8188 (2.7401)	Entropy 0.63957 (0.64122)	Top-1 acc 56.641 (57.927)	Top-5 acc 80.469 (79.862)	lr 0.01566
Train [51][800/3239]	Time 0.220 (1.048)	Data Time 0.001 (0.568)	Loss 2.7242 (2.7412)	Entropy 0.63938 (0.64120)	Top-1 acc 56.250 (57.898)	Top-5 acc 80.469 (79.841)	lr 0.01566
Train [51][810/3239]	Time 0.243 (1.047)	Data Time 0.001 (0.568)	Loss 2.8600 (2.7406)	Entropy 0.63950 (0.64118)	Top-1 acc 53.125 (57.913)	Top-5 acc 78.906 (79.852)	lr 0.01566
Train [51][820/3239]	Time 0.244 (1.039)	Data Time 0.001 (0.561)	Loss 2.7448 (2.7402)	Entropy 0.63971 (0.64116)	Top-1 acc 56.250 (57.911)	Top-5 acc 77.734 (79.853)	lr 0.01566
Train [51][830/3239]	Time 15.586 (1.063)	Data Time 15.288 (0.585)	Loss 2.7901 (2.7408)	Entropy 0.63923 (0.64114)	Top-1 acc 55.469 (57.891)	Top-5 acc 79.688 (79.846)	lr 0.01565
Train [51][840/3239]	Time 0.249 (1.058)	Data Time 0.001 (0.581)	Loss 2.5919 (2.7405)	Entropy 0.63915 (0.64111)	Top-1 acc 58.984 (57.882)	Top-5 acc 83.984 (79.853)	lr 0.01565
Train [51][850/3239]	Time 0.244 (1.059)	Data Time 0.001 (0.583)	Loss 2.6766 (2.7404)	Entropy 0.63918 (0.64109)	Top-1 acc 62.109 (57.894)	Top-5 acc 80.078 (79.859)	lr 0.01565
Train [51][860/3239]	Time 0.249 (1.061)	Data Time 0.001 (0.586)	Loss 2.5638 (2.7407)	Entropy 0.63890 (0.64106)	Top-1 acc 62.500 (57.886)	Top-5 acc 81.641 (79.849)	lr 0.01565
Train [51][870/3239]	Time 0.238 (1.069)	Data Time 0.001 (0.594)	Loss 2.7956 (2.7410)	Entropy 0.63903 (0.64104)	Top-1 acc 57.422 (57.875)	Top-5 acc 80.469 (79.859)	lr 0.01565
Train [51][880/3239]	Time 0.323 (1.072)	Data Time 0.002 (0.598)	Loss 2.7786 (2.7423)	Entropy 0.63914 (0.64102)	Top-1 acc 57.031 (57.842)	Top-5 acc 80.078 (79.837)	lr 0.01565
Train [51][890/3239]	Time 0.254 (1.066)	Data Time 0.002 (0.592)	Loss 2.8476 (2.7429)	Entropy 0.63898 (0.64100)	Top-1 acc 55.078 (57.820)	Top-5 acc 76.172 (79.816)	lr 0.01565
Train [51][900/3239]	Time 0.253 (1.088)	Data Time 0.001 (0.614)	Loss 2.8928 (2.7428)	Entropy 0.63899 (0.64097)	Top-1 acc 55.078 (57.830)	Top-5 acc 76.562 (79.815)	lr 0.01565
Train [51][910/3239]	Time 0.255 (1.086)	Data Time 0.001 (0.613)	Loss 2.7284 (2.7429)	Entropy 0.63881 (0.64095)	Top-1 acc 58.594 (57.832)	Top-5 acc 80.859 (79.817)	lr 0.01565
Train [51][920/3239]	Time 0.260 (1.087)	Data Time 0.001 (0.614)	Loss 2.6837 (2.7426)	Entropy 0.63863 (0.64093)	Top-1 acc 58.984 (57.843)	Top-5 acc 80.469 (79.825)	lr 0.01565
Train [51][930/3239]	Time 1.858 (1.098)	Data Time 1.610 (0.626)	Loss 2.6949 (2.7419)	Entropy 0.63912 (0.64091)	Top-1 acc 58.594 (57.853)	Top-5 acc 80.859 (79.843)	lr 0.01564
Train [51][940/3239]	Time 0.244 (1.100)	Data Time 0.001 (0.629)	Loss 2.5782 (2.7419)	Entropy 0.63896 (0.64089)	Top-1 acc 60.547 (57.847)	Top-5 acc 86.719 (79.842)	lr 0.01564
Train [51][950/3239]	Time 0.338 (1.105)	Data Time 0.001 (0.634)	Loss 2.8322 (2.7421)	Entropy 0.63899 (0.64086)	Top-1 acc 61.328 (57.849)	Top-5 acc 76.953 (79.832)	lr 0.01564
Train [51][960/3239]	Time 0.243 (1.105)	Data Time 0.001 (0.635)	Loss 2.6744 (2.7421)	Entropy 0.63904 (0.64084)	Top-1 acc 60.547 (57.845)	Top-5 acc 78.516 (79.819)	lr 0.01564
Train [51][970/3239]	Time 0.241 (1.120)	Data Time 0.001 (0.651)	Loss 2.8747 (2.7429)	Entropy 0.63905 (0.64083)	Top-1 acc 52.734 (57.823)	Top-5 acc 77.344 (79.803)	lr 0.01564
Train [51][980/3239]	Time 0.237 (1.115)	Data Time 0.001 (0.646)	Loss 2.7648 (2.7428)	Entropy 0.63924 (0.64081)	Top-1 acc 57.031 (57.835)	Top-5 acc 79.688 (79.803)	lr 0.01564
Train [51][990/3239]	Time 4.802 (1.113)	Data Time 4.519 (0.644)	Loss 2.8188 (2.7429)	Entropy 0.63940 (0.64080)	Top-1 acc 53.906 (57.831)	Top-5 acc 79.688 (79.792)	lr 0.01564
Train [51][1000/3239]	Time 0.224 (1.114)	Data Time 0.001 (0.646)	Loss 3.0171 (2.7439)	Entropy 0.63937 (0.64078)	Top-1 acc 53.516 (57.824)	Top-5 acc 75.000 (79.768)	lr 0.01564
Train [51][1010/3239]	Time 0.281 (1.121)	Data Time 0.001 (0.653)	Loss 2.8675 (2.7439)	Entropy 0.63959 (0.64077)	Top-1 acc 51.172 (57.820)	Top-5 acc 78.906 (79.770)	lr 0.01564
Train [51][1020/3239]	Time 0.228 (1.114)	Data Time 0.001 (0.647)	Loss 2.7071 (2.7440)	Entropy 0.63961 (0.64076)	Top-1 acc 57.812 (57.812)	Top-5 acc 80.469 (79.772)	lr 0.01564
Train [51][1030/3239]	Time 0.238 (1.118)	Data Time 0.001 (0.651)	Loss 2.7893 (2.7445)	Entropy 0.63983 (0.64075)	Top-1 acc 57.812 (57.796)	Top-5 acc 80.078 (79.759)	lr 0.01563
Train [51][1040/3239]	Time 0.339 (1.125)	Data Time 0.001 (0.659)	Loss 2.6536 (2.7446)	Entropy 0.64003 (0.64074)	Top-1 acc 59.375 (57.803)	Top-5 acc 81.250 (79.767)	lr 0.01563
Train [51][1050/3239]	Time 0.234 (1.119)	Data Time 0.001 (0.653)	Loss 2.9492 (2.7445)	Entropy 0.63956 (0.64073)	Top-1 acc 54.688 (57.799)	Top-5 acc 73.828 (79.759)	lr 0.01563
Train [51][1060/3239]	Time 0.275 (1.122)	Data Time 0.001 (0.657)	Loss 2.6274 (2.7447)	Entropy 0.63908 (0.64072)	Top-1 acc 57.031 (57.798)	Top-5 acc 82.812 (79.756)	lr 0.01563
Train [51][1070/3239]	Time 0.299 (1.148)	Data Time 0.003 (0.651)	Loss 2.7429 (2.7445)	Entropy 0.63895 (0.64070)	Top-1 acc 58.984 (57.804)	Top-5 acc 78.516 (79.764)	lr 0.01563
Train [51][1080/3239]	Time 0.258 (1.142)	Data Time 0.002 (0.645)	Loss 2.9101 (2.7439)	Entropy 0.63891 (0.64069)	Top-1 acc 53.906 (57.819)	Top-5 acc 75.781 (79.771)	lr 0.01563
Train [51][1090/3239]	Time 0.230 (1.135)	Data Time 0.001 (0.639)	Loss 2.6160 (2.7437)	Entropy 0.63893 (0.64067)	Top-1 acc 63.281 (57.836)	Top-5 acc 81.641 (79.769)	lr 0.01563
Train [51][1100/3239]	Time 0.236 (1.136)	Data Time 0.002 (0.641)	Loss 2.7596 (2.7441)	Entropy 0.63833 (0.64065)	Top-1 acc 60.938 (57.824)	Top-5 acc 78.906 (79.758)	lr 0.01563
Train [51][1110/3239]	Time 0.347 (1.129)	Data Time 0.001 (0.635)	Loss 2.9468 (2.7440)	Entropy 0.63871 (0.64063)	Top-1 acc 55.078 (57.834)	Top-5 acc 76.562 (79.755)	lr 0.01563
Train [51][1120/3239]	Time 4.492 (1.130)	Data Time 4.233 (0.636)	Loss 2.5822 (2.7445)	Entropy 0.63855 (0.64062)	Top-1 acc 58.984 (57.820)	Top-5 acc 82.031 (79.739)	lr 0.01563
Train [51][1130/3239]	Time 0.248 (1.136)	Data Time 0.001 (0.643)	Loss 2.8706 (2.7451)	Entropy 0.63864 (0.64060)	Top-1 acc 54.297 (57.806)	Top-5 acc 75.781 (79.728)	lr 0.01562
Train [51][1140/3239]	Time 0.252 (1.136)	Data Time 0.001 (0.643)	Loss 2.7542 (2.7454)	Entropy 0.63857 (0.64058)	Top-1 acc 60.156 (57.810)	Top-5 acc 78.906 (79.720)	lr 0.01562
Train [51][1150/3239]	Time 0.311 (1.129)	Data Time 0.002 (0.637)	Loss 2.7859 (2.7453)	Entropy 0.63841 (0.64056)	Top-1 acc 55.078 (57.808)	Top-5 acc 77.734 (79.715)	lr 0.01562
Train [51][1160/3239]	Time 0.245 (1.132)	Data Time 0.001 (0.640)	Loss 2.9325 (2.7451)	Entropy 0.63830 (0.64054)	Top-1 acc 56.250 (57.819)	Top-5 acc 75.000 (79.715)	lr 0.01562
Train [51][1170/3239]	Time 0.227 (1.140)	Data Time 0.001 (0.649)	Loss 2.6337 (2.7446)	Entropy 0.63879 (0.64052)	Top-1 acc 61.328 (57.834)	Top-5 acc 81.641 (79.721)	lr 0.01562
Train [51][1180/3239]	Time 0.244 (1.134)	Data Time 0.001 (0.643)	Loss 2.6526 (2.7441)	Entropy 0.63914 (0.64051)	Top-1 acc 58.594 (57.848)	Top-5 acc 81.641 (79.730)	lr 0.01562
Train [51][1190/3239]	Time 0.263 (1.137)	Data Time 0.001 (0.647)	Loss 2.7929 (2.7442)	Entropy 0.63913 (0.64050)	Top-1 acc 58.594 (57.846)	Top-5 acc 77.734 (79.720)	lr 0.01562
Train [51][1200/3239]	Time 0.326 (1.142)	Data Time 0.001 (0.653)	Loss 2.7229 (2.7446)	Entropy 0.63895 (0.64049)	Top-1 acc 58.594 (57.835)	Top-5 acc 78.906 (79.709)	lr 0.01562
Train [51][1210/3239]	Time 0.242 (1.137)	Data Time 0.001 (0.648)	Loss 2.9403 (2.7444)	Entropy 0.63892 (0.64048)	Top-1 acc 53.516 (57.839)	Top-5 acc 73.047 (79.707)	lr 0.01562
Train [51][1220/3239]	Time 0.228 (1.144)	Data Time 0.001 (0.656)	Loss 2.7232 (2.7448)	Entropy 0.63874 (0.64046)	Top-1 acc 60.547 (57.835)	Top-5 acc 79.297 (79.701)	lr 0.01562
Train [51][1230/3239]	Time 0.236 (1.147)	Data Time 0.001 (0.659)	Loss 2.7016 (2.7447)	Entropy 0.63858 (0.64045)	Top-1 acc 62.500 (57.838)	Top-5 acc 79.688 (79.704)	lr 0.01562
Train [51][1240/3239]	Time 0.253 (1.141)	Data Time 0.001 (0.654)	Loss 2.6663 (2.7451)	Entropy 0.63803 (0.64043)	Top-1 acc 62.500 (57.832)	Top-5 acc 82.031 (79.700)	lr 0.01561
Train [51][1250/3239]	Time 0.234 (1.149)	Data Time 0.001 (0.663)	Loss 2.8440 (2.7456)	Entropy 0.63781 (0.64041)	Top-1 acc 55.078 (57.817)	Top-5 acc 76.172 (79.693)	lr 0.01561
Train [51][1260/3239]	Time 0.238 (1.153)	Data Time 0.001 (0.667)	Loss 2.7814 (2.7458)	Entropy 0.63785 (0.64039)	Top-1 acc 55.078 (57.805)	Top-5 acc 79.688 (79.692)	lr 0.01561
Train [51][1270/3239]	Time 0.339 (1.148)	Data Time 0.001 (0.663)	Loss 2.8606 (2.7458)	Entropy 0.63737 (0.64037)	Top-1 acc 56.250 (57.807)	Top-5 acc 75.781 (79.692)	lr 0.01561
Train [51][1280/3239]	Time 17.741 (1.156)	Data Time 17.437 (0.672)	Loss 2.6948 (2.7457)	Entropy 0.63729 (0.64035)	Top-1 acc 60.156 (57.817)	Top-5 acc 76.172 (79.686)	lr 0.01561
Train [51][1290/3239]	Time 0.246 (1.159)	Data Time 0.001 (0.675)	Loss 2.6924 (2.7451)	Entropy 0.63743 (0.64032)	Top-1 acc 61.719 (57.835)	Top-5 acc 80.859 (79.694)	lr 0.01561
Train [51][1300/3239]	Time 0.237 (1.154)	Data Time 0.001 (0.670)	Loss 2.6503 (2.7450)	Entropy 0.63702 (0.64030)	Top-1 acc 59.375 (57.840)	Top-5 acc 81.641 (79.689)	lr 0.01561
Train [51][1310/3239]	Time 0.228 (1.148)	Data Time 0.001 (0.665)	Loss 2.7062 (2.7455)	Entropy 0.63649 (0.64027)	Top-1 acc 61.328 (57.838)	Top-5 acc 78.516 (79.672)	lr 0.01561
Train [51][1320/3239]	Time 0.240 (1.158)	Data Time 0.001 (0.675)	Loss 2.7119 (2.7461)	Entropy 0.63696 (0.64025)	Top-1 acc 55.859 (57.820)	Top-5 acc 80.469 (79.663)	lr 0.01561
Train [51][1330/3239]	Time 0.236 (1.159)	Data Time 0.001 (0.677)	Loss 2.8977 (2.7465)	Entropy 0.63692 (0.64022)	Top-1 acc 54.297 (57.815)	Top-5 acc 77.734 (79.656)	lr 0.01561
Train [51][1340/3239]	Time 0.229 (1.154)	Data Time 0.001 (0.672)	Loss 2.8568 (2.7468)	Entropy 0.63696 (0.64020)	Top-1 acc 57.812 (57.810)	Top-5 acc 78.125 (79.646)	lr 0.01560
Train [51][1350/3239]	Time 0.241 (1.161)	Data Time 0.001 (0.680)	Loss 2.6489 (2.7475)	Entropy 0.63680 (0.64017)	Top-1 acc 59.766 (57.802)	Top-5 acc 80.859 (79.635)	lr 0.01560
Train [51][1360/3239]	Time 0.330 (1.167)	Data Time 0.001 (0.687)	Loss 2.9059 (2.7477)	Entropy 0.63666 (0.64015)	Top-1 acc 53.906 (57.789)	Top-5 acc 76.953 (79.634)	lr 0.01560
Train [51][1370/3239]	Time 0.248 (1.162)	Data Time 0.001 (0.682)	Loss 2.8699 (2.7479)	Entropy 0.63663 (0.64012)	Top-1 acc 52.734 (57.775)	Top-5 acc 77.344 (79.630)	lr 0.01560
Train [51][1380/3239]	Time 0.227 (1.172)	Data Time 0.001 (0.693)	Loss 2.6017 (2.7482)	Entropy 0.63650 (0.64010)	Top-1 acc 62.500 (57.768)	Top-5 acc 82.422 (79.621)	lr 0.01560
Train [51][1390/3239]	Time 0.230 (1.175)	Data Time 0.001 (0.696)	Loss 2.7497 (2.7482)	Entropy 0.63647 (0.64007)	Top-1 acc 56.641 (57.773)	Top-5 acc 79.688 (79.619)	lr 0.01560
Train [51][1400/3239]	Time 0.238 (1.171)	Data Time 0.001 (0.693)	Loss 3.0156 (2.7488)	Entropy 0.63648 (0.64004)	Top-1 acc 52.344 (57.756)	Top-5 acc 74.219 (79.603)	lr 0.01560
Train [51][1410/3239]	Time 0.247 (1.179)	Data Time 0.001 (0.701)	Loss 2.8496 (2.7488)	Entropy 0.63582 (0.64002)	Top-1 acc 59.766 (57.757)	Top-5 acc 77.734 (79.609)	lr 0.01560
Train [51][1420/3239]	Time 0.281 (1.186)	Data Time 0.003 (0.709)	Loss 2.7481 (2.7484)	Entropy 0.63570 (0.63999)	Top-1 acc 56.641 (57.768)	Top-5 acc 78.516 (79.613)	lr 0.01560
Train [51][1430/3239]	Time 0.346 (1.181)	Data Time 0.002 (0.704)	Loss 2.6399 (2.7482)	Entropy 0.63527 (0.63996)	Top-1 acc 60.156 (57.778)	Top-5 acc 83.203 (79.618)	lr 0.01560
Train [51][1440/3239]	Time 14.153 (1.185)	Data Time 13.883 (0.708)	Loss 2.6637 (2.7479)	Entropy 0.63520 (0.63992)	Top-1 acc 62.500 (57.788)	Top-5 acc 81.641 (79.626)	lr 0.01559
Train [51][1450/3239]	Time 0.286 (1.195)	Data Time 0.001 (0.718)	Loss 2.5616 (2.7477)	Entropy 0.63519 (0.63989)	Top-1 acc 62.109 (57.794)	Top-5 acc 81.250 (79.628)	lr 0.01559
Train [51][1460/3239]	Time 0.255 (1.189)	Data Time 0.001 (0.713)	Loss 2.9136 (2.7478)	Entropy 0.63501 (0.63986)	Top-1 acc 52.344 (57.795)	Top-5 acc 76.172 (79.629)	lr 0.01559
Train [51][1470/3239]	Time 0.250 (1.184)	Data Time 0.001 (0.708)	Loss 2.6438 (2.7478)	Entropy 0.63489 (0.63982)	Top-1 acc 59.766 (57.787)	Top-5 acc 80.859 (79.627)	lr 0.01559
Train [51][1480/3239]	Time 0.269 (1.185)	Data Time 0.001 (0.710)	Loss 2.7166 (2.7473)	Entropy 0.63473 (0.63979)	Top-1 acc 53.516 (57.791)	Top-5 acc 81.250 (79.638)	lr 0.01559
Train [51][1490/3239]	Time 0.238 (1.194)	Data Time 0.001 (0.719)	Loss 2.8228 (2.7474)	Entropy 0.63505 (0.63976)	Top-1 acc 58.203 (57.787)	Top-5 acc 78.125 (79.637)	lr 0.01559
Train [51][1500/3239]	Time 0.281 (1.189)	Data Time 0.002 (0.714)	Loss 2.8908 (2.7476)	Entropy 0.63513 (0.63973)	Top-1 acc 53.125 (57.778)	Top-5 acc 78.516 (79.630)	lr 0.01559
Train [51][1510/3239]	Time 0.228 (1.191)	Data Time 0.001 (0.717)	Loss 2.7094 (2.7477)	Entropy 0.63540 (0.63970)	Top-1 acc 56.641 (57.772)	Top-5 acc 79.688 (79.624)	lr 0.01559
Train [51][1520/3239]	Time 0.256 (1.205)	Data Time 0.001 (0.732)	Loss 2.6553 (2.7478)	Entropy 0.63521 (0.63967)	Top-1 acc 58.203 (57.774)	Top-5 acc 81.641 (79.621)	lr 0.01559
Train [51][1530/3239]	Time 0.231 (1.200)	Data Time 0.001 (0.727)	Loss 2.7661 (2.7480)	Entropy 0.63503 (0.63964)	Top-1 acc 56.641 (57.759)	Top-5 acc 78.125 (79.621)	lr 0.01559
Train [51][1540/3239]	Time 0.249 (1.200)	Data Time 0.001 (0.727)	Loss 2.7548 (2.7479)	Entropy 0.63466 (0.63961)	Top-1 acc 56.641 (57.764)	Top-5 acc 81.641 (79.624)	lr 0.01558
Train [51][1550/3239]	Time 0.242 (1.213)	Data Time 0.001 (0.740)	Loss 2.7466 (2.7478)	Entropy 0.63478 (0.63958)	Top-1 acc 60.156 (57.771)	Top-5 acc 79.297 (79.625)	lr 0.01558
Train [51][1560/3239]	Time 0.236 (1.208)	Data Time 0.001 (0.735)	Loss 2.9198 (2.7481)	Entropy 0.63465 (0.63955)	Top-1 acc 53.516 (57.757)	Top-5 acc 75.000 (79.611)	lr 0.01558
Train [51][1570/3239]	Time 0.236 (1.210)	Data Time 0.001 (0.738)	Loss 2.8226 (2.7482)	Entropy 0.63481 (0.63951)	Top-1 acc 55.078 (57.750)	Top-5 acc 78.125 (79.616)	lr 0.01558
Train [51][1580/3239]	Time 0.261 (1.224)	Data Time 0.001 (0.752)	Loss 2.5826 (2.7480)	Entropy 0.63488 (0.63949)	Top-1 acc 65.234 (57.757)	Top-5 acc 85.156 (79.620)	lr 0.01558
Train [51][1590/3239]	Time 0.356 (1.219)	Data Time 0.001 (0.748)	Loss 2.7071 (2.7479)	Entropy 0.63460 (0.63946)	Top-1 acc 54.688 (57.757)	Top-5 acc 82.812 (79.627)	lr 0.01558
Train [51][1600/3239]	Time 3.014 (1.216)	Data Time 2.726 (0.745)	Loss 3.0874 (2.7482)	Entropy 0.63481 (0.63943)	Top-1 acc 50.391 (57.750)	Top-5 acc 75.391 (79.624)	lr 0.01558
Train [51][1610/3239]	Time 0.243 (1.230)	Data Time 0.001 (0.759)	Loss 2.8259 (2.7480)	Entropy 0.63456 (0.63940)	Top-1 acc 54.297 (57.760)	Top-5 acc 78.125 (79.624)	lr 0.01558
Train [51][1620/3239]	Time 0.225 (1.225)	Data Time 0.001 (0.754)	Loss 2.8736 (2.7481)	Entropy 0.63461 (0.63937)	Top-1 acc 55.078 (57.759)	Top-5 acc 76.172 (79.622)	lr 0.01558
Train [51][1630/3239]	Time 0.241 (1.220)	Data Time 0.001 (0.750)	Loss 2.8199 (2.7478)	Entropy 0.63486 (0.63934)	Top-1 acc 55.859 (57.766)	Top-5 acc 77.344 (79.624)	lr 0.01558
Train [51][1640/3239]	Time 0.238 (1.218)	Data Time 0.001 (0.748)	Loss 2.6604 (2.7475)	Entropy 0.63455 (0.63931)	Top-1 acc 59.375 (57.777)	Top-5 acc 80.078 (79.630)	lr 0.01557
Train [51][1650/3239]	Time 0.246 (1.233)	Data Time 0.001 (0.764)	Loss 2.6881 (2.7471)	Entropy 0.63408 (0.63928)	Top-1 acc 59.766 (57.786)	Top-5 acc 79.297 (79.640)	lr 0.01557
Train [51][1660/3239]	Time 0.314 (1.229)	Data Time 0.001 (0.759)	Loss 2.6100 (2.7469)	Entropy 0.63426 (0.63925)	Top-1 acc 58.984 (57.791)	Top-5 acc 80.859 (79.644)	lr 0.01557
Train [51][1670/3239]	Time 0.253 (1.229)	Data Time 0.001 (0.760)	Loss 2.7897 (2.7469)	Entropy 0.63412 (0.63922)	Top-1 acc 57.422 (57.793)	Top-5 acc 76.953 (79.646)	lr 0.01557
Train [51][1680/3239]	Time 0.232 (1.240)	Data Time 0.001 (0.772)	Loss 2.8823 (2.7466)	Entropy 0.63382 (0.63919)	Top-1 acc 56.250 (57.800)	Top-5 acc 76.172 (79.646)	lr 0.01557
Train [51][1690/3239]	Time 0.242 (1.236)	Data Time 0.001 (0.767)	Loss 2.6710 (2.7466)	Entropy 0.63388 (0.63916)	Top-1 acc 60.547 (57.799)	Top-5 acc 84.375 (79.650)	lr 0.01557
Train [51][1700/3239]	Time 0.231 (1.237)	Data Time 0.001 (0.769)	Loss 2.7743 (2.7464)	Entropy 0.63404 (0.63912)	Top-1 acc 59.766 (57.810)	Top-5 acc 79.688 (79.650)	lr 0.01557
Train [51][1710/3239]	Time 0.237 (1.248)	Data Time 0.001 (0.780)	Loss 2.6214 (2.7462)	Entropy 0.63396 (0.63909)	Top-1 acc 62.500 (57.816)	Top-5 acc 83.984 (79.658)	lr 0.01557
Train [51][1720/3239]	Time 0.295 (1.261)	Data Time 0.031 (0.775)	Loss 2.8823 (2.7466)	Entropy 0.63410 (0.63907)	Top-1 acc 56.641 (57.813)	Top-5 acc 77.344 (79.647)	lr 0.01557
Train [51][1730/3239]	Time 0.273 (1.257)	Data Time 0.004 (0.771)	Loss 2.7111 (2.7467)	Entropy 0.63415 (0.63904)	Top-1 acc 58.203 (57.809)	Top-5 acc 81.250 (79.642)	lr 0.01557
Train [51][1740/3239]	Time 0.235 (1.255)	Data Time 0.001 (0.769)	Loss 2.9497 (2.7469)	Entropy 0.63418 (0.63901)	Top-1 acc 53.516 (57.807)	Top-5 acc 76.172 (79.637)	lr 0.01557
Train [51][1750/3239]	Time 0.334 (1.251)	Data Time 0.001 (0.766)	Loss 2.9066 (2.7466)	Entropy 0.63435 (0.63898)	Top-1 acc 48.047 (57.806)	Top-5 acc 78.125 (79.640)	lr 0.01556
Train [51][1760/3239]	Time 13.659 (1.254)	Data Time 13.397 (0.769)	Loss 2.6933 (2.7468)	Entropy 0.63416 (0.63895)	Top-1 acc 56.250 (57.803)	Top-5 acc 81.641 (79.637)	lr 0.01556
Train [51][1770/3239]	Time 0.228 (1.262)	Data Time 0.001 (0.777)	Loss 2.6868 (2.7466)	Entropy 0.63439 (0.63893)	Top-1 acc 58.984 (57.808)	Top-5 acc 79.688 (79.641)	lr 0.01556
Train [51][1780/3239]	Time 0.278 (1.257)	Data Time 0.001 (0.772)	Loss 2.6353 (2.7464)	Entropy 0.63442 (0.63890)	Top-1 acc 61.328 (57.805)	Top-5 acc 82.031 (79.645)	lr 0.01556
Train [51][1790/3239]	Time 0.239 (1.252)	Data Time 0.002 (0.768)	Loss 2.7055 (2.7464)	Entropy 0.63446 (0.63888)	Top-1 acc 61.328 (57.805)	Top-5 acc 81.250 (79.649)	lr 0.01556
Train [51][1800/3239]	Time 0.254 (1.253)	Data Time 0.001 (0.769)	Loss 2.5175 (2.7464)	Entropy 0.63468 (0.63885)	Top-1 acc 63.672 (57.808)	Top-5 acc 84.375 (79.649)	lr 0.01556
Train [51][1810/3239]	Time 0.224 (1.262)	Data Time 0.001 (0.778)	Loss 2.7635 (2.7463)	Entropy 0.63472 (0.63883)	Top-1 acc 56.641 (57.815)	Top-5 acc 81.641 (79.647)	lr 0.01556
Train [51][1820/3239]	Time 0.375 (1.257)	Data Time 0.001 (0.774)	Loss 2.7941 (2.7461)	Entropy 0.63500 (0.63881)	Top-1 acc 59.375 (57.819)	Top-5 acc 78.906 (79.650)	lr 0.01556
Train [51][1830/3239]	Time 0.268 (1.256)	Data Time 0.001 (0.773)	Loss 2.8823 (2.7458)	Entropy 0.63502 (0.63879)	Top-1 acc 55.078 (57.824)	Top-5 acc 77.344 (79.655)	lr 0.01556
Train [51][1840/3239]	Time 0.236 (1.261)	Data Time 0.001 (0.779)	Loss 3.0275 (2.7461)	Entropy 0.63491 (0.63877)	Top-1 acc 52.734 (57.816)	Top-5 acc 75.781 (79.653)	lr 0.01556
Train [51][1850/3239]	Time 0.266 (1.257)	Data Time 0.002 (0.775)	Loss 2.6932 (2.7462)	Entropy 0.63530 (0.63875)	Top-1 acc 57.031 (57.818)	Top-5 acc 82.031 (79.651)	lr 0.01555
Train [51][1860/3239]	Time 0.252 (1.257)	Data Time 0.001 (0.775)	Loss 2.9132 (2.7461)	Entropy 0.63506 (0.63873)	Top-1 acc 55.859 (57.819)	Top-5 acc 74.219 (79.648)	lr 0.01555
Train [51][1870/3239]	Time 0.227 (1.261)	Data Time 0.001 (0.779)	Loss 2.8547 (2.7462)	Entropy 0.63499 (0.63871)	Top-1 acc 58.203 (57.824)	Top-5 acc 76.172 (79.644)	lr 0.01555
Train [51][1880/3239]	Time 0.260 (1.256)	Data Time 0.002 (0.775)	Loss 2.7506 (2.7461)	Entropy 0.63492 (0.63869)	Top-1 acc 57.031 (57.822)	Top-5 acc 75.781 (79.645)	lr 0.01555
Train [51][1890/3239]	Time 0.237 (1.257)	Data Time 0.001 (0.776)	Loss 2.6652 (2.7464)	Entropy 0.63510 (0.63867)	Top-1 acc 58.984 (57.811)	Top-5 acc 80.078 (79.639)	lr 0.01555
Train [51][1900/3239]	Time 0.230 (1.264)	Data Time 0.001 (0.783)	Loss 2.8449 (2.7460)	Entropy 0.63478 (0.63865)	Top-1 acc 51.953 (57.815)	Top-5 acc 78.516 (79.645)	lr 0.01555
Train [51][1910/3239]	Time 0.327 (1.260)	Data Time 0.001 (0.779)	Loss 2.8339 (2.7461)	Entropy 0.63461 (0.63863)	Top-1 acc 60.547 (57.819)	Top-5 acc 78.125 (79.646)	lr 0.01555
Train [51][1920/3239]	Time 6.633 (1.258)	Data Time 6.379 (0.779)	Loss 2.8203 (2.7462)	Entropy 0.63434 (0.63861)	Top-1 acc 55.859 (57.815)	Top-5 acc 76.562 (79.643)	lr 0.01555
Train [51][1930/3239]	Time 0.287 (1.264)	Data Time 0.001 (0.784)	Loss 2.7108 (2.7464)	Entropy 0.63442 (0.63859)	Top-1 acc 56.250 (57.814)	Top-5 acc 81.250 (79.641)	lr 0.01555
Train [51][1940/3239]	Time 0.244 (1.260)	Data Time 0.001 (0.780)	Loss 2.8600 (2.7468)	Entropy 0.63456 (0.63856)	Top-1 acc 53.516 (57.802)	Top-5 acc 80.078 (79.636)	lr 0.01555
Train [51][1950/3239]	Time 0.228 (1.255)	Data Time 0.001 (0.776)	Loss 2.7263 (2.7468)	Entropy 0.63462 (0.63854)	Top-1 acc 58.594 (57.801)	Top-5 acc 81.250 (79.635)	lr 0.01554
Train [51][1960/3239]	Time 0.241 (1.256)	Data Time 0.001 (0.777)	Loss 2.7966 (2.7469)	Entropy 0.63434 (0.63852)	Top-1 acc 56.250 (57.802)	Top-5 acc 78.125 (79.634)	lr 0.01554
Train [51][1970/3239]	Time 0.238 (1.263)	Data Time 0.001 (0.784)	Loss 2.7762 (2.7467)	Entropy 0.63463 (0.63850)	Top-1 acc 57.422 (57.803)	Top-5 acc 78.125 (79.636)	lr 0.01554
Train [51][1980/3239]	Time 0.351 (1.258)	Data Time 0.001 (0.780)	Loss 2.7254 (2.7467)	Entropy 0.63468 (0.63848)	Top-1 acc 57.031 (57.804)	Top-5 acc 81.641 (79.638)	lr 0.01554
Train [51][1990/3239]	Time 0.251 (1.256)	Data Time 0.001 (0.778)	Loss 2.6217 (2.7467)	Entropy 0.63444 (0.63846)	Top-1 acc 60.547 (57.803)	Top-5 acc 81.641 (79.642)	lr 0.01554
Train [51][2000/3239]	Time 0.240 (1.264)	Data Time 0.001 (0.786)	Loss 2.7369 (2.7467)	Entropy 0.63440 (0.63844)	Top-1 acc 56.641 (57.804)	Top-5 acc 84.766 (79.645)	lr 0.01554
Train [51][2010/3239]	Time 0.241 (1.260)	Data Time 0.001 (0.782)	Loss 2.8838 (2.7469)	Entropy 0.63443 (0.63842)	Top-1 acc 57.422 (57.795)	Top-5 acc 75.781 (79.645)	lr 0.01554
Train [51][2020/3239]	Time 0.247 (1.258)	Data Time 0.001 (0.781)	Loss 2.5838 (2.7468)	Entropy 0.63459 (0.63840)	Top-1 acc 60.156 (57.798)	Top-5 acc 82.031 (79.645)	lr 0.01554
Train [51][2030/3239]	Time 0.244 (1.264)	Data Time 0.001 (0.787)	Loss 2.6704 (2.7470)	Entropy 0.63454 (0.63839)	Top-1 acc 60.156 (57.800)	Top-5 acc 81.250 (79.647)	lr 0.01554
Train [51][2040/3239]	Time 0.233 (1.260)	Data Time 0.001 (0.783)	Loss 2.7907 (2.7472)	Entropy 0.63464 (0.63837)	Top-1 acc 55.859 (57.792)	Top-5 acc 79.297 (79.647)	lr 0.01554
Train [51][2050/3239]	Time 0.239 (1.258)	Data Time 0.001 (0.781)	Loss 2.8341 (2.7473)	Entropy 0.63435 (0.63835)	Top-1 acc 51.953 (57.789)	Top-5 acc 80.078 (79.644)	lr 0.01553
Train [51][2060/3239]	Time 0.230 (1.265)	Data Time 0.001 (0.789)	Loss 2.8972 (2.7477)	Entropy 0.63438 (0.63833)	Top-1 acc 53.516 (57.781)	Top-5 acc 76.562 (79.634)	lr 0.01553
Train [51][2070/3239]	Time 0.330 (1.261)	Data Time 0.001 (0.785)	Loss 2.6900 (2.7476)	Entropy 0.63402 (0.63831)	Top-1 acc 60.156 (57.783)	Top-5 acc 80.859 (79.636)	lr 0.01553
Train [51][2080/3239]	Time 1.836 (1.258)	Data Time 1.583 (0.782)	Loss 2.7695 (2.7478)	Entropy 0.63390 (0.63829)	Top-1 acc 53.906 (57.780)	Top-5 acc 76.562 (79.629)	lr 0.01553
Train [51][2090/3239]	Time 0.254 (1.266)	Data Time 0.001 (0.791)	Loss 2.8600 (2.7481)	Entropy 0.63416 (0.63827)	Top-1 acc 56.641 (57.779)	Top-5 acc 75.781 (79.620)	lr 0.01553
Train [51][2100/3239]	Time 0.225 (1.262)	Data Time 0.001 (0.787)	Loss 2.8498 (2.7480)	Entropy 0.63434 (0.63825)	Top-1 acc 55.078 (57.780)	Top-5 acc 77.344 (79.622)	lr 0.01553
Train [51][2110/3239]	Time 0.246 (1.258)	Data Time 0.001 (0.783)	Loss 2.6708 (2.7479)	Entropy 0.63467 (0.63823)	Top-1 acc 60.547 (57.780)	Top-5 acc 82.422 (79.622)	lr 0.01553
Train [51][2120/3239]	Time 0.246 (1.254)	Data Time 0.001 (0.780)	Loss 2.5856 (2.7481)	Entropy 0.63500 (0.63821)	Top-1 acc 62.109 (57.773)	Top-5 acc 82.422 (79.619)	lr 0.01553
Train [51][2130/3239]	Time 0.232 (1.262)	Data Time 0.001 (0.787)	Loss 2.7795 (2.7478)	Entropy 0.63535 (0.63820)	Top-1 acc 57.031 (57.779)	Top-5 acc 79.297 (79.626)	lr 0.01553
Train [51][2140/3239]	Time 0.323 (1.258)	Data Time 0.001 (0.784)	Loss 2.6541 (2.7479)	Entropy 0.63538 (0.63819)	Top-1 acc 58.594 (57.776)	Top-5 acc 82.422 (79.628)	lr 0.01553
Train [51][2150/3239]	Time 0.225 (1.255)	Data Time 0.001 (0.781)	Loss 2.7111 (2.7481)	Entropy 0.63544 (0.63817)	Top-1 acc 58.984 (57.774)	Top-5 acc 77.344 (79.620)	lr 0.01553
Train [51][2160/3239]	Time 0.229 (1.263)	Data Time 0.001 (0.789)	Loss 2.8479 (2.7479)	Entropy 0.63552 (0.63816)	Top-1 acc 54.688 (57.780)	Top-5 acc 76.953 (79.624)	lr 0.01552
Train [51][2170/3239]	Time 0.232 (1.259)	Data Time 0.001 (0.786)	Loss 2.5805 (2.7478)	Entropy 0.63571 (0.63815)	Top-1 acc 61.328 (57.782)	Top-5 acc 81.641 (79.625)	lr 0.01552
Train [51][2180/3239]	Time 0.242 (1.256)	Data Time 0.001 (0.783)	Loss 2.8488 (2.7477)	Entropy 0.63544 (0.63814)	Top-1 acc 52.734 (57.784)	Top-5 acc 75.391 (79.630)	lr 0.01552
Train [51][2190/3239]	Time 0.235 (1.263)	Data Time 0.001 (0.791)	Loss 2.5965 (2.7476)	Entropy 0.63526 (0.63813)	Top-1 acc 62.500 (57.785)	Top-5 acc 83.594 (79.633)	lr 0.01552
Train [51][2200/3239]	Time 0.246 (1.260)	Data Time 0.001 (0.787)	Loss 2.8636 (2.7474)	Entropy 0.63520 (0.63811)	Top-1 acc 53.516 (57.780)	Top-5 acc 76.953 (79.638)	lr 0.01552
Train [51][2210/3239]	Time 0.231 (1.256)	Data Time 0.001 (0.784)	Loss 2.5523 (2.7474)	Entropy 0.63512 (0.63810)	Top-1 acc 61.328 (57.782)	Top-5 acc 84.375 (79.641)	lr 0.01552
Train [51][2220/3239]	Time 0.244 (1.263)	Data Time 0.001 (0.791)	Loss 2.8851 (2.7475)	Entropy 0.63529 (0.63809)	Top-1 acc 55.859 (57.781)	Top-5 acc 77.734 (79.642)	lr 0.01552
Train [51][2230/3239]	Time 0.257 (1.259)	Data Time 0.001 (0.788)	Loss 2.6819 (2.7476)	Entropy 0.63543 (0.63807)	Top-1 acc 58.984 (57.775)	Top-5 acc 80.469 (79.641)	lr 0.01552
Train [51][2240/3239]	Time 1.547 (1.256)	Data Time 1.294 (0.785)	Loss 2.8245 (2.7477)	Entropy 0.63552 (0.63806)	Top-1 acc 56.250 (57.774)	Top-5 acc 77.734 (79.638)	lr 0.01552
Train [51][2250/3239]	Time 0.245 (1.263)	Data Time 0.001 (0.792)	Loss 2.9921 (2.7478)	Entropy 0.63552 (0.63805)	Top-1 acc 51.953 (57.768)	Top-5 acc 78.125 (79.636)	lr 0.01552
Train [51][2260/3239]	Time 0.236 (1.260)	Data Time 0.001 (0.789)	Loss 2.6866 (2.7478)	Entropy 0.63548 (0.63804)	Top-1 acc 58.203 (57.768)	Top-5 acc 81.250 (79.636)	lr 0.01551
Train [51][2270/3239]	Time 0.228 (1.256)	Data Time 0.001 (0.786)	Loss 2.7535 (2.7477)	Entropy 0.63532 (0.63803)	Top-1 acc 58.203 (57.774)	Top-5 acc 80.078 (79.639)	lr 0.01551
Train [51][2280/3239]	Time 0.229 (1.254)	Data Time 0.001 (0.784)	Loss 2.8299 (2.7476)	Entropy 0.63535 (0.63802)	Top-1 acc 53.125 (57.776)	Top-5 acc 78.906 (79.638)	lr 0.01551
Train [51][2290/3239]	Time 0.238 (1.261)	Data Time 0.001 (0.791)	Loss 2.8727 (2.7473)	Entropy 0.63515 (0.63800)	Top-1 acc 51.562 (57.785)	Top-5 acc 79.297 (79.645)	lr 0.01551
Train [51][2300/3239]	Time 0.345 (1.258)	Data Time 0.001 (0.788)	Loss 2.9944 (2.7472)	Entropy 0.63516 (0.63799)	Top-1 acc 55.859 (57.788)	Top-5 acc 74.219 (79.649)	lr 0.01551
Train [51][2310/3239]	Time 0.234 (1.256)	Data Time 0.001 (0.787)	Loss 2.7873 (2.7473)	Entropy 0.63552 (0.63798)	Top-1 acc 61.328 (57.788)	Top-5 acc 78.906 (79.645)	lr 0.01551
Train [51][2320/3239]	Time 0.248 (1.263)	Data Time 0.002 (0.794)	Loss 2.8074 (2.7474)	Entropy 0.63541 (0.63797)	Top-1 acc 57.031 (57.786)	Top-5 acc 78.516 (79.639)	lr 0.01551
Train [51][2330/3239]	Time 0.238 (1.260)	Data Time 0.001 (0.791)	Loss 3.0167 (2.7475)	Entropy 0.63563 (0.63796)	Top-1 acc 48.438 (57.782)	Top-5 acc 77.344 (79.641)	lr 0.01551
Train [51][2340/3239]	Time 0.238 (1.257)	Data Time 0.001 (0.789)	Loss 2.8530 (2.7478)	Entropy 0.63568 (0.63795)	Top-1 acc 55.859 (57.779)	Top-5 acc 75.391 (79.632)	lr 0.01551
Train [51][2350/3239]	Time 0.240 (1.264)	Data Time 0.001 (0.795)	Loss 2.6919 (2.7478)	Entropy 0.63522 (0.63794)	Top-1 acc 59.375 (57.776)	Top-5 acc 80.469 (79.633)	lr 0.01551
Train [51][2360/3239]	Time 0.249 (1.260)	Data Time 0.001 (0.792)	Loss 2.7143 (2.7476)	Entropy 0.63501 (0.63793)	Top-1 acc 57.422 (57.780)	Top-5 acc 79.688 (79.637)	lr 0.01550
Train [51][2370/3239]	Time 0.363 (1.258)	Data Time 0.001 (0.790)	Loss 2.6694 (2.7477)	Entropy 0.63515 (0.63791)	Top-1 acc 58.203 (57.780)	Top-5 acc 83.203 (79.638)	lr 0.01550
Train [51][2380/3239]	Time 0.244 (1.270)	Data Time 0.002 (0.788)	Loss 2.9266 (2.7478)	Entropy 0.63535 (0.63790)	Top-1 acc 55.859 (57.775)	Top-5 acc 78.125 (79.637)	lr 0.01550
Train [51][2390/3239]	Time 0.348 (1.267)	Data Time 0.002 (0.784)	Loss 2.6459 (2.7474)	Entropy 0.63566 (0.63789)	Top-1 acc 60.547 (57.784)	Top-5 acc 81.641 (79.645)	lr 0.01550
Train [51][2400/3239]	Time 0.254 (1.263)	Data Time 0.001 (0.781)	Loss 2.6727 (2.7475)	Entropy 0.63544 (0.63788)	Top-1 acc 55.469 (57.782)	Top-5 acc 77.734 (79.645)	lr 0.01550
Train [51][2410/3239]	Time 0.255 (1.267)	Data Time 0.002 (0.785)	Loss 3.0143 (2.7475)	Entropy 0.63523 (0.63787)	Top-1 acc 50.781 (57.779)	Top-5 acc 73.828 (79.650)	lr 0.01550
Train [51][2420/3239]	Time 0.255 (1.264)	Data Time 0.002 (0.782)	Loss 2.9040 (2.7476)	Entropy 0.63518 (0.63786)	Top-1 acc 51.172 (57.772)	Top-5 acc 77.734 (79.646)	lr 0.01550
Train [51][2430/3239]	Time 0.262 (1.260)	Data Time 0.001 (0.779)	Loss 2.7053 (2.7478)	Entropy 0.63507 (0.63785)	Top-1 acc 59.375 (57.765)	Top-5 acc 80.859 (79.642)	lr 0.01550
Train [51][2440/3239]	Time 0.252 (1.261)	Data Time 0.001 (0.780)	Loss 2.6833 (2.7477)	Entropy 0.63543 (0.63784)	Top-1 acc 64.062 (57.767)	Top-5 acc 82.031 (79.643)	lr 0.01550
Train [51][2450/3239]	Time 0.245 (1.265)	Data Time 0.001 (0.784)	Loss 2.7808 (2.7478)	Entropy 0.63535 (0.63783)	Top-1 acc 58.594 (57.764)	Top-5 acc 77.734 (79.640)	lr 0.01550
Train [51][2460/3239]	Time 0.330 (1.262)	Data Time 0.001 (0.781)	Loss 2.6950 (2.7479)	Entropy 0.63534 (0.63782)	Top-1 acc 60.156 (57.763)	Top-5 acc 79.297 (79.634)	lr 0.01549
Train [51][2470/3239]	Time 0.249 (1.262)	Data Time 0.001 (0.782)	Loss 2.9830 (2.7481)	Entropy 0.63544 (0.63781)	Top-1 acc 53.516 (57.752)	Top-5 acc 73.828 (79.629)	lr 0.01549
Train [51][2480/3239]	Time 0.235 (1.267)	Data Time 0.001 (0.786)	Loss 2.8100 (2.7483)	Entropy 0.63561 (0.63780)	Top-1 acc 55.078 (57.746)	Top-5 acc 76.562 (79.627)	lr 0.01549
Train [51][2490/3239]	Time 0.232 (1.263)	Data Time 0.001 (0.783)	Loss 2.7443 (2.7483)	Entropy 0.63507 (0.63779)	Top-1 acc 57.422 (57.746)	Top-5 acc 77.734 (79.624)	lr 0.01549
Train [51][2500/3239]	Time 0.246 (1.263)	Data Time 0.002 (0.784)	Loss 2.7848 (2.7483)	Entropy 0.63518 (0.63778)	Top-1 acc 57.031 (57.748)	Top-5 acc 80.469 (79.625)	lr 0.01549
Train [51][2510/3239]	Time 0.245 (1.267)	Data Time 0.001 (0.787)	Loss 2.7002 (2.7486)	Entropy 0.63518 (0.63777)	Top-1 acc 58.984 (57.745)	Top-5 acc 80.078 (79.622)	lr 0.01549
Train [51][2520/3239]	Time 0.249 (1.264)	Data Time 0.001 (0.784)	Loss 2.5833 (2.7485)	Entropy 0.63512 (0.63776)	Top-1 acc 60.156 (57.745)	Top-5 acc 82.422 (79.623)	lr 0.01549
Train [51][2530/3239]	Time 0.269 (1.263)	Data Time 0.002 (0.784)	Loss 2.7787 (2.7486)	Entropy 0.63485 (0.63775)	Top-1 acc 59.766 (57.743)	Top-5 acc 79.688 (79.621)	lr 0.01549
Train [51][2540/3239]	Time 0.246 (1.264)	Data Time 0.001 (0.785)	Loss 2.7758 (2.7487)	Entropy 0.63513 (0.63774)	Top-1 acc 57.031 (57.740)	Top-5 acc 78.906 (79.622)	lr 0.01549
Train [51][2550/3239]	Time 0.270 (1.261)	Data Time 0.001 (0.782)	Loss 2.7188 (2.7490)	Entropy 0.63530 (0.63773)	Top-1 acc 55.859 (57.729)	Top-5 acc 80.078 (79.614)	lr 0.01549
Train [51][2560/3239]	Time 6.507 (1.260)	Data Time 6.249 (0.781)	Loss 2.8727 (2.7489)	Entropy 0.63524 (0.63772)	Top-1 acc 52.734 (57.732)	Top-5 acc 78.516 (79.615)	lr 0.01548
Train [51][2570/3239]	Time 0.281 (1.266)	Data Time 0.001 (0.787)	Loss 2.8338 (2.7489)	Entropy 0.63526 (0.63771)	Top-1 acc 55.859 (57.732)	Top-5 acc 78.125 (79.615)	lr 0.01548
Train [51][2580/3239]	Time 0.223 (1.262)	Data Time 0.001 (0.784)	Loss 2.7890 (2.7487)	Entropy 0.63521 (0.63770)	Top-1 acc 56.641 (57.737)	Top-5 acc 80.078 (79.620)	lr 0.01548
Train [51][2590/3239]	Time 0.273 (1.259)	Data Time 0.001 (0.781)	Loss 2.7405 (2.7488)	Entropy 0.63525 (0.63769)	Top-1 acc 60.547 (57.739)	Top-5 acc 79.688 (79.617)	lr 0.01548
Train [51][2600/3239]	Time 0.285 (1.259)	Data Time 0.001 (0.781)	Loss 2.5790 (2.7488)	Entropy 0.63516 (0.63768)	Top-1 acc 59.766 (57.732)	Top-5 acc 83.594 (79.615)	lr 0.01548
Train [51][2610/3239]	Time 0.231 (1.263)	Data Time 0.001 (0.786)	Loss 2.9079 (2.7487)	Entropy 0.63512 (0.63767)	Top-1 acc 52.734 (57.730)	Top-5 acc 77.344 (79.617)	lr 0.01548
Train [51][2620/3239]	Time 0.343 (1.260)	Data Time 0.002 (0.783)	Loss 2.7182 (2.7490)	Entropy 0.63503 (0.63766)	Top-1 acc 58.984 (57.722)	Top-5 acc 83.203 (79.612)	lr 0.01548
Train [51][2630/3239]	Time 0.244 (1.261)	Data Time 0.001 (0.784)	Loss 2.9241 (2.7492)	Entropy 0.63473 (0.63765)	Top-1 acc 53.125 (57.718)	Top-5 acc 75.391 (79.606)	lr 0.01548
Train [51][2640/3239]	Time 0.238 (1.266)	Data Time 0.001 (0.789)	Loss 2.7567 (2.7489)	Entropy 0.63456 (0.63764)	Top-1 acc 60.938 (57.730)	Top-5 acc 79.688 (79.609)	lr 0.01548
Train [51][2650/3239]	Time 0.240 (1.263)	Data Time 0.001 (0.786)	Loss 2.8067 (2.7490)	Entropy 0.63464 (0.63763)	Top-1 acc 56.641 (57.724)	Top-5 acc 78.125 (79.608)	lr 0.01548
Train [51][2660/3239]	Time 0.247 (1.263)	Data Time 0.001 (0.786)	Loss 2.6714 (2.7490)	Entropy 0.63478 (0.63762)	Top-1 acc 61.328 (57.723)	Top-5 acc 80.469 (79.607)	lr 0.01547
Train [51][2670/3239]	Time 0.238 (1.266)	Data Time 0.001 (0.790)	Loss 2.8593 (2.7491)	Entropy 0.63462 (0.63760)	Top-1 acc 54.688 (57.719)	Top-5 acc 78.516 (79.605)	lr 0.01547
Train [51][2680/3239]	Time 0.275 (1.263)	Data Time 0.001 (0.787)	Loss 2.6392 (2.7493)	Entropy 0.63466 (0.63759)	Top-1 acc 58.594 (57.720)	Top-5 acc 81.250 (79.602)	lr 0.01547
Train [51][2690/3239]	Time 0.343 (1.262)	Data Time 0.001 (0.786)	Loss 2.9897 (2.7494)	Entropy 0.63490 (0.63758)	Top-1 acc 51.172 (57.718)	Top-5 acc 76.562 (79.600)	lr 0.01547
Train [51][2700/3239]	Time 0.282 (1.262)	Data Time 0.001 (0.786)	Loss 2.9777 (2.7495)	Entropy 0.63526 (0.63757)	Top-1 acc 52.734 (57.719)	Top-5 acc 75.781 (79.597)	lr 0.01547
Train [51][2710/3239]	Time 0.246 (1.259)	Data Time 0.001 (0.783)	Loss 2.6410 (2.7494)	Entropy 0.63542 (0.63757)	Top-1 acc 62.500 (57.725)	Top-5 acc 81.641 (79.598)	lr 0.01547
Train [51][2720/3239]	Time 3.804 (1.257)	Data Time 3.554 (0.781)	Loss 2.7923 (2.7493)	Entropy 0.63530 (0.63756)	Top-1 acc 56.250 (57.726)	Top-5 acc 78.516 (79.599)	lr 0.01547
Train [51][2730/3239]	Time 0.239 (1.257)	Data Time 0.001 (0.782)	Loss 2.7697 (2.7494)	Entropy 0.63565 (0.63755)	Top-1 acc 57.031 (57.726)	Top-5 acc 78.516 (79.597)	lr 0.01547
Train [51][2740/3239]	Time 0.240 (1.254)	Data Time 0.001 (0.779)	Loss 2.7637 (2.7492)	Entropy 0.63565 (0.63754)	Top-1 acc 57.422 (57.729)	Top-5 acc 80.469 (79.603)	lr 0.01547
Train [51][2750/3239]	Time 0.279 (1.251)	Data Time 0.001 (0.776)	Loss 2.6968 (2.7491)	Entropy 0.63593 (0.63754)	Top-1 acc 57.812 (57.729)	Top-5 acc 80.469 (79.606)	lr 0.01547
Train [51][2760/3239]	Time 0.251 (1.249)	Data Time 0.001 (0.774)	Loss 2.8136 (2.7493)	Entropy 0.63572 (0.63753)	Top-1 acc 57.031 (57.723)	Top-5 acc 78.516 (79.602)	lr 0.01547
Train [51][2770/3239]	Time 0.239 (1.249)	Data Time 0.001 (0.774)	Loss 2.8155 (2.7495)	Entropy 0.63578 (0.63752)	Top-1 acc 54.688 (57.719)	Top-5 acc 79.688 (79.602)	lr 0.01546
Train [51][2780/3239]	Time 0.341 (1.246)	Data Time 0.001 (0.772)	Loss 2.7592 (2.7496)	Entropy 0.63581 (0.63752)	Top-1 acc 56.641 (57.717)	Top-5 acc 77.344 (79.593)	lr 0.01546
Train [51][2790/3239]	Time 0.250 (1.245)	Data Time 0.001 (0.770)	Loss 2.5869 (2.7498)	Entropy 0.63573 (0.63751)	Top-1 acc 64.453 (57.713)	Top-5 acc 81.641 (79.588)	lr 0.01546
Train [51][2800/3239]	Time 0.246 (1.244)	Data Time 0.001 (0.770)	Loss 2.7466 (2.7501)	Entropy 0.63575 (0.63751)	Top-1 acc 53.125 (57.703)	Top-5 acc 80.859 (79.584)	lr 0.01546
Train [51][2810/3239]	Time 0.253 (1.241)	Data Time 0.002 (0.767)	Loss 2.7704 (2.7504)	Entropy 0.63572 (0.63750)	Top-1 acc 56.641 (57.695)	Top-5 acc 78.125 (79.581)	lr 0.01546
Train [51][2820/3239]	Time 0.243 (1.240)	Data Time 0.001 (0.766)	Loss 2.7461 (2.7505)	Entropy 0.63573 (0.63749)	Top-1 acc 56.250 (57.687)	Top-5 acc 80.078 (79.580)	lr 0.01546
Train [51][2830/3239]	Time 0.232 (1.241)	Data Time 0.001 (0.767)	Loss 2.9031 (2.7506)	Entropy 0.63574 (0.63749)	Top-1 acc 57.031 (57.685)	Top-5 acc 76.562 (79.578)	lr 0.01546
Train [51][2840/3239]	Time 0.224 (1.238)	Data Time 0.001 (0.764)	Loss 2.8297 (2.7504)	Entropy 0.63606 (0.63748)	Top-1 acc 57.812 (57.691)	Top-5 acc 76.562 (79.579)	lr 0.01546
Train [51][2850/3239]	Time 0.330 (1.239)	Data Time 0.001 (0.765)	Loss 2.7845 (2.7503)	Entropy 0.63596 (0.63748)	Top-1 acc 60.547 (57.696)	Top-5 acc 79.688 (79.579)	lr 0.01546
Train [51][2860/3239]	Time 0.237 (1.240)	Data Time 0.001 (0.767)	Loss 2.8424 (2.7503)	Entropy 0.63592 (0.63747)	Top-1 acc 58.984 (57.694)	Top-5 acc 79.297 (79.581)	lr 0.01546
Train [51][2870/3239]	Time 0.239 (1.237)	Data Time 0.001 (0.764)	Loss 2.6352 (2.7503)	Entropy 0.63568 (0.63747)	Top-1 acc 62.109 (57.696)	Top-5 acc 80.859 (79.581)	lr 0.01545
Train [51][2880/3239]	Time 11.194 (1.238)	Data Time 10.929 (0.765)	Loss 2.8335 (2.7502)	Entropy 0.63570 (0.63746)	Top-1 acc 56.250 (57.699)	Top-5 acc 79.297 (79.584)	lr 0.01545
Train [51][2890/3239]	Time 0.236 (1.240)	Data Time 0.001 (0.768)	Loss 2.7916 (2.7500)	Entropy 0.63589 (0.63745)	Top-1 acc 56.250 (57.702)	Top-5 acc 80.469 (79.589)	lr 0.01545
Train [51][2900/3239]	Time 0.241 (1.238)	Data Time 0.001 (0.765)	Loss 2.7847 (2.7499)	Entropy 0.63576 (0.63745)	Top-1 acc 56.250 (57.701)	Top-5 acc 76.953 (79.589)	lr 0.01545
Train [51][2910/3239]	Time 0.264 (1.235)	Data Time 0.002 (0.763)	Loss 2.9298 (2.7499)	Entropy 0.63574 (0.63744)	Top-1 acc 53.906 (57.699)	Top-5 acc 76.562 (79.587)	lr 0.01545
Train [51][2920/3239]	Time 0.264 (1.236)	Data Time 0.001 (0.764)	Loss 2.8085 (2.7499)	Entropy 0.63595 (0.63744)	Top-1 acc 55.469 (57.698)	Top-5 acc 76.172 (79.586)	lr 0.01545
Train [51][2930/3239]	Time 0.227 (1.237)	Data Time 0.001 (0.765)	Loss 2.7055 (2.7500)	Entropy 0.63586 (0.63743)	Top-1 acc 59.375 (57.697)	Top-5 acc 81.641 (79.585)	lr 0.01545
Train [51][2940/3239]	Time 0.259 (1.234)	Data Time 0.002 (0.762)	Loss 2.6982 (2.7499)	Entropy 0.63595 (0.63743)	Top-1 acc 57.422 (57.697)	Top-5 acc 81.250 (79.587)	lr 0.01545
Train [51][2950/3239]	Time 0.229 (1.236)	Data Time 0.001 (0.765)	Loss 3.0099 (2.7501)	Entropy 0.63582 (0.63742)	Top-1 acc 55.859 (57.692)	Top-5 acc 72.656 (79.585)	lr 0.01545
Train [51][2960/3239]	Time 0.242 (1.237)	Data Time 0.001 (0.766)	Loss 2.6627 (2.7501)	Entropy 0.63628 (0.63742)	Top-1 acc 60.938 (57.695)	Top-5 acc 80.469 (79.583)	lr 0.01545
Train [51][2970/3239]	Time 0.240 (1.235)	Data Time 0.001 (0.763)	Loss 2.8946 (2.7502)	Entropy 0.63601 (0.63741)	Top-1 acc 57.422 (57.694)	Top-5 acc 77.734 (79.582)	lr 0.01544
Train [51][2980/3239]	Time 0.231 (1.237)	Data Time 0.001 (0.766)	Loss 2.8060 (2.7505)	Entropy 0.63608 (0.63741)	Top-1 acc 57.812 (57.693)	Top-5 acc 76.562 (79.577)	lr 0.01544
Train [51][2990/3239]	Time 0.225 (1.238)	Data Time 0.001 (0.767)	Loss 2.8319 (2.7503)	Entropy 0.63602 (0.63740)	Top-1 acc 57.422 (57.698)	Top-5 acc 80.078 (79.577)	lr 0.01544
Train [51][3000/3239]	Time 0.254 (1.235)	Data Time 0.001 (0.764)	Loss 3.2576 (2.7504)	Entropy 0.63593 (0.63740)	Top-1 acc 42.578 (57.696)	Top-5 acc 71.094 (79.572)	lr 0.01544
Train [51][3010/3239]	Time 0.375 (1.237)	Data Time 0.001 (0.767)	Loss 2.9852 (2.7504)	Entropy 0.63587 (0.63739)	Top-1 acc 51.562 (57.690)	Top-5 acc 76.172 (79.571)	lr 0.01544
Train [51][3020/3239]	Time 0.221 (1.238)	Data Time 0.001 (0.768)	Loss 2.7630 (2.7506)	Entropy 0.63526 (0.63739)	Top-1 acc 57.422 (57.684)	Top-5 acc 79.297 (79.568)	lr 0.01544
Train [51][3030/3239]	Time 0.337 (1.246)	Data Time 0.006 (0.765)	Loss 2.9074 (2.7506)	Entropy 0.63539 (0.63738)	Top-1 acc 54.297 (57.684)	Top-5 acc 78.516 (79.567)	lr 0.01544
Train [51][3040/3239]	Time 0.248 (1.244)	Data Time 0.002 (0.763)	Loss 2.8747 (2.7505)	Entropy 0.63540 (0.63737)	Top-1 acc 54.297 (57.688)	Top-5 acc 74.609 (79.569)	lr 0.01544
Train [51][3050/3239]	Time 0.260 (1.241)	Data Time 0.002 (0.760)	Loss 2.7698 (2.7503)	Entropy 0.63511 (0.63737)	Top-1 acc 58.984 (57.694)	Top-5 acc 77.344 (79.571)	lr 0.01544
Train [51][3060/3239]	Time 0.242 (1.238)	Data Time 0.001 (0.758)	Loss 2.6343 (2.7504)	Entropy 0.63548 (0.63736)	Top-1 acc 60.938 (57.692)	Top-5 acc 81.641 (79.568)	lr 0.01544
Train [51][3070/3239]	Time 0.242 (1.236)	Data Time 0.001 (0.755)	Loss 2.7246 (2.7503)	Entropy 0.63471 (0.63735)	Top-1 acc 56.250 (57.695)	Top-5 acc 80.078 (79.570)	lr 0.01543
Train [51][3080/3239]	Time 0.250 (1.234)	Data Time 0.001 (0.754)	Loss 2.8366 (2.7503)	Entropy 0.63506 (0.63735)	Top-1 acc 54.688 (57.697)	Top-5 acc 78.125 (79.570)	lr 0.01543
Train [51][3090/3239]	Time 0.299 (1.234)	Data Time 0.002 (0.754)	Loss 2.8353 (2.7502)	Entropy 0.63518 (0.63734)	Top-1 acc 58.594 (57.701)	Top-5 acc 78.516 (79.573)	lr 0.01543
Train [51][3100/3239]	Time 0.326 (1.231)	Data Time 0.003 (0.752)	Loss 2.9395 (2.7502)	Entropy 0.63518 (0.63733)	Top-1 acc 51.953 (57.700)	Top-5 acc 73.438 (79.571)	lr 0.01543
Train [51][3110/3239]	Time 0.244 (1.235)	Data Time 0.001 (0.755)	Loss 2.6946 (2.7502)	Entropy 0.63530 (0.63732)	Top-1 acc 60.547 (57.703)	Top-5 acc 79.297 (79.571)	lr 0.01543
Train [51][3120/3239]	Time 0.258 (1.234)	Data Time 0.001 (0.755)	Loss 2.6772 (2.7502)	Entropy 0.63550 (0.63732)	Top-1 acc 60.156 (57.699)	Top-5 acc 80.469 (79.572)	lr 0.01543
Train [51][3130/3239]	Time 0.312 (1.232)	Data Time 0.001 (0.752)	Loss 2.6581 (2.7500)	Entropy 0.63529 (0.63731)	Top-1 acc 59.766 (57.702)	Top-5 acc 81.641 (79.576)	lr 0.01543
Train [51][3140/3239]	Time 0.243 (1.235)	Data Time 0.001 (0.756)	Loss 2.7185 (2.7499)	Entropy 0.63514 (0.63731)	Top-1 acc 61.719 (57.705)	Top-5 acc 78.906 (79.577)	lr 0.01543
Train [51][3150/3239]	Time 0.248 (1.234)	Data Time 0.001 (0.755)	Loss 2.4564 (2.7499)	Entropy 0.63523 (0.63730)	Top-1 acc 63.281 (57.703)	Top-5 acc 87.500 (79.579)	lr 0.01543
Train [51][3160/3239]	Time 0.253 (1.232)	Data Time 0.001 (0.753)	Loss 2.6430 (2.7497)	Entropy 0.63570 (0.63729)	Top-1 acc 58.203 (57.709)	Top-5 acc 81.641 (79.582)	lr 0.01543
Train [51][3170/3239]	Time 0.338 (1.236)	Data Time 0.001 (0.757)	Loss 2.5486 (2.7498)	Entropy 0.63565 (0.63729)	Top-1 acc 61.719 (57.705)	Top-5 acc 83.203 (79.584)	lr 0.01542
Train [51][3180/3239]	Time 0.236 (1.234)	Data Time 0.000 (0.756)	Loss 2.6154 (2.7498)	Entropy 0.63594 (0.63728)	Top-1 acc 62.891 (57.702)	Top-5 acc 80.078 (79.584)	lr 0.01542
Train [51][3190/3239]	Time 0.255 (1.232)	Data Time 0.000 (0.753)	Loss 2.7576 (2.7497)	Entropy 0.63571 (0.63728)	Top-1 acc 58.984 (57.708)	Top-5 acc 79.297 (79.587)	lr 0.01542
Train [51][3200/3239]	Time 19.107 (1.235)	Data Time 18.844 (0.757)	Loss 2.5959 (2.7497)	Entropy 0.63569 (0.63727)	Top-1 acc 58.203 (57.709)	Top-5 acc 80.078 (79.588)	lr 0.01542
Train [51][3210/3239]	Time 0.223 (1.234)	Data Time 0.000 (0.756)	Loss 2.7905 (2.7496)	Entropy 0.63548 (0.63727)	Top-1 acc 56.250 (57.709)	Top-5 acc 80.078 (79.589)	lr 0.01542
Train [51][3220/3239]	Time 0.223 (1.232)	Data Time 0.000 (0.754)	Loss 2.7070 (2.7496)	Entropy 0.63534 (0.63726)	Top-1 acc 60.547 (57.707)	Top-5 acc 80.859 (79.590)	lr 0.01542
Train [51][3230/3239]	Time 0.232 (1.229)	Data Time 0.000 (0.751)	Loss 2.5801 (2.7495)	Entropy 0.63553 (0.63726)	Top-1 acc 62.109 (57.709)	Top-5 acc 83.984 (79.591)	lr 0.01542
Train [51][3239/3239]	Time 0.830 (1.229)	Data Time 0.000 (0.751)	Loss 3.3390 (2.7495)	Entropy 0.63552 (0.63725)	Top-1 acc 43.210 (57.712)	Top-5 acc 70.370 (79.592)	lr 0.01542
==========Valid [51/120]	loss 1.478	top-1 acc 66.027 (66.027)	top-5 acc 86.312	Train top-1 57.712	top-5 79.592	Entropy 0.63552	Latency-None: 0.000ms	Flops: 538.40M
Train [52][0/3239]	Time 48.337 (48.337)	Data Time 46.732 (46.732)	Loss 2.9283 (2.9283)	Entropy 0.63578 (0.63578)	Top-1 acc 53.906 (53.906)	Top-5 acc 77.344 (77.344)	lr 0.01542
Train [52][10/3239]	Time 0.229 (4.806)	Data Time 0.001 (4.250)	Loss 2.7336 (2.7574)	Entropy 0.63594 (0.63582)	Top-1 acc 58.594 (58.274)	Top-5 acc 78.516 (79.048)	lr 0.01542
Train [52][20/3239]	Time 0.235 (2.715)	Data Time 0.001 (2.227)	Loss 2.7810 (2.7683)	Entropy 0.63546 (0.63576)	Top-1 acc 56.250 (58.036)	Top-5 acc 80.078 (79.315)	lr 0.01542
Train [52][30/3239]	Time 0.230 (1.978)	Data Time 0.001 (1.509)	Loss 2.7422 (2.7687)	Entropy 0.63509 (0.63562)	Top-1 acc 59.766 (57.825)	Top-5 acc 78.125 (79.423)	lr 0.01542
Train [52][40/3239]	Time 0.247 (1.804)	Data Time 0.001 (1.350)	Loss 2.7414 (2.7502)	Entropy 0.63503 (0.63548)	Top-1 acc 59.766 (58.422)	Top-5 acc 78.516 (79.773)	lr 0.01541
Train [52][50/3239]	Time 0.272 (1.533)	Data Time 0.001 (1.085)	Loss 2.7704 (2.7442)	Entropy 0.63479 (0.63539)	Top-1 acc 56.641 (58.272)	Top-5 acc 77.344 (79.810)	lr 0.01541
Train [52][60/3239]	Time 0.279 (1.352)	Data Time 0.002 (0.908)	Loss 2.8183 (2.7371)	Entropy 0.63492 (0.63531)	Top-1 acc 52.734 (58.459)	Top-5 acc 78.125 (79.860)	lr 0.01541
Train [52][70/3239]	Time 0.339 (1.340)	Data Time 0.001 (0.896)	Loss 2.7636 (2.7396)	Entropy 0.63477 (0.63524)	Top-1 acc 60.156 (58.429)	Top-5 acc 79.297 (79.699)	lr 0.01541
Train [52][80/3239]	Time 0.230 (1.229)	Data Time 0.001 (0.786)	Loss 2.7418 (2.7327)	Entropy 0.63438 (0.63518)	Top-1 acc 55.078 (58.517)	Top-5 acc 82.031 (79.769)	lr 0.01541
Train [52][90/3239]	Time 0.278 (1.142)	Data Time 0.001 (0.699)	Loss 2.6958 (2.7402)	Entropy 0.63402 (0.63507)	Top-1 acc 60.547 (58.358)	Top-5 acc 79.688 (79.580)	lr 0.01541
Train [52][100/3239]	Time 0.275 (1.109)	Data Time 0.001 (0.665)	Loss 2.5931 (2.7381)	Entropy 0.63345 (0.63494)	Top-1 acc 57.812 (58.308)	Top-5 acc 85.547 (79.707)	lr 0.01541
Train [52][110/3239]	Time 0.228 (1.069)	Data Time 0.001 (0.615)	Loss 2.6970 (2.7377)	Entropy 0.63342 (0.63480)	Top-1 acc 58.203 (58.305)	Top-5 acc 79.297 (79.666)	lr 0.01541
Train [52][120/3239]	Time 0.244 (1.018)	Data Time 0.001 (0.565)	Loss 2.7453 (2.7327)	Entropy 0.63290 (0.63467)	Top-1 acc 58.594 (58.432)	Top-5 acc 80.078 (79.720)	lr 0.01541
Train [52][130/3239]	Time 0.273 (1.010)	Data Time 0.001 (0.558)	Loss 2.7159 (2.7316)	Entropy 0.63307 (0.63454)	Top-1 acc 56.250 (58.394)	Top-5 acc 80.469 (79.711)	lr 0.01541
Train [52][140/3239]	Time 0.235 (0.972)	Data Time 0.001 (0.522)	Loss 2.9071 (2.7340)	Entropy 0.63286 (0.63444)	Top-1 acc 56.250 (58.314)	Top-5 acc 76.562 (79.796)	lr 0.01540
Train [52][150/3239]	Time 0.237 (0.935)	Data Time 0.001 (0.487)	Loss 2.7943 (2.7361)	Entropy 0.63293 (0.63433)	Top-1 acc 55.859 (58.294)	Top-5 acc 77.734 (79.786)	lr 0.01540
Train [52][160/3239]	Time 0.355 (0.905)	Data Time 0.002 (0.457)	Loss 2.9664 (2.7376)	Entropy 0.63304 (0.63424)	Top-1 acc 50.781 (58.191)	Top-5 acc 76.953 (79.809)	lr 0.01540
Train [52][170/3239]	Time 0.241 (0.908)	Data Time 0.001 (0.461)	Loss 2.6035 (2.7314)	Entropy 0.63276 (0.63416)	Top-1 acc 62.500 (58.313)	Top-5 acc 83.984 (79.927)	lr 0.01540
Train [52][180/3239]	Time 0.244 (0.881)	Data Time 0.001 (0.436)	Loss 2.6093 (2.7301)	Entropy 0.63267 (0.63408)	Top-1 acc 56.641 (58.309)	Top-5 acc 82.031 (79.901)	lr 0.01540
Train [52][190/3239]	Time 0.260 (0.859)	Data Time 0.001 (0.413)	Loss 2.7814 (2.7296)	Entropy 0.63250 (0.63401)	Top-1 acc 57.422 (58.324)	Top-5 acc 76.953 (79.941)	lr 0.01540
Train [52][200/3239]	Time 0.235 (0.866)	Data Time 0.001 (0.423)	Loss 2.7794 (2.7303)	Entropy 0.63241 (0.63394)	Top-1 acc 54.688 (58.267)	Top-5 acc 80.859 (79.927)	lr 0.01540
Train [52][210/3239]	Time 0.246 (0.845)	Data Time 0.001 (0.403)	Loss 2.6911 (2.7309)	Entropy 0.63248 (0.63386)	Top-1 acc 53.906 (58.201)	Top-5 acc 82.031 (79.941)	lr 0.01540
Train [52][220/3239]	Time 0.225 (0.827)	Data Time 0.001 (0.385)	Loss 2.7196 (2.7298)	Entropy 0.63240 (0.63380)	Top-1 acc 57.422 (58.242)	Top-5 acc 80.078 (79.954)	lr 0.01540
Train [52][230/3239]	Time 0.333 (0.830)	Data Time 0.001 (0.389)	Loss 2.8014 (2.7287)	Entropy 0.63265 (0.63374)	Top-1 acc 60.156 (58.300)	Top-5 acc 79.297 (79.989)	lr 0.01540
Train [52][240/3239]	Time 0.287 (0.813)	Data Time 0.001 (0.373)	Loss 2.6695 (2.7296)	Entropy 0.63285 (0.63370)	Top-1 acc 60.547 (58.270)	Top-5 acc 78.516 (79.948)	lr 0.01539
Train [52][250/3239]	Time 0.281 (0.797)	Data Time 0.001 (0.358)	Loss 2.7101 (2.7278)	Entropy 0.63302 (0.63367)	Top-1 acc 59.766 (58.332)	Top-5 acc 80.859 (79.986)	lr 0.01539
Train [52][260/3239]	Time 0.271 (0.818)	Data Time 0.001 (0.380)	Loss 2.8162 (2.7286)	Entropy 0.63298 (0.63365)	Top-1 acc 54.297 (58.308)	Top-5 acc 77.734 (79.973)	lr 0.01539
Train [52][270/3239]	Time 0.242 (0.804)	Data Time 0.001 (0.366)	Loss 2.7915 (2.7269)	Entropy 0.63305 (0.63363)	Top-1 acc 60.156 (58.347)	Top-5 acc 79.297 (80.005)	lr 0.01539
Train [52][280/3239]	Time 0.245 (0.791)	Data Time 0.001 (0.353)	Loss 2.8569 (2.7290)	Entropy 0.63322 (0.63360)	Top-1 acc 55.078 (58.281)	Top-5 acc 76.562 (79.966)	lr 0.01539
Train [52][290/3239]	Time 0.237 (0.792)	Data Time 0.001 (0.354)	Loss 2.8328 (2.7302)	Entropy 0.63356 (0.63359)	Top-1 acc 58.594 (58.262)	Top-5 acc 76.172 (79.934)	lr 0.01539
Train [52][300/3239]	Time 0.235 (0.780)	Data Time 0.001 (0.343)	Loss 2.7467 (2.7294)	Entropy 0.63377 (0.63359)	Top-1 acc 58.203 (58.273)	Top-5 acc 78.125 (79.951)	lr 0.01539
Train [52][310/3239]	Time 0.263 (0.769)	Data Time 0.001 (0.332)	Loss 2.9795 (2.7329)	Entropy 0.63370 (0.63360)	Top-1 acc 54.688 (58.175)	Top-5 acc 76.562 (79.882)	lr 0.01539
Train [52][320/3239]	Time 0.246 (0.758)	Data Time 0.001 (0.321)	Loss 2.7752 (2.7332)	Entropy 0.63358 (0.63360)	Top-1 acc 56.641 (58.128)	Top-5 acc 78.906 (79.888)	lr 0.01539
Train [52][330/3239]	Time 0.256 (0.764)	Data Time 0.001 (0.328)	Loss 2.8767 (2.7341)	Entropy 0.63337 (0.63360)	Top-1 acc 57.812 (58.117)	Top-5 acc 76.172 (79.873)	lr 0.01539
Train [52][340/3239]	Time 0.288 (0.754)	Data Time 0.001 (0.319)	Loss 2.5426 (2.7332)	Entropy 0.63328 (0.63359)	Top-1 acc 59.375 (58.141)	Top-5 acc 83.203 (79.901)	lr 0.01538
Train [52][350/3239]	Time 0.251 (0.745)	Data Time 0.001 (0.310)	Loss 2.5235 (2.7339)	Entropy 0.63360 (0.63359)	Top-1 acc 63.672 (58.110)	Top-5 acc 82.812 (79.881)	lr 0.01538
Train [52][360/3239]	Time 0.240 (0.750)	Data Time 0.001 (0.315)	Loss 2.9409 (2.7351)	Entropy 0.63374 (0.63359)	Top-1 acc 54.297 (58.093)	Top-5 acc 75.391 (79.844)	lr 0.01538
Train [52][370/3239]	Time 0.238 (0.741)	Data Time 0.001 (0.307)	Loss 2.7006 (2.7355)	Entropy 0.63337 (0.63359)	Top-1 acc 59.766 (58.107)	Top-5 acc 80.078 (79.831)	lr 0.01538
Train [52][380/3239]	Time 0.257 (0.733)	Data Time 0.001 (0.299)	Loss 2.6294 (2.7345)	Entropy 0.63329 (0.63359)	Top-1 acc 59.375 (58.147)	Top-5 acc 83.594 (79.842)	lr 0.01538
Train [52][390/3239]	Time 0.379 (0.738)	Data Time 0.001 (0.303)	Loss 2.7988 (2.7359)	Entropy 0.63346 (0.63358)	Top-1 acc 52.344 (58.093)	Top-5 acc 78.125 (79.828)	lr 0.01538
Train [52][400/3239]	Time 0.238 (0.730)	Data Time 0.001 (0.295)	Loss 2.6837 (2.7363)	Entropy 0.63382 (0.63358)	Top-1 acc 58.594 (58.098)	Top-5 acc 79.688 (79.820)	lr 0.01538
Train [52][410/3239]	Time 0.267 (0.722)	Data Time 0.001 (0.288)	Loss 2.8780 (2.7349)	Entropy 0.63407 (0.63359)	Top-1 acc 55.078 (58.152)	Top-5 acc 78.906 (79.833)	lr 0.01538
Train [52][420/3239]	Time 0.233 (0.735)	Data Time 0.001 (0.300)	Loss 2.5083 (2.7332)	Entropy 0.63404 (0.63360)	Top-1 acc 58.984 (58.150)	Top-5 acc 83.984 (79.871)	lr 0.01538
Train [52][430/3239]	Time 0.274 (0.729)	Data Time 0.001 (0.295)	Loss 2.8317 (2.7322)	Entropy 0.63418 (0.63361)	Top-1 acc 55.078 (58.188)	Top-5 acc 75.781 (79.886)	lr 0.01538
Train [52][440/3239]	Time 0.252 (0.723)	Data Time 0.001 (0.289)	Loss 2.7477 (2.7329)	Entropy 0.63398 (0.63362)	Top-1 acc 56.641 (58.190)	Top-5 acc 78.906 (79.859)	lr 0.01537
Train [52][450/3239]	Time 0.292 (0.790)	Data Time 0.003 (0.282)	Loss 2.7258 (2.7318)	Entropy 0.63378 (0.63363)	Top-1 acc 62.891 (58.225)	Top-5 acc 77.344 (79.878)	lr 0.01537
Train [52][460/3239]	Time 0.239 (0.782)	Data Time 0.001 (0.276)	Loss 2.7634 (2.7314)	Entropy 0.63402 (0.63363)	Top-1 acc 58.984 (58.225)	Top-5 acc 79.297 (79.891)	lr 0.01537
Train [52][470/3239]	Time 0.249 (0.775)	Data Time 0.002 (0.270)	Loss 2.8142 (2.7306)	Entropy 0.63417 (0.63364)	Top-1 acc 56.641 (58.238)	Top-5 acc 78.906 (79.902)	lr 0.01537
Train [52][480/3239]	Time 0.282 (0.768)	Data Time 0.001 (0.265)	Loss 2.7926 (2.7310)	Entropy 0.63407 (0.63365)	Top-1 acc 57.031 (58.241)	Top-5 acc 78.125 (79.892)	lr 0.01537
Train [52][490/3239]	Time 0.242 (0.761)	Data Time 0.001 (0.259)	Loss 2.7935 (2.7302)	Entropy 0.63382 (0.63366)	Top-1 acc 60.547 (58.280)	Top-5 acc 78.906 (79.902)	lr 0.01537
Train [52][500/3239]	Time 0.253 (0.754)	Data Time 0.001 (0.254)	Loss 2.5555 (2.7297)	Entropy 0.63366 (0.63366)	Top-1 acc 60.938 (58.275)	Top-5 acc 83.984 (79.916)	lr 0.01537
Train [52][510/3239]	Time 0.247 (0.748)	Data Time 0.002 (0.249)	Loss 2.6837 (2.7289)	Entropy 0.63382 (0.63366)	Top-1 acc 60.156 (58.301)	Top-5 acc 80.859 (79.927)	lr 0.01537
Train [52][520/3239]	Time 0.241 (0.742)	Data Time 0.001 (0.245)	Loss 2.8514 (2.7302)	Entropy 0.63368 (0.63366)	Top-1 acc 54.297 (58.277)	Top-5 acc 77.344 (79.898)	lr 0.01537
Train [52][530/3239]	Time 0.270 (0.736)	Data Time 0.001 (0.240)	Loss 2.8225 (2.7305)	Entropy 0.63364 (0.63366)	Top-1 acc 56.641 (58.244)	Top-5 acc 76.953 (79.880)	lr 0.01537
Train [52][540/3239]	Time 0.237 (0.731)	Data Time 0.001 (0.236)	Loss 2.5841 (2.7301)	Entropy 0.63382 (0.63366)	Top-1 acc 62.891 (58.267)	Top-5 acc 83.594 (79.886)	lr 0.01537
Train [52][550/3239]	Time 0.320 (0.725)	Data Time 0.001 (0.231)	Loss 2.4716 (2.7308)	Entropy 0.63381 (0.63367)	Top-1 acc 65.234 (58.264)	Top-5 acc 85.547 (79.875)	lr 0.01536
Train [52][560/3239]	Time 0.246 (0.724)	Data Time 0.001 (0.230)	Loss 2.7898 (2.7315)	Entropy 0.63406 (0.63367)	Top-1 acc 52.734 (58.239)	Top-5 acc 78.906 (79.862)	lr 0.01536
Train [52][570/3239]	Time 0.283 (0.719)	Data Time 0.001 (0.226)	Loss 2.9343 (2.7312)	Entropy 0.63407 (0.63368)	Top-1 acc 55.078 (58.246)	Top-5 acc 75.781 (79.872)	lr 0.01536
Train [52][580/3239]	Time 0.283 (0.714)	Data Time 0.001 (0.222)	Loss 2.7099 (2.7316)	Entropy 0.63382 (0.63368)	Top-1 acc 57.422 (58.209)	Top-5 acc 78.516 (79.867)	lr 0.01536
Train [52][590/3239]	Time 0.244 (0.718)	Data Time 0.001 (0.227)	Loss 2.6814 (2.7334)	Entropy 0.63397 (0.63368)	Top-1 acc 62.500 (58.169)	Top-5 acc 82.422 (79.830)	lr 0.01536
Train [52][600/3239]	Time 0.253 (0.716)	Data Time 0.001 (0.226)	Loss 2.8534 (2.7344)	Entropy 0.63409 (0.63369)	Top-1 acc 52.734 (58.139)	Top-5 acc 78.125 (79.816)	lr 0.01536
Train [52][610/3239]	Time 0.229 (0.711)	Data Time 0.001 (0.222)	Loss 2.7719 (2.7349)	Entropy 0.63438 (0.63370)	Top-1 acc 56.641 (58.132)	Top-5 acc 78.906 (79.807)	lr 0.01536
Train [52][620/3239]	Time 0.332 (0.710)	Data Time 0.001 (0.222)	Loss 2.6052 (2.7354)	Entropy 0.63438 (0.63371)	Top-1 acc 58.984 (58.107)	Top-5 acc 81.250 (79.789)	lr 0.01536
Train [52][630/3239]	Time 0.249 (0.713)	Data Time 0.001 (0.225)	Loss 2.7189 (2.7353)	Entropy 0.63433 (0.63372)	Top-1 acc 57.422 (58.105)	Top-5 acc 80.859 (79.793)	lr 0.01536
Train [52][640/3239]	Time 0.261 (0.709)	Data Time 0.003 (0.222)	Loss 2.8398 (2.7355)	Entropy 0.63422 (0.63373)	Top-1 acc 53.125 (58.093)	Top-5 acc 75.781 (79.783)	lr 0.01536
Train [52][650/3239]	Time 0.227 (0.706)	Data Time 0.001 (0.220)	Loss 2.6976 (2.7344)	Entropy 0.63423 (0.63373)	Top-1 acc 58.203 (58.102)	Top-5 acc 82.422 (79.798)	lr 0.01535
Train [52][660/3239]	Time 0.254 (0.707)	Data Time 0.001 (0.222)	Loss 2.7419 (2.7347)	Entropy 0.63426 (0.63374)	Top-1 acc 58.984 (58.099)	Top-5 acc 78.125 (79.794)	lr 0.01535
Train [52][670/3239]	Time 0.263 (0.705)	Data Time 0.001 (0.219)	Loss 2.8056 (2.7342)	Entropy 0.63464 (0.63375)	Top-1 acc 57.812 (58.117)	Top-5 acc 76.562 (79.814)	lr 0.01535
Train [52][680/3239]	Time 0.264 (0.702)	Data Time 0.002 (0.217)	Loss 2.9486 (2.7347)	Entropy 0.63449 (0.63377)	Top-1 acc 50.000 (58.113)	Top-5 acc 76.953 (79.813)	lr 0.01535
Train [52][690/3239]	Time 0.245 (0.706)	Data Time 0.001 (0.221)	Loss 2.5063 (2.7341)	Entropy 0.63441 (0.63378)	Top-1 acc 64.844 (58.133)	Top-5 acc 83.984 (79.828)	lr 0.01535
Train [52][700/3239]	Time 0.280 (0.702)	Data Time 0.001 (0.218)	Loss 2.6300 (2.7346)	Entropy 0.63426 (0.63378)	Top-1 acc 63.672 (58.126)	Top-5 acc 80.078 (79.817)	lr 0.01535
Train [52][710/3239]	Time 0.385 (0.699)	Data Time 0.001 (0.215)	Loss 2.6821 (2.7345)	Entropy 0.63417 (0.63379)	Top-1 acc 58.203 (58.126)	Top-5 acc 80.469 (79.816)	lr 0.01535
Train [52][720/3239]	Time 0.306 (0.703)	Data Time 0.001 (0.220)	Loss 2.6437 (2.7337)	Entropy 0.63446 (0.63380)	Top-1 acc 57.422 (58.141)	Top-5 acc 84.375 (79.836)	lr 0.01535
Train [52][730/3239]	Time 0.274 (0.699)	Data Time 0.001 (0.217)	Loss 2.7973 (2.7333)	Entropy 0.63466 (0.63381)	Top-1 acc 56.641 (58.144)	Top-5 acc 78.516 (79.841)	lr 0.01535
Train [52][740/3239]	Time 0.240 (0.696)	Data Time 0.001 (0.214)	Loss 2.9111 (2.7333)	Entropy 0.63499 (0.63382)	Top-1 acc 52.344 (58.142)	Top-5 acc 76.953 (79.851)	lr 0.01535
Train [52][750/3239]	Time 0.228 (0.692)	Data Time 0.001 (0.211)	Loss 2.6726 (2.7325)	Entropy 0.63507 (0.63384)	Top-1 acc 57.031 (58.154)	Top-5 acc 82.031 (79.873)	lr 0.01534
Train [52][760/3239]	Time 0.273 (0.696)	Data Time 0.001 (0.215)	Loss 2.7808 (2.7320)	Entropy 0.63520 (0.63385)	Top-1 acc 56.641 (58.168)	Top-5 acc 80.859 (79.877)	lr 0.01534
Train [52][770/3239]	Time 0.227 (0.692)	Data Time 0.001 (0.212)	Loss 2.7282 (2.7318)	Entropy 0.63541 (0.63387)	Top-1 acc 57.812 (58.160)	Top-5 acc 81.250 (79.885)	lr 0.01534
Train [52][780/3239]	Time 0.366 (0.690)	Data Time 0.001 (0.210)	Loss 2.8408 (2.7313)	Entropy 0.63527 (0.63389)	Top-1 acc 52.344 (58.169)	Top-5 acc 77.734 (79.900)	lr 0.01534
Train [52][790/3239]	Time 0.363 (0.695)	Data Time 0.002 (0.216)	Loss 2.7179 (2.7310)	Entropy 0.63566 (0.63391)	Top-1 acc 59.375 (58.179)	Top-5 acc 81.641 (79.905)	lr 0.01534
Train [52][800/3239]	Time 0.243 (0.692)	Data Time 0.001 (0.214)	Loss 2.5630 (2.7306)	Entropy 0.63584 (0.63393)	Top-1 acc 66.797 (58.202)	Top-5 acc 84.375 (79.909)	lr 0.01534
Train [52][810/3239]	Time 0.225 (0.692)	Data Time 0.001 (0.214)	Loss 2.8214 (2.7314)	Entropy 0.63605 (0.63396)	Top-1 acc 52.734 (58.165)	Top-5 acc 80.078 (79.884)	lr 0.01534
Train [52][820/3239]	Time 0.236 (0.692)	Data Time 0.001 (0.215)	Loss 2.5977 (2.7315)	Entropy 0.63617 (0.63398)	Top-1 acc 59.766 (58.165)	Top-5 acc 83.984 (79.879)	lr 0.01534
Train [52][830/3239]	Time 0.288 (0.689)	Data Time 0.003 (0.212)	Loss 2.8237 (2.7323)	Entropy 0.63595 (0.63401)	Top-1 acc 55.469 (58.145)	Top-5 acc 78.516 (79.868)	lr 0.01534
Train [52][840/3239]	Time 0.231 (0.692)	Data Time 0.001 (0.216)	Loss 2.7808 (2.7322)	Entropy 0.63581 (0.63403)	Top-1 acc 54.688 (58.141)	Top-5 acc 79.688 (79.870)	lr 0.01534
Train [52][850/3239]	Time 0.237 (0.689)	Data Time 0.001 (0.214)	Loss 2.6525 (2.7332)	Entropy 0.63605 (0.63405)	Top-1 acc 60.547 (58.115)	Top-5 acc 80.078 (79.849)	lr 0.01533
Train [52][860/3239]	Time 0.238 (0.686)	Data Time 0.001 (0.211)	Loss 2.6471 (2.7336)	Entropy 0.63591 (0.63407)	Top-1 acc 60.156 (58.102)	Top-5 acc 80.859 (79.846)	lr 0.01533
Train [52][870/3239]	Time 0.265 (0.684)	Data Time 0.001 (0.210)	Loss 2.7249 (2.7334)	Entropy 0.63585 (0.63410)	Top-1 acc 58.984 (58.093)	Top-5 acc 80.859 (79.844)	lr 0.01533
Train [52][880/3239]	Time 0.253 (0.689)	Data Time 0.001 (0.215)	Loss 2.8683 (2.7340)	Entropy 0.63642 (0.63412)	Top-1 acc 54.297 (58.088)	Top-5 acc 79.688 (79.829)	lr 0.01533
Train [52][890/3239]	Time 0.242 (0.686)	Data Time 0.001 (0.213)	Loss 2.6429 (2.7345)	Entropy 0.63631 (0.63414)	Top-1 acc 61.719 (58.079)	Top-5 acc 81.250 (79.819)	lr 0.01533
Train [52][900/3239]	Time 0.241 (0.683)	Data Time 0.001 (0.210)	Loss 2.7583 (2.7336)	Entropy 0.63680 (0.63417)	Top-1 acc 59.766 (58.105)	Top-5 acc 80.469 (79.839)	lr 0.01533
Train [52][910/3239]	Time 0.234 (0.687)	Data Time 0.001 (0.214)	Loss 2.8907 (2.7337)	Entropy 0.63683 (0.63420)	Top-1 acc 56.641 (58.115)	Top-5 acc 74.609 (79.839)	lr 0.01533
Train [52][920/3239]	Time 0.239 (0.686)	Data Time 0.001 (0.214)	Loss 2.8635 (2.7336)	Entropy 0.63695 (0.63423)	Top-1 acc 55.859 (58.110)	Top-5 acc 77.344 (79.833)	lr 0.01533
Train [52][930/3239]	Time 0.233 (0.683)	Data Time 0.001 (0.211)	Loss 2.6583 (2.7339)	Entropy 0.63627 (0.63425)	Top-1 acc 62.891 (58.113)	Top-5 acc 80.859 (79.830)	lr 0.01533
Train [52][940/3239]	Time 0.358 (0.685)	Data Time 0.001 (0.213)	Loss 2.8354 (2.7345)	Entropy 0.63596 (0.63428)	Top-1 acc 54.297 (58.096)	Top-5 acc 78.125 (79.817)	lr 0.01533
Train [52][950/3239]	Time 0.268 (0.683)	Data Time 0.001 (0.212)	Loss 2.7442 (2.7341)	Entropy 0.63577 (0.63429)	Top-1 acc 57.031 (58.110)	Top-5 acc 81.641 (79.829)	lr 0.01532
Train [52][960/3239]	Time 0.277 (0.680)	Data Time 0.002 (0.210)	Loss 2.8093 (2.7343)	Entropy 0.63559 (0.63431)	Top-1 acc 58.594 (58.100)	Top-5 acc 77.344 (79.829)	lr 0.01532
Train [52][970/3239]	Time 0.229 (0.686)	Data Time 0.001 (0.215)	Loss 2.6649 (2.7343)	Entropy 0.63577 (0.63432)	Top-1 acc 60.156 (58.117)	Top-5 acc 80.078 (79.821)	lr 0.01532
Train [52][980/3239]	Time 0.310 (0.683)	Data Time 0.001 (0.213)	Loss 2.5984 (2.7342)	Entropy 0.63577 (0.63434)	Top-1 acc 62.891 (58.128)	Top-5 acc 80.469 (79.818)	lr 0.01532
Train [52][990/3239]	Time 0.253 (0.681)	Data Time 0.002 (0.211)	Loss 2.5911 (2.7339)	Entropy 0.63567 (0.63435)	Top-1 acc 57.422 (58.129)	Top-5 acc 84.375 (79.827)	lr 0.01532
Train [52][1000/3239]	Time 0.261 (0.686)	Data Time 0.001 (0.216)	Loss 2.6255 (2.7342)	Entropy 0.63600 (0.63437)	Top-1 acc 59.766 (58.114)	Top-5 acc 80.469 (79.817)	lr 0.01532
Train [52][1010/3239]	Time 0.358 (0.683)	Data Time 0.001 (0.214)	Loss 2.5912 (2.7341)	Entropy 0.63569 (0.63438)	Top-1 acc 61.328 (58.126)	Top-5 acc 81.641 (79.819)	lr 0.01532
Train [52][1020/3239]	Time 0.259 (0.681)	Data Time 0.001 (0.212)	Loss 2.7288 (2.7341)	Entropy 0.63503 (0.63439)	Top-1 acc 60.547 (58.130)	Top-5 acc 79.688 (79.817)	lr 0.01532
Train [52][1030/3239]	Time 0.227 (0.678)	Data Time 0.001 (0.210)	Loss 2.7888 (2.7335)	Entropy 0.63489 (0.63440)	Top-1 acc 59.766 (58.140)	Top-5 acc 79.688 (79.837)	lr 0.01532
Train [52][1040/3239]	Time 0.243 (0.681)	Data Time 0.001 (0.213)	Loss 2.9073 (2.7333)	Entropy 0.63470 (0.63440)	Top-1 acc 55.469 (58.134)	Top-5 acc 76.172 (79.843)	lr 0.01532
Train [52][1050/3239]	Time 0.263 (0.679)	Data Time 0.001 (0.211)	Loss 2.6953 (2.7336)	Entropy 0.63485 (0.63441)	Top-1 acc 58.203 (58.126)	Top-5 acc 78.906 (79.832)	lr 0.01531
Train [52][1060/3239]	Time 0.224 (0.676)	Data Time 0.001 (0.209)	Loss 2.7727 (2.7340)	Entropy 0.63509 (0.63441)	Top-1 acc 56.250 (58.117)	Top-5 acc 80.078 (79.827)	lr 0.01531
Train [52][1070/3239]	Time 0.244 (0.680)	Data Time 0.001 (0.214)	Loss 2.8179 (2.7342)	Entropy 0.63528 (0.63442)	Top-1 acc 58.203 (58.122)	Top-5 acc 77.734 (79.825)	lr 0.01531
Train [52][1080/3239]	Time 0.231 (0.678)	Data Time 0.001 (0.212)	Loss 2.6989 (2.7345)	Entropy 0.63509 (0.63443)	Top-1 acc 58.594 (58.122)	Top-5 acc 77.734 (79.814)	lr 0.01531
Train [52][1090/3239]	Time 0.214 (0.676)	Data Time 0.001 (0.210)	Loss 2.6533 (2.7346)	Entropy 0.63518 (0.63443)	Top-1 acc 62.109 (58.113)	Top-5 acc 85.156 (79.810)	lr 0.01531
Train [52][1100/3239]	Time 0.628 (0.708)	Data Time 0.006 (0.213)	Loss 2.8168 (2.7349)	Entropy 0.63492 (0.63444)	Top-1 acc 54.297 (58.108)	Top-5 acc 75.391 (79.796)	lr 0.01531
Train [52][1110/3239]	Time 0.215 (0.706)	Data Time 0.002 (0.211)	Loss 2.7379 (2.7351)	Entropy 0.63477 (0.63444)	Top-1 acc 58.984 (58.102)	Top-5 acc 76.953 (79.788)	lr 0.01531
Train [52][1120/3239]	Time 0.243 (0.703)	Data Time 0.001 (0.209)	Loss 2.4468 (2.7351)	Entropy 0.63484 (0.63445)	Top-1 acc 65.234 (58.093)	Top-5 acc 85.547 (79.789)	lr 0.01531
Train [52][1130/3239]	Time 0.241 (0.701)	Data Time 0.002 (0.207)	Loss 2.5790 (2.7350)	Entropy 0.63504 (0.63445)	Top-1 acc 64.844 (58.099)	Top-5 acc 84.375 (79.790)	lr 0.01531
Train [52][1140/3239]	Time 0.265 (0.698)	Data Time 0.001 (0.205)	Loss 2.6790 (2.7347)	Entropy 0.63502 (0.63446)	Top-1 acc 57.812 (58.105)	Top-5 acc 78.906 (79.792)	lr 0.01531
Train [52][1150/3239]	Time 0.228 (0.696)	Data Time 0.001 (0.204)	Loss 2.8088 (2.7348)	Entropy 0.63517 (0.63446)	Top-1 acc 55.469 (58.090)	Top-5 acc 82.422 (79.793)	lr 0.01530
Train [52][1160/3239]	Time 0.280 (0.694)	Data Time 0.001 (0.202)	Loss 2.9955 (2.7354)	Entropy 0.63535 (0.63447)	Top-1 acc 52.734 (58.076)	Top-5 acc 73.438 (79.772)	lr 0.01530
Train [52][1170/3239]	Time 0.252 (0.692)	Data Time 0.001 (0.200)	Loss 2.8430 (2.7354)	Entropy 0.63551 (0.63448)	Top-1 acc 57.031 (58.069)	Top-5 acc 77.344 (79.777)	lr 0.01530
Train [52][1180/3239]	Time 0.281 (0.689)	Data Time 0.001 (0.199)	Loss 2.6902 (2.7356)	Entropy 0.63574 (0.63449)	Top-1 acc 56.250 (58.066)	Top-5 acc 81.641 (79.779)	lr 0.01530
Train [52][1190/3239]	Time 0.243 (0.687)	Data Time 0.001 (0.197)	Loss 2.5769 (2.7353)	Entropy 0.63532 (0.63449)	Top-1 acc 62.500 (58.069)	Top-5 acc 82.031 (79.787)	lr 0.01530
Train [52][1200/3239]	Time 0.232 (0.686)	Data Time 0.001 (0.195)	Loss 2.7484 (2.7352)	Entropy 0.63521 (0.63450)	Top-1 acc 55.078 (58.066)	Top-5 acc 80.078 (79.792)	lr 0.01530
Train [52][1210/3239]	Time 0.267 (0.684)	Data Time 0.001 (0.194)	Loss 2.8608 (2.7356)	Entropy 0.63503 (0.63451)	Top-1 acc 53.516 (58.063)	Top-5 acc 76.562 (79.785)	lr 0.01530
Train [52][1220/3239]	Time 0.230 (0.684)	Data Time 0.001 (0.195)	Loss 2.6322 (2.7360)	Entropy 0.63545 (0.63451)	Top-1 acc 59.375 (58.058)	Top-5 acc 82.422 (79.778)	lr 0.01530
Train [52][1230/3239]	Time 0.217 (0.682)	Data Time 0.001 (0.193)	Loss 2.6988 (2.7362)	Entropy 0.63535 (0.63452)	Top-1 acc 61.328 (58.053)	Top-5 acc 80.469 (79.770)	lr 0.01530
Train [52][1240/3239]	Time 0.306 (0.685)	Data Time 0.003 (0.197)	Loss 2.8163 (2.7360)	Entropy 0.63532 (0.63453)	Top-1 acc 54.688 (58.048)	Top-5 acc 79.297 (79.772)	lr 0.01530
Train [52][1250/3239]	Time 0.242 (0.684)	Data Time 0.001 (0.196)	Loss 2.7048 (2.7359)	Entropy 0.63550 (0.63453)	Top-1 acc 55.859 (58.057)	Top-5 acc 78.516 (79.771)	lr 0.01530
Train [52][1260/3239]	Time 0.345 (0.682)	Data Time 0.001 (0.194)	Loss 2.7839 (2.7360)	Entropy 0.63535 (0.63454)	Top-1 acc 57.812 (58.058)	Top-5 acc 78.906 (79.770)	lr 0.01529
Train [52][1270/3239]	Time 0.253 (0.681)	Data Time 0.001 (0.194)	Loss 2.9250 (2.7356)	Entropy 0.63531 (0.63455)	Top-1 acc 54.688 (58.076)	Top-5 acc 75.781 (79.777)	lr 0.01529
Train [52][1280/3239]	Time 0.251 (0.683)	Data Time 0.002 (0.196)	Loss 2.9193 (2.7354)	Entropy 0.63566 (0.63455)	Top-1 acc 52.734 (58.088)	Top-5 acc 75.781 (79.777)	lr 0.01529
Train [52][1290/3239]	Time 0.271 (0.681)	Data Time 0.001 (0.194)	Loss 2.7410 (2.7355)	Entropy 0.63557 (0.63456)	Top-1 acc 56.641 (58.082)	Top-5 acc 81.250 (79.769)	lr 0.01529
Train [52][1300/3239]	Time 0.245 (0.683)	Data Time 0.001 (0.196)	Loss 2.7989 (2.7357)	Entropy 0.63569 (0.63457)	Top-1 acc 58.984 (58.081)	Top-5 acc 76.562 (79.761)	lr 0.01529
Train [52][1310/3239]	Time 0.293 (0.681)	Data Time 0.001 (0.195)	Loss 2.6778 (2.7358)	Entropy 0.63512 (0.63458)	Top-1 acc 58.594 (58.082)	Top-5 acc 80.469 (79.757)	lr 0.01529
Train [52][1320/3239]	Time 0.259 (0.679)	Data Time 0.001 (0.194)	Loss 2.5700 (2.7357)	Entropy 0.63507 (0.63458)	Top-1 acc 58.594 (58.092)	Top-5 acc 83.594 (79.762)	lr 0.01529
Train [52][1330/3239]	Time 0.359 (0.679)	Data Time 0.001 (0.193)	Loss 2.9403 (2.7358)	Entropy 0.63558 (0.63459)	Top-1 acc 51.562 (58.096)	Top-5 acc 75.000 (79.762)	lr 0.01529
Train [52][1340/3239]	Time 0.259 (0.680)	Data Time 0.001 (0.195)	Loss 2.5974 (2.7355)	Entropy 0.63554 (0.63460)	Top-1 acc 63.672 (58.092)	Top-5 acc 82.812 (79.770)	lr 0.01529
Train [52][1350/3239]	Time 0.252 (0.679)	Data Time 0.001 (0.194)	Loss 2.7488 (2.7353)	Entropy 0.63564 (0.63460)	Top-1 acc 57.812 (58.092)	Top-5 acc 81.250 (79.776)	lr 0.01529
Train [52][1360/3239]	Time 0.910 (0.677)	Data Time 0.637 (0.193)	Loss 2.6512 (2.7350)	Entropy 0.63573 (0.63461)	Top-1 acc 62.500 (58.089)	Top-5 acc 82.812 (79.784)	lr 0.01528
Train [52][1370/3239]	Time 0.276 (0.679)	Data Time 0.001 (0.195)	Loss 2.5127 (2.7349)	Entropy 0.63551 (0.63462)	Top-1 acc 61.328 (58.100)	Top-5 acc 82.812 (79.781)	lr 0.01528
Train [52][1380/3239]	Time 0.242 (0.678)	Data Time 0.001 (0.195)	Loss 2.6286 (2.7350)	Entropy 0.63553 (0.63462)	Top-1 acc 64.453 (58.097)	Top-5 acc 82.422 (79.783)	lr 0.01528
Train [52][1390/3239]	Time 0.332 (0.677)	Data Time 0.002 (0.193)	Loss 2.7327 (2.7353)	Entropy 0.63521 (0.63463)	Top-1 acc 61.328 (58.095)	Top-5 acc 80.078 (79.774)	lr 0.01528
Train [52][1400/3239]	Time 3.204 (0.679)	Data Time 2.951 (0.196)	Loss 2.6375 (2.7353)	Entropy 0.63554 (0.63464)	Top-1 acc 62.500 (58.091)	Top-5 acc 81.250 (79.778)	lr 0.01528
Train [52][1410/3239]	Time 0.248 (0.678)	Data Time 0.001 (0.196)	Loss 2.7904 (2.7353)	Entropy 0.63525 (0.63464)	Top-1 acc 55.078 (58.087)	Top-5 acc 82.812 (79.783)	lr 0.01528
Train [52][1420/3239]	Time 0.332 (0.677)	Data Time 0.001 (0.194)	Loss 2.9288 (2.7354)	Entropy 0.63498 (0.63465)	Top-1 acc 55.469 (58.088)	Top-5 acc 74.219 (79.778)	lr 0.01528
Train [52][1430/3239]	Time 0.251 (0.679)	Data Time 0.001 (0.197)	Loss 2.6450 (2.7352)	Entropy 0.63537 (0.63465)	Top-1 acc 61.719 (58.091)	Top-5 acc 80.859 (79.787)	lr 0.01528
Train [52][1440/3239]	Time 0.261 (0.680)	Data Time 0.001 (0.198)	Loss 2.9152 (2.7352)	Entropy 0.63561 (0.63465)	Top-1 acc 52.734 (58.094)	Top-5 acc 77.734 (79.786)	lr 0.01528
Train [52][1450/3239]	Time 0.233 (0.678)	Data Time 0.001 (0.196)	Loss 2.5640 (2.7352)	Entropy 0.63561 (0.63466)	Top-1 acc 62.891 (58.098)	Top-5 acc 81.250 (79.784)	lr 0.01528
Train [52][1460/3239]	Time 0.254 (0.681)	Data Time 0.001 (0.200)	Loss 2.6740 (2.7350)	Entropy 0.63568 (0.63467)	Top-1 acc 60.547 (58.104)	Top-5 acc 81.250 (79.790)	lr 0.01527
Train [52][1470/3239]	Time 0.248 (0.682)	Data Time 0.001 (0.201)	Loss 2.6559 (2.7353)	Entropy 0.63590 (0.63467)	Top-1 acc 59.766 (58.094)	Top-5 acc 80.469 (79.789)	lr 0.01527
Train [52][1480/3239]	Time 0.239 (0.680)	Data Time 0.001 (0.199)	Loss 2.7119 (2.7354)	Entropy 0.63606 (0.63468)	Top-1 acc 57.812 (58.094)	Top-5 acc 80.078 (79.784)	lr 0.01527
Train [52][1490/3239]	Time 0.364 (0.682)	Data Time 0.001 (0.202)	Loss 2.7376 (2.7354)	Entropy 0.63587 (0.63469)	Top-1 acc 55.859 (58.093)	Top-5 acc 81.250 (79.782)	lr 0.01527
Train [52][1500/3239]	Time 0.230 (0.680)	Data Time 0.001 (0.200)	Loss 2.7737 (2.7351)	Entropy 0.63603 (0.63470)	Top-1 acc 58.203 (58.095)	Top-5 acc 79.297 (79.794)	lr 0.01527
Train [52][1510/3239]	Time 0.240 (0.682)	Data Time 0.001 (0.203)	Loss 2.8822 (2.7351)	Entropy 0.63614 (0.63471)	Top-1 acc 55.078 (58.093)	Top-5 acc 77.344 (79.793)	lr 0.01527
Train [52][1520/3239]	Time 2.693 (0.682)	Data Time 2.446 (0.203)	Loss 2.8350 (2.7350)	Entropy 0.63620 (0.63472)	Top-1 acc 54.688 (58.089)	Top-5 acc 78.516 (79.792)	lr 0.01527
Train [52][1530/3239]	Time 0.233 (0.680)	Data Time 0.001 (0.202)	Loss 2.5809 (2.7354)	Entropy 0.63588 (0.63473)	Top-1 acc 63.672 (58.081)	Top-5 acc 84.375 (79.787)	lr 0.01527
Train [52][1540/3239]	Time 0.219 (0.683)	Data Time 0.001 (0.205)	Loss 2.7920 (2.7354)	Entropy 0.63591 (0.63473)	Top-1 acc 54.688 (58.075)	Top-5 acc 76.562 (79.782)	lr 0.01527
Train [52][1550/3239]	Time 0.253 (0.682)	Data Time 0.001 (0.204)	Loss 2.7788 (2.7353)	Entropy 0.63612 (0.63474)	Top-1 acc 56.641 (58.068)	Top-5 acc 78.516 (79.788)	lr 0.01527
Train [52][1560/3239]	Time 0.263 (0.682)	Data Time 0.002 (0.204)	Loss 2.7998 (2.7357)	Entropy 0.63596 (0.63475)	Top-1 acc 56.250 (58.064)	Top-5 acc 78.906 (79.784)	lr 0.01526
Train [52][1570/3239]	Time 0.240 (0.682)	Data Time 0.001 (0.205)	Loss 2.7979 (2.7360)	Entropy 0.63619 (0.63476)	Top-1 acc 58.203 (58.061)	Top-5 acc 78.516 (79.780)	lr 0.01526
Train [52][1580/3239]	Time 0.288 (0.680)	Data Time 0.002 (0.204)	Loss 2.7682 (2.7361)	Entropy 0.63646 (0.63477)	Top-1 acc 56.250 (58.057)	Top-5 acc 78.125 (79.782)	lr 0.01526
Train [52][1590/3239]	Time 0.236 (0.684)	Data Time 0.001 (0.207)	Loss 2.7056 (2.7360)	Entropy 0.63666 (0.63478)	Top-1 acc 55.859 (58.056)	Top-5 acc 79.297 (79.781)	lr 0.01526
Train [52][1600/3239]	Time 0.245 (0.685)	Data Time 0.001 (0.209)	Loss 2.5381 (2.7357)	Entropy 0.63710 (0.63479)	Top-1 acc 62.500 (58.068)	Top-5 acc 85.156 (79.790)	lr 0.01526
Train [52][1610/3239]	Time 0.234 (0.683)	Data Time 0.001 (0.207)	Loss 2.9542 (2.7358)	Entropy 0.63686 (0.63481)	Top-1 acc 55.078 (58.064)	Top-5 acc 77.344 (79.792)	lr 0.01526
Train [52][1620/3239]	Time 0.246 (0.686)	Data Time 0.001 (0.211)	Loss 2.7086 (2.7360)	Entropy 0.63690 (0.63482)	Top-1 acc 57.031 (58.060)	Top-5 acc 82.031 (79.791)	lr 0.01526
Train [52][1630/3239]	Time 0.245 (0.686)	Data Time 0.001 (0.211)	Loss 2.5914 (2.7359)	Entropy 0.63660 (0.63483)	Top-1 acc 58.594 (58.057)	Top-5 acc 83.203 (79.790)	lr 0.01526
Train [52][1640/3239]	Time 0.256 (0.685)	Data Time 0.001 (0.210)	Loss 2.6095 (2.7359)	Entropy 0.63687 (0.63484)	Top-1 acc 61.719 (58.052)	Top-5 acc 82.812 (79.789)	lr 0.01526
Train [52][1650/3239]	Time 0.344 (0.690)	Data Time 0.001 (0.215)	Loss 2.4291 (2.7359)	Entropy 0.63692 (0.63485)	Top-1 acc 66.406 (58.050)	Top-5 acc 87.109 (79.788)	lr 0.01526
Train [52][1660/3239]	Time 0.241 (0.688)	Data Time 0.001 (0.213)	Loss 2.7464 (2.7360)	Entropy 0.63689 (0.63487)	Top-1 acc 58.594 (58.054)	Top-5 acc 78.516 (79.792)	lr 0.01525
Train [52][1670/3239]	Time 0.273 (0.687)	Data Time 0.001 (0.213)	Loss 2.7035 (2.7359)	Entropy 0.63680 (0.63488)	Top-1 acc 58.594 (58.056)	Top-5 acc 79.688 (79.794)	lr 0.01525
Train [52][1680/3239]	Time 8.014 (0.693)	Data Time 7.772 (0.219)	Loss 2.7398 (2.7359)	Entropy 0.63692 (0.63489)	Top-1 acc 60.547 (58.051)	Top-5 acc 79.688 (79.798)	lr 0.01525
Train [52][1690/3239]	Time 0.250 (0.691)	Data Time 0.002 (0.217)	Loss 2.8209 (2.7355)	Entropy 0.63663 (0.63490)	Top-1 acc 56.641 (58.063)	Top-5 acc 78.125 (79.802)	lr 0.01525
Train [52][1700/3239]	Time 0.249 (0.690)	Data Time 0.001 (0.216)	Loss 2.6719 (2.7356)	Entropy 0.63653 (0.63491)	Top-1 acc 58.984 (58.063)	Top-5 acc 82.031 (79.806)	lr 0.01525
Train [52][1710/3239]	Time 1.216 (0.690)	Data Time 0.954 (0.217)	Loss 2.7451 (2.7359)	Entropy 0.63603 (0.63492)	Top-1 acc 58.984 (58.052)	Top-5 acc 76.953 (79.798)	lr 0.01525
Train [52][1720/3239]	Time 0.333 (0.694)	Data Time 0.001 (0.221)	Loss 2.5936 (2.7357)	Entropy 0.63562 (0.63493)	Top-1 acc 58.203 (58.056)	Top-5 acc 85.547 (79.806)	lr 0.01525
Train [52][1730/3239]	Time 0.233 (0.692)	Data Time 0.001 (0.220)	Loss 2.8388 (2.7354)	Entropy 0.63547 (0.63493)	Top-1 acc 57.812 (58.063)	Top-5 acc 77.734 (79.814)	lr 0.01525
Train [52][1740/3239]	Time 0.245 (0.694)	Data Time 0.001 (0.222)	Loss 2.7431 (2.7352)	Entropy 0.63567 (0.63493)	Top-1 acc 56.641 (58.058)	Top-5 acc 77.734 (79.817)	lr 0.01525
Train [52][1750/3239]	Time 0.245 (0.697)	Data Time 0.001 (0.225)	Loss 3.0625 (2.7352)	Entropy 0.63560 (0.63494)	Top-1 acc 48.047 (58.056)	Top-5 acc 75.000 (79.816)	lr 0.01525
Train [52][1760/3239]	Time 0.274 (0.716)	Data Time 0.004 (0.225)	Loss 2.7330 (2.7349)	Entropy 0.63569 (0.63494)	Top-1 acc 57.422 (58.062)	Top-5 acc 80.469 (79.824)	lr 0.01524
Train [52][1770/3239]	Time 0.247 (0.714)	Data Time 0.002 (0.223)	Loss 2.9426 (2.7356)	Entropy 0.63587 (0.63495)	Top-1 acc 57.031 (58.050)	Top-5 acc 72.266 (79.809)	lr 0.01524
Train [52][1780/3239]	Time 0.247 (0.713)	Data Time 0.002 (0.222)	Loss 2.7694 (2.7356)	Entropy 0.63523 (0.63495)	Top-1 acc 58.203 (58.049)	Top-5 acc 80.469 (79.811)	lr 0.01524
Train [52][1790/3239]	Time 0.261 (0.711)	Data Time 0.002 (0.221)	Loss 2.8344 (2.7353)	Entropy 0.63521 (0.63495)	Top-1 acc 55.469 (58.054)	Top-5 acc 76.562 (79.815)	lr 0.01524
Train [52][1800/3239]	Time 0.242 (0.710)	Data Time 0.001 (0.220)	Loss 2.6130 (2.7355)	Entropy 0.63556 (0.63495)	Top-1 acc 58.594 (58.051)	Top-5 acc 82.031 (79.813)	lr 0.01524
Train [52][1810/3239]	Time 0.348 (0.708)	Data Time 0.001 (0.219)	Loss 2.7540 (2.7354)	Entropy 0.63578 (0.63496)	Top-1 acc 58.203 (58.055)	Top-5 acc 80.078 (79.811)	lr 0.01524
Train [52][1820/3239]	Time 0.235 (0.707)	Data Time 0.001 (0.217)	Loss 2.5575 (2.7356)	Entropy 0.63579 (0.63496)	Top-1 acc 63.281 (58.043)	Top-5 acc 84.766 (79.807)	lr 0.01524
Train [52][1830/3239]	Time 0.267 (0.706)	Data Time 0.001 (0.216)	Loss 2.7873 (2.7362)	Entropy 0.63585 (0.63497)	Top-1 acc 60.156 (58.029)	Top-5 acc 78.516 (79.796)	lr 0.01524
Train [52][1840/3239]	Time 0.246 (0.705)	Data Time 0.001 (0.216)	Loss 2.7926 (2.7365)	Entropy 0.63602 (0.63497)	Top-1 acc 56.641 (58.024)	Top-5 acc 77.734 (79.788)	lr 0.01524
Train [52][1850/3239]	Time 0.267 (0.704)	Data Time 0.001 (0.215)	Loss 2.8215 (2.7368)	Entropy 0.63610 (0.63498)	Top-1 acc 56.250 (58.010)	Top-5 acc 78.906 (79.787)	lr 0.01524
Train [52][1860/3239]	Time 0.242 (0.709)	Data Time 0.001 (0.221)	Loss 2.7660 (2.7370)	Entropy 0.63612 (0.63498)	Top-1 acc 55.859 (58.004)	Top-5 acc 76.172 (79.780)	lr 0.01524
Train [52][1870/3239]	Time 0.235 (0.708)	Data Time 0.001 (0.220)	Loss 2.6509 (2.7373)	Entropy 0.63612 (0.63499)	Top-1 acc 59.766 (57.998)	Top-5 acc 82.031 (79.777)	lr 0.01523
Train [52][1880/3239]	Time 0.620 (0.707)	Data Time 0.276 (0.219)	Loss 2.8970 (2.7376)	Entropy 0.63629 (0.63500)	Top-1 acc 53.906 (57.993)	Top-5 acc 78.906 (79.771)	lr 0.01523
Train [52][1890/3239]	Time 0.251 (0.712)	Data Time 0.001 (0.225)	Loss 2.7415 (2.7376)	Entropy 0.63575 (0.63500)	Top-1 acc 54.688 (57.996)	Top-5 acc 78.125 (79.769)	lr 0.01523
Train [52][1900/3239]	Time 0.226 (0.711)	Data Time 0.001 (0.224)	Loss 3.0657 (2.7378)	Entropy 0.63597 (0.63501)	Top-1 acc 53.516 (57.995)	Top-5 acc 73.438 (79.767)	lr 0.01523
Train [52][1910/3239]	Time 1.857 (0.711)	Data Time 1.604 (0.224)	Loss 2.7285 (2.7377)	Entropy 0.63609 (0.63501)	Top-1 acc 60.547 (58.000)	Top-5 acc 80.078 (79.767)	lr 0.01523
Train [52][1920/3239]	Time 0.240 (0.715)	Data Time 0.001 (0.229)	Loss 2.6801 (2.7380)	Entropy 0.63585 (0.63502)	Top-1 acc 57.031 (57.990)	Top-5 acc 80.469 (79.757)	lr 0.01523
Train [52][1930/3239]	Time 2.118 (0.716)	Data Time 1.870 (0.230)	Loss 2.7367 (2.7381)	Entropy 0.63591 (0.63502)	Top-1 acc 54.688 (57.990)	Top-5 acc 84.766 (79.760)	lr 0.01523
Train [52][1940/3239]	Time 0.260 (0.715)	Data Time 0.001 (0.228)	Loss 2.8015 (2.7379)	Entropy 0.63617 (0.63503)	Top-1 acc 55.078 (57.985)	Top-5 acc 79.688 (79.765)	lr 0.01523
Train [52][1950/3239]	Time 0.257 (0.720)	Data Time 0.001 (0.234)	Loss 2.7188 (2.7376)	Entropy 0.63633 (0.63503)	Top-1 acc 60.547 (57.988)	Top-5 acc 78.906 (79.768)	lr 0.01523
Train [52][1960/3239]	Time 0.244 (0.719)	Data Time 0.001 (0.233)	Loss 2.9741 (2.7377)	Entropy 0.63616 (0.63504)	Top-1 acc 51.953 (57.988)	Top-5 acc 77.734 (79.764)	lr 0.01523
Train [52][1970/3239]	Time 0.349 (0.719)	Data Time 0.001 (0.233)	Loss 2.6764 (2.7379)	Entropy 0.63610 (0.63504)	Top-1 acc 59.766 (57.987)	Top-5 acc 80.469 (79.759)	lr 0.01522
Train [52][1980/3239]	Time 0.257 (0.724)	Data Time 0.001 (0.239)	Loss 2.6862 (2.7377)	Entropy 0.63588 (0.63505)	Top-1 acc 56.641 (57.987)	Top-5 acc 81.641 (79.765)	lr 0.01522
Train [52][1990/3239]	Time 0.238 (0.727)	Data Time 0.001 (0.242)	Loss 2.5646 (2.7376)	Entropy 0.63609 (0.63505)	Top-1 acc 60.547 (57.991)	Top-5 acc 84.766 (79.767)	lr 0.01522
Train [52][2000/3239]	Time 0.242 (0.725)	Data Time 0.001 (0.240)	Loss 2.7229 (2.7378)	Entropy 0.63605 (0.63506)	Top-1 acc 59.375 (57.986)	Top-5 acc 80.859 (79.764)	lr 0.01522
Train [52][2010/3239]	Time 0.238 (0.725)	Data Time 0.001 (0.240)	Loss 2.6792 (2.7379)	Entropy 0.63587 (0.63506)	Top-1 acc 58.203 (57.981)	Top-5 acc 79.688 (79.762)	lr 0.01522
Train [52][2020/3239]	Time 0.249 (0.732)	Data Time 0.001 (0.247)	Loss 2.8074 (2.7379)	Entropy 0.63595 (0.63507)	Top-1 acc 54.688 (57.979)	Top-5 acc 78.516 (79.764)	lr 0.01522
Train [52][2030/3239]	Time 0.239 (0.730)	Data Time 0.001 (0.246)	Loss 2.6448 (2.7379)	Entropy 0.63578 (0.63507)	Top-1 acc 60.156 (57.980)	Top-5 acc 82.031 (79.768)	lr 0.01522
Train [52][2040/3239]	Time 2.243 (0.730)	Data Time 1.876 (0.246)	Loss 2.5686 (2.7379)	Entropy 0.63541 (0.63507)	Top-1 acc 65.234 (57.983)	Top-5 acc 80.859 (79.770)	lr 0.01522
Train [52][2050/3239]	Time 0.245 (0.731)	Data Time 0.001 (0.247)	Loss 2.6074 (2.7374)	Entropy 0.63534 (0.63508)	Top-1 acc 61.328 (57.998)	Top-5 acc 80.859 (79.777)	lr 0.01522
Train [52][2060/3239]	Time 0.282 (0.735)	Data Time 0.001 (0.252)	Loss 2.5939 (2.7376)	Entropy 0.63509 (0.63508)	Top-1 acc 58.203 (57.986)	Top-5 acc 82.812 (79.781)	lr 0.01522
Train [52][2070/3239]	Time 0.252 (0.734)	Data Time 0.001 (0.251)	Loss 2.7454 (2.7374)	Entropy 0.63506 (0.63508)	Top-1 acc 60.938 (57.990)	Top-5 acc 80.859 (79.782)	lr 0.01521
Train [52][2080/3239]	Time 0.230 (0.736)	Data Time 0.001 (0.253)	Loss 2.6540 (2.7375)	Entropy 0.63532 (0.63508)	Top-1 acc 58.203 (57.988)	Top-5 acc 78.906 (79.780)	lr 0.01521
Train [52][2090/3239]	Time 0.234 (0.741)	Data Time 0.001 (0.259)	Loss 2.5991 (2.7374)	Entropy 0.63525 (0.63508)	Top-1 acc 63.672 (57.996)	Top-5 acc 80.859 (79.783)	lr 0.01521
Train [52][2100/3239]	Time 0.256 (0.740)	Data Time 0.001 (0.257)	Loss 2.9886 (2.7378)	Entropy 0.63546 (0.63508)	Top-1 acc 53.516 (57.986)	Top-5 acc 75.000 (79.775)	lr 0.01521
Train [52][2110/3239]	Time 0.255 (0.741)	Data Time 0.001 (0.260)	Loss 2.9878 (2.7378)	Entropy 0.63519 (0.63508)	Top-1 acc 53.906 (57.988)	Top-5 acc 76.953 (79.774)	lr 0.01521
Train [52][2120/3239]	Time 0.222 (0.746)	Data Time 0.001 (0.264)	Loss 2.6316 (2.7375)	Entropy 0.63534 (0.63508)	Top-1 acc 57.812 (57.991)	Top-5 acc 82.422 (79.784)	lr 0.01521
Train [52][2130/3239]	Time 0.345 (0.744)	Data Time 0.001 (0.263)	Loss 2.6676 (2.7378)	Entropy 0.63537 (0.63508)	Top-1 acc 62.891 (57.989)	Top-5 acc 80.859 (79.782)	lr 0.01521
Train [52][2140/3239]	Time 0.227 (0.746)	Data Time 0.001 (0.266)	Loss 2.6894 (2.7377)	Entropy 0.63526 (0.63508)	Top-1 acc 57.031 (57.993)	Top-5 acc 79.688 (79.783)	lr 0.01521
Train [52][2150/3239]	Time 0.242 (0.752)	Data Time 0.001 (0.271)	Loss 2.7892 (2.7377)	Entropy 0.63526 (0.63508)	Top-1 acc 60.156 (57.995)	Top-5 acc 79.688 (79.783)	lr 0.01521
Train [52][2160/3239]	Time 0.246 (0.750)	Data Time 0.002 (0.270)	Loss 2.6265 (2.7375)	Entropy 0.63490 (0.63508)	Top-1 acc 60.547 (58.005)	Top-5 acc 77.734 (79.785)	lr 0.01521
Train [52][2170/3239]	Time 0.226 (0.753)	Data Time 0.001 (0.273)	Loss 2.7403 (2.7373)	Entropy 0.63495 (0.63508)	Top-1 acc 58.594 (58.011)	Top-5 acc 81.250 (79.785)	lr 0.01520
Train [52][2180/3239]	Time 0.250 (0.759)	Data Time 0.001 (0.279)	Loss 2.6137 (2.7372)	Entropy 0.63502 (0.63508)	Top-1 acc 62.109 (58.016)	Top-5 acc 80.078 (79.784)	lr 0.01520
Train [52][2190/3239]	Time 0.252 (0.757)	Data Time 0.002 (0.278)	Loss 2.6359 (2.7370)	Entropy 0.63502 (0.63508)	Top-1 acc 59.375 (58.022)	Top-5 acc 84.375 (79.789)	lr 0.01520
Train [52][2200/3239]	Time 1.429 (0.759)	Data Time 1.084 (0.280)	Loss 2.7738 (2.7371)	Entropy 0.63513 (0.63508)	Top-1 acc 57.422 (58.018)	Top-5 acc 75.000 (79.786)	lr 0.01520
Train [52][2210/3239]	Time 0.239 (0.759)	Data Time 0.001 (0.281)	Loss 2.8807 (2.7371)	Entropy 0.63519 (0.63508)	Top-1 acc 53.125 (58.017)	Top-5 acc 79.297 (79.785)	lr 0.01520
Train [52][2220/3239]	Time 0.232 (0.762)	Data Time 0.001 (0.284)	Loss 2.7087 (2.7369)	Entropy 0.63531 (0.63508)	Top-1 acc 59.766 (58.024)	Top-5 acc 79.688 (79.791)	lr 0.01520
Train [52][2230/3239]	Time 0.228 (0.761)	Data Time 0.001 (0.283)	Loss 3.2418 (2.7370)	Entropy 0.63514 (0.63509)	Top-1 acc 49.219 (58.019)	Top-5 acc 70.703 (79.790)	lr 0.01520
Train [52][2240/3239]	Time 0.265 (0.764)	Data Time 0.001 (0.286)	Loss 2.7405 (2.7369)	Entropy 0.63541 (0.63509)	Top-1 acc 56.250 (58.024)	Top-5 acc 80.469 (79.795)	lr 0.01520
Train [52][2250/3239]	Time 0.231 (0.767)	Data Time 0.001 (0.289)	Loss 2.9365 (2.7370)	Entropy 0.63525 (0.63509)	Top-1 acc 54.297 (58.017)	Top-5 acc 73.828 (79.791)	lr 0.01520
Train [52][2260/3239]	Time 0.237 (0.765)	Data Time 0.001 (0.288)	Loss 2.6562 (2.7372)	Entropy 0.63499 (0.63509)	Top-1 acc 57.812 (58.018)	Top-5 acc 80.859 (79.789)	lr 0.01520
Train [52][2270/3239]	Time 0.350 (0.766)	Data Time 0.001 (0.289)	Loss 2.6542 (2.7371)	Entropy 0.63512 (0.63509)	Top-1 acc 57.422 (58.017)	Top-5 acc 84.766 (79.792)	lr 0.01519
Train [52][2280/3239]	Time 0.221 (0.767)	Data Time 0.001 (0.290)	Loss 3.0073 (2.7371)	Entropy 0.63493 (0.63509)	Top-1 acc 53.125 (58.017)	Top-5 acc 75.781 (79.794)	lr 0.01519
Train [52][2290/3239]	Time 0.242 (0.765)	Data Time 0.001 (0.289)	Loss 2.7817 (2.7367)	Entropy 0.63483 (0.63509)	Top-1 acc 58.203 (58.030)	Top-5 acc 80.859 (79.802)	lr 0.01519
Train [52][2300/3239]	Time 0.248 (0.768)	Data Time 0.001 (0.291)	Loss 2.8228 (2.7366)	Entropy 0.63479 (0.63508)	Top-1 acc 55.469 (58.032)	Top-5 acc 78.125 (79.805)	lr 0.01519
Train [52][2310/3239]	Time 0.237 (0.773)	Data Time 0.002 (0.297)	Loss 2.6088 (2.7362)	Entropy 0.63479 (0.63508)	Top-1 acc 59.375 (58.040)	Top-5 acc 82.031 (79.811)	lr 0.01519
Train [52][2320/3239]	Time 0.243 (0.772)	Data Time 0.001 (0.296)	Loss 2.9491 (2.7360)	Entropy 0.63492 (0.63508)	Top-1 acc 53.906 (58.048)	Top-5 acc 74.219 (79.812)	lr 0.01519
Train [52][2330/3239]	Time 0.276 (0.774)	Data Time 0.002 (0.298)	Loss 2.6783 (2.7359)	Entropy 0.63497 (0.63508)	Top-1 acc 58.203 (58.048)	Top-5 acc 82.031 (79.815)	lr 0.01519
Train [52][2340/3239]	Time 0.238 (0.781)	Data Time 0.001 (0.305)	Loss 2.7526 (2.7360)	Entropy 0.63513 (0.63508)	Top-1 acc 55.078 (58.047)	Top-5 acc 80.469 (79.811)	lr 0.01519
Train [52][2350/3239]	Time 0.256 (0.779)	Data Time 0.002 (0.304)	Loss 2.9306 (2.7357)	Entropy 0.63504 (0.63508)	Top-1 acc 52.344 (58.052)	Top-5 acc 76.172 (79.818)	lr 0.01519
Train [52][2360/3239]	Time 2.356 (0.780)	Data Time 2.010 (0.305)	Loss 2.5892 (2.7355)	Entropy 0.63490 (0.63508)	Top-1 acc 58.984 (58.055)	Top-5 acc 82.812 (79.822)	lr 0.01519
Train [52][2370/3239]	Time 0.241 (0.781)	Data Time 0.001 (0.306)	Loss 2.7566 (2.7356)	Entropy 0.63500 (0.63508)	Top-1 acc 58.594 (58.058)	Top-5 acc 81.641 (79.821)	lr 0.01518
Train [52][2380/3239]	Time 0.256 (0.786)	Data Time 0.001 (0.312)	Loss 2.7903 (2.7355)	Entropy 0.63509 (0.63508)	Top-1 acc 57.031 (58.060)	Top-5 acc 78.125 (79.823)	lr 0.01518
Train [52][2390/3239]	Time 0.252 (0.785)	Data Time 0.001 (0.310)	Loss 2.6373 (2.7355)	Entropy 0.63503 (0.63508)	Top-1 acc 62.109 (58.060)	Top-5 acc 80.859 (79.824)	lr 0.01518
Train [52][2400/3239]	Time 0.231 (0.788)	Data Time 0.001 (0.314)	Loss 2.6889 (2.7357)	Entropy 0.63507 (0.63508)	Top-1 acc 61.719 (58.057)	Top-5 acc 83.594 (79.824)	lr 0.01518
Train [52][2410/3239]	Time 0.399 (0.806)	Data Time 0.038 (0.317)	Loss 2.7171 (2.7356)	Entropy 0.63499 (0.63508)	Top-1 acc 58.203 (58.059)	Top-5 acc 81.641 (79.827)	lr 0.01518
Train [52][2420/3239]	Time 0.241 (0.804)	Data Time 0.002 (0.316)	Loss 2.6658 (2.7359)	Entropy 0.63501 (0.63508)	Top-1 acc 65.625 (58.053)	Top-5 acc 82.422 (79.821)	lr 0.01518
Train [52][2430/3239]	Time 0.243 (0.803)	Data Time 0.002 (0.315)	Loss 2.4250 (2.7357)	Entropy 0.63500 (0.63508)	Top-1 acc 66.797 (58.053)	Top-5 acc 83.984 (79.824)	lr 0.01518
Train [52][2440/3239]	Time 0.252 (0.801)	Data Time 0.002 (0.313)	Loss 2.7369 (2.7359)	Entropy 0.63462 (0.63508)	Top-1 acc 58.594 (58.046)	Top-5 acc 79.297 (79.819)	lr 0.01518
Train [52][2450/3239]	Time 0.283 (0.800)	Data Time 0.001 (0.312)	Loss 2.8244 (2.7359)	Entropy 0.63458 (0.63507)	Top-1 acc 58.594 (58.047)	Top-5 acc 77.344 (79.819)	lr 0.01518
Train [52][2460/3239]	Time 0.239 (0.798)	Data Time 0.001 (0.311)	Loss 2.7210 (2.7359)	Entropy 0.63467 (0.63507)	Top-1 acc 57.422 (58.048)	Top-5 acc 80.859 (79.820)	lr 0.01518
Train [52][2470/3239]	Time 0.267 (0.797)	Data Time 0.001 (0.310)	Loss 2.5687 (2.7360)	Entropy 0.63454 (0.63507)	Top-1 acc 62.500 (58.045)	Top-5 acc 83.203 (79.818)	lr 0.01517
Train [52][2480/3239]	Time 0.239 (0.796)	Data Time 0.001 (0.308)	Loss 2.8591 (2.7361)	Entropy 0.63454 (0.63507)	Top-1 acc 58.203 (58.040)	Top-5 acc 76.953 (79.816)	lr 0.01517
Train [52][2490/3239]	Time 0.244 (0.794)	Data Time 0.001 (0.307)	Loss 2.8058 (2.7361)	Entropy 0.63472 (0.63507)	Top-1 acc 57.812 (58.037)	Top-5 acc 79.297 (79.819)	lr 0.01517
Train [52][2500/3239]	Time 0.276 (0.794)	Data Time 0.001 (0.307)	Loss 2.7413 (2.7363)	Entropy 0.63486 (0.63507)	Top-1 acc 61.719 (58.035)	Top-5 acc 78.516 (79.816)	lr 0.01517
Train [52][2510/3239]	Time 0.239 (0.794)	Data Time 0.001 (0.307)	Loss 2.8631 (2.7366)	Entropy 0.63512 (0.63507)	Top-1 acc 55.859 (58.030)	Top-5 acc 75.781 (79.807)	lr 0.01517
Train [52][2520/3239]	Time 0.346 (0.797)	Data Time 0.001 (0.310)	Loss 2.8898 (2.7368)	Entropy 0.63534 (0.63507)	Top-1 acc 50.781 (58.024)	Top-5 acc 78.125 (79.805)	lr 0.01517
Train [52][2530/3239]	Time 0.482 (0.798)	Data Time 0.220 (0.311)	Loss 2.7982 (2.7366)	Entropy 0.63504 (0.63507)	Top-1 acc 57.812 (58.030)	Top-5 acc 79.297 (79.806)	lr 0.01517
Train [52][2540/3239]	Time 0.253 (0.798)	Data Time 0.001 (0.312)	Loss 2.8563 (2.7369)	Entropy 0.63533 (0.63507)	Top-1 acc 59.766 (58.029)	Top-5 acc 77.344 (79.799)	lr 0.01517
Train [52][2550/3239]	Time 0.243 (0.802)	Data Time 0.001 (0.316)	Loss 3.0340 (2.7370)	Entropy 0.63562 (0.63507)	Top-1 acc 52.734 (58.020)	Top-5 acc 73.438 (79.798)	lr 0.01517
Train [52][2560/3239]	Time 0.243 (0.802)	Data Time 0.001 (0.317)	Loss 2.7078 (2.7370)	Entropy 0.63552 (0.63507)	Top-1 acc 57.031 (58.021)	Top-5 acc 79.688 (79.798)	lr 0.01517
Train [52][2570/3239]	Time 0.656 (0.802)	Data Time 0.411 (0.316)	Loss 2.7296 (2.7372)	Entropy 0.63547 (0.63507)	Top-1 acc 57.422 (58.015)	Top-5 acc 79.297 (79.792)	lr 0.01517
Train [52][2580/3239]	Time 0.249 (0.805)	Data Time 0.001 (0.320)	Loss 2.6680 (2.7374)	Entropy 0.63549 (0.63507)	Top-1 acc 58.203 (58.012)	Top-5 acc 81.250 (79.787)	lr 0.01516
Train [52][2590/3239]	Time 5.277 (0.808)	Data Time 4.903 (0.323)	Loss 2.9600 (2.7373)	Entropy 0.63561 (0.63508)	Top-1 acc 50.391 (58.010)	Top-5 acc 74.219 (79.789)	lr 0.01516
Train [52][2600/3239]	Time 0.240 (0.807)	Data Time 0.001 (0.322)	Loss 2.6337 (2.7372)	Entropy 0.63552 (0.63508)	Top-1 acc 60.938 (58.010)	Top-5 acc 82.812 (79.793)	lr 0.01516
Train [52][2610/3239]	Time 0.266 (0.809)	Data Time 0.001 (0.324)	Loss 2.7262 (2.7373)	Entropy 0.63544 (0.63508)	Top-1 acc 59.375 (58.009)	Top-5 acc 79.297 (79.791)	lr 0.01516
Train [52][2620/3239]	Time 0.235 (0.811)	Data Time 0.001 (0.326)	Loss 2.8167 (2.7375)	Entropy 0.63541 (0.63508)	Top-1 acc 57.422 (58.006)	Top-5 acc 76.562 (79.786)	lr 0.01516
Train [52][2630/3239]	Time 0.233 (0.812)	Data Time 0.001 (0.328)	Loss 2.6627 (2.7373)	Entropy 0.63536 (0.63508)	Top-1 acc 57.812 (58.012)	Top-5 acc 81.641 (79.787)	lr 0.01516
Train [52][2640/3239]	Time 3.885 (0.813)	Data Time 3.630 (0.329)	Loss 2.6803 (2.7372)	Entropy 0.63521 (0.63508)	Top-1 acc 62.500 (58.018)	Top-5 acc 81.641 (79.789)	lr 0.01516
Train [52][2650/3239]	Time 0.242 (0.815)	Data Time 0.001 (0.331)	Loss 2.6813 (2.7371)	Entropy 0.63555 (0.63508)	Top-1 acc 64.062 (58.022)	Top-5 acc 82.031 (79.790)	lr 0.01516
Train [52][2660/3239]	Time 0.230 (0.816)	Data Time 0.001 (0.333)	Loss 2.6806 (2.7372)	Entropy 0.63533 (0.63509)	Top-1 acc 62.891 (58.020)	Top-5 acc 81.250 (79.787)	lr 0.01516
Train [52][2670/3239]	Time 0.241 (0.817)	Data Time 0.001 (0.334)	Loss 2.4171 (2.7372)	Entropy 0.63537 (0.63509)	Top-1 acc 68.359 (58.022)	Top-5 acc 85.547 (79.786)	lr 0.01516
Train [52][2680/3239]	Time 0.364 (0.819)	Data Time 0.001 (0.336)	Loss 2.8932 (2.7374)	Entropy 0.63553 (0.63509)	Top-1 acc 53.906 (58.014)	Top-5 acc 78.906 (79.784)	lr 0.01515
Train [52][2690/3239]	Time 0.236 (0.820)	Data Time 0.002 (0.337)	Loss 2.6473 (2.7372)	Entropy 0.63564 (0.63509)	Top-1 acc 60.156 (58.019)	Top-5 acc 80.859 (79.788)	lr 0.01515
Train [52][2700/3239]	Time 0.260 (0.823)	Data Time 0.001 (0.340)	Loss 2.7715 (2.7373)	Entropy 0.63564 (0.63509)	Top-1 acc 55.859 (58.014)	Top-5 acc 78.125 (79.785)	lr 0.01515
Train [52][2710/3239]	Time 0.243 (0.823)	Data Time 0.001 (0.341)	Loss 2.6318 (2.7375)	Entropy 0.63590 (0.63509)	Top-1 acc 62.500 (58.008)	Top-5 acc 82.422 (79.784)	lr 0.01515
Train [52][2720/3239]	Time 0.295 (0.825)	Data Time 0.001 (0.343)	Loss 2.7402 (2.7375)	Entropy 0.63560 (0.63510)	Top-1 acc 58.594 (58.009)	Top-5 acc 80.859 (79.786)	lr 0.01515
Train [52][2730/3239]	Time 5.345 (0.826)	Data Time 5.089 (0.344)	Loss 2.6435 (2.7375)	Entropy 0.63579 (0.63510)	Top-1 acc 61.719 (58.008)	Top-5 acc 83.594 (79.789)	lr 0.01515
Train [52][2740/3239]	Time 0.244 (0.829)	Data Time 0.002 (0.347)	Loss 2.6568 (2.7377)	Entropy 0.63575 (0.63510)	Top-1 acc 61.719 (58.004)	Top-5 acc 79.297 (79.782)	lr 0.01515
Train [52][2750/3239]	Time 0.890 (0.830)	Data Time 0.536 (0.348)	Loss 2.5478 (2.7377)	Entropy 0.63565 (0.63510)	Top-1 acc 62.891 (58.004)	Top-5 acc 85.547 (79.785)	lr 0.01515
Train [52][2760/3239]	Time 0.237 (0.830)	Data Time 0.001 (0.349)	Loss 2.9381 (2.7379)	Entropy 0.63553 (0.63510)	Top-1 acc 52.734 (57.999)	Top-5 acc 75.391 (79.783)	lr 0.01515
Train [52][2770/3239]	Time 3.036 (0.831)	Data Time 2.758 (0.349)	Loss 2.8318 (2.7379)	Entropy 0.63600 (0.63511)	Top-1 acc 55.469 (57.996)	Top-5 acc 77.344 (79.782)	lr 0.01515
Train [52][2780/3239]	Time 0.249 (0.835)	Data Time 0.001 (0.354)	Loss 2.7702 (2.7380)	Entropy 0.63625 (0.63511)	Top-1 acc 56.641 (57.993)	Top-5 acc 80.078 (79.780)	lr 0.01514
Train [52][2790/3239]	Time 3.632 (0.835)	Data Time 3.374 (0.354)	Loss 2.7675 (2.7379)	Entropy 0.63616 (0.63511)	Top-1 acc 57.812 (57.995)	Top-5 acc 80.078 (79.782)	lr 0.01514
Train [52][2800/3239]	Time 2.119 (0.834)	Data Time 1.842 (0.353)	Loss 2.8011 (2.7382)	Entropy 0.63635 (0.63512)	Top-1 acc 55.078 (57.993)	Top-5 acc 79.688 (79.778)	lr 0.01514
Train [52][2810/3239]	Time 0.231 (0.839)	Data Time 0.001 (0.358)	Loss 2.6795 (2.7382)	Entropy 0.63577 (0.63512)	Top-1 acc 62.500 (57.989)	Top-5 acc 81.641 (79.774)	lr 0.01514
Train [52][2820/3239]	Time 0.246 (0.839)	Data Time 0.001 (0.358)	Loss 2.7959 (2.7382)	Entropy 0.63599 (0.63512)	Top-1 acc 57.812 (57.990)	Top-5 acc 78.125 (79.773)	lr 0.01514
Train [52][2830/3239]	Time 0.229 (0.839)	Data Time 0.001 (0.359)	Loss 2.6054 (2.7382)	Entropy 0.63585 (0.63513)	Top-1 acc 60.156 (57.991)	Top-5 acc 82.812 (79.772)	lr 0.01514
Train [52][2840/3239]	Time 0.275 (0.842)	Data Time 0.001 (0.361)	Loss 2.8119 (2.7384)	Entropy 0.63582 (0.63513)	Top-1 acc 57.812 (57.990)	Top-5 acc 78.516 (79.769)	lr 0.01514
Train [52][2850/3239]	Time 0.224 (0.843)	Data Time 0.001 (0.363)	Loss 2.6772 (2.7384)	Entropy 0.63570 (0.63513)	Top-1 acc 58.594 (57.989)	Top-5 acc 81.250 (79.769)	lr 0.01514
Train [52][2860/3239]	Time 0.266 (0.845)	Data Time 0.002 (0.365)	Loss 2.8626 (2.7386)	Entropy 0.63553 (0.63513)	Top-1 acc 50.391 (57.978)	Top-5 acc 78.125 (79.765)	lr 0.01514
Train [52][2870/3239]	Time 0.239 (0.845)	Data Time 0.001 (0.366)	Loss 2.6399 (2.7384)	Entropy 0.63598 (0.63513)	Top-1 acc 59.375 (57.981)	Top-5 acc 82.812 (79.768)	lr 0.01514
Train [52][2880/3239]	Time 0.275 (0.846)	Data Time 0.001 (0.367)	Loss 2.7338 (2.7385)	Entropy 0.63633 (0.63514)	Top-1 acc 59.375 (57.979)	Top-5 acc 80.859 (79.765)	lr 0.01513
Train [52][2890/3239]	Time 0.242 (0.849)	Data Time 0.001 (0.370)	Loss 3.0120 (2.7382)	Entropy 0.63663 (0.63514)	Top-1 acc 50.391 (57.984)	Top-5 acc 75.000 (79.772)	lr 0.01513
Train [52][2900/3239]	Time 0.248 (0.850)	Data Time 0.001 (0.371)	Loss 2.5774 (2.7382)	Entropy 0.63639 (0.63515)	Top-1 acc 66.406 (57.981)	Top-5 acc 82.422 (79.772)	lr 0.01513
Train [52][2910/3239]	Time 1.834 (0.851)	Data Time 1.475 (0.372)	Loss 2.6597 (2.7383)	Entropy 0.63635 (0.63515)	Top-1 acc 58.203 (57.976)	Top-5 acc 81.641 (79.771)	lr 0.01513
Train [52][2920/3239]	Time 0.238 (0.854)	Data Time 0.001 (0.376)	Loss 2.6647 (2.7384)	Entropy 0.63637 (0.63516)	Top-1 acc 60.547 (57.972)	Top-5 acc 83.594 (79.771)	lr 0.01513
Train [52][2930/3239]	Time 0.271 (0.853)	Data Time 0.001 (0.375)	Loss 2.8628 (2.7387)	Entropy 0.63619 (0.63516)	Top-1 acc 55.859 (57.961)	Top-5 acc 78.516 (79.766)	lr 0.01513
Train [52][2940/3239]	Time 0.278 (0.854)	Data Time 0.022 (0.376)	Loss 2.8149 (2.7385)	Entropy 0.63625 (0.63516)	Top-1 acc 56.641 (57.966)	Top-5 acc 79.297 (79.770)	lr 0.01513
Train [52][2950/3239]	Time 7.397 (0.859)	Data Time 7.133 (0.381)	Loss 2.7724 (2.7385)	Entropy 0.63650 (0.63517)	Top-1 acc 53.516 (57.965)	Top-5 acc 80.859 (79.767)	lr 0.01513
Train [52][2960/3239]	Time 1.532 (0.858)	Data Time 1.249 (0.380)	Loss 2.6388 (2.7383)	Entropy 0.63633 (0.63517)	Top-1 acc 60.156 (57.969)	Top-5 acc 79.688 (79.770)	lr 0.01513
Train [52][2970/3239]	Time 0.235 (0.858)	Data Time 0.001 (0.381)	Loss 2.8725 (2.7383)	Entropy 0.63667 (0.63518)	Top-1 acc 55.469 (57.968)	Top-5 acc 75.781 (79.769)	lr 0.01513
Train [52][2980/3239]	Time 0.331 (0.862)	Data Time 0.001 (0.385)	Loss 2.6308 (2.7382)	Entropy 0.63688 (0.63518)	Top-1 acc 58.594 (57.969)	Top-5 acc 81.250 (79.770)	lr 0.01512
Train [52][2990/3239]	Time 0.234 (0.863)	Data Time 0.001 (0.386)	Loss 2.6851 (2.7381)	Entropy 0.63684 (0.63519)	Top-1 acc 58.984 (57.968)	Top-5 acc 81.250 (79.774)	lr 0.01512
Train [52][3000/3239]	Time 0.243 (0.863)	Data Time 0.001 (0.386)	Loss 2.6391 (2.7379)	Entropy 0.63698 (0.63519)	Top-1 acc 58.594 (57.970)	Top-5 acc 83.594 (79.777)	lr 0.01512
Train [52][3010/3239]	Time 0.219 (0.867)	Data Time 0.001 (0.390)	Loss 2.7921 (2.7383)	Entropy 0.63726 (0.63520)	Top-1 acc 56.641 (57.963)	Top-5 acc 78.516 (79.769)	lr 0.01512
Train [52][3020/3239]	Time 0.250 (0.868)	Data Time 0.001 (0.391)	Loss 2.8050 (2.7383)	Entropy 0.63687 (0.63520)	Top-1 acc 55.469 (57.964)	Top-5 acc 80.859 (79.768)	lr 0.01512
Train [52][3030/3239]	Time 0.238 (0.867)	Data Time 0.001 (0.391)	Loss 2.5901 (2.7379)	Entropy 0.63655 (0.63521)	Top-1 acc 55.469 (57.969)	Top-5 acc 82.031 (79.773)	lr 0.01512
Train [52][3040/3239]	Time 0.226 (0.867)	Data Time 0.001 (0.391)	Loss 2.8922 (2.7382)	Entropy 0.63707 (0.63521)	Top-1 acc 53.906 (57.964)	Top-5 acc 75.781 (79.770)	lr 0.01512
Train [52][3050/3239]	Time 0.244 (0.871)	Data Time 0.001 (0.395)	Loss 2.5829 (2.7383)	Entropy 0.63720 (0.63522)	Top-1 acc 63.672 (57.960)	Top-5 acc 84.375 (79.770)	lr 0.01512
Train [52][3060/3239]	Time 0.230 (0.873)	Data Time 0.001 (0.397)	Loss 2.6214 (2.7381)	Entropy 0.63710 (0.63523)	Top-1 acc 61.719 (57.968)	Top-5 acc 81.641 (79.774)	lr 0.01512
Train [52][3070/3239]	Time 0.363 (0.884)	Data Time 0.003 (0.396)	Loss 2.6315 (2.7381)	Entropy 0.63703 (0.63523)	Top-1 acc 60.547 (57.967)	Top-5 acc 82.031 (79.776)	lr 0.01512
Train [52][3080/3239]	Time 0.248 (0.882)	Data Time 0.002 (0.395)	Loss 2.5849 (2.7379)	Entropy 0.63715 (0.63524)	Top-1 acc 62.891 (57.969)	Top-5 acc 82.422 (79.780)	lr 0.01511
Train [52][3090/3239]	Time 0.252 (0.881)	Data Time 0.002 (0.393)	Loss 2.9014 (2.7379)	Entropy 0.63704 (0.63524)	Top-1 acc 55.078 (57.967)	Top-5 acc 76.953 (79.781)	lr 0.01511
Train [52][3100/3239]	Time 0.233 (0.879)	Data Time 0.001 (0.392)	Loss 2.6712 (2.7379)	Entropy 0.63724 (0.63525)	Top-1 acc 60.156 (57.968)	Top-5 acc 79.688 (79.781)	lr 0.01511
Train [52][3110/3239]	Time 1.845 (0.880)	Data Time 1.584 (0.393)	Loss 2.7613 (2.7381)	Entropy 0.63722 (0.63526)	Top-1 acc 60.938 (57.965)	Top-5 acc 76.953 (79.777)	lr 0.01511
Train [52][3120/3239]	Time 3.694 (0.882)	Data Time 3.390 (0.395)	Loss 2.6110 (2.7382)	Entropy 0.63729 (0.63526)	Top-1 acc 59.375 (57.961)	Top-5 acc 83.594 (79.774)	lr 0.01511
Train [52][3130/3239]	Time 0.250 (0.882)	Data Time 0.001 (0.395)	Loss 2.8687 (2.7381)	Entropy 0.63712 (0.63527)	Top-1 acc 57.422 (57.967)	Top-5 acc 79.297 (79.773)	lr 0.01511
Train [52][3140/3239]	Time 2.375 (0.884)	Data Time 2.023 (0.397)	Loss 2.9375 (2.7383)	Entropy 0.63687 (0.63528)	Top-1 acc 57.031 (57.964)	Top-5 acc 74.609 (79.775)	lr 0.01511
Train [52][3150/3239]	Time 0.310 (0.887)	Data Time 0.001 (0.401)	Loss 2.5955 (2.7382)	Entropy 0.63670 (0.63528)	Top-1 acc 61.328 (57.963)	Top-5 acc 82.422 (79.776)	lr 0.01511
Train [52][3160/3239]	Time 0.236 (0.886)	Data Time 0.001 (0.400)	Loss 2.6582 (2.7381)	Entropy 0.63672 (0.63529)	Top-1 acc 60.156 (57.961)	Top-5 acc 84.766 (79.778)	lr 0.01511
Train [52][3170/3239]	Time 0.238 (0.888)	Data Time 0.001 (0.402)	Loss 2.6970 (2.7381)	Entropy 0.63673 (0.63529)	Top-1 acc 57.812 (57.963)	Top-5 acc 83.203 (79.782)	lr 0.01511
Train [52][3180/3239]	Time 0.254 (0.892)	Data Time 0.000 (0.406)	Loss 2.5918 (2.7379)	Entropy 0.63650 (0.63529)	Top-1 acc 64.453 (57.969)	Top-5 acc 82.031 (79.786)	lr 0.01510
Train [52][3190/3239]	Time 0.238 (0.891)	Data Time 0.000 (0.406)	Loss 2.5610 (2.7380)	Entropy 0.63588 (0.63530)	Top-1 acc 61.328 (57.968)	Top-5 acc 81.250 (79.783)	lr 0.01510
Train [52][3200/3239]	Time 0.257 (0.892)	Data Time 0.000 (0.406)	Loss 2.8087 (2.7381)	Entropy 0.63584 (0.63530)	Top-1 acc 52.344 (57.967)	Top-5 acc 78.125 (79.781)	lr 0.01510
Train [52][3210/3239]	Time 0.237 (0.894)	Data Time 0.000 (0.409)	Loss 2.5388 (2.7382)	Entropy 0.63574 (0.63530)	Top-1 acc 64.062 (57.966)	Top-5 acc 80.469 (79.780)	lr 0.01510
Train [52][3220/3239]	Time 0.225 (0.895)	Data Time 0.000 (0.409)	Loss 2.5381 (2.7379)	Entropy 0.63561 (0.63530)	Top-1 acc 64.062 (57.969)	Top-5 acc 80.859 (79.784)	lr 0.01510
Train [52][3230/3239]	Time 5.258 (0.895)	Data Time 4.908 (0.410)	Loss 2.5823 (2.7379)	Entropy 0.63569 (0.63530)	Top-1 acc 62.500 (57.969)	Top-5 acc 82.422 (79.784)	lr 0.01510
Train [52][3239/3239]	Time 1.063 (0.896)	Data Time 0.000 (0.411)	Loss 2.7496 (2.7379)	Entropy 0.63576 (0.63530)	Top-1 acc 55.556 (57.970)	Top-5 acc 82.716 (79.785)	lr 0.01510
==========Valid [52/120]	loss 1.483	top-1 acc 65.988 (66.027)	top-5 acc 86.392	Train top-1 57.970	top-5 79.785	Entropy 0.63576	Latency-None: 0.000ms	Flops: 538.40M
Train [53][0/3239]	Time 46.210 (46.210)	Data Time 45.197 (45.197)	Loss 2.8329 (2.8329)	Entropy 0.63558 (0.63558)	Top-1 acc 55.469 (55.469)	Top-5 acc 77.344 (77.344)	lr 0.01510
Train [53][10/3239]	Time 0.230 (4.636)	Data Time 0.001 (4.124)	Loss 2.8834 (2.7539)	Entropy 0.63547 (0.63556)	Top-1 acc 56.250 (57.067)	Top-5 acc 77.734 (79.261)	lr 0.01510
Train [53][20/3239]	Time 0.257 (2.652)	Data Time 0.001 (2.161)	Loss 2.7470 (2.7621)	Entropy 0.63554 (0.63553)	Top-1 acc 57.812 (57.403)	Top-5 acc 78.906 (79.036)	lr 0.01510
Train [53][30/3239]	Time 0.238 (1.957)	Data Time 0.001 (1.465)	Loss 2.6370 (2.7327)	Entropy 0.63522 (0.63553)	Top-1 acc 63.281 (58.216)	Top-5 acc 82.422 (79.688)	lr 0.01510
Train [53][40/3239]	Time 0.245 (1.629)	Data Time 0.001 (1.143)	Loss 2.8881 (2.7360)	Entropy 0.63531 (0.63546)	Top-1 acc 56.641 (58.070)	Top-5 acc 75.781 (79.697)	lr 0.01509
Train [53][50/3239]	Time 0.261 (1.395)	Data Time 0.002 (0.920)	Loss 2.5685 (2.7322)	Entropy 0.63502 (0.63541)	Top-1 acc 60.156 (58.218)	Top-5 acc 84.766 (79.841)	lr 0.01509
Train [53][60/3239]	Time 0.412 (1.245)	Data Time 0.007 (0.769)	Loss 2.6941 (2.7226)	Entropy 0.63505 (0.63534)	Top-1 acc 58.203 (58.440)	Top-5 acc 82.031 (80.053)	lr 0.01509
Train [53][70/3239]	Time 0.267 (1.206)	Data Time 0.001 (0.729)	Loss 2.7270 (2.7211)	Entropy 0.63522 (0.63531)	Top-1 acc 58.984 (58.407)	Top-5 acc 79.297 (79.985)	lr 0.01509
Train [53][80/3239]	Time 0.258 (1.112)	Data Time 0.002 (0.639)	Loss 2.8382 (2.7197)	Entropy 0.63488 (0.63529)	Top-1 acc 53.516 (58.488)	Top-5 acc 79.297 (80.006)	lr 0.01509
Train [53][90/3239]	Time 0.266 (1.046)	Data Time 0.001 (0.569)	Loss 2.7467 (2.7182)	Entropy 0.63451 (0.63524)	Top-1 acc 57.812 (58.521)	Top-5 acc 79.297 (80.001)	lr 0.01509
Train [53][100/3239]	Time 0.243 (0.987)	Data Time 0.001 (0.513)	Loss 2.7368 (2.7232)	Entropy 0.63450 (0.63517)	Top-1 acc 58.984 (58.385)	Top-5 acc 78.516 (79.943)	lr 0.01509
Train [53][110/3239]	Time 0.249 (0.946)	Data Time 0.002 (0.475)	Loss 2.8014 (2.7250)	Entropy 0.63439 (0.63512)	Top-1 acc 56.641 (58.340)	Top-5 acc 78.125 (79.892)	lr 0.01509
Train [53][120/3239]	Time 0.279 (0.906)	Data Time 0.003 (0.436)	Loss 2.8013 (2.7280)	Entropy 0.63458 (0.63506)	Top-1 acc 64.062 (58.342)	Top-5 acc 78.125 (79.813)	lr 0.01509
Train [53][130/3239]	Time 0.390 (0.876)	Data Time 0.002 (0.403)	Loss 2.7337 (2.7311)	Entropy 0.63441 (0.63502)	Top-1 acc 53.516 (58.155)	Top-5 acc 80.469 (79.741)	lr 0.01509
Train [53][140/3239]	Time 0.242 (0.849)	Data Time 0.001 (0.377)	Loss 2.6838 (2.7303)	Entropy 0.63445 (0.63498)	Top-1 acc 58.594 (58.228)	Top-5 acc 83.594 (79.801)	lr 0.01509
Train [53][150/3239]	Time 0.270 (0.822)	Data Time 0.002 (0.352)	Loss 2.7040 (2.7224)	Entropy 0.63461 (0.63494)	Top-1 acc 56.641 (58.423)	Top-5 acc 80.469 (79.962)	lr 0.01508
Train [53][160/3239]	Time 0.243 (0.802)	Data Time 0.002 (0.330)	Loss 2.7065 (2.7232)	Entropy 0.63453 (0.63492)	Top-1 acc 55.078 (58.324)	Top-5 acc 81.250 (79.979)	lr 0.01508
Train [53][170/3239]	Time 0.280 (0.799)	Data Time 0.001 (0.330)	Loss 2.9466 (2.7260)	Entropy 0.63478 (0.63490)	Top-1 acc 53.125 (58.274)	Top-5 acc 74.609 (79.955)	lr 0.01508
Train [53][180/3239]	Time 0.243 (0.779)	Data Time 0.001 (0.312)	Loss 2.8190 (2.7296)	Entropy 0.63505 (0.63490)	Top-1 acc 55.078 (58.203)	Top-5 acc 75.391 (79.875)	lr 0.01508
Train [53][190/3239]	Time 0.245 (0.763)	Data Time 0.001 (0.296)	Loss 2.7908 (2.7310)	Entropy 0.63497 (0.63491)	Top-1 acc 55.469 (58.158)	Top-5 acc 78.125 (79.908)	lr 0.01508
Train [53][200/3239]	Time 1.750 (0.755)	Data Time 1.501 (0.289)	Loss 2.7712 (2.7271)	Entropy 0.63494 (0.63491)	Top-1 acc 58.594 (58.281)	Top-5 acc 80.859 (80.047)	lr 0.01508
Train [53][210/3239]	Time 0.243 (0.740)	Data Time 0.001 (0.275)	Loss 2.5304 (2.7289)	Entropy 0.63490 (0.63492)	Top-1 acc 60.547 (58.172)	Top-5 acc 85.938 (80.047)	lr 0.01508
Train [53][220/3239]	Time 0.349 (0.727)	Data Time 0.001 (0.263)	Loss 2.9591 (2.7291)	Entropy 0.63507 (0.63492)	Top-1 acc 52.734 (58.150)	Top-5 acc 75.000 (80.037)	lr 0.01508
Train [53][230/3239]	Time 0.270 (0.715)	Data Time 0.001 (0.251)	Loss 2.9309 (2.7294)	Entropy 0.63523 (0.63493)	Top-1 acc 51.953 (58.130)	Top-5 acc 77.344 (80.076)	lr 0.01508
Train [53][240/3239]	Time 0.224 (0.715)	Data Time 0.001 (0.252)	Loss 2.8777 (2.7301)	Entropy 0.63541 (0.63495)	Top-1 acc 54.297 (58.096)	Top-5 acc 77.344 (80.031)	lr 0.01508
Train [53][250/3239]	Time 0.237 (0.706)	Data Time 0.001 (0.242)	Loss 2.6826 (2.7299)	Entropy 0.63565 (0.63497)	Top-1 acc 58.984 (58.082)	Top-5 acc 80.469 (80.007)	lr 0.01507
Train [53][260/3239]	Time 0.260 (0.696)	Data Time 0.002 (0.233)	Loss 2.9305 (2.7313)	Entropy 0.63578 (0.63500)	Top-1 acc 54.297 (58.025)	Top-5 acc 78.125 (79.981)	lr 0.01507
Train [53][270/3239]	Time 0.263 (0.687)	Data Time 0.001 (0.225)	Loss 2.4696 (2.7298)	Entropy 0.63555 (0.63502)	Top-1 acc 61.328 (58.040)	Top-5 acc 85.156 (80.033)	lr 0.01507
Train [53][280/3239]	Time 0.272 (0.679)	Data Time 0.001 (0.217)	Loss 2.6085 (2.7276)	Entropy 0.63527 (0.63504)	Top-1 acc 64.062 (58.132)	Top-5 acc 80.859 (80.088)	lr 0.01507
Train [53][290/3239]	Time 0.400 (0.672)	Data Time 0.002 (0.209)	Loss 2.9127 (2.7266)	Entropy 0.63521 (0.63505)	Top-1 acc 55.469 (58.129)	Top-5 acc 79.688 (80.124)	lr 0.01507
Train [53][300/3239]	Time 0.289 (0.680)	Data Time 0.001 (0.217)	Loss 2.5069 (2.7261)	Entropy 0.63517 (0.63506)	Top-1 acc 64.062 (58.128)	Top-5 acc 85.156 (80.149)	lr 0.01507
Train [53][310/3239]	Time 0.242 (0.672)	Data Time 0.001 (0.211)	Loss 2.5515 (2.7265)	Entropy 0.63540 (0.63507)	Top-1 acc 62.500 (58.106)	Top-5 acc 85.156 (80.153)	lr 0.01507
Train [53][320/3239]	Time 0.256 (0.666)	Data Time 0.001 (0.204)	Loss 2.8413 (2.7259)	Entropy 0.63551 (0.63508)	Top-1 acc 56.641 (58.108)	Top-5 acc 77.734 (80.150)	lr 0.01507
Train [53][330/3239]	Time 0.227 (0.659)	Data Time 0.001 (0.198)	Loss 2.6915 (2.7235)	Entropy 0.63555 (0.63509)	Top-1 acc 56.250 (58.161)	Top-5 acc 80.078 (80.186)	lr 0.01507
Train [53][340/3239]	Time 0.263 (0.655)	Data Time 0.001 (0.194)	Loss 2.5461 (2.7232)	Entropy 0.63542 (0.63510)	Top-1 acc 65.625 (58.179)	Top-5 acc 83.203 (80.164)	lr 0.01507
Train [53][350/3239]	Time 0.243 (0.650)	Data Time 0.001 (0.189)	Loss 2.6437 (2.7238)	Entropy 0.63545 (0.63511)	Top-1 acc 59.766 (58.155)	Top-5 acc 80.469 (80.145)	lr 0.01506
Train [53][360/3239]	Time 1.039 (0.646)	Data Time 0.692 (0.185)	Loss 2.6055 (2.7226)	Entropy 0.63536 (0.63512)	Top-1 acc 60.547 (58.203)	Top-5 acc 84.375 (80.163)	lr 0.01506
Train [53][370/3239]	Time 0.276 (0.641)	Data Time 0.002 (0.181)	Loss 2.6589 (2.7200)	Entropy 0.63516 (0.63513)	Top-1 acc 57.031 (58.256)	Top-5 acc 82.422 (80.234)	lr 0.01506
Train [53][380/3239]	Time 0.251 (0.636)	Data Time 0.001 (0.176)	Loss 2.5882 (2.7193)	Entropy 0.63531 (0.63513)	Top-1 acc 62.500 (58.274)	Top-5 acc 84.766 (80.247)	lr 0.01506
Train [53][390/3239]	Time 0.312 (0.634)	Data Time 0.001 (0.172)	Loss 2.8897 (2.7184)	Entropy 0.63564 (0.63514)	Top-1 acc 52.344 (58.312)	Top-5 acc 76.953 (80.264)	lr 0.01506
Train [53][400/3239]	Time 0.247 (0.630)	Data Time 0.001 (0.168)	Loss 2.8925 (2.7180)	Entropy 0.63578 (0.63515)	Top-1 acc 52.344 (58.327)	Top-5 acc 73.828 (80.251)	lr 0.01506
Train [53][410/3239]	Time 0.263 (0.626)	Data Time 0.002 (0.164)	Loss 2.7193 (2.7193)	Entropy 0.63581 (0.63517)	Top-1 acc 54.688 (58.296)	Top-5 acc 80.469 (80.226)	lr 0.01506
Train [53][420/3239]	Time 0.247 (0.622)	Data Time 0.001 (0.160)	Loss 2.6753 (2.7189)	Entropy 0.63548 (0.63518)	Top-1 acc 62.500 (58.338)	Top-5 acc 78.516 (80.209)	lr 0.01506
Train [53][430/3239]	Time 0.237 (0.621)	Data Time 0.001 (0.160)	Loss 2.6832 (2.7195)	Entropy 0.63559 (0.63519)	Top-1 acc 63.281 (58.345)	Top-5 acc 80.078 (80.194)	lr 0.01506
Train [53][440/3239]	Time 0.266 (0.617)	Data Time 0.001 (0.156)	Loss 2.7834 (2.7212)	Entropy 0.63579 (0.63520)	Top-1 acc 57.422 (58.307)	Top-5 acc 79.297 (80.157)	lr 0.01506
Train [53][450/3239]	Time 0.423 (0.617)	Data Time 0.003 (0.156)	Loss 2.7083 (2.7203)	Entropy 0.63612 (0.63521)	Top-1 acc 58.594 (58.320)	Top-5 acc 81.641 (80.177)	lr 0.01505
Train [53][460/3239]	Time 0.259 (0.623)	Data Time 0.001 (0.163)	Loss 2.9296 (2.7191)	Entropy 0.63603 (0.63523)	Top-1 acc 55.469 (58.354)	Top-5 acc 73.438 (80.171)	lr 0.01505
Train [53][470/3239]	Time 0.243 (0.620)	Data Time 0.001 (0.159)	Loss 3.0123 (2.7205)	Entropy 0.63638 (0.63525)	Top-1 acc 50.781 (58.316)	Top-5 acc 75.391 (80.145)	lr 0.01505
Train [53][480/3239]	Time 0.364 (0.692)	Data Time 0.007 (0.156)	Loss 2.8506 (2.7199)	Entropy 0.63639 (0.63527)	Top-1 acc 60.547 (58.367)	Top-5 acc 78.906 (80.157)	lr 0.01505
Train [53][490/3239]	Time 0.236 (0.687)	Data Time 0.002 (0.153)	Loss 2.8484 (2.7207)	Entropy 0.63629 (0.63530)	Top-1 acc 56.641 (58.340)	Top-5 acc 75.781 (80.130)	lr 0.01505
Train [53][500/3239]	Time 0.241 (0.682)	Data Time 0.002 (0.150)	Loss 2.7049 (2.7217)	Entropy 0.63644 (0.63532)	Top-1 acc 58.984 (58.318)	Top-5 acc 80.469 (80.105)	lr 0.01505
Train [53][510/3239]	Time 0.254 (0.677)	Data Time 0.001 (0.147)	Loss 2.7130 (2.7226)	Entropy 0.63659 (0.63534)	Top-1 acc 58.594 (58.293)	Top-5 acc 80.469 (80.097)	lr 0.01505
Train [53][520/3239]	Time 0.391 (0.673)	Data Time 0.001 (0.144)	Loss 2.7444 (2.7223)	Entropy 0.63635 (0.63536)	Top-1 acc 55.469 (58.309)	Top-5 acc 79.297 (80.107)	lr 0.01505
Train [53][530/3239]	Time 0.273 (0.669)	Data Time 0.003 (0.142)	Loss 2.6695 (2.7216)	Entropy 0.63606 (0.63538)	Top-1 acc 59.375 (58.328)	Top-5 acc 80.469 (80.113)	lr 0.01505
Train [53][540/3239]	Time 0.246 (0.664)	Data Time 0.003 (0.139)	Loss 2.6934 (2.7209)	Entropy 0.63601 (0.63539)	Top-1 acc 62.109 (58.340)	Top-5 acc 80.078 (80.116)	lr 0.01505
Train [53][550/3239]	Time 0.239 (0.661)	Data Time 0.001 (0.137)	Loss 2.7127 (2.7222)	Entropy 0.63568 (0.63540)	Top-1 acc 55.078 (58.298)	Top-5 acc 79.297 (80.094)	lr 0.01504
Train [53][560/3239]	Time 0.263 (0.657)	Data Time 0.002 (0.134)	Loss 2.6136 (2.7227)	Entropy 0.63562 (0.63541)	Top-1 acc 61.328 (58.312)	Top-5 acc 82.812 (80.080)	lr 0.01504
Train [53][570/3239]	Time 0.241 (0.653)	Data Time 0.001 (0.132)	Loss 2.8568 (2.7237)	Entropy 0.63585 (0.63541)	Top-1 acc 57.812 (58.312)	Top-5 acc 78.906 (80.053)	lr 0.01504
Train [53][580/3239]	Time 0.325 (0.650)	Data Time 0.002 (0.130)	Loss 2.7566 (2.7238)	Entropy 0.63564 (0.63542)	Top-1 acc 55.078 (58.310)	Top-5 acc 78.906 (80.059)	lr 0.01504
Train [53][590/3239]	Time 0.245 (0.647)	Data Time 0.001 (0.127)	Loss 2.7978 (2.7247)	Entropy 0.63558 (0.63542)	Top-1 acc 57.422 (58.300)	Top-5 acc 78.906 (80.033)	lr 0.01504
Train [53][600/3239]	Time 0.259 (0.643)	Data Time 0.002 (0.125)	Loss 2.5694 (2.7239)	Entropy 0.63576 (0.63543)	Top-1 acc 60.938 (58.318)	Top-5 acc 85.156 (80.051)	lr 0.01504
Train [53][610/3239]	Time 2.916 (0.645)	Data Time 2.549 (0.127)	Loss 2.6843 (2.7247)	Entropy 0.63530 (0.63543)	Top-1 acc 56.250 (58.301)	Top-5 acc 81.641 (80.049)	lr 0.01504
Train [53][620/3239]	Time 0.267 (0.645)	Data Time 0.001 (0.129)	Loss 2.7456 (2.7248)	Entropy 0.63524 (0.63542)	Top-1 acc 59.375 (58.298)	Top-5 acc 80.859 (80.050)	lr 0.01504
Train [53][630/3239]	Time 0.265 (0.646)	Data Time 0.001 (0.132)	Loss 2.7098 (2.7244)	Entropy 0.63530 (0.63542)	Top-1 acc 59.766 (58.311)	Top-5 acc 80.078 (80.059)	lr 0.01504
Train [53][640/3239]	Time 0.256 (0.643)	Data Time 0.001 (0.130)	Loss 2.6823 (2.7244)	Entropy 0.63511 (0.63542)	Top-1 acc 58.594 (58.306)	Top-5 acc 80.078 (80.072)	lr 0.01504
Train [53][650/3239]	Time 0.287 (0.644)	Data Time 0.001 (0.131)	Loss 2.6257 (2.7247)	Entropy 0.63519 (0.63542)	Top-1 acc 60.938 (58.279)	Top-5 acc 83.203 (80.068)	lr 0.01503
Train [53][660/3239]	Time 0.234 (0.645)	Data Time 0.001 (0.133)	Loss 2.8120 (2.7248)	Entropy 0.63489 (0.63541)	Top-1 acc 57.031 (58.278)	Top-5 acc 75.781 (80.060)	lr 0.01503
Train [53][670/3239]	Time 0.252 (0.642)	Data Time 0.001 (0.131)	Loss 2.5397 (2.7245)	Entropy 0.63473 (0.63540)	Top-1 acc 61.328 (58.281)	Top-5 acc 86.719 (80.075)	lr 0.01503
Train [53][680/3239]	Time 0.356 (0.647)	Data Time 0.001 (0.137)	Loss 2.6330 (2.7238)	Entropy 0.63483 (0.63539)	Top-1 acc 60.156 (58.289)	Top-5 acc 81.250 (80.090)	lr 0.01503
Train [53][690/3239]	Time 0.252 (0.645)	Data Time 0.002 (0.136)	Loss 2.6760 (2.7243)	Entropy 0.63482 (0.63538)	Top-1 acc 58.203 (58.285)	Top-5 acc 81.641 (80.079)	lr 0.01503
Train [53][700/3239]	Time 0.360 (0.644)	Data Time 0.001 (0.135)	Loss 2.8186 (2.7241)	Entropy 0.63522 (0.63538)	Top-1 acc 58.203 (58.299)	Top-5 acc 80.859 (80.071)	lr 0.01503
Train [53][710/3239]	Time 0.251 (0.643)	Data Time 0.001 (0.136)	Loss 2.6101 (2.7236)	Entropy 0.63547 (0.63538)	Top-1 acc 60.938 (58.315)	Top-5 acc 82.422 (80.080)	lr 0.01503
Train [53][720/3239]	Time 0.248 (0.644)	Data Time 0.001 (0.138)	Loss 2.6342 (2.7225)	Entropy 0.63550 (0.63538)	Top-1 acc 60.156 (58.348)	Top-5 acc 81.641 (80.104)	lr 0.01503
Train [53][730/3239]	Time 0.262 (0.643)	Data Time 0.001 (0.136)	Loss 2.7008 (2.7217)	Entropy 0.63505 (0.63538)	Top-1 acc 61.719 (58.351)	Top-5 acc 79.297 (80.123)	lr 0.01503
Train [53][740/3239]	Time 0.253 (0.644)	Data Time 0.001 (0.138)	Loss 2.7079 (2.7214)	Entropy 0.63539 (0.63537)	Top-1 acc 59.375 (58.367)	Top-5 acc 77.734 (80.125)	lr 0.01503
Train [53][750/3239]	Time 0.253 (0.645)	Data Time 0.001 (0.139)	Loss 2.7108 (2.7214)	Entropy 0.63562 (0.63538)	Top-1 acc 59.766 (58.375)	Top-5 acc 78.906 (80.115)	lr 0.01502
Train [53][760/3239]	Time 0.259 (0.642)	Data Time 0.001 (0.138)	Loss 2.6963 (2.7220)	Entropy 0.63586 (0.63538)	Top-1 acc 57.812 (58.354)	Top-5 acc 82.031 (80.116)	lr 0.01502
Train [53][770/3239]	Time 0.428 (0.651)	Data Time 0.001 (0.146)	Loss 2.7183 (2.7219)	Entropy 0.63581 (0.63539)	Top-1 acc 57.031 (58.355)	Top-5 acc 81.641 (80.123)	lr 0.01502
Train [53][780/3239]	Time 0.338 (0.648)	Data Time 0.100 (0.144)	Loss 2.7081 (2.7230)	Entropy 0.63626 (0.63539)	Top-1 acc 55.469 (58.326)	Top-5 acc 81.641 (80.108)	lr 0.01502
Train [53][790/3239]	Time 0.233 (0.645)	Data Time 0.001 (0.143)	Loss 2.6650 (2.7232)	Entropy 0.63624 (0.63541)	Top-1 acc 59.375 (58.330)	Top-5 acc 82.422 (80.105)	lr 0.01502
Train [53][800/3239]	Time 0.272 (0.652)	Data Time 0.001 (0.150)	Loss 2.6299 (2.7224)	Entropy 0.63612 (0.63542)	Top-1 acc 60.547 (58.351)	Top-5 acc 78.906 (80.118)	lr 0.01502
Train [53][810/3239]	Time 0.250 (0.650)	Data Time 0.001 (0.149)	Loss 2.8466 (2.7223)	Entropy 0.63626 (0.63543)	Top-1 acc 52.344 (58.353)	Top-5 acc 79.688 (80.121)	lr 0.01502
Train [53][820/3239]	Time 0.243 (0.647)	Data Time 0.001 (0.147)	Loss 2.9239 (2.7228)	Entropy 0.63648 (0.63544)	Top-1 acc 50.391 (58.343)	Top-5 acc 77.734 (80.106)	lr 0.01502
Train [53][830/3239]	Time 0.223 (0.645)	Data Time 0.001 (0.145)	Loss 2.8585 (2.7227)	Entropy 0.63657 (0.63545)	Top-1 acc 57.031 (58.343)	Top-5 acc 81.250 (80.123)	lr 0.01502
Train [53][840/3239]	Time 0.329 (0.653)	Data Time 0.001 (0.154)	Loss 2.6837 (2.7227)	Entropy 0.63691 (0.63546)	Top-1 acc 60.938 (58.347)	Top-5 acc 80.469 (80.132)	lr 0.01502
Train [53][850/3239]	Time 0.234 (0.651)	Data Time 0.001 (0.152)	Loss 2.5438 (2.7230)	Entropy 0.63721 (0.63548)	Top-1 acc 64.062 (58.342)	Top-5 acc 82.812 (80.124)	lr 0.01501
Train [53][860/3239]	Time 0.230 (0.648)	Data Time 0.001 (0.151)	Loss 2.7173 (2.7227)	Entropy 0.63722 (0.63550)	Top-1 acc 58.984 (58.356)	Top-5 acc 80.078 (80.132)	lr 0.01501
Train [53][870/3239]	Time 0.247 (0.661)	Data Time 0.001 (0.164)	Loss 2.7586 (2.7226)	Entropy 0.63680 (0.63552)	Top-1 acc 60.156 (58.355)	Top-5 acc 80.859 (80.142)	lr 0.01501
Train [53][880/3239]	Time 0.245 (0.658)	Data Time 0.001 (0.163)	Loss 2.6794 (2.7230)	Entropy 0.63707 (0.63554)	Top-1 acc 58.203 (58.341)	Top-5 acc 79.297 (80.130)	lr 0.01501
Train [53][890/3239]	Time 0.238 (0.656)	Data Time 0.002 (0.161)	Loss 2.7650 (2.7229)	Entropy 0.63721 (0.63555)	Top-1 acc 57.422 (58.337)	Top-5 acc 79.297 (80.138)	lr 0.01501
Train [53][900/3239]	Time 0.231 (0.665)	Data Time 0.001 (0.171)	Loss 2.5901 (2.7233)	Entropy 0.63730 (0.63557)	Top-1 acc 58.203 (58.322)	Top-5 acc 82.812 (80.129)	lr 0.01501
Train [53][910/3239]	Time 0.238 (0.663)	Data Time 0.001 (0.169)	Loss 2.5589 (2.7233)	Entropy 0.63740 (0.63559)	Top-1 acc 63.281 (58.323)	Top-5 acc 81.250 (80.128)	lr 0.01501
Train [53][920/3239]	Time 0.233 (0.660)	Data Time 0.001 (0.167)	Loss 2.6800 (2.7229)	Entropy 0.63765 (0.63561)	Top-1 acc 60.547 (58.340)	Top-5 acc 81.641 (80.134)	lr 0.01501
Train [53][930/3239]	Time 0.253 (0.670)	Data Time 0.001 (0.178)	Loss 2.9408 (2.7225)	Entropy 0.63721 (0.63563)	Top-1 acc 54.688 (58.358)	Top-5 acc 76.172 (80.143)	lr 0.01501
Train [53][940/3239]	Time 0.247 (0.667)	Data Time 0.001 (0.176)	Loss 2.4447 (2.7226)	Entropy 0.63737 (0.63565)	Top-1 acc 67.188 (58.374)	Top-5 acc 84.375 (80.134)	lr 0.01501
Train [53][950/3239]	Time 0.242 (0.665)	Data Time 0.001 (0.174)	Loss 2.9310 (2.7229)	Entropy 0.63734 (0.63567)	Top-1 acc 53.906 (58.371)	Top-5 acc 75.391 (80.127)	lr 0.01500
Train [53][960/3239]	Time 0.241 (0.676)	Data Time 0.001 (0.186)	Loss 2.7399 (2.7229)	Entropy 0.63688 (0.63568)	Top-1 acc 60.156 (58.376)	Top-5 acc 76.562 (80.122)	lr 0.01500
Train [53][970/3239]	Time 0.257 (0.674)	Data Time 0.002 (0.184)	Loss 2.8039 (2.7227)	Entropy 0.63669 (0.63569)	Top-1 acc 51.953 (58.373)	Top-5 acc 79.297 (80.120)	lr 0.01500
Train [53][980/3239]	Time 0.281 (0.671)	Data Time 0.001 (0.182)	Loss 2.6863 (2.7227)	Entropy 0.63683 (0.63570)	Top-1 acc 59.766 (58.381)	Top-5 acc 80.078 (80.116)	lr 0.01500
Train [53][990/3239]	Time 0.260 (0.669)	Data Time 0.001 (0.180)	Loss 2.7411 (2.7237)	Entropy 0.63678 (0.63571)	Top-1 acc 58.984 (58.359)	Top-5 acc 78.906 (80.101)	lr 0.01500
Train [53][1000/3239]	Time 0.332 (0.678)	Data Time 0.001 (0.191)	Loss 2.6977 (2.7233)	Entropy 0.63729 (0.63573)	Top-1 acc 57.812 (58.374)	Top-5 acc 81.250 (80.110)	lr 0.01500
Train [53][1010/3239]	Time 0.231 (0.676)	Data Time 0.001 (0.189)	Loss 2.9143 (2.7230)	Entropy 0.63739 (0.63574)	Top-1 acc 57.422 (58.392)	Top-5 acc 76.953 (80.116)	lr 0.01500
Train [53][1020/3239]	Time 0.283 (0.674)	Data Time 0.001 (0.187)	Loss 2.6431 (2.7234)	Entropy 0.63743 (0.63576)	Top-1 acc 59.766 (58.371)	Top-5 acc 78.516 (80.106)	lr 0.01500
Train [53][1030/3239]	Time 0.234 (0.685)	Data Time 0.001 (0.198)	Loss 2.6373 (2.7229)	Entropy 0.63729 (0.63578)	Top-1 acc 62.891 (58.383)	Top-5 acc 81.641 (80.117)	lr 0.01500
Train [53][1040/3239]	Time 0.238 (0.682)	Data Time 0.001 (0.196)	Loss 2.6860 (2.7228)	Entropy 0.63734 (0.63579)	Top-1 acc 61.328 (58.381)	Top-5 acc 80.859 (80.121)	lr 0.01500
Train [53][1050/3239]	Time 0.237 (0.680)	Data Time 0.001 (0.194)	Loss 2.7577 (2.7227)	Entropy 0.63739 (0.63581)	Top-1 acc 57.422 (58.388)	Top-5 acc 79.297 (80.120)	lr 0.01500
Train [53][1060/3239]	Time 0.246 (0.688)	Data Time 0.001 (0.203)	Loss 2.6879 (2.7229)	Entropy 0.63754 (0.63582)	Top-1 acc 62.891 (58.391)	Top-5 acc 81.641 (80.123)	lr 0.01499
Train [53][1070/3239]	Time 0.316 (0.685)	Data Time 0.001 (0.201)	Loss 3.0591 (2.7232)	Entropy 0.63775 (0.63584)	Top-1 acc 51.172 (58.387)	Top-5 acc 73.047 (80.115)	lr 0.01499
Train [53][1080/3239]	Time 0.231 (0.683)	Data Time 0.001 (0.199)	Loss 2.8953 (2.7236)	Entropy 0.63765 (0.63586)	Top-1 acc 53.125 (58.385)	Top-5 acc 78.125 (80.105)	lr 0.01499
Train [53][1090/3239]	Time 0.236 (0.696)	Data Time 0.001 (0.213)	Loss 2.8713 (2.7232)	Entropy 0.63718 (0.63587)	Top-1 acc 55.859 (58.394)	Top-5 acc 78.906 (80.116)	lr 0.01499
Train [53][1100/3239]	Time 0.234 (0.694)	Data Time 0.001 (0.211)	Loss 2.7750 (2.7233)	Entropy 0.63686 (0.63588)	Top-1 acc 59.375 (58.392)	Top-5 acc 76.953 (80.111)	lr 0.01499
Train [53][1110/3239]	Time 0.248 (0.692)	Data Time 0.001 (0.210)	Loss 2.8251 (2.7236)	Entropy 0.63648 (0.63589)	Top-1 acc 53.906 (58.381)	Top-5 acc 78.125 (80.106)	lr 0.01499
Train [53][1120/3239]	Time 0.247 (0.700)	Data Time 0.001 (0.218)	Loss 2.9890 (2.7241)	Entropy 0.63629 (0.63589)	Top-1 acc 51.172 (58.369)	Top-5 acc 76.562 (80.102)	lr 0.01499
Train [53][1130/3239]	Time 0.246 (0.697)	Data Time 0.001 (0.217)	Loss 2.5090 (2.7241)	Entropy 0.63671 (0.63590)	Top-1 acc 62.891 (58.364)	Top-5 acc 80.859 (80.097)	lr 0.01499
Train [53][1140/3239]	Time 0.245 (0.726)	Data Time 0.002 (0.215)	Loss 2.8593 (2.7244)	Entropy 0.63700 (0.63590)	Top-1 acc 55.078 (58.351)	Top-5 acc 77.344 (80.083)	lr 0.01499
Train [53][1150/3239]	Time 0.241 (0.724)	Data Time 0.002 (0.213)	Loss 2.8843 (2.7247)	Entropy 0.63716 (0.63592)	Top-1 acc 57.812 (58.357)	Top-5 acc 75.391 (80.075)	lr 0.01499
Train [53][1160/3239]	Time 0.354 (0.721)	Data Time 0.002 (0.211)	Loss 2.6974 (2.7246)	Entropy 0.63732 (0.63593)	Top-1 acc 59.766 (58.363)	Top-5 acc 80.078 (80.074)	lr 0.01498
Train [53][1170/3239]	Time 0.257 (0.719)	Data Time 0.002 (0.209)	Loss 2.7288 (2.7249)	Entropy 0.63708 (0.63594)	Top-1 acc 58.984 (58.354)	Top-5 acc 80.078 (80.068)	lr 0.01498
Train [53][1180/3239]	Time 0.269 (0.716)	Data Time 0.002 (0.207)	Loss 2.7337 (2.7246)	Entropy 0.63721 (0.63595)	Top-1 acc 62.891 (58.369)	Top-5 acc 79.688 (80.073)	lr 0.01498
Train [53][1190/3239]	Time 0.262 (0.714)	Data Time 0.002 (0.206)	Loss 2.6975 (2.7248)	Entropy 0.63704 (0.63596)	Top-1 acc 58.984 (58.356)	Top-5 acc 78.516 (80.069)	lr 0.01498
Train [53][1200/3239]	Time 0.240 (0.713)	Data Time 0.001 (0.205)	Loss 2.7837 (2.7250)	Entropy 0.63651 (0.63596)	Top-1 acc 58.203 (58.356)	Top-5 acc 75.781 (80.063)	lr 0.01498
Train [53][1210/3239]	Time 0.787 (0.712)	Data Time 0.534 (0.205)	Loss 2.5735 (2.7250)	Entropy 0.63630 (0.63597)	Top-1 acc 60.547 (58.353)	Top-5 acc 85.156 (80.064)	lr 0.01498
Train [53][1220/3239]	Time 0.242 (0.709)	Data Time 0.002 (0.203)	Loss 2.7599 (2.7254)	Entropy 0.63640 (0.63597)	Top-1 acc 57.422 (58.344)	Top-5 acc 78.906 (80.048)	lr 0.01498
Train [53][1230/3239]	Time 0.347 (0.712)	Data Time 0.001 (0.207)	Loss 2.8991 (2.7259)	Entropy 0.63633 (0.63597)	Top-1 acc 56.250 (58.343)	Top-5 acc 77.734 (80.045)	lr 0.01498
Train [53][1240/3239]	Time 0.253 (0.720)	Data Time 0.001 (0.215)	Loss 2.6686 (2.7256)	Entropy 0.63644 (0.63598)	Top-1 acc 60.547 (58.347)	Top-5 acc 83.594 (80.054)	lr 0.01498
Train [53][1250/3239]	Time 0.254 (0.718)	Data Time 0.001 (0.213)	Loss 2.6172 (2.7255)	Entropy 0.63616 (0.63598)	Top-1 acc 62.891 (58.350)	Top-5 acc 84.766 (80.052)	lr 0.01498
Train [53][1260/3239]	Time 0.258 (0.716)	Data Time 0.001 (0.212)	Loss 2.7952 (2.7253)	Entropy 0.63606 (0.63598)	Top-1 acc 57.031 (58.363)	Top-5 acc 78.125 (80.055)	lr 0.01497
Train [53][1270/3239]	Time 0.278 (0.721)	Data Time 0.002 (0.218)	Loss 2.6612 (2.7248)	Entropy 0.63612 (0.63598)	Top-1 acc 61.328 (58.375)	Top-5 acc 81.641 (80.069)	lr 0.01497
Train [53][1280/3239]	Time 0.249 (0.720)	Data Time 0.001 (0.218)	Loss 2.7375 (2.7250)	Entropy 0.63620 (0.63598)	Top-1 acc 60.156 (58.378)	Top-5 acc 79.297 (80.065)	lr 0.01497
Train [53][1290/3239]	Time 0.246 (0.723)	Data Time 0.001 (0.221)	Loss 2.6292 (2.7246)	Entropy 0.63620 (0.63598)	Top-1 acc 61.719 (58.385)	Top-5 acc 81.641 (80.070)	lr 0.01497
Train [53][1300/3239]	Time 0.249 (0.727)	Data Time 0.001 (0.225)	Loss 2.7742 (2.7241)	Entropy 0.63627 (0.63599)	Top-1 acc 53.906 (58.390)	Top-5 acc 79.297 (80.085)	lr 0.01497
Train [53][1310/3239]	Time 0.243 (0.727)	Data Time 0.001 (0.225)	Loss 2.6673 (2.7243)	Entropy 0.63591 (0.63599)	Top-1 acc 59.766 (58.383)	Top-5 acc 80.469 (80.082)	lr 0.01497
Train [53][1320/3239]	Time 0.409 (0.725)	Data Time 0.003 (0.224)	Loss 2.8001 (2.7249)	Entropy 0.63589 (0.63599)	Top-1 acc 58.594 (58.374)	Top-5 acc 75.391 (80.069)	lr 0.01497
Train [53][1330/3239]	Time 0.235 (0.731)	Data Time 0.001 (0.230)	Loss 2.6865 (2.7246)	Entropy 0.63588 (0.63598)	Top-1 acc 58.984 (58.378)	Top-5 acc 79.688 (80.072)	lr 0.01497
Train [53][1340/3239]	Time 0.234 (0.731)	Data Time 0.001 (0.231)	Loss 2.6649 (2.7249)	Entropy 0.63601 (0.63598)	Top-1 acc 60.156 (58.369)	Top-5 acc 81.250 (80.063)	lr 0.01497
Train [53][1350/3239]	Time 3.983 (0.731)	Data Time 3.747 (0.232)	Loss 2.6195 (2.7248)	Entropy 0.63586 (0.63598)	Top-1 acc 60.547 (58.368)	Top-5 acc 83.594 (80.066)	lr 0.01497
Train [53][1360/3239]	Time 0.252 (0.737)	Data Time 0.001 (0.238)	Loss 2.7022 (2.7248)	Entropy 0.63571 (0.63598)	Top-1 acc 62.109 (58.375)	Top-5 acc 81.641 (80.064)	lr 0.01496
Train [53][1370/3239]	Time 0.272 (0.735)	Data Time 0.002 (0.236)	Loss 2.5713 (2.7254)	Entropy 0.63571 (0.63598)	Top-1 acc 63.672 (58.357)	Top-5 acc 84.766 (80.054)	lr 0.01496
Train [53][1380/3239]	Time 0.226 (0.735)	Data Time 0.001 (0.236)	Loss 2.9451 (2.7252)	Entropy 0.63546 (0.63598)	Top-1 acc 53.516 (58.357)	Top-5 acc 75.391 (80.055)	lr 0.01496
Train [53][1390/3239]	Time 0.322 (0.738)	Data Time 0.001 (0.240)	Loss 2.7687 (2.7255)	Entropy 0.63577 (0.63597)	Top-1 acc 59.375 (58.344)	Top-5 acc 81.250 (80.053)	lr 0.01496
Train [53][1400/3239]	Time 0.234 (0.743)	Data Time 0.001 (0.246)	Loss 2.7656 (2.7253)	Entropy 0.63600 (0.63597)	Top-1 acc 54.297 (58.350)	Top-5 acc 80.078 (80.055)	lr 0.01496
Train [53][1410/3239]	Time 0.255 (0.741)	Data Time 0.001 (0.244)	Loss 3.0042 (2.7255)	Entropy 0.63611 (0.63597)	Top-1 acc 52.734 (58.343)	Top-5 acc 73.828 (80.049)	lr 0.01496
Train [53][1420/3239]	Time 0.233 (0.744)	Data Time 0.001 (0.248)	Loss 2.7017 (2.7260)	Entropy 0.63615 (0.63597)	Top-1 acc 60.547 (58.337)	Top-5 acc 79.297 (80.037)	lr 0.01496
Train [53][1430/3239]	Time 0.243 (0.753)	Data Time 0.002 (0.257)	Loss 2.8691 (2.7261)	Entropy 0.63635 (0.63598)	Top-1 acc 55.078 (58.335)	Top-5 acc 78.125 (80.035)	lr 0.01496
Train [53][1440/3239]	Time 0.303 (0.751)	Data Time 0.001 (0.255)	Loss 2.6470 (2.7259)	Entropy 0.63618 (0.63598)	Top-1 acc 61.328 (58.338)	Top-5 acc 80.469 (80.038)	lr 0.01496
Train [53][1450/3239]	Time 0.253 (0.749)	Data Time 0.001 (0.254)	Loss 2.8647 (2.7257)	Entropy 0.63628 (0.63598)	Top-1 acc 54.688 (58.343)	Top-5 acc 77.344 (80.049)	lr 0.01496
Train [53][1460/3239]	Time 0.257 (0.759)	Data Time 0.001 (0.264)	Loss 2.5457 (2.7254)	Entropy 0.63647 (0.63598)	Top-1 acc 60.156 (58.346)	Top-5 acc 82.031 (80.055)	lr 0.01495
Train [53][1470/3239]	Time 0.264 (0.756)	Data Time 0.002 (0.262)	Loss 2.7546 (2.7254)	Entropy 0.63669 (0.63599)	Top-1 acc 52.344 (58.343)	Top-5 acc 78.906 (80.051)	lr 0.01495
Train [53][1480/3239]	Time 0.268 (0.754)	Data Time 0.001 (0.260)	Loss 2.7840 (2.7253)	Entropy 0.63682 (0.63599)	Top-1 acc 60.547 (58.353)	Top-5 acc 78.906 (80.052)	lr 0.01495
Train [53][1490/3239]	Time 0.242 (0.762)	Data Time 0.001 (0.269)	Loss 2.7971 (2.7256)	Entropy 0.63652 (0.63600)	Top-1 acc 56.641 (58.344)	Top-5 acc 78.906 (80.044)	lr 0.01495
Train [53][1500/3239]	Time 0.232 (0.760)	Data Time 0.002 (0.267)	Loss 2.6431 (2.7253)	Entropy 0.63655 (0.63600)	Top-1 acc 59.766 (58.346)	Top-5 acc 83.203 (80.048)	lr 0.01495
Train [53][1510/3239]	Time 0.238 (0.758)	Data Time 0.001 (0.265)	Loss 2.7705 (2.7250)	Entropy 0.63684 (0.63601)	Top-1 acc 58.203 (58.362)	Top-5 acc 76.562 (80.048)	lr 0.01495
Train [53][1520/3239]	Time 0.276 (0.767)	Data Time 0.001 (0.275)	Loss 2.4747 (2.7247)	Entropy 0.63670 (0.63601)	Top-1 acc 61.719 (58.371)	Top-5 acc 86.328 (80.048)	lr 0.01495
Train [53][1530/3239]	Time 0.280 (0.765)	Data Time 0.002 (0.273)	Loss 2.7657 (2.7247)	Entropy 0.63707 (0.63602)	Top-1 acc 61.328 (58.376)	Top-5 acc 79.297 (80.049)	lr 0.01495
Train [53][1540/3239]	Time 0.243 (0.763)	Data Time 0.001 (0.272)	Loss 2.7313 (2.7247)	Entropy 0.63717 (0.63602)	Top-1 acc 58.984 (58.370)	Top-5 acc 81.641 (80.050)	lr 0.01495
Train [53][1550/3239]	Time 0.380 (0.761)	Data Time 0.001 (0.270)	Loss 2.5728 (2.7246)	Entropy 0.63746 (0.63603)	Top-1 acc 64.844 (58.376)	Top-5 acc 82.031 (80.046)	lr 0.01495
Train [53][1560/3239]	Time 0.268 (0.769)	Data Time 0.001 (0.279)	Loss 2.7272 (2.7250)	Entropy 0.63748 (0.63604)	Top-1 acc 57.812 (58.366)	Top-5 acc 81.250 (80.040)	lr 0.01494
Train [53][1570/3239]	Time 0.238 (0.767)	Data Time 0.002 (0.277)	Loss 2.8205 (2.7249)	Entropy 0.63772 (0.63605)	Top-1 acc 57.031 (58.369)	Top-5 acc 78.906 (80.043)	lr 0.01494
Train [53][1580/3239]	Time 0.256 (0.766)	Data Time 0.001 (0.275)	Loss 2.6192 (2.7251)	Entropy 0.63781 (0.63606)	Top-1 acc 59.766 (58.364)	Top-5 acc 82.422 (80.039)	lr 0.01494
Train [53][1590/3239]	Time 0.238 (0.777)	Data Time 0.002 (0.287)	Loss 2.6019 (2.7251)	Entropy 0.63806 (0.63607)	Top-1 acc 59.375 (58.357)	Top-5 acc 81.641 (80.038)	lr 0.01494
Train [53][1600/3239]	Time 0.242 (0.775)	Data Time 0.001 (0.285)	Loss 2.6613 (2.7250)	Entropy 0.63778 (0.63608)	Top-1 acc 60.938 (58.360)	Top-5 acc 79.688 (80.040)	lr 0.01494
Train [53][1610/3239]	Time 0.243 (0.772)	Data Time 0.001 (0.283)	Loss 2.6608 (2.7252)	Entropy 0.63799 (0.63609)	Top-1 acc 57.031 (58.351)	Top-5 acc 83.594 (80.042)	lr 0.01494
Train [53][1620/3239]	Time 0.239 (0.779)	Data Time 0.001 (0.290)	Loss 2.6961 (2.7248)	Entropy 0.63791 (0.63611)	Top-1 acc 56.250 (58.362)	Top-5 acc 80.859 (80.050)	lr 0.01494
Train [53][1630/3239]	Time 0.235 (0.777)	Data Time 0.001 (0.288)	Loss 2.7697 (2.7249)	Entropy 0.63753 (0.63612)	Top-1 acc 54.688 (58.358)	Top-5 acc 81.641 (80.048)	lr 0.01494
Train [53][1640/3239]	Time 0.237 (0.776)	Data Time 0.001 (0.288)	Loss 2.7579 (2.7249)	Entropy 0.63726 (0.63612)	Top-1 acc 56.250 (58.355)	Top-5 acc 78.906 (80.044)	lr 0.01494
Train [53][1650/3239]	Time 0.269 (0.783)	Data Time 0.001 (0.295)	Loss 2.7089 (2.7254)	Entropy 0.63697 (0.63613)	Top-1 acc 61.328 (58.350)	Top-5 acc 81.250 (80.033)	lr 0.01494
Train [53][1660/3239]	Time 0.245 (0.781)	Data Time 0.001 (0.294)	Loss 3.0232 (2.7260)	Entropy 0.63677 (0.63613)	Top-1 acc 50.391 (58.332)	Top-5 acc 73.047 (80.021)	lr 0.01493
Train [53][1670/3239]	Time 3.144 (0.781)	Data Time 2.887 (0.294)	Loss 2.8023 (2.7264)	Entropy 0.63699 (0.63614)	Top-1 acc 58.203 (58.330)	Top-5 acc 76.562 (80.014)	lr 0.01493
Train [53][1680/3239]	Time 0.235 (0.787)	Data Time 0.001 (0.300)	Loss 2.5890 (2.7264)	Entropy 0.63732 (0.63614)	Top-1 acc 61.328 (58.331)	Top-5 acc 82.812 (80.014)	lr 0.01493
Train [53][1690/3239]	Time 0.254 (0.785)	Data Time 0.001 (0.299)	Loss 2.6487 (2.7264)	Entropy 0.63713 (0.63615)	Top-1 acc 57.812 (58.325)	Top-5 acc 81.641 (80.017)	lr 0.01493
Train [53][1700/3239]	Time 0.242 (0.783)	Data Time 0.001 (0.297)	Loss 2.4857 (2.7270)	Entropy 0.63712 (0.63616)	Top-1 acc 60.938 (58.309)	Top-5 acc 83.594 (80.007)	lr 0.01493
Train [53][1710/3239]	Time 0.348 (0.783)	Data Time 0.001 (0.297)	Loss 2.7037 (2.7273)	Entropy 0.63725 (0.63616)	Top-1 acc 58.203 (58.299)	Top-5 acc 81.250 (80.003)	lr 0.01493
Train [53][1720/3239]	Time 0.254 (0.789)	Data Time 0.002 (0.303)	Loss 2.6897 (2.7271)	Entropy 0.63738 (0.63617)	Top-1 acc 58.594 (58.296)	Top-5 acc 80.078 (80.005)	lr 0.01493
Train [53][1730/3239]	Time 0.239 (0.787)	Data Time 0.001 (0.302)	Loss 2.9514 (2.7275)	Entropy 0.63735 (0.63618)	Top-1 acc 51.562 (58.290)	Top-5 acc 77.734 (80.001)	lr 0.01493
Train [53][1740/3239]	Time 0.240 (0.786)	Data Time 0.001 (0.301)	Loss 2.7400 (2.7276)	Entropy 0.63728 (0.63618)	Top-1 acc 61.719 (58.290)	Top-5 acc 79.297 (79.996)	lr 0.01493
Train [53][1750/3239]	Time 0.253 (0.795)	Data Time 0.001 (0.310)	Loss 2.7006 (2.7274)	Entropy 0.63756 (0.63619)	Top-1 acc 62.891 (58.295)	Top-5 acc 80.859 (79.999)	lr 0.01493
Train [53][1760/3239]	Time 0.252 (0.793)	Data Time 0.001 (0.309)	Loss 2.6444 (2.7278)	Entropy 0.63760 (0.63620)	Top-1 acc 61.328 (58.289)	Top-5 acc 81.641 (79.994)	lr 0.01492
Train [53][1770/3239]	Time 0.238 (0.791)	Data Time 0.001 (0.307)	Loss 2.7527 (2.7281)	Entropy 0.63759 (0.63620)	Top-1 acc 59.766 (58.284)	Top-5 acc 78.906 (79.987)	lr 0.01492
Train [53][1780/3239]	Time 0.397 (0.799)	Data Time 0.001 (0.316)	Loss 2.5819 (2.7283)	Entropy 0.63733 (0.63621)	Top-1 acc 61.719 (58.282)	Top-5 acc 82.031 (79.984)	lr 0.01492
Train [53][1790/3239]	Time 0.421 (0.817)	Data Time 0.004 (0.314)	Loss 3.0027 (2.7285)	Entropy 0.63716 (0.63622)	Top-1 acc 51.562 (58.276)	Top-5 acc 74.609 (79.979)	lr 0.01492
Train [53][1800/3239]	Time 0.265 (0.815)	Data Time 0.002 (0.312)	Loss 2.4820 (2.7282)	Entropy 0.63735 (0.63622)	Top-1 acc 66.406 (58.288)	Top-5 acc 85.156 (79.984)	lr 0.01492
Train [53][1810/3239]	Time 0.242 (0.813)	Data Time 0.001 (0.311)	Loss 2.6815 (2.7280)	Entropy 0.63728 (0.63623)	Top-1 acc 58.594 (58.293)	Top-5 acc 76.953 (79.984)	lr 0.01492
Train [53][1820/3239]	Time 0.241 (0.810)	Data Time 0.001 (0.309)	Loss 2.7092 (2.7276)	Entropy 0.63717 (0.63623)	Top-1 acc 60.547 (58.300)	Top-5 acc 80.469 (79.991)	lr 0.01492
Train [53][1830/3239]	Time 0.237 (0.808)	Data Time 0.001 (0.307)	Loss 2.8361 (2.7278)	Entropy 0.63708 (0.63624)	Top-1 acc 50.781 (58.297)	Top-5 acc 76.562 (79.987)	lr 0.01492
Train [53][1840/3239]	Time 0.244 (0.806)	Data Time 0.001 (0.306)	Loss 2.8721 (2.7283)	Entropy 0.63682 (0.63624)	Top-1 acc 53.516 (58.284)	Top-5 acc 78.125 (79.979)	lr 0.01492
Train [53][1850/3239]	Time 0.236 (0.804)	Data Time 0.001 (0.304)	Loss 2.8387 (2.7282)	Entropy 0.63674 (0.63625)	Top-1 acc 53.906 (58.280)	Top-5 acc 78.906 (79.978)	lr 0.01492
Train [53][1860/3239]	Time 1.068 (0.806)	Data Time 0.822 (0.307)	Loss 2.7277 (2.7284)	Entropy 0.63691 (0.63625)	Top-1 acc 59.375 (58.272)	Top-5 acc 79.688 (79.976)	lr 0.01491
Train [53][1870/3239]	Time 0.364 (0.805)	Data Time 0.001 (0.306)	Loss 2.6245 (2.7284)	Entropy 0.63718 (0.63625)	Top-1 acc 58.594 (58.270)	Top-5 acc 82.422 (79.979)	lr 0.01491
Train [53][1880/3239]	Time 0.667 (0.808)	Data Time 0.420 (0.309)	Loss 2.6168 (2.7282)	Entropy 0.63697 (0.63626)	Top-1 acc 62.891 (58.274)	Top-5 acc 81.641 (79.980)	lr 0.01491
Train [53][1890/3239]	Time 0.508 (0.810)	Data Time 0.275 (0.312)	Loss 2.7184 (2.7281)	Entropy 0.63723 (0.63626)	Top-1 acc 60.938 (58.283)	Top-5 acc 79.688 (79.985)	lr 0.01491
Train [53][1900/3239]	Time 0.243 (0.810)	Data Time 0.001 (0.312)	Loss 2.8109 (2.7280)	Entropy 0.63715 (0.63627)	Top-1 acc 56.250 (58.288)	Top-5 acc 78.125 (79.983)	lr 0.01491
Train [53][1910/3239]	Time 0.223 (0.812)	Data Time 0.001 (0.314)	Loss 2.6599 (2.7280)	Entropy 0.63676 (0.63627)	Top-1 acc 60.547 (58.288)	Top-5 acc 80.859 (79.985)	lr 0.01491
Train [53][1920/3239]	Time 0.237 (0.815)	Data Time 0.001 (0.318)	Loss 2.7415 (2.7280)	Entropy 0.63677 (0.63627)	Top-1 acc 58.984 (58.285)	Top-5 acc 80.859 (79.989)	lr 0.01491
Train [53][1930/3239]	Time 0.235 (0.815)	Data Time 0.001 (0.318)	Loss 2.7620 (2.7282)	Entropy 0.63624 (0.63627)	Top-1 acc 59.766 (58.280)	Top-5 acc 80.859 (79.985)	lr 0.01491
Train [53][1940/3239]	Time 0.324 (0.817)	Data Time 0.001 (0.321)	Loss 2.6839 (2.7283)	Entropy 0.63641 (0.63627)	Top-1 acc 58.984 (58.274)	Top-5 acc 80.859 (79.983)	lr 0.01491
Train [53][1950/3239]	Time 9.027 (0.821)	Data Time 8.777 (0.325)	Loss 2.6693 (2.7287)	Entropy 0.63642 (0.63627)	Top-1 acc 60.156 (58.268)	Top-5 acc 82.812 (79.975)	lr 0.01491
Train [53][1960/3239]	Time 0.252 (0.821)	Data Time 0.001 (0.326)	Loss 2.7977 (2.7286)	Entropy 0.63622 (0.63627)	Top-1 acc 54.297 (58.270)	Top-5 acc 80.078 (79.977)	lr 0.01490
Train [53][1970/3239]	Time 0.284 (0.823)	Data Time 0.001 (0.328)	Loss 2.6570 (2.7285)	Entropy 0.63588 (0.63627)	Top-1 acc 58.203 (58.274)	Top-5 acc 80.859 (79.976)	lr 0.01490
Train [53][1980/3239]	Time 0.246 (0.822)	Data Time 0.001 (0.327)	Loss 2.7053 (2.7285)	Entropy 0.63582 (0.63627)	Top-1 acc 58.594 (58.274)	Top-5 acc 80.078 (79.977)	lr 0.01490
Train [53][1990/3239]	Time 0.257 (0.827)	Data Time 0.001 (0.332)	Loss 2.7135 (2.7284)	Entropy 0.63586 (0.63627)	Top-1 acc 58.203 (58.274)	Top-5 acc 77.734 (79.977)	lr 0.01490
Train [53][2000/3239]	Time 0.770 (0.828)	Data Time 0.532 (0.334)	Loss 2.7617 (2.7282)	Entropy 0.63582 (0.63627)	Top-1 acc 55.078 (58.278)	Top-5 acc 79.297 (79.978)	lr 0.01490
Train [53][2010/3239]	Time 0.236 (0.829)	Data Time 0.001 (0.335)	Loss 2.8450 (2.7281)	Entropy 0.63583 (0.63626)	Top-1 acc 51.953 (58.271)	Top-5 acc 79.297 (79.975)	lr 0.01490
Train [53][2020/3239]	Time 7.513 (0.832)	Data Time 7.259 (0.338)	Loss 2.5652 (2.7280)	Entropy 0.63574 (0.63626)	Top-1 acc 61.328 (58.274)	Top-5 acc 84.766 (79.980)	lr 0.01490
Train [53][2030/3239]	Time 4.139 (0.832)	Data Time 3.794 (0.339)	Loss 2.6634 (2.7277)	Entropy 0.63552 (0.63626)	Top-1 acc 61.719 (58.279)	Top-5 acc 80.078 (79.988)	lr 0.01490
Train [53][2040/3239]	Time 6.362 (0.836)	Data Time 6.104 (0.343)	Loss 2.5251 (2.7276)	Entropy 0.63551 (0.63626)	Top-1 acc 62.109 (58.281)	Top-5 acc 83.203 (79.987)	lr 0.01490
Train [53][2050/3239]	Time 0.275 (0.834)	Data Time 0.001 (0.341)	Loss 2.6966 (2.7278)	Entropy 0.63553 (0.63625)	Top-1 acc 60.938 (58.278)	Top-5 acc 80.859 (79.987)	lr 0.01490
Train [53][2060/3239]	Time 0.230 (0.836)	Data Time 0.001 (0.344)	Loss 2.5780 (2.7275)	Entropy 0.63537 (0.63625)	Top-1 acc 64.453 (58.289)	Top-5 acc 82.031 (79.992)	lr 0.01490
Train [53][2070/3239]	Time 0.235 (0.839)	Data Time 0.001 (0.347)	Loss 2.7867 (2.7271)	Entropy 0.63531 (0.63624)	Top-1 acc 58.203 (58.299)	Top-5 acc 78.906 (80.000)	lr 0.01489
Train [53][2080/3239]	Time 0.227 (0.840)	Data Time 0.001 (0.348)	Loss 2.6694 (2.7271)	Entropy 0.63533 (0.63624)	Top-1 acc 60.156 (58.300)	Top-5 acc 79.688 (79.997)	lr 0.01489
Train [53][2090/3239]	Time 0.283 (0.841)	Data Time 0.001 (0.350)	Loss 2.5763 (2.7269)	Entropy 0.63550 (0.63624)	Top-1 acc 59.766 (58.305)	Top-5 acc 81.641 (80.003)	lr 0.01489
Train [53][2100/3239]	Time 0.339 (0.844)	Data Time 0.001 (0.353)	Loss 2.7783 (2.7268)	Entropy 0.63544 (0.63623)	Top-1 acc 58.984 (58.305)	Top-5 acc 77.734 (80.004)	lr 0.01489
Train [53][2110/3239]	Time 0.920 (0.845)	Data Time 0.639 (0.354)	Loss 2.6828 (2.7267)	Entropy 0.63541 (0.63623)	Top-1 acc 56.250 (58.298)	Top-5 acc 79.297 (80.005)	lr 0.01489
Train [53][2120/3239]	Time 0.292 (0.847)	Data Time 0.001 (0.356)	Loss 2.7808 (2.7264)	Entropy 0.63533 (0.63622)	Top-1 acc 55.859 (58.301)	Top-5 acc 78.516 (80.013)	lr 0.01489
Train [53][2130/3239]	Time 0.245 (0.848)	Data Time 0.001 (0.357)	Loss 2.5784 (2.7265)	Entropy 0.63538 (0.63622)	Top-1 acc 61.719 (58.293)	Top-5 acc 83.594 (80.013)	lr 0.01489
Train [53][2140/3239]	Time 0.242 (0.846)	Data Time 0.001 (0.356)	Loss 2.9680 (2.7267)	Entropy 0.63549 (0.63622)	Top-1 acc 51.562 (58.286)	Top-5 acc 77.344 (80.007)	lr 0.01489
Train [53][2150/3239]	Time 0.233 (0.848)	Data Time 0.001 (0.358)	Loss 2.5695 (2.7264)	Entropy 0.63518 (0.63621)	Top-1 acc 66.016 (58.301)	Top-5 acc 82.031 (80.009)	lr 0.01489
Train [53][2160/3239]	Time 0.232 (0.847)	Data Time 0.001 (0.358)	Loss 2.6017 (2.7260)	Entropy 0.63523 (0.63621)	Top-1 acc 59.766 (58.310)	Top-5 acc 82.812 (80.018)	lr 0.01489
Train [53][2170/3239]	Time 0.244 (0.845)	Data Time 0.001 (0.356)	Loss 2.7624 (2.7263)	Entropy 0.63587 (0.63620)	Top-1 acc 57.031 (58.301)	Top-5 acc 78.516 (80.012)	lr 0.01488
Train [53][2180/3239]	Time 4.402 (0.846)	Data Time 4.157 (0.357)	Loss 2.6777 (2.7263)	Entropy 0.63539 (0.63620)	Top-1 acc 58.594 (58.307)	Top-5 acc 80.859 (80.010)	lr 0.01488
Train [53][2190/3239]	Time 3.204 (0.845)	Data Time 2.915 (0.357)	Loss 2.7338 (2.7264)	Entropy 0.63551 (0.63620)	Top-1 acc 52.344 (58.305)	Top-5 acc 80.078 (80.006)	lr 0.01488
Train [53][2200/3239]	Time 1.345 (0.845)	Data Time 1.094 (0.357)	Loss 2.6532 (2.7266)	Entropy 0.63551 (0.63619)	Top-1 acc 57.422 (58.300)	Top-5 acc 82.812 (80.004)	lr 0.01488
Train [53][2210/3239]	Time 0.241 (0.846)	Data Time 0.001 (0.358)	Loss 2.7721 (2.7268)	Entropy 0.63532 (0.63619)	Top-1 acc 57.031 (58.294)	Top-5 acc 81.250 (80.005)	lr 0.01488
Train [53][2220/3239]	Time 0.242 (0.849)	Data Time 0.001 (0.361)	Loss 2.6041 (2.7264)	Entropy 0.63515 (0.63619)	Top-1 acc 62.109 (58.304)	Top-5 acc 82.031 (80.015)	lr 0.01488
Train [53][2230/3239]	Time 0.234 (0.849)	Data Time 0.001 (0.362)	Loss 2.6510 (2.7265)	Entropy 0.63532 (0.63618)	Top-1 acc 61.719 (58.299)	Top-5 acc 79.688 (80.015)	lr 0.01488
Train [53][2240/3239]	Time 0.237 (0.851)	Data Time 0.001 (0.364)	Loss 2.7206 (2.7265)	Entropy 0.63542 (0.63618)	Top-1 acc 57.812 (58.298)	Top-5 acc 79.297 (80.013)	lr 0.01488
Train [53][2250/3239]	Time 0.281 (0.854)	Data Time 0.001 (0.367)	Loss 2.7604 (2.7265)	Entropy 0.63546 (0.63618)	Top-1 acc 57.031 (58.295)	Top-5 acc 79.688 (80.016)	lr 0.01488
Train [53][2260/3239]	Time 0.325 (0.854)	Data Time 0.001 (0.368)	Loss 2.7617 (2.7265)	Entropy 0.63543 (0.63617)	Top-1 acc 56.641 (58.302)	Top-5 acc 81.250 (80.017)	lr 0.01488
Train [53][2270/3239]	Time 1.509 (0.855)	Data Time 1.245 (0.369)	Loss 2.7839 (2.7266)	Entropy 0.63538 (0.63617)	Top-1 acc 57.422 (58.297)	Top-5 acc 78.906 (80.014)	lr 0.01487
Train [53][2280/3239]	Time 0.242 (0.860)	Data Time 0.001 (0.374)	Loss 2.7132 (2.7268)	Entropy 0.63548 (0.63617)	Top-1 acc 61.719 (58.292)	Top-5 acc 82.422 (80.009)	lr 0.01487
Train [53][2290/3239]	Time 0.236 (0.859)	Data Time 0.001 (0.374)	Loss 2.7725 (2.7269)	Entropy 0.63541 (0.63616)	Top-1 acc 54.297 (58.286)	Top-5 acc 78.516 (80.008)	lr 0.01487
Train [53][2300/3239]	Time 0.240 (0.857)	Data Time 0.001 (0.372)	Loss 2.7494 (2.7268)	Entropy 0.63520 (0.63616)	Top-1 acc 58.594 (58.284)	Top-5 acc 76.562 (80.010)	lr 0.01487
Train [53][2310/3239]	Time 0.229 (0.859)	Data Time 0.001 (0.375)	Loss 2.7887 (2.7269)	Entropy 0.63505 (0.63616)	Top-1 acc 53.906 (58.281)	Top-5 acc 78.516 (80.006)	lr 0.01487
Train [53][2320/3239]	Time 0.243 (0.858)	Data Time 0.001 (0.374)	Loss 2.8464 (2.7271)	Entropy 0.63509 (0.63615)	Top-1 acc 57.031 (58.276)	Top-5 acc 76.562 (80.002)	lr 0.01487
Train [53][2330/3239]	Time 0.366 (0.856)	Data Time 0.002 (0.372)	Loss 2.6964 (2.7273)	Entropy 0.63503 (0.63615)	Top-1 acc 61.328 (58.276)	Top-5 acc 79.297 (79.997)	lr 0.01487
Train [53][2340/3239]	Time 9.957 (0.859)	Data Time 9.675 (0.375)	Loss 2.8680 (2.7275)	Entropy 0.63492 (0.63614)	Top-1 acc 55.469 (58.272)	Top-5 acc 76.953 (79.993)	lr 0.01487
Train [53][2350/3239]	Time 0.241 (0.857)	Data Time 0.001 (0.373)	Loss 2.8791 (2.7273)	Entropy 0.63517 (0.63614)	Top-1 acc 57.031 (58.279)	Top-5 acc 77.734 (79.991)	lr 0.01487
Train [53][2360/3239]	Time 0.232 (0.856)	Data Time 0.001 (0.372)	Loss 2.5704 (2.7274)	Entropy 0.63539 (0.63613)	Top-1 acc 61.719 (58.278)	Top-5 acc 82.422 (79.992)	lr 0.01487
Train [53][2370/3239]	Time 0.224 (0.855)	Data Time 0.001 (0.371)	Loss 2.6935 (2.7271)	Entropy 0.63544 (0.63613)	Top-1 acc 63.672 (58.285)	Top-5 acc 78.516 (79.996)	lr 0.01486
Train [53][2380/3239]	Time 0.245 (0.856)	Data Time 0.001 (0.373)	Loss 2.5803 (2.7271)	Entropy 0.63554 (0.63613)	Top-1 acc 62.109 (58.284)	Top-5 acc 83.594 (80.001)	lr 0.01486
Train [53][2390/3239]	Time 0.266 (0.855)	Data Time 0.001 (0.373)	Loss 2.5596 (2.7271)	Entropy 0.63584 (0.63612)	Top-1 acc 61.328 (58.283)	Top-5 acc 84.375 (80.001)	lr 0.01486
Train [53][2400/3239]	Time 0.366 (0.854)	Data Time 0.001 (0.371)	Loss 2.7028 (2.7269)	Entropy 0.63595 (0.63612)	Top-1 acc 59.375 (58.287)	Top-5 acc 79.688 (80.005)	lr 0.01486
Train [53][2410/3239]	Time 0.229 (0.856)	Data Time 0.001 (0.373)	Loss 2.6920 (2.7269)	Entropy 0.63561 (0.63612)	Top-1 acc 56.250 (58.287)	Top-5 acc 80.859 (80.004)	lr 0.01486
Train [53][2420/3239]	Time 0.349 (0.858)	Data Time 0.001 (0.376)	Loss 2.6016 (2.7269)	Entropy 0.63567 (0.63612)	Top-1 acc 62.891 (58.284)	Top-5 acc 82.031 (80.006)	lr 0.01486
Train [53][2430/3239]	Time 1.908 (0.857)	Data Time 1.656 (0.375)	Loss 2.6874 (2.7270)	Entropy 0.63585 (0.63612)	Top-1 acc 58.984 (58.279)	Top-5 acc 81.250 (80.004)	lr 0.01486
Train [53][2440/3239]	Time 0.243 (0.862)	Data Time 0.001 (0.380)	Loss 2.9504 (2.7272)	Entropy 0.63567 (0.63612)	Top-1 acc 50.000 (58.271)	Top-5 acc 76.172 (80.001)	lr 0.01486
Train [53][2450/3239]	Time 0.287 (0.876)	Data Time 0.002 (0.379)	Loss 2.8272 (2.7274)	Entropy 0.63550 (0.63611)	Top-1 acc 56.250 (58.265)	Top-5 acc 78.516 (79.994)	lr 0.01486
Train [53][2460/3239]	Time 0.263 (0.874)	Data Time 0.002 (0.377)	Loss 2.7484 (2.7275)	Entropy 0.63562 (0.63611)	Top-1 acc 55.078 (58.259)	Top-5 acc 79.688 (79.990)	lr 0.01486
Train [53][2470/3239]	Time 0.250 (0.872)	Data Time 0.002 (0.376)	Loss 2.6918 (2.7276)	Entropy 0.63583 (0.63611)	Top-1 acc 58.984 (58.258)	Top-5 acc 79.297 (79.989)	lr 0.01485
Train [53][2480/3239]	Time 0.240 (0.871)	Data Time 0.001 (0.374)	Loss 2.6346 (2.7275)	Entropy 0.63594 (0.63611)	Top-1 acc 55.469 (58.262)	Top-5 acc 83.984 (79.989)	lr 0.01485
Train [53][2490/3239]	Time 0.365 (0.869)	Data Time 0.001 (0.373)	Loss 2.4962 (2.7273)	Entropy 0.63561 (0.63611)	Top-1 acc 63.672 (58.265)	Top-5 acc 82.812 (79.992)	lr 0.01485
Train [53][2500/3239]	Time 13.650 (0.875)	Data Time 13.404 (0.379)	Loss 2.8718 (2.7272)	Entropy 0.63586 (0.63611)	Top-1 acc 51.953 (58.268)	Top-5 acc 77.734 (79.994)	lr 0.01485
Train [53][2510/3239]	Time 3.979 (0.875)	Data Time 3.725 (0.379)	Loss 2.7129 (2.7272)	Entropy 0.63574 (0.63611)	Top-1 acc 59.766 (58.267)	Top-5 acc 83.594 (79.993)	lr 0.01485
Train [53][2520/3239]	Time 0.243 (0.874)	Data Time 0.001 (0.379)	Loss 2.7271 (2.7271)	Entropy 0.63581 (0.63611)	Top-1 acc 58.203 (58.269)	Top-5 acc 79.297 (79.998)	lr 0.01485
Train [53][2530/3239]	Time 0.245 (0.877)	Data Time 0.001 (0.382)	Loss 2.7337 (2.7272)	Entropy 0.63600 (0.63610)	Top-1 acc 59.766 (58.267)	Top-5 acc 79.688 (79.993)	lr 0.01485
Train [53][2540/3239]	Time 0.255 (0.879)	Data Time 0.001 (0.384)	Loss 2.5492 (2.7271)	Entropy 0.63618 (0.63610)	Top-1 acc 60.156 (58.266)	Top-5 acc 82.812 (79.993)	lr 0.01485
Train [53][2550/3239]	Time 0.271 (0.882)	Data Time 0.001 (0.388)	Loss 2.6160 (2.7270)	Entropy 0.63584 (0.63610)	Top-1 acc 60.156 (58.269)	Top-5 acc 83.203 (79.993)	lr 0.01485
Train [53][2560/3239]	Time 0.265 (0.883)	Data Time 0.002 (0.389)	Loss 2.6961 (2.7269)	Entropy 0.63588 (0.63610)	Top-1 acc 59.375 (58.269)	Top-5 acc 81.641 (79.995)	lr 0.01485
Train [53][2570/3239]	Time 0.241 (0.884)	Data Time 0.002 (0.390)	Loss 2.8396 (2.7270)	Entropy 0.63606 (0.63610)	Top-1 acc 56.641 (58.268)	Top-5 acc 76.172 (79.995)	lr 0.01484
Train [53][2580/3239]	Time 0.382 (0.887)	Data Time 0.001 (0.393)	Loss 2.9311 (2.7269)	Entropy 0.63584 (0.63610)	Top-1 acc 51.172 (58.266)	Top-5 acc 78.906 (79.997)	lr 0.01484
Train [53][2590/3239]	Time 0.258 (0.885)	Data Time 0.001 (0.391)	Loss 2.6678 (2.7272)	Entropy 0.63581 (0.63610)	Top-1 acc 64.062 (58.258)	Top-5 acc 80.859 (79.993)	lr 0.01484
Train [53][2600/3239]	Time 0.266 (0.889)	Data Time 0.002 (0.395)	Loss 2.9397 (2.7273)	Entropy 0.63592 (0.63610)	Top-1 acc 51.172 (58.257)	Top-5 acc 74.609 (79.988)	lr 0.01484
Train [53][2610/3239]	Time 0.262 (0.891)	Data Time 0.001 (0.397)	Loss 2.7262 (2.7271)	Entropy 0.63629 (0.63610)	Top-1 acc 59.375 (58.256)	Top-5 acc 80.859 (79.994)	lr 0.01484
Train [53][2620/3239]	Time 0.258 (0.890)	Data Time 0.001 (0.396)	Loss 2.5762 (2.7273)	Entropy 0.63636 (0.63610)	Top-1 acc 61.328 (58.251)	Top-5 acc 84.375 (79.988)	lr 0.01484
Train [53][2630/3239]	Time 0.290 (0.894)	Data Time 0.001 (0.401)	Loss 2.8959 (2.7272)	Entropy 0.63634 (0.63610)	Top-1 acc 51.562 (58.254)	Top-5 acc 77.344 (79.992)	lr 0.01484
Train [53][2640/3239]	Time 0.238 (0.896)	Data Time 0.001 (0.402)	Loss 2.7504 (2.7273)	Entropy 0.63640 (0.63610)	Top-1 acc 57.422 (58.256)	Top-5 acc 78.906 (79.991)	lr 0.01484
Train [53][2650/3239]	Time 0.382 (0.894)	Data Time 0.001 (0.401)	Loss 2.7080 (2.7274)	Entropy 0.63629 (0.63610)	Top-1 acc 62.109 (58.252)	Top-5 acc 78.906 (79.988)	lr 0.01484
Train [53][2660/3239]	Time 10.206 (0.899)	Data Time 9.924 (0.406)	Loss 2.7691 (2.7274)	Entropy 0.63657 (0.63610)	Top-1 acc 55.469 (58.252)	Top-5 acc 76.562 (79.983)	lr 0.01484
Train [53][2670/3239]	Time 0.251 (0.897)	Data Time 0.001 (0.405)	Loss 2.5776 (2.7274)	Entropy 0.63616 (0.63611)	Top-1 acc 63.672 (58.252)	Top-5 acc 83.203 (79.982)	lr 0.01483
Train [53][2680/3239]	Time 0.245 (0.898)	Data Time 0.002 (0.406)	Loss 2.7241 (2.7273)	Entropy 0.63618 (0.63611)	Top-1 acc 58.203 (58.250)	Top-5 acc 81.250 (79.987)	lr 0.01483
Train [53][2690/3239]	Time 0.237 (0.899)	Data Time 0.001 (0.407)	Loss 2.8750 (2.7274)	Entropy 0.63632 (0.63611)	Top-1 acc 55.469 (58.245)	Top-5 acc 77.734 (79.987)	lr 0.01483
Train [53][2700/3239]	Time 0.238 (0.902)	Data Time 0.001 (0.410)	Loss 2.6082 (2.7275)	Entropy 0.63632 (0.63611)	Top-1 acc 61.328 (58.247)	Top-5 acc 82.031 (79.988)	lr 0.01483
Train [53][2710/3239]	Time 0.252 (0.902)	Data Time 0.001 (0.410)	Loss 2.7354 (2.7275)	Entropy 0.63616 (0.63611)	Top-1 acc 55.078 (58.242)	Top-5 acc 81.250 (79.986)	lr 0.01483
Train [53][2720/3239]	Time 0.262 (0.902)	Data Time 0.001 (0.411)	Loss 2.6534 (2.7274)	Entropy 0.63633 (0.63611)	Top-1 acc 60.547 (58.247)	Top-5 acc 80.859 (79.987)	lr 0.01483
Train [53][2730/3239]	Time 0.238 (0.906)	Data Time 0.001 (0.415)	Loss 2.6746 (2.7275)	Entropy 0.63640 (0.63611)	Top-1 acc 61.328 (58.244)	Top-5 acc 80.469 (79.986)	lr 0.01483
Train [53][2740/3239]	Time 0.387 (0.906)	Data Time 0.002 (0.415)	Loss 2.7090 (2.7276)	Entropy 0.63648 (0.63611)	Top-1 acc 57.812 (58.242)	Top-5 acc 79.297 (79.983)	lr 0.01483
Train [53][2750/3239]	Time 0.240 (0.905)	Data Time 0.001 (0.414)	Loss 2.6809 (2.7275)	Entropy 0.63661 (0.63611)	Top-1 acc 58.594 (58.243)	Top-5 acc 79.688 (79.984)	lr 0.01483
Train [53][2760/3239]	Time 0.234 (0.910)	Data Time 0.001 (0.419)	Loss 2.8164 (2.7275)	Entropy 0.63659 (0.63611)	Top-1 acc 56.641 (58.243)	Top-5 acc 76.953 (79.987)	lr 0.01483
Train [53][2770/3239]	Time 0.253 (0.911)	Data Time 0.001 (0.421)	Loss 2.8287 (2.7275)	Entropy 0.63661 (0.63612)	Top-1 acc 54.297 (58.238)	Top-5 acc 77.734 (79.987)	lr 0.01482
Train [53][2780/3239]	Time 0.268 (0.910)	Data Time 0.001 (0.419)	Loss 2.7537 (2.7277)	Entropy 0.63648 (0.63612)	Top-1 acc 57.031 (58.231)	Top-5 acc 76.562 (79.980)	lr 0.01482
Train [53][2790/3239]	Time 0.250 (0.914)	Data Time 0.002 (0.424)	Loss 3.0164 (2.7280)	Entropy 0.63666 (0.63612)	Top-1 acc 50.000 (58.229)	Top-5 acc 75.391 (79.974)	lr 0.01482
Train [53][2800/3239]	Time 0.242 (0.915)	Data Time 0.002 (0.425)	Loss 2.7414 (2.7279)	Entropy 0.63642 (0.63612)	Top-1 acc 60.547 (58.231)	Top-5 acc 80.469 (79.975)	lr 0.01482
Train [53][2810/3239]	Time 0.382 (0.914)	Data Time 0.001 (0.424)	Loss 2.8571 (2.7280)	Entropy 0.63661 (0.63612)	Top-1 acc 58.984 (58.229)	Top-5 acc 78.516 (79.975)	lr 0.01482
Train [53][2820/3239]	Time 8.606 (0.917)	Data Time 8.317 (0.427)	Loss 2.7978 (2.7282)	Entropy 0.63652 (0.63612)	Top-1 acc 58.984 (58.228)	Top-5 acc 78.125 (79.970)	lr 0.01482
Train [53][2830/3239]	Time 0.254 (0.916)	Data Time 0.001 (0.427)	Loss 2.5329 (2.7281)	Entropy 0.63640 (0.63612)	Top-1 acc 65.234 (58.229)	Top-5 acc 84.766 (79.973)	lr 0.01482
Train [53][2840/3239]	Time 0.245 (0.917)	Data Time 0.001 (0.428)	Loss 2.6945 (2.7280)	Entropy 0.63579 (0.63612)	Top-1 acc 57.812 (58.233)	Top-5 acc 80.469 (79.977)	lr 0.01482
Train [53][2850/3239]	Time 0.245 (0.915)	Data Time 0.001 (0.426)	Loss 2.5996 (2.7279)	Entropy 0.63548 (0.63612)	Top-1 acc 59.375 (58.231)	Top-5 acc 83.594 (79.978)	lr 0.01482
Train [53][2860/3239]	Time 0.275 (0.919)	Data Time 0.001 (0.430)	Loss 2.7802 (2.7281)	Entropy 0.63556 (0.63612)	Top-1 acc 59.766 (58.225)	Top-5 acc 77.734 (79.973)	lr 0.01482
Train [53][2870/3239]	Time 0.243 (0.920)	Data Time 0.001 (0.432)	Loss 2.6764 (2.7281)	Entropy 0.63559 (0.63612)	Top-1 acc 58.203 (58.223)	Top-5 acc 82.031 (79.971)	lr 0.01481
Train [53][2880/3239]	Time 0.254 (0.919)	Data Time 0.001 (0.430)	Loss 2.7031 (2.7278)	Entropy 0.63566 (0.63612)	Top-1 acc 59.766 (58.233)	Top-5 acc 77.734 (79.978)	lr 0.01481
Train [53][2890/3239]	Time 0.231 (0.924)	Data Time 0.001 (0.435)	Loss 2.7424 (2.7278)	Entropy 0.63525 (0.63612)	Top-1 acc 57.422 (58.231)	Top-5 acc 80.859 (79.979)	lr 0.01481
Train [53][2900/3239]	Time 0.248 (0.924)	Data Time 0.001 (0.436)	Loss 3.0321 (2.7280)	Entropy 0.63489 (0.63611)	Top-1 acc 49.609 (58.227)	Top-5 acc 74.609 (79.974)	lr 0.01481
Train [53][2910/3239]	Time 0.250 (0.922)	Data Time 0.001 (0.434)	Loss 2.6366 (2.7279)	Entropy 0.63493 (0.63611)	Top-1 acc 59.375 (58.228)	Top-5 acc 82.812 (79.974)	lr 0.01481
Train [53][2920/3239]	Time 0.253 (0.928)	Data Time 0.001 (0.440)	Loss 2.6211 (2.7281)	Entropy 0.63500 (0.63610)	Top-1 acc 62.891 (58.225)	Top-5 acc 80.859 (79.968)	lr 0.01481
Train [53][2930/3239]	Time 0.237 (0.928)	Data Time 0.001 (0.440)	Loss 2.6528 (2.7281)	Entropy 0.63480 (0.63610)	Top-1 acc 60.547 (58.223)	Top-5 acc 81.250 (79.969)	lr 0.01481
Train [53][2940/3239]	Time 0.243 (0.926)	Data Time 0.001 (0.439)	Loss 2.7565 (2.7281)	Entropy 0.63463 (0.63610)	Top-1 acc 56.250 (58.220)	Top-5 acc 81.641 (79.970)	lr 0.01481
Train [53][2950/3239]	Time 0.277 (0.931)	Data Time 0.002 (0.444)	Loss 2.6406 (2.7282)	Entropy 0.63423 (0.63609)	Top-1 acc 58.594 (58.218)	Top-5 acc 83.203 (79.968)	lr 0.01481
Train [53][2960/3239]	Time 0.245 (0.933)	Data Time 0.001 (0.446)	Loss 2.7714 (2.7283)	Entropy 0.63430 (0.63608)	Top-1 acc 56.250 (58.215)	Top-5 acc 78.125 (79.967)	lr 0.01481
Train [53][2970/3239]	Time 0.340 (0.931)	Data Time 0.001 (0.444)	Loss 2.7271 (2.7281)	Entropy 0.63440 (0.63608)	Top-1 acc 58.594 (58.222)	Top-5 acc 76.953 (79.971)	lr 0.01480
Train [53][2980/3239]	Time 4.371 (0.934)	Data Time 4.120 (0.447)	Loss 2.8879 (2.7281)	Entropy 0.63452 (0.63607)	Top-1 acc 55.469 (58.223)	Top-5 acc 78.125 (79.972)	lr 0.01480
Train [53][2990/3239]	Time 0.236 (0.935)	Data Time 0.001 (0.449)	Loss 2.8476 (2.7281)	Entropy 0.63461 (0.63607)	Top-1 acc 55.078 (58.225)	Top-5 acc 79.297 (79.974)	lr 0.01480
Train [53][3000/3239]	Time 0.251 (0.935)	Data Time 0.002 (0.449)	Loss 2.8696 (2.7282)	Entropy 0.63457 (0.63606)	Top-1 acc 51.562 (58.226)	Top-5 acc 78.516 (79.973)	lr 0.01480
Train [53][3010/3239]	Time 0.237 (0.933)	Data Time 0.001 (0.447)	Loss 2.8159 (2.7281)	Entropy 0.63481 (0.63606)	Top-1 acc 58.984 (58.231)	Top-5 acc 78.125 (79.974)	lr 0.01480
Train [53][3020/3239]	Time 0.239 (0.938)	Data Time 0.001 (0.452)	Loss 3.0442 (2.7282)	Entropy 0.63439 (0.63605)	Top-1 acc 51.953 (58.229)	Top-5 acc 75.000 (79.969)	lr 0.01480
Train [53][3030/3239]	Time 0.232 (0.937)	Data Time 0.001 (0.452)	Loss 2.5156 (2.7284)	Entropy 0.63455 (0.63605)	Top-1 acc 65.234 (58.225)	Top-5 acc 83.984 (79.969)	lr 0.01480
Train [53][3040/3239]	Time 0.350 (0.935)	Data Time 0.001 (0.450)	Loss 2.5724 (2.7284)	Entropy 0.63454 (0.63604)	Top-1 acc 63.281 (58.224)	Top-5 acc 83.984 (79.970)	lr 0.01480
Train [53][3050/3239]	Time 0.259 (0.943)	Data Time 0.001 (0.458)	Loss 2.5249 (2.7282)	Entropy 0.63431 (0.63604)	Top-1 acc 62.500 (58.228)	Top-5 acc 83.203 (79.972)	lr 0.01480
Train [53][3060/3239]	Time 0.288 (0.941)	Data Time 0.003 (0.456)	Loss 2.6868 (2.7282)	Entropy 0.63431 (0.63603)	Top-1 acc 58.984 (58.230)	Top-5 acc 81.641 (79.973)	lr 0.01480
Train [53][3070/3239]	Time 0.276 (0.939)	Data Time 0.001 (0.455)	Loss 2.9309 (2.7280)	Entropy 0.63436 (0.63603)	Top-1 acc 53.906 (58.237)	Top-5 acc 75.781 (79.978)	lr 0.01479
Train [53][3080/3239]	Time 0.234 (0.942)	Data Time 0.001 (0.458)	Loss 2.6728 (2.7281)	Entropy 0.63416 (0.63602)	Top-1 acc 55.469 (58.233)	Top-5 acc 81.641 (79.975)	lr 0.01479
Train [53][3090/3239]	Time 0.253 (0.945)	Data Time 0.001 (0.460)	Loss 3.0429 (2.7278)	Entropy 0.63425 (0.63601)	Top-1 acc 51.562 (58.237)	Top-5 acc 75.000 (79.979)	lr 0.01479
Train [53][3100/3239]	Time 0.394 (0.954)	Data Time 0.004 (0.459)	Loss 2.5823 (2.7277)	Entropy 0.63441 (0.63601)	Top-1 acc 58.594 (58.240)	Top-5 acc 84.766 (79.982)	lr 0.01479
Train [53][3110/3239]	Time 0.260 (0.953)	Data Time 0.002 (0.458)	Loss 2.7464 (2.7278)	Entropy 0.63437 (0.63600)	Top-1 acc 57.812 (58.239)	Top-5 acc 78.125 (79.979)	lr 0.01479
Train [53][3120/3239]	Time 0.232 (0.951)	Data Time 0.002 (0.456)	Loss 2.6731 (2.7276)	Entropy 0.63447 (0.63600)	Top-1 acc 60.547 (58.244)	Top-5 acc 80.859 (79.981)	lr 0.01479
Train [53][3130/3239]	Time 0.369 (0.950)	Data Time 0.001 (0.455)	Loss 2.6059 (2.7275)	Entropy 0.63444 (0.63599)	Top-1 acc 61.328 (58.248)	Top-5 acc 81.641 (79.985)	lr 0.01479
Train [53][3140/3239]	Time 2.455 (0.950)	Data Time 2.194 (0.456)	Loss 2.4866 (2.7277)	Entropy 0.63451 (0.63599)	Top-1 acc 60.938 (58.243)	Top-5 acc 84.375 (79.981)	lr 0.01479
Train [53][3150/3239]	Time 0.246 (0.952)	Data Time 0.001 (0.458)	Loss 2.5217 (2.7276)	Entropy 0.63459 (0.63598)	Top-1 acc 61.719 (58.245)	Top-5 acc 83.984 (79.980)	lr 0.01479
Train [53][3160/3239]	Time 0.248 (0.951)	Data Time 0.001 (0.456)	Loss 2.6802 (2.7275)	Entropy 0.63429 (0.63598)	Top-1 acc 60.156 (58.246)	Top-5 acc 79.297 (79.982)	lr 0.01479
Train [53][3170/3239]	Time 0.281 (0.950)	Data Time 0.002 (0.456)	Loss 2.7342 (2.7274)	Entropy 0.63394 (0.63597)	Top-1 acc 53.906 (58.248)	Top-5 acc 81.250 (79.984)	lr 0.01478
Train [53][3180/3239]	Time 0.245 (0.954)	Data Time 0.000 (0.460)	Loss 2.6705 (2.7273)	Entropy 0.63387 (0.63597)	Top-1 acc 58.594 (58.249)	Top-5 acc 81.641 (79.988)	lr 0.01478
Train [53][3190/3239]	Time 0.257 (0.953)	Data Time 0.000 (0.459)	Loss 2.7932 (2.7271)	Entropy 0.63366 (0.63596)	Top-1 acc 59.375 (58.253)	Top-5 acc 80.078 (79.992)	lr 0.01478
Train [53][3200/3239]	Time 0.350 (0.952)	Data Time 0.000 (0.458)	Loss 2.5186 (2.7270)	Entropy 0.63372 (0.63595)	Top-1 acc 62.891 (58.257)	Top-5 acc 83.203 (79.992)	lr 0.01478
Train [53][3210/3239]	Time 0.258 (0.958)	Data Time 0.000 (0.464)	Loss 2.9467 (2.7270)	Entropy 0.63330 (0.63595)	Top-1 acc 56.250 (58.258)	Top-5 acc 75.000 (79.995)	lr 0.01478
Train [53][3220/3239]	Time 0.245 (0.957)	Data Time 0.000 (0.463)	Loss 2.8807 (2.7271)	Entropy 0.63306 (0.63594)	Top-1 acc 54.688 (58.254)	Top-5 acc 76.562 (79.993)	lr 0.01478
Train [53][3230/3239]	Time 0.232 (0.955)	Data Time 0.000 (0.462)	Loss 2.7283 (2.7270)	Entropy 0.63314 (0.63593)	Top-1 acc 58.594 (58.254)	Top-5 acc 81.250 (79.995)	lr 0.01478
Train [53][3239/3239]	Time 0.982 (0.956)	Data Time 0.000 (0.463)	Loss 2.9983 (2.7271)	Entropy 0.63325 (0.63592)	Top-1 acc 50.617 (58.253)	Top-5 acc 77.778 (79.993)	lr 0.01478
==========Valid [53/120]	loss 1.471	top-1 acc 66.255 (66.255)	top-5 acc 86.427	Train top-1 58.253	top-5 79.993	Entropy 0.63325	Latency-None: 0.000ms	Flops: 538.40M
Train [54][0/3239]	Time 52.318 (52.318)	Data Time 51.357 (51.357)	Loss 2.8656 (2.8656)	Entropy 0.63320 (0.63320)	Top-1 acc 56.250 (56.250)	Top-5 acc 76.953 (76.953)	lr 0.01478
Train [54][10/3239]	Time 0.245 (5.255)	Data Time 0.002 (4.671)	Loss 3.0769 (2.7223)	Entropy 0.63337 (0.63325)	Top-1 acc 51.562 (57.457)	Top-5 acc 73.047 (79.688)	lr 0.01478
Train [54][20/3239]	Time 0.231 (2.954)	Data Time 0.001 (2.447)	Loss 2.7181 (2.7432)	Entropy 0.63327 (0.63331)	Top-1 acc 58.203 (57.850)	Top-5 acc 81.250 (79.315)	lr 0.01478
Train [54][30/3239]	Time 0.402 (2.141)	Data Time 0.001 (1.658)	Loss 2.8142 (2.7410)	Entropy 0.63317 (0.63327)	Top-1 acc 55.859 (57.964)	Top-5 acc 77.734 (79.473)	lr 0.01477
Train [54][40/3239]	Time 0.251 (1.867)	Data Time 0.001 (1.388)	Loss 2.8664 (2.7232)	Entropy 0.63309 (0.63325)	Top-1 acc 56.250 (58.260)	Top-5 acc 79.297 (80.145)	lr 0.01477
Train [54][50/3239]	Time 0.256 (1.587)	Data Time 0.001 (1.116)	Loss 2.6803 (2.7213)	Entropy 0.63315 (0.63321)	Top-1 acc 59.375 (58.257)	Top-5 acc 80.078 (80.086)	lr 0.01477
Train [54][60/3239]	Time 0.243 (1.402)	Data Time 0.001 (0.934)	Loss 2.6472 (2.7154)	Entropy 0.63302 (0.63320)	Top-1 acc 61.719 (58.440)	Top-5 acc 83.203 (80.219)	lr 0.01477
Train [54][70/3239]	Time 0.244 (1.382)	Data Time 0.001 (0.917)	Loss 2.6515 (2.7105)	Entropy 0.63300 (0.63317)	Top-1 acc 60.156 (58.429)	Top-5 acc 80.078 (80.403)	lr 0.01477
Train [54][80/3239]	Time 0.245 (1.267)	Data Time 0.001 (0.804)	Loss 2.6407 (2.7113)	Entropy 0.63272 (0.63315)	Top-1 acc 58.984 (58.280)	Top-5 acc 83.984 (80.445)	lr 0.01477
Train [54][90/3239]	Time 0.229 (1.176)	Data Time 0.001 (0.716)	Loss 2.8677 (2.7103)	Entropy 0.63258 (0.63309)	Top-1 acc 56.250 (58.285)	Top-5 acc 76.172 (80.473)	lr 0.01477
Train [54][100/3239]	Time 0.234 (1.162)	Data Time 0.001 (0.701)	Loss 2.8071 (2.7115)	Entropy 0.63275 (0.63305)	Top-1 acc 55.859 (58.222)	Top-5 acc 77.344 (80.364)	lr 0.01477
Train [54][110/3239]	Time 0.251 (1.124)	Data Time 0.002 (0.665)	Loss 2.7408 (2.7163)	Entropy 0.63281 (0.63302)	Top-1 acc 59.766 (58.164)	Top-5 acc 77.734 (80.282)	lr 0.01477
Train [54][120/3239]	Time 0.302 (1.067)	Data Time 0.001 (0.610)	Loss 2.7344 (2.7184)	Entropy 0.63300 (0.63301)	Top-1 acc 57.812 (58.171)	Top-5 acc 78.125 (80.198)	lr 0.01477
Train [54][130/3239]	Time 0.582 (1.032)	Data Time 0.335 (0.576)	Loss 2.7936 (2.7144)	Entropy 0.63292 (0.63301)	Top-1 acc 56.250 (58.242)	Top-5 acc 80.078 (80.305)	lr 0.01477
Train [54][140/3239]	Time 0.254 (1.025)	Data Time 0.001 (0.570)	Loss 2.6510 (2.7169)	Entropy 0.63303 (0.63300)	Top-1 acc 58.984 (58.181)	Top-5 acc 80.859 (80.233)	lr 0.01476
Train [54][150/3239]	Time 0.239 (0.985)	Data Time 0.001 (0.532)	Loss 2.6297 (2.7149)	Entropy 0.63275 (0.63300)	Top-1 acc 57.031 (58.291)	Top-5 acc 82.812 (80.241)	lr 0.01476
Train [54][160/3239]	Time 4.496 (0.976)	Data Time 4.170 (0.525)	Loss 2.5495 (2.7099)	Entropy 0.63275 (0.63299)	Top-1 acc 65.625 (58.421)	Top-5 acc 82.812 (80.294)	lr 0.01476
Train [54][170/3239]	Time 0.237 (0.966)	Data Time 0.001 (0.514)	Loss 2.7298 (2.7105)	Entropy 0.63266 (0.63296)	Top-1 acc 57.812 (58.400)	Top-5 acc 81.250 (80.300)	lr 0.01476
Train [54][180/3239]	Time 0.256 (0.938)	Data Time 0.001 (0.486)	Loss 2.7228 (2.7126)	Entropy 0.63273 (0.63295)	Top-1 acc 58.594 (58.302)	Top-5 acc 81.250 (80.275)	lr 0.01476
Train [54][190/3239]	Time 0.366 (0.912)	Data Time 0.001 (0.461)	Loss 2.5952 (2.7114)	Entropy 0.63267 (0.63294)	Top-1 acc 62.109 (58.326)	Top-5 acc 81.641 (80.297)	lr 0.01476
Train [54][200/3239]	Time 0.257 (0.940)	Data Time 0.001 (0.489)	Loss 2.6842 (2.7148)	Entropy 0.63311 (0.63293)	Top-1 acc 59.375 (58.263)	Top-5 acc 78.906 (80.202)	lr 0.01476
Train [54][210/3239]	Time 0.240 (0.917)	Data Time 0.001 (0.466)	Loss 2.6757 (2.7143)	Entropy 0.63336 (0.63294)	Top-1 acc 59.766 (58.283)	Top-5 acc 82.422 (80.213)	lr 0.01476
Train [54][220/3239]	Time 0.249 (0.895)	Data Time 0.001 (0.445)	Loss 2.6312 (2.7141)	Entropy 0.63339 (0.63296)	Top-1 acc 57.422 (58.323)	Top-5 acc 82.812 (80.232)	lr 0.01476
Train [54][230/3239]	Time 0.224 (0.908)	Data Time 0.001 (0.458)	Loss 2.6526 (2.7140)	Entropy 0.63324 (0.63298)	Top-1 acc 61.719 (58.335)	Top-5 acc 83.984 (80.225)	lr 0.01476
Train [54][240/3239]	Time 0.224 (0.889)	Data Time 0.001 (0.439)	Loss 2.5919 (2.7129)	Entropy 0.63351 (0.63300)	Top-1 acc 62.500 (58.415)	Top-5 acc 82.812 (80.226)	lr 0.01475
Train [54][250/3239]	Time 0.249 (0.870)	Data Time 0.001 (0.422)	Loss 2.7884 (2.7124)	Entropy 0.63336 (0.63301)	Top-1 acc 57.031 (58.421)	Top-5 acc 80.078 (80.248)	lr 0.01475
Train [54][260/3239]	Time 0.377 (0.891)	Data Time 0.002 (0.443)	Loss 2.9669 (2.7150)	Entropy 0.63323 (0.63302)	Top-1 acc 56.250 (58.366)	Top-5 acc 74.609 (80.180)	lr 0.01475
Train [54][270/3239]	Time 0.254 (0.874)	Data Time 0.001 (0.427)	Loss 2.8794 (2.7161)	Entropy 0.63333 (0.63303)	Top-1 acc 56.641 (58.354)	Top-5 acc 76.562 (80.156)	lr 0.01475
Train [54][280/3239]	Time 0.236 (0.858)	Data Time 0.001 (0.411)	Loss 2.8090 (2.7171)	Entropy 0.63329 (0.63304)	Top-1 acc 56.250 (58.359)	Top-5 acc 77.734 (80.159)	lr 0.01475
Train [54][290/3239]	Time 5.630 (0.870)	Data Time 5.339 (0.423)	Loss 2.5208 (2.7167)	Entropy 0.63387 (0.63306)	Top-1 acc 62.500 (58.351)	Top-5 acc 84.375 (80.147)	lr 0.01475
Train [54][300/3239]	Time 0.234 (0.864)	Data Time 0.002 (0.419)	Loss 2.8404 (2.7169)	Entropy 0.63370 (0.63309)	Top-1 acc 56.641 (58.389)	Top-5 acc 79.297 (80.151)	lr 0.01475
Train [54][310/3239]	Time 0.235 (0.850)	Data Time 0.001 (0.405)	Loss 2.7902 (2.7181)	Entropy 0.63334 (0.63310)	Top-1 acc 57.812 (58.385)	Top-5 acc 80.078 (80.115)	lr 0.01475
Train [54][320/3239]	Time 0.256 (0.837)	Data Time 0.001 (0.393)	Loss 2.8033 (2.7191)	Entropy 0.63374 (0.63311)	Top-1 acc 54.688 (58.348)	Top-5 acc 80.078 (80.121)	lr 0.01475
Train [54][330/3239]	Time 0.238 (0.850)	Data Time 0.002 (0.406)	Loss 2.7005 (2.7171)	Entropy 0.63371 (0.63313)	Top-1 acc 57.031 (58.365)	Top-5 acc 81.641 (80.161)	lr 0.01475
Train [54][340/3239]	Time 0.252 (0.839)	Data Time 0.001 (0.394)	Loss 2.6863 (2.7145)	Entropy 0.63364 (0.63314)	Top-1 acc 58.594 (58.439)	Top-5 acc 79.688 (80.184)	lr 0.01474
Train [54][350/3239]	Time 0.357 (0.827)	Data Time 0.001 (0.383)	Loss 3.0176 (2.7148)	Entropy 0.63335 (0.63315)	Top-1 acc 51.172 (58.415)	Top-5 acc 73.828 (80.169)	lr 0.01474
Train [54][360/3239]	Time 0.256 (0.831)	Data Time 0.002 (0.386)	Loss 2.7864 (2.7149)	Entropy 0.63333 (0.63316)	Top-1 acc 58.594 (58.410)	Top-5 acc 80.078 (80.186)	lr 0.01474
Train [54][370/3239]	Time 0.247 (0.822)	Data Time 0.001 (0.377)	Loss 2.6947 (2.7151)	Entropy 0.63342 (0.63316)	Top-1 acc 61.328 (58.435)	Top-5 acc 79.297 (80.194)	lr 0.01474
Train [54][380/3239]	Time 0.342 (0.812)	Data Time 0.002 (0.367)	Loss 2.7043 (2.7150)	Entropy 0.63337 (0.63317)	Top-1 acc 59.375 (58.410)	Top-5 acc 78.906 (80.179)	lr 0.01474
Train [54][390/3239]	Time 0.243 (0.816)	Data Time 0.001 (0.371)	Loss 2.7939 (2.7151)	Entropy 0.63363 (0.63317)	Top-1 acc 56.250 (58.426)	Top-5 acc 78.906 (80.190)	lr 0.01474
Train [54][400/3239]	Time 0.229 (0.810)	Data Time 0.001 (0.366)	Loss 2.6880 (2.7155)	Entropy 0.63378 (0.63319)	Top-1 acc 58.594 (58.442)	Top-5 acc 80.078 (80.195)	lr 0.01474
Train [54][410/3239]	Time 0.288 (0.802)	Data Time 0.001 (0.357)	Loss 2.5638 (2.7154)	Entropy 0.63351 (0.63320)	Top-1 acc 61.328 (58.457)	Top-5 acc 80.859 (80.185)	lr 0.01474
Train [54][420/3239]	Time 2.712 (0.803)	Data Time 2.330 (0.357)	Loss 2.9676 (2.7157)	Entropy 0.63344 (0.63320)	Top-1 acc 51.953 (58.457)	Top-5 acc 76.172 (80.185)	lr 0.01474
Train [54][430/3239]	Time 0.248 (0.801)	Data Time 0.001 (0.355)	Loss 2.7381 (2.7163)	Entropy 0.63302 (0.63321)	Top-1 acc 56.250 (58.426)	Top-5 acc 80.469 (80.171)	lr 0.01474
Train [54][440/3239]	Time 0.257 (0.793)	Data Time 0.002 (0.347)	Loss 2.6404 (2.7169)	Entropy 0.63309 (0.63320)	Top-1 acc 57.812 (58.393)	Top-5 acc 80.859 (80.150)	lr 0.01473
Train [54][450/3239]	Time 0.238 (0.786)	Data Time 0.001 (0.340)	Loss 2.6436 (2.7164)	Entropy 0.63331 (0.63320)	Top-1 acc 62.109 (58.395)	Top-5 acc 82.031 (80.142)	lr 0.01473
Train [54][460/3239]	Time 0.250 (0.790)	Data Time 0.001 (0.345)	Loss 2.5254 (2.7169)	Entropy 0.63293 (0.63320)	Top-1 acc 63.672 (58.381)	Top-5 acc 84.766 (80.151)	lr 0.01473
Train [54][470/3239]	Time 0.226 (0.783)	Data Time 0.001 (0.337)	Loss 2.6917 (2.7170)	Entropy 0.63283 (0.63319)	Top-1 acc 60.938 (58.391)	Top-5 acc 78.906 (80.154)	lr 0.01473
Train [54][480/3239]	Time 0.281 (0.776)	Data Time 0.002 (0.330)	Loss 2.7215 (2.7172)	Entropy 0.63248 (0.63319)	Top-1 acc 56.250 (58.378)	Top-5 acc 80.078 (80.146)	lr 0.01473
Train [54][490/3239]	Time 0.443 (0.778)	Data Time 0.177 (0.332)	Loss 2.5233 (2.7170)	Entropy 0.63215 (0.63317)	Top-1 acc 62.109 (58.361)	Top-5 acc 83.594 (80.151)	lr 0.01473
Train [54][500/3239]	Time 0.246 (0.771)	Data Time 0.001 (0.326)	Loss 2.6077 (2.7170)	Entropy 0.63190 (0.63315)	Top-1 acc 60.938 (58.354)	Top-5 acc 81.250 (80.148)	lr 0.01473
Train [54][510/3239]	Time 0.275 (0.765)	Data Time 0.001 (0.319)	Loss 2.7290 (2.7163)	Entropy 0.63172 (0.63312)	Top-1 acc 58.594 (58.364)	Top-5 acc 77.734 (80.164)	lr 0.01473
Train [54][520/3239]	Time 0.233 (0.827)	Data Time 0.003 (0.313)	Loss 2.6781 (2.7160)	Entropy 0.63161 (0.63310)	Top-1 acc 60.547 (58.376)	Top-5 acc 80.078 (80.151)	lr 0.01473
Train [54][530/3239]	Time 0.238 (0.819)	Data Time 0.001 (0.307)	Loss 2.5391 (2.7158)	Entropy 0.63196 (0.63307)	Top-1 acc 63.672 (58.372)	Top-5 acc 84.375 (80.153)	lr 0.01473
Train [54][540/3239]	Time 0.225 (0.812)	Data Time 0.001 (0.302)	Loss 2.6304 (2.7155)	Entropy 0.63218 (0.63305)	Top-1 acc 64.062 (58.394)	Top-5 acc 83.984 (80.162)	lr 0.01472
Train [54][550/3239]	Time 0.240 (0.805)	Data Time 0.001 (0.296)	Loss 2.7226 (2.7151)	Entropy 0.63249 (0.63304)	Top-1 acc 62.500 (58.431)	Top-5 acc 82.812 (80.180)	lr 0.01472
Train [54][560/3239]	Time 0.280 (0.799)	Data Time 0.001 (0.291)	Loss 2.8371 (2.7153)	Entropy 0.63192 (0.63303)	Top-1 acc 58.203 (58.430)	Top-5 acc 77.734 (80.172)	lr 0.01472
Train [54][570/3239]	Time 0.282 (0.793)	Data Time 0.001 (0.286)	Loss 2.7459 (2.7161)	Entropy 0.63219 (0.63301)	Top-1 acc 56.641 (58.408)	Top-5 acc 80.469 (80.159)	lr 0.01472
Train [54][580/3239]	Time 0.435 (0.788)	Data Time 0.003 (0.281)	Loss 2.9175 (2.7153)	Entropy 0.63178 (0.63299)	Top-1 acc 53.516 (58.430)	Top-5 acc 76.172 (80.174)	lr 0.01472
Train [54][590/3239]	Time 0.248 (0.782)	Data Time 0.001 (0.276)	Loss 2.6424 (2.7150)	Entropy 0.63204 (0.63297)	Top-1 acc 62.500 (58.453)	Top-5 acc 78.516 (80.166)	lr 0.01472
Train [54][600/3239]	Time 0.300 (0.776)	Data Time 0.001 (0.272)	Loss 2.6792 (2.7160)	Entropy 0.63204 (0.63296)	Top-1 acc 57.812 (58.435)	Top-5 acc 80.859 (80.146)	lr 0.01472
Train [54][610/3239]	Time 0.242 (0.771)	Data Time 0.001 (0.267)	Loss 2.8489 (2.7167)	Entropy 0.63233 (0.63295)	Top-1 acc 54.688 (58.425)	Top-5 acc 76.562 (80.134)	lr 0.01472
Train [54][620/3239]	Time 0.332 (0.765)	Data Time 0.001 (0.263)	Loss 2.6429 (2.7166)	Entropy 0.63256 (0.63294)	Top-1 acc 59.375 (58.426)	Top-5 acc 80.859 (80.133)	lr 0.01472
Train [54][630/3239]	Time 0.255 (0.760)	Data Time 0.001 (0.259)	Loss 2.5627 (2.7158)	Entropy 0.63286 (0.63293)	Top-1 acc 60.156 (58.448)	Top-5 acc 82.031 (80.149)	lr 0.01472
Train [54][640/3239]	Time 0.329 (0.758)	Data Time 0.002 (0.257)	Loss 2.8912 (2.7163)	Entropy 0.63301 (0.63293)	Top-1 acc 52.734 (58.443)	Top-5 acc 78.125 (80.148)	lr 0.01471
Train [54][650/3239]	Time 0.271 (0.753)	Data Time 0.001 (0.253)	Loss 2.7217 (2.7164)	Entropy 0.63337 (0.63293)	Top-1 acc 58.594 (58.447)	Top-5 acc 80.859 (80.148)	lr 0.01471
Train [54][660/3239]	Time 0.287 (0.755)	Data Time 0.001 (0.256)	Loss 2.7413 (2.7169)	Entropy 0.63336 (0.63294)	Top-1 acc 57.422 (58.417)	Top-5 acc 77.734 (80.136)	lr 0.01471
Train [54][670/3239]	Time 0.393 (0.752)	Data Time 0.002 (0.254)	Loss 2.3938 (2.7159)	Entropy 0.63343 (0.63295)	Top-1 acc 67.188 (58.444)	Top-5 acc 87.109 (80.157)	lr 0.01471
Train [54][680/3239]	Time 0.236 (0.749)	Data Time 0.001 (0.251)	Loss 2.4064 (2.7155)	Entropy 0.63297 (0.63295)	Top-1 acc 67.969 (58.435)	Top-5 acc 85.938 (80.170)	lr 0.01471
Train [54][690/3239]	Time 0.255 (0.747)	Data Time 0.002 (0.250)	Loss 2.7811 (2.7158)	Entropy 0.63312 (0.63295)	Top-1 acc 53.906 (58.430)	Top-5 acc 80.859 (80.171)	lr 0.01471
Train [54][700/3239]	Time 0.243 (0.752)	Data Time 0.002 (0.256)	Loss 2.6492 (2.7149)	Entropy 0.63285 (0.63295)	Top-1 acc 58.984 (58.460)	Top-5 acc 80.859 (80.177)	lr 0.01471
Train [54][710/3239]	Time 0.244 (0.748)	Data Time 0.001 (0.252)	Loss 2.6616 (2.7148)	Entropy 0.63293 (0.63295)	Top-1 acc 58.203 (58.467)	Top-5 acc 82.031 (80.180)	lr 0.01471
Train [54][720/3239]	Time 0.250 (0.744)	Data Time 0.001 (0.249)	Loss 2.7158 (2.7154)	Entropy 0.63306 (0.63295)	Top-1 acc 55.859 (58.451)	Top-5 acc 78.125 (80.166)	lr 0.01471
Train [54][730/3239]	Time 0.246 (0.747)	Data Time 0.001 (0.253)	Loss 2.8857 (2.7152)	Entropy 0.63295 (0.63295)	Top-1 acc 52.734 (58.457)	Top-5 acc 76.172 (80.165)	lr 0.01471
Train [54][740/3239]	Time 0.329 (0.743)	Data Time 0.001 (0.250)	Loss 2.6501 (2.7150)	Entropy 0.63286 (0.63295)	Top-1 acc 61.719 (58.454)	Top-5 acc 81.250 (80.180)	lr 0.01470
Train [54][750/3239]	Time 0.272 (0.739)	Data Time 0.001 (0.246)	Loss 2.5537 (2.7142)	Entropy 0.63270 (0.63295)	Top-1 acc 62.500 (58.473)	Top-5 acc 85.547 (80.209)	lr 0.01470
Train [54][760/3239]	Time 0.286 (0.741)	Data Time 0.002 (0.250)	Loss 2.9801 (2.7147)	Entropy 0.63280 (0.63295)	Top-1 acc 54.297 (58.462)	Top-5 acc 76.562 (80.203)	lr 0.01470
Train [54][770/3239]	Time 0.243 (0.740)	Data Time 0.001 (0.249)	Loss 2.6885 (2.7147)	Entropy 0.63287 (0.63295)	Top-1 acc 61.328 (58.459)	Top-5 acc 81.250 (80.202)	lr 0.01470
Train [54][780/3239]	Time 0.261 (0.736)	Data Time 0.001 (0.246)	Loss 2.9930 (2.7150)	Entropy 0.63279 (0.63294)	Top-1 acc 50.781 (58.448)	Top-5 acc 73.047 (80.201)	lr 0.01470
Train [54][790/3239]	Time 0.227 (0.735)	Data Time 0.001 (0.245)	Loss 2.6706 (2.7157)	Entropy 0.63242 (0.63294)	Top-1 acc 55.469 (58.425)	Top-5 acc 81.641 (80.186)	lr 0.01470
Train [54][800/3239]	Time 0.254 (0.741)	Data Time 0.002 (0.251)	Loss 2.7042 (2.7156)	Entropy 0.63259 (0.63293)	Top-1 acc 57.031 (58.436)	Top-5 acc 82.422 (80.192)	lr 0.01470
Train [54][810/3239]	Time 0.237 (0.737)	Data Time 0.001 (0.248)	Loss 2.8361 (2.7153)	Entropy 0.63240 (0.63293)	Top-1 acc 54.688 (58.441)	Top-5 acc 80.859 (80.211)	lr 0.01470
Train [54][820/3239]	Time 0.338 (0.734)	Data Time 0.098 (0.245)	Loss 2.7444 (2.7151)	Entropy 0.63223 (0.63292)	Top-1 acc 53.906 (58.449)	Top-5 acc 79.297 (80.218)	lr 0.01470
Train [54][830/3239]	Time 0.235 (0.738)	Data Time 0.001 (0.250)	Loss 2.6792 (2.7145)	Entropy 0.63231 (0.63291)	Top-1 acc 60.156 (58.462)	Top-5 acc 83.203 (80.225)	lr 0.01470
Train [54][840/3239]	Time 0.238 (0.735)	Data Time 0.001 (0.247)	Loss 2.6562 (2.7143)	Entropy 0.63231 (0.63291)	Top-1 acc 60.156 (58.451)	Top-5 acc 78.906 (80.229)	lr 0.01469
Train [54][850/3239]	Time 0.241 (0.731)	Data Time 0.001 (0.245)	Loss 2.6808 (2.7145)	Entropy 0.63245 (0.63290)	Top-1 acc 59.375 (58.429)	Top-5 acc 80.859 (80.225)	lr 0.01469
Train [54][860/3239]	Time 0.238 (0.741)	Data Time 0.001 (0.255)	Loss 2.7352 (2.7155)	Entropy 0.63213 (0.63289)	Top-1 acc 57.422 (58.404)	Top-5 acc 80.469 (80.192)	lr 0.01469
Train [54][870/3239]	Time 0.254 (0.737)	Data Time 0.001 (0.252)	Loss 2.7140 (2.7154)	Entropy 0.63199 (0.63288)	Top-1 acc 57.031 (58.404)	Top-5 acc 77.734 (80.185)	lr 0.01469
Train [54][880/3239]	Time 0.285 (0.734)	Data Time 0.002 (0.249)	Loss 2.7966 (2.7160)	Entropy 0.63201 (0.63287)	Top-1 acc 56.250 (58.392)	Top-5 acc 79.297 (80.170)	lr 0.01469
Train [54][890/3239]	Time 0.239 (0.734)	Data Time 0.001 (0.250)	Loss 2.7381 (2.7163)	Entropy 0.63174 (0.63286)	Top-1 acc 55.469 (58.375)	Top-5 acc 80.078 (80.160)	lr 0.01469
Train [54][900/3239]	Time 0.351 (0.737)	Data Time 0.001 (0.254)	Loss 2.5885 (2.7159)	Entropy 0.63193 (0.63285)	Top-1 acc 58.594 (58.380)	Top-5 acc 84.375 (80.167)	lr 0.01469
Train [54][910/3239]	Time 0.263 (0.734)	Data Time 0.001 (0.251)	Loss 2.6680 (2.7154)	Entropy 0.63195 (0.63284)	Top-1 acc 60.156 (58.407)	Top-5 acc 80.469 (80.177)	lr 0.01469
Train [54][920/3239]	Time 0.285 (0.732)	Data Time 0.001 (0.250)	Loss 2.7316 (2.7159)	Entropy 0.63172 (0.63283)	Top-1 acc 57.812 (58.390)	Top-5 acc 77.734 (80.168)	lr 0.01469
Train [54][930/3239]	Time 0.234 (0.739)	Data Time 0.001 (0.257)	Loss 2.7880 (2.7153)	Entropy 0.63164 (0.63282)	Top-1 acc 58.203 (58.405)	Top-5 acc 79.688 (80.182)	lr 0.01469
Train [54][940/3239]	Time 0.266 (0.736)	Data Time 0.003 (0.255)	Loss 2.9430 (2.7158)	Entropy 0.63131 (0.63280)	Top-1 acc 55.469 (58.396)	Top-5 acc 75.781 (80.178)	lr 0.01468
Train [54][950/3239]	Time 0.250 (0.733)	Data Time 0.001 (0.252)	Loss 2.6127 (2.7151)	Entropy 0.63131 (0.63279)	Top-1 acc 60.547 (58.408)	Top-5 acc 80.078 (80.191)	lr 0.01468
Train [54][960/3239]	Time 0.257 (0.742)	Data Time 0.001 (0.262)	Loss 2.5871 (2.7147)	Entropy 0.63154 (0.63277)	Top-1 acc 61.719 (58.427)	Top-5 acc 86.719 (80.195)	lr 0.01468
Train [54][970/3239]	Time 0.330 (0.739)	Data Time 0.001 (0.259)	Loss 2.5607 (2.7147)	Entropy 0.63161 (0.63276)	Top-1 acc 62.891 (58.428)	Top-5 acc 85.156 (80.194)	lr 0.01468
Train [54][980/3239]	Time 0.233 (0.736)	Data Time 0.001 (0.257)	Loss 2.6825 (2.7147)	Entropy 0.63182 (0.63275)	Top-1 acc 58.203 (58.428)	Top-5 acc 81.250 (80.192)	lr 0.01468
Train [54][990/3239]	Time 0.245 (0.741)	Data Time 0.001 (0.263)	Loss 2.5910 (2.7146)	Entropy 0.63200 (0.63274)	Top-1 acc 60.156 (58.433)	Top-5 acc 83.203 (80.200)	lr 0.01468
Train [54][1000/3239]	Time 0.241 (0.738)	Data Time 0.001 (0.260)	Loss 2.7304 (2.7147)	Entropy 0.63186 (0.63273)	Top-1 acc 57.031 (58.429)	Top-5 acc 78.516 (80.200)	lr 0.01468
Train [54][1010/3239]	Time 0.237 (0.736)	Data Time 0.001 (0.258)	Loss 2.5602 (2.7141)	Entropy 0.63188 (0.63272)	Top-1 acc 60.547 (58.442)	Top-5 acc 84.375 (80.218)	lr 0.01468
Train [54][1020/3239]	Time 0.220 (0.742)	Data Time 0.001 (0.265)	Loss 2.7963 (2.7146)	Entropy 0.63189 (0.63271)	Top-1 acc 55.469 (58.435)	Top-5 acc 78.125 (80.205)	lr 0.01468
Train [54][1030/3239]	Time 0.247 (0.739)	Data Time 0.001 (0.262)	Loss 2.6294 (2.7145)	Entropy 0.63195 (0.63271)	Top-1 acc 61.328 (58.449)	Top-5 acc 82.031 (80.201)	lr 0.01468
Train [54][1040/3239]	Time 1.259 (0.737)	Data Time 1.008 (0.261)	Loss 2.7176 (2.7143)	Entropy 0.63167 (0.63270)	Top-1 acc 59.375 (58.450)	Top-5 acc 78.516 (80.202)	lr 0.01467
Train [54][1050/3239]	Time 0.255 (0.736)	Data Time 0.001 (0.260)	Loss 2.5919 (2.7142)	Entropy 0.63181 (0.63269)	Top-1 acc 61.719 (58.455)	Top-5 acc 82.422 (80.204)	lr 0.01467
Train [54][1060/3239]	Time 0.350 (0.738)	Data Time 0.002 (0.263)	Loss 2.5268 (2.7144)	Entropy 0.63147 (0.63268)	Top-1 acc 64.844 (58.454)	Top-5 acc 83.594 (80.198)	lr 0.01467
Train [54][1070/3239]	Time 0.245 (0.736)	Data Time 0.001 (0.260)	Loss 2.8351 (2.7148)	Entropy 0.63172 (0.63267)	Top-1 acc 57.812 (58.451)	Top-5 acc 79.297 (80.192)	lr 0.01467
Train [54][1080/3239]	Time 0.285 (0.739)	Data Time 0.001 (0.265)	Loss 2.7745 (2.7146)	Entropy 0.63166 (0.63266)	Top-1 acc 57.812 (58.455)	Top-5 acc 79.688 (80.193)	lr 0.01467
Train [54][1090/3239]	Time 0.259 (0.741)	Data Time 0.001 (0.266)	Loss 2.4644 (2.7141)	Entropy 0.63186 (0.63265)	Top-1 acc 70.312 (58.470)	Top-5 acc 84.375 (80.204)	lr 0.01467
Train [54][1100/3239]	Time 0.261 (0.738)	Data Time 0.001 (0.264)	Loss 2.6126 (2.7137)	Entropy 0.63207 (0.63264)	Top-1 acc 60.156 (58.476)	Top-5 acc 82.812 (80.214)	lr 0.01467
Train [54][1110/3239]	Time 0.242 (0.739)	Data Time 0.001 (0.265)	Loss 2.8454 (2.7132)	Entropy 0.63213 (0.63264)	Top-1 acc 58.203 (58.499)	Top-5 acc 77.344 (80.218)	lr 0.01467
Train [54][1120/3239]	Time 0.227 (0.740)	Data Time 0.001 (0.266)	Loss 2.7739 (2.7134)	Entropy 0.63178 (0.63263)	Top-1 acc 59.375 (58.496)	Top-5 acc 76.562 (80.216)	lr 0.01467
Train [54][1130/3239]	Time 0.325 (0.737)	Data Time 0.001 (0.264)	Loss 2.8909 (2.7139)	Entropy 0.63183 (0.63263)	Top-1 acc 54.297 (58.491)	Top-5 acc 77.344 (80.206)	lr 0.01467
Train [54][1140/3239]	Time 0.249 (0.738)	Data Time 0.001 (0.266)	Loss 2.4919 (2.7137)	Entropy 0.63205 (0.63262)	Top-1 acc 62.891 (58.491)	Top-5 acc 83.203 (80.204)	lr 0.01466
Train [54][1150/3239]	Time 0.252 (0.743)	Data Time 0.001 (0.271)	Loss 2.5269 (2.7138)	Entropy 0.63202 (0.63262)	Top-1 acc 61.328 (58.477)	Top-5 acc 82.812 (80.195)	lr 0.01466
Train [54][1160/3239]	Time 0.239 (0.740)	Data Time 0.001 (0.269)	Loss 2.8049 (2.7142)	Entropy 0.63224 (0.63261)	Top-1 acc 54.297 (58.463)	Top-5 acc 79.297 (80.191)	lr 0.01466
Train [54][1170/3239]	Time 0.368 (0.771)	Data Time 0.004 (0.270)	Loss 2.6357 (2.7148)	Entropy 0.63246 (0.63261)	Top-1 acc 58.594 (58.445)	Top-5 acc 80.469 (80.177)	lr 0.01466
Train [54][1180/3239]	Time 0.224 (0.769)	Data Time 0.002 (0.268)	Loss 2.7240 (2.7144)	Entropy 0.63252 (0.63261)	Top-1 acc 55.078 (58.442)	Top-5 acc 78.125 (80.185)	lr 0.01466
Train [54][1190/3239]	Time 0.236 (0.766)	Data Time 0.001 (0.266)	Loss 2.7581 (2.7144)	Entropy 0.63231 (0.63261)	Top-1 acc 57.812 (58.441)	Top-5 acc 77.344 (80.190)	lr 0.01466
Train [54][1200/3239]	Time 0.245 (0.763)	Data Time 0.002 (0.264)	Loss 2.8961 (2.7147)	Entropy 0.63262 (0.63261)	Top-1 acc 54.688 (58.427)	Top-5 acc 78.906 (80.189)	lr 0.01466
Train [54][1210/3239]	Time 0.267 (0.760)	Data Time 0.001 (0.262)	Loss 2.6441 (2.7145)	Entropy 0.63283 (0.63261)	Top-1 acc 57.812 (58.426)	Top-5 acc 82.031 (80.195)	lr 0.01466
Train [54][1220/3239]	Time 0.382 (0.757)	Data Time 0.001 (0.259)	Loss 2.7629 (2.7146)	Entropy 0.63317 (0.63261)	Top-1 acc 58.984 (58.437)	Top-5 acc 79.688 (80.191)	lr 0.01466
Train [54][1230/3239]	Time 0.286 (0.755)	Data Time 0.002 (0.257)	Loss 2.9227 (2.7145)	Entropy 0.63310 (0.63262)	Top-1 acc 50.781 (58.442)	Top-5 acc 75.391 (80.201)	lr 0.01466
Train [54][1240/3239]	Time 0.232 (0.752)	Data Time 0.001 (0.255)	Loss 2.5957 (2.7143)	Entropy 0.63308 (0.63262)	Top-1 acc 62.891 (58.453)	Top-5 acc 83.984 (80.209)	lr 0.01465
Train [54][1250/3239]	Time 0.268 (0.750)	Data Time 0.001 (0.253)	Loss 2.7712 (2.7148)	Entropy 0.63316 (0.63262)	Top-1 acc 53.906 (58.439)	Top-5 acc 79.297 (80.196)	lr 0.01465
Train [54][1260/3239]	Time 0.243 (0.747)	Data Time 0.001 (0.251)	Loss 2.5245 (2.7149)	Entropy 0.63320 (0.63263)	Top-1 acc 62.891 (58.437)	Top-5 acc 82.812 (80.193)	lr 0.01465
Train [54][1270/3239]	Time 0.296 (0.751)	Data Time 0.001 (0.255)	Loss 2.6464 (2.7152)	Entropy 0.63279 (0.63263)	Top-1 acc 60.156 (58.435)	Top-5 acc 81.250 (80.184)	lr 0.01465
Train [54][1280/3239]	Time 0.269 (0.753)	Data Time 0.002 (0.258)	Loss 2.7709 (2.7151)	Entropy 0.63310 (0.63263)	Top-1 acc 58.984 (58.445)	Top-5 acc 80.469 (80.179)	lr 0.01465
Train [54][1290/3239]	Time 0.376 (0.751)	Data Time 0.001 (0.256)	Loss 2.7131 (2.7149)	Entropy 0.63283 (0.63264)	Top-1 acc 60.547 (58.447)	Top-5 acc 79.297 (80.176)	lr 0.01465
Train [54][1300/3239]	Time 9.030 (0.756)	Data Time 8.785 (0.262)	Loss 2.9276 (2.7154)	Entropy 0.63273 (0.63264)	Top-1 acc 55.078 (58.439)	Top-5 acc 78.906 (80.164)	lr 0.01465
Train [54][1310/3239]	Time 0.644 (0.754)	Data Time 0.390 (0.261)	Loss 2.8396 (2.7152)	Entropy 0.63266 (0.63264)	Top-1 acc 53.906 (58.445)	Top-5 acc 80.078 (80.175)	lr 0.01465
Train [54][1320/3239]	Time 0.237 (0.752)	Data Time 0.001 (0.259)	Loss 2.9620 (2.7153)	Entropy 0.63262 (0.63264)	Top-1 acc 53.906 (58.445)	Top-5 acc 79.688 (80.176)	lr 0.01465
Train [54][1330/3239]	Time 0.237 (0.750)	Data Time 0.001 (0.257)	Loss 2.6540 (2.7153)	Entropy 0.63288 (0.63264)	Top-1 acc 55.859 (58.439)	Top-5 acc 80.469 (80.178)	lr 0.01465
Train [54][1340/3239]	Time 0.270 (0.758)	Data Time 0.001 (0.265)	Loss 2.5307 (2.7150)	Entropy 0.63276 (0.63264)	Top-1 acc 64.062 (58.453)	Top-5 acc 83.984 (80.185)	lr 0.01464
Train [54][1350/3239]	Time 0.247 (0.757)	Data Time 0.001 (0.265)	Loss 2.8303 (2.7147)	Entropy 0.63292 (0.63264)	Top-1 acc 53.906 (58.451)	Top-5 acc 77.734 (80.187)	lr 0.01464
Train [54][1360/3239]	Time 0.257 (0.755)	Data Time 0.001 (0.263)	Loss 2.7067 (2.7150)	Entropy 0.63260 (0.63264)	Top-1 acc 60.156 (58.441)	Top-5 acc 80.078 (80.181)	lr 0.01464
Train [54][1370/3239]	Time 0.295 (0.760)	Data Time 0.002 (0.268)	Loss 2.6987 (2.7152)	Entropy 0.63283 (0.63264)	Top-1 acc 58.984 (58.437)	Top-5 acc 81.250 (80.182)	lr 0.01464
Train [54][1380/3239]	Time 0.289 (0.760)	Data Time 0.001 (0.269)	Loss 2.8089 (2.7153)	Entropy 0.63266 (0.63264)	Top-1 acc 56.250 (58.437)	Top-5 acc 79.688 (80.181)	lr 0.01464
Train [54][1390/3239]	Time 0.239 (0.758)	Data Time 0.001 (0.267)	Loss 2.8217 (2.7152)	Entropy 0.63276 (0.63264)	Top-1 acc 55.469 (58.444)	Top-5 acc 79.688 (80.176)	lr 0.01464
Train [54][1400/3239]	Time 0.241 (0.761)	Data Time 0.001 (0.271)	Loss 2.6767 (2.7151)	Entropy 0.63296 (0.63265)	Top-1 acc 58.594 (58.446)	Top-5 acc 79.297 (80.180)	lr 0.01464
Train [54][1410/3239]	Time 0.295 (0.764)	Data Time 0.001 (0.274)	Loss 2.7063 (2.7150)	Entropy 0.63311 (0.63265)	Top-1 acc 57.812 (58.462)	Top-5 acc 79.297 (80.184)	lr 0.01464
Train [54][1420/3239]	Time 0.250 (0.761)	Data Time 0.001 (0.272)	Loss 2.5409 (2.7152)	Entropy 0.63269 (0.63265)	Top-1 acc 62.109 (58.457)	Top-5 acc 82.422 (80.180)	lr 0.01464
Train [54][1430/3239]	Time 0.295 (0.764)	Data Time 0.001 (0.275)	Loss 2.6661 (2.7153)	Entropy 0.63275 (0.63265)	Top-1 acc 59.766 (58.459)	Top-5 acc 80.078 (80.177)	lr 0.01464
Train [54][1440/3239]	Time 0.261 (0.768)	Data Time 0.001 (0.280)	Loss 2.7683 (2.7152)	Entropy 0.63307 (0.63265)	Top-1 acc 56.250 (58.469)	Top-5 acc 78.125 (80.172)	lr 0.01463
Train [54][1450/3239]	Time 0.383 (0.766)	Data Time 0.001 (0.278)	Loss 2.7558 (2.7154)	Entropy 0.63346 (0.63265)	Top-1 acc 57.422 (58.462)	Top-5 acc 78.125 (80.166)	lr 0.01463
Train [54][1460/3239]	Time 6.724 (0.768)	Data Time 6.437 (0.280)	Loss 2.6984 (2.7152)	Entropy 0.63368 (0.63266)	Top-1 acc 56.641 (58.463)	Top-5 acc 80.078 (80.167)	lr 0.01463
Train [54][1470/3239]	Time 0.239 (0.770)	Data Time 0.001 (0.283)	Loss 2.8267 (2.7152)	Entropy 0.63350 (0.63267)	Top-1 acc 60.547 (58.463)	Top-5 acc 77.734 (80.166)	lr 0.01463
Train [54][1480/3239]	Time 0.269 (0.768)	Data Time 0.001 (0.281)	Loss 2.8712 (2.7153)	Entropy 0.63330 (0.63267)	Top-1 acc 56.641 (58.463)	Top-5 acc 78.516 (80.167)	lr 0.01463
Train [54][1490/3239]	Time 0.253 (0.766)	Data Time 0.001 (0.279)	Loss 2.7206 (2.7150)	Entropy 0.63350 (0.63268)	Top-1 acc 58.203 (58.472)	Top-5 acc 78.125 (80.172)	lr 0.01463
Train [54][1500/3239]	Time 6.487 (0.776)	Data Time 6.197 (0.289)	Loss 2.7197 (2.7150)	Entropy 0.63323 (0.63268)	Top-1 acc 57.031 (58.467)	Top-5 acc 79.688 (80.177)	lr 0.01463
Train [54][1510/3239]	Time 0.232 (0.773)	Data Time 0.001 (0.287)	Loss 2.7772 (2.7151)	Entropy 0.63294 (0.63269)	Top-1 acc 61.719 (58.461)	Top-5 acc 77.734 (80.170)	lr 0.01463
Train [54][1520/3239]	Time 0.331 (0.771)	Data Time 0.001 (0.285)	Loss 2.9275 (2.7155)	Entropy 0.63268 (0.63269)	Top-1 acc 57.422 (58.451)	Top-5 acc 76.953 (80.163)	lr 0.01463
Train [54][1530/3239]	Time 0.248 (0.776)	Data Time 0.001 (0.291)	Loss 2.6983 (2.7157)	Entropy 0.63263 (0.63269)	Top-1 acc 60.938 (58.447)	Top-5 acc 78.516 (80.152)	lr 0.01463
Train [54][1540/3239]	Time 0.228 (0.778)	Data Time 0.001 (0.293)	Loss 2.7003 (2.7155)	Entropy 0.63262 (0.63269)	Top-1 acc 55.859 (58.445)	Top-5 acc 78.516 (80.150)	lr 0.01462
Train [54][1550/3239]	Time 0.250 (0.775)	Data Time 0.001 (0.291)	Loss 2.5952 (2.7154)	Entropy 0.63251 (0.63268)	Top-1 acc 63.672 (58.454)	Top-5 acc 82.812 (80.153)	lr 0.01462
Train [54][1560/3239]	Time 0.287 (0.779)	Data Time 0.001 (0.296)	Loss 2.7513 (2.7152)	Entropy 0.63264 (0.63268)	Top-1 acc 58.594 (58.461)	Top-5 acc 82.031 (80.155)	lr 0.01462
Train [54][1570/3239]	Time 0.238 (0.781)	Data Time 0.001 (0.297)	Loss 2.6241 (2.7150)	Entropy 0.63292 (0.63268)	Top-1 acc 60.547 (58.460)	Top-5 acc 83.984 (80.160)	lr 0.01462
Train [54][1580/3239]	Time 0.233 (0.778)	Data Time 0.001 (0.295)	Loss 2.7614 (2.7153)	Entropy 0.63313 (0.63269)	Top-1 acc 53.906 (58.453)	Top-5 acc 80.469 (80.154)	lr 0.01462
Train [54][1590/3239]	Time 0.245 (0.783)	Data Time 0.001 (0.301)	Loss 2.5888 (2.7157)	Entropy 0.63336 (0.63269)	Top-1 acc 62.500 (58.446)	Top-5 acc 83.594 (80.145)	lr 0.01462
Train [54][1600/3239]	Time 0.271 (0.787)	Data Time 0.002 (0.304)	Loss 2.7527 (2.7157)	Entropy 0.63333 (0.63269)	Top-1 acc 58.203 (58.447)	Top-5 acc 80.469 (80.145)	lr 0.01462
Train [54][1610/3239]	Time 0.340 (0.784)	Data Time 0.001 (0.303)	Loss 2.7941 (2.7156)	Entropy 0.63276 (0.63270)	Top-1 acc 54.688 (58.444)	Top-5 acc 77.344 (80.146)	lr 0.01462
Train [54][1620/3239]	Time 8.572 (0.787)	Data Time 8.325 (0.306)	Loss 2.7679 (2.7156)	Entropy 0.63299 (0.63270)	Top-1 acc 59.375 (58.443)	Top-5 acc 78.516 (80.146)	lr 0.01462
Train [54][1630/3239]	Time 0.246 (0.791)	Data Time 0.002 (0.310)	Loss 2.8321 (2.7160)	Entropy 0.63333 (0.63270)	Top-1 acc 56.641 (58.427)	Top-5 acc 77.344 (80.138)	lr 0.01462
Train [54][1640/3239]	Time 0.236 (0.789)	Data Time 0.002 (0.308)	Loss 2.6609 (2.7159)	Entropy 0.63344 (0.63270)	Top-1 acc 58.203 (58.424)	Top-5 acc 79.297 (80.142)	lr 0.01461
Train [54][1650/3239]	Time 0.247 (0.787)	Data Time 0.001 (0.306)	Loss 2.7540 (2.7159)	Entropy 0.63348 (0.63271)	Top-1 acc 56.250 (58.425)	Top-5 acc 80.859 (80.140)	lr 0.01461
Train [54][1660/3239]	Time 8.972 (0.797)	Data Time 8.708 (0.317)	Loss 2.7135 (2.7157)	Entropy 0.63329 (0.63271)	Top-1 acc 61.328 (58.428)	Top-5 acc 82.031 (80.143)	lr 0.01461
Train [54][1670/3239]	Time 0.233 (0.795)	Data Time 0.001 (0.315)	Loss 2.7234 (2.7162)	Entropy 0.63336 (0.63272)	Top-1 acc 58.594 (58.416)	Top-5 acc 80.078 (80.134)	lr 0.01461
Train [54][1680/3239]	Time 0.383 (0.792)	Data Time 0.001 (0.313)	Loss 2.5264 (2.7161)	Entropy 0.63321 (0.63272)	Top-1 acc 61.328 (58.419)	Top-5 acc 84.375 (80.137)	lr 0.01461
Train [54][1690/3239]	Time 0.271 (0.797)	Data Time 0.002 (0.318)	Loss 2.7137 (2.7160)	Entropy 0.63311 (0.63272)	Top-1 acc 62.500 (58.427)	Top-5 acc 82.031 (80.140)	lr 0.01461
Train [54][1700/3239]	Time 0.245 (0.799)	Data Time 0.001 (0.321)	Loss 2.4885 (2.7161)	Entropy 0.63306 (0.63272)	Top-1 acc 64.844 (58.422)	Top-5 acc 84.375 (80.140)	lr 0.01461
Train [54][1710/3239]	Time 0.252 (0.797)	Data Time 0.001 (0.319)	Loss 2.5543 (2.7160)	Entropy 0.63314 (0.63273)	Top-1 acc 60.156 (58.425)	Top-5 acc 80.859 (80.139)	lr 0.01461
Train [54][1720/3239]	Time 0.240 (0.801)	Data Time 0.001 (0.323)	Loss 2.7065 (2.7159)	Entropy 0.63287 (0.63273)	Top-1 acc 57.422 (58.429)	Top-5 acc 80.078 (80.141)	lr 0.01461
Train [54][1730/3239]	Time 0.232 (0.807)	Data Time 0.001 (0.329)	Loss 2.4977 (2.7158)	Entropy 0.63291 (0.63273)	Top-1 acc 64.453 (58.426)	Top-5 acc 83.594 (80.137)	lr 0.01461
Train [54][1740/3239]	Time 0.236 (0.805)	Data Time 0.001 (0.328)	Loss 2.6088 (2.7160)	Entropy 0.63265 (0.63273)	Top-1 acc 57.031 (58.418)	Top-5 acc 82.812 (80.137)	lr 0.01460
Train [54][1750/3239]	Time 0.234 (0.808)	Data Time 0.001 (0.332)	Loss 2.6039 (2.7159)	Entropy 0.63283 (0.63273)	Top-1 acc 61.328 (58.418)	Top-5 acc 82.031 (80.138)	lr 0.01460
Train [54][1760/3239]	Time 0.233 (0.814)	Data Time 0.001 (0.338)	Loss 2.7674 (2.7158)	Entropy 0.63267 (0.63273)	Top-1 acc 58.984 (58.422)	Top-5 acc 79.688 (80.138)	lr 0.01460
Train [54][1770/3239]	Time 0.355 (0.812)	Data Time 0.001 (0.336)	Loss 2.8288 (2.7161)	Entropy 0.63272 (0.63273)	Top-1 acc 54.297 (58.417)	Top-5 acc 77.734 (80.139)	lr 0.01460
Train [54][1780/3239]	Time 3.371 (0.811)	Data Time 3.109 (0.336)	Loss 2.4735 (2.7161)	Entropy 0.63276 (0.63273)	Top-1 acc 65.234 (58.416)	Top-5 acc 85.547 (80.139)	lr 0.01460
Train [54][1790/3239]	Time 0.227 (0.818)	Data Time 0.001 (0.343)	Loss 2.7956 (2.7161)	Entropy 0.63305 (0.63273)	Top-1 acc 61.719 (58.418)	Top-5 acc 78.906 (80.136)	lr 0.01460
Train [54][1800/3239]	Time 0.231 (0.816)	Data Time 0.001 (0.341)	Loss 2.6136 (2.7160)	Entropy 0.63324 (0.63273)	Top-1 acc 59.375 (58.417)	Top-5 acc 80.078 (80.136)	lr 0.01460
Train [54][1810/3239]	Time 0.265 (0.814)	Data Time 0.002 (0.339)	Loss 2.6173 (2.7161)	Entropy 0.63330 (0.63274)	Top-1 acc 62.891 (58.420)	Top-5 acc 83.594 (80.134)	lr 0.01460
Train [54][1820/3239]	Time 17.849 (0.822)	Data Time 17.587 (0.347)	Loss 2.6137 (2.7155)	Entropy 0.63338 (0.63274)	Top-1 acc 57.422 (58.434)	Top-5 acc 82.422 (80.142)	lr 0.01460
Train [54][1830/3239]	Time 0.328 (0.839)	Data Time 0.003 (0.345)	Loss 2.6231 (2.7154)	Entropy 0.63299 (0.63274)	Top-1 acc 62.500 (58.442)	Top-5 acc 81.641 (80.148)	lr 0.01460
Train [54][1840/3239]	Time 0.351 (0.836)	Data Time 0.002 (0.343)	Loss 2.7400 (2.7153)	Entropy 0.63282 (0.63274)	Top-1 acc 55.469 (58.446)	Top-5 acc 81.250 (80.149)	lr 0.01459
Train [54][1850/3239]	Time 0.248 (0.834)	Data Time 0.001 (0.341)	Loss 2.7347 (2.7154)	Entropy 0.63298 (0.63274)	Top-1 acc 58.594 (58.446)	Top-5 acc 78.125 (80.144)	lr 0.01459
Train [54][1860/3239]	Time 0.248 (0.832)	Data Time 0.001 (0.340)	Loss 2.8434 (2.7158)	Entropy 0.63306 (0.63274)	Top-1 acc 52.734 (58.433)	Top-5 acc 77.734 (80.140)	lr 0.01459
Train [54][1870/3239]	Time 0.242 (0.830)	Data Time 0.001 (0.338)	Loss 2.6437 (2.7161)	Entropy 0.63268 (0.63274)	Top-1 acc 60.938 (58.426)	Top-5 acc 79.297 (80.136)	lr 0.01459
Train [54][1880/3239]	Time 0.263 (0.828)	Data Time 0.002 (0.336)	Loss 2.7368 (2.7156)	Entropy 0.63239 (0.63274)	Top-1 acc 57.422 (58.437)	Top-5 acc 78.906 (80.146)	lr 0.01459
Train [54][1890/3239]	Time 0.452 (0.826)	Data Time 0.217 (0.334)	Loss 2.5657 (2.7155)	Entropy 0.63232 (0.63274)	Top-1 acc 60.938 (58.439)	Top-5 acc 86.328 (80.147)	lr 0.01459
Train [54][1900/3239]	Time 0.249 (0.827)	Data Time 0.001 (0.336)	Loss 2.7334 (2.7156)	Entropy 0.63229 (0.63274)	Top-1 acc 57.812 (58.438)	Top-5 acc 81.641 (80.146)	lr 0.01459
Train [54][1910/3239]	Time 0.263 (0.825)	Data Time 0.002 (0.334)	Loss 2.6732 (2.7159)	Entropy 0.63210 (0.63274)	Top-1 acc 60.938 (58.435)	Top-5 acc 78.906 (80.138)	lr 0.01459
Train [54][1920/3239]	Time 0.250 (0.823)	Data Time 0.001 (0.332)	Loss 2.9951 (2.7164)	Entropy 0.63181 (0.63273)	Top-1 acc 51.172 (58.419)	Top-5 acc 73.438 (80.130)	lr 0.01459
Train [54][1930/3239]	Time 0.375 (0.829)	Data Time 0.001 (0.338)	Loss 2.6877 (2.7165)	Entropy 0.63199 (0.63273)	Top-1 acc 60.547 (58.417)	Top-5 acc 81.641 (80.131)	lr 0.01459
Train [54][1940/3239]	Time 0.249 (0.828)	Data Time 0.001 (0.338)	Loss 2.4891 (2.7165)	Entropy 0.63219 (0.63273)	Top-1 acc 69.531 (58.413)	Top-5 acc 82.812 (80.131)	lr 0.01459
Train [54][1950/3239]	Time 0.237 (0.826)	Data Time 0.001 (0.336)	Loss 2.6666 (2.7163)	Entropy 0.63176 (0.63272)	Top-1 acc 59.375 (58.416)	Top-5 acc 80.078 (80.134)	lr 0.01458
Train [54][1960/3239]	Time 0.237 (0.833)	Data Time 0.001 (0.344)	Loss 2.7399 (2.7162)	Entropy 0.63158 (0.63272)	Top-1 acc 57.422 (58.424)	Top-5 acc 78.516 (80.135)	lr 0.01458
Train [54][1970/3239]	Time 0.253 (0.831)	Data Time 0.001 (0.342)	Loss 2.7290 (2.7160)	Entropy 0.63164 (0.63271)	Top-1 acc 57.422 (58.432)	Top-5 acc 78.125 (80.136)	lr 0.01458
Train [54][1980/3239]	Time 0.249 (0.829)	Data Time 0.001 (0.340)	Loss 2.5243 (2.7162)	Entropy 0.63178 (0.63271)	Top-1 acc 61.719 (58.429)	Top-5 acc 84.766 (80.135)	lr 0.01458
Train [54][1990/3239]	Time 0.240 (0.836)	Data Time 0.001 (0.347)	Loss 2.9210 (2.7163)	Entropy 0.63189 (0.63270)	Top-1 acc 57.812 (58.429)	Top-5 acc 73.828 (80.128)	lr 0.01458
Train [54][2000/3239]	Time 0.339 (0.834)	Data Time 0.001 (0.346)	Loss 2.5006 (2.7161)	Entropy 0.63183 (0.63270)	Top-1 acc 64.844 (58.429)	Top-5 acc 82.422 (80.129)	lr 0.01458
Train [54][2010/3239]	Time 0.260 (0.833)	Data Time 0.001 (0.344)	Loss 2.8150 (2.7160)	Entropy 0.63170 (0.63269)	Top-1 acc 54.688 (58.433)	Top-5 acc 81.250 (80.133)	lr 0.01458
Train [54][2020/3239]	Time 0.320 (0.836)	Data Time 0.002 (0.348)	Loss 2.7457 (2.7159)	Entropy 0.63150 (0.63269)	Top-1 acc 56.641 (58.434)	Top-5 acc 78.516 (80.136)	lr 0.01458
Train [54][2030/3239]	Time 1.646 (0.836)	Data Time 1.367 (0.348)	Loss 2.5595 (2.7159)	Entropy 0.63160 (0.63268)	Top-1 acc 60.547 (58.438)	Top-5 acc 81.250 (80.131)	lr 0.01458
Train [54][2040/3239]	Time 0.231 (0.834)	Data Time 0.001 (0.346)	Loss 2.6641 (2.7160)	Entropy 0.63193 (0.63268)	Top-1 acc 60.547 (58.433)	Top-5 acc 81.250 (80.133)	lr 0.01458
Train [54][2050/3239]	Time 5.576 (0.840)	Data Time 5.334 (0.352)	Loss 2.5991 (2.7159)	Entropy 0.63147 (0.63267)	Top-1 acc 61.719 (58.437)	Top-5 acc 83.594 (80.133)	lr 0.01457
Train [54][2060/3239]	Time 0.253 (0.839)	Data Time 0.001 (0.351)	Loss 2.7782 (2.7162)	Entropy 0.63175 (0.63267)	Top-1 acc 54.688 (58.431)	Top-5 acc 78.906 (80.126)	lr 0.01457
Train [54][2070/3239]	Time 0.214 (0.838)	Data Time 0.001 (0.351)	Loss 2.5560 (2.7163)	Entropy 0.63175 (0.63266)	Top-1 acc 60.547 (58.434)	Top-5 acc 84.766 (80.125)	lr 0.01457
Train [54][2080/3239]	Time 0.235 (0.836)	Data Time 0.001 (0.349)	Loss 2.6447 (2.7162)	Entropy 0.63180 (0.63266)	Top-1 acc 60.156 (58.436)	Top-5 acc 83.984 (80.128)	lr 0.01457
Train [54][2090/3239]	Time 0.296 (0.842)	Data Time 0.001 (0.355)	Loss 2.5408 (2.7164)	Entropy 0.63184 (0.63265)	Top-1 acc 63.672 (58.439)	Top-5 acc 83.984 (80.124)	lr 0.01457
Train [54][2100/3239]	Time 0.242 (0.840)	Data Time 0.002 (0.354)	Loss 2.6636 (2.7162)	Entropy 0.63196 (0.63265)	Top-1 acc 62.109 (58.445)	Top-5 acc 81.250 (80.125)	lr 0.01457
Train [54][2110/3239]	Time 0.249 (0.838)	Data Time 0.001 (0.352)	Loss 2.8290 (2.7163)	Entropy 0.63212 (0.63265)	Top-1 acc 58.203 (58.445)	Top-5 acc 78.906 (80.125)	lr 0.01457
Train [54][2120/3239]	Time 0.247 (0.846)	Data Time 0.001 (0.360)	Loss 2.5479 (2.7161)	Entropy 0.63202 (0.63265)	Top-1 acc 62.891 (58.447)	Top-5 acc 83.203 (80.129)	lr 0.01457
Train [54][2130/3239]	Time 0.240 (0.844)	Data Time 0.001 (0.359)	Loss 2.7132 (2.7161)	Entropy 0.63195 (0.63264)	Top-1 acc 60.547 (58.442)	Top-5 acc 81.641 (80.132)	lr 0.01457
Train [54][2140/3239]	Time 0.252 (0.843)	Data Time 0.001 (0.357)	Loss 2.8777 (2.7165)	Entropy 0.63207 (0.63264)	Top-1 acc 53.516 (58.433)	Top-5 acc 76.562 (80.126)	lr 0.01457
Train [54][2150/3239]	Time 0.236 (0.851)	Data Time 0.001 (0.366)	Loss 2.6140 (2.7165)	Entropy 0.63194 (0.63264)	Top-1 acc 60.547 (58.436)	Top-5 acc 82.422 (80.126)	lr 0.01456
Train [54][2160/3239]	Time 1.860 (0.850)	Data Time 1.510 (0.365)	Loss 2.5874 (2.7164)	Entropy 0.63190 (0.63263)	Top-1 acc 64.844 (58.442)	Top-5 acc 82.031 (80.127)	lr 0.01456
Train [54][2170/3239]	Time 0.238 (0.848)	Data Time 0.001 (0.363)	Loss 2.7481 (2.7161)	Entropy 0.63188 (0.63263)	Top-1 acc 56.641 (58.453)	Top-5 acc 78.125 (80.130)	lr 0.01456
Train [54][2180/3239]	Time 0.255 (0.853)	Data Time 0.001 (0.369)	Loss 2.6723 (2.7165)	Entropy 0.63192 (0.63263)	Top-1 acc 59.375 (58.448)	Top-5 acc 80.469 (80.117)	lr 0.01456
Train [54][2190/3239]	Time 0.233 (0.854)	Data Time 0.001 (0.370)	Loss 2.6592 (2.7164)	Entropy 0.63206 (0.63262)	Top-1 acc 57.031 (58.451)	Top-5 acc 82.422 (80.120)	lr 0.01456
Train [54][2200/3239]	Time 0.234 (0.852)	Data Time 0.001 (0.369)	Loss 2.5617 (2.7164)	Entropy 0.63207 (0.63262)	Top-1 acc 62.891 (58.449)	Top-5 acc 83.203 (80.121)	lr 0.01456
Train [54][2210/3239]	Time 1.091 (0.856)	Data Time 0.842 (0.373)	Loss 2.7397 (2.7162)	Entropy 0.63177 (0.63262)	Top-1 acc 58.984 (58.454)	Top-5 acc 79.297 (80.125)	lr 0.01456
Train [54][2220/3239]	Time 0.254 (0.858)	Data Time 0.001 (0.375)	Loss 3.0707 (2.7163)	Entropy 0.63182 (0.63261)	Top-1 acc 47.266 (58.451)	Top-5 acc 73.438 (80.126)	lr 0.01456
Train [54][2230/3239]	Time 0.317 (0.857)	Data Time 0.001 (0.375)	Loss 2.7490 (2.7165)	Entropy 0.63175 (0.63261)	Top-1 acc 58.594 (58.448)	Top-5 acc 79.688 (80.120)	lr 0.01456
Train [54][2240/3239]	Time 0.248 (0.855)	Data Time 0.001 (0.373)	Loss 2.6800 (2.7166)	Entropy 0.63168 (0.63261)	Top-1 acc 60.938 (58.444)	Top-5 acc 81.250 (80.118)	lr 0.01456
Train [54][2250/3239]	Time 0.269 (0.862)	Data Time 0.001 (0.380)	Loss 2.7856 (2.7165)	Entropy 0.63209 (0.63260)	Top-1 acc 58.984 (58.448)	Top-5 acc 77.344 (80.120)	lr 0.01455
Train [54][2260/3239]	Time 0.247 (0.863)	Data Time 0.001 (0.381)	Loss 2.6462 (2.7162)	Entropy 0.63204 (0.63260)	Top-1 acc 59.375 (58.450)	Top-5 acc 80.078 (80.124)	lr 0.01455
Train [54][2270/3239]	Time 0.241 (0.861)	Data Time 0.001 (0.379)	Loss 2.7103 (2.7162)	Entropy 0.63192 (0.63260)	Top-1 acc 60.156 (58.454)	Top-5 acc 79.297 (80.123)	lr 0.01455
Train [54][2280/3239]	Time 0.267 (0.866)	Data Time 0.001 (0.385)	Loss 2.6438 (2.7164)	Entropy 0.63183 (0.63259)	Top-1 acc 58.984 (58.451)	Top-5 acc 82.031 (80.121)	lr 0.01455
Train [54][2290/3239]	Time 0.273 (0.866)	Data Time 0.002 (0.385)	Loss 2.5923 (2.7161)	Entropy 0.63181 (0.63259)	Top-1 acc 60.938 (58.454)	Top-5 acc 83.203 (80.126)	lr 0.01455
Train [54][2300/3239]	Time 0.248 (0.864)	Data Time 0.001 (0.383)	Loss 2.7674 (2.7162)	Entropy 0.63152 (0.63259)	Top-1 acc 57.031 (58.455)	Top-5 acc 78.906 (80.122)	lr 0.01455
Train [54][2310/3239]	Time 0.243 (0.870)	Data Time 0.001 (0.390)	Loss 2.7544 (2.7164)	Entropy 0.63171 (0.63258)	Top-1 acc 55.469 (58.450)	Top-5 acc 81.250 (80.119)	lr 0.01455
Train [54][2320/3239]	Time 3.893 (0.870)	Data Time 3.557 (0.389)	Loss 2.8828 (2.7165)	Entropy 0.63168 (0.63258)	Top-1 acc 48.047 (58.441)	Top-5 acc 78.516 (80.115)	lr 0.01455
Train [54][2330/3239]	Time 0.252 (0.869)	Data Time 0.001 (0.388)	Loss 2.7123 (2.7168)	Entropy 0.63184 (0.63258)	Top-1 acc 59.375 (58.432)	Top-5 acc 80.859 (80.111)	lr 0.01455
Train [54][2340/3239]	Time 0.248 (0.876)	Data Time 0.001 (0.396)	Loss 2.6342 (2.7169)	Entropy 0.63190 (0.63257)	Top-1 acc 61.719 (58.438)	Top-5 acc 82.812 (80.109)	lr 0.01455
Train [54][2350/3239]	Time 0.242 (0.875)	Data Time 0.001 (0.395)	Loss 2.7156 (2.7167)	Entropy 0.63201 (0.63257)	Top-1 acc 60.938 (58.439)	Top-5 acc 80.469 (80.108)	lr 0.01454
Train [54][2360/3239]	Time 0.235 (0.874)	Data Time 0.001 (0.394)	Loss 2.5294 (2.7165)	Entropy 0.63185 (0.63257)	Top-1 acc 60.156 (58.442)	Top-5 acc 86.719 (80.116)	lr 0.01454
Train [54][2370/3239]	Time 0.252 (0.880)	Data Time 0.001 (0.400)	Loss 2.6070 (2.7166)	Entropy 0.63178 (0.63257)	Top-1 acc 60.547 (58.438)	Top-5 acc 82.812 (80.112)	lr 0.01454
Train [54][2380/3239]	Time 0.235 (0.882)	Data Time 0.001 (0.403)	Loss 2.7126 (2.7163)	Entropy 0.63196 (0.63256)	Top-1 acc 56.250 (58.443)	Top-5 acc 79.688 (80.118)	lr 0.01454
Train [54][2390/3239]	Time 0.328 (0.880)	Data Time 0.001 (0.401)	Loss 2.7700 (2.7162)	Entropy 0.63204 (0.63256)	Top-1 acc 60.156 (58.446)	Top-5 acc 78.516 (80.120)	lr 0.01454
Train [54][2400/3239]	Time 0.255 (0.878)	Data Time 0.001 (0.399)	Loss 2.5937 (2.7161)	Entropy 0.63212 (0.63256)	Top-1 acc 60.156 (58.446)	Top-5 acc 82.812 (80.123)	lr 0.01454
Train [54][2410/3239]	Time 0.253 (0.887)	Data Time 0.001 (0.409)	Loss 2.6931 (2.7160)	Entropy 0.63180 (0.63256)	Top-1 acc 62.891 (58.454)	Top-5 acc 79.297 (80.126)	lr 0.01454
Train [54][2420/3239]	Time 0.246 (0.885)	Data Time 0.001 (0.408)	Loss 2.7603 (2.7160)	Entropy 0.63170 (0.63255)	Top-1 acc 59.766 (58.454)	Top-5 acc 80.078 (80.125)	lr 0.01454
Train [54][2430/3239]	Time 0.242 (0.884)	Data Time 0.001 (0.406)	Loss 2.5416 (2.7157)	Entropy 0.63172 (0.63255)	Top-1 acc 58.984 (58.461)	Top-5 acc 83.594 (80.133)	lr 0.01454
Train [54][2440/3239]	Time 0.248 (0.894)	Data Time 0.001 (0.417)	Loss 2.8995 (2.7158)	Entropy 0.63133 (0.63255)	Top-1 acc 57.031 (58.459)	Top-5 acc 78.125 (80.133)	lr 0.01454
Train [54][2450/3239]	Time 0.231 (0.892)	Data Time 0.001 (0.415)	Loss 2.7465 (2.7160)	Entropy 0.63146 (0.63254)	Top-1 acc 56.250 (58.451)	Top-5 acc 79.297 (80.128)	lr 0.01453
Train [54][2460/3239]	Time 0.223 (0.890)	Data Time 0.001 (0.413)	Loss 2.7248 (2.7161)	Entropy 0.63165 (0.63254)	Top-1 acc 57.031 (58.442)	Top-5 acc 78.516 (80.123)	lr 0.01453
Train [54][2470/3239]	Time 0.241 (0.898)	Data Time 0.001 (0.422)	Loss 2.8552 (2.7162)	Entropy 0.63173 (0.63253)	Top-1 acc 54.297 (58.444)	Top-5 acc 75.781 (80.122)	lr 0.01453
Train [54][2480/3239]	Time 0.534 (0.910)	Data Time 0.004 (0.420)	Loss 2.7547 (2.7163)	Entropy 0.63198 (0.63253)	Top-1 acc 56.250 (58.442)	Top-5 acc 79.297 (80.119)	lr 0.01453
Train [54][2490/3239]	Time 0.247 (0.908)	Data Time 0.002 (0.418)	Loss 2.9277 (2.7163)	Entropy 0.63198 (0.63253)	Top-1 acc 53.125 (58.441)	Top-5 acc 76.562 (80.119)	lr 0.01453
Train [54][2500/3239]	Time 0.237 (0.907)	Data Time 0.001 (0.417)	Loss 2.5848 (2.7163)	Entropy 0.63209 (0.63253)	Top-1 acc 64.062 (58.440)	Top-5 acc 83.203 (80.120)	lr 0.01453
Train [54][2510/3239]	Time 0.243 (0.905)	Data Time 0.001 (0.415)	Loss 2.5787 (2.7165)	Entropy 0.63206 (0.63252)	Top-1 acc 57.422 (58.436)	Top-5 acc 84.375 (80.117)	lr 0.01453
Train [54][2520/3239]	Time 0.239 (0.903)	Data Time 0.001 (0.413)	Loss 2.9747 (2.7164)	Entropy 0.63174 (0.63252)	Top-1 acc 54.297 (58.441)	Top-5 acc 79.297 (80.117)	lr 0.01453
Train [54][2530/3239]	Time 0.241 (0.908)	Data Time 0.001 (0.419)	Loss 2.5257 (2.7164)	Entropy 0.63170 (0.63252)	Top-1 acc 62.109 (58.442)	Top-5 acc 84.375 (80.119)	lr 0.01453
Train [54][2540/3239]	Time 0.267 (0.908)	Data Time 0.001 (0.419)	Loss 2.7794 (2.7164)	Entropy 0.63083 (0.63251)	Top-1 acc 57.422 (58.442)	Top-5 acc 78.125 (80.119)	lr 0.01453
Train [54][2550/3239]	Time 0.352 (0.906)	Data Time 0.001 (0.418)	Loss 2.6328 (2.7163)	Entropy 0.63074 (0.63251)	Top-1 acc 63.281 (58.447)	Top-5 acc 82.031 (80.117)	lr 0.01452
Train [54][2560/3239]	Time 0.252 (0.905)	Data Time 0.001 (0.416)	Loss 2.6282 (2.7166)	Entropy 0.63038 (0.63250)	Top-1 acc 59.766 (58.441)	Top-5 acc 81.641 (80.112)	lr 0.01452
Train [54][2570/3239]	Time 0.248 (0.914)	Data Time 0.001 (0.426)	Loss 2.7810 (2.7167)	Entropy 0.63034 (0.63249)	Top-1 acc 61.328 (58.437)	Top-5 acc 81.250 (80.111)	lr 0.01452
Train [54][2580/3239]	Time 0.231 (0.912)	Data Time 0.001 (0.424)	Loss 2.8355 (2.7164)	Entropy 0.62957 (0.63248)	Top-1 acc 57.031 (58.444)	Top-5 acc 80.859 (80.118)	lr 0.01452
Train [54][2590/3239]	Time 0.251 (0.912)	Data Time 0.001 (0.424)	Loss 2.8226 (2.7163)	Entropy 0.62922 (0.63247)	Top-1 acc 58.203 (58.447)	Top-5 acc 77.734 (80.119)	lr 0.01452
Train [54][2600/3239]	Time 0.259 (0.921)	Data Time 0.002 (0.433)	Loss 2.7750 (2.7162)	Entropy 0.62954 (0.63246)	Top-1 acc 58.984 (58.450)	Top-5 acc 78.516 (80.123)	lr 0.01452
Train [54][2610/3239]	Time 0.275 (0.919)	Data Time 0.001 (0.432)	Loss 2.6528 (2.7161)	Entropy 0.62968 (0.63245)	Top-1 acc 61.719 (58.453)	Top-5 acc 79.297 (80.127)	lr 0.01452
Train [54][2620/3239]	Time 0.287 (0.917)	Data Time 0.001 (0.430)	Loss 2.8020 (2.7160)	Entropy 0.62956 (0.63244)	Top-1 acc 56.641 (58.458)	Top-5 acc 80.859 (80.131)	lr 0.01452
Train [54][2630/3239]	Time 0.243 (0.924)	Data Time 0.001 (0.437)	Loss 2.6903 (2.7161)	Entropy 0.62969 (0.63243)	Top-1 acc 57.031 (58.457)	Top-5 acc 80.469 (80.132)	lr 0.01452
Train [54][2640/3239]	Time 0.330 (0.923)	Data Time 0.001 (0.436)	Loss 2.8252 (2.7162)	Entropy 0.62967 (0.63241)	Top-1 acc 57.422 (58.453)	Top-5 acc 80.859 (80.129)	lr 0.01452
Train [54][2650/3239]	Time 0.246 (0.922)	Data Time 0.001 (0.435)	Loss 2.6499 (2.7161)	Entropy 0.62946 (0.63240)	Top-1 acc 56.641 (58.456)	Top-5 acc 82.031 (80.130)	lr 0.01451
Train [54][2660/3239]	Time 0.253 (0.931)	Data Time 0.001 (0.444)	Loss 2.6775 (2.7160)	Entropy 0.62962 (0.63239)	Top-1 acc 57.812 (58.456)	Top-5 acc 81.250 (80.131)	lr 0.01451
Train [54][2670/3239]	Time 0.228 (0.931)	Data Time 0.001 (0.445)	Loss 2.7335 (2.7162)	Entropy 0.62950 (0.63238)	Top-1 acc 62.891 (58.456)	Top-5 acc 80.859 (80.129)	lr 0.01451
Train [54][2680/3239]	Time 0.238 (0.929)	Data Time 0.001 (0.443)	Loss 2.7616 (2.7163)	Entropy 0.62968 (0.63237)	Top-1 acc 55.859 (58.454)	Top-5 acc 82.422 (80.125)	lr 0.01451
Train [54][2690/3239]	Time 0.276 (0.935)	Data Time 0.003 (0.449)	Loss 2.5456 (2.7162)	Entropy 0.62944 (0.63236)	Top-1 acc 63.281 (58.457)	Top-5 acc 84.766 (80.130)	lr 0.01451
Train [54][2700/3239]	Time 0.246 (0.938)	Data Time 0.002 (0.453)	Loss 2.8127 (2.7161)	Entropy 0.62954 (0.63235)	Top-1 acc 56.250 (58.460)	Top-5 acc 76.953 (80.130)	lr 0.01451
Train [54][2710/3239]	Time 0.395 (0.936)	Data Time 0.002 (0.451)	Loss 2.5632 (2.7160)	Entropy 0.62950 (0.63234)	Top-1 acc 62.109 (58.462)	Top-5 acc 84.375 (80.130)	lr 0.01451
Train [54][2720/3239]	Time 0.237 (0.934)	Data Time 0.001 (0.449)	Loss 2.6366 (2.7159)	Entropy 0.62973 (0.63233)	Top-1 acc 61.328 (58.458)	Top-5 acc 79.688 (80.136)	lr 0.01451
Train [54][2730/3239]	Time 0.246 (0.944)	Data Time 0.001 (0.460)	Loss 2.6145 (2.7159)	Entropy 0.62956 (0.63232)	Top-1 acc 60.938 (58.460)	Top-5 acc 82.031 (80.139)	lr 0.01451
Train [54][2740/3239]	Time 0.243 (0.942)	Data Time 0.001 (0.458)	Loss 2.5656 (2.7158)	Entropy 0.62946 (0.63231)	Top-1 acc 59.766 (58.458)	Top-5 acc 83.203 (80.140)	lr 0.01451
Train [54][2750/3239]	Time 0.250 (0.941)	Data Time 0.001 (0.456)	Loss 2.5832 (2.7158)	Entropy 0.62946 (0.63230)	Top-1 acc 66.406 (58.460)	Top-5 acc 85.547 (80.142)	lr 0.01450
Train [54][2760/3239]	Time 0.233 (0.948)	Data Time 0.001 (0.464)	Loss 2.8210 (2.7159)	Entropy 0.62924 (0.63229)	Top-1 acc 53.906 (58.458)	Top-5 acc 76.953 (80.142)	lr 0.01450
Train [54][2770/3239]	Time 0.269 (0.946)	Data Time 0.001 (0.462)	Loss 2.6540 (2.7159)	Entropy 0.62916 (0.63228)	Top-1 acc 57.812 (58.454)	Top-5 acc 79.688 (80.141)	lr 0.01450
Train [54][2780/3239]	Time 0.252 (0.945)	Data Time 0.001 (0.461)	Loss 2.6582 (2.7158)	Entropy 0.62909 (0.63227)	Top-1 acc 58.984 (58.454)	Top-5 acc 80.469 (80.141)	lr 0.01450
Train [54][2790/3239]	Time 0.322 (0.949)	Data Time 0.001 (0.466)	Loss 2.6059 (2.7162)	Entropy 0.62955 (0.63226)	Top-1 acc 59.375 (58.446)	Top-5 acc 85.156 (80.136)	lr 0.01450
Train [54][2800/3239]	Time 0.231 (0.947)	Data Time 0.001 (0.464)	Loss 2.7866 (2.7160)	Entropy 0.62968 (0.63225)	Top-1 acc 59.766 (58.450)	Top-5 acc 78.906 (80.142)	lr 0.01450
Train [54][2810/3239]	Time 0.215 (0.945)	Data Time 0.001 (0.462)	Loss 2.5826 (2.7162)	Entropy 0.62960 (0.63224)	Top-1 acc 62.891 (58.447)	Top-5 acc 82.031 (80.142)	lr 0.01450
Train [54][2820/3239]	Time 0.235 (0.948)	Data Time 0.001 (0.465)	Loss 2.7658 (2.7161)	Entropy 0.62925 (0.63223)	Top-1 acc 58.984 (58.444)	Top-5 acc 78.516 (80.142)	lr 0.01450
Train [54][2830/3239]	Time 0.258 (0.946)	Data Time 0.001 (0.463)	Loss 2.8701 (2.7161)	Entropy 0.62926 (0.63222)	Top-1 acc 54.297 (58.443)	Top-5 acc 78.516 (80.144)	lr 0.01450
Train [54][2840/3239]	Time 0.237 (0.944)	Data Time 0.001 (0.462)	Loss 2.6923 (2.7160)	Entropy 0.62921 (0.63221)	Top-1 acc 56.641 (58.445)	Top-5 acc 80.078 (80.144)	lr 0.01450
Train [54][2850/3239]	Time 0.246 (0.952)	Data Time 0.001 (0.469)	Loss 3.0106 (2.7162)	Entropy 0.62933 (0.63220)	Top-1 acc 51.172 (58.438)	Top-5 acc 75.000 (80.140)	lr 0.01449
Train [54][2860/3239]	Time 0.236 (0.950)	Data Time 0.001 (0.468)	Loss 2.7517 (2.7165)	Entropy 0.62932 (0.63219)	Top-1 acc 57.812 (58.433)	Top-5 acc 78.906 (80.134)	lr 0.01449
Train [54][2870/3239]	Time 0.341 (0.948)	Data Time 0.001 (0.466)	Loss 2.6686 (2.7167)	Entropy 0.62920 (0.63218)	Top-1 acc 57.031 (58.426)	Top-5 acc 83.984 (80.130)	lr 0.01449
Train [54][2880/3239]	Time 0.257 (0.946)	Data Time 0.001 (0.465)	Loss 2.7072 (2.7168)	Entropy 0.62926 (0.63217)	Top-1 acc 62.891 (58.425)	Top-5 acc 80.469 (80.130)	lr 0.01449
Train [54][2890/3239]	Time 0.235 (0.953)	Data Time 0.001 (0.471)	Loss 2.7698 (2.7167)	Entropy 0.62929 (0.63216)	Top-1 acc 59.375 (58.428)	Top-5 acc 78.906 (80.131)	lr 0.01449
Train [54][2900/3239]	Time 0.272 (0.951)	Data Time 0.002 (0.470)	Loss 2.5521 (2.7165)	Entropy 0.62956 (0.63215)	Top-1 acc 63.281 (58.436)	Top-5 acc 83.203 (80.134)	lr 0.01449
Train [54][2910/3239]	Time 0.235 (0.949)	Data Time 0.001 (0.468)	Loss 2.5802 (2.7164)	Entropy 0.62946 (0.63214)	Top-1 acc 57.422 (58.436)	Top-5 acc 81.641 (80.136)	lr 0.01449
Train [54][2920/3239]	Time 0.254 (0.956)	Data Time 0.001 (0.475)	Loss 2.8480 (2.7165)	Entropy 0.62939 (0.63213)	Top-1 acc 54.688 (58.438)	Top-5 acc 77.734 (80.137)	lr 0.01449
Train [54][2930/3239]	Time 0.236 (0.954)	Data Time 0.001 (0.474)	Loss 2.7366 (2.7164)	Entropy 0.62929 (0.63212)	Top-1 acc 58.984 (58.439)	Top-5 acc 79.297 (80.136)	lr 0.01449
Train [54][2940/3239]	Time 0.346 (0.953)	Data Time 0.001 (0.473)	Loss 2.6718 (2.7164)	Entropy 0.62925 (0.63211)	Top-1 acc 64.062 (58.442)	Top-5 acc 78.516 (80.133)	lr 0.01449
Train [54][2950/3239]	Time 0.234 (0.959)	Data Time 0.001 (0.479)	Loss 2.8267 (2.7164)	Entropy 0.62929 (0.63210)	Top-1 acc 54.688 (58.441)	Top-5 acc 79.297 (80.134)	lr 0.01448
Train [54][2960/3239]	Time 0.256 (0.957)	Data Time 0.001 (0.477)	Loss 2.8661 (2.7165)	Entropy 0.62914 (0.63209)	Top-1 acc 55.859 (58.440)	Top-5 acc 75.000 (80.129)	lr 0.01448
Train [54][2970/3239]	Time 0.267 (0.955)	Data Time 0.001 (0.476)	Loss 2.6188 (2.7164)	Entropy 0.62876 (0.63208)	Top-1 acc 60.547 (58.444)	Top-5 acc 82.031 (80.132)	lr 0.01448
Train [54][2980/3239]	Time 0.223 (0.958)	Data Time 0.001 (0.479)	Loss 2.8129 (2.7165)	Entropy 0.62881 (0.63207)	Top-1 acc 55.469 (58.439)	Top-5 acc 76.953 (80.130)	lr 0.01448
Train [54][2990/3239]	Time 0.228 (0.956)	Data Time 0.001 (0.477)	Loss 2.6944 (2.7165)	Entropy 0.62912 (0.63206)	Top-1 acc 60.156 (58.441)	Top-5 acc 78.516 (80.130)	lr 0.01448
Train [54][3000/3239]	Time 0.273 (0.955)	Data Time 0.001 (0.476)	Loss 2.6883 (2.7164)	Entropy 0.62906 (0.63205)	Top-1 acc 60.938 (58.441)	Top-5 acc 81.641 (80.132)	lr 0.01448
Train [54][3010/3239]	Time 0.248 (0.957)	Data Time 0.001 (0.478)	Loss 2.8227 (2.7166)	Entropy 0.62937 (0.63204)	Top-1 acc 56.250 (58.439)	Top-5 acc 78.125 (80.131)	lr 0.01448
Train [54][3020/3239]	Time 0.235 (0.955)	Data Time 0.001 (0.476)	Loss 2.7958 (2.7166)	Entropy 0.62952 (0.63203)	Top-1 acc 57.031 (58.441)	Top-5 acc 77.734 (80.132)	lr 0.01448
Train [54][3030/3239]	Time 0.345 (0.953)	Data Time 0.001 (0.475)	Loss 2.6747 (2.7165)	Entropy 0.62963 (0.63202)	Top-1 acc 62.109 (58.442)	Top-5 acc 80.078 (80.133)	lr 0.01448
Train [54][3040/3239]	Time 0.230 (0.952)	Data Time 0.001 (0.473)	Loss 2.9013 (2.7163)	Entropy 0.62964 (0.63201)	Top-1 acc 50.781 (58.443)	Top-5 acc 76.562 (80.136)	lr 0.01448
Train [54][3050/3239]	Time 0.255 (0.953)	Data Time 0.001 (0.475)	Loss 2.6159 (2.7162)	Entropy 0.62944 (0.63201)	Top-1 acc 60.547 (58.446)	Top-5 acc 83.203 (80.136)	lr 0.01447
Train [54][3060/3239]	Time 0.229 (0.952)	Data Time 0.001 (0.474)	Loss 2.8987 (2.7161)	Entropy 0.62935 (0.63200)	Top-1 acc 52.734 (58.446)	Top-5 acc 74.609 (80.137)	lr 0.01447
Train [54][3070/3239]	Time 0.237 (0.950)	Data Time 0.001 (0.472)	Loss 2.8523 (2.7162)	Entropy 0.62962 (0.63199)	Top-1 acc 53.516 (58.443)	Top-5 acc 80.078 (80.137)	lr 0.01447
Train [54][3080/3239]	Time 0.243 (0.952)	Data Time 0.001 (0.474)	Loss 2.6139 (2.7162)	Entropy 0.62979 (0.63198)	Top-1 acc 60.938 (58.445)	Top-5 acc 82.031 (80.138)	lr 0.01447
Train [54][3090/3239]	Time 0.233 (0.950)	Data Time 0.001 (0.473)	Loss 2.6642 (2.7161)	Entropy 0.62990 (0.63197)	Top-1 acc 59.766 (58.446)	Top-5 acc 82.812 (80.138)	lr 0.01447
Train [54][3100/3239]	Time 0.341 (0.948)	Data Time 0.001 (0.471)	Loss 2.6463 (2.7162)	Entropy 0.63020 (0.63197)	Top-1 acc 58.984 (58.444)	Top-5 acc 81.250 (80.136)	lr 0.01447
Train [54][3110/3239]	Time 0.260 (0.952)	Data Time 0.001 (0.475)	Loss 2.7059 (2.7164)	Entropy 0.63001 (0.63196)	Top-1 acc 62.109 (58.443)	Top-5 acc 79.688 (80.133)	lr 0.01447
Train [54][3120/3239]	Time 0.252 (0.950)	Data Time 0.001 (0.473)	Loss 2.6305 (2.7166)	Entropy 0.62995 (0.63196)	Top-1 acc 62.891 (58.439)	Top-5 acc 81.641 (80.129)	lr 0.01447
Train [54][3130/3239]	Time 0.244 (0.948)	Data Time 0.001 (0.472)	Loss 2.8192 (2.7167)	Entropy 0.62953 (0.63195)	Top-1 acc 54.297 (58.435)	Top-5 acc 82.031 (80.129)	lr 0.01447
Train [54][3140/3239]	Time 0.434 (0.957)	Data Time 0.004 (0.470)	Loss 2.8456 (2.7170)	Entropy 0.62942 (0.63194)	Top-1 acc 56.250 (58.430)	Top-5 acc 78.516 (80.122)	lr 0.01447
Train [54][3150/3239]	Time 0.259 (0.956)	Data Time 0.002 (0.469)	Loss 2.7139 (2.7172)	Entropy 0.62973 (0.63193)	Top-1 acc 61.719 (58.425)	Top-5 acc 82.031 (80.123)	lr 0.01446
Train [54][3160/3239]	Time 0.245 (0.954)	Data Time 0.002 (0.467)	Loss 2.5814 (2.7171)	Entropy 0.62951 (0.63193)	Top-1 acc 60.547 (58.426)	Top-5 acc 80.859 (80.124)	lr 0.01446
Train [54][3170/3239]	Time 0.261 (0.956)	Data Time 0.001 (0.469)	Loss 2.5760 (2.7170)	Entropy 0.62972 (0.63192)	Top-1 acc 62.891 (58.433)	Top-5 acc 82.812 (80.125)	lr 0.01446
Train [54][3180/3239]	Time 0.240 (0.955)	Data Time 0.000 (0.468)	Loss 2.7197 (2.7168)	Entropy 0.62984 (0.63191)	Top-1 acc 57.812 (58.440)	Top-5 acc 79.688 (80.129)	lr 0.01446
Train [54][3190/3239]	Time 0.343 (0.953)	Data Time 0.000 (0.466)	Loss 2.8722 (2.7168)	Entropy 0.62972 (0.63191)	Top-1 acc 55.469 (58.442)	Top-5 acc 76.172 (80.129)	lr 0.01446
Train [54][3200/3239]	Time 0.275 (0.953)	Data Time 0.000 (0.467)	Loss 2.6476 (2.7170)	Entropy 0.62982 (0.63190)	Top-1 acc 56.250 (58.431)	Top-5 acc 80.469 (80.125)	lr 0.01446
Train [54][3210/3239]	Time 0.236 (0.957)	Data Time 0.000 (0.471)	Loss 2.7605 (2.7172)	Entropy 0.62969 (0.63189)	Top-1 acc 59.766 (58.429)	Top-5 acc 79.688 (80.120)	lr 0.01446
Train [54][3220/3239]	Time 0.245 (0.955)	Data Time 0.000 (0.469)	Loss 2.7893 (2.7171)	Entropy 0.62971 (0.63189)	Top-1 acc 60.547 (58.434)	Top-5 acc 78.906 (80.121)	lr 0.01446
Train [54][3230/3239]	Time 0.238 (0.954)	Data Time 0.000 (0.468)	Loss 2.7399 (2.7169)	Entropy 0.62958 (0.63188)	Top-1 acc 58.984 (58.442)	Top-5 acc 80.469 (80.125)	lr 0.01446
Train [54][3239/3239]	Time 0.989 (0.956)	Data Time 0.000 (0.470)	Loss 3.1017 (2.7170)	Entropy 0.62964 (0.63187)	Top-1 acc 53.086 (58.441)	Top-5 acc 76.543 (80.123)	lr 0.01446
==========Valid [54/120]	loss 1.459	top-1 acc 66.433 (66.433)	top-5 acc 86.680	Train top-1 58.441	top-5 80.123	Entropy 0.62964	Latency-None: 0.000ms	Flops: 538.40M
Train [55][0/3239]	Time 37.686 (37.686)	Data Time 36.195 (36.195)	Loss 2.6173 (2.6173)	Entropy 0.62962 (0.62962)	Top-1 acc 61.328 (61.328)	Top-5 acc 83.203 (83.203)	lr 0.01446
Train [55][10/3239]	Time 0.241 (3.931)	Data Time 0.001 (3.384)	Loss 2.6639 (2.6892)	Entropy 0.62961 (0.62960)	Top-1 acc 62.109 (59.233)	Top-5 acc 81.250 (81.001)	lr 0.01445
Train [55][20/3239]	Time 0.350 (2.301)	Data Time 0.001 (1.774)	Loss 2.5372 (2.6875)	Entropy 0.62951 (0.62956)	Top-1 acc 62.891 (59.859)	Top-5 acc 82.812 (80.971)	lr 0.01445
Train [55][30/3239]	Time 0.258 (1.693)	Data Time 0.002 (1.202)	Loss 2.5612 (2.6955)	Entropy 0.62952 (0.62951)	Top-1 acc 62.891 (59.400)	Top-5 acc 80.859 (80.733)	lr 0.01445
Train [55][40/3239]	Time 0.259 (1.395)	Data Time 0.001 (0.909)	Loss 2.4313 (2.6871)	Entropy 0.62918 (0.62944)	Top-1 acc 66.406 (59.747)	Top-5 acc 84.766 (80.707)	lr 0.01445
Train [55][50/3239]	Time 0.247 (1.235)	Data Time 0.001 (0.731)	Loss 2.7314 (2.6889)	Entropy 0.62919 (0.62937)	Top-1 acc 58.594 (59.505)	Top-5 acc 80.078 (80.507)	lr 0.01445
Train [55][60/3239]	Time 0.229 (1.103)	Data Time 0.001 (0.612)	Loss 2.5653 (2.6899)	Entropy 0.62904 (0.62933)	Top-1 acc 60.547 (59.253)	Top-5 acc 80.859 (80.520)	lr 0.01445
Train [55][70/3239]	Time 0.281 (1.016)	Data Time 0.002 (0.526)	Loss 2.7586 (2.6858)	Entropy 0.62917 (0.62930)	Top-1 acc 58.594 (59.369)	Top-5 acc 79.297 (80.733)	lr 0.01445
Train [55][80/3239]	Time 0.239 (0.956)	Data Time 0.001 (0.461)	Loss 2.7519 (2.6858)	Entropy 0.62875 (0.62925)	Top-1 acc 58.594 (59.365)	Top-5 acc 80.859 (80.734)	lr 0.01445
Train [55][90/3239]	Time 0.352 (0.899)	Data Time 0.002 (0.411)	Loss 2.5619 (2.6849)	Entropy 0.62886 (0.62919)	Top-1 acc 62.109 (59.323)	Top-5 acc 83.203 (80.726)	lr 0.01445
Train [55][100/3239]	Time 0.233 (0.853)	Data Time 0.001 (0.370)	Loss 2.6580 (2.6863)	Entropy 0.62910 (0.62916)	Top-1 acc 62.500 (59.329)	Top-5 acc 83.203 (80.736)	lr 0.01445
Train [55][110/3239]	Time 0.253 (0.817)	Data Time 0.001 (0.337)	Loss 2.7447 (2.6868)	Entropy 0.62898 (0.62915)	Top-1 acc 59.766 (59.280)	Top-5 acc 80.469 (80.771)	lr 0.01444
Train [55][120/3239]	Time 0.256 (0.790)	Data Time 0.002 (0.309)	Loss 2.6248 (2.6919)	Entropy 0.62862 (0.62913)	Top-1 acc 58.984 (59.175)	Top-5 acc 81.250 (80.669)	lr 0.01444
Train [55][130/3239]	Time 0.300 (0.764)	Data Time 0.001 (0.286)	Loss 3.1261 (2.6935)	Entropy 0.62839 (0.62908)	Top-1 acc 48.047 (59.095)	Top-5 acc 71.875 (80.621)	lr 0.01444
Train [55][140/3239]	Time 0.236 (0.743)	Data Time 0.001 (0.266)	Loss 2.7020 (2.6995)	Entropy 0.62851 (0.62904)	Top-1 acc 57.422 (58.971)	Top-5 acc 82.812 (80.505)	lr 0.01444
Train [55][150/3239]	Time 0.270 (0.723)	Data Time 0.001 (0.248)	Loss 2.8349 (2.6958)	Entropy 0.62859 (0.62900)	Top-1 acc 54.688 (59.039)	Top-5 acc 76.562 (80.544)	lr 0.01444
Train [55][160/3239]	Time 0.294 (0.708)	Data Time 0.001 (0.233)	Loss 2.6082 (2.6949)	Entropy 0.62843 (0.62897)	Top-1 acc 60.547 (59.026)	Top-5 acc 82.422 (80.580)	lr 0.01444
Train [55][170/3239]	Time 0.237 (0.692)	Data Time 0.001 (0.219)	Loss 2.7933 (2.6959)	Entropy 0.62812 (0.62894)	Top-1 acc 57.422 (59.019)	Top-5 acc 78.516 (80.597)	lr 0.01444
Train [55][180/3239]	Time 0.282 (0.679)	Data Time 0.001 (0.207)	Loss 2.8681 (2.6947)	Entropy 0.62801 (0.62888)	Top-1 acc 56.641 (59.021)	Top-5 acc 76.953 (80.628)	lr 0.01444
Train [55][190/3239]	Time 0.246 (0.667)	Data Time 0.001 (0.197)	Loss 2.7779 (2.6979)	Entropy 0.62813 (0.62884)	Top-1 acc 57.422 (58.903)	Top-5 acc 78.906 (80.573)	lr 0.01444
Train [55][200/3239]	Time 0.246 (0.656)	Data Time 0.001 (0.187)	Loss 2.6549 (2.6970)	Entropy 0.62826 (0.62881)	Top-1 acc 61.328 (58.953)	Top-5 acc 80.469 (80.603)	lr 0.01444
Train [55][210/3239]	Time 0.246 (0.650)	Data Time 0.002 (0.178)	Loss 2.8215 (2.6989)	Entropy 0.62825 (0.62877)	Top-1 acc 57.031 (58.914)	Top-5 acc 76.562 (80.545)	lr 0.01443
Train [55][220/3239]	Time 0.321 (0.640)	Data Time 0.001 (0.170)	Loss 2.4612 (2.6989)	Entropy 0.62835 (0.62875)	Top-1 acc 65.625 (58.935)	Top-5 acc 83.984 (80.554)	lr 0.01443
Train [55][230/3239]	Time 0.309 (0.632)	Data Time 0.001 (0.163)	Loss 2.7557 (2.6970)	Entropy 0.62835 (0.62873)	Top-1 acc 56.250 (58.956)	Top-5 acc 78.516 (80.570)	lr 0.01443
Train [55][240/3239]	Time 0.220 (0.623)	Data Time 0.001 (0.156)	Loss 2.9184 (2.6979)	Entropy 0.62823 (0.62872)	Top-1 acc 53.516 (58.945)	Top-5 acc 78.906 (80.564)	lr 0.01443
Train [55][250/3239]	Time 0.422 (0.616)	Data Time 0.001 (0.150)	Loss 2.7341 (2.7018)	Entropy 0.62805 (0.62870)	Top-1 acc 60.938 (58.877)	Top-5 acc 79.688 (80.491)	lr 0.01443
Train [55][260/3239]	Time 0.267 (0.609)	Data Time 0.001 (0.144)	Loss 2.7262 (2.7013)	Entropy 0.62826 (0.62868)	Top-1 acc 58.984 (58.874)	Top-5 acc 81.250 (80.556)	lr 0.01443
Train [55][270/3239]	Time 0.299 (0.604)	Data Time 0.002 (0.139)	Loss 2.7549 (2.7010)	Entropy 0.62852 (0.62867)	Top-1 acc 59.375 (58.889)	Top-5 acc 80.469 (80.548)	lr 0.01443
Train [55][280/3239]	Time 0.226 (0.598)	Data Time 0.001 (0.134)	Loss 2.6176 (2.7007)	Entropy 0.62869 (0.62867)	Top-1 acc 63.281 (58.897)	Top-5 acc 81.250 (80.545)	lr 0.01443
Train [55][290/3239]	Time 0.242 (0.591)	Data Time 0.001 (0.130)	Loss 2.6957 (2.7023)	Entropy 0.62884 (0.62867)	Top-1 acc 59.766 (58.865)	Top-5 acc 82.422 (80.514)	lr 0.01443
Train [55][300/3239]	Time 0.245 (0.587)	Data Time 0.001 (0.125)	Loss 2.8031 (2.7046)	Entropy 0.62904 (0.62867)	Top-1 acc 55.469 (58.801)	Top-5 acc 80.469 (80.473)	lr 0.01443
Train [55][310/3239]	Time 0.326 (0.583)	Data Time 0.038 (0.122)	Loss 2.3601 (2.7022)	Entropy 0.62883 (0.62868)	Top-1 acc 67.188 (58.841)	Top-5 acc 88.672 (80.514)	lr 0.01442
Train [55][320/3239]	Time 0.397 (0.579)	Data Time 0.001 (0.118)	Loss 2.5570 (2.7027)	Entropy 0.62901 (0.62869)	Top-1 acc 64.844 (58.841)	Top-5 acc 83.594 (80.506)	lr 0.01442
Train [55][330/3239]	Time 0.254 (0.575)	Data Time 0.001 (0.114)	Loss 2.6164 (2.7039)	Entropy 0.62892 (0.62870)	Top-1 acc 59.766 (58.840)	Top-5 acc 83.594 (80.485)	lr 0.01442
Train [55][340/3239]	Time 0.255 (0.570)	Data Time 0.001 (0.111)	Loss 2.7625 (2.7032)	Entropy 0.62823 (0.62870)	Top-1 acc 57.031 (58.860)	Top-5 acc 79.297 (80.486)	lr 0.01442
Train [55][350/3239]	Time 0.231 (0.567)	Data Time 0.001 (0.108)	Loss 2.6820 (2.7030)	Entropy 0.62850 (0.62869)	Top-1 acc 59.375 (58.850)	Top-5 acc 80.078 (80.502)	lr 0.01442
Train [55][360/3239]	Time 0.240 (0.563)	Data Time 0.001 (0.105)	Loss 2.6849 (2.7029)	Entropy 0.62857 (0.62868)	Top-1 acc 57.812 (58.846)	Top-5 acc 82.031 (80.513)	lr 0.01442
Train [55][370/3239]	Time 0.253 (0.561)	Data Time 0.001 (0.102)	Loss 2.5499 (2.7009)	Entropy 0.62895 (0.62868)	Top-1 acc 60.156 (58.871)	Top-5 acc 83.984 (80.559)	lr 0.01442
Train [55][380/3239]	Time 0.246 (0.558)	Data Time 0.001 (0.100)	Loss 2.7719 (2.7011)	Entropy 0.62899 (0.62869)	Top-1 acc 60.547 (58.867)	Top-5 acc 79.688 (80.534)	lr 0.01442
Train [55][390/3239]	Time 0.329 (0.555)	Data Time 0.002 (0.097)	Loss 2.6067 (2.7007)	Entropy 0.62882 (0.62870)	Top-1 acc 63.672 (58.878)	Top-5 acc 82.031 (80.525)	lr 0.01442
Train [55][400/3239]	Time 0.290 (0.552)	Data Time 0.001 (0.095)	Loss 2.7066 (2.6999)	Entropy 0.62920 (0.62870)	Top-1 acc 56.641 (58.877)	Top-5 acc 81.641 (80.531)	lr 0.01442
Train [55][410/3239]	Time 0.357 (0.549)	Data Time 0.001 (0.092)	Loss 2.5786 (2.7005)	Entropy 0.62917 (0.62872)	Top-1 acc 62.109 (58.876)	Top-5 acc 81.641 (80.517)	lr 0.01441
Train [55][420/3239]	Time 0.314 (0.547)	Data Time 0.002 (0.090)	Loss 2.5977 (2.7005)	Entropy 0.62919 (0.62873)	Top-1 acc 65.234 (58.881)	Top-5 acc 79.297 (80.517)	lr 0.01441
Train [55][430/3239]	Time 0.316 (0.545)	Data Time 0.003 (0.088)	Loss 2.7528 (2.6996)	Entropy 0.62839 (0.62873)	Top-1 acc 57.422 (58.889)	Top-5 acc 80.469 (80.531)	lr 0.01441
Train [55][440/3239]	Time 0.224 (0.544)	Data Time 0.002 (0.086)	Loss 2.7616 (2.6992)	Entropy 0.62854 (0.62872)	Top-1 acc 57.422 (58.912)	Top-5 acc 80.859 (80.533)	lr 0.01441
Train [55][450/3239]	Time 0.247 (0.542)	Data Time 0.001 (0.084)	Loss 2.9086 (2.6999)	Entropy 0.62838 (0.62872)	Top-1 acc 56.641 (58.894)	Top-5 acc 76.172 (80.520)	lr 0.01441
Train [55][460/3239]	Time 0.256 (0.540)	Data Time 0.001 (0.083)	Loss 2.5507 (2.6985)	Entropy 0.62843 (0.62871)	Top-1 acc 62.500 (58.920)	Top-5 acc 84.766 (80.550)	lr 0.01441
Train [55][470/3239]	Time 0.246 (0.538)	Data Time 0.001 (0.081)	Loss 2.6184 (2.6980)	Entropy 0.62848 (0.62870)	Top-1 acc 59.766 (58.942)	Top-5 acc 82.812 (80.559)	lr 0.01441
Train [55][480/3239]	Time 0.344 (0.536)	Data Time 0.001 (0.079)	Loss 2.5542 (2.6975)	Entropy 0.62844 (0.62870)	Top-1 acc 61.719 (58.966)	Top-5 acc 80.859 (80.574)	lr 0.01441
Train [55][490/3239]	Time 0.271 (0.534)	Data Time 0.001 (0.078)	Loss 2.7362 (2.6978)	Entropy 0.62817 (0.62869)	Top-1 acc 60.547 (58.941)	Top-5 acc 80.859 (80.581)	lr 0.01441
Train [55][500/3239]	Time 0.267 (0.532)	Data Time 0.001 (0.076)	Loss 2.7132 (2.6976)	Entropy 0.62836 (0.62868)	Top-1 acc 60.156 (58.962)	Top-5 acc 80.078 (80.583)	lr 0.01441
Train [55][510/3239]	Time 0.261 (0.530)	Data Time 0.001 (0.075)	Loss 2.7390 (2.6990)	Entropy 0.62820 (0.62868)	Top-1 acc 58.203 (58.934)	Top-5 acc 78.906 (80.544)	lr 0.01440
Train [55][520/3239]	Time 0.241 (0.528)	Data Time 0.001 (0.073)	Loss 2.9036 (2.7007)	Entropy 0.62839 (0.62867)	Top-1 acc 50.781 (58.878)	Top-5 acc 76.172 (80.519)	lr 0.01440
Train [55][530/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.072)	Loss 2.6054 (2.6998)	Entropy 0.62822 (0.62866)	Top-1 acc 60.156 (58.884)	Top-5 acc 83.594 (80.526)	lr 0.01440
Train [55][540/3239]	Time 0.245 (0.525)	Data Time 0.001 (0.071)	Loss 2.8080 (2.7002)	Entropy 0.62822 (0.62865)	Top-1 acc 56.250 (58.865)	Top-5 acc 76.562 (80.524)	lr 0.01440
Train [55][550/3239]	Time 0.336 (0.585)	Data Time 0.004 (0.069)	Loss 2.7310 (2.7006)	Entropy 0.62833 (0.62864)	Top-1 acc 55.859 (58.844)	Top-5 acc 79.297 (80.515)	lr 0.01440
Train [55][560/3239]	Time 0.255 (0.583)	Data Time 0.002 (0.068)	Loss 2.6177 (2.7008)	Entropy 0.62813 (0.62864)	Top-1 acc 62.891 (58.835)	Top-5 acc 80.859 (80.515)	lr 0.01440
Train [55][570/3239]	Time 0.324 (0.581)	Data Time 0.001 (0.067)	Loss 2.8195 (2.7005)	Entropy 0.62825 (0.62863)	Top-1 acc 53.906 (58.848)	Top-5 acc 78.516 (80.505)	lr 0.01440
Train [55][580/3239]	Time 0.259 (0.578)	Data Time 0.002 (0.066)	Loss 2.7326 (2.7000)	Entropy 0.62803 (0.62862)	Top-1 acc 55.859 (58.861)	Top-5 acc 79.688 (80.514)	lr 0.01440
Train [55][590/3239]	Time 0.243 (0.576)	Data Time 0.002 (0.065)	Loss 2.7349 (2.7005)	Entropy 0.62758 (0.62861)	Top-1 acc 59.766 (58.853)	Top-5 acc 79.688 (80.503)	lr 0.01440
Train [55][600/3239]	Time 0.249 (0.574)	Data Time 0.001 (0.064)	Loss 2.7315 (2.7013)	Entropy 0.62763 (0.62859)	Top-1 acc 53.125 (58.831)	Top-5 acc 80.859 (80.491)	lr 0.01440
Train [55][610/3239]	Time 0.256 (0.572)	Data Time 0.002 (0.063)	Loss 2.7355 (2.7000)	Entropy 0.62790 (0.62857)	Top-1 acc 59.375 (58.867)	Top-5 acc 81.641 (80.524)	lr 0.01439
Train [55][620/3239]	Time 0.249 (0.570)	Data Time 0.001 (0.062)	Loss 2.7392 (2.7003)	Entropy 0.62762 (0.62856)	Top-1 acc 59.375 (58.859)	Top-5 acc 76.953 (80.526)	lr 0.01439
Train [55][630/3239]	Time 0.252 (0.569)	Data Time 0.001 (0.061)	Loss 2.8246 (2.7013)	Entropy 0.62790 (0.62855)	Top-1 acc 58.203 (58.840)	Top-5 acc 80.859 (80.505)	lr 0.01439
Train [55][640/3239]	Time 0.377 (0.567)	Data Time 0.001 (0.060)	Loss 2.7566 (2.7006)	Entropy 0.62719 (0.62853)	Top-1 acc 57.812 (58.871)	Top-5 acc 80.859 (80.520)	lr 0.01439
Train [55][650/3239]	Time 0.256 (0.565)	Data Time 0.001 (0.059)	Loss 2.9887 (2.7019)	Entropy 0.62704 (0.62851)	Top-1 acc 52.344 (58.832)	Top-5 acc 74.609 (80.508)	lr 0.01439
Train [55][660/3239]	Time 0.239 (0.564)	Data Time 0.001 (0.058)	Loss 2.8603 (2.7027)	Entropy 0.62723 (0.62849)	Top-1 acc 58.594 (58.805)	Top-5 acc 75.391 (80.492)	lr 0.01439
Train [55][670/3239]	Time 0.265 (0.562)	Data Time 0.001 (0.057)	Loss 2.5653 (2.7030)	Entropy 0.62752 (0.62847)	Top-1 acc 63.281 (58.804)	Top-5 acc 80.078 (80.490)	lr 0.01439
Train [55][680/3239]	Time 0.237 (0.560)	Data Time 0.001 (0.056)	Loss 2.6388 (2.7037)	Entropy 0.62723 (0.62845)	Top-1 acc 60.938 (58.787)	Top-5 acc 80.859 (80.466)	lr 0.01439
Train [55][690/3239]	Time 0.232 (0.559)	Data Time 0.001 (0.056)	Loss 2.7613 (2.7042)	Entropy 0.62758 (0.62844)	Top-1 acc 55.469 (58.767)	Top-5 acc 81.641 (80.457)	lr 0.01439
Train [55][700/3239]	Time 0.243 (0.557)	Data Time 0.001 (0.055)	Loss 2.9535 (2.7043)	Entropy 0.62754 (0.62843)	Top-1 acc 56.641 (58.793)	Top-5 acc 76.172 (80.457)	lr 0.01439
Train [55][710/3239]	Time 0.263 (0.556)	Data Time 0.001 (0.054)	Loss 2.5469 (2.7044)	Entropy 0.62765 (0.62841)	Top-1 acc 63.281 (58.794)	Top-5 acc 83.203 (80.453)	lr 0.01438
Train [55][720/3239]	Time 0.377 (0.555)	Data Time 0.054 (0.054)	Loss 2.5297 (2.7039)	Entropy 0.62773 (0.62840)	Top-1 acc 63.281 (58.803)	Top-5 acc 86.328 (80.467)	lr 0.01438
Train [55][730/3239]	Time 0.354 (0.554)	Data Time 0.001 (0.053)	Loss 2.8753 (2.7046)	Entropy 0.62822 (0.62840)	Top-1 acc 54.688 (58.783)	Top-5 acc 77.734 (80.450)	lr 0.01438
Train [55][740/3239]	Time 0.237 (0.553)	Data Time 0.001 (0.052)	Loss 2.7298 (2.7057)	Entropy 0.62845 (0.62840)	Top-1 acc 58.203 (58.754)	Top-5 acc 80.469 (80.426)	lr 0.01438
Train [55][750/3239]	Time 0.241 (0.551)	Data Time 0.001 (0.051)	Loss 2.6591 (2.7046)	Entropy 0.62813 (0.62839)	Top-1 acc 58.203 (58.783)	Top-5 acc 82.031 (80.452)	lr 0.01438
Train [55][760/3239]	Time 0.251 (0.550)	Data Time 0.001 (0.051)	Loss 2.4584 (2.7039)	Entropy 0.62820 (0.62839)	Top-1 acc 64.062 (58.793)	Top-5 acc 84.375 (80.468)	lr 0.01438
Train [55][770/3239]	Time 0.246 (0.552)	Data Time 0.001 (0.053)	Loss 2.4150 (2.7033)	Entropy 0.62836 (0.62839)	Top-1 acc 67.188 (58.817)	Top-5 acc 84.766 (80.473)	lr 0.01438
Train [55][780/3239]	Time 0.268 (0.550)	Data Time 0.001 (0.052)	Loss 2.7072 (2.7023)	Entropy 0.62794 (0.62839)	Top-1 acc 58.594 (58.849)	Top-5 acc 78.125 (80.491)	lr 0.01438
Train [55][790/3239]	Time 0.226 (0.549)	Data Time 0.001 (0.052)	Loss 2.6267 (2.7031)	Entropy 0.62764 (0.62838)	Top-1 acc 60.938 (58.827)	Top-5 acc 82.812 (80.479)	lr 0.01438
Train [55][800/3239]	Time 0.351 (0.554)	Data Time 0.001 (0.058)	Loss 2.8755 (2.7027)	Entropy 0.62793 (0.62837)	Top-1 acc 54.297 (58.831)	Top-5 acc 78.906 (80.493)	lr 0.01438
Train [55][810/3239]	Time 0.245 (0.553)	Data Time 0.001 (0.057)	Loss 2.6738 (2.7023)	Entropy 0.62792 (0.62837)	Top-1 acc 58.203 (58.839)	Top-5 acc 79.688 (80.502)	lr 0.01437
Train [55][820/3239]	Time 0.254 (0.552)	Data Time 0.001 (0.056)	Loss 2.6722 (2.7025)	Entropy 0.62805 (0.62836)	Top-1 acc 58.203 (58.827)	Top-5 acc 80.859 (80.502)	lr 0.01437
Train [55][830/3239]	Time 0.296 (0.552)	Data Time 0.001 (0.056)	Loss 2.6580 (2.7032)	Entropy 0.62792 (0.62836)	Top-1 acc 57.031 (58.802)	Top-5 acc 83.984 (80.491)	lr 0.01437
Train [55][840/3239]	Time 0.261 (0.556)	Data Time 0.001 (0.062)	Loss 2.9834 (2.7036)	Entropy 0.62827 (0.62835)	Top-1 acc 52.344 (58.783)	Top-5 acc 76.562 (80.484)	lr 0.01437
Train [55][850/3239]	Time 0.281 (0.556)	Data Time 0.001 (0.061)	Loss 2.9663 (2.7034)	Entropy 0.62809 (0.62835)	Top-1 acc 50.391 (58.780)	Top-5 acc 79.297 (80.487)	lr 0.01437
Train [55][860/3239]	Time 0.247 (0.554)	Data Time 0.001 (0.060)	Loss 2.8498 (2.7031)	Entropy 0.62805 (0.62835)	Top-1 acc 53.516 (58.768)	Top-5 acc 76.953 (80.499)	lr 0.01437
Train [55][870/3239]	Time 0.235 (0.561)	Data Time 0.001 (0.068)	Loss 2.8594 (2.7028)	Entropy 0.62804 (0.62835)	Top-1 acc 56.250 (58.766)	Top-5 acc 77.344 (80.520)	lr 0.01437
Train [55][880/3239]	Time 0.248 (0.560)	Data Time 0.001 (0.067)	Loss 2.6549 (2.7019)	Entropy 0.62789 (0.62834)	Top-1 acc 60.547 (58.790)	Top-5 acc 79.688 (80.536)	lr 0.01437
Train [55][890/3239]	Time 0.248 (0.559)	Data Time 0.001 (0.066)	Loss 2.9064 (2.7022)	Entropy 0.62785 (0.62834)	Top-1 acc 50.781 (58.785)	Top-5 acc 75.391 (80.527)	lr 0.01437
Train [55][900/3239]	Time 0.247 (0.561)	Data Time 0.001 (0.069)	Loss 2.6484 (2.7017)	Entropy 0.62822 (0.62833)	Top-1 acc 61.719 (58.792)	Top-5 acc 81.250 (80.538)	lr 0.01437
Train [55][910/3239]	Time 0.231 (0.560)	Data Time 0.001 (0.069)	Loss 2.7275 (2.7023)	Entropy 0.62833 (0.62833)	Top-1 acc 60.938 (58.790)	Top-5 acc 80.469 (80.524)	lr 0.01436
Train [55][920/3239]	Time 0.227 (0.559)	Data Time 0.001 (0.068)	Loss 2.5940 (2.7025)	Entropy 0.62873 (0.62834)	Top-1 acc 64.062 (58.794)	Top-5 acc 80.859 (80.520)	lr 0.01436
Train [55][930/3239]	Time 0.255 (0.561)	Data Time 0.001 (0.071)	Loss 2.6848 (2.7016)	Entropy 0.62877 (0.62834)	Top-1 acc 57.812 (58.824)	Top-5 acc 82.422 (80.536)	lr 0.01436
Train [55][940/3239]	Time 0.344 (0.564)	Data Time 0.001 (0.075)	Loss 2.6376 (2.7013)	Entropy 0.62891 (0.62834)	Top-1 acc 60.156 (58.828)	Top-5 acc 80.859 (80.543)	lr 0.01436
Train [55][950/3239]	Time 0.230 (0.563)	Data Time 0.001 (0.074)	Loss 2.5756 (2.7009)	Entropy 0.62875 (0.62835)	Top-1 acc 62.891 (58.835)	Top-5 acc 81.641 (80.544)	lr 0.01436
Train [55][960/3239]	Time 0.329 (0.563)	Data Time 0.001 (0.074)	Loss 2.9052 (2.7010)	Entropy 0.62872 (0.62835)	Top-1 acc 56.641 (58.838)	Top-5 acc 76.953 (80.537)	lr 0.01436
Train [55][970/3239]	Time 0.260 (0.567)	Data Time 0.001 (0.079)	Loss 2.7699 (2.7018)	Entropy 0.62881 (0.62836)	Top-1 acc 55.859 (58.821)	Top-5 acc 78.906 (80.515)	lr 0.01436
Train [55][980/3239]	Time 0.257 (0.566)	Data Time 0.001 (0.079)	Loss 2.5697 (2.7009)	Entropy 0.62904 (0.62836)	Top-1 acc 61.719 (58.845)	Top-5 acc 83.203 (80.532)	lr 0.01436
Train [55][990/3239]	Time 0.297 (0.565)	Data Time 0.001 (0.078)	Loss 2.9250 (2.7010)	Entropy 0.62883 (0.62837)	Top-1 acc 53.906 (58.829)	Top-5 acc 76.172 (80.527)	lr 0.01436
Train [55][1000/3239]	Time 5.096 (0.568)	Data Time 4.863 (0.082)	Loss 2.7191 (2.7007)	Entropy 0.62896 (0.62837)	Top-1 acc 55.859 (58.832)	Top-5 acc 80.078 (80.534)	lr 0.01436
Train [55][1010/3239]	Time 0.277 (0.567)	Data Time 0.001 (0.081)	Loss 2.6523 (2.7007)	Entropy 0.62886 (0.62838)	Top-1 acc 62.109 (58.834)	Top-5 acc 80.078 (80.533)	lr 0.01435
Train [55][1020/3239]	Time 0.243 (0.566)	Data Time 0.001 (0.080)	Loss 2.7769 (2.7007)	Entropy 0.62872 (0.62838)	Top-1 acc 54.297 (58.831)	Top-5 acc 79.688 (80.528)	lr 0.01435
Train [55][1030/3239]	Time 0.318 (0.565)	Data Time 0.001 (0.081)	Loss 2.7304 (2.7004)	Entropy 0.62877 (0.62838)	Top-1 acc 59.375 (58.838)	Top-5 acc 80.859 (80.536)	lr 0.01435
Train [55][1040/3239]	Time 0.245 (0.568)	Data Time 0.001 (0.084)	Loss 2.9625 (2.7011)	Entropy 0.62914 (0.62839)	Top-1 acc 51.172 (58.818)	Top-5 acc 78.516 (80.525)	lr 0.01435
Train [55][1050/3239]	Time 0.235 (0.567)	Data Time 0.001 (0.084)	Loss 2.7851 (2.7018)	Entropy 0.62899 (0.62840)	Top-1 acc 57.422 (58.805)	Top-5 acc 79.297 (80.512)	lr 0.01435
Train [55][1060/3239]	Time 0.240 (0.569)	Data Time 0.001 (0.085)	Loss 2.7520 (2.7020)	Entropy 0.62931 (0.62840)	Top-1 acc 58.594 (58.792)	Top-5 acc 80.859 (80.505)	lr 0.01435
Train [55][1070/3239]	Time 0.251 (0.571)	Data Time 0.001 (0.088)	Loss 2.6089 (2.7021)	Entropy 0.62933 (0.62841)	Top-1 acc 61.328 (58.790)	Top-5 acc 80.859 (80.503)	lr 0.01435
Train [55][1080/3239]	Time 0.233 (0.570)	Data Time 0.001 (0.088)	Loss 2.8872 (2.7022)	Entropy 0.62942 (0.62842)	Top-1 acc 55.859 (58.784)	Top-5 acc 73.438 (80.505)	lr 0.01435
Train [55][1090/3239]	Time 0.246 (0.572)	Data Time 0.002 (0.091)	Loss 2.6737 (2.7022)	Entropy 0.62955 (0.62843)	Top-1 acc 59.766 (58.787)	Top-5 acc 82.812 (80.510)	lr 0.01435
Train [55][1100/3239]	Time 0.243 (0.576)	Data Time 0.001 (0.095)	Loss 2.7332 (2.7024)	Entropy 0.62985 (0.62844)	Top-1 acc 56.641 (58.786)	Top-5 acc 79.297 (80.506)	lr 0.01435
Train [55][1110/3239]	Time 0.219 (0.575)	Data Time 0.001 (0.094)	Loss 2.4623 (2.7025)	Entropy 0.62979 (0.62845)	Top-1 acc 64.453 (58.787)	Top-5 acc 85.547 (80.506)	lr 0.01434
Train [55][1120/3239]	Time 0.364 (0.574)	Data Time 0.001 (0.094)	Loss 2.6211 (2.7020)	Entropy 0.62955 (0.62846)	Top-1 acc 60.156 (58.801)	Top-5 acc 81.250 (80.515)	lr 0.01434
Train [55][1130/3239]	Time 0.226 (0.580)	Data Time 0.001 (0.101)	Loss 3.0478 (2.7026)	Entropy 0.63001 (0.62847)	Top-1 acc 50.391 (58.794)	Top-5 acc 76.172 (80.505)	lr 0.01434
Train [55][1140/3239]	Time 0.277 (0.579)	Data Time 0.001 (0.100)	Loss 2.6074 (2.7018)	Entropy 0.63002 (0.62849)	Top-1 acc 59.375 (58.807)	Top-5 acc 80.078 (80.513)	lr 0.01434
Train [55][1150/3239]	Time 0.253 (0.578)	Data Time 0.001 (0.099)	Loss 2.6434 (2.7018)	Entropy 0.63022 (0.62850)	Top-1 acc 61.719 (58.814)	Top-5 acc 81.250 (80.510)	lr 0.01434
Train [55][1160/3239]	Time 7.538 (0.583)	Data Time 7.291 (0.104)	Loss 2.8007 (2.7016)	Entropy 0.63044 (0.62852)	Top-1 acc 58.984 (58.828)	Top-5 acc 77.734 (80.510)	lr 0.01434
Train [55][1170/3239]	Time 0.237 (0.582)	Data Time 0.001 (0.103)	Loss 2.7734 (2.7016)	Entropy 0.63037 (0.62853)	Top-1 acc 58.203 (58.822)	Top-5 acc 78.516 (80.510)	lr 0.01434
Train [55][1180/3239]	Time 0.294 (0.581)	Data Time 0.001 (0.103)	Loss 2.4943 (2.7014)	Entropy 0.62996 (0.62855)	Top-1 acc 65.234 (58.828)	Top-5 acc 83.594 (80.515)	lr 0.01434
Train [55][1190/3239]	Time 0.398 (0.580)	Data Time 0.001 (0.102)	Loss 2.8485 (2.7018)	Entropy 0.62994 (0.62856)	Top-1 acc 57.812 (58.824)	Top-5 acc 78.125 (80.509)	lr 0.01434
Train [55][1200/3239]	Time 0.239 (0.582)	Data Time 0.001 (0.104)	Loss 2.5607 (2.7015)	Entropy 0.62995 (0.62857)	Top-1 acc 65.234 (58.835)	Top-5 acc 82.031 (80.519)	lr 0.01434
Train [55][1210/3239]	Time 0.236 (0.613)	Data Time 0.002 (0.103)	Loss 2.6768 (2.7014)	Entropy 0.63038 (0.62858)	Top-1 acc 59.375 (58.836)	Top-5 acc 80.859 (80.520)	lr 0.01433
Train [55][1220/3239]	Time 0.239 (0.612)	Data Time 0.002 (0.102)	Loss 2.7287 (2.7016)	Entropy 0.63057 (0.62860)	Top-1 acc 57.031 (58.836)	Top-5 acc 81.641 (80.515)	lr 0.01433
Train [55][1230/3239]	Time 0.248 (0.610)	Data Time 0.002 (0.101)	Loss 2.4770 (2.7011)	Entropy 0.63068 (0.62862)	Top-1 acc 67.969 (58.845)	Top-5 acc 85.156 (80.524)	lr 0.01433
Train [55][1240/3239]	Time 0.247 (0.609)	Data Time 0.001 (0.101)	Loss 2.4785 (2.7010)	Entropy 0.63001 (0.62863)	Top-1 acc 61.328 (58.846)	Top-5 acc 84.375 (80.527)	lr 0.01433
Train [55][1250/3239]	Time 0.245 (0.607)	Data Time 0.002 (0.100)	Loss 2.5554 (2.7004)	Entropy 0.63011 (0.62864)	Top-1 acc 61.719 (58.854)	Top-5 acc 83.984 (80.537)	lr 0.01433
Train [55][1260/3239]	Time 0.265 (0.606)	Data Time 0.002 (0.099)	Loss 2.5607 (2.7003)	Entropy 0.62968 (0.62865)	Top-1 acc 61.328 (58.850)	Top-5 acc 82.422 (80.544)	lr 0.01433
Train [55][1270/3239]	Time 0.298 (0.605)	Data Time 0.001 (0.098)	Loss 2.6575 (2.6999)	Entropy 0.62989 (0.62866)	Top-1 acc 57.812 (58.864)	Top-5 acc 82.812 (80.553)	lr 0.01433
Train [55][1280/3239]	Time 0.416 (0.604)	Data Time 0.001 (0.098)	Loss 2.7579 (2.7002)	Entropy 0.62958 (0.62867)	Top-1 acc 62.109 (58.863)	Top-5 acc 77.344 (80.544)	lr 0.01433
Train [55][1290/3239]	Time 0.233 (0.603)	Data Time 0.001 (0.097)	Loss 2.4618 (2.7003)	Entropy 0.62970 (0.62868)	Top-1 acc 62.891 (58.861)	Top-5 acc 83.203 (80.537)	lr 0.01433
Train [55][1300/3239]	Time 0.250 (0.601)	Data Time 0.002 (0.096)	Loss 2.8369 (2.7002)	Entropy 0.62946 (0.62868)	Top-1 acc 55.859 (58.863)	Top-5 acc 77.344 (80.532)	lr 0.01433
Train [55][1310/3239]	Time 0.271 (0.602)	Data Time 0.001 (0.097)	Loss 2.6178 (2.6998)	Entropy 0.62970 (0.62869)	Top-1 acc 63.281 (58.871)	Top-5 acc 80.859 (80.531)	lr 0.01432
Train [55][1320/3239]	Time 0.228 (0.601)	Data Time 0.001 (0.098)	Loss 2.9453 (2.7001)	Entropy 0.62975 (0.62870)	Top-1 acc 53.906 (58.872)	Top-5 acc 75.781 (80.525)	lr 0.01432
Train [55][1330/3239]	Time 0.286 (0.601)	Data Time 0.001 (0.097)	Loss 2.6702 (2.7004)	Entropy 0.62952 (0.62871)	Top-1 acc 59.375 (58.866)	Top-5 acc 80.078 (80.515)	lr 0.01432
Train [55][1340/3239]	Time 0.296 (0.605)	Data Time 0.001 (0.102)	Loss 2.6274 (2.7005)	Entropy 0.62965 (0.62871)	Top-1 acc 59.375 (58.859)	Top-5 acc 81.641 (80.521)	lr 0.01432
Train [55][1350/3239]	Time 2.108 (0.606)	Data Time 1.740 (0.103)	Loss 2.6742 (2.7007)	Entropy 0.62942 (0.62872)	Top-1 acc 58.984 (58.853)	Top-5 acc 81.641 (80.521)	lr 0.01432
Train [55][1360/3239]	Time 0.264 (0.606)	Data Time 0.002 (0.104)	Loss 2.9565 (2.7006)	Entropy 0.62968 (0.62872)	Top-1 acc 53.906 (58.854)	Top-5 acc 76.953 (80.518)	lr 0.01432
Train [55][1370/3239]	Time 0.280 (0.608)	Data Time 0.001 (0.107)	Loss 2.6210 (2.7009)	Entropy 0.62967 (0.62873)	Top-1 acc 63.281 (58.847)	Top-5 acc 82.031 (80.519)	lr 0.01432
Train [55][1380/3239]	Time 0.285 (0.607)	Data Time 0.002 (0.106)	Loss 2.6732 (2.7006)	Entropy 0.62941 (0.62874)	Top-1 acc 55.859 (58.846)	Top-5 acc 79.297 (80.520)	lr 0.01432
Train [55][1390/3239]	Time 0.248 (0.609)	Data Time 0.001 (0.109)	Loss 2.6865 (2.7008)	Entropy 0.62937 (0.62874)	Top-1 acc 60.938 (58.838)	Top-5 acc 82.422 (80.514)	lr 0.01432
Train [55][1400/3239]	Time 0.249 (0.610)	Data Time 0.001 (0.110)	Loss 2.7870 (2.7007)	Entropy 0.62977 (0.62874)	Top-1 acc 54.297 (58.840)	Top-5 acc 77.734 (80.517)	lr 0.01432
Train [55][1410/3239]	Time 0.274 (0.609)	Data Time 0.001 (0.110)	Loss 2.7149 (2.7009)	Entropy 0.62981 (0.62875)	Top-1 acc 59.766 (58.837)	Top-5 acc 81.250 (80.510)	lr 0.01431
Train [55][1420/3239]	Time 0.242 (0.612)	Data Time 0.001 (0.113)	Loss 2.7005 (2.7003)	Entropy 0.62966 (0.62876)	Top-1 acc 57.422 (58.847)	Top-5 acc 83.203 (80.521)	lr 0.01431
Train [55][1430/3239]	Time 1.884 (0.612)	Data Time 1.622 (0.114)	Loss 2.7293 (2.7002)	Entropy 0.62957 (0.62877)	Top-1 acc 57.031 (58.848)	Top-5 acc 78.906 (80.527)	lr 0.01431
Train [55][1440/3239]	Time 0.295 (0.611)	Data Time 0.001 (0.113)	Loss 2.6688 (2.7003)	Entropy 0.62973 (0.62877)	Top-1 acc 59.766 (58.849)	Top-5 acc 80.859 (80.519)	lr 0.01431
Train [55][1450/3239]	Time 0.233 (0.615)	Data Time 0.001 (0.118)	Loss 2.7538 (2.7008)	Entropy 0.62963 (0.62878)	Top-1 acc 55.859 (58.840)	Top-5 acc 78.906 (80.507)	lr 0.01431
Train [55][1460/3239]	Time 0.237 (0.614)	Data Time 0.001 (0.117)	Loss 2.7212 (2.7007)	Entropy 0.62954 (0.62878)	Top-1 acc 55.859 (58.847)	Top-5 acc 78.125 (80.505)	lr 0.01431
Train [55][1470/3239]	Time 0.254 (0.613)	Data Time 0.002 (0.116)	Loss 2.7319 (2.7010)	Entropy 0.62949 (0.62879)	Top-1 acc 59.375 (58.835)	Top-5 acc 80.859 (80.499)	lr 0.01431
Train [55][1480/3239]	Time 0.239 (0.618)	Data Time 0.001 (0.121)	Loss 2.6353 (2.7012)	Entropy 0.62929 (0.62879)	Top-1 acc 62.500 (58.831)	Top-5 acc 80.859 (80.498)	lr 0.01431
Train [55][1490/3239]	Time 0.271 (0.616)	Data Time 0.001 (0.121)	Loss 2.5996 (2.7014)	Entropy 0.62961 (0.62880)	Top-1 acc 61.328 (58.822)	Top-5 acc 82.031 (80.490)	lr 0.01431
Train [55][1500/3239]	Time 0.256 (0.616)	Data Time 0.001 (0.121)	Loss 2.8213 (2.7018)	Entropy 0.62961 (0.62880)	Top-1 acc 52.734 (58.811)	Top-5 acc 80.469 (80.487)	lr 0.01431
Train [55][1510/3239]	Time 5.773 (0.621)	Data Time 5.406 (0.126)	Loss 2.4306 (2.7014)	Entropy 0.62978 (0.62881)	Top-1 acc 65.625 (58.824)	Top-5 acc 84.766 (80.497)	lr 0.01430
Train [55][1520/3239]	Time 0.223 (0.619)	Data Time 0.001 (0.125)	Loss 2.5185 (2.7012)	Entropy 0.63028 (0.62882)	Top-1 acc 60.547 (58.827)	Top-5 acc 83.594 (80.501)	lr 0.01430
Train [55][1530/3239]	Time 2.276 (0.620)	Data Time 2.034 (0.127)	Loss 2.6720 (2.7013)	Entropy 0.63001 (0.62883)	Top-1 acc 58.594 (58.829)	Top-5 acc 79.688 (80.498)	lr 0.01430
Train [55][1540/3239]	Time 0.237 (0.619)	Data Time 0.001 (0.126)	Loss 2.5422 (2.7019)	Entropy 0.62999 (0.62883)	Top-1 acc 65.625 (58.814)	Top-5 acc 82.422 (80.485)	lr 0.01430
Train [55][1550/3239]	Time 0.227 (0.624)	Data Time 0.001 (0.131)	Loss 2.6354 (2.7020)	Entropy 0.62995 (0.62884)	Top-1 acc 60.547 (58.820)	Top-5 acc 80.469 (80.480)	lr 0.01430
Train [55][1560/3239]	Time 0.235 (0.623)	Data Time 0.001 (0.130)	Loss 2.7064 (2.7018)	Entropy 0.63037 (0.62885)	Top-1 acc 59.375 (58.814)	Top-5 acc 80.078 (80.485)	lr 0.01430
Train [55][1570/3239]	Time 0.265 (0.624)	Data Time 0.001 (0.132)	Loss 2.7561 (2.7020)	Entropy 0.63070 (0.62886)	Top-1 acc 57.812 (58.814)	Top-5 acc 80.078 (80.485)	lr 0.01430
Train [55][1580/3239]	Time 0.320 (0.627)	Data Time 0.001 (0.135)	Loss 2.4015 (2.7020)	Entropy 0.63021 (0.62887)	Top-1 acc 67.578 (58.816)	Top-5 acc 87.500 (80.487)	lr 0.01430
Train [55][1590/3239]	Time 0.232 (0.625)	Data Time 0.001 (0.134)	Loss 2.5261 (2.7016)	Entropy 0.63034 (0.62888)	Top-1 acc 63.281 (58.827)	Top-5 acc 83.203 (80.495)	lr 0.01430
Train [55][1600/3239]	Time 0.239 (0.626)	Data Time 0.001 (0.136)	Loss 2.8176 (2.7017)	Entropy 0.63067 (0.62889)	Top-1 acc 56.250 (58.825)	Top-5 acc 76.172 (80.490)	lr 0.01430
Train [55][1610/3239]	Time 0.263 (0.631)	Data Time 0.001 (0.141)	Loss 2.7916 (2.7016)	Entropy 0.63051 (0.62890)	Top-1 acc 57.422 (58.825)	Top-5 acc 75.391 (80.494)	lr 0.01429
Train [55][1620/3239]	Time 0.226 (0.630)	Data Time 0.001 (0.140)	Loss 2.7364 (2.7016)	Entropy 0.63058 (0.62891)	Top-1 acc 57.422 (58.828)	Top-5 acc 80.469 (80.490)	lr 0.01429
Train [55][1630/3239]	Time 0.233 (0.631)	Data Time 0.001 (0.142)	Loss 2.7204 (2.7019)	Entropy 0.63036 (0.62892)	Top-1 acc 57.422 (58.823)	Top-5 acc 81.641 (80.486)	lr 0.01429
Train [55][1640/3239]	Time 0.243 (0.636)	Data Time 0.001 (0.148)	Loss 2.8326 (2.7021)	Entropy 0.63048 (0.62893)	Top-1 acc 54.688 (58.817)	Top-5 acc 80.078 (80.484)	lr 0.01429
Train [55][1650/3239]	Time 0.274 (0.636)	Data Time 0.002 (0.147)	Loss 2.7170 (2.7017)	Entropy 0.63073 (0.62894)	Top-1 acc 57.031 (58.819)	Top-5 acc 80.078 (80.490)	lr 0.01429
Train [55][1660/3239]	Time 0.246 (0.638)	Data Time 0.001 (0.149)	Loss 2.6290 (2.7016)	Entropy 0.63068 (0.62895)	Top-1 acc 63.281 (58.823)	Top-5 acc 80.469 (80.489)	lr 0.01429
Train [55][1670/3239]	Time 0.317 (0.640)	Data Time 0.001 (0.152)	Loss 2.8738 (2.7015)	Entropy 0.63086 (0.62896)	Top-1 acc 57.422 (58.826)	Top-5 acc 78.906 (80.490)	lr 0.01429
Train [55][1680/3239]	Time 0.234 (0.641)	Data Time 0.001 (0.154)	Loss 2.6842 (2.7016)	Entropy 0.63109 (0.62897)	Top-1 acc 63.281 (58.826)	Top-5 acc 81.641 (80.486)	lr 0.01429
Train [55][1690/3239]	Time 0.237 (0.640)	Data Time 0.002 (0.153)	Loss 2.7027 (2.7014)	Entropy 0.63100 (0.62899)	Top-1 acc 57.812 (58.827)	Top-5 acc 76.953 (80.487)	lr 0.01429
Train [55][1700/3239]	Time 0.230 (0.642)	Data Time 0.001 (0.156)	Loss 2.5530 (2.7009)	Entropy 0.63126 (0.62900)	Top-1 acc 64.453 (58.839)	Top-5 acc 83.594 (80.497)	lr 0.01429
Train [55][1710/3239]	Time 7.806 (0.648)	Data Time 7.551 (0.162)	Loss 2.6800 (2.7007)	Entropy 0.63125 (0.62901)	Top-1 acc 58.594 (58.841)	Top-5 acc 80.078 (80.500)	lr 0.01428
Train [55][1720/3239]	Time 0.254 (0.647)	Data Time 0.001 (0.161)	Loss 2.7844 (2.7008)	Entropy 0.63170 (0.62903)	Top-1 acc 56.641 (58.833)	Top-5 acc 79.688 (80.501)	lr 0.01428
Train [55][1730/3239]	Time 0.232 (0.649)	Data Time 0.001 (0.163)	Loss 2.8099 (2.7010)	Entropy 0.63169 (0.62904)	Top-1 acc 58.984 (58.829)	Top-5 acc 76.562 (80.499)	lr 0.01428
Train [55][1740/3239]	Time 0.330 (0.651)	Data Time 0.001 (0.166)	Loss 2.5242 (2.7012)	Entropy 0.63162 (0.62906)	Top-1 acc 57.031 (58.819)	Top-5 acc 85.547 (80.493)	lr 0.01428
Train [55][1750/3239]	Time 0.226 (0.651)	Data Time 0.001 (0.166)	Loss 2.6586 (2.7016)	Entropy 0.63182 (0.62907)	Top-1 acc 58.203 (58.807)	Top-5 acc 80.078 (80.482)	lr 0.01428
Train [55][1760/3239]	Time 0.258 (0.650)	Data Time 0.001 (0.165)	Loss 2.9433 (2.7019)	Entropy 0.63156 (0.62909)	Top-1 acc 56.641 (58.801)	Top-5 acc 77.344 (80.477)	lr 0.01428
Train [55][1770/3239]	Time 0.235 (0.655)	Data Time 0.001 (0.171)	Loss 2.9450 (2.7021)	Entropy 0.63150 (0.62910)	Top-1 acc 51.562 (58.801)	Top-5 acc 79.297 (80.476)	lr 0.01428
Train [55][1780/3239]	Time 0.248 (0.657)	Data Time 0.001 (0.173)	Loss 2.7385 (2.7027)	Entropy 0.63123 (0.62911)	Top-1 acc 56.641 (58.789)	Top-5 acc 81.250 (80.464)	lr 0.01428
Train [55][1790/3239]	Time 0.241 (0.656)	Data Time 0.001 (0.173)	Loss 2.5946 (2.7033)	Entropy 0.63071 (0.62912)	Top-1 acc 63.281 (58.779)	Top-5 acc 84.375 (80.453)	lr 0.01428
Train [55][1800/3239]	Time 0.247 (0.661)	Data Time 0.001 (0.179)	Loss 2.5301 (2.7030)	Entropy 0.63102 (0.62913)	Top-1 acc 65.234 (58.787)	Top-5 acc 84.766 (80.463)	lr 0.01428
Train [55][1810/3239]	Time 0.297 (0.664)	Data Time 0.001 (0.181)	Loss 2.6900 (2.7031)	Entropy 0.63115 (0.62914)	Top-1 acc 58.984 (58.782)	Top-5 acc 80.469 (80.462)	lr 0.01427
Train [55][1820/3239]	Time 0.233 (0.663)	Data Time 0.001 (0.181)	Loss 2.9088 (2.7034)	Entropy 0.63117 (0.62915)	Top-1 acc 53.516 (58.771)	Top-5 acc 76.562 (80.455)	lr 0.01427
Train [55][1830/3239]	Time 3.351 (0.667)	Data Time 2.979 (0.185)	Loss 2.5200 (2.7032)	Entropy 0.63091 (0.62916)	Top-1 acc 64.844 (58.776)	Top-5 acc 83.203 (80.461)	lr 0.01427
Train [55][1840/3239]	Time 0.257 (0.669)	Data Time 0.001 (0.188)	Loss 2.7245 (2.7033)	Entropy 0.63086 (0.62917)	Top-1 acc 58.203 (58.770)	Top-5 acc 81.641 (80.459)	lr 0.01427
Train [55][1850/3239]	Time 0.248 (0.668)	Data Time 0.001 (0.187)	Loss 2.6318 (2.7035)	Entropy 0.63019 (0.62918)	Top-1 acc 62.500 (58.761)	Top-5 acc 82.031 (80.458)	lr 0.01427
Train [55][1860/3239]	Time 0.438 (0.692)	Data Time 0.005 (0.193)	Loss 2.5068 (2.7036)	Entropy 0.63036 (0.62919)	Top-1 acc 63.672 (58.757)	Top-5 acc 83.203 (80.459)	lr 0.01427
Train [55][1870/3239]	Time 0.230 (0.691)	Data Time 0.002 (0.192)	Loss 2.7324 (2.7039)	Entropy 0.63028 (0.62919)	Top-1 acc 56.250 (58.752)	Top-5 acc 81.641 (80.453)	lr 0.01427
Train [55][1880/3239]	Time 0.249 (0.690)	Data Time 0.002 (0.191)	Loss 2.7010 (2.7038)	Entropy 0.63017 (0.62920)	Top-1 acc 60.938 (58.757)	Top-5 acc 82.422 (80.456)	lr 0.01427
Train [55][1890/3239]	Time 0.238 (0.688)	Data Time 0.001 (0.190)	Loss 2.7078 (2.7036)	Entropy 0.63029 (0.62920)	Top-1 acc 57.031 (58.762)	Top-5 acc 78.516 (80.457)	lr 0.01427
Train [55][1900/3239]	Time 0.342 (0.687)	Data Time 0.001 (0.189)	Loss 2.6321 (2.7037)	Entropy 0.63025 (0.62921)	Top-1 acc 58.594 (58.762)	Top-5 acc 80.859 (80.452)	lr 0.01427
Train [55][1910/3239]	Time 0.241 (0.685)	Data Time 0.001 (0.188)	Loss 2.4245 (2.7037)	Entropy 0.63017 (0.62921)	Top-1 acc 65.234 (58.758)	Top-5 acc 85.547 (80.450)	lr 0.01426
Train [55][1920/3239]	Time 0.248 (0.684)	Data Time 0.001 (0.187)	Loss 2.5372 (2.7040)	Entropy 0.62987 (0.62922)	Top-1 acc 61.328 (58.746)	Top-5 acc 83.984 (80.447)	lr 0.01426
Train [55][1930/3239]	Time 0.255 (0.688)	Data Time 0.001 (0.191)	Loss 2.6370 (2.7037)	Entropy 0.63006 (0.62922)	Top-1 acc 62.500 (58.753)	Top-5 acc 81.250 (80.456)	lr 0.01426
Train [55][1940/3239]	Time 0.251 (0.687)	Data Time 0.001 (0.191)	Loss 2.6927 (2.7038)	Entropy 0.63034 (0.62923)	Top-1 acc 57.031 (58.748)	Top-5 acc 81.250 (80.455)	lr 0.01426
Train [55][1950/3239]	Time 0.235 (0.688)	Data Time 0.001 (0.192)	Loss 2.8273 (2.7038)	Entropy 0.63059 (0.62923)	Top-1 acc 54.297 (58.753)	Top-5 acc 80.859 (80.458)	lr 0.01426
Train [55][1960/3239]	Time 0.244 (0.693)	Data Time 0.002 (0.198)	Loss 2.8520 (2.7037)	Entropy 0.63072 (0.62924)	Top-1 acc 57.031 (58.755)	Top-5 acc 78.906 (80.458)	lr 0.01426
Train [55][1970/3239]	Time 0.258 (0.694)	Data Time 0.001 (0.199)	Loss 2.6671 (2.7036)	Entropy 0.63036 (0.62925)	Top-1 acc 59.375 (58.758)	Top-5 acc 80.469 (80.458)	lr 0.01426
Train [55][1980/3239]	Time 0.230 (0.695)	Data Time 0.001 (0.200)	Loss 2.5277 (2.7038)	Entropy 0.63043 (0.62925)	Top-1 acc 64.844 (58.751)	Top-5 acc 81.641 (80.453)	lr 0.01426
Train [55][1990/3239]	Time 2.846 (0.700)	Data Time 2.498 (0.205)	Loss 2.6501 (2.7038)	Entropy 0.63045 (0.62926)	Top-1 acc 61.719 (58.750)	Top-5 acc 81.250 (80.457)	lr 0.01426
Train [55][2000/3239]	Time 0.249 (0.703)	Data Time 0.001 (0.208)	Loss 2.5370 (2.7037)	Entropy 0.63077 (0.62927)	Top-1 acc 64.844 (58.750)	Top-5 acc 84.766 (80.464)	lr 0.01426
Train [55][2010/3239]	Time 2.964 (0.703)	Data Time 2.709 (0.209)	Loss 2.6811 (2.7040)	Entropy 0.63024 (0.62927)	Top-1 acc 61.328 (58.744)	Top-5 acc 79.297 (80.459)	lr 0.01425
Train [55][2020/3239]	Time 3.888 (0.704)	Data Time 3.595 (0.210)	Loss 2.7255 (2.7040)	Entropy 0.63018 (0.62928)	Top-1 acc 55.078 (58.743)	Top-5 acc 79.297 (80.459)	lr 0.01425
Train [55][2030/3239]	Time 0.254 (0.710)	Data Time 0.001 (0.216)	Loss 2.7804 (2.7041)	Entropy 0.63006 (0.62928)	Top-1 acc 56.250 (58.734)	Top-5 acc 81.641 (80.457)	lr 0.01425
Train [55][2040/3239]	Time 0.282 (0.708)	Data Time 0.001 (0.215)	Loss 2.5331 (2.7041)	Entropy 0.63035 (0.62929)	Top-1 acc 61.328 (58.735)	Top-5 acc 83.203 (80.457)	lr 0.01425
Train [55][2050/3239]	Time 0.258 (0.709)	Data Time 0.002 (0.216)	Loss 2.9103 (2.7043)	Entropy 0.63039 (0.62929)	Top-1 acc 53.906 (58.732)	Top-5 acc 75.391 (80.454)	lr 0.01425
Train [55][2060/3239]	Time 0.351 (0.717)	Data Time 0.001 (0.224)	Loss 2.8412 (2.7041)	Entropy 0.63041 (0.62930)	Top-1 acc 57.031 (58.735)	Top-5 acc 76.953 (80.456)	lr 0.01425
Train [55][2070/3239]	Time 0.239 (0.715)	Data Time 0.001 (0.223)	Loss 2.7276 (2.7042)	Entropy 0.63063 (0.62930)	Top-1 acc 56.641 (58.729)	Top-5 acc 80.469 (80.453)	lr 0.01425
Train [55][2080/3239]	Time 0.239 (0.716)	Data Time 0.001 (0.224)	Loss 2.7954 (2.7043)	Entropy 0.63042 (0.62931)	Top-1 acc 56.250 (58.730)	Top-5 acc 76.562 (80.447)	lr 0.01425
Train [55][2090/3239]	Time 4.552 (0.721)	Data Time 4.310 (0.230)	Loss 2.6253 (2.7042)	Entropy 0.63087 (0.62932)	Top-1 acc 62.891 (58.732)	Top-5 acc 81.250 (80.449)	lr 0.01425
Train [55][2100/3239]	Time 0.245 (0.721)	Data Time 0.001 (0.230)	Loss 2.4683 (2.7042)	Entropy 0.63107 (0.62932)	Top-1 acc 66.406 (58.735)	Top-5 acc 84.766 (80.450)	lr 0.01425
Train [55][2110/3239]	Time 0.231 (0.722)	Data Time 0.001 (0.231)	Loss 2.8539 (2.7044)	Entropy 0.63111 (0.62933)	Top-1 acc 57.031 (58.734)	Top-5 acc 76.172 (80.445)	lr 0.01424
Train [55][2120/3239]	Time 3.974 (0.726)	Data Time 3.725 (0.235)	Loss 2.7479 (2.7046)	Entropy 0.63137 (0.62934)	Top-1 acc 59.375 (58.727)	Top-5 acc 77.344 (80.439)	lr 0.01424
Train [55][2130/3239]	Time 3.910 (0.729)	Data Time 3.659 (0.239)	Loss 2.6030 (2.7050)	Entropy 0.63145 (0.62935)	Top-1 acc 59.766 (58.713)	Top-5 acc 81.641 (80.427)	lr 0.01424
Train [55][2140/3239]	Time 0.255 (0.730)	Data Time 0.001 (0.240)	Loss 2.7734 (2.7047)	Entropy 0.63147 (0.62936)	Top-1 acc 58.203 (58.721)	Top-5 acc 78.906 (80.434)	lr 0.01424
Train [55][2150/3239]	Time 3.401 (0.732)	Data Time 3.116 (0.242)	Loss 2.6976 (2.7047)	Entropy 0.63158 (0.62937)	Top-1 acc 55.078 (58.720)	Top-5 acc 80.859 (80.435)	lr 0.01424
Train [55][2160/3239]	Time 0.236 (0.735)	Data Time 0.001 (0.246)	Loss 2.7753 (2.7049)	Entropy 0.63146 (0.62938)	Top-1 acc 57.422 (58.715)	Top-5 acc 81.250 (80.426)	lr 0.01424
Train [55][2170/3239]	Time 6.083 (0.739)	Data Time 5.832 (0.250)	Loss 2.4833 (2.7049)	Entropy 0.63107 (0.62939)	Top-1 acc 61.719 (58.711)	Top-5 acc 85.156 (80.425)	lr 0.01424
Train [55][2180/3239]	Time 0.238 (0.737)	Data Time 0.001 (0.249)	Loss 2.6877 (2.7047)	Entropy 0.63112 (0.62940)	Top-1 acc 58.984 (58.713)	Top-5 acc 80.859 (80.431)	lr 0.01424
Train [55][2190/3239]	Time 7.931 (0.745)	Data Time 7.682 (0.257)	Loss 3.1777 (2.7049)	Entropy 0.63100 (0.62941)	Top-1 acc 47.656 (58.704)	Top-5 acc 71.875 (80.428)	lr 0.01424
Train [55][2200/3239]	Time 0.249 (0.744)	Data Time 0.002 (0.255)	Loss 2.5622 (2.7047)	Entropy 0.63111 (0.62941)	Top-1 acc 63.672 (58.710)	Top-5 acc 81.641 (80.428)	lr 0.01424
Train [55][2210/3239]	Time 0.233 (0.745)	Data Time 0.001 (0.257)	Loss 2.6950 (2.7043)	Entropy 0.63122 (0.62942)	Top-1 acc 58.984 (58.720)	Top-5 acc 80.859 (80.438)	lr 0.01423
Train [55][2220/3239]	Time 0.331 (0.749)	Data Time 0.001 (0.262)	Loss 2.6340 (2.7042)	Entropy 0.63107 (0.62943)	Top-1 acc 60.547 (58.724)	Top-5 acc 82.031 (80.437)	lr 0.01423
Train [55][2230/3239]	Time 0.248 (0.751)	Data Time 0.001 (0.264)	Loss 2.6245 (2.7040)	Entropy 0.63100 (0.62944)	Top-1 acc 59.375 (58.730)	Top-5 acc 81.641 (80.438)	lr 0.01423
Train [55][2240/3239]	Time 0.242 (0.753)	Data Time 0.001 (0.266)	Loss 2.8790 (2.7042)	Entropy 0.63073 (0.62944)	Top-1 acc 52.344 (58.728)	Top-5 acc 77.344 (80.434)	lr 0.01423
Train [55][2250/3239]	Time 6.305 (0.757)	Data Time 6.046 (0.270)	Loss 2.6603 (2.7043)	Entropy 0.63079 (0.62945)	Top-1 acc 58.984 (58.727)	Top-5 acc 80.859 (80.429)	lr 0.01423
Train [55][2260/3239]	Time 0.257 (0.760)	Data Time 0.001 (0.274)	Loss 2.5898 (2.7044)	Entropy 0.63058 (0.62945)	Top-1 acc 60.156 (58.723)	Top-5 acc 82.422 (80.428)	lr 0.01423
Train [55][2270/3239]	Time 0.255 (0.761)	Data Time 0.001 (0.275)	Loss 2.9512 (2.7047)	Entropy 0.63081 (0.62946)	Top-1 acc 50.391 (58.713)	Top-5 acc 77.734 (80.423)	lr 0.01423
Train [55][2280/3239]	Time 0.234 (0.763)	Data Time 0.001 (0.277)	Loss 2.5412 (2.7047)	Entropy 0.63087 (0.62947)	Top-1 acc 60.938 (58.713)	Top-5 acc 84.766 (80.423)	lr 0.01423
Train [55][2290/3239]	Time 0.348 (0.766)	Data Time 0.001 (0.281)	Loss 2.7030 (2.7048)	Entropy 0.63112 (0.62947)	Top-1 acc 58.594 (58.711)	Top-5 acc 80.859 (80.423)	lr 0.01423
Train [55][2300/3239]	Time 0.239 (0.768)	Data Time 0.001 (0.283)	Loss 2.8609 (2.7049)	Entropy 0.63098 (0.62948)	Top-1 acc 51.953 (58.708)	Top-5 acc 78.516 (80.423)	lr 0.01423
Train [55][2310/3239]	Time 0.230 (0.774)	Data Time 0.001 (0.290)	Loss 2.9475 (2.7052)	Entropy 0.63100 (0.62949)	Top-1 acc 55.078 (58.704)	Top-5 acc 73.828 (80.421)	lr 0.01422
Train [55][2320/3239]	Time 0.250 (0.775)	Data Time 0.001 (0.290)	Loss 2.8327 (2.7058)	Entropy 0.63136 (0.62949)	Top-1 acc 56.250 (58.691)	Top-5 acc 78.516 (80.408)	lr 0.01422
Train [55][2330/3239]	Time 1.465 (0.776)	Data Time 1.221 (0.292)	Loss 2.8930 (2.7057)	Entropy 0.63136 (0.62950)	Top-1 acc 52.344 (58.690)	Top-5 acc 80.078 (80.410)	lr 0.01422
Train [55][2340/3239]	Time 7.743 (0.778)	Data Time 7.481 (0.294)	Loss 2.6831 (2.7058)	Entropy 0.63143 (0.62951)	Top-1 acc 60.156 (58.685)	Top-5 acc 80.469 (80.413)	lr 0.01422
Train [55][2350/3239]	Time 2.810 (0.782)	Data Time 2.567 (0.298)	Loss 2.5246 (2.7055)	Entropy 0.63131 (0.62952)	Top-1 acc 63.672 (58.691)	Top-5 acc 82.422 (80.417)	lr 0.01422
Train [55][2360/3239]	Time 0.224 (0.782)	Data Time 0.001 (0.299)	Loss 2.7604 (2.7056)	Entropy 0.63127 (0.62952)	Top-1 acc 60.156 (58.690)	Top-5 acc 79.688 (80.418)	lr 0.01422
Train [55][2370/3239]	Time 1.024 (0.782)	Data Time 0.764 (0.300)	Loss 2.5404 (2.7053)	Entropy 0.63132 (0.62953)	Top-1 acc 61.328 (58.691)	Top-5 acc 82.031 (80.422)	lr 0.01422
Train [55][2380/3239]	Time 0.487 (0.788)	Data Time 0.001 (0.305)	Loss 2.8626 (2.7056)	Entropy 0.63138 (0.62954)	Top-1 acc 54.688 (58.688)	Top-5 acc 77.734 (80.416)	lr 0.01422
Train [55][2390/3239]	Time 0.268 (0.788)	Data Time 0.001 (0.305)	Loss 2.5719 (2.7058)	Entropy 0.63134 (0.62955)	Top-1 acc 64.062 (58.679)	Top-5 acc 84.375 (80.412)	lr 0.01422
Train [55][2400/3239]	Time 0.228 (0.788)	Data Time 0.001 (0.306)	Loss 2.8133 (2.7060)	Entropy 0.63148 (0.62955)	Top-1 acc 57.422 (58.675)	Top-5 acc 78.516 (80.408)	lr 0.01422
Train [55][2410/3239]	Time 0.503 (0.791)	Data Time 0.256 (0.309)	Loss 2.9150 (2.7060)	Entropy 0.63142 (0.62956)	Top-1 acc 58.203 (58.672)	Top-5 acc 77.734 (80.409)	lr 0.01421
Train [55][2420/3239]	Time 0.239 (0.796)	Data Time 0.001 (0.314)	Loss 2.6361 (2.7058)	Entropy 0.63159 (0.62957)	Top-1 acc 61.719 (58.679)	Top-5 acc 82.422 (80.413)	lr 0.01421
Train [55][2430/3239]	Time 0.234 (0.794)	Data Time 0.001 (0.312)	Loss 2.6536 (2.7057)	Entropy 0.63142 (0.62958)	Top-1 acc 58.594 (58.681)	Top-5 acc 82.031 (80.421)	lr 0.01421
Train [55][2440/3239]	Time 0.234 (0.797)	Data Time 0.001 (0.315)	Loss 2.7662 (2.7058)	Entropy 0.63129 (0.62959)	Top-1 acc 57.422 (58.676)	Top-5 acc 79.688 (80.419)	lr 0.01421
Train [55][2450/3239]	Time 0.359 (0.799)	Data Time 0.001 (0.317)	Loss 2.5476 (2.7054)	Entropy 0.63122 (0.62959)	Top-1 acc 60.547 (58.679)	Top-5 acc 85.156 (80.425)	lr 0.01421
Train [55][2460/3239]	Time 0.299 (0.802)	Data Time 0.001 (0.321)	Loss 2.6213 (2.7056)	Entropy 0.63138 (0.62960)	Top-1 acc 60.938 (58.671)	Top-5 acc 80.859 (80.425)	lr 0.01421
Train [55][2470/3239]	Time 0.242 (0.804)	Data Time 0.001 (0.323)	Loss 2.7974 (2.7054)	Entropy 0.63137 (0.62961)	Top-1 acc 56.250 (58.677)	Top-5 acc 80.078 (80.431)	lr 0.01421
Train [55][2480/3239]	Time 0.232 (0.804)	Data Time 0.001 (0.323)	Loss 2.6745 (2.7050)	Entropy 0.63151 (0.62961)	Top-1 acc 57.422 (58.688)	Top-5 acc 82.031 (80.438)	lr 0.01421
Train [55][2490/3239]	Time 1.378 (0.807)	Data Time 1.094 (0.327)	Loss 2.6144 (2.7049)	Entropy 0.63193 (0.62962)	Top-1 acc 61.719 (58.690)	Top-5 acc 81.641 (80.437)	lr 0.01421
Train [55][2500/3239]	Time 4.007 (0.807)	Data Time 3.752 (0.327)	Loss 2.6925 (2.7048)	Entropy 0.63160 (0.62963)	Top-1 acc 57.031 (58.691)	Top-5 acc 80.078 (80.439)	lr 0.01421
Train [55][2510/3239]	Time 0.229 (0.809)	Data Time 0.001 (0.329)	Loss 2.7769 (2.7049)	Entropy 0.63173 (0.62964)	Top-1 acc 56.641 (58.689)	Top-5 acc 76.953 (80.437)	lr 0.01420
Train [55][2520/3239]	Time 0.331 (0.823)	Data Time 0.004 (0.329)	Loss 2.7278 (2.7050)	Entropy 0.63196 (0.62965)	Top-1 acc 58.984 (58.688)	Top-5 acc 78.516 (80.436)	lr 0.01420
Train [55][2530/3239]	Time 0.271 (0.821)	Data Time 0.002 (0.328)	Loss 2.6961 (2.7049)	Entropy 0.63171 (0.62966)	Top-1 acc 60.156 (58.689)	Top-5 acc 80.469 (80.434)	lr 0.01420
Train [55][2540/3239]	Time 0.369 (0.820)	Data Time 0.001 (0.327)	Loss 2.8183 (2.7051)	Entropy 0.63149 (0.62966)	Top-1 acc 54.688 (58.683)	Top-5 acc 79.688 (80.430)	lr 0.01420
Train [55][2550/3239]	Time 0.235 (0.818)	Data Time 0.002 (0.326)	Loss 2.8086 (2.7050)	Entropy 0.63147 (0.62967)	Top-1 acc 53.906 (58.686)	Top-5 acc 80.469 (80.434)	lr 0.01420
Train [55][2560/3239]	Time 0.248 (0.818)	Data Time 0.001 (0.326)	Loss 2.6271 (2.7049)	Entropy 0.63141 (0.62968)	Top-1 acc 60.156 (58.688)	Top-5 acc 81.250 (80.435)	lr 0.01420
Train [55][2570/3239]	Time 0.247 (0.819)	Data Time 0.001 (0.327)	Loss 2.9770 (2.7047)	Entropy 0.63134 (0.62969)	Top-1 acc 46.875 (58.691)	Top-5 acc 74.219 (80.440)	lr 0.01420
Train [55][2580/3239]	Time 0.243 (0.822)	Data Time 0.002 (0.330)	Loss 2.8835 (2.7047)	Entropy 0.63134 (0.62969)	Top-1 acc 58.984 (58.692)	Top-5 acc 77.344 (80.440)	lr 0.01420
Train [55][2590/3239]	Time 0.236 (0.824)	Data Time 0.001 (0.332)	Loss 2.6662 (2.7049)	Entropy 0.63133 (0.62970)	Top-1 acc 59.766 (58.688)	Top-5 acc 82.031 (80.433)	lr 0.01420
Train [55][2600/3239]	Time 0.235 (0.825)	Data Time 0.001 (0.333)	Loss 2.8667 (2.7051)	Entropy 0.63150 (0.62970)	Top-1 acc 52.734 (58.680)	Top-5 acc 77.344 (80.428)	lr 0.01420
Train [55][2610/3239]	Time 1.730 (0.824)	Data Time 1.364 (0.333)	Loss 2.6263 (2.7051)	Entropy 0.63131 (0.62971)	Top-1 acc 58.984 (58.679)	Top-5 acc 83.984 (80.428)	lr 0.01419
Train [55][2620/3239]	Time 0.236 (0.829)	Data Time 0.001 (0.338)	Loss 2.6262 (2.7052)	Entropy 0.63121 (0.62972)	Top-1 acc 61.328 (58.680)	Top-5 acc 82.031 (80.428)	lr 0.01419
Train [55][2630/3239]	Time 7.129 (0.831)	Data Time 6.887 (0.340)	Loss 2.8231 (2.7053)	Entropy 0.63115 (0.62972)	Top-1 acc 57.422 (58.679)	Top-5 acc 76.562 (80.425)	lr 0.01419
Train [55][2640/3239]	Time 0.240 (0.829)	Data Time 0.001 (0.339)	Loss 2.5911 (2.7054)	Entropy 0.63126 (0.62973)	Top-1 acc 60.547 (58.677)	Top-5 acc 81.250 (80.421)	lr 0.01419
Train [55][2650/3239]	Time 0.785 (0.833)	Data Time 0.544 (0.343)	Loss 2.7101 (2.7052)	Entropy 0.63121 (0.62973)	Top-1 acc 59.766 (58.681)	Top-5 acc 81.641 (80.425)	lr 0.01419
Train [55][2660/3239]	Time 1.250 (0.832)	Data Time 0.999 (0.342)	Loss 2.6584 (2.7051)	Entropy 0.63138 (0.62974)	Top-1 acc 62.500 (58.681)	Top-5 acc 82.422 (80.426)	lr 0.01419
Train [55][2670/3239]	Time 0.238 (0.833)	Data Time 0.001 (0.343)	Loss 2.8200 (2.7053)	Entropy 0.63141 (0.62975)	Top-1 acc 59.375 (58.680)	Top-5 acc 79.688 (80.420)	lr 0.01419
Train [55][2680/3239]	Time 0.231 (0.837)	Data Time 0.001 (0.348)	Loss 2.6753 (2.7054)	Entropy 0.63121 (0.62975)	Top-1 acc 58.203 (58.684)	Top-5 acc 82.031 (80.418)	lr 0.01419
Train [55][2690/3239]	Time 0.264 (0.838)	Data Time 0.002 (0.349)	Loss 2.7728 (2.7052)	Entropy 0.63093 (0.62976)	Top-1 acc 57.812 (58.688)	Top-5 acc 79.297 (80.423)	lr 0.01419
Train [55][2700/3239]	Time 0.339 (0.838)	Data Time 0.001 (0.349)	Loss 2.3830 (2.7051)	Entropy 0.63076 (0.62976)	Top-1 acc 66.016 (58.692)	Top-5 acc 85.156 (80.424)	lr 0.01419
Train [55][2710/3239]	Time 0.246 (0.843)	Data Time 0.001 (0.354)	Loss 2.6089 (2.7049)	Entropy 0.63104 (0.62976)	Top-1 acc 57.422 (58.697)	Top-5 acc 80.859 (80.424)	lr 0.01418
Train [55][2720/3239]	Time 0.252 (0.843)	Data Time 0.001 (0.354)	Loss 2.6665 (2.7047)	Entropy 0.63107 (0.62977)	Top-1 acc 62.500 (58.706)	Top-5 acc 83.203 (80.430)	lr 0.01418
Train [55][2730/3239]	Time 0.233 (0.842)	Data Time 0.001 (0.354)	Loss 2.6679 (2.7045)	Entropy 0.63130 (0.62977)	Top-1 acc 60.547 (58.708)	Top-5 acc 81.250 (80.434)	lr 0.01418
Train [55][2740/3239]	Time 0.237 (0.847)	Data Time 0.001 (0.359)	Loss 2.7326 (2.7046)	Entropy 0.63133 (0.62978)	Top-1 acc 58.594 (58.706)	Top-5 acc 76.562 (80.433)	lr 0.01418
Train [55][2750/3239]	Time 0.251 (0.848)	Data Time 0.001 (0.360)	Loss 2.5522 (2.7046)	Entropy 0.63141 (0.62979)	Top-1 acc 62.109 (58.705)	Top-5 acc 83.594 (80.432)	lr 0.01418
Train [55][2760/3239]	Time 1.565 (0.848)	Data Time 1.318 (0.360)	Loss 2.7540 (2.7045)	Entropy 0.63154 (0.62979)	Top-1 acc 58.594 (58.704)	Top-5 acc 79.297 (80.429)	lr 0.01418
Train [55][2770/3239]	Time 0.358 (0.848)	Data Time 0.001 (0.361)	Loss 2.6007 (2.7045)	Entropy 0.63154 (0.62980)	Top-1 acc 61.719 (58.706)	Top-5 acc 79.688 (80.428)	lr 0.01418
Train [55][2780/3239]	Time 0.248 (0.854)	Data Time 0.001 (0.367)	Loss 2.6384 (2.7042)	Entropy 0.63144 (0.62980)	Top-1 acc 58.594 (58.709)	Top-5 acc 83.203 (80.432)	lr 0.01418
Train [55][2790/3239]	Time 0.250 (0.852)	Data Time 0.001 (0.365)	Loss 2.9165 (2.7045)	Entropy 0.63105 (0.62981)	Top-1 acc 52.344 (58.705)	Top-5 acc 76.562 (80.431)	lr 0.01418
Train [55][2800/3239]	Time 0.223 (0.851)	Data Time 0.001 (0.364)	Loss 2.8607 (2.7046)	Entropy 0.63122 (0.62981)	Top-1 acc 56.250 (58.703)	Top-5 acc 76.953 (80.426)	lr 0.01418
Train [55][2810/3239]	Time 7.103 (0.858)	Data Time 6.854 (0.372)	Loss 3.0033 (2.7049)	Entropy 0.63107 (0.62982)	Top-1 acc 52.734 (58.698)	Top-5 acc 72.266 (80.418)	lr 0.01417
Train [55][2820/3239]	Time 0.254 (0.856)	Data Time 0.001 (0.370)	Loss 2.6051 (2.7050)	Entropy 0.63130 (0.62982)	Top-1 acc 62.500 (58.697)	Top-5 acc 82.031 (80.418)	lr 0.01417
Train [55][2830/3239]	Time 0.225 (0.856)	Data Time 0.001 (0.370)	Loss 2.9428 (2.7050)	Entropy 0.63116 (0.62983)	Top-1 acc 51.562 (58.698)	Top-5 acc 75.781 (80.416)	lr 0.01417
Train [55][2840/3239]	Time 0.249 (0.860)	Data Time 0.001 (0.375)	Loss 2.6843 (2.7049)	Entropy 0.63109 (0.62983)	Top-1 acc 62.109 (58.702)	Top-5 acc 81.641 (80.419)	lr 0.01417
Train [55][2850/3239]	Time 0.237 (0.861)	Data Time 0.001 (0.375)	Loss 2.5696 (2.7047)	Entropy 0.63085 (0.62984)	Top-1 acc 60.547 (58.709)	Top-5 acc 81.641 (80.422)	lr 0.01417
Train [55][2860/3239]	Time 0.239 (0.862)	Data Time 0.001 (0.376)	Loss 2.7167 (2.7046)	Entropy 0.63102 (0.62984)	Top-1 acc 57.812 (58.710)	Top-5 acc 81.641 (80.421)	lr 0.01417
Train [55][2870/3239]	Time 2.569 (0.865)	Data Time 2.269 (0.380)	Loss 2.4505 (2.7045)	Entropy 0.63100 (0.62985)	Top-1 acc 64.453 (58.711)	Top-5 acc 83.984 (80.422)	lr 0.01417
Train [55][2880/3239]	Time 0.254 (0.865)	Data Time 0.001 (0.380)	Loss 2.6323 (2.7044)	Entropy 0.63101 (0.62985)	Top-1 acc 56.641 (58.715)	Top-5 acc 82.031 (80.423)	lr 0.01417
Train [55][2890/3239]	Time 0.255 (0.868)	Data Time 0.001 (0.383)	Loss 2.4547 (2.7045)	Entropy 0.63078 (0.62985)	Top-1 acc 63.672 (58.718)	Top-5 acc 86.719 (80.423)	lr 0.01417
Train [55][2900/3239]	Time 0.251 (0.868)	Data Time 0.001 (0.384)	Loss 2.9917 (2.7046)	Entropy 0.63094 (0.62986)	Top-1 acc 51.172 (58.712)	Top-5 acc 74.609 (80.419)	lr 0.01417
Train [55][2910/3239]	Time 0.269 (0.870)	Data Time 0.001 (0.385)	Loss 2.6153 (2.7046)	Entropy 0.63090 (0.62986)	Top-1 acc 62.500 (58.717)	Top-5 acc 82.031 (80.422)	lr 0.01416
Train [55][2920/3239]	Time 0.252 (0.872)	Data Time 0.001 (0.388)	Loss 2.6936 (2.7045)	Entropy 0.63125 (0.62986)	Top-1 acc 58.203 (58.716)	Top-5 acc 80.078 (80.423)	lr 0.01416
Train [55][2930/3239]	Time 0.346 (0.870)	Data Time 0.001 (0.386)	Loss 2.8718 (2.7047)	Entropy 0.63097 (0.62987)	Top-1 acc 52.344 (58.712)	Top-5 acc 75.391 (80.415)	lr 0.01416
Train [55][2940/3239]	Time 0.276 (0.875)	Data Time 0.001 (0.391)	Loss 2.7259 (2.7047)	Entropy 0.63093 (0.62987)	Top-1 acc 61.719 (58.714)	Top-5 acc 80.078 (80.418)	lr 0.01416
Train [55][2950/3239]	Time 0.258 (0.876)	Data Time 0.001 (0.392)	Loss 2.5219 (2.7046)	Entropy 0.63053 (0.62988)	Top-1 acc 62.500 (58.718)	Top-5 acc 83.984 (80.416)	lr 0.01416
Train [55][2960/3239]	Time 1.814 (0.875)	Data Time 1.570 (0.392)	Loss 2.7519 (2.7048)	Entropy 0.63065 (0.62988)	Top-1 acc 58.984 (58.714)	Top-5 acc 81.641 (80.416)	lr 0.01416
Train [55][2970/3239]	Time 9.395 (0.880)	Data Time 9.139 (0.397)	Loss 2.6916 (2.7047)	Entropy 0.63057 (0.62988)	Top-1 acc 61.328 (58.715)	Top-5 acc 80.859 (80.417)	lr 0.01416
Train [55][2980/3239]	Time 0.269 (0.878)	Data Time 0.001 (0.395)	Loss 2.8262 (2.7048)	Entropy 0.63077 (0.62988)	Top-1 acc 55.469 (58.715)	Top-5 acc 77.344 (80.415)	lr 0.01416
Train [55][2990/3239]	Time 0.253 (0.879)	Data Time 0.001 (0.396)	Loss 2.7930 (2.7046)	Entropy 0.63058 (0.62989)	Top-1 acc 56.250 (58.718)	Top-5 acc 78.516 (80.421)	lr 0.01416
Train [55][3000/3239]	Time 0.330 (0.881)	Data Time 0.002 (0.398)	Loss 2.5808 (2.7046)	Entropy 0.63080 (0.62989)	Top-1 acc 62.109 (58.717)	Top-5 acc 82.812 (80.423)	lr 0.01416
Train [55][3010/3239]	Time 0.235 (0.883)	Data Time 0.001 (0.401)	Loss 2.6892 (2.7045)	Entropy 0.63063 (0.62989)	Top-1 acc 59.766 (58.719)	Top-5 acc 76.172 (80.421)	lr 0.01415
Train [55][3020/3239]	Time 0.245 (0.883)	Data Time 0.001 (0.401)	Loss 2.7930 (2.7045)	Entropy 0.63082 (0.62989)	Top-1 acc 55.469 (58.721)	Top-5 acc 78.125 (80.423)	lr 0.01415
Train [55][3030/3239]	Time 0.233 (0.886)	Data Time 0.001 (0.404)	Loss 2.8414 (2.7045)	Entropy 0.63079 (0.62990)	Top-1 acc 56.250 (58.720)	Top-5 acc 77.344 (80.421)	lr 0.01415
Train [55][3040/3239]	Time 0.243 (0.888)	Data Time 0.001 (0.406)	Loss 2.7223 (2.7045)	Entropy 0.63048 (0.62990)	Top-1 acc 54.688 (58.719)	Top-5 acc 80.469 (80.422)	lr 0.01415
Train [55][3050/3239]	Time 0.252 (0.887)	Data Time 0.001 (0.405)	Loss 2.5527 (2.7043)	Entropy 0.63048 (0.62990)	Top-1 acc 61.719 (58.722)	Top-5 acc 80.859 (80.425)	lr 0.01415
Train [55][3060/3239]	Time 0.244 (0.891)	Data Time 0.001 (0.409)	Loss 2.9314 (2.7043)	Entropy 0.63007 (0.62990)	Top-1 acc 56.641 (58.724)	Top-5 acc 74.219 (80.425)	lr 0.01415
Train [55][3070/3239]	Time 0.230 (0.893)	Data Time 0.001 (0.412)	Loss 2.9598 (2.7047)	Entropy 0.63017 (0.62990)	Top-1 acc 47.656 (58.711)	Top-5 acc 76.172 (80.416)	lr 0.01415
Train [55][3080/3239]	Time 0.265 (0.892)	Data Time 0.001 (0.412)	Loss 2.5815 (2.7046)	Entropy 0.63029 (0.62991)	Top-1 acc 60.938 (58.712)	Top-5 acc 83.594 (80.418)	lr 0.01415
Train [55][3090/3239]	Time 0.375 (0.891)	Data Time 0.001 (0.410)	Loss 2.6585 (2.7046)	Entropy 0.63038 (0.62991)	Top-1 acc 59.766 (58.708)	Top-5 acc 83.984 (80.419)	lr 0.01415
Train [55][3100/3239]	Time 0.237 (0.898)	Data Time 0.001 (0.418)	Loss 2.5458 (2.7045)	Entropy 0.63080 (0.62991)	Top-1 acc 63.281 (58.712)	Top-5 acc 82.031 (80.422)	lr 0.01415
Train [55][3110/3239]	Time 0.248 (0.897)	Data Time 0.002 (0.417)	Loss 2.7335 (2.7046)	Entropy 0.63090 (0.62991)	Top-1 acc 56.250 (58.709)	Top-5 acc 79.688 (80.422)	lr 0.01414
Train [55][3120/3239]	Time 0.233 (0.895)	Data Time 0.001 (0.415)	Loss 2.7842 (2.7046)	Entropy 0.63111 (0.62992)	Top-1 acc 56.250 (58.702)	Top-5 acc 77.734 (80.422)	lr 0.01414
Train [55][3130/3239]	Time 14.479 (0.903)	Data Time 14.233 (0.423)	Loss 2.5854 (2.7048)	Entropy 0.63111 (0.62992)	Top-1 acc 62.891 (58.698)	Top-5 acc 82.422 (80.417)	lr 0.01414
Train [55][3140/3239]	Time 0.234 (0.901)	Data Time 0.001 (0.422)	Loss 2.9916 (2.7050)	Entropy 0.63129 (0.62992)	Top-1 acc 53.906 (58.694)	Top-5 acc 74.219 (80.413)	lr 0.01414
Train [55][3150/3239]	Time 0.269 (0.900)	Data Time 0.001 (0.421)	Loss 2.7252 (2.7048)	Entropy 0.63136 (0.62993)	Top-1 acc 54.688 (58.700)	Top-5 acc 80.859 (80.418)	lr 0.01414
Train [55][3160/3239]	Time 0.421 (0.903)	Data Time 0.002 (0.424)	Loss 2.5070 (2.7048)	Entropy 0.63102 (0.62993)	Top-1 acc 64.453 (58.699)	Top-5 acc 82.031 (80.421)	lr 0.01414
Train [55][3170/3239]	Time 0.443 (0.916)	Data Time 0.004 (0.426)	Loss 2.8253 (2.7051)	Entropy 0.63063 (0.62994)	Top-1 acc 59.375 (58.695)	Top-5 acc 77.344 (80.417)	lr 0.01414
Train [55][3180/3239]	Time 0.251 (0.914)	Data Time 0.000 (0.425)	Loss 2.6700 (2.7050)	Entropy 0.63093 (0.62994)	Top-1 acc 62.891 (58.700)	Top-5 acc 82.031 (80.420)	lr 0.01414
Train [55][3190/3239]	Time 0.238 (0.913)	Data Time 0.000 (0.423)	Loss 2.7456 (2.7050)	Entropy 0.63078 (0.62994)	Top-1 acc 55.078 (58.698)	Top-5 acc 79.297 (80.418)	lr 0.01414
Train [55][3200/3239]	Time 0.234 (0.912)	Data Time 0.000 (0.422)	Loss 2.6445 (2.7051)	Entropy 0.63032 (0.62994)	Top-1 acc 59.375 (58.693)	Top-5 acc 81.250 (80.415)	lr 0.01414
Train [55][3210/3239]	Time 0.239 (0.910)	Data Time 0.000 (0.421)	Loss 2.5534 (2.7049)	Entropy 0.63049 (0.62994)	Top-1 acc 64.062 (58.701)	Top-5 acc 85.156 (80.417)	lr 0.01413
Train [55][3220/3239]	Time 0.223 (0.911)	Data Time 0.000 (0.422)	Loss 2.7295 (2.7049)	Entropy 0.63072 (0.62995)	Top-1 acc 60.547 (58.702)	Top-5 acc 78.125 (80.415)	lr 0.01413
Train [55][3230/3239]	Time 0.235 (0.912)	Data Time 0.000 (0.423)	Loss 2.7137 (2.7052)	Entropy 0.63055 (0.62995)	Top-1 acc 57.812 (58.697)	Top-5 acc 80.859 (80.409)	lr 0.01413
Train [55][3239/3239]	Time 0.974 (0.911)	Data Time 0.000 (0.422)	Loss 3.0143 (2.7052)	Entropy 0.63071 (0.62995)	Top-1 acc 46.914 (58.696)	Top-5 acc 71.605 (80.408)	lr 0.01413
==========Valid [55/120]	loss 1.456	top-1 acc 66.543 (66.543)	top-5 acc 86.736	Train top-1 58.696	top-5 80.408	Entropy 0.63071	Latency-None: 0.000ms	Flops: 538.40M
Train [56][0/3239]	Time 43.996 (43.996)	Data Time 43.219 (43.219)	Loss 2.7483 (2.7483)	Entropy 0.63059 (0.63059)	Top-1 acc 59.766 (59.766)	Top-5 acc 77.734 (77.734)	lr 0.01413
Train [56][10/3239]	Time 0.244 (4.552)	Data Time 0.001 (3.931)	Loss 2.7832 (2.7503)	Entropy 0.63066 (0.63067)	Top-1 acc 55.469 (58.381)	Top-5 acc 77.734 (79.510)	lr 0.01413
Train [56][20/3239]	Time 0.262 (2.604)	Data Time 0.002 (2.060)	Loss 2.6985 (2.7081)	Entropy 0.63087 (0.63069)	Top-1 acc 58.594 (59.468)	Top-5 acc 80.859 (80.450)	lr 0.01413
Train [56][30/3239]	Time 0.243 (1.916)	Data Time 0.001 (1.396)	Loss 2.8382 (2.7222)	Entropy 0.63092 (0.63075)	Top-1 acc 57.422 (59.098)	Top-5 acc 77.344 (79.977)	lr 0.01413
Train [56][40/3239]	Time 0.256 (1.568)	Data Time 0.002 (1.056)	Loss 2.7656 (2.7165)	Entropy 0.63097 (0.63081)	Top-1 acc 57.031 (59.232)	Top-5 acc 81.250 (80.002)	lr 0.01413
Train [56][50/3239]	Time 0.283 (1.356)	Data Time 0.001 (0.849)	Loss 2.6353 (2.7090)	Entropy 0.63083 (0.63083)	Top-1 acc 60.547 (59.329)	Top-5 acc 80.859 (80.139)	lr 0.01413
Train [56][60/3239]	Time 0.264 (1.210)	Data Time 0.001 (0.710)	Loss 2.4972 (2.7050)	Entropy 0.63072 (0.63083)	Top-1 acc 58.984 (59.074)	Top-5 acc 83.984 (80.181)	lr 0.01413
Train [56][70/3239]	Time 0.241 (1.098)	Data Time 0.001 (0.610)	Loss 2.4974 (2.6981)	Entropy 0.63100 (0.63083)	Top-1 acc 65.625 (59.155)	Top-5 acc 84.766 (80.304)	lr 0.01412
Train [56][80/3239]	Time 0.286 (1.017)	Data Time 0.001 (0.535)	Loss 2.8046 (2.7038)	Entropy 0.63070 (0.63085)	Top-1 acc 57.812 (59.066)	Top-5 acc 78.125 (80.194)	lr 0.01412
Train [56][90/3239]	Time 0.325 (0.968)	Data Time 0.002 (0.477)	Loss 2.5872 (2.6935)	Entropy 0.63070 (0.63084)	Top-1 acc 65.234 (59.306)	Top-5 acc 81.641 (80.366)	lr 0.01412
Train [56][100/3239]	Time 0.239 (0.920)	Data Time 0.001 (0.430)	Loss 2.6807 (2.6949)	Entropy 0.63108 (0.63084)	Top-1 acc 58.984 (59.282)	Top-5 acc 82.812 (80.368)	lr 0.01412
Train [56][110/3239]	Time 0.233 (0.877)	Data Time 0.001 (0.391)	Loss 2.8528 (2.6959)	Entropy 0.63091 (0.63085)	Top-1 acc 54.688 (59.231)	Top-5 acc 77.734 (80.356)	lr 0.01412
Train [56][120/3239]	Time 0.249 (0.841)	Data Time 0.001 (0.359)	Loss 2.6269 (2.6987)	Entropy 0.63106 (0.63087)	Top-1 acc 58.984 (59.072)	Top-5 acc 82.422 (80.369)	lr 0.01412
Train [56][130/3239]	Time 0.316 (0.829)	Data Time 0.001 (0.346)	Loss 2.8319 (2.6955)	Entropy 0.63131 (0.63089)	Top-1 acc 53.516 (59.196)	Top-5 acc 77.344 (80.421)	lr 0.01412
Train [56][140/3239]	Time 0.230 (0.803)	Data Time 0.001 (0.324)	Loss 3.1018 (2.6971)	Entropy 0.63150 (0.63092)	Top-1 acc 48.047 (59.145)	Top-5 acc 72.266 (80.386)	lr 0.01412
Train [56][150/3239]	Time 0.335 (0.780)	Data Time 0.001 (0.303)	Loss 2.6968 (2.6978)	Entropy 0.63153 (0.63096)	Top-1 acc 55.469 (59.054)	Top-5 acc 79.688 (80.420)	lr 0.01412
Train [56][160/3239]	Time 6.608 (0.798)	Data Time 6.271 (0.323)	Loss 2.6528 (2.6950)	Entropy 0.63154 (0.63099)	Top-1 acc 62.109 (59.123)	Top-5 acc 80.078 (80.444)	lr 0.01412
Train [56][170/3239]	Time 0.256 (0.778)	Data Time 0.001 (0.304)	Loss 2.6986 (2.6936)	Entropy 0.63138 (0.63102)	Top-1 acc 62.109 (59.190)	Top-5 acc 78.516 (80.444)	lr 0.01411
Train [56][180/3239]	Time 0.273 (0.761)	Data Time 0.002 (0.288)	Loss 2.7186 (2.6931)	Entropy 0.63124 (0.63104)	Top-1 acc 55.469 (59.226)	Top-5 acc 79.688 (80.462)	lr 0.01411
Train [56][190/3239]	Time 0.276 (0.744)	Data Time 0.001 (0.273)	Loss 2.6786 (2.6925)	Entropy 0.63152 (0.63105)	Top-1 acc 57.422 (59.250)	Top-5 acc 82.031 (80.493)	lr 0.01411
Train [56][200/3239]	Time 0.244 (0.760)	Data Time 0.001 (0.288)	Loss 2.7044 (2.6893)	Entropy 0.63169 (0.63107)	Top-1 acc 58.984 (59.350)	Top-5 acc 80.469 (80.583)	lr 0.01411
Train [56][210/3239]	Time 0.249 (0.744)	Data Time 0.001 (0.275)	Loss 2.6637 (2.6905)	Entropy 0.63183 (0.63111)	Top-1 acc 56.641 (59.318)	Top-5 acc 82.031 (80.576)	lr 0.01411
Train [56][220/3239]	Time 0.351 (0.731)	Data Time 0.001 (0.263)	Loss 2.7487 (2.6931)	Entropy 0.63171 (0.63114)	Top-1 acc 55.078 (59.204)	Top-5 acc 80.469 (80.550)	lr 0.01411
Train [56][230/3239]	Time 0.259 (0.747)	Data Time 0.001 (0.279)	Loss 2.7336 (2.6941)	Entropy 0.63155 (0.63116)	Top-1 acc 61.328 (59.143)	Top-5 acc 79.688 (80.555)	lr 0.01411
Train [56][240/3239]	Time 0.245 (0.733)	Data Time 0.001 (0.267)	Loss 2.5870 (2.6946)	Entropy 0.63144 (0.63118)	Top-1 acc 60.938 (59.106)	Top-5 acc 82.812 (80.522)	lr 0.01411
Train [56][250/3239]	Time 0.250 (0.723)	Data Time 0.001 (0.257)	Loss 2.9116 (2.6954)	Entropy 0.63136 (0.63118)	Top-1 acc 48.438 (59.107)	Top-5 acc 80.078 (80.526)	lr 0.01411
Train [56][260/3239]	Time 0.276 (0.733)	Data Time 0.002 (0.267)	Loss 2.6883 (2.6939)	Entropy 0.63114 (0.63119)	Top-1 acc 60.547 (59.095)	Top-5 acc 79.297 (80.538)	lr 0.01411
Train [56][270/3239]	Time 0.240 (0.722)	Data Time 0.001 (0.257)	Loss 2.8903 (2.6954)	Entropy 0.63134 (0.63119)	Top-1 acc 51.953 (59.097)	Top-5 acc 77.344 (80.485)	lr 0.01410
Train [56][280/3239]	Time 0.249 (0.712)	Data Time 0.001 (0.248)	Loss 2.7438 (2.6953)	Entropy 0.63133 (0.63120)	Top-1 acc 54.297 (59.079)	Top-5 acc 77.734 (80.463)	lr 0.01410
Train [56][290/3239]	Time 0.302 (0.728)	Data Time 0.004 (0.264)	Loss 2.5888 (2.6943)	Entropy 0.63130 (0.63120)	Top-1 acc 64.062 (59.105)	Top-5 acc 82.812 (80.497)	lr 0.01410
Train [56][300/3239]	Time 0.236 (0.718)	Data Time 0.001 (0.256)	Loss 2.8688 (2.6949)	Entropy 0.63123 (0.63120)	Top-1 acc 56.250 (59.087)	Top-5 acc 78.125 (80.478)	lr 0.01410
Train [56][310/3239]	Time 0.326 (0.709)	Data Time 0.001 (0.247)	Loss 2.6794 (2.6931)	Entropy 0.63099 (0.63120)	Top-1 acc 62.109 (59.144)	Top-5 acc 79.688 (80.500)	lr 0.01410
Train [56][320/3239]	Time 0.304 (0.701)	Data Time 0.035 (0.240)	Loss 2.4767 (2.6927)	Entropy 0.63071 (0.63119)	Top-1 acc 66.406 (59.135)	Top-5 acc 84.375 (80.526)	lr 0.01410
Train [56][330/3239]	Time 0.233 (0.693)	Data Time 0.001 (0.233)	Loss 2.6043 (2.6926)	Entropy 0.63094 (0.63118)	Top-1 acc 60.156 (59.139)	Top-5 acc 82.812 (80.547)	lr 0.01410
Train [56][340/3239]	Time 0.266 (0.685)	Data Time 0.001 (0.226)	Loss 2.8090 (2.6932)	Entropy 0.63051 (0.63117)	Top-1 acc 58.203 (59.105)	Top-5 acc 78.906 (80.552)	lr 0.01410
Train [56][350/3239]	Time 0.282 (0.679)	Data Time 0.001 (0.220)	Loss 2.7502 (2.6928)	Entropy 0.63044 (0.63115)	Top-1 acc 59.766 (59.123)	Top-5 acc 78.516 (80.570)	lr 0.01410
Train [56][360/3239]	Time 0.226 (0.671)	Data Time 0.001 (0.214)	Loss 2.5700 (2.6924)	Entropy 0.63046 (0.63113)	Top-1 acc 64.453 (59.109)	Top-5 acc 82.031 (80.592)	lr 0.01410
Train [56][370/3239]	Time 0.238 (0.664)	Data Time 0.003 (0.208)	Loss 2.7015 (2.6929)	Entropy 0.63071 (0.63111)	Top-1 acc 57.031 (59.059)	Top-5 acc 78.906 (80.577)	lr 0.01409
Train [56][380/3239]	Time 0.354 (0.659)	Data Time 0.001 (0.202)	Loss 2.7268 (2.6940)	Entropy 0.63096 (0.63110)	Top-1 acc 58.594 (59.043)	Top-5 acc 79.297 (80.552)	lr 0.01409
Train [56][390/3239]	Time 0.241 (0.653)	Data Time 0.001 (0.197)	Loss 2.7461 (2.6929)	Entropy 0.63085 (0.63110)	Top-1 acc 57.812 (59.062)	Top-5 acc 79.688 (80.586)	lr 0.01409
Train [56][400/3239]	Time 0.250 (0.647)	Data Time 0.001 (0.192)	Loss 2.5271 (2.6926)	Entropy 0.63092 (0.63109)	Top-1 acc 61.328 (59.060)	Top-5 acc 82.812 (80.571)	lr 0.01409
Train [56][410/3239]	Time 0.286 (0.644)	Data Time 0.001 (0.188)	Loss 2.8731 (2.6939)	Entropy 0.63085 (0.63109)	Top-1 acc 54.688 (59.035)	Top-5 acc 76.562 (80.557)	lr 0.01409
Train [56][420/3239]	Time 0.242 (0.638)	Data Time 0.001 (0.183)	Loss 2.5430 (2.6929)	Entropy 0.63075 (0.63108)	Top-1 acc 65.234 (59.056)	Top-5 acc 82.812 (80.586)	lr 0.01409
Train [56][430/3239]	Time 0.288 (0.634)	Data Time 0.004 (0.179)	Loss 2.5191 (2.6923)	Entropy 0.63066 (0.63107)	Top-1 acc 66.406 (59.072)	Top-5 acc 83.203 (80.602)	lr 0.01409
Train [56][440/3239]	Time 0.232 (0.629)	Data Time 0.001 (0.175)	Loss 3.0181 (2.6915)	Entropy 0.63070 (0.63106)	Top-1 acc 48.047 (59.065)	Top-5 acc 76.953 (80.639)	lr 0.01409
Train [56][450/3239]	Time 0.230 (0.625)	Data Time 0.001 (0.171)	Loss 2.7766 (2.6920)	Entropy 0.63106 (0.63106)	Top-1 acc 57.812 (59.047)	Top-5 acc 76.172 (80.620)	lr 0.01409
Train [56][460/3239]	Time 0.232 (0.620)	Data Time 0.001 (0.168)	Loss 2.7793 (2.6928)	Entropy 0.63113 (0.63106)	Top-1 acc 58.984 (59.019)	Top-5 acc 79.297 (80.607)	lr 0.01409
Train [56][470/3239]	Time 0.261 (0.616)	Data Time 0.001 (0.164)	Loss 2.7876 (2.6931)	Entropy 0.63088 (0.63105)	Top-1 acc 57.031 (59.013)	Top-5 acc 82.422 (80.612)	lr 0.01408
Train [56][480/3239]	Time 0.267 (0.612)	Data Time 0.002 (0.161)	Loss 2.5690 (2.6934)	Entropy 0.63063 (0.63105)	Top-1 acc 60.156 (58.990)	Top-5 acc 83.203 (80.631)	lr 0.01408
Train [56][490/3239]	Time 0.310 (0.608)	Data Time 0.002 (0.157)	Loss 2.6088 (2.6938)	Entropy 0.63081 (0.63104)	Top-1 acc 58.984 (58.984)	Top-5 acc 81.250 (80.636)	lr 0.01408
Train [56][500/3239]	Time 0.291 (0.606)	Data Time 0.001 (0.154)	Loss 2.6364 (2.6929)	Entropy 0.63103 (0.63104)	Top-1 acc 63.281 (59.011)	Top-5 acc 81.641 (80.654)	lr 0.01408
Train [56][510/3239]	Time 0.318 (0.602)	Data Time 0.001 (0.151)	Loss 2.5019 (2.6931)	Entropy 0.63122 (0.63104)	Top-1 acc 66.016 (59.010)	Top-5 acc 85.156 (80.645)	lr 0.01408
Train [56][520/3239]	Time 0.235 (0.600)	Data Time 0.001 (0.149)	Loss 2.7188 (2.6928)	Entropy 0.63138 (0.63105)	Top-1 acc 60.156 (59.013)	Top-5 acc 79.297 (80.647)	lr 0.01408
Train [56][530/3239]	Time 0.258 (0.596)	Data Time 0.001 (0.146)	Loss 2.7648 (2.6940)	Entropy 0.63137 (0.63105)	Top-1 acc 57.812 (58.973)	Top-5 acc 77.734 (80.631)	lr 0.01408
Train [56][540/3239]	Time 0.320 (0.593)	Data Time 0.001 (0.143)	Loss 2.6991 (2.6943)	Entropy 0.63150 (0.63106)	Top-1 acc 60.938 (58.974)	Top-5 acc 79.688 (80.626)	lr 0.01408
Train [56][550/3239]	Time 0.255 (0.592)	Data Time 0.001 (0.141)	Loss 2.6427 (2.6933)	Entropy 0.63169 (0.63107)	Top-1 acc 61.328 (58.989)	Top-5 acc 83.984 (80.643)	lr 0.01408
Train [56][560/3239]	Time 0.253 (0.589)	Data Time 0.001 (0.138)	Loss 2.6173 (2.6944)	Entropy 0.63155 (0.63108)	Top-1 acc 62.109 (58.963)	Top-5 acc 82.031 (80.626)	lr 0.01408
Train [56][570/3239]	Time 0.239 (0.587)	Data Time 0.001 (0.136)	Loss 2.7284 (2.6949)	Entropy 0.63139 (0.63109)	Top-1 acc 61.328 (58.963)	Top-5 acc 78.516 (80.603)	lr 0.01407
Train [56][580/3239]	Time 0.278 (0.584)	Data Time 0.001 (0.133)	Loss 2.6575 (2.6949)	Entropy 0.63153 (0.63109)	Top-1 acc 60.156 (58.967)	Top-5 acc 80.469 (80.612)	lr 0.01407
Train [56][590/3239]	Time 0.334 (0.646)	Data Time 0.004 (0.131)	Loss 2.5807 (2.6950)	Entropy 0.63109 (0.63110)	Top-1 acc 64.844 (58.974)	Top-5 acc 83.984 (80.621)	lr 0.01407
Train [56][600/3239]	Time 0.239 (0.642)	Data Time 0.002 (0.129)	Loss 2.7710 (2.6961)	Entropy 0.63104 (0.63110)	Top-1 acc 61.328 (58.954)	Top-5 acc 80.859 (80.614)	lr 0.01407
Train [56][610/3239]	Time 0.275 (0.639)	Data Time 0.002 (0.127)	Loss 2.6917 (2.6961)	Entropy 0.63087 (0.63109)	Top-1 acc 58.984 (58.956)	Top-5 acc 82.422 (80.620)	lr 0.01407
Train [56][620/3239]	Time 0.253 (0.636)	Data Time 0.001 (0.125)	Loss 2.6575 (2.6962)	Entropy 0.63079 (0.63109)	Top-1 acc 60.156 (58.929)	Top-5 acc 78.906 (80.615)	lr 0.01407
Train [56][630/3239]	Time 0.369 (0.632)	Data Time 0.001 (0.123)	Loss 2.8399 (2.6967)	Entropy 0.63083 (0.63108)	Top-1 acc 57.812 (58.913)	Top-5 acc 76.172 (80.603)	lr 0.01407
Train [56][640/3239]	Time 0.269 (0.630)	Data Time 0.001 (0.121)	Loss 2.6743 (2.6972)	Entropy 0.63091 (0.63108)	Top-1 acc 53.906 (58.897)	Top-5 acc 81.250 (80.594)	lr 0.01407
Train [56][650/3239]	Time 0.264 (0.627)	Data Time 0.001 (0.119)	Loss 2.6304 (2.6977)	Entropy 0.63085 (0.63108)	Top-1 acc 60.938 (58.896)	Top-5 acc 78.906 (80.562)	lr 0.01407
Train [56][660/3239]	Time 0.241 (0.624)	Data Time 0.001 (0.117)	Loss 2.6722 (2.6982)	Entropy 0.63061 (0.63107)	Top-1 acc 60.156 (58.871)	Top-5 acc 80.469 (80.561)	lr 0.01407
Train [56][670/3239]	Time 0.290 (0.627)	Data Time 0.001 (0.121)	Loss 2.6138 (2.6972)	Entropy 0.63040 (0.63107)	Top-1 acc 58.984 (58.890)	Top-5 acc 83.984 (80.587)	lr 0.01406
Train [56][680/3239]	Time 0.238 (0.624)	Data Time 0.001 (0.120)	Loss 2.6771 (2.6967)	Entropy 0.63033 (0.63105)	Top-1 acc 60.547 (58.893)	Top-5 acc 82.031 (80.602)	lr 0.01406
Train [56][690/3239]	Time 0.236 (0.634)	Data Time 0.001 (0.130)	Loss 2.7020 (2.6961)	Entropy 0.63031 (0.63105)	Top-1 acc 56.250 (58.898)	Top-5 acc 82.031 (80.617)	lr 0.01406
Train [56][700/3239]	Time 2.177 (0.639)	Data Time 1.742 (0.136)	Loss 2.8575 (2.6961)	Entropy 0.63003 (0.63103)	Top-1 acc 52.734 (58.884)	Top-5 acc 78.906 (80.597)	lr 0.01406
Train [56][710/3239]	Time 0.245 (0.640)	Data Time 0.001 (0.138)	Loss 2.6276 (2.6952)	Entropy 0.63020 (0.63102)	Top-1 acc 57.422 (58.905)	Top-5 acc 81.250 (80.604)	lr 0.01406
Train [56][720/3239]	Time 0.250 (0.648)	Data Time 0.001 (0.147)	Loss 2.6688 (2.6957)	Entropy 0.63042 (0.63101)	Top-1 acc 60.547 (58.887)	Top-5 acc 82.031 (80.586)	lr 0.01406
Train [56][730/3239]	Time 0.234 (0.651)	Data Time 0.001 (0.151)	Loss 2.8767 (2.6963)	Entropy 0.63035 (0.63100)	Top-1 acc 54.297 (58.879)	Top-5 acc 78.125 (80.576)	lr 0.01406
Train [56][740/3239]	Time 0.249 (0.654)	Data Time 0.001 (0.155)	Loss 2.7547 (2.6962)	Entropy 0.63038 (0.63099)	Top-1 acc 57.031 (58.877)	Top-5 acc 79.688 (80.584)	lr 0.01406
Train [56][750/3239]	Time 0.232 (0.664)	Data Time 0.001 (0.166)	Loss 2.9262 (2.6967)	Entropy 0.63037 (0.63098)	Top-1 acc 55.469 (58.875)	Top-5 acc 75.781 (80.565)	lr 0.01406
Train [56][760/3239]	Time 4.673 (0.667)	Data Time 4.416 (0.170)	Loss 2.5780 (2.6972)	Entropy 0.63061 (0.63098)	Top-1 acc 62.500 (58.855)	Top-5 acc 82.031 (80.551)	lr 0.01406
Train [56][770/3239]	Time 1.779 (0.669)	Data Time 1.523 (0.172)	Loss 2.7567 (2.6973)	Entropy 0.63059 (0.63097)	Top-1 acc 58.984 (58.849)	Top-5 acc 78.125 (80.552)	lr 0.01405
Train [56][780/3239]	Time 2.113 (0.672)	Data Time 1.860 (0.176)	Loss 2.8966 (2.6975)	Entropy 0.63067 (0.63097)	Top-1 acc 55.078 (58.838)	Top-5 acc 76.562 (80.546)	lr 0.01405
Train [56][790/3239]	Time 0.251 (0.673)	Data Time 0.001 (0.178)	Loss 2.5909 (2.6971)	Entropy 0.63055 (0.63096)	Top-1 acc 60.156 (58.856)	Top-5 acc 82.812 (80.550)	lr 0.01405
Train [56][800/3239]	Time 0.227 (0.678)	Data Time 0.001 (0.184)	Loss 2.5065 (2.6964)	Entropy 0.63073 (0.63096)	Top-1 acc 62.891 (58.883)	Top-5 acc 83.984 (80.574)	lr 0.01405
Train [56][810/3239]	Time 3.538 (0.685)	Data Time 3.283 (0.192)	Loss 2.7865 (2.6968)	Entropy 0.63074 (0.63096)	Top-1 acc 56.641 (58.875)	Top-5 acc 78.516 (80.565)	lr 0.01405
Train [56][820/3239]	Time 0.232 (0.683)	Data Time 0.001 (0.190)	Loss 2.6462 (2.6968)	Entropy 0.63078 (0.63095)	Top-1 acc 58.203 (58.887)	Top-5 acc 79.297 (80.559)	lr 0.01405
Train [56][830/3239]	Time 0.249 (0.691)	Data Time 0.001 (0.199)	Loss 2.5976 (2.6969)	Entropy 0.63081 (0.63095)	Top-1 acc 62.109 (58.889)	Top-5 acc 81.250 (80.551)	lr 0.01405
Train [56][840/3239]	Time 0.283 (0.700)	Data Time 0.003 (0.208)	Loss 2.5779 (2.6971)	Entropy 0.63098 (0.63095)	Top-1 acc 63.281 (58.896)	Top-5 acc 80.859 (80.552)	lr 0.01405
Train [56][850/3239]	Time 0.238 (0.697)	Data Time 0.001 (0.206)	Loss 2.9480 (2.6972)	Entropy 0.63021 (0.63095)	Top-1 acc 52.734 (58.896)	Top-5 acc 76.562 (80.550)	lr 0.01405
Train [56][860/3239]	Time 0.333 (0.704)	Data Time 0.001 (0.214)	Loss 3.0587 (2.6977)	Entropy 0.63053 (0.63094)	Top-1 acc 49.219 (58.881)	Top-5 acc 73.438 (80.541)	lr 0.01405
Train [56][870/3239]	Time 0.260 (0.714)	Data Time 0.001 (0.224)	Loss 2.7421 (2.6982)	Entropy 0.63023 (0.63093)	Top-1 acc 58.203 (58.858)	Top-5 acc 78.516 (80.525)	lr 0.01404
Train [56][880/3239]	Time 0.248 (0.711)	Data Time 0.001 (0.222)	Loss 2.6207 (2.6982)	Entropy 0.63026 (0.63093)	Top-1 acc 62.891 (58.860)	Top-5 acc 80.859 (80.522)	lr 0.01404
Train [56][890/3239]	Time 0.249 (0.712)	Data Time 0.001 (0.224)	Loss 2.8940 (2.6982)	Entropy 0.63018 (0.63092)	Top-1 acc 54.297 (58.861)	Top-5 acc 77.734 (80.531)	lr 0.01404
Train [56][900/3239]	Time 0.248 (0.724)	Data Time 0.001 (0.236)	Loss 2.6093 (2.6976)	Entropy 0.63000 (0.63091)	Top-1 acc 60.547 (58.871)	Top-5 acc 82.812 (80.552)	lr 0.01404
Train [56][910/3239]	Time 0.281 (0.721)	Data Time 0.002 (0.233)	Loss 2.7288 (2.6980)	Entropy 0.63000 (0.63090)	Top-1 acc 57.812 (58.861)	Top-5 acc 81.250 (80.536)	lr 0.01404
Train [56][920/3239]	Time 4.155 (0.722)	Data Time 3.889 (0.235)	Loss 2.7803 (2.6976)	Entropy 0.62980 (0.63089)	Top-1 acc 57.812 (58.868)	Top-5 acc 77.734 (80.540)	lr 0.01404
Train [56][930/3239]	Time 9.765 (0.734)	Data Time 9.430 (0.248)	Loss 2.7383 (2.6975)	Entropy 0.62957 (0.63088)	Top-1 acc 59.766 (58.881)	Top-5 acc 80.078 (80.538)	lr 0.01404
Train [56][940/3239]	Time 0.233 (0.731)	Data Time 0.001 (0.245)	Loss 2.5748 (2.6978)	Entropy 0.62962 (0.63086)	Top-1 acc 62.891 (58.871)	Top-5 acc 82.422 (80.535)	lr 0.01404
Train [56][950/3239]	Time 0.226 (0.728)	Data Time 0.001 (0.243)	Loss 2.9570 (2.6982)	Entropy 0.62955 (0.63085)	Top-1 acc 52.734 (58.866)	Top-5 acc 75.391 (80.527)	lr 0.01404
Train [56][960/3239]	Time 0.239 (0.736)	Data Time 0.001 (0.252)	Loss 2.7108 (2.6978)	Entropy 0.62970 (0.63084)	Top-1 acc 60.938 (58.880)	Top-5 acc 78.516 (80.536)	lr 0.01404
Train [56][970/3239]	Time 0.252 (0.740)	Data Time 0.001 (0.257)	Loss 2.6860 (2.6972)	Entropy 0.62973 (0.63083)	Top-1 acc 60.156 (58.894)	Top-5 acc 80.859 (80.545)	lr 0.01403
Train [56][980/3239]	Time 0.232 (0.738)	Data Time 0.001 (0.256)	Loss 2.6803 (2.6975)	Entropy 0.62957 (0.63081)	Top-1 acc 59.766 (58.892)	Top-5 acc 83.203 (80.542)	lr 0.01403
Train [56][990/3239]	Time 0.240 (0.748)	Data Time 0.001 (0.266)	Loss 2.7526 (2.6977)	Entropy 0.62946 (0.63080)	Top-1 acc 57.422 (58.884)	Top-5 acc 81.641 (80.534)	lr 0.01403
Train [56][1000/3239]	Time 0.233 (0.753)	Data Time 0.001 (0.272)	Loss 2.9622 (2.6983)	Entropy 0.62924 (0.63079)	Top-1 acc 52.734 (58.864)	Top-5 acc 75.781 (80.525)	lr 0.01403
Train [56][1010/3239]	Time 0.241 (0.750)	Data Time 0.001 (0.269)	Loss 2.5535 (2.6973)	Entropy 0.62914 (0.63077)	Top-1 acc 62.109 (58.888)	Top-5 acc 84.375 (80.544)	lr 0.01403
Train [56][1020/3239]	Time 0.348 (0.760)	Data Time 0.001 (0.280)	Loss 2.6734 (2.6972)	Entropy 0.62933 (0.63075)	Top-1 acc 60.156 (58.893)	Top-5 acc 82.422 (80.541)	lr 0.01403
Train [56][1030/3239]	Time 0.235 (0.765)	Data Time 0.001 (0.286)	Loss 2.6959 (2.6968)	Entropy 0.62901 (0.63074)	Top-1 acc 57.812 (58.901)	Top-5 acc 80.469 (80.552)	lr 0.01403
Train [56][1040/3239]	Time 0.244 (0.762)	Data Time 0.001 (0.283)	Loss 2.6209 (2.6963)	Entropy 0.62913 (0.63072)	Top-1 acc 58.984 (58.915)	Top-5 acc 84.375 (80.554)	lr 0.01403
Train [56][1050/3239]	Time 0.238 (0.770)	Data Time 0.001 (0.293)	Loss 2.7505 (2.6963)	Entropy 0.62940 (0.63071)	Top-1 acc 58.984 (58.916)	Top-5 acc 78.125 (80.559)	lr 0.01403
Train [56][1060/3239]	Time 0.288 (0.775)	Data Time 0.002 (0.298)	Loss 2.6733 (2.6958)	Entropy 0.62931 (0.63070)	Top-1 acc 61.719 (58.931)	Top-5 acc 81.641 (80.563)	lr 0.01403
Train [56][1070/3239]	Time 0.236 (0.772)	Data Time 0.001 (0.295)	Loss 2.5979 (2.6955)	Entropy 0.62954 (0.63068)	Top-1 acc 60.547 (58.941)	Top-5 acc 83.984 (80.571)	lr 0.01402
Train [56][1080/3239]	Time 10.504 (0.781)	Data Time 10.273 (0.305)	Loss 2.9272 (2.6955)	Entropy 0.62945 (0.63067)	Top-1 acc 53.516 (58.935)	Top-5 acc 75.781 (80.570)	lr 0.01402
Train [56][1090/3239]	Time 10.539 (0.787)	Data Time 10.187 (0.312)	Loss 2.5142 (2.6951)	Entropy 0.62967 (0.63066)	Top-1 acc 63.281 (58.949)	Top-5 acc 84.375 (80.575)	lr 0.01402
Train [56][1100/3239]	Time 0.244 (0.784)	Data Time 0.001 (0.309)	Loss 2.6496 (2.6950)	Entropy 0.62933 (0.63065)	Top-1 acc 58.203 (58.957)	Top-5 acc 84.375 (80.578)	lr 0.01402
Train [56][1110/3239]	Time 0.245 (0.788)	Data Time 0.001 (0.314)	Loss 2.7837 (2.6955)	Entropy 0.62963 (0.63064)	Top-1 acc 59.375 (58.953)	Top-5 acc 78.906 (80.568)	lr 0.01402
Train [56][1120/3239]	Time 0.240 (0.791)	Data Time 0.001 (0.317)	Loss 2.7736 (2.6960)	Entropy 0.62950 (0.63063)	Top-1 acc 58.203 (58.943)	Top-5 acc 76.562 (80.554)	lr 0.01402
Train [56][1130/3239]	Time 0.243 (0.798)	Data Time 0.001 (0.324)	Loss 2.6025 (2.6959)	Entropy 0.62950 (0.63062)	Top-1 acc 58.594 (58.938)	Top-5 acc 83.203 (80.558)	lr 0.01402
Train [56][1140/3239]	Time 0.257 (0.801)	Data Time 0.001 (0.328)	Loss 2.6002 (2.6960)	Entropy 0.62907 (0.63061)	Top-1 acc 62.109 (58.947)	Top-5 acc 83.594 (80.563)	lr 0.01402
Train [56][1150/3239]	Time 0.408 (0.803)	Data Time 0.173 (0.330)	Loss 2.5815 (2.6960)	Entropy 0.62879 (0.63060)	Top-1 acc 60.938 (58.951)	Top-5 acc 83.984 (80.562)	lr 0.01402
Train [56][1160/3239]	Time 0.231 (0.811)	Data Time 0.001 (0.339)	Loss 2.5997 (2.6964)	Entropy 0.62864 (0.63058)	Top-1 acc 62.109 (58.942)	Top-5 acc 81.250 (80.552)	lr 0.01402
Train [56][1170/3239]	Time 6.865 (0.813)	Data Time 6.608 (0.341)	Loss 2.6715 (2.6965)	Entropy 0.62860 (0.63056)	Top-1 acc 59.375 (58.934)	Top-5 acc 81.250 (80.542)	lr 0.01401
Train [56][1180/3239]	Time 0.272 (0.817)	Data Time 0.001 (0.345)	Loss 2.9710 (2.6965)	Entropy 0.62877 (0.63055)	Top-1 acc 54.688 (58.942)	Top-5 acc 78.125 (80.553)	lr 0.01401
Train [56][1190/3239]	Time 0.242 (0.829)	Data Time 0.001 (0.358)	Loss 2.6815 (2.6966)	Entropy 0.62903 (0.63053)	Top-1 acc 55.078 (58.936)	Top-5 acc 82.031 (80.553)	lr 0.01401
Train [56][1200/3239]	Time 0.234 (0.826)	Data Time 0.001 (0.355)	Loss 2.7362 (2.6967)	Entropy 0.62878 (0.63052)	Top-1 acc 55.859 (58.926)	Top-5 acc 80.859 (80.553)	lr 0.01401
Train [56][1210/3239]	Time 0.240 (0.832)	Data Time 0.001 (0.362)	Loss 3.0142 (2.6974)	Entropy 0.62915 (0.63051)	Top-1 acc 50.391 (58.910)	Top-5 acc 73.438 (80.542)	lr 0.01401
Train [56][1220/3239]	Time 0.251 (0.842)	Data Time 0.001 (0.372)	Loss 2.6629 (2.6974)	Entropy 0.62904 (0.63050)	Top-1 acc 62.891 (58.911)	Top-5 acc 80.469 (80.540)	lr 0.01401
Train [56][1230/3239]	Time 0.243 (0.839)	Data Time 0.001 (0.369)	Loss 2.5704 (2.6974)	Entropy 0.62906 (0.63048)	Top-1 acc 61.328 (58.916)	Top-5 acc 80.469 (80.535)	lr 0.01401
Train [56][1240/3239]	Time 0.420 (0.871)	Data Time 0.006 (0.375)	Loss 2.6194 (2.6974)	Entropy 0.62905 (0.63047)	Top-1 acc 62.891 (58.918)	Top-5 acc 83.984 (80.536)	lr 0.01401
Train [56][1250/3239]	Time 0.347 (0.868)	Data Time 0.002 (0.372)	Loss 2.9001 (2.6976)	Entropy 0.62846 (0.63046)	Top-1 acc 55.078 (58.915)	Top-5 acc 75.781 (80.535)	lr 0.01401
Train [56][1260/3239]	Time 0.279 (0.865)	Data Time 0.001 (0.369)	Loss 2.8149 (2.6985)	Entropy 0.62848 (0.63044)	Top-1 acc 55.078 (58.895)	Top-5 acc 78.516 (80.518)	lr 0.01401
Train [56][1270/3239]	Time 0.264 (0.862)	Data Time 0.002 (0.366)	Loss 2.6853 (2.6978)	Entropy 0.62864 (0.63043)	Top-1 acc 59.766 (58.912)	Top-5 acc 79.688 (80.533)	lr 0.01400
Train [56][1280/3239]	Time 0.254 (0.869)	Data Time 0.001 (0.374)	Loss 2.6869 (2.6973)	Entropy 0.62869 (0.63042)	Top-1 acc 58.203 (58.922)	Top-5 acc 84.766 (80.544)	lr 0.01400
Train [56][1290/3239]	Time 0.249 (0.871)	Data Time 0.002 (0.376)	Loss 2.7067 (2.6971)	Entropy 0.62862 (0.63040)	Top-1 acc 59.375 (58.930)	Top-5 acc 81.641 (80.544)	lr 0.01400
Train [56][1300/3239]	Time 0.233 (0.868)	Data Time 0.001 (0.374)	Loss 2.4923 (2.6971)	Entropy 0.62870 (0.63039)	Top-1 acc 60.156 (58.930)	Top-5 acc 84.766 (80.550)	lr 0.01400
Train [56][1310/3239]	Time 0.231 (0.883)	Data Time 0.001 (0.389)	Loss 2.6576 (2.6967)	Entropy 0.62878 (0.63038)	Top-1 acc 61.328 (58.943)	Top-5 acc 81.641 (80.557)	lr 0.01400
Train [56][1320/3239]	Time 0.251 (0.887)	Data Time 0.001 (0.394)	Loss 2.6641 (2.6965)	Entropy 0.62864 (0.63036)	Top-1 acc 59.766 (58.937)	Top-5 acc 80.469 (80.561)	lr 0.01400
Train [56][1330/3239]	Time 0.613 (0.884)	Data Time 0.308 (0.391)	Loss 2.8213 (2.6966)	Entropy 0.62888 (0.63035)	Top-1 acc 57.031 (58.942)	Top-5 acc 76.172 (80.559)	lr 0.01400
Train [56][1340/3239]	Time 0.890 (0.895)	Data Time 0.632 (0.403)	Loss 2.6690 (2.6963)	Entropy 0.62878 (0.63034)	Top-1 acc 57.031 (58.952)	Top-5 acc 82.422 (80.565)	lr 0.01400
Train [56][1350/3239]	Time 0.235 (0.898)	Data Time 0.001 (0.407)	Loss 2.6950 (2.6966)	Entropy 0.62853 (0.63033)	Top-1 acc 62.109 (58.947)	Top-5 acc 79.688 (80.559)	lr 0.01400
Train [56][1360/3239]	Time 0.232 (0.894)	Data Time 0.001 (0.404)	Loss 2.7097 (2.6962)	Entropy 0.62860 (0.63031)	Top-1 acc 53.516 (58.951)	Top-5 acc 82.812 (80.565)	lr 0.01400
Train [56][1370/3239]	Time 0.230 (0.902)	Data Time 0.001 (0.412)	Loss 2.9134 (2.6965)	Entropy 0.62852 (0.63030)	Top-1 acc 54.688 (58.944)	Top-5 acc 77.344 (80.556)	lr 0.01399
Train [56][1380/3239]	Time 0.260 (0.905)	Data Time 0.001 (0.415)	Loss 2.5765 (2.6964)	Entropy 0.62852 (0.63029)	Top-1 acc 60.547 (58.943)	Top-5 acc 82.812 (80.553)	lr 0.01399
Train [56][1390/3239]	Time 0.252 (0.902)	Data Time 0.001 (0.413)	Loss 2.7170 (2.6967)	Entropy 0.62847 (0.63028)	Top-1 acc 56.641 (58.936)	Top-5 acc 77.344 (80.548)	lr 0.01399
Train [56][1400/3239]	Time 0.227 (0.910)	Data Time 0.001 (0.421)	Loss 2.8610 (2.6967)	Entropy 0.62852 (0.63026)	Top-1 acc 56.641 (58.936)	Top-5 acc 78.516 (80.550)	lr 0.01399
Train [56][1410/3239]	Time 0.338 (0.914)	Data Time 0.001 (0.426)	Loss 2.8034 (2.6967)	Entropy 0.62879 (0.63025)	Top-1 acc 56.641 (58.930)	Top-5 acc 77.734 (80.548)	lr 0.01399
Train [56][1420/3239]	Time 0.235 (0.911)	Data Time 0.001 (0.423)	Loss 2.5971 (2.6965)	Entropy 0.62888 (0.63024)	Top-1 acc 60.938 (58.934)	Top-5 acc 83.203 (80.555)	lr 0.01399
Train [56][1430/3239]	Time 0.262 (0.917)	Data Time 0.001 (0.430)	Loss 2.8243 (2.6963)	Entropy 0.62841 (0.63023)	Top-1 acc 55.859 (58.937)	Top-5 acc 77.344 (80.561)	lr 0.01399
Train [56][1440/3239]	Time 0.239 (0.921)	Data Time 0.001 (0.434)	Loss 2.7042 (2.6962)	Entropy 0.62854 (0.63022)	Top-1 acc 60.938 (58.952)	Top-5 acc 80.469 (80.568)	lr 0.01399
Train [56][1450/3239]	Time 0.257 (0.920)	Data Time 0.001 (0.434)	Loss 2.7073 (2.6965)	Entropy 0.62855 (0.63021)	Top-1 acc 57.812 (58.944)	Top-5 acc 83.203 (80.561)	lr 0.01399
Train [56][1460/3239]	Time 0.248 (0.916)	Data Time 0.001 (0.431)	Loss 2.4858 (2.6965)	Entropy 0.62829 (0.63020)	Top-1 acc 64.844 (58.950)	Top-5 acc 83.203 (80.555)	lr 0.01399
Train [56][1470/3239]	Time 0.522 (0.925)	Data Time 0.270 (0.440)	Loss 2.6129 (2.6961)	Entropy 0.62799 (0.63018)	Top-1 acc 59.375 (58.955)	Top-5 acc 83.203 (80.562)	lr 0.01398
Train [56][1480/3239]	Time 0.363 (0.926)	Data Time 0.001 (0.441)	Loss 2.6058 (2.6957)	Entropy 0.62819 (0.63017)	Top-1 acc 61.328 (58.966)	Top-5 acc 80.469 (80.569)	lr 0.01398
Train [56][1490/3239]	Time 0.239 (0.928)	Data Time 0.001 (0.444)	Loss 2.8002 (2.6954)	Entropy 0.62797 (0.63015)	Top-1 acc 58.984 (58.977)	Top-5 acc 79.297 (80.571)	lr 0.01398
Train [56][1500/3239]	Time 2.622 (0.932)	Data Time 2.362 (0.448)	Loss 2.6243 (2.6955)	Entropy 0.62832 (0.63014)	Top-1 acc 62.891 (58.976)	Top-5 acc 83.203 (80.569)	lr 0.01398
Train [56][1510/3239]	Time 0.231 (0.934)	Data Time 0.001 (0.450)	Loss 2.7844 (2.6958)	Entropy 0.62815 (0.63013)	Top-1 acc 57.422 (58.965)	Top-5 acc 78.516 (80.562)	lr 0.01398
Train [56][1520/3239]	Time 0.222 (0.937)	Data Time 0.001 (0.454)	Loss 2.8734 (2.6962)	Entropy 0.62818 (0.63012)	Top-1 acc 54.297 (58.955)	Top-5 acc 76.562 (80.558)	lr 0.01398
Train [56][1530/3239]	Time 0.250 (0.939)	Data Time 0.002 (0.457)	Loss 2.8383 (2.6965)	Entropy 0.62834 (0.63010)	Top-1 acc 56.641 (58.946)	Top-5 acc 79.688 (80.559)	lr 0.01398
Train [56][1540/3239]	Time 0.252 (0.942)	Data Time 0.001 (0.460)	Loss 2.6701 (2.6964)	Entropy 0.62842 (0.63009)	Top-1 acc 57.812 (58.945)	Top-5 acc 82.422 (80.558)	lr 0.01398
Train [56][1550/3239]	Time 0.234 (0.945)	Data Time 0.001 (0.463)	Loss 2.7010 (2.6963)	Entropy 0.62870 (0.63008)	Top-1 acc 59.375 (58.954)	Top-5 acc 79.688 (80.557)	lr 0.01398
Train [56][1560/3239]	Time 0.282 (0.948)	Data Time 0.001 (0.467)	Loss 2.7069 (2.6965)	Entropy 0.62837 (0.63007)	Top-1 acc 58.984 (58.949)	Top-5 acc 79.688 (80.549)	lr 0.01398
Train [56][1570/3239]	Time 0.334 (0.951)	Data Time 0.001 (0.470)	Loss 2.7132 (2.6966)	Entropy 0.62817 (0.63006)	Top-1 acc 57.422 (58.950)	Top-5 acc 78.906 (80.548)	lr 0.01397
Train [56][1580/3239]	Time 0.232 (0.954)	Data Time 0.001 (0.474)	Loss 2.5517 (2.6967)	Entropy 0.62843 (0.63005)	Top-1 acc 62.109 (58.956)	Top-5 acc 83.203 (80.545)	lr 0.01397
Train [56][1590/3239]	Time 0.265 (0.957)	Data Time 0.001 (0.478)	Loss 2.7956 (2.6961)	Entropy 0.62854 (0.63004)	Top-1 acc 54.297 (58.972)	Top-5 acc 79.297 (80.555)	lr 0.01397
Train [56][1600/3239]	Time 0.229 (0.959)	Data Time 0.001 (0.479)	Loss 2.8849 (2.6968)	Entropy 0.62839 (0.63003)	Top-1 acc 53.906 (58.952)	Top-5 acc 75.000 (80.541)	lr 0.01397
Train [56][1610/3239]	Time 0.228 (0.962)	Data Time 0.001 (0.483)	Loss 2.7752 (2.6969)	Entropy 0.62821 (0.63002)	Top-1 acc 61.328 (58.956)	Top-5 acc 76.172 (80.537)	lr 0.01397
Train [56][1620/3239]	Time 0.243 (0.959)	Data Time 0.001 (0.480)	Loss 3.0244 (2.6972)	Entropy 0.62830 (0.63001)	Top-1 acc 47.266 (58.945)	Top-5 acc 74.609 (80.534)	lr 0.01397
Train [56][1630/3239]	Time 0.233 (0.964)	Data Time 0.001 (0.485)	Loss 2.8200 (2.6974)	Entropy 0.62805 (0.63000)	Top-1 acc 55.859 (58.941)	Top-5 acc 76.953 (80.527)	lr 0.01397
Train [56][1640/3239]	Time 0.331 (0.964)	Data Time 0.001 (0.486)	Loss 2.7818 (2.6974)	Entropy 0.62803 (0.62998)	Top-1 acc 55.859 (58.938)	Top-5 acc 83.203 (80.531)	lr 0.01397
Train [56][1650/3239]	Time 0.239 (0.969)	Data Time 0.001 (0.491)	Loss 2.8912 (2.6974)	Entropy 0.62795 (0.62997)	Top-1 acc 59.766 (58.942)	Top-5 acc 75.000 (80.526)	lr 0.01397
Train [56][1660/3239]	Time 0.251 (0.974)	Data Time 0.001 (0.497)	Loss 2.6608 (2.6975)	Entropy 0.62799 (0.62996)	Top-1 acc 58.594 (58.937)	Top-5 acc 79.297 (80.521)	lr 0.01397
Train [56][1670/3239]	Time 0.227 (0.972)	Data Time 0.001 (0.495)	Loss 2.7274 (2.6971)	Entropy 0.62776 (0.62995)	Top-1 acc 59.375 (58.942)	Top-5 acc 77.734 (80.527)	lr 0.01396
Train [56][1680/3239]	Time 0.251 (0.980)	Data Time 0.001 (0.503)	Loss 2.6058 (2.6973)	Entropy 0.62791 (0.62994)	Top-1 acc 61.719 (58.940)	Top-5 acc 82.422 (80.523)	lr 0.01396
Train [56][1690/3239]	Time 0.227 (0.981)	Data Time 0.001 (0.504)	Loss 2.9465 (2.6977)	Entropy 0.62790 (0.62992)	Top-1 acc 53.125 (58.922)	Top-5 acc 75.000 (80.516)	lr 0.01396
Train [56][1700/3239]	Time 0.246 (0.982)	Data Time 0.001 (0.506)	Loss 2.6954 (2.6979)	Entropy 0.62804 (0.62991)	Top-1 acc 60.156 (58.912)	Top-5 acc 82.812 (80.514)	lr 0.01396
Train [56][1710/3239]	Time 0.242 (0.982)	Data Time 0.001 (0.506)	Loss 2.7081 (2.6981)	Entropy 0.62801 (0.62990)	Top-1 acc 59.766 (58.913)	Top-5 acc 79.688 (80.512)	lr 0.01396
Train [56][1720/3239]	Time 0.234 (0.990)	Data Time 0.001 (0.515)	Loss 2.6985 (2.6984)	Entropy 0.62800 (0.62989)	Top-1 acc 59.375 (58.904)	Top-5 acc 77.344 (80.506)	lr 0.01396
Train [56][1730/3239]	Time 0.259 (0.991)	Data Time 0.001 (0.516)	Loss 2.7936 (2.6984)	Entropy 0.62785 (0.62988)	Top-1 acc 54.688 (58.905)	Top-5 acc 81.641 (80.505)	lr 0.01396
Train [56][1740/3239]	Time 0.256 (0.990)	Data Time 0.001 (0.515)	Loss 2.5779 (2.6980)	Entropy 0.62780 (0.62987)	Top-1 acc 63.281 (58.910)	Top-5 acc 82.031 (80.510)	lr 0.01396
Train [56][1750/3239]	Time 0.242 (0.997)	Data Time 0.001 (0.523)	Loss 2.7846 (2.6981)	Entropy 0.62767 (0.62985)	Top-1 acc 56.250 (58.901)	Top-5 acc 77.734 (80.510)	lr 0.01396
Train [56][1760/3239]	Time 0.222 (0.997)	Data Time 0.001 (0.522)	Loss 3.0358 (2.6981)	Entropy 0.62762 (0.62984)	Top-1 acc 50.391 (58.901)	Top-5 acc 76.953 (80.515)	lr 0.01396
Train [56][1770/3239]	Time 0.242 (0.997)	Data Time 0.002 (0.523)	Loss 2.7527 (2.6980)	Entropy 0.62751 (0.62983)	Top-1 acc 55.859 (58.905)	Top-5 acc 76.562 (80.517)	lr 0.01395
Train [56][1780/3239]	Time 0.251 (1.003)	Data Time 0.001 (0.530)	Loss 2.6531 (2.6978)	Entropy 0.62795 (0.62982)	Top-1 acc 61.719 (58.907)	Top-5 acc 80.469 (80.520)	lr 0.01395
Train [56][1790/3239]	Time 1.978 (1.004)	Data Time 1.729 (0.531)	Loss 2.6851 (2.6979)	Entropy 0.62779 (0.62981)	Top-1 acc 59.375 (58.904)	Top-5 acc 80.469 (80.517)	lr 0.01395
Train [56][1800/3239]	Time 0.340 (1.001)	Data Time 0.001 (0.528)	Loss 2.7488 (2.6978)	Entropy 0.62774 (0.62979)	Top-1 acc 56.250 (58.908)	Top-5 acc 79.297 (80.521)	lr 0.01395
Train [56][1810/3239]	Time 0.288 (1.014)	Data Time 0.033 (0.541)	Loss 2.7055 (2.6978)	Entropy 0.62805 (0.62978)	Top-1 acc 58.594 (58.911)	Top-5 acc 80.078 (80.524)	lr 0.01395
Train [56][1820/3239]	Time 0.241 (1.014)	Data Time 0.001 (0.541)	Loss 2.5567 (2.6979)	Entropy 0.62789 (0.62977)	Top-1 acc 61.328 (58.914)	Top-5 acc 81.641 (80.521)	lr 0.01395
Train [56][1830/3239]	Time 0.252 (1.011)	Data Time 0.001 (0.539)	Loss 2.7211 (2.6975)	Entropy 0.62778 (0.62976)	Top-1 acc 58.594 (58.920)	Top-5 acc 77.344 (80.525)	lr 0.01395
Train [56][1840/3239]	Time 0.266 (1.022)	Data Time 0.001 (0.550)	Loss 2.7339 (2.6974)	Entropy 0.62776 (0.62975)	Top-1 acc 56.250 (58.918)	Top-5 acc 80.469 (80.528)	lr 0.01395
Train [56][1850/3239]	Time 0.245 (1.024)	Data Time 0.002 (0.552)	Loss 2.5638 (2.6974)	Entropy 0.62807 (0.62974)	Top-1 acc 63.672 (58.913)	Top-5 acc 84.375 (80.529)	lr 0.01395
Train [56][1860/3239]	Time 0.279 (1.022)	Data Time 0.001 (0.550)	Loss 2.5860 (2.6970)	Entropy 0.62809 (0.62973)	Top-1 acc 63.281 (58.924)	Top-5 acc 80.078 (80.534)	lr 0.01395
Train [56][1870/3239]	Time 0.356 (1.022)	Data Time 0.001 (0.550)	Loss 3.0281 (2.6970)	Entropy 0.62809 (0.62972)	Top-1 acc 48.438 (58.926)	Top-5 acc 75.000 (80.535)	lr 0.01394
Train [56][1880/3239]	Time 0.237 (1.035)	Data Time 0.001 (0.563)	Loss 2.6164 (2.6968)	Entropy 0.62803 (0.62972)	Top-1 acc 58.984 (58.928)	Top-5 acc 82.422 (80.539)	lr 0.01394
Train [56][1890/3239]	Time 0.234 (1.033)	Data Time 0.001 (0.561)	Loss 2.6098 (2.6970)	Entropy 0.62800 (0.62971)	Top-1 acc 62.109 (58.933)	Top-5 acc 81.250 (80.534)	lr 0.01394
Train [56][1900/3239]	Time 0.328 (1.048)	Data Time 0.002 (0.559)	Loss 2.6124 (2.6972)	Entropy 0.62767 (0.62970)	Top-1 acc 64.453 (58.938)	Top-5 acc 82.031 (80.527)	lr 0.01394
Train [56][1910/3239]	Time 0.274 (1.045)	Data Time 0.002 (0.556)	Loss 2.6319 (2.6971)	Entropy 0.62738 (0.62969)	Top-1 acc 58.594 (58.937)	Top-5 acc 82.031 (80.525)	lr 0.01394
Train [56][1920/3239]	Time 0.264 (1.042)	Data Time 0.002 (0.553)	Loss 2.4434 (2.6972)	Entropy 0.62735 (0.62967)	Top-1 acc 64.062 (58.936)	Top-5 acc 83.594 (80.523)	lr 0.01394
Train [56][1930/3239]	Time 0.250 (1.040)	Data Time 0.001 (0.551)	Loss 2.5963 (2.6968)	Entropy 0.62758 (0.62966)	Top-1 acc 61.719 (58.946)	Top-5 acc 80.859 (80.529)	lr 0.01394
Train [56][1940/3239]	Time 0.236 (1.046)	Data Time 0.001 (0.558)	Loss 2.7146 (2.6969)	Entropy 0.62784 (0.62965)	Top-1 acc 57.031 (58.942)	Top-5 acc 80.469 (80.530)	lr 0.01394
Train [56][1950/3239]	Time 2.544 (1.048)	Data Time 2.252 (0.560)	Loss 2.7353 (2.6970)	Entropy 0.62791 (0.62964)	Top-1 acc 60.156 (58.943)	Top-5 acc 81.250 (80.528)	lr 0.01394
Train [56][1960/3239]	Time 0.337 (1.045)	Data Time 0.002 (0.557)	Loss 2.7928 (2.6971)	Entropy 0.62795 (0.62963)	Top-1 acc 57.422 (58.944)	Top-5 acc 81.250 (80.528)	lr 0.01394
Train [56][1970/3239]	Time 0.234 (1.055)	Data Time 0.002 (0.568)	Loss 2.6624 (2.6970)	Entropy 0.62772 (0.62962)	Top-1 acc 57.422 (58.945)	Top-5 acc 78.906 (80.526)	lr 0.01393
Train [56][1980/3239]	Time 0.264 (1.057)	Data Time 0.002 (0.570)	Loss 2.6371 (2.6967)	Entropy 0.62763 (0.62961)	Top-1 acc 60.156 (58.953)	Top-5 acc 82.812 (80.531)	lr 0.01393
Train [56][1990/3239]	Time 0.240 (1.055)	Data Time 0.001 (0.568)	Loss 2.5551 (2.6967)	Entropy 0.62761 (0.62961)	Top-1 acc 60.547 (58.951)	Top-5 acc 83.984 (80.526)	lr 0.01393
Train [56][2000/3239]	Time 0.225 (1.063)	Data Time 0.001 (0.577)	Loss 2.7161 (2.6965)	Entropy 0.62777 (0.62960)	Top-1 acc 59.766 (58.960)	Top-5 acc 77.734 (80.530)	lr 0.01393
Train [56][2010/3239]	Time 0.240 (1.068)	Data Time 0.001 (0.581)	Loss 2.5069 (2.6964)	Entropy 0.62790 (0.62959)	Top-1 acc 64.453 (58.967)	Top-5 acc 85.156 (80.533)	lr 0.01393
Train [56][2020/3239]	Time 0.256 (1.065)	Data Time 0.001 (0.579)	Loss 2.6102 (2.6962)	Entropy 0.62782 (0.62958)	Top-1 acc 60.547 (58.963)	Top-5 acc 80.469 (80.538)	lr 0.01393
Train [56][2030/3239]	Time 0.239 (1.068)	Data Time 0.001 (0.582)	Loss 2.6192 (2.6964)	Entropy 0.62790 (0.62957)	Top-1 acc 60.938 (58.953)	Top-5 acc 79.688 (80.534)	lr 0.01393
Train [56][2040/3239]	Time 0.240 (1.077)	Data Time 0.001 (0.592)	Loss 2.7602 (2.6963)	Entropy 0.62813 (0.62956)	Top-1 acc 59.766 (58.956)	Top-5 acc 79.688 (80.536)	lr 0.01393
Train [56][2050/3239]	Time 0.243 (1.074)	Data Time 0.001 (0.589)	Loss 2.6480 (2.6959)	Entropy 0.62804 (0.62956)	Top-1 acc 59.766 (58.963)	Top-5 acc 81.641 (80.543)	lr 0.01393
Train [56][2060/3239]	Time 0.241 (1.075)	Data Time 0.001 (0.590)	Loss 2.6803 (2.6959)	Entropy 0.62816 (0.62955)	Top-1 acc 62.891 (58.964)	Top-5 acc 81.250 (80.543)	lr 0.01393
Train [56][2070/3239]	Time 0.261 (1.087)	Data Time 0.001 (0.602)	Loss 2.4961 (2.6959)	Entropy 0.62843 (0.62954)	Top-1 acc 64.844 (58.967)	Top-5 acc 85.547 (80.540)	lr 0.01392
Train [56][2080/3239]	Time 0.235 (1.084)	Data Time 0.001 (0.599)	Loss 2.6731 (2.6960)	Entropy 0.62825 (0.62954)	Top-1 acc 57.031 (58.961)	Top-5 acc 83.594 (80.540)	lr 0.01392
Train [56][2090/3239]	Time 0.245 (1.084)	Data Time 0.001 (0.600)	Loss 2.8189 (2.6959)	Entropy 0.62821 (0.62953)	Top-1 acc 54.297 (58.966)	Top-5 acc 81.250 (80.547)	lr 0.01392
Train [56][2100/3239]	Time 0.240 (1.087)	Data Time 0.001 (0.603)	Loss 2.6536 (2.6959)	Entropy 0.62829 (0.62952)	Top-1 acc 59.766 (58.964)	Top-5 acc 83.203 (80.546)	lr 0.01392
Train [56][2110/3239]	Time 0.229 (1.092)	Data Time 0.001 (0.609)	Loss 2.8391 (2.6962)	Entropy 0.62815 (0.62952)	Top-1 acc 57.422 (58.955)	Top-5 acc 76.562 (80.538)	lr 0.01392
Train [56][2120/3239]	Time 0.348 (1.089)	Data Time 0.001 (0.606)	Loss 2.6821 (2.6964)	Entropy 0.62816 (0.62951)	Top-1 acc 57.812 (58.947)	Top-5 acc 80.469 (80.536)	lr 0.01392
Train [56][2130/3239]	Time 0.243 (1.095)	Data Time 0.002 (0.612)	Loss 2.9155 (2.6966)	Entropy 0.62818 (0.62950)	Top-1 acc 54.297 (58.947)	Top-5 acc 73.828 (80.535)	lr 0.01392
Train [56][2140/3239]	Time 0.248 (1.101)	Data Time 0.001 (0.618)	Loss 2.6048 (2.6968)	Entropy 0.62791 (0.62950)	Top-1 acc 62.109 (58.937)	Top-5 acc 82.422 (80.531)	lr 0.01392
Train [56][2150/3239]	Time 0.250 (1.097)	Data Time 0.001 (0.615)	Loss 2.7249 (2.6966)	Entropy 0.62797 (0.62949)	Top-1 acc 61.328 (58.942)	Top-5 acc 80.469 (80.536)	lr 0.01392
Train [56][2160/3239]	Time 0.237 (1.104)	Data Time 0.001 (0.622)	Loss 2.6286 (2.6967)	Entropy 0.62775 (0.62948)	Top-1 acc 60.938 (58.939)	Top-5 acc 80.078 (80.534)	lr 0.01392
Train [56][2170/3239]	Time 0.290 (1.108)	Data Time 0.001 (0.626)	Loss 2.6629 (2.6969)	Entropy 0.62766 (0.62948)	Top-1 acc 60.156 (58.937)	Top-5 acc 80.469 (80.534)	lr 0.01391
Train [56][2180/3239]	Time 0.235 (1.105)	Data Time 0.001 (0.624)	Loss 2.6102 (2.6970)	Entropy 0.62804 (0.62947)	Top-1 acc 60.156 (58.932)	Top-5 acc 82.812 (80.531)	lr 0.01391
Train [56][2190/3239]	Time 0.353 (1.109)	Data Time 0.001 (0.628)	Loss 2.7024 (2.6968)	Entropy 0.62803 (0.62946)	Top-1 acc 55.859 (58.935)	Top-5 acc 80.469 (80.537)	lr 0.01391
Train [56][2200/3239]	Time 0.253 (1.114)	Data Time 0.001 (0.633)	Loss 2.6323 (2.6967)	Entropy 0.62830 (0.62946)	Top-1 acc 64.453 (58.942)	Top-5 acc 79.688 (80.534)	lr 0.01391
Train [56][2210/3239]	Time 0.250 (1.115)	Data Time 0.001 (0.634)	Loss 2.8144 (2.6969)	Entropy 0.62807 (0.62945)	Top-1 acc 51.953 (58.935)	Top-5 acc 80.859 (80.533)	lr 0.01391
Train [56][2220/3239]	Time 0.269 (1.117)	Data Time 0.001 (0.636)	Loss 2.7395 (2.6968)	Entropy 0.62808 (0.62944)	Top-1 acc 59.766 (58.935)	Top-5 acc 79.297 (80.532)	lr 0.01391
Train [56][2230/3239]	Time 0.277 (1.119)	Data Time 0.002 (0.638)	Loss 2.6942 (2.6967)	Entropy 0.62839 (0.62944)	Top-1 acc 60.938 (58.939)	Top-5 acc 78.906 (80.539)	lr 0.01391
Train [56][2240/3239]	Time 0.247 (1.120)	Data Time 0.001 (0.640)	Loss 2.5924 (2.6967)	Entropy 0.62787 (0.62943)	Top-1 acc 62.500 (58.937)	Top-5 acc 82.031 (80.538)	lr 0.01391
Train [56][2250/3239]	Time 0.255 (1.121)	Data Time 0.001 (0.641)	Loss 2.6797 (2.6965)	Entropy 0.62790 (0.62943)	Top-1 acc 61.719 (58.945)	Top-5 acc 82.031 (80.537)	lr 0.01391
Train [56][2260/3239]	Time 0.233 (1.119)	Data Time 0.001 (0.639)	Loss 2.8319 (2.6965)	Entropy 0.62787 (0.62942)	Top-1 acc 55.859 (58.947)	Top-5 acc 76.953 (80.539)	lr 0.01391
Train [56][2270/3239]	Time 0.244 (1.122)	Data Time 0.001 (0.643)	Loss 2.4464 (2.6964)	Entropy 0.62802 (0.62941)	Top-1 acc 67.578 (58.952)	Top-5 acc 83.203 (80.535)	lr 0.01390
Train [56][2280/3239]	Time 0.353 (1.119)	Data Time 0.002 (0.640)	Loss 2.7743 (2.6969)	Entropy 0.62825 (0.62941)	Top-1 acc 54.297 (58.942)	Top-5 acc 78.906 (80.524)	lr 0.01390
Train [56][2290/3239]	Time 0.227 (1.121)	Data Time 0.001 (0.642)	Loss 2.4922 (2.6967)	Entropy 0.62850 (0.62940)	Top-1 acc 64.453 (58.951)	Top-5 acc 83.203 (80.524)	lr 0.01390
Train [56][2300/3239]	Time 13.559 (1.124)	Data Time 13.312 (0.646)	Loss 2.7911 (2.6964)	Entropy 0.62883 (0.62940)	Top-1 acc 51.562 (58.959)	Top-5 acc 80.859 (80.532)	lr 0.01390
Train [56][2310/3239]	Time 0.232 (1.121)	Data Time 0.001 (0.643)	Loss 2.8561 (2.6963)	Entropy 0.62864 (0.62940)	Top-1 acc 56.641 (58.958)	Top-5 acc 77.734 (80.536)	lr 0.01390
Train [56][2320/3239]	Time 0.260 (1.124)	Data Time 0.029 (0.646)	Loss 2.8165 (2.6963)	Entropy 0.62867 (0.62939)	Top-1 acc 54.297 (58.955)	Top-5 acc 78.125 (80.540)	lr 0.01390
Train [56][2330/3239]	Time 0.231 (1.121)	Data Time 0.001 (0.643)	Loss 2.4651 (2.6962)	Entropy 0.62851 (0.62939)	Top-1 acc 64.062 (58.958)	Top-5 acc 84.375 (80.538)	lr 0.01390
Train [56][2340/3239]	Time 0.227 (1.122)	Data Time 0.001 (0.645)	Loss 2.8979 (2.6963)	Entropy 0.62835 (0.62938)	Top-1 acc 53.906 (58.957)	Top-5 acc 79.688 (80.535)	lr 0.01390
Train [56][2350/3239]	Time 0.335 (1.124)	Data Time 0.001 (0.647)	Loss 2.7509 (2.6962)	Entropy 0.62838 (0.62938)	Top-1 acc 55.078 (58.955)	Top-5 acc 79.297 (80.541)	lr 0.01390
Train [56][2360/3239]	Time 0.241 (1.123)	Data Time 0.001 (0.646)	Loss 2.6464 (2.6962)	Entropy 0.62856 (0.62938)	Top-1 acc 59.766 (58.954)	Top-5 acc 81.641 (80.543)	lr 0.01389
Train [56][2370/3239]	Time 0.239 (1.125)	Data Time 0.001 (0.648)	Loss 2.7922 (2.6958)	Entropy 0.62856 (0.62937)	Top-1 acc 50.781 (58.958)	Top-5 acc 77.734 (80.549)	lr 0.01389
Train [56][2380/3239]	Time 0.245 (1.127)	Data Time 0.001 (0.650)	Loss 2.7107 (2.6955)	Entropy 0.62862 (0.62937)	Top-1 acc 57.422 (58.962)	Top-5 acc 79.297 (80.555)	lr 0.01389
Train [56][2390/3239]	Time 0.218 (1.126)	Data Time 0.001 (0.650)	Loss 2.7233 (2.6952)	Entropy 0.62900 (0.62937)	Top-1 acc 57.422 (58.969)	Top-5 acc 81.641 (80.568)	lr 0.01389
Train [56][2400/3239]	Time 0.248 (1.127)	Data Time 0.002 (0.651)	Loss 2.6424 (2.6953)	Entropy 0.62900 (0.62936)	Top-1 acc 60.547 (58.972)	Top-5 acc 80.859 (80.565)	lr 0.01389
Train [56][2410/3239]	Time 0.224 (1.128)	Data Time 0.001 (0.653)	Loss 2.8240 (2.6953)	Entropy 0.62908 (0.62936)	Top-1 acc 58.594 (58.969)	Top-5 acc 78.516 (80.566)	lr 0.01389
Train [56][2420/3239]	Time 0.237 (1.127)	Data Time 0.001 (0.652)	Loss 2.5651 (2.6952)	Entropy 0.62940 (0.62936)	Top-1 acc 60.156 (58.972)	Top-5 acc 82.812 (80.568)	lr 0.01389
Train [56][2430/3239]	Time 0.223 (1.129)	Data Time 0.001 (0.654)	Loss 2.7311 (2.6952)	Entropy 0.62895 (0.62936)	Top-1 acc 57.812 (58.970)	Top-5 acc 80.469 (80.569)	lr 0.01389
Train [56][2440/3239]	Time 0.862 (1.126)	Data Time 0.554 (0.652)	Loss 2.6546 (2.6952)	Entropy 0.62881 (0.62936)	Top-1 acc 60.547 (58.970)	Top-5 acc 82.031 (80.573)	lr 0.01389
Train [56][2450/3239]	Time 0.232 (1.129)	Data Time 0.001 (0.655)	Loss 2.6250 (2.6955)	Entropy 0.62906 (0.62936)	Top-1 acc 64.453 (58.965)	Top-5 acc 82.812 (80.568)	lr 0.01389
Train [56][2460/3239]	Time 10.383 (1.130)	Data Time 10.139 (0.656)	Loss 2.6486 (2.6956)	Entropy 0.62916 (0.62936)	Top-1 acc 60.547 (58.962)	Top-5 acc 78.516 (80.565)	lr 0.01388
Train [56][2470/3239]	Time 0.231 (1.127)	Data Time 0.001 (0.653)	Loss 2.5994 (2.6960)	Entropy 0.62902 (0.62936)	Top-1 acc 64.062 (58.956)	Top-5 acc 83.203 (80.556)	lr 0.01388
Train [56][2480/3239]	Time 0.247 (1.132)	Data Time 0.001 (0.659)	Loss 2.5901 (2.6958)	Entropy 0.62898 (0.62936)	Top-1 acc 62.891 (58.961)	Top-5 acc 80.859 (80.559)	lr 0.01388
Train [56][2490/3239]	Time 0.236 (1.130)	Data Time 0.001 (0.656)	Loss 2.5728 (2.6959)	Entropy 0.62912 (0.62935)	Top-1 acc 60.938 (58.957)	Top-5 acc 83.203 (80.557)	lr 0.01388
Train [56][2500/3239]	Time 0.239 (1.128)	Data Time 0.001 (0.655)	Loss 2.4827 (2.6955)	Entropy 0.62862 (0.62935)	Top-1 acc 63.672 (58.967)	Top-5 acc 83.984 (80.564)	lr 0.01388
Train [56][2510/3239]	Time 0.330 (1.132)	Data Time 0.001 (0.659)	Loss 2.8107 (2.6952)	Entropy 0.62887 (0.62935)	Top-1 acc 55.859 (58.970)	Top-5 acc 77.734 (80.572)	lr 0.01388
Train [56][2520/3239]	Time 0.241 (1.131)	Data Time 0.001 (0.658)	Loss 2.7548 (2.6954)	Entropy 0.62862 (0.62935)	Top-1 acc 57.031 (58.965)	Top-5 acc 79.297 (80.569)	lr 0.01388
Train [56][2530/3239]	Time 0.251 (1.131)	Data Time 0.001 (0.659)	Loss 2.7783 (2.6952)	Entropy 0.62859 (0.62934)	Top-1 acc 59.375 (58.969)	Top-5 acc 77.734 (80.570)	lr 0.01388
Train [56][2540/3239]	Time 0.259 (1.134)	Data Time 0.001 (0.661)	Loss 2.6731 (2.6954)	Entropy 0.62792 (0.62934)	Top-1 acc 58.594 (58.965)	Top-5 acc 80.859 (80.562)	lr 0.01388
Train [56][2550/3239]	Time 0.422 (1.145)	Data Time 0.005 (0.661)	Loss 2.6525 (2.6956)	Entropy 0.62814 (0.62933)	Top-1 acc 57.422 (58.959)	Top-5 acc 85.547 (80.562)	lr 0.01388
Train [56][2560/3239]	Time 0.242 (1.143)	Data Time 0.002 (0.658)	Loss 2.5595 (2.6956)	Entropy 0.62842 (0.62933)	Top-1 acc 62.500 (58.963)	Top-5 acc 83.203 (80.560)	lr 0.01387
Train [56][2570/3239]	Time 0.272 (1.140)	Data Time 0.030 (0.655)	Loss 2.5872 (2.6959)	Entropy 0.62819 (0.62933)	Top-1 acc 64.062 (58.952)	Top-5 acc 79.297 (80.551)	lr 0.01387
Train [56][2580/3239]	Time 0.266 (1.138)	Data Time 0.002 (0.653)	Loss 2.7285 (2.6960)	Entropy 0.62825 (0.62932)	Top-1 acc 56.250 (58.945)	Top-5 acc 80.469 (80.548)	lr 0.01387
Train [56][2590/3239]	Time 0.239 (1.136)	Data Time 0.001 (0.651)	Loss 2.8645 (2.6960)	Entropy 0.62843 (0.62932)	Top-1 acc 55.469 (58.944)	Top-5 acc 77.344 (80.551)	lr 0.01387
Train [56][2600/3239]	Time 0.246 (1.133)	Data Time 0.001 (0.649)	Loss 2.5862 (2.6960)	Entropy 0.62856 (0.62932)	Top-1 acc 66.016 (58.947)	Top-5 acc 81.641 (80.550)	lr 0.01387
Train [56][2610/3239]	Time 0.236 (1.135)	Data Time 0.001 (0.651)	Loss 2.6020 (2.6961)	Entropy 0.62849 (0.62931)	Top-1 acc 61.719 (58.946)	Top-5 acc 83.984 (80.552)	lr 0.01387
Train [56][2620/3239]	Time 12.126 (1.137)	Data Time 11.875 (0.654)	Loss 2.6535 (2.6962)	Entropy 0.62876 (0.62931)	Top-1 acc 58.984 (58.939)	Top-5 acc 82.422 (80.548)	lr 0.01387
Train [56][2630/3239]	Time 0.227 (1.135)	Data Time 0.001 (0.651)	Loss 2.5914 (2.6962)	Entropy 0.62860 (0.62931)	Top-1 acc 58.594 (58.939)	Top-5 acc 82.031 (80.549)	lr 0.01387
Train [56][2640/3239]	Time 0.254 (1.137)	Data Time 0.001 (0.654)	Loss 2.5757 (2.6963)	Entropy 0.62845 (0.62930)	Top-1 acc 63.281 (58.940)	Top-5 acc 82.031 (80.545)	lr 0.01387
Train [56][2650/3239]	Time 0.256 (1.134)	Data Time 0.001 (0.651)	Loss 2.6904 (2.6966)	Entropy 0.62833 (0.62930)	Top-1 acc 57.031 (58.935)	Top-5 acc 78.906 (80.535)	lr 0.01387
Train [56][2660/3239]	Time 0.230 (1.136)	Data Time 0.001 (0.654)	Loss 2.8733 (2.6965)	Entropy 0.62834 (0.62930)	Top-1 acc 57.031 (58.939)	Top-5 acc 74.609 (80.538)	lr 0.01386
Train [56][2670/3239]	Time 2.472 (1.139)	Data Time 2.135 (0.657)	Loss 2.5124 (2.6964)	Entropy 0.62797 (0.62929)	Top-1 acc 65.625 (58.942)	Top-5 acc 84.375 (80.540)	lr 0.01386
Train [56][2680/3239]	Time 0.253 (1.137)	Data Time 0.001 (0.655)	Loss 2.6265 (2.6963)	Entropy 0.62806 (0.62929)	Top-1 acc 61.328 (58.944)	Top-5 acc 83.984 (80.541)	lr 0.01386
Train [56][2690/3239]	Time 0.239 (1.139)	Data Time 0.001 (0.657)	Loss 2.6536 (2.6962)	Entropy 0.62816 (0.62928)	Top-1 acc 59.375 (58.949)	Top-5 acc 83.203 (80.545)	lr 0.01386
Train [56][2700/3239]	Time 0.221 (1.140)	Data Time 0.001 (0.659)	Loss 2.8895 (2.6963)	Entropy 0.62842 (0.62928)	Top-1 acc 56.250 (58.951)	Top-5 acc 77.344 (80.539)	lr 0.01386
Train [56][2710/3239]	Time 0.671 (1.139)	Data Time 0.395 (0.657)	Loss 2.5951 (2.6963)	Entropy 0.62854 (0.62928)	Top-1 acc 60.938 (58.948)	Top-5 acc 80.469 (80.541)	lr 0.01386
Train [56][2720/3239]	Time 0.238 (1.141)	Data Time 0.001 (0.660)	Loss 2.7896 (2.6963)	Entropy 0.62830 (0.62927)	Top-1 acc 56.641 (58.944)	Top-5 acc 79.688 (80.541)	lr 0.01386
Train [56][2730/3239]	Time 0.231 (1.143)	Data Time 0.001 (0.662)	Loss 2.8037 (2.6964)	Entropy 0.62858 (0.62927)	Top-1 acc 55.469 (58.942)	Top-5 acc 78.906 (80.539)	lr 0.01386
Train [56][2740/3239]	Time 0.347 (1.140)	Data Time 0.002 (0.660)	Loss 2.5748 (2.6963)	Entropy 0.62854 (0.62927)	Top-1 acc 63.281 (58.948)	Top-5 acc 82.031 (80.541)	lr 0.01386
Train [56][2750/3239]	Time 0.227 (1.143)	Data Time 0.001 (0.662)	Loss 2.5925 (2.6961)	Entropy 0.62858 (0.62927)	Top-1 acc 60.156 (58.955)	Top-5 acc 84.375 (80.545)	lr 0.01386
Train [56][2760/3239]	Time 0.233 (1.140)	Data Time 0.001 (0.660)	Loss 2.7507 (2.6960)	Entropy 0.62874 (0.62926)	Top-1 acc 57.422 (58.957)	Top-5 acc 78.125 (80.545)	lr 0.01385
Train [56][2770/3239]	Time 0.228 (1.142)	Data Time 0.001 (0.662)	Loss 2.7923 (2.6962)	Entropy 0.62881 (0.62926)	Top-1 acc 57.422 (58.954)	Top-5 acc 76.953 (80.542)	lr 0.01385
Train [56][2780/3239]	Time 11.261 (1.144)	Data Time 11.008 (0.664)	Loss 2.5375 (2.6963)	Entropy 0.62911 (0.62926)	Top-1 acc 63.672 (58.952)	Top-5 acc 83.984 (80.535)	lr 0.01385
Train [56][2790/3239]	Time 0.233 (1.142)	Data Time 0.001 (0.662)	Loss 2.5661 (2.6963)	Entropy 0.62920 (0.62926)	Top-1 acc 60.547 (58.954)	Top-5 acc 83.984 (80.536)	lr 0.01385
Train [56][2800/3239]	Time 0.229 (1.146)	Data Time 0.001 (0.667)	Loss 2.9377 (2.6962)	Entropy 0.62935 (0.62926)	Top-1 acc 53.516 (58.955)	Top-5 acc 75.000 (80.536)	lr 0.01385
Train [56][2810/3239]	Time 0.294 (1.144)	Data Time 0.002 (0.665)	Loss 2.6635 (2.6964)	Entropy 0.62946 (0.62926)	Top-1 acc 59.766 (58.953)	Top-5 acc 79.297 (80.530)	lr 0.01385
Train [56][2820/3239]	Time 0.246 (1.145)	Data Time 0.001 (0.666)	Loss 2.7926 (2.6963)	Entropy 0.62916 (0.62926)	Top-1 acc 56.641 (58.956)	Top-5 acc 77.734 (80.532)	lr 0.01385
Train [56][2830/3239]	Time 0.329 (1.148)	Data Time 0.001 (0.669)	Loss 2.4512 (2.6962)	Entropy 0.62933 (0.62926)	Top-1 acc 65.625 (58.956)	Top-5 acc 83.984 (80.535)	lr 0.01385
Train [56][2840/3239]	Time 0.305 (1.146)	Data Time 0.001 (0.667)	Loss 2.7477 (2.6960)	Entropy 0.62960 (0.62926)	Top-1 acc 59.375 (58.961)	Top-5 acc 78.906 (80.539)	lr 0.01385
Train [56][2850/3239]	Time 0.260 (1.148)	Data Time 0.001 (0.669)	Loss 2.6859 (2.6960)	Entropy 0.62945 (0.62926)	Top-1 acc 61.719 (58.958)	Top-5 acc 80.859 (80.542)	lr 0.01385
Train [56][2860/3239]	Time 0.255 (1.150)	Data Time 0.001 (0.672)	Loss 2.6456 (2.6961)	Entropy 0.62978 (0.62926)	Top-1 acc 58.594 (58.956)	Top-5 acc 82.422 (80.538)	lr 0.01384
Train [56][2870/3239]	Time 0.245 (1.148)	Data Time 0.001 (0.670)	Loss 2.7416 (2.6963)	Entropy 0.63012 (0.62926)	Top-1 acc 57.422 (58.951)	Top-5 acc 79.688 (80.534)	lr 0.01384
Train [56][2880/3239]	Time 0.256 (1.149)	Data Time 0.001 (0.671)	Loss 2.8908 (2.6966)	Entropy 0.63040 (0.62927)	Top-1 acc 57.031 (58.948)	Top-5 acc 76.953 (80.528)	lr 0.01384
Train [56][2890/3239]	Time 0.228 (1.152)	Data Time 0.001 (0.674)	Loss 2.6497 (2.6965)	Entropy 0.63066 (0.62927)	Top-1 acc 59.766 (58.946)	Top-5 acc 81.250 (80.530)	lr 0.01384
Train [56][2900/3239]	Time 0.342 (1.149)	Data Time 0.001 (0.672)	Loss 2.7301 (2.6964)	Entropy 0.63095 (0.62928)	Top-1 acc 55.859 (58.950)	Top-5 acc 79.297 (80.532)	lr 0.01384
Train [56][2910/3239]	Time 0.233 (1.152)	Data Time 0.001 (0.674)	Loss 2.6059 (2.6962)	Entropy 0.63095 (0.62928)	Top-1 acc 62.500 (58.953)	Top-5 acc 82.422 (80.534)	lr 0.01384
Train [56][2920/3239]	Time 0.251 (1.149)	Data Time 0.001 (0.672)	Loss 2.6955 (2.6962)	Entropy 0.63074 (0.62929)	Top-1 acc 58.594 (58.956)	Top-5 acc 80.859 (80.533)	lr 0.01384
Train [56][2930/3239]	Time 0.236 (1.151)	Data Time 0.001 (0.674)	Loss 2.7772 (2.6962)	Entropy 0.63078 (0.62929)	Top-1 acc 58.594 (58.956)	Top-5 acc 77.734 (80.531)	lr 0.01384
Train [56][2940/3239]	Time 12.923 (1.155)	Data Time 12.653 (0.678)	Loss 2.6061 (2.6961)	Entropy 0.63093 (0.62930)	Top-1 acc 60.547 (58.958)	Top-5 acc 80.078 (80.533)	lr 0.01384
Train [56][2950/3239]	Time 0.239 (1.152)	Data Time 0.001 (0.676)	Loss 2.5820 (2.6961)	Entropy 0.63064 (0.62930)	Top-1 acc 58.594 (58.955)	Top-5 acc 82.812 (80.535)	lr 0.01384
Train [56][2960/3239]	Time 0.286 (1.155)	Data Time 0.003 (0.679)	Loss 2.5695 (2.6961)	Entropy 0.63084 (0.62931)	Top-1 acc 60.938 (58.956)	Top-5 acc 84.766 (80.535)	lr 0.01383
Train [56][2970/3239]	Time 0.233 (1.153)	Data Time 0.001 (0.677)	Loss 2.8029 (2.6963)	Entropy 0.63084 (0.62931)	Top-1 acc 55.469 (58.950)	Top-5 acc 79.688 (80.532)	lr 0.01383
Train [56][2980/3239]	Time 0.229 (1.154)	Data Time 0.001 (0.678)	Loss 3.1520 (2.6964)	Entropy 0.63069 (0.62932)	Top-1 acc 50.000 (58.951)	Top-5 acc 75.391 (80.529)	lr 0.01383
Train [56][2990/3239]	Time 0.325 (1.158)	Data Time 0.001 (0.683)	Loss 2.5429 (2.6963)	Entropy 0.63099 (0.62932)	Top-1 acc 62.891 (58.955)	Top-5 acc 85.156 (80.534)	lr 0.01383
Train [56][3000/3239]	Time 0.240 (1.156)	Data Time 0.001 (0.680)	Loss 2.7510 (2.6965)	Entropy 0.63133 (0.62933)	Top-1 acc 56.641 (58.949)	Top-5 acc 80.469 (80.530)	lr 0.01383
Train [56][3010/3239]	Time 0.269 (1.157)	Data Time 0.001 (0.682)	Loss 2.5293 (2.6963)	Entropy 0.63164 (0.62934)	Top-1 acc 61.719 (58.952)	Top-5 acc 84.375 (80.533)	lr 0.01383
Train [56][3020/3239]	Time 0.227 (1.161)	Data Time 0.001 (0.686)	Loss 2.9197 (2.6965)	Entropy 0.63146 (0.62934)	Top-1 acc 55.469 (58.947)	Top-5 acc 78.516 (80.530)	lr 0.01383
Train [56][3030/3239]	Time 0.237 (1.159)	Data Time 0.001 (0.684)	Loss 2.9639 (2.6965)	Entropy 0.63162 (0.62935)	Top-1 acc 51.953 (58.946)	Top-5 acc 77.344 (80.532)	lr 0.01383
Train [56][3040/3239]	Time 0.234 (1.159)	Data Time 0.001 (0.684)	Loss 2.7612 (2.6966)	Entropy 0.63142 (0.62936)	Top-1 acc 54.688 (58.942)	Top-5 acc 80.469 (80.531)	lr 0.01383
Train [56][3050/3239]	Time 0.229 (1.165)	Data Time 0.001 (0.690)	Loss 2.7098 (2.6966)	Entropy 0.63132 (0.62937)	Top-1 acc 60.938 (58.944)	Top-5 acc 81.641 (80.531)	lr 0.01383
Train [56][3060/3239]	Time 0.379 (1.162)	Data Time 0.001 (0.688)	Loss 2.6003 (2.6964)	Entropy 0.63141 (0.62937)	Top-1 acc 58.984 (58.946)	Top-5 acc 82.422 (80.534)	lr 0.01382
Train [56][3070/3239]	Time 0.243 (1.164)	Data Time 0.001 (0.690)	Loss 2.6951 (2.6965)	Entropy 0.63140 (0.62938)	Top-1 acc 58.203 (58.944)	Top-5 acc 80.078 (80.533)	lr 0.01382
Train [56][3080/3239]	Time 0.236 (1.161)	Data Time 0.002 (0.687)	Loss 2.6225 (2.6965)	Entropy 0.63161 (0.62939)	Top-1 acc 61.328 (58.944)	Top-5 acc 81.641 (80.536)	lr 0.01382
Train [56][3090/3239]	Time 0.233 (1.167)	Data Time 0.001 (0.693)	Loss 2.6339 (2.6968)	Entropy 0.63181 (0.62939)	Top-1 acc 60.156 (58.936)	Top-5 acc 78.906 (80.530)	lr 0.01382
Train [56][3100/3239]	Time 5.153 (1.168)	Data Time 4.918 (0.694)	Loss 2.5334 (2.6968)	Entropy 0.63211 (0.62940)	Top-1 acc 64.062 (58.939)	Top-5 acc 82.812 (80.528)	lr 0.01382
Train [56][3110/3239]	Time 0.227 (1.166)	Data Time 0.001 (0.692)	Loss 2.5827 (2.6968)	Entropy 0.63182 (0.62941)	Top-1 acc 59.766 (58.935)	Top-5 acc 82.422 (80.529)	lr 0.01382
Train [56][3120/3239]	Time 0.236 (1.171)	Data Time 0.001 (0.698)	Loss 2.5654 (2.6969)	Entropy 0.63167 (0.62942)	Top-1 acc 58.203 (58.931)	Top-5 acc 82.422 (80.525)	lr 0.01382
Train [56][3130/3239]	Time 0.234 (1.169)	Data Time 0.001 (0.696)	Loss 2.8412 (2.6969)	Entropy 0.63149 (0.62942)	Top-1 acc 55.469 (58.931)	Top-5 acc 75.781 (80.524)	lr 0.01382
Train [56][3140/3239]	Time 0.232 (1.169)	Data Time 0.001 (0.696)	Loss 2.8055 (2.6970)	Entropy 0.63153 (0.62943)	Top-1 acc 55.859 (58.929)	Top-5 acc 78.125 (80.525)	lr 0.01382
Train [56][3150/3239]	Time 0.241 (1.170)	Data Time 0.001 (0.698)	Loss 2.7971 (2.6969)	Entropy 0.63147 (0.62944)	Top-1 acc 59.375 (58.933)	Top-5 acc 77.734 (80.525)	lr 0.01382
Train [56][3160/3239]	Time 0.227 (1.171)	Data Time 0.001 (0.699)	Loss 2.7739 (2.6971)	Entropy 0.63112 (0.62944)	Top-1 acc 55.859 (58.929)	Top-5 acc 80.859 (80.521)	lr 0.01381
Train [56][3170/3239]	Time 0.226 (1.170)	Data Time 0.001 (0.698)	Loss 2.7105 (2.6971)	Entropy 0.63144 (0.62945)	Top-1 acc 57.422 (58.929)	Top-5 acc 80.859 (80.521)	lr 0.01381
Train [56][3180/3239]	Time 0.232 (1.171)	Data Time 0.000 (0.699)	Loss 2.9256 (2.6972)	Entropy 0.63157 (0.62945)	Top-1 acc 55.078 (58.925)	Top-5 acc 73.438 (80.518)	lr 0.01381
Train [56][3190/3239]	Time 0.232 (1.174)	Data Time 0.000 (0.702)	Loss 2.7325 (2.6972)	Entropy 0.63149 (0.62946)	Top-1 acc 58.594 (58.922)	Top-5 acc 81.641 (80.519)	lr 0.01381
Train [56][3200/3239]	Time 0.229 (1.171)	Data Time 0.000 (0.700)	Loss 2.6847 (2.6973)	Entropy 0.63146 (0.62947)	Top-1 acc 60.547 (58.924)	Top-5 acc 79.297 (80.517)	lr 0.01381
Train [56][3210/3239]	Time 0.229 (1.180)	Data Time 0.000 (0.697)	Loss 2.8189 (2.6975)	Entropy 0.63152 (0.62947)	Top-1 acc 55.469 (58.918)	Top-5 acc 79.297 (80.515)	lr 0.01381
Train [56][3220/3239]	Time 0.328 (1.177)	Data Time 0.000 (0.695)	Loss 2.7882 (2.6975)	Entropy 0.63135 (0.62948)	Top-1 acc 59.375 (58.916)	Top-5 acc 78.906 (80.516)	lr 0.01381
Train [56][3230/3239]	Time 0.230 (1.175)	Data Time 0.000 (0.693)	Loss 2.7081 (2.6974)	Entropy 0.63124 (0.62949)	Top-1 acc 60.156 (58.919)	Top-5 acc 78.906 (80.518)	lr 0.01381
Train [56][3239/3239]	Time 0.868 (1.173)	Data Time 0.000 (0.691)	Loss 2.8312 (2.6974)	Entropy 0.63101 (0.62949)	Top-1 acc 53.086 (58.920)	Top-5 acc 80.247 (80.520)	lr 0.01381
==========Valid [56/120]	loss 1.448	top-1 acc 66.748 (66.748)	top-5 acc 86.813	Train top-1 58.920	top-5 80.520	Entropy 0.63101	Latency-None: 0.000ms	Flops: 538.40M
Train [57][0/3239]	Time 45.445 (45.445)	Data Time 43.803 (43.803)	Loss 2.6443 (2.6443)	Entropy 0.63056 (0.63056)	Top-1 acc 58.984 (58.984)	Top-5 acc 81.641 (81.641)	lr 0.01381
Train [57][10/3239]	Time 0.245 (4.786)	Data Time 0.001 (4.151)	Loss 2.8703 (2.7303)	Entropy 0.63051 (0.63058)	Top-1 acc 57.812 (57.741)	Top-5 acc 76.953 (79.368)	lr 0.01381
Train [57][20/3239]	Time 0.228 (2.697)	Data Time 0.002 (2.175)	Loss 2.5784 (2.6961)	Entropy 0.63065 (0.63058)	Top-1 acc 57.031 (58.333)	Top-5 acc 85.547 (80.264)	lr 0.01380
Train [57][30/3239]	Time 0.249 (1.965)	Data Time 0.001 (1.474)	Loss 2.6785 (2.6856)	Entropy 0.63039 (0.63057)	Top-1 acc 55.859 (58.569)	Top-5 acc 78.906 (80.507)	lr 0.01380
Train [57][40/3239]	Time 0.258 (1.781)	Data Time 0.001 (1.284)	Loss 2.5863 (2.6661)	Entropy 0.63040 (0.63054)	Top-1 acc 57.422 (58.946)	Top-5 acc 83.984 (81.050)	lr 0.01380
Train [57][50/3239]	Time 0.327 (1.516)	Data Time 0.001 (1.032)	Loss 2.4815 (2.6761)	Entropy 0.63025 (0.63050)	Top-1 acc 66.797 (59.015)	Top-5 acc 87.109 (80.836)	lr 0.01380
Train [57][60/3239]	Time 0.243 (1.333)	Data Time 0.001 (0.863)	Loss 2.7425 (2.6758)	Entropy 0.63040 (0.63046)	Top-1 acc 58.203 (59.036)	Top-5 acc 78.516 (80.815)	lr 0.01380
Train [57][70/3239]	Time 0.243 (1.335)	Data Time 0.001 (0.869)	Loss 2.8234 (2.6765)	Entropy 0.62996 (0.63046)	Top-1 acc 56.250 (59.056)	Top-5 acc 77.734 (80.788)	lr 0.01380
Train [57][80/3239]	Time 0.251 (1.223)	Data Time 0.001 (0.762)	Loss 2.7220 (2.6868)	Entropy 0.62995 (0.63039)	Top-1 acc 59.375 (58.898)	Top-5 acc 78.906 (80.618)	lr 0.01380
Train [57][90/3239]	Time 0.239 (1.134)	Data Time 0.001 (0.678)	Loss 2.7605 (2.6842)	Entropy 0.62976 (0.63035)	Top-1 acc 60.938 (59.002)	Top-5 acc 76.953 (80.713)	lr 0.01380
Train [57][100/3239]	Time 0.247 (1.127)	Data Time 0.001 (0.674)	Loss 2.7201 (2.6840)	Entropy 0.62979 (0.63030)	Top-1 acc 58.203 (59.008)	Top-5 acc 81.641 (80.840)	lr 0.01380
Train [57][110/3239]	Time 0.240 (1.064)	Data Time 0.001 (0.613)	Loss 2.6376 (2.6845)	Entropy 0.62989 (0.63026)	Top-1 acc 62.500 (59.058)	Top-5 acc 82.422 (80.842)	lr 0.01380
Train [57][120/3239]	Time 0.340 (1.016)	Data Time 0.001 (0.563)	Loss 2.7502 (2.6845)	Entropy 0.62983 (0.63023)	Top-1 acc 60.938 (59.049)	Top-5 acc 78.125 (80.827)	lr 0.01379
Train [57][130/3239]	Time 0.234 (1.022)	Data Time 0.001 (0.572)	Loss 2.8173 (2.6852)	Entropy 0.62982 (0.63020)	Top-1 acc 58.203 (59.038)	Top-5 acc 80.078 (80.862)	lr 0.01379
Train [57][140/3239]	Time 0.236 (0.981)	Data Time 0.001 (0.534)	Loss 2.8271 (2.6819)	Entropy 0.62975 (0.63017)	Top-1 acc 55.469 (59.181)	Top-5 acc 78.125 (80.868)	lr 0.01379
Train [57][150/3239]	Time 0.225 (0.943)	Data Time 0.001 (0.498)	Loss 2.6484 (2.6845)	Entropy 0.62949 (0.63014)	Top-1 acc 60.156 (59.083)	Top-5 acc 82.422 (80.870)	lr 0.01379
Train [57][160/3239]	Time 3.681 (0.934)	Data Time 3.371 (0.488)	Loss 2.6610 (2.6846)	Entropy 0.62938 (0.63009)	Top-1 acc 59.766 (59.081)	Top-5 acc 82.031 (80.835)	lr 0.01379
Train [57][170/3239]	Time 0.233 (0.935)	Data Time 0.001 (0.491)	Loss 2.8082 (2.6818)	Entropy 0.62933 (0.63005)	Top-1 acc 58.203 (59.192)	Top-5 acc 80.469 (80.882)	lr 0.01379
Train [57][180/3239]	Time 0.231 (0.906)	Data Time 0.001 (0.464)	Loss 2.5164 (2.6755)	Entropy 0.62930 (0.63000)	Top-1 acc 63.672 (59.340)	Top-5 acc 82.422 (80.954)	lr 0.01379
Train [57][190/3239]	Time 0.246 (0.882)	Data Time 0.001 (0.439)	Loss 2.4577 (2.6755)	Entropy 0.62926 (0.62997)	Top-1 acc 65.234 (59.338)	Top-5 acc 83.984 (80.972)	lr 0.01379
Train [57][200/3239]	Time 0.245 (0.904)	Data Time 0.001 (0.462)	Loss 2.4915 (2.6762)	Entropy 0.62914 (0.62993)	Top-1 acc 61.328 (59.305)	Top-5 acc 82.422 (80.953)	lr 0.01379
Train [57][210/3239]	Time 0.323 (0.881)	Data Time 0.001 (0.441)	Loss 2.4771 (2.6755)	Entropy 0.62905 (0.62989)	Top-1 acc 66.406 (59.331)	Top-5 acc 83.984 (80.987)	lr 0.01379
Train [57][220/3239]	Time 0.222 (0.860)	Data Time 0.001 (0.421)	Loss 2.8263 (2.6754)	Entropy 0.62871 (0.62985)	Top-1 acc 56.250 (59.352)	Top-5 acc 75.000 (80.985)	lr 0.01378
Train [57][230/3239]	Time 0.230 (0.883)	Data Time 0.001 (0.445)	Loss 2.6710 (2.6753)	Entropy 0.62871 (0.62980)	Top-1 acc 60.547 (59.367)	Top-5 acc 79.297 (80.979)	lr 0.01378
Train [57][240/3239]	Time 0.276 (0.864)	Data Time 0.001 (0.426)	Loss 2.5132 (2.6760)	Entropy 0.62884 (0.62975)	Top-1 acc 60.156 (59.313)	Top-5 acc 83.984 (80.961)	lr 0.01378
Train [57][250/3239]	Time 0.240 (0.847)	Data Time 0.001 (0.409)	Loss 2.5800 (2.6764)	Entropy 0.62875 (0.62971)	Top-1 acc 61.719 (59.319)	Top-5 acc 84.375 (80.951)	lr 0.01378
Train [57][260/3239]	Time 0.235 (0.852)	Data Time 0.001 (0.414)	Loss 2.7263 (2.6766)	Entropy 0.62854 (0.62968)	Top-1 acc 57.422 (59.317)	Top-5 acc 79.688 (80.964)	lr 0.01378
Train [57][270/3239]	Time 0.242 (0.835)	Data Time 0.001 (0.399)	Loss 2.7915 (2.6794)	Entropy 0.62839 (0.62963)	Top-1 acc 59.766 (59.273)	Top-5 acc 78.906 (80.906)	lr 0.01378
Train [57][280/3239]	Time 0.315 (0.821)	Data Time 0.001 (0.385)	Loss 2.9403 (2.6812)	Entropy 0.62851 (0.62959)	Top-1 acc 48.828 (59.230)	Top-5 acc 75.391 (80.852)	lr 0.01378
Train [57][290/3239]	Time 7.048 (0.832)	Data Time 6.800 (0.395)	Loss 2.5461 (2.6796)	Entropy 0.62854 (0.62955)	Top-1 acc 59.375 (59.230)	Top-5 acc 84.766 (80.892)	lr 0.01378
Train [57][300/3239]	Time 0.250 (0.818)	Data Time 0.002 (0.382)	Loss 2.5945 (2.6791)	Entropy 0.62842 (0.62951)	Top-1 acc 61.328 (59.256)	Top-5 acc 82.031 (80.893)	lr 0.01378
Train [57][310/3239]	Time 0.225 (0.805)	Data Time 0.001 (0.370)	Loss 2.6017 (2.6791)	Entropy 0.62860 (0.62948)	Top-1 acc 62.109 (59.298)	Top-5 acc 82.422 (80.891)	lr 0.01378
Train [57][320/3239]	Time 0.319 (0.794)	Data Time 0.003 (0.358)	Loss 2.6912 (2.6804)	Entropy 0.62823 (0.62945)	Top-1 acc 59.375 (59.278)	Top-5 acc 80.469 (80.856)	lr 0.01377
Train [57][330/3239]	Time 0.248 (0.795)	Data Time 0.001 (0.359)	Loss 2.5972 (2.6817)	Entropy 0.62841 (0.62941)	Top-1 acc 62.891 (59.263)	Top-5 acc 82.812 (80.832)	lr 0.01377
Train [57][340/3239]	Time 0.234 (0.784)	Data Time 0.001 (0.348)	Loss 2.7485 (2.6825)	Entropy 0.62787 (0.62938)	Top-1 acc 61.328 (59.230)	Top-5 acc 80.859 (80.838)	lr 0.01377
Train [57][350/3239]	Time 0.243 (0.774)	Data Time 0.001 (0.339)	Loss 2.7401 (2.6820)	Entropy 0.62785 (0.62934)	Top-1 acc 56.250 (59.264)	Top-5 acc 79.297 (80.857)	lr 0.01377
Train [57][360/3239]	Time 0.235 (0.786)	Data Time 0.001 (0.351)	Loss 2.6479 (2.6804)	Entropy 0.62781 (0.62929)	Top-1 acc 62.891 (59.288)	Top-5 acc 82.422 (80.886)	lr 0.01377
Train [57][370/3239]	Time 0.265 (0.776)	Data Time 0.001 (0.341)	Loss 2.6211 (2.6809)	Entropy 0.62771 (0.62925)	Top-1 acc 57.812 (59.229)	Top-5 acc 83.203 (80.880)	lr 0.01377
Train [57][380/3239]	Time 0.272 (0.766)	Data Time 0.001 (0.333)	Loss 2.6070 (2.6819)	Entropy 0.62786 (0.62921)	Top-1 acc 62.109 (59.214)	Top-5 acc 82.812 (80.854)	lr 0.01377
Train [57][390/3239]	Time 0.267 (0.781)	Data Time 0.001 (0.347)	Loss 2.6586 (2.6809)	Entropy 0.62757 (0.62917)	Top-1 acc 62.891 (59.225)	Top-5 acc 81.250 (80.890)	lr 0.01377
Train [57][400/3239]	Time 0.252 (0.772)	Data Time 0.001 (0.338)	Loss 2.6760 (2.6813)	Entropy 0.62767 (0.62914)	Top-1 acc 57.422 (59.213)	Top-5 acc 82.422 (80.898)	lr 0.01377
Train [57][410/3239]	Time 0.226 (0.763)	Data Time 0.001 (0.330)	Loss 2.5952 (2.6809)	Entropy 0.62755 (0.62910)	Top-1 acc 64.062 (59.223)	Top-5 acc 82.812 (80.879)	lr 0.01377
Train [57][420/3239]	Time 1.648 (0.770)	Data Time 1.361 (0.337)	Loss 2.6326 (2.6801)	Entropy 0.62775 (0.62906)	Top-1 acc 57.031 (59.201)	Top-5 acc 82.031 (80.892)	lr 0.01376
Train [57][430/3239]	Time 0.533 (0.762)	Data Time 0.305 (0.330)	Loss 2.6438 (2.6811)	Entropy 0.62774 (0.62903)	Top-1 acc 61.719 (59.176)	Top-5 acc 78.906 (80.877)	lr 0.01376
Train [57][440/3239]	Time 0.358 (0.754)	Data Time 0.001 (0.323)	Loss 2.8047 (2.6825)	Entropy 0.62744 (0.62900)	Top-1 acc 56.641 (59.138)	Top-5 acc 79.297 (80.869)	lr 0.01376
Train [57][450/3239]	Time 4.873 (0.762)	Data Time 4.602 (0.331)	Loss 2.8242 (2.6825)	Entropy 0.62740 (0.62897)	Top-1 acc 55.469 (59.139)	Top-5 acc 76.562 (80.861)	lr 0.01376
Train [57][460/3239]	Time 0.231 (0.759)	Data Time 0.001 (0.328)	Loss 2.6005 (2.6823)	Entropy 0.62726 (0.62893)	Top-1 acc 62.109 (59.153)	Top-5 acc 82.422 (80.875)	lr 0.01376
Train [57][470/3239]	Time 0.262 (0.752)	Data Time 0.001 (0.321)	Loss 2.5117 (2.6820)	Entropy 0.62775 (0.62890)	Top-1 acc 64.453 (59.164)	Top-5 acc 84.375 (80.888)	lr 0.01376
Train [57][480/3239]	Time 1.762 (0.748)	Data Time 1.516 (0.318)	Loss 2.6981 (2.6806)	Entropy 0.62773 (0.62888)	Top-1 acc 57.812 (59.203)	Top-5 acc 80.859 (80.924)	lr 0.01376
Train [57][490/3239]	Time 0.248 (0.762)	Data Time 0.001 (0.331)	Loss 2.6495 (2.6803)	Entropy 0.62766 (0.62885)	Top-1 acc 59.375 (59.213)	Top-5 acc 82.031 (80.918)	lr 0.01376
Train [57][500/3239]	Time 0.220 (0.754)	Data Time 0.001 (0.325)	Loss 2.7935 (2.6808)	Entropy 0.62765 (0.62883)	Top-1 acc 56.250 (59.193)	Top-5 acc 79.297 (80.912)	lr 0.01376
Train [57][510/3239]	Time 0.338 (0.748)	Data Time 0.001 (0.318)	Loss 2.7675 (2.6817)	Entropy 0.62785 (0.62881)	Top-1 acc 57.812 (59.169)	Top-5 acc 80.078 (80.898)	lr 0.01376
Train [57][520/3239]	Time 0.244 (0.758)	Data Time 0.001 (0.328)	Loss 2.5871 (2.6804)	Entropy 0.62783 (0.62879)	Top-1 acc 60.938 (59.197)	Top-5 acc 82.031 (80.913)	lr 0.01375
Train [57][530/3239]	Time 0.269 (0.754)	Data Time 0.003 (0.325)	Loss 2.7703 (2.6812)	Entropy 0.62763 (0.62877)	Top-1 acc 57.031 (59.169)	Top-5 acc 77.734 (80.896)	lr 0.01375
Train [57][540/3239]	Time 0.253 (0.748)	Data Time 0.002 (0.319)	Loss 2.4510 (2.6813)	Entropy 0.62758 (0.62875)	Top-1 acc 65.625 (59.180)	Top-5 acc 86.719 (80.897)	lr 0.01375
Train [57][550/3239]	Time 0.232 (0.754)	Data Time 0.001 (0.325)	Loss 2.6959 (2.6801)	Entropy 0.62745 (0.62873)	Top-1 acc 57.812 (59.211)	Top-5 acc 82.031 (80.912)	lr 0.01375
Train [57][560/3239]	Time 0.243 (0.751)	Data Time 0.002 (0.322)	Loss 2.6821 (2.6794)	Entropy 0.62734 (0.62870)	Top-1 acc 61.328 (59.235)	Top-5 acc 83.203 (80.927)	lr 0.01375
Train [57][570/3239]	Time 0.249 (0.746)	Data Time 0.001 (0.317)	Loss 2.6048 (2.6791)	Entropy 0.62763 (0.62868)	Top-1 acc 58.594 (59.241)	Top-5 acc 80.859 (80.920)	lr 0.01375
Train [57][580/3239]	Time 0.255 (0.748)	Data Time 0.002 (0.319)	Loss 2.5192 (2.6785)	Entropy 0.62749 (0.62866)	Top-1 acc 64.062 (59.265)	Top-5 acc 83.203 (80.935)	lr 0.01375
Train [57][590/3239]	Time 0.248 (0.743)	Data Time 0.001 (0.313)	Loss 2.6540 (2.6796)	Entropy 0.62762 (0.62864)	Top-1 acc 58.594 (59.230)	Top-5 acc 84.375 (80.920)	lr 0.01375
Train [57][600/3239]	Time 0.333 (0.738)	Data Time 0.001 (0.308)	Loss 2.4645 (2.6783)	Entropy 0.62785 (0.62863)	Top-1 acc 64.844 (59.249)	Top-5 acc 86.719 (80.935)	lr 0.01375
Train [57][610/3239]	Time 0.264 (0.733)	Data Time 0.001 (0.303)	Loss 2.5839 (2.6782)	Entropy 0.62796 (0.62861)	Top-1 acc 59.766 (59.244)	Top-5 acc 84.375 (80.928)	lr 0.01375
Train [57][620/3239]	Time 0.346 (0.784)	Data Time 0.005 (0.298)	Loss 2.6659 (2.6792)	Entropy 0.62762 (0.62860)	Top-1 acc 60.547 (59.215)	Top-5 acc 83.203 (80.916)	lr 0.01374
Train [57][630/3239]	Time 0.253 (0.780)	Data Time 0.003 (0.294)	Loss 2.6272 (2.6800)	Entropy 0.62779 (0.62859)	Top-1 acc 61.328 (59.191)	Top-5 acc 82.422 (80.910)	lr 0.01374
Train [57][640/3239]	Time 0.247 (0.774)	Data Time 0.002 (0.289)	Loss 2.4837 (2.6788)	Entropy 0.62799 (0.62857)	Top-1 acc 67.188 (59.227)	Top-5 acc 83.594 (80.939)	lr 0.01374
Train [57][650/3239]	Time 0.244 (0.769)	Data Time 0.001 (0.285)	Loss 2.6429 (2.6792)	Entropy 0.62813 (0.62857)	Top-1 acc 60.938 (59.223)	Top-5 acc 80.859 (80.931)	lr 0.01374
Train [57][660/3239]	Time 0.270 (0.764)	Data Time 0.001 (0.280)	Loss 2.5511 (2.6785)	Entropy 0.62834 (0.62856)	Top-1 acc 58.203 (59.238)	Top-5 acc 83.203 (80.940)	lr 0.01374
Train [57][670/3239]	Time 0.360 (0.759)	Data Time 0.001 (0.276)	Loss 2.5042 (2.6791)	Entropy 0.62775 (0.62855)	Top-1 acc 62.500 (59.210)	Top-5 acc 83.594 (80.924)	lr 0.01374
Train [57][680/3239]	Time 0.236 (0.754)	Data Time 0.001 (0.272)	Loss 2.8504 (2.6793)	Entropy 0.62777 (0.62854)	Top-1 acc 53.516 (59.211)	Top-5 acc 75.781 (80.908)	lr 0.01374
Train [57][690/3239]	Time 0.242 (0.750)	Data Time 0.001 (0.268)	Loss 2.6022 (2.6793)	Entropy 0.62734 (0.62853)	Top-1 acc 62.891 (59.201)	Top-5 acc 80.078 (80.909)	lr 0.01374
Train [57][700/3239]	Time 0.239 (0.745)	Data Time 0.001 (0.265)	Loss 2.9559 (2.6797)	Entropy 0.62700 (0.62851)	Top-1 acc 52.734 (59.191)	Top-5 acc 77.344 (80.902)	lr 0.01374
Train [57][710/3239]	Time 0.264 (0.741)	Data Time 0.001 (0.261)	Loss 2.4016 (2.6791)	Entropy 0.62712 (0.62849)	Top-1 acc 64.844 (59.201)	Top-5 acc 85.938 (80.913)	lr 0.01374
Train [57][720/3239]	Time 0.233 (0.743)	Data Time 0.001 (0.263)	Loss 2.6525 (2.6786)	Entropy 0.62712 (0.62847)	Top-1 acc 57.422 (59.206)	Top-5 acc 80.859 (80.925)	lr 0.01373
Train [57][730/3239]	Time 0.254 (0.745)	Data Time 0.002 (0.266)	Loss 2.6989 (2.6783)	Entropy 0.62732 (0.62845)	Top-1 acc 58.984 (59.223)	Top-5 acc 79.297 (80.938)	lr 0.01373
Train [57][740/3239]	Time 0.242 (0.741)	Data Time 0.001 (0.263)	Loss 2.5095 (2.6776)	Entropy 0.62739 (0.62844)	Top-1 acc 63.672 (59.237)	Top-5 acc 84.766 (80.946)	lr 0.01373
Train [57][750/3239]	Time 0.248 (0.740)	Data Time 0.001 (0.263)	Loss 2.7505 (2.6787)	Entropy 0.62714 (0.62842)	Top-1 acc 55.078 (59.211)	Top-5 acc 79.297 (80.917)	lr 0.01373
Train [57][760/3239]	Time 0.325 (0.744)	Data Time 0.001 (0.267)	Loss 2.6495 (2.6784)	Entropy 0.62727 (0.62841)	Top-1 acc 60.547 (59.221)	Top-5 acc 81.250 (80.913)	lr 0.01373
Train [57][770/3239]	Time 0.255 (0.746)	Data Time 0.001 (0.269)	Loss 2.8917 (2.6781)	Entropy 0.62696 (0.62839)	Top-1 acc 54.688 (59.227)	Top-5 acc 76.953 (80.920)	lr 0.01373
Train [57][780/3239]	Time 0.249 (0.742)	Data Time 0.001 (0.266)	Loss 2.5743 (2.6777)	Entropy 0.62702 (0.62837)	Top-1 acc 65.625 (59.245)	Top-5 acc 82.812 (80.935)	lr 0.01373
Train [57][790/3239]	Time 0.229 (0.743)	Data Time 0.002 (0.267)	Loss 2.7545 (2.6773)	Entropy 0.62738 (0.62836)	Top-1 acc 58.984 (59.255)	Top-5 acc 76.953 (80.938)	lr 0.01373
Train [57][800/3239]	Time 0.233 (0.746)	Data Time 0.001 (0.271)	Loss 2.8824 (2.6775)	Entropy 0.62744 (0.62834)	Top-1 acc 53.906 (59.252)	Top-5 acc 78.125 (80.941)	lr 0.01373
Train [57][810/3239]	Time 0.286 (0.743)	Data Time 0.001 (0.268)	Loss 2.5964 (2.6788)	Entropy 0.62714 (0.62833)	Top-1 acc 57.812 (59.215)	Top-5 acc 81.250 (80.910)	lr 0.01373
Train [57][820/3239]	Time 0.253 (0.741)	Data Time 0.001 (0.266)	Loss 2.6513 (2.6785)	Entropy 0.62728 (0.62832)	Top-1 acc 61.719 (59.211)	Top-5 acc 80.078 (80.916)	lr 0.01372
Train [57][830/3239]	Time 0.731 (0.738)	Data Time 0.375 (0.264)	Loss 2.6681 (2.6783)	Entropy 0.62757 (0.62831)	Top-1 acc 62.500 (59.217)	Top-5 acc 80.469 (80.918)	lr 0.01372
Train [57][840/3239]	Time 0.229 (0.735)	Data Time 0.001 (0.261)	Loss 2.6001 (2.6779)	Entropy 0.62716 (0.62829)	Top-1 acc 61.719 (59.226)	Top-5 acc 83.203 (80.935)	lr 0.01372
Train [57][850/3239]	Time 0.274 (0.731)	Data Time 0.001 (0.258)	Loss 2.5262 (2.6784)	Entropy 0.62674 (0.62828)	Top-1 acc 63.672 (59.221)	Top-5 acc 83.203 (80.917)	lr 0.01372
Train [57][860/3239]	Time 0.221 (0.728)	Data Time 0.001 (0.255)	Loss 2.7294 (2.6793)	Entropy 0.62673 (0.62826)	Top-1 acc 58.594 (59.204)	Top-5 acc 78.125 (80.900)	lr 0.01372
Train [57][870/3239]	Time 0.263 (0.726)	Data Time 0.001 (0.253)	Loss 2.6886 (2.6791)	Entropy 0.62665 (0.62824)	Top-1 acc 61.328 (59.208)	Top-5 acc 81.250 (80.906)	lr 0.01372
Train [57][880/3239]	Time 0.273 (0.724)	Data Time 0.001 (0.250)	Loss 2.5146 (2.6790)	Entropy 0.62662 (0.62822)	Top-1 acc 62.500 (59.205)	Top-5 acc 85.156 (80.911)	lr 0.01372
Train [57][890/3239]	Time 0.258 (0.721)	Data Time 0.001 (0.247)	Loss 2.6176 (2.6794)	Entropy 0.62644 (0.62821)	Top-1 acc 59.766 (59.194)	Top-5 acc 83.594 (80.903)	lr 0.01372
Train [57][900/3239]	Time 0.243 (0.719)	Data Time 0.001 (0.246)	Loss 2.7177 (2.6795)	Entropy 0.62658 (0.62819)	Top-1 acc 59.375 (59.194)	Top-5 acc 80.078 (80.901)	lr 0.01372
Train [57][910/3239]	Time 0.280 (0.716)	Data Time 0.001 (0.243)	Loss 2.8889 (2.6798)	Entropy 0.62656 (0.62817)	Top-1 acc 56.250 (59.197)	Top-5 acc 75.391 (80.897)	lr 0.01372
Train [57][920/3239]	Time 0.353 (0.713)	Data Time 0.001 (0.240)	Loss 2.6380 (2.6799)	Entropy 0.62662 (0.62815)	Top-1 acc 57.812 (59.191)	Top-5 acc 83.203 (80.896)	lr 0.01371
Train [57][930/3239]	Time 0.236 (0.710)	Data Time 0.001 (0.238)	Loss 2.7615 (2.6797)	Entropy 0.62647 (0.62813)	Top-1 acc 55.469 (59.199)	Top-5 acc 81.641 (80.898)	lr 0.01371
Train [57][940/3239]	Time 0.242 (0.707)	Data Time 0.001 (0.235)	Loss 2.8823 (2.6798)	Entropy 0.62651 (0.62812)	Top-1 acc 55.078 (59.206)	Top-5 acc 77.734 (80.894)	lr 0.01371
Train [57][950/3239]	Time 0.236 (0.705)	Data Time 0.001 (0.233)	Loss 2.8400 (2.6800)	Entropy 0.62677 (0.62810)	Top-1 acc 52.734 (59.200)	Top-5 acc 77.734 (80.885)	lr 0.01371
Train [57][960/3239]	Time 0.289 (0.703)	Data Time 0.001 (0.231)	Loss 3.0433 (2.6803)	Entropy 0.62675 (0.62809)	Top-1 acc 53.125 (59.205)	Top-5 acc 73.047 (80.881)	lr 0.01371
Train [57][970/3239]	Time 0.239 (0.700)	Data Time 0.001 (0.228)	Loss 2.6220 (2.6801)	Entropy 0.62652 (0.62807)	Top-1 acc 59.766 (59.207)	Top-5 acc 82.422 (80.888)	lr 0.01371
Train [57][980/3239]	Time 0.238 (0.697)	Data Time 0.001 (0.226)	Loss 2.4983 (2.6799)	Entropy 0.62647 (0.62806)	Top-1 acc 60.547 (59.210)	Top-5 acc 83.203 (80.893)	lr 0.01371
Train [57][990/3239]	Time 0.339 (0.695)	Data Time 0.001 (0.224)	Loss 2.4877 (2.6794)	Entropy 0.62547 (0.62804)	Top-1 acc 62.109 (59.222)	Top-5 acc 85.156 (80.897)	lr 0.01371
Train [57][1000/3239]	Time 0.245 (0.692)	Data Time 0.001 (0.222)	Loss 2.7390 (2.6795)	Entropy 0.62553 (0.62801)	Top-1 acc 57.812 (59.223)	Top-5 acc 82.422 (80.893)	lr 0.01371
Train [57][1010/3239]	Time 0.246 (0.690)	Data Time 0.001 (0.220)	Loss 2.6628 (2.6798)	Entropy 0.62555 (0.62799)	Top-1 acc 60.156 (59.220)	Top-5 acc 82.422 (80.888)	lr 0.01371
Train [57][1020/3239]	Time 0.232 (0.687)	Data Time 0.001 (0.217)	Loss 2.6439 (2.6793)	Entropy 0.62538 (0.62796)	Top-1 acc 61.328 (59.230)	Top-5 acc 81.250 (80.899)	lr 0.01370
Train [57][1030/3239]	Time 0.233 (0.685)	Data Time 0.001 (0.215)	Loss 2.7883 (2.6792)	Entropy 0.62556 (0.62794)	Top-1 acc 55.859 (59.232)	Top-5 acc 80.078 (80.896)	lr 0.01370
Train [57][1040/3239]	Time 0.234 (0.683)	Data Time 0.001 (0.213)	Loss 2.7313 (2.6796)	Entropy 0.62568 (0.62792)	Top-1 acc 60.547 (59.219)	Top-5 acc 76.953 (80.891)	lr 0.01370
Train [57][1050/3239]	Time 0.268 (0.681)	Data Time 0.001 (0.211)	Loss 2.5784 (2.6800)	Entropy 0.62587 (0.62789)	Top-1 acc 59.766 (59.213)	Top-5 acc 82.812 (80.885)	lr 0.01370
Train [57][1060/3239]	Time 0.252 (0.679)	Data Time 0.001 (0.209)	Loss 2.6068 (2.6801)	Entropy 0.62607 (0.62788)	Top-1 acc 60.156 (59.218)	Top-5 acc 80.469 (80.873)	lr 0.01370
Train [57][1070/3239]	Time 0.243 (0.676)	Data Time 0.001 (0.207)	Loss 2.8828 (2.6805)	Entropy 0.62616 (0.62786)	Top-1 acc 55.469 (59.217)	Top-5 acc 75.000 (80.860)	lr 0.01370
Train [57][1080/3239]	Time 0.247 (0.678)	Data Time 0.001 (0.209)	Loss 2.8735 (2.6811)	Entropy 0.62639 (0.62785)	Top-1 acc 55.859 (59.207)	Top-5 acc 76.172 (80.849)	lr 0.01370
Train [57][1090/3239]	Time 0.291 (0.677)	Data Time 0.001 (0.209)	Loss 2.5827 (2.6811)	Entropy 0.62672 (0.62783)	Top-1 acc 60.156 (59.207)	Top-5 acc 82.422 (80.844)	lr 0.01370
Train [57][1100/3239]	Time 3.165 (0.678)	Data Time 2.898 (0.210)	Loss 2.5394 (2.6809)	Entropy 0.62634 (0.62782)	Top-1 acc 61.328 (59.222)	Top-5 acc 85.938 (80.851)	lr 0.01370
Train [57][1110/3239]	Time 0.242 (0.680)	Data Time 0.001 (0.212)	Loss 2.8371 (2.6807)	Entropy 0.62642 (0.62781)	Top-1 acc 55.078 (59.224)	Top-5 acc 76.953 (80.853)	lr 0.01370
Train [57][1120/3239]	Time 0.245 (0.677)	Data Time 0.001 (0.210)	Loss 2.6442 (2.6801)	Entropy 0.62644 (0.62780)	Top-1 acc 62.500 (59.239)	Top-5 acc 80.859 (80.870)	lr 0.01369
Train [57][1130/3239]	Time 0.256 (0.676)	Data Time 0.001 (0.209)	Loss 2.7619 (2.6799)	Entropy 0.62649 (0.62778)	Top-1 acc 59.766 (59.244)	Top-5 acc 80.078 (80.871)	lr 0.01369
Train [57][1140/3239]	Time 0.250 (0.680)	Data Time 0.001 (0.213)	Loss 2.7115 (2.6799)	Entropy 0.62660 (0.62777)	Top-1 acc 60.156 (59.245)	Top-5 acc 78.906 (80.867)	lr 0.01369
Train [57][1150/3239]	Time 0.345 (0.682)	Data Time 0.001 (0.215)	Loss 2.6075 (2.6798)	Entropy 0.62678 (0.62776)	Top-1 acc 60.547 (59.241)	Top-5 acc 82.422 (80.868)	lr 0.01369
Train [57][1160/3239]	Time 0.238 (0.680)	Data Time 0.001 (0.213)	Loss 2.7709 (2.6803)	Entropy 0.62667 (0.62775)	Top-1 acc 58.594 (59.235)	Top-5 acc 78.125 (80.858)	lr 0.01369
Train [57][1170/3239]	Time 0.241 (0.681)	Data Time 0.001 (0.214)	Loss 2.6578 (2.6799)	Entropy 0.62651 (0.62774)	Top-1 acc 64.844 (59.240)	Top-5 acc 81.250 (80.864)	lr 0.01369
Train [57][1180/3239]	Time 0.298 (0.682)	Data Time 0.002 (0.216)	Loss 2.6708 (2.6794)	Entropy 0.62666 (0.62773)	Top-1 acc 57.031 (59.246)	Top-5 acc 81.250 (80.882)	lr 0.01369
Train [57][1190/3239]	Time 0.242 (0.685)	Data Time 0.001 (0.219)	Loss 2.7930 (2.6794)	Entropy 0.62707 (0.62773)	Top-1 acc 60.156 (59.245)	Top-5 acc 75.781 (80.879)	lr 0.01369
Train [57][1200/3239]	Time 0.250 (0.683)	Data Time 0.001 (0.217)	Loss 2.5648 (2.6789)	Entropy 0.62726 (0.62772)	Top-1 acc 62.500 (59.254)	Top-5 acc 80.859 (80.892)	lr 0.01369
Train [57][1210/3239]	Time 0.298 (0.685)	Data Time 0.003 (0.219)	Loss 2.8812 (2.6788)	Entropy 0.62726 (0.62772)	Top-1 acc 53.125 (59.257)	Top-5 acc 77.734 (80.896)	lr 0.01369
Train [57][1220/3239]	Time 0.389 (0.688)	Data Time 0.001 (0.223)	Loss 2.7885 (2.6787)	Entropy 0.62719 (0.62771)	Top-1 acc 55.859 (59.262)	Top-5 acc 78.125 (80.897)	lr 0.01368
Train [57][1230/3239]	Time 0.264 (0.686)	Data Time 0.001 (0.221)	Loss 2.7249 (2.6787)	Entropy 0.62751 (0.62771)	Top-1 acc 57.031 (59.266)	Top-5 acc 79.688 (80.896)	lr 0.01368
Train [57][1240/3239]	Time 0.235 (0.685)	Data Time 0.001 (0.220)	Loss 2.5643 (2.6788)	Entropy 0.62765 (0.62771)	Top-1 acc 61.328 (59.258)	Top-5 acc 84.375 (80.898)	lr 0.01368
Train [57][1250/3239]	Time 0.240 (0.689)	Data Time 0.001 (0.224)	Loss 2.5206 (2.6783)	Entropy 0.62768 (0.62771)	Top-1 acc 60.156 (59.264)	Top-5 acc 83.594 (80.901)	lr 0.01368
Train [57][1260/3239]	Time 0.271 (0.687)	Data Time 0.001 (0.222)	Loss 2.7565 (2.6784)	Entropy 0.62787 (0.62771)	Top-1 acc 55.859 (59.259)	Top-5 acc 80.469 (80.906)	lr 0.01368
Train [57][1270/3239]	Time 0.237 (0.687)	Data Time 0.001 (0.223)	Loss 2.4840 (2.6785)	Entropy 0.62824 (0.62771)	Top-1 acc 62.109 (59.251)	Top-5 acc 85.938 (80.903)	lr 0.01368
Train [57][1280/3239]	Time 0.294 (0.714)	Data Time 0.002 (0.223)	Loss 2.6899 (2.6782)	Entropy 0.62836 (0.62771)	Top-1 acc 58.984 (59.259)	Top-5 acc 79.297 (80.909)	lr 0.01368
Train [57][1290/3239]	Time 0.238 (0.712)	Data Time 0.002 (0.221)	Loss 2.6668 (2.6782)	Entropy 0.62872 (0.62772)	Top-1 acc 60.938 (59.255)	Top-5 acc 82.812 (80.906)	lr 0.01368
Train [57][1300/3239]	Time 0.243 (0.709)	Data Time 0.001 (0.220)	Loss 2.5706 (2.6781)	Entropy 0.62870 (0.62773)	Top-1 acc 64.062 (59.261)	Top-5 acc 81.641 (80.909)	lr 0.01368
Train [57][1310/3239]	Time 0.362 (0.707)	Data Time 0.001 (0.218)	Loss 2.6458 (2.6780)	Entropy 0.62849 (0.62773)	Top-1 acc 62.500 (59.267)	Top-5 acc 81.250 (80.911)	lr 0.01367
Train [57][1320/3239]	Time 0.258 (0.705)	Data Time 0.001 (0.216)	Loss 2.8862 (2.6780)	Entropy 0.62876 (0.62774)	Top-1 acc 59.375 (59.269)	Top-5 acc 76.562 (80.907)	lr 0.01367
Train [57][1330/3239]	Time 0.257 (0.703)	Data Time 0.001 (0.215)	Loss 2.6270 (2.6787)	Entropy 0.62835 (0.62775)	Top-1 acc 59.375 (59.257)	Top-5 acc 81.250 (80.903)	lr 0.01367
Train [57][1340/3239]	Time 0.242 (0.701)	Data Time 0.001 (0.213)	Loss 2.5424 (2.6785)	Entropy 0.62798 (0.62775)	Top-1 acc 61.719 (59.263)	Top-5 acc 85.547 (80.908)	lr 0.01367
Train [57][1350/3239]	Time 0.248 (0.699)	Data Time 0.002 (0.212)	Loss 2.5689 (2.6783)	Entropy 0.62814 (0.62775)	Top-1 acc 61.719 (59.266)	Top-5 acc 82.422 (80.911)	lr 0.01367
Train [57][1360/3239]	Time 0.323 (0.698)	Data Time 0.001 (0.210)	Loss 2.5645 (2.6784)	Entropy 0.62812 (0.62776)	Top-1 acc 59.766 (59.259)	Top-5 acc 80.859 (80.907)	lr 0.01367
Train [57][1370/3239]	Time 0.233 (0.695)	Data Time 0.001 (0.209)	Loss 2.6191 (2.6784)	Entropy 0.62707 (0.62776)	Top-1 acc 61.328 (59.264)	Top-5 acc 80.859 (80.904)	lr 0.01367
Train [57][1380/3239]	Time 0.318 (0.700)	Data Time 0.001 (0.214)	Loss 2.7756 (2.6784)	Entropy 0.62703 (0.62775)	Top-1 acc 56.250 (59.267)	Top-5 acc 77.344 (80.900)	lr 0.01367
Train [57][1390/3239]	Time 0.231 (0.699)	Data Time 0.001 (0.213)	Loss 2.6915 (2.6789)	Entropy 0.62702 (0.62775)	Top-1 acc 61.328 (59.258)	Top-5 acc 80.078 (80.888)	lr 0.01367
Train [57][1400/3239]	Time 0.289 (0.697)	Data Time 0.001 (0.212)	Loss 2.8289 (2.6791)	Entropy 0.62677 (0.62774)	Top-1 acc 55.078 (59.255)	Top-5 acc 79.688 (80.885)	lr 0.01367
Train [57][1410/3239]	Time 0.284 (0.704)	Data Time 0.001 (0.219)	Loss 2.7799 (2.6789)	Entropy 0.62686 (0.62773)	Top-1 acc 56.250 (59.259)	Top-5 acc 78.125 (80.885)	lr 0.01366
Train [57][1420/3239]	Time 0.250 (0.702)	Data Time 0.001 (0.217)	Loss 2.5260 (2.6791)	Entropy 0.62716 (0.62773)	Top-1 acc 64.844 (59.252)	Top-5 acc 83.203 (80.876)	lr 0.01366
Train [57][1430/3239]	Time 0.318 (0.700)	Data Time 0.002 (0.216)	Loss 2.4946 (2.6786)	Entropy 0.62736 (0.62773)	Top-1 acc 63.672 (59.263)	Top-5 acc 84.375 (80.886)	lr 0.01366
Train [57][1440/3239]	Time 11.129 (0.707)	Data Time 10.815 (0.223)	Loss 2.6566 (2.6787)	Entropy 0.62758 (0.62772)	Top-1 acc 62.891 (59.266)	Top-5 acc 78.516 (80.886)	lr 0.01366
Train [57][1450/3239]	Time 0.262 (0.705)	Data Time 0.001 (0.221)	Loss 2.5801 (2.6788)	Entropy 0.62734 (0.62772)	Top-1 acc 63.281 (59.264)	Top-5 acc 82.422 (80.885)	lr 0.01366
Train [57][1460/3239]	Time 0.249 (0.704)	Data Time 0.001 (0.220)	Loss 2.6757 (2.6792)	Entropy 0.62737 (0.62772)	Top-1 acc 59.375 (59.259)	Top-5 acc 80.469 (80.875)	lr 0.01366
Train [57][1470/3239]	Time 0.371 (0.702)	Data Time 0.001 (0.219)	Loss 2.7443 (2.6793)	Entropy 0.62729 (0.62772)	Top-1 acc 55.859 (59.252)	Top-5 acc 80.078 (80.881)	lr 0.01366
Train [57][1480/3239]	Time 0.301 (0.707)	Data Time 0.001 (0.224)	Loss 2.6575 (2.6793)	Entropy 0.62707 (0.62771)	Top-1 acc 62.109 (59.255)	Top-5 acc 78.906 (80.885)	lr 0.01366
Train [57][1490/3239]	Time 0.247 (0.705)	Data Time 0.001 (0.222)	Loss 2.7493 (2.6794)	Entropy 0.62672 (0.62771)	Top-1 acc 54.297 (59.255)	Top-5 acc 83.594 (80.887)	lr 0.01366
Train [57][1500/3239]	Time 0.228 (0.703)	Data Time 0.001 (0.221)	Loss 2.5909 (2.6791)	Entropy 0.62644 (0.62770)	Top-1 acc 62.891 (59.258)	Top-5 acc 82.812 (80.894)	lr 0.01366
Train [57][1510/3239]	Time 0.263 (0.711)	Data Time 0.001 (0.229)	Loss 2.7055 (2.6794)	Entropy 0.62626 (0.62769)	Top-1 acc 56.641 (59.251)	Top-5 acc 82.422 (80.886)	lr 0.01365
Train [57][1520/3239]	Time 0.239 (0.709)	Data Time 0.001 (0.228)	Loss 2.6154 (2.6792)	Entropy 0.62634 (0.62768)	Top-1 acc 59.766 (59.260)	Top-5 acc 80.469 (80.889)	lr 0.01365
Train [57][1530/3239]	Time 0.249 (0.708)	Data Time 0.001 (0.226)	Loss 2.6960 (2.6792)	Entropy 0.62633 (0.62767)	Top-1 acc 57.812 (59.267)	Top-5 acc 80.859 (80.887)	lr 0.01365
Train [57][1540/3239]	Time 0.326 (0.713)	Data Time 0.001 (0.231)	Loss 2.7700 (2.6793)	Entropy 0.62681 (0.62767)	Top-1 acc 59.375 (59.262)	Top-5 acc 80.078 (80.883)	lr 0.01365
Train [57][1550/3239]	Time 0.229 (0.711)	Data Time 0.001 (0.230)	Loss 2.6821 (2.6792)	Entropy 0.62706 (0.62766)	Top-1 acc 57.422 (59.265)	Top-5 acc 78.906 (80.884)	lr 0.01365
Train [57][1560/3239]	Time 0.266 (0.709)	Data Time 0.002 (0.229)	Loss 2.7923 (2.6796)	Entropy 0.62702 (0.62766)	Top-1 acc 58.594 (59.254)	Top-5 acc 77.734 (80.878)	lr 0.01365
Train [57][1570/3239]	Time 0.253 (0.714)	Data Time 0.001 (0.233)	Loss 2.5190 (2.6793)	Entropy 0.62714 (0.62765)	Top-1 acc 62.109 (59.262)	Top-5 acc 83.203 (80.882)	lr 0.01365
Train [57][1580/3239]	Time 0.264 (0.715)	Data Time 0.001 (0.235)	Loss 2.7067 (2.6793)	Entropy 0.62731 (0.62765)	Top-1 acc 56.250 (59.266)	Top-5 acc 81.641 (80.881)	lr 0.01365
Train [57][1590/3239]	Time 0.250 (0.713)	Data Time 0.001 (0.234)	Loss 2.7164 (2.6796)	Entropy 0.62723 (0.62765)	Top-1 acc 59.375 (59.262)	Top-5 acc 79.297 (80.875)	lr 0.01365
Train [57][1600/3239]	Time 8.786 (0.717)	Data Time 8.544 (0.237)	Loss 2.8012 (2.6800)	Entropy 0.62738 (0.62765)	Top-1 acc 57.422 (59.248)	Top-5 acc 79.297 (80.869)	lr 0.01365
Train [57][1610/3239]	Time 0.234 (0.717)	Data Time 0.001 (0.238)	Loss 2.6066 (2.6800)	Entropy 0.62754 (0.62765)	Top-1 acc 61.328 (59.253)	Top-5 acc 81.250 (80.868)	lr 0.01364
Train [57][1620/3239]	Time 0.241 (0.715)	Data Time 0.001 (0.237)	Loss 2.8788 (2.6800)	Entropy 0.62787 (0.62765)	Top-1 acc 54.297 (59.253)	Top-5 acc 74.219 (80.865)	lr 0.01364
Train [57][1630/3239]	Time 0.239 (0.714)	Data Time 0.001 (0.235)	Loss 2.6501 (2.6796)	Entropy 0.62822 (0.62765)	Top-1 acc 59.766 (59.261)	Top-5 acc 81.250 (80.874)	lr 0.01364
Train [57][1640/3239]	Time 0.230 (0.722)	Data Time 0.001 (0.244)	Loss 2.5324 (2.6794)	Entropy 0.62795 (0.62765)	Top-1 acc 60.547 (59.262)	Top-5 acc 84.766 (80.879)	lr 0.01364
Train [57][1650/3239]	Time 0.232 (0.720)	Data Time 0.001 (0.242)	Loss 2.8541 (2.6796)	Entropy 0.62813 (0.62765)	Top-1 acc 52.344 (59.259)	Top-5 acc 77.734 (80.876)	lr 0.01364
Train [57][1660/3239]	Time 0.240 (0.718)	Data Time 0.001 (0.241)	Loss 2.7622 (2.6799)	Entropy 0.62814 (0.62766)	Top-1 acc 55.078 (59.252)	Top-5 acc 78.516 (80.872)	lr 0.01364
Train [57][1670/3239]	Time 7.191 (0.726)	Data Time 6.930 (0.249)	Loss 2.6479 (2.6796)	Entropy 0.62848 (0.62766)	Top-1 acc 58.984 (59.252)	Top-5 acc 83.594 (80.879)	lr 0.01364
Train [57][1680/3239]	Time 0.235 (0.724)	Data Time 0.001 (0.248)	Loss 2.4448 (2.6794)	Entropy 0.62869 (0.62766)	Top-1 acc 66.016 (59.254)	Top-5 acc 86.328 (80.885)	lr 0.01364
Train [57][1690/3239]	Time 0.237 (0.723)	Data Time 0.001 (0.246)	Loss 2.5133 (2.6793)	Entropy 0.62865 (0.62767)	Top-1 acc 63.672 (59.258)	Top-5 acc 83.594 (80.889)	lr 0.01364
Train [57][1700/3239]	Time 0.333 (0.725)	Data Time 0.001 (0.249)	Loss 2.6960 (2.6794)	Entropy 0.62865 (0.62768)	Top-1 acc 57.031 (59.252)	Top-5 acc 84.375 (80.893)	lr 0.01364
Train [57][1710/3239]	Time 0.246 (0.729)	Data Time 0.001 (0.253)	Loss 2.6996 (2.6794)	Entropy 0.62870 (0.62768)	Top-1 acc 59.766 (59.252)	Top-5 acc 80.469 (80.894)	lr 0.01363
Train [57][1720/3239]	Time 0.281 (0.727)	Data Time 0.001 (0.252)	Loss 2.8982 (2.6799)	Entropy 0.62833 (0.62769)	Top-1 acc 54.688 (59.239)	Top-5 acc 76.172 (80.887)	lr 0.01363
Train [57][1730/3239]	Time 0.231 (0.732)	Data Time 0.001 (0.257)	Loss 2.6651 (2.6797)	Entropy 0.62876 (0.62769)	Top-1 acc 63.672 (59.252)	Top-5 acc 80.078 (80.893)	lr 0.01363
Train [57][1740/3239]	Time 0.293 (0.734)	Data Time 0.001 (0.259)	Loss 2.6330 (2.6797)	Entropy 0.62878 (0.62770)	Top-1 acc 63.281 (59.260)	Top-5 acc 80.859 (80.893)	lr 0.01363
Train [57][1750/3239]	Time 0.232 (0.732)	Data Time 0.001 (0.258)	Loss 2.6975 (2.6799)	Entropy 0.62852 (0.62770)	Top-1 acc 59.375 (59.258)	Top-5 acc 82.031 (80.892)	lr 0.01363
Train [57][1760/3239]	Time 14.078 (0.738)	Data Time 13.832 (0.264)	Loss 2.7366 (2.6799)	Entropy 0.62889 (0.62771)	Top-1 acc 58.203 (59.261)	Top-5 acc 78.516 (80.890)	lr 0.01363
Train [57][1770/3239]	Time 0.315 (0.740)	Data Time 0.001 (0.266)	Loss 2.6191 (2.6801)	Entropy 0.62923 (0.62772)	Top-1 acc 62.891 (59.258)	Top-5 acc 80.078 (80.882)	lr 0.01363
Train [57][1780/3239]	Time 0.223 (0.738)	Data Time 0.001 (0.265)	Loss 2.7939 (2.6802)	Entropy 0.62923 (0.62772)	Top-1 acc 55.078 (59.255)	Top-5 acc 78.125 (80.874)	lr 0.01363
Train [57][1790/3239]	Time 0.234 (0.736)	Data Time 0.001 (0.263)	Loss 2.6627 (2.6802)	Entropy 0.62941 (0.62773)	Top-1 acc 57.812 (59.249)	Top-5 acc 82.031 (80.875)	lr 0.01363
Train [57][1800/3239]	Time 0.231 (0.746)	Data Time 0.001 (0.273)	Loss 2.6553 (2.6807)	Entropy 0.62908 (0.62774)	Top-1 acc 58.594 (59.238)	Top-5 acc 80.469 (80.862)	lr 0.01363
Train [57][1810/3239]	Time 0.247 (0.744)	Data Time 0.001 (0.272)	Loss 2.6722 (2.6810)	Entropy 0.62906 (0.62775)	Top-1 acc 58.984 (59.231)	Top-5 acc 80.469 (80.855)	lr 0.01362
Train [57][1820/3239]	Time 0.229 (0.742)	Data Time 0.001 (0.270)	Loss 2.8758 (2.6816)	Entropy 0.62899 (0.62776)	Top-1 acc 55.859 (59.218)	Top-5 acc 73.828 (80.842)	lr 0.01362
Train [57][1830/3239]	Time 4.057 (0.750)	Data Time 3.812 (0.278)	Loss 2.7031 (2.6817)	Entropy 0.62922 (0.62776)	Top-1 acc 55.469 (59.216)	Top-5 acc 82.031 (80.841)	lr 0.01362
Train [57][1840/3239]	Time 0.232 (0.748)	Data Time 0.001 (0.276)	Loss 2.7391 (2.6818)	Entropy 0.62918 (0.62777)	Top-1 acc 56.641 (59.218)	Top-5 acc 80.078 (80.840)	lr 0.01362
Train [57][1850/3239]	Time 0.246 (0.746)	Data Time 0.001 (0.275)	Loss 2.6629 (2.6822)	Entropy 0.62898 (0.62778)	Top-1 acc 61.719 (59.206)	Top-5 acc 78.516 (80.831)	lr 0.01362
Train [57][1860/3239]	Time 0.374 (0.754)	Data Time 0.001 (0.283)	Loss 2.6883 (2.6822)	Entropy 0.62892 (0.62778)	Top-1 acc 59.766 (59.208)	Top-5 acc 79.297 (80.834)	lr 0.01362
Train [57][1870/3239]	Time 0.239 (0.754)	Data Time 0.001 (0.283)	Loss 2.7134 (2.6822)	Entropy 0.62886 (0.62779)	Top-1 acc 56.641 (59.208)	Top-5 acc 82.031 (80.834)	lr 0.01362
Train [57][1880/3239]	Time 0.237 (0.752)	Data Time 0.001 (0.282)	Loss 2.5508 (2.6818)	Entropy 0.62878 (0.62780)	Top-1 acc 63.281 (59.212)	Top-5 acc 85.938 (80.843)	lr 0.01362
Train [57][1890/3239]	Time 0.235 (0.759)	Data Time 0.001 (0.289)	Loss 2.6821 (2.6818)	Entropy 0.62866 (0.62780)	Top-1 acc 58.984 (59.223)	Top-5 acc 79.297 (80.845)	lr 0.01362
Train [57][1900/3239]	Time 0.235 (0.761)	Data Time 0.001 (0.291)	Loss 2.6638 (2.6816)	Entropy 0.62891 (0.62781)	Top-1 acc 62.109 (59.226)	Top-5 acc 80.469 (80.848)	lr 0.01362
Train [57][1910/3239]	Time 0.267 (0.759)	Data Time 0.001 (0.289)	Loss 2.5717 (2.6816)	Entropy 0.62902 (0.62781)	Top-1 acc 61.328 (59.229)	Top-5 acc 83.984 (80.846)	lr 0.01361
Train [57][1920/3239]	Time 13.183 (0.764)	Data Time 12.942 (0.294)	Loss 2.6846 (2.6818)	Entropy 0.62903 (0.62782)	Top-1 acc 58.203 (59.227)	Top-5 acc 84.375 (80.847)	lr 0.01361
Train [57][1930/3239]	Time 0.431 (0.785)	Data Time 0.006 (0.299)	Loss 2.6781 (2.6818)	Entropy 0.62918 (0.62783)	Top-1 acc 59.766 (59.227)	Top-5 acc 80.469 (80.846)	lr 0.01361
Train [57][1940/3239]	Time 0.242 (0.784)	Data Time 0.002 (0.298)	Loss 2.7763 (2.6819)	Entropy 0.62902 (0.62783)	Top-1 acc 55.078 (59.227)	Top-5 acc 80.078 (80.840)	lr 0.01361
Train [57][1950/3239]	Time 0.253 (0.782)	Data Time 0.001 (0.296)	Loss 2.7345 (2.6817)	Entropy 0.62898 (0.62784)	Top-1 acc 57.031 (59.231)	Top-5 acc 77.734 (80.843)	lr 0.01361
Train [57][1960/3239]	Time 0.237 (0.780)	Data Time 0.001 (0.295)	Loss 2.9308 (2.6821)	Entropy 0.62934 (0.62784)	Top-1 acc 55.859 (59.226)	Top-5 acc 76.562 (80.833)	lr 0.01361
Train [57][1970/3239]	Time 0.235 (0.778)	Data Time 0.001 (0.293)	Loss 2.6623 (2.6825)	Entropy 0.62939 (0.62785)	Top-1 acc 59.766 (59.212)	Top-5 acc 80.859 (80.824)	lr 0.01361
Train [57][1980/3239]	Time 0.241 (0.776)	Data Time 0.001 (0.292)	Loss 2.6504 (2.6825)	Entropy 0.62909 (0.62786)	Top-1 acc 61.719 (59.210)	Top-5 acc 80.859 (80.823)	lr 0.01361
Train [57][1990/3239]	Time 4.035 (0.776)	Data Time 3.772 (0.292)	Loss 2.5747 (2.6822)	Entropy 0.62896 (0.62787)	Top-1 acc 61.328 (59.218)	Top-5 acc 84.766 (80.829)	lr 0.01361
Train [57][2000/3239]	Time 0.243 (0.779)	Data Time 0.001 (0.295)	Loss 2.7812 (2.6824)	Entropy 0.62890 (0.62787)	Top-1 acc 56.250 (59.216)	Top-5 acc 81.250 (80.829)	lr 0.01361
Train [57][2010/3239]	Time 0.270 (0.778)	Data Time 0.001 (0.294)	Loss 2.6139 (2.6824)	Entropy 0.62898 (0.62788)	Top-1 acc 62.891 (59.222)	Top-5 acc 82.812 (80.836)	lr 0.01360
Train [57][2020/3239]	Time 0.342 (0.778)	Data Time 0.001 (0.294)	Loss 2.7667 (2.6824)	Entropy 0.62868 (0.62788)	Top-1 acc 54.688 (59.221)	Top-5 acc 80.469 (80.835)	lr 0.01360
Train [57][2030/3239]	Time 0.267 (0.783)	Data Time 0.001 (0.300)	Loss 2.7747 (2.6826)	Entropy 0.62862 (0.62788)	Top-1 acc 54.688 (59.208)	Top-5 acc 76.562 (80.826)	lr 0.01360
Train [57][2040/3239]	Time 0.262 (0.785)	Data Time 0.001 (0.302)	Loss 2.5689 (2.6827)	Entropy 0.62892 (0.62789)	Top-1 acc 62.500 (59.206)	Top-5 acc 81.641 (80.823)	lr 0.01360
Train [57][2050/3239]	Time 0.241 (0.785)	Data Time 0.001 (0.302)	Loss 2.7120 (2.6827)	Entropy 0.62892 (0.62789)	Top-1 acc 54.297 (59.204)	Top-5 acc 81.250 (80.820)	lr 0.01360
Train [57][2060/3239]	Time 0.254 (0.790)	Data Time 0.001 (0.307)	Loss 2.7492 (2.6828)	Entropy 0.62897 (0.62790)	Top-1 acc 58.984 (59.210)	Top-5 acc 78.906 (80.815)	lr 0.01360
Train [57][2070/3239]	Time 0.240 (0.792)	Data Time 0.001 (0.309)	Loss 2.4635 (2.6829)	Entropy 0.62936 (0.62790)	Top-1 acc 64.844 (59.209)	Top-5 acc 83.594 (80.808)	lr 0.01360
Train [57][2080/3239]	Time 3.530 (0.792)	Data Time 3.277 (0.310)	Loss 2.6688 (2.6828)	Entropy 0.62937 (0.62791)	Top-1 acc 58.203 (59.212)	Top-5 acc 82.031 (80.808)	lr 0.01360
Train [57][2090/3239]	Time 7.172 (0.798)	Data Time 6.778 (0.316)	Loss 2.8182 (2.6830)	Entropy 0.62938 (0.62792)	Top-1 acc 55.859 (59.207)	Top-5 acc 81.250 (80.805)	lr 0.01360
Train [57][2100/3239]	Time 2.239 (0.800)	Data Time 1.988 (0.318)	Loss 2.8270 (2.6832)	Entropy 0.62904 (0.62792)	Top-1 acc 53.906 (59.197)	Top-5 acc 78.906 (80.802)	lr 0.01360
Train [57][2110/3239]	Time 0.249 (0.799)	Data Time 0.001 (0.318)	Loss 2.8488 (2.6832)	Entropy 0.62917 (0.62793)	Top-1 acc 55.469 (59.193)	Top-5 acc 80.078 (80.804)	lr 0.01359
Train [57][2120/3239]	Time 0.259 (0.804)	Data Time 0.001 (0.323)	Loss 2.6880 (2.6834)	Entropy 0.62938 (0.62794)	Top-1 acc 59.375 (59.187)	Top-5 acc 80.469 (80.798)	lr 0.01359
Train [57][2130/3239]	Time 0.292 (0.807)	Data Time 0.002 (0.326)	Loss 2.6753 (2.6831)	Entropy 0.62942 (0.62794)	Top-1 acc 60.156 (59.196)	Top-5 acc 79.688 (80.801)	lr 0.01359
Train [57][2140/3239]	Time 0.244 (0.806)	Data Time 0.001 (0.325)	Loss 2.5637 (2.6830)	Entropy 0.62910 (0.62795)	Top-1 acc 62.109 (59.199)	Top-5 acc 81.641 (80.803)	lr 0.01359
Train [57][2150/3239]	Time 11.919 (0.811)	Data Time 11.647 (0.330)	Loss 2.4493 (2.6831)	Entropy 0.62892 (0.62795)	Top-1 acc 67.188 (59.201)	Top-5 acc 85.547 (80.802)	lr 0.01359
Train [57][2160/3239]	Time 0.241 (0.815)	Data Time 0.001 (0.335)	Loss 2.7885 (2.6834)	Entropy 0.62894 (0.62796)	Top-1 acc 58.203 (59.198)	Top-5 acc 76.953 (80.791)	lr 0.01359
Train [57][2170/3239]	Time 0.256 (0.814)	Data Time 0.001 (0.334)	Loss 2.6022 (2.6831)	Entropy 0.62911 (0.62796)	Top-1 acc 65.625 (59.211)	Top-5 acc 83.203 (80.796)	lr 0.01359
Train [57][2180/3239]	Time 0.438 (0.813)	Data Time 0.001 (0.333)	Loss 2.6676 (2.6831)	Entropy 0.62923 (0.62797)	Top-1 acc 59.375 (59.214)	Top-5 acc 83.203 (80.798)	lr 0.01359
Train [57][2190/3239]	Time 0.238 (0.820)	Data Time 0.001 (0.340)	Loss 2.6888 (2.6831)	Entropy 0.62944 (0.62798)	Top-1 acc 61.328 (59.212)	Top-5 acc 80.859 (80.796)	lr 0.01359
Train [57][2200/3239]	Time 0.242 (0.820)	Data Time 0.001 (0.341)	Loss 2.6157 (2.6831)	Entropy 0.62921 (0.62798)	Top-1 acc 60.156 (59.211)	Top-5 acc 81.641 (80.794)	lr 0.01359
Train [57][2210/3239]	Time 0.231 (0.821)	Data Time 0.001 (0.342)	Loss 2.8753 (2.6832)	Entropy 0.62855 (0.62799)	Top-1 acc 55.469 (59.209)	Top-5 acc 76.562 (80.793)	lr 0.01358
Train [57][2220/3239]	Time 0.236 (0.827)	Data Time 0.001 (0.348)	Loss 2.8207 (2.6834)	Entropy 0.62873 (0.62799)	Top-1 acc 53.516 (59.205)	Top-5 acc 80.469 (80.789)	lr 0.01358
Train [57][2230/3239]	Time 0.227 (0.829)	Data Time 0.001 (0.350)	Loss 2.9510 (2.6835)	Entropy 0.62831 (0.62799)	Top-1 acc 56.250 (59.202)	Top-5 acc 77.344 (80.791)	lr 0.01358
Train [57][2240/3239]	Time 0.233 (0.829)	Data Time 0.001 (0.350)	Loss 2.6619 (2.6835)	Entropy 0.62835 (0.62799)	Top-1 acc 61.719 (59.202)	Top-5 acc 81.250 (80.790)	lr 0.01358
Train [57][2250/3239]	Time 7.820 (0.835)	Data Time 7.455 (0.357)	Loss 2.7148 (2.6837)	Entropy 0.62855 (0.62800)	Top-1 acc 57.812 (59.200)	Top-5 acc 80.078 (80.788)	lr 0.01358
Train [57][2260/3239]	Time 0.227 (0.837)	Data Time 0.001 (0.360)	Loss 2.6398 (2.6836)	Entropy 0.62851 (0.62800)	Top-1 acc 57.812 (59.199)	Top-5 acc 82.812 (80.791)	lr 0.01358
Train [57][2270/3239]	Time 0.233 (0.838)	Data Time 0.001 (0.360)	Loss 2.5522 (2.6836)	Entropy 0.62871 (0.62800)	Top-1 acc 65.234 (59.201)	Top-5 acc 82.812 (80.792)	lr 0.01358
Train [57][2280/3239]	Time 0.241 (0.840)	Data Time 0.001 (0.363)	Loss 2.7134 (2.6837)	Entropy 0.62869 (0.62800)	Top-1 acc 59.375 (59.200)	Top-5 acc 77.734 (80.790)	lr 0.01358
Train [57][2290/3239]	Time 0.229 (0.846)	Data Time 0.001 (0.369)	Loss 2.8971 (2.6838)	Entropy 0.62863 (0.62801)	Top-1 acc 52.344 (59.203)	Top-5 acc 76.953 (80.792)	lr 0.01358
Train [57][2300/3239]	Time 0.234 (0.847)	Data Time 0.001 (0.370)	Loss 2.8100 (2.6838)	Entropy 0.62892 (0.62801)	Top-1 acc 57.031 (59.203)	Top-5 acc 80.078 (80.795)	lr 0.01358
Train [57][2310/3239]	Time 7.543 (0.848)	Data Time 7.284 (0.371)	Loss 2.7437 (2.6837)	Entropy 0.62922 (0.62801)	Top-1 acc 58.594 (59.201)	Top-5 acc 78.516 (80.791)	lr 0.01357
Train [57][2320/3239]	Time 0.238 (0.854)	Data Time 0.001 (0.377)	Loss 2.6903 (2.6838)	Entropy 0.62898 (0.62802)	Top-1 acc 60.547 (59.203)	Top-5 acc 81.250 (80.788)	lr 0.01357
Train [57][2330/3239]	Time 0.279 (0.854)	Data Time 0.001 (0.378)	Loss 2.5261 (2.6839)	Entropy 0.62892 (0.62802)	Top-1 acc 64.062 (59.199)	Top-5 acc 84.375 (80.786)	lr 0.01357
Train [57][2340/3239]	Time 0.254 (0.852)	Data Time 0.001 (0.376)	Loss 2.5893 (2.6839)	Entropy 0.62840 (0.62803)	Top-1 acc 58.984 (59.194)	Top-5 acc 81.250 (80.787)	lr 0.01357
Train [57][2350/3239]	Time 0.227 (0.856)	Data Time 0.001 (0.380)	Loss 2.7177 (2.6841)	Entropy 0.62847 (0.62803)	Top-1 acc 57.031 (59.190)	Top-5 acc 78.906 (80.784)	lr 0.01357
Train [57][2360/3239]	Time 0.248 (0.862)	Data Time 0.001 (0.387)	Loss 2.8217 (2.6839)	Entropy 0.62817 (0.62803)	Top-1 acc 53.125 (59.194)	Top-5 acc 79.688 (80.785)	lr 0.01357
Train [57][2370/3239]	Time 0.234 (0.860)	Data Time 0.001 (0.385)	Loss 2.4292 (2.6838)	Entropy 0.62841 (0.62803)	Top-1 acc 64.844 (59.197)	Top-5 acc 86.328 (80.786)	lr 0.01357
Train [57][2380/3239]	Time 0.249 (0.865)	Data Time 0.001 (0.390)	Loss 2.5695 (2.6841)	Entropy 0.62826 (0.62803)	Top-1 acc 59.375 (59.195)	Top-5 acc 83.594 (80.779)	lr 0.01357
Train [57][2390/3239]	Time 0.285 (0.872)	Data Time 0.001 (0.397)	Loss 2.7078 (2.6841)	Entropy 0.62820 (0.62803)	Top-1 acc 62.109 (59.195)	Top-5 acc 80.859 (80.783)	lr 0.01357
Train [57][2400/3239]	Time 0.247 (0.870)	Data Time 0.001 (0.395)	Loss 2.6914 (2.6840)	Entropy 0.62831 (0.62803)	Top-1 acc 63.281 (59.200)	Top-5 acc 80.469 (80.783)	lr 0.01357
Train [57][2410/3239]	Time 12.470 (0.874)	Data Time 12.116 (0.399)	Loss 2.5051 (2.6842)	Entropy 0.62814 (0.62803)	Top-1 acc 63.281 (59.194)	Top-5 acc 85.156 (80.779)	lr 0.01356
Train [57][2420/3239]	Time 0.235 (0.880)	Data Time 0.001 (0.406)	Loss 2.5643 (2.6840)	Entropy 0.62788 (0.62803)	Top-1 acc 62.500 (59.201)	Top-5 acc 82.031 (80.780)	lr 0.01356
Train [57][2430/3239]	Time 0.256 (0.878)	Data Time 0.001 (0.405)	Loss 2.8317 (2.6842)	Entropy 0.62819 (0.62803)	Top-1 acc 55.859 (59.202)	Top-5 acc 76.562 (80.774)	lr 0.01356
Train [57][2440/3239]	Time 0.247 (0.876)	Data Time 0.001 (0.403)	Loss 2.6792 (2.6841)	Entropy 0.62809 (0.62803)	Top-1 acc 61.719 (59.207)	Top-5 acc 82.812 (80.773)	lr 0.01356
Train [57][2450/3239]	Time 0.232 (0.885)	Data Time 0.001 (0.412)	Loss 2.6319 (2.6842)	Entropy 0.62821 (0.62804)	Top-1 acc 63.281 (59.213)	Top-5 acc 83.203 (80.767)	lr 0.01356
Train [57][2460/3239]	Time 0.230 (0.883)	Data Time 0.001 (0.410)	Loss 2.8186 (2.6843)	Entropy 0.62872 (0.62804)	Top-1 acc 52.734 (59.214)	Top-5 acc 78.516 (80.764)	lr 0.01356
Train [57][2470/3239]	Time 0.234 (0.881)	Data Time 0.001 (0.409)	Loss 2.7315 (2.6845)	Entropy 0.62853 (0.62804)	Top-1 acc 55.859 (59.209)	Top-5 acc 81.641 (80.764)	lr 0.01356
Train [57][2480/3239]	Time 0.329 (0.890)	Data Time 0.001 (0.418)	Loss 2.9019 (2.6845)	Entropy 0.62857 (0.62804)	Top-1 acc 52.734 (59.207)	Top-5 acc 76.562 (80.763)	lr 0.01356
Train [57][2490/3239]	Time 0.241 (0.888)	Data Time 0.001 (0.416)	Loss 2.6702 (2.6848)	Entropy 0.62877 (0.62804)	Top-1 acc 65.625 (59.200)	Top-5 acc 77.734 (80.757)	lr 0.01356
Train [57][2500/3239]	Time 0.233 (0.886)	Data Time 0.001 (0.414)	Loss 3.0141 (2.6849)	Entropy 0.62853 (0.62805)	Top-1 acc 51.953 (59.201)	Top-5 acc 75.391 (80.756)	lr 0.01356
Train [57][2510/3239]	Time 0.232 (0.889)	Data Time 0.001 (0.418)	Loss 2.6684 (2.6847)	Entropy 0.62814 (0.62805)	Top-1 acc 60.938 (59.208)	Top-5 acc 80.469 (80.758)	lr 0.01355
Train [57][2520/3239]	Time 0.253 (0.894)	Data Time 0.001 (0.422)	Loss 2.7156 (2.6846)	Entropy 0.62770 (0.62805)	Top-1 acc 60.547 (59.209)	Top-5 acc 79.297 (80.761)	lr 0.01355
Train [57][2530/3239]	Time 0.245 (0.892)	Data Time 0.001 (0.421)	Loss 2.5801 (2.6847)	Entropy 0.62787 (0.62804)	Top-1 acc 62.500 (59.208)	Top-5 acc 81.250 (80.762)	lr 0.01355
Train [57][2540/3239]	Time 11.778 (0.894)	Data Time 11.524 (0.424)	Loss 2.8261 (2.6849)	Entropy 0.62815 (0.62804)	Top-1 acc 54.688 (59.200)	Top-5 acc 79.297 (80.759)	lr 0.01355
Train [57][2550/3239]	Time 0.224 (0.898)	Data Time 0.001 (0.428)	Loss 2.6534 (2.6851)	Entropy 0.62811 (0.62804)	Top-1 acc 61.719 (59.196)	Top-5 acc 80.859 (80.759)	lr 0.01355
Train [57][2560/3239]	Time 0.243 (0.897)	Data Time 0.001 (0.426)	Loss 2.6312 (2.6849)	Entropy 0.62833 (0.62805)	Top-1 acc 60.547 (59.199)	Top-5 acc 81.641 (80.762)	lr 0.01355
Train [57][2570/3239]	Time 0.355 (0.895)	Data Time 0.001 (0.425)	Loss 2.5711 (2.6849)	Entropy 0.62842 (0.62805)	Top-1 acc 63.672 (59.198)	Top-5 acc 83.984 (80.763)	lr 0.01355
Train [57][2580/3239]	Time 0.229 (0.903)	Data Time 0.001 (0.433)	Loss 2.8040 (2.6849)	Entropy 0.62825 (0.62805)	Top-1 acc 58.984 (59.200)	Top-5 acc 78.516 (80.764)	lr 0.01355
Train [57][2590/3239]	Time 0.264 (0.915)	Data Time 0.002 (0.431)	Loss 2.8695 (2.6847)	Entropy 0.62814 (0.62805)	Top-1 acc 57.031 (59.204)	Top-5 acc 79.297 (80.767)	lr 0.01355
Train [57][2600/3239]	Time 0.246 (0.913)	Data Time 0.002 (0.430)	Loss 2.7012 (2.6847)	Entropy 0.62821 (0.62805)	Top-1 acc 57.422 (59.207)	Top-5 acc 81.250 (80.768)	lr 0.01355
Train [57][2610/3239]	Time 0.256 (0.911)	Data Time 0.002 (0.428)	Loss 2.7043 (2.6849)	Entropy 0.62843 (0.62805)	Top-1 acc 58.594 (59.199)	Top-5 acc 80.078 (80.766)	lr 0.01354
Train [57][2620/3239]	Time 0.233 (0.909)	Data Time 0.001 (0.426)	Loss 2.6848 (2.6849)	Entropy 0.62863 (0.62805)	Top-1 acc 57.031 (59.197)	Top-5 acc 82.031 (80.768)	lr 0.01354
Train [57][2630/3239]	Time 0.260 (0.907)	Data Time 0.001 (0.425)	Loss 2.6643 (2.6849)	Entropy 0.62869 (0.62805)	Top-1 acc 60.547 (59.194)	Top-5 acc 79.688 (80.771)	lr 0.01354
Train [57][2640/3239]	Time 0.265 (0.909)	Data Time 0.001 (0.427)	Loss 2.8563 (2.6849)	Entropy 0.62840 (0.62806)	Top-1 acc 57.031 (59.193)	Top-5 acc 78.125 (80.770)	lr 0.01354
Train [57][2650/3239]	Time 0.235 (0.910)	Data Time 0.001 (0.427)	Loss 2.6743 (2.6847)	Entropy 0.62844 (0.62806)	Top-1 acc 60.938 (59.198)	Top-5 acc 79.688 (80.774)	lr 0.01354
Train [57][2660/3239]	Time 0.264 (0.908)	Data Time 0.001 (0.426)	Loss 2.6687 (2.6849)	Entropy 0.62823 (0.62806)	Top-1 acc 60.938 (59.192)	Top-5 acc 80.859 (80.773)	lr 0.01354
Train [57][2670/3239]	Time 0.253 (0.912)	Data Time 0.001 (0.430)	Loss 2.6537 (2.6851)	Entropy 0.62840 (0.62806)	Top-1 acc 58.984 (59.186)	Top-5 acc 80.078 (80.766)	lr 0.01354
Train [57][2680/3239]	Time 0.246 (0.912)	Data Time 0.001 (0.430)	Loss 2.5840 (2.6850)	Entropy 0.62827 (0.62806)	Top-1 acc 59.375 (59.189)	Top-5 acc 81.641 (80.768)	lr 0.01354
Train [57][2690/3239]	Time 0.267 (0.911)	Data Time 0.001 (0.430)	Loss 2.8262 (2.6852)	Entropy 0.62828 (0.62806)	Top-1 acc 51.953 (59.180)	Top-5 acc 80.859 (80.764)	lr 0.01354
Train [57][2700/3239]	Time 16.011 (0.917)	Data Time 15.768 (0.435)	Loss 2.7382 (2.6853)	Entropy 0.62817 (0.62806)	Top-1 acc 55.469 (59.179)	Top-5 acc 78.516 (80.762)	lr 0.01354
Train [57][2710/3239]	Time 0.250 (0.915)	Data Time 0.001 (0.434)	Loss 2.6746 (2.6853)	Entropy 0.62833 (0.62806)	Top-1 acc 61.719 (59.184)	Top-5 acc 79.688 (80.761)	lr 0.01353
Train [57][2720/3239]	Time 0.234 (0.916)	Data Time 0.001 (0.435)	Loss 2.7556 (2.6852)	Entropy 0.62841 (0.62806)	Top-1 acc 56.641 (59.185)	Top-5 acc 79.297 (80.763)	lr 0.01353
Train [57][2730/3239]	Time 0.361 (0.915)	Data Time 0.001 (0.434)	Loss 2.5808 (2.6852)	Entropy 0.62865 (0.62807)	Top-1 acc 61.719 (59.184)	Top-5 acc 80.859 (80.760)	lr 0.01353
Train [57][2740/3239]	Time 0.266 (0.920)	Data Time 0.001 (0.440)	Loss 2.8799 (2.6851)	Entropy 0.62881 (0.62807)	Top-1 acc 52.734 (59.189)	Top-5 acc 79.297 (80.764)	lr 0.01353
Train [57][2750/3239]	Time 0.235 (0.920)	Data Time 0.001 (0.439)	Loss 2.6184 (2.6850)	Entropy 0.62850 (0.62807)	Top-1 acc 63.672 (59.191)	Top-5 acc 81.250 (80.768)	lr 0.01353
Train [57][2760/3239]	Time 0.252 (0.919)	Data Time 0.001 (0.439)	Loss 2.5439 (2.6849)	Entropy 0.62895 (0.62807)	Top-1 acc 63.281 (59.191)	Top-5 acc 80.859 (80.768)	lr 0.01353
Train [57][2770/3239]	Time 0.235 (0.925)	Data Time 0.001 (0.445)	Loss 2.7244 (2.6850)	Entropy 0.62897 (0.62808)	Top-1 acc 60.938 (59.192)	Top-5 acc 78.516 (80.767)	lr 0.01353
Train [57][2780/3239]	Time 0.299 (0.924)	Data Time 0.002 (0.444)	Loss 2.8147 (2.6849)	Entropy 0.62906 (0.62808)	Top-1 acc 55.469 (59.195)	Top-5 acc 78.125 (80.768)	lr 0.01353
Train [57][2790/3239]	Time 0.256 (0.923)	Data Time 0.002 (0.444)	Loss 2.7930 (2.6847)	Entropy 0.62916 (0.62808)	Top-1 acc 56.250 (59.198)	Top-5 acc 75.781 (80.770)	lr 0.01353
Train [57][2800/3239]	Time 0.325 (0.929)	Data Time 0.001 (0.450)	Loss 2.6127 (2.6847)	Entropy 0.62918 (0.62809)	Top-1 acc 62.500 (59.196)	Top-5 acc 83.203 (80.774)	lr 0.01353
Train [57][2810/3239]	Time 0.229 (0.928)	Data Time 0.001 (0.449)	Loss 2.7622 (2.6848)	Entropy 0.62899 (0.62809)	Top-1 acc 55.469 (59.198)	Top-5 acc 81.641 (80.773)	lr 0.01352
Train [57][2820/3239]	Time 0.238 (0.928)	Data Time 0.001 (0.448)	Loss 2.7589 (2.6849)	Entropy 0.62911 (0.62809)	Top-1 acc 57.031 (59.196)	Top-5 acc 78.125 (80.770)	lr 0.01352
Train [57][2830/3239]	Time 0.232 (0.935)	Data Time 0.001 (0.456)	Loss 2.7213 (2.6849)	Entropy 0.62911 (0.62810)	Top-1 acc 56.250 (59.196)	Top-5 acc 78.906 (80.770)	lr 0.01352
Train [57][2840/3239]	Time 0.235 (0.933)	Data Time 0.001 (0.454)	Loss 2.6162 (2.6849)	Entropy 0.62879 (0.62810)	Top-1 acc 61.328 (59.197)	Top-5 acc 80.469 (80.770)	lr 0.01352
Train [57][2850/3239]	Time 0.232 (0.932)	Data Time 0.001 (0.453)	Loss 2.6257 (2.6849)	Entropy 0.62861 (0.62810)	Top-1 acc 57.422 (59.196)	Top-5 acc 84.766 (80.769)	lr 0.01352
Train [57][2860/3239]	Time 24.401 (0.939)	Data Time 24.144 (0.461)	Loss 2.4947 (2.6846)	Entropy 0.62878 (0.62810)	Top-1 acc 64.453 (59.203)	Top-5 acc 84.375 (80.775)	lr 0.01352
Train [57][2870/3239]	Time 0.268 (0.938)	Data Time 0.001 (0.459)	Loss 2.6904 (2.6845)	Entropy 0.62867 (0.62811)	Top-1 acc 61.328 (59.207)	Top-5 acc 80.078 (80.777)	lr 0.01352
Train [57][2880/3239]	Time 0.236 (0.936)	Data Time 0.001 (0.458)	Loss 2.6244 (2.6845)	Entropy 0.62868 (0.62811)	Top-1 acc 60.938 (59.205)	Top-5 acc 81.641 (80.777)	lr 0.01352
Train [57][2890/3239]	Time 0.362 (0.935)	Data Time 0.001 (0.457)	Loss 2.5655 (2.6843)	Entropy 0.62886 (0.62811)	Top-1 acc 63.672 (59.208)	Top-5 acc 84.766 (80.782)	lr 0.01352
Train [57][2900/3239]	Time 0.255 (0.943)	Data Time 0.001 (0.465)	Loss 2.5626 (2.6843)	Entropy 0.62904 (0.62811)	Top-1 acc 63.672 (59.207)	Top-5 acc 82.812 (80.781)	lr 0.01351
Train [57][2910/3239]	Time 0.255 (0.941)	Data Time 0.001 (0.463)	Loss 2.6633 (2.6843)	Entropy 0.62930 (0.62812)	Top-1 acc 61.719 (59.205)	Top-5 acc 80.859 (80.778)	lr 0.01351
Train [57][2920/3239]	Time 0.229 (0.939)	Data Time 0.001 (0.462)	Loss 2.5777 (2.6843)	Entropy 0.62944 (0.62812)	Top-1 acc 64.453 (59.208)	Top-5 acc 82.031 (80.781)	lr 0.01351
Train [57][2930/3239]	Time 0.233 (0.946)	Data Time 0.001 (0.469)	Loss 2.6178 (2.6843)	Entropy 0.62943 (0.62812)	Top-1 acc 61.328 (59.208)	Top-5 acc 79.297 (80.778)	lr 0.01351
Train [57][2940/3239]	Time 0.247 (0.944)	Data Time 0.001 (0.467)	Loss 2.7133 (2.6844)	Entropy 0.62938 (0.62813)	Top-1 acc 63.281 (59.210)	Top-5 acc 81.250 (80.778)	lr 0.01351
Train [57][2950/3239]	Time 0.237 (0.943)	Data Time 0.001 (0.466)	Loss 2.9108 (2.6845)	Entropy 0.62880 (0.62813)	Top-1 acc 55.078 (59.204)	Top-5 acc 77.734 (80.775)	lr 0.01351
Train [57][2960/3239]	Time 0.322 (0.951)	Data Time 0.001 (0.474)	Loss 2.4902 (2.6843)	Entropy 0.62860 (0.62813)	Top-1 acc 59.375 (59.205)	Top-5 acc 82.812 (80.780)	lr 0.01351
Train [57][2970/3239]	Time 0.231 (0.949)	Data Time 0.001 (0.472)	Loss 2.6760 (2.6846)	Entropy 0.62861 (0.62814)	Top-1 acc 59.766 (59.194)	Top-5 acc 82.031 (80.774)	lr 0.01351
Train [57][2980/3239]	Time 0.234 (0.948)	Data Time 0.001 (0.471)	Loss 2.5634 (2.6845)	Entropy 0.62855 (0.62814)	Top-1 acc 62.109 (59.198)	Top-5 acc 82.812 (80.777)	lr 0.01351
Train [57][2990/3239]	Time 0.238 (0.955)	Data Time 0.001 (0.478)	Loss 2.6418 (2.6846)	Entropy 0.62893 (0.62814)	Top-1 acc 62.109 (59.194)	Top-5 acc 81.250 (80.775)	lr 0.01351
Train [57][3000/3239]	Time 0.233 (0.953)	Data Time 0.001 (0.477)	Loss 2.7031 (2.6846)	Entropy 0.62892 (0.62814)	Top-1 acc 59.766 (59.197)	Top-5 acc 81.641 (80.776)	lr 0.01350
Train [57][3010/3239]	Time 0.232 (0.953)	Data Time 0.001 (0.477)	Loss 2.8669 (2.6845)	Entropy 0.62901 (0.62815)	Top-1 acc 54.688 (59.196)	Top-5 acc 75.391 (80.778)	lr 0.01350
Train [57][3020/3239]	Time 23.837 (0.959)	Data Time 23.590 (0.483)	Loss 2.7733 (2.6848)	Entropy 0.62932 (0.62815)	Top-1 acc 55.078 (59.186)	Top-5 acc 77.734 (80.771)	lr 0.01350
Train [57][3030/3239]	Time 0.252 (0.957)	Data Time 0.001 (0.482)	Loss 2.5654 (2.6847)	Entropy 0.62944 (0.62815)	Top-1 acc 58.203 (59.189)	Top-5 acc 83.594 (80.774)	lr 0.01350
Train [57][3040/3239]	Time 0.240 (0.955)	Data Time 0.001 (0.480)	Loss 2.6098 (2.6848)	Entropy 0.62920 (0.62816)	Top-1 acc 59.375 (59.187)	Top-5 acc 81.641 (80.774)	lr 0.01350
Train [57][3050/3239]	Time 0.286 (0.955)	Data Time 0.001 (0.480)	Loss 2.7746 (2.6849)	Entropy 0.62923 (0.62816)	Top-1 acc 56.250 (59.182)	Top-5 acc 77.734 (80.770)	lr 0.01350
Train [57][3060/3239]	Time 0.229 (0.962)	Data Time 0.002 (0.487)	Loss 2.6717 (2.6849)	Entropy 0.62914 (0.62816)	Top-1 acc 53.516 (59.182)	Top-5 acc 83.984 (80.771)	lr 0.01350
Train [57][3070/3239]	Time 0.256 (0.960)	Data Time 0.001 (0.485)	Loss 2.6441 (2.6848)	Entropy 0.62913 (0.62817)	Top-1 acc 61.328 (59.185)	Top-5 acc 80.469 (80.771)	lr 0.01350
Train [57][3080/3239]	Time 0.245 (0.959)	Data Time 0.001 (0.485)	Loss 2.8119 (2.6849)	Entropy 0.62919 (0.62817)	Top-1 acc 54.688 (59.182)	Top-5 acc 80.078 (80.770)	lr 0.01350
Train [57][3090/3239]	Time 0.234 (0.966)	Data Time 0.001 (0.492)	Loss 2.6812 (2.6848)	Entropy 0.62897 (0.62817)	Top-1 acc 58.984 (59.180)	Top-5 acc 82.031 (80.773)	lr 0.01350
Train [57][3100/3239]	Time 0.238 (0.964)	Data Time 0.001 (0.490)	Loss 2.7610 (2.6849)	Entropy 0.62908 (0.62818)	Top-1 acc 59.375 (59.178)	Top-5 acc 78.125 (80.770)	lr 0.01349
Train [57][3110/3239]	Time 0.240 (0.964)	Data Time 0.001 (0.490)	Loss 2.8059 (2.6848)	Entropy 0.62872 (0.62818)	Top-1 acc 55.078 (59.181)	Top-5 acc 78.125 (80.774)	lr 0.01349
Train [57][3120/3239]	Time 0.344 (0.970)	Data Time 0.002 (0.497)	Loss 2.6818 (2.6849)	Entropy 0.62860 (0.62818)	Top-1 acc 57.031 (59.175)	Top-5 acc 80.078 (80.771)	lr 0.01349
Train [57][3130/3239]	Time 0.232 (0.969)	Data Time 0.001 (0.495)	Loss 2.6163 (2.6849)	Entropy 0.62834 (0.62818)	Top-1 acc 62.891 (59.176)	Top-5 acc 82.812 (80.771)	lr 0.01349
Train [57][3140/3239]	Time 1.660 (0.968)	Data Time 1.408 (0.495)	Loss 2.7171 (2.6850)	Entropy 0.62846 (0.62818)	Top-1 acc 55.078 (59.172)	Top-5 acc 81.641 (80.771)	lr 0.01349
Train [57][3150/3239]	Time 0.235 (0.976)	Data Time 0.001 (0.503)	Loss 2.6696 (2.6851)	Entropy 0.62821 (0.62818)	Top-1 acc 55.078 (59.169)	Top-5 acc 80.469 (80.765)	lr 0.01349
Train [57][3160/3239]	Time 0.231 (0.974)	Data Time 0.001 (0.501)	Loss 2.5029 (2.6851)	Entropy 0.62833 (0.62818)	Top-1 acc 63.672 (59.171)	Top-5 acc 84.375 (80.768)	lr 0.01349
Train [57][3170/3239]	Time 0.228 (0.972)	Data Time 0.001 (0.499)	Loss 2.6743 (2.6851)	Entropy 0.62842 (0.62818)	Top-1 acc 60.156 (59.166)	Top-5 acc 80.859 (80.766)	lr 0.01349
Train [57][3180/3239]	Time 27.015 (0.980)	Data Time 26.763 (0.508)	Loss 2.7218 (2.6853)	Entropy 0.62838 (0.62818)	Top-1 acc 57.031 (59.157)	Top-5 acc 79.688 (80.761)	lr 0.01349
Train [57][3190/3239]	Time 0.343 (0.978)	Data Time 0.000 (0.506)	Loss 2.8036 (2.6853)	Entropy 0.62832 (0.62818)	Top-1 acc 54.688 (59.156)	Top-5 acc 81.250 (80.757)	lr 0.01349
Train [57][3200/3239]	Time 0.242 (0.977)	Data Time 0.000 (0.504)	Loss 2.4858 (2.6852)	Entropy 0.62822 (0.62818)	Top-1 acc 60.156 (59.159)	Top-5 acc 82.812 (80.757)	lr 0.01348
Train [57][3210/3239]	Time 0.233 (0.975)	Data Time 0.000 (0.503)	Loss 2.7668 (2.6850)	Entropy 0.62808 (0.62818)	Top-1 acc 60.938 (59.161)	Top-5 acc 77.344 (80.761)	lr 0.01348
Train [57][3220/3239]	Time 0.234 (0.981)	Data Time 0.000 (0.509)	Loss 2.7107 (2.6850)	Entropy 0.62784 (0.62818)	Top-1 acc 57.422 (59.162)	Top-5 acc 78.906 (80.757)	lr 0.01348
Train [57][3230/3239]	Time 0.240 (0.979)	Data Time 0.000 (0.508)	Loss 2.5960 (2.6850)	Entropy 0.62790 (0.62818)	Top-1 acc 63.281 (59.167)	Top-5 acc 83.984 (80.757)	lr 0.01348
Train [57][3239/3239]	Time 33.891 (0.988)	Data Time 0.000 (0.506)	Loss 2.6936 (2.6852)	Entropy 0.62807 (0.62818)	Top-1 acc 60.494 (59.164)	Top-5 acc 81.481 (80.752)	lr 0.01348
==========Valid [57/120]	loss 1.429	top-1 acc 66.988 (66.988)	top-5 acc 86.976	Train top-1 59.164	top-5 80.752	Entropy 0.62807	Latency-None: 0.000ms	Flops: 538.40M
Train [58][0/3239]	Time 48.394 (48.394)	Data Time 46.031 (46.031)	Loss 2.4633 (2.4633)	Entropy 0.62833 (0.62833)	Top-1 acc 64.453 (64.453)	Top-5 acc 86.719 (86.719)	lr 0.01348
Train [58][10/3239]	Time 0.306 (4.852)	Data Time 0.002 (4.187)	Loss 2.6264 (2.6499)	Entropy 0.62830 (0.62835)	Top-1 acc 60.938 (60.547)	Top-5 acc 82.422 (81.143)	lr 0.01348
Train [58][20/3239]	Time 0.366 (2.760)	Data Time 0.001 (2.194)	Loss 2.8475 (2.6739)	Entropy 0.62853 (0.62839)	Top-1 acc 54.688 (59.542)	Top-5 acc 76.562 (80.915)	lr 0.01348
Train [58][30/3239]	Time 0.241 (2.019)	Data Time 0.002 (1.487)	Loss 2.8536 (2.6837)	Entropy 0.62851 (0.62845)	Top-1 acc 55.078 (59.211)	Top-5 acc 79.688 (80.985)	lr 0.01348
Train [58][40/3239]	Time 0.248 (1.683)	Data Time 0.001 (1.171)	Loss 2.8174 (2.6790)	Entropy 0.62874 (0.62848)	Top-1 acc 53.125 (59.318)	Top-5 acc 80.078 (81.012)	lr 0.01348
Train [58][50/3239]	Time 0.252 (1.441)	Data Time 0.001 (0.942)	Loss 2.6041 (2.6758)	Entropy 0.62886 (0.62853)	Top-1 acc 59.766 (59.283)	Top-5 acc 82.031 (81.059)	lr 0.01348
Train [58][60/3239]	Time 0.259 (1.281)	Data Time 0.001 (0.788)	Loss 2.6362 (2.6805)	Entropy 0.62856 (0.62859)	Top-1 acc 58.594 (59.426)	Top-5 acc 79.688 (80.821)	lr 0.01347
Train [58][70/3239]	Time 0.240 (1.212)	Data Time 0.002 (0.722)	Loss 2.6545 (2.6818)	Entropy 0.62872 (0.62859)	Top-1 acc 62.109 (59.425)	Top-5 acc 81.250 (80.804)	lr 0.01347
Train [58][80/3239]	Time 0.248 (1.115)	Data Time 0.001 (0.633)	Loss 2.8067 (2.6811)	Entropy 0.62860 (0.62861)	Top-1 acc 57.031 (59.341)	Top-5 acc 77.344 (80.782)	lr 0.01347
Train [58][90/3239]	Time 0.240 (1.042)	Data Time 0.001 (0.564)	Loss 2.4106 (2.6766)	Entropy 0.62894 (0.62863)	Top-1 acc 64.453 (59.474)	Top-5 acc 85.156 (80.851)	lr 0.01347
Train [58][100/3239]	Time 0.250 (1.004)	Data Time 0.001 (0.529)	Loss 2.6669 (2.6805)	Entropy 0.62924 (0.62867)	Top-1 acc 57.812 (59.394)	Top-5 acc 83.984 (80.763)	lr 0.01347
Train [58][110/3239]	Time 0.363 (0.954)	Data Time 0.001 (0.481)	Loss 2.7493 (2.6865)	Entropy 0.62912 (0.62871)	Top-1 acc 60.156 (59.266)	Top-5 acc 83.203 (80.659)	lr 0.01347
Train [58][120/3239]	Time 0.238 (0.911)	Data Time 0.001 (0.442)	Loss 2.6037 (2.6836)	Entropy 0.62912 (0.62875)	Top-1 acc 59.766 (59.307)	Top-5 acc 82.031 (80.717)	lr 0.01347
Train [58][130/3239]	Time 0.243 (0.895)	Data Time 0.001 (0.427)	Loss 2.6705 (2.6804)	Entropy 0.62934 (0.62878)	Top-1 acc 60.938 (59.396)	Top-5 acc 82.812 (80.749)	lr 0.01347
Train [58][140/3239]	Time 0.262 (0.876)	Data Time 0.001 (0.406)	Loss 2.5980 (2.6812)	Entropy 0.62929 (0.62882)	Top-1 acc 62.891 (59.350)	Top-5 acc 82.031 (80.793)	lr 0.01347
Train [58][150/3239]	Time 0.324 (0.848)	Data Time 0.002 (0.379)	Loss 2.6599 (2.6815)	Entropy 0.62900 (0.62884)	Top-1 acc 58.984 (59.287)	Top-5 acc 80.859 (80.769)	lr 0.01347
Train [58][160/3239]	Time 0.689 (0.826)	Data Time 0.376 (0.358)	Loss 2.5614 (2.6867)	Entropy 0.62944 (0.62886)	Top-1 acc 60.938 (59.154)	Top-5 acc 82.812 (80.656)	lr 0.01346
Train [58][170/3239]	Time 0.893 (0.820)	Data Time 0.654 (0.355)	Loss 2.6993 (2.6847)	Entropy 0.62919 (0.62889)	Top-1 acc 56.250 (59.153)	Top-5 acc 80.078 (80.695)	lr 0.01346
Train [58][180/3239]	Time 0.335 (0.800)	Data Time 0.001 (0.335)	Loss 2.5157 (2.6810)	Entropy 0.62951 (0.62891)	Top-1 acc 62.500 (59.278)	Top-5 acc 86.719 (80.769)	lr 0.01346
Train [58][190/3239]	Time 0.254 (0.782)	Data Time 0.001 (0.318)	Loss 2.6472 (2.6778)	Entropy 0.62958 (0.62894)	Top-1 acc 60.938 (59.357)	Top-5 acc 80.078 (80.814)	lr 0.01346
Train [58][200/3239]	Time 0.265 (0.775)	Data Time 0.002 (0.312)	Loss 2.6359 (2.6766)	Entropy 0.62949 (0.62898)	Top-1 acc 57.031 (59.412)	Top-5 acc 82.812 (80.867)	lr 0.01346
Train [58][210/3239]	Time 0.274 (0.760)	Data Time 0.001 (0.297)	Loss 2.6455 (2.6768)	Entropy 0.62946 (0.62900)	Top-1 acc 60.156 (59.453)	Top-5 acc 80.078 (80.870)	lr 0.01346
Train [58][220/3239]	Time 0.234 (0.745)	Data Time 0.001 (0.284)	Loss 2.6738 (2.6774)	Entropy 0.62969 (0.62902)	Top-1 acc 58.594 (59.433)	Top-5 acc 80.078 (80.888)	lr 0.01346
Train [58][230/3239]	Time 0.240 (0.745)	Data Time 0.001 (0.284)	Loss 2.5770 (2.6765)	Entropy 0.62940 (0.62905)	Top-1 acc 60.938 (59.441)	Top-5 acc 82.031 (80.871)	lr 0.01346
Train [58][240/3239]	Time 0.233 (0.731)	Data Time 0.001 (0.272)	Loss 2.5532 (2.6752)	Entropy 0.62940 (0.62906)	Top-1 acc 61.328 (59.450)	Top-5 acc 83.984 (80.942)	lr 0.01346
Train [58][250/3239]	Time 0.237 (0.720)	Data Time 0.001 (0.262)	Loss 2.5536 (2.6740)	Entropy 0.62942 (0.62907)	Top-1 acc 63.281 (59.484)	Top-5 acc 81.250 (80.931)	lr 0.01346
Train [58][260/3239]	Time 4.761 (0.731)	Data Time 4.470 (0.272)	Loss 2.6521 (2.6755)	Entropy 0.62958 (0.62909)	Top-1 acc 60.547 (59.471)	Top-5 acc 82.031 (80.888)	lr 0.01345
Train [58][270/3239]	Time 0.400 (0.721)	Data Time 0.001 (0.262)	Loss 2.6147 (2.6758)	Entropy 0.62960 (0.62911)	Top-1 acc 61.719 (59.428)	Top-5 acc 82.031 (80.910)	lr 0.01345
Train [58][280/3239]	Time 0.232 (0.711)	Data Time 0.001 (0.253)	Loss 2.8282 (2.6752)	Entropy 0.62974 (0.62913)	Top-1 acc 57.812 (59.439)	Top-5 acc 80.078 (80.902)	lr 0.01345
Train [58][290/3239]	Time 0.240 (0.701)	Data Time 0.001 (0.244)	Loss 2.5397 (2.6731)	Entropy 0.63016 (0.62915)	Top-1 acc 62.891 (59.478)	Top-5 acc 83.984 (80.928)	lr 0.01345
Train [58][300/3239]	Time 0.262 (0.707)	Data Time 0.001 (0.249)	Loss 2.5649 (2.6744)	Entropy 0.63013 (0.62918)	Top-1 acc 63.672 (59.478)	Top-5 acc 84.375 (80.913)	lr 0.01345
Train [58][310/3239]	Time 0.293 (0.699)	Data Time 0.003 (0.242)	Loss 2.7428 (2.6768)	Entropy 0.63022 (0.62921)	Top-1 acc 56.641 (59.414)	Top-5 acc 79.688 (80.858)	lr 0.01345
Train [58][320/3239]	Time 0.228 (0.691)	Data Time 0.001 (0.234)	Loss 2.8327 (2.6755)	Entropy 0.63014 (0.62924)	Top-1 acc 50.391 (59.443)	Top-5 acc 77.734 (80.904)	lr 0.01345
Train [58][330/3239]	Time 0.226 (0.695)	Data Time 0.001 (0.238)	Loss 2.7095 (2.6747)	Entropy 0.63005 (0.62927)	Top-1 acc 57.812 (59.481)	Top-5 acc 82.422 (80.929)	lr 0.01345
Train [58][340/3239]	Time 0.323 (0.687)	Data Time 0.001 (0.231)	Loss 2.6375 (2.6750)	Entropy 0.62999 (0.62929)	Top-1 acc 58.984 (59.478)	Top-5 acc 80.078 (80.924)	lr 0.01345
Train [58][350/3239]	Time 0.243 (0.680)	Data Time 0.001 (0.224)	Loss 2.5016 (2.6733)	Entropy 0.63005 (0.62931)	Top-1 acc 64.453 (59.532)	Top-5 acc 83.203 (80.938)	lr 0.01345
Train [58][360/3239]	Time 0.239 (0.681)	Data Time 0.001 (0.226)	Loss 2.5811 (2.6731)	Entropy 0.62993 (0.62933)	Top-1 acc 63.672 (59.544)	Top-5 acc 83.203 (80.941)	lr 0.01344
Train [58][370/3239]	Time 0.239 (0.674)	Data Time 0.001 (0.220)	Loss 2.6184 (2.6749)	Entropy 0.62997 (0.62935)	Top-1 acc 62.500 (59.530)	Top-5 acc 83.594 (80.923)	lr 0.01344
Train [58][380/3239]	Time 0.253 (0.668)	Data Time 0.001 (0.215)	Loss 2.6123 (2.6737)	Entropy 0.62946 (0.62936)	Top-1 acc 58.984 (59.573)	Top-5 acc 82.422 (80.957)	lr 0.01344
Train [58][390/3239]	Time 0.263 (0.679)	Data Time 0.001 (0.225)	Loss 2.5816 (2.6742)	Entropy 0.62964 (0.62937)	Top-1 acc 61.328 (59.553)	Top-5 acc 84.766 (80.942)	lr 0.01344
Train [58][400/3239]	Time 0.285 (0.672)	Data Time 0.001 (0.220)	Loss 2.6800 (2.6730)	Entropy 0.62963 (0.62937)	Top-1 acc 60.156 (59.583)	Top-5 acc 80.859 (80.969)	lr 0.01344
Train [58][410/3239]	Time 0.249 (0.667)	Data Time 0.001 (0.215)	Loss 2.8748 (2.6740)	Entropy 0.62957 (0.62938)	Top-1 acc 52.344 (59.525)	Top-5 acc 77.734 (80.958)	lr 0.01344
Train [58][420/3239]	Time 1.000 (0.664)	Data Time 0.758 (0.211)	Loss 2.6596 (2.6753)	Entropy 0.62934 (0.62938)	Top-1 acc 61.719 (59.466)	Top-5 acc 78.906 (80.923)	lr 0.01344
Train [58][430/3239]	Time 0.254 (0.658)	Data Time 0.001 (0.206)	Loss 2.4236 (2.6751)	Entropy 0.62908 (0.62937)	Top-1 acc 64.844 (59.447)	Top-5 acc 83.203 (80.933)	lr 0.01344
Train [58][440/3239]	Time 0.266 (0.653)	Data Time 0.001 (0.202)	Loss 2.6587 (2.6762)	Entropy 0.62914 (0.62937)	Top-1 acc 62.109 (59.445)	Top-5 acc 81.641 (80.910)	lr 0.01344
Train [58][450/3239]	Time 0.294 (0.650)	Data Time 0.001 (0.199)	Loss 2.8584 (2.6762)	Entropy 0.62933 (0.62936)	Top-1 acc 54.297 (59.434)	Top-5 acc 75.391 (80.907)	lr 0.01344
Train [58][460/3239]	Time 0.250 (0.653)	Data Time 0.001 (0.203)	Loss 2.5913 (2.6766)	Entropy 0.62937 (0.62936)	Top-1 acc 60.938 (59.428)	Top-5 acc 83.594 (80.907)	lr 0.01343
Train [58][470/3239]	Time 0.357 (0.649)	Data Time 0.001 (0.199)	Loss 2.6294 (2.6757)	Entropy 0.62940 (0.62936)	Top-1 acc 61.328 (59.458)	Top-5 acc 82.031 (80.915)	lr 0.01343
Train [58][480/3239]	Time 0.234 (0.645)	Data Time 0.001 (0.195)	Loss 2.6240 (2.6757)	Entropy 0.62971 (0.62937)	Top-1 acc 62.109 (59.452)	Top-5 acc 82.031 (80.915)	lr 0.01343
Train [58][490/3239]	Time 0.251 (0.650)	Data Time 0.001 (0.200)	Loss 2.5591 (2.6747)	Entropy 0.62978 (0.62937)	Top-1 acc 63.672 (59.475)	Top-5 acc 83.203 (80.931)	lr 0.01343
Train [58][500/3239]	Time 0.403 (0.646)	Data Time 0.002 (0.196)	Loss 2.6409 (2.6736)	Entropy 0.62975 (0.62938)	Top-1 acc 60.938 (59.501)	Top-5 acc 82.422 (80.947)	lr 0.01343
Train [58][510/3239]	Time 0.299 (0.643)	Data Time 0.003 (0.192)	Loss 2.6272 (2.6739)	Entropy 0.62968 (0.62939)	Top-1 acc 56.641 (59.477)	Top-5 acc 81.641 (80.950)	lr 0.01343
Train [58][520/3239]	Time 0.275 (0.638)	Data Time 0.001 (0.189)	Loss 2.6532 (2.6731)	Entropy 0.62971 (0.62940)	Top-1 acc 59.766 (59.496)	Top-5 acc 80.859 (80.949)	lr 0.01343
Train [58][530/3239]	Time 0.244 (0.634)	Data Time 0.001 (0.185)	Loss 2.5477 (2.6717)	Entropy 0.62969 (0.62940)	Top-1 acc 65.625 (59.520)	Top-5 acc 82.812 (80.968)	lr 0.01343
Train [58][540/3239]	Time 0.308 (0.631)	Data Time 0.034 (0.182)	Loss 2.5608 (2.6725)	Entropy 0.62943 (0.62941)	Top-1 acc 60.547 (59.506)	Top-5 acc 82.812 (80.964)	lr 0.01343
Train [58][550/3239]	Time 0.270 (0.634)	Data Time 0.001 (0.185)	Loss 2.6668 (2.6722)	Entropy 0.62962 (0.62941)	Top-1 acc 56.641 (59.513)	Top-5 acc 81.641 (80.957)	lr 0.01343
Train [58][560/3239]	Time 0.241 (0.630)	Data Time 0.001 (0.182)	Loss 2.4980 (2.6714)	Entropy 0.62963 (0.62941)	Top-1 acc 65.625 (59.541)	Top-5 acc 82.812 (80.971)	lr 0.01342
Train [58][570/3239]	Time 0.403 (0.627)	Data Time 0.001 (0.179)	Loss 2.6385 (2.6722)	Entropy 0.62963 (0.62942)	Top-1 acc 61.328 (59.534)	Top-5 acc 83.203 (80.954)	lr 0.01342
Train [58][580/3239]	Time 1.121 (0.629)	Data Time 0.835 (0.181)	Loss 2.5323 (2.6725)	Entropy 0.62932 (0.62942)	Top-1 acc 62.500 (59.507)	Top-5 acc 84.375 (80.945)	lr 0.01342
Train [58][590/3239]	Time 0.249 (0.626)	Data Time 0.001 (0.178)	Loss 2.6138 (2.6728)	Entropy 0.62951 (0.62942)	Top-1 acc 63.281 (59.510)	Top-5 acc 80.078 (80.941)	lr 0.01342
Train [58][600/3239]	Time 0.250 (0.623)	Data Time 0.001 (0.175)	Loss 2.7159 (2.6724)	Entropy 0.62926 (0.62942)	Top-1 acc 60.938 (59.511)	Top-5 acc 79.297 (80.948)	lr 0.01342
Train [58][610/3239]	Time 0.236 (0.624)	Data Time 0.001 (0.177)	Loss 2.8583 (2.6726)	Entropy 0.62920 (0.62941)	Top-1 acc 54.688 (59.493)	Top-5 acc 78.516 (80.947)	lr 0.01342
Train [58][620/3239]	Time 0.237 (0.623)	Data Time 0.001 (0.175)	Loss 2.6508 (2.6722)	Entropy 0.62936 (0.62941)	Top-1 acc 60.156 (59.501)	Top-5 acc 82.422 (80.956)	lr 0.01342
Train [58][630/3239]	Time 0.225 (0.620)	Data Time 0.001 (0.172)	Loss 2.6328 (2.6731)	Entropy 0.62957 (0.62941)	Top-1 acc 58.594 (59.485)	Top-5 acc 82.422 (80.941)	lr 0.01342
Train [58][640/3239]	Time 1.013 (0.618)	Data Time 0.763 (0.171)	Loss 2.8008 (2.6727)	Entropy 0.63000 (0.62942)	Top-1 acc 54.297 (59.486)	Top-5 acc 80.469 (80.943)	lr 0.01342
Train [58][650/3239]	Time 0.247 (0.624)	Data Time 0.001 (0.177)	Loss 2.4916 (2.6723)	Entropy 0.62952 (0.62942)	Top-1 acc 60.938 (59.475)	Top-5 acc 86.328 (80.966)	lr 0.01342
Train [58][660/3239]	Time 0.347 (0.679)	Data Time 0.003 (0.174)	Loss 2.6558 (2.6719)	Entropy 0.62953 (0.62943)	Top-1 acc 58.594 (59.473)	Top-5 acc 82.812 (80.970)	lr 0.01341
Train [58][670/3239]	Time 0.246 (0.675)	Data Time 0.001 (0.172)	Loss 2.7334 (2.6726)	Entropy 0.62979 (0.62943)	Top-1 acc 57.422 (59.454)	Top-5 acc 80.078 (80.957)	lr 0.01341
Train [58][680/3239]	Time 0.255 (0.671)	Data Time 0.002 (0.169)	Loss 2.6010 (2.6727)	Entropy 0.62977 (0.62943)	Top-1 acc 62.891 (59.451)	Top-5 acc 83.984 (80.953)	lr 0.01341
Train [58][690/3239]	Time 0.235 (0.668)	Data Time 0.001 (0.167)	Loss 2.5077 (2.6723)	Entropy 0.62988 (0.62944)	Top-1 acc 65.625 (59.472)	Top-5 acc 83.594 (80.962)	lr 0.01341
Train [58][700/3239]	Time 0.233 (0.665)	Data Time 0.001 (0.164)	Loss 2.6779 (2.6724)	Entropy 0.62981 (0.62944)	Top-1 acc 58.203 (59.471)	Top-5 acc 80.078 (80.951)	lr 0.01341
Train [58][710/3239]	Time 0.300 (0.662)	Data Time 0.002 (0.162)	Loss 2.6477 (2.6731)	Entropy 0.62968 (0.62945)	Top-1 acc 57.031 (59.454)	Top-5 acc 83.203 (80.937)	lr 0.01341
Train [58][720/3239]	Time 0.229 (0.659)	Data Time 0.001 (0.160)	Loss 2.5553 (2.6729)	Entropy 0.62961 (0.62945)	Top-1 acc 62.500 (59.463)	Top-5 acc 79.688 (80.936)	lr 0.01341
Train [58][730/3239]	Time 0.439 (0.656)	Data Time 0.001 (0.158)	Loss 2.7425 (2.6727)	Entropy 0.62936 (0.62945)	Top-1 acc 58.203 (59.469)	Top-5 acc 82.812 (80.938)	lr 0.01341
Train [58][740/3239]	Time 0.290 (0.653)	Data Time 0.003 (0.156)	Loss 2.5684 (2.6737)	Entropy 0.62950 (0.62945)	Top-1 acc 65.625 (59.461)	Top-5 acc 83.594 (80.924)	lr 0.01341
Train [58][750/3239]	Time 0.244 (0.650)	Data Time 0.001 (0.154)	Loss 2.7481 (2.6742)	Entropy 0.62932 (0.62945)	Top-1 acc 58.984 (59.443)	Top-5 acc 76.172 (80.916)	lr 0.01341
Train [58][760/3239]	Time 0.243 (0.649)	Data Time 0.001 (0.153)	Loss 2.7658 (2.6739)	Entropy 0.62939 (0.62945)	Top-1 acc 55.469 (59.440)	Top-5 acc 80.469 (80.920)	lr 0.01340
Train [58][770/3239]	Time 0.281 (0.647)	Data Time 0.001 (0.151)	Loss 2.6007 (2.6750)	Entropy 0.62928 (0.62945)	Top-1 acc 58.984 (59.421)	Top-5 acc 81.641 (80.889)	lr 0.01340
Train [58][780/3239]	Time 0.252 (0.648)	Data Time 0.002 (0.153)	Loss 2.6581 (2.6748)	Entropy 0.62951 (0.62945)	Top-1 acc 58.984 (59.433)	Top-5 acc 82.031 (80.890)	lr 0.01340
Train [58][790/3239]	Time 0.269 (0.652)	Data Time 0.001 (0.158)	Loss 2.7827 (2.6755)	Entropy 0.62939 (0.62945)	Top-1 acc 50.781 (59.410)	Top-5 acc 77.734 (80.873)	lr 0.01340
Train [58][800/3239]	Time 0.239 (0.649)	Data Time 0.001 (0.156)	Loss 2.7379 (2.6757)	Entropy 0.62907 (0.62945)	Top-1 acc 58.203 (59.421)	Top-5 acc 80.469 (80.861)	lr 0.01340
Train [58][810/3239]	Time 0.242 (0.647)	Data Time 0.001 (0.154)	Loss 2.6928 (2.6751)	Entropy 0.62903 (0.62944)	Top-1 acc 61.328 (59.445)	Top-5 acc 80.859 (80.872)	lr 0.01340
Train [58][820/3239]	Time 0.403 (0.657)	Data Time 0.002 (0.164)	Loss 2.8576 (2.6754)	Entropy 0.62869 (0.62944)	Top-1 acc 57.031 (59.438)	Top-5 acc 78.125 (80.861)	lr 0.01340
Train [58][830/3239]	Time 0.234 (0.654)	Data Time 0.001 (0.162)	Loss 2.5365 (2.6751)	Entropy 0.62866 (0.62943)	Top-1 acc 61.719 (59.439)	Top-5 acc 83.594 (80.870)	lr 0.01340
Train [58][840/3239]	Time 0.263 (0.651)	Data Time 0.001 (0.160)	Loss 2.6817 (2.6748)	Entropy 0.62838 (0.62942)	Top-1 acc 60.547 (59.436)	Top-5 acc 80.469 (80.877)	lr 0.01340
Train [58][850/3239]	Time 0.255 (0.658)	Data Time 0.001 (0.167)	Loss 2.7554 (2.6749)	Entropy 0.62839 (0.62941)	Top-1 acc 56.250 (59.430)	Top-5 acc 79.688 (80.875)	lr 0.01340
Train [58][860/3239]	Time 0.237 (0.655)	Data Time 0.001 (0.165)	Loss 2.7973 (2.6749)	Entropy 0.62835 (0.62939)	Top-1 acc 57.422 (59.427)	Top-5 acc 78.125 (80.878)	lr 0.01339
Train [58][870/3239]	Time 0.271 (0.654)	Data Time 0.001 (0.164)	Loss 2.8344 (2.6756)	Entropy 0.62837 (0.62938)	Top-1 acc 58.594 (59.419)	Top-5 acc 76.562 (80.864)	lr 0.01339
Train [58][880/3239]	Time 3.268 (0.655)	Data Time 3.020 (0.166)	Loss 2.7770 (2.6754)	Entropy 0.62825 (0.62937)	Top-1 acc 60.547 (59.431)	Top-5 acc 82.422 (80.861)	lr 0.01339
Train [58][890/3239]	Time 0.354 (0.656)	Data Time 0.002 (0.168)	Loss 2.7286 (2.6747)	Entropy 0.62807 (0.62936)	Top-1 acc 58.594 (59.435)	Top-5 acc 79.688 (80.873)	lr 0.01339
Train [58][900/3239]	Time 0.234 (0.654)	Data Time 0.001 (0.166)	Loss 2.8153 (2.6746)	Entropy 0.62805 (0.62934)	Top-1 acc 55.859 (59.437)	Top-5 acc 78.125 (80.867)	lr 0.01339
Train [58][910/3239]	Time 0.230 (0.654)	Data Time 0.001 (0.168)	Loss 2.5749 (2.6737)	Entropy 0.62813 (0.62933)	Top-1 acc 60.547 (59.458)	Top-5 acc 83.984 (80.887)	lr 0.01339
Train [58][920/3239]	Time 0.228 (0.658)	Data Time 0.001 (0.172)	Loss 2.7215 (2.6738)	Entropy 0.62797 (0.62931)	Top-1 acc 60.938 (59.464)	Top-5 acc 78.906 (80.884)	lr 0.01339
Train [58][930/3239]	Time 0.237 (0.658)	Data Time 0.001 (0.172)	Loss 2.8608 (2.6748)	Entropy 0.62821 (0.62930)	Top-1 acc 56.250 (59.451)	Top-5 acc 76.172 (80.867)	lr 0.01339
Train [58][940/3239]	Time 0.258 (0.656)	Data Time 0.001 (0.170)	Loss 2.6701 (2.6750)	Entropy 0.62823 (0.62929)	Top-1 acc 60.547 (59.442)	Top-5 acc 79.688 (80.862)	lr 0.01339
Train [58][950/3239]	Time 0.240 (0.658)	Data Time 0.003 (0.173)	Loss 2.7554 (2.6749)	Entropy 0.62765 (0.62928)	Top-1 acc 58.594 (59.453)	Top-5 acc 80.078 (80.861)	lr 0.01339
Train [58][960/3239]	Time 0.231 (0.659)	Data Time 0.001 (0.175)	Loss 2.4880 (2.6746)	Entropy 0.62776 (0.62926)	Top-1 acc 62.500 (59.462)	Top-5 acc 86.328 (80.874)	lr 0.01338
Train [58][970/3239]	Time 0.239 (0.658)	Data Time 0.001 (0.174)	Loss 2.6015 (2.6749)	Entropy 0.62741 (0.62924)	Top-1 acc 59.375 (59.455)	Top-5 acc 82.031 (80.869)	lr 0.01338
Train [58][980/3239]	Time 0.261 (0.660)	Data Time 0.001 (0.177)	Loss 2.5511 (2.6746)	Entropy 0.62781 (0.62923)	Top-1 acc 58.984 (59.457)	Top-5 acc 83.594 (80.870)	lr 0.01338
Train [58][990/3239]	Time 0.244 (0.662)	Data Time 0.001 (0.179)	Loss 2.6093 (2.6744)	Entropy 0.62779 (0.62921)	Top-1 acc 59.766 (59.449)	Top-5 acc 82.422 (80.870)	lr 0.01338
Train [58][1000/3239]	Time 0.250 (0.660)	Data Time 0.001 (0.178)	Loss 2.8211 (2.6747)	Entropy 0.62770 (0.62919)	Top-1 acc 55.859 (59.451)	Top-5 acc 75.391 (80.866)	lr 0.01338
Train [58][1010/3239]	Time 0.281 (0.660)	Data Time 0.001 (0.178)	Loss 2.8913 (2.6748)	Entropy 0.62778 (0.62918)	Top-1 acc 53.906 (59.438)	Top-5 acc 76.172 (80.868)	lr 0.01338
Train [58][1020/3239]	Time 0.253 (0.670)	Data Time 0.002 (0.188)	Loss 2.5954 (2.6743)	Entropy 0.62780 (0.62917)	Top-1 acc 66.406 (59.460)	Top-5 acc 81.250 (80.880)	lr 0.01338
Train [58][1030/3239]	Time 0.223 (0.668)	Data Time 0.001 (0.187)	Loss 2.8783 (2.6750)	Entropy 0.62794 (0.62915)	Top-1 acc 55.078 (59.427)	Top-5 acc 77.344 (80.868)	lr 0.01338
Train [58][1040/3239]	Time 0.257 (0.665)	Data Time 0.001 (0.185)	Loss 2.6477 (2.6747)	Entropy 0.62797 (0.62914)	Top-1 acc 57.422 (59.443)	Top-5 acc 80.078 (80.873)	lr 0.01338
Train [58][1050/3239]	Time 0.335 (0.663)	Data Time 0.001 (0.183)	Loss 2.5851 (2.6745)	Entropy 0.62808 (0.62913)	Top-1 acc 61.328 (59.450)	Top-5 acc 82.031 (80.876)	lr 0.01337
Train [58][1060/3239]	Time 0.232 (0.670)	Data Time 0.001 (0.191)	Loss 2.9148 (2.6742)	Entropy 0.62794 (0.62912)	Top-1 acc 53.906 (59.461)	Top-5 acc 75.391 (80.880)	lr 0.01337
Train [58][1070/3239]	Time 0.224 (0.667)	Data Time 0.001 (0.189)	Loss 2.8699 (2.6742)	Entropy 0.62822 (0.62911)	Top-1 acc 55.469 (59.467)	Top-5 acc 78.906 (80.883)	lr 0.01337
Train [58][1080/3239]	Time 0.241 (0.667)	Data Time 0.001 (0.189)	Loss 2.6749 (2.6740)	Entropy 0.62825 (0.62910)	Top-1 acc 58.203 (59.475)	Top-5 acc 80.469 (80.884)	lr 0.01337
Train [58][1090/3239]	Time 0.247 (0.673)	Data Time 0.001 (0.195)	Loss 2.6889 (2.6741)	Entropy 0.62824 (0.62909)	Top-1 acc 58.594 (59.472)	Top-5 acc 80.078 (80.887)	lr 0.01337
Train [58][1100/3239]	Time 0.276 (0.670)	Data Time 0.001 (0.193)	Loss 2.6757 (2.6746)	Entropy 0.62818 (0.62909)	Top-1 acc 58.594 (59.458)	Top-5 acc 80.469 (80.877)	lr 0.01337
Train [58][1110/3239]	Time 0.253 (0.672)	Data Time 0.001 (0.195)	Loss 2.6823 (2.6747)	Entropy 0.62826 (0.62908)	Top-1 acc 59.375 (59.451)	Top-5 acc 80.859 (80.877)	lr 0.01337
Train [58][1120/3239]	Time 0.380 (0.675)	Data Time 0.001 (0.198)	Loss 2.5904 (2.6748)	Entropy 0.62825 (0.62907)	Top-1 acc 60.938 (59.458)	Top-5 acc 82.812 (80.876)	lr 0.01337
Train [58][1130/3239]	Time 0.237 (0.672)	Data Time 0.001 (0.197)	Loss 2.5655 (2.6743)	Entropy 0.62794 (0.62906)	Top-1 acc 64.844 (59.474)	Top-5 acc 81.641 (80.883)	lr 0.01337
Train [58][1140/3239]	Time 0.239 (0.673)	Data Time 0.001 (0.198)	Loss 2.5772 (2.6740)	Entropy 0.62800 (0.62905)	Top-1 acc 63.281 (59.481)	Top-5 acc 83.984 (80.892)	lr 0.01337
Train [58][1150/3239]	Time 0.226 (0.681)	Data Time 0.001 (0.206)	Loss 2.6382 (2.6748)	Entropy 0.62790 (0.62905)	Top-1 acc 61.328 (59.465)	Top-5 acc 80.078 (80.875)	lr 0.01336
Train [58][1160/3239]	Time 0.258 (0.679)	Data Time 0.001 (0.205)	Loss 2.6058 (2.6749)	Entropy 0.62740 (0.62903)	Top-1 acc 60.156 (59.462)	Top-5 acc 80.078 (80.869)	lr 0.01336
Train [58][1170/3239]	Time 0.249 (0.677)	Data Time 0.001 (0.203)	Loss 2.6277 (2.6744)	Entropy 0.62759 (0.62902)	Top-1 acc 59.766 (59.472)	Top-5 acc 80.859 (80.875)	lr 0.01336
Train [58][1180/3239]	Time 0.230 (0.686)	Data Time 0.001 (0.213)	Loss 2.7182 (2.6743)	Entropy 0.62746 (0.62901)	Top-1 acc 55.859 (59.476)	Top-5 acc 79.688 (80.879)	lr 0.01336
Train [58][1190/3239]	Time 0.298 (0.684)	Data Time 0.001 (0.211)	Loss 2.7608 (2.6745)	Entropy 0.62750 (0.62900)	Top-1 acc 56.641 (59.470)	Top-5 acc 77.344 (80.874)	lr 0.01336
Train [58][1200/3239]	Time 0.245 (0.682)	Data Time 0.001 (0.210)	Loss 2.7642 (2.6748)	Entropy 0.62733 (0.62898)	Top-1 acc 57.031 (59.464)	Top-5 acc 78.906 (80.867)	lr 0.01336
Train [58][1210/3239]	Time 0.411 (0.681)	Data Time 0.002 (0.209)	Loss 2.5004 (2.6746)	Entropy 0.62728 (0.62897)	Top-1 acc 63.281 (59.476)	Top-5 acc 83.203 (80.872)	lr 0.01336
Train [58][1220/3239]	Time 0.251 (0.688)	Data Time 0.001 (0.217)	Loss 2.8345 (2.6749)	Entropy 0.62748 (0.62895)	Top-1 acc 52.734 (59.462)	Top-5 acc 76.562 (80.865)	lr 0.01336
Train [58][1230/3239]	Time 0.229 (0.686)	Data Time 0.001 (0.215)	Loss 2.6309 (2.6742)	Entropy 0.62754 (0.62894)	Top-1 acc 62.891 (59.479)	Top-5 acc 82.031 (80.874)	lr 0.01336
Train [58][1240/3239]	Time 0.249 (0.686)	Data Time 0.001 (0.215)	Loss 2.6395 (2.6740)	Entropy 0.62692 (0.62893)	Top-1 acc 62.891 (59.498)	Top-5 acc 83.984 (80.881)	lr 0.01336
Train [58][1250/3239]	Time 0.233 (0.695)	Data Time 0.001 (0.225)	Loss 2.8636 (2.6746)	Entropy 0.62677 (0.62891)	Top-1 acc 52.734 (59.486)	Top-5 acc 79.297 (80.867)	lr 0.01335
Train [58][1260/3239]	Time 0.224 (0.692)	Data Time 0.001 (0.223)	Loss 2.5243 (2.6744)	Entropy 0.62723 (0.62890)	Top-1 acc 60.938 (59.491)	Top-5 acc 84.766 (80.876)	lr 0.01335
Train [58][1270/3239]	Time 0.264 (0.692)	Data Time 0.001 (0.222)	Loss 2.5498 (2.6745)	Entropy 0.62758 (0.62889)	Top-1 acc 62.109 (59.485)	Top-5 acc 84.375 (80.877)	lr 0.01335
Train [58][1280/3239]	Time 0.327 (0.699)	Data Time 0.001 (0.231)	Loss 2.3994 (2.6745)	Entropy 0.62774 (0.62888)	Top-1 acc 63.672 (59.476)	Top-5 acc 86.328 (80.876)	lr 0.01335
Train [58][1290/3239]	Time 0.236 (0.697)	Data Time 0.001 (0.229)	Loss 2.6851 (2.6740)	Entropy 0.62771 (0.62887)	Top-1 acc 58.203 (59.488)	Top-5 acc 79.297 (80.883)	lr 0.01335
Train [58][1300/3239]	Time 0.260 (0.700)	Data Time 0.001 (0.232)	Loss 2.6910 (2.6744)	Entropy 0.62786 (0.62886)	Top-1 acc 56.250 (59.470)	Top-5 acc 80.859 (80.875)	lr 0.01335
Train [58][1310/3239]	Time 0.359 (0.731)	Data Time 0.004 (0.237)	Loss 2.7891 (2.6747)	Entropy 0.62758 (0.62885)	Top-1 acc 57.812 (59.464)	Top-5 acc 76.562 (80.864)	lr 0.01335
Train [58][1320/3239]	Time 0.258 (0.729)	Data Time 0.002 (0.235)	Loss 2.5494 (2.6749)	Entropy 0.62764 (0.62884)	Top-1 acc 64.062 (59.462)	Top-5 acc 83.984 (80.858)	lr 0.01335
Train [58][1330/3239]	Time 0.250 (0.727)	Data Time 0.001 (0.234)	Loss 2.6000 (2.6748)	Entropy 0.62784 (0.62883)	Top-1 acc 60.156 (59.465)	Top-5 acc 81.250 (80.859)	lr 0.01335
Train [58][1340/3239]	Time 0.256 (0.725)	Data Time 0.002 (0.232)	Loss 2.8866 (2.6748)	Entropy 0.62808 (0.62882)	Top-1 acc 53.516 (59.468)	Top-5 acc 75.781 (80.855)	lr 0.01335
Train [58][1350/3239]	Time 0.227 (0.722)	Data Time 0.001 (0.230)	Loss 2.8739 (2.6750)	Entropy 0.62832 (0.62882)	Top-1 acc 55.469 (59.455)	Top-5 acc 76.562 (80.851)	lr 0.01334
Train [58][1360/3239]	Time 0.252 (0.720)	Data Time 0.001 (0.228)	Loss 2.7512 (2.6751)	Entropy 0.62804 (0.62881)	Top-1 acc 60.938 (59.456)	Top-5 acc 78.516 (80.852)	lr 0.01334
Train [58][1370/3239]	Time 0.324 (0.718)	Data Time 0.001 (0.227)	Loss 2.8186 (2.6744)	Entropy 0.62830 (0.62881)	Top-1 acc 59.766 (59.473)	Top-5 acc 77.344 (80.865)	lr 0.01334
Train [58][1380/3239]	Time 0.228 (0.717)	Data Time 0.001 (0.227)	Loss 2.5455 (2.6748)	Entropy 0.62789 (0.62880)	Top-1 acc 63.672 (59.473)	Top-5 acc 82.422 (80.855)	lr 0.01334
Train [58][1390/3239]	Time 0.260 (0.719)	Data Time 0.001 (0.229)	Loss 2.6144 (2.6749)	Entropy 0.62791 (0.62880)	Top-1 acc 62.500 (59.468)	Top-5 acc 80.469 (80.851)	lr 0.01334
Train [58][1400/3239]	Time 0.244 (0.717)	Data Time 0.001 (0.227)	Loss 2.5790 (2.6749)	Entropy 0.62785 (0.62879)	Top-1 acc 62.500 (59.468)	Top-5 acc 83.594 (80.853)	lr 0.01334
Train [58][1410/3239]	Time 3.607 (0.725)	Data Time 3.325 (0.235)	Loss 2.7182 (2.6747)	Entropy 0.62786 (0.62878)	Top-1 acc 60.938 (59.474)	Top-5 acc 79.297 (80.856)	lr 0.01334
Train [58][1420/3239]	Time 0.231 (0.723)	Data Time 0.001 (0.234)	Loss 2.6487 (2.6739)	Entropy 0.62767 (0.62878)	Top-1 acc 59.766 (59.490)	Top-5 acc 80.859 (80.870)	lr 0.01334
Train [58][1430/3239]	Time 0.224 (0.724)	Data Time 0.001 (0.236)	Loss 2.5635 (2.6736)	Entropy 0.62781 (0.62877)	Top-1 acc 60.938 (59.497)	Top-5 acc 83.594 (80.872)	lr 0.01334
Train [58][1440/3239]	Time 0.327 (0.727)	Data Time 0.001 (0.239)	Loss 2.6059 (2.6733)	Entropy 0.62777 (0.62876)	Top-1 acc 62.500 (59.502)	Top-5 acc 82.422 (80.876)	lr 0.01334
Train [58][1450/3239]	Time 0.242 (0.730)	Data Time 0.001 (0.243)	Loss 2.8243 (2.6734)	Entropy 0.62769 (0.62876)	Top-1 acc 55.469 (59.496)	Top-5 acc 75.781 (80.871)	lr 0.01333
Train [58][1460/3239]	Time 0.245 (0.729)	Data Time 0.001 (0.242)	Loss 2.7910 (2.6734)	Entropy 0.62814 (0.62875)	Top-1 acc 54.688 (59.497)	Top-5 acc 78.906 (80.874)	lr 0.01333
Train [58][1470/3239]	Time 2.407 (0.734)	Data Time 2.162 (0.247)	Loss 2.5820 (2.6736)	Entropy 0.62822 (0.62875)	Top-1 acc 62.500 (59.492)	Top-5 acc 81.641 (80.873)	lr 0.01333
Train [58][1480/3239]	Time 0.248 (0.736)	Data Time 0.001 (0.250)	Loss 2.6908 (2.6740)	Entropy 0.62810 (0.62874)	Top-1 acc 59.375 (59.485)	Top-5 acc 82.812 (80.867)	lr 0.01333
Train [58][1490/3239]	Time 0.240 (0.737)	Data Time 0.001 (0.251)	Loss 2.6057 (2.6739)	Entropy 0.62809 (0.62874)	Top-1 acc 58.594 (59.477)	Top-5 acc 81.250 (80.867)	lr 0.01333
Train [58][1500/3239]	Time 1.191 (0.736)	Data Time 0.930 (0.250)	Loss 2.8769 (2.6743)	Entropy 0.62842 (0.62873)	Top-1 acc 55.078 (59.468)	Top-5 acc 76.172 (80.855)	lr 0.01333
Train [58][1510/3239]	Time 0.230 (0.740)	Data Time 0.001 (0.254)	Loss 2.5668 (2.6745)	Entropy 0.62823 (0.62873)	Top-1 acc 60.156 (59.464)	Top-5 acc 82.031 (80.851)	lr 0.01333
Train [58][1520/3239]	Time 0.268 (0.740)	Data Time 0.001 (0.255)	Loss 2.5674 (2.6741)	Entropy 0.62862 (0.62873)	Top-1 acc 59.766 (59.470)	Top-5 acc 81.641 (80.858)	lr 0.01333
Train [58][1530/3239]	Time 0.340 (0.738)	Data Time 0.001 (0.253)	Loss 2.5475 (2.6740)	Entropy 0.62897 (0.62873)	Top-1 acc 64.453 (59.474)	Top-5 acc 82.422 (80.860)	lr 0.01333
Train [58][1540/3239]	Time 0.262 (0.743)	Data Time 0.001 (0.258)	Loss 3.0141 (2.6746)	Entropy 0.62865 (0.62873)	Top-1 acc 53.906 (59.459)	Top-5 acc 77.734 (80.854)	lr 0.01333
Train [58][1550/3239]	Time 0.243 (0.741)	Data Time 0.001 (0.257)	Loss 2.8635 (2.6751)	Entropy 0.62884 (0.62873)	Top-1 acc 55.859 (59.444)	Top-5 acc 79.688 (80.849)	lr 0.01332
Train [58][1560/3239]	Time 0.245 (0.740)	Data Time 0.001 (0.256)	Loss 2.8547 (2.6753)	Entropy 0.62869 (0.62873)	Top-1 acc 53.906 (59.433)	Top-5 acc 76.172 (80.848)	lr 0.01332
Train [58][1570/3239]	Time 0.236 (0.743)	Data Time 0.001 (0.260)	Loss 2.6695 (2.6750)	Entropy 0.62873 (0.62873)	Top-1 acc 64.062 (59.444)	Top-5 acc 79.688 (80.853)	lr 0.01332
Train [58][1580/3239]	Time 0.245 (0.742)	Data Time 0.001 (0.258)	Loss 2.6053 (2.6752)	Entropy 0.62866 (0.62873)	Top-1 acc 60.547 (59.437)	Top-5 acc 84.766 (80.855)	lr 0.01332
Train [58][1590/3239]	Time 0.240 (0.740)	Data Time 0.001 (0.257)	Loss 2.6231 (2.6751)	Entropy 0.62860 (0.62873)	Top-1 acc 62.500 (59.438)	Top-5 acc 80.469 (80.858)	lr 0.01332
Train [58][1600/3239]	Time 0.381 (0.746)	Data Time 0.002 (0.264)	Loss 2.8733 (2.6751)	Entropy 0.62855 (0.62873)	Top-1 acc 52.734 (59.438)	Top-5 acc 76.172 (80.856)	lr 0.01332
Train [58][1610/3239]	Time 0.264 (0.746)	Data Time 0.001 (0.264)	Loss 2.6155 (2.6754)	Entropy 0.62826 (0.62873)	Top-1 acc 56.641 (59.429)	Top-5 acc 81.250 (80.850)	lr 0.01332
Train [58][1620/3239]	Time 0.242 (0.745)	Data Time 0.002 (0.263)	Loss 2.5095 (2.6750)	Entropy 0.62832 (0.62872)	Top-1 acc 67.188 (59.442)	Top-5 acc 83.984 (80.854)	lr 0.01332
Train [58][1630/3239]	Time 10.588 (0.750)	Data Time 10.329 (0.269)	Loss 2.7740 (2.6753)	Entropy 0.62827 (0.62872)	Top-1 acc 55.859 (59.431)	Top-5 acc 79.297 (80.851)	lr 0.01332
Train [58][1640/3239]	Time 0.278 (0.752)	Data Time 0.002 (0.271)	Loss 2.4836 (2.6754)	Entropy 0.62827 (0.62872)	Top-1 acc 65.234 (59.427)	Top-5 acc 83.203 (80.851)	lr 0.01332
Train [58][1650/3239]	Time 0.249 (0.751)	Data Time 0.001 (0.271)	Loss 2.6755 (2.6755)	Entropy 0.62883 (0.62872)	Top-1 acc 60.547 (59.428)	Top-5 acc 78.125 (80.849)	lr 0.01331
Train [58][1660/3239]	Time 0.237 (0.749)	Data Time 0.001 (0.269)	Loss 2.5263 (2.6754)	Entropy 0.62882 (0.62872)	Top-1 acc 65.625 (59.437)	Top-5 acc 85.938 (80.853)	lr 0.01331
Train [58][1670/3239]	Time 0.244 (0.755)	Data Time 0.001 (0.275)	Loss 2.4718 (2.6755)	Entropy 0.62864 (0.62872)	Top-1 acc 66.797 (59.439)	Top-5 acc 83.203 (80.848)	lr 0.01331
Train [58][1680/3239]	Time 0.242 (0.753)	Data Time 0.001 (0.273)	Loss 2.9337 (2.6758)	Entropy 0.62839 (0.62872)	Top-1 acc 52.344 (59.433)	Top-5 acc 78.125 (80.842)	lr 0.01331
Train [58][1690/3239]	Time 0.237 (0.751)	Data Time 0.001 (0.272)	Loss 2.6708 (2.6761)	Entropy 0.62800 (0.62872)	Top-1 acc 58.984 (59.428)	Top-5 acc 80.078 (80.838)	lr 0.01331
Train [58][1700/3239]	Time 0.247 (0.760)	Data Time 0.001 (0.281)	Loss 2.5889 (2.6759)	Entropy 0.62798 (0.62871)	Top-1 acc 58.594 (59.433)	Top-5 acc 83.203 (80.840)	lr 0.01331
Train [58][1710/3239]	Time 0.236 (0.758)	Data Time 0.001 (0.279)	Loss 2.6726 (2.6759)	Entropy 0.62812 (0.62871)	Top-1 acc 57.422 (59.427)	Top-5 acc 78.125 (80.834)	lr 0.01331
Train [58][1720/3239]	Time 0.237 (0.758)	Data Time 0.001 (0.279)	Loss 2.5041 (2.6757)	Entropy 0.62830 (0.62870)	Top-1 acc 64.453 (59.427)	Top-5 acc 83.984 (80.837)	lr 0.01331
Train [58][1730/3239]	Time 0.241 (0.765)	Data Time 0.001 (0.287)	Loss 2.4457 (2.6756)	Entropy 0.62813 (0.62870)	Top-1 acc 63.281 (59.432)	Top-5 acc 83.203 (80.840)	lr 0.01331
Train [58][1740/3239]	Time 0.239 (0.764)	Data Time 0.001 (0.286)	Loss 2.7112 (2.6755)	Entropy 0.62823 (0.62870)	Top-1 acc 60.156 (59.432)	Top-5 acc 82.031 (80.848)	lr 0.01331
Train [58][1750/3239]	Time 0.231 (0.762)	Data Time 0.001 (0.284)	Loss 2.5716 (2.6755)	Entropy 0.62820 (0.62869)	Top-1 acc 60.938 (59.429)	Top-5 acc 84.375 (80.848)	lr 0.01330
Train [58][1760/3239]	Time 0.353 (0.764)	Data Time 0.001 (0.287)	Loss 2.7745 (2.6754)	Entropy 0.62822 (0.62869)	Top-1 acc 57.812 (59.430)	Top-5 acc 79.297 (80.848)	lr 0.01330
Train [58][1770/3239]	Time 0.242 (0.763)	Data Time 0.001 (0.286)	Loss 2.3904 (2.6753)	Entropy 0.62826 (0.62869)	Top-1 acc 64.844 (59.431)	Top-5 acc 86.328 (80.852)	lr 0.01330
Train [58][1780/3239]	Time 0.238 (0.761)	Data Time 0.001 (0.285)	Loss 2.5272 (2.6754)	Entropy 0.62813 (0.62869)	Top-1 acc 63.672 (59.432)	Top-5 acc 82.812 (80.850)	lr 0.01330
Train [58][1790/3239]	Time 2.742 (0.761)	Data Time 2.486 (0.284)	Loss 2.5184 (2.6751)	Entropy 0.62792 (0.62868)	Top-1 acc 64.844 (59.440)	Top-5 acc 83.203 (80.857)	lr 0.01330
Train [58][1800/3239]	Time 0.242 (0.762)	Data Time 0.001 (0.286)	Loss 2.5846 (2.6755)	Entropy 0.62811 (0.62868)	Top-1 acc 64.453 (59.428)	Top-5 acc 83.203 (80.849)	lr 0.01330
Train [58][1810/3239]	Time 0.246 (0.761)	Data Time 0.001 (0.284)	Loss 2.7856 (2.6757)	Entropy 0.62744 (0.62867)	Top-1 acc 52.734 (59.424)	Top-5 acc 80.078 (80.845)	lr 0.01330
Train [58][1820/3239]	Time 0.245 (0.759)	Data Time 0.001 (0.283)	Loss 2.6398 (2.6760)	Entropy 0.62720 (0.62867)	Top-1 acc 57.031 (59.422)	Top-5 acc 82.031 (80.837)	lr 0.01330
Train [58][1830/3239]	Time 0.337 (0.761)	Data Time 0.001 (0.285)	Loss 2.6374 (2.6761)	Entropy 0.62726 (0.62866)	Top-1 acc 60.156 (59.411)	Top-5 acc 85.938 (80.836)	lr 0.01330
Train [58][1840/3239]	Time 0.239 (0.759)	Data Time 0.001 (0.283)	Loss 2.5189 (2.6759)	Entropy 0.62775 (0.62865)	Top-1 acc 64.062 (59.417)	Top-5 acc 85.547 (80.838)	lr 0.01330
Train [58][1850/3239]	Time 0.240 (0.757)	Data Time 0.001 (0.282)	Loss 2.8267 (2.6761)	Entropy 0.62734 (0.62865)	Top-1 acc 59.766 (59.416)	Top-5 acc 78.906 (80.840)	lr 0.01329
Train [58][1860/3239]	Time 0.245 (0.760)	Data Time 0.001 (0.285)	Loss 2.6513 (2.6760)	Entropy 0.62740 (0.62864)	Top-1 acc 62.109 (59.416)	Top-5 acc 81.250 (80.837)	lr 0.01329
Train [58][1870/3239]	Time 0.237 (0.758)	Data Time 0.001 (0.283)	Loss 2.6478 (2.6759)	Entropy 0.62762 (0.62863)	Top-1 acc 58.984 (59.414)	Top-5 acc 81.250 (80.841)	lr 0.01329
Train [58][1880/3239]	Time 0.232 (0.756)	Data Time 0.001 (0.282)	Loss 2.7662 (2.6759)	Entropy 0.62711 (0.62863)	Top-1 acc 55.078 (59.409)	Top-5 acc 79.297 (80.838)	lr 0.01329
Train [58][1890/3239]	Time 0.233 (0.759)	Data Time 0.001 (0.285)	Loss 2.7834 (2.6758)	Entropy 0.62700 (0.62862)	Top-1 acc 56.250 (59.413)	Top-5 acc 76.562 (80.841)	lr 0.01329
Train [58][1900/3239]	Time 0.249 (0.757)	Data Time 0.001 (0.283)	Loss 2.9228 (2.6760)	Entropy 0.62694 (0.62861)	Top-1 acc 53.906 (59.408)	Top-5 acc 75.781 (80.835)	lr 0.01329
Train [58][1910/3239]	Time 0.279 (0.755)	Data Time 0.001 (0.282)	Loss 2.6573 (2.6761)	Entropy 0.62713 (0.62860)	Top-1 acc 57.422 (59.401)	Top-5 acc 81.641 (80.835)	lr 0.01329
Train [58][1920/3239]	Time 0.378 (0.761)	Data Time 0.002 (0.287)	Loss 2.5414 (2.6761)	Entropy 0.62735 (0.62859)	Top-1 acc 61.719 (59.404)	Top-5 acc 86.328 (80.836)	lr 0.01329
Train [58][1930/3239]	Time 0.236 (0.759)	Data Time 0.001 (0.286)	Loss 2.6251 (2.6766)	Entropy 0.62783 (0.62859)	Top-1 acc 60.547 (59.395)	Top-5 acc 82.031 (80.822)	lr 0.01329
Train [58][1940/3239]	Time 0.243 (0.759)	Data Time 0.001 (0.286)	Loss 2.7127 (2.6766)	Entropy 0.62793 (0.62858)	Top-1 acc 60.547 (59.399)	Top-5 acc 80.859 (80.820)	lr 0.01329
Train [58][1950/3239]	Time 1.265 (0.757)	Data Time 1.025 (0.285)	Loss 2.7979 (2.6767)	Entropy 0.62769 (0.62858)	Top-1 acc 57.031 (59.391)	Top-5 acc 77.734 (80.823)	lr 0.01328
Train [58][1960/3239]	Time 0.222 (0.766)	Data Time 0.001 (0.294)	Loss 2.5851 (2.6764)	Entropy 0.62739 (0.62858)	Top-1 acc 57.422 (59.404)	Top-5 acc 82.422 (80.830)	lr 0.01328
Train [58][1970/3239]	Time 0.314 (0.781)	Data Time 0.027 (0.293)	Loss 2.8291 (2.6767)	Entropy 0.62721 (0.62857)	Top-1 acc 53.125 (59.398)	Top-5 acc 76.953 (80.825)	lr 0.01328
Train [58][1980/3239]	Time 0.247 (0.780)	Data Time 0.002 (0.292)	Loss 2.7995 (2.6769)	Entropy 0.62718 (0.62856)	Top-1 acc 56.250 (59.393)	Top-5 acc 80.859 (80.826)	lr 0.01328
Train [58][1990/3239]	Time 0.383 (0.778)	Data Time 0.001 (0.290)	Loss 2.5832 (2.6768)	Entropy 0.62696 (0.62855)	Top-1 acc 59.375 (59.397)	Top-5 acc 83.203 (80.828)	lr 0.01328
Train [58][2000/3239]	Time 0.244 (0.776)	Data Time 0.001 (0.289)	Loss 2.6041 (2.6765)	Entropy 0.62674 (0.62855)	Top-1 acc 59.766 (59.402)	Top-5 acc 80.078 (80.829)	lr 0.01328
Train [58][2010/3239]	Time 0.236 (0.774)	Data Time 0.001 (0.287)	Loss 2.4860 (2.6766)	Entropy 0.62706 (0.62854)	Top-1 acc 64.453 (59.396)	Top-5 acc 83.203 (80.825)	lr 0.01328
Train [58][2020/3239]	Time 0.321 (0.780)	Data Time 0.001 (0.293)	Loss 2.6944 (2.6765)	Entropy 0.62702 (0.62853)	Top-1 acc 57.031 (59.394)	Top-5 acc 80.859 (80.827)	lr 0.01328
Train [58][2030/3239]	Time 0.244 (0.778)	Data Time 0.001 (0.291)	Loss 2.7215 (2.6769)	Entropy 0.62700 (0.62852)	Top-1 acc 58.203 (59.388)	Top-5 acc 81.250 (80.820)	lr 0.01328
Train [58][2040/3239]	Time 0.243 (0.776)	Data Time 0.001 (0.290)	Loss 2.6160 (2.6766)	Entropy 0.62728 (0.62852)	Top-1 acc 62.109 (59.391)	Top-5 acc 81.641 (80.822)	lr 0.01328
Train [58][2050/3239]	Time 0.243 (0.785)	Data Time 0.001 (0.299)	Loss 2.6843 (2.6764)	Entropy 0.62729 (0.62851)	Top-1 acc 60.938 (59.396)	Top-5 acc 80.469 (80.826)	lr 0.01327
Train [58][2060/3239]	Time 0.235 (0.783)	Data Time 0.001 (0.298)	Loss 2.8106 (2.6765)	Entropy 0.62711 (0.62850)	Top-1 acc 57.422 (59.393)	Top-5 acc 78.906 (80.826)	lr 0.01327
Train [58][2070/3239]	Time 0.243 (0.783)	Data Time 0.001 (0.297)	Loss 2.8671 (2.6763)	Entropy 0.62714 (0.62850)	Top-1 acc 54.297 (59.397)	Top-5 acc 76.562 (80.827)	lr 0.01327
Train [58][2080/3239]	Time 0.362 (0.788)	Data Time 0.001 (0.303)	Loss 2.6560 (2.6764)	Entropy 0.62731 (0.62849)	Top-1 acc 62.891 (59.399)	Top-5 acc 82.812 (80.826)	lr 0.01327
Train [58][2090/3239]	Time 0.287 (0.790)	Data Time 0.002 (0.305)	Loss 2.6766 (2.6765)	Entropy 0.62741 (0.62848)	Top-1 acc 59.766 (59.396)	Top-5 acc 82.812 (80.828)	lr 0.01327
Train [58][2100/3239]	Time 0.245 (0.790)	Data Time 0.001 (0.306)	Loss 2.5951 (2.6762)	Entropy 0.62724 (0.62848)	Top-1 acc 62.109 (59.400)	Top-5 acc 83.984 (80.835)	lr 0.01327
Train [58][2110/3239]	Time 0.241 (0.789)	Data Time 0.001 (0.304)	Loss 2.5693 (2.6763)	Entropy 0.62743 (0.62847)	Top-1 acc 59.766 (59.399)	Top-5 acc 80.469 (80.831)	lr 0.01327
Train [58][2120/3239]	Time 0.241 (0.796)	Data Time 0.001 (0.312)	Loss 2.8001 (2.6762)	Entropy 0.62718 (0.62847)	Top-1 acc 55.078 (59.401)	Top-5 acc 78.125 (80.835)	lr 0.01327
Train [58][2130/3239]	Time 0.260 (0.795)	Data Time 0.001 (0.311)	Loss 2.6155 (2.6760)	Entropy 0.62749 (0.62846)	Top-1 acc 61.328 (59.403)	Top-5 acc 82.422 (80.841)	lr 0.01327
Train [58][2140/3239]	Time 0.241 (0.793)	Data Time 0.001 (0.310)	Loss 2.8048 (2.6761)	Entropy 0.62714 (0.62846)	Top-1 acc 55.469 (59.399)	Top-5 acc 78.516 (80.838)	lr 0.01327
Train [58][2150/3239]	Time 0.363 (0.801)	Data Time 0.002 (0.318)	Loss 2.5509 (2.6762)	Entropy 0.62712 (0.62845)	Top-1 acc 64.844 (59.396)	Top-5 acc 81.641 (80.838)	lr 0.01326
Train [58][2160/3239]	Time 0.238 (0.802)	Data Time 0.001 (0.319)	Loss 2.5793 (2.6760)	Entropy 0.62698 (0.62844)	Top-1 acc 65.625 (59.408)	Top-5 acc 82.812 (80.839)	lr 0.01326
Train [58][2170/3239]	Time 0.249 (0.800)	Data Time 0.001 (0.317)	Loss 2.6220 (2.6760)	Entropy 0.62690 (0.62844)	Top-1 acc 59.375 (59.406)	Top-5 acc 80.469 (80.840)	lr 0.01326
Train [58][2180/3239]	Time 0.237 (0.806)	Data Time 0.001 (0.323)	Loss 2.6152 (2.6756)	Entropy 0.62711 (0.62843)	Top-1 acc 57.812 (59.412)	Top-5 acc 82.422 (80.848)	lr 0.01326
Train [58][2190/3239]	Time 6.192 (0.807)	Data Time 5.929 (0.324)	Loss 2.7422 (2.6758)	Entropy 0.62699 (0.62842)	Top-1 acc 57.812 (59.408)	Top-5 acc 77.734 (80.848)	lr 0.01326
Train [58][2200/3239]	Time 0.249 (0.805)	Data Time 0.001 (0.323)	Loss 2.6764 (2.6760)	Entropy 0.62726 (0.62842)	Top-1 acc 60.938 (59.404)	Top-5 acc 81.250 (80.846)	lr 0.01326
Train [58][2210/3239]	Time 0.234 (0.811)	Data Time 0.001 (0.329)	Loss 2.8198 (2.6759)	Entropy 0.62731 (0.62841)	Top-1 acc 51.953 (59.406)	Top-5 acc 78.125 (80.846)	lr 0.01326
Train [58][2220/3239]	Time 0.252 (0.810)	Data Time 0.001 (0.328)	Loss 2.7996 (2.6762)	Entropy 0.62708 (0.62841)	Top-1 acc 58.203 (59.403)	Top-5 acc 77.344 (80.840)	lr 0.01326
Train [58][2230/3239]	Time 0.238 (0.810)	Data Time 0.001 (0.329)	Loss 2.6179 (2.6762)	Entropy 0.62711 (0.62840)	Top-1 acc 63.672 (59.402)	Top-5 acc 81.250 (80.840)	lr 0.01326
Train [58][2240/3239]	Time 0.373 (0.815)	Data Time 0.001 (0.334)	Loss 2.4627 (2.6761)	Entropy 0.62712 (0.62840)	Top-1 acc 64.844 (59.402)	Top-5 acc 86.328 (80.839)	lr 0.01326
Train [58][2250/3239]	Time 0.237 (0.814)	Data Time 0.001 (0.333)	Loss 2.5987 (2.6762)	Entropy 0.62701 (0.62839)	Top-1 acc 58.984 (59.395)	Top-5 acc 83.594 (80.836)	lr 0.01325
Train [58][2260/3239]	Time 0.242 (0.816)	Data Time 0.001 (0.336)	Loss 2.7218 (2.6764)	Entropy 0.62691 (0.62838)	Top-1 acc 59.375 (59.389)	Top-5 acc 79.688 (80.833)	lr 0.01325
Train [58][2270/3239]	Time 0.226 (0.815)	Data Time 0.001 (0.334)	Loss 2.6167 (2.6765)	Entropy 0.62697 (0.62838)	Top-1 acc 62.109 (59.385)	Top-5 acc 82.031 (80.834)	lr 0.01325
Train [58][2280/3239]	Time 0.239 (0.821)	Data Time 0.001 (0.340)	Loss 2.8201 (2.6763)	Entropy 0.62732 (0.62837)	Top-1 acc 55.859 (59.390)	Top-5 acc 76.953 (80.838)	lr 0.01325
Train [58][2290/3239]	Time 0.237 (0.821)	Data Time 0.001 (0.341)	Loss 2.5943 (2.6762)	Entropy 0.62751 (0.62837)	Top-1 acc 60.156 (59.387)	Top-5 acc 80.859 (80.840)	lr 0.01325
Train [58][2300/3239]	Time 0.241 (0.821)	Data Time 0.001 (0.341)	Loss 2.5163 (2.6762)	Entropy 0.62749 (0.62836)	Top-1 acc 59.766 (59.386)	Top-5 acc 84.766 (80.842)	lr 0.01325
Train [58][2310/3239]	Time 0.368 (0.827)	Data Time 0.002 (0.347)	Loss 2.6938 (2.6762)	Entropy 0.62689 (0.62836)	Top-1 acc 59.375 (59.389)	Top-5 acc 78.906 (80.840)	lr 0.01325
Train [58][2320/3239]	Time 0.224 (0.827)	Data Time 0.001 (0.348)	Loss 2.7377 (2.6762)	Entropy 0.62661 (0.62835)	Top-1 acc 58.203 (59.386)	Top-5 acc 81.250 (80.841)	lr 0.01325
Train [58][2330/3239]	Time 0.238 (0.826)	Data Time 0.001 (0.346)	Loss 2.6236 (2.6762)	Entropy 0.62694 (0.62835)	Top-1 acc 61.719 (59.387)	Top-5 acc 80.078 (80.841)	lr 0.01325
Train [58][2340/3239]	Time 0.246 (0.832)	Data Time 0.001 (0.353)	Loss 2.7843 (2.6761)	Entropy 0.62674 (0.62834)	Top-1 acc 58.203 (59.392)	Top-5 acc 77.344 (80.840)	lr 0.01324
Train [58][2350/3239]	Time 4.494 (0.832)	Data Time 4.245 (0.353)	Loss 2.7816 (2.6762)	Entropy 0.62656 (0.62833)	Top-1 acc 58.984 (59.391)	Top-5 acc 80.078 (80.838)	lr 0.01324
Train [58][2360/3239]	Time 0.228 (0.830)	Data Time 0.001 (0.351)	Loss 2.6047 (2.6762)	Entropy 0.62676 (0.62833)	Top-1 acc 60.938 (59.389)	Top-5 acc 82.422 (80.836)	lr 0.01324
Train [58][2370/3239]	Time 0.237 (0.836)	Data Time 0.001 (0.358)	Loss 2.5661 (2.6761)	Entropy 0.62685 (0.62832)	Top-1 acc 58.594 (59.392)	Top-5 acc 83.984 (80.843)	lr 0.01324
Train [58][2380/3239]	Time 0.234 (0.834)	Data Time 0.001 (0.356)	Loss 2.7225 (2.6760)	Entropy 0.62650 (0.62831)	Top-1 acc 58.984 (59.396)	Top-5 acc 80.469 (80.845)	lr 0.01324
Train [58][2390/3239]	Time 0.245 (0.836)	Data Time 0.001 (0.358)	Loss 2.5895 (2.6760)	Entropy 0.62641 (0.62830)	Top-1 acc 58.594 (59.397)	Top-5 acc 81.250 (80.837)	lr 0.01324
Train [58][2400/3239]	Time 0.250 (0.841)	Data Time 0.001 (0.364)	Loss 2.7382 (2.6760)	Entropy 0.62618 (0.62830)	Top-1 acc 53.516 (59.396)	Top-5 acc 82.812 (80.838)	lr 0.01324
Train [58][2410/3239]	Time 0.240 (0.839)	Data Time 0.001 (0.362)	Loss 2.7617 (2.6762)	Entropy 0.62609 (0.62829)	Top-1 acc 58.203 (59.389)	Top-5 acc 80.078 (80.832)	lr 0.01324
Train [58][2420/3239]	Time 0.254 (0.841)	Data Time 0.001 (0.364)	Loss 2.4974 (2.6761)	Entropy 0.62600 (0.62828)	Top-1 acc 61.719 (59.395)	Top-5 acc 83.984 (80.832)	lr 0.01324
Train [58][2430/3239]	Time 0.246 (0.839)	Data Time 0.001 (0.362)	Loss 2.7262 (2.6764)	Entropy 0.62537 (0.62827)	Top-1 acc 56.250 (59.391)	Top-5 acc 81.250 (80.829)	lr 0.01324
Train [58][2440/3239]	Time 0.278 (0.844)	Data Time 0.001 (0.367)	Loss 2.5319 (2.6761)	Entropy 0.62536 (0.62825)	Top-1 acc 62.891 (59.400)	Top-5 acc 85.156 (80.833)	lr 0.01323
Train [58][2450/3239]	Time 0.256 (0.844)	Data Time 0.002 (0.368)	Loss 2.6713 (2.6761)	Entropy 0.62483 (0.62824)	Top-1 acc 58.203 (59.398)	Top-5 acc 78.906 (80.833)	lr 0.01323
Train [58][2460/3239]	Time 0.240 (0.843)	Data Time 0.001 (0.366)	Loss 2.6806 (2.6765)	Entropy 0.62480 (0.62823)	Top-1 acc 55.469 (59.385)	Top-5 acc 79.688 (80.827)	lr 0.01323
Train [58][2470/3239]	Time 0.367 (0.849)	Data Time 0.002 (0.372)	Loss 2.6289 (2.6765)	Entropy 0.62418 (0.62821)	Top-1 acc 59.375 (59.387)	Top-5 acc 83.203 (80.827)	lr 0.01323
Train [58][2480/3239]	Time 0.245 (0.850)	Data Time 0.002 (0.374)	Loss 2.8293 (2.6767)	Entropy 0.62408 (0.62820)	Top-1 acc 55.859 (59.384)	Top-5 acc 75.781 (80.821)	lr 0.01323
Train [58][2490/3239]	Time 0.277 (0.848)	Data Time 0.001 (0.372)	Loss 2.6699 (2.6764)	Entropy 0.62435 (0.62818)	Top-1 acc 57.031 (59.386)	Top-5 acc 80.859 (80.826)	lr 0.01323
Train [58][2500/3239]	Time 0.293 (0.854)	Data Time 0.002 (0.379)	Loss 2.6224 (2.6765)	Entropy 0.62423 (0.62817)	Top-1 acc 60.547 (59.381)	Top-5 acc 83.203 (80.825)	lr 0.01323
Train [58][2510/3239]	Time 1.377 (0.853)	Data Time 1.124 (0.378)	Loss 2.5798 (2.6765)	Entropy 0.62421 (0.62815)	Top-1 acc 62.109 (59.383)	Top-5 acc 83.594 (80.826)	lr 0.01323
Train [58][2520/3239]	Time 0.253 (0.851)	Data Time 0.001 (0.376)	Loss 2.5454 (2.6765)	Entropy 0.62414 (0.62813)	Top-1 acc 60.938 (59.381)	Top-5 acc 85.156 (80.825)	lr 0.01323
Train [58][2530/3239]	Time 0.247 (0.859)	Data Time 0.001 (0.384)	Loss 2.6992 (2.6764)	Entropy 0.62393 (0.62812)	Top-1 acc 60.156 (59.383)	Top-5 acc 81.250 (80.826)	lr 0.01323
Train [58][2540/3239]	Time 0.339 (0.857)	Data Time 0.001 (0.383)	Loss 2.7802 (2.6767)	Entropy 0.62428 (0.62810)	Top-1 acc 56.250 (59.376)	Top-5 acc 78.516 (80.819)	lr 0.01322
Train [58][2550/3239]	Time 0.242 (0.856)	Data Time 0.001 (0.382)	Loss 2.8954 (2.6768)	Entropy 0.62424 (0.62809)	Top-1 acc 53.906 (59.378)	Top-5 acc 75.781 (80.818)	lr 0.01322
Train [58][2560/3239]	Time 0.246 (0.864)	Data Time 0.001 (0.390)	Loss 2.6933 (2.6772)	Entropy 0.62418 (0.62807)	Top-1 acc 57.812 (59.370)	Top-5 acc 80.469 (80.808)	lr 0.01322
Train [58][2570/3239]	Time 0.220 (0.863)	Data Time 0.001 (0.389)	Loss 2.7665 (2.6773)	Entropy 0.62389 (0.62806)	Top-1 acc 57.812 (59.368)	Top-5 acc 82.031 (80.810)	lr 0.01322
Train [58][2580/3239]	Time 0.235 (0.862)	Data Time 0.001 (0.388)	Loss 3.0889 (2.6774)	Entropy 0.62410 (0.62804)	Top-1 acc 50.000 (59.364)	Top-5 acc 73.828 (80.808)	lr 0.01322
Train [58][2590/3239]	Time 0.236 (0.861)	Data Time 0.001 (0.387)	Loss 2.5865 (2.6776)	Entropy 0.62417 (0.62803)	Top-1 acc 62.500 (59.363)	Top-5 acc 84.766 (80.807)	lr 0.01322
Train [58][2600/3239]	Time 0.246 (0.867)	Data Time 0.001 (0.394)	Loss 2.7828 (2.6779)	Entropy 0.62426 (0.62801)	Top-1 acc 56.641 (59.354)	Top-5 acc 78.125 (80.800)	lr 0.01322
Train [58][2610/3239]	Time 0.276 (0.868)	Data Time 0.001 (0.395)	Loss 2.6439 (2.6777)	Entropy 0.62423 (0.62800)	Top-1 acc 57.422 (59.359)	Top-5 acc 80.469 (80.803)	lr 0.01322
Train [58][2620/3239]	Time 0.444 (0.879)	Data Time 0.045 (0.393)	Loss 2.6263 (2.6776)	Entropy 0.62453 (0.62798)	Top-1 acc 58.203 (59.356)	Top-5 acc 82.812 (80.805)	lr 0.01322
Train [58][2630/3239]	Time 0.357 (0.878)	Data Time 0.002 (0.392)	Loss 2.7944 (2.6778)	Entropy 0.62463 (0.62797)	Top-1 acc 55.078 (59.353)	Top-5 acc 80.078 (80.802)	lr 0.01322
Train [58][2640/3239]	Time 0.264 (0.876)	Data Time 0.002 (0.390)	Loss 2.8635 (2.6779)	Entropy 0.62481 (0.62796)	Top-1 acc 53.906 (59.351)	Top-5 acc 75.781 (80.800)	lr 0.01321
Train [58][2650/3239]	Time 0.233 (0.874)	Data Time 0.001 (0.389)	Loss 2.7344 (2.6778)	Entropy 0.62491 (0.62794)	Top-1 acc 53.516 (59.351)	Top-5 acc 79.688 (80.800)	lr 0.01321
Train [58][2660/3239]	Time 0.238 (0.876)	Data Time 0.001 (0.391)	Loss 2.9134 (2.6781)	Entropy 0.62487 (0.62793)	Top-1 acc 54.688 (59.347)	Top-5 acc 74.609 (80.794)	lr 0.01321
Train [58][2670/3239]	Time 3.756 (0.876)	Data Time 3.483 (0.391)	Loss 2.6268 (2.6780)	Entropy 0.62486 (0.62792)	Top-1 acc 61.328 (59.345)	Top-5 acc 81.641 (80.794)	lr 0.01321
Train [58][2680/3239]	Time 0.297 (0.874)	Data Time 0.001 (0.389)	Loss 2.7999 (2.6782)	Entropy 0.62489 (0.62791)	Top-1 acc 55.469 (59.339)	Top-5 acc 78.906 (80.789)	lr 0.01321
Train [58][2690/3239]	Time 0.258 (0.881)	Data Time 0.001 (0.396)	Loss 2.6041 (2.6785)	Entropy 0.62503 (0.62790)	Top-1 acc 61.328 (59.331)	Top-5 acc 82.422 (80.785)	lr 0.01321
Train [58][2700/3239]	Time 0.330 (0.879)	Data Time 0.001 (0.394)	Loss 2.4140 (2.6783)	Entropy 0.62516 (0.62789)	Top-1 acc 65.625 (59.331)	Top-5 acc 87.109 (80.792)	lr 0.01321
Train [58][2710/3239]	Time 0.232 (0.879)	Data Time 0.001 (0.395)	Loss 2.6631 (2.6783)	Entropy 0.62542 (0.62788)	Top-1 acc 60.938 (59.332)	Top-5 acc 83.203 (80.792)	lr 0.01321
Train [58][2720/3239]	Time 0.257 (0.885)	Data Time 0.001 (0.401)	Loss 2.7710 (2.6781)	Entropy 0.62562 (0.62787)	Top-1 acc 60.938 (59.341)	Top-5 acc 77.344 (80.797)	lr 0.01321
Train [58][2730/3239]	Time 0.243 (0.884)	Data Time 0.001 (0.400)	Loss 2.7301 (2.6782)	Entropy 0.62532 (0.62786)	Top-1 acc 55.859 (59.339)	Top-5 acc 80.078 (80.795)	lr 0.01321
Train [58][2740/3239]	Time 0.236 (0.883)	Data Time 0.001 (0.399)	Loss 2.6011 (2.6780)	Entropy 0.62568 (0.62785)	Top-1 acc 60.156 (59.346)	Top-5 acc 82.422 (80.800)	lr 0.01320
Train [58][2750/3239]	Time 0.240 (0.881)	Data Time 0.001 (0.398)	Loss 2.7853 (2.6781)	Entropy 0.62604 (0.62785)	Top-1 acc 54.297 (59.345)	Top-5 acc 80.078 (80.796)	lr 0.01320
Train [58][2760/3239]	Time 0.235 (0.888)	Data Time 0.001 (0.404)	Loss 2.6983 (2.6781)	Entropy 0.62596 (0.62784)	Top-1 acc 55.859 (59.346)	Top-5 acc 80.078 (80.795)	lr 0.01320
Train [58][2770/3239]	Time 0.247 (0.888)	Data Time 0.001 (0.405)	Loss 2.5036 (2.6779)	Entropy 0.62597 (0.62783)	Top-1 acc 64.453 (59.352)	Top-5 acc 85.547 (80.803)	lr 0.01320
Train [58][2780/3239]	Time 0.232 (0.887)	Data Time 0.001 (0.404)	Loss 2.7337 (2.6778)	Entropy 0.62559 (0.62783)	Top-1 acc 57.812 (59.353)	Top-5 acc 79.688 (80.802)	lr 0.01320
Train [58][2790/3239]	Time 0.347 (0.892)	Data Time 0.001 (0.410)	Loss 2.7479 (2.6776)	Entropy 0.62532 (0.62782)	Top-1 acc 54.688 (59.356)	Top-5 acc 81.641 (80.807)	lr 0.01320
Train [58][2800/3239]	Time 0.232 (0.892)	Data Time 0.001 (0.410)	Loss 2.6616 (2.6773)	Entropy 0.62559 (0.62781)	Top-1 acc 60.156 (59.361)	Top-5 acc 79.688 (80.811)	lr 0.01320
Train [58][2810/3239]	Time 0.232 (0.891)	Data Time 0.001 (0.408)	Loss 2.5529 (2.6772)	Entropy 0.62592 (0.62780)	Top-1 acc 65.625 (59.365)	Top-5 acc 79.688 (80.812)	lr 0.01320
Train [58][2820/3239]	Time 0.289 (0.896)	Data Time 0.001 (0.414)	Loss 2.8213 (2.6771)	Entropy 0.62614 (0.62780)	Top-1 acc 55.859 (59.373)	Top-5 acc 80.078 (80.812)	lr 0.01320
Train [58][2830/3239]	Time 5.303 (0.896)	Data Time 5.052 (0.415)	Loss 2.9434 (2.6770)	Entropy 0.62648 (0.62779)	Top-1 acc 47.266 (59.372)	Top-5 acc 76.562 (80.816)	lr 0.01320
Train [58][2840/3239]	Time 0.239 (0.895)	Data Time 0.001 (0.413)	Loss 2.3215 (2.6772)	Entropy 0.62647 (0.62779)	Top-1 acc 68.750 (59.368)	Top-5 acc 87.500 (80.815)	lr 0.01319
Train [58][2850/3239]	Time 0.245 (0.900)	Data Time 0.003 (0.419)	Loss 2.7192 (2.6772)	Entropy 0.62646 (0.62778)	Top-1 acc 58.594 (59.367)	Top-5 acc 80.859 (80.815)	lr 0.01319
Train [58][2860/3239]	Time 0.322 (0.898)	Data Time 0.001 (0.417)	Loss 2.8903 (2.6772)	Entropy 0.62658 (0.62778)	Top-1 acc 54.297 (59.369)	Top-5 acc 73.828 (80.817)	lr 0.01319
Train [58][2870/3239]	Time 0.229 (0.898)	Data Time 0.001 (0.418)	Loss 2.6200 (2.6772)	Entropy 0.62655 (0.62777)	Top-1 acc 61.328 (59.366)	Top-5 acc 81.641 (80.813)	lr 0.01319
Train [58][2880/3239]	Time 0.244 (0.904)	Data Time 0.001 (0.423)	Loss 2.5949 (2.6769)	Entropy 0.62646 (0.62777)	Top-1 acc 63.672 (59.373)	Top-5 acc 82.812 (80.818)	lr 0.01319
Train [58][2890/3239]	Time 0.242 (0.902)	Data Time 0.001 (0.422)	Loss 2.5295 (2.6768)	Entropy 0.62660 (0.62776)	Top-1 acc 60.156 (59.377)	Top-5 acc 83.984 (80.821)	lr 0.01319
Train [58][2900/3239]	Time 0.247 (0.903)	Data Time 0.001 (0.422)	Loss 2.7507 (2.6766)	Entropy 0.62665 (0.62776)	Top-1 acc 60.938 (59.381)	Top-5 acc 79.297 (80.822)	lr 0.01319
Train [58][2910/3239]	Time 0.240 (0.901)	Data Time 0.001 (0.421)	Loss 2.7260 (2.6766)	Entropy 0.62659 (0.62775)	Top-1 acc 58.203 (59.385)	Top-5 acc 80.469 (80.821)	lr 0.01319
Train [58][2920/3239]	Time 0.232 (0.906)	Data Time 0.001 (0.427)	Loss 2.7846 (2.6767)	Entropy 0.62658 (0.62775)	Top-1 acc 60.156 (59.385)	Top-5 acc 77.734 (80.819)	lr 0.01319
Train [58][2930/3239]	Time 0.277 (0.905)	Data Time 0.001 (0.426)	Loss 2.6125 (2.6767)	Entropy 0.62669 (0.62775)	Top-1 acc 55.859 (59.377)	Top-5 acc 82.031 (80.823)	lr 0.01319
Train [58][2940/3239]	Time 0.233 (0.904)	Data Time 0.001 (0.424)	Loss 2.7748 (2.6766)	Entropy 0.62659 (0.62774)	Top-1 acc 57.812 (59.378)	Top-5 acc 78.516 (80.824)	lr 0.01318
Train [58][2950/3239]	Time 0.265 (0.911)	Data Time 0.001 (0.432)	Loss 2.6569 (2.6767)	Entropy 0.62643 (0.62774)	Top-1 acc 59.375 (59.378)	Top-5 acc 80.859 (80.821)	lr 0.01318
Train [58][2960/3239]	Time 0.233 (0.910)	Data Time 0.001 (0.431)	Loss 2.8475 (2.6769)	Entropy 0.62657 (0.62774)	Top-1 acc 58.594 (59.375)	Top-5 acc 74.219 (80.817)	lr 0.01318
Train [58][2970/3239]	Time 0.240 (0.908)	Data Time 0.001 (0.429)	Loss 2.6202 (2.6768)	Entropy 0.62652 (0.62773)	Top-1 acc 61.328 (59.379)	Top-5 acc 80.859 (80.816)	lr 0.01318
Train [58][2980/3239]	Time 0.226 (0.915)	Data Time 0.001 (0.437)	Loss 2.7435 (2.6768)	Entropy 0.62654 (0.62773)	Top-1 acc 56.641 (59.377)	Top-5 acc 80.469 (80.817)	lr 0.01318
Train [58][2990/3239]	Time 0.223 (0.914)	Data Time 0.001 (0.435)	Loss 2.4360 (2.6766)	Entropy 0.62674 (0.62772)	Top-1 acc 65.234 (59.383)	Top-5 acc 86.719 (80.823)	lr 0.01318
Train [58][3000/3239]	Time 0.274 (0.912)	Data Time 0.001 (0.434)	Loss 2.7921 (2.6766)	Entropy 0.62700 (0.62772)	Top-1 acc 60.156 (59.384)	Top-5 acc 78.516 (80.824)	lr 0.01318
Train [58][3010/3239]	Time 0.249 (0.919)	Data Time 0.001 (0.441)	Loss 2.6779 (2.6768)	Entropy 0.62682 (0.62772)	Top-1 acc 61.328 (59.380)	Top-5 acc 79.688 (80.820)	lr 0.01318
Train [58][3020/3239]	Time 0.330 (0.918)	Data Time 0.001 (0.440)	Loss 2.8084 (2.6768)	Entropy 0.62687 (0.62771)	Top-1 acc 53.906 (59.383)	Top-5 acc 78.906 (80.823)	lr 0.01318
Train [58][3030/3239]	Time 0.230 (0.916)	Data Time 0.001 (0.438)	Loss 2.8820 (2.6770)	Entropy 0.62714 (0.62771)	Top-1 acc 53.906 (59.375)	Top-5 acc 77.344 (80.820)	lr 0.01318
Train [58][3040/3239]	Time 0.251 (0.925)	Data Time 0.001 (0.447)	Loss 2.7465 (2.6770)	Entropy 0.62722 (0.62771)	Top-1 acc 60.547 (59.375)	Top-5 acc 80.469 (80.823)	lr 0.01317
Train [58][3050/3239]	Time 0.240 (0.923)	Data Time 0.001 (0.446)	Loss 2.5804 (2.6772)	Entropy 0.62702 (0.62771)	Top-1 acc 60.938 (59.369)	Top-5 acc 84.766 (80.821)	lr 0.01317
Train [58][3060/3239]	Time 0.224 (0.921)	Data Time 0.001 (0.444)	Loss 2.6889 (2.6771)	Entropy 0.62746 (0.62771)	Top-1 acc 57.031 (59.368)	Top-5 acc 80.469 (80.818)	lr 0.01317
Train [58][3070/3239]	Time 0.237 (0.920)	Data Time 0.001 (0.443)	Loss 2.6731 (2.6771)	Entropy 0.62740 (0.62771)	Top-1 acc 61.719 (59.372)	Top-5 acc 80.078 (80.820)	lr 0.01317
Train [58][3080/3239]	Time 0.237 (0.926)	Data Time 0.001 (0.450)	Loss 2.7420 (2.6770)	Entropy 0.62704 (0.62770)	Top-1 acc 57.031 (59.377)	Top-5 acc 81.250 (80.821)	lr 0.01317
Train [58][3090/3239]	Time 0.338 (0.925)	Data Time 0.001 (0.448)	Loss 2.7710 (2.6771)	Entropy 0.62682 (0.62770)	Top-1 acc 57.422 (59.368)	Top-5 acc 78.906 (80.819)	lr 0.01317
Train [58][3100/3239]	Time 0.224 (0.923)	Data Time 0.001 (0.447)	Loss 2.7258 (2.6770)	Entropy 0.62683 (0.62770)	Top-1 acc 57.812 (59.373)	Top-5 acc 76.953 (80.822)	lr 0.01317
Train [58][3110/3239]	Time 0.241 (0.930)	Data Time 0.001 (0.454)	Loss 2.9521 (2.6772)	Entropy 0.62679 (0.62770)	Top-1 acc 51.562 (59.367)	Top-5 acc 75.391 (80.819)	lr 0.01317
Train [58][3120/3239]	Time 0.253 (0.928)	Data Time 0.001 (0.452)	Loss 2.5361 (2.6770)	Entropy 0.62716 (0.62769)	Top-1 acc 60.938 (59.373)	Top-5 acc 83.203 (80.820)	lr 0.01317
Train [58][3130/3239]	Time 0.250 (0.926)	Data Time 0.001 (0.451)	Loss 2.8245 (2.6769)	Entropy 0.62719 (0.62769)	Top-1 acc 57.422 (59.378)	Top-5 acc 77.344 (80.819)	lr 0.01317
Train [58][3140/3239]	Time 0.231 (0.932)	Data Time 0.001 (0.456)	Loss 2.7625 (2.6773)	Entropy 0.62744 (0.62769)	Top-1 acc 55.859 (59.373)	Top-5 acc 80.078 (80.814)	lr 0.01316
Train [58][3150/3239]	Time 0.262 (0.930)	Data Time 0.001 (0.455)	Loss 2.7012 (2.6773)	Entropy 0.62769 (0.62769)	Top-1 acc 60.938 (59.371)	Top-5 acc 75.000 (80.810)	lr 0.01316
Train [58][3160/3239]	Time 0.239 (0.928)	Data Time 0.001 (0.453)	Loss 2.8733 (2.6773)	Entropy 0.62795 (0.62769)	Top-1 acc 52.734 (59.373)	Top-5 acc 73.828 (80.809)	lr 0.01316
Train [58][3170/3239]	Time 0.227 (0.935)	Data Time 0.001 (0.460)	Loss 2.7527 (2.6772)	Entropy 0.62769 (0.62769)	Top-1 acc 58.984 (59.379)	Top-5 acc 80.078 (80.809)	lr 0.01316
Train [58][3180/3239]	Time 0.329 (0.934)	Data Time 0.000 (0.459)	Loss 2.6413 (2.6770)	Entropy 0.62745 (0.62769)	Top-1 acc 62.109 (59.385)	Top-5 acc 82.812 (80.813)	lr 0.01316
Train [58][3190/3239]	Time 0.231 (0.932)	Data Time 0.000 (0.457)	Loss 2.8240 (2.6771)	Entropy 0.62758 (0.62769)	Top-1 acc 55.469 (59.381)	Top-5 acc 81.250 (80.812)	lr 0.01316
Train [58][3200/3239]	Time 0.226 (0.937)	Data Time 0.000 (0.463)	Loss 2.5851 (2.6771)	Entropy 0.62756 (0.62769)	Top-1 acc 60.547 (59.384)	Top-5 acc 82.422 (80.810)	lr 0.01316
Train [58][3210/3239]	Time 0.235 (0.936)	Data Time 0.000 (0.462)	Loss 2.6181 (2.6771)	Entropy 0.62754 (0.62769)	Top-1 acc 59.766 (59.385)	Top-5 acc 83.203 (80.809)	lr 0.01316
Train [58][3220/3239]	Time 0.249 (0.934)	Data Time 0.000 (0.460)	Loss 2.5592 (2.6772)	Entropy 0.62751 (0.62769)	Top-1 acc 60.156 (59.384)	Top-5 acc 83.203 (80.808)	lr 0.01316
Train [58][3230/3239]	Time 0.215 (0.932)	Data Time 0.000 (0.459)	Loss 2.6590 (2.6775)	Entropy 0.62766 (0.62769)	Top-1 acc 60.938 (59.378)	Top-5 acc 81.641 (80.803)	lr 0.01316
Train [58][3239/3239]	Time 0.892 (0.934)	Data Time 0.000 (0.461)	Loss 2.7322 (2.6775)	Entropy 0.62777 (0.62769)	Top-1 acc 56.790 (59.375)	Top-5 acc 80.247 (80.802)	lr 0.01315
==========Valid [58/120]	loss 1.420	top-1 acc 67.240 (67.240)	top-5 acc 87.047	Train top-1 59.375	top-5 80.802	Entropy 0.62777	Latency-None: 0.000ms	Flops: 538.40M
Train [59][0/3239]	Time 40.294 (40.294)	Data Time 39.089 (39.089)	Loss 2.3874 (2.3874)	Entropy 0.62798 (0.62798)	Top-1 acc 67.578 (67.578)	Top-5 acc 84.766 (84.766)	lr 0.01315
Train [59][10/3239]	Time 0.266 (4.101)	Data Time 0.001 (3.555)	Loss 2.6747 (2.6363)	Entropy 0.62823 (0.62801)	Top-1 acc 63.672 (60.653)	Top-5 acc 78.906 (81.250)	lr 0.01315
Train [59][20/3239]	Time 0.239 (2.351)	Data Time 0.001 (1.863)	Loss 2.5942 (2.6394)	Entropy 0.62827 (0.62814)	Top-1 acc 60.156 (60.603)	Top-5 acc 81.641 (81.455)	lr 0.01315
Train [59][30/3239]	Time 0.339 (1.747)	Data Time 0.001 (1.263)	Loss 2.5578 (2.6471)	Entropy 0.62811 (0.62815)	Top-1 acc 63.672 (60.282)	Top-5 acc 83.203 (81.250)	lr 0.01315
Train [59][40/3239]	Time 0.230 (2.366)	Data Time 0.002 (0.965)	Loss 2.7519 (2.6504)	Entropy 0.62800 (0.62815)	Top-1 acc 56.250 (59.823)	Top-5 acc 81.250 (81.421)	lr 0.01315
Train [59][50/3239]	Time 0.233 (1.982)	Data Time 0.002 (0.777)	Loss 2.4248 (2.6627)	Entropy 0.62809 (0.62812)	Top-1 acc 65.234 (59.712)	Top-5 acc 83.984 (81.005)	lr 0.01315
Train [59][60/3239]	Time 0.263 (1.731)	Data Time 0.002 (0.650)	Loss 2.4786 (2.6557)	Entropy 0.62817 (0.62813)	Top-1 acc 64.062 (59.810)	Top-5 acc 84.375 (81.212)	lr 0.01315
Train [59][70/3239]	Time 0.251 (1.550)	Data Time 0.002 (0.558)	Loss 2.5643 (2.6501)	Entropy 0.62807 (0.62812)	Top-1 acc 62.500 (60.008)	Top-5 acc 83.203 (81.156)	lr 0.01315
Train [59][80/3239]	Time 0.353 (1.413)	Data Time 0.002 (0.490)	Loss 2.5911 (2.6591)	Entropy 0.62805 (0.62812)	Top-1 acc 59.375 (59.848)	Top-5 acc 83.594 (81.019)	lr 0.01315
Train [59][90/3239]	Time 0.260 (1.309)	Data Time 0.001 (0.436)	Loss 2.7369 (2.6616)	Entropy 0.62790 (0.62812)	Top-1 acc 58.203 (59.783)	Top-5 acc 79.297 (80.967)	lr 0.01315
Train [59][100/3239]	Time 0.282 (1.223)	Data Time 0.002 (0.393)	Loss 2.7577 (2.6624)	Entropy 0.62772 (0.62808)	Top-1 acc 57.812 (59.754)	Top-5 acc 77.344 (80.952)	lr 0.01314
Train [59][110/3239]	Time 0.263 (1.156)	Data Time 0.001 (0.358)	Loss 2.8268 (2.6612)	Entropy 0.62776 (0.62805)	Top-1 acc 57.422 (59.776)	Top-5 acc 79.297 (80.990)	lr 0.01314
Train [59][120/3239]	Time 0.272 (1.097)	Data Time 0.001 (0.328)	Loss 2.7437 (2.6613)	Entropy 0.62801 (0.62804)	Top-1 acc 57.812 (59.798)	Top-5 acc 79.297 (80.979)	lr 0.01314
Train [59][130/3239]	Time 0.253 (1.048)	Data Time 0.001 (0.303)	Loss 2.6146 (2.6623)	Entropy 0.62805 (0.62804)	Top-1 acc 63.672 (59.819)	Top-5 acc 82.031 (81.014)	lr 0.01314
Train [59][140/3239]	Time 0.296 (1.012)	Data Time 0.001 (0.288)	Loss 2.6460 (2.6613)	Entropy 0.62796 (0.62804)	Top-1 acc 58.984 (59.824)	Top-5 acc 83.594 (81.034)	lr 0.01314
Train [59][150/3239]	Time 0.227 (0.975)	Data Time 0.002 (0.269)	Loss 2.5849 (2.6578)	Entropy 0.62817 (0.62803)	Top-1 acc 59.766 (59.872)	Top-5 acc 80.859 (81.134)	lr 0.01314
Train [59][160/3239]	Time 0.244 (0.940)	Data Time 0.001 (0.252)	Loss 2.6073 (2.6530)	Entropy 0.62830 (0.62804)	Top-1 acc 60.938 (59.943)	Top-5 acc 80.469 (81.228)	lr 0.01314
Train [59][170/3239]	Time 0.344 (0.950)	Data Time 0.001 (0.276)	Loss 2.7978 (2.6510)	Entropy 0.62812 (0.62805)	Top-1 acc 55.859 (60.005)	Top-5 acc 78.516 (81.273)	lr 0.01314
Train [59][180/3239]	Time 0.250 (0.925)	Data Time 0.001 (0.263)	Loss 2.6867 (2.6498)	Entropy 0.62829 (0.62806)	Top-1 acc 61.328 (60.031)	Top-5 acc 77.734 (81.276)	lr 0.01314
Train [59][190/3239]	Time 0.259 (0.920)	Data Time 0.002 (0.269)	Loss 2.8413 (2.6535)	Entropy 0.62831 (0.62808)	Top-1 acc 59.375 (59.989)	Top-5 acc 79.297 (81.268)	lr 0.01314
Train [59][200/3239]	Time 4.403 (0.916)	Data Time 4.123 (0.276)	Loss 2.8304 (2.6559)	Entropy 0.62863 (0.62809)	Top-1 acc 55.859 (59.989)	Top-5 acc 76.953 (81.219)	lr 0.01313
Train [59][210/3239]	Time 0.248 (0.897)	Data Time 0.001 (0.267)	Loss 2.6156 (2.6554)	Entropy 0.62851 (0.62811)	Top-1 acc 60.547 (59.980)	Top-5 acc 81.641 (81.231)	lr 0.01313
Train [59][220/3239]	Time 3.395 (0.898)	Data Time 3.152 (0.277)	Loss 2.7502 (2.6559)	Entropy 0.62849 (0.62813)	Top-1 acc 58.203 (59.990)	Top-5 acc 79.297 (81.218)	lr 0.01313
Train [59][230/3239]	Time 0.234 (0.877)	Data Time 0.001 (0.265)	Loss 2.7859 (2.6583)	Entropy 0.62803 (0.62814)	Top-1 acc 50.781 (59.879)	Top-5 acc 77.734 (81.203)	lr 0.01313
Train [59][240/3239]	Time 0.396 (0.877)	Data Time 0.001 (0.272)	Loss 2.6773 (2.6564)	Entropy 0.62798 (0.62814)	Top-1 acc 56.641 (59.912)	Top-5 acc 80.469 (81.227)	lr 0.01313
Train [59][250/3239]	Time 0.246 (0.878)	Data Time 0.001 (0.280)	Loss 2.8637 (2.6560)	Entropy 0.62799 (0.62813)	Top-1 acc 54.688 (59.893)	Top-5 acc 76.172 (81.216)	lr 0.01313
Train [59][260/3239]	Time 0.245 (0.861)	Data Time 0.001 (0.269)	Loss 2.6671 (2.6581)	Entropy 0.62796 (0.62813)	Top-1 acc 59.375 (59.815)	Top-5 acc 83.594 (81.187)	lr 0.01313
Train [59][270/3239]	Time 0.224 (0.861)	Data Time 0.001 (0.275)	Loss 2.5803 (2.6575)	Entropy 0.62756 (0.62811)	Top-1 acc 64.844 (59.845)	Top-5 acc 82.422 (81.204)	lr 0.01313
Train [59][280/3239]	Time 0.251 (0.879)	Data Time 0.002 (0.299)	Loss 2.5440 (2.6576)	Entropy 0.62776 (0.62810)	Top-1 acc 63.672 (59.852)	Top-5 acc 82.422 (81.197)	lr 0.01313
Train [59][290/3239]	Time 0.235 (0.865)	Data Time 0.001 (0.289)	Loss 2.4308 (2.6558)	Entropy 0.62770 (0.62808)	Top-1 acc 65.625 (59.885)	Top-5 acc 85.547 (81.254)	lr 0.01312
Train [59][300/3239]	Time 0.245 (0.858)	Data Time 0.001 (0.287)	Loss 2.5462 (2.6533)	Entropy 0.62721 (0.62806)	Top-1 acc 64.844 (59.969)	Top-5 acc 82.422 (81.292)	lr 0.01312
Train [59][310/3239]	Time 0.243 (0.867)	Data Time 0.001 (0.300)	Loss 2.6276 (2.6543)	Entropy 0.62707 (0.62804)	Top-1 acc 62.109 (59.936)	Top-5 acc 81.641 (81.264)	lr 0.01312
Train [59][320/3239]	Time 0.258 (0.861)	Data Time 0.001 (0.298)	Loss 2.5472 (2.6532)	Entropy 0.62719 (0.62800)	Top-1 acc 63.672 (59.955)	Top-5 acc 84.766 (81.291)	lr 0.01312
Train [59][330/3239]	Time 0.279 (0.848)	Data Time 0.002 (0.289)	Loss 2.5340 (2.6534)	Entropy 0.62725 (0.62798)	Top-1 acc 63.281 (59.939)	Top-5 acc 81.641 (81.291)	lr 0.01312
Train [59][340/3239]	Time 1.544 (0.848)	Data Time 1.271 (0.292)	Loss 2.5784 (2.6524)	Entropy 0.62712 (0.62795)	Top-1 acc 60.547 (59.976)	Top-5 acc 80.859 (81.297)	lr 0.01312
Train [59][350/3239]	Time 0.216 (0.859)	Data Time 0.001 (0.307)	Loss 2.5660 (2.6513)	Entropy 0.62721 (0.62793)	Top-1 acc 60.938 (59.986)	Top-5 acc 83.594 (81.312)	lr 0.01312
Train [59][360/3239]	Time 0.280 (0.848)	Data Time 0.001 (0.299)	Loss 2.6101 (2.6526)	Entropy 0.62723 (0.62791)	Top-1 acc 62.500 (59.961)	Top-5 acc 82.031 (81.302)	lr 0.01312
Train [59][370/3239]	Time 0.265 (0.840)	Data Time 0.001 (0.293)	Loss 2.6676 (2.6528)	Entropy 0.62743 (0.62790)	Top-1 acc 62.500 (59.976)	Top-5 acc 81.250 (81.307)	lr 0.01312
Train [59][380/3239]	Time 1.955 (0.856)	Data Time 1.701 (0.313)	Loss 2.6237 (2.6526)	Entropy 0.62772 (0.62789)	Top-1 acc 58.203 (59.964)	Top-5 acc 80.078 (81.326)	lr 0.01312
Train [59][390/3239]	Time 0.299 (0.845)	Data Time 0.001 (0.305)	Loss 2.6261 (2.6509)	Entropy 0.62722 (0.62788)	Top-1 acc 63.281 (60.010)	Top-5 acc 80.859 (81.361)	lr 0.01311
Train [59][400/3239]	Time 0.354 (0.846)	Data Time 0.002 (0.308)	Loss 2.7120 (2.6513)	Entropy 0.62710 (0.62786)	Top-1 acc 57.812 (60.006)	Top-5 acc 79.297 (81.352)	lr 0.01311
Train [59][410/3239]	Time 0.227 (0.846)	Data Time 0.001 (0.312)	Loss 2.5641 (2.6521)	Entropy 0.62726 (0.62784)	Top-1 acc 58.984 (59.961)	Top-5 acc 84.766 (81.351)	lr 0.01311
Train [59][420/3239]	Time 0.252 (0.850)	Data Time 0.001 (0.319)	Loss 2.5519 (2.6514)	Entropy 0.62755 (0.62783)	Top-1 acc 60.156 (59.972)	Top-5 acc 83.594 (81.356)	lr 0.01311
Train [59][430/3239]	Time 0.242 (0.846)	Data Time 0.001 (0.317)	Loss 2.9460 (2.6515)	Entropy 0.62786 (0.62783)	Top-1 acc 51.172 (59.999)	Top-5 acc 75.000 (81.346)	lr 0.01311
Train [59][440/3239]	Time 0.235 (0.844)	Data Time 0.001 (0.317)	Loss 2.5827 (2.6516)	Entropy 0.62796 (0.62783)	Top-1 acc 58.984 (59.984)	Top-5 acc 81.250 (81.347)	lr 0.01311
Train [59][450/3239]	Time 0.248 (0.847)	Data Time 0.001 (0.323)	Loss 2.5866 (2.6526)	Entropy 0.62815 (0.62783)	Top-1 acc 59.375 (59.956)	Top-5 acc 84.766 (81.332)	lr 0.01311
Train [59][460/3239]	Time 0.233 (0.846)	Data Time 0.001 (0.324)	Loss 2.6225 (2.6532)	Entropy 0.62838 (0.62784)	Top-1 acc 59.766 (59.932)	Top-5 acc 81.250 (81.317)	lr 0.01311
Train [59][470/3239]	Time 0.345 (0.849)	Data Time 0.001 (0.329)	Loss 2.8404 (2.6549)	Entropy 0.62818 (0.62785)	Top-1 acc 55.859 (59.883)	Top-5 acc 78.906 (81.301)	lr 0.01311
Train [59][480/3239]	Time 0.234 (0.846)	Data Time 0.001 (0.329)	Loss 2.6778 (2.6542)	Entropy 0.62822 (0.62786)	Top-1 acc 58.203 (59.887)	Top-5 acc 78.906 (81.324)	lr 0.01311
Train [59][490/3239]	Time 4.690 (0.847)	Data Time 4.432 (0.332)	Loss 2.6687 (2.6535)	Entropy 0.62817 (0.62787)	Top-1 acc 61.719 (59.903)	Top-5 acc 81.250 (81.350)	lr 0.01310
Train [59][500/3239]	Time 5.884 (0.853)	Data Time 5.582 (0.340)	Loss 2.6781 (2.6540)	Entropy 0.62813 (0.62787)	Top-1 acc 58.594 (59.882)	Top-5 acc 80.469 (81.349)	lr 0.01310
Train [59][510/3239]	Time 0.233 (0.848)	Data Time 0.001 (0.336)	Loss 2.6964 (2.6529)	Entropy 0.62833 (0.62788)	Top-1 acc 57.812 (59.897)	Top-5 acc 78.906 (81.370)	lr 0.01310
Train [59][520/3239]	Time 0.252 (0.841)	Data Time 0.001 (0.331)	Loss 2.4653 (2.6525)	Entropy 0.62837 (0.62789)	Top-1 acc 66.406 (59.917)	Top-5 acc 85.547 (81.362)	lr 0.01310
Train [59][530/3239]	Time 0.244 (0.844)	Data Time 0.001 (0.335)	Loss 2.6772 (2.6528)	Entropy 0.62825 (0.62790)	Top-1 acc 62.109 (59.916)	Top-5 acc 81.641 (81.359)	lr 0.01310
Train [59][540/3239]	Time 0.241 (0.855)	Data Time 0.002 (0.347)	Loss 2.6685 (2.6530)	Entropy 0.62793 (0.62790)	Top-1 acc 61.328 (59.915)	Top-5 acc 81.641 (81.361)	lr 0.01310
Train [59][550/3239]	Time 0.263 (0.847)	Data Time 0.002 (0.341)	Loss 2.7890 (2.6526)	Entropy 0.62768 (0.62790)	Top-1 acc 55.469 (59.921)	Top-5 acc 79.297 (81.371)	lr 0.01310
Train [59][560/3239]	Time 0.338 (0.859)	Data Time 0.001 (0.354)	Loss 2.5930 (2.6528)	Entropy 0.62752 (0.62789)	Top-1 acc 61.328 (59.919)	Top-5 acc 83.984 (81.355)	lr 0.01310
Train [59][570/3239]	Time 0.250 (0.862)	Data Time 0.001 (0.358)	Loss 2.7066 (2.6522)	Entropy 0.62739 (0.62789)	Top-1 acc 58.203 (59.939)	Top-5 acc 82.031 (81.366)	lr 0.01310
Train [59][580/3239]	Time 0.243 (0.854)	Data Time 0.001 (0.352)	Loss 2.8206 (2.6533)	Entropy 0.62758 (0.62788)	Top-1 acc 53.906 (59.919)	Top-5 acc 81.641 (81.343)	lr 0.01310
Train [59][590/3239]	Time 0.247 (0.864)	Data Time 0.001 (0.363)	Loss 2.6294 (2.6544)	Entropy 0.62768 (0.62788)	Top-1 acc 61.328 (59.900)	Top-5 acc 79.688 (81.304)	lr 0.01309
Train [59][600/3239]	Time 0.229 (0.864)	Data Time 0.001 (0.365)	Loss 2.9001 (2.6555)	Entropy 0.62779 (0.62787)	Top-1 acc 54.688 (59.883)	Top-5 acc 75.781 (81.276)	lr 0.01309
Train [59][610/3239]	Time 0.231 (0.866)	Data Time 0.001 (0.368)	Loss 2.7968 (2.6553)	Entropy 0.62800 (0.62787)	Top-1 acc 56.250 (59.876)	Top-5 acc 76.562 (81.278)	lr 0.01309
Train [59][620/3239]	Time 0.219 (0.869)	Data Time 0.001 (0.373)	Loss 2.7214 (2.6557)	Entropy 0.62834 (0.62788)	Top-1 acc 56.250 (59.867)	Top-5 acc 80.469 (81.263)	lr 0.01309
Train [59][630/3239]	Time 0.316 (0.867)	Data Time 0.001 (0.372)	Loss 2.7127 (2.6556)	Entropy 0.62860 (0.62788)	Top-1 acc 56.641 (59.851)	Top-5 acc 78.516 (81.257)	lr 0.01309
Train [59][640/3239]	Time 0.227 (0.868)	Data Time 0.001 (0.375)	Loss 2.6161 (2.6558)	Entropy 0.62824 (0.62789)	Top-1 acc 61.328 (59.833)	Top-5 acc 80.469 (81.248)	lr 0.01309
Train [59][650/3239]	Time 3.212 (0.873)	Data Time 2.962 (0.380)	Loss 2.6901 (2.6555)	Entropy 0.62787 (0.62790)	Top-1 acc 60.938 (59.851)	Top-5 acc 80.469 (81.258)	lr 0.01309
Train [59][660/3239]	Time 0.237 (0.872)	Data Time 0.001 (0.381)	Loss 2.8818 (2.6553)	Entropy 0.62781 (0.62790)	Top-1 acc 55.078 (59.860)	Top-5 acc 79.688 (81.269)	lr 0.01309
Train [59][670/3239]	Time 0.246 (0.874)	Data Time 0.001 (0.383)	Loss 2.6249 (2.6551)	Entropy 0.62805 (0.62790)	Top-1 acc 65.625 (59.871)	Top-5 acc 83.594 (81.275)	lr 0.01309
Train [59][680/3239]	Time 0.235 (0.872)	Data Time 0.001 (0.383)	Loss 2.7531 (2.6550)	Entropy 0.62761 (0.62790)	Top-1 acc 58.203 (59.861)	Top-5 acc 80.469 (81.282)	lr 0.01309
Train [59][690/3239]	Time 0.329 (0.919)	Data Time 0.004 (0.380)	Loss 2.4975 (2.6545)	Entropy 0.62774 (0.62789)	Top-1 acc 64.062 (59.881)	Top-5 acc 84.375 (81.290)	lr 0.01308
Train [59][700/3239]	Time 0.260 (0.913)	Data Time 0.002 (0.375)	Loss 2.4949 (2.6546)	Entropy 0.62767 (0.62789)	Top-1 acc 67.188 (59.887)	Top-5 acc 84.375 (81.281)	lr 0.01308
Train [59][710/3239]	Time 0.243 (0.906)	Data Time 0.002 (0.369)	Loss 2.6611 (2.6557)	Entropy 0.62789 (0.62789)	Top-1 acc 59.766 (59.867)	Top-5 acc 81.641 (81.243)	lr 0.01308
Train [59][720/3239]	Time 0.372 (0.899)	Data Time 0.002 (0.364)	Loss 2.6358 (2.6550)	Entropy 0.62767 (0.62789)	Top-1 acc 60.938 (59.877)	Top-5 acc 80.469 (81.258)	lr 0.01308
Train [59][730/3239]	Time 0.235 (0.893)	Data Time 0.001 (0.359)	Loss 2.4416 (2.6553)	Entropy 0.62773 (0.62789)	Top-1 acc 65.234 (59.875)	Top-5 acc 85.938 (81.256)	lr 0.01308
Train [59][740/3239]	Time 0.239 (0.886)	Data Time 0.001 (0.355)	Loss 2.6660 (2.6559)	Entropy 0.62745 (0.62788)	Top-1 acc 60.156 (59.865)	Top-5 acc 80.859 (81.250)	lr 0.01308
Train [59][750/3239]	Time 0.227 (0.880)	Data Time 0.001 (0.350)	Loss 2.6248 (2.6570)	Entropy 0.62731 (0.62788)	Top-1 acc 60.938 (59.846)	Top-5 acc 81.641 (81.234)	lr 0.01308
Train [59][760/3239]	Time 0.216 (0.882)	Data Time 0.001 (0.354)	Loss 2.8591 (2.6579)	Entropy 0.62736 (0.62787)	Top-1 acc 53.906 (59.816)	Top-5 acc 78.516 (81.223)	lr 0.01308
Train [59][770/3239]	Time 0.238 (0.876)	Data Time 0.001 (0.349)	Loss 2.5888 (2.6579)	Entropy 0.62745 (0.62786)	Top-1 acc 60.938 (59.817)	Top-5 acc 84.766 (81.233)	lr 0.01308
Train [59][780/3239]	Time 0.243 (0.873)	Data Time 0.001 (0.348)	Loss 2.6843 (2.6573)	Entropy 0.62744 (0.62786)	Top-1 acc 56.250 (59.828)	Top-5 acc 82.422 (81.250)	lr 0.01308
Train [59][790/3239]	Time 0.393 (0.886)	Data Time 0.001 (0.362)	Loss 2.6694 (2.6573)	Entropy 0.62756 (0.62786)	Top-1 acc 54.297 (59.836)	Top-5 acc 80.469 (81.252)	lr 0.01307
Train [59][800/3239]	Time 0.228 (0.880)	Data Time 0.001 (0.357)	Loss 2.9787 (2.6581)	Entropy 0.62780 (0.62785)	Top-1 acc 53.516 (59.822)	Top-5 acc 75.391 (81.231)	lr 0.01307
Train [59][810/3239]	Time 0.227 (0.876)	Data Time 0.001 (0.354)	Loss 2.5790 (2.6582)	Entropy 0.62806 (0.62785)	Top-1 acc 60.547 (59.816)	Top-5 acc 82.422 (81.225)	lr 0.01307
Train [59][820/3239]	Time 4.655 (0.885)	Data Time 4.416 (0.364)	Loss 3.0561 (2.6577)	Entropy 0.62808 (0.62785)	Top-1 acc 47.266 (59.820)	Top-5 acc 73.828 (81.246)	lr 0.01307
Train [59][830/3239]	Time 0.252 (0.885)	Data Time 0.001 (0.366)	Loss 2.7667 (2.6578)	Entropy 0.62801 (0.62786)	Top-1 acc 56.250 (59.810)	Top-5 acc 79.688 (81.246)	lr 0.01307
Train [59][840/3239]	Time 0.262 (0.880)	Data Time 0.001 (0.362)	Loss 2.6906 (2.6574)	Entropy 0.62803 (0.62786)	Top-1 acc 59.375 (59.815)	Top-5 acc 82.031 (81.250)	lr 0.01307
Train [59][850/3239]	Time 3.739 (0.879)	Data Time 3.485 (0.362)	Loss 2.8414 (2.6578)	Entropy 0.62841 (0.62786)	Top-1 acc 55.078 (59.798)	Top-5 acc 79.297 (81.248)	lr 0.01307
Train [59][860/3239]	Time 0.241 (0.887)	Data Time 0.001 (0.371)	Loss 2.6512 (2.6573)	Entropy 0.62842 (0.62787)	Top-1 acc 55.469 (59.802)	Top-5 acc 80.859 (81.255)	lr 0.01307
Train [59][870/3239]	Time 0.243 (0.882)	Data Time 0.001 (0.367)	Loss 2.5001 (2.6570)	Entropy 0.62848 (0.62787)	Top-1 acc 62.500 (59.810)	Top-5 acc 85.156 (81.261)	lr 0.01307
Train [59][880/3239]	Time 0.269 (0.878)	Data Time 0.001 (0.364)	Loss 2.6508 (2.6570)	Entropy 0.62867 (0.62788)	Top-1 acc 59.766 (59.817)	Top-5 acc 81.250 (81.257)	lr 0.01307
Train [59][890/3239]	Time 0.261 (0.891)	Data Time 0.001 (0.378)	Loss 2.5506 (2.6569)	Entropy 0.62826 (0.62789)	Top-1 acc 61.328 (59.827)	Top-5 acc 83.984 (81.257)	lr 0.01306
Train [59][900/3239]	Time 0.236 (0.886)	Data Time 0.001 (0.374)	Loss 2.7427 (2.6561)	Entropy 0.62802 (0.62789)	Top-1 acc 58.594 (59.853)	Top-5 acc 78.516 (81.270)	lr 0.01306
Train [59][910/3239]	Time 0.231 (0.886)	Data Time 0.001 (0.375)	Loss 2.7592 (2.6561)	Entropy 0.62824 (0.62789)	Top-1 acc 59.375 (59.851)	Top-5 acc 81.641 (81.273)	lr 0.01306
Train [59][920/3239]	Time 0.493 (0.894)	Data Time 0.255 (0.384)	Loss 2.5871 (2.6557)	Entropy 0.62853 (0.62790)	Top-1 acc 60.547 (59.861)	Top-5 acc 82.422 (81.287)	lr 0.01306
Train [59][930/3239]	Time 0.244 (0.890)	Data Time 0.001 (0.381)	Loss 2.7022 (2.6562)	Entropy 0.62840 (0.62790)	Top-1 acc 60.156 (59.856)	Top-5 acc 81.250 (81.275)	lr 0.01306
Train [59][940/3239]	Time 0.247 (0.889)	Data Time 0.001 (0.381)	Loss 2.6987 (2.6561)	Entropy 0.62848 (0.62791)	Top-1 acc 60.547 (59.855)	Top-5 acc 80.078 (81.277)	lr 0.01306
Train [59][950/3239]	Time 0.364 (0.896)	Data Time 0.001 (0.388)	Loss 2.7309 (2.6560)	Entropy 0.62867 (0.62792)	Top-1 acc 60.547 (59.865)	Top-5 acc 80.469 (81.278)	lr 0.01306
Train [59][960/3239]	Time 0.232 (0.895)	Data Time 0.001 (0.388)	Loss 2.5290 (2.6560)	Entropy 0.62880 (0.62793)	Top-1 acc 63.672 (59.863)	Top-5 acc 83.594 (81.274)	lr 0.01306
Train [59][970/3239]	Time 0.258 (0.893)	Data Time 0.001 (0.387)	Loss 2.7406 (2.6565)	Entropy 0.62894 (0.62794)	Top-1 acc 58.984 (59.846)	Top-5 acc 77.734 (81.267)	lr 0.01306
Train [59][980/3239]	Time 8.344 (0.899)	Data Time 8.102 (0.394)	Loss 2.6887 (2.6564)	Entropy 0.62896 (0.62795)	Top-1 acc 56.641 (59.845)	Top-5 acc 80.469 (81.270)	lr 0.01306
Train [59][990/3239]	Time 0.234 (0.903)	Data Time 0.001 (0.399)	Loss 2.7338 (2.6570)	Entropy 0.62905 (0.62796)	Top-1 acc 58.594 (59.830)	Top-5 acc 78.516 (81.250)	lr 0.01305
Train [59][1000/3239]	Time 0.225 (0.898)	Data Time 0.001 (0.395)	Loss 2.8553 (2.6567)	Entropy 0.62876 (0.62797)	Top-1 acc 52.734 (59.825)	Top-5 acc 76.953 (81.261)	lr 0.01305
Train [59][1010/3239]	Time 0.247 (0.893)	Data Time 0.001 (0.391)	Loss 2.6510 (2.6566)	Entropy 0.62906 (0.62798)	Top-1 acc 57.422 (59.825)	Top-5 acc 80.859 (81.265)	lr 0.01305
Train [59][1020/3239]	Time 0.327 (0.910)	Data Time 0.001 (0.409)	Loss 2.6478 (2.6566)	Entropy 0.62851 (0.62799)	Top-1 acc 64.062 (59.834)	Top-5 acc 81.250 (81.258)	lr 0.01305
Train [59][1030/3239]	Time 0.245 (0.906)	Data Time 0.002 (0.405)	Loss 3.0443 (2.6564)	Entropy 0.62865 (0.62799)	Top-1 acc 50.000 (59.839)	Top-5 acc 75.391 (81.257)	lr 0.01305
Train [59][1040/3239]	Time 0.235 (0.901)	Data Time 0.001 (0.401)	Loss 2.6835 (2.6555)	Entropy 0.62879 (0.62800)	Top-1 acc 58.984 (59.849)	Top-5 acc 79.297 (81.272)	lr 0.01305
Train [59][1050/3239]	Time 0.235 (0.913)	Data Time 0.001 (0.414)	Loss 2.6696 (2.6552)	Entropy 0.62888 (0.62801)	Top-1 acc 61.719 (59.858)	Top-5 acc 83.984 (81.276)	lr 0.01305
Train [59][1060/3239]	Time 0.231 (0.909)	Data Time 0.001 (0.410)	Loss 2.7640 (2.6552)	Entropy 0.62908 (0.62801)	Top-1 acc 55.859 (59.848)	Top-5 acc 79.688 (81.276)	lr 0.01305
Train [59][1070/3239]	Time 0.234 (0.908)	Data Time 0.001 (0.410)	Loss 2.7803 (2.6556)	Entropy 0.62895 (0.62802)	Top-1 acc 58.203 (59.840)	Top-5 acc 78.516 (81.270)	lr 0.01305
Train [59][1080/3239]	Time 6.277 (0.918)	Data Time 6.024 (0.421)	Loss 2.7520 (2.6569)	Entropy 0.62883 (0.62803)	Top-1 acc 56.641 (59.805)	Top-5 acc 77.344 (81.246)	lr 0.01305
Train [59][1090/3239]	Time 0.235 (0.913)	Data Time 0.001 (0.417)	Loss 2.7318 (2.6569)	Entropy 0.62856 (0.62804)	Top-1 acc 58.203 (59.806)	Top-5 acc 80.859 (81.248)	lr 0.01304
Train [59][1100/3239]	Time 0.244 (0.914)	Data Time 0.001 (0.418)	Loss 2.6301 (2.6563)	Entropy 0.62837 (0.62804)	Top-1 acc 59.766 (59.822)	Top-5 acc 82.031 (81.257)	lr 0.01304
Train [59][1110/3239]	Time 0.335 (0.917)	Data Time 0.001 (0.422)	Loss 2.6761 (2.6564)	Entropy 0.62839 (0.62805)	Top-1 acc 57.812 (59.823)	Top-5 acc 82.422 (81.254)	lr 0.01304
Train [59][1120/3239]	Time 0.251 (0.920)	Data Time 0.001 (0.426)	Loss 2.7655 (2.6561)	Entropy 0.62869 (0.62805)	Top-1 acc 56.641 (59.830)	Top-5 acc 80.469 (81.257)	lr 0.01304
Train [59][1130/3239]	Time 0.245 (0.919)	Data Time 0.001 (0.426)	Loss 2.9296 (2.6565)	Entropy 0.62884 (0.62806)	Top-1 acc 53.906 (59.818)	Top-5 acc 77.734 (81.248)	lr 0.01304
Train [59][1140/3239]	Time 3.833 (0.923)	Data Time 3.580 (0.430)	Loss 2.5886 (2.6569)	Entropy 0.62896 (0.62806)	Top-1 acc 58.594 (59.805)	Top-5 acc 83.594 (81.244)	lr 0.01304
Train [59][1150/3239]	Time 0.231 (0.926)	Data Time 0.001 (0.434)	Loss 2.5618 (2.6568)	Entropy 0.62914 (0.62807)	Top-1 acc 64.844 (59.797)	Top-5 acc 82.422 (81.248)	lr 0.01304
Train [59][1160/3239]	Time 0.245 (0.921)	Data Time 0.001 (0.430)	Loss 2.6746 (2.6572)	Entropy 0.62931 (0.62808)	Top-1 acc 59.375 (59.795)	Top-5 acc 81.250 (81.237)	lr 0.01304
Train [59][1170/3239]	Time 7.283 (0.926)	Data Time 7.034 (0.436)	Loss 2.8240 (2.6576)	Entropy 0.62951 (0.62809)	Top-1 acc 57.812 (59.787)	Top-5 acc 80.078 (81.225)	lr 0.01304
Train [59][1180/3239]	Time 0.331 (0.933)	Data Time 0.001 (0.444)	Loss 2.5789 (2.6573)	Entropy 0.62956 (0.62811)	Top-1 acc 60.156 (59.793)	Top-5 acc 83.594 (81.236)	lr 0.01304
Train [59][1190/3239]	Time 0.259 (0.929)	Data Time 0.001 (0.440)	Loss 2.6515 (2.6579)	Entropy 0.62957 (0.62812)	Top-1 acc 61.719 (59.779)	Top-5 acc 81.641 (81.222)	lr 0.01303
Train [59][1200/3239]	Time 0.231 (0.928)	Data Time 0.001 (0.440)	Loss 2.6915 (2.6577)	Entropy 0.62911 (0.62813)	Top-1 acc 61.328 (59.786)	Top-5 acc 79.688 (81.219)	lr 0.01303
Train [59][1210/3239]	Time 0.232 (0.940)	Data Time 0.001 (0.452)	Loss 2.6386 (2.6581)	Entropy 0.62926 (0.62814)	Top-1 acc 62.500 (59.785)	Top-5 acc 80.078 (81.215)	lr 0.01303
Train [59][1220/3239]	Time 0.232 (0.935)	Data Time 0.002 (0.449)	Loss 2.8462 (2.6585)	Entropy 0.62951 (0.62815)	Top-1 acc 55.859 (59.783)	Top-5 acc 76.562 (81.209)	lr 0.01303
Train [59][1230/3239]	Time 0.258 (0.938)	Data Time 0.001 (0.451)	Loss 2.7747 (2.6585)	Entropy 0.62956 (0.62816)	Top-1 acc 60.547 (59.787)	Top-5 acc 78.125 (81.207)	lr 0.01303
Train [59][1240/3239]	Time 10.058 (0.945)	Data Time 9.765 (0.459)	Loss 2.5926 (2.6586)	Entropy 0.63014 (0.62817)	Top-1 acc 63.672 (59.789)	Top-5 acc 82.812 (81.203)	lr 0.01303
Train [59][1250/3239]	Time 0.241 (0.941)	Data Time 0.001 (0.455)	Loss 2.6099 (2.6587)	Entropy 0.62996 (0.62819)	Top-1 acc 58.203 (59.784)	Top-5 acc 84.375 (81.202)	lr 0.01303
Train [59][1260/3239]	Time 0.461 (0.944)	Data Time 0.189 (0.459)	Loss 2.7396 (2.6584)	Entropy 0.63018 (0.62820)	Top-1 acc 56.641 (59.796)	Top-5 acc 80.469 (81.206)	lr 0.01303
Train [59][1270/3239]	Time 0.353 (0.942)	Data Time 0.001 (0.458)	Loss 2.7832 (2.6581)	Entropy 0.62993 (0.62822)	Top-1 acc 56.250 (59.809)	Top-5 acc 77.734 (81.206)	lr 0.01303
Train [59][1280/3239]	Time 0.234 (0.947)	Data Time 0.001 (0.464)	Loss 2.8032 (2.6581)	Entropy 0.63013 (0.62823)	Top-1 acc 57.031 (59.809)	Top-5 acc 76.562 (81.200)	lr 0.01303
Train [59][1290/3239]	Time 0.252 (0.952)	Data Time 0.001 (0.469)	Loss 2.6649 (2.6591)	Entropy 0.63040 (0.62824)	Top-1 acc 58.984 (59.780)	Top-5 acc 82.422 (81.187)	lr 0.01302
Train [59][1300/3239]	Time 2.831 (0.950)	Data Time 2.580 (0.468)	Loss 2.9138 (2.6592)	Entropy 0.63055 (0.62826)	Top-1 acc 55.469 (59.774)	Top-5 acc 75.391 (81.179)	lr 0.01302
Train [59][1310/3239]	Time 0.233 (0.952)	Data Time 0.001 (0.470)	Loss 2.9394 (2.6592)	Entropy 0.63066 (0.62828)	Top-1 acc 51.562 (59.773)	Top-5 acc 78.125 (81.177)	lr 0.01302
Train [59][1320/3239]	Time 3.457 (0.953)	Data Time 3.194 (0.471)	Loss 2.6603 (2.6591)	Entropy 0.63071 (0.62830)	Top-1 acc 59.375 (59.777)	Top-5 acc 82.422 (81.180)	lr 0.01302
Train [59][1330/3239]	Time 0.228 (0.955)	Data Time 0.001 (0.474)	Loss 2.6815 (2.6590)	Entropy 0.63083 (0.62832)	Top-1 acc 59.766 (59.770)	Top-5 acc 79.688 (81.181)	lr 0.01302
Train [59][1340/3239]	Time 0.320 (0.958)	Data Time 0.001 (0.477)	Loss 2.5717 (2.6591)	Entropy 0.63057 (0.62833)	Top-1 acc 60.938 (59.761)	Top-5 acc 82.812 (81.176)	lr 0.01302
Train [59][1350/3239]	Time 0.317 (0.984)	Data Time 0.029 (0.479)	Loss 2.6976 (2.6595)	Entropy 0.63066 (0.62835)	Top-1 acc 53.906 (59.745)	Top-5 acc 78.906 (81.168)	lr 0.01302
Train [59][1360/3239]	Time 0.248 (0.980)	Data Time 0.002 (0.476)	Loss 2.6229 (2.6596)	Entropy 0.63098 (0.62837)	Top-1 acc 62.500 (59.746)	Top-5 acc 79.688 (81.163)	lr 0.01302
Train [59][1370/3239]	Time 0.293 (0.976)	Data Time 0.002 (0.472)	Loss 2.3516 (2.6597)	Entropy 0.63150 (0.62839)	Top-1 acc 69.531 (59.745)	Top-5 acc 89.844 (81.160)	lr 0.01302
Train [59][1380/3239]	Time 0.232 (0.972)	Data Time 0.001 (0.469)	Loss 2.6480 (2.6596)	Entropy 0.63118 (0.62841)	Top-1 acc 60.156 (59.751)	Top-5 acc 80.859 (81.154)	lr 0.01301
Train [59][1390/3239]	Time 0.244 (0.970)	Data Time 0.001 (0.467)	Loss 2.7372 (2.6593)	Entropy 0.63097 (0.62843)	Top-1 acc 55.859 (59.761)	Top-5 acc 79.688 (81.159)	lr 0.01301
Train [59][1400/3239]	Time 4.724 (0.969)	Data Time 4.477 (0.467)	Loss 2.8039 (2.6592)	Entropy 0.63068 (0.62845)	Top-1 acc 53.125 (59.759)	Top-5 acc 78.516 (81.161)	lr 0.01301
Train [59][1410/3239]	Time 0.275 (0.969)	Data Time 0.001 (0.467)	Loss 2.7077 (2.6593)	Entropy 0.63061 (0.62846)	Top-1 acc 58.203 (59.763)	Top-5 acc 79.688 (81.160)	lr 0.01301
Train [59][1420/3239]	Time 8.090 (0.977)	Data Time 7.817 (0.476)	Loss 2.6457 (2.6595)	Entropy 0.63067 (0.62848)	Top-1 acc 61.328 (59.765)	Top-5 acc 78.906 (81.158)	lr 0.01301
Train [59][1430/3239]	Time 0.332 (0.973)	Data Time 0.001 (0.473)	Loss 2.6499 (2.6597)	Entropy 0.63077 (0.62849)	Top-1 acc 62.891 (59.760)	Top-5 acc 80.859 (81.153)	lr 0.01301
Train [59][1440/3239]	Time 0.232 (0.974)	Data Time 0.001 (0.474)	Loss 2.6002 (2.6594)	Entropy 0.63092 (0.62851)	Top-1 acc 65.234 (59.761)	Top-5 acc 83.984 (81.163)	lr 0.01301
Train [59][1450/3239]	Time 0.232 (0.981)	Data Time 0.001 (0.482)	Loss 2.6309 (2.6596)	Entropy 0.63077 (0.62853)	Top-1 acc 62.109 (59.759)	Top-5 acc 81.641 (81.163)	lr 0.01301
Train [59][1460/3239]	Time 2.033 (0.979)	Data Time 1.804 (0.480)	Loss 2.8286 (2.6599)	Entropy 0.63074 (0.62854)	Top-1 acc 55.469 (59.749)	Top-5 acc 78.125 (81.159)	lr 0.01301
Train [59][1470/3239]	Time 0.238 (0.978)	Data Time 0.001 (0.480)	Loss 2.5921 (2.6599)	Entropy 0.63042 (0.62856)	Top-1 acc 60.938 (59.751)	Top-5 acc 84.375 (81.160)	lr 0.01301
Train [59][1480/3239]	Time 0.231 (0.988)	Data Time 0.001 (0.490)	Loss 2.7174 (2.6601)	Entropy 0.63020 (0.62857)	Top-1 acc 61.328 (59.746)	Top-5 acc 79.688 (81.156)	lr 0.01300
Train [59][1490/3239]	Time 0.234 (0.986)	Data Time 0.001 (0.489)	Loss 2.8069 (2.6602)	Entropy 0.63034 (0.62858)	Top-1 acc 57.031 (59.748)	Top-5 acc 79.297 (81.154)	lr 0.01300
Train [59][1500/3239]	Time 0.334 (0.985)	Data Time 0.001 (0.488)	Loss 2.6802 (2.6606)	Entropy 0.63026 (0.62859)	Top-1 acc 60.156 (59.731)	Top-5 acc 79.297 (81.149)	lr 0.01300
Train [59][1510/3239]	Time 10.567 (0.993)	Data Time 10.325 (0.497)	Loss 2.6729 (2.6610)	Entropy 0.62998 (0.62860)	Top-1 acc 59.375 (59.717)	Top-5 acc 82.031 (81.140)	lr 0.01300
Train [59][1520/3239]	Time 0.246 (0.992)	Data Time 0.001 (0.497)	Loss 2.5392 (2.6612)	Entropy 0.62969 (0.62861)	Top-1 acc 62.500 (59.717)	Top-5 acc 82.812 (81.135)	lr 0.01300
Train [59][1530/3239]	Time 0.241 (0.994)	Data Time 0.001 (0.499)	Loss 2.6268 (2.6609)	Entropy 0.62942 (0.62862)	Top-1 acc 60.938 (59.725)	Top-5 acc 82.422 (81.141)	lr 0.01300
Train [59][1540/3239]	Time 0.239 (0.995)	Data Time 0.001 (0.500)	Loss 2.6480 (2.6611)	Entropy 0.62926 (0.62862)	Top-1 acc 58.984 (59.716)	Top-5 acc 81.250 (81.140)	lr 0.01300
Train [59][1550/3239]	Time 0.235 (1.001)	Data Time 0.001 (0.507)	Loss 2.5272 (2.6607)	Entropy 0.62914 (0.62863)	Top-1 acc 61.719 (59.724)	Top-5 acc 82.031 (81.149)	lr 0.01300
Train [59][1560/3239]	Time 0.233 (1.000)	Data Time 0.001 (0.507)	Loss 2.7398 (2.6606)	Entropy 0.62893 (0.62863)	Top-1 acc 58.984 (59.723)	Top-5 acc 80.469 (81.149)	lr 0.01300
Train [59][1570/3239]	Time 0.253 (1.001)	Data Time 0.001 (0.509)	Loss 2.6099 (2.6609)	Entropy 0.62884 (0.62863)	Top-1 acc 60.547 (59.714)	Top-5 acc 80.859 (81.144)	lr 0.01300
Train [59][1580/3239]	Time 1.132 (1.006)	Data Time 0.880 (0.513)	Loss 2.5593 (2.6613)	Entropy 0.62901 (0.62863)	Top-1 acc 64.453 (59.709)	Top-5 acc 83.984 (81.135)	lr 0.01299
Train [59][1590/3239]	Time 0.255 (1.006)	Data Time 0.001 (0.514)	Loss 2.7367 (2.6615)	Entropy 0.62939 (0.62864)	Top-1 acc 57.031 (59.714)	Top-5 acc 82.031 (81.131)	lr 0.01299
Train [59][1600/3239]	Time 0.229 (1.004)	Data Time 0.001 (0.513)	Loss 2.7838 (2.6617)	Entropy 0.62949 (0.62864)	Top-1 acc 58.984 (59.714)	Top-5 acc 78.906 (81.128)	lr 0.01299
Train [59][1610/3239]	Time 0.249 (1.015)	Data Time 0.001 (0.524)	Loss 2.7131 (2.6618)	Entropy 0.62928 (0.62865)	Top-1 acc 55.859 (59.708)	Top-5 acc 78.906 (81.124)	lr 0.01299
Train [59][1620/3239]	Time 5.629 (1.016)	Data Time 5.377 (0.525)	Loss 2.6576 (2.6616)	Entropy 0.62942 (0.62865)	Top-1 acc 54.297 (59.709)	Top-5 acc 81.641 (81.126)	lr 0.01299
Train [59][1630/3239]	Time 0.239 (1.012)	Data Time 0.001 (0.522)	Loss 2.5911 (2.6619)	Entropy 0.62938 (0.62865)	Top-1 acc 59.375 (59.701)	Top-5 acc 81.641 (81.117)	lr 0.01299
Train [59][1640/3239]	Time 0.257 (1.021)	Data Time 0.001 (0.531)	Loss 2.4150 (2.6616)	Entropy 0.62970 (0.62866)	Top-1 acc 64.453 (59.704)	Top-5 acc 88.281 (81.126)	lr 0.01299
Train [59][1650/3239]	Time 0.261 (1.022)	Data Time 0.001 (0.532)	Loss 2.5730 (2.6617)	Entropy 0.63012 (0.62867)	Top-1 acc 61.719 (59.704)	Top-5 acc 83.203 (81.126)	lr 0.01299
Train [59][1660/3239]	Time 0.363 (1.019)	Data Time 0.001 (0.531)	Loss 2.7530 (2.6618)	Entropy 0.63034 (0.62868)	Top-1 acc 58.203 (59.704)	Top-5 acc 79.688 (81.122)	lr 0.01299
Train [59][1670/3239]	Time 13.500 (1.025)	Data Time 13.230 (0.537)	Loss 2.7053 (2.6617)	Entropy 0.63023 (0.62869)	Top-1 acc 58.203 (59.704)	Top-5 acc 78.125 (81.123)	lr 0.01299
Train [59][1680/3239]	Time 0.235 (1.027)	Data Time 0.001 (0.539)	Loss 2.7688 (2.6621)	Entropy 0.63038 (0.62870)	Top-1 acc 57.031 (59.699)	Top-5 acc 81.250 (81.119)	lr 0.01298
Train [59][1690/3239]	Time 0.229 (1.024)	Data Time 0.001 (0.537)	Loss 2.6053 (2.6619)	Entropy 0.63065 (0.62871)	Top-1 acc 61.719 (59.706)	Top-5 acc 82.422 (81.125)	lr 0.01298
Train [59][1700/3239]	Time 0.239 (1.021)	Data Time 0.001 (0.534)	Loss 2.6153 (2.6621)	Entropy 0.63062 (0.62872)	Top-1 acc 57.422 (59.703)	Top-5 acc 83.203 (81.117)	lr 0.01298
Train [59][1710/3239]	Time 0.236 (1.030)	Data Time 0.001 (0.544)	Loss 2.8223 (2.6623)	Entropy 0.63023 (0.62873)	Top-1 acc 55.469 (59.697)	Top-5 acc 80.469 (81.118)	lr 0.01298
Train [59][1720/3239]	Time 0.251 (1.027)	Data Time 0.001 (0.540)	Loss 2.4775 (2.6621)	Entropy 0.63016 (0.62874)	Top-1 acc 65.625 (59.695)	Top-5 acc 82.422 (81.120)	lr 0.01298
Train [59][1730/3239]	Time 0.358 (1.023)	Data Time 0.001 (0.537)	Loss 2.7199 (2.6625)	Entropy 0.62995 (0.62874)	Top-1 acc 58.984 (59.687)	Top-5 acc 80.469 (81.117)	lr 0.01298
Train [59][1740/3239]	Time 3.392 (1.027)	Data Time 3.136 (0.542)	Loss 2.5728 (2.6623)	Entropy 0.62981 (0.62875)	Top-1 acc 60.938 (59.687)	Top-5 acc 82.031 (81.120)	lr 0.01298
Train [59][1750/3239]	Time 0.257 (1.024)	Data Time 0.001 (0.538)	Loss 2.6751 (2.6624)	Entropy 0.63019 (0.62876)	Top-1 acc 58.984 (59.689)	Top-5 acc 81.641 (81.118)	lr 0.01298
Train [59][1760/3239]	Time 0.254 (1.020)	Data Time 0.001 (0.535)	Loss 2.7010 (2.6623)	Entropy 0.63039 (0.62877)	Top-1 acc 56.250 (59.696)	Top-5 acc 79.297 (81.119)	lr 0.01298
Train [59][1770/3239]	Time 0.248 (1.022)	Data Time 0.001 (0.538)	Loss 2.7086 (2.6622)	Entropy 0.63032 (0.62877)	Top-1 acc 58.984 (59.697)	Top-5 acc 79.688 (81.121)	lr 0.01298
Train [59][1780/3239]	Time 0.232 (1.022)	Data Time 0.001 (0.538)	Loss 2.7763 (2.6619)	Entropy 0.63042 (0.62878)	Top-1 acc 54.688 (59.704)	Top-5 acc 78.516 (81.124)	lr 0.01297
Train [59][1790/3239]	Time 0.233 (1.019)	Data Time 0.001 (0.535)	Loss 2.7427 (2.6620)	Entropy 0.63044 (0.62879)	Top-1 acc 57.031 (59.702)	Top-5 acc 79.688 (81.123)	lr 0.01297
Train [59][1800/3239]	Time 0.243 (1.024)	Data Time 0.001 (0.541)	Loss 2.6320 (2.6619)	Entropy 0.63057 (0.62880)	Top-1 acc 62.109 (59.706)	Top-5 acc 83.203 (81.127)	lr 0.01297
Train [59][1810/3239]	Time 0.234 (1.027)	Data Time 0.001 (0.544)	Loss 2.5256 (2.6620)	Entropy 0.63047 (0.62881)	Top-1 acc 60.156 (59.702)	Top-5 acc 84.766 (81.125)	lr 0.01297
Train [59][1820/3239]	Time 0.357 (1.023)	Data Time 0.001 (0.541)	Loss 2.6753 (2.6619)	Entropy 0.63052 (0.62882)	Top-1 acc 57.422 (59.710)	Top-5 acc 80.078 (81.123)	lr 0.01297
Train [59][1830/3239]	Time 11.890 (1.029)	Data Time 11.644 (0.547)	Loss 2.6045 (2.6621)	Entropy 0.63059 (0.62883)	Top-1 acc 61.328 (59.705)	Top-5 acc 80.469 (81.118)	lr 0.01297
Train [59][1840/3239]	Time 0.230 (1.030)	Data Time 0.001 (0.548)	Loss 2.4569 (2.6618)	Entropy 0.63049 (0.62884)	Top-1 acc 66.016 (59.720)	Top-5 acc 85.547 (81.122)	lr 0.01297
Train [59][1850/3239]	Time 0.235 (1.026)	Data Time 0.001 (0.545)	Loss 2.4849 (2.6616)	Entropy 0.63018 (0.62885)	Top-1 acc 64.453 (59.728)	Top-5 acc 84.766 (81.126)	lr 0.01297
Train [59][1860/3239]	Time 0.229 (1.027)	Data Time 0.001 (0.546)	Loss 2.7568 (2.6619)	Entropy 0.63015 (0.62886)	Top-1 acc 59.766 (59.723)	Top-5 acc 76.562 (81.116)	lr 0.01297
Train [59][1870/3239]	Time 0.231 (1.036)	Data Time 0.001 (0.555)	Loss 2.6186 (2.6618)	Entropy 0.62982 (0.62886)	Top-1 acc 63.281 (59.727)	Top-5 acc 80.078 (81.115)	lr 0.01297
Train [59][1880/3239]	Time 0.237 (1.033)	Data Time 0.001 (0.552)	Loss 2.6629 (2.6616)	Entropy 0.63011 (0.62887)	Top-1 acc 61.328 (59.731)	Top-5 acc 81.641 (81.119)	lr 0.01296
Train [59][1890/3239]	Time 0.346 (1.029)	Data Time 0.001 (0.549)	Loss 2.6812 (2.6615)	Entropy 0.62999 (0.62887)	Top-1 acc 60.156 (59.736)	Top-5 acc 83.203 (81.124)	lr 0.01296
Train [59][1900/3239]	Time 0.253 (1.036)	Data Time 0.001 (0.556)	Loss 2.6323 (2.6620)	Entropy 0.63001 (0.62888)	Top-1 acc 59.766 (59.722)	Top-5 acc 82.031 (81.115)	lr 0.01296
Train [59][1910/3239]	Time 0.258 (1.033)	Data Time 0.001 (0.553)	Loss 2.4653 (2.6618)	Entropy 0.62989 (0.62889)	Top-1 acc 62.109 (59.725)	Top-5 acc 85.547 (81.120)	lr 0.01296
Train [59][1920/3239]	Time 0.223 (1.030)	Data Time 0.001 (0.550)	Loss 2.5556 (2.6615)	Entropy 0.63020 (0.62889)	Top-1 acc 62.891 (59.733)	Top-5 acc 83.203 (81.127)	lr 0.01296
Train [59][1930/3239]	Time 0.263 (1.032)	Data Time 0.001 (0.553)	Loss 2.6557 (2.6616)	Entropy 0.63052 (0.62890)	Top-1 acc 59.375 (59.725)	Top-5 acc 81.250 (81.124)	lr 0.01296
Train [59][1940/3239]	Time 0.249 (1.029)	Data Time 0.002 (0.550)	Loss 2.7037 (2.6617)	Entropy 0.63016 (0.62891)	Top-1 acc 58.203 (59.725)	Top-5 acc 81.250 (81.126)	lr 0.01296
Train [59][1950/3239]	Time 0.241 (1.026)	Data Time 0.001 (0.547)	Loss 2.4355 (2.6617)	Entropy 0.63022 (0.62891)	Top-1 acc 65.234 (59.725)	Top-5 acc 84.375 (81.126)	lr 0.01296
Train [59][1960/3239]	Time 0.228 (1.027)	Data Time 0.001 (0.548)	Loss 2.5769 (2.6616)	Entropy 0.62985 (0.62892)	Top-1 acc 61.719 (59.723)	Top-5 acc 82.031 (81.127)	lr 0.01296
Train [59][1970/3239]	Time 0.236 (1.025)	Data Time 0.001 (0.547)	Loss 2.7294 (2.6619)	Entropy 0.62974 (0.62892)	Top-1 acc 57.812 (59.714)	Top-5 acc 80.078 (81.127)	lr 0.01296
Train [59][1980/3239]	Time 0.299 (1.022)	Data Time 0.001 (0.544)	Loss 2.6310 (2.6619)	Entropy 0.62999 (0.62893)	Top-1 acc 58.984 (59.714)	Top-5 acc 81.641 (81.121)	lr 0.01295
Train [59][1990/3239]	Time 6.765 (1.022)	Data Time 6.465 (0.545)	Loss 2.8061 (2.6620)	Entropy 0.63021 (0.62893)	Top-1 acc 59.375 (59.709)	Top-5 acc 78.906 (81.119)	lr 0.01295
Train [59][2000/3239]	Time 0.331 (1.040)	Data Time 0.004 (0.544)	Loss 2.6260 (2.6620)	Entropy 0.63040 (0.62894)	Top-1 acc 60.547 (59.705)	Top-5 acc 82.422 (81.122)	lr 0.01295
Train [59][2010/3239]	Time 0.254 (1.037)	Data Time 0.002 (0.541)	Loss 2.5461 (2.6620)	Entropy 0.63030 (0.62895)	Top-1 acc 62.891 (59.704)	Top-5 acc 85.938 (81.123)	lr 0.01295
Train [59][2020/3239]	Time 0.256 (1.034)	Data Time 0.002 (0.539)	Loss 2.5433 (2.6619)	Entropy 0.63036 (0.62896)	Top-1 acc 64.453 (59.710)	Top-5 acc 85.156 (81.125)	lr 0.01295
Train [59][2030/3239]	Time 0.288 (1.031)	Data Time 0.001 (0.536)	Loss 2.6656 (2.6621)	Entropy 0.63063 (0.62896)	Top-1 acc 57.812 (59.704)	Top-5 acc 82.812 (81.123)	lr 0.01295
Train [59][2040/3239]	Time 0.248 (1.028)	Data Time 0.001 (0.534)	Loss 2.6265 (2.6624)	Entropy 0.63041 (0.62897)	Top-1 acc 59.766 (59.696)	Top-5 acc 81.641 (81.118)	lr 0.01295
Train [59][2050/3239]	Time 0.347 (1.025)	Data Time 0.001 (0.531)	Loss 2.7240 (2.6628)	Entropy 0.63023 (0.62898)	Top-1 acc 59.375 (59.688)	Top-5 acc 78.516 (81.104)	lr 0.01295
Train [59][2060/3239]	Time 0.234 (1.022)	Data Time 0.001 (0.528)	Loss 2.5341 (2.6628)	Entropy 0.63010 (0.62898)	Top-1 acc 62.500 (59.687)	Top-5 acc 85.156 (81.107)	lr 0.01295
Train [59][2070/3239]	Time 0.249 (1.026)	Data Time 0.002 (0.532)	Loss 2.6057 (2.6627)	Entropy 0.63021 (0.62899)	Top-1 acc 62.891 (59.693)	Top-5 acc 82.812 (81.106)	lr 0.01295
Train [59][2080/3239]	Time 0.239 (1.023)	Data Time 0.001 (0.529)	Loss 2.5862 (2.6625)	Entropy 0.63050 (0.62899)	Top-1 acc 61.719 (59.694)	Top-5 acc 83.203 (81.112)	lr 0.01294
Train [59][2090/3239]	Time 0.238 (1.021)	Data Time 0.001 (0.528)	Loss 2.8400 (2.6627)	Entropy 0.63035 (0.62900)	Top-1 acc 52.344 (59.690)	Top-5 acc 77.734 (81.109)	lr 0.01294
Train [59][2100/3239]	Time 0.319 (1.028)	Data Time 0.002 (0.535)	Loss 2.6445 (2.6628)	Entropy 0.63041 (0.62901)	Top-1 acc 59.375 (59.687)	Top-5 acc 81.250 (81.105)	lr 0.01294
Train [59][2110/3239]	Time 0.248 (1.028)	Data Time 0.001 (0.535)	Loss 2.6922 (2.6625)	Entropy 0.63036 (0.62901)	Top-1 acc 56.250 (59.688)	Top-5 acc 80.469 (81.109)	lr 0.01294
Train [59][2120/3239]	Time 0.233 (1.025)	Data Time 0.001 (0.532)	Loss 2.6770 (2.6624)	Entropy 0.63024 (0.62902)	Top-1 acc 57.422 (59.693)	Top-5 acc 82.422 (81.111)	lr 0.01294
Train [59][2130/3239]	Time 0.257 (1.032)	Data Time 0.002 (0.540)	Loss 2.6843 (2.6625)	Entropy 0.63002 (0.62903)	Top-1 acc 58.203 (59.692)	Top-5 acc 82.031 (81.110)	lr 0.01294
Train [59][2140/3239]	Time 0.347 (1.032)	Data Time 0.001 (0.540)	Loss 2.6324 (2.6624)	Entropy 0.62980 (0.62903)	Top-1 acc 62.500 (59.695)	Top-5 acc 80.078 (81.109)	lr 0.01294
Train [59][2150/3239]	Time 0.250 (1.029)	Data Time 0.001 (0.537)	Loss 2.4636 (2.6620)	Entropy 0.63001 (0.62903)	Top-1 acc 64.453 (59.706)	Top-5 acc 87.500 (81.116)	lr 0.01294
Train [59][2160/3239]	Time 18.345 (1.035)	Data Time 18.079 (0.543)	Loss 2.6265 (2.6619)	Entropy 0.62990 (0.62904)	Top-1 acc 60.547 (59.709)	Top-5 acc 81.250 (81.116)	lr 0.01294
Train [59][2170/3239]	Time 0.232 (1.036)	Data Time 0.001 (0.545)	Loss 2.8254 (2.6624)	Entropy 0.62983 (0.62904)	Top-1 acc 57.812 (59.706)	Top-5 acc 77.734 (81.105)	lr 0.01294
Train [59][2180/3239]	Time 0.248 (1.033)	Data Time 0.001 (0.543)	Loss 2.3203 (2.6622)	Entropy 0.63014 (0.62905)	Top-1 acc 63.672 (59.711)	Top-5 acc 88.672 (81.109)	lr 0.01293
Train [59][2190/3239]	Time 0.224 (1.031)	Data Time 0.001 (0.541)	Loss 2.6210 (2.6621)	Entropy 0.62979 (0.62905)	Top-1 acc 61.719 (59.714)	Top-5 acc 82.031 (81.111)	lr 0.01293
Train [59][2200/3239]	Time 8.414 (1.041)	Data Time 8.137 (0.550)	Loss 2.7826 (2.6617)	Entropy 0.62990 (0.62905)	Top-1 acc 58.594 (59.728)	Top-5 acc 80.859 (81.116)	lr 0.01293
Train [59][2210/3239]	Time 0.390 (1.038)	Data Time 0.001 (0.548)	Loss 2.6975 (2.6621)	Entropy 0.62956 (0.62906)	Top-1 acc 57.422 (59.719)	Top-5 acc 80.469 (81.111)	lr 0.01293
Train [59][2220/3239]	Time 0.259 (1.035)	Data Time 0.001 (0.546)	Loss 2.7213 (2.6625)	Entropy 0.62951 (0.62906)	Top-1 acc 57.812 (59.708)	Top-5 acc 81.641 (81.108)	lr 0.01293
Train [59][2230/3239]	Time 0.239 (1.039)	Data Time 0.001 (0.549)	Loss 2.6328 (2.6623)	Entropy 0.62972 (0.62906)	Top-1 acc 60.938 (59.717)	Top-5 acc 82.812 (81.108)	lr 0.01293
Train [59][2240/3239]	Time 0.260 (1.041)	Data Time 0.001 (0.551)	Loss 2.7713 (2.6622)	Entropy 0.62957 (0.62906)	Top-1 acc 55.078 (59.720)	Top-5 acc 81.250 (81.111)	lr 0.01293
Train [59][2250/3239]	Time 0.241 (1.038)	Data Time 0.001 (0.549)	Loss 2.6661 (2.6624)	Entropy 0.62945 (0.62907)	Top-1 acc 60.547 (59.715)	Top-5 acc 80.078 (81.108)	lr 0.01293
Train [59][2260/3239]	Time 0.243 (1.043)	Data Time 0.001 (0.554)	Loss 2.5392 (2.6623)	Entropy 0.62946 (0.62907)	Top-1 acc 61.719 (59.717)	Top-5 acc 82.812 (81.110)	lr 0.01293
Train [59][2270/3239]	Time 0.276 (1.045)	Data Time 0.001 (0.557)	Loss 2.7117 (2.6625)	Entropy 0.62958 (0.62907)	Top-1 acc 60.156 (59.709)	Top-5 acc 81.250 (81.103)	lr 0.01293
Train [59][2280/3239]	Time 0.231 (1.042)	Data Time 0.001 (0.555)	Loss 2.8751 (2.6627)	Entropy 0.62950 (0.62907)	Top-1 acc 54.688 (59.703)	Top-5 acc 75.391 (81.100)	lr 0.01292
Train [59][2290/3239]	Time 0.243 (1.046)	Data Time 0.001 (0.559)	Loss 2.8145 (2.6629)	Entropy 0.62911 (0.62907)	Top-1 acc 55.859 (59.699)	Top-5 acc 80.078 (81.097)	lr 0.01292
Train [59][2300/3239]	Time 0.245 (1.048)	Data Time 0.001 (0.561)	Loss 2.7814 (2.6629)	Entropy 0.62931 (0.62907)	Top-1 acc 55.469 (59.697)	Top-5 acc 82.031 (81.100)	lr 0.01292
Train [59][2310/3239]	Time 0.256 (1.046)	Data Time 0.001 (0.559)	Loss 2.6483 (2.6627)	Entropy 0.62946 (0.62908)	Top-1 acc 60.156 (59.705)	Top-5 acc 83.203 (81.104)	lr 0.01292
Train [59][2320/3239]	Time 14.130 (1.049)	Data Time 13.817 (0.562)	Loss 2.7314 (2.6626)	Entropy 0.62918 (0.62908)	Top-1 acc 60.938 (59.705)	Top-5 acc 81.641 (81.104)	lr 0.01292
Train [59][2330/3239]	Time 0.233 (1.051)	Data Time 0.001 (0.564)	Loss 2.7184 (2.6626)	Entropy 0.62935 (0.62908)	Top-1 acc 57.812 (59.699)	Top-5 acc 80.078 (81.104)	lr 0.01292
Train [59][2340/3239]	Time 0.241 (1.048)	Data Time 0.001 (0.562)	Loss 2.7626 (2.6627)	Entropy 0.62948 (0.62908)	Top-1 acc 58.203 (59.696)	Top-5 acc 79.297 (81.106)	lr 0.01292
Train [59][2350/3239]	Time 0.263 (1.046)	Data Time 0.001 (0.560)	Loss 2.5570 (2.6626)	Entropy 0.62940 (0.62908)	Top-1 acc 64.453 (59.698)	Top-5 acc 80.859 (81.106)	lr 0.01292
Train [59][2360/3239]	Time 0.684 (1.054)	Data Time 0.434 (0.569)	Loss 2.6635 (2.6624)	Entropy 0.62915 (0.62908)	Top-1 acc 62.500 (59.707)	Top-5 acc 80.078 (81.108)	lr 0.01292
Train [59][2370/3239]	Time 0.328 (1.052)	Data Time 0.001 (0.567)	Loss 2.6513 (2.6625)	Entropy 0.62889 (0.62908)	Top-1 acc 58.984 (59.707)	Top-5 acc 83.594 (81.106)	lr 0.01292
Train [59][2380/3239]	Time 0.234 (1.049)	Data Time 0.001 (0.564)	Loss 2.5645 (2.6625)	Entropy 0.62856 (0.62908)	Top-1 acc 62.891 (59.710)	Top-5 acc 84.375 (81.107)	lr 0.01291
Train [59][2390/3239]	Time 0.256 (1.055)	Data Time 0.001 (0.571)	Loss 2.4869 (2.6624)	Entropy 0.62858 (0.62908)	Top-1 acc 63.672 (59.709)	Top-5 acc 85.156 (81.109)	lr 0.01291
Train [59][2400/3239]	Time 0.235 (1.055)	Data Time 0.001 (0.571)	Loss 2.4618 (2.6623)	Entropy 0.62851 (0.62908)	Top-1 acc 63.672 (59.712)	Top-5 acc 84.375 (81.112)	lr 0.01291
Train [59][2410/3239]	Time 0.235 (1.053)	Data Time 0.001 (0.568)	Loss 2.7071 (2.6623)	Entropy 0.62854 (0.62907)	Top-1 acc 60.156 (59.713)	Top-5 acc 80.469 (81.110)	lr 0.01291
Train [59][2420/3239]	Time 0.238 (1.059)	Data Time 0.002 (0.575)	Loss 2.8521 (2.6621)	Entropy 0.62857 (0.62907)	Top-1 acc 57.422 (59.716)	Top-5 acc 77.734 (81.114)	lr 0.01291
Train [59][2430/3239]	Time 0.242 (1.060)	Data Time 0.001 (0.577)	Loss 2.7398 (2.6623)	Entropy 0.62893 (0.62907)	Top-1 acc 60.156 (59.713)	Top-5 acc 77.734 (81.110)	lr 0.01291
Train [59][2440/3239]	Time 0.324 (1.057)	Data Time 0.001 (0.574)	Loss 2.7565 (2.6624)	Entropy 0.62904 (0.62907)	Top-1 acc 58.594 (59.712)	Top-5 acc 77.734 (81.111)	lr 0.01291
Train [59][2450/3239]	Time 0.246 (1.062)	Data Time 0.001 (0.579)	Loss 2.8873 (2.6625)	Entropy 0.62917 (0.62907)	Top-1 acc 52.344 (59.711)	Top-5 acc 76.172 (81.106)	lr 0.01291
Train [59][2460/3239]	Time 0.229 (1.064)	Data Time 0.001 (0.582)	Loss 2.6762 (2.6624)	Entropy 0.62873 (0.62907)	Top-1 acc 60.938 (59.711)	Top-5 acc 78.516 (81.105)	lr 0.01291
Train [59][2470/3239]	Time 0.233 (1.062)	Data Time 0.001 (0.580)	Loss 2.7491 (2.6625)	Entropy 0.62882 (0.62907)	Top-1 acc 57.422 (59.711)	Top-5 acc 78.125 (81.103)	lr 0.01290
Train [59][2480/3239]	Time 9.602 (1.064)	Data Time 9.363 (0.582)	Loss 2.7491 (2.6625)	Entropy 0.62872 (0.62907)	Top-1 acc 57.031 (59.710)	Top-5 acc 80.078 (81.102)	lr 0.01290
Train [59][2490/3239]	Time 0.224 (1.069)	Data Time 0.001 (0.587)	Loss 2.7949 (2.6626)	Entropy 0.62874 (0.62907)	Top-1 acc 56.641 (59.704)	Top-5 acc 78.125 (81.101)	lr 0.01290
Train [59][2500/3239]	Time 0.240 (1.066)	Data Time 0.001 (0.585)	Loss 2.6094 (2.6627)	Entropy 0.62838 (0.62906)	Top-1 acc 59.375 (59.702)	Top-5 acc 82.422 (81.100)	lr 0.01290
Train [59][2510/3239]	Time 0.263 (1.064)	Data Time 0.001 (0.583)	Loss 2.6712 (2.6628)	Entropy 0.62834 (0.62906)	Top-1 acc 57.031 (59.694)	Top-5 acc 83.203 (81.096)	lr 0.01290
Train [59][2520/3239]	Time 0.228 (1.076)	Data Time 0.001 (0.595)	Loss 2.7202 (2.6629)	Entropy 0.62856 (0.62906)	Top-1 acc 54.297 (59.688)	Top-5 acc 80.469 (81.095)	lr 0.01290
Train [59][2530/3239]	Time 0.324 (1.073)	Data Time 0.001 (0.593)	Loss 2.6418 (2.6629)	Entropy 0.62857 (0.62906)	Top-1 acc 62.109 (59.692)	Top-5 acc 85.547 (81.099)	lr 0.01290
Train [59][2540/3239]	Time 0.250 (1.071)	Data Time 0.001 (0.590)	Loss 2.6410 (2.6629)	Entropy 0.62874 (0.62906)	Top-1 acc 59.766 (59.691)	Top-5 acc 81.250 (81.099)	lr 0.01290
Train [59][2550/3239]	Time 0.240 (1.075)	Data Time 0.001 (0.595)	Loss 2.6060 (2.6630)	Entropy 0.62894 (0.62906)	Top-1 acc 61.328 (59.689)	Top-5 acc 82.031 (81.097)	lr 0.01290
Train [59][2560/3239]	Time 0.265 (1.075)	Data Time 0.002 (0.595)	Loss 2.6085 (2.6631)	Entropy 0.62905 (0.62906)	Top-1 acc 61.328 (59.687)	Top-5 acc 80.469 (81.092)	lr 0.01290
Train [59][2570/3239]	Time 0.235 (1.072)	Data Time 0.001 (0.593)	Loss 2.6740 (2.6628)	Entropy 0.62916 (0.62906)	Top-1 acc 60.547 (59.696)	Top-5 acc 80.469 (81.095)	lr 0.01289
Train [59][2580/3239]	Time 0.246 (1.075)	Data Time 0.002 (0.596)	Loss 2.7326 (2.6628)	Entropy 0.62956 (0.62906)	Top-1 acc 57.031 (59.691)	Top-5 acc 81.250 (81.096)	lr 0.01289
Train [59][2590/3239]	Time 0.242 (1.080)	Data Time 0.001 (0.601)	Loss 2.7330 (2.6630)	Entropy 0.62958 (0.62906)	Top-1 acc 61.328 (59.689)	Top-5 acc 76.562 (81.092)	lr 0.01289
Train [59][2600/3239]	Time 0.329 (1.077)	Data Time 0.001 (0.599)	Loss 2.4866 (2.6630)	Entropy 0.62958 (0.62906)	Top-1 acc 64.062 (59.690)	Top-5 acc 83.203 (81.094)	lr 0.01289
Train [59][2610/3239]	Time 0.229 (1.081)	Data Time 0.001 (0.603)	Loss 2.8124 (2.6628)	Entropy 0.62937 (0.62906)	Top-1 acc 52.344 (59.689)	Top-5 acc 79.688 (81.101)	lr 0.01289
Train [59][2620/3239]	Time 0.235 (1.084)	Data Time 0.001 (0.606)	Loss 2.6867 (2.6631)	Entropy 0.62940 (0.62906)	Top-1 acc 55.859 (59.681)	Top-5 acc 82.031 (81.096)	lr 0.01289
Train [59][2630/3239]	Time 0.230 (1.081)	Data Time 0.002 (0.604)	Loss 2.8273 (2.6632)	Entropy 0.62937 (0.62906)	Top-1 acc 55.469 (59.677)	Top-5 acc 78.125 (81.091)	lr 0.01289
Train [59][2640/3239]	Time 6.845 (1.081)	Data Time 6.596 (0.604)	Loss 2.4554 (2.6634)	Entropy 0.62877 (0.62906)	Top-1 acc 66.016 (59.675)	Top-5 acc 84.375 (81.087)	lr 0.01289
Train [59][2650/3239]	Time 0.241 (1.086)	Data Time 0.001 (0.609)	Loss 2.6914 (2.6637)	Entropy 0.62901 (0.62906)	Top-1 acc 62.891 (59.668)	Top-5 acc 78.516 (81.079)	lr 0.01289
Train [59][2660/3239]	Time 0.318 (1.096)	Data Time 0.004 (0.606)	Loss 2.6290 (2.6636)	Entropy 0.62945 (0.62906)	Top-1 acc 63.281 (59.672)	Top-5 acc 81.250 (81.079)	lr 0.01289
Train [59][2670/3239]	Time 0.238 (1.094)	Data Time 0.002 (0.604)	Loss 2.7243 (2.6636)	Entropy 0.62957 (0.62907)	Top-1 acc 53.516 (59.676)	Top-5 acc 81.641 (81.079)	lr 0.01288
Train [59][2680/3239]	Time 0.256 (1.092)	Data Time 0.002 (0.602)	Loss 2.6408 (2.6637)	Entropy 0.62966 (0.62907)	Top-1 acc 58.984 (59.666)	Top-5 acc 79.688 (81.074)	lr 0.01288
Train [59][2690/3239]	Time 0.357 (1.089)	Data Time 0.001 (0.600)	Loss 2.7596 (2.6639)	Entropy 0.62947 (0.62907)	Top-1 acc 56.641 (59.661)	Top-5 acc 79.688 (81.072)	lr 0.01288
Train [59][2700/3239]	Time 0.260 (1.087)	Data Time 0.001 (0.597)	Loss 2.6515 (2.6636)	Entropy 0.62959 (0.62907)	Top-1 acc 60.938 (59.664)	Top-5 acc 78.125 (81.077)	lr 0.01288
Train [59][2710/3239]	Time 0.240 (1.087)	Data Time 0.001 (0.598)	Loss 2.5326 (2.6634)	Entropy 0.62996 (0.62907)	Top-1 acc 60.938 (59.671)	Top-5 acc 83.984 (81.082)	lr 0.01288
Train [59][2720/3239]	Time 0.234 (1.087)	Data Time 0.001 (0.598)	Loss 2.9937 (2.6636)	Entropy 0.63042 (0.62908)	Top-1 acc 50.391 (59.665)	Top-5 acc 77.734 (81.079)	lr 0.01288
Train [59][2730/3239]	Time 1.173 (1.085)	Data Time 0.914 (0.596)	Loss 2.5620 (2.6639)	Entropy 0.63046 (0.62908)	Top-1 acc 62.109 (59.658)	Top-5 acc 84.375 (81.073)	lr 0.01288
Train [59][2740/3239]	Time 0.260 (1.086)	Data Time 0.002 (0.598)	Loss 2.4788 (2.6640)	Entropy 0.63044 (0.62909)	Top-1 acc 64.062 (59.660)	Top-5 acc 84.375 (81.076)	lr 0.01288
Train [59][2750/3239]	Time 0.244 (1.088)	Data Time 0.001 (0.600)	Loss 2.9746 (2.6642)	Entropy 0.63042 (0.62909)	Top-1 acc 56.641 (59.660)	Top-5 acc 74.609 (81.068)	lr 0.01288
Train [59][2760/3239]	Time 0.342 (1.087)	Data Time 0.001 (0.599)	Loss 2.4797 (2.6643)	Entropy 0.63032 (0.62910)	Top-1 acc 60.547 (59.656)	Top-5 acc 84.375 (81.063)	lr 0.01288
Train [59][2770/3239]	Time 0.229 (1.088)	Data Time 0.001 (0.601)	Loss 2.6552 (2.6642)	Entropy 0.63053 (0.62910)	Top-1 acc 57.812 (59.662)	Top-5 acc 81.250 (81.067)	lr 0.01287
Train [59][2780/3239]	Time 0.237 (1.090)	Data Time 0.001 (0.602)	Loss 2.6404 (2.6644)	Entropy 0.63045 (0.62911)	Top-1 acc 57.031 (59.654)	Top-5 acc 82.422 (81.061)	lr 0.01287
Train [59][2790/3239]	Time 0.249 (1.089)	Data Time 0.001 (0.602)	Loss 2.4963 (2.6644)	Entropy 0.63048 (0.62911)	Top-1 acc 60.938 (59.654)	Top-5 acc 83.594 (81.063)	lr 0.01287
Train [59][2800/3239]	Time 3.600 (1.089)	Data Time 3.351 (0.602)	Loss 2.6081 (2.6645)	Entropy 0.63037 (0.62912)	Top-1 acc 61.328 (59.651)	Top-5 acc 83.984 (81.063)	lr 0.01287
Train [59][2810/3239]	Time 0.236 (1.091)	Data Time 0.001 (0.605)	Loss 2.8217 (2.6646)	Entropy 0.63041 (0.62912)	Top-1 acc 58.203 (59.652)	Top-5 acc 79.688 (81.063)	lr 0.01287
Train [59][2820/3239]	Time 0.250 (1.091)	Data Time 0.001 (0.605)	Loss 2.6399 (2.6646)	Entropy 0.63064 (0.62913)	Top-1 acc 61.719 (59.651)	Top-5 acc 81.641 (81.059)	lr 0.01287
Train [59][2830/3239]	Time 0.951 (1.090)	Data Time 0.699 (0.604)	Loss 2.8441 (2.6645)	Entropy 0.63055 (0.62913)	Top-1 acc 57.422 (59.653)	Top-5 acc 77.344 (81.061)	lr 0.01287
Train [59][2840/3239]	Time 2.502 (1.094)	Data Time 2.236 (0.608)	Loss 2.6021 (2.6647)	Entropy 0.63055 (0.62914)	Top-1 acc 62.500 (59.651)	Top-5 acc 78.516 (81.055)	lr 0.01287
Train [59][2850/3239]	Time 2.138 (1.092)	Data Time 1.793 (0.606)	Loss 2.7140 (2.6647)	Entropy 0.63053 (0.62914)	Top-1 acc 55.859 (59.648)	Top-5 acc 82.812 (81.056)	lr 0.01287
Train [59][2860/3239]	Time 0.240 (1.092)	Data Time 0.001 (0.607)	Loss 2.6627 (2.6650)	Entropy 0.63024 (0.62915)	Top-1 acc 57.031 (59.641)	Top-5 acc 80.859 (81.055)	lr 0.01287
Train [59][2870/3239]	Time 0.246 (1.095)	Data Time 0.002 (0.609)	Loss 2.7070 (2.6652)	Entropy 0.62976 (0.62915)	Top-1 acc 58.594 (59.634)	Top-5 acc 79.297 (81.049)	lr 0.01286
Train [59][2880/3239]	Time 0.264 (1.093)	Data Time 0.037 (0.608)	Loss 2.7369 (2.6653)	Entropy 0.62995 (0.62915)	Top-1 acc 58.203 (59.636)	Top-5 acc 75.000 (81.043)	lr 0.01286
Train [59][2890/3239]	Time 0.364 (1.094)	Data Time 0.125 (0.609)	Loss 2.6494 (2.6650)	Entropy 0.62962 (0.62916)	Top-1 acc 59.766 (59.640)	Top-5 acc 80.859 (81.043)	lr 0.01286
Train [59][2900/3239]	Time 0.265 (1.093)	Data Time 0.002 (0.608)	Loss 2.5936 (2.6653)	Entropy 0.62950 (0.62916)	Top-1 acc 58.984 (59.632)	Top-5 acc 83.203 (81.039)	lr 0.01286
Train [59][2910/3239]	Time 0.228 (1.096)	Data Time 0.001 (0.611)	Loss 2.7008 (2.6653)	Entropy 0.62922 (0.62916)	Top-1 acc 57.812 (59.629)	Top-5 acc 81.641 (81.038)	lr 0.01286
Train [59][2920/3239]	Time 0.353 (1.096)	Data Time 0.001 (0.612)	Loss 2.6199 (2.6653)	Entropy 0.62875 (0.62916)	Top-1 acc 60.938 (59.629)	Top-5 acc 81.250 (81.042)	lr 0.01286
Train [59][2930/3239]	Time 0.239 (1.096)	Data Time 0.001 (0.612)	Loss 2.6488 (2.6654)	Entropy 0.62913 (0.62916)	Top-1 acc 62.891 (59.626)	Top-5 acc 80.859 (81.039)	lr 0.01286
Train [59][2940/3239]	Time 0.240 (1.097)	Data Time 0.001 (0.613)	Loss 2.6165 (2.6654)	Entropy 0.62881 (0.62916)	Top-1 acc 58.594 (59.625)	Top-5 acc 82.422 (81.038)	lr 0.01286
Train [59][2950/3239]	Time 0.235 (1.098)	Data Time 0.001 (0.614)	Loss 2.5158 (2.6654)	Entropy 0.62884 (0.62916)	Top-1 acc 62.500 (59.621)	Top-5 acc 83.984 (81.037)	lr 0.01286
Train [59][2960/3239]	Time 0.230 (1.098)	Data Time 0.001 (0.615)	Loss 2.6491 (2.6654)	Entropy 0.62892 (0.62915)	Top-1 acc 60.547 (59.621)	Top-5 acc 79.297 (81.037)	lr 0.01286
Train [59][2970/3239]	Time 0.231 (1.099)	Data Time 0.001 (0.616)	Loss 2.8034 (2.6654)	Entropy 0.62918 (0.62915)	Top-1 acc 53.125 (59.621)	Top-5 acc 79.688 (81.038)	lr 0.01285
Train [59][2980/3239]	Time 0.291 (1.100)	Data Time 0.001 (0.617)	Loss 2.4342 (2.6655)	Entropy 0.62932 (0.62915)	Top-1 acc 67.578 (59.622)	Top-5 acc 84.375 (81.036)	lr 0.01285
Train [59][2990/3239]	Time 7.407 (1.100)	Data Time 7.034 (0.617)	Loss 2.4853 (2.6652)	Entropy 0.62911 (0.62915)	Top-1 acc 62.891 (59.625)	Top-5 acc 82.422 (81.039)	lr 0.01285
Train [59][3000/3239]	Time 4.749 (1.100)	Data Time 4.494 (0.618)	Loss 2.5235 (2.6654)	Entropy 0.62893 (0.62915)	Top-1 acc 65.234 (59.625)	Top-5 acc 83.984 (81.035)	lr 0.01285
Train [59][3010/3239]	Time 0.242 (1.100)	Data Time 0.001 (0.617)	Loss 2.5669 (2.6653)	Entropy 0.62918 (0.62915)	Top-1 acc 60.547 (59.627)	Top-5 acc 83.984 (81.037)	lr 0.01285
Train [59][3020/3239]	Time 0.241 (1.100)	Data Time 0.001 (0.618)	Loss 2.6629 (2.6654)	Entropy 0.62907 (0.62915)	Top-1 acc 59.766 (59.628)	Top-5 acc 81.250 (81.036)	lr 0.01285
Train [59][3030/3239]	Time 0.257 (1.100)	Data Time 0.001 (0.619)	Loss 2.6566 (2.6655)	Entropy 0.62905 (0.62915)	Top-1 acc 57.812 (59.623)	Top-5 acc 79.297 (81.033)	lr 0.01285
Train [59][3040/3239]	Time 3.764 (1.101)	Data Time 3.500 (0.619)	Loss 2.4985 (2.6653)	Entropy 0.62880 (0.62915)	Top-1 acc 64.844 (59.626)	Top-5 acc 83.984 (81.037)	lr 0.01285
Train [59][3050/3239]	Time 0.236 (1.101)	Data Time 0.001 (0.620)	Loss 2.7080 (2.6653)	Entropy 0.62866 (0.62915)	Top-1 acc 58.984 (59.630)	Top-5 acc 79.688 (81.033)	lr 0.01285
Train [59][3060/3239]	Time 0.252 (1.101)	Data Time 0.001 (0.620)	Loss 2.7173 (2.6652)	Entropy 0.62865 (0.62915)	Top-1 acc 60.938 (59.638)	Top-5 acc 81.250 (81.033)	lr 0.01285
Train [59][3070/3239]	Time 0.247 (1.102)	Data Time 0.001 (0.621)	Loss 2.7288 (2.6652)	Entropy 0.62855 (0.62915)	Top-1 acc 59.375 (59.635)	Top-5 acc 79.688 (81.031)	lr 0.01284
Train [59][3080/3239]	Time 0.335 (1.103)	Data Time 0.001 (0.623)	Loss 2.7393 (2.6652)	Entropy 0.62883 (0.62915)	Top-1 acc 57.422 (59.635)	Top-5 acc 80.078 (81.034)	lr 0.01284
Train [59][3090/3239]	Time 0.238 (1.103)	Data Time 0.001 (0.623)	Loss 2.5898 (2.6653)	Entropy 0.62856 (0.62914)	Top-1 acc 61.719 (59.634)	Top-5 acc 83.203 (81.033)	lr 0.01284
Train [59][3100/3239]	Time 1.762 (1.104)	Data Time 1.508 (0.623)	Loss 2.6376 (2.6653)	Entropy 0.62868 (0.62914)	Top-1 acc 60.938 (59.639)	Top-5 acc 82.812 (81.033)	lr 0.01284
Train [59][3110/3239]	Time 0.270 (1.105)	Data Time 0.002 (0.625)	Loss 2.7454 (2.6653)	Entropy 0.62856 (0.62914)	Top-1 acc 58.594 (59.636)	Top-5 acc 79.297 (81.034)	lr 0.01284
Train [59][3120/3239]	Time 0.234 (1.105)	Data Time 0.001 (0.626)	Loss 2.5590 (2.6651)	Entropy 0.62881 (0.62914)	Top-1 acc 66.016 (59.643)	Top-5 acc 83.984 (81.039)	lr 0.01284
Train [59][3130/3239]	Time 0.248 (1.104)	Data Time 0.002 (0.624)	Loss 2.6790 (2.6649)	Entropy 0.62887 (0.62914)	Top-1 acc 58.203 (59.648)	Top-5 acc 78.516 (81.042)	lr 0.01284
Train [59][3140/3239]	Time 0.235 (1.107)	Data Time 0.001 (0.627)	Loss 2.4770 (2.6648)	Entropy 0.62904 (0.62914)	Top-1 acc 61.719 (59.648)	Top-5 acc 85.156 (81.042)	lr 0.01284
Train [59][3150/3239]	Time 3.836 (1.107)	Data Time 3.500 (0.628)	Loss 2.8825 (2.6650)	Entropy 0.62931 (0.62914)	Top-1 acc 58.984 (59.647)	Top-5 acc 76.172 (81.042)	lr 0.01284
Train [59][3160/3239]	Time 1.519 (1.106)	Data Time 1.278 (0.626)	Loss 2.6255 (2.6650)	Entropy 0.62947 (0.62914)	Top-1 acc 59.766 (59.647)	Top-5 acc 83.984 (81.045)	lr 0.01284
Train [59][3170/3239]	Time 0.255 (1.107)	Data Time 0.001 (0.628)	Loss 2.5895 (2.6648)	Entropy 0.62953 (0.62914)	Top-1 acc 60.938 (59.653)	Top-5 acc 81.641 (81.047)	lr 0.01283
Train [59][3180/3239]	Time 0.235 (1.108)	Data Time 0.000 (0.630)	Loss 2.6593 (2.6648)	Entropy 0.62961 (0.62914)	Top-1 acc 58.594 (59.654)	Top-5 acc 82.031 (81.046)	lr 0.01283
Train [59][3190/3239]	Time 0.227 (1.108)	Data Time 0.000 (0.630)	Loss 2.6970 (2.6648)	Entropy 0.62983 (0.62914)	Top-1 acc 60.156 (59.654)	Top-5 acc 82.812 (81.047)	lr 0.01283
Train [59][3200/3239]	Time 0.223 (1.109)	Data Time 0.000 (0.631)	Loss 2.5352 (2.6647)	Entropy 0.62975 (0.62914)	Top-1 acc 62.109 (59.655)	Top-5 acc 84.766 (81.048)	lr 0.01283
Train [59][3210/3239]	Time 7.748 (1.110)	Data Time 7.492 (0.632)	Loss 2.5748 (2.6646)	Entropy 0.62985 (0.62915)	Top-1 acc 58.594 (59.659)	Top-5 acc 82.812 (81.052)	lr 0.01283
Train [59][3220/3239]	Time 0.235 (1.109)	Data Time 0.000 (0.631)	Loss 2.6433 (2.6645)	Entropy 0.62987 (0.62915)	Top-1 acc 58.203 (59.663)	Top-5 acc 81.641 (81.054)	lr 0.01283
Train [59][3230/3239]	Time 0.236 (1.109)	Data Time 0.000 (0.631)	Loss 2.5350 (2.6645)	Entropy 0.62978 (0.62915)	Top-1 acc 60.938 (59.662)	Top-5 acc 81.641 (81.054)	lr 0.01283
Train [59][3239/3239]	Time 0.808 (1.107)	Data Time 0.000 (0.629)	Loss 2.8146 (2.6646)	Entropy 0.62981 (0.62915)	Top-1 acc 55.556 (59.662)	Top-5 acc 79.012 (81.053)	lr 0.01283
==========Valid [59/120]	loss 1.409	top-1 acc 67.653 (67.653)	top-5 acc 87.279	Train top-1 59.662	top-5 81.053	Entropy 0.62981	Latency-None: 0.000ms	Flops: 538.40M
Train [60][0/3239]	Time 49.415 (49.415)	Data Time 48.782 (48.782)	Loss 2.6305 (2.6305)	Entropy 0.62972 (0.62972)	Top-1 acc 63.672 (63.672)	Top-5 acc 82.422 (82.422)	lr 0.01283
Train [60][10/3239]	Time 0.239 (5.316)	Data Time 0.001 (4.840)	Loss 2.7600 (2.6266)	Entropy 0.62985 (0.62977)	Top-1 acc 54.688 (61.719)	Top-5 acc 77.734 (81.818)	lr 0.01283
Train [60][20/3239]	Time 0.248 (2.973)	Data Time 0.001 (2.536)	Loss 2.6137 (2.6511)	Entropy 0.62983 (0.62982)	Top-1 acc 62.500 (60.975)	Top-5 acc 81.641 (81.083)	lr 0.01283
Train [60][30/3239]	Time 0.231 (2.144)	Data Time 0.001 (1.718)	Loss 2.7758 (2.6643)	Entropy 0.62996 (0.62981)	Top-1 acc 53.906 (60.207)	Top-5 acc 82.812 (80.885)	lr 0.01282
Train [60][40/3239]	Time 0.254 (1.982)	Data Time 0.001 (1.549)	Loss 2.6012 (2.6525)	Entropy 0.62965 (0.62981)	Top-1 acc 62.500 (60.242)	Top-5 acc 81.250 (81.374)	lr 0.01282
Train [60][50/3239]	Time 0.331 (1.674)	Data Time 0.001 (1.245)	Loss 2.5514 (2.6488)	Entropy 0.62982 (0.62980)	Top-1 acc 62.500 (60.417)	Top-5 acc 83.594 (81.480)	lr 0.01282
Train [60][60/3239]	Time 0.258 (1.467)	Data Time 0.001 (1.041)	Loss 2.4409 (2.6387)	Entropy 0.63012 (0.62982)	Top-1 acc 61.328 (60.489)	Top-5 acc 85.156 (81.653)	lr 0.01282
Train [60][70/3239]	Time 0.421 (1.937)	Data Time 0.005 (1.028)	Loss 2.5716 (2.6361)	Entropy 0.63010 (0.62987)	Top-1 acc 61.719 (60.530)	Top-5 acc 83.984 (81.707)	lr 0.01282
Train [60][80/3239]	Time 0.229 (1.757)	Data Time 0.002 (0.901)	Loss 2.5382 (2.6363)	Entropy 0.62986 (0.62987)	Top-1 acc 62.891 (60.561)	Top-5 acc 84.375 (81.771)	lr 0.01282
Train [60][90/3239]	Time 0.225 (1.606)	Data Time 0.001 (0.803)	Loss 2.5018 (2.6357)	Entropy 0.62972 (0.62987)	Top-1 acc 63.672 (60.603)	Top-5 acc 86.328 (81.782)	lr 0.01282
Train [60][100/3239]	Time 0.234 (1.489)	Data Time 0.001 (0.723)	Loss 2.7685 (2.6351)	Entropy 0.62952 (0.62983)	Top-1 acc 53.516 (60.555)	Top-5 acc 80.078 (81.838)	lr 0.01282
Train [60][110/3239]	Time 0.239 (1.392)	Data Time 0.001 (0.658)	Loss 2.4813 (2.6357)	Entropy 0.62969 (0.62981)	Top-1 acc 65.625 (60.533)	Top-5 acc 85.547 (81.827)	lr 0.01282
Train [60][120/3239]	Time 0.237 (1.313)	Data Time 0.001 (0.604)	Loss 2.6155 (2.6370)	Entropy 0.62962 (0.62979)	Top-1 acc 62.500 (60.528)	Top-5 acc 80.859 (81.808)	lr 0.01282
Train [60][130/3239]	Time 0.235 (1.246)	Data Time 0.001 (0.558)	Loss 3.0646 (2.6454)	Entropy 0.62963 (0.62978)	Top-1 acc 50.000 (60.264)	Top-5 acc 74.609 (81.608)	lr 0.01281
Train [60][140/3239]	Time 0.407 (1.189)	Data Time 0.002 (0.519)	Loss 2.4589 (2.6457)	Entropy 0.62953 (0.62977)	Top-1 acc 64.453 (60.256)	Top-5 acc 85.938 (81.560)	lr 0.01281
Train [60][150/3239]	Time 0.251 (1.140)	Data Time 0.001 (0.484)	Loss 2.4581 (2.6469)	Entropy 0.62939 (0.62975)	Top-1 acc 64.062 (60.239)	Top-5 acc 85.547 (81.506)	lr 0.01281
Train [60][160/3239]	Time 0.251 (1.097)	Data Time 0.001 (0.454)	Loss 2.3886 (2.6440)	Entropy 0.62918 (0.62972)	Top-1 acc 69.531 (60.338)	Top-5 acc 85.938 (81.546)	lr 0.01281
Train [60][170/3239]	Time 0.251 (1.106)	Data Time 0.001 (0.476)	Loss 2.5114 (2.6445)	Entropy 0.62928 (0.62969)	Top-1 acc 64.453 (60.341)	Top-5 acc 83.203 (81.510)	lr 0.01281
Train [60][180/3239]	Time 0.228 (1.081)	Data Time 0.001 (0.463)	Loss 2.6472 (2.6465)	Entropy 0.62932 (0.62967)	Top-1 acc 61.328 (60.277)	Top-5 acc 80.859 (81.477)	lr 0.01281
Train [60][190/3239]	Time 0.255 (1.057)	Data Time 0.001 (0.448)	Loss 2.9805 (2.6467)	Entropy 0.62942 (0.62965)	Top-1 acc 55.859 (60.254)	Top-5 acc 76.953 (81.465)	lr 0.01281
Train [60][200/3239]	Time 0.237 (1.054)	Data Time 0.001 (0.454)	Loss 2.6706 (2.6486)	Entropy 0.62967 (0.62964)	Top-1 acc 62.500 (60.290)	Top-5 acc 79.688 (81.433)	lr 0.01281
Train [60][210/3239]	Time 0.379 (1.039)	Data Time 0.001 (0.447)	Loss 2.5947 (2.6469)	Entropy 0.62974 (0.62964)	Top-1 acc 62.500 (60.365)	Top-5 acc 83.594 (81.474)	lr 0.01281
Train [60][220/3239]	Time 0.259 (1.036)	Data Time 0.001 (0.452)	Loss 2.4997 (2.6469)	Entropy 0.62967 (0.62965)	Top-1 acc 65.234 (60.317)	Top-5 acc 84.375 (81.457)	lr 0.01280
Train [60][230/3239]	Time 0.238 (1.023)	Data Time 0.001 (0.447)	Loss 2.5539 (2.6477)	Entropy 0.62996 (0.62965)	Top-1 acc 64.062 (60.290)	Top-5 acc 82.812 (81.438)	lr 0.01280
Train [60][240/3239]	Time 0.254 (1.011)	Data Time 0.002 (0.440)	Loss 2.4782 (2.6479)	Entropy 0.62990 (0.62966)	Top-1 acc 59.375 (60.218)	Top-5 acc 85.938 (81.472)	lr 0.01280
Train [60][250/3239]	Time 0.248 (1.002)	Data Time 0.001 (0.438)	Loss 2.8641 (2.6484)	Entropy 0.63014 (0.62968)	Top-1 acc 53.125 (60.194)	Top-5 acc 77.344 (81.477)	lr 0.01280
Train [60][260/3239]	Time 0.246 (0.991)	Data Time 0.001 (0.432)	Loss 2.6727 (2.6463)	Entropy 0.63020 (0.62969)	Top-1 acc 61.328 (60.258)	Top-5 acc 81.641 (81.509)	lr 0.01280
Train [60][270/3239]	Time 0.234 (0.994)	Data Time 0.001 (0.441)	Loss 2.7669 (2.6468)	Entropy 0.63021 (0.62971)	Top-1 acc 58.203 (60.240)	Top-5 acc 80.078 (81.489)	lr 0.01280
Train [60][280/3239]	Time 0.230 (0.996)	Data Time 0.001 (0.448)	Loss 2.6356 (2.6483)	Entropy 0.63008 (0.62973)	Top-1 acc 61.719 (60.219)	Top-5 acc 79.688 (81.442)	lr 0.01280
Train [60][290/3239]	Time 0.232 (0.980)	Data Time 0.001 (0.436)	Loss 2.7349 (2.6492)	Entropy 0.62980 (0.62974)	Top-1 acc 57.422 (60.214)	Top-5 acc 78.906 (81.415)	lr 0.01280
Train [60][300/3239]	Time 0.330 (0.976)	Data Time 0.001 (0.437)	Loss 2.5729 (2.6492)	Entropy 0.62997 (0.62974)	Top-1 acc 62.500 (60.225)	Top-5 acc 83.594 (81.410)	lr 0.01280
Train [60][310/3239]	Time 0.238 (0.977)	Data Time 0.001 (0.441)	Loss 2.6812 (2.6492)	Entropy 0.62991 (0.62975)	Top-1 acc 61.719 (60.199)	Top-5 acc 81.641 (81.411)	lr 0.01280
Train [60][320/3239]	Time 0.245 (0.969)	Data Time 0.001 (0.437)	Loss 2.8866 (2.6502)	Entropy 0.62965 (0.62975)	Top-1 acc 54.688 (60.224)	Top-5 acc 75.781 (81.409)	lr 0.01279
Train [60][330/3239]	Time 0.234 (0.976)	Data Time 0.001 (0.448)	Loss 2.5292 (2.6521)	Entropy 0.62956 (0.62975)	Top-1 acc 62.500 (60.185)	Top-5 acc 82.422 (81.369)	lr 0.01279
Train [60][340/3239]	Time 0.219 (0.981)	Data Time 0.001 (0.456)	Loss 2.9319 (2.6544)	Entropy 0.62955 (0.62975)	Top-1 acc 55.469 (60.132)	Top-5 acc 73.828 (81.311)	lr 0.01279
Train [60][350/3239]	Time 0.245 (0.965)	Data Time 0.001 (0.444)	Loss 2.6080 (2.6536)	Entropy 0.63013 (0.62975)	Top-1 acc 60.547 (60.147)	Top-5 acc 82.422 (81.329)	lr 0.01279
Train [60][360/3239]	Time 0.870 (0.969)	Data Time 0.632 (0.450)	Loss 2.6780 (2.6535)	Entropy 0.63024 (0.62976)	Top-1 acc 62.891 (60.166)	Top-5 acc 79.688 (81.335)	lr 0.01279
Train [60][370/3239]	Time 0.367 (0.972)	Data Time 0.001 (0.455)	Loss 2.6282 (2.6532)	Entropy 0.63037 (0.62977)	Top-1 acc 62.500 (60.177)	Top-5 acc 80.859 (81.336)	lr 0.01279
Train [60][380/3239]	Time 0.237 (0.961)	Data Time 0.001 (0.447)	Loss 2.6843 (2.6539)	Entropy 0.62998 (0.62979)	Top-1 acc 60.938 (60.171)	Top-5 acc 80.469 (81.323)	lr 0.01279
Train [60][390/3239]	Time 0.230 (0.951)	Data Time 0.002 (0.440)	Loss 2.7225 (2.6537)	Entropy 0.62993 (0.62979)	Top-1 acc 57.031 (60.155)	Top-5 acc 77.734 (81.321)	lr 0.01279
Train [60][400/3239]	Time 0.246 (0.957)	Data Time 0.001 (0.447)	Loss 2.4289 (2.6515)	Entropy 0.62963 (0.62979)	Top-1 acc 64.844 (60.199)	Top-5 acc 86.719 (81.382)	lr 0.01279
Train [60][410/3239]	Time 0.231 (0.965)	Data Time 0.001 (0.457)	Loss 2.6718 (2.6524)	Entropy 0.62965 (0.62978)	Top-1 acc 57.422 (60.184)	Top-5 acc 79.297 (81.342)	lr 0.01279
Train [60][420/3239]	Time 0.232 (0.952)	Data Time 0.001 (0.447)	Loss 2.5544 (2.6525)	Entropy 0.62924 (0.62978)	Top-1 acc 61.719 (60.155)	Top-5 acc 82.812 (81.331)	lr 0.01278
Train [60][430/3239]	Time 0.255 (0.953)	Data Time 0.001 (0.449)	Loss 2.5259 (2.6515)	Entropy 0.62929 (0.62977)	Top-1 acc 64.453 (60.170)	Top-5 acc 84.766 (81.346)	lr 0.01278
Train [60][440/3239]	Time 0.235 (0.962)	Data Time 0.001 (0.459)	Loss 2.6262 (2.6500)	Entropy 0.62928 (0.62976)	Top-1 acc 60.547 (60.205)	Top-5 acc 82.422 (81.373)	lr 0.01278
Train [60][450/3239]	Time 0.234 (0.949)	Data Time 0.001 (0.449)	Loss 2.6088 (2.6503)	Entropy 0.62888 (0.62974)	Top-1 acc 63.281 (60.187)	Top-5 acc 81.250 (81.359)	lr 0.01278
Train [60][460/3239]	Time 6.727 (0.956)	Data Time 6.336 (0.457)	Loss 2.5413 (2.6509)	Entropy 0.62888 (0.62973)	Top-1 acc 63.672 (60.160)	Top-5 acc 83.203 (81.347)	lr 0.01278
Train [60][470/3239]	Time 0.261 (0.965)	Data Time 0.001 (0.467)	Loss 2.8071 (2.6501)	Entropy 0.62863 (0.62970)	Top-1 acc 55.859 (60.168)	Top-5 acc 75.391 (81.348)	lr 0.01278
Train [60][480/3239]	Time 0.238 (0.954)	Data Time 0.001 (0.457)	Loss 2.4910 (2.6508)	Entropy 0.62874 (0.62968)	Top-1 acc 63.672 (60.147)	Top-5 acc 85.938 (81.330)	lr 0.01278
Train [60][490/3239]	Time 0.232 (0.944)	Data Time 0.001 (0.450)	Loss 2.6200 (2.6514)	Entropy 0.62913 (0.62967)	Top-1 acc 59.375 (60.122)	Top-5 acc 82.031 (81.326)	lr 0.01278
Train [60][500/3239]	Time 0.253 (0.963)	Data Time 0.002 (0.470)	Loss 2.6021 (2.6511)	Entropy 0.62913 (0.62966)	Top-1 acc 64.453 (60.125)	Top-5 acc 81.250 (81.333)	lr 0.01278
Train [60][510/3239]	Time 0.252 (0.953)	Data Time 0.002 (0.461)	Loss 2.6103 (2.6497)	Entropy 0.62913 (0.62964)	Top-1 acc 59.766 (60.163)	Top-5 acc 83.203 (81.346)	lr 0.01278
Train [60][520/3239]	Time 0.231 (0.945)	Data Time 0.001 (0.455)	Loss 2.5691 (2.6501)	Entropy 0.62920 (0.62964)	Top-1 acc 60.938 (60.137)	Top-5 acc 83.594 (81.341)	lr 0.01277
Train [60][530/3239]	Time 0.314 (0.946)	Data Time 0.001 (0.457)	Loss 2.4045 (2.6486)	Entropy 0.62889 (0.62963)	Top-1 acc 64.453 (60.158)	Top-5 acc 84.375 (81.371)	lr 0.01277
Train [60][540/3239]	Time 0.240 (0.950)	Data Time 0.001 (0.463)	Loss 2.8256 (2.6484)	Entropy 0.62907 (0.62961)	Top-1 acc 51.172 (60.153)	Top-5 acc 80.859 (81.395)	lr 0.01277
Train [60][550/3239]	Time 0.235 (0.940)	Data Time 0.001 (0.454)	Loss 2.7484 (2.6495)	Entropy 0.62906 (0.62960)	Top-1 acc 57.812 (60.119)	Top-5 acc 80.078 (81.375)	lr 0.01277
Train [60][560/3239]	Time 0.236 (0.951)	Data Time 0.001 (0.466)	Loss 2.7020 (2.6493)	Entropy 0.62921 (0.62959)	Top-1 acc 56.641 (60.126)	Top-5 acc 79.297 (81.370)	lr 0.01277
Train [60][570/3239]	Time 0.225 (0.951)	Data Time 0.001 (0.468)	Loss 2.7090 (2.6495)	Entropy 0.62969 (0.62959)	Top-1 acc 58.984 (60.117)	Top-5 acc 79.688 (81.372)	lr 0.01277
Train [60][580/3239]	Time 0.236 (0.942)	Data Time 0.001 (0.460)	Loss 2.8106 (2.6498)	Entropy 0.62937 (0.62959)	Top-1 acc 53.125 (60.107)	Top-5 acc 79.688 (81.365)	lr 0.01277
Train [60][590/3239]	Time 0.330 (0.949)	Data Time 0.001 (0.468)	Loss 2.4655 (2.6495)	Entropy 0.62957 (0.62959)	Top-1 acc 64.062 (60.114)	Top-5 acc 85.547 (81.362)	lr 0.01277
Train [60][600/3239]	Time 0.231 (0.951)	Data Time 0.001 (0.471)	Loss 2.6902 (2.6497)	Entropy 0.62913 (0.62959)	Top-1 acc 58.984 (60.120)	Top-5 acc 81.641 (81.357)	lr 0.01277
Train [60][610/3239]	Time 0.232 (0.942)	Data Time 0.001 (0.463)	Loss 2.5586 (2.6499)	Entropy 0.62908 (0.62958)	Top-1 acc 61.328 (60.119)	Top-5 acc 83.594 (81.348)	lr 0.01277
Train [60][620/3239]	Time 9.566 (0.949)	Data Time 9.245 (0.471)	Loss 2.5809 (2.6500)	Entropy 0.62901 (0.62957)	Top-1 acc 62.109 (60.112)	Top-5 acc 80.859 (81.355)	lr 0.01276
Train [60][630/3239]	Time 0.222 (0.953)	Data Time 0.001 (0.476)	Loss 2.7578 (2.6494)	Entropy 0.62897 (0.62956)	Top-1 acc 56.641 (60.140)	Top-5 acc 79.688 (81.359)	lr 0.01276
Train [60][640/3239]	Time 0.507 (0.944)	Data Time 0.262 (0.469)	Loss 2.5252 (2.6484)	Entropy 0.62913 (0.62955)	Top-1 acc 62.891 (60.167)	Top-5 acc 85.156 (81.379)	lr 0.01276
Train [60][650/3239]	Time 0.240 (0.936)	Data Time 0.001 (0.462)	Loss 2.7163 (2.6477)	Entropy 0.62872 (0.62955)	Top-1 acc 61.328 (60.170)	Top-5 acc 81.641 (81.383)	lr 0.01276
Train [60][660/3239]	Time 0.251 (0.952)	Data Time 0.001 (0.479)	Loss 2.5748 (2.6470)	Entropy 0.62850 (0.62953)	Top-1 acc 59.375 (60.180)	Top-5 acc 82.812 (81.394)	lr 0.01276
Train [60][670/3239]	Time 0.233 (0.944)	Data Time 0.001 (0.472)	Loss 2.6881 (2.6472)	Entropy 0.62819 (0.62951)	Top-1 acc 56.641 (60.186)	Top-5 acc 82.812 (81.386)	lr 0.01276
Train [60][680/3239]	Time 0.252 (0.940)	Data Time 0.001 (0.468)	Loss 2.5888 (2.6478)	Entropy 0.62792 (0.62949)	Top-1 acc 63.672 (60.172)	Top-5 acc 81.641 (81.373)	lr 0.01276
Train [60][690/3239]	Time 4.699 (0.951)	Data Time 4.356 (0.480)	Loss 2.7227 (2.6468)	Entropy 0.62821 (0.62947)	Top-1 acc 55.469 (60.185)	Top-5 acc 80.469 (81.401)	lr 0.01276
Train [60][700/3239]	Time 0.238 (0.946)	Data Time 0.001 (0.476)	Loss 2.6375 (2.6468)	Entropy 0.62820 (0.62945)	Top-1 acc 60.156 (60.203)	Top-5 acc 81.250 (81.392)	lr 0.01276
Train [60][710/3239]	Time 0.254 (0.946)	Data Time 0.001 (0.477)	Loss 2.8158 (2.6473)	Entropy 0.62805 (0.62944)	Top-1 acc 54.297 (60.191)	Top-5 acc 78.125 (81.387)	lr 0.01276
Train [60][720/3239]	Time 0.247 (0.949)	Data Time 0.001 (0.480)	Loss 2.6075 (2.6474)	Entropy 0.62821 (0.62942)	Top-1 acc 62.891 (60.190)	Top-5 acc 83.203 (81.390)	lr 0.01275
Train [60][730/3239]	Time 0.276 (0.998)	Data Time 0.004 (0.482)	Loss 2.5627 (2.6474)	Entropy 0.62813 (0.62940)	Top-1 acc 64.062 (60.203)	Top-5 acc 83.203 (81.386)	lr 0.01275
Train [60][740/3239]	Time 0.245 (0.990)	Data Time 0.001 (0.476)	Loss 2.4688 (2.6470)	Entropy 0.62764 (0.62938)	Top-1 acc 63.281 (60.204)	Top-5 acc 83.594 (81.399)	lr 0.01275
Train [60][750/3239]	Time 0.237 (0.982)	Data Time 0.001 (0.470)	Loss 2.6247 (2.6465)	Entropy 0.62713 (0.62935)	Top-1 acc 59.766 (60.221)	Top-5 acc 81.641 (81.404)	lr 0.01275
Train [60][760/3239]	Time 0.259 (0.975)	Data Time 0.001 (0.463)	Loss 2.6483 (2.6464)	Entropy 0.62747 (0.62933)	Top-1 acc 60.938 (60.218)	Top-5 acc 81.641 (81.404)	lr 0.01275
Train [60][770/3239]	Time 0.248 (0.968)	Data Time 0.001 (0.458)	Loss 2.6410 (2.6462)	Entropy 0.62750 (0.62930)	Top-1 acc 62.891 (60.230)	Top-5 acc 83.203 (81.413)	lr 0.01275
Train [60][780/3239]	Time 0.256 (0.961)	Data Time 0.001 (0.452)	Loss 2.5698 (2.6464)	Entropy 0.62742 (0.62928)	Top-1 acc 61.328 (60.215)	Top-5 acc 81.250 (81.402)	lr 0.01275
Train [60][790/3239]	Time 0.232 (0.958)	Data Time 0.001 (0.450)	Loss 2.6770 (2.6469)	Entropy 0.62754 (0.62926)	Top-1 acc 57.031 (60.216)	Top-5 acc 82.031 (81.393)	lr 0.01275
Train [60][800/3239]	Time 0.272 (0.956)	Data Time 0.001 (0.450)	Loss 2.6778 (2.6475)	Entropy 0.62745 (0.62924)	Top-1 acc 59.766 (60.211)	Top-5 acc 80.859 (81.382)	lr 0.01275
Train [60][810/3239]	Time 0.231 (0.950)	Data Time 0.001 (0.444)	Loss 2.3969 (2.6482)	Entropy 0.62743 (0.62921)	Top-1 acc 62.891 (60.192)	Top-5 acc 85.156 (81.366)	lr 0.01275
Train [60][820/3239]	Time 0.254 (0.955)	Data Time 0.001 (0.450)	Loss 2.8837 (2.6487)	Entropy 0.62738 (0.62919)	Top-1 acc 53.516 (60.174)	Top-5 acc 76.562 (81.355)	lr 0.01274
Train [60][830/3239]	Time 0.238 (0.960)	Data Time 0.001 (0.457)	Loss 2.5020 (2.6485)	Entropy 0.62729 (0.62917)	Top-1 acc 64.844 (60.172)	Top-5 acc 83.984 (81.351)	lr 0.01274
Train [60][840/3239]	Time 0.295 (0.954)	Data Time 0.003 (0.451)	Loss 2.6652 (2.6492)	Entropy 0.62734 (0.62915)	Top-1 acc 61.719 (60.153)	Top-5 acc 80.078 (81.351)	lr 0.01274
Train [60][850/3239]	Time 4.908 (0.956)	Data Time 4.547 (0.453)	Loss 2.4818 (2.6492)	Entropy 0.62721 (0.62913)	Top-1 acc 66.797 (60.150)	Top-5 acc 85.547 (81.356)	lr 0.01274
Train [60][860/3239]	Time 0.242 (0.967)	Data Time 0.001 (0.464)	Loss 2.5337 (2.6484)	Entropy 0.62731 (0.62910)	Top-1 acc 61.328 (60.169)	Top-5 acc 82.422 (81.372)	lr 0.01274
Train [60][870/3239]	Time 0.230 (0.961)	Data Time 0.001 (0.459)	Loss 2.5423 (2.6481)	Entropy 0.62702 (0.62908)	Top-1 acc 62.109 (60.177)	Top-5 acc 83.594 (81.375)	lr 0.01274
Train [60][880/3239]	Time 0.243 (0.955)	Data Time 0.001 (0.455)	Loss 2.6528 (2.6487)	Entropy 0.62694 (0.62906)	Top-1 acc 60.938 (60.167)	Top-5 acc 83.594 (81.359)	lr 0.01274
Train [60][890/3239]	Time 0.245 (0.960)	Data Time 0.001 (0.460)	Loss 2.3093 (2.6488)	Entropy 0.62727 (0.62904)	Top-1 acc 69.531 (60.172)	Top-5 acc 88.281 (81.358)	lr 0.01274
Train [60][900/3239]	Time 0.238 (0.968)	Data Time 0.001 (0.469)	Loss 2.7270 (2.6496)	Entropy 0.62679 (0.62901)	Top-1 acc 57.031 (60.155)	Top-5 acc 81.250 (81.355)	lr 0.01274
Train [60][910/3239]	Time 0.236 (0.962)	Data Time 0.001 (0.464)	Loss 2.6885 (2.6500)	Entropy 0.62689 (0.62899)	Top-1 acc 60.156 (60.146)	Top-5 acc 80.859 (81.342)	lr 0.01274
Train [60][920/3239]	Time 0.349 (0.965)	Data Time 0.002 (0.468)	Loss 2.7109 (2.6498)	Entropy 0.62680 (0.62897)	Top-1 acc 58.594 (60.144)	Top-5 acc 80.859 (81.346)	lr 0.01273
Train [60][930/3239]	Time 0.239 (0.972)	Data Time 0.001 (0.475)	Loss 2.5924 (2.6495)	Entropy 0.62673 (0.62894)	Top-1 acc 62.109 (60.158)	Top-5 acc 81.250 (81.345)	lr 0.01273
Train [60][940/3239]	Time 0.236 (0.966)	Data Time 0.001 (0.470)	Loss 2.7104 (2.6496)	Entropy 0.62685 (0.62892)	Top-1 acc 62.109 (60.148)	Top-5 acc 80.469 (81.336)	lr 0.01273
Train [60][950/3239]	Time 1.113 (0.967)	Data Time 0.854 (0.472)	Loss 2.7878 (2.6499)	Entropy 0.62674 (0.62890)	Top-1 acc 57.031 (60.135)	Top-5 acc 80.078 (81.334)	lr 0.01273
Train [60][960/3239]	Time 0.253 (0.975)	Data Time 0.001 (0.481)	Loss 2.6543 (2.6500)	Entropy 0.62689 (0.62888)	Top-1 acc 57.031 (60.120)	Top-5 acc 83.203 (81.337)	lr 0.01273
Train [60][970/3239]	Time 0.249 (0.970)	Data Time 0.001 (0.476)	Loss 2.6758 (2.6496)	Entropy 0.62718 (0.62886)	Top-1 acc 58.594 (60.130)	Top-5 acc 82.031 (81.352)	lr 0.01273
Train [60][980/3239]	Time 0.244 (0.969)	Data Time 0.001 (0.476)	Loss 2.4777 (2.6492)	Entropy 0.62694 (0.62884)	Top-1 acc 65.234 (60.125)	Top-5 acc 85.547 (81.360)	lr 0.01273
Train [60][990/3239]	Time 0.244 (0.984)	Data Time 0.001 (0.491)	Loss 2.4335 (2.6493)	Entropy 0.62728 (0.62882)	Top-1 acc 65.234 (60.115)	Top-5 acc 85.547 (81.356)	lr 0.01273
Train [60][1000/3239]	Time 0.230 (0.978)	Data Time 0.001 (0.487)	Loss 2.8139 (2.6498)	Entropy 0.62665 (0.62880)	Top-1 acc 57.812 (60.107)	Top-5 acc 80.078 (81.348)	lr 0.01273
Train [60][1010/3239]	Time 0.325 (0.973)	Data Time 0.001 (0.482)	Loss 2.8431 (2.6500)	Entropy 0.62683 (0.62878)	Top-1 acc 53.906 (60.098)	Top-5 acc 76.562 (81.343)	lr 0.01273
Train [60][1020/3239]	Time 0.237 (0.991)	Data Time 0.001 (0.501)	Loss 2.6527 (2.6499)	Entropy 0.62669 (0.62876)	Top-1 acc 58.594 (60.099)	Top-5 acc 79.297 (81.340)	lr 0.01272
Train [60][1030/3239]	Time 0.229 (0.985)	Data Time 0.001 (0.496)	Loss 2.7078 (2.6504)	Entropy 0.62691 (0.62874)	Top-1 acc 55.078 (60.084)	Top-5 acc 78.906 (81.330)	lr 0.01272
Train [60][1040/3239]	Time 0.247 (0.980)	Data Time 0.001 (0.491)	Loss 2.6866 (2.6506)	Entropy 0.62685 (0.62872)	Top-1 acc 60.938 (60.086)	Top-5 acc 80.859 (81.324)	lr 0.01272
Train [60][1050/3239]	Time 0.243 (0.979)	Data Time 0.001 (0.491)	Loss 2.5448 (2.6505)	Entropy 0.62707 (0.62871)	Top-1 acc 64.062 (60.087)	Top-5 acc 82.812 (81.322)	lr 0.01272
Train [60][1060/3239]	Time 0.258 (0.988)	Data Time 0.001 (0.500)	Loss 2.7577 (2.6509)	Entropy 0.62707 (0.62869)	Top-1 acc 60.156 (60.076)	Top-5 acc 76.953 (81.311)	lr 0.01272
Train [60][1070/3239]	Time 0.249 (0.982)	Data Time 0.001 (0.495)	Loss 2.6837 (2.6512)	Entropy 0.62692 (0.62868)	Top-1 acc 58.203 (60.068)	Top-5 acc 82.422 (81.309)	lr 0.01272
Train [60][1080/3239]	Time 0.374 (0.985)	Data Time 0.001 (0.498)	Loss 2.5660 (2.6506)	Entropy 0.62687 (0.62866)	Top-1 acc 60.547 (60.080)	Top-5 acc 82.812 (81.323)	lr 0.01272
Train [60][1090/3239]	Time 0.260 (0.993)	Data Time 0.004 (0.507)	Loss 2.5394 (2.6506)	Entropy 0.62707 (0.62865)	Top-1 acc 65.234 (60.076)	Top-5 acc 81.641 (81.314)	lr 0.01272
Train [60][1100/3239]	Time 0.239 (0.987)	Data Time 0.001 (0.503)	Loss 2.7603 (2.6505)	Entropy 0.62684 (0.62863)	Top-1 acc 54.688 (60.079)	Top-5 acc 79.688 (81.313)	lr 0.01272
Train [60][1110/3239]	Time 8.194 (0.992)	Data Time 7.911 (0.508)	Loss 2.7231 (2.6507)	Entropy 0.62685 (0.62861)	Top-1 acc 56.250 (60.068)	Top-5 acc 80.469 (81.315)	lr 0.01272
Train [60][1120/3239]	Time 0.235 (0.996)	Data Time 0.001 (0.512)	Loss 2.7711 (2.6508)	Entropy 0.62692 (0.62860)	Top-1 acc 59.375 (60.070)	Top-5 acc 79.688 (81.311)	lr 0.01271
Train [60][1130/3239]	Time 0.250 (0.991)	Data Time 0.002 (0.508)	Loss 2.6544 (2.6514)	Entropy 0.62724 (0.62859)	Top-1 acc 62.109 (60.064)	Top-5 acc 78.516 (81.291)	lr 0.01271
Train [60][1140/3239]	Time 0.256 (0.989)	Data Time 0.001 (0.507)	Loss 2.6132 (2.6515)	Entropy 0.62710 (0.62857)	Top-1 acc 61.719 (60.061)	Top-5 acc 83.203 (81.289)	lr 0.01271
Train [60][1150/3239]	Time 0.233 (1.001)	Data Time 0.001 (0.520)	Loss 2.4933 (2.6510)	Entropy 0.62729 (0.62856)	Top-1 acc 67.188 (60.075)	Top-5 acc 85.156 (81.299)	lr 0.01271
Train [60][1160/3239]	Time 0.235 (0.996)	Data Time 0.001 (0.515)	Loss 2.7283 (2.6511)	Entropy 0.62743 (0.62855)	Top-1 acc 59.766 (60.070)	Top-5 acc 80.078 (81.302)	lr 0.01271
Train [60][1170/3239]	Time 0.254 (0.991)	Data Time 0.001 (0.511)	Loss 2.5885 (2.6515)	Entropy 0.62776 (0.62854)	Top-1 acc 62.891 (60.065)	Top-5 acc 82.812 (81.288)	lr 0.01271
Train [60][1180/3239]	Time 0.225 (1.006)	Data Time 0.001 (0.526)	Loss 2.5025 (2.6513)	Entropy 0.62781 (0.62854)	Top-1 acc 61.719 (60.065)	Top-5 acc 82.031 (81.294)	lr 0.01271
Train [60][1190/3239]	Time 0.226 (1.001)	Data Time 0.001 (0.522)	Loss 2.7169 (2.6510)	Entropy 0.62795 (0.62853)	Top-1 acc 58.203 (60.072)	Top-5 acc 80.078 (81.299)	lr 0.01271
Train [60][1200/3239]	Time 0.248 (0.996)	Data Time 0.001 (0.518)	Loss 2.7065 (2.6510)	Entropy 0.62798 (0.62853)	Top-1 acc 57.422 (60.076)	Top-5 acc 79.688 (81.294)	lr 0.01271
Train [60][1210/3239]	Time 0.232 (1.004)	Data Time 0.001 (0.526)	Loss 2.6118 (2.6508)	Entropy 0.62783 (0.62852)	Top-1 acc 60.156 (60.084)	Top-5 acc 81.250 (81.306)	lr 0.01271
Train [60][1220/3239]	Time 0.236 (1.007)	Data Time 0.001 (0.530)	Loss 2.5746 (2.6506)	Entropy 0.62772 (0.62851)	Top-1 acc 63.672 (60.091)	Top-5 acc 82.422 (81.306)	lr 0.01270
Train [60][1230/3239]	Time 0.244 (1.002)	Data Time 0.001 (0.525)	Loss 2.4797 (2.6508)	Entropy 0.62760 (0.62851)	Top-1 acc 64.062 (60.088)	Top-5 acc 82.812 (81.302)	lr 0.01270
Train [60][1240/3239]	Time 0.339 (1.009)	Data Time 0.001 (0.533)	Loss 2.9930 (2.6509)	Entropy 0.62766 (0.62850)	Top-1 acc 50.000 (60.083)	Top-5 acc 73.438 (81.302)	lr 0.01270
Train [60][1250/3239]	Time 0.237 (1.010)	Data Time 0.001 (0.534)	Loss 2.8451 (2.6513)	Entropy 0.62793 (0.62849)	Top-1 acc 53.906 (60.070)	Top-5 acc 76.562 (81.297)	lr 0.01270
Train [60][1260/3239]	Time 3.772 (1.008)	Data Time 3.544 (0.533)	Loss 2.8073 (2.6512)	Entropy 0.62783 (0.62849)	Top-1 acc 54.688 (60.069)	Top-5 acc 81.250 (81.304)	lr 0.01270
Train [60][1270/3239]	Time 12.208 (1.014)	Data Time 11.963 (0.539)	Loss 2.5725 (2.6510)	Entropy 0.62787 (0.62848)	Top-1 acc 58.203 (60.071)	Top-5 acc 82.031 (81.303)	lr 0.01270
Train [60][1280/3239]	Time 0.243 (1.016)	Data Time 0.001 (0.542)	Loss 2.6335 (2.6510)	Entropy 0.62800 (0.62848)	Top-1 acc 60.938 (60.065)	Top-5 acc 79.688 (81.310)	lr 0.01270
Train [60][1290/3239]	Time 0.231 (1.012)	Data Time 0.001 (0.538)	Loss 2.6054 (2.6509)	Entropy 0.62833 (0.62848)	Top-1 acc 62.500 (60.069)	Top-5 acc 85.547 (81.316)	lr 0.01270
Train [60][1300/3239]	Time 0.227 (1.013)	Data Time 0.001 (0.540)	Loss 2.8557 (2.6512)	Entropy 0.62831 (0.62848)	Top-1 acc 52.734 (60.056)	Top-5 acc 75.391 (81.310)	lr 0.01270
Train [60][1310/3239]	Time 0.331 (1.024)	Data Time 0.001 (0.552)	Loss 2.5800 (2.6510)	Entropy 0.62848 (0.62848)	Top-1 acc 58.594 (60.060)	Top-5 acc 83.203 (81.312)	lr 0.01269
Train [60][1320/3239]	Time 0.251 (1.019)	Data Time 0.001 (0.547)	Loss 2.7261 (2.6505)	Entropy 0.62836 (0.62848)	Top-1 acc 55.078 (60.070)	Top-5 acc 79.688 (81.321)	lr 0.01269
Train [60][1330/3239]	Time 0.242 (1.020)	Data Time 0.001 (0.549)	Loss 2.5965 (2.6510)	Entropy 0.62852 (0.62848)	Top-1 acc 62.109 (60.059)	Top-5 acc 84.766 (81.317)	lr 0.01269
Train [60][1340/3239]	Time 0.238 (1.030)	Data Time 0.001 (0.559)	Loss 2.7746 (2.6510)	Entropy 0.62852 (0.62848)	Top-1 acc 60.938 (60.064)	Top-5 acc 77.734 (81.311)	lr 0.01269
Train [60][1350/3239]	Time 0.233 (1.028)	Data Time 0.001 (0.557)	Loss 2.8198 (2.6511)	Entropy 0.62877 (0.62848)	Top-1 acc 58.203 (60.065)	Top-5 acc 75.781 (81.309)	lr 0.01269
Train [60][1360/3239]	Time 0.243 (1.028)	Data Time 0.002 (0.558)	Loss 2.6366 (2.6514)	Entropy 0.62873 (0.62848)	Top-1 acc 57.812 (60.053)	Top-5 acc 80.469 (81.305)	lr 0.01269
Train [60][1370/3239]	Time 0.251 (1.037)	Data Time 0.001 (0.568)	Loss 2.7268 (2.6515)	Entropy 0.62869 (0.62848)	Top-1 acc 58.594 (60.050)	Top-5 acc 77.734 (81.308)	lr 0.01269
Train [60][1380/3239]	Time 0.405 (1.063)	Data Time 0.006 (0.569)	Loss 2.8054 (2.6515)	Entropy 0.62883 (0.62848)	Top-1 acc 53.125 (60.052)	Top-5 acc 78.125 (81.308)	lr 0.01269
Train [60][1390/3239]	Time 0.234 (1.059)	Data Time 0.002 (0.565)	Loss 2.8057 (2.6519)	Entropy 0.62904 (0.62849)	Top-1 acc 58.594 (60.037)	Top-5 acc 78.125 (81.292)	lr 0.01269
Train [60][1400/3239]	Time 0.345 (1.055)	Data Time 0.004 (0.561)	Loss 2.7826 (2.6521)	Entropy 0.62904 (0.62849)	Top-1 acc 55.859 (60.037)	Top-5 acc 79.297 (81.289)	lr 0.01269
Train [60][1410/3239]	Time 0.233 (1.050)	Data Time 0.001 (0.557)	Loss 2.7590 (2.6519)	Entropy 0.62926 (0.62849)	Top-1 acc 58.594 (60.035)	Top-5 acc 80.078 (81.294)	lr 0.01268
Train [60][1420/3239]	Time 0.241 (1.046)	Data Time 0.001 (0.553)	Loss 2.6358 (2.6519)	Entropy 0.62903 (0.62850)	Top-1 acc 62.500 (60.029)	Top-5 acc 83.203 (81.292)	lr 0.01268
Train [60][1430/3239]	Time 11.639 (1.049)	Data Time 11.379 (0.557)	Loss 2.3122 (2.6519)	Entropy 0.62899 (0.62850)	Top-1 acc 67.188 (60.031)	Top-5 acc 88.672 (81.288)	lr 0.01268
Train [60][1440/3239]	Time 0.283 (1.050)	Data Time 0.001 (0.558)	Loss 2.4296 (2.6519)	Entropy 0.62906 (0.62851)	Top-1 acc 63.672 (60.030)	Top-5 acc 86.328 (81.291)	lr 0.01268
Train [60][1450/3239]	Time 0.241 (1.046)	Data Time 0.001 (0.554)	Loss 2.7035 (2.6517)	Entropy 0.62943 (0.62851)	Top-1 acc 61.719 (60.039)	Top-5 acc 80.078 (81.297)	lr 0.01268
Train [60][1460/3239]	Time 0.232 (1.049)	Data Time 0.001 (0.558)	Loss 2.6795 (2.6517)	Entropy 0.62906 (0.62852)	Top-1 acc 58.984 (60.043)	Top-5 acc 82.031 (81.297)	lr 0.01268
Train [60][1470/3239]	Time 0.232 (1.056)	Data Time 0.001 (0.565)	Loss 2.5741 (2.6516)	Entropy 0.62868 (0.62852)	Top-1 acc 64.062 (60.044)	Top-5 acc 77.734 (81.296)	lr 0.01268
Train [60][1480/3239]	Time 0.257 (1.053)	Data Time 0.002 (0.563)	Loss 2.5080 (2.6515)	Entropy 0.62836 (0.62852)	Top-1 acc 63.281 (60.053)	Top-5 acc 85.156 (81.293)	lr 0.01268
Train [60][1490/3239]	Time 0.249 (1.053)	Data Time 0.001 (0.564)	Loss 2.6486 (2.6517)	Entropy 0.62838 (0.62852)	Top-1 acc 60.156 (60.052)	Top-5 acc 80.078 (81.285)	lr 0.01268
Train [60][1500/3239]	Time 0.236 (1.059)	Data Time 0.001 (0.570)	Loss 2.9687 (2.6522)	Entropy 0.62853 (0.62852)	Top-1 acc 50.391 (60.044)	Top-5 acc 76.562 (81.274)	lr 0.01268
Train [60][1510/3239]	Time 0.238 (1.060)	Data Time 0.001 (0.571)	Loss 2.7162 (2.6519)	Entropy 0.62859 (0.62852)	Top-1 acc 60.547 (60.060)	Top-5 acc 78.906 (81.277)	lr 0.01267
Train [60][1520/3239]	Time 0.238 (1.059)	Data Time 0.001 (0.570)	Loss 2.4332 (2.6517)	Entropy 0.62889 (0.62852)	Top-1 acc 66.016 (60.066)	Top-5 acc 86.719 (81.275)	lr 0.01267
Train [60][1530/3239]	Time 0.233 (1.061)	Data Time 0.001 (0.573)	Loss 2.7195 (2.6518)	Entropy 0.62876 (0.62852)	Top-1 acc 60.156 (60.069)	Top-5 acc 80.078 (81.270)	lr 0.01267
Train [60][1540/3239]	Time 0.233 (1.063)	Data Time 0.001 (0.576)	Loss 2.6783 (2.6518)	Entropy 0.62893 (0.62852)	Top-1 acc 61.328 (60.068)	Top-5 acc 80.078 (81.275)	lr 0.01267
Train [60][1550/3239]	Time 0.243 (1.063)	Data Time 0.001 (0.576)	Loss 2.5443 (2.6517)	Entropy 0.62881 (0.62853)	Top-1 acc 58.594 (60.070)	Top-5 acc 84.375 (81.277)	lr 0.01267
Train [60][1560/3239]	Time 0.346 (1.066)	Data Time 0.001 (0.580)	Loss 2.4702 (2.6515)	Entropy 0.62861 (0.62853)	Top-1 acc 64.453 (60.070)	Top-5 acc 83.203 (81.278)	lr 0.01267
Train [60][1570/3239]	Time 0.231 (1.067)	Data Time 0.001 (0.581)	Loss 2.6585 (2.6515)	Entropy 0.62860 (0.62853)	Top-1 acc 60.547 (60.067)	Top-5 acc 80.469 (81.280)	lr 0.01267
Train [60][1580/3239]	Time 2.515 (1.064)	Data Time 2.256 (0.579)	Loss 2.7937 (2.6517)	Entropy 0.62818 (0.62853)	Top-1 acc 57.422 (60.057)	Top-5 acc 80.859 (81.275)	lr 0.01267
Train [60][1590/3239]	Time 3.619 (1.070)	Data Time 3.377 (0.585)	Loss 2.4974 (2.6518)	Entropy 0.62798 (0.62852)	Top-1 acc 64.844 (60.063)	Top-5 acc 82.422 (81.268)	lr 0.01267
Train [60][1600/3239]	Time 0.244 (1.071)	Data Time 0.001 (0.586)	Loss 2.6097 (2.6519)	Entropy 0.62836 (0.62852)	Top-1 acc 60.938 (60.060)	Top-5 acc 81.641 (81.266)	lr 0.01267
Train [60][1610/3239]	Time 0.235 (1.067)	Data Time 0.001 (0.583)	Loss 2.6206 (2.6519)	Entropy 0.62831 (0.62852)	Top-1 acc 59.766 (60.063)	Top-5 acc 84.375 (81.271)	lr 0.01266
Train [60][1620/3239]	Time 0.232 (1.069)	Data Time 0.001 (0.585)	Loss 2.7853 (2.6518)	Entropy 0.62826 (0.62852)	Top-1 acc 55.859 (60.063)	Top-5 acc 77.734 (81.269)	lr 0.01266
Train [60][1630/3239]	Time 0.336 (1.075)	Data Time 0.001 (0.591)	Loss 2.4683 (2.6519)	Entropy 0.62848 (0.62852)	Top-1 acc 62.891 (60.058)	Top-5 acc 87.500 (81.268)	lr 0.01266
Train [60][1640/3239]	Time 0.238 (1.071)	Data Time 0.001 (0.587)	Loss 2.6990 (2.6516)	Entropy 0.62850 (0.62852)	Top-1 acc 60.938 (60.058)	Top-5 acc 80.078 (81.271)	lr 0.01266
Train [60][1650/3239]	Time 0.239 (1.073)	Data Time 0.001 (0.590)	Loss 2.7793 (2.6516)	Entropy 0.62858 (0.62852)	Top-1 acc 58.203 (60.060)	Top-5 acc 78.516 (81.268)	lr 0.01266
Train [60][1660/3239]	Time 0.309 (1.077)	Data Time 0.041 (0.595)	Loss 2.6774 (2.6513)	Entropy 0.62878 (0.62852)	Top-1 acc 60.938 (60.071)	Top-5 acc 78.516 (81.274)	lr 0.01266
Train [60][1670/3239]	Time 0.252 (1.075)	Data Time 0.001 (0.593)	Loss 2.7683 (2.6515)	Entropy 0.62891 (0.62852)	Top-1 acc 56.250 (60.070)	Top-5 acc 78.906 (81.271)	lr 0.01266
Train [60][1680/3239]	Time 0.227 (1.077)	Data Time 0.001 (0.595)	Loss 2.7178 (2.6513)	Entropy 0.62897 (0.62852)	Top-1 acc 58.594 (60.073)	Top-5 acc 80.859 (81.275)	lr 0.01266
Train [60][1690/3239]	Time 0.226 (1.076)	Data Time 0.001 (0.595)	Loss 2.6930 (2.6517)	Entropy 0.62909 (0.62853)	Top-1 acc 62.109 (60.068)	Top-5 acc 82.422 (81.271)	lr 0.01266
Train [60][1700/3239]	Time 0.234 (1.079)	Data Time 0.001 (0.598)	Loss 2.6233 (2.6517)	Entropy 0.62868 (0.62853)	Top-1 acc 61.328 (60.064)	Top-5 acc 82.031 (81.271)	lr 0.01266
Train [60][1710/3239]	Time 0.244 (1.080)	Data Time 0.001 (0.600)	Loss 2.8293 (2.6519)	Entropy 0.62859 (0.62853)	Top-1 acc 55.078 (60.057)	Top-5 acc 75.391 (81.265)	lr 0.01265
Train [60][1720/3239]	Time 0.326 (1.080)	Data Time 0.001 (0.600)	Loss 2.6602 (2.6519)	Entropy 0.62855 (0.62853)	Top-1 acc 58.984 (60.054)	Top-5 acc 82.812 (81.265)	lr 0.01265
Train [60][1730/3239]	Time 0.270 (1.084)	Data Time 0.001 (0.604)	Loss 2.4733 (2.6518)	Entropy 0.62821 (0.62853)	Top-1 acc 66.406 (60.059)	Top-5 acc 84.766 (81.265)	lr 0.01265
Train [60][1740/3239]	Time 0.260 (1.080)	Data Time 0.003 (0.600)	Loss 2.5149 (2.6517)	Entropy 0.62827 (0.62853)	Top-1 acc 61.328 (60.062)	Top-5 acc 84.375 (81.269)	lr 0.01265
Train [60][1750/3239]	Time 0.236 (1.080)	Data Time 0.001 (0.600)	Loss 2.6222 (2.6517)	Entropy 0.62809 (0.62853)	Top-1 acc 60.156 (60.065)	Top-5 acc 83.594 (81.268)	lr 0.01265
Train [60][1760/3239]	Time 0.254 (1.081)	Data Time 0.001 (0.602)	Loss 2.5635 (2.6516)	Entropy 0.62782 (0.62853)	Top-1 acc 58.594 (60.067)	Top-5 acc 81.250 (81.269)	lr 0.01265
Train [60][1770/3239]	Time 0.243 (1.077)	Data Time 0.001 (0.598)	Loss 2.4663 (2.6515)	Entropy 0.62796 (0.62852)	Top-1 acc 64.453 (60.066)	Top-5 acc 85.547 (81.273)	lr 0.01265
Train [60][1780/3239]	Time 0.231 (1.075)	Data Time 0.001 (0.596)	Loss 2.6021 (2.6517)	Entropy 0.62795 (0.62852)	Top-1 acc 59.375 (60.054)	Top-5 acc 82.812 (81.272)	lr 0.01265
Train [60][1790/3239]	Time 0.346 (1.077)	Data Time 0.002 (0.599)	Loss 2.7632 (2.6518)	Entropy 0.62818 (0.62852)	Top-1 acc 58.203 (60.056)	Top-5 acc 77.734 (81.269)	lr 0.01265
Train [60][1800/3239]	Time 0.250 (1.074)	Data Time 0.001 (0.596)	Loss 2.7089 (2.6524)	Entropy 0.62810 (0.62851)	Top-1 acc 56.250 (60.044)	Top-5 acc 80.469 (81.259)	lr 0.01265
Train [60][1810/3239]	Time 0.251 (1.072)	Data Time 0.001 (0.595)	Loss 2.6442 (2.6525)	Entropy 0.62824 (0.62851)	Top-1 acc 59.766 (60.044)	Top-5 acc 80.078 (81.258)	lr 0.01264
Train [60][1820/3239]	Time 0.252 (1.080)	Data Time 0.001 (0.603)	Loss 2.6187 (2.6524)	Entropy 0.62836 (0.62851)	Top-1 acc 61.328 (60.044)	Top-5 acc 80.859 (81.258)	lr 0.01264
Train [60][1830/3239]	Time 0.222 (1.077)	Data Time 0.001 (0.600)	Loss 2.6891 (2.6530)	Entropy 0.62858 (0.62851)	Top-1 acc 58.984 (60.035)	Top-5 acc 83.594 (81.246)	lr 0.01264
Train [60][1840/3239]	Time 0.245 (1.076)	Data Time 0.001 (0.599)	Loss 2.6142 (2.6527)	Entropy 0.62891 (0.62851)	Top-1 acc 61.719 (60.040)	Top-5 acc 80.469 (81.251)	lr 0.01264
Train [60][1850/3239]	Time 0.283 (1.076)	Data Time 0.001 (0.600)	Loss 2.5779 (2.6527)	Entropy 0.62924 (0.62851)	Top-1 acc 59.766 (60.038)	Top-5 acc 85.547 (81.254)	lr 0.01264
Train [60][1860/3239]	Time 0.237 (1.080)	Data Time 0.001 (0.604)	Loss 2.5882 (2.6526)	Entropy 0.62962 (0.62852)	Top-1 acc 60.547 (60.028)	Top-5 acc 82.812 (81.256)	lr 0.01264
Train [60][1870/3239]	Time 0.254 (1.078)	Data Time 0.001 (0.602)	Loss 2.5943 (2.6524)	Entropy 0.62944 (0.62852)	Top-1 acc 60.938 (60.028)	Top-5 acc 82.422 (81.264)	lr 0.01264
Train [60][1880/3239]	Time 0.275 (1.079)	Data Time 0.001 (0.604)	Loss 2.4894 (2.6525)	Entropy 0.62944 (0.62853)	Top-1 acc 63.672 (60.029)	Top-5 acc 83.594 (81.265)	lr 0.01264
Train [60][1890/3239]	Time 0.250 (1.085)	Data Time 0.001 (0.610)	Loss 2.7907 (2.6524)	Entropy 0.62961 (0.62853)	Top-1 acc 56.250 (60.029)	Top-5 acc 79.297 (81.268)	lr 0.01264
Train [60][1900/3239]	Time 0.244 (1.081)	Data Time 0.001 (0.606)	Loss 2.8559 (2.6525)	Entropy 0.62975 (0.62854)	Top-1 acc 53.125 (60.023)	Top-5 acc 80.078 (81.268)	lr 0.01264
Train [60][1910/3239]	Time 0.264 (1.083)	Data Time 0.001 (0.609)	Loss 2.5907 (2.6528)	Entropy 0.62983 (0.62855)	Top-1 acc 62.500 (60.011)	Top-5 acc 82.812 (81.266)	lr 0.01263
Train [60][1920/3239]	Time 0.240 (1.085)	Data Time 0.001 (0.611)	Loss 2.7016 (2.6528)	Entropy 0.63004 (0.62855)	Top-1 acc 58.203 (60.017)	Top-5 acc 80.859 (81.267)	lr 0.01263
Train [60][1930/3239]	Time 0.252 (1.081)	Data Time 0.001 (0.607)	Loss 2.4380 (2.6528)	Entropy 0.62998 (0.62856)	Top-1 acc 67.969 (60.013)	Top-5 acc 85.938 (81.269)	lr 0.01263
Train [60][1940/3239]	Time 0.248 (1.078)	Data Time 0.001 (0.604)	Loss 2.5904 (2.6528)	Entropy 0.62984 (0.62857)	Top-1 acc 60.156 (60.013)	Top-5 acc 83.594 (81.268)	lr 0.01263
Train [60][1950/3239]	Time 0.346 (1.081)	Data Time 0.001 (0.607)	Loss 2.7019 (2.6527)	Entropy 0.63018 (0.62858)	Top-1 acc 58.203 (60.017)	Top-5 acc 81.250 (81.270)	lr 0.01263
Train [60][1960/3239]	Time 0.286 (1.077)	Data Time 0.001 (0.604)	Loss 2.6946 (2.6526)	Entropy 0.63026 (0.62858)	Top-1 acc 55.469 (60.019)	Top-5 acc 82.422 (81.275)	lr 0.01263
Train [60][1970/3239]	Time 0.238 (1.074)	Data Time 0.001 (0.601)	Loss 2.5140 (2.6525)	Entropy 0.63015 (0.62859)	Top-1 acc 60.938 (60.018)	Top-5 acc 82.422 (81.278)	lr 0.01263
Train [60][1980/3239]	Time 0.250 (1.076)	Data Time 0.001 (0.603)	Loss 2.5883 (2.6525)	Entropy 0.63013 (0.62860)	Top-1 acc 62.109 (60.017)	Top-5 acc 82.031 (81.275)	lr 0.01263
Train [60][1990/3239]	Time 0.238 (1.073)	Data Time 0.001 (0.600)	Loss 2.7134 (2.6527)	Entropy 0.63007 (0.62861)	Top-1 acc 58.984 (60.019)	Top-5 acc 79.688 (81.272)	lr 0.01263
Train [60][2000/3239]	Time 0.243 (1.070)	Data Time 0.001 (0.597)	Loss 2.7416 (2.6528)	Entropy 0.63003 (0.62861)	Top-1 acc 55.469 (60.018)	Top-5 acc 80.078 (81.267)	lr 0.01263
Train [60][2010/3239]	Time 0.242 (1.068)	Data Time 0.001 (0.596)	Loss 2.7146 (2.6529)	Entropy 0.63018 (0.62862)	Top-1 acc 57.812 (60.011)	Top-5 acc 81.250 (81.264)	lr 0.01262
Train [60][2020/3239]	Time 0.393 (1.069)	Data Time 0.001 (0.597)	Loss 2.7700 (2.6530)	Entropy 0.63020 (0.62863)	Top-1 acc 58.594 (60.008)	Top-5 acc 78.906 (81.265)	lr 0.01262
Train [60][2030/3239]	Time 0.254 (1.066)	Data Time 0.001 (0.594)	Loss 2.4905 (2.6530)	Entropy 0.62990 (0.62864)	Top-1 acc 65.234 (60.012)	Top-5 acc 81.641 (81.262)	lr 0.01262
Train [60][2040/3239]	Time 0.491 (1.079)	Data Time 0.002 (0.591)	Loss 2.4719 (2.6532)	Entropy 0.63018 (0.62864)	Top-1 acc 64.062 (60.008)	Top-5 acc 85.938 (81.258)	lr 0.01262
Train [60][2050/3239]	Time 0.251 (1.076)	Data Time 0.002 (0.588)	Loss 2.4140 (2.6532)	Entropy 0.63025 (0.62865)	Top-1 acc 61.328 (60.007)	Top-5 acc 85.938 (81.260)	lr 0.01262
Train [60][2060/3239]	Time 0.232 (1.074)	Data Time 0.001 (0.585)	Loss 2.5089 (2.6532)	Entropy 0.63023 (0.62866)	Top-1 acc 66.016 (60.011)	Top-5 acc 83.984 (81.263)	lr 0.01262
Train [60][2070/3239]	Time 0.230 (1.070)	Data Time 0.001 (0.582)	Loss 2.6277 (2.6533)	Entropy 0.63025 (0.62867)	Top-1 acc 58.984 (60.010)	Top-5 acc 82.422 (81.262)	lr 0.01262
Train [60][2080/3239]	Time 0.247 (1.067)	Data Time 0.002 (0.580)	Loss 2.8525 (2.6535)	Entropy 0.63047 (0.62867)	Top-1 acc 57.422 (60.007)	Top-5 acc 79.688 (81.260)	lr 0.01262
Train [60][2090/3239]	Time 0.261 (1.064)	Data Time 0.001 (0.577)	Loss 2.6862 (2.6536)	Entropy 0.63048 (0.62868)	Top-1 acc 55.078 (60.003)	Top-5 acc 81.250 (81.255)	lr 0.01262
Train [60][2100/3239]	Time 0.240 (1.064)	Data Time 0.001 (0.577)	Loss 2.5776 (2.6536)	Entropy 0.63058 (0.62869)	Top-1 acc 60.547 (60.003)	Top-5 acc 82.812 (81.259)	lr 0.01262
Train [60][2110/3239]	Time 2.897 (1.065)	Data Time 2.450 (0.579)	Loss 2.8235 (2.6540)	Entropy 0.62968 (0.62870)	Top-1 acc 53.516 (59.992)	Top-5 acc 80.078 (81.254)	lr 0.01261
Train [60][2120/3239]	Time 0.251 (1.062)	Data Time 0.001 (0.576)	Loss 2.5772 (2.6538)	Entropy 0.62972 (0.62870)	Top-1 acc 61.719 (59.997)	Top-5 acc 83.594 (81.257)	lr 0.01261
Train [60][2130/3239]	Time 0.260 (1.059)	Data Time 0.001 (0.573)	Loss 2.7029 (2.6538)	Entropy 0.62999 (0.62871)	Top-1 acc 61.719 (60.003)	Top-5 acc 80.469 (81.255)	lr 0.01261
Train [60][2140/3239]	Time 0.238 (1.069)	Data Time 0.001 (0.583)	Loss 2.7164 (2.6539)	Entropy 0.63010 (0.62871)	Top-1 acc 59.375 (60.002)	Top-5 acc 79.688 (81.253)	lr 0.01261
Train [60][2150/3239]	Time 0.274 (1.066)	Data Time 0.001 (0.580)	Loss 2.5691 (2.6542)	Entropy 0.63038 (0.62872)	Top-1 acc 61.719 (59.993)	Top-5 acc 83.594 (81.251)	lr 0.01261
Train [60][2160/3239]	Time 0.242 (1.063)	Data Time 0.001 (0.578)	Loss 2.6230 (2.6543)	Entropy 0.63018 (0.62873)	Top-1 acc 59.375 (59.990)	Top-5 acc 82.812 (81.250)	lr 0.01261
Train [60][2170/3239]	Time 0.234 (1.073)	Data Time 0.001 (0.588)	Loss 2.5964 (2.6545)	Entropy 0.62974 (0.62873)	Top-1 acc 61.328 (59.987)	Top-5 acc 82.031 (81.243)	lr 0.01261
Train [60][2180/3239]	Time 0.281 (1.070)	Data Time 0.001 (0.585)	Loss 2.5682 (2.6545)	Entropy 0.62996 (0.62874)	Top-1 acc 59.766 (59.988)	Top-5 acc 82.422 (81.242)	lr 0.01261
Train [60][2190/3239]	Time 0.243 (1.070)	Data Time 0.001 (0.586)	Loss 2.5497 (2.6547)	Entropy 0.62993 (0.62875)	Top-1 acc 61.328 (59.985)	Top-5 acc 79.688 (81.235)	lr 0.01261
Train [60][2200/3239]	Time 10.979 (1.078)	Data Time 10.655 (0.593)	Loss 2.6537 (2.6545)	Entropy 0.62987 (0.62875)	Top-1 acc 61.328 (59.990)	Top-5 acc 79.688 (81.239)	lr 0.01261
Train [60][2210/3239]	Time 0.279 (1.075)	Data Time 0.001 (0.591)	Loss 2.6459 (2.6545)	Entropy 0.62980 (0.62876)	Top-1 acc 60.938 (59.986)	Top-5 acc 82.031 (81.239)	lr 0.01260
Train [60][2220/3239]	Time 0.242 (1.075)	Data Time 0.001 (0.591)	Loss 2.7106 (2.6546)	Entropy 0.62945 (0.62876)	Top-1 acc 57.422 (59.982)	Top-5 acc 78.906 (81.235)	lr 0.01260
Train [60][2230/3239]	Time 1.854 (1.079)	Data Time 1.617 (0.595)	Loss 2.7406 (2.6547)	Entropy 0.62933 (0.62876)	Top-1 acc 61.719 (59.981)	Top-5 acc 78.516 (81.232)	lr 0.01260
Train [60][2240/3239]	Time 0.250 (1.078)	Data Time 0.001 (0.595)	Loss 2.8653 (2.6547)	Entropy 0.62941 (0.62877)	Top-1 acc 56.641 (59.982)	Top-5 acc 76.172 (81.227)	lr 0.01260
Train [60][2250/3239]	Time 0.595 (1.076)	Data Time 0.366 (0.593)	Loss 2.7064 (2.6548)	Entropy 0.62924 (0.62877)	Top-1 acc 60.156 (59.980)	Top-5 acc 79.688 (81.223)	lr 0.01260
Train [60][2260/3239]	Time 6.775 (1.083)	Data Time 6.524 (0.600)	Loss 2.5303 (2.6548)	Entropy 0.62906 (0.62877)	Top-1 acc 64.844 (59.977)	Top-5 acc 84.766 (81.224)	lr 0.01260
Train [60][2270/3239]	Time 0.357 (1.083)	Data Time 0.001 (0.600)	Loss 2.7878 (2.6547)	Entropy 0.62883 (0.62877)	Top-1 acc 58.984 (59.979)	Top-5 acc 76.953 (81.224)	lr 0.01260
Train [60][2280/3239]	Time 0.269 (1.080)	Data Time 0.001 (0.598)	Loss 2.8754 (2.6548)	Entropy 0.62881 (0.62877)	Top-1 acc 55.469 (59.979)	Top-5 acc 78.906 (81.225)	lr 0.01260
Train [60][2290/3239]	Time 0.250 (1.080)	Data Time 0.001 (0.598)	Loss 2.7431 (2.6549)	Entropy 0.62805 (0.62877)	Top-1 acc 57.812 (59.980)	Top-5 acc 78.906 (81.222)	lr 0.01260
Train [60][2300/3239]	Time 0.231 (1.087)	Data Time 0.001 (0.606)	Loss 2.5076 (2.6549)	Entropy 0.62799 (0.62877)	Top-1 acc 62.109 (59.982)	Top-5 acc 83.203 (81.218)	lr 0.01259
Train [60][2310/3239]	Time 0.247 (1.085)	Data Time 0.001 (0.603)	Loss 2.7439 (2.6548)	Entropy 0.62748 (0.62876)	Top-1 acc 60.547 (59.986)	Top-5 acc 79.297 (81.219)	lr 0.01259
Train [60][2320/3239]	Time 0.237 (1.085)	Data Time 0.001 (0.604)	Loss 2.7203 (2.6548)	Entropy 0.62758 (0.62876)	Top-1 acc 58.984 (59.982)	Top-5 acc 80.859 (81.217)	lr 0.01259
Train [60][2330/3239]	Time 0.233 (1.093)	Data Time 0.001 (0.612)	Loss 2.6561 (2.6547)	Entropy 0.62767 (0.62875)	Top-1 acc 55.859 (59.984)	Top-5 acc 79.688 (81.219)	lr 0.01259
Train [60][2340/3239]	Time 0.322 (1.091)	Data Time 0.001 (0.610)	Loss 2.7072 (2.6548)	Entropy 0.62738 (0.62875)	Top-1 acc 57.812 (59.979)	Top-5 acc 80.078 (81.216)	lr 0.01259
Train [60][2350/3239]	Time 0.239 (1.091)	Data Time 0.001 (0.611)	Loss 2.6150 (2.6545)	Entropy 0.62768 (0.62874)	Top-1 acc 60.547 (59.988)	Top-5 acc 81.641 (81.221)	lr 0.01259
Train [60][2360/3239]	Time 2.338 (1.097)	Data Time 2.076 (0.617)	Loss 2.6009 (2.6545)	Entropy 0.62775 (0.62874)	Top-1 acc 61.719 (59.990)	Top-5 acc 81.641 (81.217)	lr 0.01259
Train [60][2370/3239]	Time 0.248 (1.095)	Data Time 0.001 (0.615)	Loss 2.5926 (2.6544)	Entropy 0.62797 (0.62873)	Top-1 acc 58.984 (59.992)	Top-5 acc 81.641 (81.217)	lr 0.01259
Train [60][2380/3239]	Time 0.251 (1.095)	Data Time 0.001 (0.615)	Loss 2.7761 (2.6546)	Entropy 0.62782 (0.62873)	Top-1 acc 58.984 (59.986)	Top-5 acc 79.297 (81.215)	lr 0.01259
Train [60][2390/3239]	Time 0.235 (1.101)	Data Time 0.001 (0.621)	Loss 2.7600 (2.6545)	Entropy 0.62818 (0.62873)	Top-1 acc 58.594 (59.989)	Top-5 acc 78.125 (81.217)	lr 0.01259
Train [60][2400/3239]	Time 0.225 (1.100)	Data Time 0.001 (0.621)	Loss 2.6886 (2.6544)	Entropy 0.62817 (0.62872)	Top-1 acc 61.719 (59.994)	Top-5 acc 80.078 (81.217)	lr 0.01258
Train [60][2410/3239]	Time 0.236 (1.101)	Data Time 0.001 (0.622)	Loss 2.8358 (2.6546)	Entropy 0.62826 (0.62872)	Top-1 acc 57.031 (59.985)	Top-5 acc 78.516 (81.214)	lr 0.01258
Train [60][2420/3239]	Time 7.676 (1.104)	Data Time 7.433 (0.626)	Loss 2.5428 (2.6546)	Entropy 0.62846 (0.62872)	Top-1 acc 61.328 (59.982)	Top-5 acc 83.984 (81.215)	lr 0.01258
Train [60][2430/3239]	Time 0.608 (1.104)	Data Time 0.258 (0.625)	Loss 2.6913 (2.6547)	Entropy 0.62851 (0.62872)	Top-1 acc 57.422 (59.976)	Top-5 acc 80.469 (81.207)	lr 0.01258
Train [60][2440/3239]	Time 0.226 (1.102)	Data Time 0.001 (0.624)	Loss 2.5291 (2.6549)	Entropy 0.62867 (0.62872)	Top-1 acc 60.156 (59.969)	Top-5 acc 83.594 (81.207)	lr 0.01258
Train [60][2450/3239]	Time 0.228 (1.104)	Data Time 0.001 (0.626)	Loss 2.9614 (2.6551)	Entropy 0.62848 (0.62872)	Top-1 acc 55.078 (59.966)	Top-5 acc 78.125 (81.204)	lr 0.01258
Train [60][2460/3239]	Time 0.241 (1.110)	Data Time 0.001 (0.632)	Loss 2.6923 (2.6552)	Entropy 0.62812 (0.62872)	Top-1 acc 58.203 (59.961)	Top-5 acc 82.812 (81.205)	lr 0.01258
Train [60][2470/3239]	Time 0.242 (1.108)	Data Time 0.001 (0.630)	Loss 2.7271 (2.6554)	Entropy 0.62816 (0.62871)	Top-1 acc 56.641 (59.955)	Top-5 acc 81.641 (81.201)	lr 0.01258
Train [60][2480/3239]	Time 0.253 (1.108)	Data Time 0.001 (0.631)	Loss 2.4079 (2.6552)	Entropy 0.62835 (0.62871)	Top-1 acc 66.406 (59.963)	Top-5 acc 84.766 (81.204)	lr 0.01258
Train [60][2490/3239]	Time 0.280 (1.112)	Data Time 0.001 (0.635)	Loss 2.7825 (2.6554)	Entropy 0.62796 (0.62871)	Top-1 acc 58.594 (59.957)	Top-5 acc 78.906 (81.198)	lr 0.01258
Train [60][2500/3239]	Time 1.546 (1.110)	Data Time 1.152 (0.633)	Loss 2.5378 (2.6552)	Entropy 0.62787 (0.62871)	Top-1 acc 63.672 (59.959)	Top-5 acc 83.594 (81.205)	lr 0.01257
Train [60][2510/3239]	Time 0.237 (1.110)	Data Time 0.001 (0.633)	Loss 2.7153 (2.6550)	Entropy 0.62777 (0.62870)	Top-1 acc 60.156 (59.965)	Top-5 acc 79.297 (81.207)	lr 0.01257
Train [60][2520/3239]	Time 4.753 (1.113)	Data Time 4.478 (0.636)	Loss 2.7259 (2.6551)	Entropy 0.62779 (0.62870)	Top-1 acc 62.109 (59.965)	Top-5 acc 80.859 (81.205)	lr 0.01257
Train [60][2530/3239]	Time 0.234 (1.111)	Data Time 0.001 (0.635)	Loss 2.7204 (2.6550)	Entropy 0.62793 (0.62870)	Top-1 acc 61.719 (59.967)	Top-5 acc 80.859 (81.207)	lr 0.01257
Train [60][2540/3239]	Time 0.273 (1.110)	Data Time 0.001 (0.634)	Loss 2.5060 (2.6550)	Entropy 0.62827 (0.62869)	Top-1 acc 60.156 (59.960)	Top-5 acc 84.766 (81.208)	lr 0.01257
Train [60][2550/3239]	Time 0.259 (1.113)	Data Time 0.001 (0.637)	Loss 2.5628 (2.6548)	Entropy 0.62836 (0.62869)	Top-1 acc 60.547 (59.961)	Top-5 acc 80.859 (81.213)	lr 0.01257
Train [60][2560/3239]	Time 0.238 (1.113)	Data Time 0.001 (0.637)	Loss 2.5743 (2.6547)	Entropy 0.62818 (0.62869)	Top-1 acc 62.500 (59.966)	Top-5 acc 82.812 (81.214)	lr 0.01257
Train [60][2570/3239]	Time 0.247 (1.111)	Data Time 0.001 (0.636)	Loss 2.6473 (2.6546)	Entropy 0.62829 (0.62869)	Top-1 acc 60.547 (59.970)	Top-5 acc 80.469 (81.214)	lr 0.01257
Train [60][2580/3239]	Time 0.378 (1.114)	Data Time 0.113 (0.639)	Loss 2.6859 (2.6545)	Entropy 0.62802 (0.62869)	Top-1 acc 60.547 (59.970)	Top-5 acc 81.641 (81.216)	lr 0.01257
Train [60][2590/3239]	Time 0.290 (1.115)	Data Time 0.002 (0.640)	Loss 2.7458 (2.6543)	Entropy 0.62779 (0.62868)	Top-1 acc 57.422 (59.975)	Top-5 acc 77.734 (81.218)	lr 0.01257
Train [60][2600/3239]	Time 0.244 (1.112)	Data Time 0.001 (0.637)	Loss 2.5709 (2.6542)	Entropy 0.62810 (0.62868)	Top-1 acc 58.594 (59.974)	Top-5 acc 86.328 (81.220)	lr 0.01256
Train [60][2610/3239]	Time 0.249 (1.113)	Data Time 0.001 (0.638)	Loss 2.6177 (2.6540)	Entropy 0.62806 (0.62868)	Top-1 acc 62.109 (59.977)	Top-5 acc 82.031 (81.225)	lr 0.01256
Train [60][2620/3239]	Time 0.254 (1.116)	Data Time 0.001 (0.641)	Loss 2.5894 (2.6540)	Entropy 0.62808 (0.62868)	Top-1 acc 58.984 (59.973)	Top-5 acc 82.031 (81.225)	lr 0.01256
Train [60][2630/3239]	Time 0.248 (1.114)	Data Time 0.002 (0.640)	Loss 2.8471 (2.6542)	Entropy 0.62819 (0.62867)	Top-1 acc 57.422 (59.965)	Top-5 acc 76.953 (81.221)	lr 0.01256
Train [60][2640/3239]	Time 0.226 (1.116)	Data Time 0.001 (0.641)	Loss 2.6653 (2.6543)	Entropy 0.62816 (0.62867)	Top-1 acc 61.719 (59.964)	Top-5 acc 81.641 (81.220)	lr 0.01256
Train [60][2650/3239]	Time 0.232 (1.119)	Data Time 0.001 (0.644)	Loss 2.7233 (2.6543)	Entropy 0.62826 (0.62867)	Top-1 acc 56.641 (59.963)	Top-5 acc 80.078 (81.219)	lr 0.01256
Train [60][2660/3239]	Time 0.325 (1.116)	Data Time 0.001 (0.642)	Loss 2.4811 (2.6543)	Entropy 0.62834 (0.62867)	Top-1 acc 62.109 (59.964)	Top-5 acc 85.938 (81.221)	lr 0.01256
Train [60][2670/3239]	Time 0.241 (1.118)	Data Time 0.001 (0.644)	Loss 2.5452 (2.6546)	Entropy 0.62810 (0.62867)	Top-1 acc 64.844 (59.959)	Top-5 acc 82.812 (81.215)	lr 0.01256
Train [60][2680/3239]	Time 11.756 (1.120)	Data Time 11.498 (0.647)	Loss 2.6863 (2.6547)	Entropy 0.62794 (0.62866)	Top-1 acc 59.766 (59.959)	Top-5 acc 80.078 (81.209)	lr 0.01256
Train [60][2690/3239]	Time 0.423 (1.132)	Data Time 0.005 (0.645)	Loss 2.8252 (2.6547)	Entropy 0.62803 (0.62866)	Top-1 acc 57.812 (59.961)	Top-5 acc 78.516 (81.210)	lr 0.01256
Train [60][2700/3239]	Time 0.247 (1.129)	Data Time 0.002 (0.643)	Loss 2.6765 (2.6546)	Entropy 0.62809 (0.62866)	Top-1 acc 61.719 (59.967)	Top-5 acc 79.297 (81.216)	lr 0.01255
Train [60][2710/3239]	Time 0.244 (1.127)	Data Time 0.001 (0.640)	Loss 2.8309 (2.6548)	Entropy 0.62828 (0.62866)	Top-1 acc 53.906 (59.965)	Top-5 acc 76.953 (81.208)	lr 0.01255
Train [60][2720/3239]	Time 0.248 (1.124)	Data Time 0.001 (0.638)	Loss 2.7308 (2.6547)	Entropy 0.62841 (0.62866)	Top-1 acc 57.812 (59.964)	Top-5 acc 80.859 (81.211)	lr 0.01255
Train [60][2730/3239]	Time 0.241 (1.122)	Data Time 0.001 (0.636)	Loss 2.6208 (2.6548)	Entropy 0.62846 (0.62866)	Top-1 acc 58.594 (59.961)	Top-5 acc 82.422 (81.207)	lr 0.01255
Train [60][2740/3239]	Time 0.243 (1.120)	Data Time 0.001 (0.635)	Loss 2.4359 (2.6548)	Entropy 0.62857 (0.62866)	Top-1 acc 64.453 (59.963)	Top-5 acc 83.203 (81.208)	lr 0.01255
Train [60][2750/3239]	Time 0.326 (1.122)	Data Time 0.001 (0.636)	Loss 2.7037 (2.6550)	Entropy 0.62837 (0.62865)	Top-1 acc 57.812 (59.958)	Top-5 acc 82.031 (81.203)	lr 0.01255
Train [60][2760/3239]	Time 0.272 (1.120)	Data Time 0.001 (0.634)	Loss 2.4077 (2.6551)	Entropy 0.62861 (0.62865)	Top-1 acc 65.625 (59.955)	Top-5 acc 85.156 (81.200)	lr 0.01255
Train [60][2770/3239]	Time 0.253 (1.120)	Data Time 0.001 (0.634)	Loss 2.5485 (2.6550)	Entropy 0.62888 (0.62865)	Top-1 acc 62.891 (59.952)	Top-5 acc 82.812 (81.202)	lr 0.01255
Train [60][2780/3239]	Time 0.283 (1.124)	Data Time 0.001 (0.638)	Loss 2.6031 (2.6551)	Entropy 0.62871 (0.62866)	Top-1 acc 61.328 (59.950)	Top-5 acc 80.469 (81.202)	lr 0.01255
Train [60][2790/3239]	Time 0.236 (1.121)	Data Time 0.001 (0.636)	Loss 2.6423 (2.6551)	Entropy 0.62885 (0.62866)	Top-1 acc 61.328 (59.950)	Top-5 acc 79.688 (81.200)	lr 0.01255
Train [60][2800/3239]	Time 0.228 (1.122)	Data Time 0.001 (0.637)	Loss 2.4423 (2.6550)	Entropy 0.62890 (0.62866)	Top-1 acc 65.625 (59.953)	Top-5 acc 85.547 (81.201)	lr 0.01254
Train [60][2810/3239]	Time 0.237 (1.126)	Data Time 0.001 (0.641)	Loss 2.6881 (2.6551)	Entropy 0.62903 (0.62866)	Top-1 acc 59.766 (59.952)	Top-5 acc 80.078 (81.200)	lr 0.01254
Train [60][2820/3239]	Time 0.354 (1.123)	Data Time 0.001 (0.639)	Loss 2.6202 (2.6555)	Entropy 0.62908 (0.62866)	Top-1 acc 58.984 (59.944)	Top-5 acc 83.594 (81.194)	lr 0.01254
Train [60][2830/3239]	Time 0.240 (1.122)	Data Time 0.001 (0.638)	Loss 2.5245 (2.6554)	Entropy 0.62943 (0.62866)	Top-1 acc 60.547 (59.946)	Top-5 acc 84.766 (81.196)	lr 0.01254
Train [60][2840/3239]	Time 0.229 (1.126)	Data Time 0.001 (0.642)	Loss 2.7874 (2.6555)	Entropy 0.62916 (0.62866)	Top-1 acc 55.469 (59.941)	Top-5 acc 80.859 (81.193)	lr 0.01254
Train [60][2850/3239]	Time 0.282 (1.125)	Data Time 0.001 (0.642)	Loss 2.4881 (2.6556)	Entropy 0.62924 (0.62866)	Top-1 acc 62.109 (59.939)	Top-5 acc 83.203 (81.195)	lr 0.01254
Train [60][2860/3239]	Time 2.707 (1.124)	Data Time 2.453 (0.640)	Loss 2.5962 (2.6557)	Entropy 0.62904 (0.62867)	Top-1 acc 59.766 (59.941)	Top-5 acc 83.984 (81.191)	lr 0.01254
Train [60][2870/3239]	Time 0.240 (1.128)	Data Time 0.001 (0.645)	Loss 2.6871 (2.6557)	Entropy 0.62889 (0.62867)	Top-1 acc 56.250 (59.936)	Top-5 acc 82.031 (81.190)	lr 0.01254
Train [60][2880/3239]	Time 0.274 (1.128)	Data Time 0.001 (0.644)	Loss 2.6768 (2.6557)	Entropy 0.62879 (0.62867)	Top-1 acc 59.375 (59.935)	Top-5 acc 80.078 (81.189)	lr 0.01254
Train [60][2890/3239]	Time 0.322 (1.125)	Data Time 0.001 (0.642)	Loss 2.6727 (2.6557)	Entropy 0.62870 (0.62867)	Top-1 acc 59.375 (59.932)	Top-5 acc 77.734 (81.188)	lr 0.01254
Train [60][2900/3239]	Time 0.234 (1.130)	Data Time 0.001 (0.647)	Loss 2.5852 (2.6558)	Entropy 0.62875 (0.62867)	Top-1 acc 62.500 (59.931)	Top-5 acc 81.641 (81.184)	lr 0.01253
Train [60][2910/3239]	Time 0.239 (1.128)	Data Time 0.001 (0.645)	Loss 2.8453 (2.6559)	Entropy 0.62873 (0.62867)	Top-1 acc 57.031 (59.929)	Top-5 acc 78.125 (81.185)	lr 0.01253
Train [60][2920/3239]	Time 0.247 (1.126)	Data Time 0.001 (0.643)	Loss 2.7147 (2.6559)	Entropy 0.62890 (0.62867)	Top-1 acc 62.109 (59.931)	Top-5 acc 80.859 (81.185)	lr 0.01253
Train [60][2930/3239]	Time 0.236 (1.126)	Data Time 0.001 (0.644)	Loss 2.4751 (2.6559)	Entropy 0.62891 (0.62867)	Top-1 acc 64.844 (59.932)	Top-5 acc 84.766 (81.184)	lr 0.01253
Train [60][2940/3239]	Time 0.238 (1.131)	Data Time 0.001 (0.648)	Loss 2.7888 (2.6560)	Entropy 0.62853 (0.62867)	Top-1 acc 60.156 (59.934)	Top-5 acc 78.516 (81.184)	lr 0.01253
Train [60][2950/3239]	Time 0.236 (1.128)	Data Time 0.001 (0.646)	Loss 2.5754 (2.6563)	Entropy 0.62861 (0.62867)	Top-1 acc 60.156 (59.928)	Top-5 acc 83.594 (81.182)	lr 0.01253
Train [60][2960/3239]	Time 0.235 (1.127)	Data Time 0.001 (0.645)	Loss 2.6290 (2.6563)	Entropy 0.62863 (0.62867)	Top-1 acc 60.938 (59.927)	Top-5 acc 82.031 (81.183)	lr 0.01253
Train [60][2970/3239]	Time 0.236 (1.131)	Data Time 0.001 (0.649)	Loss 2.7633 (2.6561)	Entropy 0.62859 (0.62867)	Top-1 acc 57.031 (59.930)	Top-5 acc 80.078 (81.187)	lr 0.01253
Train [60][2980/3239]	Time 0.391 (1.129)	Data Time 0.001 (0.647)	Loss 2.4979 (2.6560)	Entropy 0.62828 (0.62867)	Top-1 acc 62.500 (59.934)	Top-5 acc 83.594 (81.192)	lr 0.01253
Train [60][2990/3239]	Time 0.237 (1.129)	Data Time 0.001 (0.648)	Loss 2.7241 (2.6561)	Entropy 0.62844 (0.62867)	Top-1 acc 58.594 (59.932)	Top-5 acc 80.859 (81.190)	lr 0.01253
Train [60][3000/3239]	Time 0.222 (1.130)	Data Time 0.001 (0.649)	Loss 2.9324 (2.6560)	Entropy 0.62853 (0.62867)	Top-1 acc 53.906 (59.933)	Top-5 acc 74.219 (81.193)	lr 0.01252
Train [60][3010/3239]	Time 0.249 (1.131)	Data Time 0.001 (0.650)	Loss 2.7408 (2.6558)	Entropy 0.62864 (0.62867)	Top-1 acc 57.812 (59.938)	Top-5 acc 76.953 (81.197)	lr 0.01252
Train [60][3020/3239]	Time 3.618 (1.130)	Data Time 3.316 (0.649)	Loss 2.7893 (2.6558)	Entropy 0.62860 (0.62867)	Top-1 acc 57.422 (59.940)	Top-5 acc 80.078 (81.194)	lr 0.01252
Train [60][3030/3239]	Time 0.240 (1.132)	Data Time 0.001 (0.651)	Loss 2.7016 (2.6559)	Entropy 0.62872 (0.62867)	Top-1 acc 63.672 (59.936)	Top-5 acc 80.469 (81.193)	lr 0.01252
Train [60][3040/3239]	Time 0.243 (1.133)	Data Time 0.001 (0.652)	Loss 2.7960 (2.6558)	Entropy 0.62854 (0.62867)	Top-1 acc 61.328 (59.941)	Top-5 acc 79.297 (81.195)	lr 0.01252
Train [60][3050/3239]	Time 0.322 (1.130)	Data Time 0.001 (0.650)	Loss 2.5818 (2.6557)	Entropy 0.62868 (0.62867)	Top-1 acc 60.938 (59.944)	Top-5 acc 83.203 (81.198)	lr 0.01252
Train [60][3060/3239]	Time 0.248 (1.132)	Data Time 0.001 (0.652)	Loss 2.6252 (2.6557)	Entropy 0.62874 (0.62867)	Top-1 acc 58.984 (59.940)	Top-5 acc 82.422 (81.198)	lr 0.01252
Train [60][3070/3239]	Time 0.235 (1.134)	Data Time 0.001 (0.654)	Loss 2.5435 (2.6556)	Entropy 0.62859 (0.62867)	Top-1 acc 62.500 (59.942)	Top-5 acc 82.812 (81.201)	lr 0.01252
Train [60][3080/3239]	Time 0.237 (1.132)	Data Time 0.001 (0.653)	Loss 2.5894 (2.6557)	Entropy 0.62873 (0.62867)	Top-1 acc 60.156 (59.941)	Top-5 acc 80.469 (81.200)	lr 0.01252
Train [60][3090/3239]	Time 0.237 (1.132)	Data Time 0.001 (0.653)	Loss 2.6023 (2.6559)	Entropy 0.62866 (0.62867)	Top-1 acc 60.547 (59.937)	Top-5 acc 82.031 (81.198)	lr 0.01252
Train [60][3100/3239]	Time 0.241 (1.136)	Data Time 0.001 (0.657)	Loss 2.4981 (2.6557)	Entropy 0.62901 (0.62867)	Top-1 acc 62.109 (59.941)	Top-5 acc 85.938 (81.204)	lr 0.01251
Train [60][3110/3239]	Time 0.235 (1.134)	Data Time 0.001 (0.655)	Loss 2.4086 (2.6555)	Entropy 0.62882 (0.62867)	Top-1 acc 66.016 (59.946)	Top-5 acc 84.375 (81.210)	lr 0.01251
Train [60][3120/3239]	Time 0.254 (1.134)	Data Time 0.001 (0.655)	Loss 2.7430 (2.6556)	Entropy 0.62853 (0.62867)	Top-1 acc 54.297 (59.944)	Top-5 acc 82.031 (81.209)	lr 0.01251
Train [60][3130/3239]	Time 0.244 (1.139)	Data Time 0.001 (0.660)	Loss 2.7352 (2.6556)	Entropy 0.62882 (0.62867)	Top-1 acc 59.766 (59.945)	Top-5 acc 79.688 (81.210)	lr 0.01251
Train [60][3140/3239]	Time 0.256 (1.136)	Data Time 0.001 (0.658)	Loss 2.6187 (2.6558)	Entropy 0.62898 (0.62867)	Top-1 acc 60.938 (59.943)	Top-5 acc 81.250 (81.207)	lr 0.01251
Train [60][3150/3239]	Time 3.357 (1.136)	Data Time 3.105 (0.658)	Loss 2.6665 (2.6560)	Entropy 0.62891 (0.62867)	Top-1 acc 55.469 (59.938)	Top-5 acc 81.641 (81.204)	lr 0.01251
Train [60][3160/3239]	Time 0.225 (1.135)	Data Time 0.001 (0.657)	Loss 2.5923 (2.6560)	Entropy 0.62910 (0.62867)	Top-1 acc 59.766 (59.936)	Top-5 acc 81.250 (81.205)	lr 0.01251
Train [60][3170/3239]	Time 0.239 (1.138)	Data Time 0.001 (0.661)	Loss 2.6446 (2.6562)	Entropy 0.62939 (0.62867)	Top-1 acc 58.984 (59.932)	Top-5 acc 80.078 (81.201)	lr 0.01251
Train [60][3180/3239]	Time 0.230 (1.136)	Data Time 0.000 (0.659)	Loss 2.6646 (2.6562)	Entropy 0.62954 (0.62868)	Top-1 acc 63.281 (59.932)	Top-5 acc 80.859 (81.202)	lr 0.01251
Train [60][3190/3239]	Time 0.228 (1.138)	Data Time 0.000 (0.660)	Loss 2.6504 (2.6562)	Entropy 0.62929 (0.62868)	Top-1 acc 61.328 (59.935)	Top-5 acc 81.250 (81.203)	lr 0.01251
Train [60][3200/3239]	Time 0.234 (1.139)	Data Time 0.000 (0.662)	Loss 2.8300 (2.6562)	Entropy 0.62884 (0.62868)	Top-1 acc 54.688 (59.930)	Top-5 acc 79.688 (81.203)	lr 0.01250
Train [60][3210/3239]	Time 0.394 (1.139)	Data Time 0.000 (0.662)	Loss 2.6460 (2.6562)	Entropy 0.62904 (0.62868)	Top-1 acc 60.938 (59.934)	Top-5 acc 79.297 (81.203)	lr 0.01250
Train [60][3220/3239]	Time 2.560 (1.138)	Data Time 2.314 (0.661)	Loss 2.4542 (2.6562)	Entropy 0.62922 (0.62868)	Top-1 acc 66.797 (59.938)	Top-5 acc 83.984 (81.203)	lr 0.01250
Train [60][3230/3239]	Time 0.241 (1.138)	Data Time 0.000 (0.662)	Loss 2.4890 (2.6561)	Entropy 0.62911 (0.62868)	Top-1 acc 62.109 (59.938)	Top-5 acc 85.547 (81.206)	lr 0.01250
Train [60][3239/3239]	Time 0.900 (1.137)	Data Time 0.000 (0.661)	Loss 2.6208 (2.6561)	Entropy 0.62898 (0.62868)	Top-1 acc 62.963 (59.941)	Top-5 acc 82.716 (81.206)	lr 0.01250
==========Valid [60/120]	loss 1.398	top-1 acc 67.769 (67.769)	top-5 acc 87.513	Train top-1 59.941	top-5 81.206	Entropy 0.62898	Latency-None: 0.000ms	Flops: 538.40M
Train [61][0/3239]	Time 58.105 (58.105)	Data Time 55.881 (55.881)	Loss 2.5828 (2.5828)	Entropy 0.62910 (0.62910)	Top-1 acc 62.500 (62.500)	Top-5 acc 82.422 (82.422)	lr 0.01250
Train [61][10/3239]	Time 0.231 (5.702)	Data Time 0.001 (5.106)	Loss 2.5907 (2.6017)	Entropy 0.62895 (0.62909)	Top-1 acc 60.547 (61.293)	Top-5 acc 83.203 (82.067)	lr 0.01250
Train [61][20/3239]	Time 0.255 (3.182)	Data Time 0.002 (2.675)	Loss 2.7094 (2.6450)	Entropy 0.62903 (0.62905)	Top-1 acc 60.156 (60.268)	Top-5 acc 81.641 (81.436)	lr 0.01250
Train [61][30/3239]	Time 0.252 (2.295)	Data Time 0.001 (1.813)	Loss 2.8004 (2.6398)	Entropy 0.62951 (0.62910)	Top-1 acc 59.766 (60.585)	Top-5 acc 78.516 (81.767)	lr 0.01250
Train [61][40/3239]	Time 0.339 (2.186)	Data Time 0.001 (1.718)	Loss 2.6404 (2.6218)	Entropy 0.62957 (0.62917)	Top-1 acc 56.250 (60.833)	Top-5 acc 82.031 (82.079)	lr 0.01250
Train [61][50/3239]	Time 0.239 (1.840)	Data Time 0.001 (1.381)	Loss 2.6633 (2.6302)	Entropy 0.62944 (0.62927)	Top-1 acc 58.203 (60.547)	Top-5 acc 82.422 (81.978)	lr 0.01249
Train [61][60/3239]	Time 0.243 (1.604)	Data Time 0.001 (1.155)	Loss 2.5774 (2.6288)	Entropy 0.62937 (0.62929)	Top-1 acc 62.109 (60.662)	Top-5 acc 84.766 (82.070)	lr 0.01249
Train [61][70/3239]	Time 0.240 (1.624)	Data Time 0.001 (1.177)	Loss 2.7945 (2.6353)	Entropy 0.62931 (0.62930)	Top-1 acc 54.688 (60.574)	Top-5 acc 77.734 (82.015)	lr 0.01249
Train [61][80/3239]	Time 0.238 (1.474)	Data Time 0.001 (1.032)	Loss 2.7258 (2.6374)	Entropy 0.62922 (0.62930)	Top-1 acc 57.422 (60.566)	Top-5 acc 79.688 (81.916)	lr 0.01249
Train [61][90/3239]	Time 0.230 (1.357)	Data Time 0.001 (0.918)	Loss 2.6213 (2.6448)	Entropy 0.62912 (0.62929)	Top-1 acc 61.719 (60.427)	Top-5 acc 83.203 (81.795)	lr 0.01249
Train [61][100/3239]	Time 0.298 (1.408)	Data Time 0.002 (0.966)	Loss 2.5420 (2.6448)	Entropy 0.62909 (0.62928)	Top-1 acc 62.500 (60.323)	Top-5 acc 83.984 (81.799)	lr 0.01249
Train [61][110/3239]	Time 0.277 (1.689)	Data Time 0.003 (0.880)	Loss 2.6570 (2.6433)	Entropy 0.62950 (0.62927)	Top-1 acc 59.375 (60.262)	Top-5 acc 82.031 (81.746)	lr 0.01249
Train [61][120/3239]	Time 0.232 (1.587)	Data Time 0.002 (0.808)	Loss 2.7158 (2.6375)	Entropy 0.62974 (0.62930)	Top-1 acc 57.422 (60.408)	Top-5 acc 83.984 (81.825)	lr 0.01249
Train [61][130/3239]	Time 0.272 (1.497)	Data Time 0.002 (0.746)	Loss 2.5055 (2.6345)	Entropy 0.62985 (0.62933)	Top-1 acc 63.281 (60.478)	Top-5 acc 84.766 (81.948)	lr 0.01249
Train [61][140/3239]	Time 0.246 (1.421)	Data Time 0.001 (0.694)	Loss 2.6832 (2.6310)	Entropy 0.62999 (0.62937)	Top-1 acc 59.375 (60.619)	Top-5 acc 83.203 (82.001)	lr 0.01249
Train [61][150/3239]	Time 0.238 (1.355)	Data Time 0.001 (0.648)	Loss 2.7597 (2.6337)	Entropy 0.63011 (0.62942)	Top-1 acc 57.031 (60.562)	Top-5 acc 80.859 (81.920)	lr 0.01248
Train [61][160/3239]	Time 0.257 (1.298)	Data Time 0.002 (0.608)	Loss 2.5994 (2.6342)	Entropy 0.62974 (0.62945)	Top-1 acc 60.938 (60.508)	Top-5 acc 82.422 (81.905)	lr 0.01248
Train [61][170/3239]	Time 0.255 (1.247)	Data Time 0.001 (0.572)	Loss 2.5432 (2.6355)	Entropy 0.62906 (0.62946)	Top-1 acc 59.375 (60.444)	Top-5 acc 83.594 (81.894)	lr 0.01248
Train [61][180/3239]	Time 0.246 (1.209)	Data Time 0.001 (0.545)	Loss 2.6192 (2.6371)	Entropy 0.62854 (0.62943)	Top-1 acc 62.109 (60.420)	Top-5 acc 82.812 (81.824)	lr 0.01248
Train [61][190/3239]	Time 0.240 (1.169)	Data Time 0.001 (0.517)	Loss 2.8676 (2.6388)	Entropy 0.62831 (0.62938)	Top-1 acc 56.641 (60.338)	Top-5 acc 76.172 (81.772)	lr 0.01248
Train [61][200/3239]	Time 0.355 (1.140)	Data Time 0.002 (0.499)	Loss 2.4756 (2.6405)	Entropy 0.62839 (0.62933)	Top-1 acc 66.406 (60.279)	Top-5 acc 82.812 (81.697)	lr 0.01248
Train [61][210/3239]	Time 0.261 (1.149)	Data Time 0.001 (0.515)	Loss 2.5983 (2.6408)	Entropy 0.62807 (0.62928)	Top-1 acc 60.938 (60.265)	Top-5 acc 80.469 (81.661)	lr 0.01248
Train [61][220/3239]	Time 0.266 (1.138)	Data Time 0.002 (0.512)	Loss 2.5995 (2.6426)	Entropy 0.62815 (0.62923)	Top-1 acc 62.109 (60.268)	Top-5 acc 81.641 (81.630)	lr 0.01248
Train [61][230/3239]	Time 0.260 (1.109)	Data Time 0.002 (0.490)	Loss 2.4824 (2.6437)	Entropy 0.62783 (0.62917)	Top-1 acc 63.672 (60.226)	Top-5 acc 84.375 (81.625)	lr 0.01248
Train [61][240/3239]	Time 0.242 (1.114)	Data Time 0.001 (0.503)	Loss 2.6380 (2.6435)	Entropy 0.62799 (0.62912)	Top-1 acc 58.984 (60.271)	Top-5 acc 79.688 (81.589)	lr 0.01248
Train [61][250/3239]	Time 0.244 (1.101)	Data Time 0.001 (0.497)	Loss 2.5678 (2.6434)	Entropy 0.62791 (0.62908)	Top-1 acc 60.547 (60.293)	Top-5 acc 82.812 (81.578)	lr 0.01247
Train [61][260/3239]	Time 0.241 (1.088)	Data Time 0.001 (0.491)	Loss 2.6251 (2.6444)	Entropy 0.62813 (0.62903)	Top-1 acc 62.109 (60.258)	Top-5 acc 82.031 (81.581)	lr 0.01247
Train [61][270/3239]	Time 0.369 (1.085)	Data Time 0.001 (0.493)	Loss 2.6221 (2.6445)	Entropy 0.62781 (0.62900)	Top-1 acc 60.547 (60.243)	Top-5 acc 82.422 (81.570)	lr 0.01247
Train [61][280/3239]	Time 0.278 (1.080)	Data Time 0.001 (0.493)	Loss 2.5466 (2.6426)	Entropy 0.62748 (0.62895)	Top-1 acc 64.062 (60.301)	Top-5 acc 80.078 (81.564)	lr 0.01247
Train [61][290/3239]	Time 0.247 (1.057)	Data Time 0.001 (0.476)	Loss 2.6956 (2.6426)	Entropy 0.62730 (0.62890)	Top-1 acc 62.109 (60.253)	Top-5 acc 78.516 (81.540)	lr 0.01247
Train [61][300/3239]	Time 1.425 (1.068)	Data Time 1.152 (0.492)	Loss 2.7674 (2.6409)	Entropy 0.62735 (0.62885)	Top-1 acc 57.812 (60.282)	Top-5 acc 76.953 (81.555)	lr 0.01247
Train [61][310/3239]	Time 0.289 (1.055)	Data Time 0.001 (0.482)	Loss 2.7493 (2.6418)	Entropy 0.62734 (0.62880)	Top-1 acc 60.156 (60.271)	Top-5 acc 78.516 (81.519)	lr 0.01247
Train [61][320/3239]	Time 0.246 (1.035)	Data Time 0.001 (0.467)	Loss 2.5226 (2.6424)	Entropy 0.62686 (0.62875)	Top-1 acc 64.062 (60.240)	Top-5 acc 84.375 (81.518)	lr 0.01247
Train [61][330/3239]	Time 5.283 (1.052)	Data Time 5.023 (0.488)	Loss 2.4498 (2.6412)	Entropy 0.62675 (0.62869)	Top-1 acc 65.234 (60.246)	Top-5 acc 86.328 (81.536)	lr 0.01247
Train [61][340/3239]	Time 0.237 (1.039)	Data Time 0.001 (0.478)	Loss 2.5811 (2.6414)	Entropy 0.62668 (0.62864)	Top-1 acc 62.109 (60.233)	Top-5 acc 81.250 (81.519)	lr 0.01247
Train [61][350/3239]	Time 0.248 (1.024)	Data Time 0.001 (0.468)	Loss 2.6370 (2.6422)	Entropy 0.62670 (0.62858)	Top-1 acc 60.156 (60.251)	Top-5 acc 79.297 (81.500)	lr 0.01246
Train [61][360/3239]	Time 0.354 (1.033)	Data Time 0.001 (0.479)	Loss 2.8233 (2.6415)	Entropy 0.62650 (0.62853)	Top-1 acc 55.859 (60.283)	Top-5 acc 78.906 (81.491)	lr 0.01246
Train [61][370/3239]	Time 0.254 (1.030)	Data Time 0.001 (0.480)	Loss 2.4669 (2.6416)	Entropy 0.62672 (0.62847)	Top-1 acc 64.453 (60.294)	Top-5 acc 85.547 (81.482)	lr 0.01246
Train [61][380/3239]	Time 0.246 (1.016)	Data Time 0.001 (0.470)	Loss 2.6650 (2.6403)	Entropy 0.62689 (0.62843)	Top-1 acc 60.156 (60.313)	Top-5 acc 82.812 (81.511)	lr 0.01246
Train [61][390/3239]	Time 0.248 (1.016)	Data Time 0.001 (0.472)	Loss 2.4803 (2.6379)	Entropy 0.62695 (0.62839)	Top-1 acc 60.547 (60.358)	Top-5 acc 84.375 (81.562)	lr 0.01246
Train [61][400/3239]	Time 1.152 (1.011)	Data Time 0.910 (0.471)	Loss 2.6132 (2.6400)	Entropy 0.62670 (0.62835)	Top-1 acc 62.109 (60.334)	Top-5 acc 83.594 (81.539)	lr 0.01246
Train [61][410/3239]	Time 0.279 (1.011)	Data Time 0.001 (0.473)	Loss 2.6198 (2.6393)	Entropy 0.62700 (0.62832)	Top-1 acc 60.156 (60.373)	Top-5 acc 82.422 (81.554)	lr 0.01246
Train [61][420/3239]	Time 0.251 (1.006)	Data Time 0.001 (0.469)	Loss 2.8487 (2.6403)	Entropy 0.62688 (0.62828)	Top-1 acc 60.547 (60.356)	Top-5 acc 76.172 (81.527)	lr 0.01246
Train [61][430/3239]	Time 0.394 (1.000)	Data Time 0.003 (0.465)	Loss 2.7743 (2.6404)	Entropy 0.62708 (0.62825)	Top-1 acc 58.984 (60.344)	Top-5 acc 77.344 (81.526)	lr 0.01246
Train [61][440/3239]	Time 0.243 (1.006)	Data Time 0.001 (0.473)	Loss 2.8079 (2.6401)	Entropy 0.62698 (0.62822)	Top-1 acc 55.859 (60.352)	Top-5 acc 78.125 (81.517)	lr 0.01246
Train [61][450/3239]	Time 0.236 (0.992)	Data Time 0.001 (0.463)	Loss 2.7639 (2.6408)	Entropy 0.62715 (0.62820)	Top-1 acc 58.203 (60.337)	Top-5 acc 77.344 (81.502)	lr 0.01245
Train [61][460/3239]	Time 0.274 (0.996)	Data Time 0.002 (0.468)	Loss 2.7552 (2.6414)	Entropy 0.62721 (0.62818)	Top-1 acc 57.031 (60.325)	Top-5 acc 79.688 (81.490)	lr 0.01245
Train [61][470/3239]	Time 3.357 (0.994)	Data Time 3.092 (0.468)	Loss 2.8104 (2.6429)	Entropy 0.62738 (0.62816)	Top-1 acc 58.594 (60.296)	Top-5 acc 76.172 (81.446)	lr 0.01245
Train [61][480/3239]	Time 0.239 (0.982)	Data Time 0.001 (0.459)	Loss 2.6948 (2.6427)	Entropy 0.62718 (0.62814)	Top-1 acc 56.250 (60.289)	Top-5 acc 79.688 (81.444)	lr 0.01245
Train [61][490/3239]	Time 4.435 (0.984)	Data Time 4.181 (0.462)	Loss 2.5706 (2.6437)	Entropy 0.62740 (0.62812)	Top-1 acc 58.203 (60.257)	Top-5 acc 83.594 (81.422)	lr 0.01245
Train [61][500/3239]	Time 0.241 (0.984)	Data Time 0.001 (0.463)	Loss 2.6236 (2.6431)	Entropy 0.62715 (0.62811)	Top-1 acc 60.156 (60.265)	Top-5 acc 80.859 (81.430)	lr 0.01245
Train [61][510/3239]	Time 0.275 (0.976)	Data Time 0.001 (0.458)	Loss 2.6949 (2.6431)	Entropy 0.62707 (0.62809)	Top-1 acc 58.203 (60.256)	Top-5 acc 82.031 (81.430)	lr 0.01245
Train [61][520/3239]	Time 0.284 (0.973)	Data Time 0.001 (0.456)	Loss 2.5452 (2.6436)	Entropy 0.62706 (0.62807)	Top-1 acc 60.938 (60.230)	Top-5 acc 84.375 (81.428)	lr 0.01245
Train [61][530/3239]	Time 0.248 (0.979)	Data Time 0.001 (0.463)	Loss 2.5996 (2.6418)	Entropy 0.62709 (0.62805)	Top-1 acc 62.500 (60.272)	Top-5 acc 84.375 (81.461)	lr 0.01245
Train [61][540/3239]	Time 0.233 (0.973)	Data Time 0.001 (0.460)	Loss 2.6804 (2.6423)	Entropy 0.62728 (0.62803)	Top-1 acc 58.984 (60.263)	Top-5 acc 80.078 (81.447)	lr 0.01245
Train [61][550/3239]	Time 0.252 (0.970)	Data Time 0.001 (0.457)	Loss 2.5269 (2.6417)	Entropy 0.62737 (0.62801)	Top-1 acc 60.938 (60.274)	Top-5 acc 83.984 (81.452)	lr 0.01244
Train [61][560/3239]	Time 1.265 (0.978)	Data Time 1.014 (0.467)	Loss 2.6698 (2.6432)	Entropy 0.62718 (0.62800)	Top-1 acc 57.422 (60.240)	Top-5 acc 79.297 (81.430)	lr 0.01244
Train [61][570/3239]	Time 0.234 (0.978)	Data Time 0.001 (0.468)	Loss 2.6084 (2.6434)	Entropy 0.62718 (0.62799)	Top-1 acc 64.062 (60.251)	Top-5 acc 80.469 (81.432)	lr 0.01244
Train [61][580/3239]	Time 0.265 (0.969)	Data Time 0.001 (0.460)	Loss 2.7638 (2.6440)	Entropy 0.62737 (0.62798)	Top-1 acc 57.031 (60.242)	Top-5 acc 79.688 (81.425)	lr 0.01244
Train [61][590/3239]	Time 0.333 (0.979)	Data Time 0.001 (0.472)	Loss 2.7582 (2.6436)	Entropy 0.62754 (0.62797)	Top-1 acc 58.594 (60.255)	Top-5 acc 80.078 (81.442)	lr 0.01244
Train [61][600/3239]	Time 0.273 (0.976)	Data Time 0.001 (0.471)	Loss 2.3655 (2.6435)	Entropy 0.62738 (0.62796)	Top-1 acc 66.406 (60.249)	Top-5 acc 86.719 (81.449)	lr 0.01244
Train [61][610/3239]	Time 0.240 (0.968)	Data Time 0.001 (0.463)	Loss 2.7801 (2.6432)	Entropy 0.62745 (0.62795)	Top-1 acc 57.031 (60.259)	Top-5 acc 78.906 (81.455)	lr 0.01244
Train [61][620/3239]	Time 0.238 (0.979)	Data Time 0.001 (0.475)	Loss 2.5894 (2.6431)	Entropy 0.62769 (0.62794)	Top-1 acc 63.672 (60.270)	Top-5 acc 81.641 (81.456)	lr 0.01244
Train [61][630/3239]	Time 0.242 (0.974)	Data Time 0.001 (0.471)	Loss 2.7137 (2.6424)	Entropy 0.62751 (0.62794)	Top-1 acc 56.641 (60.287)	Top-5 acc 78.906 (81.458)	lr 0.01244
Train [61][640/3239]	Time 0.259 (0.970)	Data Time 0.001 (0.469)	Loss 2.5314 (2.6424)	Entropy 0.62738 (0.62793)	Top-1 acc 62.500 (60.283)	Top-5 acc 83.984 (81.464)	lr 0.01244
Train [61][650/3239]	Time 12.383 (0.981)	Data Time 12.103 (0.480)	Loss 2.6817 (2.6417)	Entropy 0.62757 (0.62792)	Top-1 acc 57.812 (60.301)	Top-5 acc 80.859 (81.473)	lr 0.01243
Train [61][660/3239]	Time 0.318 (0.973)	Data Time 0.001 (0.474)	Loss 2.7325 (2.6423)	Entropy 0.62755 (0.62792)	Top-1 acc 59.766 (60.284)	Top-5 acc 80.859 (81.461)	lr 0.01243
Train [61][670/3239]	Time 0.260 (0.973)	Data Time 0.001 (0.475)	Loss 2.7481 (2.6431)	Entropy 0.62710 (0.62791)	Top-1 acc 57.031 (60.277)	Top-5 acc 77.734 (81.437)	lr 0.01243
Train [61][680/3239]	Time 0.261 (0.966)	Data Time 0.001 (0.469)	Loss 2.3711 (2.6429)	Entropy 0.62718 (0.62790)	Top-1 acc 71.875 (60.301)	Top-5 acc 85.156 (81.438)	lr 0.01243
Train [61][690/3239]	Time 0.237 (0.982)	Data Time 0.001 (0.486)	Loss 2.9264 (2.6442)	Entropy 0.62681 (0.62788)	Top-1 acc 53.125 (60.279)	Top-5 acc 76.953 (81.417)	lr 0.01243
Train [61][700/3239]	Time 0.247 (0.979)	Data Time 0.001 (0.485)	Loss 2.7724 (2.6449)	Entropy 0.62684 (0.62787)	Top-1 acc 54.297 (60.270)	Top-5 acc 81.250 (81.421)	lr 0.01243
Train [61][710/3239]	Time 0.238 (0.976)	Data Time 0.001 (0.483)	Loss 2.5535 (2.6430)	Entropy 0.62685 (0.62786)	Top-1 acc 59.766 (60.313)	Top-5 acc 80.078 (81.442)	lr 0.01243
Train [61][720/3239]	Time 4.757 (0.986)	Data Time 4.505 (0.493)	Loss 2.6498 (2.6428)	Entropy 0.62676 (0.62784)	Top-1 acc 58.594 (60.298)	Top-5 acc 80.859 (81.449)	lr 0.01243
Train [61][730/3239]	Time 0.318 (0.986)	Data Time 0.001 (0.495)	Loss 2.4902 (2.6420)	Entropy 0.62692 (0.62783)	Top-1 acc 66.797 (60.315)	Top-5 acc 81.641 (81.462)	lr 0.01243
Train [61][740/3239]	Time 0.245 (0.979)	Data Time 0.001 (0.488)	Loss 2.5360 (2.6415)	Entropy 0.62730 (0.62782)	Top-1 acc 62.891 (60.334)	Top-5 acc 82.422 (81.467)	lr 0.01243
Train [61][750/3239]	Time 1.453 (0.980)	Data Time 1.081 (0.490)	Loss 2.5421 (2.6415)	Entropy 0.62757 (0.62781)	Top-1 acc 61.719 (60.328)	Top-5 acc 83.984 (81.469)	lr 0.01242
Train [61][760/3239]	Time 0.370 (1.035)	Data Time 0.006 (0.501)	Loss 2.6684 (2.6408)	Entropy 0.62736 (0.62781)	Top-1 acc 60.547 (60.365)	Top-5 acc 82.031 (81.478)	lr 0.01242
Train [61][770/3239]	Time 0.237 (1.028)	Data Time 0.002 (0.494)	Loss 2.7372 (2.6412)	Entropy 0.62703 (0.62780)	Top-1 acc 60.547 (60.360)	Top-5 acc 78.516 (81.468)	lr 0.01242
Train [61][780/3239]	Time 0.254 (1.021)	Data Time 0.002 (0.488)	Loss 2.6693 (2.6415)	Entropy 0.62705 (0.62779)	Top-1 acc 58.594 (60.342)	Top-5 acc 82.812 (81.464)	lr 0.01242
Train [61][790/3239]	Time 0.241 (1.013)	Data Time 0.002 (0.482)	Loss 2.8966 (2.6416)	Entropy 0.62710 (0.62778)	Top-1 acc 53.125 (60.339)	Top-5 acc 75.391 (81.455)	lr 0.01242
Train [61][800/3239]	Time 0.235 (1.006)	Data Time 0.001 (0.476)	Loss 2.7856 (2.6423)	Entropy 0.62718 (0.62777)	Top-1 acc 55.859 (60.319)	Top-5 acc 76.562 (81.450)	lr 0.01242
Train [61][810/3239]	Time 0.260 (0.999)	Data Time 0.002 (0.470)	Loss 2.8453 (2.6430)	Entropy 0.62738 (0.62777)	Top-1 acc 58.984 (60.306)	Top-5 acc 76.953 (81.441)	lr 0.01242
Train [61][820/3239]	Time 0.384 (0.993)	Data Time 0.002 (0.464)	Loss 2.7706 (2.6430)	Entropy 0.62729 (0.62776)	Top-1 acc 58.203 (60.295)	Top-5 acc 75.000 (81.436)	lr 0.01242
Train [61][830/3239]	Time 0.251 (0.992)	Data Time 0.001 (0.465)	Loss 2.4518 (2.6433)	Entropy 0.62739 (0.62776)	Top-1 acc 63.281 (60.291)	Top-5 acc 84.375 (81.438)	lr 0.01242
Train [61][840/3239]	Time 0.243 (0.986)	Data Time 0.001 (0.460)	Loss 2.5618 (2.6431)	Entropy 0.62713 (0.62775)	Top-1 acc 62.891 (60.298)	Top-5 acc 81.250 (81.440)	lr 0.01242
Train [61][850/3239]	Time 0.248 (0.990)	Data Time 0.001 (0.464)	Loss 2.6739 (2.6438)	Entropy 0.62690 (0.62774)	Top-1 acc 60.156 (60.286)	Top-5 acc 80.078 (81.419)	lr 0.01241
Train [61][860/3239]	Time 0.254 (0.993)	Data Time 0.001 (0.468)	Loss 2.4608 (2.6436)	Entropy 0.62692 (0.62773)	Top-1 acc 62.891 (60.288)	Top-5 acc 84.375 (81.428)	lr 0.01241
Train [61][870/3239]	Time 0.251 (0.990)	Data Time 0.001 (0.466)	Loss 2.6829 (2.6434)	Entropy 0.62651 (0.62772)	Top-1 acc 57.031 (60.293)	Top-5 acc 78.906 (81.432)	lr 0.01241
Train [61][880/3239]	Time 0.245 (0.987)	Data Time 0.001 (0.464)	Loss 2.6711 (2.6440)	Entropy 0.62658 (0.62771)	Top-1 acc 58.984 (60.289)	Top-5 acc 77.344 (81.418)	lr 0.01241
Train [61][890/3239]	Time 0.238 (0.993)	Data Time 0.001 (0.471)	Loss 2.5067 (2.6436)	Entropy 0.62676 (0.62770)	Top-1 acc 62.109 (60.278)	Top-5 acc 84.766 (81.433)	lr 0.01241
Train [61][900/3239]	Time 0.267 (0.994)	Data Time 0.001 (0.473)	Loss 2.5828 (2.6430)	Entropy 0.62672 (0.62769)	Top-1 acc 60.547 (60.287)	Top-5 acc 82.812 (81.450)	lr 0.01241
Train [61][910/3239]	Time 0.385 (0.990)	Data Time 0.001 (0.469)	Loss 2.6067 (2.6426)	Entropy 0.62687 (0.62768)	Top-1 acc 62.500 (60.288)	Top-5 acc 83.203 (81.464)	lr 0.01241
Train [61][920/3239]	Time 1.548 (0.995)	Data Time 1.232 (0.475)	Loss 2.6539 (2.6433)	Entropy 0.62670 (0.62767)	Top-1 acc 58.984 (60.262)	Top-5 acc 80.078 (81.448)	lr 0.01241
Train [61][930/3239]	Time 0.990 (0.999)	Data Time 0.740 (0.480)	Loss 2.6982 (2.6429)	Entropy 0.62670 (0.62766)	Top-1 acc 57.031 (60.265)	Top-5 acc 80.078 (81.451)	lr 0.01241
Train [61][940/3239]	Time 0.242 (0.993)	Data Time 0.001 (0.475)	Loss 2.5589 (2.6426)	Entropy 0.62641 (0.62765)	Top-1 acc 62.891 (60.270)	Top-5 acc 83.984 (81.457)	lr 0.01241
Train [61][950/3239]	Time 0.242 (0.997)	Data Time 0.001 (0.480)	Loss 2.5345 (2.6418)	Entropy 0.62643 (0.62763)	Top-1 acc 64.844 (60.295)	Top-5 acc 82.031 (81.475)	lr 0.01240
Train [61][960/3239]	Time 0.241 (1.001)	Data Time 0.001 (0.485)	Loss 2.6173 (2.6418)	Entropy 0.62672 (0.62762)	Top-1 acc 59.766 (60.304)	Top-5 acc 81.641 (81.474)	lr 0.01240
Train [61][970/3239]	Time 3.385 (1.000)	Data Time 3.111 (0.484)	Loss 2.6758 (2.6416)	Entropy 0.62659 (0.62761)	Top-1 acc 60.938 (60.319)	Top-5 acc 80.859 (81.479)	lr 0.01240
Train [61][980/3239]	Time 0.335 (0.999)	Data Time 0.001 (0.484)	Loss 2.6226 (2.6410)	Entropy 0.62650 (0.62760)	Top-1 acc 59.375 (60.335)	Top-5 acc 80.859 (81.492)	lr 0.01240
Train [61][990/3239]	Time 0.233 (1.008)	Data Time 0.001 (0.494)	Loss 2.8311 (2.6411)	Entropy 0.62665 (0.62759)	Top-1 acc 54.297 (60.336)	Top-5 acc 78.125 (81.492)	lr 0.01240
Train [61][1000/3239]	Time 0.225 (1.003)	Data Time 0.003 (0.491)	Loss 2.5815 (2.6417)	Entropy 0.62640 (0.62758)	Top-1 acc 58.203 (60.309)	Top-5 acc 81.641 (81.478)	lr 0.01240
Train [61][1010/3239]	Time 0.240 (1.000)	Data Time 0.001 (0.488)	Loss 2.6275 (2.6412)	Entropy 0.62663 (0.62757)	Top-1 acc 61.328 (60.310)	Top-5 acc 79.688 (81.489)	lr 0.01240
Train [61][1020/3239]	Time 0.244 (1.011)	Data Time 0.001 (0.500)	Loss 2.6909 (2.6412)	Entropy 0.62621 (0.62756)	Top-1 acc 57.031 (60.306)	Top-5 acc 80.859 (81.498)	lr 0.01240
Train [61][1030/3239]	Time 0.230 (1.009)	Data Time 0.001 (0.499)	Loss 2.6750 (2.6415)	Entropy 0.62623 (0.62755)	Top-1 acc 58.203 (60.298)	Top-5 acc 79.297 (81.497)	lr 0.01240
Train [61][1040/3239]	Time 0.237 (1.004)	Data Time 0.001 (0.495)	Loss 2.7335 (2.6417)	Entropy 0.62645 (0.62754)	Top-1 acc 58.203 (60.290)	Top-5 acc 82.422 (81.503)	lr 0.01239
Train [61][1050/3239]	Time 0.235 (1.015)	Data Time 0.001 (0.506)	Loss 2.5150 (2.6418)	Entropy 0.62629 (0.62752)	Top-1 acc 60.938 (60.298)	Top-5 acc 83.203 (81.505)	lr 0.01239
Train [61][1060/3239]	Time 0.233 (1.020)	Data Time 0.001 (0.512)	Loss 2.6110 (2.6414)	Entropy 0.62611 (0.62751)	Top-1 acc 62.891 (60.310)	Top-5 acc 80.078 (81.516)	lr 0.01239
Train [61][1070/3239]	Time 0.246 (1.014)	Data Time 0.001 (0.508)	Loss 2.5350 (2.6413)	Entropy 0.62614 (0.62750)	Top-1 acc 67.969 (60.325)	Top-5 acc 84.375 (81.518)	lr 0.01239
Train [61][1080/3239]	Time 4.518 (1.018)	Data Time 4.251 (0.513)	Loss 2.7472 (2.6409)	Entropy 0.62612 (0.62749)	Top-1 acc 61.719 (60.339)	Top-5 acc 80.078 (81.522)	lr 0.01239
Train [61][1090/3239]	Time 5.590 (1.023)	Data Time 5.353 (0.518)	Loss 2.7895 (2.6410)	Entropy 0.62647 (0.62747)	Top-1 acc 54.688 (60.327)	Top-5 acc 78.125 (81.522)	lr 0.01239
Train [61][1100/3239]	Time 0.237 (1.017)	Data Time 0.001 (0.513)	Loss 2.5747 (2.6410)	Entropy 0.62644 (0.62747)	Top-1 acc 64.844 (60.333)	Top-5 acc 83.203 (81.524)	lr 0.01239
Train [61][1110/3239]	Time 0.231 (1.019)	Data Time 0.001 (0.516)	Loss 2.6158 (2.6414)	Entropy 0.62649 (0.62746)	Top-1 acc 60.938 (60.314)	Top-5 acc 83.594 (81.514)	lr 0.01239
Train [61][1120/3239]	Time 0.249 (1.022)	Data Time 0.001 (0.519)	Loss 2.8484 (2.6414)	Entropy 0.62643 (0.62745)	Top-1 acc 55.469 (60.303)	Top-5 acc 76.953 (81.511)	lr 0.01239
Train [61][1130/3239]	Time 0.254 (1.024)	Data Time 0.005 (0.521)	Loss 2.5923 (2.6417)	Entropy 0.62628 (0.62744)	Top-1 acc 60.938 (60.291)	Top-5 acc 83.203 (81.500)	lr 0.01239
Train [61][1140/3239]	Time 0.348 (1.020)	Data Time 0.001 (0.519)	Loss 2.8063 (2.6419)	Entropy 0.62653 (0.62743)	Top-1 acc 53.906 (60.290)	Top-5 acc 78.125 (81.493)	lr 0.01238
Train [61][1150/3239]	Time 0.239 (1.031)	Data Time 0.001 (0.530)	Loss 2.7406 (2.6418)	Entropy 0.62621 (0.62742)	Top-1 acc 55.469 (60.295)	Top-5 acc 81.641 (81.499)	lr 0.01238
Train [61][1160/3239]	Time 0.441 (1.029)	Data Time 0.194 (0.529)	Loss 2.8545 (2.6423)	Entropy 0.62634 (0.62741)	Top-1 acc 53.906 (60.281)	Top-5 acc 77.344 (81.490)	lr 0.01238
Train [61][1170/3239]	Time 0.234 (1.030)	Data Time 0.001 (0.531)	Loss 2.6876 (2.6422)	Entropy 0.62633 (0.62740)	Top-1 acc 57.031 (60.275)	Top-5 acc 80.078 (81.487)	lr 0.01238
Train [61][1180/3239]	Time 0.254 (1.040)	Data Time 0.001 (0.542)	Loss 2.6690 (2.6423)	Entropy 0.62641 (0.62739)	Top-1 acc 58.203 (60.268)	Top-5 acc 80.078 (81.481)	lr 0.01238
Train [61][1190/3239]	Time 0.265 (1.037)	Data Time 0.002 (0.539)	Loss 2.7177 (2.6427)	Entropy 0.62639 (0.62738)	Top-1 acc 58.203 (60.264)	Top-5 acc 79.688 (81.468)	lr 0.01238
Train [61][1200/3239]	Time 0.241 (1.043)	Data Time 0.001 (0.545)	Loss 2.6638 (2.6434)	Entropy 0.62663 (0.62737)	Top-1 acc 60.156 (60.254)	Top-5 acc 82.031 (81.459)	lr 0.01238
Train [61][1210/3239]	Time 0.358 (1.049)	Data Time 0.001 (0.552)	Loss 2.5380 (2.6431)	Entropy 0.62664 (0.62737)	Top-1 acc 61.328 (60.264)	Top-5 acc 83.594 (81.460)	lr 0.01238
Train [61][1220/3239]	Time 0.232 (1.048)	Data Time 0.001 (0.552)	Loss 2.8264 (2.6436)	Entropy 0.62675 (0.62736)	Top-1 acc 56.250 (60.262)	Top-5 acc 80.469 (81.450)	lr 0.01238
Train [61][1230/3239]	Time 0.225 (1.050)	Data Time 0.001 (0.554)	Loss 2.7928 (2.6439)	Entropy 0.62671 (0.62736)	Top-1 acc 57.812 (60.254)	Top-5 acc 76.953 (81.445)	lr 0.01238
Train [61][1240/3239]	Time 9.115 (1.056)	Data Time 8.874 (0.561)	Loss 2.7737 (2.6437)	Entropy 0.62703 (0.62735)	Top-1 acc 54.297 (60.250)	Top-5 acc 77.734 (81.447)	lr 0.01237
Train [61][1250/3239]	Time 0.980 (1.055)	Data Time 0.747 (0.560)	Loss 2.6211 (2.6443)	Entropy 0.62688 (0.62735)	Top-1 acc 62.500 (60.241)	Top-5 acc 79.297 (81.432)	lr 0.01237
Train [61][1260/3239]	Time 0.251 (1.058)	Data Time 0.001 (0.564)	Loss 2.5533 (2.6443)	Entropy 0.62688 (0.62735)	Top-1 acc 62.891 (60.243)	Top-5 acc 81.250 (81.425)	lr 0.01237
Train [61][1270/3239]	Time 0.233 (1.059)	Data Time 0.001 (0.566)	Loss 2.5965 (2.6444)	Entropy 0.62661 (0.62734)	Top-1 acc 63.281 (60.244)	Top-5 acc 81.641 (81.425)	lr 0.01237
Train [61][1280/3239]	Time 0.273 (1.064)	Data Time 0.003 (0.571)	Loss 2.6599 (2.6449)	Entropy 0.62634 (0.62734)	Top-1 acc 59.766 (60.228)	Top-5 acc 81.250 (81.413)	lr 0.01237
Train [61][1290/3239]	Time 6.749 (1.070)	Data Time 6.513 (0.578)	Loss 2.4764 (2.6447)	Entropy 0.62638 (0.62733)	Top-1 acc 65.234 (60.237)	Top-5 acc 84.766 (81.417)	lr 0.01237
Train [61][1300/3239]	Time 0.322 (1.067)	Data Time 0.001 (0.575)	Loss 2.7176 (2.6446)	Entropy 0.62637 (0.62732)	Top-1 acc 60.156 (60.241)	Top-5 acc 79.297 (81.413)	lr 0.01237
Train [61][1310/3239]	Time 0.251 (1.070)	Data Time 0.001 (0.579)	Loss 2.9377 (2.6453)	Entropy 0.62627 (0.62731)	Top-1 acc 53.906 (60.227)	Top-5 acc 75.000 (81.402)	lr 0.01237
Train [61][1320/3239]	Time 0.255 (1.070)	Data Time 0.001 (0.580)	Loss 2.4261 (2.6454)	Entropy 0.62634 (0.62731)	Top-1 acc 65.625 (60.225)	Top-5 acc 88.281 (81.403)	lr 0.01237
Train [61][1330/3239]	Time 0.242 (1.072)	Data Time 0.001 (0.582)	Loss 2.7818 (2.6454)	Entropy 0.62615 (0.62730)	Top-1 acc 54.297 (60.219)	Top-5 acc 79.297 (81.403)	lr 0.01237
Train [61][1340/3239]	Time 0.233 (1.075)	Data Time 0.001 (0.586)	Loss 2.4094 (2.6456)	Entropy 0.62605 (0.62729)	Top-1 acc 67.188 (60.218)	Top-5 acc 85.547 (81.398)	lr 0.01236
Train [61][1350/3239]	Time 0.246 (1.070)	Data Time 0.001 (0.581)	Loss 2.6490 (2.6463)	Entropy 0.62599 (0.62728)	Top-1 acc 58.203 (60.200)	Top-5 acc 79.297 (81.384)	lr 0.01236
Train [61][1360/3239]	Time 0.233 (1.076)	Data Time 0.001 (0.588)	Loss 2.7042 (2.6464)	Entropy 0.62609 (0.62727)	Top-1 acc 61.328 (60.201)	Top-5 acc 80.859 (81.386)	lr 0.01236
Train [61][1370/3239]	Time 0.324 (1.073)	Data Time 0.001 (0.586)	Loss 2.4943 (2.6467)	Entropy 0.62568 (0.62726)	Top-1 acc 64.453 (60.194)	Top-5 acc 82.812 (81.379)	lr 0.01236
Train [61][1380/3239]	Time 0.233 (1.073)	Data Time 0.001 (0.586)	Loss 2.7495 (2.6469)	Entropy 0.62562 (0.62725)	Top-1 acc 58.203 (60.186)	Top-5 acc 76.953 (81.371)	lr 0.01236
Train [61][1390/3239]	Time 0.237 (1.080)	Data Time 0.001 (0.593)	Loss 2.6045 (2.6472)	Entropy 0.62569 (0.62724)	Top-1 acc 63.672 (60.180)	Top-5 acc 78.516 (81.368)	lr 0.01236
Train [61][1400/3239]	Time 0.243 (1.075)	Data Time 0.001 (0.589)	Loss 2.4457 (2.6474)	Entropy 0.62548 (0.62723)	Top-1 acc 67.188 (60.168)	Top-5 acc 83.984 (81.357)	lr 0.01236
Train [61][1410/3239]	Time 0.241 (1.076)	Data Time 0.001 (0.591)	Loss 2.6310 (2.6476)	Entropy 0.62547 (0.62722)	Top-1 acc 60.156 (60.165)	Top-5 acc 81.641 (81.355)	lr 0.01236
Train [61][1420/3239]	Time 0.299 (1.096)	Data Time 0.003 (0.587)	Loss 2.7275 (2.6477)	Entropy 0.62589 (0.62720)	Top-1 acc 57.422 (60.166)	Top-5 acc 79.297 (81.348)	lr 0.01236
Train [61][1430/3239]	Time 0.243 (1.092)	Data Time 0.001 (0.583)	Loss 2.5853 (2.6477)	Entropy 0.62616 (0.62720)	Top-1 acc 60.156 (60.162)	Top-5 acc 82.031 (81.351)	lr 0.01236
Train [61][1440/3239]	Time 0.237 (1.087)	Data Time 0.001 (0.579)	Loss 2.5871 (2.6479)	Entropy 0.62641 (0.62719)	Top-1 acc 58.203 (60.161)	Top-5 acc 83.984 (81.347)	lr 0.01235
Train [61][1450/3239]	Time 4.439 (1.086)	Data Time 4.125 (0.578)	Loss 2.5831 (2.6478)	Entropy 0.62632 (0.62718)	Top-1 acc 63.281 (60.162)	Top-5 acc 83.984 (81.346)	lr 0.01235
Train [61][1460/3239]	Time 0.342 (1.081)	Data Time 0.001 (0.574)	Loss 2.5968 (2.6477)	Entropy 0.62654 (0.62718)	Top-1 acc 60.938 (60.165)	Top-5 acc 81.250 (81.348)	lr 0.01235
Train [61][1470/3239]	Time 4.212 (1.083)	Data Time 3.938 (0.577)	Loss 2.5976 (2.6480)	Entropy 0.62671 (0.62717)	Top-1 acc 64.062 (60.159)	Top-5 acc 83.984 (81.343)	lr 0.01235
Train [61][1480/3239]	Time 0.254 (1.081)	Data Time 0.001 (0.575)	Loss 2.6786 (2.6478)	Entropy 0.62707 (0.62717)	Top-1 acc 60.547 (60.164)	Top-5 acc 82.031 (81.352)	lr 0.01235
Train [61][1490/3239]	Time 0.248 (1.086)	Data Time 0.001 (0.580)	Loss 2.6818 (2.6479)	Entropy 0.62679 (0.62717)	Top-1 acc 59.375 (60.170)	Top-5 acc 80.469 (81.350)	lr 0.01235
Train [61][1500/3239]	Time 0.247 (1.087)	Data Time 0.001 (0.582)	Loss 2.6657 (2.6480)	Entropy 0.62676 (0.62717)	Top-1 acc 57.812 (60.172)	Top-5 acc 82.422 (81.348)	lr 0.01235
Train [61][1510/3239]	Time 0.261 (1.082)	Data Time 0.001 (0.578)	Loss 2.6654 (2.6478)	Entropy 0.62645 (0.62717)	Top-1 acc 58.594 (60.170)	Top-5 acc 82.031 (81.355)	lr 0.01235
Train [61][1520/3239]	Time 0.226 (1.088)	Data Time 0.001 (0.584)	Loss 2.5592 (2.6475)	Entropy 0.62641 (0.62716)	Top-1 acc 60.938 (60.174)	Top-5 acc 83.203 (81.359)	lr 0.01235
Train [61][1530/3239]	Time 0.328 (1.087)	Data Time 0.001 (0.583)	Loss 2.6124 (2.6480)	Entropy 0.62655 (0.62716)	Top-1 acc 61.719 (60.159)	Top-5 acc 83.594 (81.352)	lr 0.01235
Train [61][1540/3239]	Time 0.229 (1.087)	Data Time 0.001 (0.584)	Loss 2.6900 (2.6478)	Entropy 0.62668 (0.62715)	Top-1 acc 58.984 (60.163)	Top-5 acc 80.469 (81.353)	lr 0.01234
Train [61][1550/3239]	Time 0.227 (1.092)	Data Time 0.001 (0.590)	Loss 2.8233 (2.6477)	Entropy 0.62682 (0.62715)	Top-1 acc 57.031 (60.165)	Top-5 acc 78.125 (81.359)	lr 0.01234
Train [61][1560/3239]	Time 0.223 (1.090)	Data Time 0.001 (0.588)	Loss 2.7859 (2.6479)	Entropy 0.62669 (0.62715)	Top-1 acc 57.812 (60.159)	Top-5 acc 76.953 (81.352)	lr 0.01234
Train [61][1570/3239]	Time 0.233 (1.091)	Data Time 0.001 (0.590)	Loss 2.6927 (2.6479)	Entropy 0.62700 (0.62714)	Top-1 acc 59.375 (60.161)	Top-5 acc 80.469 (81.355)	lr 0.01234
Train [61][1580/3239]	Time 0.253 (1.097)	Data Time 0.001 (0.596)	Loss 2.5990 (2.6484)	Entropy 0.62746 (0.62714)	Top-1 acc 63.281 (60.147)	Top-5 acc 81.641 (81.348)	lr 0.01234
Train [61][1590/3239]	Time 0.240 (1.093)	Data Time 0.001 (0.593)	Loss 2.7018 (2.6487)	Entropy 0.62725 (0.62715)	Top-1 acc 56.641 (60.143)	Top-5 acc 80.469 (81.343)	lr 0.01234
Train [61][1600/3239]	Time 0.244 (1.095)	Data Time 0.001 (0.595)	Loss 2.5975 (2.6487)	Entropy 0.62748 (0.62715)	Top-1 acc 66.797 (60.146)	Top-5 acc 83.203 (81.345)	lr 0.01234
Train [61][1610/3239]	Time 15.685 (1.100)	Data Time 15.421 (0.601)	Loss 2.7158 (2.6492)	Entropy 0.62734 (0.62715)	Top-1 acc 57.031 (60.131)	Top-5 acc 79.688 (81.335)	lr 0.01234
Train [61][1620/3239]	Time 0.364 (1.096)	Data Time 0.001 (0.597)	Loss 2.8003 (2.6492)	Entropy 0.62710 (0.62715)	Top-1 acc 55.078 (60.134)	Top-5 acc 81.641 (81.332)	lr 0.01234
Train [61][1630/3239]	Time 0.245 (1.097)	Data Time 0.001 (0.598)	Loss 2.6565 (2.6491)	Entropy 0.62727 (0.62715)	Top-1 acc 57.031 (60.133)	Top-5 acc 78.906 (81.333)	lr 0.01234
Train [61][1640/3239]	Time 0.254 (1.094)	Data Time 0.001 (0.595)	Loss 2.8034 (2.6495)	Entropy 0.62722 (0.62715)	Top-1 acc 56.250 (60.118)	Top-5 acc 75.781 (81.330)	lr 0.01233
Train [61][1650/3239]	Time 0.241 (1.100)	Data Time 0.001 (0.602)	Loss 2.5869 (2.6495)	Entropy 0.62701 (0.62715)	Top-1 acc 66.797 (60.118)	Top-5 acc 82.031 (81.330)	lr 0.01233
Train [61][1660/3239]	Time 0.288 (1.103)	Data Time 0.001 (0.605)	Loss 2.6327 (2.6493)	Entropy 0.62743 (0.62715)	Top-1 acc 60.156 (60.123)	Top-5 acc 81.641 (81.333)	lr 0.01233
Train [61][1670/3239]	Time 0.232 (1.099)	Data Time 0.001 (0.602)	Loss 2.6417 (2.6496)	Entropy 0.62678 (0.62715)	Top-1 acc 61.719 (60.117)	Top-5 acc 79.297 (81.325)	lr 0.01233
Train [61][1680/3239]	Time 1.804 (1.104)	Data Time 1.569 (0.608)	Loss 2.5642 (2.6495)	Entropy 0.62664 (0.62715)	Top-1 acc 60.156 (60.120)	Top-5 acc 82.812 (81.326)	lr 0.01233
Train [61][1690/3239]	Time 0.319 (1.100)	Data Time 0.001 (0.604)	Loss 2.6325 (2.6492)	Entropy 0.62689 (0.62715)	Top-1 acc 60.156 (60.132)	Top-5 acc 80.859 (81.327)	lr 0.01233
Train [61][1700/3239]	Time 0.233 (1.102)	Data Time 0.001 (0.607)	Loss 2.5754 (2.6491)	Entropy 0.62705 (0.62715)	Top-1 acc 62.109 (60.134)	Top-5 acc 81.250 (81.327)	lr 0.01233
Train [61][1710/3239]	Time 0.261 (1.106)	Data Time 0.002 (0.611)	Loss 2.5666 (2.6488)	Entropy 0.62696 (0.62714)	Top-1 acc 62.500 (60.144)	Top-5 acc 84.766 (81.331)	lr 0.01233
Train [61][1720/3239]	Time 0.232 (1.104)	Data Time 0.001 (0.610)	Loss 2.7168 (2.6486)	Entropy 0.62725 (0.62714)	Top-1 acc 61.719 (60.146)	Top-5 acc 80.078 (81.339)	lr 0.01233
Train [61][1730/3239]	Time 0.234 (1.106)	Data Time 0.001 (0.612)	Loss 2.5889 (2.6486)	Entropy 0.62691 (0.62714)	Top-1 acc 60.156 (60.148)	Top-5 acc 81.641 (81.339)	lr 0.01233
Train [61][1740/3239]	Time 0.243 (1.108)	Data Time 0.001 (0.615)	Loss 2.6248 (2.6487)	Entropy 0.62688 (0.62714)	Top-1 acc 63.281 (60.148)	Top-5 acc 79.688 (81.338)	lr 0.01232
Train [61][1750/3239]	Time 0.237 (1.109)	Data Time 0.001 (0.616)	Loss 2.8458 (2.6489)	Entropy 0.62730 (0.62714)	Top-1 acc 56.641 (60.145)	Top-5 acc 77.344 (81.339)	lr 0.01232
Train [61][1760/3239]	Time 0.250 (1.111)	Data Time 0.001 (0.618)	Loss 2.5211 (2.6489)	Entropy 0.62724 (0.62714)	Top-1 acc 59.375 (60.142)	Top-5 acc 83.203 (81.338)	lr 0.01232
Train [61][1770/3239]	Time 8.273 (1.111)	Data Time 8.000 (0.619)	Loss 2.7507 (2.6487)	Entropy 0.62727 (0.62714)	Top-1 acc 59.375 (60.146)	Top-5 acc 79.297 (81.342)	lr 0.01232
Train [61][1780/3239]	Time 0.245 (1.112)	Data Time 0.002 (0.620)	Loss 2.7357 (2.6488)	Entropy 0.62749 (0.62715)	Top-1 acc 59.375 (60.144)	Top-5 acc 81.641 (81.343)	lr 0.01232
Train [61][1790/3239]	Time 0.238 (1.113)	Data Time 0.001 (0.622)	Loss 2.6045 (2.6485)	Entropy 0.62776 (0.62715)	Top-1 acc 58.984 (60.150)	Top-5 acc 85.938 (81.349)	lr 0.01232
Train [61][1800/3239]	Time 0.242 (1.109)	Data Time 0.001 (0.618)	Loss 2.7479 (2.6488)	Entropy 0.62812 (0.62715)	Top-1 acc 57.422 (60.140)	Top-5 acc 81.250 (81.346)	lr 0.01232
Train [61][1810/3239]	Time 0.245 (1.115)	Data Time 0.001 (0.624)	Loss 3.0904 (2.6492)	Entropy 0.62846 (0.62716)	Top-1 acc 49.609 (60.131)	Top-5 acc 72.266 (81.333)	lr 0.01232
Train [61][1820/3239]	Time 0.256 (1.116)	Data Time 0.001 (0.625)	Loss 2.5476 (2.6491)	Entropy 0.62844 (0.62716)	Top-1 acc 63.281 (60.133)	Top-5 acc 80.859 (81.332)	lr 0.01232
Train [61][1830/3239]	Time 0.226 (1.112)	Data Time 0.001 (0.622)	Loss 2.6585 (2.6488)	Entropy 0.62833 (0.62717)	Top-1 acc 60.938 (60.139)	Top-5 acc 83.203 (81.340)	lr 0.01232
Train [61][1840/3239]	Time 4.784 (1.119)	Data Time 4.520 (0.630)	Loss 2.5778 (2.6488)	Entropy 0.62836 (0.62718)	Top-1 acc 62.109 (60.142)	Top-5 acc 82.422 (81.335)	lr 0.01231
Train [61][1850/3239]	Time 0.343 (1.115)	Data Time 0.001 (0.626)	Loss 2.5262 (2.6489)	Entropy 0.62853 (0.62718)	Top-1 acc 63.281 (60.137)	Top-5 acc 83.203 (81.335)	lr 0.01231
Train [61][1860/3239]	Time 0.234 (1.115)	Data Time 0.001 (0.627)	Loss 2.4190 (2.6486)	Entropy 0.62882 (0.62719)	Top-1 acc 64.844 (60.141)	Top-5 acc 88.672 (81.338)	lr 0.01231
Train [61][1870/3239]	Time 0.249 (1.120)	Data Time 0.001 (0.631)	Loss 2.5288 (2.6484)	Entropy 0.62881 (0.62720)	Top-1 acc 62.109 (60.144)	Top-5 acc 83.594 (81.340)	lr 0.01231
Train [61][1880/3239]	Time 0.240 (1.117)	Data Time 0.001 (0.629)	Loss 2.7614 (2.6488)	Entropy 0.62882 (0.62721)	Top-1 acc 55.859 (60.136)	Top-5 acc 81.641 (81.331)	lr 0.01231
Train [61][1890/3239]	Time 0.250 (1.117)	Data Time 0.002 (0.629)	Loss 2.7070 (2.6490)	Entropy 0.62897 (0.62722)	Top-1 acc 58.203 (60.134)	Top-5 acc 77.344 (81.330)	lr 0.01231
Train [61][1900/3239]	Time 0.242 (1.117)	Data Time 0.001 (0.629)	Loss 2.6815 (2.6491)	Entropy 0.62890 (0.62723)	Top-1 acc 58.594 (60.133)	Top-5 acc 79.688 (81.323)	lr 0.01231
Train [61][1910/3239]	Time 0.250 (1.115)	Data Time 0.002 (0.628)	Loss 2.4599 (2.6487)	Entropy 0.62910 (0.62724)	Top-1 acc 66.406 (60.145)	Top-5 acc 83.203 (81.326)	lr 0.01231
Train [61][1920/3239]	Time 0.354 (1.113)	Data Time 0.001 (0.626)	Loss 2.6872 (2.6486)	Entropy 0.62918 (0.62725)	Top-1 acc 60.938 (60.151)	Top-5 acc 79.688 (81.327)	lr 0.01231
Train [61][1930/3239]	Time 9.837 (1.114)	Data Time 9.551 (0.628)	Loss 2.6464 (2.6488)	Entropy 0.62903 (0.62726)	Top-1 acc 59.766 (60.149)	Top-5 acc 82.812 (81.325)	lr 0.01231
Train [61][1940/3239]	Time 0.246 (1.113)	Data Time 0.001 (0.627)	Loss 2.7222 (2.6486)	Entropy 0.62905 (0.62727)	Top-1 acc 58.203 (60.153)	Top-5 acc 82.422 (81.329)	lr 0.01230
Train [61][1950/3239]	Time 0.247 (1.115)	Data Time 0.001 (0.629)	Loss 2.4918 (2.6487)	Entropy 0.62931 (0.62727)	Top-1 acc 60.938 (60.147)	Top-5 acc 83.984 (81.325)	lr 0.01230
Train [61][1960/3239]	Time 0.253 (1.111)	Data Time 0.001 (0.626)	Loss 2.5214 (2.6487)	Entropy 0.62932 (0.62728)	Top-1 acc 63.672 (60.145)	Top-5 acc 81.250 (81.322)	lr 0.01230
Train [61][1970/3239]	Time 0.231 (1.118)	Data Time 0.001 (0.633)	Loss 2.5483 (2.6487)	Entropy 0.62886 (0.62729)	Top-1 acc 63.281 (60.149)	Top-5 acc 82.812 (81.320)	lr 0.01230
Train [61][1980/3239]	Time 0.239 (1.118)	Data Time 0.001 (0.634)	Loss 2.5559 (2.6488)	Entropy 0.62893 (0.62730)	Top-1 acc 61.719 (60.148)	Top-5 acc 80.469 (81.317)	lr 0.01230
Train [61][1990/3239]	Time 0.234 (1.115)	Data Time 0.001 (0.631)	Loss 2.7887 (2.6487)	Entropy 0.62895 (0.62731)	Top-1 acc 56.641 (60.152)	Top-5 acc 78.906 (81.319)	lr 0.01230
Train [61][2000/3239]	Time 2.584 (1.120)	Data Time 2.343 (0.636)	Loss 2.6221 (2.6483)	Entropy 0.62896 (0.62732)	Top-1 acc 57.031 (60.153)	Top-5 acc 83.203 (81.330)	lr 0.01230
Train [61][2010/3239]	Time 0.329 (1.116)	Data Time 0.001 (0.633)	Loss 2.5484 (2.6483)	Entropy 0.62867 (0.62733)	Top-1 acc 61.719 (60.155)	Top-5 acc 83.594 (81.335)	lr 0.01230
Train [61][2020/3239]	Time 0.292 (1.118)	Data Time 0.001 (0.635)	Loss 2.6868 (2.6482)	Entropy 0.62885 (0.62733)	Top-1 acc 57.812 (60.156)	Top-5 acc 80.469 (81.332)	lr 0.01230
Train [61][2030/3239]	Time 0.234 (1.122)	Data Time 0.002 (0.640)	Loss 2.6153 (2.6481)	Entropy 0.62875 (0.62734)	Top-1 acc 58.984 (60.155)	Top-5 acc 82.422 (81.335)	lr 0.01229
Train [61][2040/3239]	Time 0.239 (1.120)	Data Time 0.001 (0.637)	Loss 2.6019 (2.6479)	Entropy 0.62875 (0.62735)	Top-1 acc 56.641 (60.154)	Top-5 acc 83.594 (81.338)	lr 0.01229
Train [61][2050/3239]	Time 0.223 (1.121)	Data Time 0.001 (0.639)	Loss 2.8587 (2.6486)	Entropy 0.62881 (0.62735)	Top-1 acc 55.859 (60.137)	Top-5 acc 77.344 (81.325)	lr 0.01229
Train [61][2060/3239]	Time 0.246 (1.121)	Data Time 0.001 (0.639)	Loss 2.6604 (2.6486)	Entropy 0.62850 (0.62736)	Top-1 acc 60.156 (60.139)	Top-5 acc 79.297 (81.325)	lr 0.01229
Train [61][2070/3239]	Time 0.347 (1.134)	Data Time 0.005 (0.636)	Loss 2.4288 (2.6483)	Entropy 0.62849 (0.62736)	Top-1 acc 66.016 (60.146)	Top-5 acc 85.547 (81.333)	lr 0.01229
Train [61][2080/3239]	Time 0.325 (1.131)	Data Time 0.002 (0.633)	Loss 2.5560 (2.6482)	Entropy 0.62840 (0.62737)	Top-1 acc 65.234 (60.150)	Top-5 acc 83.594 (81.331)	lr 0.01229
Train [61][2090/3239]	Time 0.248 (1.127)	Data Time 0.002 (0.630)	Loss 2.6611 (2.6482)	Entropy 0.62874 (0.62738)	Top-1 acc 60.547 (60.149)	Top-5 acc 79.688 (81.331)	lr 0.01229
Train [61][2100/3239]	Time 0.244 (1.124)	Data Time 0.001 (0.627)	Loss 2.6472 (2.6481)	Entropy 0.62872 (0.62738)	Top-1 acc 60.938 (60.150)	Top-5 acc 80.859 (81.333)	lr 0.01229
Train [61][2110/3239]	Time 0.242 (1.121)	Data Time 0.001 (0.624)	Loss 2.5991 (2.6481)	Entropy 0.62856 (0.62739)	Top-1 acc 60.938 (60.147)	Top-5 acc 83.594 (81.336)	lr 0.01229
Train [61][2120/3239]	Time 0.256 (1.117)	Data Time 0.001 (0.621)	Loss 2.5776 (2.6479)	Entropy 0.62874 (0.62739)	Top-1 acc 59.766 (60.154)	Top-5 acc 85.156 (81.341)	lr 0.01229
Train [61][2130/3239]	Time 0.240 (1.114)	Data Time 0.002 (0.618)	Loss 2.7295 (2.6479)	Entropy 0.62887 (0.62740)	Top-1 acc 63.281 (60.158)	Top-5 acc 78.125 (81.339)	lr 0.01228
Train [61][2140/3239]	Time 0.234 (1.111)	Data Time 0.001 (0.615)	Loss 2.6281 (2.6479)	Entropy 0.62916 (0.62741)	Top-1 acc 64.062 (60.157)	Top-5 acc 81.250 (81.340)	lr 0.01228
Train [61][2150/3239]	Time 0.234 (1.108)	Data Time 0.001 (0.612)	Loss 2.6489 (2.6482)	Entropy 0.62916 (0.62742)	Top-1 acc 56.641 (60.144)	Top-5 acc 81.641 (81.337)	lr 0.01228
Train [61][2160/3239]	Time 0.504 (1.105)	Data Time 0.254 (0.610)	Loss 2.5954 (2.6481)	Entropy 0.62908 (0.62742)	Top-1 acc 58.984 (60.142)	Top-5 acc 82.422 (81.338)	lr 0.01228
Train [61][2170/3239]	Time 0.374 (1.107)	Data Time 0.001 (0.611)	Loss 2.6149 (2.6483)	Entropy 0.62903 (0.62743)	Top-1 acc 60.938 (60.136)	Top-5 acc 82.422 (81.332)	lr 0.01228
Train [61][2180/3239]	Time 1.045 (1.108)	Data Time 0.790 (0.613)	Loss 2.6416 (2.6485)	Entropy 0.62907 (0.62744)	Top-1 acc 59.766 (60.137)	Top-5 acc 83.203 (81.329)	lr 0.01228
Train [61][2190/3239]	Time 1.442 (1.108)	Data Time 1.180 (0.614)	Loss 2.5744 (2.6484)	Entropy 0.62910 (0.62745)	Top-1 acc 64.453 (60.136)	Top-5 acc 83.203 (81.330)	lr 0.01228
Train [61][2200/3239]	Time 2.713 (1.108)	Data Time 2.461 (0.614)	Loss 2.8528 (2.6487)	Entropy 0.62899 (0.62746)	Top-1 acc 53.125 (60.131)	Top-5 acc 77.734 (81.328)	lr 0.01228
Train [61][2210/3239]	Time 0.239 (1.109)	Data Time 0.001 (0.616)	Loss 2.5318 (2.6487)	Entropy 0.62907 (0.62746)	Top-1 acc 61.719 (60.128)	Top-5 acc 83.594 (81.325)	lr 0.01228
Train [61][2220/3239]	Time 0.249 (1.111)	Data Time 0.001 (0.618)	Loss 2.6365 (2.6485)	Entropy 0.62893 (0.62747)	Top-1 acc 60.156 (60.130)	Top-5 acc 80.859 (81.328)	lr 0.01228
Train [61][2230/3239]	Time 0.233 (1.110)	Data Time 0.001 (0.616)	Loss 2.6413 (2.6487)	Entropy 0.62889 (0.62748)	Top-1 acc 61.719 (60.123)	Top-5 acc 80.859 (81.323)	lr 0.01227
Train [61][2240/3239]	Time 8.878 (1.113)	Data Time 8.522 (0.620)	Loss 2.6278 (2.6485)	Entropy 0.62891 (0.62748)	Top-1 acc 60.156 (60.121)	Top-5 acc 79.297 (81.328)	lr 0.01227
Train [61][2250/3239]	Time 0.247 (1.114)	Data Time 0.001 (0.621)	Loss 2.6469 (2.6486)	Entropy 0.62900 (0.62749)	Top-1 acc 61.328 (60.118)	Top-5 acc 80.078 (81.328)	lr 0.01227
Train [61][2260/3239]	Time 0.354 (1.111)	Data Time 0.114 (0.618)	Loss 2.5958 (2.6487)	Entropy 0.62916 (0.62750)	Top-1 acc 59.766 (60.114)	Top-5 acc 82.422 (81.327)	lr 0.01227
Train [61][2270/3239]	Time 0.227 (1.112)	Data Time 0.001 (0.620)	Loss 2.5173 (2.6487)	Entropy 0.62882 (0.62750)	Top-1 acc 63.672 (60.117)	Top-5 acc 83.984 (81.327)	lr 0.01227
Train [61][2280/3239]	Time 0.217 (1.116)	Data Time 0.001 (0.624)	Loss 2.5488 (2.6487)	Entropy 0.62905 (0.62751)	Top-1 acc 60.938 (60.117)	Top-5 acc 85.156 (81.331)	lr 0.01227
Train [61][2290/3239]	Time 0.240 (1.113)	Data Time 0.001 (0.622)	Loss 2.5326 (2.6484)	Entropy 0.62911 (0.62752)	Top-1 acc 60.938 (60.126)	Top-5 acc 83.203 (81.334)	lr 0.01227
Train [61][2300/3239]	Time 2.633 (1.113)	Data Time 2.324 (0.622)	Loss 2.5136 (2.6482)	Entropy 0.62937 (0.62752)	Top-1 acc 68.359 (60.129)	Top-5 acc 82.422 (81.338)	lr 0.01227
Train [61][2310/3239]	Time 3.590 (1.117)	Data Time 3.356 (0.626)	Loss 2.6026 (2.6481)	Entropy 0.62914 (0.62753)	Top-1 acc 60.547 (60.131)	Top-5 acc 81.641 (81.340)	lr 0.01227
Train [61][2320/3239]	Time 0.244 (1.115)	Data Time 0.001 (0.625)	Loss 2.7539 (2.6478)	Entropy 0.62912 (0.62754)	Top-1 acc 56.250 (60.138)	Top-5 acc 79.297 (81.346)	lr 0.01227
Train [61][2330/3239]	Time 0.259 (1.114)	Data Time 0.001 (0.624)	Loss 2.4978 (2.6478)	Entropy 0.62879 (0.62754)	Top-1 acc 64.453 (60.135)	Top-5 acc 84.375 (81.348)	lr 0.01226
Train [61][2340/3239]	Time 0.250 (1.116)	Data Time 0.001 (0.626)	Loss 2.5867 (2.6479)	Entropy 0.62878 (0.62755)	Top-1 acc 62.109 (60.134)	Top-5 acc 82.422 (81.349)	lr 0.01226
Train [61][2350/3239]	Time 0.248 (1.117)	Data Time 0.001 (0.628)	Loss 2.7295 (2.6479)	Entropy 0.62859 (0.62755)	Top-1 acc 58.594 (60.138)	Top-5 acc 80.469 (81.350)	lr 0.01226
Train [61][2360/3239]	Time 0.236 (1.115)	Data Time 0.001 (0.626)	Loss 2.9782 (2.6482)	Entropy 0.62860 (0.62756)	Top-1 acc 54.688 (60.133)	Top-5 acc 75.781 (81.344)	lr 0.01226
Train [61][2370/3239]	Time 0.234 (1.117)	Data Time 0.001 (0.628)	Loss 2.8482 (2.6483)	Entropy 0.62888 (0.62756)	Top-1 acc 54.688 (60.128)	Top-5 acc 82.031 (81.348)	lr 0.01226
Train [61][2380/3239]	Time 0.236 (1.120)	Data Time 0.001 (0.631)	Loss 2.5738 (2.6481)	Entropy 0.62917 (0.62757)	Top-1 acc 59.375 (60.133)	Top-5 acc 85.156 (81.351)	lr 0.01226
Train [61][2390/3239]	Time 0.231 (1.117)	Data Time 0.001 (0.629)	Loss 2.7358 (2.6482)	Entropy 0.62923 (0.62757)	Top-1 acc 54.688 (60.132)	Top-5 acc 80.469 (81.348)	lr 0.01226
Train [61][2400/3239]	Time 2.170 (1.119)	Data Time 1.816 (0.631)	Loss 2.5758 (2.6480)	Entropy 0.62931 (0.62758)	Top-1 acc 62.500 (60.133)	Top-5 acc 81.250 (81.350)	lr 0.01226
Train [61][2410/3239]	Time 0.234 (1.122)	Data Time 0.001 (0.634)	Loss 2.7121 (2.6481)	Entropy 0.62903 (0.62759)	Top-1 acc 60.156 (60.132)	Top-5 acc 80.469 (81.347)	lr 0.01226
Train [61][2420/3239]	Time 0.243 (1.119)	Data Time 0.001 (0.632)	Loss 2.6317 (2.6480)	Entropy 0.62931 (0.62759)	Top-1 acc 62.500 (60.138)	Top-5 acc 80.469 (81.348)	lr 0.01226
Train [61][2430/3239]	Time 4.084 (1.120)	Data Time 3.841 (0.632)	Loss 2.6017 (2.6481)	Entropy 0.62935 (0.62760)	Top-1 acc 60.547 (60.133)	Top-5 acc 83.594 (81.346)	lr 0.01225
Train [61][2440/3239]	Time 3.633 (1.122)	Data Time 3.360 (0.635)	Loss 2.6974 (2.6484)	Entropy 0.62973 (0.62761)	Top-1 acc 57.812 (60.129)	Top-5 acc 79.688 (81.336)	lr 0.01225
Train [61][2450/3239]	Time 0.231 (1.119)	Data Time 0.001 (0.633)	Loss 2.7308 (2.6486)	Entropy 0.62993 (0.62762)	Top-1 acc 58.984 (60.122)	Top-5 acc 78.516 (81.330)	lr 0.01225
Train [61][2460/3239]	Time 5.980 (1.120)	Data Time 5.686 (0.633)	Loss 2.9493 (2.6489)	Entropy 0.63007 (0.62763)	Top-1 acc 53.516 (60.117)	Top-5 acc 77.734 (81.324)	lr 0.01225
Train [61][2470/3239]	Time 0.368 (1.122)	Data Time 0.001 (0.636)	Loss 2.6641 (2.6490)	Entropy 0.63006 (0.62764)	Top-1 acc 61.328 (60.115)	Top-5 acc 78.125 (81.323)	lr 0.01225
Train [61][2480/3239]	Time 0.238 (1.122)	Data Time 0.001 (0.636)	Loss 2.6357 (2.6488)	Entropy 0.62963 (0.62765)	Top-1 acc 60.547 (60.115)	Top-5 acc 80.859 (81.324)	lr 0.01225
Train [61][2490/3239]	Time 0.244 (1.119)	Data Time 0.001 (0.633)	Loss 2.5679 (2.6489)	Entropy 0.62969 (0.62765)	Top-1 acc 60.156 (60.109)	Top-5 acc 85.156 (81.325)	lr 0.01225
Train [61][2500/3239]	Time 0.241 (1.121)	Data Time 0.001 (0.636)	Loss 2.7537 (2.6492)	Entropy 0.62964 (0.62766)	Top-1 acc 60.547 (60.106)	Top-5 acc 78.516 (81.319)	lr 0.01225
Train [61][2510/3239]	Time 0.252 (1.124)	Data Time 0.001 (0.639)	Loss 2.7325 (2.6490)	Entropy 0.62952 (0.62767)	Top-1 acc 60.156 (60.111)	Top-5 acc 79.688 (81.324)	lr 0.01225
Train [61][2520/3239]	Time 0.241 (1.121)	Data Time 0.001 (0.636)	Loss 2.9339 (2.6492)	Entropy 0.62966 (0.62768)	Top-1 acc 55.469 (60.108)	Top-5 acc 74.609 (81.316)	lr 0.01225
Train [61][2530/3239]	Time 0.243 (1.123)	Data Time 0.001 (0.638)	Loss 2.6108 (2.6493)	Entropy 0.62964 (0.62769)	Top-1 acc 63.281 (60.108)	Top-5 acc 80.078 (81.315)	lr 0.01224
Train [61][2540/3239]	Time 0.231 (1.125)	Data Time 0.001 (0.641)	Loss 2.7359 (2.6493)	Entropy 0.62955 (0.62769)	Top-1 acc 58.594 (60.107)	Top-5 acc 77.344 (81.315)	lr 0.01224
Train [61][2550/3239]	Time 0.235 (1.122)	Data Time 0.001 (0.638)	Loss 2.5891 (2.6492)	Entropy 0.62886 (0.62770)	Top-1 acc 60.547 (60.107)	Top-5 acc 82.031 (81.316)	lr 0.01224
Train [61][2560/3239]	Time 0.322 (1.123)	Data Time 0.001 (0.639)	Loss 2.5943 (2.6491)	Entropy 0.62884 (0.62770)	Top-1 acc 64.062 (60.109)	Top-5 acc 81.641 (81.317)	lr 0.01224
Train [61][2570/3239]	Time 0.223 (1.125)	Data Time 0.001 (0.642)	Loss 2.8512 (2.6493)	Entropy 0.62832 (0.62771)	Top-1 acc 58.203 (60.106)	Top-5 acc 76.172 (81.314)	lr 0.01224
Train [61][2580/3239]	Time 0.238 (1.124)	Data Time 0.001 (0.641)	Loss 2.6633 (2.6495)	Entropy 0.62788 (0.62771)	Top-1 acc 55.859 (60.098)	Top-5 acc 82.422 (81.308)	lr 0.01224
Train [61][2590/3239]	Time 0.238 (1.124)	Data Time 0.001 (0.641)	Loss 2.5019 (2.6498)	Entropy 0.62795 (0.62771)	Top-1 acc 62.891 (60.093)	Top-5 acc 85.547 (81.303)	lr 0.01224
Train [61][2600/3239]	Time 10.397 (1.128)	Data Time 10.146 (0.646)	Loss 2.7664 (2.6499)	Entropy 0.62807 (0.62771)	Top-1 acc 57.031 (60.089)	Top-5 acc 77.344 (81.302)	lr 0.01224
Train [61][2610/3239]	Time 0.244 (1.126)	Data Time 0.001 (0.643)	Loss 2.4320 (2.6498)	Entropy 0.62829 (0.62771)	Top-1 acc 61.328 (60.090)	Top-5 acc 83.984 (81.305)	lr 0.01224
Train [61][2620/3239]	Time 5.121 (1.125)	Data Time 4.857 (0.643)	Loss 2.5793 (2.6497)	Entropy 0.62824 (0.62771)	Top-1 acc 62.891 (60.091)	Top-5 acc 79.297 (81.304)	lr 0.01224
Train [61][2630/3239]	Time 0.333 (1.126)	Data Time 0.001 (0.644)	Loss 2.5769 (2.6495)	Entropy 0.62874 (0.62772)	Top-1 acc 61.328 (60.095)	Top-5 acc 81.641 (81.308)	lr 0.01223
Train [61][2640/3239]	Time 0.248 (1.127)	Data Time 0.001 (0.646)	Loss 2.5666 (2.6492)	Entropy 0.62881 (0.62772)	Top-1 acc 62.891 (60.101)	Top-5 acc 81.641 (81.314)	lr 0.01223
Train [61][2650/3239]	Time 0.243 (1.125)	Data Time 0.001 (0.643)	Loss 2.7909 (2.6493)	Entropy 0.62897 (0.62773)	Top-1 acc 60.938 (60.101)	Top-5 acc 78.906 (81.314)	lr 0.01223
Train [61][2660/3239]	Time 0.237 (1.127)	Data Time 0.001 (0.645)	Loss 2.5856 (2.6491)	Entropy 0.62914 (0.62773)	Top-1 acc 62.109 (60.105)	Top-5 acc 79.297 (81.317)	lr 0.01223
Train [61][2670/3239]	Time 0.231 (1.128)	Data Time 0.001 (0.647)	Loss 2.9425 (2.6492)	Entropy 0.62908 (0.62774)	Top-1 acc 55.469 (60.099)	Top-5 acc 76.562 (81.316)	lr 0.01223
Train [61][2680/3239]	Time 0.240 (1.125)	Data Time 0.001 (0.644)	Loss 2.7054 (2.6491)	Entropy 0.62859 (0.62774)	Top-1 acc 56.641 (60.103)	Top-5 acc 82.031 (81.320)	lr 0.01223
Train [61][2690/3239]	Time 0.247 (1.128)	Data Time 0.002 (0.647)	Loss 2.6175 (2.6491)	Entropy 0.62842 (0.62774)	Top-1 acc 63.281 (60.104)	Top-5 acc 83.594 (81.320)	lr 0.01223
Train [61][2700/3239]	Time 0.253 (1.129)	Data Time 0.001 (0.649)	Loss 2.5130 (2.6493)	Entropy 0.62885 (0.62775)	Top-1 acc 62.500 (60.104)	Top-5 acc 84.375 (81.319)	lr 0.01223
Train [61][2710/3239]	Time 0.256 (1.128)	Data Time 0.001 (0.647)	Loss 2.6498 (2.6493)	Entropy 0.62865 (0.62775)	Top-1 acc 60.938 (60.103)	Top-5 acc 79.688 (81.315)	lr 0.01223
Train [61][2720/3239]	Time 3.120 (1.126)	Data Time 2.776 (0.646)	Loss 2.6934 (2.6491)	Entropy 0.62882 (0.62775)	Top-1 acc 57.812 (60.110)	Top-5 acc 81.250 (81.321)	lr 0.01223
Train [61][2730/3239]	Time 0.394 (1.141)	Data Time 0.035 (0.649)	Loss 2.5457 (2.6491)	Entropy 0.62866 (0.62776)	Top-1 acc 62.891 (60.108)	Top-5 acc 81.250 (81.321)	lr 0.01222
Train [61][2740/3239]	Time 0.261 (1.139)	Data Time 0.002 (0.646)	Loss 2.7606 (2.6492)	Entropy 0.62862 (0.62776)	Top-1 acc 57.031 (60.109)	Top-5 acc 79.688 (81.319)	lr 0.01222
Train [61][2750/3239]	Time 0.241 (1.136)	Data Time 0.001 (0.644)	Loss 2.6818 (2.6494)	Entropy 0.62839 (0.62776)	Top-1 acc 60.547 (60.103)	Top-5 acc 82.031 (81.318)	lr 0.01222
Train [61][2760/3239]	Time 0.237 (1.134)	Data Time 0.001 (0.642)	Loss 2.6379 (2.6491)	Entropy 0.62838 (0.62777)	Top-1 acc 58.203 (60.110)	Top-5 acc 82.031 (81.326)	lr 0.01222
Train [61][2770/3239]	Time 0.254 (1.131)	Data Time 0.001 (0.639)	Loss 2.7650 (2.6492)	Entropy 0.62861 (0.62777)	Top-1 acc 57.031 (60.107)	Top-5 acc 77.344 (81.325)	lr 0.01222
Train [61][2780/3239]	Time 0.261 (1.129)	Data Time 0.001 (0.637)	Loss 2.4972 (2.6492)	Entropy 0.62871 (0.62777)	Top-1 acc 62.500 (60.107)	Top-5 acc 85.938 (81.325)	lr 0.01222
Train [61][2790/3239]	Time 0.357 (1.131)	Data Time 0.001 (0.640)	Loss 2.5643 (2.6492)	Entropy 0.62879 (0.62778)	Top-1 acc 65.234 (60.109)	Top-5 acc 82.812 (81.324)	lr 0.01222
Train [61][2800/3239]	Time 0.240 (1.130)	Data Time 0.001 (0.639)	Loss 2.6344 (2.6493)	Entropy 0.62884 (0.62778)	Top-1 acc 60.156 (60.104)	Top-5 acc 83.594 (81.322)	lr 0.01222
Train [61][2810/3239]	Time 0.243 (1.130)	Data Time 0.001 (0.639)	Loss 2.5937 (2.6495)	Entropy 0.62881 (0.62778)	Top-1 acc 60.938 (60.101)	Top-5 acc 82.812 (81.320)	lr 0.01222
Train [61][2820/3239]	Time 0.236 (1.133)	Data Time 0.001 (0.642)	Loss 2.6641 (2.6494)	Entropy 0.62909 (0.62779)	Top-1 acc 57.422 (60.099)	Top-5 acc 80.469 (81.320)	lr 0.01222
Train [61][2830/3239]	Time 0.255 (1.133)	Data Time 0.002 (0.642)	Loss 2.7386 (2.6494)	Entropy 0.62917 (0.62779)	Top-1 acc 58.203 (60.100)	Top-5 acc 79.688 (81.319)	lr 0.01221
Train [61][2840/3239]	Time 0.241 (1.132)	Data Time 0.001 (0.642)	Loss 2.7691 (2.6497)	Entropy 0.62926 (0.62780)	Top-1 acc 57.031 (60.092)	Top-5 acc 78.516 (81.312)	lr 0.01221
Train [61][2850/3239]	Time 0.247 (1.132)	Data Time 0.001 (0.643)	Loss 2.6619 (2.6498)	Entropy 0.62940 (0.62780)	Top-1 acc 60.938 (60.091)	Top-5 acc 81.250 (81.310)	lr 0.01221
Train [61][2860/3239]	Time 0.260 (1.134)	Data Time 0.001 (0.644)	Loss 2.5922 (2.6499)	Entropy 0.62919 (0.62781)	Top-1 acc 63.281 (60.089)	Top-5 acc 81.641 (81.310)	lr 0.01221
Train [61][2870/3239]	Time 0.217 (1.133)	Data Time 0.001 (0.644)	Loss 2.6302 (2.6498)	Entropy 0.62925 (0.62781)	Top-1 acc 60.938 (60.089)	Top-5 acc 82.031 (81.315)	lr 0.01221
Train [61][2880/3239]	Time 0.319 (1.131)	Data Time 0.001 (0.642)	Loss 2.7075 (2.6497)	Entropy 0.62957 (0.62782)	Top-1 acc 61.719 (60.090)	Top-5 acc 79.688 (81.317)	lr 0.01221
Train [61][2890/3239]	Time 0.237 (1.137)	Data Time 0.001 (0.648)	Loss 2.5330 (2.6497)	Entropy 0.62968 (0.62782)	Top-1 acc 58.984 (60.091)	Top-5 acc 83.203 (81.317)	lr 0.01221
Train [61][2900/3239]	Time 0.236 (1.134)	Data Time 0.001 (0.645)	Loss 2.6705 (2.6496)	Entropy 0.62983 (0.62783)	Top-1 acc 60.156 (60.093)	Top-5 acc 82.812 (81.318)	lr 0.01221
Train [61][2910/3239]	Time 0.231 (1.132)	Data Time 0.001 (0.644)	Loss 2.7199 (2.6499)	Entropy 0.62985 (0.62784)	Top-1 acc 59.375 (60.090)	Top-5 acc 82.812 (81.314)	lr 0.01221
Train [61][2920/3239]	Time 1.934 (1.136)	Data Time 1.688 (0.648)	Loss 2.6133 (2.6501)	Entropy 0.62960 (0.62784)	Top-1 acc 58.984 (60.084)	Top-5 acc 80.859 (81.309)	lr 0.01221
Train [61][2930/3239]	Time 0.258 (1.134)	Data Time 0.001 (0.646)	Loss 2.8700 (2.6502)	Entropy 0.62975 (0.62785)	Top-1 acc 57.812 (60.078)	Top-5 acc 78.125 (81.307)	lr 0.01220
Train [61][2940/3239]	Time 0.229 (1.134)	Data Time 0.001 (0.646)	Loss 2.5517 (2.6501)	Entropy 0.62949 (0.62786)	Top-1 acc 62.891 (60.080)	Top-5 acc 83.594 (81.310)	lr 0.01220
Train [61][2950/3239]	Time 0.357 (1.137)	Data Time 0.001 (0.649)	Loss 2.6374 (2.6500)	Entropy 0.62954 (0.62786)	Top-1 acc 60.156 (60.080)	Top-5 acc 81.641 (81.311)	lr 0.01220
Train [61][2960/3239]	Time 0.248 (1.137)	Data Time 0.001 (0.650)	Loss 2.6534 (2.6498)	Entropy 0.62916 (0.62787)	Top-1 acc 60.938 (60.084)	Top-5 acc 80.859 (81.315)	lr 0.01220
Train [61][2970/3239]	Time 0.242 (1.135)	Data Time 0.001 (0.648)	Loss 2.5481 (2.6499)	Entropy 0.62888 (0.62787)	Top-1 acc 60.938 (60.078)	Top-5 acc 83.594 (81.315)	lr 0.01220
Train [61][2980/3239]	Time 0.243 (1.138)	Data Time 0.001 (0.651)	Loss 2.5827 (2.6499)	Entropy 0.62895 (0.62787)	Top-1 acc 62.500 (60.083)	Top-5 acc 82.422 (81.314)	lr 0.01220
Train [61][2990/3239]	Time 0.245 (1.138)	Data Time 0.001 (0.651)	Loss 2.6090 (2.6498)	Entropy 0.62897 (0.62788)	Top-1 acc 63.281 (60.086)	Top-5 acc 80.469 (81.315)	lr 0.01220
Train [61][3000/3239]	Time 0.245 (1.137)	Data Time 0.001 (0.650)	Loss 2.8240 (2.6500)	Entropy 0.62906 (0.62788)	Top-1 acc 52.734 (60.080)	Top-5 acc 78.125 (81.314)	lr 0.01220
Train [61][3010/3239]	Time 0.233 (1.138)	Data Time 0.001 (0.651)	Loss 2.7767 (2.6499)	Entropy 0.62933 (0.62789)	Top-1 acc 57.812 (60.082)	Top-5 acc 75.391 (81.313)	lr 0.01220
Train [61][3020/3239]	Time 0.643 (1.139)	Data Time 0.390 (0.653)	Loss 2.6211 (2.6499)	Entropy 0.62921 (0.62789)	Top-1 acc 60.547 (60.083)	Top-5 acc 82.422 (81.312)	lr 0.01220
Train [61][3030/3239]	Time 0.227 (1.139)	Data Time 0.001 (0.653)	Loss 2.5580 (2.6497)	Entropy 0.62937 (0.62789)	Top-1 acc 63.672 (60.088)	Top-5 acc 83.203 (81.315)	lr 0.01219
Train [61][3040/3239]	Time 0.229 (1.136)	Data Time 0.001 (0.650)	Loss 2.8155 (2.6496)	Entropy 0.62883 (0.62790)	Top-1 acc 57.031 (60.090)	Top-5 acc 79.688 (81.320)	lr 0.01219
Train [61][3050/3239]	Time 0.263 (1.142)	Data Time 0.001 (0.656)	Loss 2.6244 (2.6496)	Entropy 0.62856 (0.62790)	Top-1 acc 59.766 (60.093)	Top-5 acc 82.031 (81.320)	lr 0.01219
Train [61][3060/3239]	Time 0.249 (1.141)	Data Time 0.002 (0.655)	Loss 2.6315 (2.6495)	Entropy 0.62830 (0.62790)	Top-1 acc 60.156 (60.093)	Top-5 acc 80.469 (81.322)	lr 0.01219
Train [61][3070/3239]	Time 0.233 (1.138)	Data Time 0.001 (0.653)	Loss 2.8807 (2.6495)	Entropy 0.62838 (0.62791)	Top-1 acc 56.250 (60.093)	Top-5 acc 76.172 (81.321)	lr 0.01219
Train [61][3080/3239]	Time 6.523 (1.142)	Data Time 6.271 (0.657)	Loss 2.4455 (2.6494)	Entropy 0.62872 (0.62791)	Top-1 acc 67.188 (60.096)	Top-5 acc 85.547 (81.322)	lr 0.01219
Train [61][3090/3239]	Time 0.238 (1.141)	Data Time 0.001 (0.656)	Loss 2.5901 (2.6494)	Entropy 0.62890 (0.62791)	Top-1 acc 61.328 (60.094)	Top-5 acc 82.031 (81.322)	lr 0.01219
Train [61][3100/3239]	Time 0.229 (1.140)	Data Time 0.001 (0.656)	Loss 3.0410 (2.6493)	Entropy 0.62906 (0.62791)	Top-1 acc 51.953 (60.094)	Top-5 acc 76.562 (81.325)	lr 0.01219
Train [61][3110/3239]	Time 0.336 (1.143)	Data Time 0.001 (0.659)	Loss 2.7216 (2.6492)	Entropy 0.62882 (0.62792)	Top-1 acc 60.156 (60.099)	Top-5 acc 80.078 (81.327)	lr 0.01219
Train [61][3120/3239]	Time 0.236 (1.143)	Data Time 0.001 (0.659)	Loss 2.6753 (2.6493)	Entropy 0.62854 (0.62792)	Top-1 acc 57.812 (60.100)	Top-5 acc 80.078 (81.326)	lr 0.01218
Train [61][3130/3239]	Time 0.247 (1.141)	Data Time 0.001 (0.657)	Loss 2.7927 (2.6494)	Entropy 0.62852 (0.62792)	Top-1 acc 56.641 (60.097)	Top-5 acc 81.250 (81.323)	lr 0.01218
Train [61][3140/3239]	Time 7.690 (1.144)	Data Time 7.425 (0.661)	Loss 2.8203 (2.6495)	Entropy 0.62851 (0.62792)	Top-1 acc 57.422 (60.092)	Top-5 acc 78.516 (81.321)	lr 0.01218
Train [61][3150/3239]	Time 0.232 (1.144)	Data Time 0.001 (0.661)	Loss 2.5346 (2.6493)	Entropy 0.62839 (0.62793)	Top-1 acc 64.062 (60.098)	Top-5 acc 84.375 (81.326)	lr 0.01218
Train [61][3160/3239]	Time 0.221 (1.142)	Data Time 0.001 (0.659)	Loss 2.7414 (2.6495)	Entropy 0.62848 (0.62793)	Top-1 acc 60.938 (60.093)	Top-5 acc 79.688 (81.322)	lr 0.01218
Train [61][3170/3239]	Time 0.245 (1.143)	Data Time 0.001 (0.660)	Loss 2.7559 (2.6496)	Entropy 0.62827 (0.62793)	Top-1 acc 63.672 (60.093)	Top-5 acc 78.906 (81.320)	lr 0.01218
Train [61][3180/3239]	Time 0.326 (1.146)	Data Time 0.000 (0.664)	Loss 2.7476 (2.6496)	Entropy 0.62798 (0.62793)	Top-1 acc 57.031 (60.095)	Top-5 acc 80.078 (81.319)	lr 0.01218
Train [61][3190/3239]	Time 0.237 (1.144)	Data Time 0.000 (0.662)	Loss 2.4404 (2.6497)	Entropy 0.62787 (0.62793)	Top-1 acc 63.672 (60.092)	Top-5 acc 85.156 (81.315)	lr 0.01218
Train [61][3200/3239]	Time 0.234 (1.142)	Data Time 0.000 (0.660)	Loss 2.8621 (2.6498)	Entropy 0.62815 (0.62793)	Top-1 acc 59.766 (60.095)	Top-5 acc 76.562 (81.313)	lr 0.01218
Train [61][3210/3239]	Time 0.231 (1.147)	Data Time 0.000 (0.666)	Loss 2.6159 (2.6497)	Entropy 0.62790 (0.62793)	Top-1 acc 60.938 (60.096)	Top-5 acc 80.078 (81.313)	lr 0.01218
Train [61][3220/3239]	Time 0.230 (1.145)	Data Time 0.000 (0.663)	Loss 2.6990 (2.6497)	Entropy 0.62836 (0.62793)	Top-1 acc 59.766 (60.096)	Top-5 acc 80.078 (81.314)	lr 0.01217
Train [61][3230/3239]	Time 0.228 (1.143)	Data Time 0.000 (0.661)	Loss 2.6740 (2.6495)	Entropy 0.62877 (0.62793)	Top-1 acc 61.719 (60.103)	Top-5 acc 81.641 (81.318)	lr 0.01217
Train [61][3239/3239]	Time 0.913 (1.142)	Data Time 0.000 (0.661)	Loss 3.4395 (2.6495)	Entropy 0.62879 (0.62793)	Top-1 acc 41.975 (60.105)	Top-5 acc 65.432 (81.320)	lr 0.01217
==========Valid [61/120]	loss 1.398	top-1 acc 67.688 (67.769)	top-5 acc 87.507	Train top-1 60.105	top-5 81.320	Entropy 0.62879	Latency-None: 0.000ms	Flops: 538.40M
Train [62][0/3239]	Time 39.541 (39.541)	Data Time 37.428 (37.428)	Loss 2.5017 (2.5017)	Entropy 0.62874 (0.62874)	Top-1 acc 62.500 (62.500)	Top-5 acc 83.203 (83.203)	lr 0.01217
Train [62][10/3239]	Time 0.332 (4.035)	Data Time 0.002 (3.420)	Loss 2.5470 (2.5893)	Entropy 0.62899 (0.62879)	Top-1 acc 59.375 (61.648)	Top-5 acc 83.594 (82.635)	lr 0.01217
Train [62][20/3239]	Time 0.330 (2.333)	Data Time 0.003 (1.792)	Loss 2.8756 (2.5966)	Entropy 0.62910 (0.62893)	Top-1 acc 53.906 (61.347)	Top-5 acc 78.516 (82.478)	lr 0.01217
Train [62][30/3239]	Time 0.266 (1.727)	Data Time 0.002 (1.215)	Loss 2.6238 (2.6177)	Entropy 0.62908 (0.62899)	Top-1 acc 64.062 (61.101)	Top-5 acc 83.594 (82.119)	lr 0.01217
Train [62][40/3239]	Time 0.251 (1.415)	Data Time 0.001 (0.919)	Loss 2.6507 (2.6180)	Entropy 0.62932 (0.62902)	Top-1 acc 57.812 (61.080)	Top-5 acc 82.031 (82.031)	lr 0.01217
Train [62][50/3239]	Time 0.232 (1.234)	Data Time 0.002 (0.740)	Loss 2.7221 (2.6313)	Entropy 0.62939 (0.62909)	Top-1 acc 58.594 (60.761)	Top-5 acc 82.812 (81.771)	lr 0.01217
Train [62][60/3239]	Time 0.235 (1.102)	Data Time 0.001 (0.619)	Loss 2.4587 (2.6340)	Entropy 0.62934 (0.62913)	Top-1 acc 65.625 (60.784)	Top-5 acc 83.203 (81.679)	lr 0.01217
Train [62][70/3239]	Time 0.266 (1.010)	Data Time 0.001 (0.532)	Loss 2.8059 (2.6384)	Entropy 0.62935 (0.62917)	Top-1 acc 60.938 (60.646)	Top-5 acc 79.688 (81.652)	lr 0.01217
Train [62][80/3239]	Time 0.361 (0.944)	Data Time 0.001 (0.466)	Loss 2.6733 (2.6329)	Entropy 0.62963 (0.62920)	Top-1 acc 62.500 (60.827)	Top-5 acc 80.469 (81.752)	lr 0.01216
Train [62][90/3239]	Time 0.244 (0.891)	Data Time 0.001 (0.415)	Loss 2.4405 (2.6364)	Entropy 0.63001 (0.62926)	Top-1 acc 62.891 (60.663)	Top-5 acc 84.375 (81.701)	lr 0.01216
Train [62][100/3239]	Time 0.270 (0.847)	Data Time 0.001 (0.374)	Loss 2.7132 (2.6357)	Entropy 0.62999 (0.62933)	Top-1 acc 58.984 (60.624)	Top-5 acc 78.516 (81.679)	lr 0.01216
Train [62][110/3239]	Time 0.248 (0.812)	Data Time 0.001 (0.341)	Loss 2.6438 (2.6355)	Entropy 0.63029 (0.62940)	Top-1 acc 60.156 (60.529)	Top-5 acc 81.250 (81.627)	lr 0.01216
Train [62][120/3239]	Time 0.322 (0.784)	Data Time 0.002 (0.313)	Loss 2.6604 (2.6389)	Entropy 0.63050 (0.62947)	Top-1 acc 55.859 (60.276)	Top-5 acc 80.859 (81.602)	lr 0.01216
Train [62][130/3239]	Time 0.223 (0.758)	Data Time 0.001 (0.289)	Loss 2.5513 (2.6372)	Entropy 0.63046 (0.62955)	Top-1 acc 60.938 (60.344)	Top-5 acc 84.375 (81.664)	lr 0.01216
Train [62][140/3239]	Time 0.390 (0.977)	Data Time 0.005 (0.269)	Loss 2.6147 (2.6411)	Entropy 0.63010 (0.62959)	Top-1 acc 61.719 (60.259)	Top-5 acc 82.812 (81.605)	lr 0.01216
Train [62][150/3239]	Time 0.241 (0.947)	Data Time 0.002 (0.251)	Loss 2.7871 (2.6407)	Entropy 0.63030 (0.62963)	Top-1 acc 58.984 (60.299)	Top-5 acc 76.953 (81.617)	lr 0.01216
Train [62][160/3239]	Time 0.227 (0.913)	Data Time 0.001 (0.236)	Loss 2.7595 (2.6422)	Entropy 0.63033 (0.62967)	Top-1 acc 57.422 (60.290)	Top-5 acc 81.641 (81.621)	lr 0.01216
Train [62][170/3239]	Time 0.459 (0.887)	Data Time 0.004 (0.222)	Loss 2.4886 (2.6400)	Entropy 0.63022 (0.62970)	Top-1 acc 64.062 (60.387)	Top-5 acc 84.766 (81.677)	lr 0.01216
Train [62][180/3239]	Time 0.265 (0.863)	Data Time 0.001 (0.210)	Loss 2.4928 (2.6388)	Entropy 0.63037 (0.62973)	Top-1 acc 65.234 (60.402)	Top-5 acc 84.375 (81.682)	lr 0.01215
Train [62][190/3239]	Time 0.266 (0.842)	Data Time 0.002 (0.199)	Loss 2.4809 (2.6347)	Entropy 0.63055 (0.62977)	Top-1 acc 62.891 (60.447)	Top-5 acc 83.984 (81.706)	lr 0.01215
Train [62][200/3239]	Time 0.237 (0.825)	Data Time 0.001 (0.189)	Loss 2.9041 (2.6374)	Entropy 0.63071 (0.62981)	Top-1 acc 51.172 (60.374)	Top-5 acc 76.172 (81.679)	lr 0.01215
Train [62][210/3239]	Time 0.285 (0.807)	Data Time 0.001 (0.181)	Loss 2.7612 (2.6354)	Entropy 0.63072 (0.62985)	Top-1 acc 57.422 (60.425)	Top-5 acc 80.469 (81.726)	lr 0.01215
Train [62][220/3239]	Time 0.263 (0.793)	Data Time 0.002 (0.172)	Loss 2.5485 (2.6343)	Entropy 0.63052 (0.62989)	Top-1 acc 62.500 (60.478)	Top-5 acc 80.859 (81.770)	lr 0.01215
Train [62][230/3239]	Time 0.331 (0.778)	Data Time 0.002 (0.165)	Loss 2.6326 (2.6347)	Entropy 0.63087 (0.62992)	Top-1 acc 58.203 (60.493)	Top-5 acc 78.906 (81.737)	lr 0.01215
Train [62][240/3239]	Time 0.392 (0.765)	Data Time 0.002 (0.158)	Loss 2.5813 (2.6328)	Entropy 0.63071 (0.62996)	Top-1 acc 60.547 (60.545)	Top-5 acc 82.031 (81.764)	lr 0.01215
Train [62][250/3239]	Time 0.250 (0.752)	Data Time 0.001 (0.152)	Loss 2.8675 (2.6323)	Entropy 0.63048 (0.62999)	Top-1 acc 55.078 (60.558)	Top-5 acc 76.562 (81.765)	lr 0.01215
Train [62][260/3239]	Time 0.245 (0.740)	Data Time 0.001 (0.146)	Loss 2.7405 (2.6347)	Entropy 0.63069 (0.63001)	Top-1 acc 58.594 (60.509)	Top-5 acc 79.688 (81.705)	lr 0.01215
Train [62][270/3239]	Time 0.248 (0.730)	Data Time 0.001 (0.141)	Loss 2.7956 (2.6334)	Entropy 0.63096 (0.63004)	Top-1 acc 52.344 (60.505)	Top-5 acc 78.125 (81.724)	lr 0.01215
Train [62][280/3239]	Time 0.307 (0.718)	Data Time 0.003 (0.136)	Loss 2.5848 (2.6326)	Entropy 0.63112 (0.63007)	Top-1 acc 59.766 (60.514)	Top-5 acc 80.859 (81.728)	lr 0.01214
Train [62][290/3239]	Time 0.231 (0.710)	Data Time 0.001 (0.131)	Loss 2.8020 (2.6337)	Entropy 0.63112 (0.63011)	Top-1 acc 59.375 (60.507)	Top-5 acc 80.469 (81.694)	lr 0.01214
Train [62][300/3239]	Time 0.285 (0.701)	Data Time 0.001 (0.127)	Loss 2.4088 (2.6333)	Entropy 0.63085 (0.63014)	Top-1 acc 67.188 (60.518)	Top-5 acc 85.938 (81.706)	lr 0.01214
Train [62][310/3239]	Time 0.275 (0.693)	Data Time 0.001 (0.123)	Loss 2.7112 (2.6337)	Entropy 0.63094 (0.63016)	Top-1 acc 56.641 (60.494)	Top-5 acc 80.859 (81.695)	lr 0.01214
Train [62][320/3239]	Time 0.283 (0.686)	Data Time 0.001 (0.119)	Loss 2.7206 (2.6341)	Entropy 0.63072 (0.63018)	Top-1 acc 53.125 (60.450)	Top-5 acc 83.203 (81.708)	lr 0.01214
Train [62][330/3239]	Time 0.363 (0.679)	Data Time 0.001 (0.116)	Loss 2.3827 (2.6343)	Entropy 0.63074 (0.63019)	Top-1 acc 67.578 (60.447)	Top-5 acc 85.156 (81.687)	lr 0.01214
Train [62][340/3239]	Time 0.248 (0.672)	Data Time 0.001 (0.112)	Loss 2.7724 (2.6343)	Entropy 0.63078 (0.63021)	Top-1 acc 55.078 (60.440)	Top-5 acc 80.469 (81.699)	lr 0.01214
Train [62][350/3239]	Time 0.286 (0.666)	Data Time 0.001 (0.109)	Loss 2.4826 (2.6329)	Entropy 0.63091 (0.63023)	Top-1 acc 64.844 (60.483)	Top-5 acc 83.203 (81.717)	lr 0.01214
Train [62][360/3239]	Time 0.298 (0.661)	Data Time 0.001 (0.106)	Loss 2.6146 (2.6355)	Entropy 0.63118 (0.63025)	Top-1 acc 60.547 (60.443)	Top-5 acc 81.641 (81.671)	lr 0.01214
Train [62][370/3239]	Time 0.236 (0.655)	Data Time 0.001 (0.103)	Loss 2.5512 (2.6336)	Entropy 0.63127 (0.63028)	Top-1 acc 60.938 (60.489)	Top-5 acc 85.938 (81.722)	lr 0.01214
Train [62][380/3239]	Time 0.226 (0.649)	Data Time 0.001 (0.101)	Loss 2.9465 (2.6354)	Entropy 0.63122 (0.63030)	Top-1 acc 53.906 (60.433)	Top-5 acc 73.438 (81.692)	lr 0.01213
Train [62][390/3239]	Time 0.264 (0.644)	Data Time 0.002 (0.098)	Loss 2.6796 (2.6343)	Entropy 0.63142 (0.63033)	Top-1 acc 58.203 (60.444)	Top-5 acc 81.250 (81.706)	lr 0.01213
Train [62][400/3239]	Time 0.313 (0.638)	Data Time 0.001 (0.096)	Loss 2.4522 (2.6336)	Entropy 0.63111 (0.63035)	Top-1 acc 65.234 (60.465)	Top-5 acc 85.156 (81.716)	lr 0.01213
Train [62][410/3239]	Time 0.257 (0.633)	Data Time 0.002 (0.094)	Loss 2.6745 (2.6334)	Entropy 0.63100 (0.63037)	Top-1 acc 58.203 (60.469)	Top-5 acc 78.906 (81.707)	lr 0.01213
Train [62][420/3239]	Time 0.226 (0.629)	Data Time 0.002 (0.091)	Loss 2.7605 (2.6339)	Entropy 0.63084 (0.63038)	Top-1 acc 58.594 (60.464)	Top-5 acc 79.688 (81.704)	lr 0.01213
Train [62][430/3239]	Time 0.284 (0.626)	Data Time 0.001 (0.089)	Loss 2.5969 (2.6339)	Entropy 0.63080 (0.63039)	Top-1 acc 62.891 (60.489)	Top-5 acc 82.812 (81.700)	lr 0.01213
Train [62][440/3239]	Time 0.234 (0.624)	Data Time 0.001 (0.087)	Loss 2.5090 (2.6330)	Entropy 0.63072 (0.63040)	Top-1 acc 63.281 (60.496)	Top-5 acc 82.812 (81.720)	lr 0.01213
Train [62][450/3239]	Time 0.228 (0.620)	Data Time 0.001 (0.085)	Loss 2.5457 (2.6333)	Entropy 0.63064 (0.63040)	Top-1 acc 62.500 (60.477)	Top-5 acc 84.766 (81.710)	lr 0.01213
Train [62][460/3239]	Time 0.236 (0.616)	Data Time 0.001 (0.084)	Loss 2.2902 (2.6327)	Entropy 0.63081 (0.63041)	Top-1 acc 70.312 (60.502)	Top-5 acc 87.500 (81.714)	lr 0.01213
Train [62][470/3239]	Time 0.241 (0.612)	Data Time 0.001 (0.082)	Loss 2.6995 (2.6333)	Entropy 0.63064 (0.63042)	Top-1 acc 61.328 (60.510)	Top-5 acc 76.953 (81.684)	lr 0.01213
Train [62][480/3239]	Time 0.276 (0.609)	Data Time 0.002 (0.080)	Loss 2.2571 (2.6309)	Entropy 0.63070 (0.63043)	Top-1 acc 71.875 (60.581)	Top-5 acc 89.062 (81.723)	lr 0.01212
Train [62][490/3239]	Time 0.378 (0.606)	Data Time 0.001 (0.079)	Loss 2.7270 (2.6302)	Entropy 0.63098 (0.63044)	Top-1 acc 60.156 (60.597)	Top-5 acc 79.688 (81.742)	lr 0.01212
Train [62][500/3239]	Time 0.250 (0.602)	Data Time 0.001 (0.077)	Loss 2.6244 (2.6307)	Entropy 0.63082 (0.63045)	Top-1 acc 62.500 (60.587)	Top-5 acc 82.031 (81.724)	lr 0.01212
Train [62][510/3239]	Time 0.257 (0.599)	Data Time 0.002 (0.076)	Loss 2.4569 (2.6296)	Entropy 0.63069 (0.63045)	Top-1 acc 68.359 (60.624)	Top-5 acc 86.719 (81.734)	lr 0.01212
Train [62][520/3239]	Time 0.239 (0.596)	Data Time 0.001 (0.074)	Loss 2.7771 (2.6303)	Entropy 0.63062 (0.63045)	Top-1 acc 57.422 (60.605)	Top-5 acc 78.906 (81.725)	lr 0.01212
Train [62][530/3239]	Time 0.236 (0.593)	Data Time 0.001 (0.073)	Loss 2.6509 (2.6292)	Entropy 0.63096 (0.63046)	Top-1 acc 58.594 (60.612)	Top-5 acc 80.859 (81.751)	lr 0.01212
Train [62][540/3239]	Time 0.245 (0.590)	Data Time 0.002 (0.072)	Loss 2.5352 (2.6281)	Entropy 0.63091 (0.63047)	Top-1 acc 62.109 (60.640)	Top-5 acc 83.984 (81.771)	lr 0.01212
Train [62][550/3239]	Time 0.232 (0.587)	Data Time 0.001 (0.070)	Loss 2.4843 (2.6280)	Entropy 0.63028 (0.63047)	Top-1 acc 66.016 (60.624)	Top-5 acc 83.594 (81.763)	lr 0.01212
Train [62][560/3239]	Time 0.352 (0.584)	Data Time 0.001 (0.069)	Loss 2.6496 (2.6277)	Entropy 0.63012 (0.63047)	Top-1 acc 62.500 (60.642)	Top-5 acc 81.250 (81.771)	lr 0.01212
Train [62][570/3239]	Time 0.302 (0.582)	Data Time 0.002 (0.068)	Loss 2.6898 (2.6280)	Entropy 0.63005 (0.63046)	Top-1 acc 56.641 (60.628)	Top-5 acc 80.469 (81.762)	lr 0.01212
Train [62][580/3239]	Time 0.232 (0.579)	Data Time 0.001 (0.067)	Loss 2.4108 (2.6266)	Entropy 0.62989 (0.63045)	Top-1 acc 64.062 (60.662)	Top-5 acc 85.938 (81.774)	lr 0.01211
Train [62][590/3239]	Time 0.331 (0.577)	Data Time 0.001 (0.066)	Loss 2.5699 (2.6260)	Entropy 0.62979 (0.63044)	Top-1 acc 62.500 (60.659)	Top-5 acc 84.375 (81.789)	lr 0.01211
Train [62][600/3239]	Time 0.253 (0.574)	Data Time 0.002 (0.065)	Loss 2.5892 (2.6257)	Entropy 0.63005 (0.63043)	Top-1 acc 57.812 (60.676)	Top-5 acc 83.203 (81.798)	lr 0.01211
Train [62][610/3239]	Time 0.242 (0.572)	Data Time 0.001 (0.064)	Loss 2.5160 (2.6252)	Entropy 0.62999 (0.63043)	Top-1 acc 61.719 (60.690)	Top-5 acc 81.641 (81.827)	lr 0.01211
Train [62][620/3239]	Time 0.267 (0.570)	Data Time 0.001 (0.063)	Loss 3.2486 (2.6263)	Entropy 0.62954 (0.63042)	Top-1 acc 45.312 (60.669)	Top-5 acc 69.922 (81.814)	lr 0.01211
Train [62][630/3239]	Time 0.247 (0.568)	Data Time 0.001 (0.062)	Loss 2.5943 (2.6269)	Entropy 0.62954 (0.63040)	Top-1 acc 60.938 (60.656)	Top-5 acc 82.422 (81.800)	lr 0.01211
Train [62][640/3239]	Time 0.244 (0.566)	Data Time 0.001 (0.061)	Loss 2.5282 (2.6266)	Entropy 0.62943 (0.63039)	Top-1 acc 64.453 (60.653)	Top-5 acc 83.984 (81.814)	lr 0.01211
Train [62][650/3239]	Time 0.240 (0.564)	Data Time 0.001 (0.060)	Loss 2.5682 (2.6272)	Entropy 0.62962 (0.63038)	Top-1 acc 63.281 (60.649)	Top-5 acc 83.594 (81.801)	lr 0.01211
Train [62][660/3239]	Time 0.244 (0.562)	Data Time 0.001 (0.059)	Loss 2.6320 (2.6272)	Entropy 0.62964 (0.63036)	Top-1 acc 64.453 (60.654)	Top-5 acc 83.203 (81.803)	lr 0.01211
Train [62][670/3239]	Time 0.238 (0.560)	Data Time 0.001 (0.058)	Loss 2.5942 (2.6264)	Entropy 0.62951 (0.63035)	Top-1 acc 62.891 (60.663)	Top-5 acc 82.422 (81.812)	lr 0.01211
Train [62][680/3239]	Time 0.254 (0.559)	Data Time 0.001 (0.057)	Loss 2.6293 (2.6261)	Entropy 0.62956 (0.63034)	Top-1 acc 59.766 (60.670)	Top-5 acc 83.203 (81.818)	lr 0.01210
Train [62][690/3239]	Time 0.259 (0.557)	Data Time 0.001 (0.056)	Loss 2.7963 (2.6265)	Entropy 0.62939 (0.63033)	Top-1 acc 54.297 (60.664)	Top-5 acc 80.469 (81.808)	lr 0.01210
Train [62][700/3239]	Time 0.240 (0.555)	Data Time 0.001 (0.056)	Loss 2.7419 (2.6272)	Entropy 0.62947 (0.63032)	Top-1 acc 58.203 (60.659)	Top-5 acc 81.641 (81.791)	lr 0.01210
Train [62][710/3239]	Time 0.263 (0.553)	Data Time 0.001 (0.055)	Loss 2.6654 (2.6272)	Entropy 0.62946 (0.63031)	Top-1 acc 61.719 (60.655)	Top-5 acc 81.250 (81.791)	lr 0.01210
Train [62][720/3239]	Time 0.324 (0.552)	Data Time 0.001 (0.054)	Loss 2.4726 (2.6266)	Entropy 0.62926 (0.63029)	Top-1 acc 65.234 (60.683)	Top-5 acc 85.156 (81.799)	lr 0.01210
Train [62][730/3239]	Time 0.246 (0.551)	Data Time 0.001 (0.053)	Loss 2.5970 (2.6266)	Entropy 0.62934 (0.63028)	Top-1 acc 63.281 (60.682)	Top-5 acc 81.250 (81.790)	lr 0.01210
Train [62][740/3239]	Time 0.245 (0.549)	Data Time 0.002 (0.053)	Loss 2.5872 (2.6269)	Entropy 0.62943 (0.63027)	Top-1 acc 62.500 (60.686)	Top-5 acc 81.250 (81.783)	lr 0.01210
Train [62][750/3239]	Time 0.277 (0.548)	Data Time 0.002 (0.052)	Loss 2.5117 (2.6276)	Entropy 0.62953 (0.63026)	Top-1 acc 62.500 (60.674)	Top-5 acc 84.766 (81.772)	lr 0.01210
Train [62][760/3239]	Time 0.251 (0.547)	Data Time 0.002 (0.051)	Loss 2.8710 (2.6281)	Entropy 0.62969 (0.63025)	Top-1 acc 54.688 (60.660)	Top-5 acc 75.391 (81.766)	lr 0.01210
Train [62][770/3239]	Time 0.286 (0.546)	Data Time 0.001 (0.051)	Loss 2.6977 (2.6278)	Entropy 0.62972 (0.63024)	Top-1 acc 57.812 (60.663)	Top-5 acc 78.906 (81.773)	lr 0.01210
Train [62][780/3239]	Time 0.236 (0.544)	Data Time 0.001 (0.050)	Loss 2.9252 (2.6284)	Entropy 0.62989 (0.63024)	Top-1 acc 54.688 (60.637)	Top-5 acc 74.219 (81.755)	lr 0.01209
Train [62][790/3239]	Time 0.376 (0.543)	Data Time 0.001 (0.050)	Loss 2.4546 (2.6286)	Entropy 0.63030 (0.63023)	Top-1 acc 62.109 (60.625)	Top-5 acc 86.328 (81.749)	lr 0.01209
Train [62][800/3239]	Time 0.228 (0.585)	Data Time 0.002 (0.049)	Loss 2.6576 (2.6288)	Entropy 0.63011 (0.63024)	Top-1 acc 62.500 (60.620)	Top-5 acc 80.859 (81.735)	lr 0.01209
Train [62][810/3239]	Time 0.251 (0.583)	Data Time 0.002 (0.048)	Loss 2.5609 (2.6290)	Entropy 0.62998 (0.63023)	Top-1 acc 62.109 (60.621)	Top-5 acc 82.031 (81.731)	lr 0.01209
Train [62][820/3239]	Time 0.237 (0.581)	Data Time 0.002 (0.048)	Loss 2.5603 (2.6294)	Entropy 0.62961 (0.63023)	Top-1 acc 62.891 (60.612)	Top-5 acc 83.203 (81.723)	lr 0.01209
Train [62][830/3239]	Time 0.245 (0.579)	Data Time 0.002 (0.047)	Loss 2.4579 (2.6299)	Entropy 0.62973 (0.63022)	Top-1 acc 64.844 (60.604)	Top-5 acc 85.156 (81.724)	lr 0.01209
Train [62][840/3239]	Time 0.246 (0.577)	Data Time 0.001 (0.047)	Loss 2.5753 (2.6300)	Entropy 0.63015 (0.63022)	Top-1 acc 60.547 (60.608)	Top-5 acc 82.031 (81.718)	lr 0.01209
Train [62][850/3239]	Time 0.255 (0.576)	Data Time 0.001 (0.046)	Loss 2.5354 (2.6303)	Entropy 0.62980 (0.63021)	Top-1 acc 62.500 (60.605)	Top-5 acc 80.469 (81.700)	lr 0.01209
Train [62][860/3239]	Time 0.262 (0.575)	Data Time 0.001 (0.046)	Loss 2.5661 (2.6299)	Entropy 0.62959 (0.63021)	Top-1 acc 60.156 (60.600)	Top-5 acc 80.859 (81.701)	lr 0.01209
Train [62][870/3239]	Time 0.287 (0.574)	Data Time 0.002 (0.045)	Loss 2.8390 (2.6309)	Entropy 0.62965 (0.63020)	Top-1 acc 56.250 (60.576)	Top-5 acc 75.781 (81.687)	lr 0.01208
Train [62][880/3239]	Time 0.334 (0.573)	Data Time 0.001 (0.045)	Loss 2.7172 (2.6315)	Entropy 0.62991 (0.63020)	Top-1 acc 60.938 (60.559)	Top-5 acc 82.031 (81.676)	lr 0.01208
Train [62][890/3239]	Time 0.238 (0.571)	Data Time 0.001 (0.044)	Loss 2.4945 (2.6310)	Entropy 0.63029 (0.63020)	Top-1 acc 65.234 (60.567)	Top-5 acc 82.422 (81.687)	lr 0.01208
Train [62][900/3239]	Time 0.247 (0.570)	Data Time 0.001 (0.044)	Loss 2.9107 (2.6310)	Entropy 0.63013 (0.63020)	Top-1 acc 52.734 (60.560)	Top-5 acc 74.219 (81.681)	lr 0.01208
Train [62][910/3239]	Time 0.265 (0.569)	Data Time 0.001 (0.043)	Loss 2.7803 (2.6312)	Entropy 0.63001 (0.63019)	Top-1 acc 58.594 (60.548)	Top-5 acc 77.734 (81.673)	lr 0.01208
Train [62][920/3239]	Time 0.243 (0.567)	Data Time 0.001 (0.043)	Loss 2.7033 (2.6315)	Entropy 0.63028 (0.63019)	Top-1 acc 59.766 (60.547)	Top-5 acc 79.297 (81.669)	lr 0.01208
Train [62][930/3239]	Time 0.229 (0.566)	Data Time 0.001 (0.042)	Loss 2.4679 (2.6305)	Entropy 0.63046 (0.63019)	Top-1 acc 66.406 (60.570)	Top-5 acc 85.156 (81.686)	lr 0.01208
Train [62][940/3239]	Time 0.242 (0.565)	Data Time 0.001 (0.042)	Loss 2.5313 (2.6306)	Entropy 0.63041 (0.63020)	Top-1 acc 58.203 (60.561)	Top-5 acc 82.812 (81.687)	lr 0.01208
Train [62][950/3239]	Time 0.345 (0.563)	Data Time 0.001 (0.041)	Loss 2.4637 (2.6304)	Entropy 0.63054 (0.63020)	Top-1 acc 65.234 (60.567)	Top-5 acc 85.547 (81.687)	lr 0.01208
Train [62][960/3239]	Time 0.237 (0.562)	Data Time 0.001 (0.041)	Loss 2.6121 (2.6301)	Entropy 0.63050 (0.63020)	Top-1 acc 60.156 (60.570)	Top-5 acc 80.078 (81.693)	lr 0.01208
Train [62][970/3239]	Time 0.246 (0.561)	Data Time 0.001 (0.041)	Loss 2.7272 (2.6300)	Entropy 0.63096 (0.63021)	Top-1 acc 58.203 (60.561)	Top-5 acc 81.641 (81.692)	lr 0.01207
Train [62][980/3239]	Time 0.249 (0.560)	Data Time 0.001 (0.040)	Loss 2.6417 (2.6301)	Entropy 0.63077 (0.63021)	Top-1 acc 60.547 (60.558)	Top-5 acc 79.688 (81.689)	lr 0.01207
Train [62][990/3239]	Time 0.237 (0.559)	Data Time 0.001 (0.040)	Loss 2.7032 (2.6304)	Entropy 0.63070 (0.63022)	Top-1 acc 61.328 (60.559)	Top-5 acc 78.516 (81.682)	lr 0.01207
Train [62][1000/3239]	Time 0.270 (0.558)	Data Time 0.001 (0.039)	Loss 2.8129 (2.6308)	Entropy 0.63088 (0.63023)	Top-1 acc 53.906 (60.554)	Top-5 acc 79.297 (81.673)	lr 0.01207
Train [62][1010/3239]	Time 0.281 (0.557)	Data Time 0.001 (0.039)	Loss 2.7009 (2.6316)	Entropy 0.63052 (0.63023)	Top-1 acc 60.156 (60.533)	Top-5 acc 81.250 (81.660)	lr 0.01207
Train [62][1020/3239]	Time 0.233 (0.556)	Data Time 0.001 (0.039)	Loss 2.7472 (2.6318)	Entropy 0.63089 (0.63024)	Top-1 acc 58.203 (60.538)	Top-5 acc 78.906 (81.656)	lr 0.01207
Train [62][1030/3239]	Time 0.231 (0.555)	Data Time 0.001 (0.038)	Loss 2.5815 (2.6317)	Entropy 0.63080 (0.63024)	Top-1 acc 60.156 (60.537)	Top-5 acc 82.031 (81.659)	lr 0.01207
Train [62][1040/3239]	Time 0.403 (0.554)	Data Time 0.001 (0.038)	Loss 2.4211 (2.6315)	Entropy 0.63109 (0.63025)	Top-1 acc 65.234 (60.526)	Top-5 acc 85.547 (81.665)	lr 0.01207
Train [62][1050/3239]	Time 0.255 (0.553)	Data Time 0.002 (0.038)	Loss 2.5759 (2.6313)	Entropy 0.63095 (0.63026)	Top-1 acc 64.844 (60.536)	Top-5 acc 82.422 (81.673)	lr 0.01207
Train [62][1060/3239]	Time 0.226 (0.552)	Data Time 0.001 (0.037)	Loss 2.5249 (2.6317)	Entropy 0.63152 (0.63026)	Top-1 acc 62.891 (60.531)	Top-5 acc 85.156 (81.671)	lr 0.01207
Train [62][1070/3239]	Time 0.253 (0.551)	Data Time 0.001 (0.037)	Loss 2.5610 (2.6315)	Entropy 0.63096 (0.63027)	Top-1 acc 61.719 (60.539)	Top-5 acc 83.594 (81.677)	lr 0.01206
Train [62][1080/3239]	Time 0.222 (0.550)	Data Time 0.001 (0.037)	Loss 2.6758 (2.6320)	Entropy 0.63045 (0.63028)	Top-1 acc 56.250 (60.527)	Top-5 acc 79.297 (81.661)	lr 0.01206
Train [62][1090/3239]	Time 0.249 (0.549)	Data Time 0.001 (0.036)	Loss 2.7473 (2.6321)	Entropy 0.63010 (0.63028)	Top-1 acc 62.500 (60.525)	Top-5 acc 80.469 (81.659)	lr 0.01206
Train [62][1100/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.036)	Loss 2.6626 (2.6319)	Entropy 0.62982 (0.63028)	Top-1 acc 59.766 (60.541)	Top-5 acc 80.859 (81.653)	lr 0.01206
Train [62][1110/3239]	Time 0.388 (0.547)	Data Time 0.001 (0.036)	Loss 2.6952 (2.6314)	Entropy 0.63017 (0.63027)	Top-1 acc 59.766 (60.545)	Top-5 acc 80.859 (81.666)	lr 0.01206
Train [62][1120/3239]	Time 0.278 (0.546)	Data Time 0.002 (0.035)	Loss 2.6003 (2.6316)	Entropy 0.63034 (0.63027)	Top-1 acc 63.281 (60.544)	Top-5 acc 83.203 (81.659)	lr 0.01206
Train [62][1130/3239]	Time 0.258 (0.545)	Data Time 0.001 (0.035)	Loss 2.6473 (2.6316)	Entropy 0.63019 (0.63027)	Top-1 acc 58.203 (60.540)	Top-5 acc 82.422 (81.657)	lr 0.01206
Train [62][1140/3239]	Time 0.242 (0.544)	Data Time 0.001 (0.035)	Loss 2.4255 (2.6314)	Entropy 0.63014 (0.63027)	Top-1 acc 64.453 (60.549)	Top-5 acc 82.422 (81.655)	lr 0.01206
Train [62][1150/3239]	Time 0.230 (0.543)	Data Time 0.001 (0.035)	Loss 2.7195 (2.6311)	Entropy 0.62996 (0.63027)	Top-1 acc 58.203 (60.552)	Top-5 acc 81.250 (81.664)	lr 0.01206
Train [62][1160/3239]	Time 0.237 (0.542)	Data Time 0.001 (0.034)	Loss 2.7892 (2.6317)	Entropy 0.63016 (0.63027)	Top-1 acc 56.250 (60.534)	Top-5 acc 77.734 (81.647)	lr 0.01206
Train [62][1170/3239]	Time 0.275 (0.542)	Data Time 0.001 (0.034)	Loss 2.7976 (2.6325)	Entropy 0.63003 (0.63027)	Top-1 acc 55.078 (60.514)	Top-5 acc 78.906 (81.629)	lr 0.01205
Train [62][1180/3239]	Time 0.260 (0.541)	Data Time 0.001 (0.034)	Loss 2.5688 (2.6326)	Entropy 0.62968 (0.63027)	Top-1 acc 60.938 (60.519)	Top-5 acc 82.031 (81.627)	lr 0.01205
Train [62][1190/3239]	Time 0.287 (0.540)	Data Time 0.002 (0.033)	Loss 2.4612 (2.6329)	Entropy 0.62984 (0.63026)	Top-1 acc 64.844 (60.511)	Top-5 acc 86.719 (81.622)	lr 0.01205
Train [62][1200/3239]	Time 0.270 (0.539)	Data Time 0.001 (0.033)	Loss 2.7249 (2.6331)	Entropy 0.63010 (0.63026)	Top-1 acc 61.719 (60.504)	Top-5 acc 81.250 (81.622)	lr 0.01205
Train [62][1210/3239]	Time 0.223 (0.538)	Data Time 0.001 (0.033)	Loss 2.7957 (2.6338)	Entropy 0.63018 (0.63026)	Top-1 acc 54.688 (60.491)	Top-5 acc 80.469 (81.610)	lr 0.01205
Train [62][1220/3239]	Time 0.250 (0.537)	Data Time 0.002 (0.033)	Loss 2.4711 (2.6333)	Entropy 0.63020 (0.63026)	Top-1 acc 67.188 (60.491)	Top-5 acc 83.203 (81.619)	lr 0.01205
Train [62][1230/3239]	Time 0.245 (0.536)	Data Time 0.001 (0.032)	Loss 2.9752 (2.6341)	Entropy 0.63061 (0.63026)	Top-1 acc 50.781 (60.468)	Top-5 acc 75.000 (81.608)	lr 0.01205
Train [62][1240/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.034)	Loss 2.6476 (2.6343)	Entropy 0.63038 (0.63026)	Top-1 acc 59.375 (60.462)	Top-5 acc 81.250 (81.604)	lr 0.01205
Train [62][1250/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.033)	Loss 2.7336 (2.6342)	Entropy 0.63045 (0.63026)	Top-1 acc 59.375 (60.466)	Top-5 acc 81.250 (81.608)	lr 0.01205
Train [62][1260/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.033)	Loss 2.7640 (2.6346)	Entropy 0.63057 (0.63026)	Top-1 acc 56.250 (60.458)	Top-5 acc 81.250 (81.604)	lr 0.01205
Train [62][1270/3239]	Time 0.337 (0.534)	Data Time 0.002 (0.033)	Loss 2.8112 (2.6350)	Entropy 0.63082 (0.63026)	Top-1 acc 54.688 (60.451)	Top-5 acc 78.125 (81.599)	lr 0.01204
Train [62][1280/3239]	Time 0.274 (0.534)	Data Time 0.001 (0.033)	Loss 2.7305 (2.6348)	Entropy 0.63090 (0.63027)	Top-1 acc 54.297 (60.446)	Top-5 acc 78.516 (81.602)	lr 0.01204
Train [62][1290/3239]	Time 0.266 (0.534)	Data Time 0.001 (0.034)	Loss 2.6282 (2.6350)	Entropy 0.63086 (0.63027)	Top-1 acc 60.156 (60.447)	Top-5 acc 80.859 (81.596)	lr 0.01204
Train [62][1300/3239]	Time 0.256 (0.534)	Data Time 0.001 (0.034)	Loss 2.6756 (2.6353)	Entropy 0.63054 (0.63028)	Top-1 acc 58.594 (60.442)	Top-5 acc 79.688 (81.597)	lr 0.01204
Train [62][1310/3239]	Time 0.244 (0.533)	Data Time 0.001 (0.034)	Loss 2.6365 (2.6356)	Entropy 0.63033 (0.63028)	Top-1 acc 59.766 (60.438)	Top-5 acc 81.250 (81.590)	lr 0.01204
Train [62][1320/3239]	Time 0.270 (0.532)	Data Time 0.002 (0.033)	Loss 2.6447 (2.6354)	Entropy 0.63046 (0.63028)	Top-1 acc 58.984 (60.437)	Top-5 acc 81.641 (81.594)	lr 0.01204
Train [62][1330/3239]	Time 0.260 (0.532)	Data Time 0.001 (0.034)	Loss 2.7562 (2.6356)	Entropy 0.63038 (0.63028)	Top-1 acc 56.250 (60.434)	Top-5 acc 80.469 (81.583)	lr 0.01204
Train [62][1340/3239]	Time 0.370 (0.532)	Data Time 0.002 (0.035)	Loss 2.5290 (2.6357)	Entropy 0.63069 (0.63028)	Top-1 acc 65.625 (60.432)	Top-5 acc 80.859 (81.573)	lr 0.01204
Train [62][1350/3239]	Time 0.248 (0.532)	Data Time 0.001 (0.035)	Loss 2.5560 (2.6357)	Entropy 0.63051 (0.63029)	Top-1 acc 64.844 (60.436)	Top-5 acc 83.203 (81.577)	lr 0.01204
Train [62][1360/3239]	Time 0.306 (0.531)	Data Time 0.001 (0.035)	Loss 2.7569 (2.6361)	Entropy 0.63007 (0.63029)	Top-1 acc 54.688 (60.428)	Top-5 acc 80.078 (81.565)	lr 0.01204
Train [62][1370/3239]	Time 0.223 (0.532)	Data Time 0.001 (0.035)	Loss 2.4725 (2.6357)	Entropy 0.62948 (0.63028)	Top-1 acc 62.109 (60.438)	Top-5 acc 85.156 (81.571)	lr 0.01203
Train [62][1380/3239]	Time 3.050 (0.533)	Data Time 2.759 (0.037)	Loss 2.6983 (2.6356)	Entropy 0.62952 (0.63028)	Top-1 acc 55.469 (60.443)	Top-5 acc 80.859 (81.576)	lr 0.01203
Train [62][1390/3239]	Time 0.267 (0.532)	Data Time 0.001 (0.037)	Loss 2.6123 (2.6357)	Entropy 0.62986 (0.63027)	Top-1 acc 59.375 (60.436)	Top-5 acc 82.422 (81.572)	lr 0.01203
Train [62][1400/3239]	Time 0.244 (0.533)	Data Time 0.001 (0.038)	Loss 2.5458 (2.6358)	Entropy 0.62981 (0.63027)	Top-1 acc 65.234 (60.430)	Top-5 acc 83.203 (81.575)	lr 0.01203
Train [62][1410/3239]	Time 0.274 (0.532)	Data Time 0.001 (0.038)	Loss 2.5080 (2.6355)	Entropy 0.62977 (0.63027)	Top-1 acc 60.938 (60.435)	Top-5 acc 85.156 (81.585)	lr 0.01203
Train [62][1420/3239]	Time 0.245 (0.532)	Data Time 0.001 (0.038)	Loss 2.7220 (2.6356)	Entropy 0.63005 (0.63026)	Top-1 acc 57.031 (60.438)	Top-5 acc 81.641 (81.580)	lr 0.01203
Train [62][1430/3239]	Time 0.355 (0.531)	Data Time 0.001 (0.037)	Loss 2.7560 (2.6358)	Entropy 0.62987 (0.63026)	Top-1 acc 57.812 (60.437)	Top-5 acc 77.734 (81.577)	lr 0.01203
Train [62][1440/3239]	Time 0.270 (0.531)	Data Time 0.001 (0.038)	Loss 2.9028 (2.6358)	Entropy 0.62961 (0.63026)	Top-1 acc 54.297 (60.434)	Top-5 acc 74.219 (81.569)	lr 0.01203
Train [62][1450/3239]	Time 0.328 (0.555)	Data Time 0.027 (0.038)	Loss 2.6280 (2.6359)	Entropy 0.62985 (0.63025)	Top-1 acc 61.328 (60.433)	Top-5 acc 82.031 (81.564)	lr 0.01203
Train [62][1460/3239]	Time 0.228 (0.554)	Data Time 0.002 (0.038)	Loss 2.5502 (2.6363)	Entropy 0.62963 (0.63025)	Top-1 acc 63.281 (60.425)	Top-5 acc 85.938 (81.559)	lr 0.01203
Train [62][1470/3239]	Time 0.231 (0.553)	Data Time 0.001 (0.037)	Loss 2.4342 (2.6367)	Entropy 0.62957 (0.63025)	Top-1 acc 67.188 (60.414)	Top-5 acc 86.719 (81.554)	lr 0.01202
Train [62][1480/3239]	Time 0.259 (0.552)	Data Time 0.001 (0.037)	Loss 2.7411 (2.6370)	Entropy 0.62970 (0.63024)	Top-1 acc 55.469 (60.403)	Top-5 acc 82.031 (81.548)	lr 0.01202
Train [62][1490/3239]	Time 0.266 (0.551)	Data Time 0.002 (0.037)	Loss 2.5567 (2.6368)	Entropy 0.62996 (0.63024)	Top-1 acc 64.453 (60.400)	Top-5 acc 82.422 (81.550)	lr 0.01202
Train [62][1500/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.037)	Loss 2.6317 (2.6371)	Entropy 0.62937 (0.63024)	Top-1 acc 60.938 (60.397)	Top-5 acc 82.031 (81.539)	lr 0.01202
Train [62][1510/3239]	Time 0.270 (0.550)	Data Time 0.001 (0.036)	Loss 2.5717 (2.6370)	Entropy 0.62953 (0.63023)	Top-1 acc 64.453 (60.403)	Top-5 acc 83.594 (81.540)	lr 0.01202
Train [62][1520/3239]	Time 0.243 (0.550)	Data Time 0.001 (0.036)	Loss 2.6029 (2.6369)	Entropy 0.62944 (0.63023)	Top-1 acc 60.156 (60.407)	Top-5 acc 81.641 (81.543)	lr 0.01202
Train [62][1530/3239]	Time 0.231 (0.549)	Data Time 0.001 (0.036)	Loss 2.6834 (2.6369)	Entropy 0.62943 (0.63022)	Top-1 acc 61.328 (60.405)	Top-5 acc 80.469 (81.541)	lr 0.01202
Train [62][1540/3239]	Time 0.240 (0.548)	Data Time 0.001 (0.036)	Loss 2.8337 (2.6372)	Entropy 0.62953 (0.63022)	Top-1 acc 57.812 (60.402)	Top-5 acc 76.562 (81.535)	lr 0.01202
Train [62][1550/3239]	Time 0.234 (0.547)	Data Time 0.001 (0.035)	Loss 2.6919 (2.6370)	Entropy 0.62996 (0.63021)	Top-1 acc 58.203 (60.405)	Top-5 acc 77.734 (81.536)	lr 0.01202
Train [62][1560/3239]	Time 0.275 (0.547)	Data Time 0.001 (0.035)	Loss 2.6128 (2.6367)	Entropy 0.62970 (0.63021)	Top-1 acc 60.547 (60.408)	Top-5 acc 82.031 (81.543)	lr 0.01202
Train [62][1570/3239]	Time 0.306 (0.546)	Data Time 0.001 (0.035)	Loss 2.5052 (2.6374)	Entropy 0.62940 (0.63021)	Top-1 acc 61.328 (60.386)	Top-5 acc 83.203 (81.528)	lr 0.01201
Train [62][1580/3239]	Time 0.239 (0.545)	Data Time 0.001 (0.035)	Loss 2.6040 (2.6376)	Entropy 0.62907 (0.63020)	Top-1 acc 60.938 (60.386)	Top-5 acc 83.594 (81.527)	lr 0.01201
Train [62][1590/3239]	Time 0.356 (0.545)	Data Time 0.001 (0.035)	Loss 2.8481 (2.6377)	Entropy 0.62911 (0.63019)	Top-1 acc 53.516 (60.385)	Top-5 acc 76.953 (81.525)	lr 0.01201
Train [62][1600/3239]	Time 0.295 (0.544)	Data Time 0.001 (0.034)	Loss 2.5391 (2.6375)	Entropy 0.62934 (0.63019)	Top-1 acc 61.719 (60.387)	Top-5 acc 83.594 (81.525)	lr 0.01201
Train [62][1610/3239]	Time 0.243 (0.544)	Data Time 0.001 (0.034)	Loss 2.7074 (2.6376)	Entropy 0.62922 (0.63018)	Top-1 acc 59.375 (60.388)	Top-5 acc 80.859 (81.523)	lr 0.01201
Train [62][1620/3239]	Time 0.272 (0.543)	Data Time 0.001 (0.034)	Loss 2.5130 (2.6372)	Entropy 0.62913 (0.63018)	Top-1 acc 62.109 (60.394)	Top-5 acc 84.375 (81.530)	lr 0.01201
Train [62][1630/3239]	Time 0.265 (0.542)	Data Time 0.001 (0.034)	Loss 2.6149 (2.6374)	Entropy 0.62929 (0.63017)	Top-1 acc 60.156 (60.385)	Top-5 acc 82.031 (81.524)	lr 0.01201
Train [62][1640/3239]	Time 0.272 (0.542)	Data Time 0.001 (0.034)	Loss 2.6459 (2.6374)	Entropy 0.62915 (0.63016)	Top-1 acc 62.109 (60.389)	Top-5 acc 82.422 (81.525)	lr 0.01201
Train [62][1650/3239]	Time 0.242 (0.541)	Data Time 0.001 (0.033)	Loss 2.7141 (2.6376)	Entropy 0.62885 (0.63016)	Top-1 acc 57.422 (60.388)	Top-5 acc 81.250 (81.524)	lr 0.01201
Train [62][1660/3239]	Time 0.413 (0.541)	Data Time 0.001 (0.033)	Loss 2.6017 (2.6377)	Entropy 0.62899 (0.63015)	Top-1 acc 60.547 (60.386)	Top-5 acc 82.422 (81.523)	lr 0.01201
Train [62][1670/3239]	Time 0.229 (0.541)	Data Time 0.001 (0.034)	Loss 2.6929 (2.6377)	Entropy 0.62922 (0.63014)	Top-1 acc 58.984 (60.386)	Top-5 acc 78.906 (81.518)	lr 0.01200
Train [62][1680/3239]	Time 0.220 (0.540)	Data Time 0.001 (0.034)	Loss 2.6601 (2.6378)	Entropy 0.62925 (0.63014)	Top-1 acc 58.203 (60.382)	Top-5 acc 82.031 (81.519)	lr 0.01200
Train [62][1690/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.034)	Loss 2.7844 (2.6378)	Entropy 0.62924 (0.63013)	Top-1 acc 58.984 (60.382)	Top-5 acc 77.734 (81.515)	lr 0.01200
Train [62][1700/3239]	Time 0.261 (0.540)	Data Time 0.001 (0.034)	Loss 2.6001 (2.6379)	Entropy 0.62958 (0.63013)	Top-1 acc 56.641 (60.377)	Top-5 acc 80.859 (81.509)	lr 0.01200
Train [62][1710/3239]	Time 0.235 (0.540)	Data Time 0.001 (0.034)	Loss 2.7010 (2.6380)	Entropy 0.62986 (0.63012)	Top-1 acc 61.328 (60.377)	Top-5 acc 79.688 (81.510)	lr 0.01200
Train [62][1720/3239]	Time 0.251 (0.539)	Data Time 0.001 (0.034)	Loss 2.6930 (2.6380)	Entropy 0.62990 (0.63012)	Top-1 acc 62.109 (60.374)	Top-5 acc 80.078 (81.511)	lr 0.01200
Train [62][1730/3239]	Time 0.246 (0.540)	Data Time 0.001 (0.035)	Loss 2.5999 (2.6380)	Entropy 0.62988 (0.63012)	Top-1 acc 60.938 (60.370)	Top-5 acc 82.422 (81.514)	lr 0.01200
Train [62][1740/3239]	Time 0.282 (0.540)	Data Time 0.001 (0.036)	Loss 2.5727 (2.6379)	Entropy 0.62966 (0.63012)	Top-1 acc 64.844 (60.376)	Top-5 acc 83.594 (81.518)	lr 0.01200
Train [62][1750/3239]	Time 0.337 (0.540)	Data Time 0.001 (0.036)	Loss 2.5214 (2.6376)	Entropy 0.62964 (0.63012)	Top-1 acc 64.844 (60.380)	Top-5 acc 83.203 (81.523)	lr 0.01200
Train [62][1760/3239]	Time 0.251 (0.540)	Data Time 0.002 (0.036)	Loss 2.7198 (2.6377)	Entropy 0.62964 (0.63012)	Top-1 acc 58.984 (60.374)	Top-5 acc 80.859 (81.521)	lr 0.01200
Train [62][1770/3239]	Time 0.289 (0.541)	Data Time 0.001 (0.038)	Loss 2.6682 (2.6373)	Entropy 0.62996 (0.63011)	Top-1 acc 61.328 (60.384)	Top-5 acc 79.297 (81.526)	lr 0.01199
Train [62][1780/3239]	Time 0.272 (0.540)	Data Time 0.002 (0.037)	Loss 2.5555 (2.6370)	Entropy 0.62984 (0.63011)	Top-1 acc 64.453 (60.390)	Top-5 acc 83.203 (81.532)	lr 0.01199
Train [62][1790/3239]	Time 0.265 (0.540)	Data Time 0.001 (0.038)	Loss 2.7124 (2.6370)	Entropy 0.62946 (0.63011)	Top-1 acc 60.547 (60.389)	Top-5 acc 79.297 (81.533)	lr 0.01199
Train [62][1800/3239]	Time 0.241 (0.542)	Data Time 0.001 (0.040)	Loss 2.8115 (2.6371)	Entropy 0.62938 (0.63011)	Top-1 acc 56.641 (60.386)	Top-5 acc 75.781 (81.527)	lr 0.01199
Train [62][1810/3239]	Time 0.230 (0.541)	Data Time 0.001 (0.039)	Loss 2.8979 (2.6372)	Entropy 0.62930 (0.63010)	Top-1 acc 53.906 (60.386)	Top-5 acc 75.781 (81.525)	lr 0.01199
Train [62][1820/3239]	Time 0.331 (0.541)	Data Time 0.001 (0.039)	Loss 2.5168 (2.6369)	Entropy 0.62924 (0.63010)	Top-1 acc 61.328 (60.394)	Top-5 acc 83.203 (81.527)	lr 0.01199
Train [62][1830/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.045)	Loss 2.5603 (2.6368)	Entropy 0.62913 (0.63009)	Top-1 acc 62.891 (60.397)	Top-5 acc 82.031 (81.524)	lr 0.01199
Train [62][1840/3239]	Time 0.329 (0.545)	Data Time 0.001 (0.044)	Loss 2.8179 (2.6368)	Entropy 0.62897 (0.63009)	Top-1 acc 57.812 (60.391)	Top-5 acc 76.953 (81.522)	lr 0.01199
Train [62][1850/3239]	Time 0.228 (0.544)	Data Time 0.001 (0.044)	Loss 2.6923 (2.6365)	Entropy 0.62883 (0.63008)	Top-1 acc 57.031 (60.396)	Top-5 acc 78.906 (81.526)	lr 0.01199
Train [62][1860/3239]	Time 0.284 (0.544)	Data Time 0.001 (0.044)	Loss 2.7180 (2.6367)	Entropy 0.62883 (0.63007)	Top-1 acc 61.328 (60.394)	Top-5 acc 80.859 (81.523)	lr 0.01199
Train [62][1870/3239]	Time 0.235 (0.546)	Data Time 0.001 (0.046)	Loss 2.7769 (2.6369)	Entropy 0.62857 (0.63007)	Top-1 acc 55.469 (60.391)	Top-5 acc 78.516 (81.514)	lr 0.01198
Train [62][1880/3239]	Time 0.219 (0.545)	Data Time 0.001 (0.046)	Loss 2.5029 (2.6368)	Entropy 0.62854 (0.63006)	Top-1 acc 64.844 (60.391)	Top-5 acc 83.594 (81.517)	lr 0.01198
Train [62][1890/3239]	Time 0.282 (0.545)	Data Time 0.001 (0.047)	Loss 2.7148 (2.6369)	Entropy 0.62819 (0.63005)	Top-1 acc 60.156 (60.386)	Top-5 acc 78.516 (81.516)	lr 0.01198
Train [62][1900/3239]	Time 0.238 (0.549)	Data Time 0.001 (0.050)	Loss 2.7182 (2.6370)	Entropy 0.62871 (0.63004)	Top-1 acc 57.031 (60.385)	Top-5 acc 79.688 (81.515)	lr 0.01198
Train [62][1910/3239]	Time 0.265 (0.548)	Data Time 0.001 (0.050)	Loss 2.5497 (2.6369)	Entropy 0.62905 (0.63004)	Top-1 acc 62.109 (60.391)	Top-5 acc 81.250 (81.515)	lr 0.01198
Train [62][1920/3239]	Time 0.244 (0.547)	Data Time 0.001 (0.050)	Loss 2.5532 (2.6372)	Entropy 0.62922 (0.63003)	Top-1 acc 60.547 (60.384)	Top-5 acc 86.328 (81.509)	lr 0.01198
Train [62][1930/3239]	Time 0.283 (0.550)	Data Time 0.001 (0.053)	Loss 2.5728 (2.6375)	Entropy 0.62959 (0.63003)	Top-1 acc 61.328 (60.377)	Top-5 acc 83.984 (81.507)	lr 0.01198
Train [62][1940/3239]	Time 0.264 (0.550)	Data Time 0.001 (0.053)	Loss 2.6249 (2.6375)	Entropy 0.62956 (0.63002)	Top-1 acc 64.453 (60.377)	Top-5 acc 83.984 (81.507)	lr 0.01198
Train [62][1950/3239]	Time 0.245 (0.549)	Data Time 0.001 (0.052)	Loss 2.5418 (2.6371)	Entropy 0.62922 (0.63002)	Top-1 acc 60.938 (60.382)	Top-5 acc 83.594 (81.516)	lr 0.01198
Train [62][1960/3239]	Time 0.249 (0.552)	Data Time 0.001 (0.056)	Loss 2.5678 (2.6368)	Entropy 0.62908 (0.63002)	Top-1 acc 62.500 (60.387)	Top-5 acc 81.641 (81.522)	lr 0.01197
Train [62][1970/3239]	Time 0.244 (0.552)	Data Time 0.001 (0.056)	Loss 2.9381 (2.6369)	Entropy 0.62878 (0.63001)	Top-1 acc 57.031 (60.386)	Top-5 acc 76.562 (81.522)	lr 0.01197
Train [62][1980/3239]	Time 0.354 (0.551)	Data Time 0.002 (0.055)	Loss 2.5806 (2.6370)	Entropy 0.62873 (0.63001)	Top-1 acc 61.719 (60.383)	Top-5 acc 83.984 (81.516)	lr 0.01197
Train [62][1990/3239]	Time 0.254 (0.554)	Data Time 0.001 (0.059)	Loss 2.4646 (2.6370)	Entropy 0.62869 (0.63000)	Top-1 acc 63.281 (60.382)	Top-5 acc 84.766 (81.518)	lr 0.01197
Train [62][2000/3239]	Time 0.262 (0.554)	Data Time 0.001 (0.059)	Loss 2.4954 (2.6372)	Entropy 0.62864 (0.62999)	Top-1 acc 61.328 (60.372)	Top-5 acc 85.547 (81.516)	lr 0.01197
Train [62][2010/3239]	Time 0.227 (0.553)	Data Time 0.001 (0.058)	Loss 2.5944 (2.6372)	Entropy 0.62839 (0.62998)	Top-1 acc 58.984 (60.369)	Top-5 acc 82.031 (81.512)	lr 0.01197
Train [62][2020/3239]	Time 0.236 (0.553)	Data Time 0.001 (0.059)	Loss 2.7744 (2.6371)	Entropy 0.62821 (0.62998)	Top-1 acc 58.594 (60.375)	Top-5 acc 77.734 (81.516)	lr 0.01197
Train [62][2030/3239]	Time 0.232 (0.556)	Data Time 0.001 (0.062)	Loss 2.5610 (2.6371)	Entropy 0.62767 (0.62997)	Top-1 acc 62.500 (60.372)	Top-5 acc 81.641 (81.513)	lr 0.01197
Train [62][2040/3239]	Time 0.245 (0.555)	Data Time 0.001 (0.062)	Loss 2.7785 (2.6370)	Entropy 0.62749 (0.62995)	Top-1 acc 55.469 (60.371)	Top-5 acc 81.641 (81.518)	lr 0.01197
Train [62][2050/3239]	Time 0.357 (0.556)	Data Time 0.001 (0.062)	Loss 2.6934 (2.6372)	Entropy 0.62721 (0.62994)	Top-1 acc 60.156 (60.367)	Top-5 acc 79.297 (81.516)	lr 0.01197
Train [62][2060/3239]	Time 0.239 (0.560)	Data Time 0.001 (0.067)	Loss 2.5396 (2.6369)	Entropy 0.62738 (0.62993)	Top-1 acc 64.062 (60.376)	Top-5 acc 84.766 (81.523)	lr 0.01196
Train [62][2070/3239]	Time 0.249 (0.559)	Data Time 0.001 (0.067)	Loss 2.5416 (2.6370)	Entropy 0.62750 (0.62992)	Top-1 acc 64.453 (60.378)	Top-5 acc 84.375 (81.521)	lr 0.01196
Train [62][2080/3239]	Time 0.236 (0.560)	Data Time 0.001 (0.068)	Loss 2.3896 (2.6368)	Entropy 0.62764 (0.62991)	Top-1 acc 65.625 (60.377)	Top-5 acc 84.375 (81.523)	lr 0.01196
Train [62][2090/3239]	Time 0.267 (0.561)	Data Time 0.001 (0.070)	Loss 2.6647 (2.6373)	Entropy 0.62727 (0.62989)	Top-1 acc 60.156 (60.369)	Top-5 acc 79.688 (81.516)	lr 0.01196
Train [62][2100/3239]	Time 0.228 (0.561)	Data Time 0.001 (0.069)	Loss 2.6180 (2.6373)	Entropy 0.62741 (0.62988)	Top-1 acc 66.406 (60.373)	Top-5 acc 82.031 (81.514)	lr 0.01196
Train [62][2110/3239]	Time 0.219 (0.577)	Data Time 0.002 (0.069)	Loss 2.6425 (2.6374)	Entropy 0.62729 (0.62987)	Top-1 acc 57.031 (60.372)	Top-5 acc 82.031 (81.510)	lr 0.01196
Train [62][2120/3239]	Time 0.236 (0.576)	Data Time 0.001 (0.069)	Loss 2.6124 (2.6374)	Entropy 0.62748 (0.62986)	Top-1 acc 61.719 (60.375)	Top-5 acc 83.594 (81.512)	lr 0.01196
Train [62][2130/3239]	Time 0.227 (0.576)	Data Time 0.001 (0.068)	Loss 2.6384 (2.6373)	Entropy 0.62731 (0.62985)	Top-1 acc 62.891 (60.380)	Top-5 acc 83.203 (81.517)	lr 0.01196
Train [62][2140/3239]	Time 0.329 (0.575)	Data Time 0.001 (0.068)	Loss 2.4898 (2.6374)	Entropy 0.62718 (0.62983)	Top-1 acc 65.625 (60.380)	Top-5 acc 83.594 (81.518)	lr 0.01196
Train [62][2150/3239]	Time 0.239 (0.574)	Data Time 0.001 (0.068)	Loss 2.6606 (2.6376)	Entropy 0.62717 (0.62982)	Top-1 acc 58.984 (60.376)	Top-5 acc 81.641 (81.512)	lr 0.01196
Train [62][2160/3239]	Time 0.265 (0.574)	Data Time 0.002 (0.067)	Loss 2.7616 (2.6377)	Entropy 0.62712 (0.62981)	Top-1 acc 59.375 (60.380)	Top-5 acc 79.688 (81.511)	lr 0.01195
Train [62][2170/3239]	Time 0.249 (0.573)	Data Time 0.001 (0.067)	Loss 2.7141 (2.6376)	Entropy 0.62678 (0.62980)	Top-1 acc 60.547 (60.380)	Top-5 acc 80.469 (81.511)	lr 0.01195
Train [62][2180/3239]	Time 0.236 (0.572)	Data Time 0.001 (0.067)	Loss 2.7821 (2.6376)	Entropy 0.62667 (0.62978)	Top-1 acc 55.078 (60.380)	Top-5 acc 78.516 (81.514)	lr 0.01195
Train [62][2190/3239]	Time 0.248 (0.572)	Data Time 0.001 (0.066)	Loss 2.7300 (2.6375)	Entropy 0.62668 (0.62977)	Top-1 acc 58.594 (60.382)	Top-5 acc 79.297 (81.516)	lr 0.01195
Train [62][2200/3239]	Time 0.248 (0.571)	Data Time 0.001 (0.066)	Loss 2.5619 (2.6373)	Entropy 0.62682 (0.62975)	Top-1 acc 62.500 (60.384)	Top-5 acc 82.812 (81.521)	lr 0.01195
Train [62][2210/3239]	Time 0.344 (0.575)	Data Time 0.001 (0.070)	Loss 2.4594 (2.6372)	Entropy 0.62689 (0.62974)	Top-1 acc 62.500 (60.387)	Top-5 acc 86.328 (81.521)	lr 0.01195
Train [62][2220/3239]	Time 0.242 (0.575)	Data Time 0.001 (0.071)	Loss 2.5717 (2.6372)	Entropy 0.62661 (0.62973)	Top-1 acc 59.766 (60.383)	Top-5 acc 83.594 (81.519)	lr 0.01195
Train [62][2230/3239]	Time 0.273 (0.575)	Data Time 0.002 (0.071)	Loss 2.8559 (2.6370)	Entropy 0.62643 (0.62971)	Top-1 acc 51.953 (60.392)	Top-5 acc 75.000 (81.521)	lr 0.01195
Train [62][2240/3239]	Time 0.240 (0.578)	Data Time 0.002 (0.074)	Loss 2.8833 (2.6372)	Entropy 0.62644 (0.62970)	Top-1 acc 51.953 (60.386)	Top-5 acc 78.906 (81.520)	lr 0.01195
Train [62][2250/3239]	Time 0.273 (0.579)	Data Time 0.001 (0.075)	Loss 2.5011 (2.6369)	Entropy 0.62662 (0.62969)	Top-1 acc 64.844 (60.392)	Top-5 acc 85.156 (81.525)	lr 0.01195
Train [62][2260/3239]	Time 0.240 (0.578)	Data Time 0.001 (0.075)	Loss 2.7296 (2.6367)	Entropy 0.62652 (0.62967)	Top-1 acc 58.984 (60.394)	Top-5 acc 78.516 (81.531)	lr 0.01194
Train [62][2270/3239]	Time 0.248 (0.582)	Data Time 0.001 (0.079)	Loss 2.5770 (2.6367)	Entropy 0.62653 (0.62966)	Top-1 acc 59.766 (60.395)	Top-5 acc 82.812 (81.534)	lr 0.01194
Train [62][2280/3239]	Time 0.232 (0.583)	Data Time 0.001 (0.080)	Loss 2.6681 (2.6366)	Entropy 0.62640 (0.62964)	Top-1 acc 60.938 (60.393)	Top-5 acc 80.469 (81.536)	lr 0.01194
Train [62][2290/3239]	Time 0.235 (0.582)	Data Time 0.001 (0.080)	Loss 2.5928 (2.6365)	Entropy 0.62649 (0.62963)	Top-1 acc 62.500 (60.394)	Top-5 acc 82.031 (81.537)	lr 0.01194
Train [62][2300/3239]	Time 0.323 (0.585)	Data Time 0.001 (0.084)	Loss 2.8151 (2.6367)	Entropy 0.62624 (0.62962)	Top-1 acc 57.031 (60.392)	Top-5 acc 76.172 (81.532)	lr 0.01194
Train [62][2310/3239]	Time 0.234 (0.586)	Data Time 0.001 (0.085)	Loss 2.7577 (2.6368)	Entropy 0.62610 (0.62960)	Top-1 acc 55.078 (60.386)	Top-5 acc 79.297 (81.530)	lr 0.01194
Train [62][2320/3239]	Time 0.244 (0.586)	Data Time 0.001 (0.085)	Loss 2.5626 (2.6367)	Entropy 0.62613 (0.62959)	Top-1 acc 60.547 (60.387)	Top-5 acc 84.375 (81.531)	lr 0.01194
Train [62][2330/3239]	Time 3.911 (0.589)	Data Time 3.629 (0.088)	Loss 2.5304 (2.6366)	Entropy 0.62639 (0.62957)	Top-1 acc 67.578 (60.390)	Top-5 acc 83.594 (81.529)	lr 0.01194
Train [62][2340/3239]	Time 1.240 (0.591)	Data Time 1.016 (0.090)	Loss 2.7420 (2.6369)	Entropy 0.62624 (0.62956)	Top-1 acc 58.594 (60.388)	Top-5 acc 77.344 (81.524)	lr 0.01194
Train [62][2350/3239]	Time 0.250 (0.590)	Data Time 0.001 (0.090)	Loss 2.5390 (2.6366)	Entropy 0.62645 (0.62954)	Top-1 acc 60.547 (60.394)	Top-5 acc 80.859 (81.529)	lr 0.01194
Train [62][2360/3239]	Time 0.236 (0.590)	Data Time 0.001 (0.090)	Loss 2.5373 (2.6367)	Entropy 0.62611 (0.62953)	Top-1 acc 62.500 (60.387)	Top-5 acc 86.719 (81.527)	lr 0.01193
Train [62][2370/3239]	Time 0.339 (0.594)	Data Time 0.001 (0.095)	Loss 2.6801 (2.6364)	Entropy 0.62630 (0.62952)	Top-1 acc 60.156 (60.395)	Top-5 acc 80.469 (81.531)	lr 0.01193
Train [62][2380/3239]	Time 0.229 (0.595)	Data Time 0.001 (0.096)	Loss 2.7525 (2.6364)	Entropy 0.62640 (0.62950)	Top-1 acc 55.859 (60.396)	Top-5 acc 78.125 (81.529)	lr 0.01193
Train [62][2390/3239]	Time 0.226 (0.594)	Data Time 0.001 (0.095)	Loss 2.7377 (2.6364)	Entropy 0.62646 (0.62949)	Top-1 acc 57.422 (60.394)	Top-5 acc 79.688 (81.526)	lr 0.01193
Train [62][2400/3239]	Time 0.235 (0.600)	Data Time 0.001 (0.102)	Loss 2.6282 (2.6364)	Entropy 0.62630 (0.62948)	Top-1 acc 59.375 (60.390)	Top-5 acc 77.734 (81.523)	lr 0.01193
Train [62][2410/3239]	Time 0.264 (0.599)	Data Time 0.001 (0.101)	Loss 2.6480 (2.6366)	Entropy 0.62647 (0.62946)	Top-1 acc 58.594 (60.384)	Top-5 acc 79.297 (81.522)	lr 0.01193
Train [62][2420/3239]	Time 0.247 (0.600)	Data Time 0.001 (0.102)	Loss 2.6452 (2.6368)	Entropy 0.62615 (0.62945)	Top-1 acc 62.891 (60.382)	Top-5 acc 81.641 (81.521)	lr 0.01193
Train [62][2430/3239]	Time 0.230 (0.605)	Data Time 0.001 (0.107)	Loss 2.7591 (2.6368)	Entropy 0.62639 (0.62944)	Top-1 acc 58.594 (60.382)	Top-5 acc 79.297 (81.520)	lr 0.01193
Train [62][2440/3239]	Time 0.233 (0.604)	Data Time 0.001 (0.107)	Loss 2.7199 (2.6368)	Entropy 0.62674 (0.62943)	Top-1 acc 55.469 (60.377)	Top-5 acc 82.422 (81.522)	lr 0.01193
Train [62][2450/3239]	Time 0.233 (0.606)	Data Time 0.001 (0.109)	Loss 2.6627 (2.6369)	Entropy 0.62668 (0.62941)	Top-1 acc 60.938 (60.371)	Top-5 acc 81.250 (81.518)	lr 0.01193
Train [62][2460/3239]	Time 0.267 (0.609)	Data Time 0.001 (0.113)	Loss 2.7581 (2.6372)	Entropy 0.62672 (0.62940)	Top-1 acc 55.078 (60.364)	Top-5 acc 79.688 (81.509)	lr 0.01192
Train [62][2470/3239]	Time 0.232 (0.613)	Data Time 0.001 (0.117)	Loss 2.5127 (2.6373)	Entropy 0.62682 (0.62939)	Top-1 acc 63.281 (60.360)	Top-5 acc 82.422 (81.509)	lr 0.01192
Train [62][2480/3239]	Time 0.241 (0.613)	Data Time 0.001 (0.117)	Loss 2.8365 (2.6373)	Entropy 0.62688 (0.62938)	Top-1 acc 56.641 (60.360)	Top-5 acc 76.172 (81.508)	lr 0.01192
Train [62][2490/3239]	Time 4.253 (0.617)	Data Time 3.960 (0.121)	Loss 2.5237 (2.6372)	Entropy 0.62662 (0.62937)	Top-1 acc 65.234 (60.361)	Top-5 acc 83.203 (81.508)	lr 0.01192
Train [62][2500/3239]	Time 0.226 (0.621)	Data Time 0.001 (0.126)	Loss 2.6529 (2.6375)	Entropy 0.62667 (0.62936)	Top-1 acc 58.594 (60.353)	Top-5 acc 81.250 (81.507)	lr 0.01192
Train [62][2510/3239]	Time 0.233 (0.620)	Data Time 0.001 (0.125)	Loss 2.6781 (2.6374)	Entropy 0.62688 (0.62935)	Top-1 acc 62.891 (60.356)	Top-5 acc 80.859 (81.506)	lr 0.01192
Train [62][2520/3239]	Time 0.223 (0.620)	Data Time 0.001 (0.126)	Loss 2.8383 (2.6374)	Entropy 0.62656 (0.62934)	Top-1 acc 55.859 (60.356)	Top-5 acc 79.688 (81.503)	lr 0.01192
Train [62][2530/3239]	Time 0.325 (0.626)	Data Time 0.001 (0.131)	Loss 2.4409 (2.6376)	Entropy 0.62672 (0.62933)	Top-1 acc 63.281 (60.346)	Top-5 acc 84.766 (81.500)	lr 0.01192
Train [62][2540/3239]	Time 0.233 (0.628)	Data Time 0.001 (0.134)	Loss 2.6422 (2.6376)	Entropy 0.62673 (0.62932)	Top-1 acc 64.453 (60.346)	Top-5 acc 78.516 (81.496)	lr 0.01192
Train [62][2550/3239]	Time 0.246 (0.628)	Data Time 0.001 (0.135)	Loss 2.4466 (2.6375)	Entropy 0.62700 (0.62931)	Top-1 acc 66.797 (60.348)	Top-5 acc 85.156 (81.501)	lr 0.01192
Train [62][2560/3239]	Time 0.233 (0.633)	Data Time 0.001 (0.140)	Loss 2.7082 (2.6375)	Entropy 0.62727 (0.62930)	Top-1 acc 58.594 (60.350)	Top-5 acc 82.422 (81.501)	lr 0.01191
Train [62][2570/3239]	Time 0.227 (0.634)	Data Time 0.001 (0.141)	Loss 2.6369 (2.6377)	Entropy 0.62755 (0.62929)	Top-1 acc 60.156 (60.347)	Top-5 acc 82.422 (81.500)	lr 0.01191
Train [62][2580/3239]	Time 0.226 (0.636)	Data Time 0.001 (0.143)	Loss 2.7444 (2.6380)	Entropy 0.62767 (0.62929)	Top-1 acc 60.938 (60.338)	Top-5 acc 80.078 (81.495)	lr 0.01191
Train [62][2590/3239]	Time 0.237 (0.641)	Data Time 0.001 (0.148)	Loss 2.5385 (2.6380)	Entropy 0.62722 (0.62928)	Top-1 acc 64.062 (60.345)	Top-5 acc 85.547 (81.495)	lr 0.01191
Train [62][2600/3239]	Time 0.377 (0.642)	Data Time 0.001 (0.150)	Loss 2.6465 (2.6378)	Entropy 0.62696 (0.62927)	Top-1 acc 60.938 (60.347)	Top-5 acc 80.469 (81.497)	lr 0.01191
Train [62][2610/3239]	Time 2.767 (0.642)	Data Time 2.516 (0.151)	Loss 2.6044 (2.6379)	Entropy 0.62745 (0.62927)	Top-1 acc 59.375 (60.344)	Top-5 acc 82.031 (81.496)	lr 0.01191
Train [62][2620/3239]	Time 0.236 (0.646)	Data Time 0.001 (0.155)	Loss 2.6204 (2.6376)	Entropy 0.62739 (0.62926)	Top-1 acc 61.719 (60.354)	Top-5 acc 78.516 (81.500)	lr 0.01191
Train [62][2630/3239]	Time 0.216 (0.649)	Data Time 0.001 (0.158)	Loss 2.5757 (2.6377)	Entropy 0.62755 (0.62925)	Top-1 acc 61.719 (60.353)	Top-5 acc 82.031 (81.502)	lr 0.01191
Train [62][2640/3239]	Time 0.254 (0.648)	Data Time 0.001 (0.157)	Loss 2.4795 (2.6375)	Entropy 0.62786 (0.62925)	Top-1 acc 64.844 (60.357)	Top-5 acc 82.812 (81.503)	lr 0.01191
Train [62][2650/3239]	Time 0.320 (0.648)	Data Time 0.093 (0.157)	Loss 2.7150 (2.6375)	Entropy 0.62719 (0.62924)	Top-1 acc 57.031 (60.357)	Top-5 acc 80.859 (81.502)	lr 0.01191
Train [62][2660/3239]	Time 2.921 (0.651)	Data Time 2.646 (0.160)	Loss 2.5959 (2.6376)	Entropy 0.62738 (0.62923)	Top-1 acc 59.766 (60.354)	Top-5 acc 83.594 (81.502)	lr 0.01190
Train [62][2670/3239]	Time 0.245 (0.650)	Data Time 0.002 (0.160)	Loss 2.7276 (2.6377)	Entropy 0.62761 (0.62923)	Top-1 acc 57.812 (60.351)	Top-5 acc 77.344 (81.500)	lr 0.01190
Train [62][2680/3239]	Time 0.238 (0.649)	Data Time 0.002 (0.159)	Loss 2.5851 (2.6377)	Entropy 0.62731 (0.62922)	Top-1 acc 62.500 (60.351)	Top-5 acc 82.812 (81.502)	lr 0.01190
Train [62][2690/3239]	Time 0.358 (0.650)	Data Time 0.001 (0.160)	Loss 2.5319 (2.6378)	Entropy 0.62733 (0.62921)	Top-1 acc 63.281 (60.351)	Top-5 acc 83.594 (81.496)	lr 0.01190
Train [62][2700/3239]	Time 0.225 (0.652)	Data Time 0.001 (0.162)	Loss 2.4759 (2.6376)	Entropy 0.62708 (0.62920)	Top-1 acc 64.062 (60.357)	Top-5 acc 83.594 (81.500)	lr 0.01190
Train [62][2710/3239]	Time 5.774 (0.653)	Data Time 5.534 (0.164)	Loss 2.7116 (2.6377)	Entropy 0.62735 (0.62920)	Top-1 acc 58.594 (60.360)	Top-5 acc 82.031 (81.499)	lr 0.01190
Train [62][2720/3239]	Time 0.537 (0.655)	Data Time 0.313 (0.167)	Loss 2.7445 (2.6377)	Entropy 0.62737 (0.62919)	Top-1 acc 57.812 (60.358)	Top-5 acc 81.641 (81.500)	lr 0.01190
Train [62][2730/3239]	Time 0.269 (0.658)	Data Time 0.001 (0.170)	Loss 2.7297 (2.6377)	Entropy 0.62733 (0.62918)	Top-1 acc 59.766 (60.357)	Top-5 acc 80.469 (81.500)	lr 0.01190
Train [62][2740/3239]	Time 0.256 (0.657)	Data Time 0.001 (0.169)	Loss 2.5738 (2.6378)	Entropy 0.62739 (0.62918)	Top-1 acc 63.281 (60.356)	Top-5 acc 81.641 (81.495)	lr 0.01190
Train [62][2750/3239]	Time 0.264 (0.663)	Data Time 0.002 (0.174)	Loss 2.7285 (2.6378)	Entropy 0.62713 (0.62917)	Top-1 acc 56.641 (60.355)	Top-5 acc 83.203 (81.496)	lr 0.01190
Train [62][2760/3239]	Time 0.355 (0.677)	Data Time 0.006 (0.176)	Loss 2.7262 (2.6381)	Entropy 0.62747 (0.62916)	Top-1 acc 59.766 (60.353)	Top-5 acc 80.469 (81.491)	lr 0.01189
Train [62][2770/3239]	Time 0.235 (0.676)	Data Time 0.002 (0.175)	Loss 2.7425 (2.6381)	Entropy 0.62715 (0.62916)	Top-1 acc 61.328 (60.357)	Top-5 acc 80.078 (81.491)	lr 0.01189
Train [62][2780/3239]	Time 0.235 (0.675)	Data Time 0.001 (0.175)	Loss 2.7836 (2.6382)	Entropy 0.62668 (0.62915)	Top-1 acc 56.250 (60.353)	Top-5 acc 79.297 (81.489)	lr 0.01189
Train [62][2790/3239]	Time 0.232 (0.674)	Data Time 0.002 (0.174)	Loss 2.9178 (2.6385)	Entropy 0.62660 (0.62914)	Top-1 acc 53.906 (60.349)	Top-5 acc 77.344 (81.483)	lr 0.01189
Train [62][2800/3239]	Time 0.248 (0.673)	Data Time 0.001 (0.173)	Loss 2.7914 (2.6387)	Entropy 0.62674 (0.62913)	Top-1 acc 61.328 (60.345)	Top-5 acc 77.734 (81.478)	lr 0.01189
Train [62][2810/3239]	Time 1.453 (0.673)	Data Time 1.203 (0.173)	Loss 2.8268 (2.6388)	Entropy 0.62678 (0.62912)	Top-1 acc 55.859 (60.345)	Top-5 acc 79.297 (81.477)	lr 0.01189
Train [62][2820/3239]	Time 0.290 (0.676)	Data Time 0.001 (0.176)	Loss 2.8385 (2.6386)	Entropy 0.62659 (0.62912)	Top-1 acc 55.859 (60.348)	Top-5 acc 75.000 (81.479)	lr 0.01189
Train [62][2830/3239]	Time 0.259 (0.675)	Data Time 0.001 (0.176)	Loss 2.5697 (2.6386)	Entropy 0.62638 (0.62911)	Top-1 acc 62.891 (60.348)	Top-5 acc 83.203 (81.479)	lr 0.01189
Train [62][2840/3239]	Time 0.255 (0.674)	Data Time 0.001 (0.175)	Loss 2.6394 (2.6386)	Entropy 0.62627 (0.62910)	Top-1 acc 61.719 (60.347)	Top-5 acc 80.859 (81.480)	lr 0.01189
Train [62][2850/3239]	Time 0.397 (0.677)	Data Time 0.001 (0.178)	Loss 2.5820 (2.6386)	Entropy 0.62657 (0.62909)	Top-1 acc 61.719 (60.345)	Top-5 acc 81.641 (81.481)	lr 0.01189
Train [62][2860/3239]	Time 0.245 (0.677)	Data Time 0.001 (0.178)	Loss 2.6990 (2.6387)	Entropy 0.62686 (0.62908)	Top-1 acc 60.938 (60.342)	Top-5 acc 80.859 (81.476)	lr 0.01188
Train [62][2870/3239]	Time 0.245 (0.676)	Data Time 0.002 (0.178)	Loss 2.7743 (2.6390)	Entropy 0.62697 (0.62907)	Top-1 acc 55.078 (60.334)	Top-5 acc 80.859 (81.473)	lr 0.01188
Train [62][2880/3239]	Time 0.325 (0.678)	Data Time 0.092 (0.180)	Loss 2.6045 (2.6390)	Entropy 0.62683 (0.62906)	Top-1 acc 58.594 (60.330)	Top-5 acc 81.641 (81.473)	lr 0.01188
Train [62][2890/3239]	Time 0.251 (0.678)	Data Time 0.002 (0.180)	Loss 2.6120 (2.6390)	Entropy 0.62665 (0.62906)	Top-1 acc 61.328 (60.330)	Top-5 acc 83.203 (81.473)	lr 0.01188
Train [62][2900/3239]	Time 0.266 (0.677)	Data Time 0.001 (0.179)	Loss 2.4747 (2.6390)	Entropy 0.62630 (0.62905)	Top-1 acc 65.234 (60.329)	Top-5 acc 84.766 (81.473)	lr 0.01188
Train [62][2910/3239]	Time 0.241 (0.680)	Data Time 0.001 (0.182)	Loss 2.4824 (2.6388)	Entropy 0.62618 (0.62904)	Top-1 acc 66.406 (60.333)	Top-5 acc 83.203 (81.477)	lr 0.01188
Train [62][2920/3239]	Time 0.387 (0.679)	Data Time 0.001 (0.181)	Loss 2.6572 (2.6389)	Entropy 0.62647 (0.62903)	Top-1 acc 58.203 (60.332)	Top-5 acc 81.250 (81.475)	lr 0.01188
Train [62][2930/3239]	Time 0.251 (0.678)	Data Time 0.001 (0.181)	Loss 2.7046 (2.6388)	Entropy 0.62640 (0.62902)	Top-1 acc 59.766 (60.333)	Top-5 acc 80.078 (81.477)	lr 0.01188
Train [62][2940/3239]	Time 0.243 (0.679)	Data Time 0.001 (0.181)	Loss 2.4771 (2.6386)	Entropy 0.62640 (0.62901)	Top-1 acc 62.891 (60.341)	Top-5 acc 84.375 (81.481)	lr 0.01188
Train [62][2950/3239]	Time 0.238 (0.680)	Data Time 0.001 (0.183)	Loss 2.4445 (2.6384)	Entropy 0.62688 (0.62900)	Top-1 acc 60.156 (60.343)	Top-5 acc 86.719 (81.484)	lr 0.01188
Train [62][2960/3239]	Time 0.292 (0.679)	Data Time 0.003 (0.182)	Loss 2.4751 (2.6383)	Entropy 0.62710 (0.62900)	Top-1 acc 67.578 (60.347)	Top-5 acc 82.422 (81.485)	lr 0.01187
Train [62][2970/3239]	Time 0.253 (0.680)	Data Time 0.001 (0.184)	Loss 2.4001 (2.6382)	Entropy 0.62696 (0.62899)	Top-1 acc 68.359 (60.353)	Top-5 acc 83.594 (81.486)	lr 0.01187
Train [62][2980/3239]	Time 3.280 (0.683)	Data Time 2.987 (0.187)	Loss 2.8709 (2.6382)	Entropy 0.62714 (0.62898)	Top-1 acc 55.469 (60.348)	Top-5 acc 76.562 (81.484)	lr 0.01187
Train [62][2990/3239]	Time 0.238 (0.683)	Data Time 0.001 (0.187)	Loss 2.6232 (2.6384)	Entropy 0.62752 (0.62898)	Top-1 acc 59.766 (60.346)	Top-5 acc 80.469 (81.480)	lr 0.01187
Train [62][3000/3239]	Time 0.251 (0.683)	Data Time 0.001 (0.187)	Loss 2.7268 (2.6385)	Entropy 0.62746 (0.62897)	Top-1 acc 55.859 (60.339)	Top-5 acc 78.906 (81.477)	lr 0.01187
Train [62][3010/3239]	Time 0.368 (0.689)	Data Time 0.001 (0.193)	Loss 2.5506 (2.6385)	Entropy 0.62722 (0.62897)	Top-1 acc 60.547 (60.337)	Top-5 acc 82.422 (81.476)	lr 0.01187
Train [62][3020/3239]	Time 0.248 (0.690)	Data Time 0.001 (0.194)	Loss 2.5633 (2.6386)	Entropy 0.62710 (0.62896)	Top-1 acc 60.938 (60.336)	Top-5 acc 83.984 (81.475)	lr 0.01187
Train [62][3030/3239]	Time 0.254 (0.689)	Data Time 0.001 (0.194)	Loss 2.6495 (2.6385)	Entropy 0.62724 (0.62896)	Top-1 acc 64.062 (60.336)	Top-5 acc 79.297 (81.476)	lr 0.01187
Train [62][3040/3239]	Time 7.675 (0.695)	Data Time 7.393 (0.200)	Loss 2.6573 (2.6385)	Entropy 0.62727 (0.62895)	Top-1 acc 62.500 (60.339)	Top-5 acc 82.422 (81.477)	lr 0.01187
Train [62][3050/3239]	Time 0.251 (0.696)	Data Time 0.001 (0.201)	Loss 2.4877 (2.6385)	Entropy 0.62705 (0.62894)	Top-1 acc 62.500 (60.340)	Top-5 acc 83.203 (81.474)	lr 0.01186
Train [62][3060/3239]	Time 0.294 (0.695)	Data Time 0.002 (0.200)	Loss 2.7006 (2.6384)	Entropy 0.62692 (0.62894)	Top-1 acc 56.250 (60.341)	Top-5 acc 82.812 (81.477)	lr 0.01186
Train [62][3070/3239]	Time 0.224 (0.697)	Data Time 0.001 (0.203)	Loss 2.7278 (2.6386)	Entropy 0.62702 (0.62893)	Top-1 acc 58.984 (60.335)	Top-5 acc 81.641 (81.474)	lr 0.01186
Train [62][3080/3239]	Time 0.330 (0.701)	Data Time 0.001 (0.207)	Loss 2.7139 (2.6385)	Entropy 0.62693 (0.62892)	Top-1 acc 58.594 (60.338)	Top-5 acc 80.078 (81.474)	lr 0.01186
Train [62][3090/3239]	Time 0.265 (0.700)	Data Time 0.001 (0.206)	Loss 2.3150 (2.6385)	Entropy 0.62664 (0.62892)	Top-1 acc 67.188 (60.338)	Top-5 acc 86.328 (81.473)	lr 0.01186
Train [62][3100/3239]	Time 0.251 (0.701)	Data Time 0.001 (0.207)	Loss 2.6787 (2.6388)	Entropy 0.62718 (0.62891)	Top-1 acc 60.156 (60.331)	Top-5 acc 77.734 (81.468)	lr 0.01186
Train [62][3110/3239]	Time 0.295 (0.706)	Data Time 0.001 (0.213)	Loss 2.5118 (2.6388)	Entropy 0.62709 (0.62891)	Top-1 acc 63.672 (60.333)	Top-5 acc 84.375 (81.469)	lr 0.01186
Train [62][3120/3239]	Time 0.256 (0.705)	Data Time 0.001 (0.212)	Loss 2.6549 (2.6386)	Entropy 0.62715 (0.62890)	Top-1 acc 61.719 (60.337)	Top-5 acc 81.250 (81.477)	lr 0.01186
Train [62][3130/3239]	Time 0.251 (0.707)	Data Time 0.001 (0.214)	Loss 2.6537 (2.6386)	Entropy 0.62735 (0.62889)	Top-1 acc 62.109 (60.339)	Top-5 acc 80.859 (81.477)	lr 0.01186
Train [62][3140/3239]	Time 2.105 (0.711)	Data Time 1.846 (0.218)	Loss 2.4952 (2.6383)	Entropy 0.62732 (0.62889)	Top-1 acc 67.188 (60.344)	Top-5 acc 84.375 (81.482)	lr 0.01186
Train [62][3150/3239]	Time 0.255 (0.710)	Data Time 0.001 (0.217)	Loss 2.5610 (2.6382)	Entropy 0.62711 (0.62888)	Top-1 acc 63.281 (60.345)	Top-5 acc 81.250 (81.482)	lr 0.01185
Train [62][3160/3239]	Time 0.233 (0.710)	Data Time 0.001 (0.218)	Loss 2.6863 (2.6381)	Entropy 0.62681 (0.62888)	Top-1 acc 59.375 (60.345)	Top-5 acc 81.641 (81.485)	lr 0.01185
Train [62][3170/3239]	Time 0.291 (0.716)	Data Time 0.001 (0.224)	Loss 2.7449 (2.6383)	Entropy 0.62685 (0.62887)	Top-1 acc 59.375 (60.340)	Top-5 acc 80.859 (81.482)	lr 0.01185
Train [62][3180/3239]	Time 0.237 (0.716)	Data Time 0.000 (0.224)	Loss 2.6227 (2.6383)	Entropy 0.62653 (0.62887)	Top-1 acc 59.766 (60.340)	Top-5 acc 80.078 (81.482)	lr 0.01185
Train [62][3190/3239]	Time 0.250 (0.715)	Data Time 0.000 (0.224)	Loss 2.5185 (2.6382)	Entropy 0.62691 (0.62886)	Top-1 acc 66.406 (60.341)	Top-5 acc 82.422 (81.482)	lr 0.01185
Train [62][3200/3239]	Time 10.916 (0.721)	Data Time 10.656 (0.230)	Loss 2.7103 (2.6384)	Entropy 0.62694 (0.62885)	Top-1 acc 58.203 (60.341)	Top-5 acc 80.078 (81.481)	lr 0.01185
Train [62][3210/3239]	Time 0.232 (0.721)	Data Time 0.000 (0.230)	Loss 2.7596 (2.6385)	Entropy 0.62700 (0.62885)	Top-1 acc 58.984 (60.341)	Top-5 acc 76.953 (81.477)	lr 0.01185
Train [62][3220/3239]	Time 0.248 (0.720)	Data Time 0.000 (0.230)	Loss 2.5656 (2.6384)	Entropy 0.62726 (0.62884)	Top-1 acc 62.500 (60.342)	Top-5 acc 82.422 (81.479)	lr 0.01185
Train [62][3230/3239]	Time 0.217 (0.720)	Data Time 0.000 (0.230)	Loss 2.8740 (2.6383)	Entropy 0.62720 (0.62884)	Top-1 acc 56.641 (60.344)	Top-5 acc 76.172 (81.481)	lr 0.01185
Train [62][3239/3239]	Time 0.848 (0.722)	Data Time 0.000 (0.232)	Loss 2.9721 (2.6383)	Entropy 0.62696 (0.62883)	Top-1 acc 49.383 (60.342)	Top-5 acc 70.370 (81.483)	lr 0.01185
==========Valid [62/120]	loss 1.427	top-1 acc 67.525 (67.769)	top-5 acc 87.439	Train top-1 60.342	top-5 81.483	Entropy 0.62696	Latency-None: 0.000ms	Flops: 537.50M
Train [63][0/3239]	Time 38.899 (38.899)	Data Time 37.888 (37.888)	Loss 2.6874 (2.6874)	Entropy 0.62691 (0.62691)	Top-1 acc 59.766 (59.766)	Top-5 acc 76.562 (76.562)	lr 0.01185
Train [63][10/3239]	Time 0.234 (3.964)	Data Time 0.001 (3.446)	Loss 2.5917 (2.7307)	Entropy 0.62714 (0.62700)	Top-1 acc 60.156 (58.203)	Top-5 acc 82.812 (80.149)	lr 0.01184
Train [63][20/3239]	Time 0.267 (2.274)	Data Time 0.001 (1.806)	Loss 2.6346 (2.7045)	Entropy 0.62710 (0.62709)	Top-1 acc 63.672 (59.003)	Top-5 acc 81.641 (80.469)	lr 0.01184
Train [63][30/3239]	Time 0.249 (1.695)	Data Time 0.001 (1.224)	Loss 2.4975 (2.6659)	Entropy 0.62678 (0.62705)	Top-1 acc 64.844 (59.740)	Top-5 acc 83.594 (81.326)	lr 0.01184
Train [63][40/3239]	Time 0.256 (1.391)	Data Time 0.001 (0.926)	Loss 2.4898 (2.6430)	Entropy 0.62674 (0.62700)	Top-1 acc 62.891 (60.423)	Top-5 acc 83.203 (81.688)	lr 0.01184
Train [63][50/3239]	Time 0.257 (1.212)	Data Time 0.001 (0.745)	Loss 2.6097 (2.6314)	Entropy 0.62693 (0.62696)	Top-1 acc 61.328 (60.654)	Top-5 acc 82.031 (81.832)	lr 0.01184
Train [63][60/3239]	Time 0.224 (1.086)	Data Time 0.001 (0.623)	Loss 2.7553 (2.6279)	Entropy 0.62678 (0.62694)	Top-1 acc 61.719 (60.912)	Top-5 acc 80.469 (81.839)	lr 0.01184
Train [63][70/3239]	Time 0.357 (0.997)	Data Time 0.001 (0.535)	Loss 2.5673 (2.6346)	Entropy 0.62662 (0.62693)	Top-1 acc 62.500 (60.552)	Top-5 acc 81.641 (81.602)	lr 0.01184
Train [63][80/3239]	Time 0.327 (0.928)	Data Time 0.001 (0.469)	Loss 2.8186 (2.6281)	Entropy 0.62672 (0.62690)	Top-1 acc 53.516 (60.740)	Top-5 acc 77.344 (81.776)	lr 0.01184
Train [63][90/3239]	Time 0.253 (0.870)	Data Time 0.001 (0.418)	Loss 2.5235 (2.6240)	Entropy 0.62681 (0.62688)	Top-1 acc 64.453 (60.946)	Top-5 acc 82.031 (81.821)	lr 0.01184
Train [63][100/3239]	Time 0.244 (0.851)	Data Time 0.001 (0.399)	Loss 2.4489 (2.6173)	Entropy 0.62676 (0.62687)	Top-1 acc 65.234 (61.015)	Top-5 acc 85.547 (81.911)	lr 0.01184
Train [63][110/3239]	Time 0.253 (0.811)	Data Time 0.001 (0.363)	Loss 2.6732 (2.6148)	Entropy 0.62661 (0.62685)	Top-1 acc 57.422 (60.969)	Top-5 acc 82.031 (82.014)	lr 0.01183
Train [63][120/3239]	Time 0.274 (0.781)	Data Time 0.001 (0.333)	Loss 2.7206 (2.6173)	Entropy 0.62650 (0.62683)	Top-1 acc 62.109 (60.921)	Top-5 acc 81.250 (81.960)	lr 0.01183
Train [63][130/3239]	Time 0.368 (0.756)	Data Time 0.001 (0.308)	Loss 2.6589 (2.6211)	Entropy 0.62621 (0.62680)	Top-1 acc 59.375 (60.878)	Top-5 acc 78.906 (81.843)	lr 0.01183
Train [63][140/3239]	Time 0.321 (0.749)	Data Time 0.001 (0.302)	Loss 2.8808 (2.6200)	Entropy 0.62605 (0.62676)	Top-1 acc 52.734 (60.949)	Top-5 acc 77.344 (81.868)	lr 0.01183
Train [63][150/3239]	Time 0.243 (0.728)	Data Time 0.001 (0.282)	Loss 2.5064 (2.6198)	Entropy 0.62605 (0.62671)	Top-1 acc 66.016 (60.922)	Top-5 acc 84.766 (81.897)	lr 0.01183
Train [63][160/3239]	Time 0.239 (0.709)	Data Time 0.001 (0.265)	Loss 2.5915 (2.6192)	Entropy 0.62603 (0.62667)	Top-1 acc 61.328 (60.896)	Top-5 acc 83.984 (81.905)	lr 0.01183
Train [63][170/3239]	Time 0.240 (0.708)	Data Time 0.001 (0.263)	Loss 2.5020 (2.6178)	Entropy 0.62565 (0.62663)	Top-1 acc 69.531 (60.979)	Top-5 acc 83.984 (81.919)	lr 0.01183
Train [63][180/3239]	Time 0.339 (0.892)	Data Time 0.003 (0.249)	Loss 2.6217 (2.6165)	Entropy 0.62566 (0.62657)	Top-1 acc 63.281 (61.022)	Top-5 acc 80.859 (81.917)	lr 0.01183
Train [63][190/3239]	Time 0.231 (0.868)	Data Time 0.002 (0.236)	Loss 2.4902 (2.6133)	Entropy 0.62558 (0.62652)	Top-1 acc 66.016 (61.099)	Top-5 acc 83.594 (81.996)	lr 0.01183
Train [63][200/3239]	Time 0.247 (0.845)	Data Time 0.002 (0.224)	Loss 2.5545 (2.6108)	Entropy 0.62520 (0.62646)	Top-1 acc 65.234 (61.153)	Top-5 acc 81.641 (82.027)	lr 0.01183
Train [63][210/3239]	Time 0.245 (0.825)	Data Time 0.002 (0.214)	Loss 2.7181 (2.6112)	Entropy 0.62535 (0.62641)	Top-1 acc 58.203 (61.149)	Top-5 acc 79.297 (81.996)	lr 0.01182
Train [63][220/3239]	Time 0.239 (0.807)	Data Time 0.001 (0.204)	Loss 2.9765 (2.6120)	Entropy 0.62559 (0.62636)	Top-1 acc 55.078 (61.153)	Top-5 acc 73.828 (81.973)	lr 0.01182
Train [63][230/3239]	Time 0.386 (0.792)	Data Time 0.003 (0.195)	Loss 2.4062 (2.6095)	Entropy 0.62580 (0.62633)	Top-1 acc 65.625 (61.220)	Top-5 acc 85.938 (82.024)	lr 0.01182
Train [63][240/3239]	Time 0.262 (0.779)	Data Time 0.001 (0.187)	Loss 2.4773 (2.6085)	Entropy 0.62553 (0.62630)	Top-1 acc 64.062 (61.250)	Top-5 acc 82.812 (82.036)	lr 0.01182
Train [63][250/3239]	Time 0.246 (0.765)	Data Time 0.001 (0.180)	Loss 2.6401 (2.6082)	Entropy 0.62548 (0.62627)	Top-1 acc 58.984 (61.219)	Top-5 acc 81.641 (82.023)	lr 0.01182
Train [63][260/3239]	Time 0.215 (0.752)	Data Time 0.001 (0.173)	Loss 2.6357 (2.6099)	Entropy 0.62545 (0.62624)	Top-1 acc 59.766 (61.168)	Top-5 acc 82.812 (82.012)	lr 0.01182
Train [63][270/3239]	Time 0.295 (0.741)	Data Time 0.003 (0.167)	Loss 2.6755 (2.6102)	Entropy 0.62507 (0.62620)	Top-1 acc 62.109 (61.144)	Top-5 acc 78.906 (81.985)	lr 0.01182
Train [63][280/3239]	Time 0.229 (0.731)	Data Time 0.001 (0.161)	Loss 2.6079 (2.6109)	Entropy 0.62520 (0.62616)	Top-1 acc 63.672 (61.125)	Top-5 acc 83.203 (81.962)	lr 0.01182
Train [63][290/3239]	Time 0.236 (0.721)	Data Time 0.001 (0.155)	Loss 2.5340 (2.6116)	Entropy 0.62504 (0.62613)	Top-1 acc 61.719 (61.099)	Top-5 acc 83.594 (81.936)	lr 0.01182
Train [63][300/3239]	Time 0.355 (0.711)	Data Time 0.001 (0.150)	Loss 2.4996 (2.6129)	Entropy 0.62476 (0.62609)	Top-1 acc 62.891 (61.045)	Top-5 acc 83.203 (81.917)	lr 0.01182
Train [63][310/3239]	Time 0.233 (0.708)	Data Time 0.001 (0.152)	Loss 2.5192 (2.6156)	Entropy 0.62462 (0.62605)	Top-1 acc 62.891 (60.999)	Top-5 acc 86.328 (81.869)	lr 0.01181
Train [63][320/3239]	Time 0.243 (0.701)	Data Time 0.002 (0.148)	Loss 2.7457 (2.6168)	Entropy 0.62499 (0.62601)	Top-1 acc 57.812 (60.961)	Top-5 acc 80.469 (81.855)	lr 0.01181
Train [63][330/3239]	Time 0.248 (0.697)	Data Time 0.001 (0.147)	Loss 2.5788 (2.6154)	Entropy 0.62495 (0.62598)	Top-1 acc 64.453 (60.988)	Top-5 acc 82.812 (81.894)	lr 0.01181
Train [63][340/3239]	Time 0.245 (0.709)	Data Time 0.001 (0.163)	Loss 2.5182 (2.6156)	Entropy 0.62507 (0.62595)	Top-1 acc 61.719 (60.989)	Top-5 acc 83.984 (81.898)	lr 0.01181
Train [63][350/3239]	Time 0.242 (0.702)	Data Time 0.001 (0.159)	Loss 2.5760 (2.6157)	Entropy 0.62502 (0.62593)	Top-1 acc 56.641 (60.985)	Top-5 acc 84.766 (81.897)	lr 0.01181
Train [63][360/3239]	Time 0.237 (0.695)	Data Time 0.001 (0.154)	Loss 2.6883 (2.6156)	Entropy 0.62522 (0.62590)	Top-1 acc 58.594 (60.979)	Top-5 acc 79.688 (81.897)	lr 0.01181
Train [63][370/3239]	Time 0.284 (0.697)	Data Time 0.001 (0.159)	Loss 2.7306 (2.6172)	Entropy 0.62536 (0.62588)	Top-1 acc 58.594 (60.907)	Top-5 acc 79.297 (81.861)	lr 0.01181
Train [63][380/3239]	Time 0.263 (0.693)	Data Time 0.001 (0.158)	Loss 2.8330 (2.6174)	Entropy 0.62534 (0.62587)	Top-1 acc 56.250 (60.926)	Top-5 acc 75.781 (81.847)	lr 0.01181
Train [63][390/3239]	Time 0.237 (0.699)	Data Time 0.001 (0.167)	Loss 2.7785 (2.6175)	Entropy 0.62498 (0.62585)	Top-1 acc 58.984 (60.937)	Top-5 acc 78.125 (81.845)	lr 0.01181
Train [63][400/3239]	Time 3.754 (0.701)	Data Time 3.512 (0.172)	Loss 2.6089 (2.6177)	Entropy 0.62506 (0.62583)	Top-1 acc 59.375 (60.939)	Top-5 acc 84.375 (81.853)	lr 0.01181
Train [63][410/3239]	Time 0.245 (0.704)	Data Time 0.001 (0.177)	Loss 2.5601 (2.6174)	Entropy 0.62471 (0.62581)	Top-1 acc 62.500 (60.942)	Top-5 acc 80.078 (81.860)	lr 0.01180
Train [63][420/3239]	Time 0.261 (0.699)	Data Time 0.001 (0.175)	Loss 2.7144 (2.6164)	Entropy 0.62433 (0.62578)	Top-1 acc 58.203 (60.989)	Top-5 acc 80.469 (81.869)	lr 0.01180
Train [63][430/3239]	Time 0.247 (0.695)	Data Time 0.001 (0.173)	Loss 2.7194 (2.6177)	Entropy 0.62425 (0.62575)	Top-1 acc 57.422 (60.930)	Top-5 acc 79.297 (81.845)	lr 0.01180
Train [63][440/3239]	Time 0.296 (0.706)	Data Time 0.001 (0.186)	Loss 2.4940 (2.6176)	Entropy 0.62448 (0.62572)	Top-1 acc 64.453 (60.944)	Top-5 acc 83.594 (81.837)	lr 0.01180
Train [63][450/3239]	Time 0.261 (0.702)	Data Time 0.001 (0.184)	Loss 2.9315 (2.6187)	Entropy 0.62446 (0.62569)	Top-1 acc 50.000 (60.892)	Top-5 acc 77.344 (81.813)	lr 0.01180
Train [63][460/3239]	Time 0.348 (0.697)	Data Time 0.002 (0.181)	Loss 2.6308 (2.6189)	Entropy 0.62462 (0.62566)	Top-1 acc 58.984 (60.893)	Top-5 acc 82.422 (81.817)	lr 0.01180
Train [63][470/3239]	Time 0.255 (0.699)	Data Time 0.001 (0.185)	Loss 2.4943 (2.6193)	Entropy 0.62498 (0.62564)	Top-1 acc 64.453 (60.899)	Top-5 acc 82.812 (81.810)	lr 0.01180
Train [63][480/3239]	Time 0.259 (0.708)	Data Time 0.001 (0.195)	Loss 2.6431 (2.6198)	Entropy 0.62493 (0.62563)	Top-1 acc 58.594 (60.883)	Top-5 acc 82.422 (81.801)	lr 0.01180
Train [63][490/3239]	Time 0.237 (0.703)	Data Time 0.001 (0.192)	Loss 2.5900 (2.6198)	Entropy 0.62467 (0.62561)	Top-1 acc 62.500 (60.893)	Top-5 acc 82.422 (81.816)	lr 0.01180
Train [63][500/3239]	Time 0.227 (0.704)	Data Time 0.001 (0.195)	Loss 2.4427 (2.6192)	Entropy 0.62446 (0.62559)	Top-1 acc 63.281 (60.907)	Top-5 acc 85.938 (81.828)	lr 0.01180
Train [63][510/3239]	Time 0.234 (0.713)	Data Time 0.001 (0.205)	Loss 2.4999 (2.6175)	Entropy 0.62452 (0.62557)	Top-1 acc 64.844 (60.938)	Top-5 acc 83.594 (81.871)	lr 0.01179
Train [63][520/3239]	Time 0.249 (0.707)	Data Time 0.001 (0.201)	Loss 2.7004 (2.6180)	Entropy 0.62441 (0.62555)	Top-1 acc 58.203 (60.927)	Top-5 acc 82.031 (81.869)	lr 0.01179
Train [63][530/3239]	Time 0.649 (0.704)	Data Time 0.301 (0.200)	Loss 2.4885 (2.6170)	Entropy 0.62424 (0.62553)	Top-1 acc 62.109 (60.965)	Top-5 acc 84.375 (81.875)	lr 0.01179
Train [63][540/3239]	Time 0.250 (0.717)	Data Time 0.001 (0.214)	Loss 2.5307 (2.6169)	Entropy 0.62462 (0.62551)	Top-1 acc 62.891 (60.940)	Top-5 acc 82.812 (81.869)	lr 0.01179
Train [63][550/3239]	Time 0.248 (0.715)	Data Time 0.001 (0.213)	Loss 2.7731 (2.6172)	Entropy 0.62447 (0.62549)	Top-1 acc 58.203 (60.936)	Top-5 acc 78.516 (81.864)	lr 0.01179
Train [63][560/3239]	Time 0.802 (0.710)	Data Time 0.525 (0.210)	Loss 2.7327 (2.6174)	Entropy 0.62412 (0.62547)	Top-1 acc 57.812 (60.934)	Top-5 acc 79.688 (81.859)	lr 0.01179
Train [63][570/3239]	Time 0.251 (0.724)	Data Time 0.001 (0.225)	Loss 2.5711 (2.6162)	Entropy 0.62391 (0.62545)	Top-1 acc 61.328 (60.975)	Top-5 acc 82.422 (81.892)	lr 0.01179
Train [63][580/3239]	Time 0.267 (0.719)	Data Time 0.001 (0.221)	Loss 2.5814 (2.6164)	Entropy 0.62417 (0.62542)	Top-1 acc 60.938 (60.964)	Top-5 acc 80.859 (81.870)	lr 0.01179
Train [63][590/3239]	Time 0.250 (0.713)	Data Time 0.001 (0.217)	Loss 2.5809 (2.6169)	Entropy 0.62406 (0.62540)	Top-1 acc 56.641 (60.923)	Top-5 acc 82.422 (81.865)	lr 0.01179
Train [63][600/3239]	Time 0.262 (0.730)	Data Time 0.001 (0.235)	Loss 2.5808 (2.6188)	Entropy 0.62422 (0.62538)	Top-1 acc 59.375 (60.896)	Top-5 acc 81.250 (81.820)	lr 0.01179
Train [63][610/3239]	Time 0.249 (0.725)	Data Time 0.001 (0.232)	Loss 2.8528 (2.6189)	Entropy 0.62432 (0.62536)	Top-1 acc 52.734 (60.876)	Top-5 acc 77.344 (81.810)	lr 0.01178
Train [63][620/3239]	Time 0.347 (0.721)	Data Time 0.001 (0.229)	Loss 2.6640 (2.6196)	Entropy 0.62393 (0.62535)	Top-1 acc 62.891 (60.888)	Top-5 acc 80.859 (81.796)	lr 0.01178
Train [63][630/3239]	Time 0.236 (0.716)	Data Time 0.001 (0.225)	Loss 2.4472 (2.6191)	Entropy 0.62409 (0.62532)	Top-1 acc 65.625 (60.882)	Top-5 acc 84.766 (81.817)	lr 0.01178
Train [63][640/3239]	Time 0.225 (0.731)	Data Time 0.001 (0.241)	Loss 2.7041 (2.6181)	Entropy 0.62408 (0.62530)	Top-1 acc 58.203 (60.909)	Top-5 acc 80.859 (81.844)	lr 0.01178
Train [63][650/3239]	Time 0.245 (0.727)	Data Time 0.001 (0.238)	Loss 2.5220 (2.6182)	Entropy 0.62402 (0.62528)	Top-1 acc 66.406 (60.917)	Top-5 acc 83.594 (81.839)	lr 0.01178
Train [63][660/3239]	Time 0.233 (0.722)	Data Time 0.001 (0.234)	Loss 2.6459 (2.6187)	Entropy 0.62386 (0.62526)	Top-1 acc 59.766 (60.916)	Top-5 acc 80.859 (81.830)	lr 0.01178
Train [63][670/3239]	Time 0.230 (0.734)	Data Time 0.001 (0.247)	Loss 2.6668 (2.6185)	Entropy 0.62395 (0.62524)	Top-1 acc 60.938 (60.918)	Top-5 acc 82.031 (81.827)	lr 0.01178
Train [63][680/3239]	Time 0.232 (0.731)	Data Time 0.001 (0.245)	Loss 2.8406 (2.6187)	Entropy 0.62419 (0.62523)	Top-1 acc 58.594 (60.913)	Top-5 acc 79.297 (81.819)	lr 0.01178
Train [63][690/3239]	Time 0.339 (0.726)	Data Time 0.001 (0.241)	Loss 2.6556 (2.6189)	Entropy 0.62432 (0.62521)	Top-1 acc 57.031 (60.903)	Top-5 acc 78.906 (81.809)	lr 0.01178
Train [63][700/3239]	Time 0.228 (0.738)	Data Time 0.001 (0.254)	Loss 2.7535 (2.6192)	Entropy 0.62406 (0.62520)	Top-1 acc 56.641 (60.905)	Top-5 acc 80.469 (81.812)	lr 0.01178
Train [63][710/3239]	Time 0.249 (0.740)	Data Time 0.002 (0.258)	Loss 2.5638 (2.6190)	Entropy 0.62408 (0.62518)	Top-1 acc 62.891 (60.907)	Top-5 acc 81.641 (81.812)	lr 0.01177
Train [63][720/3239]	Time 0.230 (0.735)	Data Time 0.001 (0.254)	Loss 2.8130 (2.6199)	Entropy 0.62440 (0.62517)	Top-1 acc 54.688 (60.870)	Top-5 acc 75.781 (81.796)	lr 0.01177
Train [63][730/3239]	Time 0.220 (0.744)	Data Time 0.001 (0.264)	Loss 2.4005 (2.6198)	Entropy 0.62441 (0.62516)	Top-1 acc 65.625 (60.877)	Top-5 acc 85.938 (81.794)	lr 0.01177
Train [63][740/3239]	Time 0.221 (0.739)	Data Time 0.001 (0.260)	Loss 2.6059 (2.6199)	Entropy 0.62434 (0.62515)	Top-1 acc 60.156 (60.873)	Top-5 acc 79.688 (81.791)	lr 0.01177
Train [63][750/3239]	Time 0.232 (0.737)	Data Time 0.001 (0.258)	Loss 2.5798 (2.6213)	Entropy 0.62451 (0.62514)	Top-1 acc 60.938 (60.833)	Top-5 acc 82.031 (81.764)	lr 0.01177
Train [63][760/3239]	Time 0.251 (0.747)	Data Time 0.001 (0.269)	Loss 2.7534 (2.6216)	Entropy 0.62483 (0.62513)	Top-1 acc 58.203 (60.825)	Top-5 acc 78.516 (81.748)	lr 0.01177
Train [63][770/3239]	Time 0.247 (0.748)	Data Time 0.002 (0.271)	Loss 2.4762 (2.6224)	Entropy 0.62465 (0.62512)	Top-1 acc 66.797 (60.807)	Top-5 acc 85.547 (81.735)	lr 0.01177
Train [63][780/3239]	Time 0.318 (0.744)	Data Time 0.001 (0.268)	Loss 2.7024 (2.6226)	Entropy 0.62510 (0.62512)	Top-1 acc 63.281 (60.807)	Top-5 acc 78.516 (81.734)	lr 0.01177
Train [63][790/3239]	Time 0.230 (0.742)	Data Time 0.001 (0.267)	Loss 2.4482 (2.6235)	Entropy 0.62480 (0.62512)	Top-1 acc 69.141 (60.795)	Top-5 acc 85.938 (81.716)	lr 0.01177
Train [63][800/3239]	Time 0.228 (0.756)	Data Time 0.001 (0.282)	Loss 2.5174 (2.6233)	Entropy 0.62487 (0.62511)	Top-1 acc 64.453 (60.789)	Top-5 acc 83.203 (81.715)	lr 0.01177
Train [63][810/3239]	Time 0.238 (0.752)	Data Time 0.001 (0.279)	Loss 2.7684 (2.6242)	Entropy 0.62452 (0.62511)	Top-1 acc 57.422 (60.761)	Top-5 acc 78.125 (81.702)	lr 0.01176
Train [63][820/3239]	Time 0.252 (0.748)	Data Time 0.001 (0.276)	Loss 2.7198 (2.6238)	Entropy 0.62481 (0.62510)	Top-1 acc 59.375 (60.779)	Top-5 acc 77.344 (81.710)	lr 0.01176
Train [63][830/3239]	Time 0.349 (0.808)	Data Time 0.043 (0.293)	Loss 2.5726 (2.6234)	Entropy 0.62464 (0.62510)	Top-1 acc 61.719 (60.783)	Top-5 acc 81.641 (81.719)	lr 0.01176
Train [63][840/3239]	Time 0.235 (0.804)	Data Time 0.002 (0.289)	Loss 2.5395 (2.6239)	Entropy 0.62476 (0.62509)	Top-1 acc 66.016 (60.769)	Top-5 acc 83.984 (81.712)	lr 0.01176
Train [63][850/3239]	Time 0.328 (0.800)	Data Time 0.002 (0.286)	Loss 2.7881 (2.6241)	Entropy 0.62506 (0.62509)	Top-1 acc 54.297 (60.753)	Top-5 acc 78.906 (81.713)	lr 0.01176
Train [63][860/3239]	Time 0.240 (0.796)	Data Time 0.001 (0.283)	Loss 2.5337 (2.6243)	Entropy 0.62533 (0.62509)	Top-1 acc 63.281 (60.752)	Top-5 acc 81.250 (81.710)	lr 0.01176
Train [63][870/3239]	Time 0.235 (0.791)	Data Time 0.001 (0.279)	Loss 2.6366 (2.6234)	Entropy 0.62549 (0.62509)	Top-1 acc 59.766 (60.762)	Top-5 acc 82.422 (81.728)	lr 0.01176
Train [63][880/3239]	Time 0.242 (0.787)	Data Time 0.001 (0.276)	Loss 2.8462 (2.6240)	Entropy 0.62569 (0.62510)	Top-1 acc 54.688 (60.749)	Top-5 acc 75.391 (81.707)	lr 0.01176
Train [63][890/3239]	Time 0.284 (0.783)	Data Time 0.001 (0.273)	Loss 2.5189 (2.6243)	Entropy 0.62568 (0.62511)	Top-1 acc 62.891 (60.742)	Top-5 acc 83.203 (81.708)	lr 0.01176
Train [63][900/3239]	Time 0.266 (0.781)	Data Time 0.001 (0.272)	Loss 2.6220 (2.6248)	Entropy 0.62591 (0.62511)	Top-1 acc 58.594 (60.726)	Top-5 acc 82.812 (81.700)	lr 0.01176
Train [63][910/3239]	Time 0.249 (0.779)	Data Time 0.002 (0.271)	Loss 2.5045 (2.6245)	Entropy 0.62592 (0.62512)	Top-1 acc 64.062 (60.727)	Top-5 acc 84.375 (81.706)	lr 0.01175
Train [63][920/3239]	Time 0.260 (0.779)	Data Time 0.001 (0.272)	Loss 2.8022 (2.6244)	Entropy 0.62605 (0.62513)	Top-1 acc 58.203 (60.725)	Top-5 acc 80.078 (81.712)	lr 0.01175
Train [63][930/3239]	Time 0.241 (0.789)	Data Time 0.001 (0.283)	Loss 2.4693 (2.6242)	Entropy 0.62610 (0.62514)	Top-1 acc 64.844 (60.724)	Top-5 acc 83.594 (81.708)	lr 0.01175
Train [63][940/3239]	Time 0.385 (0.789)	Data Time 0.001 (0.283)	Loss 2.7292 (2.6242)	Entropy 0.62641 (0.62515)	Top-1 acc 60.938 (60.724)	Top-5 acc 80.859 (81.712)	lr 0.01175
Train [63][950/3239]	Time 0.246 (0.790)	Data Time 0.001 (0.285)	Loss 2.7132 (2.6245)	Entropy 0.62671 (0.62517)	Top-1 acc 57.812 (60.721)	Top-5 acc 80.859 (81.708)	lr 0.01175
Train [63][960/3239]	Time 0.988 (0.793)	Data Time 0.699 (0.289)	Loss 2.6136 (2.6248)	Entropy 0.62645 (0.62518)	Top-1 acc 61.328 (60.704)	Top-5 acc 80.859 (81.698)	lr 0.01175
Train [63][970/3239]	Time 0.240 (0.796)	Data Time 0.001 (0.293)	Loss 2.5588 (2.6246)	Entropy 0.62596 (0.62520)	Top-1 acc 58.984 (60.707)	Top-5 acc 81.250 (81.700)	lr 0.01175
Train [63][980/3239]	Time 0.248 (0.797)	Data Time 0.001 (0.294)	Loss 2.7045 (2.6242)	Entropy 0.62625 (0.62520)	Top-1 acc 61.719 (60.722)	Top-5 acc 80.078 (81.709)	lr 0.01175
Train [63][990/3239]	Time 6.659 (0.800)	Data Time 6.415 (0.298)	Loss 2.5968 (2.6238)	Entropy 0.62629 (0.62521)	Top-1 acc 62.891 (60.741)	Top-5 acc 83.594 (81.718)	lr 0.01175
Train [63][1000/3239]	Time 0.235 (0.804)	Data Time 0.001 (0.303)	Loss 2.5542 (2.6241)	Entropy 0.62641 (0.62523)	Top-1 acc 61.328 (60.739)	Top-5 acc 82.031 (81.713)	lr 0.01174
Train [63][1010/3239]	Time 2.826 (0.804)	Data Time 2.478 (0.303)	Loss 2.8103 (2.6241)	Entropy 0.62622 (0.62524)	Top-1 acc 59.375 (60.740)	Top-5 acc 79.297 (81.713)	lr 0.01174
Train [63][1020/3239]	Time 0.249 (0.800)	Data Time 0.002 (0.300)	Loss 2.4491 (2.6243)	Entropy 0.62624 (0.62525)	Top-1 acc 65.625 (60.743)	Top-5 acc 83.594 (81.701)	lr 0.01174
Train [63][1030/3239]	Time 0.251 (0.810)	Data Time 0.001 (0.311)	Loss 2.5560 (2.6240)	Entropy 0.62617 (0.62526)	Top-1 acc 63.672 (60.746)	Top-5 acc 81.641 (81.703)	lr 0.01174
Train [63][1040/3239]	Time 0.262 (0.808)	Data Time 0.001 (0.309)	Loss 2.7299 (2.6239)	Entropy 0.62622 (0.62527)	Top-1 acc 56.641 (60.753)	Top-5 acc 80.469 (81.703)	lr 0.01174
Train [63][1050/3239]	Time 0.230 (0.809)	Data Time 0.001 (0.311)	Loss 2.6904 (2.6240)	Entropy 0.62599 (0.62527)	Top-1 acc 57.812 (60.751)	Top-5 acc 79.688 (81.701)	lr 0.01174
Train [63][1060/3239]	Time 2.693 (0.819)	Data Time 2.462 (0.322)	Loss 2.8263 (2.6245)	Entropy 0.62600 (0.62528)	Top-1 acc 56.641 (60.734)	Top-5 acc 75.781 (81.690)	lr 0.01174
Train [63][1070/3239]	Time 0.267 (0.818)	Data Time 0.001 (0.322)	Loss 2.6352 (2.6244)	Entropy 0.62607 (0.62529)	Top-1 acc 63.281 (60.734)	Top-5 acc 80.078 (81.686)	lr 0.01174
Train [63][1080/3239]	Time 0.240 (0.816)	Data Time 0.001 (0.320)	Loss 2.8854 (2.6251)	Entropy 0.62575 (0.62529)	Top-1 acc 53.516 (60.717)	Top-5 acc 76.172 (81.673)	lr 0.01174
Train [63][1090/3239]	Time 0.230 (0.829)	Data Time 0.001 (0.334)	Loss 2.6761 (2.6250)	Entropy 0.62593 (0.62530)	Top-1 acc 58.594 (60.709)	Top-5 acc 81.250 (81.671)	lr 0.01174
Train [63][1100/3239]	Time 3.158 (0.827)	Data Time 2.846 (0.333)	Loss 2.5518 (2.6250)	Entropy 0.62628 (0.62530)	Top-1 acc 61.719 (60.708)	Top-5 acc 84.766 (81.666)	lr 0.01173
Train [63][1110/3239]	Time 0.255 (0.825)	Data Time 0.002 (0.331)	Loss 2.6605 (2.6252)	Entropy 0.62625 (0.62531)	Top-1 acc 58.594 (60.700)	Top-5 acc 80.469 (81.664)	lr 0.01173
Train [63][1120/3239]	Time 13.616 (0.835)	Data Time 13.335 (0.342)	Loss 2.6325 (2.6252)	Entropy 0.62604 (0.62532)	Top-1 acc 57.422 (60.701)	Top-5 acc 83.203 (81.667)	lr 0.01173
Train [63][1130/3239]	Time 0.233 (0.834)	Data Time 0.001 (0.341)	Loss 2.6188 (2.6253)	Entropy 0.62612 (0.62533)	Top-1 acc 62.891 (60.698)	Top-5 acc 84.375 (81.670)	lr 0.01173
Train [63][1140/3239]	Time 1.251 (0.831)	Data Time 1.012 (0.340)	Loss 2.6148 (2.6255)	Entropy 0.62643 (0.62533)	Top-1 acc 61.719 (60.699)	Top-5 acc 82.422 (81.668)	lr 0.01173
Train [63][1150/3239]	Time 0.239 (0.831)	Data Time 0.001 (0.340)	Loss 2.7287 (2.6253)	Entropy 0.62607 (0.62534)	Top-1 acc 56.250 (60.711)	Top-5 acc 80.859 (81.673)	lr 0.01173
Train [63][1160/3239]	Time 0.239 (0.846)	Data Time 0.001 (0.356)	Loss 2.3783 (2.6252)	Entropy 0.62574 (0.62535)	Top-1 acc 65.625 (60.710)	Top-5 acc 85.938 (81.672)	lr 0.01173
Train [63][1170/3239]	Time 0.323 (0.843)	Data Time 0.001 (0.353)	Loss 2.6258 (2.6256)	Entropy 0.62640 (0.62535)	Top-1 acc 58.984 (60.697)	Top-5 acc 81.641 (81.660)	lr 0.01173
Train [63][1180/3239]	Time 0.233 (0.839)	Data Time 0.001 (0.350)	Loss 2.6459 (2.6258)	Entropy 0.62655 (0.62536)	Top-1 acc 59.766 (60.693)	Top-5 acc 81.250 (81.663)	lr 0.01173
Train [63][1190/3239]	Time 0.243 (0.855)	Data Time 0.001 (0.367)	Loss 2.3627 (2.6258)	Entropy 0.62685 (0.62537)	Top-1 acc 65.625 (60.689)	Top-5 acc 85.938 (81.657)	lr 0.01173
Train [63][1200/3239]	Time 0.254 (0.852)	Data Time 0.002 (0.364)	Loss 2.8279 (2.6260)	Entropy 0.62704 (0.62539)	Top-1 acc 55.469 (60.684)	Top-5 acc 78.516 (81.653)	lr 0.01172
Train [63][1210/3239]	Time 0.240 (0.850)	Data Time 0.001 (0.362)	Loss 2.5934 (2.6259)	Entropy 0.62665 (0.62540)	Top-1 acc 60.156 (60.694)	Top-5 acc 82.031 (81.657)	lr 0.01172
Train [63][1220/3239]	Time 0.234 (0.868)	Data Time 0.001 (0.381)	Loss 2.6297 (2.6262)	Entropy 0.62628 (0.62541)	Top-1 acc 62.500 (60.696)	Top-5 acc 81.641 (81.657)	lr 0.01172
Train [63][1230/3239]	Time 0.249 (0.864)	Data Time 0.001 (0.378)	Loss 2.7898 (2.6267)	Entropy 0.62632 (0.62542)	Top-1 acc 56.250 (60.690)	Top-5 acc 80.859 (81.651)	lr 0.01172
Train [63][1240/3239]	Time 0.341 (0.865)	Data Time 0.001 (0.379)	Loss 2.5014 (2.6265)	Entropy 0.62625 (0.62542)	Top-1 acc 66.016 (60.700)	Top-5 acc 84.766 (81.657)	lr 0.01172
Train [63][1250/3239]	Time 4.530 (0.881)	Data Time 4.286 (0.396)	Loss 2.8719 (2.6270)	Entropy 0.62626 (0.62543)	Top-1 acc 55.078 (60.693)	Top-5 acc 74.219 (81.646)	lr 0.01172
Train [63][1260/3239]	Time 0.247 (0.877)	Data Time 0.001 (0.393)	Loss 2.4743 (2.6270)	Entropy 0.62612 (0.62543)	Top-1 acc 62.891 (60.688)	Top-5 acc 83.984 (81.648)	lr 0.01172
Train [63][1270/3239]	Time 0.242 (0.879)	Data Time 0.001 (0.395)	Loss 2.6443 (2.6267)	Entropy 0.62596 (0.62544)	Top-1 acc 58.203 (60.691)	Top-5 acc 84.766 (81.661)	lr 0.01172
Train [63][1280/3239]	Time 18.443 (0.890)	Data Time 18.194 (0.406)	Loss 2.4444 (2.6267)	Entropy 0.62571 (0.62544)	Top-1 acc 64.062 (60.685)	Top-5 acc 85.156 (81.658)	lr 0.01172
Train [63][1290/3239]	Time 0.248 (0.889)	Data Time 0.001 (0.406)	Loss 2.8768 (2.6267)	Entropy 0.62562 (0.62544)	Top-1 acc 57.031 (60.685)	Top-5 acc 77.734 (81.659)	lr 0.01172
Train [63][1300/3239]	Time 0.247 (0.892)	Data Time 0.001 (0.409)	Loss 2.4895 (2.6262)	Entropy 0.62593 (0.62545)	Top-1 acc 63.281 (60.697)	Top-5 acc 82.422 (81.667)	lr 0.01171
Train [63][1310/3239]	Time 0.244 (0.888)	Data Time 0.001 (0.406)	Loss 2.5235 (2.6260)	Entropy 0.62610 (0.62545)	Top-1 acc 63.281 (60.707)	Top-5 acc 83.594 (81.671)	lr 0.01171
Train [63][1320/3239]	Time 0.228 (0.896)	Data Time 0.001 (0.415)	Loss 2.5490 (2.6265)	Entropy 0.62601 (0.62545)	Top-1 acc 62.891 (60.696)	Top-5 acc 83.203 (81.663)	lr 0.01171
Train [63][1330/3239]	Time 0.337 (0.893)	Data Time 0.001 (0.412)	Loss 2.6845 (2.6261)	Entropy 0.62608 (0.62546)	Top-1 acc 58.594 (60.692)	Top-5 acc 82.031 (81.671)	lr 0.01171
Train [63][1340/3239]	Time 0.228 (0.895)	Data Time 0.001 (0.415)	Loss 2.4280 (2.6261)	Entropy 0.62541 (0.62546)	Top-1 acc 65.625 (60.692)	Top-5 acc 83.984 (81.673)	lr 0.01171
Train [63][1350/3239]	Time 0.248 (0.906)	Data Time 0.001 (0.426)	Loss 2.5138 (2.6259)	Entropy 0.62571 (0.62546)	Top-1 acc 64.062 (60.696)	Top-5 acc 84.375 (81.685)	lr 0.01171
Train [63][1360/3239]	Time 0.229 (0.902)	Data Time 0.001 (0.423)	Loss 2.6751 (2.6263)	Entropy 0.62568 (0.62546)	Top-1 acc 60.938 (60.690)	Top-5 acc 82.031 (81.684)	lr 0.01171
Train [63][1370/3239]	Time 0.322 (0.902)	Data Time 0.001 (0.423)	Loss 2.6196 (2.6260)	Entropy 0.62550 (0.62547)	Top-1 acc 61.719 (60.692)	Top-5 acc 80.859 (81.692)	lr 0.01171
Train [63][1380/3239]	Time 0.222 (0.910)	Data Time 0.001 (0.432)	Loss 2.7041 (2.6257)	Entropy 0.62552 (0.62547)	Top-1 acc 58.594 (60.699)	Top-5 acc 80.859 (81.696)	lr 0.01171
Train [63][1390/3239]	Time 0.254 (0.907)	Data Time 0.001 (0.429)	Loss 2.6893 (2.6254)	Entropy 0.62526 (0.62547)	Top-1 acc 55.859 (60.697)	Top-5 acc 80.078 (81.698)	lr 0.01171
Train [63][1400/3239]	Time 0.319 (0.910)	Data Time 0.001 (0.433)	Loss 2.8733 (2.6259)	Entropy 0.62481 (0.62546)	Top-1 acc 55.078 (60.694)	Top-5 acc 77.734 (81.696)	lr 0.01170
Train [63][1410/3239]	Time 1.750 (0.917)	Data Time 1.474 (0.440)	Loss 2.5045 (2.6263)	Entropy 0.62460 (0.62546)	Top-1 acc 66.406 (60.684)	Top-5 acc 83.203 (81.691)	lr 0.01170
Train [63][1420/3239]	Time 0.236 (0.913)	Data Time 0.001 (0.437)	Loss 2.6512 (2.6262)	Entropy 0.62429 (0.62545)	Top-1 acc 58.594 (60.686)	Top-5 acc 80.859 (81.689)	lr 0.01170
Train [63][1430/3239]	Time 0.231 (0.916)	Data Time 0.001 (0.440)	Loss 2.5020 (2.6257)	Entropy 0.62433 (0.62544)	Top-1 acc 64.453 (60.700)	Top-5 acc 83.203 (81.697)	lr 0.01170
Train [63][1440/3239]	Time 13.800 (0.922)	Data Time 13.557 (0.446)	Loss 2.7589 (2.6253)	Entropy 0.62404 (0.62544)	Top-1 acc 56.250 (60.700)	Top-5 acc 79.688 (81.705)	lr 0.01170
Train [63][1450/3239]	Time 0.230 (0.922)	Data Time 0.001 (0.447)	Loss 2.6093 (2.6250)	Entropy 0.62432 (0.62543)	Top-1 acc 63.281 (60.704)	Top-5 acc 82.422 (81.707)	lr 0.01170
Train [63][1460/3239]	Time 0.247 (0.925)	Data Time 0.001 (0.450)	Loss 2.4239 (2.6250)	Entropy 0.62443 (0.62542)	Top-1 acc 64.844 (60.709)	Top-5 acc 83.984 (81.708)	lr 0.01170
Train [63][1470/3239]	Time 0.231 (0.921)	Data Time 0.001 (0.447)	Loss 2.6465 (2.6252)	Entropy 0.62460 (0.62541)	Top-1 acc 59.375 (60.709)	Top-5 acc 82.812 (81.705)	lr 0.01170
Train [63][1480/3239]	Time 0.230 (0.929)	Data Time 0.001 (0.455)	Loss 2.7470 (2.6247)	Entropy 0.62462 (0.62541)	Top-1 acc 56.641 (60.722)	Top-5 acc 80.859 (81.714)	lr 0.01170
Train [63][1490/3239]	Time 0.340 (0.951)	Data Time 0.002 (0.452)	Loss 2.8505 (2.6247)	Entropy 0.62447 (0.62540)	Top-1 acc 58.203 (60.728)	Top-5 acc 76.562 (81.710)	lr 0.01170
Train [63][1500/3239]	Time 0.265 (0.948)	Data Time 0.002 (0.449)	Loss 2.6194 (2.6244)	Entropy 0.62474 (0.62540)	Top-1 acc 62.500 (60.734)	Top-5 acc 80.469 (81.717)	lr 0.01169
Train [63][1510/3239]	Time 0.252 (0.944)	Data Time 0.002 (0.446)	Loss 2.5059 (2.6240)	Entropy 0.62457 (0.62539)	Top-1 acc 64.844 (60.749)	Top-5 acc 82.812 (81.723)	lr 0.01169
Train [63][1520/3239]	Time 0.240 (0.941)	Data Time 0.001 (0.444)	Loss 2.6682 (2.6242)	Entropy 0.62497 (0.62539)	Top-1 acc 55.859 (60.741)	Top-5 acc 82.422 (81.724)	lr 0.01169
Train [63][1530/3239]	Time 0.229 (0.938)	Data Time 0.001 (0.441)	Loss 2.7582 (2.6242)	Entropy 0.62557 (0.62539)	Top-1 acc 55.859 (60.736)	Top-5 acc 77.734 (81.722)	lr 0.01169
Train [63][1540/3239]	Time 0.291 (0.941)	Data Time 0.001 (0.445)	Loss 2.7573 (2.6242)	Entropy 0.62567 (0.62539)	Top-1 acc 59.375 (60.740)	Top-5 acc 80.078 (81.723)	lr 0.01169
Train [63][1550/3239]	Time 0.264 (0.939)	Data Time 0.002 (0.443)	Loss 2.6398 (2.6241)	Entropy 0.62538 (0.62539)	Top-1 acc 57.422 (60.743)	Top-5 acc 81.641 (81.726)	lr 0.01169
Train [63][1560/3239]	Time 0.330 (0.943)	Data Time 0.001 (0.447)	Loss 2.4608 (2.6243)	Entropy 0.62537 (0.62539)	Top-1 acc 62.500 (60.738)	Top-5 acc 85.547 (81.725)	lr 0.01169
Train [63][1570/3239]	Time 3.897 (0.948)	Data Time 3.607 (0.453)	Loss 2.7502 (2.6247)	Entropy 0.62537 (0.62539)	Top-1 acc 55.078 (60.730)	Top-5 acc 79.688 (81.719)	lr 0.01169
Train [63][1580/3239]	Time 0.251 (0.946)	Data Time 0.001 (0.451)	Loss 2.5977 (2.6246)	Entropy 0.62549 (0.62539)	Top-1 acc 62.891 (60.737)	Top-5 acc 82.812 (81.719)	lr 0.01169
Train [63][1590/3239]	Time 0.246 (0.949)	Data Time 0.002 (0.455)	Loss 2.8930 (2.6250)	Entropy 0.62562 (0.62539)	Top-1 acc 53.125 (60.725)	Top-5 acc 76.562 (81.714)	lr 0.01169
Train [63][1600/3239]	Time 11.258 (0.953)	Data Time 11.011 (0.459)	Loss 2.8085 (2.6251)	Entropy 0.62526 (0.62539)	Top-1 acc 58.203 (60.717)	Top-5 acc 78.125 (81.709)	lr 0.01168
Train [63][1610/3239]	Time 0.231 (0.952)	Data Time 0.001 (0.459)	Loss 2.6304 (2.6255)	Entropy 0.62498 (0.62539)	Top-1 acc 59.375 (60.713)	Top-5 acc 82.812 (81.703)	lr 0.01168
Train [63][1620/3239]	Time 0.254 (0.957)	Data Time 0.001 (0.464)	Loss 2.7076 (2.6255)	Entropy 0.62508 (0.62539)	Top-1 acc 60.156 (60.710)	Top-5 acc 80.078 (81.702)	lr 0.01168
Train [63][1630/3239]	Time 0.236 (0.954)	Data Time 0.001 (0.462)	Loss 2.5689 (2.6253)	Entropy 0.62506 (0.62538)	Top-1 acc 62.109 (60.713)	Top-5 acc 84.375 (81.704)	lr 0.01168
Train [63][1640/3239]	Time 0.278 (0.961)	Data Time 0.001 (0.469)	Loss 2.5955 (2.6253)	Entropy 0.62521 (0.62538)	Top-1 acc 63.281 (60.718)	Top-5 acc 80.859 (81.703)	lr 0.01168
Train [63][1650/3239]	Time 0.345 (0.958)	Data Time 0.001 (0.466)	Loss 2.5793 (2.6255)	Entropy 0.62540 (0.62538)	Top-1 acc 60.156 (60.712)	Top-5 acc 81.250 (81.696)	lr 0.01168
Train [63][1660/3239]	Time 0.252 (0.961)	Data Time 0.002 (0.470)	Loss 2.5661 (2.6254)	Entropy 0.62567 (0.62538)	Top-1 acc 58.984 (60.713)	Top-5 acc 82.031 (81.697)	lr 0.01168
Train [63][1670/3239]	Time 0.378 (0.967)	Data Time 0.135 (0.477)	Loss 2.5818 (2.6250)	Entropy 0.62532 (0.62538)	Top-1 acc 64.062 (60.724)	Top-5 acc 84.766 (81.707)	lr 0.01168
Train [63][1680/3239]	Time 0.230 (0.964)	Data Time 0.001 (0.474)	Loss 2.6183 (2.6247)	Entropy 0.62553 (0.62538)	Top-1 acc 62.109 (60.731)	Top-5 acc 78.516 (81.710)	lr 0.01168
Train [63][1690/3239]	Time 0.235 (0.967)	Data Time 0.001 (0.477)	Loss 2.6697 (2.6244)	Entropy 0.62560 (0.62539)	Top-1 acc 56.641 (60.735)	Top-5 acc 78.906 (81.715)	lr 0.01168
Train [63][1700/3239]	Time 0.245 (0.974)	Data Time 0.001 (0.484)	Loss 3.1247 (2.6249)	Entropy 0.62557 (0.62539)	Top-1 acc 51.562 (60.725)	Top-5 acc 71.875 (81.706)	lr 0.01167
Train [63][1710/3239]	Time 0.287 (0.973)	Data Time 0.001 (0.484)	Loss 2.4356 (2.6248)	Entropy 0.62573 (0.62539)	Top-1 acc 65.234 (60.734)	Top-5 acc 85.938 (81.708)	lr 0.01167
Train [63][1720/3239]	Time 0.344 (0.975)	Data Time 0.002 (0.486)	Loss 2.4130 (2.6246)	Entropy 0.62571 (0.62539)	Top-1 acc 66.016 (60.735)	Top-5 acc 87.109 (81.713)	lr 0.01167
Train [63][1730/3239]	Time 7.482 (0.980)	Data Time 7.235 (0.492)	Loss 2.3897 (2.6247)	Entropy 0.62586 (0.62539)	Top-1 acc 68.359 (60.737)	Top-5 acc 85.547 (81.708)	lr 0.01167
Train [63][1740/3239]	Time 0.233 (0.980)	Data Time 0.001 (0.491)	Loss 2.8859 (2.6250)	Entropy 0.62577 (0.62539)	Top-1 acc 53.125 (60.728)	Top-5 acc 76.562 (81.701)	lr 0.01167
Train [63][1750/3239]	Time 0.236 (0.982)	Data Time 0.001 (0.494)	Loss 2.5144 (2.6255)	Entropy 0.62586 (0.62540)	Top-1 acc 64.844 (60.712)	Top-5 acc 84.375 (81.689)	lr 0.01167
Train [63][1760/3239]	Time 6.409 (0.982)	Data Time 6.168 (0.495)	Loss 2.4811 (2.6256)	Entropy 0.62592 (0.62540)	Top-1 acc 66.406 (60.709)	Top-5 acc 82.031 (81.684)	lr 0.01167
Train [63][1770/3239]	Time 0.240 (0.985)	Data Time 0.001 (0.498)	Loss 2.6224 (2.6253)	Entropy 0.62616 (0.62540)	Top-1 acc 55.859 (60.715)	Top-5 acc 84.766 (81.694)	lr 0.01167
Train [63][1780/3239]	Time 0.238 (0.989)	Data Time 0.001 (0.502)	Loss 2.7260 (2.6253)	Entropy 0.62595 (0.62541)	Top-1 acc 57.812 (60.718)	Top-5 acc 79.297 (81.692)	lr 0.01167
Train [63][1790/3239]	Time 0.236 (0.986)	Data Time 0.001 (0.499)	Loss 2.6765 (2.6253)	Entropy 0.62611 (0.62541)	Top-1 acc 59.375 (60.718)	Top-5 acc 81.250 (81.693)	lr 0.01167
Train [63][1800/3239]	Time 0.253 (0.994)	Data Time 0.001 (0.508)	Loss 2.6171 (2.6252)	Entropy 0.62574 (0.62541)	Top-1 acc 62.500 (60.725)	Top-5 acc 82.422 (81.697)	lr 0.01166
Train [63][1810/3239]	Time 0.251 (0.992)	Data Time 0.001 (0.506)	Loss 2.4018 (2.6252)	Entropy 0.62571 (0.62541)	Top-1 acc 67.188 (60.726)	Top-5 acc 83.203 (81.695)	lr 0.01166
Train [63][1820/3239]	Time 0.226 (0.994)	Data Time 0.001 (0.509)	Loss 2.4776 (2.6249)	Entropy 0.62560 (0.62542)	Top-1 acc 60.156 (60.727)	Top-5 acc 84.766 (81.705)	lr 0.01166
Train [63][1830/3239]	Time 1.511 (0.999)	Data Time 1.218 (0.514)	Loss 2.5520 (2.6249)	Entropy 0.62590 (0.62542)	Top-1 acc 62.500 (60.726)	Top-5 acc 82.422 (81.705)	lr 0.01166
Train [63][1840/3239]	Time 0.279 (0.999)	Data Time 0.002 (0.515)	Loss 2.6733 (2.6252)	Entropy 0.62593 (0.62542)	Top-1 acc 57.812 (60.720)	Top-5 acc 80.859 (81.701)	lr 0.01166
Train [63][1850/3239]	Time 0.230 (1.002)	Data Time 0.001 (0.518)	Loss 3.0233 (2.6254)	Entropy 0.62576 (0.62542)	Top-1 acc 56.641 (60.718)	Top-5 acc 76.953 (81.697)	lr 0.01166
Train [63][1860/3239]	Time 0.249 (1.006)	Data Time 0.001 (0.522)	Loss 2.6047 (2.6254)	Entropy 0.62578 (0.62543)	Top-1 acc 56.641 (60.723)	Top-5 acc 84.375 (81.700)	lr 0.01166
Train [63][1870/3239]	Time 0.288 (1.006)	Data Time 0.001 (0.523)	Loss 2.7348 (2.6256)	Entropy 0.62628 (0.62543)	Top-1 acc 58.594 (60.716)	Top-5 acc 75.781 (81.695)	lr 0.01166
Train [63][1880/3239]	Time 0.354 (1.006)	Data Time 0.001 (0.523)	Loss 2.6327 (2.6254)	Entropy 0.62675 (0.62543)	Top-1 acc 60.156 (60.713)	Top-5 acc 80.078 (81.700)	lr 0.01166
Train [63][1890/3239]	Time 9.941 (1.011)	Data Time 9.677 (0.528)	Loss 2.4623 (2.6252)	Entropy 0.62697 (0.62544)	Top-1 acc 60.938 (60.720)	Top-5 acc 86.719 (81.706)	lr 0.01166
Train [63][1900/3239]	Time 0.263 (1.013)	Data Time 0.001 (0.531)	Loss 2.3341 (2.6248)	Entropy 0.62720 (0.62545)	Top-1 acc 67.578 (60.725)	Top-5 acc 89.062 (81.716)	lr 0.01165
Train [63][1910/3239]	Time 0.234 (1.013)	Data Time 0.001 (0.531)	Loss 2.6142 (2.6249)	Entropy 0.62720 (0.62546)	Top-1 acc 61.328 (60.723)	Top-5 acc 80.469 (81.715)	lr 0.01165
Train [63][1920/3239]	Time 13.070 (1.017)	Data Time 12.836 (0.535)	Loss 2.7507 (2.6254)	Entropy 0.62709 (0.62547)	Top-1 acc 56.641 (60.714)	Top-5 acc 78.906 (81.707)	lr 0.01165
Train [63][1930/3239]	Time 0.245 (1.020)	Data Time 0.001 (0.539)	Loss 2.6822 (2.6256)	Entropy 0.62709 (0.62547)	Top-1 acc 58.594 (60.715)	Top-5 acc 80.859 (81.707)	lr 0.01165
Train [63][1940/3239]	Time 0.241 (1.021)	Data Time 0.001 (0.540)	Loss 2.6819 (2.6255)	Entropy 0.62687 (0.62548)	Top-1 acc 57.422 (60.717)	Top-5 acc 81.641 (81.707)	lr 0.01165
Train [63][1950/3239]	Time 0.337 (1.018)	Data Time 0.001 (0.537)	Loss 2.5033 (2.6255)	Entropy 0.62691 (0.62549)	Top-1 acc 64.062 (60.715)	Top-5 acc 85.547 (81.706)	lr 0.01165
Train [63][1960/3239]	Time 14.685 (1.031)	Data Time 14.434 (0.551)	Loss 2.7427 (2.6259)	Entropy 0.62714 (0.62550)	Top-1 acc 55.469 (60.696)	Top-5 acc 81.250 (81.701)	lr 0.01165
Train [63][1970/3239]	Time 0.280 (1.028)	Data Time 0.001 (0.548)	Loss 2.5743 (2.6259)	Entropy 0.62723 (0.62551)	Top-1 acc 62.109 (60.692)	Top-5 acc 83.203 (81.704)	lr 0.01165
Train [63][1980/3239]	Time 0.236 (1.026)	Data Time 0.001 (0.546)	Loss 2.5623 (2.6259)	Entropy 0.62752 (0.62552)	Top-1 acc 60.547 (60.690)	Top-5 acc 82.031 (81.704)	lr 0.01165
Train [63][1990/3239]	Time 1.983 (1.032)	Data Time 1.715 (0.553)	Loss 2.6068 (2.6260)	Entropy 0.62738 (0.62553)	Top-1 acc 58.984 (60.688)	Top-5 acc 82.812 (81.706)	lr 0.01165
Train [63][2000/3239]	Time 0.229 (1.035)	Data Time 0.001 (0.556)	Loss 2.6583 (2.6260)	Entropy 0.62757 (0.62554)	Top-1 acc 60.156 (60.688)	Top-5 acc 78.906 (81.704)	lr 0.01164
Train [63][2010/3239]	Time 0.242 (1.035)	Data Time 0.001 (0.557)	Loss 2.5439 (2.6259)	Entropy 0.62743 (0.62554)	Top-1 acc 62.891 (60.690)	Top-5 acc 84.766 (81.707)	lr 0.01164
Train [63][2020/3239]	Time 0.226 (1.038)	Data Time 0.001 (0.560)	Loss 2.5604 (2.6259)	Entropy 0.62687 (0.62555)	Top-1 acc 64.062 (60.687)	Top-5 acc 83.984 (81.709)	lr 0.01164
Train [63][2030/3239]	Time 0.233 (1.043)	Data Time 0.001 (0.565)	Loss 2.6980 (2.6259)	Entropy 0.62674 (0.62556)	Top-1 acc 57.031 (60.688)	Top-5 acc 79.688 (81.707)	lr 0.01164
Train [63][2040/3239]	Time 0.358 (1.041)	Data Time 0.001 (0.563)	Loss 2.3979 (2.6258)	Entropy 0.62704 (0.62557)	Top-1 acc 69.141 (60.692)	Top-5 acc 87.500 (81.711)	lr 0.01164
Train [63][2050/3239]	Time 0.274 (1.046)	Data Time 0.001 (0.569)	Loss 2.5613 (2.6257)	Entropy 0.62709 (0.62557)	Top-1 acc 63.672 (60.696)	Top-5 acc 82.812 (81.712)	lr 0.01164
Train [63][2060/3239]	Time 0.233 (1.051)	Data Time 0.001 (0.573)	Loss 2.6956 (2.6257)	Entropy 0.62722 (0.62558)	Top-1 acc 62.109 (60.695)	Top-5 acc 83.203 (81.711)	lr 0.01164
Train [63][2070/3239]	Time 0.238 (1.051)	Data Time 0.001 (0.574)	Loss 2.5312 (2.6257)	Entropy 0.62751 (0.62559)	Top-1 acc 64.844 (60.696)	Top-5 acc 83.594 (81.712)	lr 0.01164
Train [63][2080/3239]	Time 15.705 (1.056)	Data Time 15.439 (0.579)	Loss 2.7366 (2.6258)	Entropy 0.62763 (0.62560)	Top-1 acc 59.375 (60.698)	Top-5 acc 82.031 (81.713)	lr 0.01164
Train [63][2090/3239]	Time 0.237 (1.059)	Data Time 0.001 (0.582)	Loss 2.7239 (2.6257)	Entropy 0.62766 (0.62561)	Top-1 acc 58.594 (60.703)	Top-5 acc 78.516 (81.713)	lr 0.01164
Train [63][2100/3239]	Time 0.248 (1.062)	Data Time 0.001 (0.586)	Loss 2.5028 (2.6254)	Entropy 0.62786 (0.62562)	Top-1 acc 61.328 (60.708)	Top-5 acc 83.984 (81.719)	lr 0.01163
Train [63][2110/3239]	Time 0.336 (1.059)	Data Time 0.001 (0.583)	Loss 2.6509 (2.6254)	Entropy 0.62705 (0.62563)	Top-1 acc 60.938 (60.710)	Top-5 acc 80.469 (81.716)	lr 0.01163
Train [63][2120/3239]	Time 0.237 (1.067)	Data Time 0.001 (0.591)	Loss 2.6075 (2.6252)	Entropy 0.62672 (0.62563)	Top-1 acc 60.938 (60.712)	Top-5 acc 83.203 (81.726)	lr 0.01163
Train [63][2130/3239]	Time 0.282 (1.065)	Data Time 0.002 (0.590)	Loss 2.6860 (2.6256)	Entropy 0.62717 (0.62564)	Top-1 acc 57.031 (60.701)	Top-5 acc 80.078 (81.717)	lr 0.01163
Train [63][2140/3239]	Time 0.414 (1.082)	Data Time 0.006 (0.590)	Loss 2.7629 (2.6259)	Entropy 0.62645 (0.62564)	Top-1 acc 54.688 (60.689)	Top-5 acc 80.469 (81.710)	lr 0.01163
Train [63][2150/3239]	Time 0.234 (1.080)	Data Time 0.002 (0.588)	Loss 2.7495 (2.6263)	Entropy 0.62634 (0.62565)	Top-1 acc 58.203 (60.683)	Top-5 acc 78.516 (81.702)	lr 0.01163
Train [63][2160/3239]	Time 0.257 (1.077)	Data Time 0.002 (0.585)	Loss 2.7215 (2.6263)	Entropy 0.62645 (0.62565)	Top-1 acc 58.984 (60.682)	Top-5 acc 80.859 (81.701)	lr 0.01163
Train [63][2170/3239]	Time 0.238 (1.074)	Data Time 0.001 (0.582)	Loss 2.3532 (2.6262)	Entropy 0.62660 (0.62566)	Top-1 acc 69.141 (60.688)	Top-5 acc 87.500 (81.706)	lr 0.01163
Train [63][2180/3239]	Time 0.252 (1.078)	Data Time 0.001 (0.587)	Loss 2.5235 (2.6259)	Entropy 0.62677 (0.62566)	Top-1 acc 64.844 (60.697)	Top-5 acc 82.031 (81.711)	lr 0.01163
Train [63][2190/3239]	Time 0.234 (1.077)	Data Time 0.001 (0.586)	Loss 2.6600 (2.6259)	Entropy 0.62709 (0.62567)	Top-1 acc 60.938 (60.700)	Top-5 acc 79.297 (81.711)	lr 0.01163
Train [63][2200/3239]	Time 0.343 (1.074)	Data Time 0.001 (0.584)	Loss 2.6841 (2.6257)	Entropy 0.62752 (0.62567)	Top-1 acc 58.203 (60.707)	Top-5 acc 78.125 (81.709)	lr 0.01162
Train [63][2210/3239]	Time 0.238 (1.082)	Data Time 0.001 (0.592)	Loss 2.5517 (2.6256)	Entropy 0.62751 (0.62568)	Top-1 acc 62.109 (60.708)	Top-5 acc 82.031 (81.708)	lr 0.01162
Train [63][2220/3239]	Time 0.246 (1.080)	Data Time 0.001 (0.590)	Loss 2.6999 (2.6258)	Entropy 0.62763 (0.62569)	Top-1 acc 59.766 (60.703)	Top-5 acc 78.516 (81.703)	lr 0.01162
Train [63][2230/3239]	Time 0.752 (1.078)	Data Time 0.511 (0.588)	Loss 2.6758 (2.6259)	Entropy 0.62758 (0.62570)	Top-1 acc 58.984 (60.696)	Top-5 acc 80.469 (81.703)	lr 0.01162
Train [63][2240/3239]	Time 22.169 (1.084)	Data Time 21.923 (0.595)	Loss 2.6962 (2.6261)	Entropy 0.62750 (0.62571)	Top-1 acc 60.156 (60.694)	Top-5 acc 80.859 (81.702)	lr 0.01162
Train [63][2250/3239]	Time 0.246 (1.082)	Data Time 0.001 (0.593)	Loss 2.5871 (2.6262)	Entropy 0.62789 (0.62572)	Top-1 acc 63.672 (60.690)	Top-5 acc 82.031 (81.702)	lr 0.01162
Train [63][2260/3239]	Time 0.225 (1.081)	Data Time 0.001 (0.592)	Loss 2.8301 (2.6262)	Entropy 0.62788 (0.62572)	Top-1 acc 56.250 (60.684)	Top-5 acc 76.953 (81.700)	lr 0.01162
Train [63][2270/3239]	Time 0.317 (1.079)	Data Time 0.001 (0.590)	Loss 2.4268 (2.6260)	Entropy 0.62767 (0.62573)	Top-1 acc 67.578 (60.690)	Top-5 acc 85.547 (81.702)	lr 0.01162
Train [63][2280/3239]	Time 0.240 (1.085)	Data Time 0.001 (0.597)	Loss 2.7172 (2.6265)	Entropy 0.62786 (0.62574)	Top-1 acc 55.469 (60.677)	Top-5 acc 80.859 (81.696)	lr 0.01162
Train [63][2290/3239]	Time 0.284 (1.083)	Data Time 0.003 (0.595)	Loss 2.6167 (2.6266)	Entropy 0.62783 (0.62575)	Top-1 acc 57.031 (60.676)	Top-5 acc 80.469 (81.692)	lr 0.01161
Train [63][2300/3239]	Time 0.246 (1.081)	Data Time 0.001 (0.593)	Loss 2.5204 (2.6265)	Entropy 0.62796 (0.62576)	Top-1 acc 61.719 (60.676)	Top-5 acc 85.547 (81.695)	lr 0.01161
Train [63][2310/3239]	Time 0.240 (1.089)	Data Time 0.001 (0.601)	Loss 2.9177 (2.6267)	Entropy 0.62791 (0.62577)	Top-1 acc 51.172 (60.670)	Top-5 acc 76.562 (81.689)	lr 0.01161
Train [63][2320/3239]	Time 0.248 (1.086)	Data Time 0.001 (0.599)	Loss 2.6570 (2.6270)	Entropy 0.62800 (0.62578)	Top-1 acc 61.328 (60.665)	Top-5 acc 83.594 (81.684)	lr 0.01161
Train [63][2330/3239]	Time 0.241 (1.083)	Data Time 0.001 (0.596)	Loss 2.7272 (2.6273)	Entropy 0.62832 (0.62579)	Top-1 acc 56.250 (60.659)	Top-5 acc 77.344 (81.678)	lr 0.01161
Train [63][2340/3239]	Time 0.230 (1.091)	Data Time 0.001 (0.604)	Loss 2.7081 (2.6274)	Entropy 0.62825 (0.62580)	Top-1 acc 60.938 (60.659)	Top-5 acc 78.125 (81.675)	lr 0.01161
Train [63][2350/3239]	Time 0.235 (1.088)	Data Time 0.001 (0.602)	Loss 2.9741 (2.6274)	Entropy 0.62793 (0.62581)	Top-1 acc 49.609 (60.657)	Top-5 acc 76.562 (81.676)	lr 0.01161
Train [63][2360/3239]	Time 0.248 (1.086)	Data Time 0.001 (0.600)	Loss 2.4988 (2.6274)	Entropy 0.62782 (0.62582)	Top-1 acc 62.109 (60.656)	Top-5 acc 83.594 (81.676)	lr 0.01161
Train [63][2370/3239]	Time 0.263 (1.094)	Data Time 0.002 (0.608)	Loss 2.7075 (2.6273)	Entropy 0.62761 (0.62583)	Top-1 acc 61.328 (60.659)	Top-5 acc 77.344 (81.678)	lr 0.01161
Train [63][2380/3239]	Time 0.224 (1.091)	Data Time 0.001 (0.606)	Loss 2.6394 (2.6270)	Entropy 0.62742 (0.62583)	Top-1 acc 59.375 (60.662)	Top-5 acc 81.641 (81.684)	lr 0.01161
Train [63][2390/3239]	Time 0.243 (1.089)	Data Time 0.001 (0.604)	Loss 2.5705 (2.6271)	Entropy 0.62721 (0.62584)	Top-1 acc 62.891 (60.666)	Top-5 acc 82.422 (81.681)	lr 0.01160
Train [63][2400/3239]	Time 20.907 (1.095)	Data Time 20.648 (0.611)	Loss 2.6954 (2.6271)	Entropy 0.62746 (0.62585)	Top-1 acc 59.375 (60.664)	Top-5 acc 80.859 (81.681)	lr 0.01160
Train [63][2410/3239]	Time 0.291 (1.093)	Data Time 0.003 (0.608)	Loss 2.4564 (2.6270)	Entropy 0.62734 (0.62585)	Top-1 acc 64.844 (60.667)	Top-5 acc 84.766 (81.682)	lr 0.01160
Train [63][2420/3239]	Time 0.494 (1.090)	Data Time 0.263 (0.606)	Loss 2.7048 (2.6272)	Entropy 0.62730 (0.62586)	Top-1 acc 60.156 (60.666)	Top-5 acc 78.125 (81.677)	lr 0.01160
Train [63][2430/3239]	Time 0.359 (1.090)	Data Time 0.001 (0.606)	Loss 2.5399 (2.6269)	Entropy 0.62695 (0.62587)	Top-1 acc 61.328 (60.670)	Top-5 acc 83.203 (81.682)	lr 0.01160
Train [63][2440/3239]	Time 0.242 (1.096)	Data Time 0.001 (0.612)	Loss 2.7454 (2.6270)	Entropy 0.62686 (0.62587)	Top-1 acc 56.250 (60.667)	Top-5 acc 80.469 (81.681)	lr 0.01160
Train [63][2450/3239]	Time 0.234 (1.093)	Data Time 0.001 (0.610)	Loss 2.7502 (2.6272)	Entropy 0.62698 (0.62587)	Top-1 acc 57.031 (60.666)	Top-5 acc 78.125 (81.676)	lr 0.01160
Train [63][2460/3239]	Time 0.242 (1.092)	Data Time 0.001 (0.609)	Loss 2.6342 (2.6272)	Entropy 0.62689 (0.62588)	Top-1 acc 62.891 (60.668)	Top-5 acc 80.469 (81.675)	lr 0.01160
Train [63][2470/3239]	Time 0.236 (1.099)	Data Time 0.001 (0.615)	Loss 2.7271 (2.6271)	Entropy 0.62679 (0.62588)	Top-1 acc 60.547 (60.676)	Top-5 acc 79.297 (81.675)	lr 0.01160
Train [63][2480/3239]	Time 0.236 (1.096)	Data Time 0.001 (0.613)	Loss 2.4146 (2.6271)	Entropy 0.62653 (0.62589)	Top-1 acc 68.359 (60.681)	Top-5 acc 86.719 (81.677)	lr 0.01160
Train [63][2490/3239]	Time 0.240 (1.095)	Data Time 0.001 (0.612)	Loss 2.6238 (2.6272)	Entropy 0.62673 (0.62589)	Top-1 acc 59.375 (60.678)	Top-5 acc 81.641 (81.672)	lr 0.01159
Train [63][2500/3239]	Time 0.358 (1.102)	Data Time 0.001 (0.619)	Loss 2.5804 (2.6275)	Entropy 0.62646 (0.62589)	Top-1 acc 63.672 (60.674)	Top-5 acc 80.469 (81.666)	lr 0.01159
Train [63][2510/3239]	Time 0.233 (1.099)	Data Time 0.002 (0.617)	Loss 2.6937 (2.6276)	Entropy 0.62686 (0.62589)	Top-1 acc 60.156 (60.668)	Top-5 acc 80.078 (81.665)	lr 0.01159
Train [63][2520/3239]	Time 0.560 (1.096)	Data Time 0.275 (0.614)	Loss 2.7693 (2.6276)	Entropy 0.62676 (0.62590)	Top-1 acc 59.766 (60.668)	Top-5 acc 78.516 (81.664)	lr 0.01159
Train [63][2530/3239]	Time 0.249 (1.104)	Data Time 0.001 (0.622)	Loss 2.5972 (2.6276)	Entropy 0.62639 (0.62590)	Top-1 acc 62.891 (60.673)	Top-5 acc 83.203 (81.665)	lr 0.01159
Train [63][2540/3239]	Time 0.277 (1.101)	Data Time 0.002 (0.619)	Loss 2.7733 (2.6278)	Entropy 0.62640 (0.62590)	Top-1 acc 59.766 (60.668)	Top-5 acc 77.734 (81.663)	lr 0.01159
Train [63][2550/3239]	Time 0.237 (1.098)	Data Time 0.001 (0.617)	Loss 2.6323 (2.6277)	Entropy 0.62650 (0.62590)	Top-1 acc 62.891 (60.669)	Top-5 acc 80.859 (81.663)	lr 0.01159
Train [63][2560/3239]	Time 24.150 (1.106)	Data Time 23.866 (0.625)	Loss 2.6419 (2.6278)	Entropy 0.62647 (0.62591)	Top-1 acc 61.328 (60.666)	Top-5 acc 82.812 (81.663)	lr 0.01159
Train [63][2570/3239]	Time 0.233 (1.103)	Data Time 0.001 (0.622)	Loss 2.6299 (2.6279)	Entropy 0.62652 (0.62591)	Top-1 acc 60.547 (60.664)	Top-5 acc 80.859 (81.660)	lr 0.01159
Train [63][2580/3239]	Time 0.238 (1.101)	Data Time 0.001 (0.620)	Loss 2.6513 (2.6278)	Entropy 0.62671 (0.62591)	Top-1 acc 61.328 (60.666)	Top-5 acc 80.469 (81.665)	lr 0.01159
Train [63][2590/3239]	Time 0.327 (1.099)	Data Time 0.001 (0.619)	Loss 2.7553 (2.6279)	Entropy 0.62668 (0.62591)	Top-1 acc 57.812 (60.664)	Top-5 acc 80.859 (81.664)	lr 0.01158
Train [63][2600/3239]	Time 0.249 (1.105)	Data Time 0.001 (0.625)	Loss 2.6753 (2.6278)	Entropy 0.62662 (0.62592)	Top-1 acc 60.938 (60.667)	Top-5 acc 80.469 (81.668)	lr 0.01158
Train [63][2610/3239]	Time 0.251 (1.103)	Data Time 0.001 (0.623)	Loss 2.7508 (2.6278)	Entropy 0.62676 (0.62592)	Top-1 acc 56.641 (60.666)	Top-5 acc 81.250 (81.670)	lr 0.01158
Train [63][2620/3239]	Time 0.237 (1.101)	Data Time 0.001 (0.622)	Loss 2.4857 (2.6279)	Entropy 0.62632 (0.62592)	Top-1 acc 63.281 (60.661)	Top-5 acc 88.281 (81.671)	lr 0.01158
Train [63][2630/3239]	Time 0.237 (1.107)	Data Time 0.001 (0.627)	Loss 2.7136 (2.6278)	Entropy 0.62639 (0.62593)	Top-1 acc 59.375 (60.660)	Top-5 acc 76.953 (81.668)	lr 0.01158
Train [63][2640/3239]	Time 1.708 (1.105)	Data Time 1.451 (0.626)	Loss 2.6369 (2.6278)	Entropy 0.62651 (0.62593)	Top-1 acc 59.766 (60.665)	Top-5 acc 79.688 (81.668)	lr 0.01158
Train [63][2650/3239]	Time 0.234 (1.104)	Data Time 0.001 (0.625)	Loss 2.6828 (2.6277)	Entropy 0.62642 (0.62593)	Top-1 acc 60.938 (60.667)	Top-5 acc 79.688 (81.669)	lr 0.01158
Train [63][2660/3239]	Time 0.318 (1.109)	Data Time 0.001 (0.631)	Loss 2.5132 (2.6277)	Entropy 0.62662 (0.62593)	Top-1 acc 70.312 (60.668)	Top-5 acc 82.031 (81.671)	lr 0.01158
Train [63][2670/3239]	Time 0.270 (1.107)	Data Time 0.002 (0.628)	Loss 2.4344 (2.6275)	Entropy 0.62661 (0.62593)	Top-1 acc 66.016 (60.671)	Top-5 acc 86.328 (81.676)	lr 0.01158
Train [63][2680/3239]	Time 3.909 (1.105)	Data Time 3.654 (0.627)	Loss 2.6401 (2.6275)	Entropy 0.62599 (0.62594)	Top-1 acc 59.766 (60.668)	Top-5 acc 82.031 (81.675)	lr 0.01158
Train [63][2690/3239]	Time 0.287 (1.110)	Data Time 0.001 (0.632)	Loss 2.4908 (2.6277)	Entropy 0.62607 (0.62594)	Top-1 acc 64.062 (60.668)	Top-5 acc 84.375 (81.675)	lr 0.01157
Train [63][2700/3239]	Time 0.225 (1.108)	Data Time 0.001 (0.630)	Loss 2.6235 (2.6275)	Entropy 0.62601 (0.62594)	Top-1 acc 60.156 (60.672)	Top-5 acc 80.859 (81.676)	lr 0.01157
Train [63][2710/3239]	Time 0.248 (1.106)	Data Time 0.001 (0.628)	Loss 2.7074 (2.6275)	Entropy 0.62573 (0.62594)	Top-1 acc 56.641 (60.672)	Top-5 acc 83.594 (81.674)	lr 0.01157
Train [63][2720/3239]	Time 12.534 (1.111)	Data Time 12.281 (0.634)	Loss 2.7157 (2.6276)	Entropy 0.62610 (0.62594)	Top-1 acc 58.984 (60.671)	Top-5 acc 78.906 (81.674)	lr 0.01157
Train [63][2730/3239]	Time 0.243 (1.109)	Data Time 0.001 (0.632)	Loss 2.3760 (2.6276)	Entropy 0.62637 (0.62594)	Top-1 acc 68.359 (60.669)	Top-5 acc 87.500 (81.675)	lr 0.01157
Train [63][2740/3239]	Time 0.223 (1.108)	Data Time 0.001 (0.631)	Loss 2.6855 (2.6276)	Entropy 0.62640 (0.62594)	Top-1 acc 65.625 (60.669)	Top-5 acc 78.516 (81.673)	lr 0.01157
Train [63][2750/3239]	Time 3.816 (1.107)	Data Time 3.461 (0.630)	Loss 2.6271 (2.6279)	Entropy 0.62614 (0.62594)	Top-1 acc 61.719 (60.664)	Top-5 acc 83.984 (81.666)	lr 0.01157
Train [63][2760/3239]	Time 0.239 (1.108)	Data Time 0.001 (0.632)	Loss 2.5465 (2.6278)	Entropy 0.62603 (0.62594)	Top-1 acc 60.156 (60.665)	Top-5 acc 86.719 (81.668)	lr 0.01157
Train [63][2770/3239]	Time 0.244 (1.106)	Data Time 0.001 (0.630)	Loss 2.5362 (2.6279)	Entropy 0.62620 (0.62594)	Top-1 acc 60.547 (60.668)	Top-5 acc 82.031 (81.667)	lr 0.01157
Train [63][2780/3239]	Time 0.229 (1.104)	Data Time 0.001 (0.628)	Loss 2.6760 (2.6280)	Entropy 0.62632 (0.62594)	Top-1 acc 59.766 (60.667)	Top-5 acc 81.641 (81.662)	lr 0.01157
Train [63][2790/3239]	Time 0.230 (1.106)	Data Time 0.001 (0.630)	Loss 2.6513 (2.6279)	Entropy 0.62619 (0.62594)	Top-1 acc 57.422 (60.667)	Top-5 acc 80.859 (81.667)	lr 0.01156
Train [63][2800/3239]	Time 0.256 (1.117)	Data Time 0.002 (0.628)	Loss 2.5984 (2.6277)	Entropy 0.62579 (0.62594)	Top-1 acc 60.547 (60.672)	Top-5 acc 79.688 (81.670)	lr 0.01156
Train [63][2810/3239]	Time 0.257 (1.115)	Data Time 0.002 (0.625)	Loss 2.6469 (2.6279)	Entropy 0.62597 (0.62594)	Top-1 acc 57.422 (60.664)	Top-5 acc 84.375 (81.664)	lr 0.01156
Train [63][2820/3239]	Time 0.340 (1.112)	Data Time 0.001 (0.623)	Loss 2.5652 (2.6281)	Entropy 0.62573 (0.62594)	Top-1 acc 64.453 (60.658)	Top-5 acc 82.031 (81.660)	lr 0.01156
Train [63][2830/3239]	Time 0.249 (1.110)	Data Time 0.002 (0.621)	Loss 2.6436 (2.6282)	Entropy 0.62588 (0.62594)	Top-1 acc 60.938 (60.659)	Top-5 acc 80.078 (81.658)	lr 0.01156
Train [63][2840/3239]	Time 0.224 (1.107)	Data Time 0.001 (0.619)	Loss 2.6648 (2.6281)	Entropy 0.62571 (0.62594)	Top-1 acc 61.719 (60.662)	Top-5 acc 80.469 (81.663)	lr 0.01156
Train [63][2850/3239]	Time 0.228 (1.106)	Data Time 0.001 (0.618)	Loss 2.6924 (2.6281)	Entropy 0.62565 (0.62594)	Top-1 acc 58.594 (60.661)	Top-5 acc 83.203 (81.667)	lr 0.01156
Train [63][2860/3239]	Time 2.879 (1.106)	Data Time 2.620 (0.618)	Loss 2.6935 (2.6280)	Entropy 0.62567 (0.62594)	Top-1 acc 59.375 (60.665)	Top-5 acc 79.688 (81.671)	lr 0.01156
Train [63][2870/3239]	Time 0.420 (1.105)	Data Time 0.180 (0.617)	Loss 2.5682 (2.6278)	Entropy 0.62570 (0.62594)	Top-1 acc 67.188 (60.669)	Top-5 acc 83.203 (81.675)	lr 0.01156
Train [63][2880/3239]	Time 12.388 (1.108)	Data Time 12.130 (0.620)	Loss 2.5964 (2.6277)	Entropy 0.62567 (0.62594)	Top-1 acc 63.281 (60.672)	Top-5 acc 82.031 (81.680)	lr 0.01156
Train [63][2890/3239]	Time 0.242 (1.105)	Data Time 0.001 (0.618)	Loss 2.6767 (2.6277)	Entropy 0.62564 (0.62594)	Top-1 acc 59.375 (60.675)	Top-5 acc 79.688 (81.679)	lr 0.01155
Train [63][2900/3239]	Time 0.247 (1.108)	Data Time 0.001 (0.621)	Loss 3.0561 (2.6279)	Entropy 0.62573 (0.62594)	Top-1 acc 49.609 (60.667)	Top-5 acc 75.000 (81.677)	lr 0.01155
Train [63][2910/3239]	Time 0.342 (1.106)	Data Time 0.001 (0.619)	Loss 2.8180 (2.6280)	Entropy 0.62597 (0.62594)	Top-1 acc 55.078 (60.662)	Top-5 acc 76.562 (81.674)	lr 0.01155
Train [63][2920/3239]	Time 0.235 (1.107)	Data Time 0.001 (0.621)	Loss 2.4099 (2.6278)	Entropy 0.62599 (0.62594)	Top-1 acc 65.234 (60.670)	Top-5 acc 85.547 (81.678)	lr 0.01155
Train [63][2930/3239]	Time 1.858 (1.108)	Data Time 1.581 (0.622)	Loss 2.6763 (2.6279)	Entropy 0.62585 (0.62594)	Top-1 acc 62.109 (60.667)	Top-5 acc 78.906 (81.674)	lr 0.01155
Train [63][2940/3239]	Time 0.256 (1.106)	Data Time 0.001 (0.620)	Loss 2.7849 (2.6280)	Entropy 0.62582 (0.62594)	Top-1 acc 57.812 (60.657)	Top-5 acc 76.562 (81.672)	lr 0.01155
Train [63][2950/3239]	Time 0.244 (1.105)	Data Time 0.001 (0.619)	Loss 2.5655 (2.6279)	Entropy 0.62587 (0.62594)	Top-1 acc 62.109 (60.658)	Top-5 acc 83.203 (81.674)	lr 0.01155
Train [63][2960/3239]	Time 0.251 (1.105)	Data Time 0.001 (0.619)	Loss 2.5898 (2.6279)	Entropy 0.62576 (0.62594)	Top-1 acc 59.375 (60.651)	Top-5 acc 83.984 (81.678)	lr 0.01155
Train [63][2970/3239]	Time 0.229 (1.104)	Data Time 0.001 (0.618)	Loss 2.5949 (2.6278)	Entropy 0.62589 (0.62594)	Top-1 acc 62.109 (60.650)	Top-5 acc 82.031 (81.679)	lr 0.01155
Train [63][2980/3239]	Time 0.377 (1.102)	Data Time 0.001 (0.617)	Loss 2.6624 (2.6278)	Entropy 0.62611 (0.62594)	Top-1 acc 58.984 (60.649)	Top-5 acc 79.688 (81.681)	lr 0.01155
Train [63][2990/3239]	Time 0.232 (1.101)	Data Time 0.001 (0.616)	Loss 2.7413 (2.6279)	Entropy 0.62612 (0.62594)	Top-1 acc 58.984 (60.649)	Top-5 acc 80.859 (81.683)	lr 0.01154
Train [63][3000/3239]	Time 0.249 (1.101)	Data Time 0.001 (0.615)	Loss 2.8368 (2.6282)	Entropy 0.62618 (0.62594)	Top-1 acc 55.469 (60.642)	Top-5 acc 78.125 (81.677)	lr 0.01154
Train [63][3010/3239]	Time 0.255 (1.100)	Data Time 0.001 (0.615)	Loss 2.4163 (2.6282)	Entropy 0.62609 (0.62594)	Top-1 acc 61.719 (60.640)	Top-5 acc 85.938 (81.678)	lr 0.01154
Train [63][3020/3239]	Time 0.782 (1.098)	Data Time 0.552 (0.613)	Loss 2.8351 (2.6283)	Entropy 0.62624 (0.62594)	Top-1 acc 53.906 (60.639)	Top-5 acc 78.125 (81.677)	lr 0.01154
Train [63][3030/3239]	Time 0.249 (1.098)	Data Time 0.001 (0.613)	Loss 2.6035 (2.6284)	Entropy 0.62670 (0.62594)	Top-1 acc 62.109 (60.637)	Top-5 acc 80.469 (81.675)	lr 0.01154
Train [63][3040/3239]	Time 2.481 (1.097)	Data Time 2.221 (0.612)	Loss 2.7092 (2.6286)	Entropy 0.62678 (0.62594)	Top-1 acc 62.109 (60.635)	Top-5 acc 77.734 (81.670)	lr 0.01154
Train [63][3050/3239]	Time 0.231 (1.094)	Data Time 0.001 (0.610)	Loss 2.5906 (2.6286)	Entropy 0.62676 (0.62594)	Top-1 acc 62.109 (60.635)	Top-5 acc 83.203 (81.669)	lr 0.01154
Train [63][3060/3239]	Time 0.232 (1.096)	Data Time 0.001 (0.612)	Loss 2.6504 (2.6287)	Entropy 0.62654 (0.62595)	Top-1 acc 62.109 (60.634)	Top-5 acc 78.516 (81.668)	lr 0.01154
Train [63][3070/3239]	Time 0.274 (1.093)	Data Time 0.001 (0.610)	Loss 2.5329 (2.6284)	Entropy 0.62611 (0.62595)	Top-1 acc 60.547 (60.639)	Top-5 acc 85.547 (81.674)	lr 0.01154
Train [63][3080/3239]	Time 0.254 (1.093)	Data Time 0.001 (0.609)	Loss 2.7004 (2.6285)	Entropy 0.62637 (0.62595)	Top-1 acc 60.156 (60.640)	Top-5 acc 80.469 (81.676)	lr 0.01154
Train [63][3090/3239]	Time 4.054 (1.096)	Data Time 3.801 (0.613)	Loss 2.9080 (2.6286)	Entropy 0.62639 (0.62595)	Top-1 acc 52.734 (60.634)	Top-5 acc 77.344 (81.673)	lr 0.01153
Train [63][3100/3239]	Time 0.233 (1.095)	Data Time 0.001 (0.612)	Loss 2.8894 (2.6286)	Entropy 0.62624 (0.62595)	Top-1 acc 55.078 (60.634)	Top-5 acc 77.734 (81.674)	lr 0.01153
Train [63][3110/3239]	Time 0.234 (1.095)	Data Time 0.001 (0.612)	Loss 2.4379 (2.6285)	Entropy 0.62635 (0.62595)	Top-1 acc 66.797 (60.638)	Top-5 acc 81.250 (81.675)	lr 0.01153
Train [63][3120/3239]	Time 0.237 (1.097)	Data Time 0.001 (0.614)	Loss 2.5480 (2.6284)	Entropy 0.62655 (0.62595)	Top-1 acc 65.234 (60.641)	Top-5 acc 82.812 (81.676)	lr 0.01153
Train [63][3130/3239]	Time 0.237 (1.096)	Data Time 0.001 (0.614)	Loss 2.6887 (2.6284)	Entropy 0.62635 (0.62596)	Top-1 acc 61.719 (60.643)	Top-5 acc 77.344 (81.674)	lr 0.01153
Train [63][3140/3239]	Time 0.322 (1.096)	Data Time 0.001 (0.614)	Loss 2.5073 (2.6282)	Entropy 0.62608 (0.62596)	Top-1 acc 64.453 (60.647)	Top-5 acc 83.594 (81.677)	lr 0.01153
Train [63][3150/3239]	Time 7.112 (1.098)	Data Time 6.864 (0.615)	Loss 2.4481 (2.6281)	Entropy 0.62639 (0.62596)	Top-1 acc 65.625 (60.651)	Top-5 acc 83.984 (81.679)	lr 0.01153
Train [63][3160/3239]	Time 0.233 (1.098)	Data Time 0.001 (0.616)	Loss 2.3478 (2.6281)	Entropy 0.62602 (0.62596)	Top-1 acc 65.234 (60.647)	Top-5 acc 86.328 (81.681)	lr 0.01153
Train [63][3170/3239]	Time 0.274 (1.098)	Data Time 0.002 (0.616)	Loss 2.7835 (2.6280)	Entropy 0.62609 (0.62596)	Top-1 acc 58.203 (60.645)	Top-5 acc 77.734 (81.682)	lr 0.01153
Train [63][3180/3239]	Time 3.455 (1.098)	Data Time 3.219 (0.616)	Loss 2.6758 (2.6281)	Entropy 0.62603 (0.62596)	Top-1 acc 57.812 (60.642)	Top-5 acc 82.031 (81.681)	lr 0.01153
Train [63][3190/3239]	Time 0.229 (1.100)	Data Time 0.000 (0.619)	Loss 2.5681 (2.6279)	Entropy 0.62605 (0.62596)	Top-1 acc 58.984 (60.646)	Top-5 acc 82.812 (81.683)	lr 0.01152
Train [63][3200/3239]	Time 7.330 (1.100)	Data Time 7.092 (0.619)	Loss 2.5522 (2.6281)	Entropy 0.62609 (0.62596)	Top-1 acc 61.328 (60.642)	Top-5 acc 83.203 (81.678)	lr 0.01152
Train [63][3210/3239]	Time 0.325 (1.098)	Data Time 0.000 (0.617)	Loss 2.6799 (2.6283)	Entropy 0.62571 (0.62596)	Top-1 acc 62.891 (60.639)	Top-5 acc 80.078 (81.675)	lr 0.01152
Train [63][3220/3239]	Time 0.229 (1.101)	Data Time 0.000 (0.620)	Loss 2.7197 (2.6283)	Entropy 0.62560 (0.62596)	Top-1 acc 56.250 (60.640)	Top-5 acc 80.469 (81.675)	lr 0.01152
Train [63][3230/3239]	Time 0.228 (1.099)	Data Time 0.000 (0.618)	Loss 2.5909 (2.6284)	Entropy 0.62583 (0.62596)	Top-1 acc 61.719 (60.638)	Top-5 acc 82.812 (81.673)	lr 0.01152
Train [63][3239/3239]	Time 0.949 (1.097)	Data Time 0.000 (0.617)	Loss 2.8225 (2.6286)	Entropy 0.62558 (0.62596)	Top-1 acc 55.556 (60.634)	Top-5 acc 76.543 (81.671)	lr 0.01152
==========Valid [63/120]	loss 1.366	top-1 acc 68.326 (68.326)	top-5 acc 88.027	Train top-1 60.634	top-5 81.671	Entropy 0.62558	Latency-None: 0.000ms	Flops: 539.91M
Train [64][0/3239]	Time 49.238 (49.238)	Data Time 48.682 (48.682)	Loss 2.5765 (2.5765)	Entropy 0.62555 (0.62555)	Top-1 acc 61.719 (61.719)	Top-5 acc 82.812 (82.812)	lr 0.01152
Train [64][10/3239]	Time 0.253 (4.942)	Data Time 0.002 (4.446)	Loss 2.6850 (2.5827)	Entropy 0.62544 (0.62548)	Top-1 acc 60.938 (62.749)	Top-5 acc 80.469 (82.209)	lr 0.01152
Train [64][20/3239]	Time 0.239 (2.799)	Data Time 0.001 (2.330)	Loss 2.8084 (2.6024)	Entropy 0.62562 (0.62549)	Top-1 acc 56.641 (61.663)	Top-5 acc 78.125 (82.199)	lr 0.01152
Train [64][30/3239]	Time 0.257 (2.034)	Data Time 0.002 (1.579)	Loss 2.5387 (2.5856)	Entropy 0.62541 (0.62547)	Top-1 acc 63.672 (61.731)	Top-5 acc 79.688 (82.245)	lr 0.01152
Train [64][40/3239]	Time 0.349 (1.852)	Data Time 0.001 (1.402)	Loss 2.5306 (2.5942)	Entropy 0.62539 (0.62544)	Top-1 acc 62.109 (61.719)	Top-5 acc 83.984 (82.079)	lr 0.01152
Train [64][50/3239]	Time 0.230 (1.568)	Data Time 0.001 (1.127)	Loss 2.7443 (2.5988)	Entropy 0.62541 (0.62544)	Top-1 acc 57.812 (61.627)	Top-5 acc 78.125 (82.070)	lr 0.01151
Train [64][60/3239]	Time 0.253 (1.378)	Data Time 0.001 (0.943)	Loss 2.6300 (2.5988)	Entropy 0.62546 (0.62544)	Top-1 acc 59.766 (61.642)	Top-5 acc 80.859 (82.063)	lr 0.01151
Train [64][70/3239]	Time 0.228 (1.378)	Data Time 0.001 (0.939)	Loss 2.3806 (2.6013)	Entropy 0.62563 (0.62546)	Top-1 acc 67.578 (61.394)	Top-5 acc 84.766 (82.004)	lr 0.01151
Train [64][80/3239]	Time 0.248 (1.260)	Data Time 0.001 (0.824)	Loss 2.5238 (2.6045)	Entropy 0.62553 (0.62548)	Top-1 acc 65.234 (61.309)	Top-5 acc 82.812 (81.959)	lr 0.01151
Train [64][90/3239]	Time 0.258 (1.170)	Data Time 0.001 (0.733)	Loss 2.6047 (2.6085)	Entropy 0.62521 (0.62547)	Top-1 acc 60.547 (61.234)	Top-5 acc 82.812 (81.937)	lr 0.01151
Train [64][100/3239]	Time 3.006 (1.182)	Data Time 2.723 (0.743)	Loss 2.6323 (2.6059)	Entropy 0.62528 (0.62544)	Top-1 acc 58.984 (61.355)	Top-5 acc 81.641 (81.965)	lr 0.01151
Train [64][110/3239]	Time 0.223 (1.114)	Data Time 0.001 (0.677)	Loss 2.5043 (2.6094)	Entropy 0.62472 (0.62541)	Top-1 acc 67.578 (61.226)	Top-5 acc 82.031 (81.869)	lr 0.01151
Train [64][120/3239]	Time 0.242 (1.057)	Data Time 0.001 (0.621)	Loss 2.4513 (2.6112)	Entropy 0.62498 (0.62536)	Top-1 acc 64.844 (61.122)	Top-5 acc 84.766 (81.860)	lr 0.01151
Train [64][130/3239]	Time 1.776 (1.026)	Data Time 1.412 (0.589)	Loss 2.5434 (2.6086)	Entropy 0.62492 (0.62533)	Top-1 acc 58.203 (61.155)	Top-5 acc 85.938 (81.972)	lr 0.01151
Train [64][140/3239]	Time 0.252 (1.017)	Data Time 0.001 (0.583)	Loss 2.6620 (2.6096)	Entropy 0.62511 (0.62531)	Top-1 acc 60.156 (61.115)	Top-5 acc 79.297 (81.926)	lr 0.01151
Train [64][150/3239]	Time 0.229 (0.977)	Data Time 0.001 (0.544)	Loss 2.6071 (2.6095)	Entropy 0.62509 (0.62530)	Top-1 acc 63.672 (61.093)	Top-5 acc 85.156 (81.990)	lr 0.01150
Train [64][160/3239]	Time 0.249 (0.944)	Data Time 0.001 (0.510)	Loss 2.5527 (2.6080)	Entropy 0.62504 (0.62528)	Top-1 acc 62.891 (61.122)	Top-5 acc 83.984 (81.995)	lr 0.01150
Train [64][170/3239]	Time 0.239 (0.973)	Data Time 0.001 (0.540)	Loss 2.4388 (2.6042)	Entropy 0.62531 (0.62528)	Top-1 acc 64.062 (61.202)	Top-5 acc 84.375 (82.066)	lr 0.01150
Train [64][180/3239]	Time 0.236 (0.942)	Data Time 0.001 (0.510)	Loss 2.4673 (2.6036)	Entropy 0.62552 (0.62528)	Top-1 acc 62.891 (61.177)	Top-5 acc 83.984 (82.085)	lr 0.01150
Train [64][190/3239]	Time 0.333 (0.917)	Data Time 0.002 (0.484)	Loss 2.7731 (2.6027)	Entropy 0.62562 (0.62530)	Top-1 acc 57.422 (61.234)	Top-5 acc 79.688 (82.109)	lr 0.01150
Train [64][200/3239]	Time 0.339 (0.932)	Data Time 0.001 (0.499)	Loss 2.5583 (2.6018)	Entropy 0.62577 (0.62532)	Top-1 acc 63.281 (61.295)	Top-5 acc 81.641 (82.125)	lr 0.01150
Train [64][210/3239]	Time 0.432 (1.103)	Data Time 0.004 (0.476)	Loss 2.5741 (2.6010)	Entropy 0.62575 (0.62533)	Top-1 acc 63.281 (61.323)	Top-5 acc 81.641 (82.142)	lr 0.01150
Train [64][220/3239]	Time 0.232 (1.075)	Data Time 0.002 (0.455)	Loss 2.4350 (2.6008)	Entropy 0.62548 (0.62534)	Top-1 acc 64.453 (61.346)	Top-5 acc 85.547 (82.132)	lr 0.01150
Train [64][230/3239]	Time 0.252 (1.047)	Data Time 0.002 (0.435)	Loss 2.7338 (2.6006)	Entropy 0.62528 (0.62535)	Top-1 acc 57.031 (61.306)	Top-5 acc 80.469 (82.138)	lr 0.01150
Train [64][240/3239]	Time 0.250 (1.021)	Data Time 0.001 (0.417)	Loss 2.4843 (2.6017)	Entropy 0.62541 (0.62535)	Top-1 acc 62.500 (61.273)	Top-5 acc 83.594 (82.119)	lr 0.01150
Train [64][250/3239]	Time 0.270 (0.997)	Data Time 0.001 (0.400)	Loss 2.5359 (2.6037)	Entropy 0.62510 (0.62535)	Top-1 acc 62.891 (61.238)	Top-5 acc 82.812 (82.061)	lr 0.01149
Train [64][260/3239]	Time 0.245 (0.976)	Data Time 0.001 (0.385)	Loss 2.5880 (2.6045)	Entropy 0.62504 (0.62535)	Top-1 acc 58.984 (61.198)	Top-5 acc 84.375 (82.049)	lr 0.01149
Train [64][270/3239]	Time 0.239 (0.956)	Data Time 0.001 (0.371)	Loss 2.4638 (2.6036)	Entropy 0.62477 (0.62533)	Top-1 acc 64.844 (61.203)	Top-5 acc 85.938 (82.074)	lr 0.01149
Train [64][280/3239]	Time 0.276 (0.938)	Data Time 0.002 (0.358)	Loss 2.5689 (2.6036)	Entropy 0.62487 (0.62532)	Top-1 acc 60.938 (61.218)	Top-5 acc 85.156 (82.080)	lr 0.01149
Train [64][290/3239]	Time 0.331 (0.921)	Data Time 0.001 (0.346)	Loss 2.5367 (2.6040)	Entropy 0.62496 (0.62530)	Top-1 acc 62.500 (61.197)	Top-5 acc 82.812 (82.076)	lr 0.01149
Train [64][300/3239]	Time 0.235 (0.905)	Data Time 0.001 (0.334)	Loss 2.5134 (2.6055)	Entropy 0.62521 (0.62529)	Top-1 acc 61.328 (61.175)	Top-5 acc 85.938 (82.051)	lr 0.01149
Train [64][310/3239]	Time 0.256 (0.892)	Data Time 0.001 (0.325)	Loss 2.4875 (2.6065)	Entropy 0.62506 (0.62529)	Top-1 acc 64.062 (61.182)	Top-5 acc 85.938 (82.040)	lr 0.01149
Train [64][320/3239]	Time 0.247 (0.885)	Data Time 0.001 (0.322)	Loss 2.7534 (2.6058)	Entropy 0.62535 (0.62528)	Top-1 acc 56.641 (61.181)	Top-5 acc 80.469 (82.048)	lr 0.01149
Train [64][330/3239]	Time 0.260 (0.873)	Data Time 0.001 (0.312)	Loss 2.7090 (2.6051)	Entropy 0.62533 (0.62529)	Top-1 acc 58.984 (61.207)	Top-5 acc 81.641 (82.058)	lr 0.01149
Train [64][340/3239]	Time 0.235 (0.870)	Data Time 0.001 (0.312)	Loss 2.6408 (2.6042)	Entropy 0.62568 (0.62529)	Top-1 acc 61.328 (61.233)	Top-5 acc 81.641 (82.069)	lr 0.01149
Train [64][350/3239]	Time 3.494 (0.869)	Data Time 3.238 (0.315)	Loss 2.3839 (2.6012)	Entropy 0.62536 (0.62530)	Top-1 acc 68.359 (61.311)	Top-5 acc 87.109 (82.128)	lr 0.01148
Train [64][360/3239]	Time 0.420 (0.859)	Data Time 0.002 (0.308)	Loss 2.4442 (2.6012)	Entropy 0.62527 (0.62531)	Top-1 acc 65.625 (61.310)	Top-5 acc 85.547 (82.132)	lr 0.01148
Train [64][370/3239]	Time 0.239 (0.848)	Data Time 0.001 (0.299)	Loss 2.7427 (2.6016)	Entropy 0.62519 (0.62530)	Top-1 acc 60.547 (61.333)	Top-5 acc 75.391 (82.106)	lr 0.01148
Train [64][380/3239]	Time 0.242 (0.845)	Data Time 0.001 (0.300)	Loss 2.6903 (2.6021)	Entropy 0.62510 (0.62530)	Top-1 acc 60.938 (61.335)	Top-5 acc 80.859 (82.115)	lr 0.01148
Train [64][390/3239]	Time 0.232 (0.846)	Data Time 0.001 (0.303)	Loss 2.6115 (2.6020)	Entropy 0.62538 (0.62530)	Top-1 acc 61.328 (61.339)	Top-5 acc 82.812 (82.127)	lr 0.01148
Train [64][400/3239]	Time 0.261 (0.836)	Data Time 0.001 (0.295)	Loss 2.7062 (2.6027)	Entropy 0.62568 (0.62530)	Top-1 acc 58.594 (61.318)	Top-5 acc 77.734 (82.113)	lr 0.01148
Train [64][410/3239]	Time 0.265 (0.835)	Data Time 0.001 (0.296)	Loss 2.6478 (2.6032)	Entropy 0.62577 (0.62531)	Top-1 acc 62.109 (61.302)	Top-5 acc 82.422 (82.103)	lr 0.01148
Train [64][420/3239]	Time 0.237 (0.836)	Data Time 0.001 (0.300)	Loss 2.6222 (2.6033)	Entropy 0.62577 (0.62533)	Top-1 acc 58.203 (61.285)	Top-5 acc 80.078 (82.086)	lr 0.01148
Train [64][430/3239]	Time 0.250 (0.827)	Data Time 0.001 (0.293)	Loss 2.5606 (2.6042)	Entropy 0.62611 (0.62534)	Top-1 acc 64.453 (61.264)	Top-5 acc 82.422 (82.066)	lr 0.01148
Train [64][440/3239]	Time 0.265 (0.827)	Data Time 0.001 (0.296)	Loss 2.5868 (2.6049)	Entropy 0.62637 (0.62536)	Top-1 acc 62.109 (61.240)	Top-5 acc 84.375 (82.060)	lr 0.01147
Train [64][450/3239]	Time 0.329 (0.819)	Data Time 0.001 (0.290)	Loss 2.7490 (2.6049)	Entropy 0.62620 (0.62538)	Top-1 acc 58.203 (61.248)	Top-5 acc 77.734 (82.062)	lr 0.01147
Train [64][460/3239]	Time 0.253 (0.814)	Data Time 0.002 (0.285)	Loss 2.8536 (2.6059)	Entropy 0.62609 (0.62540)	Top-1 acc 55.859 (61.215)	Top-5 acc 77.344 (82.059)	lr 0.01147
Train [64][470/3239]	Time 0.227 (0.805)	Data Time 0.001 (0.279)	Loss 2.6485 (2.6061)	Entropy 0.62619 (0.62542)	Top-1 acc 60.547 (61.211)	Top-5 acc 81.250 (82.064)	lr 0.01147
Train [64][480/3239]	Time 0.233 (0.814)	Data Time 0.001 (0.289)	Loss 2.4639 (2.6065)	Entropy 0.62632 (0.62543)	Top-1 acc 66.406 (61.202)	Top-5 acc 83.594 (82.033)	lr 0.01147
Train [64][490/3239]	Time 0.300 (0.807)	Data Time 0.002 (0.284)	Loss 2.6290 (2.6070)	Entropy 0.62644 (0.62545)	Top-1 acc 58.594 (61.176)	Top-5 acc 81.250 (82.025)	lr 0.01147
Train [64][500/3239]	Time 0.250 (0.799)	Data Time 0.001 (0.278)	Loss 2.5225 (2.6052)	Entropy 0.62659 (0.62547)	Top-1 acc 62.500 (61.228)	Top-5 acc 84.375 (82.059)	lr 0.01147
Train [64][510/3239]	Time 0.258 (0.802)	Data Time 0.001 (0.282)	Loss 2.4063 (2.6049)	Entropy 0.62648 (0.62549)	Top-1 acc 67.578 (61.243)	Top-5 acc 86.328 (82.068)	lr 0.01147
Train [64][520/3239]	Time 0.360 (0.795)	Data Time 0.001 (0.277)	Loss 2.6012 (2.6051)	Entropy 0.62645 (0.62551)	Top-1 acc 61.328 (61.237)	Top-5 acc 80.469 (82.061)	lr 0.01147
Train [64][530/3239]	Time 0.272 (0.798)	Data Time 0.002 (0.281)	Loss 2.7364 (2.6061)	Entropy 0.62648 (0.62553)	Top-1 acc 62.109 (61.191)	Top-5 acc 79.688 (82.039)	lr 0.01147
Train [64][540/3239]	Time 0.247 (0.792)	Data Time 0.001 (0.277)	Loss 2.6341 (2.6064)	Entropy 0.62613 (0.62554)	Top-1 acc 61.719 (61.184)	Top-5 acc 81.250 (82.019)	lr 0.01146
Train [64][550/3239]	Time 0.304 (0.794)	Data Time 0.001 (0.279)	Loss 2.4174 (2.6059)	Entropy 0.62622 (0.62555)	Top-1 acc 66.016 (61.193)	Top-5 acc 84.766 (82.021)	lr 0.01146
Train [64][560/3239]	Time 0.265 (0.791)	Data Time 0.001 (0.277)	Loss 2.6112 (2.6070)	Entropy 0.62588 (0.62556)	Top-1 acc 65.234 (61.169)	Top-5 acc 82.422 (81.995)	lr 0.01146
Train [64][570/3239]	Time 0.239 (0.789)	Data Time 0.001 (0.276)	Loss 2.6094 (2.6062)	Entropy 0.62602 (0.62557)	Top-1 acc 64.453 (61.200)	Top-5 acc 83.203 (82.000)	lr 0.01146
Train [64][580/3239]	Time 0.236 (0.792)	Data Time 0.001 (0.280)	Loss 2.5582 (2.6060)	Entropy 0.62596 (0.62558)	Top-1 acc 57.422 (61.206)	Top-5 acc 85.547 (81.997)	lr 0.01146
Train [64][590/3239]	Time 0.337 (0.786)	Data Time 0.001 (0.276)	Loss 2.6798 (2.6061)	Entropy 0.62608 (0.62558)	Top-1 acc 55.859 (61.197)	Top-5 acc 83.203 (81.991)	lr 0.01146
Train [64][600/3239]	Time 2.959 (0.784)	Data Time 2.731 (0.276)	Loss 2.9216 (2.6065)	Entropy 0.62618 (0.62559)	Top-1 acc 53.906 (61.186)	Top-5 acc 76.953 (81.988)	lr 0.01146
Train [64][610/3239]	Time 0.249 (0.783)	Data Time 0.001 (0.276)	Loss 2.5799 (2.6076)	Entropy 0.62630 (0.62560)	Top-1 acc 60.156 (61.162)	Top-5 acc 82.422 (81.978)	lr 0.01146
Train [64][620/3239]	Time 0.238 (0.778)	Data Time 0.002 (0.271)	Loss 2.4700 (2.6074)	Entropy 0.62604 (0.62561)	Top-1 acc 64.062 (61.149)	Top-5 acc 83.203 (81.983)	lr 0.01146
Train [64][630/3239]	Time 0.234 (0.772)	Data Time 0.001 (0.267)	Loss 2.7310 (2.6086)	Entropy 0.62552 (0.62561)	Top-1 acc 60.547 (61.137)	Top-5 acc 79.297 (81.971)	lr 0.01146
Train [64][640/3239]	Time 0.242 (0.776)	Data Time 0.001 (0.272)	Loss 2.4698 (2.6083)	Entropy 0.62544 (0.62561)	Top-1 acc 66.406 (61.139)	Top-5 acc 86.719 (81.979)	lr 0.01145
Train [64][650/3239]	Time 0.263 (0.771)	Data Time 0.001 (0.268)	Loss 2.5446 (2.6082)	Entropy 0.62521 (0.62561)	Top-1 acc 61.719 (61.122)	Top-5 acc 82.422 (81.984)	lr 0.01145
Train [64][660/3239]	Time 0.255 (0.766)	Data Time 0.002 (0.264)	Loss 2.5737 (2.6091)	Entropy 0.62501 (0.62560)	Top-1 acc 61.719 (61.102)	Top-5 acc 80.859 (81.966)	lr 0.01145
Train [64][670/3239]	Time 0.305 (0.779)	Data Time 0.001 (0.277)	Loss 2.7674 (2.6095)	Entropy 0.62538 (0.62559)	Top-1 acc 55.078 (61.074)	Top-5 acc 78.125 (81.958)	lr 0.01145
Train [64][680/3239]	Time 0.359 (0.773)	Data Time 0.001 (0.273)	Loss 2.5897 (2.6094)	Entropy 0.62490 (0.62559)	Top-1 acc 59.766 (61.058)	Top-5 acc 84.766 (81.963)	lr 0.01145
Train [64][690/3239]	Time 0.258 (0.768)	Data Time 0.001 (0.269)	Loss 2.4262 (2.6089)	Entropy 0.62463 (0.62558)	Top-1 acc 67.188 (61.064)	Top-5 acc 87.500 (81.975)	lr 0.01145
Train [64][700/3239]	Time 0.233 (0.777)	Data Time 0.001 (0.278)	Loss 2.7244 (2.6087)	Entropy 0.62472 (0.62556)	Top-1 acc 58.984 (61.060)	Top-5 acc 82.031 (81.983)	lr 0.01145
Train [64][710/3239]	Time 0.267 (0.772)	Data Time 0.001 (0.275)	Loss 2.5679 (2.6087)	Entropy 0.62440 (0.62555)	Top-1 acc 62.500 (61.058)	Top-5 acc 80.078 (81.992)	lr 0.01145
Train [64][720/3239]	Time 0.242 (0.768)	Data Time 0.001 (0.271)	Loss 2.6061 (2.6086)	Entropy 0.62434 (0.62553)	Top-1 acc 60.547 (61.062)	Top-5 acc 83.984 (82.000)	lr 0.01145
Train [64][730/3239]	Time 0.248 (0.773)	Data Time 0.001 (0.276)	Loss 2.7108 (2.6083)	Entropy 0.62408 (0.62551)	Top-1 acc 60.156 (61.074)	Top-5 acc 83.594 (82.008)	lr 0.01145
Train [64][740/3239]	Time 0.253 (0.768)	Data Time 0.002 (0.273)	Loss 2.9346 (2.6085)	Entropy 0.62400 (0.62549)	Top-1 acc 52.734 (61.065)	Top-5 acc 76.562 (82.005)	lr 0.01144
Train [64][750/3239]	Time 0.336 (0.764)	Data Time 0.001 (0.269)	Loss 2.5500 (2.6080)	Entropy 0.62411 (0.62548)	Top-1 acc 64.453 (61.079)	Top-5 acc 81.250 (82.019)	lr 0.01144
Train [64][760/3239]	Time 0.240 (0.760)	Data Time 0.001 (0.266)	Loss 2.4716 (2.6078)	Entropy 0.62431 (0.62546)	Top-1 acc 60.938 (61.071)	Top-5 acc 84.766 (82.028)	lr 0.01144
Train [64][770/3239]	Time 0.252 (0.761)	Data Time 0.001 (0.267)	Loss 2.7666 (2.6080)	Entropy 0.62400 (0.62544)	Top-1 acc 58.984 (61.086)	Top-5 acc 78.125 (82.016)	lr 0.01144
Train [64][780/3239]	Time 0.224 (0.756)	Data Time 0.001 (0.264)	Loss 2.6756 (2.6080)	Entropy 0.62397 (0.62542)	Top-1 acc 57.031 (61.083)	Top-5 acc 78.906 (82.014)	lr 0.01144
Train [64][790/3239]	Time 0.269 (0.752)	Data Time 0.001 (0.261)	Loss 2.6094 (2.6080)	Entropy 0.62398 (0.62540)	Top-1 acc 61.328 (61.086)	Top-5 acc 82.031 (82.012)	lr 0.01144
Train [64][800/3239]	Time 0.286 (0.759)	Data Time 0.002 (0.268)	Loss 2.6071 (2.6078)	Entropy 0.62402 (0.62539)	Top-1 acc 62.500 (61.107)	Top-5 acc 80.859 (82.019)	lr 0.01144
Train [64][810/3239]	Time 0.239 (0.754)	Data Time 0.001 (0.264)	Loss 2.5049 (2.6074)	Entropy 0.62432 (0.62537)	Top-1 acc 63.281 (61.107)	Top-5 acc 82.422 (82.025)	lr 0.01144
Train [64][820/3239]	Time 0.236 (0.751)	Data Time 0.001 (0.261)	Loss 2.3761 (2.6071)	Entropy 0.62417 (0.62536)	Top-1 acc 66.797 (61.127)	Top-5 acc 86.328 (82.023)	lr 0.01144
Train [64][830/3239]	Time 0.238 (0.755)	Data Time 0.001 (0.267)	Loss 2.5462 (2.6071)	Entropy 0.62445 (0.62534)	Top-1 acc 60.156 (61.119)	Top-5 acc 84.375 (82.028)	lr 0.01144
Train [64][840/3239]	Time 0.257 (0.751)	Data Time 0.001 (0.263)	Loss 2.6682 (2.6076)	Entropy 0.62469 (0.62533)	Top-1 acc 57.812 (61.109)	Top-5 acc 83.594 (82.018)	lr 0.01143
Train [64][850/3239]	Time 0.245 (0.748)	Data Time 0.001 (0.260)	Loss 2.6110 (2.6080)	Entropy 0.62483 (0.62533)	Top-1 acc 63.281 (61.094)	Top-5 acc 81.641 (82.013)	lr 0.01143
Train [64][860/3239]	Time 0.249 (0.755)	Data Time 0.001 (0.269)	Loss 2.3737 (2.6078)	Entropy 0.62476 (0.62532)	Top-1 acc 67.578 (61.099)	Top-5 acc 87.109 (82.015)	lr 0.01143
Train [64][870/3239]	Time 0.261 (0.796)	Data Time 0.004 (0.266)	Loss 2.6953 (2.6079)	Entropy 0.62502 (0.62531)	Top-1 acc 57.031 (61.102)	Top-5 acc 80.078 (82.014)	lr 0.01143
Train [64][880/3239]	Time 0.243 (0.792)	Data Time 0.001 (0.263)	Loss 2.5297 (2.6070)	Entropy 0.62506 (0.62531)	Top-1 acc 62.500 (61.113)	Top-5 acc 85.156 (82.029)	lr 0.01143
Train [64][890/3239]	Time 0.230 (0.787)	Data Time 0.001 (0.260)	Loss 2.6537 (2.6072)	Entropy 0.62496 (0.62531)	Top-1 acc 60.156 (61.106)	Top-5 acc 83.984 (82.024)	lr 0.01143
Train [64][900/3239]	Time 0.272 (0.783)	Data Time 0.001 (0.257)	Loss 2.6691 (2.6069)	Entropy 0.62463 (0.62530)	Top-1 acc 58.203 (61.124)	Top-5 acc 82.031 (82.030)	lr 0.01143
Train [64][910/3239]	Time 0.357 (0.780)	Data Time 0.001 (0.254)	Loss 2.6351 (2.6074)	Entropy 0.62474 (0.62529)	Top-1 acc 58.594 (61.110)	Top-5 acc 80.469 (82.018)	lr 0.01143
Train [64][920/3239]	Time 0.242 (0.776)	Data Time 0.001 (0.251)	Loss 2.6113 (2.6073)	Entropy 0.62456 (0.62529)	Top-1 acc 59.375 (61.107)	Top-5 acc 83.594 (82.030)	lr 0.01143
Train [64][930/3239]	Time 0.273 (0.773)	Data Time 0.002 (0.249)	Loss 2.4434 (2.6068)	Entropy 0.62441 (0.62528)	Top-1 acc 67.578 (61.128)	Top-5 acc 86.719 (82.041)	lr 0.01143
Train [64][940/3239]	Time 0.239 (0.769)	Data Time 0.001 (0.246)	Loss 2.6364 (2.6065)	Entropy 0.62413 (0.62527)	Top-1 acc 57.812 (61.133)	Top-5 acc 82.422 (82.043)	lr 0.01142
Train [64][950/3239]	Time 0.239 (0.766)	Data Time 0.001 (0.243)	Loss 2.6975 (2.6069)	Entropy 0.62389 (0.62525)	Top-1 acc 60.938 (61.116)	Top-5 acc 79.688 (82.037)	lr 0.01142
Train [64][960/3239]	Time 0.252 (0.763)	Data Time 0.002 (0.241)	Loss 2.7376 (2.6074)	Entropy 0.62350 (0.62524)	Top-1 acc 56.641 (61.108)	Top-5 acc 80.859 (82.024)	lr 0.01142
Train [64][970/3239]	Time 0.242 (0.759)	Data Time 0.001 (0.238)	Loss 2.6490 (2.6075)	Entropy 0.62355 (0.62522)	Top-1 acc 60.938 (61.102)	Top-5 acc 81.250 (82.028)	lr 0.01142
Train [64][980/3239]	Time 0.248 (0.760)	Data Time 0.001 (0.240)	Loss 2.4042 (2.6077)	Entropy 0.62389 (0.62521)	Top-1 acc 63.672 (61.101)	Top-5 acc 87.500 (82.024)	lr 0.01142
Train [64][990/3239]	Time 0.281 (0.759)	Data Time 0.001 (0.239)	Loss 2.7013 (2.6079)	Entropy 0.62388 (0.62519)	Top-1 acc 57.422 (61.090)	Top-5 acc 78.516 (82.021)	lr 0.01142
Train [64][1000/3239]	Time 0.386 (0.756)	Data Time 0.003 (0.238)	Loss 2.6450 (2.6079)	Entropy 0.62418 (0.62518)	Top-1 acc 57.812 (61.080)	Top-5 acc 82.031 (82.022)	lr 0.01142
Train [64][1010/3239]	Time 0.230 (0.755)	Data Time 0.001 (0.237)	Loss 2.5597 (2.6073)	Entropy 0.62434 (0.62517)	Top-1 acc 60.938 (61.098)	Top-5 acc 83.594 (82.041)	lr 0.01142
Train [64][1020/3239]	Time 0.251 (0.754)	Data Time 0.001 (0.237)	Loss 2.6476 (2.6079)	Entropy 0.62422 (0.62516)	Top-1 acc 60.938 (61.083)	Top-5 acc 80.859 (82.032)	lr 0.01142
Train [64][1030/3239]	Time 0.274 (0.753)	Data Time 0.002 (0.237)	Loss 2.6218 (2.6078)	Entropy 0.62420 (0.62515)	Top-1 acc 60.547 (61.096)	Top-5 acc 82.812 (82.035)	lr 0.01142
Train [64][1040/3239]	Time 0.259 (0.752)	Data Time 0.001 (0.238)	Loss 2.7609 (2.6083)	Entropy 0.62437 (0.62515)	Top-1 acc 58.984 (61.091)	Top-5 acc 79.297 (82.024)	lr 0.01141
Train [64][1050/3239]	Time 0.252 (0.752)	Data Time 0.001 (0.238)	Loss 2.6100 (2.6081)	Entropy 0.62446 (0.62514)	Top-1 acc 61.719 (61.091)	Top-5 acc 82.422 (82.027)	lr 0.01141
Train [64][1060/3239]	Time 0.295 (0.754)	Data Time 0.001 (0.240)	Loss 2.6055 (2.6084)	Entropy 0.62445 (0.62513)	Top-1 acc 63.672 (61.097)	Top-5 acc 78.906 (82.017)	lr 0.01141
Train [64][1070/3239]	Time 0.367 (0.751)	Data Time 0.001 (0.238)	Loss 2.4596 (2.6082)	Entropy 0.62419 (0.62512)	Top-1 acc 66.797 (61.104)	Top-5 acc 84.375 (82.022)	lr 0.01141
Train [64][1080/3239]	Time 0.242 (0.748)	Data Time 0.001 (0.236)	Loss 2.5824 (2.6086)	Entropy 0.62405 (0.62511)	Top-1 acc 58.984 (61.096)	Top-5 acc 83.984 (82.019)	lr 0.01141
Train [64][1090/3239]	Time 0.253 (0.753)	Data Time 0.001 (0.241)	Loss 2.5835 (2.6090)	Entropy 0.62388 (0.62510)	Top-1 acc 60.938 (61.079)	Top-5 acc 83.594 (82.018)	lr 0.01141
Train [64][1100/3239]	Time 0.244 (0.750)	Data Time 0.001 (0.238)	Loss 2.6188 (2.6088)	Entropy 0.62387 (0.62509)	Top-1 acc 59.375 (61.081)	Top-5 acc 82.031 (82.018)	lr 0.01141
Train [64][1110/3239]	Time 0.236 (0.747)	Data Time 0.001 (0.236)	Loss 2.5029 (2.6086)	Entropy 0.62396 (0.62508)	Top-1 acc 65.234 (61.088)	Top-5 acc 82.812 (82.019)	lr 0.01141
Train [64][1120/3239]	Time 0.241 (0.745)	Data Time 0.001 (0.235)	Loss 2.6162 (2.6093)	Entropy 0.62386 (0.62507)	Top-1 acc 59.766 (61.069)	Top-5 acc 81.250 (82.001)	lr 0.01141
Train [64][1130/3239]	Time 0.229 (0.749)	Data Time 0.001 (0.240)	Loss 2.5612 (2.6092)	Entropy 0.62388 (0.62506)	Top-1 acc 64.062 (61.073)	Top-5 acc 82.422 (81.993)	lr 0.01141
Train [64][1140/3239]	Time 0.254 (0.747)	Data Time 0.001 (0.238)	Loss 2.6805 (2.6094)	Entropy 0.62392 (0.62505)	Top-1 acc 59.375 (61.066)	Top-5 acc 82.031 (81.992)	lr 0.01140
Train [64][1150/3239]	Time 0.238 (0.745)	Data Time 0.001 (0.237)	Loss 2.9553 (2.6100)	Entropy 0.62371 (0.62504)	Top-1 acc 53.516 (61.056)	Top-5 acc 75.000 (81.982)	lr 0.01140
Train [64][1160/3239]	Time 0.246 (0.745)	Data Time 0.002 (0.237)	Loss 2.7542 (2.6105)	Entropy 0.62401 (0.62503)	Top-1 acc 57.812 (61.049)	Top-5 acc 79.297 (81.975)	lr 0.01140
Train [64][1170/3239]	Time 0.244 (0.744)	Data Time 0.002 (0.237)	Loss 2.6740 (2.6106)	Entropy 0.62369 (0.62502)	Top-1 acc 56.250 (61.040)	Top-5 acc 80.469 (81.974)	lr 0.01140
Train [64][1180/3239]	Time 0.260 (0.747)	Data Time 0.001 (0.241)	Loss 2.6283 (2.6106)	Entropy 0.62356 (0.62501)	Top-1 acc 58.984 (61.036)	Top-5 acc 80.859 (81.972)	lr 0.01140
Train [64][1190/3239]	Time 0.227 (0.745)	Data Time 0.001 (0.239)	Loss 2.6430 (2.6109)	Entropy 0.62364 (0.62500)	Top-1 acc 60.547 (61.027)	Top-5 acc 81.641 (81.967)	lr 0.01140
Train [64][1200/3239]	Time 0.243 (0.742)	Data Time 0.001 (0.237)	Loss 2.7750 (2.6113)	Entropy 0.62352 (0.62499)	Top-1 acc 58.203 (61.020)	Top-5 acc 78.516 (81.963)	lr 0.01140
Train [64][1210/3239]	Time 0.232 (0.741)	Data Time 0.001 (0.236)	Loss 2.3934 (2.6107)	Entropy 0.62379 (0.62497)	Top-1 acc 66.797 (61.033)	Top-5 acc 86.719 (81.976)	lr 0.01140
Train [64][1220/3239]	Time 0.256 (0.743)	Data Time 0.001 (0.238)	Loss 2.7129 (2.6107)	Entropy 0.62387 (0.62496)	Top-1 acc 57.812 (61.036)	Top-5 acc 79.297 (81.980)	lr 0.01140
Train [64][1230/3239]	Time 0.823 (0.740)	Data Time 0.453 (0.236)	Loss 2.6922 (2.6110)	Entropy 0.62382 (0.62496)	Top-1 acc 57.422 (61.028)	Top-5 acc 80.859 (81.975)	lr 0.01140
Train [64][1240/3239]	Time 0.288 (0.742)	Data Time 0.001 (0.238)	Loss 2.6740 (2.6107)	Entropy 0.62369 (0.62495)	Top-1 acc 60.156 (61.031)	Top-5 acc 80.859 (81.981)	lr 0.01139
Train [64][1250/3239]	Time 0.254 (0.743)	Data Time 0.001 (0.240)	Loss 2.8020 (2.6111)	Entropy 0.62367 (0.62494)	Top-1 acc 52.734 (61.017)	Top-5 acc 78.125 (81.969)	lr 0.01139
Train [64][1260/3239]	Time 0.253 (0.743)	Data Time 0.001 (0.240)	Loss 2.7120 (2.6110)	Entropy 0.62382 (0.62493)	Top-1 acc 56.250 (61.022)	Top-5 acc 78.125 (81.967)	lr 0.01139
Train [64][1270/3239]	Time 0.244 (0.740)	Data Time 0.001 (0.238)	Loss 2.7902 (2.6115)	Entropy 0.62414 (0.62492)	Top-1 acc 53.906 (61.009)	Top-5 acc 79.297 (81.960)	lr 0.01139
Train [64][1280/3239]	Time 0.239 (0.740)	Data Time 0.001 (0.238)	Loss 2.7090 (2.6119)	Entropy 0.62447 (0.62491)	Top-1 acc 57.812 (61.004)	Top-5 acc 79.688 (81.950)	lr 0.01139
Train [64][1290/3239]	Time 0.238 (0.742)	Data Time 0.001 (0.241)	Loss 2.4752 (2.6116)	Entropy 0.62436 (0.62491)	Top-1 acc 61.719 (61.006)	Top-5 acc 85.156 (81.956)	lr 0.01139
Train [64][1300/3239]	Time 0.342 (0.740)	Data Time 0.001 (0.239)	Loss 2.3349 (2.6115)	Entropy 0.62443 (0.62491)	Top-1 acc 70.312 (61.003)	Top-5 acc 86.328 (81.960)	lr 0.01139
Train [64][1310/3239]	Time 0.235 (0.737)	Data Time 0.001 (0.237)	Loss 2.4961 (2.6118)	Entropy 0.62440 (0.62490)	Top-1 acc 63.281 (60.991)	Top-5 acc 83.203 (81.958)	lr 0.01139
Train [64][1320/3239]	Time 0.281 (0.739)	Data Time 0.001 (0.239)	Loss 2.5051 (2.6114)	Entropy 0.62451 (0.62490)	Top-1 acc 63.672 (60.997)	Top-5 acc 83.594 (81.963)	lr 0.01139
Train [64][1330/3239]	Time 0.237 (0.739)	Data Time 0.001 (0.239)	Loss 2.5539 (2.6115)	Entropy 0.62441 (0.62490)	Top-1 acc 60.938 (61.002)	Top-5 acc 82.812 (81.963)	lr 0.01139
Train [64][1340/3239]	Time 0.249 (0.738)	Data Time 0.002 (0.238)	Loss 2.6356 (2.6112)	Entropy 0.62414 (0.62489)	Top-1 acc 60.156 (61.000)	Top-5 acc 81.641 (81.970)	lr 0.01138
Train [64][1350/3239]	Time 0.876 (0.738)	Data Time 0.626 (0.239)	Loss 2.7018 (2.6116)	Entropy 0.62418 (0.62489)	Top-1 acc 58.594 (60.987)	Top-5 acc 80.859 (81.961)	lr 0.01138
Train [64][1360/3239]	Time 1.699 (0.737)	Data Time 1.407 (0.238)	Loss 2.6962 (2.6120)	Entropy 0.62353 (0.62488)	Top-1 acc 58.984 (60.977)	Top-5 acc 79.297 (81.951)	lr 0.01138
Train [64][1370/3239]	Time 0.280 (0.735)	Data Time 0.001 (0.237)	Loss 2.6434 (2.6120)	Entropy 0.62384 (0.62487)	Top-1 acc 62.500 (60.974)	Top-5 acc 78.906 (81.948)	lr 0.01138
Train [64][1380/3239]	Time 0.460 (0.738)	Data Time 0.220 (0.240)	Loss 2.6595 (2.6120)	Entropy 0.62395 (0.62486)	Top-1 acc 62.500 (60.977)	Top-5 acc 82.031 (81.951)	lr 0.01138
Train [64][1390/3239]	Time 1.533 (0.736)	Data Time 1.168 (0.239)	Loss 2.6363 (2.6119)	Entropy 0.62409 (0.62486)	Top-1 acc 62.891 (60.979)	Top-5 acc 82.422 (81.954)	lr 0.01138
Train [64][1400/3239]	Time 0.310 (0.735)	Data Time 0.002 (0.238)	Loss 2.5265 (2.6122)	Entropy 0.62419 (0.62485)	Top-1 acc 62.891 (60.971)	Top-5 acc 82.422 (81.947)	lr 0.01138
Train [64][1410/3239]	Time 0.274 (0.737)	Data Time 0.001 (0.240)	Loss 2.6270 (2.6123)	Entropy 0.62361 (0.62485)	Top-1 acc 60.156 (60.973)	Top-5 acc 82.422 (81.946)	lr 0.01138
Train [64][1420/3239]	Time 0.221 (0.735)	Data Time 0.001 (0.238)	Loss 2.7763 (2.6124)	Entropy 0.62364 (0.62484)	Top-1 acc 57.812 (60.972)	Top-5 acc 80.859 (81.946)	lr 0.01138
Train [64][1430/3239]	Time 0.236 (0.734)	Data Time 0.001 (0.239)	Loss 2.5732 (2.6122)	Entropy 0.62371 (0.62483)	Top-1 acc 63.672 (60.979)	Top-5 acc 82.031 (81.947)	lr 0.01138
Train [64][1440/3239]	Time 0.236 (0.732)	Data Time 0.001 (0.237)	Loss 2.8226 (2.6123)	Entropy 0.62376 (0.62482)	Top-1 acc 59.375 (60.982)	Top-5 acc 77.344 (81.943)	lr 0.01137
Train [64][1450/3239]	Time 0.233 (0.735)	Data Time 0.001 (0.240)	Loss 2.5102 (2.6123)	Entropy 0.62380 (0.62481)	Top-1 acc 64.453 (60.985)	Top-5 acc 83.984 (81.937)	lr 0.01137
Train [64][1460/3239]	Time 1.457 (0.734)	Data Time 1.035 (0.240)	Loss 2.6848 (2.6120)	Entropy 0.62370 (0.62481)	Top-1 acc 57.031 (60.987)	Top-5 acc 81.641 (81.940)	lr 0.01137
Train [64][1470/3239]	Time 0.254 (0.732)	Data Time 0.001 (0.238)	Loss 2.5317 (2.6120)	Entropy 0.62337 (0.62480)	Top-1 acc 63.281 (60.990)	Top-5 acc 83.594 (81.943)	lr 0.01137
Train [64][1480/3239]	Time 0.241 (0.734)	Data Time 0.001 (0.240)	Loss 2.7467 (2.6119)	Entropy 0.62314 (0.62479)	Top-1 acc 54.688 (60.984)	Top-5 acc 82.422 (81.943)	lr 0.01137
Train [64][1490/3239]	Time 0.238 (0.732)	Data Time 0.001 (0.239)	Loss 2.6760 (2.6122)	Entropy 0.62326 (0.62478)	Top-1 acc 56.250 (60.984)	Top-5 acc 80.859 (81.940)	lr 0.01137
Train [64][1500/3239]	Time 0.259 (0.733)	Data Time 0.001 (0.241)	Loss 2.5921 (2.6121)	Entropy 0.62340 (0.62477)	Top-1 acc 63.672 (60.987)	Top-5 acc 83.984 (81.941)	lr 0.01137
Train [64][1510/3239]	Time 0.231 (0.734)	Data Time 0.001 (0.241)	Loss 2.5299 (2.6117)	Entropy 0.62358 (0.62476)	Top-1 acc 62.500 (60.998)	Top-5 acc 85.547 (81.951)	lr 0.01137
Train [64][1520/3239]	Time 0.425 (0.758)	Data Time 0.007 (0.240)	Loss 2.6981 (2.6119)	Entropy 0.62372 (0.62475)	Top-1 acc 60.547 (60.992)	Top-5 acc 80.078 (81.944)	lr 0.01137
Train [64][1530/3239]	Time 0.231 (0.756)	Data Time 0.002 (0.238)	Loss 2.4059 (2.6118)	Entropy 0.62375 (0.62475)	Top-1 acc 66.406 (61.000)	Top-5 acc 83.203 (81.946)	lr 0.01137
Train [64][1540/3239]	Time 0.264 (0.754)	Data Time 0.002 (0.237)	Loss 2.4615 (2.6119)	Entropy 0.62383 (0.62474)	Top-1 acc 64.844 (61.007)	Top-5 acc 84.375 (81.946)	lr 0.01136
Train [64][1550/3239]	Time 0.370 (0.752)	Data Time 0.001 (0.235)	Loss 2.5688 (2.6120)	Entropy 0.62390 (0.62473)	Top-1 acc 64.844 (61.002)	Top-5 acc 81.641 (81.939)	lr 0.01136
Train [64][1560/3239]	Time 0.256 (0.750)	Data Time 0.001 (0.234)	Loss 2.7258 (2.6122)	Entropy 0.62350 (0.62473)	Top-1 acc 55.469 (61.001)	Top-5 acc 78.516 (81.933)	lr 0.01136
Train [64][1570/3239]	Time 0.243 (0.748)	Data Time 0.001 (0.232)	Loss 2.6127 (2.6125)	Entropy 0.62346 (0.62472)	Top-1 acc 61.328 (60.988)	Top-5 acc 79.297 (81.924)	lr 0.01136
Train [64][1580/3239]	Time 0.248 (0.746)	Data Time 0.001 (0.231)	Loss 2.5626 (2.6122)	Entropy 0.62339 (0.62471)	Top-1 acc 57.812 (60.996)	Top-5 acc 83.984 (81.935)	lr 0.01136
Train [64][1590/3239]	Time 0.248 (0.744)	Data Time 0.002 (0.229)	Loss 2.5409 (2.6120)	Entropy 0.62337 (0.62470)	Top-1 acc 61.328 (60.997)	Top-5 acc 83.984 (81.938)	lr 0.01136
Train [64][1600/3239]	Time 0.238 (0.743)	Data Time 0.001 (0.228)	Loss 2.4614 (2.6116)	Entropy 0.62321 (0.62470)	Top-1 acc 64.844 (61.008)	Top-5 acc 85.156 (81.943)	lr 0.01136
Train [64][1610/3239]	Time 0.242 (0.741)	Data Time 0.001 (0.227)	Loss 2.8612 (2.6117)	Entropy 0.62324 (0.62469)	Top-1 acc 58.203 (61.003)	Top-5 acc 78.125 (81.940)	lr 0.01136
Train [64][1620/3239]	Time 0.425 (0.744)	Data Time 0.001 (0.230)	Loss 2.4760 (2.6119)	Entropy 0.62335 (0.62468)	Top-1 acc 62.109 (61.000)	Top-5 acc 86.328 (81.940)	lr 0.01136
Train [64][1630/3239]	Time 0.289 (0.743)	Data Time 0.002 (0.229)	Loss 2.4761 (2.6117)	Entropy 0.62337 (0.62467)	Top-1 acc 63.672 (61.002)	Top-5 acc 84.375 (81.942)	lr 0.01136
Train [64][1640/3239]	Time 0.244 (0.743)	Data Time 0.001 (0.229)	Loss 2.5393 (2.6114)	Entropy 0.62327 (0.62466)	Top-1 acc 60.547 (61.009)	Top-5 acc 83.203 (81.949)	lr 0.01135
Train [64][1650/3239]	Time 0.233 (0.745)	Data Time 0.001 (0.232)	Loss 2.8174 (2.6117)	Entropy 0.62327 (0.62465)	Top-1 acc 58.594 (61.006)	Top-5 acc 78.125 (81.946)	lr 0.01135
Train [64][1660/3239]	Time 0.302 (0.748)	Data Time 0.001 (0.235)	Loss 2.8201 (2.6117)	Entropy 0.62331 (0.62465)	Top-1 acc 56.250 (61.008)	Top-5 acc 75.391 (81.946)	lr 0.01135
Train [64][1670/3239]	Time 0.225 (0.746)	Data Time 0.001 (0.234)	Loss 2.6615 (2.6122)	Entropy 0.62336 (0.62464)	Top-1 acc 58.984 (60.998)	Top-5 acc 82.422 (81.934)	lr 0.01135
Train [64][1680/3239]	Time 4.345 (0.747)	Data Time 4.091 (0.235)	Loss 2.5084 (2.6119)	Entropy 0.62307 (0.62463)	Top-1 acc 62.891 (60.997)	Top-5 acc 84.375 (81.938)	lr 0.01135
Train [64][1690/3239]	Time 0.228 (0.749)	Data Time 0.001 (0.238)	Loss 2.6381 (2.6123)	Entropy 0.62299 (0.62462)	Top-1 acc 58.984 (60.993)	Top-5 acc 80.859 (81.929)	lr 0.01135
Train [64][1700/3239]	Time 0.236 (0.747)	Data Time 0.001 (0.236)	Loss 2.7145 (2.6125)	Entropy 0.62320 (0.62461)	Top-1 acc 57.422 (60.991)	Top-5 acc 83.203 (81.928)	lr 0.01135
Train [64][1710/3239]	Time 0.259 (0.745)	Data Time 0.001 (0.235)	Loss 2.7225 (2.6127)	Entropy 0.62301 (0.62460)	Top-1 acc 61.328 (60.991)	Top-5 acc 78.906 (81.923)	lr 0.01135
Train [64][1720/3239]	Time 0.258 (0.751)	Data Time 0.001 (0.241)	Loss 2.4919 (2.6125)	Entropy 0.62299 (0.62459)	Top-1 acc 63.281 (60.995)	Top-5 acc 83.203 (81.924)	lr 0.01135
Train [64][1730/3239]	Time 0.236 (0.750)	Data Time 0.001 (0.240)	Loss 2.4519 (2.6127)	Entropy 0.62317 (0.62458)	Top-1 acc 64.844 (60.983)	Top-5 acc 86.719 (81.923)	lr 0.01135
Train [64][1740/3239]	Time 0.253 (0.748)	Data Time 0.002 (0.239)	Loss 2.6435 (2.6126)	Entropy 0.62343 (0.62458)	Top-1 acc 62.891 (60.983)	Top-5 acc 83.203 (81.926)	lr 0.01134
Train [64][1750/3239]	Time 0.240 (0.749)	Data Time 0.002 (0.239)	Loss 2.5910 (2.6124)	Entropy 0.62334 (0.62457)	Top-1 acc 61.719 (60.991)	Top-5 acc 83.984 (81.933)	lr 0.01134
Train [64][1760/3239]	Time 0.242 (0.752)	Data Time 0.001 (0.243)	Loss 2.7817 (2.6125)	Entropy 0.62339 (0.62456)	Top-1 acc 57.422 (60.987)	Top-5 acc 78.906 (81.931)	lr 0.01134
Train [64][1770/3239]	Time 0.224 (0.750)	Data Time 0.001 (0.242)	Loss 2.9003 (2.6128)	Entropy 0.62347 (0.62456)	Top-1 acc 51.172 (60.980)	Top-5 acc 78.516 (81.929)	lr 0.01134
Train [64][1780/3239]	Time 0.327 (0.750)	Data Time 0.001 (0.243)	Loss 2.5164 (2.6127)	Entropy 0.62352 (0.62455)	Top-1 acc 62.891 (60.982)	Top-5 acc 83.594 (81.932)	lr 0.01134
Train [64][1790/3239]	Time 0.258 (0.754)	Data Time 0.001 (0.246)	Loss 2.5806 (2.6124)	Entropy 0.62369 (0.62454)	Top-1 acc 59.375 (60.986)	Top-5 acc 82.812 (81.941)	lr 0.01134
Train [64][1800/3239]	Time 0.275 (0.752)	Data Time 0.001 (0.245)	Loss 2.6235 (2.6125)	Entropy 0.62374 (0.62454)	Top-1 acc 65.625 (60.984)	Top-5 acc 82.422 (81.942)	lr 0.01134
Train [64][1810/3239]	Time 0.237 (0.750)	Data Time 0.001 (0.244)	Loss 2.5373 (2.6123)	Entropy 0.62388 (0.62454)	Top-1 acc 62.500 (60.992)	Top-5 acc 85.156 (81.951)	lr 0.01134
Train [64][1820/3239]	Time 0.270 (0.753)	Data Time 0.002 (0.247)	Loss 2.5079 (2.6123)	Entropy 0.62349 (0.62453)	Top-1 acc 61.719 (60.989)	Top-5 acc 84.766 (81.956)	lr 0.01134
Train [64][1830/3239]	Time 0.262 (0.752)	Data Time 0.001 (0.246)	Loss 2.6491 (2.6121)	Entropy 0.62368 (0.62453)	Top-1 acc 62.109 (60.994)	Top-5 acc 83.203 (81.956)	lr 0.01134
Train [64][1840/3239]	Time 0.267 (0.750)	Data Time 0.001 (0.245)	Loss 2.5278 (2.6121)	Entropy 0.62378 (0.62452)	Top-1 acc 59.766 (60.989)	Top-5 acc 85.938 (81.961)	lr 0.01133
Train [64][1850/3239]	Time 0.377 (0.756)	Data Time 0.002 (0.250)	Loss 2.8496 (2.6121)	Entropy 0.62407 (0.62452)	Top-1 acc 56.250 (60.990)	Top-5 acc 77.344 (81.958)	lr 0.01133
Train [64][1860/3239]	Time 0.248 (0.754)	Data Time 0.001 (0.249)	Loss 2.6858 (2.6120)	Entropy 0.62404 (0.62451)	Top-1 acc 59.375 (61.000)	Top-5 acc 80.859 (81.958)	lr 0.01133
Train [64][1870/3239]	Time 0.240 (0.752)	Data Time 0.001 (0.247)	Loss 2.8393 (2.6120)	Entropy 0.62413 (0.62451)	Top-1 acc 58.203 (60.996)	Top-5 acc 76.953 (81.956)	lr 0.01133
Train [64][1880/3239]	Time 0.253 (0.757)	Data Time 0.001 (0.252)	Loss 2.7743 (2.6120)	Entropy 0.62399 (0.62451)	Top-1 acc 56.641 (60.998)	Top-5 acc 80.469 (81.956)	lr 0.01133
Train [64][1890/3239]	Time 0.233 (0.755)	Data Time 0.001 (0.252)	Loss 2.5934 (2.6120)	Entropy 0.62433 (0.62451)	Top-1 acc 58.594 (60.997)	Top-5 acc 83.984 (81.958)	lr 0.01133
Train [64][1900/3239]	Time 0.231 (0.754)	Data Time 0.001 (0.250)	Loss 2.3845 (2.6119)	Entropy 0.62432 (0.62451)	Top-1 acc 67.578 (61.001)	Top-5 acc 85.156 (81.958)	lr 0.01133
Train [64][1910/3239]	Time 0.276 (0.753)	Data Time 0.001 (0.250)	Loss 2.7466 (2.6123)	Entropy 0.62421 (0.62451)	Top-1 acc 58.984 (60.992)	Top-5 acc 78.125 (81.952)	lr 0.01133
Train [64][1920/3239]	Time 0.255 (0.757)	Data Time 0.001 (0.254)	Loss 2.3613 (2.6120)	Entropy 0.62416 (0.62450)	Top-1 acc 68.359 (61.002)	Top-5 acc 84.375 (81.954)	lr 0.01133
Train [64][1930/3239]	Time 0.238 (0.756)	Data Time 0.001 (0.254)	Loss 2.7045 (2.6120)	Entropy 0.62377 (0.62450)	Top-1 acc 60.156 (60.995)	Top-5 acc 79.297 (81.955)	lr 0.01133
Train [64][1940/3239]	Time 0.333 (0.754)	Data Time 0.001 (0.253)	Loss 2.8451 (2.6122)	Entropy 0.62383 (0.62450)	Top-1 acc 55.078 (60.991)	Top-5 acc 78.516 (81.952)	lr 0.01132
Train [64][1950/3239]	Time 0.246 (0.760)	Data Time 0.001 (0.258)	Loss 2.7102 (2.6125)	Entropy 0.62361 (0.62449)	Top-1 acc 60.156 (60.983)	Top-5 acc 79.297 (81.947)	lr 0.01132
Train [64][1960/3239]	Time 0.241 (0.759)	Data Time 0.001 (0.258)	Loss 2.4894 (2.6127)	Entropy 0.62310 (0.62449)	Top-1 acc 61.719 (60.980)	Top-5 acc 87.109 (81.943)	lr 0.01132
Train [64][1970/3239]	Time 0.255 (0.758)	Data Time 0.001 (0.257)	Loss 2.6029 (2.6125)	Entropy 0.62327 (0.62448)	Top-1 acc 58.594 (60.977)	Top-5 acc 82.812 (81.946)	lr 0.01132
Train [64][1980/3239]	Time 0.229 (0.761)	Data Time 0.001 (0.261)	Loss 2.6544 (2.6127)	Entropy 0.62306 (0.62448)	Top-1 acc 60.938 (60.970)	Top-5 acc 80.469 (81.944)	lr 0.01132
Train [64][1990/3239]	Time 0.225 (0.763)	Data Time 0.001 (0.263)	Loss 2.7265 (2.6128)	Entropy 0.62324 (0.62447)	Top-1 acc 60.547 (60.967)	Top-5 acc 79.688 (81.944)	lr 0.01132
Train [64][2000/3239]	Time 0.243 (0.761)	Data Time 0.001 (0.261)	Loss 2.7059 (2.6129)	Entropy 0.62348 (0.62446)	Top-1 acc 59.375 (60.965)	Top-5 acc 79.688 (81.943)	lr 0.01132
Train [64][2010/3239]	Time 0.400 (0.764)	Data Time 0.002 (0.265)	Loss 2.5495 (2.6129)	Entropy 0.62292 (0.62446)	Top-1 acc 63.281 (60.970)	Top-5 acc 82.812 (81.947)	lr 0.01132
Train [64][2020/3239]	Time 0.232 (0.765)	Data Time 0.001 (0.266)	Loss 2.7221 (2.6129)	Entropy 0.62296 (0.62445)	Top-1 acc 61.328 (60.970)	Top-5 acc 79.688 (81.947)	lr 0.01132
Train [64][2030/3239]	Time 0.232 (0.763)	Data Time 0.001 (0.264)	Loss 2.5180 (2.6128)	Entropy 0.62271 (0.62444)	Top-1 acc 65.234 (60.981)	Top-5 acc 82.422 (81.945)	lr 0.01131
Train [64][2040/3239]	Time 0.236 (0.767)	Data Time 0.001 (0.269)	Loss 2.6300 (2.6130)	Entropy 0.62283 (0.62444)	Top-1 acc 61.328 (60.979)	Top-5 acc 81.641 (81.938)	lr 0.01131
Train [64][2050/3239]	Time 0.225 (0.767)	Data Time 0.001 (0.270)	Loss 2.8161 (2.6129)	Entropy 0.62296 (0.62443)	Top-1 acc 56.250 (60.982)	Top-5 acc 77.734 (81.941)	lr 0.01131
Train [64][2060/3239]	Time 0.228 (0.766)	Data Time 0.001 (0.268)	Loss 2.5286 (2.6130)	Entropy 0.62298 (0.62442)	Top-1 acc 60.156 (60.979)	Top-5 acc 83.594 (81.940)	lr 0.01131
Train [64][2070/3239]	Time 0.252 (0.764)	Data Time 0.001 (0.267)	Loss 2.4707 (2.6128)	Entropy 0.62251 (0.62441)	Top-1 acc 62.109 (60.982)	Top-5 acc 87.500 (81.942)	lr 0.01131
Train [64][2080/3239]	Time 0.236 (0.769)	Data Time 0.001 (0.272)	Loss 2.6376 (2.6127)	Entropy 0.62204 (0.62440)	Top-1 acc 60.547 (60.983)	Top-5 acc 80.859 (81.942)	lr 0.01131
Train [64][2090/3239]	Time 0.248 (0.771)	Data Time 0.001 (0.274)	Loss 2.5668 (2.6131)	Entropy 0.62182 (0.62439)	Top-1 acc 64.062 (60.975)	Top-5 acc 79.688 (81.936)	lr 0.01131
Train [64][2100/3239]	Time 0.309 (0.769)	Data Time 0.001 (0.273)	Loss 2.5103 (2.6132)	Entropy 0.62189 (0.62438)	Top-1 acc 64.062 (60.970)	Top-5 acc 83.984 (81.936)	lr 0.01131
Train [64][2110/3239]	Time 0.258 (0.773)	Data Time 0.002 (0.277)	Loss 2.6577 (2.6137)	Entropy 0.62164 (0.62437)	Top-1 acc 61.328 (60.962)	Top-5 acc 80.469 (81.926)	lr 0.01131
Train [64][2120/3239]	Time 0.279 (0.774)	Data Time 0.001 (0.278)	Loss 2.7251 (2.6137)	Entropy 0.62170 (0.62435)	Top-1 acc 58.203 (60.962)	Top-5 acc 77.734 (81.922)	lr 0.01131
Train [64][2130/3239]	Time 0.242 (0.772)	Data Time 0.001 (0.277)	Loss 2.6103 (2.6136)	Entropy 0.62169 (0.62434)	Top-1 acc 57.812 (60.965)	Top-5 acc 80.469 (81.921)	lr 0.01130
Train [64][2140/3239]	Time 0.249 (0.776)	Data Time 0.001 (0.281)	Loss 2.6073 (2.6137)	Entropy 0.62180 (0.62433)	Top-1 acc 63.281 (60.965)	Top-5 acc 77.344 (81.917)	lr 0.01130
Train [64][2150/3239]	Time 0.228 (0.776)	Data Time 0.001 (0.282)	Loss 2.6737 (2.6137)	Entropy 0.62184 (0.62432)	Top-1 acc 60.938 (60.965)	Top-5 acc 82.031 (81.918)	lr 0.01130
Train [64][2160/3239]	Time 0.234 (0.775)	Data Time 0.001 (0.281)	Loss 2.5973 (2.6138)	Entropy 0.62151 (0.62431)	Top-1 acc 61.328 (60.960)	Top-5 acc 82.812 (81.915)	lr 0.01130
Train [64][2170/3239]	Time 0.355 (0.779)	Data Time 0.001 (0.285)	Loss 2.6329 (2.6138)	Entropy 0.62141 (0.62429)	Top-1 acc 59.375 (60.958)	Top-5 acc 82.422 (81.916)	lr 0.01130
Train [64][2180/3239]	Time 0.279 (0.796)	Data Time 0.002 (0.285)	Loss 2.6063 (2.6138)	Entropy 0.62139 (0.62428)	Top-1 acc 61.328 (60.960)	Top-5 acc 81.641 (81.918)	lr 0.01130
Train [64][2190/3239]	Time 0.226 (0.794)	Data Time 0.001 (0.283)	Loss 2.4217 (2.6139)	Entropy 0.62143 (0.62427)	Top-1 acc 67.578 (60.957)	Top-5 acc 83.984 (81.915)	lr 0.01130
Train [64][2200/3239]	Time 0.240 (0.793)	Data Time 0.002 (0.282)	Loss 2.4722 (2.6135)	Entropy 0.62086 (0.62425)	Top-1 acc 65.625 (60.966)	Top-5 acc 84.766 (81.921)	lr 0.01130
Train [64][2210/3239]	Time 0.242 (0.791)	Data Time 0.001 (0.281)	Loss 2.5740 (2.6135)	Entropy 0.62065 (0.62424)	Top-1 acc 64.062 (60.964)	Top-5 acc 82.422 (81.921)	lr 0.01130
Train [64][2220/3239]	Time 0.258 (0.790)	Data Time 0.002 (0.280)	Loss 2.5356 (2.6134)	Entropy 0.62084 (0.62422)	Top-1 acc 62.891 (60.968)	Top-5 acc 81.250 (81.924)	lr 0.01130
Train [64][2230/3239]	Time 0.245 (0.788)	Data Time 0.001 (0.278)	Loss 2.7089 (2.6139)	Entropy 0.62069 (0.62421)	Top-1 acc 58.203 (60.956)	Top-5 acc 77.734 (81.918)	lr 0.01129
Train [64][2240/3239]	Time 2.935 (0.789)	Data Time 2.686 (0.280)	Loss 2.6117 (2.6138)	Entropy 0.62055 (0.62419)	Top-1 acc 63.281 (60.962)	Top-5 acc 82.812 (81.919)	lr 0.01129
Train [64][2250/3239]	Time 0.238 (0.789)	Data Time 0.001 (0.280)	Loss 2.5222 (2.6140)	Entropy 0.62079 (0.62417)	Top-1 acc 63.672 (60.961)	Top-5 acc 83.984 (81.916)	lr 0.01129
Train [64][2260/3239]	Time 0.333 (0.788)	Data Time 0.001 (0.279)	Loss 2.5691 (2.6141)	Entropy 0.62118 (0.62416)	Top-1 acc 61.328 (60.956)	Top-5 acc 82.812 (81.916)	lr 0.01129
Train [64][2270/3239]	Time 0.231 (0.789)	Data Time 0.001 (0.281)	Loss 2.6298 (2.6141)	Entropy 0.62111 (0.62415)	Top-1 acc 59.766 (60.955)	Top-5 acc 82.031 (81.917)	lr 0.01129
Train [64][2280/3239]	Time 0.237 (0.795)	Data Time 0.001 (0.288)	Loss 2.6171 (2.6141)	Entropy 0.62076 (0.62413)	Top-1 acc 59.375 (60.953)	Top-5 acc 82.812 (81.916)	lr 0.01129
Train [64][2290/3239]	Time 0.238 (0.794)	Data Time 0.001 (0.286)	Loss 2.5587 (2.6144)	Entropy 0.62083 (0.62412)	Top-1 acc 64.453 (60.948)	Top-5 acc 83.594 (81.910)	lr 0.01129
Train [64][2300/3239]	Time 0.237 (0.794)	Data Time 0.001 (0.287)	Loss 2.5423 (2.6144)	Entropy 0.62105 (0.62410)	Top-1 acc 63.281 (60.949)	Top-5 acc 83.984 (81.911)	lr 0.01129
Train [64][2310/3239]	Time 0.235 (0.800)	Data Time 0.001 (0.294)	Loss 2.7978 (2.6147)	Entropy 0.62113 (0.62409)	Top-1 acc 58.594 (60.943)	Top-5 acc 80.859 (81.907)	lr 0.01129
Train [64][2320/3239]	Time 0.233 (0.799)	Data Time 0.001 (0.293)	Loss 2.3629 (2.6143)	Entropy 0.62083 (0.62408)	Top-1 acc 63.672 (60.951)	Top-5 acc 86.719 (81.915)	lr 0.01129
Train [64][2330/3239]	Time 0.322 (0.799)	Data Time 0.001 (0.293)	Loss 2.7510 (2.6143)	Entropy 0.62063 (0.62406)	Top-1 acc 58.203 (60.954)	Top-5 acc 78.906 (81.912)	lr 0.01128
Train [64][2340/3239]	Time 0.235 (0.806)	Data Time 0.001 (0.300)	Loss 2.6617 (2.6144)	Entropy 0.62084 (0.62405)	Top-1 acc 59.375 (60.951)	Top-5 acc 82.031 (81.912)	lr 0.01128
Train [64][2350/3239]	Time 0.244 (0.805)	Data Time 0.001 (0.299)	Loss 2.7697 (2.6146)	Entropy 0.62098 (0.62404)	Top-1 acc 59.375 (60.946)	Top-5 acc 77.344 (81.906)	lr 0.01128
Train [64][2360/3239]	Time 0.219 (0.805)	Data Time 0.001 (0.300)	Loss 2.7316 (2.6149)	Entropy 0.62119 (0.62402)	Top-1 acc 59.766 (60.941)	Top-5 acc 79.297 (81.906)	lr 0.01128
Train [64][2370/3239]	Time 0.241 (0.811)	Data Time 0.001 (0.306)	Loss 2.6017 (2.6150)	Entropy 0.62131 (0.62401)	Top-1 acc 60.547 (60.939)	Top-5 acc 83.984 (81.907)	lr 0.01128
Train [64][2380/3239]	Time 0.223 (0.810)	Data Time 0.001 (0.306)	Loss 2.7852 (2.6152)	Entropy 0.62118 (0.62400)	Top-1 acc 59.375 (60.931)	Top-5 acc 78.906 (81.901)	lr 0.01128
Train [64][2390/3239]	Time 0.261 (0.809)	Data Time 0.001 (0.305)	Loss 2.7307 (2.6149)	Entropy 0.62114 (0.62399)	Top-1 acc 57.422 (60.938)	Top-5 acc 80.469 (81.909)	lr 0.01128
Train [64][2400/3239]	Time 4.049 (0.814)	Data Time 3.795 (0.311)	Loss 2.5369 (2.6149)	Entropy 0.62149 (0.62398)	Top-1 acc 60.938 (60.937)	Top-5 acc 83.594 (81.908)	lr 0.01128
Train [64][2410/3239]	Time 0.252 (0.816)	Data Time 0.001 (0.313)	Loss 2.6086 (2.6149)	Entropy 0.62166 (0.62397)	Top-1 acc 60.547 (60.933)	Top-5 acc 81.641 (81.907)	lr 0.01128
Train [64][2420/3239]	Time 0.254 (0.815)	Data Time 0.002 (0.312)	Loss 2.5697 (2.6151)	Entropy 0.62199 (0.62396)	Top-1 acc 59.375 (60.928)	Top-5 acc 81.641 (81.900)	lr 0.01128
Train [64][2430/3239]	Time 0.250 (0.816)	Data Time 0.001 (0.313)	Loss 2.5228 (2.6150)	Entropy 0.62217 (0.62395)	Top-1 acc 62.891 (60.933)	Top-5 acc 83.594 (81.902)	lr 0.01127
Train [64][2440/3239]	Time 0.242 (0.821)	Data Time 0.001 (0.318)	Loss 2.4512 (2.6151)	Entropy 0.62224 (0.62394)	Top-1 acc 65.234 (60.927)	Top-5 acc 85.547 (81.900)	lr 0.01127
Train [64][2450/3239]	Time 0.243 (0.820)	Data Time 0.001 (0.318)	Loss 2.4793 (2.6148)	Entropy 0.62215 (0.62394)	Top-1 acc 62.500 (60.932)	Top-5 acc 83.594 (81.905)	lr 0.01127
Train [64][2460/3239]	Time 0.250 (0.821)	Data Time 0.001 (0.319)	Loss 2.5473 (2.6149)	Entropy 0.62216 (0.62393)	Top-1 acc 62.891 (60.930)	Top-5 acc 81.641 (81.902)	lr 0.01127
Train [64][2470/3239]	Time 0.241 (0.827)	Data Time 0.001 (0.325)	Loss 2.5030 (2.6146)	Entropy 0.62209 (0.62392)	Top-1 acc 62.500 (60.936)	Top-5 acc 82.812 (81.907)	lr 0.01127
Train [64][2480/3239]	Time 0.227 (0.825)	Data Time 0.001 (0.324)	Loss 2.5940 (2.6147)	Entropy 0.62222 (0.62392)	Top-1 acc 60.547 (60.936)	Top-5 acc 83.203 (81.905)	lr 0.01127
Train [64][2490/3239]	Time 0.328 (0.825)	Data Time 0.001 (0.324)	Loss 2.5038 (2.6146)	Entropy 0.62194 (0.62391)	Top-1 acc 64.844 (60.939)	Top-5 acc 82.422 (81.906)	lr 0.01127
Train [64][2500/3239]	Time 0.236 (0.834)	Data Time 0.001 (0.333)	Loss 2.7428 (2.6149)	Entropy 0.62183 (0.62390)	Top-1 acc 57.812 (60.932)	Top-5 acc 80.078 (81.901)	lr 0.01127
Train [64][2510/3239]	Time 0.252 (0.832)	Data Time 0.001 (0.332)	Loss 2.6235 (2.6149)	Entropy 0.62200 (0.62389)	Top-1 acc 57.422 (60.928)	Top-5 acc 83.984 (81.901)	lr 0.01127
Train [64][2520/3239]	Time 0.237 (0.831)	Data Time 0.001 (0.331)	Loss 2.3302 (2.6150)	Entropy 0.62165 (0.62388)	Top-1 acc 72.656 (60.932)	Top-5 acc 84.375 (81.901)	lr 0.01127
Train [64][2530/3239]	Time 0.220 (0.836)	Data Time 0.001 (0.337)	Loss 2.6491 (2.6149)	Entropy 0.62174 (0.62388)	Top-1 acc 59.375 (60.932)	Top-5 acc 80.078 (81.901)	lr 0.01126
Train [64][2540/3239]	Time 0.254 (0.836)	Data Time 0.001 (0.337)	Loss 2.3723 (2.6148)	Entropy 0.62214 (0.62387)	Top-1 acc 66.406 (60.936)	Top-5 acc 88.672 (81.905)	lr 0.01126
Train [64][2550/3239]	Time 0.223 (0.835)	Data Time 0.001 (0.336)	Loss 2.6629 (2.6148)	Entropy 0.62230 (0.62386)	Top-1 acc 60.156 (60.939)	Top-5 acc 82.422 (81.905)	lr 0.01126
Train [64][2560/3239]	Time 10.452 (0.840)	Data Time 10.074 (0.342)	Loss 2.6308 (2.6152)	Entropy 0.62263 (0.62386)	Top-1 acc 58.594 (60.929)	Top-5 acc 80.078 (81.896)	lr 0.01126
Train [64][2570/3239]	Time 0.252 (0.842)	Data Time 0.001 (0.344)	Loss 2.6981 (2.6153)	Entropy 0.62251 (0.62385)	Top-1 acc 60.547 (60.927)	Top-5 acc 80.469 (81.892)	lr 0.01126
Train [64][2580/3239]	Time 0.273 (0.841)	Data Time 0.001 (0.343)	Loss 2.5119 (2.6154)	Entropy 0.62255 (0.62385)	Top-1 acc 62.109 (60.925)	Top-5 acc 83.984 (81.892)	lr 0.01126
Train [64][2590/3239]	Time 0.261 (0.841)	Data Time 0.001 (0.344)	Loss 2.4542 (2.6153)	Entropy 0.62243 (0.62384)	Top-1 acc 62.891 (60.927)	Top-5 acc 84.375 (81.895)	lr 0.01126
Train [64][2600/3239]	Time 0.231 (0.846)	Data Time 0.001 (0.349)	Loss 2.5980 (2.6154)	Entropy 0.62229 (0.62383)	Top-1 acc 62.109 (60.926)	Top-5 acc 80.078 (81.894)	lr 0.01126
Train [64][2610/3239]	Time 0.233 (0.847)	Data Time 0.001 (0.350)	Loss 2.4626 (2.6153)	Entropy 0.62193 (0.62383)	Top-1 acc 62.109 (60.926)	Top-5 acc 84.375 (81.898)	lr 0.01126
Train [64][2620/3239]	Time 0.243 (0.846)	Data Time 0.001 (0.349)	Loss 2.7277 (2.6153)	Entropy 0.62228 (0.62382)	Top-1 acc 59.375 (60.931)	Top-5 acc 80.469 (81.896)	lr 0.01126
Train [64][2630/3239]	Time 0.232 (0.851)	Data Time 0.001 (0.354)	Loss 3.0046 (2.6155)	Entropy 0.62235 (0.62382)	Top-1 acc 50.391 (60.922)	Top-5 acc 74.219 (81.894)	lr 0.01125
Train [64][2640/3239]	Time 0.228 (0.852)	Data Time 0.001 (0.356)	Loss 2.7343 (2.6154)	Entropy 0.62254 (0.62381)	Top-1 acc 58.984 (60.923)	Top-5 acc 78.906 (81.895)	lr 0.01125
Train [64][2650/3239]	Time 0.296 (0.850)	Data Time 0.001 (0.354)	Loss 2.8684 (2.6156)	Entropy 0.62262 (0.62381)	Top-1 acc 54.688 (60.921)	Top-5 acc 77.344 (81.889)	lr 0.01125
Train [64][2660/3239]	Time 0.261 (0.856)	Data Time 0.038 (0.360)	Loss 2.5020 (2.6161)	Entropy 0.62254 (0.62380)	Top-1 acc 63.672 (60.909)	Top-5 acc 85.156 (81.880)	lr 0.01125
Train [64][2670/3239]	Time 6.196 (0.858)	Data Time 5.934 (0.363)	Loss 2.3880 (2.6160)	Entropy 0.62243 (0.62380)	Top-1 acc 66.797 (60.912)	Top-5 acc 85.547 (81.881)	lr 0.01125
Train [64][2680/3239]	Time 0.233 (0.856)	Data Time 0.001 (0.362)	Loss 2.5822 (2.6162)	Entropy 0.62222 (0.62379)	Top-1 acc 62.109 (60.907)	Top-5 acc 82.031 (81.875)	lr 0.01125
Train [64][2690/3239]	Time 0.229 (0.858)	Data Time 0.001 (0.363)	Loss 2.6763 (2.6164)	Entropy 0.62226 (0.62379)	Top-1 acc 63.281 (60.904)	Top-5 acc 80.859 (81.871)	lr 0.01125
Train [64][2700/3239]	Time 0.224 (0.860)	Data Time 0.001 (0.366)	Loss 3.0195 (2.6167)	Entropy 0.62242 (0.62378)	Top-1 acc 54.297 (60.899)	Top-5 acc 75.000 (81.866)	lr 0.01125
Train [64][2710/3239]	Time 0.239 (0.862)	Data Time 0.001 (0.368)	Loss 2.9028 (2.6168)	Entropy 0.62266 (0.62378)	Top-1 acc 53.906 (60.897)	Top-5 acc 75.000 (81.861)	lr 0.01125
Train [64][2720/3239]	Time 1.948 (0.861)	Data Time 1.609 (0.367)	Loss 2.6139 (2.6167)	Entropy 0.62242 (0.62377)	Top-1 acc 60.156 (60.900)	Top-5 acc 81.641 (81.862)	lr 0.01125
Train [64][2730/3239]	Time 0.251 (0.864)	Data Time 0.001 (0.371)	Loss 2.7481 (2.6167)	Entropy 0.62228 (0.62377)	Top-1 acc 60.547 (60.903)	Top-5 acc 78.516 (81.860)	lr 0.01124
Train [64][2740/3239]	Time 0.288 (0.867)	Data Time 0.001 (0.373)	Loss 2.5647 (2.6167)	Entropy 0.62233 (0.62376)	Top-1 acc 65.625 (60.903)	Top-5 acc 80.469 (81.859)	lr 0.01124
Train [64][2750/3239]	Time 0.224 (0.865)	Data Time 0.001 (0.372)	Loss 2.6938 (2.6168)	Entropy 0.62252 (0.62376)	Top-1 acc 58.984 (60.901)	Top-5 acc 80.469 (81.858)	lr 0.01124
Train [64][2760/3239]	Time 0.264 (0.868)	Data Time 0.001 (0.375)	Loss 2.5503 (2.6168)	Entropy 0.62266 (0.62375)	Top-1 acc 62.109 (60.896)	Top-5 acc 82.031 (81.859)	lr 0.01124
Train [64][2770/3239]	Time 0.235 (0.871)	Data Time 0.001 (0.379)	Loss 2.6582 (2.6167)	Entropy 0.62272 (0.62375)	Top-1 acc 63.281 (60.901)	Top-5 acc 81.250 (81.860)	lr 0.01124
Train [64][2780/3239]	Time 0.256 (0.870)	Data Time 0.001 (0.377)	Loss 2.6913 (2.6168)	Entropy 0.62304 (0.62374)	Top-1 acc 59.375 (60.897)	Top-5 acc 81.250 (81.857)	lr 0.01124
Train [64][2790/3239]	Time 0.387 (0.874)	Data Time 0.001 (0.382)	Loss 2.8094 (2.6170)	Entropy 0.62329 (0.62374)	Top-1 acc 55.469 (60.891)	Top-5 acc 77.734 (81.856)	lr 0.01124
Train [64][2800/3239]	Time 0.287 (0.877)	Data Time 0.001 (0.385)	Loss 2.6838 (2.6169)	Entropy 0.62276 (0.62374)	Top-1 acc 56.250 (60.891)	Top-5 acc 78.516 (81.854)	lr 0.01124
Train [64][2810/3239]	Time 0.233 (0.875)	Data Time 0.001 (0.383)	Loss 2.8012 (2.6172)	Entropy 0.62246 (0.62374)	Top-1 acc 56.641 (60.888)	Top-5 acc 78.125 (81.850)	lr 0.01124
Train [64][2820/3239]	Time 0.236 (0.878)	Data Time 0.001 (0.386)	Loss 2.7249 (2.6171)	Entropy 0.62250 (0.62373)	Top-1 acc 57.422 (60.893)	Top-5 acc 80.859 (81.852)	lr 0.01124
Train [64][2830/3239]	Time 0.337 (0.891)	Data Time 0.006 (0.385)	Loss 2.3489 (2.6169)	Entropy 0.62260 (0.62373)	Top-1 acc 67.578 (60.895)	Top-5 acc 89.062 (81.860)	lr 0.01123
Train [64][2840/3239]	Time 0.256 (0.890)	Data Time 0.002 (0.384)	Loss 2.7320 (2.6173)	Entropy 0.62267 (0.62372)	Top-1 acc 57.422 (60.888)	Top-5 acc 80.469 (81.856)	lr 0.01123
Train [64][2850/3239]	Time 0.241 (0.888)	Data Time 0.001 (0.383)	Loss 2.5703 (2.6174)	Entropy 0.62262 (0.62372)	Top-1 acc 61.719 (60.885)	Top-5 acc 81.641 (81.855)	lr 0.01123
Train [64][2860/3239]	Time 0.266 (0.887)	Data Time 0.002 (0.381)	Loss 2.6839 (2.6175)	Entropy 0.62262 (0.62372)	Top-1 acc 56.250 (60.883)	Top-5 acc 82.031 (81.850)	lr 0.01123
Train [64][2870/3239]	Time 0.237 (0.885)	Data Time 0.001 (0.380)	Loss 2.5855 (2.6176)	Entropy 0.62285 (0.62371)	Top-1 acc 62.891 (60.880)	Top-5 acc 81.250 (81.846)	lr 0.01123
Train [64][2880/3239]	Time 0.354 (0.883)	Data Time 0.002 (0.379)	Loss 2.5290 (2.6176)	Entropy 0.62277 (0.62371)	Top-1 acc 62.891 (60.879)	Top-5 acc 84.766 (81.845)	lr 0.01123
Train [64][2890/3239]	Time 0.253 (0.884)	Data Time 0.001 (0.380)	Loss 2.4875 (2.6173)	Entropy 0.62275 (0.62371)	Top-1 acc 66.016 (60.885)	Top-5 acc 85.156 (81.849)	lr 0.01123
Train [64][2900/3239]	Time 0.250 (0.886)	Data Time 0.001 (0.382)	Loss 2.4236 (2.6173)	Entropy 0.62281 (0.62370)	Top-1 acc 69.531 (60.888)	Top-5 acc 85.938 (81.851)	lr 0.01123
Train [64][2910/3239]	Time 0.266 (0.884)	Data Time 0.001 (0.380)	Loss 2.5707 (2.6173)	Entropy 0.62287 (0.62370)	Top-1 acc 57.812 (60.889)	Top-5 acc 83.594 (81.851)	lr 0.01123
Train [64][2920/3239]	Time 0.259 (0.888)	Data Time 0.001 (0.385)	Loss 2.5458 (2.6170)	Entropy 0.62340 (0.62370)	Top-1 acc 64.844 (60.897)	Top-5 acc 81.250 (81.853)	lr 0.01123
Train [64][2930/3239]	Time 0.241 (0.890)	Data Time 0.001 (0.387)	Loss 2.6698 (2.6170)	Entropy 0.62317 (0.62370)	Top-1 acc 57.812 (60.896)	Top-5 acc 80.469 (81.853)	lr 0.01122
Train [64][2940/3239]	Time 0.260 (0.889)	Data Time 0.001 (0.386)	Loss 2.7310 (2.6171)	Entropy 0.62253 (0.62369)	Top-1 acc 61.328 (60.895)	Top-5 acc 80.469 (81.855)	lr 0.01122
Train [64][2950/3239]	Time 0.245 (0.891)	Data Time 0.001 (0.388)	Loss 2.4644 (2.6170)	Entropy 0.62249 (0.62369)	Top-1 acc 64.062 (60.900)	Top-5 acc 83.594 (81.857)	lr 0.01122
Train [64][2960/3239]	Time 0.258 (0.892)	Data Time 0.001 (0.389)	Loss 2.5815 (2.6171)	Entropy 0.62238 (0.62369)	Top-1 acc 60.938 (60.896)	Top-5 acc 82.031 (81.854)	lr 0.01122
Train [64][2970/3239]	Time 0.238 (0.891)	Data Time 0.001 (0.388)	Loss 2.9135 (2.6173)	Entropy 0.62222 (0.62368)	Top-1 acc 54.297 (60.893)	Top-5 acc 75.000 (81.850)	lr 0.01122
Train [64][2980/3239]	Time 0.251 (0.890)	Data Time 0.002 (0.387)	Loss 2.6598 (2.6174)	Entropy 0.62220 (0.62368)	Top-1 acc 60.547 (60.889)	Top-5 acc 80.078 (81.849)	lr 0.01122
Train [64][2990/3239]	Time 5.028 (0.891)	Data Time 4.776 (0.389)	Loss 2.6855 (2.6176)	Entropy 0.62235 (0.62367)	Top-1 acc 60.547 (60.883)	Top-5 acc 81.641 (81.843)	lr 0.01122
Train [64][3000/3239]	Time 0.293 (0.890)	Data Time 0.001 (0.388)	Loss 2.7899 (2.6177)	Entropy 0.62232 (0.62367)	Top-1 acc 55.469 (60.883)	Top-5 acc 78.906 (81.841)	lr 0.01122
Train [64][3010/3239]	Time 0.247 (0.888)	Data Time 0.001 (0.386)	Loss 2.3473 (2.6174)	Entropy 0.62230 (0.62366)	Top-1 acc 69.141 (60.892)	Top-5 acc 87.500 (81.845)	lr 0.01122
Train [64][3020/3239]	Time 0.260 (0.890)	Data Time 0.002 (0.389)	Loss 2.6061 (2.6174)	Entropy 0.62228 (0.62366)	Top-1 acc 61.328 (60.894)	Top-5 acc 82.422 (81.845)	lr 0.01122
Train [64][3030/3239]	Time 0.236 (0.894)	Data Time 0.001 (0.392)	Loss 2.6186 (2.6174)	Entropy 0.62262 (0.62365)	Top-1 acc 60.938 (60.896)	Top-5 acc 82.812 (81.843)	lr 0.01121
Train [64][3040/3239]	Time 0.367 (0.892)	Data Time 0.001 (0.391)	Loss 2.4327 (2.6172)	Entropy 0.62257 (0.62365)	Top-1 acc 64.844 (60.898)	Top-5 acc 85.547 (81.846)	lr 0.01121
Train [64][3050/3239]	Time 0.234 (0.895)	Data Time 0.001 (0.394)	Loss 2.5621 (2.6172)	Entropy 0.62249 (0.62365)	Top-1 acc 61.719 (60.900)	Top-5 acc 82.031 (81.848)	lr 0.01121
Train [64][3060/3239]	Time 0.242 (0.898)	Data Time 0.001 (0.397)	Loss 2.5918 (2.6173)	Entropy 0.62255 (0.62364)	Top-1 acc 60.156 (60.893)	Top-5 acc 83.203 (81.848)	lr 0.01121
Train [64][3070/3239]	Time 0.228 (0.896)	Data Time 0.001 (0.396)	Loss 2.5316 (2.6171)	Entropy 0.62233 (0.62364)	Top-1 acc 60.547 (60.895)	Top-5 acc 83.203 (81.851)	lr 0.01121
Train [64][3080/3239]	Time 0.232 (0.897)	Data Time 0.001 (0.397)	Loss 2.5444 (2.6171)	Entropy 0.62235 (0.62363)	Top-1 acc 64.062 (60.898)	Top-5 acc 82.422 (81.849)	lr 0.01121
Train [64][3090/3239]	Time 0.226 (0.901)	Data Time 0.001 (0.401)	Loss 2.7378 (2.6172)	Entropy 0.62201 (0.62363)	Top-1 acc 55.078 (60.894)	Top-5 acc 79.297 (81.846)	lr 0.01121
Train [64][3100/3239]	Time 0.245 (0.899)	Data Time 0.001 (0.400)	Loss 2.4875 (2.6170)	Entropy 0.62192 (0.62362)	Top-1 acc 69.922 (60.896)	Top-5 acc 83.203 (81.848)	lr 0.01121
Train [64][3110/3239]	Time 0.323 (0.898)	Data Time 0.001 (0.399)	Loss 2.4646 (2.6169)	Entropy 0.62194 (0.62362)	Top-1 acc 65.625 (60.898)	Top-5 acc 83.594 (81.849)	lr 0.01121
Train [64][3120/3239]	Time 0.233 (0.905)	Data Time 0.001 (0.405)	Loss 2.7538 (2.6171)	Entropy 0.62203 (0.62361)	Top-1 acc 55.859 (60.893)	Top-5 acc 80.078 (81.845)	lr 0.01121
Train [64][3130/3239]	Time 0.239 (0.903)	Data Time 0.001 (0.404)	Loss 2.6214 (2.6170)	Entropy 0.62221 (0.62361)	Top-1 acc 58.203 (60.893)	Top-5 acc 83.203 (81.847)	lr 0.01120
Train [64][3140/3239]	Time 0.259 (0.901)	Data Time 0.001 (0.403)	Loss 2.6847 (2.6171)	Entropy 0.62220 (0.62360)	Top-1 acc 57.812 (60.889)	Top-5 acc 79.688 (81.849)	lr 0.01120
Train [64][3150/3239]	Time 7.421 (0.904)	Data Time 7.190 (0.405)	Loss 2.6107 (2.6169)	Entropy 0.62173 (0.62360)	Top-1 acc 60.938 (60.892)	Top-5 acc 80.078 (81.851)	lr 0.01120
Train [64][3160/3239]	Time 0.279 (0.902)	Data Time 0.001 (0.404)	Loss 2.5174 (2.6170)	Entropy 0.62164 (0.62359)	Top-1 acc 60.938 (60.889)	Top-5 acc 80.078 (81.845)	lr 0.01120
Train [64][3170/3239]	Time 0.234 (0.901)	Data Time 0.001 (0.403)	Loss 2.5984 (2.6172)	Entropy 0.62180 (0.62359)	Top-1 acc 60.938 (60.882)	Top-5 acc 79.688 (81.840)	lr 0.01120
Train [64][3180/3239]	Time 0.268 (0.901)	Data Time 0.000 (0.403)	Loss 2.4887 (2.6172)	Entropy 0.62185 (0.62358)	Top-1 acc 64.453 (60.882)	Top-5 acc 86.328 (81.843)	lr 0.01120
Train [64][3190/3239]	Time 0.228 (0.902)	Data Time 0.000 (0.404)	Loss 2.5002 (2.6170)	Entropy 0.62163 (0.62358)	Top-1 acc 62.891 (60.889)	Top-5 acc 83.203 (81.846)	lr 0.01120
Train [64][3200/3239]	Time 0.337 (0.900)	Data Time 0.000 (0.403)	Loss 2.8735 (2.6171)	Entropy 0.62165 (0.62357)	Top-1 acc 55.859 (60.890)	Top-5 acc 76.562 (81.845)	lr 0.01120
Train [64][3210/3239]	Time 0.242 (0.900)	Data Time 0.000 (0.403)	Loss 2.6254 (2.6173)	Entropy 0.62205 (0.62356)	Top-1 acc 61.328 (60.884)	Top-5 acc 82.031 (81.839)	lr 0.01120
Train [64][3220/3239]	Time 0.223 (0.899)	Data Time 0.000 (0.403)	Loss 2.9084 (2.6175)	Entropy 0.62177 (0.62356)	Top-1 acc 53.906 (60.880)	Top-5 acc 76.172 (81.837)	lr 0.01120
Train [64][3230/3239]	Time 0.229 (0.898)	Data Time 0.000 (0.401)	Loss 2.8579 (2.6177)	Entropy 0.62166 (0.62355)	Top-1 acc 58.594 (60.876)	Top-5 acc 76.953 (81.834)	lr 0.01119
Train [64][3239/3239]	Time 0.916 (0.896)	Data Time 0.000 (0.400)	Loss 2.5886 (2.6178)	Entropy 0.62147 (0.62355)	Top-1 acc 62.963 (60.874)	Top-5 acc 80.247 (81.830)	lr 0.01119
==========Valid [64/120]	loss 1.362	top-1 acc 68.487 (68.487)	top-5 acc 87.985	Train top-1 60.874	top-5 81.830	Entropy 0.62147	Latency-None: 0.000ms	Flops: 539.91M
Train [65][0/3239]	Time 35.950 (35.950)	Data Time 34.481 (34.481)	Loss 2.6913 (2.6913)	Entropy 0.62134 (0.62134)	Top-1 acc 59.766 (59.766)	Top-5 acc 79.297 (79.297)	lr 0.01119
Train [65][10/3239]	Time 0.274 (3.779)	Data Time 0.002 (3.204)	Loss 2.5070 (2.6090)	Entropy 0.62139 (0.62141)	Top-1 acc 60.547 (60.440)	Top-5 acc 83.984 (81.250)	lr 0.01119
Train [65][20/3239]	Time 0.276 (2.226)	Data Time 0.029 (1.681)	Loss 2.6622 (2.6097)	Entropy 0.62146 (0.62145)	Top-1 acc 61.719 (61.068)	Top-5 acc 81.250 (81.901)	lr 0.01119
Train [65][30/3239]	Time 0.276 (1.656)	Data Time 0.001 (1.139)	Loss 2.7086 (2.5907)	Entropy 0.62147 (0.62142)	Top-1 acc 59.766 (61.240)	Top-5 acc 79.688 (82.308)	lr 0.01119
Train [65][40/3239]	Time 0.274 (1.364)	Data Time 0.002 (0.862)	Loss 2.3980 (2.5917)	Entropy 0.62147 (0.62144)	Top-1 acc 64.062 (61.166)	Top-5 acc 86.719 (82.384)	lr 0.01119
Train [65][50/3239]	Time 0.292 (1.183)	Data Time 0.003 (0.693)	Loss 2.5501 (2.6060)	Entropy 0.62133 (0.62146)	Top-1 acc 64.453 (61.068)	Top-5 acc 82.422 (82.039)	lr 0.01119
Train [65][60/3239]	Time 0.259 (1.067)	Data Time 0.001 (0.580)	Loss 2.5738 (2.6007)	Entropy 0.62054 (0.62142)	Top-1 acc 60.938 (61.219)	Top-5 acc 80.859 (82.102)	lr 0.01119
Train [65][70/3239]	Time 0.280 (0.978)	Data Time 0.001 (0.498)	Loss 2.6069 (2.5924)	Entropy 0.62062 (0.62129)	Top-1 acc 57.812 (61.427)	Top-5 acc 81.641 (82.295)	lr 0.01119
Train [65][80/3239]	Time 0.276 (0.913)	Data Time 0.002 (0.437)	Loss 2.5469 (2.5940)	Entropy 0.62056 (0.62121)	Top-1 acc 63.672 (61.372)	Top-5 acc 83.984 (82.268)	lr 0.01119
Train [65][90/3239]	Time 0.241 (0.862)	Data Time 0.001 (0.389)	Loss 2.6619 (2.5984)	Entropy 0.62052 (0.62112)	Top-1 acc 58.203 (61.268)	Top-5 acc 79.297 (82.169)	lr 0.01118
Train [65][100/3239]	Time 0.336 (0.821)	Data Time 0.001 (0.351)	Loss 2.6895 (2.5972)	Entropy 0.62062 (0.62106)	Top-1 acc 58.203 (61.228)	Top-5 acc 79.297 (82.159)	lr 0.01118
Train [65][110/3239]	Time 0.280 (0.788)	Data Time 0.001 (0.319)	Loss 2.6886 (2.5982)	Entropy 0.62058 (0.62102)	Top-1 acc 60.547 (61.296)	Top-5 acc 80.859 (82.105)	lr 0.01118
Train [65][120/3239]	Time 0.253 (0.760)	Data Time 0.002 (0.293)	Loss 2.6591 (2.6017)	Entropy 0.62041 (0.62098)	Top-1 acc 59.766 (61.218)	Top-5 acc 80.078 (82.076)	lr 0.01118
Train [65][130/3239]	Time 0.275 (0.738)	Data Time 0.001 (0.271)	Loss 2.8598 (2.6089)	Entropy 0.62069 (0.62094)	Top-1 acc 51.953 (61.075)	Top-5 acc 77.344 (81.930)	lr 0.01118
Train [65][140/3239]	Time 0.228 (0.716)	Data Time 0.001 (0.252)	Loss 2.7614 (2.6091)	Entropy 0.62093 (0.62092)	Top-1 acc 52.734 (61.021)	Top-5 acc 77.344 (81.912)	lr 0.01118
Train [65][150/3239]	Time 0.221 (0.700)	Data Time 0.001 (0.235)	Loss 2.6794 (2.6073)	Entropy 0.62072 (0.62092)	Top-1 acc 55.859 (61.033)	Top-5 acc 81.250 (81.980)	lr 0.01118
Train [65][160/3239]	Time 0.220 (0.682)	Data Time 0.001 (0.221)	Loss 2.8971 (2.6089)	Entropy 0.62050 (0.62091)	Top-1 acc 52.344 (60.988)	Top-5 acc 78.125 (81.934)	lr 0.01118
Train [65][170/3239]	Time 0.415 (0.670)	Data Time 0.001 (0.208)	Loss 2.5084 (2.6056)	Entropy 0.62057 (0.62089)	Top-1 acc 63.281 (61.150)	Top-5 acc 84.766 (81.990)	lr 0.01118
Train [65][180/3239]	Time 0.283 (0.658)	Data Time 0.001 (0.196)	Loss 2.7430 (2.6095)	Entropy 0.62050 (0.62087)	Top-1 acc 58.203 (61.067)	Top-5 acc 80.859 (81.923)	lr 0.01118
Train [65][190/3239]	Time 0.242 (0.646)	Data Time 0.001 (0.186)	Loss 2.5013 (2.6081)	Entropy 0.62065 (0.62085)	Top-1 acc 63.672 (61.113)	Top-5 acc 83.984 (81.964)	lr 0.01117
Train [65][200/3239]	Time 0.278 (0.638)	Data Time 0.001 (0.177)	Loss 2.5168 (2.6073)	Entropy 0.62074 (0.62084)	Top-1 acc 60.938 (61.130)	Top-5 acc 84.766 (81.996)	lr 0.01117
Train [65][210/3239]	Time 0.240 (0.628)	Data Time 0.001 (0.169)	Loss 2.6742 (2.6077)	Entropy 0.62085 (0.62083)	Top-1 acc 58.203 (61.119)	Top-5 acc 82.031 (81.978)	lr 0.01117
Train [65][220/3239]	Time 0.253 (0.619)	Data Time 0.001 (0.161)	Loss 2.5276 (2.6061)	Entropy 0.62086 (0.62083)	Top-1 acc 62.500 (61.167)	Top-5 acc 85.156 (82.026)	lr 0.01117
Train [65][230/3239]	Time 0.288 (0.611)	Data Time 0.001 (0.154)	Loss 2.5150 (2.6061)	Entropy 0.62097 (0.62083)	Top-1 acc 62.109 (61.167)	Top-5 acc 83.984 (82.028)	lr 0.01117
Train [65][240/3239]	Time 0.290 (0.605)	Data Time 0.002 (0.148)	Loss 2.3247 (2.6073)	Entropy 0.62105 (0.62084)	Top-1 acc 69.141 (61.202)	Top-5 acc 87.109 (81.996)	lr 0.01117
Train [65][250/3239]	Time 0.319 (0.786)	Data Time 0.002 (0.142)	Loss 2.7655 (2.6087)	Entropy 0.62088 (0.62085)	Top-1 acc 57.422 (61.191)	Top-5 acc 81.250 (81.989)	lr 0.01117
Train [65][260/3239]	Time 0.337 (0.773)	Data Time 0.002 (0.137)	Loss 2.5057 (2.6114)	Entropy 0.62100 (0.62085)	Top-1 acc 62.891 (61.105)	Top-5 acc 82.422 (81.912)	lr 0.01117
Train [65][270/3239]	Time 0.244 (0.761)	Data Time 0.001 (0.132)	Loss 2.7816 (2.6127)	Entropy 0.62112 (0.62086)	Top-1 acc 54.297 (61.102)	Top-5 acc 80.078 (81.896)	lr 0.01117
Train [65][280/3239]	Time 0.246 (0.751)	Data Time 0.001 (0.127)	Loss 2.5432 (2.6115)	Entropy 0.62107 (0.62087)	Top-1 acc 63.672 (61.093)	Top-5 acc 82.812 (81.924)	lr 0.01117
Train [65][290/3239]	Time 0.258 (0.743)	Data Time 0.001 (0.123)	Loss 2.6008 (2.6109)	Entropy 0.62102 (0.62088)	Top-1 acc 60.156 (61.123)	Top-5 acc 82.422 (81.956)	lr 0.01116
Train [65][300/3239]	Time 0.231 (0.733)	Data Time 0.001 (0.119)	Loss 2.5040 (2.6084)	Entropy 0.62064 (0.62087)	Top-1 acc 64.844 (61.178)	Top-5 acc 83.984 (81.983)	lr 0.01116
Train [65][310/3239]	Time 0.291 (0.724)	Data Time 0.001 (0.115)	Loss 2.7221 (2.6074)	Entropy 0.62061 (0.62087)	Top-1 acc 58.203 (61.179)	Top-5 acc 79.688 (82.022)	lr 0.01116
Train [65][320/3239]	Time 0.245 (0.717)	Data Time 0.001 (0.112)	Loss 2.6454 (2.6074)	Entropy 0.62059 (0.62086)	Top-1 acc 58.984 (61.183)	Top-5 acc 80.469 (82.008)	lr 0.01116
Train [65][330/3239]	Time 0.341 (0.709)	Data Time 0.001 (0.108)	Loss 2.4282 (2.6057)	Entropy 0.62035 (0.62085)	Top-1 acc 67.578 (61.243)	Top-5 acc 85.547 (82.049)	lr 0.01116
Train [65][340/3239]	Time 0.261 (0.702)	Data Time 0.001 (0.105)	Loss 2.6483 (2.6054)	Entropy 0.62017 (0.62084)	Top-1 acc 56.641 (61.227)	Top-5 acc 81.250 (82.056)	lr 0.01116
Train [65][350/3239]	Time 0.259 (0.695)	Data Time 0.001 (0.102)	Loss 2.4621 (2.6043)	Entropy 0.62000 (0.62082)	Top-1 acc 65.234 (61.237)	Top-5 acc 83.984 (82.096)	lr 0.01116
Train [65][360/3239]	Time 0.256 (0.689)	Data Time 0.001 (0.100)	Loss 2.9123 (2.6051)	Entropy 0.62012 (0.62079)	Top-1 acc 55.078 (61.223)	Top-5 acc 75.781 (82.073)	lr 0.01116
Train [65][370/3239]	Time 0.247 (0.683)	Data Time 0.001 (0.097)	Loss 2.8449 (2.6065)	Entropy 0.61988 (0.62077)	Top-1 acc 55.469 (61.181)	Top-5 acc 76.562 (82.066)	lr 0.01116
Train [65][380/3239]	Time 0.256 (0.677)	Data Time 0.001 (0.094)	Loss 2.5779 (2.6054)	Entropy 0.61987 (0.62075)	Top-1 acc 61.328 (61.206)	Top-5 acc 83.203 (82.087)	lr 0.01116
Train [65][390/3239]	Time 0.245 (0.671)	Data Time 0.001 (0.092)	Loss 2.5495 (2.6042)	Entropy 0.61975 (0.62072)	Top-1 acc 60.938 (61.215)	Top-5 acc 81.641 (82.107)	lr 0.01115
Train [65][400/3239]	Time 0.265 (0.666)	Data Time 0.001 (0.090)	Loss 2.6825 (2.6048)	Entropy 0.61994 (0.62070)	Top-1 acc 58.594 (61.206)	Top-5 acc 83.203 (82.113)	lr 0.01115
Train [65][410/3239]	Time 0.260 (0.661)	Data Time 0.001 (0.088)	Loss 2.5823 (2.6041)	Entropy 0.61973 (0.62068)	Top-1 acc 60.547 (61.207)	Top-5 acc 82.812 (82.138)	lr 0.01115
Train [65][420/3239]	Time 0.377 (0.657)	Data Time 0.001 (0.086)	Loss 2.5785 (2.6044)	Entropy 0.61992 (0.62066)	Top-1 acc 63.672 (61.211)	Top-5 acc 84.375 (82.132)	lr 0.01115
Train [65][430/3239]	Time 0.242 (0.653)	Data Time 0.001 (0.084)	Loss 2.4463 (2.6035)	Entropy 0.62005 (0.62064)	Top-1 acc 67.578 (61.244)	Top-5 acc 82.422 (82.131)	lr 0.01115
Train [65][440/3239]	Time 0.300 (0.649)	Data Time 0.004 (0.082)	Loss 2.8245 (2.6037)	Entropy 0.62017 (0.62063)	Top-1 acc 56.641 (61.224)	Top-5 acc 78.125 (82.126)	lr 0.01115
Train [65][450/3239]	Time 0.268 (0.646)	Data Time 0.001 (0.080)	Loss 2.5072 (2.6051)	Entropy 0.62009 (0.62062)	Top-1 acc 59.375 (61.169)	Top-5 acc 83.203 (82.103)	lr 0.01115
Train [65][460/3239]	Time 0.319 (0.642)	Data Time 0.003 (0.078)	Loss 2.4824 (2.6061)	Entropy 0.61987 (0.62061)	Top-1 acc 62.891 (61.147)	Top-5 acc 85.547 (82.089)	lr 0.01115
Train [65][470/3239]	Time 0.248 (0.638)	Data Time 0.001 (0.077)	Loss 2.9808 (2.6083)	Entropy 0.62000 (0.62059)	Top-1 acc 53.125 (61.093)	Top-5 acc 76.562 (82.069)	lr 0.01115
Train [65][480/3239]	Time 0.240 (0.634)	Data Time 0.001 (0.075)	Loss 2.7206 (2.6085)	Entropy 0.61979 (0.62058)	Top-1 acc 58.594 (61.102)	Top-5 acc 79.688 (82.065)	lr 0.01115
Train [65][490/3239]	Time 0.374 (0.631)	Data Time 0.001 (0.074)	Loss 2.7533 (2.6082)	Entropy 0.61974 (0.62056)	Top-1 acc 59.375 (61.120)	Top-5 acc 80.469 (82.057)	lr 0.01114
Train [65][500/3239]	Time 0.255 (0.628)	Data Time 0.001 (0.072)	Loss 2.5412 (2.6081)	Entropy 0.61993 (0.62054)	Top-1 acc 62.109 (61.128)	Top-5 acc 84.375 (82.053)	lr 0.01114
Train [65][510/3239]	Time 0.280 (0.625)	Data Time 0.001 (0.071)	Loss 2.3847 (2.6084)	Entropy 0.62005 (0.62053)	Top-1 acc 66.016 (61.131)	Top-5 acc 87.891 (82.055)	lr 0.01114
Train [65][520/3239]	Time 0.244 (0.622)	Data Time 0.001 (0.070)	Loss 2.6969 (2.6085)	Entropy 0.61970 (0.62052)	Top-1 acc 58.984 (61.124)	Top-5 acc 81.641 (82.060)	lr 0.01114
Train [65][530/3239]	Time 0.238 (0.619)	Data Time 0.001 (0.068)	Loss 2.5845 (2.6084)	Entropy 0.61982 (0.62051)	Top-1 acc 62.500 (61.131)	Top-5 acc 82.031 (82.060)	lr 0.01114
Train [65][540/3239]	Time 0.265 (0.616)	Data Time 0.001 (0.067)	Loss 2.5549 (2.6090)	Entropy 0.61977 (0.62050)	Top-1 acc 64.062 (61.125)	Top-5 acc 83.203 (82.046)	lr 0.01114
Train [65][550/3239]	Time 0.251 (0.614)	Data Time 0.001 (0.066)	Loss 2.4636 (2.6086)	Entropy 0.62014 (0.62049)	Top-1 acc 66.016 (61.130)	Top-5 acc 82.812 (82.046)	lr 0.01114
Train [65][560/3239]	Time 0.249 (0.612)	Data Time 0.002 (0.065)	Loss 2.6532 (2.6087)	Entropy 0.62034 (0.62048)	Top-1 acc 60.547 (61.142)	Top-5 acc 80.469 (82.042)	lr 0.01114
Train [65][570/3239]	Time 0.295 (0.609)	Data Time 0.001 (0.064)	Loss 2.6060 (2.6073)	Entropy 0.62042 (0.62048)	Top-1 acc 63.672 (61.176)	Top-5 acc 81.250 (82.058)	lr 0.01114
Train [65][580/3239]	Time 0.285 (0.607)	Data Time 0.001 (0.063)	Loss 2.8102 (2.6075)	Entropy 0.61998 (0.62047)	Top-1 acc 53.906 (61.171)	Top-5 acc 80.078 (82.062)	lr 0.01114
Train [65][590/3239]	Time 0.230 (0.604)	Data Time 0.001 (0.062)	Loss 2.6364 (2.6081)	Entropy 0.62022 (0.62047)	Top-1 acc 62.500 (61.140)	Top-5 acc 81.641 (82.056)	lr 0.01113
Train [65][600/3239]	Time 0.242 (0.601)	Data Time 0.001 (0.061)	Loss 2.7984 (2.6081)	Entropy 0.62029 (0.62046)	Top-1 acc 53.125 (61.137)	Top-5 acc 79.297 (82.053)	lr 0.01113
Train [65][610/3239]	Time 0.261 (0.599)	Data Time 0.001 (0.060)	Loss 2.5588 (2.6076)	Entropy 0.62015 (0.62046)	Top-1 acc 63.281 (61.146)	Top-5 acc 81.641 (82.059)	lr 0.01113
Train [65][620/3239]	Time 0.255 (0.597)	Data Time 0.001 (0.059)	Loss 2.5796 (2.6089)	Entropy 0.61983 (0.62045)	Top-1 acc 61.719 (61.122)	Top-5 acc 82.812 (82.042)	lr 0.01113
Train [65][630/3239]	Time 0.240 (0.595)	Data Time 0.001 (0.058)	Loss 2.6305 (2.6092)	Entropy 0.61991 (0.62044)	Top-1 acc 60.156 (61.111)	Top-5 acc 82.422 (82.034)	lr 0.01113
Train [65][640/3239]	Time 0.255 (0.592)	Data Time 0.001 (0.057)	Loss 2.7408 (2.6085)	Entropy 0.61969 (0.62043)	Top-1 acc 56.250 (61.115)	Top-5 acc 78.516 (82.044)	lr 0.01113
Train [65][650/3239]	Time 0.364 (0.590)	Data Time 0.001 (0.056)	Loss 2.5025 (2.6085)	Entropy 0.61936 (0.62042)	Top-1 acc 64.453 (61.106)	Top-5 acc 83.984 (82.044)	lr 0.01113
Train [65][660/3239]	Time 0.292 (0.588)	Data Time 0.003 (0.055)	Loss 2.5559 (2.6088)	Entropy 0.61910 (0.62041)	Top-1 acc 60.938 (61.119)	Top-5 acc 82.031 (82.027)	lr 0.01113
Train [65][670/3239]	Time 0.262 (0.586)	Data Time 0.001 (0.054)	Loss 2.6327 (2.6096)	Entropy 0.61939 (0.62039)	Top-1 acc 62.109 (61.102)	Top-5 acc 78.906 (82.007)	lr 0.01113
Train [65][680/3239]	Time 0.253 (0.585)	Data Time 0.001 (0.054)	Loss 2.6885 (2.6095)	Entropy 0.61953 (0.62037)	Top-1 acc 60.547 (61.103)	Top-5 acc 80.078 (82.020)	lr 0.01113
Train [65][690/3239]	Time 0.269 (0.583)	Data Time 0.001 (0.053)	Loss 2.6210 (2.6095)	Entropy 0.61949 (0.62036)	Top-1 acc 61.719 (61.085)	Top-5 acc 82.031 (82.021)	lr 0.01112
Train [65][700/3239]	Time 0.288 (0.581)	Data Time 0.001 (0.052)	Loss 2.6316 (2.6098)	Entropy 0.61953 (0.62035)	Top-1 acc 62.500 (61.091)	Top-5 acc 81.250 (82.001)	lr 0.01112
Train [65][710/3239]	Time 0.277 (0.580)	Data Time 0.002 (0.051)	Loss 2.5442 (2.6097)	Entropy 0.61951 (0.62034)	Top-1 acc 65.625 (61.092)	Top-5 acc 82.031 (82.004)	lr 0.01112
Train [65][720/3239]	Time 0.409 (0.578)	Data Time 0.001 (0.051)	Loss 2.7125 (2.6104)	Entropy 0.61956 (0.62033)	Top-1 acc 56.250 (61.073)	Top-5 acc 81.250 (81.986)	lr 0.01112
Train [65][730/3239]	Time 0.304 (0.576)	Data Time 0.001 (0.050)	Loss 2.5293 (2.6098)	Entropy 0.61932 (0.62032)	Top-1 acc 61.719 (61.095)	Top-5 acc 85.938 (81.992)	lr 0.01112
Train [65][740/3239]	Time 0.294 (0.575)	Data Time 0.003 (0.049)	Loss 2.4884 (2.6096)	Entropy 0.61968 (0.62030)	Top-1 acc 60.547 (61.088)	Top-5 acc 84.375 (81.996)	lr 0.01112
Train [65][750/3239]	Time 0.245 (0.573)	Data Time 0.001 (0.049)	Loss 2.5990 (2.6097)	Entropy 0.61946 (0.62029)	Top-1 acc 60.938 (61.092)	Top-5 acc 82.422 (81.990)	lr 0.01112
Train [65][760/3239]	Time 0.309 (0.572)	Data Time 0.002 (0.048)	Loss 2.5471 (2.6091)	Entropy 0.61949 (0.62028)	Top-1 acc 64.453 (61.106)	Top-5 acc 85.156 (82.008)	lr 0.01112
Train [65][770/3239]	Time 0.234 (0.571)	Data Time 0.001 (0.048)	Loss 2.8422 (2.6097)	Entropy 0.61926 (0.62027)	Top-1 acc 57.812 (61.099)	Top-5 acc 77.344 (81.998)	lr 0.01112
Train [65][780/3239]	Time 0.253 (0.569)	Data Time 0.001 (0.047)	Loss 2.4471 (2.6093)	Entropy 0.61883 (0.62026)	Top-1 acc 65.625 (61.099)	Top-5 acc 85.938 (82.006)	lr 0.01112
Train [65][790/3239]	Time 0.327 (0.568)	Data Time 0.002 (0.046)	Loss 2.5325 (2.6090)	Entropy 0.61893 (0.62024)	Top-1 acc 63.672 (61.099)	Top-5 acc 80.078 (82.014)	lr 0.01111
Train [65][800/3239]	Time 0.250 (0.566)	Data Time 0.001 (0.046)	Loss 2.3389 (2.6090)	Entropy 0.61872 (0.62022)	Top-1 acc 67.969 (61.107)	Top-5 acc 85.938 (82.003)	lr 0.01111
Train [65][810/3239]	Time 0.355 (0.565)	Data Time 0.001 (0.045)	Loss 2.3743 (2.6086)	Entropy 0.61885 (0.62020)	Top-1 acc 67.578 (61.114)	Top-5 acc 86.328 (82.011)	lr 0.01111
Train [65][820/3239]	Time 0.262 (0.564)	Data Time 0.001 (0.045)	Loss 2.6403 (2.6086)	Entropy 0.61883 (0.62019)	Top-1 acc 57.422 (61.110)	Top-5 acc 81.250 (82.010)	lr 0.01111
Train [65][830/3239]	Time 0.249 (0.563)	Data Time 0.002 (0.044)	Loss 2.5365 (2.6083)	Entropy 0.61840 (0.62017)	Top-1 acc 60.547 (61.121)	Top-5 acc 81.641 (82.004)	lr 0.01111
Train [65][840/3239]	Time 0.253 (0.562)	Data Time 0.001 (0.044)	Loss 2.7898 (2.6087)	Entropy 0.61815 (0.62015)	Top-1 acc 55.859 (61.126)	Top-5 acc 78.906 (81.998)	lr 0.01111
Train [65][850/3239]	Time 0.241 (0.560)	Data Time 0.001 (0.043)	Loss 2.6176 (2.6087)	Entropy 0.61809 (0.62013)	Top-1 acc 59.766 (61.128)	Top-5 acc 81.250 (81.996)	lr 0.01111
Train [65][860/3239]	Time 0.252 (0.559)	Data Time 0.001 (0.043)	Loss 2.7503 (2.6089)	Entropy 0.61821 (0.62010)	Top-1 acc 58.594 (61.121)	Top-5 acc 80.078 (81.995)	lr 0.01111
Train [65][870/3239]	Time 0.254 (0.558)	Data Time 0.001 (0.042)	Loss 2.8487 (2.6090)	Entropy 0.61827 (0.62008)	Top-1 acc 57.812 (61.119)	Top-5 acc 77.344 (81.996)	lr 0.01111
Train [65][880/3239]	Time 0.340 (0.557)	Data Time 0.002 (0.042)	Loss 2.6197 (2.6091)	Entropy 0.61839 (0.62006)	Top-1 acc 60.547 (61.112)	Top-5 acc 81.250 (81.992)	lr 0.01111
Train [65][890/3239]	Time 0.262 (0.556)	Data Time 0.002 (0.041)	Loss 2.4102 (2.6084)	Entropy 0.61863 (0.62004)	Top-1 acc 67.969 (61.129)	Top-5 acc 83.984 (81.999)	lr 0.01110
Train [65][900/3239]	Time 0.439 (0.598)	Data Time 0.006 (0.041)	Loss 2.6743 (2.6088)	Entropy 0.61866 (0.62003)	Top-1 acc 55.859 (61.125)	Top-5 acc 82.031 (81.986)	lr 0.01110
Train [65][910/3239]	Time 0.251 (0.598)	Data Time 0.002 (0.041)	Loss 2.5773 (2.6087)	Entropy 0.61892 (0.62001)	Top-1 acc 61.719 (61.132)	Top-5 acc 83.594 (81.990)	lr 0.01110
Train [65][920/3239]	Time 0.250 (0.596)	Data Time 0.002 (0.040)	Loss 2.7553 (2.6089)	Entropy 0.61876 (0.62000)	Top-1 acc 60.156 (61.127)	Top-5 acc 78.125 (81.986)	lr 0.01110
Train [65][930/3239]	Time 0.241 (0.594)	Data Time 0.001 (0.040)	Loss 2.6901 (2.6096)	Entropy 0.61869 (0.61999)	Top-1 acc 60.156 (61.110)	Top-5 acc 79.297 (81.969)	lr 0.01110
Train [65][940/3239]	Time 0.256 (0.592)	Data Time 0.002 (0.039)	Loss 2.7361 (2.6100)	Entropy 0.61837 (0.61997)	Top-1 acc 61.328 (61.107)	Top-5 acc 78.516 (81.965)	lr 0.01110
Train [65][950/3239]	Time 0.269 (0.591)	Data Time 0.001 (0.039)	Loss 2.6298 (2.6098)	Entropy 0.61807 (0.61995)	Top-1 acc 59.375 (61.110)	Top-5 acc 81.641 (81.969)	lr 0.01110
Train [65][960/3239]	Time 0.279 (0.590)	Data Time 0.002 (0.039)	Loss 2.4983 (2.6094)	Entropy 0.61765 (0.61993)	Top-1 acc 62.109 (61.116)	Top-5 acc 82.812 (81.980)	lr 0.01110
Train [65][970/3239]	Time 0.405 (0.588)	Data Time 0.001 (0.038)	Loss 2.6952 (2.6096)	Entropy 0.61762 (0.61991)	Top-1 acc 63.672 (61.115)	Top-5 acc 81.641 (81.979)	lr 0.01110
Train [65][980/3239]	Time 0.251 (0.587)	Data Time 0.001 (0.038)	Loss 2.5844 (2.6093)	Entropy 0.61774 (0.61989)	Top-1 acc 61.328 (61.116)	Top-5 acc 83.203 (81.984)	lr 0.01109
Train [65][990/3239]	Time 0.302 (0.586)	Data Time 0.001 (0.037)	Loss 2.4826 (2.6098)	Entropy 0.61772 (0.61986)	Top-1 acc 64.453 (61.116)	Top-5 acc 82.812 (81.978)	lr 0.01109
Train [65][1000/3239]	Time 0.242 (0.584)	Data Time 0.001 (0.037)	Loss 2.4106 (2.6092)	Entropy 0.61799 (0.61984)	Top-1 acc 66.797 (61.126)	Top-5 acc 87.109 (81.997)	lr 0.01109
Train [65][1010/3239]	Time 0.296 (0.583)	Data Time 0.002 (0.037)	Loss 2.4874 (2.6095)	Entropy 0.61821 (0.61983)	Top-1 acc 62.109 (61.114)	Top-5 acc 85.156 (81.996)	lr 0.01109
Train [65][1020/3239]	Time 0.246 (0.582)	Data Time 0.001 (0.036)	Loss 2.6171 (2.6100)	Entropy 0.61813 (0.61981)	Top-1 acc 59.766 (61.102)	Top-5 acc 80.078 (81.985)	lr 0.01109
Train [65][1030/3239]	Time 0.247 (0.581)	Data Time 0.001 (0.036)	Loss 2.6695 (2.6098)	Entropy 0.61802 (0.61979)	Top-1 acc 60.547 (61.114)	Top-5 acc 79.688 (81.985)	lr 0.01109
Train [65][1040/3239]	Time 0.371 (0.583)	Data Time 0.001 (0.039)	Loss 2.4332 (2.6099)	Entropy 0.61803 (0.61978)	Top-1 acc 67.969 (61.120)	Top-5 acc 82.812 (81.989)	lr 0.01109
Train [65][1050/3239]	Time 0.252 (0.582)	Data Time 0.003 (0.038)	Loss 2.7143 (2.6103)	Entropy 0.61794 (0.61976)	Top-1 acc 58.594 (61.123)	Top-5 acc 80.078 (81.979)	lr 0.01109
Train [65][1060/3239]	Time 0.246 (0.580)	Data Time 0.001 (0.038)	Loss 2.5579 (2.6098)	Entropy 0.61815 (0.61974)	Top-1 acc 62.500 (61.144)	Top-5 acc 82.422 (81.979)	lr 0.01109
Train [65][1070/3239]	Time 0.249 (0.587)	Data Time 0.001 (0.045)	Loss 2.5738 (2.6099)	Entropy 0.61836 (0.61973)	Top-1 acc 61.719 (61.132)	Top-5 acc 81.641 (81.982)	lr 0.01109
Train [65][1080/3239]	Time 0.265 (0.586)	Data Time 0.001 (0.045)	Loss 2.5534 (2.6104)	Entropy 0.61852 (0.61972)	Top-1 acc 61.719 (61.125)	Top-5 acc 83.203 (81.971)	lr 0.01108
Train [65][1090/3239]	Time 0.287 (0.585)	Data Time 0.002 (0.044)	Loss 2.6631 (2.6109)	Entropy 0.61880 (0.61971)	Top-1 acc 57.031 (61.109)	Top-5 acc 80.859 (81.960)	lr 0.01108
Train [65][1100/3239]	Time 0.245 (0.587)	Data Time 0.001 (0.048)	Loss 2.4888 (2.6110)	Entropy 0.61865 (0.61970)	Top-1 acc 62.500 (61.109)	Top-5 acc 84.766 (81.968)	lr 0.01108
Train [65][1110/3239]	Time 0.276 (0.586)	Data Time 0.001 (0.047)	Loss 2.2991 (2.6105)	Entropy 0.61882 (0.61969)	Top-1 acc 65.234 (61.115)	Top-5 acc 88.672 (81.973)	lr 0.01108
Train [65][1120/3239]	Time 0.257 (0.585)	Data Time 0.001 (0.047)	Loss 2.5980 (2.6108)	Entropy 0.61891 (0.61968)	Top-1 acc 62.109 (61.105)	Top-5 acc 80.078 (81.973)	lr 0.01108
Train [65][1130/3239]	Time 0.351 (0.584)	Data Time 0.002 (0.047)	Loss 2.5032 (2.6113)	Entropy 0.61899 (0.61967)	Top-1 acc 64.844 (61.090)	Top-5 acc 82.812 (81.960)	lr 0.01108
Train [65][1140/3239]	Time 0.245 (0.586)	Data Time 0.001 (0.049)	Loss 2.8150 (2.6114)	Entropy 0.61900 (0.61967)	Top-1 acc 57.422 (61.084)	Top-5 acc 76.953 (81.955)	lr 0.01108
Train [65][1150/3239]	Time 0.258 (0.585)	Data Time 0.001 (0.049)	Loss 2.6970 (2.6112)	Entropy 0.61870 (0.61966)	Top-1 acc 59.766 (61.078)	Top-5 acc 79.297 (81.949)	lr 0.01108
Train [65][1160/3239]	Time 0.249 (0.584)	Data Time 0.002 (0.048)	Loss 2.5170 (2.6107)	Entropy 0.61876 (0.61965)	Top-1 acc 62.500 (61.086)	Top-5 acc 82.422 (81.961)	lr 0.01108
Train [65][1170/3239]	Time 0.247 (0.584)	Data Time 0.001 (0.049)	Loss 2.5521 (2.6105)	Entropy 0.61848 (0.61965)	Top-1 acc 62.891 (61.092)	Top-5 acc 82.812 (81.964)	lr 0.01108
Train [65][1180/3239]	Time 0.325 (0.583)	Data Time 0.002 (0.049)	Loss 2.5347 (2.6104)	Entropy 0.61852 (0.61964)	Top-1 acc 62.109 (61.091)	Top-5 acc 82.031 (81.965)	lr 0.01107
Train [65][1190/3239]	Time 0.227 (0.582)	Data Time 0.001 (0.048)	Loss 2.6739 (2.6108)	Entropy 0.61872 (0.61963)	Top-1 acc 58.594 (61.084)	Top-5 acc 82.812 (81.961)	lr 0.01107
Train [65][1200/3239]	Time 0.406 (0.582)	Data Time 0.002 (0.049)	Loss 2.4770 (2.6108)	Entropy 0.61881 (0.61962)	Top-1 acc 65.234 (61.082)	Top-5 acc 83.203 (81.964)	lr 0.01107
Train [65][1210/3239]	Time 0.282 (0.581)	Data Time 0.001 (0.049)	Loss 2.7259 (2.6110)	Entropy 0.61852 (0.61961)	Top-1 acc 58.203 (61.077)	Top-5 acc 78.516 (81.955)	lr 0.01107
Train [65][1220/3239]	Time 0.278 (0.580)	Data Time 0.001 (0.048)	Loss 2.5575 (2.6114)	Entropy 0.61851 (0.61960)	Top-1 acc 60.156 (61.070)	Top-5 acc 85.547 (81.952)	lr 0.01107
Train [65][1230/3239]	Time 0.292 (0.579)	Data Time 0.034 (0.049)	Loss 2.4677 (2.6115)	Entropy 0.61911 (0.61960)	Top-1 acc 64.453 (61.074)	Top-5 acc 83.203 (81.952)	lr 0.01107
Train [65][1240/3239]	Time 0.237 (0.579)	Data Time 0.001 (0.049)	Loss 2.7063 (2.6119)	Entropy 0.61914 (0.61959)	Top-1 acc 59.766 (61.067)	Top-5 acc 78.906 (81.943)	lr 0.01107
Train [65][1250/3239]	Time 0.232 (0.578)	Data Time 0.001 (0.049)	Loss 2.6854 (2.6121)	Entropy 0.61962 (0.61959)	Top-1 acc 58.594 (61.062)	Top-5 acc 81.250 (81.937)	lr 0.01107
Train [65][1260/3239]	Time 0.258 (0.581)	Data Time 0.001 (0.052)	Loss 2.7471 (2.6121)	Entropy 0.61951 (0.61959)	Top-1 acc 58.984 (61.067)	Top-5 acc 79.688 (81.940)	lr 0.01107
Train [65][1270/3239]	Time 0.297 (0.580)	Data Time 0.002 (0.051)	Loss 2.5826 (2.6119)	Entropy 0.61958 (0.61959)	Top-1 acc 64.844 (61.073)	Top-5 acc 84.766 (81.944)	lr 0.01107
Train [65][1280/3239]	Time 0.248 (0.579)	Data Time 0.001 (0.051)	Loss 3.1012 (2.6119)	Entropy 0.61964 (0.61959)	Top-1 acc 51.172 (61.075)	Top-5 acc 69.141 (81.937)	lr 0.01106
Train [65][1290/3239]	Time 0.350 (0.578)	Data Time 0.002 (0.051)	Loss 2.4626 (2.6118)	Entropy 0.61956 (0.61959)	Top-1 acc 67.188 (61.077)	Top-5 acc 86.328 (81.944)	lr 0.01106
Train [65][1300/3239]	Time 0.245 (0.579)	Data Time 0.001 (0.052)	Loss 2.7245 (2.6123)	Entropy 0.61947 (0.61959)	Top-1 acc 58.594 (61.069)	Top-5 acc 78.125 (81.934)	lr 0.01106
Train [65][1310/3239]	Time 0.238 (0.578)	Data Time 0.001 (0.052)	Loss 2.4219 (2.6118)	Entropy 0.61947 (0.61959)	Top-1 acc 64.453 (61.078)	Top-5 acc 86.328 (81.940)	lr 0.01106
Train [65][1320/3239]	Time 0.259 (0.577)	Data Time 0.001 (0.052)	Loss 2.5300 (2.6115)	Entropy 0.61920 (0.61959)	Top-1 acc 60.547 (61.083)	Top-5 acc 83.203 (81.947)	lr 0.01106
Train [65][1330/3239]	Time 0.252 (0.580)	Data Time 0.001 (0.055)	Loss 2.5962 (2.6112)	Entropy 0.61919 (0.61958)	Top-1 acc 59.375 (61.086)	Top-5 acc 82.812 (81.952)	lr 0.01106
Train [65][1340/3239]	Time 0.246 (0.580)	Data Time 0.001 (0.055)	Loss 2.5338 (2.6113)	Entropy 0.61940 (0.61958)	Top-1 acc 61.328 (61.087)	Top-5 acc 83.203 (81.950)	lr 0.01106
Train [65][1350/3239]	Time 0.256 (0.579)	Data Time 0.002 (0.055)	Loss 2.4317 (2.6110)	Entropy 0.61975 (0.61958)	Top-1 acc 68.359 (61.093)	Top-5 acc 82.422 (81.955)	lr 0.01106
Train [65][1360/3239]	Time 0.345 (0.578)	Data Time 0.001 (0.054)	Loss 2.4527 (2.6106)	Entropy 0.61957 (0.61958)	Top-1 acc 63.281 (61.096)	Top-5 acc 85.547 (81.964)	lr 0.01106
Train [65][1370/3239]	Time 0.242 (0.579)	Data Time 0.001 (0.055)	Loss 2.8017 (2.6106)	Entropy 0.61950 (0.61958)	Top-1 acc 56.250 (61.098)	Top-5 acc 77.734 (81.960)	lr 0.01106
Train [65][1380/3239]	Time 0.240 (0.578)	Data Time 0.001 (0.055)	Loss 2.5845 (2.6109)	Entropy 0.61979 (0.61958)	Top-1 acc 63.672 (61.094)	Top-5 acc 83.203 (81.961)	lr 0.01105
Train [65][1390/3239]	Time 0.251 (0.577)	Data Time 0.001 (0.055)	Loss 2.6497 (2.6106)	Entropy 0.61965 (0.61958)	Top-1 acc 59.766 (61.108)	Top-5 acc 80.859 (81.967)	lr 0.01105
Train [65][1400/3239]	Time 0.230 (0.578)	Data Time 0.001 (0.057)	Loss 2.6738 (2.6104)	Entropy 0.61970 (0.61958)	Top-1 acc 56.250 (61.103)	Top-5 acc 81.641 (81.975)	lr 0.01105
Train [65][1410/3239]	Time 0.247 (0.577)	Data Time 0.001 (0.056)	Loss 2.5235 (2.6102)	Entropy 0.61986 (0.61958)	Top-1 acc 62.109 (61.109)	Top-5 acc 83.203 (81.976)	lr 0.01105
Train [65][1420/3239]	Time 0.237 (0.578)	Data Time 0.001 (0.057)	Loss 2.6731 (2.6108)	Entropy 0.61997 (0.61959)	Top-1 acc 60.156 (61.097)	Top-5 acc 79.297 (81.966)	lr 0.01105
Train [65][1430/3239]	Time 0.397 (0.579)	Data Time 0.001 (0.059)	Loss 2.4909 (2.6104)	Entropy 0.62019 (0.61959)	Top-1 acc 62.500 (61.097)	Top-5 acc 83.984 (81.970)	lr 0.01105
Train [65][1440/3239]	Time 0.283 (0.578)	Data Time 0.001 (0.059)	Loss 2.5355 (2.6100)	Entropy 0.62042 (0.61959)	Top-1 acc 64.062 (61.101)	Top-5 acc 82.422 (81.979)	lr 0.01105
Train [65][1450/3239]	Time 0.254 (0.577)	Data Time 0.001 (0.058)	Loss 2.5454 (2.6098)	Entropy 0.62057 (0.61960)	Top-1 acc 60.938 (61.108)	Top-5 acc 81.641 (81.982)	lr 0.01105
Train [65][1460/3239]	Time 0.255 (0.578)	Data Time 0.001 (0.060)	Loss 2.5505 (2.6100)	Entropy 0.62082 (0.61961)	Top-1 acc 59.375 (61.096)	Top-5 acc 82.812 (81.976)	lr 0.01105
Train [65][1470/3239]	Time 0.251 (0.578)	Data Time 0.001 (0.059)	Loss 2.4242 (2.6096)	Entropy 0.62052 (0.61961)	Top-1 acc 63.281 (61.112)	Top-5 acc 85.938 (81.983)	lr 0.01105
Train [65][1480/3239]	Time 0.254 (0.577)	Data Time 0.001 (0.059)	Loss 2.8383 (2.6097)	Entropy 0.62053 (0.61962)	Top-1 acc 55.859 (61.111)	Top-5 acc 75.391 (81.985)	lr 0.01104
Train [65][1490/3239]	Time 0.239 (0.578)	Data Time 0.002 (0.061)	Loss 2.5793 (2.6093)	Entropy 0.62025 (0.61963)	Top-1 acc 62.109 (61.119)	Top-5 acc 82.812 (81.988)	lr 0.01104
Train [65][1500/3239]	Time 0.255 (0.578)	Data Time 0.001 (0.061)	Loss 2.6226 (2.6092)	Entropy 0.62035 (0.61963)	Top-1 acc 59.375 (61.124)	Top-5 acc 80.469 (81.983)	lr 0.01104
Train [65][1510/3239]	Time 0.251 (0.577)	Data Time 0.001 (0.060)	Loss 2.6202 (2.6091)	Entropy 0.62026 (0.61963)	Top-1 acc 60.547 (61.119)	Top-5 acc 83.594 (81.984)	lr 0.01104
Train [65][1520/3239]	Time 0.401 (0.578)	Data Time 0.001 (0.062)	Loss 2.5472 (2.6093)	Entropy 0.62012 (0.61964)	Top-1 acc 62.891 (61.112)	Top-5 acc 83.984 (81.985)	lr 0.01104
Train [65][1530/3239]	Time 0.241 (0.577)	Data Time 0.001 (0.061)	Loss 2.6815 (2.6096)	Entropy 0.61978 (0.61964)	Top-1 acc 62.891 (61.103)	Top-5 acc 81.250 (81.980)	lr 0.01104
Train [65][1540/3239]	Time 0.227 (0.576)	Data Time 0.001 (0.061)	Loss 2.6494 (2.6097)	Entropy 0.61991 (0.61964)	Top-1 acc 61.719 (61.102)	Top-5 acc 82.031 (81.981)	lr 0.01104
Train [65][1550/3239]	Time 0.235 (0.578)	Data Time 0.001 (0.064)	Loss 2.6935 (2.6098)	Entropy 0.61964 (0.61964)	Top-1 acc 58.203 (61.102)	Top-5 acc 77.734 (81.978)	lr 0.01104
Train [65][1560/3239]	Time 0.319 (0.604)	Data Time 0.002 (0.064)	Loss 2.7337 (2.6095)	Entropy 0.61956 (0.61964)	Top-1 acc 57.812 (61.107)	Top-5 acc 80.078 (81.987)	lr 0.01104
Train [65][1570/3239]	Time 0.246 (0.603)	Data Time 0.002 (0.064)	Loss 2.5994 (2.6095)	Entropy 0.61974 (0.61964)	Top-1 acc 62.891 (61.110)	Top-5 acc 81.250 (81.984)	lr 0.01104
Train [65][1580/3239]	Time 0.248 (0.602)	Data Time 0.001 (0.063)	Loss 2.5554 (2.6092)	Entropy 0.61970 (0.61964)	Top-1 acc 61.719 (61.119)	Top-5 acc 83.203 (81.993)	lr 0.01103
Train [65][1590/3239]	Time 0.376 (0.601)	Data Time 0.002 (0.063)	Loss 2.5314 (2.6092)	Entropy 0.61955 (0.61964)	Top-1 acc 64.844 (61.121)	Top-5 acc 83.203 (81.995)	lr 0.01103
Train [65][1600/3239]	Time 0.259 (0.600)	Data Time 0.002 (0.062)	Loss 2.5650 (2.6097)	Entropy 0.61931 (0.61964)	Top-1 acc 61.719 (61.109)	Top-5 acc 81.641 (81.987)	lr 0.01103
Train [65][1610/3239]	Time 0.247 (0.599)	Data Time 0.002 (0.062)	Loss 2.3238 (2.6098)	Entropy 0.61918 (0.61964)	Top-1 acc 66.797 (61.110)	Top-5 acc 89.453 (81.990)	lr 0.01103
Train [65][1620/3239]	Time 0.250 (0.598)	Data Time 0.001 (0.062)	Loss 2.6284 (2.6099)	Entropy 0.61921 (0.61964)	Top-1 acc 62.500 (61.107)	Top-5 acc 82.812 (81.988)	lr 0.01103
Train [65][1630/3239]	Time 0.249 (0.597)	Data Time 0.001 (0.061)	Loss 2.4863 (2.6103)	Entropy 0.61908 (0.61963)	Top-1 acc 64.453 (61.097)	Top-5 acc 82.422 (81.977)	lr 0.01103
Train [65][1640/3239]	Time 0.286 (0.596)	Data Time 0.001 (0.061)	Loss 2.6024 (2.6103)	Entropy 0.61892 (0.61963)	Top-1 acc 64.062 (61.097)	Top-5 acc 80.078 (81.975)	lr 0.01103
Train [65][1650/3239]	Time 0.245 (0.595)	Data Time 0.001 (0.061)	Loss 2.6920 (2.6104)	Entropy 0.61911 (0.61963)	Top-1 acc 59.766 (61.092)	Top-5 acc 80.078 (81.973)	lr 0.01103
Train [65][1660/3239]	Time 0.570 (0.595)	Data Time 0.318 (0.061)	Loss 2.5818 (2.6106)	Entropy 0.61918 (0.61962)	Top-1 acc 62.109 (61.087)	Top-5 acc 79.688 (81.966)	lr 0.01103
Train [65][1670/3239]	Time 0.303 (0.596)	Data Time 0.033 (0.062)	Loss 2.6017 (2.6103)	Entropy 0.61921 (0.61962)	Top-1 acc 59.766 (61.090)	Top-5 acc 81.641 (81.972)	lr 0.01103
Train [65][1680/3239]	Time 0.373 (0.595)	Data Time 0.001 (0.062)	Loss 2.5794 (2.6102)	Entropy 0.61938 (0.61962)	Top-1 acc 60.938 (61.094)	Top-5 acc 83.594 (81.977)	lr 0.01102
Train [65][1690/3239]	Time 0.238 (0.598)	Data Time 0.002 (0.065)	Loss 2.5450 (2.6102)	Entropy 0.61947 (0.61962)	Top-1 acc 62.891 (61.094)	Top-5 acc 82.812 (81.972)	lr 0.01102
Train [65][1700/3239]	Time 0.240 (0.600)	Data Time 0.001 (0.067)	Loss 2.5167 (2.6104)	Entropy 0.61936 (0.61962)	Top-1 acc 63.672 (61.094)	Top-5 acc 85.156 (81.969)	lr 0.01102
Train [65][1710/3239]	Time 0.266 (0.599)	Data Time 0.001 (0.067)	Loss 2.7801 (2.6102)	Entropy 0.61904 (0.61961)	Top-1 acc 55.078 (61.097)	Top-5 acc 77.734 (81.973)	lr 0.01102
Train [65][1720/3239]	Time 0.645 (0.600)	Data Time 0.364 (0.069)	Loss 2.4660 (2.6099)	Entropy 0.61891 (0.61961)	Top-1 acc 64.453 (61.105)	Top-5 acc 83.594 (81.976)	lr 0.01102
Train [65][1730/3239]	Time 0.274 (0.603)	Data Time 0.001 (0.072)	Loss 2.6460 (2.6098)	Entropy 0.61896 (0.61961)	Top-1 acc 58.984 (61.110)	Top-5 acc 79.688 (81.982)	lr 0.01102
Train [65][1740/3239]	Time 0.245 (0.602)	Data Time 0.001 (0.072)	Loss 2.7184 (2.6101)	Entropy 0.61916 (0.61960)	Top-1 acc 58.984 (61.106)	Top-5 acc 80.078 (81.976)	lr 0.01102
Train [65][1750/3239]	Time 0.365 (0.603)	Data Time 0.001 (0.073)	Loss 2.5774 (2.6103)	Entropy 0.61908 (0.61960)	Top-1 acc 61.719 (61.097)	Top-5 acc 84.375 (81.973)	lr 0.01102
Train [65][1760/3239]	Time 0.256 (0.605)	Data Time 0.001 (0.075)	Loss 2.7127 (2.6106)	Entropy 0.61914 (0.61960)	Top-1 acc 59.766 (61.088)	Top-5 acc 79.297 (81.969)	lr 0.01102
Train [65][1770/3239]	Time 3.237 (0.605)	Data Time 2.985 (0.076)	Loss 2.5161 (2.6104)	Entropy 0.61951 (0.61960)	Top-1 acc 57.031 (61.093)	Top-5 acc 83.203 (81.970)	lr 0.01102
Train [65][1780/3239]	Time 0.276 (0.605)	Data Time 0.001 (0.076)	Loss 2.6506 (2.6104)	Entropy 0.61965 (0.61960)	Top-1 acc 62.891 (61.095)	Top-5 acc 80.078 (81.965)	lr 0.01101
Train [65][1790/3239]	Time 0.279 (0.609)	Data Time 0.001 (0.081)	Loss 2.6217 (2.6105)	Entropy 0.61971 (0.61960)	Top-1 acc 60.156 (61.092)	Top-5 acc 81.250 (81.961)	lr 0.01101
Train [65][1800/3239]	Time 0.258 (0.608)	Data Time 0.001 (0.080)	Loss 2.4557 (2.6102)	Entropy 0.61986 (0.61960)	Top-1 acc 67.969 (61.102)	Top-5 acc 83.203 (81.964)	lr 0.01101
Train [65][1810/3239]	Time 0.283 (0.608)	Data Time 0.001 (0.081)	Loss 2.4939 (2.6099)	Entropy 0.61996 (0.61960)	Top-1 acc 63.281 (61.107)	Top-5 acc 85.156 (81.973)	lr 0.01101
Train [65][1820/3239]	Time 0.248 (0.611)	Data Time 0.001 (0.084)	Loss 2.5400 (2.6097)	Entropy 0.61994 (0.61960)	Top-1 acc 62.109 (61.106)	Top-5 acc 82.422 (81.978)	lr 0.01101
Train [65][1830/3239]	Time 0.246 (0.611)	Data Time 0.001 (0.085)	Loss 2.7193 (2.6095)	Entropy 0.61988 (0.61960)	Top-1 acc 53.125 (61.109)	Top-5 acc 80.078 (81.986)	lr 0.01101
Train [65][1840/3239]	Time 0.327 (0.612)	Data Time 0.001 (0.086)	Loss 2.5614 (2.6098)	Entropy 0.61982 (0.61960)	Top-1 acc 61.719 (61.098)	Top-5 acc 82.422 (81.982)	lr 0.01101
Train [65][1850/3239]	Time 0.281 (0.615)	Data Time 0.001 (0.089)	Loss 2.5083 (2.6101)	Entropy 0.61973 (0.61961)	Top-1 acc 59.766 (61.094)	Top-5 acc 82.422 (81.974)	lr 0.01101
Train [65][1860/3239]	Time 0.257 (0.615)	Data Time 0.001 (0.090)	Loss 2.5260 (2.6103)	Entropy 0.61980 (0.61961)	Top-1 acc 68.750 (61.091)	Top-5 acc 83.984 (81.974)	lr 0.01101
Train [65][1870/3239]	Time 0.238 (0.615)	Data Time 0.001 (0.090)	Loss 2.6331 (2.6103)	Entropy 0.61979 (0.61961)	Top-1 acc 57.812 (61.095)	Top-5 acc 81.250 (81.976)	lr 0.01101
Train [65][1880/3239]	Time 0.258 (0.615)	Data Time 0.001 (0.091)	Loss 2.4175 (2.6103)	Entropy 0.62002 (0.61961)	Top-1 acc 64.844 (61.095)	Top-5 acc 85.156 (81.972)	lr 0.01100
Train [65][1890/3239]	Time 0.286 (0.618)	Data Time 0.001 (0.095)	Loss 2.6435 (2.6101)	Entropy 0.61996 (0.61961)	Top-1 acc 60.547 (61.104)	Top-5 acc 82.812 (81.975)	lr 0.01100
Train [65][1900/3239]	Time 0.235 (0.618)	Data Time 0.002 (0.094)	Loss 2.6300 (2.6101)	Entropy 0.62002 (0.61961)	Top-1 acc 60.156 (61.102)	Top-5 acc 81.641 (81.973)	lr 0.01100
Train [65][1910/3239]	Time 0.344 (0.620)	Data Time 0.001 (0.097)	Loss 2.5042 (2.6098)	Entropy 0.62013 (0.61961)	Top-1 acc 61.719 (61.105)	Top-5 acc 83.594 (81.976)	lr 0.01100
Train [65][1920/3239]	Time 0.252 (0.623)	Data Time 0.001 (0.100)	Loss 2.5028 (2.6096)	Entropy 0.62031 (0.61962)	Top-1 acc 63.672 (61.108)	Top-5 acc 83.203 (81.982)	lr 0.01100
Train [65][1930/3239]	Time 0.244 (0.622)	Data Time 0.001 (0.100)	Loss 2.5383 (2.6098)	Entropy 0.62062 (0.61962)	Top-1 acc 64.062 (61.107)	Top-5 acc 83.594 (81.978)	lr 0.01100
Train [65][1940/3239]	Time 0.248 (0.624)	Data Time 0.001 (0.103)	Loss 2.8811 (2.6101)	Entropy 0.62074 (0.61963)	Top-1 acc 55.859 (61.101)	Top-5 acc 78.516 (81.971)	lr 0.01100
Train [65][1950/3239]	Time 0.252 (0.625)	Data Time 0.001 (0.105)	Loss 2.6029 (2.6102)	Entropy 0.62054 (0.61963)	Top-1 acc 62.500 (61.097)	Top-5 acc 81.641 (81.970)	lr 0.01100
Train [65][1960/3239]	Time 0.253 (0.625)	Data Time 0.001 (0.104)	Loss 2.7661 (2.6103)	Entropy 0.62062 (0.61964)	Top-1 acc 59.375 (61.092)	Top-5 acc 78.906 (81.968)	lr 0.01100
Train [65][1970/3239]	Time 0.243 (0.625)	Data Time 0.001 (0.105)	Loss 2.5388 (2.6103)	Entropy 0.62061 (0.61964)	Top-1 acc 65.625 (61.092)	Top-5 acc 84.766 (81.970)	lr 0.01100
Train [65][1980/3239]	Time 0.257 (0.631)	Data Time 0.001 (0.112)	Loss 2.7058 (2.6106)	Entropy 0.62075 (0.61965)	Top-1 acc 60.547 (61.080)	Top-5 acc 81.641 (81.967)	lr 0.01099
Train [65][1990/3239]	Time 0.237 (0.630)	Data Time 0.001 (0.111)	Loss 2.5810 (2.6106)	Entropy 0.62082 (0.61965)	Top-1 acc 65.234 (61.082)	Top-5 acc 81.641 (81.958)	lr 0.01099
Train [65][2000/3239]	Time 0.252 (0.629)	Data Time 0.001 (0.111)	Loss 2.5273 (2.6105)	Entropy 0.62073 (0.61966)	Top-1 acc 60.938 (61.085)	Top-5 acc 84.375 (81.963)	lr 0.01099
Train [65][2010/3239]	Time 0.227 (0.635)	Data Time 0.001 (0.117)	Loss 2.5893 (2.6109)	Entropy 0.62066 (0.61966)	Top-1 acc 64.453 (61.078)	Top-5 acc 81.250 (81.955)	lr 0.01099
Train [65][2020/3239]	Time 0.255 (0.635)	Data Time 0.001 (0.117)	Loss 2.5771 (2.6105)	Entropy 0.62070 (0.61967)	Top-1 acc 60.156 (61.082)	Top-5 acc 82.812 (81.966)	lr 0.01099
Train [65][2030/3239]	Time 0.247 (0.634)	Data Time 0.001 (0.117)	Loss 2.6771 (2.6102)	Entropy 0.62081 (0.61967)	Top-1 acc 58.594 (61.092)	Top-5 acc 80.469 (81.969)	lr 0.01099
Train [65][2040/3239]	Time 0.259 (0.639)	Data Time 0.001 (0.122)	Loss 2.6025 (2.6104)	Entropy 0.62113 (0.61968)	Top-1 acc 59.375 (61.088)	Top-5 acc 81.641 (81.966)	lr 0.01099
Train [65][2050/3239]	Time 0.433 (0.639)	Data Time 0.194 (0.123)	Loss 2.5520 (2.6105)	Entropy 0.62137 (0.61969)	Top-1 acc 58.984 (61.077)	Top-5 acc 84.766 (81.967)	lr 0.01099
Train [65][2060/3239]	Time 0.248 (0.640)	Data Time 0.001 (0.124)	Loss 2.4825 (2.6105)	Entropy 0.62104 (0.61969)	Top-1 acc 65.625 (61.079)	Top-5 acc 83.984 (81.967)	lr 0.01099
Train [65][2070/3239]	Time 0.341 (0.646)	Data Time 0.001 (0.131)	Loss 2.5528 (2.6107)	Entropy 0.62101 (0.61970)	Top-1 acc 62.109 (61.073)	Top-5 acc 82.031 (81.962)	lr 0.01099
Train [65][2080/3239]	Time 0.254 (0.646)	Data Time 0.002 (0.131)	Loss 2.6190 (2.6106)	Entropy 0.62072 (0.61971)	Top-1 acc 62.891 (61.073)	Top-5 acc 83.594 (81.966)	lr 0.01098
Train [65][2090/3239]	Time 1.417 (0.645)	Data Time 1.180 (0.131)	Loss 2.6479 (2.6103)	Entropy 0.62043 (0.61971)	Top-1 acc 57.812 (61.078)	Top-5 acc 80.078 (81.972)	lr 0.01098
Train [65][2100/3239]	Time 0.243 (0.654)	Data Time 0.001 (0.140)	Loss 2.5781 (2.6103)	Entropy 0.62034 (0.61971)	Top-1 acc 60.938 (61.071)	Top-5 acc 82.812 (81.973)	lr 0.01098
Train [65][2110/3239]	Time 0.242 (0.652)	Data Time 0.001 (0.139)	Loss 2.6578 (2.6104)	Entropy 0.62044 (0.61972)	Top-1 acc 60.156 (61.066)	Top-5 acc 81.250 (81.971)	lr 0.01098
Train [65][2120/3239]	Time 0.255 (0.651)	Data Time 0.002 (0.138)	Loss 2.6531 (2.6104)	Entropy 0.62054 (0.61972)	Top-1 acc 61.328 (61.068)	Top-5 acc 80.469 (81.967)	lr 0.01098
Train [65][2130/3239]	Time 0.233 (0.651)	Data Time 0.001 (0.138)	Loss 2.5667 (2.6103)	Entropy 0.62086 (0.61973)	Top-1 acc 62.891 (61.071)	Top-5 acc 83.594 (81.966)	lr 0.01098
Train [65][2140/3239]	Time 0.353 (0.658)	Data Time 0.001 (0.146)	Loss 2.6235 (2.6105)	Entropy 0.62111 (0.61973)	Top-1 acc 60.938 (61.065)	Top-5 acc 84.375 (81.965)	lr 0.01098
Train [65][2150/3239]	Time 0.223 (0.657)	Data Time 0.001 (0.146)	Loss 2.5716 (2.6102)	Entropy 0.62097 (0.61974)	Top-1 acc 65.625 (61.074)	Top-5 acc 79.297 (81.967)	lr 0.01098
Train [65][2160/3239]	Time 0.246 (0.657)	Data Time 0.001 (0.146)	Loss 2.6930 (2.6103)	Entropy 0.62083 (0.61974)	Top-1 acc 57.422 (61.072)	Top-5 acc 83.594 (81.967)	lr 0.01098
Train [65][2170/3239]	Time 0.234 (0.664)	Data Time 0.001 (0.153)	Loss 2.5675 (2.6102)	Entropy 0.62078 (0.61975)	Top-1 acc 62.891 (61.076)	Top-5 acc 82.812 (81.968)	lr 0.01098
Train [65][2180/3239]	Time 0.232 (0.665)	Data Time 0.001 (0.154)	Loss 2.8151 (2.6103)	Entropy 0.62056 (0.61975)	Top-1 acc 50.781 (61.071)	Top-5 acc 75.781 (81.963)	lr 0.01097
Train [65][2190/3239]	Time 0.250 (0.664)	Data Time 0.002 (0.153)	Loss 2.6060 (2.6103)	Entropy 0.62051 (0.61976)	Top-1 acc 62.891 (61.073)	Top-5 acc 79.297 (81.963)	lr 0.01097
Train [65][2200/3239]	Time 0.245 (0.671)	Data Time 0.001 (0.161)	Loss 2.4790 (2.6100)	Entropy 0.62019 (0.61976)	Top-1 acc 64.062 (61.077)	Top-5 acc 85.547 (81.968)	lr 0.01097
Train [65][2210/3239]	Time 0.314 (0.688)	Data Time 0.006 (0.160)	Loss 2.8344 (2.6102)	Entropy 0.62015 (0.61976)	Top-1 acc 56.641 (61.074)	Top-5 acc 77.344 (81.966)	lr 0.01097
Train [65][2220/3239]	Time 0.241 (0.687)	Data Time 0.002 (0.159)	Loss 2.5108 (2.6104)	Entropy 0.61982 (0.61976)	Top-1 acc 64.844 (61.067)	Top-5 acc 84.375 (81.961)	lr 0.01097
Train [65][2230/3239]	Time 0.381 (0.686)	Data Time 0.002 (0.159)	Loss 2.7085 (2.6103)	Entropy 0.61975 (0.61976)	Top-1 acc 58.594 (61.070)	Top-5 acc 80.078 (81.964)	lr 0.01097
Train [65][2240/3239]	Time 0.243 (0.685)	Data Time 0.001 (0.158)	Loss 2.6598 (2.6106)	Entropy 0.61987 (0.61976)	Top-1 acc 62.109 (61.063)	Top-5 acc 81.641 (81.960)	lr 0.01097
Train [65][2250/3239]	Time 0.247 (0.684)	Data Time 0.001 (0.157)	Loss 2.6092 (2.6105)	Entropy 0.61982 (0.61976)	Top-1 acc 64.453 (61.069)	Top-5 acc 80.859 (81.961)	lr 0.01097
Train [65][2260/3239]	Time 0.237 (0.683)	Data Time 0.001 (0.156)	Loss 2.6185 (2.6104)	Entropy 0.61956 (0.61976)	Top-1 acc 61.719 (61.071)	Top-5 acc 80.859 (81.960)	lr 0.01097
Train [65][2270/3239]	Time 0.246 (0.681)	Data Time 0.001 (0.156)	Loss 2.6516 (2.6102)	Entropy 0.61971 (0.61976)	Top-1 acc 59.766 (61.074)	Top-5 acc 81.250 (81.964)	lr 0.01097
Train [65][2280/3239]	Time 0.243 (0.685)	Data Time 0.001 (0.160)	Loss 2.4574 (2.6099)	Entropy 0.61959 (0.61976)	Top-1 acc 64.844 (61.082)	Top-5 acc 83.984 (81.972)	lr 0.01096
Train [65][2290/3239]	Time 0.237 (0.684)	Data Time 0.001 (0.159)	Loss 2.4282 (2.6101)	Entropy 0.61962 (0.61976)	Top-1 acc 65.625 (61.076)	Top-5 acc 85.156 (81.968)	lr 0.01096
Train [65][2300/3239]	Time 0.376 (0.687)	Data Time 0.001 (0.162)	Loss 2.6900 (2.6101)	Entropy 0.61953 (0.61976)	Top-1 acc 59.766 (61.075)	Top-5 acc 82.031 (81.968)	lr 0.01096
Train [65][2310/3239]	Time 0.245 (0.691)	Data Time 0.001 (0.167)	Loss 2.5975 (2.6099)	Entropy 0.61945 (0.61976)	Top-1 acc 62.891 (61.081)	Top-5 acc 82.812 (81.972)	lr 0.01096
Train [65][2320/3239]	Time 0.265 (0.690)	Data Time 0.001 (0.166)	Loss 2.5347 (2.6099)	Entropy 0.61946 (0.61976)	Top-1 acc 64.062 (61.084)	Top-5 acc 82.031 (81.973)	lr 0.01096
Train [65][2330/3239]	Time 0.240 (0.695)	Data Time 0.001 (0.171)	Loss 2.5537 (2.6099)	Entropy 0.61961 (0.61976)	Top-1 acc 58.984 (61.086)	Top-5 acc 82.812 (81.975)	lr 0.01096
Train [65][2340/3239]	Time 0.883 (0.697)	Data Time 0.627 (0.174)	Loss 2.6885 (2.6097)	Entropy 0.61962 (0.61975)	Top-1 acc 60.156 (61.087)	Top-5 acc 79.688 (81.976)	lr 0.01096
Train [65][2350/3239]	Time 0.242 (0.697)	Data Time 0.001 (0.174)	Loss 2.6315 (2.6095)	Entropy 0.61974 (0.61975)	Top-1 acc 63.672 (61.092)	Top-5 acc 80.078 (81.981)	lr 0.01096
Train [65][2360/3239]	Time 0.240 (0.702)	Data Time 0.001 (0.180)	Loss 2.6021 (2.6092)	Entropy 0.61999 (0.61975)	Top-1 acc 60.938 (61.096)	Top-5 acc 80.469 (81.985)	lr 0.01096
Train [65][2370/3239]	Time 2.069 (0.702)	Data Time 1.777 (0.180)	Loss 2.6661 (2.6093)	Entropy 0.61955 (0.61975)	Top-1 acc 60.156 (61.096)	Top-5 acc 79.688 (81.983)	lr 0.01096
Train [65][2380/3239]	Time 0.262 (0.704)	Data Time 0.001 (0.182)	Loss 2.6620 (2.6093)	Entropy 0.61922 (0.61975)	Top-1 acc 61.719 (61.096)	Top-5 acc 80.469 (81.980)	lr 0.01095
Train [65][2390/3239]	Time 0.375 (0.710)	Data Time 0.002 (0.188)	Loss 2.5567 (2.6092)	Entropy 0.61904 (0.61975)	Top-1 acc 63.672 (61.096)	Top-5 acc 82.812 (81.984)	lr 0.01095
Train [65][2400/3239]	Time 0.296 (0.709)	Data Time 0.002 (0.188)	Loss 2.6202 (2.6091)	Entropy 0.61904 (0.61975)	Top-1 acc 61.328 (61.098)	Top-5 acc 83.594 (81.987)	lr 0.01095
Train [65][2410/3239]	Time 0.241 (0.710)	Data Time 0.001 (0.189)	Loss 2.4865 (2.6094)	Entropy 0.61917 (0.61974)	Top-1 acc 62.109 (61.090)	Top-5 acc 84.375 (81.984)	lr 0.01095
Train [65][2420/3239]	Time 0.239 (0.717)	Data Time 0.002 (0.197)	Loss 2.7127 (2.6095)	Entropy 0.61893 (0.61974)	Top-1 acc 59.766 (61.086)	Top-5 acc 79.297 (81.980)	lr 0.01095
Train [65][2430/3239]	Time 0.254 (0.716)	Data Time 0.001 (0.196)	Loss 2.7262 (2.6094)	Entropy 0.61898 (0.61974)	Top-1 acc 58.203 (61.088)	Top-5 acc 76.953 (81.982)	lr 0.01095
Train [65][2440/3239]	Time 1.730 (0.716)	Data Time 1.495 (0.196)	Loss 2.4133 (2.6095)	Entropy 0.61923 (0.61974)	Top-1 acc 66.016 (61.083)	Top-5 acc 85.156 (81.981)	lr 0.01095
Train [65][2450/3239]	Time 0.252 (0.715)	Data Time 0.001 (0.196)	Loss 2.7101 (2.6097)	Entropy 0.61941 (0.61973)	Top-1 acc 60.547 (61.079)	Top-5 acc 77.344 (81.975)	lr 0.01095
Train [65][2460/3239]	Time 0.346 (0.723)	Data Time 0.001 (0.204)	Loss 2.3999 (2.6098)	Entropy 0.61946 (0.61973)	Top-1 acc 65.234 (61.076)	Top-5 acc 85.938 (81.974)	lr 0.01095
Train [65][2470/3239]	Time 0.256 (0.723)	Data Time 0.001 (0.204)	Loss 2.6486 (2.6099)	Entropy 0.61928 (0.61973)	Top-1 acc 62.500 (61.078)	Top-5 acc 82.812 (81.973)	lr 0.01095
Train [65][2480/3239]	Time 0.241 (0.722)	Data Time 0.001 (0.204)	Loss 2.6413 (2.6098)	Entropy 0.61944 (0.61973)	Top-1 acc 61.328 (61.076)	Top-5 acc 81.641 (81.972)	lr 0.01094
Train [65][2490/3239]	Time 0.257 (0.731)	Data Time 0.001 (0.213)	Loss 2.6428 (2.6098)	Entropy 0.61965 (0.61973)	Top-1 acc 60.156 (61.079)	Top-5 acc 79.688 (81.976)	lr 0.01094
Train [65][2500/3239]	Time 0.243 (0.730)	Data Time 0.002 (0.212)	Loss 2.5743 (2.6097)	Entropy 0.61999 (0.61973)	Top-1 acc 57.812 (61.074)	Top-5 acc 83.984 (81.980)	lr 0.01094
Train [65][2510/3239]	Time 0.240 (0.729)	Data Time 0.001 (0.212)	Loss 2.5775 (2.6098)	Entropy 0.62031 (0.61973)	Top-1 acc 60.938 (61.070)	Top-5 acc 82.031 (81.981)	lr 0.01094
Train [65][2520/3239]	Time 0.244 (0.737)	Data Time 0.001 (0.220)	Loss 2.8445 (2.6100)	Entropy 0.62040 (0.61973)	Top-1 acc 56.250 (61.067)	Top-5 acc 76.172 (81.978)	lr 0.01094
Train [65][2530/3239]	Time 0.240 (0.736)	Data Time 0.001 (0.219)	Loss 2.6932 (2.6103)	Entropy 0.62053 (0.61974)	Top-1 acc 59.375 (61.061)	Top-5 acc 77.734 (81.974)	lr 0.01094
Train [65][2540/3239]	Time 0.262 (0.735)	Data Time 0.001 (0.219)	Loss 2.4109 (2.6103)	Entropy 0.62059 (0.61974)	Top-1 acc 65.625 (61.059)	Top-5 acc 85.156 (81.974)	lr 0.01094
Train [65][2550/3239]	Time 0.274 (0.745)	Data Time 0.001 (0.229)	Loss 2.6171 (2.6102)	Entropy 0.62021 (0.61974)	Top-1 acc 57.031 (61.059)	Top-5 acc 81.641 (81.972)	lr 0.01094
Train [65][2560/3239]	Time 0.244 (0.743)	Data Time 0.001 (0.228)	Loss 2.7706 (2.6104)	Entropy 0.62039 (0.61975)	Top-1 acc 60.547 (61.056)	Top-5 acc 80.859 (81.971)	lr 0.01094
Train [65][2570/3239]	Time 0.251 (0.744)	Data Time 0.002 (0.228)	Loss 2.7598 (2.6104)	Entropy 0.62048 (0.61975)	Top-1 acc 62.109 (61.058)	Top-5 acc 80.859 (81.973)	lr 0.01094
Train [65][2580/3239]	Time 0.264 (0.752)	Data Time 0.001 (0.236)	Loss 2.5158 (2.6102)	Entropy 0.62033 (0.61975)	Top-1 acc 60.547 (61.065)	Top-5 acc 84.375 (81.975)	lr 0.01093
Train [65][2590/3239]	Time 0.263 (0.751)	Data Time 0.002 (0.236)	Loss 2.6076 (2.6104)	Entropy 0.62053 (0.61975)	Top-1 acc 60.938 (61.061)	Top-5 acc 82.031 (81.971)	lr 0.01093
Train [65][2600/3239]	Time 0.624 (0.750)	Data Time 0.376 (0.235)	Loss 2.5220 (2.6103)	Entropy 0.62033 (0.61976)	Top-1 acc 60.547 (61.059)	Top-5 acc 83.203 (81.975)	lr 0.01093
Train [65][2610/3239]	Time 0.258 (0.749)	Data Time 0.002 (0.234)	Loss 2.7222 (2.6103)	Entropy 0.62022 (0.61976)	Top-1 acc 54.297 (61.057)	Top-5 acc 79.297 (81.973)	lr 0.01093
Train [65][2620/3239]	Time 0.358 (0.757)	Data Time 0.001 (0.243)	Loss 2.4914 (2.6102)	Entropy 0.62009 (0.61976)	Top-1 acc 65.625 (61.054)	Top-5 acc 85.547 (81.974)	lr 0.01093
Train [65][2630/3239]	Time 0.250 (0.755)	Data Time 0.001 (0.242)	Loss 2.5221 (2.6100)	Entropy 0.62007 (0.61976)	Top-1 acc 66.016 (61.059)	Top-5 acc 82.812 (81.979)	lr 0.01093
Train [65][2640/3239]	Time 0.279 (0.754)	Data Time 0.001 (0.241)	Loss 2.5548 (2.6101)	Entropy 0.62040 (0.61976)	Top-1 acc 61.328 (61.053)	Top-5 acc 84.766 (81.979)	lr 0.01093
Train [65][2650/3239]	Time 0.246 (0.764)	Data Time 0.001 (0.250)	Loss 2.6553 (2.6102)	Entropy 0.62026 (0.61977)	Top-1 acc 56.250 (61.052)	Top-5 acc 82.812 (81.980)	lr 0.01093
Train [65][2660/3239]	Time 0.248 (0.762)	Data Time 0.001 (0.250)	Loss 2.5735 (2.6098)	Entropy 0.62050 (0.61977)	Top-1 acc 60.547 (61.059)	Top-5 acc 82.031 (81.987)	lr 0.01093
Train [65][2670/3239]	Time 0.258 (0.761)	Data Time 0.002 (0.249)	Loss 2.8482 (2.6099)	Entropy 0.62027 (0.61977)	Top-1 acc 56.250 (61.057)	Top-5 acc 79.297 (81.988)	lr 0.01093
Train [65][2680/3239]	Time 0.263 (0.769)	Data Time 0.001 (0.257)	Loss 2.5055 (2.6099)	Entropy 0.62024 (0.61977)	Top-1 acc 63.672 (61.054)	Top-5 acc 84.766 (81.990)	lr 0.01092
Train [65][2690/3239]	Time 0.349 (0.768)	Data Time 0.001 (0.256)	Loss 2.7277 (2.6102)	Entropy 0.62023 (0.61977)	Top-1 acc 58.203 (61.043)	Top-5 acc 82.031 (81.988)	lr 0.01092
Train [65][2700/3239]	Time 0.255 (0.767)	Data Time 0.001 (0.255)	Loss 2.6074 (2.6101)	Entropy 0.62015 (0.61977)	Top-1 acc 61.328 (61.048)	Top-5 acc 82.812 (81.990)	lr 0.01092
Train [65][2710/3239]	Time 0.247 (0.776)	Data Time 0.001 (0.265)	Loss 2.4698 (2.6102)	Entropy 0.61991 (0.61978)	Top-1 acc 66.016 (61.043)	Top-5 acc 83.203 (81.988)	lr 0.01092
Train [65][2720/3239]	Time 0.245 (0.775)	Data Time 0.001 (0.264)	Loss 2.5949 (2.6104)	Entropy 0.61994 (0.61978)	Top-1 acc 62.500 (61.037)	Top-5 acc 84.375 (81.984)	lr 0.01092
Train [65][2730/3239]	Time 0.235 (0.774)	Data Time 0.001 (0.263)	Loss 2.7246 (2.6102)	Entropy 0.61994 (0.61978)	Top-1 acc 58.203 (61.043)	Top-5 acc 78.516 (81.986)	lr 0.01092
Train [65][2740/3239]	Time 0.245 (0.783)	Data Time 0.001 (0.272)	Loss 2.5724 (2.6103)	Entropy 0.62023 (0.61978)	Top-1 acc 60.156 (61.040)	Top-5 acc 82.031 (81.985)	lr 0.01092
Train [65][2750/3239]	Time 0.254 (0.781)	Data Time 0.001 (0.272)	Loss 2.5210 (2.6102)	Entropy 0.62041 (0.61978)	Top-1 acc 65.625 (61.047)	Top-5 acc 84.766 (81.990)	lr 0.01092
Train [65][2760/3239]	Time 0.258 (0.780)	Data Time 0.002 (0.271)	Loss 2.5069 (2.6103)	Entropy 0.62067 (0.61978)	Top-1 acc 64.453 (61.044)	Top-5 acc 82.031 (81.986)	lr 0.01092
Train [65][2770/3239]	Time 0.224 (0.779)	Data Time 0.001 (0.270)	Loss 2.7027 (2.6102)	Entropy 0.62088 (0.61979)	Top-1 acc 58.203 (61.044)	Top-5 acc 80.469 (81.987)	lr 0.01092
Train [65][2780/3239]	Time 0.333 (0.787)	Data Time 0.001 (0.278)	Loss 2.5459 (2.6102)	Entropy 0.62094 (0.61979)	Top-1 acc 63.281 (61.043)	Top-5 acc 82.422 (81.987)	lr 0.01091
Train [65][2790/3239]	Time 0.239 (0.786)	Data Time 0.001 (0.277)	Loss 2.7019 (2.6104)	Entropy 0.62089 (0.61979)	Top-1 acc 55.859 (61.037)	Top-5 acc 81.250 (81.982)	lr 0.01091
Train [65][2800/3239]	Time 0.249 (0.784)	Data Time 0.001 (0.276)	Loss 2.6191 (2.6106)	Entropy 0.62076 (0.61980)	Top-1 acc 60.156 (61.030)	Top-5 acc 79.688 (81.979)	lr 0.01091
Train [65][2810/3239]	Time 0.224 (0.791)	Data Time 0.001 (0.283)	Loss 2.4866 (2.6105)	Entropy 0.62096 (0.61980)	Top-1 acc 66.406 (61.034)	Top-5 acc 85.156 (81.981)	lr 0.01091
Train [65][2820/3239]	Time 0.242 (0.790)	Data Time 0.001 (0.282)	Loss 2.4918 (2.6103)	Entropy 0.62120 (0.61981)	Top-1 acc 60.156 (61.037)	Top-5 acc 85.547 (81.987)	lr 0.01091
Train [65][2830/3239]	Time 0.344 (0.789)	Data Time 0.001 (0.281)	Loss 2.7118 (2.6104)	Entropy 0.62135 (0.61981)	Top-1 acc 56.641 (61.030)	Top-5 acc 78.125 (81.981)	lr 0.01091
Train [65][2840/3239]	Time 0.239 (0.797)	Data Time 0.001 (0.289)	Loss 2.5336 (2.6103)	Entropy 0.62144 (0.61982)	Top-1 acc 64.453 (61.033)	Top-5 acc 83.203 (81.984)	lr 0.01091
Train [65][2850/3239]	Time 0.358 (0.795)	Data Time 0.001 (0.288)	Loss 2.8603 (2.6105)	Entropy 0.62128 (0.61982)	Top-1 acc 58.594 (61.027)	Top-5 acc 76.562 (81.981)	lr 0.01091
Train [65][2860/3239]	Time 0.266 (0.794)	Data Time 0.001 (0.287)	Loss 2.7353 (2.6106)	Entropy 0.62122 (0.61983)	Top-1 acc 58.594 (61.024)	Top-5 acc 78.125 (81.978)	lr 0.01091
Train [65][2870/3239]	Time 0.256 (0.807)	Data Time 0.002 (0.286)	Loss 2.8231 (2.6109)	Entropy 0.62135 (0.61983)	Top-1 acc 53.516 (61.021)	Top-5 acc 78.516 (81.972)	lr 0.01091
Train [65][2880/3239]	Time 0.246 (0.806)	Data Time 0.002 (0.285)	Loss 2.6575 (2.6109)	Entropy 0.62156 (0.61984)	Top-1 acc 62.500 (61.025)	Top-5 acc 81.641 (81.973)	lr 0.01090
Train [65][2890/3239]	Time 0.244 (0.805)	Data Time 0.002 (0.284)	Loss 2.4901 (2.6109)	Entropy 0.62176 (0.61984)	Top-1 acc 64.453 (61.025)	Top-5 acc 83.594 (81.968)	lr 0.01090
Train [65][2900/3239]	Time 0.257 (0.804)	Data Time 0.001 (0.284)	Loss 2.6450 (2.6107)	Entropy 0.62136 (0.61985)	Top-1 acc 61.719 (61.029)	Top-5 acc 79.297 (81.969)	lr 0.01090
Train [65][2910/3239]	Time 0.248 (0.803)	Data Time 0.001 (0.283)	Loss 2.5986 (2.6105)	Entropy 0.62137 (0.61985)	Top-1 acc 61.328 (61.037)	Top-5 acc 82.031 (81.977)	lr 0.01090
Train [65][2920/3239]	Time 0.260 (0.802)	Data Time 0.001 (0.282)	Loss 2.6616 (2.6105)	Entropy 0.62155 (0.61986)	Top-1 acc 59.375 (61.033)	Top-5 acc 78.516 (81.976)	lr 0.01090
Train [65][2930/3239]	Time 0.251 (0.804)	Data Time 0.001 (0.284)	Loss 2.6883 (2.6105)	Entropy 0.62155 (0.61987)	Top-1 acc 62.500 (61.035)	Top-5 acc 80.469 (81.977)	lr 0.01090
Train [65][2940/3239]	Time 0.342 (0.808)	Data Time 0.001 (0.289)	Loss 2.6398 (2.6107)	Entropy 0.62138 (0.61987)	Top-1 acc 60.156 (61.028)	Top-5 acc 81.641 (81.974)	lr 0.01090
Train [65][2950/3239]	Time 0.249 (0.807)	Data Time 0.001 (0.288)	Loss 2.5828 (2.6108)	Entropy 0.62145 (0.61988)	Top-1 acc 61.719 (61.026)	Top-5 acc 80.078 (81.973)	lr 0.01090
Train [65][2960/3239]	Time 0.239 (0.805)	Data Time 0.001 (0.287)	Loss 2.5936 (2.6107)	Entropy 0.62141 (0.61988)	Top-1 acc 61.719 (61.031)	Top-5 acc 83.984 (81.974)	lr 0.01090
Train [65][2970/3239]	Time 0.255 (0.813)	Data Time 0.001 (0.295)	Loss 2.7057 (2.6109)	Entropy 0.62094 (0.61989)	Top-1 acc 56.250 (61.025)	Top-5 acc 81.250 (81.974)	lr 0.01090
Train [65][2980/3239]	Time 0.243 (0.812)	Data Time 0.001 (0.294)	Loss 2.6046 (2.6109)	Entropy 0.62093 (0.61989)	Top-1 acc 60.156 (61.023)	Top-5 acc 82.031 (81.974)	lr 0.01089
Train [65][2990/3239]	Time 0.251 (0.810)	Data Time 0.001 (0.293)	Loss 2.7842 (2.6109)	Entropy 0.62129 (0.61989)	Top-1 acc 57.812 (61.018)	Top-5 acc 80.469 (81.974)	lr 0.01089
Train [65][3000/3239]	Time 0.234 (0.817)	Data Time 0.001 (0.300)	Loss 2.7155 (2.6110)	Entropy 0.62083 (0.61990)	Top-1 acc 57.031 (61.014)	Top-5 acc 78.516 (81.972)	lr 0.01089
Train [65][3010/3239]	Time 0.356 (0.815)	Data Time 0.001 (0.299)	Loss 2.7043 (2.6109)	Entropy 0.62075 (0.61990)	Top-1 acc 57.812 (61.015)	Top-5 acc 79.297 (81.970)	lr 0.01089
Train [65][3020/3239]	Time 0.254 (0.814)	Data Time 0.001 (0.298)	Loss 2.4922 (2.6109)	Entropy 0.62032 (0.61990)	Top-1 acc 67.578 (61.013)	Top-5 acc 85.547 (81.975)	lr 0.01089
Train [65][3030/3239]	Time 0.234 (0.821)	Data Time 0.001 (0.305)	Loss 2.5985 (2.6108)	Entropy 0.62032 (0.61990)	Top-1 acc 59.375 (61.016)	Top-5 acc 81.250 (81.976)	lr 0.01089
Train [65][3040/3239]	Time 0.250 (0.820)	Data Time 0.001 (0.304)	Loss 2.6049 (2.6107)	Entropy 0.62008 (0.61991)	Top-1 acc 58.984 (61.018)	Top-5 acc 83.594 (81.977)	lr 0.01089
Train [65][3050/3239]	Time 0.259 (0.820)	Data Time 0.001 (0.305)	Loss 2.3621 (2.6104)	Entropy 0.62031 (0.61991)	Top-1 acc 69.531 (61.028)	Top-5 acc 86.719 (81.983)	lr 0.01089
Train [65][3060/3239]	Time 0.247 (0.826)	Data Time 0.001 (0.310)	Loss 2.5656 (2.6104)	Entropy 0.62018 (0.61991)	Top-1 acc 64.844 (61.031)	Top-5 acc 83.594 (81.985)	lr 0.01089
Train [65][3070/3239]	Time 0.237 (0.824)	Data Time 0.001 (0.309)	Loss 2.5591 (2.6104)	Entropy 0.62042 (0.61991)	Top-1 acc 58.984 (61.027)	Top-5 acc 84.375 (81.985)	lr 0.01089
Train [65][3080/3239]	Time 0.235 (0.823)	Data Time 0.001 (0.308)	Loss 2.7712 (2.6105)	Entropy 0.62057 (0.61991)	Top-1 acc 53.906 (61.027)	Top-5 acc 80.859 (81.986)	lr 0.01088
Train [65][3090/3239]	Time 10.601 (0.827)	Data Time 10.328 (0.312)	Loss 2.2938 (2.6105)	Entropy 0.62028 (0.61991)	Top-1 acc 71.094 (61.027)	Top-5 acc 89.062 (81.989)	lr 0.01088
Train [65][3100/3239]	Time 0.353 (0.828)	Data Time 0.001 (0.313)	Loss 2.6352 (2.6107)	Entropy 0.62024 (0.61991)	Top-1 acc 59.375 (61.024)	Top-5 acc 80.078 (81.986)	lr 0.01088
Train [65][3110/3239]	Time 0.241 (0.826)	Data Time 0.001 (0.312)	Loss 2.5900 (2.6107)	Entropy 0.62016 (0.61991)	Top-1 acc 60.938 (61.024)	Top-5 acc 80.859 (81.988)	lr 0.01088
Train [65][3120/3239]	Time 0.232 (0.827)	Data Time 0.001 (0.314)	Loss 2.4001 (2.6108)	Entropy 0.62007 (0.61992)	Top-1 acc 66.797 (61.018)	Top-5 acc 86.328 (81.988)	lr 0.01088
Train [65][3130/3239]	Time 0.254 (0.833)	Data Time 0.002 (0.320)	Loss 2.7092 (2.6109)	Entropy 0.62024 (0.61992)	Top-1 acc 58.594 (61.017)	Top-5 acc 81.641 (81.984)	lr 0.01088
Train [65][3140/3239]	Time 0.244 (0.832)	Data Time 0.001 (0.318)	Loss 2.5626 (2.6108)	Entropy 0.62010 (0.61992)	Top-1 acc 64.062 (61.024)	Top-5 acc 82.422 (81.987)	lr 0.01088
Train [65][3150/3239]	Time 0.227 (0.830)	Data Time 0.001 (0.318)	Loss 2.6260 (2.6107)	Entropy 0.62020 (0.61992)	Top-1 acc 62.109 (61.026)	Top-5 acc 81.250 (81.987)	lr 0.01088
Train [65][3160/3239]	Time 0.237 (0.837)	Data Time 0.001 (0.324)	Loss 2.6963 (2.6107)	Entropy 0.61983 (0.61992)	Top-1 acc 58.984 (61.025)	Top-5 acc 80.469 (81.988)	lr 0.01088
Train [65][3170/3239]	Time 0.340 (0.836)	Data Time 0.001 (0.323)	Loss 2.5772 (2.6106)	Entropy 0.61991 (0.61992)	Top-1 acc 58.984 (61.027)	Top-5 acc 82.422 (81.989)	lr 0.01088
Train [65][3180/3239]	Time 0.243 (0.835)	Data Time 0.000 (0.323)	Loss 2.6747 (2.6105)	Entropy 0.62001 (0.61992)	Top-1 acc 59.766 (61.027)	Top-5 acc 78.516 (81.990)	lr 0.01087
Train [65][3190/3239]	Time 0.238 (0.841)	Data Time 0.000 (0.329)	Loss 2.5770 (2.6105)	Entropy 0.62023 (0.61992)	Top-1 acc 58.984 (61.026)	Top-5 acc 82.031 (81.991)	lr 0.01087
Train [65][3200/3239]	Time 0.253 (0.839)	Data Time 0.000 (0.328)	Loss 2.5846 (2.6106)	Entropy 0.62057 (0.61992)	Top-1 acc 64.062 (61.025)	Top-5 acc 81.641 (81.989)	lr 0.01087
Train [65][3210/3239]	Time 0.241 (0.839)	Data Time 0.000 (0.328)	Loss 2.6282 (2.6106)	Entropy 0.62056 (0.61992)	Top-1 acc 60.547 (61.023)	Top-5 acc 81.250 (81.988)	lr 0.01087
Train [65][3220/3239]	Time 0.230 (0.844)	Data Time 0.000 (0.333)	Loss 2.3181 (2.6104)	Entropy 0.62050 (0.61992)	Top-1 acc 64.453 (61.024)	Top-5 acc 87.500 (81.991)	lr 0.01087
Train [65][3230/3239]	Time 0.227 (0.842)	Data Time 0.000 (0.332)	Loss 2.7223 (2.6103)	Entropy 0.62066 (0.61993)	Top-1 acc 57.812 (61.026)	Top-5 acc 76.953 (81.993)	lr 0.01087
Train [65][3239/3239]	Time 0.915 (0.841)	Data Time 0.000 (0.331)	Loss 2.4976 (2.6102)	Entropy 0.62070 (0.61993)	Top-1 acc 64.198 (61.029)	Top-5 acc 85.185 (81.995)	lr 0.01087
==========Valid [65/120]	loss 1.357	top-1 acc 68.549 (68.549)	top-5 acc 87.929	Train top-1 61.029	top-5 81.995	Entropy 0.62070	Latency-None: 0.000ms	Flops: 538.40M
Train [66][0/3239]	Time 42.041 (42.041)	Data Time 40.217 (40.217)	Loss 2.4625 (2.4625)	Entropy 0.62092 (0.62092)	Top-1 acc 65.625 (65.625)	Top-5 acc 84.766 (84.766)	lr 0.01087
Train [66][10/3239]	Time 0.235 (4.228)	Data Time 0.001 (3.668)	Loss 2.7392 (2.5936)	Entropy 0.62080 (0.62092)	Top-1 acc 62.109 (62.749)	Top-5 acc 81.250 (82.457)	lr 0.01087
Train [66][20/3239]	Time 0.253 (2.413)	Data Time 0.002 (1.922)	Loss 2.6647 (2.5952)	Entropy 0.62057 (0.62085)	Top-1 acc 58.594 (61.998)	Top-5 acc 79.297 (82.385)	lr 0.01087
Train [66][30/3239]	Time 0.309 (1.805)	Data Time 0.001 (1.303)	Loss 2.4966 (2.6228)	Entropy 0.62026 (0.62071)	Top-1 acc 64.062 (61.139)	Top-5 acc 85.547 (82.145)	lr 0.01087
Train [66][40/3239]	Time 0.245 (1.471)	Data Time 0.001 (0.985)	Loss 2.6696 (2.6192)	Entropy 0.62038 (0.62062)	Top-1 acc 60.547 (60.966)	Top-5 acc 81.250 (82.050)	lr 0.01086
Train [66][50/3239]	Time 0.238 (1.285)	Data Time 0.001 (0.793)	Loss 2.6568 (2.6190)	Entropy 0.62048 (0.62060)	Top-1 acc 60.547 (61.106)	Top-5 acc 82.422 (81.878)	lr 0.01086
Train [66][60/3239]	Time 0.241 (1.144)	Data Time 0.001 (0.663)	Loss 2.6958 (2.6146)	Entropy 0.62018 (0.62056)	Top-1 acc 53.516 (61.162)	Top-5 acc 85.156 (81.929)	lr 0.01086
Train [66][70/3239]	Time 0.503 (1.052)	Data Time 0.002 (0.570)	Loss 2.7332 (2.6090)	Entropy 0.62025 (0.62051)	Top-1 acc 56.250 (61.251)	Top-5 acc 79.297 (82.026)	lr 0.01086
Train [66][80/3239]	Time 0.260 (0.977)	Data Time 0.002 (0.500)	Loss 2.5259 (2.6033)	Entropy 0.62042 (0.62048)	Top-1 acc 65.625 (61.478)	Top-5 acc 84.375 (82.108)	lr 0.01086
Train [66][90/3239]	Time 0.261 (0.915)	Data Time 0.002 (0.445)	Loss 2.5172 (2.6030)	Entropy 0.62057 (0.62048)	Top-1 acc 62.109 (61.461)	Top-5 acc 83.594 (82.044)	lr 0.01086
Train [66][100/3239]	Time 0.255 (0.869)	Data Time 0.001 (0.401)	Loss 2.4896 (2.5956)	Entropy 0.62061 (0.62049)	Top-1 acc 63.672 (61.634)	Top-5 acc 83.984 (82.186)	lr 0.01086
Train [66][110/3239]	Time 0.246 (0.830)	Data Time 0.001 (0.365)	Loss 2.8433 (2.6036)	Entropy 0.62057 (0.62049)	Top-1 acc 57.812 (61.532)	Top-5 acc 76.172 (82.021)	lr 0.01086
Train [66][120/3239]	Time 0.273 (0.799)	Data Time 0.003 (0.335)	Loss 2.4727 (2.5979)	Entropy 0.62054 (0.62050)	Top-1 acc 60.938 (61.693)	Top-5 acc 84.375 (82.125)	lr 0.01086
Train [66][130/3239]	Time 0.250 (0.775)	Data Time 0.002 (0.310)	Loss 2.6278 (2.5964)	Entropy 0.62065 (0.62051)	Top-1 acc 59.766 (61.668)	Top-5 acc 82.812 (82.165)	lr 0.01086
Train [66][140/3239]	Time 0.247 (0.753)	Data Time 0.001 (0.288)	Loss 2.5892 (2.5950)	Entropy 0.62032 (0.62050)	Top-1 acc 64.062 (61.672)	Top-5 acc 81.250 (82.142)	lr 0.01085
Train [66][150/3239]	Time 0.226 (0.731)	Data Time 0.001 (0.269)	Loss 2.6960 (2.5973)	Entropy 0.62028 (0.62049)	Top-1 acc 61.719 (61.644)	Top-5 acc 78.906 (82.083)	lr 0.01085
Train [66][160/3239]	Time 0.354 (0.713)	Data Time 0.001 (0.252)	Loss 2.5901 (2.5954)	Entropy 0.61997 (0.62047)	Top-1 acc 65.234 (61.694)	Top-5 acc 84.375 (82.116)	lr 0.01085
Train [66][170/3239]	Time 0.232 (0.698)	Data Time 0.001 (0.238)	Loss 2.7085 (2.5927)	Entropy 0.61988 (0.62044)	Top-1 acc 62.891 (61.762)	Top-5 acc 78.516 (82.187)	lr 0.01085
Train [66][180/3239]	Time 0.262 (0.684)	Data Time 0.002 (0.224)	Loss 2.4551 (2.5922)	Entropy 0.61972 (0.62041)	Top-1 acc 65.234 (61.768)	Top-5 acc 84.375 (82.187)	lr 0.01085
Train [66][190/3239]	Time 0.232 (0.670)	Data Time 0.001 (0.213)	Loss 2.5113 (2.5954)	Entropy 0.61983 (0.62038)	Top-1 acc 62.500 (61.678)	Top-5 acc 84.375 (82.138)	lr 0.01085
Train [66][200/3239]	Time 0.235 (0.657)	Data Time 0.001 (0.202)	Loss 2.6712 (2.5944)	Entropy 0.61974 (0.62035)	Top-1 acc 59.766 (61.645)	Top-5 acc 80.859 (82.134)	lr 0.01085
Train [66][210/3239]	Time 0.260 (0.647)	Data Time 0.001 (0.193)	Loss 2.5306 (2.5936)	Entropy 0.62006 (0.62032)	Top-1 acc 58.984 (61.639)	Top-5 acc 85.547 (82.174)	lr 0.01085
Train [66][220/3239]	Time 0.268 (0.637)	Data Time 0.001 (0.184)	Loss 2.4925 (2.5941)	Entropy 0.61973 (0.62031)	Top-1 acc 61.719 (61.627)	Top-5 acc 85.938 (82.194)	lr 0.01085
Train [66][230/3239]	Time 0.335 (0.628)	Data Time 0.001 (0.176)	Loss 2.5924 (2.5930)	Entropy 0.61938 (0.62027)	Top-1 acc 62.500 (61.633)	Top-5 acc 81.641 (82.185)	lr 0.01085
Train [66][240/3239]	Time 0.248 (0.620)	Data Time 0.001 (0.169)	Loss 2.6765 (2.5954)	Entropy 0.61931 (0.62023)	Top-1 acc 59.766 (61.578)	Top-5 acc 83.203 (82.143)	lr 0.01084
Train [66][250/3239]	Time 0.233 (0.613)	Data Time 0.001 (0.162)	Loss 2.6023 (2.5949)	Entropy 0.61939 (0.62020)	Top-1 acc 64.453 (61.576)	Top-5 acc 81.250 (82.153)	lr 0.01084
Train [66][260/3239]	Time 0.266 (0.607)	Data Time 0.001 (0.156)	Loss 2.4875 (2.5950)	Entropy 0.61932 (0.62017)	Top-1 acc 62.109 (61.545)	Top-5 acc 84.375 (82.157)	lr 0.01084
Train [66][270/3239]	Time 0.284 (0.600)	Data Time 0.003 (0.150)	Loss 2.4588 (2.5956)	Entropy 0.61951 (0.62014)	Top-1 acc 60.938 (61.521)	Top-5 acc 87.500 (82.154)	lr 0.01084
Train [66][280/3239]	Time 0.360 (0.738)	Data Time 0.006 (0.145)	Loss 2.7214 (2.5984)	Entropy 0.61944 (0.62011)	Top-1 acc 58.984 (61.442)	Top-5 acc 82.422 (82.098)	lr 0.01084
Train [66][290/3239]	Time 0.245 (0.730)	Data Time 0.002 (0.140)	Loss 2.7545 (2.5973)	Entropy 0.61928 (0.62009)	Top-1 acc 60.547 (61.473)	Top-5 acc 79.688 (82.120)	lr 0.01084
Train [66][300/3239]	Time 0.245 (0.720)	Data Time 0.003 (0.136)	Loss 2.6183 (2.5969)	Entropy 0.61914 (0.62006)	Top-1 acc 59.766 (61.493)	Top-5 acc 82.812 (82.119)	lr 0.01084
Train [66][310/3239]	Time 0.254 (0.711)	Data Time 0.001 (0.131)	Loss 2.4699 (2.5961)	Entropy 0.61899 (0.62003)	Top-1 acc 64.062 (61.506)	Top-5 acc 82.422 (82.143)	lr 0.01084
Train [66][320/3239]	Time 0.369 (0.703)	Data Time 0.002 (0.127)	Loss 2.5630 (2.5954)	Entropy 0.61879 (0.61999)	Top-1 acc 63.281 (61.506)	Top-5 acc 79.688 (82.147)	lr 0.01084
Train [66][330/3239]	Time 0.281 (0.695)	Data Time 0.002 (0.124)	Loss 2.5639 (2.5941)	Entropy 0.61885 (0.61996)	Top-1 acc 62.891 (61.549)	Top-5 acc 84.375 (82.192)	lr 0.01084
Train [66][340/3239]	Time 0.247 (0.688)	Data Time 0.001 (0.120)	Loss 2.4953 (2.5945)	Entropy 0.61871 (0.61992)	Top-1 acc 62.109 (61.543)	Top-5 acc 83.984 (82.176)	lr 0.01083
Train [66][350/3239]	Time 0.244 (0.681)	Data Time 0.001 (0.117)	Loss 2.6285 (2.5937)	Entropy 0.61864 (0.61989)	Top-1 acc 58.984 (61.565)	Top-5 acc 80.469 (82.190)	lr 0.01083
Train [66][360/3239]	Time 0.274 (0.675)	Data Time 0.001 (0.113)	Loss 2.8522 (2.5944)	Entropy 0.61851 (0.61985)	Top-1 acc 56.250 (61.553)	Top-5 acc 77.344 (82.192)	lr 0.01083
Train [66][370/3239]	Time 0.354 (0.669)	Data Time 0.001 (0.110)	Loss 2.6555 (2.5949)	Entropy 0.61869 (0.61982)	Top-1 acc 55.078 (61.528)	Top-5 acc 82.812 (82.193)	lr 0.01083
Train [66][380/3239]	Time 0.259 (0.663)	Data Time 0.001 (0.108)	Loss 2.6081 (2.5952)	Entropy 0.61866 (0.61979)	Top-1 acc 61.719 (61.501)	Top-5 acc 83.594 (82.195)	lr 0.01083
Train [66][390/3239]	Time 0.405 (0.659)	Data Time 0.001 (0.105)	Loss 2.4485 (2.5966)	Entropy 0.61847 (0.61976)	Top-1 acc 61.719 (61.442)	Top-5 acc 85.156 (82.172)	lr 0.01083
Train [66][400/3239]	Time 0.316 (0.653)	Data Time 0.002 (0.102)	Loss 2.6189 (2.5966)	Entropy 0.61864 (0.61972)	Top-1 acc 60.938 (61.424)	Top-5 acc 80.469 (82.180)	lr 0.01083
Train [66][410/3239]	Time 0.264 (0.649)	Data Time 0.002 (0.100)	Loss 2.4657 (2.5959)	Entropy 0.61894 (0.61970)	Top-1 acc 64.844 (61.448)	Top-5 acc 82.812 (82.188)	lr 0.01083
Train [66][420/3239]	Time 0.264 (0.644)	Data Time 0.001 (0.098)	Loss 2.6361 (2.5954)	Entropy 0.61881 (0.61968)	Top-1 acc 59.375 (61.458)	Top-5 acc 80.469 (82.186)	lr 0.01083
Train [66][430/3239]	Time 0.263 (0.640)	Data Time 0.001 (0.095)	Loss 2.7750 (2.5943)	Entropy 0.61916 (0.61966)	Top-1 acc 56.641 (61.461)	Top-5 acc 77.734 (82.212)	lr 0.01083
Train [66][440/3239]	Time 0.245 (0.636)	Data Time 0.001 (0.093)	Loss 2.4689 (2.5947)	Entropy 0.61887 (0.61965)	Top-1 acc 63.281 (61.443)	Top-5 acc 82.422 (82.201)	lr 0.01082
Train [66][450/3239]	Time 0.252 (0.632)	Data Time 0.001 (0.091)	Loss 2.5908 (2.5950)	Entropy 0.61842 (0.61963)	Top-1 acc 62.500 (61.427)	Top-5 acc 78.516 (82.198)	lr 0.01082
Train [66][460/3239]	Time 0.289 (0.628)	Data Time 0.001 (0.089)	Loss 2.7180 (2.5966)	Entropy 0.61833 (0.61960)	Top-1 acc 55.469 (61.385)	Top-5 acc 80.859 (82.182)	lr 0.01082
Train [66][470/3239]	Time 0.253 (0.624)	Data Time 0.001 (0.087)	Loss 2.5995 (2.5974)	Entropy 0.61822 (0.61957)	Top-1 acc 63.672 (61.360)	Top-5 acc 83.594 (82.174)	lr 0.01082
Train [66][480/3239]	Time 0.369 (0.621)	Data Time 0.001 (0.086)	Loss 2.4658 (2.5974)	Entropy 0.61827 (0.61955)	Top-1 acc 64.453 (61.371)	Top-5 acc 85.156 (82.178)	lr 0.01082
Train [66][490/3239]	Time 0.260 (0.618)	Data Time 0.001 (0.084)	Loss 2.6659 (2.5969)	Entropy 0.61853 (0.61952)	Top-1 acc 59.375 (61.385)	Top-5 acc 80.859 (82.196)	lr 0.01082
Train [66][500/3239]	Time 0.254 (0.614)	Data Time 0.001 (0.082)	Loss 2.6416 (2.5967)	Entropy 0.61830 (0.61950)	Top-1 acc 56.250 (61.372)	Top-5 acc 82.422 (82.199)	lr 0.01082
Train [66][510/3239]	Time 0.253 (0.611)	Data Time 0.001 (0.081)	Loss 2.5572 (2.5964)	Entropy 0.61816 (0.61948)	Top-1 acc 58.594 (61.373)	Top-5 acc 83.203 (82.207)	lr 0.01082
Train [66][520/3239]	Time 0.233 (0.608)	Data Time 0.001 (0.079)	Loss 2.3994 (2.5966)	Entropy 0.61790 (0.61945)	Top-1 acc 66.016 (61.369)	Top-5 acc 84.375 (82.201)	lr 0.01082
Train [66][530/3239]	Time 0.264 (0.605)	Data Time 0.002 (0.078)	Loss 2.6944 (2.5961)	Entropy 0.61803 (0.61942)	Top-1 acc 62.500 (61.394)	Top-5 acc 78.516 (82.223)	lr 0.01082
Train [66][540/3239]	Time 0.278 (0.602)	Data Time 0.001 (0.076)	Loss 2.6012 (2.5955)	Entropy 0.61819 (0.61940)	Top-1 acc 60.156 (61.397)	Top-5 acc 80.469 (82.235)	lr 0.01081
Train [66][550/3239]	Time 0.351 (0.600)	Data Time 0.001 (0.075)	Loss 2.6013 (2.5954)	Entropy 0.61830 (0.61937)	Top-1 acc 63.281 (61.409)	Top-5 acc 83.203 (82.244)	lr 0.01081
Train [66][560/3239]	Time 0.243 (0.597)	Data Time 0.001 (0.074)	Loss 2.6363 (2.5944)	Entropy 0.61825 (0.61935)	Top-1 acc 59.766 (61.414)	Top-5 acc 82.422 (82.266)	lr 0.01081
Train [66][570/3239]	Time 0.282 (0.594)	Data Time 0.001 (0.072)	Loss 2.5655 (2.5954)	Entropy 0.61823 (0.61933)	Top-1 acc 63.281 (61.399)	Top-5 acc 80.859 (82.239)	lr 0.01081
Train [66][580/3239]	Time 0.263 (0.593)	Data Time 0.002 (0.071)	Loss 2.8357 (2.5966)	Entropy 0.61830 (0.61932)	Top-1 acc 56.250 (61.376)	Top-5 acc 78.906 (82.224)	lr 0.01081
Train [66][590/3239]	Time 0.258 (0.591)	Data Time 0.001 (0.070)	Loss 2.4311 (2.5968)	Entropy 0.61819 (0.61930)	Top-1 acc 65.234 (61.379)	Top-5 acc 85.547 (82.219)	lr 0.01081
Train [66][600/3239]	Time 0.289 (0.589)	Data Time 0.002 (0.069)	Loss 2.6473 (2.5963)	Entropy 0.61845 (0.61928)	Top-1 acc 63.281 (61.402)	Top-5 acc 81.641 (82.224)	lr 0.01081
Train [66][610/3239]	Time 0.236 (0.586)	Data Time 0.001 (0.068)	Loss 2.6067 (2.5960)	Entropy 0.61855 (0.61927)	Top-1 acc 60.547 (61.404)	Top-5 acc 83.594 (82.233)	lr 0.01081
Train [66][620/3239]	Time 0.248 (0.588)	Data Time 0.001 (0.070)	Loss 2.5776 (2.5954)	Entropy 0.61890 (0.61926)	Top-1 acc 61.719 (61.426)	Top-5 acc 82.422 (82.234)	lr 0.01081
Train [66][630/3239]	Time 0.248 (0.585)	Data Time 0.001 (0.069)	Loss 2.5931 (2.5956)	Entropy 0.61930 (0.61926)	Top-1 acc 61.719 (61.401)	Top-5 acc 85.156 (82.241)	lr 0.01081
Train [66][640/3239]	Time 0.245 (0.586)	Data Time 0.001 (0.071)	Loss 2.5288 (2.5956)	Entropy 0.61916 (0.61926)	Top-1 acc 66.797 (61.397)	Top-5 acc 83.594 (82.243)	lr 0.01080
Train [66][650/3239]	Time 0.263 (0.588)	Data Time 0.001 (0.074)	Loss 2.4960 (2.5949)	Entropy 0.61950 (0.61926)	Top-1 acc 66.016 (61.418)	Top-5 acc 83.203 (82.266)	lr 0.01080
Train [66][660/3239]	Time 0.286 (0.585)	Data Time 0.001 (0.073)	Loss 2.5323 (2.5945)	Entropy 0.61996 (0.61927)	Top-1 acc 62.109 (61.429)	Top-5 acc 83.984 (82.263)	lr 0.01080
Train [66][670/3239]	Time 0.320 (0.589)	Data Time 0.001 (0.077)	Loss 2.5089 (2.5941)	Entropy 0.62008 (0.61928)	Top-1 acc 66.016 (61.431)	Top-5 acc 83.203 (82.279)	lr 0.01080
Train [66][680/3239]	Time 0.272 (0.587)	Data Time 0.002 (0.076)	Loss 2.5669 (2.5940)	Entropy 0.62039 (0.61929)	Top-1 acc 64.453 (61.424)	Top-5 acc 81.250 (82.268)	lr 0.01080
Train [66][690/3239]	Time 0.253 (0.589)	Data Time 0.001 (0.079)	Loss 2.6935 (2.5943)	Entropy 0.62061 (0.61931)	Top-1 acc 62.891 (61.435)	Top-5 acc 77.734 (82.248)	lr 0.01080
Train [66][700/3239]	Time 0.297 (0.589)	Data Time 0.025 (0.080)	Loss 2.7099 (2.5941)	Entropy 0.62012 (0.61932)	Top-1 acc 57.812 (61.431)	Top-5 acc 82.031 (82.243)	lr 0.01080
Train [66][710/3239]	Time 2.712 (0.591)	Data Time 2.343 (0.082)	Loss 2.3374 (2.5941)	Entropy 0.62040 (0.61933)	Top-1 acc 63.281 (61.427)	Top-5 acc 87.891 (82.242)	lr 0.01080
Train [66][720/3239]	Time 4.700 (0.595)	Data Time 4.443 (0.087)	Loss 2.5992 (2.5952)	Entropy 0.62028 (0.61935)	Top-1 acc 61.719 (61.403)	Top-5 acc 85.156 (82.233)	lr 0.01080
Train [66][730/3239]	Time 0.286 (0.593)	Data Time 0.002 (0.086)	Loss 2.5283 (2.5959)	Entropy 0.61976 (0.61936)	Top-1 acc 63.672 (61.407)	Top-5 acc 84.375 (82.223)	lr 0.01080
Train [66][740/3239]	Time 0.238 (0.591)	Data Time 0.001 (0.085)	Loss 2.5375 (2.5958)	Entropy 0.61945 (0.61936)	Top-1 acc 62.109 (61.420)	Top-5 acc 85.547 (82.231)	lr 0.01079
Train [66][750/3239]	Time 0.261 (0.594)	Data Time 0.001 (0.089)	Loss 2.5662 (2.5953)	Entropy 0.61949 (0.61937)	Top-1 acc 60.156 (61.423)	Top-5 acc 83.203 (82.239)	lr 0.01079
Train [66][760/3239]	Time 0.295 (0.603)	Data Time 0.002 (0.098)	Loss 2.6031 (2.5956)	Entropy 0.61921 (0.61937)	Top-1 acc 60.547 (61.406)	Top-5 acc 79.688 (82.227)	lr 0.01079
Train [66][770/3239]	Time 0.261 (0.600)	Data Time 0.002 (0.097)	Loss 2.5464 (2.5957)	Entropy 0.61903 (0.61936)	Top-1 acc 62.500 (61.404)	Top-5 acc 83.594 (82.219)	lr 0.01079
Train [66][780/3239]	Time 0.338 (0.598)	Data Time 0.001 (0.096)	Loss 2.5879 (2.5961)	Entropy 0.61921 (0.61936)	Top-1 acc 60.156 (61.389)	Top-5 acc 83.984 (82.212)	lr 0.01079
Train [66][790/3239]	Time 0.284 (0.606)	Data Time 0.001 (0.104)	Loss 2.5671 (2.5958)	Entropy 0.61926 (0.61936)	Top-1 acc 64.453 (61.389)	Top-5 acc 83.203 (82.227)	lr 0.01079
Train [66][800/3239]	Time 0.287 (0.604)	Data Time 0.002 (0.103)	Loss 2.5962 (2.5950)	Entropy 0.61978 (0.61936)	Top-1 acc 60.938 (61.412)	Top-5 acc 82.031 (82.246)	lr 0.01079
Train [66][810/3239]	Time 0.250 (0.602)	Data Time 0.001 (0.102)	Loss 2.5948 (2.5955)	Entropy 0.61985 (0.61936)	Top-1 acc 60.156 (61.401)	Top-5 acc 82.422 (82.240)	lr 0.01079
Train [66][820/3239]	Time 0.235 (0.608)	Data Time 0.001 (0.108)	Loss 2.4660 (2.5958)	Entropy 0.61988 (0.61937)	Top-1 acc 64.453 (61.401)	Top-5 acc 84.766 (82.225)	lr 0.01079
Train [66][830/3239]	Time 0.230 (0.609)	Data Time 0.001 (0.110)	Loss 2.6645 (2.5957)	Entropy 0.61975 (0.61938)	Top-1 acc 58.203 (61.401)	Top-5 acc 82.031 (82.228)	lr 0.01079
Train [66][840/3239]	Time 0.233 (0.607)	Data Time 0.003 (0.110)	Loss 2.5726 (2.5953)	Entropy 0.61988 (0.61938)	Top-1 acc 60.156 (61.410)	Top-5 acc 80.859 (82.231)	lr 0.01078
Train [66][850/3239]	Time 0.240 (0.615)	Data Time 0.001 (0.118)	Loss 2.6931 (2.5953)	Entropy 0.61982 (0.61939)	Top-1 acc 62.500 (61.422)	Top-5 acc 79.688 (82.233)	lr 0.01078
Train [66][860/3239]	Time 0.231 (0.613)	Data Time 0.001 (0.117)	Loss 2.5063 (2.5952)	Entropy 0.61981 (0.61939)	Top-1 acc 61.719 (61.415)	Top-5 acc 84.375 (82.240)	lr 0.01078
Train [66][870/3239]	Time 3.033 (0.614)	Data Time 2.685 (0.119)	Loss 2.4787 (2.5948)	Entropy 0.61983 (0.61940)	Top-1 acc 64.844 (61.426)	Top-5 acc 87.109 (82.243)	lr 0.01078
Train [66][880/3239]	Time 9.996 (0.626)	Data Time 9.728 (0.131)	Loss 2.7471 (2.5946)	Entropy 0.61961 (0.61940)	Top-1 acc 52.344 (61.424)	Top-5 acc 79.297 (82.248)	lr 0.01078
Train [66][890/3239]	Time 0.237 (0.624)	Data Time 0.001 (0.130)	Loss 2.6335 (2.5950)	Entropy 0.61937 (0.61940)	Top-1 acc 58.594 (61.417)	Top-5 acc 81.641 (82.240)	lr 0.01078
Train [66][900/3239]	Time 0.265 (0.622)	Data Time 0.001 (0.129)	Loss 2.4604 (2.5947)	Entropy 0.61965 (0.61941)	Top-1 acc 62.109 (61.424)	Top-5 acc 83.984 (82.239)	lr 0.01078
Train [66][910/3239]	Time 0.234 (0.621)	Data Time 0.001 (0.129)	Loss 2.7217 (2.5943)	Entropy 0.62015 (0.61941)	Top-1 acc 58.594 (61.426)	Top-5 acc 78.906 (82.241)	lr 0.01078
Train [66][920/3239]	Time 0.241 (0.628)	Data Time 0.001 (0.136)	Loss 2.5435 (2.5944)	Entropy 0.62016 (0.61942)	Top-1 acc 64.844 (61.434)	Top-5 acc 81.250 (82.236)	lr 0.01078
Train [66][930/3239]	Time 0.255 (0.626)	Data Time 0.001 (0.135)	Loss 2.6667 (2.5947)	Entropy 0.62006 (0.61943)	Top-1 acc 58.984 (61.429)	Top-5 acc 82.031 (82.224)	lr 0.01078
Train [66][940/3239]	Time 0.402 (0.671)	Data Time 0.003 (0.136)	Loss 2.6782 (2.5948)	Entropy 0.62029 (0.61943)	Top-1 acc 55.859 (61.425)	Top-5 acc 82.031 (82.217)	lr 0.01077
Train [66][950/3239]	Time 0.237 (0.668)	Data Time 0.002 (0.135)	Loss 2.5942 (2.5949)	Entropy 0.62040 (0.61944)	Top-1 acc 57.812 (61.421)	Top-5 acc 82.422 (82.215)	lr 0.01077
Train [66][960/3239]	Time 0.253 (0.665)	Data Time 0.001 (0.134)	Loss 2.5089 (2.5948)	Entropy 0.62030 (0.61945)	Top-1 acc 65.625 (61.432)	Top-5 acc 83.594 (82.210)	lr 0.01077
Train [66][970/3239]	Time 0.248 (0.663)	Data Time 0.001 (0.132)	Loss 2.6939 (2.5944)	Entropy 0.61998 (0.61946)	Top-1 acc 58.203 (61.444)	Top-5 acc 80.469 (82.215)	lr 0.01077
Train [66][980/3239]	Time 0.251 (0.661)	Data Time 0.001 (0.131)	Loss 2.5641 (2.5940)	Entropy 0.62007 (0.61947)	Top-1 acc 60.156 (61.454)	Top-5 acc 84.375 (82.223)	lr 0.01077
Train [66][990/3239]	Time 0.246 (0.658)	Data Time 0.001 (0.130)	Loss 2.6046 (2.5936)	Entropy 0.62009 (0.61947)	Top-1 acc 60.156 (61.458)	Top-5 acc 82.812 (82.232)	lr 0.01077
Train [66][1000/3239]	Time 0.242 (0.656)	Data Time 0.001 (0.128)	Loss 2.6018 (2.5940)	Entropy 0.62036 (0.61948)	Top-1 acc 60.938 (61.452)	Top-5 acc 85.547 (82.226)	lr 0.01077
Train [66][1010/3239]	Time 0.224 (0.654)	Data Time 0.001 (0.127)	Loss 2.5683 (2.5939)	Entropy 0.62055 (0.61949)	Top-1 acc 64.453 (61.448)	Top-5 acc 84.375 (82.233)	lr 0.01077
Train [66][1020/3239]	Time 0.237 (0.653)	Data Time 0.001 (0.126)	Loss 2.3901 (2.5930)	Entropy 0.62038 (0.61950)	Top-1 acc 68.750 (61.461)	Top-5 acc 88.281 (82.249)	lr 0.01077
Train [66][1030/3239]	Time 0.355 (0.652)	Data Time 0.001 (0.127)	Loss 2.4230 (2.5930)	Entropy 0.62016 (0.61951)	Top-1 acc 66.797 (61.471)	Top-5 acc 86.719 (82.243)	lr 0.01077
Train [66][1040/3239]	Time 0.296 (0.660)	Data Time 0.001 (0.136)	Loss 2.8354 (2.5933)	Entropy 0.62024 (0.61951)	Top-1 acc 57.812 (61.466)	Top-5 acc 76.562 (82.238)	lr 0.01076
Train [66][1050/3239]	Time 0.247 (0.658)	Data Time 0.001 (0.135)	Loss 2.7029 (2.5933)	Entropy 0.62013 (0.61952)	Top-1 acc 59.766 (61.466)	Top-5 acc 81.641 (82.243)	lr 0.01076
Train [66][1060/3239]	Time 0.244 (0.656)	Data Time 0.001 (0.133)	Loss 2.6498 (2.5928)	Entropy 0.62039 (0.61953)	Top-1 acc 61.328 (61.474)	Top-5 acc 78.906 (82.253)	lr 0.01076
Train [66][1070/3239]	Time 4.318 (0.666)	Data Time 4.065 (0.144)	Loss 2.2964 (2.5925)	Entropy 0.62053 (0.61954)	Top-1 acc 67.188 (61.481)	Top-5 acc 87.891 (82.261)	lr 0.01076
Train [66][1080/3239]	Time 0.241 (0.664)	Data Time 0.001 (0.143)	Loss 2.5477 (2.5923)	Entropy 0.62049 (0.61954)	Top-1 acc 62.109 (61.485)	Top-5 acc 82.812 (82.261)	lr 0.01076
Train [66][1090/3239]	Time 0.236 (0.663)	Data Time 0.001 (0.143)	Loss 2.6706 (2.5927)	Entropy 0.62046 (0.61955)	Top-1 acc 62.109 (61.481)	Top-5 acc 80.078 (82.260)	lr 0.01076
Train [66][1100/3239]	Time 0.323 (0.668)	Data Time 0.001 (0.148)	Loss 2.5190 (2.5918)	Entropy 0.62055 (0.61956)	Top-1 acc 64.062 (61.492)	Top-5 acc 84.766 (82.279)	lr 0.01076
Train [66][1110/3239]	Time 0.255 (0.670)	Data Time 0.002 (0.151)	Loss 2.6872 (2.5918)	Entropy 0.62053 (0.61957)	Top-1 acc 58.984 (61.482)	Top-5 acc 79.688 (82.279)	lr 0.01076
Train [66][1120/3239]	Time 0.223 (0.669)	Data Time 0.001 (0.151)	Loss 2.8267 (2.5917)	Entropy 0.62074 (0.61958)	Top-1 acc 56.250 (61.480)	Top-5 acc 75.781 (82.278)	lr 0.01076
Train [66][1130/3239]	Time 0.259 (0.674)	Data Time 0.001 (0.157)	Loss 2.6697 (2.5919)	Entropy 0.62109 (0.61959)	Top-1 acc 60.938 (61.471)	Top-5 acc 80.859 (82.272)	lr 0.01076
Train [66][1140/3239]	Time 0.254 (0.673)	Data Time 0.001 (0.157)	Loss 2.8116 (2.5924)	Entropy 0.62097 (0.61960)	Top-1 acc 58.203 (61.451)	Top-5 acc 77.734 (82.265)	lr 0.01075
Train [66][1150/3239]	Time 0.240 (0.677)	Data Time 0.001 (0.161)	Loss 2.4713 (2.5925)	Entropy 0.62112 (0.61962)	Top-1 acc 66.797 (61.449)	Top-5 acc 85.547 (82.263)	lr 0.01075
Train [66][1160/3239]	Time 2.373 (0.677)	Data Time 2.148 (0.162)	Loss 2.8886 (2.5925)	Entropy 0.62095 (0.61963)	Top-1 acc 54.688 (61.446)	Top-5 acc 76.562 (82.267)	lr 0.01075
Train [66][1170/3239]	Time 0.239 (0.678)	Data Time 0.001 (0.164)	Loss 2.5409 (2.5925)	Entropy 0.62111 (0.61964)	Top-1 acc 63.672 (61.441)	Top-5 acc 81.641 (82.265)	lr 0.01075
Train [66][1180/3239]	Time 0.241 (0.684)	Data Time 0.001 (0.170)	Loss 2.7141 (2.5925)	Entropy 0.62135 (0.61965)	Top-1 acc 55.859 (61.432)	Top-5 acc 80.469 (82.268)	lr 0.01075
Train [66][1190/3239]	Time 0.275 (0.681)	Data Time 0.001 (0.169)	Loss 2.5767 (2.5928)	Entropy 0.62126 (0.61967)	Top-1 acc 61.719 (61.420)	Top-5 acc 82.031 (82.264)	lr 0.01075
Train [66][1200/3239]	Time 0.246 (0.686)	Data Time 0.001 (0.174)	Loss 2.6182 (2.5922)	Entropy 0.62152 (0.61968)	Top-1 acc 60.156 (61.436)	Top-5 acc 81.641 (82.273)	lr 0.01075
Train [66][1210/3239]	Time 0.231 (0.685)	Data Time 0.001 (0.174)	Loss 2.5001 (2.5924)	Entropy 0.62151 (0.61970)	Top-1 acc 62.891 (61.441)	Top-5 acc 81.250 (82.266)	lr 0.01075
Train [66][1220/3239]	Time 0.249 (0.688)	Data Time 0.001 (0.177)	Loss 2.3382 (2.5918)	Entropy 0.62152 (0.61971)	Top-1 acc 66.797 (61.453)	Top-5 acc 85.156 (82.278)	lr 0.01075
Train [66][1230/3239]	Time 0.323 (0.691)	Data Time 0.001 (0.181)	Loss 2.5170 (2.5917)	Entropy 0.62165 (0.61973)	Top-1 acc 60.938 (61.457)	Top-5 acc 83.594 (82.283)	lr 0.01075
Train [66][1240/3239]	Time 0.230 (0.691)	Data Time 0.001 (0.181)	Loss 2.7546 (2.5920)	Entropy 0.62160 (0.61974)	Top-1 acc 56.641 (61.446)	Top-5 acc 78.516 (82.275)	lr 0.01074
Train [66][1250/3239]	Time 0.256 (0.694)	Data Time 0.001 (0.186)	Loss 2.5857 (2.5925)	Entropy 0.62171 (0.61976)	Top-1 acc 60.156 (61.425)	Top-5 acc 82.422 (82.263)	lr 0.01074
Train [66][1260/3239]	Time 0.348 (0.699)	Data Time 0.001 (0.190)	Loss 2.5739 (2.5923)	Entropy 0.62146 (0.61977)	Top-1 acc 57.422 (61.423)	Top-5 acc 81.641 (82.270)	lr 0.01074
Train [66][1270/3239]	Time 0.254 (0.697)	Data Time 0.001 (0.189)	Loss 2.7923 (2.5926)	Entropy 0.62137 (0.61979)	Top-1 acc 56.641 (61.409)	Top-5 acc 79.688 (82.265)	lr 0.01074
Train [66][1280/3239]	Time 0.225 (0.701)	Data Time 0.001 (0.194)	Loss 2.6396 (2.5925)	Entropy 0.62170 (0.61980)	Top-1 acc 58.203 (61.406)	Top-5 acc 82.812 (82.265)	lr 0.01074
Train [66][1290/3239]	Time 4.102 (0.706)	Data Time 3.849 (0.199)	Loss 2.6577 (2.5928)	Entropy 0.62177 (0.61981)	Top-1 acc 62.109 (61.401)	Top-5 acc 81.250 (82.266)	lr 0.01074
Train [66][1300/3239]	Time 0.315 (0.705)	Data Time 0.001 (0.199)	Loss 2.4330 (2.5931)	Entropy 0.62181 (0.61983)	Top-1 acc 63.672 (61.380)	Top-5 acc 85.156 (82.265)	lr 0.01074
Train [66][1310/3239]	Time 0.253 (0.709)	Data Time 0.002 (0.204)	Loss 2.5340 (2.5936)	Entropy 0.62218 (0.61985)	Top-1 acc 61.328 (61.366)	Top-5 acc 82.031 (82.253)	lr 0.01074
Train [66][1320/3239]	Time 0.254 (0.711)	Data Time 0.001 (0.206)	Loss 2.4432 (2.5935)	Entropy 0.62214 (0.61986)	Top-1 acc 64.062 (61.370)	Top-5 acc 87.109 (82.252)	lr 0.01074
Train [66][1330/3239]	Time 0.340 (0.712)	Data Time 0.001 (0.208)	Loss 2.6014 (2.5931)	Entropy 0.62233 (0.61988)	Top-1 acc 58.594 (61.377)	Top-5 acc 85.547 (82.267)	lr 0.01074
Train [66][1340/3239]	Time 0.234 (0.718)	Data Time 0.001 (0.214)	Loss 2.7563 (2.5935)	Entropy 0.62225 (0.61990)	Top-1 acc 57.031 (61.376)	Top-5 acc 78.125 (82.256)	lr 0.01073
Train [66][1350/3239]	Time 0.243 (0.717)	Data Time 0.001 (0.214)	Loss 2.7869 (2.5937)	Entropy 0.62248 (0.61992)	Top-1 acc 55.469 (61.368)	Top-5 acc 79.688 (82.256)	lr 0.01073
Train [66][1360/3239]	Time 0.231 (0.721)	Data Time 0.001 (0.219)	Loss 2.7715 (2.5934)	Entropy 0.62237 (0.61993)	Top-1 acc 60.938 (61.380)	Top-5 acc 78.516 (82.263)	lr 0.01073
Train [66][1370/3239]	Time 0.256 (0.720)	Data Time 0.001 (0.219)	Loss 2.8458 (2.5937)	Entropy 0.62222 (0.61995)	Top-1 acc 55.469 (61.377)	Top-5 acc 77.344 (82.261)	lr 0.01073
Train [66][1380/3239]	Time 0.249 (0.721)	Data Time 0.001 (0.220)	Loss 2.5410 (2.5942)	Entropy 0.62242 (0.61997)	Top-1 acc 62.891 (61.360)	Top-5 acc 83.203 (82.258)	lr 0.01073
Train [66][1390/3239]	Time 0.221 (0.727)	Data Time 0.001 (0.227)	Loss 2.6348 (2.5942)	Entropy 0.62264 (0.61999)	Top-1 acc 58.984 (61.360)	Top-5 acc 81.250 (82.262)	lr 0.01073
Train [66][1400/3239]	Time 0.231 (0.727)	Data Time 0.001 (0.227)	Loss 2.5517 (2.5943)	Entropy 0.62285 (0.62001)	Top-1 acc 62.891 (61.359)	Top-5 acc 82.031 (82.261)	lr 0.01073
Train [66][1410/3239]	Time 0.246 (0.730)	Data Time 0.001 (0.231)	Loss 2.6877 (2.5943)	Entropy 0.62310 (0.62003)	Top-1 acc 62.109 (61.365)	Top-5 acc 79.297 (82.261)	lr 0.01073
Train [66][1420/3239]	Time 0.376 (0.734)	Data Time 0.001 (0.236)	Loss 2.4715 (2.5941)	Entropy 0.62343 (0.62005)	Top-1 acc 62.500 (61.373)	Top-5 acc 87.109 (82.265)	lr 0.01073
Train [66][1430/3239]	Time 0.236 (0.737)	Data Time 0.001 (0.239)	Loss 2.3441 (2.5937)	Entropy 0.62384 (0.62007)	Top-1 acc 66.406 (61.384)	Top-5 acc 86.328 (82.269)	lr 0.01073
Train [66][1440/3239]	Time 0.238 (0.739)	Data Time 0.001 (0.242)	Loss 2.7175 (2.5935)	Entropy 0.62368 (0.62010)	Top-1 acc 57.422 (61.388)	Top-5 acc 80.859 (82.274)	lr 0.01072
Train [66][1450/3239]	Time 4.547 (0.743)	Data Time 4.274 (0.246)	Loss 2.6415 (2.5936)	Entropy 0.62383 (0.62013)	Top-1 acc 62.891 (61.389)	Top-5 acc 81.641 (82.272)	lr 0.01072
Train [66][1460/3239]	Time 0.251 (0.743)	Data Time 0.001 (0.247)	Loss 2.5407 (2.5931)	Entropy 0.62392 (0.62015)	Top-1 acc 60.156 (61.395)	Top-5 acc 84.766 (82.281)	lr 0.01072
Train [66][1470/3239]	Time 0.277 (0.748)	Data Time 0.002 (0.252)	Loss 2.6885 (2.5930)	Entropy 0.62378 (0.62018)	Top-1 acc 57.812 (61.395)	Top-5 acc 81.641 (82.282)	lr 0.01072
Train [66][1480/3239]	Time 0.234 (0.746)	Data Time 0.001 (0.250)	Loss 2.5708 (2.5930)	Entropy 0.62382 (0.62020)	Top-1 acc 62.500 (61.400)	Top-5 acc 82.812 (82.285)	lr 0.01072
Train [66][1490/3239]	Time 0.356 (0.752)	Data Time 0.001 (0.257)	Loss 2.6085 (2.5931)	Entropy 0.62375 (0.62023)	Top-1 acc 62.109 (61.404)	Top-5 acc 82.812 (82.280)	lr 0.01072
Train [66][1500/3239]	Time 0.234 (0.759)	Data Time 0.001 (0.264)	Loss 2.6172 (2.5934)	Entropy 0.62392 (0.62025)	Top-1 acc 61.719 (61.395)	Top-5 acc 80.469 (82.267)	lr 0.01072
Train [66][1510/3239]	Time 0.250 (0.756)	Data Time 0.001 (0.263)	Loss 2.5268 (2.5937)	Entropy 0.62389 (0.62027)	Top-1 acc 63.672 (61.390)	Top-5 acc 83.594 (82.256)	lr 0.01072
Train [66][1520/3239]	Time 0.229 (0.760)	Data Time 0.001 (0.267)	Loss 2.6274 (2.5937)	Entropy 0.62372 (0.62030)	Top-1 acc 60.547 (61.387)	Top-5 acc 81.641 (82.257)	lr 0.01072
Train [66][1530/3239]	Time 0.235 (0.761)	Data Time 0.001 (0.269)	Loss 2.6105 (2.5933)	Entropy 0.62380 (0.62032)	Top-1 acc 61.328 (61.391)	Top-5 acc 81.641 (82.264)	lr 0.01072
Train [66][1540/3239]	Time 0.239 (0.763)	Data Time 0.001 (0.271)	Loss 2.7073 (2.5936)	Entropy 0.62420 (0.62034)	Top-1 acc 60.547 (61.388)	Top-5 acc 77.344 (82.260)	lr 0.01071
Train [66][1550/3239]	Time 0.242 (0.767)	Data Time 0.001 (0.275)	Loss 2.7477 (2.5941)	Entropy 0.62448 (0.62037)	Top-1 acc 54.688 (61.378)	Top-5 acc 78.906 (82.251)	lr 0.01071
Train [66][1560/3239]	Time 0.241 (0.766)	Data Time 0.002 (0.275)	Loss 2.4891 (2.5938)	Entropy 0.62451 (0.62040)	Top-1 acc 62.891 (61.388)	Top-5 acc 84.375 (82.256)	lr 0.01071
Train [66][1570/3239]	Time 0.239 (0.771)	Data Time 0.002 (0.280)	Loss 2.6579 (2.5938)	Entropy 0.62462 (0.62042)	Top-1 acc 53.516 (61.378)	Top-5 acc 82.422 (82.259)	lr 0.01071
Train [66][1580/3239]	Time 0.329 (0.775)	Data Time 0.001 (0.285)	Loss 2.7041 (2.5944)	Entropy 0.62451 (0.62045)	Top-1 acc 57.031 (61.363)	Top-5 acc 81.250 (82.250)	lr 0.01071
Train [66][1590/3239]	Time 0.459 (0.802)	Data Time 0.040 (0.285)	Loss 2.6504 (2.5942)	Entropy 0.62471 (0.62047)	Top-1 acc 60.547 (61.362)	Top-5 acc 81.250 (82.255)	lr 0.01071
Train [66][1600/3239]	Time 0.243 (0.800)	Data Time 0.002 (0.283)	Loss 2.6650 (2.5943)	Entropy 0.62493 (0.62050)	Top-1 acc 58.203 (61.363)	Top-5 acc 81.641 (82.250)	lr 0.01071
Train [66][1610/3239]	Time 0.254 (0.798)	Data Time 0.002 (0.282)	Loss 2.5678 (2.5942)	Entropy 0.62536 (0.62053)	Top-1 acc 64.062 (61.364)	Top-5 acc 82.812 (82.254)	lr 0.01071
Train [66][1620/3239]	Time 0.244 (0.796)	Data Time 0.001 (0.280)	Loss 2.4565 (2.5940)	Entropy 0.62530 (0.62056)	Top-1 acc 63.281 (61.372)	Top-5 acc 86.719 (82.258)	lr 0.01071
Train [66][1630/3239]	Time 0.230 (0.793)	Data Time 0.001 (0.278)	Loss 2.6632 (2.5938)	Entropy 0.62519 (0.62059)	Top-1 acc 58.594 (61.379)	Top-5 acc 81.250 (82.258)	lr 0.01071
Train [66][1640/3239]	Time 0.237 (0.791)	Data Time 0.001 (0.276)	Loss 2.6304 (2.5941)	Entropy 0.62533 (0.62062)	Top-1 acc 62.891 (61.376)	Top-5 acc 82.812 (82.255)	lr 0.01070
Train [66][1650/3239]	Time 0.375 (0.789)	Data Time 0.001 (0.275)	Loss 2.7299 (2.5942)	Entropy 0.62491 (0.62064)	Top-1 acc 59.375 (61.370)	Top-5 acc 81.250 (82.260)	lr 0.01070
Train [66][1660/3239]	Time 0.256 (0.793)	Data Time 0.001 (0.279)	Loss 2.4287 (2.5945)	Entropy 0.62507 (0.62067)	Top-1 acc 62.891 (61.363)	Top-5 acc 86.328 (82.253)	lr 0.01070
Train [66][1670/3239]	Time 0.236 (0.792)	Data Time 0.001 (0.279)	Loss 2.6949 (2.5946)	Entropy 0.62505 (0.62070)	Top-1 acc 60.156 (61.363)	Top-5 acc 78.906 (82.250)	lr 0.01070
Train [66][1680/3239]	Time 2.592 (0.795)	Data Time 2.328 (0.282)	Loss 2.5422 (2.5948)	Entropy 0.62545 (0.62072)	Top-1 acc 63.672 (61.358)	Top-5 acc 80.078 (82.241)	lr 0.01070
Train [66][1690/3239]	Time 0.234 (0.801)	Data Time 0.001 (0.289)	Loss 2.5640 (2.5950)	Entropy 0.62571 (0.62075)	Top-1 acc 59.766 (61.349)	Top-5 acc 81.250 (82.241)	lr 0.01070
Train [66][1700/3239]	Time 0.252 (0.802)	Data Time 0.001 (0.290)	Loss 2.6074 (2.5950)	Entropy 0.62599 (0.62078)	Top-1 acc 59.375 (61.354)	Top-5 acc 79.297 (82.243)	lr 0.01070
Train [66][1710/3239]	Time 0.231 (0.801)	Data Time 0.002 (0.290)	Loss 2.5647 (2.5949)	Entropy 0.62601 (0.62081)	Top-1 acc 60.938 (61.353)	Top-5 acc 84.375 (82.245)	lr 0.01070
Train [66][1720/3239]	Time 5.295 (0.809)	Data Time 5.030 (0.299)	Loss 2.9179 (2.5953)	Entropy 0.62578 (0.62084)	Top-1 acc 55.859 (61.342)	Top-5 acc 76.562 (82.233)	lr 0.01070
Train [66][1730/3239]	Time 0.254 (0.810)	Data Time 0.001 (0.300)	Loss 2.5559 (2.5953)	Entropy 0.62595 (0.62087)	Top-1 acc 57.812 (61.338)	Top-5 acc 83.203 (82.233)	lr 0.01070
Train [66][1740/3239]	Time 0.336 (0.809)	Data Time 0.001 (0.299)	Loss 2.6426 (2.5952)	Entropy 0.62586 (0.62090)	Top-1 acc 60.938 (61.341)	Top-5 acc 80.469 (82.233)	lr 0.01069
Train [66][1750/3239]	Time 6.662 (0.812)	Data Time 6.391 (0.302)	Loss 2.4931 (2.5952)	Entropy 0.62559 (0.62093)	Top-1 acc 62.500 (61.339)	Top-5 acc 83.594 (82.234)	lr 0.01069
Train [66][1760/3239]	Time 1.411 (0.816)	Data Time 1.153 (0.307)	Loss 2.6663 (2.5950)	Entropy 0.62574 (0.62096)	Top-1 acc 58.594 (61.347)	Top-5 acc 81.641 (82.240)	lr 0.01069
Train [66][1770/3239]	Time 6.431 (0.818)	Data Time 6.164 (0.309)	Loss 2.4537 (2.5951)	Entropy 0.62577 (0.62098)	Top-1 acc 65.234 (61.347)	Top-5 acc 84.375 (82.239)	lr 0.01069
Train [66][1780/3239]	Time 0.230 (0.816)	Data Time 0.001 (0.308)	Loss 2.4187 (2.5947)	Entropy 0.62605 (0.62101)	Top-1 acc 68.359 (61.358)	Top-5 acc 84.375 (82.246)	lr 0.01069
Train [66][1790/3239]	Time 0.246 (0.824)	Data Time 0.001 (0.316)	Loss 2.4868 (2.5949)	Entropy 0.62596 (0.62104)	Top-1 acc 64.453 (61.358)	Top-5 acc 82.812 (82.241)	lr 0.01069
Train [66][1800/3239]	Time 0.236 (0.823)	Data Time 0.001 (0.316)	Loss 2.7525 (2.5947)	Entropy 0.62601 (0.62107)	Top-1 acc 58.203 (61.364)	Top-5 acc 78.516 (82.246)	lr 0.01069
Train [66][1810/3239]	Time 0.322 (0.826)	Data Time 0.001 (0.319)	Loss 2.7164 (2.5944)	Entropy 0.62575 (0.62109)	Top-1 acc 60.156 (61.370)	Top-5 acc 79.297 (82.253)	lr 0.01069
Train [66][1820/3239]	Time 0.244 (0.833)	Data Time 0.001 (0.326)	Loss 2.4212 (2.5944)	Entropy 0.62574 (0.62112)	Top-1 acc 63.672 (61.371)	Top-5 acc 85.938 (82.253)	lr 0.01069
Train [66][1830/3239]	Time 0.269 (0.833)	Data Time 0.001 (0.328)	Loss 2.5441 (2.5946)	Entropy 0.62565 (0.62114)	Top-1 acc 63.281 (61.367)	Top-5 acc 82.422 (82.247)	lr 0.01069
Train [66][1840/3239]	Time 0.233 (0.833)	Data Time 0.001 (0.328)	Loss 2.6858 (2.5945)	Entropy 0.62542 (0.62117)	Top-1 acc 59.766 (61.371)	Top-5 acc 80.469 (82.253)	lr 0.01068
Train [66][1850/3239]	Time 0.270 (0.840)	Data Time 0.002 (0.335)	Loss 2.5546 (2.5943)	Entropy 0.62516 (0.62119)	Top-1 acc 59.375 (61.366)	Top-5 acc 84.766 (82.261)	lr 0.01068
Train [66][1860/3239]	Time 0.237 (0.842)	Data Time 0.002 (0.338)	Loss 2.4948 (2.5944)	Entropy 0.62511 (0.62121)	Top-1 acc 64.453 (61.368)	Top-5 acc 82.422 (82.259)	lr 0.01068
Train [66][1870/3239]	Time 0.234 (0.841)	Data Time 0.001 (0.337)	Loss 2.8429 (2.5948)	Entropy 0.62521 (0.62123)	Top-1 acc 51.953 (61.349)	Top-5 acc 79.688 (82.254)	lr 0.01068
Train [66][1880/3239]	Time 2.680 (0.847)	Data Time 2.425 (0.343)	Loss 2.5441 (2.5946)	Entropy 0.62561 (0.62125)	Top-1 acc 62.500 (61.356)	Top-5 acc 83.984 (82.259)	lr 0.01068
Train [66][1890/3239]	Time 0.247 (0.847)	Data Time 0.001 (0.344)	Loss 2.7004 (2.5944)	Entropy 0.62561 (0.62128)	Top-1 acc 56.641 (61.360)	Top-5 acc 79.688 (82.263)	lr 0.01068
Train [66][1900/3239]	Time 0.281 (0.846)	Data Time 0.001 (0.343)	Loss 2.5339 (2.5944)	Entropy 0.62552 (0.62130)	Top-1 acc 61.328 (61.358)	Top-5 acc 84.766 (82.260)	lr 0.01068
Train [66][1910/3239]	Time 14.609 (0.851)	Data Time 14.345 (0.349)	Loss 2.3930 (2.5944)	Entropy 0.62523 (0.62132)	Top-1 acc 66.797 (61.363)	Top-5 acc 86.328 (82.262)	lr 0.01068
Train [66][1920/3239]	Time 9.491 (0.854)	Data Time 9.222 (0.352)	Loss 2.6314 (2.5945)	Entropy 0.62532 (0.62134)	Top-1 acc 59.375 (61.362)	Top-5 acc 80.469 (82.258)	lr 0.01068
Train [66][1930/3239]	Time 0.249 (0.852)	Data Time 0.001 (0.350)	Loss 2.5263 (2.5945)	Entropy 0.62533 (0.62136)	Top-1 acc 62.500 (61.360)	Top-5 acc 82.812 (82.254)	lr 0.01068
Train [66][1940/3239]	Time 0.225 (0.849)	Data Time 0.001 (0.348)	Loss 2.6874 (2.5947)	Entropy 0.62561 (0.62138)	Top-1 acc 58.594 (61.355)	Top-5 acc 80.859 (82.248)	lr 0.01067
Train [66][1950/3239]	Time 0.253 (0.856)	Data Time 0.001 (0.355)	Loss 2.5582 (2.5950)	Entropy 0.62549 (0.62141)	Top-1 acc 60.938 (61.350)	Top-5 acc 81.641 (82.245)	lr 0.01067
Train [66][1960/3239]	Time 0.245 (0.860)	Data Time 0.001 (0.360)	Loss 2.7274 (2.5948)	Entropy 0.62561 (0.62143)	Top-1 acc 59.375 (61.356)	Top-5 acc 80.078 (82.250)	lr 0.01067
Train [66][1970/3239]	Time 0.346 (0.858)	Data Time 0.001 (0.358)	Loss 2.7293 (2.5948)	Entropy 0.62546 (0.62145)	Top-1 acc 60.938 (61.355)	Top-5 acc 78.906 (82.247)	lr 0.01067
Train [66][1980/3239]	Time 0.240 (0.862)	Data Time 0.001 (0.362)	Loss 2.5685 (2.5950)	Entropy 0.62525 (0.62147)	Top-1 acc 64.844 (61.353)	Top-5 acc 82.031 (82.248)	lr 0.01067
Train [66][1990/3239]	Time 0.268 (0.866)	Data Time 0.001 (0.366)	Loss 2.4905 (2.5949)	Entropy 0.62560 (0.62149)	Top-1 acc 64.844 (61.354)	Top-5 acc 82.812 (82.251)	lr 0.01067
Train [66][2000/3239]	Time 0.245 (0.864)	Data Time 0.001 (0.364)	Loss 2.5405 (2.5947)	Entropy 0.62532 (0.62151)	Top-1 acc 61.719 (61.359)	Top-5 acc 83.203 (82.254)	lr 0.01067
Train [66][2010/3239]	Time 0.240 (0.866)	Data Time 0.001 (0.367)	Loss 2.4773 (2.5947)	Entropy 0.62541 (0.62153)	Top-1 acc 62.500 (61.360)	Top-5 acc 83.984 (82.257)	lr 0.01067
Train [66][2020/3239]	Time 0.242 (0.868)	Data Time 0.001 (0.370)	Loss 2.7044 (2.5946)	Entropy 0.62534 (0.62154)	Top-1 acc 57.031 (61.363)	Top-5 acc 81.250 (82.257)	lr 0.01067
Train [66][2030/3239]	Time 0.241 (0.866)	Data Time 0.001 (0.368)	Loss 2.6649 (2.5948)	Entropy 0.62515 (0.62156)	Top-1 acc 60.156 (61.363)	Top-5 acc 79.297 (82.250)	lr 0.01067
Train [66][2040/3239]	Time 0.326 (0.871)	Data Time 0.001 (0.373)	Loss 2.7796 (2.5950)	Entropy 0.62516 (0.62158)	Top-1 acc 55.859 (61.356)	Top-5 acc 78.516 (82.247)	lr 0.01066
Train [66][2050/3239]	Time 0.246 (0.873)	Data Time 0.001 (0.375)	Loss 2.6584 (2.5951)	Entropy 0.62503 (0.62160)	Top-1 acc 60.156 (61.353)	Top-5 acc 82.031 (82.245)	lr 0.01066
Train [66][2060/3239]	Time 0.248 (0.870)	Data Time 0.001 (0.373)	Loss 2.5147 (2.5952)	Entropy 0.62498 (0.62161)	Top-1 acc 62.891 (61.348)	Top-5 acc 84.375 (82.244)	lr 0.01066
Train [66][2070/3239]	Time 14.094 (0.875)	Data Time 13.834 (0.378)	Loss 2.6620 (2.5953)	Entropy 0.62506 (0.62163)	Top-1 acc 56.641 (61.338)	Top-5 acc 83.594 (82.243)	lr 0.01066
Train [66][2080/3239]	Time 8.586 (0.877)	Data Time 8.329 (0.381)	Loss 2.7152 (2.5953)	Entropy 0.62515 (0.62165)	Top-1 acc 57.031 (61.340)	Top-5 acc 80.469 (82.244)	lr 0.01066
Train [66][2090/3239]	Time 1.671 (0.875)	Data Time 1.417 (0.379)	Loss 2.6423 (2.5955)	Entropy 0.62514 (0.62166)	Top-1 acc 57.422 (61.336)	Top-5 acc 82.031 (82.242)	lr 0.01066
Train [66][2100/3239]	Time 0.249 (0.873)	Data Time 0.001 (0.378)	Loss 2.5665 (2.5955)	Entropy 0.62507 (0.62168)	Top-1 acc 58.984 (61.333)	Top-5 acc 82.812 (82.246)	lr 0.01066
Train [66][2110/3239]	Time 0.245 (0.877)	Data Time 0.001 (0.382)	Loss 2.6713 (2.5957)	Entropy 0.62499 (0.62170)	Top-1 acc 60.547 (61.326)	Top-5 acc 81.641 (82.243)	lr 0.01066
Train [66][2120/3239]	Time 0.232 (0.879)	Data Time 0.001 (0.384)	Loss 2.6776 (2.5958)	Entropy 0.62499 (0.62171)	Top-1 acc 57.031 (61.322)	Top-5 acc 81.250 (82.242)	lr 0.01066
Train [66][2130/3239]	Time 0.348 (0.880)	Data Time 0.001 (0.386)	Loss 2.6189 (2.5959)	Entropy 0.62516 (0.62173)	Top-1 acc 58.203 (61.317)	Top-5 acc 80.859 (82.239)	lr 0.01066
Train [66][2140/3239]	Time 0.235 (0.882)	Data Time 0.001 (0.388)	Loss 2.5843 (2.5965)	Entropy 0.62475 (0.62174)	Top-1 acc 66.016 (61.309)	Top-5 acc 81.250 (82.228)	lr 0.01065
Train [66][2150/3239]	Time 0.256 (0.886)	Data Time 0.001 (0.392)	Loss 2.5589 (2.5964)	Entropy 0.62503 (0.62176)	Top-1 acc 63.281 (61.314)	Top-5 acc 80.469 (82.228)	lr 0.01065
Train [66][2160/3239]	Time 0.264 (0.886)	Data Time 0.002 (0.393)	Loss 2.4393 (2.5964)	Entropy 0.62553 (0.62177)	Top-1 acc 66.797 (61.314)	Top-5 acc 85.938 (82.231)	lr 0.01065
Train [66][2170/3239]	Time 0.237 (0.886)	Data Time 0.001 (0.393)	Loss 2.6570 (2.5963)	Entropy 0.62579 (0.62179)	Top-1 acc 58.984 (61.314)	Top-5 acc 81.641 (82.229)	lr 0.01065
Train [66][2180/3239]	Time 0.235 (0.890)	Data Time 0.001 (0.397)	Loss 2.3001 (2.5963)	Entropy 0.62541 (0.62181)	Top-1 acc 68.750 (61.321)	Top-5 acc 87.500 (82.228)	lr 0.01065
Train [66][2190/3239]	Time 0.226 (0.890)	Data Time 0.001 (0.397)	Loss 2.6880 (2.5964)	Entropy 0.62554 (0.62182)	Top-1 acc 58.594 (61.319)	Top-5 acc 78.516 (82.224)	lr 0.01065
Train [66][2200/3239]	Time 3.998 (0.891)	Data Time 3.645 (0.399)	Loss 2.5593 (2.5965)	Entropy 0.62543 (0.62184)	Top-1 acc 62.500 (61.317)	Top-5 acc 85.547 (82.226)	lr 0.01065
Train [66][2210/3239]	Time 0.240 (0.894)	Data Time 0.001 (0.403)	Loss 2.7450 (2.5966)	Entropy 0.62502 (0.62186)	Top-1 acc 58.203 (61.310)	Top-5 acc 80.859 (82.225)	lr 0.01065
Train [66][2220/3239]	Time 0.249 (0.895)	Data Time 0.001 (0.403)	Loss 2.6056 (2.5968)	Entropy 0.62490 (0.62187)	Top-1 acc 62.500 (61.306)	Top-5 acc 81.641 (82.220)	lr 0.01065
Train [66][2230/3239]	Time 0.234 (0.893)	Data Time 0.001 (0.401)	Loss 2.6487 (2.5967)	Entropy 0.62486 (0.62188)	Top-1 acc 54.688 (61.304)	Top-5 acc 82.812 (82.220)	lr 0.01065
Train [66][2240/3239]	Time 10.942 (0.899)	Data Time 10.684 (0.408)	Loss 2.4965 (2.5970)	Entropy 0.62528 (0.62190)	Top-1 acc 62.500 (61.299)	Top-5 acc 83.594 (82.212)	lr 0.01064
Train [66][2250/3239]	Time 0.331 (0.915)	Data Time 0.004 (0.406)	Loss 2.5990 (2.5968)	Entropy 0.62505 (0.62191)	Top-1 acc 61.328 (61.302)	Top-5 acc 81.250 (82.213)	lr 0.01064
Train [66][2260/3239]	Time 0.249 (0.913)	Data Time 0.002 (0.404)	Loss 2.5794 (2.5967)	Entropy 0.62498 (0.62193)	Top-1 acc 59.375 (61.298)	Top-5 acc 80.469 (82.212)	lr 0.01064
Train [66][2270/3239]	Time 0.237 (0.911)	Data Time 0.001 (0.402)	Loss 2.5385 (2.5966)	Entropy 0.62486 (0.62194)	Top-1 acc 61.719 (61.301)	Top-5 acc 84.766 (82.214)	lr 0.01064
Train [66][2280/3239]	Time 0.235 (0.909)	Data Time 0.001 (0.400)	Loss 2.6938 (2.5966)	Entropy 0.62471 (0.62195)	Top-1 acc 58.984 (61.299)	Top-5 acc 79.688 (82.215)	lr 0.01064
Train [66][2290/3239]	Time 0.353 (0.907)	Data Time 0.001 (0.399)	Loss 2.5364 (2.5966)	Entropy 0.62492 (0.62197)	Top-1 acc 62.500 (61.304)	Top-5 acc 82.031 (82.215)	lr 0.01064
Train [66][2300/3239]	Time 0.244 (0.905)	Data Time 0.001 (0.397)	Loss 2.5726 (2.5966)	Entropy 0.62493 (0.62198)	Top-1 acc 64.062 (61.304)	Top-5 acc 83.594 (82.216)	lr 0.01064
Train [66][2310/3239]	Time 0.277 (0.907)	Data Time 0.001 (0.400)	Loss 2.3408 (2.5964)	Entropy 0.62493 (0.62199)	Top-1 acc 66.016 (61.309)	Top-5 acc 87.891 (82.218)	lr 0.01064
Train [66][2320/3239]	Time 0.249 (0.906)	Data Time 0.001 (0.399)	Loss 2.6196 (2.5964)	Entropy 0.62460 (0.62200)	Top-1 acc 62.109 (61.307)	Top-5 acc 84.766 (82.219)	lr 0.01064
Train [66][2330/3239]	Time 0.245 (0.904)	Data Time 0.001 (0.397)	Loss 2.7608 (2.5963)	Entropy 0.62469 (0.62201)	Top-1 acc 57.422 (61.306)	Top-5 acc 79.297 (82.216)	lr 0.01064
Train [66][2340/3239]	Time 0.228 (0.908)	Data Time 0.001 (0.401)	Loss 2.8241 (2.5963)	Entropy 0.62490 (0.62203)	Top-1 acc 55.859 (61.308)	Top-5 acc 80.078 (82.218)	lr 0.01063
Train [66][2350/3239]	Time 0.245 (0.910)	Data Time 0.001 (0.404)	Loss 2.8561 (2.5965)	Entropy 0.62474 (0.62204)	Top-1 acc 53.516 (61.301)	Top-5 acc 77.344 (82.214)	lr 0.01063
Train [66][2360/3239]	Time 0.334 (0.909)	Data Time 0.001 (0.404)	Loss 2.5738 (2.5965)	Entropy 0.62459 (0.62205)	Top-1 acc 61.719 (61.300)	Top-5 acc 82.812 (82.217)	lr 0.01063
Train [66][2370/3239]	Time 0.220 (0.912)	Data Time 0.001 (0.407)	Loss 2.4373 (2.5963)	Entropy 0.62426 (0.62206)	Top-1 acc 67.969 (61.302)	Top-5 acc 85.547 (82.221)	lr 0.01063
Train [66][2380/3239]	Time 0.233 (0.916)	Data Time 0.001 (0.411)	Loss 2.4227 (2.5962)	Entropy 0.62434 (0.62207)	Top-1 acc 67.578 (61.301)	Top-5 acc 84.375 (82.222)	lr 0.01063
Train [66][2390/3239]	Time 0.241 (0.914)	Data Time 0.001 (0.409)	Loss 2.4499 (2.5961)	Entropy 0.62439 (0.62208)	Top-1 acc 68.359 (61.307)	Top-5 acc 85.547 (82.225)	lr 0.01063
Train [66][2400/3239]	Time 11.920 (0.917)	Data Time 11.640 (0.413)	Loss 2.6175 (2.5960)	Entropy 0.62434 (0.62209)	Top-1 acc 60.156 (61.305)	Top-5 acc 81.641 (82.231)	lr 0.01063
Train [66][2410/3239]	Time 4.314 (0.921)	Data Time 4.053 (0.416)	Loss 2.6928 (2.5962)	Entropy 0.62431 (0.62210)	Top-1 acc 56.641 (61.296)	Top-5 acc 78.125 (82.224)	lr 0.01063
Train [66][2420/3239]	Time 0.246 (0.919)	Data Time 0.001 (0.415)	Loss 2.6672 (2.5960)	Entropy 0.62447 (0.62211)	Top-1 acc 58.594 (61.303)	Top-5 acc 80.469 (82.228)	lr 0.01063
Train [66][2430/3239]	Time 0.234 (0.917)	Data Time 0.001 (0.413)	Loss 2.4957 (2.5962)	Entropy 0.62454 (0.62212)	Top-1 acc 63.281 (61.300)	Top-5 acc 83.594 (82.225)	lr 0.01063
Train [66][2440/3239]	Time 0.260 (0.924)	Data Time 0.002 (0.421)	Loss 2.6515 (2.5958)	Entropy 0.62412 (0.62213)	Top-1 acc 58.203 (61.304)	Top-5 acc 81.641 (82.229)	lr 0.01062
Train [66][2450/3239]	Time 0.357 (0.923)	Data Time 0.002 (0.419)	Loss 2.4420 (2.5958)	Entropy 0.62439 (0.62213)	Top-1 acc 64.844 (61.306)	Top-5 acc 85.156 (82.226)	lr 0.01062
Train [66][2460/3239]	Time 0.231 (0.921)	Data Time 0.001 (0.418)	Loss 2.6509 (2.5957)	Entropy 0.62459 (0.62214)	Top-1 acc 57.031 (61.306)	Top-5 acc 78.906 (82.228)	lr 0.01062
Train [66][2470/3239]	Time 0.284 (0.929)	Data Time 0.001 (0.427)	Loss 2.4313 (2.5956)	Entropy 0.62430 (0.62215)	Top-1 acc 65.234 (61.307)	Top-5 acc 85.938 (82.230)	lr 0.01062
Train [66][2480/3239]	Time 0.244 (0.928)	Data Time 0.001 (0.425)	Loss 2.6868 (2.5955)	Entropy 0.62447 (0.62216)	Top-1 acc 60.547 (61.314)	Top-5 acc 80.469 (82.234)	lr 0.01062
Train [66][2490/3239]	Time 0.250 (0.926)	Data Time 0.001 (0.424)	Loss 2.7323 (2.5956)	Entropy 0.62481 (0.62217)	Top-1 acc 62.109 (61.312)	Top-5 acc 78.516 (82.234)	lr 0.01062
Train [66][2500/3239]	Time 0.241 (0.928)	Data Time 0.001 (0.426)	Loss 2.6326 (2.5956)	Entropy 0.62493 (0.62218)	Top-1 acc 60.547 (61.309)	Top-5 acc 80.859 (82.235)	lr 0.01062
Train [66][2510/3239]	Time 0.247 (0.933)	Data Time 0.001 (0.432)	Loss 2.6224 (2.5954)	Entropy 0.62475 (0.62219)	Top-1 acc 62.109 (61.314)	Top-5 acc 84.375 (82.236)	lr 0.01062
Train [66][2520/3239]	Time 0.361 (0.931)	Data Time 0.001 (0.430)	Loss 2.9434 (2.5957)	Entropy 0.62457 (0.62220)	Top-1 acc 53.906 (61.306)	Top-5 acc 75.391 (82.233)	lr 0.01062
Train [66][2530/3239]	Time 0.230 (0.932)	Data Time 0.001 (0.431)	Loss 2.6704 (2.5959)	Entropy 0.62453 (0.62221)	Top-1 acc 61.328 (61.304)	Top-5 acc 79.688 (82.228)	lr 0.01062
Train [66][2540/3239]	Time 0.266 (0.935)	Data Time 0.002 (0.434)	Loss 2.5820 (2.5956)	Entropy 0.62457 (0.62222)	Top-1 acc 61.328 (61.308)	Top-5 acc 83.594 (82.234)	lr 0.01061
Train [66][2550/3239]	Time 0.243 (0.935)	Data Time 0.002 (0.435)	Loss 2.6202 (2.5958)	Entropy 0.62448 (0.62223)	Top-1 acc 63.281 (61.301)	Top-5 acc 81.250 (82.232)	lr 0.01061
Train [66][2560/3239]	Time 7.446 (0.936)	Data Time 7.192 (0.436)	Loss 2.6085 (2.5958)	Entropy 0.62449 (0.62224)	Top-1 acc 62.500 (61.300)	Top-5 acc 83.203 (82.233)	lr 0.01061
Train [66][2570/3239]	Time 0.234 (0.939)	Data Time 0.001 (0.439)	Loss 2.5643 (2.5958)	Entropy 0.62437 (0.62225)	Top-1 acc 62.109 (61.302)	Top-5 acc 81.641 (82.234)	lr 0.01061
Train [66][2580/3239]	Time 0.245 (0.938)	Data Time 0.001 (0.439)	Loss 2.6470 (2.5959)	Entropy 0.62423 (0.62226)	Top-1 acc 61.328 (61.302)	Top-5 acc 81.250 (82.235)	lr 0.01061
Train [66][2590/3239]	Time 0.242 (0.936)	Data Time 0.001 (0.437)	Loss 2.3752 (2.5959)	Entropy 0.62448 (0.62226)	Top-1 acc 67.969 (61.301)	Top-5 acc 87.109 (82.233)	lr 0.01061
Train [66][2600/3239]	Time 0.320 (0.944)	Data Time 0.031 (0.445)	Loss 2.7344 (2.5957)	Entropy 0.62499 (0.62227)	Top-1 acc 63.281 (61.310)	Top-5 acc 78.906 (82.236)	lr 0.01061
Train [66][2610/3239]	Time 0.271 (0.943)	Data Time 0.001 (0.444)	Loss 2.4713 (2.5955)	Entropy 0.62501 (0.62228)	Top-1 acc 66.016 (61.312)	Top-5 acc 82.031 (82.239)	lr 0.01061
Train [66][2620/3239]	Time 0.243 (0.941)	Data Time 0.001 (0.442)	Loss 2.6304 (2.5956)	Entropy 0.62478 (0.62229)	Top-1 acc 59.375 (61.307)	Top-5 acc 80.469 (82.237)	lr 0.01061
Train [66][2630/3239]	Time 0.791 (0.948)	Data Time 0.543 (0.450)	Loss 2.6577 (2.5957)	Entropy 0.62468 (0.62230)	Top-1 acc 61.328 (61.308)	Top-5 acc 80.078 (82.233)	lr 0.01061
Train [66][2640/3239]	Time 0.265 (0.948)	Data Time 0.001 (0.450)	Loss 2.6743 (2.5960)	Entropy 0.62425 (0.62231)	Top-1 acc 61.719 (61.302)	Top-5 acc 78.516 (82.228)	lr 0.01060
Train [66][2650/3239]	Time 0.244 (0.946)	Data Time 0.001 (0.448)	Loss 2.5901 (2.5958)	Entropy 0.62397 (0.62232)	Top-1 acc 58.203 (61.304)	Top-5 acc 83.984 (82.234)	lr 0.01060
Train [66][2660/3239]	Time 0.245 (0.950)	Data Time 0.001 (0.452)	Loss 2.5711 (2.5958)	Entropy 0.62403 (0.62232)	Top-1 acc 62.109 (61.306)	Top-5 acc 83.203 (82.233)	lr 0.01060
Train [66][2670/3239]	Time 0.246 (0.954)	Data Time 0.001 (0.456)	Loss 2.6266 (2.5957)	Entropy 0.62423 (0.62233)	Top-1 acc 61.719 (61.309)	Top-5 acc 80.859 (82.237)	lr 0.01060
Train [66][2680/3239]	Time 0.317 (0.952)	Data Time 0.001 (0.455)	Loss 2.6051 (2.5956)	Entropy 0.62414 (0.62234)	Top-1 acc 61.328 (61.307)	Top-5 acc 82.812 (82.240)	lr 0.01060
Train [66][2690/3239]	Time 0.248 (0.954)	Data Time 0.001 (0.457)	Loss 2.3729 (2.5955)	Entropy 0.62393 (0.62235)	Top-1 acc 69.531 (61.307)	Top-5 acc 86.719 (82.242)	lr 0.01060
Train [66][2700/3239]	Time 0.224 (0.957)	Data Time 0.001 (0.461)	Loss 2.7906 (2.5957)	Entropy 0.62406 (0.62235)	Top-1 acc 56.250 (61.303)	Top-5 acc 76.953 (82.239)	lr 0.01060
Train [66][2710/3239]	Time 0.231 (0.956)	Data Time 0.001 (0.460)	Loss 2.4497 (2.5958)	Entropy 0.62375 (0.62236)	Top-1 acc 68.750 (61.300)	Top-5 acc 85.156 (82.236)	lr 0.01060
Train [66][2720/3239]	Time 15.632 (0.959)	Data Time 15.373 (0.464)	Loss 2.3854 (2.5957)	Entropy 0.62375 (0.62236)	Top-1 acc 62.109 (61.309)	Top-5 acc 86.328 (82.239)	lr 0.01060
Train [66][2730/3239]	Time 0.234 (0.961)	Data Time 0.001 (0.466)	Loss 2.4442 (2.5958)	Entropy 0.62308 (0.62237)	Top-1 acc 62.500 (61.304)	Top-5 acc 87.109 (82.239)	lr 0.01060
Train [66][2740/3239]	Time 0.222 (0.961)	Data Time 0.001 (0.466)	Loss 2.6999 (2.5960)	Entropy 0.62296 (0.62237)	Top-1 acc 62.891 (61.299)	Top-5 acc 82.031 (82.235)	lr 0.01059
Train [66][2750/3239]	Time 0.332 (0.959)	Data Time 0.001 (0.464)	Loss 2.5490 (2.5960)	Entropy 0.62284 (0.62237)	Top-1 acc 59.766 (61.300)	Top-5 acc 83.203 (82.234)	lr 0.01059
Train [66][2760/3239]	Time 0.305 (0.968)	Data Time 0.001 (0.473)	Loss 2.5631 (2.5960)	Entropy 0.62284 (0.62237)	Top-1 acc 60.938 (61.304)	Top-5 acc 80.469 (82.234)	lr 0.01059
Train [66][2770/3239]	Time 0.244 (0.966)	Data Time 0.001 (0.472)	Loss 2.7000 (2.5959)	Entropy 0.62279 (0.62238)	Top-1 acc 56.641 (61.306)	Top-5 acc 79.297 (82.234)	lr 0.01059
Train [66][2780/3239]	Time 0.237 (0.964)	Data Time 0.001 (0.470)	Loss 2.4544 (2.5961)	Entropy 0.62305 (0.62238)	Top-1 acc 65.234 (61.301)	Top-5 acc 85.938 (82.232)	lr 0.01059
Train [66][2790/3239]	Time 9.881 (0.972)	Data Time 9.605 (0.478)	Loss 2.5843 (2.5960)	Entropy 0.62298 (0.62238)	Top-1 acc 60.938 (61.304)	Top-5 acc 80.078 (82.233)	lr 0.01059
Train [66][2800/3239]	Time 0.270 (0.970)	Data Time 0.001 (0.477)	Loss 2.4580 (2.5961)	Entropy 0.62318 (0.62238)	Top-1 acc 65.625 (61.304)	Top-5 acc 86.719 (82.230)	lr 0.01059
Train [66][2810/3239]	Time 0.239 (0.968)	Data Time 0.001 (0.475)	Loss 2.6040 (2.5961)	Entropy 0.62344 (0.62238)	Top-1 acc 59.766 (61.302)	Top-5 acc 84.375 (82.231)	lr 0.01059
Train [66][2820/3239]	Time 0.241 (0.971)	Data Time 0.001 (0.478)	Loss 2.6170 (2.5962)	Entropy 0.62346 (0.62239)	Top-1 acc 62.500 (61.301)	Top-5 acc 82.031 (82.230)	lr 0.01059
Train [66][2830/3239]	Time 0.245 (0.975)	Data Time 0.001 (0.482)	Loss 2.7090 (2.5963)	Entropy 0.62361 (0.62239)	Top-1 acc 60.938 (61.298)	Top-5 acc 79.297 (82.226)	lr 0.01059
Train [66][2840/3239]	Time 0.311 (0.973)	Data Time 0.001 (0.481)	Loss 2.6293 (2.5962)	Entropy 0.62344 (0.62240)	Top-1 acc 60.547 (61.302)	Top-5 acc 80.859 (82.227)	lr 0.01058
Train [66][2850/3239]	Time 0.239 (0.974)	Data Time 0.001 (0.482)	Loss 2.8747 (2.5965)	Entropy 0.62332 (0.62240)	Top-1 acc 53.516 (61.297)	Top-5 acc 77.344 (82.223)	lr 0.01058
Train [66][2860/3239]	Time 0.244 (0.979)	Data Time 0.001 (0.487)	Loss 2.5676 (2.5964)	Entropy 0.62330 (0.62240)	Top-1 acc 65.625 (61.300)	Top-5 acc 81.641 (82.227)	lr 0.01058
Train [66][2870/3239]	Time 0.233 (0.977)	Data Time 0.001 (0.485)	Loss 2.5818 (2.5963)	Entropy 0.62341 (0.62241)	Top-1 acc 64.062 (61.304)	Top-5 acc 84.375 (82.229)	lr 0.01058
Train [66][2880/3239]	Time 7.562 (0.977)	Data Time 7.305 (0.486)	Loss 2.5864 (2.5963)	Entropy 0.62343 (0.62241)	Top-1 acc 59.375 (61.304)	Top-5 acc 83.984 (82.227)	lr 0.01058
Train [66][2890/3239]	Time 0.255 (0.982)	Data Time 0.001 (0.491)	Loss 2.6943 (2.5964)	Entropy 0.62342 (0.62241)	Top-1 acc 63.281 (61.299)	Top-5 acc 82.422 (82.226)	lr 0.01058
Train [66][2900/3239]	Time 0.376 (0.994)	Data Time 0.006 (0.489)	Loss 3.1379 (2.5967)	Entropy 0.62359 (0.62242)	Top-1 acc 44.141 (61.290)	Top-5 acc 72.266 (82.220)	lr 0.01058
Train [66][2910/3239]	Time 0.353 (0.992)	Data Time 0.002 (0.488)	Loss 2.7238 (2.5968)	Entropy 0.62356 (0.62242)	Top-1 acc 58.984 (61.289)	Top-5 acc 79.297 (82.219)	lr 0.01058
Train [66][2920/3239]	Time 0.299 (0.990)	Data Time 0.004 (0.486)	Loss 2.6561 (2.5969)	Entropy 0.62324 (0.62243)	Top-1 acc 58.203 (61.285)	Top-5 acc 80.078 (82.215)	lr 0.01058
Train [66][2930/3239]	Time 0.253 (0.988)	Data Time 0.002 (0.484)	Loss 2.6867 (2.5970)	Entropy 0.62304 (0.62243)	Top-1 acc 63.281 (61.284)	Top-5 acc 81.250 (82.215)	lr 0.01058
Train [66][2940/3239]	Time 0.260 (0.987)	Data Time 0.001 (0.483)	Loss 2.6441 (2.5972)	Entropy 0.62338 (0.62243)	Top-1 acc 57.422 (61.277)	Top-5 acc 81.250 (82.211)	lr 0.01057
Train [66][2950/3239]	Time 0.238 (0.985)	Data Time 0.001 (0.481)	Loss 2.7644 (2.5972)	Entropy 0.62357 (0.62243)	Top-1 acc 55.859 (61.276)	Top-5 acc 80.859 (82.209)	lr 0.01057
Train [66][2960/3239]	Time 0.256 (0.983)	Data Time 0.002 (0.479)	Loss 2.5974 (2.5971)	Entropy 0.62343 (0.62244)	Top-1 acc 62.500 (61.279)	Top-5 acc 83.203 (82.212)	lr 0.01057
Train [66][2970/3239]	Time 0.230 (0.982)	Data Time 0.001 (0.479)	Loss 2.6917 (2.5968)	Entropy 0.62351 (0.62244)	Top-1 acc 55.859 (61.286)	Top-5 acc 80.859 (82.217)	lr 0.01057
Train [66][2980/3239]	Time 0.268 (0.981)	Data Time 0.002 (0.477)	Loss 2.6607 (2.5968)	Entropy 0.62333 (0.62244)	Top-1 acc 57.812 (61.288)	Top-5 acc 80.078 (82.217)	lr 0.01057
Train [66][2990/3239]	Time 0.263 (0.981)	Data Time 0.001 (0.478)	Loss 2.8724 (2.5968)	Entropy 0.62317 (0.62245)	Top-1 acc 52.344 (61.286)	Top-5 acc 79.688 (82.218)	lr 0.01057
Train [66][3000/3239]	Time 1.674 (0.980)	Data Time 1.259 (0.478)	Loss 2.6249 (2.5967)	Entropy 0.62310 (0.62245)	Top-1 acc 62.500 (61.287)	Top-5 acc 80.078 (82.218)	lr 0.01057
Train [66][3010/3239]	Time 0.282 (0.979)	Data Time 0.002 (0.476)	Loss 2.6680 (2.5968)	Entropy 0.62305 (0.62245)	Top-1 acc 58.594 (61.283)	Top-5 acc 82.812 (82.218)	lr 0.01057
Train [66][3020/3239]	Time 0.239 (0.979)	Data Time 0.001 (0.477)	Loss 2.7194 (2.5968)	Entropy 0.62272 (0.62245)	Top-1 acc 59.766 (61.282)	Top-5 acc 81.250 (82.218)	lr 0.01057
Train [66][3030/3239]	Time 0.246 (0.980)	Data Time 0.001 (0.478)	Loss 2.7507 (2.5969)	Entropy 0.62263 (0.62245)	Top-1 acc 55.859 (61.279)	Top-5 acc 78.516 (82.216)	lr 0.01057
Train [66][3040/3239]	Time 3.781 (0.981)	Data Time 3.525 (0.479)	Loss 2.6668 (2.5968)	Entropy 0.62249 (0.62245)	Top-1 acc 60.547 (61.279)	Top-5 acc 81.250 (82.217)	lr 0.01056
Train [66][3050/3239]	Time 0.239 (0.982)	Data Time 0.001 (0.480)	Loss 2.4668 (2.5967)	Entropy 0.62240 (0.62245)	Top-1 acc 65.625 (61.286)	Top-5 acc 83.984 (82.220)	lr 0.01056
Train [66][3060/3239]	Time 1.784 (0.980)	Data Time 1.539 (0.479)	Loss 2.7399 (2.5969)	Entropy 0.62261 (0.62245)	Top-1 acc 54.297 (61.280)	Top-5 acc 79.688 (82.215)	lr 0.01056
Train [66][3070/3239]	Time 0.387 (0.983)	Data Time 0.002 (0.482)	Loss 2.6239 (2.5968)	Entropy 0.62279 (0.62245)	Top-1 acc 59.766 (61.285)	Top-5 acc 80.078 (82.217)	lr 0.01056
Train [66][3080/3239]	Time 0.240 (0.985)	Data Time 0.001 (0.484)	Loss 2.5256 (2.5965)	Entropy 0.62302 (0.62246)	Top-1 acc 64.453 (61.291)	Top-5 acc 82.812 (82.220)	lr 0.01056
Train [66][3090/3239]	Time 0.232 (0.983)	Data Time 0.001 (0.483)	Loss 2.7006 (2.5967)	Entropy 0.62317 (0.62246)	Top-1 acc 60.547 (61.285)	Top-5 acc 82.031 (82.218)	lr 0.01056
Train [66][3100/3239]	Time 2.911 (0.986)	Data Time 2.632 (0.486)	Loss 2.7016 (2.5966)	Entropy 0.62343 (0.62246)	Top-1 acc 60.156 (61.287)	Top-5 acc 77.734 (82.219)	lr 0.01056
Train [66][3110/3239]	Time 8.779 (0.987)	Data Time 8.527 (0.487)	Loss 2.5195 (2.5967)	Entropy 0.62334 (0.62246)	Top-1 acc 59.766 (61.284)	Top-5 acc 82.031 (82.217)	lr 0.01056
Train [66][3120/3239]	Time 0.232 (0.987)	Data Time 0.001 (0.487)	Loss 2.6361 (2.5967)	Entropy 0.62332 (0.62247)	Top-1 acc 62.891 (61.283)	Top-5 acc 79.688 (82.216)	lr 0.01056
Train [66][3130/3239]	Time 1.068 (0.989)	Data Time 0.801 (0.489)	Loss 2.6944 (2.5968)	Entropy 0.62331 (0.62247)	Top-1 acc 58.594 (61.279)	Top-5 acc 80.469 (82.215)	lr 0.01056
Train [66][3140/3239]	Time 0.249 (0.987)	Data Time 0.001 (0.488)	Loss 2.6227 (2.5968)	Entropy 0.62324 (0.62247)	Top-1 acc 59.375 (61.279)	Top-5 acc 82.031 (82.217)	lr 0.01055
Train [66][3150/3239]	Time 0.257 (0.987)	Data Time 0.001 (0.488)	Loss 2.3901 (2.5968)	Entropy 0.62339 (0.62247)	Top-1 acc 64.062 (61.280)	Top-5 acc 85.547 (82.215)	lr 0.01055
Train [66][3160/3239]	Time 0.343 (0.988)	Data Time 0.001 (0.489)	Loss 2.5318 (2.5967)	Entropy 0.62327 (0.62248)	Top-1 acc 62.500 (61.285)	Top-5 acc 84.375 (82.217)	lr 0.01055
Train [66][3170/3239]	Time 0.292 (0.987)	Data Time 0.001 (0.488)	Loss 2.8257 (2.5968)	Entropy 0.62298 (0.62248)	Top-1 acc 58.203 (61.282)	Top-5 acc 78.906 (82.215)	lr 0.01055
Train [66][3180/3239]	Time 0.237 (0.985)	Data Time 0.000 (0.487)	Loss 2.5397 (2.5968)	Entropy 0.62306 (0.62248)	Top-1 acc 59.375 (61.276)	Top-5 acc 84.375 (82.216)	lr 0.01055
Train [66][3190/3239]	Time 0.257 (0.986)	Data Time 0.000 (0.488)	Loss 2.6469 (2.5968)	Entropy 0.62316 (0.62248)	Top-1 acc 58.594 (61.278)	Top-5 acc 80.469 (82.214)	lr 0.01055
Train [66][3200/3239]	Time 0.261 (0.985)	Data Time 0.000 (0.487)	Loss 2.7075 (2.5967)	Entropy 0.62311 (0.62248)	Top-1 acc 58.984 (61.279)	Top-5 acc 79.297 (82.216)	lr 0.01055
Train [66][3210/3239]	Time 0.430 (0.983)	Data Time 0.200 (0.485)	Loss 2.6340 (2.5969)	Entropy 0.62294 (0.62249)	Top-1 acc 58.203 (61.273)	Top-5 acc 82.031 (82.214)	lr 0.01055
Train [66][3220/3239]	Time 0.231 (0.981)	Data Time 0.000 (0.484)	Loss 2.5673 (2.5967)	Entropy 0.62324 (0.62249)	Top-1 acc 64.062 (61.274)	Top-5 acc 80.859 (82.216)	lr 0.01055
Train [66][3230/3239]	Time 0.323 (0.981)	Data Time 0.000 (0.483)	Loss 2.5739 (2.5968)	Entropy 0.62306 (0.62249)	Top-1 acc 58.984 (61.273)	Top-5 acc 81.641 (82.212)	lr 0.01055
Train [66][3239/3239]	Time 0.888 (0.979)	Data Time 0.000 (0.482)	Loss 2.3343 (2.5968)	Entropy 0.62315 (0.62249)	Top-1 acc 66.667 (61.270)	Top-5 acc 88.889 (82.211)	lr 0.01054
==========Valid [66/120]	loss 1.399	top-1 acc 68.113 (68.549)	top-5 acc 87.682	Train top-1 61.270	top-5 82.211	Entropy 0.62315	Latency-None: 0.000ms	Flops: 537.50M
Train [67][0/3239]	Time 40.219 (40.219)	Data Time 38.158 (38.158)	Loss 2.6812 (2.6812)	Entropy 0.62322 (0.62322)	Top-1 acc 58.984 (58.984)	Top-5 acc 80.859 (80.859)	lr 0.01054
Train [67][10/3239]	Time 0.241 (4.121)	Data Time 0.001 (3.538)	Loss 2.4551 (2.6032)	Entropy 0.62269 (0.62306)	Top-1 acc 64.062 (61.825)	Top-5 acc 86.328 (81.854)	lr 0.01054
Train [67][20/3239]	Time 0.243 (2.353)	Data Time 0.001 (1.854)	Loss 2.6776 (2.5881)	Entropy 0.62292 (0.62292)	Top-1 acc 59.766 (61.682)	Top-5 acc 78.516 (82.775)	lr 0.01054
Train [67][30/3239]	Time 0.262 (1.742)	Data Time 0.001 (1.256)	Loss 2.4973 (2.5947)	Entropy 0.62291 (0.62294)	Top-1 acc 63.672 (61.253)	Top-5 acc 82.812 (82.359)	lr 0.01054
Train [67][40/3239]	Time 0.248 (1.427)	Data Time 0.002 (0.953)	Loss 2.8143 (2.5948)	Entropy 0.62298 (0.62295)	Top-1 acc 57.422 (61.042)	Top-5 acc 77.344 (82.403)	lr 0.01054
Train [67][50/3239]	Time 0.236 (1.226)	Data Time 0.001 (0.766)	Loss 2.5889 (2.5916)	Entropy 0.62259 (0.62292)	Top-1 acc 59.766 (61.152)	Top-5 acc 81.641 (82.460)	lr 0.01054
Train [67][60/3239]	Time 0.361 (1.095)	Data Time 0.001 (0.641)	Loss 2.6339 (2.5871)	Entropy 0.62258 (0.62288)	Top-1 acc 60.938 (61.347)	Top-5 acc 79.688 (82.441)	lr 0.01054
Train [67][70/3239]	Time 0.240 (1.030)	Data Time 0.001 (0.576)	Loss 2.4937 (2.5785)	Entropy 0.62247 (0.62282)	Top-1 acc 62.891 (61.620)	Top-5 acc 82.812 (82.548)	lr 0.01054
Train [67][80/3239]	Time 0.237 (0.953)	Data Time 0.001 (0.505)	Loss 2.8007 (2.5804)	Entropy 0.62221 (0.62275)	Top-1 acc 57.031 (61.574)	Top-5 acc 82.812 (82.523)	lr 0.01054
Train [67][90/3239]	Time 0.231 (0.894)	Data Time 0.002 (0.450)	Loss 2.4006 (2.5832)	Entropy 0.62252 (0.62270)	Top-1 acc 65.234 (61.453)	Top-5 acc 84.766 (82.512)	lr 0.01054
Train [67][100/3239]	Time 0.246 (0.876)	Data Time 0.001 (0.432)	Loss 2.7223 (2.5900)	Entropy 0.62243 (0.62268)	Top-1 acc 57.031 (61.262)	Top-5 acc 80.078 (82.387)	lr 0.01053
Train [67][110/3239]	Time 0.234 (0.835)	Data Time 0.001 (0.393)	Loss 2.4607 (2.5924)	Entropy 0.62251 (0.62266)	Top-1 acc 64.453 (61.166)	Top-5 acc 82.422 (82.295)	lr 0.01053
Train [67][120/3239]	Time 0.294 (0.802)	Data Time 0.001 (0.361)	Loss 2.6690 (2.5913)	Entropy 0.62260 (0.62266)	Top-1 acc 62.109 (61.283)	Top-5 acc 82.031 (82.280)	lr 0.01053
Train [67][130/3239]	Time 0.373 (0.794)	Data Time 0.001 (0.348)	Loss 2.5879 (2.5882)	Entropy 0.62293 (0.62266)	Top-1 acc 61.719 (61.328)	Top-5 acc 81.641 (82.326)	lr 0.01053
Train [67][140/3239]	Time 0.226 (0.767)	Data Time 0.001 (0.323)	Loss 2.5975 (2.5884)	Entropy 0.62279 (0.62266)	Top-1 acc 64.062 (61.433)	Top-5 acc 80.469 (82.289)	lr 0.01053
Train [67][150/3239]	Time 0.235 (0.744)	Data Time 0.001 (0.302)	Loss 2.7730 (2.5912)	Entropy 0.62266 (0.62267)	Top-1 acc 58.984 (61.336)	Top-5 acc 80.078 (82.192)	lr 0.01053
Train [67][160/3239]	Time 0.237 (0.729)	Data Time 0.001 (0.283)	Loss 2.7274 (2.5932)	Entropy 0.62261 (0.62267)	Top-1 acc 60.156 (61.316)	Top-5 acc 75.781 (82.092)	lr 0.01053
Train [67][170/3239]	Time 0.236 (0.709)	Data Time 0.001 (0.267)	Loss 2.7694 (2.5924)	Entropy 0.62262 (0.62266)	Top-1 acc 60.938 (61.362)	Top-5 acc 76.953 (82.148)	lr 0.01053
Train [67][180/3239]	Time 0.236 (0.693)	Data Time 0.001 (0.252)	Loss 2.5350 (2.5932)	Entropy 0.62288 (0.62266)	Top-1 acc 61.328 (61.343)	Top-5 acc 83.203 (82.169)	lr 0.01053
Train [67][190/3239]	Time 0.272 (0.682)	Data Time 0.001 (0.239)	Loss 2.5985 (2.5941)	Entropy 0.62296 (0.62268)	Top-1 acc 64.062 (61.334)	Top-5 acc 83.594 (82.140)	lr 0.01053
Train [67][200/3239]	Time 0.221 (0.677)	Data Time 0.001 (0.236)	Loss 2.6481 (2.5947)	Entropy 0.62274 (0.62268)	Top-1 acc 61.328 (61.332)	Top-5 acc 81.250 (82.138)	lr 0.01052
Train [67][210/3239]	Time 0.254 (0.664)	Data Time 0.001 (0.225)	Loss 2.6330 (2.5964)	Entropy 0.62286 (0.62269)	Top-1 acc 58.203 (61.324)	Top-5 acc 81.250 (82.100)	lr 0.01052
Train [67][220/3239]	Time 0.390 (0.656)	Data Time 0.001 (0.214)	Loss 2.5675 (2.5949)	Entropy 0.62335 (0.62270)	Top-1 acc 66.406 (61.340)	Top-5 acc 82.812 (82.143)	lr 0.01052
Train [67][230/3239]	Time 0.251 (0.656)	Data Time 0.002 (0.215)	Loss 2.6066 (2.5923)	Entropy 0.62311 (0.62273)	Top-1 acc 65.234 (61.425)	Top-5 acc 83.203 (82.167)	lr 0.01052
Train [67][240/3239]	Time 0.241 (0.647)	Data Time 0.001 (0.207)	Loss 2.5358 (2.5899)	Entropy 0.62320 (0.62274)	Top-1 acc 63.281 (61.472)	Top-5 acc 83.984 (82.219)	lr 0.01052
Train [67][250/3239]	Time 0.269 (0.640)	Data Time 0.001 (0.198)	Loss 2.8303 (2.5903)	Entropy 0.62326 (0.62276)	Top-1 acc 57.422 (61.482)	Top-5 acc 78.906 (82.238)	lr 0.01052
Train [67][260/3239]	Time 0.274 (0.633)	Data Time 0.001 (0.191)	Loss 2.4429 (2.5903)	Entropy 0.62332 (0.62278)	Top-1 acc 66.016 (61.511)	Top-5 acc 84.375 (82.236)	lr 0.01052
Train [67][270/3239]	Time 0.251 (0.625)	Data Time 0.002 (0.184)	Loss 2.5446 (2.5916)	Entropy 0.62348 (0.62280)	Top-1 acc 61.719 (61.488)	Top-5 acc 82.812 (82.194)	lr 0.01052
Train [67][280/3239]	Time 0.225 (0.620)	Data Time 0.001 (0.177)	Loss 2.4361 (2.5896)	Entropy 0.62363 (0.62283)	Top-1 acc 65.234 (61.528)	Top-5 acc 85.938 (82.223)	lr 0.01052
Train [67][290/3239]	Time 0.352 (0.617)	Data Time 0.002 (0.175)	Loss 2.7463 (2.5883)	Entropy 0.62380 (0.62286)	Top-1 acc 57.422 (61.542)	Top-5 acc 77.344 (82.234)	lr 0.01052
Train [67][300/3239]	Time 0.248 (0.610)	Data Time 0.001 (0.169)	Loss 2.7406 (2.5873)	Entropy 0.62404 (0.62289)	Top-1 acc 59.375 (61.572)	Top-5 acc 79.688 (82.257)	lr 0.01051
Train [67][310/3239]	Time 0.307 (0.604)	Data Time 0.003 (0.163)	Loss 2.8963 (2.5889)	Entropy 0.62427 (0.62293)	Top-1 acc 54.297 (61.490)	Top-5 acc 74.219 (82.237)	lr 0.01051
Train [67][320/3239]	Time 0.302 (0.730)	Data Time 0.004 (0.158)	Loss 2.4416 (2.5890)	Entropy 0.62408 (0.62297)	Top-1 acc 67.188 (61.517)	Top-5 acc 82.812 (82.221)	lr 0.01051
Train [67][330/3239]	Time 0.245 (0.721)	Data Time 0.002 (0.154)	Loss 2.5248 (2.5885)	Entropy 0.62393 (0.62300)	Top-1 acc 63.281 (61.513)	Top-5 acc 83.984 (82.253)	lr 0.01051
Train [67][340/3239]	Time 0.243 (0.712)	Data Time 0.002 (0.149)	Loss 2.6956 (2.5898)	Entropy 0.62400 (0.62303)	Top-1 acc 60.156 (61.506)	Top-5 acc 81.641 (82.224)	lr 0.01051
Train [67][350/3239]	Time 0.241 (0.704)	Data Time 0.001 (0.145)	Loss 2.6256 (2.5909)	Entropy 0.62398 (0.62306)	Top-1 acc 61.328 (61.505)	Top-5 acc 82.812 (82.217)	lr 0.01051
Train [67][360/3239]	Time 0.250 (0.697)	Data Time 0.001 (0.141)	Loss 2.7631 (2.5915)	Entropy 0.62409 (0.62308)	Top-1 acc 55.469 (61.490)	Top-5 acc 78.516 (82.205)	lr 0.01051
Train [67][370/3239]	Time 0.253 (0.690)	Data Time 0.001 (0.137)	Loss 2.4661 (2.5909)	Entropy 0.62387 (0.62311)	Top-1 acc 64.453 (61.534)	Top-5 acc 85.547 (82.217)	lr 0.01051
Train [67][380/3239]	Time 0.373 (0.684)	Data Time 0.002 (0.134)	Loss 2.6761 (2.5904)	Entropy 0.62383 (0.62312)	Top-1 acc 58.594 (61.534)	Top-5 acc 83.203 (82.233)	lr 0.01051
Train [67][390/3239]	Time 0.242 (0.678)	Data Time 0.001 (0.130)	Loss 2.5624 (2.5902)	Entropy 0.62364 (0.62314)	Top-1 acc 59.375 (61.517)	Top-5 acc 83.594 (82.237)	lr 0.01051
Train [67][400/3239]	Time 0.293 (0.673)	Data Time 0.002 (0.127)	Loss 2.7029 (2.5895)	Entropy 0.62311 (0.62314)	Top-1 acc 58.594 (61.557)	Top-5 acc 78.906 (82.250)	lr 0.01050
Train [67][410/3239]	Time 0.228 (0.668)	Data Time 0.001 (0.124)	Loss 2.5500 (2.5902)	Entropy 0.62320 (0.62314)	Top-1 acc 61.328 (61.513)	Top-5 acc 83.984 (82.239)	lr 0.01050
Train [67][420/3239]	Time 0.228 (0.662)	Data Time 0.001 (0.121)	Loss 2.6286 (2.5888)	Entropy 0.62348 (0.62314)	Top-1 acc 56.250 (61.521)	Top-5 acc 82.422 (82.264)	lr 0.01050
Train [67][430/3239]	Time 0.262 (0.657)	Data Time 0.001 (0.119)	Loss 2.3799 (2.5875)	Entropy 0.62359 (0.62315)	Top-1 acc 67.969 (61.578)	Top-5 acc 87.500 (82.301)	lr 0.01050
Train [67][440/3239]	Time 0.241 (0.653)	Data Time 0.001 (0.116)	Loss 2.3679 (2.5858)	Entropy 0.62375 (0.62316)	Top-1 acc 66.797 (61.609)	Top-5 acc 83.594 (82.335)	lr 0.01050
Train [67][450/3239]	Time 0.324 (0.649)	Data Time 0.001 (0.113)	Loss 2.5930 (2.5846)	Entropy 0.62382 (0.62318)	Top-1 acc 65.625 (61.645)	Top-5 acc 81.641 (82.379)	lr 0.01050
Train [67][460/3239]	Time 0.238 (0.645)	Data Time 0.001 (0.111)	Loss 2.4864 (2.5836)	Entropy 0.62356 (0.62319)	Top-1 acc 64.062 (61.680)	Top-5 acc 84.375 (82.408)	lr 0.01050
Train [67][470/3239]	Time 0.322 (0.641)	Data Time 0.001 (0.109)	Loss 2.7238 (2.5843)	Entropy 0.62349 (0.62320)	Top-1 acc 59.375 (61.667)	Top-5 acc 80.078 (82.397)	lr 0.01050
Train [67][480/3239]	Time 0.260 (0.637)	Data Time 0.001 (0.106)	Loss 2.8393 (2.5845)	Entropy 0.62379 (0.62320)	Top-1 acc 53.516 (61.655)	Top-5 acc 78.516 (82.404)	lr 0.01050
Train [67][490/3239]	Time 0.257 (0.633)	Data Time 0.002 (0.104)	Loss 2.7778 (2.5844)	Entropy 0.62386 (0.62322)	Top-1 acc 58.594 (61.669)	Top-5 acc 79.688 (82.417)	lr 0.01050
Train [67][500/3239]	Time 0.231 (0.629)	Data Time 0.001 (0.102)	Loss 2.9662 (2.5874)	Entropy 0.62409 (0.62323)	Top-1 acc 54.297 (61.592)	Top-5 acc 74.219 (82.367)	lr 0.01049
Train [67][510/3239]	Time 0.263 (0.626)	Data Time 0.001 (0.100)	Loss 2.8271 (2.5871)	Entropy 0.62382 (0.62325)	Top-1 acc 52.734 (61.603)	Top-5 acc 77.344 (82.377)	lr 0.01049
Train [67][520/3239]	Time 0.258 (0.623)	Data Time 0.001 (0.098)	Loss 2.6258 (2.5879)	Entropy 0.62388 (0.62326)	Top-1 acc 55.859 (61.561)	Top-5 acc 82.812 (82.363)	lr 0.01049
Train [67][530/3239]	Time 0.249 (0.620)	Data Time 0.002 (0.097)	Loss 2.6247 (2.5877)	Entropy 0.62410 (0.62328)	Top-1 acc 59.766 (61.560)	Top-5 acc 80.078 (82.371)	lr 0.01049
Train [67][540/3239]	Time 0.396 (0.617)	Data Time 0.001 (0.095)	Loss 2.5379 (2.5873)	Entropy 0.62393 (0.62329)	Top-1 acc 62.891 (61.581)	Top-5 acc 81.641 (82.366)	lr 0.01049
Train [67][550/3239]	Time 0.239 (0.614)	Data Time 0.001 (0.093)	Loss 2.5079 (2.5870)	Entropy 0.62389 (0.62330)	Top-1 acc 62.109 (61.581)	Top-5 acc 82.031 (82.373)	lr 0.01049
Train [67][560/3239]	Time 0.256 (0.612)	Data Time 0.001 (0.091)	Loss 2.5573 (2.5862)	Entropy 0.62394 (0.62331)	Top-1 acc 60.938 (61.604)	Top-5 acc 83.594 (82.397)	lr 0.01049
Train [67][570/3239]	Time 0.246 (0.609)	Data Time 0.001 (0.090)	Loss 2.5422 (2.5854)	Entropy 0.62403 (0.62333)	Top-1 acc 59.766 (61.611)	Top-5 acc 84.375 (82.417)	lr 0.01049
Train [67][580/3239]	Time 0.258 (0.606)	Data Time 0.001 (0.088)	Loss 2.7563 (2.5851)	Entropy 0.62383 (0.62334)	Top-1 acc 57.812 (61.623)	Top-5 acc 80.469 (82.417)	lr 0.01049
Train [67][590/3239]	Time 0.236 (0.603)	Data Time 0.001 (0.087)	Loss 2.7055 (2.5851)	Entropy 0.62345 (0.62334)	Top-1 acc 58.203 (61.620)	Top-5 acc 80.469 (82.415)	lr 0.01049
Train [67][600/3239]	Time 0.243 (0.600)	Data Time 0.001 (0.085)	Loss 2.4626 (2.5840)	Entropy 0.62381 (0.62335)	Top-1 acc 66.797 (61.643)	Top-5 acc 85.156 (82.432)	lr 0.01048
Train [67][610/3239]	Time 0.335 (0.598)	Data Time 0.001 (0.084)	Loss 2.4880 (2.5848)	Entropy 0.62379 (0.62335)	Top-1 acc 64.453 (61.625)	Top-5 acc 81.250 (82.414)	lr 0.01048
Train [67][620/3239]	Time 0.245 (0.598)	Data Time 0.001 (0.085)	Loss 2.9662 (2.5857)	Entropy 0.62394 (0.62336)	Top-1 acc 53.125 (61.616)	Top-5 acc 73.438 (82.392)	lr 0.01048
Train [67][630/3239]	Time 0.257 (0.595)	Data Time 0.002 (0.084)	Loss 2.4494 (2.5859)	Entropy 0.62390 (0.62337)	Top-1 acc 64.844 (61.631)	Top-5 acc 82.812 (82.380)	lr 0.01048
Train [67][640/3239]	Time 0.602 (0.594)	Data Time 0.322 (0.083)	Loss 2.5893 (2.5856)	Entropy 0.62387 (0.62338)	Top-1 acc 59.766 (61.661)	Top-5 acc 78.906 (82.383)	lr 0.01048
Train [67][650/3239]	Time 0.238 (0.599)	Data Time 0.001 (0.089)	Loss 2.6681 (2.5868)	Entropy 0.62362 (0.62338)	Top-1 acc 56.641 (61.623)	Top-5 acc 82.812 (82.363)	lr 0.01048
Train [67][660/3239]	Time 0.238 (0.597)	Data Time 0.001 (0.088)	Loss 2.6041 (2.5867)	Entropy 0.62366 (0.62339)	Top-1 acc 60.938 (61.638)	Top-5 acc 83.984 (82.366)	lr 0.01048
Train [67][670/3239]	Time 0.256 (0.594)	Data Time 0.001 (0.086)	Loss 2.4485 (2.5860)	Entropy 0.62342 (0.62339)	Top-1 acc 66.406 (61.656)	Top-5 acc 83.984 (82.374)	lr 0.01048
Train [67][680/3239]	Time 0.242 (0.593)	Data Time 0.001 (0.086)	Loss 2.6513 (2.5859)	Entropy 0.62346 (0.62339)	Top-1 acc 59.766 (61.652)	Top-5 acc 80.469 (82.373)	lr 0.01048
Train [67][690/3239]	Time 0.249 (0.591)	Data Time 0.001 (0.086)	Loss 2.5594 (2.5861)	Entropy 0.62358 (0.62339)	Top-1 acc 64.453 (61.649)	Top-5 acc 81.250 (82.363)	lr 0.01048
Train [67][700/3239]	Time 0.238 (0.589)	Data Time 0.001 (0.085)	Loss 2.5211 (2.5863)	Entropy 0.62347 (0.62339)	Top-1 acc 61.719 (61.646)	Top-5 acc 86.328 (82.362)	lr 0.01047
Train [67][710/3239]	Time 0.248 (0.593)	Data Time 0.001 (0.090)	Loss 2.5257 (2.5860)	Entropy 0.62377 (0.62340)	Top-1 acc 64.062 (61.662)	Top-5 acc 83.203 (82.359)	lr 0.01047
Train [67][720/3239]	Time 0.257 (0.592)	Data Time 0.001 (0.090)	Loss 2.8302 (2.5859)	Entropy 0.62375 (0.62340)	Top-1 acc 54.688 (61.645)	Top-5 acc 77.344 (82.361)	lr 0.01047
Train [67][730/3239]	Time 0.279 (0.590)	Data Time 0.003 (0.089)	Loss 2.6044 (2.5867)	Entropy 0.62391 (0.62341)	Top-1 acc 60.938 (61.617)	Top-5 acc 83.594 (82.344)	lr 0.01047
Train [67][740/3239]	Time 0.246 (0.588)	Data Time 0.001 (0.088)	Loss 2.6142 (2.5856)	Entropy 0.62389 (0.62341)	Top-1 acc 62.500 (61.639)	Top-5 acc 80.859 (82.377)	lr 0.01047
Train [67][750/3239]	Time 0.243 (0.589)	Data Time 0.001 (0.090)	Loss 2.6223 (2.5856)	Entropy 0.62372 (0.62342)	Top-1 acc 57.422 (61.637)	Top-5 acc 84.375 (82.383)	lr 0.01047
Train [67][760/3239]	Time 0.247 (0.587)	Data Time 0.001 (0.088)	Loss 2.3415 (2.5859)	Entropy 0.62389 (0.62342)	Top-1 acc 66.016 (61.633)	Top-5 acc 86.719 (82.371)	lr 0.01047
Train [67][770/3239]	Time 0.342 (0.586)	Data Time 0.002 (0.088)	Loss 2.3570 (2.5862)	Entropy 0.62363 (0.62343)	Top-1 acc 68.359 (61.639)	Top-5 acc 87.109 (82.377)	lr 0.01047
Train [67][780/3239]	Time 0.245 (0.585)	Data Time 0.001 (0.087)	Loss 2.6152 (2.5870)	Entropy 0.62332 (0.62343)	Top-1 acc 61.719 (61.608)	Top-5 acc 82.031 (82.361)	lr 0.01047
Train [67][790/3239]	Time 0.256 (0.583)	Data Time 0.002 (0.087)	Loss 2.7262 (2.5875)	Entropy 0.62325 (0.62343)	Top-1 acc 58.984 (61.605)	Top-5 acc 78.906 (82.357)	lr 0.01047
Train [67][800/3239]	Time 0.269 (0.587)	Data Time 0.001 (0.092)	Loss 2.4885 (2.5873)	Entropy 0.62307 (0.62343)	Top-1 acc 65.234 (61.613)	Top-5 acc 83.203 (82.360)	lr 0.01046
Train [67][810/3239]	Time 0.246 (0.585)	Data Time 0.001 (0.091)	Loss 2.5402 (2.5869)	Entropy 0.62309 (0.62342)	Top-1 acc 64.062 (61.619)	Top-5 acc 82.812 (82.374)	lr 0.01046
Train [67][820/3239]	Time 0.294 (0.587)	Data Time 0.001 (0.093)	Loss 2.5630 (2.5872)	Entropy 0.62307 (0.62342)	Top-1 acc 62.109 (61.612)	Top-5 acc 82.031 (82.366)	lr 0.01046
Train [67][830/3239]	Time 0.244 (0.585)	Data Time 0.001 (0.092)	Loss 2.7106 (2.5870)	Entropy 0.62310 (0.62341)	Top-1 acc 55.469 (61.613)	Top-5 acc 82.031 (82.373)	lr 0.01046
Train [67][840/3239]	Time 0.340 (0.588)	Data Time 0.001 (0.095)	Loss 2.4933 (2.5869)	Entropy 0.62320 (0.62341)	Top-1 acc 67.578 (61.632)	Top-5 acc 83.203 (82.381)	lr 0.01046
Train [67][850/3239]	Time 0.280 (0.587)	Data Time 0.001 (0.095)	Loss 2.5033 (2.5866)	Entropy 0.62305 (0.62341)	Top-1 acc 66.016 (61.647)	Top-5 acc 83.594 (82.386)	lr 0.01046
Train [67][860/3239]	Time 0.257 (0.586)	Data Time 0.001 (0.094)	Loss 2.6169 (2.5867)	Entropy 0.62300 (0.62340)	Top-1 acc 64.062 (61.647)	Top-5 acc 80.469 (82.378)	lr 0.01046
Train [67][870/3239]	Time 0.301 (0.585)	Data Time 0.002 (0.094)	Loss 2.5181 (2.5867)	Entropy 0.62333 (0.62340)	Top-1 acc 65.234 (61.646)	Top-5 acc 86.328 (82.377)	lr 0.01046
Train [67][880/3239]	Time 0.234 (0.585)	Data Time 0.001 (0.095)	Loss 2.7957 (2.5874)	Entropy 0.62371 (0.62340)	Top-1 acc 58.594 (61.623)	Top-5 acc 76.953 (82.361)	lr 0.01046
Train [67][890/3239]	Time 0.231 (0.583)	Data Time 0.001 (0.094)	Loss 2.9187 (2.5881)	Entropy 0.62393 (0.62340)	Top-1 acc 51.562 (61.611)	Top-5 acc 76.953 (82.360)	lr 0.01046
Train [67][900/3239]	Time 3.070 (0.586)	Data Time 2.818 (0.098)	Loss 2.6163 (2.5885)	Entropy 0.62408 (0.62341)	Top-1 acc 62.109 (61.586)	Top-5 acc 83.594 (82.357)	lr 0.01045
Train [67][910/3239]	Time 0.249 (0.585)	Data Time 0.001 (0.096)	Loss 2.5767 (2.5889)	Entropy 0.62380 (0.62342)	Top-1 acc 65.234 (61.570)	Top-5 acc 82.812 (82.346)	lr 0.01045
Train [67][920/3239]	Time 0.260 (0.584)	Data Time 0.002 (0.096)	Loss 2.4566 (2.5886)	Entropy 0.62385 (0.62342)	Top-1 acc 61.719 (61.569)	Top-5 acc 85.938 (82.360)	lr 0.01045
Train [67][930/3239]	Time 0.342 (0.582)	Data Time 0.001 (0.095)	Loss 2.4815 (2.5882)	Entropy 0.62373 (0.62342)	Top-1 acc 61.328 (61.569)	Top-5 acc 83.984 (82.374)	lr 0.01045
Train [67][940/3239]	Time 0.286 (0.585)	Data Time 0.001 (0.098)	Loss 2.7710 (2.5879)	Entropy 0.62346 (0.62343)	Top-1 acc 53.125 (61.571)	Top-5 acc 80.469 (82.386)	lr 0.01045
Train [67][950/3239]	Time 0.231 (0.583)	Data Time 0.001 (0.097)	Loss 2.7720 (2.5890)	Entropy 0.62322 (0.62343)	Top-1 acc 55.469 (61.556)	Top-5 acc 77.344 (82.365)	lr 0.01045
Train [67][960/3239]	Time 0.220 (0.583)	Data Time 0.001 (0.098)	Loss 2.7757 (2.5892)	Entropy 0.62362 (0.62343)	Top-1 acc 53.125 (61.548)	Top-5 acc 81.641 (82.373)	lr 0.01045
Train [67][970/3239]	Time 0.374 (0.628)	Data Time 0.006 (0.099)	Loss 2.6439 (2.5892)	Entropy 0.62373 (0.62343)	Top-1 acc 61.328 (61.558)	Top-5 acc 80.859 (82.374)	lr 0.01045
Train [67][980/3239]	Time 0.235 (0.627)	Data Time 0.002 (0.098)	Loss 2.5526 (2.5887)	Entropy 0.62369 (0.62343)	Top-1 acc 62.891 (61.563)	Top-5 acc 81.250 (82.382)	lr 0.01045
Train [67][990/3239]	Time 0.240 (0.625)	Data Time 0.001 (0.098)	Loss 2.5704 (2.5884)	Entropy 0.62370 (0.62343)	Top-1 acc 62.891 (61.566)	Top-5 acc 82.031 (82.388)	lr 0.01045
Train [67][1000/3239]	Time 0.339 (0.623)	Data Time 0.002 (0.097)	Loss 2.5795 (2.5883)	Entropy 0.62396 (0.62344)	Top-1 acc 60.547 (61.568)	Top-5 acc 81.641 (82.381)	lr 0.01044
Train [67][1010/3239]	Time 0.236 (0.621)	Data Time 0.001 (0.096)	Loss 2.6209 (2.5880)	Entropy 0.62405 (0.62344)	Top-1 acc 60.547 (61.572)	Top-5 acc 82.422 (82.383)	lr 0.01044
Train [67][1020/3239]	Time 0.290 (0.619)	Data Time 0.004 (0.095)	Loss 2.5791 (2.5883)	Entropy 0.62412 (0.62345)	Top-1 acc 61.328 (61.559)	Top-5 acc 83.984 (82.379)	lr 0.01044
Train [67][1030/3239]	Time 0.271 (0.618)	Data Time 0.002 (0.094)	Loss 2.5987 (2.5886)	Entropy 0.62390 (0.62346)	Top-1 acc 60.547 (61.544)	Top-5 acc 82.422 (82.379)	lr 0.01044
Train [67][1040/3239]	Time 0.238 (0.616)	Data Time 0.001 (0.093)	Loss 2.5765 (2.5882)	Entropy 0.62398 (0.62346)	Top-1 acc 60.547 (61.551)	Top-5 acc 81.641 (82.388)	lr 0.01044
Train [67][1050/3239]	Time 0.221 (0.615)	Data Time 0.001 (0.092)	Loss 3.0877 (2.5892)	Entropy 0.62386 (0.62347)	Top-1 acc 44.922 (61.526)	Top-5 acc 74.219 (82.370)	lr 0.01044
Train [67][1060/3239]	Time 0.261 (0.613)	Data Time 0.001 (0.091)	Loss 2.5996 (2.5895)	Entropy 0.62383 (0.62347)	Top-1 acc 60.547 (61.507)	Top-5 acc 82.031 (82.369)	lr 0.01044
Train [67][1070/3239]	Time 0.251 (0.611)	Data Time 0.001 (0.090)	Loss 2.4443 (2.5889)	Entropy 0.62353 (0.62347)	Top-1 acc 65.625 (61.527)	Top-5 acc 85.938 (82.386)	lr 0.01044
Train [67][1080/3239]	Time 0.298 (0.610)	Data Time 0.002 (0.090)	Loss 2.6317 (2.5889)	Entropy 0.62366 (0.62347)	Top-1 acc 63.672 (61.531)	Top-5 acc 80.469 (82.388)	lr 0.01044
Train [67][1090/3239]	Time 0.335 (0.608)	Data Time 0.001 (0.089)	Loss 2.5423 (2.5888)	Entropy 0.62367 (0.62347)	Top-1 acc 62.109 (61.538)	Top-5 acc 82.422 (82.393)	lr 0.01044
Train [67][1100/3239]	Time 0.242 (0.609)	Data Time 0.001 (0.089)	Loss 2.4802 (2.5882)	Entropy 0.62346 (0.62347)	Top-1 acc 63.672 (61.557)	Top-5 acc 83.594 (82.400)	lr 0.01043
Train [67][1110/3239]	Time 0.260 (0.610)	Data Time 0.002 (0.091)	Loss 2.5657 (2.5884)	Entropy 0.62302 (0.62347)	Top-1 acc 61.328 (61.552)	Top-5 acc 85.156 (82.393)	lr 0.01043
Train [67][1120/3239]	Time 0.256 (0.612)	Data Time 0.001 (0.094)	Loss 2.4210 (2.5882)	Entropy 0.62311 (0.62347)	Top-1 acc 65.234 (61.562)	Top-5 acc 87.500 (82.395)	lr 0.01043
Train [67][1130/3239]	Time 0.240 (0.610)	Data Time 0.001 (0.093)	Loss 2.5649 (2.5883)	Entropy 0.62306 (0.62346)	Top-1 acc 61.328 (61.556)	Top-5 acc 82.812 (82.389)	lr 0.01043
Train [67][1140/3239]	Time 0.254 (0.612)	Data Time 0.002 (0.095)	Loss 2.6253 (2.5883)	Entropy 0.62254 (0.62346)	Top-1 acc 59.766 (61.566)	Top-5 acc 80.859 (82.390)	lr 0.01043
Train [67][1150/3239]	Time 0.217 (0.611)	Data Time 0.001 (0.096)	Loss 2.8292 (2.5886)	Entropy 0.62251 (0.62345)	Top-1 acc 56.641 (61.558)	Top-5 acc 78.125 (82.383)	lr 0.01043
Train [67][1160/3239]	Time 0.313 (0.610)	Data Time 0.001 (0.095)	Loss 2.7151 (2.5891)	Entropy 0.62258 (0.62344)	Top-1 acc 58.984 (61.549)	Top-5 acc 81.250 (82.370)	lr 0.01043
Train [67][1170/3239]	Time 0.251 (0.611)	Data Time 0.001 (0.097)	Loss 2.7328 (2.5890)	Entropy 0.62250 (0.62343)	Top-1 acc 58.203 (61.556)	Top-5 acc 79.688 (82.370)	lr 0.01043
Train [67][1180/3239]	Time 0.233 (0.612)	Data Time 0.001 (0.099)	Loss 2.4947 (2.5887)	Entropy 0.62263 (0.62343)	Top-1 acc 61.719 (61.565)	Top-5 acc 83.594 (82.373)	lr 0.01043
Train [67][1190/3239]	Time 0.492 (0.611)	Data Time 0.194 (0.098)	Loss 2.5158 (2.5886)	Entropy 0.62221 (0.62342)	Top-1 acc 60.938 (61.566)	Top-5 acc 81.250 (82.370)	lr 0.01043
Train [67][1200/3239]	Time 0.229 (0.612)	Data Time 0.001 (0.100)	Loss 2.7078 (2.5885)	Entropy 0.62210 (0.62341)	Top-1 acc 57.031 (61.564)	Top-5 acc 80.078 (82.374)	lr 0.01042
Train [67][1210/3239]	Time 0.237 (0.613)	Data Time 0.001 (0.102)	Loss 2.5946 (2.5888)	Entropy 0.62203 (0.62340)	Top-1 acc 60.156 (61.556)	Top-5 acc 81.641 (82.362)	lr 0.01042
Train [67][1220/3239]	Time 0.241 (0.612)	Data Time 0.001 (0.101)	Loss 2.7406 (2.5891)	Entropy 0.62196 (0.62339)	Top-1 acc 59.375 (61.549)	Top-5 acc 78.906 (82.359)	lr 0.01042
Train [67][1230/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.103)	Loss 2.4519 (2.5892)	Entropy 0.62199 (0.62337)	Top-1 acc 64.062 (61.541)	Top-5 acc 86.328 (82.353)	lr 0.01042
Train [67][1240/3239]	Time 0.257 (0.612)	Data Time 0.001 (0.102)	Loss 2.7072 (2.5896)	Entropy 0.62208 (0.62336)	Top-1 acc 57.031 (61.536)	Top-5 acc 80.859 (82.347)	lr 0.01042
Train [67][1250/3239]	Time 0.273 (0.613)	Data Time 0.001 (0.104)	Loss 2.3205 (2.5893)	Entropy 0.62200 (0.62335)	Top-1 acc 70.703 (61.548)	Top-5 acc 85.547 (82.350)	lr 0.01042
Train [67][1260/3239]	Time 0.239 (0.615)	Data Time 0.001 (0.107)	Loss 2.2849 (2.5895)	Entropy 0.62203 (0.62334)	Top-1 acc 66.406 (61.542)	Top-5 acc 86.719 (82.347)	lr 0.01042
Train [67][1270/3239]	Time 0.273 (0.614)	Data Time 0.001 (0.106)	Loss 2.4280 (2.5892)	Entropy 0.62202 (0.62333)	Top-1 acc 66.016 (61.548)	Top-5 acc 84.766 (82.351)	lr 0.01042
Train [67][1280/3239]	Time 0.229 (0.615)	Data Time 0.001 (0.108)	Loss 2.7873 (2.5897)	Entropy 0.62206 (0.62332)	Top-1 acc 55.469 (61.543)	Top-5 acc 79.688 (82.341)	lr 0.01042
Train [67][1290/3239]	Time 0.260 (0.616)	Data Time 0.002 (0.109)	Loss 2.4137 (2.5894)	Entropy 0.62212 (0.62331)	Top-1 acc 62.109 (61.549)	Top-5 acc 88.672 (82.350)	lr 0.01042
Train [67][1300/3239]	Time 0.255 (0.616)	Data Time 0.001 (0.110)	Loss 2.5384 (2.5896)	Entropy 0.62204 (0.62330)	Top-1 acc 60.547 (61.544)	Top-5 acc 84.375 (82.355)	lr 0.01041
Train [67][1310/3239]	Time 0.247 (0.615)	Data Time 0.001 (0.109)	Loss 2.5586 (2.5890)	Entropy 0.62196 (0.62329)	Top-1 acc 58.984 (61.555)	Top-5 acc 83.984 (82.371)	lr 0.01041
Train [67][1320/3239]	Time 0.355 (0.617)	Data Time 0.001 (0.112)	Loss 2.5864 (2.5890)	Entropy 0.62174 (0.62328)	Top-1 acc 56.641 (61.548)	Top-5 acc 81.250 (82.371)	lr 0.01041
Train [67][1330/3239]	Time 0.249 (0.616)	Data Time 0.001 (0.112)	Loss 2.5977 (2.5889)	Entropy 0.62192 (0.62327)	Top-1 acc 57.812 (61.549)	Top-5 acc 84.375 (82.379)	lr 0.01041
Train [67][1340/3239]	Time 0.268 (0.617)	Data Time 0.002 (0.113)	Loss 2.6646 (2.5887)	Entropy 0.62178 (0.62326)	Top-1 acc 59.766 (61.561)	Top-5 acc 81.250 (82.382)	lr 0.01041
Train [67][1350/3239]	Time 2.396 (0.617)	Data Time 2.146 (0.114)	Loss 2.5125 (2.5883)	Entropy 0.62188 (0.62325)	Top-1 acc 64.062 (61.568)	Top-5 acc 84.375 (82.391)	lr 0.01041
Train [67][1360/3239]	Time 0.248 (0.618)	Data Time 0.001 (0.115)	Loss 2.5175 (2.5879)	Entropy 0.62213 (0.62324)	Top-1 acc 62.500 (61.571)	Top-5 acc 83.594 (82.397)	lr 0.01041
Train [67][1370/3239]	Time 2.649 (0.618)	Data Time 2.395 (0.116)	Loss 2.5826 (2.5877)	Entropy 0.62196 (0.62323)	Top-1 acc 61.719 (61.576)	Top-5 acc 82.031 (82.402)	lr 0.01041
Train [67][1380/3239]	Time 0.261 (0.617)	Data Time 0.002 (0.115)	Loss 2.6881 (2.5882)	Entropy 0.62199 (0.62322)	Top-1 acc 60.938 (61.567)	Top-5 acc 80.859 (82.390)	lr 0.01041
Train [67][1390/3239]	Time 0.339 (0.618)	Data Time 0.001 (0.118)	Loss 2.5791 (2.5883)	Entropy 0.62172 (0.62321)	Top-1 acc 64.062 (61.568)	Top-5 acc 83.203 (82.386)	lr 0.01041
Train [67][1400/3239]	Time 0.259 (0.618)	Data Time 0.001 (0.117)	Loss 2.5948 (2.5883)	Entropy 0.62216 (0.62321)	Top-1 acc 60.156 (61.564)	Top-5 acc 81.641 (82.383)	lr 0.01041
Train [67][1410/3239]	Time 0.244 (0.619)	Data Time 0.002 (0.120)	Loss 2.4657 (2.5885)	Entropy 0.62237 (0.62320)	Top-1 acc 64.062 (61.557)	Top-5 acc 83.203 (82.379)	lr 0.01040
Train [67][1420/3239]	Time 0.249 (0.620)	Data Time 0.001 (0.120)	Loss 2.5184 (2.5886)	Entropy 0.62229 (0.62319)	Top-1 acc 63.281 (61.556)	Top-5 acc 83.203 (82.376)	lr 0.01040
Train [67][1430/3239]	Time 0.249 (0.623)	Data Time 0.001 (0.124)	Loss 2.3346 (2.5886)	Entropy 0.62199 (0.62318)	Top-1 acc 65.625 (61.552)	Top-5 acc 87.109 (82.379)	lr 0.01040
Train [67][1440/3239]	Time 0.241 (0.622)	Data Time 0.001 (0.123)	Loss 2.5819 (2.5887)	Entropy 0.62198 (0.62318)	Top-1 acc 62.891 (61.556)	Top-5 acc 81.250 (82.375)	lr 0.01040
Train [67][1450/3239]	Time 0.441 (0.621)	Data Time 0.189 (0.124)	Loss 2.6545 (2.5884)	Entropy 0.62182 (0.62317)	Top-1 acc 60.547 (61.561)	Top-5 acc 80.469 (82.377)	lr 0.01040
Train [67][1460/3239]	Time 0.251 (0.624)	Data Time 0.001 (0.127)	Loss 2.6208 (2.5884)	Entropy 0.62162 (0.62316)	Top-1 acc 60.547 (61.562)	Top-5 acc 83.203 (82.383)	lr 0.01040
Train [67][1470/3239]	Time 0.255 (0.623)	Data Time 0.001 (0.126)	Loss 2.6471 (2.5883)	Entropy 0.62184 (0.62315)	Top-1 acc 61.328 (61.560)	Top-5 acc 78.516 (82.387)	lr 0.01040
Train [67][1480/3239]	Time 0.330 (0.622)	Data Time 0.001 (0.125)	Loss 2.7837 (2.5883)	Entropy 0.62171 (0.62314)	Top-1 acc 58.594 (61.559)	Top-5 acc 76.562 (82.384)	lr 0.01040
Train [67][1490/3239]	Time 0.257 (0.622)	Data Time 0.002 (0.126)	Loss 2.4571 (2.5879)	Entropy 0.62157 (0.62313)	Top-1 acc 62.891 (61.571)	Top-5 acc 87.500 (82.395)	lr 0.01040
Train [67][1500/3239]	Time 0.257 (0.624)	Data Time 0.001 (0.128)	Loss 2.7711 (2.5883)	Entropy 0.62158 (0.62312)	Top-1 acc 60.938 (61.559)	Top-5 acc 76.172 (82.382)	lr 0.01040
Train [67][1510/3239]	Time 1.400 (0.623)	Data Time 1.138 (0.128)	Loss 2.3379 (2.5878)	Entropy 0.62190 (0.62311)	Top-1 acc 68.750 (61.569)	Top-5 acc 86.719 (82.388)	lr 0.01039
Train [67][1520/3239]	Time 0.232 (0.623)	Data Time 0.001 (0.128)	Loss 2.4843 (2.5878)	Entropy 0.62192 (0.62310)	Top-1 acc 62.109 (61.570)	Top-5 acc 84.766 (82.385)	lr 0.01039
Train [67][1530/3239]	Time 0.234 (0.626)	Data Time 0.001 (0.132)	Loss 2.5881 (2.5878)	Entropy 0.62169 (0.62309)	Top-1 acc 60.156 (61.573)	Top-5 acc 81.641 (82.381)	lr 0.01039
Train [67][1540/3239]	Time 0.224 (0.625)	Data Time 0.001 (0.131)	Loss 2.5985 (2.5881)	Entropy 0.62168 (0.62308)	Top-1 acc 61.328 (61.565)	Top-5 acc 83.594 (82.375)	lr 0.01039
Train [67][1550/3239]	Time 0.339 (0.627)	Data Time 0.001 (0.133)	Loss 2.5951 (2.5884)	Entropy 0.62154 (0.62307)	Top-1 acc 60.938 (61.556)	Top-5 acc 81.250 (82.367)	lr 0.01039
Train [67][1560/3239]	Time 0.267 (0.629)	Data Time 0.001 (0.136)	Loss 2.5756 (2.5883)	Entropy 0.62162 (0.62307)	Top-1 acc 62.109 (61.555)	Top-5 acc 79.297 (82.366)	lr 0.01039
Train [67][1570/3239]	Time 0.260 (0.629)	Data Time 0.001 (0.136)	Loss 2.6792 (2.5883)	Entropy 0.62144 (0.62306)	Top-1 acc 57.031 (61.559)	Top-5 acc 82.031 (82.371)	lr 0.01039
Train [67][1580/3239]	Time 0.234 (0.630)	Data Time 0.001 (0.138)	Loss 2.5717 (2.5887)	Entropy 0.62119 (0.62304)	Top-1 acc 60.156 (61.544)	Top-5 acc 85.156 (82.368)	lr 0.01039
Train [67][1590/3239]	Time 0.227 (0.631)	Data Time 0.002 (0.140)	Loss 2.7601 (2.5889)	Entropy 0.62102 (0.62303)	Top-1 acc 56.641 (61.538)	Top-5 acc 79.688 (82.365)	lr 0.01039
Train [67][1600/3239]	Time 0.231 (0.632)	Data Time 0.001 (0.141)	Loss 2.7687 (2.5891)	Entropy 0.62089 (0.62302)	Top-1 acc 55.859 (61.539)	Top-5 acc 79.297 (82.359)	lr 0.01039
Train [67][1610/3239]	Time 7.322 (0.636)	Data Time 7.080 (0.146)	Loss 2.6219 (2.5889)	Entropy 0.62081 (0.62301)	Top-1 acc 60.156 (61.546)	Top-5 acc 83.984 (82.364)	lr 0.01038
Train [67][1620/3239]	Time 0.245 (0.635)	Data Time 0.001 (0.145)	Loss 2.6589 (2.5894)	Entropy 0.62082 (0.62299)	Top-1 acc 60.938 (61.536)	Top-5 acc 81.250 (82.353)	lr 0.01038
Train [67][1630/3239]	Time 0.246 (0.661)	Data Time 0.002 (0.144)	Loss 2.5079 (2.5892)	Entropy 0.62095 (0.62298)	Top-1 acc 64.844 (61.541)	Top-5 acc 83.203 (82.356)	lr 0.01038
Train [67][1640/3239]	Time 0.320 (0.659)	Data Time 0.001 (0.143)	Loss 2.7815 (2.5896)	Entropy 0.62066 (0.62297)	Top-1 acc 53.906 (61.525)	Top-5 acc 76.953 (82.346)	lr 0.01038
Train [67][1650/3239]	Time 0.235 (0.658)	Data Time 0.001 (0.142)	Loss 2.5964 (2.5897)	Entropy 0.62037 (0.62295)	Top-1 acc 62.500 (61.524)	Top-5 acc 84.375 (82.341)	lr 0.01038
Train [67][1660/3239]	Time 0.248 (0.656)	Data Time 0.001 (0.141)	Loss 2.6968 (2.5899)	Entropy 0.62027 (0.62294)	Top-1 acc 57.812 (61.523)	Top-5 acc 82.031 (82.337)	lr 0.01038
Train [67][1670/3239]	Time 0.238 (0.655)	Data Time 0.001 (0.141)	Loss 2.5716 (2.5897)	Entropy 0.62016 (0.62292)	Top-1 acc 64.062 (61.530)	Top-5 acc 78.125 (82.340)	lr 0.01038
Train [67][1680/3239]	Time 0.252 (0.654)	Data Time 0.001 (0.140)	Loss 2.5792 (2.5897)	Entropy 0.61996 (0.62290)	Top-1 acc 63.672 (61.532)	Top-5 acc 82.812 (82.336)	lr 0.01038
Train [67][1690/3239]	Time 0.243 (0.652)	Data Time 0.001 (0.139)	Loss 2.4181 (2.5895)	Entropy 0.61999 (0.62289)	Top-1 acc 62.891 (61.531)	Top-5 acc 83.594 (82.338)	lr 0.01038
Train [67][1700/3239]	Time 0.370 (0.651)	Data Time 0.129 (0.138)	Loss 2.7469 (2.5898)	Entropy 0.62027 (0.62287)	Top-1 acc 55.469 (61.522)	Top-5 acc 78.125 (82.331)	lr 0.01038
Train [67][1710/3239]	Time 0.355 (0.651)	Data Time 0.001 (0.139)	Loss 2.4972 (2.5896)	Entropy 0.62016 (0.62285)	Top-1 acc 64.453 (61.528)	Top-5 acc 87.109 (82.334)	lr 0.01037
Train [67][1720/3239]	Time 0.240 (0.650)	Data Time 0.001 (0.138)	Loss 2.8814 (2.5899)	Entropy 0.62003 (0.62284)	Top-1 acc 54.297 (61.521)	Top-5 acc 76.953 (82.329)	lr 0.01037
Train [67][1730/3239]	Time 0.236 (0.655)	Data Time 0.001 (0.144)	Loss 2.7922 (2.5904)	Entropy 0.61953 (0.62282)	Top-1 acc 55.469 (61.505)	Top-5 acc 80.859 (82.325)	lr 0.01037
Train [67][1740/3239]	Time 0.251 (0.655)	Data Time 0.001 (0.144)	Loss 2.8131 (2.5906)	Entropy 0.61954 (0.62280)	Top-1 acc 55.469 (61.502)	Top-5 acc 76.953 (82.327)	lr 0.01037
Train [67][1750/3239]	Time 0.258 (0.655)	Data Time 0.001 (0.144)	Loss 2.2914 (2.5907)	Entropy 0.61954 (0.62278)	Top-1 acc 70.312 (61.498)	Top-5 acc 85.156 (82.325)	lr 0.01037
Train [67][1760/3239]	Time 2.406 (0.659)	Data Time 2.121 (0.149)	Loss 2.6062 (2.5907)	Entropy 0.61966 (0.62277)	Top-1 acc 63.281 (61.500)	Top-5 acc 81.250 (82.329)	lr 0.01037
Train [67][1770/3239]	Time 0.240 (0.659)	Data Time 0.001 (0.149)	Loss 2.5502 (2.5907)	Entropy 0.61952 (0.62275)	Top-1 acc 63.281 (61.495)	Top-5 acc 84.766 (82.329)	lr 0.01037
Train [67][1780/3239]	Time 0.262 (0.659)	Data Time 0.001 (0.149)	Loss 2.6388 (2.5908)	Entropy 0.61946 (0.62273)	Top-1 acc 61.328 (61.488)	Top-5 acc 79.297 (82.328)	lr 0.01037
Train [67][1790/3239]	Time 0.232 (0.662)	Data Time 0.001 (0.153)	Loss 2.7128 (2.5911)	Entropy 0.61981 (0.62271)	Top-1 acc 59.375 (61.485)	Top-5 acc 79.688 (82.323)	lr 0.01037
Train [67][1800/3239]	Time 0.366 (0.663)	Data Time 0.001 (0.154)	Loss 2.9227 (2.5911)	Entropy 0.62009 (0.62270)	Top-1 acc 54.688 (61.487)	Top-5 acc 75.781 (82.317)	lr 0.01037
Train [67][1810/3239]	Time 0.230 (0.663)	Data Time 0.001 (0.155)	Loss 2.6532 (2.5917)	Entropy 0.61987 (0.62268)	Top-1 acc 57.422 (61.471)	Top-5 acc 80.859 (82.312)	lr 0.01036
Train [67][1820/3239]	Time 0.238 (0.665)	Data Time 0.001 (0.158)	Loss 2.9182 (2.5919)	Entropy 0.62002 (0.62267)	Top-1 acc 50.391 (61.466)	Top-5 acc 77.344 (82.311)	lr 0.01036
Train [67][1830/3239]	Time 0.275 (0.668)	Data Time 0.001 (0.161)	Loss 2.4618 (2.5917)	Entropy 0.61999 (0.62265)	Top-1 acc 67.188 (61.474)	Top-5 acc 87.500 (82.318)	lr 0.01036
Train [67][1840/3239]	Time 0.232 (0.667)	Data Time 0.001 (0.161)	Loss 2.5205 (2.5916)	Entropy 0.62004 (0.62264)	Top-1 acc 62.891 (61.477)	Top-5 acc 83.594 (82.321)	lr 0.01036
Train [67][1850/3239]	Time 3.771 (0.668)	Data Time 3.524 (0.162)	Loss 2.4517 (2.5914)	Entropy 0.62012 (0.62262)	Top-1 acc 62.891 (61.476)	Top-5 acc 85.156 (82.326)	lr 0.01036
Train [67][1860/3239]	Time 0.238 (0.673)	Data Time 0.001 (0.167)	Loss 2.3498 (2.5913)	Entropy 0.62044 (0.62261)	Top-1 acc 66.406 (61.482)	Top-5 acc 86.328 (82.328)	lr 0.01036
Train [67][1870/3239]	Time 1.749 (0.673)	Data Time 1.402 (0.167)	Loss 2.4616 (2.5911)	Entropy 0.62048 (0.62260)	Top-1 acc 59.766 (61.482)	Top-5 acc 83.984 (82.331)	lr 0.01036
Train [67][1880/3239]	Time 0.237 (0.671)	Data Time 0.001 (0.166)	Loss 2.5941 (2.5912)	Entropy 0.62074 (0.62259)	Top-1 acc 58.594 (61.479)	Top-5 acc 83.984 (82.331)	lr 0.01036
Train [67][1890/3239]	Time 0.249 (0.675)	Data Time 0.001 (0.170)	Loss 2.4305 (2.5910)	Entropy 0.62085 (0.62258)	Top-1 acc 67.969 (61.487)	Top-5 acc 83.203 (82.330)	lr 0.01036
Train [67][1900/3239]	Time 0.233 (0.673)	Data Time 0.001 (0.169)	Loss 2.7693 (2.5912)	Entropy 0.62115 (0.62257)	Top-1 acc 56.250 (61.485)	Top-5 acc 81.250 (82.326)	lr 0.01036
Train [67][1910/3239]	Time 0.248 (0.675)	Data Time 0.001 (0.171)	Loss 2.5526 (2.5912)	Entropy 0.62104 (0.62256)	Top-1 acc 62.109 (61.482)	Top-5 acc 82.422 (82.326)	lr 0.01035
Train [67][1920/3239]	Time 0.237 (0.681)	Data Time 0.001 (0.177)	Loss 2.6749 (2.5912)	Entropy 0.62118 (0.62255)	Top-1 acc 57.031 (61.479)	Top-5 acc 80.078 (82.324)	lr 0.01035
Train [67][1930/3239]	Time 0.249 (0.680)	Data Time 0.001 (0.177)	Loss 2.5491 (2.5912)	Entropy 0.62117 (0.62255)	Top-1 acc 65.234 (61.485)	Top-5 acc 82.812 (82.321)	lr 0.01035
Train [67][1940/3239]	Time 0.235 (0.680)	Data Time 0.001 (0.178)	Loss 2.8024 (2.5914)	Entropy 0.62100 (0.62254)	Top-1 acc 56.250 (61.483)	Top-5 acc 82.031 (82.318)	lr 0.01035
Train [67][1950/3239]	Time 0.229 (0.685)	Data Time 0.001 (0.182)	Loss 2.6518 (2.5912)	Entropy 0.62102 (0.62253)	Top-1 acc 58.594 (61.486)	Top-5 acc 82.031 (82.321)	lr 0.01035
Train [67][1960/3239]	Time 0.256 (0.683)	Data Time 0.001 (0.182)	Loss 2.6352 (2.5912)	Entropy 0.62100 (0.62252)	Top-1 acc 61.719 (61.486)	Top-5 acc 79.688 (82.317)	lr 0.01035
Train [67][1970/3239]	Time 0.249 (0.685)	Data Time 0.001 (0.184)	Loss 2.5952 (2.5915)	Entropy 0.62124 (0.62252)	Top-1 acc 61.328 (61.481)	Top-5 acc 83.203 (82.310)	lr 0.01035
Train [67][1980/3239]	Time 0.246 (0.690)	Data Time 0.001 (0.189)	Loss 2.8385 (2.5919)	Entropy 0.62123 (0.62251)	Top-1 acc 60.156 (61.478)	Top-5 acc 78.906 (82.302)	lr 0.01035
Train [67][1990/3239]	Time 0.246 (0.689)	Data Time 0.001 (0.188)	Loss 2.5242 (2.5917)	Entropy 0.62139 (0.62250)	Top-1 acc 60.938 (61.483)	Top-5 acc 82.812 (82.300)	lr 0.01035
Train [67][2000/3239]	Time 2.100 (0.690)	Data Time 1.850 (0.190)	Loss 2.5106 (2.5917)	Entropy 0.62118 (0.62250)	Top-1 acc 64.844 (61.487)	Top-5 acc 83.984 (82.298)	lr 0.01035
Train [67][2010/3239]	Time 0.252 (0.689)	Data Time 0.001 (0.189)	Loss 2.6289 (2.5919)	Entropy 0.62109 (0.62249)	Top-1 acc 65.234 (61.486)	Top-5 acc 78.516 (82.291)	lr 0.01034
Train [67][2020/3239]	Time 0.235 (0.695)	Data Time 0.001 (0.195)	Loss 2.6001 (2.5919)	Entropy 0.62121 (0.62249)	Top-1 acc 62.109 (61.484)	Top-5 acc 84.766 (82.292)	lr 0.01034
Train [67][2030/3239]	Time 0.351 (0.695)	Data Time 0.001 (0.196)	Loss 2.6371 (2.5917)	Entropy 0.62137 (0.62248)	Top-1 acc 59.766 (61.492)	Top-5 acc 80.859 (82.296)	lr 0.01034
Train [67][2040/3239]	Time 0.238 (0.694)	Data Time 0.001 (0.195)	Loss 2.8434 (2.5914)	Entropy 0.62144 (0.62247)	Top-1 acc 57.422 (61.496)	Top-5 acc 79.688 (82.305)	lr 0.01034
Train [67][2050/3239]	Time 0.274 (0.703)	Data Time 0.002 (0.205)	Loss 2.6484 (2.5911)	Entropy 0.62123 (0.62247)	Top-1 acc 60.938 (61.503)	Top-5 acc 77.344 (82.306)	lr 0.01034
Train [67][2060/3239]	Time 0.253 (0.702)	Data Time 0.002 (0.204)	Loss 2.3729 (2.5912)	Entropy 0.62131 (0.62246)	Top-1 acc 68.359 (61.502)	Top-5 acc 85.156 (82.304)	lr 0.01034
Train [67][2070/3239]	Time 0.237 (0.701)	Data Time 0.002 (0.203)	Loss 2.8530 (2.5913)	Entropy 0.62097 (0.62245)	Top-1 acc 57.031 (61.499)	Top-5 acc 76.562 (82.301)	lr 0.01034
Train [67][2080/3239]	Time 0.233 (0.710)	Data Time 0.001 (0.212)	Loss 2.6291 (2.5913)	Entropy 0.62109 (0.62245)	Top-1 acc 58.984 (61.495)	Top-5 acc 82.812 (82.296)	lr 0.01034
Train [67][2090/3239]	Time 0.234 (0.708)	Data Time 0.001 (0.211)	Loss 2.7185 (2.5912)	Entropy 0.62088 (0.62244)	Top-1 acc 58.984 (61.495)	Top-5 acc 82.812 (82.300)	lr 0.01034
Train [67][2100/3239]	Time 0.349 (0.707)	Data Time 0.001 (0.211)	Loss 2.4467 (2.5915)	Entropy 0.62083 (0.62243)	Top-1 acc 64.062 (61.489)	Top-5 acc 86.328 (82.294)	lr 0.01034
Train [67][2110/3239]	Time 0.228 (0.717)	Data Time 0.001 (0.220)	Loss 2.5467 (2.5909)	Entropy 0.62088 (0.62243)	Top-1 acc 63.672 (61.502)	Top-5 acc 81.250 (82.303)	lr 0.01033
Train [67][2120/3239]	Time 0.237 (0.715)	Data Time 0.001 (0.219)	Loss 2.5635 (2.5909)	Entropy 0.62122 (0.62242)	Top-1 acc 60.938 (61.496)	Top-5 acc 83.203 (82.305)	lr 0.01033
Train [67][2130/3239]	Time 0.237 (0.714)	Data Time 0.001 (0.219)	Loss 2.5693 (2.5908)	Entropy 0.62094 (0.62241)	Top-1 acc 65.234 (61.496)	Top-5 acc 81.250 (82.306)	lr 0.01033
Train [67][2140/3239]	Time 0.236 (0.724)	Data Time 0.001 (0.229)	Loss 2.8275 (2.5907)	Entropy 0.62111 (0.62241)	Top-1 acc 57.812 (61.497)	Top-5 acc 75.000 (82.307)	lr 0.01033
Train [67][2150/3239]	Time 0.222 (0.722)	Data Time 0.001 (0.227)	Loss 2.8275 (2.5907)	Entropy 0.62124 (0.62240)	Top-1 acc 57.031 (61.493)	Top-5 acc 75.781 (82.306)	lr 0.01033
Train [67][2160/3239]	Time 2.227 (0.722)	Data Time 1.987 (0.227)	Loss 2.8364 (2.5912)	Entropy 0.62101 (0.62239)	Top-1 acc 55.469 (61.483)	Top-5 acc 76.953 (82.296)	lr 0.01033
Train [67][2170/3239]	Time 0.228 (0.720)	Data Time 0.001 (0.226)	Loss 2.5136 (2.5909)	Entropy 0.62113 (0.62239)	Top-1 acc 63.672 (61.492)	Top-5 acc 82.422 (82.297)	lr 0.01033
Train [67][2180/3239]	Time 0.250 (0.728)	Data Time 0.002 (0.235)	Loss 2.5307 (2.5907)	Entropy 0.62144 (0.62238)	Top-1 acc 65.234 (61.493)	Top-5 acc 86.328 (82.301)	lr 0.01033
Train [67][2190/3239]	Time 0.336 (0.727)	Data Time 0.001 (0.234)	Loss 2.5121 (2.5908)	Entropy 0.62155 (0.62238)	Top-1 acc 63.672 (61.492)	Top-5 acc 85.156 (82.299)	lr 0.01033
Train [67][2200/3239]	Time 0.235 (0.728)	Data Time 0.001 (0.235)	Loss 2.7204 (2.5908)	Entropy 0.62145 (0.62238)	Top-1 acc 60.156 (61.494)	Top-5 acc 78.516 (82.296)	lr 0.01033
Train [67][2210/3239]	Time 0.243 (0.733)	Data Time 0.001 (0.241)	Loss 2.5348 (2.5910)	Entropy 0.62136 (0.62237)	Top-1 acc 61.719 (61.490)	Top-5 acc 83.984 (82.291)	lr 0.01032
Train [67][2220/3239]	Time 0.225 (0.732)	Data Time 0.001 (0.240)	Loss 2.5419 (2.5911)	Entropy 0.62158 (0.62237)	Top-1 acc 59.766 (61.491)	Top-5 acc 86.328 (82.293)	lr 0.01032
Train [67][2230/3239]	Time 0.257 (0.735)	Data Time 0.001 (0.243)	Loss 2.5695 (2.5913)	Entropy 0.62178 (0.62236)	Top-1 acc 60.938 (61.486)	Top-5 acc 81.641 (82.285)	lr 0.01032
Train [67][2240/3239]	Time 0.230 (0.741)	Data Time 0.001 (0.250)	Loss 2.5230 (2.5911)	Entropy 0.62180 (0.62236)	Top-1 acc 67.188 (61.492)	Top-5 acc 81.250 (82.290)	lr 0.01032
Train [67][2250/3239]	Time 0.251 (0.740)	Data Time 0.001 (0.249)	Loss 2.6641 (2.5912)	Entropy 0.62200 (0.62236)	Top-1 acc 59.766 (61.487)	Top-5 acc 81.641 (82.290)	lr 0.01032
Train [67][2260/3239]	Time 0.355 (0.741)	Data Time 0.001 (0.251)	Loss 2.6567 (2.5911)	Entropy 0.62210 (0.62236)	Top-1 acc 57.812 (61.491)	Top-5 acc 78.906 (82.289)	lr 0.01032
Train [67][2270/3239]	Time 0.239 (0.750)	Data Time 0.001 (0.259)	Loss 2.4231 (2.5912)	Entropy 0.62213 (0.62236)	Top-1 acc 66.016 (61.491)	Top-5 acc 86.328 (82.289)	lr 0.01032
Train [67][2280/3239]	Time 0.552 (0.768)	Data Time 0.081 (0.258)	Loss 2.4780 (2.5912)	Entropy 0.62236 (0.62236)	Top-1 acc 66.797 (61.490)	Top-5 acc 87.109 (82.288)	lr 0.01032
Train [67][2290/3239]	Time 0.249 (0.767)	Data Time 0.002 (0.257)	Loss 2.3893 (2.5913)	Entropy 0.62240 (0.62236)	Top-1 acc 68.750 (61.490)	Top-5 acc 83.594 (82.282)	lr 0.01032
Train [67][2300/3239]	Time 0.246 (0.765)	Data Time 0.002 (0.256)	Loss 2.6211 (2.5915)	Entropy 0.62239 (0.62236)	Top-1 acc 60.938 (61.491)	Top-5 acc 81.641 (82.279)	lr 0.01032
Train [67][2310/3239]	Time 0.254 (0.764)	Data Time 0.001 (0.255)	Loss 2.3150 (2.5912)	Entropy 0.62259 (0.62236)	Top-1 acc 65.625 (61.496)	Top-5 acc 88.672 (82.284)	lr 0.01031
Train [67][2320/3239]	Time 0.221 (0.762)	Data Time 0.001 (0.254)	Loss 2.7265 (2.5914)	Entropy 0.62291 (0.62236)	Top-1 acc 56.641 (61.490)	Top-5 acc 78.906 (82.279)	lr 0.01031
Train [67][2330/3239]	Time 0.239 (0.761)	Data Time 0.001 (0.253)	Loss 2.7586 (2.5914)	Entropy 0.62306 (0.62236)	Top-1 acc 58.594 (61.491)	Top-5 acc 80.078 (82.281)	lr 0.01031
Train [67][2340/3239]	Time 0.246 (0.766)	Data Time 0.001 (0.258)	Loss 2.4864 (2.5914)	Entropy 0.62269 (0.62236)	Top-1 acc 67.188 (61.494)	Top-5 acc 83.594 (82.278)	lr 0.01031
Train [67][2350/3239]	Time 0.402 (0.766)	Data Time 0.001 (0.259)	Loss 2.6144 (2.5914)	Entropy 0.62274 (0.62236)	Top-1 acc 62.109 (61.493)	Top-5 acc 82.031 (82.277)	lr 0.01031
Train [67][2360/3239]	Time 0.240 (0.768)	Data Time 0.001 (0.261)	Loss 2.5752 (2.5912)	Entropy 0.62290 (0.62237)	Top-1 acc 60.547 (61.501)	Top-5 acc 83.984 (82.279)	lr 0.01031
Train [67][2370/3239]	Time 0.240 (0.774)	Data Time 0.001 (0.267)	Loss 2.6485 (2.5911)	Entropy 0.62264 (0.62237)	Top-1 acc 60.156 (61.508)	Top-5 acc 81.250 (82.281)	lr 0.01031
Train [67][2380/3239]	Time 0.251 (0.774)	Data Time 0.001 (0.268)	Loss 2.5959 (2.5910)	Entropy 0.62254 (0.62237)	Top-1 acc 62.891 (61.515)	Top-5 acc 82.422 (82.281)	lr 0.01031
Train [67][2390/3239]	Time 0.237 (0.776)	Data Time 0.001 (0.270)	Loss 2.5193 (2.5910)	Entropy 0.62289 (0.62237)	Top-1 acc 60.156 (61.511)	Top-5 acc 85.547 (82.281)	lr 0.01031
Train [67][2400/3239]	Time 0.241 (0.780)	Data Time 0.001 (0.274)	Loss 2.3731 (2.5907)	Entropy 0.62255 (0.62237)	Top-1 acc 65.625 (61.519)	Top-5 acc 86.719 (82.287)	lr 0.01031
Train [67][2410/3239]	Time 6.368 (0.783)	Data Time 6.114 (0.278)	Loss 2.6381 (2.5910)	Entropy 0.62222 (0.62237)	Top-1 acc 56.641 (61.511)	Top-5 acc 81.250 (82.283)	lr 0.01030
Train [67][2420/3239]	Time 0.342 (0.783)	Data Time 0.001 (0.278)	Loss 2.5993 (2.5909)	Entropy 0.62190 (0.62237)	Top-1 acc 62.500 (61.514)	Top-5 acc 80.469 (82.283)	lr 0.01030
Train [67][2430/3239]	Time 0.237 (0.789)	Data Time 0.001 (0.284)	Loss 2.6310 (2.5909)	Entropy 0.62174 (0.62237)	Top-1 acc 58.984 (61.516)	Top-5 acc 81.641 (82.285)	lr 0.01030
Train [67][2440/3239]	Time 5.397 (0.790)	Data Time 5.134 (0.286)	Loss 2.5898 (2.5910)	Entropy 0.62205 (0.62237)	Top-1 acc 60.547 (61.515)	Top-5 acc 81.250 (82.285)	lr 0.01030
Train [67][2450/3239]	Time 0.245 (0.792)	Data Time 0.001 (0.289)	Loss 2.5786 (2.5911)	Entropy 0.62193 (0.62236)	Top-1 acc 63.672 (61.513)	Top-5 acc 80.859 (82.282)	lr 0.01030
Train [67][2460/3239]	Time 0.248 (0.797)	Data Time 0.001 (0.294)	Loss 2.3929 (2.5911)	Entropy 0.62185 (0.62236)	Top-1 acc 65.625 (61.515)	Top-5 acc 85.156 (82.281)	lr 0.01030
Train [67][2470/3239]	Time 0.241 (0.798)	Data Time 0.001 (0.295)	Loss 2.5200 (2.5914)	Entropy 0.62133 (0.62236)	Top-1 acc 64.062 (61.506)	Top-5 acc 83.984 (82.273)	lr 0.01030
Train [67][2480/3239]	Time 3.029 (0.801)	Data Time 2.777 (0.299)	Loss 2.6079 (2.5915)	Entropy 0.62135 (0.62236)	Top-1 acc 59.766 (61.500)	Top-5 acc 81.641 (82.271)	lr 0.01030
Train [67][2490/3239]	Time 0.236 (0.803)	Data Time 0.001 (0.300)	Loss 2.5041 (2.5912)	Entropy 0.62112 (0.62235)	Top-1 acc 61.719 (61.510)	Top-5 acc 84.375 (82.277)	lr 0.01030
Train [67][2500/3239]	Time 7.220 (0.805)	Data Time 6.982 (0.303)	Loss 2.6155 (2.5914)	Entropy 0.62132 (0.62235)	Top-1 acc 59.375 (61.506)	Top-5 acc 82.812 (82.276)	lr 0.01030
Train [67][2510/3239]	Time 0.332 (0.806)	Data Time 0.001 (0.304)	Loss 2.5938 (2.5915)	Entropy 0.62120 (0.62234)	Top-1 acc 64.062 (61.504)	Top-5 acc 82.422 (82.274)	lr 0.01029
Train [67][2520/3239]	Time 0.232 (0.809)	Data Time 0.001 (0.308)	Loss 2.6302 (2.5914)	Entropy 0.62135 (0.62234)	Top-1 acc 59.766 (61.507)	Top-5 acc 80.859 (82.278)	lr 0.01029
Train [67][2530/3239]	Time 0.392 (0.808)	Data Time 0.158 (0.307)	Loss 2.4809 (2.5912)	Entropy 0.62132 (0.62233)	Top-1 acc 65.234 (61.510)	Top-5 acc 83.203 (82.278)	lr 0.01029
Train [67][2540/3239]	Time 0.238 (0.812)	Data Time 0.001 (0.311)	Loss 2.5031 (2.5911)	Entropy 0.62127 (0.62233)	Top-1 acc 60.547 (61.510)	Top-5 acc 83.984 (82.283)	lr 0.01029
Train [67][2550/3239]	Time 0.228 (0.816)	Data Time 0.001 (0.315)	Loss 2.5813 (2.5910)	Entropy 0.62109 (0.62233)	Top-1 acc 61.328 (61.511)	Top-5 acc 82.031 (82.281)	lr 0.01029
Train [67][2560/3239]	Time 0.230 (0.816)	Data Time 0.001 (0.316)	Loss 2.7155 (2.5908)	Entropy 0.62097 (0.62232)	Top-1 acc 57.422 (61.515)	Top-5 acc 79.688 (82.281)	lr 0.01029
Train [67][2570/3239]	Time 0.242 (0.818)	Data Time 0.001 (0.318)	Loss 2.5793 (2.5907)	Entropy 0.62045 (0.62232)	Top-1 acc 62.500 (61.515)	Top-5 acc 83.984 (82.283)	lr 0.01029
Train [67][2580/3239]	Time 0.335 (0.817)	Data Time 0.001 (0.317)	Loss 2.6032 (2.5907)	Entropy 0.62067 (0.62231)	Top-1 acc 60.156 (61.517)	Top-5 acc 81.250 (82.283)	lr 0.01029
Train [67][2590/3239]	Time 0.228 (0.822)	Data Time 0.001 (0.322)	Loss 2.3850 (2.5904)	Entropy 0.62051 (0.62230)	Top-1 acc 66.016 (61.523)	Top-5 acc 84.766 (82.286)	lr 0.01029
Train [67][2600/3239]	Time 0.239 (0.820)	Data Time 0.001 (0.321)	Loss 2.7923 (2.5904)	Entropy 0.62037 (0.62229)	Top-1 acc 55.469 (61.522)	Top-5 acc 79.688 (82.285)	lr 0.01029
Train [67][2610/3239]	Time 1.337 (0.822)	Data Time 1.082 (0.324)	Loss 2.5369 (2.5904)	Entropy 0.62044 (0.62229)	Top-1 acc 61.719 (61.520)	Top-5 acc 81.250 (82.283)	lr 0.01028
Train [67][2620/3239]	Time 0.226 (0.827)	Data Time 0.001 (0.329)	Loss 2.6063 (2.5904)	Entropy 0.61977 (0.62228)	Top-1 acc 62.109 (61.519)	Top-5 acc 80.078 (82.281)	lr 0.01028
Train [67][2630/3239]	Time 0.258 (0.826)	Data Time 0.002 (0.328)	Loss 2.5148 (2.5904)	Entropy 0.61988 (0.62227)	Top-1 acc 62.109 (61.518)	Top-5 acc 85.938 (82.281)	lr 0.01028
Train [67][2640/3239]	Time 0.226 (0.827)	Data Time 0.001 (0.329)	Loss 2.6084 (2.5905)	Entropy 0.61961 (0.62226)	Top-1 acc 61.719 (61.514)	Top-5 acc 80.859 (82.279)	lr 0.01028
Train [67][2650/3239]	Time 0.261 (0.829)	Data Time 0.001 (0.332)	Loss 2.5232 (2.5905)	Entropy 0.61971 (0.62225)	Top-1 acc 61.719 (61.517)	Top-5 acc 81.641 (82.279)	lr 0.01028
Train [67][2660/3239]	Time 0.239 (0.830)	Data Time 0.001 (0.333)	Loss 2.5585 (2.5904)	Entropy 0.61998 (0.62224)	Top-1 acc 61.328 (61.517)	Top-5 acc 81.250 (82.280)	lr 0.01028
Train [67][2670/3239]	Time 2.484 (0.832)	Data Time 2.173 (0.336)	Loss 2.6127 (2.5905)	Entropy 0.62019 (0.62223)	Top-1 acc 60.938 (61.513)	Top-5 acc 82.031 (82.280)	lr 0.01028
Train [67][2680/3239]	Time 0.231 (0.833)	Data Time 0.001 (0.337)	Loss 2.4883 (2.5907)	Entropy 0.62003 (0.62222)	Top-1 acc 65.234 (61.511)	Top-5 acc 83.984 (82.275)	lr 0.01028
Train [67][2690/3239]	Time 0.253 (0.835)	Data Time 0.001 (0.339)	Loss 2.6289 (2.5908)	Entropy 0.62029 (0.62222)	Top-1 acc 57.812 (61.507)	Top-5 acc 83.203 (82.271)	lr 0.01028
Train [67][2700/3239]	Time 0.246 (0.837)	Data Time 0.001 (0.341)	Loss 2.6145 (2.5907)	Entropy 0.62027 (0.62221)	Top-1 acc 60.938 (61.511)	Top-5 acc 81.250 (82.272)	lr 0.01028
Train [67][2710/3239]	Time 0.224 (0.837)	Data Time 0.001 (0.342)	Loss 2.4112 (2.5908)	Entropy 0.61940 (0.62220)	Top-1 acc 66.016 (61.507)	Top-5 acc 85.938 (82.271)	lr 0.01027
Train [67][2720/3239]	Time 0.249 (0.838)	Data Time 0.001 (0.343)	Loss 2.5827 (2.5908)	Entropy 0.61947 (0.62219)	Top-1 acc 61.328 (61.503)	Top-5 acc 84.766 (82.272)	lr 0.01027
Train [67][2730/3239]	Time 6.017 (0.839)	Data Time 5.738 (0.345)	Loss 2.5785 (2.5909)	Entropy 0.61942 (0.62218)	Top-1 acc 62.500 (61.503)	Top-5 acc 80.078 (82.269)	lr 0.01027
Train [67][2740/3239]	Time 0.342 (0.839)	Data Time 0.001 (0.344)	Loss 2.5492 (2.5911)	Entropy 0.61950 (0.62217)	Top-1 acc 62.109 (61.497)	Top-5 acc 85.156 (82.265)	lr 0.01027
Train [67][2750/3239]	Time 0.260 (0.839)	Data Time 0.001 (0.345)	Loss 2.4946 (2.5911)	Entropy 0.61972 (0.62216)	Top-1 acc 66.797 (61.497)	Top-5 acc 83.594 (82.265)	lr 0.01027
Train [67][2760/3239]	Time 0.234 (0.838)	Data Time 0.001 (0.344)	Loss 2.5816 (2.5908)	Entropy 0.61993 (0.62215)	Top-1 acc 63.672 (61.507)	Top-5 acc 79.297 (82.271)	lr 0.01027
Train [67][2770/3239]	Time 1.779 (0.838)	Data Time 1.554 (0.344)	Loss 2.7071 (2.5911)	Entropy 0.62004 (0.62215)	Top-1 acc 59.766 (61.497)	Top-5 acc 79.297 (82.268)	lr 0.01027
Train [67][2780/3239]	Time 0.230 (0.838)	Data Time 0.001 (0.344)	Loss 2.4572 (2.5911)	Entropy 0.61953 (0.62214)	Top-1 acc 68.359 (61.498)	Top-5 acc 84.375 (82.267)	lr 0.01027
Train [67][2790/3239]	Time 0.246 (0.838)	Data Time 0.001 (0.345)	Loss 2.6000 (2.5911)	Entropy 0.61960 (0.62213)	Top-1 acc 61.328 (61.494)	Top-5 acc 80.859 (82.269)	lr 0.01027
Train [67][2800/3239]	Time 0.226 (0.839)	Data Time 0.001 (0.346)	Loss 2.6675 (2.5911)	Entropy 0.61977 (0.62212)	Top-1 acc 59.375 (61.490)	Top-5 acc 78.906 (82.270)	lr 0.01027
Train [67][2810/3239]	Time 0.348 (0.840)	Data Time 0.001 (0.347)	Loss 2.4561 (2.5910)	Entropy 0.62029 (0.62211)	Top-1 acc 66.406 (61.494)	Top-5 acc 82.422 (82.271)	lr 0.01026
Train [67][2820/3239]	Time 4.414 (0.842)	Data Time 4.171 (0.350)	Loss 2.6506 (2.5913)	Entropy 0.62032 (0.62211)	Top-1 acc 55.859 (61.486)	Top-5 acc 83.203 (82.265)	lr 0.01026
Train [67][2830/3239]	Time 0.251 (0.844)	Data Time 0.001 (0.352)	Loss 2.6086 (2.5912)	Entropy 0.61989 (0.62210)	Top-1 acc 61.719 (61.493)	Top-5 acc 83.594 (82.263)	lr 0.01026
Train [67][2840/3239]	Time 0.237 (0.845)	Data Time 0.001 (0.352)	Loss 2.5721 (2.5913)	Entropy 0.61965 (0.62209)	Top-1 acc 63.672 (61.494)	Top-5 acc 80.859 (82.259)	lr 0.01026
Train [67][2850/3239]	Time 0.229 (0.846)	Data Time 0.001 (0.354)	Loss 2.4759 (2.5912)	Entropy 0.61933 (0.62208)	Top-1 acc 66.797 (61.497)	Top-5 acc 83.594 (82.258)	lr 0.01026
Train [67][2860/3239]	Time 0.237 (0.847)	Data Time 0.001 (0.356)	Loss 2.6151 (2.5915)	Entropy 0.61948 (0.62207)	Top-1 acc 60.547 (61.491)	Top-5 acc 81.250 (82.253)	lr 0.01026
Train [67][2870/3239]	Time 0.241 (0.850)	Data Time 0.001 (0.359)	Loss 2.5520 (2.5916)	Entropy 0.61946 (0.62206)	Top-1 acc 62.500 (61.485)	Top-5 acc 82.031 (82.250)	lr 0.01026
Train [67][2880/3239]	Time 0.236 (0.852)	Data Time 0.001 (0.361)	Loss 2.5877 (2.5917)	Entropy 0.61901 (0.62205)	Top-1 acc 58.984 (61.482)	Top-5 acc 80.859 (82.248)	lr 0.01026
Train [67][2890/3239]	Time 0.718 (0.852)	Data Time 0.466 (0.361)	Loss 2.3700 (2.5915)	Entropy 0.61918 (0.62204)	Top-1 acc 64.453 (61.486)	Top-5 acc 84.766 (82.250)	lr 0.01026
Train [67][2900/3239]	Time 0.350 (0.852)	Data Time 0.001 (0.362)	Loss 2.6434 (2.5917)	Entropy 0.61935 (0.62203)	Top-1 acc 62.500 (61.479)	Top-5 acc 82.031 (82.247)	lr 0.01026
Train [67][2910/3239]	Time 0.258 (0.855)	Data Time 0.001 (0.365)	Loss 2.4815 (2.5916)	Entropy 0.61940 (0.62202)	Top-1 acc 63.281 (61.481)	Top-5 acc 84.766 (82.251)	lr 0.01025
Train [67][2920/3239]	Time 0.263 (0.854)	Data Time 0.001 (0.364)	Loss 2.4141 (2.5914)	Entropy 0.61941 (0.62202)	Top-1 acc 68.750 (61.483)	Top-5 acc 85.156 (82.254)	lr 0.01025
Train [67][2930/3239]	Time 0.230 (0.853)	Data Time 0.001 (0.363)	Loss 2.4601 (2.5912)	Entropy 0.61943 (0.62201)	Top-1 acc 66.406 (61.487)	Top-5 acc 83.984 (82.258)	lr 0.01025
Train [67][2940/3239]	Time 0.266 (0.868)	Data Time 0.002 (0.363)	Loss 2.7161 (2.5912)	Entropy 0.61905 (0.62200)	Top-1 acc 57.031 (61.486)	Top-5 acc 79.297 (82.257)	lr 0.01025
Train [67][2950/3239]	Time 0.244 (0.867)	Data Time 0.001 (0.362)	Loss 2.4941 (2.5915)	Entropy 0.61891 (0.62199)	Top-1 acc 62.500 (61.480)	Top-5 acc 82.812 (82.252)	lr 0.01025
Train [67][2960/3239]	Time 0.231 (0.865)	Data Time 0.001 (0.361)	Loss 2.4879 (2.5913)	Entropy 0.61866 (0.62198)	Top-1 acc 64.844 (61.489)	Top-5 acc 84.375 (82.259)	lr 0.01025
Train [67][2970/3239]	Time 0.257 (0.864)	Data Time 0.001 (0.360)	Loss 2.4942 (2.5911)	Entropy 0.61860 (0.62197)	Top-1 acc 64.844 (61.494)	Top-5 acc 82.031 (82.261)	lr 0.01025
Train [67][2980/3239]	Time 0.245 (0.862)	Data Time 0.001 (0.358)	Loss 2.6522 (2.5911)	Entropy 0.61878 (0.62195)	Top-1 acc 56.641 (61.489)	Top-5 acc 78.125 (82.261)	lr 0.01025
Train [67][2990/3239]	Time 0.262 (0.861)	Data Time 0.001 (0.357)	Loss 2.5786 (2.5912)	Entropy 0.61875 (0.62194)	Top-1 acc 60.938 (61.490)	Top-5 acc 81.250 (82.259)	lr 0.01025
Train [67][3000/3239]	Time 0.248 (0.859)	Data Time 0.001 (0.356)	Loss 2.5923 (2.5912)	Entropy 0.61877 (0.62193)	Top-1 acc 61.719 (61.488)	Top-5 acc 83.203 (82.260)	lr 0.01025
Train [67][3010/3239]	Time 0.266 (0.858)	Data Time 0.002 (0.355)	Loss 2.6057 (2.5914)	Entropy 0.61885 (0.62192)	Top-1 acc 62.109 (61.482)	Top-5 acc 82.031 (82.257)	lr 0.01024
Train [67][3020/3239]	Time 0.419 (0.858)	Data Time 0.172 (0.355)	Loss 2.3147 (2.5912)	Entropy 0.61876 (0.62191)	Top-1 acc 68.359 (61.484)	Top-5 acc 85.547 (82.263)	lr 0.01024
Train [67][3030/3239]	Time 0.245 (0.858)	Data Time 0.001 (0.355)	Loss 2.4805 (2.5914)	Entropy 0.61884 (0.62190)	Top-1 acc 67.188 (61.481)	Top-5 acc 84.375 (82.261)	lr 0.01024
Train [67][3040/3239]	Time 0.261 (0.860)	Data Time 0.002 (0.358)	Loss 2.8107 (2.5914)	Entropy 0.61858 (0.62189)	Top-1 acc 54.688 (61.479)	Top-5 acc 78.516 (82.259)	lr 0.01024
Train [67][3050/3239]	Time 0.252 (0.862)	Data Time 0.001 (0.359)	Loss 2.6588 (2.5915)	Entropy 0.61858 (0.62188)	Top-1 acc 62.500 (61.480)	Top-5 acc 81.641 (82.257)	lr 0.01024
Train [67][3060/3239]	Time 0.341 (0.862)	Data Time 0.001 (0.360)	Loss 2.7750 (2.5918)	Entropy 0.61802 (0.62187)	Top-1 acc 53.906 (61.472)	Top-5 acc 77.344 (82.251)	lr 0.01024
Train [67][3070/3239]	Time 0.226 (0.863)	Data Time 0.001 (0.361)	Loss 2.6137 (2.5917)	Entropy 0.61818 (0.62186)	Top-1 acc 65.234 (61.474)	Top-5 acc 80.859 (82.250)	lr 0.01024
Train [67][3080/3239]	Time 0.274 (0.865)	Data Time 0.003 (0.364)	Loss 2.5030 (2.5917)	Entropy 0.61822 (0.62185)	Top-1 acc 62.500 (61.474)	Top-5 acc 83.203 (82.248)	lr 0.01024
Train [67][3090/3239]	Time 0.238 (0.867)	Data Time 0.001 (0.365)	Loss 2.5192 (2.5919)	Entropy 0.61835 (0.62184)	Top-1 acc 60.547 (61.470)	Top-5 acc 84.375 (82.245)	lr 0.01024
Train [67][3100/3239]	Time 0.249 (0.866)	Data Time 0.001 (0.365)	Loss 2.6065 (2.5919)	Entropy 0.61778 (0.62182)	Top-1 acc 60.938 (61.470)	Top-5 acc 83.203 (82.248)	lr 0.01024
Train [67][3110/3239]	Time 0.235 (0.868)	Data Time 0.001 (0.367)	Loss 2.6575 (2.5919)	Entropy 0.61771 (0.62181)	Top-1 acc 62.500 (61.467)	Top-5 acc 78.125 (82.246)	lr 0.01023
Train [67][3120/3239]	Time 0.224 (0.868)	Data Time 0.001 (0.367)	Loss 2.5414 (2.5919)	Entropy 0.61774 (0.62180)	Top-1 acc 62.109 (61.468)	Top-5 acc 84.375 (82.246)	lr 0.01023
Train [67][3130/3239]	Time 2.372 (0.869)	Data Time 2.018 (0.369)	Loss 2.3644 (2.5916)	Entropy 0.61817 (0.62178)	Top-1 acc 69.922 (61.478)	Top-5 acc 85.938 (82.249)	lr 0.01023
Train [67][3140/3239]	Time 0.255 (0.872)	Data Time 0.001 (0.372)	Loss 2.5374 (2.5916)	Entropy 0.61803 (0.62177)	Top-1 acc 62.109 (61.478)	Top-5 acc 81.641 (82.249)	lr 0.01023
Train [67][3150/3239]	Time 0.232 (0.871)	Data Time 0.001 (0.371)	Loss 2.9033 (2.5917)	Entropy 0.61840 (0.62176)	Top-1 acc 52.734 (61.473)	Top-5 acc 75.781 (82.249)	lr 0.01023
Train [67][3160/3239]	Time 0.228 (0.873)	Data Time 0.001 (0.373)	Loss 2.5774 (2.5917)	Entropy 0.61837 (0.62175)	Top-1 acc 60.938 (61.474)	Top-5 acc 82.031 (82.250)	lr 0.01023
Train [67][3170/3239]	Time 0.237 (0.875)	Data Time 0.001 (0.375)	Loss 2.6583 (2.5916)	Entropy 0.61860 (0.62174)	Top-1 acc 59.766 (61.474)	Top-5 acc 80.078 (82.253)	lr 0.01023
Train [67][3180/3239]	Time 0.230 (0.874)	Data Time 0.000 (0.375)	Loss 2.4608 (2.5913)	Entropy 0.61850 (0.62173)	Top-1 acc 67.188 (61.480)	Top-5 acc 83.203 (82.258)	lr 0.01023
Train [67][3190/3239]	Time 0.263 (0.875)	Data Time 0.000 (0.377)	Loss 2.6848 (2.5912)	Entropy 0.61845 (0.62172)	Top-1 acc 56.641 (61.480)	Top-5 acc 82.812 (82.258)	lr 0.01023
Train [67][3200/3239]	Time 0.234 (0.876)	Data Time 0.000 (0.378)	Loss 2.6239 (2.5913)	Entropy 0.61846 (0.62171)	Top-1 acc 57.812 (61.477)	Top-5 acc 81.250 (82.256)	lr 0.01023
Train [67][3210/3239]	Time 0.235 (0.878)	Data Time 0.000 (0.380)	Loss 2.4060 (2.5912)	Entropy 0.61822 (0.62170)	Top-1 acc 62.891 (61.480)	Top-5 acc 85.156 (82.259)	lr 0.01023
Train [67][3220/3239]	Time 0.335 (0.878)	Data Time 0.000 (0.380)	Loss 2.4071 (2.5912)	Entropy 0.61852 (0.62169)	Top-1 acc 66.016 (61.479)	Top-5 acc 85.547 (82.256)	lr 0.01022
Train [67][3230/3239]	Time 0.226 (0.879)	Data Time 0.000 (0.381)	Loss 2.7073 (2.5912)	Entropy 0.61849 (0.62168)	Top-1 acc 60.547 (61.479)	Top-5 acc 80.859 (82.255)	lr 0.01022
Train [67][3239/3239]	Time 0.841 (0.879)	Data Time 0.000 (0.381)	Loss 2.3885 (2.5913)	Entropy 0.61818 (0.62167)	Top-1 acc 72.840 (61.478)	Top-5 acc 85.185 (82.253)	lr 0.01022
==========Valid [67/120]	loss 1.375	top-1 acc 68.558 (68.558)	top-5 acc 88.068	Train top-1 61.478	top-5 82.253	Entropy 0.61818	Latency-None: 0.000ms	Flops: 539.00M
Train [68][0/3239]	Time 44.056 (44.056)	Data Time 42.209 (42.209)	Loss 2.8124 (2.8124)	Entropy 0.61828 (0.61828)	Top-1 acc 56.250 (56.250)	Top-5 acc 80.469 (80.469)	lr 0.01022
Train [68][10/3239]	Time 0.223 (4.563)	Data Time 0.001 (3.845)	Loss 2.6412 (2.6141)	Entropy 0.61807 (0.61823)	Top-1 acc 58.594 (61.009)	Top-5 acc 79.688 (82.173)	lr 0.01022
Train [68][20/3239]	Time 0.250 (2.595)	Data Time 0.001 (2.015)	Loss 2.6146 (2.6166)	Entropy 0.61798 (0.61815)	Top-1 acc 61.719 (60.658)	Top-5 acc 82.422 (82.366)	lr 0.01022
Train [68][30/3239]	Time 0.276 (1.908)	Data Time 0.003 (1.366)	Loss 2.4497 (2.6090)	Entropy 0.61776 (0.61808)	Top-1 acc 63.672 (60.597)	Top-5 acc 86.719 (82.371)	lr 0.01022
Train [68][40/3239]	Time 0.225 (1.552)	Data Time 0.001 (1.033)	Loss 2.5651 (2.6012)	Entropy 0.61760 (0.61799)	Top-1 acc 62.891 (60.985)	Top-5 acc 82.422 (82.355)	lr 0.01022
Train [68][50/3239]	Time 0.234 (1.327)	Data Time 0.001 (0.831)	Loss 2.4696 (2.5962)	Entropy 0.61762 (0.61791)	Top-1 acc 66.016 (61.083)	Top-5 acc 82.812 (82.284)	lr 0.01022
Train [68][60/3239]	Time 0.222 (1.178)	Data Time 0.001 (0.695)	Loss 2.7254 (2.6030)	Entropy 0.61763 (0.61786)	Top-1 acc 59.766 (61.098)	Top-5 acc 80.078 (82.121)	lr 0.01022
Train [68][70/3239]	Time 0.224 (1.138)	Data Time 0.001 (0.657)	Loss 2.7791 (2.6001)	Entropy 0.61765 (0.61782)	Top-1 acc 55.078 (61.147)	Top-5 acc 78.125 (82.180)	lr 0.01022
Train [68][80/3239]	Time 0.249 (1.050)	Data Time 0.001 (0.576)	Loss 2.5599 (2.5988)	Entropy 0.61775 (0.61781)	Top-1 acc 62.891 (61.304)	Top-5 acc 82.422 (82.210)	lr 0.01021
Train [68][90/3239]	Time 0.232 (0.980)	Data Time 0.001 (0.513)	Loss 2.5474 (2.5890)	Entropy 0.61773 (0.61780)	Top-1 acc 63.281 (61.500)	Top-5 acc 84.375 (82.392)	lr 0.01021
Train [68][100/3239]	Time 1.386 (0.964)	Data Time 1.116 (0.499)	Loss 2.5216 (2.5850)	Entropy 0.61784 (0.61779)	Top-1 acc 62.109 (61.514)	Top-5 acc 83.203 (82.418)	lr 0.01021
Train [68][110/3239]	Time 0.252 (0.915)	Data Time 0.001 (0.455)	Loss 2.4399 (2.5826)	Entropy 0.61767 (0.61779)	Top-1 acc 67.578 (61.624)	Top-5 acc 84.766 (82.499)	lr 0.01021
Train [68][120/3239]	Time 0.413 (0.876)	Data Time 0.001 (0.417)	Loss 2.3313 (2.5804)	Entropy 0.61763 (0.61777)	Top-1 acc 66.016 (61.716)	Top-5 acc 87.891 (82.548)	lr 0.01021
Train [68][130/3239]	Time 0.238 (0.864)	Data Time 0.001 (0.406)	Loss 2.5603 (2.5804)	Entropy 0.61767 (0.61776)	Top-1 acc 62.500 (61.734)	Top-5 acc 82.422 (82.553)	lr 0.01021
Train [68][140/3239]	Time 0.248 (0.833)	Data Time 0.001 (0.377)	Loss 2.6960 (2.5777)	Entropy 0.61747 (0.61775)	Top-1 acc 61.719 (61.824)	Top-5 acc 78.516 (82.574)	lr 0.01021
Train [68][150/3239]	Time 0.249 (0.805)	Data Time 0.001 (0.352)	Loss 2.4158 (2.5779)	Entropy 0.61720 (0.61772)	Top-1 acc 66.016 (61.877)	Top-5 acc 84.766 (82.587)	lr 0.01021
Train [68][160/3239]	Time 2.677 (0.799)	Data Time 2.400 (0.345)	Loss 2.7196 (2.5786)	Entropy 0.61752 (0.61769)	Top-1 acc 58.203 (61.813)	Top-5 acc 80.078 (82.538)	lr 0.01021
Train [68][170/3239]	Time 0.244 (0.784)	Data Time 0.001 (0.333)	Loss 2.6583 (2.5807)	Entropy 0.61756 (0.61768)	Top-1 acc 59.375 (61.799)	Top-5 acc 79.688 (82.497)	lr 0.01021
Train [68][180/3239]	Time 0.236 (0.764)	Data Time 0.001 (0.315)	Loss 2.3831 (2.5839)	Entropy 0.61777 (0.61767)	Top-1 acc 64.453 (61.673)	Top-5 acc 85.547 (82.407)	lr 0.01020
Train [68][190/3239]	Time 0.322 (0.747)	Data Time 0.001 (0.299)	Loss 2.6959 (2.5820)	Entropy 0.61800 (0.61768)	Top-1 acc 61.328 (61.723)	Top-5 acc 78.516 (82.420)	lr 0.01020
Train [68][200/3239]	Time 0.250 (0.748)	Data Time 0.003 (0.300)	Loss 2.5721 (2.5831)	Entropy 0.61837 (0.61770)	Top-1 acc 62.891 (61.754)	Top-5 acc 84.375 (82.369)	lr 0.01020
Train [68][210/3239]	Time 0.287 (0.735)	Data Time 0.002 (0.288)	Loss 2.4988 (2.5841)	Entropy 0.61866 (0.61774)	Top-1 acc 66.016 (61.730)	Top-5 acc 85.156 (82.372)	lr 0.01020
Train [68][220/3239]	Time 0.267 (0.725)	Data Time 0.001 (0.275)	Loss 2.6315 (2.5851)	Entropy 0.61866 (0.61778)	Top-1 acc 60.938 (61.676)	Top-5 acc 80.859 (82.344)	lr 0.01020
Train [68][230/3239]	Time 0.234 (0.714)	Data Time 0.001 (0.264)	Loss 2.6445 (2.5845)	Entropy 0.61820 (0.61781)	Top-1 acc 60.938 (61.693)	Top-5 acc 81.641 (82.353)	lr 0.01020
Train [68][240/3239]	Time 0.240 (0.702)	Data Time 0.001 (0.254)	Loss 2.5427 (2.5850)	Entropy 0.61817 (0.61783)	Top-1 acc 64.844 (61.688)	Top-5 acc 83.203 (82.362)	lr 0.01020
Train [68][250/3239]	Time 0.260 (0.691)	Data Time 0.002 (0.244)	Loss 2.4840 (2.5832)	Entropy 0.61827 (0.61784)	Top-1 acc 62.109 (61.722)	Top-5 acc 83.984 (82.392)	lr 0.01020
Train [68][260/3239]	Time 0.241 (0.700)	Data Time 0.001 (0.253)	Loss 2.5474 (2.5840)	Entropy 0.61831 (0.61786)	Top-1 acc 62.891 (61.681)	Top-5 acc 84.375 (82.390)	lr 0.01020
Train [68][270/3239]	Time 0.239 (0.689)	Data Time 0.001 (0.244)	Loss 2.5549 (2.5831)	Entropy 0.61860 (0.61788)	Top-1 acc 60.156 (61.723)	Top-5 acc 84.375 (82.396)	lr 0.01020
Train [68][280/3239]	Time 0.384 (0.680)	Data Time 0.001 (0.235)	Loss 2.6975 (2.5840)	Entropy 0.61828 (0.61790)	Top-1 acc 57.031 (61.662)	Top-5 acc 82.031 (82.397)	lr 0.01019
Train [68][290/3239]	Time 0.273 (0.672)	Data Time 0.001 (0.227)	Loss 2.5031 (2.5825)	Entropy 0.61836 (0.61792)	Top-1 acc 64.453 (61.728)	Top-5 acc 84.766 (82.445)	lr 0.01019
Train [68][300/3239]	Time 0.260 (0.672)	Data Time 0.001 (0.228)	Loss 2.7363 (2.5821)	Entropy 0.61805 (0.61793)	Top-1 acc 57.812 (61.742)	Top-5 acc 80.859 (82.458)	lr 0.01019
Train [68][310/3239]	Time 0.256 (0.664)	Data Time 0.001 (0.220)	Loss 2.6767 (2.5827)	Entropy 0.61802 (0.61793)	Top-1 acc 58.203 (61.735)	Top-5 acc 78.516 (82.419)	lr 0.01019
Train [68][320/3239]	Time 0.233 (0.657)	Data Time 0.001 (0.213)	Loss 2.5029 (2.5813)	Entropy 0.61813 (0.61793)	Top-1 acc 63.281 (61.754)	Top-5 acc 83.203 (82.462)	lr 0.01019
Train [68][330/3239]	Time 0.237 (0.664)	Data Time 0.001 (0.221)	Loss 2.6258 (2.5814)	Entropy 0.61819 (0.61795)	Top-1 acc 55.859 (61.749)	Top-5 acc 82.422 (82.445)	lr 0.01019
Train [68][340/3239]	Time 0.233 (0.658)	Data Time 0.001 (0.215)	Loss 2.6629 (2.5812)	Entropy 0.61831 (0.61795)	Top-1 acc 58.594 (61.736)	Top-5 acc 76.172 (82.449)	lr 0.01019
Train [68][350/3239]	Time 0.591 (0.778)	Data Time 0.004 (0.209)	Loss 2.4831 (2.5797)	Entropy 0.61866 (0.61797)	Top-1 acc 64.453 (61.789)	Top-5 acc 81.250 (82.459)	lr 0.01019
Train [68][360/3239]	Time 0.238 (0.769)	Data Time 0.002 (0.203)	Loss 2.5922 (2.5801)	Entropy 0.61862 (0.61799)	Top-1 acc 60.938 (61.767)	Top-5 acc 82.422 (82.469)	lr 0.01019
Train [68][370/3239]	Time 0.243 (0.759)	Data Time 0.001 (0.198)	Loss 2.6406 (2.5808)	Entropy 0.61856 (0.61800)	Top-1 acc 57.812 (61.751)	Top-5 acc 81.641 (82.465)	lr 0.01019
Train [68][380/3239]	Time 0.251 (0.751)	Data Time 0.002 (0.192)	Loss 2.3981 (2.5797)	Entropy 0.61871 (0.61802)	Top-1 acc 67.578 (61.778)	Top-5 acc 87.109 (82.504)	lr 0.01018
Train [68][390/3239]	Time 0.266 (0.742)	Data Time 0.001 (0.188)	Loss 2.4185 (2.5798)	Entropy 0.61832 (0.61803)	Top-1 acc 64.844 (61.758)	Top-5 acc 84.766 (82.501)	lr 0.01018
Train [68][400/3239]	Time 0.263 (0.736)	Data Time 0.002 (0.183)	Loss 2.7121 (2.5797)	Entropy 0.61848 (0.61804)	Top-1 acc 58.203 (61.776)	Top-5 acc 80.469 (82.502)	lr 0.01018
Train [68][410/3239]	Time 0.236 (0.729)	Data Time 0.001 (0.179)	Loss 2.7192 (2.5809)	Entropy 0.61843 (0.61805)	Top-1 acc 57.031 (61.765)	Top-5 acc 80.078 (82.483)	lr 0.01018
Train [68][420/3239]	Time 0.244 (0.723)	Data Time 0.001 (0.174)	Loss 2.6165 (2.5810)	Entropy 0.61805 (0.61806)	Top-1 acc 58.594 (61.741)	Top-5 acc 82.422 (82.481)	lr 0.01018
Train [68][430/3239]	Time 0.239 (0.717)	Data Time 0.001 (0.170)	Loss 2.5328 (2.5817)	Entropy 0.61772 (0.61806)	Top-1 acc 60.547 (61.697)	Top-5 acc 82.422 (82.463)	lr 0.01018
Train [68][440/3239]	Time 0.358 (0.711)	Data Time 0.002 (0.167)	Loss 2.6076 (2.5826)	Entropy 0.61736 (0.61805)	Top-1 acc 62.109 (61.662)	Top-5 acc 82.812 (82.440)	lr 0.01018
Train [68][450/3239]	Time 0.326 (0.705)	Data Time 0.001 (0.163)	Loss 2.5180 (2.5828)	Entropy 0.61736 (0.61803)	Top-1 acc 66.797 (61.635)	Top-5 acc 82.812 (82.440)	lr 0.01018
Train [68][460/3239]	Time 0.281 (0.700)	Data Time 0.001 (0.159)	Loss 2.4554 (2.5830)	Entropy 0.61746 (0.61802)	Top-1 acc 66.016 (61.648)	Top-5 acc 87.109 (82.418)	lr 0.01018
Train [68][470/3239]	Time 0.280 (0.696)	Data Time 0.002 (0.156)	Loss 2.4821 (2.5829)	Entropy 0.61783 (0.61801)	Top-1 acc 63.281 (61.644)	Top-5 acc 83.984 (82.416)	lr 0.01018
Train [68][480/3239]	Time 0.248 (0.691)	Data Time 0.001 (0.153)	Loss 2.6843 (2.5834)	Entropy 0.61823 (0.61801)	Top-1 acc 58.203 (61.617)	Top-5 acc 81.250 (82.410)	lr 0.01017
Train [68][490/3239]	Time 0.259 (0.686)	Data Time 0.001 (0.150)	Loss 2.5715 (2.5831)	Entropy 0.61780 (0.61801)	Top-1 acc 63.281 (61.644)	Top-5 acc 82.031 (82.409)	lr 0.01017
Train [68][500/3239]	Time 0.266 (0.683)	Data Time 0.002 (0.148)	Loss 2.6610 (2.5842)	Entropy 0.61781 (0.61801)	Top-1 acc 61.719 (61.622)	Top-5 acc 82.422 (82.398)	lr 0.01017
Train [68][510/3239]	Time 0.406 (0.679)	Data Time 0.001 (0.146)	Loss 2.5910 (2.5866)	Entropy 0.61760 (0.61800)	Top-1 acc 60.547 (61.583)	Top-5 acc 80.859 (82.358)	lr 0.01017
Train [68][520/3239]	Time 0.289 (0.675)	Data Time 0.001 (0.143)	Loss 2.7113 (2.5871)	Entropy 0.61784 (0.61800)	Top-1 acc 60.156 (61.579)	Top-5 acc 80.469 (82.362)	lr 0.01017
Train [68][530/3239]	Time 0.243 (0.678)	Data Time 0.001 (0.147)	Loss 2.8476 (2.5872)	Entropy 0.61753 (0.61799)	Top-1 acc 53.125 (61.578)	Top-5 acc 79.297 (82.370)	lr 0.01017
Train [68][540/3239]	Time 0.252 (0.675)	Data Time 0.003 (0.144)	Loss 2.5459 (2.5868)	Entropy 0.61795 (0.61799)	Top-1 acc 62.891 (61.591)	Top-5 acc 83.594 (82.375)	lr 0.01017
Train [68][550/3239]	Time 0.238 (0.670)	Data Time 0.001 (0.142)	Loss 2.6262 (2.5873)	Entropy 0.61802 (0.61799)	Top-1 acc 58.984 (61.583)	Top-5 acc 83.594 (82.375)	lr 0.01017
Train [68][560/3239]	Time 0.242 (0.676)	Data Time 0.001 (0.149)	Loss 2.5794 (2.5861)	Entropy 0.61794 (0.61799)	Top-1 acc 58.984 (61.592)	Top-5 acc 83.984 (82.407)	lr 0.01017
Train [68][570/3239]	Time 0.251 (0.672)	Data Time 0.001 (0.146)	Loss 2.6375 (2.5857)	Entropy 0.61785 (0.61799)	Top-1 acc 58.594 (61.603)	Top-5 acc 83.984 (82.421)	lr 0.01017
Train [68][580/3239]	Time 0.262 (0.669)	Data Time 0.001 (0.144)	Loss 2.4916 (2.5851)	Entropy 0.61804 (0.61798)	Top-1 acc 67.188 (61.619)	Top-5 acc 81.641 (82.424)	lr 0.01016
Train [68][590/3239]	Time 0.235 (0.675)	Data Time 0.001 (0.151)	Loss 2.4906 (2.5868)	Entropy 0.61792 (0.61799)	Top-1 acc 67.188 (61.594)	Top-5 acc 83.594 (82.393)	lr 0.01016
Train [68][600/3239]	Time 0.301 (0.671)	Data Time 0.001 (0.149)	Loss 2.6436 (2.5876)	Entropy 0.61747 (0.61798)	Top-1 acc 62.500 (61.573)	Top-5 acc 82.031 (82.386)	lr 0.01016
Train [68][610/3239]	Time 0.264 (0.667)	Data Time 0.001 (0.146)	Loss 2.5804 (2.5878)	Entropy 0.61764 (0.61798)	Top-1 acc 60.156 (61.565)	Top-5 acc 83.203 (82.378)	lr 0.01016
Train [68][620/3239]	Time 0.275 (0.670)	Data Time 0.001 (0.150)	Loss 2.8294 (2.5870)	Entropy 0.61741 (0.61797)	Top-1 acc 56.250 (61.589)	Top-5 acc 78.125 (82.405)	lr 0.01016
Train [68][630/3239]	Time 0.249 (0.666)	Data Time 0.001 (0.148)	Loss 2.5569 (2.5858)	Entropy 0.61755 (0.61796)	Top-1 acc 60.547 (61.615)	Top-5 acc 82.031 (82.417)	lr 0.01016
Train [68][640/3239]	Time 0.247 (0.663)	Data Time 0.001 (0.145)	Loss 2.5829 (2.5857)	Entropy 0.61721 (0.61795)	Top-1 acc 62.109 (61.611)	Top-5 acc 83.984 (82.422)	lr 0.01016
Train [68][650/3239]	Time 0.250 (0.660)	Data Time 0.002 (0.143)	Loss 2.5762 (2.5855)	Entropy 0.61685 (0.61794)	Top-1 acc 62.891 (61.615)	Top-5 acc 81.641 (82.435)	lr 0.01016
Train [68][660/3239]	Time 0.303 (0.661)	Data Time 0.001 (0.145)	Loss 2.4263 (2.5863)	Entropy 0.61706 (0.61792)	Top-1 acc 64.453 (61.605)	Top-5 acc 86.328 (82.414)	lr 0.01016
Train [68][670/3239]	Time 0.366 (0.657)	Data Time 0.001 (0.143)	Loss 2.4805 (2.5866)	Entropy 0.61726 (0.61791)	Top-1 acc 62.891 (61.577)	Top-5 acc 83.594 (82.406)	lr 0.01016
Train [68][680/3239]	Time 0.300 (0.655)	Data Time 0.002 (0.141)	Loss 2.5559 (2.5856)	Entropy 0.61703 (0.61790)	Top-1 acc 63.281 (61.599)	Top-5 acc 80.859 (82.429)	lr 0.01015
Train [68][690/3239]	Time 0.271 (0.660)	Data Time 0.001 (0.146)	Loss 2.5741 (2.5846)	Entropy 0.61698 (0.61789)	Top-1 acc 62.109 (61.633)	Top-5 acc 82.422 (82.451)	lr 0.01015
Train [68][700/3239]	Time 0.248 (0.657)	Data Time 0.002 (0.144)	Loss 2.5350 (2.5847)	Entropy 0.61682 (0.61787)	Top-1 acc 64.062 (61.647)	Top-5 acc 82.812 (82.450)	lr 0.01015
Train [68][710/3239]	Time 0.286 (0.654)	Data Time 0.001 (0.142)	Loss 2.6688 (2.5854)	Entropy 0.61669 (0.61786)	Top-1 acc 60.547 (61.634)	Top-5 acc 82.812 (82.447)	lr 0.01015
Train [68][720/3239]	Time 0.296 (0.655)	Data Time 0.001 (0.144)	Loss 2.4883 (2.5853)	Entropy 0.61682 (0.61784)	Top-1 acc 66.797 (61.630)	Top-5 acc 82.031 (82.453)	lr 0.01015
Train [68][730/3239]	Time 0.256 (0.652)	Data Time 0.001 (0.142)	Loss 2.5175 (2.5858)	Entropy 0.61683 (0.61783)	Top-1 acc 61.328 (61.602)	Top-5 acc 82.812 (82.447)	lr 0.01015
Train [68][740/3239]	Time 0.432 (0.649)	Data Time 0.001 (0.140)	Loss 2.4470 (2.5848)	Entropy 0.61677 (0.61782)	Top-1 acc 68.750 (61.625)	Top-5 acc 85.547 (82.464)	lr 0.01015
Train [68][750/3239]	Time 0.279 (0.657)	Data Time 0.004 (0.148)	Loss 2.5784 (2.5847)	Entropy 0.61691 (0.61780)	Top-1 acc 60.938 (61.614)	Top-5 acc 82.422 (82.468)	lr 0.01015
Train [68][760/3239]	Time 0.267 (0.654)	Data Time 0.001 (0.146)	Loss 2.4663 (2.5838)	Entropy 0.61704 (0.61779)	Top-1 acc 65.625 (61.632)	Top-5 acc 85.156 (82.481)	lr 0.01015
Train [68][770/3239]	Time 0.239 (0.651)	Data Time 0.001 (0.145)	Loss 2.4659 (2.5833)	Entropy 0.61703 (0.61778)	Top-1 acc 64.844 (61.645)	Top-5 acc 80.859 (82.481)	lr 0.01015
Train [68][780/3239]	Time 0.254 (0.657)	Data Time 0.001 (0.151)	Loss 2.7958 (2.5830)	Entropy 0.61715 (0.61777)	Top-1 acc 56.641 (61.648)	Top-5 acc 78.906 (82.482)	lr 0.01014
Train [68][790/3239]	Time 0.256 (0.654)	Data Time 0.002 (0.149)	Loss 2.6021 (2.5824)	Entropy 0.61723 (0.61776)	Top-1 acc 63.281 (61.664)	Top-5 acc 81.250 (82.494)	lr 0.01014
Train [68][800/3239]	Time 0.272 (0.651)	Data Time 0.001 (0.147)	Loss 2.6990 (2.5832)	Entropy 0.61733 (0.61776)	Top-1 acc 61.328 (61.653)	Top-5 acc 78.906 (82.477)	lr 0.01014
Train [68][810/3239]	Time 0.248 (0.649)	Data Time 0.001 (0.145)	Loss 2.5822 (2.5828)	Entropy 0.61749 (0.61775)	Top-1 acc 60.547 (61.657)	Top-5 acc 83.203 (82.483)	lr 0.01014
Train [68][820/3239]	Time 0.238 (0.648)	Data Time 0.001 (0.145)	Loss 2.6131 (2.5824)	Entropy 0.61745 (0.61775)	Top-1 acc 60.547 (61.660)	Top-5 acc 81.250 (82.490)	lr 0.01014
Train [68][830/3239]	Time 0.400 (0.646)	Data Time 0.001 (0.144)	Loss 2.8013 (2.5827)	Entropy 0.61714 (0.61775)	Top-1 acc 56.641 (61.653)	Top-5 acc 78.906 (82.483)	lr 0.01014
Train [68][840/3239]	Time 0.281 (0.643)	Data Time 0.001 (0.142)	Loss 2.6398 (2.5829)	Entropy 0.61722 (0.61774)	Top-1 acc 59.766 (61.651)	Top-5 acc 80.469 (82.478)	lr 0.01014
Train [68][850/3239]	Time 0.268 (0.643)	Data Time 0.001 (0.143)	Loss 2.3965 (2.5826)	Entropy 0.61717 (0.61773)	Top-1 acc 65.625 (61.665)	Top-5 acc 84.375 (82.484)	lr 0.01014
Train [68][860/3239]	Time 0.263 (0.641)	Data Time 0.001 (0.142)	Loss 2.8344 (2.5834)	Entropy 0.61753 (0.61773)	Top-1 acc 53.516 (61.638)	Top-5 acc 80.859 (82.466)	lr 0.01014
Train [68][870/3239]	Time 0.267 (0.639)	Data Time 0.002 (0.140)	Loss 2.4830 (2.5839)	Entropy 0.61786 (0.61773)	Top-1 acc 64.062 (61.631)	Top-5 acc 84.766 (82.456)	lr 0.01014
Train [68][880/3239]	Time 0.262 (0.642)	Data Time 0.001 (0.144)	Loss 2.7019 (2.5836)	Entropy 0.61807 (0.61773)	Top-1 acc 59.766 (61.645)	Top-5 acc 77.734 (82.463)	lr 0.01013
Train [68][890/3239]	Time 0.253 (0.640)	Data Time 0.001 (0.142)	Loss 2.5036 (2.5836)	Entropy 0.61802 (0.61773)	Top-1 acc 61.328 (61.644)	Top-5 acc 83.594 (82.460)	lr 0.01013
Train [68][900/3239]	Time 0.349 (0.641)	Data Time 0.001 (0.144)	Loss 2.4933 (2.5830)	Entropy 0.61799 (0.61774)	Top-1 acc 63.672 (61.667)	Top-5 acc 85.547 (82.466)	lr 0.01013
Train [68][910/3239]	Time 0.241 (0.646)	Data Time 0.001 (0.149)	Loss 2.5415 (2.5831)	Entropy 0.61786 (0.61774)	Top-1 acc 60.156 (61.666)	Top-5 acc 82.812 (82.467)	lr 0.01013
Train [68][920/3239]	Time 0.251 (0.643)	Data Time 0.001 (0.148)	Loss 2.5621 (2.5835)	Entropy 0.61787 (0.61774)	Top-1 acc 60.156 (61.651)	Top-5 acc 82.422 (82.474)	lr 0.01013
Train [68][930/3239]	Time 0.256 (0.642)	Data Time 0.002 (0.146)	Loss 2.5003 (2.5833)	Entropy 0.61798 (0.61774)	Top-1 acc 62.109 (61.670)	Top-5 acc 85.156 (82.471)	lr 0.01013
Train [68][940/3239]	Time 0.246 (0.651)	Data Time 0.002 (0.156)	Loss 2.6340 (2.5837)	Entropy 0.61801 (0.61774)	Top-1 acc 57.422 (61.666)	Top-5 acc 82.812 (82.469)	lr 0.01013
Train [68][950/3239]	Time 0.232 (0.648)	Data Time 0.001 (0.154)	Loss 2.3479 (2.5830)	Entropy 0.61816 (0.61775)	Top-1 acc 67.578 (61.678)	Top-5 acc 87.891 (82.490)	lr 0.01013
Train [68][960/3239]	Time 0.233 (0.646)	Data Time 0.001 (0.153)	Loss 2.4958 (2.5822)	Entropy 0.61825 (0.61775)	Top-1 acc 64.062 (61.689)	Top-5 acc 83.594 (82.496)	lr 0.01013
Train [68][970/3239]	Time 0.247 (0.644)	Data Time 0.001 (0.151)	Loss 2.6219 (2.5828)	Entropy 0.61841 (0.61776)	Top-1 acc 59.766 (61.676)	Top-5 acc 80.469 (82.484)	lr 0.01013
Train [68][980/3239]	Time 0.280 (0.649)	Data Time 0.002 (0.157)	Loss 2.5483 (2.5834)	Entropy 0.61842 (0.61777)	Top-1 acc 65.625 (61.655)	Top-5 acc 81.250 (82.473)	lr 0.01012
Train [68][990/3239]	Time 0.342 (0.653)	Data Time 0.001 (0.161)	Loss 2.5652 (2.5828)	Entropy 0.61848 (0.61777)	Top-1 acc 66.406 (61.672)	Top-5 acc 82.812 (82.479)	lr 0.01012
Train [68][1000/3239]	Time 0.240 (0.650)	Data Time 0.001 (0.159)	Loss 2.4973 (2.5826)	Entropy 0.61811 (0.61778)	Top-1 acc 64.453 (61.679)	Top-5 acc 84.766 (82.492)	lr 0.01012
Train [68][1010/3239]	Time 0.286 (0.691)	Data Time 0.002 (0.159)	Loss 2.3780 (2.5823)	Entropy 0.61816 (0.61778)	Top-1 acc 67.578 (61.692)	Top-5 acc 88.672 (82.500)	lr 0.01012
Train [68][1020/3239]	Time 0.239 (0.689)	Data Time 0.001 (0.157)	Loss 2.4829 (2.5822)	Entropy 0.61780 (0.61778)	Top-1 acc 62.500 (61.696)	Top-5 acc 85.156 (82.508)	lr 0.01012
Train [68][1030/3239]	Time 0.247 (0.686)	Data Time 0.001 (0.156)	Loss 2.4811 (2.5825)	Entropy 0.61760 (0.61778)	Top-1 acc 66.406 (61.687)	Top-5 acc 86.328 (82.505)	lr 0.01012
Train [68][1040/3239]	Time 0.256 (0.684)	Data Time 0.001 (0.154)	Loss 2.4163 (2.5820)	Entropy 0.61757 (0.61778)	Top-1 acc 67.578 (61.701)	Top-5 acc 85.547 (82.514)	lr 0.01012
Train [68][1050/3239]	Time 0.254 (0.681)	Data Time 0.002 (0.153)	Loss 2.8485 (2.5818)	Entropy 0.61749 (0.61778)	Top-1 acc 54.688 (61.702)	Top-5 acc 79.688 (82.520)	lr 0.01012
Train [68][1060/3239]	Time 0.349 (0.679)	Data Time 0.001 (0.151)	Loss 2.5504 (2.5813)	Entropy 0.61730 (0.61778)	Top-1 acc 63.672 (61.719)	Top-5 acc 85.547 (82.528)	lr 0.01012
Train [68][1070/3239]	Time 0.252 (0.677)	Data Time 0.002 (0.150)	Loss 2.7953 (2.5817)	Entropy 0.61751 (0.61777)	Top-1 acc 57.031 (61.709)	Top-5 acc 80.078 (82.524)	lr 0.01012
Train [68][1080/3239]	Time 0.240 (0.675)	Data Time 0.001 (0.148)	Loss 2.7191 (2.5820)	Entropy 0.61729 (0.61777)	Top-1 acc 56.641 (61.695)	Top-5 acc 80.469 (82.525)	lr 0.01011
Train [68][1090/3239]	Time 0.239 (0.673)	Data Time 0.001 (0.147)	Loss 2.6750 (2.5820)	Entropy 0.61745 (0.61777)	Top-1 acc 57.422 (61.684)	Top-5 acc 81.250 (82.526)	lr 0.01011
Train [68][1100/3239]	Time 0.242 (0.671)	Data Time 0.001 (0.146)	Loss 2.4734 (2.5825)	Entropy 0.61714 (0.61776)	Top-1 acc 63.281 (61.668)	Top-5 acc 84.375 (82.521)	lr 0.01011
Train [68][1110/3239]	Time 0.306 (0.675)	Data Time 0.001 (0.150)	Loss 2.4838 (2.5824)	Entropy 0.61734 (0.61776)	Top-1 acc 64.453 (61.666)	Top-5 acc 84.375 (82.521)	lr 0.01011
Train [68][1120/3239]	Time 0.264 (0.672)	Data Time 0.001 (0.149)	Loss 2.4257 (2.5819)	Entropy 0.61755 (0.61776)	Top-1 acc 66.797 (61.685)	Top-5 acc 85.938 (82.523)	lr 0.01011
Train [68][1130/3239]	Time 0.225 (0.670)	Data Time 0.001 (0.148)	Loss 2.5906 (2.5820)	Entropy 0.61760 (0.61775)	Top-1 acc 58.984 (61.675)	Top-5 acc 81.250 (82.522)	lr 0.01011
Train [68][1140/3239]	Time 8.018 (0.678)	Data Time 7.767 (0.156)	Loss 2.6142 (2.5819)	Entropy 0.61748 (0.61775)	Top-1 acc 60.938 (61.665)	Top-5 acc 83.203 (82.526)	lr 0.01011
Train [68][1150/3239]	Time 0.373 (0.676)	Data Time 0.001 (0.155)	Loss 2.3721 (2.5816)	Entropy 0.61770 (0.61775)	Top-1 acc 69.531 (61.671)	Top-5 acc 85.547 (82.535)	lr 0.01011
Train [68][1160/3239]	Time 0.234 (0.674)	Data Time 0.001 (0.154)	Loss 2.5138 (2.5818)	Entropy 0.61733 (0.61775)	Top-1 acc 64.844 (61.669)	Top-5 acc 83.203 (82.538)	lr 0.01011
Train [68][1170/3239]	Time 0.314 (0.672)	Data Time 0.075 (0.152)	Loss 2.6146 (2.5818)	Entropy 0.61741 (0.61775)	Top-1 acc 58.984 (61.658)	Top-5 acc 82.031 (82.536)	lr 0.01011
Train [68][1180/3239]	Time 0.247 (0.678)	Data Time 0.001 (0.159)	Loss 2.6089 (2.5818)	Entropy 0.61717 (0.61774)	Top-1 acc 57.812 (61.648)	Top-5 acc 83.594 (82.548)	lr 0.01010
Train [68][1190/3239]	Time 0.241 (0.676)	Data Time 0.001 (0.158)	Loss 2.8557 (2.5823)	Entropy 0.61743 (0.61774)	Top-1 acc 53.516 (61.635)	Top-5 acc 76.562 (82.537)	lr 0.01010
Train [68][1200/3239]	Time 0.232 (0.674)	Data Time 0.001 (0.157)	Loss 2.4374 (2.5823)	Entropy 0.61757 (0.61773)	Top-1 acc 63.281 (61.633)	Top-5 acc 87.109 (82.539)	lr 0.01010
Train [68][1210/3239]	Time 0.277 (0.680)	Data Time 0.001 (0.163)	Loss 2.5065 (2.5821)	Entropy 0.61810 (0.61773)	Top-1 acc 61.328 (61.644)	Top-5 acc 81.641 (82.543)	lr 0.01010
Train [68][1220/3239]	Time 0.324 (0.678)	Data Time 0.001 (0.162)	Loss 2.5684 (2.5818)	Entropy 0.61847 (0.61774)	Top-1 acc 62.891 (61.651)	Top-5 acc 83.203 (82.550)	lr 0.01010
Train [68][1230/3239]	Time 0.243 (0.676)	Data Time 0.001 (0.161)	Loss 2.6930 (2.5822)	Entropy 0.61865 (0.61774)	Top-1 acc 59.375 (61.643)	Top-5 acc 81.250 (82.547)	lr 0.01010
Train [68][1240/3239]	Time 0.257 (0.681)	Data Time 0.001 (0.167)	Loss 2.3937 (2.5825)	Entropy 0.61820 (0.61775)	Top-1 acc 67.578 (61.643)	Top-5 acc 84.766 (82.539)	lr 0.01010
Train [68][1250/3239]	Time 0.246 (0.679)	Data Time 0.001 (0.165)	Loss 2.5994 (2.5824)	Entropy 0.61841 (0.61776)	Top-1 acc 60.938 (61.644)	Top-5 acc 82.422 (82.544)	lr 0.01010
Train [68][1260/3239]	Time 0.241 (0.677)	Data Time 0.001 (0.164)	Loss 2.3506 (2.5824)	Entropy 0.61808 (0.61776)	Top-1 acc 68.359 (61.647)	Top-5 acc 86.328 (82.540)	lr 0.01010
Train [68][1270/3239]	Time 0.248 (0.683)	Data Time 0.001 (0.170)	Loss 2.5935 (2.5825)	Entropy 0.61827 (0.61776)	Top-1 acc 59.766 (61.642)	Top-5 acc 83.594 (82.541)	lr 0.01010
Train [68][1280/3239]	Time 0.233 (0.681)	Data Time 0.001 (0.169)	Loss 2.5696 (2.5825)	Entropy 0.61833 (0.61777)	Top-1 acc 64.062 (61.647)	Top-5 acc 83.594 (82.543)	lr 0.01010
Train [68][1290/3239]	Time 0.249 (0.679)	Data Time 0.001 (0.168)	Loss 2.5684 (2.5825)	Entropy 0.61869 (0.61777)	Top-1 acc 58.984 (61.648)	Top-5 acc 83.594 (82.543)	lr 0.01009
Train [68][1300/3239]	Time 6.894 (0.687)	Data Time 6.656 (0.176)	Loss 2.6645 (2.5822)	Entropy 0.61895 (0.61778)	Top-1 acc 57.812 (61.654)	Top-5 acc 78.906 (82.544)	lr 0.01009
Train [68][1310/3239]	Time 0.272 (0.685)	Data Time 0.001 (0.175)	Loss 2.5346 (2.5826)	Entropy 0.61903 (0.61779)	Top-1 acc 59.375 (61.649)	Top-5 acc 82.812 (82.537)	lr 0.01009
Train [68][1320/3239]	Time 0.265 (0.683)	Data Time 0.002 (0.173)	Loss 2.5999 (2.5826)	Entropy 0.61901 (0.61780)	Top-1 acc 61.719 (61.647)	Top-5 acc 81.250 (82.530)	lr 0.01009
Train [68][1330/3239]	Time 5.129 (0.685)	Data Time 4.855 (0.176)	Loss 2.5866 (2.5823)	Entropy 0.61893 (0.61781)	Top-1 acc 60.938 (61.653)	Top-5 acc 83.594 (82.534)	lr 0.01009
Train [68][1340/3239]	Time 0.287 (0.687)	Data Time 0.001 (0.179)	Loss 2.5211 (2.5823)	Entropy 0.61869 (0.61782)	Top-1 acc 61.328 (61.657)	Top-5 acc 83.594 (82.535)	lr 0.01009
Train [68][1350/3239]	Time 0.228 (0.685)	Data Time 0.001 (0.177)	Loss 2.5618 (2.5822)	Entropy 0.61892 (0.61782)	Top-1 acc 59.375 (61.653)	Top-5 acc 83.984 (82.537)	lr 0.01009
Train [68][1360/3239]	Time 0.237 (0.683)	Data Time 0.001 (0.176)	Loss 2.5674 (2.5821)	Entropy 0.61894 (0.61783)	Top-1 acc 63.281 (61.658)	Top-5 acc 82.031 (82.540)	lr 0.01009
Train [68][1370/3239]	Time 0.231 (0.690)	Data Time 0.001 (0.183)	Loss 2.7084 (2.5819)	Entropy 0.61905 (0.61784)	Top-1 acc 58.594 (61.660)	Top-5 acc 81.641 (82.545)	lr 0.01009
Train [68][1380/3239]	Time 0.319 (0.688)	Data Time 0.001 (0.182)	Loss 2.6263 (2.5823)	Entropy 0.61919 (0.61785)	Top-1 acc 62.109 (61.653)	Top-5 acc 78.125 (82.537)	lr 0.01009
Train [68][1390/3239]	Time 0.254 (0.687)	Data Time 0.001 (0.182)	Loss 2.8061 (2.5828)	Entropy 0.61907 (0.61786)	Top-1 acc 56.250 (61.640)	Top-5 acc 77.734 (82.526)	lr 0.01008
Train [68][1400/3239]	Time 0.236 (0.693)	Data Time 0.001 (0.189)	Loss 2.9548 (2.5827)	Entropy 0.61916 (0.61787)	Top-1 acc 52.344 (61.650)	Top-5 acc 75.781 (82.526)	lr 0.01008
Train [68][1410/3239]	Time 0.234 (0.695)	Data Time 0.001 (0.191)	Loss 2.6100 (2.5826)	Entropy 0.61916 (0.61788)	Top-1 acc 57.812 (61.651)	Top-5 acc 82.031 (82.527)	lr 0.01008
Train [68][1420/3239]	Time 0.286 (0.693)	Data Time 0.002 (0.189)	Loss 2.6129 (2.5826)	Entropy 0.61924 (0.61789)	Top-1 acc 62.500 (61.656)	Top-5 acc 81.641 (82.525)	lr 0.01008
Train [68][1430/3239]	Time 0.236 (0.698)	Data Time 0.002 (0.195)	Loss 2.4782 (2.5830)	Entropy 0.61925 (0.61789)	Top-1 acc 64.453 (61.648)	Top-5 acc 84.375 (82.516)	lr 0.01008
Train [68][1440/3239]	Time 0.240 (0.698)	Data Time 0.001 (0.196)	Loss 2.6118 (2.5830)	Entropy 0.61902 (0.61790)	Top-1 acc 61.328 (61.649)	Top-5 acc 79.297 (82.509)	lr 0.01008
Train [68][1450/3239]	Time 0.341 (0.696)	Data Time 0.001 (0.194)	Loss 2.4527 (2.5831)	Entropy 0.61897 (0.61791)	Top-1 acc 67.188 (61.649)	Top-5 acc 84.375 (82.510)	lr 0.01008
Train [68][1460/3239]	Time 11.215 (0.703)	Data Time 10.928 (0.201)	Loss 2.8001 (2.5834)	Entropy 0.61938 (0.61792)	Top-1 acc 57.812 (61.641)	Top-5 acc 78.516 (82.506)	lr 0.01008
Train [68][1470/3239]	Time 0.222 (0.701)	Data Time 0.001 (0.200)	Loss 2.6488 (2.5833)	Entropy 0.61941 (0.61793)	Top-1 acc 56.250 (61.639)	Top-5 acc 81.641 (82.513)	lr 0.01008
Train [68][1480/3239]	Time 0.258 (0.699)	Data Time 0.002 (0.198)	Loss 2.7480 (2.5838)	Entropy 0.61935 (0.61794)	Top-1 acc 57.422 (61.628)	Top-5 acc 82.422 (82.503)	lr 0.01008
Train [68][1490/3239]	Time 0.653 (0.697)	Data Time 0.387 (0.197)	Loss 2.4333 (2.5838)	Entropy 0.61843 (0.61795)	Top-1 acc 68.750 (61.630)	Top-5 acc 83.984 (82.505)	lr 0.01007
Train [68][1500/3239]	Time 0.573 (0.704)	Data Time 0.334 (0.205)	Loss 2.7851 (2.5837)	Entropy 0.61833 (0.61795)	Top-1 acc 55.469 (61.632)	Top-5 acc 80.469 (82.505)	lr 0.01007
Train [68][1510/3239]	Time 0.253 (0.702)	Data Time 0.001 (0.203)	Loss 2.5487 (2.5839)	Entropy 0.61838 (0.61795)	Top-1 acc 65.234 (61.623)	Top-5 acc 83.203 (82.505)	lr 0.01007
Train [68][1520/3239]	Time 0.235 (0.700)	Data Time 0.001 (0.202)	Loss 2.5986 (2.5840)	Entropy 0.61843 (0.61795)	Top-1 acc 60.938 (61.618)	Top-5 acc 83.203 (82.506)	lr 0.01007
Train [68][1530/3239]	Time 0.248 (0.706)	Data Time 0.001 (0.209)	Loss 2.6083 (2.5844)	Entropy 0.61873 (0.61796)	Top-1 acc 60.547 (61.610)	Top-5 acc 80.859 (82.499)	lr 0.01007
Train [68][1540/3239]	Time 0.349 (0.707)	Data Time 0.001 (0.209)	Loss 2.3755 (2.5841)	Entropy 0.61858 (0.61796)	Top-1 acc 64.453 (61.614)	Top-5 acc 86.328 (82.497)	lr 0.01007
Train [68][1550/3239]	Time 0.233 (0.705)	Data Time 0.001 (0.208)	Loss 2.5268 (2.5843)	Entropy 0.61864 (0.61797)	Top-1 acc 64.062 (61.611)	Top-5 acc 82.422 (82.494)	lr 0.01007
Train [68][1560/3239]	Time 0.240 (0.709)	Data Time 0.001 (0.213)	Loss 2.6555 (2.5841)	Entropy 0.61870 (0.61797)	Top-1 acc 57.812 (61.618)	Top-5 acc 78.906 (82.496)	lr 0.01007
Train [68][1570/3239]	Time 0.235 (0.711)	Data Time 0.001 (0.216)	Loss 2.5778 (2.5843)	Entropy 0.61872 (0.61798)	Top-1 acc 64.453 (61.614)	Top-5 acc 79.297 (82.497)	lr 0.01007
Train [68][1580/3239]	Time 0.263 (0.710)	Data Time 0.001 (0.214)	Loss 2.3776 (2.5840)	Entropy 0.61890 (0.61798)	Top-1 acc 65.234 (61.621)	Top-5 acc 87.109 (82.501)	lr 0.01007
Train [68][1590/3239]	Time 0.239 (0.714)	Data Time 0.001 (0.219)	Loss 2.5738 (2.5835)	Entropy 0.61913 (0.61799)	Top-1 acc 62.109 (61.628)	Top-5 acc 84.375 (82.509)	lr 0.01006
Train [68][1600/3239]	Time 0.236 (0.715)	Data Time 0.001 (0.221)	Loss 2.7181 (2.5836)	Entropy 0.61882 (0.61800)	Top-1 acc 62.109 (61.629)	Top-5 acc 79.297 (82.508)	lr 0.01006
Train [68][1610/3239]	Time 0.379 (0.713)	Data Time 0.001 (0.219)	Loss 2.5128 (2.5837)	Entropy 0.61869 (0.61800)	Top-1 acc 63.672 (61.627)	Top-5 acc 83.594 (82.504)	lr 0.01006
Train [68][1620/3239]	Time 9.862 (0.717)	Data Time 9.599 (0.224)	Loss 2.7313 (2.5836)	Entropy 0.61861 (0.61800)	Top-1 acc 58.984 (61.630)	Top-5 acc 81.250 (82.511)	lr 0.01006
Train [68][1630/3239]	Time 0.259 (0.718)	Data Time 0.001 (0.225)	Loss 2.5330 (2.5838)	Entropy 0.61855 (0.61801)	Top-1 acc 65.234 (61.624)	Top-5 acc 83.984 (82.507)	lr 0.01006
Train [68][1640/3239]	Time 0.234 (0.716)	Data Time 0.001 (0.224)	Loss 2.6256 (2.5839)	Entropy 0.61851 (0.61801)	Top-1 acc 58.203 (61.619)	Top-5 acc 83.203 (82.509)	lr 0.01006
Train [68][1650/3239]	Time 1.984 (0.715)	Data Time 1.734 (0.223)	Loss 2.6421 (2.5840)	Entropy 0.61870 (0.61802)	Top-1 acc 59.375 (61.614)	Top-5 acc 80.859 (82.510)	lr 0.01006
Train [68][1660/3239]	Time 0.318 (0.744)	Data Time 0.005 (0.227)	Loss 2.7158 (2.5842)	Entropy 0.61908 (0.61802)	Top-1 acc 59.766 (61.609)	Top-5 acc 81.250 (82.498)	lr 0.01006
Train [68][1670/3239]	Time 0.236 (0.742)	Data Time 0.002 (0.225)	Loss 2.6805 (2.5845)	Entropy 0.61918 (0.61803)	Top-1 acc 55.469 (61.607)	Top-5 acc 81.250 (82.495)	lr 0.01006
Train [68][1680/3239]	Time 0.254 (0.740)	Data Time 0.002 (0.224)	Loss 2.4121 (2.5846)	Entropy 0.61934 (0.61803)	Top-1 acc 63.672 (61.598)	Top-5 acc 85.156 (82.492)	lr 0.01006
Train [68][1690/3239]	Time 0.245 (0.738)	Data Time 0.001 (0.223)	Loss 2.4613 (2.5842)	Entropy 0.61969 (0.61804)	Top-1 acc 66.016 (61.610)	Top-5 acc 84.375 (82.499)	lr 0.01005
Train [68][1700/3239]	Time 0.361 (0.737)	Data Time 0.002 (0.221)	Loss 2.7886 (2.5843)	Entropy 0.61960 (0.61805)	Top-1 acc 56.641 (61.616)	Top-5 acc 79.688 (82.499)	lr 0.01005
Train [68][1710/3239]	Time 0.225 (0.735)	Data Time 0.001 (0.220)	Loss 2.7561 (2.5844)	Entropy 0.61941 (0.61806)	Top-1 acc 59.766 (61.612)	Top-5 acc 79.297 (82.495)	lr 0.01005
Train [68][1720/3239]	Time 0.237 (0.733)	Data Time 0.001 (0.219)	Loss 2.6158 (2.5846)	Entropy 0.61937 (0.61807)	Top-1 acc 61.719 (61.607)	Top-5 acc 80.469 (82.492)	lr 0.01005
Train [68][1730/3239]	Time 0.250 (0.733)	Data Time 0.001 (0.220)	Loss 2.6161 (2.5844)	Entropy 0.61944 (0.61808)	Top-1 acc 62.500 (61.611)	Top-5 acc 81.641 (82.493)	lr 0.01005
Train [68][1740/3239]	Time 0.251 (0.732)	Data Time 0.002 (0.218)	Loss 2.5380 (2.5842)	Entropy 0.61926 (0.61808)	Top-1 acc 60.547 (61.614)	Top-5 acc 83.594 (82.494)	lr 0.01005
Train [68][1750/3239]	Time 0.242 (0.731)	Data Time 0.001 (0.218)	Loss 2.5716 (2.5846)	Entropy 0.61864 (0.61809)	Top-1 acc 63.672 (61.610)	Top-5 acc 82.812 (82.489)	lr 0.01005
Train [68][1760/3239]	Time 0.242 (0.737)	Data Time 0.001 (0.224)	Loss 2.6635 (2.5846)	Entropy 0.61875 (0.61809)	Top-1 acc 63.672 (61.607)	Top-5 acc 80.859 (82.492)	lr 0.01005
Train [68][1770/3239]	Time 0.361 (0.736)	Data Time 0.001 (0.225)	Loss 2.8181 (2.5846)	Entropy 0.61866 (0.61810)	Top-1 acc 55.078 (61.606)	Top-5 acc 79.297 (82.495)	lr 0.01005
Train [68][1780/3239]	Time 0.249 (0.735)	Data Time 0.001 (0.224)	Loss 2.6426 (2.5845)	Entropy 0.61895 (0.61810)	Top-1 acc 59.766 (61.606)	Top-5 acc 80.078 (82.496)	lr 0.01005
Train [68][1790/3239]	Time 0.252 (0.742)	Data Time 0.001 (0.231)	Loss 2.5303 (2.5847)	Entropy 0.61881 (0.61811)	Top-1 acc 64.062 (61.602)	Top-5 acc 82.812 (82.490)	lr 0.01004
Train [68][1800/3239]	Time 0.229 (0.741)	Data Time 0.001 (0.230)	Loss 2.5867 (2.5846)	Entropy 0.61887 (0.61811)	Top-1 acc 61.328 (61.603)	Top-5 acc 82.031 (82.487)	lr 0.01004
Train [68][1810/3239]	Time 0.264 (0.739)	Data Time 0.001 (0.230)	Loss 2.3275 (2.5845)	Entropy 0.61907 (0.61811)	Top-1 acc 65.234 (61.602)	Top-5 acc 88.281 (82.489)	lr 0.01004
Train [68][1820/3239]	Time 7.694 (0.743)	Data Time 7.447 (0.234)	Loss 2.5028 (2.5844)	Entropy 0.61920 (0.61812)	Top-1 acc 64.062 (61.605)	Top-5 acc 84.375 (82.488)	lr 0.01004
Train [68][1830/3239]	Time 0.973 (0.747)	Data Time 0.731 (0.238)	Loss 2.5282 (2.5841)	Entropy 0.61906 (0.61812)	Top-1 acc 64.453 (61.617)	Top-5 acc 84.375 (82.494)	lr 0.01004
Train [68][1840/3239]	Time 0.257 (0.745)	Data Time 0.001 (0.237)	Loss 2.6968 (2.5840)	Entropy 0.61890 (0.61813)	Top-1 acc 57.031 (61.615)	Top-5 acc 79.688 (82.497)	lr 0.01004
Train [68][1850/3239]	Time 0.239 (0.744)	Data Time 0.001 (0.235)	Loss 2.5785 (2.5837)	Entropy 0.61922 (0.61813)	Top-1 acc 59.375 (61.620)	Top-5 acc 80.859 (82.501)	lr 0.01004
Train [68][1860/3239]	Time 0.329 (0.752)	Data Time 0.001 (0.244)	Loss 2.6838 (2.5837)	Entropy 0.61920 (0.61814)	Top-1 acc 55.859 (61.623)	Top-5 acc 82.812 (82.502)	lr 0.01004
Train [68][1870/3239]	Time 0.259 (0.750)	Data Time 0.001 (0.243)	Loss 2.5958 (2.5837)	Entropy 0.61904 (0.61815)	Top-1 acc 60.547 (61.624)	Top-5 acc 82.422 (82.504)	lr 0.01004
Train [68][1880/3239]	Time 0.251 (0.749)	Data Time 0.001 (0.242)	Loss 2.5191 (2.5839)	Entropy 0.61926 (0.61815)	Top-1 acc 60.938 (61.622)	Top-5 acc 82.812 (82.500)	lr 0.01004
Train [68][1890/3239]	Time 0.240 (0.757)	Data Time 0.001 (0.251)	Loss 2.6989 (2.5840)	Entropy 0.61909 (0.61816)	Top-1 acc 58.594 (61.622)	Top-5 acc 80.469 (82.495)	lr 0.01003
Train [68][1900/3239]	Time 0.251 (0.756)	Data Time 0.001 (0.251)	Loss 2.6570 (2.5842)	Entropy 0.61918 (0.61816)	Top-1 acc 58.594 (61.618)	Top-5 acc 80.469 (82.487)	lr 0.01003
Train [68][1910/3239]	Time 0.231 (0.755)	Data Time 0.001 (0.250)	Loss 2.4194 (2.5838)	Entropy 0.61915 (0.61817)	Top-1 acc 67.188 (61.628)	Top-5 acc 85.156 (82.495)	lr 0.01003
Train [68][1920/3239]	Time 0.250 (0.763)	Data Time 0.002 (0.258)	Loss 2.6468 (2.5838)	Entropy 0.61864 (0.61817)	Top-1 acc 58.984 (61.629)	Top-5 acc 84.766 (82.494)	lr 0.01003
Train [68][1930/3239]	Time 0.333 (0.761)	Data Time 0.001 (0.257)	Loss 2.4549 (2.5839)	Entropy 0.61831 (0.61817)	Top-1 acc 63.672 (61.628)	Top-5 acc 85.938 (82.491)	lr 0.01003
Train [68][1940/3239]	Time 0.223 (0.761)	Data Time 0.001 (0.257)	Loss 2.6198 (2.5838)	Entropy 0.61782 (0.61817)	Top-1 acc 62.109 (61.627)	Top-5 acc 78.516 (82.494)	lr 0.01003
Train [68][1950/3239]	Time 0.241 (0.771)	Data Time 0.001 (0.267)	Loss 2.5265 (2.5839)	Entropy 0.61774 (0.61817)	Top-1 acc 63.672 (61.618)	Top-5 acc 84.766 (82.498)	lr 0.01003
Train [68][1960/3239]	Time 0.242 (0.770)	Data Time 0.001 (0.267)	Loss 2.5950 (2.5838)	Entropy 0.61761 (0.61817)	Top-1 acc 59.766 (61.623)	Top-5 acc 82.812 (82.497)	lr 0.01003
Train [68][1970/3239]	Time 0.236 (0.769)	Data Time 0.001 (0.267)	Loss 2.4238 (2.5841)	Entropy 0.61772 (0.61816)	Top-1 acc 65.625 (61.615)	Top-5 acc 83.594 (82.488)	lr 0.01003
Train [68][1980/3239]	Time 7.183 (0.771)	Data Time 6.938 (0.269)	Loss 2.5949 (2.5843)	Entropy 0.61774 (0.61816)	Top-1 acc 60.547 (61.608)	Top-5 acc 80.078 (82.484)	lr 0.01003
Train [68][1990/3239]	Time 3.008 (0.775)	Data Time 2.742 (0.273)	Loss 2.4694 (2.5845)	Entropy 0.61798 (0.61816)	Top-1 acc 66.406 (61.603)	Top-5 acc 85.938 (82.479)	lr 0.01002
Train [68][2000/3239]	Time 2.885 (0.776)	Data Time 2.637 (0.275)	Loss 2.5976 (2.5844)	Entropy 0.61790 (0.61816)	Top-1 acc 60.938 (61.603)	Top-5 acc 82.422 (82.482)	lr 0.01002
Train [68][2010/3239]	Time 0.243 (0.774)	Data Time 0.001 (0.273)	Loss 2.4797 (2.5846)	Entropy 0.61814 (0.61816)	Top-1 acc 63.281 (61.599)	Top-5 acc 85.156 (82.479)	lr 0.01002
Train [68][2020/3239]	Time 0.490 (0.779)	Data Time 0.253 (0.278)	Loss 2.4809 (2.5845)	Entropy 0.61857 (0.61816)	Top-1 acc 64.453 (61.608)	Top-5 acc 84.766 (82.481)	lr 0.01002
Train [68][2030/3239]	Time 0.239 (0.781)	Data Time 0.001 (0.281)	Loss 2.6827 (2.5843)	Entropy 0.61831 (0.61816)	Top-1 acc 57.031 (61.608)	Top-5 acc 81.641 (82.481)	lr 0.01002
Train [68][2040/3239]	Time 0.245 (0.781)	Data Time 0.001 (0.281)	Loss 2.9166 (2.5846)	Entropy 0.61822 (0.61816)	Top-1 acc 51.172 (61.600)	Top-5 acc 76.172 (82.477)	lr 0.01002
Train [68][2050/3239]	Time 0.242 (0.786)	Data Time 0.002 (0.286)	Loss 2.3171 (2.5844)	Entropy 0.61820 (0.61816)	Top-1 acc 69.531 (61.602)	Top-5 acc 84.766 (82.478)	lr 0.01002
Train [68][2060/3239]	Time 0.239 (0.786)	Data Time 0.001 (0.287)	Loss 2.5325 (2.5841)	Entropy 0.61790 (0.61816)	Top-1 acc 63.281 (61.607)	Top-5 acc 82.812 (82.485)	lr 0.01002
Train [68][2070/3239]	Time 0.223 (0.788)	Data Time 0.001 (0.289)	Loss 3.0055 (2.5842)	Entropy 0.61781 (0.61816)	Top-1 acc 51.562 (61.605)	Top-5 acc 72.656 (82.484)	lr 0.01002
Train [68][2080/3239]	Time 0.225 (0.793)	Data Time 0.001 (0.295)	Loss 2.3230 (2.5842)	Entropy 0.61775 (0.61816)	Top-1 acc 66.797 (61.602)	Top-5 acc 86.719 (82.484)	lr 0.01002
Train [68][2090/3239]	Time 0.374 (0.793)	Data Time 0.001 (0.295)	Loss 2.3871 (2.5840)	Entropy 0.61782 (0.61816)	Top-1 acc 65.625 (61.608)	Top-5 acc 86.328 (82.489)	lr 0.01001
Train [68][2100/3239]	Time 0.244 (0.795)	Data Time 0.001 (0.297)	Loss 2.6266 (2.5839)	Entropy 0.61748 (0.61815)	Top-1 acc 59.375 (61.614)	Top-5 acc 82.422 (82.487)	lr 0.01001
Train [68][2110/3239]	Time 0.265 (0.800)	Data Time 0.001 (0.303)	Loss 2.4789 (2.5838)	Entropy 0.61773 (0.61815)	Top-1 acc 64.453 (61.613)	Top-5 acc 85.938 (82.491)	lr 0.01001
Train [68][2120/3239]	Time 0.252 (0.801)	Data Time 0.001 (0.304)	Loss 2.5285 (2.5836)	Entropy 0.61774 (0.61815)	Top-1 acc 62.109 (61.616)	Top-5 acc 84.375 (82.494)	lr 0.01001
Train [68][2130/3239]	Time 0.232 (0.802)	Data Time 0.001 (0.305)	Loss 2.4549 (2.5838)	Entropy 0.61795 (0.61815)	Top-1 acc 68.750 (61.617)	Top-5 acc 83.594 (82.492)	lr 0.01001
Train [68][2140/3239]	Time 5.110 (0.802)	Data Time 4.867 (0.306)	Loss 2.5580 (2.5839)	Entropy 0.61790 (0.61815)	Top-1 acc 61.328 (61.613)	Top-5 acc 82.031 (82.486)	lr 0.01001
Train [68][2150/3239]	Time 11.783 (0.810)	Data Time 11.539 (0.314)	Loss 2.5923 (2.5839)	Entropy 0.61801 (0.61815)	Top-1 acc 62.500 (61.618)	Top-5 acc 83.203 (82.484)	lr 0.01001
Train [68][2160/3239]	Time 0.430 (0.809)	Data Time 0.088 (0.314)	Loss 2.6735 (2.5842)	Entropy 0.61788 (0.61815)	Top-1 acc 58.203 (61.612)	Top-5 acc 80.859 (82.476)	lr 0.01001
Train [68][2170/3239]	Time 0.244 (0.807)	Data Time 0.001 (0.312)	Loss 2.7354 (2.5844)	Entropy 0.61797 (0.61814)	Top-1 acc 57.812 (61.609)	Top-5 acc 79.688 (82.475)	lr 0.01001
Train [68][2180/3239]	Time 0.247 (0.812)	Data Time 0.001 (0.317)	Loss 2.5109 (2.5841)	Entropy 0.61823 (0.61814)	Top-1 acc 62.500 (61.616)	Top-5 acc 83.984 (82.480)	lr 0.01001
Train [68][2190/3239]	Time 0.246 (0.816)	Data Time 0.001 (0.322)	Loss 2.5454 (2.5842)	Entropy 0.61822 (0.61814)	Top-1 acc 60.938 (61.618)	Top-5 acc 82.812 (82.478)	lr 0.01000
Train [68][2200/3239]	Time 0.227 (0.816)	Data Time 0.001 (0.323)	Loss 2.6896 (2.5843)	Entropy 0.61831 (0.61814)	Top-1 acc 62.500 (61.620)	Top-5 acc 80.859 (82.473)	lr 0.01000
Train [68][2210/3239]	Time 0.235 (0.821)	Data Time 0.001 (0.327)	Loss 2.5201 (2.5844)	Entropy 0.61835 (0.61815)	Top-1 acc 62.109 (61.624)	Top-5 acc 82.812 (82.472)	lr 0.01000
Train [68][2220/3239]	Time 0.229 (0.825)	Data Time 0.001 (0.331)	Loss 2.6716 (2.5845)	Entropy 0.61832 (0.61815)	Top-1 acc 57.422 (61.617)	Top-5 acc 79.688 (82.468)	lr 0.01000
Train [68][2230/3239]	Time 0.242 (0.826)	Data Time 0.001 (0.333)	Loss 2.7048 (2.5845)	Entropy 0.61831 (0.61815)	Top-1 acc 58.203 (61.617)	Top-5 acc 79.688 (82.467)	lr 0.01000
Train [68][2240/3239]	Time 0.246 (0.831)	Data Time 0.001 (0.338)	Loss 2.5997 (2.5843)	Entropy 0.61812 (0.61815)	Top-1 acc 60.547 (61.622)	Top-5 acc 80.078 (82.469)	lr 0.01000
Train [68][2250/3239]	Time 0.343 (0.831)	Data Time 0.001 (0.339)	Loss 2.6869 (2.5846)	Entropy 0.61796 (0.61815)	Top-1 acc 61.328 (61.611)	Top-5 acc 80.859 (82.460)	lr 0.01000
Train [68][2260/3239]	Time 0.226 (0.834)	Data Time 0.001 (0.343)	Loss 2.4363 (2.5843)	Entropy 0.61794 (0.61815)	Top-1 acc 65.625 (61.621)	Top-5 acc 84.375 (82.467)	lr 0.01000
Train [68][2270/3239]	Time 1.551 (0.835)	Data Time 1.308 (0.343)	Loss 2.9445 (2.5843)	Entropy 0.61813 (0.61815)	Top-1 acc 53.906 (61.623)	Top-5 acc 76.953 (82.468)	lr 0.01000
Train [68][2280/3239]	Time 0.234 (0.839)	Data Time 0.002 (0.348)	Loss 2.6876 (2.5843)	Entropy 0.61823 (0.61815)	Top-1 acc 59.375 (61.625)	Top-5 acc 78.906 (82.469)	lr 0.01000
Train [68][2290/3239]	Time 0.223 (0.841)	Data Time 0.001 (0.350)	Loss 2.5797 (2.5843)	Entropy 0.61835 (0.61815)	Top-1 acc 62.109 (61.624)	Top-5 acc 83.203 (82.470)	lr 0.01000
Train [68][2300/3239]	Time 0.256 (0.840)	Data Time 0.001 (0.350)	Loss 2.6651 (2.5841)	Entropy 0.61840 (0.61815)	Top-1 acc 59.375 (61.632)	Top-5 acc 80.078 (82.472)	lr 0.00999
Train [68][2310/3239]	Time 4.708 (0.847)	Data Time 4.460 (0.357)	Loss 2.4899 (2.5840)	Entropy 0.61831 (0.61815)	Top-1 acc 61.328 (61.628)	Top-5 acc 84.766 (82.473)	lr 0.00999
Train [68][2320/3239]	Time 0.414 (0.864)	Data Time 0.004 (0.355)	Loss 2.7473 (2.5845)	Entropy 0.61845 (0.61815)	Top-1 acc 57.031 (61.620)	Top-5 acc 76.953 (82.466)	lr 0.00999
Train [68][2330/3239]	Time 0.240 (0.862)	Data Time 0.001 (0.353)	Loss 2.5598 (2.5847)	Entropy 0.61866 (0.61815)	Top-1 acc 60.156 (61.613)	Top-5 acc 84.766 (82.465)	lr 0.00999
Train [68][2340/3239]	Time 0.240 (0.860)	Data Time 0.001 (0.352)	Loss 2.6808 (2.5850)	Entropy 0.61882 (0.61815)	Top-1 acc 61.719 (61.609)	Top-5 acc 79.297 (82.461)	lr 0.00999
Train [68][2350/3239]	Time 0.259 (0.858)	Data Time 0.001 (0.350)	Loss 2.6554 (2.5851)	Entropy 0.61838 (0.61815)	Top-1 acc 58.594 (61.609)	Top-5 acc 83.203 (82.461)	lr 0.00999
Train [68][2360/3239]	Time 0.233 (0.856)	Data Time 0.001 (0.349)	Loss 2.4619 (2.5848)	Entropy 0.61837 (0.61816)	Top-1 acc 65.234 (61.615)	Top-5 acc 84.375 (82.467)	lr 0.00999
Train [68][2370/3239]	Time 0.247 (0.856)	Data Time 0.001 (0.349)	Loss 2.5304 (2.5847)	Entropy 0.61796 (0.61816)	Top-1 acc 60.547 (61.611)	Top-5 acc 84.766 (82.470)	lr 0.00999
Train [68][2380/3239]	Time 0.255 (0.859)	Data Time 0.001 (0.353)	Loss 2.4770 (2.5845)	Entropy 0.61803 (0.61815)	Top-1 acc 62.891 (61.618)	Top-5 acc 85.156 (82.475)	lr 0.00999
Train [68][2390/3239]	Time 0.243 (0.859)	Data Time 0.001 (0.353)	Loss 2.6071 (2.5846)	Entropy 0.61833 (0.61815)	Top-1 acc 59.766 (61.619)	Top-5 acc 82.812 (82.472)	lr 0.00999
Train [68][2400/3239]	Time 0.265 (0.863)	Data Time 0.001 (0.357)	Loss 2.3534 (2.5844)	Entropy 0.61789 (0.61815)	Top-1 acc 66.406 (61.626)	Top-5 acc 86.719 (82.475)	lr 0.00998
Train [68][2410/3239]	Time 0.336 (0.864)	Data Time 0.001 (0.358)	Loss 2.5912 (2.5846)	Entropy 0.61801 (0.61815)	Top-1 acc 61.328 (61.620)	Top-5 acc 81.641 (82.472)	lr 0.00998
Train [68][2420/3239]	Time 0.249 (0.867)	Data Time 0.001 (0.362)	Loss 2.5109 (2.5846)	Entropy 0.61777 (0.61815)	Top-1 acc 62.891 (61.622)	Top-5 acc 84.766 (82.472)	lr 0.00998
Train [68][2430/3239]	Time 0.266 (0.868)	Data Time 0.001 (0.363)	Loss 2.3970 (2.5845)	Entropy 0.61758 (0.61815)	Top-1 acc 67.188 (61.627)	Top-5 acc 84.766 (82.472)	lr 0.00998
Train [68][2440/3239]	Time 0.234 (0.871)	Data Time 0.001 (0.366)	Loss 2.5975 (2.5846)	Entropy 0.61757 (0.61815)	Top-1 acc 63.281 (61.626)	Top-5 acc 80.469 (82.469)	lr 0.00998
Train [68][2450/3239]	Time 3.302 (0.874)	Data Time 3.053 (0.369)	Loss 2.8316 (2.5848)	Entropy 0.61714 (0.61815)	Top-1 acc 57.031 (61.625)	Top-5 acc 76.953 (82.467)	lr 0.00998
Train [68][2460/3239]	Time 2.771 (0.875)	Data Time 2.512 (0.371)	Loss 2.4359 (2.5849)	Entropy 0.61709 (0.61814)	Top-1 acc 66.016 (61.620)	Top-5 acc 86.328 (82.467)	lr 0.00998
Train [68][2470/3239]	Time 3.244 (0.878)	Data Time 2.961 (0.374)	Loss 2.6602 (2.5848)	Entropy 0.61707 (0.61814)	Top-1 acc 59.766 (61.625)	Top-5 acc 82.031 (82.469)	lr 0.00998
Train [68][2480/3239]	Time 0.345 (0.880)	Data Time 0.002 (0.377)	Loss 2.8966 (2.5852)	Entropy 0.61705 (0.61813)	Top-1 acc 55.078 (61.619)	Top-5 acc 78.516 (82.464)	lr 0.00998
Train [68][2490/3239]	Time 0.246 (0.882)	Data Time 0.001 (0.379)	Loss 2.7791 (2.5853)	Entropy 0.61706 (0.61813)	Top-1 acc 59.375 (61.616)	Top-5 acc 76.953 (82.459)	lr 0.00998
Train [68][2500/3239]	Time 0.239 (0.884)	Data Time 0.001 (0.381)	Loss 2.2924 (2.5853)	Entropy 0.61679 (0.61812)	Top-1 acc 67.969 (61.613)	Top-5 acc 88.281 (82.460)	lr 0.00997
Train [68][2510/3239]	Time 7.863 (0.889)	Data Time 7.621 (0.386)	Loss 2.3924 (2.5851)	Entropy 0.61664 (0.61812)	Top-1 acc 68.359 (61.618)	Top-5 acc 88.672 (82.465)	lr 0.00997
Train [68][2520/3239]	Time 0.265 (0.890)	Data Time 0.001 (0.388)	Loss 2.4149 (2.5849)	Entropy 0.61660 (0.61811)	Top-1 acc 64.844 (61.623)	Top-5 acc 84.375 (82.468)	lr 0.00997
Train [68][2530/3239]	Time 0.255 (0.892)	Data Time 0.001 (0.390)	Loss 2.7091 (2.5849)	Entropy 0.61677 (0.61811)	Top-1 acc 61.719 (61.621)	Top-5 acc 78.906 (82.470)	lr 0.00997
Train [68][2540/3239]	Time 0.233 (0.894)	Data Time 0.001 (0.393)	Loss 2.5663 (2.5848)	Entropy 0.61682 (0.61810)	Top-1 acc 62.500 (61.624)	Top-5 acc 83.984 (82.474)	lr 0.00997
Train [68][2550/3239]	Time 0.227 (0.897)	Data Time 0.001 (0.396)	Loss 2.4251 (2.5847)	Entropy 0.61652 (0.61810)	Top-1 acc 66.406 (61.625)	Top-5 acc 83.984 (82.475)	lr 0.00997
Train [68][2560/3239]	Time 0.238 (0.899)	Data Time 0.001 (0.398)	Loss 2.3998 (2.5845)	Entropy 0.61653 (0.61809)	Top-1 acc 64.453 (61.633)	Top-5 acc 85.547 (82.477)	lr 0.00997
Train [68][2570/3239]	Time 0.246 (0.898)	Data Time 0.001 (0.398)	Loss 2.5236 (2.5846)	Entropy 0.61621 (0.61808)	Top-1 acc 59.766 (61.630)	Top-5 acc 83.984 (82.475)	lr 0.00997
Train [68][2580/3239]	Time 0.244 (0.904)	Data Time 0.001 (0.404)	Loss 2.6917 (2.5846)	Entropy 0.61648 (0.61808)	Top-1 acc 60.547 (61.631)	Top-5 acc 80.469 (82.475)	lr 0.00997
Train [68][2590/3239]	Time 0.250 (0.905)	Data Time 0.001 (0.405)	Loss 2.6876 (2.5843)	Entropy 0.61654 (0.61807)	Top-1 acc 58.594 (61.638)	Top-5 acc 79.688 (82.480)	lr 0.00997
Train [68][2600/3239]	Time 0.260 (0.905)	Data Time 0.001 (0.405)	Loss 2.5102 (2.5843)	Entropy 0.61655 (0.61806)	Top-1 acc 62.891 (61.639)	Top-5 acc 86.328 (82.483)	lr 0.00996
Train [68][2610/3239]	Time 6.701 (0.910)	Data Time 6.458 (0.411)	Loss 2.7690 (2.5845)	Entropy 0.61641 (0.61806)	Top-1 acc 58.984 (61.636)	Top-5 acc 81.250 (82.479)	lr 0.00996
Train [68][2620/3239]	Time 0.246 (0.912)	Data Time 0.001 (0.414)	Loss 2.3883 (2.5845)	Entropy 0.61616 (0.61805)	Top-1 acc 67.578 (61.635)	Top-5 acc 87.109 (82.482)	lr 0.00996
Train [68][2630/3239]	Time 0.691 (0.911)	Data Time 0.465 (0.412)	Loss 2.4649 (2.5844)	Entropy 0.61608 (0.61804)	Top-1 acc 64.453 (61.639)	Top-5 acc 83.984 (82.485)	lr 0.00996
Train [68][2640/3239]	Time 0.343 (0.915)	Data Time 0.001 (0.417)	Loss 2.7351 (2.5846)	Entropy 0.61626 (0.61804)	Top-1 acc 60.938 (61.637)	Top-5 acc 77.344 (82.480)	lr 0.00996
Train [68][2650/3239]	Time 0.228 (0.921)	Data Time 0.001 (0.423)	Loss 2.5598 (2.5844)	Entropy 0.61618 (0.61803)	Top-1 acc 60.547 (61.641)	Top-5 acc 83.203 (82.486)	lr 0.00996
Train [68][2660/3239]	Time 0.231 (0.919)	Data Time 0.001 (0.421)	Loss 2.6155 (2.5843)	Entropy 0.61627 (0.61802)	Top-1 acc 62.500 (61.645)	Top-5 acc 83.594 (82.487)	lr 0.00996
Train [68][2670/3239]	Time 7.843 (0.924)	Data Time 7.595 (0.426)	Loss 2.7057 (2.5843)	Entropy 0.61636 (0.61802)	Top-1 acc 60.547 (61.648)	Top-5 acc 79.297 (82.487)	lr 0.00996
Train [68][2680/3239]	Time 0.233 (0.924)	Data Time 0.001 (0.427)	Loss 2.7030 (2.5844)	Entropy 0.61635 (0.61801)	Top-1 acc 57.812 (61.648)	Top-5 acc 80.859 (82.487)	lr 0.00996
Train [68][2690/3239]	Time 0.230 (0.929)	Data Time 0.001 (0.432)	Loss 2.7327 (2.5844)	Entropy 0.61655 (0.61800)	Top-1 acc 61.328 (61.651)	Top-5 acc 80.078 (82.485)	lr 0.00996
Train [68][2700/3239]	Time 0.224 (0.929)	Data Time 0.001 (0.433)	Loss 2.5159 (2.5844)	Entropy 0.61665 (0.61800)	Top-1 acc 62.500 (61.648)	Top-5 acc 86.328 (82.486)	lr 0.00995
Train [68][2710/3239]	Time 0.328 (0.933)	Data Time 0.001 (0.437)	Loss 2.7962 (2.5845)	Entropy 0.61657 (0.61799)	Top-1 acc 54.688 (61.642)	Top-5 acc 76.562 (82.483)	lr 0.00995
Train [68][2720/3239]	Time 0.230 (0.938)	Data Time 0.001 (0.442)	Loss 2.3607 (2.5844)	Entropy 0.61680 (0.61799)	Top-1 acc 66.797 (61.647)	Top-5 acc 84.766 (82.480)	lr 0.00995
Train [68][2730/3239]	Time 0.235 (0.936)	Data Time 0.001 (0.441)	Loss 2.4928 (2.5844)	Entropy 0.61700 (0.61798)	Top-1 acc 62.891 (61.647)	Top-5 acc 85.547 (82.481)	lr 0.00995
Train [68][2740/3239]	Time 0.236 (0.939)	Data Time 0.001 (0.443)	Loss 2.6022 (2.5841)	Entropy 0.61694 (0.61798)	Top-1 acc 60.156 (61.652)	Top-5 acc 84.766 (82.488)	lr 0.00995
Train [68][2750/3239]	Time 0.247 (0.939)	Data Time 0.001 (0.444)	Loss 2.5013 (2.5841)	Entropy 0.61683 (0.61798)	Top-1 acc 64.062 (61.653)	Top-5 acc 84.375 (82.487)	lr 0.00995
Train [68][2760/3239]	Time 0.274 (0.942)	Data Time 0.001 (0.447)	Loss 2.6800 (2.5841)	Entropy 0.61640 (0.61797)	Top-1 acc 58.594 (61.655)	Top-5 acc 82.031 (82.489)	lr 0.00995
Train [68][2770/3239]	Time 5.101 (0.943)	Data Time 4.846 (0.449)	Loss 2.5876 (2.5841)	Entropy 0.61655 (0.61797)	Top-1 acc 58.984 (61.654)	Top-5 acc 83.203 (82.490)	lr 0.00995
Train [68][2780/3239]	Time 0.256 (0.943)	Data Time 0.001 (0.449)	Loss 2.3456 (2.5839)	Entropy 0.61636 (0.61796)	Top-1 acc 65.625 (61.660)	Top-5 acc 87.891 (82.495)	lr 0.00995
Train [68][2790/3239]	Time 3.431 (0.945)	Data Time 3.191 (0.451)	Loss 2.4370 (2.5837)	Entropy 0.61611 (0.61795)	Top-1 acc 62.109 (61.660)	Top-5 acc 85.156 (82.498)	lr 0.00995
Train [68][2800/3239]	Time 0.346 (0.944)	Data Time 0.001 (0.450)	Loss 2.3742 (2.5836)	Entropy 0.61588 (0.61795)	Top-1 acc 67.969 (61.664)	Top-5 acc 87.891 (82.498)	lr 0.00994
Train [68][2810/3239]	Time 0.239 (0.947)	Data Time 0.001 (0.453)	Loss 2.5104 (2.5836)	Entropy 0.61608 (0.61794)	Top-1 acc 61.328 (61.662)	Top-5 acc 85.938 (82.499)	lr 0.00994
Train [68][2820/3239]	Time 0.250 (0.947)	Data Time 0.001 (0.454)	Loss 2.5405 (2.5837)	Entropy 0.61595 (0.61793)	Top-1 acc 64.062 (61.660)	Top-5 acc 85.547 (82.499)	lr 0.00994
Train [68][2830/3239]	Time 2.546 (0.948)	Data Time 2.291 (0.454)	Loss 2.5350 (2.5837)	Entropy 0.61595 (0.61793)	Top-1 acc 60.938 (61.661)	Top-5 acc 83.203 (82.497)	lr 0.00994
Train [68][2840/3239]	Time 0.240 (0.949)	Data Time 0.001 (0.457)	Loss 2.6599 (2.5837)	Entropy 0.61585 (0.61792)	Top-1 acc 60.547 (61.662)	Top-5 acc 80.859 (82.496)	lr 0.00994
Train [68][2850/3239]	Time 0.253 (0.952)	Data Time 0.001 (0.460)	Loss 2.8057 (2.5838)	Entropy 0.61598 (0.61791)	Top-1 acc 57.422 (61.665)	Top-5 acc 75.781 (82.494)	lr 0.00994
Train [68][2860/3239]	Time 0.275 (0.950)	Data Time 0.001 (0.458)	Loss 2.4508 (2.5836)	Entropy 0.61617 (0.61791)	Top-1 acc 63.672 (61.670)	Top-5 acc 85.938 (82.499)	lr 0.00994
Train [68][2870/3239]	Time 0.319 (0.952)	Data Time 0.001 (0.460)	Loss 2.7273 (2.5835)	Entropy 0.61628 (0.61790)	Top-1 acc 59.766 (61.672)	Top-5 acc 79.688 (82.499)	lr 0.00994
Train [68][2880/3239]	Time 6.893 (0.957)	Data Time 6.631 (0.465)	Loss 2.6793 (2.5833)	Entropy 0.61628 (0.61790)	Top-1 acc 58.984 (61.676)	Top-5 acc 80.469 (82.502)	lr 0.00994
Train [68][2890/3239]	Time 0.239 (0.955)	Data Time 0.001 (0.463)	Loss 2.3891 (2.5831)	Entropy 0.61602 (0.61789)	Top-1 acc 67.578 (61.681)	Top-5 acc 86.719 (82.507)	lr 0.00994
Train [68][2900/3239]	Time 0.229 (0.957)	Data Time 0.001 (0.466)	Loss 2.5630 (2.5831)	Entropy 0.61627 (0.61788)	Top-1 acc 59.375 (61.683)	Top-5 acc 82.422 (82.509)	lr 0.00993
Train [68][2910/3239]	Time 0.238 (0.957)	Data Time 0.001 (0.466)	Loss 2.5295 (2.5830)	Entropy 0.61604 (0.61788)	Top-1 acc 63.281 (61.684)	Top-5 acc 84.766 (82.511)	lr 0.00993
Train [68][2920/3239]	Time 0.277 (0.958)	Data Time 0.003 (0.467)	Loss 2.6606 (2.5834)	Entropy 0.61586 (0.61787)	Top-1 acc 59.766 (61.677)	Top-5 acc 81.641 (82.500)	lr 0.00993
Train [68][2930/3239]	Time 12.346 (0.961)	Data Time 12.059 (0.470)	Loss 2.4068 (2.5832)	Entropy 0.61602 (0.61786)	Top-1 acc 66.016 (61.683)	Top-5 acc 86.719 (82.503)	lr 0.00993
Train [68][2940/3239]	Time 0.247 (0.959)	Data Time 0.001 (0.469)	Loss 2.5878 (2.5833)	Entropy 0.61630 (0.61786)	Top-1 acc 60.547 (61.681)	Top-5 acc 81.641 (82.502)	lr 0.00993
Train [68][2950/3239]	Time 0.233 (0.960)	Data Time 0.001 (0.470)	Loss 2.6064 (2.5833)	Entropy 0.61611 (0.61785)	Top-1 acc 59.766 (61.680)	Top-5 acc 83.203 (82.499)	lr 0.00993
Train [68][2960/3239]	Time 0.383 (0.958)	Data Time 0.001 (0.468)	Loss 2.6463 (2.5834)	Entropy 0.61618 (0.61785)	Top-1 acc 60.938 (61.676)	Top-5 acc 80.469 (82.496)	lr 0.00993
Train [68][2970/3239]	Time 0.296 (0.973)	Data Time 0.004 (0.468)	Loss 2.5556 (2.5835)	Entropy 0.61638 (0.61784)	Top-1 acc 63.281 (61.677)	Top-5 acc 83.594 (82.494)	lr 0.00993
Train [68][2980/3239]	Time 0.241 (0.971)	Data Time 0.002 (0.467)	Loss 2.8995 (2.5836)	Entropy 0.61642 (0.61784)	Top-1 acc 56.250 (61.675)	Top-5 acc 79.297 (82.492)	lr 0.00993
Train [68][2990/3239]	Time 0.242 (0.969)	Data Time 0.002 (0.465)	Loss 2.7372 (2.5835)	Entropy 0.61606 (0.61783)	Top-1 acc 58.594 (61.676)	Top-5 acc 80.469 (82.490)	lr 0.00993
Train [68][3000/3239]	Time 0.232 (0.968)	Data Time 0.002 (0.463)	Loss 2.6169 (2.5836)	Entropy 0.61621 (0.61783)	Top-1 acc 59.766 (61.674)	Top-5 acc 81.641 (82.487)	lr 0.00992
Train [68][3010/3239]	Time 0.248 (0.966)	Data Time 0.002 (0.462)	Loss 2.6474 (2.5835)	Entropy 0.61616 (0.61782)	Top-1 acc 58.594 (61.679)	Top-5 acc 85.547 (82.491)	lr 0.00992
Train [68][3020/3239]	Time 0.245 (0.964)	Data Time 0.001 (0.460)	Loss 2.5844 (2.5835)	Entropy 0.61652 (0.61781)	Top-1 acc 57.812 (61.678)	Top-5 acc 83.594 (82.490)	lr 0.00992
Train [68][3030/3239]	Time 0.328 (0.962)	Data Time 0.001 (0.459)	Loss 2.5386 (2.5834)	Entropy 0.61651 (0.61781)	Top-1 acc 64.062 (61.680)	Top-5 acc 85.156 (82.491)	lr 0.00992
Train [68][3040/3239]	Time 0.272 (0.961)	Data Time 0.001 (0.457)	Loss 2.5788 (2.5835)	Entropy 0.61648 (0.61781)	Top-1 acc 57.031 (61.679)	Top-5 acc 80.859 (82.488)	lr 0.00992
Train [68][3050/3239]	Time 0.249 (0.960)	Data Time 0.001 (0.457)	Loss 2.4814 (2.5834)	Entropy 0.61678 (0.61780)	Top-1 acc 64.844 (61.676)	Top-5 acc 85.156 (82.491)	lr 0.00992
Train [68][3060/3239]	Time 0.290 (0.959)	Data Time 0.003 (0.456)	Loss 2.4782 (2.5835)	Entropy 0.61690 (0.61780)	Top-1 acc 64.844 (61.675)	Top-5 acc 83.594 (82.491)	lr 0.00992
Train [68][3070/3239]	Time 0.233 (0.960)	Data Time 0.001 (0.457)	Loss 2.6798 (2.5836)	Entropy 0.61705 (0.61780)	Top-1 acc 60.156 (61.673)	Top-5 acc 79.688 (82.488)	lr 0.00992
Train [68][3080/3239]	Time 0.702 (0.962)	Data Time 0.456 (0.459)	Loss 2.5820 (2.5836)	Entropy 0.61681 (0.61779)	Top-1 acc 62.109 (61.675)	Top-5 acc 80.469 (82.489)	lr 0.00992
Train [68][3090/3239]	Time 0.258 (0.962)	Data Time 0.001 (0.460)	Loss 2.5062 (2.5837)	Entropy 0.61687 (0.61779)	Top-1 acc 61.328 (61.668)	Top-5 acc 85.547 (82.489)	lr 0.00992
Train [68][3100/3239]	Time 0.228 (0.964)	Data Time 0.001 (0.462)	Loss 2.7774 (2.5839)	Entropy 0.61684 (0.61779)	Top-1 acc 58.984 (61.667)	Top-5 acc 79.688 (82.485)	lr 0.00991
Train [68][3110/3239]	Time 0.234 (0.965)	Data Time 0.001 (0.463)	Loss 2.5918 (2.5837)	Entropy 0.61707 (0.61778)	Top-1 acc 59.375 (61.668)	Top-5 acc 81.641 (82.485)	lr 0.00991
Train [68][3120/3239]	Time 0.340 (0.965)	Data Time 0.001 (0.463)	Loss 2.4998 (2.5834)	Entropy 0.61692 (0.61778)	Top-1 acc 68.750 (61.675)	Top-5 acc 85.156 (82.491)	lr 0.00991
Train [68][3130/3239]	Time 11.875 (0.967)	Data Time 11.611 (0.466)	Loss 2.6205 (2.5834)	Entropy 0.61675 (0.61778)	Top-1 acc 63.281 (61.678)	Top-5 acc 79.688 (82.489)	lr 0.00991
Train [68][3140/3239]	Time 6.001 (0.969)	Data Time 5.755 (0.468)	Loss 2.6276 (2.5835)	Entropy 0.61714 (0.61778)	Top-1 acc 62.109 (61.674)	Top-5 acc 80.469 (82.488)	lr 0.00991
Train [68][3150/3239]	Time 0.253 (0.967)	Data Time 0.002 (0.467)	Loss 2.5951 (2.5834)	Entropy 0.61675 (0.61777)	Top-1 acc 58.984 (61.675)	Top-5 acc 81.250 (82.488)	lr 0.00991
Train [68][3160/3239]	Time 0.239 (0.967)	Data Time 0.001 (0.467)	Loss 2.6410 (2.5833)	Entropy 0.61680 (0.61777)	Top-1 acc 59.766 (61.678)	Top-5 acc 82.031 (82.490)	lr 0.00991
Train [68][3170/3239]	Time 2.379 (0.970)	Data Time 2.152 (0.470)	Loss 2.4867 (2.5833)	Entropy 0.61678 (0.61777)	Top-1 acc 62.891 (61.679)	Top-5 acc 83.594 (82.492)	lr 0.00991
Train [68][3180/3239]	Time 0.272 (0.970)	Data Time 0.000 (0.470)	Loss 2.8867 (2.5834)	Entropy 0.61670 (0.61776)	Top-1 acc 54.688 (61.677)	Top-5 acc 77.734 (82.492)	lr 0.00991
Train [68][3190/3239]	Time 0.407 (0.969)	Data Time 0.000 (0.470)	Loss 2.5961 (2.5834)	Entropy 0.61668 (0.61776)	Top-1 acc 60.938 (61.675)	Top-5 acc 80.859 (82.488)	lr 0.00991
Train [68][3200/3239]	Time 2.918 (0.972)	Data Time 2.681 (0.473)	Loss 2.4554 (2.5832)	Entropy 0.61665 (0.61776)	Top-1 acc 64.453 (61.681)	Top-5 acc 85.938 (82.492)	lr 0.00991
Train [68][3210/3239]	Time 0.271 (0.973)	Data Time 0.000 (0.474)	Loss 2.6566 (2.5832)	Entropy 0.61675 (0.61775)	Top-1 acc 58.594 (61.683)	Top-5 acc 81.641 (82.492)	lr 0.00990
Train [68][3220/3239]	Time 0.317 (0.972)	Data Time 0.083 (0.473)	Loss 2.4835 (2.5832)	Entropy 0.61652 (0.61775)	Top-1 acc 62.891 (61.681)	Top-5 acc 85.938 (82.492)	lr 0.00990
Train [68][3230/3239]	Time 0.229 (0.971)	Data Time 0.000 (0.473)	Loss 2.5549 (2.5833)	Entropy 0.61656 (0.61775)	Top-1 acc 61.719 (61.681)	Top-5 acc 81.250 (82.491)	lr 0.00990
Train [68][3239/3239]	Time 0.981 (0.972)	Data Time 0.000 (0.474)	Loss 2.7275 (2.5834)	Entropy 0.61630 (0.61774)	Top-1 acc 60.494 (61.675)	Top-5 acc 77.778 (82.490)	lr 0.00990
==========Valid [68/120]	loss 1.371	top-1 acc 68.481 (68.558)	top-5 acc 88.309	Train top-1 61.675	top-5 82.490	Entropy 0.61630	Latency-None: 0.000ms	Flops: 539.00M
Train [69][0/3239]	Time 41.405 (41.405)	Data Time 40.038 (40.038)	Loss 2.6732 (2.6732)	Entropy 0.61591 (0.61591)	Top-1 acc 62.109 (62.109)	Top-5 acc 81.250 (81.250)	lr 0.00990
Train [69][10/3239]	Time 0.235 (4.223)	Data Time 0.001 (3.670)	Loss 2.5388 (2.5634)	Entropy 0.61599 (0.61599)	Top-1 acc 65.625 (62.713)	Top-5 acc 83.984 (82.599)	lr 0.00990
Train [69][20/3239]	Time 0.344 (2.426)	Data Time 0.001 (1.923)	Loss 2.5938 (2.5791)	Entropy 0.61572 (0.61597)	Top-1 acc 64.453 (62.184)	Top-5 acc 82.031 (82.310)	lr 0.00990
Train [69][30/3239]	Time 0.322 (1.798)	Data Time 0.036 (1.304)	Loss 2.4243 (2.5515)	Entropy 0.61562 (0.61587)	Top-1 acc 62.109 (62.399)	Top-5 acc 86.719 (82.825)	lr 0.00990
Train [69][40/3239]	Time 0.239 (1.488)	Data Time 0.001 (1.009)	Loss 2.4510 (2.5485)	Entropy 0.61556 (0.61580)	Top-1 acc 64.844 (62.376)	Top-5 acc 84.766 (82.955)	lr 0.00990
Train [69][50/3239]	Time 0.242 (1.304)	Data Time 0.001 (0.812)	Loss 2.5382 (2.5680)	Entropy 0.61535 (0.61572)	Top-1 acc 58.594 (61.803)	Top-5 acc 85.547 (82.613)	lr 0.00990
Train [69][60/3239]	Time 0.291 (1.171)	Data Time 0.001 (0.679)	Loss 2.9115 (2.5666)	Entropy 0.61555 (0.61567)	Top-1 acc 55.078 (62.033)	Top-5 acc 76.953 (82.652)	lr 0.00990
Train [69][70/3239]	Time 0.236 (1.069)	Data Time 0.001 (0.584)	Loss 2.9604 (2.5752)	Entropy 0.61543 (0.61565)	Top-1 acc 53.906 (61.889)	Top-5 acc 72.266 (82.416)	lr 0.00989
Train [69][80/3239]	Time 0.242 (0.988)	Data Time 0.001 (0.512)	Loss 2.6260 (2.5698)	Entropy 0.61539 (0.61563)	Top-1 acc 60.938 (62.052)	Top-5 acc 82.031 (82.480)	lr 0.00989
Train [69][90/3239]	Time 0.419 (0.932)	Data Time 0.002 (0.456)	Loss 2.2635 (2.5645)	Entropy 0.61590 (0.61563)	Top-1 acc 69.922 (62.165)	Top-5 acc 87.500 (82.667)	lr 0.00989
Train [69][100/3239]	Time 0.232 (0.907)	Data Time 0.001 (0.435)	Loss 2.4152 (2.5620)	Entropy 0.61576 (0.61566)	Top-1 acc 68.359 (62.214)	Top-5 acc 85.156 (82.785)	lr 0.00989
Train [69][110/3239]	Time 0.244 (0.863)	Data Time 0.001 (0.396)	Loss 2.5814 (2.5651)	Entropy 0.61593 (0.61568)	Top-1 acc 61.719 (62.268)	Top-5 acc 82.031 (82.707)	lr 0.00989
Train [69][120/3239]	Time 0.230 (0.834)	Data Time 0.001 (0.364)	Loss 2.4951 (2.5644)	Entropy 0.61632 (0.61571)	Top-1 acc 62.891 (62.284)	Top-5 acc 85.547 (82.751)	lr 0.00989
Train [69][130/3239]	Time 0.232 (0.801)	Data Time 0.001 (0.336)	Loss 2.4466 (2.5631)	Entropy 0.61635 (0.61576)	Top-1 acc 66.016 (62.354)	Top-5 acc 84.375 (82.738)	lr 0.00989
Train [69][140/3239]	Time 0.256 (0.782)	Data Time 0.001 (0.321)	Loss 2.5028 (2.5605)	Entropy 0.61667 (0.61582)	Top-1 acc 64.453 (62.422)	Top-5 acc 84.375 (82.829)	lr 0.00989
Train [69][150/3239]	Time 0.303 (0.758)	Data Time 0.001 (0.300)	Loss 2.6552 (2.5626)	Entropy 0.61657 (0.61587)	Top-1 acc 64.062 (62.412)	Top-5 acc 81.250 (82.841)	lr 0.00989
Train [69][160/3239]	Time 0.270 (0.739)	Data Time 0.001 (0.281)	Loss 2.5581 (2.5611)	Entropy 0.61671 (0.61593)	Top-1 acc 60.938 (62.447)	Top-5 acc 85.547 (82.866)	lr 0.00989
Train [69][170/3239]	Time 0.243 (0.742)	Data Time 0.002 (0.285)	Loss 2.4746 (2.5575)	Entropy 0.61637 (0.61596)	Top-1 acc 63.281 (62.550)	Top-5 acc 85.156 (82.963)	lr 0.00988
Train [69][180/3239]	Time 0.313 (0.726)	Data Time 0.001 (0.269)	Loss 2.6700 (2.5576)	Entropy 0.61623 (0.61598)	Top-1 acc 59.375 (62.485)	Top-5 acc 84.375 (82.992)	lr 0.00988
Train [69][190/3239]	Time 0.252 (0.710)	Data Time 0.001 (0.255)	Loss 2.6284 (2.5595)	Entropy 0.61588 (0.61599)	Top-1 acc 63.672 (62.449)	Top-5 acc 82.031 (82.915)	lr 0.00988
Train [69][200/3239]	Time 0.232 (0.694)	Data Time 0.001 (0.243)	Loss 2.6561 (2.5614)	Entropy 0.61605 (0.61599)	Top-1 acc 58.203 (62.378)	Top-5 acc 80.859 (82.917)	lr 0.00988
Train [69][210/3239]	Time 0.228 (0.681)	Data Time 0.001 (0.231)	Loss 2.6329 (2.5604)	Entropy 0.61577 (0.61598)	Top-1 acc 59.375 (62.393)	Top-5 acc 81.641 (82.972)	lr 0.00988
Train [69][220/3239]	Time 0.256 (0.669)	Data Time 0.001 (0.221)	Loss 2.8103 (2.5610)	Entropy 0.61581 (0.61597)	Top-1 acc 57.812 (62.401)	Top-5 acc 75.000 (82.966)	lr 0.00988
Train [69][230/3239]	Time 0.249 (0.659)	Data Time 0.001 (0.211)	Loss 2.6148 (2.5592)	Entropy 0.61613 (0.61597)	Top-1 acc 59.766 (62.443)	Top-5 acc 83.984 (83.032)	lr 0.00988
Train [69][240/3239]	Time 0.272 (0.649)	Data Time 0.001 (0.203)	Loss 2.5423 (2.5566)	Entropy 0.61600 (0.61597)	Top-1 acc 62.109 (62.515)	Top-5 acc 81.641 (83.085)	lr 0.00988
Train [69][250/3239]	Time 0.383 (0.641)	Data Time 0.002 (0.195)	Loss 2.3837 (2.5549)	Entropy 0.61581 (0.61596)	Top-1 acc 64.453 (62.565)	Top-5 acc 87.109 (83.125)	lr 0.00988
Train [69][260/3239]	Time 0.285 (0.636)	Data Time 0.001 (0.189)	Loss 2.5009 (2.5581)	Entropy 0.61543 (0.61595)	Top-1 acc 66.406 (62.494)	Top-5 acc 85.547 (83.070)	lr 0.00988
Train [69][270/3239]	Time 0.252 (0.627)	Data Time 0.001 (0.182)	Loss 2.5880 (2.5579)	Entropy 0.61521 (0.61593)	Top-1 acc 63.672 (62.507)	Top-5 acc 80.469 (83.065)	lr 0.00987
Train [69][280/3239]	Time 0.258 (0.621)	Data Time 0.002 (0.176)	Loss 2.3341 (2.5579)	Entropy 0.61552 (0.61591)	Top-1 acc 66.016 (62.538)	Top-5 acc 89.062 (83.059)	lr 0.00987
Train [69][290/3239]	Time 0.284 (0.616)	Data Time 0.003 (0.171)	Loss 2.5286 (2.5577)	Entropy 0.61561 (0.61590)	Top-1 acc 59.766 (62.496)	Top-5 acc 81.641 (83.045)	lr 0.00987
Train [69][300/3239]	Time 0.250 (0.610)	Data Time 0.001 (0.165)	Loss 2.5062 (2.5561)	Entropy 0.61545 (0.61589)	Top-1 acc 61.719 (62.517)	Top-5 acc 85.547 (83.064)	lr 0.00987
Train [69][310/3239]	Time 0.231 (0.604)	Data Time 0.001 (0.160)	Loss 2.5464 (2.5577)	Entropy 0.61558 (0.61588)	Top-1 acc 62.500 (62.480)	Top-5 acc 84.375 (83.018)	lr 0.00987
Train [69][320/3239]	Time 1.326 (0.603)	Data Time 1.066 (0.158)	Loss 2.5474 (2.5561)	Entropy 0.61547 (0.61587)	Top-1 acc 62.109 (62.511)	Top-5 acc 83.594 (83.042)	lr 0.00987
Train [69][330/3239]	Time 0.249 (0.598)	Data Time 0.001 (0.153)	Loss 2.5542 (2.5548)	Entropy 0.61553 (0.61585)	Top-1 acc 63.672 (62.520)	Top-5 acc 83.984 (83.078)	lr 0.00987
Train [69][340/3239]	Time 0.332 (0.592)	Data Time 0.001 (0.149)	Loss 2.4849 (2.5531)	Entropy 0.61539 (0.61585)	Top-1 acc 64.062 (62.552)	Top-5 acc 86.719 (83.114)	lr 0.00987
Train [69][350/3239]	Time 0.276 (0.588)	Data Time 0.001 (0.145)	Loss 2.5206 (2.5547)	Entropy 0.61553 (0.61583)	Top-1 acc 62.109 (62.479)	Top-5 acc 85.547 (83.090)	lr 0.00987
Train [69][360/3239]	Time 0.245 (0.586)	Data Time 0.001 (0.143)	Loss 2.6940 (2.5558)	Entropy 0.61541 (0.61582)	Top-1 acc 62.500 (62.458)	Top-5 acc 79.297 (83.048)	lr 0.00987
Train [69][370/3239]	Time 0.251 (0.582)	Data Time 0.001 (0.139)	Loss 2.6011 (2.5565)	Entropy 0.61511 (0.61581)	Top-1 acc 61.719 (62.431)	Top-5 acc 79.297 (83.025)	lr 0.00986
Train [69][380/3239]	Time 0.249 (0.579)	Data Time 0.001 (0.136)	Loss 2.6283 (2.5595)	Entropy 0.61497 (0.61579)	Top-1 acc 62.891 (62.379)	Top-5 acc 81.641 (82.953)	lr 0.00986
Train [69][390/3239]	Time 0.304 (0.694)	Data Time 0.006 (0.138)	Loss 2.5917 (2.5589)	Entropy 0.61476 (0.61577)	Top-1 acc 63.281 (62.388)	Top-5 acc 82.031 (82.978)	lr 0.00986
Train [69][400/3239]	Time 0.248 (0.688)	Data Time 0.002 (0.135)	Loss 2.7370 (2.5605)	Entropy 0.61474 (0.61574)	Top-1 acc 57.031 (62.317)	Top-5 acc 79.297 (82.952)	lr 0.00986
Train [69][410/3239]	Time 0.345 (0.682)	Data Time 0.001 (0.132)	Loss 2.4861 (2.5594)	Entropy 0.61468 (0.61572)	Top-1 acc 66.406 (62.359)	Top-5 acc 83.984 (82.971)	lr 0.00986
Train [69][420/3239]	Time 0.243 (0.676)	Data Time 0.002 (0.129)	Loss 2.5533 (2.5615)	Entropy 0.61463 (0.61569)	Top-1 acc 62.891 (62.306)	Top-5 acc 83.594 (82.938)	lr 0.00986
Train [69][430/3239]	Time 0.263 (0.671)	Data Time 0.001 (0.126)	Loss 2.4566 (2.5619)	Entropy 0.61447 (0.61567)	Top-1 acc 63.672 (62.299)	Top-5 acc 85.547 (82.919)	lr 0.00986
Train [69][440/3239]	Time 0.243 (0.666)	Data Time 0.001 (0.123)	Loss 2.7041 (2.5638)	Entropy 0.61415 (0.61564)	Top-1 acc 58.594 (62.249)	Top-5 acc 79.688 (82.881)	lr 0.00986
Train [69][450/3239]	Time 0.238 (0.661)	Data Time 0.001 (0.120)	Loss 2.6514 (2.5645)	Entropy 0.61420 (0.61560)	Top-1 acc 60.938 (62.232)	Top-5 acc 83.203 (82.880)	lr 0.00986
Train [69][460/3239]	Time 0.251 (0.657)	Data Time 0.002 (0.118)	Loss 2.4072 (2.5629)	Entropy 0.61423 (0.61557)	Top-1 acc 67.188 (62.287)	Top-5 acc 85.547 (82.897)	lr 0.00986
Train [69][470/3239]	Time 0.226 (0.652)	Data Time 0.001 (0.115)	Loss 2.5211 (2.5630)	Entropy 0.61461 (0.61555)	Top-1 acc 61.719 (62.235)	Top-5 acc 82.812 (82.903)	lr 0.00985
Train [69][480/3239]	Time 0.237 (0.648)	Data Time 0.001 (0.113)	Loss 2.9034 (2.5657)	Entropy 0.61471 (0.61553)	Top-1 acc 54.297 (62.176)	Top-5 acc 74.219 (82.833)	lr 0.00985
Train [69][490/3239]	Time 0.303 (0.644)	Data Time 0.001 (0.111)	Loss 2.4521 (2.5657)	Entropy 0.61443 (0.61551)	Top-1 acc 60.938 (62.165)	Top-5 acc 85.156 (82.824)	lr 0.00985
Train [69][500/3239]	Time 0.437 (0.640)	Data Time 0.002 (0.108)	Loss 2.5824 (2.5647)	Entropy 0.61443 (0.61549)	Top-1 acc 58.984 (62.169)	Top-5 acc 82.422 (82.841)	lr 0.00985
Train [69][510/3239]	Time 0.296 (0.636)	Data Time 0.003 (0.106)	Loss 2.5691 (2.5644)	Entropy 0.61461 (0.61547)	Top-1 acc 60.938 (62.177)	Top-5 acc 83.203 (82.829)	lr 0.00985
Train [69][520/3239]	Time 0.255 (0.633)	Data Time 0.001 (0.104)	Loss 2.5902 (2.5646)	Entropy 0.61493 (0.61545)	Top-1 acc 62.891 (62.184)	Top-5 acc 80.078 (82.815)	lr 0.00985
Train [69][530/3239]	Time 0.244 (0.630)	Data Time 0.001 (0.102)	Loss 2.5382 (2.5643)	Entropy 0.61484 (0.61544)	Top-1 acc 63.281 (62.165)	Top-5 acc 82.812 (82.825)	lr 0.00985
Train [69][540/3239]	Time 0.282 (0.626)	Data Time 0.001 (0.100)	Loss 2.5184 (2.5644)	Entropy 0.61522 (0.61544)	Top-1 acc 64.453 (62.164)	Top-5 acc 84.766 (82.829)	lr 0.00985
Train [69][550/3239]	Time 0.281 (0.624)	Data Time 0.001 (0.100)	Loss 2.5098 (2.5643)	Entropy 0.61544 (0.61543)	Top-1 acc 66.016 (62.165)	Top-5 acc 84.766 (82.825)	lr 0.00985
Train [69][560/3239]	Time 0.268 (0.623)	Data Time 0.001 (0.101)	Loss 2.4941 (2.5643)	Entropy 0.61542 (0.61543)	Top-1 acc 64.844 (62.190)	Top-5 acc 82.812 (82.808)	lr 0.00985
Train [69][570/3239]	Time 0.353 (0.624)	Data Time 0.002 (0.103)	Loss 2.5669 (2.5650)	Entropy 0.61536 (0.61543)	Top-1 acc 63.672 (62.176)	Top-5 acc 82.031 (82.801)	lr 0.00984
Train [69][580/3239]	Time 1.437 (0.623)	Data Time 1.187 (0.104)	Loss 2.5314 (2.5656)	Entropy 0.61544 (0.61543)	Top-1 acc 59.766 (62.156)	Top-5 acc 82.812 (82.790)	lr 0.00984
Train [69][590/3239]	Time 0.258 (0.623)	Data Time 0.001 (0.105)	Loss 2.4608 (2.5664)	Entropy 0.61529 (0.61543)	Top-1 acc 63.281 (62.111)	Top-5 acc 82.031 (82.766)	lr 0.00984
Train [69][600/3239]	Time 0.274 (0.627)	Data Time 0.001 (0.110)	Loss 2.5240 (2.5671)	Entropy 0.61532 (0.61543)	Top-1 acc 62.500 (62.096)	Top-5 acc 82.422 (82.758)	lr 0.00984
Train [69][610/3239]	Time 0.224 (0.624)	Data Time 0.001 (0.109)	Loss 2.4318 (2.5670)	Entropy 0.61573 (0.61543)	Top-1 acc 64.453 (62.084)	Top-5 acc 83.203 (82.756)	lr 0.00984
Train [69][620/3239]	Time 0.249 (0.621)	Data Time 0.001 (0.107)	Loss 2.5347 (2.5672)	Entropy 0.61603 (0.61544)	Top-1 acc 63.281 (62.070)	Top-5 acc 82.031 (82.757)	lr 0.00984
Train [69][630/3239]	Time 5.433 (0.629)	Data Time 5.161 (0.116)	Loss 2.3838 (2.5675)	Entropy 0.61593 (0.61544)	Top-1 acc 66.016 (62.067)	Top-5 acc 82.031 (82.750)	lr 0.00984
Train [69][640/3239]	Time 0.241 (0.626)	Data Time 0.001 (0.115)	Loss 2.5318 (2.5665)	Entropy 0.61562 (0.61545)	Top-1 acc 62.891 (62.094)	Top-5 acc 82.422 (82.767)	lr 0.00984
Train [69][650/3239]	Time 0.227 (0.627)	Data Time 0.001 (0.117)	Loss 2.6900 (2.5655)	Entropy 0.61554 (0.61545)	Top-1 acc 57.812 (62.114)	Top-5 acc 80.469 (82.780)	lr 0.00984
Train [69][660/3239]	Time 0.277 (0.625)	Data Time 0.001 (0.116)	Loss 2.7341 (2.5658)	Entropy 0.61564 (0.61545)	Top-1 acc 54.297 (62.102)	Top-5 acc 76.953 (82.762)	lr 0.00984
Train [69][670/3239]	Time 0.239 (0.630)	Data Time 0.001 (0.122)	Loss 2.5903 (2.5656)	Entropy 0.61616 (0.61546)	Top-1 acc 61.719 (62.101)	Top-5 acc 80.859 (82.765)	lr 0.00983
Train [69][680/3239]	Time 0.231 (0.627)	Data Time 0.001 (0.121)	Loss 2.4562 (2.5653)	Entropy 0.61617 (0.61547)	Top-1 acc 62.500 (62.113)	Top-5 acc 83.594 (82.774)	lr 0.00983
Train [69][690/3239]	Time 0.288 (0.628)	Data Time 0.001 (0.122)	Loss 2.6064 (2.5650)	Entropy 0.61626 (0.61548)	Top-1 acc 60.156 (62.121)	Top-5 acc 82.031 (82.782)	lr 0.00983
Train [69][700/3239]	Time 0.247 (0.632)	Data Time 0.001 (0.127)	Loss 2.6177 (2.5654)	Entropy 0.61636 (0.61549)	Top-1 acc 58.203 (62.105)	Top-5 acc 81.641 (82.768)	lr 0.00983
Train [69][710/3239]	Time 0.242 (0.629)	Data Time 0.001 (0.125)	Loss 2.5279 (2.5655)	Entropy 0.61680 (0.61550)	Top-1 acc 64.453 (62.111)	Top-5 acc 84.766 (82.762)	lr 0.00983
Train [69][720/3239]	Time 2.418 (0.629)	Data Time 2.179 (0.126)	Loss 2.6025 (2.5657)	Entropy 0.61721 (0.61552)	Top-1 acc 62.109 (62.109)	Top-5 acc 83.594 (82.756)	lr 0.00983
Train [69][730/3239]	Time 0.362 (0.633)	Data Time 0.001 (0.131)	Loss 2.5110 (2.5662)	Entropy 0.61737 (0.61555)	Top-1 acc 61.328 (62.090)	Top-5 acc 84.375 (82.747)	lr 0.00983
Train [69][740/3239]	Time 0.244 (0.630)	Data Time 0.001 (0.129)	Loss 2.6644 (2.5664)	Entropy 0.61729 (0.61557)	Top-1 acc 59.766 (62.079)	Top-5 acc 78.906 (82.740)	lr 0.00983
Train [69][750/3239]	Time 0.255 (0.630)	Data Time 0.001 (0.130)	Loss 2.5028 (2.5660)	Entropy 0.61740 (0.61560)	Top-1 acc 65.234 (62.094)	Top-5 acc 82.812 (82.736)	lr 0.00983
Train [69][760/3239]	Time 0.263 (0.635)	Data Time 0.002 (0.136)	Loss 2.2972 (2.5654)	Entropy 0.61739 (0.61562)	Top-1 acc 66.016 (62.120)	Top-5 acc 89.453 (82.742)	lr 0.00983
Train [69][770/3239]	Time 0.243 (0.632)	Data Time 0.001 (0.135)	Loss 2.5879 (2.5658)	Entropy 0.61731 (0.61564)	Top-1 acc 58.984 (62.113)	Top-5 acc 82.422 (82.731)	lr 0.00983
Train [69][780/3239]	Time 0.253 (0.630)	Data Time 0.001 (0.133)	Loss 2.1654 (2.5658)	Entropy 0.61750 (0.61566)	Top-1 acc 74.609 (62.119)	Top-5 acc 88.672 (82.733)	lr 0.00982
Train [69][790/3239]	Time 3.681 (0.636)	Data Time 3.431 (0.140)	Loss 2.5346 (2.5664)	Entropy 0.61732 (0.61569)	Top-1 acc 62.500 (62.099)	Top-5 acc 83.203 (82.708)	lr 0.00982
Train [69][800/3239]	Time 0.335 (0.633)	Data Time 0.001 (0.138)	Loss 2.5420 (2.5663)	Entropy 0.61729 (0.61571)	Top-1 acc 63.281 (62.111)	Top-5 acc 83.984 (82.717)	lr 0.00982
Train [69][810/3239]	Time 0.240 (0.632)	Data Time 0.001 (0.138)	Loss 2.4598 (2.5660)	Entropy 0.61714 (0.61573)	Top-1 acc 65.234 (62.122)	Top-5 acc 85.938 (82.727)	lr 0.00982
Train [69][820/3239]	Time 0.233 (0.633)	Data Time 0.002 (0.140)	Loss 2.5384 (2.5654)	Entropy 0.61706 (0.61574)	Top-1 acc 62.500 (62.134)	Top-5 acc 83.203 (82.737)	lr 0.00982
Train [69][830/3239]	Time 0.227 (0.638)	Data Time 0.001 (0.145)	Loss 2.6035 (2.5656)	Entropy 0.61695 (0.61576)	Top-1 acc 61.328 (62.141)	Top-5 acc 81.641 (82.729)	lr 0.00982
Train [69][840/3239]	Time 0.290 (0.639)	Data Time 0.002 (0.147)	Loss 2.5095 (2.5665)	Entropy 0.61684 (0.61577)	Top-1 acc 64.062 (62.119)	Top-5 acc 82.812 (82.708)	lr 0.00982
Train [69][850/3239]	Time 0.256 (0.637)	Data Time 0.001 (0.145)	Loss 2.4404 (2.5655)	Entropy 0.61671 (0.61578)	Top-1 acc 60.547 (62.131)	Top-5 acc 87.891 (82.730)	lr 0.00982
Train [69][860/3239]	Time 0.278 (0.640)	Data Time 0.001 (0.150)	Loss 2.4842 (2.5653)	Entropy 0.61696 (0.61579)	Top-1 acc 64.453 (62.127)	Top-5 acc 82.812 (82.734)	lr 0.00982
Train [69][870/3239]	Time 0.233 (0.638)	Data Time 0.001 (0.148)	Loss 2.6524 (2.5658)	Entropy 0.61696 (0.61581)	Top-1 acc 60.156 (62.128)	Top-5 acc 82.812 (82.729)	lr 0.00982
Train [69][880/3239]	Time 0.262 (0.638)	Data Time 0.003 (0.149)	Loss 2.5924 (2.5665)	Entropy 0.61695 (0.61582)	Top-1 acc 61.328 (62.111)	Top-5 acc 81.250 (82.720)	lr 0.00981
Train [69][890/3239]	Time 0.326 (0.644)	Data Time 0.001 (0.155)	Loss 2.3293 (2.5663)	Entropy 0.61716 (0.61584)	Top-1 acc 69.141 (62.122)	Top-5 acc 86.719 (82.721)	lr 0.00981
Train [69][900/3239]	Time 0.242 (0.642)	Data Time 0.001 (0.153)	Loss 2.5968 (2.5665)	Entropy 0.61724 (0.61585)	Top-1 acc 63.281 (62.117)	Top-5 acc 83.984 (82.723)	lr 0.00981
Train [69][910/3239]	Time 0.247 (0.645)	Data Time 0.002 (0.158)	Loss 2.5064 (2.5665)	Entropy 0.61718 (0.61587)	Top-1 acc 62.500 (62.113)	Top-5 acc 82.812 (82.724)	lr 0.00981
Train [69][920/3239]	Time 0.251 (0.646)	Data Time 0.002 (0.159)	Loss 2.6587 (2.5665)	Entropy 0.61711 (0.61588)	Top-1 acc 56.641 (62.109)	Top-5 acc 82.812 (82.718)	lr 0.00981
Train [69][930/3239]	Time 0.239 (0.644)	Data Time 0.001 (0.158)	Loss 2.6752 (2.5664)	Entropy 0.61722 (0.61589)	Top-1 acc 57.812 (62.104)	Top-5 acc 79.688 (82.724)	lr 0.00981
Train [69][940/3239]	Time 0.498 (0.644)	Data Time 0.260 (0.158)	Loss 2.6828 (2.5661)	Entropy 0.61661 (0.61591)	Top-1 acc 58.984 (62.105)	Top-5 acc 82.031 (82.732)	lr 0.00981
Train [69][950/3239]	Time 9.776 (0.653)	Data Time 9.502 (0.169)	Loss 2.5968 (2.5660)	Entropy 0.61683 (0.61591)	Top-1 acc 61.719 (62.109)	Top-5 acc 79.688 (82.741)	lr 0.00981
Train [69][960/3239]	Time 0.358 (0.651)	Data Time 0.001 (0.167)	Loss 2.5457 (2.5659)	Entropy 0.61665 (0.61592)	Top-1 acc 58.984 (62.107)	Top-5 acc 82.031 (82.744)	lr 0.00981
Train [69][970/3239]	Time 0.246 (0.649)	Data Time 0.001 (0.165)	Loss 2.4897 (2.5656)	Entropy 0.61665 (0.61593)	Top-1 acc 62.891 (62.105)	Top-5 acc 83.203 (82.753)	lr 0.00981
Train [69][980/3239]	Time 0.232 (0.650)	Data Time 0.001 (0.167)	Loss 2.5001 (2.5662)	Entropy 0.61687 (0.61594)	Top-1 acc 62.891 (62.089)	Top-5 acc 83.594 (82.748)	lr 0.00980
Train [69][990/3239]	Time 0.235 (0.656)	Data Time 0.001 (0.173)	Loss 2.7733 (2.5669)	Entropy 0.61712 (0.61595)	Top-1 acc 59.375 (62.084)	Top-5 acc 78.125 (82.731)	lr 0.00980
Train [69][1000/3239]	Time 0.228 (0.653)	Data Time 0.001 (0.172)	Loss 2.5380 (2.5669)	Entropy 0.61722 (0.61596)	Top-1 acc 62.109 (62.091)	Top-5 acc 85.547 (82.732)	lr 0.00980
Train [69][1010/3239]	Time 0.233 (0.652)	Data Time 0.001 (0.171)	Loss 2.5815 (2.5670)	Entropy 0.61737 (0.61597)	Top-1 acc 62.109 (62.087)	Top-5 acc 82.812 (82.732)	lr 0.00980
Train [69][1020/3239]	Time 0.229 (0.660)	Data Time 0.001 (0.179)	Loss 2.4871 (2.5668)	Entropy 0.61759 (0.61599)	Top-1 acc 64.062 (62.090)	Top-5 acc 83.203 (82.736)	lr 0.00980
Train [69][1030/3239]	Time 0.258 (0.657)	Data Time 0.001 (0.178)	Loss 2.6175 (2.5674)	Entropy 0.61776 (0.61600)	Top-1 acc 58.203 (62.072)	Top-5 acc 81.250 (82.720)	lr 0.00980
Train [69][1040/3239]	Time 0.315 (0.699)	Data Time 0.004 (0.176)	Loss 2.6484 (2.5677)	Entropy 0.61769 (0.61602)	Top-1 acc 61.328 (62.060)	Top-5 acc 78.125 (82.713)	lr 0.00980
Train [69][1050/3239]	Time 0.322 (0.696)	Data Time 0.002 (0.174)	Loss 2.4423 (2.5677)	Entropy 0.61800 (0.61604)	Top-1 acc 64.453 (62.047)	Top-5 acc 85.938 (82.716)	lr 0.00980
Train [69][1060/3239]	Time 0.223 (0.693)	Data Time 0.001 (0.173)	Loss 2.7590 (2.5679)	Entropy 0.61817 (0.61606)	Top-1 acc 59.766 (62.040)	Top-5 acc 76.562 (82.702)	lr 0.00980
Train [69][1070/3239]	Time 0.235 (0.691)	Data Time 0.001 (0.171)	Loss 2.6813 (2.5679)	Entropy 0.61793 (0.61607)	Top-1 acc 58.203 (62.043)	Top-5 acc 78.125 (82.695)	lr 0.00980
Train [69][1080/3239]	Time 0.259 (0.688)	Data Time 0.001 (0.170)	Loss 2.6569 (2.5687)	Entropy 0.61812 (0.61609)	Top-1 acc 61.328 (62.031)	Top-5 acc 82.031 (82.678)	lr 0.00979
Train [69][1090/3239]	Time 0.245 (0.686)	Data Time 0.001 (0.168)	Loss 2.3821 (2.5691)	Entropy 0.61824 (0.61611)	Top-1 acc 66.406 (62.016)	Top-5 acc 86.328 (82.674)	lr 0.00979
Train [69][1100/3239]	Time 0.260 (0.684)	Data Time 0.001 (0.167)	Loss 2.7665 (2.5688)	Entropy 0.61821 (0.61613)	Top-1 acc 53.906 (62.013)	Top-5 acc 78.906 (82.681)	lr 0.00979
Train [69][1110/3239]	Time 0.251 (0.682)	Data Time 0.001 (0.165)	Loss 2.5711 (2.5685)	Entropy 0.61839 (0.61615)	Top-1 acc 63.281 (62.016)	Top-5 acc 82.812 (82.686)	lr 0.00979
Train [69][1120/3239]	Time 0.445 (0.680)	Data Time 0.003 (0.164)	Loss 2.7843 (2.5686)	Entropy 0.61865 (0.61617)	Top-1 acc 57.422 (62.017)	Top-5 acc 78.906 (82.679)	lr 0.00979
Train [69][1130/3239]	Time 0.248 (0.678)	Data Time 0.001 (0.162)	Loss 2.6940 (2.5691)	Entropy 0.61883 (0.61619)	Top-1 acc 63.672 (62.010)	Top-5 acc 79.688 (82.668)	lr 0.00979
Train [69][1140/3239]	Time 0.230 (0.678)	Data Time 0.001 (0.163)	Loss 2.5303 (2.5695)	Entropy 0.61864 (0.61622)	Top-1 acc 62.109 (61.996)	Top-5 acc 84.766 (82.662)	lr 0.00979
Train [69][1150/3239]	Time 0.251 (0.679)	Data Time 0.001 (0.165)	Loss 2.6925 (2.5697)	Entropy 0.61892 (0.61624)	Top-1 acc 62.109 (61.996)	Top-5 acc 78.516 (82.657)	lr 0.00979
Train [69][1160/3239]	Time 0.277 (0.680)	Data Time 0.001 (0.167)	Loss 2.6592 (2.5705)	Entropy 0.61890 (0.61626)	Top-1 acc 60.547 (61.976)	Top-5 acc 79.688 (82.641)	lr 0.00979
Train [69][1170/3239]	Time 0.237 (0.679)	Data Time 0.001 (0.167)	Loss 2.8158 (2.5709)	Entropy 0.61916 (0.61628)	Top-1 acc 53.906 (61.969)	Top-5 acc 76.953 (82.632)	lr 0.00979
Train [69][1180/3239]	Time 0.287 (0.683)	Data Time 0.002 (0.172)	Loss 2.5161 (2.5713)	Entropy 0.61890 (0.61631)	Top-1 acc 64.453 (61.961)	Top-5 acc 83.984 (82.627)	lr 0.00978
Train [69][1190/3239]	Time 0.241 (0.681)	Data Time 0.001 (0.170)	Loss 2.7070 (2.5715)	Entropy 0.61867 (0.61633)	Top-1 acc 59.766 (61.959)	Top-5 acc 80.859 (82.625)	lr 0.00978
Train [69][1200/3239]	Time 3.307 (0.681)	Data Time 2.988 (0.171)	Loss 2.5263 (2.5717)	Entropy 0.61863 (0.61635)	Top-1 acc 63.672 (61.949)	Top-5 acc 83.594 (82.621)	lr 0.00978
Train [69][1210/3239]	Time 2.295 (0.684)	Data Time 1.940 (0.175)	Loss 2.4069 (2.5711)	Entropy 0.61847 (0.61637)	Top-1 acc 64.453 (61.956)	Top-5 acc 85.938 (82.631)	lr 0.00978
Train [69][1220/3239]	Time 0.249 (0.682)	Data Time 0.002 (0.173)	Loss 2.5428 (2.5715)	Entropy 0.61856 (0.61639)	Top-1 acc 61.719 (61.946)	Top-5 acc 86.328 (82.632)	lr 0.00978
Train [69][1230/3239]	Time 0.242 (0.680)	Data Time 0.001 (0.172)	Loss 2.3731 (2.5712)	Entropy 0.61867 (0.61640)	Top-1 acc 66.016 (61.958)	Top-5 acc 88.281 (82.638)	lr 0.00978
Train [69][1240/3239]	Time 0.238 (0.683)	Data Time 0.001 (0.176)	Loss 2.3841 (2.5710)	Entropy 0.61889 (0.61642)	Top-1 acc 66.406 (61.965)	Top-5 acc 87.500 (82.646)	lr 0.00978
Train [69][1250/3239]	Time 0.245 (0.684)	Data Time 0.001 (0.177)	Loss 2.4868 (2.5708)	Entropy 0.61858 (0.61644)	Top-1 acc 63.672 (61.965)	Top-5 acc 85.547 (82.648)	lr 0.00978
Train [69][1260/3239]	Time 0.228 (0.682)	Data Time 0.001 (0.176)	Loss 2.2779 (2.5711)	Entropy 0.61871 (0.61646)	Top-1 acc 70.703 (61.964)	Top-5 acc 86.719 (82.634)	lr 0.00978
Train [69][1270/3239]	Time 0.234 (0.684)	Data Time 0.001 (0.178)	Loss 2.4931 (2.5708)	Entropy 0.61883 (0.61648)	Top-1 acc 62.891 (61.977)	Top-5 acc 84.375 (82.632)	lr 0.00978
Train [69][1280/3239]	Time 0.427 (0.687)	Data Time 0.001 (0.182)	Loss 2.7272 (2.5712)	Entropy 0.61896 (0.61650)	Top-1 acc 60.547 (61.970)	Top-5 acc 83.203 (82.632)	lr 0.00977
Train [69][1290/3239]	Time 0.250 (0.685)	Data Time 0.001 (0.180)	Loss 2.4923 (2.5709)	Entropy 0.61884 (0.61652)	Top-1 acc 66.016 (61.979)	Top-5 acc 82.812 (82.638)	lr 0.00977
Train [69][1300/3239]	Time 0.242 (0.686)	Data Time 0.001 (0.182)	Loss 2.4066 (2.5710)	Entropy 0.61905 (0.61653)	Top-1 acc 68.750 (61.988)	Top-5 acc 85.156 (82.632)	lr 0.00977
Train [69][1310/3239]	Time 0.226 (0.689)	Data Time 0.001 (0.185)	Loss 2.7352 (2.5706)	Entropy 0.61857 (0.61655)	Top-1 acc 56.641 (61.995)	Top-5 acc 78.516 (82.633)	lr 0.00977
Train [69][1320/3239]	Time 0.256 (0.687)	Data Time 0.001 (0.184)	Loss 2.6544 (2.5706)	Entropy 0.61870 (0.61657)	Top-1 acc 60.547 (62.002)	Top-5 acc 80.859 (82.634)	lr 0.00977
Train [69][1330/3239]	Time 0.254 (0.687)	Data Time 0.001 (0.185)	Loss 2.4184 (2.5703)	Entropy 0.61858 (0.61658)	Top-1 acc 66.406 (62.012)	Top-5 acc 84.375 (82.645)	lr 0.00977
Train [69][1340/3239]	Time 0.282 (0.690)	Data Time 0.001 (0.188)	Loss 2.4858 (2.5701)	Entropy 0.61849 (0.61660)	Top-1 acc 62.109 (62.016)	Top-5 acc 87.109 (82.647)	lr 0.00977
Train [69][1350/3239]	Time 0.237 (0.688)	Data Time 0.001 (0.187)	Loss 2.6569 (2.5699)	Entropy 0.61839 (0.61661)	Top-1 acc 60.547 (62.021)	Top-5 acc 82.422 (82.652)	lr 0.00977
Train [69][1360/3239]	Time 1.745 (0.687)	Data Time 1.496 (0.187)	Loss 2.7364 (2.5704)	Entropy 0.61807 (0.61662)	Top-1 acc 59.375 (62.005)	Top-5 acc 78.516 (82.641)	lr 0.00977
Train [69][1370/3239]	Time 0.251 (0.693)	Data Time 0.002 (0.193)	Loss 2.3624 (2.5700)	Entropy 0.61818 (0.61663)	Top-1 acc 67.578 (62.009)	Top-5 acc 86.719 (82.650)	lr 0.00977
Train [69][1380/3239]	Time 0.219 (0.691)	Data Time 0.001 (0.191)	Loss 2.4780 (2.5699)	Entropy 0.61819 (0.61665)	Top-1 acc 64.062 (62.004)	Top-5 acc 83.594 (82.654)	lr 0.00976
Train [69][1390/3239]	Time 0.234 (0.689)	Data Time 0.001 (0.190)	Loss 2.6679 (2.5702)	Entropy 0.61855 (0.61666)	Top-1 acc 59.375 (61.996)	Top-5 acc 79.297 (82.650)	lr 0.00976
Train [69][1400/3239]	Time 0.243 (0.692)	Data Time 0.001 (0.194)	Loss 2.4390 (2.5700)	Entropy 0.61877 (0.61667)	Top-1 acc 65.625 (62.002)	Top-5 acc 83.984 (82.653)	lr 0.00976
Train [69][1410/3239]	Time 0.219 (0.693)	Data Time 0.001 (0.196)	Loss 2.6289 (2.5699)	Entropy 0.61908 (0.61669)	Top-1 acc 60.156 (62.003)	Top-5 acc 82.422 (82.653)	lr 0.00976
Train [69][1420/3239]	Time 0.264 (0.691)	Data Time 0.001 (0.194)	Loss 2.5158 (2.5699)	Entropy 0.61898 (0.61670)	Top-1 acc 61.719 (62.004)	Top-5 acc 82.031 (82.649)	lr 0.00976
Train [69][1430/3239]	Time 0.252 (0.691)	Data Time 0.002 (0.195)	Loss 2.7204 (2.5697)	Entropy 0.61869 (0.61672)	Top-1 acc 59.375 (62.016)	Top-5 acc 78.125 (82.649)	lr 0.00976
Train [69][1440/3239]	Time 0.328 (0.697)	Data Time 0.001 (0.201)	Loss 2.5152 (2.5699)	Entropy 0.61876 (0.61673)	Top-1 acc 64.453 (62.011)	Top-5 acc 82.422 (82.641)	lr 0.00976
Train [69][1450/3239]	Time 0.266 (0.695)	Data Time 0.001 (0.200)	Loss 2.5409 (2.5701)	Entropy 0.61887 (0.61675)	Top-1 acc 61.328 (62.006)	Top-5 acc 82.812 (82.641)	lr 0.00976
Train [69][1460/3239]	Time 0.240 (0.694)	Data Time 0.001 (0.200)	Loss 2.7172 (2.5703)	Entropy 0.61914 (0.61676)	Top-1 acc 58.984 (61.998)	Top-5 acc 82.031 (82.637)	lr 0.00976
Train [69][1470/3239]	Time 0.251 (0.699)	Data Time 0.001 (0.205)	Loss 2.5798 (2.5702)	Entropy 0.61882 (0.61678)	Top-1 acc 64.062 (61.998)	Top-5 acc 82.031 (82.644)	lr 0.00976
Train [69][1480/3239]	Time 0.230 (0.697)	Data Time 0.001 (0.204)	Loss 2.4190 (2.5702)	Entropy 0.61867 (0.61679)	Top-1 acc 64.453 (61.994)	Top-5 acc 84.375 (82.636)	lr 0.00976
Train [69][1490/3239]	Time 0.239 (0.698)	Data Time 0.001 (0.205)	Loss 2.6101 (2.5700)	Entropy 0.61872 (0.61681)	Top-1 acc 60.156 (61.994)	Top-5 acc 80.078 (82.640)	lr 0.00975
Train [69][1500/3239]	Time 0.241 (0.699)	Data Time 0.001 (0.207)	Loss 2.5015 (2.5694)	Entropy 0.61870 (0.61682)	Top-1 acc 62.109 (62.003)	Top-5 acc 83.594 (82.653)	lr 0.00975
Train [69][1510/3239]	Time 0.323 (0.699)	Data Time 0.001 (0.207)	Loss 2.7240 (2.5698)	Entropy 0.61875 (0.61683)	Top-1 acc 59.766 (61.995)	Top-5 acc 78.906 (82.645)	lr 0.00975
Train [69][1520/3239]	Time 3.983 (0.699)	Data Time 3.727 (0.208)	Loss 2.3163 (2.5694)	Entropy 0.61850 (0.61684)	Top-1 acc 65.234 (62.004)	Top-5 acc 85.156 (82.650)	lr 0.00975
Train [69][1530/3239]	Time 0.238 (0.702)	Data Time 0.001 (0.211)	Loss 2.5121 (2.5693)	Entropy 0.61831 (0.61685)	Top-1 acc 66.406 (62.007)	Top-5 acc 83.203 (82.656)	lr 0.00975
Train [69][1540/3239]	Time 0.235 (0.702)	Data Time 0.001 (0.211)	Loss 2.5875 (2.5695)	Entropy 0.61834 (0.61686)	Top-1 acc 61.719 (62.006)	Top-5 acc 81.641 (82.652)	lr 0.00975
Train [69][1550/3239]	Time 0.250 (0.700)	Data Time 0.001 (0.210)	Loss 2.4029 (2.5695)	Entropy 0.61827 (0.61687)	Top-1 acc 65.234 (62.010)	Top-5 acc 83.984 (82.648)	lr 0.00975
Train [69][1560/3239]	Time 0.243 (0.706)	Data Time 0.001 (0.216)	Loss 2.4374 (2.5696)	Entropy 0.61856 (0.61688)	Top-1 acc 63.672 (62.001)	Top-5 acc 84.766 (82.647)	lr 0.00975
Train [69][1570/3239]	Time 0.231 (0.705)	Data Time 0.001 (0.216)	Loss 2.6702 (2.5694)	Entropy 0.61856 (0.61689)	Top-1 acc 60.938 (62.011)	Top-5 acc 79.688 (82.652)	lr 0.00975
Train [69][1580/3239]	Time 0.239 (0.704)	Data Time 0.001 (0.214)	Loss 2.5278 (2.5694)	Entropy 0.61866 (0.61690)	Top-1 acc 62.891 (62.004)	Top-5 acc 83.984 (82.650)	lr 0.00975
Train [69][1590/3239]	Time 0.246 (0.706)	Data Time 0.001 (0.217)	Loss 2.5242 (2.5693)	Entropy 0.61877 (0.61691)	Top-1 acc 60.156 (62.008)	Top-5 acc 85.156 (82.654)	lr 0.00974
Train [69][1600/3239]	Time 0.330 (0.709)	Data Time 0.001 (0.221)	Loss 2.6112 (2.5693)	Entropy 0.61887 (0.61692)	Top-1 acc 59.375 (62.009)	Top-5 acc 83.984 (82.654)	lr 0.00974
Train [69][1610/3239]	Time 0.240 (0.708)	Data Time 0.001 (0.220)	Loss 2.6621 (2.5696)	Entropy 0.61872 (0.61694)	Top-1 acc 57.812 (62.000)	Top-5 acc 82.422 (82.651)	lr 0.00974
Train [69][1620/3239]	Time 0.247 (0.710)	Data Time 0.001 (0.223)	Loss 2.3234 (2.5695)	Entropy 0.61864 (0.61695)	Top-1 acc 68.750 (61.999)	Top-5 acc 86.328 (82.652)	lr 0.00974
Train [69][1630/3239]	Time 0.234 (0.714)	Data Time 0.001 (0.227)	Loss 2.5729 (2.5693)	Entropy 0.61854 (0.61696)	Top-1 acc 66.016 (62.005)	Top-5 acc 83.203 (82.658)	lr 0.00974
Train [69][1640/3239]	Time 0.250 (0.712)	Data Time 0.001 (0.225)	Loss 2.4126 (2.5693)	Entropy 0.61846 (0.61697)	Top-1 acc 65.625 (62.013)	Top-5 acc 84.375 (82.656)	lr 0.00974
Train [69][1650/3239]	Time 0.232 (0.714)	Data Time 0.001 (0.227)	Loss 2.5576 (2.5695)	Entropy 0.61867 (0.61698)	Top-1 acc 58.203 (62.004)	Top-5 acc 82.031 (82.650)	lr 0.00974
Train [69][1660/3239]	Time 0.243 (0.720)	Data Time 0.001 (0.234)	Loss 2.5283 (2.5698)	Entropy 0.61871 (0.61699)	Top-1 acc 58.984 (61.997)	Top-5 acc 82.422 (82.644)	lr 0.00974
Train [69][1670/3239]	Time 0.326 (0.718)	Data Time 0.001 (0.233)	Loss 2.5632 (2.5694)	Entropy 0.61878 (0.61700)	Top-1 acc 58.984 (62.003)	Top-5 acc 83.594 (82.651)	lr 0.00974
Train [69][1680/3239]	Time 3.471 (0.718)	Data Time 3.211 (0.233)	Loss 2.7904 (2.5703)	Entropy 0.61818 (0.61701)	Top-1 acc 56.250 (61.982)	Top-5 acc 78.516 (82.641)	lr 0.00974
Train [69][1690/3239]	Time 0.240 (0.724)	Data Time 0.001 (0.239)	Loss 2.3865 (2.5699)	Entropy 0.61850 (0.61701)	Top-1 acc 66.016 (61.989)	Top-5 acc 87.109 (82.645)	lr 0.00973
Train [69][1700/3239]	Time 0.272 (0.749)	Data Time 0.004 (0.238)	Loss 2.6973 (2.5700)	Entropy 0.61820 (0.61702)	Top-1 acc 59.375 (61.986)	Top-5 acc 80.078 (82.642)	lr 0.00973
Train [69][1710/3239]	Time 0.237 (0.747)	Data Time 0.001 (0.236)	Loss 2.4480 (2.5698)	Entropy 0.61805 (0.61703)	Top-1 acc 66.797 (61.991)	Top-5 acc 83.594 (82.642)	lr 0.00973
Train [69][1720/3239]	Time 0.245 (0.745)	Data Time 0.002 (0.235)	Loss 2.7196 (2.5698)	Entropy 0.61792 (0.61703)	Top-1 acc 53.516 (61.988)	Top-5 acc 79.297 (82.638)	lr 0.00973
Train [69][1730/3239]	Time 0.256 (0.743)	Data Time 0.002 (0.234)	Loss 2.4840 (2.5700)	Entropy 0.61796 (0.61704)	Top-1 acc 62.109 (61.981)	Top-5 acc 82.031 (82.631)	lr 0.00973
Train [69][1740/3239]	Time 0.236 (0.741)	Data Time 0.001 (0.232)	Loss 2.2592 (2.5701)	Entropy 0.61821 (0.61705)	Top-1 acc 70.312 (61.979)	Top-5 acc 88.672 (82.632)	lr 0.00973
Train [69][1750/3239]	Time 0.244 (0.739)	Data Time 0.001 (0.231)	Loss 2.6925 (2.5704)	Entropy 0.61815 (0.61705)	Top-1 acc 56.250 (61.973)	Top-5 acc 81.250 (82.628)	lr 0.00973
Train [69][1760/3239]	Time 0.399 (0.741)	Data Time 0.001 (0.233)	Loss 2.7750 (2.5706)	Entropy 0.61844 (0.61706)	Top-1 acc 58.203 (61.973)	Top-5 acc 79.688 (82.627)	lr 0.00973
Train [69][1770/3239]	Time 0.230 (0.739)	Data Time 0.001 (0.232)	Loss 2.3432 (2.5706)	Entropy 0.61843 (0.61707)	Top-1 acc 69.531 (61.966)	Top-5 acc 88.281 (82.629)	lr 0.00973
Train [69][1780/3239]	Time 0.260 (0.738)	Data Time 0.001 (0.231)	Loss 2.5400 (2.5706)	Entropy 0.61857 (0.61707)	Top-1 acc 62.109 (61.967)	Top-5 acc 83.203 (82.628)	lr 0.00973
Train [69][1790/3239]	Time 0.229 (0.737)	Data Time 0.001 (0.230)	Loss 2.5615 (2.5706)	Entropy 0.61855 (0.61708)	Top-1 acc 63.672 (61.970)	Top-5 acc 82.812 (82.628)	lr 0.00972
Train [69][1800/3239]	Time 0.235 (0.745)	Data Time 0.001 (0.239)	Loss 2.6028 (2.5707)	Entropy 0.61866 (0.61709)	Top-1 acc 59.766 (61.970)	Top-5 acc 82.812 (82.630)	lr 0.00972
Train [69][1810/3239]	Time 0.302 (0.745)	Data Time 0.002 (0.240)	Loss 2.5192 (2.5704)	Entropy 0.61867 (0.61710)	Top-1 acc 59.375 (61.973)	Top-5 acc 85.938 (82.638)	lr 0.00972
Train [69][1820/3239]	Time 0.230 (0.744)	Data Time 0.001 (0.238)	Loss 2.7647 (2.5707)	Entropy 0.61906 (0.61711)	Top-1 acc 56.641 (61.968)	Top-5 acc 79.297 (82.630)	lr 0.00972
Train [69][1830/3239]	Time 0.386 (0.751)	Data Time 0.001 (0.246)	Loss 2.4382 (2.5708)	Entropy 0.61891 (0.61712)	Top-1 acc 64.453 (61.957)	Top-5 acc 84.375 (82.631)	lr 0.00972
Train [69][1840/3239]	Time 0.234 (0.751)	Data Time 0.001 (0.247)	Loss 2.6025 (2.5708)	Entropy 0.61905 (0.61713)	Top-1 acc 63.672 (61.959)	Top-5 acc 83.203 (82.633)	lr 0.00972
Train [69][1850/3239]	Time 0.231 (0.750)	Data Time 0.001 (0.246)	Loss 2.5357 (2.5705)	Entropy 0.61913 (0.61714)	Top-1 acc 62.891 (61.968)	Top-5 acc 82.031 (82.637)	lr 0.00972
Train [69][1860/3239]	Time 0.247 (0.756)	Data Time 0.001 (0.253)	Loss 2.7340 (2.5706)	Entropy 0.61883 (0.61715)	Top-1 acc 56.250 (61.966)	Top-5 acc 81.250 (82.635)	lr 0.00972
Train [69][1870/3239]	Time 0.257 (0.755)	Data Time 0.001 (0.252)	Loss 2.3565 (2.5706)	Entropy 0.61874 (0.61716)	Top-1 acc 66.797 (61.967)	Top-5 acc 85.938 (82.635)	lr 0.00972
Train [69][1880/3239]	Time 0.247 (0.757)	Data Time 0.001 (0.254)	Loss 2.6785 (2.5704)	Entropy 0.61868 (0.61717)	Top-1 acc 59.375 (61.971)	Top-5 acc 79.688 (82.637)	lr 0.00972
Train [69][1890/3239]	Time 0.236 (0.760)	Data Time 0.001 (0.258)	Loss 2.5357 (2.5706)	Entropy 0.61891 (0.61718)	Top-1 acc 63.672 (61.969)	Top-5 acc 83.203 (82.632)	lr 0.00971
Train [69][1900/3239]	Time 0.229 (0.760)	Data Time 0.001 (0.259)	Loss 2.7850 (2.5711)	Entropy 0.61932 (0.61719)	Top-1 acc 59.375 (61.953)	Top-5 acc 76.953 (82.620)	lr 0.00971
Train [69][1910/3239]	Time 0.235 (0.763)	Data Time 0.001 (0.262)	Loss 2.6808 (2.5710)	Entropy 0.61926 (0.61720)	Top-1 acc 61.719 (61.955)	Top-5 acc 79.688 (82.620)	lr 0.00971
Train [69][1920/3239]	Time 0.361 (0.769)	Data Time 0.001 (0.268)	Loss 2.4965 (2.5711)	Entropy 0.61899 (0.61721)	Top-1 acc 63.281 (61.956)	Top-5 acc 87.500 (82.622)	lr 0.00971
Train [69][1930/3239]	Time 0.230 (0.767)	Data Time 0.001 (0.266)	Loss 2.4584 (2.5712)	Entropy 0.61903 (0.61722)	Top-1 acc 66.797 (61.954)	Top-5 acc 84.375 (82.622)	lr 0.00971
Train [69][1940/3239]	Time 0.257 (0.772)	Data Time 0.001 (0.272)	Loss 2.8074 (2.5716)	Entropy 0.61934 (0.61723)	Top-1 acc 58.984 (61.952)	Top-5 acc 79.297 (82.611)	lr 0.00971
Train [69][1950/3239]	Time 0.225 (0.770)	Data Time 0.001 (0.271)	Loss 2.4374 (2.5717)	Entropy 0.61955 (0.61724)	Top-1 acc 67.578 (61.952)	Top-5 acc 83.594 (82.608)	lr 0.00971
Train [69][1960/3239]	Time 0.251 (0.774)	Data Time 0.006 (0.275)	Loss 2.6291 (2.5716)	Entropy 0.61907 (0.61725)	Top-1 acc 58.984 (61.952)	Top-5 acc 82.812 (82.611)	lr 0.00971
Train [69][1970/3239]	Time 0.263 (0.779)	Data Time 0.001 (0.280)	Loss 2.3993 (2.5714)	Entropy 0.61908 (0.61726)	Top-1 acc 63.672 (61.956)	Top-5 acc 87.109 (82.613)	lr 0.00971
Train [69][1980/3239]	Time 0.236 (0.778)	Data Time 0.001 (0.279)	Loss 2.4224 (2.5715)	Entropy 0.61914 (0.61727)	Top-1 acc 65.234 (61.947)	Top-5 acc 85.938 (82.608)	lr 0.00971
Train [69][1990/3239]	Time 0.325 (0.781)	Data Time 0.001 (0.283)	Loss 2.4264 (2.5710)	Entropy 0.61915 (0.61728)	Top-1 acc 67.969 (61.961)	Top-5 acc 85.156 (82.618)	lr 0.00970
Train [69][2000/3239]	Time 0.242 (0.787)	Data Time 0.001 (0.289)	Loss 2.6932 (2.5713)	Entropy 0.61911 (0.61728)	Top-1 acc 61.328 (61.953)	Top-5 acc 77.344 (82.610)	lr 0.00970
Train [69][2010/3239]	Time 0.239 (0.785)	Data Time 0.001 (0.287)	Loss 2.5366 (2.5711)	Entropy 0.61959 (0.61729)	Top-1 acc 67.188 (61.951)	Top-5 acc 82.812 (82.616)	lr 0.00970
Train [69][2020/3239]	Time 0.238 (0.791)	Data Time 0.001 (0.294)	Loss 2.3799 (2.5709)	Entropy 0.61935 (0.61731)	Top-1 acc 67.188 (61.958)	Top-5 acc 84.766 (82.615)	lr 0.00970
Train [69][2030/3239]	Time 0.227 (0.790)	Data Time 0.001 (0.293)	Loss 2.5995 (2.5710)	Entropy 0.61898 (0.61732)	Top-1 acc 62.109 (61.958)	Top-5 acc 80.859 (82.611)	lr 0.00970
Train [69][2040/3239]	Time 0.239 (0.794)	Data Time 0.001 (0.298)	Loss 2.4506 (2.5712)	Entropy 0.61904 (0.61732)	Top-1 acc 65.625 (61.953)	Top-5 acc 82.422 (82.602)	lr 0.00970
Train [69][2050/3239]	Time 0.252 (0.799)	Data Time 0.001 (0.304)	Loss 2.5687 (2.5710)	Entropy 0.61913 (0.61733)	Top-1 acc 62.891 (61.958)	Top-5 acc 81.250 (82.601)	lr 0.00970
Train [69][2060/3239]	Time 0.318 (0.800)	Data Time 0.001 (0.305)	Loss 2.6502 (2.5710)	Entropy 0.61835 (0.61734)	Top-1 acc 61.719 (61.957)	Top-5 acc 80.078 (82.600)	lr 0.00970
Train [69][2070/3239]	Time 0.228 (0.805)	Data Time 0.001 (0.310)	Loss 2.6409 (2.5712)	Entropy 0.61792 (0.61734)	Top-1 acc 55.078 (61.952)	Top-5 acc 82.422 (82.599)	lr 0.00970
Train [69][2080/3239]	Time 0.228 (0.807)	Data Time 0.001 (0.313)	Loss 2.6020 (2.5710)	Entropy 0.61791 (0.61735)	Top-1 acc 64.062 (61.958)	Top-5 acc 82.031 (82.604)	lr 0.00970
Train [69][2090/3239]	Time 0.228 (0.807)	Data Time 0.001 (0.313)	Loss 2.5464 (2.5710)	Entropy 0.61769 (0.61735)	Top-1 acc 63.281 (61.961)	Top-5 acc 84.766 (82.602)	lr 0.00970
Train [69][2100/3239]	Time 0.227 (0.813)	Data Time 0.001 (0.319)	Loss 2.3877 (2.5711)	Entropy 0.61780 (0.61735)	Top-1 acc 69.141 (61.955)	Top-5 acc 88.281 (82.601)	lr 0.00969
Train [69][2110/3239]	Time 0.236 (0.811)	Data Time 0.001 (0.318)	Loss 2.5234 (2.5710)	Entropy 0.61804 (0.61735)	Top-1 acc 63.281 (61.962)	Top-5 acc 85.547 (82.602)	lr 0.00969
Train [69][2120/3239]	Time 4.274 (0.816)	Data Time 4.013 (0.323)	Loss 2.6286 (2.5710)	Entropy 0.61814 (0.61736)	Top-1 acc 68.359 (61.967)	Top-5 acc 82.812 (82.602)	lr 0.00969
Train [69][2130/3239]	Time 0.233 (0.822)	Data Time 0.001 (0.329)	Loss 2.5454 (2.5711)	Entropy 0.61827 (0.61736)	Top-1 acc 58.203 (61.962)	Top-5 acc 84.766 (82.601)	lr 0.00969
Train [69][2140/3239]	Time 0.244 (0.820)	Data Time 0.001 (0.328)	Loss 2.6437 (2.5712)	Entropy 0.61806 (0.61736)	Top-1 acc 60.938 (61.958)	Top-5 acc 81.250 (82.600)	lr 0.00969
Train [69][2150/3239]	Time 0.323 (0.823)	Data Time 0.001 (0.331)	Loss 2.4799 (2.5711)	Entropy 0.61780 (0.61737)	Top-1 acc 62.500 (61.958)	Top-5 acc 83.594 (82.597)	lr 0.00969
Train [69][2160/3239]	Time 0.240 (0.830)	Data Time 0.001 (0.338)	Loss 2.3218 (2.5709)	Entropy 0.61770 (0.61737)	Top-1 acc 70.312 (61.963)	Top-5 acc 87.500 (82.603)	lr 0.00969
Train [69][2170/3239]	Time 0.230 (0.828)	Data Time 0.001 (0.337)	Loss 2.7156 (2.5708)	Entropy 0.61787 (0.61737)	Top-1 acc 59.375 (61.966)	Top-5 acc 78.516 (82.604)	lr 0.00969
Train [69][2180/3239]	Time 0.227 (0.832)	Data Time 0.001 (0.341)	Loss 2.5759 (2.5708)	Entropy 0.61798 (0.61737)	Top-1 acc 63.281 (61.967)	Top-5 acc 82.422 (82.605)	lr 0.00969
Train [69][2190/3239]	Time 0.235 (0.833)	Data Time 0.001 (0.342)	Loss 2.5161 (2.5707)	Entropy 0.61826 (0.61738)	Top-1 acc 62.891 (61.970)	Top-5 acc 82.422 (82.606)	lr 0.00969
Train [69][2200/3239]	Time 0.241 (0.839)	Data Time 0.001 (0.348)	Loss 2.6017 (2.5706)	Entropy 0.61864 (0.61738)	Top-1 acc 58.594 (61.971)	Top-5 acc 82.422 (82.608)	lr 0.00968
Train [69][2210/3239]	Time 0.277 (0.839)	Data Time 0.001 (0.349)	Loss 2.5776 (2.5708)	Entropy 0.61872 (0.61739)	Top-1 acc 62.891 (61.968)	Top-5 acc 82.422 (82.602)	lr 0.00968
Train [69][2220/3239]	Time 1.334 (0.841)	Data Time 0.997 (0.351)	Loss 2.4639 (2.5708)	Entropy 0.61892 (0.61739)	Top-1 acc 64.453 (61.967)	Top-5 acc 83.203 (82.603)	lr 0.00968
Train [69][2230/3239]	Time 0.251 (0.844)	Data Time 0.001 (0.355)	Loss 2.7183 (2.5707)	Entropy 0.61910 (0.61740)	Top-1 acc 60.547 (61.969)	Top-5 acc 80.469 (82.605)	lr 0.00968
Train [69][2240/3239]	Time 0.261 (0.845)	Data Time 0.001 (0.356)	Loss 2.4874 (2.5706)	Entropy 0.61945 (0.61741)	Top-1 acc 66.406 (61.974)	Top-5 acc 84.375 (82.607)	lr 0.00968
Train [69][2250/3239]	Time 0.240 (0.848)	Data Time 0.001 (0.359)	Loss 2.4452 (2.5704)	Entropy 0.61945 (0.61742)	Top-1 acc 68.750 (61.976)	Top-5 acc 84.766 (82.608)	lr 0.00968
Train [69][2260/3239]	Time 0.250 (0.850)	Data Time 0.001 (0.362)	Loss 2.6496 (2.5704)	Entropy 0.61920 (0.61742)	Top-1 acc 60.547 (61.981)	Top-5 acc 78.906 (82.606)	lr 0.00968
Train [69][2270/3239]	Time 0.231 (0.848)	Data Time 0.001 (0.360)	Loss 2.5193 (2.5704)	Entropy 0.61918 (0.61743)	Top-1 acc 60.938 (61.977)	Top-5 acc 83.984 (82.605)	lr 0.00968
Train [69][2280/3239]	Time 4.269 (0.853)	Data Time 3.989 (0.366)	Loss 2.5244 (2.5702)	Entropy 0.61947 (0.61744)	Top-1 acc 61.328 (61.979)	Top-5 acc 85.156 (82.608)	lr 0.00968
Train [69][2290/3239]	Time 0.239 (0.858)	Data Time 0.001 (0.371)	Loss 2.4219 (2.5703)	Entropy 0.61919 (0.61745)	Top-1 acc 65.625 (61.979)	Top-5 acc 85.547 (82.606)	lr 0.00968
Train [69][2300/3239]	Time 0.241 (0.856)	Data Time 0.001 (0.369)	Loss 2.6737 (2.5705)	Entropy 0.61903 (0.61746)	Top-1 acc 56.250 (61.973)	Top-5 acc 82.422 (82.604)	lr 0.00967
Train [69][2310/3239]	Time 0.315 (0.859)	Data Time 0.001 (0.373)	Loss 2.7048 (2.5707)	Entropy 0.61913 (0.61746)	Top-1 acc 60.547 (61.976)	Top-5 acc 80.078 (82.599)	lr 0.00967
Train [69][2320/3239]	Time 0.240 (0.866)	Data Time 0.001 (0.379)	Loss 2.5685 (2.5706)	Entropy 0.61865 (0.61747)	Top-1 acc 62.109 (61.979)	Top-5 acc 82.812 (82.599)	lr 0.00967
Train [69][2330/3239]	Time 0.228 (0.864)	Data Time 0.001 (0.378)	Loss 2.7679 (2.5708)	Entropy 0.61859 (0.61747)	Top-1 acc 55.859 (61.976)	Top-5 acc 80.078 (82.595)	lr 0.00967
Train [69][2340/3239]	Time 0.238 (0.867)	Data Time 0.001 (0.381)	Loss 2.5803 (2.5707)	Entropy 0.61873 (0.61748)	Top-1 acc 61.328 (61.978)	Top-5 acc 83.203 (82.597)	lr 0.00967
Train [69][2350/3239]	Time 0.403 (0.887)	Data Time 0.042 (0.382)	Loss 2.6093 (2.5706)	Entropy 0.61873 (0.61748)	Top-1 acc 62.109 (61.975)	Top-5 acc 83.203 (82.601)	lr 0.00967
Train [69][2360/3239]	Time 0.257 (0.886)	Data Time 0.002 (0.381)	Loss 2.5142 (2.5707)	Entropy 0.61864 (0.61749)	Top-1 acc 64.062 (61.973)	Top-5 acc 83.203 (82.599)	lr 0.00967
Train [69][2370/3239]	Time 0.232 (0.884)	Data Time 0.001 (0.379)	Loss 2.6374 (2.5707)	Entropy 0.61871 (0.61750)	Top-1 acc 59.375 (61.968)	Top-5 acc 82.422 (82.598)	lr 0.00967
Train [69][2380/3239]	Time 0.331 (0.882)	Data Time 0.001 (0.378)	Loss 2.5331 (2.5707)	Entropy 0.61915 (0.61750)	Top-1 acc 63.672 (61.970)	Top-5 acc 84.766 (82.601)	lr 0.00967
Train [69][2390/3239]	Time 0.246 (0.880)	Data Time 0.001 (0.376)	Loss 2.6841 (2.5709)	Entropy 0.61937 (0.61751)	Top-1 acc 57.812 (61.964)	Top-5 acc 81.250 (82.596)	lr 0.00967
Train [69][2400/3239]	Time 0.253 (0.878)	Data Time 0.001 (0.374)	Loss 2.5964 (2.5709)	Entropy 0.61936 (0.61752)	Top-1 acc 60.156 (61.966)	Top-5 acc 83.594 (82.598)	lr 0.00966
Train [69][2410/3239]	Time 0.246 (0.877)	Data Time 0.001 (0.373)	Loss 2.6048 (2.5710)	Entropy 0.61975 (0.61752)	Top-1 acc 62.109 (61.962)	Top-5 acc 81.641 (82.598)	lr 0.00966
Train [69][2420/3239]	Time 0.765 (0.880)	Data Time 0.522 (0.378)	Loss 2.5172 (2.5710)	Entropy 0.61957 (0.61753)	Top-1 acc 64.062 (61.964)	Top-5 acc 85.156 (82.599)	lr 0.00966
Train [69][2430/3239]	Time 0.551 (0.880)	Data Time 0.267 (0.377)	Loss 2.7025 (2.5713)	Entropy 0.61924 (0.61754)	Top-1 acc 56.641 (61.956)	Top-5 acc 82.812 (82.596)	lr 0.00966
Train [69][2440/3239]	Time 0.240 (0.882)	Data Time 0.001 (0.380)	Loss 2.6494 (2.5716)	Entropy 0.61945 (0.61755)	Top-1 acc 59.766 (61.950)	Top-5 acc 81.250 (82.590)	lr 0.00966
Train [69][2450/3239]	Time 4.589 (0.888)	Data Time 4.326 (0.386)	Loss 2.4550 (2.5717)	Entropy 0.61928 (0.61756)	Top-1 acc 66.797 (61.949)	Top-5 acc 84.375 (82.586)	lr 0.00966
Train [69][2460/3239]	Time 0.241 (0.886)	Data Time 0.001 (0.384)	Loss 2.6573 (2.5718)	Entropy 0.61901 (0.61756)	Top-1 acc 62.109 (61.951)	Top-5 acc 78.125 (82.584)	lr 0.00966
Train [69][2470/3239]	Time 0.368 (0.889)	Data Time 0.001 (0.388)	Loss 2.4048 (2.5720)	Entropy 0.61917 (0.61757)	Top-1 acc 62.891 (61.942)	Top-5 acc 85.938 (82.579)	lr 0.00966
Train [69][2480/3239]	Time 0.238 (0.893)	Data Time 0.001 (0.392)	Loss 2.5660 (2.5717)	Entropy 0.61916 (0.61757)	Top-1 acc 60.938 (61.949)	Top-5 acc 83.203 (82.583)	lr 0.00966
Train [69][2490/3239]	Time 0.228 (0.892)	Data Time 0.001 (0.392)	Loss 2.8811 (2.5721)	Entropy 0.61927 (0.61758)	Top-1 acc 52.344 (61.942)	Top-5 acc 77.344 (82.574)	lr 0.00966
Train [69][2500/3239]	Time 0.236 (0.897)	Data Time 0.001 (0.397)	Loss 2.5945 (2.5720)	Entropy 0.61943 (0.61759)	Top-1 acc 59.766 (61.943)	Top-5 acc 80.469 (82.576)	lr 0.00965
Train [69][2510/3239]	Time 8.436 (0.898)	Data Time 8.176 (0.398)	Loss 2.5428 (2.5720)	Entropy 0.61973 (0.61760)	Top-1 acc 64.453 (61.937)	Top-5 acc 84.375 (82.578)	lr 0.00965
Train [69][2520/3239]	Time 0.264 (0.899)	Data Time 0.002 (0.399)	Loss 2.8934 (2.5721)	Entropy 0.61993 (0.61760)	Top-1 acc 52.734 (61.936)	Top-5 acc 76.172 (82.576)	lr 0.00965
Train [69][2530/3239]	Time 0.233 (0.902)	Data Time 0.001 (0.403)	Loss 2.5151 (2.5723)	Entropy 0.61997 (0.61761)	Top-1 acc 60.547 (61.935)	Top-5 acc 82.812 (82.572)	lr 0.00965
Train [69][2540/3239]	Time 0.350 (0.900)	Data Time 0.001 (0.401)	Loss 2.6445 (2.5722)	Entropy 0.61999 (0.61762)	Top-1 acc 58.203 (61.936)	Top-5 acc 82.031 (82.573)	lr 0.00965
Train [69][2550/3239]	Time 0.223 (0.905)	Data Time 0.001 (0.406)	Loss 2.6208 (2.5724)	Entropy 0.62025 (0.61763)	Top-1 acc 63.281 (61.935)	Top-5 acc 80.078 (82.570)	lr 0.00965
Train [69][2560/3239]	Time 11.604 (0.907)	Data Time 11.346 (0.409)	Loss 2.6319 (2.5725)	Entropy 0.62042 (0.61764)	Top-1 acc 59.375 (61.929)	Top-5 acc 82.031 (82.568)	lr 0.00965
Train [69][2570/3239]	Time 0.235 (0.906)	Data Time 0.001 (0.408)	Loss 2.3903 (2.5728)	Entropy 0.61992 (0.61765)	Top-1 acc 66.016 (61.926)	Top-5 acc 86.328 (82.561)	lr 0.00965
Train [69][2580/3239]	Time 0.253 (0.910)	Data Time 0.001 (0.412)	Loss 2.5630 (2.5730)	Entropy 0.61986 (0.61766)	Top-1 acc 64.453 (61.923)	Top-5 acc 80.859 (82.557)	lr 0.00965
Train [69][2590/3239]	Time 0.238 (0.908)	Data Time 0.001 (0.410)	Loss 2.5185 (2.5728)	Entropy 0.61982 (0.61767)	Top-1 acc 62.109 (61.927)	Top-5 acc 84.375 (82.561)	lr 0.00965
Train [69][2600/3239]	Time 0.237 (0.910)	Data Time 0.001 (0.413)	Loss 2.4898 (2.5726)	Entropy 0.61936 (0.61768)	Top-1 acc 63.672 (61.932)	Top-5 acc 82.031 (82.564)	lr 0.00964
Train [69][2610/3239]	Time 0.251 (0.916)	Data Time 0.001 (0.418)	Loss 2.6586 (2.5724)	Entropy 0.61977 (0.61769)	Top-1 acc 59.766 (61.938)	Top-5 acc 80.469 (82.567)	lr 0.00964
Train [69][2620/3239]	Time 0.241 (0.914)	Data Time 0.001 (0.417)	Loss 2.7785 (2.5722)	Entropy 0.61967 (0.61769)	Top-1 acc 57.812 (61.943)	Top-5 acc 77.734 (82.567)	lr 0.00964
Train [69][2630/3239]	Time 0.269 (0.917)	Data Time 0.001 (0.420)	Loss 2.5338 (2.5722)	Entropy 0.61969 (0.61770)	Top-1 acc 64.453 (61.946)	Top-5 acc 84.766 (82.569)	lr 0.00964
Train [69][2640/3239]	Time 0.235 (0.920)	Data Time 0.001 (0.424)	Loss 2.6110 (2.5722)	Entropy 0.61971 (0.61771)	Top-1 acc 62.891 (61.945)	Top-5 acc 81.641 (82.565)	lr 0.00964
Train [69][2650/3239]	Time 0.230 (0.919)	Data Time 0.001 (0.423)	Loss 2.6386 (2.5721)	Entropy 0.61951 (0.61772)	Top-1 acc 63.281 (61.944)	Top-5 acc 80.469 (82.567)	lr 0.00964
Train [69][2660/3239]	Time 0.237 (0.921)	Data Time 0.001 (0.426)	Loss 2.4826 (2.5720)	Entropy 0.61972 (0.61772)	Top-1 acc 64.844 (61.939)	Top-5 acc 83.594 (82.568)	lr 0.00964
Train [69][2670/3239]	Time 14.044 (0.926)	Data Time 13.791 (0.430)	Loss 2.5614 (2.5720)	Entropy 0.62001 (0.61773)	Top-1 acc 59.766 (61.940)	Top-5 acc 83.203 (82.570)	lr 0.00964
Train [69][2680/3239]	Time 0.238 (0.926)	Data Time 0.001 (0.430)	Loss 2.3719 (2.5721)	Entropy 0.61977 (0.61774)	Top-1 acc 66.406 (61.940)	Top-5 acc 86.328 (82.565)	lr 0.00964
Train [69][2690/3239]	Time 0.243 (0.927)	Data Time 0.001 (0.433)	Loss 2.8399 (2.5722)	Entropy 0.61971 (0.61775)	Top-1 acc 55.859 (61.943)	Top-5 acc 75.781 (82.563)	lr 0.00964
Train [69][2700/3239]	Time 0.325 (0.927)	Data Time 0.001 (0.432)	Loss 2.5846 (2.5720)	Entropy 0.61958 (0.61775)	Top-1 acc 62.500 (61.949)	Top-5 acc 82.422 (82.566)	lr 0.00963
Train [69][2710/3239]	Time 0.257 (0.930)	Data Time 0.001 (0.435)	Loss 2.6034 (2.5721)	Entropy 0.61989 (0.61776)	Top-1 acc 58.984 (61.945)	Top-5 acc 82.812 (82.564)	lr 0.00963
Train [69][2720/3239]	Time 5.029 (0.932)	Data Time 4.795 (0.437)	Loss 2.4431 (2.5720)	Entropy 0.62001 (0.61777)	Top-1 acc 67.188 (61.950)	Top-5 acc 84.766 (82.566)	lr 0.00963
Train [69][2730/3239]	Time 0.238 (0.930)	Data Time 0.001 (0.436)	Loss 2.4839 (2.5719)	Entropy 0.62007 (0.61778)	Top-1 acc 67.578 (61.950)	Top-5 acc 83.594 (82.568)	lr 0.00963
Train [69][2740/3239]	Time 0.291 (0.935)	Data Time 0.001 (0.442)	Loss 2.5325 (2.5721)	Entropy 0.62030 (0.61779)	Top-1 acc 65.234 (61.951)	Top-5 acc 85.156 (82.565)	lr 0.00963
Train [69][2750/3239]	Time 0.221 (0.934)	Data Time 0.001 (0.441)	Loss 2.6427 (2.5721)	Entropy 0.62050 (0.61780)	Top-1 acc 63.672 (61.950)	Top-5 acc 80.078 (82.565)	lr 0.00963
Train [69][2760/3239]	Time 0.245 (0.937)	Data Time 0.001 (0.444)	Loss 2.5205 (2.5722)	Entropy 0.62084 (0.61781)	Top-1 acc 60.938 (61.947)	Top-5 acc 82.812 (82.562)	lr 0.00963
Train [69][2770/3239]	Time 4.290 (0.942)	Data Time 3.911 (0.449)	Loss 2.4981 (2.5722)	Entropy 0.62109 (0.61782)	Top-1 acc 62.500 (61.947)	Top-5 acc 83.594 (82.560)	lr 0.00963
Train [69][2780/3239]	Time 0.239 (0.940)	Data Time 0.001 (0.448)	Loss 2.5427 (2.5723)	Entropy 0.62078 (0.61783)	Top-1 acc 62.891 (61.949)	Top-5 acc 81.641 (82.556)	lr 0.00963
Train [69][2790/3239]	Time 0.227 (0.943)	Data Time 0.001 (0.451)	Loss 2.6732 (2.5722)	Entropy 0.62098 (0.61784)	Top-1 acc 55.859 (61.948)	Top-5 acc 81.641 (82.558)	lr 0.00963
Train [69][2800/3239]	Time 0.233 (0.946)	Data Time 0.001 (0.454)	Loss 2.5945 (2.5723)	Entropy 0.62069 (0.61785)	Top-1 acc 59.375 (61.945)	Top-5 acc 80.859 (82.556)	lr 0.00963
Train [69][2810/3239]	Time 0.227 (0.946)	Data Time 0.001 (0.454)	Loss 2.7108 (2.5727)	Entropy 0.62027 (0.61786)	Top-1 acc 55.859 (61.936)	Top-5 acc 80.859 (82.551)	lr 0.00962
Train [69][2820/3239]	Time 0.229 (0.947)	Data Time 0.001 (0.456)	Loss 2.6953 (2.5728)	Entropy 0.62020 (0.61787)	Top-1 acc 57.031 (61.932)	Top-5 acc 79.688 (82.550)	lr 0.00962
Train [69][2830/3239]	Time 16.789 (0.951)	Data Time 16.502 (0.461)	Loss 2.5293 (2.5727)	Entropy 0.61985 (0.61788)	Top-1 acc 67.578 (61.937)	Top-5 acc 84.375 (82.552)	lr 0.00962
Train [69][2840/3239]	Time 0.231 (0.953)	Data Time 0.001 (0.462)	Loss 2.6425 (2.5725)	Entropy 0.62001 (0.61788)	Top-1 acc 58.594 (61.941)	Top-5 acc 80.859 (82.555)	lr 0.00962
Train [69][2850/3239]	Time 0.248 (0.954)	Data Time 0.001 (0.463)	Loss 2.6480 (2.5723)	Entropy 0.61988 (0.61789)	Top-1 acc 62.500 (61.951)	Top-5 acc 80.859 (82.556)	lr 0.00962
Train [69][2860/3239]	Time 0.332 (0.952)	Data Time 0.001 (0.462)	Loss 2.6570 (2.5723)	Entropy 0.62013 (0.61790)	Top-1 acc 58.984 (61.947)	Top-5 acc 83.984 (82.553)	lr 0.00962
Train [69][2870/3239]	Time 0.232 (0.958)	Data Time 0.001 (0.468)	Loss 2.7980 (2.5721)	Entropy 0.62050 (0.61791)	Top-1 acc 58.203 (61.953)	Top-5 acc 78.516 (82.558)	lr 0.00962
Train [69][2880/3239]	Time 7.846 (0.958)	Data Time 7.587 (0.469)	Loss 2.4262 (2.5722)	Entropy 0.62066 (0.61791)	Top-1 acc 62.109 (61.951)	Top-5 acc 86.719 (82.559)	lr 0.00962
Train [69][2890/3239]	Time 0.232 (0.957)	Data Time 0.001 (0.467)	Loss 2.6453 (2.5723)	Entropy 0.62074 (0.61792)	Top-1 acc 58.984 (61.944)	Top-5 acc 82.422 (82.557)	lr 0.00962
Train [69][2900/3239]	Time 0.243 (0.966)	Data Time 0.001 (0.477)	Loss 2.7020 (2.5726)	Entropy 0.62102 (0.61793)	Top-1 acc 55.859 (61.936)	Top-5 acc 80.859 (82.550)	lr 0.00962
Train [69][2910/3239]	Time 0.243 (0.964)	Data Time 0.001 (0.475)	Loss 2.6738 (2.5726)	Entropy 0.62119 (0.61795)	Top-1 acc 58.594 (61.939)	Top-5 acc 81.641 (82.550)	lr 0.00961
Train [69][2920/3239]	Time 0.224 (0.963)	Data Time 0.001 (0.474)	Loss 2.5393 (2.5728)	Entropy 0.62146 (0.61796)	Top-1 acc 63.672 (61.934)	Top-5 acc 81.641 (82.545)	lr 0.00961
Train [69][2930/3239]	Time 10.888 (0.972)	Data Time 10.538 (0.483)	Loss 2.6875 (2.5729)	Entropy 0.62129 (0.61797)	Top-1 acc 60.156 (61.933)	Top-5 acc 78.906 (82.546)	lr 0.00961
Train [69][2940/3239]	Time 0.244 (0.970)	Data Time 0.001 (0.482)	Loss 2.5243 (2.5728)	Entropy 0.62157 (0.61798)	Top-1 acc 64.062 (61.932)	Top-5 acc 83.203 (82.550)	lr 0.00961
Train [69][2950/3239]	Time 0.246 (0.969)	Data Time 0.001 (0.482)	Loss 2.6852 (2.5728)	Entropy 0.62157 (0.61799)	Top-1 acc 58.203 (61.926)	Top-5 acc 81.641 (82.550)	lr 0.00961
Train [69][2960/3239]	Time 0.225 (0.974)	Data Time 0.001 (0.486)	Loss 2.6208 (2.5729)	Entropy 0.62146 (0.61800)	Top-1 acc 60.156 (61.926)	Top-5 acc 80.078 (82.550)	lr 0.00961
Train [69][2970/3239]	Time 0.233 (0.975)	Data Time 0.001 (0.488)	Loss 2.4973 (2.5729)	Entropy 0.62147 (0.61802)	Top-1 acc 61.328 (61.927)	Top-5 acc 85.156 (82.550)	lr 0.00961
Train [69][2980/3239]	Time 0.243 (0.976)	Data Time 0.001 (0.489)	Loss 2.8921 (2.5730)	Entropy 0.62144 (0.61803)	Top-1 acc 53.516 (61.924)	Top-5 acc 76.172 (82.548)	lr 0.00961
Train [69][2990/3239]	Time 14.398 (0.978)	Data Time 14.146 (0.492)	Loss 2.6578 (2.5732)	Entropy 0.62164 (0.61804)	Top-1 acc 61.328 (61.918)	Top-5 acc 83.203 (82.549)	lr 0.00961
Train [69][3000/3239]	Time 0.231 (0.979)	Data Time 0.001 (0.492)	Loss 2.5567 (2.5734)	Entropy 0.62171 (0.61805)	Top-1 acc 60.938 (61.914)	Top-5 acc 81.250 (82.544)	lr 0.00961
Train [69][3010/3239]	Time 0.337 (0.992)	Data Time 0.002 (0.491)	Loss 2.4139 (2.5733)	Entropy 0.62127 (0.61806)	Top-1 acc 62.109 (61.916)	Top-5 acc 86.328 (82.547)	lr 0.00960
Train [69][3020/3239]	Time 0.349 (0.990)	Data Time 0.002 (0.489)	Loss 2.6581 (2.5732)	Entropy 0.62134 (0.61807)	Top-1 acc 57.422 (61.916)	Top-5 acc 80.859 (82.549)	lr 0.00960
Train [69][3030/3239]	Time 0.233 (0.989)	Data Time 0.001 (0.487)	Loss 2.7309 (2.5733)	Entropy 0.62128 (0.61808)	Top-1 acc 55.469 (61.914)	Top-5 acc 83.203 (82.549)	lr 0.00960
Train [69][3040/3239]	Time 2.924 (0.988)	Data Time 2.669 (0.487)	Loss 2.6655 (2.5732)	Entropy 0.62095 (0.61809)	Top-1 acc 59.766 (61.915)	Top-5 acc 81.641 (82.549)	lr 0.00960
Train [69][3050/3239]	Time 0.230 (0.986)	Data Time 0.001 (0.485)	Loss 2.6469 (2.5734)	Entropy 0.62134 (0.61810)	Top-1 acc 62.109 (61.910)	Top-5 acc 81.641 (82.546)	lr 0.00960
Train [69][3060/3239]	Time 0.246 (0.989)	Data Time 0.001 (0.489)	Loss 2.4168 (2.5735)	Entropy 0.62125 (0.61811)	Top-1 acc 64.453 (61.906)	Top-5 acc 85.547 (82.543)	lr 0.00960
Train [69][3070/3239]	Time 0.249 (0.988)	Data Time 0.001 (0.488)	Loss 2.8192 (2.5736)	Entropy 0.62102 (0.61812)	Top-1 acc 57.031 (61.903)	Top-5 acc 79.297 (82.543)	lr 0.00960
Train [69][3080/3239]	Time 0.268 (0.990)	Data Time 0.001 (0.490)	Loss 2.4885 (2.5737)	Entropy 0.62078 (0.61813)	Top-1 acc 67.188 (61.902)	Top-5 acc 81.641 (82.540)	lr 0.00960
Train [69][3090/3239]	Time 9.176 (0.994)	Data Time 8.757 (0.494)	Loss 2.6981 (2.5739)	Entropy 0.62105 (0.61814)	Top-1 acc 62.109 (61.897)	Top-5 acc 77.344 (82.537)	lr 0.00960
Train [69][3100/3239]	Time 0.247 (0.992)	Data Time 0.001 (0.493)	Loss 2.6051 (2.5738)	Entropy 0.62113 (0.61815)	Top-1 acc 58.594 (61.896)	Top-5 acc 79.688 (82.540)	lr 0.00960
Train [69][3110/3239]	Time 0.250 (0.994)	Data Time 0.001 (0.495)	Loss 2.4692 (2.5740)	Entropy 0.62132 (0.61816)	Top-1 acc 64.062 (61.885)	Top-5 acc 85.156 (82.538)	lr 0.00959
Train [69][3120/3239]	Time 0.272 (0.994)	Data Time 0.002 (0.495)	Loss 2.6546 (2.5743)	Entropy 0.62127 (0.61817)	Top-1 acc 57.812 (61.878)	Top-5 acc 81.250 (82.534)	lr 0.00959
Train [69][3130/3239]	Time 0.252 (0.996)	Data Time 0.001 (0.497)	Loss 2.5302 (2.5744)	Entropy 0.62126 (0.61818)	Top-1 acc 66.016 (61.876)	Top-5 acc 80.859 (82.531)	lr 0.00959
Train [69][3140/3239]	Time 0.228 (0.997)	Data Time 0.001 (0.499)	Loss 2.3682 (2.5744)	Entropy 0.62144 (0.61819)	Top-1 acc 66.797 (61.877)	Top-5 acc 84.766 (82.531)	lr 0.00959
Train [69][3150/3239]	Time 0.375 (0.996)	Data Time 0.145 (0.497)	Loss 2.4973 (2.5743)	Entropy 0.62091 (0.61820)	Top-1 acc 65.625 (61.877)	Top-5 acc 85.156 (82.534)	lr 0.00959
Train [69][3160/3239]	Time 0.238 (0.998)	Data Time 0.001 (0.500)	Loss 2.6120 (2.5743)	Entropy 0.62082 (0.61821)	Top-1 acc 61.719 (61.871)	Top-5 acc 82.031 (82.534)	lr 0.00959
Train [69][3170/3239]	Time 0.244 (1.000)	Data Time 0.001 (0.502)	Loss 2.4892 (2.5745)	Entropy 0.62082 (0.61822)	Top-1 acc 65.625 (61.867)	Top-5 acc 85.156 (82.531)	lr 0.00959
Train [69][3180/3239]	Time 0.359 (0.998)	Data Time 0.000 (0.500)	Loss 2.7199 (2.5746)	Entropy 0.62074 (0.61823)	Top-1 acc 57.812 (61.864)	Top-5 acc 82.031 (82.530)	lr 0.00959
Train [69][3190/3239]	Time 0.236 (1.002)	Data Time 0.000 (0.504)	Loss 2.4387 (2.5745)	Entropy 0.62064 (0.61823)	Top-1 acc 63.672 (61.865)	Top-5 acc 84.766 (82.532)	lr 0.00959
Train [69][3200/3239]	Time 8.116 (1.003)	Data Time 7.847 (0.506)	Loss 2.4893 (2.5744)	Entropy 0.62083 (0.61824)	Top-1 acc 61.328 (61.864)	Top-5 acc 89.062 (82.535)	lr 0.00959
Train [69][3210/3239]	Time 0.230 (1.001)	Data Time 0.000 (0.504)	Loss 2.8445 (2.5746)	Entropy 0.62063 (0.61825)	Top-1 acc 53.516 (61.859)	Top-5 acc 79.297 (82.533)	lr 0.00958
Train [69][3220/3239]	Time 2.298 (1.003)	Data Time 2.034 (0.506)	Loss 2.8659 (2.5747)	Entropy 0.62084 (0.61826)	Top-1 acc 55.078 (61.853)	Top-5 acc 77.344 (82.533)	lr 0.00958
Train [69][3230/3239]	Time 0.245 (1.001)	Data Time 0.000 (0.505)	Loss 2.6754 (2.5748)	Entropy 0.62091 (0.61826)	Top-1 acc 58.203 (61.848)	Top-5 acc 82.031 (82.533)	lr 0.00958
Train [69][3239/3239]	Time 0.994 (1.002)	Data Time 0.000 (0.505)	Loss 2.5586 (2.5749)	Entropy 0.62064 (0.61827)	Top-1 acc 64.198 (61.843)	Top-5 acc 81.481 (82.533)	lr 0.00958
==========Valid [69/120]	loss 1.357	top-1 acc 69.065 (69.065)	top-5 acc 88.344	Train top-1 61.843	top-5 82.533	Entropy 0.62064	Latency-None: 0.000ms	Flops: 539.00M
Train [70][0/3239]	Time 44.851 (44.851)	Data Time 42.248 (42.248)	Loss 2.4411 (2.4411)	Entropy 0.62063 (0.62063)	Top-1 acc 66.797 (66.797)	Top-5 acc 82.812 (82.812)	lr 0.00958
Train [70][10/3239]	Time 0.243 (4.563)	Data Time 0.001 (3.845)	Loss 2.5295 (2.5060)	Entropy 0.62091 (0.62070)	Top-1 acc 62.500 (64.631)	Top-5 acc 82.422 (83.736)	lr 0.00958
Train [70][20/3239]	Time 0.252 (2.602)	Data Time 0.001 (2.015)	Loss 2.6033 (2.5571)	Entropy 0.62093 (0.62079)	Top-1 acc 63.281 (63.095)	Top-5 acc 82.422 (82.868)	lr 0.00958
Train [70][30/3239]	Time 0.253 (1.903)	Data Time 0.001 (1.365)	Loss 2.4115 (2.5750)	Entropy 0.62070 (0.62082)	Top-1 acc 65.234 (62.261)	Top-5 acc 86.719 (82.699)	lr 0.00958
Train [70][40/3239]	Time 0.253 (1.643)	Data Time 0.001 (1.120)	Loss 2.4780 (2.5708)	Entropy 0.62072 (0.62079)	Top-1 acc 64.844 (62.462)	Top-5 acc 84.766 (82.812)	lr 0.00958
Train [70][50/3239]	Time 0.250 (1.406)	Data Time 0.002 (0.901)	Loss 2.7089 (2.5723)	Entropy 0.62078 (0.62077)	Top-1 acc 59.375 (62.224)	Top-5 acc 79.688 (82.698)	lr 0.00958
Train [70][60/3239]	Time 0.234 (1.246)	Data Time 0.001 (0.753)	Loss 2.5326 (2.5681)	Entropy 0.62108 (0.62079)	Top-1 acc 63.672 (62.372)	Top-5 acc 83.594 (82.800)	lr 0.00958
Train [70][70/3239]	Time 0.249 (1.193)	Data Time 0.001 (0.704)	Loss 2.3294 (2.5654)	Entropy 0.62060 (0.62080)	Top-1 acc 68.750 (62.467)	Top-5 acc 88.672 (82.763)	lr 0.00958
Train [70][80/3239]	Time 0.374 (1.121)	Data Time 0.001 (0.632)	Loss 2.4365 (2.5569)	Entropy 0.62043 (0.62077)	Top-1 acc 66.797 (62.563)	Top-5 acc 87.500 (82.967)	lr 0.00957
Train [70][90/3239]	Time 0.234 (1.048)	Data Time 0.001 (0.563)	Loss 2.6636 (2.5541)	Entropy 0.62063 (0.62073)	Top-1 acc 57.031 (62.466)	Top-5 acc 79.297 (83.010)	lr 0.00957
Train [70][100/3239]	Time 0.251 (1.023)	Data Time 0.001 (0.540)	Loss 2.4773 (2.5562)	Entropy 0.62045 (0.62072)	Top-1 acc 61.719 (62.427)	Top-5 acc 83.984 (82.932)	lr 0.00957
Train [70][110/3239]	Time 0.230 (0.987)	Data Time 0.001 (0.509)	Loss 2.6349 (2.5619)	Entropy 0.61997 (0.62069)	Top-1 acc 63.672 (62.310)	Top-5 acc 79.297 (82.820)	lr 0.00957
Train [70][120/3239]	Time 0.342 (0.941)	Data Time 0.003 (0.467)	Loss 2.7161 (2.5686)	Entropy 0.61967 (0.62062)	Top-1 acc 60.156 (62.174)	Top-5 acc 80.859 (82.658)	lr 0.00957
Train [70][130/3239]	Time 0.270 (0.926)	Data Time 0.002 (0.452)	Loss 2.5487 (2.5642)	Entropy 0.61921 (0.62052)	Top-1 acc 62.891 (62.321)	Top-5 acc 81.250 (82.729)	lr 0.00957
Train [70][140/3239]	Time 0.240 (0.922)	Data Time 0.001 (0.452)	Loss 2.8819 (2.5659)	Entropy 0.61943 (0.62044)	Top-1 acc 55.078 (62.265)	Top-5 acc 76.172 (82.704)	lr 0.00957
Train [70][150/3239]	Time 0.379 (0.894)	Data Time 0.001 (0.422)	Loss 2.3726 (2.5640)	Entropy 0.61968 (0.62038)	Top-1 acc 66.406 (62.285)	Top-5 acc 88.281 (82.766)	lr 0.00957
Train [70][160/3239]	Time 0.271 (0.865)	Data Time 0.001 (0.396)	Loss 2.5459 (2.5625)	Entropy 0.61977 (0.62033)	Top-1 acc 62.891 (62.320)	Top-5 acc 85.938 (82.800)	lr 0.00957
Train [70][170/3239]	Time 0.249 (0.847)	Data Time 0.001 (0.381)	Loss 2.8017 (2.5613)	Entropy 0.61973 (0.62030)	Top-1 acc 53.516 (62.329)	Top-5 acc 77.734 (82.851)	lr 0.00957
Train [70][180/3239]	Time 0.314 (0.827)	Data Time 0.001 (0.360)	Loss 2.6542 (2.5613)	Entropy 0.62001 (0.62027)	Top-1 acc 60.156 (62.308)	Top-5 acc 82.422 (82.877)	lr 0.00956
Train [70][190/3239]	Time 0.340 (0.808)	Data Time 0.003 (0.341)	Loss 2.5811 (2.5601)	Entropy 0.62040 (0.62026)	Top-1 acc 57.812 (62.320)	Top-5 acc 85.938 (82.927)	lr 0.00956
Train [70][200/3239]	Time 0.258 (0.791)	Data Time 0.001 (0.324)	Loss 2.8771 (2.5607)	Entropy 0.61997 (0.62026)	Top-1 acc 50.391 (62.284)	Top-5 acc 78.906 (82.956)	lr 0.00956
Train [70][210/3239]	Time 0.250 (0.775)	Data Time 0.002 (0.309)	Loss 2.6577 (2.5636)	Entropy 0.61993 (0.62025)	Top-1 acc 63.672 (62.193)	Top-5 acc 77.734 (82.898)	lr 0.00956
Train [70][220/3239]	Time 0.236 (0.761)	Data Time 0.001 (0.295)	Loss 2.4220 (2.5619)	Entropy 0.61994 (0.62023)	Top-1 acc 64.844 (62.274)	Top-5 acc 86.719 (82.940)	lr 0.00956
Train [70][230/3239]	Time 0.270 (0.747)	Data Time 0.001 (0.282)	Loss 2.5915 (2.5617)	Entropy 0.62031 (0.62023)	Top-1 acc 61.328 (62.246)	Top-5 acc 79.297 (82.936)	lr 0.00956
Train [70][240/3239]	Time 0.396 (0.736)	Data Time 0.001 (0.271)	Loss 2.4745 (2.5598)	Entropy 0.62005 (0.62023)	Top-1 acc 64.453 (62.255)	Top-5 acc 83.984 (82.973)	lr 0.00956
Train [70][250/3239]	Time 0.293 (0.724)	Data Time 0.002 (0.260)	Loss 2.5840 (2.5590)	Entropy 0.61986 (0.62021)	Top-1 acc 61.328 (62.335)	Top-5 acc 83.203 (82.965)	lr 0.00956
Train [70][260/3239]	Time 0.252 (0.713)	Data Time 0.001 (0.250)	Loss 2.5052 (2.5585)	Entropy 0.61994 (0.62020)	Top-1 acc 62.109 (62.323)	Top-5 acc 83.203 (82.964)	lr 0.00956
Train [70][270/3239]	Time 0.246 (0.704)	Data Time 0.001 (0.241)	Loss 2.3936 (2.5592)	Entropy 0.61988 (0.62018)	Top-1 acc 69.141 (62.359)	Top-5 acc 85.938 (82.965)	lr 0.00956
Train [70][280/3239]	Time 0.240 (0.694)	Data Time 0.001 (0.232)	Loss 2.3976 (2.5592)	Entropy 0.61998 (0.62017)	Top-1 acc 64.844 (62.361)	Top-5 acc 86.328 (82.979)	lr 0.00955
Train [70][290/3239]	Time 0.245 (0.685)	Data Time 0.001 (0.225)	Loss 2.5456 (2.5594)	Entropy 0.62010 (0.62017)	Top-1 acc 62.500 (62.381)	Top-5 acc 84.766 (82.964)	lr 0.00955
Train [70][300/3239]	Time 0.245 (0.677)	Data Time 0.001 (0.217)	Loss 2.6256 (2.5600)	Entropy 0.62006 (0.62017)	Top-1 acc 58.594 (62.357)	Top-5 acc 81.641 (82.945)	lr 0.00955
Train [70][310/3239]	Time 0.333 (0.670)	Data Time 0.001 (0.210)	Loss 2.7490 (2.5597)	Entropy 0.61996 (0.62016)	Top-1 acc 57.031 (62.363)	Top-5 acc 78.516 (82.966)	lr 0.00955
Train [70][320/3239]	Time 0.247 (0.663)	Data Time 0.001 (0.204)	Loss 2.7693 (2.5592)	Entropy 0.62020 (0.62016)	Top-1 acc 57.031 (62.364)	Top-5 acc 78.906 (82.965)	lr 0.00955
Train [70][330/3239]	Time 0.291 (0.656)	Data Time 0.001 (0.198)	Loss 2.5953 (2.5596)	Entropy 0.61998 (0.62016)	Top-1 acc 64.453 (62.350)	Top-5 acc 82.812 (82.947)	lr 0.00955
Train [70][340/3239]	Time 0.296 (0.650)	Data Time 0.002 (0.192)	Loss 2.5551 (2.5594)	Entropy 0.62013 (0.62016)	Top-1 acc 64.062 (62.356)	Top-5 acc 83.203 (82.947)	lr 0.00955
Train [70][350/3239]	Time 0.243 (0.644)	Data Time 0.001 (0.186)	Loss 2.5954 (2.5611)	Entropy 0.62037 (0.62016)	Top-1 acc 63.281 (62.325)	Top-5 acc 83.594 (82.913)	lr 0.00955
Train [70][360/3239]	Time 0.225 (0.639)	Data Time 0.001 (0.181)	Loss 2.5853 (2.5620)	Entropy 0.62049 (0.62016)	Top-1 acc 60.156 (62.266)	Top-5 acc 82.422 (82.886)	lr 0.00955
Train [70][370/3239]	Time 0.308 (0.634)	Data Time 0.028 (0.177)	Loss 2.5181 (2.5611)	Entropy 0.62053 (0.62017)	Top-1 acc 64.453 (62.272)	Top-5 acc 83.203 (82.891)	lr 0.00955
Train [70][380/3239]	Time 0.238 (0.629)	Data Time 0.001 (0.172)	Loss 2.5106 (2.5600)	Entropy 0.62017 (0.62018)	Top-1 acc 64.844 (62.280)	Top-5 acc 84.375 (82.908)	lr 0.00954
Train [70][390/3239]	Time 0.261 (0.623)	Data Time 0.001 (0.168)	Loss 2.5717 (2.5600)	Entropy 0.62011 (0.62018)	Top-1 acc 58.984 (62.268)	Top-5 acc 83.984 (82.893)	lr 0.00954
Train [70][400/3239]	Time 0.249 (0.618)	Data Time 0.001 (0.163)	Loss 2.5733 (2.5612)	Entropy 0.62002 (0.62017)	Top-1 acc 62.891 (62.252)	Top-5 acc 82.812 (82.871)	lr 0.00954
Train [70][410/3239]	Time 0.256 (0.613)	Data Time 0.001 (0.160)	Loss 2.4795 (2.5605)	Entropy 0.62005 (0.62017)	Top-1 acc 65.234 (62.266)	Top-5 acc 84.375 (82.907)	lr 0.00954
Train [70][420/3239]	Time 0.418 (0.717)	Data Time 0.006 (0.156)	Loss 2.4515 (2.5599)	Entropy 0.61989 (0.62017)	Top-1 acc 64.844 (62.303)	Top-5 acc 85.938 (82.909)	lr 0.00954
Train [70][430/3239]	Time 0.223 (0.713)	Data Time 0.002 (0.152)	Loss 2.8030 (2.5605)	Entropy 0.62003 (0.62016)	Top-1 acc 53.125 (62.269)	Top-5 acc 77.344 (82.909)	lr 0.00954
Train [70][440/3239]	Time 0.241 (0.706)	Data Time 0.001 (0.149)	Loss 2.6242 (2.5610)	Entropy 0.62041 (0.62016)	Top-1 acc 60.938 (62.253)	Top-5 acc 81.641 (82.892)	lr 0.00954
Train [70][450/3239]	Time 0.244 (0.700)	Data Time 0.002 (0.146)	Loss 2.5186 (2.5616)	Entropy 0.62053 (0.62017)	Top-1 acc 65.625 (62.229)	Top-5 acc 83.203 (82.892)	lr 0.00954
Train [70][460/3239]	Time 0.221 (0.693)	Data Time 0.001 (0.142)	Loss 2.6769 (2.5620)	Entropy 0.62045 (0.62017)	Top-1 acc 55.469 (62.209)	Top-5 acc 82.812 (82.897)	lr 0.00954
Train [70][470/3239]	Time 0.313 (0.687)	Data Time 0.001 (0.139)	Loss 2.7642 (2.5616)	Entropy 0.62015 (0.62018)	Top-1 acc 57.031 (62.198)	Top-5 acc 80.078 (82.898)	lr 0.00954
Train [70][480/3239]	Time 0.254 (0.682)	Data Time 0.001 (0.137)	Loss 2.5249 (2.5610)	Entropy 0.62010 (0.62018)	Top-1 acc 62.500 (62.227)	Top-5 acc 83.203 (82.903)	lr 0.00953
Train [70][490/3239]	Time 0.298 (0.678)	Data Time 0.002 (0.134)	Loss 2.6613 (2.5615)	Entropy 0.62034 (0.62018)	Top-1 acc 60.156 (62.229)	Top-5 acc 80.859 (82.894)	lr 0.00953
Train [70][500/3239]	Time 0.255 (0.673)	Data Time 0.001 (0.131)	Loss 2.5910 (2.5619)	Entropy 0.61998 (0.62018)	Top-1 acc 59.375 (62.213)	Top-5 acc 84.766 (82.891)	lr 0.00953
Train [70][510/3239]	Time 0.275 (0.669)	Data Time 0.001 (0.129)	Loss 2.4683 (2.5625)	Entropy 0.62021 (0.62018)	Top-1 acc 68.750 (62.203)	Top-5 acc 83.594 (82.887)	lr 0.00953
Train [70][520/3239]	Time 0.243 (0.665)	Data Time 0.001 (0.126)	Loss 2.5074 (2.5630)	Entropy 0.61932 (0.62017)	Top-1 acc 62.500 (62.169)	Top-5 acc 85.547 (82.880)	lr 0.00953
Train [70][530/3239]	Time 0.273 (0.662)	Data Time 0.002 (0.126)	Loss 2.6064 (2.5627)	Entropy 0.61935 (0.62016)	Top-1 acc 59.766 (62.188)	Top-5 acc 81.641 (82.898)	lr 0.00953
Train [70][540/3239]	Time 0.324 (0.659)	Data Time 0.004 (0.124)	Loss 2.6195 (2.5630)	Entropy 0.61975 (0.62015)	Top-1 acc 62.500 (62.200)	Top-5 acc 82.031 (82.901)	lr 0.00953
Train [70][550/3239]	Time 0.249 (0.662)	Data Time 0.001 (0.129)	Loss 2.5777 (2.5625)	Entropy 0.61917 (0.62013)	Top-1 acc 57.812 (62.199)	Top-5 acc 80.859 (82.901)	lr 0.00953
Train [70][560/3239]	Time 0.410 (0.663)	Data Time 0.001 (0.131)	Loss 2.4460 (2.5625)	Entropy 0.61918 (0.62012)	Top-1 acc 66.016 (62.200)	Top-5 acc 85.547 (82.903)	lr 0.00953
Train [70][570/3239]	Time 0.228 (0.659)	Data Time 0.002 (0.129)	Loss 2.6969 (2.5635)	Entropy 0.61932 (0.62010)	Top-1 acc 60.547 (62.187)	Top-5 acc 80.078 (82.877)	lr 0.00953
Train [70][580/3239]	Time 0.268 (0.657)	Data Time 0.001 (0.129)	Loss 2.5163 (2.5641)	Entropy 0.61957 (0.62009)	Top-1 acc 63.281 (62.169)	Top-5 acc 83.203 (82.870)	lr 0.00953
Train [70][590/3239]	Time 0.244 (0.658)	Data Time 0.002 (0.131)	Loss 2.5190 (2.5634)	Entropy 0.61975 (0.62008)	Top-1 acc 64.062 (62.193)	Top-5 acc 82.422 (82.884)	lr 0.00952
Train [70][600/3239]	Time 0.237 (0.659)	Data Time 0.001 (0.134)	Loss 2.7741 (2.5629)	Entropy 0.61985 (0.62008)	Top-1 acc 54.688 (62.200)	Top-5 acc 80.469 (82.890)	lr 0.00952
Train [70][610/3239]	Time 0.245 (0.656)	Data Time 0.001 (0.132)	Loss 2.5132 (2.5634)	Entropy 0.62030 (0.62007)	Top-1 acc 61.719 (62.194)	Top-5 acc 82.422 (82.884)	lr 0.00952
Train [70][620/3239]	Time 0.244 (0.656)	Data Time 0.001 (0.134)	Loss 2.9402 (2.5635)	Entropy 0.62001 (0.62007)	Top-1 acc 53.906 (62.189)	Top-5 acc 74.219 (82.880)	lr 0.00952
Train [70][630/3239]	Time 1.977 (0.663)	Data Time 1.623 (0.142)	Loss 2.7219 (2.5640)	Entropy 0.62039 (0.62007)	Top-1 acc 60.938 (62.185)	Top-5 acc 77.734 (82.869)	lr 0.00952
Train [70][640/3239]	Time 0.227 (0.659)	Data Time 0.001 (0.139)	Loss 2.6323 (2.5642)	Entropy 0.62051 (0.62008)	Top-1 acc 59.766 (62.175)	Top-5 acc 82.422 (82.872)	lr 0.00952
Train [70][650/3239]	Time 0.247 (0.655)	Data Time 0.001 (0.137)	Loss 2.3385 (2.5639)	Entropy 0.62073 (0.62009)	Top-1 acc 64.844 (62.179)	Top-5 acc 88.281 (82.898)	lr 0.00952
Train [70][660/3239]	Time 0.228 (0.662)	Data Time 0.001 (0.145)	Loss 2.7784 (2.5642)	Entropy 0.62103 (0.62010)	Top-1 acc 56.641 (62.160)	Top-5 acc 80.859 (82.889)	lr 0.00952
Train [70][670/3239]	Time 0.246 (0.663)	Data Time 0.001 (0.148)	Loss 2.5997 (2.5645)	Entropy 0.62070 (0.62011)	Top-1 acc 61.328 (62.148)	Top-5 acc 82.422 (82.896)	lr 0.00952
Train [70][680/3239]	Time 0.274 (0.661)	Data Time 0.001 (0.146)	Loss 2.6539 (2.5654)	Entropy 0.62099 (0.62012)	Top-1 acc 61.328 (62.116)	Top-5 acc 83.984 (82.888)	lr 0.00952
Train [70][690/3239]	Time 0.242 (0.660)	Data Time 0.001 (0.147)	Loss 2.6428 (2.5653)	Entropy 0.62109 (0.62013)	Top-1 acc 60.547 (62.127)	Top-5 acc 80.469 (82.883)	lr 0.00951
Train [70][700/3239]	Time 0.322 (0.665)	Data Time 0.001 (0.153)	Loss 2.3889 (2.5650)	Entropy 0.62137 (0.62015)	Top-1 acc 64.844 (62.113)	Top-5 acc 86.719 (82.892)	lr 0.00951
Train [70][710/3239]	Time 0.238 (0.662)	Data Time 0.001 (0.151)	Loss 2.7261 (2.5652)	Entropy 0.62137 (0.62017)	Top-1 acc 57.812 (62.113)	Top-5 acc 80.078 (82.887)	lr 0.00951
Train [70][720/3239]	Time 0.237 (0.659)	Data Time 0.001 (0.149)	Loss 2.5419 (2.5660)	Entropy 0.62138 (0.62018)	Top-1 acc 62.891 (62.086)	Top-5 acc 82.812 (82.874)	lr 0.00951
Train [70][730/3239]	Time 0.227 (0.663)	Data Time 0.001 (0.154)	Loss 2.8787 (2.5664)	Entropy 0.62143 (0.62020)	Top-1 acc 55.859 (62.084)	Top-5 acc 76.562 (82.865)	lr 0.00951
Train [70][740/3239]	Time 0.256 (0.661)	Data Time 0.001 (0.152)	Loss 2.6631 (2.5655)	Entropy 0.62142 (0.62022)	Top-1 acc 60.938 (62.106)	Top-5 acc 81.641 (82.877)	lr 0.00951
Train [70][750/3239]	Time 0.251 (0.658)	Data Time 0.001 (0.150)	Loss 2.8213 (2.5655)	Entropy 0.62171 (0.62023)	Top-1 acc 57.031 (62.105)	Top-5 acc 76.562 (82.883)	lr 0.00951
Train [70][760/3239]	Time 0.234 (0.663)	Data Time 0.001 (0.157)	Loss 2.6354 (2.5660)	Entropy 0.62181 (0.62025)	Top-1 acc 62.109 (62.095)	Top-5 acc 83.203 (82.869)	lr 0.00951
Train [70][770/3239]	Time 0.282 (0.660)	Data Time 0.001 (0.155)	Loss 2.4655 (2.5661)	Entropy 0.62112 (0.62027)	Top-1 acc 63.672 (62.089)	Top-5 acc 85.156 (82.865)	lr 0.00951
Train [70][780/3239]	Time 0.254 (0.662)	Data Time 0.001 (0.157)	Loss 2.6968 (2.5669)	Entropy 0.62084 (0.62028)	Top-1 acc 57.031 (62.079)	Top-5 acc 80.078 (82.850)	lr 0.00951
Train [70][790/3239]	Time 2.826 (0.665)	Data Time 2.488 (0.162)	Loss 2.6454 (2.5675)	Entropy 0.62041 (0.62029)	Top-1 acc 60.156 (62.060)	Top-5 acc 80.469 (82.835)	lr 0.00950
Train [70][800/3239]	Time 0.235 (0.662)	Data Time 0.001 (0.160)	Loss 2.4863 (2.5669)	Entropy 0.62022 (0.62028)	Top-1 acc 63.672 (62.075)	Top-5 acc 85.938 (82.838)	lr 0.00950
Train [70][810/3239]	Time 0.257 (0.659)	Data Time 0.001 (0.158)	Loss 2.7499 (2.5670)	Entropy 0.62018 (0.62028)	Top-1 acc 59.766 (62.078)	Top-5 acc 78.906 (82.840)	lr 0.00950
Train [70][820/3239]	Time 0.243 (0.663)	Data Time 0.001 (0.163)	Loss 2.3798 (2.5668)	Entropy 0.62036 (0.62028)	Top-1 acc 68.750 (62.088)	Top-5 acc 86.719 (82.834)	lr 0.00950
Train [70][830/3239]	Time 0.233 (0.665)	Data Time 0.001 (0.165)	Loss 2.6171 (2.5670)	Entropy 0.62043 (0.62028)	Top-1 acc 62.109 (62.086)	Top-5 acc 79.688 (82.825)	lr 0.00950
Train [70][840/3239]	Time 0.233 (0.662)	Data Time 0.001 (0.163)	Loss 2.6115 (2.5677)	Entropy 0.62077 (0.62029)	Top-1 acc 57.812 (62.080)	Top-5 acc 82.031 (82.809)	lr 0.00950
Train [70][850/3239]	Time 0.255 (0.665)	Data Time 0.001 (0.167)	Loss 2.6602 (2.5677)	Entropy 0.62066 (0.62029)	Top-1 acc 61.328 (62.092)	Top-5 acc 80.859 (82.805)	lr 0.00950
Train [70][860/3239]	Time 0.336 (0.665)	Data Time 0.001 (0.168)	Loss 2.4597 (2.5673)	Entropy 0.62037 (0.62030)	Top-1 acc 64.453 (62.102)	Top-5 acc 85.156 (82.814)	lr 0.00950
Train [70][870/3239]	Time 0.235 (0.663)	Data Time 0.001 (0.166)	Loss 2.5732 (2.5670)	Entropy 0.62024 (0.62030)	Top-1 acc 64.453 (62.101)	Top-5 acc 83.203 (82.818)	lr 0.00950
Train [70][880/3239]	Time 0.227 (0.664)	Data Time 0.001 (0.168)	Loss 2.5341 (2.5668)	Entropy 0.62018 (0.62030)	Top-1 acc 64.062 (62.096)	Top-5 acc 84.375 (82.816)	lr 0.00950
Train [70][890/3239]	Time 0.241 (0.665)	Data Time 0.001 (0.170)	Loss 2.5416 (2.5675)	Entropy 0.62044 (0.62030)	Top-1 acc 60.938 (62.084)	Top-5 acc 83.203 (82.805)	lr 0.00949
Train [70][900/3239]	Time 0.257 (0.662)	Data Time 0.001 (0.169)	Loss 2.2699 (2.5671)	Entropy 0.62054 (0.62030)	Top-1 acc 69.141 (62.083)	Top-5 acc 87.891 (82.813)	lr 0.00949
Train [70][910/3239]	Time 0.234 (0.664)	Data Time 0.001 (0.171)	Loss 2.6261 (2.5668)	Entropy 0.62030 (0.62030)	Top-1 acc 64.844 (62.081)	Top-5 acc 80.859 (82.818)	lr 0.00949
Train [70][920/3239]	Time 0.259 (0.666)	Data Time 0.001 (0.174)	Loss 2.9636 (2.5668)	Entropy 0.62022 (0.62030)	Top-1 acc 51.172 (62.092)	Top-5 acc 75.391 (82.813)	lr 0.00949
Train [70][930/3239]	Time 0.256 (0.664)	Data Time 0.001 (0.172)	Loss 2.4640 (2.5663)	Entropy 0.62038 (0.62030)	Top-1 acc 64.844 (62.102)	Top-5 acc 87.109 (82.828)	lr 0.00949
Train [70][940/3239]	Time 0.223 (0.665)	Data Time 0.001 (0.174)	Loss 2.6764 (2.5668)	Entropy 0.62069 (0.62030)	Top-1 acc 60.547 (62.087)	Top-5 acc 82.422 (82.823)	lr 0.00949
Train [70][950/3239]	Time 0.375 (0.668)	Data Time 0.001 (0.178)	Loss 2.6601 (2.5669)	Entropy 0.62075 (0.62030)	Top-1 acc 62.109 (62.094)	Top-5 acc 80.078 (82.815)	lr 0.00949
Train [70][960/3239]	Time 0.243 (0.665)	Data Time 0.001 (0.176)	Loss 2.6721 (2.5672)	Entropy 0.62006 (0.62031)	Top-1 acc 58.984 (62.087)	Top-5 acc 82.031 (82.816)	lr 0.00949
Train [70][970/3239]	Time 0.242 (0.663)	Data Time 0.001 (0.174)	Loss 2.4070 (2.5668)	Entropy 0.61951 (0.62030)	Top-1 acc 66.797 (62.093)	Top-5 acc 83.594 (82.819)	lr 0.00949
Train [70][980/3239]	Time 0.235 (0.669)	Data Time 0.001 (0.180)	Loss 2.5753 (2.5662)	Entropy 0.61950 (0.62030)	Top-1 acc 61.719 (62.103)	Top-5 acc 81.641 (82.817)	lr 0.00949
Train [70][990/3239]	Time 0.242 (0.666)	Data Time 0.001 (0.178)	Loss 2.4971 (2.5662)	Entropy 0.61976 (0.62029)	Top-1 acc 63.281 (62.102)	Top-5 acc 85.547 (82.823)	lr 0.00948
Train [70][1000/3239]	Time 0.233 (0.664)	Data Time 0.001 (0.176)	Loss 2.6994 (2.5660)	Entropy 0.61945 (0.62028)	Top-1 acc 60.156 (62.110)	Top-5 acc 81.250 (82.823)	lr 0.00948
Train [70][1010/3239]	Time 0.259 (0.669)	Data Time 0.001 (0.183)	Loss 2.5970 (2.5658)	Entropy 0.61916 (0.62027)	Top-1 acc 60.547 (62.114)	Top-5 acc 79.688 (82.820)	lr 0.00948
Train [70][1020/3239]	Time 0.371 (0.668)	Data Time 0.002 (0.181)	Loss 2.2395 (2.5652)	Entropy 0.61896 (0.62026)	Top-1 acc 70.703 (62.120)	Top-5 acc 87.109 (82.833)	lr 0.00948
Train [70][1030/3239]	Time 0.246 (0.667)	Data Time 0.001 (0.181)	Loss 2.3649 (2.5648)	Entropy 0.61886 (0.62025)	Top-1 acc 66.016 (62.128)	Top-5 acc 87.891 (82.845)	lr 0.00948
Train [70][1040/3239]	Time 0.235 (0.668)	Data Time 0.001 (0.183)	Loss 2.8324 (2.5641)	Entropy 0.61890 (0.62023)	Top-1 acc 54.688 (62.144)	Top-5 acc 77.344 (82.858)	lr 0.00948
Train [70][1050/3239]	Time 0.335 (0.668)	Data Time 0.002 (0.183)	Loss 2.4610 (2.5645)	Entropy 0.61866 (0.62022)	Top-1 acc 66.797 (62.137)	Top-5 acc 85.547 (82.844)	lr 0.00948
Train [70][1060/3239]	Time 0.285 (0.670)	Data Time 0.001 (0.186)	Loss 2.5096 (2.5647)	Entropy 0.61832 (0.62020)	Top-1 acc 64.453 (62.122)	Top-5 acc 85.547 (82.847)	lr 0.00948
Train [70][1070/3239]	Time 0.252 (0.672)	Data Time 0.001 (0.188)	Loss 2.2955 (2.5641)	Entropy 0.61864 (0.62019)	Top-1 acc 69.141 (62.145)	Top-5 acc 87.891 (82.863)	lr 0.00948
Train [70][1080/3239]	Time 0.293 (0.714)	Data Time 0.004 (0.188)	Loss 2.5657 (2.5646)	Entropy 0.61863 (0.62017)	Top-1 acc 62.500 (62.126)	Top-5 acc 82.422 (82.851)	lr 0.00948
Train [70][1090/3239]	Time 0.230 (0.711)	Data Time 0.001 (0.186)	Loss 2.5473 (2.5648)	Entropy 0.61887 (0.62016)	Top-1 acc 64.062 (62.126)	Top-5 acc 85.156 (82.855)	lr 0.00947
Train [70][1100/3239]	Time 0.256 (0.709)	Data Time 0.002 (0.185)	Loss 2.7442 (2.5650)	Entropy 0.61890 (0.62015)	Top-1 acc 56.250 (62.114)	Top-5 acc 81.641 (82.850)	lr 0.00947
Train [70][1110/3239]	Time 0.277 (0.706)	Data Time 0.002 (0.183)	Loss 2.5024 (2.5648)	Entropy 0.61876 (0.62014)	Top-1 acc 61.719 (62.113)	Top-5 acc 82.422 (82.855)	lr 0.00947
Train [70][1120/3239]	Time 0.253 (0.704)	Data Time 0.002 (0.181)	Loss 2.5285 (2.5649)	Entropy 0.61832 (0.62012)	Top-1 acc 61.328 (62.107)	Top-5 acc 82.812 (82.856)	lr 0.00947
Train [70][1130/3239]	Time 0.280 (0.701)	Data Time 0.001 (0.180)	Loss 2.4059 (2.5648)	Entropy 0.61834 (0.62011)	Top-1 acc 64.844 (62.117)	Top-5 acc 85.547 (82.860)	lr 0.00947
Train [70][1140/3239]	Time 0.244 (0.699)	Data Time 0.001 (0.178)	Loss 2.4118 (2.5644)	Entropy 0.61843 (0.62009)	Top-1 acc 62.500 (62.122)	Top-5 acc 85.547 (82.860)	lr 0.00947
Train [70][1150/3239]	Time 0.267 (0.697)	Data Time 0.001 (0.177)	Loss 2.3987 (2.5639)	Entropy 0.61844 (0.62008)	Top-1 acc 63.672 (62.137)	Top-5 acc 87.109 (82.874)	lr 0.00947
Train [70][1160/3239]	Time 0.233 (0.695)	Data Time 0.001 (0.175)	Loss 2.2899 (2.5640)	Entropy 0.61861 (0.62006)	Top-1 acc 70.703 (62.146)	Top-5 acc 85.547 (82.879)	lr 0.00947
Train [70][1170/3239]	Time 0.262 (0.693)	Data Time 0.001 (0.174)	Loss 2.5749 (2.5641)	Entropy 0.61850 (0.62005)	Top-1 acc 63.672 (62.144)	Top-5 acc 81.641 (82.869)	lr 0.00947
Train [70][1180/3239]	Time 0.333 (0.696)	Data Time 0.001 (0.177)	Loss 2.4292 (2.5640)	Entropy 0.61867 (0.62004)	Top-1 acc 65.625 (62.149)	Top-5 acc 82.422 (82.869)	lr 0.00947
Train [70][1190/3239]	Time 0.235 (0.695)	Data Time 0.001 (0.178)	Loss 2.4663 (2.5640)	Entropy 0.61809 (0.62003)	Top-1 acc 65.625 (62.150)	Top-5 acc 83.594 (82.864)	lr 0.00947
Train [70][1200/3239]	Time 0.268 (0.693)	Data Time 0.002 (0.176)	Loss 2.5803 (2.5639)	Entropy 0.61827 (0.62001)	Top-1 acc 62.500 (62.162)	Top-5 acc 82.031 (82.858)	lr 0.00946
Train [70][1210/3239]	Time 0.234 (0.698)	Data Time 0.001 (0.182)	Loss 2.4064 (2.5633)	Entropy 0.61819 (0.62000)	Top-1 acc 62.109 (62.180)	Top-5 acc 87.891 (82.871)	lr 0.00946
Train [70][1220/3239]	Time 0.240 (0.698)	Data Time 0.001 (0.183)	Loss 2.5003 (2.5636)	Entropy 0.61814 (0.61998)	Top-1 acc 61.719 (62.168)	Top-5 acc 83.984 (82.867)	lr 0.00946
Train [70][1230/3239]	Time 0.252 (0.696)	Data Time 0.001 (0.181)	Loss 2.4783 (2.5635)	Entropy 0.61758 (0.61996)	Top-1 acc 64.844 (62.168)	Top-5 acc 81.641 (82.859)	lr 0.00946
Train [70][1240/3239]	Time 0.248 (0.698)	Data Time 0.001 (0.184)	Loss 2.6593 (2.5638)	Entropy 0.61752 (0.61994)	Top-1 acc 55.859 (62.152)	Top-5 acc 80.859 (82.859)	lr 0.00946
Train [70][1250/3239]	Time 0.352 (0.699)	Data Time 0.001 (0.185)	Loss 2.6387 (2.5636)	Entropy 0.61790 (0.61993)	Top-1 acc 57.812 (62.151)	Top-5 acc 80.078 (82.864)	lr 0.00946
Train [70][1260/3239]	Time 0.239 (0.697)	Data Time 0.001 (0.184)	Loss 2.5001 (2.5637)	Entropy 0.61793 (0.61991)	Top-1 acc 65.234 (62.158)	Top-5 acc 84.766 (82.860)	lr 0.00946
Train [70][1270/3239]	Time 0.239 (0.702)	Data Time 0.001 (0.190)	Loss 2.4034 (2.5634)	Entropy 0.61802 (0.61989)	Top-1 acc 66.016 (62.168)	Top-5 acc 84.766 (82.860)	lr 0.00946
Train [70][1280/3239]	Time 0.245 (0.702)	Data Time 0.002 (0.191)	Loss 2.7142 (2.5631)	Entropy 0.61783 (0.61988)	Top-1 acc 58.984 (62.180)	Top-5 acc 80.859 (82.862)	lr 0.00946
Train [70][1290/3239]	Time 0.238 (0.700)	Data Time 0.001 (0.189)	Loss 2.4682 (2.5634)	Entropy 0.61776 (0.61986)	Top-1 acc 64.453 (62.173)	Top-5 acc 82.422 (82.852)	lr 0.00946
Train [70][1300/3239]	Time 7.609 (0.703)	Data Time 7.326 (0.193)	Loss 2.6736 (2.5640)	Entropy 0.61782 (0.61985)	Top-1 acc 59.375 (62.158)	Top-5 acc 80.469 (82.842)	lr 0.00945
Train [70][1310/3239]	Time 0.483 (0.702)	Data Time 0.234 (0.193)	Loss 2.3791 (2.5642)	Entropy 0.61799 (0.61983)	Top-1 acc 64.453 (62.149)	Top-5 acc 87.109 (82.841)	lr 0.00945
Train [70][1320/3239]	Time 0.272 (0.700)	Data Time 0.001 (0.191)	Loss 2.5998 (2.5641)	Entropy 0.61806 (0.61982)	Top-1 acc 60.938 (62.149)	Top-5 acc 81.641 (82.843)	lr 0.00945
Train [70][1330/3239]	Time 0.237 (0.698)	Data Time 0.001 (0.190)	Loss 2.5021 (2.5642)	Entropy 0.61834 (0.61980)	Top-1 acc 65.625 (62.147)	Top-5 acc 82.031 (82.842)	lr 0.00945
Train [70][1340/3239]	Time 0.346 (0.705)	Data Time 0.001 (0.196)	Loss 2.5180 (2.5642)	Entropy 0.61803 (0.61979)	Top-1 acc 59.766 (62.143)	Top-5 acc 83.594 (82.838)	lr 0.00945
Train [70][1350/3239]	Time 0.230 (0.702)	Data Time 0.001 (0.195)	Loss 2.5533 (2.5639)	Entropy 0.61802 (0.61978)	Top-1 acc 59.375 (62.147)	Top-5 acc 83.984 (82.848)	lr 0.00945
Train [70][1360/3239]	Time 0.247 (0.701)	Data Time 0.002 (0.195)	Loss 2.5654 (2.5637)	Entropy 0.61812 (0.61977)	Top-1 acc 57.422 (62.150)	Top-5 acc 83.594 (82.848)	lr 0.00945
Train [70][1370/3239]	Time 0.281 (0.706)	Data Time 0.001 (0.200)	Loss 2.5705 (2.5639)	Entropy 0.61818 (0.61975)	Top-1 acc 60.547 (62.147)	Top-5 acc 84.375 (82.843)	lr 0.00945
Train [70][1380/3239]	Time 0.245 (0.704)	Data Time 0.001 (0.198)	Loss 2.5050 (2.5638)	Entropy 0.61840 (0.61974)	Top-1 acc 63.672 (62.148)	Top-5 acc 83.203 (82.839)	lr 0.00945
Train [70][1390/3239]	Time 0.242 (0.704)	Data Time 0.002 (0.198)	Loss 2.4565 (2.5634)	Entropy 0.61832 (0.61973)	Top-1 acc 67.578 (62.149)	Top-5 acc 83.594 (82.848)	lr 0.00945
Train [70][1400/3239]	Time 0.246 (0.706)	Data Time 0.001 (0.201)	Loss 2.6414 (2.5637)	Entropy 0.61825 (0.61972)	Top-1 acc 58.594 (62.143)	Top-5 acc 82.031 (82.841)	lr 0.00944
Train [70][1410/3239]	Time 0.337 (0.705)	Data Time 0.001 (0.200)	Loss 2.6019 (2.5639)	Entropy 0.61814 (0.61971)	Top-1 acc 61.328 (62.139)	Top-5 acc 82.812 (82.841)	lr 0.00944
Train [70][1420/3239]	Time 0.241 (0.705)	Data Time 0.001 (0.201)	Loss 2.6059 (2.5639)	Entropy 0.61811 (0.61970)	Top-1 acc 62.500 (62.142)	Top-5 acc 82.422 (82.836)	lr 0.00944
Train [70][1430/3239]	Time 0.230 (0.707)	Data Time 0.001 (0.203)	Loss 2.6990 (2.5643)	Entropy 0.61806 (0.61969)	Top-1 acc 60.938 (62.133)	Top-5 acc 79.688 (82.828)	lr 0.00944
Train [70][1440/3239]	Time 0.225 (0.705)	Data Time 0.001 (0.202)	Loss 2.5742 (2.5643)	Entropy 0.61795 (0.61968)	Top-1 acc 61.719 (62.126)	Top-5 acc 82.422 (82.829)	lr 0.00944
Train [70][1450/3239]	Time 0.281 (0.706)	Data Time 0.001 (0.204)	Loss 2.4632 (2.5639)	Entropy 0.61785 (0.61967)	Top-1 acc 62.109 (62.137)	Top-5 acc 85.547 (82.831)	lr 0.00944
Train [70][1460/3239]	Time 7.834 (0.710)	Data Time 7.603 (0.208)	Loss 2.8076 (2.5643)	Entropy 0.61806 (0.61965)	Top-1 acc 58.594 (62.129)	Top-5 acc 79.297 (82.829)	lr 0.00944
Train [70][1470/3239]	Time 0.236 (0.708)	Data Time 0.001 (0.206)	Loss 2.4138 (2.5644)	Entropy 0.61830 (0.61964)	Top-1 acc 66.016 (62.128)	Top-5 acc 83.984 (82.824)	lr 0.00944
Train [70][1480/3239]	Time 2.146 (0.707)	Data Time 1.872 (0.206)	Loss 2.6966 (2.5645)	Entropy 0.61812 (0.61963)	Top-1 acc 61.328 (62.127)	Top-5 acc 79.297 (82.821)	lr 0.00944
Train [70][1490/3239]	Time 0.242 (0.705)	Data Time 0.001 (0.205)	Loss 2.7233 (2.5643)	Entropy 0.61831 (0.61962)	Top-1 acc 58.594 (62.126)	Top-5 acc 81.250 (82.825)	lr 0.00944
Train [70][1500/3239]	Time 0.351 (0.710)	Data Time 0.001 (0.210)	Loss 2.4943 (2.5643)	Entropy 0.61863 (0.61962)	Top-1 acc 63.281 (62.122)	Top-5 acc 83.984 (82.822)	lr 0.00943
Train [70][1510/3239]	Time 0.240 (0.708)	Data Time 0.002 (0.209)	Loss 2.5838 (2.5645)	Entropy 0.61812 (0.61961)	Top-1 acc 61.719 (62.120)	Top-5 acc 80.078 (82.816)	lr 0.00943
Train [70][1520/3239]	Time 0.224 (0.708)	Data Time 0.001 (0.209)	Loss 2.6127 (2.5648)	Entropy 0.61857 (0.61960)	Top-1 acc 62.891 (62.109)	Top-5 acc 79.297 (82.808)	lr 0.00943
Train [70][1530/3239]	Time 0.227 (0.712)	Data Time 0.001 (0.214)	Loss 2.6463 (2.5650)	Entropy 0.61864 (0.61959)	Top-1 acc 61.328 (62.104)	Top-5 acc 80.859 (82.796)	lr 0.00943
Train [70][1540/3239]	Time 0.238 (0.710)	Data Time 0.001 (0.212)	Loss 2.4993 (2.5647)	Entropy 0.61871 (0.61959)	Top-1 acc 64.453 (62.116)	Top-5 acc 83.984 (82.804)	lr 0.00943
Train [70][1550/3239]	Time 0.282 (0.711)	Data Time 0.023 (0.213)	Loss 2.5255 (2.5642)	Entropy 0.61863 (0.61958)	Top-1 acc 65.234 (62.133)	Top-5 acc 84.375 (82.814)	lr 0.00943
Train [70][1560/3239]	Time 0.241 (0.714)	Data Time 0.001 (0.217)	Loss 2.6624 (2.5641)	Entropy 0.61822 (0.61957)	Top-1 acc 58.203 (62.125)	Top-5 acc 80.859 (82.809)	lr 0.00943
Train [70][1570/3239]	Time 0.325 (0.712)	Data Time 0.001 (0.215)	Loss 2.4794 (2.5635)	Entropy 0.61824 (0.61956)	Top-1 acc 65.234 (62.143)	Top-5 acc 87.109 (82.818)	lr 0.00943
Train [70][1580/3239]	Time 0.244 (0.714)	Data Time 0.001 (0.218)	Loss 2.4494 (2.5636)	Entropy 0.61801 (0.61956)	Top-1 acc 64.844 (62.144)	Top-5 acc 84.375 (82.812)	lr 0.00943
Train [70][1590/3239]	Time 0.240 (0.717)	Data Time 0.001 (0.222)	Loss 2.3605 (2.5640)	Entropy 0.61827 (0.61955)	Top-1 acc 68.359 (62.130)	Top-5 acc 87.109 (82.808)	lr 0.00943
Train [70][1600/3239]	Time 0.238 (0.715)	Data Time 0.001 (0.221)	Loss 2.3268 (2.5641)	Entropy 0.61833 (0.61954)	Top-1 acc 65.625 (62.129)	Top-5 acc 87.109 (82.807)	lr 0.00943
Train [70][1610/3239]	Time 0.272 (0.717)	Data Time 0.001 (0.223)	Loss 2.5458 (2.5645)	Entropy 0.61849 (0.61953)	Top-1 acc 64.062 (62.127)	Top-5 acc 88.281 (82.805)	lr 0.00942
Train [70][1620/3239]	Time 6.686 (0.719)	Data Time 6.421 (0.225)	Loss 2.6321 (2.5646)	Entropy 0.61834 (0.61952)	Top-1 acc 60.547 (62.126)	Top-5 acc 82.812 (82.802)	lr 0.00942
Train [70][1630/3239]	Time 0.270 (0.717)	Data Time 0.001 (0.224)	Loss 2.5860 (2.5646)	Entropy 0.61827 (0.61952)	Top-1 acc 60.156 (62.126)	Top-5 acc 82.812 (82.805)	lr 0.00942
Train [70][1640/3239]	Time 3.978 (0.718)	Data Time 3.726 (0.225)	Loss 2.6097 (2.5648)	Entropy 0.61793 (0.61951)	Top-1 acc 62.109 (62.117)	Top-5 acc 83.594 (82.802)	lr 0.00942
Train [70][1650/3239]	Time 0.227 (0.716)	Data Time 0.001 (0.223)	Loss 2.4464 (2.5647)	Entropy 0.61804 (0.61950)	Top-1 acc 66.016 (62.114)	Top-5 acc 86.719 (82.806)	lr 0.00942
Train [70][1660/3239]	Time 0.273 (0.718)	Data Time 0.002 (0.226)	Loss 2.6091 (2.5648)	Entropy 0.61794 (0.61949)	Top-1 acc 63.672 (62.118)	Top-5 acc 81.641 (82.807)	lr 0.00942
Train [70][1670/3239]	Time 0.230 (0.716)	Data Time 0.001 (0.225)	Loss 2.5900 (2.5647)	Entropy 0.61773 (0.61948)	Top-1 acc 58.203 (62.119)	Top-5 acc 80.859 (82.802)	lr 0.00942
Train [70][1680/3239]	Time 0.275 (0.719)	Data Time 0.002 (0.228)	Loss 2.4505 (2.5647)	Entropy 0.61781 (0.61947)	Top-1 acc 64.844 (62.121)	Top-5 acc 84.375 (82.803)	lr 0.00942
Train [70][1690/3239]	Time 0.271 (0.720)	Data Time 0.002 (0.229)	Loss 2.6018 (2.5644)	Entropy 0.61733 (0.61946)	Top-1 acc 59.375 (62.126)	Top-5 acc 81.250 (82.806)	lr 0.00942
Train [70][1700/3239]	Time 0.251 (0.720)	Data Time 0.001 (0.229)	Loss 2.3889 (2.5642)	Entropy 0.61712 (0.61944)	Top-1 acc 64.062 (62.126)	Top-5 acc 83.984 (82.810)	lr 0.00942
Train [70][1710/3239]	Time 0.252 (0.724)	Data Time 0.001 (0.234)	Loss 2.1651 (2.5639)	Entropy 0.61716 (0.61943)	Top-1 acc 73.047 (62.136)	Top-5 acc 89.062 (82.812)	lr 0.00941
Train [70][1720/3239]	Time 0.241 (0.723)	Data Time 0.001 (0.233)	Loss 2.5164 (2.5642)	Entropy 0.61711 (0.61942)	Top-1 acc 60.547 (62.131)	Top-5 acc 83.984 (82.807)	lr 0.00941
Train [70][1730/3239]	Time 0.455 (0.748)	Data Time 0.004 (0.232)	Loss 2.6226 (2.5643)	Entropy 0.61710 (0.61940)	Top-1 acc 60.938 (62.132)	Top-5 acc 81.250 (82.805)	lr 0.00941
Train [70][1740/3239]	Time 0.238 (0.747)	Data Time 0.002 (0.231)	Loss 2.5778 (2.5645)	Entropy 0.61718 (0.61939)	Top-1 acc 59.375 (62.128)	Top-5 acc 81.641 (82.800)	lr 0.00941
Train [70][1750/3239]	Time 0.245 (0.745)	Data Time 0.001 (0.229)	Loss 2.7549 (2.5648)	Entropy 0.61718 (0.61938)	Top-1 acc 60.547 (62.121)	Top-5 acc 79.688 (82.793)	lr 0.00941
Train [70][1760/3239]	Time 0.254 (0.743)	Data Time 0.002 (0.228)	Loss 2.3516 (2.5653)	Entropy 0.61733 (0.61937)	Top-1 acc 66.406 (62.111)	Top-5 acc 86.328 (82.783)	lr 0.00941
Train [70][1770/3239]	Time 0.262 (0.741)	Data Time 0.001 (0.227)	Loss 2.5825 (2.5653)	Entropy 0.61696 (0.61935)	Top-1 acc 60.938 (62.108)	Top-5 acc 82.031 (82.782)	lr 0.00941
Train [70][1780/3239]	Time 0.236 (0.739)	Data Time 0.001 (0.225)	Loss 2.8356 (2.5655)	Entropy 0.61697 (0.61934)	Top-1 acc 56.641 (62.107)	Top-5 acc 77.344 (82.777)	lr 0.00941
Train [70][1790/3239]	Time 0.230 (0.737)	Data Time 0.001 (0.224)	Loss 2.5735 (2.5659)	Entropy 0.61708 (0.61933)	Top-1 acc 58.594 (62.094)	Top-5 acc 80.859 (82.768)	lr 0.00941
Train [70][1800/3239]	Time 0.251 (0.737)	Data Time 0.001 (0.224)	Loss 2.5466 (2.5659)	Entropy 0.61721 (0.61932)	Top-1 acc 64.062 (62.098)	Top-5 acc 82.422 (82.769)	lr 0.00941
Train [70][1810/3239]	Time 0.253 (0.737)	Data Time 0.001 (0.224)	Loss 2.7370 (2.5659)	Entropy 0.61703 (0.61930)	Top-1 acc 56.250 (62.097)	Top-5 acc 79.297 (82.770)	lr 0.00940
Train [70][1820/3239]	Time 0.261 (0.735)	Data Time 0.001 (0.223)	Loss 2.5409 (2.5660)	Entropy 0.61735 (0.61929)	Top-1 acc 64.844 (62.092)	Top-5 acc 81.641 (82.766)	lr 0.00940
Train [70][1830/3239]	Time 1.165 (0.742)	Data Time 0.885 (0.230)	Loss 2.6107 (2.5662)	Entropy 0.61741 (0.61928)	Top-1 acc 58.594 (62.087)	Top-5 acc 81.641 (82.757)	lr 0.00940
Train [70][1840/3239]	Time 0.264 (0.741)	Data Time 0.001 (0.229)	Loss 2.5965 (2.5661)	Entropy 0.61725 (0.61927)	Top-1 acc 62.109 (62.089)	Top-5 acc 82.422 (82.761)	lr 0.00940
Train [70][1850/3239]	Time 0.242 (0.739)	Data Time 0.001 (0.228)	Loss 2.6350 (2.5662)	Entropy 0.61726 (0.61926)	Top-1 acc 61.719 (62.088)	Top-5 acc 80.078 (82.760)	lr 0.00940
Train [70][1860/3239]	Time 2.629 (0.745)	Data Time 2.376 (0.234)	Loss 2.7186 (2.5664)	Entropy 0.61676 (0.61925)	Top-1 acc 57.812 (62.081)	Top-5 acc 77.734 (82.752)	lr 0.00940
Train [70][1870/3239]	Time 0.245 (0.744)	Data Time 0.001 (0.234)	Loss 2.5348 (2.5662)	Entropy 0.61703 (0.61924)	Top-1 acc 64.844 (62.089)	Top-5 acc 86.328 (82.754)	lr 0.00940
Train [70][1880/3239]	Time 0.516 (0.743)	Data Time 0.280 (0.233)	Loss 2.8907 (2.5663)	Entropy 0.61692 (0.61922)	Top-1 acc 55.469 (62.093)	Top-5 acc 78.125 (82.753)	lr 0.00940
Train [70][1890/3239]	Time 5.932 (0.744)	Data Time 5.565 (0.235)	Loss 2.5070 (2.5665)	Entropy 0.61679 (0.61921)	Top-1 acc 67.188 (62.090)	Top-5 acc 84.766 (82.750)	lr 0.00940
Train [70][1900/3239]	Time 0.233 (0.747)	Data Time 0.001 (0.238)	Loss 2.5562 (2.5666)	Entropy 0.61659 (0.61920)	Top-1 acc 57.812 (62.079)	Top-5 acc 83.203 (82.751)	lr 0.00940
Train [70][1910/3239]	Time 0.235 (0.747)	Data Time 0.001 (0.239)	Loss 2.4538 (2.5670)	Entropy 0.61694 (0.61919)	Top-1 acc 61.719 (62.069)	Top-5 acc 84.375 (82.746)	lr 0.00939
Train [70][1920/3239]	Time 0.255 (0.745)	Data Time 0.001 (0.237)	Loss 2.3536 (2.5668)	Entropy 0.61707 (0.61917)	Top-1 acc 68.359 (62.071)	Top-5 acc 87.500 (82.750)	lr 0.00939
Train [70][1930/3239]	Time 3.582 (0.752)	Data Time 3.328 (0.244)	Loss 2.4642 (2.5668)	Entropy 0.61728 (0.61916)	Top-1 acc 63.672 (62.074)	Top-5 acc 84.375 (82.748)	lr 0.00939
Train [70][1940/3239]	Time 0.250 (0.752)	Data Time 0.001 (0.245)	Loss 2.4883 (2.5667)	Entropy 0.61705 (0.61915)	Top-1 acc 60.547 (62.074)	Top-5 acc 84.375 (82.754)	lr 0.00939
Train [70][1950/3239]	Time 0.243 (0.751)	Data Time 0.001 (0.244)	Loss 2.6548 (2.5670)	Entropy 0.61730 (0.61914)	Top-1 acc 61.328 (62.065)	Top-5 acc 78.906 (82.744)	lr 0.00939
Train [70][1960/3239]	Time 0.363 (0.754)	Data Time 0.001 (0.248)	Loss 2.5131 (2.5669)	Entropy 0.61733 (0.61913)	Top-1 acc 63.672 (62.064)	Top-5 acc 84.375 (82.749)	lr 0.00939
Train [70][1970/3239]	Time 0.255 (0.756)	Data Time 0.001 (0.250)	Loss 2.6070 (2.5669)	Entropy 0.61733 (0.61912)	Top-1 acc 59.375 (62.064)	Top-5 acc 82.812 (82.749)	lr 0.00939
Train [70][1980/3239]	Time 0.242 (0.754)	Data Time 0.001 (0.248)	Loss 2.7465 (2.5666)	Entropy 0.61741 (0.61912)	Top-1 acc 60.156 (62.072)	Top-5 acc 78.125 (82.755)	lr 0.00939
Train [70][1990/3239]	Time 2.618 (0.759)	Data Time 2.389 (0.254)	Loss 2.5280 (2.5668)	Entropy 0.61740 (0.61911)	Top-1 acc 62.891 (62.071)	Top-5 acc 82.031 (82.753)	lr 0.00939
Train [70][2000/3239]	Time 0.233 (0.761)	Data Time 0.001 (0.256)	Loss 2.6418 (2.5669)	Entropy 0.61756 (0.61910)	Top-1 acc 60.938 (62.067)	Top-5 acc 79.297 (82.750)	lr 0.00939
Train [70][2010/3239]	Time 0.243 (0.760)	Data Time 0.001 (0.256)	Loss 2.7029 (2.5671)	Entropy 0.61750 (0.61909)	Top-1 acc 60.547 (62.059)	Top-5 acc 82.031 (82.751)	lr 0.00938
Train [70][2020/3239]	Time 0.279 (0.763)	Data Time 0.002 (0.259)	Loss 2.6644 (2.5672)	Entropy 0.61726 (0.61908)	Top-1 acc 58.594 (62.056)	Top-5 acc 80.469 (82.749)	lr 0.00938
Train [70][2030/3239]	Time 0.258 (0.765)	Data Time 0.001 (0.261)	Loss 2.5836 (2.5673)	Entropy 0.61673 (0.61907)	Top-1 acc 60.156 (62.054)	Top-5 acc 83.203 (82.749)	lr 0.00938
Train [70][2040/3239]	Time 0.262 (0.765)	Data Time 0.002 (0.261)	Loss 2.6414 (2.5673)	Entropy 0.61694 (0.61906)	Top-1 acc 65.234 (62.053)	Top-5 acc 82.812 (82.749)	lr 0.00938
Train [70][2050/3239]	Time 4.603 (0.765)	Data Time 4.250 (0.262)	Loss 2.5456 (2.5677)	Entropy 0.61700 (0.61905)	Top-1 acc 63.672 (62.044)	Top-5 acc 81.641 (82.742)	lr 0.00938
Train [70][2060/3239]	Time 0.220 (0.769)	Data Time 0.001 (0.266)	Loss 2.5357 (2.5675)	Entropy 0.61717 (0.61904)	Top-1 acc 66.016 (62.046)	Top-5 acc 83.203 (82.744)	lr 0.00938
Train [70][2070/3239]	Time 0.234 (0.770)	Data Time 0.001 (0.268)	Loss 2.8170 (2.5676)	Entropy 0.61732 (0.61903)	Top-1 acc 58.203 (62.046)	Top-5 acc 77.344 (82.738)	lr 0.00938
Train [70][2080/3239]	Time 0.224 (0.769)	Data Time 0.001 (0.267)	Loss 2.6120 (2.5678)	Entropy 0.61736 (0.61902)	Top-1 acc 58.984 (62.038)	Top-5 acc 82.812 (82.736)	lr 0.00938
Train [70][2090/3239]	Time 0.244 (0.773)	Data Time 0.001 (0.272)	Loss 2.5164 (2.5677)	Entropy 0.61727 (0.61901)	Top-1 acc 68.359 (62.043)	Top-5 acc 85.156 (82.740)	lr 0.00938
Train [70][2100/3239]	Time 0.235 (0.775)	Data Time 0.001 (0.274)	Loss 2.4883 (2.5677)	Entropy 0.61717 (0.61901)	Top-1 acc 64.453 (62.042)	Top-5 acc 86.328 (82.744)	lr 0.00938
Train [70][2110/3239]	Time 0.225 (0.774)	Data Time 0.001 (0.273)	Loss 2.5009 (2.5676)	Entropy 0.61710 (0.61900)	Top-1 acc 64.062 (62.041)	Top-5 acc 81.250 (82.745)	lr 0.00938
Train [70][2120/3239]	Time 0.319 (0.781)	Data Time 0.001 (0.281)	Loss 2.5936 (2.5677)	Entropy 0.61746 (0.61899)	Top-1 acc 59.766 (62.038)	Top-5 acc 83.594 (82.746)	lr 0.00937
Train [70][2130/3239]	Time 0.245 (0.781)	Data Time 0.001 (0.281)	Loss 2.4791 (2.5677)	Entropy 0.61739 (0.61898)	Top-1 acc 67.578 (62.035)	Top-5 acc 84.375 (82.746)	lr 0.00937
Train [70][2140/3239]	Time 0.260 (0.779)	Data Time 0.001 (0.280)	Loss 2.3553 (2.5675)	Entropy 0.61728 (0.61897)	Top-1 acc 68.750 (62.043)	Top-5 acc 87.500 (82.755)	lr 0.00937
Train [70][2150/3239]	Time 2.441 (0.786)	Data Time 2.179 (0.286)	Loss 2.5111 (2.5673)	Entropy 0.61726 (0.61897)	Top-1 acc 62.500 (62.044)	Top-5 acc 82.812 (82.756)	lr 0.00937
Train [70][2160/3239]	Time 0.239 (0.787)	Data Time 0.001 (0.289)	Loss 2.6121 (2.5673)	Entropy 0.61740 (0.61896)	Top-1 acc 62.109 (62.043)	Top-5 acc 81.641 (82.754)	lr 0.00937
Train [70][2170/3239]	Time 0.226 (0.786)	Data Time 0.001 (0.288)	Loss 2.4908 (2.5677)	Entropy 0.61738 (0.61895)	Top-1 acc 61.328 (62.032)	Top-5 acc 84.375 (82.747)	lr 0.00937
Train [70][2180/3239]	Time 0.230 (0.791)	Data Time 0.001 (0.293)	Loss 2.5194 (2.5676)	Entropy 0.61745 (0.61894)	Top-1 acc 61.719 (62.033)	Top-5 acc 83.203 (82.754)	lr 0.00937
Train [70][2190/3239]	Time 0.241 (0.795)	Data Time 0.001 (0.297)	Loss 2.4140 (2.5673)	Entropy 0.61756 (0.61894)	Top-1 acc 62.109 (62.039)	Top-5 acc 87.500 (82.758)	lr 0.00937
Train [70][2200/3239]	Time 0.239 (0.793)	Data Time 0.001 (0.296)	Loss 2.6272 (2.5676)	Entropy 0.61762 (0.61893)	Top-1 acc 58.203 (62.034)	Top-5 acc 78.125 (82.751)	lr 0.00937
Train [70][2210/3239]	Time 11.415 (0.796)	Data Time 11.125 (0.300)	Loss 2.5402 (2.5675)	Entropy 0.61795 (0.61893)	Top-1 acc 64.844 (62.042)	Top-5 acc 85.156 (82.754)	lr 0.00937
Train [70][2220/3239]	Time 0.242 (0.800)	Data Time 0.001 (0.304)	Loss 2.4972 (2.5673)	Entropy 0.61762 (0.61892)	Top-1 acc 64.062 (62.048)	Top-5 acc 83.203 (82.758)	lr 0.00936
Train [70][2230/3239]	Time 0.242 (0.801)	Data Time 0.001 (0.305)	Loss 2.3796 (2.5672)	Entropy 0.61787 (0.61891)	Top-1 acc 65.625 (62.052)	Top-5 acc 85.938 (82.762)	lr 0.00936
Train [70][2240/3239]	Time 0.241 (0.799)	Data Time 0.001 (0.303)	Loss 3.0785 (2.5676)	Entropy 0.61821 (0.61891)	Top-1 acc 49.219 (62.045)	Top-5 acc 72.266 (82.753)	lr 0.00936
Train [70][2250/3239]	Time 9.854 (0.808)	Data Time 9.610 (0.312)	Loss 2.6914 (2.5675)	Entropy 0.61828 (0.61891)	Top-1 acc 59.375 (62.047)	Top-5 acc 78.906 (82.753)	lr 0.00936
Train [70][2260/3239]	Time 0.243 (0.809)	Data Time 0.001 (0.314)	Loss 2.5483 (2.5674)	Entropy 0.61845 (0.61890)	Top-1 acc 63.281 (62.050)	Top-5 acc 82.031 (82.752)	lr 0.00936
Train [70][2270/3239]	Time 0.233 (0.807)	Data Time 0.001 (0.312)	Loss 2.5865 (2.5675)	Entropy 0.61828 (0.61890)	Top-1 acc 59.766 (62.044)	Top-5 acc 82.422 (82.747)	lr 0.00936
Train [70][2280/3239]	Time 0.349 (0.813)	Data Time 0.001 (0.318)	Loss 2.5561 (2.5679)	Entropy 0.61823 (0.61890)	Top-1 acc 62.891 (62.037)	Top-5 acc 82.031 (82.738)	lr 0.00936
Train [70][2290/3239]	Time 1.315 (0.817)	Data Time 1.085 (0.323)	Loss 2.7004 (2.5682)	Entropy 0.61829 (0.61890)	Top-1 acc 59.766 (62.032)	Top-5 acc 78.516 (82.734)	lr 0.00936
Train [70][2300/3239]	Time 0.242 (0.815)	Data Time 0.001 (0.322)	Loss 2.5917 (2.5683)	Entropy 0.61840 (0.61889)	Top-1 acc 66.016 (62.030)	Top-5 acc 82.422 (82.729)	lr 0.00936
Train [70][2310/3239]	Time 0.247 (0.821)	Data Time 0.001 (0.328)	Loss 2.6303 (2.5682)	Entropy 0.61806 (0.61889)	Top-1 acc 57.812 (62.027)	Top-5 acc 83.203 (82.730)	lr 0.00936
Train [70][2320/3239]	Time 0.279 (0.822)	Data Time 0.001 (0.329)	Loss 2.7672 (2.5683)	Entropy 0.61797 (0.61889)	Top-1 acc 58.984 (62.025)	Top-5 acc 78.906 (82.725)	lr 0.00935
Train [70][2330/3239]	Time 0.225 (0.826)	Data Time 0.001 (0.333)	Loss 2.6221 (2.5684)	Entropy 0.61796 (0.61888)	Top-1 acc 61.719 (62.026)	Top-5 acc 82.812 (82.724)	lr 0.00935
Train [70][2340/3239]	Time 0.249 (0.824)	Data Time 0.001 (0.332)	Loss 2.4911 (2.5681)	Entropy 0.61808 (0.61888)	Top-1 acc 64.453 (62.030)	Top-5 acc 84.375 (82.728)	lr 0.00935
Train [70][2350/3239]	Time 0.370 (0.829)	Data Time 0.001 (0.337)	Loss 2.5000 (2.5682)	Entropy 0.61723 (0.61887)	Top-1 acc 62.109 (62.029)	Top-5 acc 80.859 (82.725)	lr 0.00935
Train [70][2360/3239]	Time 5.140 (0.835)	Data Time 4.887 (0.343)	Loss 2.5797 (2.5686)	Entropy 0.61719 (0.61887)	Top-1 acc 65.625 (62.020)	Top-5 acc 81.641 (82.718)	lr 0.00935
Train [70][2370/3239]	Time 0.249 (0.833)	Data Time 0.001 (0.342)	Loss 2.5716 (2.5686)	Entropy 0.61735 (0.61886)	Top-1 acc 61.328 (62.017)	Top-5 acc 83.203 (82.717)	lr 0.00935
Train [70][2380/3239]	Time 0.271 (0.837)	Data Time 0.001 (0.346)	Loss 2.3807 (2.5685)	Entropy 0.61766 (0.61886)	Top-1 acc 69.531 (62.025)	Top-5 acc 85.938 (82.720)	lr 0.00935
Train [70][2390/3239]	Time 0.241 (0.856)	Data Time 0.002 (0.345)	Loss 2.4935 (2.5682)	Entropy 0.61746 (0.61885)	Top-1 acc 64.062 (62.035)	Top-5 acc 86.328 (82.725)	lr 0.00935
Train [70][2400/3239]	Time 0.243 (0.854)	Data Time 0.001 (0.343)	Loss 2.3637 (2.5682)	Entropy 0.61767 (0.61884)	Top-1 acc 69.531 (62.037)	Top-5 acc 85.156 (82.725)	lr 0.00935
Train [70][2410/3239]	Time 0.267 (0.852)	Data Time 0.002 (0.342)	Loss 2.5514 (2.5682)	Entropy 0.61782 (0.61884)	Top-1 acc 59.766 (62.035)	Top-5 acc 85.547 (82.725)	lr 0.00935
Train [70][2420/3239]	Time 0.264 (0.851)	Data Time 0.001 (0.340)	Loss 2.4534 (2.5681)	Entropy 0.61756 (0.61884)	Top-1 acc 63.672 (62.035)	Top-5 acc 86.328 (82.725)	lr 0.00934
Train [70][2430/3239]	Time 0.262 (0.849)	Data Time 0.001 (0.339)	Loss 2.4999 (2.5682)	Entropy 0.61792 (0.61883)	Top-1 acc 58.984 (62.030)	Top-5 acc 85.156 (82.722)	lr 0.00934
Train [70][2440/3239]	Time 0.350 (0.851)	Data Time 0.001 (0.342)	Loss 2.3913 (2.5682)	Entropy 0.61828 (0.61883)	Top-1 acc 65.625 (62.032)	Top-5 acc 88.281 (82.722)	lr 0.00934
Train [70][2450/3239]	Time 0.348 (0.854)	Data Time 0.093 (0.345)	Loss 2.5738 (2.5682)	Entropy 0.61836 (0.61883)	Top-1 acc 61.328 (62.032)	Top-5 acc 82.812 (82.722)	lr 0.00934
Train [70][2460/3239]	Time 0.266 (0.855)	Data Time 0.001 (0.346)	Loss 2.5770 (2.5683)	Entropy 0.61810 (0.61882)	Top-1 acc 57.812 (62.030)	Top-5 acc 82.812 (82.722)	lr 0.00934
Train [70][2470/3239]	Time 1.663 (0.857)	Data Time 1.410 (0.349)	Loss 2.7153 (2.5684)	Entropy 0.61797 (0.61882)	Top-1 acc 58.203 (62.029)	Top-5 acc 78.516 (82.715)	lr 0.00934
Train [70][2480/3239]	Time 0.239 (0.856)	Data Time 0.001 (0.348)	Loss 2.4914 (2.5687)	Entropy 0.61763 (0.61882)	Top-1 acc 67.188 (62.022)	Top-5 acc 83.984 (82.713)	lr 0.00934
Train [70][2490/3239]	Time 0.258 (0.860)	Data Time 0.001 (0.352)	Loss 2.4994 (2.5685)	Entropy 0.61779 (0.61881)	Top-1 acc 64.844 (62.028)	Top-5 acc 85.156 (82.714)	lr 0.00934
Train [70][2500/3239]	Time 2.362 (0.859)	Data Time 2.115 (0.351)	Loss 2.7338 (2.5687)	Entropy 0.61779 (0.61881)	Top-1 acc 61.328 (62.027)	Top-5 acc 80.859 (82.707)	lr 0.00934
Train [70][2510/3239]	Time 0.325 (0.862)	Data Time 0.001 (0.355)	Loss 2.6040 (2.5687)	Entropy 0.61784 (0.61880)	Top-1 acc 61.328 (62.027)	Top-5 acc 81.641 (82.712)	lr 0.00934
Train [70][2520/3239]	Time 2.864 (0.865)	Data Time 2.579 (0.358)	Loss 2.5566 (2.5687)	Entropy 0.61815 (0.61880)	Top-1 acc 63.281 (62.029)	Top-5 acc 80.469 (82.713)	lr 0.00934
Train [70][2530/3239]	Time 0.249 (0.863)	Data Time 0.002 (0.357)	Loss 2.5287 (2.5688)	Entropy 0.61845 (0.61880)	Top-1 acc 63.672 (62.031)	Top-5 acc 81.641 (82.708)	lr 0.00933
Train [70][2540/3239]	Time 0.234 (0.868)	Data Time 0.001 (0.362)	Loss 2.5273 (2.5683)	Entropy 0.61848 (0.61880)	Top-1 acc 63.281 (62.042)	Top-5 acc 82.812 (82.717)	lr 0.00933
Train [70][2550/3239]	Time 0.252 (0.869)	Data Time 0.001 (0.363)	Loss 2.5222 (2.5685)	Entropy 0.61831 (0.61880)	Top-1 acc 63.672 (62.036)	Top-5 acc 83.984 (82.714)	lr 0.00933
Train [70][2560/3239]	Time 0.227 (0.868)	Data Time 0.001 (0.363)	Loss 2.6704 (2.5683)	Entropy 0.61812 (0.61879)	Top-1 acc 58.984 (62.038)	Top-5 acc 82.812 (82.714)	lr 0.00933
Train [70][2570/3239]	Time 1.920 (0.873)	Data Time 1.675 (0.368)	Loss 2.3563 (2.5684)	Entropy 0.61832 (0.61879)	Top-1 acc 67.188 (62.038)	Top-5 acc 85.156 (82.710)	lr 0.00933
Train [70][2580/3239]	Time 0.239 (0.873)	Data Time 0.001 (0.368)	Loss 2.8054 (2.5683)	Entropy 0.61838 (0.61879)	Top-1 acc 57.812 (62.038)	Top-5 acc 76.172 (82.711)	lr 0.00933
Train [70][2590/3239]	Time 0.251 (0.874)	Data Time 0.001 (0.369)	Loss 2.7409 (2.5685)	Entropy 0.61837 (0.61879)	Top-1 acc 56.250 (62.031)	Top-5 acc 79.297 (82.707)	lr 0.00933
Train [70][2600/3239]	Time 0.329 (0.876)	Data Time 0.001 (0.372)	Loss 2.3642 (2.5684)	Entropy 0.61864 (0.61879)	Top-1 acc 66.406 (62.031)	Top-5 acc 85.156 (82.706)	lr 0.00933
Train [70][2610/3239]	Time 0.239 (0.878)	Data Time 0.001 (0.375)	Loss 2.4861 (2.5682)	Entropy 0.61887 (0.61879)	Top-1 acc 62.891 (62.035)	Top-5 acc 82.422 (82.711)	lr 0.00933
Train [70][2620/3239]	Time 0.275 (0.878)	Data Time 0.001 (0.375)	Loss 2.6560 (2.5681)	Entropy 0.61909 (0.61879)	Top-1 acc 58.984 (62.032)	Top-5 acc 80.859 (82.713)	lr 0.00933
Train [70][2630/3239]	Time 6.642 (0.880)	Data Time 6.385 (0.377)	Loss 2.4023 (2.5679)	Entropy 0.61915 (0.61879)	Top-1 acc 64.844 (62.043)	Top-5 acc 85.547 (82.718)	lr 0.00932
Train [70][2640/3239]	Time 0.254 (0.881)	Data Time 0.001 (0.378)	Loss 2.7334 (2.5680)	Entropy 0.61937 (0.61879)	Top-1 acc 58.203 (62.039)	Top-5 acc 79.688 (82.716)	lr 0.00932
Train [70][2650/3239]	Time 0.235 (0.883)	Data Time 0.001 (0.380)	Loss 2.5747 (2.5683)	Entropy 0.61948 (0.61879)	Top-1 acc 62.500 (62.030)	Top-5 acc 81.250 (82.710)	lr 0.00932
Train [70][2660/3239]	Time 0.961 (0.881)	Data Time 0.714 (0.379)	Loss 2.6919 (2.5684)	Entropy 0.61959 (0.61879)	Top-1 acc 59.766 (62.031)	Top-5 acc 79.297 (82.709)	lr 0.00932
Train [70][2670/3239]	Time 0.328 (0.887)	Data Time 0.001 (0.385)	Loss 2.4061 (2.5682)	Entropy 0.61930 (0.61880)	Top-1 acc 63.281 (62.035)	Top-5 acc 85.938 (82.713)	lr 0.00932
Train [70][2680/3239]	Time 0.240 (0.889)	Data Time 0.001 (0.387)	Loss 2.4774 (2.5682)	Entropy 0.61934 (0.61880)	Top-1 acc 63.672 (62.039)	Top-5 acc 84.375 (82.716)	lr 0.00932
Train [70][2690/3239]	Time 0.253 (0.887)	Data Time 0.001 (0.385)	Loss 2.7039 (2.5683)	Entropy 0.61965 (0.61880)	Top-1 acc 57.812 (62.039)	Top-5 acc 79.688 (82.714)	lr 0.00932
Train [70][2700/3239]	Time 0.244 (0.891)	Data Time 0.001 (0.390)	Loss 2.5290 (2.5683)	Entropy 0.61952 (0.61880)	Top-1 acc 64.453 (62.040)	Top-5 acc 85.156 (82.714)	lr 0.00932
Train [70][2710/3239]	Time 0.247 (0.894)	Data Time 0.001 (0.393)	Loss 2.7447 (2.5685)	Entropy 0.61967 (0.61881)	Top-1 acc 55.469 (62.035)	Top-5 acc 78.906 (82.709)	lr 0.00932
Train [70][2720/3239]	Time 0.235 (0.892)	Data Time 0.001 (0.392)	Loss 2.5237 (2.5685)	Entropy 0.61975 (0.61881)	Top-1 acc 65.234 (62.031)	Top-5 acc 83.203 (82.711)	lr 0.00932
Train [70][2730/3239]	Time 1.951 (0.895)	Data Time 1.704 (0.394)	Loss 2.5635 (2.5684)	Entropy 0.61984 (0.61881)	Top-1 acc 64.062 (62.035)	Top-5 acc 83.984 (82.714)	lr 0.00931
Train [70][2740/3239]	Time 0.246 (0.896)	Data Time 0.001 (0.396)	Loss 2.7108 (2.5683)	Entropy 0.61982 (0.61882)	Top-1 acc 58.984 (62.033)	Top-5 acc 78.125 (82.714)	lr 0.00931
Train [70][2750/3239]	Time 0.254 (0.896)	Data Time 0.001 (0.397)	Loss 2.6043 (2.5684)	Entropy 0.61983 (0.61882)	Top-1 acc 60.547 (62.031)	Top-5 acc 81.641 (82.712)	lr 0.00931
Train [70][2760/3239]	Time 0.287 (0.898)	Data Time 0.001 (0.398)	Loss 2.5071 (2.5685)	Entropy 0.61999 (0.61882)	Top-1 acc 62.500 (62.027)	Top-5 acc 84.766 (82.707)	lr 0.00931
Train [70][2770/3239]	Time 0.266 (0.901)	Data Time 0.001 (0.402)	Loss 2.6872 (2.5689)	Entropy 0.62000 (0.61883)	Top-1 acc 60.156 (62.021)	Top-5 acc 82.422 (82.701)	lr 0.00931
Train [70][2780/3239]	Time 0.241 (0.901)	Data Time 0.002 (0.403)	Loss 2.8292 (2.5690)	Entropy 0.61987 (0.61883)	Top-1 acc 56.641 (62.012)	Top-5 acc 79.297 (82.701)	lr 0.00931
Train [70][2790/3239]	Time 8.024 (0.902)	Data Time 7.766 (0.404)	Loss 2.5010 (2.5691)	Entropy 0.61992 (0.61884)	Top-1 acc 65.625 (62.013)	Top-5 acc 84.375 (82.700)	lr 0.00931
Train [70][2800/3239]	Time 0.231 (0.902)	Data Time 0.001 (0.404)	Loss 2.7487 (2.5693)	Entropy 0.61982 (0.61884)	Top-1 acc 54.688 (62.010)	Top-5 acc 79.297 (82.698)	lr 0.00931
Train [70][2810/3239]	Time 0.252 (0.905)	Data Time 0.001 (0.407)	Loss 2.6489 (2.5693)	Entropy 0.61990 (0.61884)	Top-1 acc 60.938 (62.006)	Top-5 acc 82.031 (82.699)	lr 0.00931
Train [70][2820/3239]	Time 0.271 (0.903)	Data Time 0.001 (0.405)	Loss 2.7649 (2.5693)	Entropy 0.62002 (0.61885)	Top-1 acc 55.078 (62.005)	Top-5 acc 80.859 (82.698)	lr 0.00931
Train [70][2830/3239]	Time 0.317 (0.905)	Data Time 0.001 (0.408)	Loss 2.6420 (2.5695)	Entropy 0.62024 (0.61885)	Top-1 acc 59.766 (61.999)	Top-5 acc 80.469 (82.693)	lr 0.00930
Train [70][2840/3239]	Time 0.232 (0.908)	Data Time 0.001 (0.412)	Loss 2.5878 (2.5693)	Entropy 0.62017 (0.61886)	Top-1 acc 58.594 (62.002)	Top-5 acc 82.422 (82.697)	lr 0.00930
Train [70][2850/3239]	Time 0.233 (0.907)	Data Time 0.001 (0.410)	Loss 2.6888 (2.5694)	Entropy 0.61993 (0.61886)	Top-1 acc 58.203 (62.000)	Top-5 acc 80.078 (82.695)	lr 0.00930
Train [70][2860/3239]	Time 0.224 (0.911)	Data Time 0.001 (0.415)	Loss 2.7699 (2.5695)	Entropy 0.62025 (0.61886)	Top-1 acc 57.422 (61.993)	Top-5 acc 78.125 (82.695)	lr 0.00930
Train [70][2870/3239]	Time 0.275 (0.912)	Data Time 0.002 (0.417)	Loss 2.4541 (2.5696)	Entropy 0.61977 (0.61887)	Top-1 acc 64.844 (61.988)	Top-5 acc 86.719 (82.697)	lr 0.00930
Train [70][2880/3239]	Time 0.236 (0.911)	Data Time 0.001 (0.415)	Loss 2.5663 (2.5696)	Entropy 0.61988 (0.61887)	Top-1 acc 65.625 (61.991)	Top-5 acc 81.641 (82.695)	lr 0.00930
Train [70][2890/3239]	Time 0.227 (0.916)	Data Time 0.001 (0.421)	Loss 2.5107 (2.5697)	Entropy 0.61982 (0.61888)	Top-1 acc 62.109 (61.986)	Top-5 acc 83.203 (82.693)	lr 0.00930
Train [70][2900/3239]	Time 0.360 (0.917)	Data Time 0.001 (0.422)	Loss 2.5558 (2.5697)	Entropy 0.61964 (0.61888)	Top-1 acc 58.984 (61.985)	Top-5 acc 81.250 (82.692)	lr 0.00930
Train [70][2910/3239]	Time 0.234 (0.916)	Data Time 0.001 (0.421)	Loss 2.4425 (2.5694)	Entropy 0.61949 (0.61888)	Top-1 acc 66.406 (61.991)	Top-5 acc 83.984 (82.694)	lr 0.00930
Train [70][2920/3239]	Time 0.265 (0.918)	Data Time 0.001 (0.424)	Loss 2.6366 (2.5694)	Entropy 0.61966 (0.61888)	Top-1 acc 60.156 (61.991)	Top-5 acc 78.906 (82.694)	lr 0.00930
Train [70][2930/3239]	Time 0.237 (0.922)	Data Time 0.001 (0.427)	Loss 2.3946 (2.5693)	Entropy 0.61984 (0.61889)	Top-1 acc 66.797 (61.994)	Top-5 acc 85.938 (82.696)	lr 0.00930
Train [70][2940/3239]	Time 0.238 (0.922)	Data Time 0.001 (0.428)	Loss 2.5756 (2.5692)	Entropy 0.61988 (0.61889)	Top-1 acc 64.844 (61.998)	Top-5 acc 82.422 (82.697)	lr 0.00929
Train [70][2950/3239]	Time 7.412 (0.923)	Data Time 7.161 (0.429)	Loss 2.6383 (2.5692)	Entropy 0.61919 (0.61889)	Top-1 acc 61.719 (61.999)	Top-5 acc 81.250 (82.698)	lr 0.00929
Train [70][2960/3239]	Time 0.252 (0.926)	Data Time 0.001 (0.433)	Loss 2.5709 (2.5692)	Entropy 0.61916 (0.61889)	Top-1 acc 62.500 (62.001)	Top-5 acc 84.766 (82.698)	lr 0.00929
Train [70][2970/3239]	Time 0.257 (0.927)	Data Time 0.002 (0.433)	Loss 2.4541 (2.5689)	Entropy 0.61919 (0.61889)	Top-1 acc 62.109 (62.006)	Top-5 acc 83.984 (82.702)	lr 0.00929
Train [70][2980/3239]	Time 0.242 (0.925)	Data Time 0.001 (0.432)	Loss 2.5310 (2.5691)	Entropy 0.61889 (0.61890)	Top-1 acc 61.328 (62.003)	Top-5 acc 82.422 (82.698)	lr 0.00929
Train [70][2990/3239]	Time 0.368 (0.930)	Data Time 0.001 (0.437)	Loss 2.5513 (2.5690)	Entropy 0.61891 (0.61890)	Top-1 acc 62.500 (62.007)	Top-5 acc 85.547 (82.701)	lr 0.00929
Train [70][3000/3239]	Time 2.906 (0.930)	Data Time 2.662 (0.437)	Loss 2.4068 (2.5690)	Entropy 0.61927 (0.61890)	Top-1 acc 70.312 (62.007)	Top-5 acc 85.156 (82.701)	lr 0.00929
Train [70][3010/3239]	Time 0.248 (0.929)	Data Time 0.001 (0.437)	Loss 2.4910 (2.5692)	Entropy 0.61906 (0.61890)	Top-1 acc 66.406 (62.007)	Top-5 acc 81.641 (82.695)	lr 0.00929
Train [70][3020/3239]	Time 0.228 (0.934)	Data Time 0.001 (0.442)	Loss 2.4808 (2.5693)	Entropy 0.61907 (0.61890)	Top-1 acc 60.547 (62.004)	Top-5 acc 85.547 (82.693)	lr 0.00929
Train [70][3030/3239]	Time 0.228 (0.934)	Data Time 0.001 (0.442)	Loss 2.4000 (2.5691)	Entropy 0.61906 (0.61890)	Top-1 acc 66.797 (62.007)	Top-5 acc 88.281 (82.695)	lr 0.00929
Train [70][3040/3239]	Time 0.434 (0.950)	Data Time 0.004 (0.443)	Loss 2.6102 (2.5692)	Entropy 0.61935 (0.61890)	Top-1 acc 63.281 (62.000)	Top-5 acc 82.031 (82.695)	lr 0.00928
Train [70][3050/3239]	Time 0.239 (0.949)	Data Time 0.002 (0.441)	Loss 2.4196 (2.5690)	Entropy 0.61916 (0.61890)	Top-1 acc 69.141 (62.003)	Top-5 acc 87.109 (82.698)	lr 0.00928
Train [70][3060/3239]	Time 0.238 (0.947)	Data Time 0.002 (0.440)	Loss 2.5074 (2.5691)	Entropy 0.61916 (0.61890)	Top-1 acc 61.719 (62.002)	Top-5 acc 83.594 (82.697)	lr 0.00928
Train [70][3070/3239]	Time 0.239 (0.945)	Data Time 0.001 (0.439)	Loss 2.7517 (2.5688)	Entropy 0.61892 (0.61890)	Top-1 acc 56.250 (62.009)	Top-5 acc 76.172 (82.701)	lr 0.00928
Train [70][3080/3239]	Time 0.250 (0.943)	Data Time 0.001 (0.437)	Loss 2.5647 (2.5690)	Entropy 0.61912 (0.61890)	Top-1 acc 57.422 (62.003)	Top-5 acc 82.812 (82.698)	lr 0.00928
Train [70][3090/3239]	Time 0.240 (0.942)	Data Time 0.001 (0.436)	Loss 2.5106 (2.5689)	Entropy 0.61933 (0.61890)	Top-1 acc 65.234 (62.008)	Top-5 acc 82.422 (82.701)	lr 0.00928
Train [70][3100/3239]	Time 0.249 (0.940)	Data Time 0.001 (0.434)	Loss 2.5431 (2.5691)	Entropy 0.61937 (0.61890)	Top-1 acc 61.719 (62.003)	Top-5 acc 82.031 (82.696)	lr 0.00928
Train [70][3110/3239]	Time 0.242 (0.945)	Data Time 0.001 (0.439)	Loss 2.5954 (2.5692)	Entropy 0.61908 (0.61891)	Top-1 acc 62.109 (62.001)	Top-5 acc 82.031 (82.696)	lr 0.00928
Train [70][3120/3239]	Time 0.237 (0.945)	Data Time 0.001 (0.440)	Loss 2.5319 (2.5693)	Entropy 0.61860 (0.61891)	Top-1 acc 64.453 (61.998)	Top-5 acc 83.203 (82.693)	lr 0.00928
Train [70][3130/3239]	Time 0.259 (0.944)	Data Time 0.001 (0.439)	Loss 2.4312 (2.5693)	Entropy 0.61877 (0.61890)	Top-1 acc 62.891 (61.999)	Top-5 acc 85.156 (82.693)	lr 0.00928
Train [70][3140/3239]	Time 0.257 (0.949)	Data Time 0.001 (0.444)	Loss 2.6292 (2.5696)	Entropy 0.61842 (0.61890)	Top-1 acc 60.547 (61.992)	Top-5 acc 80.078 (82.688)	lr 0.00927
Train [70][3150/3239]	Time 0.372 (0.950)	Data Time 0.001 (0.445)	Loss 2.5215 (2.5697)	Entropy 0.61831 (0.61890)	Top-1 acc 64.062 (61.990)	Top-5 acc 82.812 (82.687)	lr 0.00927
Train [70][3160/3239]	Time 0.244 (0.948)	Data Time 0.001 (0.444)	Loss 2.7264 (2.5699)	Entropy 0.61830 (0.61890)	Top-1 acc 58.594 (61.987)	Top-5 acc 78.125 (82.680)	lr 0.00927
Train [70][3170/3239]	Time 0.229 (0.954)	Data Time 0.001 (0.450)	Loss 2.7281 (2.5700)	Entropy 0.61835 (0.61890)	Top-1 acc 59.766 (61.985)	Top-5 acc 79.297 (82.677)	lr 0.00927
Train [70][3180/3239]	Time 0.243 (0.954)	Data Time 0.000 (0.451)	Loss 2.5727 (2.5699)	Entropy 0.61829 (0.61890)	Top-1 acc 61.719 (61.989)	Top-5 acc 80.469 (82.678)	lr 0.00927
Train [70][3190/3239]	Time 0.237 (0.953)	Data Time 0.000 (0.449)	Loss 2.5874 (2.5699)	Entropy 0.61781 (0.61889)	Top-1 acc 56.641 (61.991)	Top-5 acc 84.375 (82.679)	lr 0.00927
Train [70][3200/3239]	Time 5.884 (0.958)	Data Time 5.638 (0.454)	Loss 2.4851 (2.5699)	Entropy 0.61795 (0.61889)	Top-1 acc 67.578 (61.991)	Top-5 acc 83.984 (82.679)	lr 0.00927
Train [70][3210/3239]	Time 0.264 (0.959)	Data Time 0.000 (0.456)	Loss 2.5465 (2.5697)	Entropy 0.61819 (0.61889)	Top-1 acc 66.016 (61.991)	Top-5 acc 80.078 (82.682)	lr 0.00927
Train [70][3220/3239]	Time 0.328 (0.957)	Data Time 0.000 (0.454)	Loss 2.6453 (2.5696)	Entropy 0.61810 (0.61889)	Top-1 acc 60.547 (61.994)	Top-5 acc 78.906 (82.684)	lr 0.00927
Train [70][3230/3239]	Time 8.245 (0.958)	Data Time 7.983 (0.456)	Loss 2.5276 (2.5694)	Entropy 0.61841 (0.61888)	Top-1 acc 62.500 (62.003)	Top-5 acc 83.594 (82.690)	lr 0.00927
Train [70][3239/3239]	Time 0.872 (0.958)	Data Time 0.000 (0.456)	Loss 2.8142 (2.5694)	Entropy 0.61847 (0.61888)	Top-1 acc 66.667 (62.001)	Top-5 acc 82.716 (82.689)	lr 0.00926
==========Valid [70/120]	loss 1.359	top-1 acc 68.757 (69.065)	top-5 acc 88.344	Train top-1 62.001	top-5 82.689	Entropy 0.61847	Latency-None: 0.000ms	Flops: 537.50M
Train [71][0/3239]	Time 41.986 (41.986)	Data Time 40.366 (40.366)	Loss 2.7516 (2.7516)	Entropy 0.61850 (0.61850)	Top-1 acc 59.375 (59.375)	Top-5 acc 79.688 (79.688)	lr 0.00926
Train [71][10/3239]	Time 0.224 (4.371)	Data Time 0.001 (3.793)	Loss 2.7533 (2.6361)	Entropy 0.61811 (0.61834)	Top-1 acc 55.859 (59.588)	Top-5 acc 80.859 (81.996)	lr 0.00926
Train [71][20/3239]	Time 0.258 (2.491)	Data Time 0.002 (1.988)	Loss 2.4067 (2.5839)	Entropy 0.61835 (0.61826)	Top-1 acc 65.234 (60.956)	Top-5 acc 87.500 (83.017)	lr 0.00926
Train [71][30/3239]	Time 0.237 (1.823)	Data Time 0.001 (1.347)	Loss 2.3272 (2.5818)	Entropy 0.61851 (0.61834)	Top-1 acc 67.578 (61.227)	Top-5 acc 85.156 (82.661)	lr 0.00926
Train [71][40/3239]	Time 0.233 (1.670)	Data Time 0.001 (1.207)	Loss 2.4154 (2.5683)	Entropy 0.61870 (0.61841)	Top-1 acc 66.016 (61.623)	Top-5 acc 84.766 (82.898)	lr 0.00926
Train [71][50/3239]	Time 0.325 (1.424)	Data Time 0.001 (0.970)	Loss 2.7218 (2.5633)	Entropy 0.61847 (0.61847)	Top-1 acc 62.500 (61.949)	Top-5 acc 78.516 (82.904)	lr 0.00926
Train [71][60/3239]	Time 0.234 (1.258)	Data Time 0.001 (0.812)	Loss 2.5830 (2.5562)	Entropy 0.61838 (0.61847)	Top-1 acc 59.375 (62.026)	Top-5 acc 86.328 (83.088)	lr 0.00926
Train [71][70/3239]	Time 0.221 (1.238)	Data Time 0.001 (0.794)	Loss 2.6669 (2.5591)	Entropy 0.61844 (0.61845)	Top-1 acc 58.203 (61.911)	Top-5 acc 78.906 (83.066)	lr 0.00926
Train [71][80/3239]	Time 0.243 (1.138)	Data Time 0.001 (0.696)	Loss 2.5011 (2.5535)	Entropy 0.61823 (0.61844)	Top-1 acc 63.281 (62.191)	Top-5 acc 85.156 (83.087)	lr 0.00926
Train [71][90/3239]	Time 0.245 (1.060)	Data Time 0.001 (0.620)	Loss 2.6212 (2.5517)	Entropy 0.61835 (0.61842)	Top-1 acc 60.547 (62.272)	Top-5 acc 81.641 (83.070)	lr 0.00926
Train [71][100/3239]	Time 0.245 (1.027)	Data Time 0.001 (0.585)	Loss 2.7319 (2.5496)	Entropy 0.61865 (0.61843)	Top-1 acc 60.547 (62.349)	Top-5 acc 80.469 (83.103)	lr 0.00926
Train [71][110/3239]	Time 0.260 (0.972)	Data Time 0.001 (0.532)	Loss 2.5460 (2.5495)	Entropy 0.61848 (0.61845)	Top-1 acc 65.625 (62.338)	Top-5 acc 82.422 (83.129)	lr 0.00925
Train [71][120/3239]	Time 0.242 (0.932)	Data Time 0.001 (0.489)	Loss 2.4966 (2.5499)	Entropy 0.61814 (0.61845)	Top-1 acc 63.281 (62.368)	Top-5 acc 86.719 (83.145)	lr 0.00925
Train [71][130/3239]	Time 0.258 (0.910)	Data Time 0.001 (0.464)	Loss 2.5792 (2.5537)	Entropy 0.61854 (0.61844)	Top-1 acc 60.547 (62.193)	Top-5 acc 82.812 (83.051)	lr 0.00925
Train [71][140/3239]	Time 0.236 (0.876)	Data Time 0.002 (0.433)	Loss 2.4726 (2.5541)	Entropy 0.61884 (0.61845)	Top-1 acc 65.234 (62.187)	Top-5 acc 82.031 (83.009)	lr 0.00925
Train [71][150/3239]	Time 0.234 (0.846)	Data Time 0.001 (0.404)	Loss 2.3216 (2.5505)	Entropy 0.61900 (0.61848)	Top-1 acc 69.141 (62.270)	Top-5 acc 88.281 (83.076)	lr 0.00925
Train [71][160/3239]	Time 1.344 (0.828)	Data Time 1.101 (0.386)	Loss 2.4850 (2.5475)	Entropy 0.61911 (0.61851)	Top-1 acc 64.844 (62.333)	Top-5 acc 83.594 (83.099)	lr 0.00925
Train [71][170/3239]	Time 0.240 (0.821)	Data Time 0.001 (0.381)	Loss 2.4018 (2.5452)	Entropy 0.61898 (0.61854)	Top-1 acc 66.406 (62.413)	Top-5 acc 86.719 (83.098)	lr 0.00925
Train [71][180/3239]	Time 0.277 (0.800)	Data Time 0.001 (0.360)	Loss 2.5479 (2.5469)	Entropy 0.61897 (0.61857)	Top-1 acc 60.938 (62.353)	Top-5 acc 81.250 (83.037)	lr 0.00925
Train [71][190/3239]	Time 0.246 (0.783)	Data Time 0.001 (0.341)	Loss 2.4546 (2.5445)	Entropy 0.61929 (0.61860)	Top-1 acc 60.156 (62.433)	Top-5 acc 85.156 (83.062)	lr 0.00925
Train [71][200/3239]	Time 0.227 (0.778)	Data Time 0.001 (0.338)	Loss 2.6179 (2.5445)	Entropy 0.61933 (0.61863)	Top-1 acc 60.547 (62.430)	Top-5 acc 80.078 (83.071)	lr 0.00925
Train [71][210/3239]	Time 0.322 (0.761)	Data Time 0.001 (0.322)	Loss 2.4492 (2.5449)	Entropy 0.61947 (0.61867)	Top-1 acc 64.844 (62.428)	Top-5 acc 83.984 (83.094)	lr 0.00924
Train [71][220/3239]	Time 0.248 (0.747)	Data Time 0.001 (0.308)	Loss 2.6499 (2.5462)	Entropy 0.61965 (0.61871)	Top-1 acc 62.109 (62.424)	Top-5 acc 80.859 (83.063)	lr 0.00924
Train [71][230/3239]	Time 0.273 (0.750)	Data Time 0.001 (0.311)	Loss 2.5135 (2.5446)	Entropy 0.61972 (0.61875)	Top-1 acc 63.672 (62.503)	Top-5 acc 84.766 (83.098)	lr 0.00924
Train [71][240/3239]	Time 0.282 (0.737)	Data Time 0.001 (0.298)	Loss 2.4215 (2.5417)	Entropy 0.61969 (0.61879)	Top-1 acc 65.234 (62.571)	Top-5 acc 83.594 (83.129)	lr 0.00924
Train [71][250/3239]	Time 0.234 (0.725)	Data Time 0.001 (0.286)	Loss 2.4406 (2.5396)	Entropy 0.61989 (0.61883)	Top-1 acc 63.672 (62.606)	Top-5 acc 85.547 (83.181)	lr 0.00924
Train [71][260/3239]	Time 2.280 (0.724)	Data Time 2.011 (0.285)	Loss 2.9649 (2.5427)	Entropy 0.61989 (0.61887)	Top-1 acc 51.953 (62.506)	Top-5 acc 74.609 (83.137)	lr 0.00924
Train [71][270/3239]	Time 0.230 (0.713)	Data Time 0.001 (0.274)	Loss 2.6662 (2.5438)	Entropy 0.62010 (0.61891)	Top-1 acc 57.031 (62.499)	Top-5 acc 82.422 (83.109)	lr 0.00924
Train [71][280/3239]	Time 0.333 (0.703)	Data Time 0.001 (0.265)	Loss 2.6908 (2.5444)	Entropy 0.62031 (0.61896)	Top-1 acc 58.594 (62.481)	Top-5 acc 81.250 (83.096)	lr 0.00924
Train [71][290/3239]	Time 0.230 (0.694)	Data Time 0.001 (0.256)	Loss 2.7040 (2.5429)	Entropy 0.62049 (0.61901)	Top-1 acc 57.812 (62.488)	Top-5 acc 82.422 (83.136)	lr 0.00924
Train [71][300/3239]	Time 0.254 (0.692)	Data Time 0.001 (0.254)	Loss 2.4362 (2.5430)	Entropy 0.62055 (0.61906)	Top-1 acc 67.188 (62.468)	Top-5 acc 85.156 (83.142)	lr 0.00924
Train [71][310/3239]	Time 0.241 (0.684)	Data Time 0.002 (0.246)	Loss 2.4899 (2.5429)	Entropy 0.62024 (0.61910)	Top-1 acc 64.453 (62.471)	Top-5 acc 84.375 (83.142)	lr 0.00923
Train [71][320/3239]	Time 0.244 (0.675)	Data Time 0.001 (0.238)	Loss 2.5844 (2.5424)	Entropy 0.62033 (0.61914)	Top-1 acc 57.422 (62.505)	Top-5 acc 85.156 (83.148)	lr 0.00923
Train [71][330/3239]	Time 0.221 (0.679)	Data Time 0.001 (0.242)	Loss 2.8470 (2.5434)	Entropy 0.62057 (0.61918)	Top-1 acc 55.859 (62.482)	Top-5 acc 79.297 (83.144)	lr 0.00923
Train [71][340/3239]	Time 0.243 (0.672)	Data Time 0.001 (0.235)	Loss 2.6231 (2.5438)	Entropy 0.62075 (0.61922)	Top-1 acc 60.938 (62.473)	Top-5 acc 81.641 (83.136)	lr 0.00923
Train [71][350/3239]	Time 0.291 (0.665)	Data Time 0.003 (0.229)	Loss 2.5017 (2.5419)	Entropy 0.62100 (0.61927)	Top-1 acc 63.672 (62.526)	Top-5 acc 84.766 (83.170)	lr 0.00923
Train [71][360/3239]	Time 0.246 (0.665)	Data Time 0.001 (0.228)	Loss 2.3750 (2.5420)	Entropy 0.62100 (0.61932)	Top-1 acc 65.625 (62.532)	Top-5 acc 87.500 (83.176)	lr 0.00923
Train [71][370/3239]	Time 0.385 (0.659)	Data Time 0.002 (0.222)	Loss 2.4994 (2.5405)	Entropy 0.62120 (0.61936)	Top-1 acc 61.328 (62.597)	Top-5 acc 82.031 (83.202)	lr 0.00923
Train [71][380/3239]	Time 0.233 (0.653)	Data Time 0.001 (0.216)	Loss 2.6312 (2.5430)	Entropy 0.62146 (0.61941)	Top-1 acc 62.109 (62.548)	Top-5 acc 83.594 (83.165)	lr 0.00923
Train [71][390/3239]	Time 0.238 (0.647)	Data Time 0.001 (0.211)	Loss 2.4727 (2.5430)	Entropy 0.62130 (0.61947)	Top-1 acc 63.281 (62.531)	Top-5 acc 85.156 (83.170)	lr 0.00923
Train [71][400/3239]	Time 0.230 (0.643)	Data Time 0.001 (0.207)	Loss 2.7141 (2.5443)	Entropy 0.62090 (0.61951)	Top-1 acc 60.938 (62.518)	Top-5 acc 80.859 (83.122)	lr 0.00923
Train [71][410/3239]	Time 0.279 (0.637)	Data Time 0.003 (0.202)	Loss 2.4875 (2.5438)	Entropy 0.62076 (0.61954)	Top-1 acc 63.281 (62.547)	Top-5 acc 83.984 (83.129)	lr 0.00922
Train [71][420/3239]	Time 0.243 (0.637)	Data Time 0.001 (0.201)	Loss 2.7561 (2.5450)	Entropy 0.62055 (0.61957)	Top-1 acc 58.594 (62.535)	Top-5 acc 80.859 (83.113)	lr 0.00922
Train [71][430/3239]	Time 0.224 (0.631)	Data Time 0.001 (0.197)	Loss 2.4232 (2.5451)	Entropy 0.62023 (0.61959)	Top-1 acc 67.578 (62.555)	Top-5 acc 82.812 (83.103)	lr 0.00922
Train [71][440/3239]	Time 0.344 (0.626)	Data Time 0.001 (0.192)	Loss 2.4874 (2.5463)	Entropy 0.62005 (0.61960)	Top-1 acc 62.500 (62.540)	Top-5 acc 83.594 (83.072)	lr 0.00922
Train [71][450/3239]	Time 0.244 (0.624)	Data Time 0.001 (0.189)	Loss 2.4402 (2.5465)	Entropy 0.62055 (0.61962)	Top-1 acc 62.500 (62.510)	Top-5 acc 84.375 (83.063)	lr 0.00922
Train [71][460/3239]	Time 0.246 (0.732)	Data Time 0.002 (0.189)	Loss 2.4512 (2.5461)	Entropy 0.62081 (0.61964)	Top-1 acc 63.672 (62.508)	Top-5 acc 86.719 (83.089)	lr 0.00922
Train [71][470/3239]	Time 0.249 (0.725)	Data Time 0.001 (0.185)	Loss 2.4739 (2.5456)	Entropy 0.62068 (0.61966)	Top-1 acc 64.844 (62.536)	Top-5 acc 84.766 (83.099)	lr 0.00922
Train [71][480/3239]	Time 0.231 (0.718)	Data Time 0.001 (0.181)	Loss 2.7620 (2.5459)	Entropy 0.62023 (0.61968)	Top-1 acc 58.984 (62.532)	Top-5 acc 80.859 (83.103)	lr 0.00922
Train [71][490/3239]	Time 0.229 (0.712)	Data Time 0.001 (0.177)	Loss 2.3700 (2.5451)	Entropy 0.62003 (0.61969)	Top-1 acc 68.359 (62.545)	Top-5 acc 83.203 (83.107)	lr 0.00922
Train [71][500/3239]	Time 0.272 (0.707)	Data Time 0.001 (0.174)	Loss 2.5475 (2.5443)	Entropy 0.62026 (0.61970)	Top-1 acc 60.938 (62.573)	Top-5 acc 82.812 (83.117)	lr 0.00922
Train [71][510/3239]	Time 0.269 (0.702)	Data Time 0.001 (0.170)	Loss 2.3763 (2.5443)	Entropy 0.62050 (0.61971)	Top-1 acc 65.234 (62.583)	Top-5 acc 84.766 (83.117)	lr 0.00922
Train [71][520/3239]	Time 0.268 (0.696)	Data Time 0.001 (0.167)	Loss 2.6860 (2.5442)	Entropy 0.62065 (0.61973)	Top-1 acc 58.203 (62.579)	Top-5 acc 81.250 (83.126)	lr 0.00921
Train [71][530/3239]	Time 0.322 (0.691)	Data Time 0.001 (0.164)	Loss 2.4390 (2.5446)	Entropy 0.62060 (0.61975)	Top-1 acc 67.188 (62.585)	Top-5 acc 84.766 (83.130)	lr 0.00921
Train [71][540/3239]	Time 0.231 (0.686)	Data Time 0.001 (0.161)	Loss 2.4829 (2.5449)	Entropy 0.62057 (0.61976)	Top-1 acc 64.844 (62.556)	Top-5 acc 84.766 (83.124)	lr 0.00921
Train [71][550/3239]	Time 0.253 (0.682)	Data Time 0.001 (0.158)	Loss 2.5851 (2.5447)	Entropy 0.62051 (0.61978)	Top-1 acc 61.719 (62.548)	Top-5 acc 81.250 (83.135)	lr 0.00921
Train [71][560/3239]	Time 0.289 (0.678)	Data Time 0.002 (0.155)	Loss 2.5799 (2.5451)	Entropy 0.62050 (0.61979)	Top-1 acc 60.156 (62.533)	Top-5 acc 80.469 (83.127)	lr 0.00921
Train [71][570/3239]	Time 0.261 (0.674)	Data Time 0.001 (0.153)	Loss 2.9538 (2.5462)	Entropy 0.62041 (0.61981)	Top-1 acc 54.297 (62.497)	Top-5 acc 76.172 (83.117)	lr 0.00921
Train [71][580/3239]	Time 0.236 (0.670)	Data Time 0.001 (0.150)	Loss 2.3003 (2.5462)	Entropy 0.62063 (0.61982)	Top-1 acc 69.531 (62.499)	Top-5 acc 88.672 (83.111)	lr 0.00921
Train [71][590/3239]	Time 0.260 (0.666)	Data Time 0.001 (0.148)	Loss 2.7345 (2.5461)	Entropy 0.62051 (0.61983)	Top-1 acc 57.812 (62.517)	Top-5 acc 80.859 (83.102)	lr 0.00921
Train [71][600/3239]	Time 0.319 (0.662)	Data Time 0.001 (0.145)	Loss 2.3605 (2.5466)	Entropy 0.62017 (0.61984)	Top-1 acc 70.312 (62.532)	Top-5 acc 85.156 (83.095)	lr 0.00921
Train [71][610/3239]	Time 0.236 (0.658)	Data Time 0.001 (0.143)	Loss 2.8104 (2.5473)	Entropy 0.62043 (0.61985)	Top-1 acc 55.859 (62.516)	Top-5 acc 79.297 (83.093)	lr 0.00921
Train [71][620/3239]	Time 0.233 (0.655)	Data Time 0.001 (0.141)	Loss 2.4196 (2.5467)	Entropy 0.62044 (0.61986)	Top-1 acc 66.406 (62.547)	Top-5 acc 87.891 (83.108)	lr 0.00920
Train [71][630/3239]	Time 0.236 (0.651)	Data Time 0.001 (0.138)	Loss 2.6742 (2.5466)	Entropy 0.62028 (0.61986)	Top-1 acc 55.859 (62.563)	Top-5 acc 80.469 (83.113)	lr 0.00920
Train [71][640/3239]	Time 0.248 (0.652)	Data Time 0.001 (0.141)	Loss 2.5237 (2.5460)	Entropy 0.61970 (0.61986)	Top-1 acc 61.328 (62.587)	Top-5 acc 81.641 (83.120)	lr 0.00920
Train [71][650/3239]	Time 0.279 (0.649)	Data Time 0.001 (0.139)	Loss 2.6913 (2.5465)	Entropy 0.61960 (0.61986)	Top-1 acc 58.203 (62.567)	Top-5 acc 79.688 (83.110)	lr 0.00920
Train [71][660/3239]	Time 0.228 (0.648)	Data Time 0.001 (0.139)	Loss 2.6540 (2.5457)	Entropy 0.61958 (0.61986)	Top-1 acc 59.375 (62.577)	Top-5 acc 82.812 (83.122)	lr 0.00920
Train [71][670/3239]	Time 0.227 (0.648)	Data Time 0.001 (0.140)	Loss 2.5520 (2.5457)	Entropy 0.61965 (0.61985)	Top-1 acc 60.547 (62.556)	Top-5 acc 83.203 (83.118)	lr 0.00920
Train [71][680/3239]	Time 0.272 (0.644)	Data Time 0.001 (0.138)	Loss 2.4153 (2.5450)	Entropy 0.61933 (0.61985)	Top-1 acc 64.453 (62.576)	Top-5 acc 86.328 (83.135)	lr 0.00920
Train [71][690/3239]	Time 0.301 (0.641)	Data Time 0.001 (0.136)	Loss 2.7071 (2.5457)	Entropy 0.61942 (0.61984)	Top-1 acc 60.938 (62.570)	Top-5 acc 83.203 (83.120)	lr 0.00920
Train [71][700/3239]	Time 0.249 (0.641)	Data Time 0.001 (0.136)	Loss 2.6051 (2.5462)	Entropy 0.61966 (0.61984)	Top-1 acc 64.062 (62.562)	Top-5 acc 82.422 (83.110)	lr 0.00920
Train [71][710/3239]	Time 0.225 (0.637)	Data Time 0.001 (0.134)	Loss 2.5412 (2.5455)	Entropy 0.61942 (0.61983)	Top-1 acc 63.672 (62.591)	Top-5 acc 82.031 (83.116)	lr 0.00920
Train [71][720/3239]	Time 0.243 (0.634)	Data Time 0.001 (0.133)	Loss 2.6059 (2.5471)	Entropy 0.61961 (0.61983)	Top-1 acc 58.984 (62.536)	Top-5 acc 83.203 (83.088)	lr 0.00919
Train [71][730/3239]	Time 0.232 (0.636)	Data Time 0.001 (0.135)	Loss 2.4382 (2.5475)	Entropy 0.61950 (0.61983)	Top-1 acc 63.281 (62.531)	Top-5 acc 85.547 (83.075)	lr 0.00919
Train [71][740/3239]	Time 0.241 (0.634)	Data Time 0.001 (0.134)	Loss 2.6766 (2.5486)	Entropy 0.61985 (0.61982)	Top-1 acc 57.422 (62.508)	Top-5 acc 80.859 (83.045)	lr 0.00919
Train [71][750/3239]	Time 0.250 (0.631)	Data Time 0.001 (0.132)	Loss 2.5472 (2.5485)	Entropy 0.61970 (0.61982)	Top-1 acc 64.062 (62.511)	Top-5 acc 83.594 (83.046)	lr 0.00919
Train [71][760/3239]	Time 0.358 (0.634)	Data Time 0.003 (0.135)	Loss 2.5796 (2.5478)	Entropy 0.61991 (0.61982)	Top-1 acc 59.375 (62.513)	Top-5 acc 82.031 (83.061)	lr 0.00919
Train [71][770/3239]	Time 0.247 (0.632)	Data Time 0.001 (0.134)	Loss 2.5356 (2.5475)	Entropy 0.61970 (0.61982)	Top-1 acc 62.500 (62.512)	Top-5 acc 85.156 (83.076)	lr 0.00919
Train [71][780/3239]	Time 0.245 (0.629)	Data Time 0.001 (0.132)	Loss 2.3357 (2.5470)	Entropy 0.61956 (0.61982)	Top-1 acc 71.875 (62.531)	Top-5 acc 87.109 (83.086)	lr 0.00919
Train [71][790/3239]	Time 0.253 (0.627)	Data Time 0.001 (0.130)	Loss 2.6606 (2.5472)	Entropy 0.61943 (0.61981)	Top-1 acc 58.594 (62.515)	Top-5 acc 81.641 (83.080)	lr 0.00919
Train [71][800/3239]	Time 0.241 (0.626)	Data Time 0.001 (0.130)	Loss 2.3827 (2.5470)	Entropy 0.61907 (0.61981)	Top-1 acc 64.844 (62.522)	Top-5 acc 85.156 (83.082)	lr 0.00919
Train [71][810/3239]	Time 0.247 (0.624)	Data Time 0.001 (0.129)	Loss 2.4718 (2.5471)	Entropy 0.61903 (0.61980)	Top-1 acc 63.672 (62.520)	Top-5 acc 83.984 (83.085)	lr 0.00919
Train [71][820/3239]	Time 0.239 (0.624)	Data Time 0.001 (0.129)	Loss 2.6352 (2.5474)	Entropy 0.61920 (0.61979)	Top-1 acc 63.672 (62.506)	Top-5 acc 82.422 (83.084)	lr 0.00918
Train [71][830/3239]	Time 0.332 (0.624)	Data Time 0.001 (0.130)	Loss 2.5849 (2.5470)	Entropy 0.61913 (0.61978)	Top-1 acc 61.719 (62.498)	Top-5 acc 82.031 (83.093)	lr 0.00918
Train [71][840/3239]	Time 0.243 (0.621)	Data Time 0.002 (0.129)	Loss 2.5377 (2.5468)	Entropy 0.61938 (0.61978)	Top-1 acc 62.891 (62.487)	Top-5 acc 82.422 (83.095)	lr 0.00918
Train [71][850/3239]	Time 0.312 (0.621)	Data Time 0.003 (0.128)	Loss 2.6093 (2.5468)	Entropy 0.61905 (0.61977)	Top-1 acc 60.156 (62.497)	Top-5 acc 82.422 (83.092)	lr 0.00918
Train [71][860/3239]	Time 0.231 (0.619)	Data Time 0.001 (0.127)	Loss 2.5390 (2.5465)	Entropy 0.61910 (0.61976)	Top-1 acc 62.891 (62.500)	Top-5 acc 84.766 (83.101)	lr 0.00918
Train [71][870/3239]	Time 0.244 (0.616)	Data Time 0.001 (0.125)	Loss 2.5837 (2.5473)	Entropy 0.61934 (0.61976)	Top-1 acc 62.109 (62.488)	Top-5 acc 82.422 (83.086)	lr 0.00918
Train [71][880/3239]	Time 0.255 (0.615)	Data Time 0.001 (0.124)	Loss 2.5081 (2.5474)	Entropy 0.61959 (0.61975)	Top-1 acc 63.281 (62.480)	Top-5 acc 84.375 (83.080)	lr 0.00918
Train [71][890/3239]	Time 0.274 (0.613)	Data Time 0.001 (0.123)	Loss 2.3677 (2.5473)	Entropy 0.61983 (0.61975)	Top-1 acc 70.312 (62.473)	Top-5 acc 86.719 (83.086)	lr 0.00918
Train [71][900/3239]	Time 0.244 (0.612)	Data Time 0.001 (0.121)	Loss 2.5379 (2.5474)	Entropy 0.61923 (0.61975)	Top-1 acc 59.375 (62.469)	Top-5 acc 86.719 (83.084)	lr 0.00918
Train [71][910/3239]	Time 0.370 (0.612)	Data Time 0.001 (0.120)	Loss 2.4725 (2.5482)	Entropy 0.61935 (0.61975)	Top-1 acc 65.625 (62.440)	Top-5 acc 84.375 (83.066)	lr 0.00918
Train [71][920/3239]	Time 0.316 (0.610)	Data Time 0.001 (0.119)	Loss 2.6974 (2.5491)	Entropy 0.61948 (0.61974)	Top-1 acc 60.156 (62.422)	Top-5 acc 80.078 (83.052)	lr 0.00918
Train [71][930/3239]	Time 0.226 (0.608)	Data Time 0.001 (0.117)	Loss 2.4341 (2.5481)	Entropy 0.61911 (0.61974)	Top-1 acc 68.750 (62.437)	Top-5 acc 85.547 (83.072)	lr 0.00917
Train [71][940/3239]	Time 0.265 (0.606)	Data Time 0.002 (0.116)	Loss 2.6076 (2.5483)	Entropy 0.61917 (0.61973)	Top-1 acc 61.719 (62.432)	Top-5 acc 80.078 (83.067)	lr 0.00917
Train [71][950/3239]	Time 0.250 (0.604)	Data Time 0.002 (0.115)	Loss 2.4719 (2.5479)	Entropy 0.61891 (0.61972)	Top-1 acc 64.062 (62.435)	Top-5 acc 83.984 (83.078)	lr 0.00917
Train [71][960/3239]	Time 0.233 (0.602)	Data Time 0.001 (0.114)	Loss 2.5663 (2.5469)	Entropy 0.61876 (0.61972)	Top-1 acc 65.234 (62.460)	Top-5 acc 82.812 (83.102)	lr 0.00917
Train [71][970/3239]	Time 0.248 (0.600)	Data Time 0.001 (0.113)	Loss 2.4595 (2.5465)	Entropy 0.61867 (0.61971)	Top-1 acc 63.672 (62.475)	Top-5 acc 85.156 (83.108)	lr 0.00917
Train [71][980/3239]	Time 0.266 (0.599)	Data Time 0.001 (0.112)	Loss 2.4911 (2.5464)	Entropy 0.61909 (0.61970)	Top-1 acc 63.672 (62.485)	Top-5 acc 82.422 (83.101)	lr 0.00917
Train [71][990/3239]	Time 0.351 (0.597)	Data Time 0.001 (0.110)	Loss 2.5639 (2.5464)	Entropy 0.61916 (0.61969)	Top-1 acc 62.500 (62.464)	Top-5 acc 81.250 (83.105)	lr 0.00917
Train [71][1000/3239]	Time 0.255 (0.596)	Data Time 0.002 (0.109)	Loss 2.5652 (2.5468)	Entropy 0.61911 (0.61969)	Top-1 acc 62.500 (62.457)	Top-5 acc 80.078 (83.097)	lr 0.00917
Train [71][1010/3239]	Time 0.275 (0.594)	Data Time 0.002 (0.108)	Loss 2.6185 (2.5466)	Entropy 0.61939 (0.61968)	Top-1 acc 60.938 (62.463)	Top-5 acc 78.906 (83.096)	lr 0.00917
Train [71][1020/3239]	Time 0.250 (0.593)	Data Time 0.001 (0.107)	Loss 2.4904 (2.5470)	Entropy 0.61939 (0.61968)	Top-1 acc 64.062 (62.453)	Top-5 acc 81.641 (83.090)	lr 0.00917
Train [71][1030/3239]	Time 0.230 (0.591)	Data Time 0.001 (0.106)	Loss 2.7976 (2.5466)	Entropy 0.61930 (0.61967)	Top-1 acc 57.812 (62.461)	Top-5 acc 79.688 (83.096)	lr 0.00916
Train [71][1040/3239]	Time 0.295 (0.590)	Data Time 0.002 (0.105)	Loss 2.6865 (2.5467)	Entropy 0.61928 (0.61967)	Top-1 acc 58.203 (62.460)	Top-5 acc 80.859 (83.091)	lr 0.00916
Train [71][1050/3239]	Time 0.255 (0.589)	Data Time 0.001 (0.104)	Loss 2.4615 (2.5468)	Entropy 0.61960 (0.61967)	Top-1 acc 66.016 (62.464)	Top-5 acc 83.594 (83.093)	lr 0.00916
Train [71][1060/3239]	Time 0.249 (0.587)	Data Time 0.001 (0.103)	Loss 2.5629 (2.5470)	Entropy 0.61967 (0.61967)	Top-1 acc 63.672 (62.466)	Top-5 acc 80.078 (83.087)	lr 0.00916
Train [71][1070/3239]	Time 0.235 (0.586)	Data Time 0.002 (0.102)	Loss 2.3328 (2.5475)	Entropy 0.61989 (0.61967)	Top-1 acc 68.359 (62.451)	Top-5 acc 88.281 (83.077)	lr 0.00916
Train [71][1080/3239]	Time 0.339 (0.585)	Data Time 0.001 (0.101)	Loss 2.5480 (2.5475)	Entropy 0.62003 (0.61967)	Top-1 acc 64.453 (62.456)	Top-5 acc 84.766 (83.082)	lr 0.00916
Train [71][1090/3239]	Time 0.254 (0.584)	Data Time 0.001 (0.101)	Loss 2.4630 (2.5472)	Entropy 0.62020 (0.61968)	Top-1 acc 66.016 (62.468)	Top-5 acc 83.594 (83.088)	lr 0.00916
Train [71][1100/3239]	Time 0.229 (0.582)	Data Time 0.001 (0.100)	Loss 2.8528 (2.5477)	Entropy 0.62026 (0.61968)	Top-1 acc 55.859 (62.460)	Top-5 acc 76.562 (83.077)	lr 0.00916
Train [71][1110/3239]	Time 0.289 (0.624)	Data Time 0.004 (0.099)	Loss 2.7923 (2.5476)	Entropy 0.62024 (0.61969)	Top-1 acc 58.203 (62.465)	Top-5 acc 77.734 (83.082)	lr 0.00916
Train [71][1120/3239]	Time 0.231 (0.622)	Data Time 0.002 (0.098)	Loss 2.3527 (2.5479)	Entropy 0.61999 (0.61969)	Top-1 acc 69.922 (62.462)	Top-5 acc 88.281 (83.070)	lr 0.00916
Train [71][1130/3239]	Time 0.254 (0.621)	Data Time 0.002 (0.097)	Loss 2.3527 (2.5479)	Entropy 0.62003 (0.61969)	Top-1 acc 66.016 (62.463)	Top-5 acc 87.109 (83.074)	lr 0.00915
Train [71][1140/3239]	Time 0.313 (0.619)	Data Time 0.002 (0.096)	Loss 2.5904 (2.5473)	Entropy 0.62002 (0.61970)	Top-1 acc 57.422 (62.473)	Top-5 acc 82.812 (83.088)	lr 0.00915
Train [71][1150/3239]	Time 0.384 (0.618)	Data Time 0.001 (0.095)	Loss 2.4749 (2.5470)	Entropy 0.62022 (0.61970)	Top-1 acc 59.766 (62.480)	Top-5 acc 83.984 (83.090)	lr 0.00915
Train [71][1160/3239]	Time 0.243 (0.617)	Data Time 0.001 (0.095)	Loss 2.4708 (2.5466)	Entropy 0.62041 (0.61971)	Top-1 acc 63.281 (62.495)	Top-5 acc 83.984 (83.093)	lr 0.00915
Train [71][1170/3239]	Time 0.273 (0.615)	Data Time 0.001 (0.094)	Loss 2.6965 (2.5469)	Entropy 0.62052 (0.61971)	Top-1 acc 59.766 (62.482)	Top-5 acc 81.250 (83.085)	lr 0.00915
Train [71][1180/3239]	Time 0.239 (0.614)	Data Time 0.001 (0.093)	Loss 2.5778 (2.5471)	Entropy 0.62076 (0.61972)	Top-1 acc 63.281 (62.483)	Top-5 acc 83.984 (83.078)	lr 0.00915
Train [71][1190/3239]	Time 0.232 (0.612)	Data Time 0.001 (0.092)	Loss 2.7068 (2.5474)	Entropy 0.62037 (0.61973)	Top-1 acc 58.984 (62.477)	Top-5 acc 78.125 (83.072)	lr 0.00915
Train [71][1200/3239]	Time 0.232 (0.611)	Data Time 0.001 (0.091)	Loss 2.6465 (2.5473)	Entropy 0.62017 (0.61973)	Top-1 acc 59.375 (62.479)	Top-5 acc 83.203 (83.079)	lr 0.00915
Train [71][1210/3239]	Time 0.264 (0.610)	Data Time 0.002 (0.091)	Loss 2.7143 (2.5471)	Entropy 0.62020 (0.61974)	Top-1 acc 61.719 (62.488)	Top-5 acc 82.031 (83.083)	lr 0.00915
Train [71][1220/3239]	Time 0.274 (0.608)	Data Time 0.001 (0.090)	Loss 2.5322 (2.5476)	Entropy 0.62052 (0.61974)	Top-1 acc 59.375 (62.470)	Top-5 acc 83.594 (83.076)	lr 0.00915
Train [71][1230/3239]	Time 0.289 (0.607)	Data Time 0.001 (0.089)	Loss 2.7397 (2.5479)	Entropy 0.62000 (0.61975)	Top-1 acc 57.422 (62.464)	Top-5 acc 76.953 (83.070)	lr 0.00914
Train [71][1240/3239]	Time 0.335 (0.606)	Data Time 0.001 (0.089)	Loss 2.6175 (2.5479)	Entropy 0.61984 (0.61975)	Top-1 acc 64.062 (62.468)	Top-5 acc 80.469 (83.066)	lr 0.00914
Train [71][1250/3239]	Time 0.238 (0.604)	Data Time 0.001 (0.088)	Loss 2.5941 (2.5482)	Entropy 0.61977 (0.61975)	Top-1 acc 64.062 (62.462)	Top-5 acc 79.688 (83.063)	lr 0.00914
Train [71][1260/3239]	Time 0.351 (0.603)	Data Time 0.002 (0.087)	Loss 2.4446 (2.5486)	Entropy 0.62009 (0.61975)	Top-1 acc 67.578 (62.442)	Top-5 acc 84.375 (83.055)	lr 0.00914
Train [71][1270/3239]	Time 0.243 (0.603)	Data Time 0.001 (0.087)	Loss 2.5015 (2.5487)	Entropy 0.62039 (0.61975)	Top-1 acc 64.844 (62.442)	Top-5 acc 83.203 (83.053)	lr 0.00914
Train [71][1280/3239]	Time 0.237 (0.601)	Data Time 0.001 (0.086)	Loss 2.4159 (2.5488)	Entropy 0.62022 (0.61976)	Top-1 acc 65.234 (62.448)	Top-5 acc 86.328 (83.050)	lr 0.00914
Train [71][1290/3239]	Time 0.275 (0.600)	Data Time 0.002 (0.085)	Loss 2.6242 (2.5487)	Entropy 0.62021 (0.61976)	Top-1 acc 60.156 (62.456)	Top-5 acc 81.641 (83.052)	lr 0.00914
Train [71][1300/3239]	Time 0.268 (0.599)	Data Time 0.002 (0.085)	Loss 2.4909 (2.5488)	Entropy 0.62014 (0.61976)	Top-1 acc 62.109 (62.455)	Top-5 acc 82.812 (83.051)	lr 0.00914
Train [71][1310/3239]	Time 0.351 (0.598)	Data Time 0.001 (0.084)	Loss 2.5408 (2.5486)	Entropy 0.62019 (0.61976)	Top-1 acc 60.156 (62.462)	Top-5 acc 84.375 (83.052)	lr 0.00914
Train [71][1320/3239]	Time 0.257 (0.596)	Data Time 0.001 (0.083)	Loss 2.4740 (2.5486)	Entropy 0.62024 (0.61977)	Top-1 acc 63.672 (62.460)	Top-5 acc 83.984 (83.057)	lr 0.00914
Train [71][1330/3239]	Time 0.284 (0.595)	Data Time 0.001 (0.083)	Loss 3.0839 (2.5492)	Entropy 0.62008 (0.61977)	Top-1 acc 53.125 (62.458)	Top-5 acc 72.266 (83.043)	lr 0.00914
Train [71][1340/3239]	Time 0.244 (0.594)	Data Time 0.001 (0.082)	Loss 2.6809 (2.5493)	Entropy 0.62022 (0.61977)	Top-1 acc 59.766 (62.461)	Top-5 acc 81.641 (83.046)	lr 0.00913
Train [71][1350/3239]	Time 0.289 (0.593)	Data Time 0.001 (0.082)	Loss 2.6885 (2.5498)	Entropy 0.62009 (0.61978)	Top-1 acc 58.203 (62.457)	Top-5 acc 79.688 (83.032)	lr 0.00913
Train [71][1360/3239]	Time 0.307 (0.593)	Data Time 0.001 (0.081)	Loss 2.6310 (2.5499)	Entropy 0.62020 (0.61978)	Top-1 acc 57.422 (62.451)	Top-5 acc 81.641 (83.028)	lr 0.00913
Train [71][1370/3239]	Time 0.260 (0.592)	Data Time 0.001 (0.080)	Loss 2.4333 (2.5496)	Entropy 0.62002 (0.61978)	Top-1 acc 66.797 (62.462)	Top-5 acc 83.594 (83.034)	lr 0.00913
Train [71][1380/3239]	Time 0.245 (0.591)	Data Time 0.001 (0.080)	Loss 2.6951 (2.5499)	Entropy 0.61975 (0.61978)	Top-1 acc 58.594 (62.449)	Top-5 acc 81.641 (83.032)	lr 0.00913
Train [71][1390/3239]	Time 0.315 (0.590)	Data Time 0.003 (0.079)	Loss 2.4393 (2.5497)	Entropy 0.61951 (0.61978)	Top-1 acc 66.016 (62.457)	Top-5 acc 87.500 (83.039)	lr 0.00913
Train [71][1400/3239]	Time 0.333 (0.589)	Data Time 0.001 (0.079)	Loss 2.6600 (2.5497)	Entropy 0.61999 (0.61978)	Top-1 acc 61.719 (62.460)	Top-5 acc 80.078 (83.032)	lr 0.00913
Train [71][1410/3239]	Time 0.290 (0.588)	Data Time 0.001 (0.078)	Loss 2.4903 (2.5504)	Entropy 0.62029 (0.61978)	Top-1 acc 60.547 (62.440)	Top-5 acc 85.156 (83.024)	lr 0.00913
Train [71][1420/3239]	Time 0.243 (0.587)	Data Time 0.001 (0.078)	Loss 2.7646 (2.5504)	Entropy 0.61990 (0.61979)	Top-1 acc 55.469 (62.427)	Top-5 acc 79.688 (83.025)	lr 0.00913
Train [71][1430/3239]	Time 0.256 (0.586)	Data Time 0.001 (0.077)	Loss 2.6267 (2.5506)	Entropy 0.62000 (0.61979)	Top-1 acc 60.547 (62.421)	Top-5 acc 79.688 (83.018)	lr 0.00913
Train [71][1440/3239]	Time 0.260 (0.585)	Data Time 0.002 (0.077)	Loss 2.6233 (2.5511)	Entropy 0.61996 (0.61979)	Top-1 acc 62.109 (62.406)	Top-5 acc 78.906 (83.007)	lr 0.00912
Train [71][1450/3239]	Time 0.245 (0.585)	Data Time 0.001 (0.076)	Loss 2.6205 (2.5515)	Entropy 0.61998 (0.61979)	Top-1 acc 59.375 (62.399)	Top-5 acc 83.203 (83.000)	lr 0.00912
Train [71][1460/3239]	Time 0.251 (0.584)	Data Time 0.001 (0.075)	Loss 2.4666 (2.5518)	Entropy 0.62026 (0.61979)	Top-1 acc 67.188 (62.395)	Top-5 acc 83.594 (82.999)	lr 0.00912
Train [71][1470/3239]	Time 0.363 (0.583)	Data Time 0.002 (0.075)	Loss 2.5174 (2.5519)	Entropy 0.62026 (0.61980)	Top-1 acc 65.234 (62.389)	Top-5 acc 84.375 (82.990)	lr 0.00912
Train [71][1480/3239]	Time 0.268 (0.582)	Data Time 0.001 (0.074)	Loss 2.5986 (2.5522)	Entropy 0.62022 (0.61980)	Top-1 acc 64.453 (62.386)	Top-5 acc 81.250 (82.982)	lr 0.00912
Train [71][1490/3239]	Time 0.252 (0.581)	Data Time 0.001 (0.074)	Loss 2.7653 (2.5525)	Entropy 0.62010 (0.61980)	Top-1 acc 58.984 (62.380)	Top-5 acc 82.031 (82.977)	lr 0.00912
Train [71][1500/3239]	Time 0.235 (0.581)	Data Time 0.002 (0.074)	Loss 2.3752 (2.5523)	Entropy 0.61959 (0.61980)	Top-1 acc 63.672 (62.382)	Top-5 acc 88.672 (82.980)	lr 0.00912
Train [71][1510/3239]	Time 0.238 (0.580)	Data Time 0.001 (0.074)	Loss 2.4550 (2.5521)	Entropy 0.61968 (0.61980)	Top-1 acc 64.453 (62.382)	Top-5 acc 83.984 (82.984)	lr 0.00912
Train [71][1520/3239]	Time 0.229 (0.580)	Data Time 0.001 (0.075)	Loss 2.4551 (2.5521)	Entropy 0.61993 (0.61980)	Top-1 acc 61.719 (62.386)	Top-5 acc 85.156 (82.983)	lr 0.00912
Train [71][1530/3239]	Time 0.254 (0.580)	Data Time 0.001 (0.076)	Loss 2.6822 (2.5522)	Entropy 0.61995 (0.61980)	Top-1 acc 57.812 (62.381)	Top-5 acc 82.812 (82.985)	lr 0.00912
Train [71][1540/3239]	Time 0.344 (0.580)	Data Time 0.001 (0.075)	Loss 2.4871 (2.5525)	Entropy 0.62006 (0.61980)	Top-1 acc 59.766 (62.364)	Top-5 acc 83.203 (82.981)	lr 0.00911
Train [71][1550/3239]	Time 0.249 (0.579)	Data Time 0.001 (0.075)	Loss 2.7167 (2.5525)	Entropy 0.62004 (0.61981)	Top-1 acc 58.984 (62.362)	Top-5 acc 80.078 (82.978)	lr 0.00911
Train [71][1560/3239]	Time 0.250 (0.581)	Data Time 0.002 (0.077)	Loss 2.6338 (2.5526)	Entropy 0.61992 (0.61981)	Top-1 acc 62.109 (62.362)	Top-5 acc 83.594 (82.978)	lr 0.00911
Train [71][1570/3239]	Time 0.277 (0.580)	Data Time 0.001 (0.076)	Loss 2.6598 (2.5528)	Entropy 0.61996 (0.61981)	Top-1 acc 64.062 (62.364)	Top-5 acc 79.297 (82.973)	lr 0.00911
Train [71][1580/3239]	Time 0.271 (0.579)	Data Time 0.001 (0.076)	Loss 2.6001 (2.5527)	Entropy 0.62006 (0.61981)	Top-1 acc 59.766 (62.363)	Top-5 acc 83.594 (82.973)	lr 0.00911
Train [71][1590/3239]	Time 0.252 (0.580)	Data Time 0.001 (0.077)	Loss 2.7473 (2.5527)	Entropy 0.62016 (0.61981)	Top-1 acc 54.297 (62.362)	Top-5 acc 78.906 (82.966)	lr 0.00911
Train [71][1600/3239]	Time 0.245 (0.579)	Data Time 0.001 (0.077)	Loss 2.4558 (2.5530)	Entropy 0.62009 (0.61981)	Top-1 acc 63.281 (62.358)	Top-5 acc 83.594 (82.965)	lr 0.00911
Train [71][1610/3239]	Time 0.265 (0.578)	Data Time 0.001 (0.076)	Loss 2.5779 (2.5532)	Entropy 0.62056 (0.61981)	Top-1 acc 61.328 (62.353)	Top-5 acc 82.422 (82.958)	lr 0.00911
Train [71][1620/3239]	Time 0.243 (0.580)	Data Time 0.001 (0.079)	Loss 2.5588 (2.5534)	Entropy 0.62037 (0.61982)	Top-1 acc 63.672 (62.351)	Top-5 acc 82.422 (82.954)	lr 0.00911
Train [71][1630/3239]	Time 0.383 (0.580)	Data Time 0.001 (0.078)	Loss 2.6643 (2.5534)	Entropy 0.62063 (0.61982)	Top-1 acc 61.719 (62.352)	Top-5 acc 79.688 (82.950)	lr 0.00911
Train [71][1640/3239]	Time 0.250 (0.579)	Data Time 0.002 (0.078)	Loss 2.6439 (2.5538)	Entropy 0.62046 (0.61983)	Top-1 acc 60.156 (62.342)	Top-5 acc 81.250 (82.939)	lr 0.00911
Train [71][1650/3239]	Time 0.269 (0.580)	Data Time 0.001 (0.079)	Loss 2.5267 (2.5537)	Entropy 0.62056 (0.61983)	Top-1 acc 64.844 (62.349)	Top-5 acc 81.250 (82.940)	lr 0.00910
Train [71][1660/3239]	Time 0.253 (0.580)	Data Time 0.001 (0.080)	Loss 2.6934 (2.5537)	Entropy 0.62034 (0.61983)	Top-1 acc 63.281 (62.349)	Top-5 acc 79.297 (82.937)	lr 0.00910
Train [71][1670/3239]	Time 0.282 (0.579)	Data Time 0.001 (0.079)	Loss 2.5432 (2.5533)	Entropy 0.62020 (0.61984)	Top-1 acc 64.062 (62.361)	Top-5 acc 82.031 (82.943)	lr 0.00910
Train [71][1680/3239]	Time 0.244 (0.578)	Data Time 0.001 (0.079)	Loss 2.5197 (2.5536)	Entropy 0.62042 (0.61984)	Top-1 acc 65.234 (62.355)	Top-5 acc 82.812 (82.936)	lr 0.00910
Train [71][1690/3239]	Time 0.249 (0.580)	Data Time 0.002 (0.080)	Loss 2.4363 (2.5539)	Entropy 0.62062 (0.61984)	Top-1 acc 61.719 (62.342)	Top-5 acc 86.719 (82.936)	lr 0.00910
Train [71][1700/3239]	Time 0.385 (0.579)	Data Time 0.001 (0.080)	Loss 2.7375 (2.5540)	Entropy 0.62031 (0.61985)	Top-1 acc 58.984 (62.336)	Top-5 acc 80.469 (82.936)	lr 0.00910
Train [71][1710/3239]	Time 0.258 (0.579)	Data Time 0.001 (0.079)	Loss 2.5695 (2.5537)	Entropy 0.62017 (0.61985)	Top-1 acc 61.719 (62.344)	Top-5 acc 84.766 (82.944)	lr 0.00910
Train [71][1720/3239]	Time 0.243 (0.580)	Data Time 0.002 (0.081)	Loss 2.6249 (2.5536)	Entropy 0.62025 (0.61985)	Top-1 acc 61.328 (62.345)	Top-5 acc 82.422 (82.947)	lr 0.00910
Train [71][1730/3239]	Time 0.273 (0.579)	Data Time 0.001 (0.081)	Loss 2.7871 (2.5537)	Entropy 0.62037 (0.61986)	Top-1 acc 56.641 (62.338)	Top-5 acc 77.344 (82.945)	lr 0.00910
Train [71][1740/3239]	Time 0.249 (0.579)	Data Time 0.001 (0.080)	Loss 2.6065 (2.5540)	Entropy 0.62025 (0.61986)	Top-1 acc 60.938 (62.334)	Top-5 acc 80.859 (82.936)	lr 0.00910
Train [71][1750/3239]	Time 0.295 (0.581)	Data Time 0.002 (0.083)	Loss 2.5174 (2.5539)	Entropy 0.61964 (0.61986)	Top-1 acc 63.672 (62.334)	Top-5 acc 83.594 (82.938)	lr 0.00909
Train [71][1760/3239]	Time 0.268 (0.580)	Data Time 0.001 (0.083)	Loss 2.4906 (2.5541)	Entropy 0.62012 (0.61986)	Top-1 acc 65.625 (62.331)	Top-5 acc 82.422 (82.929)	lr 0.00909
Train [71][1770/3239]	Time 0.295 (0.607)	Data Time 0.004 (0.082)	Loss 2.5345 (2.5539)	Entropy 0.62032 (0.61986)	Top-1 acc 61.328 (62.335)	Top-5 acc 84.766 (82.932)	lr 0.00909
Train [71][1780/3239]	Time 0.243 (0.606)	Data Time 0.002 (0.082)	Loss 2.6110 (2.5539)	Entropy 0.62031 (0.61986)	Top-1 acc 60.547 (62.337)	Top-5 acc 81.250 (82.932)	lr 0.00909
Train [71][1790/3239]	Time 0.364 (0.605)	Data Time 0.001 (0.081)	Loss 2.5509 (2.5537)	Entropy 0.62033 (0.61987)	Top-1 acc 62.891 (62.337)	Top-5 acc 82.031 (82.937)	lr 0.00909
Train [71][1800/3239]	Time 0.283 (0.604)	Data Time 0.002 (0.081)	Loss 2.4734 (2.5538)	Entropy 0.62073 (0.61987)	Top-1 acc 65.234 (62.338)	Top-5 acc 83.594 (82.936)	lr 0.00909
Train [71][1810/3239]	Time 0.262 (0.603)	Data Time 0.001 (0.080)	Loss 2.2962 (2.5536)	Entropy 0.62089 (0.61987)	Top-1 acc 68.750 (62.341)	Top-5 acc 85.938 (82.939)	lr 0.00909
Train [71][1820/3239]	Time 0.261 (0.603)	Data Time 0.001 (0.080)	Loss 2.4542 (2.5534)	Entropy 0.62144 (0.61988)	Top-1 acc 63.672 (62.350)	Top-5 acc 84.375 (82.941)	lr 0.00909
Train [71][1830/3239]	Time 0.305 (0.602)	Data Time 0.002 (0.079)	Loss 2.4815 (2.5528)	Entropy 0.62086 (0.61989)	Top-1 acc 64.062 (62.364)	Top-5 acc 83.203 (82.953)	lr 0.00909
Train [71][1840/3239]	Time 0.253 (0.602)	Data Time 0.001 (0.079)	Loss 3.0731 (2.5533)	Entropy 0.62086 (0.61989)	Top-1 acc 50.391 (62.354)	Top-5 acc 74.609 (82.950)	lr 0.00909
Train [71][1850/3239]	Time 0.311 (0.601)	Data Time 0.003 (0.079)	Loss 2.4312 (2.5533)	Entropy 0.62093 (0.61990)	Top-1 acc 69.531 (62.356)	Top-5 acc 86.328 (82.948)	lr 0.00908
Train [71][1860/3239]	Time 0.349 (0.600)	Data Time 0.002 (0.078)	Loss 2.6866 (2.5535)	Entropy 0.62095 (0.61990)	Top-1 acc 60.938 (62.354)	Top-5 acc 81.250 (82.946)	lr 0.00908
Train [71][1870/3239]	Time 0.268 (0.599)	Data Time 0.002 (0.078)	Loss 2.5821 (2.5538)	Entropy 0.62079 (0.61991)	Top-1 acc 62.109 (62.351)	Top-5 acc 82.812 (82.946)	lr 0.00908
Train [71][1880/3239]	Time 0.257 (0.599)	Data Time 0.002 (0.077)	Loss 2.3656 (2.5536)	Entropy 0.62088 (0.61991)	Top-1 acc 69.141 (62.350)	Top-5 acc 85.547 (82.948)	lr 0.00908
Train [71][1890/3239]	Time 0.259 (0.598)	Data Time 0.002 (0.077)	Loss 2.5493 (2.5535)	Entropy 0.62069 (0.61992)	Top-1 acc 59.375 (62.348)	Top-5 acc 82.031 (82.949)	lr 0.00908
Train [71][1900/3239]	Time 0.259 (0.598)	Data Time 0.001 (0.077)	Loss 3.0156 (2.5539)	Entropy 0.62041 (0.61992)	Top-1 acc 49.219 (62.337)	Top-5 acc 74.609 (82.945)	lr 0.00908
Train [71][1910/3239]	Time 0.242 (0.597)	Data Time 0.001 (0.076)	Loss 2.4306 (2.5535)	Entropy 0.62019 (0.61992)	Top-1 acc 66.797 (62.346)	Top-5 acc 87.891 (82.950)	lr 0.00908
Train [71][1920/3239]	Time 0.296 (0.596)	Data Time 0.001 (0.076)	Loss 2.6290 (2.5535)	Entropy 0.62035 (0.61993)	Top-1 acc 57.422 (62.350)	Top-5 acc 82.812 (82.951)	lr 0.00908
Train [71][1930/3239]	Time 0.283 (0.596)	Data Time 0.001 (0.075)	Loss 2.5559 (2.5534)	Entropy 0.62003 (0.61993)	Top-1 acc 62.500 (62.359)	Top-5 acc 80.859 (82.949)	lr 0.00908
Train [71][1940/3239]	Time 0.249 (0.595)	Data Time 0.001 (0.075)	Loss 2.4817 (2.5534)	Entropy 0.62032 (0.61993)	Top-1 acc 62.500 (62.360)	Top-5 acc 85.547 (82.947)	lr 0.00908
Train [71][1950/3239]	Time 0.348 (0.594)	Data Time 0.001 (0.075)	Loss 2.6155 (2.5533)	Entropy 0.62008 (0.61993)	Top-1 acc 60.547 (62.365)	Top-5 acc 82.422 (82.950)	lr 0.00907
Train [71][1960/3239]	Time 0.274 (0.596)	Data Time 0.001 (0.076)	Loss 2.5934 (2.5531)	Entropy 0.62030 (0.61993)	Top-1 acc 60.547 (62.365)	Top-5 acc 83.203 (82.954)	lr 0.00907
Train [71][1970/3239]	Time 0.249 (0.595)	Data Time 0.002 (0.076)	Loss 2.5576 (2.5533)	Entropy 0.62043 (0.61993)	Top-1 acc 62.109 (62.363)	Top-5 acc 83.203 (82.951)	lr 0.00907
Train [71][1980/3239]	Time 0.275 (0.594)	Data Time 0.002 (0.076)	Loss 2.6673 (2.5536)	Entropy 0.62060 (0.61994)	Top-1 acc 60.156 (62.353)	Top-5 acc 80.859 (82.948)	lr 0.00907
Train [71][1990/3239]	Time 0.244 (0.595)	Data Time 0.001 (0.077)	Loss 2.3512 (2.5535)	Entropy 0.62047 (0.61994)	Top-1 acc 66.406 (62.359)	Top-5 acc 83.984 (82.942)	lr 0.00907
Train [71][2000/3239]	Time 0.235 (0.594)	Data Time 0.001 (0.076)	Loss 2.6038 (2.5538)	Entropy 0.62077 (0.61994)	Top-1 acc 62.500 (62.352)	Top-5 acc 82.031 (82.938)	lr 0.00907
Train [71][2010/3239]	Time 0.271 (0.594)	Data Time 0.001 (0.077)	Loss 2.4227 (2.5538)	Entropy 0.62084 (0.61995)	Top-1 acc 64.453 (62.351)	Top-5 acc 87.109 (82.935)	lr 0.00907
Train [71][2020/3239]	Time 1.361 (0.595)	Data Time 0.995 (0.078)	Loss 2.6083 (2.5536)	Entropy 0.62104 (0.61995)	Top-1 acc 59.766 (62.358)	Top-5 acc 82.812 (82.938)	lr 0.00907
Train [71][2030/3239]	Time 0.264 (0.594)	Data Time 0.001 (0.077)	Loss 2.6878 (2.5541)	Entropy 0.62113 (0.61996)	Top-1 acc 61.719 (62.354)	Top-5 acc 79.297 (82.931)	lr 0.00907
Train [71][2040/3239]	Time 0.279 (0.595)	Data Time 0.001 (0.078)	Loss 2.7489 (2.5542)	Entropy 0.62106 (0.61996)	Top-1 acc 60.938 (62.354)	Top-5 acc 78.906 (82.931)	lr 0.00907
Train [71][2050/3239]	Time 0.308 (0.596)	Data Time 0.001 (0.079)	Loss 2.6387 (2.5541)	Entropy 0.62075 (0.61997)	Top-1 acc 56.250 (62.350)	Top-5 acc 82.422 (82.935)	lr 0.00907
Train [71][2060/3239]	Time 0.254 (0.595)	Data Time 0.001 (0.079)	Loss 2.5904 (2.5544)	Entropy 0.62068 (0.61997)	Top-1 acc 61.328 (62.344)	Top-5 acc 81.641 (82.927)	lr 0.00906
Train [71][2070/3239]	Time 0.262 (0.595)	Data Time 0.002 (0.079)	Loss 2.3272 (2.5542)	Entropy 0.62035 (0.61997)	Top-1 acc 67.578 (62.352)	Top-5 acc 89.844 (82.933)	lr 0.00906
Train [71][2080/3239]	Time 0.322 (0.597)	Data Time 0.001 (0.081)	Loss 2.5591 (2.5544)	Entropy 0.61989 (0.61997)	Top-1 acc 62.500 (62.351)	Top-5 acc 80.859 (82.929)	lr 0.00906
Train [71][2090/3239]	Time 0.244 (0.596)	Data Time 0.001 (0.081)	Loss 2.5398 (2.5542)	Entropy 0.61982 (0.61997)	Top-1 acc 60.938 (62.357)	Top-5 acc 83.203 (82.935)	lr 0.00906
Train [71][2100/3239]	Time 0.236 (0.596)	Data Time 0.001 (0.081)	Loss 2.5289 (2.5540)	Entropy 0.61998 (0.61997)	Top-1 acc 62.109 (62.362)	Top-5 acc 84.766 (82.936)	lr 0.00906
Train [71][2110/3239]	Time 0.237 (0.597)	Data Time 0.002 (0.082)	Loss 2.7603 (2.5542)	Entropy 0.62004 (0.61997)	Top-1 acc 58.203 (62.362)	Top-5 acc 77.344 (82.928)	lr 0.00906
Train [71][2120/3239]	Time 0.243 (0.596)	Data Time 0.001 (0.082)	Loss 2.5532 (2.5541)	Entropy 0.61996 (0.61997)	Top-1 acc 61.719 (62.361)	Top-5 acc 82.422 (82.931)	lr 0.00906
Train [71][2130/3239]	Time 0.253 (0.596)	Data Time 0.001 (0.082)	Loss 2.5645 (2.5540)	Entropy 0.62005 (0.61997)	Top-1 acc 63.672 (62.363)	Top-5 acc 83.594 (82.931)	lr 0.00906
Train [71][2140/3239]	Time 0.253 (0.598)	Data Time 0.001 (0.084)	Loss 2.8487 (2.5543)	Entropy 0.62010 (0.61997)	Top-1 acc 56.641 (62.359)	Top-5 acc 76.172 (82.928)	lr 0.00906
Train [71][2150/3239]	Time 0.243 (0.597)	Data Time 0.002 (0.084)	Loss 2.4089 (2.5543)	Entropy 0.62031 (0.61997)	Top-1 acc 65.234 (62.362)	Top-5 acc 85.156 (82.927)	lr 0.00906
Train [71][2160/3239]	Time 0.298 (0.597)	Data Time 0.001 (0.083)	Loss 2.5584 (2.5546)	Entropy 0.62005 (0.61998)	Top-1 acc 60.938 (62.352)	Top-5 acc 82.812 (82.919)	lr 0.00905
Train [71][2170/3239]	Time 0.244 (0.598)	Data Time 0.001 (0.085)	Loss 2.9066 (2.5551)	Entropy 0.62005 (0.61998)	Top-1 acc 53.516 (62.338)	Top-5 acc 78.516 (82.913)	lr 0.00905
Train [71][2180/3239]	Time 0.357 (0.597)	Data Time 0.001 (0.085)	Loss 2.5389 (2.5551)	Entropy 0.62023 (0.61998)	Top-1 acc 60.156 (62.336)	Top-5 acc 83.984 (82.913)	lr 0.00905
Train [71][2190/3239]	Time 0.267 (0.597)	Data Time 0.002 (0.085)	Loss 2.7228 (2.5555)	Entropy 0.62024 (0.61998)	Top-1 acc 57.812 (62.330)	Top-5 acc 80.469 (82.905)	lr 0.00905
Train [71][2200/3239]	Time 0.245 (0.599)	Data Time 0.001 (0.087)	Loss 2.6536 (2.5559)	Entropy 0.62002 (0.61998)	Top-1 acc 62.891 (62.321)	Top-5 acc 81.250 (82.896)	lr 0.00905
Train [71][2210/3239]	Time 0.249 (0.598)	Data Time 0.001 (0.087)	Loss 2.7059 (2.5561)	Entropy 0.61997 (0.61998)	Top-1 acc 57.422 (62.318)	Top-5 acc 80.859 (82.894)	lr 0.00905
Train [71][2220/3239]	Time 0.241 (0.597)	Data Time 0.001 (0.086)	Loss 2.5800 (2.5560)	Entropy 0.62015 (0.61998)	Top-1 acc 60.938 (62.324)	Top-5 acc 83.203 (82.896)	lr 0.00905
Train [71][2230/3239]	Time 0.263 (0.597)	Data Time 0.001 (0.086)	Loss 2.5348 (2.5559)	Entropy 0.61998 (0.61998)	Top-1 acc 62.109 (62.325)	Top-5 acc 83.203 (82.896)	lr 0.00905
Train [71][2240/3239]	Time 0.280 (0.597)	Data Time 0.002 (0.087)	Loss 2.3624 (2.5558)	Entropy 0.61995 (0.61998)	Top-1 acc 67.578 (62.326)	Top-5 acc 87.500 (82.897)	lr 0.00905
Train [71][2250/3239]	Time 0.332 (0.597)	Data Time 0.001 (0.086)	Loss 2.4611 (2.5558)	Entropy 0.61944 (0.61998)	Top-1 acc 64.062 (62.324)	Top-5 acc 85.938 (82.897)	lr 0.00905
Train [71][2260/3239]	Time 0.232 (0.596)	Data Time 0.001 (0.086)	Loss 2.4265 (2.5558)	Entropy 0.61953 (0.61998)	Top-1 acc 65.625 (62.324)	Top-5 acc 86.719 (82.896)	lr 0.00904
Train [71][2270/3239]	Time 0.258 (0.597)	Data Time 0.001 (0.087)	Loss 2.6242 (2.5556)	Entropy 0.61915 (0.61997)	Top-1 acc 60.156 (62.327)	Top-5 acc 82.031 (82.899)	lr 0.00904
Train [71][2280/3239]	Time 0.265 (0.596)	Data Time 0.002 (0.087)	Loss 2.8458 (2.5559)	Entropy 0.61909 (0.61997)	Top-1 acc 56.250 (62.325)	Top-5 acc 78.125 (82.891)	lr 0.00904
Train [71][2290/3239]	Time 0.281 (0.596)	Data Time 0.001 (0.087)	Loss 2.5815 (2.5563)	Entropy 0.61857 (0.61997)	Top-1 acc 63.672 (62.318)	Top-5 acc 85.547 (82.886)	lr 0.00904
Train [71][2300/3239]	Time 0.223 (0.598)	Data Time 0.001 (0.089)	Loss 2.7266 (2.5566)	Entropy 0.61879 (0.61996)	Top-1 acc 54.688 (62.306)	Top-5 acc 81.250 (82.883)	lr 0.00904
Train [71][2310/3239]	Time 0.281 (0.597)	Data Time 0.001 (0.089)	Loss 2.6467 (2.5567)	Entropy 0.61883 (0.61995)	Top-1 acc 63.281 (62.306)	Top-5 acc 80.859 (82.880)	lr 0.00904
Train [71][2320/3239]	Time 1.241 (0.597)	Data Time 1.000 (0.089)	Loss 2.5712 (2.5570)	Entropy 0.61889 (0.61995)	Top-1 acc 63.281 (62.297)	Top-5 acc 80.469 (82.876)	lr 0.00904
Train [71][2330/3239]	Time 0.232 (0.599)	Data Time 0.001 (0.091)	Loss 2.4337 (2.5569)	Entropy 0.61896 (0.61995)	Top-1 acc 67.578 (62.294)	Top-5 acc 85.156 (82.879)	lr 0.00904
Train [71][2340/3239]	Time 0.385 (0.598)	Data Time 0.001 (0.091)	Loss 2.6182 (2.5571)	Entropy 0.61893 (0.61994)	Top-1 acc 61.719 (62.288)	Top-5 acc 81.250 (82.877)	lr 0.00904
Train [71][2350/3239]	Time 0.250 (0.598)	Data Time 0.001 (0.090)	Loss 2.6149 (2.5572)	Entropy 0.61894 (0.61994)	Top-1 acc 60.547 (62.286)	Top-5 acc 81.641 (82.875)	lr 0.00904
Train [71][2360/3239]	Time 0.246 (0.601)	Data Time 0.001 (0.094)	Loss 2.7633 (2.5572)	Entropy 0.61881 (0.61993)	Top-1 acc 56.641 (62.286)	Top-5 acc 77.734 (82.874)	lr 0.00904
Train [71][2370/3239]	Time 0.235 (0.602)	Data Time 0.001 (0.096)	Loss 2.4131 (2.5569)	Entropy 0.61850 (0.61993)	Top-1 acc 67.188 (62.291)	Top-5 acc 86.328 (82.881)	lr 0.00903
Train [71][2380/3239]	Time 0.245 (0.601)	Data Time 0.001 (0.095)	Loss 2.6017 (2.5571)	Entropy 0.61821 (0.61992)	Top-1 acc 63.672 (62.282)	Top-5 acc 80.078 (82.873)	lr 0.00903
Train [71][2390/3239]	Time 0.260 (0.604)	Data Time 0.001 (0.098)	Loss 2.5511 (2.5572)	Entropy 0.61840 (0.61991)	Top-1 acc 59.766 (62.284)	Top-5 acc 81.641 (82.870)	lr 0.00903
Train [71][2400/3239]	Time 0.242 (0.605)	Data Time 0.001 (0.100)	Loss 2.8407 (2.5574)	Entropy 0.61815 (0.61991)	Top-1 acc 57.031 (62.280)	Top-5 acc 77.734 (82.869)	lr 0.00903
Train [71][2410/3239]	Time 0.333 (0.605)	Data Time 0.002 (0.099)	Loss 2.4102 (2.5574)	Entropy 0.61806 (0.61990)	Top-1 acc 68.359 (62.285)	Top-5 acc 85.938 (82.867)	lr 0.00903
Train [71][2420/3239]	Time 0.334 (0.626)	Data Time 0.006 (0.101)	Loss 2.6536 (2.5575)	Entropy 0.61802 (0.61989)	Top-1 acc 61.328 (62.281)	Top-5 acc 82.422 (82.867)	lr 0.00903
Train [71][2430/3239]	Time 0.251 (0.625)	Data Time 0.002 (0.100)	Loss 2.4861 (2.5575)	Entropy 0.61761 (0.61988)	Top-1 acc 61.328 (62.278)	Top-5 acc 83.594 (82.866)	lr 0.00903
Train [71][2440/3239]	Time 0.240 (0.625)	Data Time 0.001 (0.100)	Loss 2.4877 (2.5575)	Entropy 0.61766 (0.61987)	Top-1 acc 62.500 (62.278)	Top-5 acc 85.547 (82.865)	lr 0.00903
Train [71][2450/3239]	Time 0.265 (0.624)	Data Time 0.002 (0.100)	Loss 2.8644 (2.5576)	Entropy 0.61786 (0.61987)	Top-1 acc 55.078 (62.276)	Top-5 acc 78.906 (82.865)	lr 0.00903
Train [71][2460/3239]	Time 0.252 (0.623)	Data Time 0.002 (0.099)	Loss 2.4336 (2.5574)	Entropy 0.61786 (0.61986)	Top-1 acc 65.234 (62.279)	Top-5 acc 86.328 (82.870)	lr 0.00903
Train [71][2470/3239]	Time 0.282 (0.623)	Data Time 0.002 (0.099)	Loss 2.4520 (2.5572)	Entropy 0.61790 (0.61985)	Top-1 acc 62.109 (62.282)	Top-5 acc 83.984 (82.872)	lr 0.00902
Train [71][2480/3239]	Time 0.265 (0.622)	Data Time 0.001 (0.098)	Loss 2.6135 (2.5572)	Entropy 0.61789 (0.61984)	Top-1 acc 58.984 (62.279)	Top-5 acc 80.859 (82.872)	lr 0.00902
Train [71][2490/3239]	Time 0.258 (0.623)	Data Time 0.001 (0.100)	Loss 2.4068 (2.5571)	Entropy 0.61804 (0.61983)	Top-1 acc 68.359 (62.283)	Top-5 acc 87.891 (82.879)	lr 0.00902
Train [71][2500/3239]	Time 0.353 (0.623)	Data Time 0.001 (0.099)	Loss 2.5670 (2.5573)	Entropy 0.61804 (0.61983)	Top-1 acc 58.984 (62.279)	Top-5 acc 82.422 (82.872)	lr 0.00902
Train [71][2510/3239]	Time 0.247 (0.622)	Data Time 0.001 (0.099)	Loss 2.5171 (2.5574)	Entropy 0.61819 (0.61982)	Top-1 acc 64.453 (62.276)	Top-5 acc 81.641 (82.870)	lr 0.00902
Train [71][2520/3239]	Time 0.256 (0.630)	Data Time 0.001 (0.108)	Loss 2.5587 (2.5573)	Entropy 0.61816 (0.61981)	Top-1 acc 64.453 (62.282)	Top-5 acc 82.422 (82.872)	lr 0.00902
Train [71][2530/3239]	Time 0.252 (0.630)	Data Time 0.001 (0.108)	Loss 2.5327 (2.5575)	Entropy 0.61819 (0.61981)	Top-1 acc 59.766 (62.278)	Top-5 acc 83.203 (82.869)	lr 0.00902
Train [71][2540/3239]	Time 0.254 (0.629)	Data Time 0.002 (0.107)	Loss 2.5831 (2.5579)	Entropy 0.61826 (0.61980)	Top-1 acc 62.500 (62.273)	Top-5 acc 81.641 (82.860)	lr 0.00902
Train [71][2550/3239]	Time 0.246 (0.638)	Data Time 0.001 (0.117)	Loss 2.5361 (2.5581)	Entropy 0.61830 (0.61979)	Top-1 acc 62.891 (62.271)	Top-5 acc 83.203 (82.852)	lr 0.00902
Train [71][2560/3239]	Time 0.251 (0.637)	Data Time 0.001 (0.116)	Loss 2.4734 (2.5581)	Entropy 0.61822 (0.61979)	Top-1 acc 65.625 (62.272)	Top-5 acc 83.984 (82.854)	lr 0.00902
Train [71][2570/3239]	Time 0.368 (0.637)	Data Time 0.002 (0.116)	Loss 2.6419 (2.5580)	Entropy 0.61847 (0.61978)	Top-1 acc 60.547 (62.273)	Top-5 acc 80.078 (82.854)	lr 0.00901
Train [71][2580/3239]	Time 5.793 (0.640)	Data Time 5.524 (0.119)	Loss 2.3974 (2.5581)	Entropy 0.61831 (0.61978)	Top-1 acc 67.969 (62.274)	Top-5 acc 86.328 (82.852)	lr 0.00901
Train [71][2590/3239]	Time 0.278 (0.646)	Data Time 0.002 (0.125)	Loss 2.4855 (2.5582)	Entropy 0.61849 (0.61977)	Top-1 acc 65.234 (62.273)	Top-5 acc 83.984 (82.852)	lr 0.00901
Train [71][2600/3239]	Time 0.225 (0.645)	Data Time 0.001 (0.125)	Loss 2.5576 (2.5582)	Entropy 0.61849 (0.61977)	Top-1 acc 58.984 (62.274)	Top-5 acc 83.594 (82.854)	lr 0.00901
Train [71][2610/3239]	Time 0.259 (0.645)	Data Time 0.001 (0.125)	Loss 2.4712 (2.5582)	Entropy 0.61878 (0.61976)	Top-1 acc 65.234 (62.275)	Top-5 acc 83.984 (82.854)	lr 0.00901
Train [71][2620/3239]	Time 0.245 (0.653)	Data Time 0.001 (0.133)	Loss 2.4256 (2.5583)	Entropy 0.61858 (0.61976)	Top-1 acc 67.578 (62.276)	Top-5 acc 83.594 (82.849)	lr 0.00901
Train [71][2630/3239]	Time 0.236 (0.652)	Data Time 0.001 (0.133)	Loss 2.5880 (2.5584)	Entropy 0.61880 (0.61975)	Top-1 acc 61.719 (62.279)	Top-5 acc 81.641 (82.847)	lr 0.00901
Train [71][2640/3239]	Time 0.237 (0.652)	Data Time 0.001 (0.133)	Loss 2.6152 (2.5582)	Entropy 0.61878 (0.61975)	Top-1 acc 64.062 (62.290)	Top-5 acc 82.422 (82.849)	lr 0.00901
Train [71][2650/3239]	Time 0.218 (0.659)	Data Time 0.001 (0.141)	Loss 2.6098 (2.5584)	Entropy 0.61880 (0.61975)	Top-1 acc 63.281 (62.288)	Top-5 acc 81.250 (82.844)	lr 0.00901
Train [71][2660/3239]	Time 0.277 (0.658)	Data Time 0.001 (0.140)	Loss 2.5660 (2.5584)	Entropy 0.61880 (0.61974)	Top-1 acc 62.500 (62.290)	Top-5 acc 83.203 (82.846)	lr 0.00901
Train [71][2670/3239]	Time 2.102 (0.659)	Data Time 1.856 (0.142)	Loss 2.4100 (2.5584)	Entropy 0.61881 (0.61974)	Top-1 acc 64.062 (62.285)	Top-5 acc 85.156 (82.848)	lr 0.00901
Train [71][2680/3239]	Time 0.240 (0.666)	Data Time 0.001 (0.149)	Loss 2.5504 (2.5585)	Entropy 0.61847 (0.61974)	Top-1 acc 64.062 (62.283)	Top-5 acc 83.984 (82.847)	lr 0.00900
Train [71][2690/3239]	Time 0.229 (0.665)	Data Time 0.001 (0.148)	Loss 2.4088 (2.5584)	Entropy 0.61883 (0.61973)	Top-1 acc 64.453 (62.289)	Top-5 acc 87.891 (82.847)	lr 0.00900
Train [71][2700/3239]	Time 0.249 (0.666)	Data Time 0.001 (0.150)	Loss 2.5744 (2.5586)	Entropy 0.61888 (0.61973)	Top-1 acc 63.281 (62.285)	Top-5 acc 82.812 (82.845)	lr 0.00900
Train [71][2710/3239]	Time 0.241 (0.673)	Data Time 0.001 (0.158)	Loss 2.4202 (2.5585)	Entropy 0.61887 (0.61973)	Top-1 acc 67.578 (62.285)	Top-5 acc 87.891 (82.848)	lr 0.00900
Train [71][2720/3239]	Time 0.231 (0.673)	Data Time 0.001 (0.157)	Loss 2.5009 (2.5583)	Entropy 0.61910 (0.61972)	Top-1 acc 64.062 (62.288)	Top-5 acc 84.375 (82.852)	lr 0.00900
Train [71][2730/3239]	Time 0.329 (0.673)	Data Time 0.001 (0.158)	Loss 2.4034 (2.5584)	Entropy 0.61856 (0.61972)	Top-1 acc 67.578 (62.287)	Top-5 acc 87.109 (82.850)	lr 0.00900
Train [71][2740/3239]	Time 3.811 (0.674)	Data Time 3.547 (0.159)	Loss 2.5606 (2.5583)	Entropy 0.61890 (0.61972)	Top-1 acc 60.547 (62.290)	Top-5 acc 80.859 (82.852)	lr 0.00900
Train [71][2750/3239]	Time 0.228 (0.680)	Data Time 0.001 (0.166)	Loss 2.6464 (2.5583)	Entropy 0.61890 (0.61971)	Top-1 acc 61.719 (62.292)	Top-5 acc 82.812 (82.853)	lr 0.00900
Train [71][2760/3239]	Time 0.230 (0.680)	Data Time 0.001 (0.166)	Loss 2.5471 (2.5585)	Entropy 0.61913 (0.61971)	Top-1 acc 58.984 (62.283)	Top-5 acc 84.375 (82.847)	lr 0.00900
Train [71][2770/3239]	Time 0.250 (0.679)	Data Time 0.001 (0.165)	Loss 2.4723 (2.5585)	Entropy 0.61914 (0.61971)	Top-1 acc 65.625 (62.286)	Top-5 acc 81.250 (82.845)	lr 0.00900
Train [71][2780/3239]	Time 0.252 (0.688)	Data Time 0.001 (0.174)	Loss 2.5359 (2.5581)	Entropy 0.61940 (0.61971)	Top-1 acc 61.719 (62.297)	Top-5 acc 82.422 (82.852)	lr 0.00899
Train [71][2790/3239]	Time 3.556 (0.688)	Data Time 3.297 (0.175)	Loss 2.6574 (2.5582)	Entropy 0.61922 (0.61970)	Top-1 acc 60.156 (62.291)	Top-5 acc 79.297 (82.849)	lr 0.00899
Train [71][2800/3239]	Time 0.351 (0.687)	Data Time 0.001 (0.175)	Loss 2.4767 (2.5581)	Entropy 0.61863 (0.61970)	Top-1 acc 62.500 (62.296)	Top-5 acc 85.938 (82.852)	lr 0.00899
Train [71][2810/3239]	Time 0.237 (0.696)	Data Time 0.001 (0.183)	Loss 2.6311 (2.5583)	Entropy 0.61864 (0.61970)	Top-1 acc 61.328 (62.293)	Top-5 acc 78.906 (82.846)	lr 0.00899
Train [71][2820/3239]	Time 0.303 (0.695)	Data Time 0.002 (0.183)	Loss 2.4708 (2.5582)	Entropy 0.61897 (0.61969)	Top-1 acc 64.062 (62.298)	Top-5 acc 84.375 (82.848)	lr 0.00899
Train [71][2830/3239]	Time 0.230 (0.694)	Data Time 0.001 (0.182)	Loss 2.6240 (2.5581)	Entropy 0.61875 (0.61969)	Top-1 acc 60.156 (62.300)	Top-5 acc 79.688 (82.850)	lr 0.00899
Train [71][2840/3239]	Time 0.254 (0.703)	Data Time 0.001 (0.192)	Loss 2.6519 (2.5582)	Entropy 0.61904 (0.61969)	Top-1 acc 61.328 (62.300)	Top-5 acc 81.250 (82.848)	lr 0.00899
Train [71][2850/3239]	Time 0.244 (0.702)	Data Time 0.001 (0.191)	Loss 2.5706 (2.5582)	Entropy 0.61896 (0.61969)	Top-1 acc 63.672 (62.299)	Top-5 acc 82.031 (82.847)	lr 0.00899
Train [71][2860/3239]	Time 0.244 (0.702)	Data Time 0.001 (0.191)	Loss 2.6482 (2.5583)	Entropy 0.61863 (0.61968)	Top-1 acc 60.938 (62.299)	Top-5 acc 84.375 (82.849)	lr 0.00899
Train [71][2870/3239]	Time 0.250 (0.711)	Data Time 0.001 (0.200)	Loss 2.5406 (2.5583)	Entropy 0.61829 (0.61968)	Top-1 acc 63.281 (62.300)	Top-5 acc 83.594 (82.848)	lr 0.00899
Train [71][2880/3239]	Time 0.228 (0.710)	Data Time 0.001 (0.200)	Loss 2.4289 (2.5583)	Entropy 0.61854 (0.61968)	Top-1 acc 66.797 (62.303)	Top-5 acc 86.328 (82.849)	lr 0.00898
Train [71][2890/3239]	Time 3.546 (0.710)	Data Time 3.175 (0.200)	Loss 2.4201 (2.5581)	Entropy 0.61881 (0.61967)	Top-1 acc 64.844 (62.309)	Top-5 acc 84.766 (82.854)	lr 0.00898
Train [71][2900/3239]	Time 0.363 (0.709)	Data Time 0.130 (0.200)	Loss 2.6167 (2.5580)	Entropy 0.61883 (0.61967)	Top-1 acc 60.156 (62.313)	Top-5 acc 82.422 (82.854)	lr 0.00898
Train [71][2910/3239]	Time 0.242 (0.717)	Data Time 0.001 (0.208)	Loss 2.6935 (2.5581)	Entropy 0.61875 (0.61967)	Top-1 acc 60.547 (62.312)	Top-5 acc 80.078 (82.852)	lr 0.00898
Train [71][2920/3239]	Time 0.242 (0.718)	Data Time 0.001 (0.209)	Loss 2.5862 (2.5580)	Entropy 0.61894 (0.61966)	Top-1 acc 58.984 (62.312)	Top-5 acc 87.109 (82.857)	lr 0.00898
Train [71][2930/3239]	Time 0.248 (0.717)	Data Time 0.001 (0.209)	Loss 2.5660 (2.5582)	Entropy 0.61886 (0.61966)	Top-1 acc 63.672 (62.311)	Top-5 acc 81.641 (82.854)	lr 0.00898
Train [71][2940/3239]	Time 0.241 (0.724)	Data Time 0.001 (0.216)	Loss 2.5435 (2.5583)	Entropy 0.61869 (0.61966)	Top-1 acc 66.016 (62.309)	Top-5 acc 81.641 (82.854)	lr 0.00898
Train [71][2950/3239]	Time 4.939 (0.725)	Data Time 4.675 (0.217)	Loss 2.5599 (2.5583)	Entropy 0.61867 (0.61965)	Top-1 acc 64.062 (62.312)	Top-5 acc 82.812 (82.854)	lr 0.00898
Train [71][2960/3239]	Time 0.349 (0.725)	Data Time 0.001 (0.218)	Loss 2.5818 (2.5583)	Entropy 0.61869 (0.61965)	Top-1 acc 61.719 (62.308)	Top-5 acc 82.031 (82.854)	lr 0.00898
Train [71][2970/3239]	Time 0.232 (0.732)	Data Time 0.001 (0.225)	Loss 2.5352 (2.5584)	Entropy 0.61879 (0.61965)	Top-1 acc 62.891 (62.304)	Top-5 acc 82.422 (82.853)	lr 0.00898
Train [71][2980/3239]	Time 0.249 (0.731)	Data Time 0.001 (0.224)	Loss 2.4623 (2.5585)	Entropy 0.61866 (0.61965)	Top-1 acc 62.891 (62.303)	Top-5 acc 85.547 (82.854)	lr 0.00897
Train [71][2990/3239]	Time 0.232 (0.731)	Data Time 0.001 (0.224)	Loss 2.5580 (2.5586)	Entropy 0.61898 (0.61964)	Top-1 acc 60.938 (62.298)	Top-5 acc 83.203 (82.849)	lr 0.00897
Train [71][3000/3239]	Time 0.232 (0.739)	Data Time 0.001 (0.232)	Loss 2.6364 (2.5587)	Entropy 0.61897 (0.61964)	Top-1 acc 59.375 (62.294)	Top-5 acc 80.469 (82.845)	lr 0.00897
Train [71][3010/3239]	Time 0.240 (0.738)	Data Time 0.001 (0.232)	Loss 2.4666 (2.5586)	Entropy 0.61868 (0.61964)	Top-1 acc 66.016 (62.299)	Top-5 acc 83.984 (82.846)	lr 0.00897
Train [71][3020/3239]	Time 0.246 (0.738)	Data Time 0.001 (0.232)	Loss 2.7396 (2.5588)	Entropy 0.61846 (0.61963)	Top-1 acc 56.641 (62.295)	Top-5 acc 80.469 (82.843)	lr 0.00897
Train [71][3030/3239]	Time 0.220 (0.746)	Data Time 0.001 (0.240)	Loss 2.4795 (2.5589)	Entropy 0.61833 (0.61963)	Top-1 acc 62.891 (62.295)	Top-5 acc 83.594 (82.841)	lr 0.00897
Train [71][3040/3239]	Time 0.241 (0.745)	Data Time 0.001 (0.240)	Loss 2.6522 (2.5589)	Entropy 0.61836 (0.61963)	Top-1 acc 63.281 (62.297)	Top-5 acc 83.594 (82.842)	lr 0.00897
Train [71][3050/3239]	Time 1.205 (0.744)	Data Time 0.882 (0.239)	Loss 2.5403 (2.5589)	Entropy 0.61837 (0.61962)	Top-1 acc 58.594 (62.298)	Top-5 acc 85.547 (82.844)	lr 0.00897
Train [71][3060/3239]	Time 0.252 (0.745)	Data Time 0.001 (0.240)	Loss 2.6368 (2.5590)	Entropy 0.61805 (0.61962)	Top-1 acc 57.812 (62.294)	Top-5 acc 82.422 (82.844)	lr 0.00897
Train [71][3070/3239]	Time 0.239 (0.751)	Data Time 0.001 (0.247)	Loss 2.5451 (2.5589)	Entropy 0.61832 (0.61961)	Top-1 acc 63.281 (62.295)	Top-5 acc 83.594 (82.845)	lr 0.00897
Train [71][3080/3239]	Time 0.314 (0.766)	Data Time 0.003 (0.246)	Loss 2.3707 (2.5590)	Entropy 0.61807 (0.61961)	Top-1 acc 64.453 (62.289)	Top-5 acc 85.547 (82.842)	lr 0.00897
Train [71][3090/3239]	Time 0.279 (0.765)	Data Time 0.002 (0.245)	Loss 2.4457 (2.5590)	Entropy 0.61827 (0.61960)	Top-1 acc 65.625 (62.292)	Top-5 acc 85.547 (82.841)	lr 0.00896
Train [71][3100/3239]	Time 0.240 (0.763)	Data Time 0.001 (0.245)	Loss 2.4078 (2.5590)	Entropy 0.61845 (0.61960)	Top-1 acc 66.406 (62.292)	Top-5 acc 84.375 (82.840)	lr 0.00896
Train [71][3110/3239]	Time 0.224 (0.762)	Data Time 0.001 (0.244)	Loss 2.7369 (2.5591)	Entropy 0.61818 (0.61959)	Top-1 acc 56.641 (62.289)	Top-5 acc 78.516 (82.838)	lr 0.00896
Train [71][3120/3239]	Time 0.348 (0.761)	Data Time 0.001 (0.243)	Loss 2.4064 (2.5592)	Entropy 0.61817 (0.61959)	Top-1 acc 63.672 (62.287)	Top-5 acc 86.328 (82.837)	lr 0.00896
Train [71][3130/3239]	Time 0.238 (0.765)	Data Time 0.001 (0.247)	Loss 2.4678 (2.5591)	Entropy 0.61833 (0.61959)	Top-1 acc 63.672 (62.289)	Top-5 acc 83.984 (82.837)	lr 0.00896
Train [71][3140/3239]	Time 2.508 (0.765)	Data Time 2.257 (0.247)	Loss 2.4716 (2.5592)	Entropy 0.61830 (0.61958)	Top-1 acc 65.234 (62.285)	Top-5 acc 87.109 (82.836)	lr 0.00896
Train [71][3150/3239]	Time 0.245 (0.764)	Data Time 0.001 (0.247)	Loss 2.3911 (2.5592)	Entropy 0.61810 (0.61958)	Top-1 acc 65.234 (62.284)	Top-5 acc 84.766 (82.836)	lr 0.00896
Train [71][3160/3239]	Time 0.246 (0.772)	Data Time 0.001 (0.255)	Loss 2.6267 (2.5593)	Entropy 0.61801 (0.61957)	Top-1 acc 55.859 (62.279)	Top-5 acc 80.469 (82.834)	lr 0.00896
Train [71][3170/3239]	Time 0.263 (0.771)	Data Time 0.001 (0.254)	Loss 2.5826 (2.5593)	Entropy 0.61800 (0.61957)	Top-1 acc 59.375 (62.278)	Top-5 acc 82.031 (82.834)	lr 0.00896
Train [71][3180/3239]	Time 0.253 (0.771)	Data Time 0.000 (0.254)	Loss 2.7411 (2.5597)	Entropy 0.61801 (0.61956)	Top-1 acc 60.547 (62.268)	Top-5 acc 78.516 (82.828)	lr 0.00896
Train [71][3190/3239]	Time 0.249 (0.778)	Data Time 0.000 (0.262)	Loss 2.6126 (2.5596)	Entropy 0.61774 (0.61956)	Top-1 acc 60.547 (62.270)	Top-5 acc 83.594 (82.830)	lr 0.00895
Train [71][3200/3239]	Time 0.228 (0.777)	Data Time 0.000 (0.261)	Loss 2.4146 (2.5596)	Entropy 0.61745 (0.61955)	Top-1 acc 64.453 (62.269)	Top-5 acc 89.453 (82.828)	lr 0.00895
Train [71][3210/3239]	Time 0.262 (0.777)	Data Time 0.000 (0.262)	Loss 2.4355 (2.5596)	Entropy 0.61712 (0.61954)	Top-1 acc 65.625 (62.268)	Top-5 acc 84.766 (82.827)	lr 0.00895
Train [71][3220/3239]	Time 0.226 (0.776)	Data Time 0.000 (0.261)	Loss 2.7695 (2.5596)	Entropy 0.61683 (0.61954)	Top-1 acc 56.250 (62.266)	Top-5 acc 78.125 (82.827)	lr 0.00895
Train [71][3230/3239]	Time 0.230 (0.780)	Data Time 0.000 (0.265)	Loss 2.6802 (2.5597)	Entropy 0.61718 (0.61953)	Top-1 acc 58.984 (62.264)	Top-5 acc 79.297 (82.825)	lr 0.00895
Train [71][3239/3239]	Time 1.072 (0.779)	Data Time 0.000 (0.265)	Loss 2.6306 (2.5597)	Entropy 0.61707 (0.61952)	Top-1 acc 65.432 (62.268)	Top-5 acc 81.481 (82.825)	lr 0.00895
==========Valid [71/120]	loss 1.349	top-1 acc 69.092 (69.092)	top-5 acc 88.552	Train top-1 62.268	top-5 82.825	Entropy 0.61707	Latency-None: 0.000ms	Flops: 539.00M
Train [72][0/3239]	Time 41.086 (41.086)	Data Time 39.251 (39.251)	Loss 2.5469 (2.5469)	Entropy 0.61705 (0.61705)	Top-1 acc 63.672 (63.672)	Top-5 acc 83.984 (83.984)	lr 0.00895
Train [72][10/3239]	Time 0.261 (4.310)	Data Time 0.002 (3.641)	Loss 2.6528 (2.5761)	Entropy 0.61737 (0.61721)	Top-1 acc 57.422 (61.967)	Top-5 acc 81.641 (82.706)	lr 0.00895
Train [72][20/3239]	Time 0.322 (2.478)	Data Time 0.001 (1.908)	Loss 2.5466 (2.5168)	Entropy 0.61775 (0.61734)	Top-1 acc 66.406 (63.318)	Top-5 acc 83.203 (83.761)	lr 0.00895
Train [72][30/3239]	Time 0.263 (1.849)	Data Time 0.001 (1.293)	Loss 2.6957 (2.5623)	Entropy 0.61817 (0.61755)	Top-1 acc 57.422 (62.185)	Top-5 acc 77.734 (82.926)	lr 0.00895
Train [72][40/3239]	Time 0.255 (1.506)	Data Time 0.001 (0.978)	Loss 2.7729 (2.5489)	Entropy 0.61830 (0.61772)	Top-1 acc 55.078 (62.224)	Top-5 acc 80.859 (83.308)	lr 0.00895
Train [72][50/3239]	Time 0.277 (1.299)	Data Time 0.001 (0.787)	Loss 2.4171 (2.5518)	Entropy 0.61843 (0.61786)	Top-1 acc 64.844 (62.002)	Top-5 acc 86.328 (83.172)	lr 0.00894
Train [72][60/3239]	Time 0.250 (1.165)	Data Time 0.001 (0.658)	Loss 2.4487 (2.5585)	Entropy 0.61825 (0.61795)	Top-1 acc 65.234 (61.898)	Top-5 acc 83.594 (83.101)	lr 0.00894
Train [72][70/3239]	Time 0.243 (1.067)	Data Time 0.001 (0.566)	Loss 2.4839 (2.5555)	Entropy 0.61796 (0.61798)	Top-1 acc 67.578 (61.972)	Top-5 acc 83.984 (83.071)	lr 0.00894
Train [72][80/3239]	Time 0.245 (0.990)	Data Time 0.001 (0.496)	Loss 2.5078 (2.5462)	Entropy 0.61808 (0.61798)	Top-1 acc 62.109 (62.196)	Top-5 acc 84.375 (83.218)	lr 0.00894
Train [72][90/3239]	Time 0.297 (0.936)	Data Time 0.001 (0.442)	Loss 2.5428 (2.5490)	Entropy 0.61771 (0.61798)	Top-1 acc 64.844 (62.109)	Top-5 acc 83.594 (83.177)	lr 0.00894
Train [72][100/3239]	Time 0.296 (0.886)	Data Time 0.001 (0.398)	Loss 2.5885 (2.5508)	Entropy 0.61774 (0.61795)	Top-1 acc 62.891 (62.094)	Top-5 acc 83.594 (83.149)	lr 0.00894
Train [72][110/3239]	Time 0.404 (0.846)	Data Time 0.011 (0.362)	Loss 2.2973 (2.5486)	Entropy 0.61784 (0.61794)	Top-1 acc 67.969 (62.236)	Top-5 acc 85.156 (83.186)	lr 0.00894
Train [72][120/3239]	Time 0.240 (0.810)	Data Time 0.001 (0.333)	Loss 2.5918 (2.5456)	Entropy 0.61799 (0.61794)	Top-1 acc 61.328 (62.319)	Top-5 acc 82.031 (83.226)	lr 0.00894
Train [72][130/3239]	Time 3.262 (0.807)	Data Time 2.991 (0.330)	Loss 2.5425 (2.5409)	Entropy 0.61833 (0.61795)	Top-1 acc 56.250 (62.363)	Top-5 acc 81.641 (83.310)	lr 0.00894
Train [72][140/3239]	Time 0.293 (0.784)	Data Time 0.001 (0.307)	Loss 2.4085 (2.5415)	Entropy 0.61842 (0.61798)	Top-1 acc 65.625 (62.384)	Top-5 acc 85.938 (83.331)	lr 0.00894
Train [72][150/3239]	Time 0.234 (0.760)	Data Time 0.001 (0.287)	Loss 2.5530 (2.5470)	Entropy 0.61845 (0.61800)	Top-1 acc 63.281 (62.322)	Top-5 acc 83.203 (83.201)	lr 0.00894
Train [72][160/3239]	Time 0.265 (0.746)	Data Time 0.002 (0.269)	Loss 2.7956 (2.5437)	Entropy 0.61859 (0.61804)	Top-1 acc 54.297 (62.410)	Top-5 acc 77.734 (83.257)	lr 0.00893
Train [72][170/3239]	Time 0.312 (0.760)	Data Time 0.001 (0.285)	Loss 2.5655 (2.5427)	Entropy 0.61886 (0.61808)	Top-1 acc 64.844 (62.443)	Top-5 acc 82.422 (83.260)	lr 0.00893
Train [72][180/3239]	Time 0.379 (0.744)	Data Time 0.001 (0.270)	Loss 2.6165 (2.5426)	Entropy 0.61884 (0.61812)	Top-1 acc 60.938 (62.470)	Top-5 acc 82.031 (83.231)	lr 0.00893
Train [72][190/3239]	Time 0.248 (0.728)	Data Time 0.001 (0.256)	Loss 2.6481 (2.5424)	Entropy 0.61922 (0.61817)	Top-1 acc 60.547 (62.473)	Top-5 acc 80.469 (83.230)	lr 0.00893
Train [72][200/3239]	Time 0.258 (0.747)	Data Time 0.001 (0.276)	Loss 2.5968 (2.5431)	Entropy 0.61895 (0.61821)	Top-1 acc 57.812 (62.407)	Top-5 acc 82.031 (83.221)	lr 0.00893
Train [72][210/3239]	Time 0.292 (0.734)	Data Time 0.001 (0.263)	Loss 2.4607 (2.5431)	Entropy 0.61903 (0.61825)	Top-1 acc 66.016 (62.407)	Top-5 acc 85.156 (83.229)	lr 0.00893
Train [72][220/3239]	Time 0.251 (0.720)	Data Time 0.001 (0.251)	Loss 2.3280 (2.5424)	Entropy 0.61886 (0.61828)	Top-1 acc 68.750 (62.397)	Top-5 acc 87.891 (83.228)	lr 0.00893
Train [72][230/3239]	Time 0.239 (0.713)	Data Time 0.001 (0.245)	Loss 2.3044 (2.5437)	Entropy 0.61911 (0.61831)	Top-1 acc 64.062 (62.341)	Top-5 acc 88.281 (83.188)	lr 0.00893
Train [72][240/3239]	Time 0.266 (0.701)	Data Time 0.001 (0.235)	Loss 2.5822 (2.5442)	Entropy 0.61879 (0.61833)	Top-1 acc 62.109 (62.340)	Top-5 acc 80.078 (83.164)	lr 0.00893
Train [72][250/3239]	Time 0.271 (0.693)	Data Time 0.001 (0.226)	Loss 2.5324 (2.5432)	Entropy 0.61840 (0.61834)	Top-1 acc 66.016 (62.346)	Top-5 acc 82.031 (83.194)	lr 0.00893
Train [72][260/3239]	Time 0.247 (0.688)	Data Time 0.001 (0.222)	Loss 2.5221 (2.5420)	Entropy 0.61828 (0.61834)	Top-1 acc 63.281 (62.385)	Top-5 acc 86.719 (83.244)	lr 0.00892
Train [72][270/3239]	Time 0.380 (0.679)	Data Time 0.003 (0.214)	Loss 2.4621 (2.5423)	Entropy 0.61817 (0.61834)	Top-1 acc 63.281 (62.386)	Top-5 acc 85.547 (83.254)	lr 0.00892
Train [72][280/3239]	Time 0.282 (0.671)	Data Time 0.001 (0.206)	Loss 2.6791 (2.5438)	Entropy 0.61826 (0.61834)	Top-1 acc 55.859 (62.362)	Top-5 acc 80.859 (83.223)	lr 0.00892
Train [72][290/3239]	Time 2.286 (0.670)	Data Time 2.029 (0.206)	Loss 2.4191 (2.5432)	Entropy 0.61810 (0.61834)	Top-1 acc 67.578 (62.426)	Top-5 acc 84.375 (83.219)	lr 0.00892
Train [72][300/3239]	Time 0.249 (0.663)	Data Time 0.001 (0.200)	Loss 2.4313 (2.5438)	Entropy 0.61841 (0.61833)	Top-1 acc 64.844 (62.423)	Top-5 acc 87.500 (83.212)	lr 0.00892
Train [72][310/3239]	Time 0.357 (0.656)	Data Time 0.002 (0.193)	Loss 2.5663 (2.5433)	Entropy 0.61831 (0.61833)	Top-1 acc 64.062 (62.403)	Top-5 acc 84.766 (83.231)	lr 0.00892
Train [72][320/3239]	Time 0.260 (0.649)	Data Time 0.002 (0.187)	Loss 2.4049 (2.5448)	Entropy 0.61852 (0.61833)	Top-1 acc 63.672 (62.398)	Top-5 acc 85.547 (83.186)	lr 0.00892
Train [72][330/3239]	Time 0.233 (0.659)	Data Time 0.001 (0.198)	Loss 2.6061 (2.5432)	Entropy 0.61833 (0.61833)	Top-1 acc 62.891 (62.470)	Top-5 acc 81.641 (83.194)	lr 0.00892
Train [72][340/3239]	Time 0.388 (0.652)	Data Time 0.002 (0.192)	Loss 2.4946 (2.5423)	Entropy 0.61844 (0.61833)	Top-1 acc 67.969 (62.501)	Top-5 acc 84.766 (83.191)	lr 0.00892
Train [72][350/3239]	Time 0.234 (0.647)	Data Time 0.001 (0.187)	Loss 2.5307 (2.5435)	Entropy 0.61870 (0.61834)	Top-1 acc 63.672 (62.500)	Top-5 acc 82.031 (83.157)	lr 0.00892
Train [72][360/3239]	Time 0.229 (0.657)	Data Time 0.001 (0.199)	Loss 2.5212 (2.5424)	Entropy 0.61854 (0.61834)	Top-1 acc 60.156 (62.527)	Top-5 acc 82.031 (83.193)	lr 0.00891
Train [72][370/3239]	Time 0.302 (0.652)	Data Time 0.024 (0.193)	Loss 2.6648 (2.5417)	Entropy 0.61850 (0.61835)	Top-1 acc 57.812 (62.540)	Top-5 acc 80.469 (83.214)	lr 0.00891
Train [72][380/3239]	Time 0.291 (0.646)	Data Time 0.002 (0.188)	Loss 2.5102 (2.5388)	Entropy 0.61860 (0.61835)	Top-1 acc 63.672 (62.612)	Top-5 acc 82.422 (83.269)	lr 0.00891
Train [72][390/3239]	Time 0.241 (0.654)	Data Time 0.001 (0.196)	Loss 2.3617 (2.5390)	Entropy 0.61856 (0.61836)	Top-1 acc 66.406 (62.599)	Top-5 acc 88.672 (83.271)	lr 0.00891
Train [72][400/3239]	Time 0.235 (0.648)	Data Time 0.001 (0.191)	Loss 2.5498 (2.5393)	Entropy 0.61892 (0.61837)	Top-1 acc 64.062 (62.611)	Top-5 acc 83.203 (83.270)	lr 0.00891
Train [72][410/3239]	Time 0.255 (0.644)	Data Time 0.001 (0.186)	Loss 2.5080 (2.5399)	Entropy 0.61889 (0.61838)	Top-1 acc 64.062 (62.607)	Top-5 acc 83.984 (83.249)	lr 0.00891
Train [72][420/3239]	Time 0.245 (0.655)	Data Time 0.001 (0.197)	Loss 2.5911 (2.5413)	Entropy 0.61880 (0.61839)	Top-1 acc 61.719 (62.576)	Top-5 acc 80.078 (83.206)	lr 0.00891
Train [72][430/3239]	Time 0.274 (0.649)	Data Time 0.001 (0.193)	Loss 2.4359 (2.5410)	Entropy 0.61895 (0.61840)	Top-1 acc 64.844 (62.601)	Top-5 acc 85.547 (83.222)	lr 0.00891
Train [72][440/3239]	Time 0.253 (0.645)	Data Time 0.001 (0.188)	Loss 2.5014 (2.5408)	Entropy 0.61928 (0.61842)	Top-1 acc 63.281 (62.609)	Top-5 acc 82.812 (83.231)	lr 0.00891
Train [72][450/3239]	Time 4.229 (0.650)	Data Time 3.990 (0.193)	Loss 2.2958 (2.5401)	Entropy 0.61904 (0.61844)	Top-1 acc 68.750 (62.616)	Top-5 acc 87.891 (83.234)	lr 0.00891
Train [72][460/3239]	Time 0.243 (0.645)	Data Time 0.001 (0.189)	Loss 2.5231 (2.5390)	Entropy 0.61904 (0.61845)	Top-1 acc 62.500 (62.639)	Top-5 acc 83.203 (83.254)	lr 0.00891
Train [72][470/3239]	Time 0.240 (0.640)	Data Time 0.001 (0.185)	Loss 2.3863 (2.5389)	Entropy 0.61948 (0.61846)	Top-1 acc 70.312 (62.651)	Top-5 acc 84.375 (83.254)	lr 0.00890
Train [72][480/3239]	Time 0.258 (0.637)	Data Time 0.001 (0.181)	Loss 2.4319 (2.5390)	Entropy 0.61939 (0.61848)	Top-1 acc 64.844 (62.641)	Top-5 acc 85.156 (83.253)	lr 0.00890
Train [72][490/3239]	Time 0.346 (0.750)	Data Time 0.007 (0.195)	Loss 2.6258 (2.5401)	Entropy 0.61948 (0.61850)	Top-1 acc 59.375 (62.624)	Top-5 acc 84.766 (83.225)	lr 0.00890
Train [72][500/3239]	Time 0.375 (0.745)	Data Time 0.002 (0.191)	Loss 2.5294 (2.5418)	Entropy 0.61949 (0.61852)	Top-1 acc 66.016 (62.587)	Top-5 acc 85.156 (83.199)	lr 0.00890
Train [72][510/3239]	Time 0.253 (0.739)	Data Time 0.002 (0.187)	Loss 2.6532 (2.5423)	Entropy 0.61969 (0.61854)	Top-1 acc 60.547 (62.569)	Top-5 acc 79.688 (83.186)	lr 0.00890
Train [72][520/3239]	Time 0.245 (0.733)	Data Time 0.001 (0.184)	Loss 2.7036 (2.5424)	Entropy 0.62004 (0.61857)	Top-1 acc 58.203 (62.564)	Top-5 acc 77.734 (83.175)	lr 0.00890
Train [72][530/3239]	Time 0.282 (0.728)	Data Time 0.002 (0.180)	Loss 2.4580 (2.5412)	Entropy 0.62016 (0.61859)	Top-1 acc 64.062 (62.596)	Top-5 acc 84.766 (83.194)	lr 0.00890
Train [72][540/3239]	Time 0.252 (0.723)	Data Time 0.001 (0.177)	Loss 2.5881 (2.5420)	Entropy 0.62003 (0.61862)	Top-1 acc 62.109 (62.582)	Top-5 acc 79.297 (83.183)	lr 0.00890
Train [72][550/3239]	Time 0.258 (0.719)	Data Time 0.001 (0.174)	Loss 2.4456 (2.5420)	Entropy 0.61995 (0.61865)	Top-1 acc 61.328 (62.574)	Top-5 acc 84.766 (83.179)	lr 0.00890
Train [72][560/3239]	Time 0.270 (0.715)	Data Time 0.002 (0.171)	Loss 2.6075 (2.5420)	Entropy 0.62007 (0.61867)	Top-1 acc 57.031 (62.579)	Top-5 acc 80.859 (83.175)	lr 0.00890
Train [72][570/3239]	Time 0.298 (0.711)	Data Time 0.001 (0.168)	Loss 2.4234 (2.5418)	Entropy 0.61977 (0.61869)	Top-1 acc 66.016 (62.581)	Top-5 acc 86.719 (83.187)	lr 0.00889
Train [72][580/3239]	Time 0.263 (0.706)	Data Time 0.001 (0.165)	Loss 2.2991 (2.5409)	Entropy 0.61937 (0.61871)	Top-1 acc 67.578 (62.585)	Top-5 acc 85.938 (83.195)	lr 0.00889
Train [72][590/3239]	Time 0.274 (0.702)	Data Time 0.001 (0.162)	Loss 2.6600 (2.5420)	Entropy 0.61935 (0.61872)	Top-1 acc 59.766 (62.563)	Top-5 acc 80.078 (83.164)	lr 0.00889
Train [72][600/3239]	Time 0.247 (0.699)	Data Time 0.001 (0.159)	Loss 2.5408 (2.5424)	Entropy 0.61959 (0.61873)	Top-1 acc 63.281 (62.560)	Top-5 acc 83.594 (83.152)	lr 0.00889
Train [72][610/3239]	Time 0.251 (0.701)	Data Time 0.001 (0.163)	Loss 2.4459 (2.5418)	Entropy 0.61868 (0.61874)	Top-1 acc 63.672 (62.581)	Top-5 acc 85.156 (83.158)	lr 0.00889
Train [72][620/3239]	Time 0.231 (0.701)	Data Time 0.001 (0.165)	Loss 2.6300 (2.5430)	Entropy 0.61863 (0.61874)	Top-1 acc 60.938 (62.565)	Top-5 acc 79.297 (83.134)	lr 0.00889
Train [72][630/3239]	Time 0.251 (0.699)	Data Time 0.001 (0.165)	Loss 2.5550 (2.5428)	Entropy 0.61896 (0.61874)	Top-1 acc 64.062 (62.563)	Top-5 acc 82.031 (83.140)	lr 0.00889
Train [72][640/3239]	Time 0.241 (0.700)	Data Time 0.001 (0.168)	Loss 2.3842 (2.5432)	Entropy 0.61917 (0.61874)	Top-1 acc 64.844 (62.559)	Top-5 acc 85.547 (83.137)	lr 0.00889
Train [72][650/3239]	Time 4.913 (0.707)	Data Time 4.659 (0.175)	Loss 2.7847 (2.5437)	Entropy 0.61918 (0.61875)	Top-1 acc 57.422 (62.550)	Top-5 acc 77.734 (83.123)	lr 0.00889
Train [72][660/3239]	Time 0.394 (0.703)	Data Time 0.001 (0.173)	Loss 3.1032 (2.5450)	Entropy 0.61909 (0.61876)	Top-1 acc 50.781 (62.517)	Top-5 acc 71.875 (83.102)	lr 0.00889
Train [72][670/3239]	Time 0.268 (0.712)	Data Time 0.001 (0.183)	Loss 2.5753 (2.5456)	Entropy 0.61876 (0.61876)	Top-1 acc 59.766 (62.497)	Top-5 acc 82.422 (83.085)	lr 0.00888
Train [72][680/3239]	Time 0.243 (0.708)	Data Time 0.001 (0.180)	Loss 2.5814 (2.5457)	Entropy 0.61876 (0.61876)	Top-1 acc 62.891 (62.487)	Top-5 acc 80.859 (83.078)	lr 0.00888
Train [72][690/3239]	Time 0.286 (0.704)	Data Time 0.001 (0.178)	Loss 2.3808 (2.5455)	Entropy 0.61885 (0.61876)	Top-1 acc 66.797 (62.484)	Top-5 acc 85.156 (83.082)	lr 0.00888
Train [72][700/3239]	Time 10.275 (0.715)	Data Time 10.021 (0.190)	Loss 2.5305 (2.5447)	Entropy 0.61908 (0.61876)	Top-1 acc 63.281 (62.512)	Top-5 acc 83.203 (83.093)	lr 0.00888
Train [72][710/3239]	Time 0.249 (0.712)	Data Time 0.001 (0.187)	Loss 2.5085 (2.5448)	Entropy 0.61906 (0.61877)	Top-1 acc 62.891 (62.509)	Top-5 acc 84.766 (83.094)	lr 0.00888
Train [72][720/3239]	Time 0.258 (0.708)	Data Time 0.001 (0.184)	Loss 2.4488 (2.5455)	Entropy 0.61924 (0.61877)	Top-1 acc 67.188 (62.491)	Top-5 acc 84.766 (83.075)	lr 0.00888
Train [72][730/3239]	Time 0.363 (0.704)	Data Time 0.001 (0.182)	Loss 2.6032 (2.5454)	Entropy 0.61929 (0.61878)	Top-1 acc 62.891 (62.487)	Top-5 acc 82.422 (83.087)	lr 0.00888
Train [72][740/3239]	Time 0.240 (0.709)	Data Time 0.001 (0.188)	Loss 2.4707 (2.5450)	Entropy 0.61914 (0.61878)	Top-1 acc 64.844 (62.507)	Top-5 acc 82.422 (83.098)	lr 0.00888
Train [72][750/3239]	Time 0.275 (0.706)	Data Time 0.002 (0.186)	Loss 2.5197 (2.5455)	Entropy 0.61918 (0.61879)	Top-1 acc 61.719 (62.499)	Top-5 acc 82.031 (83.081)	lr 0.00888
Train [72][760/3239]	Time 0.245 (0.706)	Data Time 0.001 (0.187)	Loss 2.5483 (2.5460)	Entropy 0.61921 (0.61880)	Top-1 acc 59.375 (62.485)	Top-5 acc 85.547 (83.084)	lr 0.00888
Train [72][770/3239]	Time 0.245 (0.708)	Data Time 0.001 (0.190)	Loss 2.3435 (2.5457)	Entropy 0.61876 (0.61880)	Top-1 acc 66.797 (62.496)	Top-5 acc 85.938 (83.090)	lr 0.00888
Train [72][780/3239]	Time 0.246 (0.705)	Data Time 0.001 (0.187)	Loss 2.7120 (2.5455)	Entropy 0.61852 (0.61880)	Top-1 acc 57.422 (62.509)	Top-5 acc 81.250 (83.096)	lr 0.00887
Train [72][790/3239]	Time 0.276 (0.704)	Data Time 0.001 (0.187)	Loss 2.6512 (2.5457)	Entropy 0.61851 (0.61879)	Top-1 acc 62.109 (62.513)	Top-5 acc 80.859 (83.095)	lr 0.00887
Train [72][800/3239]	Time 0.236 (0.710)	Data Time 0.001 (0.195)	Loss 2.3898 (2.5459)	Entropy 0.61891 (0.61879)	Top-1 acc 67.578 (62.502)	Top-5 acc 88.281 (83.094)	lr 0.00887
Train [72][810/3239]	Time 0.247 (0.707)	Data Time 0.001 (0.193)	Loss 2.6043 (2.5463)	Entropy 0.61891 (0.61879)	Top-1 acc 58.203 (62.486)	Top-5 acc 83.594 (83.088)	lr 0.00887
Train [72][820/3239]	Time 0.341 (0.709)	Data Time 0.001 (0.195)	Loss 2.9971 (2.5473)	Entropy 0.61876 (0.61879)	Top-1 acc 53.906 (62.473)	Top-5 acc 71.094 (83.076)	lr 0.00887
Train [72][830/3239]	Time 0.253 (0.714)	Data Time 0.001 (0.201)	Loss 2.6361 (2.5476)	Entropy 0.61856 (0.61879)	Top-1 acc 58.203 (62.462)	Top-5 acc 83.594 (83.085)	lr 0.00887
Train [72][840/3239]	Time 0.238 (0.710)	Data Time 0.001 (0.199)	Loss 2.5471 (2.5486)	Entropy 0.61822 (0.61879)	Top-1 acc 60.938 (62.439)	Top-5 acc 82.422 (83.064)	lr 0.00887
Train [72][850/3239]	Time 0.617 (0.709)	Data Time 0.358 (0.198)	Loss 2.3434 (2.5490)	Entropy 0.61798 (0.61878)	Top-1 acc 67.578 (62.417)	Top-5 acc 85.547 (83.051)	lr 0.00887
Train [72][860/3239]	Time 7.575 (0.719)	Data Time 7.319 (0.210)	Loss 2.6960 (2.5495)	Entropy 0.61779 (0.61877)	Top-1 acc 59.375 (62.412)	Top-5 acc 80.078 (83.036)	lr 0.00887
Train [72][870/3239]	Time 0.252 (0.716)	Data Time 0.002 (0.207)	Loss 2.5257 (2.5494)	Entropy 0.61769 (0.61876)	Top-1 acc 60.156 (62.407)	Top-5 acc 85.156 (83.052)	lr 0.00887
Train [72][880/3239]	Time 2.045 (0.715)	Data Time 1.784 (0.207)	Loss 2.7011 (2.5494)	Entropy 0.61786 (0.61875)	Top-1 acc 56.641 (62.407)	Top-5 acc 76.562 (83.042)	lr 0.00886
Train [72][890/3239]	Time 0.445 (0.717)	Data Time 0.002 (0.209)	Loss 2.4686 (2.5495)	Entropy 0.61792 (0.61874)	Top-1 acc 62.891 (62.390)	Top-5 acc 86.328 (83.047)	lr 0.00886
Train [72][900/3239]	Time 0.239 (0.719)	Data Time 0.001 (0.213)	Loss 2.4442 (2.5488)	Entropy 0.61764 (0.61873)	Top-1 acc 66.406 (62.411)	Top-5 acc 84.766 (83.062)	lr 0.00886
Train [72][910/3239]	Time 0.245 (0.715)	Data Time 0.002 (0.210)	Loss 2.5039 (2.5487)	Entropy 0.61752 (0.61872)	Top-1 acc 66.406 (62.418)	Top-5 acc 82.812 (83.066)	lr 0.00886
Train [72][920/3239]	Time 0.245 (0.718)	Data Time 0.001 (0.214)	Loss 2.5568 (2.5485)	Entropy 0.61781 (0.61871)	Top-1 acc 61.328 (62.420)	Top-5 acc 82.422 (83.066)	lr 0.00886
Train [72][930/3239]	Time 0.259 (0.727)	Data Time 0.001 (0.223)	Loss 2.3073 (2.5478)	Entropy 0.61767 (0.61869)	Top-1 acc 66.797 (62.433)	Top-5 acc 88.281 (83.079)	lr 0.00886
Train [72][940/3239]	Time 0.252 (0.724)	Data Time 0.001 (0.221)	Loss 2.3448 (2.5478)	Entropy 0.61756 (0.61868)	Top-1 acc 67.578 (62.429)	Top-5 acc 89.453 (83.083)	lr 0.00886
Train [72][950/3239]	Time 0.333 (0.724)	Data Time 0.001 (0.222)	Loss 2.7850 (2.5487)	Entropy 0.61753 (0.61867)	Top-1 acc 58.594 (62.396)	Top-5 acc 78.125 (83.065)	lr 0.00886
Train [72][960/3239]	Time 0.251 (0.729)	Data Time 0.001 (0.228)	Loss 2.6540 (2.5487)	Entropy 0.61734 (0.61866)	Top-1 acc 62.891 (62.409)	Top-5 acc 80.469 (83.062)	lr 0.00886
Train [72][970/3239]	Time 0.270 (0.726)	Data Time 0.001 (0.225)	Loss 2.5370 (2.5488)	Entropy 0.61730 (0.61865)	Top-1 acc 61.719 (62.409)	Top-5 acc 82.031 (83.059)	lr 0.00886
Train [72][980/3239]	Time 2.378 (0.733)	Data Time 2.103 (0.233)	Loss 2.6118 (2.5492)	Entropy 0.61764 (0.61863)	Top-1 acc 60.547 (62.397)	Top-5 acc 80.078 (83.049)	lr 0.00886
Train [72][990/3239]	Time 0.273 (0.734)	Data Time 0.001 (0.235)	Loss 2.3688 (2.5487)	Entropy 0.61754 (0.61862)	Top-1 acc 66.406 (62.403)	Top-5 acc 87.109 (83.060)	lr 0.00885
Train [72][1000/3239]	Time 0.264 (0.731)	Data Time 0.001 (0.233)	Loss 2.6301 (2.5486)	Entropy 0.61722 (0.61861)	Top-1 acc 60.156 (62.408)	Top-5 acc 82.422 (83.056)	lr 0.00885
Train [72][1010/3239]	Time 7.512 (0.738)	Data Time 7.265 (0.241)	Loss 2.3884 (2.5485)	Entropy 0.61715 (0.61860)	Top-1 acc 67.188 (62.410)	Top-5 acc 85.156 (83.052)	lr 0.00885
Train [72][1020/3239]	Time 3.629 (0.739)	Data Time 3.376 (0.242)	Loss 2.5851 (2.5484)	Entropy 0.61706 (0.61858)	Top-1 acc 61.719 (62.421)	Top-5 acc 82.422 (83.059)	lr 0.00885
Train [72][1030/3239]	Time 0.281 (0.736)	Data Time 0.001 (0.240)	Loss 2.4607 (2.5482)	Entropy 0.61691 (0.61857)	Top-1 acc 62.891 (62.419)	Top-5 acc 84.375 (83.059)	lr 0.00885
Train [72][1040/3239]	Time 0.244 (0.733)	Data Time 0.001 (0.238)	Loss 2.6573 (2.5480)	Entropy 0.61693 (0.61855)	Top-1 acc 59.375 (62.420)	Top-5 acc 80.859 (83.062)	lr 0.00885
Train [72][1050/3239]	Time 0.344 (0.741)	Data Time 0.001 (0.246)	Loss 2.4960 (2.5484)	Entropy 0.61664 (0.61853)	Top-1 acc 65.625 (62.423)	Top-5 acc 84.375 (83.049)	lr 0.00885
Train [72][1060/3239]	Time 0.237 (0.739)	Data Time 0.001 (0.245)	Loss 2.4605 (2.5481)	Entropy 0.61653 (0.61852)	Top-1 acc 64.062 (62.434)	Top-5 acc 86.328 (83.050)	lr 0.00885
Train [72][1070/3239]	Time 0.241 (0.740)	Data Time 0.001 (0.247)	Loss 2.6728 (2.5483)	Entropy 0.61672 (0.61850)	Top-1 acc 60.547 (62.442)	Top-5 acc 77.734 (83.057)	lr 0.00885
Train [72][1080/3239]	Time 0.233 (0.744)	Data Time 0.001 (0.251)	Loss 2.5978 (2.5485)	Entropy 0.61640 (0.61848)	Top-1 acc 60.547 (62.427)	Top-5 acc 81.641 (83.056)	lr 0.00885
Train [72][1090/3239]	Time 0.251 (0.743)	Data Time 0.001 (0.251)	Loss 2.6523 (2.5487)	Entropy 0.61624 (0.61846)	Top-1 acc 56.250 (62.414)	Top-5 acc 80.469 (83.051)	lr 0.00884
Train [72][1100/3239]	Time 0.250 (0.742)	Data Time 0.001 (0.251)	Loss 2.5278 (2.5483)	Entropy 0.61610 (0.61844)	Top-1 acc 60.938 (62.410)	Top-5 acc 86.328 (83.061)	lr 0.00884
Train [72][1110/3239]	Time 0.235 (0.748)	Data Time 0.001 (0.256)	Loss 2.6552 (2.5481)	Entropy 0.61622 (0.61842)	Top-1 acc 57.812 (62.410)	Top-5 acc 81.250 (83.067)	lr 0.00884
Train [72][1120/3239]	Time 0.373 (0.749)	Data Time 0.001 (0.258)	Loss 2.4976 (2.5478)	Entropy 0.61617 (0.61840)	Top-1 acc 62.500 (62.411)	Top-5 acc 82.812 (83.072)	lr 0.00884
Train [72][1130/3239]	Time 0.248 (0.752)	Data Time 0.001 (0.262)	Loss 2.6761 (2.5480)	Entropy 0.61606 (0.61838)	Top-1 acc 58.594 (62.408)	Top-5 acc 79.688 (83.065)	lr 0.00884
Train [72][1140/3239]	Time 0.260 (0.753)	Data Time 0.001 (0.264)	Loss 2.4156 (2.5482)	Entropy 0.61614 (0.61836)	Top-1 acc 66.797 (62.413)	Top-5 acc 84.375 (83.058)	lr 0.00884
Train [72][1150/3239]	Time 0.253 (0.795)	Data Time 0.002 (0.264)	Loss 2.4221 (2.5477)	Entropy 0.61636 (0.61834)	Top-1 acc 67.188 (62.429)	Top-5 acc 84.766 (83.065)	lr 0.00884
Train [72][1160/3239]	Time 0.255 (0.792)	Data Time 0.002 (0.262)	Loss 2.4919 (2.5472)	Entropy 0.61622 (0.61832)	Top-1 acc 63.672 (62.446)	Top-5 acc 84.375 (83.077)	lr 0.00884
Train [72][1170/3239]	Time 0.243 (0.789)	Data Time 0.001 (0.260)	Loss 2.5116 (2.5473)	Entropy 0.61642 (0.61831)	Top-1 acc 61.328 (62.438)	Top-5 acc 83.203 (83.077)	lr 0.00884
Train [72][1180/3239]	Time 0.240 (0.786)	Data Time 0.001 (0.258)	Loss 2.3654 (2.5473)	Entropy 0.61649 (0.61829)	Top-1 acc 69.141 (62.440)	Top-5 acc 86.328 (83.077)	lr 0.00884
Train [72][1190/3239]	Time 0.236 (0.783)	Data Time 0.001 (0.255)	Loss 2.6251 (2.5469)	Entropy 0.61627 (0.61827)	Top-1 acc 59.766 (62.446)	Top-5 acc 82.031 (83.089)	lr 0.00883
Train [72][1200/3239]	Time 0.236 (0.779)	Data Time 0.001 (0.253)	Loss 2.5707 (2.5471)	Entropy 0.61595 (0.61826)	Top-1 acc 62.109 (62.439)	Top-5 acc 81.641 (83.092)	lr 0.00883
Train [72][1210/3239]	Time 0.329 (0.777)	Data Time 0.001 (0.252)	Loss 2.4746 (2.5465)	Entropy 0.61591 (0.61824)	Top-1 acc 63.672 (62.445)	Top-5 acc 85.938 (83.102)	lr 0.00883
Train [72][1220/3239]	Time 0.278 (0.779)	Data Time 0.003 (0.255)	Loss 2.6981 (2.5469)	Entropy 0.61598 (0.61822)	Top-1 acc 58.203 (62.436)	Top-5 acc 82.812 (83.095)	lr 0.00883
Train [72][1230/3239]	Time 0.239 (0.777)	Data Time 0.001 (0.253)	Loss 2.3094 (2.5466)	Entropy 0.61595 (0.61820)	Top-1 acc 67.578 (62.448)	Top-5 acc 87.500 (83.105)	lr 0.00883
Train [72][1240/3239]	Time 0.635 (0.776)	Data Time 0.410 (0.253)	Loss 2.7326 (2.5465)	Entropy 0.61588 (0.61818)	Top-1 acc 59.375 (62.458)	Top-5 acc 80.469 (83.103)	lr 0.00883
Train [72][1250/3239]	Time 0.267 (0.784)	Data Time 0.001 (0.262)	Loss 2.3280 (2.5461)	Entropy 0.61574 (0.61816)	Top-1 acc 66.016 (62.467)	Top-5 acc 89.453 (83.114)	lr 0.00883
Train [72][1260/3239]	Time 0.229 (0.782)	Data Time 0.001 (0.260)	Loss 2.5032 (2.5468)	Entropy 0.61543 (0.61814)	Top-1 acc 65.234 (62.448)	Top-5 acc 82.031 (83.102)	lr 0.00883
Train [72][1270/3239]	Time 1.313 (0.780)	Data Time 1.068 (0.259)	Loss 2.3492 (2.5468)	Entropy 0.61530 (0.61812)	Top-1 acc 66.797 (62.446)	Top-5 acc 84.375 (83.101)	lr 0.00883
Train [72][1280/3239]	Time 0.267 (0.788)	Data Time 0.001 (0.268)	Loss 2.6992 (2.5464)	Entropy 0.61521 (0.61810)	Top-1 acc 60.156 (62.460)	Top-5 acc 79.688 (83.107)	lr 0.00883
Train [72][1290/3239]	Time 0.230 (0.789)	Data Time 0.001 (0.269)	Loss 2.4092 (2.5469)	Entropy 0.61533 (0.61808)	Top-1 acc 62.500 (62.455)	Top-5 acc 84.766 (83.094)	lr 0.00883
Train [72][1300/3239]	Time 0.246 (0.786)	Data Time 0.001 (0.267)	Loss 2.6045 (2.5467)	Entropy 0.61541 (0.61806)	Top-1 acc 64.062 (62.459)	Top-5 acc 80.469 (83.090)	lr 0.00882
Train [72][1310/3239]	Time 0.261 (0.796)	Data Time 0.001 (0.278)	Loss 2.4135 (2.5469)	Entropy 0.61583 (0.61804)	Top-1 acc 63.672 (62.451)	Top-5 acc 85.938 (83.085)	lr 0.00882
Train [72][1320/3239]	Time 0.274 (0.794)	Data Time 0.001 (0.277)	Loss 2.6481 (2.5469)	Entropy 0.61567 (0.61802)	Top-1 acc 59.766 (62.459)	Top-5 acc 78.516 (83.083)	lr 0.00882
Train [72][1330/3239]	Time 0.251 (0.792)	Data Time 0.001 (0.275)	Loss 2.8952 (2.5467)	Entropy 0.61510 (0.61800)	Top-1 acc 54.688 (62.465)	Top-5 acc 75.000 (83.083)	lr 0.00882
Train [72][1340/3239]	Time 0.251 (0.800)	Data Time 0.001 (0.284)	Loss 2.5668 (2.5472)	Entropy 0.61493 (0.61798)	Top-1 acc 63.672 (62.448)	Top-5 acc 84.375 (83.079)	lr 0.00882
Train [72][1350/3239]	Time 2.902 (0.801)	Data Time 2.618 (0.285)	Loss 2.5315 (2.5470)	Entropy 0.61455 (0.61795)	Top-1 acc 62.891 (62.450)	Top-5 acc 83.203 (83.079)	lr 0.00882
Train [72][1360/3239]	Time 0.271 (0.798)	Data Time 0.001 (0.283)	Loss 2.4723 (2.5469)	Entropy 0.61445 (0.61793)	Top-1 acc 66.406 (62.450)	Top-5 acc 85.547 (83.087)	lr 0.00882
Train [72][1370/3239]	Time 2.049 (0.805)	Data Time 1.666 (0.290)	Loss 2.6595 (2.5475)	Entropy 0.61419 (0.61790)	Top-1 acc 60.547 (62.441)	Top-5 acc 82.422 (83.077)	lr 0.00882
Train [72][1380/3239]	Time 0.246 (0.805)	Data Time 0.001 (0.291)	Loss 2.4254 (2.5473)	Entropy 0.61415 (0.61788)	Top-1 acc 66.016 (62.448)	Top-5 acc 85.938 (83.080)	lr 0.00882
Train [72][1390/3239]	Time 0.253 (0.807)	Data Time 0.001 (0.293)	Loss 2.8681 (2.5474)	Entropy 0.61412 (0.61785)	Top-1 acc 58.203 (62.449)	Top-5 acc 78.516 (83.083)	lr 0.00882
Train [72][1400/3239]	Time 0.312 (0.804)	Data Time 0.003 (0.291)	Loss 2.3872 (2.5477)	Entropy 0.61408 (0.61782)	Top-1 acc 64.453 (62.444)	Top-5 acc 84.766 (83.077)	lr 0.00881
Train [72][1410/3239]	Time 3.809 (0.810)	Data Time 3.546 (0.297)	Loss 2.4608 (2.5474)	Entropy 0.61402 (0.61780)	Top-1 acc 64.844 (62.452)	Top-5 acc 87.109 (83.088)	lr 0.00881
Train [72][1420/3239]	Time 0.272 (0.810)	Data Time 0.002 (0.297)	Loss 2.6016 (2.5475)	Entropy 0.61371 (0.61777)	Top-1 acc 61.719 (62.451)	Top-5 acc 80.469 (83.086)	lr 0.00881
Train [72][1430/3239]	Time 0.278 (0.807)	Data Time 0.001 (0.295)	Loss 2.6253 (2.5479)	Entropy 0.61356 (0.61774)	Top-1 acc 60.547 (62.456)	Top-5 acc 82.812 (83.073)	lr 0.00881
Train [72][1440/3239]	Time 0.327 (0.812)	Data Time 0.001 (0.300)	Loss 2.5868 (2.5478)	Entropy 0.61349 (0.61771)	Top-1 acc 61.719 (62.456)	Top-5 acc 83.203 (83.075)	lr 0.00881
Train [72][1450/3239]	Time 0.251 (0.815)	Data Time 0.001 (0.305)	Loss 2.4748 (2.5475)	Entropy 0.61363 (0.61768)	Top-1 acc 62.109 (62.461)	Top-5 acc 84.766 (83.078)	lr 0.00881
Train [72][1460/3239]	Time 0.277 (0.813)	Data Time 0.001 (0.302)	Loss 2.3701 (2.5475)	Entropy 0.61367 (0.61765)	Top-1 acc 66.797 (62.459)	Top-5 acc 86.328 (83.084)	lr 0.00881
Train [72][1470/3239]	Time 0.250 (0.816)	Data Time 0.001 (0.306)	Loss 2.4827 (2.5473)	Entropy 0.61365 (0.61763)	Top-1 acc 62.891 (62.456)	Top-5 acc 83.984 (83.095)	lr 0.00881
Train [72][1480/3239]	Time 0.231 (0.820)	Data Time 0.001 (0.311)	Loss 2.4825 (2.5479)	Entropy 0.61353 (0.61760)	Top-1 acc 66.016 (62.447)	Top-5 acc 86.328 (83.086)	lr 0.00881
Train [72][1490/3239]	Time 0.233 (0.817)	Data Time 0.001 (0.309)	Loss 2.4818 (2.5479)	Entropy 0.61332 (0.61757)	Top-1 acc 60.547 (62.444)	Top-5 acc 85.156 (83.085)	lr 0.00881
Train [72][1500/3239]	Time 0.246 (0.822)	Data Time 0.001 (0.314)	Loss 2.4673 (2.5476)	Entropy 0.61336 (0.61754)	Top-1 acc 65.625 (62.450)	Top-5 acc 83.594 (83.090)	lr 0.00880
Train [72][1510/3239]	Time 6.645 (0.826)	Data Time 6.407 (0.318)	Loss 2.3751 (2.5475)	Entropy 0.61370 (0.61752)	Top-1 acc 67.578 (62.453)	Top-5 acc 86.328 (83.090)	lr 0.00880
Train [72][1520/3239]	Time 0.234 (0.823)	Data Time 0.001 (0.316)	Loss 2.5579 (2.5473)	Entropy 0.61391 (0.61749)	Top-1 acc 63.281 (62.462)	Top-5 acc 83.594 (83.094)	lr 0.00880
Train [72][1530/3239]	Time 0.423 (0.825)	Data Time 0.001 (0.319)	Loss 2.6528 (2.5475)	Entropy 0.61380 (0.61747)	Top-1 acc 58.594 (62.453)	Top-5 acc 83.203 (83.085)	lr 0.00880
Train [72][1540/3239]	Time 0.240 (0.824)	Data Time 0.001 (0.319)	Loss 2.7234 (2.5479)	Entropy 0.61399 (0.61745)	Top-1 acc 58.984 (62.440)	Top-5 acc 78.125 (83.081)	lr 0.00880
Train [72][1550/3239]	Time 0.244 (0.826)	Data Time 0.001 (0.321)	Loss 2.7540 (2.5483)	Entropy 0.61405 (0.61742)	Top-1 acc 58.984 (62.427)	Top-5 acc 77.344 (83.075)	lr 0.00880
Train [72][1560/3239]	Time 0.243 (0.824)	Data Time 0.001 (0.319)	Loss 2.4030 (2.5483)	Entropy 0.61362 (0.61740)	Top-1 acc 64.453 (62.434)	Top-5 acc 85.938 (83.076)	lr 0.00880
Train [72][1570/3239]	Time 2.088 (0.830)	Data Time 1.831 (0.325)	Loss 2.7098 (2.5486)	Entropy 0.61386 (0.61738)	Top-1 acc 58.594 (62.428)	Top-5 acc 78.125 (83.066)	lr 0.00880
Train [72][1580/3239]	Time 0.243 (0.834)	Data Time 0.001 (0.330)	Loss 2.5048 (2.5487)	Entropy 0.61384 (0.61736)	Top-1 acc 62.891 (62.424)	Top-5 acc 85.156 (83.067)	lr 0.00880
Train [72][1590/3239]	Time 0.226 (0.831)	Data Time 0.001 (0.328)	Loss 2.5339 (2.5486)	Entropy 0.61389 (0.61733)	Top-1 acc 62.891 (62.428)	Top-5 acc 82.812 (83.069)	lr 0.00880
Train [72][1600/3239]	Time 2.141 (0.833)	Data Time 1.800 (0.330)	Loss 2.6176 (2.5488)	Entropy 0.61400 (0.61731)	Top-1 acc 63.281 (62.422)	Top-5 acc 82.031 (83.066)	lr 0.00880
Train [72][1610/3239]	Time 0.253 (0.839)	Data Time 0.001 (0.336)	Loss 2.5041 (2.5492)	Entropy 0.61404 (0.61729)	Top-1 acc 66.016 (62.416)	Top-5 acc 82.422 (83.055)	lr 0.00879
Train [72][1620/3239]	Time 0.230 (0.836)	Data Time 0.001 (0.334)	Loss 2.5167 (2.5494)	Entropy 0.61391 (0.61727)	Top-1 acc 62.891 (62.412)	Top-5 acc 82.422 (83.050)	lr 0.00879
Train [72][1630/3239]	Time 0.240 (0.837)	Data Time 0.001 (0.336)	Loss 2.5652 (2.5495)	Entropy 0.61367 (0.61725)	Top-1 acc 62.109 (62.410)	Top-5 acc 85.156 (83.048)	lr 0.00879
Train [72][1640/3239]	Time 0.251 (0.843)	Data Time 0.002 (0.343)	Loss 2.6058 (2.5494)	Entropy 0.61388 (0.61723)	Top-1 acc 60.938 (62.410)	Top-5 acc 83.594 (83.050)	lr 0.00879
Train [72][1650/3239]	Time 0.304 (0.844)	Data Time 0.001 (0.344)	Loss 2.6864 (2.5495)	Entropy 0.61394 (0.61721)	Top-1 acc 61.328 (62.409)	Top-5 acc 80.469 (83.046)	lr 0.00879
Train [72][1660/3239]	Time 0.237 (0.844)	Data Time 0.001 (0.344)	Loss 2.6799 (2.5495)	Entropy 0.61394 (0.61719)	Top-1 acc 60.938 (62.411)	Top-5 acc 77.734 (83.044)	lr 0.00879
Train [72][1670/3239]	Time 1.645 (0.851)	Data Time 1.384 (0.351)	Loss 2.5128 (2.5495)	Entropy 0.61402 (0.61717)	Top-1 acc 65.234 (62.410)	Top-5 acc 83.203 (83.044)	lr 0.00879
Train [72][1680/3239]	Time 0.228 (0.851)	Data Time 0.001 (0.352)	Loss 2.4385 (2.5494)	Entropy 0.61388 (0.61715)	Top-1 acc 67.188 (62.421)	Top-5 acc 85.938 (83.044)	lr 0.00879
Train [72][1690/3239]	Time 0.281 (0.850)	Data Time 0.001 (0.351)	Loss 2.9169 (2.5493)	Entropy 0.61368 (0.61713)	Top-1 acc 56.250 (62.423)	Top-5 acc 75.781 (83.041)	lr 0.00879
Train [72][1700/3239]	Time 0.236 (0.858)	Data Time 0.001 (0.359)	Loss 2.4746 (2.5488)	Entropy 0.61360 (0.61711)	Top-1 acc 66.016 (62.437)	Top-5 acc 79.688 (83.048)	lr 0.00879
Train [72][1710/3239]	Time 0.238 (0.858)	Data Time 0.001 (0.361)	Loss 2.6261 (2.5490)	Entropy 0.61339 (0.61709)	Top-1 acc 63.281 (62.435)	Top-5 acc 81.250 (83.040)	lr 0.00878
Train [72][1720/3239]	Time 0.245 (0.856)	Data Time 0.001 (0.359)	Loss 2.6132 (2.5492)	Entropy 0.61320 (0.61707)	Top-1 acc 58.984 (62.430)	Top-5 acc 83.203 (83.035)	lr 0.00878
Train [72][1730/3239]	Time 0.877 (0.864)	Data Time 0.630 (0.368)	Loss 2.6433 (2.5492)	Entropy 0.61316 (0.61705)	Top-1 acc 64.844 (62.430)	Top-5 acc 82.031 (83.035)	lr 0.00878
Train [72][1740/3239]	Time 0.250 (0.866)	Data Time 0.001 (0.369)	Loss 2.6594 (2.5492)	Entropy 0.61318 (0.61702)	Top-1 acc 58.203 (62.431)	Top-5 acc 81.250 (83.038)	lr 0.00878
Train [72][1750/3239]	Time 0.273 (0.863)	Data Time 0.001 (0.367)	Loss 2.3461 (2.5491)	Entropy 0.61314 (0.61700)	Top-1 acc 66.016 (62.431)	Top-5 acc 84.766 (83.036)	lr 0.00878
Train [72][1760/3239]	Time 7.536 (0.867)	Data Time 7.152 (0.372)	Loss 2.4489 (2.5492)	Entropy 0.61281 (0.61698)	Top-1 acc 64.453 (62.425)	Top-5 acc 82.812 (83.035)	lr 0.00878
Train [72][1770/3239]	Time 0.266 (0.868)	Data Time 0.001 (0.373)	Loss 2.5352 (2.5491)	Entropy 0.61273 (0.61695)	Top-1 acc 62.109 (62.423)	Top-5 acc 83.203 (83.036)	lr 0.00878
Train [72][1780/3239]	Time 0.244 (0.869)	Data Time 0.001 (0.373)	Loss 2.7121 (2.5491)	Entropy 0.61265 (0.61693)	Top-1 acc 61.328 (62.425)	Top-5 acc 82.031 (83.036)	lr 0.00878
Train [72][1790/3239]	Time 0.227 (0.871)	Data Time 0.001 (0.376)	Loss 2.6522 (2.5489)	Entropy 0.61258 (0.61691)	Top-1 acc 61.328 (62.431)	Top-5 acc 81.641 (83.041)	lr 0.00878
Train [72][1800/3239]	Time 0.330 (0.904)	Data Time 0.036 (0.383)	Loss 2.5561 (2.5493)	Entropy 0.61256 (0.61688)	Top-1 acc 61.719 (62.428)	Top-5 acc 83.203 (83.032)	lr 0.00878
Train [72][1810/3239]	Time 0.238 (0.901)	Data Time 0.002 (0.381)	Loss 2.6652 (2.5494)	Entropy 0.61233 (0.61686)	Top-1 acc 57.031 (62.423)	Top-5 acc 80.859 (83.029)	lr 0.00877
Train [72][1820/3239]	Time 0.252 (0.899)	Data Time 0.001 (0.379)	Loss 2.4656 (2.5491)	Entropy 0.61234 (0.61683)	Top-1 acc 60.938 (62.427)	Top-5 acc 86.328 (83.038)	lr 0.00877
Train [72][1830/3239]	Time 0.244 (0.896)	Data Time 0.001 (0.376)	Loss 2.4252 (2.5489)	Entropy 0.61233 (0.61681)	Top-1 acc 64.453 (62.436)	Top-5 acc 87.109 (83.040)	lr 0.00877
Train [72][1840/3239]	Time 0.241 (0.894)	Data Time 0.001 (0.374)	Loss 3.0322 (2.5490)	Entropy 0.61186 (0.61678)	Top-1 acc 48.438 (62.430)	Top-5 acc 76.953 (83.038)	lr 0.00877
Train [72][1850/3239]	Time 0.300 (0.891)	Data Time 0.001 (0.372)	Loss 2.5347 (2.5489)	Entropy 0.61172 (0.61676)	Top-1 acc 60.938 (62.432)	Top-5 acc 82.422 (83.035)	lr 0.00877
Train [72][1860/3239]	Time 0.235 (0.889)	Data Time 0.001 (0.370)	Loss 2.4509 (2.5489)	Entropy 0.61185 (0.61673)	Top-1 acc 64.453 (62.436)	Top-5 acc 85.938 (83.038)	lr 0.00877
Train [72][1870/3239]	Time 0.260 (0.893)	Data Time 0.001 (0.375)	Loss 2.6122 (2.5489)	Entropy 0.61172 (0.61670)	Top-1 acc 61.328 (62.434)	Top-5 acc 84.375 (83.043)	lr 0.00877
Train [72][1880/3239]	Time 0.250 (0.891)	Data Time 0.001 (0.373)	Loss 2.6927 (2.5490)	Entropy 0.61181 (0.61668)	Top-1 acc 58.594 (62.433)	Top-5 acc 81.250 (83.041)	lr 0.00877
Train [72][1890/3239]	Time 0.255 (0.889)	Data Time 0.001 (0.371)	Loss 2.5032 (2.5491)	Entropy 0.61175 (0.61665)	Top-1 acc 59.375 (62.429)	Top-5 acc 84.375 (83.041)	lr 0.00877
Train [72][1900/3239]	Time 0.265 (0.899)	Data Time 0.001 (0.382)	Loss 2.6118 (2.5491)	Entropy 0.61186 (0.61662)	Top-1 acc 60.547 (62.431)	Top-5 acc 80.469 (83.045)	lr 0.00877
Train [72][1910/3239]	Time 0.266 (0.899)	Data Time 0.001 (0.382)	Loss 2.5834 (2.5488)	Entropy 0.61197 (0.61660)	Top-1 acc 61.719 (62.438)	Top-5 acc 81.250 (83.046)	lr 0.00877
Train [72][1920/3239]	Time 0.389 (0.896)	Data Time 0.003 (0.380)	Loss 2.4146 (2.5489)	Entropy 0.61215 (0.61658)	Top-1 acc 69.141 (62.437)	Top-5 acc 86.328 (83.046)	lr 0.00876
Train [72][1930/3239]	Time 0.284 (0.900)	Data Time 0.002 (0.384)	Loss 2.5503 (2.5490)	Entropy 0.61206 (0.61655)	Top-1 acc 62.500 (62.433)	Top-5 acc 83.203 (83.044)	lr 0.00876
Train [72][1940/3239]	Time 0.274 (0.897)	Data Time 0.001 (0.382)	Loss 2.5878 (2.5491)	Entropy 0.61163 (0.61653)	Top-1 acc 58.594 (62.436)	Top-5 acc 84.375 (83.044)	lr 0.00876
Train [72][1950/3239]	Time 0.239 (0.895)	Data Time 0.001 (0.380)	Loss 2.5138 (2.5489)	Entropy 0.61145 (0.61650)	Top-1 acc 59.766 (62.437)	Top-5 acc 82.812 (83.048)	lr 0.00876
Train [72][1960/3239]	Time 11.067 (0.898)	Data Time 10.816 (0.384)	Loss 2.5866 (2.5486)	Entropy 0.61125 (0.61648)	Top-1 acc 60.938 (62.445)	Top-5 acc 82.812 (83.053)	lr 0.00876
Train [72][1970/3239]	Time 1.170 (0.897)	Data Time 0.923 (0.382)	Loss 2.5826 (2.5486)	Entropy 0.61155 (0.61645)	Top-1 acc 62.109 (62.442)	Top-5 acc 82.031 (83.053)	lr 0.00876
Train [72][1980/3239]	Time 0.249 (0.895)	Data Time 0.001 (0.380)	Loss 2.5334 (2.5490)	Entropy 0.61137 (0.61642)	Top-1 acc 64.062 (62.430)	Top-5 acc 82.422 (83.047)	lr 0.00876
Train [72][1990/3239]	Time 0.361 (0.892)	Data Time 0.001 (0.379)	Loss 2.4381 (2.5488)	Entropy 0.61166 (0.61640)	Top-1 acc 66.016 (62.439)	Top-5 acc 83.594 (83.052)	lr 0.00876
Train [72][2000/3239]	Time 0.235 (0.902)	Data Time 0.001 (0.389)	Loss 2.6196 (2.5490)	Entropy 0.61149 (0.61638)	Top-1 acc 60.938 (62.431)	Top-5 acc 81.250 (83.043)	lr 0.00876
Train [72][2010/3239]	Time 0.246 (0.900)	Data Time 0.001 (0.387)	Loss 2.7761 (2.5490)	Entropy 0.61149 (0.61635)	Top-1 acc 54.688 (62.430)	Top-5 acc 80.859 (83.045)	lr 0.00876
Train [72][2020/3239]	Time 0.248 (0.898)	Data Time 0.001 (0.385)	Loss 2.4916 (2.5489)	Entropy 0.61147 (0.61633)	Top-1 acc 64.062 (62.436)	Top-5 acc 85.547 (83.046)	lr 0.00875
Train [72][2030/3239]	Time 0.242 (0.909)	Data Time 0.001 (0.396)	Loss 2.6606 (2.5489)	Entropy 0.61156 (0.61630)	Top-1 acc 59.375 (62.432)	Top-5 acc 80.469 (83.041)	lr 0.00875
Train [72][2040/3239]	Time 0.248 (0.906)	Data Time 0.001 (0.394)	Loss 2.5437 (2.5494)	Entropy 0.61150 (0.61628)	Top-1 acc 59.766 (62.415)	Top-5 acc 84.375 (83.032)	lr 0.00875
Train [72][2050/3239]	Time 0.246 (0.904)	Data Time 0.001 (0.392)	Loss 2.6285 (2.5496)	Entropy 0.61152 (0.61626)	Top-1 acc 57.812 (62.413)	Top-5 acc 83.203 (83.027)	lr 0.00875
Train [72][2060/3239]	Time 2.997 (0.913)	Data Time 2.725 (0.402)	Loss 2.5740 (2.5498)	Entropy 0.61145 (0.61623)	Top-1 acc 62.500 (62.412)	Top-5 acc 83.984 (83.023)	lr 0.00875
Train [72][2070/3239]	Time 0.283 (0.911)	Data Time 0.001 (0.400)	Loss 2.6490 (2.5498)	Entropy 0.61142 (0.61621)	Top-1 acc 59.375 (62.411)	Top-5 acc 83.984 (83.019)	lr 0.00875
Train [72][2080/3239]	Time 0.344 (0.909)	Data Time 0.001 (0.398)	Loss 2.3482 (2.5497)	Entropy 0.61144 (0.61619)	Top-1 acc 67.578 (62.419)	Top-5 acc 85.938 (83.018)	lr 0.00875
Train [72][2090/3239]	Time 0.232 (0.917)	Data Time 0.001 (0.407)	Loss 2.5395 (2.5496)	Entropy 0.61128 (0.61617)	Top-1 acc 66.797 (62.421)	Top-5 acc 80.859 (83.019)	lr 0.00875
Train [72][2100/3239]	Time 0.237 (0.918)	Data Time 0.001 (0.408)	Loss 2.3082 (2.5495)	Entropy 0.61120 (0.61614)	Top-1 acc 67.188 (62.426)	Top-5 acc 87.500 (83.024)	lr 0.00875
Train [72][2110/3239]	Time 0.254 (0.916)	Data Time 0.001 (0.406)	Loss 2.6823 (2.5496)	Entropy 0.61090 (0.61612)	Top-1 acc 60.156 (62.427)	Top-5 acc 80.469 (83.021)	lr 0.00875
Train [72][2120/3239]	Time 8.653 (0.917)	Data Time 8.360 (0.408)	Loss 2.4986 (2.5497)	Entropy 0.61092 (0.61609)	Top-1 acc 64.062 (62.425)	Top-5 acc 83.594 (83.018)	lr 0.00875
Train [72][2130/3239]	Time 0.233 (0.915)	Data Time 0.001 (0.406)	Loss 2.5356 (2.5496)	Entropy 0.61090 (0.61607)	Top-1 acc 64.062 (62.427)	Top-5 acc 83.203 (83.021)	lr 0.00874
Train [72][2140/3239]	Time 0.238 (0.913)	Data Time 0.001 (0.404)	Loss 2.4537 (2.5493)	Entropy 0.61082 (0.61604)	Top-1 acc 63.281 (62.435)	Top-5 acc 86.328 (83.027)	lr 0.00874
Train [72][2150/3239]	Time 0.343 (0.911)	Data Time 0.001 (0.402)	Loss 2.6490 (2.5496)	Entropy 0.61079 (0.61602)	Top-1 acc 57.812 (62.426)	Top-5 acc 82.031 (83.020)	lr 0.00874
Train [72][2160/3239]	Time 0.256 (0.914)	Data Time 0.001 (0.406)	Loss 2.5151 (2.5494)	Entropy 0.61053 (0.61600)	Top-1 acc 63.281 (62.434)	Top-5 acc 81.641 (83.021)	lr 0.00874
Train [72][2170/3239]	Time 0.238 (0.912)	Data Time 0.001 (0.404)	Loss 2.5758 (2.5496)	Entropy 0.61029 (0.61597)	Top-1 acc 58.984 (62.428)	Top-5 acc 81.641 (83.018)	lr 0.00874
Train [72][2180/3239]	Time 0.251 (0.909)	Data Time 0.001 (0.402)	Loss 2.5281 (2.5496)	Entropy 0.60996 (0.61595)	Top-1 acc 63.672 (62.431)	Top-5 acc 82.812 (83.016)	lr 0.00874
Train [72][2190/3239]	Time 0.234 (0.912)	Data Time 0.001 (0.405)	Loss 2.6947 (2.5497)	Entropy 0.61030 (0.61592)	Top-1 acc 58.203 (62.427)	Top-5 acc 78.516 (83.010)	lr 0.00874
Train [72][2200/3239]	Time 0.218 (0.910)	Data Time 0.001 (0.403)	Loss 2.7771 (2.5498)	Entropy 0.61023 (0.61589)	Top-1 acc 58.594 (62.431)	Top-5 acc 79.297 (83.004)	lr 0.00874
Train [72][2210/3239]	Time 0.232 (0.910)	Data Time 0.001 (0.404)	Loss 2.5433 (2.5496)	Entropy 0.61004 (0.61587)	Top-1 acc 62.500 (62.438)	Top-5 acc 81.250 (83.007)	lr 0.00874
Train [72][2220/3239]	Time 0.280 (0.911)	Data Time 0.002 (0.405)	Loss 2.4714 (2.5498)	Entropy 0.61003 (0.61584)	Top-1 acc 65.234 (62.438)	Top-5 acc 85.547 (83.000)	lr 0.00874
Train [72][2230/3239]	Time 0.250 (0.908)	Data Time 0.002 (0.403)	Loss 2.7049 (2.5498)	Entropy 0.61021 (0.61581)	Top-1 acc 60.156 (62.433)	Top-5 acc 82.031 (83.002)	lr 0.00873
Train [72][2240/3239]	Time 0.351 (0.908)	Data Time 0.001 (0.403)	Loss 2.4947 (2.5499)	Entropy 0.61008 (0.61579)	Top-1 acc 64.844 (62.432)	Top-5 acc 83.203 (83.000)	lr 0.00873
Train [72][2250/3239]	Time 0.318 (0.909)	Data Time 0.002 (0.404)	Loss 2.4722 (2.5499)	Entropy 0.61001 (0.61576)	Top-1 acc 66.797 (62.428)	Top-5 acc 84.766 (83.001)	lr 0.00873
Train [72][2260/3239]	Time 0.254 (0.907)	Data Time 0.002 (0.402)	Loss 2.5253 (2.5498)	Entropy 0.60979 (0.61574)	Top-1 acc 62.109 (62.429)	Top-5 acc 82.812 (83.002)	lr 0.00873
Train [72][2270/3239]	Time 0.249 (0.906)	Data Time 0.001 (0.401)	Loss 2.5792 (2.5498)	Entropy 0.60978 (0.61571)	Top-1 acc 60.156 (62.430)	Top-5 acc 83.203 (83.005)	lr 0.00873
Train [72][2280/3239]	Time 7.823 (0.907)	Data Time 7.541 (0.403)	Loss 2.6716 (2.5495)	Entropy 0.60978 (0.61569)	Top-1 acc 59.375 (62.440)	Top-5 acc 80.078 (83.007)	lr 0.00873
Train [72][2290/3239]	Time 1.381 (0.907)	Data Time 1.124 (0.403)	Loss 2.6978 (2.5496)	Entropy 0.60989 (0.61566)	Top-1 acc 62.109 (62.439)	Top-5 acc 82.031 (83.009)	lr 0.00873
Train [72][2300/3239]	Time 0.226 (0.908)	Data Time 0.001 (0.404)	Loss 2.5087 (2.5499)	Entropy 0.60983 (0.61563)	Top-1 acc 63.281 (62.429)	Top-5 acc 82.031 (83.003)	lr 0.00873
Train [72][2310/3239]	Time 0.354 (0.906)	Data Time 0.001 (0.403)	Loss 2.7897 (2.5502)	Entropy 0.60993 (0.61561)	Top-1 acc 55.859 (62.421)	Top-5 acc 76.953 (82.997)	lr 0.00873
Train [72][2320/3239]	Time 0.234 (0.911)	Data Time 0.002 (0.408)	Loss 2.4929 (2.5505)	Entropy 0.60964 (0.61558)	Top-1 acc 64.453 (62.410)	Top-5 acc 84.375 (82.992)	lr 0.00873
Train [72][2330/3239]	Time 0.237 (0.912)	Data Time 0.001 (0.409)	Loss 2.6860 (2.5502)	Entropy 0.60931 (0.61556)	Top-1 acc 57.031 (62.420)	Top-5 acc 82.031 (82.995)	lr 0.00872
Train [72][2340/3239]	Time 0.241 (0.912)	Data Time 0.001 (0.410)	Loss 2.4999 (2.5503)	Entropy 0.60923 (0.61553)	Top-1 acc 63.672 (62.414)	Top-5 acc 83.984 (82.991)	lr 0.00872
Train [72][2350/3239]	Time 0.271 (0.920)	Data Time 0.001 (0.418)	Loss 2.5950 (2.5503)	Entropy 0.60900 (0.61550)	Top-1 acc 62.500 (62.416)	Top-5 acc 80.469 (82.991)	lr 0.00872
Train [72][2360/3239]	Time 0.244 (0.919)	Data Time 0.001 (0.417)	Loss 2.4833 (2.5500)	Entropy 0.60896 (0.61548)	Top-1 acc 60.938 (62.421)	Top-5 acc 83.203 (82.990)	lr 0.00872
Train [72][2370/3239]	Time 0.258 (0.919)	Data Time 0.002 (0.417)	Loss 2.6006 (2.5501)	Entropy 0.60898 (0.61545)	Top-1 acc 58.984 (62.417)	Top-5 acc 81.250 (82.992)	lr 0.00872
Train [72][2380/3239]	Time 0.542 (0.923)	Data Time 0.001 (0.421)	Loss 2.6919 (2.5500)	Entropy 0.60901 (0.61542)	Top-1 acc 57.031 (62.417)	Top-5 acc 78.906 (82.992)	lr 0.00872
Train [72][2390/3239]	Time 0.254 (0.921)	Data Time 0.001 (0.420)	Loss 2.5987 (2.5502)	Entropy 0.60914 (0.61540)	Top-1 acc 61.328 (62.413)	Top-5 acc 83.984 (82.988)	lr 0.00872
Train [72][2400/3239]	Time 0.259 (0.923)	Data Time 0.002 (0.422)	Loss 2.4638 (2.5500)	Entropy 0.60932 (0.61537)	Top-1 acc 63.672 (62.419)	Top-5 acc 82.031 (82.989)	lr 0.00872
Train [72][2410/3239]	Time 0.230 (0.928)	Data Time 0.001 (0.427)	Loss 2.5969 (2.5501)	Entropy 0.60962 (0.61535)	Top-1 acc 60.938 (62.419)	Top-5 acc 82.812 (82.987)	lr 0.00872
Train [72][2420/3239]	Time 0.237 (0.927)	Data Time 0.001 (0.426)	Loss 2.6331 (2.5503)	Entropy 0.60997 (0.61532)	Top-1 acc 60.547 (62.410)	Top-5 acc 82.422 (82.984)	lr 0.00872
Train [72][2430/3239]	Time 0.253 (0.929)	Data Time 0.001 (0.429)	Loss 2.7610 (2.5505)	Entropy 0.61033 (0.61530)	Top-1 acc 56.250 (62.405)	Top-5 acc 80.859 (82.979)	lr 0.00872
Train [72][2440/3239]	Time 17.137 (0.935)	Data Time 16.871 (0.435)	Loss 2.6514 (2.5506)	Entropy 0.61034 (0.61528)	Top-1 acc 58.203 (62.402)	Top-5 acc 81.250 (82.977)	lr 0.00871
Train [72][2450/3239]	Time 2.156 (0.934)	Data Time 1.909 (0.434)	Loss 2.7180 (2.5506)	Entropy 0.61033 (0.61526)	Top-1 acc 59.766 (62.404)	Top-5 acc 78.906 (82.978)	lr 0.00871
Train [72][2460/3239]	Time 0.344 (0.951)	Data Time 0.002 (0.433)	Loss 2.6092 (2.5507)	Entropy 0.61040 (0.61524)	Top-1 acc 60.547 (62.401)	Top-5 acc 82.812 (82.977)	lr 0.00871
Train [72][2470/3239]	Time 0.366 (0.949)	Data Time 0.002 (0.431)	Loss 2.6844 (2.5507)	Entropy 0.61017 (0.61522)	Top-1 acc 61.719 (62.402)	Top-5 acc 78.906 (82.979)	lr 0.00871
Train [72][2480/3239]	Time 0.242 (0.947)	Data Time 0.001 (0.429)	Loss 2.6120 (2.5507)	Entropy 0.61037 (0.61520)	Top-1 acc 59.766 (62.399)	Top-5 acc 83.203 (82.978)	lr 0.00871
Train [72][2490/3239]	Time 0.253 (0.945)	Data Time 0.002 (0.427)	Loss 2.4265 (2.5508)	Entropy 0.61035 (0.61518)	Top-1 acc 66.797 (62.402)	Top-5 acc 85.156 (82.976)	lr 0.00871
Train [72][2500/3239]	Time 0.259 (0.943)	Data Time 0.001 (0.426)	Loss 2.4123 (2.5507)	Entropy 0.61017 (0.61516)	Top-1 acc 66.797 (62.403)	Top-5 acc 85.547 (82.977)	lr 0.00871
Train [72][2510/3239]	Time 0.240 (0.943)	Data Time 0.001 (0.426)	Loss 2.4455 (2.5506)	Entropy 0.61027 (0.61514)	Top-1 acc 65.234 (62.405)	Top-5 acc 83.203 (82.983)	lr 0.00871
Train [72][2520/3239]	Time 0.304 (0.946)	Data Time 0.004 (0.429)	Loss 2.4692 (2.5507)	Entropy 0.61049 (0.61512)	Top-1 acc 62.500 (62.402)	Top-5 acc 85.156 (82.985)	lr 0.00871
Train [72][2530/3239]	Time 0.238 (0.945)	Data Time 0.001 (0.428)	Loss 2.6683 (2.5507)	Entropy 0.61040 (0.61510)	Top-1 acc 59.766 (62.408)	Top-5 acc 80.078 (82.986)	lr 0.00871
Train [72][2540/3239]	Time 1.924 (0.950)	Data Time 1.670 (0.433)	Loss 2.6054 (2.5508)	Entropy 0.61044 (0.61509)	Top-1 acc 62.109 (62.406)	Top-5 acc 84.375 (82.983)	lr 0.00870
Train [72][2550/3239]	Time 0.262 (0.950)	Data Time 0.001 (0.433)	Loss 2.5167 (2.5508)	Entropy 0.61052 (0.61507)	Top-1 acc 64.062 (62.406)	Top-5 acc 83.203 (82.987)	lr 0.00870
Train [72][2560/3239]	Time 0.288 (0.951)	Data Time 0.001 (0.435)	Loss 2.3109 (2.5506)	Entropy 0.61035 (0.61505)	Top-1 acc 71.094 (62.412)	Top-5 acc 88.672 (82.990)	lr 0.00870
Train [72][2570/3239]	Time 0.255 (0.953)	Data Time 0.001 (0.437)	Loss 2.5786 (2.5506)	Entropy 0.60955 (0.61503)	Top-1 acc 62.891 (62.412)	Top-5 acc 82.812 (82.989)	lr 0.00870
Train [72][2580/3239]	Time 0.239 (0.957)	Data Time 0.002 (0.442)	Loss 2.5995 (2.5507)	Entropy 0.60930 (0.61501)	Top-1 acc 60.156 (62.413)	Top-5 acc 80.859 (82.989)	lr 0.00870
Train [72][2590/3239]	Time 0.251 (0.957)	Data Time 0.001 (0.442)	Loss 2.6282 (2.5505)	Entropy 0.60907 (0.61499)	Top-1 acc 60.156 (62.417)	Top-5 acc 81.641 (82.993)	lr 0.00870
Train [72][2600/3239]	Time 8.711 (0.959)	Data Time 8.454 (0.444)	Loss 2.5929 (2.5506)	Entropy 0.60893 (0.61496)	Top-1 acc 61.719 (62.414)	Top-5 acc 81.641 (82.989)	lr 0.00870
Train [72][2610/3239]	Time 0.995 (0.961)	Data Time 0.742 (0.447)	Loss 2.6336 (2.5505)	Entropy 0.60909 (0.61494)	Top-1 acc 60.938 (62.414)	Top-5 acc 81.641 (82.991)	lr 0.00870
Train [72][2620/3239]	Time 0.231 (0.963)	Data Time 0.001 (0.449)	Loss 2.7349 (2.5503)	Entropy 0.60896 (0.61492)	Top-1 acc 56.641 (62.419)	Top-5 acc 81.250 (82.994)	lr 0.00870
Train [72][2630/3239]	Time 0.369 (0.962)	Data Time 0.001 (0.448)	Loss 2.7368 (2.5504)	Entropy 0.60857 (0.61490)	Top-1 acc 58.594 (62.418)	Top-5 acc 80.859 (82.990)	lr 0.00870
Train [72][2640/3239]	Time 0.243 (0.966)	Data Time 0.001 (0.452)	Loss 2.5886 (2.5505)	Entropy 0.60855 (0.61487)	Top-1 acc 64.453 (62.416)	Top-5 acc 83.984 (82.989)	lr 0.00869
Train [72][2650/3239]	Time 0.228 (0.971)	Data Time 0.001 (0.457)	Loss 2.4366 (2.5503)	Entropy 0.60871 (0.61485)	Top-1 acc 71.094 (62.420)	Top-5 acc 85.156 (82.996)	lr 0.00869
Train [72][2660/3239]	Time 1.767 (0.969)	Data Time 1.504 (0.456)	Loss 2.3847 (2.5502)	Entropy 0.60859 (0.61482)	Top-1 acc 65.234 (62.421)	Top-5 acc 87.109 (82.998)	lr 0.00869
Train [72][2670/3239]	Time 0.233 (0.974)	Data Time 0.001 (0.461)	Loss 2.8456 (2.5505)	Entropy 0.60858 (0.61480)	Top-1 acc 55.859 (62.419)	Top-5 acc 79.297 (82.991)	lr 0.00869
Train [72][2680/3239]	Time 0.247 (0.976)	Data Time 0.001 (0.463)	Loss 2.5936 (2.5505)	Entropy 0.60847 (0.61478)	Top-1 acc 64.062 (62.415)	Top-5 acc 82.422 (82.992)	lr 0.00869
Train [72][2690/3239]	Time 0.227 (0.975)	Data Time 0.001 (0.463)	Loss 2.6102 (2.5506)	Entropy 0.60805 (0.61475)	Top-1 acc 61.719 (62.408)	Top-5 acc 83.203 (82.992)	lr 0.00869
Train [72][2700/3239]	Time 5.081 (0.979)	Data Time 4.723 (0.467)	Loss 2.3612 (2.5504)	Entropy 0.60803 (0.61473)	Top-1 acc 67.578 (62.411)	Top-5 acc 86.328 (82.996)	lr 0.00869
Train [72][2710/3239]	Time 0.239 (0.979)	Data Time 0.001 (0.468)	Loss 2.5741 (2.5506)	Entropy 0.60761 (0.61470)	Top-1 acc 64.844 (62.406)	Top-5 acc 82.031 (82.992)	lr 0.00869
Train [72][2720/3239]	Time 0.279 (0.980)	Data Time 0.004 (0.469)	Loss 2.4372 (2.5507)	Entropy 0.60759 (0.61468)	Top-1 acc 67.969 (62.405)	Top-5 acc 85.156 (82.988)	lr 0.00869
Train [72][2730/3239]	Time 0.236 (0.983)	Data Time 0.001 (0.472)	Loss 2.4204 (2.5507)	Entropy 0.60770 (0.61465)	Top-1 acc 69.141 (62.403)	Top-5 acc 83.594 (82.985)	lr 0.00869
Train [72][2740/3239]	Time 0.277 (0.984)	Data Time 0.001 (0.473)	Loss 2.5065 (2.5508)	Entropy 0.60752 (0.61463)	Top-1 acc 65.625 (62.402)	Top-5 acc 81.250 (82.982)	lr 0.00869
Train [72][2750/3239]	Time 0.235 (0.985)	Data Time 0.002 (0.475)	Loss 2.4586 (2.5509)	Entropy 0.60706 (0.61460)	Top-1 acc 66.797 (62.401)	Top-5 acc 83.984 (82.983)	lr 0.00868
Train [72][2760/3239]	Time 11.859 (0.990)	Data Time 11.609 (0.480)	Loss 2.7933 (2.5509)	Entropy 0.60739 (0.61457)	Top-1 acc 55.469 (62.400)	Top-5 acc 78.516 (82.981)	lr 0.00868
Train [72][2770/3239]	Time 2.398 (0.989)	Data Time 2.146 (0.479)	Loss 2.5772 (2.5508)	Entropy 0.60747 (0.61455)	Top-1 acc 62.500 (62.400)	Top-5 acc 83.203 (82.985)	lr 0.00868
Train [72][2780/3239]	Time 0.928 (0.990)	Data Time 0.682 (0.480)	Loss 2.5757 (2.5509)	Entropy 0.60735 (0.61452)	Top-1 acc 60.938 (62.397)	Top-5 acc 82.812 (82.985)	lr 0.00868
Train [72][2790/3239]	Time 0.384 (0.990)	Data Time 0.001 (0.481)	Loss 2.5089 (2.5508)	Entropy 0.60744 (0.61450)	Top-1 acc 62.891 (62.400)	Top-5 acc 84.766 (82.989)	lr 0.00868
Train [72][2800/3239]	Time 0.276 (0.993)	Data Time 0.001 (0.484)	Loss 2.5555 (2.5507)	Entropy 0.60736 (0.61447)	Top-1 acc 65.625 (62.404)	Top-5 acc 82.031 (82.989)	lr 0.00868
Train [72][2810/3239]	Time 0.238 (0.995)	Data Time 0.001 (0.486)	Loss 2.5404 (2.5508)	Entropy 0.60713 (0.61445)	Top-1 acc 60.547 (62.402)	Top-5 acc 84.766 (82.988)	lr 0.00868
Train [72][2820/3239]	Time 4.000 (0.995)	Data Time 3.752 (0.487)	Loss 2.6967 (2.5508)	Entropy 0.60731 (0.61442)	Top-1 acc 59.766 (62.401)	Top-5 acc 80.078 (82.987)	lr 0.00868
Train [72][2830/3239]	Time 0.227 (1.000)	Data Time 0.001 (0.492)	Loss 2.7759 (2.5508)	Entropy 0.60726 (0.61439)	Top-1 acc 57.812 (62.402)	Top-5 acc 79.688 (82.990)	lr 0.00868
Train [72][2840/3239]	Time 0.258 (1.004)	Data Time 0.002 (0.496)	Loss 2.6615 (2.5509)	Entropy 0.60707 (0.61437)	Top-1 acc 60.547 (62.402)	Top-5 acc 79.297 (82.988)	lr 0.00868
Train [72][2850/3239]	Time 0.233 (1.002)	Data Time 0.001 (0.495)	Loss 2.6009 (2.5510)	Entropy 0.60676 (0.61434)	Top-1 acc 63.281 (62.402)	Top-5 acc 78.516 (82.985)	lr 0.00867
Train [72][2860/3239]	Time 2.383 (1.005)	Data Time 1.992 (0.498)	Loss 2.3896 (2.5509)	Entropy 0.60692 (0.61432)	Top-1 acc 66.016 (62.405)	Top-5 acc 83.984 (82.985)	lr 0.00867
Train [72][2870/3239]	Time 0.244 (1.003)	Data Time 0.001 (0.496)	Loss 2.6959 (2.5509)	Entropy 0.60695 (0.61429)	Top-1 acc 60.938 (62.403)	Top-5 acc 77.344 (82.983)	lr 0.00867
Train [72][2880/3239]	Time 0.239 (1.006)	Data Time 0.001 (0.499)	Loss 2.7111 (2.5509)	Entropy 0.60678 (0.61427)	Top-1 acc 54.297 (62.399)	Top-5 acc 77.734 (82.981)	lr 0.00867
Train [72][2890/3239]	Time 0.240 (1.008)	Data Time 0.001 (0.502)	Loss 2.4307 (2.5507)	Entropy 0.60650 (0.61424)	Top-1 acc 66.016 (62.406)	Top-5 acc 85.547 (82.982)	lr 0.00867
Train [72][2900/3239]	Time 0.233 (1.008)	Data Time 0.001 (0.502)	Loss 2.3494 (2.5505)	Entropy 0.60645 (0.61421)	Top-1 acc 68.750 (62.413)	Top-5 acc 87.500 (82.988)	lr 0.00867
Train [72][2910/3239]	Time 0.231 (1.011)	Data Time 0.001 (0.505)	Loss 2.6120 (2.5508)	Entropy 0.60659 (0.61419)	Top-1 acc 60.156 (62.407)	Top-5 acc 80.469 (82.980)	lr 0.00867
Train [72][2920/3239]	Time 17.999 (1.015)	Data Time 17.746 (0.509)	Loss 2.4103 (2.5506)	Entropy 0.60624 (0.61416)	Top-1 acc 61.328 (62.407)	Top-5 acc 85.156 (82.980)	lr 0.00867
Train [72][2930/3239]	Time 0.257 (1.015)	Data Time 0.001 (0.510)	Loss 2.5164 (2.5508)	Entropy 0.60638 (0.61413)	Top-1 acc 63.672 (62.404)	Top-5 acc 82.812 (82.977)	lr 0.00867
Train [72][2940/3239]	Time 0.232 (1.016)	Data Time 0.001 (0.511)	Loss 2.3757 (2.5505)	Entropy 0.60617 (0.61411)	Top-1 acc 66.797 (62.415)	Top-5 acc 85.156 (82.980)	lr 0.00867
Train [72][2950/3239]	Time 0.283 (1.014)	Data Time 0.001 (0.510)	Loss 2.5362 (2.5504)	Entropy 0.60616 (0.61408)	Top-1 acc 60.547 (62.417)	Top-5 acc 82.422 (82.983)	lr 0.00867
Train [72][2960/3239]	Time 0.232 (1.020)	Data Time 0.001 (0.516)	Loss 2.4424 (2.5506)	Entropy 0.60616 (0.61405)	Top-1 acc 62.109 (62.415)	Top-5 acc 83.984 (82.979)	lr 0.00866
Train [72][2970/3239]	Time 0.237 (1.022)	Data Time 0.001 (0.518)	Loss 2.5236 (2.5506)	Entropy 0.60605 (0.61402)	Top-1 acc 66.797 (62.418)	Top-5 acc 83.203 (82.980)	lr 0.00866
Train [72][2980/3239]	Time 0.242 (1.020)	Data Time 0.001 (0.516)	Loss 2.4558 (2.5504)	Entropy 0.60648 (0.61400)	Top-1 acc 64.844 (62.420)	Top-5 acc 84.766 (82.981)	lr 0.00866
Train [72][2990/3239]	Time 0.236 (1.027)	Data Time 0.001 (0.523)	Loss 2.4581 (2.5503)	Entropy 0.60676 (0.61397)	Top-1 acc 64.062 (62.425)	Top-5 acc 85.547 (82.986)	lr 0.00866
Train [72][3000/3239]	Time 0.237 (1.029)	Data Time 0.001 (0.526)	Loss 2.6022 (2.5504)	Entropy 0.60692 (0.61395)	Top-1 acc 63.281 (62.424)	Top-5 acc 82.812 (82.984)	lr 0.00866
Train [72][3010/3239]	Time 0.278 (1.027)	Data Time 0.002 (0.525)	Loss 2.8003 (2.5504)	Entropy 0.60691 (0.61393)	Top-1 acc 55.469 (62.422)	Top-5 acc 76.172 (82.983)	lr 0.00866
Train [72][3020/3239]	Time 14.513 (1.031)	Data Time 14.160 (0.529)	Loss 2.5055 (2.5505)	Entropy 0.60672 (0.61390)	Top-1 acc 59.766 (62.422)	Top-5 acc 84.375 (82.981)	lr 0.00866
Train [72][3030/3239]	Time 0.239 (1.029)	Data Time 0.001 (0.527)	Loss 2.6243 (2.5504)	Entropy 0.60678 (0.61388)	Top-1 acc 62.500 (62.420)	Top-5 acc 82.812 (82.986)	lr 0.00866
Train [72][3040/3239]	Time 0.233 (1.031)	Data Time 0.001 (0.529)	Loss 2.5419 (2.5502)	Entropy 0.60654 (0.61386)	Top-1 acc 63.281 (62.426)	Top-5 acc 85.547 (82.991)	lr 0.00866
Train [72][3050/3239]	Time 0.237 (1.031)	Data Time 0.001 (0.529)	Loss 2.6047 (2.5503)	Entropy 0.60639 (0.61383)	Top-1 acc 58.594 (62.419)	Top-5 acc 80.469 (82.986)	lr 0.00866
Train [72][3060/3239]	Time 0.228 (1.032)	Data Time 0.001 (0.531)	Loss 2.4294 (2.5504)	Entropy 0.60613 (0.61381)	Top-1 acc 64.453 (62.419)	Top-5 acc 85.547 (82.986)	lr 0.00865
Train [72][3070/3239]	Time 0.265 (1.035)	Data Time 0.001 (0.534)	Loss 2.5179 (2.5502)	Entropy 0.60591 (0.61378)	Top-1 acc 64.062 (62.423)	Top-5 acc 83.984 (82.990)	lr 0.00865
Train [72][3080/3239]	Time 4.295 (1.034)	Data Time 4.019 (0.533)	Loss 2.4936 (2.5502)	Entropy 0.60601 (0.61376)	Top-1 acc 65.234 (62.424)	Top-5 acc 85.547 (82.991)	lr 0.00865
Train [72][3090/3239]	Time 0.417 (1.037)	Data Time 0.002 (0.536)	Loss 2.3229 (2.5502)	Entropy 0.60631 (0.61373)	Top-1 acc 67.969 (62.425)	Top-5 acc 87.891 (82.992)	lr 0.00865
Train [72][3100/3239]	Time 0.235 (1.041)	Data Time 0.001 (0.540)	Loss 2.5485 (2.5503)	Entropy 0.60632 (0.61371)	Top-1 acc 60.938 (62.424)	Top-5 acc 82.031 (82.989)	lr 0.00865
Train [72][3110/3239]	Time 0.566 (1.054)	Data Time 0.004 (0.538)	Loss 2.5227 (2.5502)	Entropy 0.60632 (0.61368)	Top-1 acc 64.844 (62.424)	Top-5 acc 85.156 (82.992)	lr 0.00865
Train [72][3120/3239]	Time 0.251 (1.052)	Data Time 0.002 (0.537)	Loss 2.4968 (2.5502)	Entropy 0.60630 (0.61366)	Top-1 acc 62.500 (62.424)	Top-5 acc 83.984 (82.993)	lr 0.00865
Train [72][3130/3239]	Time 0.240 (1.050)	Data Time 0.002 (0.535)	Loss 2.7256 (2.5503)	Entropy 0.60651 (0.61364)	Top-1 acc 54.297 (62.421)	Top-5 acc 80.078 (82.994)	lr 0.00865
Train [72][3140/3239]	Time 0.240 (1.048)	Data Time 0.001 (0.533)	Loss 2.3878 (2.5503)	Entropy 0.60649 (0.61361)	Top-1 acc 68.750 (62.422)	Top-5 acc 85.547 (82.995)	lr 0.00865
Train [72][3150/3239]	Time 0.248 (1.047)	Data Time 0.001 (0.533)	Loss 2.6784 (2.5505)	Entropy 0.60632 (0.61359)	Top-1 acc 60.938 (62.419)	Top-5 acc 80.859 (82.991)	lr 0.00865
Train [72][3160/3239]	Time 0.243 (1.049)	Data Time 0.001 (0.535)	Loss 2.6053 (2.5505)	Entropy 0.60626 (0.61357)	Top-1 acc 58.594 (62.414)	Top-5 acc 85.547 (82.992)	lr 0.00864
Train [72][3170/3239]	Time 0.260 (1.047)	Data Time 0.001 (0.533)	Loss 2.4722 (2.5504)	Entropy 0.60645 (0.61355)	Top-1 acc 65.234 (62.417)	Top-5 acc 83.984 (82.991)	lr 0.00864
Train [72][3180/3239]	Time 9.769 (1.051)	Data Time 9.363 (0.537)	Loss 2.7549 (2.5503)	Entropy 0.60658 (0.61352)	Top-1 acc 58.594 (62.419)	Top-5 acc 79.688 (82.993)	lr 0.00864
Train [72][3190/3239]	Time 0.246 (1.049)	Data Time 0.000 (0.536)	Loss 2.3372 (2.5503)	Entropy 0.60671 (0.61350)	Top-1 acc 67.969 (62.419)	Top-5 acc 86.328 (82.994)	lr 0.00864
Train [72][3200/3239]	Time 0.231 (1.052)	Data Time 0.000 (0.538)	Loss 2.6294 (2.5501)	Entropy 0.60683 (0.61348)	Top-1 acc 60.156 (62.424)	Top-5 acc 83.203 (82.999)	lr 0.00864
Train [72][3210/3239]	Time 0.308 (1.052)	Data Time 0.000 (0.538)	Loss 2.4009 (2.5502)	Entropy 0.60700 (0.61346)	Top-1 acc 64.453 (62.424)	Top-5 acc 86.328 (82.999)	lr 0.00864
Train [72][3220/3239]	Time 0.234 (1.052)	Data Time 0.000 (0.539)	Loss 2.7387 (2.5501)	Entropy 0.60699 (0.61344)	Top-1 acc 59.375 (62.424)	Top-5 acc 80.078 (83.000)	lr 0.00864
Train [72][3230/3239]	Time 0.253 (1.054)	Data Time 0.000 (0.541)	Loss 2.6347 (2.5499)	Entropy 0.60683 (0.61342)	Top-1 acc 56.250 (62.426)	Top-5 acc 83.203 (83.003)	lr 0.00864
Train [72][3239/3239]	Time 0.955 (1.052)	Data Time 0.000 (0.540)	Loss 2.8923 (2.5499)	Entropy 0.60689 (0.61340)	Top-1 acc 55.556 (62.426)	Top-5 acc 75.309 (83.004)	lr 0.00864
==========Valid [72/120]	loss 1.342	top-1 acc 69.065 (69.092)	top-5 acc 88.490	Train top-1 62.426	top-5 83.004	Entropy 0.60689	Latency-None: 0.000ms	Flops: 539.00M
Train [73][0/3239]	Time 42.344 (42.344)	Data Time 41.455 (41.455)	Loss 2.5449 (2.5449)	Entropy 0.60653 (0.60653)	Top-1 acc 63.672 (63.672)	Top-5 acc 81.641 (81.641)	lr 0.00864
Train [73][10/3239]	Time 0.322 (4.342)	Data Time 0.001 (3.774)	Loss 2.5415 (2.4917)	Entropy 0.60649 (0.60658)	Top-1 acc 58.984 (63.814)	Top-5 acc 82.031 (83.771)	lr 0.00864
Train [73][20/3239]	Time 0.246 (2.475)	Data Time 0.001 (1.978)	Loss 2.4970 (2.5185)	Entropy 0.60632 (0.60649)	Top-1 acc 61.719 (62.872)	Top-5 acc 83.594 (83.426)	lr 0.00864
Train [73][30/3239]	Time 0.257 (1.955)	Data Time 0.002 (1.340)	Loss 2.6396 (2.5142)	Entropy 0.60638 (0.60645)	Top-1 acc 60.938 (63.206)	Top-5 acc 80.859 (83.531)	lr 0.00863
Train [73][40/3239]	Time 0.229 (1.585)	Data Time 0.001 (1.014)	Loss 2.5060 (2.5101)	Entropy 0.60635 (0.60644)	Top-1 acc 64.844 (63.510)	Top-5 acc 83.203 (83.546)	lr 0.00863
Train [73][50/3239]	Time 0.252 (1.355)	Data Time 0.001 (0.815)	Loss 2.5293 (2.5174)	Entropy 0.60653 (0.60643)	Top-1 acc 60.156 (63.228)	Top-5 acc 83.594 (83.165)	lr 0.00863
Train [73][60/3239]	Time 0.283 (1.207)	Data Time 0.001 (0.682)	Loss 2.5769 (2.5183)	Entropy 0.60590 (0.60642)	Top-1 acc 60.938 (63.204)	Top-5 acc 83.594 (83.197)	lr 0.00863
Train [73][70/3239]	Time 0.246 (1.104)	Data Time 0.001 (0.586)	Loss 2.8447 (2.5219)	Entropy 0.60568 (0.60634)	Top-1 acc 55.078 (63.122)	Top-5 acc 79.297 (83.231)	lr 0.00863
Train [73][80/3239]	Time 0.336 (1.022)	Data Time 0.001 (0.514)	Loss 2.5394 (2.5171)	Entropy 0.60581 (0.60627)	Top-1 acc 60.547 (63.223)	Top-5 acc 81.250 (83.295)	lr 0.00863
Train [73][90/3239]	Time 0.256 (0.958)	Data Time 0.001 (0.458)	Loss 2.6002 (2.5200)	Entropy 0.60573 (0.60621)	Top-1 acc 59.766 (63.204)	Top-5 acc 84.375 (83.336)	lr 0.00863
Train [73][100/3239]	Time 0.241 (0.912)	Data Time 0.001 (0.413)	Loss 2.5873 (2.5196)	Entropy 0.60549 (0.60616)	Top-1 acc 60.156 (63.289)	Top-5 acc 82.031 (83.404)	lr 0.00863
Train [73][110/3239]	Time 2.309 (0.892)	Data Time 2.071 (0.399)	Loss 2.4960 (2.5174)	Entropy 0.60546 (0.60609)	Top-1 acc 60.938 (63.207)	Top-5 acc 85.938 (83.499)	lr 0.00863
Train [73][120/3239]	Time 0.258 (0.852)	Data Time 0.002 (0.366)	Loss 2.4754 (2.5162)	Entropy 0.60541 (0.60604)	Top-1 acc 64.844 (63.259)	Top-5 acc 85.547 (83.532)	lr 0.00863
Train [73][130/3239]	Time 0.249 (0.835)	Data Time 0.001 (0.350)	Loss 2.4410 (2.5120)	Entropy 0.60575 (0.60600)	Top-1 acc 66.016 (63.350)	Top-5 acc 86.328 (83.600)	lr 0.00862
Train [73][140/3239]	Time 0.232 (0.823)	Data Time 0.001 (0.337)	Loss 2.4333 (2.5138)	Entropy 0.60575 (0.60599)	Top-1 acc 64.062 (63.298)	Top-5 acc 85.547 (83.580)	lr 0.00862
Train [73][150/3239]	Time 0.244 (0.800)	Data Time 0.001 (0.314)	Loss 2.5246 (2.5112)	Entropy 0.60581 (0.60597)	Top-1 acc 62.891 (63.359)	Top-5 acc 84.375 (83.669)	lr 0.00862
Train [73][160/3239]	Time 0.241 (0.781)	Data Time 0.001 (0.295)	Loss 2.5470 (2.5121)	Entropy 0.60599 (0.60596)	Top-1 acc 60.938 (63.327)	Top-5 acc 83.594 (83.659)	lr 0.00862
Train [73][170/3239]	Time 0.336 (0.770)	Data Time 0.002 (0.288)	Loss 2.5105 (2.5133)	Entropy 0.60643 (0.60597)	Top-1 acc 63.281 (63.295)	Top-5 acc 83.203 (83.610)	lr 0.00862
Train [73][180/3239]	Time 0.276 (0.759)	Data Time 0.001 (0.280)	Loss 2.5571 (2.5152)	Entropy 0.60652 (0.60599)	Top-1 acc 65.234 (63.279)	Top-5 acc 80.859 (83.574)	lr 0.00862
Train [73][190/3239]	Time 0.256 (0.744)	Data Time 0.001 (0.265)	Loss 2.5923 (2.5159)	Entropy 0.60639 (0.60602)	Top-1 acc 58.594 (63.285)	Top-5 acc 83.203 (83.596)	lr 0.00862
Train [73][200/3239]	Time 0.232 (0.730)	Data Time 0.001 (0.253)	Loss 2.5097 (2.5166)	Entropy 0.60615 (0.60603)	Top-1 acc 59.766 (63.242)	Top-5 acc 84.766 (83.637)	lr 0.00862
Train [73][210/3239]	Time 0.246 (0.716)	Data Time 0.001 (0.241)	Loss 2.5454 (2.5169)	Entropy 0.60603 (0.60604)	Top-1 acc 59.766 (63.202)	Top-5 acc 85.156 (83.629)	lr 0.00862
Train [73][220/3239]	Time 0.244 (0.704)	Data Time 0.001 (0.230)	Loss 2.4838 (2.5217)	Entropy 0.60626 (0.60604)	Top-1 acc 67.188 (63.113)	Top-5 acc 83.203 (83.516)	lr 0.00862
Train [73][230/3239]	Time 0.249 (0.706)	Data Time 0.001 (0.234)	Loss 2.5045 (2.5258)	Entropy 0.60600 (0.60604)	Top-1 acc 63.672 (63.009)	Top-5 acc 87.109 (83.438)	lr 0.00862
Train [73][240/3239]	Time 0.353 (0.700)	Data Time 0.001 (0.230)	Loss 2.5681 (2.5260)	Entropy 0.60641 (0.60604)	Top-1 acc 63.281 (62.962)	Top-5 acc 82.812 (83.424)	lr 0.00861
Train [73][250/3239]	Time 0.261 (0.690)	Data Time 0.001 (0.221)	Loss 2.4773 (2.5253)	Entropy 0.60653 (0.60606)	Top-1 acc 62.500 (63.020)	Top-5 acc 85.938 (83.438)	lr 0.00861
Train [73][260/3239]	Time 0.237 (0.681)	Data Time 0.001 (0.212)	Loss 2.5140 (2.5257)	Entropy 0.60629 (0.60608)	Top-1 acc 61.719 (62.956)	Top-5 acc 85.156 (83.465)	lr 0.00861
Train [73][270/3239]	Time 1.945 (0.679)	Data Time 1.695 (0.211)	Loss 2.3427 (2.5271)	Entropy 0.60604 (0.60608)	Top-1 acc 65.625 (62.902)	Top-5 acc 87.891 (83.457)	lr 0.00861
Train [73][280/3239]	Time 0.226 (0.670)	Data Time 0.001 (0.203)	Loss 2.5006 (2.5295)	Entropy 0.60629 (0.60608)	Top-1 acc 62.891 (62.823)	Top-5 acc 83.203 (83.448)	lr 0.00861
Train [73][290/3239]	Time 0.237 (0.675)	Data Time 0.001 (0.211)	Loss 2.5437 (2.5311)	Entropy 0.60640 (0.60609)	Top-1 acc 63.281 (62.783)	Top-5 acc 82.812 (83.415)	lr 0.00861
Train [73][300/3239]	Time 0.251 (0.667)	Data Time 0.001 (0.204)	Loss 2.4530 (2.5313)	Entropy 0.60649 (0.60611)	Top-1 acc 65.234 (62.780)	Top-5 acc 84.375 (83.422)	lr 0.00861
Train [73][310/3239]	Time 0.236 (0.669)	Data Time 0.001 (0.206)	Loss 2.4351 (2.5316)	Entropy 0.60676 (0.60612)	Top-1 acc 65.234 (62.771)	Top-5 acc 82.812 (83.400)	lr 0.00861
Train [73][320/3239]	Time 0.271 (0.662)	Data Time 0.001 (0.199)	Loss 2.4610 (2.5314)	Entropy 0.60700 (0.60614)	Top-1 acc 64.844 (62.760)	Top-5 acc 84.375 (83.377)	lr 0.00861
Train [73][330/3239]	Time 0.238 (0.654)	Data Time 0.001 (0.193)	Loss 2.6017 (2.5319)	Entropy 0.60708 (0.60617)	Top-1 acc 60.547 (62.720)	Top-5 acc 81.641 (83.346)	lr 0.00861
Train [73][340/3239]	Time 0.228 (0.658)	Data Time 0.001 (0.198)	Loss 2.5243 (2.5311)	Entropy 0.60691 (0.60620)	Top-1 acc 67.969 (62.752)	Top-5 acc 83.203 (83.358)	lr 0.00860
Train [73][350/3239]	Time 0.303 (0.653)	Data Time 0.001 (0.193)	Loss 2.5266 (2.5320)	Entropy 0.60679 (0.60621)	Top-1 acc 60.938 (62.744)	Top-5 acc 84.375 (83.356)	lr 0.00860
Train [73][360/3239]	Time 0.254 (0.647)	Data Time 0.001 (0.188)	Loss 2.4382 (2.5296)	Entropy 0.60632 (0.60623)	Top-1 acc 67.188 (62.820)	Top-5 acc 84.766 (83.387)	lr 0.00860
Train [73][370/3239]	Time 0.235 (0.643)	Data Time 0.001 (0.184)	Loss 2.5610 (2.5304)	Entropy 0.60634 (0.60623)	Top-1 acc 64.844 (62.803)	Top-5 acc 80.859 (83.348)	lr 0.00860
Train [73][380/3239]	Time 0.302 (0.639)	Data Time 0.003 (0.180)	Loss 2.5594 (2.5328)	Entropy 0.60622 (0.60623)	Top-1 acc 63.672 (62.761)	Top-5 acc 82.812 (83.313)	lr 0.00860
Train [73][390/3239]	Time 0.248 (0.637)	Data Time 0.001 (0.178)	Loss 2.7218 (2.5338)	Entropy 0.60643 (0.60623)	Top-1 acc 58.984 (62.754)	Top-5 acc 80.859 (83.290)	lr 0.00860
Train [73][400/3239]	Time 0.350 (0.640)	Data Time 0.001 (0.182)	Loss 2.5806 (2.5344)	Entropy 0.60633 (0.60624)	Top-1 acc 62.109 (62.731)	Top-5 acc 83.203 (83.279)	lr 0.00860
Train [73][410/3239]	Time 0.261 (0.635)	Data Time 0.001 (0.178)	Loss 2.5051 (2.5340)	Entropy 0.60615 (0.60623)	Top-1 acc 64.453 (62.747)	Top-5 acc 80.859 (83.275)	lr 0.00860
Train [73][420/3239]	Time 0.283 (0.639)	Data Time 0.001 (0.182)	Loss 2.7224 (2.5351)	Entropy 0.60620 (0.60623)	Top-1 acc 58.984 (62.726)	Top-5 acc 81.250 (83.270)	lr 0.00860
Train [73][430/3239]	Time 0.247 (0.635)	Data Time 0.001 (0.178)	Loss 2.5382 (2.5342)	Entropy 0.60649 (0.60623)	Top-1 acc 63.281 (62.746)	Top-5 acc 82.422 (83.271)	lr 0.00860
Train [73][440/3239]	Time 0.246 (0.630)	Data Time 0.001 (0.174)	Loss 2.5038 (2.5348)	Entropy 0.60672 (0.60624)	Top-1 acc 62.500 (62.717)	Top-5 acc 83.594 (83.247)	lr 0.00860
Train [73][450/3239]	Time 0.236 (0.633)	Data Time 0.001 (0.177)	Loss 2.8033 (2.5341)	Entropy 0.60643 (0.60625)	Top-1 acc 56.250 (62.742)	Top-5 acc 79.297 (83.258)	lr 0.00859
Train [73][460/3239]	Time 0.252 (0.628)	Data Time 0.001 (0.173)	Loss 2.6992 (2.5343)	Entropy 0.60621 (0.60625)	Top-1 acc 58.203 (62.740)	Top-5 acc 78.125 (83.251)	lr 0.00859
Train [73][470/3239]	Time 0.324 (0.626)	Data Time 0.001 (0.173)	Loss 2.5601 (2.5343)	Entropy 0.60596 (0.60625)	Top-1 acc 59.766 (62.760)	Top-5 acc 82.422 (83.245)	lr 0.00859
Train [73][480/3239]	Time 7.864 (0.638)	Data Time 7.566 (0.185)	Loss 2.5815 (2.5342)	Entropy 0.60564 (0.60624)	Top-1 acc 61.328 (62.743)	Top-5 acc 82.812 (83.240)	lr 0.00859
Train [73][490/3239]	Time 0.242 (0.634)	Data Time 0.001 (0.181)	Loss 2.6027 (2.5339)	Entropy 0.60580 (0.60622)	Top-1 acc 61.328 (62.743)	Top-5 acc 82.812 (83.242)	lr 0.00859
Train [73][500/3239]	Time 0.273 (0.630)	Data Time 0.001 (0.177)	Loss 2.6463 (2.5348)	Entropy 0.60548 (0.60622)	Top-1 acc 59.375 (62.728)	Top-5 acc 78.125 (83.219)	lr 0.00859
Train [73][510/3239]	Time 0.240 (0.627)	Data Time 0.002 (0.174)	Loss 2.5956 (2.5349)	Entropy 0.60547 (0.60620)	Top-1 acc 60.156 (62.719)	Top-5 acc 81.641 (83.215)	lr 0.00859
Train [73][520/3239]	Time 0.225 (0.631)	Data Time 0.001 (0.178)	Loss 2.6343 (2.5345)	Entropy 0.60543 (0.60619)	Top-1 acc 60.156 (62.733)	Top-5 acc 82.422 (83.217)	lr 0.00859
Train [73][530/3239]	Time 0.262 (0.720)	Data Time 0.003 (0.175)	Loss 2.6476 (2.5346)	Entropy 0.60564 (0.60618)	Top-1 acc 58.984 (62.724)	Top-5 acc 80.859 (83.213)	lr 0.00859
Train [73][540/3239]	Time 0.244 (0.715)	Data Time 0.002 (0.172)	Loss 2.4705 (2.5342)	Entropy 0.60564 (0.60617)	Top-1 acc 60.938 (62.717)	Top-5 acc 85.938 (83.217)	lr 0.00859
Train [73][550/3239]	Time 0.249 (0.710)	Data Time 0.001 (0.168)	Loss 2.5671 (2.5338)	Entropy 0.60579 (0.60616)	Top-1 acc 64.453 (62.730)	Top-5 acc 83.984 (83.232)	lr 0.00858
Train [73][560/3239]	Time 0.365 (0.705)	Data Time 0.002 (0.165)	Loss 2.6048 (2.5331)	Entropy 0.60568 (0.60615)	Top-1 acc 60.156 (62.744)	Top-5 acc 82.031 (83.250)	lr 0.00858
Train [73][570/3239]	Time 0.263 (0.701)	Data Time 0.001 (0.163)	Loss 2.4437 (2.5323)	Entropy 0.60586 (0.60614)	Top-1 acc 64.062 (62.753)	Top-5 acc 84.766 (83.254)	lr 0.00858
Train [73][580/3239]	Time 0.255 (0.697)	Data Time 0.001 (0.160)	Loss 2.7214 (2.5316)	Entropy 0.60623 (0.60614)	Top-1 acc 58.594 (62.779)	Top-5 acc 77.344 (83.266)	lr 0.00858
Train [73][590/3239]	Time 0.290 (0.693)	Data Time 0.001 (0.157)	Loss 2.4558 (2.5315)	Entropy 0.60635 (0.60614)	Top-1 acc 63.281 (62.777)	Top-5 acc 84.375 (83.271)	lr 0.00858
Train [73][600/3239]	Time 0.261 (0.689)	Data Time 0.001 (0.155)	Loss 2.7128 (2.5330)	Entropy 0.60629 (0.60614)	Top-1 acc 60.547 (62.752)	Top-5 acc 80.859 (83.247)	lr 0.00858
Train [73][610/3239]	Time 0.247 (0.686)	Data Time 0.001 (0.152)	Loss 2.5286 (2.5332)	Entropy 0.60629 (0.60615)	Top-1 acc 61.328 (62.751)	Top-5 acc 83.203 (83.245)	lr 0.00858
Train [73][620/3239]	Time 0.249 (0.682)	Data Time 0.001 (0.150)	Loss 2.5105 (2.5335)	Entropy 0.60650 (0.60615)	Top-1 acc 59.766 (62.749)	Top-5 acc 85.938 (83.246)	lr 0.00858
Train [73][630/3239]	Time 0.371 (0.678)	Data Time 0.001 (0.147)	Loss 2.6539 (2.5335)	Entropy 0.60583 (0.60615)	Top-1 acc 60.156 (62.748)	Top-5 acc 81.641 (83.250)	lr 0.00858
Train [73][640/3239]	Time 0.264 (0.675)	Data Time 0.002 (0.145)	Loss 2.4980 (2.5331)	Entropy 0.60580 (0.60615)	Top-1 acc 64.062 (62.762)	Top-5 acc 86.328 (83.249)	lr 0.00858
Train [73][650/3239]	Time 0.297 (0.671)	Data Time 0.001 (0.143)	Loss 2.3037 (2.5319)	Entropy 0.60581 (0.60614)	Top-1 acc 68.750 (62.790)	Top-5 acc 85.547 (83.266)	lr 0.00857
Train [73][660/3239]	Time 0.258 (0.674)	Data Time 0.001 (0.146)	Loss 2.4851 (2.5323)	Entropy 0.60537 (0.60613)	Top-1 acc 66.016 (62.790)	Top-5 acc 86.719 (83.268)	lr 0.00857
Train [73][670/3239]	Time 0.260 (0.671)	Data Time 0.001 (0.144)	Loss 2.6875 (2.5322)	Entropy 0.60504 (0.60612)	Top-1 acc 58.594 (62.793)	Top-5 acc 82.812 (83.283)	lr 0.00857
Train [73][680/3239]	Time 0.246 (0.672)	Data Time 0.001 (0.146)	Loss 2.7361 (2.5323)	Entropy 0.60535 (0.60611)	Top-1 acc 57.031 (62.786)	Top-5 acc 77.734 (83.274)	lr 0.00857
Train [73][690/3239]	Time 0.250 (0.673)	Data Time 0.001 (0.148)	Loss 2.6989 (2.5321)	Entropy 0.60572 (0.60610)	Top-1 acc 59.375 (62.801)	Top-5 acc 81.641 (83.277)	lr 0.00857
Train [73][700/3239]	Time 1.259 (0.672)	Data Time 1.001 (0.147)	Loss 2.3696 (2.5316)	Entropy 0.60577 (0.60609)	Top-1 acc 69.141 (62.816)	Top-5 acc 87.500 (83.289)	lr 0.00857
Train [73][710/3239]	Time 0.282 (0.679)	Data Time 0.003 (0.155)	Loss 2.6022 (2.5319)	Entropy 0.60585 (0.60609)	Top-1 acc 59.375 (62.807)	Top-5 acc 80.469 (83.288)	lr 0.00857
Train [73][720/3239]	Time 0.417 (0.677)	Data Time 0.035 (0.155)	Loss 2.6009 (2.5318)	Entropy 0.60594 (0.60608)	Top-1 acc 60.547 (62.801)	Top-5 acc 81.250 (83.295)	lr 0.00857
Train [73][730/3239]	Time 0.274 (0.675)	Data Time 0.001 (0.153)	Loss 2.5003 (2.5321)	Entropy 0.60603 (0.60608)	Top-1 acc 65.625 (62.809)	Top-5 acc 83.984 (83.284)	lr 0.00857
Train [73][740/3239]	Time 0.247 (0.679)	Data Time 0.001 (0.159)	Loss 2.5214 (2.5310)	Entropy 0.60603 (0.60608)	Top-1 acc 61.328 (62.838)	Top-5 acc 82.422 (83.305)	lr 0.00857
Train [73][750/3239]	Time 4.152 (0.682)	Data Time 3.905 (0.162)	Loss 2.4347 (2.5312)	Entropy 0.60651 (0.60608)	Top-1 acc 66.797 (62.837)	Top-5 acc 82.812 (83.307)	lr 0.00857
Train [73][760/3239]	Time 0.246 (0.678)	Data Time 0.001 (0.160)	Loss 2.3695 (2.5309)	Entropy 0.60657 (0.60609)	Top-1 acc 64.844 (62.840)	Top-5 acc 87.500 (83.324)	lr 0.00856
Train [73][770/3239]	Time 0.331 (0.679)	Data Time 0.001 (0.161)	Loss 2.4354 (2.5312)	Entropy 0.60657 (0.60610)	Top-1 acc 62.891 (62.818)	Top-5 acc 83.594 (83.318)	lr 0.00856
Train [73][780/3239]	Time 0.237 (0.676)	Data Time 0.001 (0.159)	Loss 2.3917 (2.5309)	Entropy 0.60676 (0.60610)	Top-1 acc 64.062 (62.827)	Top-5 acc 87.500 (83.321)	lr 0.00856
Train [73][790/3239]	Time 0.340 (0.677)	Data Time 0.001 (0.162)	Loss 2.4620 (2.5303)	Entropy 0.60661 (0.60611)	Top-1 acc 60.547 (62.847)	Top-5 acc 83.984 (83.332)	lr 0.00856
Train [73][800/3239]	Time 0.229 (0.681)	Data Time 0.001 (0.166)	Loss 2.5785 (2.5311)	Entropy 0.60655 (0.60612)	Top-1 acc 64.062 (62.840)	Top-5 acc 80.859 (83.310)	lr 0.00856
Train [73][810/3239]	Time 3.154 (0.682)	Data Time 2.905 (0.168)	Loss 2.5168 (2.5314)	Entropy 0.60638 (0.60612)	Top-1 acc 62.500 (62.838)	Top-5 acc 83.594 (83.309)	lr 0.00856
Train [73][820/3239]	Time 0.249 (0.679)	Data Time 0.001 (0.166)	Loss 2.4861 (2.5317)	Entropy 0.60638 (0.60612)	Top-1 acc 61.719 (62.828)	Top-5 acc 85.547 (83.300)	lr 0.00856
Train [73][830/3239]	Time 0.243 (0.680)	Data Time 0.001 (0.168)	Loss 2.3735 (2.5321)	Entropy 0.60604 (0.60613)	Top-1 acc 67.578 (62.819)	Top-5 acc 87.500 (83.296)	lr 0.00856
Train [73][840/3239]	Time 0.235 (0.677)	Data Time 0.001 (0.166)	Loss 2.5866 (2.5328)	Entropy 0.60638 (0.60613)	Top-1 acc 60.938 (62.806)	Top-5 acc 83.594 (83.287)	lr 0.00856
Train [73][850/3239]	Time 0.242 (0.681)	Data Time 0.001 (0.171)	Loss 2.5230 (2.5328)	Entropy 0.60659 (0.60613)	Top-1 acc 67.578 (62.808)	Top-5 acc 82.422 (83.291)	lr 0.00856
Train [73][860/3239]	Time 0.232 (0.680)	Data Time 0.001 (0.170)	Loss 2.6212 (2.5332)	Entropy 0.60674 (0.60614)	Top-1 acc 62.500 (62.797)	Top-5 acc 83.594 (83.282)	lr 0.00855
Train [73][870/3239]	Time 0.234 (0.677)	Data Time 0.001 (0.168)	Loss 2.5324 (2.5331)	Entropy 0.60695 (0.60614)	Top-1 acc 64.453 (62.794)	Top-5 acc 82.812 (83.288)	lr 0.00855
Train [73][880/3239]	Time 0.729 (0.683)	Data Time 0.458 (0.175)	Loss 2.3569 (2.5325)	Entropy 0.60717 (0.60615)	Top-1 acc 67.188 (62.815)	Top-5 acc 85.938 (83.298)	lr 0.00855
Train [73][890/3239]	Time 0.282 (0.682)	Data Time 0.005 (0.176)	Loss 2.4769 (2.5326)	Entropy 0.60700 (0.60616)	Top-1 acc 64.062 (62.803)	Top-5 acc 83.984 (83.299)	lr 0.00855
Train [73][900/3239]	Time 0.260 (0.680)	Data Time 0.001 (0.174)	Loss 2.9062 (2.5329)	Entropy 0.60672 (0.60617)	Top-1 acc 56.250 (62.803)	Top-5 acc 76.172 (83.294)	lr 0.00855
Train [73][910/3239]	Time 0.228 (0.685)	Data Time 0.001 (0.180)	Loss 2.6497 (2.5341)	Entropy 0.60658 (0.60618)	Top-1 acc 60.938 (62.779)	Top-5 acc 81.641 (83.281)	lr 0.00855
Train [73][920/3239]	Time 0.240 (0.682)	Data Time 0.001 (0.178)	Loss 2.4739 (2.5349)	Entropy 0.60652 (0.60619)	Top-1 acc 63.672 (62.760)	Top-5 acc 85.156 (83.272)	lr 0.00855
Train [73][930/3239]	Time 0.240 (0.685)	Data Time 0.001 (0.181)	Loss 2.4519 (2.5350)	Entropy 0.60637 (0.60619)	Top-1 acc 61.328 (62.762)	Top-5 acc 84.375 (83.266)	lr 0.00855
Train [73][940/3239]	Time 4.201 (0.691)	Data Time 3.945 (0.188)	Loss 2.5489 (2.5353)	Entropy 0.60615 (0.60619)	Top-1 acc 62.891 (62.753)	Top-5 acc 84.375 (83.259)	lr 0.00855
Train [73][950/3239]	Time 0.340 (0.690)	Data Time 0.001 (0.188)	Loss 2.4396 (2.5349)	Entropy 0.60625 (0.60619)	Top-1 acc 64.453 (62.755)	Top-5 acc 85.156 (83.270)	lr 0.00855
Train [73][960/3239]	Time 0.222 (0.691)	Data Time 0.001 (0.190)	Loss 2.6259 (2.5352)	Entropy 0.60612 (0.60619)	Top-1 acc 60.938 (62.739)	Top-5 acc 79.297 (83.254)	lr 0.00855
Train [73][970/3239]	Time 0.243 (0.690)	Data Time 0.001 (0.190)	Loss 2.4865 (2.5355)	Entropy 0.60623 (0.60619)	Top-1 acc 66.797 (62.737)	Top-5 acc 83.594 (83.251)	lr 0.00854
Train [73][980/3239]	Time 0.235 (0.690)	Data Time 0.001 (0.190)	Loss 2.6080 (2.5354)	Entropy 0.60626 (0.60619)	Top-1 acc 59.766 (62.741)	Top-5 acc 82.422 (83.255)	lr 0.00854
Train [73][990/3239]	Time 0.237 (0.694)	Data Time 0.001 (0.195)	Loss 2.5530 (2.5357)	Entropy 0.60615 (0.60619)	Top-1 acc 61.328 (62.738)	Top-5 acc 81.250 (83.249)	lr 0.00854
Train [73][1000/3239]	Time 0.289 (0.695)	Data Time 0.001 (0.197)	Loss 2.6480 (2.5362)	Entropy 0.60619 (0.60619)	Top-1 acc 62.891 (62.734)	Top-5 acc 81.250 (83.237)	lr 0.00854
Train [73][1010/3239]	Time 0.246 (0.696)	Data Time 0.001 (0.198)	Loss 2.4838 (2.5358)	Entropy 0.60622 (0.60619)	Top-1 acc 66.797 (62.755)	Top-5 acc 85.547 (83.241)	lr 0.00854
Train [73][1020/3239]	Time 0.373 (0.698)	Data Time 0.001 (0.201)	Loss 2.7455 (2.5363)	Entropy 0.60651 (0.60619)	Top-1 acc 57.812 (62.748)	Top-5 acc 77.344 (83.233)	lr 0.00854
Train [73][1030/3239]	Time 0.274 (0.695)	Data Time 0.001 (0.199)	Loss 2.3524 (2.5359)	Entropy 0.60635 (0.60619)	Top-1 acc 68.359 (62.752)	Top-5 acc 86.328 (83.250)	lr 0.00854
Train [73][1040/3239]	Time 0.244 (0.698)	Data Time 0.001 (0.203)	Loss 2.5080 (2.5358)	Entropy 0.60628 (0.60620)	Top-1 acc 61.719 (62.752)	Top-5 acc 83.203 (83.250)	lr 0.00854
Train [73][1050/3239]	Time 0.285 (0.701)	Data Time 0.001 (0.206)	Loss 2.4440 (2.5357)	Entropy 0.60649 (0.60620)	Top-1 acc 67.578 (62.758)	Top-5 acc 84.375 (83.243)	lr 0.00854
Train [73][1060/3239]	Time 0.232 (0.699)	Data Time 0.001 (0.204)	Loss 2.5410 (2.5360)	Entropy 0.60603 (0.60620)	Top-1 acc 61.328 (62.750)	Top-5 acc 83.594 (83.240)	lr 0.00854
Train [73][1070/3239]	Time 0.234 (0.707)	Data Time 0.002 (0.213)	Loss 2.5118 (2.5363)	Entropy 0.60600 (0.60620)	Top-1 acc 61.328 (62.741)	Top-5 acc 84.375 (83.232)	lr 0.00853
Train [73][1080/3239]	Time 0.242 (0.705)	Data Time 0.002 (0.211)	Loss 2.5425 (2.5367)	Entropy 0.60635 (0.60620)	Top-1 acc 60.156 (62.729)	Top-5 acc 85.156 (83.223)	lr 0.00853
Train [73][1090/3239]	Time 0.252 (0.705)	Data Time 0.001 (0.212)	Loss 2.5399 (2.5367)	Entropy 0.60637 (0.60620)	Top-1 acc 62.109 (62.730)	Top-5 acc 83.203 (83.221)	lr 0.00853
Train [73][1100/3239]	Time 0.299 (0.709)	Data Time 0.001 (0.216)	Loss 2.4737 (2.5369)	Entropy 0.60621 (0.60620)	Top-1 acc 62.500 (62.733)	Top-5 acc 85.938 (83.216)	lr 0.00853
Train [73][1110/3239]	Time 2.334 (0.708)	Data Time 1.941 (0.216)	Loss 2.3004 (2.5373)	Entropy 0.60617 (0.60620)	Top-1 acc 69.531 (62.732)	Top-5 acc 86.328 (83.212)	lr 0.00853
Train [73][1120/3239]	Time 0.236 (0.711)	Data Time 0.002 (0.220)	Loss 2.5644 (2.5376)	Entropy 0.60625 (0.60620)	Top-1 acc 66.016 (62.726)	Top-5 acc 82.422 (83.207)	lr 0.00853
Train [73][1130/3239]	Time 0.261 (0.718)	Data Time 0.001 (0.227)	Loss 2.4558 (2.5373)	Entropy 0.60614 (0.60620)	Top-1 acc 66.406 (62.730)	Top-5 acc 84.375 (83.211)	lr 0.00853
Train [73][1140/3239]	Time 0.243 (0.716)	Data Time 0.001 (0.225)	Loss 2.5681 (2.5372)	Entropy 0.60580 (0.60620)	Top-1 acc 58.594 (62.729)	Top-5 acc 82.422 (83.207)	lr 0.00853
Train [73][1150/3239]	Time 0.249 (0.714)	Data Time 0.001 (0.224)	Loss 2.4778 (2.5371)	Entropy 0.60569 (0.60620)	Top-1 acc 64.062 (62.730)	Top-5 acc 84.766 (83.208)	lr 0.00853
Train [73][1160/3239]	Time 0.235 (0.719)	Data Time 0.001 (0.229)	Loss 2.7503 (2.5371)	Entropy 0.60548 (0.60619)	Top-1 acc 60.938 (62.740)	Top-5 acc 77.734 (83.208)	lr 0.00853
Train [73][1170/3239]	Time 0.246 (0.717)	Data Time 0.002 (0.228)	Loss 2.5519 (2.5372)	Entropy 0.60574 (0.60619)	Top-1 acc 63.281 (62.733)	Top-5 acc 83.203 (83.201)	lr 0.00853
Train [73][1180/3239]	Time 0.598 (0.756)	Data Time 0.035 (0.228)	Loss 2.5702 (2.5381)	Entropy 0.60578 (0.60618)	Top-1 acc 60.547 (62.717)	Top-5 acc 83.203 (83.182)	lr 0.00852
Train [73][1190/3239]	Time 0.249 (0.754)	Data Time 0.002 (0.226)	Loss 2.5441 (2.5382)	Entropy 0.60587 (0.60618)	Top-1 acc 63.281 (62.709)	Top-5 acc 82.812 (83.177)	lr 0.00852
Train [73][1200/3239]	Time 0.239 (0.751)	Data Time 0.001 (0.224)	Loss 2.4718 (2.5381)	Entropy 0.60581 (0.60618)	Top-1 acc 65.625 (62.716)	Top-5 acc 83.594 (83.178)	lr 0.00852
Train [73][1210/3239]	Time 0.252 (0.749)	Data Time 0.002 (0.222)	Loss 2.6819 (2.5381)	Entropy 0.60599 (0.60618)	Top-1 acc 61.328 (62.712)	Top-5 acc 77.344 (83.168)	lr 0.00852
Train [73][1220/3239]	Time 0.247 (0.746)	Data Time 0.001 (0.221)	Loss 2.5403 (2.5386)	Entropy 0.60619 (0.60617)	Top-1 acc 60.938 (62.696)	Top-5 acc 86.328 (83.164)	lr 0.00852
Train [73][1230/3239]	Time 0.274 (0.743)	Data Time 0.001 (0.219)	Loss 2.5585 (2.5391)	Entropy 0.60636 (0.60618)	Top-1 acc 59.375 (62.683)	Top-5 acc 84.766 (83.157)	lr 0.00852
Train [73][1240/3239]	Time 0.279 (0.741)	Data Time 0.001 (0.217)	Loss 2.5498 (2.5388)	Entropy 0.60589 (0.60618)	Top-1 acc 64.844 (62.697)	Top-5 acc 83.203 (83.163)	lr 0.00852
Train [73][1250/3239]	Time 0.292 (0.742)	Data Time 0.002 (0.219)	Loss 2.5960 (2.5386)	Entropy 0.60607 (0.60617)	Top-1 acc 63.281 (62.708)	Top-5 acc 80.859 (83.168)	lr 0.00852
Train [73][1260/3239]	Time 0.239 (0.741)	Data Time 0.001 (0.218)	Loss 2.5479 (2.5388)	Entropy 0.60586 (0.60617)	Top-1 acc 62.109 (62.702)	Top-5 acc 85.938 (83.170)	lr 0.00852
Train [73][1270/3239]	Time 0.342 (0.738)	Data Time 0.001 (0.216)	Loss 2.6021 (2.5389)	Entropy 0.60610 (0.60617)	Top-1 acc 62.500 (62.703)	Top-5 acc 83.203 (83.167)	lr 0.00852
Train [73][1280/3239]	Time 5.435 (0.748)	Data Time 5.179 (0.227)	Loss 2.4951 (2.5393)	Entropy 0.60610 (0.60617)	Top-1 acc 61.719 (62.692)	Top-5 acc 80.859 (83.165)	lr 0.00851
Train [73][1290/3239]	Time 0.261 (0.746)	Data Time 0.003 (0.225)	Loss 2.4098 (2.5391)	Entropy 0.60622 (0.60617)	Top-1 acc 63.672 (62.703)	Top-5 acc 85.156 (83.173)	lr 0.00851
Train [73][1300/3239]	Time 0.244 (0.743)	Data Time 0.001 (0.223)	Loss 2.6312 (2.5397)	Entropy 0.60617 (0.60617)	Top-1 acc 58.984 (62.685)	Top-5 acc 81.641 (83.159)	lr 0.00851
Train [73][1310/3239]	Time 2.329 (0.747)	Data Time 2.068 (0.227)	Loss 2.6776 (2.5402)	Entropy 0.60631 (0.60617)	Top-1 acc 58.594 (62.669)	Top-5 acc 81.250 (83.146)	lr 0.00851
Train [73][1320/3239]	Time 0.249 (0.752)	Data Time 0.001 (0.233)	Loss 2.5651 (2.5406)	Entropy 0.60615 (0.60617)	Top-1 acc 63.672 (62.666)	Top-5 acc 81.641 (83.140)	lr 0.00851
Train [73][1330/3239]	Time 0.234 (0.750)	Data Time 0.001 (0.231)	Loss 2.7734 (2.5403)	Entropy 0.60609 (0.60617)	Top-1 acc 57.422 (62.668)	Top-5 acc 79.688 (83.144)	lr 0.00851
Train [73][1340/3239]	Time 3.523 (0.750)	Data Time 3.168 (0.232)	Loss 2.7768 (2.5407)	Entropy 0.60599 (0.60617)	Top-1 acc 57.422 (62.655)	Top-5 acc 77.344 (83.138)	lr 0.00851
Train [73][1350/3239]	Time 0.240 (0.760)	Data Time 0.001 (0.243)	Loss 2.4876 (2.5406)	Entropy 0.60639 (0.60617)	Top-1 acc 62.500 (62.656)	Top-5 acc 83.984 (83.142)	lr 0.00851
Train [73][1360/3239]	Time 0.246 (0.757)	Data Time 0.001 (0.241)	Loss 2.6772 (2.5401)	Entropy 0.60686 (0.60617)	Top-1 acc 58.203 (62.661)	Top-5 acc 82.422 (83.157)	lr 0.00851
Train [73][1370/3239]	Time 0.235 (0.755)	Data Time 0.001 (0.239)	Loss 2.5527 (2.5401)	Entropy 0.60667 (0.60618)	Top-1 acc 60.938 (62.669)	Top-5 acc 83.594 (83.153)	lr 0.00851
Train [73][1380/3239]	Time 0.257 (0.767)	Data Time 0.002 (0.251)	Loss 2.4259 (2.5395)	Entropy 0.60685 (0.60618)	Top-1 acc 65.234 (62.678)	Top-5 acc 87.500 (83.167)	lr 0.00850
Train [73][1390/3239]	Time 0.234 (0.764)	Data Time 0.001 (0.249)	Loss 2.6090 (2.5391)	Entropy 0.60701 (0.60619)	Top-1 acc 60.156 (62.693)	Top-5 acc 82.031 (83.175)	lr 0.00850
Train [73][1400/3239]	Time 0.255 (0.762)	Data Time 0.001 (0.248)	Loss 2.5062 (2.5390)	Entropy 0.60678 (0.60619)	Top-1 acc 64.453 (62.690)	Top-5 acc 84.766 (83.181)	lr 0.00850
Train [73][1410/3239]	Time 0.249 (0.771)	Data Time 0.001 (0.257)	Loss 2.3922 (2.5389)	Entropy 0.60697 (0.60620)	Top-1 acc 64.062 (62.687)	Top-5 acc 84.766 (83.183)	lr 0.00850
Train [73][1420/3239]	Time 0.240 (0.769)	Data Time 0.001 (0.256)	Loss 2.6663 (2.5394)	Entropy 0.60718 (0.60620)	Top-1 acc 59.766 (62.678)	Top-5 acc 78.906 (83.175)	lr 0.00850
Train [73][1430/3239]	Time 0.353 (0.766)	Data Time 0.001 (0.254)	Loss 2.6515 (2.5394)	Entropy 0.60721 (0.60621)	Top-1 acc 60.547 (62.676)	Top-5 acc 81.250 (83.177)	lr 0.00850
Train [73][1440/3239]	Time 13.561 (0.778)	Data Time 13.305 (0.266)	Loss 2.4223 (2.5391)	Entropy 0.60738 (0.60622)	Top-1 acc 66.016 (62.679)	Top-5 acc 84.375 (83.179)	lr 0.00850
Train [73][1450/3239]	Time 0.262 (0.775)	Data Time 0.001 (0.264)	Loss 2.4750 (2.5390)	Entropy 0.60760 (0.60623)	Top-1 acc 65.234 (62.681)	Top-5 acc 83.594 (83.183)	lr 0.00850
Train [73][1460/3239]	Time 0.294 (0.773)	Data Time 0.001 (0.262)	Loss 2.5782 (2.5393)	Entropy 0.60742 (0.60624)	Top-1 acc 60.547 (62.674)	Top-5 acc 83.594 (83.176)	lr 0.00850
Train [73][1470/3239]	Time 0.288 (0.774)	Data Time 0.001 (0.263)	Loss 2.5834 (2.5395)	Entropy 0.60759 (0.60624)	Top-1 acc 59.375 (62.672)	Top-5 acc 80.859 (83.173)	lr 0.00850
Train [73][1480/3239]	Time 0.243 (0.780)	Data Time 0.001 (0.270)	Loss 2.5573 (2.5397)	Entropy 0.60775 (0.60625)	Top-1 acc 60.938 (62.667)	Top-5 acc 79.688 (83.169)	lr 0.00850
Train [73][1490/3239]	Time 0.239 (0.778)	Data Time 0.001 (0.268)	Loss 2.4535 (2.5399)	Entropy 0.60808 (0.60626)	Top-1 acc 66.016 (62.656)	Top-5 acc 82.812 (83.164)	lr 0.00849
Train [73][1500/3239]	Time 0.392 (0.775)	Data Time 0.001 (0.266)	Loss 2.8889 (2.5400)	Entropy 0.60803 (0.60628)	Top-1 acc 53.906 (62.655)	Top-5 acc 77.734 (83.164)	lr 0.00849
Train [73][1510/3239]	Time 0.252 (0.788)	Data Time 0.002 (0.279)	Loss 2.5339 (2.5402)	Entropy 0.60783 (0.60629)	Top-1 acc 63.672 (62.655)	Top-5 acc 84.375 (83.166)	lr 0.00849
Train [73][1520/3239]	Time 0.246 (0.785)	Data Time 0.001 (0.277)	Loss 2.5340 (2.5404)	Entropy 0.60779 (0.60630)	Top-1 acc 62.891 (62.655)	Top-5 acc 84.766 (83.167)	lr 0.00849
Train [73][1530/3239]	Time 0.253 (0.783)	Data Time 0.001 (0.275)	Loss 2.6127 (2.5405)	Entropy 0.60773 (0.60631)	Top-1 acc 64.844 (62.655)	Top-5 acc 82.812 (83.163)	lr 0.00849
Train [73][1540/3239]	Time 0.253 (0.793)	Data Time 0.001 (0.286)	Loss 2.5862 (2.5406)	Entropy 0.60787 (0.60632)	Top-1 acc 64.062 (62.659)	Top-5 acc 82.422 (83.162)	lr 0.00849
Train [73][1550/3239]	Time 0.227 (0.791)	Data Time 0.001 (0.284)	Loss 2.6017 (2.5406)	Entropy 0.60767 (0.60633)	Top-1 acc 59.766 (62.661)	Top-5 acc 81.250 (83.161)	lr 0.00849
Train [73][1560/3239]	Time 0.239 (0.789)	Data Time 0.001 (0.283)	Loss 2.5561 (2.5406)	Entropy 0.60764 (0.60633)	Top-1 acc 56.641 (62.657)	Top-5 acc 83.594 (83.162)	lr 0.00849
Train [73][1570/3239]	Time 0.248 (0.799)	Data Time 0.001 (0.294)	Loss 2.4261 (2.5404)	Entropy 0.60737 (0.60634)	Top-1 acc 65.625 (62.665)	Top-5 acc 85.938 (83.168)	lr 0.00849
Train [73][1580/3239]	Time 0.239 (0.797)	Data Time 0.001 (0.292)	Loss 2.5072 (2.5404)	Entropy 0.60749 (0.60635)	Top-1 acc 61.328 (62.667)	Top-5 acc 83.203 (83.164)	lr 0.00849
Train [73][1590/3239]	Time 0.245 (0.794)	Data Time 0.001 (0.290)	Loss 2.7059 (2.5408)	Entropy 0.60762 (0.60636)	Top-1 acc 60.156 (62.659)	Top-5 acc 78.906 (83.156)	lr 0.00848
Train [73][1600/3239]	Time 14.003 (0.804)	Data Time 13.723 (0.301)	Loss 2.5208 (2.5409)	Entropy 0.60760 (0.60636)	Top-1 acc 62.500 (62.656)	Top-5 acc 83.203 (83.154)	lr 0.00848
Train [73][1610/3239]	Time 0.254 (0.802)	Data Time 0.001 (0.299)	Loss 2.5101 (2.5407)	Entropy 0.60769 (0.60637)	Top-1 acc 66.016 (62.660)	Top-5 acc 84.766 (83.161)	lr 0.00848
Train [73][1620/3239]	Time 0.236 (0.800)	Data Time 0.001 (0.297)	Loss 2.6727 (2.5409)	Entropy 0.60781 (0.60638)	Top-1 acc 60.938 (62.653)	Top-5 acc 81.250 (83.154)	lr 0.00848
Train [73][1630/3239]	Time 0.245 (0.800)	Data Time 0.001 (0.298)	Loss 2.6762 (2.5409)	Entropy 0.60794 (0.60639)	Top-1 acc 58.984 (62.652)	Top-5 acc 82.031 (83.156)	lr 0.00848
Train [73][1640/3239]	Time 0.246 (0.808)	Data Time 0.001 (0.306)	Loss 2.5493 (2.5412)	Entropy 0.60766 (0.60640)	Top-1 acc 63.281 (62.652)	Top-5 acc 82.812 (83.154)	lr 0.00848
Train [73][1650/3239]	Time 0.246 (0.806)	Data Time 0.001 (0.305)	Loss 2.2989 (2.5411)	Entropy 0.60756 (0.60641)	Top-1 acc 66.797 (62.653)	Top-5 acc 87.109 (83.161)	lr 0.00848
Train [73][1660/3239]	Time 0.341 (0.803)	Data Time 0.001 (0.303)	Loss 2.4812 (2.5413)	Entropy 0.60764 (0.60641)	Top-1 acc 62.109 (62.654)	Top-5 acc 82.422 (83.151)	lr 0.00848
Train [73][1670/3239]	Time 0.236 (0.814)	Data Time 0.001 (0.314)	Loss 2.5835 (2.5415)	Entropy 0.60782 (0.60642)	Top-1 acc 62.500 (62.651)	Top-5 acc 82.422 (83.148)	lr 0.00848
Train [73][1680/3239]	Time 0.243 (0.811)	Data Time 0.001 (0.312)	Loss 2.4735 (2.5416)	Entropy 0.60765 (0.60643)	Top-1 acc 61.719 (62.651)	Top-5 acc 83.594 (83.146)	lr 0.00848
Train [73][1690/3239]	Time 0.246 (0.809)	Data Time 0.001 (0.310)	Loss 2.4842 (2.5411)	Entropy 0.60741 (0.60644)	Top-1 acc 65.234 (62.660)	Top-5 acc 81.641 (83.150)	lr 0.00848
Train [73][1700/3239]	Time 0.281 (0.823)	Data Time 0.002 (0.324)	Loss 2.5423 (2.5414)	Entropy 0.60707 (0.60644)	Top-1 acc 65.625 (62.655)	Top-5 acc 82.422 (83.144)	lr 0.00847
Train [73][1710/3239]	Time 0.249 (0.820)	Data Time 0.001 (0.322)	Loss 2.6895 (2.5417)	Entropy 0.60675 (0.60645)	Top-1 acc 58.203 (62.645)	Top-5 acc 80.469 (83.143)	lr 0.00847
Train [73][1720/3239]	Time 0.222 (0.818)	Data Time 0.001 (0.321)	Loss 2.4294 (2.5419)	Entropy 0.60705 (0.60645)	Top-1 acc 60.547 (62.638)	Top-5 acc 87.109 (83.144)	lr 0.00847
Train [73][1730/3239]	Time 0.348 (0.829)	Data Time 0.001 (0.332)	Loss 2.6994 (2.5420)	Entropy 0.60723 (0.60645)	Top-1 acc 58.984 (62.638)	Top-5 acc 78.516 (83.141)	lr 0.00847
Train [73][1740/3239]	Time 0.246 (0.827)	Data Time 0.001 (0.331)	Loss 2.4450 (2.5420)	Entropy 0.60724 (0.60646)	Top-1 acc 65.625 (62.636)	Top-5 acc 83.984 (83.140)	lr 0.00847
Train [73][1750/3239]	Time 0.227 (0.825)	Data Time 0.001 (0.329)	Loss 2.5929 (2.5423)	Entropy 0.60713 (0.60646)	Top-1 acc 61.328 (62.634)	Top-5 acc 82.422 (83.134)	lr 0.00847
Train [73][1760/3239]	Time 9.212 (0.838)	Data Time 8.926 (0.342)	Loss 2.5929 (2.5424)	Entropy 0.60712 (0.60647)	Top-1 acc 64.453 (62.632)	Top-5 acc 79.688 (83.135)	lr 0.00847
Train [73][1770/3239]	Time 0.278 (0.836)	Data Time 0.002 (0.341)	Loss 2.6542 (2.5420)	Entropy 0.60667 (0.60647)	Top-1 acc 58.594 (62.635)	Top-5 acc 82.422 (83.142)	lr 0.00847
Train [73][1780/3239]	Time 0.245 (0.836)	Data Time 0.001 (0.341)	Loss 2.3553 (2.5421)	Entropy 0.60686 (0.60647)	Top-1 acc 68.750 (62.635)	Top-5 acc 87.891 (83.141)	lr 0.00847
Train [73][1790/3239]	Time 0.244 (0.840)	Data Time 0.001 (0.346)	Loss 2.5376 (2.5420)	Entropy 0.60725 (0.60647)	Top-1 acc 62.109 (62.638)	Top-5 acc 83.203 (83.140)	lr 0.00847
Train [73][1800/3239]	Time 0.240 (0.843)	Data Time 0.001 (0.349)	Loss 2.6422 (2.5420)	Entropy 0.60686 (0.60648)	Top-1 acc 62.109 (62.637)	Top-5 acc 83.203 (83.139)	lr 0.00846
Train [73][1810/3239]	Time 0.260 (0.843)	Data Time 0.001 (0.349)	Loss 2.5643 (2.5423)	Entropy 0.60673 (0.60648)	Top-1 acc 60.156 (62.628)	Top-5 acc 86.328 (83.136)	lr 0.00846
Train [73][1820/3239]	Time 0.333 (0.840)	Data Time 0.001 (0.347)	Loss 2.6195 (2.5423)	Entropy 0.60652 (0.60648)	Top-1 acc 63.281 (62.631)	Top-5 acc 80.469 (83.133)	lr 0.00846
Train [73][1830/3239]	Time 0.244 (0.853)	Data Time 0.001 (0.361)	Loss 2.6419 (2.5427)	Entropy 0.60645 (0.60648)	Top-1 acc 56.641 (62.621)	Top-5 acc 80.859 (83.124)	lr 0.00846
Train [73][1840/3239]	Time 0.378 (0.877)	Data Time 0.028 (0.359)	Loss 2.7456 (2.5430)	Entropy 0.60616 (0.60648)	Top-1 acc 59.766 (62.616)	Top-5 acc 78.125 (83.118)	lr 0.00846
Train [73][1850/3239]	Time 0.238 (0.875)	Data Time 0.001 (0.357)	Loss 2.3938 (2.5427)	Entropy 0.60628 (0.60648)	Top-1 acc 65.625 (62.622)	Top-5 acc 84.766 (83.122)	lr 0.00846
Train [73][1860/3239]	Time 0.260 (0.872)	Data Time 0.002 (0.355)	Loss 2.4387 (2.5428)	Entropy 0.60668 (0.60648)	Top-1 acc 65.234 (62.618)	Top-5 acc 84.766 (83.118)	lr 0.00846
Train [73][1870/3239]	Time 0.245 (0.870)	Data Time 0.001 (0.353)	Loss 2.3724 (2.5428)	Entropy 0.60646 (0.60648)	Top-1 acc 68.750 (62.619)	Top-5 acc 85.938 (83.118)	lr 0.00846
Train [73][1880/3239]	Time 0.247 (0.868)	Data Time 0.001 (0.351)	Loss 2.4907 (2.5422)	Entropy 0.60658 (0.60648)	Top-1 acc 65.625 (62.629)	Top-5 acc 85.938 (83.130)	lr 0.00846
Train [73][1890/3239]	Time 0.363 (0.865)	Data Time 0.001 (0.349)	Loss 2.5051 (2.5423)	Entropy 0.60638 (0.60648)	Top-1 acc 62.891 (62.631)	Top-5 acc 84.375 (83.126)	lr 0.00846
Train [73][1900/3239]	Time 0.325 (0.870)	Data Time 0.002 (0.354)	Loss 2.4794 (2.5424)	Entropy 0.60666 (0.60648)	Top-1 acc 60.547 (62.625)	Top-5 acc 84.766 (83.126)	lr 0.00846
Train [73][1910/3239]	Time 0.249 (0.869)	Data Time 0.001 (0.353)	Loss 2.5028 (2.5427)	Entropy 0.60636 (0.60648)	Top-1 acc 64.062 (62.621)	Top-5 acc 82.812 (83.119)	lr 0.00845
Train [73][1920/3239]	Time 4.109 (0.869)	Data Time 3.852 (0.354)	Loss 2.2649 (2.5423)	Entropy 0.60603 (0.60648)	Top-1 acc 69.922 (62.634)	Top-5 acc 87.109 (83.126)	lr 0.00845
Train [73][1930/3239]	Time 0.238 (0.872)	Data Time 0.004 (0.357)	Loss 2.7404 (2.5426)	Entropy 0.60598 (0.60647)	Top-1 acc 59.375 (62.623)	Top-5 acc 78.906 (83.122)	lr 0.00845
Train [73][1940/3239]	Time 0.239 (0.879)	Data Time 0.002 (0.364)	Loss 2.4872 (2.5425)	Entropy 0.60564 (0.60647)	Top-1 acc 65.625 (62.623)	Top-5 acc 83.203 (83.116)	lr 0.00845
Train [73][1950/3239]	Time 0.267 (0.877)	Data Time 0.002 (0.363)	Loss 2.6896 (2.5427)	Entropy 0.60566 (0.60647)	Top-1 acc 58.984 (62.621)	Top-5 acc 80.078 (83.112)	lr 0.00845
Train [73][1960/3239]	Time 0.849 (0.879)	Data Time 0.595 (0.365)	Loss 2.8394 (2.5426)	Entropy 0.60566 (0.60646)	Top-1 acc 57.812 (62.630)	Top-5 acc 78.125 (83.115)	lr 0.00845
Train [73][1970/3239]	Time 0.258 (0.889)	Data Time 0.002 (0.375)	Loss 2.5946 (2.5428)	Entropy 0.60547 (0.60646)	Top-1 acc 64.453 (62.628)	Top-5 acc 83.203 (83.110)	lr 0.00845
Train [73][1980/3239]	Time 0.348 (0.887)	Data Time 0.001 (0.373)	Loss 2.6585 (2.5427)	Entropy 0.60552 (0.60645)	Top-1 acc 60.938 (62.630)	Top-5 acc 80.859 (83.114)	lr 0.00845
Train [73][1990/3239]	Time 0.233 (0.886)	Data Time 0.001 (0.373)	Loss 2.6595 (2.5427)	Entropy 0.60547 (0.60645)	Top-1 acc 58.203 (62.635)	Top-5 acc 80.078 (83.115)	lr 0.00845
Train [73][2000/3239]	Time 0.229 (0.896)	Data Time 0.001 (0.384)	Loss 2.6110 (2.5433)	Entropy 0.60588 (0.60644)	Top-1 acc 61.328 (62.615)	Top-5 acc 82.812 (83.108)	lr 0.00845
Train [73][2010/3239]	Time 0.253 (0.894)	Data Time 0.001 (0.382)	Loss 2.7110 (2.5436)	Entropy 0.60601 (0.60644)	Top-1 acc 58.984 (62.603)	Top-5 acc 81.250 (83.102)	lr 0.00844
Train [73][2020/3239]	Time 0.233 (0.895)	Data Time 0.001 (0.383)	Loss 2.6619 (2.5437)	Entropy 0.60602 (0.60644)	Top-1 acc 60.156 (62.602)	Top-5 acc 80.469 (83.096)	lr 0.00844
Train [73][2030/3239]	Time 8.854 (0.904)	Data Time 8.569 (0.393)	Loss 2.7176 (2.5439)	Entropy 0.60636 (0.60644)	Top-1 acc 59.375 (62.597)	Top-5 acc 78.906 (83.092)	lr 0.00844
Train [73][2040/3239]	Time 0.260 (0.903)	Data Time 0.001 (0.392)	Loss 2.5649 (2.5437)	Entropy 0.60631 (0.60644)	Top-1 acc 56.250 (62.599)	Top-5 acc 85.156 (83.093)	lr 0.00844
Train [73][2050/3239]	Time 0.374 (0.904)	Data Time 0.002 (0.393)	Loss 2.3234 (2.5437)	Entropy 0.60663 (0.60644)	Top-1 acc 69.922 (62.599)	Top-5 acc 87.500 (83.099)	lr 0.00844
Train [73][2060/3239]	Time 2.585 (0.908)	Data Time 2.324 (0.398)	Loss 2.6085 (2.5436)	Entropy 0.60609 (0.60644)	Top-1 acc 64.453 (62.605)	Top-5 acc 81.641 (83.100)	lr 0.00844
Train [73][2070/3239]	Time 0.246 (0.910)	Data Time 0.001 (0.401)	Loss 2.5461 (2.5435)	Entropy 0.60652 (0.60644)	Top-1 acc 62.500 (62.605)	Top-5 acc 83.203 (83.104)	lr 0.00844
Train [73][2080/3239]	Time 0.492 (0.908)	Data Time 0.250 (0.399)	Loss 2.4956 (2.5435)	Entropy 0.60615 (0.60644)	Top-1 acc 65.234 (62.614)	Top-5 acc 82.812 (83.103)	lr 0.00844
Train [73][2090/3239]	Time 0.246 (0.909)	Data Time 0.001 (0.400)	Loss 2.5738 (2.5439)	Entropy 0.60620 (0.60643)	Top-1 acc 59.375 (62.605)	Top-5 acc 83.594 (83.097)	lr 0.00844
Train [73][2100/3239]	Time 0.246 (0.918)	Data Time 0.002 (0.410)	Loss 2.4362 (2.5434)	Entropy 0.60621 (0.60643)	Top-1 acc 65.234 (62.619)	Top-5 acc 86.328 (83.111)	lr 0.00844
Train [73][2110/3239]	Time 0.248 (0.916)	Data Time 0.001 (0.408)	Loss 2.5370 (2.5434)	Entropy 0.60607 (0.60643)	Top-1 acc 65.234 (62.621)	Top-5 acc 82.812 (83.108)	lr 0.00844
Train [73][2120/3239]	Time 6.422 (0.919)	Data Time 6.172 (0.411)	Loss 2.5345 (2.5438)	Entropy 0.60567 (0.60643)	Top-1 acc 60.156 (62.615)	Top-5 acc 82.031 (83.101)	lr 0.00843
Train [73][2130/3239]	Time 0.233 (0.927)	Data Time 0.001 (0.419)	Loss 2.4113 (2.5436)	Entropy 0.60587 (0.60643)	Top-1 acc 66.016 (62.617)	Top-5 acc 84.375 (83.103)	lr 0.00843
Train [73][2140/3239]	Time 0.294 (0.925)	Data Time 0.001 (0.417)	Loss 2.4345 (2.5438)	Entropy 0.60609 (0.60642)	Top-1 acc 63.672 (62.610)	Top-5 acc 85.547 (83.097)	lr 0.00843
Train [73][2150/3239]	Time 0.243 (0.924)	Data Time 0.001 (0.417)	Loss 2.4264 (2.5437)	Entropy 0.60594 (0.60642)	Top-1 acc 67.969 (62.614)	Top-5 acc 82.031 (83.101)	lr 0.00843
Train [73][2160/3239]	Time 0.248 (0.935)	Data Time 0.001 (0.429)	Loss 2.6794 (2.5437)	Entropy 0.60594 (0.60642)	Top-1 acc 60.156 (62.616)	Top-5 acc 80.469 (83.104)	lr 0.00843
Train [73][2170/3239]	Time 0.255 (0.933)	Data Time 0.001 (0.427)	Loss 2.3820 (2.5435)	Entropy 0.60570 (0.60642)	Top-1 acc 66.016 (62.614)	Top-5 acc 84.375 (83.105)	lr 0.00843
Train [73][2180/3239]	Time 0.261 (0.932)	Data Time 0.002 (0.427)	Loss 2.6646 (2.5435)	Entropy 0.60562 (0.60641)	Top-1 acc 58.594 (62.623)	Top-5 acc 80.078 (83.103)	lr 0.00843
Train [73][2190/3239]	Time 15.754 (0.943)	Data Time 15.439 (0.438)	Loss 2.6886 (2.5435)	Entropy 0.60554 (0.60641)	Top-1 acc 60.547 (62.624)	Top-5 acc 82.422 (83.102)	lr 0.00843
Train [73][2200/3239]	Time 0.248 (0.941)	Data Time 0.001 (0.436)	Loss 2.4950 (2.5433)	Entropy 0.60579 (0.60641)	Top-1 acc 64.844 (62.632)	Top-5 acc 82.422 (83.105)	lr 0.00843
Train [73][2210/3239]	Time 0.323 (0.940)	Data Time 0.001 (0.436)	Loss 2.6041 (2.5432)	Entropy 0.60589 (0.60640)	Top-1 acc 59.766 (62.636)	Top-5 acc 82.812 (83.108)	lr 0.00843
Train [73][2220/3239]	Time 11.334 (0.945)	Data Time 11.055 (0.441)	Loss 2.4269 (2.5433)	Entropy 0.60595 (0.60640)	Top-1 acc 65.625 (62.633)	Top-5 acc 83.594 (83.106)	lr 0.00842
Train [73][2230/3239]	Time 0.255 (0.948)	Data Time 0.001 (0.444)	Loss 2.6101 (2.5431)	Entropy 0.60618 (0.60640)	Top-1 acc 62.500 (62.637)	Top-5 acc 83.594 (83.109)	lr 0.00842
Train [73][2240/3239]	Time 0.229 (0.946)	Data Time 0.001 (0.442)	Loss 2.6661 (2.5432)	Entropy 0.60614 (0.60640)	Top-1 acc 62.109 (62.636)	Top-5 acc 78.516 (83.105)	lr 0.00842
Train [73][2250/3239]	Time 0.229 (0.946)	Data Time 0.001 (0.443)	Loss 2.9019 (2.5433)	Entropy 0.60630 (0.60640)	Top-1 acc 53.906 (62.638)	Top-5 acc 75.391 (83.105)	lr 0.00842
Train [73][2260/3239]	Time 0.242 (0.954)	Data Time 0.001 (0.452)	Loss 2.3380 (2.5434)	Entropy 0.60653 (0.60640)	Top-1 acc 69.531 (62.636)	Top-5 acc 84.375 (83.100)	lr 0.00842
Train [73][2270/3239]	Time 0.231 (0.953)	Data Time 0.001 (0.450)	Loss 2.6166 (2.5435)	Entropy 0.60652 (0.60640)	Top-1 acc 59.375 (62.632)	Top-5 acc 80.859 (83.095)	lr 0.00842
Train [73][2280/3239]	Time 7.037 (0.955)	Data Time 6.669 (0.453)	Loss 2.4618 (2.5434)	Entropy 0.60634 (0.60640)	Top-1 acc 60.156 (62.635)	Top-5 acc 85.156 (83.101)	lr 0.00842
Train [73][2290/3239]	Time 0.239 (0.959)	Data Time 0.001 (0.457)	Loss 2.7493 (2.5434)	Entropy 0.60665 (0.60640)	Top-1 acc 59.375 (62.630)	Top-5 acc 77.734 (83.101)	lr 0.00842
Train [73][2300/3239]	Time 0.238 (0.959)	Data Time 0.001 (0.458)	Loss 2.8510 (2.5436)	Entropy 0.60671 (0.60640)	Top-1 acc 58.984 (62.624)	Top-5 acc 77.734 (83.100)	lr 0.00842
Train [73][2310/3239]	Time 0.237 (0.957)	Data Time 0.001 (0.456)	Loss 2.3986 (2.5436)	Entropy 0.60616 (0.60640)	Top-1 acc 65.234 (62.625)	Top-5 acc 85.938 (83.098)	lr 0.00842
Train [73][2320/3239]	Time 0.252 (0.966)	Data Time 0.001 (0.465)	Loss 2.5744 (2.5438)	Entropy 0.60646 (0.60640)	Top-1 acc 63.672 (62.622)	Top-5 acc 83.203 (83.091)	lr 0.00842
Train [73][2330/3239]	Time 4.564 (0.965)	Data Time 4.293 (0.465)	Loss 2.5340 (2.5436)	Entropy 0.60670 (0.60640)	Top-1 acc 63.672 (62.633)	Top-5 acc 83.203 (83.095)	lr 0.00841
Train [73][2340/3239]	Time 0.233 (0.963)	Data Time 0.002 (0.463)	Loss 2.5466 (2.5437)	Entropy 0.60684 (0.60640)	Top-1 acc 62.500 (62.630)	Top-5 acc 81.641 (83.092)	lr 0.00841
Train [73][2350/3239]	Time 3.407 (0.966)	Data Time 3.157 (0.466)	Loss 2.2876 (2.5436)	Entropy 0.60687 (0.60640)	Top-1 acc 68.359 (62.635)	Top-5 acc 87.891 (83.095)	lr 0.00841
Train [73][2360/3239]	Time 0.221 (0.964)	Data Time 0.001 (0.465)	Loss 2.6453 (2.5439)	Entropy 0.60700 (0.60640)	Top-1 acc 62.891 (62.629)	Top-5 acc 81.250 (83.088)	lr 0.00841
Train [73][2370/3239]	Time 0.334 (0.964)	Data Time 0.001 (0.465)	Loss 2.5800 (2.5440)	Entropy 0.60670 (0.60641)	Top-1 acc 60.547 (62.627)	Top-5 acc 82.812 (83.088)	lr 0.00841
Train [73][2380/3239]	Time 0.238 (0.964)	Data Time 0.001 (0.465)	Loss 2.4668 (2.5438)	Entropy 0.60700 (0.60641)	Top-1 acc 66.406 (62.631)	Top-5 acc 83.594 (83.090)	lr 0.00841
Train [73][2390/3239]	Time 0.237 (0.964)	Data Time 0.001 (0.465)	Loss 2.3584 (2.5436)	Entropy 0.60701 (0.60641)	Top-1 acc 65.625 (62.635)	Top-5 acc 87.109 (83.093)	lr 0.00841
Train [73][2400/3239]	Time 0.231 (0.964)	Data Time 0.001 (0.466)	Loss 2.6332 (2.5438)	Entropy 0.60681 (0.60641)	Top-1 acc 62.500 (62.629)	Top-5 acc 80.859 (83.089)	lr 0.00841
Train [73][2410/3239]	Time 0.234 (0.962)	Data Time 0.001 (0.464)	Loss 2.3941 (2.5437)	Entropy 0.60689 (0.60641)	Top-1 acc 69.531 (62.631)	Top-5 acc 85.547 (83.091)	lr 0.00841
Train [73][2420/3239]	Time 0.258 (0.969)	Data Time 0.001 (0.471)	Loss 2.5119 (2.5438)	Entropy 0.60683 (0.60642)	Top-1 acc 62.891 (62.624)	Top-5 acc 83.203 (83.089)	lr 0.00841
Train [73][2430/3239]	Time 0.256 (0.969)	Data Time 0.001 (0.471)	Loss 2.6130 (2.5436)	Entropy 0.60701 (0.60642)	Top-1 acc 59.375 (62.627)	Top-5 acc 81.250 (83.093)	lr 0.00840
Train [73][2440/3239]	Time 0.362 (0.966)	Data Time 0.001 (0.469)	Loss 2.5171 (2.5436)	Entropy 0.60730 (0.60642)	Top-1 acc 62.109 (62.629)	Top-5 acc 84.375 (83.092)	lr 0.00840
Train [73][2450/3239]	Time 6.945 (0.974)	Data Time 6.654 (0.478)	Loss 2.4944 (2.5436)	Entropy 0.60715 (0.60642)	Top-1 acc 62.891 (62.628)	Top-5 acc 83.594 (83.090)	lr 0.00840
Train [73][2460/3239]	Time 0.236 (0.973)	Data Time 0.001 (0.477)	Loss 2.5419 (2.5436)	Entropy 0.60716 (0.60643)	Top-1 acc 63.672 (62.631)	Top-5 acc 82.422 (83.090)	lr 0.00840
Train [73][2470/3239]	Time 0.248 (0.972)	Data Time 0.001 (0.476)	Loss 2.4213 (2.5434)	Entropy 0.60720 (0.60643)	Top-1 acc 67.578 (62.640)	Top-5 acc 85.156 (83.094)	lr 0.00840
Train [73][2480/3239]	Time 0.251 (0.977)	Data Time 0.001 (0.482)	Loss 2.6688 (2.5435)	Entropy 0.60745 (0.60643)	Top-1 acc 58.594 (62.637)	Top-5 acc 79.688 (83.093)	lr 0.00840
Train [73][2490/3239]	Time 0.421 (0.999)	Data Time 0.039 (0.484)	Loss 2.6684 (2.5437)	Entropy 0.60754 (0.60644)	Top-1 acc 58.984 (62.633)	Top-5 acc 78.516 (83.088)	lr 0.00840
Train [73][2500/3239]	Time 0.240 (0.997)	Data Time 0.002 (0.482)	Loss 2.5675 (2.5437)	Entropy 0.60767 (0.60644)	Top-1 acc 62.500 (62.634)	Top-5 acc 82.812 (83.091)	lr 0.00840
Train [73][2510/3239]	Time 0.245 (0.995)	Data Time 0.001 (0.480)	Loss 2.4383 (2.5434)	Entropy 0.60770 (0.60645)	Top-1 acc 64.453 (62.636)	Top-5 acc 83.594 (83.091)	lr 0.00840
Train [73][2520/3239]	Time 0.239 (0.992)	Data Time 0.001 (0.478)	Loss 2.7566 (2.5436)	Entropy 0.60767 (0.60645)	Top-1 acc 59.375 (62.633)	Top-5 acc 78.516 (83.090)	lr 0.00840
Train [73][2530/3239]	Time 0.366 (0.990)	Data Time 0.002 (0.476)	Loss 2.6367 (2.5435)	Entropy 0.60811 (0.60646)	Top-1 acc 60.156 (62.635)	Top-5 acc 80.859 (83.090)	lr 0.00840
Train [73][2540/3239]	Time 0.233 (0.988)	Data Time 0.001 (0.474)	Loss 2.3406 (2.5434)	Entropy 0.60827 (0.60646)	Top-1 acc 66.406 (62.637)	Top-5 acc 86.719 (83.095)	lr 0.00839
Train [73][2550/3239]	Time 0.239 (0.986)	Data Time 0.001 (0.473)	Loss 2.4092 (2.5435)	Entropy 0.60821 (0.60647)	Top-1 acc 67.188 (62.640)	Top-5 acc 84.766 (83.093)	lr 0.00839
Train [73][2560/3239]	Time 0.239 (0.984)	Data Time 0.001 (0.471)	Loss 2.5209 (2.5436)	Entropy 0.60845 (0.60648)	Top-1 acc 63.281 (62.637)	Top-5 acc 83.594 (83.092)	lr 0.00839
Train [73][2570/3239]	Time 0.265 (0.982)	Data Time 0.001 (0.469)	Loss 2.6766 (2.5438)	Entropy 0.60842 (0.60649)	Top-1 acc 59.766 (62.632)	Top-5 acc 83.594 (83.089)	lr 0.00839
Train [73][2580/3239]	Time 0.259 (0.980)	Data Time 0.001 (0.467)	Loss 2.4613 (2.5438)	Entropy 0.60890 (0.60649)	Top-1 acc 64.453 (62.628)	Top-5 acc 85.938 (83.093)	lr 0.00839
Train [73][2590/3239]	Time 0.469 (0.980)	Data Time 0.186 (0.468)	Loss 2.4233 (2.5438)	Entropy 0.60869 (0.60650)	Top-1 acc 61.719 (62.631)	Top-5 acc 85.156 (83.092)	lr 0.00839
Train [73][2600/3239]	Time 0.334 (0.979)	Data Time 0.001 (0.467)	Loss 2.7062 (2.5439)	Entropy 0.60841 (0.60651)	Top-1 acc 58.984 (62.626)	Top-5 acc 80.859 (83.089)	lr 0.00839
Train [73][2610/3239]	Time 0.237 (0.978)	Data Time 0.001 (0.466)	Loss 2.3190 (2.5437)	Entropy 0.60839 (0.60652)	Top-1 acc 66.406 (62.625)	Top-5 acc 89.062 (83.092)	lr 0.00839
Train [73][2620/3239]	Time 0.350 (0.979)	Data Time 0.001 (0.468)	Loss 2.4497 (2.5437)	Entropy 0.60830 (0.60652)	Top-1 acc 66.406 (62.629)	Top-5 acc 86.328 (83.095)	lr 0.00839
Train [73][2630/3239]	Time 0.405 (0.978)	Data Time 0.167 (0.467)	Loss 2.9355 (2.5438)	Entropy 0.60805 (0.60653)	Top-1 acc 51.953 (62.627)	Top-5 acc 78.125 (83.092)	lr 0.00839
Train [73][2640/3239]	Time 0.242 (0.977)	Data Time 0.001 (0.466)	Loss 2.5482 (2.5436)	Entropy 0.60844 (0.60654)	Top-1 acc 60.938 (62.631)	Top-5 acc 82.031 (83.094)	lr 0.00838
Train [73][2650/3239]	Time 7.939 (0.978)	Data Time 7.693 (0.467)	Loss 2.5924 (2.5439)	Entropy 0.60819 (0.60654)	Top-1 acc 60.938 (62.627)	Top-5 acc 83.594 (83.090)	lr 0.00838
Train [73][2660/3239]	Time 0.255 (0.977)	Data Time 0.001 (0.467)	Loss 2.5436 (2.5440)	Entropy 0.60850 (0.60655)	Top-1 acc 59.375 (62.622)	Top-5 acc 84.766 (83.088)	lr 0.00838
Train [73][2670/3239]	Time 2.956 (0.978)	Data Time 2.700 (0.468)	Loss 2.4318 (2.5441)	Entropy 0.60843 (0.60656)	Top-1 acc 62.891 (62.622)	Top-5 acc 85.156 (83.086)	lr 0.00838
Train [73][2680/3239]	Time 0.250 (0.977)	Data Time 0.002 (0.467)	Loss 2.5959 (2.5442)	Entropy 0.60846 (0.60656)	Top-1 acc 61.719 (62.624)	Top-5 acc 81.250 (83.085)	lr 0.00838
Train [73][2690/3239]	Time 0.376 (0.981)	Data Time 0.001 (0.472)	Loss 2.5805 (2.5441)	Entropy 0.60794 (0.60657)	Top-1 acc 64.453 (62.626)	Top-5 acc 80.469 (83.085)	lr 0.00838
Train [73][2700/3239]	Time 0.252 (0.982)	Data Time 0.001 (0.473)	Loss 2.5633 (2.5442)	Entropy 0.60767 (0.60658)	Top-1 acc 63.672 (62.626)	Top-5 acc 83.594 (83.085)	lr 0.00838
Train [73][2710/3239]	Time 0.249 (0.981)	Data Time 0.001 (0.472)	Loss 2.5979 (2.5441)	Entropy 0.60780 (0.60658)	Top-1 acc 60.547 (62.627)	Top-5 acc 82.031 (83.085)	lr 0.00838
Train [73][2720/3239]	Time 0.225 (0.985)	Data Time 0.001 (0.476)	Loss 2.5593 (2.5445)	Entropy 0.60796 (0.60658)	Top-1 acc 60.938 (62.618)	Top-5 acc 82.031 (83.076)	lr 0.00838
Train [73][2730/3239]	Time 0.251 (0.985)	Data Time 0.001 (0.477)	Loss 2.6751 (2.5445)	Entropy 0.60821 (0.60659)	Top-1 acc 56.641 (62.617)	Top-5 acc 81.250 (83.076)	lr 0.00838
Train [73][2740/3239]	Time 0.256 (0.985)	Data Time 0.001 (0.476)	Loss 2.6048 (2.5446)	Entropy 0.60762 (0.60660)	Top-1 acc 60.938 (62.616)	Top-5 acc 83.984 (83.075)	lr 0.00838
Train [73][2750/3239]	Time 0.667 (0.989)	Data Time 0.379 (0.481)	Loss 2.5995 (2.5447)	Entropy 0.60741 (0.60660)	Top-1 acc 60.938 (62.612)	Top-5 acc 83.984 (83.077)	lr 0.00837
Train [73][2760/3239]	Time 0.364 (0.988)	Data Time 0.001 (0.481)	Loss 2.4656 (2.5445)	Entropy 0.60761 (0.60660)	Top-1 acc 64.453 (62.614)	Top-5 acc 84.766 (83.080)	lr 0.00837
Train [73][2770/3239]	Time 0.243 (0.988)	Data Time 0.001 (0.480)	Loss 2.4439 (2.5446)	Entropy 0.60766 (0.60661)	Top-1 acc 65.234 (62.614)	Top-5 acc 85.938 (83.079)	lr 0.00837
Train [73][2780/3239]	Time 0.258 (0.993)	Data Time 0.001 (0.485)	Loss 2.4223 (2.5446)	Entropy 0.60775 (0.60661)	Top-1 acc 65.625 (62.615)	Top-5 acc 84.375 (83.078)	lr 0.00837
Train [73][2790/3239]	Time 0.239 (0.992)	Data Time 0.001 (0.485)	Loss 2.4300 (2.5446)	Entropy 0.60784 (0.60661)	Top-1 acc 65.234 (62.617)	Top-5 acc 84.375 (83.076)	lr 0.00837
Train [73][2800/3239]	Time 5.869 (0.994)	Data Time 5.617 (0.487)	Loss 2.6525 (2.5445)	Entropy 0.60783 (0.60662)	Top-1 acc 59.766 (62.619)	Top-5 acc 80.469 (83.076)	lr 0.00837
Train [73][2810/3239]	Time 11.482 (0.996)	Data Time 11.242 (0.489)	Loss 2.6101 (2.5447)	Entropy 0.60800 (0.60662)	Top-1 acc 60.156 (62.614)	Top-5 acc 82.812 (83.072)	lr 0.00837
Train [73][2820/3239]	Time 0.239 (0.997)	Data Time 0.001 (0.490)	Loss 2.7347 (2.5446)	Entropy 0.60799 (0.60663)	Top-1 acc 59.766 (62.618)	Top-5 acc 79.688 (83.073)	lr 0.00837
Train [73][2830/3239]	Time 0.244 (0.995)	Data Time 0.001 (0.489)	Loss 2.5186 (2.5447)	Entropy 0.60798 (0.60663)	Top-1 acc 62.109 (62.618)	Top-5 acc 83.984 (83.071)	lr 0.00837
Train [73][2840/3239]	Time 0.277 (0.995)	Data Time 0.001 (0.489)	Loss 2.7121 (2.5449)	Entropy 0.60844 (0.60664)	Top-1 acc 60.938 (62.612)	Top-5 acc 79.297 (83.065)	lr 0.00837
Train [73][2850/3239]	Time 0.281 (1.001)	Data Time 0.001 (0.495)	Loss 2.5345 (2.5450)	Entropy 0.60834 (0.60664)	Top-1 acc 60.938 (62.613)	Top-5 acc 83.203 (83.064)	lr 0.00836
Train [73][2860/3239]	Time 0.241 (0.999)	Data Time 0.002 (0.493)	Loss 2.5717 (2.5449)	Entropy 0.60868 (0.60665)	Top-1 acc 63.281 (62.615)	Top-5 acc 84.766 (83.065)	lr 0.00836
Train [73][2870/3239]	Time 0.329 (0.999)	Data Time 0.089 (0.494)	Loss 2.6012 (2.5449)	Entropy 0.60830 (0.60666)	Top-1 acc 58.984 (62.614)	Top-5 acc 82.031 (83.068)	lr 0.00836
Train [73][2880/3239]	Time 0.270 (1.004)	Data Time 0.001 (0.499)	Loss 2.6358 (2.5449)	Entropy 0.60804 (0.60666)	Top-1 acc 60.938 (62.615)	Top-5 acc 83.203 (83.069)	lr 0.00836
Train [73][2890/3239]	Time 0.245 (1.004)	Data Time 0.001 (0.499)	Loss 2.6744 (2.5451)	Entropy 0.60813 (0.60667)	Top-1 acc 60.156 (62.609)	Top-5 acc 80.859 (83.066)	lr 0.00836
Train [73][2900/3239]	Time 0.260 (1.002)	Data Time 0.001 (0.497)	Loss 2.6021 (2.5453)	Entropy 0.60825 (0.60667)	Top-1 acc 60.547 (62.605)	Top-5 acc 80.078 (83.061)	lr 0.00836
Train [73][2910/3239]	Time 5.279 (1.008)	Data Time 5.022 (0.503)	Loss 2.4649 (2.5454)	Entropy 0.60820 (0.60668)	Top-1 acc 67.969 (62.605)	Top-5 acc 83.203 (83.062)	lr 0.00836
Train [73][2920/3239]	Time 0.413 (1.007)	Data Time 0.001 (0.503)	Loss 2.6177 (2.5454)	Entropy 0.60812 (0.60668)	Top-1 acc 59.766 (62.606)	Top-5 acc 81.250 (83.060)	lr 0.00836
Train [73][2930/3239]	Time 0.268 (1.007)	Data Time 0.001 (0.503)	Loss 2.6818 (2.5452)	Entropy 0.60812 (0.60669)	Top-1 acc 58.594 (62.608)	Top-5 acc 80.859 (83.063)	lr 0.00836
Train [73][2940/3239]	Time 0.248 (1.010)	Data Time 0.001 (0.507)	Loss 2.5823 (2.5454)	Entropy 0.60774 (0.60669)	Top-1 acc 60.156 (62.606)	Top-5 acc 83.984 (83.062)	lr 0.00836
Train [73][2950/3239]	Time 0.245 (1.011)	Data Time 0.001 (0.507)	Loss 2.3732 (2.5454)	Entropy 0.60677 (0.60669)	Top-1 acc 64.844 (62.608)	Top-5 acc 87.109 (83.062)	lr 0.00836
Train [73][2960/3239]	Time 2.749 (1.011)	Data Time 2.470 (0.508)	Loss 2.4554 (2.5452)	Entropy 0.60671 (0.60669)	Top-1 acc 58.984 (62.611)	Top-5 acc 84.375 (83.065)	lr 0.00835
Train [73][2970/3239]	Time 8.062 (1.012)	Data Time 7.805 (0.509)	Loss 2.4942 (2.5451)	Entropy 0.60672 (0.60669)	Top-1 acc 63.672 (62.616)	Top-5 acc 82.422 (83.067)	lr 0.00835
Train [73][2980/3239]	Time 0.285 (1.014)	Data Time 0.001 (0.511)	Loss 2.5527 (2.5451)	Entropy 0.60690 (0.60670)	Top-1 acc 61.328 (62.616)	Top-5 acc 83.984 (83.068)	lr 0.00835
Train [73][2990/3239]	Time 0.416 (1.013)	Data Time 0.053 (0.510)	Loss 2.5779 (2.5452)	Entropy 0.60699 (0.60670)	Top-1 acc 65.625 (62.614)	Top-5 acc 81.250 (83.067)	lr 0.00835
Train [73][3000/3239]	Time 1.958 (1.013)	Data Time 1.710 (0.511)	Loss 2.6703 (2.5451)	Entropy 0.60699 (0.60670)	Top-1 acc 58.594 (62.617)	Top-5 acc 78.516 (83.066)	lr 0.00835
Train [73][3010/3239]	Time 0.299 (1.018)	Data Time 0.002 (0.515)	Loss 2.2662 (2.5449)	Entropy 0.60684 (0.60670)	Top-1 acc 71.484 (62.625)	Top-5 acc 87.500 (83.071)	lr 0.00835
Train [73][3020/3239]	Time 0.233 (1.016)	Data Time 0.001 (0.514)	Loss 2.9456 (2.5449)	Entropy 0.60690 (0.60670)	Top-1 acc 55.469 (62.622)	Top-5 acc 76.562 (83.072)	lr 0.00835
Train [73][3030/3239]	Time 0.257 (1.016)	Data Time 0.001 (0.515)	Loss 2.4245 (2.5449)	Entropy 0.60692 (0.60670)	Top-1 acc 65.234 (62.624)	Top-5 acc 86.328 (83.074)	lr 0.00835
Train [73][3040/3239]	Time 0.248 (1.018)	Data Time 0.001 (0.517)	Loss 2.5157 (2.5447)	Entropy 0.60713 (0.60670)	Top-1 acc 64.062 (62.628)	Top-5 acc 82.422 (83.076)	lr 0.00835
Train [73][3050/3239]	Time 0.228 (1.020)	Data Time 0.001 (0.519)	Loss 2.4674 (2.5448)	Entropy 0.60738 (0.60670)	Top-1 acc 66.016 (62.623)	Top-5 acc 85.938 (83.077)	lr 0.00835
Train [73][3060/3239]	Time 0.237 (1.019)	Data Time 0.001 (0.518)	Loss 2.5292 (2.5447)	Entropy 0.60715 (0.60670)	Top-1 acc 65.234 (62.624)	Top-5 acc 83.984 (83.078)	lr 0.00834
Train [73][3070/3239]	Time 3.998 (1.022)	Data Time 3.753 (0.521)	Loss 2.5728 (2.5446)	Entropy 0.60712 (0.60670)	Top-1 acc 58.984 (62.626)	Top-5 acc 84.766 (83.080)	lr 0.00834
Train [73][3080/3239]	Time 0.357 (1.022)	Data Time 0.001 (0.522)	Loss 2.7795 (2.5445)	Entropy 0.60726 (0.60671)	Top-1 acc 58.203 (62.628)	Top-5 acc 81.641 (83.084)	lr 0.00834
Train [73][3090/3239]	Time 0.256 (1.024)	Data Time 0.001 (0.523)	Loss 2.5055 (2.5444)	Entropy 0.60749 (0.60671)	Top-1 acc 61.719 (62.629)	Top-5 acc 83.984 (83.085)	lr 0.00834
Train [73][3100/3239]	Time 2.369 (1.025)	Data Time 2.084 (0.525)	Loss 2.4105 (2.5442)	Entropy 0.60771 (0.60671)	Top-1 acc 68.359 (62.633)	Top-5 acc 84.766 (83.089)	lr 0.00834
Train [73][3110/3239]	Time 0.271 (1.027)	Data Time 0.001 (0.527)	Loss 2.7693 (2.5443)	Entropy 0.60782 (0.60671)	Top-1 acc 58.594 (62.630)	Top-5 acc 78.125 (83.090)	lr 0.00834
Train [73][3120/3239]	Time 3.942 (1.026)	Data Time 3.682 (0.527)	Loss 2.6135 (2.5445)	Entropy 0.60756 (0.60672)	Top-1 acc 63.281 (62.627)	Top-5 acc 83.203 (83.089)	lr 0.00834
Train [73][3130/3239]	Time 0.262 (1.026)	Data Time 0.002 (0.527)	Loss 2.2988 (2.5444)	Entropy 0.60766 (0.60672)	Top-1 acc 68.359 (62.625)	Top-5 acc 87.500 (83.088)	lr 0.00834
Train [73][3140/3239]	Time 0.251 (1.031)	Data Time 0.002 (0.531)	Loss 2.7108 (2.5445)	Entropy 0.60784 (0.60672)	Top-1 acc 62.891 (62.625)	Top-5 acc 79.688 (83.088)	lr 0.00834
Train [73][3150/3239]	Time 0.331 (1.045)	Data Time 0.002 (0.530)	Loss 2.4965 (2.5443)	Entropy 0.60793 (0.60673)	Top-1 acc 61.719 (62.628)	Top-5 acc 83.203 (83.092)	lr 0.00834
Train [73][3160/3239]	Time 0.263 (1.043)	Data Time 0.002 (0.528)	Loss 2.4569 (2.5441)	Entropy 0.60780 (0.60673)	Top-1 acc 63.281 (62.632)	Top-5 acc 86.328 (83.095)	lr 0.00834
Train [73][3170/3239]	Time 0.271 (1.041)	Data Time 0.003 (0.526)	Loss 2.8078 (2.5443)	Entropy 0.60809 (0.60673)	Top-1 acc 55.469 (62.627)	Top-5 acc 80.078 (83.092)	lr 0.00833
Train [73][3180/3239]	Time 0.249 (1.039)	Data Time 0.000 (0.525)	Loss 2.5125 (2.5443)	Entropy 0.60800 (0.60674)	Top-1 acc 63.281 (62.628)	Top-5 acc 82.812 (83.094)	lr 0.00833
Train [73][3190/3239]	Time 0.246 (1.037)	Data Time 0.000 (0.523)	Loss 2.5806 (2.5443)	Entropy 0.60778 (0.60674)	Top-1 acc 61.719 (62.631)	Top-5 acc 79.688 (83.091)	lr 0.00833
Train [73][3200/3239]	Time 0.254 (1.035)	Data Time 0.000 (0.522)	Loss 2.6980 (2.5444)	Entropy 0.60771 (0.60675)	Top-1 acc 60.938 (62.629)	Top-5 acc 78.516 (83.088)	lr 0.00833
Train [73][3210/3239]	Time 0.252 (1.037)	Data Time 0.000 (0.524)	Loss 2.7110 (2.5442)	Entropy 0.60776 (0.60675)	Top-1 acc 58.203 (62.636)	Top-5 acc 82.812 (83.091)	lr 0.00833
Train [73][3220/3239]	Time 0.258 (1.036)	Data Time 0.000 (0.522)	Loss 2.5273 (2.5440)	Entropy 0.60816 (0.60675)	Top-1 acc 61.328 (62.641)	Top-5 acc 83.203 (83.094)	lr 0.00833
Train [73][3230/3239]	Time 0.247 (1.034)	Data Time 0.000 (0.520)	Loss 2.4925 (2.5437)	Entropy 0.60795 (0.60676)	Top-1 acc 64.062 (62.651)	Top-5 acc 83.984 (83.099)	lr 0.00833
Train [73][3239/3239]	Time 0.979 (1.034)	Data Time 0.000 (0.521)	Loss 2.7193 (2.5441)	Entropy 0.60790 (0.60676)	Top-1 acc 51.852 (62.644)	Top-5 acc 76.543 (83.093)	lr 0.00833
==========Valid [73/120]	loss 1.342	top-1 acc 69.291 (69.291)	top-5 acc 88.555	Train top-1 62.644	top-5 83.093	Entropy 0.60790	Latency-None: 0.000ms	Flops: 539.00M
Train [74][0/3239]	Time 48.145 (48.145)	Data Time 47.768 (47.768)	Loss 2.3773 (2.3773)	Entropy 0.60778 (0.60778)	Top-1 acc 69.141 (69.141)	Top-5 acc 86.719 (86.719)	lr 0.00833
Train [74][10/3239]	Time 0.232 (4.783)	Data Time 0.001 (4.344)	Loss 2.6005 (2.4704)	Entropy 0.60742 (0.60771)	Top-1 acc 60.938 (64.773)	Top-5 acc 82.422 (84.624)	lr 0.00833
Train [74][20/3239]	Time 0.302 (2.724)	Data Time 0.003 (2.277)	Loss 2.3263 (2.4793)	Entropy 0.60731 (0.60755)	Top-1 acc 67.969 (64.249)	Top-5 acc 86.719 (84.524)	lr 0.00833
Train [74][30/3239]	Time 0.241 (2.004)	Data Time 0.001 (1.543)	Loss 2.6246 (2.5086)	Entropy 0.60700 (0.60741)	Top-1 acc 62.109 (63.458)	Top-5 acc 80.469 (84.047)	lr 0.00832
Train [74][40/3239]	Time 0.233 (1.649)	Data Time 0.001 (1.199)	Loss 2.4588 (2.5024)	Entropy 0.60712 (0.60732)	Top-1 acc 62.891 (63.758)	Top-5 acc 83.984 (84.184)	lr 0.00832
Train [74][50/3239]	Time 0.291 (1.426)	Data Time 0.002 (0.964)	Loss 2.4203 (2.5015)	Entropy 0.60705 (0.60730)	Top-1 acc 64.453 (63.802)	Top-5 acc 84.766 (84.245)	lr 0.00832
Train [74][60/3239]	Time 0.239 (1.288)	Data Time 0.001 (0.806)	Loss 2.6657 (2.5035)	Entropy 0.60741 (0.60727)	Top-1 acc 61.328 (63.877)	Top-5 acc 79.688 (84.100)	lr 0.00832
Train [74][70/3239]	Time 0.281 (1.169)	Data Time 0.001 (0.693)	Loss 2.5659 (2.5115)	Entropy 0.60726 (0.60728)	Top-1 acc 58.203 (63.474)	Top-5 acc 81.641 (83.891)	lr 0.00832
Train [74][80/3239]	Time 0.272 (1.081)	Data Time 0.002 (0.608)	Loss 2.4856 (2.5098)	Entropy 0.60667 (0.60724)	Top-1 acc 64.453 (63.489)	Top-5 acc 85.547 (83.931)	lr 0.00832
Train [74][90/3239]	Time 0.239 (1.010)	Data Time 0.001 (0.541)	Loss 2.8325 (2.5148)	Entropy 0.60654 (0.60718)	Top-1 acc 58.594 (63.483)	Top-5 acc 76.562 (83.851)	lr 0.00832
Train [74][100/3239]	Time 0.223 (0.956)	Data Time 0.001 (0.488)	Loss 2.6073 (2.5146)	Entropy 0.60637 (0.60711)	Top-1 acc 59.766 (63.428)	Top-5 acc 83.203 (83.822)	lr 0.00832
Train [74][110/3239]	Time 0.233 (0.913)	Data Time 0.001 (0.444)	Loss 2.7492 (2.5163)	Entropy 0.60614 (0.60704)	Top-1 acc 57.812 (63.464)	Top-5 acc 79.297 (83.798)	lr 0.00832
Train [74][120/3239]	Time 0.244 (0.876)	Data Time 0.001 (0.407)	Loss 2.4212 (2.5193)	Entropy 0.60616 (0.60696)	Top-1 acc 66.016 (63.465)	Top-5 acc 86.328 (83.755)	lr 0.00832
Train [74][130/3239]	Time 0.232 (0.845)	Data Time 0.001 (0.376)	Loss 2.6036 (2.5254)	Entropy 0.60610 (0.60690)	Top-1 acc 56.250 (63.278)	Top-5 acc 81.250 (83.677)	lr 0.00832
Train [74][140/3239]	Time 0.349 (0.818)	Data Time 0.001 (0.350)	Loss 2.7245 (2.5241)	Entropy 0.60616 (0.60684)	Top-1 acc 56.250 (63.265)	Top-5 acc 82.031 (83.707)	lr 0.00831
Train [74][150/3239]	Time 0.284 (0.794)	Data Time 0.001 (0.327)	Loss 2.5441 (2.5235)	Entropy 0.60612 (0.60680)	Top-1 acc 64.062 (63.227)	Top-5 acc 83.203 (83.705)	lr 0.00831
Train [74][160/3239]	Time 0.284 (0.773)	Data Time 0.001 (0.307)	Loss 2.5956 (2.5218)	Entropy 0.60648 (0.60676)	Top-1 acc 61.719 (63.235)	Top-5 acc 81.250 (83.717)	lr 0.00831
Train [74][170/3239]	Time 0.309 (0.755)	Data Time 0.001 (0.289)	Loss 2.4174 (2.5249)	Entropy 0.60649 (0.60675)	Top-1 acc 67.969 (63.188)	Top-5 acc 85.156 (83.619)	lr 0.00831
Train [74][180/3239]	Time 0.269 (0.740)	Data Time 0.001 (0.273)	Loss 2.4199 (2.5256)	Entropy 0.60631 (0.60673)	Top-1 acc 65.625 (63.186)	Top-5 acc 85.156 (83.615)	lr 0.00831
Train [74][190/3239]	Time 0.243 (0.725)	Data Time 0.001 (0.259)	Loss 2.3533 (2.5229)	Entropy 0.60612 (0.60671)	Top-1 acc 65.625 (63.275)	Top-5 acc 85.547 (83.616)	lr 0.00831
Train [74][200/3239]	Time 0.251 (0.711)	Data Time 0.002 (0.246)	Loss 2.4306 (2.5199)	Entropy 0.60620 (0.60668)	Top-1 acc 66.016 (63.332)	Top-5 acc 87.891 (83.683)	lr 0.00831
Train [74][210/3239]	Time 0.433 (0.699)	Data Time 0.001 (0.234)	Loss 2.5081 (2.5184)	Entropy 0.60595 (0.60666)	Top-1 acc 64.062 (63.378)	Top-5 acc 83.203 (83.677)	lr 0.00831
Train [74][220/3239]	Time 0.281 (0.689)	Data Time 0.001 (0.224)	Loss 2.3650 (2.5185)	Entropy 0.60612 (0.60663)	Top-1 acc 66.016 (63.354)	Top-5 acc 82.031 (83.656)	lr 0.00831
Train [74][230/3239]	Time 0.272 (0.678)	Data Time 0.001 (0.214)	Loss 2.6941 (2.5170)	Entropy 0.60573 (0.60660)	Top-1 acc 57.812 (63.403)	Top-5 acc 81.250 (83.677)	lr 0.00831
Train [74][240/3239]	Time 0.260 (0.671)	Data Time 0.001 (0.205)	Loss 2.4905 (2.5162)	Entropy 0.60544 (0.60657)	Top-1 acc 65.234 (63.469)	Top-5 acc 84.766 (83.691)	lr 0.00830
Train [74][250/3239]	Time 0.260 (0.663)	Data Time 0.001 (0.197)	Loss 2.5940 (2.5136)	Entropy 0.60528 (0.60652)	Top-1 acc 60.547 (63.538)	Top-5 acc 81.641 (83.723)	lr 0.00830
Train [74][260/3239]	Time 0.227 (0.655)	Data Time 0.001 (0.190)	Loss 2.5539 (2.5102)	Entropy 0.60529 (0.60647)	Top-1 acc 61.719 (63.609)	Top-5 acc 82.422 (83.785)	lr 0.00830
Train [74][270/3239]	Time 0.242 (0.648)	Data Time 0.001 (0.183)	Loss 2.4563 (2.5122)	Entropy 0.60545 (0.60644)	Top-1 acc 64.844 (63.597)	Top-5 acc 85.547 (83.735)	lr 0.00830
Train [74][280/3239]	Time 0.269 (0.641)	Data Time 0.001 (0.176)	Loss 2.6058 (2.5125)	Entropy 0.60569 (0.60640)	Top-1 acc 58.203 (63.559)	Top-5 acc 85.156 (83.768)	lr 0.00830
Train [74][290/3239]	Time 0.235 (0.635)	Data Time 0.001 (0.170)	Loss 2.4921 (2.5117)	Entropy 0.60573 (0.60638)	Top-1 acc 61.719 (63.546)	Top-5 acc 84.375 (83.811)	lr 0.00830
Train [74][300/3239]	Time 0.361 (0.628)	Data Time 0.001 (0.165)	Loss 2.6322 (2.5136)	Entropy 0.60583 (0.60636)	Top-1 acc 60.938 (63.495)	Top-5 acc 82.031 (83.766)	lr 0.00830
Train [74][310/3239]	Time 0.272 (0.621)	Data Time 0.001 (0.160)	Loss 2.4930 (2.5125)	Entropy 0.60577 (0.60634)	Top-1 acc 66.016 (63.507)	Top-5 acc 82.812 (83.768)	lr 0.00830
Train [74][320/3239]	Time 0.236 (0.615)	Data Time 0.001 (0.155)	Loss 2.3320 (2.5091)	Entropy 0.60586 (0.60632)	Top-1 acc 66.406 (63.573)	Top-5 acc 88.281 (83.843)	lr 0.00830
Train [74][330/3239]	Time 0.237 (0.609)	Data Time 0.001 (0.150)	Loss 2.3907 (2.5086)	Entropy 0.60609 (0.60631)	Top-1 acc 66.016 (63.585)	Top-5 acc 87.500 (83.868)	lr 0.00830
Train [74][340/3239]	Time 0.278 (0.603)	Data Time 0.002 (0.146)	Loss 2.4554 (2.5088)	Entropy 0.60589 (0.60630)	Top-1 acc 63.281 (63.599)	Top-5 acc 83.984 (83.861)	lr 0.00830
Train [74][350/3239]	Time 0.352 (0.601)	Data Time 0.002 (0.142)	Loss 2.3424 (2.5087)	Entropy 0.60625 (0.60630)	Top-1 acc 69.922 (63.612)	Top-5 acc 86.719 (83.837)	lr 0.00829
Train [74][360/3239]	Time 0.252 (0.597)	Data Time 0.001 (0.138)	Loss 2.6589 (2.5094)	Entropy 0.60641 (0.60630)	Top-1 acc 60.547 (63.582)	Top-5 acc 80.469 (83.840)	lr 0.00829
Train [74][370/3239]	Time 0.391 (0.594)	Data Time 0.001 (0.134)	Loss 2.3665 (2.5095)	Entropy 0.60662 (0.60630)	Top-1 acc 67.578 (63.583)	Top-5 acc 87.109 (83.849)	lr 0.00829
Train [74][380/3239]	Time 0.257 (0.591)	Data Time 0.001 (0.131)	Loss 2.3968 (2.5101)	Entropy 0.60651 (0.60631)	Top-1 acc 62.891 (63.589)	Top-5 acc 86.719 (83.816)	lr 0.00829
Train [74][390/3239]	Time 0.256 (0.588)	Data Time 0.001 (0.127)	Loss 2.3890 (2.5089)	Entropy 0.60636 (0.60632)	Top-1 acc 67.969 (63.643)	Top-5 acc 87.109 (83.825)	lr 0.00829
Train [74][400/3239]	Time 0.233 (0.586)	Data Time 0.001 (0.124)	Loss 2.5898 (2.5103)	Entropy 0.60627 (0.60632)	Top-1 acc 60.156 (63.574)	Top-5 acc 81.641 (83.808)	lr 0.00829
Train [74][410/3239]	Time 0.239 (0.582)	Data Time 0.001 (0.121)	Loss 2.2910 (2.5095)	Entropy 0.60636 (0.60632)	Top-1 acc 70.312 (63.583)	Top-5 acc 86.328 (83.817)	lr 0.00829
Train [74][420/3239]	Time 0.234 (0.580)	Data Time 0.001 (0.118)	Loss 2.4495 (2.5092)	Entropy 0.60662 (0.60632)	Top-1 acc 64.453 (63.585)	Top-5 acc 85.547 (83.820)	lr 0.00829
Train [74][430/3239]	Time 0.258 (0.577)	Data Time 0.001 (0.116)	Loss 2.4852 (2.5102)	Entropy 0.60653 (0.60633)	Top-1 acc 61.328 (63.575)	Top-5 acc 84.375 (83.788)	lr 0.00829
Train [74][440/3239]	Time 0.266 (0.575)	Data Time 0.001 (0.113)	Loss 2.5200 (2.5100)	Entropy 0.60658 (0.60633)	Top-1 acc 60.156 (63.562)	Top-5 acc 84.766 (83.797)	lr 0.00829
Train [74][450/3239]	Time 0.268 (0.572)	Data Time 0.001 (0.111)	Loss 2.6247 (2.5118)	Entropy 0.60667 (0.60634)	Top-1 acc 60.547 (63.549)	Top-5 acc 82.031 (83.757)	lr 0.00828
Train [74][460/3239]	Time 0.370 (0.571)	Data Time 0.001 (0.108)	Loss 2.5233 (2.5122)	Entropy 0.60618 (0.60634)	Top-1 acc 61.719 (63.545)	Top-5 acc 83.594 (83.754)	lr 0.00828
Train [74][470/3239]	Time 0.251 (0.568)	Data Time 0.001 (0.106)	Loss 2.4651 (2.5130)	Entropy 0.60596 (0.60634)	Top-1 acc 65.234 (63.544)	Top-5 acc 82.422 (83.731)	lr 0.00828
Train [74][480/3239]	Time 0.275 (0.566)	Data Time 0.001 (0.104)	Loss 2.2858 (2.5127)	Entropy 0.60629 (0.60633)	Top-1 acc 66.797 (63.541)	Top-5 acc 89.062 (83.729)	lr 0.00828
Train [74][490/3239]	Time 0.257 (0.563)	Data Time 0.001 (0.102)	Loss 2.4606 (2.5135)	Entropy 0.60614 (0.60633)	Top-1 acc 64.062 (63.505)	Top-5 acc 84.766 (83.727)	lr 0.00828
Train [74][500/3239]	Time 0.269 (0.561)	Data Time 0.001 (0.100)	Loss 2.2970 (2.5122)	Entropy 0.60637 (0.60633)	Top-1 acc 69.141 (63.544)	Top-5 acc 88.281 (83.740)	lr 0.00828
Train [74][510/3239]	Time 0.287 (0.560)	Data Time 0.002 (0.098)	Loss 2.4644 (2.5130)	Entropy 0.60611 (0.60632)	Top-1 acc 67.969 (63.521)	Top-5 acc 84.375 (83.718)	lr 0.00828
Train [74][520/3239]	Time 0.262 (0.558)	Data Time 0.001 (0.096)	Loss 2.7643 (2.5153)	Entropy 0.60578 (0.60632)	Top-1 acc 57.031 (63.448)	Top-5 acc 80.469 (83.670)	lr 0.00828
Train [74][530/3239]	Time 0.379 (0.556)	Data Time 0.002 (0.094)	Loss 2.5205 (2.5172)	Entropy 0.60599 (0.60631)	Top-1 acc 62.891 (63.395)	Top-5 acc 83.594 (83.626)	lr 0.00828
Train [74][540/3239]	Time 0.260 (0.554)	Data Time 0.001 (0.093)	Loss 2.5766 (2.5173)	Entropy 0.60617 (0.60630)	Top-1 acc 63.672 (63.387)	Top-5 acc 80.859 (83.607)	lr 0.00828
Train [74][550/3239]	Time 0.245 (0.553)	Data Time 0.001 (0.091)	Loss 2.4082 (2.5174)	Entropy 0.60627 (0.60630)	Top-1 acc 62.891 (63.373)	Top-5 acc 88.281 (83.604)	lr 0.00828
Train [74][560/3239]	Time 0.400 (0.638)	Data Time 0.005 (0.089)	Loss 2.4187 (2.5176)	Entropy 0.60634 (0.60630)	Top-1 acc 66.016 (63.365)	Top-5 acc 85.547 (83.615)	lr 0.00827
Train [74][570/3239]	Time 0.261 (0.636)	Data Time 0.002 (0.088)	Loss 2.4230 (2.5192)	Entropy 0.60651 (0.60630)	Top-1 acc 62.500 (63.320)	Top-5 acc 85.938 (83.592)	lr 0.00827
Train [74][580/3239]	Time 0.240 (0.633)	Data Time 0.002 (0.086)	Loss 2.6529 (2.5196)	Entropy 0.60676 (0.60630)	Top-1 acc 58.984 (63.320)	Top-5 acc 80.469 (83.588)	lr 0.00827
Train [74][590/3239]	Time 0.258 (0.630)	Data Time 0.002 (0.085)	Loss 2.4346 (2.5198)	Entropy 0.60684 (0.60631)	Top-1 acc 62.891 (63.322)	Top-5 acc 85.938 (83.581)	lr 0.00827
Train [74][600/3239]	Time 0.237 (0.627)	Data Time 0.001 (0.084)	Loss 2.4939 (2.5197)	Entropy 0.60693 (0.60632)	Top-1 acc 62.500 (63.333)	Top-5 acc 82.422 (83.577)	lr 0.00827
Train [74][610/3239]	Time 0.254 (0.624)	Data Time 0.001 (0.082)	Loss 2.5255 (2.5186)	Entropy 0.60688 (0.60633)	Top-1 acc 62.891 (63.369)	Top-5 acc 82.031 (83.600)	lr 0.00827
Train [74][620/3239]	Time 0.331 (0.621)	Data Time 0.002 (0.081)	Loss 2.7124 (2.5194)	Entropy 0.60674 (0.60634)	Top-1 acc 57.812 (63.349)	Top-5 acc 78.906 (83.581)	lr 0.00827
Train [74][630/3239]	Time 0.241 (0.619)	Data Time 0.001 (0.080)	Loss 2.5463 (2.5192)	Entropy 0.60690 (0.60635)	Top-1 acc 62.500 (63.340)	Top-5 acc 80.469 (83.585)	lr 0.00827
Train [74][640/3239]	Time 0.230 (0.616)	Data Time 0.001 (0.078)	Loss 2.6111 (2.5195)	Entropy 0.60720 (0.60636)	Top-1 acc 62.891 (63.331)	Top-5 acc 81.250 (83.585)	lr 0.00827
Train [74][650/3239]	Time 0.266 (0.614)	Data Time 0.001 (0.077)	Loss 2.3640 (2.5192)	Entropy 0.60682 (0.60637)	Top-1 acc 68.359 (63.335)	Top-5 acc 87.500 (83.588)	lr 0.00827
Train [74][660/3239]	Time 0.279 (0.611)	Data Time 0.001 (0.076)	Loss 2.6637 (2.5199)	Entropy 0.60705 (0.60638)	Top-1 acc 58.984 (63.308)	Top-5 acc 79.297 (83.569)	lr 0.00826
Train [74][670/3239]	Time 0.243 (0.609)	Data Time 0.001 (0.075)	Loss 2.8921 (2.5204)	Entropy 0.60718 (0.60639)	Top-1 acc 55.469 (63.294)	Top-5 acc 78.125 (83.569)	lr 0.00826
Train [74][680/3239]	Time 0.240 (0.607)	Data Time 0.001 (0.074)	Loss 2.3129 (2.5201)	Entropy 0.60702 (0.60640)	Top-1 acc 71.094 (63.311)	Top-5 acc 85.547 (83.569)	lr 0.00826
Train [74][690/3239]	Time 0.364 (0.604)	Data Time 0.001 (0.073)	Loss 2.4949 (2.5198)	Entropy 0.60677 (0.60641)	Top-1 acc 62.500 (63.307)	Top-5 acc 83.984 (83.573)	lr 0.00826
Train [74][700/3239]	Time 0.247 (0.602)	Data Time 0.001 (0.072)	Loss 2.4624 (2.5199)	Entropy 0.60674 (0.60641)	Top-1 acc 61.328 (63.294)	Top-5 acc 86.328 (83.573)	lr 0.00826
Train [74][710/3239]	Time 0.256 (0.600)	Data Time 0.001 (0.071)	Loss 2.4444 (2.5194)	Entropy 0.60677 (0.60642)	Top-1 acc 70.312 (63.302)	Top-5 acc 85.156 (83.581)	lr 0.00826
Train [74][720/3239]	Time 1.642 (0.600)	Data Time 1.352 (0.072)	Loss 2.3751 (2.5192)	Entropy 0.60682 (0.60642)	Top-1 acc 67.578 (63.296)	Top-5 acc 86.719 (83.586)	lr 0.00826
Train [74][730/3239]	Time 2.935 (0.605)	Data Time 2.584 (0.077)	Loss 2.5489 (2.5187)	Entropy 0.60681 (0.60643)	Top-1 acc 60.938 (63.304)	Top-5 acc 81.641 (83.589)	lr 0.00826
Train [74][740/3239]	Time 0.239 (0.603)	Data Time 0.001 (0.076)	Loss 2.5261 (2.5192)	Entropy 0.60681 (0.60643)	Top-1 acc 60.547 (63.300)	Top-5 acc 83.594 (83.577)	lr 0.00826
Train [74][750/3239]	Time 0.233 (0.601)	Data Time 0.001 (0.076)	Loss 2.7508 (2.5203)	Entropy 0.60709 (0.60644)	Top-1 acc 57.812 (63.271)	Top-5 acc 79.688 (83.562)	lr 0.00826
Train [74][760/3239]	Time 0.232 (0.603)	Data Time 0.001 (0.078)	Loss 2.6724 (2.5208)	Entropy 0.60762 (0.60645)	Top-1 acc 56.250 (63.247)	Top-5 acc 82.812 (83.554)	lr 0.00826
Train [74][770/3239]	Time 0.241 (0.603)	Data Time 0.001 (0.079)	Loss 2.9170 (2.5213)	Entropy 0.60748 (0.60646)	Top-1 acc 51.562 (63.223)	Top-5 acc 79.297 (83.548)	lr 0.00825
Train [74][780/3239]	Time 0.241 (0.601)	Data Time 0.001 (0.079)	Loss 2.5306 (2.5211)	Entropy 0.60773 (0.60648)	Top-1 acc 65.625 (63.219)	Top-5 acc 82.422 (83.554)	lr 0.00825
Train [74][790/3239]	Time 0.229 (0.605)	Data Time 0.001 (0.084)	Loss 2.6633 (2.5208)	Entropy 0.60786 (0.60649)	Top-1 acc 59.766 (63.234)	Top-5 acc 82.031 (83.559)	lr 0.00825
Train [74][800/3239]	Time 0.233 (0.607)	Data Time 0.001 (0.087)	Loss 2.5460 (2.5209)	Entropy 0.60762 (0.60651)	Top-1 acc 61.719 (63.214)	Top-5 acc 82.031 (83.557)	lr 0.00825
Train [74][810/3239]	Time 0.237 (0.605)	Data Time 0.001 (0.086)	Loss 2.6518 (2.5216)	Entropy 0.60809 (0.60652)	Top-1 acc 61.719 (63.196)	Top-5 acc 83.984 (83.552)	lr 0.00825
Train [74][820/3239]	Time 0.254 (0.602)	Data Time 0.001 (0.085)	Loss 2.6614 (2.5217)	Entropy 0.60759 (0.60654)	Top-1 acc 57.031 (63.206)	Top-5 acc 80.469 (83.550)	lr 0.00825
Train [74][830/3239]	Time 0.262 (0.608)	Data Time 0.001 (0.091)	Loss 2.5045 (2.5216)	Entropy 0.60764 (0.60655)	Top-1 acc 66.016 (63.210)	Top-5 acc 82.812 (83.543)	lr 0.00825
Train [74][840/3239]	Time 0.239 (0.606)	Data Time 0.001 (0.090)	Loss 2.4844 (2.5215)	Entropy 0.60793 (0.60657)	Top-1 acc 61.719 (63.216)	Top-5 acc 84.375 (83.544)	lr 0.00825
Train [74][850/3239]	Time 0.319 (0.604)	Data Time 0.001 (0.089)	Loss 2.5972 (2.5214)	Entropy 0.60778 (0.60658)	Top-1 acc 60.547 (63.218)	Top-5 acc 83.203 (83.538)	lr 0.00825
Train [74][860/3239]	Time 0.255 (0.610)	Data Time 0.001 (0.095)	Loss 2.4163 (2.5213)	Entropy 0.60746 (0.60660)	Top-1 acc 62.500 (63.211)	Top-5 acc 84.766 (83.535)	lr 0.00825
Train [74][870/3239]	Time 0.248 (0.608)	Data Time 0.001 (0.094)	Loss 2.5455 (2.5208)	Entropy 0.60726 (0.60661)	Top-1 acc 64.062 (63.217)	Top-5 acc 83.984 (83.546)	lr 0.00824
Train [74][880/3239]	Time 0.239 (0.607)	Data Time 0.001 (0.093)	Loss 2.5327 (2.5206)	Entropy 0.60713 (0.60661)	Top-1 acc 63.281 (63.226)	Top-5 acc 82.422 (83.547)	lr 0.00824
Train [74][890/3239]	Time 1.228 (0.612)	Data Time 0.990 (0.099)	Loss 2.4616 (2.5199)	Entropy 0.60712 (0.60662)	Top-1 acc 62.109 (63.233)	Top-5 acc 83.984 (83.555)	lr 0.00824
Train [74][900/3239]	Time 0.252 (0.610)	Data Time 0.001 (0.098)	Loss 2.7980 (2.5197)	Entropy 0.60723 (0.60663)	Top-1 acc 55.469 (63.241)	Top-5 acc 80.078 (83.555)	lr 0.00824
Train [74][910/3239]	Time 0.231 (0.608)	Data Time 0.001 (0.097)	Loss 2.4964 (2.5196)	Entropy 0.60719 (0.60663)	Top-1 acc 65.234 (63.241)	Top-5 acc 82.812 (83.562)	lr 0.00824
Train [74][920/3239]	Time 0.352 (0.614)	Data Time 0.001 (0.104)	Loss 2.3388 (2.5191)	Entropy 0.60681 (0.60664)	Top-1 acc 66.016 (63.255)	Top-5 acc 86.719 (83.564)	lr 0.00824
Train [74][930/3239]	Time 0.257 (0.617)	Data Time 0.001 (0.108)	Loss 2.4889 (2.5186)	Entropy 0.60667 (0.60664)	Top-1 acc 60.156 (63.267)	Top-5 acc 84.375 (83.569)	lr 0.00824
Train [74][940/3239]	Time 0.238 (0.615)	Data Time 0.001 (0.107)	Loss 2.7012 (2.5187)	Entropy 0.60635 (0.60664)	Top-1 acc 60.938 (63.256)	Top-5 acc 78.125 (83.558)	lr 0.00824
Train [74][950/3239]	Time 0.247 (0.620)	Data Time 0.002 (0.112)	Loss 2.4168 (2.5193)	Entropy 0.60648 (0.60664)	Top-1 acc 64.844 (63.231)	Top-5 acc 85.156 (83.542)	lr 0.00824
Train [74][960/3239]	Time 0.237 (0.623)	Data Time 0.001 (0.116)	Loss 2.3376 (2.5186)	Entropy 0.60629 (0.60664)	Top-1 acc 70.703 (63.243)	Top-5 acc 85.547 (83.557)	lr 0.00824
Train [74][970/3239]	Time 0.251 (0.621)	Data Time 0.001 (0.115)	Loss 2.4188 (2.5183)	Entropy 0.60623 (0.60663)	Top-1 acc 66.797 (63.260)	Top-5 acc 85.938 (83.568)	lr 0.00824
Train [74][980/3239]	Time 0.245 (0.619)	Data Time 0.001 (0.114)	Loss 2.5821 (2.5188)	Entropy 0.60630 (0.60663)	Top-1 acc 64.844 (63.249)	Top-5 acc 82.812 (83.558)	lr 0.00823
Train [74][990/3239]	Time 0.241 (0.628)	Data Time 0.001 (0.123)	Loss 2.4755 (2.5182)	Entropy 0.60634 (0.60663)	Top-1 acc 60.547 (63.256)	Top-5 acc 85.156 (83.569)	lr 0.00823
Train [74][1000/3239]	Time 0.234 (0.626)	Data Time 0.001 (0.122)	Loss 2.5364 (2.5180)	Entropy 0.60641 (0.60662)	Top-1 acc 66.016 (63.271)	Top-5 acc 85.156 (83.579)	lr 0.00823
Train [74][1010/3239]	Time 0.329 (0.624)	Data Time 0.001 (0.121)	Loss 2.4832 (2.5176)	Entropy 0.60675 (0.60662)	Top-1 acc 62.891 (63.281)	Top-5 acc 83.594 (83.579)	lr 0.00823
Train [74][1020/3239]	Time 0.241 (0.633)	Data Time 0.001 (0.131)	Loss 2.5157 (2.5176)	Entropy 0.60679 (0.60662)	Top-1 acc 62.109 (63.277)	Top-5 acc 85.547 (83.580)	lr 0.00823
Train [74][1030/3239]	Time 0.272 (0.631)	Data Time 0.002 (0.129)	Loss 2.5246 (2.5185)	Entropy 0.60653 (0.60663)	Top-1 acc 61.719 (63.263)	Top-5 acc 82.812 (83.562)	lr 0.00823
Train [74][1040/3239]	Time 0.242 (0.629)	Data Time 0.001 (0.128)	Loss 2.3911 (2.5184)	Entropy 0.60659 (0.60662)	Top-1 acc 66.797 (63.262)	Top-5 acc 83.594 (83.555)	lr 0.00823
Train [74][1050/3239]	Time 1.415 (0.636)	Data Time 1.176 (0.136)	Loss 2.6018 (2.5185)	Entropy 0.60633 (0.60662)	Top-1 acc 64.453 (63.267)	Top-5 acc 83.203 (83.549)	lr 0.00823
Train [74][1060/3239]	Time 0.319 (0.634)	Data Time 0.001 (0.135)	Loss 2.7224 (2.5183)	Entropy 0.60610 (0.60662)	Top-1 acc 58.203 (63.254)	Top-5 acc 81.250 (83.550)	lr 0.00823
Train [74][1070/3239]	Time 0.252 (0.632)	Data Time 0.001 (0.134)	Loss 2.7047 (2.5183)	Entropy 0.60605 (0.60662)	Top-1 acc 58.594 (63.255)	Top-5 acc 80.859 (83.551)	lr 0.00823
Train [74][1080/3239]	Time 0.429 (0.638)	Data Time 0.001 (0.140)	Loss 2.3527 (2.5182)	Entropy 0.60588 (0.60661)	Top-1 acc 66.797 (63.263)	Top-5 acc 85.156 (83.551)	lr 0.00822
Train [74][1090/3239]	Time 0.246 (0.644)	Data Time 0.001 (0.147)	Loss 2.3972 (2.5175)	Entropy 0.60579 (0.60660)	Top-1 acc 66.406 (63.275)	Top-5 acc 85.938 (83.566)	lr 0.00822
Train [74][1100/3239]	Time 0.236 (0.642)	Data Time 0.001 (0.145)	Loss 2.4525 (2.5176)	Entropy 0.60538 (0.60659)	Top-1 acc 64.844 (63.267)	Top-5 acc 84.375 (83.560)	lr 0.00822
Train [74][1110/3239]	Time 0.255 (0.644)	Data Time 0.001 (0.147)	Loss 2.5517 (2.5183)	Entropy 0.60506 (0.60658)	Top-1 acc 64.453 (63.251)	Top-5 acc 83.594 (83.543)	lr 0.00822
Train [74][1120/3239]	Time 0.282 (0.647)	Data Time 0.001 (0.152)	Loss 2.5262 (2.5186)	Entropy 0.60500 (0.60657)	Top-1 acc 65.625 (63.241)	Top-5 acc 82.031 (83.541)	lr 0.00822
Train [74][1130/3239]	Time 0.239 (0.645)	Data Time 0.001 (0.150)	Loss 2.4961 (2.5183)	Entropy 0.60480 (0.60655)	Top-1 acc 62.891 (63.251)	Top-5 acc 85.156 (83.549)	lr 0.00822
Train [74][1140/3239]	Time 0.233 (0.644)	Data Time 0.001 (0.149)	Loss 2.4745 (2.5181)	Entropy 0.60499 (0.60654)	Top-1 acc 65.234 (63.256)	Top-5 acc 83.203 (83.549)	lr 0.00822
Train [74][1150/3239]	Time 0.237 (0.652)	Data Time 0.001 (0.158)	Loss 2.3880 (2.5184)	Entropy 0.60519 (0.60653)	Top-1 acc 67.188 (63.253)	Top-5 acc 86.328 (83.546)	lr 0.00822
Train [74][1160/3239]	Time 0.245 (0.650)	Data Time 0.001 (0.157)	Loss 2.5450 (2.5186)	Entropy 0.60548 (0.60652)	Top-1 acc 63.672 (63.257)	Top-5 acc 81.641 (83.539)	lr 0.00822
Train [74][1170/3239]	Time 0.288 (0.648)	Data Time 0.001 (0.155)	Loss 2.6654 (2.5190)	Entropy 0.60517 (0.60651)	Top-1 acc 58.594 (63.250)	Top-5 acc 82.422 (83.530)	lr 0.00822
Train [74][1180/3239]	Time 0.238 (0.658)	Data Time 0.001 (0.166)	Loss 2.4110 (2.5193)	Entropy 0.60533 (0.60650)	Top-1 acc 66.406 (63.246)	Top-5 acc 85.938 (83.521)	lr 0.00822
Train [74][1190/3239]	Time 0.240 (0.656)	Data Time 0.001 (0.165)	Loss 2.5629 (2.5193)	Entropy 0.60531 (0.60649)	Top-1 acc 63.672 (63.250)	Top-5 acc 82.422 (83.518)	lr 0.00821
Train [74][1200/3239]	Time 0.235 (0.654)	Data Time 0.001 (0.163)	Loss 2.6479 (2.5199)	Entropy 0.60554 (0.60648)	Top-1 acc 61.328 (63.236)	Top-5 acc 76.953 (83.499)	lr 0.00821
Train [74][1210/3239]	Time 10.333 (0.664)	Data Time 10.077 (0.173)	Loss 2.4970 (2.5199)	Entropy 0.60596 (0.60647)	Top-1 acc 62.500 (63.236)	Top-5 acc 84.375 (83.499)	lr 0.00821
Train [74][1220/3239]	Time 0.356 (0.701)	Data Time 0.004 (0.171)	Loss 2.5289 (2.5202)	Entropy 0.60585 (0.60647)	Top-1 acc 63.672 (63.224)	Top-5 acc 80.859 (83.496)	lr 0.00821
Train [74][1230/3239]	Time 0.241 (0.698)	Data Time 0.002 (0.170)	Loss 2.3907 (2.5202)	Entropy 0.60567 (0.60646)	Top-1 acc 69.531 (63.224)	Top-5 acc 87.500 (83.499)	lr 0.00821
Train [74][1240/3239]	Time 0.349 (0.696)	Data Time 0.002 (0.169)	Loss 2.4909 (2.5200)	Entropy 0.60558 (0.60645)	Top-1 acc 63.672 (63.221)	Top-5 acc 82.812 (83.494)	lr 0.00821
Train [74][1250/3239]	Time 0.257 (0.694)	Data Time 0.001 (0.167)	Loss 2.5239 (2.5201)	Entropy 0.60594 (0.60645)	Top-1 acc 62.109 (63.223)	Top-5 acc 83.984 (83.495)	lr 0.00821
Train [74][1260/3239]	Time 0.255 (0.692)	Data Time 0.001 (0.166)	Loss 2.5198 (2.5205)	Entropy 0.60619 (0.60644)	Top-1 acc 63.281 (63.217)	Top-5 acc 83.203 (83.488)	lr 0.00821
Train [74][1270/3239]	Time 0.245 (0.690)	Data Time 0.002 (0.165)	Loss 2.6205 (2.5205)	Entropy 0.60589 (0.60644)	Top-1 acc 57.812 (63.221)	Top-5 acc 79.297 (83.485)	lr 0.00821
Train [74][1280/3239]	Time 0.293 (0.688)	Data Time 0.002 (0.163)	Loss 2.4737 (2.5206)	Entropy 0.60510 (0.60643)	Top-1 acc 63.281 (63.221)	Top-5 acc 83.984 (83.479)	lr 0.00821
Train [74][1290/3239]	Time 0.292 (0.688)	Data Time 0.002 (0.164)	Loss 2.4451 (2.5206)	Entropy 0.60503 (0.60642)	Top-1 acc 64.062 (63.223)	Top-5 acc 83.203 (83.481)	lr 0.00820
Train [74][1300/3239]	Time 0.245 (0.686)	Data Time 0.001 (0.163)	Loss 2.6109 (2.5203)	Entropy 0.60515 (0.60641)	Top-1 acc 64.062 (63.231)	Top-5 acc 79.688 (83.490)	lr 0.00820
Train [74][1310/3239]	Time 0.251 (0.685)	Data Time 0.001 (0.162)	Loss 2.4258 (2.5199)	Entropy 0.60516 (0.60640)	Top-1 acc 66.016 (63.237)	Top-5 acc 85.156 (83.494)	lr 0.00820
Train [74][1320/3239]	Time 0.230 (0.693)	Data Time 0.001 (0.171)	Loss 2.5882 (2.5202)	Entropy 0.60454 (0.60639)	Top-1 acc 62.109 (63.235)	Top-5 acc 83.203 (83.485)	lr 0.00820
Train [74][1330/3239]	Time 0.270 (0.693)	Data Time 0.002 (0.171)	Loss 2.5071 (2.5206)	Entropy 0.60478 (0.60638)	Top-1 acc 63.281 (63.227)	Top-5 acc 81.641 (83.476)	lr 0.00820
Train [74][1340/3239]	Time 0.237 (0.691)	Data Time 0.001 (0.170)	Loss 2.4651 (2.5208)	Entropy 0.60484 (0.60637)	Top-1 acc 65.625 (63.224)	Top-5 acc 86.328 (83.473)	lr 0.00820
Train [74][1350/3239]	Time 0.242 (0.699)	Data Time 0.001 (0.178)	Loss 2.5072 (2.5206)	Entropy 0.60478 (0.60636)	Top-1 acc 62.109 (63.232)	Top-5 acc 84.766 (83.475)	lr 0.00820
Train [74][1360/3239]	Time 0.259 (0.698)	Data Time 0.002 (0.178)	Loss 2.6923 (2.5204)	Entropy 0.60487 (0.60634)	Top-1 acc 56.641 (63.230)	Top-5 acc 78.906 (83.475)	lr 0.00820
Train [74][1370/3239]	Time 0.238 (0.696)	Data Time 0.001 (0.176)	Loss 2.3811 (2.5206)	Entropy 0.60495 (0.60633)	Top-1 acc 66.406 (63.220)	Top-5 acc 86.719 (83.478)	lr 0.00820
Train [74][1380/3239]	Time 4.167 (0.702)	Data Time 3.913 (0.183)	Loss 2.5962 (2.5204)	Entropy 0.60546 (0.60633)	Top-1 acc 64.844 (63.229)	Top-5 acc 82.812 (83.481)	lr 0.00820
Train [74][1390/3239]	Time 0.233 (0.703)	Data Time 0.001 (0.185)	Loss 2.4987 (2.5212)	Entropy 0.60528 (0.60632)	Top-1 acc 64.844 (63.211)	Top-5 acc 82.812 (83.469)	lr 0.00820
Train [74][1400/3239]	Time 0.347 (0.701)	Data Time 0.001 (0.184)	Loss 2.8515 (2.5219)	Entropy 0.60523 (0.60631)	Top-1 acc 53.906 (63.196)	Top-5 acc 76.953 (83.458)	lr 0.00819
Train [74][1410/3239]	Time 0.239 (0.705)	Data Time 0.001 (0.188)	Loss 2.5721 (2.5222)	Entropy 0.60535 (0.60630)	Top-1 acc 63.672 (63.192)	Top-5 acc 83.594 (83.456)	lr 0.00819
Train [74][1420/3239]	Time 0.290 (0.710)	Data Time 0.001 (0.194)	Loss 2.4377 (2.5216)	Entropy 0.60490 (0.60630)	Top-1 acc 66.406 (63.209)	Top-5 acc 87.109 (83.474)	lr 0.00819
Train [74][1430/3239]	Time 0.236 (0.709)	Data Time 0.001 (0.193)	Loss 2.7078 (2.5216)	Entropy 0.60493 (0.60629)	Top-1 acc 60.156 (63.221)	Top-5 acc 80.469 (83.466)	lr 0.00819
Train [74][1440/3239]	Time 0.266 (0.710)	Data Time 0.001 (0.195)	Loss 2.4860 (2.5219)	Entropy 0.60483 (0.60628)	Top-1 acc 64.453 (63.219)	Top-5 acc 82.812 (83.462)	lr 0.00819
Train [74][1450/3239]	Time 0.249 (0.716)	Data Time 0.001 (0.201)	Loss 2.5184 (2.5219)	Entropy 0.60459 (0.60626)	Top-1 acc 67.578 (63.218)	Top-5 acc 83.203 (83.467)	lr 0.00819
Train [74][1460/3239]	Time 0.283 (0.714)	Data Time 0.002 (0.200)	Loss 2.5374 (2.5222)	Entropy 0.60498 (0.60625)	Top-1 acc 63.672 (63.205)	Top-5 acc 83.203 (83.460)	lr 0.00819
Train [74][1470/3239]	Time 0.336 (0.712)	Data Time 0.001 (0.198)	Loss 2.6707 (2.5227)	Entropy 0.60487 (0.60624)	Top-1 acc 60.156 (63.198)	Top-5 acc 81.641 (83.448)	lr 0.00819
Train [74][1480/3239]	Time 0.282 (0.720)	Data Time 0.001 (0.208)	Loss 2.5965 (2.5226)	Entropy 0.60522 (0.60624)	Top-1 acc 63.672 (63.203)	Top-5 acc 80.078 (83.444)	lr 0.00819
Train [74][1490/3239]	Time 0.252 (0.718)	Data Time 0.001 (0.206)	Loss 2.4138 (2.5227)	Entropy 0.60537 (0.60623)	Top-1 acc 64.844 (63.196)	Top-5 acc 85.156 (83.444)	lr 0.00819
Train [74][1500/3239]	Time 0.252 (0.716)	Data Time 0.001 (0.205)	Loss 2.4398 (2.5230)	Entropy 0.60513 (0.60622)	Top-1 acc 63.672 (63.186)	Top-5 acc 83.984 (83.443)	lr 0.00818
Train [74][1510/3239]	Time 0.277 (0.729)	Data Time 0.002 (0.218)	Loss 2.5760 (2.5228)	Entropy 0.60531 (0.60622)	Top-1 acc 67.188 (63.190)	Top-5 acc 81.641 (83.448)	lr 0.00818
Train [74][1520/3239]	Time 0.242 (0.727)	Data Time 0.002 (0.216)	Loss 2.5370 (2.5230)	Entropy 0.60538 (0.60621)	Top-1 acc 63.281 (63.188)	Top-5 acc 87.109 (83.448)	lr 0.00818
Train [74][1530/3239]	Time 0.253 (0.725)	Data Time 0.001 (0.215)	Loss 2.3178 (2.5234)	Entropy 0.60529 (0.60621)	Top-1 acc 67.188 (63.174)	Top-5 acc 88.281 (83.443)	lr 0.00818
Train [74][1540/3239]	Time 12.843 (0.734)	Data Time 12.607 (0.224)	Loss 2.6326 (2.5231)	Entropy 0.60553 (0.60620)	Top-1 acc 58.594 (63.171)	Top-5 acc 83.203 (83.450)	lr 0.00818
Train [74][1550/3239]	Time 0.250 (0.732)	Data Time 0.001 (0.223)	Loss 2.3855 (2.5235)	Entropy 0.60545 (0.60620)	Top-1 acc 67.578 (63.169)	Top-5 acc 84.766 (83.439)	lr 0.00818
Train [74][1560/3239]	Time 0.346 (0.730)	Data Time 0.001 (0.221)	Loss 2.5296 (2.5235)	Entropy 0.60555 (0.60619)	Top-1 acc 65.234 (63.169)	Top-5 acc 80.859 (83.433)	lr 0.00818
Train [74][1570/3239]	Time 4.899 (0.732)	Data Time 4.648 (0.224)	Loss 2.5766 (2.5236)	Entropy 0.60552 (0.60619)	Top-1 acc 61.719 (63.169)	Top-5 acc 82.812 (83.432)	lr 0.00818
Train [74][1580/3239]	Time 0.281 (0.740)	Data Time 0.002 (0.232)	Loss 2.2712 (2.5234)	Entropy 0.60575 (0.60618)	Top-1 acc 70.312 (63.171)	Top-5 acc 87.500 (83.435)	lr 0.00818
Train [74][1590/3239]	Time 0.241 (0.738)	Data Time 0.001 (0.231)	Loss 2.6871 (2.5237)	Entropy 0.60518 (0.60618)	Top-1 acc 58.594 (63.159)	Top-5 acc 78.516 (83.432)	lr 0.00818
Train [74][1600/3239]	Time 0.236 (0.737)	Data Time 0.001 (0.230)	Loss 2.6020 (2.5240)	Entropy 0.60495 (0.60617)	Top-1 acc 62.500 (63.150)	Top-5 acc 80.469 (83.426)	lr 0.00818
Train [74][1610/3239]	Time 0.248 (0.747)	Data Time 0.001 (0.241)	Loss 2.4163 (2.5240)	Entropy 0.60488 (0.60617)	Top-1 acc 64.062 (63.157)	Top-5 acc 85.156 (83.424)	lr 0.00817
Train [74][1620/3239]	Time 0.230 (0.745)	Data Time 0.001 (0.239)	Loss 2.4780 (2.5240)	Entropy 0.60483 (0.60616)	Top-1 acc 62.891 (63.154)	Top-5 acc 82.812 (83.420)	lr 0.00817
Train [74][1630/3239]	Time 0.331 (0.743)	Data Time 0.001 (0.238)	Loss 2.5830 (2.5237)	Entropy 0.60471 (0.60615)	Top-1 acc 59.375 (63.160)	Top-5 acc 83.594 (83.429)	lr 0.00817
Train [74][1640/3239]	Time 0.229 (0.755)	Data Time 0.001 (0.251)	Loss 2.5756 (2.5243)	Entropy 0.60483 (0.60614)	Top-1 acc 61.328 (63.142)	Top-5 acc 82.422 (83.422)	lr 0.00817
Train [74][1650/3239]	Time 0.235 (0.753)	Data Time 0.001 (0.249)	Loss 2.6179 (2.5243)	Entropy 0.60482 (0.60613)	Top-1 acc 58.984 (63.137)	Top-5 acc 82.422 (83.425)	lr 0.00817
Train [74][1660/3239]	Time 0.244 (0.751)	Data Time 0.001 (0.248)	Loss 2.7021 (2.5244)	Entropy 0.60489 (0.60612)	Top-1 acc 59.375 (63.137)	Top-5 acc 80.078 (83.423)	lr 0.00817
Train [74][1670/3239]	Time 0.232 (0.762)	Data Time 0.002 (0.259)	Loss 2.7879 (2.5246)	Entropy 0.60460 (0.60612)	Top-1 acc 57.422 (63.130)	Top-5 acc 78.906 (83.420)	lr 0.00817
Train [74][1680/3239]	Time 0.254 (0.760)	Data Time 0.001 (0.257)	Loss 2.5449 (2.5248)	Entropy 0.60460 (0.60611)	Top-1 acc 64.062 (63.129)	Top-5 acc 83.984 (83.416)	lr 0.00817
Train [74][1690/3239]	Time 0.245 (0.758)	Data Time 0.001 (0.256)	Loss 2.6510 (2.5249)	Entropy 0.60442 (0.60610)	Top-1 acc 59.766 (63.126)	Top-5 acc 83.594 (83.412)	lr 0.00817
Train [74][1700/3239]	Time 21.272 (0.769)	Data Time 21.003 (0.267)	Loss 2.6029 (2.5249)	Entropy 0.60445 (0.60609)	Top-1 acc 59.375 (63.125)	Top-5 acc 82.422 (83.415)	lr 0.00817
Train [74][1710/3239]	Time 0.223 (0.767)	Data Time 0.001 (0.266)	Loss 2.4318 (2.5244)	Entropy 0.60460 (0.60608)	Top-1 acc 65.625 (63.138)	Top-5 acc 84.766 (83.422)	lr 0.00817
Train [74][1720/3239]	Time 0.360 (0.765)	Data Time 0.001 (0.264)	Loss 2.6107 (2.5243)	Entropy 0.60501 (0.60607)	Top-1 acc 60.156 (63.141)	Top-5 acc 84.766 (83.426)	lr 0.00816
Train [74][1730/3239]	Time 0.279 (0.767)	Data Time 0.001 (0.267)	Loss 2.5252 (2.5246)	Entropy 0.60496 (0.60606)	Top-1 acc 62.500 (63.135)	Top-5 acc 86.328 (83.420)	lr 0.00816
Train [74][1740/3239]	Time 0.255 (0.774)	Data Time 0.001 (0.274)	Loss 2.4711 (2.5245)	Entropy 0.60490 (0.60606)	Top-1 acc 63.672 (63.139)	Top-5 acc 84.766 (83.422)	lr 0.00816
Train [74][1750/3239]	Time 0.251 (0.772)	Data Time 0.001 (0.273)	Loss 2.5367 (2.5248)	Entropy 0.60490 (0.60605)	Top-1 acc 60.938 (63.128)	Top-5 acc 80.859 (83.412)	lr 0.00816
Train [74][1760/3239]	Time 0.242 (0.775)	Data Time 0.001 (0.276)	Loss 2.4590 (2.5247)	Entropy 0.60443 (0.60604)	Top-1 acc 61.328 (63.125)	Top-5 acc 83.203 (83.411)	lr 0.00816
Train [74][1770/3239]	Time 0.253 (0.781)	Data Time 0.001 (0.283)	Loss 2.5270 (2.5249)	Entropy 0.60436 (0.60603)	Top-1 acc 64.453 (63.120)	Top-5 acc 84.375 (83.410)	lr 0.00816
Train [74][1780/3239]	Time 0.229 (0.779)	Data Time 0.001 (0.281)	Loss 2.4576 (2.5252)	Entropy 0.60467 (0.60603)	Top-1 acc 67.969 (63.115)	Top-5 acc 83.594 (83.406)	lr 0.00816
Train [74][1790/3239]	Time 0.380 (0.777)	Data Time 0.002 (0.280)	Loss 2.5044 (2.5254)	Entropy 0.60456 (0.60602)	Top-1 acc 64.453 (63.114)	Top-5 acc 83.203 (83.400)	lr 0.00816
Train [74][1800/3239]	Time 0.238 (0.788)	Data Time 0.001 (0.291)	Loss 2.6142 (2.5257)	Entropy 0.60478 (0.60601)	Top-1 acc 63.672 (63.104)	Top-5 acc 80.859 (83.390)	lr 0.00816
Train [74][1810/3239]	Time 0.226 (0.786)	Data Time 0.001 (0.289)	Loss 2.5029 (2.5257)	Entropy 0.60504 (0.60600)	Top-1 acc 67.578 (63.108)	Top-5 acc 83.203 (83.393)	lr 0.00816
Train [74][1820/3239]	Time 0.235 (0.784)	Data Time 0.001 (0.288)	Loss 2.5716 (2.5255)	Entropy 0.60509 (0.60600)	Top-1 acc 62.500 (63.107)	Top-5 acc 80.859 (83.395)	lr 0.00815
Train [74][1830/3239]	Time 0.244 (0.794)	Data Time 0.001 (0.298)	Loss 2.7772 (2.5256)	Entropy 0.60510 (0.60599)	Top-1 acc 54.688 (63.108)	Top-5 acc 78.516 (83.391)	lr 0.00815
Train [74][1840/3239]	Time 0.250 (0.793)	Data Time 0.001 (0.297)	Loss 2.4081 (2.5254)	Entropy 0.60532 (0.60599)	Top-1 acc 66.797 (63.118)	Top-5 acc 82.031 (83.391)	lr 0.00815
Train [74][1850/3239]	Time 0.248 (0.791)	Data Time 0.001 (0.296)	Loss 2.6096 (2.5258)	Entropy 0.60541 (0.60599)	Top-1 acc 62.891 (63.116)	Top-5 acc 82.422 (83.382)	lr 0.00815
Train [74][1860/3239]	Time 10.114 (0.800)	Data Time 9.860 (0.305)	Loss 2.3988 (2.5259)	Entropy 0.60521 (0.60598)	Top-1 acc 67.578 (63.110)	Top-5 acc 85.938 (83.378)	lr 0.00815
Train [74][1870/3239]	Time 0.350 (0.827)	Data Time 0.005 (0.306)	Loss 2.6035 (2.5259)	Entropy 0.60515 (0.60598)	Top-1 acc 56.641 (63.110)	Top-5 acc 83.203 (83.380)	lr 0.00815
Train [74][1880/3239]	Time 0.350 (0.826)	Data Time 0.002 (0.305)	Loss 2.5227 (2.5260)	Entropy 0.60540 (0.60597)	Top-1 acc 64.844 (63.108)	Top-5 acc 84.766 (83.379)	lr 0.00815
Train [74][1890/3239]	Time 0.244 (0.824)	Data Time 0.001 (0.303)	Loss 2.4802 (2.5260)	Entropy 0.60547 (0.60597)	Top-1 acc 64.844 (63.107)	Top-5 acc 82.031 (83.377)	lr 0.00815
Train [74][1900/3239]	Time 0.245 (0.821)	Data Time 0.001 (0.301)	Loss 2.3513 (2.5260)	Entropy 0.60546 (0.60597)	Top-1 acc 64.844 (63.107)	Top-5 acc 86.719 (83.382)	lr 0.00815
Train [74][1910/3239]	Time 0.245 (0.820)	Data Time 0.001 (0.300)	Loss 2.6891 (2.5260)	Entropy 0.60530 (0.60596)	Top-1 acc 60.156 (63.107)	Top-5 acc 81.250 (83.383)	lr 0.00815
Train [74][1920/3239]	Time 0.236 (0.817)	Data Time 0.001 (0.298)	Loss 2.5805 (2.5258)	Entropy 0.60553 (0.60596)	Top-1 acc 63.672 (63.117)	Top-5 acc 82.812 (83.383)	lr 0.00815
Train [74][1930/3239]	Time 0.255 (0.815)	Data Time 0.001 (0.297)	Loss 2.5404 (2.5260)	Entropy 0.60571 (0.60596)	Top-1 acc 61.719 (63.114)	Top-5 acc 82.422 (83.382)	lr 0.00814
Train [74][1940/3239]	Time 0.246 (0.820)	Data Time 0.001 (0.302)	Loss 2.4694 (2.5261)	Entropy 0.60586 (0.60596)	Top-1 acc 66.797 (63.109)	Top-5 acc 83.594 (83.382)	lr 0.00814
Train [74][1950/3239]	Time 0.338 (0.819)	Data Time 0.001 (0.301)	Loss 2.5628 (2.5262)	Entropy 0.60597 (0.60596)	Top-1 acc 60.156 (63.101)	Top-5 acc 83.984 (83.379)	lr 0.00814
Train [74][1960/3239]	Time 0.235 (0.818)	Data Time 0.001 (0.301)	Loss 2.4879 (2.5264)	Entropy 0.60591 (0.60596)	Top-1 acc 63.672 (63.098)	Top-5 acc 82.812 (83.376)	lr 0.00814
Train [74][1970/3239]	Time 0.254 (0.827)	Data Time 0.001 (0.310)	Loss 2.4824 (2.5266)	Entropy 0.60600 (0.60596)	Top-1 acc 61.328 (63.099)	Top-5 acc 83.984 (83.374)	lr 0.00814
Train [74][1980/3239]	Time 1.530 (0.827)	Data Time 1.243 (0.310)	Loss 2.3153 (2.5262)	Entropy 0.60641 (0.60596)	Top-1 acc 67.578 (63.105)	Top-5 acc 87.500 (83.384)	lr 0.00814
Train [74][1990/3239]	Time 0.265 (0.826)	Data Time 0.001 (0.309)	Loss 2.5061 (2.5263)	Entropy 0.60632 (0.60596)	Top-1 acc 65.234 (63.097)	Top-5 acc 84.375 (83.384)	lr 0.00814
Train [74][2000/3239]	Time 0.246 (0.833)	Data Time 0.001 (0.317)	Loss 2.4646 (2.5264)	Entropy 0.60617 (0.60596)	Top-1 acc 63.281 (63.097)	Top-5 acc 85.547 (83.382)	lr 0.00814
Train [74][2010/3239]	Time 0.246 (0.833)	Data Time 0.001 (0.318)	Loss 2.4803 (2.5264)	Entropy 0.60616 (0.60596)	Top-1 acc 64.453 (63.096)	Top-5 acc 87.109 (83.386)	lr 0.00814
Train [74][2020/3239]	Time 1.658 (0.833)	Data Time 1.374 (0.318)	Loss 2.4366 (2.5265)	Entropy 0.60639 (0.60596)	Top-1 acc 65.234 (63.093)	Top-5 acc 86.719 (83.384)	lr 0.00814
Train [74][2030/3239]	Time 18.403 (0.841)	Data Time 18.150 (0.326)	Loss 2.4790 (2.5266)	Entropy 0.60654 (0.60597)	Top-1 acc 62.891 (63.087)	Top-5 acc 83.984 (83.382)	lr 0.00813
Train [74][2040/3239]	Time 0.271 (0.841)	Data Time 0.001 (0.327)	Loss 2.5129 (2.5266)	Entropy 0.60660 (0.60597)	Top-1 acc 62.500 (63.092)	Top-5 acc 83.203 (83.382)	lr 0.00813
Train [74][2050/3239]	Time 1.216 (0.840)	Data Time 0.955 (0.326)	Loss 2.4294 (2.5265)	Entropy 0.60667 (0.60597)	Top-1 acc 69.531 (63.096)	Top-5 acc 83.203 (83.385)	lr 0.00813
Train [74][2060/3239]	Time 0.250 (0.840)	Data Time 0.001 (0.326)	Loss 2.2478 (2.5266)	Entropy 0.60663 (0.60598)	Top-1 acc 69.531 (63.090)	Top-5 acc 87.891 (83.385)	lr 0.00813
Train [74][2070/3239]	Time 0.240 (0.848)	Data Time 0.001 (0.335)	Loss 2.4068 (2.5265)	Entropy 0.60635 (0.60598)	Top-1 acc 66.406 (63.093)	Top-5 acc 86.719 (83.388)	lr 0.00813
Train [74][2080/3239]	Time 0.240 (0.847)	Data Time 0.001 (0.335)	Loss 2.4263 (2.5269)	Entropy 0.60644 (0.60598)	Top-1 acc 64.453 (63.083)	Top-5 acc 86.328 (83.382)	lr 0.00813
Train [74][2090/3239]	Time 0.233 (0.847)	Data Time 0.001 (0.335)	Loss 2.5628 (2.5271)	Entropy 0.60663 (0.60598)	Top-1 acc 61.719 (63.072)	Top-5 acc 85.156 (83.378)	lr 0.00813
Train [74][2100/3239]	Time 0.258 (0.855)	Data Time 0.001 (0.344)	Loss 2.3944 (2.5270)	Entropy 0.60655 (0.60599)	Top-1 acc 66.797 (63.075)	Top-5 acc 84.375 (83.377)	lr 0.00813
Train [74][2110/3239]	Time 0.345 (0.856)	Data Time 0.001 (0.345)	Loss 2.4295 (2.5271)	Entropy 0.60665 (0.60599)	Top-1 acc 64.062 (63.074)	Top-5 acc 86.328 (83.373)	lr 0.00813
Train [74][2120/3239]	Time 0.238 (0.856)	Data Time 0.001 (0.345)	Loss 2.4646 (2.5273)	Entropy 0.60654 (0.60599)	Top-1 acc 62.891 (63.067)	Top-5 acc 83.594 (83.372)	lr 0.00813
Train [74][2130/3239]	Time 0.242 (0.862)	Data Time 0.001 (0.352)	Loss 2.7417 (2.5275)	Entropy 0.60669 (0.60600)	Top-1 acc 60.156 (63.062)	Top-5 acc 75.391 (83.368)	lr 0.00813
Train [74][2140/3239]	Time 1.541 (0.863)	Data Time 1.262 (0.353)	Loss 2.7229 (2.5277)	Entropy 0.60688 (0.60600)	Top-1 acc 59.375 (63.059)	Top-5 acc 79.688 (83.363)	lr 0.00812
Train [74][2150/3239]	Time 0.247 (0.863)	Data Time 0.001 (0.353)	Loss 2.2535 (2.5277)	Entropy 0.60670 (0.60600)	Top-1 acc 69.141 (63.062)	Top-5 acc 87.109 (83.361)	lr 0.00812
Train [74][2160/3239]	Time 0.244 (0.870)	Data Time 0.001 (0.360)	Loss 2.5883 (2.5275)	Entropy 0.60635 (0.60601)	Top-1 acc 59.766 (63.061)	Top-5 acc 81.641 (83.369)	lr 0.00812
Train [74][2170/3239]	Time 0.237 (0.870)	Data Time 0.001 (0.361)	Loss 2.6268 (2.5276)	Entropy 0.60658 (0.60601)	Top-1 acc 64.844 (63.059)	Top-5 acc 80.469 (83.365)	lr 0.00812
Train [74][2180/3239]	Time 0.334 (0.870)	Data Time 0.001 (0.361)	Loss 2.6797 (2.5278)	Entropy 0.60661 (0.60601)	Top-1 acc 58.203 (63.059)	Top-5 acc 80.859 (83.359)	lr 0.00812
Train [74][2190/3239]	Time 18.180 (0.876)	Data Time 17.904 (0.368)	Loss 2.3660 (2.5279)	Entropy 0.60694 (0.60601)	Top-1 acc 68.359 (63.053)	Top-5 acc 83.594 (83.357)	lr 0.00812
Train [74][2200/3239]	Time 0.250 (0.878)	Data Time 0.001 (0.371)	Loss 2.4948 (2.5285)	Entropy 0.60697 (0.60602)	Top-1 acc 62.891 (63.037)	Top-5 acc 83.594 (83.347)	lr 0.00812
Train [74][2210/3239]	Time 0.222 (0.876)	Data Time 0.001 (0.369)	Loss 2.5873 (2.5287)	Entropy 0.60692 (0.60602)	Top-1 acc 63.672 (63.031)	Top-5 acc 81.250 (83.344)	lr 0.00812
Train [74][2220/3239]	Time 0.232 (0.875)	Data Time 0.001 (0.368)	Loss 2.5082 (2.5288)	Entropy 0.60679 (0.60603)	Top-1 acc 62.891 (63.031)	Top-5 acc 84.766 (83.342)	lr 0.00812
Train [74][2230/3239]	Time 0.231 (0.878)	Data Time 0.001 (0.372)	Loss 2.7368 (2.5289)	Entropy 0.60670 (0.60603)	Top-1 acc 59.375 (63.033)	Top-5 acc 76.172 (83.339)	lr 0.00812
Train [74][2240/3239]	Time 0.230 (0.879)	Data Time 0.001 (0.373)	Loss 2.4359 (2.5289)	Entropy 0.60670 (0.60603)	Top-1 acc 65.234 (63.035)	Top-5 acc 84.375 (83.340)	lr 0.00811
Train [74][2250/3239]	Time 0.258 (0.877)	Data Time 0.001 (0.371)	Loss 2.4724 (2.5291)	Entropy 0.60653 (0.60603)	Top-1 acc 63.281 (63.031)	Top-5 acc 83.984 (83.335)	lr 0.00811
Train [74][2260/3239]	Time 0.277 (0.878)	Data Time 0.003 (0.373)	Loss 2.4470 (2.5294)	Entropy 0.60674 (0.60604)	Top-1 acc 64.062 (63.026)	Top-5 acc 86.719 (83.329)	lr 0.00811
Train [74][2270/3239]	Time 0.364 (0.880)	Data Time 0.002 (0.375)	Loss 2.3390 (2.5290)	Entropy 0.60674 (0.60604)	Top-1 acc 64.062 (63.033)	Top-5 acc 88.672 (83.335)	lr 0.00811
Train [74][2280/3239]	Time 0.226 (0.878)	Data Time 0.001 (0.374)	Loss 2.7067 (2.5294)	Entropy 0.60668 (0.60604)	Top-1 acc 58.203 (63.024)	Top-5 acc 81.641 (83.331)	lr 0.00811
Train [74][2290/3239]	Time 0.251 (0.882)	Data Time 0.001 (0.378)	Loss 2.6208 (2.5295)	Entropy 0.60667 (0.60605)	Top-1 acc 64.062 (63.023)	Top-5 acc 81.641 (83.326)	lr 0.00811
Train [74][2300/3239]	Time 0.232 (0.886)	Data Time 0.001 (0.382)	Loss 2.5675 (2.5296)	Entropy 0.60666 (0.60605)	Top-1 acc 61.328 (63.018)	Top-5 acc 83.984 (83.325)	lr 0.00811
Train [74][2310/3239]	Time 0.238 (0.884)	Data Time 0.001 (0.381)	Loss 2.5680 (2.5295)	Entropy 0.60668 (0.60605)	Top-1 acc 60.938 (63.020)	Top-5 acc 83.594 (83.326)	lr 0.00811
Train [74][2320/3239]	Time 0.235 (0.890)	Data Time 0.001 (0.387)	Loss 2.5345 (2.5298)	Entropy 0.60640 (0.60605)	Top-1 acc 65.234 (63.021)	Top-5 acc 83.594 (83.320)	lr 0.00811
Train [74][2330/3239]	Time 0.236 (0.892)	Data Time 0.001 (0.389)	Loss 2.9837 (2.5300)	Entropy 0.60660 (0.60605)	Top-1 acc 54.688 (63.022)	Top-5 acc 74.609 (83.317)	lr 0.00811
Train [74][2340/3239]	Time 0.384 (0.890)	Data Time 0.002 (0.388)	Loss 2.3671 (2.5300)	Entropy 0.60642 (0.60606)	Top-1 acc 63.281 (63.022)	Top-5 acc 86.328 (83.313)	lr 0.00811
Train [74][2350/3239]	Time 16.107 (0.895)	Data Time 15.857 (0.393)	Loss 2.5741 (2.5301)	Entropy 0.60650 (0.60606)	Top-1 acc 59.375 (63.021)	Top-5 acc 82.031 (83.312)	lr 0.00810
Train [74][2360/3239]	Time 0.253 (0.898)	Data Time 0.001 (0.396)	Loss 2.4766 (2.5301)	Entropy 0.60597 (0.60606)	Top-1 acc 64.844 (63.021)	Top-5 acc 83.203 (83.314)	lr 0.00810
Train [74][2370/3239]	Time 0.237 (0.896)	Data Time 0.001 (0.394)	Loss 2.5522 (2.5303)	Entropy 0.60592 (0.60606)	Top-1 acc 64.844 (63.016)	Top-5 acc 81.641 (83.308)	lr 0.00810
Train [74][2380/3239]	Time 0.232 (0.894)	Data Time 0.001 (0.392)	Loss 2.4466 (2.5301)	Entropy 0.60584 (0.60606)	Top-1 acc 66.406 (63.022)	Top-5 acc 84.375 (83.311)	lr 0.00810
Train [74][2390/3239]	Time 0.252 (0.901)	Data Time 0.001 (0.400)	Loss 2.5070 (2.5302)	Entropy 0.60612 (0.60606)	Top-1 acc 63.672 (63.022)	Top-5 acc 85.547 (83.312)	lr 0.00810
Train [74][2400/3239]	Time 0.232 (0.902)	Data Time 0.001 (0.401)	Loss 2.4743 (2.5302)	Entropy 0.60631 (0.60606)	Top-1 acc 63.672 (63.023)	Top-5 acc 85.156 (83.309)	lr 0.00810
Train [74][2410/3239]	Time 0.237 (0.900)	Data Time 0.001 (0.400)	Loss 2.5779 (2.5304)	Entropy 0.60662 (0.60606)	Top-1 acc 62.891 (63.017)	Top-5 acc 83.203 (83.306)	lr 0.00810
Train [74][2420/3239]	Time 0.283 (0.901)	Data Time 0.001 (0.402)	Loss 2.5271 (2.5301)	Entropy 0.60643 (0.60606)	Top-1 acc 58.594 (63.023)	Top-5 acc 85.938 (83.312)	lr 0.00810
Train [74][2430/3239]	Time 0.242 (0.901)	Data Time 0.001 (0.402)	Loss 2.7558 (2.5301)	Entropy 0.60565 (0.60606)	Top-1 acc 55.859 (63.019)	Top-5 acc 80.078 (83.313)	lr 0.00810
Train [74][2440/3239]	Time 0.242 (0.899)	Data Time 0.001 (0.400)	Loss 2.5468 (2.5302)	Entropy 0.60560 (0.60606)	Top-1 acc 65.234 (63.017)	Top-5 acc 84.375 (83.311)	lr 0.00810
Train [74][2450/3239]	Time 0.237 (0.903)	Data Time 0.001 (0.404)	Loss 2.5900 (2.5304)	Entropy 0.60573 (0.60606)	Top-1 acc 64.453 (63.014)	Top-5 acc 83.594 (83.311)	lr 0.00809
Train [74][2460/3239]	Time 0.254 (0.902)	Data Time 0.001 (0.404)	Loss 2.4845 (2.5303)	Entropy 0.60556 (0.60606)	Top-1 acc 62.109 (63.012)	Top-5 acc 82.422 (83.311)	lr 0.00809
Train [74][2470/3239]	Time 0.241 (0.900)	Data Time 0.001 (0.403)	Loss 2.6368 (2.5308)	Entropy 0.60543 (0.60605)	Top-1 acc 64.062 (63.001)	Top-5 acc 82.422 (83.305)	lr 0.00809
Train [74][2480/3239]	Time 0.273 (0.904)	Data Time 0.001 (0.407)	Loss 2.5371 (2.5307)	Entropy 0.60525 (0.60605)	Top-1 acc 67.188 (63.002)	Top-5 acc 84.375 (83.306)	lr 0.00809
Train [74][2490/3239]	Time 0.214 (0.904)	Data Time 0.001 (0.406)	Loss 2.7614 (2.5308)	Entropy 0.60534 (0.60605)	Top-1 acc 55.859 (63.001)	Top-5 acc 82.812 (83.304)	lr 0.00809
Train [74][2500/3239]	Time 0.354 (0.902)	Data Time 0.001 (0.405)	Loss 2.5874 (2.5306)	Entropy 0.60548 (0.60605)	Top-1 acc 60.938 (63.001)	Top-5 acc 81.250 (83.308)	lr 0.00809
Train [74][2510/3239]	Time 12.484 (0.905)	Data Time 12.232 (0.408)	Loss 2.6030 (2.5308)	Entropy 0.60540 (0.60604)	Top-1 acc 61.719 (62.997)	Top-5 acc 81.250 (83.306)	lr 0.00809
Train [74][2520/3239]	Time 0.226 (0.903)	Data Time 0.001 (0.406)	Loss 2.5309 (2.5309)	Entropy 0.60548 (0.60604)	Top-1 acc 66.406 (62.993)	Top-5 acc 83.203 (83.306)	lr 0.00809
Train [74][2530/3239]	Time 0.266 (0.923)	Data Time 0.002 (0.405)	Loss 2.4879 (2.5307)	Entropy 0.60589 (0.60604)	Top-1 acc 65.625 (62.996)	Top-5 acc 82.812 (83.309)	lr 0.00809
Train [74][2540/3239]	Time 0.226 (0.921)	Data Time 0.001 (0.404)	Loss 2.6163 (2.5306)	Entropy 0.60604 (0.60604)	Top-1 acc 60.156 (62.999)	Top-5 acc 82.031 (83.310)	lr 0.00809
Train [74][2550/3239]	Time 0.260 (0.919)	Data Time 0.002 (0.402)	Loss 2.4810 (2.5305)	Entropy 0.60609 (0.60604)	Top-1 acc 65.234 (63.004)	Top-5 acc 81.641 (83.311)	lr 0.00809
Train [74][2560/3239]	Time 0.248 (0.917)	Data Time 0.001 (0.401)	Loss 2.4922 (2.5304)	Entropy 0.60598 (0.60604)	Top-1 acc 65.625 (63.003)	Top-5 acc 83.984 (83.313)	lr 0.00808
Train [74][2570/3239]	Time 0.241 (0.915)	Data Time 0.001 (0.399)	Loss 2.6531 (2.5305)	Entropy 0.60604 (0.60604)	Top-1 acc 57.422 (62.995)	Top-5 acc 81.641 (83.309)	lr 0.00808
Train [74][2580/3239]	Time 0.247 (0.913)	Data Time 0.001 (0.398)	Loss 2.4920 (2.5304)	Entropy 0.60579 (0.60604)	Top-1 acc 64.453 (62.997)	Top-5 acc 80.859 (83.309)	lr 0.00808
Train [74][2590/3239]	Time 0.359 (0.914)	Data Time 0.001 (0.399)	Loss 2.6486 (2.5306)	Entropy 0.60599 (0.60604)	Top-1 acc 59.375 (62.990)	Top-5 acc 82.812 (83.308)	lr 0.00808
Train [74][2600/3239]	Time 0.242 (0.915)	Data Time 0.001 (0.399)	Loss 2.6164 (2.5306)	Entropy 0.60639 (0.60604)	Top-1 acc 61.328 (62.986)	Top-5 acc 81.641 (83.306)	lr 0.00808
Train [74][2610/3239]	Time 0.251 (0.913)	Data Time 0.001 (0.399)	Loss 2.5848 (2.5308)	Entropy 0.60644 (0.60604)	Top-1 acc 60.156 (62.979)	Top-5 acc 83.203 (83.305)	lr 0.00808
Train [74][2620/3239]	Time 1.934 (0.912)	Data Time 1.671 (0.398)	Loss 2.5638 (2.5305)	Entropy 0.60636 (0.60604)	Top-1 acc 62.891 (62.987)	Top-5 acc 82.422 (83.310)	lr 0.00808
Train [74][2630/3239]	Time 0.239 (0.919)	Data Time 0.001 (0.404)	Loss 2.6152 (2.5306)	Entropy 0.60636 (0.60604)	Top-1 acc 60.938 (62.985)	Top-5 acc 81.641 (83.307)	lr 0.00808
Train [74][2640/3239]	Time 0.231 (0.917)	Data Time 0.001 (0.403)	Loss 2.5863 (2.5307)	Entropy 0.60636 (0.60604)	Top-1 acc 63.672 (62.988)	Top-5 acc 83.984 (83.305)	lr 0.00808
Train [74][2650/3239]	Time 0.239 (0.916)	Data Time 0.001 (0.402)	Loss 2.5537 (2.5306)	Entropy 0.60626 (0.60605)	Top-1 acc 62.500 (62.993)	Top-5 acc 82.422 (83.307)	lr 0.00808
Train [74][2660/3239]	Time 0.472 (0.923)	Data Time 0.001 (0.410)	Loss 2.5578 (2.5307)	Entropy 0.60597 (0.60605)	Top-1 acc 60.547 (62.991)	Top-5 acc 85.547 (83.305)	lr 0.00808
Train [74][2670/3239]	Time 0.245 (0.922)	Data Time 0.001 (0.408)	Loss 2.5501 (2.5308)	Entropy 0.60569 (0.60605)	Top-1 acc 59.766 (62.981)	Top-5 acc 83.203 (83.306)	lr 0.00807
Train [74][2680/3239]	Time 0.243 (0.921)	Data Time 0.001 (0.407)	Loss 2.8287 (2.5310)	Entropy 0.60563 (0.60604)	Top-1 acc 56.641 (62.978)	Top-5 acc 76.953 (83.302)	lr 0.00807
Train [74][2690/3239]	Time 1.149 (0.927)	Data Time 0.897 (0.414)	Loss 2.6380 (2.5310)	Entropy 0.60561 (0.60604)	Top-1 acc 58.203 (62.977)	Top-5 acc 84.375 (83.301)	lr 0.00807
Train [74][2700/3239]	Time 7.461 (0.928)	Data Time 7.193 (0.415)	Loss 2.4423 (2.5310)	Entropy 0.60563 (0.60604)	Top-1 acc 62.500 (62.976)	Top-5 acc 85.938 (83.299)	lr 0.00807
Train [74][2710/3239]	Time 0.245 (0.926)	Data Time 0.001 (0.414)	Loss 2.5489 (2.5313)	Entropy 0.60571 (0.60604)	Top-1 acc 61.328 (62.970)	Top-5 acc 82.812 (83.294)	lr 0.00807
Train [74][2720/3239]	Time 0.246 (0.930)	Data Time 0.001 (0.418)	Loss 2.5210 (2.5314)	Entropy 0.60565 (0.60604)	Top-1 acc 62.500 (62.964)	Top-5 acc 82.031 (83.291)	lr 0.00807
Train [74][2730/3239]	Time 0.260 (0.931)	Data Time 0.001 (0.419)	Loss 2.6021 (2.5313)	Entropy 0.60578 (0.60604)	Top-1 acc 60.547 (62.966)	Top-5 acc 81.641 (83.293)	lr 0.00807
Train [74][2740/3239]	Time 0.242 (0.930)	Data Time 0.001 (0.418)	Loss 2.4591 (2.5314)	Entropy 0.60567 (0.60604)	Top-1 acc 65.625 (62.962)	Top-5 acc 85.938 (83.293)	lr 0.00807
Train [74][2750/3239]	Time 0.278 (0.931)	Data Time 0.001 (0.420)	Loss 2.6643 (2.5314)	Entropy 0.60587 (0.60604)	Top-1 acc 56.641 (62.959)	Top-5 acc 81.641 (83.295)	lr 0.00807
Train [74][2760/3239]	Time 0.274 (0.934)	Data Time 0.002 (0.423)	Loss 2.1497 (2.5311)	Entropy 0.60620 (0.60604)	Top-1 acc 71.094 (62.962)	Top-5 acc 91.016 (83.300)	lr 0.00807
Train [74][2770/3239]	Time 0.245 (0.934)	Data Time 0.001 (0.423)	Loss 2.5400 (2.5310)	Entropy 0.60620 (0.60604)	Top-1 acc 64.844 (62.968)	Top-5 acc 83.594 (83.303)	lr 0.00806
Train [74][2780/3239]	Time 5.191 (0.934)	Data Time 4.920 (0.423)	Loss 2.6694 (2.5310)	Entropy 0.60640 (0.60604)	Top-1 acc 60.938 (62.969)	Top-5 acc 80.469 (83.303)	lr 0.00806
Train [74][2790/3239]	Time 0.282 (0.940)	Data Time 0.002 (0.430)	Loss 2.4271 (2.5310)	Entropy 0.60602 (0.60604)	Top-1 acc 66.406 (62.969)	Top-5 acc 87.891 (83.304)	lr 0.00806
Train [74][2800/3239]	Time 0.259 (0.938)	Data Time 0.001 (0.428)	Loss 2.3580 (2.5306)	Entropy 0.60614 (0.60604)	Top-1 acc 69.531 (62.980)	Top-5 acc 85.547 (83.309)	lr 0.00806
Train [74][2810/3239]	Time 0.258 (0.937)	Data Time 0.002 (0.427)	Loss 2.5713 (2.5306)	Entropy 0.60583 (0.60604)	Top-1 acc 61.719 (62.983)	Top-5 acc 82.422 (83.311)	lr 0.00806
Train [74][2820/3239]	Time 0.360 (0.945)	Data Time 0.001 (0.435)	Loss 2.4950 (2.5306)	Entropy 0.60592 (0.60604)	Top-1 acc 64.453 (62.980)	Top-5 acc 82.031 (83.308)	lr 0.00806
Train [74][2830/3239]	Time 0.249 (0.943)	Data Time 0.001 (0.433)	Loss 2.4823 (2.5306)	Entropy 0.60567 (0.60604)	Top-1 acc 64.844 (62.975)	Top-5 acc 85.547 (83.308)	lr 0.00806
Train [74][2840/3239]	Time 0.239 (0.941)	Data Time 0.001 (0.432)	Loss 2.4687 (2.5307)	Entropy 0.60590 (0.60604)	Top-1 acc 62.500 (62.973)	Top-5 acc 83.203 (83.306)	lr 0.00806
Train [74][2850/3239]	Time 9.278 (0.949)	Data Time 9.034 (0.440)	Loss 2.6319 (2.5307)	Entropy 0.60592 (0.60603)	Top-1 acc 61.328 (62.971)	Top-5 acc 83.594 (83.308)	lr 0.00806
Train [74][2860/3239]	Time 0.255 (0.947)	Data Time 0.001 (0.438)	Loss 2.5571 (2.5308)	Entropy 0.60628 (0.60604)	Top-1 acc 60.547 (62.971)	Top-5 acc 82.031 (83.303)	lr 0.00806
Train [74][2870/3239]	Time 0.252 (0.945)	Data Time 0.001 (0.437)	Loss 2.5390 (2.5312)	Entropy 0.60627 (0.60604)	Top-1 acc 66.016 (62.963)	Top-5 acc 83.594 (83.296)	lr 0.00806
Train [74][2880/3239]	Time 0.262 (0.949)	Data Time 0.001 (0.441)	Loss 2.5863 (2.5310)	Entropy 0.60593 (0.60604)	Top-1 acc 59.375 (62.966)	Top-5 acc 82.031 (83.298)	lr 0.00805
Train [74][2890/3239]	Time 0.350 (0.950)	Data Time 0.001 (0.443)	Loss 2.7418 (2.5308)	Entropy 0.60616 (0.60604)	Top-1 acc 53.125 (62.970)	Top-5 acc 80.078 (83.303)	lr 0.00805
Train [74][2900/3239]	Time 0.244 (0.949)	Data Time 0.001 (0.441)	Loss 2.4688 (2.5308)	Entropy 0.60591 (0.60604)	Top-1 acc 65.234 (62.968)	Top-5 acc 83.203 (83.302)	lr 0.00805
Train [74][2910/3239]	Time 3.894 (0.950)	Data Time 3.629 (0.442)	Loss 2.5092 (2.5307)	Entropy 0.60622 (0.60604)	Top-1 acc 66.797 (62.969)	Top-5 acc 83.203 (83.303)	lr 0.00805
Train [74][2920/3239]	Time 0.253 (0.953)	Data Time 0.001 (0.446)	Loss 2.5609 (2.5309)	Entropy 0.60606 (0.60604)	Top-1 acc 63.672 (62.962)	Top-5 acc 82.422 (83.301)	lr 0.00805
Train [74][2930/3239]	Time 0.238 (0.951)	Data Time 0.001 (0.445)	Loss 2.4797 (2.5310)	Entropy 0.60610 (0.60604)	Top-1 acc 64.844 (62.958)	Top-5 acc 83.984 (83.299)	lr 0.00805
Train [74][2940/3239]	Time 0.227 (0.950)	Data Time 0.001 (0.443)	Loss 2.6201 (2.5310)	Entropy 0.60628 (0.60604)	Top-1 acc 63.672 (62.961)	Top-5 acc 82.812 (83.300)	lr 0.00805
Train [74][2950/3239]	Time 0.226 (0.957)	Data Time 0.001 (0.450)	Loss 2.4553 (2.5312)	Entropy 0.60635 (0.60604)	Top-1 acc 62.891 (62.956)	Top-5 acc 85.156 (83.295)	lr 0.00805
Train [74][2960/3239]	Time 0.262 (0.955)	Data Time 0.001 (0.449)	Loss 2.4964 (2.5312)	Entropy 0.60611 (0.60604)	Top-1 acc 63.281 (62.955)	Top-5 acc 80.859 (83.293)	lr 0.00805
Train [74][2970/3239]	Time 0.240 (0.953)	Data Time 0.001 (0.447)	Loss 2.4688 (2.5310)	Entropy 0.60593 (0.60604)	Top-1 acc 59.766 (62.958)	Top-5 acc 88.281 (83.297)	lr 0.00805
Train [74][2980/3239]	Time 0.351 (0.960)	Data Time 0.001 (0.455)	Loss 2.4668 (2.5309)	Entropy 0.60618 (0.60604)	Top-1 acc 64.844 (62.959)	Top-5 acc 85.156 (83.300)	lr 0.00804
Train [74][2990/3239]	Time 0.234 (0.958)	Data Time 0.001 (0.453)	Loss 2.5442 (2.5308)	Entropy 0.60601 (0.60604)	Top-1 acc 60.156 (62.960)	Top-5 acc 83.203 (83.301)	lr 0.00804
Train [74][3000/3239]	Time 0.241 (0.957)	Data Time 0.001 (0.452)	Loss 2.3995 (2.5308)	Entropy 0.60607 (0.60604)	Top-1 acc 66.406 (62.960)	Top-5 acc 85.547 (83.304)	lr 0.00804
Train [74][3010/3239]	Time 11.018 (0.964)	Data Time 10.764 (0.460)	Loss 2.5096 (2.5308)	Entropy 0.60578 (0.60604)	Top-1 acc 61.719 (62.960)	Top-5 acc 85.938 (83.309)	lr 0.00804
Train [74][3020/3239]	Time 0.244 (0.962)	Data Time 0.001 (0.458)	Loss 2.4739 (2.5309)	Entropy 0.60590 (0.60604)	Top-1 acc 64.844 (62.959)	Top-5 acc 82.812 (83.307)	lr 0.00804
Train [74][3030/3239]	Time 0.242 (0.961)	Data Time 0.001 (0.457)	Loss 2.3848 (2.5308)	Entropy 0.60541 (0.60604)	Top-1 acc 67.969 (62.964)	Top-5 acc 85.547 (83.309)	lr 0.00804
Train [74][3040/3239]	Time 0.251 (0.964)	Data Time 0.002 (0.461)	Loss 2.5467 (2.5308)	Entropy 0.60542 (0.60604)	Top-1 acc 60.547 (62.963)	Top-5 acc 82.422 (83.307)	lr 0.00804
Train [74][3050/3239]	Time 0.331 (0.966)	Data Time 0.001 (0.462)	Loss 2.6790 (2.5309)	Entropy 0.60559 (0.60603)	Top-1 acc 62.500 (62.961)	Top-5 acc 79.297 (83.306)	lr 0.00804
Train [74][3060/3239]	Time 0.251 (0.964)	Data Time 0.001 (0.461)	Loss 2.3849 (2.5311)	Entropy 0.60575 (0.60603)	Top-1 acc 68.750 (62.958)	Top-5 acc 85.156 (83.302)	lr 0.00804
Train [74][3070/3239]	Time 6.384 (0.966)	Data Time 6.122 (0.463)	Loss 2.3496 (2.5311)	Entropy 0.60543 (0.60603)	Top-1 acc 63.281 (62.956)	Top-5 acc 87.500 (83.301)	lr 0.00804
Train [74][3080/3239]	Time 0.245 (0.968)	Data Time 0.001 (0.465)	Loss 2.4292 (2.5312)	Entropy 0.60542 (0.60603)	Top-1 acc 66.016 (62.955)	Top-5 acc 85.547 (83.298)	lr 0.00804
Train [74][3090/3239]	Time 0.258 (0.967)	Data Time 0.001 (0.464)	Loss 2.5754 (2.5312)	Entropy 0.60539 (0.60603)	Top-1 acc 62.500 (62.954)	Top-5 acc 80.078 (83.298)	lr 0.00803
Train [74][3100/3239]	Time 0.248 (0.965)	Data Time 0.001 (0.463)	Loss 2.5029 (2.5310)	Entropy 0.60531 (0.60603)	Top-1 acc 62.500 (62.959)	Top-5 acc 82.422 (83.300)	lr 0.00803
Train [74][3110/3239]	Time 0.255 (0.972)	Data Time 0.001 (0.470)	Loss 2.5740 (2.5311)	Entropy 0.60522 (0.60602)	Top-1 acc 64.453 (62.958)	Top-5 acc 83.594 (83.299)	lr 0.00803
Train [74][3120/3239]	Time 0.240 (0.970)	Data Time 0.001 (0.468)	Loss 2.7696 (2.5312)	Entropy 0.60519 (0.60602)	Top-1 acc 56.250 (62.958)	Top-5 acc 80.859 (83.296)	lr 0.00803
Train [74][3130/3239]	Time 0.251 (0.968)	Data Time 0.001 (0.467)	Loss 2.5782 (2.5312)	Entropy 0.60500 (0.60602)	Top-1 acc 63.281 (62.954)	Top-5 acc 82.031 (83.295)	lr 0.00803
Train [74][3140/3239]	Time 0.333 (0.974)	Data Time 0.001 (0.472)	Loss 2.3699 (2.5312)	Entropy 0.60501 (0.60601)	Top-1 acc 67.578 (62.955)	Top-5 acc 85.547 (83.296)	lr 0.00803
Train [74][3150/3239]	Time 0.231 (0.972)	Data Time 0.001 (0.471)	Loss 2.5730 (2.5311)	Entropy 0.60508 (0.60601)	Top-1 acc 62.109 (62.955)	Top-5 acc 85.156 (83.297)	lr 0.00803
Train [74][3160/3239]	Time 0.246 (0.971)	Data Time 0.001 (0.470)	Loss 2.6064 (2.5315)	Entropy 0.60481 (0.60601)	Top-1 acc 57.031 (62.943)	Top-5 acc 81.641 (83.289)	lr 0.00803
Train [74][3170/3239]	Time 2.733 (0.976)	Data Time 2.465 (0.475)	Loss 2.4859 (2.5314)	Entropy 0.60463 (0.60600)	Top-1 acc 64.062 (62.942)	Top-5 acc 82.812 (83.292)	lr 0.00803
Train [74][3180/3239]	Time 0.377 (0.990)	Data Time 0.000 (0.474)	Loss 2.7292 (2.5314)	Entropy 0.60478 (0.60600)	Top-1 acc 59.766 (62.944)	Top-5 acc 80.469 (83.293)	lr 0.00803
Train [74][3190/3239]	Time 0.267 (0.989)	Data Time 0.000 (0.473)	Loss 2.5455 (2.5314)	Entropy 0.60472 (0.60600)	Top-1 acc 61.719 (62.941)	Top-5 acc 85.156 (83.292)	lr 0.00803
Train [74][3200/3239]	Time 0.252 (0.987)	Data Time 0.000 (0.471)	Loss 2.5781 (2.5316)	Entropy 0.60484 (0.60599)	Top-1 acc 63.281 (62.936)	Top-5 acc 79.297 (83.287)	lr 0.00802
Train [74][3210/3239]	Time 0.408 (0.986)	Data Time 0.000 (0.470)	Loss 2.4753 (2.5314)	Entropy 0.60519 (0.60599)	Top-1 acc 65.234 (62.944)	Top-5 acc 83.203 (83.290)	lr 0.00802
Train [74][3220/3239]	Time 0.249 (0.984)	Data Time 0.000 (0.469)	Loss 2.5038 (2.5311)	Entropy 0.60517 (0.60599)	Top-1 acc 63.672 (62.948)	Top-5 acc 82.812 (83.294)	lr 0.00802
Train [74][3230/3239]	Time 0.234 (0.982)	Data Time 0.000 (0.467)	Loss 2.6937 (2.5312)	Entropy 0.60487 (0.60598)	Top-1 acc 58.203 (62.948)	Top-5 acc 81.641 (83.294)	lr 0.00802
Train [74][3239/3239]	Time 1.154 (0.981)	Data Time 0.000 (0.466)	Loss 2.4700 (2.5312)	Entropy 0.60482 (0.60598)	Top-1 acc 66.667 (62.951)	Top-5 acc 82.716 (83.294)	lr 0.00802
==========Valid [74/120]	loss 1.323	top-1 acc 69.766 (69.766)	top-5 acc 88.602	Train top-1 62.951	top-5 83.294	Entropy 0.60482	Latency-None: 0.000ms	Flops: 539.00M
Train [75][0/3239]	Time 50.305 (50.305)	Data Time 47.647 (47.647)	Loss 2.3275 (2.3275)	Entropy 0.60485 (0.60485)	Top-1 acc 68.750 (68.750)	Top-5 acc 85.547 (85.547)	lr 0.00802
Train [75][10/3239]	Time 0.319 (5.095)	Data Time 0.002 (4.346)	Loss 2.7485 (2.5235)	Entropy 0.60494 (0.60488)	Top-1 acc 58.203 (62.713)	Top-5 acc 80.469 (83.239)	lr 0.00802
Train [75][20/3239]	Time 0.257 (2.891)	Data Time 0.001 (2.277)	Loss 2.5256 (2.5283)	Entropy 0.60485 (0.60491)	Top-1 acc 62.500 (62.872)	Top-5 acc 82.422 (83.445)	lr 0.00802
Train [75][30/3239]	Time 0.354 (2.121)	Data Time 0.001 (1.543)	Loss 2.3677 (2.5171)	Entropy 0.60478 (0.60489)	Top-1 acc 68.750 (62.941)	Top-5 acc 85.156 (83.556)	lr 0.00802
Train [75][40/3239]	Time 0.361 (1.758)	Data Time 0.002 (1.210)	Loss 2.5657 (2.5170)	Entropy 0.60477 (0.60486)	Top-1 acc 64.453 (63.081)	Top-5 acc 82.422 (83.622)	lr 0.00802
Train [75][50/3239]	Time 0.271 (1.502)	Data Time 0.001 (0.973)	Loss 2.7446 (2.5208)	Entropy 0.60466 (0.60483)	Top-1 acc 60.547 (63.251)	Top-5 acc 80.469 (83.686)	lr 0.00802
Train [75][60/3239]	Time 0.293 (1.331)	Data Time 0.001 (0.814)	Loss 2.4815 (2.5112)	Entropy 0.60447 (0.60479)	Top-1 acc 60.938 (63.352)	Top-5 acc 82.031 (83.747)	lr 0.00801
Train [75][70/3239]	Time 0.274 (1.281)	Data Time 0.001 (0.770)	Loss 2.7153 (2.5079)	Entropy 0.60435 (0.60475)	Top-1 acc 56.641 (63.331)	Top-5 acc 80.859 (83.819)	lr 0.00801
Train [75][80/3239]	Time 0.239 (1.176)	Data Time 0.001 (0.675)	Loss 2.7278 (2.5096)	Entropy 0.60432 (0.60469)	Top-1 acc 60.156 (63.455)	Top-5 acc 80.078 (83.700)	lr 0.00801
Train [75][90/3239]	Time 0.251 (1.094)	Data Time 0.001 (0.601)	Loss 2.5750 (2.5122)	Entropy 0.60446 (0.60464)	Top-1 acc 62.500 (63.470)	Top-5 acc 83.984 (83.757)	lr 0.00801
Train [75][100/3239]	Time 0.255 (1.084)	Data Time 0.001 (0.587)	Loss 2.4931 (2.5183)	Entropy 0.60451 (0.60463)	Top-1 acc 62.109 (63.343)	Top-5 acc 83.984 (83.609)	lr 0.00801
Train [75][110/3239]	Time 0.257 (1.032)	Data Time 0.001 (0.534)	Loss 2.4309 (2.5155)	Entropy 0.60501 (0.60462)	Top-1 acc 65.625 (63.334)	Top-5 acc 83.594 (83.611)	lr 0.00801
Train [75][120/3239]	Time 0.260 (0.986)	Data Time 0.002 (0.490)	Loss 2.4927 (2.5177)	Entropy 0.60466 (0.60465)	Top-1 acc 58.984 (63.268)	Top-5 acc 85.547 (83.600)	lr 0.00801
Train [75][130/3239]	Time 0.238 (0.983)	Data Time 0.001 (0.489)	Loss 2.6254 (2.5202)	Entropy 0.60484 (0.60466)	Top-1 acc 64.062 (63.189)	Top-5 acc 79.297 (83.537)	lr 0.00801
Train [75][140/3239]	Time 0.273 (0.945)	Data Time 0.001 (0.455)	Loss 2.2312 (2.5165)	Entropy 0.60497 (0.60467)	Top-1 acc 67.578 (63.290)	Top-5 acc 87.500 (83.580)	lr 0.00801
Train [75][150/3239]	Time 0.246 (0.913)	Data Time 0.002 (0.425)	Loss 2.5972 (2.5196)	Entropy 0.60511 (0.60469)	Top-1 acc 59.375 (63.227)	Top-5 acc 82.031 (83.516)	lr 0.00801
Train [75][160/3239]	Time 3.115 (0.902)	Data Time 2.872 (0.416)	Loss 2.5758 (2.5173)	Entropy 0.60472 (0.60471)	Top-1 acc 61.328 (63.322)	Top-5 acc 82.812 (83.548)	lr 0.00801
Train [75][170/3239]	Time 0.236 (0.874)	Data Time 0.002 (0.392)	Loss 2.5983 (2.5190)	Entropy 0.60471 (0.60471)	Top-1 acc 61.328 (63.288)	Top-5 acc 83.594 (83.498)	lr 0.00800
Train [75][180/3239]	Time 0.237 (0.850)	Data Time 0.001 (0.370)	Loss 2.3737 (2.5173)	Entropy 0.60455 (0.60471)	Top-1 acc 68.750 (63.391)	Top-5 acc 84.375 (83.516)	lr 0.00800
Train [75][190/3239]	Time 0.301 (0.828)	Data Time 0.003 (0.351)	Loss 2.5569 (2.5174)	Entropy 0.60467 (0.60470)	Top-1 acc 62.500 (63.377)	Top-5 acc 83.203 (83.526)	lr 0.00800
Train [75][200/3239]	Time 0.471 (0.830)	Data Time 0.009 (0.353)	Loss 2.3499 (2.5140)	Entropy 0.60480 (0.60470)	Top-1 acc 69.141 (63.464)	Top-5 acc 85.156 (83.576)	lr 0.00800
Train [75][210/3239]	Time 0.240 (0.823)	Data Time 0.001 (0.347)	Loss 2.5133 (2.5158)	Entropy 0.60459 (0.60470)	Top-1 acc 65.234 (63.403)	Top-5 acc 82.422 (83.522)	lr 0.00800
Train [75][220/3239]	Time 0.251 (0.807)	Data Time 0.001 (0.332)	Loss 2.6063 (2.5159)	Entropy 0.60453 (0.60469)	Top-1 acc 58.984 (63.416)	Top-5 acc 83.203 (83.542)	lr 0.00800
Train [75][230/3239]	Time 0.240 (0.801)	Data Time 0.001 (0.326)	Loss 2.5805 (2.5149)	Entropy 0.60429 (0.60468)	Top-1 acc 61.719 (63.454)	Top-5 acc 82.812 (83.541)	lr 0.00800
Train [75][240/3239]	Time 0.265 (0.804)	Data Time 0.001 (0.330)	Loss 2.5964 (2.5135)	Entropy 0.60464 (0.60467)	Top-1 acc 57.031 (63.411)	Top-5 acc 84.375 (83.623)	lr 0.00800
Train [75][250/3239]	Time 0.227 (0.790)	Data Time 0.001 (0.317)	Loss 2.4345 (2.5145)	Entropy 0.60468 (0.60467)	Top-1 acc 64.844 (63.373)	Top-5 acc 85.938 (83.602)	lr 0.00800
Train [75][260/3239]	Time 0.253 (0.779)	Data Time 0.002 (0.305)	Loss 2.2292 (2.5141)	Entropy 0.60483 (0.60467)	Top-1 acc 71.484 (63.401)	Top-5 acc 87.109 (83.574)	lr 0.00800
Train [75][270/3239]	Time 0.382 (0.786)	Data Time 0.001 (0.312)	Loss 2.5944 (2.5151)	Entropy 0.60469 (0.60467)	Top-1 acc 65.625 (63.382)	Top-5 acc 80.859 (83.575)	lr 0.00799
Train [75][280/3239]	Time 0.279 (0.774)	Data Time 0.001 (0.301)	Loss 2.5166 (2.5196)	Entropy 0.60458 (0.60467)	Top-1 acc 65.234 (63.278)	Top-5 acc 81.250 (83.495)	lr 0.00799
Train [75][290/3239]	Time 0.253 (0.769)	Data Time 0.001 (0.298)	Loss 2.3315 (2.5193)	Entropy 0.60459 (0.60467)	Top-1 acc 71.875 (63.266)	Top-5 acc 87.109 (83.529)	lr 0.00799
Train [75][300/3239]	Time 5.363 (0.778)	Data Time 5.100 (0.307)	Loss 2.5019 (2.5200)	Entropy 0.60464 (0.60466)	Top-1 acc 63.672 (63.263)	Top-5 acc 85.938 (83.546)	lr 0.00799
Train [75][310/3239]	Time 0.253 (0.767)	Data Time 0.001 (0.298)	Loss 2.6515 (2.5195)	Entropy 0.60448 (0.60466)	Top-1 acc 60.547 (63.274)	Top-5 acc 79.297 (83.570)	lr 0.00799
Train [75][320/3239]	Time 0.223 (0.758)	Data Time 0.001 (0.288)	Loss 2.5288 (2.5172)	Entropy 0.60448 (0.60466)	Top-1 acc 62.500 (63.326)	Top-5 acc 84.766 (83.618)	lr 0.00799
Train [75][330/3239]	Time 0.234 (0.750)	Data Time 0.001 (0.281)	Loss 2.4554 (2.5155)	Entropy 0.60427 (0.60465)	Top-1 acc 66.797 (63.399)	Top-5 acc 85.156 (83.644)	lr 0.00799
Train [75][340/3239]	Time 0.236 (0.748)	Data Time 0.001 (0.280)	Loss 2.7605 (2.5159)	Entropy 0.60416 (0.60463)	Top-1 acc 56.250 (63.402)	Top-5 acc 79.297 (83.619)	lr 0.00799
Train [75][350/3239]	Time 0.304 (0.739)	Data Time 0.001 (0.272)	Loss 2.7280 (2.5158)	Entropy 0.60417 (0.60462)	Top-1 acc 59.766 (63.399)	Top-5 acc 77.734 (83.622)	lr 0.00799
Train [75][360/3239]	Time 0.340 (0.750)	Data Time 0.001 (0.284)	Loss 2.3095 (2.5136)	Entropy 0.60410 (0.60460)	Top-1 acc 70.312 (63.437)	Top-5 acc 87.109 (83.637)	lr 0.00799
Train [75][370/3239]	Time 0.230 (0.741)	Data Time 0.001 (0.276)	Loss 2.5732 (2.5151)	Entropy 0.60408 (0.60459)	Top-1 acc 61.328 (63.424)	Top-5 acc 82.422 (83.616)	lr 0.00799
Train [75][380/3239]	Time 0.254 (0.732)	Data Time 0.001 (0.269)	Loss 2.5789 (2.5151)	Entropy 0.60403 (0.60458)	Top-1 acc 60.938 (63.421)	Top-5 acc 84.766 (83.638)	lr 0.00798
Train [75][390/3239]	Time 0.238 (0.743)	Data Time 0.001 (0.278)	Loss 2.4973 (2.5162)	Entropy 0.60406 (0.60456)	Top-1 acc 64.062 (63.384)	Top-5 acc 84.375 (83.631)	lr 0.00798
Train [75][400/3239]	Time 0.247 (0.734)	Data Time 0.001 (0.272)	Loss 2.4484 (2.5154)	Entropy 0.60423 (0.60455)	Top-1 acc 66.406 (63.388)	Top-5 acc 83.203 (83.635)	lr 0.00798
Train [75][410/3239]	Time 0.231 (0.727)	Data Time 0.001 (0.265)	Loss 2.6202 (2.5157)	Entropy 0.60404 (0.60454)	Top-1 acc 60.547 (63.360)	Top-5 acc 82.422 (83.637)	lr 0.00798
Train [75][420/3239]	Time 0.237 (0.732)	Data Time 0.001 (0.271)	Loss 2.4032 (2.5154)	Entropy 0.60373 (0.60453)	Top-1 acc 66.406 (63.357)	Top-5 acc 84.766 (83.648)	lr 0.00798
Train [75][430/3239]	Time 0.376 (0.740)	Data Time 0.003 (0.280)	Loss 2.6900 (2.5140)	Entropy 0.60375 (0.60451)	Top-1 acc 61.719 (63.398)	Top-5 acc 79.688 (83.665)	lr 0.00798
Train [75][440/3239]	Time 0.295 (0.734)	Data Time 0.003 (0.274)	Loss 2.4149 (2.5132)	Entropy 0.60369 (0.60449)	Top-1 acc 64.844 (63.424)	Top-5 acc 84.766 (83.671)	lr 0.00798
Train [75][450/3239]	Time 0.268 (0.727)	Data Time 0.002 (0.268)	Loss 2.4285 (2.5134)	Entropy 0.60365 (0.60448)	Top-1 acc 64.062 (63.428)	Top-5 acc 83.594 (83.667)	lr 0.00798
Train [75][460/3239]	Time 6.227 (0.734)	Data Time 5.965 (0.275)	Loss 2.5411 (2.5123)	Entropy 0.60373 (0.60446)	Top-1 acc 62.500 (63.436)	Top-5 acc 82.422 (83.678)	lr 0.00798
Train [75][470/3239]	Time 0.324 (0.728)	Data Time 0.002 (0.269)	Loss 2.5671 (2.5129)	Entropy 0.60345 (0.60444)	Top-1 acc 62.109 (63.410)	Top-5 acc 83.594 (83.659)	lr 0.00798
Train [75][480/3239]	Time 0.229 (0.722)	Data Time 0.001 (0.263)	Loss 2.4822 (2.5132)	Entropy 0.60300 (0.60442)	Top-1 acc 62.109 (63.380)	Top-5 acc 83.594 (83.667)	lr 0.00798
Train [75][490/3239]	Time 0.232 (0.718)	Data Time 0.001 (0.260)	Loss 2.4647 (2.5138)	Entropy 0.60322 (0.60439)	Top-1 acc 64.844 (63.352)	Top-5 acc 83.984 (83.659)	lr 0.00797
Train [75][500/3239]	Time 0.261 (0.723)	Data Time 0.001 (0.266)	Loss 2.4711 (2.5134)	Entropy 0.60319 (0.60437)	Top-1 acc 65.234 (63.354)	Top-5 acc 83.984 (83.671)	lr 0.00797
Train [75][510/3239]	Time 0.299 (0.725)	Data Time 0.002 (0.267)	Loss 2.4893 (2.5119)	Entropy 0.60308 (0.60435)	Top-1 acc 62.109 (63.384)	Top-5 acc 84.375 (83.708)	lr 0.00797
Train [75][520/3239]	Time 0.398 (0.721)	Data Time 0.001 (0.262)	Loss 2.5031 (2.5123)	Entropy 0.60355 (0.60433)	Top-1 acc 64.453 (63.373)	Top-5 acc 83.984 (83.704)	lr 0.00797
Train [75][530/3239]	Time 0.314 (0.719)	Data Time 0.001 (0.261)	Loss 2.4521 (2.5118)	Entropy 0.60375 (0.60431)	Top-1 acc 67.578 (63.395)	Top-5 acc 85.156 (83.717)	lr 0.00797
Train [75][540/3239]	Time 3.896 (0.721)	Data Time 3.613 (0.263)	Loss 2.5178 (2.5112)	Entropy 0.60350 (0.60430)	Top-1 acc 64.453 (63.422)	Top-5 acc 84.766 (83.730)	lr 0.00797
Train [75][550/3239]	Time 0.246 (0.717)	Data Time 0.001 (0.258)	Loss 2.6046 (2.5124)	Entropy 0.60369 (0.60429)	Top-1 acc 63.672 (63.392)	Top-5 acc 81.250 (83.701)	lr 0.00797
Train [75][560/3239]	Time 0.274 (0.717)	Data Time 0.001 (0.258)	Loss 2.4018 (2.5119)	Entropy 0.60374 (0.60428)	Top-1 acc 65.234 (63.411)	Top-5 acc 87.500 (83.716)	lr 0.00797
Train [75][570/3239]	Time 0.263 (0.712)	Data Time 0.001 (0.253)	Loss 2.4588 (2.5118)	Entropy 0.60359 (0.60427)	Top-1 acc 67.188 (63.423)	Top-5 acc 83.984 (83.712)	lr 0.00797
Train [75][580/3239]	Time 0.266 (0.715)	Data Time 0.001 (0.256)	Loss 2.5571 (2.5115)	Entropy 0.60380 (0.60426)	Top-1 acc 64.453 (63.435)	Top-5 acc 82.422 (83.728)	lr 0.00797
Train [75][590/3239]	Time 0.355 (0.714)	Data Time 0.001 (0.256)	Loss 2.6814 (2.5118)	Entropy 0.60407 (0.60425)	Top-1 acc 58.984 (63.426)	Top-5 acc 78.516 (83.714)	lr 0.00796
Train [75][600/3239]	Time 0.262 (0.797)	Data Time 0.003 (0.252)	Loss 2.4941 (2.5127)	Entropy 0.60443 (0.60425)	Top-1 acc 60.938 (63.404)	Top-5 acc 83.594 (83.691)	lr 0.00796
Train [75][610/3239]	Time 0.240 (0.791)	Data Time 0.002 (0.248)	Loss 2.7149 (2.5133)	Entropy 0.60441 (0.60425)	Top-1 acc 58.203 (63.384)	Top-5 acc 79.297 (83.672)	lr 0.00796
Train [75][620/3239]	Time 0.244 (0.785)	Data Time 0.002 (0.244)	Loss 2.5385 (2.5130)	Entropy 0.60382 (0.60425)	Top-1 acc 62.500 (63.395)	Top-5 acc 84.375 (83.683)	lr 0.00796
Train [75][630/3239]	Time 0.276 (0.780)	Data Time 0.002 (0.240)	Loss 2.6184 (2.5147)	Entropy 0.60379 (0.60425)	Top-1 acc 57.031 (63.342)	Top-5 acc 83.203 (83.647)	lr 0.00796
Train [75][640/3239]	Time 0.254 (0.775)	Data Time 0.001 (0.236)	Loss 2.7439 (2.5156)	Entropy 0.60392 (0.60424)	Top-1 acc 56.250 (63.317)	Top-5 acc 79.688 (83.633)	lr 0.00796
Train [75][650/3239]	Time 0.272 (0.770)	Data Time 0.001 (0.233)	Loss 2.4817 (2.5158)	Entropy 0.60404 (0.60424)	Top-1 acc 64.453 (63.305)	Top-5 acc 83.203 (83.612)	lr 0.00796
Train [75][660/3239]	Time 0.258 (0.766)	Data Time 0.001 (0.229)	Loss 2.4503 (2.5157)	Entropy 0.60421 (0.60423)	Top-1 acc 65.234 (63.307)	Top-5 acc 85.156 (83.611)	lr 0.00796
Train [75][670/3239]	Time 0.266 (0.761)	Data Time 0.001 (0.226)	Loss 2.5682 (2.5161)	Entropy 0.60386 (0.60423)	Top-1 acc 64.062 (63.295)	Top-5 acc 82.031 (83.601)	lr 0.00796
Train [75][680/3239]	Time 0.328 (0.757)	Data Time 0.001 (0.222)	Loss 2.5446 (2.5161)	Entropy 0.60370 (0.60423)	Top-1 acc 60.156 (63.290)	Top-5 acc 80.859 (83.589)	lr 0.00796
Train [75][690/3239]	Time 0.254 (0.752)	Data Time 0.003 (0.219)	Loss 2.4804 (2.5160)	Entropy 0.60330 (0.60422)	Top-1 acc 62.500 (63.289)	Top-5 acc 83.594 (83.594)	lr 0.00796
Train [75][700/3239]	Time 0.246 (0.750)	Data Time 0.002 (0.218)	Loss 2.5921 (2.5168)	Entropy 0.60313 (0.60420)	Top-1 acc 62.109 (63.285)	Top-5 acc 82.422 (83.584)	lr 0.00795
Train [75][710/3239]	Time 0.282 (0.749)	Data Time 0.007 (0.218)	Loss 2.7054 (2.5172)	Entropy 0.60276 (0.60419)	Top-1 acc 61.719 (63.291)	Top-5 acc 79.297 (83.568)	lr 0.00795
Train [75][720/3239]	Time 0.244 (0.747)	Data Time 0.001 (0.217)	Loss 2.3953 (2.5176)	Entropy 0.60247 (0.60416)	Top-1 acc 66.406 (63.280)	Top-5 acc 84.766 (83.563)	lr 0.00795
Train [75][730/3239]	Time 0.261 (0.752)	Data Time 0.001 (0.223)	Loss 2.5260 (2.5171)	Entropy 0.60286 (0.60414)	Top-1 acc 60.156 (63.289)	Top-5 acc 82.422 (83.572)	lr 0.00795
Train [75][740/3239]	Time 0.260 (0.748)	Data Time 0.001 (0.221)	Loss 2.5395 (2.5166)	Entropy 0.60308 (0.60413)	Top-1 acc 64.062 (63.293)	Top-5 acc 82.031 (83.579)	lr 0.00795
Train [75][750/3239]	Time 0.352 (0.750)	Data Time 0.001 (0.223)	Loss 2.4164 (2.5161)	Entropy 0.60294 (0.60411)	Top-1 acc 66.797 (63.302)	Top-5 acc 85.938 (83.597)	lr 0.00795
Train [75][760/3239]	Time 0.251 (0.753)	Data Time 0.001 (0.228)	Loss 2.3372 (2.5170)	Entropy 0.60297 (0.60409)	Top-1 acc 67.969 (63.285)	Top-5 acc 83.984 (83.569)	lr 0.00795
Train [75][770/3239]	Time 0.254 (0.749)	Data Time 0.001 (0.225)	Loss 2.8078 (2.5174)	Entropy 0.60341 (0.60408)	Top-1 acc 56.250 (63.278)	Top-5 acc 77.734 (83.563)	lr 0.00795
Train [75][780/3239]	Time 0.282 (0.748)	Data Time 0.001 (0.224)	Loss 2.6258 (2.5178)	Entropy 0.60332 (0.60407)	Top-1 acc 60.156 (63.270)	Top-5 acc 82.422 (83.558)	lr 0.00795
Train [75][790/3239]	Time 0.260 (0.754)	Data Time 0.001 (0.231)	Loss 2.4861 (2.5171)	Entropy 0.60353 (0.60406)	Top-1 acc 67.578 (63.286)	Top-5 acc 82.422 (83.575)	lr 0.00795
Train [75][800/3239]	Time 0.245 (0.751)	Data Time 0.001 (0.229)	Loss 2.6246 (2.5172)	Entropy 0.60356 (0.60406)	Top-1 acc 61.328 (63.278)	Top-5 acc 82.812 (83.574)	lr 0.00795
Train [75][810/3239]	Time 0.248 (0.748)	Data Time 0.002 (0.227)	Loss 2.3692 (2.5182)	Entropy 0.60342 (0.60405)	Top-1 acc 67.969 (63.259)	Top-5 acc 86.719 (83.559)	lr 0.00794
Train [75][820/3239]	Time 0.365 (0.749)	Data Time 0.001 (0.229)	Loss 2.4599 (2.5175)	Entropy 0.60347 (0.60404)	Top-1 acc 62.500 (63.258)	Top-5 acc 86.328 (83.569)	lr 0.00794
Train [75][830/3239]	Time 0.247 (0.751)	Data Time 0.001 (0.231)	Loss 2.4902 (2.5176)	Entropy 0.60360 (0.60404)	Top-1 acc 65.625 (63.253)	Top-5 acc 84.766 (83.566)	lr 0.00794
Train [75][840/3239]	Time 0.260 (0.750)	Data Time 0.001 (0.232)	Loss 2.4825 (2.5174)	Entropy 0.60356 (0.60403)	Top-1 acc 65.625 (63.270)	Top-5 acc 82.812 (83.564)	lr 0.00794
Train [75][850/3239]	Time 0.273 (0.748)	Data Time 0.001 (0.230)	Loss 2.5618 (2.5182)	Entropy 0.60387 (0.60403)	Top-1 acc 58.984 (63.243)	Top-5 acc 82.422 (83.552)	lr 0.00794
Train [75][860/3239]	Time 0.254 (0.753)	Data Time 0.001 (0.236)	Loss 2.5162 (2.5192)	Entropy 0.60382 (0.60403)	Top-1 acc 61.719 (63.221)	Top-5 acc 84.375 (83.536)	lr 0.00794
Train [75][870/3239]	Time 1.759 (0.753)	Data Time 1.518 (0.237)	Loss 2.4145 (2.5194)	Entropy 0.60396 (0.60403)	Top-1 acc 63.281 (63.219)	Top-5 acc 84.766 (83.540)	lr 0.00794
Train [75][880/3239]	Time 0.243 (0.750)	Data Time 0.001 (0.234)	Loss 2.6881 (2.5195)	Entropy 0.60373 (0.60402)	Top-1 acc 60.547 (63.225)	Top-5 acc 81.641 (83.545)	lr 0.00794
Train [75][890/3239]	Time 0.238 (0.754)	Data Time 0.001 (0.239)	Loss 2.5402 (2.5190)	Entropy 0.60393 (0.60402)	Top-1 acc 66.406 (63.248)	Top-5 acc 81.641 (83.550)	lr 0.00794
Train [75][900/3239]	Time 0.245 (0.752)	Data Time 0.002 (0.238)	Loss 2.6360 (2.5191)	Entropy 0.60370 (0.60402)	Top-1 acc 58.203 (63.246)	Top-5 acc 83.594 (83.543)	lr 0.00794
Train [75][910/3239]	Time 0.374 (0.757)	Data Time 0.001 (0.244)	Loss 2.4797 (2.5187)	Entropy 0.60341 (0.60401)	Top-1 acc 62.109 (63.248)	Top-5 acc 83.594 (83.550)	lr 0.00793
Train [75][920/3239]	Time 0.263 (0.757)	Data Time 0.001 (0.245)	Loss 2.4767 (2.5193)	Entropy 0.60317 (0.60401)	Top-1 acc 66.016 (63.231)	Top-5 acc 83.984 (83.544)	lr 0.00793
Train [75][930/3239]	Time 1.680 (0.756)	Data Time 1.414 (0.244)	Loss 2.5079 (2.5193)	Entropy 0.60300 (0.60400)	Top-1 acc 62.109 (63.230)	Top-5 acc 84.375 (83.541)	lr 0.00793
Train [75][940/3239]	Time 4.535 (0.760)	Data Time 4.278 (0.249)	Loss 2.5704 (2.5202)	Entropy 0.60264 (0.60398)	Top-1 acc 65.625 (63.209)	Top-5 acc 80.469 (83.524)	lr 0.00793
Train [75][950/3239]	Time 1.191 (0.760)	Data Time 0.948 (0.250)	Loss 2.6291 (2.5213)	Entropy 0.60270 (0.60397)	Top-1 acc 62.500 (63.175)	Top-5 acc 80.469 (83.506)	lr 0.00793
Train [75][960/3239]	Time 0.245 (0.760)	Data Time 0.001 (0.250)	Loss 2.4396 (2.5216)	Entropy 0.60285 (0.60396)	Top-1 acc 63.672 (63.169)	Top-5 acc 85.547 (83.506)	lr 0.00793
Train [75][970/3239]	Time 0.255 (0.757)	Data Time 0.001 (0.248)	Loss 2.5710 (2.5218)	Entropy 0.60267 (0.60394)	Top-1 acc 64.453 (63.166)	Top-5 acc 82.812 (83.499)	lr 0.00793
Train [75][980/3239]	Time 1.510 (0.759)	Data Time 1.116 (0.251)	Loss 2.5570 (2.5228)	Entropy 0.60248 (0.60393)	Top-1 acc 63.672 (63.142)	Top-5 acc 80.859 (83.487)	lr 0.00793
Train [75][990/3239]	Time 0.256 (0.764)	Data Time 0.001 (0.256)	Loss 2.4960 (2.5233)	Entropy 0.60250 (0.60392)	Top-1 acc 64.453 (63.127)	Top-5 acc 82.812 (83.462)	lr 0.00793
Train [75][1000/3239]	Time 0.246 (0.760)	Data Time 0.001 (0.253)	Loss 2.5508 (2.5235)	Entropy 0.60234 (0.60390)	Top-1 acc 62.500 (63.122)	Top-5 acc 85.547 (83.455)	lr 0.00793
Train [75][1010/3239]	Time 0.233 (0.762)	Data Time 0.001 (0.256)	Loss 2.6607 (2.5239)	Entropy 0.60211 (0.60389)	Top-1 acc 60.938 (63.117)	Top-5 acc 80.078 (83.448)	lr 0.00793
Train [75][1020/3239]	Time 0.234 (0.766)	Data Time 0.001 (0.260)	Loss 2.7566 (2.5236)	Entropy 0.60245 (0.60387)	Top-1 acc 54.688 (63.119)	Top-5 acc 79.297 (83.453)	lr 0.00792
Train [75][1030/3239]	Time 0.292 (0.764)	Data Time 0.002 (0.259)	Loss 2.5998 (2.5233)	Entropy 0.60262 (0.60386)	Top-1 acc 60.938 (63.131)	Top-5 acc 82.422 (83.454)	lr 0.00792
Train [75][1040/3239]	Time 0.253 (0.765)	Data Time 0.002 (0.260)	Loss 2.5881 (2.5229)	Entropy 0.60292 (0.60384)	Top-1 acc 58.203 (63.137)	Top-5 acc 82.812 (83.454)	lr 0.00792
Train [75][1050/3239]	Time 0.251 (0.768)	Data Time 0.001 (0.264)	Loss 2.4019 (2.5236)	Entropy 0.60300 (0.60384)	Top-1 acc 66.797 (63.119)	Top-5 acc 84.375 (83.439)	lr 0.00792
Train [75][1060/3239]	Time 0.818 (0.766)	Data Time 0.578 (0.263)	Loss 2.5031 (2.5232)	Entropy 0.60312 (0.60383)	Top-1 acc 62.891 (63.124)	Top-5 acc 86.328 (83.450)	lr 0.00792
Train [75][1070/3239]	Time 0.343 (0.769)	Data Time 0.001 (0.266)	Loss 2.5210 (2.5232)	Entropy 0.60314 (0.60382)	Top-1 acc 65.234 (63.121)	Top-5 acc 82.812 (83.453)	lr 0.00792
Train [75][1080/3239]	Time 0.231 (0.773)	Data Time 0.001 (0.271)	Loss 2.6105 (2.5227)	Entropy 0.60294 (0.60381)	Top-1 acc 59.766 (63.128)	Top-5 acc 83.984 (83.468)	lr 0.00792
Train [75][1090/3239]	Time 0.240 (0.770)	Data Time 0.001 (0.269)	Loss 2.3264 (2.5227)	Entropy 0.60302 (0.60381)	Top-1 acc 67.578 (63.129)	Top-5 acc 87.109 (83.467)	lr 0.00792
Train [75][1100/3239]	Time 4.687 (0.773)	Data Time 4.403 (0.272)	Loss 2.4408 (2.5216)	Entropy 0.60306 (0.60380)	Top-1 acc 62.109 (63.157)	Top-5 acc 84.766 (83.490)	lr 0.00792
Train [75][1110/3239]	Time 0.250 (0.776)	Data Time 0.001 (0.276)	Loss 2.4689 (2.5217)	Entropy 0.60326 (0.60379)	Top-1 acc 65.234 (63.147)	Top-5 acc 85.938 (83.488)	lr 0.00792
Train [75][1120/3239]	Time 0.242 (0.775)	Data Time 0.001 (0.275)	Loss 2.4190 (2.5215)	Entropy 0.60335 (0.60379)	Top-1 acc 66.797 (63.153)	Top-5 acc 86.328 (83.492)	lr 0.00791
Train [75][1130/3239]	Time 0.256 (0.774)	Data Time 0.001 (0.275)	Loss 2.7681 (2.5219)	Entropy 0.60342 (0.60378)	Top-1 acc 57.812 (63.145)	Top-5 acc 81.250 (83.479)	lr 0.00791
Train [75][1140/3239]	Time 7.664 (0.780)	Data Time 7.312 (0.281)	Loss 2.7559 (2.5225)	Entropy 0.60347 (0.60378)	Top-1 acc 51.172 (63.123)	Top-5 acc 81.641 (83.472)	lr 0.00791
Train [75][1150/3239]	Time 0.257 (0.779)	Data Time 0.002 (0.281)	Loss 2.3612 (2.5224)	Entropy 0.60358 (0.60378)	Top-1 acc 68.359 (63.125)	Top-5 acc 87.109 (83.474)	lr 0.00791
Train [75][1160/3239]	Time 0.255 (0.776)	Data Time 0.001 (0.279)	Loss 2.4692 (2.5226)	Entropy 0.60379 (0.60378)	Top-1 acc 62.109 (63.123)	Top-5 acc 84.375 (83.470)	lr 0.00791
Train [75][1170/3239]	Time 0.247 (0.780)	Data Time 0.001 (0.283)	Loss 2.6836 (2.5229)	Entropy 0.60384 (0.60378)	Top-1 acc 56.250 (63.114)	Top-5 acc 83.203 (83.471)	lr 0.00791
Train [75][1180/3239]	Time 0.234 (0.787)	Data Time 0.001 (0.290)	Loss 2.3914 (2.5227)	Entropy 0.60385 (0.60378)	Top-1 acc 65.625 (63.120)	Top-5 acc 87.109 (83.479)	lr 0.00791
Train [75][1190/3239]	Time 0.234 (0.784)	Data Time 0.001 (0.288)	Loss 2.3604 (2.5228)	Entropy 0.60411 (0.60378)	Top-1 acc 67.578 (63.125)	Top-5 acc 84.766 (83.479)	lr 0.00791
Train [75][1200/3239]	Time 0.237 (0.789)	Data Time 0.001 (0.293)	Loss 2.9442 (2.5237)	Entropy 0.60442 (0.60378)	Top-1 acc 52.344 (63.110)	Top-5 acc 76.562 (83.467)	lr 0.00791
Train [75][1210/3239]	Time 0.248 (0.791)	Data Time 0.001 (0.296)	Loss 2.4981 (2.5238)	Entropy 0.60428 (0.60379)	Top-1 acc 63.672 (63.111)	Top-5 acc 83.984 (83.460)	lr 0.00791
Train [75][1220/3239]	Time 0.257 (0.788)	Data Time 0.002 (0.294)	Loss 2.2433 (2.5238)	Entropy 0.60431 (0.60379)	Top-1 acc 70.312 (63.111)	Top-5 acc 89.453 (83.462)	lr 0.00791
Train [75][1230/3239]	Time 0.244 (0.795)	Data Time 0.001 (0.301)	Loss 2.3934 (2.5235)	Entropy 0.60439 (0.60380)	Top-1 acc 65.625 (63.119)	Top-5 acc 85.938 (83.464)	lr 0.00790
Train [75][1240/3239]	Time 0.249 (0.795)	Data Time 0.001 (0.301)	Loss 2.6919 (2.5235)	Entropy 0.60432 (0.60380)	Top-1 acc 64.844 (63.126)	Top-5 acc 82.031 (83.468)	lr 0.00790
Train [75][1250/3239]	Time 0.430 (0.835)	Data Time 0.033 (0.301)	Loss 2.5198 (2.5236)	Entropy 0.60435 (0.60380)	Top-1 acc 67.188 (63.120)	Top-5 acc 82.031 (83.464)	lr 0.00790
Train [75][1260/3239]	Time 0.246 (0.832)	Data Time 0.002 (0.299)	Loss 2.5684 (2.5237)	Entropy 0.60441 (0.60381)	Top-1 acc 63.672 (63.118)	Top-5 acc 81.641 (83.470)	lr 0.00790
Train [75][1270/3239]	Time 0.249 (0.829)	Data Time 0.002 (0.296)	Loss 2.5809 (2.5233)	Entropy 0.60461 (0.60381)	Top-1 acc 60.156 (63.122)	Top-5 acc 83.984 (83.476)	lr 0.00790
Train [75][1280/3239]	Time 0.251 (0.826)	Data Time 0.002 (0.294)	Loss 2.5238 (2.5237)	Entropy 0.60423 (0.60382)	Top-1 acc 62.500 (63.111)	Top-5 acc 82.422 (83.467)	lr 0.00790
Train [75][1290/3239]	Time 0.268 (0.823)	Data Time 0.001 (0.292)	Loss 2.5380 (2.5239)	Entropy 0.60421 (0.60382)	Top-1 acc 60.938 (63.095)	Top-5 acc 82.031 (83.458)	lr 0.00790
Train [75][1300/3239]	Time 0.341 (0.820)	Data Time 0.001 (0.290)	Loss 2.6594 (2.5242)	Entropy 0.60422 (0.60382)	Top-1 acc 60.938 (63.087)	Top-5 acc 81.250 (83.458)	lr 0.00790
Train [75][1310/3239]	Time 0.265 (0.817)	Data Time 0.001 (0.287)	Loss 2.5758 (2.5243)	Entropy 0.60458 (0.60383)	Top-1 acc 62.500 (63.085)	Top-5 acc 81.250 (83.458)	lr 0.00790
Train [75][1320/3239]	Time 2.915 (0.818)	Data Time 2.647 (0.288)	Loss 2.3717 (2.5239)	Entropy 0.60458 (0.60383)	Top-1 acc 67.578 (63.095)	Top-5 acc 85.938 (83.468)	lr 0.00790
Train [75][1330/3239]	Time 0.245 (0.815)	Data Time 0.001 (0.287)	Loss 2.5949 (2.5239)	Entropy 0.60429 (0.60384)	Top-1 acc 60.547 (63.096)	Top-5 acc 83.203 (83.463)	lr 0.00790
Train [75][1340/3239]	Time 0.236 (0.815)	Data Time 0.001 (0.287)	Loss 2.5258 (2.5237)	Entropy 0.60452 (0.60384)	Top-1 acc 64.844 (63.102)	Top-5 acc 83.984 (83.466)	lr 0.00789
Train [75][1350/3239]	Time 0.228 (0.818)	Data Time 0.001 (0.291)	Loss 2.6433 (2.5240)	Entropy 0.60459 (0.60385)	Top-1 acc 59.766 (63.088)	Top-5 acc 83.594 (83.462)	lr 0.00789
Train [75][1360/3239]	Time 0.241 (0.822)	Data Time 0.001 (0.295)	Loss 2.5560 (2.5238)	Entropy 0.60470 (0.60385)	Top-1 acc 64.062 (63.098)	Top-5 acc 84.375 (83.473)	lr 0.00789
Train [75][1370/3239]	Time 0.262 (0.821)	Data Time 0.001 (0.295)	Loss 2.5490 (2.5239)	Entropy 0.60476 (0.60386)	Top-1 acc 63.281 (63.099)	Top-5 acc 84.766 (83.474)	lr 0.00789
Train [75][1380/3239]	Time 0.236 (0.824)	Data Time 0.001 (0.298)	Loss 2.4770 (2.5241)	Entropy 0.60477 (0.60387)	Top-1 acc 63.672 (63.101)	Top-5 acc 83.984 (83.463)	lr 0.00789
Train [75][1390/3239]	Time 0.278 (0.825)	Data Time 0.001 (0.301)	Loss 2.5415 (2.5239)	Entropy 0.60508 (0.60387)	Top-1 acc 59.766 (63.103)	Top-5 acc 82.812 (83.469)	lr 0.00789
Train [75][1400/3239]	Time 0.248 (0.826)	Data Time 0.001 (0.303)	Loss 2.3967 (2.5236)	Entropy 0.60498 (0.60388)	Top-1 acc 67.969 (63.112)	Top-5 acc 83.203 (83.473)	lr 0.00789
Train [75][1410/3239]	Time 4.646 (0.827)	Data Time 4.387 (0.304)	Loss 2.4750 (2.5236)	Entropy 0.60503 (0.60389)	Top-1 acc 65.234 (63.104)	Top-5 acc 80.469 (83.471)	lr 0.00789
Train [75][1420/3239]	Time 4.068 (0.829)	Data Time 3.803 (0.306)	Loss 2.5650 (2.5238)	Entropy 0.60468 (0.60390)	Top-1 acc 62.109 (63.105)	Top-5 acc 80.078 (83.466)	lr 0.00789
Train [75][1430/3239]	Time 0.243 (0.829)	Data Time 0.001 (0.307)	Loss 2.4749 (2.5238)	Entropy 0.60464 (0.60390)	Top-1 acc 60.547 (63.096)	Top-5 acc 86.328 (83.471)	lr 0.00789
Train [75][1440/3239]	Time 0.247 (0.827)	Data Time 0.001 (0.305)	Loss 2.5107 (2.5235)	Entropy 0.60491 (0.60391)	Top-1 acc 64.062 (63.106)	Top-5 acc 83.203 (83.478)	lr 0.00788
Train [75][1450/3239]	Time 0.250 (0.831)	Data Time 0.001 (0.310)	Loss 2.5366 (2.5237)	Entropy 0.60462 (0.60391)	Top-1 acc 62.891 (63.099)	Top-5 acc 82.422 (83.474)	lr 0.00788
Train [75][1460/3239]	Time 0.387 (0.834)	Data Time 0.002 (0.313)	Loss 2.4135 (2.5235)	Entropy 0.60444 (0.60392)	Top-1 acc 66.406 (63.114)	Top-5 acc 84.766 (83.471)	lr 0.00788
Train [75][1470/3239]	Time 0.263 (0.831)	Data Time 0.001 (0.311)	Loss 2.5931 (2.5234)	Entropy 0.60434 (0.60392)	Top-1 acc 65.234 (63.116)	Top-5 acc 79.688 (83.471)	lr 0.00788
Train [75][1480/3239]	Time 0.257 (0.833)	Data Time 0.001 (0.314)	Loss 2.4756 (2.5236)	Entropy 0.60437 (0.60393)	Top-1 acc 63.281 (63.111)	Top-5 acc 82.031 (83.466)	lr 0.00788
Train [75][1490/3239]	Time 0.258 (0.834)	Data Time 0.001 (0.315)	Loss 2.5148 (2.5236)	Entropy 0.60458 (0.60393)	Top-1 acc 61.719 (63.103)	Top-5 acc 84.766 (83.467)	lr 0.00788
Train [75][1500/3239]	Time 0.242 (0.834)	Data Time 0.001 (0.315)	Loss 2.5088 (2.5233)	Entropy 0.60433 (0.60393)	Top-1 acc 64.453 (63.108)	Top-5 acc 83.594 (83.474)	lr 0.00788
Train [75][1510/3239]	Time 1.046 (0.835)	Data Time 0.785 (0.317)	Loss 2.7307 (2.5235)	Entropy 0.60441 (0.60394)	Top-1 acc 57.422 (63.100)	Top-5 acc 84.375 (83.476)	lr 0.00788
Train [75][1520/3239]	Time 0.252 (0.836)	Data Time 0.001 (0.318)	Loss 2.3080 (2.5235)	Entropy 0.60429 (0.60394)	Top-1 acc 68.359 (63.101)	Top-5 acc 87.500 (83.479)	lr 0.00788
Train [75][1530/3239]	Time 0.361 (0.837)	Data Time 0.002 (0.320)	Loss 2.5640 (2.5241)	Entropy 0.60448 (0.60394)	Top-1 acc 61.719 (63.091)	Top-5 acc 84.766 (83.465)	lr 0.00788
Train [75][1540/3239]	Time 3.038 (0.839)	Data Time 2.782 (0.323)	Loss 2.6055 (2.5241)	Entropy 0.60467 (0.60395)	Top-1 acc 58.594 (63.094)	Top-5 acc 82.422 (83.467)	lr 0.00788
Train [75][1550/3239]	Time 0.286 (0.839)	Data Time 0.001 (0.323)	Loss 2.4520 (2.5239)	Entropy 0.60439 (0.60395)	Top-1 acc 67.578 (63.098)	Top-5 acc 83.203 (83.471)	lr 0.00787
Train [75][1560/3239]	Time 0.238 (0.840)	Data Time 0.001 (0.325)	Loss 2.4599 (2.5239)	Entropy 0.60433 (0.60395)	Top-1 acc 66.406 (63.101)	Top-5 acc 83.984 (83.470)	lr 0.00787
Train [75][1570/3239]	Time 5.322 (0.841)	Data Time 5.014 (0.326)	Loss 2.5504 (2.5240)	Entropy 0.60447 (0.60395)	Top-1 acc 65.234 (63.102)	Top-5 acc 87.109 (83.470)	lr 0.00787
Train [75][1580/3239]	Time 0.257 (0.848)	Data Time 0.001 (0.333)	Loss 2.3735 (2.5239)	Entropy 0.60477 (0.60396)	Top-1 acc 68.750 (63.105)	Top-5 acc 84.766 (83.467)	lr 0.00787
Train [75][1590/3239]	Time 0.222 (0.845)	Data Time 0.001 (0.331)	Loss 2.5067 (2.5237)	Entropy 0.60482 (0.60396)	Top-1 acc 64.844 (63.107)	Top-5 acc 83.203 (83.473)	lr 0.00787
Train [75][1600/3239]	Time 0.243 (0.843)	Data Time 0.001 (0.329)	Loss 2.4765 (2.5239)	Entropy 0.60491 (0.60397)	Top-1 acc 64.062 (63.102)	Top-5 acc 82.422 (83.463)	lr 0.00787
Train [75][1610/3239]	Time 0.244 (0.852)	Data Time 0.001 (0.339)	Loss 2.3792 (2.5237)	Entropy 0.60516 (0.60398)	Top-1 acc 66.406 (63.105)	Top-5 acc 86.719 (83.465)	lr 0.00787
Train [75][1620/3239]	Time 0.326 (0.849)	Data Time 0.001 (0.337)	Loss 2.5869 (2.5236)	Entropy 0.60530 (0.60398)	Top-1 acc 59.375 (63.102)	Top-5 acc 82.422 (83.467)	lr 0.00787
Train [75][1630/3239]	Time 0.230 (0.847)	Data Time 0.001 (0.335)	Loss 2.5414 (2.5237)	Entropy 0.60535 (0.60399)	Top-1 acc 59.375 (63.099)	Top-5 acc 83.594 (83.463)	lr 0.00787
Train [75][1640/3239]	Time 0.253 (0.857)	Data Time 0.001 (0.345)	Loss 2.4170 (2.5238)	Entropy 0.60535 (0.60400)	Top-1 acc 66.406 (63.094)	Top-5 acc 84.375 (83.459)	lr 0.00787
Train [75][1650/3239]	Time 0.261 (0.855)	Data Time 0.001 (0.343)	Loss 2.6532 (2.5245)	Entropy 0.60514 (0.60401)	Top-1 acc 60.547 (63.069)	Top-5 acc 79.688 (83.444)	lr 0.00787
Train [75][1660/3239]	Time 0.257 (0.852)	Data Time 0.002 (0.341)	Loss 2.5503 (2.5249)	Entropy 0.60517 (0.60401)	Top-1 acc 64.453 (63.063)	Top-5 acc 83.594 (83.436)	lr 0.00786
Train [75][1670/3239]	Time 9.849 (0.860)	Data Time 9.586 (0.349)	Loss 2.5487 (2.5251)	Entropy 0.60530 (0.60402)	Top-1 acc 63.281 (63.069)	Top-5 acc 83.984 (83.432)	lr 0.00786
Train [75][1680/3239]	Time 0.265 (0.857)	Data Time 0.002 (0.347)	Loss 2.5301 (2.5255)	Entropy 0.60549 (0.60403)	Top-1 acc 59.375 (63.058)	Top-5 acc 83.203 (83.424)	lr 0.00786
Train [75][1690/3239]	Time 0.369 (0.855)	Data Time 0.002 (0.345)	Loss 2.4419 (2.5254)	Entropy 0.60541 (0.60404)	Top-1 acc 66.797 (63.063)	Top-5 acc 82.812 (83.429)	lr 0.00786
Train [75][1700/3239]	Time 4.477 (0.855)	Data Time 4.200 (0.345)	Loss 2.5416 (2.5253)	Entropy 0.60523 (0.60405)	Top-1 acc 61.328 (63.072)	Top-5 acc 83.203 (83.429)	lr 0.00786
Train [75][1710/3239]	Time 0.289 (0.858)	Data Time 0.002 (0.349)	Loss 2.5918 (2.5253)	Entropy 0.60525 (0.60405)	Top-1 acc 63.672 (63.078)	Top-5 acc 83.203 (83.429)	lr 0.00786
Train [75][1720/3239]	Time 0.244 (0.856)	Data Time 0.002 (0.347)	Loss 2.4421 (2.5252)	Entropy 0.60547 (0.60406)	Top-1 acc 65.234 (63.081)	Top-5 acc 85.156 (83.432)	lr 0.00786
Train [75][1730/3239]	Time 2.455 (0.855)	Data Time 2.161 (0.346)	Loss 2.7285 (2.5257)	Entropy 0.60576 (0.60407)	Top-1 acc 57.812 (63.069)	Top-5 acc 79.688 (83.424)	lr 0.00786
Train [75][1740/3239]	Time 0.233 (0.860)	Data Time 0.001 (0.352)	Loss 2.2410 (2.5258)	Entropy 0.60590 (0.60408)	Top-1 acc 70.703 (63.065)	Top-5 acc 91.016 (83.424)	lr 0.00786
Train [75][1750/3239]	Time 0.244 (0.858)	Data Time 0.002 (0.350)	Loss 2.5871 (2.5256)	Entropy 0.60618 (0.60409)	Top-1 acc 60.547 (63.066)	Top-5 acc 83.984 (83.426)	lr 0.00786
Train [75][1760/3239]	Time 0.238 (0.855)	Data Time 0.001 (0.348)	Loss 2.6335 (2.5263)	Entropy 0.60591 (0.60410)	Top-1 acc 59.375 (63.050)	Top-5 acc 80.078 (83.412)	lr 0.00785
Train [75][1770/3239]	Time 0.238 (0.861)	Data Time 0.001 (0.354)	Loss 2.6935 (2.5266)	Entropy 0.60612 (0.60411)	Top-1 acc 60.938 (63.039)	Top-5 acc 82.031 (83.403)	lr 0.00785
Train [75][1780/3239]	Time 0.346 (0.858)	Data Time 0.004 (0.352)	Loss 2.3570 (2.5265)	Entropy 0.60549 (0.60412)	Top-1 acc 68.750 (63.044)	Top-5 acc 85.156 (83.405)	lr 0.00785
Train [75][1790/3239]	Time 0.239 (0.856)	Data Time 0.001 (0.350)	Loss 2.4387 (2.5265)	Entropy 0.60581 (0.60413)	Top-1 acc 64.453 (63.043)	Top-5 acc 86.328 (83.405)	lr 0.00785
Train [75][1800/3239]	Time 0.261 (0.864)	Data Time 0.001 (0.358)	Loss 2.6074 (2.5265)	Entropy 0.60601 (0.60414)	Top-1 acc 60.547 (63.049)	Top-5 acc 82.422 (83.402)	lr 0.00785
Train [75][1810/3239]	Time 0.282 (0.861)	Data Time 0.003 (0.356)	Loss 2.4399 (2.5266)	Entropy 0.60611 (0.60415)	Top-1 acc 67.188 (63.045)	Top-5 acc 83.203 (83.399)	lr 0.00785
Train [75][1820/3239]	Time 0.262 (0.859)	Data Time 0.001 (0.354)	Loss 2.4060 (2.5265)	Entropy 0.60582 (0.60416)	Top-1 acc 65.625 (63.047)	Top-5 acc 85.938 (83.399)	lr 0.00785
Train [75][1830/3239]	Time 11.240 (0.864)	Data Time 10.957 (0.360)	Loss 2.3906 (2.5265)	Entropy 0.60568 (0.60417)	Top-1 acc 66.797 (63.048)	Top-5 acc 85.156 (83.400)	lr 0.00785
Train [75][1840/3239]	Time 0.239 (0.862)	Data Time 0.001 (0.358)	Loss 2.6797 (2.5268)	Entropy 0.60533 (0.60418)	Top-1 acc 60.938 (63.043)	Top-5 acc 80.859 (83.394)	lr 0.00785
Train [75][1850/3239]	Time 0.379 (0.860)	Data Time 0.001 (0.356)	Loss 2.3707 (2.5267)	Entropy 0.60524 (0.60418)	Top-1 acc 67.969 (63.048)	Top-5 acc 87.109 (83.396)	lr 0.00785
Train [75][1860/3239]	Time 2.926 (0.860)	Data Time 2.673 (0.356)	Loss 2.5138 (2.5269)	Entropy 0.60498 (0.60419)	Top-1 acc 60.938 (63.038)	Top-5 acc 81.250 (83.388)	lr 0.00785
Train [75][1870/3239]	Time 0.249 (0.865)	Data Time 0.001 (0.362)	Loss 2.3713 (2.5272)	Entropy 0.60530 (0.60419)	Top-1 acc 67.969 (63.036)	Top-5 acc 85.547 (83.385)	lr 0.00784
Train [75][1880/3239]	Time 0.284 (0.863)	Data Time 0.001 (0.360)	Loss 2.5944 (2.5270)	Entropy 0.60490 (0.60420)	Top-1 acc 59.375 (63.037)	Top-5 acc 82.031 (83.390)	lr 0.00784
Train [75][1890/3239]	Time 0.253 (0.862)	Data Time 0.001 (0.359)	Loss 2.4542 (2.5271)	Entropy 0.60498 (0.60420)	Top-1 acc 63.672 (63.033)	Top-5 acc 84.375 (83.388)	lr 0.00784
Train [75][1900/3239]	Time 0.263 (0.866)	Data Time 0.001 (0.364)	Loss 2.5039 (2.5266)	Entropy 0.60527 (0.60421)	Top-1 acc 67.969 (63.047)	Top-5 acc 82.422 (83.393)	lr 0.00784
Train [75][1910/3239]	Time 0.370 (0.890)	Data Time 0.003 (0.362)	Loss 2.3025 (2.5267)	Entropy 0.60486 (0.60421)	Top-1 acc 68.359 (63.044)	Top-5 acc 89.062 (83.392)	lr 0.00784
Train [75][1920/3239]	Time 0.258 (0.888)	Data Time 0.002 (0.360)	Loss 2.3854 (2.5266)	Entropy 0.60485 (0.60422)	Top-1 acc 64.844 (63.039)	Top-5 acc 86.328 (83.396)	lr 0.00784
Train [75][1930/3239]	Time 0.255 (0.885)	Data Time 0.002 (0.359)	Loss 2.6874 (2.5266)	Entropy 0.60508 (0.60422)	Top-1 acc 60.938 (63.034)	Top-5 acc 78.516 (83.394)	lr 0.00784
Train [75][1940/3239]	Time 0.372 (0.883)	Data Time 0.001 (0.357)	Loss 2.4687 (2.5266)	Entropy 0.60513 (0.60422)	Top-1 acc 63.281 (63.034)	Top-5 acc 82.422 (83.394)	lr 0.00784
Train [75][1950/3239]	Time 0.257 (0.881)	Data Time 0.001 (0.355)	Loss 2.5762 (2.5266)	Entropy 0.60527 (0.60423)	Top-1 acc 60.156 (63.040)	Top-5 acc 82.031 (83.396)	lr 0.00784
Train [75][1960/3239]	Time 0.264 (0.879)	Data Time 0.001 (0.353)	Loss 2.3611 (2.5269)	Entropy 0.60542 (0.60423)	Top-1 acc 64.062 (63.033)	Top-5 acc 86.719 (83.393)	lr 0.00784
Train [75][1970/3239]	Time 0.242 (0.877)	Data Time 0.002 (0.351)	Loss 2.5838 (2.5269)	Entropy 0.60516 (0.60424)	Top-1 acc 60.156 (63.029)	Top-5 acc 83.203 (83.392)	lr 0.00784
Train [75][1980/3239]	Time 0.852 (0.875)	Data Time 0.563 (0.350)	Loss 2.4953 (2.5268)	Entropy 0.60491 (0.60424)	Top-1 acc 60.938 (63.031)	Top-5 acc 84.766 (83.390)	lr 0.00783
Train [75][1990/3239]	Time 0.296 (0.874)	Data Time 0.003 (0.349)	Loss 2.5529 (2.5268)	Entropy 0.60466 (0.60424)	Top-1 acc 61.328 (63.029)	Top-5 acc 85.156 (83.389)	lr 0.00783
Train [75][2000/3239]	Time 0.246 (0.873)	Data Time 0.002 (0.348)	Loss 2.5958 (2.5269)	Entropy 0.60462 (0.60425)	Top-1 acc 64.453 (63.030)	Top-5 acc 81.250 (83.387)	lr 0.00783
Train [75][2010/3239]	Time 0.366 (0.876)	Data Time 0.001 (0.352)	Loss 2.6547 (2.5270)	Entropy 0.60437 (0.60425)	Top-1 acc 57.812 (63.026)	Top-5 acc 81.641 (83.388)	lr 0.00783
Train [75][2020/3239]	Time 0.276 (0.875)	Data Time 0.001 (0.352)	Loss 2.4874 (2.5273)	Entropy 0.60420 (0.60425)	Top-1 acc 60.156 (63.010)	Top-5 acc 84.375 (83.381)	lr 0.00783
Train [75][2030/3239]	Time 0.270 (0.875)	Data Time 0.001 (0.352)	Loss 2.3988 (2.5273)	Entropy 0.60456 (0.60425)	Top-1 acc 66.797 (63.012)	Top-5 acc 87.109 (83.382)	lr 0.00783
Train [75][2040/3239]	Time 0.242 (0.877)	Data Time 0.001 (0.354)	Loss 2.7340 (2.5272)	Entropy 0.60472 (0.60425)	Top-1 acc 56.641 (63.011)	Top-5 acc 82.031 (83.388)	lr 0.00783
Train [75][2050/3239]	Time 0.694 (0.878)	Data Time 0.420 (0.355)	Loss 2.5071 (2.5271)	Entropy 0.60462 (0.60425)	Top-1 acc 60.547 (63.009)	Top-5 acc 82.422 (83.392)	lr 0.00783
Train [75][2060/3239]	Time 0.258 (0.876)	Data Time 0.001 (0.354)	Loss 2.3929 (2.5269)	Entropy 0.60460 (0.60426)	Top-1 acc 65.234 (63.011)	Top-5 acc 87.500 (83.397)	lr 0.00783
Train [75][2070/3239]	Time 2.998 (0.880)	Data Time 2.730 (0.359)	Loss 2.6383 (2.5272)	Entropy 0.60424 (0.60426)	Top-1 acc 59.375 (63.005)	Top-5 acc 80.078 (83.394)	lr 0.00783
Train [75][2080/3239]	Time 0.300 (0.880)	Data Time 0.001 (0.358)	Loss 2.6482 (2.5270)	Entropy 0.60417 (0.60426)	Top-1 acc 58.594 (63.011)	Top-5 acc 82.422 (83.395)	lr 0.00782
Train [75][2090/3239]	Time 0.259 (0.878)	Data Time 0.001 (0.357)	Loss 2.5741 (2.5269)	Entropy 0.60405 (0.60426)	Top-1 acc 61.719 (63.012)	Top-5 acc 84.766 (83.399)	lr 0.00782
Train [75][2100/3239]	Time 0.250 (0.880)	Data Time 0.001 (0.359)	Loss 2.5041 (2.5268)	Entropy 0.60448 (0.60426)	Top-1 acc 64.844 (63.011)	Top-5 acc 84.375 (83.399)	lr 0.00782
Train [75][2110/3239]	Time 0.250 (0.883)	Data Time 0.002 (0.362)	Loss 2.4351 (2.5268)	Entropy 0.60449 (0.60426)	Top-1 acc 64.844 (63.011)	Top-5 acc 84.375 (83.396)	lr 0.00782
Train [75][2120/3239]	Time 0.235 (0.881)	Data Time 0.001 (0.361)	Loss 2.5236 (2.5267)	Entropy 0.60473 (0.60426)	Top-1 acc 63.672 (63.017)	Top-5 acc 83.203 (83.400)	lr 0.00782
Train [75][2130/3239]	Time 0.249 (0.880)	Data Time 0.001 (0.360)	Loss 2.6498 (2.5268)	Entropy 0.60486 (0.60426)	Top-1 acc 60.156 (63.016)	Top-5 acc 79.688 (83.401)	lr 0.00782
Train [75][2140/3239]	Time 0.319 (0.882)	Data Time 0.001 (0.363)	Loss 2.6620 (2.5271)	Entropy 0.60514 (0.60426)	Top-1 acc 63.672 (63.009)	Top-5 acc 79.297 (83.395)	lr 0.00782
Train [75][2150/3239]	Time 0.271 (0.881)	Data Time 0.002 (0.362)	Loss 2.5272 (2.5271)	Entropy 0.60515 (0.60427)	Top-1 acc 61.719 (63.008)	Top-5 acc 83.203 (83.396)	lr 0.00782
Train [75][2160/3239]	Time 0.229 (0.879)	Data Time 0.001 (0.361)	Loss 2.6484 (2.5273)	Entropy 0.60497 (0.60427)	Top-1 acc 61.719 (63.008)	Top-5 acc 80.469 (83.391)	lr 0.00782
Train [75][2170/3239]	Time 0.342 (0.884)	Data Time 0.001 (0.365)	Loss 2.5813 (2.5274)	Entropy 0.60500 (0.60428)	Top-1 acc 64.844 (63.002)	Top-5 acc 80.469 (83.389)	lr 0.00782
Train [75][2180/3239]	Time 0.262 (0.883)	Data Time 0.006 (0.365)	Loss 2.4139 (2.5274)	Entropy 0.60480 (0.60428)	Top-1 acc 67.188 (63.002)	Top-5 acc 82.812 (83.388)	lr 0.00782
Train [75][2190/3239]	Time 0.266 (0.881)	Data Time 0.001 (0.364)	Loss 2.4163 (2.5274)	Entropy 0.60443 (0.60428)	Top-1 acc 65.625 (63.004)	Top-5 acc 85.547 (83.386)	lr 0.00781
Train [75][2200/3239]	Time 0.247 (0.885)	Data Time 0.001 (0.368)	Loss 2.4136 (2.5274)	Entropy 0.60371 (0.60428)	Top-1 acc 66.016 (63.002)	Top-5 acc 87.500 (83.386)	lr 0.00781
Train [75][2210/3239]	Time 0.227 (0.885)	Data Time 0.002 (0.368)	Loss 2.6511 (2.5278)	Entropy 0.60339 (0.60428)	Top-1 acc 59.766 (62.994)	Top-5 acc 79.297 (83.382)	lr 0.00781
Train [75][2220/3239]	Time 2.076 (0.884)	Data Time 1.828 (0.368)	Loss 2.5551 (2.5279)	Entropy 0.60360 (0.60427)	Top-1 acc 59.766 (62.989)	Top-5 acc 84.766 (83.383)	lr 0.00781
Train [75][2230/3239]	Time 0.260 (0.887)	Data Time 0.001 (0.371)	Loss 2.6208 (2.5281)	Entropy 0.60385 (0.60427)	Top-1 acc 59.375 (62.983)	Top-5 acc 82.812 (83.382)	lr 0.00781
Train [75][2240/3239]	Time 0.361 (0.888)	Data Time 0.001 (0.372)	Loss 2.4884 (2.5282)	Entropy 0.60399 (0.60427)	Top-1 acc 63.281 (62.973)	Top-5 acc 82.812 (83.384)	lr 0.00781
Train [75][2250/3239]	Time 0.259 (0.886)	Data Time 0.001 (0.370)	Loss 2.3165 (2.5282)	Entropy 0.60398 (0.60427)	Top-1 acc 67.188 (62.975)	Top-5 acc 87.500 (83.386)	lr 0.00781
Train [75][2260/3239]	Time 0.254 (0.890)	Data Time 0.001 (0.375)	Loss 2.5184 (2.5281)	Entropy 0.60375 (0.60427)	Top-1 acc 63.672 (62.974)	Top-5 acc 84.766 (83.390)	lr 0.00781
Train [75][2270/3239]	Time 0.247 (0.890)	Data Time 0.001 (0.375)	Loss 2.5048 (2.5283)	Entropy 0.60353 (0.60426)	Top-1 acc 61.719 (62.967)	Top-5 acc 85.938 (83.386)	lr 0.00781
Train [75][2280/3239]	Time 0.256 (0.888)	Data Time 0.001 (0.373)	Loss 2.4546 (2.5283)	Entropy 0.60353 (0.60426)	Top-1 acc 64.062 (62.970)	Top-5 acc 83.594 (83.386)	lr 0.00781
Train [75][2290/3239]	Time 0.361 (0.886)	Data Time 0.094 (0.372)	Loss 2.5961 (2.5284)	Entropy 0.60347 (0.60426)	Top-1 acc 62.891 (62.966)	Top-5 acc 81.641 (83.385)	lr 0.00781
Train [75][2300/3239]	Time 0.285 (0.887)	Data Time 0.001 (0.373)	Loss 2.6091 (2.5282)	Entropy 0.60356 (0.60425)	Top-1 acc 60.938 (62.969)	Top-5 acc 81.250 (83.388)	lr 0.00780
Train [75][2310/3239]	Time 0.245 (0.885)	Data Time 0.001 (0.372)	Loss 2.3832 (2.5282)	Entropy 0.60355 (0.60425)	Top-1 acc 67.188 (62.970)	Top-5 acc 83.984 (83.384)	lr 0.00780
Train [75][2320/3239]	Time 0.246 (0.883)	Data Time 0.001 (0.370)	Loss 2.3881 (2.5280)	Entropy 0.60347 (0.60425)	Top-1 acc 63.672 (62.974)	Top-5 acc 83.984 (83.387)	lr 0.00780
Train [75][2330/3239]	Time 0.341 (0.885)	Data Time 0.001 (0.372)	Loss 2.4568 (2.5278)	Entropy 0.60364 (0.60424)	Top-1 acc 65.625 (62.982)	Top-5 acc 83.594 (83.388)	lr 0.00780
Train [75][2340/3239]	Time 0.243 (0.885)	Data Time 0.001 (0.373)	Loss 2.5542 (2.5277)	Entropy 0.60367 (0.60424)	Top-1 acc 61.719 (62.984)	Top-5 acc 83.203 (83.390)	lr 0.00780
Train [75][2350/3239]	Time 0.248 (0.885)	Data Time 0.001 (0.373)	Loss 2.4602 (2.5275)	Entropy 0.60345 (0.60424)	Top-1 acc 62.500 (62.988)	Top-5 acc 85.156 (83.394)	lr 0.00780
Train [75][2360/3239]	Time 0.226 (0.888)	Data Time 0.001 (0.376)	Loss 2.6478 (2.5276)	Entropy 0.60380 (0.60424)	Top-1 acc 60.938 (62.986)	Top-5 acc 80.078 (83.391)	lr 0.00780
Train [75][2370/3239]	Time 0.244 (0.889)	Data Time 0.001 (0.378)	Loss 2.6128 (2.5279)	Entropy 0.60393 (0.60423)	Top-1 acc 62.500 (62.980)	Top-5 acc 80.859 (83.385)	lr 0.00780
Train [75][2380/3239]	Time 0.248 (0.888)	Data Time 0.001 (0.377)	Loss 2.6466 (2.5283)	Entropy 0.60404 (0.60423)	Top-1 acc 57.812 (62.970)	Top-5 acc 80.469 (83.378)	lr 0.00780
Train [75][2390/3239]	Time 0.265 (0.891)	Data Time 0.001 (0.381)	Loss 2.4664 (2.5286)	Entropy 0.60388 (0.60423)	Top-1 acc 65.234 (62.965)	Top-5 acc 86.328 (83.371)	lr 0.00780
Train [75][2400/3239]	Time 0.338 (0.892)	Data Time 0.001 (0.382)	Loss 2.4006 (2.5286)	Entropy 0.60412 (0.60423)	Top-1 acc 65.625 (62.968)	Top-5 acc 84.766 (83.373)	lr 0.00779
Train [75][2410/3239]	Time 0.229 (0.890)	Data Time 0.001 (0.380)	Loss 2.7240 (2.5288)	Entropy 0.60418 (0.60423)	Top-1 acc 56.250 (62.964)	Top-5 acc 80.078 (83.373)	lr 0.00779
Train [75][2420/3239]	Time 0.246 (0.892)	Data Time 0.002 (0.382)	Loss 2.5358 (2.5287)	Entropy 0.60411 (0.60423)	Top-1 acc 62.109 (62.965)	Top-5 acc 83.203 (83.377)	lr 0.00779
Train [75][2430/3239]	Time 0.259 (0.895)	Data Time 0.002 (0.386)	Loss 2.4442 (2.5286)	Entropy 0.60392 (0.60423)	Top-1 acc 64.844 (62.965)	Top-5 acc 83.203 (83.376)	lr 0.00779
Train [75][2440/3239]	Time 0.225 (0.893)	Data Time 0.001 (0.385)	Loss 2.6865 (2.5287)	Entropy 0.60390 (0.60423)	Top-1 acc 57.422 (62.965)	Top-5 acc 80.859 (83.371)	lr 0.00779
Train [75][2450/3239]	Time 1.956 (0.893)	Data Time 1.720 (0.385)	Loss 2.7091 (2.5289)	Entropy 0.60410 (0.60423)	Top-1 acc 55.469 (62.959)	Top-5 acc 84.375 (83.371)	lr 0.00779
Train [75][2460/3239]	Time 0.250 (0.896)	Data Time 0.001 (0.387)	Loss 2.4535 (2.5289)	Entropy 0.60433 (0.60423)	Top-1 acc 64.453 (62.961)	Top-5 acc 83.594 (83.369)	lr 0.00779
Train [75][2470/3239]	Time 0.288 (0.894)	Data Time 0.001 (0.386)	Loss 2.5546 (2.5287)	Entropy 0.60459 (0.60423)	Top-1 acc 58.594 (62.964)	Top-5 acc 83.203 (83.373)	lr 0.00779
Train [75][2480/3239]	Time 0.313 (0.892)	Data Time 0.004 (0.384)	Loss 2.6658 (2.5288)	Entropy 0.60433 (0.60423)	Top-1 acc 59.766 (62.963)	Top-5 acc 80.469 (83.371)	lr 0.00779
Train [75][2490/3239]	Time 0.265 (0.893)	Data Time 0.001 (0.386)	Loss 2.5324 (2.5287)	Entropy 0.60403 (0.60423)	Top-1 acc 61.719 (62.965)	Top-5 acc 84.375 (83.369)	lr 0.00779
Train [75][2500/3239]	Time 0.230 (0.892)	Data Time 0.001 (0.385)	Loss 2.7232 (2.5284)	Entropy 0.60411 (0.60423)	Top-1 acc 55.859 (62.972)	Top-5 acc 78.906 (83.376)	lr 0.00779
Train [75][2510/3239]	Time 0.258 (0.890)	Data Time 0.001 (0.383)	Loss 2.4071 (2.5285)	Entropy 0.60362 (0.60423)	Top-1 acc 66.016 (62.969)	Top-5 acc 84.766 (83.374)	lr 0.00778
Train [75][2520/3239]	Time 0.252 (0.891)	Data Time 0.001 (0.384)	Loss 2.6566 (2.5285)	Entropy 0.60324 (0.60423)	Top-1 acc 61.328 (62.963)	Top-5 acc 80.078 (83.373)	lr 0.00778
Train [75][2530/3239]	Time 0.236 (0.889)	Data Time 0.001 (0.383)	Loss 2.3967 (2.5287)	Entropy 0.60336 (0.60422)	Top-1 acc 67.969 (62.960)	Top-5 acc 85.156 (83.371)	lr 0.00778
Train [75][2540/3239]	Time 0.243 (0.888)	Data Time 0.001 (0.382)	Loss 2.7299 (2.5287)	Entropy 0.60342 (0.60422)	Top-1 acc 59.375 (62.959)	Top-5 acc 80.469 (83.369)	lr 0.00778
Train [75][2550/3239]	Time 0.246 (0.889)	Data Time 0.001 (0.383)	Loss 2.6359 (2.5288)	Entropy 0.60347 (0.60422)	Top-1 acc 59.766 (62.958)	Top-5 acc 80.469 (83.367)	lr 0.00778
Train [75][2560/3239]	Time 0.663 (0.907)	Data Time 0.006 (0.382)	Loss 2.3946 (2.5288)	Entropy 0.60328 (0.60421)	Top-1 acc 67.188 (62.960)	Top-5 acc 86.719 (83.370)	lr 0.00778
Train [75][2570/3239]	Time 0.288 (0.905)	Data Time 0.002 (0.380)	Loss 2.9363 (2.5289)	Entropy 0.60349 (0.60421)	Top-1 acc 52.734 (62.953)	Top-5 acc 78.906 (83.366)	lr 0.00778
Train [75][2580/3239]	Time 0.267 (0.904)	Data Time 0.002 (0.379)	Loss 2.5436 (2.5289)	Entropy 0.60355 (0.60421)	Top-1 acc 59.375 (62.954)	Top-5 acc 82.422 (83.365)	lr 0.00778
Train [75][2590/3239]	Time 0.264 (0.902)	Data Time 0.002 (0.377)	Loss 2.3222 (2.5291)	Entropy 0.60383 (0.60420)	Top-1 acc 68.359 (62.952)	Top-5 acc 84.766 (83.361)	lr 0.00778
Train [75][2600/3239]	Time 0.256 (0.900)	Data Time 0.002 (0.376)	Loss 2.4787 (2.5290)	Entropy 0.60410 (0.60420)	Top-1 acc 65.234 (62.953)	Top-5 acc 84.375 (83.366)	lr 0.00778
Train [75][2610/3239]	Time 0.257 (0.899)	Data Time 0.002 (0.374)	Loss 2.5075 (2.5289)	Entropy 0.60449 (0.60420)	Top-1 acc 62.891 (62.956)	Top-5 acc 85.938 (83.367)	lr 0.00778
Train [75][2620/3239]	Time 0.277 (0.897)	Data Time 0.002 (0.373)	Loss 2.3306 (2.5289)	Entropy 0.60444 (0.60420)	Top-1 acc 67.188 (62.956)	Top-5 acc 87.109 (83.368)	lr 0.00777
Train [75][2630/3239]	Time 0.253 (0.896)	Data Time 0.001 (0.372)	Loss 2.5946 (2.5289)	Entropy 0.60455 (0.60421)	Top-1 acc 62.109 (62.957)	Top-5 acc 82.812 (83.368)	lr 0.00777
Train [75][2640/3239]	Time 0.353 (0.895)	Data Time 0.001 (0.372)	Loss 2.5870 (2.5287)	Entropy 0.60444 (0.60421)	Top-1 acc 59.375 (62.959)	Top-5 acc 80.859 (83.370)	lr 0.00777
Train [75][2650/3239]	Time 0.302 (0.895)	Data Time 0.001 (0.371)	Loss 2.5817 (2.5288)	Entropy 0.60444 (0.60421)	Top-1 acc 59.766 (62.960)	Top-5 acc 85.547 (83.367)	lr 0.00777
Train [75][2660/3239]	Time 0.265 (0.897)	Data Time 0.001 (0.373)	Loss 2.6920 (2.5285)	Entropy 0.60454 (0.60421)	Top-1 acc 56.250 (62.962)	Top-5 acc 82.031 (83.371)	lr 0.00777
Train [75][2670/3239]	Time 0.315 (0.897)	Data Time 0.001 (0.373)	Loss 2.5249 (2.5286)	Entropy 0.60430 (0.60421)	Top-1 acc 61.719 (62.958)	Top-5 acc 84.766 (83.371)	lr 0.00777
Train [75][2680/3239]	Time 0.642 (0.896)	Data Time 0.368 (0.373)	Loss 2.6348 (2.5288)	Entropy 0.60442 (0.60421)	Top-1 acc 62.891 (62.956)	Top-5 acc 80.469 (83.368)	lr 0.00777
Train [75][2690/3239]	Time 0.312 (0.898)	Data Time 0.001 (0.375)	Loss 2.5608 (2.5286)	Entropy 0.60469 (0.60421)	Top-1 acc 61.328 (62.960)	Top-5 acc 83.984 (83.373)	lr 0.00777
Train [75][2700/3239]	Time 0.250 (0.898)	Data Time 0.001 (0.376)	Loss 2.3919 (2.5285)	Entropy 0.60450 (0.60421)	Top-1 acc 65.234 (62.963)	Top-5 acc 87.500 (83.375)	lr 0.00777
Train [75][2710/3239]	Time 0.274 (0.899)	Data Time 0.001 (0.376)	Loss 2.3632 (2.5285)	Entropy 0.60476 (0.60421)	Top-1 acc 67.578 (62.963)	Top-5 acc 85.938 (83.372)	lr 0.00777
Train [75][2720/3239]	Time 2.657 (0.898)	Data Time 2.270 (0.376)	Loss 2.4881 (2.5284)	Entropy 0.60458 (0.60422)	Top-1 acc 66.016 (62.968)	Top-5 acc 81.641 (83.375)	lr 0.00777
Train [75][2730/3239]	Time 0.240 (0.901)	Data Time 0.001 (0.379)	Loss 2.5181 (2.5285)	Entropy 0.60459 (0.60422)	Top-1 acc 60.938 (62.964)	Top-5 acc 84.766 (83.374)	lr 0.00776
Train [75][2740/3239]	Time 0.998 (0.901)	Data Time 0.743 (0.379)	Loss 2.5480 (2.5283)	Entropy 0.60447 (0.60422)	Top-1 acc 61.719 (62.966)	Top-5 acc 84.375 (83.379)	lr 0.00776
Train [75][2750/3239]	Time 0.256 (0.899)	Data Time 0.001 (0.378)	Loss 2.6418 (2.5281)	Entropy 0.60446 (0.60422)	Top-1 acc 59.375 (62.967)	Top-5 acc 83.203 (83.384)	lr 0.00776
Train [75][2760/3239]	Time 0.250 (0.904)	Data Time 0.001 (0.382)	Loss 2.5999 (2.5283)	Entropy 0.60441 (0.60422)	Top-1 acc 56.641 (62.961)	Top-5 acc 80.859 (83.383)	lr 0.00776
Train [75][2770/3239]	Time 0.251 (0.903)	Data Time 0.001 (0.382)	Loss 2.4925 (2.5284)	Entropy 0.60424 (0.60422)	Top-1 acc 65.234 (62.959)	Top-5 acc 82.812 (83.382)	lr 0.00776
Train [75][2780/3239]	Time 0.250 (0.901)	Data Time 0.002 (0.381)	Loss 2.4989 (2.5283)	Entropy 0.60416 (0.60422)	Top-1 acc 66.406 (62.960)	Top-5 acc 81.250 (83.385)	lr 0.00776
Train [75][2790/3239]	Time 2.588 (0.905)	Data Time 2.224 (0.385)	Loss 2.3517 (2.5282)	Entropy 0.60406 (0.60422)	Top-1 acc 69.531 (62.962)	Top-5 acc 86.719 (83.384)	lr 0.00776
Train [75][2800/3239]	Time 2.575 (0.905)	Data Time 2.289 (0.384)	Loss 2.3779 (2.5282)	Entropy 0.60422 (0.60422)	Top-1 acc 65.625 (62.962)	Top-5 acc 87.891 (83.385)	lr 0.00776
Train [75][2810/3239]	Time 0.265 (0.903)	Data Time 0.002 (0.383)	Loss 2.7206 (2.5281)	Entropy 0.60394 (0.60422)	Top-1 acc 61.328 (62.964)	Top-5 acc 79.297 (83.385)	lr 0.00776
Train [75][2820/3239]	Time 0.314 (0.907)	Data Time 0.001 (0.388)	Loss 2.5550 (2.5281)	Entropy 0.60391 (0.60422)	Top-1 acc 64.062 (62.964)	Top-5 acc 84.375 (83.384)	lr 0.00776
Train [75][2830/3239]	Time 0.250 (0.907)	Data Time 0.001 (0.387)	Loss 2.5163 (2.5281)	Entropy 0.60403 (0.60422)	Top-1 acc 63.281 (62.966)	Top-5 acc 85.156 (83.382)	lr 0.00775
Train [75][2840/3239]	Time 0.247 (0.906)	Data Time 0.001 (0.387)	Loss 2.4978 (2.5278)	Entropy 0.60383 (0.60422)	Top-1 acc 61.328 (62.971)	Top-5 acc 85.547 (83.387)	lr 0.00775
Train [75][2850/3239]	Time 0.233 (0.906)	Data Time 0.001 (0.387)	Loss 2.5432 (2.5278)	Entropy 0.60408 (0.60422)	Top-1 acc 63.281 (62.972)	Top-5 acc 80.859 (83.386)	lr 0.00775
Train [75][2860/3239]	Time 0.252 (0.908)	Data Time 0.002 (0.390)	Loss 2.5713 (2.5276)	Entropy 0.60419 (0.60422)	Top-1 acc 61.719 (62.976)	Top-5 acc 78.516 (83.384)	lr 0.00775
Train [75][2870/3239]	Time 0.248 (0.908)	Data Time 0.001 (0.390)	Loss 2.7258 (2.5276)	Entropy 0.60430 (0.60422)	Top-1 acc 58.594 (62.979)	Top-5 acc 82.422 (83.384)	lr 0.00775
Train [75][2880/3239]	Time 0.370 (0.906)	Data Time 0.001 (0.388)	Loss 2.4299 (2.5276)	Entropy 0.60418 (0.60422)	Top-1 acc 66.406 (62.981)	Top-5 acc 86.328 (83.385)	lr 0.00775
Train [75][2890/3239]	Time 0.302 (0.909)	Data Time 0.001 (0.391)	Loss 2.2252 (2.5275)	Entropy 0.60422 (0.60422)	Top-1 acc 72.656 (62.985)	Top-5 acc 88.672 (83.386)	lr 0.00775
Train [75][2900/3239]	Time 0.235 (0.909)	Data Time 0.002 (0.392)	Loss 2.4596 (2.5275)	Entropy 0.60407 (0.60421)	Top-1 acc 60.547 (62.979)	Top-5 acc 82.812 (83.387)	lr 0.00775
Train [75][2910/3239]	Time 0.241 (0.908)	Data Time 0.002 (0.390)	Loss 2.6484 (2.5277)	Entropy 0.60399 (0.60421)	Top-1 acc 59.375 (62.978)	Top-5 acc 79.297 (83.385)	lr 0.00775
Train [75][2920/3239]	Time 0.232 (0.911)	Data Time 0.001 (0.394)	Loss 2.5484 (2.5278)	Entropy 0.60401 (0.60421)	Top-1 acc 63.281 (62.978)	Top-5 acc 82.422 (83.385)	lr 0.00775
Train [75][2930/3239]	Time 0.248 (0.911)	Data Time 0.001 (0.394)	Loss 2.4926 (2.5278)	Entropy 0.60396 (0.60421)	Top-1 acc 61.328 (62.980)	Top-5 acc 83.203 (83.382)	lr 0.00775
Train [75][2940/3239]	Time 0.241 (0.911)	Data Time 0.001 (0.394)	Loss 2.5636 (2.5278)	Entropy 0.60387 (0.60421)	Top-1 acc 62.109 (62.978)	Top-5 acc 81.641 (83.382)	lr 0.00774
Train [75][2950/3239]	Time 0.368 (0.913)	Data Time 0.001 (0.397)	Loss 2.3951 (2.5277)	Entropy 0.60353 (0.60421)	Top-1 acc 64.844 (62.979)	Top-5 acc 84.766 (83.386)	lr 0.00774
Train [75][2960/3239]	Time 0.266 (0.914)	Data Time 0.002 (0.398)	Loss 2.5079 (2.5278)	Entropy 0.60378 (0.60421)	Top-1 acc 60.547 (62.977)	Top-5 acc 84.375 (83.383)	lr 0.00774
Train [75][2970/3239]	Time 0.245 (0.914)	Data Time 0.001 (0.398)	Loss 2.3632 (2.5279)	Entropy 0.60385 (0.60421)	Top-1 acc 67.188 (62.977)	Top-5 acc 85.938 (83.381)	lr 0.00774
Train [75][2980/3239]	Time 0.253 (0.916)	Data Time 0.002 (0.400)	Loss 2.7744 (2.5280)	Entropy 0.60389 (0.60421)	Top-1 acc 53.516 (62.970)	Top-5 acc 79.297 (83.378)	lr 0.00774
Train [75][2990/3239]	Time 8.851 (0.917)	Data Time 8.539 (0.402)	Loss 2.6015 (2.5281)	Entropy 0.60388 (0.60421)	Top-1 acc 58.594 (62.970)	Top-5 acc 83.203 (83.376)	lr 0.00774
Train [75][3000/3239]	Time 1.487 (0.916)	Data Time 1.247 (0.401)	Loss 2.5138 (2.5280)	Entropy 0.60408 (0.60420)	Top-1 acc 66.016 (62.976)	Top-5 acc 81.250 (83.376)	lr 0.00774
Train [75][3010/3239]	Time 0.243 (0.916)	Data Time 0.001 (0.402)	Loss 2.4300 (2.5281)	Entropy 0.60391 (0.60420)	Top-1 acc 66.797 (62.976)	Top-5 acc 84.375 (83.375)	lr 0.00774
Train [75][3020/3239]	Time 2.060 (0.918)	Data Time 1.805 (0.403)	Loss 2.3887 (2.5281)	Entropy 0.60376 (0.60420)	Top-1 acc 64.453 (62.974)	Top-5 acc 86.719 (83.373)	lr 0.00774
Train [75][3030/3239]	Time 0.237 (0.918)	Data Time 0.001 (0.404)	Loss 2.2291 (2.5280)	Entropy 0.60378 (0.60420)	Top-1 acc 68.750 (62.976)	Top-5 acc 89.453 (83.375)	lr 0.00774
Train [75][3040/3239]	Time 0.376 (0.918)	Data Time 0.001 (0.404)	Loss 2.3850 (2.5279)	Entropy 0.60367 (0.60420)	Top-1 acc 66.406 (62.977)	Top-5 acc 86.328 (83.376)	lr 0.00774
Train [75][3050/3239]	Time 0.248 (0.920)	Data Time 0.001 (0.406)	Loss 2.7587 (2.5278)	Entropy 0.60389 (0.60420)	Top-1 acc 54.688 (62.980)	Top-5 acc 80.469 (83.375)	lr 0.00773
Train [75][3060/3239]	Time 0.252 (0.920)	Data Time 0.001 (0.407)	Loss 2.4303 (2.5280)	Entropy 0.60374 (0.60420)	Top-1 acc 66.016 (62.978)	Top-5 acc 83.984 (83.374)	lr 0.00773
Train [75][3070/3239]	Time 0.235 (0.920)	Data Time 0.001 (0.407)	Loss 2.5579 (2.5280)	Entropy 0.60387 (0.60420)	Top-1 acc 63.672 (62.977)	Top-5 acc 82.812 (83.372)	lr 0.00773
Train [75][3080/3239]	Time 0.258 (0.923)	Data Time 0.001 (0.410)	Loss 2.3998 (2.5280)	Entropy 0.60379 (0.60420)	Top-1 acc 65.625 (62.978)	Top-5 acc 85.938 (83.374)	lr 0.00773
Train [75][3090/3239]	Time 0.274 (0.922)	Data Time 0.001 (0.409)	Loss 2.6586 (2.5281)	Entropy 0.60396 (0.60419)	Top-1 acc 62.109 (62.978)	Top-5 acc 80.469 (83.369)	lr 0.00773
Train [75][3100/3239]	Time 0.258 (0.923)	Data Time 0.001 (0.411)	Loss 2.6724 (2.5282)	Entropy 0.60400 (0.60419)	Top-1 acc 59.766 (62.975)	Top-5 acc 79.297 (83.367)	lr 0.00773
Train [75][3110/3239]	Time 5.330 (0.926)	Data Time 4.966 (0.413)	Loss 2.3256 (2.5282)	Entropy 0.60335 (0.60419)	Top-1 acc 68.359 (62.974)	Top-5 acc 88.281 (83.368)	lr 0.00773
Train [75][3120/3239]	Time 0.252 (0.925)	Data Time 0.001 (0.413)	Loss 2.6535 (2.5284)	Entropy 0.60353 (0.60419)	Top-1 acc 62.109 (62.969)	Top-5 acc 80.469 (83.365)	lr 0.00773
Train [75][3130/3239]	Time 0.253 (0.926)	Data Time 0.001 (0.414)	Loss 2.3936 (2.5284)	Entropy 0.60356 (0.60419)	Top-1 acc 64.453 (62.968)	Top-5 acc 87.500 (83.363)	lr 0.00773
Train [75][3140/3239]	Time 0.248 (0.926)	Data Time 0.002 (0.414)	Loss 2.8139 (2.5286)	Entropy 0.60301 (0.60418)	Top-1 acc 59.375 (62.964)	Top-5 acc 76.953 (83.360)	lr 0.00773
Train [75][3150/3239]	Time 5.587 (0.928)	Data Time 5.303 (0.417)	Loss 2.5807 (2.5284)	Entropy 0.60299 (0.60418)	Top-1 acc 59.375 (62.968)	Top-5 acc 81.641 (83.364)	lr 0.00772
Train [75][3160/3239]	Time 1.821 (0.928)	Data Time 1.566 (0.417)	Loss 2.6561 (2.5284)	Entropy 0.60297 (0.60418)	Top-1 acc 64.062 (62.974)	Top-5 acc 82.031 (83.367)	lr 0.00772
Train [75][3170/3239]	Time 0.245 (0.929)	Data Time 0.001 (0.418)	Loss 2.7430 (2.5285)	Entropy 0.60283 (0.60417)	Top-1 acc 58.984 (62.968)	Top-5 acc 81.641 (83.363)	lr 0.00772
Train [75][3180/3239]	Time 0.240 (0.930)	Data Time 0.000 (0.420)	Loss 2.5613 (2.5286)	Entropy 0.60278 (0.60417)	Top-1 acc 62.500 (62.963)	Top-5 acc 83.203 (83.364)	lr 0.00772
Train [75][3190/3239]	Time 0.254 (0.930)	Data Time 0.000 (0.420)	Loss 2.5226 (2.5284)	Entropy 0.60279 (0.60417)	Top-1 acc 66.016 (62.965)	Top-5 acc 82.422 (83.366)	lr 0.00772
Train [75][3200/3239]	Time 0.260 (0.930)	Data Time 0.000 (0.419)	Loss 2.4813 (2.5284)	Entropy 0.60302 (0.60416)	Top-1 acc 63.281 (62.967)	Top-5 acc 87.109 (83.365)	lr 0.00772
Train [75][3210/3239]	Time 0.221 (0.932)	Data Time 0.000 (0.422)	Loss 2.7521 (2.5286)	Entropy 0.60323 (0.60416)	Top-1 acc 59.375 (62.962)	Top-5 acc 80.859 (83.363)	lr 0.00772
Train [75][3220/3239]	Time 0.342 (0.947)	Data Time 0.000 (0.421)	Loss 2.6187 (2.5288)	Entropy 0.60321 (0.60415)	Top-1 acc 62.891 (62.959)	Top-5 acc 82.812 (83.360)	lr 0.00772
Train [75][3230/3239]	Time 0.250 (0.945)	Data Time 0.000 (0.420)	Loss 2.3108 (2.5286)	Entropy 0.60315 (0.60415)	Top-1 acc 69.141 (62.961)	Top-5 acc 89.453 (83.363)	lr 0.00772
Train [75][3239/3239]	Time 1.046 (0.944)	Data Time 0.000 (0.419)	Loss 2.7785 (2.5286)	Entropy 0.60326 (0.60415)	Top-1 acc 62.963 (62.964)	Top-5 acc 80.247 (83.364)	lr 0.00772
==========Valid [75/120]	loss 1.320	top-1 acc 69.531 (69.766)	top-5 acc 88.795	Train top-1 62.964	top-5 83.364	Entropy 0.60326	Latency-None: 0.000ms	Flops: 539.00M
Train [76][0/3239]	Time 45.488 (45.488)	Data Time 44.662 (44.662)	Loss 2.3575 (2.3575)	Entropy 0.60325 (0.60325)	Top-1 acc 68.750 (68.750)	Top-5 acc 86.328 (86.328)	lr 0.00772
Train [76][10/3239]	Time 0.341 (5.053)	Data Time 0.001 (4.490)	Loss 2.5429 (2.4740)	Entropy 0.60298 (0.60313)	Top-1 acc 60.938 (64.382)	Top-5 acc 82.422 (84.446)	lr 0.00772
Train [76][20/3239]	Time 0.231 (2.851)	Data Time 0.001 (2.353)	Loss 2.5537 (2.4937)	Entropy 0.60309 (0.60306)	Top-1 acc 60.938 (63.653)	Top-5 acc 82.031 (84.115)	lr 0.00771
Train [76][30/3239]	Time 0.282 (2.067)	Data Time 0.001 (1.594)	Loss 2.5505 (2.4933)	Entropy 0.60301 (0.60307)	Top-1 acc 60.938 (63.584)	Top-5 acc 83.594 (84.060)	lr 0.00771
Train [76][40/3239]	Time 0.234 (1.743)	Data Time 0.001 (1.279)	Loss 2.5729 (2.5012)	Entropy 0.60313 (0.60304)	Top-1 acc 61.719 (63.453)	Top-5 acc 82.422 (83.994)	lr 0.00771
Train [76][50/3239]	Time 0.302 (1.478)	Data Time 0.003 (1.029)	Loss 2.2729 (2.4900)	Entropy 0.60259 (0.60300)	Top-1 acc 70.703 (63.664)	Top-5 acc 88.672 (84.275)	lr 0.00771
Train [76][60/3239]	Time 0.251 (1.313)	Data Time 0.001 (0.860)	Loss 2.3923 (2.4856)	Entropy 0.60246 (0.60292)	Top-1 acc 67.578 (63.800)	Top-5 acc 84.766 (84.253)	lr 0.00771
Train [76][70/3239]	Time 0.263 (1.247)	Data Time 0.001 (0.794)	Loss 2.6963 (2.4863)	Entropy 0.60256 (0.60285)	Top-1 acc 61.328 (63.952)	Top-5 acc 79.688 (84.193)	lr 0.00771
Train [76][80/3239]	Time 0.240 (1.149)	Data Time 0.001 (0.696)	Loss 2.4818 (2.4871)	Entropy 0.60269 (0.60282)	Top-1 acc 64.453 (63.749)	Top-5 acc 83.984 (84.197)	lr 0.00771
Train [76][90/3239]	Time 0.236 (1.067)	Data Time 0.001 (0.620)	Loss 2.4707 (2.4890)	Entropy 0.60227 (0.60278)	Top-1 acc 64.062 (63.620)	Top-5 acc 85.938 (84.195)	lr 0.00771
Train [76][100/3239]	Time 0.329 (1.054)	Data Time 0.001 (0.608)	Loss 2.5085 (2.4917)	Entropy 0.60222 (0.60272)	Top-1 acc 60.156 (63.645)	Top-5 acc 83.594 (84.108)	lr 0.00771
Train [76][110/3239]	Time 0.227 (1.008)	Data Time 0.001 (0.566)	Loss 2.6160 (2.4961)	Entropy 0.60249 (0.60269)	Top-1 acc 64.062 (63.450)	Top-5 acc 81.641 (84.044)	lr 0.00771
Train [76][120/3239]	Time 0.232 (0.958)	Data Time 0.001 (0.520)	Loss 2.5493 (2.4982)	Entropy 0.60260 (0.60268)	Top-1 acc 57.812 (63.427)	Top-5 acc 83.984 (83.913)	lr 0.00771
Train [76][130/3239]	Time 0.259 (0.938)	Data Time 0.001 (0.501)	Loss 2.3392 (2.4962)	Entropy 0.60225 (0.60267)	Top-1 acc 66.016 (63.406)	Top-5 acc 90.234 (83.984)	lr 0.00770
Train [76][140/3239]	Time 0.247 (0.943)	Data Time 0.001 (0.506)	Loss 2.5412 (2.4975)	Entropy 0.60187 (0.60263)	Top-1 acc 63.281 (63.403)	Top-5 acc 82.812 (83.965)	lr 0.00770
Train [76][150/3239]	Time 0.238 (0.907)	Data Time 0.001 (0.473)	Loss 2.3147 (2.4957)	Entropy 0.60196 (0.60258)	Top-1 acc 72.266 (63.468)	Top-5 acc 86.719 (84.008)	lr 0.00770
Train [76][160/3239]	Time 0.243 (0.878)	Data Time 0.001 (0.443)	Loss 2.4352 (2.4951)	Entropy 0.60227 (0.60255)	Top-1 acc 64.844 (63.502)	Top-5 acc 84.766 (83.975)	lr 0.00770
Train [76][170/3239]	Time 0.341 (0.907)	Data Time 0.001 (0.472)	Loss 2.6100 (2.4940)	Entropy 0.60214 (0.60252)	Top-1 acc 61.719 (63.537)	Top-5 acc 80.859 (83.994)	lr 0.00770
Train [76][180/3239]	Time 0.228 (0.880)	Data Time 0.001 (0.446)	Loss 2.8332 (2.4942)	Entropy 0.60222 (0.60250)	Top-1 acc 56.641 (63.570)	Top-5 acc 78.125 (84.015)	lr 0.00770
Train [76][190/3239]	Time 0.237 (0.856)	Data Time 0.001 (0.423)	Loss 2.5078 (2.4940)	Entropy 0.60212 (0.60248)	Top-1 acc 63.281 (63.541)	Top-5 acc 83.594 (84.021)	lr 0.00770
Train [76][200/3239]	Time 0.236 (0.887)	Data Time 0.001 (0.454)	Loss 2.4099 (2.4931)	Entropy 0.60178 (0.60246)	Top-1 acc 67.578 (63.561)	Top-5 acc 83.984 (84.033)	lr 0.00770
Train [76][210/3239]	Time 0.233 (0.864)	Data Time 0.002 (0.433)	Loss 2.4748 (2.4904)	Entropy 0.60206 (0.60244)	Top-1 acc 63.281 (63.661)	Top-5 acc 82.812 (84.077)	lr 0.00770
Train [76][220/3239]	Time 0.272 (0.845)	Data Time 0.001 (0.413)	Loss 2.8034 (2.4936)	Entropy 0.60196 (0.60242)	Top-1 acc 57.031 (63.591)	Top-5 acc 76.953 (83.995)	lr 0.00770
Train [76][230/3239]	Time 0.233 (0.835)	Data Time 0.001 (0.404)	Loss 2.5546 (2.4976)	Entropy 0.60227 (0.60240)	Top-1 acc 60.547 (63.526)	Top-5 acc 81.641 (83.940)	lr 0.00770
Train [76][240/3239]	Time 0.258 (0.850)	Data Time 0.002 (0.418)	Loss 2.5583 (2.5013)	Entropy 0.60215 (0.60239)	Top-1 acc 59.766 (63.463)	Top-5 acc 83.594 (83.876)	lr 0.00769
Train [76][250/3239]	Time 0.284 (0.834)	Data Time 0.001 (0.401)	Loss 2.3794 (2.5029)	Entropy 0.60194 (0.60238)	Top-1 acc 67.969 (63.485)	Top-5 acc 88.281 (83.852)	lr 0.00769
Train [76][260/3239]	Time 0.368 (0.821)	Data Time 0.001 (0.386)	Loss 2.4377 (2.5032)	Entropy 0.60178 (0.60236)	Top-1 acc 64.844 (63.422)	Top-5 acc 85.547 (83.845)	lr 0.00769
Train [76][270/3239]	Time 0.216 (0.832)	Data Time 0.001 (0.398)	Loss 2.6247 (2.5032)	Entropy 0.60168 (0.60234)	Top-1 acc 61.719 (63.425)	Top-5 acc 78.906 (83.829)	lr 0.00769
Train [76][280/3239]	Time 0.263 (0.817)	Data Time 0.003 (0.384)	Loss 2.7025 (2.5038)	Entropy 0.60163 (0.60232)	Top-1 acc 58.984 (63.416)	Top-5 acc 78.906 (83.799)	lr 0.00769
Train [76][290/3239]	Time 0.285 (0.807)	Data Time 0.001 (0.371)	Loss 2.6848 (2.5057)	Entropy 0.60189 (0.60230)	Top-1 acc 61.719 (63.393)	Top-5 acc 80.078 (83.753)	lr 0.00769
Train [76][300/3239]	Time 0.270 (0.810)	Data Time 0.002 (0.374)	Loss 2.4920 (2.5052)	Entropy 0.60168 (0.60228)	Top-1 acc 63.281 (63.424)	Top-5 acc 84.766 (83.759)	lr 0.00769
Train [76][310/3239]	Time 0.236 (0.797)	Data Time 0.001 (0.362)	Loss 2.5090 (2.5051)	Entropy 0.60148 (0.60225)	Top-1 acc 64.453 (63.443)	Top-5 acc 86.328 (83.786)	lr 0.00769
Train [76][320/3239]	Time 0.270 (0.787)	Data Time 0.001 (0.351)	Loss 2.5906 (2.5051)	Entropy 0.60156 (0.60223)	Top-1 acc 64.453 (63.456)	Top-5 acc 80.469 (83.774)	lr 0.00769
Train [76][330/3239]	Time 0.317 (0.807)	Data Time 0.001 (0.371)	Loss 2.4840 (2.5043)	Entropy 0.60182 (0.60221)	Top-1 acc 64.062 (63.482)	Top-5 acc 83.984 (83.785)	lr 0.00769
Train [76][340/3239]	Time 0.245 (0.795)	Data Time 0.001 (0.360)	Loss 2.6015 (2.5057)	Entropy 0.60158 (0.60220)	Top-1 acc 58.984 (63.437)	Top-5 acc 81.250 (83.755)	lr 0.00768
Train [76][350/3239]	Time 0.233 (0.784)	Data Time 0.001 (0.350)	Loss 2.4498 (2.5063)	Entropy 0.60129 (0.60218)	Top-1 acc 63.672 (63.421)	Top-5 acc 86.719 (83.757)	lr 0.00768
Train [76][360/3239]	Time 0.228 (0.817)	Data Time 0.001 (0.383)	Loss 2.6058 (2.5061)	Entropy 0.60123 (0.60215)	Top-1 acc 60.156 (63.421)	Top-5 acc 85.547 (83.777)	lr 0.00768
Train [76][370/3239]	Time 0.225 (0.807)	Data Time 0.001 (0.372)	Loss 2.6952 (2.5058)	Entropy 0.60100 (0.60213)	Top-1 acc 55.078 (63.414)	Top-5 acc 85.156 (83.807)	lr 0.00768
Train [76][380/3239]	Time 0.249 (0.798)	Data Time 0.001 (0.363)	Loss 2.5458 (2.5067)	Entropy 0.60087 (0.60209)	Top-1 acc 62.109 (63.401)	Top-5 acc 82.422 (83.807)	lr 0.00768
Train [76][390/3239]	Time 0.230 (0.824)	Data Time 0.001 (0.389)	Loss 2.6602 (2.5083)	Entropy 0.60066 (0.60206)	Top-1 acc 62.109 (63.376)	Top-5 acc 79.297 (83.755)	lr 0.00768
Train [76][400/3239]	Time 0.273 (0.815)	Data Time 0.002 (0.379)	Loss 2.6239 (2.5078)	Entropy 0.60084 (0.60203)	Top-1 acc 59.375 (63.386)	Top-5 acc 80.859 (83.766)	lr 0.00768
Train [76][410/3239]	Time 0.266 (0.806)	Data Time 0.001 (0.370)	Loss 2.5769 (2.5078)	Entropy 0.60093 (0.60200)	Top-1 acc 64.062 (63.398)	Top-5 acc 85.156 (83.789)	lr 0.00768
Train [76][420/3239]	Time 15.292 (0.832)	Data Time 15.026 (0.397)	Loss 2.6432 (2.5084)	Entropy 0.60098 (0.60197)	Top-1 acc 60.938 (63.404)	Top-5 acc 80.859 (83.771)	lr 0.00768
Train [76][430/3239]	Time 0.285 (0.823)	Data Time 0.002 (0.388)	Loss 2.7198 (2.5079)	Entropy 0.60124 (0.60195)	Top-1 acc 57.031 (63.396)	Top-5 acc 81.250 (83.793)	lr 0.00768
Train [76][440/3239]	Time 0.245 (0.815)	Data Time 0.001 (0.379)	Loss 2.4168 (2.5080)	Entropy 0.60110 (0.60194)	Top-1 acc 66.406 (63.416)	Top-5 acc 85.938 (83.788)	lr 0.00768
Train [76][450/3239]	Time 0.230 (0.807)	Data Time 0.001 (0.371)	Loss 2.6189 (2.5106)	Entropy 0.60112 (0.60192)	Top-1 acc 61.719 (63.357)	Top-5 acc 82.031 (83.738)	lr 0.00767
Train [76][460/3239]	Time 0.253 (0.844)	Data Time 0.001 (0.407)	Loss 2.6520 (2.5107)	Entropy 0.60122 (0.60190)	Top-1 acc 59.766 (63.391)	Top-5 acc 80.469 (83.720)	lr 0.00767
Train [76][470/3239]	Time 0.246 (0.835)	Data Time 0.001 (0.399)	Loss 2.6206 (2.5113)	Entropy 0.60067 (0.60189)	Top-1 acc 59.766 (63.368)	Top-5 acc 83.594 (83.712)	lr 0.00767
Train [76][480/3239]	Time 0.252 (0.827)	Data Time 0.001 (0.391)	Loss 2.4103 (2.5116)	Entropy 0.60068 (0.60186)	Top-1 acc 64.062 (63.368)	Top-5 acc 86.328 (83.711)	lr 0.00767
Train [76][490/3239]	Time 0.404 (0.861)	Data Time 0.001 (0.423)	Loss 2.3779 (2.5110)	Entropy 0.60080 (0.60184)	Top-1 acc 66.406 (63.358)	Top-5 acc 88.281 (83.742)	lr 0.00767
Train [76][500/3239]	Time 0.284 (0.852)	Data Time 0.003 (0.415)	Loss 2.6153 (2.5113)	Entropy 0.60081 (0.60182)	Top-1 acc 60.547 (63.337)	Top-5 acc 80.469 (83.729)	lr 0.00767
Train [76][510/3239]	Time 0.224 (0.844)	Data Time 0.001 (0.407)	Loss 2.4377 (2.5115)	Entropy 0.60047 (0.60180)	Top-1 acc 66.797 (63.339)	Top-5 acc 85.156 (83.727)	lr 0.00767
Train [76][520/3239]	Time 0.242 (0.860)	Data Time 0.001 (0.424)	Loss 2.4231 (2.5109)	Entropy 0.60019 (0.60177)	Top-1 acc 63.281 (63.343)	Top-5 acc 83.203 (83.741)	lr 0.00767
Train [76][530/3239]	Time 0.296 (0.854)	Data Time 0.002 (0.416)	Loss 2.7031 (2.5102)	Entropy 0.59990 (0.60174)	Top-1 acc 56.250 (63.329)	Top-5 acc 82.031 (83.762)	lr 0.00767
Train [76][540/3239]	Time 0.241 (0.846)	Data Time 0.001 (0.408)	Loss 2.5122 (2.5113)	Entropy 0.59976 (0.60170)	Top-1 acc 64.453 (63.307)	Top-5 acc 82.812 (83.742)	lr 0.00767
Train [76][550/3239]	Time 0.258 (0.860)	Data Time 0.001 (0.422)	Loss 2.6409 (2.5111)	Entropy 0.59946 (0.60167)	Top-1 acc 60.547 (63.318)	Top-5 acc 80.859 (83.750)	lr 0.00767
Train [76][560/3239]	Time 0.429 (0.853)	Data Time 0.001 (0.415)	Loss 2.4277 (2.5091)	Entropy 0.59957 (0.60163)	Top-1 acc 64.062 (63.368)	Top-5 acc 85.938 (83.780)	lr 0.00766
Train [76][570/3239]	Time 0.238 (0.846)	Data Time 0.001 (0.407)	Loss 2.2689 (2.5087)	Entropy 0.59956 (0.60159)	Top-1 acc 68.750 (63.387)	Top-5 acc 89.453 (83.796)	lr 0.00766
Train [76][580/3239]	Time 14.842 (0.864)	Data Time 14.574 (0.426)	Loss 2.3249 (2.5083)	Entropy 0.59939 (0.60156)	Top-1 acc 66.406 (63.394)	Top-5 acc 84.766 (83.801)	lr 0.00766
Train [76][590/3239]	Time 0.232 (0.856)	Data Time 0.002 (0.418)	Loss 2.4403 (2.5078)	Entropy 0.59929 (0.60152)	Top-1 acc 66.016 (63.398)	Top-5 acc 84.375 (83.799)	lr 0.00766
Train [76][600/3239]	Time 0.247 (0.849)	Data Time 0.002 (0.411)	Loss 2.1780 (2.5073)	Entropy 0.59963 (0.60148)	Top-1 acc 73.047 (63.418)	Top-5 acc 90.234 (83.800)	lr 0.00766
Train [76][610/3239]	Time 0.249 (0.843)	Data Time 0.001 (0.405)	Loss 2.3867 (2.5072)	Entropy 0.59970 (0.60145)	Top-1 acc 67.188 (63.420)	Top-5 acc 86.719 (83.794)	lr 0.00766
Train [76][620/3239]	Time 0.249 (0.876)	Data Time 0.001 (0.438)	Loss 2.3640 (2.5070)	Entropy 0.59934 (0.60142)	Top-1 acc 67.578 (63.449)	Top-5 acc 85.938 (83.784)	lr 0.00766
Train [76][630/3239]	Time 0.301 (0.955)	Data Time 0.005 (0.431)	Loss 2.5212 (2.5074)	Entropy 0.59959 (0.60139)	Top-1 acc 63.281 (63.443)	Top-5 acc 83.203 (83.776)	lr 0.00766
Train [76][640/3239]	Time 0.256 (0.947)	Data Time 0.003 (0.424)	Loss 2.5272 (2.5077)	Entropy 0.59937 (0.60136)	Top-1 acc 62.500 (63.435)	Top-5 acc 83.984 (83.774)	lr 0.00766
Train [76][650/3239]	Time 0.336 (0.939)	Data Time 0.001 (0.418)	Loss 2.6619 (2.5072)	Entropy 0.59952 (0.60133)	Top-1 acc 61.328 (63.448)	Top-5 acc 81.250 (83.797)	lr 0.00766
Train [76][660/3239]	Time 0.254 (0.931)	Data Time 0.002 (0.412)	Loss 2.5514 (2.5078)	Entropy 0.59956 (0.60130)	Top-1 acc 60.938 (63.436)	Top-5 acc 82.031 (83.778)	lr 0.00765
Train [76][670/3239]	Time 0.247 (0.924)	Data Time 0.001 (0.406)	Loss 2.4962 (2.5085)	Entropy 0.59963 (0.60128)	Top-1 acc 60.547 (63.429)	Top-5 acc 84.375 (83.761)	lr 0.00765
Train [76][680/3239]	Time 0.236 (0.917)	Data Time 0.001 (0.400)	Loss 2.4981 (2.5087)	Entropy 0.59940 (0.60125)	Top-1 acc 63.281 (63.425)	Top-5 acc 83.594 (83.765)	lr 0.00765
Train [76][690/3239]	Time 0.245 (0.909)	Data Time 0.002 (0.394)	Loss 2.5858 (2.5090)	Entropy 0.59938 (0.60122)	Top-1 acc 63.672 (63.422)	Top-5 acc 81.641 (83.754)	lr 0.00765
Train [76][700/3239]	Time 0.263 (0.918)	Data Time 0.001 (0.403)	Loss 2.5075 (2.5090)	Entropy 0.59934 (0.60120)	Top-1 acc 64.062 (63.427)	Top-5 acc 83.203 (83.752)	lr 0.00765
Train [76][710/3239]	Time 2.400 (0.916)	Data Time 2.102 (0.403)	Loss 2.8228 (2.5090)	Entropy 0.59920 (0.60117)	Top-1 acc 57.422 (63.421)	Top-5 acc 77.344 (83.757)	lr 0.00765
Train [76][720/3239]	Time 0.337 (0.910)	Data Time 0.002 (0.397)	Loss 2.3695 (2.5092)	Entropy 0.59939 (0.60114)	Top-1 acc 64.062 (63.433)	Top-5 acc 87.109 (83.748)	lr 0.00765
Train [76][730/3239]	Time 0.302 (0.927)	Data Time 0.001 (0.416)	Loss 2.4981 (2.5087)	Entropy 0.59930 (0.60112)	Top-1 acc 69.141 (63.458)	Top-5 acc 85.156 (83.757)	lr 0.00765
Train [76][740/3239]	Time 0.583 (0.927)	Data Time 0.294 (0.416)	Loss 2.6222 (2.5085)	Entropy 0.59946 (0.60110)	Top-1 acc 57.812 (63.458)	Top-5 acc 84.375 (83.756)	lr 0.00765
Train [76][750/3239]	Time 0.246 (0.921)	Data Time 0.001 (0.411)	Loss 2.5543 (2.5077)	Entropy 0.59933 (0.60107)	Top-1 acc 60.938 (63.480)	Top-5 acc 81.641 (83.764)	lr 0.00765
Train [76][760/3239]	Time 0.253 (0.938)	Data Time 0.001 (0.429)	Loss 2.6053 (2.5087)	Entropy 0.59947 (0.60105)	Top-1 acc 58.984 (63.458)	Top-5 acc 82.812 (83.755)	lr 0.00765
Train [76][770/3239]	Time 0.235 (0.936)	Data Time 0.001 (0.428)	Loss 2.6030 (2.5090)	Entropy 0.59939 (0.60103)	Top-1 acc 59.766 (63.455)	Top-5 acc 82.031 (83.746)	lr 0.00764
Train [76][780/3239]	Time 0.229 (0.930)	Data Time 0.001 (0.423)	Loss 2.5289 (2.5097)	Entropy 0.59956 (0.60101)	Top-1 acc 54.688 (63.416)	Top-5 acc 83.203 (83.741)	lr 0.00764
Train [76][790/3239]	Time 11.970 (0.940)	Data Time 11.729 (0.434)	Loss 2.4453 (2.5097)	Entropy 0.59962 (0.60100)	Top-1 acc 66.016 (63.422)	Top-5 acc 83.984 (83.746)	lr 0.00764
Train [76][800/3239]	Time 0.227 (0.937)	Data Time 0.001 (0.432)	Loss 2.3432 (2.5106)	Entropy 0.59946 (0.60098)	Top-1 acc 69.922 (63.410)	Top-5 acc 85.938 (83.731)	lr 0.00764
Train [76][810/3239]	Time 0.326 (0.932)	Data Time 0.001 (0.428)	Loss 2.4117 (2.5091)	Entropy 0.59954 (0.60096)	Top-1 acc 67.578 (63.449)	Top-5 acc 85.938 (83.763)	lr 0.00764
Train [76][820/3239]	Time 0.239 (0.926)	Data Time 0.001 (0.423)	Loss 2.3640 (2.5098)	Entropy 0.59969 (0.60094)	Top-1 acc 66.406 (63.433)	Top-5 acc 86.328 (83.743)	lr 0.00764
Train [76][830/3239]	Time 0.277 (0.936)	Data Time 0.001 (0.435)	Loss 2.6546 (2.5103)	Entropy 0.59954 (0.60093)	Top-1 acc 58.594 (63.415)	Top-5 acc 81.250 (83.744)	lr 0.00764
Train [76][840/3239]	Time 0.662 (0.932)	Data Time 0.433 (0.431)	Loss 2.1946 (2.5097)	Entropy 0.59964 (0.60091)	Top-1 acc 69.531 (63.422)	Top-5 acc 90.234 (83.760)	lr 0.00764
Train [76][850/3239]	Time 0.230 (0.929)	Data Time 0.001 (0.429)	Loss 2.5613 (2.5099)	Entropy 0.59951 (0.60089)	Top-1 acc 62.500 (63.417)	Top-5 acc 82.422 (83.758)	lr 0.00764
Train [76][860/3239]	Time 0.238 (0.938)	Data Time 0.001 (0.439)	Loss 2.5533 (2.5094)	Entropy 0.59938 (0.60088)	Top-1 acc 62.109 (63.424)	Top-5 acc 83.984 (83.768)	lr 0.00764
Train [76][870/3239]	Time 0.246 (0.937)	Data Time 0.002 (0.439)	Loss 2.7713 (2.5104)	Entropy 0.59940 (0.60086)	Top-1 acc 54.688 (63.395)	Top-5 acc 77.734 (83.753)	lr 0.00764
Train [76][880/3239]	Time 0.358 (0.933)	Data Time 0.001 (0.436)	Loss 2.5713 (2.5107)	Entropy 0.59961 (0.60084)	Top-1 acc 59.375 (63.398)	Top-5 acc 84.766 (83.744)	lr 0.00763
Train [76][890/3239]	Time 0.292 (0.943)	Data Time 0.001 (0.448)	Loss 2.5762 (2.5109)	Entropy 0.59941 (0.60083)	Top-1 acc 60.156 (63.378)	Top-5 acc 82.422 (83.738)	lr 0.00763
Train [76][900/3239]	Time 1.875 (0.939)	Data Time 1.586 (0.444)	Loss 2.6122 (2.5110)	Entropy 0.59942 (0.60081)	Top-1 acc 62.109 (63.376)	Top-5 acc 82.812 (83.733)	lr 0.00763
Train [76][910/3239]	Time 0.247 (0.938)	Data Time 0.001 (0.443)	Loss 2.3785 (2.5109)	Entropy 0.59959 (0.60080)	Top-1 acc 64.062 (63.374)	Top-5 acc 85.938 (83.737)	lr 0.00763
Train [76][920/3239]	Time 3.730 (0.948)	Data Time 3.471 (0.454)	Loss 2.5692 (2.5099)	Entropy 0.59984 (0.60079)	Top-1 acc 62.109 (63.408)	Top-5 acc 85.156 (83.764)	lr 0.00763
Train [76][930/3239]	Time 0.247 (0.942)	Data Time 0.001 (0.449)	Loss 2.6340 (2.5107)	Entropy 0.59982 (0.60078)	Top-1 acc 61.328 (63.382)	Top-5 acc 82.031 (83.753)	lr 0.00763
Train [76][940/3239]	Time 0.243 (0.944)	Data Time 0.001 (0.452)	Loss 2.6965 (2.5110)	Entropy 0.59981 (0.60077)	Top-1 acc 57.422 (63.372)	Top-5 acc 82.812 (83.750)	lr 0.00763
Train [76][950/3239]	Time 8.689 (0.947)	Data Time 8.444 (0.456)	Loss 2.9431 (2.5116)	Entropy 0.59958 (0.60075)	Top-1 acc 54.688 (63.367)	Top-5 acc 77.734 (83.738)	lr 0.00763
Train [76][960/3239]	Time 0.237 (0.946)	Data Time 0.001 (0.456)	Loss 2.5239 (2.5115)	Entropy 0.59977 (0.60074)	Top-1 acc 62.891 (63.364)	Top-5 acc 82.812 (83.738)	lr 0.00763
Train [76][970/3239]	Time 0.248 (0.949)	Data Time 0.001 (0.459)	Loss 2.4710 (2.5112)	Entropy 0.59996 (0.60073)	Top-1 acc 65.625 (63.373)	Top-5 acc 85.547 (83.736)	lr 0.00763
Train [76][980/3239]	Time 0.257 (0.943)	Data Time 0.002 (0.454)	Loss 2.4912 (2.5116)	Entropy 0.60011 (0.60073)	Top-1 acc 64.844 (63.359)	Top-5 acc 84.766 (83.725)	lr 0.00763
Train [76][990/3239]	Time 0.235 (0.949)	Data Time 0.001 (0.461)	Loss 2.5447 (2.5112)	Entropy 0.60048 (0.60072)	Top-1 acc 59.375 (63.368)	Top-5 acc 83.594 (83.729)	lr 0.00762
Train [76][1000/3239]	Time 4.436 (0.953)	Data Time 4.186 (0.466)	Loss 2.5139 (2.5110)	Entropy 0.60022 (0.60072)	Top-1 acc 62.891 (63.372)	Top-5 acc 84.375 (83.733)	lr 0.00762
Train [76][1010/3239]	Time 0.243 (0.948)	Data Time 0.001 (0.461)	Loss 2.3131 (2.5102)	Entropy 0.60027 (0.60071)	Top-1 acc 67.969 (63.395)	Top-5 acc 87.109 (83.751)	lr 0.00762
Train [76][1020/3239]	Time 3.097 (0.953)	Data Time 2.840 (0.467)	Loss 2.4667 (2.5097)	Entropy 0.60020 (0.60071)	Top-1 acc 65.234 (63.418)	Top-5 acc 85.547 (83.762)	lr 0.00762
Train [76][1030/3239]	Time 0.230 (0.953)	Data Time 0.001 (0.468)	Loss 2.6439 (2.5099)	Entropy 0.59968 (0.60070)	Top-1 acc 64.844 (63.419)	Top-5 acc 81.250 (83.758)	lr 0.00762
Train [76][1040/3239]	Time 0.319 (0.952)	Data Time 0.001 (0.467)	Loss 2.4489 (2.5097)	Entropy 0.59960 (0.60069)	Top-1 acc 62.500 (63.423)	Top-5 acc 84.375 (83.752)	lr 0.00762
Train [76][1050/3239]	Time 0.264 (0.957)	Data Time 0.001 (0.473)	Loss 2.4101 (2.5095)	Entropy 0.59964 (0.60068)	Top-1 acc 65.234 (63.428)	Top-5 acc 85.156 (83.754)	lr 0.00762
Train [76][1060/3239]	Time 0.232 (0.960)	Data Time 0.001 (0.477)	Loss 2.5975 (2.5100)	Entropy 0.59970 (0.60067)	Top-1 acc 62.109 (63.417)	Top-5 acc 83.594 (83.754)	lr 0.00762
Train [76][1070/3239]	Time 0.239 (0.959)	Data Time 0.001 (0.477)	Loss 2.4059 (2.5104)	Entropy 0.59989 (0.60066)	Top-1 acc 64.844 (63.408)	Top-5 acc 86.719 (83.748)	lr 0.00762
Train [76][1080/3239]	Time 0.237 (0.963)	Data Time 0.001 (0.482)	Loss 2.5328 (2.5105)	Entropy 0.59953 (0.60066)	Top-1 acc 61.328 (63.416)	Top-5 acc 82.812 (83.749)	lr 0.00762
Train [76][1090/3239]	Time 0.250 (0.964)	Data Time 0.001 (0.483)	Loss 2.7641 (2.5104)	Entropy 0.59914 (0.60065)	Top-1 acc 55.469 (63.429)	Top-5 acc 76.953 (83.751)	lr 0.00761
Train [76][1100/3239]	Time 0.291 (0.962)	Data Time 0.003 (0.482)	Loss 2.5374 (2.5103)	Entropy 0.59916 (0.60063)	Top-1 acc 62.109 (63.430)	Top-5 acc 82.422 (83.748)	lr 0.00761
Train [76][1110/3239]	Time 9.776 (0.967)	Data Time 9.435 (0.486)	Loss 2.6769 (2.5105)	Entropy 0.59915 (0.60062)	Top-1 acc 58.594 (63.435)	Top-5 acc 79.688 (83.737)	lr 0.00761
Train [76][1120/3239]	Time 0.235 (0.968)	Data Time 0.001 (0.488)	Loss 2.4198 (2.5106)	Entropy 0.59934 (0.60061)	Top-1 acc 67.578 (63.435)	Top-5 acc 84.375 (83.731)	lr 0.00761
Train [76][1130/3239]	Time 0.242 (0.968)	Data Time 0.001 (0.489)	Loss 2.3692 (2.5102)	Entropy 0.59933 (0.60060)	Top-1 acc 67.578 (63.453)	Top-5 acc 85.938 (83.737)	lr 0.00761
Train [76][1140/3239]	Time 0.230 (0.963)	Data Time 0.001 (0.484)	Loss 2.4196 (2.5102)	Entropy 0.59977 (0.60059)	Top-1 acc 66.406 (63.452)	Top-5 acc 84.766 (83.737)	lr 0.00761
Train [76][1150/3239]	Time 0.228 (0.977)	Data Time 0.001 (0.498)	Loss 2.5856 (2.5102)	Entropy 0.59965 (0.60058)	Top-1 acc 60.938 (63.458)	Top-5 acc 81.641 (83.733)	lr 0.00761
Train [76][1160/3239]	Time 3.216 (0.974)	Data Time 2.970 (0.497)	Loss 2.5576 (2.5106)	Entropy 0.59979 (0.60057)	Top-1 acc 64.844 (63.449)	Top-5 acc 80.469 (83.721)	lr 0.00761
Train [76][1170/3239]	Time 0.272 (0.970)	Data Time 0.001 (0.493)	Loss 2.5069 (2.5110)	Entropy 0.59990 (0.60057)	Top-1 acc 64.062 (63.437)	Top-5 acc 87.109 (83.712)	lr 0.00761
Train [76][1180/3239]	Time 16.120 (0.983)	Data Time 15.878 (0.507)	Loss 2.6782 (2.5118)	Entropy 0.59997 (0.60056)	Top-1 acc 62.109 (63.428)	Top-5 acc 79.688 (83.702)	lr 0.00761
Train [76][1190/3239]	Time 0.245 (0.978)	Data Time 0.002 (0.503)	Loss 2.4852 (2.5120)	Entropy 0.59975 (0.60056)	Top-1 acc 67.188 (63.432)	Top-5 acc 84.766 (83.697)	lr 0.00761
Train [76][1200/3239]	Time 0.322 (0.975)	Data Time 0.001 (0.500)	Loss 2.7023 (2.5112)	Entropy 0.59962 (0.60055)	Top-1 acc 60.547 (63.451)	Top-5 acc 79.688 (83.708)	lr 0.00760
Train [76][1210/3239]	Time 0.228 (0.978)	Data Time 0.001 (0.504)	Loss 2.4107 (2.5115)	Entropy 0.59983 (0.60054)	Top-1 acc 66.016 (63.438)	Top-5 acc 84.375 (83.708)	lr 0.00760
Train [76][1220/3239]	Time 0.285 (0.984)	Data Time 0.001 (0.510)	Loss 2.6044 (2.5119)	Entropy 0.59999 (0.60054)	Top-1 acc 63.281 (63.431)	Top-5 acc 83.203 (83.696)	lr 0.00760
Train [76][1230/3239]	Time 0.237 (0.980)	Data Time 0.002 (0.506)	Loss 2.3499 (2.5118)	Entropy 0.60019 (0.60053)	Top-1 acc 68.750 (63.433)	Top-5 acc 87.891 (83.700)	lr 0.00760
Train [76][1240/3239]	Time 9.745 (0.984)	Data Time 9.498 (0.511)	Loss 2.4884 (2.5115)	Entropy 0.60027 (0.60053)	Top-1 acc 64.062 (63.439)	Top-5 acc 82.422 (83.705)	lr 0.00760
Train [76][1250/3239]	Time 0.236 (0.992)	Data Time 0.001 (0.519)	Loss 2.5570 (2.5120)	Entropy 0.60034 (0.60053)	Top-1 acc 65.234 (63.432)	Top-5 acc 84.375 (83.701)	lr 0.00760
Train [76][1260/3239]	Time 0.230 (0.987)	Data Time 0.001 (0.515)	Loss 2.2685 (2.5121)	Entropy 0.59995 (0.60053)	Top-1 acc 69.141 (63.430)	Top-5 acc 87.500 (83.698)	lr 0.00760
Train [76][1270/3239]	Time 0.329 (0.983)	Data Time 0.001 (0.511)	Loss 2.6148 (2.5123)	Entropy 0.59962 (0.60052)	Top-1 acc 62.891 (63.432)	Top-5 acc 81.250 (83.690)	lr 0.00760
Train [76][1280/3239]	Time 0.285 (0.995)	Data Time 0.002 (0.523)	Loss 2.5367 (2.5122)	Entropy 0.59957 (0.60051)	Top-1 acc 62.109 (63.435)	Top-5 acc 83.984 (83.693)	lr 0.00760
Train [76][1290/3239]	Time 0.264 (1.034)	Data Time 0.002 (0.519)	Loss 2.4854 (2.5123)	Entropy 0.59930 (0.60051)	Top-1 acc 61.719 (63.431)	Top-5 acc 83.984 (83.696)	lr 0.00760
Train [76][1300/3239]	Time 0.247 (1.030)	Data Time 0.002 (0.515)	Loss 2.3819 (2.5129)	Entropy 0.59934 (0.60050)	Top-1 acc 66.797 (63.415)	Top-5 acc 84.766 (83.686)	lr 0.00760
Train [76][1310/3239]	Time 0.233 (1.025)	Data Time 0.001 (0.511)	Loss 2.5747 (2.5133)	Entropy 0.59926 (0.60049)	Top-1 acc 63.281 (63.405)	Top-5 acc 82.812 (83.684)	lr 0.00759
Train [76][1320/3239]	Time 0.240 (1.020)	Data Time 0.002 (0.507)	Loss 2.6988 (2.5133)	Entropy 0.59947 (0.60048)	Top-1 acc 56.641 (63.395)	Top-5 acc 81.641 (83.686)	lr 0.00759
Train [76][1330/3239]	Time 0.239 (1.015)	Data Time 0.001 (0.503)	Loss 2.4278 (2.5132)	Entropy 0.59927 (0.60047)	Top-1 acc 61.719 (63.395)	Top-5 acc 86.328 (83.689)	lr 0.00759
Train [76][1340/3239]	Time 0.247 (1.011)	Data Time 0.001 (0.499)	Loss 2.5436 (2.5138)	Entropy 0.59904 (0.60046)	Top-1 acc 65.625 (63.387)	Top-5 acc 84.766 (83.680)	lr 0.00759
Train [76][1350/3239]	Time 2.646 (1.017)	Data Time 2.397 (0.506)	Loss 2.3874 (2.5142)	Entropy 0.59932 (0.60045)	Top-1 acc 66.016 (63.369)	Top-5 acc 86.719 (83.676)	lr 0.00759
Train [76][1360/3239]	Time 0.370 (1.013)	Data Time 0.001 (0.503)	Loss 2.5082 (2.5143)	Entropy 0.59937 (0.60044)	Top-1 acc 64.062 (63.367)	Top-5 acc 83.594 (83.672)	lr 0.00759
Train [76][1370/3239]	Time 0.232 (1.010)	Data Time 0.001 (0.500)	Loss 2.7153 (2.5141)	Entropy 0.59916 (0.60043)	Top-1 acc 59.766 (63.368)	Top-5 acc 80.859 (83.676)	lr 0.00759
Train [76][1380/3239]	Time 0.245 (1.007)	Data Time 0.001 (0.498)	Loss 2.4934 (2.5149)	Entropy 0.59896 (0.60042)	Top-1 acc 61.328 (63.347)	Top-5 acc 86.719 (83.662)	lr 0.00759
Train [76][1390/3239]	Time 0.230 (1.024)	Data Time 0.001 (0.515)	Loss 2.3380 (2.5147)	Entropy 0.59920 (0.60041)	Top-1 acc 67.578 (63.343)	Top-5 acc 87.500 (83.667)	lr 0.00759
Train [76][1400/3239]	Time 0.246 (1.019)	Data Time 0.001 (0.512)	Loss 2.4864 (2.5150)	Entropy 0.59916 (0.60041)	Top-1 acc 62.891 (63.335)	Top-5 acc 84.766 (83.660)	lr 0.00759
Train [76][1410/3239]	Time 0.268 (1.015)	Data Time 0.002 (0.508)	Loss 2.4475 (2.5151)	Entropy 0.59914 (0.60040)	Top-1 acc 59.766 (63.335)	Top-5 acc 87.109 (83.654)	lr 0.00759
Train [76][1420/3239]	Time 0.229 (1.031)	Data Time 0.001 (0.525)	Loss 2.5205 (2.5153)	Entropy 0.59898 (0.60039)	Top-1 acc 63.672 (63.331)	Top-5 acc 85.156 (83.654)	lr 0.00758
Train [76][1430/3239]	Time 0.331 (1.027)	Data Time 0.001 (0.521)	Loss 2.4348 (2.5154)	Entropy 0.59899 (0.60038)	Top-1 acc 64.453 (63.326)	Top-5 acc 84.766 (83.653)	lr 0.00758
Train [76][1440/3239]	Time 0.233 (1.023)	Data Time 0.001 (0.518)	Loss 2.6642 (2.5153)	Entropy 0.59914 (0.60037)	Top-1 acc 61.328 (63.329)	Top-5 acc 79.297 (83.662)	lr 0.00758
Train [76][1450/3239]	Time 0.274 (1.031)	Data Time 0.001 (0.526)	Loss 2.4652 (2.5155)	Entropy 0.59952 (0.60036)	Top-1 acc 61.719 (63.329)	Top-5 acc 84.766 (83.651)	lr 0.00758
Train [76][1460/3239]	Time 0.236 (1.026)	Data Time 0.001 (0.523)	Loss 2.5439 (2.5153)	Entropy 0.59943 (0.60036)	Top-1 acc 66.016 (63.336)	Top-5 acc 80.469 (83.649)	lr 0.00758
Train [76][1470/3239]	Time 0.248 (1.022)	Data Time 0.003 (0.519)	Loss 2.3488 (2.5153)	Entropy 0.59915 (0.60035)	Top-1 acc 66.797 (63.339)	Top-5 acc 87.500 (83.651)	lr 0.00758
Train [76][1480/3239]	Time 0.246 (1.038)	Data Time 0.001 (0.535)	Loss 2.6901 (2.5156)	Entropy 0.59922 (0.60034)	Top-1 acc 57.812 (63.330)	Top-5 acc 80.469 (83.643)	lr 0.00758
Train [76][1490/3239]	Time 0.254 (1.034)	Data Time 0.001 (0.532)	Loss 2.4944 (2.5154)	Entropy 0.59899 (0.60033)	Top-1 acc 61.328 (63.332)	Top-5 acc 84.375 (83.653)	lr 0.00758
Train [76][1500/3239]	Time 0.236 (1.030)	Data Time 0.001 (0.528)	Loss 2.5151 (2.5158)	Entropy 0.59905 (0.60032)	Top-1 acc 63.281 (63.321)	Top-5 acc 82.031 (83.645)	lr 0.00758
Train [76][1510/3239]	Time 11.882 (1.044)	Data Time 11.622 (0.543)	Loss 2.5668 (2.5159)	Entropy 0.59918 (0.60032)	Top-1 acc 62.891 (63.317)	Top-5 acc 80.469 (83.645)	lr 0.00758
Train [76][1520/3239]	Time 1.808 (1.041)	Data Time 1.446 (0.541)	Loss 2.5110 (2.5159)	Entropy 0.59930 (0.60031)	Top-1 acc 64.062 (63.317)	Top-5 acc 79.297 (83.639)	lr 0.00757
Train [76][1530/3239]	Time 0.224 (1.037)	Data Time 0.001 (0.537)	Loss 2.4855 (2.5157)	Entropy 0.59916 (0.60030)	Top-1 acc 68.750 (63.325)	Top-5 acc 83.203 (83.641)	lr 0.00757
Train [76][1540/3239]	Time 0.251 (1.033)	Data Time 0.001 (0.534)	Loss 2.4246 (2.5162)	Entropy 0.59879 (0.60029)	Top-1 acc 68.750 (63.310)	Top-5 acc 84.375 (83.635)	lr 0.00757
Train [76][1550/3239]	Time 0.262 (1.046)	Data Time 0.002 (0.547)	Loss 2.4565 (2.5162)	Entropy 0.59905 (0.60028)	Top-1 acc 60.938 (63.305)	Top-5 acc 84.375 (83.636)	lr 0.00757
Train [76][1560/3239]	Time 0.227 (1.044)	Data Time 0.001 (0.546)	Loss 2.3517 (2.5158)	Entropy 0.59927 (0.60028)	Top-1 acc 66.797 (63.321)	Top-5 acc 87.500 (83.641)	lr 0.00757
Train [76][1570/3239]	Time 0.229 (1.042)	Data Time 0.001 (0.544)	Loss 2.6938 (2.5160)	Entropy 0.59955 (0.60027)	Top-1 acc 57.812 (63.314)	Top-5 acc 83.203 (83.640)	lr 0.00757
Train [76][1580/3239]	Time 0.231 (1.052)	Data Time 0.001 (0.555)	Loss 2.6336 (2.5160)	Entropy 0.59971 (0.60027)	Top-1 acc 59.766 (63.316)	Top-5 acc 82.031 (83.643)	lr 0.00757
Train [76][1590/3239]	Time 0.341 (1.049)	Data Time 0.002 (0.552)	Loss 2.4688 (2.5159)	Entropy 0.59955 (0.60026)	Top-1 acc 64.062 (63.323)	Top-5 acc 86.328 (83.642)	lr 0.00757
Train [76][1600/3239]	Time 0.234 (1.050)	Data Time 0.001 (0.553)	Loss 2.5475 (2.5160)	Entropy 0.59913 (0.60026)	Top-1 acc 57.812 (63.313)	Top-5 acc 82.422 (83.633)	lr 0.00757
Train [76][1610/3239]	Time 0.234 (1.057)	Data Time 0.001 (0.560)	Loss 2.3847 (2.5164)	Entropy 0.59887 (0.60025)	Top-1 acc 66.797 (63.306)	Top-5 acc 85.156 (83.625)	lr 0.00757
Train [76][1620/3239]	Time 0.236 (1.053)	Data Time 0.001 (0.557)	Loss 2.3432 (2.5163)	Entropy 0.59885 (0.60024)	Top-1 acc 70.312 (63.315)	Top-5 acc 85.547 (83.626)	lr 0.00757
Train [76][1630/3239]	Time 0.234 (1.053)	Data Time 0.001 (0.558)	Loss 2.4736 (2.5164)	Entropy 0.59900 (0.60023)	Top-1 acc 63.281 (63.313)	Top-5 acc 83.594 (83.621)	lr 0.00756
Train [76][1640/3239]	Time 0.294 (1.063)	Data Time 0.001 (0.568)	Loss 2.4426 (2.5163)	Entropy 0.59913 (0.60022)	Top-1 acc 66.016 (63.316)	Top-5 acc 84.766 (83.621)	lr 0.00756
Train [76][1650/3239]	Time 0.246 (1.059)	Data Time 0.001 (0.565)	Loss 2.5174 (2.5164)	Entropy 0.59892 (0.60022)	Top-1 acc 60.547 (63.318)	Top-5 acc 83.203 (83.616)	lr 0.00756
Train [76][1660/3239]	Time 3.315 (1.057)	Data Time 3.061 (0.563)	Loss 2.9025 (2.5165)	Entropy 0.59878 (0.60021)	Top-1 acc 51.562 (63.318)	Top-5 acc 75.391 (83.618)	lr 0.00756
Train [76][1670/3239]	Time 22.374 (1.070)	Data Time 22.119 (0.577)	Loss 2.5854 (2.5167)	Entropy 0.59864 (0.60020)	Top-1 acc 59.766 (63.307)	Top-5 acc 83.984 (83.614)	lr 0.00756
Train [76][1680/3239]	Time 0.289 (1.066)	Data Time 0.001 (0.573)	Loss 2.4924 (2.5173)	Entropy 0.59847 (0.60019)	Top-1 acc 66.406 (63.293)	Top-5 acc 83.203 (83.602)	lr 0.00756
Train [76][1690/3239]	Time 0.233 (1.062)	Data Time 0.001 (0.570)	Loss 2.5136 (2.5171)	Entropy 0.59848 (0.60018)	Top-1 acc 61.719 (63.292)	Top-5 acc 84.766 (83.607)	lr 0.00756
Train [76][1700/3239]	Time 0.233 (1.061)	Data Time 0.001 (0.570)	Loss 2.5866 (2.5171)	Entropy 0.59832 (0.60017)	Top-1 acc 60.547 (63.288)	Top-5 acc 82.031 (83.607)	lr 0.00756
Train [76][1710/3239]	Time 0.232 (1.072)	Data Time 0.001 (0.581)	Loss 2.5062 (2.5171)	Entropy 0.59859 (0.60016)	Top-1 acc 65.625 (63.288)	Top-5 acc 83.594 (83.604)	lr 0.00756
Train [76][1720/3239]	Time 0.267 (1.069)	Data Time 0.001 (0.578)	Loss 2.4433 (2.5168)	Entropy 0.59850 (0.60015)	Top-1 acc 63.672 (63.293)	Top-5 acc 85.156 (83.609)	lr 0.00756
Train [76][1730/3239]	Time 0.229 (1.069)	Data Time 0.001 (0.579)	Loss 2.3080 (2.5167)	Entropy 0.59849 (0.60014)	Top-1 acc 68.750 (63.294)	Top-5 acc 88.281 (83.608)	lr 0.00756
Train [76][1740/3239]	Time 0.231 (1.076)	Data Time 0.001 (0.587)	Loss 2.4539 (2.5168)	Entropy 0.59868 (0.60013)	Top-1 acc 63.672 (63.291)	Top-5 acc 83.594 (83.608)	lr 0.00755
Train [76][1750/3239]	Time 0.330 (1.072)	Data Time 0.001 (0.583)	Loss 2.4669 (2.5166)	Entropy 0.59854 (0.60012)	Top-1 acc 64.062 (63.290)	Top-5 acc 85.156 (83.609)	lr 0.00755
Train [76][1760/3239]	Time 0.239 (1.071)	Data Time 0.001 (0.582)	Loss 2.4198 (2.5167)	Entropy 0.59835 (0.60011)	Top-1 acc 64.453 (63.292)	Top-5 acc 85.156 (83.607)	lr 0.00755
Train [76][1770/3239]	Time 0.219 (1.075)	Data Time 0.002 (0.587)	Loss 2.5324 (2.5166)	Entropy 0.59843 (0.60010)	Top-1 acc 63.672 (63.293)	Top-5 acc 82.422 (83.610)	lr 0.00755
Train [76][1780/3239]	Time 0.223 (1.074)	Data Time 0.001 (0.586)	Loss 2.4015 (2.5165)	Entropy 0.59849 (0.60009)	Top-1 acc 64.062 (63.292)	Top-5 acc 86.719 (83.615)	lr 0.00755
Train [76][1790/3239]	Time 0.269 (1.071)	Data Time 0.001 (0.584)	Loss 2.4774 (2.5165)	Entropy 0.59865 (0.60009)	Top-1 acc 62.109 (63.286)	Top-5 acc 84.375 (83.612)	lr 0.00755
Train [76][1800/3239]	Time 0.223 (1.076)	Data Time 0.001 (0.589)	Loss 2.4778 (2.5168)	Entropy 0.59889 (0.60008)	Top-1 acc 66.016 (63.279)	Top-5 acc 81.250 (83.605)	lr 0.00755
Train [76][1810/3239]	Time 0.277 (1.075)	Data Time 0.001 (0.589)	Loss 2.4251 (2.5167)	Entropy 0.59901 (0.60007)	Top-1 acc 66.797 (63.282)	Top-5 acc 86.328 (83.606)	lr 0.00755
Train [76][1820/3239]	Time 0.425 (1.072)	Data Time 0.002 (0.586)	Loss 2.4976 (2.5168)	Entropy 0.59914 (0.60007)	Top-1 acc 67.188 (63.285)	Top-5 acc 81.641 (83.605)	lr 0.00755
Train [76][1830/3239]	Time 13.958 (1.076)	Data Time 13.719 (0.590)	Loss 2.4492 (2.5166)	Entropy 0.59919 (0.60006)	Top-1 acc 64.062 (63.285)	Top-5 acc 86.328 (83.607)	lr 0.00755
Train [76][1840/3239]	Time 0.233 (1.078)	Data Time 0.001 (0.592)	Loss 2.6305 (2.5166)	Entropy 0.59895 (0.60006)	Top-1 acc 62.500 (63.289)	Top-5 acc 78.906 (83.606)	lr 0.00755
Train [76][1850/3239]	Time 0.235 (1.074)	Data Time 0.001 (0.589)	Loss 2.6989 (2.5172)	Entropy 0.59882 (0.60005)	Top-1 acc 61.328 (63.276)	Top-5 acc 79.688 (83.594)	lr 0.00754
Train [76][1860/3239]	Time 0.286 (1.071)	Data Time 0.002 (0.586)	Loss 2.3720 (2.5169)	Entropy 0.59884 (0.60004)	Top-1 acc 67.578 (63.283)	Top-5 acc 84.375 (83.596)	lr 0.00754
Train [76][1870/3239]	Time 0.238 (1.077)	Data Time 0.001 (0.592)	Loss 2.4239 (2.5170)	Entropy 0.59891 (0.60004)	Top-1 acc 65.625 (63.277)	Top-5 acc 87.109 (83.594)	lr 0.00754
Train [76][1880/3239]	Time 0.252 (1.074)	Data Time 0.001 (0.589)	Loss 2.6311 (2.5171)	Entropy 0.59906 (0.60003)	Top-1 acc 63.672 (63.276)	Top-5 acc 81.641 (83.589)	lr 0.00754
Train [76][1890/3239]	Time 0.264 (1.070)	Data Time 0.001 (0.586)	Loss 2.2914 (2.5166)	Entropy 0.59950 (0.60003)	Top-1 acc 69.922 (63.285)	Top-5 acc 86.719 (83.598)	lr 0.00754
Train [76][1900/3239]	Time 0.250 (1.072)	Data Time 0.001 (0.588)	Loss 2.5677 (2.5166)	Entropy 0.59931 (0.60002)	Top-1 acc 60.156 (63.286)	Top-5 acc 82.812 (83.601)	lr 0.00754
Train [76][1910/3239]	Time 0.371 (1.074)	Data Time 0.001 (0.590)	Loss 2.4273 (2.5167)	Entropy 0.59921 (0.60002)	Top-1 acc 65.625 (63.285)	Top-5 acc 83.594 (83.596)	lr 0.00754
Train [76][1920/3239]	Time 0.246 (1.070)	Data Time 0.002 (0.587)	Loss 2.3983 (2.5167)	Entropy 0.59942 (0.60002)	Top-1 acc 69.141 (63.283)	Top-5 acc 85.156 (83.595)	lr 0.00754
Train [76][1930/3239]	Time 0.250 (1.072)	Data Time 0.002 (0.589)	Loss 2.6456 (2.5169)	Entropy 0.59978 (0.60001)	Top-1 acc 57.812 (63.284)	Top-5 acc 82.812 (83.593)	lr 0.00754
Train [76][1940/3239]	Time 0.395 (1.101)	Data Time 0.006 (0.591)	Loss 2.7516 (2.5172)	Entropy 0.59961 (0.60001)	Top-1 acc 57.422 (63.279)	Top-5 acc 77.734 (83.585)	lr 0.00754
Train [76][1950/3239]	Time 0.237 (1.098)	Data Time 0.002 (0.588)	Loss 2.6667 (2.5174)	Entropy 0.59969 (0.60001)	Top-1 acc 60.156 (63.276)	Top-5 acc 79.297 (83.580)	lr 0.00754
Train [76][1960/3239]	Time 0.242 (1.094)	Data Time 0.002 (0.585)	Loss 2.3698 (2.5172)	Entropy 0.59955 (0.60001)	Top-1 acc 69.141 (63.285)	Top-5 acc 87.891 (83.585)	lr 0.00753
Train [76][1970/3239]	Time 0.236 (1.091)	Data Time 0.001 (0.582)	Loss 2.5596 (2.5171)	Entropy 0.59938 (0.60001)	Top-1 acc 66.016 (63.287)	Top-5 acc 80.078 (83.587)	lr 0.00753
Train [76][1980/3239]	Time 0.368 (1.088)	Data Time 0.002 (0.579)	Loss 2.6272 (2.5171)	Entropy 0.59928 (0.60000)	Top-1 acc 63.672 (63.288)	Top-5 acc 81.641 (83.585)	lr 0.00753
Train [76][1990/3239]	Time 0.236 (1.084)	Data Time 0.001 (0.576)	Loss 2.6252 (2.5171)	Entropy 0.59940 (0.60000)	Top-1 acc 54.688 (63.280)	Top-5 acc 79.688 (83.584)	lr 0.00753
Train [76][2000/3239]	Time 0.225 (1.081)	Data Time 0.001 (0.574)	Loss 2.5004 (2.5171)	Entropy 0.59930 (0.60000)	Top-1 acc 65.625 (63.282)	Top-5 acc 83.203 (83.584)	lr 0.00753
Train [76][2010/3239]	Time 0.231 (1.082)	Data Time 0.002 (0.575)	Loss 2.3758 (2.5172)	Entropy 0.59949 (0.59999)	Top-1 acc 66.406 (63.279)	Top-5 acc 84.375 (83.581)	lr 0.00753
Train [76][2020/3239]	Time 0.243 (1.079)	Data Time 0.001 (0.572)	Loss 2.6335 (2.5171)	Entropy 0.59938 (0.59999)	Top-1 acc 61.719 (63.280)	Top-5 acc 80.469 (83.579)	lr 0.00753
Train [76][2030/3239]	Time 0.235 (1.076)	Data Time 0.001 (0.570)	Loss 2.5048 (2.5169)	Entropy 0.59945 (0.59999)	Top-1 acc 63.281 (63.286)	Top-5 acc 83.594 (83.583)	lr 0.00753
Train [76][2040/3239]	Time 0.277 (1.081)	Data Time 0.002 (0.576)	Loss 2.9105 (2.5173)	Entropy 0.59967 (0.59998)	Top-1 acc 51.953 (63.276)	Top-5 acc 78.125 (83.574)	lr 0.00753
Train [76][2050/3239]	Time 0.245 (1.079)	Data Time 0.001 (0.573)	Loss 2.4257 (2.5173)	Entropy 0.59956 (0.59998)	Top-1 acc 64.844 (63.275)	Top-5 acc 84.375 (83.575)	lr 0.00753
Train [76][2060/3239]	Time 0.530 (1.076)	Data Time 0.298 (0.570)	Loss 2.4955 (2.5175)	Entropy 0.59974 (0.59998)	Top-1 acc 62.500 (63.271)	Top-5 acc 83.984 (83.570)	lr 0.00752
Train [76][2070/3239]	Time 0.564 (1.080)	Data Time 0.173 (0.575)	Loss 2.5839 (2.5178)	Entropy 0.59974 (0.59998)	Top-1 acc 58.203 (63.263)	Top-5 acc 83.984 (83.565)	lr 0.00752
Train [76][2080/3239]	Time 0.227 (1.079)	Data Time 0.001 (0.574)	Loss 2.7927 (2.5178)	Entropy 0.59992 (0.59998)	Top-1 acc 59.375 (63.262)	Top-5 acc 78.516 (83.562)	lr 0.00752
Train [76][2090/3239]	Time 0.244 (1.077)	Data Time 0.001 (0.572)	Loss 2.5153 (2.5176)	Entropy 0.59979 (0.59998)	Top-1 acc 60.938 (63.270)	Top-5 acc 82.422 (83.564)	lr 0.00752
Train [76][2100/3239]	Time 8.250 (1.079)	Data Time 7.959 (0.575)	Loss 2.6950 (2.5178)	Entropy 0.59981 (0.59998)	Top-1 acc 60.938 (63.265)	Top-5 acc 81.250 (83.559)	lr 0.00752
Train [76][2110/3239]	Time 0.268 (1.080)	Data Time 0.003 (0.575)	Loss 2.6070 (2.5183)	Entropy 0.59908 (0.59998)	Top-1 acc 60.156 (63.256)	Top-5 acc 77.344 (83.549)	lr 0.00752
Train [76][2120/3239]	Time 0.239 (1.077)	Data Time 0.001 (0.573)	Loss 2.4083 (2.5184)	Entropy 0.59917 (0.59997)	Top-1 acc 64.453 (63.251)	Top-5 acc 86.719 (83.548)	lr 0.00752
Train [76][2130/3239]	Time 4.178 (1.078)	Data Time 3.945 (0.574)	Loss 2.5052 (2.5182)	Entropy 0.59914 (0.59997)	Top-1 acc 64.453 (63.258)	Top-5 acc 84.375 (83.554)	lr 0.00752
Train [76][2140/3239]	Time 0.500 (1.080)	Data Time 0.127 (0.577)	Loss 2.5426 (2.5183)	Entropy 0.59913 (0.59997)	Top-1 acc 62.500 (63.260)	Top-5 acc 84.375 (83.552)	lr 0.00752
Train [76][2150/3239]	Time 0.221 (1.078)	Data Time 0.001 (0.575)	Loss 2.4017 (2.5182)	Entropy 0.59909 (0.59996)	Top-1 acc 67.578 (63.263)	Top-5 acc 86.328 (83.553)	lr 0.00752
Train [76][2160/3239]	Time 1.194 (1.076)	Data Time 0.942 (0.574)	Loss 2.3041 (2.5178)	Entropy 0.59908 (0.59996)	Top-1 acc 71.094 (63.269)	Top-5 acc 89.844 (83.562)	lr 0.00752
Train [76][2170/3239]	Time 0.235 (1.081)	Data Time 0.001 (0.578)	Loss 2.3096 (2.5177)	Entropy 0.59909 (0.59995)	Top-1 acc 69.141 (63.269)	Top-5 acc 87.500 (83.562)	lr 0.00751
Train [76][2180/3239]	Time 0.261 (1.080)	Data Time 0.001 (0.578)	Loss 2.3622 (2.5176)	Entropy 0.59897 (0.59995)	Top-1 acc 66.797 (63.268)	Top-5 acc 89.062 (83.563)	lr 0.00751
Train [76][2190/3239]	Time 0.843 (1.077)	Data Time 0.609 (0.576)	Loss 2.3991 (2.5173)	Entropy 0.59903 (0.59995)	Top-1 acc 64.844 (63.274)	Top-5 acc 84.375 (83.566)	lr 0.00751
Train [76][2200/3239]	Time 0.286 (1.080)	Data Time 0.001 (0.579)	Loss 2.6462 (2.5174)	Entropy 0.59904 (0.59994)	Top-1 acc 58.203 (63.271)	Top-5 acc 82.812 (83.567)	lr 0.00751
Train [76][2210/3239]	Time 0.233 (1.077)	Data Time 0.001 (0.576)	Loss 2.5999 (2.5174)	Entropy 0.59895 (0.59994)	Top-1 acc 63.672 (63.271)	Top-5 acc 82.031 (83.570)	lr 0.00751
Train [76][2220/3239]	Time 0.243 (1.074)	Data Time 0.001 (0.574)	Loss 2.3942 (2.5173)	Entropy 0.59890 (0.59993)	Top-1 acc 67.188 (63.275)	Top-5 acc 84.375 (83.572)	lr 0.00751
Train [76][2230/3239]	Time 0.339 (1.074)	Data Time 0.001 (0.574)	Loss 2.5969 (2.5174)	Entropy 0.59871 (0.59993)	Top-1 acc 60.156 (63.272)	Top-5 acc 81.641 (83.569)	lr 0.00751
Train [76][2240/3239]	Time 0.274 (1.073)	Data Time 0.001 (0.573)	Loss 2.5126 (2.5173)	Entropy 0.59891 (0.59992)	Top-1 acc 64.844 (63.274)	Top-5 acc 84.375 (83.570)	lr 0.00751
Train [76][2250/3239]	Time 0.232 (1.070)	Data Time 0.001 (0.570)	Loss 2.4833 (2.5173)	Entropy 0.59909 (0.59992)	Top-1 acc 63.281 (63.270)	Top-5 acc 81.641 (83.569)	lr 0.00751
Train [76][2260/3239]	Time 0.229 (1.067)	Data Time 0.002 (0.568)	Loss 2.6766 (2.5172)	Entropy 0.59919 (0.59991)	Top-1 acc 60.156 (63.272)	Top-5 acc 81.250 (83.565)	lr 0.00751
Train [76][2270/3239]	Time 0.243 (1.069)	Data Time 0.001 (0.571)	Loss 2.5095 (2.5174)	Entropy 0.59941 (0.59991)	Top-1 acc 61.328 (63.265)	Top-5 acc 83.203 (83.559)	lr 0.00751
Train [76][2280/3239]	Time 0.274 (1.067)	Data Time 0.001 (0.568)	Loss 2.6540 (2.5172)	Entropy 0.59970 (0.59991)	Top-1 acc 58.984 (63.266)	Top-5 acc 82.422 (83.563)	lr 0.00750
Train [76][2290/3239]	Time 7.648 (1.067)	Data Time 7.368 (0.569)	Loss 2.7112 (2.5176)	Entropy 0.59990 (0.59991)	Top-1 acc 59.375 (63.258)	Top-5 acc 77.734 (83.557)	lr 0.00750
Train [76][2300/3239]	Time 0.322 (1.068)	Data Time 0.001 (0.571)	Loss 2.6312 (2.5176)	Entropy 0.59968 (0.59991)	Top-1 acc 61.719 (63.260)	Top-5 acc 82.812 (83.558)	lr 0.00750
Train [76][2310/3239]	Time 0.222 (1.066)	Data Time 0.001 (0.568)	Loss 2.7553 (2.5179)	Entropy 0.59988 (0.59991)	Top-1 acc 58.203 (63.254)	Top-5 acc 79.688 (83.552)	lr 0.00750
Train [76][2320/3239]	Time 0.236 (1.065)	Data Time 0.001 (0.568)	Loss 2.5265 (2.5179)	Entropy 0.59945 (0.59991)	Top-1 acc 62.500 (63.254)	Top-5 acc 83.203 (83.550)	lr 0.00750
Train [76][2330/3239]	Time 0.233 (1.069)	Data Time 0.001 (0.573)	Loss 2.5634 (2.5178)	Entropy 0.59923 (0.59991)	Top-1 acc 62.109 (63.257)	Top-5 acc 82.031 (83.551)	lr 0.00750
Train [76][2340/3239]	Time 1.728 (1.068)	Data Time 1.494 (0.572)	Loss 2.3825 (2.5177)	Entropy 0.59932 (0.59990)	Top-1 acc 65.234 (63.256)	Top-5 acc 83.594 (83.549)	lr 0.00750
Train [76][2350/3239]	Time 0.228 (1.067)	Data Time 0.001 (0.572)	Loss 2.6122 (2.5177)	Entropy 0.59921 (0.59990)	Top-1 acc 62.500 (63.257)	Top-5 acc 80.859 (83.548)	lr 0.00750
Train [76][2360/3239]	Time 0.231 (1.071)	Data Time 0.001 (0.575)	Loss 2.4907 (2.5179)	Entropy 0.59926 (0.59990)	Top-1 acc 62.109 (63.254)	Top-5 acc 84.375 (83.548)	lr 0.00750
Train [76][2370/3239]	Time 0.238 (1.068)	Data Time 0.001 (0.573)	Loss 2.3232 (2.5178)	Entropy 0.59927 (0.59990)	Top-1 acc 68.359 (63.257)	Top-5 acc 85.547 (83.548)	lr 0.00750
Train [76][2380/3239]	Time 5.356 (1.068)	Data Time 5.122 (0.573)	Loss 2.4690 (2.5177)	Entropy 0.59907 (0.59989)	Top-1 acc 66.406 (63.257)	Top-5 acc 82.031 (83.549)	lr 0.00750
Train [76][2390/3239]	Time 0.273 (1.068)	Data Time 0.001 (0.574)	Loss 2.5083 (2.5177)	Entropy 0.59878 (0.59989)	Top-1 acc 58.594 (63.254)	Top-5 acc 85.547 (83.550)	lr 0.00749
Train [76][2400/3239]	Time 0.233 (1.068)	Data Time 0.001 (0.574)	Loss 2.3765 (2.5177)	Entropy 0.59868 (0.59988)	Top-1 acc 65.234 (63.252)	Top-5 acc 84.375 (83.551)	lr 0.00749
Train [76][2410/3239]	Time 0.230 (1.066)	Data Time 0.001 (0.572)	Loss 2.5221 (2.5177)	Entropy 0.59871 (0.59988)	Top-1 acc 66.797 (63.252)	Top-5 acc 82.812 (83.550)	lr 0.00749
Train [76][2420/3239]	Time 0.473 (1.065)	Data Time 0.242 (0.572)	Loss 2.4862 (2.5178)	Entropy 0.59887 (0.59987)	Top-1 acc 64.844 (63.253)	Top-5 acc 84.766 (83.550)	lr 0.00749
Train [76][2430/3239]	Time 0.237 (1.063)	Data Time 0.001 (0.570)	Loss 2.5185 (2.5178)	Entropy 0.59905 (0.59987)	Top-1 acc 64.453 (63.248)	Top-5 acc 83.594 (83.553)	lr 0.00749
Train [76][2440/3239]	Time 0.233 (1.062)	Data Time 0.001 (0.569)	Loss 2.4518 (2.5177)	Entropy 0.59875 (0.59987)	Top-1 acc 69.141 (63.251)	Top-5 acc 83.594 (83.554)	lr 0.00749
Train [76][2450/3239]	Time 0.221 (1.060)	Data Time 0.001 (0.568)	Loss 2.5576 (2.5178)	Entropy 0.59883 (0.59986)	Top-1 acc 60.938 (63.248)	Top-5 acc 85.156 (83.553)	lr 0.00749
Train [76][2460/3239]	Time 0.359 (1.059)	Data Time 0.001 (0.567)	Loss 2.5832 (2.5179)	Entropy 0.59892 (0.59986)	Top-1 acc 58.594 (63.241)	Top-5 acc 81.250 (83.554)	lr 0.00749
Train [76][2470/3239]	Time 0.265 (1.057)	Data Time 0.002 (0.565)	Loss 2.6420 (2.5180)	Entropy 0.59885 (0.59985)	Top-1 acc 58.594 (63.239)	Top-5 acc 82.422 (83.550)	lr 0.00749
Train [76][2480/3239]	Time 0.226 (1.055)	Data Time 0.001 (0.564)	Loss 2.3426 (2.5179)	Entropy 0.59908 (0.59985)	Top-1 acc 68.750 (63.240)	Top-5 acc 86.328 (83.552)	lr 0.00749
Train [76][2490/3239]	Time 0.229 (1.054)	Data Time 0.001 (0.563)	Loss 2.4589 (2.5180)	Entropy 0.59936 (0.59985)	Top-1 acc 66.797 (63.241)	Top-5 acc 82.422 (83.554)	lr 0.00749
Train [76][2500/3239]	Time 0.337 (1.052)	Data Time 0.001 (0.561)	Loss 2.5184 (2.5179)	Entropy 0.59945 (0.59985)	Top-1 acc 66.406 (63.238)	Top-5 acc 81.641 (83.554)	lr 0.00748
Train [76][2510/3239]	Time 0.221 (1.050)	Data Time 0.001 (0.560)	Loss 2.7386 (2.5179)	Entropy 0.59936 (0.59984)	Top-1 acc 57.812 (63.242)	Top-5 acc 78.906 (83.553)	lr 0.00748
Train [76][2520/3239]	Time 0.225 (1.051)	Data Time 0.001 (0.561)	Loss 2.6730 (2.5183)	Entropy 0.59945 (0.59984)	Top-1 acc 60.156 (63.228)	Top-5 acc 82.422 (83.544)	lr 0.00748
Train [76][2530/3239]	Time 0.350 (1.048)	Data Time 0.002 (0.558)	Loss 2.6896 (2.5185)	Entropy 0.59967 (0.59984)	Top-1 acc 55.078 (63.224)	Top-5 acc 81.641 (83.540)	lr 0.00748
Train [76][2540/3239]	Time 0.237 (1.046)	Data Time 0.001 (0.556)	Loss 2.4963 (2.5184)	Entropy 0.59983 (0.59984)	Top-1 acc 67.969 (63.230)	Top-5 acc 83.594 (83.538)	lr 0.00748
Train [76][2550/3239]	Time 0.232 (1.046)	Data Time 0.001 (0.557)	Loss 2.5938 (2.5185)	Entropy 0.59971 (0.59984)	Top-1 acc 63.281 (63.229)	Top-5 acc 82.812 (83.537)	lr 0.00748
Train [76][2560/3239]	Time 0.240 (1.044)	Data Time 0.001 (0.555)	Loss 2.3967 (2.5184)	Entropy 0.59962 (0.59984)	Top-1 acc 70.703 (63.234)	Top-5 acc 83.594 (83.537)	lr 0.00748
Train [76][2570/3239]	Time 0.257 (1.042)	Data Time 0.001 (0.553)	Loss 2.5281 (2.5184)	Entropy 0.59950 (0.59984)	Top-1 acc 61.719 (63.236)	Top-5 acc 84.375 (83.535)	lr 0.00748
Train [76][2580/3239]	Time 0.252 (1.044)	Data Time 0.001 (0.555)	Loss 2.4334 (2.5181)	Entropy 0.59896 (0.59984)	Top-1 acc 64.062 (63.242)	Top-5 acc 82.812 (83.541)	lr 0.00748
Train [76][2590/3239]	Time 0.243 (1.044)	Data Time 0.001 (0.556)	Loss 2.6335 (2.5185)	Entropy 0.59893 (0.59983)	Top-1 acc 63.281 (63.234)	Top-5 acc 82.422 (83.538)	lr 0.00748
Train [76][2600/3239]	Time 0.343 (1.064)	Data Time 0.004 (0.554)	Loss 2.6133 (2.5184)	Entropy 0.59874 (0.59983)	Top-1 acc 62.109 (63.235)	Top-5 acc 82.812 (83.538)	lr 0.00747
Train [76][2610/3239]	Time 0.244 (1.061)	Data Time 0.002 (0.552)	Loss 2.6277 (2.5185)	Entropy 0.59862 (0.59982)	Top-1 acc 59.766 (63.237)	Top-5 acc 85.547 (83.537)	lr 0.00747
Train [76][2620/3239]	Time 0.336 (1.059)	Data Time 0.002 (0.550)	Loss 2.5809 (2.5183)	Entropy 0.59897 (0.59982)	Top-1 acc 60.156 (63.243)	Top-5 acc 82.031 (83.540)	lr 0.00747
Train [76][2630/3239]	Time 0.239 (1.056)	Data Time 0.001 (0.548)	Loss 2.4575 (2.5182)	Entropy 0.59907 (0.59982)	Top-1 acc 65.234 (63.246)	Top-5 acc 84.375 (83.539)	lr 0.00747
Train [76][2640/3239]	Time 0.238 (1.054)	Data Time 0.001 (0.546)	Loss 2.8012 (2.5183)	Entropy 0.59925 (0.59982)	Top-1 acc 58.203 (63.243)	Top-5 acc 76.953 (83.534)	lr 0.00747
Train [76][2650/3239]	Time 0.256 (1.052)	Data Time 0.002 (0.544)	Loss 2.4307 (2.5182)	Entropy 0.59927 (0.59981)	Top-1 acc 65.625 (63.247)	Top-5 acc 85.156 (83.536)	lr 0.00747
Train [76][2660/3239]	Time 1.447 (1.050)	Data Time 1.191 (0.543)	Loss 2.4916 (2.5180)	Entropy 0.59928 (0.59981)	Top-1 acc 65.234 (63.252)	Top-5 acc 82.812 (83.538)	lr 0.00747
Train [76][2670/3239]	Time 0.247 (1.050)	Data Time 0.001 (0.542)	Loss 2.6020 (2.5179)	Entropy 0.59959 (0.59981)	Top-1 acc 60.938 (63.252)	Top-5 acc 82.812 (83.541)	lr 0.00747
Train [76][2680/3239]	Time 0.253 (1.048)	Data Time 0.001 (0.541)	Loss 2.6472 (2.5180)	Entropy 0.59969 (0.59981)	Top-1 acc 62.500 (63.252)	Top-5 acc 79.688 (83.540)	lr 0.00747
Train [76][2690/3239]	Time 0.373 (1.047)	Data Time 0.001 (0.540)	Loss 2.4541 (2.5180)	Entropy 0.59986 (0.59981)	Top-1 acc 63.672 (63.255)	Top-5 acc 84.766 (83.540)	lr 0.00747
Train [76][2700/3239]	Time 0.238 (1.051)	Data Time 0.001 (0.545)	Loss 2.5981 (2.5177)	Entropy 0.59990 (0.59981)	Top-1 acc 62.500 (63.263)	Top-5 acc 82.031 (83.542)	lr 0.00747
Train [76][2710/3239]	Time 0.232 (1.050)	Data Time 0.001 (0.544)	Loss 2.6532 (2.5177)	Entropy 0.59990 (0.59981)	Top-1 acc 60.547 (63.267)	Top-5 acc 80.078 (83.540)	lr 0.00746
Train [76][2720/3239]	Time 0.230 (1.048)	Data Time 0.001 (0.542)	Loss 2.4584 (2.5177)	Entropy 0.59985 (0.59981)	Top-1 acc 65.234 (63.266)	Top-5 acc 84.766 (83.542)	lr 0.00746
Train [76][2730/3239]	Time 0.772 (1.051)	Data Time 0.503 (0.546)	Loss 2.4303 (2.5178)	Entropy 0.60006 (0.59981)	Top-1 acc 63.672 (63.261)	Top-5 acc 85.547 (83.540)	lr 0.00746
Train [76][2740/3239]	Time 0.237 (1.050)	Data Time 0.001 (0.545)	Loss 2.5220 (2.5178)	Entropy 0.59976 (0.59981)	Top-1 acc 62.891 (63.261)	Top-5 acc 82.422 (83.537)	lr 0.00746
Train [76][2750/3239]	Time 0.242 (1.050)	Data Time 0.001 (0.545)	Loss 2.6437 (2.5179)	Entropy 0.60005 (0.59981)	Top-1 acc 60.938 (63.258)	Top-5 acc 82.422 (83.534)	lr 0.00746
Train [76][2760/3239]	Time 0.261 (1.052)	Data Time 0.027 (0.547)	Loss 2.9960 (2.5179)	Entropy 0.60018 (0.59981)	Top-1 acc 54.297 (63.255)	Top-5 acc 75.000 (83.532)	lr 0.00746
Train [76][2770/3239]	Time 0.227 (1.051)	Data Time 0.001 (0.547)	Loss 2.6661 (2.5179)	Entropy 0.60015 (0.59981)	Top-1 acc 57.422 (63.253)	Top-5 acc 80.078 (83.530)	lr 0.00746
Train [76][2780/3239]	Time 5.353 (1.051)	Data Time 4.966 (0.547)	Loss 2.7074 (2.5181)	Entropy 0.60027 (0.59981)	Top-1 acc 58.984 (63.250)	Top-5 acc 80.078 (83.526)	lr 0.00746
Train [76][2790/3239]	Time 0.242 (1.053)	Data Time 0.001 (0.549)	Loss 2.5170 (2.5182)	Entropy 0.60042 (0.59981)	Top-1 acc 65.625 (63.247)	Top-5 acc 82.812 (83.525)	lr 0.00746
Train [76][2800/3239]	Time 0.232 (1.053)	Data Time 0.001 (0.550)	Loss 2.5973 (2.5185)	Entropy 0.60073 (0.59982)	Top-1 acc 61.328 (63.242)	Top-5 acc 82.031 (83.521)	lr 0.00746
Train [76][2810/3239]	Time 0.231 (1.051)	Data Time 0.001 (0.548)	Loss 2.5375 (2.5185)	Entropy 0.60067 (0.59982)	Top-1 acc 62.109 (63.240)	Top-5 acc 84.766 (83.520)	lr 0.00746
Train [76][2820/3239]	Time 0.247 (1.054)	Data Time 0.001 (0.551)	Loss 2.6316 (2.5187)	Entropy 0.60035 (0.59982)	Top-1 acc 62.500 (63.235)	Top-5 acc 82.422 (83.518)	lr 0.00745
Train [76][2830/3239]	Time 0.292 (1.054)	Data Time 0.042 (0.551)	Loss 2.4250 (2.5185)	Entropy 0.60058 (0.59982)	Top-1 acc 63.672 (63.239)	Top-5 acc 83.984 (83.521)	lr 0.00745
Train [76][2840/3239]	Time 0.239 (1.052)	Data Time 0.001 (0.550)	Loss 2.5735 (2.5183)	Entropy 0.60076 (0.59983)	Top-1 acc 60.156 (63.240)	Top-5 acc 81.641 (83.522)	lr 0.00745
Train [76][2850/3239]	Time 0.346 (1.050)	Data Time 0.001 (0.548)	Loss 2.3651 (2.5182)	Entropy 0.60048 (0.59983)	Top-1 acc 69.141 (63.246)	Top-5 acc 85.547 (83.523)	lr 0.00745
Train [76][2860/3239]	Time 0.233 (1.055)	Data Time 0.001 (0.553)	Loss 2.4781 (2.5182)	Entropy 0.60065 (0.59983)	Top-1 acc 64.453 (63.248)	Top-5 acc 85.547 (83.524)	lr 0.00745
Train [76][2870/3239]	Time 0.232 (1.053)	Data Time 0.001 (0.552)	Loss 2.6066 (2.5183)	Entropy 0.60058 (0.59984)	Top-1 acc 61.719 (63.248)	Top-5 acc 81.641 (83.520)	lr 0.00745
Train [76][2880/3239]	Time 0.226 (1.051)	Data Time 0.001 (0.550)	Loss 2.6345 (2.5183)	Entropy 0.60042 (0.59984)	Top-1 acc 64.062 (63.248)	Top-5 acc 80.469 (83.519)	lr 0.00745
Train [76][2890/3239]	Time 0.600 (1.055)	Data Time 0.361 (0.554)	Loss 2.6616 (2.5182)	Entropy 0.60037 (0.59984)	Top-1 acc 59.375 (63.249)	Top-5 acc 81.250 (83.520)	lr 0.00745
Train [76][2900/3239]	Time 0.235 (1.054)	Data Time 0.001 (0.553)	Loss 2.5097 (2.5185)	Entropy 0.60040 (0.59984)	Top-1 acc 64.062 (63.243)	Top-5 acc 83.984 (83.517)	lr 0.00745
Train [76][2910/3239]	Time 0.262 (1.053)	Data Time 0.001 (0.553)	Loss 2.3733 (2.5184)	Entropy 0.60049 (0.59984)	Top-1 acc 66.016 (63.247)	Top-5 acc 86.328 (83.518)	lr 0.00745
Train [76][2920/3239]	Time 0.238 (1.056)	Data Time 0.001 (0.556)	Loss 2.3832 (2.5184)	Entropy 0.60045 (0.59985)	Top-1 acc 68.359 (63.250)	Top-5 acc 88.281 (83.521)	lr 0.00745
Train [76][2930/3239]	Time 0.232 (1.055)	Data Time 0.001 (0.555)	Loss 2.4961 (2.5184)	Entropy 0.60041 (0.59985)	Top-1 acc 64.062 (63.247)	Top-5 acc 82.812 (83.517)	lr 0.00744
Train [76][2940/3239]	Time 3.424 (1.054)	Data Time 3.146 (0.554)	Loss 2.5136 (2.5185)	Entropy 0.60047 (0.59985)	Top-1 acc 61.719 (63.245)	Top-5 acc 84.766 (83.515)	lr 0.00744
Train [76][2950/3239]	Time 0.235 (1.055)	Data Time 0.001 (0.556)	Loss 2.3901 (2.5184)	Entropy 0.60075 (0.59985)	Top-1 acc 67.969 (63.247)	Top-5 acc 85.547 (83.517)	lr 0.00744
Train [76][2960/3239]	Time 0.250 (1.056)	Data Time 0.001 (0.557)	Loss 2.6392 (2.5184)	Entropy 0.60063 (0.59986)	Top-1 acc 60.547 (63.245)	Top-5 acc 80.078 (83.517)	lr 0.00744
Train [76][2970/3239]	Time 0.232 (1.054)	Data Time 0.001 (0.555)	Loss 2.5218 (2.5184)	Entropy 0.60035 (0.59986)	Top-1 acc 65.234 (63.243)	Top-5 acc 82.812 (83.518)	lr 0.00744
Train [76][2980/3239]	Time 0.245 (1.057)	Data Time 0.001 (0.558)	Loss 2.4651 (2.5184)	Entropy 0.60080 (0.59986)	Top-1 acc 64.844 (63.244)	Top-5 acc 82.812 (83.520)	lr 0.00744
Train [76][2990/3239]	Time 0.236 (1.056)	Data Time 0.001 (0.558)	Loss 2.4637 (2.5184)	Entropy 0.60096 (0.59986)	Top-1 acc 63.281 (63.247)	Top-5 acc 83.594 (83.520)	lr 0.00744
Train [76][3000/3239]	Time 0.224 (1.054)	Data Time 0.001 (0.556)	Loss 2.6515 (2.5186)	Entropy 0.60111 (0.59987)	Top-1 acc 56.641 (63.242)	Top-5 acc 80.469 (83.518)	lr 0.00744
Train [76][3010/3239]	Time 0.440 (1.052)	Data Time 0.001 (0.554)	Loss 2.4156 (2.5185)	Entropy 0.60134 (0.59987)	Top-1 acc 63.672 (63.247)	Top-5 acc 84.375 (83.518)	lr 0.00744
Train [76][3020/3239]	Time 0.234 (1.056)	Data Time 0.001 (0.558)	Loss 2.7428 (2.5188)	Entropy 0.60136 (0.59988)	Top-1 acc 61.328 (63.243)	Top-5 acc 79.297 (83.514)	lr 0.00744
Train [76][3030/3239]	Time 0.246 (1.055)	Data Time 0.001 (0.558)	Loss 2.2738 (2.5189)	Entropy 0.60133 (0.59988)	Top-1 acc 69.922 (63.240)	Top-5 acc 87.891 (83.515)	lr 0.00744
Train [76][3040/3239]	Time 0.266 (1.053)	Data Time 0.001 (0.556)	Loss 2.4768 (2.5189)	Entropy 0.60100 (0.59989)	Top-1 acc 64.453 (63.241)	Top-5 acc 84.766 (83.514)	lr 0.00743
Train [76][3050/3239]	Time 1.859 (1.058)	Data Time 1.604 (0.561)	Loss 2.5741 (2.5190)	Entropy 0.60081 (0.59989)	Top-1 acc 61.719 (63.239)	Top-5 acc 82.031 (83.512)	lr 0.00743
Train [76][3060/3239]	Time 1.418 (1.056)	Data Time 1.165 (0.560)	Loss 2.5456 (2.5190)	Entropy 0.60099 (0.59989)	Top-1 acc 62.891 (63.234)	Top-5 acc 82.031 (83.516)	lr 0.00743
Train [76][3070/3239]	Time 0.243 (1.054)	Data Time 0.002 (0.558)	Loss 2.3819 (2.5190)	Entropy 0.60124 (0.59990)	Top-1 acc 67.969 (63.233)	Top-5 acc 86.328 (83.518)	lr 0.00743
Train [76][3080/3239]	Time 0.341 (1.058)	Data Time 0.001 (0.562)	Loss 2.4508 (2.5190)	Entropy 0.60121 (0.59990)	Top-1 acc 64.453 (63.230)	Top-5 acc 80.078 (83.516)	lr 0.00743
Train [76][3090/3239]	Time 0.268 (1.057)	Data Time 0.001 (0.561)	Loss 2.4899 (2.5191)	Entropy 0.60148 (0.59991)	Top-1 acc 67.578 (63.227)	Top-5 acc 81.641 (83.512)	lr 0.00743
Train [76][3100/3239]	Time 0.263 (1.056)	Data Time 0.001 (0.560)	Loss 2.5288 (2.5193)	Entropy 0.60151 (0.59991)	Top-1 acc 63.672 (63.221)	Top-5 acc 81.641 (83.511)	lr 0.00743
Train [76][3110/3239]	Time 0.252 (1.058)	Data Time 0.002 (0.562)	Loss 2.4771 (2.5192)	Entropy 0.60155 (0.59992)	Top-1 acc 64.062 (63.224)	Top-5 acc 83.594 (83.512)	lr 0.00743
Train [76][3120/3239]	Time 0.238 (1.058)	Data Time 0.001 (0.563)	Loss 2.6099 (2.5193)	Entropy 0.60148 (0.59992)	Top-1 acc 61.328 (63.221)	Top-5 acc 82.031 (83.512)	lr 0.00743
Train [76][3130/3239]	Time 0.235 (1.058)	Data Time 0.001 (0.562)	Loss 2.5735 (2.5191)	Entropy 0.60168 (0.59993)	Top-1 acc 64.062 (63.224)	Top-5 acc 82.031 (83.517)	lr 0.00743
Train [76][3140/3239]	Time 0.234 (1.059)	Data Time 0.001 (0.564)	Loss 2.6987 (2.5194)	Entropy 0.60156 (0.59993)	Top-1 acc 57.031 (63.214)	Top-5 acc 79.688 (83.511)	lr 0.00743
Train [76][3150/3239]	Time 0.251 (1.059)	Data Time 0.001 (0.564)	Loss 2.5543 (2.5197)	Entropy 0.60112 (0.59994)	Top-1 acc 62.109 (63.209)	Top-5 acc 82.422 (83.508)	lr 0.00742
Train [76][3160/3239]	Time 0.228 (1.058)	Data Time 0.001 (0.564)	Loss 2.4753 (2.5200)	Entropy 0.60092 (0.59994)	Top-1 acc 61.328 (63.204)	Top-5 acc 84.766 (83.503)	lr 0.00742
Train [76][3170/3239]	Time 0.342 (1.057)	Data Time 0.001 (0.562)	Loss 2.5435 (2.5200)	Entropy 0.60074 (0.59994)	Top-1 acc 65.234 (63.205)	Top-5 acc 83.984 (83.502)	lr 0.00742
Train [76][3180/3239]	Time 0.233 (1.060)	Data Time 0.000 (0.566)	Loss 2.5686 (2.5199)	Entropy 0.60083 (0.59995)	Top-1 acc 62.109 (63.205)	Top-5 acc 82.812 (83.503)	lr 0.00742
Train [76][3190/3239]	Time 0.238 (1.059)	Data Time 0.000 (0.566)	Loss 2.4936 (2.5203)	Entropy 0.60107 (0.59995)	Top-1 acc 65.625 (63.196)	Top-5 acc 83.984 (83.496)	lr 0.00742
Train [76][3200/3239]	Time 0.234 (1.058)	Data Time 0.000 (0.565)	Loss 2.4644 (2.5202)	Entropy 0.60115 (0.59995)	Top-1 acc 64.453 (63.196)	Top-5 acc 83.594 (83.497)	lr 0.00742
Train [76][3210/3239]	Time 0.259 (1.060)	Data Time 0.000 (0.566)	Loss 2.4387 (2.5201)	Entropy 0.60117 (0.59996)	Top-1 acc 64.062 (63.200)	Top-5 acc 83.203 (83.497)	lr 0.00742
Train [76][3220/3239]	Time 0.256 (1.059)	Data Time 0.000 (0.565)	Loss 2.5150 (2.5202)	Entropy 0.60085 (0.59996)	Top-1 acc 64.844 (63.196)	Top-5 acc 83.203 (83.493)	lr 0.00742
Train [76][3230/3239]	Time 0.243 (1.058)	Data Time 0.000 (0.565)	Loss 2.4830 (2.5201)	Entropy 0.60085 (0.59996)	Top-1 acc 64.453 (63.196)	Top-5 acc 85.156 (83.495)	lr 0.00742
Train [76][3239/3239]	Time 0.824 (1.057)	Data Time 0.000 (0.564)	Loss 2.7079 (2.5200)	Entropy 0.60093 (0.59997)	Top-1 acc 60.494 (63.198)	Top-5 acc 76.543 (83.496)	lr 0.00742
==========Valid [76/120]	loss 1.324	top-1 acc 69.887 (69.887)	top-5 acc 88.792	Train top-1 63.198	top-5 83.496	Entropy 0.60093	Latency-None: 0.000ms	Flops: 539.00M
Train [77][0/3239]	Time 54.435 (54.435)	Data Time 52.917 (52.917)	Loss 2.3686 (2.3686)	Entropy 0.60113 (0.60113)	Top-1 acc 65.234 (65.234)	Top-5 acc 87.109 (87.109)	lr 0.00742
Train [77][10/3239]	Time 0.313 (10.701)	Data Time 0.004 (4.813)	Loss 2.3758 (2.4471)	Entropy 0.60110 (0.60114)	Top-1 acc 68.750 (66.016)	Top-5 acc 87.891 (84.908)	lr 0.00741
Train [77][20/3239]	Time 0.234 (5.813)	Data Time 0.002 (2.522)	Loss 2.4530 (2.4780)	Entropy 0.60093 (0.60107)	Top-1 acc 66.797 (64.937)	Top-5 acc 85.547 (84.561)	lr 0.00741
Train [77][30/3239]	Time 0.238 (4.074)	Data Time 0.002 (1.709)	Loss 2.2653 (2.4591)	Entropy 0.60112 (0.60102)	Top-1 acc 69.141 (65.171)	Top-5 acc 87.109 (84.677)	lr 0.00741
Train [77][40/3239]	Time 0.237 (3.181)	Data Time 0.002 (1.293)	Loss 2.4990 (2.4583)	Entropy 0.60161 (0.60109)	Top-1 acc 63.672 (65.196)	Top-5 acc 84.375 (84.642)	lr 0.00741
Train [77][50/3239]	Time 0.236 (2.638)	Data Time 0.001 (1.040)	Loss 2.2315 (2.4502)	Entropy 0.60183 (0.60119)	Top-1 acc 71.484 (65.288)	Top-5 acc 88.672 (84.766)	lr 0.00741
Train [77][60/3239]	Time 0.242 (2.275)	Data Time 0.001 (0.870)	Loss 2.5849 (2.4690)	Entropy 0.60175 (0.60128)	Top-1 acc 60.156 (64.568)	Top-5 acc 83.203 (84.471)	lr 0.00741
Train [77][70/3239]	Time 0.335 (2.015)	Data Time 0.001 (0.747)	Loss 2.6115 (2.4826)	Entropy 0.60185 (0.60134)	Top-1 acc 60.938 (64.129)	Top-5 acc 82.422 (84.270)	lr 0.00741
Train [77][80/3239]	Time 0.239 (1.819)	Data Time 0.001 (0.655)	Loss 2.5314 (2.4889)	Entropy 0.60152 (0.60139)	Top-1 acc 61.719 (63.874)	Top-5 acc 83.984 (84.129)	lr 0.00741
Train [77][90/3239]	Time 0.234 (1.667)	Data Time 0.001 (0.583)	Loss 2.6034 (2.4876)	Entropy 0.60129 (0.60140)	Top-1 acc 60.938 (63.895)	Top-5 acc 82.422 (84.195)	lr 0.00741
Train [77][100/3239]	Time 0.227 (1.544)	Data Time 0.001 (0.526)	Loss 2.3654 (2.4845)	Entropy 0.60006 (0.60134)	Top-1 acc 66.016 (63.811)	Top-5 acc 86.719 (84.259)	lr 0.00741
Train [77][110/3239]	Time 0.243 (1.469)	Data Time 0.001 (0.504)	Loss 2.3775 (2.4821)	Entropy 0.59995 (0.60121)	Top-1 acc 69.141 (63.865)	Top-5 acc 84.766 (84.273)	lr 0.00741
Train [77][120/3239]	Time 0.285 (1.395)	Data Time 0.003 (0.475)	Loss 2.4177 (2.4824)	Entropy 0.59984 (0.60111)	Top-1 acc 64.844 (63.866)	Top-5 acc 87.500 (84.252)	lr 0.00740
Train [77][130/3239]	Time 0.226 (1.324)	Data Time 0.001 (0.442)	Loss 2.6485 (2.4805)	Entropy 0.59984 (0.60101)	Top-1 acc 61.719 (63.919)	Top-5 acc 82.422 (84.300)	lr 0.00740
Train [77][140/3239]	Time 0.230 (1.311)	Data Time 0.001 (0.461)	Loss 2.5089 (2.4821)	Entropy 0.60012 (0.60093)	Top-1 acc 65.234 (63.921)	Top-5 acc 82.422 (84.253)	lr 0.00740
Train [77][150/3239]	Time 0.256 (1.259)	Data Time 0.001 (0.438)	Loss 2.7448 (2.4853)	Entropy 0.60011 (0.60088)	Top-1 acc 59.375 (63.900)	Top-5 acc 78.125 (84.215)	lr 0.00740
Train [77][160/3239]	Time 0.344 (1.213)	Data Time 0.001 (0.414)	Loss 2.4549 (2.4859)	Entropy 0.60008 (0.60083)	Top-1 acc 64.453 (63.876)	Top-5 acc 85.156 (84.217)	lr 0.00740
Train [77][170/3239]	Time 3.002 (1.202)	Data Time 2.752 (0.426)	Loss 2.4445 (2.4878)	Entropy 0.59975 (0.60078)	Top-1 acc 65.625 (63.829)	Top-5 acc 83.203 (84.183)	lr 0.00740
Train [77][180/3239]	Time 0.225 (1.169)	Data Time 0.001 (0.413)	Loss 2.5608 (2.4904)	Entropy 0.59989 (0.60073)	Top-1 acc 64.453 (63.834)	Top-5 acc 81.641 (84.118)	lr 0.00740
Train [77][190/3239]	Time 0.236 (1.145)	Data Time 0.001 (0.406)	Loss 2.4233 (2.4930)	Entropy 0.59999 (0.60068)	Top-1 acc 64.844 (63.750)	Top-5 acc 84.375 (84.080)	lr 0.00740
Train [77][200/3239]	Time 0.277 (1.126)	Data Time 0.001 (0.404)	Loss 2.7638 (2.4973)	Entropy 0.59980 (0.60065)	Top-1 acc 61.719 (63.647)	Top-5 acc 80.469 (83.998)	lr 0.00740
Train [77][210/3239]	Time 0.285 (1.111)	Data Time 0.002 (0.403)	Loss 2.4857 (2.4983)	Entropy 0.59965 (0.60061)	Top-1 acc 64.062 (63.613)	Top-5 acc 83.594 (83.964)	lr 0.00740
Train [77][220/3239]	Time 0.233 (1.106)	Data Time 0.001 (0.410)	Loss 2.5872 (2.4994)	Entropy 0.59906 (0.60056)	Top-1 acc 61.328 (63.591)	Top-5 acc 82.422 (83.956)	lr 0.00740
Train [77][230/3239]	Time 1.657 (1.082)	Data Time 1.255 (0.398)	Loss 2.3781 (2.4981)	Entropy 0.59909 (0.60049)	Top-1 acc 69.922 (63.643)	Top-5 acc 86.719 (83.996)	lr 0.00739
Train [77][240/3239]	Time 0.228 (1.057)	Data Time 0.001 (0.384)	Loss 2.7454 (2.4984)	Entropy 0.59906 (0.60043)	Top-1 acc 55.469 (63.605)	Top-5 acc 82.031 (83.994)	lr 0.00739
Train [77][250/3239]	Time 0.236 (1.052)	Data Time 0.002 (0.390)	Loss 2.5743 (2.4956)	Entropy 0.59875 (0.60037)	Top-1 acc 62.109 (63.719)	Top-5 acc 81.250 (84.030)	lr 0.00739
Train [77][260/3239]	Time 0.229 (1.037)	Data Time 0.001 (0.384)	Loss 2.4617 (2.4956)	Entropy 0.59874 (0.60031)	Top-1 acc 65.625 (63.721)	Top-5 acc 83.984 (84.026)	lr 0.00739
Train [77][270/3239]	Time 0.262 (1.024)	Data Time 0.001 (0.380)	Loss 2.5028 (2.4957)	Entropy 0.59864 (0.60025)	Top-1 acc 60.938 (63.698)	Top-5 acc 83.203 (84.010)	lr 0.00739
Train [77][280/3239]	Time 0.237 (1.024)	Data Time 0.001 (0.387)	Loss 2.6485 (2.4994)	Entropy 0.59829 (0.60019)	Top-1 acc 60.156 (63.593)	Top-5 acc 78.125 (83.936)	lr 0.00739
Train [77][290/3239]	Time 0.230 (1.007)	Data Time 0.001 (0.378)	Loss 2.4728 (2.5006)	Entropy 0.59823 (0.60012)	Top-1 acc 66.016 (63.602)	Top-5 acc 83.594 (83.916)	lr 0.00739
Train [77][300/3239]	Time 0.523 (1.002)	Data Time 0.295 (0.380)	Loss 2.4201 (2.5000)	Entropy 0.59843 (0.60006)	Top-1 acc 62.891 (63.643)	Top-5 acc 84.766 (83.904)	lr 0.00739
Train [77][310/3239]	Time 0.281 (1.000)	Data Time 0.001 (0.384)	Loss 2.4711 (2.4990)	Entropy 0.59867 (0.60001)	Top-1 acc 63.281 (63.700)	Top-5 acc 84.766 (83.905)	lr 0.00739
Train [77][320/3239]	Time 0.227 (0.987)	Data Time 0.001 (0.377)	Loss 2.6246 (2.4995)	Entropy 0.59886 (0.59997)	Top-1 acc 59.375 (63.693)	Top-5 acc 79.688 (83.874)	lr 0.00739
Train [77][330/3239]	Time 0.248 (0.979)	Data Time 0.001 (0.375)	Loss 2.3477 (2.5006)	Entropy 0.59926 (0.59994)	Top-1 acc 64.844 (63.682)	Top-5 acc 86.328 (83.842)	lr 0.00739
Train [77][340/3239]	Time 2.188 (0.981)	Data Time 1.931 (0.383)	Loss 2.3187 (2.5008)	Entropy 0.59923 (0.59992)	Top-1 acc 68.750 (63.682)	Top-5 acc 87.500 (83.841)	lr 0.00738
Train [77][350/3239]	Time 0.255 (0.973)	Data Time 0.001 (0.379)	Loss 2.5791 (2.5020)	Entropy 0.59910 (0.59990)	Top-1 acc 60.156 (63.669)	Top-5 acc 82.031 (83.803)	lr 0.00738
Train [77][360/3239]	Time 0.224 (0.968)	Data Time 0.001 (0.378)	Loss 2.5246 (2.5017)	Entropy 0.59916 (0.59988)	Top-1 acc 61.328 (63.661)	Top-5 acc 83.594 (83.816)	lr 0.00738
Train [77][370/3239]	Time 0.239 (0.964)	Data Time 0.002 (0.378)	Loss 2.4517 (2.5017)	Entropy 0.59905 (0.59987)	Top-1 acc 65.234 (63.683)	Top-5 acc 84.375 (83.801)	lr 0.00738
Train [77][380/3239]	Time 0.224 (0.967)	Data Time 0.001 (0.386)	Loss 2.4694 (2.5029)	Entropy 0.59902 (0.59984)	Top-1 acc 63.281 (63.642)	Top-5 acc 87.109 (83.794)	lr 0.00738
Train [77][390/3239]	Time 0.324 (0.952)	Data Time 0.001 (0.376)	Loss 2.4350 (2.5029)	Entropy 0.59904 (0.59982)	Top-1 acc 68.359 (63.644)	Top-5 acc 82.422 (83.775)	lr 0.00738
Train [77][400/3239]	Time 0.222 (0.953)	Data Time 0.001 (0.381)	Loss 2.7879 (2.5029)	Entropy 0.59890 (0.59980)	Top-1 acc 55.469 (63.628)	Top-5 acc 76.172 (83.773)	lr 0.00738
Train [77][410/3239]	Time 0.249 (0.962)	Data Time 0.001 (0.393)	Loss 2.3403 (2.5031)	Entropy 0.59920 (0.59978)	Top-1 acc 68.359 (63.634)	Top-5 acc 86.719 (83.756)	lr 0.00738
Train [77][420/3239]	Time 0.284 (0.949)	Data Time 0.001 (0.384)	Loss 2.3808 (2.5009)	Entropy 0.59925 (0.59977)	Top-1 acc 66.797 (63.673)	Top-5 acc 86.719 (83.802)	lr 0.00738
Train [77][430/3239]	Time 0.276 (0.949)	Data Time 0.001 (0.388)	Loss 2.3921 (2.4999)	Entropy 0.59923 (0.59976)	Top-1 acc 65.625 (63.688)	Top-5 acc 87.500 (83.822)	lr 0.00738
Train [77][440/3239]	Time 0.233 (0.957)	Data Time 0.002 (0.399)	Loss 2.5444 (2.5013)	Entropy 0.59908 (0.59975)	Top-1 acc 64.844 (63.672)	Top-5 acc 83.203 (83.792)	lr 0.00738
Train [77][450/3239]	Time 0.239 (0.948)	Data Time 0.001 (0.393)	Loss 2.6461 (2.5011)	Entropy 0.59902 (0.59973)	Top-1 acc 59.375 (63.679)	Top-5 acc 83.203 (83.804)	lr 0.00737
Train [77][460/3239]	Time 2.060 (0.947)	Data Time 1.732 (0.395)	Loss 2.4538 (2.5015)	Entropy 0.59889 (0.59972)	Top-1 acc 64.062 (63.665)	Top-5 acc 84.375 (83.809)	lr 0.00737
Train [77][470/3239]	Time 0.235 (0.954)	Data Time 0.001 (0.405)	Loss 2.3978 (2.5023)	Entropy 0.59859 (0.59970)	Top-1 acc 68.359 (63.668)	Top-5 acc 85.547 (83.794)	lr 0.00737
Train [77][480/3239]	Time 0.229 (0.951)	Data Time 0.001 (0.405)	Loss 2.7338 (2.5018)	Entropy 0.59866 (0.59967)	Top-1 acc 55.859 (63.678)	Top-5 acc 80.859 (83.812)	lr 0.00737
Train [77][490/3239]	Time 0.235 (0.942)	Data Time 0.001 (0.398)	Loss 2.5238 (2.5018)	Entropy 0.59902 (0.59966)	Top-1 acc 62.500 (63.654)	Top-5 acc 83.203 (83.820)	lr 0.00737
Train [77][500/3239]	Time 4.289 (0.951)	Data Time 4.043 (0.409)	Loss 2.5264 (2.5015)	Entropy 0.59891 (0.59964)	Top-1 acc 65.234 (63.658)	Top-5 acc 83.203 (83.818)	lr 0.00737
Train [77][510/3239]	Time 0.495 (0.953)	Data Time 0.260 (0.414)	Loss 2.5896 (2.5017)	Entropy 0.59935 (0.59963)	Top-1 acc 60.156 (63.659)	Top-5 acc 82.422 (83.818)	lr 0.00737
Train [77][520/3239]	Time 0.235 (0.943)	Data Time 0.001 (0.406)	Loss 2.4977 (2.5023)	Entropy 0.59941 (0.59963)	Top-1 acc 61.719 (63.631)	Top-5 acc 84.375 (83.803)	lr 0.00737
Train [77][530/3239]	Time 0.230 (0.949)	Data Time 0.001 (0.414)	Loss 2.3672 (2.5022)	Entropy 0.59916 (0.59962)	Top-1 acc 66.406 (63.637)	Top-5 acc 85.156 (83.800)	lr 0.00737
Train [77][540/3239]	Time 0.226 (0.957)	Data Time 0.001 (0.423)	Loss 2.6415 (2.5019)	Entropy 0.59915 (0.59961)	Top-1 acc 58.984 (63.636)	Top-5 acc 80.469 (83.805)	lr 0.00737
Train [77][550/3239]	Time 0.363 (0.947)	Data Time 0.001 (0.416)	Loss 2.5035 (2.5023)	Entropy 0.59901 (0.59961)	Top-1 acc 63.281 (63.631)	Top-5 acc 85.156 (83.809)	lr 0.00737
Train [77][560/3239]	Time 0.493 (0.950)	Data Time 0.218 (0.421)	Loss 2.6135 (2.5023)	Entropy 0.59902 (0.59959)	Top-1 acc 62.891 (63.627)	Top-5 acc 82.422 (83.813)	lr 0.00736
Train [77][570/3239]	Time 0.252 (0.950)	Data Time 0.002 (0.422)	Loss 2.5971 (2.5030)	Entropy 0.59879 (0.59958)	Top-1 acc 60.156 (63.590)	Top-5 acc 83.984 (83.798)	lr 0.00736
Train [77][580/3239]	Time 0.239 (0.947)	Data Time 0.001 (0.422)	Loss 2.8310 (2.5044)	Entropy 0.59859 (0.59957)	Top-1 acc 58.203 (63.555)	Top-5 acc 78.906 (83.768)	lr 0.00736
Train [77][590/3239]	Time 0.231 (0.954)	Data Time 0.001 (0.431)	Loss 2.4837 (2.5046)	Entropy 0.59875 (0.59955)	Top-1 acc 67.969 (63.551)	Top-5 acc 83.203 (83.763)	lr 0.00736
Train [77][600/3239]	Time 0.243 (0.949)	Data Time 0.001 (0.428)	Loss 2.3317 (2.5040)	Entropy 0.59844 (0.59954)	Top-1 acc 66.797 (63.559)	Top-5 acc 90.234 (83.785)	lr 0.00736
Train [77][610/3239]	Time 0.235 (0.951)	Data Time 0.001 (0.431)	Loss 2.5746 (2.5048)	Entropy 0.59833 (0.59952)	Top-1 acc 63.281 (63.533)	Top-5 acc 82.031 (83.766)	lr 0.00736
Train [77][620/3239]	Time 7.849 (0.959)	Data Time 7.461 (0.440)	Loss 2.5317 (2.5057)	Entropy 0.59823 (0.59950)	Top-1 acc 63.672 (63.505)	Top-5 acc 85.547 (83.745)	lr 0.00736
Train [77][630/3239]	Time 0.250 (0.956)	Data Time 0.003 (0.439)	Loss 2.5472 (2.5051)	Entropy 0.59844 (0.59948)	Top-1 acc 65.234 (63.528)	Top-5 acc 83.203 (83.749)	lr 0.00736
Train [77][640/3239]	Time 0.239 (0.951)	Data Time 0.001 (0.435)	Loss 2.5221 (2.5058)	Entropy 0.59853 (0.59946)	Top-1 acc 67.578 (63.514)	Top-5 acc 80.078 (83.727)	lr 0.00736
Train [77][650/3239]	Time 0.234 (0.954)	Data Time 0.001 (0.439)	Loss 2.5150 (2.5052)	Entropy 0.59875 (0.59945)	Top-1 acc 65.625 (63.535)	Top-5 acc 84.375 (83.740)	lr 0.00736
Train [77][660/3239]	Time 5.049 (0.969)	Data Time 4.787 (0.456)	Loss 2.4901 (2.5056)	Entropy 0.59869 (0.59944)	Top-1 acc 63.672 (63.525)	Top-5 acc 84.375 (83.736)	lr 0.00735
Train [77][670/3239]	Time 0.298 (1.042)	Data Time 0.002 (0.450)	Loss 2.5261 (2.5057)	Entropy 0.59874 (0.59943)	Top-1 acc 61.719 (63.519)	Top-5 acc 84.375 (83.742)	lr 0.00735
Train [77][680/3239]	Time 0.249 (1.033)	Data Time 0.002 (0.443)	Loss 2.4579 (2.5052)	Entropy 0.59853 (0.59942)	Top-1 acc 64.453 (63.533)	Top-5 acc 84.375 (83.756)	lr 0.00735
Train [77][690/3239]	Time 0.240 (1.025)	Data Time 0.001 (0.437)	Loss 2.5457 (2.5048)	Entropy 0.59864 (0.59940)	Top-1 acc 60.547 (63.548)	Top-5 acc 83.203 (83.752)	lr 0.00735
Train [77][700/3239]	Time 0.246 (1.016)	Data Time 0.001 (0.430)	Loss 2.3141 (2.5045)	Entropy 0.59860 (0.59939)	Top-1 acc 68.359 (63.558)	Top-5 acc 86.719 (83.756)	lr 0.00735
Train [77][710/3239]	Time 0.349 (1.008)	Data Time 0.002 (0.424)	Loss 2.7613 (2.5056)	Entropy 0.59881 (0.59938)	Top-1 acc 57.422 (63.547)	Top-5 acc 77.344 (83.728)	lr 0.00735
Train [77][720/3239]	Time 0.232 (0.999)	Data Time 0.001 (0.419)	Loss 2.4637 (2.5057)	Entropy 0.59861 (0.59938)	Top-1 acc 65.625 (63.550)	Top-5 acc 85.938 (83.725)	lr 0.00735
Train [77][730/3239]	Time 0.232 (0.995)	Data Time 0.001 (0.417)	Loss 2.6908 (2.5068)	Entropy 0.59857 (0.59937)	Top-1 acc 62.109 (63.526)	Top-5 acc 82.031 (83.709)	lr 0.00735
Train [77][740/3239]	Time 0.225 (0.991)	Data Time 0.001 (0.415)	Loss 2.5983 (2.5072)	Entropy 0.59832 (0.59935)	Top-1 acc 64.453 (63.535)	Top-5 acc 81.250 (83.698)	lr 0.00735
Train [77][750/3239]	Time 0.233 (0.986)	Data Time 0.001 (0.411)	Loss 2.3825 (2.5080)	Entropy 0.59818 (0.59934)	Top-1 acc 66.016 (63.513)	Top-5 acc 87.500 (83.680)	lr 0.00735
Train [77][760/3239]	Time 0.235 (0.978)	Data Time 0.001 (0.405)	Loss 2.2312 (2.5071)	Entropy 0.59784 (0.59932)	Top-1 acc 69.922 (63.534)	Top-5 acc 89.844 (83.696)	lr 0.00735
Train [77][770/3239]	Time 0.408 (0.992)	Data Time 0.003 (0.420)	Loss 2.6258 (2.5074)	Entropy 0.59763 (0.59930)	Top-1 acc 60.547 (63.544)	Top-5 acc 83.594 (83.691)	lr 0.00734
Train [77][780/3239]	Time 0.332 (0.986)	Data Time 0.001 (0.416)	Loss 2.5100 (2.5083)	Entropy 0.59775 (0.59928)	Top-1 acc 64.844 (63.524)	Top-5 acc 82.031 (83.671)	lr 0.00734
Train [77][790/3239]	Time 0.246 (0.979)	Data Time 0.001 (0.411)	Loss 2.4725 (2.5088)	Entropy 0.59739 (0.59926)	Top-1 acc 64.062 (63.515)	Top-5 acc 85.156 (83.659)	lr 0.00734
Train [77][800/3239]	Time 0.247 (0.991)	Data Time 0.001 (0.425)	Loss 2.5444 (2.5096)	Entropy 0.59752 (0.59924)	Top-1 acc 64.453 (63.502)	Top-5 acc 81.250 (83.643)	lr 0.00734
Train [77][810/3239]	Time 0.262 (0.988)	Data Time 0.001 (0.424)	Loss 2.4086 (2.5101)	Entropy 0.59780 (0.59922)	Top-1 acc 67.969 (63.496)	Top-5 acc 87.891 (83.631)	lr 0.00734
Train [77][820/3239]	Time 0.235 (0.981)	Data Time 0.001 (0.419)	Loss 2.3609 (2.5099)	Entropy 0.59790 (0.59920)	Top-1 acc 70.703 (63.500)	Top-5 acc 85.938 (83.632)	lr 0.00734
Train [77][830/3239]	Time 0.243 (0.992)	Data Time 0.002 (0.431)	Loss 2.4565 (2.5103)	Entropy 0.59793 (0.59919)	Top-1 acc 64.844 (63.489)	Top-5 acc 87.109 (83.627)	lr 0.00734
Train [77][840/3239]	Time 0.260 (0.988)	Data Time 0.001 (0.429)	Loss 2.4651 (2.5102)	Entropy 0.59806 (0.59917)	Top-1 acc 63.672 (63.491)	Top-5 acc 87.109 (83.630)	lr 0.00734
Train [77][850/3239]	Time 0.242 (0.982)	Data Time 0.002 (0.424)	Loss 2.4833 (2.5098)	Entropy 0.59810 (0.59916)	Top-1 acc 65.234 (63.494)	Top-5 acc 80.859 (83.635)	lr 0.00734
Train [77][860/3239]	Time 0.234 (0.993)	Data Time 0.001 (0.437)	Loss 2.5881 (2.5097)	Entropy 0.59821 (0.59915)	Top-1 acc 58.984 (63.490)	Top-5 acc 83.203 (83.636)	lr 0.00734
Train [77][870/3239]	Time 0.266 (0.990)	Data Time 0.001 (0.435)	Loss 2.4218 (2.5095)	Entropy 0.59831 (0.59914)	Top-1 acc 66.016 (63.487)	Top-5 acc 83.594 (83.638)	lr 0.00734
Train [77][880/3239]	Time 0.291 (0.990)	Data Time 0.002 (0.436)	Loss 2.4624 (2.5093)	Entropy 0.59805 (0.59913)	Top-1 acc 67.969 (63.490)	Top-5 acc 83.984 (83.646)	lr 0.00733
Train [77][890/3239]	Time 0.262 (0.996)	Data Time 0.001 (0.443)	Loss 2.3037 (2.5088)	Entropy 0.59810 (0.59911)	Top-1 acc 70.312 (63.504)	Top-5 acc 86.719 (83.659)	lr 0.00733
Train [77][900/3239]	Time 0.263 (0.993)	Data Time 0.001 (0.441)	Loss 2.4974 (2.5087)	Entropy 0.59828 (0.59910)	Top-1 acc 61.719 (63.509)	Top-5 acc 82.812 (83.648)	lr 0.00733
Train [77][910/3239]	Time 0.264 (0.992)	Data Time 0.001 (0.442)	Loss 2.5665 (2.5085)	Entropy 0.59832 (0.59909)	Top-1 acc 59.375 (63.512)	Top-5 acc 83.594 (83.658)	lr 0.00733
Train [77][920/3239]	Time 0.255 (0.987)	Data Time 0.001 (0.437)	Loss 2.6216 (2.5089)	Entropy 0.59834 (0.59909)	Top-1 acc 60.156 (63.502)	Top-5 acc 81.641 (83.646)	lr 0.00733
Train [77][930/3239]	Time 0.239 (1.001)	Data Time 0.001 (0.453)	Loss 2.5521 (2.5082)	Entropy 0.59849 (0.59908)	Top-1 acc 65.234 (63.514)	Top-5 acc 81.641 (83.663)	lr 0.00733
Train [77][940/3239]	Time 0.338 (0.995)	Data Time 0.001 (0.448)	Loss 2.4205 (2.5077)	Entropy 0.59846 (0.59907)	Top-1 acc 66.406 (63.525)	Top-5 acc 81.250 (83.668)	lr 0.00733
Train [77][950/3239]	Time 0.236 (0.989)	Data Time 0.001 (0.444)	Loss 2.5768 (2.5077)	Entropy 0.59829 (0.59906)	Top-1 acc 65.234 (63.521)	Top-5 acc 83.203 (83.675)	lr 0.00733
Train [77][960/3239]	Time 0.240 (1.010)	Data Time 0.001 (0.466)	Loss 2.3849 (2.5082)	Entropy 0.59819 (0.59905)	Top-1 acc 65.625 (63.497)	Top-5 acc 85.156 (83.668)	lr 0.00733
Train [77][970/3239]	Time 0.235 (1.004)	Data Time 0.001 (0.462)	Loss 2.5039 (2.5085)	Entropy 0.59778 (0.59904)	Top-1 acc 60.547 (63.491)	Top-5 acc 83.594 (83.659)	lr 0.00733
Train [77][980/3239]	Time 0.236 (0.998)	Data Time 0.002 (0.457)	Loss 2.3629 (2.5087)	Entropy 0.59779 (0.59903)	Top-1 acc 66.406 (63.480)	Top-5 acc 85.156 (83.652)	lr 0.00733
Train [77][990/3239]	Time 7.024 (1.015)	Data Time 6.772 (0.475)	Loss 2.7445 (2.5090)	Entropy 0.59787 (0.59902)	Top-1 acc 57.422 (63.472)	Top-5 acc 78.906 (83.650)	lr 0.00732
Train [77][1000/3239]	Time 0.231 (1.009)	Data Time 0.001 (0.470)	Loss 2.7477 (2.5095)	Entropy 0.59788 (0.59901)	Top-1 acc 59.766 (63.463)	Top-5 acc 78.516 (83.643)	lr 0.00732
Train [77][1010/3239]	Time 0.326 (1.003)	Data Time 0.001 (0.466)	Loss 2.5253 (2.5092)	Entropy 0.59788 (0.59900)	Top-1 acc 61.719 (63.468)	Top-5 acc 83.203 (83.654)	lr 0.00732
Train [77][1020/3239]	Time 0.240 (1.017)	Data Time 0.001 (0.481)	Loss 2.3944 (2.5095)	Entropy 0.59796 (0.59899)	Top-1 acc 65.625 (63.457)	Top-5 acc 85.938 (83.649)	lr 0.00732
Train [77][1030/3239]	Time 0.231 (1.013)	Data Time 0.001 (0.478)	Loss 2.8204 (2.5101)	Entropy 0.59827 (0.59898)	Top-1 acc 55.859 (63.444)	Top-5 acc 79.688 (83.641)	lr 0.00732
Train [77][1040/3239]	Time 0.244 (1.008)	Data Time 0.001 (0.475)	Loss 2.7439 (2.5104)	Entropy 0.59843 (0.59897)	Top-1 acc 58.594 (63.434)	Top-5 acc 78.125 (83.632)	lr 0.00732
Train [77][1050/3239]	Time 0.236 (1.023)	Data Time 0.002 (0.491)	Loss 2.6140 (2.5104)	Entropy 0.59850 (0.59897)	Top-1 acc 58.203 (63.441)	Top-5 acc 82.812 (83.634)	lr 0.00732
Train [77][1060/3239]	Time 0.269 (1.018)	Data Time 0.001 (0.487)	Loss 2.3672 (2.5101)	Entropy 0.59856 (0.59896)	Top-1 acc 64.844 (63.442)	Top-5 acc 86.328 (83.639)	lr 0.00732
Train [77][1070/3239]	Time 0.226 (1.015)	Data Time 0.001 (0.485)	Loss 2.5563 (2.5101)	Entropy 0.59885 (0.59896)	Top-1 acc 62.500 (63.445)	Top-5 acc 81.641 (83.643)	lr 0.00732
Train [77][1080/3239]	Time 0.238 (1.012)	Data Time 0.001 (0.483)	Loss 2.4646 (2.5100)	Entropy 0.59895 (0.59896)	Top-1 acc 64.453 (63.444)	Top-5 acc 82.031 (83.643)	lr 0.00732
Train [77][1090/3239]	Time 0.247 (1.024)	Data Time 0.001 (0.496)	Loss 2.3776 (2.5100)	Entropy 0.59868 (0.59896)	Top-1 acc 66.016 (63.438)	Top-5 acc 84.766 (83.644)	lr 0.00732
Train [77][1100/3239]	Time 4.781 (1.023)	Data Time 4.418 (0.496)	Loss 2.5333 (2.5098)	Entropy 0.59873 (0.59896)	Top-1 acc 60.547 (63.446)	Top-5 acc 84.375 (83.648)	lr 0.00731
Train [77][1110/3239]	Time 0.986 (1.018)	Data Time 0.734 (0.492)	Loss 2.4982 (2.5096)	Entropy 0.59851 (0.59895)	Top-1 acc 63.672 (63.450)	Top-5 acc 83.984 (83.650)	lr 0.00731
Train [77][1120/3239]	Time 0.238 (1.030)	Data Time 0.001 (0.505)	Loss 2.5452 (2.5094)	Entropy 0.59841 (0.59895)	Top-1 acc 60.547 (63.446)	Top-5 acc 81.641 (83.663)	lr 0.00731
Train [77][1130/3239]	Time 0.234 (1.025)	Data Time 0.001 (0.501)	Loss 2.3870 (2.5093)	Entropy 0.59819 (0.59895)	Top-1 acc 66.797 (63.450)	Top-5 acc 86.719 (83.667)	lr 0.00731
Train [77][1140/3239]	Time 0.244 (1.025)	Data Time 0.001 (0.502)	Loss 2.3621 (2.5092)	Entropy 0.59837 (0.59894)	Top-1 acc 65.625 (63.456)	Top-5 acc 87.891 (83.671)	lr 0.00731
Train [77][1150/3239]	Time 4.952 (1.038)	Data Time 4.698 (0.516)	Loss 2.3884 (2.5093)	Entropy 0.59849 (0.59893)	Top-1 acc 66.797 (63.444)	Top-5 acc 89.062 (83.672)	lr 0.00731
Train [77][1160/3239]	Time 0.238 (1.033)	Data Time 0.001 (0.512)	Loss 2.4561 (2.5091)	Entropy 0.59859 (0.59893)	Top-1 acc 65.625 (63.452)	Top-5 acc 87.109 (83.682)	lr 0.00731
Train [77][1170/3239]	Time 0.359 (1.031)	Data Time 0.002 (0.510)	Loss 2.8735 (2.5089)	Entropy 0.59881 (0.59893)	Top-1 acc 55.078 (63.469)	Top-5 acc 77.734 (83.686)	lr 0.00731
Train [77][1180/3239]	Time 0.230 (1.046)	Data Time 0.001 (0.527)	Loss 2.4043 (2.5091)	Entropy 0.59869 (0.59893)	Top-1 acc 65.234 (63.462)	Top-5 acc 85.547 (83.685)	lr 0.00731
Train [77][1190/3239]	Time 0.236 (1.043)	Data Time 0.001 (0.525)	Loss 2.3975 (2.5088)	Entropy 0.59860 (0.59893)	Top-1 acc 66.406 (63.475)	Top-5 acc 85.547 (83.691)	lr 0.00731
Train [77][1200/3239]	Time 0.236 (1.038)	Data Time 0.001 (0.521)	Loss 2.5926 (2.5088)	Entropy 0.59843 (0.59892)	Top-1 acc 61.328 (63.479)	Top-5 acc 82.031 (83.691)	lr 0.00731
Train [77][1210/3239]	Time 0.255 (1.055)	Data Time 0.001 (0.538)	Loss 2.4528 (2.5088)	Entropy 0.59864 (0.59892)	Top-1 acc 63.672 (63.480)	Top-5 acc 84.766 (83.686)	lr 0.00730
Train [77][1220/3239]	Time 0.308 (1.052)	Data Time 0.002 (0.535)	Loss 2.4332 (2.5085)	Entropy 0.59871 (0.59892)	Top-1 acc 64.453 (63.479)	Top-5 acc 82.422 (83.692)	lr 0.00730
Train [77][1230/3239]	Time 0.227 (1.046)	Data Time 0.001 (0.531)	Loss 2.3668 (2.5085)	Entropy 0.59875 (0.59892)	Top-1 acc 66.406 (63.478)	Top-5 acc 85.938 (83.693)	lr 0.00730
Train [77][1240/3239]	Time 0.237 (1.048)	Data Time 0.002 (0.534)	Loss 2.6699 (2.5088)	Entropy 0.59852 (0.59892)	Top-1 acc 61.328 (63.469)	Top-5 acc 79.297 (83.684)	lr 0.00730
Train [77][1250/3239]	Time 0.246 (1.058)	Data Time 0.001 (0.544)	Loss 2.5003 (2.5091)	Entropy 0.59813 (0.59891)	Top-1 acc 64.844 (63.477)	Top-5 acc 81.641 (83.678)	lr 0.00730
Train [77][1260/3239]	Time 0.396 (1.053)	Data Time 0.002 (0.539)	Loss 2.4518 (2.5095)	Entropy 0.59837 (0.59890)	Top-1 acc 65.234 (63.470)	Top-5 acc 80.469 (83.668)	lr 0.00730
Train [77][1270/3239]	Time 3.240 (1.050)	Data Time 2.998 (0.538)	Loss 2.6574 (2.5094)	Entropy 0.59837 (0.59890)	Top-1 acc 60.547 (63.472)	Top-5 acc 81.250 (83.665)	lr 0.00730
Train [77][1280/3239]	Time 0.238 (1.066)	Data Time 0.001 (0.554)	Loss 2.6028 (2.5098)	Entropy 0.59844 (0.59890)	Top-1 acc 61.719 (63.468)	Top-5 acc 82.422 (83.657)	lr 0.00730
Train [77][1290/3239]	Time 0.244 (1.061)	Data Time 0.001 (0.550)	Loss 2.5975 (2.5101)	Entropy 0.59852 (0.59889)	Top-1 acc 62.109 (63.456)	Top-5 acc 79.297 (83.652)	lr 0.00730
Train [77][1300/3239]	Time 0.250 (1.056)	Data Time 0.001 (0.546)	Loss 2.5909 (2.5104)	Entropy 0.59862 (0.59889)	Top-1 acc 59.375 (63.448)	Top-5 acc 83.984 (83.647)	lr 0.00730
Train [77][1310/3239]	Time 3.213 (1.075)	Data Time 2.933 (0.565)	Loss 2.3575 (2.5109)	Entropy 0.59867 (0.59889)	Top-1 acc 66.797 (63.443)	Top-5 acc 85.938 (83.639)	lr 0.00730
Train [77][1320/3239]	Time 0.354 (1.115)	Data Time 0.005 (0.564)	Loss 2.4121 (2.5107)	Entropy 0.59884 (0.59888)	Top-1 acc 65.234 (63.446)	Top-5 acc 85.156 (83.643)	lr 0.00729
Train [77][1330/3239]	Time 0.355 (1.111)	Data Time 0.002 (0.560)	Loss 2.4528 (2.5110)	Entropy 0.59888 (0.59888)	Top-1 acc 63.281 (63.437)	Top-5 acc 83.203 (83.635)	lr 0.00729
Train [77][1340/3239]	Time 0.245 (1.106)	Data Time 0.001 (0.556)	Loss 2.6382 (2.5109)	Entropy 0.59874 (0.59888)	Top-1 acc 63.672 (63.441)	Top-5 acc 79.297 (83.635)	lr 0.00729
Train [77][1350/3239]	Time 0.268 (1.101)	Data Time 0.002 (0.551)	Loss 2.3837 (2.5109)	Entropy 0.59834 (0.59888)	Top-1 acc 66.797 (63.446)	Top-5 acc 85.156 (83.635)	lr 0.00729
Train [77][1360/3239]	Time 0.253 (1.096)	Data Time 0.001 (0.547)	Loss 2.5255 (2.5114)	Entropy 0.59858 (0.59888)	Top-1 acc 60.547 (63.433)	Top-5 acc 83.594 (83.623)	lr 0.00729
Train [77][1370/3239]	Time 0.262 (1.091)	Data Time 0.001 (0.543)	Loss 2.5078 (2.5111)	Entropy 0.59876 (0.59888)	Top-1 acc 61.719 (63.441)	Top-5 acc 84.375 (83.625)	lr 0.00729
Train [77][1380/3239]	Time 0.256 (1.089)	Data Time 0.001 (0.542)	Loss 2.4893 (2.5110)	Entropy 0.59896 (0.59888)	Top-1 acc 63.672 (63.441)	Top-5 acc 85.547 (83.631)	lr 0.00729
Train [77][1390/3239]	Time 0.251 (1.096)	Data Time 0.001 (0.550)	Loss 2.6122 (2.5115)	Entropy 0.59940 (0.59888)	Top-1 acc 60.547 (63.428)	Top-5 acc 82.812 (83.625)	lr 0.00729
Train [77][1400/3239]	Time 0.259 (1.095)	Data Time 0.002 (0.549)	Loss 2.3722 (2.5118)	Entropy 0.59940 (0.59888)	Top-1 acc 63.672 (63.418)	Top-5 acc 85.938 (83.615)	lr 0.00729
Train [77][1410/3239]	Time 0.232 (1.101)	Data Time 0.001 (0.556)	Loss 2.7481 (2.5118)	Entropy 0.59921 (0.59888)	Top-1 acc 52.344 (63.417)	Top-5 acc 78.125 (83.616)	lr 0.00729
Train [77][1420/3239]	Time 0.347 (1.103)	Data Time 0.001 (0.559)	Loss 2.6648 (2.5123)	Entropy 0.59917 (0.59889)	Top-1 acc 58.203 (63.409)	Top-5 acc 83.203 (83.605)	lr 0.00729
Train [77][1430/3239]	Time 0.234 (1.098)	Data Time 0.001 (0.555)	Loss 2.3796 (2.5120)	Entropy 0.59936 (0.59889)	Top-1 acc 66.406 (63.423)	Top-5 acc 85.156 (83.608)	lr 0.00728
Train [77][1440/3239]	Time 0.243 (1.109)	Data Time 0.001 (0.567)	Loss 2.6897 (2.5118)	Entropy 0.59923 (0.59889)	Top-1 acc 58.594 (63.431)	Top-5 acc 78.906 (83.607)	lr 0.00728
Train [77][1450/3239]	Time 5.855 (1.116)	Data Time 5.604 (0.575)	Loss 2.5525 (2.5118)	Entropy 0.59900 (0.59889)	Top-1 acc 61.719 (63.420)	Top-5 acc 84.375 (83.609)	lr 0.00728
Train [77][1460/3239]	Time 0.250 (1.112)	Data Time 0.001 (0.571)	Loss 2.6021 (2.5118)	Entropy 0.59895 (0.59889)	Top-1 acc 61.328 (63.421)	Top-5 acc 79.688 (83.611)	lr 0.00728
Train [77][1470/3239]	Time 0.243 (1.107)	Data Time 0.001 (0.567)	Loss 2.3870 (2.5118)	Entropy 0.59915 (0.59889)	Top-1 acc 64.453 (63.416)	Top-5 acc 88.281 (83.617)	lr 0.00728
Train [77][1480/3239]	Time 5.308 (1.121)	Data Time 5.064 (0.581)	Loss 2.4629 (2.5119)	Entropy 0.59873 (0.59890)	Top-1 acc 65.625 (63.420)	Top-5 acc 85.156 (83.611)	lr 0.00728
Train [77][1490/3239]	Time 0.333 (1.122)	Data Time 0.001 (0.583)	Loss 2.5645 (2.5119)	Entropy 0.59875 (0.59889)	Top-1 acc 61.328 (63.421)	Top-5 acc 83.594 (83.611)	lr 0.00728
Train [77][1500/3239]	Time 0.251 (1.118)	Data Time 0.001 (0.580)	Loss 2.5220 (2.5120)	Entropy 0.59890 (0.59889)	Top-1 acc 66.016 (63.417)	Top-5 acc 82.422 (83.611)	lr 0.00728
Train [77][1510/3239]	Time 0.275 (1.129)	Data Time 0.001 (0.591)	Loss 2.6456 (2.5121)	Entropy 0.59855 (0.59889)	Top-1 acc 60.938 (63.412)	Top-5 acc 82.812 (83.610)	lr 0.00728
Train [77][1520/3239]	Time 0.260 (1.129)	Data Time 0.001 (0.592)	Loss 2.5205 (2.5121)	Entropy 0.59814 (0.59889)	Top-1 acc 64.453 (63.414)	Top-5 acc 82.422 (83.606)	lr 0.00728
Train [77][1530/3239]	Time 0.258 (1.127)	Data Time 0.001 (0.590)	Loss 2.6861 (2.5122)	Entropy 0.59847 (0.59889)	Top-1 acc 57.422 (63.409)	Top-5 acc 80.078 (83.605)	lr 0.00728
Train [77][1540/3239]	Time 0.269 (1.140)	Data Time 0.002 (0.604)	Loss 2.3902 (2.5123)	Entropy 0.59866 (0.59888)	Top-1 acc 67.578 (63.409)	Top-5 acc 86.719 (83.606)	lr 0.00727
Train [77][1550/3239]	Time 0.246 (1.137)	Data Time 0.001 (0.601)	Loss 2.5313 (2.5121)	Entropy 0.59874 (0.59888)	Top-1 acc 64.062 (63.417)	Top-5 acc 82.031 (83.608)	lr 0.00727
Train [77][1560/3239]	Time 0.249 (1.134)	Data Time 0.001 (0.599)	Loss 2.4114 (2.5121)	Entropy 0.59874 (0.59888)	Top-1 acc 65.625 (63.419)	Top-5 acc 86.328 (83.604)	lr 0.00727
Train [77][1570/3239]	Time 0.240 (1.148)	Data Time 0.001 (0.614)	Loss 2.4844 (2.5119)	Entropy 0.59881 (0.59888)	Top-1 acc 68.750 (63.428)	Top-5 acc 86.719 (83.608)	lr 0.00727
Train [77][1580/3239]	Time 0.270 (1.144)	Data Time 0.001 (0.611)	Loss 2.5438 (2.5121)	Entropy 0.59890 (0.59888)	Top-1 acc 65.234 (63.424)	Top-5 acc 83.594 (83.601)	lr 0.00727
Train [77][1590/3239]	Time 0.251 (1.140)	Data Time 0.001 (0.607)	Loss 2.3271 (2.5119)	Entropy 0.59893 (0.59888)	Top-1 acc 66.797 (63.427)	Top-5 acc 87.891 (83.603)	lr 0.00727
Train [77][1600/3239]	Time 0.246 (1.153)	Data Time 0.001 (0.621)	Loss 2.7290 (2.5118)	Entropy 0.59914 (0.59888)	Top-1 acc 58.203 (63.429)	Top-5 acc 80.469 (83.604)	lr 0.00727
Train [77][1610/3239]	Time 0.253 (1.149)	Data Time 0.001 (0.617)	Loss 2.4792 (2.5115)	Entropy 0.59921 (0.59888)	Top-1 acc 60.547 (63.434)	Top-5 acc 85.547 (83.611)	lr 0.00727
Train [77][1620/3239]	Time 0.240 (1.145)	Data Time 0.001 (0.614)	Loss 2.5117 (2.5113)	Entropy 0.59925 (0.59888)	Top-1 acc 63.672 (63.438)	Top-5 acc 83.984 (83.619)	lr 0.00727
Train [77][1630/3239]	Time 0.238 (1.145)	Data Time 0.001 (0.615)	Loss 2.4482 (2.5111)	Entropy 0.59898 (0.59889)	Top-1 acc 65.234 (63.435)	Top-5 acc 85.156 (83.621)	lr 0.00727
Train [77][1640/3239]	Time 0.268 (1.156)	Data Time 0.002 (0.626)	Loss 2.4659 (2.5109)	Entropy 0.59871 (0.59889)	Top-1 acc 65.234 (63.437)	Top-5 acc 84.766 (83.623)	lr 0.00726
Train [77][1650/3239]	Time 6.572 (1.157)	Data Time 6.166 (0.627)	Loss 2.3060 (2.5106)	Entropy 0.59875 (0.59888)	Top-1 acc 67.969 (63.443)	Top-5 acc 89.062 (83.632)	lr 0.00726
Train [77][1660/3239]	Time 0.239 (1.152)	Data Time 0.002 (0.623)	Loss 2.4990 (2.5108)	Entropy 0.59860 (0.59888)	Top-1 acc 63.281 (63.440)	Top-5 acc 83.594 (83.625)	lr 0.00726
Train [77][1670/3239]	Time 0.234 (1.164)	Data Time 0.001 (0.635)	Loss 2.5660 (2.5105)	Entropy 0.59859 (0.59888)	Top-1 acc 63.281 (63.452)	Top-5 acc 82.031 (83.631)	lr 0.00726
Train [77][1680/3239]	Time 0.233 (1.161)	Data Time 0.001 (0.633)	Loss 2.6967 (2.5104)	Entropy 0.59836 (0.59888)	Top-1 acc 60.156 (63.453)	Top-5 acc 79.297 (83.632)	lr 0.00726
Train [77][1690/3239]	Time 0.232 (1.162)	Data Time 0.001 (0.634)	Loss 2.5245 (2.5104)	Entropy 0.59801 (0.59888)	Top-1 acc 64.844 (63.457)	Top-5 acc 83.984 (83.635)	lr 0.00726
Train [77][1700/3239]	Time 0.244 (1.172)	Data Time 0.001 (0.645)	Loss 2.7976 (2.5104)	Entropy 0.59769 (0.59887)	Top-1 acc 57.422 (63.462)	Top-5 acc 76.172 (83.636)	lr 0.00726
Train [77][1710/3239]	Time 0.239 (1.168)	Data Time 0.001 (0.643)	Loss 2.4434 (2.5105)	Entropy 0.59746 (0.59886)	Top-1 acc 66.406 (63.465)	Top-5 acc 84.766 (83.634)	lr 0.00726
Train [77][1720/3239]	Time 0.337 (1.170)	Data Time 0.001 (0.644)	Loss 2.5463 (2.5105)	Entropy 0.59742 (0.59885)	Top-1 acc 58.594 (63.458)	Top-5 acc 83.984 (83.634)	lr 0.00726
Train [77][1730/3239]	Time 0.236 (1.181)	Data Time 0.001 (0.656)	Loss 2.4421 (2.5101)	Entropy 0.59776 (0.59885)	Top-1 acc 65.234 (63.461)	Top-5 acc 85.156 (83.644)	lr 0.00726
Train [77][1740/3239]	Time 0.229 (1.177)	Data Time 0.001 (0.653)	Loss 2.2864 (2.5103)	Entropy 0.59758 (0.59884)	Top-1 acc 70.703 (63.455)	Top-5 acc 88.672 (83.640)	lr 0.00726
Train [77][1750/3239]	Time 0.239 (1.179)	Data Time 0.001 (0.655)	Loss 2.4580 (2.5102)	Entropy 0.59790 (0.59883)	Top-1 acc 65.234 (63.456)	Top-5 acc 84.375 (83.638)	lr 0.00725
Train [77][1760/3239]	Time 0.229 (1.186)	Data Time 0.001 (0.662)	Loss 2.3884 (2.5101)	Entropy 0.59787 (0.59883)	Top-1 acc 62.500 (63.456)	Top-5 acc 86.719 (83.642)	lr 0.00725
Train [77][1770/3239]	Time 0.236 (1.181)	Data Time 0.001 (0.659)	Loss 2.2970 (2.5098)	Entropy 0.59776 (0.59882)	Top-1 acc 71.094 (63.464)	Top-5 acc 87.109 (83.644)	lr 0.00725
Train [77][1780/3239]	Time 0.232 (1.182)	Data Time 0.001 (0.661)	Loss 2.7298 (2.5099)	Entropy 0.59770 (0.59882)	Top-1 acc 57.422 (63.461)	Top-5 acc 76.953 (83.638)	lr 0.00725
Train [77][1790/3239]	Time 0.231 (1.178)	Data Time 0.001 (0.657)	Loss 2.4931 (2.5098)	Entropy 0.59758 (0.59881)	Top-1 acc 61.719 (63.466)	Top-5 acc 84.766 (83.642)	lr 0.00725
Train [77][1800/3239]	Time 0.246 (1.182)	Data Time 0.001 (0.662)	Loss 2.4827 (2.5097)	Entropy 0.59765 (0.59880)	Top-1 acc 63.281 (63.461)	Top-5 acc 83.594 (83.645)	lr 0.00725
Train [77][1810/3239]	Time 6.688 (1.182)	Data Time 6.342 (0.661)	Loss 2.5309 (2.5094)	Entropy 0.59741 (0.59880)	Top-1 acc 66.797 (63.468)	Top-5 acc 84.766 (83.650)	lr 0.00725
Train [77][1820/3239]	Time 0.234 (1.177)	Data Time 0.001 (0.658)	Loss 2.5319 (2.5094)	Entropy 0.59743 (0.59879)	Top-1 acc 62.500 (63.470)	Top-5 acc 82.422 (83.649)	lr 0.00725
Train [77][1830/3239]	Time 0.241 (1.183)	Data Time 0.001 (0.665)	Loss 2.3971 (2.5095)	Entropy 0.59749 (0.59878)	Top-1 acc 68.359 (63.471)	Top-5 acc 85.156 (83.650)	lr 0.00725
Train [77][1840/3239]	Time 0.230 (1.179)	Data Time 0.001 (0.661)	Loss 2.4649 (2.5093)	Entropy 0.59749 (0.59877)	Top-1 acc 64.453 (63.476)	Top-5 acc 84.375 (83.653)	lr 0.00725
Train [77][1850/3239]	Time 0.241 (1.178)	Data Time 0.001 (0.660)	Loss 2.7350 (2.5094)	Entropy 0.59757 (0.59877)	Top-1 acc 60.938 (63.476)	Top-5 acc 80.859 (83.653)	lr 0.00725
Train [77][1860/3239]	Time 0.230 (1.184)	Data Time 0.001 (0.667)	Loss 2.4583 (2.5094)	Entropy 0.59731 (0.59876)	Top-1 acc 64.453 (63.474)	Top-5 acc 83.594 (83.656)	lr 0.00724
Train [77][1870/3239]	Time 0.235 (1.180)	Data Time 0.001 (0.664)	Loss 2.5924 (2.5095)	Entropy 0.59733 (0.59875)	Top-1 acc 64.453 (63.474)	Top-5 acc 79.688 (83.650)	lr 0.00724
Train [77][1880/3239]	Time 0.355 (1.179)	Data Time 0.001 (0.663)	Loss 2.4971 (2.5094)	Entropy 0.59695 (0.59874)	Top-1 acc 62.500 (63.484)	Top-5 acc 83.594 (83.651)	lr 0.00724
Train [77][1890/3239]	Time 0.235 (1.185)	Data Time 0.001 (0.669)	Loss 2.6670 (2.5092)	Entropy 0.59696 (0.59873)	Top-1 acc 58.203 (63.484)	Top-5 acc 79.688 (83.658)	lr 0.00724
Train [77][1900/3239]	Time 0.238 (1.182)	Data Time 0.001 (0.667)	Loss 2.4891 (2.5091)	Entropy 0.59705 (0.59872)	Top-1 acc 62.891 (63.486)	Top-5 acc 83.203 (83.658)	lr 0.00724
Train [77][1910/3239]	Time 0.236 (1.181)	Data Time 0.001 (0.666)	Loss 2.4922 (2.5091)	Entropy 0.59703 (0.59872)	Top-1 acc 63.672 (63.484)	Top-5 acc 82.422 (83.658)	lr 0.00724
Train [77][1920/3239]	Time 0.273 (1.185)	Data Time 0.001 (0.670)	Loss 2.5564 (2.5094)	Entropy 0.59706 (0.59871)	Top-1 acc 64.062 (63.482)	Top-5 acc 82.422 (83.652)	lr 0.00724
Train [77][1930/3239]	Time 0.435 (1.182)	Data Time 0.161 (0.668)	Loss 2.5020 (2.5092)	Entropy 0.59715 (0.59870)	Top-1 acc 58.984 (63.483)	Top-5 acc 86.719 (83.657)	lr 0.00724
Train [77][1940/3239]	Time 0.256 (1.184)	Data Time 0.001 (0.671)	Loss 2.4022 (2.5093)	Entropy 0.59696 (0.59869)	Top-1 acc 66.406 (63.481)	Top-5 acc 86.328 (83.656)	lr 0.00724
Train [77][1950/3239]	Time 0.237 (1.180)	Data Time 0.001 (0.667)	Loss 3.2254 (2.5097)	Entropy 0.59676 (0.59868)	Top-1 acc 46.875 (63.471)	Top-5 acc 70.312 (83.648)	lr 0.00724
Train [77][1960/3239]	Time 2.722 (1.183)	Data Time 2.465 (0.671)	Loss 2.4330 (2.5098)	Entropy 0.59685 (0.59867)	Top-1 acc 62.891 (63.465)	Top-5 acc 86.719 (83.650)	lr 0.00724
Train [77][1970/3239]	Time 8.948 (1.186)	Data Time 8.660 (0.674)	Loss 2.3750 (2.5097)	Entropy 0.59690 (0.59866)	Top-1 acc 67.578 (63.463)	Top-5 acc 86.719 (83.650)	lr 0.00723
Train [77][1980/3239]	Time 0.292 (1.209)	Data Time 0.003 (0.670)	Loss 2.6123 (2.5096)	Entropy 0.59649 (0.59865)	Top-1 acc 61.719 (63.464)	Top-5 acc 82.031 (83.653)	lr 0.00723
Train [77][1990/3239]	Time 0.253 (1.206)	Data Time 0.002 (0.667)	Loss 2.5369 (2.5097)	Entropy 0.59663 (0.59864)	Top-1 acc 60.547 (63.460)	Top-5 acc 83.594 (83.651)	lr 0.00723
Train [77][2000/3239]	Time 0.251 (1.202)	Data Time 0.001 (0.664)	Loss 2.5062 (2.5097)	Entropy 0.59650 (0.59863)	Top-1 acc 64.453 (63.462)	Top-5 acc 83.984 (83.649)	lr 0.00723
Train [77][2010/3239]	Time 0.246 (1.198)	Data Time 0.001 (0.660)	Loss 2.2794 (2.5096)	Entropy 0.59636 (0.59862)	Top-1 acc 66.797 (63.457)	Top-5 acc 89.453 (83.655)	lr 0.00723
Train [77][2020/3239]	Time 0.238 (1.194)	Data Time 0.001 (0.657)	Loss 2.7085 (2.5096)	Entropy 0.59656 (0.59861)	Top-1 acc 56.641 (63.453)	Top-5 acc 79.688 (83.658)	lr 0.00723
Train [77][2030/3239]	Time 0.248 (1.190)	Data Time 0.002 (0.654)	Loss 2.5725 (2.5091)	Entropy 0.59629 (0.59860)	Top-1 acc 60.156 (63.462)	Top-5 acc 83.984 (83.668)	lr 0.00723
Train [77][2040/3239]	Time 1.382 (1.190)	Data Time 1.032 (0.655)	Loss 2.3887 (2.5092)	Entropy 0.59644 (0.59859)	Top-1 acc 66.406 (63.461)	Top-5 acc 85.156 (83.664)	lr 0.00723
Train [77][2050/3239]	Time 0.839 (1.189)	Data Time 0.602 (0.654)	Loss 2.3400 (2.5088)	Entropy 0.59599 (0.59858)	Top-1 acc 70.703 (63.477)	Top-5 acc 85.156 (83.671)	lr 0.00723
Train [77][2060/3239]	Time 0.238 (1.185)	Data Time 0.001 (0.651)	Loss 2.5681 (2.5088)	Entropy 0.59570 (0.59856)	Top-1 acc 58.984 (63.476)	Top-5 acc 81.641 (83.668)	lr 0.00723
Train [77][2070/3239]	Time 0.240 (1.183)	Data Time 0.001 (0.649)	Loss 2.3317 (2.5091)	Entropy 0.59569 (0.59855)	Top-1 acc 70.312 (63.472)	Top-5 acc 85.156 (83.664)	lr 0.00723
Train [77][2080/3239]	Time 0.240 (1.189)	Data Time 0.001 (0.655)	Loss 2.6120 (2.5090)	Entropy 0.59555 (0.59854)	Top-1 acc 58.203 (63.472)	Top-5 acc 84.766 (83.668)	lr 0.00722
Train [77][2090/3239]	Time 0.239 (1.188)	Data Time 0.001 (0.654)	Loss 2.4065 (2.5087)	Entropy 0.59549 (0.59852)	Top-1 acc 64.062 (63.477)	Top-5 acc 86.719 (83.673)	lr 0.00722
Train [77][2100/3239]	Time 0.234 (1.186)	Data Time 0.001 (0.653)	Loss 2.4153 (2.5091)	Entropy 0.59542 (0.59851)	Top-1 acc 62.891 (63.468)	Top-5 acc 85.938 (83.670)	lr 0.00722
Train [77][2110/3239]	Time 0.242 (1.192)	Data Time 0.001 (0.660)	Loss 2.4671 (2.5091)	Entropy 0.59568 (0.59849)	Top-1 acc 63.281 (63.466)	Top-5 acc 83.594 (83.670)	lr 0.00722
Train [77][2120/3239]	Time 0.237 (1.189)	Data Time 0.001 (0.657)	Loss 2.3956 (2.5088)	Entropy 0.59576 (0.59848)	Top-1 acc 65.234 (63.476)	Top-5 acc 85.938 (83.671)	lr 0.00722
Train [77][2130/3239]	Time 1.687 (1.187)	Data Time 1.395 (0.656)	Loss 2.4783 (2.5084)	Entropy 0.59574 (0.59847)	Top-1 acc 66.016 (63.485)	Top-5 acc 85.938 (83.680)	lr 0.00722
Train [77][2140/3239]	Time 0.227 (1.190)	Data Time 0.001 (0.659)	Loss 2.4210 (2.5085)	Entropy 0.59572 (0.59846)	Top-1 acc 66.016 (63.482)	Top-5 acc 85.156 (83.680)	lr 0.00722
Train [77][2150/3239]	Time 0.232 (1.187)	Data Time 0.001 (0.656)	Loss 2.4804 (2.5085)	Entropy 0.59571 (0.59844)	Top-1 acc 62.109 (63.480)	Top-5 acc 82.422 (83.680)	lr 0.00722
Train [77][2160/3239]	Time 0.256 (1.184)	Data Time 0.003 (0.654)	Loss 2.9898 (2.5086)	Entropy 0.59548 (0.59843)	Top-1 acc 51.172 (63.477)	Top-5 acc 75.000 (83.680)	lr 0.00722
Train [77][2170/3239]	Time 0.283 (1.186)	Data Time 0.001 (0.656)	Loss 2.5741 (2.5088)	Entropy 0.59518 (0.59842)	Top-1 acc 60.547 (63.472)	Top-5 acc 82.422 (83.679)	lr 0.00722
Train [77][2180/3239]	Time 0.247 (1.183)	Data Time 0.001 (0.654)	Loss 2.4684 (2.5089)	Entropy 0.59503 (0.59840)	Top-1 acc 64.453 (63.469)	Top-5 acc 84.766 (83.682)	lr 0.00722
Train [77][2190/3239]	Time 0.251 (1.179)	Data Time 0.001 (0.651)	Loss 2.5127 (2.5087)	Entropy 0.59497 (0.59839)	Top-1 acc 63.281 (63.475)	Top-5 acc 85.547 (83.682)	lr 0.00721
Train [77][2200/3239]	Time 0.346 (1.184)	Data Time 0.002 (0.656)	Loss 2.4636 (2.5085)	Entropy 0.59513 (0.59837)	Top-1 acc 61.719 (63.477)	Top-5 acc 83.984 (83.688)	lr 0.00721
Train [77][2210/3239]	Time 0.243 (1.182)	Data Time 0.002 (0.654)	Loss 2.3771 (2.5084)	Entropy 0.59513 (0.59836)	Top-1 acc 68.750 (63.481)	Top-5 acc 86.328 (83.689)	lr 0.00721
Train [77][2220/3239]	Time 0.229 (1.179)	Data Time 0.001 (0.652)	Loss 2.5577 (2.5085)	Entropy 0.59503 (0.59834)	Top-1 acc 59.766 (63.474)	Top-5 acc 82.422 (83.684)	lr 0.00721
Train [77][2230/3239]	Time 0.247 (1.176)	Data Time 0.001 (0.650)	Loss 2.5795 (2.5088)	Entropy 0.59507 (0.59833)	Top-1 acc 60.547 (63.467)	Top-5 acc 82.422 (83.678)	lr 0.00721
Train [77][2240/3239]	Time 0.236 (1.184)	Data Time 0.001 (0.658)	Loss 2.4811 (2.5087)	Entropy 0.59450 (0.59831)	Top-1 acc 63.672 (63.467)	Top-5 acc 83.984 (83.683)	lr 0.00721
Train [77][2250/3239]	Time 0.230 (1.182)	Data Time 0.001 (0.657)	Loss 2.6093 (2.5089)	Entropy 0.59414 (0.59829)	Top-1 acc 63.672 (63.463)	Top-5 acc 81.250 (83.680)	lr 0.00721
Train [77][2260/3239]	Time 0.235 (1.179)	Data Time 0.001 (0.654)	Loss 2.4565 (2.5092)	Entropy 0.59424 (0.59828)	Top-1 acc 64.844 (63.457)	Top-5 acc 83.594 (83.678)	lr 0.00721
Train [77][2270/3239]	Time 0.248 (1.186)	Data Time 0.002 (0.662)	Loss 2.3846 (2.5093)	Entropy 0.59426 (0.59826)	Top-1 acc 68.359 (63.456)	Top-5 acc 85.547 (83.677)	lr 0.00721
Train [77][2280/3239]	Time 0.259 (1.183)	Data Time 0.001 (0.659)	Loss 2.7993 (2.5094)	Entropy 0.59457 (0.59824)	Top-1 acc 50.000 (63.455)	Top-5 acc 75.781 (83.675)	lr 0.00721
Train [77][2290/3239]	Time 0.243 (1.180)	Data Time 0.001 (0.656)	Loss 2.4466 (2.5095)	Entropy 0.59458 (0.59822)	Top-1 acc 66.016 (63.456)	Top-5 acc 85.938 (83.673)	lr 0.00721
Train [77][2300/3239]	Time 0.237 (1.189)	Data Time 0.001 (0.666)	Loss 2.4516 (2.5096)	Entropy 0.59474 (0.59821)	Top-1 acc 66.797 (63.450)	Top-5 acc 83.984 (83.676)	lr 0.00720
Train [77][2310/3239]	Time 0.295 (1.186)	Data Time 0.001 (0.663)	Loss 2.4566 (2.5098)	Entropy 0.59467 (0.59819)	Top-1 acc 66.016 (63.447)	Top-5 acc 82.422 (83.670)	lr 0.00720
Train [77][2320/3239]	Time 0.253 (1.183)	Data Time 0.001 (0.661)	Loss 2.4887 (2.5098)	Entropy 0.59453 (0.59818)	Top-1 acc 66.797 (63.447)	Top-5 acc 83.203 (83.669)	lr 0.00720
Train [77][2330/3239]	Time 0.254 (1.185)	Data Time 0.001 (0.663)	Loss 2.3585 (2.5099)	Entropy 0.59462 (0.59816)	Top-1 acc 68.750 (63.444)	Top-5 acc 84.766 (83.666)	lr 0.00720
Train [77][2340/3239]	Time 0.229 (1.182)	Data Time 0.001 (0.660)	Loss 2.4519 (2.5099)	Entropy 0.59456 (0.59815)	Top-1 acc 60.938 (63.446)	Top-5 acc 85.547 (83.666)	lr 0.00720
Train [77][2350/3239]	Time 0.229 (1.179)	Data Time 0.001 (0.658)	Loss 2.8012 (2.5099)	Entropy 0.59455 (0.59813)	Top-1 acc 56.250 (63.447)	Top-5 acc 78.906 (83.669)	lr 0.00720
Train [77][2360/3239]	Time 0.425 (1.181)	Data Time 0.001 (0.660)	Loss 2.3944 (2.5098)	Entropy 0.59477 (0.59812)	Top-1 acc 67.188 (63.443)	Top-5 acc 85.938 (83.671)	lr 0.00720
Train [77][2370/3239]	Time 0.220 (1.178)	Data Time 0.001 (0.658)	Loss 2.4974 (2.5097)	Entropy 0.59483 (0.59810)	Top-1 acc 64.453 (63.448)	Top-5 acc 84.766 (83.671)	lr 0.00720
Train [77][2380/3239]	Time 0.236 (1.175)	Data Time 0.001 (0.655)	Loss 2.4177 (2.5098)	Entropy 0.59482 (0.59809)	Top-1 acc 64.453 (63.447)	Top-5 acc 85.938 (83.670)	lr 0.00720
Train [77][2390/3239]	Time 0.229 (1.172)	Data Time 0.001 (0.652)	Loss 2.8141 (2.5098)	Entropy 0.59475 (0.59808)	Top-1 acc 56.250 (63.445)	Top-5 acc 77.344 (83.672)	lr 0.00720
Train [77][2400/3239]	Time 0.251 (1.174)	Data Time 0.003 (0.655)	Loss 2.1298 (2.5095)	Entropy 0.59446 (0.59806)	Top-1 acc 72.266 (63.451)	Top-5 acc 89.062 (83.678)	lr 0.00720
Train [77][2410/3239]	Time 0.223 (1.171)	Data Time 0.001 (0.652)	Loss 2.6260 (2.5094)	Entropy 0.59470 (0.59805)	Top-1 acc 64.453 (63.458)	Top-5 acc 82.812 (83.680)	lr 0.00719
Train [77][2420/3239]	Time 0.244 (1.168)	Data Time 0.001 (0.650)	Loss 2.6321 (2.5092)	Entropy 0.59477 (0.59803)	Top-1 acc 60.547 (63.464)	Top-5 acc 81.250 (83.683)	lr 0.00719
Train [77][2430/3239]	Time 0.335 (1.171)	Data Time 0.001 (0.653)	Loss 2.4432 (2.5088)	Entropy 0.59478 (0.59802)	Top-1 acc 66.406 (63.471)	Top-5 acc 84.375 (83.689)	lr 0.00719
Train [77][2440/3239]	Time 0.255 (1.167)	Data Time 0.001 (0.650)	Loss 2.6174 (2.5092)	Entropy 0.59471 (0.59801)	Top-1 acc 58.984 (63.458)	Top-5 acc 78.906 (83.679)	lr 0.00719
Train [77][2450/3239]	Time 0.254 (1.164)	Data Time 0.001 (0.647)	Loss 2.2203 (2.5092)	Entropy 0.59460 (0.59799)	Top-1 acc 72.656 (63.457)	Top-5 acc 87.891 (83.677)	lr 0.00719
Train [77][2460/3239]	Time 0.233 (1.166)	Data Time 0.001 (0.650)	Loss 2.5391 (2.5092)	Entropy 0.59423 (0.59798)	Top-1 acc 60.547 (63.459)	Top-5 acc 80.469 (83.677)	lr 0.00719
Train [77][2470/3239]	Time 0.248 (1.163)	Data Time 0.001 (0.647)	Loss 2.2865 (2.5091)	Entropy 0.59428 (0.59796)	Top-1 acc 70.703 (63.462)	Top-5 acc 87.500 (83.679)	lr 0.00719
Train [77][2480/3239]	Time 0.236 (1.160)	Data Time 0.001 (0.644)	Loss 2.3527 (2.5089)	Entropy 0.59438 (0.59795)	Top-1 acc 63.672 (63.464)	Top-5 acc 89.453 (83.683)	lr 0.00719
Train [77][2490/3239]	Time 0.245 (1.168)	Data Time 0.002 (0.652)	Loss 2.3774 (2.5089)	Entropy 0.59430 (0.59793)	Top-1 acc 66.016 (63.464)	Top-5 acc 84.766 (83.683)	lr 0.00719
Train [77][2500/3239]	Time 0.243 (1.165)	Data Time 0.001 (0.649)	Loss 2.2404 (2.5089)	Entropy 0.59420 (0.59792)	Top-1 acc 71.484 (63.468)	Top-5 acc 88.672 (83.680)	lr 0.00719
Train [77][2510/3239]	Time 0.243 (1.162)	Data Time 0.001 (0.647)	Loss 2.3501 (2.5089)	Entropy 0.59409 (0.59790)	Top-1 acc 68.359 (63.469)	Top-5 acc 86.719 (83.680)	lr 0.00719
Train [77][2520/3239]	Time 0.362 (1.170)	Data Time 0.001 (0.655)	Loss 2.6699 (2.5091)	Entropy 0.59412 (0.59789)	Top-1 acc 60.156 (63.463)	Top-5 acc 80.859 (83.674)	lr 0.00718
Train [77][2530/3239]	Time 0.244 (1.167)	Data Time 0.001 (0.653)	Loss 2.5008 (2.5090)	Entropy 0.59388 (0.59787)	Top-1 acc 63.281 (63.467)	Top-5 acc 84.375 (83.677)	lr 0.00718
Train [77][2540/3239]	Time 0.241 (1.164)	Data Time 0.001 (0.650)	Loss 2.4347 (2.5092)	Entropy 0.59363 (0.59786)	Top-1 acc 66.016 (63.462)	Top-5 acc 82.812 (83.671)	lr 0.00718
Train [77][2550/3239]	Time 0.231 (1.161)	Data Time 0.001 (0.648)	Loss 2.5886 (2.5092)	Entropy 0.59357 (0.59784)	Top-1 acc 63.281 (63.468)	Top-5 acc 82.812 (83.671)	lr 0.00718
Train [77][2560/3239]	Time 0.233 (1.168)	Data Time 0.001 (0.655)	Loss 2.7235 (2.5094)	Entropy 0.59346 (0.59782)	Top-1 acc 56.641 (63.463)	Top-5 acc 81.641 (83.669)	lr 0.00718
Train [77][2570/3239]	Time 0.236 (1.165)	Data Time 0.001 (0.653)	Loss 2.5806 (2.5093)	Entropy 0.59329 (0.59781)	Top-1 acc 62.891 (63.464)	Top-5 acc 80.859 (83.671)	lr 0.00718
Train [77][2580/3239]	Time 0.231 (1.162)	Data Time 0.001 (0.651)	Loss 2.4307 (2.5093)	Entropy 0.59332 (0.59779)	Top-1 acc 64.844 (63.459)	Top-5 acc 84.375 (83.672)	lr 0.00718
Train [77][2590/3239]	Time 0.346 (1.169)	Data Time 0.001 (0.658)	Loss 2.6050 (2.5095)	Entropy 0.59326 (0.59777)	Top-1 acc 60.156 (63.458)	Top-5 acc 82.031 (83.669)	lr 0.00718
Train [77][2600/3239]	Time 0.260 (1.167)	Data Time 0.001 (0.656)	Loss 2.5253 (2.5096)	Entropy 0.59347 (0.59776)	Top-1 acc 62.109 (63.458)	Top-5 acc 83.594 (83.668)	lr 0.00718
Train [77][2610/3239]	Time 0.247 (1.165)	Data Time 0.001 (0.654)	Loss 2.4076 (2.5097)	Entropy 0.59347 (0.59774)	Top-1 acc 66.797 (63.453)	Top-5 acc 84.375 (83.664)	lr 0.00718
Train [77][2620/3239]	Time 0.252 (1.170)	Data Time 0.001 (0.660)	Loss 2.3910 (2.5094)	Entropy 0.59335 (0.59772)	Top-1 acc 64.844 (63.456)	Top-5 acc 87.891 (83.671)	lr 0.00718
Train [77][2630/3239]	Time 0.309 (1.191)	Data Time 0.005 (0.658)	Loss 2.4186 (2.5093)	Entropy 0.59324 (0.59771)	Top-1 acc 64.062 (63.458)	Top-5 acc 85.938 (83.674)	lr 0.00717
Train [77][2640/3239]	Time 0.233 (1.188)	Data Time 0.002 (0.655)	Loss 2.4307 (2.5094)	Entropy 0.59344 (0.59769)	Top-1 acc 63.672 (63.459)	Top-5 acc 85.938 (83.675)	lr 0.00717
Train [77][2650/3239]	Time 0.241 (1.185)	Data Time 0.002 (0.653)	Loss 2.7523 (2.5099)	Entropy 0.59359 (0.59767)	Top-1 acc 61.328 (63.448)	Top-5 acc 80.469 (83.667)	lr 0.00717
Train [77][2660/3239]	Time 0.235 (1.182)	Data Time 0.001 (0.650)	Loss 2.5998 (2.5098)	Entropy 0.59329 (0.59766)	Top-1 acc 60.547 (63.447)	Top-5 acc 82.031 (83.667)	lr 0.00717
Train [77][2670/3239]	Time 0.232 (1.179)	Data Time 0.001 (0.648)	Loss 2.4536 (2.5099)	Entropy 0.59310 (0.59764)	Top-1 acc 68.359 (63.446)	Top-5 acc 83.594 (83.666)	lr 0.00717
Train [77][2680/3239]	Time 0.354 (1.177)	Data Time 0.001 (0.645)	Loss 2.7186 (2.5098)	Entropy 0.59293 (0.59762)	Top-1 acc 58.984 (63.453)	Top-5 acc 82.031 (83.668)	lr 0.00717
Train [77][2690/3239]	Time 0.245 (1.174)	Data Time 0.001 (0.643)	Loss 2.5124 (2.5100)	Entropy 0.59258 (0.59761)	Top-1 acc 63.672 (63.449)	Top-5 acc 83.203 (83.665)	lr 0.00717
Train [77][2700/3239]	Time 0.238 (1.177)	Data Time 0.001 (0.647)	Loss 2.5049 (2.5099)	Entropy 0.59270 (0.59759)	Top-1 acc 64.453 (63.451)	Top-5 acc 84.375 (83.667)	lr 0.00717
Train [77][2710/3239]	Time 0.239 (1.174)	Data Time 0.001 (0.644)	Loss 2.3909 (2.5099)	Entropy 0.59267 (0.59757)	Top-1 acc 67.578 (63.453)	Top-5 acc 82.812 (83.665)	lr 0.00717
Train [77][2720/3239]	Time 0.256 (1.171)	Data Time 0.002 (0.642)	Loss 2.5262 (2.5100)	Entropy 0.59231 (0.59755)	Top-1 acc 65.625 (63.452)	Top-5 acc 83.984 (83.661)	lr 0.00717
Train [77][2730/3239]	Time 0.270 (1.179)	Data Time 0.001 (0.650)	Loss 2.4976 (2.5100)	Entropy 0.59262 (0.59753)	Top-1 acc 64.844 (63.452)	Top-5 acc 84.375 (83.662)	lr 0.00717
Train [77][2740/3239]	Time 0.259 (1.177)	Data Time 0.001 (0.648)	Loss 2.3854 (2.5097)	Entropy 0.59273 (0.59752)	Top-1 acc 67.578 (63.460)	Top-5 acc 85.938 (83.665)	lr 0.00716
Train [77][2750/3239]	Time 0.333 (1.174)	Data Time 0.002 (0.646)	Loss 2.5531 (2.5096)	Entropy 0.59288 (0.59750)	Top-1 acc 59.766 (63.464)	Top-5 acc 85.156 (83.667)	lr 0.00716
Train [77][2760/3239]	Time 0.232 (1.179)	Data Time 0.001 (0.651)	Loss 2.6367 (2.5097)	Entropy 0.59301 (0.59748)	Top-1 acc 59.766 (63.459)	Top-5 acc 80.859 (83.665)	lr 0.00716
Train [77][2770/3239]	Time 0.239 (1.178)	Data Time 0.002 (0.650)	Loss 2.4062 (2.5099)	Entropy 0.59319 (0.59747)	Top-1 acc 66.797 (63.456)	Top-5 acc 86.328 (83.664)	lr 0.00716
Train [77][2780/3239]	Time 0.234 (1.175)	Data Time 0.001 (0.648)	Loss 2.4801 (2.5099)	Entropy 0.59361 (0.59745)	Top-1 acc 63.281 (63.454)	Top-5 acc 83.984 (83.661)	lr 0.00716
Train [77][2790/3239]	Time 17.860 (1.178)	Data Time 17.615 (0.652)	Loss 2.4614 (2.5100)	Entropy 0.59391 (0.59744)	Top-1 acc 65.625 (63.450)	Top-5 acc 83.203 (83.660)	lr 0.00716
Train [77][2800/3239]	Time 0.232 (1.178)	Data Time 0.001 (0.652)	Loss 2.3223 (2.5099)	Entropy 0.59404 (0.59743)	Top-1 acc 69.141 (63.453)	Top-5 acc 85.547 (83.662)	lr 0.00716
Train [77][2810/3239]	Time 0.224 (1.176)	Data Time 0.001 (0.650)	Loss 2.6406 (2.5100)	Entropy 0.59401 (0.59741)	Top-1 acc 60.156 (63.455)	Top-5 acc 81.641 (83.660)	lr 0.00716
Train [77][2820/3239]	Time 0.251 (1.173)	Data Time 0.002 (0.647)	Loss 2.4941 (2.5098)	Entropy 0.59427 (0.59740)	Top-1 acc 66.016 (63.462)	Top-5 acc 83.203 (83.663)	lr 0.00716
Train [77][2830/3239]	Time 0.229 (1.179)	Data Time 0.001 (0.654)	Loss 2.7504 (2.5098)	Entropy 0.59456 (0.59739)	Top-1 acc 58.594 (63.463)	Top-5 acc 78.906 (83.664)	lr 0.00716
Train [77][2840/3239]	Time 0.329 (1.177)	Data Time 0.001 (0.651)	Loss 2.5578 (2.5098)	Entropy 0.59452 (0.59738)	Top-1 acc 64.062 (63.465)	Top-5 acc 84.375 (83.665)	lr 0.00716
Train [77][2850/3239]	Time 0.227 (1.174)	Data Time 0.001 (0.649)	Loss 2.5847 (2.5099)	Entropy 0.59468 (0.59737)	Top-1 acc 58.594 (63.462)	Top-5 acc 84.766 (83.664)	lr 0.00715
Train [77][2860/3239]	Time 0.238 (1.180)	Data Time 0.001 (0.655)	Loss 2.6012 (2.5101)	Entropy 0.59405 (0.59736)	Top-1 acc 61.719 (63.453)	Top-5 acc 82.031 (83.660)	lr 0.00715
Train [77][2870/3239]	Time 0.231 (1.177)	Data Time 0.001 (0.653)	Loss 2.6230 (2.5103)	Entropy 0.59390 (0.59735)	Top-1 acc 58.203 (63.453)	Top-5 acc 82.812 (83.655)	lr 0.00715
Train [77][2880/3239]	Time 0.234 (1.174)	Data Time 0.001 (0.651)	Loss 2.5716 (2.5104)	Entropy 0.59401 (0.59734)	Top-1 acc 66.016 (63.452)	Top-5 acc 81.641 (83.653)	lr 0.00715
Train [77][2890/3239]	Time 0.240 (1.180)	Data Time 0.001 (0.657)	Loss 2.6171 (2.5106)	Entropy 0.59381 (0.59732)	Top-1 acc 59.766 (63.447)	Top-5 acc 80.469 (83.647)	lr 0.00715
Train [77][2900/3239]	Time 0.224 (1.177)	Data Time 0.001 (0.654)	Loss 2.5273 (2.5107)	Entropy 0.59369 (0.59731)	Top-1 acc 64.453 (63.444)	Top-5 acc 81.641 (83.645)	lr 0.00715
Train [77][2910/3239]	Time 0.328 (1.175)	Data Time 0.001 (0.652)	Loss 2.6380 (2.5109)	Entropy 0.59364 (0.59730)	Top-1 acc 57.031 (63.439)	Top-5 acc 82.812 (83.644)	lr 0.00715
Train [77][2920/3239]	Time 0.238 (1.177)	Data Time 0.001 (0.655)	Loss 2.5463 (2.5110)	Entropy 0.59392 (0.59729)	Top-1 acc 61.328 (63.435)	Top-5 acc 84.375 (83.640)	lr 0.00715
Train [77][2930/3239]	Time 0.246 (1.177)	Data Time 0.001 (0.655)	Loss 2.3616 (2.5112)	Entropy 0.59362 (0.59728)	Top-1 acc 68.359 (63.430)	Top-5 acc 84.766 (83.637)	lr 0.00715
Train [77][2940/3239]	Time 0.235 (1.175)	Data Time 0.001 (0.653)	Loss 2.6356 (2.5114)	Entropy 0.59378 (0.59726)	Top-1 acc 59.375 (63.424)	Top-5 acc 81.250 (83.634)	lr 0.00715
Train [77][2950/3239]	Time 15.894 (1.177)	Data Time 15.641 (0.656)	Loss 2.4590 (2.5114)	Entropy 0.59386 (0.59725)	Top-1 acc 64.062 (63.420)	Top-5 acc 83.203 (83.635)	lr 0.00715
Train [77][2960/3239]	Time 0.232 (1.177)	Data Time 0.001 (0.657)	Loss 2.5808 (2.5116)	Entropy 0.59401 (0.59724)	Top-1 acc 60.938 (63.418)	Top-5 acc 81.250 (83.633)	lr 0.00714
Train [77][2970/3239]	Time 0.267 (1.175)	Data Time 0.001 (0.654)	Loss 2.4469 (2.5115)	Entropy 0.59397 (0.59723)	Top-1 acc 66.406 (63.417)	Top-5 acc 84.766 (83.634)	lr 0.00714
Train [77][2980/3239]	Time 0.234 (1.172)	Data Time 0.001 (0.652)	Loss 2.4319 (2.5115)	Entropy 0.59369 (0.59722)	Top-1 acc 66.797 (63.419)	Top-5 acc 83.984 (83.633)	lr 0.00714
Train [77][2990/3239]	Time 0.231 (1.178)	Data Time 0.002 (0.658)	Loss 2.8969 (2.5115)	Entropy 0.59335 (0.59721)	Top-1 acc 53.906 (63.419)	Top-5 acc 75.781 (83.633)	lr 0.00714
Train [77][3000/3239]	Time 0.235 (1.175)	Data Time 0.001 (0.656)	Loss 2.2729 (2.5115)	Entropy 0.59285 (0.59719)	Top-1 acc 71.094 (63.417)	Top-5 acc 88.281 (83.635)	lr 0.00714
Train [77][3010/3239]	Time 0.266 (1.173)	Data Time 0.002 (0.654)	Loss 2.5332 (2.5116)	Entropy 0.59250 (0.59718)	Top-1 acc 60.156 (63.414)	Top-5 acc 85.156 (83.634)	lr 0.00714
Train [77][3020/3239]	Time 0.283 (1.178)	Data Time 0.001 (0.659)	Loss 2.5107 (2.5117)	Entropy 0.59250 (0.59716)	Top-1 acc 61.328 (63.412)	Top-5 acc 83.984 (83.634)	lr 0.00714
Train [77][3030/3239]	Time 0.238 (1.175)	Data Time 0.001 (0.657)	Loss 2.5179 (2.5120)	Entropy 0.59271 (0.59715)	Top-1 acc 62.500 (63.406)	Top-5 acc 84.766 (83.630)	lr 0.00714
Train [77][3040/3239]	Time 0.231 (1.173)	Data Time 0.001 (0.655)	Loss 2.5820 (2.5120)	Entropy 0.59279 (0.59713)	Top-1 acc 64.062 (63.404)	Top-5 acc 83.203 (83.629)	lr 0.00714
Train [77][3050/3239]	Time 0.249 (1.177)	Data Time 0.001 (0.659)	Loss 2.4778 (2.5122)	Entropy 0.59272 (0.59712)	Top-1 acc 61.719 (63.403)	Top-5 acc 84.375 (83.624)	lr 0.00714
Train [77][3060/3239]	Time 0.265 (1.175)	Data Time 0.001 (0.657)	Loss 2.7126 (2.5121)	Entropy 0.59263 (0.59710)	Top-1 acc 60.156 (63.405)	Top-5 acc 79.688 (83.626)	lr 0.00714
Train [77][3070/3239]	Time 0.354 (1.172)	Data Time 0.001 (0.655)	Loss 2.5195 (2.5122)	Entropy 0.59284 (0.59709)	Top-1 acc 61.328 (63.403)	Top-5 acc 83.984 (83.624)	lr 0.00713
Train [77][3080/3239]	Time 0.281 (1.175)	Data Time 0.001 (0.658)	Loss 2.4483 (2.5123)	Entropy 0.59294 (0.59708)	Top-1 acc 67.578 (63.401)	Top-5 acc 85.156 (83.623)	lr 0.00713
Train [77][3090/3239]	Time 0.230 (1.176)	Data Time 0.001 (0.660)	Loss 2.5358 (2.5121)	Entropy 0.59322 (0.59706)	Top-1 acc 60.938 (63.403)	Top-5 acc 80.859 (83.623)	lr 0.00713
Train [77][3100/3239]	Time 0.215 (1.174)	Data Time 0.001 (0.658)	Loss 2.4696 (2.5122)	Entropy 0.59299 (0.59705)	Top-1 acc 66.016 (63.401)	Top-5 acc 85.938 (83.622)	lr 0.00713
Train [77][3110/3239]	Time 11.160 (1.175)	Data Time 10.892 (0.659)	Loss 2.5401 (2.5125)	Entropy 0.59293 (0.59704)	Top-1 acc 63.672 (63.394)	Top-5 acc 84.766 (83.619)	lr 0.00713
Train [77][3120/3239]	Time 0.253 (1.176)	Data Time 0.001 (0.661)	Loss 2.6446 (2.5123)	Entropy 0.59255 (0.59702)	Top-1 acc 63.672 (63.396)	Top-5 acc 79.688 (83.620)	lr 0.00713
Train [77][3130/3239]	Time 0.258 (1.174)	Data Time 0.001 (0.659)	Loss 2.4919 (2.5124)	Entropy 0.59265 (0.59701)	Top-1 acc 64.453 (63.395)	Top-5 acc 84.375 (83.620)	lr 0.00713
Train [77][3140/3239]	Time 0.340 (1.171)	Data Time 0.001 (0.657)	Loss 2.6237 (2.5123)	Entropy 0.59285 (0.59700)	Top-1 acc 61.328 (63.396)	Top-5 acc 82.031 (83.621)	lr 0.00713
Train [77][3150/3239]	Time 0.231 (1.177)	Data Time 0.001 (0.663)	Loss 2.3140 (2.5124)	Entropy 0.59290 (0.59698)	Top-1 acc 69.922 (63.395)	Top-5 acc 85.938 (83.622)	lr 0.00713
Train [77][3160/3239]	Time 0.238 (1.174)	Data Time 0.001 (0.660)	Loss 2.5683 (2.5124)	Entropy 0.59307 (0.59697)	Top-1 acc 62.500 (63.393)	Top-5 acc 84.375 (83.621)	lr 0.00713
Train [77][3170/3239]	Time 0.239 (1.172)	Data Time 0.001 (0.658)	Loss 2.4711 (2.5124)	Entropy 0.59269 (0.59696)	Top-1 acc 64.453 (63.394)	Top-5 acc 83.984 (83.621)	lr 0.00712
Train [77][3180/3239]	Time 6.344 (1.177)	Data Time 6.083 (0.664)	Loss 2.3955 (2.5124)	Entropy 0.59304 (0.59694)	Top-1 acc 66.016 (63.397)	Top-5 acc 85.547 (83.621)	lr 0.00712
Train [77][3190/3239]	Time 0.233 (1.175)	Data Time 0.000 (0.662)	Loss 2.3294 (2.5123)	Entropy 0.59267 (0.59693)	Top-1 acc 65.625 (63.395)	Top-5 acc 87.891 (83.623)	lr 0.00712
Train [77][3200/3239]	Time 0.235 (1.172)	Data Time 0.000 (0.659)	Loss 2.4904 (2.5124)	Entropy 0.59254 (0.59692)	Top-1 acc 65.234 (63.395)	Top-5 acc 83.594 (83.622)	lr 0.00712
Train [77][3210/3239]	Time 0.284 (1.175)	Data Time 0.000 (0.663)	Loss 2.3281 (2.5123)	Entropy 0.59236 (0.59690)	Top-1 acc 67.188 (63.399)	Top-5 acc 87.891 (83.624)	lr 0.00712
Train [77][3220/3239]	Time 0.234 (1.174)	Data Time 0.000 (0.662)	Loss 2.3436 (2.5123)	Entropy 0.59229 (0.59689)	Top-1 acc 65.625 (63.395)	Top-5 acc 84.766 (83.622)	lr 0.00712
Train [77][3230/3239]	Time 0.335 (1.171)	Data Time 0.000 (0.659)	Loss 2.4163 (2.5123)	Entropy 0.59228 (0.59688)	Top-1 acc 65.625 (63.393)	Top-5 acc 84.766 (83.619)	lr 0.00712
Train [77][3239/3239]	Time 1.040 (1.170)	Data Time 0.000 (0.658)	Loss 2.7468 (2.5124)	Entropy 0.59240 (0.59686)	Top-1 acc 61.728 (63.390)	Top-5 acc 76.543 (83.619)	lr 0.00712
==========Valid [77/120]	loss 1.301	top-1 acc 70.151 (70.151)	top-5 acc 88.890	Train top-1 63.390	top-5 83.619	Entropy 0.59240	Latency-None: 0.000ms	Flops: 539.00M
Train [78][0/3239]	Time 55.815 (55.815)	Data Time 52.455 (52.455)	Loss 2.6591 (2.6591)	Entropy 0.59248 (0.59248)	Top-1 acc 63.672 (63.672)	Top-5 acc 79.297 (79.297)	lr 0.00712
Train [78][10/3239]	Time 0.241 (5.574)	Data Time 0.001 (4.847)	Loss 2.4303 (2.4849)	Entropy 0.59280 (0.59256)	Top-1 acc 66.016 (64.631)	Top-5 acc 82.031 (84.126)	lr 0.00712
Train [78][20/3239]	Time 0.236 (3.121)	Data Time 0.001 (2.540)	Loss 2.4098 (2.4522)	Entropy 0.59276 (0.59265)	Top-1 acc 66.406 (65.290)	Top-5 acc 84.766 (84.580)	lr 0.00712
Train [78][30/3239]	Time 0.244 (2.248)	Data Time 0.001 (1.721)	Loss 2.4966 (2.4610)	Entropy 0.59238 (0.59261)	Top-1 acc 62.500 (64.919)	Top-5 acc 85.938 (84.388)	lr 0.00712
Train [78][40/3239]	Time 0.235 (1.969)	Data Time 0.001 (1.457)	Loss 2.4244 (2.4550)	Entropy 0.59246 (0.59255)	Top-1 acc 67.188 (64.996)	Top-5 acc 85.156 (84.585)	lr 0.00711
Train [78][50/3239]	Time 0.310 (2.702)	Data Time 0.004 (1.172)	Loss 2.4670 (2.4615)	Entropy 0.59261 (0.59254)	Top-1 acc 62.109 (64.775)	Top-5 acc 84.766 (84.367)	lr 0.00711
Train [78][60/3239]	Time 0.350 (2.331)	Data Time 0.002 (0.981)	Loss 2.4776 (2.4690)	Entropy 0.59281 (0.59256)	Top-1 acc 65.234 (64.652)	Top-5 acc 82.812 (84.298)	lr 0.00711
Train [78][70/3239]	Time 0.235 (2.062)	Data Time 0.001 (0.843)	Loss 2.5618 (2.4773)	Entropy 0.59294 (0.59260)	Top-1 acc 60.938 (64.393)	Top-5 acc 83.203 (84.182)	lr 0.00711
Train [78][80/3239]	Time 0.241 (1.859)	Data Time 0.001 (0.739)	Loss 2.4825 (2.4821)	Entropy 0.59321 (0.59266)	Top-1 acc 66.016 (64.231)	Top-5 acc 80.469 (84.004)	lr 0.00711
Train [78][90/3239]	Time 0.255 (1.705)	Data Time 0.003 (0.658)	Loss 2.2761 (2.4774)	Entropy 0.59325 (0.59273)	Top-1 acc 69.531 (64.487)	Top-5 acc 86.719 (84.010)	lr 0.00711
Train [78][100/3239]	Time 0.240 (1.580)	Data Time 0.001 (0.593)	Loss 2.5677 (2.4852)	Entropy 0.59323 (0.59278)	Top-1 acc 62.500 (64.213)	Top-5 acc 78.516 (83.868)	lr 0.00711
Train [78][110/3239]	Time 0.247 (1.479)	Data Time 0.001 (0.540)	Loss 2.4778 (2.4900)	Entropy 0.59328 (0.59282)	Top-1 acc 63.281 (64.101)	Top-5 acc 87.500 (83.865)	lr 0.00711
Train [78][120/3239]	Time 0.311 (1.393)	Data Time 0.001 (0.495)	Loss 2.5140 (2.4895)	Entropy 0.59345 (0.59287)	Top-1 acc 64.453 (64.104)	Top-5 acc 81.641 (83.878)	lr 0.00711
Train [78][130/3239]	Time 0.332 (1.319)	Data Time 0.001 (0.458)	Loss 2.4481 (2.4902)	Entropy 0.59367 (0.59291)	Top-1 acc 66.406 (64.131)	Top-5 acc 86.328 (83.856)	lr 0.00711
Train [78][140/3239]	Time 0.254 (1.256)	Data Time 0.001 (0.425)	Loss 2.3926 (2.4879)	Entropy 0.59384 (0.59298)	Top-1 acc 65.234 (64.148)	Top-5 acc 85.156 (83.921)	lr 0.00711
Train [78][150/3239]	Time 0.235 (1.211)	Data Time 0.002 (0.408)	Loss 2.4440 (2.4837)	Entropy 0.59392 (0.59303)	Top-1 acc 65.625 (64.210)	Top-5 acc 86.328 (83.990)	lr 0.00710
Train [78][160/3239]	Time 0.233 (1.170)	Data Time 0.001 (0.388)	Loss 2.4336 (2.4797)	Entropy 0.59387 (0.59309)	Top-1 acc 67.969 (64.303)	Top-5 acc 84.766 (84.098)	lr 0.00710
Train [78][170/3239]	Time 0.272 (1.139)	Data Time 0.001 (0.378)	Loss 2.5603 (2.4863)	Entropy 0.59360 (0.59313)	Top-1 acc 64.062 (64.115)	Top-5 acc 80.859 (84.019)	lr 0.00710
Train [78][180/3239]	Time 0.233 (1.126)	Data Time 0.001 (0.382)	Loss 2.6865 (2.4916)	Entropy 0.59311 (0.59315)	Top-1 acc 62.500 (64.000)	Top-5 acc 79.297 (83.930)	lr 0.00710
Train [78][190/3239]	Time 0.238 (1.096)	Data Time 0.002 (0.370)	Loss 2.4445 (2.4929)	Entropy 0.59334 (0.59315)	Top-1 acc 63.672 (64.005)	Top-5 acc 84.375 (83.927)	lr 0.00710
Train [78][200/3239]	Time 0.260 (1.068)	Data Time 0.001 (0.355)	Loss 2.6212 (2.4945)	Entropy 0.59351 (0.59316)	Top-1 acc 58.984 (63.926)	Top-5 acc 83.984 (83.907)	lr 0.00710
Train [78][210/3239]	Time 0.232 (1.052)	Data Time 0.001 (0.352)	Loss 2.4786 (2.4962)	Entropy 0.59387 (0.59319)	Top-1 acc 63.672 (63.890)	Top-5 acc 82.422 (83.834)	lr 0.00710
Train [78][220/3239]	Time 0.273 (1.043)	Data Time 0.002 (0.355)	Loss 2.3850 (2.4947)	Entropy 0.59391 (0.59322)	Top-1 acc 67.188 (63.918)	Top-5 acc 83.594 (83.871)	lr 0.00710
Train [78][230/3239]	Time 0.260 (1.016)	Data Time 0.001 (0.340)	Loss 2.5677 (2.4950)	Entropy 0.59354 (0.59324)	Top-1 acc 65.625 (63.934)	Top-5 acc 81.250 (83.874)	lr 0.00710
Train [78][240/3239]	Time 0.229 (1.004)	Data Time 0.001 (0.338)	Loss 2.5230 (2.4943)	Entropy 0.59341 (0.59325)	Top-1 acc 61.719 (63.960)	Top-5 acc 83.984 (83.856)	lr 0.00710
Train [78][250/3239]	Time 0.239 (1.009)	Data Time 0.001 (0.352)	Loss 2.6011 (2.4960)	Entropy 0.59343 (0.59326)	Top-1 acc 64.453 (63.933)	Top-5 acc 80.469 (83.826)	lr 0.00710
Train [78][260/3239]	Time 0.231 (0.987)	Data Time 0.001 (0.339)	Loss 2.4054 (2.4984)	Entropy 0.59316 (0.59326)	Top-1 acc 66.016 (63.869)	Top-5 acc 84.766 (83.800)	lr 0.00709
Train [78][270/3239]	Time 0.974 (0.970)	Data Time 0.696 (0.329)	Loss 2.4527 (2.5003)	Entropy 0.59310 (0.59325)	Top-1 acc 61.719 (63.781)	Top-5 acc 87.891 (83.771)	lr 0.00709
Train [78][280/3239]	Time 0.241 (0.968)	Data Time 0.001 (0.335)	Loss 2.4887 (2.4986)	Entropy 0.59309 (0.59324)	Top-1 acc 64.844 (63.803)	Top-5 acc 84.375 (83.795)	lr 0.00709
Train [78][290/3239]	Time 0.356 (0.953)	Data Time 0.001 (0.326)	Loss 2.3029 (2.4970)	Entropy 0.59298 (0.59324)	Top-1 acc 66.797 (63.825)	Top-5 acc 88.281 (83.827)	lr 0.00709
Train [78][300/3239]	Time 0.281 (0.936)	Data Time 0.001 (0.315)	Loss 2.5977 (2.4976)	Entropy 0.59291 (0.59323)	Top-1 acc 62.891 (63.835)	Top-5 acc 82.812 (83.812)	lr 0.00709
Train [78][310/3239]	Time 0.247 (0.924)	Data Time 0.001 (0.310)	Loss 2.3872 (2.4985)	Entropy 0.59264 (0.59322)	Top-1 acc 66.016 (63.820)	Top-5 acc 85.547 (83.788)	lr 0.00709
Train [78][320/3239]	Time 0.232 (0.927)	Data Time 0.001 (0.317)	Loss 2.4698 (2.4978)	Entropy 0.59229 (0.59319)	Top-1 acc 64.453 (63.839)	Top-5 acc 83.203 (83.762)	lr 0.00709
Train [78][330/3239]	Time 0.260 (0.912)	Data Time 0.001 (0.308)	Loss 2.4218 (2.4970)	Entropy 0.59224 (0.59317)	Top-1 acc 63.672 (63.862)	Top-5 acc 86.719 (83.763)	lr 0.00709
Train [78][340/3239]	Time 0.283 (0.913)	Data Time 0.001 (0.314)	Loss 2.5452 (2.4979)	Entropy 0.59229 (0.59314)	Top-1 acc 63.672 (63.829)	Top-5 acc 82.422 (83.762)	lr 0.00709
Train [78][350/3239]	Time 0.242 (0.910)	Data Time 0.002 (0.316)	Loss 2.3201 (2.4962)	Entropy 0.59239 (0.59312)	Top-1 acc 69.141 (63.892)	Top-5 acc 87.109 (83.792)	lr 0.00709
Train [78][360/3239]	Time 0.362 (0.897)	Data Time 0.001 (0.307)	Loss 2.3901 (2.4957)	Entropy 0.59227 (0.59310)	Top-1 acc 67.188 (63.882)	Top-5 acc 86.328 (83.804)	lr 0.00709
Train [78][370/3239]	Time 0.235 (0.888)	Data Time 0.001 (0.302)	Loss 2.3150 (2.4951)	Entropy 0.59227 (0.59308)	Top-1 acc 68.750 (63.887)	Top-5 acc 86.719 (83.834)	lr 0.00708
Train [78][380/3239]	Time 0.239 (0.890)	Data Time 0.001 (0.309)	Loss 2.2422 (2.4947)	Entropy 0.59225 (0.59305)	Top-1 acc 69.141 (63.890)	Top-5 acc 87.500 (83.834)	lr 0.00708
Train [78][390/3239]	Time 0.231 (0.878)	Data Time 0.001 (0.301)	Loss 2.5577 (2.4939)	Entropy 0.59241 (0.59303)	Top-1 acc 60.938 (63.892)	Top-5 acc 83.203 (83.872)	lr 0.00708
Train [78][400/3239]	Time 0.244 (0.876)	Data Time 0.001 (0.304)	Loss 2.7098 (2.4951)	Entropy 0.59239 (0.59301)	Top-1 acc 58.203 (63.864)	Top-5 acc 80.078 (83.849)	lr 0.00708
Train [78][410/3239]	Time 0.248 (0.881)	Data Time 0.001 (0.311)	Loss 2.5245 (2.4946)	Entropy 0.59239 (0.59300)	Top-1 acc 62.109 (63.877)	Top-5 acc 82.812 (83.850)	lr 0.00708
Train [78][420/3239]	Time 0.222 (0.870)	Data Time 0.001 (0.304)	Loss 2.6321 (2.4937)	Entropy 0.59251 (0.59298)	Top-1 acc 62.500 (63.898)	Top-5 acc 80.469 (83.871)	lr 0.00708
Train [78][430/3239]	Time 0.243 (0.864)	Data Time 0.002 (0.301)	Loss 2.6104 (2.4924)	Entropy 0.59231 (0.59297)	Top-1 acc 61.719 (63.939)	Top-5 acc 81.641 (83.892)	lr 0.00708
Train [78][440/3239]	Time 0.273 (0.867)	Data Time 0.002 (0.308)	Loss 2.4320 (2.4929)	Entropy 0.59216 (0.59296)	Top-1 acc 64.844 (63.936)	Top-5 acc 85.938 (83.891)	lr 0.00708
Train [78][450/3239]	Time 0.352 (0.858)	Data Time 0.001 (0.301)	Loss 2.4103 (2.4925)	Entropy 0.59182 (0.59293)	Top-1 acc 63.672 (63.948)	Top-5 acc 84.375 (83.887)	lr 0.00708
Train [78][460/3239]	Time 0.252 (0.848)	Data Time 0.001 (0.294)	Loss 2.5321 (2.4928)	Entropy 0.59175 (0.59291)	Top-1 acc 63.672 (63.941)	Top-5 acc 85.156 (83.892)	lr 0.00708
Train [78][470/3239]	Time 0.237 (0.852)	Data Time 0.001 (0.301)	Loss 2.5474 (2.4934)	Entropy 0.59161 (0.59288)	Top-1 acc 64.844 (63.928)	Top-5 acc 82.422 (83.882)	lr 0.00708
Train [78][480/3239]	Time 0.228 (0.849)	Data Time 0.001 (0.300)	Loss 2.3548 (2.4930)	Entropy 0.59156 (0.59286)	Top-1 acc 67.578 (63.925)	Top-5 acc 84.766 (83.878)	lr 0.00707
Train [78][490/3239]	Time 0.233 (0.840)	Data Time 0.001 (0.294)	Loss 2.3758 (2.4929)	Entropy 0.59132 (0.59283)	Top-1 acc 64.844 (63.916)	Top-5 acc 86.719 (83.878)	lr 0.00707
Train [78][500/3239]	Time 2.378 (0.840)	Data Time 2.140 (0.296)	Loss 2.5584 (2.4935)	Entropy 0.59157 (0.59280)	Top-1 acc 59.766 (63.898)	Top-5 acc 83.203 (83.874)	lr 0.00707
Train [78][510/3239]	Time 0.236 (0.843)	Data Time 0.001 (0.301)	Loss 2.3962 (2.4942)	Entropy 0.59138 (0.59278)	Top-1 acc 67.578 (63.887)	Top-5 acc 85.156 (83.870)	lr 0.00707
Train [78][520/3239]	Time 0.361 (0.834)	Data Time 0.001 (0.296)	Loss 2.5574 (2.4942)	Entropy 0.59134 (0.59275)	Top-1 acc 60.547 (63.882)	Top-5 acc 84.375 (83.867)	lr 0.00707
Train [78][530/3239]	Time 0.248 (0.831)	Data Time 0.001 (0.295)	Loss 2.3934 (2.4940)	Entropy 0.59172 (0.59273)	Top-1 acc 63.672 (63.890)	Top-5 acc 85.156 (83.884)	lr 0.00707
Train [78][540/3239]	Time 0.223 (0.838)	Data Time 0.001 (0.304)	Loss 2.4681 (2.4947)	Entropy 0.59173 (0.59271)	Top-1 acc 66.016 (63.876)	Top-5 acc 83.984 (83.869)	lr 0.00707
Train [78][550/3239]	Time 0.228 (0.830)	Data Time 0.001 (0.298)	Loss 2.3569 (2.4953)	Entropy 0.59196 (0.59269)	Top-1 acc 66.797 (63.872)	Top-5 acc 84.766 (83.860)	lr 0.00707
Train [78][560/3239]	Time 0.234 (0.825)	Data Time 0.001 (0.295)	Loss 2.7105 (2.4955)	Entropy 0.59192 (0.59268)	Top-1 acc 60.156 (63.870)	Top-5 acc 81.641 (83.858)	lr 0.00707
Train [78][570/3239]	Time 0.231 (0.833)	Data Time 0.001 (0.305)	Loss 2.5468 (2.4961)	Entropy 0.59221 (0.59267)	Top-1 acc 60.156 (63.859)	Top-5 acc 84.766 (83.841)	lr 0.00707
Train [78][580/3239]	Time 0.271 (0.826)	Data Time 0.001 (0.300)	Loss 2.6740 (2.4949)	Entropy 0.59236 (0.59266)	Top-1 acc 60.938 (63.881)	Top-5 acc 78.516 (83.863)	lr 0.00707
Train [78][590/3239]	Time 0.231 (0.820)	Data Time 0.001 (0.294)	Loss 2.5428 (2.4951)	Entropy 0.59196 (0.59265)	Top-1 acc 57.812 (63.853)	Top-5 acc 85.547 (83.870)	lr 0.00706
Train [78][600/3239]	Time 0.230 (0.836)	Data Time 0.001 (0.312)	Loss 2.6362 (2.4966)	Entropy 0.59190 (0.59264)	Top-1 acc 57.812 (63.819)	Top-5 acc 83.203 (83.852)	lr 0.00706
Train [78][610/3239]	Time 0.328 (0.830)	Data Time 0.001 (0.307)	Loss 2.5724 (2.4970)	Entropy 0.59167 (0.59263)	Top-1 acc 61.719 (63.825)	Top-5 acc 83.594 (83.833)	lr 0.00706
Train [78][620/3239]	Time 0.237 (0.823)	Data Time 0.001 (0.302)	Loss 2.2537 (2.4966)	Entropy 0.59163 (0.59261)	Top-1 acc 72.656 (63.851)	Top-5 acc 89.062 (83.847)	lr 0.00706
Train [78][630/3239]	Time 0.260 (0.817)	Data Time 0.001 (0.297)	Loss 2.5847 (2.4965)	Entropy 0.59143 (0.59260)	Top-1 acc 62.500 (63.845)	Top-5 acc 83.203 (83.845)	lr 0.00706
Train [78][640/3239]	Time 0.238 (0.820)	Data Time 0.001 (0.302)	Loss 2.5032 (2.4966)	Entropy 0.59163 (0.59258)	Top-1 acc 64.062 (63.840)	Top-5 acc 83.203 (83.849)	lr 0.00706
Train [78][650/3239]	Time 0.251 (0.815)	Data Time 0.001 (0.298)	Loss 2.2364 (2.4968)	Entropy 0.59158 (0.59257)	Top-1 acc 71.875 (63.826)	Top-5 acc 89.844 (83.854)	lr 0.00706
Train [78][660/3239]	Time 0.244 (0.809)	Data Time 0.001 (0.294)	Loss 2.5050 (2.4976)	Entropy 0.59176 (0.59255)	Top-1 acc 63.281 (63.809)	Top-5 acc 84.375 (83.841)	lr 0.00706
Train [78][670/3239]	Time 0.269 (0.820)	Data Time 0.001 (0.306)	Loss 2.5355 (2.4984)	Entropy 0.59193 (0.59254)	Top-1 acc 63.672 (63.785)	Top-5 acc 83.984 (83.836)	lr 0.00706
Train [78][680/3239]	Time 0.343 (0.815)	Data Time 0.001 (0.301)	Loss 2.4126 (2.4979)	Entropy 0.59231 (0.59254)	Top-1 acc 65.625 (63.804)	Top-5 acc 87.500 (83.848)	lr 0.00706
Train [78][690/3239]	Time 0.233 (0.809)	Data Time 0.001 (0.297)	Loss 2.5935 (2.4991)	Entropy 0.59210 (0.59253)	Top-1 acc 64.844 (63.780)	Top-5 acc 83.594 (83.825)	lr 0.00706
Train [78][700/3239]	Time 0.332 (0.889)	Data Time 0.005 (0.302)	Loss 2.5389 (2.4988)	Entropy 0.59188 (0.59252)	Top-1 acc 59.766 (63.768)	Top-5 acc 83.594 (83.838)	lr 0.00705
Train [78][710/3239]	Time 0.241 (0.884)	Data Time 0.002 (0.298)	Loss 2.6218 (2.4989)	Entropy 0.59199 (0.59252)	Top-1 acc 57.812 (63.744)	Top-5 acc 82.812 (83.831)	lr 0.00705
Train [78][720/3239]	Time 0.247 (0.877)	Data Time 0.002 (0.294)	Loss 2.5976 (2.4993)	Entropy 0.59177 (0.59251)	Top-1 acc 61.719 (63.734)	Top-5 acc 81.641 (83.826)	lr 0.00705
Train [78][730/3239]	Time 0.243 (0.871)	Data Time 0.002 (0.290)	Loss 2.4034 (2.4984)	Entropy 0.59211 (0.59250)	Top-1 acc 64.844 (63.758)	Top-5 acc 87.500 (83.847)	lr 0.00705
Train [78][740/3239]	Time 0.227 (0.865)	Data Time 0.001 (0.286)	Loss 2.5374 (2.4986)	Entropy 0.59237 (0.59249)	Top-1 acc 61.719 (63.753)	Top-5 acc 83.203 (83.845)	lr 0.00705
Train [78][750/3239]	Time 0.235 (0.859)	Data Time 0.001 (0.282)	Loss 2.4943 (2.4987)	Entropy 0.59232 (0.59249)	Top-1 acc 62.500 (63.750)	Top-5 acc 82.812 (83.842)	lr 0.00705
Train [78][760/3239]	Time 0.239 (0.854)	Data Time 0.001 (0.278)	Loss 2.5572 (2.4986)	Entropy 0.59214 (0.59249)	Top-1 acc 60.547 (63.755)	Top-5 acc 82.812 (83.837)	lr 0.00705
Train [78][770/3239]	Time 0.373 (0.848)	Data Time 0.003 (0.275)	Loss 2.6053 (2.4990)	Entropy 0.59235 (0.59249)	Top-1 acc 62.109 (63.741)	Top-5 acc 82.422 (83.833)	lr 0.00705
Train [78][780/3239]	Time 0.235 (0.843)	Data Time 0.001 (0.271)	Loss 2.6924 (2.5000)	Entropy 0.59231 (0.59248)	Top-1 acc 60.547 (63.713)	Top-5 acc 78.516 (83.813)	lr 0.00705
Train [78][790/3239]	Time 0.245 (0.838)	Data Time 0.001 (0.268)	Loss 2.5395 (2.5001)	Entropy 0.59251 (0.59248)	Top-1 acc 65.625 (63.719)	Top-5 acc 82.812 (83.806)	lr 0.00705
Train [78][800/3239]	Time 0.282 (0.845)	Data Time 0.001 (0.276)	Loss 2.5036 (2.5000)	Entropy 0.59248 (0.59248)	Top-1 acc 62.109 (63.715)	Top-5 acc 85.156 (83.807)	lr 0.00705
Train [78][810/3239]	Time 0.251 (0.843)	Data Time 0.001 (0.276)	Loss 2.6189 (2.4996)	Entropy 0.59258 (0.59248)	Top-1 acc 57.812 (63.703)	Top-5 acc 81.250 (83.813)	lr 0.00704
Train [78][820/3239]	Time 0.239 (0.842)	Data Time 0.001 (0.276)	Loss 2.4678 (2.4994)	Entropy 0.59264 (0.59248)	Top-1 acc 65.234 (63.699)	Top-5 acc 83.594 (83.815)	lr 0.00704
Train [78][830/3239]	Time 0.242 (0.848)	Data Time 0.001 (0.285)	Loss 2.2935 (2.4997)	Entropy 0.59257 (0.59249)	Top-1 acc 67.969 (63.695)	Top-5 acc 88.281 (83.821)	lr 0.00704
Train [78][840/3239]	Time 0.364 (0.845)	Data Time 0.003 (0.282)	Loss 2.5503 (2.5003)	Entropy 0.59271 (0.59249)	Top-1 acc 62.891 (63.692)	Top-5 acc 81.641 (83.815)	lr 0.00704
Train [78][850/3239]	Time 0.222 (0.842)	Data Time 0.001 (0.281)	Loss 2.5864 (2.4997)	Entropy 0.59256 (0.59249)	Top-1 acc 60.938 (63.710)	Top-5 acc 81.250 (83.820)	lr 0.00704
Train [78][860/3239]	Time 9.096 (0.847)	Data Time 8.839 (0.288)	Loss 2.4953 (2.4997)	Entropy 0.59277 (0.59249)	Top-1 acc 62.891 (63.708)	Top-5 acc 83.984 (83.821)	lr 0.00704
Train [78][870/3239]	Time 0.236 (0.846)	Data Time 0.001 (0.288)	Loss 2.4565 (2.4999)	Entropy 0.59302 (0.59250)	Top-1 acc 64.453 (63.698)	Top-5 acc 84.375 (83.823)	lr 0.00704
Train [78][880/3239]	Time 0.223 (0.841)	Data Time 0.001 (0.285)	Loss 2.8095 (2.5003)	Entropy 0.59235 (0.59250)	Top-1 acc 57.422 (63.693)	Top-5 acc 79.297 (83.812)	lr 0.00704
Train [78][890/3239]	Time 0.237 (0.840)	Data Time 0.001 (0.285)	Loss 2.3766 (2.5002)	Entropy 0.59258 (0.59250)	Top-1 acc 68.359 (63.698)	Top-5 acc 83.984 (83.806)	lr 0.00704
Train [78][900/3239]	Time 0.283 (0.847)	Data Time 0.002 (0.294)	Loss 2.4891 (2.5010)	Entropy 0.59259 (0.59250)	Top-1 acc 64.453 (63.673)	Top-5 acc 83.984 (83.790)	lr 0.00704
Train [78][910/3239]	Time 0.265 (0.843)	Data Time 0.003 (0.291)	Loss 2.3579 (2.5012)	Entropy 0.59264 (0.59250)	Top-1 acc 66.406 (63.672)	Top-5 acc 85.938 (83.783)	lr 0.00704
Train [78][920/3239]	Time 0.279 (0.848)	Data Time 0.003 (0.297)	Loss 2.5173 (2.5013)	Entropy 0.59269 (0.59250)	Top-1 acc 62.500 (63.661)	Top-5 acc 83.594 (83.787)	lr 0.00703
Train [78][930/3239]	Time 2.481 (0.848)	Data Time 2.194 (0.299)	Loss 2.6967 (2.5015)	Entropy 0.59252 (0.59251)	Top-1 acc 57.812 (63.656)	Top-5 acc 81.250 (83.786)	lr 0.00703
Train [78][940/3239]	Time 0.259 (0.843)	Data Time 0.001 (0.295)	Loss 2.6757 (2.5015)	Entropy 0.59200 (0.59250)	Top-1 acc 62.500 (63.660)	Top-5 acc 82.812 (83.791)	lr 0.00703
Train [78][950/3239]	Time 0.254 (0.849)	Data Time 0.002 (0.302)	Loss 2.5781 (2.5017)	Entropy 0.59213 (0.59250)	Top-1 acc 63.672 (63.656)	Top-5 acc 84.375 (83.790)	lr 0.00703
Train [78][960/3239]	Time 0.234 (0.846)	Data Time 0.001 (0.300)	Loss 2.4322 (2.5017)	Entropy 0.59217 (0.59250)	Top-1 acc 64.844 (63.652)	Top-5 acc 85.938 (83.794)	lr 0.00703
Train [78][970/3239]	Time 0.243 (0.845)	Data Time 0.001 (0.300)	Loss 2.4538 (2.5015)	Entropy 0.59213 (0.59249)	Top-1 acc 61.328 (63.653)	Top-5 acc 84.375 (83.803)	lr 0.00703
Train [78][980/3239]	Time 0.276 (0.848)	Data Time 0.001 (0.305)	Loss 2.4276 (2.5016)	Entropy 0.59203 (0.59249)	Top-1 acc 66.016 (63.661)	Top-5 acc 87.109 (83.803)	lr 0.00703
Train [78][990/3239]	Time 0.235 (0.844)	Data Time 0.001 (0.302)	Loss 2.6058 (2.5017)	Entropy 0.59216 (0.59248)	Top-1 acc 62.109 (63.653)	Top-5 acc 82.812 (83.801)	lr 0.00703
Train [78][1000/3239]	Time 0.356 (0.846)	Data Time 0.001 (0.304)	Loss 2.5137 (2.5012)	Entropy 0.59186 (0.59248)	Top-1 acc 61.719 (63.664)	Top-5 acc 83.594 (83.810)	lr 0.00703
Train [78][1010/3239]	Time 0.245 (0.847)	Data Time 0.001 (0.307)	Loss 2.3536 (2.5015)	Entropy 0.59228 (0.59248)	Top-1 acc 67.969 (63.661)	Top-5 acc 85.938 (83.804)	lr 0.00703
Train [78][1020/3239]	Time 1.395 (0.844)	Data Time 1.159 (0.305)	Loss 2.6974 (2.5020)	Entropy 0.59221 (0.59247)	Top-1 acc 59.766 (63.653)	Top-5 acc 80.859 (83.793)	lr 0.00703
Train [78][1030/3239]	Time 0.234 (0.848)	Data Time 0.001 (0.310)	Loss 2.4816 (2.5013)	Entropy 0.59217 (0.59247)	Top-1 acc 64.453 (63.669)	Top-5 acc 83.984 (83.806)	lr 0.00702
Train [78][1040/3239]	Time 0.236 (0.844)	Data Time 0.001 (0.307)	Loss 2.4220 (2.5013)	Entropy 0.59236 (0.59247)	Top-1 acc 66.016 (63.672)	Top-5 acc 85.547 (83.806)	lr 0.00702
Train [78][1050/3239]	Time 0.276 (0.848)	Data Time 0.001 (0.312)	Loss 2.4440 (2.5018)	Entropy 0.59251 (0.59247)	Top-1 acc 62.109 (63.655)	Top-5 acc 85.938 (83.806)	lr 0.00702
Train [78][1060/3239]	Time 0.222 (0.848)	Data Time 0.001 (0.313)	Loss 2.7610 (2.5021)	Entropy 0.59201 (0.59247)	Top-1 acc 57.422 (63.644)	Top-5 acc 77.734 (83.794)	lr 0.00702
Train [78][1070/3239]	Time 0.316 (0.844)	Data Time 0.001 (0.310)	Loss 2.6041 (2.5019)	Entropy 0.59192 (0.59246)	Top-1 acc 60.547 (63.647)	Top-5 acc 81.250 (83.802)	lr 0.00702
Train [78][1080/3239]	Time 0.295 (0.849)	Data Time 0.001 (0.316)	Loss 2.6288 (2.5018)	Entropy 0.59199 (0.59246)	Top-1 acc 61.328 (63.656)	Top-5 acc 79.688 (83.795)	lr 0.00702
Train [78][1090/3239]	Time 0.240 (0.851)	Data Time 0.001 (0.320)	Loss 2.3665 (2.5017)	Entropy 0.59208 (0.59245)	Top-1 acc 66.406 (63.656)	Top-5 acc 88.672 (83.806)	lr 0.00702
Train [78][1100/3239]	Time 0.229 (0.848)	Data Time 0.001 (0.317)	Loss 2.5128 (2.5015)	Entropy 0.59174 (0.59245)	Top-1 acc 61.328 (63.649)	Top-5 acc 82.422 (83.812)	lr 0.00702
Train [78][1110/3239]	Time 0.235 (0.853)	Data Time 0.001 (0.323)	Loss 2.4278 (2.5019)	Entropy 0.59151 (0.59244)	Top-1 acc 66.406 (63.640)	Top-5 acc 84.375 (83.810)	lr 0.00702
Train [78][1120/3239]	Time 0.244 (0.853)	Data Time 0.001 (0.324)	Loss 2.4067 (2.5020)	Entropy 0.59171 (0.59244)	Top-1 acc 65.234 (63.636)	Top-5 acc 83.984 (83.809)	lr 0.00702
Train [78][1130/3239]	Time 0.239 (0.849)	Data Time 0.001 (0.321)	Loss 2.4690 (2.5022)	Entropy 0.59205 (0.59243)	Top-1 acc 63.281 (63.629)	Top-5 acc 85.156 (83.802)	lr 0.00702
Train [78][1140/3239]	Time 0.224 (0.854)	Data Time 0.001 (0.327)	Loss 2.4676 (2.5020)	Entropy 0.59197 (0.59243)	Top-1 acc 66.406 (63.637)	Top-5 acc 85.938 (83.802)	lr 0.00701
Train [78][1150/3239]	Time 0.264 (0.850)	Data Time 0.002 (0.324)	Loss 2.4935 (2.5019)	Entropy 0.59181 (0.59242)	Top-1 acc 61.719 (63.636)	Top-5 acc 86.328 (83.806)	lr 0.00701
Train [78][1160/3239]	Time 1.097 (0.851)	Data Time 0.733 (0.326)	Loss 2.5861 (2.5018)	Entropy 0.59183 (0.59242)	Top-1 acc 58.203 (63.640)	Top-5 acc 83.203 (83.812)	lr 0.00701
Train [78][1170/3239]	Time 0.249 (0.856)	Data Time 0.001 (0.332)	Loss 2.3642 (2.5018)	Entropy 0.59179 (0.59241)	Top-1 acc 66.406 (63.638)	Top-5 acc 86.328 (83.814)	lr 0.00701
Train [78][1180/3239]	Time 0.230 (0.852)	Data Time 0.001 (0.329)	Loss 2.3565 (2.5015)	Entropy 0.59163 (0.59241)	Top-1 acc 69.141 (63.642)	Top-5 acc 84.766 (83.821)	lr 0.00701
Train [78][1190/3239]	Time 0.257 (0.852)	Data Time 0.001 (0.330)	Loss 2.6062 (2.5014)	Entropy 0.59166 (0.59240)	Top-1 acc 62.500 (63.644)	Top-5 acc 83.594 (83.825)	lr 0.00701
Train [78][1200/3239]	Time 2.500 (0.850)	Data Time 2.248 (0.329)	Loss 2.6076 (2.5016)	Entropy 0.59178 (0.59240)	Top-1 acc 58.594 (63.639)	Top-5 acc 81.641 (83.819)	lr 0.00701
Train [78][1210/3239]	Time 0.299 (0.857)	Data Time 0.001 (0.336)	Loss 2.4850 (2.5017)	Entropy 0.59147 (0.59239)	Top-1 acc 63.672 (63.633)	Top-5 acc 83.203 (83.821)	lr 0.00701
Train [78][1220/3239]	Time 0.251 (0.854)	Data Time 0.001 (0.333)	Loss 2.7007 (2.5018)	Entropy 0.59169 (0.59238)	Top-1 acc 57.422 (63.638)	Top-5 acc 80.859 (83.818)	lr 0.00701
Train [78][1230/3239]	Time 0.326 (0.851)	Data Time 0.001 (0.331)	Loss 2.3357 (2.5015)	Entropy 0.59147 (0.59238)	Top-1 acc 69.141 (63.642)	Top-5 acc 87.500 (83.822)	lr 0.00701
Train [78][1240/3239]	Time 0.228 (0.858)	Data Time 0.001 (0.339)	Loss 2.5132 (2.5017)	Entropy 0.59145 (0.59237)	Top-1 acc 66.797 (63.633)	Top-5 acc 81.250 (83.817)	lr 0.00701
Train [78][1250/3239]	Time 0.247 (0.854)	Data Time 0.001 (0.336)	Loss 2.3557 (2.5018)	Entropy 0.59117 (0.59236)	Top-1 acc 64.453 (63.628)	Top-5 acc 88.672 (83.822)	lr 0.00700
Train [78][1260/3239]	Time 0.685 (0.852)	Data Time 0.461 (0.335)	Loss 2.5089 (2.5020)	Entropy 0.59106 (0.59235)	Top-1 acc 65.625 (63.625)	Top-5 acc 83.203 (83.819)	lr 0.00700
Train [78][1270/3239]	Time 0.230 (0.860)	Data Time 0.001 (0.344)	Loss 2.4224 (2.5017)	Entropy 0.59083 (0.59234)	Top-1 acc 64.062 (63.632)	Top-5 acc 84.375 (83.828)	lr 0.00700
Train [78][1280/3239]	Time 0.233 (0.857)	Data Time 0.001 (0.341)	Loss 2.5205 (2.5014)	Entropy 0.59101 (0.59233)	Top-1 acc 64.453 (63.637)	Top-5 acc 83.203 (83.833)	lr 0.00700
Train [78][1290/3239]	Time 0.233 (0.853)	Data Time 0.001 (0.338)	Loss 2.5549 (2.5020)	Entropy 0.59026 (0.59232)	Top-1 acc 60.938 (63.629)	Top-5 acc 84.375 (83.819)	lr 0.00700
Train [78][1300/3239]	Time 0.239 (0.864)	Data Time 0.001 (0.350)	Loss 2.5235 (2.5018)	Entropy 0.59033 (0.59230)	Top-1 acc 64.453 (63.634)	Top-5 acc 84.375 (83.825)	lr 0.00700
Train [78][1310/3239]	Time 0.242 (0.861)	Data Time 0.001 (0.347)	Loss 2.6339 (2.5022)	Entropy 0.59023 (0.59229)	Top-1 acc 62.109 (63.629)	Top-5 acc 80.078 (83.818)	lr 0.00700
Train [78][1320/3239]	Time 0.288 (0.857)	Data Time 0.001 (0.344)	Loss 2.4930 (2.5023)	Entropy 0.59048 (0.59227)	Top-1 acc 63.281 (63.629)	Top-5 acc 83.984 (83.821)	lr 0.00700
Train [78][1330/3239]	Time 0.234 (0.868)	Data Time 0.001 (0.356)	Loss 2.6711 (2.5028)	Entropy 0.59052 (0.59226)	Top-1 acc 59.766 (63.616)	Top-5 acc 82.812 (83.818)	lr 0.00700
Train [78][1340/3239]	Time 0.267 (0.865)	Data Time 0.001 (0.353)	Loss 2.4013 (2.5029)	Entropy 0.59061 (0.59225)	Top-1 acc 65.625 (63.613)	Top-5 acc 85.547 (83.814)	lr 0.00700
Train [78][1350/3239]	Time 0.235 (0.861)	Data Time 0.001 (0.351)	Loss 2.6582 (2.5034)	Entropy 0.59072 (0.59223)	Top-1 acc 60.547 (63.605)	Top-5 acc 81.250 (83.799)	lr 0.00700
Train [78][1360/3239]	Time 0.278 (0.899)	Data Time 0.002 (0.348)	Loss 2.4659 (2.5037)	Entropy 0.59072 (0.59222)	Top-1 acc 63.281 (63.603)	Top-5 acc 87.109 (83.797)	lr 0.00699
Train [78][1370/3239]	Time 0.232 (0.895)	Data Time 0.002 (0.345)	Loss 2.4755 (2.5038)	Entropy 0.59079 (0.59221)	Top-1 acc 61.719 (63.600)	Top-5 acc 84.766 (83.784)	lr 0.00699
Train [78][1380/3239]	Time 0.254 (0.891)	Data Time 0.002 (0.343)	Loss 2.4317 (2.5034)	Entropy 0.59073 (0.59220)	Top-1 acc 64.453 (63.610)	Top-5 acc 83.984 (83.788)	lr 0.00699
Train [78][1390/3239]	Time 0.329 (0.888)	Data Time 0.001 (0.341)	Loss 2.5572 (2.5035)	Entropy 0.59078 (0.59219)	Top-1 acc 63.672 (63.615)	Top-5 acc 84.766 (83.786)	lr 0.00699
Train [78][1400/3239]	Time 0.252 (0.885)	Data Time 0.003 (0.338)	Loss 2.4114 (2.5040)	Entropy 0.59096 (0.59218)	Top-1 acc 64.062 (63.602)	Top-5 acc 84.375 (83.775)	lr 0.00699
Train [78][1410/3239]	Time 0.254 (0.881)	Data Time 0.001 (0.336)	Loss 2.5510 (2.5037)	Entropy 0.59111 (0.59217)	Top-1 acc 59.375 (63.612)	Top-5 acc 84.375 (83.776)	lr 0.00699
Train [78][1420/3239]	Time 0.258 (0.878)	Data Time 0.002 (0.333)	Loss 2.4114 (2.5036)	Entropy 0.59117 (0.59217)	Top-1 acc 66.797 (63.617)	Top-5 acc 85.156 (83.780)	lr 0.00699
Train [78][1430/3239]	Time 0.323 (0.876)	Data Time 0.094 (0.332)	Loss 2.4692 (2.5035)	Entropy 0.59141 (0.59216)	Top-1 acc 62.109 (63.620)	Top-5 acc 84.766 (83.779)	lr 0.00699
Train [78][1440/3239]	Time 2.017 (0.876)	Data Time 1.763 (0.333)	Loss 2.3132 (2.5035)	Entropy 0.59150 (0.59216)	Top-1 acc 67.188 (63.618)	Top-5 acc 87.109 (83.779)	lr 0.00699
Train [78][1450/3239]	Time 0.251 (0.873)	Data Time 0.001 (0.330)	Loss 2.4646 (2.5031)	Entropy 0.59112 (0.59215)	Top-1 acc 63.672 (63.626)	Top-5 acc 85.547 (83.784)	lr 0.00699
Train [78][1460/3239]	Time 0.287 (0.879)	Data Time 0.003 (0.337)	Loss 2.4838 (2.5029)	Entropy 0.59146 (0.59214)	Top-1 acc 62.109 (63.627)	Top-5 acc 83.594 (83.785)	lr 0.00699
Train [78][1470/3239]	Time 0.288 (0.876)	Data Time 0.001 (0.335)	Loss 2.4417 (2.5034)	Entropy 0.59143 (0.59214)	Top-1 acc 67.969 (63.620)	Top-5 acc 83.203 (83.772)	lr 0.00698
Train [78][1480/3239]	Time 0.350 (0.875)	Data Time 0.001 (0.335)	Loss 2.2823 (2.5032)	Entropy 0.59135 (0.59214)	Top-1 acc 72.656 (63.632)	Top-5 acc 87.891 (83.776)	lr 0.00698
Train [78][1490/3239]	Time 0.239 (0.880)	Data Time 0.001 (0.340)	Loss 2.5427 (2.5031)	Entropy 0.59175 (0.59213)	Top-1 acc 64.062 (63.633)	Top-5 acc 83.594 (83.778)	lr 0.00698
Train [78][1500/3239]	Time 0.249 (0.879)	Data Time 0.001 (0.340)	Loss 2.3528 (2.5036)	Entropy 0.59198 (0.59213)	Top-1 acc 64.453 (63.612)	Top-5 acc 89.062 (83.772)	lr 0.00698
Train [78][1510/3239]	Time 0.452 (0.876)	Data Time 0.217 (0.338)	Loss 2.6171 (2.5033)	Entropy 0.59145 (0.59213)	Top-1 acc 63.672 (63.620)	Top-5 acc 82.812 (83.777)	lr 0.00698
Train [78][1520/3239]	Time 0.240 (0.881)	Data Time 0.001 (0.343)	Loss 2.4470 (2.5033)	Entropy 0.59135 (0.59212)	Top-1 acc 62.891 (63.620)	Top-5 acc 85.156 (83.776)	lr 0.00698
Train [78][1530/3239]	Time 0.256 (0.881)	Data Time 0.001 (0.344)	Loss 2.7299 (2.5033)	Entropy 0.59126 (0.59212)	Top-1 acc 55.859 (63.616)	Top-5 acc 79.297 (83.777)	lr 0.00698
Train [78][1540/3239]	Time 1.759 (0.879)	Data Time 1.483 (0.343)	Loss 2.4349 (2.5030)	Entropy 0.59104 (0.59211)	Top-1 acc 62.891 (63.617)	Top-5 acc 83.203 (83.779)	lr 0.00698
Train [78][1550/3239]	Time 1.664 (0.882)	Data Time 1.309 (0.347)	Loss 2.5173 (2.5028)	Entropy 0.59121 (0.59211)	Top-1 acc 64.453 (63.626)	Top-5 acc 83.984 (83.779)	lr 0.00698
Train [78][1560/3239]	Time 0.244 (0.881)	Data Time 0.001 (0.346)	Loss 2.5140 (2.5029)	Entropy 0.59098 (0.59210)	Top-1 acc 61.328 (63.625)	Top-5 acc 83.594 (83.772)	lr 0.00698
Train [78][1570/3239]	Time 0.246 (0.881)	Data Time 0.001 (0.347)	Loss 2.5826 (2.5030)	Entropy 0.59085 (0.59209)	Top-1 acc 60.938 (63.617)	Top-5 acc 82.031 (83.773)	lr 0.00698
Train [78][1580/3239]	Time 0.275 (0.883)	Data Time 0.003 (0.349)	Loss 2.2448 (2.5025)	Entropy 0.59082 (0.59208)	Top-1 acc 69.141 (63.631)	Top-5 acc 89.453 (83.783)	lr 0.00698
Train [78][1590/3239]	Time 0.261 (0.884)	Data Time 0.001 (0.351)	Loss 2.6655 (2.5030)	Entropy 0.59094 (0.59208)	Top-1 acc 58.594 (63.614)	Top-5 acc 82.812 (83.775)	lr 0.00697
Train [78][1600/3239]	Time 0.259 (0.883)	Data Time 0.001 (0.351)	Loss 2.4369 (2.5030)	Entropy 0.59091 (0.59207)	Top-1 acc 64.453 (63.618)	Top-5 acc 85.938 (83.776)	lr 0.00697
Train [78][1610/3239]	Time 0.237 (0.880)	Data Time 0.001 (0.349)	Loss 2.3749 (2.5029)	Entropy 0.59117 (0.59206)	Top-1 acc 66.016 (63.620)	Top-5 acc 86.719 (83.781)	lr 0.00697
Train [78][1620/3239]	Time 1.793 (0.883)	Data Time 1.563 (0.352)	Loss 2.7161 (2.5032)	Entropy 0.59115 (0.59206)	Top-1 acc 57.422 (63.614)	Top-5 acc 79.297 (83.774)	lr 0.00697
Train [78][1630/3239]	Time 0.283 (0.886)	Data Time 0.001 (0.356)	Loss 2.5680 (2.5033)	Entropy 0.59116 (0.59205)	Top-1 acc 60.156 (63.614)	Top-5 acc 83.984 (83.776)	lr 0.00697
Train [78][1640/3239]	Time 0.238 (0.884)	Data Time 0.002 (0.355)	Loss 2.3702 (2.5033)	Entropy 0.59123 (0.59205)	Top-1 acc 66.797 (63.612)	Top-5 acc 86.328 (83.775)	lr 0.00697
Train [78][1650/3239]	Time 0.230 (0.885)	Data Time 0.001 (0.356)	Loss 2.5737 (2.5034)	Entropy 0.59130 (0.59204)	Top-1 acc 59.766 (63.602)	Top-5 acc 83.984 (83.777)	lr 0.00697
Train [78][1660/3239]	Time 0.240 (0.890)	Data Time 0.001 (0.362)	Loss 2.3792 (2.5033)	Entropy 0.59127 (0.59204)	Top-1 acc 70.312 (63.610)	Top-5 acc 84.375 (83.778)	lr 0.00697
Train [78][1670/3239]	Time 0.407 (0.887)	Data Time 0.172 (0.360)	Loss 2.6180 (2.5035)	Entropy 0.59133 (0.59203)	Top-1 acc 60.547 (63.607)	Top-5 acc 81.641 (83.776)	lr 0.00697
Train [78][1680/3239]	Time 0.229 (0.889)	Data Time 0.001 (0.361)	Loss 2.5081 (2.5034)	Entropy 0.59107 (0.59203)	Top-1 acc 64.453 (63.616)	Top-5 acc 83.594 (83.778)	lr 0.00697
Train [78][1690/3239]	Time 7.547 (0.893)	Data Time 7.294 (0.367)	Loss 2.4001 (2.5036)	Entropy 0.59121 (0.59202)	Top-1 acc 64.062 (63.613)	Top-5 acc 85.938 (83.773)	lr 0.00697
Train [78][1700/3239]	Time 0.238 (0.891)	Data Time 0.001 (0.365)	Loss 2.2614 (2.5036)	Entropy 0.59133 (0.59202)	Top-1 acc 69.141 (63.618)	Top-5 acc 86.328 (83.775)	lr 0.00696
Train [78][1710/3239]	Time 0.332 (0.894)	Data Time 0.001 (0.369)	Loss 2.5148 (2.5040)	Entropy 0.59150 (0.59201)	Top-1 acc 64.062 (63.605)	Top-5 acc 83.984 (83.771)	lr 0.00696
Train [78][1720/3239]	Time 0.238 (0.894)	Data Time 0.001 (0.369)	Loss 2.3937 (2.5039)	Entropy 0.59126 (0.59201)	Top-1 acc 67.188 (63.602)	Top-5 acc 85.938 (83.776)	lr 0.00696
Train [78][1730/3239]	Time 0.239 (0.894)	Data Time 0.001 (0.370)	Loss 2.3854 (2.5036)	Entropy 0.59131 (0.59201)	Top-1 acc 62.500 (63.605)	Top-5 acc 87.891 (83.781)	lr 0.00696
Train [78][1740/3239]	Time 0.232 (0.899)	Data Time 0.001 (0.375)	Loss 2.4336 (2.5033)	Entropy 0.59133 (0.59200)	Top-1 acc 66.406 (63.611)	Top-5 acc 84.375 (83.783)	lr 0.00696
Train [78][1750/3239]	Time 0.233 (0.899)	Data Time 0.001 (0.376)	Loss 2.4568 (2.5036)	Entropy 0.59098 (0.59200)	Top-1 acc 62.500 (63.603)	Top-5 acc 85.156 (83.778)	lr 0.00696
Train [78][1760/3239]	Time 0.243 (0.900)	Data Time 0.002 (0.378)	Loss 2.5166 (2.5036)	Entropy 0.59083 (0.59199)	Top-1 acc 63.281 (63.606)	Top-5 acc 82.422 (83.777)	lr 0.00696
Train [78][1770/3239]	Time 0.243 (0.898)	Data Time 0.001 (0.376)	Loss 2.5181 (2.5034)	Entropy 0.59035 (0.59198)	Top-1 acc 66.406 (63.612)	Top-5 acc 83.984 (83.780)	lr 0.00696
Train [78][1780/3239]	Time 0.332 (0.900)	Data Time 0.001 (0.379)	Loss 2.4823 (2.5036)	Entropy 0.59076 (0.59198)	Top-1 acc 64.062 (63.606)	Top-5 acc 82.031 (83.773)	lr 0.00696
Train [78][1790/3239]	Time 0.251 (0.905)	Data Time 0.002 (0.385)	Loss 2.3382 (2.5032)	Entropy 0.59097 (0.59197)	Top-1 acc 66.016 (63.608)	Top-5 acc 85.938 (83.777)	lr 0.00696
Train [78][1800/3239]	Time 0.274 (0.903)	Data Time 0.002 (0.383)	Loss 2.3833 (2.5034)	Entropy 0.59111 (0.59196)	Top-1 acc 67.578 (63.606)	Top-5 acc 87.109 (83.776)	lr 0.00696
Train [78][1810/3239]	Time 0.235 (0.904)	Data Time 0.001 (0.385)	Loss 2.6189 (2.5034)	Entropy 0.59119 (0.59196)	Top-1 acc 64.844 (63.606)	Top-5 acc 81.250 (83.778)	lr 0.00695
Train [78][1820/3239]	Time 0.230 (0.909)	Data Time 0.001 (0.390)	Loss 2.6891 (2.5038)	Entropy 0.59138 (0.59196)	Top-1 acc 58.203 (63.597)	Top-5 acc 81.641 (83.767)	lr 0.00695
Train [78][1830/3239]	Time 0.249 (0.906)	Data Time 0.001 (0.388)	Loss 2.4785 (2.5040)	Entropy 0.59134 (0.59195)	Top-1 acc 60.156 (63.579)	Top-5 acc 84.375 (83.769)	lr 0.00695
Train [78][1840/3239]	Time 0.235 (0.908)	Data Time 0.001 (0.390)	Loss 2.3911 (2.5037)	Entropy 0.59143 (0.59195)	Top-1 acc 67.969 (63.588)	Top-5 acc 85.156 (83.775)	lr 0.00695
Train [78][1850/3239]	Time 3.904 (0.912)	Data Time 3.655 (0.395)	Loss 2.3273 (2.5032)	Entropy 0.59177 (0.59195)	Top-1 acc 63.672 (63.600)	Top-5 acc 86.719 (83.784)	lr 0.00695
Train [78][1860/3239]	Time 0.229 (0.910)	Data Time 0.001 (0.393)	Loss 2.4596 (2.5030)	Entropy 0.59198 (0.59195)	Top-1 acc 66.406 (63.606)	Top-5 acc 82.422 (83.789)	lr 0.00695
Train [78][1870/3239]	Time 0.344 (0.911)	Data Time 0.002 (0.395)	Loss 2.5133 (2.5031)	Entropy 0.59197 (0.59195)	Top-1 acc 65.234 (63.601)	Top-5 acc 85.156 (83.787)	lr 0.00695
Train [78][1880/3239]	Time 0.239 (0.913)	Data Time 0.001 (0.397)	Loss 2.3894 (2.5033)	Entropy 0.59182 (0.59195)	Top-1 acc 64.062 (63.597)	Top-5 acc 85.547 (83.785)	lr 0.00695
Train [78][1890/3239]	Time 0.258 (0.915)	Data Time 0.001 (0.400)	Loss 2.3320 (2.5032)	Entropy 0.59156 (0.59195)	Top-1 acc 66.797 (63.601)	Top-5 acc 86.719 (83.788)	lr 0.00695
Train [78][1900/3239]	Time 0.233 (0.913)	Data Time 0.001 (0.398)	Loss 2.5867 (2.5031)	Entropy 0.59158 (0.59194)	Top-1 acc 61.328 (63.603)	Top-5 acc 82.812 (83.787)	lr 0.00695
Train [78][1910/3239]	Time 0.246 (0.917)	Data Time 0.001 (0.403)	Loss 2.4789 (2.5034)	Entropy 0.59186 (0.59194)	Top-1 acc 65.625 (63.600)	Top-5 acc 84.766 (83.785)	lr 0.00695
Train [78][1920/3239]	Time 0.231 (0.918)	Data Time 0.001 (0.404)	Loss 2.4606 (2.5031)	Entropy 0.59166 (0.59194)	Top-1 acc 65.234 (63.607)	Top-5 acc 84.375 (83.792)	lr 0.00694
Train [78][1930/3239]	Time 0.234 (0.916)	Data Time 0.001 (0.402)	Loss 2.6042 (2.5033)	Entropy 0.59154 (0.59194)	Top-1 acc 67.578 (63.610)	Top-5 acc 80.859 (83.790)	lr 0.00694
Train [78][1940/3239]	Time 0.374 (0.917)	Data Time 0.001 (0.405)	Loss 2.4868 (2.5033)	Entropy 0.59179 (0.59194)	Top-1 acc 63.281 (63.608)	Top-5 acc 83.203 (83.786)	lr 0.00694
Train [78][1950/3239]	Time 0.244 (0.922)	Data Time 0.001 (0.410)	Loss 2.5289 (2.5032)	Entropy 0.59208 (0.59194)	Top-1 acc 68.750 (63.610)	Top-5 acc 82.422 (83.784)	lr 0.00694
Train [78][1960/3239]	Time 0.238 (0.921)	Data Time 0.002 (0.409)	Loss 2.5216 (2.5035)	Entropy 0.59225 (0.59194)	Top-1 acc 63.281 (63.608)	Top-5 acc 83.203 (83.779)	lr 0.00694
Train [78][1970/3239]	Time 0.231 (0.922)	Data Time 0.001 (0.411)	Loss 2.5204 (2.5034)	Entropy 0.59211 (0.59194)	Top-1 acc 64.062 (63.606)	Top-5 acc 83.203 (83.780)	lr 0.00694
Train [78][1980/3239]	Time 0.242 (0.926)	Data Time 0.001 (0.415)	Loss 2.5003 (2.5034)	Entropy 0.59203 (0.59194)	Top-1 acc 60.156 (63.601)	Top-5 acc 83.203 (83.781)	lr 0.00694
Train [78][1990/3239]	Time 2.301 (0.925)	Data Time 2.011 (0.414)	Loss 2.4277 (2.5032)	Entropy 0.59219 (0.59194)	Top-1 acc 64.453 (63.605)	Top-5 acc 82.812 (83.784)	lr 0.00694
Train [78][2000/3239]	Time 0.244 (0.924)	Data Time 0.001 (0.415)	Loss 2.4289 (2.5034)	Entropy 0.59240 (0.59194)	Top-1 acc 64.453 (63.602)	Top-5 acc 87.109 (83.782)	lr 0.00694
Train [78][2010/3239]	Time 0.285 (0.955)	Data Time 0.004 (0.417)	Loss 2.6462 (2.5033)	Entropy 0.59248 (0.59194)	Top-1 acc 61.328 (63.604)	Top-5 acc 78.125 (83.780)	lr 0.00694
Train [78][2020/3239]	Time 0.243 (0.953)	Data Time 0.002 (0.415)	Loss 2.3593 (2.5031)	Entropy 0.59208 (0.59195)	Top-1 acc 66.016 (63.607)	Top-5 acc 88.672 (83.791)	lr 0.00694
Train [78][2030/3239]	Time 0.416 (0.950)	Data Time 0.002 (0.413)	Loss 2.5925 (2.5033)	Entropy 0.59205 (0.59195)	Top-1 acc 63.281 (63.605)	Top-5 acc 79.688 (83.786)	lr 0.00693
Train [78][2040/3239]	Time 0.289 (0.948)	Data Time 0.002 (0.411)	Loss 2.7838 (2.5036)	Entropy 0.59178 (0.59195)	Top-1 acc 56.250 (63.594)	Top-5 acc 77.344 (83.780)	lr 0.00693
Train [78][2050/3239]	Time 0.241 (0.946)	Data Time 0.001 (0.409)	Loss 2.2034 (2.5036)	Entropy 0.59196 (0.59195)	Top-1 acc 72.266 (63.594)	Top-5 acc 90.234 (83.782)	lr 0.00693
Train [78][2060/3239]	Time 0.243 (0.943)	Data Time 0.001 (0.407)	Loss 2.5723 (2.5037)	Entropy 0.59169 (0.59195)	Top-1 acc 65.234 (63.597)	Top-5 acc 81.250 (83.781)	lr 0.00693
Train [78][2070/3239]	Time 0.244 (0.941)	Data Time 0.001 (0.405)	Loss 2.3264 (2.5041)	Entropy 0.59174 (0.59194)	Top-1 acc 65.234 (63.590)	Top-5 acc 86.328 (83.775)	lr 0.00693
Train [78][2080/3239]	Time 0.255 (0.942)	Data Time 0.001 (0.407)	Loss 2.4417 (2.5040)	Entropy 0.59178 (0.59194)	Top-1 acc 64.844 (63.589)	Top-5 acc 85.938 (83.778)	lr 0.00693
Train [78][2090/3239]	Time 0.247 (0.940)	Data Time 0.001 (0.406)	Loss 2.4576 (2.5042)	Entropy 0.59203 (0.59194)	Top-1 acc 65.234 (63.587)	Top-5 acc 85.156 (83.774)	lr 0.00693
Train [78][2100/3239]	Time 0.399 (0.938)	Data Time 0.044 (0.404)	Loss 2.4928 (2.5040)	Entropy 0.59190 (0.59194)	Top-1 acc 63.672 (63.591)	Top-5 acc 85.547 (83.778)	lr 0.00693
Train [78][2110/3239]	Time 0.256 (0.945)	Data Time 0.002 (0.411)	Loss 2.2564 (2.5041)	Entropy 0.59214 (0.59194)	Top-1 acc 70.312 (63.586)	Top-5 acc 87.109 (83.776)	lr 0.00693
Train [78][2120/3239]	Time 0.671 (0.944)	Data Time 0.436 (0.410)	Loss 2.4627 (2.5038)	Entropy 0.59231 (0.59194)	Top-1 acc 63.672 (63.592)	Top-5 acc 85.156 (83.780)	lr 0.00693
Train [78][2130/3239]	Time 0.245 (0.941)	Data Time 0.001 (0.409)	Loss 2.3388 (2.5036)	Entropy 0.59253 (0.59195)	Top-1 acc 67.578 (63.596)	Top-5 acc 86.719 (83.783)	lr 0.00693
Train [78][2140/3239]	Time 0.287 (0.947)	Data Time 0.002 (0.415)	Loss 2.6264 (2.5035)	Entropy 0.59265 (0.59195)	Top-1 acc 62.891 (63.595)	Top-5 acc 78.125 (83.783)	lr 0.00692
Train [78][2150/3239]	Time 0.251 (0.947)	Data Time 0.002 (0.415)	Loss 2.4199 (2.5033)	Entropy 0.59278 (0.59195)	Top-1 acc 64.062 (63.602)	Top-5 acc 85.938 (83.786)	lr 0.00692
Train [78][2160/3239]	Time 0.233 (0.945)	Data Time 0.001 (0.414)	Loss 2.5016 (2.5033)	Entropy 0.59281 (0.59196)	Top-1 acc 60.547 (63.602)	Top-5 acc 83.203 (83.786)	lr 0.00692
Train [78][2170/3239]	Time 10.130 (0.949)	Data Time 9.867 (0.418)	Loss 2.5201 (2.5031)	Entropy 0.59301 (0.59196)	Top-1 acc 62.109 (63.606)	Top-5 acc 82.812 (83.787)	lr 0.00692
Train [78][2180/3239]	Time 0.255 (0.948)	Data Time 0.001 (0.418)	Loss 2.6515 (2.5032)	Entropy 0.59335 (0.59197)	Top-1 acc 58.984 (63.599)	Top-5 acc 80.469 (83.785)	lr 0.00692
Train [78][2190/3239]	Time 0.292 (0.946)	Data Time 0.002 (0.416)	Loss 2.4032 (2.5030)	Entropy 0.59332 (0.59197)	Top-1 acc 62.109 (63.599)	Top-5 acc 87.500 (83.788)	lr 0.00692
Train [78][2200/3239]	Time 0.233 (0.944)	Data Time 0.001 (0.414)	Loss 2.5342 (2.5031)	Entropy 0.59291 (0.59198)	Top-1 acc 66.016 (63.599)	Top-5 acc 83.594 (83.786)	lr 0.00692
Train [78][2210/3239]	Time 0.235 (0.946)	Data Time 0.001 (0.416)	Loss 2.8856 (2.5034)	Entropy 0.59278 (0.59198)	Top-1 acc 51.562 (63.596)	Top-5 acc 77.734 (83.779)	lr 0.00692
Train [78][2220/3239]	Time 0.267 (0.943)	Data Time 0.001 (0.414)	Loss 2.4383 (2.5032)	Entropy 0.59272 (0.59198)	Top-1 acc 66.797 (63.604)	Top-5 acc 86.328 (83.782)	lr 0.00692
Train [78][2230/3239]	Time 0.242 (0.941)	Data Time 0.001 (0.412)	Loss 2.4499 (2.5031)	Entropy 0.59257 (0.59199)	Top-1 acc 62.891 (63.607)	Top-5 acc 85.547 (83.781)	lr 0.00692
Train [78][2240/3239]	Time 0.242 (0.944)	Data Time 0.001 (0.416)	Loss 2.4779 (2.5030)	Entropy 0.59239 (0.59199)	Top-1 acc 64.453 (63.610)	Top-5 acc 85.156 (83.781)	lr 0.00692
Train [78][2250/3239]	Time 0.253 (0.943)	Data Time 0.001 (0.415)	Loss 2.6832 (2.5030)	Entropy 0.59245 (0.59199)	Top-1 acc 59.375 (63.616)	Top-5 acc 78.516 (83.778)	lr 0.00691
Train [78][2260/3239]	Time 0.940 (0.944)	Data Time 0.570 (0.417)	Loss 2.3675 (2.5031)	Entropy 0.59242 (0.59199)	Top-1 acc 67.969 (63.613)	Top-5 acc 84.766 (83.775)	lr 0.00691
Train [78][2270/3239]	Time 0.249 (0.947)	Data Time 0.001 (0.420)	Loss 2.6505 (2.5034)	Entropy 0.59263 (0.59200)	Top-1 acc 61.719 (63.607)	Top-5 acc 80.469 (83.770)	lr 0.00691
Train [78][2280/3239]	Time 0.268 (0.947)	Data Time 0.002 (0.420)	Loss 2.6184 (2.5035)	Entropy 0.59307 (0.59200)	Top-1 acc 64.062 (63.602)	Top-5 acc 83.203 (83.772)	lr 0.00691
Train [78][2290/3239]	Time 0.253 (0.948)	Data Time 0.001 (0.422)	Loss 2.4914 (2.5038)	Entropy 0.59320 (0.59200)	Top-1 acc 65.625 (63.595)	Top-5 acc 84.766 (83.772)	lr 0.00691
Train [78][2300/3239]	Time 0.238 (0.950)	Data Time 0.001 (0.425)	Loss 2.5926 (2.5038)	Entropy 0.59298 (0.59201)	Top-1 acc 61.328 (63.600)	Top-5 acc 82.031 (83.770)	lr 0.00691
Train [78][2310/3239]	Time 0.252 (0.950)	Data Time 0.001 (0.425)	Loss 2.6812 (2.5039)	Entropy 0.59303 (0.59201)	Top-1 acc 61.719 (63.603)	Top-5 acc 82.031 (83.767)	lr 0.00691
Train [78][2320/3239]	Time 0.241 (0.948)	Data Time 0.001 (0.424)	Loss 2.4605 (2.5037)	Entropy 0.59306 (0.59202)	Top-1 acc 63.281 (63.605)	Top-5 acc 83.984 (83.770)	lr 0.00691
Train [78][2330/3239]	Time 13.884 (0.955)	Data Time 13.535 (0.431)	Loss 2.4039 (2.5035)	Entropy 0.59317 (0.59202)	Top-1 acc 66.016 (63.610)	Top-5 acc 85.156 (83.774)	lr 0.00691
Train [78][2340/3239]	Time 0.227 (0.954)	Data Time 0.001 (0.430)	Loss 2.4713 (2.5035)	Entropy 0.59298 (0.59203)	Top-1 acc 63.672 (63.610)	Top-5 acc 84.375 (83.775)	lr 0.00691
Train [78][2350/3239]	Time 0.296 (0.952)	Data Time 0.001 (0.428)	Loss 2.5526 (2.5037)	Entropy 0.59304 (0.59203)	Top-1 acc 63.281 (63.610)	Top-5 acc 77.734 (83.771)	lr 0.00691
Train [78][2360/3239]	Time 0.237 (0.953)	Data Time 0.001 (0.429)	Loss 2.5949 (2.5036)	Entropy 0.59289 (0.59204)	Top-1 acc 59.766 (63.611)	Top-5 acc 82.031 (83.770)	lr 0.00690
Train [78][2370/3239]	Time 0.285 (0.954)	Data Time 0.002 (0.431)	Loss 2.4795 (2.5036)	Entropy 0.59299 (0.59204)	Top-1 acc 62.500 (63.609)	Top-5 acc 84.375 (83.772)	lr 0.00690
Train [78][2380/3239]	Time 0.241 (0.952)	Data Time 0.002 (0.429)	Loss 2.4494 (2.5034)	Entropy 0.59312 (0.59204)	Top-1 acc 62.500 (63.611)	Top-5 acc 83.984 (83.774)	lr 0.00690
Train [78][2390/3239]	Time 0.237 (0.950)	Data Time 0.001 (0.427)	Loss 2.2699 (2.5032)	Entropy 0.59333 (0.59205)	Top-1 acc 64.844 (63.615)	Top-5 acc 88.672 (83.778)	lr 0.00690
Train [78][2400/3239]	Time 0.229 (0.951)	Data Time 0.001 (0.429)	Loss 2.6593 (2.5033)	Entropy 0.59316 (0.59205)	Top-1 acc 63.672 (63.611)	Top-5 acc 80.859 (83.776)	lr 0.00690
Train [78][2410/3239]	Time 0.236 (0.949)	Data Time 0.001 (0.427)	Loss 2.5179 (2.5034)	Entropy 0.59326 (0.59206)	Top-1 acc 63.281 (63.611)	Top-5 acc 83.984 (83.775)	lr 0.00690
Train [78][2420/3239]	Time 0.341 (0.948)	Data Time 0.001 (0.426)	Loss 2.6489 (2.5036)	Entropy 0.59290 (0.59206)	Top-1 acc 60.938 (63.609)	Top-5 acc 82.812 (83.774)	lr 0.00690
Train [78][2430/3239]	Time 0.261 (0.948)	Data Time 0.001 (0.427)	Loss 2.4458 (2.5037)	Entropy 0.59294 (0.59207)	Top-1 acc 65.234 (63.608)	Top-5 acc 84.766 (83.767)	lr 0.00690
Train [78][2440/3239]	Time 0.256 (0.946)	Data Time 0.001 (0.425)	Loss 2.4129 (2.5035)	Entropy 0.59318 (0.59207)	Top-1 acc 67.969 (63.615)	Top-5 acc 85.156 (83.770)	lr 0.00690
Train [78][2450/3239]	Time 0.230 (0.945)	Data Time 0.001 (0.425)	Loss 2.3875 (2.5034)	Entropy 0.59352 (0.59208)	Top-1 acc 66.016 (63.621)	Top-5 acc 85.547 (83.769)	lr 0.00690
Train [78][2460/3239]	Time 0.234 (0.946)	Data Time 0.001 (0.426)	Loss 2.4964 (2.5033)	Entropy 0.59377 (0.59208)	Top-1 acc 63.281 (63.624)	Top-5 acc 83.203 (83.769)	lr 0.00690
Train [78][2470/3239]	Time 0.253 (0.944)	Data Time 0.001 (0.424)	Loss 2.5255 (2.5034)	Entropy 0.59363 (0.59209)	Top-1 acc 64.844 (63.624)	Top-5 acc 81.641 (83.769)	lr 0.00689
Train [78][2480/3239]	Time 0.240 (0.942)	Data Time 0.001 (0.422)	Loss 2.4789 (2.5035)	Entropy 0.59382 (0.59210)	Top-1 acc 64.453 (63.623)	Top-5 acc 85.547 (83.768)	lr 0.00689
Train [78][2490/3239]	Time 7.093 (0.943)	Data Time 6.720 (0.424)	Loss 2.3674 (2.5034)	Entropy 0.59374 (0.59210)	Top-1 acc 66.016 (63.626)	Top-5 acc 87.109 (83.768)	lr 0.00689
Train [78][2500/3239]	Time 0.247 (0.942)	Data Time 0.001 (0.423)	Loss 2.5436 (2.5033)	Entropy 0.59353 (0.59211)	Top-1 acc 59.375 (63.625)	Top-5 acc 84.766 (83.768)	lr 0.00689
Train [78][2510/3239]	Time 0.247 (0.940)	Data Time 0.001 (0.422)	Loss 2.6108 (2.5033)	Entropy 0.59360 (0.59211)	Top-1 acc 58.984 (63.624)	Top-5 acc 82.031 (83.772)	lr 0.00689
Train [78][2520/3239]	Time 0.263 (0.939)	Data Time 0.002 (0.421)	Loss 2.7145 (2.5035)	Entropy 0.59358 (0.59212)	Top-1 acc 58.984 (63.620)	Top-5 acc 79.297 (83.771)	lr 0.00689
Train [78][2530/3239]	Time 0.237 (0.943)	Data Time 0.002 (0.426)	Loss 2.4985 (2.5034)	Entropy 0.59348 (0.59213)	Top-1 acc 64.844 (63.621)	Top-5 acc 84.766 (83.771)	lr 0.00689
Train [78][2540/3239]	Time 0.227 (0.941)	Data Time 0.001 (0.424)	Loss 2.4547 (2.5033)	Entropy 0.59359 (0.59213)	Top-1 acc 67.969 (63.624)	Top-5 acc 83.984 (83.773)	lr 0.00689
Train [78][2550/3239]	Time 0.238 (0.941)	Data Time 0.001 (0.424)	Loss 2.3435 (2.5033)	Entropy 0.59353 (0.59214)	Top-1 acc 66.016 (63.623)	Top-5 acc 87.109 (83.770)	lr 0.00689
Train [78][2560/3239]	Time 0.235 (0.944)	Data Time 0.001 (0.428)	Loss 2.6341 (2.5035)	Entropy 0.59370 (0.59214)	Top-1 acc 63.672 (63.620)	Top-5 acc 79.688 (83.767)	lr 0.00689
Train [78][2570/3239]	Time 0.289 (0.943)	Data Time 0.001 (0.427)	Loss 2.4447 (2.5035)	Entropy 0.59343 (0.59215)	Top-1 acc 63.281 (63.624)	Top-5 acc 82.422 (83.765)	lr 0.00689
Train [78][2580/3239]	Time 3.597 (0.944)	Data Time 3.253 (0.428)	Loss 2.5494 (2.5036)	Entropy 0.59352 (0.59215)	Top-1 acc 64.062 (63.622)	Top-5 acc 82.422 (83.764)	lr 0.00688
Train [78][2590/3239]	Time 0.277 (0.948)	Data Time 0.001 (0.433)	Loss 2.6348 (2.5039)	Entropy 0.59392 (0.59216)	Top-1 acc 60.547 (63.612)	Top-5 acc 80.078 (83.760)	lr 0.00688
Train [78][2600/3239]	Time 0.249 (0.946)	Data Time 0.002 (0.431)	Loss 2.3086 (2.5036)	Entropy 0.59388 (0.59217)	Top-1 acc 68.750 (63.616)	Top-5 acc 87.500 (83.763)	lr 0.00688
Train [78][2610/3239]	Time 0.235 (0.945)	Data Time 0.001 (0.430)	Loss 2.5787 (2.5037)	Entropy 0.59387 (0.59217)	Top-1 acc 66.016 (63.612)	Top-5 acc 81.641 (83.763)	lr 0.00688
Train [78][2620/3239]	Time 1.437 (0.949)	Data Time 1.177 (0.434)	Loss 2.7411 (2.5037)	Entropy 0.59404 (0.59218)	Top-1 acc 54.688 (63.608)	Top-5 acc 82.031 (83.762)	lr 0.00688
Train [78][2630/3239]	Time 0.226 (0.950)	Data Time 0.001 (0.436)	Loss 2.4557 (2.5037)	Entropy 0.59379 (0.59218)	Top-1 acc 64.062 (63.608)	Top-5 acc 83.203 (83.760)	lr 0.00688
Train [78][2640/3239]	Time 0.223 (0.948)	Data Time 0.001 (0.434)	Loss 2.5382 (2.5037)	Entropy 0.59381 (0.59219)	Top-1 acc 60.547 (63.612)	Top-5 acc 82.422 (83.760)	lr 0.00688
Train [78][2650/3239]	Time 12.330 (0.951)	Data Time 11.959 (0.438)	Loss 2.6367 (2.5038)	Entropy 0.59396 (0.59220)	Top-1 acc 59.375 (63.606)	Top-5 acc 83.594 (83.757)	lr 0.00688
Train [78][2660/3239]	Time 0.233 (0.954)	Data Time 0.001 (0.441)	Loss 2.3648 (2.5037)	Entropy 0.59406 (0.59220)	Top-1 acc 68.750 (63.608)	Top-5 acc 85.547 (83.762)	lr 0.00688
Train [78][2670/3239]	Time 0.240 (0.973)	Data Time 0.002 (0.439)	Loss 2.3976 (2.5037)	Entropy 0.59423 (0.59221)	Top-1 acc 64.453 (63.608)	Top-5 acc 85.156 (83.762)	lr 0.00688
Train [78][2680/3239]	Time 0.236 (0.971)	Data Time 0.002 (0.438)	Loss 2.3571 (2.5036)	Entropy 0.59454 (0.59222)	Top-1 acc 66.016 (63.610)	Top-5 acc 84.766 (83.763)	lr 0.00688
Train [78][2690/3239]	Time 0.244 (0.969)	Data Time 0.001 (0.436)	Loss 2.6183 (2.5037)	Entropy 0.59437 (0.59223)	Top-1 acc 59.375 (63.609)	Top-5 acc 81.250 (83.760)	lr 0.00687
Train [78][2700/3239]	Time 0.242 (0.967)	Data Time 0.001 (0.435)	Loss 2.6159 (2.5039)	Entropy 0.59410 (0.59223)	Top-1 acc 65.234 (63.609)	Top-5 acc 82.031 (83.758)	lr 0.00687
Train [78][2710/3239]	Time 0.251 (0.965)	Data Time 0.001 (0.433)	Loss 2.5039 (2.5040)	Entropy 0.59438 (0.59224)	Top-1 acc 62.891 (63.605)	Top-5 acc 84.375 (83.757)	lr 0.00687
Train [78][2720/3239]	Time 0.251 (0.963)	Data Time 0.001 (0.431)	Loss 2.3174 (2.5037)	Entropy 0.59459 (0.59225)	Top-1 acc 67.578 (63.614)	Top-5 acc 87.891 (83.763)	lr 0.00687
Train [78][2730/3239]	Time 0.296 (0.965)	Data Time 0.001 (0.433)	Loss 2.5650 (2.5038)	Entropy 0.59465 (0.59226)	Top-1 acc 60.547 (63.613)	Top-5 acc 83.984 (83.761)	lr 0.00687
Train [78][2740/3239]	Time 0.391 (0.964)	Data Time 0.003 (0.433)	Loss 2.4908 (2.5037)	Entropy 0.59459 (0.59227)	Top-1 acc 62.891 (63.613)	Top-5 acc 83.984 (83.763)	lr 0.00687
Train [78][2750/3239]	Time 0.230 (0.963)	Data Time 0.001 (0.432)	Loss 2.4915 (2.5039)	Entropy 0.59460 (0.59228)	Top-1 acc 65.234 (63.607)	Top-5 acc 84.375 (83.761)	lr 0.00687
Train [78][2760/3239]	Time 0.242 (0.961)	Data Time 0.001 (0.431)	Loss 2.5403 (2.5039)	Entropy 0.59443 (0.59228)	Top-1 acc 59.766 (63.604)	Top-5 acc 85.156 (83.763)	lr 0.00687
Train [78][2770/3239]	Time 0.271 (0.967)	Data Time 0.001 (0.437)	Loss 2.4419 (2.5038)	Entropy 0.59442 (0.59229)	Top-1 acc 65.234 (63.608)	Top-5 acc 84.375 (83.763)	lr 0.00687
Train [78][2780/3239]	Time 0.294 (0.966)	Data Time 0.002 (0.436)	Loss 2.3129 (2.5036)	Entropy 0.59440 (0.59230)	Top-1 acc 67.188 (63.610)	Top-5 acc 85.938 (83.768)	lr 0.00687
Train [78][2790/3239]	Time 0.239 (0.964)	Data Time 0.001 (0.434)	Loss 2.4016 (2.5035)	Entropy 0.59452 (0.59231)	Top-1 acc 66.797 (63.613)	Top-5 acc 85.938 (83.771)	lr 0.00687
Train [78][2800/3239]	Time 0.259 (0.971)	Data Time 0.001 (0.441)	Loss 2.5303 (2.5035)	Entropy 0.59456 (0.59232)	Top-1 acc 63.281 (63.614)	Top-5 acc 84.766 (83.770)	lr 0.00686
Train [78][2810/3239]	Time 0.351 (0.971)	Data Time 0.001 (0.442)	Loss 2.2504 (2.5037)	Entropy 0.59491 (0.59232)	Top-1 acc 71.875 (63.615)	Top-5 acc 86.328 (83.766)	lr 0.00686
Train [78][2820/3239]	Time 0.228 (0.969)	Data Time 0.001 (0.440)	Loss 2.5858 (2.5036)	Entropy 0.59521 (0.59233)	Top-1 acc 60.547 (63.615)	Top-5 acc 81.641 (83.769)	lr 0.00686
Train [78][2830/3239]	Time 0.245 (0.974)	Data Time 0.001 (0.446)	Loss 2.6249 (2.5039)	Entropy 0.59508 (0.59234)	Top-1 acc 63.672 (63.609)	Top-5 acc 79.688 (83.764)	lr 0.00686
Train [78][2840/3239]	Time 0.246 (0.974)	Data Time 0.001 (0.446)	Loss 2.5413 (2.5039)	Entropy 0.59490 (0.59235)	Top-1 acc 64.062 (63.609)	Top-5 acc 83.594 (83.762)	lr 0.00686
Train [78][2850/3239]	Time 0.245 (0.974)	Data Time 0.001 (0.447)	Loss 2.6405 (2.5041)	Entropy 0.59493 (0.59236)	Top-1 acc 56.641 (63.601)	Top-5 acc 80.469 (83.757)	lr 0.00686
Train [78][2860/3239]	Time 2.974 (0.979)	Data Time 2.692 (0.451)	Loss 2.6296 (2.5045)	Entropy 0.59493 (0.59237)	Top-1 acc 56.250 (63.591)	Top-5 acc 82.031 (83.750)	lr 0.00686
Train [78][2870/3239]	Time 0.247 (0.979)	Data Time 0.001 (0.452)	Loss 2.2326 (2.5044)	Entropy 0.59525 (0.59238)	Top-1 acc 68.750 (63.594)	Top-5 acc 88.672 (83.751)	lr 0.00686
Train [78][2880/3239]	Time 0.229 (0.980)	Data Time 0.001 (0.454)	Loss 2.5635 (2.5042)	Entropy 0.59531 (0.59239)	Top-1 acc 62.891 (63.596)	Top-5 acc 81.250 (83.754)	lr 0.00686
Train [78][2890/3239]	Time 4.380 (0.983)	Data Time 4.127 (0.457)	Loss 2.5174 (2.5042)	Entropy 0.59545 (0.59240)	Top-1 acc 60.547 (63.591)	Top-5 acc 83.984 (83.756)	lr 0.00686
Train [78][2900/3239]	Time 5.238 (0.984)	Data Time 4.874 (0.458)	Loss 2.3772 (2.5041)	Entropy 0.59494 (0.59241)	Top-1 acc 63.672 (63.591)	Top-5 acc 85.156 (83.758)	lr 0.00686
Train [78][2910/3239]	Time 0.256 (0.984)	Data Time 0.001 (0.459)	Loss 2.4205 (2.5044)	Entropy 0.59520 (0.59242)	Top-1 acc 62.891 (63.583)	Top-5 acc 86.328 (83.754)	lr 0.00685
Train [78][2920/3239]	Time 0.253 (0.983)	Data Time 0.001 (0.457)	Loss 2.5308 (2.5043)	Entropy 0.59534 (0.59243)	Top-1 acc 60.938 (63.580)	Top-5 acc 87.500 (83.754)	lr 0.00685
Train [78][2930/3239]	Time 0.247 (0.988)	Data Time 0.001 (0.463)	Loss 2.4315 (2.5044)	Entropy 0.59554 (0.59244)	Top-1 acc 61.328 (63.578)	Top-5 acc 84.375 (83.754)	lr 0.00685
Train [78][2940/3239]	Time 0.238 (0.987)	Data Time 0.001 (0.463)	Loss 2.4481 (2.5043)	Entropy 0.59556 (0.59245)	Top-1 acc 65.625 (63.580)	Top-5 acc 83.594 (83.758)	lr 0.00685
Train [78][2950/3239]	Time 0.271 (0.985)	Data Time 0.001 (0.461)	Loss 2.5384 (2.5044)	Entropy 0.59570 (0.59246)	Top-1 acc 61.719 (63.574)	Top-5 acc 83.203 (83.757)	lr 0.00685
Train [78][2960/3239]	Time 0.235 (0.990)	Data Time 0.001 (0.466)	Loss 2.5765 (2.5046)	Entropy 0.59618 (0.59247)	Top-1 acc 61.719 (63.566)	Top-5 acc 83.594 (83.753)	lr 0.00685
Train [78][2970/3239]	Time 0.360 (0.990)	Data Time 0.001 (0.466)	Loss 2.6261 (2.5049)	Entropy 0.59584 (0.59248)	Top-1 acc 61.328 (63.561)	Top-5 acc 82.031 (83.749)	lr 0.00685
Train [78][2980/3239]	Time 4.719 (0.990)	Data Time 4.448 (0.466)	Loss 2.4343 (2.5047)	Entropy 0.59616 (0.59250)	Top-1 acc 64.844 (63.567)	Top-5 acc 84.766 (83.750)	lr 0.00685
Train [78][2990/3239]	Time 0.239 (0.996)	Data Time 0.001 (0.473)	Loss 2.5468 (2.5047)	Entropy 0.59631 (0.59251)	Top-1 acc 60.938 (63.563)	Top-5 acc 82.812 (83.751)	lr 0.00685
Train [78][3000/3239]	Time 0.243 (0.997)	Data Time 0.001 (0.474)	Loss 2.7297 (2.5047)	Entropy 0.59609 (0.59252)	Top-1 acc 58.984 (63.562)	Top-5 acc 80.859 (83.751)	lr 0.00685
Train [78][3010/3239]	Time 0.242 (0.995)	Data Time 0.001 (0.472)	Loss 2.4970 (2.5047)	Entropy 0.59595 (0.59253)	Top-1 acc 62.109 (63.561)	Top-5 acc 85.938 (83.751)	lr 0.00685
Train [78][3020/3239]	Time 2.881 (1.002)	Data Time 2.633 (0.480)	Loss 2.4625 (2.5045)	Entropy 0.59605 (0.59254)	Top-1 acc 64.844 (63.564)	Top-5 acc 88.281 (83.757)	lr 0.00684
Train [78][3030/3239]	Time 0.241 (1.003)	Data Time 0.001 (0.481)	Loss 2.5351 (2.5047)	Entropy 0.59617 (0.59255)	Top-1 acc 66.016 (63.557)	Top-5 acc 82.422 (83.754)	lr 0.00684
Train [78][3040/3239]	Time 0.228 (1.001)	Data Time 0.001 (0.479)	Loss 2.5784 (2.5047)	Entropy 0.59621 (0.59257)	Top-1 acc 62.500 (63.559)	Top-5 acc 81.641 (83.751)	lr 0.00684
Train [78][3050/3239]	Time 8.347 (1.005)	Data Time 8.084 (0.484)	Loss 2.3404 (2.5047)	Entropy 0.59607 (0.59258)	Top-1 acc 69.141 (63.561)	Top-5 acc 83.203 (83.751)	lr 0.00684
Train [78][3060/3239]	Time 3.793 (1.005)	Data Time 3.541 (0.484)	Loss 2.8327 (2.5047)	Entropy 0.59611 (0.59259)	Top-1 acc 53.125 (63.560)	Top-5 acc 79.297 (83.749)	lr 0.00684
Train [78][3070/3239]	Time 0.266 (1.003)	Data Time 0.001 (0.482)	Loss 2.5357 (2.5047)	Entropy 0.59577 (0.59260)	Top-1 acc 59.766 (63.561)	Top-5 acc 83.594 (83.751)	lr 0.00684
Train [78][3080/3239]	Time 0.244 (1.001)	Data Time 0.001 (0.481)	Loss 2.6466 (2.5048)	Entropy 0.59574 (0.59261)	Top-1 acc 57.812 (63.556)	Top-5 acc 80.859 (83.748)	lr 0.00684
Train [78][3090/3239]	Time 0.227 (1.005)	Data Time 0.001 (0.485)	Loss 2.5997 (2.5050)	Entropy 0.59561 (0.59262)	Top-1 acc 58.984 (63.555)	Top-5 acc 84.375 (83.745)	lr 0.00684
Train [78][3100/3239]	Time 0.234 (1.004)	Data Time 0.001 (0.485)	Loss 2.3023 (2.5048)	Entropy 0.59539 (0.59263)	Top-1 acc 69.141 (63.560)	Top-5 acc 84.766 (83.746)	lr 0.00684
Train [78][3110/3239]	Time 0.246 (1.003)	Data Time 0.001 (0.483)	Loss 2.5977 (2.5047)	Entropy 0.59563 (0.59264)	Top-1 acc 65.234 (63.562)	Top-5 acc 79.297 (83.746)	lr 0.00684
Train [78][3120/3239]	Time 0.235 (1.008)	Data Time 0.001 (0.489)	Loss 2.4528 (2.5046)	Entropy 0.59573 (0.59265)	Top-1 acc 68.359 (63.567)	Top-5 acc 82.031 (83.748)	lr 0.00684
Train [78][3130/3239]	Time 0.348 (1.006)	Data Time 0.001 (0.487)	Loss 2.6510 (2.5046)	Entropy 0.59573 (0.59266)	Top-1 acc 59.766 (63.568)	Top-5 acc 80.078 (83.748)	lr 0.00684
Train [78][3140/3239]	Time 3.401 (1.005)	Data Time 3.125 (0.487)	Loss 2.4104 (2.5044)	Entropy 0.59571 (0.59267)	Top-1 acc 66.016 (63.575)	Top-5 acc 87.891 (83.751)	lr 0.00683
Train [78][3150/3239]	Time 0.236 (1.009)	Data Time 0.001 (0.491)	Loss 2.3490 (2.5045)	Entropy 0.59544 (0.59268)	Top-1 acc 67.969 (63.572)	Top-5 acc 86.328 (83.748)	lr 0.00683
Train [78][3160/3239]	Time 0.249 (1.008)	Data Time 0.001 (0.490)	Loss 2.5348 (2.5043)	Entropy 0.59552 (0.59269)	Top-1 acc 65.625 (63.577)	Top-5 acc 80.859 (83.750)	lr 0.00683
Train [78][3170/3239]	Time 0.252 (1.007)	Data Time 0.001 (0.489)	Loss 2.6886 (2.5043)	Entropy 0.59572 (0.59270)	Top-1 acc 57.812 (63.580)	Top-5 acc 80.859 (83.752)	lr 0.00683
Train [78][3180/3239]	Time 0.460 (1.011)	Data Time 0.213 (0.494)	Loss 2.5226 (2.5043)	Entropy 0.59578 (0.59271)	Top-1 acc 63.672 (63.579)	Top-5 acc 83.984 (83.754)	lr 0.00683
Train [78][3190/3239]	Time 0.228 (1.010)	Data Time 0.000 (0.493)	Loss 2.3806 (2.5043)	Entropy 0.59534 (0.59272)	Top-1 acc 68.750 (63.580)	Top-5 acc 88.672 (83.753)	lr 0.00683
Train [78][3200/3239]	Time 0.348 (1.008)	Data Time 0.000 (0.492)	Loss 2.4425 (2.5044)	Entropy 0.59554 (0.59272)	Top-1 acc 64.453 (63.578)	Top-5 acc 85.547 (83.751)	lr 0.00683
Train [78][3210/3239]	Time 12.124 (1.012)	Data Time 11.858 (0.496)	Loss 2.3096 (2.5043)	Entropy 0.59545 (0.59273)	Top-1 acc 69.531 (63.576)	Top-5 acc 85.938 (83.755)	lr 0.00683
Train [78][3220/3239]	Time 0.286 (1.010)	Data Time 0.000 (0.494)	Loss 2.3687 (2.5044)	Entropy 0.59527 (0.59274)	Top-1 acc 69.922 (63.578)	Top-5 acc 85.547 (83.753)	lr 0.00683
Train [78][3230/3239]	Time 0.227 (1.009)	Data Time 0.000 (0.493)	Loss 2.5400 (2.5044)	Entropy 0.59497 (0.59275)	Top-1 acc 63.281 (63.579)	Top-5 acc 83.203 (83.755)	lr 0.00683
Train [78][3239/3239]	Time 0.932 (1.007)	Data Time 0.000 (0.492)	Loss 2.8610 (2.5042)	Entropy 0.59517 (0.59276)	Top-1 acc 55.556 (63.586)	Top-5 acc 74.074 (83.757)	lr 0.00683
==========Valid [78/120]	loss 1.306	top-1 acc 70.142 (70.151)	top-5 acc 88.917	Train top-1 63.586	top-5 83.757	Entropy 0.59517	Latency-None: 0.000ms	Flops: 539.00M
Train [79][0/3239]	Time 55.007 (55.007)	Data Time 53.966 (53.966)	Loss 2.5892 (2.5892)	Entropy 0.59507 (0.59507)	Top-1 acc 61.719 (61.719)	Top-5 acc 82.031 (82.031)	lr 0.00683
Train [79][10/3239]	Time 0.244 (5.427)	Data Time 0.001 (4.908)	Loss 2.5621 (2.4708)	Entropy 0.59479 (0.59501)	Top-1 acc 61.328 (64.240)	Top-5 acc 82.422 (84.624)	lr 0.00682
Train [79][20/3239]	Time 0.233 (3.038)	Data Time 0.001 (2.572)	Loss 2.4188 (2.5246)	Entropy 0.59500 (0.59497)	Top-1 acc 65.234 (62.742)	Top-5 acc 85.938 (83.650)	lr 0.00682
Train [79][30/3239]	Time 0.328 (2.190)	Data Time 0.001 (1.743)	Loss 2.6790 (2.5248)	Entropy 0.59483 (0.59496)	Top-1 acc 58.594 (62.702)	Top-5 acc 79.297 (83.619)	lr 0.00682
Train [79][40/3239]	Time 0.246 (1.977)	Data Time 0.002 (1.527)	Loss 2.6328 (2.5350)	Entropy 0.59506 (0.59497)	Top-1 acc 64.844 (62.795)	Top-5 acc 79.297 (83.203)	lr 0.00682
Train [79][50/3239]	Time 0.264 (1.674)	Data Time 0.001 (1.228)	Loss 2.3740 (2.5330)	Entropy 0.59465 (0.59498)	Top-1 acc 65.625 (62.791)	Top-5 acc 85.547 (83.119)	lr 0.00682
Train [79][60/3239]	Time 0.236 (1.468)	Data Time 0.001 (1.027)	Loss 2.4747 (2.5152)	Entropy 0.59463 (0.59492)	Top-1 acc 63.672 (63.096)	Top-5 acc 87.500 (83.555)	lr 0.00682
Train [79][70/3239]	Time 0.236 (1.454)	Data Time 0.001 (1.015)	Loss 2.5488 (2.5101)	Entropy 0.59447 (0.59487)	Top-1 acc 64.062 (63.105)	Top-5 acc 83.203 (83.726)	lr 0.00682
Train [79][80/3239]	Time 0.395 (2.003)	Data Time 0.005 (0.890)	Loss 2.5290 (2.5161)	Entropy 0.59463 (0.59484)	Top-1 acc 64.453 (63.103)	Top-5 acc 81.641 (83.560)	lr 0.00682
Train [79][90/3239]	Time 0.238 (1.836)	Data Time 0.002 (0.793)	Loss 2.4638 (2.5180)	Entropy 0.59461 (0.59482)	Top-1 acc 66.016 (63.165)	Top-5 acc 85.547 (83.577)	lr 0.00682
Train [79][100/3239]	Time 0.225 (1.695)	Data Time 0.003 (0.714)	Loss 2.2341 (2.5217)	Entropy 0.59468 (0.59481)	Top-1 acc 72.266 (63.084)	Top-5 acc 87.109 (83.567)	lr 0.00682
Train [79][110/3239]	Time 0.252 (1.580)	Data Time 0.002 (0.650)	Loss 2.7040 (2.5200)	Entropy 0.59455 (0.59480)	Top-1 acc 62.500 (63.211)	Top-5 acc 79.688 (83.534)	lr 0.00682
Train [79][120/3239]	Time 0.330 (1.485)	Data Time 0.001 (0.597)	Loss 2.5183 (2.5184)	Entropy 0.59455 (0.59478)	Top-1 acc 61.719 (63.207)	Top-5 acc 83.984 (83.578)	lr 0.00681
Train [79][130/3239]	Time 0.235 (1.405)	Data Time 0.001 (0.551)	Loss 2.4435 (2.5166)	Entropy 0.59482 (0.59477)	Top-1 acc 63.672 (63.225)	Top-5 acc 85.547 (83.588)	lr 0.00681
Train [79][140/3239]	Time 0.259 (1.337)	Data Time 0.001 (0.512)	Loss 2.3514 (2.5135)	Entropy 0.59475 (0.59478)	Top-1 acc 68.359 (63.337)	Top-5 acc 88.672 (83.619)	lr 0.00681
Train [79][150/3239]	Time 0.280 (1.279)	Data Time 0.003 (0.478)	Loss 2.6016 (2.5182)	Entropy 0.59492 (0.59479)	Top-1 acc 61.328 (63.248)	Top-5 acc 84.375 (83.583)	lr 0.00681
Train [79][160/3239]	Time 0.234 (1.226)	Data Time 0.001 (0.449)	Loss 2.7700 (2.5167)	Entropy 0.59442 (0.59478)	Top-1 acc 57.031 (63.318)	Top-5 acc 78.906 (83.555)	lr 0.00681
Train [79][170/3239]	Time 0.243 (1.179)	Data Time 0.001 (0.423)	Loss 2.8068 (2.5154)	Entropy 0.59426 (0.59475)	Top-1 acc 58.594 (63.434)	Top-5 acc 80.469 (83.598)	lr 0.00681
Train [79][180/3239]	Time 0.236 (1.138)	Data Time 0.001 (0.399)	Loss 2.3636 (2.5125)	Entropy 0.59399 (0.59472)	Top-1 acc 67.969 (63.471)	Top-5 acc 86.719 (83.667)	lr 0.00681
Train [79][190/3239]	Time 0.344 (1.116)	Data Time 0.001 (0.393)	Loss 2.6916 (2.5156)	Entropy 0.59406 (0.59469)	Top-1 acc 56.641 (63.388)	Top-5 acc 80.469 (83.633)	lr 0.00681
Train [79][200/3239]	Time 0.244 (1.089)	Data Time 0.002 (0.381)	Loss 2.5111 (2.5144)	Entropy 0.59404 (0.59466)	Top-1 acc 60.156 (63.404)	Top-5 acc 83.594 (83.648)	lr 0.00681
Train [79][210/3239]	Time 0.228 (1.085)	Data Time 0.001 (0.390)	Loss 2.5328 (2.5158)	Entropy 0.59370 (0.59462)	Top-1 acc 60.156 (63.370)	Top-5 acc 84.375 (83.599)	lr 0.00681
Train [79][220/3239]	Time 0.244 (1.071)	Data Time 0.001 (0.386)	Loss 2.4763 (2.5158)	Entropy 0.59354 (0.59458)	Top-1 acc 62.891 (63.322)	Top-5 acc 83.203 (83.580)	lr 0.00681
Train [79][230/3239]	Time 0.240 (1.044)	Data Time 0.003 (0.370)	Loss 2.5782 (2.5130)	Entropy 0.59344 (0.59453)	Top-1 acc 60.938 (63.359)	Top-5 acc 83.984 (83.655)	lr 0.00680
Train [79][240/3239]	Time 2.061 (1.026)	Data Time 1.825 (0.362)	Loss 2.4497 (2.5114)	Entropy 0.59356 (0.59449)	Top-1 acc 67.578 (63.346)	Top-5 acc 86.328 (83.712)	lr 0.00680
Train [79][250/3239]	Time 0.258 (1.024)	Data Time 0.001 (0.369)	Loss 2.5080 (2.5109)	Entropy 0.59355 (0.59445)	Top-1 acc 64.844 (63.373)	Top-5 acc 83.203 (83.723)	lr 0.00680
Train [79][260/3239]	Time 0.242 (1.010)	Data Time 0.001 (0.364)	Loss 2.4103 (2.5112)	Entropy 0.59350 (0.59442)	Top-1 acc 65.625 (63.325)	Top-5 acc 85.938 (83.713)	lr 0.00680
Train [79][270/3239]	Time 0.241 (0.993)	Data Time 0.001 (0.356)	Loss 2.5459 (2.5097)	Entropy 0.59370 (0.59438)	Top-1 acc 61.328 (63.418)	Top-5 acc 81.641 (83.729)	lr 0.00680
Train [79][280/3239]	Time 0.300 (0.994)	Data Time 0.001 (0.364)	Loss 2.6540 (2.5086)	Entropy 0.59362 (0.59435)	Top-1 acc 54.688 (63.424)	Top-5 acc 81.250 (83.763)	lr 0.00680
Train [79][290/3239]	Time 0.280 (0.984)	Data Time 0.001 (0.360)	Loss 2.6612 (2.5076)	Entropy 0.59354 (0.59433)	Top-1 acc 56.250 (63.437)	Top-5 acc 81.250 (83.758)	lr 0.00680
Train [79][300/3239]	Time 0.233 (0.970)	Data Time 0.001 (0.353)	Loss 2.5030 (2.5078)	Entropy 0.59384 (0.59430)	Top-1 acc 66.016 (63.451)	Top-5 acc 85.938 (83.742)	lr 0.00680
Train [79][310/3239]	Time 0.232 (0.978)	Data Time 0.001 (0.367)	Loss 2.3357 (2.5085)	Entropy 0.59347 (0.59428)	Top-1 acc 67.969 (63.434)	Top-5 acc 86.719 (83.717)	lr 0.00680
Train [79][320/3239]	Time 0.252 (0.965)	Data Time 0.001 (0.361)	Loss 2.4515 (2.5078)	Entropy 0.59341 (0.59425)	Top-1 acc 62.891 (63.439)	Top-5 acc 83.203 (83.692)	lr 0.00680
Train [79][330/3239]	Time 0.233 (0.950)	Data Time 0.001 (0.350)	Loss 2.5586 (2.5076)	Entropy 0.59351 (0.59423)	Top-1 acc 62.500 (63.433)	Top-5 acc 82.422 (83.693)	lr 0.00680
Train [79][340/3239]	Time 0.551 (0.963)	Data Time 0.309 (0.368)	Loss 2.4996 (2.5077)	Entropy 0.59367 (0.59421)	Top-1 acc 61.719 (63.406)	Top-5 acc 82.812 (83.690)	lr 0.00679
Train [79][350/3239]	Time 0.330 (0.965)	Data Time 0.001 (0.375)	Loss 2.5061 (2.5064)	Entropy 0.59319 (0.59419)	Top-1 acc 62.109 (63.462)	Top-5 acc 83.203 (83.701)	lr 0.00679
Train [79][360/3239]	Time 0.258 (0.950)	Data Time 0.001 (0.365)	Loss 2.4950 (2.5038)	Entropy 0.59316 (0.59416)	Top-1 acc 62.891 (63.545)	Top-5 acc 83.984 (83.740)	lr 0.00679
Train [79][370/3239]	Time 5.108 (0.951)	Data Time 4.852 (0.370)	Loss 2.5384 (2.5026)	Entropy 0.59332 (0.59413)	Top-1 acc 61.328 (63.574)	Top-5 acc 83.594 (83.761)	lr 0.00679
Train [79][380/3239]	Time 0.262 (0.957)	Data Time 0.001 (0.378)	Loss 2.5663 (2.5007)	Entropy 0.59357 (0.59411)	Top-1 acc 64.844 (63.635)	Top-5 acc 82.812 (83.781)	lr 0.00679
Train [79][390/3239]	Time 0.234 (0.943)	Data Time 0.001 (0.368)	Loss 2.3473 (2.5008)	Entropy 0.59376 (0.59410)	Top-1 acc 67.188 (63.605)	Top-5 acc 88.672 (83.780)	lr 0.00679
Train [79][400/3239]	Time 0.271 (0.930)	Data Time 0.001 (0.359)	Loss 2.4210 (2.5007)	Entropy 0.59361 (0.59409)	Top-1 acc 66.797 (63.630)	Top-5 acc 85.156 (83.788)	lr 0.00679
Train [79][410/3239]	Time 0.258 (0.932)	Data Time 0.002 (0.364)	Loss 2.3553 (2.4988)	Entropy 0.59370 (0.59408)	Top-1 acc 66.016 (63.697)	Top-5 acc 87.891 (83.815)	lr 0.00679
Train [79][420/3239]	Time 0.340 (0.926)	Data Time 0.001 (0.361)	Loss 2.3492 (2.4995)	Entropy 0.59353 (0.59407)	Top-1 acc 67.578 (63.680)	Top-5 acc 87.500 (83.811)	lr 0.00679
Train [79][430/3239]	Time 0.278 (0.922)	Data Time 0.001 (0.361)	Loss 2.6452 (2.4993)	Entropy 0.59387 (0.59406)	Top-1 acc 63.672 (63.707)	Top-5 acc 79.688 (83.800)	lr 0.00679
Train [79][440/3239]	Time 0.236 (0.928)	Data Time 0.001 (0.370)	Loss 2.5727 (2.5002)	Entropy 0.59383 (0.59405)	Top-1 acc 63.281 (63.667)	Top-5 acc 80.859 (83.808)	lr 0.00679
Train [79][450/3239]	Time 0.243 (0.926)	Data Time 0.001 (0.371)	Loss 2.4579 (2.5008)	Entropy 0.59391 (0.59405)	Top-1 acc 66.016 (63.661)	Top-5 acc 83.594 (83.812)	lr 0.00678
Train [79][460/3239]	Time 0.252 (0.916)	Data Time 0.001 (0.363)	Loss 2.5247 (2.5009)	Entropy 0.59371 (0.59404)	Top-1 acc 64.844 (63.661)	Top-5 acc 82.812 (83.804)	lr 0.00678
Train [79][470/3239]	Time 0.241 (0.927)	Data Time 0.001 (0.376)	Loss 2.6569 (2.5020)	Entropy 0.59360 (0.59404)	Top-1 acc 62.891 (63.635)	Top-5 acc 82.812 (83.776)	lr 0.00678
Train [79][480/3239]	Time 0.237 (0.925)	Data Time 0.001 (0.377)	Loss 2.4657 (2.5001)	Entropy 0.59367 (0.59403)	Top-1 acc 65.625 (63.679)	Top-5 acc 82.422 (83.804)	lr 0.00678
Train [79][490/3239]	Time 0.267 (0.915)	Data Time 0.001 (0.369)	Loss 2.4463 (2.5006)	Entropy 0.59336 (0.59402)	Top-1 acc 65.625 (63.688)	Top-5 acc 83.203 (83.797)	lr 0.00678
Train [79][500/3239]	Time 1.363 (0.923)	Data Time 1.114 (0.380)	Loss 2.7049 (2.5004)	Entropy 0.59321 (0.59401)	Top-1 acc 61.328 (63.694)	Top-5 acc 79.297 (83.782)	lr 0.00678
Train [79][510/3239]	Time 0.335 (0.927)	Data Time 0.001 (0.386)	Loss 2.3930 (2.5003)	Entropy 0.59338 (0.59399)	Top-1 acc 67.969 (63.699)	Top-5 acc 86.328 (83.783)	lr 0.00678
Train [79][520/3239]	Time 0.243 (0.920)	Data Time 0.001 (0.381)	Loss 2.3283 (2.4986)	Entropy 0.59337 (0.59398)	Top-1 acc 69.531 (63.729)	Top-5 acc 85.156 (83.811)	lr 0.00678
Train [79][530/3239]	Time 6.850 (0.923)	Data Time 6.605 (0.386)	Loss 2.4037 (2.4981)	Entropy 0.59282 (0.59397)	Top-1 acc 66.016 (63.755)	Top-5 acc 86.328 (83.817)	lr 0.00678
Train [79][540/3239]	Time 0.237 (0.934)	Data Time 0.001 (0.400)	Loss 2.4038 (2.4991)	Entropy 0.59312 (0.59395)	Top-1 acc 64.453 (63.721)	Top-5 acc 85.547 (83.808)	lr 0.00678
Train [79][550/3239]	Time 0.404 (0.925)	Data Time 0.144 (0.393)	Loss 2.3481 (2.4983)	Entropy 0.59328 (0.59394)	Top-1 acc 69.531 (63.752)	Top-5 acc 87.109 (83.828)	lr 0.00678
Train [79][560/3239]	Time 0.228 (0.916)	Data Time 0.001 (0.386)	Loss 2.5699 (2.4971)	Entropy 0.59316 (0.59392)	Top-1 acc 64.844 (63.793)	Top-5 acc 80.078 (83.850)	lr 0.00677
Train [79][570/3239]	Time 6.125 (0.936)	Data Time 5.843 (0.407)	Loss 2.3482 (2.4970)	Entropy 0.59286 (0.59391)	Top-1 acc 70.703 (63.817)	Top-5 acc 87.109 (83.860)	lr 0.00677
Train [79][580/3239]	Time 0.372 (0.930)	Data Time 0.001 (0.403)	Loss 2.5576 (2.4968)	Entropy 0.59273 (0.59389)	Top-1 acc 60.547 (63.816)	Top-5 acc 82.422 (83.853)	lr 0.00677
Train [79][590/3239]	Time 0.245 (0.926)	Data Time 0.001 (0.401)	Loss 2.4026 (2.4972)	Entropy 0.59270 (0.59387)	Top-1 acc 62.891 (63.799)	Top-5 acc 86.328 (83.840)	lr 0.00677
Train [79][600/3239]	Time 0.243 (0.932)	Data Time 0.001 (0.408)	Loss 2.4398 (2.4961)	Entropy 0.59296 (0.59385)	Top-1 acc 67.969 (63.827)	Top-5 acc 85.156 (83.856)	lr 0.00677
Train [79][610/3239]	Time 0.226 (0.933)	Data Time 0.001 (0.411)	Loss 2.7001 (2.4960)	Entropy 0.59289 (0.59384)	Top-1 acc 59.766 (63.835)	Top-5 acc 79.297 (83.857)	lr 0.00677
Train [79][620/3239]	Time 0.250 (0.929)	Data Time 0.002 (0.409)	Loss 2.4833 (2.4967)	Entropy 0.59276 (0.59382)	Top-1 acc 63.281 (63.809)	Top-5 acc 83.984 (83.838)	lr 0.00677
Train [79][630/3239]	Time 0.252 (0.932)	Data Time 0.001 (0.412)	Loss 2.3815 (2.4966)	Entropy 0.59267 (0.59381)	Top-1 acc 66.797 (63.821)	Top-5 acc 85.547 (83.831)	lr 0.00677
Train [79][640/3239]	Time 0.248 (0.933)	Data Time 0.001 (0.415)	Loss 2.5133 (2.4958)	Entropy 0.59251 (0.59379)	Top-1 acc 65.625 (63.844)	Top-5 acc 81.250 (83.855)	lr 0.00677
Train [79][650/3239]	Time 0.252 (0.929)	Data Time 0.002 (0.412)	Loss 2.4207 (2.4959)	Entropy 0.59255 (0.59377)	Top-1 acc 65.234 (63.831)	Top-5 acc 83.594 (83.846)	lr 0.00677
Train [79][660/3239]	Time 10.058 (0.937)	Data Time 9.763 (0.422)	Loss 2.5034 (2.4952)	Entropy 0.59220 (0.59375)	Top-1 acc 64.062 (63.854)	Top-5 acc 84.766 (83.864)	lr 0.00677
Train [79][670/3239]	Time 0.316 (0.943)	Data Time 0.001 (0.428)	Loss 2.5615 (2.4960)	Entropy 0.59235 (0.59373)	Top-1 acc 64.453 (63.826)	Top-5 acc 84.375 (83.842)	lr 0.00676
Train [79][680/3239]	Time 0.244 (0.935)	Data Time 0.001 (0.422)	Loss 2.6256 (2.4951)	Entropy 0.59242 (0.59371)	Top-1 acc 58.984 (63.834)	Top-5 acc 82.812 (83.857)	lr 0.00676
Train [79][690/3239]	Time 4.100 (0.937)	Data Time 3.822 (0.425)	Loss 2.4200 (2.4946)	Entropy 0.59228 (0.59369)	Top-1 acc 62.500 (63.842)	Top-5 acc 84.766 (83.864)	lr 0.00676
Train [79][700/3239]	Time 0.241 (0.950)	Data Time 0.001 (0.439)	Loss 2.5533 (2.4966)	Entropy 0.59233 (0.59367)	Top-1 acc 60.938 (63.785)	Top-5 acc 81.641 (83.820)	lr 0.00676
Train [79][710/3239]	Time 0.244 (0.943)	Data Time 0.002 (0.433)	Loss 2.3774 (2.4954)	Entropy 0.59224 (0.59365)	Top-1 acc 67.188 (63.827)	Top-5 acc 85.938 (83.853)	lr 0.00676
Train [79][720/3239]	Time 0.259 (0.936)	Data Time 0.002 (0.427)	Loss 2.5343 (2.4956)	Entropy 0.59205 (0.59363)	Top-1 acc 62.500 (63.822)	Top-5 acc 83.594 (83.848)	lr 0.00676
Train [79][730/3239]	Time 5.097 (0.952)	Data Time 4.825 (0.444)	Loss 2.4317 (2.4961)	Entropy 0.59197 (0.59361)	Top-1 acc 67.969 (63.814)	Top-5 acc 83.984 (83.841)	lr 0.00676
Train [79][740/3239]	Time 0.448 (1.026)	Data Time 0.004 (0.444)	Loss 2.4582 (2.4964)	Entropy 0.59211 (0.59359)	Top-1 acc 62.109 (63.796)	Top-5 acc 85.547 (83.835)	lr 0.00676
Train [79][750/3239]	Time 0.253 (1.018)	Data Time 0.002 (0.438)	Loss 2.4628 (2.4953)	Entropy 0.59219 (0.59357)	Top-1 acc 62.891 (63.816)	Top-5 acc 82.031 (83.852)	lr 0.00676
Train [79][760/3239]	Time 0.253 (1.010)	Data Time 0.002 (0.432)	Loss 2.4464 (2.4951)	Entropy 0.59219 (0.59355)	Top-1 acc 63.281 (63.814)	Top-5 acc 83.984 (83.859)	lr 0.00676
Train [79][770/3239]	Time 0.276 (1.003)	Data Time 0.002 (0.427)	Loss 2.4427 (2.4947)	Entropy 0.59209 (0.59354)	Top-1 acc 63.281 (63.825)	Top-5 acc 83.203 (83.861)	lr 0.00676
Train [79][780/3239]	Time 0.252 (0.995)	Data Time 0.001 (0.421)	Loss 2.5769 (2.4946)	Entropy 0.59211 (0.59352)	Top-1 acc 63.281 (63.829)	Top-5 acc 82.422 (83.858)	lr 0.00676
Train [79][790/3239]	Time 0.239 (0.988)	Data Time 0.001 (0.416)	Loss 2.4655 (2.4941)	Entropy 0.59202 (0.59350)	Top-1 acc 64.453 (63.836)	Top-5 acc 83.984 (83.867)	lr 0.00675
Train [79][800/3239]	Time 0.256 (0.988)	Data Time 0.001 (0.418)	Loss 2.4994 (2.4948)	Entropy 0.59209 (0.59348)	Top-1 acc 62.891 (63.827)	Top-5 acc 83.594 (83.848)	lr 0.00675
Train [79][810/3239]	Time 0.254 (0.985)	Data Time 0.001 (0.415)	Loss 2.4492 (2.4946)	Entropy 0.59214 (0.59346)	Top-1 acc 67.969 (63.821)	Top-5 acc 85.156 (83.853)	lr 0.00675
Train [79][820/3239]	Time 0.658 (0.980)	Data Time 0.400 (0.412)	Loss 2.4253 (2.4946)	Entropy 0.59225 (0.59345)	Top-1 acc 63.672 (63.827)	Top-5 acc 85.156 (83.854)	lr 0.00675
Train [79][830/3239]	Time 0.332 (0.973)	Data Time 0.001 (0.407)	Loss 2.6907 (2.4947)	Entropy 0.59238 (0.59344)	Top-1 acc 60.156 (63.820)	Top-5 acc 80.469 (83.860)	lr 0.00675
Train [79][840/3239]	Time 0.238 (0.991)	Data Time 0.001 (0.426)	Loss 2.6078 (2.4946)	Entropy 0.59222 (0.59342)	Top-1 acc 60.156 (63.818)	Top-5 acc 80.469 (83.859)	lr 0.00675
Train [79][850/3239]	Time 0.250 (0.987)	Data Time 0.001 (0.424)	Loss 2.4599 (2.4949)	Entropy 0.59251 (0.59341)	Top-1 acc 66.797 (63.819)	Top-5 acc 85.547 (83.849)	lr 0.00675
Train [79][860/3239]	Time 0.247 (0.984)	Data Time 0.001 (0.422)	Loss 2.7270 (2.4951)	Entropy 0.59274 (0.59340)	Top-1 acc 58.594 (63.815)	Top-5 acc 80.859 (83.853)	lr 0.00675
Train [79][870/3239]	Time 0.236 (1.001)	Data Time 0.001 (0.441)	Loss 2.3866 (2.4955)	Entropy 0.59264 (0.59339)	Top-1 acc 67.969 (63.812)	Top-5 acc 85.938 (83.850)	lr 0.00675
Train [79][880/3239]	Time 0.253 (0.995)	Data Time 0.001 (0.436)	Loss 2.4120 (2.4962)	Entropy 0.59277 (0.59338)	Top-1 acc 65.625 (63.797)	Top-5 acc 84.375 (83.838)	lr 0.00675
Train [79][890/3239]	Time 0.251 (0.994)	Data Time 0.001 (0.437)	Loss 2.5278 (2.4962)	Entropy 0.59287 (0.59338)	Top-1 acc 65.234 (63.802)	Top-5 acc 82.812 (83.848)	lr 0.00675
Train [79][900/3239]	Time 0.383 (1.012)	Data Time 0.001 (0.456)	Loss 2.4308 (2.4960)	Entropy 0.59271 (0.59337)	Top-1 acc 61.328 (63.802)	Top-5 acc 85.547 (83.846)	lr 0.00674
Train [79][910/3239]	Time 0.266 (1.006)	Data Time 0.001 (0.451)	Loss 2.4812 (2.4960)	Entropy 0.59260 (0.59336)	Top-1 acc 62.500 (63.803)	Top-5 acc 82.031 (83.845)	lr 0.00674
Train [79][920/3239]	Time 0.243 (1.005)	Data Time 0.001 (0.452)	Loss 2.5017 (2.4959)	Entropy 0.59272 (0.59335)	Top-1 acc 60.547 (63.797)	Top-5 acc 84.375 (83.842)	lr 0.00674
Train [79][930/3239]	Time 0.276 (1.018)	Data Time 0.001 (0.466)	Loss 2.4685 (2.4948)	Entropy 0.59282 (0.59335)	Top-1 acc 65.625 (63.828)	Top-5 acc 83.594 (83.859)	lr 0.00674
Train [79][940/3239]	Time 0.247 (1.012)	Data Time 0.001 (0.461)	Loss 2.2725 (2.4947)	Entropy 0.59236 (0.59334)	Top-1 acc 67.969 (63.823)	Top-5 acc 87.891 (83.857)	lr 0.00674
Train [79][950/3239]	Time 0.249 (1.007)	Data Time 0.002 (0.458)	Loss 2.5625 (2.4950)	Entropy 0.59251 (0.59333)	Top-1 acc 61.328 (63.811)	Top-5 acc 85.938 (83.853)	lr 0.00674
Train [79][960/3239]	Time 0.237 (1.009)	Data Time 0.001 (0.461)	Loss 2.4443 (2.4951)	Entropy 0.59196 (0.59332)	Top-1 acc 62.891 (63.813)	Top-5 acc 85.938 (83.847)	lr 0.00674
Train [79][970/3239]	Time 0.275 (1.012)	Data Time 0.001 (0.465)	Loss 2.3793 (2.4953)	Entropy 0.59181 (0.59331)	Top-1 acc 68.359 (63.806)	Top-5 acc 88.281 (83.844)	lr 0.00674
Train [79][980/3239]	Time 0.250 (1.012)	Data Time 0.001 (0.466)	Loss 2.4217 (2.4954)	Entropy 0.59195 (0.59329)	Top-1 acc 67.969 (63.811)	Top-5 acc 84.766 (83.847)	lr 0.00674
Train [79][990/3239]	Time 0.244 (1.006)	Data Time 0.001 (0.461)	Loss 2.2769 (2.4947)	Entropy 0.59201 (0.59328)	Top-1 acc 70.312 (63.825)	Top-5 acc 85.938 (83.857)	lr 0.00674
Train [79][1000/3239]	Time 0.226 (1.014)	Data Time 0.001 (0.470)	Loss 2.4600 (2.4947)	Entropy 0.59174 (0.59327)	Top-1 acc 66.406 (63.830)	Top-5 acc 84.766 (83.861)	lr 0.00674
Train [79][1010/3239]	Time 4.023 (1.011)	Data Time 3.795 (0.469)	Loss 2.6252 (2.4948)	Entropy 0.59212 (0.59325)	Top-1 acc 59.766 (63.824)	Top-5 acc 80.859 (83.859)	lr 0.00673
Train [79][1020/3239]	Time 0.258 (1.006)	Data Time 0.001 (0.465)	Loss 2.4964 (2.4944)	Entropy 0.59211 (0.59324)	Top-1 acc 59.766 (63.843)	Top-5 acc 84.375 (83.867)	lr 0.00673
Train [79][1030/3239]	Time 0.243 (1.020)	Data Time 0.001 (0.480)	Loss 2.5386 (2.4948)	Entropy 0.59174 (0.59323)	Top-1 acc 62.109 (63.831)	Top-5 acc 83.203 (83.860)	lr 0.00673
Train [79][1040/3239]	Time 0.233 (1.014)	Data Time 0.001 (0.475)	Loss 2.6114 (2.4942)	Entropy 0.59175 (0.59321)	Top-1 acc 60.938 (63.839)	Top-5 acc 79.688 (83.865)	lr 0.00673
Train [79][1050/3239]	Time 0.245 (1.008)	Data Time 0.001 (0.471)	Loss 2.3546 (2.4939)	Entropy 0.59171 (0.59320)	Top-1 acc 68.359 (63.838)	Top-5 acc 85.938 (83.870)	lr 0.00673
Train [79][1060/3239]	Time 1.318 (1.014)	Data Time 0.922 (0.477)	Loss 2.2976 (2.4936)	Entropy 0.59165 (0.59319)	Top-1 acc 67.969 (63.846)	Top-5 acc 86.719 (83.882)	lr 0.00673
Train [79][1070/3239]	Time 0.234 (1.017)	Data Time 0.001 (0.481)	Loss 2.4799 (2.4938)	Entropy 0.59156 (0.59317)	Top-1 acc 64.453 (63.845)	Top-5 acc 85.938 (83.887)	lr 0.00673
Train [79][1080/3239]	Time 0.228 (1.012)	Data Time 0.001 (0.478)	Loss 2.4556 (2.4941)	Entropy 0.59182 (0.59316)	Top-1 acc 64.844 (63.838)	Top-5 acc 85.547 (83.886)	lr 0.00673
Train [79][1090/3239]	Time 0.246 (1.016)	Data Time 0.001 (0.483)	Loss 2.3687 (2.4939)	Entropy 0.59146 (0.59314)	Top-1 acc 67.188 (63.843)	Top-5 acc 87.500 (83.898)	lr 0.00673
Train [79][1100/3239]	Time 0.231 (1.018)	Data Time 0.001 (0.486)	Loss 2.5873 (2.4942)	Entropy 0.59162 (0.59313)	Top-1 acc 60.547 (63.833)	Top-5 acc 81.250 (83.894)	lr 0.00673
Train [79][1110/3239]	Time 0.308 (1.013)	Data Time 0.002 (0.481)	Loss 2.6308 (2.4945)	Entropy 0.59130 (0.59311)	Top-1 acc 59.766 (63.832)	Top-5 acc 80.469 (83.886)	lr 0.00673
Train [79][1120/3239]	Time 0.236 (1.018)	Data Time 0.001 (0.487)	Loss 2.5721 (2.4943)	Entropy 0.59123 (0.59310)	Top-1 acc 60.938 (63.840)	Top-5 acc 80.859 (83.885)	lr 0.00672
Train [79][1130/3239]	Time 0.320 (1.020)	Data Time 0.001 (0.490)	Loss 2.4209 (2.4943)	Entropy 0.59103 (0.59308)	Top-1 acc 67.188 (63.840)	Top-5 acc 85.156 (83.886)	lr 0.00672
Train [79][1140/3239]	Time 0.237 (1.019)	Data Time 0.001 (0.490)	Loss 2.5247 (2.4939)	Entropy 0.59106 (0.59306)	Top-1 acc 62.109 (63.846)	Top-5 acc 82.031 (83.895)	lr 0.00672
Train [79][1150/3239]	Time 0.243 (1.014)	Data Time 0.002 (0.486)	Loss 2.5245 (2.4937)	Entropy 0.59094 (0.59305)	Top-1 acc 62.891 (63.852)	Top-5 acc 84.766 (83.896)	lr 0.00672
Train [79][1160/3239]	Time 0.229 (1.022)	Data Time 0.001 (0.495)	Loss 2.4232 (2.4938)	Entropy 0.59105 (0.59303)	Top-1 acc 65.234 (63.853)	Top-5 acc 84.766 (83.891)	lr 0.00672
Train [79][1170/3239]	Time 4.007 (1.021)	Data Time 3.754 (0.495)	Loss 2.4308 (2.4937)	Entropy 0.59122 (0.59301)	Top-1 acc 68.750 (63.853)	Top-5 acc 82.422 (83.894)	lr 0.00672
Train [79][1180/3239]	Time 0.243 (1.016)	Data Time 0.001 (0.490)	Loss 2.2785 (2.4937)	Entropy 0.59104 (0.59300)	Top-1 acc 70.312 (63.856)	Top-5 acc 88.281 (83.895)	lr 0.00672
Train [79][1190/3239]	Time 0.257 (1.027)	Data Time 0.003 (0.503)	Loss 2.7674 (2.4935)	Entropy 0.59143 (0.59298)	Top-1 acc 57.031 (63.859)	Top-5 acc 80.859 (83.903)	lr 0.00672
Train [79][1200/3239]	Time 0.240 (1.022)	Data Time 0.001 (0.498)	Loss 2.7869 (2.4942)	Entropy 0.59121 (0.59297)	Top-1 acc 58.594 (63.836)	Top-5 acc 76.562 (83.889)	lr 0.00672
Train [79][1210/3239]	Time 0.236 (1.019)	Data Time 0.003 (0.497)	Loss 2.6349 (2.4939)	Entropy 0.59073 (0.59295)	Top-1 acc 57.812 (63.841)	Top-5 acc 78.516 (83.893)	lr 0.00672
Train [79][1220/3239]	Time 3.249 (1.028)	Data Time 2.886 (0.506)	Loss 2.5619 (2.4939)	Entropy 0.59040 (0.59293)	Top-1 acc 62.500 (63.832)	Top-5 acc 81.641 (83.892)	lr 0.00672
Train [79][1230/3239]	Time 0.256 (1.023)	Data Time 0.001 (0.502)	Loss 2.5117 (2.4939)	Entropy 0.58986 (0.59291)	Top-1 acc 64.062 (63.832)	Top-5 acc 82.422 (83.891)	lr 0.00671
Train [79][1240/3239]	Time 0.258 (1.025)	Data Time 0.001 (0.505)	Loss 2.7314 (2.4937)	Entropy 0.58967 (0.59289)	Top-1 acc 58.594 (63.841)	Top-5 acc 81.250 (83.902)	lr 0.00671
Train [79][1250/3239]	Time 0.238 (1.030)	Data Time 0.001 (0.510)	Loss 2.4857 (2.4938)	Entropy 0.58971 (0.59286)	Top-1 acc 64.453 (63.835)	Top-5 acc 83.594 (83.900)	lr 0.00671
Train [79][1260/3239]	Time 0.241 (1.028)	Data Time 0.001 (0.509)	Loss 2.4119 (2.4933)	Entropy 0.58910 (0.59283)	Top-1 acc 66.406 (63.852)	Top-5 acc 84.375 (83.910)	lr 0.00671
Train [79][1270/3239]	Time 0.247 (1.029)	Data Time 0.001 (0.511)	Loss 2.4816 (2.4932)	Entropy 0.58897 (0.59280)	Top-1 acc 59.766 (63.858)	Top-5 acc 84.766 (83.911)	lr 0.00671
Train [79][1280/3239]	Time 0.241 (1.024)	Data Time 0.001 (0.507)	Loss 2.2840 (2.4928)	Entropy 0.58898 (0.59278)	Top-1 acc 69.141 (63.872)	Top-5 acc 88.672 (83.919)	lr 0.00671
Train [79][1290/3239]	Time 0.370 (1.032)	Data Time 0.001 (0.515)	Loss 2.4352 (2.4927)	Entropy 0.58885 (0.59274)	Top-1 acc 64.453 (63.875)	Top-5 acc 85.156 (83.924)	lr 0.00671
Train [79][1300/3239]	Time 0.251 (1.036)	Data Time 0.001 (0.519)	Loss 2.5657 (2.4927)	Entropy 0.58897 (0.59272)	Top-1 acc 64.062 (63.878)	Top-5 acc 82.031 (83.923)	lr 0.00671
Train [79][1310/3239]	Time 0.249 (1.031)	Data Time 0.001 (0.515)	Loss 2.4439 (2.4925)	Entropy 0.58925 (0.59269)	Top-1 acc 61.328 (63.882)	Top-5 acc 83.203 (83.932)	lr 0.00671
Train [79][1320/3239]	Time 0.232 (1.037)	Data Time 0.001 (0.522)	Loss 2.5350 (2.4922)	Entropy 0.58912 (0.59266)	Top-1 acc 63.281 (63.888)	Top-5 acc 80.469 (83.937)	lr 0.00671
Train [79][1330/3239]	Time 3.144 (1.037)	Data Time 2.893 (0.523)	Loss 2.5679 (2.4920)	Entropy 0.58882 (0.59263)	Top-1 acc 60.156 (63.892)	Top-5 acc 80.859 (83.943)	lr 0.00671
Train [79][1340/3239]	Time 0.254 (1.033)	Data Time 0.001 (0.519)	Loss 2.3302 (2.4922)	Entropy 0.58893 (0.59261)	Top-1 acc 67.578 (63.883)	Top-5 acc 87.109 (83.946)	lr 0.00670
Train [79][1350/3239]	Time 0.234 (1.040)	Data Time 0.001 (0.527)	Loss 2.4289 (2.4923)	Entropy 0.58879 (0.59258)	Top-1 acc 66.406 (63.884)	Top-5 acc 84.375 (83.936)	lr 0.00670
Train [79][1360/3239]	Time 0.238 (1.038)	Data Time 0.001 (0.525)	Loss 2.3873 (2.4925)	Entropy 0.58912 (0.59255)	Top-1 acc 64.844 (63.883)	Top-5 acc 85.547 (83.932)	lr 0.00670
Train [79][1370/3239]	Time 0.235 (1.035)	Data Time 0.001 (0.522)	Loss 2.3273 (2.4924)	Entropy 0.58924 (0.59253)	Top-1 acc 66.406 (63.885)	Top-5 acc 86.719 (83.938)	lr 0.00670
Train [79][1380/3239]	Time 0.287 (1.043)	Data Time 0.002 (0.531)	Loss 2.3160 (2.4920)	Entropy 0.58900 (0.59250)	Top-1 acc 67.188 (63.890)	Top-5 acc 88.281 (83.949)	lr 0.00670
Train [79][1390/3239]	Time 0.337 (1.078)	Data Time 0.004 (0.527)	Loss 2.5336 (2.4917)	Entropy 0.58965 (0.59248)	Top-1 acc 61.719 (63.895)	Top-5 acc 83.594 (83.956)	lr 0.00670
Train [79][1400/3239]	Time 0.246 (1.074)	Data Time 0.002 (0.523)	Loss 2.4493 (2.4916)	Entropy 0.58979 (0.59246)	Top-1 acc 67.578 (63.904)	Top-5 acc 84.375 (83.960)	lr 0.00670
Train [79][1410/3239]	Time 0.241 (1.069)	Data Time 0.002 (0.520)	Loss 2.2968 (2.4912)	Entropy 0.58997 (0.59244)	Top-1 acc 67.188 (63.914)	Top-5 acc 88.281 (83.971)	lr 0.00670
Train [79][1420/3239]	Time 0.240 (1.064)	Data Time 0.001 (0.516)	Loss 2.6789 (2.4913)	Entropy 0.59029 (0.59242)	Top-1 acc 58.984 (63.905)	Top-5 acc 79.688 (83.967)	lr 0.00670
Train [79][1430/3239]	Time 0.244 (1.060)	Data Time 0.001 (0.513)	Loss 2.4094 (2.4911)	Entropy 0.59001 (0.59241)	Top-1 acc 64.844 (63.912)	Top-5 acc 83.594 (83.970)	lr 0.00670
Train [79][1440/3239]	Time 0.221 (1.055)	Data Time 0.001 (0.509)	Loss 2.4353 (2.4910)	Entropy 0.59010 (0.59239)	Top-1 acc 64.062 (63.905)	Top-5 acc 84.375 (83.967)	lr 0.00670
Train [79][1450/3239]	Time 0.333 (1.051)	Data Time 0.001 (0.505)	Loss 2.3313 (2.4914)	Entropy 0.59028 (0.59238)	Top-1 acc 69.531 (63.904)	Top-5 acc 85.938 (83.959)	lr 0.00670
Train [79][1460/3239]	Time 0.682 (1.054)	Data Time 0.412 (0.509)	Loss 2.5679 (2.4913)	Entropy 0.59016 (0.59236)	Top-1 acc 61.328 (63.904)	Top-5 acc 80.469 (83.967)	lr 0.00669
Train [79][1470/3239]	Time 0.252 (1.052)	Data Time 0.001 (0.508)	Loss 2.6030 (2.4914)	Entropy 0.59047 (0.59235)	Top-1 acc 62.891 (63.898)	Top-5 acc 83.984 (83.968)	lr 0.00669
Train [79][1480/3239]	Time 0.243 (1.049)	Data Time 0.001 (0.505)	Loss 2.7968 (2.4916)	Entropy 0.59056 (0.59234)	Top-1 acc 57.422 (63.892)	Top-5 acc 78.906 (83.965)	lr 0.00669
Train [79][1490/3239]	Time 0.284 (1.056)	Data Time 0.001 (0.513)	Loss 2.5573 (2.4918)	Entropy 0.59028 (0.59232)	Top-1 acc 64.844 (63.889)	Top-5 acc 82.031 (83.963)	lr 0.00669
Train [79][1500/3239]	Time 0.239 (1.055)	Data Time 0.001 (0.513)	Loss 2.3857 (2.4919)	Entropy 0.59016 (0.59231)	Top-1 acc 67.969 (63.883)	Top-5 acc 85.156 (83.965)	lr 0.00669
Train [79][1510/3239]	Time 0.234 (1.051)	Data Time 0.001 (0.509)	Loss 2.5247 (2.4915)	Entropy 0.59006 (0.59230)	Top-1 acc 61.719 (63.887)	Top-5 acc 82.422 (83.967)	lr 0.00669
Train [79][1520/3239]	Time 0.263 (1.059)	Data Time 0.001 (0.518)	Loss 2.4686 (2.4917)	Entropy 0.59013 (0.59228)	Top-1 acc 66.406 (63.878)	Top-5 acc 82.812 (83.966)	lr 0.00669
Train [79][1530/3239]	Time 0.250 (1.059)	Data Time 0.001 (0.518)	Loss 2.3701 (2.4915)	Entropy 0.58995 (0.59227)	Top-1 acc 66.016 (63.876)	Top-5 acc 86.719 (83.969)	lr 0.00669
Train [79][1540/3239]	Time 0.264 (1.056)	Data Time 0.001 (0.516)	Loss 2.4551 (2.4916)	Entropy 0.58970 (0.59225)	Top-1 acc 64.453 (63.872)	Top-5 acc 82.812 (83.969)	lr 0.00669
Train [79][1550/3239]	Time 7.490 (1.057)	Data Time 7.235 (0.517)	Loss 2.5114 (2.4913)	Entropy 0.58959 (0.59223)	Top-1 acc 62.500 (63.877)	Top-5 acc 81.250 (83.977)	lr 0.00669
Train [79][1560/3239]	Time 0.299 (1.061)	Data Time 0.002 (0.523)	Loss 2.7042 (2.4918)	Entropy 0.58923 (0.59222)	Top-1 acc 58.203 (63.854)	Top-5 acc 80.859 (83.973)	lr 0.00669
Train [79][1570/3239]	Time 0.287 (1.058)	Data Time 0.001 (0.520)	Loss 2.4639 (2.4923)	Entropy 0.58920 (0.59220)	Top-1 acc 64.844 (63.840)	Top-5 acc 83.203 (83.968)	lr 0.00668
Train [79][1580/3239]	Time 0.249 (1.055)	Data Time 0.002 (0.518)	Loss 2.6698 (2.4920)	Entropy 0.58886 (0.59218)	Top-1 acc 63.281 (63.848)	Top-5 acc 80.078 (83.968)	lr 0.00668
Train [79][1590/3239]	Time 0.237 (1.063)	Data Time 0.001 (0.527)	Loss 2.6142 (2.4923)	Entropy 0.58892 (0.59216)	Top-1 acc 59.375 (63.841)	Top-5 acc 82.031 (83.959)	lr 0.00668
Train [79][1600/3239]	Time 0.242 (1.062)	Data Time 0.001 (0.526)	Loss 2.4430 (2.4919)	Entropy 0.58901 (0.59214)	Top-1 acc 63.672 (63.848)	Top-5 acc 86.328 (83.971)	lr 0.00668
Train [79][1610/3239]	Time 0.358 (1.058)	Data Time 0.002 (0.523)	Loss 2.4561 (2.4921)	Entropy 0.58905 (0.59212)	Top-1 acc 66.406 (63.840)	Top-5 acc 85.156 (83.972)	lr 0.00668
Train [79][1620/3239]	Time 0.278 (1.066)	Data Time 0.001 (0.532)	Loss 2.4733 (2.4925)	Entropy 0.58892 (0.59210)	Top-1 acc 66.016 (63.842)	Top-5 acc 85.547 (83.965)	lr 0.00668
Train [79][1630/3239]	Time 0.231 (1.062)	Data Time 0.001 (0.528)	Loss 2.5634 (2.4922)	Entropy 0.58911 (0.59208)	Top-1 acc 61.719 (63.851)	Top-5 acc 83.984 (83.969)	lr 0.00668
Train [79][1640/3239]	Time 0.244 (1.060)	Data Time 0.001 (0.527)	Loss 2.6029 (2.4923)	Entropy 0.58895 (0.59206)	Top-1 acc 59.766 (63.849)	Top-5 acc 80.469 (83.968)	lr 0.00668
Train [79][1650/3239]	Time 0.259 (1.069)	Data Time 0.001 (0.537)	Loss 2.6228 (2.4924)	Entropy 0.58912 (0.59204)	Top-1 acc 63.672 (63.850)	Top-5 acc 82.031 (83.968)	lr 0.00668
Train [79][1660/3239]	Time 0.237 (1.066)	Data Time 0.001 (0.534)	Loss 2.6538 (2.4928)	Entropy 0.58940 (0.59203)	Top-1 acc 60.156 (63.835)	Top-5 acc 82.422 (83.968)	lr 0.00668
Train [79][1670/3239]	Time 0.241 (1.063)	Data Time 0.001 (0.532)	Loss 2.5299 (2.4926)	Entropy 0.58965 (0.59201)	Top-1 acc 59.375 (63.838)	Top-5 acc 83.594 (83.970)	lr 0.00668
Train [79][1680/3239]	Time 1.729 (1.068)	Data Time 1.292 (0.537)	Loss 2.4650 (2.4927)	Entropy 0.58936 (0.59200)	Top-1 acc 66.797 (63.840)	Top-5 acc 85.156 (83.966)	lr 0.00667
Train [79][1690/3239]	Time 0.239 (1.069)	Data Time 0.001 (0.539)	Loss 2.5040 (2.4925)	Entropy 0.58925 (0.59198)	Top-1 acc 64.062 (63.845)	Top-5 acc 83.594 (83.969)	lr 0.00667
Train [79][1700/3239]	Time 0.251 (1.066)	Data Time 0.001 (0.537)	Loss 2.5735 (2.4927)	Entropy 0.58905 (0.59196)	Top-1 acc 61.328 (63.843)	Top-5 acc 81.250 (83.962)	lr 0.00667
Train [79][1710/3239]	Time 15.404 (1.072)	Data Time 15.142 (0.542)	Loss 2.3979 (2.4929)	Entropy 0.58912 (0.59195)	Top-1 acc 65.625 (63.834)	Top-5 acc 82.812 (83.958)	lr 0.00667
Train [79][1720/3239]	Time 0.244 (1.070)	Data Time 0.001 (0.541)	Loss 2.3419 (2.4929)	Entropy 0.58918 (0.59193)	Top-1 acc 66.406 (63.833)	Top-5 acc 87.500 (83.958)	lr 0.00667
Train [79][1730/3239]	Time 0.236 (1.071)	Data Time 0.001 (0.543)	Loss 2.7862 (2.4931)	Entropy 0.58937 (0.59191)	Top-1 acc 53.906 (63.822)	Top-5 acc 76.172 (83.950)	lr 0.00667
Train [79][1740/3239]	Time 0.235 (1.068)	Data Time 0.001 (0.541)	Loss 2.6623 (2.4932)	Entropy 0.58888 (0.59190)	Top-1 acc 60.547 (63.824)	Top-5 acc 82.031 (83.951)	lr 0.00667
Train [79][1750/3239]	Time 0.227 (1.075)	Data Time 0.001 (0.548)	Loss 2.6647 (2.4931)	Entropy 0.58892 (0.59188)	Top-1 acc 58.984 (63.825)	Top-5 acc 80.078 (83.950)	lr 0.00667
Train [79][1760/3239]	Time 0.237 (1.074)	Data Time 0.001 (0.548)	Loss 2.6097 (2.4934)	Entropy 0.58865 (0.59186)	Top-1 acc 58.984 (63.812)	Top-5 acc 80.469 (83.946)	lr 0.00667
Train [79][1770/3239]	Time 0.331 (1.072)	Data Time 0.001 (0.547)	Loss 2.3463 (2.4933)	Entropy 0.58875 (0.59185)	Top-1 acc 68.750 (63.818)	Top-5 acc 85.938 (83.948)	lr 0.00667
Train [79][1780/3239]	Time 0.247 (1.078)	Data Time 0.001 (0.553)	Loss 2.4088 (2.4930)	Entropy 0.58897 (0.59183)	Top-1 acc 67.969 (63.819)	Top-5 acc 86.328 (83.955)	lr 0.00667
Train [79][1790/3239]	Time 0.234 (1.080)	Data Time 0.001 (0.555)	Loss 2.4855 (2.4931)	Entropy 0.58927 (0.59181)	Top-1 acc 61.719 (63.818)	Top-5 acc 84.766 (83.953)	lr 0.00666
Train [79][1800/3239]	Time 0.224 (1.077)	Data Time 0.001 (0.553)	Loss 2.5574 (2.4932)	Entropy 0.58926 (0.59180)	Top-1 acc 60.547 (63.820)	Top-5 acc 82.812 (83.949)	lr 0.00666
Train [79][1810/3239]	Time 0.240 (1.082)	Data Time 0.001 (0.559)	Loss 2.2842 (2.4935)	Entropy 0.58916 (0.59179)	Top-1 acc 67.969 (63.806)	Top-5 acc 87.891 (83.945)	lr 0.00666
Train [79][1820/3239]	Time 0.282 (1.085)	Data Time 0.002 (0.563)	Loss 2.7032 (2.4936)	Entropy 0.58942 (0.59177)	Top-1 acc 59.375 (63.802)	Top-5 acc 81.641 (83.940)	lr 0.00666
Train [79][1830/3239]	Time 0.228 (1.083)	Data Time 0.001 (0.561)	Loss 2.4623 (2.4937)	Entropy 0.58943 (0.59176)	Top-1 acc 67.188 (63.800)	Top-5 acc 86.328 (83.940)	lr 0.00666
Train [79][1840/3239]	Time 0.329 (1.081)	Data Time 0.001 (0.560)	Loss 2.3709 (2.4940)	Entropy 0.58932 (0.59175)	Top-1 acc 66.406 (63.797)	Top-5 acc 85.938 (83.936)	lr 0.00666
Train [79][1850/3239]	Time 10.605 (1.088)	Data Time 10.320 (0.567)	Loss 2.4093 (2.4940)	Entropy 0.58936 (0.59173)	Top-1 acc 67.578 (63.798)	Top-5 acc 86.328 (83.935)	lr 0.00666
Train [79][1860/3239]	Time 0.231 (1.085)	Data Time 0.001 (0.565)	Loss 2.4187 (2.4939)	Entropy 0.58923 (0.59172)	Top-1 acc 64.062 (63.801)	Top-5 acc 88.281 (83.939)	lr 0.00666
Train [79][1870/3239]	Time 3.620 (1.083)	Data Time 3.332 (0.563)	Loss 2.4098 (2.4938)	Entropy 0.58920 (0.59171)	Top-1 acc 66.406 (63.802)	Top-5 acc 84.766 (83.941)	lr 0.00666
Train [79][1880/3239]	Time 0.240 (1.084)	Data Time 0.001 (0.565)	Loss 2.5152 (2.4937)	Entropy 0.58949 (0.59170)	Top-1 acc 59.766 (63.801)	Top-5 acc 86.328 (83.944)	lr 0.00666
Train [79][1890/3239]	Time 0.238 (1.089)	Data Time 0.001 (0.570)	Loss 2.5162 (2.4936)	Entropy 0.58936 (0.59168)	Top-1 acc 62.109 (63.793)	Top-5 acc 84.766 (83.948)	lr 0.00666
Train [79][1900/3239]	Time 0.254 (1.086)	Data Time 0.001 (0.567)	Loss 2.4276 (2.4936)	Entropy 0.58893 (0.59167)	Top-1 acc 67.188 (63.801)	Top-5 acc 84.766 (83.948)	lr 0.00665
Train [79][1910/3239]	Time 1.493 (1.091)	Data Time 1.248 (0.573)	Loss 2.3922 (2.4937)	Entropy 0.58905 (0.59166)	Top-1 acc 66.016 (63.801)	Top-5 acc 83.984 (83.945)	lr 0.00665
Train [79][1920/3239]	Time 0.246 (1.092)	Data Time 0.001 (0.575)	Loss 2.3278 (2.4933)	Entropy 0.58943 (0.59164)	Top-1 acc 67.969 (63.810)	Top-5 acc 87.891 (83.954)	lr 0.00665
Train [79][1930/3239]	Time 0.339 (1.091)	Data Time 0.001 (0.574)	Loss 2.1788 (2.4929)	Entropy 0.58923 (0.59163)	Top-1 acc 71.094 (63.820)	Top-5 acc 91.016 (83.964)	lr 0.00665
Train [79][1940/3239]	Time 0.648 (1.094)	Data Time 0.415 (0.578)	Loss 2.5892 (2.4929)	Entropy 0.58926 (0.59162)	Top-1 acc 60.547 (63.817)	Top-5 acc 82.812 (83.966)	lr 0.00665
Train [79][1950/3239]	Time 0.263 (1.097)	Data Time 0.001 (0.581)	Loss 2.6543 (2.4930)	Entropy 0.58936 (0.59161)	Top-1 acc 61.328 (63.809)	Top-5 acc 81.641 (83.966)	lr 0.00665
Train [79][1960/3239]	Time 0.236 (1.094)	Data Time 0.001 (0.578)	Loss 2.6517 (2.4931)	Entropy 0.58899 (0.59159)	Top-1 acc 59.766 (63.809)	Top-5 acc 80.078 (83.968)	lr 0.00665
Train [79][1970/3239]	Time 0.274 (1.096)	Data Time 0.002 (0.581)	Loss 2.4621 (2.4930)	Entropy 0.58913 (0.59158)	Top-1 acc 63.281 (63.808)	Top-5 acc 81.641 (83.972)	lr 0.00665
Train [79][1980/3239]	Time 0.228 (1.097)	Data Time 0.001 (0.583)	Loss 2.3400 (2.4926)	Entropy 0.58932 (0.59157)	Top-1 acc 67.188 (63.813)	Top-5 acc 89.062 (83.980)	lr 0.00665
Train [79][1990/3239]	Time 0.239 (1.095)	Data Time 0.001 (0.581)	Loss 2.3922 (2.4924)	Entropy 0.58945 (0.59156)	Top-1 acc 68.750 (63.825)	Top-5 acc 85.547 (83.982)	lr 0.00665
Train [79][2000/3239]	Time 0.355 (1.096)	Data Time 0.002 (0.582)	Loss 2.8410 (2.4927)	Entropy 0.58980 (0.59155)	Top-1 acc 53.906 (63.819)	Top-5 acc 78.906 (83.974)	lr 0.00665
Train [79][2010/3239]	Time 4.038 (1.100)	Data Time 3.758 (0.587)	Loss 2.5090 (2.4926)	Entropy 0.58984 (0.59154)	Top-1 acc 59.375 (63.817)	Top-5 acc 82.812 (83.975)	lr 0.00664
Train [79][2020/3239]	Time 0.463 (1.097)	Data Time 0.113 (0.584)	Loss 2.2977 (2.4922)	Entropy 0.58980 (0.59153)	Top-1 acc 65.625 (63.827)	Top-5 acc 87.109 (83.984)	lr 0.00664
Train [79][2030/3239]	Time 11.958 (1.099)	Data Time 11.697 (0.587)	Loss 2.4356 (2.4921)	Entropy 0.58977 (0.59152)	Top-1 acc 66.406 (63.831)	Top-5 acc 83.984 (83.989)	lr 0.00664
Train [79][2040/3239]	Time 0.250 (1.100)	Data Time 0.001 (0.588)	Loss 2.4398 (2.4922)	Entropy 0.58988 (0.59151)	Top-1 acc 62.500 (63.830)	Top-5 acc 85.547 (83.990)	lr 0.00664
Train [79][2050/3239]	Time 0.301 (1.126)	Data Time 0.002 (0.586)	Loss 2.4879 (2.4925)	Entropy 0.59020 (0.59151)	Top-1 acc 62.891 (63.822)	Top-5 acc 83.594 (83.983)	lr 0.00664
Train [79][2060/3239]	Time 0.234 (1.122)	Data Time 0.002 (0.584)	Loss 2.4356 (2.4927)	Entropy 0.59049 (0.59150)	Top-1 acc 65.625 (63.815)	Top-5 acc 85.156 (83.977)	lr 0.00664
Train [79][2070/3239]	Time 0.260 (1.119)	Data Time 0.002 (0.581)	Loss 2.4389 (2.4926)	Entropy 0.59054 (0.59150)	Top-1 acc 65.625 (63.815)	Top-5 acc 83.594 (83.976)	lr 0.00664
Train [79][2080/3239]	Time 0.287 (1.116)	Data Time 0.002 (0.578)	Loss 2.3650 (2.4925)	Entropy 0.59067 (0.59149)	Top-1 acc 66.016 (63.815)	Top-5 acc 87.109 (83.980)	lr 0.00664
Train [79][2090/3239]	Time 0.400 (1.113)	Data Time 0.001 (0.575)	Loss 2.3383 (2.4925)	Entropy 0.59056 (0.59149)	Top-1 acc 67.188 (63.810)	Top-5 acc 87.891 (83.984)	lr 0.00664
Train [79][2100/3239]	Time 0.242 (1.110)	Data Time 0.001 (0.573)	Loss 2.3753 (2.4925)	Entropy 0.59061 (0.59148)	Top-1 acc 67.188 (63.812)	Top-5 acc 85.547 (83.983)	lr 0.00664
Train [79][2110/3239]	Time 0.275 (1.107)	Data Time 0.001 (0.570)	Loss 2.3610 (2.4923)	Entropy 0.59023 (0.59148)	Top-1 acc 67.188 (63.818)	Top-5 acc 86.719 (83.983)	lr 0.00664
Train [79][2120/3239]	Time 0.240 (1.104)	Data Time 0.002 (0.567)	Loss 2.7222 (2.4926)	Entropy 0.59016 (0.59147)	Top-1 acc 58.594 (63.813)	Top-5 acc 81.250 (83.978)	lr 0.00664
Train [79][2130/3239]	Time 0.261 (1.100)	Data Time 0.001 (0.565)	Loss 2.3290 (2.4928)	Entropy 0.58991 (0.59147)	Top-1 acc 67.969 (63.810)	Top-5 acc 84.766 (83.973)	lr 0.00663
Train [79][2140/3239]	Time 0.253 (1.097)	Data Time 0.001 (0.562)	Loss 2.7198 (2.4929)	Entropy 0.59010 (0.59146)	Top-1 acc 62.500 (63.810)	Top-5 acc 80.469 (83.967)	lr 0.00663
Train [79][2150/3239]	Time 4.569 (1.098)	Data Time 4.296 (0.563)	Loss 2.5485 (2.4932)	Entropy 0.59021 (0.59145)	Top-1 acc 61.328 (63.804)	Top-5 acc 79.297 (83.959)	lr 0.00663
Train [79][2160/3239]	Time 0.859 (1.098)	Data Time 0.512 (0.563)	Loss 2.4833 (2.4931)	Entropy 0.59015 (0.59145)	Top-1 acc 64.453 (63.804)	Top-5 acc 83.203 (83.958)	lr 0.00663
Train [79][2170/3239]	Time 0.243 (1.097)	Data Time 0.001 (0.563)	Loss 2.5336 (2.4931)	Entropy 0.59015 (0.59144)	Top-1 acc 62.500 (63.804)	Top-5 acc 82.031 (83.959)	lr 0.00663
Train [79][2180/3239]	Time 1.499 (1.098)	Data Time 1.246 (0.565)	Loss 2.5719 (2.4931)	Entropy 0.59012 (0.59143)	Top-1 acc 61.719 (63.803)	Top-5 acc 82.422 (83.959)	lr 0.00663
Train [79][2190/3239]	Time 0.239 (1.100)	Data Time 0.001 (0.567)	Loss 2.5329 (2.4932)	Entropy 0.59011 (0.59143)	Top-1 acc 62.500 (63.802)	Top-5 acc 85.156 (83.958)	lr 0.00663
Train [79][2200/3239]	Time 0.235 (1.099)	Data Time 0.001 (0.566)	Loss 2.3475 (2.4931)	Entropy 0.58961 (0.59142)	Top-1 acc 68.359 (63.805)	Top-5 acc 85.938 (83.959)	lr 0.00663
Train [79][2210/3239]	Time 0.243 (1.098)	Data Time 0.001 (0.565)	Loss 2.7386 (2.4929)	Entropy 0.58918 (0.59141)	Top-1 acc 58.984 (63.807)	Top-5 acc 78.125 (83.964)	lr 0.00663
Train [79][2220/3239]	Time 1.305 (1.102)	Data Time 1.048 (0.570)	Loss 2.3494 (2.4930)	Entropy 0.58898 (0.59140)	Top-1 acc 64.844 (63.807)	Top-5 acc 87.109 (83.966)	lr 0.00663
Train [79][2230/3239]	Time 0.667 (1.099)	Data Time 0.371 (0.568)	Loss 2.5409 (2.4928)	Entropy 0.58905 (0.59139)	Top-1 acc 63.672 (63.812)	Top-5 acc 83.203 (83.969)	lr 0.00663
Train [79][2240/3239]	Time 3.057 (1.099)	Data Time 2.801 (0.568)	Loss 2.6631 (2.4933)	Entropy 0.58918 (0.59138)	Top-1 acc 60.156 (63.805)	Top-5 acc 78.906 (83.957)	lr 0.00662
Train [79][2250/3239]	Time 2.969 (1.103)	Data Time 2.601 (0.573)	Loss 2.4306 (2.4932)	Entropy 0.58928 (0.59137)	Top-1 acc 67.188 (63.810)	Top-5 acc 84.766 (83.956)	lr 0.00662
Train [79][2260/3239]	Time 0.241 (1.101)	Data Time 0.002 (0.571)	Loss 2.6043 (2.4935)	Entropy 0.58924 (0.59136)	Top-1 acc 58.594 (63.803)	Top-5 acc 81.641 (83.950)	lr 0.00662
Train [79][2270/3239]	Time 0.240 (1.098)	Data Time 0.001 (0.569)	Loss 2.5267 (2.4937)	Entropy 0.58933 (0.59135)	Top-1 acc 62.500 (63.799)	Top-5 acc 85.938 (83.947)	lr 0.00662
Train [79][2280/3239]	Time 0.240 (1.098)	Data Time 0.001 (0.569)	Loss 2.5328 (2.4938)	Entropy 0.58938 (0.59135)	Top-1 acc 63.672 (63.803)	Top-5 acc 82.422 (83.944)	lr 0.00662
Train [79][2290/3239]	Time 0.310 (1.097)	Data Time 0.001 (0.568)	Loss 2.5914 (2.4941)	Entropy 0.58958 (0.59134)	Top-1 acc 59.375 (63.794)	Top-5 acc 81.641 (83.939)	lr 0.00662
Train [79][2300/3239]	Time 0.263 (1.094)	Data Time 0.001 (0.565)	Loss 2.4623 (2.4943)	Entropy 0.58925 (0.59133)	Top-1 acc 65.234 (63.785)	Top-5 acc 82.812 (83.937)	lr 0.00662
Train [79][2310/3239]	Time 0.314 (1.092)	Data Time 0.084 (0.564)	Loss 2.4149 (2.4941)	Entropy 0.58931 (0.59132)	Top-1 acc 62.891 (63.784)	Top-5 acc 85.156 (83.938)	lr 0.00662
Train [79][2320/3239]	Time 0.351 (1.092)	Data Time 0.001 (0.564)	Loss 2.3192 (2.4942)	Entropy 0.58955 (0.59131)	Top-1 acc 65.234 (63.780)	Top-5 acc 87.500 (83.936)	lr 0.00662
Train [79][2330/3239]	Time 0.242 (1.090)	Data Time 0.001 (0.562)	Loss 2.3366 (2.4942)	Entropy 0.58934 (0.59130)	Top-1 acc 69.531 (63.782)	Top-5 acc 86.328 (83.939)	lr 0.00662
Train [79][2340/3239]	Time 0.651 (1.087)	Data Time 0.429 (0.560)	Loss 2.5882 (2.4943)	Entropy 0.58961 (0.59130)	Top-1 acc 64.062 (63.783)	Top-5 acc 82.812 (83.935)	lr 0.00662
Train [79][2350/3239]	Time 0.269 (1.087)	Data Time 0.001 (0.560)	Loss 2.5756 (2.4942)	Entropy 0.58962 (0.59129)	Top-1 acc 60.938 (63.785)	Top-5 acc 80.859 (83.938)	lr 0.00661
Train [79][2360/3239]	Time 0.258 (1.086)	Data Time 0.001 (0.559)	Loss 2.4130 (2.4943)	Entropy 0.58961 (0.59128)	Top-1 acc 67.578 (63.781)	Top-5 acc 86.328 (83.940)	lr 0.00661
Train [79][2370/3239]	Time 0.253 (1.083)	Data Time 0.001 (0.557)	Loss 2.7046 (2.4943)	Entropy 0.58957 (0.59127)	Top-1 acc 58.203 (63.780)	Top-5 acc 81.250 (83.938)	lr 0.00661
Train [79][2380/3239]	Time 0.260 (1.083)	Data Time 0.001 (0.557)	Loss 2.4700 (2.4942)	Entropy 0.58959 (0.59127)	Top-1 acc 63.672 (63.782)	Top-5 acc 84.766 (83.944)	lr 0.00661
Train [79][2390/3239]	Time 0.348 (1.081)	Data Time 0.001 (0.556)	Loss 2.6060 (2.4941)	Entropy 0.58960 (0.59126)	Top-1 acc 62.109 (63.780)	Top-5 acc 84.766 (83.943)	lr 0.00661
Train [79][2400/3239]	Time 0.256 (1.079)	Data Time 0.001 (0.554)	Loss 2.4294 (2.4943)	Entropy 0.58951 (0.59125)	Top-1 acc 64.453 (63.770)	Top-5 acc 83.984 (83.939)	lr 0.00661
Train [79][2410/3239]	Time 1.166 (1.079)	Data Time 0.910 (0.554)	Loss 2.4295 (2.4942)	Entropy 0.58927 (0.59125)	Top-1 acc 66.797 (63.775)	Top-5 acc 85.156 (83.942)	lr 0.00661
Train [79][2420/3239]	Time 0.231 (1.077)	Data Time 0.001 (0.553)	Loss 2.2948 (2.4942)	Entropy 0.58962 (0.59124)	Top-1 acc 71.875 (63.775)	Top-5 acc 86.328 (83.942)	lr 0.00661
Train [79][2430/3239]	Time 1.458 (1.076)	Data Time 1.209 (0.552)	Loss 2.7557 (2.4944)	Entropy 0.58952 (0.59123)	Top-1 acc 57.422 (63.769)	Top-5 acc 82.031 (83.937)	lr 0.00661
Train [79][2440/3239]	Time 0.275 (1.078)	Data Time 0.001 (0.554)	Loss 2.5260 (2.4945)	Entropy 0.58968 (0.59122)	Top-1 acc 60.547 (63.762)	Top-5 acc 82.812 (83.935)	lr 0.00661
Train [79][2450/3239]	Time 3.104 (1.079)	Data Time 2.864 (0.556)	Loss 2.6067 (2.4946)	Entropy 0.58937 (0.59122)	Top-1 acc 58.203 (63.761)	Top-5 acc 82.031 (83.932)	lr 0.00661
Train [79][2460/3239]	Time 0.248 (1.076)	Data Time 0.001 (0.554)	Loss 2.4634 (2.4948)	Entropy 0.58955 (0.59121)	Top-1 acc 64.062 (63.751)	Top-5 acc 84.375 (83.928)	lr 0.00660
Train [79][2470/3239]	Time 1.703 (1.078)	Data Time 1.422 (0.555)	Loss 2.3918 (2.4945)	Entropy 0.58994 (0.59120)	Top-1 acc 68.750 (63.756)	Top-5 acc 85.547 (83.935)	lr 0.00660
Train [79][2480/3239]	Time 0.326 (1.079)	Data Time 0.001 (0.557)	Loss 2.5101 (2.4945)	Entropy 0.58982 (0.59120)	Top-1 acc 63.281 (63.753)	Top-5 acc 84.766 (83.938)	lr 0.00660
Train [79][2490/3239]	Time 0.235 (1.079)	Data Time 0.001 (0.557)	Loss 2.5693 (2.4946)	Entropy 0.59025 (0.59119)	Top-1 acc 62.891 (63.752)	Top-5 acc 83.203 (83.936)	lr 0.00660
Train [79][2500/3239]	Time 6.635 (1.079)	Data Time 6.388 (0.558)	Loss 2.5545 (2.4944)	Entropy 0.59003 (0.59119)	Top-1 acc 62.109 (63.753)	Top-5 acc 83.203 (83.943)	lr 0.00660
Train [79][2510/3239]	Time 0.244 (1.080)	Data Time 0.001 (0.560)	Loss 2.4848 (2.4945)	Entropy 0.59014 (0.59119)	Top-1 acc 62.891 (63.750)	Top-5 acc 85.547 (83.940)	lr 0.00660
Train [79][2520/3239]	Time 0.237 (1.080)	Data Time 0.001 (0.560)	Loss 2.5937 (2.4949)	Entropy 0.59038 (0.59118)	Top-1 acc 63.672 (63.742)	Top-5 acc 82.812 (83.936)	lr 0.00660
Train [79][2530/3239]	Time 0.260 (1.077)	Data Time 0.001 (0.557)	Loss 2.5307 (2.4948)	Entropy 0.58993 (0.59118)	Top-1 acc 64.062 (63.743)	Top-5 acc 83.594 (83.935)	lr 0.00660
Train [79][2540/3239]	Time 0.239 (1.082)	Data Time 0.001 (0.562)	Loss 2.4838 (2.4948)	Entropy 0.58972 (0.59117)	Top-1 acc 64.062 (63.744)	Top-5 acc 83.984 (83.937)	lr 0.00660
Train [79][2550/3239]	Time 0.328 (1.082)	Data Time 0.001 (0.562)	Loss 2.5520 (2.4950)	Entropy 0.58988 (0.59117)	Top-1 acc 62.500 (63.739)	Top-5 acc 82.812 (83.933)	lr 0.00660
Train [79][2560/3239]	Time 0.235 (1.079)	Data Time 0.001 (0.560)	Loss 2.5931 (2.4951)	Entropy 0.59003 (0.59116)	Top-1 acc 61.328 (63.735)	Top-5 acc 82.422 (83.929)	lr 0.00660
Train [79][2570/3239]	Time 3.543 (1.083)	Data Time 3.291 (0.564)	Loss 2.4422 (2.4949)	Entropy 0.59034 (0.59116)	Top-1 acc 64.844 (63.744)	Top-5 acc 84.375 (83.934)	lr 0.00660
Train [79][2580/3239]	Time 0.238 (1.083)	Data Time 0.001 (0.565)	Loss 2.5452 (2.4948)	Entropy 0.58966 (0.59115)	Top-1 acc 60.547 (63.749)	Top-5 acc 85.156 (83.935)	lr 0.00659
Train [79][2590/3239]	Time 0.238 (1.080)	Data Time 0.001 (0.562)	Loss 2.5344 (2.4948)	Entropy 0.58985 (0.59115)	Top-1 acc 62.891 (63.753)	Top-5 acc 81.641 (83.936)	lr 0.00659
Train [79][2600/3239]	Time 0.222 (1.081)	Data Time 0.001 (0.564)	Loss 2.6032 (2.4949)	Entropy 0.59004 (0.59114)	Top-1 acc 58.203 (63.751)	Top-5 acc 82.422 (83.934)	lr 0.00659
Train [79][2610/3239]	Time 3.894 (1.085)	Data Time 3.640 (0.568)	Loss 2.8278 (2.4950)	Entropy 0.59022 (0.59114)	Top-1 acc 58.203 (63.751)	Top-5 acc 80.469 (83.932)	lr 0.00659
Train [79][2620/3239]	Time 0.246 (1.083)	Data Time 0.001 (0.566)	Loss 2.5041 (2.4950)	Entropy 0.59032 (0.59114)	Top-1 acc 65.234 (63.751)	Top-5 acc 84.766 (83.934)	lr 0.00659
Train [79][2630/3239]	Time 2.065 (1.081)	Data Time 1.825 (0.565)	Loss 2.3502 (2.4950)	Entropy 0.59042 (0.59113)	Top-1 acc 68.750 (63.753)	Top-5 acc 84.766 (83.936)	lr 0.00659
Train [79][2640/3239]	Time 0.266 (1.085)	Data Time 0.001 (0.569)	Loss 2.7072 (2.4951)	Entropy 0.59044 (0.59113)	Top-1 acc 58.984 (63.750)	Top-5 acc 78.906 (83.933)	lr 0.00659
Train [79][2650/3239]	Time 0.229 (1.085)	Data Time 0.001 (0.569)	Loss 2.3982 (2.4948)	Entropy 0.59059 (0.59113)	Top-1 acc 65.234 (63.756)	Top-5 acc 85.938 (83.938)	lr 0.00659
Train [79][2660/3239]	Time 0.247 (1.082)	Data Time 0.001 (0.567)	Loss 2.4196 (2.4948)	Entropy 0.59078 (0.59113)	Top-1 acc 64.453 (63.756)	Top-5 acc 85.547 (83.940)	lr 0.00659
Train [79][2670/3239]	Time 8.592 (1.087)	Data Time 8.344 (0.571)	Loss 2.2016 (2.4948)	Entropy 0.59056 (0.59113)	Top-1 acc 71.484 (63.753)	Top-5 acc 87.891 (83.936)	lr 0.00659
Train [79][2680/3239]	Time 0.227 (1.087)	Data Time 0.001 (0.572)	Loss 2.5959 (2.4949)	Entropy 0.59047 (0.59112)	Top-1 acc 59.766 (63.753)	Top-5 acc 81.641 (83.934)	lr 0.00659
Train [79][2690/3239]	Time 0.270 (1.084)	Data Time 0.001 (0.570)	Loss 2.6381 (2.4950)	Entropy 0.59034 (0.59112)	Top-1 acc 61.719 (63.752)	Top-5 acc 80.078 (83.932)	lr 0.00658
Train [79][2700/3239]	Time 0.435 (1.106)	Data Time 0.006 (0.571)	Loss 2.5894 (2.4950)	Entropy 0.59033 (0.59112)	Top-1 acc 60.547 (63.749)	Top-5 acc 80.469 (83.928)	lr 0.00658
Train [79][2710/3239]	Time 0.348 (1.104)	Data Time 0.002 (0.569)	Loss 2.4909 (2.4950)	Entropy 0.59006 (0.59111)	Top-1 acc 63.672 (63.756)	Top-5 acc 81.250 (83.929)	lr 0.00658
Train [79][2720/3239]	Time 0.240 (1.101)	Data Time 0.002 (0.567)	Loss 2.5017 (2.4952)	Entropy 0.59027 (0.59111)	Top-1 acc 61.719 (63.750)	Top-5 acc 84.375 (83.929)	lr 0.00658
Train [79][2730/3239]	Time 0.249 (1.099)	Data Time 0.001 (0.565)	Loss 2.4409 (2.4953)	Entropy 0.59015 (0.59111)	Top-1 acc 64.844 (63.751)	Top-5 acc 85.547 (83.929)	lr 0.00658
Train [79][2740/3239]	Time 0.281 (1.097)	Data Time 0.002 (0.563)	Loss 2.2588 (2.4949)	Entropy 0.59034 (0.59110)	Top-1 acc 64.453 (63.755)	Top-5 acc 89.062 (83.935)	lr 0.00658
Train [79][2750/3239]	Time 0.239 (1.094)	Data Time 0.001 (0.561)	Loss 2.6034 (2.4952)	Entropy 0.59047 (0.59110)	Top-1 acc 65.625 (63.750)	Top-5 acc 81.250 (83.932)	lr 0.00658
Train [79][2760/3239]	Time 0.266 (1.092)	Data Time 0.001 (0.559)	Loss 2.5577 (2.4949)	Entropy 0.59036 (0.59110)	Top-1 acc 64.062 (63.758)	Top-5 acc 79.688 (83.934)	lr 0.00658
Train [79][2770/3239]	Time 2.195 (1.093)	Data Time 1.949 (0.561)	Loss 2.6287 (2.4950)	Entropy 0.59043 (0.59110)	Top-1 acc 59.375 (63.754)	Top-5 acc 82.422 (83.934)	lr 0.00658
Train [79][2780/3239]	Time 0.267 (1.092)	Data Time 0.001 (0.560)	Loss 2.5722 (2.4950)	Entropy 0.59067 (0.59110)	Top-1 acc 62.109 (63.754)	Top-5 acc 82.031 (83.936)	lr 0.00658
Train [79][2790/3239]	Time 0.228 (1.090)	Data Time 0.001 (0.558)	Loss 2.4856 (2.4948)	Entropy 0.59092 (0.59109)	Top-1 acc 64.062 (63.762)	Top-5 acc 82.031 (83.936)	lr 0.00658
Train [79][2800/3239]	Time 0.377 (1.095)	Data Time 0.001 (0.563)	Loss 2.5960 (2.4950)	Entropy 0.59088 (0.59109)	Top-1 acc 58.203 (63.753)	Top-5 acc 83.594 (83.934)	lr 0.00657
Train [79][2810/3239]	Time 0.244 (1.095)	Data Time 0.001 (0.563)	Loss 2.5379 (2.4949)	Entropy 0.59049 (0.59109)	Top-1 acc 62.500 (63.757)	Top-5 acc 83.984 (83.937)	lr 0.00657
Train [79][2820/3239]	Time 0.247 (1.093)	Data Time 0.001 (0.561)	Loss 2.5710 (2.4949)	Entropy 0.59052 (0.59109)	Top-1 acc 60.156 (63.759)	Top-5 acc 83.594 (83.938)	lr 0.00657
Train [79][2830/3239]	Time 0.243 (1.097)	Data Time 0.001 (0.567)	Loss 2.5005 (2.4949)	Entropy 0.59055 (0.59109)	Top-1 acc 64.453 (63.760)	Top-5 acc 80.859 (83.937)	lr 0.00657
Train [79][2840/3239]	Time 0.253 (1.099)	Data Time 0.001 (0.568)	Loss 2.5636 (2.4946)	Entropy 0.59083 (0.59109)	Top-1 acc 61.328 (63.766)	Top-5 acc 83.984 (83.943)	lr 0.00657
Train [79][2850/3239]	Time 0.259 (1.096)	Data Time 0.001 (0.566)	Loss 2.4480 (2.4945)	Entropy 0.59088 (0.59109)	Top-1 acc 66.797 (63.771)	Top-5 acc 83.594 (83.944)	lr 0.00657
Train [79][2860/3239]	Time 18.391 (1.100)	Data Time 18.143 (0.571)	Loss 2.4133 (2.4945)	Entropy 0.59059 (0.59108)	Top-1 acc 65.234 (63.770)	Top-5 acc 85.156 (83.944)	lr 0.00657
Train [79][2870/3239]	Time 0.329 (1.102)	Data Time 0.001 (0.572)	Loss 2.5922 (2.4945)	Entropy 0.59068 (0.59108)	Top-1 acc 61.719 (63.773)	Top-5 acc 82.031 (83.944)	lr 0.00657
Train [79][2880/3239]	Time 0.235 (1.099)	Data Time 0.001 (0.570)	Loss 2.6322 (2.4944)	Entropy 0.59078 (0.59108)	Top-1 acc 61.719 (63.778)	Top-5 acc 79.297 (83.943)	lr 0.00657
Train [79][2890/3239]	Time 0.241 (1.097)	Data Time 0.001 (0.568)	Loss 2.4125 (2.4945)	Entropy 0.59044 (0.59108)	Top-1 acc 66.016 (63.772)	Top-5 acc 84.375 (83.939)	lr 0.00657
Train [79][2900/3239]	Time 0.250 (1.103)	Data Time 0.001 (0.574)	Loss 2.3788 (2.4945)	Entropy 0.59045 (0.59108)	Top-1 acc 66.016 (63.770)	Top-5 acc 86.719 (83.939)	lr 0.00657
Train [79][2910/3239]	Time 0.252 (1.102)	Data Time 0.001 (0.574)	Loss 2.5555 (2.4949)	Entropy 0.59068 (0.59108)	Top-1 acc 64.453 (63.759)	Top-5 acc 82.422 (83.934)	lr 0.00656
Train [79][2920/3239]	Time 0.253 (1.100)	Data Time 0.002 (0.572)	Loss 2.5329 (2.4951)	Entropy 0.59036 (0.59107)	Top-1 acc 61.719 (63.758)	Top-5 acc 83.984 (83.930)	lr 0.00656
Train [79][2930/3239]	Time 0.288 (1.107)	Data Time 0.001 (0.579)	Loss 2.3480 (2.4950)	Entropy 0.59005 (0.59107)	Top-1 acc 69.141 (63.759)	Top-5 acc 85.547 (83.928)	lr 0.00656
Train [79][2940/3239]	Time 0.238 (1.105)	Data Time 0.001 (0.578)	Loss 2.2875 (2.4951)	Entropy 0.58980 (0.59107)	Top-1 acc 67.969 (63.756)	Top-5 acc 85.938 (83.927)	lr 0.00656
Train [79][2950/3239]	Time 0.263 (1.103)	Data Time 0.001 (0.576)	Loss 2.6073 (2.4953)	Entropy 0.58983 (0.59106)	Top-1 acc 59.375 (63.754)	Top-5 acc 81.641 (83.925)	lr 0.00656
Train [79][2960/3239]	Time 0.272 (1.107)	Data Time 0.003 (0.581)	Loss 2.5547 (2.4954)	Entropy 0.58951 (0.59106)	Top-1 acc 62.891 (63.756)	Top-5 acc 81.641 (83.921)	lr 0.00656
Train [79][2970/3239]	Time 0.231 (1.106)	Data Time 0.001 (0.579)	Loss 2.7828 (2.4957)	Entropy 0.58941 (0.59105)	Top-1 acc 58.203 (63.745)	Top-5 acc 78.125 (83.916)	lr 0.00656
Train [79][2980/3239]	Time 0.261 (1.104)	Data Time 0.003 (0.577)	Loss 2.4806 (2.4957)	Entropy 0.58947 (0.59105)	Top-1 acc 64.844 (63.742)	Top-5 acc 85.938 (83.920)	lr 0.00656
Train [79][2990/3239]	Time 0.376 (1.107)	Data Time 0.130 (0.581)	Loss 2.3216 (2.4954)	Entropy 0.58949 (0.59104)	Top-1 acc 67.969 (63.751)	Top-5 acc 87.891 (83.928)	lr 0.00656
Train [79][3000/3239]	Time 0.282 (1.108)	Data Time 0.001 (0.583)	Loss 2.4857 (2.4954)	Entropy 0.58975 (0.59104)	Top-1 acc 60.938 (63.748)	Top-5 acc 82.422 (83.927)	lr 0.00656
Train [79][3010/3239]	Time 0.272 (1.106)	Data Time 0.001 (0.581)	Loss 2.4635 (2.4954)	Entropy 0.59003 (0.59103)	Top-1 acc 66.406 (63.747)	Top-5 acc 83.203 (83.929)	lr 0.00656
Train [79][3020/3239]	Time 14.766 (1.110)	Data Time 14.466 (0.585)	Loss 2.2207 (2.4952)	Entropy 0.58982 (0.59103)	Top-1 acc 70.312 (63.750)	Top-5 acc 88.281 (83.933)	lr 0.00656
Train [79][3030/3239]	Time 0.365 (1.112)	Data Time 0.001 (0.587)	Loss 2.5867 (2.4955)	Entropy 0.58973 (0.59103)	Top-1 acc 60.156 (63.743)	Top-5 acc 80.469 (83.929)	lr 0.00655
Train [79][3040/3239]	Time 0.254 (1.110)	Data Time 0.001 (0.585)	Loss 2.6016 (2.4955)	Entropy 0.58980 (0.59102)	Top-1 acc 59.375 (63.743)	Top-5 acc 82.812 (83.930)	lr 0.00655
Train [79][3050/3239]	Time 0.227 (1.108)	Data Time 0.001 (0.584)	Loss 2.2484 (2.4953)	Entropy 0.59013 (0.59102)	Top-1 acc 72.656 (63.748)	Top-5 acc 87.109 (83.932)	lr 0.00655
Train [79][3060/3239]	Time 0.236 (1.113)	Data Time 0.001 (0.589)	Loss 2.6714 (2.4953)	Entropy 0.58981 (0.59102)	Top-1 acc 58.984 (63.749)	Top-5 acc 78.906 (83.928)	lr 0.00655
Train [79][3070/3239]	Time 0.236 (1.110)	Data Time 0.001 (0.587)	Loss 2.3709 (2.4953)	Entropy 0.59000 (0.59101)	Top-1 acc 62.109 (63.747)	Top-5 acc 86.328 (83.930)	lr 0.00655
Train [79][3080/3239]	Time 0.248 (1.108)	Data Time 0.001 (0.585)	Loss 2.7229 (2.4954)	Entropy 0.58960 (0.59101)	Top-1 acc 60.938 (63.745)	Top-5 acc 77.734 (83.925)	lr 0.00655
Train [79][3090/3239]	Time 0.243 (1.112)	Data Time 0.001 (0.589)	Loss 2.6080 (2.4955)	Entropy 0.58988 (0.59100)	Top-1 acc 62.891 (63.741)	Top-5 acc 78.906 (83.928)	lr 0.00655
Train [79][3100/3239]	Time 0.360 (1.111)	Data Time 0.001 (0.588)	Loss 2.2963 (2.4954)	Entropy 0.58980 (0.59100)	Top-1 acc 67.969 (63.738)	Top-5 acc 88.672 (83.928)	lr 0.00655
Train [79][3110/3239]	Time 0.233 (1.109)	Data Time 0.001 (0.586)	Loss 2.4053 (2.4955)	Entropy 0.58975 (0.59100)	Top-1 acc 64.844 (63.733)	Top-5 acc 86.719 (83.930)	lr 0.00655
Train [79][3120/3239]	Time 0.239 (1.113)	Data Time 0.001 (0.591)	Loss 2.5323 (2.4956)	Entropy 0.58966 (0.59099)	Top-1 acc 66.016 (63.729)	Top-5 acc 82.422 (83.927)	lr 0.00655
Train [79][3130/3239]	Time 1.686 (1.112)	Data Time 1.388 (0.590)	Loss 2.6196 (2.4956)	Entropy 0.58966 (0.59099)	Top-1 acc 58.984 (63.731)	Top-5 acc 81.250 (83.927)	lr 0.00655
Train [79][3140/3239]	Time 0.245 (1.110)	Data Time 0.001 (0.588)	Loss 2.7477 (2.4957)	Entropy 0.58964 (0.59098)	Top-1 acc 59.375 (63.731)	Top-5 acc 78.516 (83.925)	lr 0.00654
Train [79][3150/3239]	Time 0.247 (1.111)	Data Time 0.002 (0.590)	Loss 2.3399 (2.4955)	Entropy 0.58958 (0.59098)	Top-1 acc 65.625 (63.735)	Top-5 acc 85.547 (83.925)	lr 0.00654
Train [79][3160/3239]	Time 0.277 (1.111)	Data Time 0.001 (0.590)	Loss 2.5586 (2.4955)	Entropy 0.58939 (0.59097)	Top-1 acc 66.797 (63.734)	Top-5 acc 83.203 (83.924)	lr 0.00654
Train [79][3170/3239]	Time 0.233 (1.110)	Data Time 0.001 (0.589)	Loss 2.4177 (2.4955)	Entropy 0.58931 (0.59097)	Top-1 acc 66.016 (63.735)	Top-5 acc 84.375 (83.924)	lr 0.00654
Train [79][3180/3239]	Time 8.144 (1.112)	Data Time 7.900 (0.591)	Loss 2.4014 (2.4955)	Entropy 0.58923 (0.59096)	Top-1 acc 69.141 (63.735)	Top-5 acc 87.109 (83.924)	lr 0.00654
Train [79][3190/3239]	Time 0.374 (1.112)	Data Time 0.000 (0.591)	Loss 2.7405 (2.4954)	Entropy 0.58942 (0.59096)	Top-1 acc 57.031 (63.739)	Top-5 acc 79.688 (83.925)	lr 0.00654
Train [79][3200/3239]	Time 0.237 (1.111)	Data Time 0.000 (0.591)	Loss 2.7210 (2.4954)	Entropy 0.58932 (0.59095)	Top-1 acc 59.375 (63.740)	Top-5 acc 78.125 (83.923)	lr 0.00654
Train [79][3210/3239]	Time 0.236 (1.109)	Data Time 0.000 (0.589)	Loss 2.3354 (2.4954)	Entropy 0.58967 (0.59095)	Top-1 acc 65.625 (63.738)	Top-5 acc 89.453 (83.925)	lr 0.00654
Train [79][3220/3239]	Time 0.270 (1.111)	Data Time 0.000 (0.592)	Loss 2.6249 (2.4954)	Entropy 0.58991 (0.59095)	Top-1 acc 60.938 (63.739)	Top-5 acc 83.594 (83.928)	lr 0.00654
Train [79][3230/3239]	Time 2.971 (1.110)	Data Time 2.725 (0.591)	Loss 2.5374 (2.4953)	Entropy 0.58984 (0.59094)	Top-1 acc 62.500 (63.741)	Top-5 acc 80.859 (83.929)	lr 0.00654
Train [79][3239/3239]	Time 0.931 (1.108)	Data Time 0.000 (0.589)	Loss 2.4901 (2.4952)	Entropy 0.58968 (0.59094)	Top-1 acc 59.259 (63.742)	Top-5 acc 81.481 (83.929)	lr 0.00654
==========Valid [79/120]	loss 1.292	top-1 acc 70.285 (70.285)	top-5 acc 89.175	Train top-1 63.742	top-5 83.929	Entropy 0.58968	Latency-None: 0.000ms	Flops: 539.00M
Train [80][0/3239]	Time 62.090 (62.090)	Data Time 60.280 (60.280)	Loss 2.4091 (2.4091)	Entropy 0.58955 (0.58955)	Top-1 acc 66.406 (66.406)	Top-5 acc 87.109 (87.109)	lr 0.00654
Train [80][10/3239]	Time 0.251 (6.040)	Data Time 0.001 (5.482)	Loss 2.4722 (2.5078)	Entropy 0.58967 (0.58957)	Top-1 acc 61.328 (63.033)	Top-5 acc 83.984 (84.411)	lr 0.00653
Train [80][20/3239]	Time 0.273 (3.364)	Data Time 0.001 (2.872)	Loss 2.4364 (2.4992)	Entropy 0.58945 (0.58957)	Top-1 acc 66.016 (63.151)	Top-5 acc 86.719 (84.022)	lr 0.00653
Train [80][30/3239]	Time 0.247 (2.418)	Data Time 0.001 (1.946)	Loss 2.4259 (2.5015)	Entropy 0.58933 (0.58950)	Top-1 acc 63.281 (63.117)	Top-5 acc 87.109 (83.909)	lr 0.00653
Train [80][40/3239]	Time 0.246 (2.182)	Data Time 0.001 (1.715)	Loss 2.5052 (2.5016)	Entropy 0.58884 (0.58941)	Top-1 acc 64.453 (63.014)	Top-5 acc 85.547 (83.937)	lr 0.00653
Train [80][50/3239]	Time 0.243 (1.838)	Data Time 0.001 (1.379)	Loss 2.2657 (2.5002)	Entropy 0.58879 (0.58930)	Top-1 acc 67.969 (63.197)	Top-5 acc 88.281 (83.992)	lr 0.00653
Train [80][60/3239]	Time 0.239 (1.604)	Data Time 0.001 (1.153)	Loss 2.6927 (2.5053)	Entropy 0.58878 (0.58920)	Top-1 acc 57.422 (63.224)	Top-5 acc 79.688 (83.831)	lr 0.00653
Train [80][70/3239]	Time 0.258 (1.592)	Data Time 0.002 (1.141)	Loss 2.6030 (2.5038)	Entropy 0.58903 (0.58915)	Top-1 acc 62.500 (63.419)	Top-5 acc 82.812 (83.885)	lr 0.00653
Train [80][80/3239]	Time 0.252 (1.450)	Data Time 0.001 (1.000)	Loss 2.4889 (2.5015)	Entropy 0.58875 (0.58912)	Top-1 acc 62.500 (63.368)	Top-5 acc 85.547 (83.907)	lr 0.00653
Train [80][90/3239]	Time 0.365 (1.338)	Data Time 0.001 (0.890)	Loss 2.6898 (2.5009)	Entropy 0.58873 (0.58908)	Top-1 acc 61.328 (63.423)	Top-5 acc 76.953 (83.929)	lr 0.00653
Train [80][100/3239]	Time 2.281 (1.365)	Data Time 2.017 (0.918)	Loss 2.4198 (2.4946)	Entropy 0.58882 (0.58905)	Top-1 acc 67.969 (63.718)	Top-5 acc 83.594 (84.054)	lr 0.00653
Train [80][110/3239]	Time 0.236 (1.280)	Data Time 0.001 (0.835)	Loss 2.3926 (2.4957)	Entropy 0.58843 (0.58902)	Top-1 acc 64.062 (63.682)	Top-5 acc 84.375 (84.002)	lr 0.00653
Train [80][120/3239]	Time 0.243 (1.679)	Data Time 0.002 (0.767)	Loss 2.4601 (2.4983)	Entropy 0.58831 (0.58897)	Top-1 acc 66.016 (63.569)	Top-5 acc 85.156 (84.007)	lr 0.00652
Train [80][130/3239]	Time 0.249 (1.582)	Data Time 0.002 (0.708)	Loss 2.3965 (2.4953)	Entropy 0.58811 (0.58891)	Top-1 acc 67.578 (63.684)	Top-5 acc 85.156 (84.062)	lr 0.00652
Train [80][140/3239]	Time 0.231 (1.501)	Data Time 0.001 (0.658)	Loss 2.5614 (2.4958)	Entropy 0.58810 (0.58886)	Top-1 acc 62.109 (63.578)	Top-5 acc 82.812 (84.012)	lr 0.00652
Train [80][150/3239]	Time 0.236 (1.429)	Data Time 0.002 (0.615)	Loss 2.5132 (2.4977)	Entropy 0.58789 (0.58880)	Top-1 acc 67.188 (63.592)	Top-5 acc 83.203 (83.946)	lr 0.00652
Train [80][160/3239]	Time 0.242 (1.367)	Data Time 0.001 (0.577)	Loss 2.4359 (2.4935)	Entropy 0.58789 (0.58875)	Top-1 acc 65.625 (63.708)	Top-5 acc 86.719 (84.040)	lr 0.00652
Train [80][170/3239]	Time 0.249 (1.312)	Data Time 0.001 (0.543)	Loss 2.7116 (2.4924)	Entropy 0.58785 (0.58870)	Top-1 acc 55.859 (63.720)	Top-5 acc 80.078 (84.078)	lr 0.00652
Train [80][180/3239]	Time 0.377 (1.263)	Data Time 0.001 (0.513)	Loss 2.6993 (2.4929)	Entropy 0.58759 (0.58865)	Top-1 acc 60.156 (63.696)	Top-5 acc 78.906 (84.075)	lr 0.00652
Train [80][190/3239]	Time 0.243 (1.220)	Data Time 0.001 (0.486)	Loss 2.4368 (2.4923)	Entropy 0.58770 (0.58860)	Top-1 acc 65.234 (63.688)	Top-5 acc 84.766 (84.054)	lr 0.00652
Train [80][200/3239]	Time 0.536 (1.184)	Data Time 0.294 (0.464)	Loss 2.4728 (2.4913)	Entropy 0.58767 (0.58855)	Top-1 acc 65.625 (63.779)	Top-5 acc 84.375 (84.054)	lr 0.00652
Train [80][210/3239]	Time 1.132 (1.159)	Data Time 0.886 (0.453)	Loss 2.5956 (2.4918)	Entropy 0.58795 (0.58851)	Top-1 acc 55.078 (63.753)	Top-5 acc 83.203 (84.058)	lr 0.00652
Train [80][220/3239]	Time 0.271 (1.161)	Data Time 0.002 (0.467)	Loss 2.3884 (2.4907)	Entropy 0.58775 (0.58849)	Top-1 acc 65.625 (63.794)	Top-5 acc 85.938 (84.069)	lr 0.00652
Train [80][230/3239]	Time 0.237 (1.144)	Data Time 0.001 (0.460)	Loss 2.4400 (2.4934)	Entropy 0.58820 (0.58846)	Top-1 acc 65.625 (63.731)	Top-5 acc 85.938 (84.006)	lr 0.00652
Train [80][240/3239]	Time 0.229 (1.120)	Data Time 0.001 (0.447)	Loss 2.6636 (2.4932)	Entropy 0.58819 (0.58845)	Top-1 acc 58.203 (63.782)	Top-5 acc 81.250 (84.007)	lr 0.00651
Train [80][250/3239]	Time 0.330 (1.134)	Data Time 0.001 (0.470)	Loss 2.3263 (2.4921)	Entropy 0.58832 (0.58844)	Top-1 acc 68.750 (63.838)	Top-5 acc 85.547 (83.997)	lr 0.00651
Train [80][260/3239]	Time 0.255 (1.119)	Data Time 0.001 (0.464)	Loss 2.3287 (2.4919)	Entropy 0.58831 (0.58844)	Top-1 acc 67.969 (63.847)	Top-5 acc 87.500 (83.993)	lr 0.00651
Train [80][270/3239]	Time 0.252 (1.094)	Data Time 0.001 (0.447)	Loss 2.2475 (2.4913)	Entropy 0.58823 (0.58843)	Top-1 acc 69.922 (63.903)	Top-5 acc 87.500 (84.000)	lr 0.00651
Train [80][280/3239]	Time 0.238 (1.103)	Data Time 0.002 (0.463)	Loss 2.4761 (2.4915)	Entropy 0.58833 (0.58842)	Top-1 acc 63.281 (63.883)	Top-5 acc 86.719 (84.009)	lr 0.00651
Train [80][290/3239]	Time 1.576 (1.088)	Data Time 1.262 (0.455)	Loss 2.3375 (2.4888)	Entropy 0.58828 (0.58842)	Top-1 acc 70.312 (63.994)	Top-5 acc 88.281 (84.074)	lr 0.00651
Train [80][300/3239]	Time 0.236 (1.070)	Data Time 0.001 (0.444)	Loss 2.5257 (2.4885)	Entropy 0.58840 (0.58842)	Top-1 acc 62.891 (64.011)	Top-5 acc 82.812 (84.062)	lr 0.00651
Train [80][310/3239]	Time 0.264 (1.083)	Data Time 0.002 (0.463)	Loss 2.4805 (2.4872)	Entropy 0.58873 (0.58842)	Top-1 acc 61.719 (64.054)	Top-5 acc 84.766 (84.091)	lr 0.00651
Train [80][320/3239]	Time 0.381 (1.067)	Data Time 0.001 (0.451)	Loss 2.3612 (2.4872)	Entropy 0.58847 (0.58843)	Top-1 acc 66.797 (64.043)	Top-5 acc 85.547 (84.066)	lr 0.00651
Train [80][330/3239]	Time 0.241 (1.058)	Data Time 0.001 (0.448)	Loss 2.3436 (2.4864)	Entropy 0.58857 (0.58843)	Top-1 acc 66.016 (64.032)	Top-5 acc 87.891 (84.079)	lr 0.00651
Train [80][340/3239]	Time 2.895 (1.051)	Data Time 2.632 (0.447)	Loss 2.5086 (2.4853)	Entropy 0.58829 (0.58843)	Top-1 acc 64.453 (64.054)	Top-5 acc 82.422 (84.083)	lr 0.00651
Train [80][350/3239]	Time 0.236 (1.061)	Data Time 0.001 (0.461)	Loss 2.3520 (2.4851)	Entropy 0.58807 (0.58843)	Top-1 acc 66.797 (64.074)	Top-5 acc 84.375 (84.076)	lr 0.00650
Train [80][360/3239]	Time 0.627 (1.043)	Data Time 0.366 (0.450)	Loss 2.4004 (2.4854)	Entropy 0.58830 (0.58842)	Top-1 acc 66.406 (64.045)	Top-5 acc 85.547 (84.067)	lr 0.00650
Train [80][370/3239]	Time 0.236 (1.037)	Data Time 0.002 (0.448)	Loss 2.7483 (2.4877)	Entropy 0.58804 (0.58841)	Top-1 acc 56.641 (63.972)	Top-5 acc 76.953 (84.041)	lr 0.00650
Train [80][380/3239]	Time 0.299 (1.047)	Data Time 0.001 (0.461)	Loss 2.3598 (2.4865)	Entropy 0.58804 (0.58840)	Top-1 acc 62.500 (63.968)	Top-5 acc 86.328 (84.044)	lr 0.00650
Train [80][390/3239]	Time 0.253 (1.032)	Data Time 0.002 (0.449)	Loss 2.3778 (2.4863)	Entropy 0.58736 (0.58839)	Top-1 acc 69.141 (63.992)	Top-5 acc 86.719 (84.031)	lr 0.00650
Train [80][400/3239]	Time 0.243 (1.023)	Data Time 0.001 (0.444)	Loss 2.4311 (2.4850)	Entropy 0.58705 (0.58836)	Top-1 acc 64.453 (64.025)	Top-5 acc 85.547 (84.055)	lr 0.00650
Train [80][410/3239]	Time 0.331 (1.040)	Data Time 0.001 (0.464)	Loss 2.5253 (2.4846)	Entropy 0.58733 (0.58833)	Top-1 acc 62.500 (64.024)	Top-5 acc 83.203 (84.072)	lr 0.00650
Train [80][420/3239]	Time 0.234 (1.026)	Data Time 0.001 (0.453)	Loss 2.4945 (2.4848)	Entropy 0.58716 (0.58831)	Top-1 acc 64.453 (64.021)	Top-5 acc 82.812 (84.076)	lr 0.00650
Train [80][430/3239]	Time 0.235 (1.018)	Data Time 0.001 (0.450)	Loss 2.8334 (2.4851)	Entropy 0.58715 (0.58828)	Top-1 acc 57.031 (64.009)	Top-5 acc 76.562 (84.072)	lr 0.00650
Train [80][440/3239]	Time 2.110 (1.034)	Data Time 1.877 (0.468)	Loss 2.4900 (2.4843)	Entropy 0.58709 (0.58825)	Top-1 acc 59.766 (64.025)	Top-5 acc 84.766 (84.086)	lr 0.00650
Train [80][450/3239]	Time 0.236 (1.021)	Data Time 0.001 (0.458)	Loss 2.2747 (2.4827)	Entropy 0.58743 (0.58823)	Top-1 acc 68.359 (64.080)	Top-5 acc 86.328 (84.119)	lr 0.00650
Train [80][460/3239]	Time 0.253 (1.007)	Data Time 0.001 (0.448)	Loss 2.5705 (2.4834)	Entropy 0.58754 (0.58821)	Top-1 acc 56.641 (64.051)	Top-5 acc 80.859 (84.096)	lr 0.00649
Train [80][470/3239]	Time 0.591 (1.020)	Data Time 0.355 (0.464)	Loss 2.4738 (2.4831)	Entropy 0.58742 (0.58820)	Top-1 acc 63.672 (64.038)	Top-5 acc 84.375 (84.099)	lr 0.00649
Train [80][480/3239]	Time 0.364 (1.017)	Data Time 0.001 (0.463)	Loss 2.5153 (2.4824)	Entropy 0.58724 (0.58818)	Top-1 acc 66.406 (64.065)	Top-5 acc 82.812 (84.108)	lr 0.00649
Train [80][490/3239]	Time 0.238 (1.007)	Data Time 0.001 (0.456)	Loss 2.4240 (2.4832)	Entropy 0.58745 (0.58816)	Top-1 acc 65.234 (64.050)	Top-5 acc 85.547 (84.097)	lr 0.00649
Train [80][500/3239]	Time 0.233 (1.006)	Data Time 0.001 (0.458)	Loss 2.3572 (2.4852)	Entropy 0.58745 (0.58815)	Top-1 acc 66.016 (63.995)	Top-5 acc 89.062 (84.069)	lr 0.00649
Train [80][510/3239]	Time 0.230 (1.018)	Data Time 0.001 (0.472)	Loss 2.3626 (2.4842)	Entropy 0.58743 (0.58813)	Top-1 acc 67.578 (64.035)	Top-5 acc 87.500 (84.081)	lr 0.00649
Train [80][520/3239]	Time 0.230 (1.006)	Data Time 0.001 (0.463)	Loss 2.5959 (2.4844)	Entropy 0.58712 (0.58812)	Top-1 acc 60.938 (64.027)	Top-5 acc 80.859 (84.063)	lr 0.00649
Train [80][530/3239]	Time 0.238 (1.005)	Data Time 0.002 (0.464)	Loss 2.3463 (2.4848)	Entropy 0.58720 (0.58810)	Top-1 acc 66.016 (63.994)	Top-5 acc 87.500 (84.056)	lr 0.00649
Train [80][540/3239]	Time 5.889 (1.020)	Data Time 5.648 (0.482)	Loss 2.4511 (2.4843)	Entropy 0.58728 (0.58808)	Top-1 acc 66.016 (64.012)	Top-5 acc 82.812 (84.051)	lr 0.00649
Train [80][550/3239]	Time 0.235 (1.009)	Data Time 0.001 (0.473)	Loss 2.6689 (2.4840)	Entropy 0.58677 (0.58806)	Top-1 acc 63.281 (64.028)	Top-5 acc 80.078 (84.054)	lr 0.00649
Train [80][560/3239]	Time 0.233 (1.014)	Data Time 0.001 (0.480)	Loss 2.4204 (2.4840)	Entropy 0.58675 (0.58804)	Top-1 acc 65.625 (64.044)	Top-5 acc 87.500 (84.062)	lr 0.00649
Train [80][570/3239]	Time 0.384 (1.022)	Data Time 0.002 (0.490)	Loss 2.5858 (2.4846)	Entropy 0.58676 (0.58801)	Top-1 acc 58.203 (64.003)	Top-5 acc 83.203 (84.055)	lr 0.00648
Train [80][580/3239]	Time 0.270 (1.025)	Data Time 0.001 (0.494)	Loss 2.3223 (2.4847)	Entropy 0.58693 (0.58799)	Top-1 acc 66.797 (63.995)	Top-5 acc 87.500 (84.052)	lr 0.00648
Train [80][590/3239]	Time 0.261 (1.021)	Data Time 0.001 (0.493)	Loss 2.2018 (2.4843)	Entropy 0.58691 (0.58798)	Top-1 acc 72.656 (64.020)	Top-5 acc 86.719 (84.043)	lr 0.00648
Train [80][600/3239]	Time 0.881 (1.026)	Data Time 0.633 (0.499)	Loss 2.4899 (2.4856)	Entropy 0.58690 (0.58796)	Top-1 acc 63.672 (63.986)	Top-5 acc 84.766 (84.025)	lr 0.00648
Train [80][610/3239]	Time 0.231 (1.026)	Data Time 0.001 (0.501)	Loss 2.5524 (2.4860)	Entropy 0.58658 (0.58794)	Top-1 acc 62.109 (63.990)	Top-5 acc 80.469 (84.011)	lr 0.00648
Train [80][620/3239]	Time 0.263 (1.017)	Data Time 0.001 (0.493)	Loss 2.5127 (2.4864)	Entropy 0.58646 (0.58792)	Top-1 acc 63.672 (63.993)	Top-5 acc 82.422 (83.996)	lr 0.00648
Train [80][630/3239]	Time 1.588 (1.030)	Data Time 1.352 (0.507)	Loss 2.3201 (2.4853)	Entropy 0.58657 (0.58790)	Top-1 acc 68.750 (64.022)	Top-5 acc 85.938 (84.014)	lr 0.00648
Train [80][640/3239]	Time 0.374 (1.029)	Data Time 0.001 (0.508)	Loss 2.6380 (2.4855)	Entropy 0.58677 (0.58787)	Top-1 acc 55.859 (64.021)	Top-5 acc 82.031 (84.008)	lr 0.00648
Train [80][650/3239]	Time 0.241 (1.021)	Data Time 0.001 (0.502)	Loss 2.5703 (2.4851)	Entropy 0.58668 (0.58786)	Top-1 acc 62.109 (64.021)	Top-5 acc 80.859 (84.019)	lr 0.00648
Train [80][660/3239]	Time 0.244 (1.020)	Data Time 0.001 (0.502)	Loss 2.5219 (2.4853)	Entropy 0.58687 (0.58784)	Top-1 acc 60.938 (64.031)	Top-5 acc 86.328 (84.022)	lr 0.00648
Train [80][670/3239]	Time 0.244 (1.037)	Data Time 0.001 (0.521)	Loss 2.5704 (2.4845)	Entropy 0.58670 (0.58783)	Top-1 acc 59.375 (64.041)	Top-5 acc 82.031 (84.039)	lr 0.00648
Train [80][680/3239]	Time 5.743 (1.037)	Data Time 5.500 (0.521)	Loss 2.5704 (2.4839)	Entropy 0.58656 (0.58781)	Top-1 acc 61.719 (64.054)	Top-5 acc 84.375 (84.049)	lr 0.00648
Train [80][690/3239]	Time 0.251 (1.030)	Data Time 0.001 (0.516)	Loss 2.5510 (2.4839)	Entropy 0.58648 (0.58779)	Top-1 acc 61.719 (64.057)	Top-5 acc 84.766 (84.057)	lr 0.00647
Train [80][700/3239]	Time 3.641 (1.051)	Data Time 3.396 (0.538)	Loss 2.6048 (2.4845)	Entropy 0.58677 (0.58777)	Top-1 acc 60.156 (64.040)	Top-5 acc 82.812 (84.056)	lr 0.00647
Train [80][710/3239]	Time 0.233 (1.042)	Data Time 0.001 (0.531)	Loss 2.5585 (2.4846)	Entropy 0.58695 (0.58776)	Top-1 acc 64.844 (64.021)	Top-5 acc 82.422 (84.051)	lr 0.00647
Train [80][720/3239]	Time 0.241 (1.036)	Data Time 0.001 (0.525)	Loss 2.5985 (2.4850)	Entropy 0.58715 (0.58775)	Top-1 acc 62.891 (64.016)	Top-5 acc 81.641 (84.050)	lr 0.00647
Train [80][730/3239]	Time 0.257 (1.050)	Data Time 0.001 (0.540)	Loss 2.5397 (2.4862)	Entropy 0.58721 (0.58774)	Top-1 acc 60.938 (63.982)	Top-5 acc 83.984 (84.034)	lr 0.00647
Train [80][740/3239]	Time 0.239 (1.053)	Data Time 0.001 (0.544)	Loss 2.2920 (2.4862)	Entropy 0.58713 (0.58773)	Top-1 acc 66.406 (63.976)	Top-5 acc 88.672 (84.034)	lr 0.00647
Train [80][750/3239]	Time 0.237 (1.045)	Data Time 0.001 (0.538)	Loss 2.2231 (2.4855)	Entropy 0.58717 (0.58773)	Top-1 acc 69.922 (63.986)	Top-5 acc 89.844 (84.049)	lr 0.00647
Train [80][760/3239]	Time 3.268 (1.059)	Data Time 3.015 (0.553)	Loss 2.5442 (2.4859)	Entropy 0.58719 (0.58772)	Top-1 acc 62.109 (63.972)	Top-5 acc 82.812 (84.035)	lr 0.00647
Train [80][770/3239]	Time 0.372 (1.140)	Data Time 0.008 (0.561)	Loss 2.4302 (2.4864)	Entropy 0.58747 (0.58771)	Top-1 acc 62.891 (63.962)	Top-5 acc 85.938 (84.036)	lr 0.00647
Train [80][780/3239]	Time 0.234 (1.131)	Data Time 0.002 (0.554)	Loss 2.3459 (2.4860)	Entropy 0.58762 (0.58771)	Top-1 acc 66.016 (63.965)	Top-5 acc 87.109 (84.048)	lr 0.00647
Train [80][790/3239]	Time 0.243 (1.122)	Data Time 0.002 (0.547)	Loss 2.5053 (2.4852)	Entropy 0.58755 (0.58771)	Top-1 acc 61.328 (63.979)	Top-5 acc 83.594 (84.063)	lr 0.00647
Train [80][800/3239]	Time 0.351 (1.114)	Data Time 0.002 (0.540)	Loss 2.4381 (2.4856)	Entropy 0.58754 (0.58771)	Top-1 acc 64.062 (63.969)	Top-5 acc 85.156 (84.062)	lr 0.00646
Train [80][810/3239]	Time 0.243 (1.105)	Data Time 0.001 (0.533)	Loss 2.5815 (2.4853)	Entropy 0.58719 (0.58770)	Top-1 acc 61.719 (63.983)	Top-5 acc 79.297 (84.057)	lr 0.00646
Train [80][820/3239]	Time 0.229 (1.097)	Data Time 0.001 (0.527)	Loss 2.4265 (2.4858)	Entropy 0.58734 (0.58770)	Top-1 acc 64.844 (63.972)	Top-5 acc 84.766 (84.050)	lr 0.00646
Train [80][830/3239]	Time 0.241 (1.089)	Data Time 0.002 (0.520)	Loss 2.4106 (2.4853)	Entropy 0.58723 (0.58769)	Top-1 acc 64.062 (63.979)	Top-5 acc 85.156 (84.051)	lr 0.00646
Train [80][840/3239]	Time 0.248 (1.098)	Data Time 0.001 (0.531)	Loss 2.5156 (2.4854)	Entropy 0.58726 (0.58769)	Top-1 acc 67.969 (63.990)	Top-5 acc 82.812 (84.053)	lr 0.00646
Train [80][850/3239]	Time 0.241 (1.093)	Data Time 0.001 (0.527)	Loss 2.5550 (2.4857)	Entropy 0.58735 (0.58768)	Top-1 acc 60.547 (63.973)	Top-5 acc 83.203 (84.047)	lr 0.00646
Train [80][860/3239]	Time 0.232 (1.087)	Data Time 0.001 (0.523)	Loss 2.5134 (2.4859)	Entropy 0.58739 (0.58768)	Top-1 acc 62.109 (63.967)	Top-5 acc 84.375 (84.045)	lr 0.00646
Train [80][870/3239]	Time 0.257 (1.110)	Data Time 0.001 (0.547)	Loss 2.2983 (2.4856)	Entropy 0.58758 (0.58768)	Top-1 acc 67.188 (63.975)	Top-5 acc 87.109 (84.045)	lr 0.00646
Train [80][880/3239]	Time 0.234 (1.103)	Data Time 0.001 (0.541)	Loss 2.5066 (2.4853)	Entropy 0.58742 (0.58767)	Top-1 acc 63.672 (63.987)	Top-5 acc 83.984 (84.053)	lr 0.00646
Train [80][890/3239]	Time 0.283 (1.095)	Data Time 0.001 (0.535)	Loss 2.3593 (2.4849)	Entropy 0.58745 (0.58767)	Top-1 acc 67.188 (64.001)	Top-5 acc 87.109 (84.064)	lr 0.00646
Train [80][900/3239]	Time 0.278 (1.107)	Data Time 0.001 (0.548)	Loss 2.4919 (2.4848)	Entropy 0.58751 (0.58767)	Top-1 acc 67.188 (63.992)	Top-5 acc 85.156 (84.070)	lr 0.00646
Train [80][910/3239]	Time 0.251 (1.101)	Data Time 0.001 (0.543)	Loss 2.3606 (2.4848)	Entropy 0.58716 (0.58767)	Top-1 acc 67.969 (64.001)	Top-5 acc 88.672 (84.074)	lr 0.00645
Train [80][920/3239]	Time 0.259 (1.094)	Data Time 0.001 (0.538)	Loss 2.7411 (2.4856)	Entropy 0.58689 (0.58766)	Top-1 acc 62.500 (63.989)	Top-5 acc 78.516 (84.062)	lr 0.00645
Train [80][930/3239]	Time 14.457 (1.102)	Data Time 14.164 (0.547)	Loss 2.4051 (2.4857)	Entropy 0.58678 (0.58765)	Top-1 acc 64.453 (63.996)	Top-5 acc 86.719 (84.060)	lr 0.00645
Train [80][940/3239]	Time 0.246 (1.103)	Data Time 0.002 (0.549)	Loss 2.5158 (2.4860)	Entropy 0.58717 (0.58764)	Top-1 acc 64.844 (63.999)	Top-5 acc 83.203 (84.057)	lr 0.00645
Train [80][950/3239]	Time 0.249 (1.096)	Data Time 0.001 (0.543)	Loss 2.3149 (2.4860)	Entropy 0.58702 (0.58764)	Top-1 acc 67.969 (63.996)	Top-5 acc 87.109 (84.057)	lr 0.00645
Train [80][960/3239]	Time 0.332 (1.089)	Data Time 0.001 (0.538)	Loss 2.3108 (2.4856)	Entropy 0.58702 (0.58763)	Top-1 acc 66.016 (64.002)	Top-5 acc 89.453 (84.071)	lr 0.00645
Train [80][970/3239]	Time 0.234 (1.105)	Data Time 0.001 (0.555)	Loss 2.3563 (2.4851)	Entropy 0.58719 (0.58763)	Top-1 acc 65.625 (64.016)	Top-5 acc 84.766 (84.075)	lr 0.00645
Train [80][980/3239]	Time 0.277 (1.098)	Data Time 0.001 (0.549)	Loss 2.2635 (2.4850)	Entropy 0.58726 (0.58762)	Top-1 acc 68.359 (64.025)	Top-5 acc 87.500 (84.078)	lr 0.00645
Train [80][990/3239]	Time 0.240 (1.091)	Data Time 0.001 (0.544)	Loss 2.3766 (2.4852)	Entropy 0.58724 (0.58762)	Top-1 acc 68.750 (64.022)	Top-5 acc 84.766 (84.073)	lr 0.00645
Train [80][1000/3239]	Time 0.240 (1.107)	Data Time 0.002 (0.560)	Loss 2.5234 (2.4849)	Entropy 0.58725 (0.58761)	Top-1 acc 62.500 (64.030)	Top-5 acc 82.812 (84.082)	lr 0.00645
Train [80][1010/3239]	Time 0.246 (1.100)	Data Time 0.001 (0.555)	Loss 2.4393 (2.4841)	Entropy 0.58732 (0.58761)	Top-1 acc 66.797 (64.068)	Top-5 acc 85.547 (84.100)	lr 0.00645
Train [80][1020/3239]	Time 0.244 (1.094)	Data Time 0.001 (0.549)	Loss 2.5604 (2.4837)	Entropy 0.58720 (0.58761)	Top-1 acc 62.891 (64.078)	Top-5 acc 83.984 (84.104)	lr 0.00645
Train [80][1030/3239]	Time 0.340 (1.108)	Data Time 0.001 (0.564)	Loss 2.3731 (2.4835)	Entropy 0.58745 (0.58760)	Top-1 acc 68.359 (64.085)	Top-5 acc 85.938 (84.113)	lr 0.00644
Train [80][1040/3239]	Time 0.249 (1.101)	Data Time 0.001 (0.559)	Loss 2.3317 (2.4837)	Entropy 0.58769 (0.58760)	Top-1 acc 70.312 (64.094)	Top-5 acc 86.719 (84.105)	lr 0.00644
Train [80][1050/3239]	Time 1.249 (1.096)	Data Time 1.003 (0.555)	Loss 2.5411 (2.4837)	Entropy 0.58733 (0.58760)	Top-1 acc 64.844 (64.101)	Top-5 acc 82.422 (84.101)	lr 0.00644
Train [80][1060/3239]	Time 6.219 (1.108)	Data Time 5.927 (0.568)	Loss 2.4407 (2.4839)	Entropy 0.58724 (0.58760)	Top-1 acc 64.062 (64.092)	Top-5 acc 82.812 (84.099)	lr 0.00644
Train [80][1070/3239]	Time 0.242 (1.103)	Data Time 0.001 (0.564)	Loss 2.4446 (2.4837)	Entropy 0.58736 (0.58760)	Top-1 acc 64.062 (64.108)	Top-5 acc 84.766 (84.097)	lr 0.00644
Train [80][1080/3239]	Time 0.243 (1.097)	Data Time 0.001 (0.559)	Loss 2.2467 (2.4836)	Entropy 0.58725 (0.58760)	Top-1 acc 67.969 (64.098)	Top-5 acc 89.453 (84.097)	lr 0.00644
Train [80][1090/3239]	Time 11.039 (1.104)	Data Time 10.773 (0.566)	Loss 2.6104 (2.4830)	Entropy 0.58742 (0.58759)	Top-1 acc 58.594 (64.102)	Top-5 acc 84.766 (84.110)	lr 0.00644
Train [80][1100/3239]	Time 1.956 (1.106)	Data Time 1.663 (0.569)	Loss 2.6109 (2.4834)	Entropy 0.58770 (0.58759)	Top-1 acc 61.328 (64.090)	Top-5 acc 83.594 (84.100)	lr 0.00644
Train [80][1110/3239]	Time 0.234 (1.100)	Data Time 0.001 (0.564)	Loss 2.5668 (2.4834)	Entropy 0.58807 (0.58759)	Top-1 acc 57.812 (64.089)	Top-5 acc 81.641 (84.103)	lr 0.00644
Train [80][1120/3239]	Time 1.143 (1.095)	Data Time 0.779 (0.560)	Loss 2.5904 (2.4841)	Entropy 0.58784 (0.58760)	Top-1 acc 60.938 (64.061)	Top-5 acc 82.422 (84.092)	lr 0.00644
Train [80][1130/3239]	Time 0.243 (1.109)	Data Time 0.001 (0.576)	Loss 2.2915 (2.4839)	Entropy 0.58766 (0.58760)	Top-1 acc 68.359 (64.073)	Top-5 acc 86.719 (84.094)	lr 0.00644
Train [80][1140/3239]	Time 0.248 (1.103)	Data Time 0.001 (0.571)	Loss 2.5013 (2.4839)	Entropy 0.58788 (0.58760)	Top-1 acc 60.547 (64.066)	Top-5 acc 83.594 (84.093)	lr 0.00643
Train [80][1150/3239]	Time 0.238 (1.098)	Data Time 0.001 (0.566)	Loss 2.3588 (2.4841)	Entropy 0.58793 (0.58760)	Top-1 acc 65.234 (64.057)	Top-5 acc 87.500 (84.090)	lr 0.00643
Train [80][1160/3239]	Time 0.253 (1.112)	Data Time 0.001 (0.581)	Loss 2.3835 (2.4841)	Entropy 0.58797 (0.58761)	Top-1 acc 65.625 (64.058)	Top-5 acc 84.766 (84.089)	lr 0.00643
Train [80][1170/3239]	Time 0.235 (1.106)	Data Time 0.001 (0.576)	Loss 2.2568 (2.4842)	Entropy 0.58791 (0.58761)	Top-1 acc 73.047 (64.055)	Top-5 acc 87.891 (84.084)	lr 0.00643
Train [80][1180/3239]	Time 0.247 (1.101)	Data Time 0.001 (0.571)	Loss 2.5268 (2.4840)	Entropy 0.58779 (0.58761)	Top-1 acc 61.328 (64.063)	Top-5 acc 84.375 (84.093)	lr 0.00643
Train [80][1190/3239]	Time 0.337 (1.112)	Data Time 0.002 (0.583)	Loss 2.3323 (2.4849)	Entropy 0.58768 (0.58761)	Top-1 acc 68.359 (64.040)	Top-5 acc 86.719 (84.076)	lr 0.00643
Train [80][1200/3239]	Time 0.245 (1.108)	Data Time 0.001 (0.580)	Loss 2.4260 (2.4853)	Entropy 0.58750 (0.58761)	Top-1 acc 67.578 (64.038)	Top-5 acc 85.156 (84.067)	lr 0.00643
Train [80][1210/3239]	Time 0.281 (1.104)	Data Time 0.002 (0.577)	Loss 2.6249 (2.4858)	Entropy 0.58753 (0.58761)	Top-1 acc 58.203 (64.030)	Top-5 acc 85.156 (84.060)	lr 0.00643
Train [80][1220/3239]	Time 9.133 (1.114)	Data Time 8.882 (0.588)	Loss 2.4467 (2.4854)	Entropy 0.58715 (0.58761)	Top-1 acc 63.281 (64.035)	Top-5 acc 83.203 (84.070)	lr 0.00643
Train [80][1230/3239]	Time 0.232 (1.113)	Data Time 0.001 (0.588)	Loss 2.4936 (2.4855)	Entropy 0.58717 (0.58761)	Top-1 acc 65.234 (64.031)	Top-5 acc 82.031 (84.070)	lr 0.00643
Train [80][1240/3239]	Time 0.225 (1.108)	Data Time 0.001 (0.583)	Loss 2.5100 (2.4860)	Entropy 0.58668 (0.58760)	Top-1 acc 61.719 (64.024)	Top-5 acc 82.422 (84.066)	lr 0.00643
Train [80][1250/3239]	Time 8.593 (1.113)	Data Time 8.333 (0.589)	Loss 2.6478 (2.4859)	Entropy 0.58690 (0.58759)	Top-1 acc 60.156 (64.023)	Top-5 acc 81.641 (84.072)	lr 0.00642
Train [80][1260/3239]	Time 0.297 (1.116)	Data Time 0.001 (0.593)	Loss 2.4665 (2.4862)	Entropy 0.58700 (0.58759)	Top-1 acc 60.938 (64.008)	Top-5 acc 84.766 (84.067)	lr 0.00642
Train [80][1270/3239]	Time 0.236 (1.110)	Data Time 0.001 (0.588)	Loss 2.6172 (2.4863)	Entropy 0.58665 (0.58758)	Top-1 acc 57.422 (64.008)	Top-5 acc 80.078 (84.066)	lr 0.00642
Train [80][1280/3239]	Time 0.257 (1.108)	Data Time 0.001 (0.587)	Loss 2.4782 (2.4862)	Entropy 0.58633 (0.58757)	Top-1 acc 67.578 (64.009)	Top-5 acc 86.328 (84.070)	lr 0.00642
Train [80][1290/3239]	Time 0.243 (1.118)	Data Time 0.001 (0.597)	Loss 2.3900 (2.4866)	Entropy 0.58632 (0.58756)	Top-1 acc 67.969 (63.997)	Top-5 acc 85.156 (84.063)	lr 0.00642
Train [80][1300/3239]	Time 0.255 (1.112)	Data Time 0.001 (0.592)	Loss 2.4094 (2.4866)	Entropy 0.58641 (0.58755)	Top-1 acc 61.719 (63.991)	Top-5 acc 86.719 (84.063)	lr 0.00642
Train [80][1310/3239]	Time 0.245 (1.115)	Data Time 0.001 (0.596)	Loss 2.8489 (2.4866)	Entropy 0.58652 (0.58754)	Top-1 acc 52.344 (63.996)	Top-5 acc 76.562 (84.059)	lr 0.00642
Train [80][1320/3239]	Time 0.232 (1.124)	Data Time 0.001 (0.605)	Loss 2.5960 (2.4864)	Entropy 0.58687 (0.58754)	Top-1 acc 62.109 (64.005)	Top-5 acc 83.203 (84.061)	lr 0.00642
Train [80][1330/3239]	Time 0.233 (1.119)	Data Time 0.001 (0.601)	Loss 2.4406 (2.4859)	Entropy 0.58659 (0.58753)	Top-1 acc 63.672 (64.013)	Top-5 acc 85.547 (84.073)	lr 0.00642
Train [80][1340/3239]	Time 0.260 (1.122)	Data Time 0.001 (0.605)	Loss 2.2941 (2.4860)	Entropy 0.58661 (0.58752)	Top-1 acc 69.531 (64.009)	Top-5 acc 87.891 (84.066)	lr 0.00642
Train [80][1350/3239]	Time 0.343 (1.128)	Data Time 0.002 (0.611)	Loss 2.4731 (2.4860)	Entropy 0.58671 (0.58752)	Top-1 acc 69.141 (64.011)	Top-5 acc 83.984 (84.067)	lr 0.00642
Train [80][1360/3239]	Time 0.240 (1.125)	Data Time 0.002 (0.609)	Loss 2.5343 (2.4866)	Entropy 0.58665 (0.58751)	Top-1 acc 60.938 (64.002)	Top-5 acc 82.812 (84.055)	lr 0.00642
Train [80][1370/3239]	Time 0.230 (1.120)	Data Time 0.001 (0.605)	Loss 2.4586 (2.4860)	Entropy 0.58634 (0.58750)	Top-1 acc 62.500 (64.014)	Top-5 acc 87.109 (84.067)	lr 0.00641
Train [80][1380/3239]	Time 9.845 (1.135)	Data Time 9.584 (0.620)	Loss 2.2596 (2.4857)	Entropy 0.58650 (0.58750)	Top-1 acc 68.359 (64.017)	Top-5 acc 87.109 (84.070)	lr 0.00641
Train [80][1390/3239]	Time 0.262 (1.130)	Data Time 0.001 (0.616)	Loss 2.5990 (2.4856)	Entropy 0.58661 (0.58749)	Top-1 acc 59.375 (64.018)	Top-5 acc 83.203 (84.077)	lr 0.00641
Train [80][1400/3239]	Time 0.238 (1.125)	Data Time 0.001 (0.611)	Loss 2.5945 (2.4857)	Entropy 0.58648 (0.58748)	Top-1 acc 59.375 (64.015)	Top-5 acc 81.641 (84.072)	lr 0.00641
Train [80][1410/3239]	Time 2.842 (1.129)	Data Time 2.583 (0.617)	Loss 2.4398 (2.4859)	Entropy 0.58665 (0.58748)	Top-1 acc 67.578 (64.012)	Top-5 acc 85.156 (84.074)	lr 0.00641
Train [80][1420/3239]	Time 0.374 (1.134)	Data Time 0.001 (0.621)	Loss 2.6675 (2.4863)	Entropy 0.58645 (0.58747)	Top-1 acc 60.547 (64.003)	Top-5 acc 78.516 (84.064)	lr 0.00641
Train [80][1430/3239]	Time 0.371 (1.167)	Data Time 0.026 (0.617)	Loss 2.4103 (2.4863)	Entropy 0.58663 (0.58746)	Top-1 acc 67.578 (64.009)	Top-5 acc 84.375 (84.061)	lr 0.00641
Train [80][1440/3239]	Time 0.359 (1.163)	Data Time 0.002 (0.613)	Loss 2.5759 (2.4863)	Entropy 0.58677 (0.58746)	Top-1 acc 61.719 (64.006)	Top-5 acc 83.203 (84.064)	lr 0.00641
Train [80][1450/3239]	Time 0.256 (1.157)	Data Time 0.002 (0.609)	Loss 2.4735 (2.4869)	Entropy 0.58674 (0.58745)	Top-1 acc 62.500 (63.995)	Top-5 acc 82.812 (84.052)	lr 0.00641
Train [80][1460/3239]	Time 0.251 (1.152)	Data Time 0.002 (0.605)	Loss 2.3946 (2.4870)	Entropy 0.58674 (0.58745)	Top-1 acc 68.750 (64.003)	Top-5 acc 85.156 (84.050)	lr 0.00641
Train [80][1470/3239]	Time 0.254 (1.148)	Data Time 0.001 (0.600)	Loss 2.4706 (2.4874)	Entropy 0.58696 (0.58744)	Top-1 acc 67.188 (63.992)	Top-5 acc 82.422 (84.038)	lr 0.00641
Train [80][1480/3239]	Time 0.245 (1.143)	Data Time 0.001 (0.596)	Loss 2.5391 (2.4876)	Entropy 0.58707 (0.58744)	Top-1 acc 65.625 (63.992)	Top-5 acc 83.594 (84.030)	lr 0.00640
Train [80][1490/3239]	Time 0.508 (1.144)	Data Time 0.254 (0.599)	Loss 2.3948 (2.4873)	Entropy 0.58712 (0.58744)	Top-1 acc 65.234 (64.002)	Top-5 acc 86.719 (84.035)	lr 0.00640
Train [80][1500/3239]	Time 0.253 (1.145)	Data Time 0.001 (0.600)	Loss 2.5423 (2.4870)	Entropy 0.58718 (0.58744)	Top-1 acc 64.844 (64.014)	Top-5 acc 85.938 (84.039)	lr 0.00640
Train [80][1510/3239]	Time 0.436 (1.141)	Data Time 0.001 (0.597)	Loss 2.3350 (2.4870)	Entropy 0.58738 (0.58744)	Top-1 acc 69.922 (64.020)	Top-5 acc 81.250 (84.035)	lr 0.00640
Train [80][1520/3239]	Time 0.266 (1.138)	Data Time 0.001 (0.594)	Loss 2.5872 (2.4870)	Entropy 0.58744 (0.58744)	Top-1 acc 61.719 (64.022)	Top-5 acc 84.375 (84.038)	lr 0.00640
Train [80][1530/3239]	Time 0.242 (1.153)	Data Time 0.001 (0.610)	Loss 2.8690 (2.4869)	Entropy 0.58754 (0.58744)	Top-1 acc 54.297 (64.022)	Top-5 acc 75.000 (84.039)	lr 0.00640
Train [80][1540/3239]	Time 0.271 (1.149)	Data Time 0.001 (0.606)	Loss 2.5910 (2.4869)	Entropy 0.58730 (0.58744)	Top-1 acc 58.594 (64.019)	Top-5 acc 82.422 (84.040)	lr 0.00640
Train [80][1550/3239]	Time 0.240 (1.146)	Data Time 0.001 (0.604)	Loss 2.3291 (2.4867)	Entropy 0.58742 (0.58744)	Top-1 acc 67.969 (64.021)	Top-5 acc 84.766 (84.041)	lr 0.00640
Train [80][1560/3239]	Time 3.295 (1.161)	Data Time 3.036 (0.619)	Loss 2.4281 (2.4869)	Entropy 0.58765 (0.58744)	Top-1 acc 66.016 (64.017)	Top-5 acc 84.766 (84.034)	lr 0.00640
Train [80][1570/3239]	Time 0.238 (1.156)	Data Time 0.001 (0.615)	Loss 2.4305 (2.4866)	Entropy 0.58753 (0.58744)	Top-1 acc 67.969 (64.023)	Top-5 acc 80.469 (84.039)	lr 0.00640
Train [80][1580/3239]	Time 0.235 (1.154)	Data Time 0.001 (0.614)	Loss 2.5434 (2.4867)	Entropy 0.58773 (0.58744)	Top-1 acc 64.062 (64.023)	Top-5 acc 80.078 (84.035)	lr 0.00640
Train [80][1590/3239]	Time 0.280 (1.161)	Data Time 0.001 (0.621)	Loss 2.7072 (2.4868)	Entropy 0.58756 (0.58744)	Top-1 acc 58.984 (64.018)	Top-5 acc 79.297 (84.032)	lr 0.00639
Train [80][1600/3239]	Time 0.242 (1.157)	Data Time 0.001 (0.618)	Loss 2.3839 (2.4866)	Entropy 0.58746 (0.58744)	Top-1 acc 66.797 (64.027)	Top-5 acc 87.891 (84.038)	lr 0.00639
Train [80][1610/3239]	Time 0.641 (1.152)	Data Time 0.365 (0.614)	Loss 2.4716 (2.4865)	Entropy 0.58722 (0.58744)	Top-1 acc 64.453 (64.022)	Top-5 acc 84.766 (84.042)	lr 0.00639
Train [80][1620/3239]	Time 0.253 (1.152)	Data Time 0.001 (0.615)	Loss 2.7630 (2.4868)	Entropy 0.58743 (0.58744)	Top-1 acc 58.984 (64.016)	Top-5 acc 77.734 (84.034)	lr 0.00639
Train [80][1630/3239]	Time 0.253 (1.152)	Data Time 0.001 (0.615)	Loss 2.4461 (2.4870)	Entropy 0.58729 (0.58744)	Top-1 acc 64.844 (64.008)	Top-5 acc 83.984 (84.028)	lr 0.00639
Train [80][1640/3239]	Time 0.251 (1.147)	Data Time 0.001 (0.611)	Loss 2.3350 (2.4868)	Entropy 0.58722 (0.58744)	Top-1 acc 67.578 (64.011)	Top-5 acc 85.938 (84.034)	lr 0.00639
Train [80][1650/3239]	Time 6.091 (1.148)	Data Time 5.839 (0.613)	Loss 2.7027 (2.4872)	Entropy 0.58694 (0.58744)	Top-1 acc 57.031 (63.996)	Top-5 acc 80.859 (84.024)	lr 0.00639
Train [80][1660/3239]	Time 0.231 (1.147)	Data Time 0.001 (0.612)	Loss 2.3952 (2.4872)	Entropy 0.58640 (0.58743)	Top-1 acc 66.797 (63.999)	Top-5 acc 85.547 (84.018)	lr 0.00639
Train [80][1670/3239]	Time 0.351 (1.143)	Data Time 0.001 (0.608)	Loss 2.5361 (2.4875)	Entropy 0.58639 (0.58743)	Top-1 acc 60.938 (63.992)	Top-5 acc 83.203 (84.017)	lr 0.00639
Train [80][1680/3239]	Time 0.249 (1.140)	Data Time 0.001 (0.606)	Loss 2.5348 (2.4875)	Entropy 0.58662 (0.58742)	Top-1 acc 62.891 (63.989)	Top-5 acc 82.812 (84.015)	lr 0.00639
Train [80][1690/3239]	Time 0.256 (1.143)	Data Time 0.001 (0.610)	Loss 2.2841 (2.4872)	Entropy 0.58665 (0.58742)	Top-1 acc 67.578 (63.993)	Top-5 acc 88.281 (84.021)	lr 0.00639
Train [80][1700/3239]	Time 0.223 (1.139)	Data Time 0.001 (0.606)	Loss 2.5242 (2.4868)	Entropy 0.58632 (0.58741)	Top-1 acc 62.500 (64.001)	Top-5 acc 85.156 (84.028)	lr 0.00639
Train [80][1710/3239]	Time 0.236 (1.136)	Data Time 0.001 (0.604)	Loss 2.3871 (2.4866)	Entropy 0.58585 (0.58740)	Top-1 acc 67.578 (64.007)	Top-5 acc 83.984 (84.030)	lr 0.00638
Train [80][1720/3239]	Time 3.475 (1.138)	Data Time 3.197 (0.606)	Loss 2.4012 (2.4867)	Entropy 0.58592 (0.58740)	Top-1 acc 66.406 (64.001)	Top-5 acc 85.938 (84.028)	lr 0.00638
Train [80][1730/3239]	Time 0.315 (1.134)	Data Time 0.001 (0.603)	Loss 2.5492 (2.4874)	Entropy 0.58586 (0.58739)	Top-1 acc 62.109 (63.990)	Top-5 acc 84.375 (84.018)	lr 0.00638
Train [80][1740/3239]	Time 0.368 (1.135)	Data Time 0.001 (0.604)	Loss 2.4940 (2.4874)	Entropy 0.58610 (0.58738)	Top-1 acc 61.719 (63.991)	Top-5 acc 82.031 (84.016)	lr 0.00638
Train [80][1750/3239]	Time 0.239 (1.138)	Data Time 0.001 (0.608)	Loss 2.4659 (2.4874)	Entropy 0.58622 (0.58737)	Top-1 acc 66.406 (63.993)	Top-5 acc 84.766 (84.016)	lr 0.00638
Train [80][1760/3239]	Time 0.291 (1.140)	Data Time 0.001 (0.610)	Loss 2.4328 (2.4873)	Entropy 0.58637 (0.58737)	Top-1 acc 64.062 (63.996)	Top-5 acc 85.156 (84.019)	lr 0.00638
Train [80][1770/3239]	Time 5.344 (1.139)	Data Time 5.092 (0.610)	Loss 2.3565 (2.4871)	Entropy 0.58688 (0.58736)	Top-1 acc 66.797 (63.997)	Top-5 acc 85.547 (84.021)	lr 0.00638
Train [80][1780/3239]	Time 0.242 (1.142)	Data Time 0.001 (0.614)	Loss 2.5095 (2.4871)	Entropy 0.58714 (0.58736)	Top-1 acc 66.016 (64.002)	Top-5 acc 82.812 (84.019)	lr 0.00638
Train [80][1790/3239]	Time 0.253 (1.144)	Data Time 0.002 (0.617)	Loss 2.4469 (2.4867)	Entropy 0.58700 (0.58736)	Top-1 acc 64.844 (64.010)	Top-5 acc 83.594 (84.022)	lr 0.00638
Train [80][1800/3239]	Time 0.248 (1.140)	Data Time 0.001 (0.613)	Loss 2.4640 (2.4871)	Entropy 0.58714 (0.58736)	Top-1 acc 60.938 (64.007)	Top-5 acc 83.203 (84.011)	lr 0.00638
Train [80][1810/3239]	Time 7.462 (1.148)	Data Time 7.216 (0.621)	Loss 2.3725 (2.4871)	Entropy 0.58717 (0.58735)	Top-1 acc 68.750 (64.011)	Top-5 acc 87.109 (84.012)	lr 0.00638
Train [80][1820/3239]	Time 0.250 (1.145)	Data Time 0.001 (0.619)	Loss 2.4822 (2.4870)	Entropy 0.58735 (0.58735)	Top-1 acc 62.109 (64.012)	Top-5 acc 84.375 (84.014)	lr 0.00637
Train [80][1830/3239]	Time 0.332 (1.144)	Data Time 0.001 (0.619)	Loss 2.4800 (2.4875)	Entropy 0.58749 (0.58735)	Top-1 acc 59.375 (63.997)	Top-5 acc 85.938 (84.004)	lr 0.00637
Train [80][1840/3239]	Time 0.254 (1.141)	Data Time 0.001 (0.616)	Loss 2.3590 (2.4874)	Entropy 0.58737 (0.58735)	Top-1 acc 66.797 (64.005)	Top-5 acc 85.938 (84.002)	lr 0.00637
Train [80][1850/3239]	Time 0.943 (1.150)	Data Time 0.688 (0.626)	Loss 2.5629 (2.4871)	Entropy 0.58741 (0.58735)	Top-1 acc 62.500 (64.004)	Top-5 acc 83.203 (84.004)	lr 0.00637
Train [80][1860/3239]	Time 0.236 (1.152)	Data Time 0.001 (0.627)	Loss 2.5840 (2.4869)	Entropy 0.58753 (0.58736)	Top-1 acc 60.156 (64.006)	Top-5 acc 83.984 (84.013)	lr 0.00637
Train [80][1870/3239]	Time 0.257 (1.148)	Data Time 0.001 (0.624)	Loss 2.3813 (2.4869)	Entropy 0.58725 (0.58736)	Top-1 acc 65.625 (64.004)	Top-5 acc 86.328 (84.016)	lr 0.00637
Train [80][1880/3239]	Time 0.244 (1.156)	Data Time 0.002 (0.632)	Loss 2.4738 (2.4870)	Entropy 0.58756 (0.58736)	Top-1 acc 61.328 (64.000)	Top-5 acc 82.812 (84.009)	lr 0.00637
Train [80][1890/3239]	Time 0.238 (1.159)	Data Time 0.001 (0.636)	Loss 2.4451 (2.4874)	Entropy 0.58740 (0.58736)	Top-1 acc 64.062 (63.993)	Top-5 acc 86.719 (84.002)	lr 0.00637
Train [80][1900/3239]	Time 0.347 (1.155)	Data Time 0.002 (0.632)	Loss 2.4081 (2.4873)	Entropy 0.58724 (0.58736)	Top-1 acc 66.016 (63.990)	Top-5 acc 87.500 (84.006)	lr 0.00637
Train [80][1910/3239]	Time 0.258 (1.155)	Data Time 0.002 (0.633)	Loss 2.5858 (2.4873)	Entropy 0.58728 (0.58736)	Top-1 acc 61.328 (63.994)	Top-5 acc 83.203 (84.006)	lr 0.00637
Train [80][1920/3239]	Time 0.240 (1.156)	Data Time 0.001 (0.634)	Loss 2.3556 (2.4876)	Entropy 0.58726 (0.58736)	Top-1 acc 68.359 (63.989)	Top-5 acc 87.109 (84.003)	lr 0.00637
Train [80][1930/3239]	Time 0.258 (1.155)	Data Time 0.001 (0.634)	Loss 2.3816 (2.4874)	Entropy 0.58698 (0.58736)	Top-1 acc 64.844 (63.991)	Top-5 acc 85.547 (84.005)	lr 0.00636
Train [80][1940/3239]	Time 0.250 (1.155)	Data Time 0.001 (0.635)	Loss 2.4891 (2.4875)	Entropy 0.58695 (0.58735)	Top-1 acc 60.547 (63.991)	Top-5 acc 82.812 (84.002)	lr 0.00636
Train [80][1950/3239]	Time 0.481 (1.156)	Data Time 0.253 (0.636)	Loss 2.4192 (2.4875)	Entropy 0.58701 (0.58735)	Top-1 acc 66.016 (63.987)	Top-5 acc 83.594 (84.003)	lr 0.00636
Train [80][1960/3239]	Time 0.253 (1.156)	Data Time 0.001 (0.637)	Loss 2.7852 (2.4877)	Entropy 0.58751 (0.58735)	Top-1 acc 58.203 (63.979)	Top-5 acc 79.297 (83.998)	lr 0.00636
Train [80][1970/3239]	Time 0.316 (1.156)	Data Time 0.002 (0.637)	Loss 2.4552 (2.4874)	Entropy 0.58755 (0.58735)	Top-1 acc 62.891 (63.981)	Top-5 acc 83.984 (84.008)	lr 0.00636
Train [80][1980/3239]	Time 0.245 (1.156)	Data Time 0.001 (0.637)	Loss 2.7148 (2.4874)	Entropy 0.58765 (0.58735)	Top-1 acc 57.422 (63.978)	Top-5 acc 79.688 (84.008)	lr 0.00636
Train [80][1990/3239]	Time 0.320 (1.157)	Data Time 0.002 (0.639)	Loss 2.6199 (2.4875)	Entropy 0.58766 (0.58735)	Top-1 acc 61.719 (63.976)	Top-5 acc 82.812 (84.003)	lr 0.00636
Train [80][2000/3239]	Time 0.239 (1.153)	Data Time 0.001 (0.636)	Loss 2.4215 (2.4873)	Entropy 0.58733 (0.58736)	Top-1 acc 67.578 (63.977)	Top-5 acc 86.328 (84.010)	lr 0.00636
Train [80][2010/3239]	Time 0.495 (1.156)	Data Time 0.230 (0.638)	Loss 2.5212 (2.4871)	Entropy 0.58731 (0.58735)	Top-1 acc 63.672 (63.983)	Top-5 acc 82.031 (84.014)	lr 0.00636
Train [80][2020/3239]	Time 0.243 (1.157)	Data Time 0.001 (0.640)	Loss 2.3683 (2.4872)	Entropy 0.58698 (0.58735)	Top-1 acc 66.797 (63.982)	Top-5 acc 84.766 (84.012)	lr 0.00636
Train [80][2030/3239]	Time 0.253 (1.153)	Data Time 0.002 (0.637)	Loss 2.6591 (2.4871)	Entropy 0.58713 (0.58735)	Top-1 acc 60.547 (63.982)	Top-5 acc 81.250 (84.018)	lr 0.00636
Train [80][2040/3239]	Time 2.819 (1.156)	Data Time 2.573 (0.640)	Loss 2.4959 (2.4870)	Entropy 0.58732 (0.58735)	Top-1 acc 63.281 (63.987)	Top-5 acc 84.766 (84.020)	lr 0.00636
Train [80][2050/3239]	Time 0.243 (1.160)	Data Time 0.001 (0.644)	Loss 2.5417 (2.4872)	Entropy 0.58762 (0.58735)	Top-1 acc 59.766 (63.979)	Top-5 acc 83.984 (84.019)	lr 0.00635
Train [80][2060/3239]	Time 0.349 (1.156)	Data Time 0.001 (0.641)	Loss 2.4188 (2.4872)	Entropy 0.58783 (0.58735)	Top-1 acc 67.188 (63.975)	Top-5 acc 84.766 (84.016)	lr 0.00635
Train [80][2070/3239]	Time 0.242 (1.154)	Data Time 0.001 (0.640)	Loss 2.4987 (2.4874)	Entropy 0.58797 (0.58736)	Top-1 acc 67.188 (63.972)	Top-5 acc 84.375 (84.016)	lr 0.00635
Train [80][2080/3239]	Time 0.449 (1.185)	Data Time 0.031 (0.644)	Loss 2.4265 (2.4875)	Entropy 0.58795 (0.58736)	Top-1 acc 66.016 (63.972)	Top-5 acc 84.766 (84.012)	lr 0.00635
Train [80][2090/3239]	Time 0.259 (1.182)	Data Time 0.002 (0.641)	Loss 2.4101 (2.4875)	Entropy 0.58811 (0.58736)	Top-1 acc 64.844 (63.974)	Top-5 acc 82.422 (84.011)	lr 0.00635
Train [80][2100/3239]	Time 0.246 (1.178)	Data Time 0.001 (0.637)	Loss 2.5956 (2.4873)	Entropy 0.58848 (0.58737)	Top-1 acc 63.281 (63.979)	Top-5 acc 80.078 (84.013)	lr 0.00635
Train [80][2110/3239]	Time 0.262 (1.175)	Data Time 0.002 (0.634)	Loss 2.4529 (2.4873)	Entropy 0.58857 (0.58737)	Top-1 acc 64.062 (63.975)	Top-5 acc 85.938 (84.015)	lr 0.00635
Train [80][2120/3239]	Time 0.240 (1.171)	Data Time 0.001 (0.631)	Loss 2.1869 (2.4871)	Entropy 0.58850 (0.58738)	Top-1 acc 70.703 (63.981)	Top-5 acc 87.891 (84.018)	lr 0.00635
Train [80][2130/3239]	Time 0.267 (1.168)	Data Time 0.001 (0.629)	Loss 2.3621 (2.4872)	Entropy 0.58857 (0.58738)	Top-1 acc 69.531 (63.980)	Top-5 acc 85.938 (84.016)	lr 0.00635
Train [80][2140/3239]	Time 0.250 (1.165)	Data Time 0.002 (0.626)	Loss 2.5489 (2.4872)	Entropy 0.58856 (0.58739)	Top-1 acc 62.500 (63.980)	Top-5 acc 82.422 (84.018)	lr 0.00635
Train [80][2150/3239]	Time 0.299 (1.166)	Data Time 0.002 (0.628)	Loss 2.4027 (2.4872)	Entropy 0.58879 (0.58740)	Top-1 acc 64.062 (63.982)	Top-5 acc 86.328 (84.018)	lr 0.00635
Train [80][2160/3239]	Time 0.281 (1.163)	Data Time 0.001 (0.625)	Loss 2.4344 (2.4872)	Entropy 0.58903 (0.58740)	Top-1 acc 62.891 (63.978)	Top-5 acc 86.719 (84.017)	lr 0.00634
Train [80][2170/3239]	Time 0.250 (1.161)	Data Time 0.001 (0.623)	Loss 2.4655 (2.4875)	Entropy 0.58908 (0.58741)	Top-1 acc 66.016 (63.966)	Top-5 acc 86.719 (84.013)	lr 0.00634
Train [80][2180/3239]	Time 0.270 (1.167)	Data Time 0.002 (0.630)	Loss 2.8594 (2.4877)	Entropy 0.58913 (0.58742)	Top-1 acc 54.297 (63.963)	Top-5 acc 75.781 (84.010)	lr 0.00634
Train [80][2190/3239]	Time 0.557 (1.164)	Data Time 0.297 (0.627)	Loss 2.1856 (2.4875)	Entropy 0.58915 (0.58743)	Top-1 acc 73.047 (63.965)	Top-5 acc 88.672 (84.011)	lr 0.00634
Train [80][2200/3239]	Time 0.246 (1.164)	Data Time 0.002 (0.627)	Loss 2.4557 (2.4873)	Entropy 0.58903 (0.58743)	Top-1 acc 62.500 (63.967)	Top-5 acc 84.375 (84.014)	lr 0.00634
Train [80][2210/3239]	Time 0.255 (1.167)	Data Time 0.001 (0.631)	Loss 2.7065 (2.4876)	Entropy 0.58914 (0.58744)	Top-1 acc 57.422 (63.967)	Top-5 acc 79.297 (84.008)	lr 0.00634
Train [80][2220/3239]	Time 0.382 (1.167)	Data Time 0.001 (0.631)	Loss 2.2792 (2.4872)	Entropy 0.58897 (0.58745)	Top-1 acc 67.578 (63.975)	Top-5 acc 88.281 (84.013)	lr 0.00634
Train [80][2230/3239]	Time 0.238 (1.165)	Data Time 0.001 (0.630)	Loss 2.4557 (2.4874)	Entropy 0.58878 (0.58745)	Top-1 acc 64.062 (63.970)	Top-5 acc 85.156 (84.012)	lr 0.00634
Train [80][2240/3239]	Time 15.586 (1.168)	Data Time 15.345 (0.634)	Loss 2.3924 (2.4875)	Entropy 0.58889 (0.58746)	Top-1 acc 64.844 (63.968)	Top-5 acc 86.328 (84.011)	lr 0.00634
Train [80][2250/3239]	Time 0.239 (1.170)	Data Time 0.001 (0.635)	Loss 2.5698 (2.4878)	Entropy 0.58846 (0.58747)	Top-1 acc 61.328 (63.957)	Top-5 acc 83.594 (84.004)	lr 0.00634
Train [80][2260/3239]	Time 0.254 (1.168)	Data Time 0.001 (0.634)	Loss 2.4054 (2.4876)	Entropy 0.58838 (0.58747)	Top-1 acc 66.797 (63.961)	Top-5 acc 84.766 (84.003)	lr 0.00634
Train [80][2270/3239]	Time 0.238 (1.165)	Data Time 0.001 (0.631)	Loss 2.6703 (2.4876)	Entropy 0.58868 (0.58748)	Top-1 acc 59.375 (63.960)	Top-5 acc 82.812 (84.003)	lr 0.00634
Train [80][2280/3239]	Time 0.232 (1.172)	Data Time 0.001 (0.639)	Loss 2.2444 (2.4878)	Entropy 0.58862 (0.58748)	Top-1 acc 69.531 (63.958)	Top-5 acc 87.891 (83.999)	lr 0.00633
Train [80][2290/3239]	Time 0.328 (1.170)	Data Time 0.001 (0.637)	Loss 2.7058 (2.4878)	Entropy 0.58886 (0.58749)	Top-1 acc 61.328 (63.963)	Top-5 acc 82.031 (83.998)	lr 0.00633
Train [80][2300/3239]	Time 0.242 (1.166)	Data Time 0.001 (0.634)	Loss 2.5473 (2.4878)	Entropy 0.58854 (0.58749)	Top-1 acc 62.109 (63.963)	Top-5 acc 83.984 (84.000)	lr 0.00633
Train [80][2310/3239]	Time 0.256 (1.172)	Data Time 0.002 (0.640)	Loss 2.5133 (2.4879)	Entropy 0.58868 (0.58750)	Top-1 acc 64.453 (63.964)	Top-5 acc 83.594 (83.997)	lr 0.00633
Train [80][2320/3239]	Time 0.247 (1.171)	Data Time 0.001 (0.640)	Loss 2.5469 (2.4879)	Entropy 0.58845 (0.58750)	Top-1 acc 65.234 (63.966)	Top-5 acc 82.812 (83.994)	lr 0.00633
Train [80][2330/3239]	Time 0.232 (1.168)	Data Time 0.001 (0.637)	Loss 2.5045 (2.4881)	Entropy 0.58847 (0.58751)	Top-1 acc 64.453 (63.968)	Top-5 acc 84.375 (83.992)	lr 0.00633
Train [80][2340/3239]	Time 0.603 (1.170)	Data Time 0.374 (0.640)	Loss 2.5008 (2.4878)	Entropy 0.58825 (0.58751)	Top-1 acc 62.891 (63.971)	Top-5 acc 83.984 (83.996)	lr 0.00633
Train [80][2350/3239]	Time 0.305 (1.171)	Data Time 0.001 (0.641)	Loss 2.4351 (2.4880)	Entropy 0.58795 (0.58751)	Top-1 acc 63.672 (63.966)	Top-5 acc 85.547 (83.997)	lr 0.00633
Train [80][2360/3239]	Time 0.242 (1.171)	Data Time 0.001 (0.641)	Loss 2.3366 (2.4879)	Entropy 0.58800 (0.58751)	Top-1 acc 66.406 (63.970)	Top-5 acc 85.156 (83.997)	lr 0.00633
Train [80][2370/3239]	Time 3.651 (1.172)	Data Time 3.363 (0.642)	Loss 2.4662 (2.4881)	Entropy 0.58764 (0.58752)	Top-1 acc 66.797 (63.963)	Top-5 acc 86.328 (83.999)	lr 0.00633
Train [80][2380/3239]	Time 0.375 (1.174)	Data Time 0.001 (0.645)	Loss 2.4255 (2.4878)	Entropy 0.58788 (0.58752)	Top-1 acc 64.453 (63.969)	Top-5 acc 84.766 (84.004)	lr 0.00633
Train [80][2390/3239]	Time 0.262 (1.173)	Data Time 0.003 (0.645)	Loss 2.5121 (2.4879)	Entropy 0.58793 (0.58752)	Top-1 acc 66.016 (63.967)	Top-5 acc 80.469 (84.001)	lr 0.00632
Train [80][2400/3239]	Time 0.245 (1.170)	Data Time 0.001 (0.642)	Loss 2.4009 (2.4880)	Entropy 0.58789 (0.58752)	Top-1 acc 68.750 (63.964)	Top-5 acc 82.812 (83.998)	lr 0.00632
Train [80][2410/3239]	Time 0.248 (1.176)	Data Time 0.001 (0.649)	Loss 2.5603 (2.4883)	Entropy 0.58755 (0.58752)	Top-1 acc 64.844 (63.965)	Top-5 acc 82.031 (83.992)	lr 0.00632
Train [80][2420/3239]	Time 0.357 (1.175)	Data Time 0.110 (0.648)	Loss 2.4915 (2.4881)	Entropy 0.58763 (0.58752)	Top-1 acc 64.453 (63.967)	Top-5 acc 82.422 (83.994)	lr 0.00632
Train [80][2430/3239]	Time 0.249 (1.172)	Data Time 0.001 (0.645)	Loss 2.5885 (2.4881)	Entropy 0.58768 (0.58752)	Top-1 acc 62.891 (63.969)	Top-5 acc 80.859 (83.991)	lr 0.00632
Train [80][2440/3239]	Time 0.253 (1.179)	Data Time 0.001 (0.653)	Loss 2.2777 (2.4876)	Entropy 0.58783 (0.58752)	Top-1 acc 72.266 (63.979)	Top-5 acc 88.672 (84.001)	lr 0.00632
Train [80][2450/3239]	Time 0.327 (1.177)	Data Time 0.001 (0.651)	Loss 2.5447 (2.4877)	Entropy 0.58793 (0.58752)	Top-1 acc 60.938 (63.973)	Top-5 acc 84.375 (84.000)	lr 0.00632
Train [80][2460/3239]	Time 0.271 (1.174)	Data Time 0.001 (0.649)	Loss 2.3403 (2.4877)	Entropy 0.58776 (0.58753)	Top-1 acc 66.016 (63.975)	Top-5 acc 87.109 (84.000)	lr 0.00632
Train [80][2470/3239]	Time 0.245 (1.180)	Data Time 0.001 (0.655)	Loss 2.3401 (2.4879)	Entropy 0.58784 (0.58753)	Top-1 acc 66.016 (63.970)	Top-5 acc 87.109 (83.994)	lr 0.00632
Train [80][2480/3239]	Time 0.243 (1.179)	Data Time 0.002 (0.654)	Loss 2.4807 (2.4879)	Entropy 0.58771 (0.58753)	Top-1 acc 64.453 (63.972)	Top-5 acc 83.984 (83.993)	lr 0.00632
Train [80][2490/3239]	Time 0.241 (1.176)	Data Time 0.002 (0.651)	Loss 2.6339 (2.4881)	Entropy 0.58769 (0.58753)	Top-1 acc 59.375 (63.966)	Top-5 acc 82.812 (83.992)	lr 0.00632
Train [80][2500/3239]	Time 0.255 (1.178)	Data Time 0.002 (0.653)	Loss 2.3943 (2.4881)	Entropy 0.58753 (0.58753)	Top-1 acc 66.797 (63.967)	Top-5 acc 83.984 (83.992)	lr 0.00631
Train [80][2510/3239]	Time 0.259 (1.178)	Data Time 0.002 (0.654)	Loss 2.2461 (2.4881)	Entropy 0.58751 (0.58753)	Top-1 acc 68.359 (63.964)	Top-5 acc 89.062 (83.994)	lr 0.00631
Train [80][2520/3239]	Time 0.255 (1.177)	Data Time 0.001 (0.654)	Loss 2.4297 (2.4881)	Entropy 0.58784 (0.58753)	Top-1 acc 66.797 (63.968)	Top-5 acc 83.594 (83.991)	lr 0.00631
Train [80][2530/3239]	Time 0.283 (1.177)	Data Time 0.001 (0.654)	Loss 2.4822 (2.4880)	Entropy 0.58779 (0.58753)	Top-1 acc 64.062 (63.970)	Top-5 acc 85.156 (83.993)	lr 0.00631
Train [80][2540/3239]	Time 0.359 (1.182)	Data Time 0.001 (0.659)	Loss 2.4608 (2.4880)	Entropy 0.58785 (0.58753)	Top-1 acc 64.844 (63.971)	Top-5 acc 85.156 (83.994)	lr 0.00631
Train [80][2550/3239]	Time 0.249 (1.181)	Data Time 0.001 (0.659)	Loss 2.4001 (2.4881)	Entropy 0.58782 (0.58753)	Top-1 acc 65.234 (63.964)	Top-5 acc 86.328 (83.993)	lr 0.00631
Train [80][2560/3239]	Time 0.241 (1.182)	Data Time 0.001 (0.660)	Loss 2.5771 (2.4880)	Entropy 0.58786 (0.58753)	Top-1 acc 61.719 (63.967)	Top-5 acc 82.422 (83.994)	lr 0.00631
Train [80][2570/3239]	Time 0.274 (1.185)	Data Time 0.001 (0.663)	Loss 2.4401 (2.4879)	Entropy 0.58777 (0.58754)	Top-1 acc 65.625 (63.970)	Top-5 acc 83.594 (83.994)	lr 0.00631
Train [80][2580/3239]	Time 0.243 (1.184)	Data Time 0.001 (0.663)	Loss 2.6053 (2.4878)	Entropy 0.58772 (0.58754)	Top-1 acc 56.641 (63.975)	Top-5 acc 82.422 (83.996)	lr 0.00631
Train [80][2590/3239]	Time 0.237 (1.181)	Data Time 0.001 (0.660)	Loss 2.3271 (2.4879)	Entropy 0.58765 (0.58754)	Top-1 acc 68.359 (63.972)	Top-5 acc 88.281 (83.996)	lr 0.00631
Train [80][2600/3239]	Time 0.256 (1.189)	Data Time 0.001 (0.669)	Loss 2.4189 (2.4880)	Entropy 0.58775 (0.58754)	Top-1 acc 65.625 (63.973)	Top-5 acc 85.547 (83.994)	lr 0.00631
Train [80][2610/3239]	Time 0.353 (1.189)	Data Time 0.002 (0.668)	Loss 2.7310 (2.4878)	Entropy 0.58793 (0.58754)	Top-1 acc 57.422 (63.977)	Top-5 acc 81.641 (84.001)	lr 0.00631
Train [80][2620/3239]	Time 0.260 (1.186)	Data Time 0.001 (0.666)	Loss 2.4352 (2.4874)	Entropy 0.58817 (0.58754)	Top-1 acc 62.891 (63.981)	Top-5 acc 85.938 (84.010)	lr 0.00630
Train [80][2630/3239]	Time 0.270 (1.194)	Data Time 0.001 (0.674)	Loss 2.7399 (2.4877)	Entropy 0.58788 (0.58754)	Top-1 acc 58.203 (63.980)	Top-5 acc 80.078 (84.009)	lr 0.00630
Train [80][2640/3239]	Time 0.231 (1.193)	Data Time 0.001 (0.673)	Loss 2.4286 (2.4878)	Entropy 0.58795 (0.58754)	Top-1 acc 67.578 (63.976)	Top-5 acc 83.984 (84.006)	lr 0.00630
Train [80][2650/3239]	Time 0.244 (1.190)	Data Time 0.001 (0.671)	Loss 2.5113 (2.4880)	Entropy 0.58797 (0.58754)	Top-1 acc 62.891 (63.973)	Top-5 acc 82.812 (84.002)	lr 0.00630
Train [80][2660/3239]	Time 2.149 (1.190)	Data Time 1.901 (0.671)	Loss 2.5530 (2.4879)	Entropy 0.58800 (0.58755)	Top-1 acc 64.844 (63.973)	Top-5 acc 83.594 (84.003)	lr 0.00630
Train [80][2670/3239]	Time 0.241 (1.192)	Data Time 0.001 (0.673)	Loss 2.4240 (2.4878)	Entropy 0.58821 (0.58755)	Top-1 acc 63.672 (63.975)	Top-5 acc 82.422 (84.004)	lr 0.00630
Train [80][2680/3239]	Time 0.231 (1.191)	Data Time 0.001 (0.672)	Loss 2.5089 (2.4880)	Entropy 0.58823 (0.58755)	Top-1 acc 62.109 (63.973)	Top-5 acc 82.031 (84.000)	lr 0.00630
Train [80][2690/3239]	Time 0.252 (1.191)	Data Time 0.001 (0.673)	Loss 2.2604 (2.4880)	Entropy 0.58813 (0.58755)	Top-1 acc 68.359 (63.970)	Top-5 acc 88.672 (83.999)	lr 0.00630
Train [80][2700/3239]	Time 0.294 (1.195)	Data Time 0.001 (0.678)	Loss 2.3731 (2.4880)	Entropy 0.58800 (0.58755)	Top-1 acc 68.750 (63.971)	Top-5 acc 85.547 (83.999)	lr 0.00630
Train [80][2710/3239]	Time 0.250 (1.195)	Data Time 0.001 (0.678)	Loss 2.5710 (2.4884)	Entropy 0.58790 (0.58756)	Top-1 acc 58.984 (63.959)	Top-5 acc 82.812 (83.997)	lr 0.00630
Train [80][2720/3239]	Time 0.244 (1.192)	Data Time 0.001 (0.675)	Loss 2.5908 (2.4884)	Entropy 0.58780 (0.58756)	Top-1 acc 60.938 (63.957)	Top-5 acc 82.031 (83.996)	lr 0.00630
Train [80][2730/3239]	Time 0.249 (1.200)	Data Time 0.001 (0.683)	Loss 2.5870 (2.4887)	Entropy 0.58770 (0.58756)	Top-1 acc 60.938 (63.953)	Top-5 acc 82.031 (83.994)	lr 0.00629
Train [80][2740/3239]	Time 0.333 (1.217)	Data Time 0.004 (0.681)	Loss 2.5190 (2.4886)	Entropy 0.58769 (0.58756)	Top-1 acc 61.719 (63.953)	Top-5 acc 84.766 (83.996)	lr 0.00629
Train [80][2750/3239]	Time 0.253 (1.214)	Data Time 0.002 (0.678)	Loss 2.5112 (2.4885)	Entropy 0.58806 (0.58756)	Top-1 acc 62.891 (63.958)	Top-5 acc 83.203 (83.997)	lr 0.00629
Train [80][2760/3239]	Time 0.268 (1.211)	Data Time 0.002 (0.676)	Loss 2.6550 (2.4886)	Entropy 0.58802 (0.58756)	Top-1 acc 57.422 (63.953)	Top-5 acc 80.859 (83.997)	lr 0.00629
Train [80][2770/3239]	Time 0.368 (1.209)	Data Time 0.001 (0.673)	Loss 2.8892 (2.4888)	Entropy 0.58808 (0.58756)	Top-1 acc 50.781 (63.948)	Top-5 acc 77.344 (83.992)	lr 0.00629
Train [80][2780/3239]	Time 0.259 (1.206)	Data Time 0.001 (0.671)	Loss 2.4007 (2.4889)	Entropy 0.58770 (0.58756)	Top-1 acc 63.281 (63.944)	Top-5 acc 85.547 (83.990)	lr 0.00629
Train [80][2790/3239]	Time 0.246 (1.207)	Data Time 0.001 (0.672)	Loss 2.6047 (2.4887)	Entropy 0.58792 (0.58757)	Top-1 acc 62.109 (63.949)	Top-5 acc 79.688 (83.996)	lr 0.00629
Train [80][2800/3239]	Time 1.155 (1.206)	Data Time 0.888 (0.672)	Loss 2.4859 (2.4886)	Entropy 0.58804 (0.58757)	Top-1 acc 64.453 (63.953)	Top-5 acc 83.594 (84.002)	lr 0.00629
Train [80][2810/3239]	Time 0.280 (1.206)	Data Time 0.001 (0.672)	Loss 2.4408 (2.4885)	Entropy 0.58770 (0.58757)	Top-1 acc 67.969 (63.958)	Top-5 acc 83.594 (83.999)	lr 0.00629
Train [80][2820/3239]	Time 2.408 (1.204)	Data Time 2.134 (0.670)	Loss 2.4710 (2.4885)	Entropy 0.58773 (0.58757)	Top-1 acc 60.156 (63.952)	Top-5 acc 85.547 (83.999)	lr 0.00629
Train [80][2830/3239]	Time 0.250 (1.207)	Data Time 0.001 (0.673)	Loss 2.5003 (2.4884)	Entropy 0.58800 (0.58757)	Top-1 acc 62.891 (63.958)	Top-5 acc 84.766 (84.003)	lr 0.00629
Train [80][2840/3239]	Time 3.544 (1.210)	Data Time 3.263 (0.677)	Loss 2.4655 (2.4883)	Entropy 0.58810 (0.58757)	Top-1 acc 63.281 (63.956)	Top-5 acc 82.812 (84.004)	lr 0.00629
Train [80][2850/3239]	Time 0.252 (1.208)	Data Time 0.001 (0.674)	Loss 2.5758 (2.4885)	Entropy 0.58813 (0.58757)	Top-1 acc 56.641 (63.949)	Top-5 acc 83.594 (84.000)	lr 0.00628
Train [80][2860/3239]	Time 0.336 (1.211)	Data Time 0.001 (0.678)	Loss 2.7327 (2.4886)	Entropy 0.58813 (0.58757)	Top-1 acc 57.031 (63.947)	Top-5 acc 79.688 (84.000)	lr 0.00628
Train [80][2870/3239]	Time 0.241 (1.211)	Data Time 0.001 (0.678)	Loss 2.3392 (2.4885)	Entropy 0.58843 (0.58758)	Top-1 acc 66.797 (63.949)	Top-5 acc 85.547 (83.996)	lr 0.00628
Train [80][2880/3239]	Time 0.499 (1.209)	Data Time 0.256 (0.676)	Loss 2.6788 (2.4887)	Entropy 0.58851 (0.58758)	Top-1 acc 60.156 (63.946)	Top-5 acc 81.641 (83.994)	lr 0.00628
Train [80][2890/3239]	Time 0.259 (1.213)	Data Time 0.001 (0.681)	Loss 2.5210 (2.4888)	Entropy 0.58852 (0.58758)	Top-1 acc 64.453 (63.941)	Top-5 acc 82.422 (83.992)	lr 0.00628
Train [80][2900/3239]	Time 0.256 (1.214)	Data Time 0.002 (0.682)	Loss 2.5755 (2.4887)	Entropy 0.58860 (0.58759)	Top-1 acc 61.328 (63.943)	Top-5 acc 84.766 (83.996)	lr 0.00628
Train [80][2910/3239]	Time 0.251 (1.213)	Data Time 0.001 (0.681)	Loss 2.5725 (2.4886)	Entropy 0.58793 (0.58759)	Top-1 acc 62.109 (63.947)	Top-5 acc 82.422 (83.998)	lr 0.00628
Train [80][2920/3239]	Time 0.251 (1.217)	Data Time 0.001 (0.685)	Loss 2.7075 (2.4887)	Entropy 0.58779 (0.58759)	Top-1 acc 57.031 (63.944)	Top-5 acc 81.641 (83.997)	lr 0.00628
Train [80][2930/3239]	Time 2.218 (1.217)	Data Time 1.797 (0.686)	Loss 2.5187 (2.4886)	Entropy 0.58794 (0.58759)	Top-1 acc 64.062 (63.948)	Top-5 acc 82.031 (83.999)	lr 0.00628
Train [80][2940/3239]	Time 0.226 (1.216)	Data Time 0.001 (0.685)	Loss 2.6066 (2.4884)	Entropy 0.58759 (0.58759)	Top-1 acc 62.109 (63.952)	Top-5 acc 80.859 (84.001)	lr 0.00628
Train [80][2950/3239]	Time 0.242 (1.217)	Data Time 0.001 (0.686)	Loss 2.4246 (2.4883)	Entropy 0.58757 (0.58759)	Top-1 acc 64.844 (63.953)	Top-5 acc 85.938 (84.002)	lr 0.00628
Train [80][2960/3239]	Time 0.232 (1.217)	Data Time 0.001 (0.687)	Loss 2.4183 (2.4883)	Entropy 0.58752 (0.58759)	Top-1 acc 62.891 (63.949)	Top-5 acc 85.547 (84.002)	lr 0.00627
Train [80][2970/3239]	Time 0.242 (1.217)	Data Time 0.001 (0.687)	Loss 2.5120 (2.4884)	Entropy 0.58772 (0.58759)	Top-1 acc 63.281 (63.946)	Top-5 acc 83.594 (84.000)	lr 0.00627
Train [80][2980/3239]	Time 0.252 (1.215)	Data Time 0.001 (0.685)	Loss 2.6113 (2.4886)	Entropy 0.58754 (0.58759)	Top-1 acc 59.766 (63.939)	Top-5 acc 83.203 (83.997)	lr 0.00627
Train [80][2990/3239]	Time 0.260 (1.214)	Data Time 0.001 (0.685)	Loss 2.4907 (2.4884)	Entropy 0.58746 (0.58759)	Top-1 acc 62.500 (63.943)	Top-5 acc 86.719 (84.002)	lr 0.00627
Train [80][3000/3239]	Time 0.329 (1.217)	Data Time 0.002 (0.688)	Loss 2.4272 (2.4887)	Entropy 0.58727 (0.58759)	Top-1 acc 65.625 (63.936)	Top-5 acc 83.594 (83.999)	lr 0.00627
Train [80][3010/3239]	Time 0.272 (1.215)	Data Time 0.001 (0.686)	Loss 2.4070 (2.4887)	Entropy 0.58719 (0.58759)	Top-1 acc 67.188 (63.936)	Top-5 acc 86.719 (83.999)	lr 0.00627
Train [80][3020/3239]	Time 2.266 (1.214)	Data Time 2.028 (0.686)	Loss 2.4881 (2.4888)	Entropy 0.58707 (0.58759)	Top-1 acc 64.062 (63.937)	Top-5 acc 83.203 (84.000)	lr 0.00627
Train [80][3030/3239]	Time 0.282 (1.217)	Data Time 0.001 (0.689)	Loss 2.4980 (2.4889)	Entropy 0.58702 (0.58759)	Top-1 acc 63.672 (63.934)	Top-5 acc 82.812 (83.997)	lr 0.00627
Train [80][3040/3239]	Time 0.238 (1.215)	Data Time 0.001 (0.687)	Loss 2.5470 (2.4889)	Entropy 0.58703 (0.58759)	Top-1 acc 60.938 (63.935)	Top-5 acc 82.422 (83.996)	lr 0.00627
Train [80][3050/3239]	Time 0.232 (1.213)	Data Time 0.002 (0.686)	Loss 2.6459 (2.4889)	Entropy 0.58716 (0.58758)	Top-1 acc 61.719 (63.934)	Top-5 acc 80.078 (83.995)	lr 0.00627
Train [80][3060/3239]	Time 6.806 (1.218)	Data Time 6.518 (0.691)	Loss 2.4824 (2.4890)	Entropy 0.58696 (0.58758)	Top-1 acc 66.016 (63.934)	Top-5 acc 84.375 (83.994)	lr 0.00627
Train [80][3070/3239]	Time 0.240 (1.215)	Data Time 0.001 (0.689)	Loss 2.4681 (2.4890)	Entropy 0.58746 (0.58758)	Top-1 acc 64.453 (63.937)	Top-5 acc 84.766 (83.995)	lr 0.00626
Train [80][3080/3239]	Time 0.965 (1.213)	Data Time 0.725 (0.687)	Loss 2.5376 (2.4889)	Entropy 0.58754 (0.58758)	Top-1 acc 64.453 (63.939)	Top-5 acc 82.812 (83.998)	lr 0.00626
Train [80][3090/3239]	Time 5.590 (1.215)	Data Time 5.227 (0.689)	Loss 2.4097 (2.4887)	Entropy 0.58750 (0.58758)	Top-1 acc 66.406 (63.945)	Top-5 acc 83.203 (83.999)	lr 0.00626
Train [80][3100/3239]	Time 0.231 (1.215)	Data Time 0.001 (0.689)	Loss 2.4901 (2.4888)	Entropy 0.58754 (0.58758)	Top-1 acc 62.500 (63.940)	Top-5 acc 83.594 (83.996)	lr 0.00626
Train [80][3110/3239]	Time 0.227 (1.213)	Data Time 0.001 (0.687)	Loss 2.3658 (2.4886)	Entropy 0.58739 (0.58758)	Top-1 acc 64.062 (63.943)	Top-5 acc 85.547 (84.000)	lr 0.00626
Train [80][3120/3239]	Time 4.041 (1.213)	Data Time 3.769 (0.688)	Loss 2.4909 (2.4885)	Entropy 0.58737 (0.58758)	Top-1 acc 61.719 (63.950)	Top-5 acc 83.984 (84.001)	lr 0.00626
Train [80][3130/3239]	Time 0.238 (1.215)	Data Time 0.001 (0.690)	Loss 2.3743 (2.4883)	Entropy 0.58726 (0.58758)	Top-1 acc 67.578 (63.954)	Top-5 acc 87.109 (84.006)	lr 0.00626
Train [80][3140/3239]	Time 0.261 (1.213)	Data Time 0.001 (0.689)	Loss 2.4344 (2.4882)	Entropy 0.58717 (0.58758)	Top-1 acc 66.016 (63.954)	Top-5 acc 85.156 (84.007)	lr 0.00626
Train [80][3150/3239]	Time 0.253 (1.210)	Data Time 0.001 (0.686)	Loss 2.4695 (2.4881)	Entropy 0.58711 (0.58758)	Top-1 acc 64.844 (63.957)	Top-5 acc 85.938 (84.006)	lr 0.00626
Train [80][3160/3239]	Time 0.333 (1.215)	Data Time 0.001 (0.692)	Loss 2.6128 (2.4882)	Entropy 0.58703 (0.58757)	Top-1 acc 62.500 (63.956)	Top-5 acc 83.984 (84.008)	lr 0.00626
Train [80][3170/3239]	Time 0.242 (1.213)	Data Time 0.002 (0.690)	Loss 2.5385 (2.4884)	Entropy 0.58693 (0.58757)	Top-1 acc 64.453 (63.951)	Top-5 acc 79.688 (84.005)	lr 0.00626
Train [80][3180/3239]	Time 0.243 (1.210)	Data Time 0.000 (0.687)	Loss 2.4544 (2.4883)	Entropy 0.58689 (0.58757)	Top-1 acc 64.453 (63.955)	Top-5 acc 85.156 (84.006)	lr 0.00626
Train [80][3190/3239]	Time 0.250 (1.216)	Data Time 0.000 (0.693)	Loss 2.5024 (2.4884)	Entropy 0.58678 (0.58757)	Top-1 acc 65.234 (63.953)	Top-5 acc 82.031 (84.006)	lr 0.00625
Train [80][3200/3239]	Time 0.237 (1.213)	Data Time 0.000 (0.691)	Loss 2.4989 (2.4886)	Entropy 0.58692 (0.58757)	Top-1 acc 64.453 (63.947)	Top-5 acc 82.812 (84.003)	lr 0.00625
Train [80][3210/3239]	Time 0.237 (1.211)	Data Time 0.000 (0.689)	Loss 2.3363 (2.4886)	Entropy 0.58719 (0.58756)	Top-1 acc 68.359 (63.945)	Top-5 acc 86.719 (84.003)	lr 0.00625
Train [80][3220/3239]	Time 5.895 (1.213)	Data Time 5.654 (0.692)	Loss 2.3191 (2.4884)	Entropy 0.58714 (0.58756)	Top-1 acc 67.969 (63.948)	Top-5 acc 85.156 (84.009)	lr 0.00625
Train [80][3230/3239]	Time 0.237 (1.211)	Data Time 0.000 (0.689)	Loss 2.4422 (2.4885)	Entropy 0.58713 (0.58756)	Top-1 acc 64.062 (63.945)	Top-5 acc 86.328 (84.007)	lr 0.00625
Train [80][3239/3239]	Time 0.915 (1.209)	Data Time 0.000 (0.687)	Loss 2.5072 (2.4886)	Entropy 0.58698 (0.58756)	Top-1 acc 64.198 (63.944)	Top-5 acc 86.420 (84.008)	lr 0.00625
==========Valid [80/120]	loss 1.289	top-1 acc 70.353 (70.353)	top-5 acc 89.220	Train top-1 63.944	top-5 84.008	Entropy 0.58698	Latency-None: 0.000ms	Flops: 539.00M
Train [81][0/3239]	Time 60.657 (60.657)	Data Time 59.324 (59.324)	Loss 2.4078 (2.4078)	Entropy 0.58679 (0.58679)	Top-1 acc 66.016 (66.016)	Top-5 acc 84.766 (84.766)	lr 0.00625
Train [81][10/3239]	Time 0.239 (6.040)	Data Time 0.001 (5.513)	Loss 2.4809 (2.4282)	Entropy 0.58676 (0.58681)	Top-1 acc 63.672 (65.057)	Top-5 acc 84.375 (84.659)	lr 0.00625
Train [81][20/3239]	Time 0.253 (3.378)	Data Time 0.001 (2.889)	Loss 2.5371 (2.4727)	Entropy 0.58662 (0.58674)	Top-1 acc 61.328 (63.281)	Top-5 acc 84.375 (84.580)	lr 0.00625
Train [81][30/3239]	Time 0.244 (2.425)	Data Time 0.001 (1.957)	Loss 2.5960 (2.4998)	Entropy 0.58666 (0.58671)	Top-1 acc 58.594 (62.903)	Top-5 acc 82.812 (84.136)	lr 0.00625
Train [81][40/3239]	Time 0.247 (2.264)	Data Time 0.001 (1.799)	Loss 2.6280 (2.4990)	Entropy 0.58698 (0.58671)	Top-1 acc 61.719 (63.176)	Top-5 acc 80.469 (84.042)	lr 0.00625
Train [81][50/3239]	Time 0.257 (1.904)	Data Time 0.002 (1.447)	Loss 2.3758 (2.4915)	Entropy 0.58693 (0.58676)	Top-1 acc 64.062 (63.350)	Top-5 acc 88.281 (84.176)	lr 0.00625
Train [81][60/3239]	Time 0.349 (1.663)	Data Time 0.001 (1.210)	Loss 2.5492 (2.4810)	Entropy 0.58693 (0.58680)	Top-1 acc 65.234 (63.730)	Top-5 acc 82.422 (84.324)	lr 0.00624
Train [81][70/3239]	Time 0.247 (1.654)	Data Time 0.001 (1.201)	Loss 2.3856 (2.4748)	Entropy 0.58678 (0.58681)	Top-1 acc 67.578 (63.980)	Top-5 acc 86.719 (84.502)	lr 0.00624
Train [81][80/3239]	Time 0.252 (1.502)	Data Time 0.001 (1.053)	Loss 2.4522 (2.4712)	Entropy 0.58660 (0.58679)	Top-1 acc 65.234 (64.120)	Top-5 acc 86.328 (84.597)	lr 0.00624
Train [81][90/3239]	Time 0.244 (1.383)	Data Time 0.001 (0.937)	Loss 2.5459 (2.4752)	Entropy 0.58696 (0.58678)	Top-1 acc 63.281 (63.968)	Top-5 acc 82.812 (84.499)	lr 0.00624
Train [81][100/3239]	Time 0.245 (1.437)	Data Time 0.001 (0.994)	Loss 2.5692 (2.4733)	Entropy 0.58683 (0.58680)	Top-1 acc 62.891 (64.113)	Top-5 acc 82.422 (84.514)	lr 0.00624
Train [81][110/3239]	Time 0.246 (1.345)	Data Time 0.001 (0.904)	Loss 2.5571 (2.4743)	Entropy 0.58675 (0.58680)	Top-1 acc 64.062 (64.073)	Top-5 acc 83.984 (84.474)	lr 0.00624
Train [81][120/3239]	Time 0.238 (1.268)	Data Time 0.001 (0.830)	Loss 2.5294 (2.4756)	Entropy 0.58669 (0.58680)	Top-1 acc 67.188 (64.108)	Top-5 acc 83.203 (84.449)	lr 0.00624
Train [81][130/3239]	Time 0.273 (1.290)	Data Time 0.002 (0.852)	Loss 2.4269 (2.4792)	Entropy 0.58668 (0.58680)	Top-1 acc 69.531 (64.024)	Top-5 acc 84.766 (84.405)	lr 0.00624
Train [81][140/3239]	Time 0.236 (1.249)	Data Time 0.001 (0.814)	Loss 2.4117 (2.4790)	Entropy 0.58635 (0.58678)	Top-1 acc 66.016 (64.096)	Top-5 acc 85.938 (84.381)	lr 0.00624
Train [81][150/3239]	Time 0.617 (1.547)	Data Time 0.034 (0.760)	Loss 2.5991 (2.4795)	Entropy 0.58642 (0.58676)	Top-1 acc 62.109 (64.127)	Top-5 acc 80.859 (84.365)	lr 0.00624
Train [81][160/3239]	Time 0.244 (1.485)	Data Time 0.002 (0.713)	Loss 2.9285 (2.4797)	Entropy 0.58621 (0.58674)	Top-1 acc 52.734 (64.126)	Top-5 acc 77.344 (84.346)	lr 0.00624
Train [81][170/3239]	Time 0.238 (1.423)	Data Time 0.001 (0.672)	Loss 2.4061 (2.4748)	Entropy 0.58596 (0.58670)	Top-1 acc 67.969 (64.252)	Top-5 acc 85.938 (84.423)	lr 0.00624
Train [81][180/3239]	Time 0.247 (1.367)	Data Time 0.002 (0.635)	Loss 2.4397 (2.4722)	Entropy 0.58623 (0.58667)	Top-1 acc 66.406 (64.332)	Top-5 acc 84.375 (84.451)	lr 0.00623
Train [81][190/3239]	Time 0.249 (1.317)	Data Time 0.002 (0.601)	Loss 2.5279 (2.4736)	Entropy 0.58621 (0.58665)	Top-1 acc 64.062 (64.275)	Top-5 acc 84.375 (84.404)	lr 0.00623
Train [81][200/3239]	Time 0.246 (1.273)	Data Time 0.001 (0.572)	Loss 2.3397 (2.4731)	Entropy 0.58600 (0.58662)	Top-1 acc 66.016 (64.282)	Top-5 acc 85.547 (84.369)	lr 0.00623
Train [81][210/3239]	Time 0.253 (1.233)	Data Time 0.002 (0.545)	Loss 2.6396 (2.4747)	Entropy 0.58591 (0.58659)	Top-1 acc 62.891 (64.246)	Top-5 acc 80.078 (84.321)	lr 0.00623
Train [81][220/3239]	Time 0.401 (1.199)	Data Time 0.003 (0.520)	Loss 2.5289 (2.4737)	Entropy 0.58608 (0.58656)	Top-1 acc 64.844 (64.275)	Top-5 acc 82.031 (84.333)	lr 0.00623
Train [81][230/3239]	Time 0.274 (1.170)	Data Time 0.002 (0.498)	Loss 2.5731 (2.4755)	Entropy 0.58614 (0.58654)	Top-1 acc 58.594 (64.171)	Top-5 acc 82.812 (84.304)	lr 0.00623
Train [81][240/3239]	Time 0.243 (1.140)	Data Time 0.001 (0.477)	Loss 2.3440 (2.4767)	Entropy 0.58561 (0.58652)	Top-1 acc 67.578 (64.139)	Top-5 acc 86.328 (84.297)	lr 0.00623
Train [81][250/3239]	Time 2.420 (1.129)	Data Time 2.130 (0.474)	Loss 2.9489 (2.4797)	Entropy 0.58567 (0.58649)	Top-1 acc 55.469 (64.081)	Top-5 acc 75.391 (84.244)	lr 0.00623
Train [81][260/3239]	Time 0.234 (1.103)	Data Time 0.002 (0.456)	Loss 2.3548 (2.4789)	Entropy 0.58540 (0.58645)	Top-1 acc 66.797 (64.068)	Top-5 acc 84.766 (84.257)	lr 0.00623
Train [81][270/3239]	Time 0.247 (1.080)	Data Time 0.001 (0.439)	Loss 2.1843 (2.4781)	Entropy 0.58521 (0.58641)	Top-1 acc 68.750 (64.050)	Top-5 acc 89.062 (84.283)	lr 0.00623
Train [81][280/3239]	Time 0.243 (1.064)	Data Time 0.001 (0.430)	Loss 2.5825 (2.4806)	Entropy 0.58498 (0.58636)	Top-1 acc 59.766 (63.999)	Top-5 acc 80.469 (84.221)	lr 0.00623
Train [81][290/3239]	Time 0.288 (1.047)	Data Time 0.001 (0.418)	Loss 2.5542 (2.4807)	Entropy 0.58491 (0.58631)	Top-1 acc 62.109 (64.020)	Top-5 acc 82.812 (84.214)	lr 0.00622
Train [81][300/3239]	Time 0.261 (1.028)	Data Time 0.001 (0.404)	Loss 2.4890 (2.4784)	Entropy 0.58504 (0.58627)	Top-1 acc 65.625 (64.074)	Top-5 acc 85.547 (84.263)	lr 0.00622
Train [81][310/3239]	Time 0.355 (1.011)	Data Time 0.001 (0.392)	Loss 2.5902 (2.4764)	Entropy 0.58487 (0.58622)	Top-1 acc 62.500 (64.147)	Top-5 acc 82.422 (84.286)	lr 0.00622
Train [81][320/3239]	Time 0.247 (0.999)	Data Time 0.002 (0.385)	Loss 2.5029 (2.4758)	Entropy 0.58486 (0.58618)	Top-1 acc 62.109 (64.176)	Top-5 acc 82.812 (84.287)	lr 0.00622
Train [81][330/3239]	Time 0.245 (0.982)	Data Time 0.001 (0.373)	Loss 2.6937 (2.4778)	Entropy 0.58524 (0.58614)	Top-1 acc 58.594 (64.111)	Top-5 acc 81.641 (84.248)	lr 0.00622
Train [81][340/3239]	Time 0.229 (0.967)	Data Time 0.001 (0.362)	Loss 2.5169 (2.4763)	Entropy 0.58556 (0.58612)	Top-1 acc 59.375 (64.120)	Top-5 acc 83.594 (84.271)	lr 0.00622
Train [81][350/3239]	Time 0.234 (0.976)	Data Time 0.001 (0.377)	Loss 2.6787 (2.4747)	Entropy 0.58555 (0.58611)	Top-1 acc 57.812 (64.160)	Top-5 acc 82.812 (84.292)	lr 0.00622
Train [81][360/3239]	Time 0.253 (0.962)	Data Time 0.001 (0.367)	Loss 2.4356 (2.4755)	Entropy 0.58567 (0.58609)	Top-1 acc 65.234 (64.162)	Top-5 acc 84.766 (84.309)	lr 0.00622
Train [81][370/3239]	Time 0.287 (0.959)	Data Time 0.001 (0.368)	Loss 2.4130 (2.4750)	Entropy 0.58563 (0.58608)	Top-1 acc 64.844 (64.186)	Top-5 acc 86.719 (84.324)	lr 0.00622
Train [81][380/3239]	Time 0.373 (0.970)	Data Time 0.002 (0.383)	Loss 2.2680 (2.4745)	Entropy 0.58549 (0.58607)	Top-1 acc 68.359 (64.192)	Top-5 acc 88.672 (84.332)	lr 0.00622
Train [81][390/3239]	Time 0.235 (0.955)	Data Time 0.001 (0.373)	Loss 2.3111 (2.4725)	Entropy 0.58544 (0.58605)	Top-1 acc 68.750 (64.238)	Top-5 acc 86.328 (84.362)	lr 0.00622
Train [81][400/3239]	Time 1.776 (0.947)	Data Time 1.518 (0.367)	Loss 2.3602 (2.4716)	Entropy 0.58541 (0.58604)	Top-1 acc 68.750 (64.282)	Top-5 acc 84.766 (84.377)	lr 0.00622
Train [81][410/3239]	Time 5.582 (0.957)	Data Time 5.338 (0.381)	Loss 2.6859 (2.4758)	Entropy 0.58548 (0.58602)	Top-1 acc 57.031 (64.197)	Top-5 acc 81.250 (84.306)	lr 0.00621
Train [81][420/3239]	Time 0.241 (0.951)	Data Time 0.001 (0.378)	Loss 2.4945 (2.4750)	Entropy 0.58567 (0.58601)	Top-1 acc 62.109 (64.218)	Top-5 acc 82.812 (84.315)	lr 0.00621
Train [81][430/3239]	Time 0.242 (0.939)	Data Time 0.001 (0.369)	Loss 2.6916 (2.4763)	Entropy 0.58586 (0.58600)	Top-1 acc 61.328 (64.183)	Top-5 acc 78.516 (84.286)	lr 0.00621
Train [81][440/3239]	Time 0.254 (0.932)	Data Time 0.001 (0.366)	Loss 2.5769 (2.4756)	Entropy 0.58577 (0.58600)	Top-1 acc 62.891 (64.195)	Top-5 acc 81.641 (84.303)	lr 0.00621
Train [81][450/3239]	Time 3.334 (0.946)	Data Time 3.078 (0.382)	Loss 2.5199 (2.4759)	Entropy 0.58611 (0.58600)	Top-1 acc 62.891 (64.186)	Top-5 acc 84.375 (84.318)	lr 0.00621
Train [81][460/3239]	Time 0.236 (0.935)	Data Time 0.001 (0.374)	Loss 2.6361 (2.4766)	Entropy 0.58617 (0.58600)	Top-1 acc 58.594 (64.151)	Top-5 acc 79.688 (84.310)	lr 0.00621
Train [81][470/3239]	Time 2.626 (0.929)	Data Time 2.233 (0.371)	Loss 2.4164 (2.4772)	Entropy 0.58611 (0.58601)	Top-1 acc 66.797 (64.159)	Top-5 acc 86.328 (84.307)	lr 0.00621
Train [81][480/3239]	Time 0.254 (0.932)	Data Time 0.001 (0.376)	Loss 2.5667 (2.4777)	Entropy 0.58624 (0.58601)	Top-1 acc 64.453 (64.176)	Top-5 acc 82.031 (84.291)	lr 0.00621
Train [81][490/3239]	Time 0.232 (0.926)	Data Time 0.001 (0.374)	Loss 2.6761 (2.4767)	Entropy 0.58652 (0.58602)	Top-1 acc 59.375 (64.200)	Top-5 acc 79.297 (84.306)	lr 0.00621
Train [81][500/3239]	Time 0.242 (0.918)	Data Time 0.001 (0.367)	Loss 2.6926 (2.4773)	Entropy 0.58667 (0.58602)	Top-1 acc 58.594 (64.186)	Top-5 acc 79.688 (84.278)	lr 0.00621
Train [81][510/3239]	Time 0.242 (0.918)	Data Time 0.001 (0.371)	Loss 2.6091 (2.4757)	Entropy 0.58660 (0.58603)	Top-1 acc 58.984 (64.234)	Top-5 acc 80.859 (84.301)	lr 0.00621
Train [81][520/3239]	Time 0.252 (0.909)	Data Time 0.001 (0.364)	Loss 2.4803 (2.4752)	Entropy 0.58653 (0.58604)	Top-1 acc 68.359 (64.239)	Top-5 acc 82.422 (84.307)	lr 0.00620
Train [81][530/3239]	Time 0.237 (0.900)	Data Time 0.001 (0.357)	Loss 2.4025 (2.4737)	Entropy 0.58673 (0.58606)	Top-1 acc 64.453 (64.280)	Top-5 acc 82.422 (84.321)	lr 0.00620
Train [81][540/3239]	Time 0.367 (0.897)	Data Time 0.001 (0.355)	Loss 2.3938 (2.4735)	Entropy 0.58646 (0.58606)	Top-1 acc 64.062 (64.291)	Top-5 acc 85.938 (84.320)	lr 0.00620
Train [81][550/3239]	Time 0.242 (0.889)	Data Time 0.001 (0.349)	Loss 2.4295 (2.4727)	Entropy 0.58618 (0.58607)	Top-1 acc 66.406 (64.303)	Top-5 acc 83.594 (84.326)	lr 0.00620
Train [81][560/3239]	Time 0.234 (0.881)	Data Time 0.001 (0.343)	Loss 2.4338 (2.4736)	Entropy 0.58613 (0.58607)	Top-1 acc 64.844 (64.276)	Top-5 acc 85.547 (84.321)	lr 0.00620
Train [81][570/3239]	Time 0.703 (0.875)	Data Time 0.460 (0.338)	Loss 2.3722 (2.4743)	Entropy 0.58628 (0.58607)	Top-1 acc 63.672 (64.253)	Top-5 acc 86.328 (84.302)	lr 0.00620
Train [81][580/3239]	Time 0.252 (0.870)	Data Time 0.001 (0.335)	Loss 2.3338 (2.4744)	Entropy 0.58619 (0.58608)	Top-1 acc 69.922 (64.247)	Top-5 acc 87.891 (84.313)	lr 0.00620
Train [81][590/3239]	Time 0.267 (0.863)	Data Time 0.002 (0.329)	Loss 2.4661 (2.4734)	Entropy 0.58622 (0.58608)	Top-1 acc 63.672 (64.271)	Top-5 acc 85.156 (84.336)	lr 0.00620
Train [81][600/3239]	Time 0.240 (0.857)	Data Time 0.001 (0.325)	Loss 2.3924 (2.4726)	Entropy 0.58631 (0.58608)	Top-1 acc 67.969 (64.293)	Top-5 acc 84.766 (84.347)	lr 0.00620
Train [81][610/3239]	Time 0.307 (0.852)	Data Time 0.054 (0.321)	Loss 2.4349 (2.4718)	Entropy 0.58667 (0.58609)	Top-1 acc 66.797 (64.314)	Top-5 acc 83.984 (84.367)	lr 0.00620
Train [81][620/3239]	Time 0.254 (0.846)	Data Time 0.001 (0.316)	Loss 2.2910 (2.4712)	Entropy 0.58650 (0.58609)	Top-1 acc 71.094 (64.348)	Top-5 acc 85.938 (84.383)	lr 0.00620
Train [81][630/3239]	Time 0.256 (0.840)	Data Time 0.001 (0.311)	Loss 2.3356 (2.4714)	Entropy 0.58626 (0.58610)	Top-1 acc 64.453 (64.316)	Top-5 acc 84.375 (84.376)	lr 0.00619
Train [81][640/3239]	Time 0.255 (0.838)	Data Time 0.002 (0.311)	Loss 2.4277 (2.4702)	Entropy 0.58601 (0.58610)	Top-1 acc 64.453 (64.337)	Top-5 acc 85.547 (84.389)	lr 0.00619
Train [81][650/3239]	Time 0.250 (0.832)	Data Time 0.001 (0.306)	Loss 2.4020 (2.4696)	Entropy 0.58543 (0.58610)	Top-1 acc 66.797 (64.337)	Top-5 acc 85.547 (84.407)	lr 0.00619
Train [81][660/3239]	Time 0.242 (0.827)	Data Time 0.001 (0.302)	Loss 2.4285 (2.4686)	Entropy 0.58580 (0.58609)	Top-1 acc 68.359 (64.367)	Top-5 acc 85.547 (84.419)	lr 0.00619
Train [81][670/3239]	Time 0.234 (0.821)	Data Time 0.001 (0.298)	Loss 2.5580 (2.4691)	Entropy 0.58583 (0.58608)	Top-1 acc 61.719 (64.352)	Top-5 acc 84.766 (84.421)	lr 0.00619
Train [81][680/3239]	Time 0.243 (0.816)	Data Time 0.001 (0.294)	Loss 2.4478 (2.4694)	Entropy 0.58604 (0.58608)	Top-1 acc 62.109 (64.324)	Top-5 acc 86.328 (84.427)	lr 0.00619
Train [81][690/3239]	Time 0.242 (0.813)	Data Time 0.001 (0.292)	Loss 2.6498 (2.4687)	Entropy 0.58616 (0.58608)	Top-1 acc 63.672 (64.355)	Top-5 acc 79.688 (84.421)	lr 0.00619
Train [81][700/3239]	Time 0.353 (0.809)	Data Time 0.001 (0.290)	Loss 2.5695 (2.4684)	Entropy 0.58629 (0.58608)	Top-1 acc 60.938 (64.366)	Top-5 acc 83.203 (84.425)	lr 0.00619
Train [81][710/3239]	Time 0.229 (0.804)	Data Time 0.001 (0.285)	Loss 2.6190 (2.4687)	Entropy 0.58619 (0.58608)	Top-1 acc 59.375 (64.367)	Top-5 acc 81.641 (84.420)	lr 0.00619
Train [81][720/3239]	Time 0.251 (0.804)	Data Time 0.001 (0.287)	Loss 2.3492 (2.4676)	Entropy 0.58634 (0.58609)	Top-1 acc 67.188 (64.406)	Top-5 acc 86.328 (84.449)	lr 0.00619
Train [81][730/3239]	Time 3.503 (0.805)	Data Time 3.222 (0.289)	Loss 2.4795 (2.4681)	Entropy 0.58654 (0.58609)	Top-1 acc 66.016 (64.402)	Top-5 acc 83.984 (84.437)	lr 0.00619
Train [81][740/3239]	Time 0.245 (0.806)	Data Time 0.001 (0.291)	Loss 2.3204 (2.4682)	Entropy 0.58662 (0.58610)	Top-1 acc 67.578 (64.408)	Top-5 acc 87.500 (84.440)	lr 0.00619
Train [81][750/3239]	Time 0.240 (0.802)	Data Time 0.001 (0.289)	Loss 2.5124 (2.4688)	Entropy 0.58661 (0.58610)	Top-1 acc 65.234 (64.394)	Top-5 acc 84.375 (84.419)	lr 0.00618
Train [81][760/3239]	Time 0.262 (0.801)	Data Time 0.001 (0.288)	Loss 2.3743 (2.4685)	Entropy 0.58678 (0.58611)	Top-1 acc 67.188 (64.409)	Top-5 acc 85.938 (84.429)	lr 0.00618
Train [81][770/3239]	Time 1.489 (0.806)	Data Time 1.135 (0.294)	Loss 2.7279 (2.4694)	Entropy 0.58716 (0.58612)	Top-1 acc 57.031 (64.390)	Top-5 acc 82.031 (84.420)	lr 0.00618
Train [81][780/3239]	Time 0.241 (0.801)	Data Time 0.001 (0.291)	Loss 2.5208 (2.4697)	Entropy 0.58705 (0.58614)	Top-1 acc 66.406 (64.396)	Top-5 acc 84.375 (84.404)	lr 0.00618
Train [81][790/3239]	Time 0.244 (0.799)	Data Time 0.001 (0.289)	Loss 2.4646 (2.4689)	Entropy 0.58704 (0.58615)	Top-1 acc 62.500 (64.411)	Top-5 acc 83.984 (84.423)	lr 0.00618
Train [81][800/3239]	Time 0.239 (0.808)	Data Time 0.001 (0.299)	Loss 2.4272 (2.4691)	Entropy 0.58744 (0.58616)	Top-1 acc 63.672 (64.405)	Top-5 acc 82.812 (84.418)	lr 0.00618
Train [81][810/3239]	Time 0.348 (0.872)	Data Time 0.003 (0.295)	Loss 2.6393 (2.4693)	Entropy 0.58726 (0.58618)	Top-1 acc 62.891 (64.391)	Top-5 acc 83.203 (84.421)	lr 0.00618
Train [81][820/3239]	Time 0.240 (0.867)	Data Time 0.002 (0.292)	Loss 2.6244 (2.4697)	Entropy 0.58703 (0.58619)	Top-1 acc 60.547 (64.377)	Top-5 acc 82.812 (84.421)	lr 0.00618
Train [81][830/3239]	Time 0.250 (0.861)	Data Time 0.002 (0.288)	Loss 2.5114 (2.4698)	Entropy 0.58714 (0.58620)	Top-1 acc 62.891 (64.374)	Top-5 acc 85.547 (84.417)	lr 0.00618
Train [81][840/3239]	Time 0.247 (0.856)	Data Time 0.001 (0.285)	Loss 2.3492 (2.4696)	Entropy 0.58706 (0.58621)	Top-1 acc 69.141 (64.373)	Top-5 acc 85.938 (84.418)	lr 0.00618
Train [81][850/3239]	Time 0.245 (0.851)	Data Time 0.001 (0.282)	Loss 2.4897 (2.4697)	Entropy 0.58720 (0.58622)	Top-1 acc 64.844 (64.373)	Top-5 acc 83.203 (84.414)	lr 0.00618
Train [81][860/3239]	Time 0.395 (0.847)	Data Time 0.001 (0.278)	Loss 2.3323 (2.4698)	Entropy 0.58714 (0.58623)	Top-1 acc 68.359 (64.364)	Top-5 acc 85.547 (84.415)	lr 0.00617
Train [81][870/3239]	Time 0.236 (0.843)	Data Time 0.001 (0.275)	Loss 2.5534 (2.4691)	Entropy 0.58702 (0.58624)	Top-1 acc 60.547 (64.378)	Top-5 acc 85.938 (84.431)	lr 0.00617
Train [81][880/3239]	Time 0.240 (0.839)	Data Time 0.001 (0.272)	Loss 2.6963 (2.4693)	Entropy 0.58707 (0.58625)	Top-1 acc 58.203 (64.378)	Top-5 acc 80.078 (84.418)	lr 0.00617
Train [81][890/3239]	Time 0.245 (0.834)	Data Time 0.002 (0.269)	Loss 2.3743 (2.4697)	Entropy 0.58703 (0.58626)	Top-1 acc 67.188 (64.372)	Top-5 acc 87.891 (84.423)	lr 0.00617
Train [81][900/3239]	Time 0.239 (0.830)	Data Time 0.001 (0.266)	Loss 2.3476 (2.4698)	Entropy 0.58718 (0.58627)	Top-1 acc 69.531 (64.377)	Top-5 acc 83.203 (84.414)	lr 0.00617
Train [81][910/3239]	Time 0.243 (0.835)	Data Time 0.001 (0.273)	Loss 2.3918 (2.4696)	Entropy 0.58675 (0.58628)	Top-1 acc 64.844 (64.384)	Top-5 acc 85.156 (84.419)	lr 0.00617
Train [81][920/3239]	Time 0.245 (0.831)	Data Time 0.002 (0.270)	Loss 2.3663 (2.4690)	Entropy 0.58671 (0.58628)	Top-1 acc 66.016 (64.402)	Top-5 acc 86.719 (84.430)	lr 0.00617
Train [81][930/3239]	Time 0.350 (0.829)	Data Time 0.001 (0.269)	Loss 2.4230 (2.4681)	Entropy 0.58698 (0.58629)	Top-1 acc 66.016 (64.427)	Top-5 acc 85.156 (84.448)	lr 0.00617
Train [81][940/3239]	Time 0.231 (0.841)	Data Time 0.001 (0.282)	Loss 2.5781 (2.4684)	Entropy 0.58703 (0.58629)	Top-1 acc 65.234 (64.425)	Top-5 acc 82.422 (84.436)	lr 0.00617
Train [81][950/3239]	Time 0.250 (0.836)	Data Time 0.003 (0.279)	Loss 2.3831 (2.4684)	Entropy 0.58723 (0.58630)	Top-1 acc 66.016 (64.417)	Top-5 acc 87.500 (84.437)	lr 0.00617
Train [81][960/3239]	Time 0.240 (0.834)	Data Time 0.001 (0.278)	Loss 2.4609 (2.4681)	Entropy 0.58674 (0.58631)	Top-1 acc 67.188 (64.436)	Top-5 acc 83.594 (84.443)	lr 0.00617
Train [81][970/3239]	Time 3.074 (0.839)	Data Time 2.827 (0.285)	Loss 2.4468 (2.4686)	Entropy 0.58686 (0.58631)	Top-1 acc 64.453 (64.431)	Top-5 acc 85.156 (84.433)	lr 0.00617
Train [81][980/3239]	Time 0.239 (0.837)	Data Time 0.001 (0.284)	Loss 2.5554 (2.4690)	Entropy 0.58660 (0.58632)	Top-1 acc 63.672 (64.414)	Top-5 acc 84.375 (84.420)	lr 0.00616
Train [81][990/3239]	Time 0.257 (0.835)	Data Time 0.001 (0.283)	Loss 2.4804 (2.4693)	Entropy 0.58619 (0.58632)	Top-1 acc 64.844 (64.405)	Top-5 acc 85.547 (84.412)	lr 0.00616
Train [81][1000/3239]	Time 9.955 (0.840)	Data Time 9.685 (0.290)	Loss 2.6577 (2.4694)	Entropy 0.58638 (0.58632)	Top-1 acc 60.938 (64.406)	Top-5 acc 81.250 (84.405)	lr 0.00616
Train [81][1010/3239]	Time 0.309 (0.837)	Data Time 0.001 (0.287)	Loss 2.6649 (2.4693)	Entropy 0.58616 (0.58632)	Top-1 acc 59.766 (64.408)	Top-5 acc 82.031 (84.407)	lr 0.00616
Train [81][1020/3239]	Time 0.340 (0.836)	Data Time 0.001 (0.288)	Loss 2.6068 (2.4694)	Entropy 0.58621 (0.58632)	Top-1 acc 58.984 (64.416)	Top-5 acc 80.859 (84.400)	lr 0.00616
Train [81][1030/3239]	Time 0.238 (0.833)	Data Time 0.001 (0.285)	Loss 2.3823 (2.4693)	Entropy 0.58632 (0.58632)	Top-1 acc 62.891 (64.415)	Top-5 acc 83.203 (84.397)	lr 0.00616
Train [81][1040/3239]	Time 4.999 (0.842)	Data Time 4.680 (0.295)	Loss 2.4528 (2.4690)	Entropy 0.58607 (0.58631)	Top-1 acc 66.406 (64.409)	Top-5 acc 82.812 (84.404)	lr 0.00616
Train [81][1050/3239]	Time 0.234 (0.838)	Data Time 0.001 (0.292)	Loss 2.3251 (2.4682)	Entropy 0.58640 (0.58631)	Top-1 acc 69.531 (64.431)	Top-5 acc 87.109 (84.419)	lr 0.00616
Train [81][1060/3239]	Time 0.251 (0.834)	Data Time 0.001 (0.289)	Loss 2.4372 (2.4685)	Entropy 0.58671 (0.58631)	Top-1 acc 66.016 (64.426)	Top-5 acc 85.938 (84.409)	lr 0.00616
Train [81][1070/3239]	Time 0.234 (0.839)	Data Time 0.001 (0.295)	Loss 2.2612 (2.4688)	Entropy 0.58667 (0.58632)	Top-1 acc 70.312 (64.423)	Top-5 acc 89.453 (84.400)	lr 0.00616
Train [81][1080/3239]	Time 0.256 (0.840)	Data Time 0.002 (0.296)	Loss 2.1830 (2.4684)	Entropy 0.58659 (0.58632)	Top-1 acc 74.609 (64.447)	Top-5 acc 89.453 (84.414)	lr 0.00616
Train [81][1090/3239]	Time 0.323 (0.836)	Data Time 0.001 (0.294)	Loss 2.6536 (2.4690)	Entropy 0.58629 (0.58632)	Top-1 acc 61.719 (64.443)	Top-5 acc 80.078 (84.396)	lr 0.00615
Train [81][1100/3239]	Time 0.302 (0.842)	Data Time 0.002 (0.300)	Loss 2.5934 (2.4699)	Entropy 0.58608 (0.58632)	Top-1 acc 57.422 (64.416)	Top-5 acc 82.812 (84.377)	lr 0.00615
Train [81][1110/3239]	Time 0.255 (0.844)	Data Time 0.001 (0.303)	Loss 2.3356 (2.4702)	Entropy 0.58615 (0.58632)	Top-1 acc 67.969 (64.410)	Top-5 acc 86.328 (84.373)	lr 0.00615
Train [81][1120/3239]	Time 0.245 (0.841)	Data Time 0.001 (0.301)	Loss 2.3666 (2.4704)	Entropy 0.58643 (0.58631)	Top-1 acc 66.016 (64.412)	Top-5 acc 85.547 (84.364)	lr 0.00615
Train [81][1130/3239]	Time 3.880 (0.843)	Data Time 3.620 (0.304)	Loss 2.6182 (2.4707)	Entropy 0.58623 (0.58632)	Top-1 acc 60.938 (64.407)	Top-5 acc 80.469 (84.356)	lr 0.00615
Train [81][1140/3239]	Time 0.237 (0.847)	Data Time 0.001 (0.309)	Loss 2.3811 (2.4716)	Entropy 0.58641 (0.58632)	Top-1 acc 64.453 (64.379)	Top-5 acc 85.547 (84.340)	lr 0.00615
Train [81][1150/3239]	Time 0.242 (0.844)	Data Time 0.001 (0.306)	Loss 2.5887 (2.4716)	Entropy 0.58634 (0.58632)	Top-1 acc 60.156 (64.373)	Top-5 acc 83.203 (84.335)	lr 0.00615
Train [81][1160/3239]	Time 1.021 (0.841)	Data Time 0.774 (0.304)	Loss 2.5282 (2.4715)	Entropy 0.58623 (0.58632)	Top-1 acc 63.672 (64.374)	Top-5 acc 83.203 (84.338)	lr 0.00615
Train [81][1170/3239]	Time 0.263 (0.847)	Data Time 0.001 (0.312)	Loss 2.2051 (2.4718)	Entropy 0.58588 (0.58631)	Top-1 acc 72.656 (64.361)	Top-5 acc 91.016 (84.329)	lr 0.00615
Train [81][1180/3239]	Time 0.302 (0.844)	Data Time 0.001 (0.309)	Loss 2.5389 (2.4720)	Entropy 0.58608 (0.58631)	Top-1 acc 61.719 (64.356)	Top-5 acc 84.766 (84.326)	lr 0.00615
Train [81][1190/3239]	Time 0.242 (0.840)	Data Time 0.001 (0.306)	Loss 2.5529 (2.4716)	Entropy 0.58612 (0.58631)	Top-1 acc 59.766 (64.358)	Top-5 acc 82.031 (84.338)	lr 0.00615
Train [81][1200/3239]	Time 6.179 (0.847)	Data Time 5.915 (0.314)	Loss 2.3508 (2.4716)	Entropy 0.58592 (0.58631)	Top-1 acc 68.359 (64.355)	Top-5 acc 87.500 (84.339)	lr 0.00615
Train [81][1210/3239]	Time 0.233 (0.844)	Data Time 0.001 (0.312)	Loss 2.5642 (2.4722)	Entropy 0.58574 (0.58630)	Top-1 acc 62.891 (64.336)	Top-5 acc 83.203 (84.336)	lr 0.00614
Train [81][1220/3239]	Time 0.266 (0.840)	Data Time 0.001 (0.309)	Loss 2.3935 (2.4716)	Entropy 0.58601 (0.58630)	Top-1 acc 68.359 (64.355)	Top-5 acc 86.719 (84.346)	lr 0.00614
Train [81][1230/3239]	Time 0.242 (0.843)	Data Time 0.001 (0.313)	Loss 2.5441 (2.4715)	Entropy 0.58603 (0.58630)	Top-1 acc 65.625 (64.362)	Top-5 acc 83.594 (84.348)	lr 0.00614
Train [81][1240/3239]	Time 0.231 (0.844)	Data Time 0.001 (0.314)	Loss 2.6409 (2.4718)	Entropy 0.58618 (0.58629)	Top-1 acc 61.328 (64.352)	Top-5 acc 80.078 (84.344)	lr 0.00614
Train [81][1250/3239]	Time 0.336 (0.841)	Data Time 0.001 (0.312)	Loss 2.4856 (2.4718)	Entropy 0.58583 (0.58629)	Top-1 acc 59.766 (64.348)	Top-5 acc 82.422 (84.338)	lr 0.00614
Train [81][1260/3239]	Time 0.241 (0.843)	Data Time 0.001 (0.314)	Loss 2.4981 (2.4716)	Entropy 0.58566 (0.58629)	Top-1 acc 63.672 (64.362)	Top-5 acc 84.375 (84.342)	lr 0.00614
Train [81][1270/3239]	Time 0.284 (0.843)	Data Time 0.002 (0.316)	Loss 2.4860 (2.4720)	Entropy 0.58555 (0.58628)	Top-1 acc 62.891 (64.351)	Top-5 acc 81.641 (84.332)	lr 0.00614
Train [81][1280/3239]	Time 0.241 (0.842)	Data Time 0.001 (0.315)	Loss 2.7844 (2.4722)	Entropy 0.58549 (0.58628)	Top-1 acc 55.469 (64.351)	Top-5 acc 79.688 (84.330)	lr 0.00614
Train [81][1290/3239]	Time 5.830 (0.845)	Data Time 5.581 (0.319)	Loss 2.3641 (2.4728)	Entropy 0.58529 (0.58627)	Top-1 acc 66.016 (64.338)	Top-5 acc 85.938 (84.321)	lr 0.00614
Train [81][1300/3239]	Time 0.277 (0.845)	Data Time 0.002 (0.320)	Loss 2.3147 (2.4724)	Entropy 0.58536 (0.58626)	Top-1 acc 68.750 (64.351)	Top-5 acc 87.109 (84.332)	lr 0.00614
Train [81][1310/3239]	Time 0.234 (0.846)	Data Time 0.001 (0.321)	Loss 2.4712 (2.4724)	Entropy 0.58547 (0.58626)	Top-1 acc 64.844 (64.354)	Top-5 acc 85.938 (84.331)	lr 0.00614
Train [81][1320/3239]	Time 0.366 (0.843)	Data Time 0.001 (0.319)	Loss 2.2573 (2.4724)	Entropy 0.58552 (0.58625)	Top-1 acc 69.531 (64.356)	Top-5 acc 86.719 (84.328)	lr 0.00613
Train [81][1330/3239]	Time 0.263 (0.848)	Data Time 0.002 (0.324)	Loss 2.2983 (2.4723)	Entropy 0.58540 (0.58625)	Top-1 acc 70.312 (64.358)	Top-5 acc 86.328 (84.329)	lr 0.00613
Train [81][1340/3239]	Time 0.249 (0.850)	Data Time 0.001 (0.327)	Loss 2.5342 (2.4726)	Entropy 0.58534 (0.58624)	Top-1 acc 64.844 (64.342)	Top-5 acc 82.422 (84.321)	lr 0.00613
Train [81][1350/3239]	Time 0.248 (0.847)	Data Time 0.001 (0.325)	Loss 2.5952 (2.4729)	Entropy 0.58518 (0.58623)	Top-1 acc 62.500 (64.338)	Top-5 acc 82.031 (84.311)	lr 0.00613
Train [81][1360/3239]	Time 5.150 (0.853)	Data Time 4.897 (0.331)	Loss 2.4224 (2.4728)	Entropy 0.58545 (0.58623)	Top-1 acc 67.578 (64.337)	Top-5 acc 84.766 (84.312)	lr 0.00613
Train [81][1370/3239]	Time 0.314 (0.852)	Data Time 0.071 (0.331)	Loss 2.4071 (2.4723)	Entropy 0.58548 (0.58622)	Top-1 acc 64.844 (64.343)	Top-5 acc 86.719 (84.328)	lr 0.00613
Train [81][1380/3239]	Time 0.238 (0.849)	Data Time 0.001 (0.329)	Loss 2.5145 (2.4724)	Entropy 0.58574 (0.58622)	Top-1 acc 64.062 (64.343)	Top-5 acc 85.156 (84.328)	lr 0.00613
Train [81][1390/3239]	Time 0.269 (0.853)	Data Time 0.002 (0.333)	Loss 2.7143 (2.4726)	Entropy 0.58590 (0.58621)	Top-1 acc 58.984 (64.337)	Top-5 acc 80.078 (84.329)	lr 0.00613
Train [81][1400/3239]	Time 2.540 (0.855)	Data Time 2.275 (0.336)	Loss 2.4624 (2.4727)	Entropy 0.58540 (0.58621)	Top-1 acc 65.234 (64.323)	Top-5 acc 84.375 (84.328)	lr 0.00613
Train [81][1410/3239]	Time 0.397 (0.856)	Data Time 0.001 (0.338)	Loss 2.4795 (2.4730)	Entropy 0.58541 (0.58620)	Top-1 acc 62.500 (64.314)	Top-5 acc 85.156 (84.325)	lr 0.00613
Train [81][1420/3239]	Time 0.233 (0.856)	Data Time 0.001 (0.338)	Loss 2.4117 (2.4731)	Entropy 0.58534 (0.58620)	Top-1 acc 69.141 (64.323)	Top-5 acc 83.203 (84.318)	lr 0.00613
Train [81][1430/3239]	Time 0.245 (0.857)	Data Time 0.001 (0.340)	Loss 2.7688 (2.4731)	Entropy 0.58558 (0.58619)	Top-1 acc 59.375 (64.333)	Top-5 acc 80.859 (84.323)	lr 0.00613
Train [81][1440/3239]	Time 0.233 (0.862)	Data Time 0.001 (0.346)	Loss 2.5257 (2.4732)	Entropy 0.58549 (0.58619)	Top-1 acc 62.500 (64.332)	Top-5 acc 85.156 (84.324)	lr 0.00612
Train [81][1450/3239]	Time 0.286 (0.859)	Data Time 0.001 (0.343)	Loss 2.4069 (2.4728)	Entropy 0.58538 (0.58618)	Top-1 acc 66.797 (64.340)	Top-5 acc 84.766 (84.335)	lr 0.00612
Train [81][1460/3239]	Time 0.311 (0.899)	Data Time 0.004 (0.345)	Loss 2.3551 (2.4725)	Entropy 0.58500 (0.58618)	Top-1 acc 67.188 (64.348)	Top-5 acc 83.984 (84.340)	lr 0.00612
Train [81][1470/3239]	Time 0.253 (0.896)	Data Time 0.003 (0.342)	Loss 2.1848 (2.4722)	Entropy 0.58510 (0.58617)	Top-1 acc 71.875 (64.347)	Top-5 acc 88.281 (84.344)	lr 0.00612
Train [81][1480/3239]	Time 0.350 (0.893)	Data Time 0.003 (0.340)	Loss 2.4129 (2.4720)	Entropy 0.58496 (0.58616)	Top-1 acc 65.625 (64.350)	Top-5 acc 83.203 (84.346)	lr 0.00612
Train [81][1490/3239]	Time 0.239 (0.890)	Data Time 0.001 (0.338)	Loss 2.7860 (2.4723)	Entropy 0.58489 (0.58615)	Top-1 acc 56.250 (64.345)	Top-5 acc 78.516 (84.338)	lr 0.00612
Train [81][1500/3239]	Time 0.247 (0.886)	Data Time 0.002 (0.336)	Loss 2.6118 (2.4721)	Entropy 0.58479 (0.58614)	Top-1 acc 59.766 (64.348)	Top-5 acc 83.203 (84.348)	lr 0.00612
Train [81][1510/3239]	Time 0.243 (0.883)	Data Time 0.002 (0.333)	Loss 2.5858 (2.4721)	Entropy 0.58497 (0.58613)	Top-1 acc 62.109 (64.348)	Top-5 acc 82.031 (84.343)	lr 0.00612
Train [81][1520/3239]	Time 0.256 (0.880)	Data Time 0.002 (0.331)	Loss 2.5184 (2.4723)	Entropy 0.58486 (0.58613)	Top-1 acc 63.672 (64.340)	Top-5 acc 85.156 (84.346)	lr 0.00612
Train [81][1530/3239]	Time 0.269 (0.881)	Data Time 0.001 (0.333)	Loss 2.5459 (2.4724)	Entropy 0.58497 (0.58612)	Top-1 acc 62.109 (64.334)	Top-5 acc 82.422 (84.343)	lr 0.00612
Train [81][1540/3239]	Time 0.434 (0.880)	Data Time 0.178 (0.332)	Loss 2.5063 (2.4725)	Entropy 0.58508 (0.58611)	Top-1 acc 61.719 (64.331)	Top-5 acc 82.422 (84.342)	lr 0.00612
Train [81][1550/3239]	Time 0.235 (0.878)	Data Time 0.001 (0.330)	Loss 2.5992 (2.4727)	Entropy 0.58498 (0.58610)	Top-1 acc 60.938 (64.322)	Top-5 acc 83.984 (84.338)	lr 0.00611
Train [81][1560/3239]	Time 0.241 (0.886)	Data Time 0.001 (0.340)	Loss 2.4931 (2.4728)	Entropy 0.58504 (0.58610)	Top-1 acc 63.281 (64.319)	Top-5 acc 82.031 (84.330)	lr 0.00611
Train [81][1570/3239]	Time 0.361 (0.887)	Data Time 0.001 (0.341)	Loss 2.5175 (2.4728)	Entropy 0.58501 (0.58609)	Top-1 acc 65.625 (64.321)	Top-5 acc 80.469 (84.327)	lr 0.00611
Train [81][1580/3239]	Time 0.234 (0.885)	Data Time 0.001 (0.340)	Loss 2.5334 (2.4730)	Entropy 0.58522 (0.58608)	Top-1 acc 64.453 (64.315)	Top-5 acc 82.031 (84.320)	lr 0.00611
Train [81][1590/3239]	Time 0.241 (0.892)	Data Time 0.001 (0.348)	Loss 2.4343 (2.4731)	Entropy 0.58505 (0.58608)	Top-1 acc 66.797 (64.314)	Top-5 acc 83.984 (84.317)	lr 0.00611
Train [81][1600/3239]	Time 0.240 (0.892)	Data Time 0.001 (0.349)	Loss 2.5139 (2.4732)	Entropy 0.58533 (0.58607)	Top-1 acc 63.672 (64.316)	Top-5 acc 83.203 (84.315)	lr 0.00611
Train [81][1610/3239]	Time 0.243 (0.892)	Data Time 0.001 (0.350)	Loss 2.2854 (2.4730)	Entropy 0.58547 (0.58607)	Top-1 acc 67.578 (64.316)	Top-5 acc 91.016 (84.324)	lr 0.00611
Train [81][1620/3239]	Time 6.729 (0.894)	Data Time 6.479 (0.351)	Loss 2.6079 (2.4730)	Entropy 0.58545 (0.58606)	Top-1 acc 61.719 (64.319)	Top-5 acc 85.547 (84.329)	lr 0.00611
Train [81][1630/3239]	Time 0.240 (0.899)	Data Time 0.001 (0.357)	Loss 2.4536 (2.4735)	Entropy 0.58543 (0.58606)	Top-1 acc 66.406 (64.311)	Top-5 acc 85.156 (84.325)	lr 0.00611
Train [81][1640/3239]	Time 0.353 (0.898)	Data Time 0.001 (0.357)	Loss 2.4838 (2.4738)	Entropy 0.58563 (0.58606)	Top-1 acc 66.016 (64.306)	Top-5 acc 84.375 (84.318)	lr 0.00611
Train [81][1650/3239]	Time 0.220 (0.895)	Data Time 0.001 (0.355)	Loss 2.4496 (2.4734)	Entropy 0.58553 (0.58605)	Top-1 acc 62.500 (64.316)	Top-5 acc 87.500 (84.326)	lr 0.00611
Train [81][1660/3239]	Time 1.059 (0.903)	Data Time 0.779 (0.364)	Loss 2.4047 (2.4733)	Entropy 0.58529 (0.58605)	Top-1 acc 62.109 (64.313)	Top-5 acc 86.328 (84.326)	lr 0.00611
Train [81][1670/3239]	Time 0.230 (0.905)	Data Time 0.001 (0.366)	Loss 2.6240 (2.4733)	Entropy 0.58515 (0.58605)	Top-1 acc 57.812 (64.309)	Top-5 acc 79.297 (84.325)	lr 0.00610
Train [81][1680/3239]	Time 0.240 (0.902)	Data Time 0.001 (0.364)	Loss 2.5381 (2.4730)	Entropy 0.58485 (0.58604)	Top-1 acc 59.766 (64.311)	Top-5 acc 82.031 (84.329)	lr 0.00610
Train [81][1690/3239]	Time 0.269 (0.909)	Data Time 0.001 (0.372)	Loss 2.5471 (2.4734)	Entropy 0.58503 (0.58603)	Top-1 acc 63.281 (64.303)	Top-5 acc 83.984 (84.321)	lr 0.00610
Train [81][1700/3239]	Time 0.236 (0.910)	Data Time 0.001 (0.374)	Loss 2.4192 (2.4734)	Entropy 0.58512 (0.58603)	Top-1 acc 66.016 (64.296)	Top-5 acc 85.938 (84.323)	lr 0.00610
Train [81][1710/3239]	Time 0.245 (0.908)	Data Time 0.001 (0.371)	Loss 2.4154 (2.4731)	Entropy 0.58510 (0.58602)	Top-1 acc 66.016 (64.304)	Top-5 acc 84.766 (84.328)	lr 0.00610
Train [81][1720/3239]	Time 0.268 (0.914)	Data Time 0.001 (0.379)	Loss 2.4486 (2.4732)	Entropy 0.58538 (0.58602)	Top-1 acc 64.844 (64.302)	Top-5 acc 82.031 (84.324)	lr 0.00610
Train [81][1730/3239]	Time 0.336 (0.913)	Data Time 0.001 (0.378)	Loss 2.5696 (2.4732)	Entropy 0.58513 (0.58601)	Top-1 acc 61.328 (64.303)	Top-5 acc 80.469 (84.321)	lr 0.00610
Train [81][1740/3239]	Time 0.245 (0.913)	Data Time 0.001 (0.378)	Loss 2.5142 (2.4734)	Entropy 0.58526 (0.58601)	Top-1 acc 62.891 (64.299)	Top-5 acc 82.812 (84.318)	lr 0.00610
Train [81][1750/3239]	Time 0.241 (0.919)	Data Time 0.001 (0.385)	Loss 2.5409 (2.4733)	Entropy 0.58530 (0.58600)	Top-1 acc 60.156 (64.299)	Top-5 acc 83.203 (84.323)	lr 0.00610
Train [81][1760/3239]	Time 0.237 (0.920)	Data Time 0.001 (0.387)	Loss 2.3522 (2.4733)	Entropy 0.58544 (0.58600)	Top-1 acc 67.969 (64.299)	Top-5 acc 85.156 (84.325)	lr 0.00610
Train [81][1770/3239]	Time 0.247 (0.919)	Data Time 0.001 (0.386)	Loss 2.6382 (2.4735)	Entropy 0.58560 (0.58600)	Top-1 acc 62.500 (64.291)	Top-5 acc 82.031 (84.326)	lr 0.00610
Train [81][1780/3239]	Time 4.256 (0.919)	Data Time 4.008 (0.387)	Loss 2.6049 (2.4734)	Entropy 0.58583 (0.58599)	Top-1 acc 60.156 (64.287)	Top-5 acc 80.078 (84.324)	lr 0.00609
Train [81][1790/3239]	Time 0.255 (0.925)	Data Time 0.001 (0.393)	Loss 2.6124 (2.4735)	Entropy 0.58563 (0.58599)	Top-1 acc 62.891 (64.285)	Top-5 acc 80.859 (84.319)	lr 0.00609
Train [81][1800/3239]	Time 0.333 (0.926)	Data Time 0.001 (0.395)	Loss 2.3810 (2.4735)	Entropy 0.58574 (0.58599)	Top-1 acc 62.891 (64.281)	Top-5 acc 88.281 (84.321)	lr 0.00609
Train [81][1810/3239]	Time 1.892 (0.924)	Data Time 1.649 (0.394)	Loss 2.3828 (2.4735)	Entropy 0.58582 (0.58599)	Top-1 acc 66.406 (64.281)	Top-5 acc 84.766 (84.322)	lr 0.00609
Train [81][1820/3239]	Time 0.255 (0.931)	Data Time 0.001 (0.402)	Loss 2.3743 (2.4730)	Entropy 0.58552 (0.58599)	Top-1 acc 67.188 (64.287)	Top-5 acc 84.766 (84.329)	lr 0.00609
Train [81][1830/3239]	Time 0.239 (0.935)	Data Time 0.001 (0.406)	Loss 2.3392 (2.4730)	Entropy 0.58547 (0.58598)	Top-1 acc 64.844 (64.285)	Top-5 acc 90.234 (84.330)	lr 0.00609
Train [81][1840/3239]	Time 0.280 (0.932)	Data Time 0.003 (0.404)	Loss 2.4842 (2.4731)	Entropy 0.58542 (0.58598)	Top-1 acc 62.500 (64.287)	Top-5 acc 86.328 (84.328)	lr 0.00609
Train [81][1850/3239]	Time 0.256 (0.937)	Data Time 0.001 (0.409)	Loss 2.4179 (2.4733)	Entropy 0.58554 (0.58598)	Top-1 acc 66.016 (64.284)	Top-5 acc 85.938 (84.328)	lr 0.00609
Train [81][1860/3239]	Time 0.227 (0.941)	Data Time 0.001 (0.414)	Loss 2.3927 (2.4732)	Entropy 0.58563 (0.58598)	Top-1 acc 67.969 (64.288)	Top-5 acc 83.594 (84.328)	lr 0.00609
Train [81][1870/3239]	Time 0.232 (0.939)	Data Time 0.001 (0.412)	Loss 2.5839 (2.4731)	Entropy 0.58557 (0.58597)	Top-1 acc 61.328 (64.294)	Top-5 acc 81.641 (84.328)	lr 0.00609
Train [81][1880/3239]	Time 0.243 (0.944)	Data Time 0.001 (0.417)	Loss 2.3921 (2.4733)	Entropy 0.58558 (0.58597)	Top-1 acc 64.453 (64.291)	Top-5 acc 85.547 (84.326)	lr 0.00609
Train [81][1890/3239]	Time 0.240 (0.941)	Data Time 0.001 (0.415)	Loss 2.5693 (2.4735)	Entropy 0.58531 (0.58597)	Top-1 acc 61.719 (64.284)	Top-5 acc 80.469 (84.321)	lr 0.00609
Train [81][1900/3239]	Time 0.228 (0.945)	Data Time 0.001 (0.420)	Loss 2.3537 (2.4737)	Entropy 0.58520 (0.58597)	Top-1 acc 67.188 (64.275)	Top-5 acc 87.500 (84.319)	lr 0.00608
Train [81][1910/3239]	Time 0.233 (0.943)	Data Time 0.001 (0.419)	Loss 2.3485 (2.4739)	Entropy 0.58529 (0.58596)	Top-1 acc 67.969 (64.271)	Top-5 acc 85.938 (84.315)	lr 0.00608
Train [81][1920/3239]	Time 0.232 (0.945)	Data Time 0.001 (0.421)	Loss 2.3324 (2.4739)	Entropy 0.58532 (0.58596)	Top-1 acc 68.359 (64.268)	Top-5 acc 89.453 (84.316)	lr 0.00608
Train [81][1930/3239]	Time 0.251 (0.950)	Data Time 0.001 (0.426)	Loss 2.5763 (2.4738)	Entropy 0.58538 (0.58596)	Top-1 acc 61.719 (64.269)	Top-5 acc 82.422 (84.316)	lr 0.00608
Train [81][1940/3239]	Time 0.239 (0.947)	Data Time 0.001 (0.424)	Loss 2.5311 (2.4741)	Entropy 0.58554 (0.58595)	Top-1 acc 63.672 (64.268)	Top-5 acc 84.375 (84.310)	lr 0.00608
Train [81][1950/3239]	Time 0.255 (0.950)	Data Time 0.002 (0.427)	Loss 2.4703 (2.4741)	Entropy 0.58550 (0.58595)	Top-1 acc 64.453 (64.268)	Top-5 acc 84.766 (84.309)	lr 0.00608
Train [81][1960/3239]	Time 0.352 (0.957)	Data Time 0.001 (0.435)	Loss 2.3751 (2.4741)	Entropy 0.58560 (0.58595)	Top-1 acc 65.625 (64.264)	Top-5 acc 85.156 (84.310)	lr 0.00608
Train [81][1970/3239]	Time 0.252 (0.955)	Data Time 0.001 (0.433)	Loss 2.7162 (2.4742)	Entropy 0.58576 (0.58595)	Top-1 acc 58.984 (64.258)	Top-5 acc 80.078 (84.303)	lr 0.00608
Train [81][1980/3239]	Time 0.237 (0.958)	Data Time 0.001 (0.436)	Loss 2.5374 (2.4744)	Entropy 0.58596 (0.58595)	Top-1 acc 61.719 (64.253)	Top-5 acc 83.203 (84.303)	lr 0.00608
Train [81][1990/3239]	Time 0.231 (0.965)	Data Time 0.001 (0.444)	Loss 2.6530 (2.4747)	Entropy 0.58632 (0.58595)	Top-1 acc 64.453 (64.249)	Top-5 acc 81.250 (84.300)	lr 0.00608
Train [81][2000/3239]	Time 0.236 (0.962)	Data Time 0.001 (0.441)	Loss 2.4649 (2.4747)	Entropy 0.58638 (0.58595)	Top-1 acc 63.281 (64.252)	Top-5 acc 85.938 (84.298)	lr 0.00608
Train [81][2010/3239]	Time 0.260 (0.965)	Data Time 0.001 (0.445)	Loss 2.2910 (2.4750)	Entropy 0.58606 (0.58595)	Top-1 acc 67.188 (64.246)	Top-5 acc 87.891 (84.295)	lr 0.00608
Train [81][2020/3239]	Time 0.268 (0.974)	Data Time 0.003 (0.455)	Loss 2.4796 (2.4755)	Entropy 0.58622 (0.58595)	Top-1 acc 63.281 (64.234)	Top-5 acc 83.984 (84.288)	lr 0.00607
Train [81][2030/3239]	Time 0.351 (0.971)	Data Time 0.001 (0.452)	Loss 2.3846 (2.4754)	Entropy 0.58627 (0.58595)	Top-1 acc 66.406 (64.236)	Top-5 acc 87.891 (84.292)	lr 0.00607
Train [81][2040/3239]	Time 0.238 (0.970)	Data Time 0.001 (0.452)	Loss 2.6278 (2.4755)	Entropy 0.58647 (0.58596)	Top-1 acc 58.594 (64.231)	Top-5 acc 83.984 (84.290)	lr 0.00607
Train [81][2050/3239]	Time 0.242 (0.971)	Data Time 0.001 (0.454)	Loss 2.4712 (2.4757)	Entropy 0.58639 (0.58596)	Top-1 acc 66.797 (64.225)	Top-5 acc 83.594 (84.288)	lr 0.00607
Train [81][2060/3239]	Time 0.267 (0.977)	Data Time 0.001 (0.460)	Loss 2.3352 (2.4759)	Entropy 0.58645 (0.58596)	Top-1 acc 67.188 (64.223)	Top-5 acc 85.938 (84.282)	lr 0.00607
Train [81][2070/3239]	Time 0.288 (0.974)	Data Time 0.001 (0.457)	Loss 2.2973 (2.4759)	Entropy 0.58670 (0.58596)	Top-1 acc 71.484 (64.222)	Top-5 acc 87.500 (84.278)	lr 0.00607
Train [81][2080/3239]	Time 0.248 (0.975)	Data Time 0.001 (0.459)	Loss 2.4618 (2.4758)	Entropy 0.58640 (0.58597)	Top-1 acc 60.156 (64.221)	Top-5 acc 87.891 (84.279)	lr 0.00607
Train [81][2090/3239]	Time 0.247 (0.980)	Data Time 0.001 (0.464)	Loss 2.4186 (2.4758)	Entropy 0.58644 (0.58597)	Top-1 acc 64.844 (64.225)	Top-5 acc 85.938 (84.280)	lr 0.00607
Train [81][2100/3239]	Time 0.245 (0.978)	Data Time 0.002 (0.462)	Loss 2.4605 (2.4760)	Entropy 0.58628 (0.58597)	Top-1 acc 62.500 (64.215)	Top-5 acc 83.594 (84.276)	lr 0.00607
Train [81][2110/3239]	Time 0.237 (0.980)	Data Time 0.002 (0.465)	Loss 2.4552 (2.4756)	Entropy 0.58625 (0.58597)	Top-1 acc 65.625 (64.224)	Top-5 acc 83.984 (84.282)	lr 0.00607
Train [81][2120/3239]	Time 0.343 (1.006)	Data Time 0.002 (0.464)	Loss 2.4086 (2.4754)	Entropy 0.58630 (0.58597)	Top-1 acc 65.234 (64.232)	Top-5 acc 85.547 (84.286)	lr 0.00607
Train [81][2130/3239]	Time 0.251 (1.003)	Data Time 0.001 (0.462)	Loss 2.3532 (2.4755)	Entropy 0.58628 (0.58597)	Top-1 acc 66.797 (64.232)	Top-5 acc 87.109 (84.284)	lr 0.00606
Train [81][2140/3239]	Time 0.243 (1.001)	Data Time 0.002 (0.459)	Loss 2.2178 (2.4754)	Entropy 0.58591 (0.58598)	Top-1 acc 72.656 (64.235)	Top-5 acc 88.281 (84.283)	lr 0.00606
Train [81][2150/3239]	Time 0.241 (0.998)	Data Time 0.001 (0.457)	Loss 2.7789 (2.4755)	Entropy 0.58576 (0.58597)	Top-1 acc 55.859 (64.233)	Top-5 acc 75.000 (84.280)	lr 0.00606
Train [81][2160/3239]	Time 0.227 (0.995)	Data Time 0.002 (0.455)	Loss 2.6249 (2.4758)	Entropy 0.58587 (0.58597)	Top-1 acc 62.109 (64.227)	Top-5 acc 78.125 (84.274)	lr 0.00606
Train [81][2170/3239]	Time 0.242 (0.993)	Data Time 0.002 (0.453)	Loss 2.5893 (2.4757)	Entropy 0.58562 (0.58597)	Top-1 acc 64.844 (64.231)	Top-5 acc 80.859 (84.272)	lr 0.00606
Train [81][2180/3239]	Time 0.231 (0.994)	Data Time 0.001 (0.455)	Loss 2.4707 (2.4756)	Entropy 0.58594 (0.58597)	Top-1 acc 62.109 (64.230)	Top-5 acc 82.812 (84.272)	lr 0.00606
Train [81][2190/3239]	Time 0.409 (0.993)	Data Time 0.001 (0.455)	Loss 2.4261 (2.4757)	Entropy 0.58610 (0.58597)	Top-1 acc 62.500 (64.227)	Top-5 acc 87.500 (84.265)	lr 0.00606
Train [81][2200/3239]	Time 0.285 (0.991)	Data Time 0.002 (0.453)	Loss 2.1651 (2.4756)	Entropy 0.58589 (0.58597)	Top-1 acc 73.438 (64.228)	Top-5 acc 89.453 (84.270)	lr 0.00606
Train [81][2210/3239]	Time 0.237 (0.989)	Data Time 0.001 (0.451)	Loss 2.5881 (2.4757)	Entropy 0.58610 (0.58597)	Top-1 acc 62.891 (64.225)	Top-5 acc 84.375 (84.268)	lr 0.00606
Train [81][2220/3239]	Time 0.248 (0.997)	Data Time 0.001 (0.459)	Loss 2.4438 (2.4755)	Entropy 0.58603 (0.58597)	Top-1 acc 63.281 (64.227)	Top-5 acc 85.547 (84.272)	lr 0.00606
Train [81][2230/3239]	Time 0.247 (0.994)	Data Time 0.001 (0.457)	Loss 2.5507 (2.4754)	Entropy 0.58592 (0.58597)	Top-1 acc 60.547 (64.227)	Top-5 acc 82.812 (84.271)	lr 0.00606
Train [81][2240/3239]	Time 0.250 (0.993)	Data Time 0.001 (0.456)	Loss 2.6212 (2.4757)	Entropy 0.58606 (0.58597)	Top-1 acc 64.844 (64.221)	Top-5 acc 79.297 (84.262)	lr 0.00606
Train [81][2250/3239]	Time 0.259 (0.998)	Data Time 0.001 (0.462)	Loss 2.4519 (2.4756)	Entropy 0.58608 (0.58597)	Top-1 acc 66.016 (64.222)	Top-5 acc 83.594 (84.262)	lr 0.00605
Train [81][2260/3239]	Time 0.269 (0.997)	Data Time 0.001 (0.461)	Loss 2.3841 (2.4758)	Entropy 0.58621 (0.58597)	Top-1 acc 67.969 (64.221)	Top-5 acc 86.328 (84.258)	lr 0.00605
Train [81][2270/3239]	Time 0.241 (0.995)	Data Time 0.001 (0.460)	Loss 2.4717 (2.4761)	Entropy 0.58604 (0.58598)	Top-1 acc 65.625 (64.219)	Top-5 acc 82.812 (84.253)	lr 0.00605
Train [81][2280/3239]	Time 0.330 (1.001)	Data Time 0.001 (0.466)	Loss 2.4706 (2.4762)	Entropy 0.58618 (0.58598)	Top-1 acc 67.188 (64.218)	Top-5 acc 83.984 (84.252)	lr 0.00605
Train [81][2290/3239]	Time 0.236 (1.000)	Data Time 0.001 (0.466)	Loss 2.5999 (2.4763)	Entropy 0.58615 (0.58598)	Top-1 acc 59.766 (64.213)	Top-5 acc 80.859 (84.252)	lr 0.00605
Train [81][2300/3239]	Time 0.253 (0.998)	Data Time 0.001 (0.464)	Loss 2.7223 (2.4762)	Entropy 0.58598 (0.58598)	Top-1 acc 58.984 (64.215)	Top-5 acc 80.469 (84.255)	lr 0.00605
Train [81][2310/3239]	Time 3.382 (1.004)	Data Time 3.120 (0.471)	Loss 2.5024 (2.4761)	Entropy 0.58577 (0.58598)	Top-1 acc 63.281 (64.223)	Top-5 acc 82.422 (84.253)	lr 0.00605
Train [81][2320/3239]	Time 0.289 (1.004)	Data Time 0.002 (0.470)	Loss 2.4359 (2.4760)	Entropy 0.58587 (0.58598)	Top-1 acc 64.453 (64.228)	Top-5 acc 85.938 (84.256)	lr 0.00605
Train [81][2330/3239]	Time 0.261 (1.001)	Data Time 0.002 (0.468)	Loss 2.4637 (2.4762)	Entropy 0.58566 (0.58597)	Top-1 acc 64.453 (64.224)	Top-5 acc 83.594 (84.250)	lr 0.00605
Train [81][2340/3239]	Time 10.873 (1.006)	Data Time 10.638 (0.473)	Loss 2.3575 (2.4761)	Entropy 0.58557 (0.58597)	Top-1 acc 68.750 (64.226)	Top-5 acc 85.938 (84.251)	lr 0.00605
Train [81][2350/3239]	Time 0.397 (1.006)	Data Time 0.001 (0.474)	Loss 2.5505 (2.4766)	Entropy 0.58565 (0.58597)	Top-1 acc 62.500 (64.216)	Top-5 acc 85.156 (84.246)	lr 0.00605
Train [81][2360/3239]	Time 0.253 (1.004)	Data Time 0.001 (0.472)	Loss 2.5097 (2.4763)	Entropy 0.58540 (0.58597)	Top-1 acc 62.891 (64.224)	Top-5 acc 82.812 (84.249)	lr 0.00604
Train [81][2370/3239]	Time 0.234 (1.001)	Data Time 0.001 (0.470)	Loss 2.1938 (2.4762)	Entropy 0.58555 (0.58597)	Top-1 acc 72.656 (64.229)	Top-5 acc 88.672 (84.250)	lr 0.00604
Train [81][2380/3239]	Time 0.260 (1.009)	Data Time 0.001 (0.477)	Loss 2.2555 (2.4761)	Entropy 0.58583 (0.58597)	Top-1 acc 69.141 (64.230)	Top-5 acc 88.672 (84.253)	lr 0.00604
Train [81][2390/3239]	Time 0.230 (1.007)	Data Time 0.001 (0.476)	Loss 2.7490 (2.4761)	Entropy 0.58580 (0.58597)	Top-1 acc 58.203 (64.227)	Top-5 acc 80.859 (84.255)	lr 0.00604
Train [81][2400/3239]	Time 0.248 (1.004)	Data Time 0.002 (0.474)	Loss 2.4579 (2.4762)	Entropy 0.58578 (0.58596)	Top-1 acc 65.625 (64.224)	Top-5 acc 84.766 (84.253)	lr 0.00604
Train [81][2410/3239]	Time 0.221 (1.011)	Data Time 0.001 (0.481)	Loss 2.5496 (2.4763)	Entropy 0.58574 (0.58596)	Top-1 acc 61.719 (64.224)	Top-5 acc 83.984 (84.252)	lr 0.00604
Train [81][2420/3239]	Time 0.242 (1.009)	Data Time 0.001 (0.480)	Loss 2.5701 (2.4767)	Entropy 0.58561 (0.58596)	Top-1 acc 62.500 (64.216)	Top-5 acc 81.250 (84.245)	lr 0.00604
Train [81][2430/3239]	Time 0.232 (1.007)	Data Time 0.001 (0.478)	Loss 2.3036 (2.4764)	Entropy 0.58594 (0.58596)	Top-1 acc 65.234 (64.218)	Top-5 acc 87.109 (84.251)	lr 0.00604
Train [81][2440/3239]	Time 0.318 (1.015)	Data Time 0.001 (0.486)	Loss 2.5306 (2.4765)	Entropy 0.58589 (0.58596)	Top-1 acc 64.062 (64.215)	Top-5 acc 84.375 (84.252)	lr 0.00604
Train [81][2450/3239]	Time 0.228 (1.012)	Data Time 0.001 (0.484)	Loss 2.4939 (2.4764)	Entropy 0.58579 (0.58596)	Top-1 acc 65.625 (64.217)	Top-5 acc 81.641 (84.254)	lr 0.00604
Train [81][2460/3239]	Time 0.252 (1.010)	Data Time 0.001 (0.482)	Loss 2.3085 (2.4762)	Entropy 0.58602 (0.58596)	Top-1 acc 69.531 (64.222)	Top-5 acc 85.938 (84.256)	lr 0.00604
Train [81][2470/3239]	Time 0.238 (1.016)	Data Time 0.001 (0.489)	Loss 2.2630 (2.4762)	Entropy 0.58609 (0.58596)	Top-1 acc 66.797 (64.220)	Top-5 acc 87.891 (84.256)	lr 0.00604
Train [81][2480/3239]	Time 0.268 (1.015)	Data Time 0.002 (0.488)	Loss 2.3101 (2.4763)	Entropy 0.58619 (0.58596)	Top-1 acc 67.188 (64.217)	Top-5 acc 89.062 (84.254)	lr 0.00603
Train [81][2490/3239]	Time 0.246 (1.013)	Data Time 0.001 (0.486)	Loss 2.4805 (2.4763)	Entropy 0.58652 (0.58596)	Top-1 acc 62.891 (64.216)	Top-5 acc 80.859 (84.250)	lr 0.00603
Train [81][2500/3239]	Time 5.179 (1.015)	Data Time 4.929 (0.489)	Loss 2.7061 (2.4763)	Entropy 0.58669 (0.58597)	Top-1 acc 57.812 (64.217)	Top-5 acc 79.688 (84.250)	lr 0.00603
Train [81][2510/3239]	Time 0.434 (1.018)	Data Time 0.001 (0.492)	Loss 2.5509 (2.4762)	Entropy 0.58676 (0.58597)	Top-1 acc 60.156 (64.216)	Top-5 acc 83.203 (84.252)	lr 0.00603
Train [81][2520/3239]	Time 0.236 (1.015)	Data Time 0.001 (0.490)	Loss 2.6606 (2.4761)	Entropy 0.58680 (0.58597)	Top-1 acc 57.812 (64.218)	Top-5 acc 79.688 (84.249)	lr 0.00603
Train [81][2530/3239]	Time 0.241 (1.013)	Data Time 0.001 (0.488)	Loss 2.4273 (2.4762)	Entropy 0.58675 (0.58598)	Top-1 acc 63.281 (64.216)	Top-5 acc 84.375 (84.248)	lr 0.00603
Train [81][2540/3239]	Time 0.243 (1.021)	Data Time 0.001 (0.496)	Loss 2.5136 (2.4763)	Entropy 0.58679 (0.58598)	Top-1 acc 63.672 (64.212)	Top-5 acc 81.641 (84.245)	lr 0.00603
Train [81][2550/3239]	Time 0.240 (1.018)	Data Time 0.001 (0.494)	Loss 2.4320 (2.4764)	Entropy 0.58694 (0.58598)	Top-1 acc 65.625 (64.208)	Top-5 acc 85.547 (84.245)	lr 0.00603
Train [81][2560/3239]	Time 0.241 (1.016)	Data Time 0.001 (0.492)	Loss 2.7784 (2.4764)	Entropy 0.58727 (0.58599)	Top-1 acc 59.766 (64.210)	Top-5 acc 78.125 (84.243)	lr 0.00603
Train [81][2570/3239]	Time 3.525 (1.022)	Data Time 3.273 (0.499)	Loss 2.7009 (2.4767)	Entropy 0.58755 (0.58599)	Top-1 acc 57.422 (64.200)	Top-5 acc 78.906 (84.241)	lr 0.00603
Train [81][2580/3239]	Time 3.765 (1.021)	Data Time 3.414 (0.498)	Loss 2.4757 (2.4768)	Entropy 0.58739 (0.58600)	Top-1 acc 62.109 (64.195)	Top-5 acc 84.375 (84.240)	lr 0.00603
Train [81][2590/3239]	Time 0.251 (1.019)	Data Time 0.001 (0.496)	Loss 2.3703 (2.4766)	Entropy 0.58763 (0.58600)	Top-1 acc 64.453 (64.196)	Top-5 acc 86.328 (84.240)	lr 0.00602
Train [81][2600/3239]	Time 0.255 (1.025)	Data Time 0.001 (0.502)	Loss 2.5690 (2.4769)	Entropy 0.58770 (0.58601)	Top-1 acc 59.766 (64.185)	Top-5 acc 83.594 (84.234)	lr 0.00602
Train [81][2610/3239]	Time 0.244 (1.022)	Data Time 0.001 (0.500)	Loss 2.4155 (2.4770)	Entropy 0.58756 (0.58602)	Top-1 acc 67.188 (64.186)	Top-5 acc 85.547 (84.233)	lr 0.00602
Train [81][2620/3239]	Time 0.236 (1.020)	Data Time 0.002 (0.499)	Loss 2.3089 (2.4768)	Entropy 0.58748 (0.58602)	Top-1 acc 66.016 (64.187)	Top-5 acc 88.281 (84.235)	lr 0.00602
Train [81][2630/3239]	Time 0.220 (1.023)	Data Time 0.001 (0.502)	Loss 2.6562 (2.4770)	Entropy 0.58754 (0.58603)	Top-1 acc 59.375 (64.182)	Top-5 acc 82.812 (84.231)	lr 0.00602
Train [81][2640/3239]	Time 0.238 (1.021)	Data Time 0.001 (0.500)	Loss 2.4131 (2.4771)	Entropy 0.58764 (0.58603)	Top-1 acc 65.625 (64.179)	Top-5 acc 84.375 (84.229)	lr 0.00602
Train [81][2650/3239]	Time 0.251 (1.019)	Data Time 0.002 (0.498)	Loss 2.7085 (2.4772)	Entropy 0.58780 (0.58604)	Top-1 acc 58.594 (64.179)	Top-5 acc 79.297 (84.226)	lr 0.00602
Train [81][2660/3239]	Time 0.249 (1.017)	Data Time 0.001 (0.497)	Loss 2.4105 (2.4771)	Entropy 0.58794 (0.58605)	Top-1 acc 68.750 (64.186)	Top-5 acc 85.938 (84.224)	lr 0.00602
Train [81][2670/3239]	Time 0.371 (1.019)	Data Time 0.002 (0.499)	Loss 2.5905 (2.4771)	Entropy 0.58832 (0.58606)	Top-1 acc 62.891 (64.187)	Top-5 acc 82.422 (84.223)	lr 0.00602
Train [81][2680/3239]	Time 0.233 (1.018)	Data Time 0.001 (0.498)	Loss 2.7834 (2.4772)	Entropy 0.58851 (0.58606)	Top-1 acc 59.375 (64.184)	Top-5 acc 78.125 (84.219)	lr 0.00602
Train [81][2690/3239]	Time 0.246 (1.015)	Data Time 0.001 (0.496)	Loss 2.4909 (2.4773)	Entropy 0.58847 (0.58607)	Top-1 acc 65.234 (64.184)	Top-5 acc 85.547 (84.220)	lr 0.00602
Train [81][2700/3239]	Time 0.240 (1.023)	Data Time 0.001 (0.504)	Loss 2.6642 (2.4774)	Entropy 0.58860 (0.58608)	Top-1 acc 61.328 (64.185)	Top-5 acc 82.031 (84.218)	lr 0.00602
Train [81][2710/3239]	Time 0.242 (1.021)	Data Time 0.001 (0.502)	Loss 2.5324 (2.4774)	Entropy 0.58880 (0.58609)	Top-1 acc 60.938 (64.182)	Top-5 acc 83.594 (84.216)	lr 0.00601
Train [81][2720/3239]	Time 0.243 (1.018)	Data Time 0.001 (0.501)	Loss 2.5512 (2.4775)	Entropy 0.58899 (0.58610)	Top-1 acc 62.500 (64.179)	Top-5 acc 82.812 (84.213)	lr 0.00601
Train [81][2730/3239]	Time 0.246 (1.025)	Data Time 0.001 (0.508)	Loss 2.4399 (2.4774)	Entropy 0.58919 (0.58611)	Top-1 acc 62.891 (64.183)	Top-5 acc 82.812 (84.213)	lr 0.00601
Train [81][2740/3239]	Time 0.361 (1.023)	Data Time 0.001 (0.506)	Loss 2.6190 (2.4776)	Entropy 0.58911 (0.58612)	Top-1 acc 59.766 (64.177)	Top-5 acc 83.594 (84.214)	lr 0.00601
Train [81][2750/3239]	Time 0.226 (1.021)	Data Time 0.001 (0.504)	Loss 2.4824 (2.4775)	Entropy 0.58917 (0.58613)	Top-1 acc 62.109 (64.179)	Top-5 acc 84.375 (84.214)	lr 0.00601
Train [81][2760/3239]	Time 0.248 (1.027)	Data Time 0.001 (0.510)	Loss 2.4056 (2.4776)	Entropy 0.58912 (0.58615)	Top-1 acc 64.062 (64.174)	Top-5 acc 85.547 (84.209)	lr 0.00601
Train [81][2770/3239]	Time 0.373 (1.044)	Data Time 0.042 (0.508)	Loss 2.4216 (2.4776)	Entropy 0.58934 (0.58616)	Top-1 acc 63.672 (64.173)	Top-5 acc 87.109 (84.211)	lr 0.00601
Train [81][2780/3239]	Time 0.239 (1.042)	Data Time 0.002 (0.507)	Loss 2.4146 (2.4776)	Entropy 0.58945 (0.58617)	Top-1 acc 66.016 (64.175)	Top-5 acc 84.766 (84.210)	lr 0.00601
Train [81][2790/3239]	Time 0.246 (1.040)	Data Time 0.002 (0.505)	Loss 2.2933 (2.4774)	Entropy 0.58972 (0.58618)	Top-1 acc 67.188 (64.177)	Top-5 acc 86.719 (84.213)	lr 0.00601
Train [81][2800/3239]	Time 0.264 (1.038)	Data Time 0.002 (0.503)	Loss 2.5403 (2.4775)	Entropy 0.58935 (0.58619)	Top-1 acc 62.500 (64.174)	Top-5 acc 83.984 (84.214)	lr 0.00601
Train [81][2810/3239]	Time 0.273 (1.036)	Data Time 0.002 (0.501)	Loss 2.4829 (2.4776)	Entropy 0.58955 (0.58621)	Top-1 acc 62.891 (64.174)	Top-5 acc 83.594 (84.214)	lr 0.00601
Train [81][2820/3239]	Time 0.237 (1.034)	Data Time 0.001 (0.499)	Loss 2.7334 (2.4777)	Entropy 0.58987 (0.58622)	Top-1 acc 55.859 (64.174)	Top-5 acc 81.250 (84.211)	lr 0.00600
Train [81][2830/3239]	Time 0.337 (1.031)	Data Time 0.001 (0.498)	Loss 2.6321 (2.4779)	Entropy 0.59004 (0.58623)	Top-1 acc 59.375 (64.166)	Top-5 acc 82.422 (84.208)	lr 0.00600
Train [81][2840/3239]	Time 0.239 (1.029)	Data Time 0.002 (0.496)	Loss 2.5135 (2.4781)	Entropy 0.58995 (0.58624)	Top-1 acc 61.719 (64.158)	Top-5 acc 85.156 (84.203)	lr 0.00600
Train [81][2850/3239]	Time 0.233 (1.027)	Data Time 0.001 (0.494)	Loss 2.4450 (2.4781)	Entropy 0.58995 (0.58626)	Top-1 acc 64.844 (64.156)	Top-5 acc 83.203 (84.202)	lr 0.00600
Train [81][2860/3239]	Time 0.257 (1.026)	Data Time 0.001 (0.494)	Loss 2.5605 (2.4783)	Entropy 0.58993 (0.58627)	Top-1 acc 62.891 (64.150)	Top-5 acc 82.812 (84.197)	lr 0.00600
Train [81][2870/3239]	Time 0.234 (1.025)	Data Time 0.001 (0.493)	Loss 2.4959 (2.4783)	Entropy 0.59009 (0.58628)	Top-1 acc 64.844 (64.149)	Top-5 acc 82.422 (84.198)	lr 0.00600
Train [81][2880/3239]	Time 2.830 (1.027)	Data Time 2.587 (0.495)	Loss 2.4804 (2.4785)	Entropy 0.59021 (0.58630)	Top-1 acc 63.672 (64.146)	Top-5 acc 83.203 (84.192)	lr 0.00600
Train [81][2890/3239]	Time 0.228 (1.027)	Data Time 0.001 (0.495)	Loss 2.6767 (2.4785)	Entropy 0.59035 (0.58631)	Top-1 acc 62.891 (64.146)	Top-5 acc 79.297 (84.192)	lr 0.00600
Train [81][2900/3239]	Time 0.329 (1.027)	Data Time 0.001 (0.495)	Loss 2.6887 (2.4788)	Entropy 0.58998 (0.58632)	Top-1 acc 58.203 (64.136)	Top-5 acc 79.688 (84.188)	lr 0.00600
Train [81][2910/3239]	Time 0.235 (1.027)	Data Time 0.001 (0.496)	Loss 2.5814 (2.4789)	Entropy 0.59016 (0.58634)	Top-1 acc 58.594 (64.134)	Top-5 acc 82.812 (84.188)	lr 0.00600
Train [81][2920/3239]	Time 0.281 (1.028)	Data Time 0.003 (0.498)	Loss 2.6483 (2.4790)	Entropy 0.59050 (0.58635)	Top-1 acc 58.594 (64.133)	Top-5 acc 79.688 (84.188)	lr 0.00600
Train [81][2930/3239]	Time 0.250 (1.028)	Data Time 0.001 (0.497)	Loss 2.5400 (2.4791)	Entropy 0.59073 (0.58636)	Top-1 acc 62.500 (64.129)	Top-5 acc 82.812 (84.186)	lr 0.00600
Train [81][2940/3239]	Time 0.242 (1.029)	Data Time 0.001 (0.499)	Loss 2.5250 (2.4792)	Entropy 0.59039 (0.58638)	Top-1 acc 60.547 (64.127)	Top-5 acc 82.422 (84.182)	lr 0.00599
Train [81][2950/3239]	Time 0.255 (1.030)	Data Time 0.002 (0.500)	Loss 2.4382 (2.4794)	Entropy 0.59045 (0.58639)	Top-1 acc 65.625 (64.122)	Top-5 acc 84.766 (84.181)	lr 0.00599
Train [81][2960/3239]	Time 1.209 (1.029)	Data Time 0.972 (0.499)	Loss 2.5962 (2.4794)	Entropy 0.59035 (0.58640)	Top-1 acc 62.109 (64.120)	Top-5 acc 80.469 (84.181)	lr 0.00599
Train [81][2970/3239]	Time 2.733 (1.030)	Data Time 2.464 (0.501)	Loss 2.3849 (2.4795)	Entropy 0.59030 (0.58642)	Top-1 acc 65.234 (64.116)	Top-5 acc 85.547 (84.176)	lr 0.00599
Train [81][2980/3239]	Time 0.248 (1.030)	Data Time 0.001 (0.501)	Loss 2.4827 (2.4794)	Entropy 0.59001 (0.58643)	Top-1 acc 66.797 (64.121)	Top-5 acc 85.547 (84.177)	lr 0.00599
Train [81][2990/3239]	Time 0.359 (1.030)	Data Time 0.001 (0.502)	Loss 2.6857 (2.4798)	Entropy 0.58982 (0.58644)	Top-1 acc 58.203 (64.111)	Top-5 acc 79.297 (84.170)	lr 0.00599
Train [81][3000/3239]	Time 0.268 (1.030)	Data Time 0.001 (0.502)	Loss 2.2863 (2.4796)	Entropy 0.58970 (0.58645)	Top-1 acc 69.922 (64.114)	Top-5 acc 86.328 (84.172)	lr 0.00599
Train [81][3010/3239]	Time 0.245 (1.031)	Data Time 0.001 (0.503)	Loss 3.0217 (2.4797)	Entropy 0.58969 (0.58646)	Top-1 acc 48.047 (64.111)	Top-5 acc 75.391 (84.168)	lr 0.00599
Train [81][3020/3239]	Time 0.249 (1.030)	Data Time 0.001 (0.502)	Loss 2.4486 (2.4797)	Entropy 0.58970 (0.58648)	Top-1 acc 63.672 (64.111)	Top-5 acc 84.375 (84.169)	lr 0.00599
Train [81][3030/3239]	Time 0.274 (1.031)	Data Time 0.001 (0.504)	Loss 2.5713 (2.4797)	Entropy 0.58996 (0.58649)	Top-1 acc 65.234 (64.111)	Top-5 acc 81.641 (84.169)	lr 0.00599
Train [81][3040/3239]	Time 3.355 (1.032)	Data Time 3.105 (0.505)	Loss 2.4453 (2.4798)	Entropy 0.59005 (0.58650)	Top-1 acc 64.062 (64.108)	Top-5 acc 86.328 (84.168)	lr 0.00599
Train [81][3050/3239]	Time 0.232 (1.031)	Data Time 0.001 (0.505)	Loss 2.5120 (2.4796)	Entropy 0.59019 (0.58651)	Top-1 acc 66.406 (64.113)	Top-5 acc 82.422 (84.170)	lr 0.00599
Train [81][3060/3239]	Time 0.351 (1.032)	Data Time 0.001 (0.506)	Loss 2.5697 (2.4798)	Entropy 0.59028 (0.58652)	Top-1 acc 60.547 (64.108)	Top-5 acc 84.766 (84.164)	lr 0.00598
Train [81][3070/3239]	Time 1.045 (1.032)	Data Time 0.793 (0.506)	Loss 2.3818 (2.4799)	Entropy 0.59049 (0.58653)	Top-1 acc 67.578 (64.102)	Top-5 acc 85.156 (84.164)	lr 0.00598
Train [81][3080/3239]	Time 0.249 (1.034)	Data Time 0.001 (0.508)	Loss 2.5233 (2.4800)	Entropy 0.59064 (0.58655)	Top-1 acc 61.328 (64.099)	Top-5 acc 84.766 (84.161)	lr 0.00598
Train [81][3090/3239]	Time 0.256 (1.034)	Data Time 0.001 (0.509)	Loss 2.5180 (2.4799)	Entropy 0.59087 (0.58656)	Top-1 acc 64.062 (64.100)	Top-5 acc 83.984 (84.164)	lr 0.00598
Train [81][3100/3239]	Time 4.044 (1.035)	Data Time 3.711 (0.509)	Loss 2.3876 (2.4799)	Entropy 0.59104 (0.58658)	Top-1 acc 66.016 (64.099)	Top-5 acc 85.547 (84.162)	lr 0.00598
Train [81][3110/3239]	Time 0.243 (1.035)	Data Time 0.001 (0.511)	Loss 2.4237 (2.4799)	Entropy 0.59142 (0.58659)	Top-1 acc 65.234 (64.094)	Top-5 acc 84.766 (84.162)	lr 0.00598
Train [81][3120/3239]	Time 0.228 (1.037)	Data Time 0.001 (0.512)	Loss 2.3479 (2.4798)	Entropy 0.59156 (0.58661)	Top-1 acc 69.922 (64.096)	Top-5 acc 85.938 (84.162)	lr 0.00598
Train [81][3130/3239]	Time 4.219 (1.036)	Data Time 3.994 (0.512)	Loss 2.4341 (2.4797)	Entropy 0.59157 (0.58662)	Top-1 acc 66.797 (64.098)	Top-5 acc 84.375 (84.161)	lr 0.00598
Train [81][3140/3239]	Time 0.279 (1.037)	Data Time 0.001 (0.513)	Loss 2.4780 (2.4798)	Entropy 0.59167 (0.58664)	Top-1 acc 66.406 (64.099)	Top-5 acc 83.984 (84.159)	lr 0.00598
Train [81][3150/3239]	Time 0.313 (1.038)	Data Time 0.003 (0.514)	Loss 2.3125 (2.4794)	Entropy 0.59082 (0.58665)	Top-1 acc 70.703 (64.108)	Top-5 acc 88.281 (84.166)	lr 0.00598
Train [81][3160/3239]	Time 0.236 (1.036)	Data Time 0.001 (0.513)	Loss 2.5304 (2.4794)	Entropy 0.59077 (0.58667)	Top-1 acc 64.062 (64.110)	Top-5 acc 83.203 (84.165)	lr 0.00598
Train [81][3170/3239]	Time 0.231 (1.038)	Data Time 0.001 (0.515)	Loss 2.4633 (2.4792)	Entropy 0.59079 (0.58668)	Top-1 acc 61.719 (64.114)	Top-5 acc 85.547 (84.168)	lr 0.00597
Train [81][3180/3239]	Time 0.237 (1.036)	Data Time 0.000 (0.513)	Loss 2.6409 (2.4794)	Entropy 0.59097 (0.58669)	Top-1 acc 60.938 (64.109)	Top-5 acc 81.250 (84.164)	lr 0.00597
Train [81][3190/3239]	Time 0.238 (1.037)	Data Time 0.000 (0.515)	Loss 2.4195 (2.4795)	Entropy 0.59076 (0.58670)	Top-1 acc 63.281 (64.108)	Top-5 acc 86.328 (84.164)	lr 0.00597
Train [81][3200/3239]	Time 3.684 (1.040)	Data Time 3.383 (0.518)	Loss 2.4492 (2.4794)	Entropy 0.59068 (0.58672)	Top-1 acc 64.062 (64.113)	Top-5 acc 84.766 (84.165)	lr 0.00597
Train [81][3210/3239]	Time 0.236 (1.039)	Data Time 0.000 (0.517)	Loss 2.5648 (2.4792)	Entropy 0.59059 (0.58673)	Top-1 acc 61.328 (64.115)	Top-5 acc 82.422 (84.168)	lr 0.00597
Train [81][3220/3239]	Time 0.337 (1.039)	Data Time 0.000 (0.518)	Loss 2.4284 (2.4792)	Entropy 0.59083 (0.58674)	Top-1 acc 60.547 (64.111)	Top-5 acc 87.109 (84.165)	lr 0.00597
Train [81][3230/3239]	Time 0.261 (1.038)	Data Time 0.000 (0.517)	Loss 2.7345 (2.4794)	Entropy 0.59061 (0.58676)	Top-1 acc 59.766 (64.105)	Top-5 acc 80.078 (84.164)	lr 0.00597
Train [81][3239/3239]	Time 0.806 (1.037)	Data Time 0.000 (0.516)	Loss 2.6016 (2.4795)	Entropy 0.59061 (0.58677)	Top-1 acc 62.963 (64.104)	Top-5 acc 88.889 (84.164)	lr 0.00597
==========Valid [81/120]	loss 1.277	top-1 acc 70.617 (70.617)	top-5 acc 89.365	Train top-1 64.104	top-5 84.164	Entropy 0.59061	Latency-None: 0.000ms	Flops: 539.00M
Train [82][0/3239]	Time 52.101 (52.101)	Data Time 50.462 (50.462)	Loss 2.5197 (2.5197)	Entropy 0.59045 (0.59045)	Top-1 acc 62.891 (62.891)	Top-5 acc 83.594 (83.594)	lr 0.00597
Train [82][10/3239]	Time 0.262 (5.169)	Data Time 0.002 (4.591)	Loss 2.3080 (2.4274)	Entropy 0.59058 (0.59056)	Top-1 acc 67.188 (64.560)	Top-5 acc 85.156 (85.405)	lr 0.00597
Train [82][20/3239]	Time 0.243 (2.908)	Data Time 0.001 (2.406)	Loss 2.6336 (2.4679)	Entropy 0.59015 (0.59049)	Top-1 acc 62.500 (64.044)	Top-5 acc 81.250 (84.505)	lr 0.00597
Train [82][30/3239]	Time 0.242 (2.111)	Data Time 0.001 (1.630)	Loss 2.3503 (2.4995)	Entropy 0.59018 (0.59038)	Top-1 acc 68.359 (63.697)	Top-5 acc 89.453 (83.858)	lr 0.00597
Train [82][40/3239]	Time 0.254 (1.722)	Data Time 0.002 (1.241)	Loss 2.4269 (2.4966)	Entropy 0.59038 (0.59036)	Top-1 acc 65.234 (63.939)	Top-5 acc 85.938 (83.899)	lr 0.00597
Train [82][50/3239]	Time 0.347 (1.470)	Data Time 0.001 (0.998)	Loss 2.6214 (2.4901)	Entropy 0.59001 (0.59033)	Top-1 acc 62.109 (64.085)	Top-5 acc 82.422 (83.992)	lr 0.00596
Train [82][60/3239]	Time 0.252 (1.299)	Data Time 0.001 (0.835)	Loss 2.3282 (2.4936)	Entropy 0.59020 (0.59029)	Top-1 acc 70.703 (64.056)	Top-5 acc 87.109 (83.837)	lr 0.00596
Train [82][70/3239]	Time 0.251 (1.212)	Data Time 0.002 (0.745)	Loss 2.3049 (2.4878)	Entropy 0.59065 (0.59030)	Top-1 acc 67.969 (64.101)	Top-5 acc 86.328 (83.847)	lr 0.00596
Train [82][80/3239]	Time 0.228 (1.116)	Data Time 0.001 (0.653)	Loss 2.6016 (2.4883)	Entropy 0.59012 (0.59031)	Top-1 acc 60.938 (64.034)	Top-5 acc 80.859 (83.811)	lr 0.00596
Train [82][90/3239]	Time 0.253 (1.039)	Data Time 0.001 (0.581)	Loss 2.5859 (2.4842)	Entropy 0.59014 (0.59029)	Top-1 acc 61.719 (64.140)	Top-5 acc 82.031 (83.817)	lr 0.00596
Train [82][100/3239]	Time 0.247 (1.003)	Data Time 0.001 (0.546)	Loss 2.3764 (2.4748)	Entropy 0.59034 (0.59028)	Top-1 acc 65.625 (64.345)	Top-5 acc 85.547 (83.965)	lr 0.00596
Train [82][110/3239]	Time 0.235 (0.957)	Data Time 0.001 (0.503)	Loss 2.5795 (2.4768)	Entropy 0.59058 (0.59029)	Top-1 acc 64.453 (64.312)	Top-5 acc 83.203 (83.967)	lr 0.00596
Train [82][120/3239]	Time 0.345 (0.914)	Data Time 0.001 (0.461)	Loss 2.4022 (2.4721)	Entropy 0.59054 (0.59032)	Top-1 acc 66.016 (64.431)	Top-5 acc 84.766 (84.084)	lr 0.00596
Train [82][130/3239]	Time 0.245 (0.895)	Data Time 0.001 (0.444)	Loss 2.5468 (2.4734)	Entropy 0.59071 (0.59034)	Top-1 acc 61.328 (64.352)	Top-5 acc 81.250 (84.002)	lr 0.00596
Train [82][140/3239]	Time 0.257 (0.887)	Data Time 0.001 (0.436)	Loss 2.5622 (2.4706)	Entropy 0.59095 (0.59038)	Top-1 acc 62.500 (64.442)	Top-5 acc 80.859 (84.065)	lr 0.00596
Train [82][150/3239]	Time 0.249 (0.856)	Data Time 0.001 (0.407)	Loss 2.3710 (2.4654)	Entropy 0.59086 (0.59041)	Top-1 acc 64.844 (64.557)	Top-5 acc 86.328 (84.150)	lr 0.00596
Train [82][160/3239]	Time 1.406 (0.837)	Data Time 1.165 (0.389)	Loss 2.4373 (2.4631)	Entropy 0.59116 (0.59045)	Top-1 acc 64.062 (64.638)	Top-5 acc 85.938 (84.181)	lr 0.00595
Train [82][170/3239]	Time 0.284 (0.839)	Data Time 0.001 (0.392)	Loss 2.3317 (2.4594)	Entropy 0.59113 (0.59048)	Top-1 acc 71.875 (64.771)	Top-5 acc 85.156 (84.290)	lr 0.00595
Train [82][180/3239]	Time 0.259 (0.816)	Data Time 0.002 (0.370)	Loss 2.4382 (2.4608)	Entropy 0.59090 (0.59051)	Top-1 acc 64.453 (64.719)	Top-5 acc 85.156 (84.254)	lr 0.00595
Train [82][190/3239]	Time 0.289 (1.109)	Data Time 0.005 (0.351)	Loss 2.7866 (2.4611)	Entropy 0.59063 (0.59052)	Top-1 acc 53.516 (64.729)	Top-5 acc 79.688 (84.252)	lr 0.00595
Train [82][200/3239]	Time 0.244 (1.075)	Data Time 0.002 (0.334)	Loss 2.3013 (2.4610)	Entropy 0.59048 (0.59052)	Top-1 acc 67.578 (64.745)	Top-5 acc 89.062 (84.245)	lr 0.00595
Train [82][210/3239]	Time 0.322 (1.044)	Data Time 0.001 (0.318)	Loss 2.6220 (2.4604)	Entropy 0.59038 (0.59052)	Top-1 acc 63.281 (64.727)	Top-5 acc 81.250 (84.240)	lr 0.00595
Train [82][220/3239]	Time 0.247 (1.015)	Data Time 0.001 (0.304)	Loss 2.4762 (2.4611)	Entropy 0.59048 (0.59052)	Top-1 acc 63.281 (64.732)	Top-5 acc 84.375 (84.262)	lr 0.00595
Train [82][230/3239]	Time 0.241 (0.990)	Data Time 0.002 (0.291)	Loss 2.5230 (2.4640)	Entropy 0.59055 (0.59052)	Top-1 acc 62.500 (64.681)	Top-5 acc 82.812 (84.216)	lr 0.00595
Train [82][240/3239]	Time 0.248 (0.967)	Data Time 0.001 (0.279)	Loss 2.1694 (2.4632)	Entropy 0.59054 (0.59052)	Top-1 acc 71.875 (64.687)	Top-5 acc 89.844 (84.260)	lr 0.00595
Train [82][250/3239]	Time 0.276 (0.947)	Data Time 0.001 (0.268)	Loss 2.6700 (2.4630)	Entropy 0.59067 (0.59052)	Top-1 acc 60.156 (64.747)	Top-5 acc 78.516 (84.271)	lr 0.00595
Train [82][260/3239]	Time 0.264 (0.928)	Data Time 0.001 (0.258)	Loss 2.3506 (2.4644)	Entropy 0.59095 (0.59053)	Top-1 acc 69.531 (64.743)	Top-5 acc 85.938 (84.209)	lr 0.00595
Train [82][270/3239]	Time 0.269 (0.910)	Data Time 0.002 (0.248)	Loss 2.3305 (2.4647)	Entropy 0.59090 (0.59055)	Top-1 acc 68.359 (64.714)	Top-5 acc 83.594 (84.216)	lr 0.00595
Train [82][280/3239]	Time 0.326 (0.894)	Data Time 0.001 (0.239)	Loss 2.7970 (2.4645)	Entropy 0.59078 (0.59056)	Top-1 acc 60.547 (64.712)	Top-5 acc 78.906 (84.250)	lr 0.00594
Train [82][290/3239]	Time 0.234 (0.914)	Data Time 0.001 (0.267)	Loss 2.4824 (2.4649)	Entropy 0.59061 (0.59057)	Top-1 acc 64.844 (64.692)	Top-5 acc 83.203 (84.249)	lr 0.00594
Train [82][300/3239]	Time 0.242 (0.903)	Data Time 0.002 (0.263)	Loss 2.4373 (2.4634)	Entropy 0.59044 (0.59056)	Top-1 acc 64.844 (64.684)	Top-5 acc 83.594 (84.280)	lr 0.00594
Train [82][310/3239]	Time 0.235 (0.889)	Data Time 0.001 (0.255)	Loss 2.4624 (2.4636)	Entropy 0.59035 (0.59056)	Top-1 acc 67.188 (64.713)	Top-5 acc 85.938 (84.300)	lr 0.00594
Train [82][320/3239]	Time 1.614 (0.904)	Data Time 1.332 (0.276)	Loss 2.5070 (2.4643)	Entropy 0.59061 (0.59056)	Top-1 acc 62.500 (64.687)	Top-5 acc 82.812 (84.287)	lr 0.00594
Train [82][330/3239]	Time 0.291 (0.893)	Data Time 0.001 (0.270)	Loss 2.4145 (2.4634)	Entropy 0.59054 (0.59056)	Top-1 acc 70.312 (64.704)	Top-5 acc 83.984 (84.322)	lr 0.00594
Train [82][340/3239]	Time 0.240 (0.894)	Data Time 0.001 (0.277)	Loss 2.6556 (2.4648)	Entropy 0.59033 (0.59056)	Top-1 acc 63.281 (64.679)	Top-5 acc 82.422 (84.297)	lr 0.00594
Train [82][350/3239]	Time 2.822 (0.904)	Data Time 2.550 (0.292)	Loss 2.4125 (2.4641)	Entropy 0.59044 (0.59055)	Top-1 acc 65.234 (64.699)	Top-5 acc 85.938 (84.302)	lr 0.00594
Train [82][360/3239]	Time 1.309 (0.895)	Data Time 1.062 (0.287)	Loss 2.6130 (2.4639)	Entropy 0.59031 (0.59055)	Top-1 acc 62.891 (64.711)	Top-5 acc 81.641 (84.323)	lr 0.00594
Train [82][370/3239]	Time 0.246 (0.895)	Data Time 0.001 (0.293)	Loss 2.4633 (2.4635)	Entropy 0.59015 (0.59054)	Top-1 acc 64.844 (64.695)	Top-5 acc 84.766 (84.340)	lr 0.00594
Train [82][380/3239]	Time 0.259 (0.908)	Data Time 0.001 (0.310)	Loss 2.3758 (2.4644)	Entropy 0.59011 (0.59053)	Top-1 acc 67.578 (64.684)	Top-5 acc 86.328 (84.305)	lr 0.00594
Train [82][390/3239]	Time 0.284 (0.895)	Data Time 0.001 (0.302)	Loss 2.5376 (2.4640)	Entropy 0.58996 (0.59052)	Top-1 acc 62.109 (64.690)	Top-5 acc 80.469 (84.300)	lr 0.00594
Train [82][400/3239]	Time 2.788 (0.901)	Data Time 2.534 (0.311)	Loss 2.2051 (2.4650)	Entropy 0.59024 (0.59051)	Top-1 acc 69.922 (64.671)	Top-5 acc 90.625 (84.284)	lr 0.00593
Train [82][410/3239]	Time 0.254 (0.891)	Data Time 0.001 (0.306)	Loss 2.6304 (2.4644)	Entropy 0.59049 (0.59050)	Top-1 acc 60.547 (64.690)	Top-5 acc 80.859 (84.302)	lr 0.00593
Train [82][420/3239]	Time 0.242 (0.904)	Data Time 0.001 (0.322)	Loss 2.3385 (2.4634)	Entropy 0.59073 (0.59050)	Top-1 acc 63.672 (64.679)	Top-5 acc 90.234 (84.332)	lr 0.00593
Train [82][430/3239]	Time 0.250 (0.898)	Data Time 0.001 (0.321)	Loss 2.3689 (2.4636)	Entropy 0.59106 (0.59051)	Top-1 acc 67.188 (64.676)	Top-5 acc 86.328 (84.310)	lr 0.00593
Train [82][440/3239]	Time 0.333 (0.896)	Data Time 0.001 (0.322)	Loss 2.4007 (2.4634)	Entropy 0.59129 (0.59052)	Top-1 acc 66.016 (64.658)	Top-5 acc 86.328 (84.324)	lr 0.00593
Train [82][450/3239]	Time 0.230 (0.911)	Data Time 0.001 (0.340)	Loss 2.6016 (2.4623)	Entropy 0.59143 (0.59054)	Top-1 acc 60.156 (64.695)	Top-5 acc 82.812 (84.364)	lr 0.00593
Train [82][460/3239]	Time 0.277 (0.901)	Data Time 0.002 (0.333)	Loss 2.5236 (2.4624)	Entropy 0.59173 (0.59056)	Top-1 acc 66.016 (64.675)	Top-5 acc 81.641 (84.361)	lr 0.00593
Train [82][470/3239]	Time 0.251 (0.899)	Data Time 0.001 (0.334)	Loss 2.4488 (2.4611)	Entropy 0.59173 (0.59059)	Top-1 acc 67.188 (64.723)	Top-5 acc 83.984 (84.392)	lr 0.00593
Train [82][480/3239]	Time 0.270 (0.909)	Data Time 0.001 (0.346)	Loss 2.3229 (2.4633)	Entropy 0.59210 (0.59061)	Top-1 acc 69.922 (64.680)	Top-5 acc 85.547 (84.355)	lr 0.00593
Train [82][490/3239]	Time 0.258 (0.902)	Data Time 0.002 (0.342)	Loss 2.5902 (2.4625)	Entropy 0.59223 (0.59064)	Top-1 acc 60.938 (64.697)	Top-5 acc 82.422 (84.368)	lr 0.00593
Train [82][500/3239]	Time 0.235 (0.898)	Data Time 0.001 (0.340)	Loss 2.2788 (2.4625)	Entropy 0.59255 (0.59068)	Top-1 acc 68.750 (64.688)	Top-5 acc 86.719 (84.372)	lr 0.00593
Train [82][510/3239]	Time 0.335 (0.911)	Data Time 0.001 (0.356)	Loss 2.4023 (2.4622)	Entropy 0.59274 (0.59071)	Top-1 acc 66.406 (64.708)	Top-5 acc 86.328 (84.375)	lr 0.00592
Train [82][520/3239]	Time 2.956 (0.907)	Data Time 2.713 (0.354)	Loss 2.7165 (2.4628)	Entropy 0.59238 (0.59075)	Top-1 acc 59.375 (64.668)	Top-5 acc 80.078 (84.370)	lr 0.00592
Train [82][530/3239]	Time 0.235 (0.901)	Data Time 0.001 (0.350)	Loss 2.4550 (2.4625)	Entropy 0.59251 (0.59078)	Top-1 acc 65.625 (64.674)	Top-5 acc 82.422 (84.374)	lr 0.00592
Train [82][540/3239]	Time 0.252 (0.915)	Data Time 0.001 (0.366)	Loss 2.6243 (2.4624)	Entropy 0.59242 (0.59082)	Top-1 acc 62.109 (64.671)	Top-5 acc 82.422 (84.366)	lr 0.00592
Train [82][550/3239]	Time 0.232 (0.906)	Data Time 0.001 (0.360)	Loss 2.5757 (2.4623)	Entropy 0.59229 (0.59084)	Top-1 acc 61.719 (64.674)	Top-5 acc 82.031 (84.366)	lr 0.00592
Train [82][560/3239]	Time 0.277 (0.909)	Data Time 0.001 (0.365)	Loss 2.6359 (2.4623)	Entropy 0.59208 (0.59087)	Top-1 acc 62.891 (64.681)	Top-5 acc 81.641 (84.385)	lr 0.00592
Train [82][570/3239]	Time 0.266 (0.902)	Data Time 0.001 (0.360)	Loss 2.4004 (2.4630)	Entropy 0.59216 (0.59089)	Top-1 acc 72.266 (64.677)	Top-5 acc 84.375 (84.384)	lr 0.00592
Train [82][580/3239]	Time 0.254 (0.910)	Data Time 0.001 (0.370)	Loss 2.3448 (2.4630)	Entropy 0.59197 (0.59091)	Top-1 acc 67.969 (64.686)	Top-5 acc 86.328 (84.384)	lr 0.00592
Train [82][590/3239]	Time 0.241 (0.916)	Data Time 0.001 (0.378)	Loss 2.4730 (2.4628)	Entropy 0.59171 (0.59093)	Top-1 acc 66.406 (64.692)	Top-5 acc 84.766 (84.403)	lr 0.00592
Train [82][600/3239]	Time 0.320 (0.908)	Data Time 0.001 (0.372)	Loss 2.5053 (2.4644)	Entropy 0.59173 (0.59094)	Top-1 acc 61.719 (64.641)	Top-5 acc 83.203 (84.374)	lr 0.00592
Train [82][610/3239]	Time 0.230 (0.918)	Data Time 0.001 (0.384)	Loss 2.3361 (2.4638)	Entropy 0.59189 (0.59096)	Top-1 acc 66.406 (64.648)	Top-5 acc 84.766 (84.382)	lr 0.00592
Train [82][620/3239]	Time 0.243 (0.910)	Data Time 0.001 (0.378)	Loss 2.5551 (2.4635)	Entropy 0.59175 (0.59097)	Top-1 acc 60.156 (64.649)	Top-5 acc 81.641 (84.381)	lr 0.00592
Train [82][630/3239]	Time 0.250 (0.910)	Data Time 0.001 (0.379)	Loss 2.4295 (2.4637)	Entropy 0.59188 (0.59098)	Top-1 acc 64.844 (64.639)	Top-5 acc 83.203 (84.368)	lr 0.00591
Train [82][640/3239]	Time 0.238 (0.925)	Data Time 0.001 (0.396)	Loss 2.7328 (2.4636)	Entropy 0.59197 (0.59100)	Top-1 acc 58.203 (64.638)	Top-5 acc 80.078 (84.374)	lr 0.00591
Train [82][650/3239]	Time 0.261 (0.918)	Data Time 0.001 (0.390)	Loss 2.4888 (2.4622)	Entropy 0.59228 (0.59101)	Top-1 acc 61.328 (64.679)	Top-5 acc 85.938 (84.406)	lr 0.00591
Train [82][660/3239]	Time 0.245 (0.912)	Data Time 0.001 (0.386)	Loss 2.4184 (2.4622)	Entropy 0.59220 (0.59103)	Top-1 acc 68.750 (64.694)	Top-5 acc 84.766 (84.403)	lr 0.00591
Train [82][670/3239]	Time 0.337 (0.927)	Data Time 0.002 (0.402)	Loss 2.5316 (2.4629)	Entropy 0.59230 (0.59105)	Top-1 acc 64.453 (64.678)	Top-5 acc 82.812 (84.402)	lr 0.00591
Train [82][680/3239]	Time 3.218 (0.924)	Data Time 2.965 (0.400)	Loss 2.5005 (2.4632)	Entropy 0.59270 (0.59107)	Top-1 acc 62.500 (64.665)	Top-5 acc 83.594 (84.409)	lr 0.00591
Train [82][690/3239]	Time 0.242 (0.917)	Data Time 0.001 (0.395)	Loss 2.4369 (2.4622)	Entropy 0.59254 (0.59109)	Top-1 acc 65.234 (64.688)	Top-5 acc 86.328 (84.435)	lr 0.00591
Train [82][700/3239]	Time 0.233 (0.931)	Data Time 0.001 (0.410)	Loss 2.5911 (2.4625)	Entropy 0.59256 (0.59111)	Top-1 acc 59.375 (64.672)	Top-5 acc 79.297 (84.424)	lr 0.00591
Train [82][710/3239]	Time 0.232 (0.925)	Data Time 0.001 (0.405)	Loss 2.5613 (2.4632)	Entropy 0.59252 (0.59113)	Top-1 acc 62.891 (64.658)	Top-5 acc 83.203 (84.420)	lr 0.00591
Train [82][720/3239]	Time 0.238 (0.924)	Data Time 0.001 (0.405)	Loss 2.3336 (2.4630)	Entropy 0.59259 (0.59115)	Top-1 acc 67.188 (64.673)	Top-5 acc 86.328 (84.415)	lr 0.00591
Train [82][730/3239]	Time 0.265 (0.917)	Data Time 0.001 (0.399)	Loss 2.5190 (2.4627)	Entropy 0.59280 (0.59117)	Top-1 acc 62.109 (64.676)	Top-5 acc 82.812 (84.411)	lr 0.00591
Train [82][740/3239]	Time 0.225 (0.928)	Data Time 0.001 (0.412)	Loss 2.4524 (2.4628)	Entropy 0.59271 (0.59119)	Top-1 acc 65.234 (64.675)	Top-5 acc 86.719 (84.407)	lr 0.00591
Train [82][750/3239]	Time 0.242 (0.930)	Data Time 0.001 (0.415)	Loss 2.4195 (2.4623)	Entropy 0.59246 (0.59121)	Top-1 acc 67.578 (64.700)	Top-5 acc 83.984 (84.409)	lr 0.00590
Train [82][760/3239]	Time 0.273 (0.924)	Data Time 0.001 (0.410)	Loss 2.4884 (2.4632)	Entropy 0.59224 (0.59123)	Top-1 acc 65.625 (64.685)	Top-5 acc 83.984 (84.403)	lr 0.00590
Train [82][770/3239]	Time 0.240 (0.934)	Data Time 0.001 (0.421)	Loss 2.3919 (2.4632)	Entropy 0.59249 (0.59124)	Top-1 acc 66.797 (64.700)	Top-5 acc 85.547 (84.397)	lr 0.00590
Train [82][780/3239]	Time 0.283 (0.934)	Data Time 0.001 (0.422)	Loss 2.4116 (2.4633)	Entropy 0.59281 (0.59126)	Top-1 acc 64.062 (64.698)	Top-5 acc 86.719 (84.396)	lr 0.00590
Train [82][790/3239]	Time 0.288 (0.929)	Data Time 0.002 (0.418)	Loss 2.3939 (2.4639)	Entropy 0.59288 (0.59128)	Top-1 acc 64.453 (64.678)	Top-5 acc 85.156 (84.388)	lr 0.00590
Train [82][800/3239]	Time 0.225 (0.943)	Data Time 0.001 (0.433)	Loss 2.6069 (2.4635)	Entropy 0.59281 (0.59130)	Top-1 acc 64.062 (64.701)	Top-5 acc 82.812 (84.398)	lr 0.00590
Train [82][810/3239]	Time 0.232 (0.941)	Data Time 0.001 (0.432)	Loss 2.4013 (2.4645)	Entropy 0.59265 (0.59132)	Top-1 acc 64.062 (64.664)	Top-5 acc 84.766 (84.375)	lr 0.00590
Train [82][820/3239]	Time 0.239 (0.937)	Data Time 0.003 (0.429)	Loss 2.5178 (2.4645)	Entropy 0.59256 (0.59134)	Top-1 acc 61.719 (64.656)	Top-5 acc 81.641 (84.373)	lr 0.00590
Train [82][830/3239]	Time 0.357 (0.953)	Data Time 0.001 (0.446)	Loss 2.9235 (2.4653)	Entropy 0.59281 (0.59135)	Top-1 acc 50.781 (64.639)	Top-5 acc 73.828 (84.352)	lr 0.00590
Train [82][840/3239]	Time 0.377 (1.012)	Data Time 0.004 (0.441)	Loss 2.4643 (2.4656)	Entropy 0.59273 (0.59137)	Top-1 acc 63.281 (64.611)	Top-5 acc 85.156 (84.361)	lr 0.00590
Train [82][850/3239]	Time 0.250 (1.006)	Data Time 0.002 (0.436)	Loss 2.5235 (2.4653)	Entropy 0.59252 (0.59138)	Top-1 acc 62.109 (64.618)	Top-5 acc 85.156 (84.369)	lr 0.00590
Train [82][860/3239]	Time 0.245 (0.999)	Data Time 0.002 (0.431)	Loss 2.4426 (2.4642)	Entropy 0.59229 (0.59140)	Top-1 acc 67.188 (64.641)	Top-5 acc 86.328 (84.387)	lr 0.00589
Train [82][870/3239]	Time 0.244 (0.993)	Data Time 0.001 (0.426)	Loss 2.3697 (2.4641)	Entropy 0.59278 (0.59141)	Top-1 acc 62.500 (64.624)	Top-5 acc 87.891 (84.392)	lr 0.00589
Train [82][880/3239]	Time 0.235 (0.986)	Data Time 0.001 (0.421)	Loss 2.5283 (2.4646)	Entropy 0.59246 (0.59142)	Top-1 acc 61.719 (64.596)	Top-5 acc 83.984 (84.376)	lr 0.00589
Train [82][890/3239]	Time 0.233 (0.980)	Data Time 0.001 (0.416)	Loss 2.4982 (2.4651)	Entropy 0.59271 (0.59144)	Top-1 acc 63.281 (64.580)	Top-5 acc 83.984 (84.376)	lr 0.00589
Train [82][900/3239]	Time 0.244 (0.974)	Data Time 0.001 (0.412)	Loss 2.4904 (2.4658)	Entropy 0.59289 (0.59145)	Top-1 acc 66.016 (64.552)	Top-5 acc 83.984 (84.371)	lr 0.00589
Train [82][910/3239]	Time 0.248 (0.973)	Data Time 0.001 (0.412)	Loss 2.3694 (2.4644)	Entropy 0.59242 (0.59146)	Top-1 acc 65.234 (64.587)	Top-5 acc 83.984 (84.395)	lr 0.00589
Train [82][920/3239]	Time 0.338 (0.973)	Data Time 0.001 (0.414)	Loss 2.3903 (2.4659)	Entropy 0.59266 (0.59148)	Top-1 acc 67.969 (64.559)	Top-5 acc 86.719 (84.377)	lr 0.00589
Train [82][930/3239]	Time 0.230 (0.967)	Data Time 0.001 (0.409)	Loss 2.4394 (2.4655)	Entropy 0.59293 (0.59149)	Top-1 acc 67.969 (64.569)	Top-5 acc 84.766 (84.391)	lr 0.00589
Train [82][940/3239]	Time 0.249 (0.980)	Data Time 0.001 (0.424)	Loss 2.5085 (2.4656)	Entropy 0.59298 (0.59151)	Top-1 acc 65.234 (64.575)	Top-5 acc 84.375 (84.393)	lr 0.00589
Train [82][950/3239]	Time 0.239 (0.979)	Data Time 0.001 (0.424)	Loss 2.4640 (2.4657)	Entropy 0.59334 (0.59152)	Top-1 acc 67.578 (64.587)	Top-5 acc 82.812 (84.393)	lr 0.00589
Train [82][960/3239]	Time 0.229 (0.980)	Data Time 0.001 (0.426)	Loss 2.6080 (2.4663)	Entropy 0.59324 (0.59154)	Top-1 acc 64.062 (64.569)	Top-5 acc 84.375 (84.390)	lr 0.00589
Train [82][970/3239]	Time 0.240 (0.991)	Data Time 0.001 (0.438)	Loss 2.6788 (2.4667)	Entropy 0.59315 (0.59156)	Top-1 acc 57.031 (64.568)	Top-5 acc 82.422 (84.383)	lr 0.00589
Train [82][980/3239]	Time 0.229 (0.988)	Data Time 0.001 (0.436)	Loss 2.6534 (2.4676)	Entropy 0.59294 (0.59157)	Top-1 acc 60.156 (64.551)	Top-5 acc 80.469 (84.369)	lr 0.00588
Train [82][990/3239]	Time 0.360 (0.989)	Data Time 0.001 (0.439)	Loss 2.3763 (2.4676)	Entropy 0.59339 (0.59159)	Top-1 acc 64.844 (64.547)	Top-5 acc 88.281 (84.369)	lr 0.00588
Train [82][1000/3239]	Time 12.072 (0.995)	Data Time 11.815 (0.447)	Loss 2.4982 (2.4677)	Entropy 0.59339 (0.59161)	Top-1 acc 65.625 (64.539)	Top-5 acc 83.594 (84.367)	lr 0.00588
Train [82][1010/3239]	Time 1.057 (0.995)	Data Time 0.783 (0.447)	Loss 2.4945 (2.4674)	Entropy 0.59386 (0.59163)	Top-1 acc 63.672 (64.532)	Top-5 acc 85.547 (84.370)	lr 0.00588
Train [82][1020/3239]	Time 0.246 (0.999)	Data Time 0.001 (0.453)	Loss 2.3887 (2.4672)	Entropy 0.59403 (0.59165)	Top-1 acc 67.969 (64.540)	Top-5 acc 87.891 (84.368)	lr 0.00588
Train [82][1030/3239]	Time 0.231 (0.994)	Data Time 0.001 (0.448)	Loss 2.3315 (2.4670)	Entropy 0.59381 (0.59167)	Top-1 acc 67.188 (64.533)	Top-5 acc 87.891 (84.374)	lr 0.00588
Train [82][1040/3239]	Time 0.279 (1.004)	Data Time 0.001 (0.459)	Loss 2.4378 (2.4670)	Entropy 0.59384 (0.59169)	Top-1 acc 70.312 (64.532)	Top-5 acc 83.594 (84.370)	lr 0.00588
Train [82][1050/3239]	Time 0.244 (1.009)	Data Time 0.001 (0.466)	Loss 2.4862 (2.4670)	Entropy 0.59373 (0.59171)	Top-1 acc 62.500 (64.533)	Top-5 acc 83.203 (84.372)	lr 0.00588
Train [82][1060/3239]	Time 0.333 (1.004)	Data Time 0.001 (0.462)	Loss 2.4524 (2.4671)	Entropy 0.59404 (0.59173)	Top-1 acc 63.281 (64.529)	Top-5 acc 85.547 (84.376)	lr 0.00588
Train [82][1070/3239]	Time 0.251 (1.016)	Data Time 0.001 (0.474)	Loss 2.4271 (2.4672)	Entropy 0.59383 (0.59175)	Top-1 acc 64.453 (64.526)	Top-5 acc 84.375 (84.375)	lr 0.00588
Train [82][1080/3239]	Time 0.252 (1.014)	Data Time 0.001 (0.474)	Loss 2.5068 (2.4675)	Entropy 0.59346 (0.59177)	Top-1 acc 61.328 (64.515)	Top-5 acc 86.328 (84.379)	lr 0.00588
Train [82][1090/3239]	Time 0.255 (1.009)	Data Time 0.001 (0.470)	Loss 2.5459 (2.4671)	Entropy 0.59335 (0.59179)	Top-1 acc 65.625 (64.528)	Top-5 acc 80.859 (84.385)	lr 0.00588
Train [82][1100/3239]	Time 0.253 (1.018)	Data Time 0.002 (0.480)	Loss 2.4898 (2.4676)	Entropy 0.59342 (0.59180)	Top-1 acc 61.719 (64.517)	Top-5 acc 82.812 (84.374)	lr 0.00587
Train [82][1110/3239]	Time 0.238 (1.022)	Data Time 0.001 (0.484)	Loss 2.6103 (2.4681)	Entropy 0.59332 (0.59181)	Top-1 acc 58.594 (64.504)	Top-5 acc 81.641 (84.368)	lr 0.00587
Train [82][1120/3239]	Time 0.240 (1.018)	Data Time 0.001 (0.482)	Loss 2.3380 (2.4679)	Entropy 0.59343 (0.59183)	Top-1 acc 67.969 (64.519)	Top-5 acc 85.938 (84.368)	lr 0.00587
Train [82][1130/3239]	Time 0.252 (1.026)	Data Time 0.001 (0.491)	Loss 2.3241 (2.4678)	Entropy 0.59350 (0.59184)	Top-1 acc 67.188 (64.517)	Top-5 acc 89.453 (84.375)	lr 0.00587
Train [82][1140/3239]	Time 0.246 (1.030)	Data Time 0.001 (0.496)	Loss 2.3885 (2.4680)	Entropy 0.59353 (0.59186)	Top-1 acc 69.141 (64.512)	Top-5 acc 84.766 (84.371)	lr 0.00587
Train [82][1150/3239]	Time 0.349 (1.025)	Data Time 0.001 (0.491)	Loss 2.4944 (2.4683)	Entropy 0.59338 (0.59187)	Top-1 acc 64.453 (64.500)	Top-5 acc 83.984 (84.368)	lr 0.00587
Train [82][1160/3239]	Time 3.892 (1.023)	Data Time 3.621 (0.490)	Loss 2.2738 (2.4681)	Entropy 0.59344 (0.59188)	Top-1 acc 68.359 (64.514)	Top-5 acc 87.109 (84.366)	lr 0.00587
Train [82][1170/3239]	Time 0.236 (1.033)	Data Time 0.001 (0.501)	Loss 2.4932 (2.4688)	Entropy 0.59334 (0.59190)	Top-1 acc 65.625 (64.507)	Top-5 acc 84.766 (84.349)	lr 0.00587
Train [82][1180/3239]	Time 0.233 (1.028)	Data Time 0.002 (0.497)	Loss 2.3912 (2.4685)	Entropy 0.59328 (0.59191)	Top-1 acc 67.969 (64.521)	Top-5 acc 87.109 (84.354)	lr 0.00587
Train [82][1190/3239]	Time 0.222 (1.025)	Data Time 0.001 (0.495)	Loss 2.3511 (2.4683)	Entropy 0.59312 (0.59192)	Top-1 acc 71.094 (64.518)	Top-5 acc 84.766 (84.356)	lr 0.00587
Train [82][1200/3239]	Time 0.260 (1.037)	Data Time 0.001 (0.507)	Loss 2.3672 (2.4681)	Entropy 0.59292 (0.59193)	Top-1 acc 66.797 (64.526)	Top-5 acc 85.547 (84.361)	lr 0.00587
Train [82][1210/3239]	Time 0.290 (1.032)	Data Time 0.001 (0.503)	Loss 2.4026 (2.4679)	Entropy 0.59313 (0.59194)	Top-1 acc 67.969 (64.529)	Top-5 acc 85.156 (84.364)	lr 0.00586
Train [82][1220/3239]	Time 0.364 (1.029)	Data Time 0.001 (0.501)	Loss 2.4451 (2.4682)	Entropy 0.59299 (0.59195)	Top-1 acc 64.062 (64.521)	Top-5 acc 84.766 (84.360)	lr 0.00586
Train [82][1230/3239]	Time 0.248 (1.040)	Data Time 0.002 (0.513)	Loss 2.6666 (2.4685)	Entropy 0.59317 (0.59195)	Top-1 acc 55.859 (64.511)	Top-5 acc 80.078 (84.348)	lr 0.00586
Train [82][1240/3239]	Time 0.242 (1.035)	Data Time 0.001 (0.509)	Loss 2.3299 (2.4684)	Entropy 0.59290 (0.59196)	Top-1 acc 69.531 (64.513)	Top-5 acc 85.547 (84.352)	lr 0.00586
Train [82][1250/3239]	Time 0.238 (1.031)	Data Time 0.001 (0.506)	Loss 2.3983 (2.4682)	Entropy 0.59244 (0.59197)	Top-1 acc 66.016 (64.529)	Top-5 acc 83.203 (84.349)	lr 0.00586
Train [82][1260/3239]	Time 0.234 (1.035)	Data Time 0.001 (0.510)	Loss 2.4441 (2.4685)	Entropy 0.59275 (0.59198)	Top-1 acc 63.672 (64.527)	Top-5 acc 83.984 (84.336)	lr 0.00586
Train [82][1270/3239]	Time 0.244 (1.038)	Data Time 0.001 (0.514)	Loss 2.4388 (2.4684)	Entropy 0.59281 (0.59198)	Top-1 acc 66.016 (64.534)	Top-5 acc 87.500 (84.343)	lr 0.00586
Train [82][1280/3239]	Time 0.241 (1.038)	Data Time 0.001 (0.515)	Loss 2.4585 (2.4685)	Entropy 0.59277 (0.59199)	Top-1 acc 62.891 (64.525)	Top-5 acc 85.938 (84.340)	lr 0.00586
Train [82][1290/3239]	Time 0.241 (1.039)	Data Time 0.001 (0.516)	Loss 2.5478 (2.4685)	Entropy 0.59268 (0.59199)	Top-1 acc 64.453 (64.524)	Top-5 acc 82.812 (84.338)	lr 0.00586
Train [82][1300/3239]	Time 0.272 (1.044)	Data Time 0.001 (0.522)	Loss 2.5461 (2.4686)	Entropy 0.59261 (0.59200)	Top-1 acc 65.234 (64.532)	Top-5 acc 82.812 (84.334)	lr 0.00586
Train [82][1310/3239]	Time 0.337 (1.043)	Data Time 0.001 (0.521)	Loss 2.4807 (2.4682)	Entropy 0.59282 (0.59200)	Top-1 acc 61.328 (64.536)	Top-5 acc 85.547 (84.344)	lr 0.00586
Train [82][1320/3239]	Time 4.909 (1.042)	Data Time 4.656 (0.521)	Loss 2.5372 (2.4684)	Entropy 0.59309 (0.59201)	Top-1 acc 62.500 (64.522)	Top-5 acc 84.766 (84.340)	lr 0.00586
Train [82][1330/3239]	Time 5.481 (1.048)	Data Time 5.228 (0.529)	Loss 2.3956 (2.4682)	Entropy 0.59327 (0.59202)	Top-1 acc 69.141 (64.528)	Top-5 acc 86.719 (84.347)	lr 0.00585
Train [82][1340/3239]	Time 0.252 (1.044)	Data Time 0.001 (0.525)	Loss 2.5382 (2.4685)	Entropy 0.59318 (0.59203)	Top-1 acc 63.281 (64.526)	Top-5 acc 82.812 (84.344)	lr 0.00585
Train [82][1350/3239]	Time 0.247 (1.041)	Data Time 0.001 (0.523)	Loss 2.6700 (2.4683)	Entropy 0.59345 (0.59204)	Top-1 acc 57.031 (64.524)	Top-5 acc 82.031 (84.349)	lr 0.00585
Train [82][1360/3239]	Time 0.238 (1.048)	Data Time 0.001 (0.530)	Loss 2.4160 (2.4686)	Entropy 0.59365 (0.59205)	Top-1 acc 67.188 (64.518)	Top-5 acc 87.109 (84.343)	lr 0.00585
Train [82][1370/3239]	Time 0.246 (1.047)	Data Time 0.001 (0.530)	Loss 2.2888 (2.4684)	Entropy 0.59367 (0.59206)	Top-1 acc 69.141 (64.525)	Top-5 acc 87.891 (84.344)	lr 0.00585
Train [82][1380/3239]	Time 0.337 (1.042)	Data Time 0.001 (0.526)	Loss 2.6210 (2.4681)	Entropy 0.59330 (0.59207)	Top-1 acc 59.375 (64.535)	Top-5 acc 80.078 (84.350)	lr 0.00585
Train [82][1390/3239]	Time 4.034 (1.050)	Data Time 3.795 (0.535)	Loss 2.5222 (2.4682)	Entropy 0.59309 (0.59208)	Top-1 acc 59.766 (64.533)	Top-5 acc 82.422 (84.349)	lr 0.00585
Train [82][1400/3239]	Time 0.251 (1.050)	Data Time 0.001 (0.535)	Loss 2.4682 (2.4688)	Entropy 0.59293 (0.59209)	Top-1 acc 62.109 (64.513)	Top-5 acc 83.984 (84.333)	lr 0.00585
Train [82][1410/3239]	Time 0.261 (1.047)	Data Time 0.001 (0.532)	Loss 2.2958 (2.4691)	Entropy 0.59287 (0.59209)	Top-1 acc 71.875 (64.511)	Top-5 acc 85.938 (84.327)	lr 0.00585
Train [82][1420/3239]	Time 0.237 (1.049)	Data Time 0.002 (0.535)	Loss 2.6878 (2.4695)	Entropy 0.59305 (0.59210)	Top-1 acc 56.250 (64.499)	Top-5 acc 80.078 (84.322)	lr 0.00585
Train [82][1430/3239]	Time 0.244 (1.052)	Data Time 0.002 (0.539)	Loss 2.3374 (2.4701)	Entropy 0.59307 (0.59211)	Top-1 acc 64.453 (64.483)	Top-5 acc 83.984 (84.305)	lr 0.00585
Train [82][1440/3239]	Time 0.257 (1.050)	Data Time 0.003 (0.538)	Loss 2.7038 (2.4701)	Entropy 0.59292 (0.59211)	Top-1 acc 59.375 (64.476)	Top-5 acc 80.859 (84.307)	lr 0.00585
Train [82][1450/3239]	Time 0.246 (1.050)	Data Time 0.001 (0.538)	Loss 2.3507 (2.4699)	Entropy 0.59293 (0.59212)	Top-1 acc 66.016 (64.478)	Top-5 acc 86.328 (84.310)	lr 0.00584
Train [82][1460/3239]	Time 0.231 (1.056)	Data Time 0.001 (0.545)	Loss 2.5673 (2.4696)	Entropy 0.59269 (0.59212)	Top-1 acc 64.453 (64.485)	Top-5 acc 81.250 (84.311)	lr 0.00584
Train [82][1470/3239]	Time 0.245 (1.055)	Data Time 0.001 (0.544)	Loss 2.7190 (2.4698)	Entropy 0.59251 (0.59213)	Top-1 acc 57.031 (64.479)	Top-5 acc 80.078 (84.310)	lr 0.00584
Train [82][1480/3239]	Time 4.274 (1.053)	Data Time 4.017 (0.543)	Loss 2.4355 (2.4698)	Entropy 0.59262 (0.59213)	Top-1 acc 64.453 (64.485)	Top-5 acc 87.109 (84.312)	lr 0.00584
Train [82][1490/3239]	Time 0.289 (1.059)	Data Time 0.003 (0.549)	Loss 2.6440 (2.4695)	Entropy 0.59263 (0.59213)	Top-1 acc 63.281 (64.492)	Top-5 acc 79.688 (84.314)	lr 0.00584
Train [82][1500/3239]	Time 0.279 (1.094)	Data Time 0.004 (0.546)	Loss 2.3763 (2.4694)	Entropy 0.59293 (0.59214)	Top-1 acc 64.453 (64.494)	Top-5 acc 87.109 (84.319)	lr 0.00584
Train [82][1510/3239]	Time 0.269 (1.090)	Data Time 0.003 (0.542)	Loss 2.3711 (2.4694)	Entropy 0.59306 (0.59214)	Top-1 acc 66.016 (64.493)	Top-5 acc 87.500 (84.321)	lr 0.00584
Train [82][1520/3239]	Time 0.241 (1.085)	Data Time 0.001 (0.538)	Loss 2.5156 (2.4698)	Entropy 0.59297 (0.59215)	Top-1 acc 63.672 (64.484)	Top-5 acc 84.766 (84.312)	lr 0.00584
Train [82][1530/3239]	Time 0.242 (1.081)	Data Time 0.001 (0.535)	Loss 2.3144 (2.4698)	Entropy 0.59307 (0.59215)	Top-1 acc 68.359 (64.481)	Top-5 acc 87.109 (84.311)	lr 0.00584
Train [82][1540/3239]	Time 0.369 (1.077)	Data Time 0.002 (0.532)	Loss 2.6904 (2.4704)	Entropy 0.59286 (0.59216)	Top-1 acc 58.984 (64.468)	Top-5 acc 80.078 (84.302)	lr 0.00584
Train [82][1550/3239]	Time 0.234 (1.073)	Data Time 0.001 (0.528)	Loss 2.5979 (2.4705)	Entropy 0.59293 (0.59216)	Top-1 acc 61.328 (64.464)	Top-5 acc 80.469 (84.298)	lr 0.00584
Train [82][1560/3239]	Time 0.269 (1.072)	Data Time 0.001 (0.528)	Loss 2.6189 (2.4706)	Entropy 0.59291 (0.59217)	Top-1 acc 62.109 (64.466)	Top-5 acc 81.641 (84.294)	lr 0.00583
Train [82][1570/3239]	Time 0.236 (1.072)	Data Time 0.001 (0.528)	Loss 2.5269 (2.4702)	Entropy 0.59299 (0.59217)	Top-1 acc 64.844 (64.477)	Top-5 acc 82.422 (84.298)	lr 0.00583
Train [82][1580/3239]	Time 0.249 (1.069)	Data Time 0.001 (0.526)	Loss 2.4839 (2.4702)	Entropy 0.59266 (0.59218)	Top-1 acc 63.672 (64.479)	Top-5 acc 83.594 (84.297)	lr 0.00583
Train [82][1590/3239]	Time 0.252 (1.065)	Data Time 0.002 (0.523)	Loss 2.6006 (2.4705)	Entropy 0.59267 (0.59218)	Top-1 acc 64.453 (64.472)	Top-5 acc 81.641 (84.289)	lr 0.00583
Train [82][1600/3239]	Time 0.258 (1.075)	Data Time 0.001 (0.533)	Loss 2.3251 (2.4707)	Entropy 0.59275 (0.59219)	Top-1 acc 67.969 (64.465)	Top-5 acc 84.766 (84.284)	lr 0.00583
Train [82][1610/3239]	Time 0.245 (1.072)	Data Time 0.001 (0.531)	Loss 2.4800 (2.4705)	Entropy 0.59275 (0.59219)	Top-1 acc 62.891 (64.465)	Top-5 acc 83.984 (84.286)	lr 0.00583
Train [82][1620/3239]	Time 0.232 (1.068)	Data Time 0.001 (0.528)	Loss 2.6288 (2.4705)	Entropy 0.59295 (0.59219)	Top-1 acc 58.984 (64.461)	Top-5 acc 83.203 (84.290)	lr 0.00583
Train [82][1630/3239]	Time 0.242 (1.079)	Data Time 0.001 (0.539)	Loss 2.4345 (2.4705)	Entropy 0.59286 (0.59220)	Top-1 acc 66.406 (64.460)	Top-5 acc 83.984 (84.287)	lr 0.00583
Train [82][1640/3239]	Time 0.270 (1.076)	Data Time 0.001 (0.537)	Loss 2.4014 (2.4705)	Entropy 0.59300 (0.59220)	Top-1 acc 64.844 (64.459)	Top-5 acc 85.547 (84.294)	lr 0.00583
Train [82][1650/3239]	Time 0.238 (1.073)	Data Time 0.001 (0.535)	Loss 2.4844 (2.4703)	Entropy 0.59341 (0.59221)	Top-1 acc 63.672 (64.464)	Top-5 acc 83.203 (84.294)	lr 0.00583
Train [82][1660/3239]	Time 1.500 (1.078)	Data Time 1.231 (0.541)	Loss 2.5246 (2.4705)	Entropy 0.59346 (0.59222)	Top-1 acc 67.578 (64.462)	Top-5 acc 81.250 (84.295)	lr 0.00583
Train [82][1670/3239]	Time 0.257 (1.075)	Data Time 0.001 (0.537)	Loss 2.3057 (2.4704)	Entropy 0.59333 (0.59222)	Top-1 acc 67.188 (64.464)	Top-5 acc 87.500 (84.299)	lr 0.00583
Train [82][1680/3239]	Time 0.249 (1.071)	Data Time 0.001 (0.534)	Loss 2.4964 (2.4705)	Entropy 0.59354 (0.59223)	Top-1 acc 63.672 (64.467)	Top-5 acc 83.984 (84.295)	lr 0.00582
Train [82][1690/3239]	Time 0.262 (1.073)	Data Time 0.001 (0.537)	Loss 2.4030 (2.4705)	Entropy 0.59358 (0.59224)	Top-1 acc 64.844 (64.464)	Top-5 acc 87.891 (84.298)	lr 0.00582
Train [82][1700/3239]	Time 0.357 (1.071)	Data Time 0.002 (0.535)	Loss 2.4433 (2.4704)	Entropy 0.59364 (0.59224)	Top-1 acc 64.062 (64.471)	Top-5 acc 83.594 (84.301)	lr 0.00582
Train [82][1710/3239]	Time 0.248 (1.067)	Data Time 0.001 (0.532)	Loss 2.4612 (2.4704)	Entropy 0.59347 (0.59225)	Top-1 acc 64.453 (64.473)	Top-5 acc 83.203 (84.299)	lr 0.00582
Train [82][1720/3239]	Time 0.240 (1.071)	Data Time 0.001 (0.536)	Loss 2.5985 (2.4705)	Entropy 0.59360 (0.59226)	Top-1 acc 62.891 (64.470)	Top-5 acc 81.250 (84.297)	lr 0.00582
Train [82][1730/3239]	Time 0.399 (1.072)	Data Time 0.131 (0.538)	Loss 2.5915 (2.4710)	Entropy 0.59371 (0.59227)	Top-1 acc 60.938 (64.454)	Top-5 acc 81.250 (84.288)	lr 0.00582
Train [82][1740/3239]	Time 0.226 (1.070)	Data Time 0.001 (0.537)	Loss 2.5040 (2.4712)	Entropy 0.59384 (0.59228)	Top-1 acc 62.500 (64.447)	Top-5 acc 84.375 (84.287)	lr 0.00582
Train [82][1750/3239]	Time 0.238 (1.066)	Data Time 0.001 (0.534)	Loss 2.2112 (2.4711)	Entropy 0.59350 (0.59228)	Top-1 acc 71.875 (64.449)	Top-5 acc 89.844 (84.290)	lr 0.00582
Train [82][1760/3239]	Time 0.231 (1.076)	Data Time 0.001 (0.544)	Loss 2.3784 (2.4714)	Entropy 0.59363 (0.59229)	Top-1 acc 67.969 (64.452)	Top-5 acc 83.594 (84.279)	lr 0.00582
Train [82][1770/3239]	Time 0.373 (1.074)	Data Time 0.001 (0.542)	Loss 2.4149 (2.4714)	Entropy 0.59368 (0.59230)	Top-1 acc 66.016 (64.452)	Top-5 acc 85.938 (84.282)	lr 0.00582
Train [82][1780/3239]	Time 0.235 (1.072)	Data Time 0.001 (0.541)	Loss 2.4679 (2.4716)	Entropy 0.59352 (0.59231)	Top-1 acc 65.625 (64.452)	Top-5 acc 82.812 (84.277)	lr 0.00582
Train [82][1790/3239]	Time 0.248 (1.082)	Data Time 0.001 (0.552)	Loss 2.7480 (2.4716)	Entropy 0.59329 (0.59231)	Top-1 acc 59.375 (64.449)	Top-5 acc 82.031 (84.278)	lr 0.00582
Train [82][1800/3239]	Time 0.242 (1.079)	Data Time 0.001 (0.549)	Loss 2.5157 (2.4712)	Entropy 0.59334 (0.59232)	Top-1 acc 66.797 (64.460)	Top-5 acc 82.812 (84.282)	lr 0.00581
Train [82][1810/3239]	Time 0.246 (1.076)	Data Time 0.001 (0.547)	Loss 2.6146 (2.4712)	Entropy 0.59336 (0.59232)	Top-1 acc 60.938 (64.462)	Top-5 acc 80.078 (84.281)	lr 0.00581
Train [82][1820/3239]	Time 11.524 (1.085)	Data Time 11.249 (0.557)	Loss 2.4884 (2.4713)	Entropy 0.59349 (0.59233)	Top-1 acc 64.844 (64.457)	Top-5 acc 82.422 (84.275)	lr 0.00581
Train [82][1830/3239]	Time 0.230 (1.082)	Data Time 0.001 (0.554)	Loss 2.4981 (2.4714)	Entropy 0.59328 (0.59234)	Top-1 acc 64.844 (64.455)	Top-5 acc 83.594 (84.277)	lr 0.00581
Train [82][1840/3239]	Time 0.242 (1.078)	Data Time 0.001 (0.551)	Loss 2.3053 (2.4715)	Entropy 0.59336 (0.59234)	Top-1 acc 68.359 (64.453)	Top-5 acc 86.328 (84.274)	lr 0.00581
Train [82][1850/3239]	Time 0.282 (1.076)	Data Time 0.002 (0.549)	Loss 2.4800 (2.4714)	Entropy 0.59352 (0.59235)	Top-1 acc 63.281 (64.452)	Top-5 acc 83.984 (84.278)	lr 0.00581
Train [82][1860/3239]	Time 0.353 (1.078)	Data Time 0.001 (0.552)	Loss 2.3778 (2.4716)	Entropy 0.59349 (0.59235)	Top-1 acc 67.578 (64.443)	Top-5 acc 87.500 (84.278)	lr 0.00581
Train [82][1870/3239]	Time 0.251 (1.075)	Data Time 0.001 (0.549)	Loss 2.3487 (2.4711)	Entropy 0.59334 (0.59236)	Top-1 acc 70.312 (64.452)	Top-5 acc 86.719 (84.291)	lr 0.00581
Train [82][1880/3239]	Time 0.238 (1.071)	Data Time 0.001 (0.546)	Loss 2.6656 (2.4713)	Entropy 0.59354 (0.59236)	Top-1 acc 60.938 (64.451)	Top-5 acc 81.641 (84.285)	lr 0.00581
Train [82][1890/3239]	Time 0.249 (1.074)	Data Time 0.001 (0.549)	Loss 2.2867 (2.4712)	Entropy 0.59348 (0.59237)	Top-1 acc 69.531 (64.455)	Top-5 acc 90.234 (84.288)	lr 0.00581
Train [82][1900/3239]	Time 0.270 (1.070)	Data Time 0.001 (0.546)	Loss 2.3682 (2.4715)	Entropy 0.59347 (0.59238)	Top-1 acc 64.453 (64.446)	Top-5 acc 87.891 (84.287)	lr 0.00581
Train [82][1910/3239]	Time 0.247 (1.067)	Data Time 0.001 (0.543)	Loss 2.3645 (2.4715)	Entropy 0.59312 (0.59238)	Top-1 acc 68.359 (64.439)	Top-5 acc 85.156 (84.293)	lr 0.00581
Train [82][1920/3239]	Time 0.284 (1.070)	Data Time 0.001 (0.546)	Loss 2.3310 (2.4716)	Entropy 0.59324 (0.59238)	Top-1 acc 66.797 (64.438)	Top-5 acc 86.719 (84.293)	lr 0.00580
Train [82][1930/3239]	Time 0.355 (1.067)	Data Time 0.001 (0.544)	Loss 2.5213 (2.4715)	Entropy 0.59321 (0.59239)	Top-1 acc 61.328 (64.434)	Top-5 acc 83.984 (84.294)	lr 0.00580
Train [82][1940/3239]	Time 0.228 (1.064)	Data Time 0.001 (0.541)	Loss 2.3494 (2.4717)	Entropy 0.59348 (0.59239)	Top-1 acc 64.062 (64.426)	Top-5 acc 88.672 (84.292)	lr 0.00580
Train [82][1950/3239]	Time 0.256 (1.064)	Data Time 0.001 (0.542)	Loss 2.3241 (2.4716)	Entropy 0.59357 (0.59240)	Top-1 acc 67.188 (64.425)	Top-5 acc 87.500 (84.295)	lr 0.00580
Train [82][1960/3239]	Time 0.259 (1.061)	Data Time 0.001 (0.540)	Loss 2.4331 (2.4713)	Entropy 0.59363 (0.59240)	Top-1 acc 64.844 (64.429)	Top-5 acc 84.375 (84.300)	lr 0.00580
Train [82][1970/3239]	Time 0.250 (1.058)	Data Time 0.002 (0.537)	Loss 2.4915 (2.4712)	Entropy 0.59373 (0.59241)	Top-1 acc 69.531 (64.431)	Top-5 acc 85.156 (84.299)	lr 0.00580
Train [82][1980/3239]	Time 11.561 (1.063)	Data Time 11.295 (0.542)	Loss 2.5421 (2.4711)	Entropy 0.59388 (0.59242)	Top-1 acc 61.719 (64.437)	Top-5 acc 83.984 (84.301)	lr 0.00580
Train [82][1990/3239]	Time 0.259 (1.061)	Data Time 0.001 (0.540)	Loss 2.5159 (2.4715)	Entropy 0.59384 (0.59243)	Top-1 acc 66.016 (64.430)	Top-5 acc 83.203 (84.295)	lr 0.00580
Train [82][2000/3239]	Time 0.248 (1.058)	Data Time 0.001 (0.538)	Loss 2.6536 (2.4718)	Entropy 0.59367 (0.59243)	Top-1 acc 58.203 (64.417)	Top-5 acc 79.297 (84.290)	lr 0.00580
Train [82][2010/3239]	Time 0.280 (1.060)	Data Time 0.001 (0.541)	Loss 2.4323 (2.4719)	Entropy 0.59344 (0.59244)	Top-1 acc 66.797 (64.415)	Top-5 acc 84.375 (84.286)	lr 0.00580
Train [82][2020/3239]	Time 0.294 (1.063)	Data Time 0.002 (0.543)	Loss 2.3821 (2.4718)	Entropy 0.59324 (0.59244)	Top-1 acc 62.891 (64.419)	Top-5 acc 87.500 (84.287)	lr 0.00580
Train [82][2030/3239]	Time 0.259 (1.060)	Data Time 0.001 (0.541)	Loss 2.3648 (2.4718)	Entropy 0.59305 (0.59245)	Top-1 acc 68.750 (64.427)	Top-5 acc 85.547 (84.287)	lr 0.00579
Train [82][2040/3239]	Time 7.748 (1.062)	Data Time 7.484 (0.544)	Loss 2.5638 (2.4720)	Entropy 0.59273 (0.59245)	Top-1 acc 63.281 (64.425)	Top-5 acc 82.031 (84.282)	lr 0.00579
Train [82][2050/3239]	Time 0.232 (1.065)	Data Time 0.001 (0.547)	Loss 2.5742 (2.4722)	Entropy 0.59255 (0.59245)	Top-1 acc 61.719 (64.417)	Top-5 acc 85.156 (84.281)	lr 0.00579
Train [82][2060/3239]	Time 0.262 (1.063)	Data Time 0.001 (0.545)	Loss 2.7516 (2.4721)	Entropy 0.59259 (0.59245)	Top-1 acc 56.641 (64.416)	Top-5 acc 76.172 (84.284)	lr 0.00579
Train [82][2070/3239]	Time 0.251 (1.060)	Data Time 0.001 (0.543)	Loss 2.5420 (2.4721)	Entropy 0.59281 (0.59245)	Top-1 acc 65.625 (64.419)	Top-5 acc 83.594 (84.284)	lr 0.00579
Train [82][2080/3239]	Time 0.247 (1.066)	Data Time 0.001 (0.550)	Loss 2.3625 (2.4722)	Entropy 0.59266 (0.59245)	Top-1 acc 66.406 (64.422)	Top-5 acc 85.938 (84.279)	lr 0.00579
Train [82][2090/3239]	Time 0.327 (1.065)	Data Time 0.001 (0.549)	Loss 2.6027 (2.4725)	Entropy 0.59264 (0.59245)	Top-1 acc 62.500 (64.416)	Top-5 acc 80.859 (84.274)	lr 0.00579
Train [82][2100/3239]	Time 0.247 (1.062)	Data Time 0.001 (0.547)	Loss 2.5108 (2.4724)	Entropy 0.59288 (0.59245)	Top-1 acc 62.500 (64.415)	Top-5 acc 83.594 (84.277)	lr 0.00579
Train [82][2110/3239]	Time 0.234 (1.070)	Data Time 0.001 (0.555)	Loss 2.4094 (2.4723)	Entropy 0.59227 (0.59246)	Top-1 acc 67.969 (64.416)	Top-5 acc 84.375 (84.277)	lr 0.00579
Train [82][2120/3239]	Time 0.234 (1.067)	Data Time 0.001 (0.552)	Loss 2.2495 (2.4721)	Entropy 0.59187 (0.59246)	Top-1 acc 71.484 (64.421)	Top-5 acc 87.500 (84.277)	lr 0.00579
Train [82][2130/3239]	Time 0.250 (1.064)	Data Time 0.001 (0.550)	Loss 2.5844 (2.4723)	Entropy 0.59188 (0.59245)	Top-1 acc 60.938 (64.417)	Top-5 acc 81.250 (84.273)	lr 0.00579
Train [82][2140/3239]	Time 13.026 (1.072)	Data Time 12.781 (0.557)	Loss 2.3131 (2.4724)	Entropy 0.59155 (0.59245)	Top-1 acc 66.016 (64.412)	Top-5 acc 86.328 (84.276)	lr 0.00579
Train [82][2150/3239]	Time 0.419 (1.095)	Data Time 0.005 (0.555)	Loss 2.2705 (2.4726)	Entropy 0.59174 (0.59245)	Top-1 acc 65.625 (64.406)	Top-5 acc 87.500 (84.272)	lr 0.00578
Train [82][2160/3239]	Time 0.244 (1.093)	Data Time 0.002 (0.553)	Loss 2.5981 (2.4728)	Entropy 0.59126 (0.59244)	Top-1 acc 63.672 (64.404)	Top-5 acc 81.250 (84.269)	lr 0.00578
Train [82][2170/3239]	Time 0.286 (1.090)	Data Time 0.002 (0.550)	Loss 2.6043 (2.4729)	Entropy 0.59131 (0.59244)	Top-1 acc 60.938 (64.399)	Top-5 acc 83.984 (84.266)	lr 0.00578
Train [82][2180/3239]	Time 0.288 (1.087)	Data Time 0.001 (0.547)	Loss 2.5496 (2.4731)	Entropy 0.59149 (0.59243)	Top-1 acc 61.719 (64.393)	Top-5 acc 83.594 (84.261)	lr 0.00578
Train [82][2190/3239]	Time 0.237 (1.084)	Data Time 0.001 (0.545)	Loss 2.6521 (2.4731)	Entropy 0.59149 (0.59243)	Top-1 acc 59.766 (64.393)	Top-5 acc 82.422 (84.262)	lr 0.00578
Train [82][2200/3239]	Time 0.247 (1.081)	Data Time 0.001 (0.543)	Loss 2.4915 (2.4735)	Entropy 0.59157 (0.59242)	Top-1 acc 63.281 (64.382)	Top-5 acc 87.109 (84.259)	lr 0.00578
Train [82][2210/3239]	Time 0.254 (1.078)	Data Time 0.001 (0.540)	Loss 2.4048 (2.4735)	Entropy 0.59129 (0.59242)	Top-1 acc 65.625 (64.383)	Top-5 acc 87.891 (84.260)	lr 0.00578
Train [82][2220/3239]	Time 0.568 (1.077)	Data Time 0.323 (0.539)	Loss 2.4175 (2.4735)	Entropy 0.59110 (0.59241)	Top-1 acc 67.578 (64.380)	Top-5 acc 85.547 (84.263)	lr 0.00578
Train [82][2230/3239]	Time 0.256 (1.077)	Data Time 0.001 (0.540)	Loss 2.3853 (2.4737)	Entropy 0.59092 (0.59241)	Top-1 acc 65.234 (64.372)	Top-5 acc 87.500 (84.262)	lr 0.00578
Train [82][2240/3239]	Time 0.261 (1.076)	Data Time 0.002 (0.539)	Loss 2.4742 (2.4739)	Entropy 0.59108 (0.59240)	Top-1 acc 63.672 (64.368)	Top-5 acc 82.422 (84.257)	lr 0.00578
Train [82][2250/3239]	Time 0.373 (1.079)	Data Time 0.001 (0.543)	Loss 2.6887 (2.4740)	Entropy 0.59120 (0.59240)	Top-1 acc 60.938 (64.367)	Top-5 acc 81.641 (84.259)	lr 0.00578
Train [82][2260/3239]	Time 0.268 (1.080)	Data Time 0.001 (0.544)	Loss 2.6105 (2.4740)	Entropy 0.59152 (0.59239)	Top-1 acc 61.719 (64.366)	Top-5 acc 83.594 (84.260)	lr 0.00578
Train [82][2270/3239]	Time 0.231 (1.077)	Data Time 0.001 (0.541)	Loss 2.6514 (2.4743)	Entropy 0.59160 (0.59239)	Top-1 acc 59.375 (64.359)	Top-5 acc 81.250 (84.255)	lr 0.00577
Train [82][2280/3239]	Time 0.242 (1.079)	Data Time 0.001 (0.544)	Loss 2.5164 (2.4741)	Entropy 0.59122 (0.59238)	Top-1 acc 61.328 (64.357)	Top-5 acc 85.547 (84.258)	lr 0.00577
Train [82][2290/3239]	Time 0.241 (1.079)	Data Time 0.001 (0.544)	Loss 2.3916 (2.4743)	Entropy 0.59142 (0.59238)	Top-1 acc 67.969 (64.356)	Top-5 acc 84.375 (84.253)	lr 0.00577
Train [82][2300/3239]	Time 0.244 (1.078)	Data Time 0.001 (0.543)	Loss 2.5893 (2.4744)	Entropy 0.59156 (0.59238)	Top-1 acc 64.453 (64.356)	Top-5 acc 82.031 (84.250)	lr 0.00577
Train [82][2310/3239]	Time 10.505 (1.079)	Data Time 10.242 (0.545)	Loss 2.3890 (2.4743)	Entropy 0.59142 (0.59237)	Top-1 acc 66.406 (64.358)	Top-5 acc 83.984 (84.251)	lr 0.00577
Train [82][2320/3239]	Time 2.440 (1.080)	Data Time 2.084 (0.546)	Loss 2.3665 (2.4744)	Entropy 0.59167 (0.59237)	Top-1 acc 65.234 (64.353)	Top-5 acc 86.328 (84.247)	lr 0.00577
Train [82][2330/3239]	Time 0.248 (1.078)	Data Time 0.001 (0.545)	Loss 2.5485 (2.4749)	Entropy 0.59156 (0.59236)	Top-1 acc 61.328 (64.345)	Top-5 acc 83.984 (84.239)	lr 0.00577
Train [82][2340/3239]	Time 0.252 (1.077)	Data Time 0.002 (0.544)	Loss 2.4891 (2.4749)	Entropy 0.59139 (0.59236)	Top-1 acc 63.672 (64.343)	Top-5 acc 83.594 (84.242)	lr 0.00577
Train [82][2350/3239]	Time 0.237 (1.079)	Data Time 0.001 (0.546)	Loss 2.4843 (2.4751)	Entropy 0.59139 (0.59236)	Top-1 acc 66.016 (64.340)	Top-5 acc 80.859 (84.237)	lr 0.00577
Train [82][2360/3239]	Time 4.338 (1.080)	Data Time 4.081 (0.547)	Loss 2.4986 (2.4751)	Entropy 0.59144 (0.59235)	Top-1 acc 65.625 (64.339)	Top-5 acc 85.156 (84.237)	lr 0.00577
Train [82][2370/3239]	Time 0.231 (1.077)	Data Time 0.001 (0.545)	Loss 2.8643 (2.4752)	Entropy 0.59126 (0.59235)	Top-1 acc 56.641 (64.335)	Top-5 acc 77.734 (84.233)	lr 0.00577
Train [82][2380/3239]	Time 0.253 (1.080)	Data Time 0.001 (0.549)	Loss 2.3957 (2.4752)	Entropy 0.59125 (0.59235)	Top-1 acc 62.500 (64.333)	Top-5 acc 88.672 (84.236)	lr 0.00577
Train [82][2390/3239]	Time 0.228 (1.080)	Data Time 0.001 (0.548)	Loss 2.5915 (2.4752)	Entropy 0.59138 (0.59234)	Top-1 acc 61.328 (64.335)	Top-5 acc 82.812 (84.235)	lr 0.00576
Train [82][2400/3239]	Time 1.381 (1.078)	Data Time 1.142 (0.547)	Loss 2.3372 (2.4750)	Entropy 0.59149 (0.59234)	Top-1 acc 67.969 (64.339)	Top-5 acc 87.109 (84.241)	lr 0.00576
Train [82][2410/3239]	Time 0.358 (1.080)	Data Time 0.001 (0.549)	Loss 2.5501 (2.4752)	Entropy 0.59124 (0.59233)	Top-1 acc 65.625 (64.334)	Top-5 acc 82.812 (84.237)	lr 0.00576
Train [82][2420/3239]	Time 0.237 (1.081)	Data Time 0.001 (0.551)	Loss 2.4033 (2.4752)	Entropy 0.59131 (0.59233)	Top-1 acc 68.750 (64.337)	Top-5 acc 86.328 (84.237)	lr 0.00576
Train [82][2430/3239]	Time 0.237 (1.079)	Data Time 0.001 (0.550)	Loss 2.6673 (2.4754)	Entropy 0.59157 (0.59232)	Top-1 acc 57.422 (64.330)	Top-5 acc 79.297 (84.232)	lr 0.00576
Train [82][2440/3239]	Time 0.256 (1.081)	Data Time 0.001 (0.551)	Loss 2.3899 (2.4754)	Entropy 0.59152 (0.59232)	Top-1 acc 66.406 (64.335)	Top-5 acc 84.375 (84.227)	lr 0.00576
Train [82][2450/3239]	Time 0.257 (1.080)	Data Time 0.001 (0.551)	Loss 2.5834 (2.4755)	Entropy 0.59169 (0.59232)	Top-1 acc 63.281 (64.335)	Top-5 acc 81.250 (84.224)	lr 0.00576
Train [82][2460/3239]	Time 0.235 (1.080)	Data Time 0.001 (0.551)	Loss 2.6033 (2.4756)	Entropy 0.59169 (0.59232)	Top-1 acc 62.500 (64.333)	Top-5 acc 82.812 (84.223)	lr 0.00576
Train [82][2470/3239]	Time 8.898 (1.080)	Data Time 8.610 (0.552)	Loss 2.2788 (2.4756)	Entropy 0.59199 (0.59231)	Top-1 acc 69.141 (64.333)	Top-5 acc 89.453 (84.224)	lr 0.00576
Train [82][2480/3239]	Time 3.517 (1.080)	Data Time 3.139 (0.552)	Loss 2.5099 (2.4754)	Entropy 0.59172 (0.59231)	Top-1 acc 62.500 (64.335)	Top-5 acc 84.766 (84.229)	lr 0.00576
Train [82][2490/3239]	Time 0.232 (1.080)	Data Time 0.001 (0.553)	Loss 2.3824 (2.4753)	Entropy 0.59191 (0.59231)	Top-1 acc 65.625 (64.334)	Top-5 acc 86.719 (84.231)	lr 0.00576
Train [82][2500/3239]	Time 0.246 (1.077)	Data Time 0.001 (0.551)	Loss 2.6247 (2.4753)	Entropy 0.59193 (0.59231)	Top-1 acc 63.672 (64.332)	Top-5 acc 84.375 (84.231)	lr 0.00575
Train [82][2510/3239]	Time 0.249 (1.080)	Data Time 0.001 (0.554)	Loss 2.4546 (2.4751)	Entropy 0.59205 (0.59231)	Top-1 acc 63.672 (64.335)	Top-5 acc 85.156 (84.232)	lr 0.00575
Train [82][2520/3239]	Time 0.329 (1.080)	Data Time 0.080 (0.554)	Loss 2.4944 (2.4751)	Entropy 0.59206 (0.59231)	Top-1 acc 61.328 (64.334)	Top-5 acc 83.984 (84.234)	lr 0.00575
Train [82][2530/3239]	Time 0.906 (1.078)	Data Time 0.622 (0.552)	Loss 2.4236 (2.4752)	Entropy 0.59218 (0.59230)	Top-1 acc 64.062 (64.328)	Top-5 acc 83.984 (84.232)	lr 0.00575
Train [82][2540/3239]	Time 0.236 (1.081)	Data Time 0.001 (0.556)	Loss 2.5330 (2.4752)	Entropy 0.59237 (0.59230)	Top-1 acc 61.719 (64.324)	Top-5 acc 84.766 (84.233)	lr 0.00575
Train [82][2550/3239]	Time 0.238 (1.082)	Data Time 0.001 (0.557)	Loss 2.5453 (2.4753)	Entropy 0.59248 (0.59230)	Top-1 acc 57.422 (64.319)	Top-5 acc 82.812 (84.237)	lr 0.00575
Train [82][2560/3239]	Time 0.271 (1.080)	Data Time 0.001 (0.555)	Loss 2.4779 (2.4752)	Entropy 0.59256 (0.59231)	Top-1 acc 66.016 (64.324)	Top-5 acc 83.984 (84.237)	lr 0.00575
Train [82][2570/3239]	Time 0.281 (1.081)	Data Time 0.002 (0.557)	Loss 2.4056 (2.4753)	Entropy 0.59216 (0.59231)	Top-1 acc 67.969 (64.323)	Top-5 acc 84.375 (84.234)	lr 0.00575
Train [82][2580/3239]	Time 2.816 (1.083)	Data Time 2.526 (0.559)	Loss 2.6277 (2.4754)	Entropy 0.59225 (0.59230)	Top-1 acc 59.766 (64.322)	Top-5 acc 82.812 (84.233)	lr 0.00575
Train [82][2590/3239]	Time 0.252 (1.081)	Data Time 0.001 (0.557)	Loss 2.3226 (2.4753)	Entropy 0.59232 (0.59230)	Top-1 acc 66.797 (64.320)	Top-5 acc 89.062 (84.235)	lr 0.00575
Train [82][2600/3239]	Time 0.245 (1.082)	Data Time 0.001 (0.559)	Loss 2.4659 (2.4756)	Entropy 0.59212 (0.59230)	Top-1 acc 60.938 (64.315)	Top-5 acc 83.594 (84.234)	lr 0.00575
Train [82][2610/3239]	Time 0.229 (1.083)	Data Time 0.001 (0.560)	Loss 2.4384 (2.4757)	Entropy 0.59209 (0.59230)	Top-1 acc 62.891 (64.311)	Top-5 acc 82.812 (84.231)	lr 0.00575
Train [82][2620/3239]	Time 0.226 (1.082)	Data Time 0.001 (0.560)	Loss 2.3942 (2.4758)	Entropy 0.59165 (0.59230)	Top-1 acc 65.625 (64.307)	Top-5 acc 85.547 (84.226)	lr 0.00574
Train [82][2630/3239]	Time 9.356 (1.083)	Data Time 9.110 (0.561)	Loss 2.4129 (2.4758)	Entropy 0.59189 (0.59230)	Top-1 acc 65.234 (64.303)	Top-5 acc 83.594 (84.226)	lr 0.00574
Train [82][2640/3239]	Time 7.720 (1.084)	Data Time 7.376 (0.563)	Loss 2.2984 (2.4759)	Entropy 0.59144 (0.59230)	Top-1 acc 68.359 (64.300)	Top-5 acc 88.281 (84.225)	lr 0.00574
Train [82][2650/3239]	Time 0.251 (1.083)	Data Time 0.001 (0.562)	Loss 2.4735 (2.4761)	Entropy 0.59122 (0.59229)	Top-1 acc 66.406 (64.300)	Top-5 acc 82.812 (84.220)	lr 0.00574
Train [82][2660/3239]	Time 1.626 (1.081)	Data Time 1.365 (0.560)	Loss 2.6261 (2.4761)	Entropy 0.59084 (0.59229)	Top-1 acc 58.984 (64.300)	Top-5 acc 82.031 (84.221)	lr 0.00574
Train [82][2670/3239]	Time 0.242 (1.083)	Data Time 0.001 (0.562)	Loss 2.4689 (2.4760)	Entropy 0.59075 (0.59228)	Top-1 acc 65.625 (64.302)	Top-5 acc 85.156 (84.222)	lr 0.00574
Train [82][2680/3239]	Time 0.239 (1.085)	Data Time 0.001 (0.564)	Loss 2.3195 (2.4761)	Entropy 0.59082 (0.59228)	Top-1 acc 67.578 (64.302)	Top-5 acc 85.547 (84.219)	lr 0.00574
Train [82][2690/3239]	Time 0.261 (1.082)	Data Time 0.001 (0.562)	Loss 2.3982 (2.4762)	Entropy 0.59088 (0.59227)	Top-1 acc 63.281 (64.295)	Top-5 acc 86.719 (84.216)	lr 0.00574
Train [82][2700/3239]	Time 2.466 (1.084)	Data Time 2.208 (0.565)	Loss 2.4040 (2.4762)	Entropy 0.59110 (0.59227)	Top-1 acc 66.406 (64.295)	Top-5 acc 84.766 (84.214)	lr 0.00574
Train [82][2710/3239]	Time 0.346 (1.087)	Data Time 0.001 (0.567)	Loss 2.5159 (2.4762)	Entropy 0.59104 (0.59226)	Top-1 acc 64.062 (64.296)	Top-5 acc 82.812 (84.214)	lr 0.00574
Train [82][2720/3239]	Time 0.240 (1.084)	Data Time 0.001 (0.565)	Loss 2.4551 (2.4762)	Entropy 0.59065 (0.59226)	Top-1 acc 66.406 (64.300)	Top-5 acc 83.984 (84.212)	lr 0.00574
Train [82][2730/3239]	Time 0.251 (1.084)	Data Time 0.001 (0.566)	Loss 2.3539 (2.4762)	Entropy 0.59074 (0.59225)	Top-1 acc 70.703 (64.301)	Top-5 acc 88.672 (84.215)	lr 0.00574
Train [82][2740/3239]	Time 0.244 (1.086)	Data Time 0.001 (0.568)	Loss 2.2940 (2.4763)	Entropy 0.59056 (0.59225)	Top-1 acc 67.969 (64.294)	Top-5 acc 86.328 (84.214)	lr 0.00573
Train [82][2750/3239]	Time 0.241 (1.085)	Data Time 0.001 (0.567)	Loss 2.6484 (2.4765)	Entropy 0.59048 (0.59224)	Top-1 acc 60.547 (64.292)	Top-5 acc 81.250 (84.210)	lr 0.00573
Train [82][2760/3239]	Time 0.229 (1.085)	Data Time 0.001 (0.568)	Loss 2.5975 (2.4766)	Entropy 0.59031 (0.59223)	Top-1 acc 60.156 (64.290)	Top-5 acc 82.422 (84.206)	lr 0.00573
Train [82][2770/3239]	Time 0.239 (1.088)	Data Time 0.001 (0.570)	Loss 2.5284 (2.4767)	Entropy 0.59042 (0.59223)	Top-1 acc 63.281 (64.286)	Top-5 acc 81.641 (84.206)	lr 0.00573
Train [82][2780/3239]	Time 0.234 (1.087)	Data Time 0.001 (0.570)	Loss 2.5857 (2.4767)	Entropy 0.59040 (0.59222)	Top-1 acc 64.062 (64.287)	Top-5 acc 82.422 (84.204)	lr 0.00573
Train [82][2790/3239]	Time 3.526 (1.086)	Data Time 3.266 (0.569)	Loss 2.3772 (2.4767)	Entropy 0.59068 (0.59221)	Top-1 acc 66.016 (64.287)	Top-5 acc 85.547 (84.203)	lr 0.00573
Train [82][2800/3239]	Time 5.074 (1.086)	Data Time 4.709 (0.570)	Loss 2.4507 (2.4770)	Entropy 0.59033 (0.59221)	Top-1 acc 64.844 (64.282)	Top-5 acc 83.203 (84.198)	lr 0.00573
Train [82][2810/3239]	Time 0.311 (1.106)	Data Time 0.002 (0.570)	Loss 2.4346 (2.4771)	Entropy 0.59028 (0.59220)	Top-1 acc 64.844 (64.279)	Top-5 acc 85.156 (84.196)	lr 0.00573
Train [82][2820/3239]	Time 0.245 (1.103)	Data Time 0.002 (0.568)	Loss 2.4696 (2.4772)	Entropy 0.58985 (0.59219)	Top-1 acc 66.016 (64.279)	Top-5 acc 86.719 (84.198)	lr 0.00573
Train [82][2830/3239]	Time 0.242 (1.101)	Data Time 0.001 (0.566)	Loss 2.4069 (2.4770)	Entropy 0.58967 (0.59219)	Top-1 acc 64.844 (64.278)	Top-5 acc 86.328 (84.201)	lr 0.00573
Train [82][2840/3239]	Time 0.259 (1.099)	Data Time 0.001 (0.564)	Loss 2.4377 (2.4773)	Entropy 0.58926 (0.59218)	Top-1 acc 64.062 (64.274)	Top-5 acc 85.156 (84.195)	lr 0.00573
Train [82][2850/3239]	Time 0.249 (1.096)	Data Time 0.001 (0.562)	Loss 2.5161 (2.4773)	Entropy 0.58939 (0.59217)	Top-1 acc 63.281 (64.277)	Top-5 acc 82.031 (84.193)	lr 0.00573
Train [82][2860/3239]	Time 0.236 (1.094)	Data Time 0.001 (0.560)	Loss 2.6038 (2.4772)	Entropy 0.58920 (0.59216)	Top-1 acc 59.375 (64.277)	Top-5 acc 82.812 (84.197)	lr 0.00572
Train [82][2870/3239]	Time 1.586 (1.095)	Data Time 1.318 (0.562)	Loss 2.4042 (2.4769)	Entropy 0.58929 (0.59215)	Top-1 acc 66.797 (64.283)	Top-5 acc 84.766 (84.200)	lr 0.00572
Train [82][2880/3239]	Time 0.255 (1.094)	Data Time 0.002 (0.561)	Loss 2.5215 (2.4771)	Entropy 0.58956 (0.59214)	Top-1 acc 59.375 (64.280)	Top-5 acc 83.984 (84.198)	lr 0.00572
Train [82][2890/3239]	Time 0.247 (1.092)	Data Time 0.001 (0.559)	Loss 2.5083 (2.4770)	Entropy 0.58945 (0.59213)	Top-1 acc 61.719 (64.284)	Top-5 acc 83.594 (84.200)	lr 0.00572
Train [82][2900/3239]	Time 0.243 (1.090)	Data Time 0.001 (0.557)	Loss 2.3890 (2.4769)	Entropy 0.58972 (0.59212)	Top-1 acc 67.969 (64.287)	Top-5 acc 85.547 (84.203)	lr 0.00572
Train [82][2910/3239]	Time 0.258 (1.095)	Data Time 0.001 (0.563)	Loss 2.3050 (2.4771)	Entropy 0.58974 (0.59211)	Top-1 acc 71.484 (64.282)	Top-5 acc 89.453 (84.200)	lr 0.00572
Train [82][2920/3239]	Time 0.778 (1.093)	Data Time 0.533 (0.562)	Loss 2.2311 (2.4769)	Entropy 0.58957 (0.59210)	Top-1 acc 70.312 (64.285)	Top-5 acc 87.891 (84.202)	lr 0.00572
Train [82][2930/3239]	Time 1.983 (1.092)	Data Time 1.732 (0.560)	Loss 2.4673 (2.4769)	Entropy 0.58969 (0.59209)	Top-1 acc 62.500 (64.286)	Top-5 acc 85.156 (84.203)	lr 0.00572
Train [82][2940/3239]	Time 0.243 (1.097)	Data Time 0.001 (0.566)	Loss 2.6152 (2.4768)	Entropy 0.58951 (0.59208)	Top-1 acc 61.719 (64.291)	Top-5 acc 81.250 (84.205)	lr 0.00572
Train [82][2950/3239]	Time 0.232 (1.095)	Data Time 0.001 (0.564)	Loss 2.3567 (2.4766)	Entropy 0.58963 (0.59208)	Top-1 acc 68.359 (64.297)	Top-5 acc 85.156 (84.208)	lr 0.00572
Train [82][2960/3239]	Time 0.340 (1.093)	Data Time 0.001 (0.562)	Loss 2.5604 (2.4766)	Entropy 0.58976 (0.59207)	Top-1 acc 62.891 (64.294)	Top-5 acc 83.984 (84.208)	lr 0.00572
Train [82][2970/3239]	Time 0.289 (1.099)	Data Time 0.001 (0.569)	Loss 2.4370 (2.4769)	Entropy 0.58989 (0.59206)	Top-1 acc 65.234 (64.286)	Top-5 acc 85.547 (84.205)	lr 0.00571
Train [82][2980/3239]	Time 0.247 (1.097)	Data Time 0.001 (0.567)	Loss 2.5901 (2.4771)	Entropy 0.59001 (0.59205)	Top-1 acc 62.109 (64.286)	Top-5 acc 81.250 (84.198)	lr 0.00571
Train [82][2990/3239]	Time 0.242 (1.095)	Data Time 0.001 (0.565)	Loss 2.4404 (2.4773)	Entropy 0.58983 (0.59205)	Top-1 acc 64.062 (64.280)	Top-5 acc 83.203 (84.195)	lr 0.00571
Train [82][3000/3239]	Time 0.253 (1.102)	Data Time 0.001 (0.573)	Loss 2.3246 (2.4773)	Entropy 0.59001 (0.59204)	Top-1 acc 66.406 (64.280)	Top-5 acc 87.109 (84.195)	lr 0.00571
Train [82][3010/3239]	Time 0.241 (1.100)	Data Time 0.001 (0.571)	Loss 2.3511 (2.4773)	Entropy 0.58966 (0.59203)	Top-1 acc 63.672 (64.279)	Top-5 acc 85.156 (84.195)	lr 0.00571
Train [82][3020/3239]	Time 0.234 (1.098)	Data Time 0.001 (0.569)	Loss 2.4491 (2.4774)	Entropy 0.58970 (0.59202)	Top-1 acc 62.891 (64.276)	Top-5 acc 85.156 (84.190)	lr 0.00571
Train [82][3030/3239]	Time 15.928 (1.104)	Data Time 15.512 (0.575)	Loss 2.5194 (2.4778)	Entropy 0.58961 (0.59202)	Top-1 acc 62.891 (64.265)	Top-5 acc 81.641 (84.183)	lr 0.00571
Train [82][3040/3239]	Time 0.252 (1.101)	Data Time 0.001 (0.574)	Loss 2.5333 (2.4778)	Entropy 0.58958 (0.59201)	Top-1 acc 62.891 (64.265)	Top-5 acc 83.594 (84.184)	lr 0.00571
Train [82][3050/3239]	Time 0.235 (1.099)	Data Time 0.001 (0.572)	Loss 2.7390 (2.4779)	Entropy 0.58919 (0.59200)	Top-1 acc 56.641 (64.261)	Top-5 acc 77.734 (84.181)	lr 0.00571
Train [82][3060/3239]	Time 0.228 (1.098)	Data Time 0.001 (0.571)	Loss 2.3670 (2.4778)	Entropy 0.58929 (0.59199)	Top-1 acc 66.406 (64.262)	Top-5 acc 87.500 (84.184)	lr 0.00571
Train [82][3070/3239]	Time 0.251 (1.104)	Data Time 0.001 (0.577)	Loss 2.6465 (2.4777)	Entropy 0.58915 (0.59198)	Top-1 acc 56.641 (64.264)	Top-5 acc 79.297 (84.187)	lr 0.00571
Train [82][3080/3239]	Time 0.258 (1.101)	Data Time 0.002 (0.575)	Loss 2.3490 (2.4777)	Entropy 0.58917 (0.59197)	Top-1 acc 66.016 (64.263)	Top-5 acc 89.453 (84.189)	lr 0.00571
Train [82][3090/3239]	Time 0.261 (1.100)	Data Time 0.001 (0.574)	Loss 2.5296 (2.4777)	Entropy 0.58885 (0.59196)	Top-1 acc 59.375 (64.263)	Top-5 acc 82.422 (84.189)	lr 0.00570
Train [82][3100/3239]	Time 0.243 (1.105)	Data Time 0.001 (0.579)	Loss 2.4265 (2.4777)	Entropy 0.58911 (0.59195)	Top-1 acc 64.453 (64.263)	Top-5 acc 85.547 (84.187)	lr 0.00570
Train [82][3110/3239]	Time 0.294 (1.103)	Data Time 0.002 (0.577)	Loss 2.4982 (2.4776)	Entropy 0.58928 (0.59195)	Top-1 acc 62.109 (64.267)	Top-5 acc 79.297 (84.190)	lr 0.00570
Train [82][3120/3239]	Time 0.335 (1.101)	Data Time 0.001 (0.575)	Loss 2.3416 (2.4774)	Entropy 0.58943 (0.59194)	Top-1 acc 67.578 (64.269)	Top-5 acc 86.328 (84.191)	lr 0.00570
Train [82][3130/3239]	Time 0.243 (1.105)	Data Time 0.001 (0.580)	Loss 2.4765 (2.4774)	Entropy 0.58963 (0.59193)	Top-1 acc 63.281 (64.270)	Top-5 acc 84.375 (84.192)	lr 0.00570
Train [82][3140/3239]	Time 0.251 (1.104)	Data Time 0.001 (0.579)	Loss 2.5441 (2.4773)	Entropy 0.58963 (0.59192)	Top-1 acc 64.062 (64.279)	Top-5 acc 80.469 (84.195)	lr 0.00570
Train [82][3150/3239]	Time 2.571 (1.102)	Data Time 2.305 (0.578)	Loss 2.4568 (2.4772)	Entropy 0.58980 (0.59192)	Top-1 acc 62.109 (64.276)	Top-5 acc 83.203 (84.194)	lr 0.00570
Train [82][3160/3239]	Time 0.249 (1.107)	Data Time 0.001 (0.583)	Loss 2.6320 (2.4773)	Entropy 0.58951 (0.59191)	Top-1 acc 62.500 (64.276)	Top-5 acc 80.859 (84.194)	lr 0.00570
Train [82][3170/3239]	Time 0.249 (1.106)	Data Time 0.001 (0.582)	Loss 2.4609 (2.4772)	Entropy 0.58981 (0.59190)	Top-1 acc 62.500 (64.279)	Top-5 acc 85.938 (84.196)	lr 0.00570
Train [82][3180/3239]	Time 0.233 (1.104)	Data Time 0.000 (0.580)	Loss 2.3155 (2.4771)	Entropy 0.58997 (0.59190)	Top-1 acc 69.531 (64.282)	Top-5 acc 85.938 (84.197)	lr 0.00570
Train [82][3190/3239]	Time 19.716 (1.109)	Data Time 19.337 (0.586)	Loss 2.3549 (2.4770)	Entropy 0.59020 (0.59189)	Top-1 acc 67.969 (64.284)	Top-5 acc 85.938 (84.200)	lr 0.00570
Train [82][3200/3239]	Time 0.239 (1.108)	Data Time 0.000 (0.585)	Loss 2.4481 (2.4770)	Entropy 0.59001 (0.59188)	Top-1 acc 63.281 (64.282)	Top-5 acc 87.500 (84.201)	lr 0.00570
Train [82][3210/3239]	Time 0.244 (1.106)	Data Time 0.000 (0.583)	Loss 2.3597 (2.4771)	Entropy 0.59012 (0.59188)	Top-1 acc 69.141 (64.282)	Top-5 acc 86.328 (84.199)	lr 0.00569
Train [82][3220/3239]	Time 0.228 (1.104)	Data Time 0.000 (0.582)	Loss 2.7637 (2.4771)	Entropy 0.59022 (0.59187)	Top-1 acc 57.422 (64.284)	Top-5 acc 80.078 (84.197)	lr 0.00569
Train [82][3230/3239]	Time 0.224 (1.108)	Data Time 0.000 (0.586)	Loss 2.5697 (2.4771)	Entropy 0.59017 (0.59187)	Top-1 acc 61.719 (64.284)	Top-5 acc 83.594 (84.199)	lr 0.00569
Train [82][3239/3239]	Time 0.917 (1.106)	Data Time 0.000 (0.584)	Loss 2.8574 (2.4771)	Entropy 0.59012 (0.59186)	Top-1 acc 56.790 (64.281)	Top-5 acc 81.481 (84.199)	lr 0.00569
==========Valid [82/120]	loss 1.273	top-1 acc 70.783 (70.783)	top-5 acc 89.409	Train top-1 64.281	top-5 84.199	Entropy 0.59012	Latency-None: 0.000ms	Flops: 539.00M
Train [83][0/3239]	Time 56.455 (56.455)	Data Time 54.651 (54.651)	Loss 2.4298 (2.4298)	Entropy 0.59007 (0.59007)	Top-1 acc 64.844 (64.844)	Top-5 acc 83.203 (83.203)	lr 0.00569
Train [83][10/3239]	Time 0.233 (5.615)	Data Time 0.001 (5.009)	Loss 2.4600 (2.5036)	Entropy 0.58986 (0.58997)	Top-1 acc 62.891 (62.749)	Top-5 acc 83.594 (83.594)	lr 0.00569
Train [83][20/3239]	Time 0.337 (3.141)	Data Time 0.001 (2.625)	Loss 2.4887 (2.4691)	Entropy 0.58940 (0.58979)	Top-1 acc 66.016 (64.044)	Top-5 acc 84.766 (84.505)	lr 0.00569
Train [83][30/3239]	Time 0.242 (2.261)	Data Time 0.001 (1.778)	Loss 2.6145 (2.4633)	Entropy 0.58896 (0.58960)	Top-1 acc 59.375 (64.529)	Top-5 acc 81.641 (84.627)	lr 0.00569
Train [83][40/3239]	Time 0.248 (2.039)	Data Time 0.002 (1.567)	Loss 2.4661 (2.4564)	Entropy 0.58889 (0.58943)	Top-1 acc 63.672 (64.901)	Top-5 acc 84.766 (84.546)	lr 0.00569
Train [83][50/3239]	Time 0.254 (1.762)	Data Time 0.001 (1.301)	Loss 2.4295 (2.4587)	Entropy 0.58866 (0.58931)	Top-1 acc 66.797 (64.920)	Top-5 acc 85.156 (84.444)	lr 0.00569
Train [83][60/3239]	Time 0.274 (1.542)	Data Time 0.002 (1.088)	Loss 2.4123 (2.4571)	Entropy 0.58891 (0.58922)	Top-1 acc 68.359 (65.183)	Top-5 acc 85.156 (84.439)	lr 0.00569
Train [83][70/3239]	Time 0.238 (1.501)	Data Time 0.001 (1.048)	Loss 2.3822 (2.4507)	Entropy 0.58887 (0.58917)	Top-1 acc 66.797 (65.278)	Top-5 acc 84.766 (84.590)	lr 0.00569
Train [83][80/3239]	Time 0.237 (1.432)	Data Time 0.001 (0.985)	Loss 2.5027 (2.4514)	Entropy 0.58863 (0.58911)	Top-1 acc 63.672 (65.283)	Top-5 acc 83.984 (84.582)	lr 0.00569
Train [83][90/3239]	Time 0.237 (1.321)	Data Time 0.002 (0.877)	Loss 2.4279 (2.4579)	Entropy 0.58863 (0.58906)	Top-1 acc 66.016 (65.093)	Top-5 acc 84.766 (84.469)	lr 0.00568
Train [83][100/3239]	Time 0.239 (1.297)	Data Time 0.001 (0.855)	Loss 2.4400 (2.4557)	Entropy 0.58844 (0.58901)	Top-1 acc 63.281 (65.142)	Top-5 acc 84.766 (84.495)	lr 0.00568
Train [83][110/3239]	Time 0.235 (1.246)	Data Time 0.001 (0.806)	Loss 2.4657 (2.4538)	Entropy 0.58840 (0.58896)	Top-1 acc 66.797 (65.136)	Top-5 acc 85.547 (84.583)	lr 0.00568
Train [83][120/3239]	Time 0.245 (1.177)	Data Time 0.001 (0.739)	Loss 2.5887 (2.4567)	Entropy 0.58854 (0.58892)	Top-1 acc 59.375 (65.037)	Top-5 acc 82.422 (84.533)	lr 0.00568
Train [83][130/3239]	Time 0.249 (1.185)	Data Time 0.001 (0.748)	Loss 2.5941 (2.4600)	Entropy 0.58846 (0.58889)	Top-1 acc 62.500 (64.915)	Top-5 acc 81.641 (84.518)	lr 0.00568
Train [83][140/3239]	Time 0.235 (1.151)	Data Time 0.001 (0.716)	Loss 2.5424 (2.4573)	Entropy 0.58863 (0.58886)	Top-1 acc 60.938 (64.979)	Top-5 acc 83.203 (84.552)	lr 0.00568
Train [83][150/3239]	Time 0.253 (1.101)	Data Time 0.001 (0.668)	Loss 2.5863 (2.4581)	Entropy 0.58874 (0.58885)	Top-1 acc 60.547 (64.921)	Top-5 acc 85.547 (84.595)	lr 0.00568
Train [83][160/3239]	Time 6.322 (1.098)	Data Time 6.031 (0.664)	Loss 2.6350 (2.4560)	Entropy 0.58851 (0.58884)	Top-1 acc 57.031 (64.931)	Top-5 acc 82.422 (84.654)	lr 0.00568
Train [83][170/3239]	Time 4.279 (1.081)	Data Time 4.026 (0.649)	Loss 2.5373 (2.4557)	Entropy 0.58841 (0.58882)	Top-1 acc 61.328 (64.921)	Top-5 acc 82.812 (84.663)	lr 0.00568
Train [83][180/3239]	Time 0.332 (1.045)	Data Time 0.001 (0.613)	Loss 2.5416 (2.4603)	Entropy 0.58850 (0.58879)	Top-1 acc 61.719 (64.809)	Top-5 acc 84.375 (84.595)	lr 0.00568
Train [83][190/3239]	Time 0.228 (1.012)	Data Time 0.001 (0.581)	Loss 2.6197 (2.4606)	Entropy 0.58811 (0.58877)	Top-1 acc 60.938 (64.795)	Top-5 acc 81.641 (84.582)	lr 0.00568
Train [83][200/3239]	Time 0.251 (1.021)	Data Time 0.001 (0.589)	Loss 2.4906 (2.4624)	Entropy 0.58822 (0.58874)	Top-1 acc 64.062 (64.787)	Top-5 acc 83.594 (84.554)	lr 0.00568
Train [83][210/3239]	Time 0.232 (1.006)	Data Time 0.001 (0.575)	Loss 2.6832 (2.4608)	Entropy 0.58806 (0.58871)	Top-1 acc 60.938 (64.816)	Top-5 acc 80.078 (84.571)	lr 0.00567
Train [83][220/3239]	Time 0.289 (1.229)	Data Time 0.004 (0.549)	Loss 2.4840 (2.4627)	Entropy 0.58797 (0.58868)	Top-1 acc 62.109 (64.782)	Top-5 acc 85.156 (84.575)	lr 0.00567
Train [83][230/3239]	Time 0.238 (1.195)	Data Time 0.002 (0.525)	Loss 2.4514 (2.4629)	Entropy 0.58818 (0.58865)	Top-1 acc 63.281 (64.756)	Top-5 acc 85.547 (84.568)	lr 0.00567
Train [83][240/3239]	Time 0.236 (1.162)	Data Time 0.001 (0.503)	Loss 2.4125 (2.4640)	Entropy 0.58822 (0.58863)	Top-1 acc 62.109 (64.716)	Top-5 acc 85.938 (84.553)	lr 0.00567
Train [83][250/3239]	Time 0.254 (1.133)	Data Time 0.002 (0.483)	Loss 2.3475 (2.4626)	Entropy 0.58834 (0.58862)	Top-1 acc 66.406 (64.707)	Top-5 acc 88.281 (84.601)	lr 0.00567
Train [83][260/3239]	Time 0.260 (1.106)	Data Time 0.001 (0.465)	Loss 2.4834 (2.4613)	Entropy 0.58805 (0.58860)	Top-1 acc 64.453 (64.714)	Top-5 acc 85.938 (84.638)	lr 0.00567
Train [83][270/3239]	Time 0.286 (1.080)	Data Time 0.001 (0.448)	Loss 2.4805 (2.4617)	Entropy 0.58821 (0.58858)	Top-1 acc 60.156 (64.681)	Top-5 acc 82.422 (84.634)	lr 0.00567
Train [83][280/3239]	Time 0.252 (1.058)	Data Time 0.002 (0.432)	Loss 2.4828 (2.4599)	Entropy 0.58792 (0.58857)	Top-1 acc 62.109 (64.706)	Top-5 acc 86.328 (84.679)	lr 0.00567
Train [83][290/3239]	Time 0.276 (1.038)	Data Time 0.001 (0.417)	Loss 2.2934 (2.4569)	Entropy 0.58794 (0.58855)	Top-1 acc 67.969 (64.817)	Top-5 acc 88.281 (84.732)	lr 0.00567
Train [83][300/3239]	Time 0.280 (1.019)	Data Time 0.001 (0.403)	Loss 2.5907 (2.4588)	Entropy 0.58778 (0.58853)	Top-1 acc 64.062 (64.772)	Top-5 acc 83.594 (84.689)	lr 0.00567
Train [83][310/3239]	Time 0.260 (1.000)	Data Time 0.002 (0.390)	Loss 2.3723 (2.4591)	Entropy 0.58784 (0.58851)	Top-1 acc 68.750 (64.772)	Top-5 acc 85.547 (84.678)	lr 0.00567
Train [83][320/3239]	Time 0.259 (1.003)	Data Time 0.001 (0.397)	Loss 2.5753 (2.4597)	Entropy 0.58793 (0.58849)	Top-1 acc 61.719 (64.744)	Top-5 acc 80.859 (84.665)	lr 0.00566
Train [83][330/3239]	Time 0.241 (0.986)	Data Time 0.001 (0.385)	Loss 2.3829 (2.4586)	Entropy 0.58809 (0.58847)	Top-1 acc 66.406 (64.773)	Top-5 acc 84.766 (84.666)	lr 0.00566
Train [83][340/3239]	Time 0.353 (0.977)	Data Time 0.001 (0.381)	Loss 2.3876 (2.4581)	Entropy 0.58785 (0.58845)	Top-1 acc 66.016 (64.811)	Top-5 acc 86.719 (84.656)	lr 0.00566
Train [83][350/3239]	Time 0.316 (0.977)	Data Time 0.003 (0.387)	Loss 2.4320 (2.4582)	Entropy 0.58757 (0.58843)	Top-1 acc 66.016 (64.799)	Top-5 acc 85.547 (84.659)	lr 0.00566
Train [83][360/3239]	Time 0.274 (0.966)	Data Time 0.001 (0.380)	Loss 2.4854 (2.4563)	Entropy 0.58747 (0.58841)	Top-1 acc 62.891 (64.836)	Top-5 acc 84.766 (84.686)	lr 0.00566
Train [83][370/3239]	Time 0.236 (0.963)	Data Time 0.001 (0.381)	Loss 2.4869 (2.4569)	Entropy 0.58751 (0.58838)	Top-1 acc 62.500 (64.800)	Top-5 acc 85.156 (84.687)	lr 0.00566
Train [83][380/3239]	Time 0.229 (0.949)	Data Time 0.001 (0.371)	Loss 2.7543 (2.4575)	Entropy 0.58730 (0.58836)	Top-1 acc 54.297 (64.770)	Top-5 acc 78.516 (84.655)	lr 0.00566
Train [83][390/3239]	Time 0.276 (0.957)	Data Time 0.001 (0.382)	Loss 2.4715 (2.4560)	Entropy 0.58737 (0.58833)	Top-1 acc 64.844 (64.800)	Top-5 acc 85.156 (84.675)	lr 0.00566
Train [83][400/3239]	Time 0.243 (0.949)	Data Time 0.001 (0.378)	Loss 2.3179 (2.4558)	Entropy 0.58735 (0.58830)	Top-1 acc 68.359 (64.826)	Top-5 acc 89.062 (84.676)	lr 0.00566
Train [83][410/3239]	Time 0.330 (0.939)	Data Time 0.001 (0.372)	Loss 2.5596 (2.4562)	Entropy 0.58736 (0.58828)	Top-1 acc 61.719 (64.788)	Top-5 acc 83.984 (84.676)	lr 0.00566
Train [83][420/3239]	Time 0.244 (0.941)	Data Time 0.001 (0.376)	Loss 2.3914 (2.4558)	Entropy 0.58738 (0.58826)	Top-1 acc 66.016 (64.812)	Top-5 acc 83.203 (84.665)	lr 0.00566
Train [83][430/3239]	Time 0.235 (0.946)	Data Time 0.001 (0.385)	Loss 2.4751 (2.4564)	Entropy 0.58736 (0.58824)	Top-1 acc 63.281 (64.789)	Top-5 acc 83.984 (84.655)	lr 0.00566
Train [83][440/3239]	Time 0.247 (0.935)	Data Time 0.001 (0.377)	Loss 2.2170 (2.4568)	Entropy 0.58725 (0.58821)	Top-1 acc 72.266 (64.811)	Top-5 acc 89.062 (84.655)	lr 0.00565
Train [83][450/3239]	Time 0.276 (0.929)	Data Time 0.001 (0.373)	Loss 2.4398 (2.4578)	Entropy 0.58733 (0.58819)	Top-1 acc 62.500 (64.768)	Top-5 acc 85.156 (84.627)	lr 0.00565
Train [83][460/3239]	Time 0.487 (0.924)	Data Time 0.236 (0.370)	Loss 2.4337 (2.4586)	Entropy 0.58720 (0.58817)	Top-1 acc 69.531 (64.752)	Top-5 acc 83.594 (84.622)	lr 0.00565
Train [83][470/3239]	Time 0.235 (0.913)	Data Time 0.001 (0.362)	Loss 2.8204 (2.4587)	Entropy 0.58712 (0.58815)	Top-1 acc 51.562 (64.747)	Top-5 acc 77.734 (84.629)	lr 0.00565
Train [83][480/3239]	Time 0.260 (0.904)	Data Time 0.001 (0.354)	Loss 2.5176 (2.4589)	Entropy 0.58698 (0.58813)	Top-1 acc 64.453 (64.744)	Top-5 acc 83.203 (84.625)	lr 0.00565
Train [83][490/3239]	Time 1.375 (0.898)	Data Time 1.077 (0.351)	Loss 2.4182 (2.4584)	Entropy 0.58714 (0.58811)	Top-1 acc 67.578 (64.753)	Top-5 acc 84.766 (84.629)	lr 0.00565
Train [83][500/3239]	Time 0.410 (0.892)	Data Time 0.003 (0.345)	Loss 2.7638 (2.4591)	Entropy 0.58733 (0.58809)	Top-1 acc 56.641 (64.740)	Top-5 acc 79.297 (84.620)	lr 0.00565
Train [83][510/3239]	Time 0.280 (0.883)	Data Time 0.001 (0.338)	Loss 2.3405 (2.4587)	Entropy 0.58711 (0.58807)	Top-1 acc 68.359 (64.743)	Top-5 acc 89.062 (84.633)	lr 0.00565
Train [83][520/3239]	Time 0.276 (0.877)	Data Time 0.003 (0.334)	Loss 2.2763 (2.4580)	Entropy 0.58741 (0.58806)	Top-1 acc 70.312 (64.752)	Top-5 acc 87.891 (84.638)	lr 0.00565
Train [83][530/3239]	Time 0.257 (0.870)	Data Time 0.001 (0.329)	Loss 2.5409 (2.4591)	Entropy 0.58718 (0.58804)	Top-1 acc 64.844 (64.739)	Top-5 acc 82.812 (84.621)	lr 0.00565
Train [83][540/3239]	Time 0.265 (0.863)	Data Time 0.001 (0.323)	Loss 2.3912 (2.4610)	Entropy 0.58729 (0.58803)	Top-1 acc 64.844 (64.694)	Top-5 acc 85.938 (84.577)	lr 0.00565
Train [83][550/3239]	Time 0.241 (0.860)	Data Time 0.001 (0.322)	Loss 2.3589 (2.4594)	Entropy 0.58728 (0.58802)	Top-1 acc 65.234 (64.744)	Top-5 acc 84.375 (84.603)	lr 0.00565
Train [83][560/3239]	Time 0.247 (0.864)	Data Time 0.001 (0.327)	Loss 2.2819 (2.4574)	Entropy 0.58729 (0.58800)	Top-1 acc 68.750 (64.792)	Top-5 acc 88.281 (84.635)	lr 0.00564
Train [83][570/3239]	Time 1.230 (0.857)	Data Time 0.811 (0.323)	Loss 2.7568 (2.4575)	Entropy 0.58716 (0.58799)	Top-1 acc 54.297 (64.795)	Top-5 acc 79.297 (84.623)	lr 0.00564
Train [83][580/3239]	Time 0.252 (0.859)	Data Time 0.001 (0.326)	Loss 2.2964 (2.4567)	Entropy 0.58715 (0.58797)	Top-1 acc 70.703 (64.830)	Top-5 acc 87.891 (84.635)	lr 0.00564
Train [83][590/3239]	Time 0.256 (0.861)	Data Time 0.001 (0.330)	Loss 2.5453 (2.4565)	Entropy 0.58717 (0.58796)	Top-1 acc 60.156 (64.829)	Top-5 acc 83.984 (84.639)	lr 0.00564
Train [83][600/3239]	Time 0.235 (0.854)	Data Time 0.001 (0.324)	Loss 2.4823 (2.4557)	Entropy 0.58721 (0.58795)	Top-1 acc 64.844 (64.857)	Top-5 acc 83.984 (84.651)	lr 0.00564
Train [83][610/3239]	Time 0.239 (0.860)	Data Time 0.001 (0.332)	Loss 2.4114 (2.4556)	Entropy 0.58733 (0.58794)	Top-1 acc 65.234 (64.860)	Top-5 acc 87.500 (84.654)	lr 0.00564
Train [83][620/3239]	Time 5.444 (0.865)	Data Time 5.181 (0.339)	Loss 2.4443 (2.4572)	Entropy 0.58749 (0.58793)	Top-1 acc 68.750 (64.809)	Top-5 acc 85.547 (84.630)	lr 0.00564
Train [83][630/3239]	Time 0.255 (0.858)	Data Time 0.001 (0.334)	Loss 2.4504 (2.4578)	Entropy 0.58686 (0.58792)	Top-1 acc 61.328 (64.781)	Top-5 acc 86.328 (84.615)	lr 0.00564
Train [83][640/3239]	Time 0.275 (0.863)	Data Time 0.002 (0.339)	Loss 2.5910 (2.4576)	Entropy 0.58691 (0.58790)	Top-1 acc 61.328 (64.781)	Top-5 acc 83.594 (84.613)	lr 0.00564
Train [83][650/3239]	Time 0.240 (0.857)	Data Time 0.001 (0.335)	Loss 2.5359 (2.4581)	Entropy 0.58701 (0.58789)	Top-1 acc 62.109 (64.766)	Top-5 acc 84.375 (84.610)	lr 0.00564
Train [83][660/3239]	Time 0.301 (0.857)	Data Time 0.001 (0.336)	Loss 2.4530 (2.4580)	Entropy 0.58690 (0.58787)	Top-1 acc 63.672 (64.772)	Top-5 acc 85.547 (84.610)	lr 0.00564
Train [83][670/3239]	Time 0.254 (0.851)	Data Time 0.001 (0.331)	Loss 2.6779 (2.4585)	Entropy 0.58697 (0.58786)	Top-1 acc 59.766 (64.742)	Top-5 acc 80.469 (84.583)	lr 0.00564
Train [83][680/3239]	Time 0.260 (0.848)	Data Time 0.001 (0.329)	Loss 2.4586 (2.4587)	Entropy 0.58680 (0.58785)	Top-1 acc 65.234 (64.750)	Top-5 acc 84.375 (84.575)	lr 0.00563
Train [83][690/3239]	Time 0.234 (0.850)	Data Time 0.001 (0.333)	Loss 2.6331 (2.4595)	Entropy 0.58656 (0.58783)	Top-1 acc 60.938 (64.741)	Top-5 acc 81.641 (84.553)	lr 0.00563
Train [83][700/3239]	Time 0.249 (0.844)	Data Time 0.001 (0.328)	Loss 2.2991 (2.4594)	Entropy 0.58641 (0.58781)	Top-1 acc 73.438 (64.756)	Top-5 acc 87.500 (84.553)	lr 0.00563
Train [83][710/3239]	Time 0.241 (0.839)	Data Time 0.001 (0.324)	Loss 2.3331 (2.4600)	Entropy 0.58644 (0.58779)	Top-1 acc 65.234 (64.733)	Top-5 acc 87.500 (84.549)	lr 0.00563
Train [83][720/3239]	Time 0.254 (0.841)	Data Time 0.001 (0.327)	Loss 2.6040 (2.4608)	Entropy 0.58651 (0.58777)	Top-1 acc 64.453 (64.721)	Top-5 acc 82.031 (84.538)	lr 0.00563
Train [83][730/3239]	Time 0.396 (0.836)	Data Time 0.001 (0.323)	Loss 2.3006 (2.4600)	Entropy 0.58665 (0.58776)	Top-1 acc 67.969 (64.726)	Top-5 acc 87.891 (84.556)	lr 0.00563
Train [83][740/3239]	Time 0.238 (0.830)	Data Time 0.001 (0.319)	Loss 2.3355 (2.4597)	Entropy 0.58671 (0.58774)	Top-1 acc 66.797 (64.735)	Top-5 acc 87.500 (84.556)	lr 0.00563
Train [83][750/3239]	Time 0.270 (0.834)	Data Time 0.001 (0.323)	Loss 2.3898 (2.4602)	Entropy 0.58695 (0.58773)	Top-1 acc 67.578 (64.723)	Top-5 acc 88.281 (84.546)	lr 0.00563
Train [83][760/3239]	Time 0.271 (0.829)	Data Time 0.001 (0.319)	Loss 2.3953 (2.4607)	Entropy 0.58708 (0.58772)	Top-1 acc 64.453 (64.701)	Top-5 acc 87.891 (84.539)	lr 0.00563
Train [83][770/3239]	Time 0.244 (0.824)	Data Time 0.001 (0.315)	Loss 2.5345 (2.4617)	Entropy 0.58663 (0.58771)	Top-1 acc 64.453 (64.685)	Top-5 acc 83.203 (84.521)	lr 0.00563
Train [83][780/3239]	Time 5.146 (0.825)	Data Time 4.875 (0.317)	Loss 2.4648 (2.4619)	Entropy 0.58695 (0.58770)	Top-1 acc 63.672 (64.682)	Top-5 acc 81.641 (84.515)	lr 0.00563
Train [83][790/3239]	Time 0.251 (0.821)	Data Time 0.001 (0.313)	Loss 2.4358 (2.4624)	Entropy 0.58706 (0.58769)	Top-1 acc 62.891 (64.669)	Top-5 acc 84.766 (84.511)	lr 0.00563
Train [83][800/3239]	Time 0.342 (0.816)	Data Time 0.001 (0.309)	Loss 2.5079 (2.4627)	Entropy 0.58665 (0.58768)	Top-1 acc 66.797 (64.674)	Top-5 acc 83.984 (84.500)	lr 0.00562
Train [83][810/3239]	Time 0.250 (0.811)	Data Time 0.002 (0.305)	Loss 2.2882 (2.4631)	Entropy 0.58675 (0.58767)	Top-1 acc 68.359 (64.665)	Top-5 acc 84.375 (84.489)	lr 0.00562
Train [83][820/3239]	Time 0.249 (0.815)	Data Time 0.001 (0.310)	Loss 2.6948 (2.4632)	Entropy 0.58662 (0.58766)	Top-1 acc 61.328 (64.662)	Top-5 acc 81.250 (84.492)	lr 0.00562
Train [83][830/3239]	Time 0.313 (0.811)	Data Time 0.003 (0.306)	Loss 2.6208 (2.4640)	Entropy 0.58669 (0.58764)	Top-1 acc 62.500 (64.641)	Top-5 acc 78.906 (84.469)	lr 0.00562
Train [83][840/3239]	Time 0.250 (0.806)	Data Time 0.001 (0.303)	Loss 2.3336 (2.4641)	Entropy 0.58621 (0.58763)	Top-1 acc 69.141 (64.646)	Top-5 acc 85.938 (84.466)	lr 0.00562
Train [83][850/3239]	Time 0.252 (0.813)	Data Time 0.001 (0.311)	Loss 2.3528 (2.4633)	Entropy 0.58614 (0.58761)	Top-1 acc 67.188 (64.656)	Top-5 acc 86.719 (84.480)	lr 0.00562
Train [83][860/3239]	Time 0.265 (0.809)	Data Time 0.001 (0.307)	Loss 2.5622 (2.4642)	Entropy 0.58652 (0.58760)	Top-1 acc 59.766 (64.631)	Top-5 acc 82.812 (84.462)	lr 0.00562
Train [83][870/3239]	Time 0.250 (0.805)	Data Time 0.001 (0.304)	Loss 2.5033 (2.4649)	Entropy 0.58654 (0.58759)	Top-1 acc 64.844 (64.607)	Top-5 acc 81.641 (84.445)	lr 0.00562
Train [83][880/3239]	Time 0.266 (0.863)	Data Time 0.002 (0.300)	Loss 2.3410 (2.4654)	Entropy 0.58670 (0.58757)	Top-1 acc 66.406 (64.603)	Top-5 acc 86.328 (84.436)	lr 0.00562
Train [83][890/3239]	Time 0.333 (0.859)	Data Time 0.002 (0.297)	Loss 2.4969 (2.4658)	Entropy 0.58682 (0.58757)	Top-1 acc 60.938 (64.591)	Top-5 acc 83.984 (84.429)	lr 0.00562
Train [83][900/3239]	Time 0.233 (0.854)	Data Time 0.001 (0.294)	Loss 2.7017 (2.4660)	Entropy 0.58690 (0.58756)	Top-1 acc 57.422 (64.573)	Top-5 acc 83.203 (84.426)	lr 0.00562
Train [83][910/3239]	Time 0.241 (0.849)	Data Time 0.001 (0.290)	Loss 2.3281 (2.4662)	Entropy 0.58711 (0.58755)	Top-1 acc 64.062 (64.569)	Top-5 acc 87.109 (84.423)	lr 0.00562
Train [83][920/3239]	Time 0.294 (0.845)	Data Time 0.002 (0.287)	Loss 2.4250 (2.4664)	Entropy 0.58741 (0.58755)	Top-1 acc 66.016 (64.562)	Top-5 acc 85.938 (84.422)	lr 0.00561
Train [83][930/3239]	Time 0.238 (0.840)	Data Time 0.002 (0.284)	Loss 2.5952 (2.4658)	Entropy 0.58731 (0.58755)	Top-1 acc 60.938 (64.583)	Top-5 acc 81.250 (84.431)	lr 0.00561
Train [83][940/3239]	Time 0.286 (0.836)	Data Time 0.001 (0.281)	Loss 2.5899 (2.4663)	Entropy 0.58758 (0.58754)	Top-1 acc 61.719 (64.569)	Top-5 acc 82.031 (84.416)	lr 0.00561
Train [83][950/3239]	Time 0.264 (0.833)	Data Time 0.001 (0.278)	Loss 2.5528 (2.4662)	Entropy 0.58730 (0.58754)	Top-1 acc 62.891 (64.564)	Top-5 acc 80.859 (84.423)	lr 0.00561
Train [83][960/3239]	Time 0.343 (0.829)	Data Time 0.001 (0.275)	Loss 2.4210 (2.4661)	Entropy 0.58766 (0.58754)	Top-1 acc 68.750 (64.562)	Top-5 acc 82.812 (84.424)	lr 0.00561
Train [83][970/3239]	Time 0.245 (0.825)	Data Time 0.001 (0.273)	Loss 2.3950 (2.4657)	Entropy 0.58786 (0.58754)	Top-1 acc 66.016 (64.564)	Top-5 acc 85.156 (84.432)	lr 0.00561
Train [83][980/3239]	Time 0.251 (0.822)	Data Time 0.001 (0.271)	Loss 2.4207 (2.4660)	Entropy 0.58788 (0.58755)	Top-1 acc 65.625 (64.552)	Top-5 acc 84.375 (84.435)	lr 0.00561
Train [83][990/3239]	Time 0.253 (0.823)	Data Time 0.001 (0.273)	Loss 2.4678 (2.4661)	Entropy 0.58773 (0.58755)	Top-1 acc 65.625 (64.546)	Top-5 acc 85.156 (84.432)	lr 0.00561
Train [83][1000/3239]	Time 0.257 (0.820)	Data Time 0.001 (0.271)	Loss 2.2834 (2.4664)	Entropy 0.58752 (0.58755)	Top-1 acc 68.750 (64.535)	Top-5 acc 88.281 (84.430)	lr 0.00561
Train [83][1010/3239]	Time 0.254 (0.819)	Data Time 0.001 (0.272)	Loss 2.4363 (2.4664)	Entropy 0.58748 (0.58755)	Top-1 acc 64.844 (64.532)	Top-5 acc 83.984 (84.431)	lr 0.00561
Train [83][1020/3239]	Time 0.283 (0.820)	Data Time 0.002 (0.273)	Loss 2.5304 (2.4664)	Entropy 0.58761 (0.58755)	Top-1 acc 58.594 (64.522)	Top-5 acc 84.375 (84.434)	lr 0.00561
Train [83][1030/3239]	Time 0.267 (0.817)	Data Time 0.001 (0.271)	Loss 2.4819 (2.4666)	Entropy 0.58745 (0.58755)	Top-1 acc 62.109 (64.519)	Top-5 acc 83.594 (84.424)	lr 0.00560
Train [83][1040/3239]	Time 0.236 (0.816)	Data Time 0.001 (0.271)	Loss 2.3760 (2.4666)	Entropy 0.58768 (0.58755)	Top-1 acc 67.578 (64.521)	Top-5 acc 85.938 (84.421)	lr 0.00560
Train [83][1050/3239]	Time 1.586 (0.816)	Data Time 1.218 (0.272)	Loss 2.4391 (2.4662)	Entropy 0.58768 (0.58755)	Top-1 acc 62.109 (64.529)	Top-5 acc 86.328 (84.431)	lr 0.00560
Train [83][1060/3239]	Time 0.251 (0.816)	Data Time 0.001 (0.273)	Loss 2.4897 (2.4658)	Entropy 0.58745 (0.58755)	Top-1 acc 64.453 (64.540)	Top-5 acc 85.156 (84.439)	lr 0.00560
Train [83][1070/3239]	Time 2.583 (0.814)	Data Time 2.288 (0.273)	Loss 2.4568 (2.4662)	Entropy 0.58758 (0.58755)	Top-1 acc 64.844 (64.519)	Top-5 acc 82.031 (84.425)	lr 0.00560
Train [83][1080/3239]	Time 0.258 (0.814)	Data Time 0.001 (0.273)	Loss 2.4654 (2.4672)	Entropy 0.58714 (0.58755)	Top-1 acc 63.281 (64.506)	Top-5 acc 83.984 (84.401)	lr 0.00560
Train [83][1090/3239]	Time 0.249 (0.814)	Data Time 0.001 (0.274)	Loss 2.4516 (2.4673)	Entropy 0.58683 (0.58754)	Top-1 acc 66.406 (64.506)	Top-5 acc 86.328 (84.396)	lr 0.00560
Train [83][1100/3239]	Time 0.241 (0.811)	Data Time 0.001 (0.272)	Loss 2.6782 (2.4677)	Entropy 0.58672 (0.58754)	Top-1 acc 55.078 (64.495)	Top-5 acc 80.078 (84.384)	lr 0.00560
Train [83][1110/3239]	Time 1.093 (0.811)	Data Time 0.828 (0.273)	Loss 2.3687 (2.4679)	Entropy 0.58648 (0.58753)	Top-1 acc 67.188 (64.487)	Top-5 acc 84.766 (84.378)	lr 0.00560
Train [83][1120/3239]	Time 0.347 (0.812)	Data Time 0.001 (0.274)	Loss 2.4686 (2.4685)	Entropy 0.58613 (0.58752)	Top-1 acc 62.109 (64.478)	Top-5 acc 83.594 (84.363)	lr 0.00560
Train [83][1130/3239]	Time 0.252 (0.812)	Data Time 0.001 (0.275)	Loss 2.5488 (2.4688)	Entropy 0.58631 (0.58751)	Top-1 acc 63.281 (64.480)	Top-5 acc 82.812 (84.358)	lr 0.00560
Train [83][1140/3239]	Time 0.232 (0.809)	Data Time 0.001 (0.274)	Loss 2.6604 (2.4687)	Entropy 0.58663 (0.58750)	Top-1 acc 60.156 (64.486)	Top-5 acc 78.906 (84.358)	lr 0.00560
Train [83][1150/3239]	Time 0.249 (0.811)	Data Time 0.001 (0.276)	Loss 2.5817 (2.4687)	Entropy 0.58672 (0.58749)	Top-1 acc 60.547 (64.482)	Top-5 acc 82.031 (84.358)	lr 0.00559
Train [83][1160/3239]	Time 0.246 (0.810)	Data Time 0.001 (0.276)	Loss 2.2002 (2.4682)	Entropy 0.58687 (0.58749)	Top-1 acc 72.656 (64.501)	Top-5 acc 90.234 (84.366)	lr 0.00559
Train [83][1170/3239]	Time 2.838 (0.809)	Data Time 2.584 (0.276)	Loss 2.6557 (2.4679)	Entropy 0.58675 (0.58748)	Top-1 acc 60.547 (64.507)	Top-5 acc 83.203 (84.379)	lr 0.00559
Train [83][1180/3239]	Time 0.240 (0.809)	Data Time 0.001 (0.277)	Loss 2.5663 (2.4680)	Entropy 0.58669 (0.58747)	Top-1 acc 59.375 (64.506)	Top-5 acc 83.203 (84.376)	lr 0.00559
Train [83][1190/3239]	Time 0.252 (0.810)	Data Time 0.002 (0.278)	Loss 2.4851 (2.4683)	Entropy 0.58628 (0.58747)	Top-1 acc 60.156 (64.504)	Top-5 acc 86.719 (84.372)	lr 0.00559
Train [83][1200/3239]	Time 0.296 (0.806)	Data Time 0.001 (0.276)	Loss 2.4715 (2.4689)	Entropy 0.58641 (0.58746)	Top-1 acc 65.234 (64.484)	Top-5 acc 81.250 (84.361)	lr 0.00559
Train [83][1210/3239]	Time 0.377 (0.809)	Data Time 0.001 (0.279)	Loss 2.4063 (2.4690)	Entropy 0.58610 (0.58745)	Top-1 acc 65.234 (64.489)	Top-5 acc 85.547 (84.346)	lr 0.00559
Train [83][1220/3239]	Time 2.596 (0.810)	Data Time 2.349 (0.280)	Loss 2.3748 (2.4691)	Entropy 0.58563 (0.58743)	Top-1 acc 64.062 (64.474)	Top-5 acc 85.547 (84.344)	lr 0.00559
Train [83][1230/3239]	Time 0.242 (0.807)	Data Time 0.001 (0.279)	Loss 2.3483 (2.4693)	Entropy 0.58555 (0.58742)	Top-1 acc 66.406 (64.469)	Top-5 acc 86.328 (84.333)	lr 0.00559
Train [83][1240/3239]	Time 0.294 (0.811)	Data Time 0.001 (0.283)	Loss 2.5959 (2.4696)	Entropy 0.58557 (0.58740)	Top-1 acc 63.281 (64.465)	Top-5 acc 82.422 (84.327)	lr 0.00559
Train [83][1250/3239]	Time 0.246 (0.809)	Data Time 0.001 (0.282)	Loss 2.4021 (2.4698)	Entropy 0.58557 (0.58739)	Top-1 acc 63.672 (64.461)	Top-5 acc 85.938 (84.323)	lr 0.00559
Train [83][1260/3239]	Time 0.226 (0.811)	Data Time 0.001 (0.285)	Loss 2.2706 (2.4698)	Entropy 0.58591 (0.58738)	Top-1 acc 67.578 (64.453)	Top-5 acc 89.062 (84.327)	lr 0.00559
Train [83][1270/3239]	Time 3.927 (0.814)	Data Time 3.674 (0.289)	Loss 2.5008 (2.4700)	Entropy 0.58578 (0.58736)	Top-1 acc 64.844 (64.454)	Top-5 acc 83.203 (84.322)	lr 0.00558
Train [83][1280/3239]	Time 0.345 (0.812)	Data Time 0.002 (0.287)	Loss 2.3635 (2.4699)	Entropy 0.58557 (0.58735)	Top-1 acc 67.578 (64.458)	Top-5 acc 83.984 (84.321)	lr 0.00558
Train [83][1290/3239]	Time 0.240 (0.813)	Data Time 0.001 (0.290)	Loss 2.3367 (2.4699)	Entropy 0.58540 (0.58734)	Top-1 acc 69.531 (64.455)	Top-5 acc 84.766 (84.321)	lr 0.00558
Train [83][1300/3239]	Time 0.244 (0.811)	Data Time 0.001 (0.288)	Loss 2.5613 (2.4700)	Entropy 0.58558 (0.58732)	Top-1 acc 62.891 (64.448)	Top-5 acc 82.031 (84.321)	lr 0.00558
Train [83][1310/3239]	Time 2.329 (0.818)	Data Time 2.073 (0.295)	Loss 2.4125 (2.4702)	Entropy 0.58577 (0.58731)	Top-1 acc 65.625 (64.450)	Top-5 acc 84.375 (84.312)	lr 0.00558
Train [83][1320/3239]	Time 0.278 (0.818)	Data Time 0.001 (0.296)	Loss 2.5364 (2.4701)	Entropy 0.58585 (0.58730)	Top-1 acc 62.109 (64.455)	Top-5 acc 82.031 (84.312)	lr 0.00558
Train [83][1330/3239]	Time 0.235 (0.815)	Data Time 0.001 (0.294)	Loss 2.4993 (2.4697)	Entropy 0.58605 (0.58729)	Top-1 acc 64.453 (64.467)	Top-5 acc 83.594 (84.322)	lr 0.00558
Train [83][1340/3239]	Time 0.285 (0.821)	Data Time 0.001 (0.301)	Loss 2.5565 (2.4694)	Entropy 0.58619 (0.58728)	Top-1 acc 62.109 (64.473)	Top-5 acc 81.641 (84.326)	lr 0.00558
Train [83][1350/3239]	Time 0.247 (0.826)	Data Time 0.001 (0.306)	Loss 2.5190 (2.4703)	Entropy 0.58572 (0.58727)	Top-1 acc 64.844 (64.452)	Top-5 acc 83.203 (84.314)	lr 0.00558
Train [83][1360/3239]	Time 0.243 (0.823)	Data Time 0.001 (0.304)	Loss 2.5071 (2.4701)	Entropy 0.58586 (0.58726)	Top-1 acc 62.500 (64.456)	Top-5 acc 83.594 (84.320)	lr 0.00558
Train [83][1370/3239]	Time 0.244 (0.829)	Data Time 0.002 (0.311)	Loss 2.5867 (2.4701)	Entropy 0.58593 (0.58725)	Top-1 acc 62.500 (64.458)	Top-5 acc 83.594 (84.321)	lr 0.00558
Train [83][1380/3239]	Time 6.786 (0.836)	Data Time 6.549 (0.318)	Loss 2.5666 (2.4702)	Entropy 0.58570 (0.58724)	Top-1 acc 60.547 (64.452)	Top-5 acc 80.859 (84.316)	lr 0.00558
Train [83][1390/3239]	Time 0.249 (0.832)	Data Time 0.001 (0.315)	Loss 2.1622 (2.4699)	Entropy 0.58570 (0.58723)	Top-1 acc 71.484 (64.453)	Top-5 acc 89.062 (84.321)	lr 0.00557
Train [83][1400/3239]	Time 0.235 (0.839)	Data Time 0.001 (0.322)	Loss 2.2300 (2.4698)	Entropy 0.58574 (0.58722)	Top-1 acc 69.531 (64.454)	Top-5 acc 87.891 (84.325)	lr 0.00557
Train [83][1410/3239]	Time 0.244 (0.837)	Data Time 0.001 (0.321)	Loss 2.5370 (2.4695)	Entropy 0.58599 (0.58721)	Top-1 acc 60.938 (64.463)	Top-5 acc 82.812 (84.328)	lr 0.00557
Train [83][1420/3239]	Time 0.254 (0.840)	Data Time 0.001 (0.325)	Loss 2.6108 (2.4698)	Entropy 0.58599 (0.58720)	Top-1 acc 59.766 (64.453)	Top-5 acc 81.250 (84.324)	lr 0.00557
Train [83][1430/3239]	Time 14.140 (0.847)	Data Time 13.858 (0.333)	Loss 2.4146 (2.4701)	Entropy 0.58591 (0.58719)	Top-1 acc 65.234 (64.448)	Top-5 acc 86.328 (84.313)	lr 0.00557
Train [83][1440/3239]	Time 0.827 (0.845)	Data Time 0.479 (0.331)	Loss 2.1901 (2.4699)	Entropy 0.58567 (0.58718)	Top-1 acc 73.047 (64.454)	Top-5 acc 89.844 (84.322)	lr 0.00557
Train [83][1450/3239]	Time 0.234 (0.847)	Data Time 0.001 (0.334)	Loss 2.4039 (2.4696)	Entropy 0.58548 (0.58717)	Top-1 acc 68.359 (64.462)	Top-5 acc 83.594 (84.327)	lr 0.00557
Train [83][1460/3239]	Time 0.243 (0.844)	Data Time 0.001 (0.332)	Loss 2.3980 (2.4698)	Entropy 0.58548 (0.58716)	Top-1 acc 61.719 (64.459)	Top-5 acc 86.719 (84.324)	lr 0.00557
Train [83][1470/3239]	Time 0.255 (0.853)	Data Time 0.001 (0.341)	Loss 2.3142 (2.4696)	Entropy 0.58541 (0.58715)	Top-1 acc 71.094 (64.472)	Top-5 acc 83.203 (84.328)	lr 0.00557
Train [83][1480/3239]	Time 0.312 (0.855)	Data Time 0.058 (0.344)	Loss 2.7016 (2.4694)	Entropy 0.58536 (0.58713)	Top-1 acc 60.938 (64.477)	Top-5 acc 79.297 (84.326)	lr 0.00557
Train [83][1490/3239]	Time 0.238 (0.853)	Data Time 0.001 (0.342)	Loss 2.3637 (2.4692)	Entropy 0.58512 (0.58712)	Top-1 acc 70.703 (64.486)	Top-5 acc 87.109 (84.330)	lr 0.00557
Train [83][1500/3239]	Time 0.239 (0.863)	Data Time 0.001 (0.353)	Loss 2.4646 (2.4694)	Entropy 0.58520 (0.58711)	Top-1 acc 66.406 (64.486)	Top-5 acc 82.031 (84.323)	lr 0.00557
Train [83][1510/3239]	Time 0.360 (0.862)	Data Time 0.001 (0.353)	Loss 2.4148 (2.4696)	Entropy 0.58506 (0.58710)	Top-1 acc 64.453 (64.485)	Top-5 acc 85.156 (84.317)	lr 0.00556
Train [83][1520/3239]	Time 0.246 (0.861)	Data Time 0.001 (0.352)	Loss 2.4715 (2.4695)	Entropy 0.58516 (0.58708)	Top-1 acc 62.891 (64.489)	Top-5 acc 83.594 (84.316)	lr 0.00556
Train [83][1530/3239]	Time 0.571 (0.909)	Data Time 0.039 (0.363)	Loss 2.6298 (2.4693)	Entropy 0.58533 (0.58707)	Top-1 acc 58.594 (64.492)	Top-5 acc 81.250 (84.318)	lr 0.00556
Train [83][1540/3239]	Time 0.245 (0.906)	Data Time 0.002 (0.361)	Loss 2.4780 (2.4695)	Entropy 0.58528 (0.58706)	Top-1 acc 61.328 (64.480)	Top-5 acc 84.375 (84.317)	lr 0.00556
Train [83][1550/3239]	Time 0.236 (0.903)	Data Time 0.001 (0.358)	Loss 2.4858 (2.4695)	Entropy 0.58554 (0.58705)	Top-1 acc 64.453 (64.480)	Top-5 acc 83.984 (84.316)	lr 0.00556
Train [83][1560/3239]	Time 0.234 (0.900)	Data Time 0.001 (0.356)	Loss 2.3757 (2.4695)	Entropy 0.58563 (0.58704)	Top-1 acc 66.016 (64.475)	Top-5 acc 86.719 (84.322)	lr 0.00556
Train [83][1570/3239]	Time 0.233 (0.897)	Data Time 0.002 (0.354)	Loss 2.4827 (2.4696)	Entropy 0.58572 (0.58703)	Top-1 acc 65.625 (64.473)	Top-5 acc 83.594 (84.323)	lr 0.00556
Train [83][1580/3239]	Time 0.234 (0.894)	Data Time 0.001 (0.351)	Loss 2.4459 (2.4694)	Entropy 0.58585 (0.58702)	Top-1 acc 63.281 (64.475)	Top-5 acc 83.203 (84.329)	lr 0.00556
Train [83][1590/3239]	Time 0.255 (0.891)	Data Time 0.001 (0.349)	Loss 2.5958 (2.4696)	Entropy 0.58550 (0.58702)	Top-1 acc 63.281 (64.467)	Top-5 acc 81.641 (84.326)	lr 0.00556
Train [83][1600/3239]	Time 0.557 (0.890)	Data Time 0.207 (0.350)	Loss 2.4932 (2.4691)	Entropy 0.58567 (0.58701)	Top-1 acc 62.109 (64.477)	Top-5 acc 86.328 (84.334)	lr 0.00556
Train [83][1610/3239]	Time 0.261 (0.891)	Data Time 0.001 (0.351)	Loss 2.4669 (2.4693)	Entropy 0.58564 (0.58700)	Top-1 acc 62.891 (64.474)	Top-5 acc 83.984 (84.332)	lr 0.00556
Train [83][1620/3239]	Time 0.229 (0.888)	Data Time 0.001 (0.348)	Loss 2.6037 (2.4695)	Entropy 0.58566 (0.58699)	Top-1 acc 62.891 (64.476)	Top-5 acc 82.812 (84.330)	lr 0.00556
Train [83][1630/3239]	Time 0.254 (0.897)	Data Time 0.001 (0.358)	Loss 2.6183 (2.4696)	Entropy 0.58575 (0.58698)	Top-1 acc 66.016 (64.473)	Top-5 acc 81.250 (84.325)	lr 0.00555
Train [83][1640/3239]	Time 0.235 (0.897)	Data Time 0.001 (0.358)	Loss 2.3506 (2.4692)	Entropy 0.58567 (0.58697)	Top-1 acc 69.531 (64.482)	Top-5 acc 88.281 (84.331)	lr 0.00555
Train [83][1650/3239]	Time 0.248 (0.894)	Data Time 0.001 (0.356)	Loss 2.5241 (2.4693)	Entropy 0.58588 (0.58697)	Top-1 acc 64.062 (64.483)	Top-5 acc 84.375 (84.325)	lr 0.00555
Train [83][1660/3239]	Time 6.012 (0.901)	Data Time 5.753 (0.364)	Loss 2.4990 (2.4691)	Entropy 0.58587 (0.58696)	Top-1 acc 61.719 (64.490)	Top-5 acc 85.938 (84.325)	lr 0.00555
Train [83][1670/3239]	Time 0.379 (0.901)	Data Time 0.001 (0.364)	Loss 2.2589 (2.4688)	Entropy 0.58609 (0.58695)	Top-1 acc 70.312 (64.502)	Top-5 acc 89.062 (84.331)	lr 0.00555
Train [83][1680/3239]	Time 0.236 (0.899)	Data Time 0.001 (0.363)	Loss 2.3681 (2.4688)	Entropy 0.58601 (0.58695)	Top-1 acc 68.750 (64.503)	Top-5 acc 87.109 (84.332)	lr 0.00555
Train [83][1690/3239]	Time 4.427 (0.899)	Data Time 4.170 (0.363)	Loss 2.5130 (2.4689)	Entropy 0.58591 (0.58694)	Top-1 acc 62.500 (64.497)	Top-5 acc 83.203 (84.329)	lr 0.00555
Train [83][1700/3239]	Time 0.262 (0.906)	Data Time 0.001 (0.370)	Loss 2.4866 (2.4689)	Entropy 0.58622 (0.58694)	Top-1 acc 64.844 (64.498)	Top-5 acc 83.984 (84.329)	lr 0.00555
Train [83][1710/3239]	Time 0.286 (0.903)	Data Time 0.001 (0.368)	Loss 2.5568 (2.4689)	Entropy 0.58622 (0.58693)	Top-1 acc 63.672 (64.492)	Top-5 acc 81.250 (84.328)	lr 0.00555
Train [83][1720/3239]	Time 0.240 (0.902)	Data Time 0.001 (0.367)	Loss 2.2589 (2.4685)	Entropy 0.58659 (0.58693)	Top-1 acc 69.531 (64.503)	Top-5 acc 86.328 (84.338)	lr 0.00555
Train [83][1730/3239]	Time 0.235 (0.912)	Data Time 0.001 (0.379)	Loss 2.6653 (2.4688)	Entropy 0.58659 (0.58693)	Top-1 acc 58.984 (64.493)	Top-5 acc 83.203 (84.341)	lr 0.00555
Train [83][1740/3239]	Time 0.266 (0.909)	Data Time 0.002 (0.376)	Loss 2.4689 (2.4689)	Entropy 0.58666 (0.58693)	Top-1 acc 64.844 (64.487)	Top-5 acc 81.641 (84.339)	lr 0.00555
Train [83][1750/3239]	Time 0.240 (0.906)	Data Time 0.001 (0.374)	Loss 2.5474 (2.4688)	Entropy 0.58655 (0.58692)	Top-1 acc 65.625 (64.488)	Top-5 acc 83.984 (84.340)	lr 0.00554
Train [83][1760/3239]	Time 0.366 (0.912)	Data Time 0.001 (0.380)	Loss 2.7896 (2.4692)	Entropy 0.58651 (0.58692)	Top-1 acc 58.594 (64.484)	Top-5 acc 75.000 (84.330)	lr 0.00554
Train [83][1770/3239]	Time 0.230 (0.914)	Data Time 0.001 (0.383)	Loss 2.4406 (2.4689)	Entropy 0.58684 (0.58692)	Top-1 acc 64.062 (64.492)	Top-5 acc 84.375 (84.338)	lr 0.00554
Train [83][1780/3239]	Time 0.242 (0.911)	Data Time 0.001 (0.381)	Loss 2.2586 (2.4690)	Entropy 0.58688 (0.58692)	Top-1 acc 71.875 (64.488)	Top-5 acc 88.281 (84.336)	lr 0.00554
Train [83][1790/3239]	Time 0.249 (0.913)	Data Time 0.001 (0.383)	Loss 2.3792 (2.4693)	Entropy 0.58681 (0.58692)	Top-1 acc 66.797 (64.481)	Top-5 acc 85.547 (84.331)	lr 0.00554
Train [83][1800/3239]	Time 0.250 (0.919)	Data Time 0.001 (0.390)	Loss 2.6471 (2.4696)	Entropy 0.58670 (0.58692)	Top-1 acc 57.422 (64.478)	Top-5 acc 82.031 (84.328)	lr 0.00554
Train [83][1810/3239]	Time 0.232 (0.917)	Data Time 0.001 (0.388)	Loss 2.3084 (2.4695)	Entropy 0.58658 (0.58692)	Top-1 acc 69.531 (64.482)	Top-5 acc 87.891 (84.330)	lr 0.00554
Train [83][1820/3239]	Time 4.998 (0.917)	Data Time 4.739 (0.388)	Loss 2.4800 (2.4693)	Entropy 0.58638 (0.58691)	Top-1 acc 64.844 (64.492)	Top-5 acc 83.594 (84.330)	lr 0.00554
Train [83][1830/3239]	Time 0.332 (0.924)	Data Time 0.001 (0.396)	Loss 2.8003 (2.4694)	Entropy 0.58614 (0.58691)	Top-1 acc 58.203 (64.489)	Top-5 acc 80.078 (84.327)	lr 0.00554
Train [83][1840/3239]	Time 0.242 (0.921)	Data Time 0.001 (0.394)	Loss 2.3973 (2.4694)	Entropy 0.58581 (0.58691)	Top-1 acc 67.578 (64.488)	Top-5 acc 88.281 (84.333)	lr 0.00554
Train [83][1850/3239]	Time 0.253 (0.919)	Data Time 0.002 (0.392)	Loss 2.4943 (2.4694)	Entropy 0.58578 (0.58690)	Top-1 acc 65.625 (64.489)	Top-5 acc 82.812 (84.332)	lr 0.00554
Train [83][1860/3239]	Time 0.252 (0.927)	Data Time 0.001 (0.401)	Loss 2.3543 (2.4694)	Entropy 0.58586 (0.58690)	Top-1 acc 66.406 (64.497)	Top-5 acc 85.938 (84.328)	lr 0.00554
Train [83][1870/3239]	Time 0.244 (0.924)	Data Time 0.001 (0.399)	Loss 2.4123 (2.4693)	Entropy 0.58600 (0.58689)	Top-1 acc 67.969 (64.500)	Top-5 acc 86.719 (84.332)	lr 0.00553
Train [83][1880/3239]	Time 0.236 (0.922)	Data Time 0.001 (0.397)	Loss 2.3901 (2.4695)	Entropy 0.58607 (0.58689)	Top-1 acc 65.234 (64.496)	Top-5 acc 85.156 (84.328)	lr 0.00553
Train [83][1890/3239]	Time 0.232 (0.931)	Data Time 0.001 (0.407)	Loss 2.3133 (2.4697)	Entropy 0.58641 (0.58688)	Top-1 acc 69.922 (64.496)	Top-5 acc 88.281 (84.324)	lr 0.00553
Train [83][1900/3239]	Time 0.243 (0.929)	Data Time 0.001 (0.405)	Loss 2.3767 (2.4699)	Entropy 0.58596 (0.58688)	Top-1 acc 65.234 (64.483)	Top-5 acc 83.594 (84.319)	lr 0.00553
Train [83][1910/3239]	Time 0.241 (0.926)	Data Time 0.001 (0.402)	Loss 2.5985 (2.4698)	Entropy 0.58608 (0.58687)	Top-1 acc 62.109 (64.484)	Top-5 acc 84.375 (84.323)	lr 0.00553
Train [83][1920/3239]	Time 0.256 (0.930)	Data Time 0.001 (0.407)	Loss 2.5625 (2.4698)	Entropy 0.58626 (0.58687)	Top-1 acc 61.719 (64.484)	Top-5 acc 83.594 (84.319)	lr 0.00553
Train [83][1930/3239]	Time 0.238 (0.933)	Data Time 0.001 (0.411)	Loss 2.5151 (2.4696)	Entropy 0.58622 (0.58687)	Top-1 acc 63.281 (64.488)	Top-5 acc 82.812 (84.319)	lr 0.00553
Train [83][1940/3239]	Time 0.240 (0.931)	Data Time 0.001 (0.409)	Loss 2.6161 (2.4697)	Entropy 0.58608 (0.58686)	Top-1 acc 59.375 (64.483)	Top-5 acc 81.250 (84.316)	lr 0.00553
Train [83][1950/3239]	Time 0.286 (0.930)	Data Time 0.001 (0.409)	Loss 2.5325 (2.4697)	Entropy 0.58599 (0.58686)	Top-1 acc 60.938 (64.482)	Top-5 acc 81.250 (84.316)	lr 0.00553
Train [83][1960/3239]	Time 0.252 (0.939)	Data Time 0.001 (0.418)	Loss 2.6333 (2.4700)	Entropy 0.58599 (0.58685)	Top-1 acc 60.156 (64.479)	Top-5 acc 81.641 (84.311)	lr 0.00553
Train [83][1970/3239]	Time 0.240 (0.936)	Data Time 0.001 (0.416)	Loss 2.5995 (2.4706)	Entropy 0.58587 (0.58685)	Top-1 acc 58.984 (64.462)	Top-5 acc 84.375 (84.303)	lr 0.00553
Train [83][1980/3239]	Time 1.469 (0.934)	Data Time 1.221 (0.414)	Loss 2.4535 (2.4707)	Entropy 0.58586 (0.58684)	Top-1 acc 67.969 (64.458)	Top-5 acc 83.203 (84.298)	lr 0.00553
Train [83][1990/3239]	Time 0.372 (0.944)	Data Time 0.001 (0.425)	Loss 2.6363 (2.4711)	Entropy 0.58605 (0.58684)	Top-1 acc 58.203 (64.448)	Top-5 acc 82.422 (84.289)	lr 0.00552
Train [83][2000/3239]	Time 0.225 (0.942)	Data Time 0.001 (0.423)	Loss 2.6444 (2.4709)	Entropy 0.58605 (0.58684)	Top-1 acc 55.859 (64.449)	Top-5 acc 81.641 (84.295)	lr 0.00552
Train [83][2010/3239]	Time 0.242 (0.939)	Data Time 0.001 (0.421)	Loss 2.5531 (2.4708)	Entropy 0.58621 (0.58683)	Top-1 acc 61.328 (64.449)	Top-5 acc 81.641 (84.298)	lr 0.00552
Train [83][2020/3239]	Time 0.244 (0.949)	Data Time 0.002 (0.431)	Loss 2.3567 (2.4707)	Entropy 0.58630 (0.58683)	Top-1 acc 65.625 (64.448)	Top-5 acc 86.719 (84.301)	lr 0.00552
Train [83][2030/3239]	Time 0.255 (0.947)	Data Time 0.002 (0.429)	Loss 2.3155 (2.4709)	Entropy 0.58613 (0.58683)	Top-1 acc 63.672 (64.441)	Top-5 acc 88.672 (84.300)	lr 0.00552
Train [83][2040/3239]	Time 0.245 (0.944)	Data Time 0.001 (0.427)	Loss 2.3046 (2.4705)	Entropy 0.58620 (0.58682)	Top-1 acc 67.578 (64.449)	Top-5 acc 88.672 (84.303)	lr 0.00552
Train [83][2050/3239]	Time 0.325 (0.954)	Data Time 0.003 (0.437)	Loss 2.4687 (2.4706)	Entropy 0.58622 (0.58682)	Top-1 acc 59.375 (64.446)	Top-5 acc 85.547 (84.299)	lr 0.00552
Train [83][2060/3239]	Time 0.388 (0.953)	Data Time 0.001 (0.436)	Loss 2.5781 (2.4705)	Entropy 0.58640 (0.58682)	Top-1 acc 57.812 (64.445)	Top-5 acc 82.422 (84.299)	lr 0.00552
Train [83][2070/3239]	Time 0.258 (0.950)	Data Time 0.001 (0.434)	Loss 2.5458 (2.4705)	Entropy 0.58608 (0.58682)	Top-1 acc 62.891 (64.444)	Top-5 acc 84.375 (84.302)	lr 0.00552
Train [83][2080/3239]	Time 0.252 (0.951)	Data Time 0.001 (0.435)	Loss 2.4116 (2.4707)	Entropy 0.58540 (0.58681)	Top-1 acc 66.797 (64.436)	Top-5 acc 83.203 (84.300)	lr 0.00552
Train [83][2090/3239]	Time 1.379 (0.956)	Data Time 1.113 (0.441)	Loss 2.4684 (2.4708)	Entropy 0.58543 (0.58680)	Top-1 acc 62.891 (64.433)	Top-5 acc 84.375 (84.300)	lr 0.00552
Train [83][2100/3239]	Time 0.257 (0.954)	Data Time 0.002 (0.439)	Loss 2.4420 (2.4707)	Entropy 0.58517 (0.58680)	Top-1 acc 62.109 (64.435)	Top-5 acc 85.156 (84.305)	lr 0.00552
Train [83][2110/3239]	Time 3.268 (0.955)	Data Time 3.006 (0.441)	Loss 2.4452 (2.4705)	Entropy 0.58463 (0.58679)	Top-1 acc 60.938 (64.440)	Top-5 acc 86.719 (84.310)	lr 0.00551
Train [83][2120/3239]	Time 0.232 (0.962)	Data Time 0.001 (0.448)	Loss 2.6046 (2.4706)	Entropy 0.58493 (0.58678)	Top-1 acc 61.328 (64.434)	Top-5 acc 78.125 (84.306)	lr 0.00551
Train [83][2130/3239]	Time 0.236 (0.960)	Data Time 0.001 (0.446)	Loss 2.4781 (2.4705)	Entropy 0.58518 (0.58677)	Top-1 acc 64.844 (64.437)	Top-5 acc 85.938 (84.307)	lr 0.00551
Train [83][2140/3239]	Time 0.221 (0.958)	Data Time 0.001 (0.445)	Loss 2.6133 (2.4703)	Entropy 0.58556 (0.58676)	Top-1 acc 60.938 (64.445)	Top-5 acc 82.812 (84.311)	lr 0.00551
Train [83][2150/3239]	Time 0.336 (0.968)	Data Time 0.001 (0.455)	Loss 2.6544 (2.4703)	Entropy 0.58544 (0.58676)	Top-1 acc 57.422 (64.446)	Top-5 acc 80.078 (84.313)	lr 0.00551
Train [83][2160/3239]	Time 0.229 (0.966)	Data Time 0.001 (0.454)	Loss 2.3888 (2.4706)	Entropy 0.58526 (0.58675)	Top-1 acc 66.016 (64.442)	Top-5 acc 83.594 (84.309)	lr 0.00551
Train [83][2170/3239]	Time 0.255 (0.963)	Data Time 0.001 (0.452)	Loss 2.6707 (2.4706)	Entropy 0.58511 (0.58674)	Top-1 acc 60.547 (64.443)	Top-5 acc 78.906 (84.308)	lr 0.00551
Train [83][2180/3239]	Time 0.240 (0.974)	Data Time 0.001 (0.463)	Loss 2.5843 (2.4703)	Entropy 0.58502 (0.58674)	Top-1 acc 64.062 (64.448)	Top-5 acc 82.812 (84.313)	lr 0.00551
Train [83][2190/3239]	Time 0.307 (0.998)	Data Time 0.003 (0.461)	Loss 2.5088 (2.4702)	Entropy 0.58517 (0.58673)	Top-1 acc 63.281 (64.448)	Top-5 acc 83.984 (84.315)	lr 0.00551
Train [83][2200/3239]	Time 0.260 (0.996)	Data Time 0.002 (0.459)	Loss 2.4767 (2.4700)	Entropy 0.58494 (0.58672)	Top-1 acc 64.062 (64.450)	Top-5 acc 85.547 (84.320)	lr 0.00551
Train [83][2210/3239]	Time 0.285 (0.993)	Data Time 0.003 (0.456)	Loss 2.3228 (2.4700)	Entropy 0.58509 (0.58671)	Top-1 acc 67.188 (64.449)	Top-5 acc 87.500 (84.317)	lr 0.00551
Train [83][2220/3239]	Time 0.229 (0.991)	Data Time 0.001 (0.454)	Loss 2.6294 (2.4702)	Entropy 0.58533 (0.58671)	Top-1 acc 59.766 (64.442)	Top-5 acc 82.422 (84.314)	lr 0.00551
Train [83][2230/3239]	Time 0.254 (0.988)	Data Time 0.001 (0.452)	Loss 2.5279 (2.4701)	Entropy 0.58521 (0.58670)	Top-1 acc 62.109 (64.441)	Top-5 acc 82.812 (84.315)	lr 0.00550
Train [83][2240/3239]	Time 0.310 (0.986)	Data Time 0.001 (0.450)	Loss 2.6210 (2.4699)	Entropy 0.58542 (0.58669)	Top-1 acc 63.672 (64.449)	Top-5 acc 80.859 (84.318)	lr 0.00550
Train [83][2250/3239]	Time 0.244 (0.983)	Data Time 0.001 (0.448)	Loss 2.4873 (2.4697)	Entropy 0.58542 (0.58669)	Top-1 acc 64.844 (64.451)	Top-5 acc 82.422 (84.318)	lr 0.00550
Train [83][2260/3239]	Time 0.253 (0.983)	Data Time 0.001 (0.448)	Loss 2.4450 (2.4697)	Entropy 0.58532 (0.58668)	Top-1 acc 69.141 (64.451)	Top-5 acc 83.984 (84.318)	lr 0.00550
Train [83][2270/3239]	Time 0.249 (0.984)	Data Time 0.001 (0.450)	Loss 2.4733 (2.4696)	Entropy 0.58534 (0.58668)	Top-1 acc 62.891 (64.452)	Top-5 acc 85.156 (84.322)	lr 0.00550
Train [83][2280/3239]	Time 0.334 (0.982)	Data Time 0.082 (0.449)	Loss 2.3596 (2.4695)	Entropy 0.58521 (0.58667)	Top-1 acc 66.797 (64.456)	Top-5 acc 85.938 (84.323)	lr 0.00550
Train [83][2290/3239]	Time 0.262 (0.986)	Data Time 0.001 (0.452)	Loss 2.3521 (2.4694)	Entropy 0.58526 (0.58666)	Top-1 acc 64.453 (64.460)	Top-5 acc 85.547 (84.325)	lr 0.00550
Train [83][2300/3239]	Time 0.336 (0.990)	Data Time 0.003 (0.457)	Loss 2.5021 (2.4695)	Entropy 0.58552 (0.58666)	Top-1 acc 64.062 (64.456)	Top-5 acc 83.984 (84.324)	lr 0.00550
Train [83][2310/3239]	Time 0.392 (0.989)	Data Time 0.001 (0.456)	Loss 2.3947 (2.4694)	Entropy 0.58536 (0.58665)	Top-1 acc 67.969 (64.458)	Top-5 acc 85.938 (84.326)	lr 0.00550
Train [83][2320/3239]	Time 0.249 (0.990)	Data Time 0.001 (0.458)	Loss 2.5551 (2.4694)	Entropy 0.58562 (0.58665)	Top-1 acc 61.328 (64.455)	Top-5 acc 82.812 (84.325)	lr 0.00550
Train [83][2330/3239]	Time 3.312 (0.994)	Data Time 3.031 (0.462)	Loss 2.4165 (2.4695)	Entropy 0.58555 (0.58664)	Top-1 acc 64.453 (64.448)	Top-5 acc 85.156 (84.323)	lr 0.00550
Train [83][2340/3239]	Time 0.252 (0.995)	Data Time 0.001 (0.463)	Loss 2.4683 (2.4694)	Entropy 0.58503 (0.58664)	Top-1 acc 65.234 (64.448)	Top-5 acc 83.984 (84.325)	lr 0.00550
Train [83][2350/3239]	Time 0.256 (0.994)	Data Time 0.001 (0.462)	Loss 2.3984 (2.4694)	Entropy 0.58516 (0.58663)	Top-1 acc 65.625 (64.447)	Top-5 acc 86.719 (84.323)	lr 0.00549
Train [83][2360/3239]	Time 0.257 (0.997)	Data Time 0.001 (0.466)	Loss 2.5422 (2.4695)	Entropy 0.58486 (0.58662)	Top-1 acc 63.281 (64.446)	Top-5 acc 82.812 (84.323)	lr 0.00549
Train [83][2370/3239]	Time 1.211 (0.996)	Data Time 0.932 (0.465)	Loss 2.3760 (2.4697)	Entropy 0.58505 (0.58662)	Top-1 acc 62.109 (64.440)	Top-5 acc 85.938 (84.320)	lr 0.00549
Train [83][2380/3239]	Time 0.399 (0.994)	Data Time 0.001 (0.464)	Loss 2.3283 (2.4694)	Entropy 0.58513 (0.58661)	Top-1 acc 66.797 (64.442)	Top-5 acc 89.062 (84.328)	lr 0.00549
Train [83][2390/3239]	Time 4.206 (0.995)	Data Time 3.940 (0.465)	Loss 2.2882 (2.4693)	Entropy 0.58495 (0.58660)	Top-1 acc 70.703 (64.446)	Top-5 acc 87.109 (84.332)	lr 0.00549
Train [83][2400/3239]	Time 0.250 (0.994)	Data Time 0.001 (0.464)	Loss 2.5893 (2.4693)	Entropy 0.58533 (0.58660)	Top-1 acc 65.625 (64.443)	Top-5 acc 84.766 (84.332)	lr 0.00549
Train [83][2410/3239]	Time 0.227 (0.992)	Data Time 0.001 (0.463)	Loss 2.5345 (2.4693)	Entropy 0.58509 (0.58659)	Top-1 acc 64.453 (64.441)	Top-5 acc 83.594 (84.334)	lr 0.00549
Train [83][2420/3239]	Time 0.234 (0.991)	Data Time 0.001 (0.462)	Loss 2.5653 (2.4694)	Entropy 0.58489 (0.58659)	Top-1 acc 60.156 (64.437)	Top-5 acc 83.203 (84.329)	lr 0.00549
Train [83][2430/3239]	Time 0.234 (0.991)	Data Time 0.001 (0.463)	Loss 2.5606 (2.4694)	Entropy 0.58465 (0.58658)	Top-1 acc 66.016 (64.439)	Top-5 acc 85.547 (84.328)	lr 0.00549
Train [83][2440/3239]	Time 0.289 (0.989)	Data Time 0.001 (0.461)	Loss 2.4858 (2.4695)	Entropy 0.58454 (0.58657)	Top-1 acc 64.062 (64.438)	Top-5 acc 86.328 (84.325)	lr 0.00549
Train [83][2450/3239]	Time 0.252 (0.990)	Data Time 0.001 (0.462)	Loss 2.4028 (2.4693)	Entropy 0.58459 (0.58656)	Top-1 acc 64.062 (64.438)	Top-5 acc 87.109 (84.330)	lr 0.00549
Train [83][2460/3239]	Time 0.241 (0.991)	Data Time 0.001 (0.463)	Loss 2.4358 (2.4695)	Entropy 0.58469 (0.58655)	Top-1 acc 64.062 (64.429)	Top-5 acc 86.328 (84.330)	lr 0.00548
Train [83][2470/3239]	Time 0.378 (0.989)	Data Time 0.002 (0.462)	Loss 2.5055 (2.4693)	Entropy 0.58459 (0.58655)	Top-1 acc 64.062 (64.437)	Top-5 acc 84.766 (84.337)	lr 0.00548
Train [83][2480/3239]	Time 0.255 (0.991)	Data Time 0.001 (0.463)	Loss 2.4127 (2.4692)	Entropy 0.58467 (0.58654)	Top-1 acc 64.062 (64.442)	Top-5 acc 85.156 (84.337)	lr 0.00548
Train [83][2490/3239]	Time 5.798 (0.994)	Data Time 5.525 (0.467)	Loss 2.4675 (2.4691)	Entropy 0.58456 (0.58653)	Top-1 acc 64.062 (64.441)	Top-5 acc 82.812 (84.336)	lr 0.00548
Train [83][2500/3239]	Time 0.245 (0.994)	Data Time 0.002 (0.467)	Loss 2.4222 (2.4688)	Entropy 0.58479 (0.58652)	Top-1 acc 65.234 (64.446)	Top-5 acc 85.938 (84.342)	lr 0.00548
Train [83][2510/3239]	Time 0.250 (0.995)	Data Time 0.001 (0.469)	Loss 2.4553 (2.4686)	Entropy 0.58472 (0.58652)	Top-1 acc 64.062 (64.447)	Top-5 acc 85.156 (84.344)	lr 0.00548
Train [83][2520/3239]	Time 0.263 (0.996)	Data Time 0.002 (0.470)	Loss 2.4884 (2.4687)	Entropy 0.58512 (0.58651)	Top-1 acc 64.453 (64.447)	Top-5 acc 83.203 (84.346)	lr 0.00548
Train [83][2530/3239]	Time 0.231 (0.998)	Data Time 0.001 (0.472)	Loss 2.4822 (2.4688)	Entropy 0.58493 (0.58650)	Top-1 acc 63.281 (64.443)	Top-5 acc 83.594 (84.344)	lr 0.00548
Train [83][2540/3239]	Time 0.363 (0.999)	Data Time 0.001 (0.474)	Loss 2.6099 (2.4689)	Entropy 0.58496 (0.58650)	Top-1 acc 62.109 (64.444)	Top-5 acc 80.078 (84.343)	lr 0.00548
Train [83][2550/3239]	Time 6.697 (1.000)	Data Time 6.426 (0.475)	Loss 2.7157 (2.4687)	Entropy 0.58482 (0.58649)	Top-1 acc 57.422 (64.447)	Top-5 acc 76.953 (84.347)	lr 0.00548
Train [83][2560/3239]	Time 0.238 (1.001)	Data Time 0.001 (0.476)	Loss 2.7389 (2.4690)	Entropy 0.58485 (0.58649)	Top-1 acc 57.812 (64.441)	Top-5 acc 81.250 (84.342)	lr 0.00548
Train [83][2570/3239]	Time 0.248 (1.001)	Data Time 0.001 (0.476)	Loss 2.4578 (2.4692)	Entropy 0.58442 (0.58648)	Top-1 acc 67.969 (64.442)	Top-5 acc 83.594 (84.338)	lr 0.00548
Train [83][2580/3239]	Time 0.259 (1.002)	Data Time 0.001 (0.478)	Loss 2.1542 (2.4691)	Entropy 0.58432 (0.58647)	Top-1 acc 71.484 (64.447)	Top-5 acc 88.672 (84.341)	lr 0.00547
Train [83][2590/3239]	Time 0.233 (1.007)	Data Time 0.001 (0.483)	Loss 2.4117 (2.4694)	Entropy 0.58408 (0.58646)	Top-1 acc 64.062 (64.437)	Top-5 acc 83.984 (84.334)	lr 0.00547
Train [83][2600/3239]	Time 4.020 (1.006)	Data Time 3.757 (0.483)	Loss 2.7208 (2.4693)	Entropy 0.58427 (0.58645)	Top-1 acc 58.984 (64.441)	Top-5 acc 77.734 (84.337)	lr 0.00547
Train [83][2610/3239]	Time 0.282 (1.009)	Data Time 0.002 (0.485)	Loss 2.4219 (2.4693)	Entropy 0.58466 (0.58645)	Top-1 acc 66.016 (64.440)	Top-5 acc 82.812 (84.336)	lr 0.00547
Train [83][2620/3239]	Time 0.241 (1.011)	Data Time 0.001 (0.489)	Loss 2.8484 (2.4696)	Entropy 0.58472 (0.58644)	Top-1 acc 57.422 (64.430)	Top-5 acc 78.125 (84.328)	lr 0.00547
Train [83][2630/3239]	Time 0.294 (1.009)	Data Time 0.002 (0.487)	Loss 2.4372 (2.4696)	Entropy 0.58469 (0.58643)	Top-1 acc 62.891 (64.431)	Top-5 acc 85.547 (84.328)	lr 0.00547
Train [83][2640/3239]	Time 0.229 (1.011)	Data Time 0.001 (0.489)	Loss 2.3873 (2.4697)	Entropy 0.58493 (0.58643)	Top-1 acc 65.234 (64.430)	Top-5 acc 86.719 (84.329)	lr 0.00547
Train [83][2650/3239]	Time 0.259 (1.012)	Data Time 0.001 (0.489)	Loss 2.3990 (2.4695)	Entropy 0.58487 (0.58642)	Top-1 acc 65.234 (64.434)	Top-5 acc 84.766 (84.334)	lr 0.00547
Train [83][2660/3239]	Time 0.272 (1.011)	Data Time 0.002 (0.490)	Loss 2.3956 (2.4694)	Entropy 0.58475 (0.58641)	Top-1 acc 66.016 (64.433)	Top-5 acc 87.500 (84.335)	lr 0.00547
Train [83][2670/3239]	Time 0.239 (1.013)	Data Time 0.001 (0.492)	Loss 2.3589 (2.4693)	Entropy 0.58500 (0.58641)	Top-1 acc 66.016 (64.435)	Top-5 acc 85.547 (84.336)	lr 0.00547
Train [83][2680/3239]	Time 0.229 (1.011)	Data Time 0.001 (0.490)	Loss 2.3167 (2.4692)	Entropy 0.58481 (0.58640)	Top-1 acc 70.703 (64.439)	Top-5 acc 86.328 (84.338)	lr 0.00547
Train [83][2690/3239]	Time 0.780 (1.011)	Data Time 0.542 (0.490)	Loss 2.4544 (2.4693)	Entropy 0.58478 (0.58640)	Top-1 acc 64.844 (64.434)	Top-5 acc 83.984 (84.337)	lr 0.00547
Train [83][2700/3239]	Time 0.355 (1.013)	Data Time 0.001 (0.493)	Loss 2.4120 (2.4692)	Entropy 0.58475 (0.58639)	Top-1 acc 66.016 (64.439)	Top-5 acc 83.594 (84.339)	lr 0.00546
Train [83][2710/3239]	Time 0.302 (1.011)	Data Time 0.002 (0.491)	Loss 2.4854 (2.4693)	Entropy 0.58464 (0.58638)	Top-1 acc 65.234 (64.436)	Top-5 acc 85.547 (84.337)	lr 0.00546
Train [83][2720/3239]	Time 0.241 (1.012)	Data Time 0.001 (0.492)	Loss 2.3904 (2.4692)	Entropy 0.58479 (0.58638)	Top-1 acc 64.844 (64.435)	Top-5 acc 85.938 (84.337)	lr 0.00546
Train [83][2730/3239]	Time 0.233 (1.011)	Data Time 0.001 (0.491)	Loss 2.4239 (2.4694)	Entropy 0.58512 (0.58637)	Top-1 acc 65.234 (64.432)	Top-5 acc 86.328 (84.331)	lr 0.00546
Train [83][2740/3239]	Time 0.241 (1.011)	Data Time 0.001 (0.492)	Loss 2.5435 (2.4693)	Entropy 0.58512 (0.58637)	Top-1 acc 61.328 (64.434)	Top-5 acc 82.812 (84.333)	lr 0.00546
Train [83][2750/3239]	Time 0.246 (1.012)	Data Time 0.001 (0.493)	Loss 2.3811 (2.4693)	Entropy 0.58501 (0.58636)	Top-1 acc 69.141 (64.435)	Top-5 acc 85.938 (84.331)	lr 0.00546
Train [83][2760/3239]	Time 0.299 (1.011)	Data Time 0.002 (0.492)	Loss 2.4072 (2.4691)	Entropy 0.58457 (0.58636)	Top-1 acc 66.797 (64.437)	Top-5 acc 85.156 (84.331)	lr 0.00546
Train [83][2770/3239]	Time 0.407 (1.012)	Data Time 0.001 (0.493)	Loss 2.1907 (2.4692)	Entropy 0.58467 (0.58635)	Top-1 acc 70.703 (64.437)	Top-5 acc 89.062 (84.331)	lr 0.00546
Train [83][2780/3239]	Time 0.226 (1.013)	Data Time 0.001 (0.495)	Loss 2.3712 (2.4693)	Entropy 0.58489 (0.58635)	Top-1 acc 65.234 (64.434)	Top-5 acc 87.891 (84.332)	lr 0.00546
Train [83][2790/3239]	Time 2.121 (1.012)	Data Time 1.868 (0.494)	Loss 2.4271 (2.4696)	Entropy 0.58459 (0.58634)	Top-1 acc 65.625 (64.429)	Top-5 acc 84.375 (84.324)	lr 0.00546
Train [83][2800/3239]	Time 0.269 (1.011)	Data Time 0.001 (0.493)	Loss 2.7637 (2.4695)	Entropy 0.58432 (0.58633)	Top-1 acc 58.594 (64.432)	Top-5 acc 80.859 (84.326)	lr 0.00546
Train [83][2810/3239]	Time 0.242 (1.014)	Data Time 0.001 (0.496)	Loss 2.5140 (2.4697)	Entropy 0.58445 (0.58633)	Top-1 acc 60.156 (64.429)	Top-5 acc 84.766 (84.324)	lr 0.00546
Train [83][2820/3239]	Time 0.237 (1.012)	Data Time 0.001 (0.495)	Loss 2.4332 (2.4697)	Entropy 0.58440 (0.58632)	Top-1 acc 65.625 (64.431)	Top-5 acc 86.328 (84.323)	lr 0.00545
Train [83][2830/3239]	Time 0.248 (1.012)	Data Time 0.001 (0.496)	Loss 2.5231 (2.4699)	Entropy 0.58427 (0.58631)	Top-1 acc 63.672 (64.429)	Top-5 acc 82.812 (84.323)	lr 0.00545
Train [83][2840/3239]	Time 0.270 (1.030)	Data Time 0.010 (0.494)	Loss 2.3853 (2.4698)	Entropy 0.58429 (0.58631)	Top-1 acc 67.188 (64.430)	Top-5 acc 87.500 (84.323)	lr 0.00545
Train [83][2850/3239]	Time 0.236 (1.029)	Data Time 0.002 (0.493)	Loss 2.3524 (2.4697)	Entropy 0.58432 (0.58630)	Top-1 acc 65.625 (64.435)	Top-5 acc 86.719 (84.323)	lr 0.00545
Train [83][2860/3239]	Time 0.360 (1.026)	Data Time 0.001 (0.491)	Loss 2.3436 (2.4696)	Entropy 0.58459 (0.58629)	Top-1 acc 66.016 (64.434)	Top-5 acc 87.500 (84.323)	lr 0.00545
Train [83][2870/3239]	Time 0.252 (1.024)	Data Time 0.001 (0.489)	Loss 2.4530 (2.4698)	Entropy 0.58460 (0.58629)	Top-1 acc 64.453 (64.428)	Top-5 acc 84.375 (84.318)	lr 0.00545
Train [83][2880/3239]	Time 0.252 (1.022)	Data Time 0.001 (0.488)	Loss 2.4273 (2.4698)	Entropy 0.58429 (0.58628)	Top-1 acc 67.188 (64.429)	Top-5 acc 85.547 (84.318)	lr 0.00545
Train [83][2890/3239]	Time 0.243 (1.020)	Data Time 0.001 (0.486)	Loss 2.3173 (2.4699)	Entropy 0.58434 (0.58627)	Top-1 acc 66.797 (64.422)	Top-5 acc 88.281 (84.320)	lr 0.00545
Train [83][2900/3239]	Time 0.247 (1.018)	Data Time 0.001 (0.484)	Loss 2.4675 (2.4702)	Entropy 0.58444 (0.58627)	Top-1 acc 64.844 (64.415)	Top-5 acc 82.031 (84.312)	lr 0.00545
Train [83][2910/3239]	Time 0.258 (1.016)	Data Time 0.001 (0.483)	Loss 2.5863 (2.4703)	Entropy 0.58462 (0.58626)	Top-1 acc 63.281 (64.415)	Top-5 acc 82.031 (84.311)	lr 0.00545
Train [83][2920/3239]	Time 0.259 (1.016)	Data Time 0.001 (0.483)	Loss 2.2551 (2.4699)	Entropy 0.58450 (0.58626)	Top-1 acc 69.531 (64.422)	Top-5 acc 87.891 (84.318)	lr 0.00545
Train [83][2930/3239]	Time 0.250 (1.015)	Data Time 0.001 (0.481)	Loss 2.5659 (2.4700)	Entropy 0.58460 (0.58625)	Top-1 acc 62.500 (64.422)	Top-5 acc 82.031 (84.316)	lr 0.00545
Train [83][2940/3239]	Time 0.258 (1.016)	Data Time 0.002 (0.483)	Loss 2.5602 (2.4699)	Entropy 0.58459 (0.58624)	Top-1 acc 58.594 (64.425)	Top-5 acc 82.812 (84.317)	lr 0.00544
Train [83][2950/3239]	Time 0.258 (1.017)	Data Time 0.001 (0.484)	Loss 2.4831 (2.4699)	Entropy 0.58456 (0.58624)	Top-1 acc 65.625 (64.427)	Top-5 acc 83.203 (84.318)	lr 0.00544
Train [83][2960/3239]	Time 0.244 (1.016)	Data Time 0.001 (0.483)	Loss 2.7084 (2.4700)	Entropy 0.58489 (0.58623)	Top-1 acc 60.547 (64.426)	Top-5 acc 82.422 (84.316)	lr 0.00544
Train [83][2970/3239]	Time 0.258 (1.015)	Data Time 0.001 (0.483)	Loss 2.5168 (2.4700)	Entropy 0.58502 (0.58623)	Top-1 acc 62.109 (64.428)	Top-5 acc 83.203 (84.316)	lr 0.00544
Train [83][2980/3239]	Time 0.247 (1.020)	Data Time 0.001 (0.488)	Loss 2.3284 (2.4701)	Entropy 0.58533 (0.58622)	Top-1 acc 66.406 (64.424)	Top-5 acc 87.891 (84.313)	lr 0.00544
Train [83][2990/3239]	Time 0.253 (1.018)	Data Time 0.001 (0.486)	Loss 2.4033 (2.4700)	Entropy 0.58559 (0.58622)	Top-1 acc 63.281 (64.426)	Top-5 acc 87.109 (84.315)	lr 0.00544
Train [83][3000/3239]	Time 0.252 (1.016)	Data Time 0.001 (0.484)	Loss 2.5506 (2.4700)	Entropy 0.58551 (0.58622)	Top-1 acc 64.062 (64.426)	Top-5 acc 82.422 (84.317)	lr 0.00544
Train [83][3010/3239]	Time 4.733 (1.019)	Data Time 4.477 (0.488)	Loss 2.6310 (2.4701)	Entropy 0.58561 (0.58622)	Top-1 acc 63.672 (64.427)	Top-5 acc 83.594 (84.316)	lr 0.00544
Train [83][3020/3239]	Time 0.360 (1.020)	Data Time 0.001 (0.489)	Loss 2.3028 (2.4698)	Entropy 0.58545 (0.58621)	Top-1 acc 67.578 (64.435)	Top-5 acc 85.156 (84.322)	lr 0.00544
Train [83][3030/3239]	Time 0.274 (1.018)	Data Time 0.001 (0.487)	Loss 2.4410 (2.4697)	Entropy 0.58548 (0.58621)	Top-1 acc 62.891 (64.434)	Top-5 acc 85.547 (84.326)	lr 0.00544
Train [83][3040/3239]	Time 2.341 (1.019)	Data Time 2.076 (0.489)	Loss 2.6320 (2.4698)	Entropy 0.58548 (0.58621)	Top-1 acc 61.328 (64.429)	Top-5 acc 78.906 (84.320)	lr 0.00544
Train [83][3050/3239]	Time 0.247 (1.023)	Data Time 0.001 (0.492)	Loss 2.6099 (2.4700)	Entropy 0.58514 (0.58621)	Top-1 acc 63.672 (64.431)	Top-5 acc 80.859 (84.316)	lr 0.00544
Train [83][3060/3239]	Time 0.239 (1.021)	Data Time 0.001 (0.491)	Loss 2.5540 (2.4700)	Entropy 0.58566 (0.58620)	Top-1 acc 58.594 (64.426)	Top-5 acc 83.594 (84.317)	lr 0.00543
Train [83][3070/3239]	Time 2.474 (1.019)	Data Time 2.220 (0.490)	Loss 2.6556 (2.4700)	Entropy 0.58579 (0.58620)	Top-1 acc 62.109 (64.429)	Top-5 acc 80.859 (84.315)	lr 0.00543
Train [83][3080/3239]	Time 0.235 (1.024)	Data Time 0.001 (0.495)	Loss 2.3199 (2.4699)	Entropy 0.58579 (0.58620)	Top-1 acc 67.578 (64.429)	Top-5 acc 85.938 (84.317)	lr 0.00543
Train [83][3090/3239]	Time 0.424 (1.022)	Data Time 0.001 (0.493)	Loss 2.3046 (2.4697)	Entropy 0.58578 (0.58620)	Top-1 acc 67.578 (64.433)	Top-5 acc 86.719 (84.320)	lr 0.00543
Train [83][3100/3239]	Time 0.249 (1.020)	Data Time 0.002 (0.491)	Loss 2.2294 (2.4698)	Entropy 0.58597 (0.58620)	Top-1 acc 69.922 (64.432)	Top-5 acc 87.109 (84.318)	lr 0.00543
Train [83][3110/3239]	Time 0.239 (1.025)	Data Time 0.001 (0.497)	Loss 2.2800 (2.4698)	Entropy 0.58568 (0.58620)	Top-1 acc 64.844 (64.427)	Top-5 acc 87.500 (84.317)	lr 0.00543
Train [83][3120/3239]	Time 0.269 (1.023)	Data Time 0.002 (0.496)	Loss 2.4565 (2.4696)	Entropy 0.58579 (0.58620)	Top-1 acc 66.016 (64.431)	Top-5 acc 84.375 (84.322)	lr 0.00543
Train [83][3130/3239]	Time 0.247 (1.022)	Data Time 0.001 (0.494)	Loss 2.5053 (2.4699)	Entropy 0.58579 (0.58620)	Top-1 acc 65.234 (64.428)	Top-5 acc 85.547 (84.318)	lr 0.00543
Train [83][3140/3239]	Time 0.261 (1.028)	Data Time 0.002 (0.500)	Loss 2.3472 (2.4698)	Entropy 0.58584 (0.58619)	Top-1 acc 68.359 (64.430)	Top-5 acc 88.281 (84.321)	lr 0.00543
Train [83][3150/3239]	Time 0.269 (1.026)	Data Time 0.001 (0.498)	Loss 2.4995 (2.4699)	Entropy 0.58564 (0.58619)	Top-1 acc 62.109 (64.425)	Top-5 acc 83.594 (84.320)	lr 0.00543
Train [83][3160/3239]	Time 0.241 (1.024)	Data Time 0.001 (0.497)	Loss 2.5533 (2.4700)	Entropy 0.58556 (0.58619)	Top-1 acc 62.109 (64.423)	Top-5 acc 84.375 (84.316)	lr 0.00543
Train [83][3170/3239]	Time 0.240 (1.026)	Data Time 0.001 (0.500)	Loss 2.5034 (2.4700)	Entropy 0.58547 (0.58619)	Top-1 acc 64.453 (64.424)	Top-5 acc 82.031 (84.316)	lr 0.00543
Train [83][3180/3239]	Time 0.400 (1.027)	Data Time 0.000 (0.500)	Loss 2.4581 (2.4698)	Entropy 0.58550 (0.58619)	Top-1 acc 64.453 (64.430)	Top-5 acc 83.203 (84.319)	lr 0.00542
Train [83][3190/3239]	Time 0.241 (1.025)	Data Time 0.000 (0.499)	Loss 2.3572 (2.4698)	Entropy 0.58493 (0.58618)	Top-1 acc 64.844 (64.430)	Top-5 acc 85.156 (84.317)	lr 0.00542
Train [83][3200/3239]	Time 0.289 (1.028)	Data Time 0.000 (0.502)	Loss 2.5841 (2.4698)	Entropy 0.58501 (0.58618)	Top-1 acc 63.672 (64.432)	Top-5 acc 81.641 (84.317)	lr 0.00542
Train [83][3210/3239]	Time 0.276 (1.028)	Data Time 0.000 (0.503)	Loss 2.5891 (2.4697)	Entropy 0.58515 (0.58618)	Top-1 acc 58.984 (64.433)	Top-5 acc 82.812 (84.318)	lr 0.00542
Train [83][3220/3239]	Time 0.230 (1.026)	Data Time 0.000 (0.501)	Loss 2.5591 (2.4698)	Entropy 0.58525 (0.58617)	Top-1 acc 62.891 (64.433)	Top-5 acc 80.469 (84.317)	lr 0.00542
Train [83][3230/3239]	Time 0.239 (1.025)	Data Time 0.000 (0.500)	Loss 2.2744 (2.4698)	Entropy 0.58526 (0.58617)	Top-1 acc 69.141 (64.435)	Top-5 acc 87.891 (84.317)	lr 0.00542
Train [83][3239/3239]	Time 0.960 (1.027)	Data Time 0.000 (0.502)	Loss 2.7578 (2.4699)	Entropy 0.58520 (0.58617)	Top-1 acc 54.321 (64.432)	Top-5 acc 83.951 (84.316)	lr 0.00542
==========Valid [83/120]	loss 1.263	top-1 acc 71.027 (71.027)	top-5 acc 89.457	Train top-1 64.432	top-5 84.316	Entropy 0.58520	Latency-None: 0.000ms	Flops: 539.00M
Train [84][0/3239]	Time 62.615 (62.615)	Data Time 61.676 (61.676)	Loss 2.4793 (2.4793)	Entropy 0.58502 (0.58502)	Top-1 acc 62.891 (62.891)	Top-5 acc 80.859 (80.859)	lr 0.00542
Train [84][10/3239]	Time 0.289 (6.339)	Data Time 0.001 (5.777)	Loss 2.3359 (2.4115)	Entropy 0.58519 (0.58503)	Top-1 acc 66.016 (64.702)	Top-5 acc 86.328 (85.014)	lr 0.00542
Train [84][20/3239]	Time 0.248 (3.581)	Data Time 0.001 (3.059)	Loss 2.4194 (2.4098)	Entropy 0.58516 (0.58512)	Top-1 acc 66.016 (65.346)	Top-5 acc 83.594 (85.082)	lr 0.00542
Train [84][30/3239]	Time 0.286 (2.560)	Data Time 0.001 (2.073)	Loss 2.5257 (2.4421)	Entropy 0.58515 (0.58516)	Top-1 acc 61.719 (64.856)	Top-5 acc 84.766 (84.539)	lr 0.00542
Train [84][40/3239]	Time 0.242 (2.358)	Data Time 0.001 (1.865)	Loss 2.4847 (2.4505)	Entropy 0.58503 (0.58517)	Top-1 acc 64.844 (64.663)	Top-5 acc 85.156 (84.470)	lr 0.00542
Train [84][50/3239]	Time 0.284 (2.016)	Data Time 0.002 (1.536)	Loss 2.2339 (2.4553)	Entropy 0.58518 (0.58514)	Top-1 acc 70.703 (64.591)	Top-5 acc 87.891 (84.360)	lr 0.00542
Train [84][60/3239]	Time 0.244 (1.764)	Data Time 0.001 (1.285)	Loss 2.4645 (2.4511)	Entropy 0.58519 (0.58515)	Top-1 acc 64.062 (64.549)	Top-5 acc 82.812 (84.458)	lr 0.00541
Train [84][70/3239]	Time 0.262 (1.755)	Data Time 0.003 (1.279)	Loss 2.5117 (2.4490)	Entropy 0.58528 (0.58515)	Top-1 acc 61.719 (64.596)	Top-5 acc 85.156 (84.601)	lr 0.00541
Train [84][80/3239]	Time 0.360 (1.625)	Data Time 0.001 (1.152)	Loss 2.4050 (2.4452)	Entropy 0.58481 (0.58515)	Top-1 acc 68.359 (64.723)	Top-5 acc 83.594 (84.684)	lr 0.00541
Train [84][90/3239]	Time 0.242 (1.493)	Data Time 0.001 (1.026)	Loss 2.4338 (2.4467)	Entropy 0.58468 (0.58510)	Top-1 acc 65.625 (64.848)	Top-5 acc 85.156 (84.551)	lr 0.00541
Train [84][100/3239]	Time 0.303 (1.538)	Data Time 0.001 (1.073)	Loss 2.4160 (2.4405)	Entropy 0.58476 (0.58507)	Top-1 acc 66.797 (65.064)	Top-5 acc 84.375 (84.684)	lr 0.00541
Train [84][110/3239]	Time 0.247 (1.473)	Data Time 0.001 (1.008)	Loss 2.2758 (2.4388)	Entropy 0.58474 (0.58504)	Top-1 acc 67.188 (65.094)	Top-5 acc 87.109 (84.730)	lr 0.00541
Train [84][120/3239]	Time 0.247 (1.387)	Data Time 0.001 (0.925)	Loss 2.4778 (2.4387)	Entropy 0.58445 (0.58501)	Top-1 acc 64.062 (65.050)	Top-5 acc 85.156 (84.782)	lr 0.00541
Train [84][130/3239]	Time 0.241 (1.433)	Data Time 0.001 (0.971)	Loss 2.4946 (2.4457)	Entropy 0.58451 (0.58497)	Top-1 acc 65.625 (64.915)	Top-5 acc 82.812 (84.706)	lr 0.00541
Train [84][140/3239]	Time 0.258 (1.401)	Data Time 0.001 (0.940)	Loss 2.5264 (2.4423)	Entropy 0.58453 (0.58493)	Top-1 acc 65.234 (65.101)	Top-5 acc 83.594 (84.724)	lr 0.00541
Train [84][150/3239]	Time 0.367 (1.338)	Data Time 0.001 (0.878)	Loss 2.7184 (2.4473)	Entropy 0.58447 (0.58491)	Top-1 acc 60.547 (64.976)	Top-5 acc 80.469 (84.641)	lr 0.00541
Train [84][160/3239]	Time 18.571 (1.395)	Data Time 18.313 (0.937)	Loss 2.3952 (2.4482)	Entropy 0.58445 (0.58488)	Top-1 acc 66.797 (64.999)	Top-5 acc 85.547 (84.603)	lr 0.00541
Train [84][170/3239]	Time 0.240 (1.356)	Data Time 0.001 (0.898)	Loss 2.3811 (2.4518)	Entropy 0.58443 (0.58485)	Top-1 acc 67.188 (64.917)	Top-5 acc 87.109 (84.546)	lr 0.00541
Train [84][180/3239]	Time 0.255 (1.305)	Data Time 0.001 (0.849)	Loss 2.2237 (2.4486)	Entropy 0.58459 (0.58483)	Top-1 acc 72.266 (64.986)	Top-5 acc 89.062 (84.628)	lr 0.00540
Train [84][190/3239]	Time 0.260 (1.260)	Data Time 0.001 (0.804)	Loss 2.3696 (2.4464)	Entropy 0.58471 (0.58482)	Top-1 acc 67.578 (65.030)	Top-5 acc 85.156 (84.682)	lr 0.00540
Train [84][200/3239]	Time 0.329 (1.335)	Data Time 0.001 (0.879)	Loss 2.2585 (2.4499)	Entropy 0.58454 (0.58481)	Top-1 acc 71.094 (64.943)	Top-5 acc 85.156 (84.618)	lr 0.00540
Train [84][210/3239]	Time 0.257 (1.292)	Data Time 0.001 (0.837)	Loss 2.4751 (2.4492)	Entropy 0.58474 (0.58480)	Top-1 acc 68.359 (64.920)	Top-5 acc 83.594 (84.666)	lr 0.00540
Train [84][220/3239]	Time 0.231 (1.253)	Data Time 0.001 (0.800)	Loss 2.3220 (2.4516)	Entropy 0.58477 (0.58480)	Top-1 acc 70.703 (64.833)	Top-5 acc 87.109 (84.605)	lr 0.00540
Train [84][230/3239]	Time 0.237 (1.324)	Data Time 0.001 (0.872)	Loss 2.4915 (2.4517)	Entropy 0.58464 (0.58480)	Top-1 acc 62.891 (64.830)	Top-5 acc 85.547 (84.605)	lr 0.00540
Train [84][240/3239]	Time 0.350 (1.294)	Data Time 0.001 (0.842)	Loss 2.4596 (2.4513)	Entropy 0.58479 (0.58480)	Top-1 acc 63.672 (64.834)	Top-5 acc 84.766 (84.612)	lr 0.00540
Train [84][250/3239]	Time 0.244 (1.260)	Data Time 0.001 (0.809)	Loss 2.3703 (2.4502)	Entropy 0.58469 (0.58480)	Top-1 acc 67.188 (64.872)	Top-5 acc 86.719 (84.647)	lr 0.00540
Train [84][260/3239]	Time 0.233 (1.452)	Data Time 0.002 (0.778)	Loss 2.4294 (2.4487)	Entropy 0.58482 (0.58479)	Top-1 acc 62.500 (64.920)	Top-5 acc 83.594 (84.656)	lr 0.00540
Train [84][270/3239]	Time 0.277 (1.415)	Data Time 0.002 (0.749)	Loss 2.3273 (2.4500)	Entropy 0.58432 (0.58479)	Top-1 acc 67.969 (64.868)	Top-5 acc 89.453 (84.633)	lr 0.00540
Train [84][280/3239]	Time 0.234 (1.381)	Data Time 0.001 (0.723)	Loss 2.4950 (2.4498)	Entropy 0.58449 (0.58477)	Top-1 acc 63.672 (64.841)	Top-5 acc 83.984 (84.639)	lr 0.00540
Train [84][290/3239]	Time 0.248 (1.349)	Data Time 0.002 (0.698)	Loss 2.2501 (2.4486)	Entropy 0.58456 (0.58477)	Top-1 acc 71.094 (64.891)	Top-5 acc 87.891 (84.664)	lr 0.00540
Train [84][300/3239]	Time 0.243 (1.318)	Data Time 0.002 (0.675)	Loss 2.4962 (2.4490)	Entropy 0.58426 (0.58476)	Top-1 acc 61.328 (64.835)	Top-5 acc 84.766 (84.689)	lr 0.00539
Train [84][310/3239]	Time 0.346 (1.290)	Data Time 0.002 (0.653)	Loss 2.4747 (2.4472)	Entropy 0.58431 (0.58474)	Top-1 acc 60.156 (64.874)	Top-5 acc 83.984 (84.714)	lr 0.00539
Train [84][320/3239]	Time 0.254 (1.263)	Data Time 0.002 (0.633)	Loss 2.3219 (2.4499)	Entropy 0.58457 (0.58473)	Top-1 acc 67.578 (64.817)	Top-5 acc 87.891 (84.662)	lr 0.00539
Train [84][330/3239]	Time 0.260 (1.257)	Data Time 0.002 (0.631)	Loss 2.6178 (2.4515)	Entropy 0.58449 (0.58473)	Top-1 acc 60.547 (64.771)	Top-5 acc 80.078 (84.649)	lr 0.00539
Train [84][340/3239]	Time 0.270 (1.255)	Data Time 0.003 (0.634)	Loss 2.6140 (2.4516)	Entropy 0.58459 (0.58472)	Top-1 acc 62.891 (64.769)	Top-5 acc 82.031 (84.661)	lr 0.00539
Train [84][350/3239]	Time 0.242 (1.232)	Data Time 0.001 (0.616)	Loss 2.2284 (2.4517)	Entropy 0.58462 (0.58472)	Top-1 acc 70.312 (64.759)	Top-5 acc 87.500 (84.648)	lr 0.00539
Train [84][360/3239]	Time 0.266 (1.267)	Data Time 0.002 (0.655)	Loss 2.4012 (2.4520)	Entropy 0.58423 (0.58471)	Top-1 acc 63.281 (64.755)	Top-5 acc 83.594 (84.629)	lr 0.00539
Train [84][370/3239]	Time 0.242 (1.244)	Data Time 0.001 (0.638)	Loss 2.5158 (2.4523)	Entropy 0.58436 (0.58470)	Top-1 acc 63.672 (64.784)	Top-5 acc 81.641 (84.615)	lr 0.00539
Train [84][380/3239]	Time 0.251 (1.237)	Data Time 0.001 (0.634)	Loss 2.4530 (2.4523)	Entropy 0.58449 (0.58469)	Top-1 acc 63.281 (64.776)	Top-5 acc 84.766 (84.620)	lr 0.00539
Train [84][390/3239]	Time 0.252 (1.273)	Data Time 0.001 (0.674)	Loss 2.4038 (2.4513)	Entropy 0.58432 (0.58468)	Top-1 acc 66.797 (64.780)	Top-5 acc 82.422 (84.639)	lr 0.00539
Train [84][400/3239]	Time 0.340 (1.256)	Data Time 0.001 (0.661)	Loss 2.4383 (2.4528)	Entropy 0.58417 (0.58467)	Top-1 acc 64.453 (64.730)	Top-5 acc 86.719 (84.611)	lr 0.00539
Train [84][410/3239]	Time 0.258 (1.256)	Data Time 0.001 (0.664)	Loss 2.3488 (2.4533)	Entropy 0.58399 (0.58466)	Top-1 acc 67.969 (64.731)	Top-5 acc 85.938 (84.590)	lr 0.00539
Train [84][420/3239]	Time 0.263 (1.275)	Data Time 0.001 (0.687)	Loss 2.5833 (2.4545)	Entropy 0.58381 (0.58464)	Top-1 acc 59.766 (64.714)	Top-5 acc 82.422 (84.560)	lr 0.00539
Train [84][430/3239]	Time 5.381 (1.277)	Data Time 5.112 (0.692)	Loss 2.4462 (2.4533)	Entropy 0.58368 (0.58462)	Top-1 acc 62.109 (64.711)	Top-5 acc 82.812 (84.566)	lr 0.00538
Train [84][440/3239]	Time 0.250 (1.261)	Data Time 0.001 (0.680)	Loss 2.5626 (2.4526)	Entropy 0.58340 (0.58460)	Top-1 acc 61.328 (64.747)	Top-5 acc 85.156 (84.575)	lr 0.00538
Train [84][450/3239]	Time 0.299 (1.269)	Data Time 0.002 (0.691)	Loss 2.3653 (2.4535)	Entropy 0.58355 (0.58457)	Top-1 acc 67.578 (64.733)	Top-5 acc 83.984 (84.556)	lr 0.00538
Train [84][460/3239]	Time 2.137 (1.273)	Data Time 1.893 (0.698)	Loss 2.5391 (2.4530)	Entropy 0.58324 (0.58455)	Top-1 acc 64.453 (64.743)	Top-5 acc 85.547 (84.578)	lr 0.00538
Train [84][470/3239]	Time 9.469 (1.282)	Data Time 9.122 (0.710)	Loss 3.0064 (2.4551)	Entropy 0.58350 (0.58453)	Top-1 acc 57.031 (64.703)	Top-5 acc 76.562 (84.543)	lr 0.00538
Train [84][480/3239]	Time 1.374 (1.273)	Data Time 1.135 (0.704)	Loss 2.4677 (2.4558)	Entropy 0.58353 (0.58450)	Top-1 acc 62.891 (64.684)	Top-5 acc 83.594 (84.527)	lr 0.00538
Train [84][490/3239]	Time 1.535 (1.283)	Data Time 1.282 (0.717)	Loss 2.5912 (2.4569)	Entropy 0.58359 (0.58448)	Top-1 acc 60.938 (64.654)	Top-5 acc 81.641 (84.511)	lr 0.00538
Train [84][500/3239]	Time 0.249 (1.280)	Data Time 0.001 (0.716)	Loss 2.4598 (2.4569)	Entropy 0.58369 (0.58446)	Top-1 acc 66.797 (64.650)	Top-5 acc 84.766 (84.511)	lr 0.00538
Train [84][510/3239]	Time 0.238 (1.263)	Data Time 0.001 (0.702)	Loss 2.4483 (2.4578)	Entropy 0.58370 (0.58445)	Top-1 acc 61.719 (64.612)	Top-5 acc 86.328 (84.501)	lr 0.00538
Train [84][520/3239]	Time 0.244 (1.301)	Data Time 0.002 (0.742)	Loss 2.4320 (2.4576)	Entropy 0.58346 (0.58443)	Top-1 acc 65.234 (64.624)	Top-5 acc 85.156 (84.499)	lr 0.00538
Train [84][530/3239]	Time 3.837 (1.292)	Data Time 3.572 (0.735)	Loss 2.4382 (2.4586)	Entropy 0.58378 (0.58442)	Top-1 acc 63.281 (64.602)	Top-5 acc 86.719 (84.494)	lr 0.00538
Train [84][540/3239]	Time 4.094 (1.283)	Data Time 3.848 (0.729)	Loss 2.3225 (2.4572)	Entropy 0.58362 (0.58440)	Top-1 acc 66.797 (64.629)	Top-5 acc 87.891 (84.526)	lr 0.00538
Train [84][550/3239]	Time 0.239 (1.308)	Data Time 0.001 (0.756)	Loss 2.4437 (2.4572)	Entropy 0.58367 (0.58439)	Top-1 acc 65.625 (64.627)	Top-5 acc 85.156 (84.517)	lr 0.00537
Train [84][560/3239]	Time 0.291 (1.297)	Data Time 0.001 (0.747)	Loss 2.2698 (2.4574)	Entropy 0.58357 (0.58437)	Top-1 acc 66.406 (64.622)	Top-5 acc 87.500 (84.513)	lr 0.00537
Train [84][570/3239]	Time 1.325 (1.291)	Data Time 1.046 (0.743)	Loss 2.2727 (2.4571)	Entropy 0.58388 (0.58436)	Top-1 acc 68.750 (64.628)	Top-5 acc 89.062 (84.517)	lr 0.00537
Train [84][580/3239]	Time 0.289 (1.313)	Data Time 0.002 (0.767)	Loss 2.4522 (2.4568)	Entropy 0.58369 (0.58435)	Top-1 acc 64.844 (64.634)	Top-5 acc 83.203 (84.526)	lr 0.00537
Train [84][590/3239]	Time 0.253 (1.316)	Data Time 0.002 (0.771)	Loss 2.2569 (2.4556)	Entropy 0.58363 (0.58434)	Top-1 acc 68.750 (64.663)	Top-5 acc 86.328 (84.551)	lr 0.00537
Train [84][600/3239]	Time 0.243 (1.306)	Data Time 0.001 (0.764)	Loss 2.6750 (2.4554)	Entropy 0.58338 (0.58433)	Top-1 acc 60.156 (64.673)	Top-5 acc 80.859 (84.552)	lr 0.00537
Train [84][610/3239]	Time 0.239 (1.317)	Data Time 0.001 (0.776)	Loss 2.3888 (2.4562)	Entropy 0.58338 (0.58431)	Top-1 acc 66.797 (64.642)	Top-5 acc 84.766 (84.539)	lr 0.00537
Train [84][620/3239]	Time 1.570 (1.323)	Data Time 1.323 (0.784)	Loss 2.3695 (2.4561)	Entropy 0.58322 (0.58430)	Top-1 acc 68.359 (64.644)	Top-5 acc 87.500 (84.547)	lr 0.00537
Train [84][630/3239]	Time 0.328 (1.317)	Data Time 0.001 (0.780)	Loss 2.6467 (2.4558)	Entropy 0.58322 (0.58428)	Top-1 acc 59.375 (64.648)	Top-5 acc 82.031 (84.545)	lr 0.00537
Train [84][640/3239]	Time 5.990 (1.327)	Data Time 5.701 (0.792)	Loss 2.3220 (2.4548)	Entropy 0.58324 (0.58426)	Top-1 acc 69.531 (64.673)	Top-5 acc 85.547 (84.561)	lr 0.00537
Train [84][650/3239]	Time 0.242 (1.330)	Data Time 0.001 (0.797)	Loss 2.2828 (2.4552)	Entropy 0.58312 (0.58425)	Top-1 acc 69.922 (64.676)	Top-5 acc 87.500 (84.563)	lr 0.00537
Train [84][660/3239]	Time 0.239 (1.319)	Data Time 0.001 (0.788)	Loss 2.3932 (2.4552)	Entropy 0.58302 (0.58423)	Top-1 acc 68.750 (64.688)	Top-5 acc 84.375 (84.558)	lr 0.00537
Train [84][670/3239]	Time 0.218 (1.312)	Data Time 0.001 (0.782)	Loss 2.7086 (2.4562)	Entropy 0.58284 (0.58421)	Top-1 acc 57.812 (64.663)	Top-5 acc 78.906 (84.530)	lr 0.00536
Train [84][680/3239]	Time 0.258 (1.324)	Data Time 0.002 (0.795)	Loss 2.2817 (2.4556)	Entropy 0.58287 (0.58419)	Top-1 acc 70.312 (64.678)	Top-5 acc 88.672 (84.544)	lr 0.00536
Train [84][690/3239]	Time 0.270 (1.314)	Data Time 0.001 (0.787)	Loss 2.3191 (2.4557)	Entropy 0.58260 (0.58417)	Top-1 acc 67.578 (64.680)	Top-5 acc 88.672 (84.542)	lr 0.00536
Train [84][700/3239]	Time 0.383 (1.309)	Data Time 0.002 (0.783)	Loss 2.5431 (2.4551)	Entropy 0.58262 (0.58415)	Top-1 acc 65.234 (64.712)	Top-5 acc 80.859 (84.554)	lr 0.00536
Train [84][710/3239]	Time 0.246 (1.320)	Data Time 0.001 (0.795)	Loss 2.4318 (2.4553)	Entropy 0.58259 (0.58413)	Top-1 acc 63.672 (64.717)	Top-5 acc 82.031 (84.549)	lr 0.00536
Train [84][720/3239]	Time 0.251 (1.308)	Data Time 0.001 (0.786)	Loss 2.4301 (2.4548)	Entropy 0.58266 (0.58411)	Top-1 acc 64.844 (64.748)	Top-5 acc 83.594 (84.556)	lr 0.00536
Train [84][730/3239]	Time 2.867 (1.310)	Data Time 2.626 (0.789)	Loss 2.5656 (2.4547)	Entropy 0.58237 (0.58408)	Top-1 acc 59.375 (64.743)	Top-5 acc 82.422 (84.562)	lr 0.00536
Train [84][740/3239]	Time 0.271 (1.314)	Data Time 0.001 (0.794)	Loss 2.3544 (2.4547)	Entropy 0.58244 (0.58406)	Top-1 acc 65.625 (64.745)	Top-5 acc 85.156 (84.555)	lr 0.00536
Train [84][750/3239]	Time 0.228 (1.308)	Data Time 0.001 (0.790)	Loss 2.4855 (2.4545)	Entropy 0.58210 (0.58404)	Top-1 acc 66.406 (64.762)	Top-5 acc 84.375 (84.557)	lr 0.00536
Train [84][760/3239]	Time 0.241 (1.309)	Data Time 0.002 (0.791)	Loss 2.3140 (2.4547)	Entropy 0.58196 (0.58401)	Top-1 acc 66.406 (64.756)	Top-5 acc 88.672 (84.555)	lr 0.00536
Train [84][770/3239]	Time 0.235 (1.303)	Data Time 0.001 (0.787)	Loss 2.7573 (2.4553)	Entropy 0.58179 (0.58398)	Top-1 acc 60.156 (64.749)	Top-5 acc 78.906 (84.545)	lr 0.00536
Train [84][780/3239]	Time 0.246 (1.307)	Data Time 0.002 (0.792)	Loss 2.5574 (2.4555)	Entropy 0.58187 (0.58395)	Top-1 acc 59.766 (64.737)	Top-5 acc 82.812 (84.537)	lr 0.00536
Train [84][790/3239]	Time 0.332 (1.314)	Data Time 0.001 (0.801)	Loss 2.2142 (2.4550)	Entropy 0.58194 (0.58393)	Top-1 acc 68.750 (64.747)	Top-5 acc 87.891 (84.541)	lr 0.00535
Train [84][800/3239]	Time 0.242 (1.303)	Data Time 0.001 (0.791)	Loss 2.4373 (2.4548)	Entropy 0.58196 (0.58390)	Top-1 acc 66.016 (64.758)	Top-5 acc 84.766 (84.540)	lr 0.00535
Train [84][810/3239]	Time 0.248 (1.301)	Data Time 0.001 (0.790)	Loss 2.3942 (2.4555)	Entropy 0.58203 (0.58388)	Top-1 acc 67.578 (64.731)	Top-5 acc 86.328 (84.531)	lr 0.00535
Train [84][820/3239]	Time 0.244 (1.291)	Data Time 0.001 (0.780)	Loss 2.4274 (2.4552)	Entropy 0.58183 (0.58385)	Top-1 acc 67.188 (64.731)	Top-5 acc 82.031 (84.530)	lr 0.00535
Train [84][830/3239]	Time 0.242 (1.295)	Data Time 0.001 (0.786)	Loss 2.5749 (2.4559)	Entropy 0.58198 (0.58383)	Top-1 acc 61.719 (64.722)	Top-5 acc 81.250 (84.511)	lr 0.00535
Train [84][840/3239]	Time 0.246 (1.285)	Data Time 0.001 (0.776)	Loss 2.5808 (2.4558)	Entropy 0.58200 (0.58381)	Top-1 acc 60.938 (64.724)	Top-5 acc 81.641 (84.516)	lr 0.00535
Train [84][850/3239]	Time 0.251 (1.275)	Data Time 0.001 (0.767)	Loss 2.4096 (2.4555)	Entropy 0.58183 (0.58378)	Top-1 acc 70.312 (64.743)	Top-5 acc 85.156 (84.524)	lr 0.00535
Train [84][860/3239]	Time 0.331 (1.287)	Data Time 0.001 (0.780)	Loss 2.3590 (2.4559)	Entropy 0.58186 (0.58376)	Top-1 acc 67.578 (64.728)	Top-5 acc 85.547 (84.516)	lr 0.00535
Train [84][870/3239]	Time 0.271 (1.277)	Data Time 0.001 (0.771)	Loss 2.4580 (2.4562)	Entropy 0.58201 (0.58374)	Top-1 acc 65.234 (64.722)	Top-5 acc 85.156 (84.500)	lr 0.00535
Train [84][880/3239]	Time 0.276 (1.267)	Data Time 0.001 (0.762)	Loss 2.6741 (2.4568)	Entropy 0.58198 (0.58372)	Top-1 acc 56.641 (64.692)	Top-5 acc 80.469 (84.496)	lr 0.00535
Train [84][890/3239]	Time 0.240 (1.291)	Data Time 0.001 (0.787)	Loss 2.5844 (2.4568)	Entropy 0.58219 (0.58370)	Top-1 acc 60.156 (64.692)	Top-5 acc 80.859 (84.498)	lr 0.00535
Train [84][900/3239]	Time 0.232 (1.281)	Data Time 0.001 (0.778)	Loss 2.5023 (2.4560)	Entropy 0.58238 (0.58369)	Top-1 acc 63.281 (64.721)	Top-5 acc 82.422 (84.503)	lr 0.00535
Train [84][910/3239]	Time 0.462 (1.332)	Data Time 0.049 (0.769)	Loss 2.4069 (2.4559)	Entropy 0.58240 (0.58367)	Top-1 acc 66.797 (64.725)	Top-5 acc 87.109 (84.504)	lr 0.00534
Train [84][920/3239]	Time 0.243 (1.323)	Data Time 0.002 (0.761)	Loss 2.6588 (2.4562)	Entropy 0.58240 (0.58366)	Top-1 acc 60.547 (64.719)	Top-5 acc 80.078 (84.498)	lr 0.00534
Train [84][930/3239]	Time 0.236 (1.313)	Data Time 0.001 (0.753)	Loss 2.5643 (2.4558)	Entropy 0.58218 (0.58365)	Top-1 acc 61.719 (64.729)	Top-5 acc 82.812 (84.508)	lr 0.00534
Train [84][940/3239]	Time 0.238 (1.303)	Data Time 0.001 (0.745)	Loss 2.4548 (2.4555)	Entropy 0.58194 (0.58363)	Top-1 acc 63.281 (64.739)	Top-5 acc 84.375 (84.511)	lr 0.00534
Train [84][950/3239]	Time 0.389 (1.294)	Data Time 0.002 (0.737)	Loss 2.2757 (2.4554)	Entropy 0.58224 (0.58361)	Top-1 acc 69.922 (64.730)	Top-5 acc 89.062 (84.519)	lr 0.00534
Train [84][960/3239]	Time 0.247 (1.285)	Data Time 0.001 (0.730)	Loss 2.5328 (2.4560)	Entropy 0.58248 (0.58360)	Top-1 acc 64.062 (64.719)	Top-5 acc 82.422 (84.508)	lr 0.00534
Train [84][970/3239]	Time 0.260 (1.276)	Data Time 0.002 (0.722)	Loss 2.3754 (2.4560)	Entropy 0.58255 (0.58359)	Top-1 acc 67.578 (64.717)	Top-5 acc 86.328 (84.513)	lr 0.00534
Train [84][980/3239]	Time 0.252 (1.276)	Data Time 0.001 (0.723)	Loss 2.3876 (2.4554)	Entropy 0.58253 (0.58358)	Top-1 acc 66.406 (64.723)	Top-5 acc 85.938 (84.532)	lr 0.00534
Train [84][990/3239]	Time 0.302 (1.268)	Data Time 0.003 (0.715)	Loss 2.2511 (2.4562)	Entropy 0.58251 (0.58357)	Top-1 acc 70.312 (64.714)	Top-5 acc 87.500 (84.519)	lr 0.00534
Train [84][1000/3239]	Time 0.230 (1.259)	Data Time 0.001 (0.708)	Loss 2.3811 (2.4564)	Entropy 0.58255 (0.58356)	Top-1 acc 70.312 (64.719)	Top-5 acc 85.156 (84.516)	lr 0.00534
Train [84][1010/3239]	Time 0.297 (1.264)	Data Time 0.003 (0.714)	Loss 2.5950 (2.4563)	Entropy 0.58270 (0.58355)	Top-1 acc 62.500 (64.727)	Top-5 acc 81.250 (84.519)	lr 0.00534
Train [84][1020/3239]	Time 0.421 (1.257)	Data Time 0.001 (0.708)	Loss 2.4436 (2.4558)	Entropy 0.58255 (0.58354)	Top-1 acc 63.672 (64.733)	Top-5 acc 83.203 (84.523)	lr 0.00534
Train [84][1030/3239]	Time 0.245 (1.249)	Data Time 0.001 (0.701)	Loss 2.3855 (2.4559)	Entropy 0.58254 (0.58353)	Top-1 acc 66.406 (64.726)	Top-5 acc 85.156 (84.526)	lr 0.00533
Train [84][1040/3239]	Time 0.253 (1.253)	Data Time 0.001 (0.706)	Loss 2.4480 (2.4553)	Entropy 0.58273 (0.58352)	Top-1 acc 65.234 (64.742)	Top-5 acc 85.547 (84.535)	lr 0.00533
Train [84][1050/3239]	Time 0.243 (1.245)	Data Time 0.001 (0.699)	Loss 2.5161 (2.4554)	Entropy 0.58292 (0.58351)	Top-1 acc 59.766 (64.731)	Top-5 acc 83.203 (84.531)	lr 0.00533
Train [84][1060/3239]	Time 0.233 (1.238)	Data Time 0.001 (0.693)	Loss 2.5778 (2.4548)	Entropy 0.58325 (0.58351)	Top-1 acc 60.547 (64.754)	Top-5 acc 82.031 (84.543)	lr 0.00533
Train [84][1070/3239]	Time 11.092 (1.240)	Data Time 10.852 (0.696)	Loss 2.6119 (2.4545)	Entropy 0.58303 (0.58350)	Top-1 acc 64.062 (64.766)	Top-5 acc 82.422 (84.542)	lr 0.00533
Train [84][1080/3239]	Time 0.286 (1.234)	Data Time 0.002 (0.691)	Loss 2.4139 (2.4547)	Entropy 0.58305 (0.58350)	Top-1 acc 64.453 (64.761)	Top-5 acc 86.328 (84.542)	lr 0.00533
Train [84][1090/3239]	Time 0.250 (1.227)	Data Time 0.001 (0.685)	Loss 2.6252 (2.4544)	Entropy 0.58302 (0.58350)	Top-1 acc 61.328 (64.776)	Top-5 acc 82.422 (84.547)	lr 0.00533
Train [84][1100/3239]	Time 0.260 (1.220)	Data Time 0.001 (0.679)	Loss 2.2540 (2.4548)	Entropy 0.58297 (0.58349)	Top-1 acc 71.094 (64.763)	Top-5 acc 87.500 (84.542)	lr 0.00533
Train [84][1110/3239]	Time 0.329 (1.225)	Data Time 0.001 (0.685)	Loss 2.3625 (2.4546)	Entropy 0.58309 (0.58349)	Top-1 acc 62.500 (64.766)	Top-5 acc 87.500 (84.544)	lr 0.00533
Train [84][1120/3239]	Time 0.234 (1.218)	Data Time 0.001 (0.679)	Loss 2.4234 (2.4547)	Entropy 0.58269 (0.58348)	Top-1 acc 66.797 (64.772)	Top-5 acc 86.328 (84.546)	lr 0.00533
Train [84][1130/3239]	Time 0.256 (1.212)	Data Time 0.001 (0.673)	Loss 2.4088 (2.4547)	Entropy 0.58245 (0.58347)	Top-1 acc 66.406 (64.775)	Top-5 acc 85.938 (84.544)	lr 0.00533
Train [84][1140/3239]	Time 0.248 (1.213)	Data Time 0.001 (0.675)	Loss 2.4236 (2.4544)	Entropy 0.58265 (0.58347)	Top-1 acc 66.016 (64.775)	Top-5 acc 85.156 (84.556)	lr 0.00533
Train [84][1150/3239]	Time 0.228 (1.207)	Data Time 0.001 (0.669)	Loss 2.4572 (2.4547)	Entropy 0.58278 (0.58346)	Top-1 acc 66.797 (64.777)	Top-5 acc 83.984 (84.547)	lr 0.00532
Train [84][1160/3239]	Time 0.237 (1.200)	Data Time 0.001 (0.664)	Loss 2.3599 (2.4544)	Entropy 0.58292 (0.58345)	Top-1 acc 67.188 (64.782)	Top-5 acc 85.938 (84.551)	lr 0.00532
Train [84][1170/3239]	Time 0.307 (1.200)	Data Time 0.002 (0.665)	Loss 2.4783 (2.4540)	Entropy 0.58302 (0.58345)	Top-1 acc 63.281 (64.798)	Top-5 acc 84.375 (84.556)	lr 0.00532
Train [84][1180/3239]	Time 0.342 (1.194)	Data Time 0.001 (0.659)	Loss 2.4293 (2.4539)	Entropy 0.58293 (0.58344)	Top-1 acc 65.625 (64.802)	Top-5 acc 85.547 (84.554)	lr 0.00532
Train [84][1190/3239]	Time 0.273 (1.188)	Data Time 0.001 (0.654)	Loss 2.3447 (2.4540)	Entropy 0.58281 (0.58344)	Top-1 acc 69.531 (64.805)	Top-5 acc 85.938 (84.554)	lr 0.00532
Train [84][1200/3239]	Time 0.250 (1.191)	Data Time 0.002 (0.658)	Loss 2.4621 (2.4541)	Entropy 0.58261 (0.58344)	Top-1 acc 60.938 (64.803)	Top-5 acc 85.938 (84.554)	lr 0.00532
Train [84][1210/3239]	Time 2.099 (1.187)	Data Time 1.847 (0.655)	Loss 2.4222 (2.4538)	Entropy 0.58264 (0.58343)	Top-1 acc 66.406 (64.811)	Top-5 acc 84.375 (84.560)	lr 0.00532
Train [84][1220/3239]	Time 0.253 (1.181)	Data Time 0.001 (0.649)	Loss 2.6243 (2.4542)	Entropy 0.58222 (0.58342)	Top-1 acc 60.156 (64.798)	Top-5 acc 83.984 (84.548)	lr 0.00532
Train [84][1230/3239]	Time 10.511 (1.183)	Data Time 10.241 (0.652)	Loss 2.4368 (2.4541)	Entropy 0.58191 (0.58341)	Top-1 acc 65.625 (64.803)	Top-5 acc 85.156 (84.551)	lr 0.00532
Train [84][1240/3239]	Time 0.284 (1.179)	Data Time 0.001 (0.649)	Loss 2.4360 (2.4543)	Entropy 0.58202 (0.58340)	Top-1 acc 62.891 (64.798)	Top-5 acc 85.156 (84.546)	lr 0.00532
Train [84][1250/3239]	Time 0.248 (1.175)	Data Time 0.002 (0.646)	Loss 2.5678 (2.4541)	Entropy 0.58216 (0.58339)	Top-1 acc 60.547 (64.790)	Top-5 acc 83.984 (84.551)	lr 0.00532
Train [84][1260/3239]	Time 0.255 (1.169)	Data Time 0.001 (0.641)	Loss 2.4088 (2.4545)	Entropy 0.58232 (0.58338)	Top-1 acc 64.453 (64.781)	Top-5 acc 83.984 (84.540)	lr 0.00532
Train [84][1270/3239]	Time 0.258 (1.173)	Data Time 0.001 (0.645)	Loss 2.3209 (2.4546)	Entropy 0.58213 (0.58337)	Top-1 acc 67.188 (64.773)	Top-5 acc 85.547 (84.543)	lr 0.00531
Train [84][1280/3239]	Time 0.263 (1.171)	Data Time 0.001 (0.643)	Loss 2.5124 (2.4546)	Entropy 0.58250 (0.58336)	Top-1 acc 62.891 (64.773)	Top-5 acc 84.766 (84.541)	lr 0.00531
Train [84][1290/3239]	Time 0.238 (1.165)	Data Time 0.001 (0.638)	Loss 2.3161 (2.4545)	Entropy 0.58232 (0.58335)	Top-1 acc 69.922 (64.782)	Top-5 acc 87.109 (84.543)	lr 0.00531
Train [84][1300/3239]	Time 0.234 (1.167)	Data Time 0.001 (0.641)	Loss 2.3982 (2.4544)	Entropy 0.58240 (0.58335)	Top-1 acc 66.797 (64.784)	Top-5 acc 83.984 (84.548)	lr 0.00531
Train [84][1310/3239]	Time 0.257 (1.164)	Data Time 0.002 (0.639)	Loss 2.4933 (2.4545)	Entropy 0.58269 (0.58334)	Top-1 acc 65.234 (64.780)	Top-5 acc 82.812 (84.545)	lr 0.00531
Train [84][1320/3239]	Time 0.238 (1.159)	Data Time 0.001 (0.634)	Loss 2.5443 (2.4547)	Entropy 0.58248 (0.58334)	Top-1 acc 62.891 (64.776)	Top-5 acc 83.984 (84.536)	lr 0.00531
Train [84][1330/3239]	Time 0.239 (1.162)	Data Time 0.001 (0.639)	Loss 2.5361 (2.4550)	Entropy 0.58236 (0.58333)	Top-1 acc 61.719 (64.768)	Top-5 acc 83.203 (84.541)	lr 0.00531
Train [84][1340/3239]	Time 0.926 (1.161)	Data Time 0.570 (0.638)	Loss 2.5545 (2.4552)	Entropy 0.58252 (0.58332)	Top-1 acc 62.891 (64.769)	Top-5 acc 82.422 (84.539)	lr 0.00531
Train [84][1350/3239]	Time 0.253 (1.156)	Data Time 0.001 (0.633)	Loss 2.3623 (2.4552)	Entropy 0.58252 (0.58332)	Top-1 acc 67.188 (64.774)	Top-5 acc 85.938 (84.540)	lr 0.00531
Train [84][1360/3239]	Time 0.251 (1.160)	Data Time 0.001 (0.638)	Loss 2.4226 (2.4552)	Entropy 0.58247 (0.58331)	Top-1 acc 67.188 (64.773)	Top-5 acc 84.375 (84.532)	lr 0.00531
Train [84][1370/3239]	Time 0.261 (1.155)	Data Time 0.001 (0.633)	Loss 2.3607 (2.4551)	Entropy 0.58213 (0.58330)	Top-1 acc 65.625 (64.776)	Top-5 acc 85.156 (84.531)	lr 0.00531
Train [84][1380/3239]	Time 0.251 (1.152)	Data Time 0.001 (0.631)	Loss 2.3323 (2.4554)	Entropy 0.58203 (0.58329)	Top-1 acc 69.531 (64.774)	Top-5 acc 85.938 (84.528)	lr 0.00531
Train [84][1390/3239]	Time 13.091 (1.156)	Data Time 12.804 (0.636)	Loss 2.5191 (2.4557)	Entropy 0.58220 (0.58328)	Top-1 acc 62.500 (64.768)	Top-5 acc 82.422 (84.525)	lr 0.00530
Train [84][1400/3239]	Time 0.276 (1.151)	Data Time 0.002 (0.632)	Loss 2.3887 (2.4558)	Entropy 0.58226 (0.58328)	Top-1 acc 67.969 (64.765)	Top-5 acc 85.156 (84.526)	lr 0.00530
Train [84][1410/3239]	Time 0.339 (1.149)	Data Time 0.001 (0.630)	Loss 2.4947 (2.4557)	Entropy 0.58222 (0.58327)	Top-1 acc 66.406 (64.777)	Top-5 acc 84.375 (84.531)	lr 0.00530
Train [84][1420/3239]	Time 0.237 (1.144)	Data Time 0.001 (0.626)	Loss 2.3900 (2.4561)	Entropy 0.58198 (0.58326)	Top-1 acc 65.234 (64.761)	Top-5 acc 84.766 (84.524)	lr 0.00530
Train [84][1430/3239]	Time 0.233 (1.147)	Data Time 0.001 (0.630)	Loss 2.5247 (2.4563)	Entropy 0.58187 (0.58325)	Top-1 acc 63.281 (64.757)	Top-5 acc 84.766 (84.525)	lr 0.00530
Train [84][1440/3239]	Time 0.239 (1.143)	Data Time 0.001 (0.626)	Loss 2.4970 (2.4568)	Entropy 0.58185 (0.58324)	Top-1 acc 66.797 (64.741)	Top-5 acc 83.984 (84.517)	lr 0.00530
Train [84][1450/3239]	Time 0.244 (1.138)	Data Time 0.002 (0.622)	Loss 2.3866 (2.4571)	Entropy 0.58168 (0.58323)	Top-1 acc 66.797 (64.736)	Top-5 acc 83.203 (84.513)	lr 0.00530
Train [84][1460/3239]	Time 0.270 (1.139)	Data Time 0.002 (0.623)	Loss 2.5426 (2.4573)	Entropy 0.58151 (0.58322)	Top-1 acc 63.281 (64.731)	Top-5 acc 83.203 (84.510)	lr 0.00530
Train [84][1470/3239]	Time 0.250 (1.134)	Data Time 0.001 (0.619)	Loss 2.3069 (2.4573)	Entropy 0.58187 (0.58321)	Top-1 acc 67.578 (64.727)	Top-5 acc 87.109 (84.512)	lr 0.00530
Train [84][1480/3239]	Time 0.241 (1.130)	Data Time 0.002 (0.615)	Loss 2.3732 (2.4569)	Entropy 0.58144 (0.58320)	Top-1 acc 66.797 (64.737)	Top-5 acc 85.547 (84.519)	lr 0.00530
Train [84][1490/3239]	Time 0.235 (1.133)	Data Time 0.001 (0.619)	Loss 2.2819 (2.4569)	Entropy 0.58132 (0.58319)	Top-1 acc 69.922 (64.735)	Top-5 acc 88.281 (84.519)	lr 0.00530
Train [84][1500/3239]	Time 0.357 (1.130)	Data Time 0.001 (0.616)	Loss 2.4737 (2.4571)	Entropy 0.58129 (0.58318)	Top-1 acc 64.453 (64.728)	Top-5 acc 85.547 (84.517)	lr 0.00530
Train [84][1510/3239]	Time 0.246 (1.126)	Data Time 0.001 (0.613)	Loss 2.4482 (2.4570)	Entropy 0.58131 (0.58316)	Top-1 acc 66.016 (64.731)	Top-5 acc 85.156 (84.516)	lr 0.00529
Train [84][1520/3239]	Time 0.274 (1.134)	Data Time 0.001 (0.622)	Loss 2.5575 (2.4569)	Entropy 0.58101 (0.58315)	Top-1 acc 59.375 (64.729)	Top-5 acc 83.594 (84.518)	lr 0.00529
Train [84][1530/3239]	Time 0.251 (1.130)	Data Time 0.001 (0.618)	Loss 2.1763 (2.4565)	Entropy 0.58115 (0.58314)	Top-1 acc 70.703 (64.731)	Top-5 acc 90.234 (84.528)	lr 0.00529
Train [84][1540/3239]	Time 0.252 (1.127)	Data Time 0.001 (0.615)	Loss 2.6964 (2.4567)	Entropy 0.58076 (0.58312)	Top-1 acc 58.984 (64.725)	Top-5 acc 82.031 (84.523)	lr 0.00529
Train [84][1550/3239]	Time 15.837 (1.132)	Data Time 15.570 (0.621)	Loss 2.1918 (2.4563)	Entropy 0.58058 (0.58311)	Top-1 acc 72.266 (64.731)	Top-5 acc 89.062 (84.534)	lr 0.00529
Train [84][1560/3239]	Time 0.232 (1.131)	Data Time 0.001 (0.621)	Loss 2.4568 (2.4562)	Entropy 0.58070 (0.58309)	Top-1 acc 66.016 (64.740)	Top-5 acc 84.375 (84.536)	lr 0.00529
Train [84][1570/3239]	Time 0.488 (1.162)	Data Time 0.004 (0.617)	Loss 2.3805 (2.4561)	Entropy 0.58061 (0.58308)	Top-1 acc 67.188 (64.745)	Top-5 acc 83.984 (84.539)	lr 0.00529
Train [84][1580/3239]	Time 0.258 (1.157)	Data Time 0.002 (0.613)	Loss 2.2408 (2.4560)	Entropy 0.58075 (0.58306)	Top-1 acc 69.531 (64.750)	Top-5 acc 89.062 (84.538)	lr 0.00529
Train [84][1590/3239]	Time 0.245 (1.153)	Data Time 0.002 (0.609)	Loss 2.3864 (2.4555)	Entropy 0.58093 (0.58305)	Top-1 acc 64.844 (64.761)	Top-5 acc 86.328 (84.545)	lr 0.00529
Train [84][1600/3239]	Time 0.257 (1.148)	Data Time 0.001 (0.605)	Loss 2.5483 (2.4557)	Entropy 0.58090 (0.58303)	Top-1 acc 62.891 (64.755)	Top-5 acc 81.641 (84.541)	lr 0.00529
Train [84][1610/3239]	Time 0.253 (1.144)	Data Time 0.002 (0.601)	Loss 2.9159 (2.4559)	Entropy 0.58086 (0.58302)	Top-1 acc 49.609 (64.750)	Top-5 acc 76.172 (84.537)	lr 0.00529
Train [84][1620/3239]	Time 0.254 (1.139)	Data Time 0.001 (0.598)	Loss 2.3652 (2.4563)	Entropy 0.58053 (0.58301)	Top-1 acc 68.359 (64.743)	Top-5 acc 86.719 (84.534)	lr 0.00529
Train [84][1630/3239]	Time 0.262 (1.135)	Data Time 0.001 (0.594)	Loss 2.3757 (2.4560)	Entropy 0.58052 (0.58299)	Top-1 acc 67.188 (64.747)	Top-5 acc 85.938 (84.541)	lr 0.00528
Train [84][1640/3239]	Time 0.252 (1.134)	Data Time 0.001 (0.593)	Loss 2.5752 (2.4560)	Entropy 0.58061 (0.58298)	Top-1 acc 58.594 (64.749)	Top-5 acc 83.984 (84.538)	lr 0.00528
Train [84][1650/3239]	Time 0.257 (1.132)	Data Time 0.001 (0.592)	Loss 2.3729 (2.4560)	Entropy 0.58068 (0.58296)	Top-1 acc 66.016 (64.751)	Top-5 acc 85.938 (84.538)	lr 0.00528
Train [84][1660/3239]	Time 0.362 (1.128)	Data Time 0.001 (0.588)	Loss 2.3699 (2.4558)	Entropy 0.58044 (0.58295)	Top-1 acc 66.406 (64.753)	Top-5 acc 86.328 (84.542)	lr 0.00528
Train [84][1670/3239]	Time 0.264 (1.134)	Data Time 0.002 (0.595)	Loss 2.5843 (2.4557)	Entropy 0.58081 (0.58293)	Top-1 acc 59.766 (64.749)	Top-5 acc 82.031 (84.545)	lr 0.00528
Train [84][1680/3239]	Time 0.239 (1.131)	Data Time 0.001 (0.593)	Loss 2.5406 (2.4559)	Entropy 0.58104 (0.58292)	Top-1 acc 60.938 (64.741)	Top-5 acc 85.547 (84.544)	lr 0.00528
Train [84][1690/3239]	Time 0.227 (1.129)	Data Time 0.001 (0.591)	Loss 2.5486 (2.4561)	Entropy 0.58104 (0.58291)	Top-1 acc 65.625 (64.744)	Top-5 acc 81.641 (84.539)	lr 0.00528
Train [84][1700/3239]	Time 0.243 (1.130)	Data Time 0.001 (0.593)	Loss 2.3279 (2.4560)	Entropy 0.58097 (0.58290)	Top-1 acc 70.312 (64.745)	Top-5 acc 87.109 (84.541)	lr 0.00528
Train [84][1710/3239]	Time 0.257 (1.128)	Data Time 0.001 (0.591)	Loss 2.7087 (2.4564)	Entropy 0.58096 (0.58289)	Top-1 acc 57.812 (64.742)	Top-5 acc 80.859 (84.533)	lr 0.00528
Train [84][1720/3239]	Time 0.243 (1.124)	Data Time 0.002 (0.587)	Loss 2.5503 (2.4567)	Entropy 0.58079 (0.58287)	Top-1 acc 66.016 (64.739)	Top-5 acc 80.469 (84.520)	lr 0.00528
Train [84][1730/3239]	Time 1.022 (1.126)	Data Time 0.639 (0.590)	Loss 2.2937 (2.4566)	Entropy 0.58044 (0.58286)	Top-1 acc 69.141 (64.740)	Top-5 acc 90.234 (84.527)	lr 0.00528
Train [84][1740/3239]	Time 0.233 (1.124)	Data Time 0.001 (0.589)	Loss 2.5455 (2.4570)	Entropy 0.58004 (0.58285)	Top-1 acc 66.016 (64.729)	Top-5 acc 81.641 (84.517)	lr 0.00528
Train [84][1750/3239]	Time 0.245 (1.122)	Data Time 0.001 (0.587)	Loss 2.4759 (2.4571)	Entropy 0.58017 (0.58283)	Top-1 acc 60.547 (64.724)	Top-5 acc 85.156 (84.517)	lr 0.00527
Train [84][1760/3239]	Time 5.766 (1.126)	Data Time 5.492 (0.592)	Loss 2.3868 (2.4571)	Entropy 0.58041 (0.58282)	Top-1 acc 67.188 (64.718)	Top-5 acc 86.328 (84.521)	lr 0.00527
Train [84][1770/3239]	Time 0.238 (1.125)	Data Time 0.001 (0.592)	Loss 2.4399 (2.4573)	Entropy 0.58036 (0.58280)	Top-1 acc 66.406 (64.711)	Top-5 acc 85.156 (84.516)	lr 0.00527
Train [84][1780/3239]	Time 0.229 (1.123)	Data Time 0.001 (0.590)	Loss 2.5330 (2.4577)	Entropy 0.58032 (0.58279)	Top-1 acc 62.109 (64.702)	Top-5 acc 83.203 (84.511)	lr 0.00527
Train [84][1790/3239]	Time 0.231 (1.124)	Data Time 0.001 (0.592)	Loss 2.4798 (2.4577)	Entropy 0.58050 (0.58278)	Top-1 acc 65.234 (64.706)	Top-5 acc 85.547 (84.508)	lr 0.00527
Train [84][1800/3239]	Time 0.248 (1.126)	Data Time 0.001 (0.594)	Loss 2.3133 (2.4574)	Entropy 0.58085 (0.58277)	Top-1 acc 69.141 (64.711)	Top-5 acc 87.109 (84.514)	lr 0.00527
Train [84][1810/3239]	Time 0.252 (1.124)	Data Time 0.001 (0.593)	Loss 2.5748 (2.4576)	Entropy 0.58082 (0.58275)	Top-1 acc 62.891 (64.700)	Top-5 acc 81.250 (84.513)	lr 0.00527
Train [84][1820/3239]	Time 0.358 (1.120)	Data Time 0.001 (0.590)	Loss 2.3842 (2.4573)	Entropy 0.58080 (0.58274)	Top-1 acc 66.016 (64.712)	Top-5 acc 86.719 (84.519)	lr 0.00527
Train [84][1830/3239]	Time 0.318 (1.127)	Data Time 0.001 (0.597)	Loss 2.4902 (2.4573)	Entropy 0.58086 (0.58273)	Top-1 acc 63.672 (64.711)	Top-5 acc 80.469 (84.517)	lr 0.00527
Train [84][1840/3239]	Time 0.250 (1.127)	Data Time 0.001 (0.597)	Loss 2.4265 (2.4574)	Entropy 0.58085 (0.58272)	Top-1 acc 65.234 (64.707)	Top-5 acc 84.375 (84.511)	lr 0.00527
Train [84][1850/3239]	Time 0.249 (1.123)	Data Time 0.001 (0.594)	Loss 2.3539 (2.4574)	Entropy 0.58104 (0.58271)	Top-1 acc 67.969 (64.713)	Top-5 acc 85.547 (84.514)	lr 0.00527
Train [84][1860/3239]	Time 1.903 (1.128)	Data Time 1.600 (0.599)	Loss 2.3327 (2.4574)	Entropy 0.58113 (0.58270)	Top-1 acc 65.625 (64.719)	Top-5 acc 86.719 (84.515)	lr 0.00527
Train [84][1870/3239]	Time 0.252 (1.126)	Data Time 0.001 (0.597)	Loss 2.3742 (2.4575)	Entropy 0.58120 (0.58270)	Top-1 acc 67.969 (64.719)	Top-5 acc 83.594 (84.511)	lr 0.00527
Train [84][1880/3239]	Time 3.235 (1.124)	Data Time 2.978 (0.596)	Loss 2.4339 (2.4578)	Entropy 0.58093 (0.58269)	Top-1 acc 65.234 (64.711)	Top-5 acc 86.328 (84.509)	lr 0.00526
Train [84][1890/3239]	Time 0.357 (1.127)	Data Time 0.001 (0.600)	Loss 2.4057 (2.4578)	Entropy 0.58073 (0.58268)	Top-1 acc 67.188 (64.713)	Top-5 acc 82.031 (84.506)	lr 0.00526
Train [84][1900/3239]	Time 0.237 (1.125)	Data Time 0.001 (0.598)	Loss 2.4376 (2.4578)	Entropy 0.58069 (0.58267)	Top-1 acc 66.797 (64.711)	Top-5 acc 83.203 (84.504)	lr 0.00526
Train [84][1910/3239]	Time 0.290 (1.125)	Data Time 0.002 (0.598)	Loss 2.4362 (2.4579)	Entropy 0.58064 (0.58266)	Top-1 acc 62.500 (64.706)	Top-5 acc 84.375 (84.500)	lr 0.00526
Train [84][1920/3239]	Time 6.646 (1.129)	Data Time 6.361 (0.602)	Loss 2.9220 (2.4583)	Entropy 0.58075 (0.58265)	Top-1 acc 57.031 (64.698)	Top-5 acc 77.344 (84.494)	lr 0.00526
Train [84][1930/3239]	Time 0.253 (1.127)	Data Time 0.001 (0.601)	Loss 2.3045 (2.4583)	Entropy 0.58108 (0.58264)	Top-1 acc 66.797 (64.694)	Top-5 acc 89.062 (84.496)	lr 0.00526
Train [84][1940/3239]	Time 0.235 (1.126)	Data Time 0.001 (0.601)	Loss 2.8045 (2.4584)	Entropy 0.58150 (0.58263)	Top-1 acc 57.422 (64.690)	Top-5 acc 77.344 (84.496)	lr 0.00526
Train [84][1950/3239]	Time 0.232 (1.126)	Data Time 0.001 (0.601)	Loss 2.3901 (2.4584)	Entropy 0.58123 (0.58262)	Top-1 acc 69.141 (64.696)	Top-5 acc 85.547 (84.499)	lr 0.00526
Train [84][1960/3239]	Time 0.242 (1.126)	Data Time 0.001 (0.602)	Loss 2.5569 (2.4584)	Entropy 0.58112 (0.58262)	Top-1 acc 65.234 (64.699)	Top-5 acc 84.766 (84.503)	lr 0.00526
Train [84][1970/3239]	Time 0.259 (1.128)	Data Time 0.001 (0.604)	Loss 2.4764 (2.4586)	Entropy 0.58138 (0.58261)	Top-1 acc 61.719 (64.692)	Top-5 acc 84.766 (84.499)	lr 0.00526
Train [84][1980/3239]	Time 0.241 (1.124)	Data Time 0.001 (0.601)	Loss 2.4276 (2.4585)	Entropy 0.58147 (0.58260)	Top-1 acc 66.016 (64.697)	Top-5 acc 85.156 (84.505)	lr 0.00526
Train [84][1990/3239]	Time 0.234 (1.126)	Data Time 0.001 (0.603)	Loss 2.3157 (2.4582)	Entropy 0.58129 (0.58260)	Top-1 acc 67.188 (64.700)	Top-5 acc 86.719 (84.513)	lr 0.00526
Train [84][2000/3239]	Time 0.274 (1.125)	Data Time 0.001 (0.603)	Loss 2.5364 (2.4583)	Entropy 0.58107 (0.58259)	Top-1 acc 67.578 (64.695)	Top-5 acc 83.203 (84.510)	lr 0.00525
Train [84][2010/3239]	Time 0.249 (1.122)	Data Time 0.001 (0.600)	Loss 2.4578 (2.4580)	Entropy 0.58091 (0.58258)	Top-1 acc 65.234 (64.699)	Top-5 acc 83.984 (84.518)	lr 0.00525
Train [84][2020/3239]	Time 0.238 (1.120)	Data Time 0.001 (0.599)	Loss 2.4352 (2.4582)	Entropy 0.58080 (0.58257)	Top-1 acc 64.453 (64.699)	Top-5 acc 85.156 (84.512)	lr 0.00525
Train [84][2030/3239]	Time 4.042 (1.119)	Data Time 3.793 (0.598)	Loss 2.3646 (2.4583)	Entropy 0.58082 (0.58256)	Top-1 acc 67.578 (64.699)	Top-5 acc 85.547 (84.512)	lr 0.00525
Train [84][2040/3239]	Time 0.302 (1.116)	Data Time 0.001 (0.595)	Loss 2.4084 (2.4582)	Entropy 0.58101 (0.58256)	Top-1 acc 62.891 (64.700)	Top-5 acc 85.156 (84.513)	lr 0.00525
Train [84][2050/3239]	Time 0.390 (1.114)	Data Time 0.002 (0.593)	Loss 2.2983 (2.4580)	Entropy 0.58100 (0.58255)	Top-1 acc 70.703 (64.705)	Top-5 acc 85.547 (84.516)	lr 0.00525
Train [84][2060/3239]	Time 0.229 (1.111)	Data Time 0.001 (0.590)	Loss 2.7175 (2.4580)	Entropy 0.58078 (0.58254)	Top-1 acc 58.594 (64.702)	Top-5 acc 78.906 (84.517)	lr 0.00525
Train [84][2070/3239]	Time 0.241 (1.110)	Data Time 0.002 (0.590)	Loss 2.1955 (2.4580)	Entropy 0.58075 (0.58253)	Top-1 acc 70.312 (64.703)	Top-5 acc 89.844 (84.516)	lr 0.00525
Train [84][2080/3239]	Time 1.684 (1.108)	Data Time 1.395 (0.588)	Loss 2.4104 (2.4582)	Entropy 0.58083 (0.58252)	Top-1 acc 64.453 (64.699)	Top-5 acc 85.156 (84.515)	lr 0.00525
Train [84][2090/3239]	Time 0.246 (1.105)	Data Time 0.001 (0.586)	Loss 2.4821 (2.4585)	Entropy 0.58112 (0.58251)	Top-1 acc 63.672 (64.688)	Top-5 acc 85.938 (84.511)	lr 0.00525
Train [84][2100/3239]	Time 0.228 (1.105)	Data Time 0.001 (0.586)	Loss 2.2733 (2.4583)	Entropy 0.58127 (0.58251)	Top-1 acc 67.188 (64.696)	Top-5 acc 88.672 (84.517)	lr 0.00525
Train [84][2110/3239]	Time 0.230 (1.102)	Data Time 0.001 (0.583)	Loss 2.4171 (2.4585)	Entropy 0.58119 (0.58250)	Top-1 acc 64.844 (64.692)	Top-5 acc 87.891 (84.514)	lr 0.00525
Train [84][2120/3239]	Time 0.315 (1.099)	Data Time 0.001 (0.581)	Loss 2.3864 (2.4583)	Entropy 0.58127 (0.58250)	Top-1 acc 65.625 (64.698)	Top-5 acc 84.375 (84.517)	lr 0.00524
Train [84][2130/3239]	Time 0.240 (1.099)	Data Time 0.001 (0.581)	Loss 2.3809 (2.4582)	Entropy 0.58149 (0.58249)	Top-1 acc 64.844 (64.706)	Top-5 acc 86.719 (84.521)	lr 0.00524
Train [84][2140/3239]	Time 0.230 (1.095)	Data Time 0.001 (0.578)	Loss 2.5719 (2.4581)	Entropy 0.58172 (0.58249)	Top-1 acc 62.109 (64.710)	Top-5 acc 82.812 (84.524)	lr 0.00524
Train [84][2150/3239]	Time 0.247 (1.094)	Data Time 0.001 (0.577)	Loss 2.5254 (2.4581)	Entropy 0.58178 (0.58248)	Top-1 acc 62.109 (64.713)	Top-5 acc 82.031 (84.526)	lr 0.00524
Train [84][2160/3239]	Time 0.246 (1.094)	Data Time 0.001 (0.577)	Loss 2.5508 (2.4580)	Entropy 0.58167 (0.58248)	Top-1 acc 61.719 (64.716)	Top-5 acc 82.031 (84.525)	lr 0.00524
Train [84][2170/3239]	Time 0.224 (1.091)	Data Time 0.001 (0.575)	Loss 2.6374 (2.4583)	Entropy 0.58164 (0.58248)	Top-1 acc 60.156 (64.710)	Top-5 acc 78.125 (84.522)	lr 0.00524
Train [84][2180/3239]	Time 0.242 (1.089)	Data Time 0.001 (0.574)	Loss 2.4541 (2.4581)	Entropy 0.58170 (0.58247)	Top-1 acc 66.406 (64.715)	Top-5 acc 85.547 (84.527)	lr 0.00524
Train [84][2190/3239]	Time 6.451 (1.089)	Data Time 6.196 (0.574)	Loss 2.4061 (2.4580)	Entropy 0.58173 (0.58247)	Top-1 acc 64.453 (64.712)	Top-5 acc 86.719 (84.532)	lr 0.00524
Train [84][2200/3239]	Time 0.238 (1.086)	Data Time 0.001 (0.572)	Loss 2.4712 (2.4580)	Entropy 0.58177 (0.58246)	Top-1 acc 62.891 (64.709)	Top-5 acc 84.766 (84.533)	lr 0.00524
Train [84][2210/3239]	Time 0.453 (1.085)	Data Time 0.002 (0.570)	Loss 2.7160 (2.4582)	Entropy 0.58168 (0.58246)	Top-1 acc 60.547 (64.708)	Top-5 acc 81.641 (84.529)	lr 0.00524
Train [84][2220/3239]	Time 0.274 (1.106)	Data Time 0.005 (0.568)	Loss 2.5570 (2.4584)	Entropy 0.58168 (0.58246)	Top-1 acc 58.984 (64.701)	Top-5 acc 82.422 (84.522)	lr 0.00524
Train [84][2230/3239]	Time 0.237 (1.103)	Data Time 0.002 (0.565)	Loss 2.5509 (2.4584)	Entropy 0.58199 (0.58245)	Top-1 acc 64.062 (64.705)	Top-5 acc 80.859 (84.519)	lr 0.00524
Train [84][2240/3239]	Time 0.254 (1.100)	Data Time 0.002 (0.563)	Loss 2.3911 (2.4586)	Entropy 0.58166 (0.58245)	Top-1 acc 66.797 (64.700)	Top-5 acc 87.500 (84.518)	lr 0.00523
Train [84][2250/3239]	Time 0.264 (1.097)	Data Time 0.002 (0.560)	Loss 2.4310 (2.4585)	Entropy 0.58126 (0.58245)	Top-1 acc 63.281 (64.701)	Top-5 acc 83.203 (84.519)	lr 0.00523
Train [84][2260/3239]	Time 0.253 (1.095)	Data Time 0.001 (0.558)	Loss 2.6397 (2.4586)	Entropy 0.58148 (0.58244)	Top-1 acc 59.766 (64.700)	Top-5 acc 81.641 (84.518)	lr 0.00523
Train [84][2270/3239]	Time 0.241 (1.092)	Data Time 0.001 (0.555)	Loss 2.3600 (2.4584)	Entropy 0.58142 (0.58244)	Top-1 acc 67.578 (64.706)	Top-5 acc 85.938 (84.521)	lr 0.00523
Train [84][2280/3239]	Time 0.342 (1.089)	Data Time 0.001 (0.553)	Loss 2.5589 (2.4586)	Entropy 0.58144 (0.58243)	Top-1 acc 64.453 (64.700)	Top-5 acc 84.375 (84.518)	lr 0.00523
Train [84][2290/3239]	Time 0.249 (1.086)	Data Time 0.002 (0.551)	Loss 2.4907 (2.4588)	Entropy 0.58141 (0.58243)	Top-1 acc 63.281 (64.696)	Top-5 acc 83.203 (84.509)	lr 0.00523
Train [84][2300/3239]	Time 0.248 (1.083)	Data Time 0.001 (0.548)	Loss 2.5876 (2.4587)	Entropy 0.58164 (0.58243)	Top-1 acc 59.766 (64.697)	Top-5 acc 81.641 (84.511)	lr 0.00523
Train [84][2310/3239]	Time 0.250 (1.080)	Data Time 0.001 (0.546)	Loss 2.6215 (2.4588)	Entropy 0.58165 (0.58242)	Top-1 acc 62.500 (64.693)	Top-5 acc 79.297 (84.508)	lr 0.00523
Train [84][2320/3239]	Time 0.283 (1.078)	Data Time 0.002 (0.544)	Loss 2.5296 (2.4587)	Entropy 0.58173 (0.58242)	Top-1 acc 61.328 (64.692)	Top-5 acc 82.422 (84.511)	lr 0.00523
Train [84][2330/3239]	Time 0.247 (1.076)	Data Time 0.001 (0.542)	Loss 2.6682 (2.4584)	Entropy 0.58191 (0.58242)	Top-1 acc 58.594 (64.700)	Top-5 acc 79.688 (84.516)	lr 0.00523
Train [84][2340/3239]	Time 0.240 (1.075)	Data Time 0.001 (0.541)	Loss 2.3982 (2.4582)	Entropy 0.58213 (0.58242)	Top-1 acc 64.453 (64.707)	Top-5 acc 85.938 (84.523)	lr 0.00523
Train [84][2350/3239]	Time 0.254 (1.073)	Data Time 0.001 (0.540)	Loss 2.3874 (2.4584)	Entropy 0.58200 (0.58241)	Top-1 acc 64.062 (64.705)	Top-5 acc 87.109 (84.520)	lr 0.00523
Train [84][2360/3239]	Time 0.239 (1.073)	Data Time 0.001 (0.540)	Loss 2.5972 (2.4581)	Entropy 0.58194 (0.58241)	Top-1 acc 65.625 (64.717)	Top-5 acc 81.250 (84.524)	lr 0.00522
Train [84][2370/3239]	Time 0.393 (1.072)	Data Time 0.001 (0.540)	Loss 2.5265 (2.4582)	Entropy 0.58206 (0.58241)	Top-1 acc 63.672 (64.717)	Top-5 acc 84.375 (84.521)	lr 0.00522
Train [84][2380/3239]	Time 0.244 (1.069)	Data Time 0.002 (0.537)	Loss 2.8489 (2.4583)	Entropy 0.58187 (0.58241)	Top-1 acc 58.984 (64.713)	Top-5 acc 78.906 (84.517)	lr 0.00522
Train [84][2390/3239]	Time 3.146 (1.068)	Data Time 2.899 (0.537)	Loss 2.4687 (2.4585)	Entropy 0.58189 (0.58241)	Top-1 acc 65.625 (64.710)	Top-5 acc 83.203 (84.514)	lr 0.00522
Train [84][2400/3239]	Time 0.254 (1.067)	Data Time 0.001 (0.536)	Loss 2.5395 (2.4587)	Entropy 0.58175 (0.58240)	Top-1 acc 62.500 (64.707)	Top-5 acc 82.812 (84.510)	lr 0.00522
Train [84][2410/3239]	Time 0.244 (1.064)	Data Time 0.001 (0.533)	Loss 2.6398 (2.4586)	Entropy 0.58177 (0.58240)	Top-1 acc 60.938 (64.712)	Top-5 acc 78.906 (84.511)	lr 0.00522
Train [84][2420/3239]	Time 0.243 (1.063)	Data Time 0.001 (0.533)	Loss 2.5801 (2.4588)	Entropy 0.58197 (0.58240)	Top-1 acc 61.719 (64.706)	Top-5 acc 81.250 (84.507)	lr 0.00522
Train [84][2430/3239]	Time 0.264 (1.062)	Data Time 0.001 (0.532)	Loss 2.4874 (2.4587)	Entropy 0.58194 (0.58240)	Top-1 acc 65.625 (64.707)	Top-5 acc 81.641 (84.507)	lr 0.00522
Train [84][2440/3239]	Time 0.363 (1.060)	Data Time 0.001 (0.530)	Loss 2.4056 (2.4589)	Entropy 0.58199 (0.58240)	Top-1 acc 66.016 (64.700)	Top-5 acc 85.156 (84.503)	lr 0.00522
Train [84][2450/3239]	Time 0.235 (1.060)	Data Time 0.001 (0.531)	Loss 2.5554 (2.4592)	Entropy 0.58210 (0.58239)	Top-1 acc 61.719 (64.697)	Top-5 acc 82.031 (84.498)	lr 0.00522
Train [84][2460/3239]	Time 0.225 (1.059)	Data Time 0.001 (0.530)	Loss 2.7704 (2.4591)	Entropy 0.58193 (0.58239)	Top-1 acc 60.156 (64.697)	Top-5 acc 78.516 (84.500)	lr 0.00522
Train [84][2470/3239]	Time 0.240 (1.056)	Data Time 0.001 (0.528)	Loss 2.2919 (2.4590)	Entropy 0.58176 (0.58239)	Top-1 acc 68.359 (64.704)	Top-5 acc 88.672 (84.502)	lr 0.00522
Train [84][2480/3239]	Time 0.257 (1.054)	Data Time 0.001 (0.526)	Loss 2.2473 (2.4588)	Entropy 0.58200 (0.58239)	Top-1 acc 69.531 (64.711)	Top-5 acc 90.234 (84.506)	lr 0.00521
Train [84][2490/3239]	Time 0.233 (1.055)	Data Time 0.001 (0.527)	Loss 2.7234 (2.4589)	Entropy 0.58237 (0.58239)	Top-1 acc 58.203 (64.709)	Top-5 acc 80.469 (84.502)	lr 0.00521
Train [84][2500/3239]	Time 0.249 (1.053)	Data Time 0.001 (0.526)	Loss 2.3643 (2.4591)	Entropy 0.58255 (0.58239)	Top-1 acc 67.578 (64.700)	Top-5 acc 85.156 (84.500)	lr 0.00521
Train [84][2510/3239]	Time 0.237 (1.051)	Data Time 0.001 (0.524)	Loss 2.3124 (2.4591)	Entropy 0.58235 (0.58239)	Top-1 acc 67.969 (64.701)	Top-5 acc 87.109 (84.498)	lr 0.00521
Train [84][2520/3239]	Time 0.217 (1.051)	Data Time 0.001 (0.524)	Loss 2.6344 (2.4591)	Entropy 0.58242 (0.58239)	Top-1 acc 59.766 (64.700)	Top-5 acc 82.812 (84.500)	lr 0.00521
Train [84][2530/3239]	Time 0.273 (1.050)	Data Time 0.001 (0.523)	Loss 2.4083 (2.4588)	Entropy 0.58213 (0.58239)	Top-1 acc 65.625 (64.705)	Top-5 acc 85.547 (84.502)	lr 0.00521
Train [84][2540/3239]	Time 0.234 (1.047)	Data Time 0.001 (0.521)	Loss 2.4770 (2.4591)	Entropy 0.58184 (0.58239)	Top-1 acc 65.625 (64.703)	Top-5 acc 82.422 (84.493)	lr 0.00521
Train [84][2550/3239]	Time 0.254 (1.046)	Data Time 0.001 (0.520)	Loss 2.5673 (2.4590)	Entropy 0.58148 (0.58238)	Top-1 acc 57.812 (64.704)	Top-5 acc 82.812 (84.495)	lr 0.00521
Train [84][2560/3239]	Time 0.282 (1.046)	Data Time 0.002 (0.521)	Loss 2.5109 (2.4590)	Entropy 0.58155 (0.58238)	Top-1 acc 62.109 (64.702)	Top-5 acc 84.766 (84.497)	lr 0.00521
Train [84][2570/3239]	Time 0.259 (1.043)	Data Time 0.001 (0.519)	Loss 2.4215 (2.4588)	Entropy 0.58166 (0.58238)	Top-1 acc 64.453 (64.704)	Top-5 acc 86.328 (84.504)	lr 0.00521
Train [84][2580/3239]	Time 0.245 (1.042)	Data Time 0.001 (0.518)	Loss 2.4625 (2.4586)	Entropy 0.58204 (0.58237)	Top-1 acc 66.797 (64.710)	Top-5 acc 82.812 (84.507)	lr 0.00521
Train [84][2590/3239]	Time 0.229 (1.042)	Data Time 0.001 (0.518)	Loss 2.4325 (2.4584)	Entropy 0.58228 (0.58237)	Top-1 acc 66.016 (64.714)	Top-5 acc 82.812 (84.509)	lr 0.00521
Train [84][2600/3239]	Time 0.356 (1.040)	Data Time 0.001 (0.516)	Loss 2.4879 (2.4584)	Entropy 0.58282 (0.58237)	Top-1 acc 64.453 (64.716)	Top-5 acc 85.938 (84.508)	lr 0.00521
Train [84][2610/3239]	Time 0.234 (1.039)	Data Time 0.001 (0.515)	Loss 2.5910 (2.4583)	Entropy 0.58288 (0.58237)	Top-1 acc 59.766 (64.718)	Top-5 acc 83.594 (84.508)	lr 0.00520
Train [84][2620/3239]	Time 0.231 (1.040)	Data Time 0.001 (0.516)	Loss 2.3751 (2.4582)	Entropy 0.58291 (0.58238)	Top-1 acc 64.062 (64.718)	Top-5 acc 85.938 (84.511)	lr 0.00520
Train [84][2630/3239]	Time 0.231 (1.037)	Data Time 0.001 (0.515)	Loss 2.5269 (2.4585)	Entropy 0.58280 (0.58238)	Top-1 acc 64.844 (64.711)	Top-5 acc 85.156 (84.506)	lr 0.00520
Train [84][2640/3239]	Time 0.234 (1.035)	Data Time 0.001 (0.513)	Loss 2.4446 (2.4586)	Entropy 0.58290 (0.58238)	Top-1 acc 62.500 (64.709)	Top-5 acc 84.375 (84.504)	lr 0.00520
Train [84][2650/3239]	Time 0.231 (1.034)	Data Time 0.001 (0.512)	Loss 2.5071 (2.4586)	Entropy 0.58287 (0.58238)	Top-1 acc 64.453 (64.710)	Top-5 acc 83.203 (84.504)	lr 0.00520
Train [84][2660/3239]	Time 0.225 (1.035)	Data Time 0.001 (0.513)	Loss 2.5205 (2.4590)	Entropy 0.58295 (0.58238)	Top-1 acc 64.453 (64.701)	Top-5 acc 83.203 (84.495)	lr 0.00520
Train [84][2670/3239]	Time 0.359 (1.032)	Data Time 0.001 (0.511)	Loss 2.5165 (2.4590)	Entropy 0.58315 (0.58239)	Top-1 acc 66.016 (64.699)	Top-5 acc 82.812 (84.493)	lr 0.00520
Train [84][2680/3239]	Time 0.239 (1.031)	Data Time 0.001 (0.511)	Loss 2.4022 (2.4587)	Entropy 0.58315 (0.58239)	Top-1 acc 62.109 (64.707)	Top-5 acc 86.719 (84.500)	lr 0.00520
Train [84][2690/3239]	Time 1.159 (1.031)	Data Time 0.919 (0.511)	Loss 2.3851 (2.4585)	Entropy 0.58322 (0.58239)	Top-1 acc 66.016 (64.712)	Top-5 acc 84.375 (84.502)	lr 0.00520
Train [84][2700/3239]	Time 0.263 (1.029)	Data Time 0.001 (0.509)	Loss 2.6136 (2.4587)	Entropy 0.58315 (0.58240)	Top-1 acc 60.156 (64.709)	Top-5 acc 83.203 (84.497)	lr 0.00520
Train [84][2710/3239]	Time 0.589 (1.027)	Data Time 0.348 (0.508)	Loss 2.4158 (2.4586)	Entropy 0.58326 (0.58240)	Top-1 acc 63.672 (64.711)	Top-5 acc 85.938 (84.500)	lr 0.00520
Train [84][2720/3239]	Time 0.250 (1.028)	Data Time 0.001 (0.509)	Loss 2.9116 (2.4586)	Entropy 0.58352 (0.58240)	Top-1 acc 53.516 (64.709)	Top-5 acc 75.391 (84.499)	lr 0.00520
Train [84][2730/3239]	Time 0.246 (1.026)	Data Time 0.001 (0.507)	Loss 2.3444 (2.4585)	Entropy 0.58389 (0.58241)	Top-1 acc 67.578 (64.711)	Top-5 acc 83.984 (84.500)	lr 0.00519
Train [84][2740/3239]	Time 0.307 (1.024)	Data Time 0.002 (0.505)	Loss 2.4788 (2.4585)	Entropy 0.58365 (0.58241)	Top-1 acc 64.844 (64.709)	Top-5 acc 85.156 (84.501)	lr 0.00519
Train [84][2750/3239]	Time 0.272 (1.025)	Data Time 0.001 (0.507)	Loss 2.5165 (2.4586)	Entropy 0.58390 (0.58242)	Top-1 acc 62.109 (64.705)	Top-5 acc 85.547 (84.500)	lr 0.00519
Train [84][2760/3239]	Time 0.341 (1.023)	Data Time 0.001 (0.505)	Loss 2.3316 (2.4587)	Entropy 0.58424 (0.58242)	Top-1 acc 67.578 (64.702)	Top-5 acc 87.891 (84.499)	lr 0.00519
Train [84][2770/3239]	Time 0.226 (1.022)	Data Time 0.001 (0.504)	Loss 2.5411 (2.4586)	Entropy 0.58443 (0.58243)	Top-1 acc 64.062 (64.707)	Top-5 acc 85.156 (84.501)	lr 0.00519
Train [84][2780/3239]	Time 0.231 (1.023)	Data Time 0.001 (0.505)	Loss 2.4594 (2.4586)	Entropy 0.58441 (0.58244)	Top-1 acc 67.578 (64.706)	Top-5 acc 83.984 (84.499)	lr 0.00519
Train [84][2790/3239]	Time 0.261 (1.021)	Data Time 0.001 (0.503)	Loss 2.4317 (2.4586)	Entropy 0.58463 (0.58244)	Top-1 acc 64.844 (64.703)	Top-5 acc 84.375 (84.499)	lr 0.00519
Train [84][2800/3239]	Time 0.274 (1.019)	Data Time 0.001 (0.501)	Loss 2.4456 (2.4588)	Entropy 0.58456 (0.58245)	Top-1 acc 62.891 (64.701)	Top-5 acc 85.547 (84.497)	lr 0.00519
Train [84][2810/3239]	Time 0.277 (1.018)	Data Time 0.001 (0.501)	Loss 2.2455 (2.4584)	Entropy 0.58478 (0.58246)	Top-1 acc 66.797 (64.708)	Top-5 acc 90.234 (84.502)	lr 0.00519
Train [84][2820/3239]	Time 0.253 (1.018)	Data Time 0.001 (0.501)	Loss 2.5890 (2.4586)	Entropy 0.58474 (0.58247)	Top-1 acc 61.719 (64.703)	Top-5 acc 82.812 (84.498)	lr 0.00519
Train [84][2830/3239]	Time 0.328 (1.015)	Data Time 0.001 (0.499)	Loss 2.6427 (2.4585)	Entropy 0.58492 (0.58248)	Top-1 acc 60.547 (64.707)	Top-5 acc 79.688 (84.501)	lr 0.00519
Train [84][2840/3239]	Time 0.238 (1.016)	Data Time 0.001 (0.500)	Loss 2.7197 (2.4586)	Entropy 0.58484 (0.58249)	Top-1 acc 56.641 (64.699)	Top-5 acc 82.812 (84.501)	lr 0.00519
Train [84][2850/3239]	Time 0.233 (1.016)	Data Time 0.001 (0.500)	Loss 2.4141 (2.4586)	Entropy 0.58487 (0.58249)	Top-1 acc 66.406 (64.700)	Top-5 acc 87.109 (84.504)	lr 0.00518
Train [84][2860/3239]	Time 0.235 (1.014)	Data Time 0.001 (0.498)	Loss 2.4279 (2.4586)	Entropy 0.58480 (0.58250)	Top-1 acc 64.844 (64.701)	Top-5 acc 85.547 (84.505)	lr 0.00518
Train [84][2870/3239]	Time 1.890 (1.013)	Data Time 1.629 (0.498)	Loss 2.5459 (2.4585)	Entropy 0.58481 (0.58251)	Top-1 acc 62.891 (64.704)	Top-5 acc 82.812 (84.507)	lr 0.00518
Train [84][2880/3239]	Time 0.298 (1.031)	Data Time 0.003 (0.497)	Loss 2.3701 (2.4587)	Entropy 0.58495 (0.58252)	Top-1 acc 64.453 (64.699)	Top-5 acc 86.328 (84.504)	lr 0.00518
Train [84][2890/3239]	Time 0.241 (1.029)	Data Time 0.002 (0.496)	Loss 2.5213 (2.4585)	Entropy 0.58524 (0.58253)	Top-1 acc 62.891 (64.700)	Top-5 acc 83.594 (84.508)	lr 0.00518
Train [84][2900/3239]	Time 0.242 (1.027)	Data Time 0.001 (0.494)	Loss 2.3597 (2.4585)	Entropy 0.58505 (0.58254)	Top-1 acc 69.531 (64.700)	Top-5 acc 83.984 (84.508)	lr 0.00518
Train [84][2910/3239]	Time 0.289 (1.025)	Data Time 0.003 (0.492)	Loss 2.3870 (2.4584)	Entropy 0.58474 (0.58254)	Top-1 acc 64.844 (64.698)	Top-5 acc 84.766 (84.507)	lr 0.00518
Train [84][2920/3239]	Time 0.334 (1.023)	Data Time 0.002 (0.491)	Loss 2.3476 (2.4583)	Entropy 0.58461 (0.58255)	Top-1 acc 66.797 (64.697)	Top-5 acc 86.719 (84.511)	lr 0.00518
Train [84][2930/3239]	Time 0.276 (1.021)	Data Time 0.002 (0.489)	Loss 2.3098 (2.4582)	Entropy 0.58466 (0.58256)	Top-1 acc 68.359 (64.697)	Top-5 acc 88.672 (84.511)	lr 0.00518
Train [84][2940/3239]	Time 0.246 (1.019)	Data Time 0.001 (0.487)	Loss 2.4943 (2.4583)	Entropy 0.58442 (0.58257)	Top-1 acc 62.891 (64.693)	Top-5 acc 84.766 (84.511)	lr 0.00518
Train [84][2950/3239]	Time 0.317 (1.017)	Data Time 0.003 (0.486)	Loss 2.5204 (2.4584)	Entropy 0.58427 (0.58257)	Top-1 acc 64.453 (64.690)	Top-5 acc 83.594 (84.508)	lr 0.00518
Train [84][2960/3239]	Time 0.246 (1.016)	Data Time 0.001 (0.484)	Loss 2.4019 (2.4584)	Entropy 0.58427 (0.58258)	Top-1 acc 64.844 (64.690)	Top-5 acc 84.766 (84.511)	lr 0.00518
Train [84][2970/3239]	Time 0.249 (1.014)	Data Time 0.001 (0.482)	Loss 2.2580 (2.4583)	Entropy 0.58423 (0.58258)	Top-1 acc 72.266 (64.691)	Top-5 acc 84.766 (84.513)	lr 0.00517
Train [84][2980/3239]	Time 0.266 (1.014)	Data Time 0.001 (0.483)	Loss 2.3070 (2.4581)	Entropy 0.58438 (0.58259)	Top-1 acc 67.578 (64.696)	Top-5 acc 88.281 (84.518)	lr 0.00517
Train [84][2990/3239]	Time 0.360 (1.013)	Data Time 0.001 (0.483)	Loss 2.4376 (2.4581)	Entropy 0.58432 (0.58260)	Top-1 acc 66.797 (64.696)	Top-5 acc 84.766 (84.520)	lr 0.00517
Train [84][3000/3239]	Time 0.240 (1.012)	Data Time 0.001 (0.481)	Loss 2.6463 (2.4583)	Entropy 0.58458 (0.58260)	Top-1 acc 62.109 (64.688)	Top-5 acc 81.641 (84.515)	lr 0.00517
Train [84][3010/3239]	Time 0.242 (1.012)	Data Time 0.001 (0.482)	Loss 2.7114 (2.4586)	Entropy 0.58452 (0.58261)	Top-1 acc 58.984 (64.685)	Top-5 acc 78.906 (84.511)	lr 0.00517
Train [84][3020/3239]	Time 0.306 (1.012)	Data Time 0.001 (0.482)	Loss 2.4287 (2.4585)	Entropy 0.58467 (0.58261)	Top-1 acc 63.672 (64.688)	Top-5 acc 83.594 (84.511)	lr 0.00517
Train [84][3030/3239]	Time 0.249 (1.010)	Data Time 0.001 (0.481)	Loss 2.4709 (2.4586)	Entropy 0.58469 (0.58262)	Top-1 acc 67.188 (64.684)	Top-5 acc 85.547 (84.509)	lr 0.00517
Train [84][3040/3239]	Time 0.243 (1.010)	Data Time 0.002 (0.481)	Loss 2.7038 (2.4589)	Entropy 0.58495 (0.58263)	Top-1 acc 54.688 (64.679)	Top-5 acc 82.812 (84.506)	lr 0.00517
Train [84][3050/3239]	Time 0.241 (1.010)	Data Time 0.001 (0.481)	Loss 2.4434 (2.4586)	Entropy 0.58510 (0.58264)	Top-1 acc 65.625 (64.685)	Top-5 acc 84.375 (84.509)	lr 0.00517
Train [84][3060/3239]	Time 0.265 (1.009)	Data Time 0.001 (0.480)	Loss 2.5767 (2.4586)	Entropy 0.58506 (0.58264)	Top-1 acc 62.891 (64.684)	Top-5 acc 80.859 (84.510)	lr 0.00517
Train [84][3070/3239]	Time 0.267 (1.007)	Data Time 0.001 (0.479)	Loss 2.4792 (2.4585)	Entropy 0.58526 (0.58265)	Top-1 acc 61.328 (64.685)	Top-5 acc 83.984 (84.514)	lr 0.00517
Train [84][3080/3239]	Time 2.472 (1.008)	Data Time 2.118 (0.480)	Loss 2.4137 (2.4584)	Entropy 0.58529 (0.58266)	Top-1 acc 67.188 (64.690)	Top-5 acc 85.938 (84.515)	lr 0.00517
Train [84][3090/3239]	Time 0.240 (1.007)	Data Time 0.001 (0.479)	Loss 2.4817 (2.4585)	Entropy 0.58518 (0.58267)	Top-1 acc 64.453 (64.688)	Top-5 acc 81.250 (84.514)	lr 0.00516
Train [84][3100/3239]	Time 0.252 (1.005)	Data Time 0.002 (0.478)	Loss 2.5692 (2.4584)	Entropy 0.58514 (0.58268)	Top-1 acc 62.891 (64.693)	Top-5 acc 82.031 (84.517)	lr 0.00516
Train [84][3110/3239]	Time 0.262 (1.005)	Data Time 0.001 (0.477)	Loss 2.4673 (2.4585)	Entropy 0.58531 (0.58269)	Top-1 acc 64.844 (64.691)	Top-5 acc 83.984 (84.515)	lr 0.00516
Train [84][3120/3239]	Time 0.238 (1.006)	Data Time 0.001 (0.478)	Loss 2.3465 (2.4584)	Entropy 0.58561 (0.58269)	Top-1 acc 65.625 (64.690)	Top-5 acc 85.156 (84.518)	lr 0.00516
Train [84][3130/3239]	Time 0.256 (1.004)	Data Time 0.001 (0.477)	Loss 2.4213 (2.4584)	Entropy 0.58567 (0.58270)	Top-1 acc 65.234 (64.688)	Top-5 acc 82.812 (84.517)	lr 0.00516
Train [84][3140/3239]	Time 0.268 (1.003)	Data Time 0.001 (0.476)	Loss 2.5806 (2.4586)	Entropy 0.58579 (0.58271)	Top-1 acc 61.328 (64.686)	Top-5 acc 84.766 (84.513)	lr 0.00516
Train [84][3150/3239]	Time 0.400 (1.003)	Data Time 0.002 (0.476)	Loss 2.8176 (2.4590)	Entropy 0.58606 (0.58272)	Top-1 acc 56.250 (64.676)	Top-5 acc 79.297 (84.506)	lr 0.00516
Train [84][3160/3239]	Time 0.245 (1.002)	Data Time 0.001 (0.476)	Loss 2.2705 (2.4589)	Entropy 0.58585 (0.58273)	Top-1 acc 68.359 (64.675)	Top-5 acc 88.281 (84.509)	lr 0.00516
Train [84][3170/3239]	Time 0.245 (1.001)	Data Time 0.001 (0.475)	Loss 2.3551 (2.4588)	Entropy 0.58586 (0.58274)	Top-1 acc 67.578 (64.680)	Top-5 acc 86.719 (84.510)	lr 0.00516
Train [84][3180/3239]	Time 0.239 (1.001)	Data Time 0.000 (0.475)	Loss 2.5195 (2.4588)	Entropy 0.58579 (0.58275)	Top-1 acc 64.844 (64.681)	Top-5 acc 84.375 (84.508)	lr 0.00516
Train [84][3190/3239]	Time 0.237 (1.001)	Data Time 0.000 (0.476)	Loss 2.5053 (2.4589)	Entropy 0.58567 (0.58276)	Top-1 acc 61.719 (64.676)	Top-5 acc 83.984 (84.506)	lr 0.00516
Train [84][3200/3239]	Time 0.239 (1.000)	Data Time 0.000 (0.475)	Loss 2.5428 (2.4589)	Entropy 0.58574 (0.58277)	Top-1 acc 62.109 (64.676)	Top-5 acc 84.375 (84.506)	lr 0.00516
Train [84][3210/3239]	Time 0.251 (1.000)	Data Time 0.000 (0.475)	Loss 2.4443 (2.4590)	Entropy 0.58586 (0.58278)	Top-1 acc 64.844 (64.676)	Top-5 acc 87.109 (84.505)	lr 0.00516
Train [84][3220/3239]	Time 0.235 (0.998)	Data Time 0.000 (0.474)	Loss 2.3911 (2.4588)	Entropy 0.58591 (0.58279)	Top-1 acc 62.891 (64.681)	Top-5 acc 86.719 (84.508)	lr 0.00515
Train [84][3230/3239]	Time 0.229 (0.996)	Data Time 0.000 (0.473)	Loss 2.7480 (2.4590)	Entropy 0.58595 (0.58280)	Top-1 acc 60.547 (64.675)	Top-5 acc 78.906 (84.502)	lr 0.00515
Train [84][3239/3239]	Time 0.828 (0.995)	Data Time 0.000 (0.471)	Loss 2.6200 (2.4591)	Entropy 0.58584 (0.58281)	Top-1 acc 64.198 (64.672)	Top-5 acc 81.481 (84.500)	lr 0.00515
==========Valid [84/120]	loss 1.266	top-1 acc 70.665 (71.027)	top-5 acc 89.344	Train top-1 64.672	top-5 84.500	Entropy 0.58584	Latency-None: 0.000ms	Flops: 539.00M
Train [85][0/3239]	Time 45.549 (45.549)	Data Time 44.331 (44.331)	Loss 2.3886 (2.3886)	Entropy 0.58587 (0.58587)	Top-1 acc 67.188 (67.188)	Top-5 acc 85.547 (85.547)	lr 0.00515
Train [85][10/3239]	Time 0.241 (4.633)	Data Time 0.001 (4.079)	Loss 2.3921 (2.4380)	Entropy 0.58573 (0.58592)	Top-1 acc 63.672 (65.021)	Top-5 acc 89.062 (84.730)	lr 0.00515
Train [85][20/3239]	Time 0.338 (2.660)	Data Time 0.003 (2.139)	Loss 2.4224 (2.4224)	Entropy 0.58584 (0.58583)	Top-1 acc 67.578 (66.276)	Top-5 acc 85.547 (85.193)	lr 0.00515
Train [85][30/3239]	Time 0.253 (1.953)	Data Time 0.001 (1.450)	Loss 2.4747 (2.4329)	Entropy 0.58599 (0.58587)	Top-1 acc 62.109 (65.411)	Top-5 acc 84.766 (84.917)	lr 0.00515
Train [85][40/3239]	Time 0.274 (1.614)	Data Time 0.003 (1.097)	Loss 2.2736 (2.4378)	Entropy 0.58577 (0.58586)	Top-1 acc 68.750 (65.358)	Top-5 acc 88.672 (84.470)	lr 0.00515
Train [85][50/3239]	Time 0.343 (1.384)	Data Time 0.001 (0.882)	Loss 2.4630 (2.4501)	Entropy 0.58527 (0.58584)	Top-1 acc 64.453 (64.813)	Top-5 acc 85.156 (84.406)	lr 0.00515
Train [85][60/3239]	Time 0.250 (1.231)	Data Time 0.001 (0.738)	Loss 2.3501 (2.4467)	Entropy 0.58556 (0.58577)	Top-1 acc 67.969 (64.908)	Top-5 acc 87.109 (84.503)	lr 0.00515
Train [85][70/3239]	Time 0.295 (1.122)	Data Time 0.001 (0.634)	Loss 2.4108 (2.4486)	Entropy 0.58539 (0.58573)	Top-1 acc 67.969 (65.119)	Top-5 acc 85.547 (84.452)	lr 0.00515
Train [85][80/3239]	Time 0.244 (1.043)	Data Time 0.001 (0.556)	Loss 2.4520 (2.4512)	Entropy 0.58545 (0.58569)	Top-1 acc 69.141 (65.152)	Top-5 acc 85.547 (84.496)	lr 0.00515
Train [85][90/3239]	Time 0.265 (0.984)	Data Time 0.002 (0.495)	Loss 2.3536 (2.4380)	Entropy 0.58509 (0.58565)	Top-1 acc 66.406 (65.462)	Top-5 acc 87.109 (84.736)	lr 0.00515
Train [85][100/3239]	Time 0.255 (0.935)	Data Time 0.001 (0.446)	Loss 2.4489 (2.4444)	Entropy 0.58506 (0.58559)	Top-1 acc 67.969 (65.370)	Top-5 acc 82.812 (84.619)	lr 0.00514
Train [85][110/3239]	Time 0.258 (0.891)	Data Time 0.001 (0.406)	Loss 2.5078 (2.4457)	Entropy 0.58496 (0.58554)	Top-1 acc 62.500 (65.326)	Top-5 acc 83.984 (84.505)	lr 0.00514
Train [85][120/3239]	Time 0.258 (0.856)	Data Time 0.002 (0.373)	Loss 2.6186 (2.4486)	Entropy 0.58492 (0.58550)	Top-1 acc 59.766 (65.205)	Top-5 acc 79.688 (84.511)	lr 0.00514
Train [85][130/3239]	Time 0.292 (0.826)	Data Time 0.002 (0.344)	Loss 2.3085 (2.4516)	Entropy 0.58463 (0.58545)	Top-1 acc 68.359 (65.079)	Top-5 acc 87.891 (84.500)	lr 0.00514
Train [85][140/3239]	Time 0.372 (0.799)	Data Time 0.001 (0.320)	Loss 2.5139 (2.4567)	Entropy 0.58470 (0.58539)	Top-1 acc 63.672 (64.927)	Top-5 acc 81.641 (84.403)	lr 0.00514
Train [85][150/3239]	Time 0.236 (0.776)	Data Time 0.001 (0.299)	Loss 2.4480 (2.4544)	Entropy 0.58500 (0.58536)	Top-1 acc 68.750 (65.020)	Top-5 acc 83.203 (84.447)	lr 0.00514
Train [85][160/3239]	Time 0.243 (0.756)	Data Time 0.001 (0.281)	Loss 2.4751 (2.4498)	Entropy 0.58482 (0.58534)	Top-1 acc 62.109 (65.132)	Top-5 acc 82.422 (84.504)	lr 0.00514
Train [85][170/3239]	Time 0.246 (0.740)	Data Time 0.001 (0.264)	Loss 2.5248 (2.4488)	Entropy 0.58490 (0.58531)	Top-1 acc 66.016 (65.132)	Top-5 acc 82.812 (84.551)	lr 0.00514
Train [85][180/3239]	Time 0.243 (0.724)	Data Time 0.001 (0.250)	Loss 2.4597 (2.4513)	Entropy 0.58469 (0.58528)	Top-1 acc 65.625 (65.038)	Top-5 acc 82.812 (84.574)	lr 0.00514
Train [85][190/3239]	Time 0.232 (0.710)	Data Time 0.001 (0.237)	Loss 2.2956 (2.4465)	Entropy 0.58451 (0.58525)	Top-1 acc 68.359 (65.155)	Top-5 acc 86.719 (84.657)	lr 0.00514
Train [85][200/3239]	Time 0.254 (0.698)	Data Time 0.001 (0.225)	Loss 2.2391 (2.4489)	Entropy 0.58434 (0.58521)	Top-1 acc 69.922 (65.102)	Top-5 acc 88.281 (84.606)	lr 0.00514
Train [85][210/3239]	Time 0.386 (0.687)	Data Time 0.001 (0.214)	Loss 2.3351 (2.4479)	Entropy 0.58426 (0.58516)	Top-1 acc 66.797 (65.160)	Top-5 acc 87.109 (84.623)	lr 0.00514
Train [85][220/3239]	Time 0.261 (0.677)	Data Time 0.001 (0.205)	Loss 2.4022 (2.4477)	Entropy 0.58420 (0.58512)	Top-1 acc 66.016 (65.116)	Top-5 acc 83.984 (84.681)	lr 0.00513
Train [85][230/3239]	Time 0.260 (0.668)	Data Time 0.001 (0.196)	Loss 2.3598 (2.4464)	Entropy 0.58424 (0.58508)	Top-1 acc 69.531 (65.162)	Top-5 acc 85.156 (84.705)	lr 0.00513
Train [85][240/3239]	Time 0.263 (0.660)	Data Time 0.002 (0.188)	Loss 2.6498 (2.4470)	Entropy 0.58441 (0.58505)	Top-1 acc 61.328 (65.111)	Top-5 acc 81.641 (84.717)	lr 0.00513
Train [85][250/3239]	Time 0.297 (0.652)	Data Time 0.003 (0.181)	Loss 2.3892 (2.4490)	Entropy 0.58454 (0.58503)	Top-1 acc 67.969 (65.023)	Top-5 acc 85.547 (84.700)	lr 0.00513
Train [85][260/3239]	Time 0.238 (0.645)	Data Time 0.002 (0.174)	Loss 2.3873 (2.4508)	Entropy 0.58435 (0.58501)	Top-1 acc 66.406 (65.020)	Top-5 acc 85.156 (84.667)	lr 0.00513
Train [85][270/3239]	Time 0.242 (0.638)	Data Time 0.001 (0.167)	Loss 2.4838 (2.4501)	Entropy 0.58461 (0.58499)	Top-1 acc 62.891 (65.084)	Top-5 acc 83.984 (84.659)	lr 0.00513
Train [85][280/3239]	Time 0.246 (0.632)	Data Time 0.002 (0.161)	Loss 2.3736 (2.4526)	Entropy 0.58435 (0.58497)	Top-1 acc 66.406 (65.027)	Top-5 acc 85.938 (84.614)	lr 0.00513
Train [85][290/3239]	Time 0.478 (0.823)	Data Time 0.005 (0.156)	Loss 2.3023 (2.4517)	Entropy 0.58395 (0.58494)	Top-1 acc 67.188 (65.013)	Top-5 acc 85.547 (84.614)	lr 0.00513
Train [85][300/3239]	Time 0.356 (0.814)	Data Time 0.002 (0.151)	Loss 2.4007 (2.4512)	Entropy 0.58413 (0.58490)	Top-1 acc 67.188 (65.028)	Top-5 acc 84.375 (84.624)	lr 0.00513
Train [85][310/3239]	Time 0.238 (0.801)	Data Time 0.002 (0.146)	Loss 2.6016 (2.4539)	Entropy 0.58402 (0.58488)	Top-1 acc 62.109 (64.968)	Top-5 acc 83.594 (84.596)	lr 0.00513
Train [85][320/3239]	Time 0.260 (0.790)	Data Time 0.002 (0.142)	Loss 2.5519 (2.4554)	Entropy 0.58383 (0.58485)	Top-1 acc 62.109 (64.912)	Top-5 acc 82.812 (84.571)	lr 0.00513
Train [85][330/3239]	Time 0.248 (0.780)	Data Time 0.001 (0.137)	Loss 2.2351 (2.4556)	Entropy 0.58383 (0.58482)	Top-1 acc 70.312 (64.877)	Top-5 acc 89.844 (84.567)	lr 0.00513
Train [85][340/3239]	Time 0.261 (0.771)	Data Time 0.001 (0.133)	Loss 2.4040 (2.4547)	Entropy 0.58413 (0.58479)	Top-1 acc 67.969 (64.922)	Top-5 acc 84.766 (84.571)	lr 0.00512
Train [85][350/3239]	Time 0.267 (0.762)	Data Time 0.002 (0.130)	Loss 2.3261 (2.4556)	Entropy 0.58420 (0.58477)	Top-1 acc 65.234 (64.907)	Top-5 acc 87.109 (84.560)	lr 0.00512
Train [85][360/3239]	Time 0.255 (0.754)	Data Time 0.001 (0.126)	Loss 2.3740 (2.4542)	Entropy 0.58447 (0.58476)	Top-1 acc 67.969 (64.947)	Top-5 acc 85.547 (84.568)	lr 0.00512
Train [85][370/3239]	Time 0.438 (0.747)	Data Time 0.002 (0.123)	Loss 2.5089 (2.4529)	Entropy 0.58444 (0.58475)	Top-1 acc 65.625 (64.962)	Top-5 acc 80.469 (84.575)	lr 0.00512
Train [85][380/3239]	Time 0.347 (0.741)	Data Time 0.003 (0.120)	Loss 2.5774 (2.4537)	Entropy 0.58444 (0.58475)	Top-1 acc 62.891 (64.928)	Top-5 acc 83.203 (84.567)	lr 0.00512
Train [85][390/3239]	Time 0.276 (0.734)	Data Time 0.001 (0.117)	Loss 2.2513 (2.4507)	Entropy 0.58443 (0.58474)	Top-1 acc 69.531 (64.984)	Top-5 acc 89.062 (84.630)	lr 0.00512
Train [85][400/3239]	Time 0.269 (0.728)	Data Time 0.002 (0.114)	Loss 2.4212 (2.4490)	Entropy 0.58428 (0.58473)	Top-1 acc 62.500 (65.039)	Top-5 acc 87.500 (84.662)	lr 0.00512
Train [85][410/3239]	Time 0.257 (0.722)	Data Time 0.002 (0.111)	Loss 2.5003 (2.4483)	Entropy 0.58444 (0.58472)	Top-1 acc 64.844 (65.072)	Top-5 acc 82.812 (84.668)	lr 0.00512
Train [85][420/3239]	Time 0.253 (0.716)	Data Time 0.002 (0.108)	Loss 2.5090 (2.4484)	Entropy 0.58438 (0.58471)	Top-1 acc 63.281 (65.078)	Top-5 acc 84.375 (84.676)	lr 0.00512
Train [85][430/3239]	Time 0.300 (0.710)	Data Time 0.001 (0.106)	Loss 2.6122 (2.4490)	Entropy 0.58437 (0.58470)	Top-1 acc 61.719 (65.083)	Top-5 acc 81.250 (84.653)	lr 0.00512
Train [85][440/3239]	Time 0.322 (0.705)	Data Time 0.001 (0.104)	Loss 3.0903 (2.4505)	Entropy 0.58429 (0.58470)	Top-1 acc 48.828 (65.026)	Top-5 acc 74.219 (84.631)	lr 0.00512
Train [85][450/3239]	Time 0.273 (0.701)	Data Time 0.001 (0.101)	Loss 2.4769 (2.4497)	Entropy 0.58451 (0.58469)	Top-1 acc 62.891 (65.043)	Top-5 acc 83.594 (84.665)	lr 0.00512
Train [85][460/3239]	Time 0.277 (0.696)	Data Time 0.001 (0.099)	Loss 2.5674 (2.4499)	Entropy 0.58439 (0.58469)	Top-1 acc 59.375 (65.045)	Top-5 acc 82.812 (84.653)	lr 0.00512
Train [85][470/3239]	Time 0.227 (0.690)	Data Time 0.001 (0.097)	Loss 2.5591 (2.4490)	Entropy 0.58460 (0.58468)	Top-1 acc 60.938 (65.054)	Top-5 acc 81.641 (84.669)	lr 0.00511
Train [85][480/3239]	Time 0.291 (0.686)	Data Time 0.003 (0.095)	Loss 2.3959 (2.4482)	Entropy 0.58487 (0.58468)	Top-1 acc 64.062 (65.078)	Top-5 acc 87.109 (84.695)	lr 0.00511
Train [85][490/3239]	Time 0.238 (0.681)	Data Time 0.001 (0.093)	Loss 2.4178 (2.4491)	Entropy 0.58495 (0.58469)	Top-1 acc 64.844 (65.053)	Top-5 acc 84.766 (84.668)	lr 0.00511
Train [85][500/3239]	Time 0.240 (0.676)	Data Time 0.001 (0.091)	Loss 2.6169 (2.4496)	Entropy 0.58516 (0.58470)	Top-1 acc 58.984 (65.051)	Top-5 acc 82.812 (84.669)	lr 0.00511
Train [85][510/3239]	Time 0.295 (0.673)	Data Time 0.001 (0.090)	Loss 2.5810 (2.4501)	Entropy 0.58533 (0.58470)	Top-1 acc 63.672 (65.036)	Top-5 acc 81.641 (84.646)	lr 0.00511
Train [85][520/3239]	Time 0.236 (0.669)	Data Time 0.001 (0.088)	Loss 2.4835 (2.4503)	Entropy 0.58524 (0.58472)	Top-1 acc 65.625 (65.024)	Top-5 acc 84.766 (84.659)	lr 0.00511
Train [85][530/3239]	Time 0.348 (0.665)	Data Time 0.001 (0.086)	Loss 2.3627 (2.4481)	Entropy 0.58537 (0.58473)	Top-1 acc 69.531 (65.059)	Top-5 acc 84.375 (84.691)	lr 0.00511
Train [85][540/3239]	Time 0.253 (0.661)	Data Time 0.001 (0.085)	Loss 2.5777 (2.4489)	Entropy 0.58536 (0.58474)	Top-1 acc 59.766 (65.033)	Top-5 acc 83.984 (84.680)	lr 0.00511
Train [85][550/3239]	Time 0.267 (0.657)	Data Time 0.003 (0.083)	Loss 2.4439 (2.4488)	Entropy 0.58527 (0.58475)	Top-1 acc 62.500 (65.041)	Top-5 acc 85.156 (84.673)	lr 0.00511
Train [85][560/3239]	Time 0.274 (0.653)	Data Time 0.001 (0.082)	Loss 2.4873 (2.4487)	Entropy 0.58513 (0.58476)	Top-1 acc 66.797 (65.045)	Top-5 acc 86.328 (84.679)	lr 0.00511
Train [85][570/3239]	Time 0.253 (0.650)	Data Time 0.002 (0.080)	Loss 2.4360 (2.4479)	Entropy 0.58527 (0.58477)	Top-1 acc 64.844 (65.058)	Top-5 acc 83.594 (84.687)	lr 0.00511
Train [85][580/3239]	Time 0.299 (0.647)	Data Time 0.002 (0.079)	Loss 2.5664 (2.4479)	Entropy 0.58516 (0.58477)	Top-1 acc 61.719 (65.057)	Top-5 acc 83.594 (84.692)	lr 0.00511
Train [85][590/3239]	Time 0.241 (0.644)	Data Time 0.002 (0.078)	Loss 2.2327 (2.4479)	Entropy 0.58479 (0.58478)	Top-1 acc 73.047 (65.051)	Top-5 acc 89.453 (84.690)	lr 0.00510
Train [85][600/3239]	Time 0.332 (0.641)	Data Time 0.002 (0.076)	Loss 2.8946 (2.4484)	Entropy 0.58489 (0.58478)	Top-1 acc 53.906 (65.034)	Top-5 acc 76.172 (84.675)	lr 0.00510
Train [85][610/3239]	Time 0.261 (0.638)	Data Time 0.001 (0.075)	Loss 2.4678 (2.4476)	Entropy 0.58474 (0.58478)	Top-1 acc 64.844 (65.046)	Top-5 acc 85.156 (84.697)	lr 0.00510
Train [85][620/3239]	Time 0.272 (0.635)	Data Time 0.002 (0.074)	Loss 2.4562 (2.4473)	Entropy 0.58475 (0.58478)	Top-1 acc 62.500 (65.048)	Top-5 acc 84.375 (84.708)	lr 0.00510
Train [85][630/3239]	Time 0.243 (0.632)	Data Time 0.001 (0.073)	Loss 2.6320 (2.4473)	Entropy 0.58435 (0.58478)	Top-1 acc 60.156 (65.045)	Top-5 acc 81.641 (84.719)	lr 0.00510
Train [85][640/3239]	Time 0.285 (0.629)	Data Time 0.001 (0.072)	Loss 2.5660 (2.4479)	Entropy 0.58458 (0.58477)	Top-1 acc 65.625 (65.045)	Top-5 acc 81.250 (84.707)	lr 0.00510
Train [85][650/3239]	Time 0.241 (0.626)	Data Time 0.001 (0.071)	Loss 2.3377 (2.4480)	Entropy 0.58445 (0.58477)	Top-1 acc 66.016 (65.038)	Top-5 acc 86.719 (84.702)	lr 0.00510
Train [85][660/3239]	Time 0.236 (0.623)	Data Time 0.001 (0.070)	Loss 2.2842 (2.4469)	Entropy 0.58425 (0.58476)	Top-1 acc 68.359 (65.067)	Top-5 acc 89.453 (84.714)	lr 0.00510
Train [85][670/3239]	Time 0.238 (0.621)	Data Time 0.001 (0.069)	Loss 2.2928 (2.4473)	Entropy 0.58436 (0.58476)	Top-1 acc 66.016 (65.052)	Top-5 acc 85.938 (84.706)	lr 0.00510
Train [85][680/3239]	Time 0.255 (0.618)	Data Time 0.002 (0.068)	Loss 2.3736 (2.4474)	Entropy 0.58432 (0.58475)	Top-1 acc 68.750 (65.061)	Top-5 acc 85.547 (84.702)	lr 0.00510
Train [85][690/3239]	Time 0.378 (0.616)	Data Time 0.001 (0.067)	Loss 2.7847 (2.4481)	Entropy 0.58455 (0.58475)	Top-1 acc 56.250 (65.050)	Top-5 acc 79.297 (84.685)	lr 0.00510
Train [85][700/3239]	Time 0.246 (0.614)	Data Time 0.001 (0.066)	Loss 2.2539 (2.4467)	Entropy 0.58428 (0.58474)	Top-1 acc 67.188 (65.088)	Top-5 acc 88.672 (84.715)	lr 0.00510
Train [85][710/3239]	Time 0.257 (0.611)	Data Time 0.002 (0.065)	Loss 2.4924 (2.4468)	Entropy 0.58386 (0.58473)	Top-1 acc 64.844 (65.072)	Top-5 acc 81.641 (84.705)	lr 0.00509
Train [85][720/3239]	Time 0.245 (0.609)	Data Time 0.001 (0.064)	Loss 2.6234 (2.4471)	Entropy 0.58396 (0.58472)	Top-1 acc 60.938 (65.070)	Top-5 acc 79.688 (84.703)	lr 0.00509
Train [85][730/3239]	Time 0.238 (0.606)	Data Time 0.001 (0.063)	Loss 2.3332 (2.4464)	Entropy 0.58399 (0.58471)	Top-1 acc 69.141 (65.083)	Top-5 acc 87.500 (84.723)	lr 0.00509
Train [85][740/3239]	Time 0.287 (0.605)	Data Time 0.001 (0.062)	Loss 2.5724 (2.4466)	Entropy 0.58381 (0.58470)	Top-1 acc 61.719 (65.071)	Top-5 acc 81.250 (84.727)	lr 0.00509
Train [85][750/3239]	Time 0.288 (0.602)	Data Time 0.003 (0.062)	Loss 2.5281 (2.4463)	Entropy 0.58388 (0.58469)	Top-1 acc 62.891 (65.085)	Top-5 acc 84.766 (84.728)	lr 0.00509
Train [85][760/3239]	Time 0.353 (0.600)	Data Time 0.001 (0.061)	Loss 2.5396 (2.4465)	Entropy 0.58365 (0.58468)	Top-1 acc 64.844 (65.085)	Top-5 acc 80.859 (84.725)	lr 0.00509
Train [85][770/3239]	Time 0.250 (0.598)	Data Time 0.001 (0.060)	Loss 2.3358 (2.4463)	Entropy 0.58348 (0.58466)	Top-1 acc 66.797 (65.086)	Top-5 acc 87.891 (84.723)	lr 0.00509
Train [85][780/3239]	Time 0.244 (0.596)	Data Time 0.001 (0.059)	Loss 2.4205 (2.4466)	Entropy 0.58356 (0.58465)	Top-1 acc 64.453 (65.072)	Top-5 acc 84.375 (84.706)	lr 0.00509
Train [85][790/3239]	Time 0.229 (0.594)	Data Time 0.001 (0.059)	Loss 2.4316 (2.4462)	Entropy 0.58360 (0.58463)	Top-1 acc 65.234 (65.080)	Top-5 acc 84.766 (84.707)	lr 0.00509
Train [85][800/3239]	Time 0.234 (0.593)	Data Time 0.001 (0.058)	Loss 2.3415 (2.4462)	Entropy 0.58360 (0.58462)	Top-1 acc 64.062 (65.077)	Top-5 acc 89.062 (84.710)	lr 0.00509
Train [85][810/3239]	Time 0.250 (0.591)	Data Time 0.001 (0.057)	Loss 2.5923 (2.4471)	Entropy 0.58366 (0.58461)	Top-1 acc 56.641 (65.040)	Top-5 acc 83.984 (84.696)	lr 0.00509
Train [85][820/3239]	Time 0.240 (0.589)	Data Time 0.001 (0.056)	Loss 2.3867 (2.4472)	Entropy 0.58359 (0.58460)	Top-1 acc 61.719 (65.035)	Top-5 acc 86.719 (84.701)	lr 0.00509
Train [85][830/3239]	Time 0.245 (0.587)	Data Time 0.001 (0.056)	Loss 2.4458 (2.4474)	Entropy 0.58373 (0.58458)	Top-1 acc 63.281 (65.024)	Top-5 acc 84.375 (84.701)	lr 0.00509
Train [85][840/3239]	Time 0.243 (0.585)	Data Time 0.001 (0.055)	Loss 2.4441 (2.4476)	Entropy 0.58360 (0.58457)	Top-1 acc 66.797 (65.027)	Top-5 acc 83.984 (84.698)	lr 0.00508
Train [85][850/3239]	Time 0.282 (0.583)	Data Time 0.001 (0.055)	Loss 2.4810 (2.4477)	Entropy 0.58298 (0.58456)	Top-1 acc 66.406 (65.034)	Top-5 acc 83.984 (84.698)	lr 0.00508
Train [85][860/3239]	Time 0.257 (0.582)	Data Time 0.001 (0.054)	Loss 2.4206 (2.4475)	Entropy 0.58299 (0.58454)	Top-1 acc 67.188 (65.042)	Top-5 acc 83.984 (84.700)	lr 0.00508
Train [85][870/3239]	Time 0.271 (0.580)	Data Time 0.001 (0.053)	Loss 2.3697 (2.4479)	Entropy 0.58305 (0.58452)	Top-1 acc 67.578 (65.031)	Top-5 acc 85.938 (84.682)	lr 0.00508
Train [85][880/3239]	Time 0.252 (0.579)	Data Time 0.002 (0.053)	Loss 2.3934 (2.4475)	Entropy 0.58351 (0.58451)	Top-1 acc 64.844 (65.037)	Top-5 acc 86.328 (84.696)	lr 0.00508
Train [85][890/3239]	Time 0.239 (0.577)	Data Time 0.001 (0.052)	Loss 2.4079 (2.4474)	Entropy 0.58380 (0.58450)	Top-1 acc 67.578 (65.031)	Top-5 acc 84.766 (84.699)	lr 0.00508
Train [85][900/3239]	Time 0.302 (0.576)	Data Time 0.001 (0.052)	Loss 2.5634 (2.4467)	Entropy 0.58376 (0.58449)	Top-1 acc 64.062 (65.050)	Top-5 acc 82.812 (84.708)	lr 0.00508
Train [85][910/3239]	Time 0.275 (0.574)	Data Time 0.002 (0.051)	Loss 2.4279 (2.4467)	Entropy 0.58388 (0.58449)	Top-1 acc 67.578 (65.057)	Top-5 acc 84.375 (84.710)	lr 0.00508
Train [85][920/3239]	Time 0.364 (0.573)	Data Time 0.001 (0.051)	Loss 2.5722 (2.4466)	Entropy 0.58399 (0.58448)	Top-1 acc 66.406 (65.058)	Top-5 acc 81.641 (84.714)	lr 0.00508
Train [85][930/3239]	Time 0.321 (0.572)	Data Time 0.003 (0.050)	Loss 2.5273 (2.4470)	Entropy 0.58407 (0.58447)	Top-1 acc 63.672 (65.054)	Top-5 acc 83.203 (84.704)	lr 0.00508
Train [85][940/3239]	Time 0.251 (0.570)	Data Time 0.003 (0.049)	Loss 2.4881 (2.4467)	Entropy 0.58388 (0.58447)	Top-1 acc 66.406 (65.070)	Top-5 acc 80.859 (84.708)	lr 0.00508
Train [85][950/3239]	Time 0.274 (0.624)	Data Time 0.002 (0.049)	Loss 2.4854 (2.4468)	Entropy 0.58346 (0.58446)	Top-1 acc 65.234 (65.066)	Top-5 acc 83.594 (84.703)	lr 0.00508
Train [85][960/3239]	Time 0.247 (0.622)	Data Time 0.002 (0.048)	Loss 2.3099 (2.4468)	Entropy 0.58345 (0.58445)	Top-1 acc 66.797 (65.060)	Top-5 acc 83.594 (84.701)	lr 0.00507
Train [85][970/3239]	Time 0.261 (0.620)	Data Time 0.001 (0.048)	Loss 2.4705 (2.4473)	Entropy 0.58327 (0.58444)	Top-1 acc 63.281 (65.048)	Top-5 acc 82.422 (84.685)	lr 0.00507
Train [85][980/3239]	Time 0.243 (0.618)	Data Time 0.001 (0.048)	Loss 2.5784 (2.4485)	Entropy 0.58332 (0.58443)	Top-1 acc 66.797 (65.029)	Top-5 acc 82.031 (84.668)	lr 0.00507
Train [85][990/3239]	Time 0.250 (0.616)	Data Time 0.001 (0.047)	Loss 2.5379 (2.4482)	Entropy 0.58295 (0.58441)	Top-1 acc 60.156 (65.029)	Top-5 acc 82.422 (84.667)	lr 0.00507
Train [85][1000/3239]	Time 0.258 (0.615)	Data Time 0.001 (0.047)	Loss 2.4201 (2.4483)	Entropy 0.58275 (0.58440)	Top-1 acc 66.016 (65.030)	Top-5 acc 82.812 (84.663)	lr 0.00507
Train [85][1010/3239]	Time 0.301 (0.613)	Data Time 0.001 (0.046)	Loss 2.5205 (2.4483)	Entropy 0.58277 (0.58438)	Top-1 acc 63.672 (65.041)	Top-5 acc 83.984 (84.660)	lr 0.00507
Train [85][1020/3239]	Time 0.245 (0.611)	Data Time 0.001 (0.046)	Loss 2.4843 (2.4487)	Entropy 0.58278 (0.58437)	Top-1 acc 62.891 (65.032)	Top-5 acc 84.766 (84.649)	lr 0.00507
Train [85][1030/3239]	Time 0.265 (0.610)	Data Time 0.002 (0.045)	Loss 2.4276 (2.4492)	Entropy 0.58305 (0.58435)	Top-1 acc 64.062 (65.018)	Top-5 acc 86.328 (84.640)	lr 0.00507
Train [85][1040/3239]	Time 0.239 (0.608)	Data Time 0.002 (0.045)	Loss 2.6080 (2.4494)	Entropy 0.58322 (0.58434)	Top-1 acc 59.766 (65.008)	Top-5 acc 82.422 (84.643)	lr 0.00507
Train [85][1050/3239]	Time 0.257 (0.607)	Data Time 0.001 (0.044)	Loss 2.4263 (2.4496)	Entropy 0.58366 (0.58433)	Top-1 acc 67.578 (64.998)	Top-5 acc 83.984 (84.637)	lr 0.00507
Train [85][1060/3239]	Time 0.243 (0.605)	Data Time 0.001 (0.044)	Loss 2.3672 (2.4496)	Entropy 0.58357 (0.58432)	Top-1 acc 67.188 (64.998)	Top-5 acc 85.938 (84.633)	lr 0.00507
Train [85][1070/3239]	Time 0.245 (0.604)	Data Time 0.001 (0.044)	Loss 2.7432 (2.4495)	Entropy 0.58377 (0.58432)	Top-1 acc 59.766 (65.006)	Top-5 acc 80.078 (84.637)	lr 0.00507
Train [85][1080/3239]	Time 0.355 (0.603)	Data Time 0.001 (0.043)	Loss 2.3832 (2.4497)	Entropy 0.58348 (0.58431)	Top-1 acc 69.531 (65.004)	Top-5 acc 84.766 (84.634)	lr 0.00506
Train [85][1090/3239]	Time 0.246 (0.601)	Data Time 0.001 (0.043)	Loss 2.6261 (2.4496)	Entropy 0.58367 (0.58430)	Top-1 acc 65.625 (65.011)	Top-5 acc 78.906 (84.633)	lr 0.00506
Train [85][1100/3239]	Time 0.245 (0.600)	Data Time 0.001 (0.043)	Loss 2.4243 (2.4500)	Entropy 0.58364 (0.58430)	Top-1 acc 66.016 (65.003)	Top-5 acc 87.109 (84.624)	lr 0.00506
Train [85][1110/3239]	Time 0.254 (0.599)	Data Time 0.002 (0.042)	Loss 2.3247 (2.4499)	Entropy 0.58338 (0.58429)	Top-1 acc 70.312 (64.999)	Top-5 acc 86.719 (84.623)	lr 0.00506
Train [85][1120/3239]	Time 0.249 (0.598)	Data Time 0.002 (0.042)	Loss 2.3531 (2.4493)	Entropy 0.58341 (0.58428)	Top-1 acc 67.188 (65.005)	Top-5 acc 84.766 (84.631)	lr 0.00506
Train [85][1130/3239]	Time 0.286 (0.597)	Data Time 0.002 (0.041)	Loss 2.4015 (2.4489)	Entropy 0.58350 (0.58428)	Top-1 acc 67.969 (65.017)	Top-5 acc 85.938 (84.642)	lr 0.00506
Train [85][1140/3239]	Time 0.239 (0.598)	Data Time 0.001 (0.041)	Loss 2.3182 (2.4496)	Entropy 0.58347 (0.58427)	Top-1 acc 69.922 (64.996)	Top-5 acc 85.547 (84.626)	lr 0.00506
Train [85][1150/3239]	Time 0.255 (0.597)	Data Time 0.001 (0.041)	Loss 2.4798 (2.4503)	Entropy 0.58370 (0.58426)	Top-1 acc 62.891 (64.974)	Top-5 acc 83.984 (84.616)	lr 0.00506
Train [85][1160/3239]	Time 0.241 (0.596)	Data Time 0.001 (0.040)	Loss 2.5113 (2.4506)	Entropy 0.58369 (0.58426)	Top-1 acc 60.938 (64.963)	Top-5 acc 85.547 (84.611)	lr 0.00506
Train [85][1170/3239]	Time 0.244 (0.595)	Data Time 0.001 (0.040)	Loss 2.3043 (2.4501)	Entropy 0.58401 (0.58426)	Top-1 acc 67.578 (64.974)	Top-5 acc 85.938 (84.615)	lr 0.00506
Train [85][1180/3239]	Time 0.272 (0.593)	Data Time 0.002 (0.040)	Loss 2.4725 (2.4505)	Entropy 0.58379 (0.58425)	Top-1 acc 64.453 (64.973)	Top-5 acc 85.547 (84.608)	lr 0.00506
Train [85][1190/3239]	Time 0.247 (0.592)	Data Time 0.001 (0.039)	Loss 2.6211 (2.4509)	Entropy 0.58377 (0.58425)	Top-1 acc 61.328 (64.966)	Top-5 acc 83.203 (84.600)	lr 0.00506
Train [85][1200/3239]	Time 0.301 (0.591)	Data Time 0.001 (0.039)	Loss 2.3984 (2.4504)	Entropy 0.58394 (0.58425)	Top-1 acc 65.625 (64.978)	Top-5 acc 84.766 (84.612)	lr 0.00505
Train [85][1210/3239]	Time 0.248 (0.590)	Data Time 0.001 (0.039)	Loss 2.4115 (2.4508)	Entropy 0.58368 (0.58424)	Top-1 acc 66.406 (64.971)	Top-5 acc 83.984 (84.600)	lr 0.00505
Train [85][1220/3239]	Time 0.272 (0.589)	Data Time 0.002 (0.039)	Loss 2.4172 (2.4506)	Entropy 0.58361 (0.58424)	Top-1 acc 68.750 (64.979)	Top-5 acc 84.766 (84.602)	lr 0.00505
Train [85][1230/3239]	Time 0.257 (0.588)	Data Time 0.001 (0.038)	Loss 2.4587 (2.4509)	Entropy 0.58363 (0.58423)	Top-1 acc 63.672 (64.970)	Top-5 acc 86.328 (84.597)	lr 0.00505
Train [85][1240/3239]	Time 0.335 (0.587)	Data Time 0.001 (0.038)	Loss 2.6224 (2.4519)	Entropy 0.58382 (0.58423)	Top-1 acc 60.938 (64.946)	Top-5 acc 80.859 (84.584)	lr 0.00505
Train [85][1250/3239]	Time 0.297 (0.586)	Data Time 0.001 (0.038)	Loss 2.3813 (2.4520)	Entropy 0.58339 (0.58422)	Top-1 acc 65.234 (64.938)	Top-5 acc 86.328 (84.579)	lr 0.00505
Train [85][1260/3239]	Time 0.285 (0.585)	Data Time 0.001 (0.037)	Loss 2.4276 (2.4522)	Entropy 0.58303 (0.58422)	Top-1 acc 66.406 (64.935)	Top-5 acc 82.812 (84.575)	lr 0.00505
Train [85][1270/3239]	Time 0.291 (0.584)	Data Time 0.001 (0.037)	Loss 2.5104 (2.4526)	Entropy 0.58308 (0.58421)	Top-1 acc 61.328 (64.929)	Top-5 acc 82.812 (84.568)	lr 0.00505
Train [85][1280/3239]	Time 0.277 (0.583)	Data Time 0.001 (0.037)	Loss 2.5082 (2.4522)	Entropy 0.58322 (0.58420)	Top-1 acc 64.062 (64.932)	Top-5 acc 85.156 (84.576)	lr 0.00505
Train [85][1290/3239]	Time 0.239 (0.582)	Data Time 0.001 (0.037)	Loss 2.2736 (2.4524)	Entropy 0.58272 (0.58419)	Top-1 acc 69.922 (64.922)	Top-5 acc 87.500 (84.571)	lr 0.00505
Train [85][1300/3239]	Time 0.252 (0.581)	Data Time 0.001 (0.036)	Loss 2.6345 (2.4522)	Entropy 0.58287 (0.58418)	Top-1 acc 62.109 (64.925)	Top-5 acc 79.688 (84.575)	lr 0.00505
Train [85][1310/3239]	Time 0.399 (0.580)	Data Time 0.003 (0.036)	Loss 2.4068 (2.4523)	Entropy 0.58286 (0.58417)	Top-1 acc 66.406 (64.927)	Top-5 acc 84.375 (84.575)	lr 0.00505
Train [85][1320/3239]	Time 0.249 (0.579)	Data Time 0.001 (0.036)	Loss 2.6503 (2.4528)	Entropy 0.58283 (0.58416)	Top-1 acc 59.375 (64.918)	Top-5 acc 80.078 (84.565)	lr 0.00505
Train [85][1330/3239]	Time 0.239 (0.578)	Data Time 0.002 (0.035)	Loss 2.6570 (2.4531)	Entropy 0.58272 (0.58415)	Top-1 acc 62.500 (64.918)	Top-5 acc 78.516 (84.563)	lr 0.00504
Train [85][1340/3239]	Time 0.238 (0.577)	Data Time 0.001 (0.035)	Loss 2.4509 (2.4532)	Entropy 0.58294 (0.58414)	Top-1 acc 63.281 (64.908)	Top-5 acc 85.938 (84.561)	lr 0.00504
Train [85][1350/3239]	Time 0.295 (0.576)	Data Time 0.001 (0.035)	Loss 2.2838 (2.4529)	Entropy 0.58284 (0.58413)	Top-1 acc 67.578 (64.917)	Top-5 acc 85.547 (84.565)	lr 0.00504
Train [85][1360/3239]	Time 0.281 (0.576)	Data Time 0.001 (0.035)	Loss 2.5907 (2.4530)	Entropy 0.58261 (0.58412)	Top-1 acc 63.281 (64.915)	Top-5 acc 82.422 (84.563)	lr 0.00504
Train [85][1370/3239]	Time 0.241 (0.575)	Data Time 0.001 (0.034)	Loss 2.3702 (2.4530)	Entropy 0.58289 (0.58411)	Top-1 acc 66.406 (64.914)	Top-5 acc 84.766 (84.566)	lr 0.00504
Train [85][1380/3239]	Time 0.258 (0.574)	Data Time 0.001 (0.034)	Loss 2.7019 (2.4531)	Entropy 0.58301 (0.58410)	Top-1 acc 61.328 (64.910)	Top-5 acc 79.688 (84.563)	lr 0.00504
Train [85][1390/3239]	Time 0.239 (0.573)	Data Time 0.001 (0.034)	Loss 2.5423 (2.4531)	Entropy 0.58314 (0.58409)	Top-1 acc 61.328 (64.905)	Top-5 acc 85.156 (84.566)	lr 0.00504
Train [85][1400/3239]	Time 0.488 (0.572)	Data Time 0.001 (0.034)	Loss 2.3784 (2.4535)	Entropy 0.58321 (0.58409)	Top-1 acc 67.969 (64.890)	Top-5 acc 85.938 (84.565)	lr 0.00504
Train [85][1410/3239]	Time 0.262 (0.571)	Data Time 0.002 (0.034)	Loss 2.4869 (2.4536)	Entropy 0.58315 (0.58408)	Top-1 acc 60.938 (64.896)	Top-5 acc 85.156 (84.562)	lr 0.00504
Train [85][1420/3239]	Time 0.258 (0.571)	Data Time 0.001 (0.033)	Loss 2.4568 (2.4535)	Entropy 0.58328 (0.58407)	Top-1 acc 68.359 (64.907)	Top-5 acc 83.594 (84.558)	lr 0.00504
Train [85][1430/3239]	Time 0.237 (0.570)	Data Time 0.002 (0.033)	Loss 2.5315 (2.4538)	Entropy 0.58306 (0.58407)	Top-1 acc 62.891 (64.902)	Top-5 acc 83.594 (84.552)	lr 0.00504
Train [85][1440/3239]	Time 0.249 (0.569)	Data Time 0.001 (0.033)	Loss 2.4857 (2.4536)	Entropy 0.58302 (0.58406)	Top-1 acc 63.281 (64.902)	Top-5 acc 85.156 (84.557)	lr 0.00504
Train [85][1450/3239]	Time 0.271 (0.569)	Data Time 0.001 (0.033)	Loss 2.4575 (2.4541)	Entropy 0.58297 (0.58405)	Top-1 acc 65.625 (64.889)	Top-5 acc 87.891 (84.551)	lr 0.00503
Train [85][1460/3239]	Time 0.251 (0.568)	Data Time 0.001 (0.032)	Loss 2.4831 (2.4541)	Entropy 0.58318 (0.58405)	Top-1 acc 59.766 (64.884)	Top-5 acc 87.109 (84.550)	lr 0.00503
Train [85][1470/3239]	Time 0.397 (0.567)	Data Time 0.001 (0.032)	Loss 2.4840 (2.4545)	Entropy 0.58358 (0.58404)	Top-1 acc 62.500 (64.871)	Top-5 acc 86.328 (84.546)	lr 0.00503
Train [85][1480/3239]	Time 0.270 (0.567)	Data Time 0.001 (0.032)	Loss 2.4708 (2.4546)	Entropy 0.58360 (0.58404)	Top-1 acc 64.062 (64.867)	Top-5 acc 83.203 (84.544)	lr 0.00503
Train [85][1490/3239]	Time 0.278 (0.566)	Data Time 0.001 (0.032)	Loss 2.4045 (2.4545)	Entropy 0.58375 (0.58404)	Top-1 acc 61.328 (64.867)	Top-5 acc 86.719 (84.548)	lr 0.00503
Train [85][1500/3239]	Time 0.262 (0.565)	Data Time 0.001 (0.032)	Loss 2.3709 (2.4543)	Entropy 0.58360 (0.58403)	Top-1 acc 67.188 (64.871)	Top-5 acc 88.672 (84.552)	lr 0.00503
Train [85][1510/3239]	Time 0.252 (0.565)	Data Time 0.001 (0.031)	Loss 2.3527 (2.4546)	Entropy 0.58355 (0.58403)	Top-1 acc 66.016 (64.860)	Top-5 acc 85.938 (84.548)	lr 0.00503
Train [85][1520/3239]	Time 0.242 (0.564)	Data Time 0.001 (0.031)	Loss 2.7171 (2.4546)	Entropy 0.58354 (0.58403)	Top-1 acc 57.812 (64.866)	Top-5 acc 81.641 (84.548)	lr 0.00503
Train [85][1530/3239]	Time 0.289 (0.563)	Data Time 0.001 (0.031)	Loss 2.5479 (2.4548)	Entropy 0.58344 (0.58402)	Top-1 acc 64.844 (64.863)	Top-5 acc 80.078 (84.546)	lr 0.00503
Train [85][1540/3239]	Time 0.293 (0.563)	Data Time 0.001 (0.031)	Loss 2.4946 (2.4546)	Entropy 0.58356 (0.58402)	Top-1 acc 64.062 (64.861)	Top-5 acc 84.375 (84.553)	lr 0.00503
Train [85][1550/3239]	Time 0.258 (0.562)	Data Time 0.001 (0.031)	Loss 2.3489 (2.4549)	Entropy 0.58376 (0.58402)	Top-1 acc 66.016 (64.847)	Top-5 acc 86.328 (84.549)	lr 0.00503
Train [85][1560/3239]	Time 0.254 (0.562)	Data Time 0.001 (0.031)	Loss 2.3332 (2.4546)	Entropy 0.58380 (0.58402)	Top-1 acc 69.141 (64.855)	Top-5 acc 85.547 (84.554)	lr 0.00503
Train [85][1570/3239]	Time 0.240 (0.561)	Data Time 0.001 (0.030)	Loss 2.4077 (2.4545)	Entropy 0.58422 (0.58402)	Top-1 acc 67.188 (64.862)	Top-5 acc 85.938 (84.557)	lr 0.00502
Train [85][1580/3239]	Time 0.254 (0.560)	Data Time 0.001 (0.030)	Loss 2.4856 (2.4541)	Entropy 0.58422 (0.58402)	Top-1 acc 63.281 (64.866)	Top-5 acc 83.594 (84.569)	lr 0.00502
Train [85][1590/3239]	Time 0.291 (0.560)	Data Time 0.001 (0.030)	Loss 2.2929 (2.4541)	Entropy 0.58403 (0.58402)	Top-1 acc 72.266 (64.865)	Top-5 acc 85.156 (84.566)	lr 0.00502
Train [85][1600/3239]	Time 0.348 (0.595)	Data Time 0.038 (0.030)	Loss 2.3021 (2.4540)	Entropy 0.58400 (0.58402)	Top-1 acc 69.531 (64.869)	Top-5 acc 86.719 (84.565)	lr 0.00502
Train [85][1610/3239]	Time 0.287 (0.595)	Data Time 0.003 (0.030)	Loss 2.4372 (2.4546)	Entropy 0.58377 (0.58402)	Top-1 acc 64.453 (64.856)	Top-5 acc 85.938 (84.558)	lr 0.00502
Train [85][1620/3239]	Time 0.235 (0.594)	Data Time 0.001 (0.029)	Loss 2.5008 (2.4549)	Entropy 0.58369 (0.58402)	Top-1 acc 64.062 (64.848)	Top-5 acc 86.719 (84.554)	lr 0.00502
Train [85][1630/3239]	Time 0.345 (0.593)	Data Time 0.001 (0.029)	Loss 2.5133 (2.4546)	Entropy 0.58362 (0.58401)	Top-1 acc 66.016 (64.852)	Top-5 acc 83.203 (84.561)	lr 0.00502
Train [85][1640/3239]	Time 0.254 (0.592)	Data Time 0.001 (0.029)	Loss 2.2950 (2.4543)	Entropy 0.58378 (0.58401)	Top-1 acc 69.141 (64.855)	Top-5 acc 87.500 (84.564)	lr 0.00502
Train [85][1650/3239]	Time 0.250 (0.591)	Data Time 0.001 (0.029)	Loss 2.4779 (2.4542)	Entropy 0.58367 (0.58401)	Top-1 acc 60.156 (64.855)	Top-5 acc 86.719 (84.564)	lr 0.00502
Train [85][1660/3239]	Time 0.241 (0.591)	Data Time 0.001 (0.029)	Loss 2.4745 (2.4541)	Entropy 0.58391 (0.58401)	Top-1 acc 62.891 (64.855)	Top-5 acc 82.422 (84.563)	lr 0.00502
Train [85][1670/3239]	Time 0.252 (0.590)	Data Time 0.002 (0.029)	Loss 2.7054 (2.4544)	Entropy 0.58403 (0.58401)	Top-1 acc 59.766 (64.847)	Top-5 acc 82.031 (84.560)	lr 0.00502
Train [85][1680/3239]	Time 0.299 (0.589)	Data Time 0.003 (0.028)	Loss 2.5553 (2.4545)	Entropy 0.58416 (0.58401)	Top-1 acc 62.891 (64.843)	Top-5 acc 84.375 (84.560)	lr 0.00502
Train [85][1690/3239]	Time 0.261 (0.588)	Data Time 0.001 (0.028)	Loss 2.4981 (2.4546)	Entropy 0.58345 (0.58401)	Top-1 acc 63.281 (64.833)	Top-5 acc 84.766 (84.556)	lr 0.00502
Train [85][1700/3239]	Time 0.253 (0.587)	Data Time 0.001 (0.028)	Loss 2.4971 (2.4549)	Entropy 0.58375 (0.58401)	Top-1 acc 63.281 (64.829)	Top-5 acc 84.375 (84.552)	lr 0.00501
Train [85][1710/3239]	Time 0.248 (0.588)	Data Time 0.001 (0.029)	Loss 2.4105 (2.4545)	Entropy 0.58389 (0.58400)	Top-1 acc 65.625 (64.833)	Top-5 acc 84.375 (84.559)	lr 0.00501
Train [85][1720/3239]	Time 0.258 (0.589)	Data Time 0.001 (0.032)	Loss 2.4903 (2.4545)	Entropy 0.58375 (0.58400)	Top-1 acc 66.406 (64.831)	Top-5 acc 82.422 (84.559)	lr 0.00501
Train [85][1730/3239]	Time 0.282 (0.590)	Data Time 0.002 (0.032)	Loss 2.3575 (2.4542)	Entropy 0.58373 (0.58400)	Top-1 acc 64.844 (64.834)	Top-5 acc 85.938 (84.563)	lr 0.00501
Train [85][1740/3239]	Time 0.276 (0.592)	Data Time 0.002 (0.035)	Loss 2.2934 (2.4538)	Entropy 0.58358 (0.58400)	Top-1 acc 68.359 (64.847)	Top-5 acc 86.328 (84.566)	lr 0.00501
Train [85][1750/3239]	Time 2.121 (0.593)	Data Time 1.874 (0.037)	Loss 2.5037 (2.4537)	Entropy 0.58344 (0.58400)	Top-1 acc 62.891 (64.844)	Top-5 acc 82.812 (84.567)	lr 0.00501
Train [85][1760/3239]	Time 0.226 (0.592)	Data Time 0.001 (0.037)	Loss 2.4411 (2.4536)	Entropy 0.58347 (0.58399)	Top-1 acc 63.281 (64.839)	Top-5 acc 87.109 (84.571)	lr 0.00501
Train [85][1770/3239]	Time 0.280 (0.595)	Data Time 0.003 (0.040)	Loss 2.7170 (2.4535)	Entropy 0.58348 (0.58399)	Top-1 acc 57.812 (64.838)	Top-5 acc 80.469 (84.573)	lr 0.00501
Train [85][1780/3239]	Time 0.248 (0.595)	Data Time 0.001 (0.040)	Loss 2.3702 (2.4536)	Entropy 0.58273 (0.58399)	Top-1 acc 66.797 (64.832)	Top-5 acc 87.891 (84.574)	lr 0.00501
Train [85][1790/3239]	Time 0.371 (0.597)	Data Time 0.001 (0.043)	Loss 2.4782 (2.4538)	Entropy 0.58297 (0.58398)	Top-1 acc 63.281 (64.827)	Top-5 acc 87.891 (84.577)	lr 0.00501
Train [85][1800/3239]	Time 2.509 (0.597)	Data Time 2.246 (0.044)	Loss 2.4503 (2.4535)	Entropy 0.58265 (0.58397)	Top-1 acc 64.453 (64.836)	Top-5 acc 82.422 (84.578)	lr 0.00501
Train [85][1810/3239]	Time 0.249 (0.598)	Data Time 0.001 (0.046)	Loss 2.4743 (2.4538)	Entropy 0.58250 (0.58396)	Top-1 acc 64.453 (64.830)	Top-5 acc 81.641 (84.569)	lr 0.00501
Train [85][1820/3239]	Time 0.253 (0.599)	Data Time 0.002 (0.047)	Loss 2.3087 (2.4534)	Entropy 0.58235 (0.58396)	Top-1 acc 70.312 (64.841)	Top-5 acc 87.500 (84.581)	lr 0.00500
Train [85][1830/3239]	Time 1.818 (0.599)	Data Time 1.565 (0.048)	Loss 2.7560 (2.4534)	Entropy 0.58230 (0.58395)	Top-1 acc 59.766 (64.842)	Top-5 acc 80.859 (84.582)	lr 0.00500
Train [85][1840/3239]	Time 0.243 (0.600)	Data Time 0.001 (0.050)	Loss 2.5303 (2.4536)	Entropy 0.58249 (0.58394)	Top-1 acc 64.062 (64.834)	Top-5 acc 81.641 (84.576)	lr 0.00500
Train [85][1850/3239]	Time 0.252 (0.602)	Data Time 0.001 (0.052)	Loss 2.3685 (2.4536)	Entropy 0.58260 (0.58393)	Top-1 acc 66.016 (64.833)	Top-5 acc 87.891 (84.581)	lr 0.00500
Train [85][1860/3239]	Time 0.348 (0.601)	Data Time 0.001 (0.051)	Loss 2.4979 (2.4535)	Entropy 0.58300 (0.58392)	Top-1 acc 62.109 (64.833)	Top-5 acc 82.812 (84.586)	lr 0.00500
Train [85][1870/3239]	Time 0.256 (0.604)	Data Time 0.002 (0.055)	Loss 2.3553 (2.4539)	Entropy 0.58284 (0.58392)	Top-1 acc 63.281 (64.825)	Top-5 acc 85.156 (84.576)	lr 0.00500
Train [85][1880/3239]	Time 0.274 (0.604)	Data Time 0.001 (0.055)	Loss 2.3657 (2.4538)	Entropy 0.58296 (0.58391)	Top-1 acc 66.797 (64.829)	Top-5 acc 86.719 (84.579)	lr 0.00500
Train [85][1890/3239]	Time 0.249 (0.605)	Data Time 0.001 (0.057)	Loss 2.2278 (2.4537)	Entropy 0.58315 (0.58391)	Top-1 acc 71.875 (64.829)	Top-5 acc 89.062 (84.582)	lr 0.00500
Train [85][1900/3239]	Time 0.276 (0.608)	Data Time 0.002 (0.061)	Loss 2.3427 (2.4532)	Entropy 0.58320 (0.58390)	Top-1 acc 66.797 (64.837)	Top-5 acc 85.547 (84.589)	lr 0.00500
Train [85][1910/3239]	Time 0.288 (0.608)	Data Time 0.001 (0.061)	Loss 2.5404 (2.4532)	Entropy 0.58347 (0.58390)	Top-1 acc 67.188 (64.839)	Top-5 acc 83.984 (84.588)	lr 0.00500
Train [85][1920/3239]	Time 0.232 (0.607)	Data Time 0.001 (0.061)	Loss 2.6343 (2.4535)	Entropy 0.58323 (0.58390)	Top-1 acc 58.203 (64.830)	Top-5 acc 81.250 (84.583)	lr 0.00500
Train [85][1930/3239]	Time 0.241 (0.611)	Data Time 0.001 (0.066)	Loss 2.3411 (2.4536)	Entropy 0.58265 (0.58389)	Top-1 acc 67.969 (64.829)	Top-5 acc 85.156 (84.580)	lr 0.00500
Train [85][1940/3239]	Time 0.239 (0.611)	Data Time 0.001 (0.065)	Loss 2.6277 (2.4537)	Entropy 0.58256 (0.58389)	Top-1 acc 59.375 (64.827)	Top-5 acc 80.469 (84.579)	lr 0.00500
Train [85][1950/3239]	Time 0.370 (0.610)	Data Time 0.001 (0.065)	Loss 2.7481 (2.4537)	Entropy 0.58269 (0.58388)	Top-1 acc 57.812 (64.824)	Top-5 acc 80.469 (84.581)	lr 0.00499
Train [85][1960/3239]	Time 6.135 (0.612)	Data Time 5.832 (0.068)	Loss 2.5850 (2.4540)	Entropy 0.58273 (0.58387)	Top-1 acc 63.672 (64.823)	Top-5 acc 80.859 (84.575)	lr 0.00499
Train [85][1970/3239]	Time 0.225 (0.611)	Data Time 0.001 (0.067)	Loss 2.6822 (2.4538)	Entropy 0.58269 (0.58387)	Top-1 acc 59.375 (64.828)	Top-5 acc 79.297 (84.577)	lr 0.00499
Train [85][1980/3239]	Time 0.240 (0.610)	Data Time 0.001 (0.067)	Loss 2.5742 (2.4541)	Entropy 0.58268 (0.58386)	Top-1 acc 64.062 (64.825)	Top-5 acc 83.203 (84.573)	lr 0.00499
Train [85][1990/3239]	Time 0.272 (0.609)	Data Time 0.001 (0.067)	Loss 2.4735 (2.4542)	Entropy 0.58248 (0.58385)	Top-1 acc 63.281 (64.823)	Top-5 acc 87.109 (84.572)	lr 0.00499
Train [85][2000/3239]	Time 0.241 (0.611)	Data Time 0.001 (0.069)	Loss 2.2985 (2.4540)	Entropy 0.58233 (0.58385)	Top-1 acc 67.578 (64.829)	Top-5 acc 86.328 (84.575)	lr 0.00499
Train [85][2010/3239]	Time 0.237 (0.610)	Data Time 0.001 (0.069)	Loss 2.4126 (2.4538)	Entropy 0.58195 (0.58384)	Top-1 acc 66.016 (64.830)	Top-5 acc 84.375 (84.582)	lr 0.00499
Train [85][2020/3239]	Time 0.359 (0.610)	Data Time 0.002 (0.069)	Loss 2.4467 (2.4538)	Entropy 0.58222 (0.58383)	Top-1 acc 62.109 (64.828)	Top-5 acc 87.109 (84.579)	lr 0.00499
Train [85][2030/3239]	Time 0.237 (0.613)	Data Time 0.001 (0.072)	Loss 2.3551 (2.4536)	Entropy 0.58222 (0.58382)	Top-1 acc 67.969 (64.839)	Top-5 acc 87.891 (84.584)	lr 0.00499
Train [85][2040/3239]	Time 0.238 (0.612)	Data Time 0.001 (0.072)	Loss 2.6678 (2.4539)	Entropy 0.58217 (0.58381)	Top-1 acc 60.547 (64.836)	Top-5 acc 80.469 (84.579)	lr 0.00499
Train [85][2050/3239]	Time 0.236 (0.612)	Data Time 0.001 (0.072)	Loss 2.1945 (2.4539)	Entropy 0.58186 (0.58381)	Top-1 acc 71.875 (64.840)	Top-5 acc 87.891 (84.580)	lr 0.00499
Train [85][2060/3239]	Time 0.239 (0.615)	Data Time 0.001 (0.076)	Loss 2.3645 (2.4540)	Entropy 0.58173 (0.58380)	Top-1 acc 64.453 (64.839)	Top-5 acc 88.672 (84.580)	lr 0.00499
Train [85][2070/3239]	Time 0.255 (0.614)	Data Time 0.001 (0.076)	Loss 2.4657 (2.4541)	Entropy 0.58188 (0.58379)	Top-1 acc 62.891 (64.830)	Top-5 acc 83.984 (84.581)	lr 0.00498
Train [85][2080/3239]	Time 0.236 (0.614)	Data Time 0.001 (0.076)	Loss 2.5459 (2.4541)	Entropy 0.58199 (0.58378)	Top-1 acc 62.500 (64.835)	Top-5 acc 82.812 (84.584)	lr 0.00498
Train [85][2090/3239]	Time 0.287 (0.618)	Data Time 0.002 (0.080)	Loss 2.3034 (2.4543)	Entropy 0.58218 (0.58377)	Top-1 acc 68.750 (64.828)	Top-5 acc 85.156 (84.577)	lr 0.00498
Train [85][2100/3239]	Time 0.237 (0.617)	Data Time 0.001 (0.080)	Loss 2.4355 (2.4545)	Entropy 0.58220 (0.58376)	Top-1 acc 67.188 (64.824)	Top-5 acc 84.766 (84.573)	lr 0.00498
Train [85][2110/3239]	Time 0.284 (0.617)	Data Time 0.001 (0.080)	Loss 2.5424 (2.4545)	Entropy 0.58248 (0.58376)	Top-1 acc 59.375 (64.825)	Top-5 acc 83.594 (84.573)	lr 0.00498
Train [85][2120/3239]	Time 6.891 (0.620)	Data Time 6.629 (0.083)	Loss 2.3424 (2.4544)	Entropy 0.58243 (0.58375)	Top-1 acc 64.062 (64.827)	Top-5 acc 86.328 (84.574)	lr 0.00498
Train [85][2130/3239]	Time 0.236 (0.620)	Data Time 0.001 (0.084)	Loss 2.4271 (2.4542)	Entropy 0.58247 (0.58374)	Top-1 acc 63.672 (64.832)	Top-5 acc 85.547 (84.578)	lr 0.00498
Train [85][2140/3239]	Time 0.247 (0.619)	Data Time 0.001 (0.083)	Loss 2.4667 (2.4542)	Entropy 0.58253 (0.58374)	Top-1 acc 64.844 (64.832)	Top-5 acc 83.594 (84.575)	lr 0.00498
Train [85][2150/3239]	Time 0.251 (0.618)	Data Time 0.001 (0.083)	Loss 2.4259 (2.4546)	Entropy 0.58281 (0.58373)	Top-1 acc 62.891 (64.822)	Top-5 acc 87.891 (84.571)	lr 0.00498
Train [85][2160/3239]	Time 0.335 (0.623)	Data Time 0.001 (0.089)	Loss 2.4299 (2.4545)	Entropy 0.58258 (0.58373)	Top-1 acc 63.281 (64.822)	Top-5 acc 87.109 (84.576)	lr 0.00498
Train [85][2170/3239]	Time 0.276 (0.622)	Data Time 0.001 (0.088)	Loss 2.4650 (2.4545)	Entropy 0.58243 (0.58372)	Top-1 acc 65.625 (64.823)	Top-5 acc 83.203 (84.577)	lr 0.00498
Train [85][2180/3239]	Time 0.365 (0.621)	Data Time 0.002 (0.088)	Loss 2.5424 (2.4547)	Entropy 0.58242 (0.58372)	Top-1 acc 61.719 (64.820)	Top-5 acc 82.812 (84.575)	lr 0.00498
Train [85][2190/3239]	Time 0.296 (0.626)	Data Time 0.001 (0.093)	Loss 2.6353 (2.4547)	Entropy 0.58214 (0.58371)	Top-1 acc 58.984 (64.824)	Top-5 acc 81.641 (84.573)	lr 0.00497
Train [85][2200/3239]	Time 0.235 (0.625)	Data Time 0.001 (0.093)	Loss 2.4835 (2.4546)	Entropy 0.58183 (0.58370)	Top-1 acc 64.062 (64.820)	Top-5 acc 82.422 (84.574)	lr 0.00497
Train [85][2210/3239]	Time 0.236 (0.624)	Data Time 0.001 (0.092)	Loss 2.6525 (2.4547)	Entropy 0.58171 (0.58369)	Top-1 acc 60.547 (64.815)	Top-5 acc 79.688 (84.570)	lr 0.00497
Train [85][2220/3239]	Time 0.288 (0.627)	Data Time 0.001 (0.095)	Loss 2.3895 (2.4546)	Entropy 0.58143 (0.58369)	Top-1 acc 64.844 (64.816)	Top-5 acc 87.109 (84.570)	lr 0.00497
Train [85][2230/3239]	Time 0.239 (0.627)	Data Time 0.001 (0.095)	Loss 2.5672 (2.4550)	Entropy 0.58130 (0.58367)	Top-1 acc 64.062 (64.813)	Top-5 acc 80.469 (84.560)	lr 0.00497
Train [85][2240/3239]	Time 0.268 (0.626)	Data Time 0.001 (0.095)	Loss 2.3509 (2.4550)	Entropy 0.58150 (0.58366)	Top-1 acc 66.406 (64.811)	Top-5 acc 86.328 (84.558)	lr 0.00497
Train [85][2250/3239]	Time 0.342 (0.629)	Data Time 0.001 (0.099)	Loss 2.2852 (2.4548)	Entropy 0.58148 (0.58365)	Top-1 acc 70.312 (64.820)	Top-5 acc 87.109 (84.565)	lr 0.00497
Train [85][2260/3239]	Time 0.321 (0.655)	Data Time 0.002 (0.099)	Loss 2.4620 (2.4552)	Entropy 0.58146 (0.58365)	Top-1 acc 61.328 (64.814)	Top-5 acc 85.156 (84.556)	lr 0.00497
Train [85][2270/3239]	Time 0.274 (0.654)	Data Time 0.002 (0.098)	Loss 2.4874 (2.4549)	Entropy 0.58158 (0.58364)	Top-1 acc 63.281 (64.823)	Top-5 acc 85.547 (84.561)	lr 0.00497
Train [85][2280/3239]	Time 0.247 (0.654)	Data Time 0.001 (0.098)	Loss 2.4877 (2.4551)	Entropy 0.58142 (0.58363)	Top-1 acc 64.844 (64.819)	Top-5 acc 82.812 (84.557)	lr 0.00497
Train [85][2290/3239]	Time 0.242 (0.653)	Data Time 0.001 (0.098)	Loss 2.4020 (2.4549)	Entropy 0.58138 (0.58362)	Top-1 acc 64.453 (64.825)	Top-5 acc 86.719 (84.562)	lr 0.00497
Train [85][2300/3239]	Time 0.249 (0.652)	Data Time 0.002 (0.097)	Loss 2.2626 (2.4548)	Entropy 0.58137 (0.58361)	Top-1 acc 65.625 (64.822)	Top-5 acc 87.500 (84.563)	lr 0.00497
Train [85][2310/3239]	Time 0.282 (0.651)	Data Time 0.001 (0.097)	Loss 2.4683 (2.4548)	Entropy 0.58140 (0.58360)	Top-1 acc 66.016 (64.822)	Top-5 acc 82.031 (84.561)	lr 0.00497
Train [85][2320/3239]	Time 0.255 (0.650)	Data Time 0.001 (0.096)	Loss 2.5368 (2.4545)	Entropy 0.58161 (0.58359)	Top-1 acc 61.719 (64.827)	Top-5 acc 83.984 (84.567)	lr 0.00496
Train [85][2330/3239]	Time 0.251 (0.649)	Data Time 0.001 (0.096)	Loss 2.6317 (2.4547)	Entropy 0.58175 (0.58358)	Top-1 acc 61.719 (64.828)	Top-5 acc 80.469 (84.564)	lr 0.00496
Train [85][2340/3239]	Time 0.385 (0.648)	Data Time 0.003 (0.096)	Loss 2.3549 (2.4546)	Entropy 0.58148 (0.58357)	Top-1 acc 65.625 (64.825)	Top-5 acc 87.891 (84.568)	lr 0.00496
Train [85][2350/3239]	Time 0.248 (0.647)	Data Time 0.002 (0.095)	Loss 2.4781 (2.4545)	Entropy 0.58143 (0.58356)	Top-1 acc 64.844 (64.829)	Top-5 acc 82.031 (84.569)	lr 0.00496
Train [85][2360/3239]	Time 2.260 (0.648)	Data Time 2.007 (0.096)	Loss 2.3894 (2.4547)	Entropy 0.58130 (0.58355)	Top-1 acc 63.281 (64.820)	Top-5 acc 85.547 (84.567)	lr 0.00496
Train [85][2370/3239]	Time 2.904 (0.650)	Data Time 2.643 (0.099)	Loss 2.3894 (2.4548)	Entropy 0.58115 (0.58354)	Top-1 acc 64.453 (64.816)	Top-5 acc 87.109 (84.566)	lr 0.00496
Train [85][2380/3239]	Time 0.250 (0.649)	Data Time 0.001 (0.099)	Loss 2.4078 (2.4548)	Entropy 0.58136 (0.58353)	Top-1 acc 66.016 (64.819)	Top-5 acc 85.938 (84.566)	lr 0.00496
Train [85][2390/3239]	Time 0.272 (0.651)	Data Time 0.003 (0.100)	Loss 2.2866 (2.4546)	Entropy 0.58109 (0.58352)	Top-1 acc 69.531 (64.827)	Top-5 acc 86.328 (84.569)	lr 0.00496
Train [85][2400/3239]	Time 0.278 (0.653)	Data Time 0.001 (0.103)	Loss 2.3285 (2.4544)	Entropy 0.58078 (0.58351)	Top-1 acc 68.359 (64.833)	Top-5 acc 86.719 (84.574)	lr 0.00496
Train [85][2410/3239]	Time 0.335 (0.652)	Data Time 0.001 (0.102)	Loss 2.5984 (2.4544)	Entropy 0.58056 (0.58350)	Top-1 acc 56.641 (64.834)	Top-5 acc 81.641 (84.574)	lr 0.00496
Train [85][2420/3239]	Time 2.340 (0.653)	Data Time 2.099 (0.104)	Loss 2.5565 (2.4541)	Entropy 0.58053 (0.58349)	Top-1 acc 62.891 (64.841)	Top-5 acc 82.422 (84.579)	lr 0.00496
Train [85][2430/3239]	Time 0.254 (0.654)	Data Time 0.001 (0.105)	Loss 2.4701 (2.4543)	Entropy 0.58038 (0.58348)	Top-1 acc 63.672 (64.838)	Top-5 acc 83.594 (84.580)	lr 0.00496
Train [85][2440/3239]	Time 0.242 (0.655)	Data Time 0.001 (0.106)	Loss 2.5222 (2.4544)	Entropy 0.58060 (0.58346)	Top-1 acc 62.891 (64.832)	Top-5 acc 84.766 (84.573)	lr 0.00495
Train [85][2450/3239]	Time 1.218 (0.655)	Data Time 0.965 (0.107)	Loss 2.4215 (2.4545)	Entropy 0.58031 (0.58345)	Top-1 acc 64.062 (64.830)	Top-5 acc 84.766 (84.574)	lr 0.00495
Train [85][2460/3239]	Time 0.235 (0.657)	Data Time 0.001 (0.109)	Loss 2.5102 (2.4547)	Entropy 0.58031 (0.58344)	Top-1 acc 62.109 (64.824)	Top-5 acc 83.594 (84.571)	lr 0.00495
Train [85][2470/3239]	Time 0.248 (0.657)	Data Time 0.001 (0.109)	Loss 2.6191 (2.4547)	Entropy 0.58028 (0.58343)	Top-1 acc 58.984 (64.823)	Top-5 acc 80.859 (84.568)	lr 0.00495
Train [85][2480/3239]	Time 0.254 (0.657)	Data Time 0.001 (0.110)	Loss 2.4829 (2.4548)	Entropy 0.58034 (0.58341)	Top-1 acc 66.406 (64.818)	Top-5 acc 82.031 (84.565)	lr 0.00495
Train [85][2490/3239]	Time 0.246 (0.659)	Data Time 0.001 (0.113)	Loss 2.5430 (2.4550)	Entropy 0.58006 (0.58340)	Top-1 acc 60.938 (64.809)	Top-5 acc 83.594 (84.563)	lr 0.00495
Train [85][2500/3239]	Time 0.366 (0.658)	Data Time 0.001 (0.112)	Loss 2.5011 (2.4549)	Entropy 0.57997 (0.58339)	Top-1 acc 67.188 (64.813)	Top-5 acc 83.594 (84.561)	lr 0.00495
Train [85][2510/3239]	Time 1.175 (0.659)	Data Time 0.924 (0.113)	Loss 2.7218 (2.4549)	Entropy 0.58016 (0.58337)	Top-1 acc 61.719 (64.811)	Top-5 acc 79.688 (84.559)	lr 0.00495
Train [85][2520/3239]	Time 0.236 (0.661)	Data Time 0.001 (0.116)	Loss 2.5425 (2.4548)	Entropy 0.58032 (0.58336)	Top-1 acc 64.453 (64.816)	Top-5 acc 83.203 (84.559)	lr 0.00495
Train [85][2530/3239]	Time 0.252 (0.661)	Data Time 0.002 (0.116)	Loss 2.4331 (2.4548)	Entropy 0.58050 (0.58335)	Top-1 acc 67.188 (64.814)	Top-5 acc 86.328 (84.562)	lr 0.00495
Train [85][2540/3239]	Time 0.247 (0.660)	Data Time 0.001 (0.116)	Loss 2.3599 (2.4549)	Entropy 0.58040 (0.58334)	Top-1 acc 66.797 (64.811)	Top-5 acc 86.719 (84.561)	lr 0.00495
Train [85][2550/3239]	Time 0.267 (0.664)	Data Time 0.001 (0.120)	Loss 2.4959 (2.4548)	Entropy 0.58051 (0.58333)	Top-1 acc 66.797 (64.817)	Top-5 acc 83.984 (84.561)	lr 0.00495
Train [85][2560/3239]	Time 0.246 (0.663)	Data Time 0.001 (0.119)	Loss 2.6016 (2.4550)	Entropy 0.58056 (0.58332)	Top-1 acc 60.156 (64.811)	Top-5 acc 82.812 (84.556)	lr 0.00495
Train [85][2570/3239]	Time 0.353 (0.662)	Data Time 0.001 (0.119)	Loss 2.2219 (2.4549)	Entropy 0.58048 (0.58331)	Top-1 acc 69.531 (64.813)	Top-5 acc 89.844 (84.561)	lr 0.00494
Train [85][2580/3239]	Time 0.228 (0.662)	Data Time 0.001 (0.119)	Loss 2.4629 (2.4548)	Entropy 0.58031 (0.58329)	Top-1 acc 60.547 (64.814)	Top-5 acc 86.328 (84.564)	lr 0.00494
Train [85][2590/3239]	Time 0.225 (0.663)	Data Time 0.001 (0.120)	Loss 2.6011 (2.4546)	Entropy 0.58022 (0.58328)	Top-1 acc 60.156 (64.817)	Top-5 acc 79.688 (84.568)	lr 0.00494
Train [85][2600/3239]	Time 0.239 (0.662)	Data Time 0.001 (0.120)	Loss 2.5101 (2.4546)	Entropy 0.58005 (0.58327)	Top-1 acc 63.281 (64.820)	Top-5 acc 83.594 (84.570)	lr 0.00494
Train [85][2610/3239]	Time 0.282 (0.662)	Data Time 0.001 (0.121)	Loss 2.7842 (2.4549)	Entropy 0.58011 (0.58326)	Top-1 acc 55.078 (64.813)	Top-5 acc 82.031 (84.564)	lr 0.00494
Train [85][2620/3239]	Time 0.247 (0.664)	Data Time 0.001 (0.123)	Loss 2.4031 (2.4550)	Entropy 0.58002 (0.58325)	Top-1 acc 64.844 (64.810)	Top-5 acc 86.719 (84.562)	lr 0.00494
Train [85][2630/3239]	Time 0.263 (0.663)	Data Time 0.001 (0.122)	Loss 2.4580 (2.4551)	Entropy 0.58000 (0.58323)	Top-1 acc 65.625 (64.810)	Top-5 acc 82.031 (84.557)	lr 0.00494
Train [85][2640/3239]	Time 0.222 (0.663)	Data Time 0.001 (0.122)	Loss 2.3910 (2.4551)	Entropy 0.58018 (0.58322)	Top-1 acc 70.312 (64.809)	Top-5 acc 86.719 (84.559)	lr 0.00494
Train [85][2650/3239]	Time 0.247 (0.664)	Data Time 0.001 (0.124)	Loss 2.4461 (2.4551)	Entropy 0.57944 (0.58321)	Top-1 acc 64.062 (64.808)	Top-5 acc 86.328 (84.561)	lr 0.00494
Train [85][2660/3239]	Time 0.342 (0.664)	Data Time 0.001 (0.124)	Loss 2.4261 (2.4549)	Entropy 0.57949 (0.58320)	Top-1 acc 65.625 (64.813)	Top-5 acc 83.203 (84.563)	lr 0.00494
Train [85][2670/3239]	Time 0.249 (0.664)	Data Time 0.001 (0.124)	Loss 2.5248 (2.4552)	Entropy 0.57956 (0.58318)	Top-1 acc 63.672 (64.808)	Top-5 acc 84.375 (84.559)	lr 0.00494
Train [85][2680/3239]	Time 0.266 (0.665)	Data Time 0.001 (0.126)	Loss 2.4558 (2.4553)	Entropy 0.57969 (0.58317)	Top-1 acc 63.672 (64.806)	Top-5 acc 85.156 (84.557)	lr 0.00494
Train [85][2690/3239]	Time 0.274 (0.665)	Data Time 0.001 (0.126)	Loss 2.3741 (2.4552)	Entropy 0.57979 (0.58316)	Top-1 acc 67.188 (64.810)	Top-5 acc 85.156 (84.559)	lr 0.00493
Train [85][2700/3239]	Time 0.247 (0.665)	Data Time 0.001 (0.126)	Loss 2.4089 (2.4550)	Entropy 0.57985 (0.58314)	Top-1 acc 63.672 (64.818)	Top-5 acc 83.984 (84.563)	lr 0.00493
Train [85][2710/3239]	Time 0.258 (0.665)	Data Time 0.001 (0.127)	Loss 2.2955 (2.4550)	Entropy 0.57983 (0.58313)	Top-1 acc 71.484 (64.821)	Top-5 acc 85.547 (84.562)	lr 0.00493
Train [85][2720/3239]	Time 0.249 (0.666)	Data Time 0.001 (0.128)	Loss 2.7288 (2.4552)	Entropy 0.57996 (0.58312)	Top-1 acc 56.641 (64.815)	Top-5 acc 80.469 (84.558)	lr 0.00493
Train [85][2730/3239]	Time 0.349 (0.665)	Data Time 0.001 (0.128)	Loss 2.7249 (2.4552)	Entropy 0.58003 (0.58311)	Top-1 acc 59.766 (64.818)	Top-5 acc 79.297 (84.558)	lr 0.00493
Train [85][2740/3239]	Time 0.246 (0.664)	Data Time 0.001 (0.127)	Loss 2.7646 (2.4555)	Entropy 0.58027 (0.58310)	Top-1 acc 57.812 (64.812)	Top-5 acc 78.516 (84.550)	lr 0.00493
Train [85][2750/3239]	Time 0.254 (0.667)	Data Time 0.001 (0.130)	Loss 2.6824 (2.4555)	Entropy 0.58046 (0.58309)	Top-1 acc 59.766 (64.812)	Top-5 acc 79.688 (84.549)	lr 0.00493
Train [85][2760/3239]	Time 0.230 (0.666)	Data Time 0.001 (0.130)	Loss 2.3918 (2.4555)	Entropy 0.58061 (0.58308)	Top-1 acc 63.281 (64.812)	Top-5 acc 86.328 (84.547)	lr 0.00493
Train [85][2770/3239]	Time 0.232 (0.666)	Data Time 0.001 (0.130)	Loss 2.3667 (2.4554)	Entropy 0.58084 (0.58307)	Top-1 acc 66.797 (64.817)	Top-5 acc 83.594 (84.550)	lr 0.00493
Train [85][2780/3239]	Time 0.256 (0.668)	Data Time 0.002 (0.133)	Loss 2.5236 (2.4555)	Entropy 0.58079 (0.58306)	Top-1 acc 62.109 (64.814)	Top-5 acc 86.719 (84.552)	lr 0.00493
Train [85][2790/3239]	Time 0.233 (0.667)	Data Time 0.001 (0.132)	Loss 2.4457 (2.4553)	Entropy 0.58086 (0.58305)	Top-1 acc 64.844 (64.821)	Top-5 acc 83.203 (84.555)	lr 0.00493
Train [85][2800/3239]	Time 0.346 (0.667)	Data Time 0.001 (0.132)	Loss 2.4664 (2.4555)	Entropy 0.58088 (0.58304)	Top-1 acc 63.672 (64.816)	Top-5 acc 85.547 (84.553)	lr 0.00493
Train [85][2810/3239]	Time 2.489 (0.667)	Data Time 2.255 (0.133)	Loss 2.6285 (2.4559)	Entropy 0.58088 (0.58304)	Top-1 acc 61.719 (64.807)	Top-5 acc 81.250 (84.547)	lr 0.00492
Train [85][2820/3239]	Time 0.268 (0.669)	Data Time 0.002 (0.135)	Loss 2.6333 (2.4560)	Entropy 0.58085 (0.58303)	Top-1 acc 58.984 (64.801)	Top-5 acc 82.031 (84.544)	lr 0.00492
Train [85][2830/3239]	Time 0.251 (0.668)	Data Time 0.001 (0.135)	Loss 2.4500 (2.4558)	Entropy 0.58075 (0.58302)	Top-1 acc 67.578 (64.810)	Top-5 acc 83.203 (84.546)	lr 0.00492
Train [85][2840/3239]	Time 0.282 (0.668)	Data Time 0.001 (0.134)	Loss 2.3625 (2.4559)	Entropy 0.58066 (0.58301)	Top-1 acc 65.625 (64.812)	Top-5 acc 84.766 (84.542)	lr 0.00492
Train [85][2850/3239]	Time 0.248 (0.670)	Data Time 0.002 (0.137)	Loss 2.5811 (2.4560)	Entropy 0.58043 (0.58300)	Top-1 acc 62.891 (64.810)	Top-5 acc 80.469 (84.538)	lr 0.00492
Train [85][2860/3239]	Time 0.247 (0.669)	Data Time 0.001 (0.137)	Loss 2.3347 (2.4561)	Entropy 0.58050 (0.58300)	Top-1 acc 71.094 (64.808)	Top-5 acc 86.328 (84.539)	lr 0.00492
Train [85][2870/3239]	Time 0.262 (0.668)	Data Time 0.002 (0.136)	Loss 2.4774 (2.4561)	Entropy 0.58032 (0.58299)	Top-1 acc 64.453 (64.806)	Top-5 acc 84.375 (84.536)	lr 0.00492
Train [85][2880/3239]	Time 0.231 (0.670)	Data Time 0.001 (0.138)	Loss 2.4305 (2.4560)	Entropy 0.58064 (0.58298)	Top-1 acc 65.625 (64.806)	Top-5 acc 83.594 (84.540)	lr 0.00492
Train [85][2890/3239]	Time 0.348 (0.670)	Data Time 0.001 (0.138)	Loss 2.3587 (2.4559)	Entropy 0.58075 (0.58297)	Top-1 acc 65.625 (64.807)	Top-5 acc 85.938 (84.540)	lr 0.00492
Train [85][2900/3239]	Time 0.237 (0.669)	Data Time 0.001 (0.137)	Loss 2.5181 (2.4558)	Entropy 0.58073 (0.58296)	Top-1 acc 62.109 (64.810)	Top-5 acc 85.156 (84.544)	lr 0.00492
Train [85][2910/3239]	Time 0.286 (0.690)	Data Time 0.006 (0.140)	Loss 2.3048 (2.4559)	Entropy 0.58073 (0.58295)	Top-1 acc 69.141 (64.806)	Top-5 acc 86.328 (84.544)	lr 0.00492
Train [85][2920/3239]	Time 0.241 (0.689)	Data Time 0.002 (0.140)	Loss 2.4080 (2.4558)	Entropy 0.58085 (0.58295)	Top-1 acc 67.188 (64.808)	Top-5 acc 85.156 (84.550)	lr 0.00492
Train [85][2930/3239]	Time 0.231 (0.688)	Data Time 0.001 (0.139)	Loss 2.3402 (2.4560)	Entropy 0.58128 (0.58294)	Top-1 acc 69.922 (64.806)	Top-5 acc 89.062 (84.548)	lr 0.00492
Train [85][2940/3239]	Time 0.269 (0.687)	Data Time 0.002 (0.139)	Loss 2.4381 (2.4560)	Entropy 0.58120 (0.58293)	Top-1 acc 64.844 (64.807)	Top-5 acc 85.938 (84.547)	lr 0.00491
Train [85][2950/3239]	Time 0.262 (0.687)	Data Time 0.001 (0.138)	Loss 2.3060 (2.4557)	Entropy 0.58101 (0.58293)	Top-1 acc 66.406 (64.810)	Top-5 acc 86.719 (84.551)	lr 0.00491
Train [85][2960/3239]	Time 0.304 (0.686)	Data Time 0.002 (0.138)	Loss 2.4502 (2.4556)	Entropy 0.58114 (0.58292)	Top-1 acc 64.844 (64.814)	Top-5 acc 84.766 (84.556)	lr 0.00491
Train [85][2970/3239]	Time 0.246 (0.685)	Data Time 0.002 (0.138)	Loss 2.4608 (2.4557)	Entropy 0.58099 (0.58292)	Top-1 acc 60.938 (64.806)	Top-5 acc 84.375 (84.552)	lr 0.00491
Train [85][2980/3239]	Time 0.253 (0.685)	Data Time 0.001 (0.137)	Loss 2.3750 (2.4556)	Entropy 0.58105 (0.58291)	Top-1 acc 68.359 (64.807)	Top-5 acc 87.109 (84.554)	lr 0.00491
Train [85][2990/3239]	Time 0.266 (0.684)	Data Time 0.001 (0.137)	Loss 2.5038 (2.4554)	Entropy 0.58077 (0.58290)	Top-1 acc 63.672 (64.810)	Top-5 acc 84.766 (84.556)	lr 0.00491
Train [85][3000/3239]	Time 0.275 (0.683)	Data Time 0.001 (0.136)	Loss 2.7223 (2.4555)	Entropy 0.58061 (0.58289)	Top-1 acc 57.031 (64.808)	Top-5 acc 82.031 (84.556)	lr 0.00491
Train [85][3010/3239]	Time 0.254 (0.682)	Data Time 0.002 (0.136)	Loss 2.5396 (2.4555)	Entropy 0.58056 (0.58289)	Top-1 acc 60.938 (64.806)	Top-5 acc 83.594 (84.557)	lr 0.00491
Train [85][3020/3239]	Time 0.253 (0.682)	Data Time 0.001 (0.135)	Loss 2.4784 (2.4556)	Entropy 0.58049 (0.58288)	Top-1 acc 65.234 (64.804)	Top-5 acc 85.938 (84.553)	lr 0.00491
Train [85][3030/3239]	Time 0.257 (0.682)	Data Time 0.001 (0.136)	Loss 2.3873 (2.4557)	Entropy 0.58056 (0.58287)	Top-1 acc 66.016 (64.802)	Top-5 acc 85.938 (84.552)	lr 0.00491
Train [85][3040/3239]	Time 0.253 (0.681)	Data Time 0.001 (0.136)	Loss 2.5090 (2.4557)	Entropy 0.58032 (0.58286)	Top-1 acc 62.109 (64.802)	Top-5 acc 83.594 (84.552)	lr 0.00491
Train [85][3050/3239]	Time 0.373 (0.682)	Data Time 0.001 (0.137)	Loss 2.5185 (2.4558)	Entropy 0.58047 (0.58286)	Top-1 acc 62.891 (64.803)	Top-5 acc 86.328 (84.553)	lr 0.00491
Train [85][3060/3239]	Time 0.278 (0.682)	Data Time 0.002 (0.137)	Loss 2.6175 (2.4559)	Entropy 0.58041 (0.58285)	Top-1 acc 62.109 (64.801)	Top-5 acc 81.641 (84.554)	lr 0.00490
Train [85][3070/3239]	Time 0.257 (0.682)	Data Time 0.001 (0.137)	Loss 2.5117 (2.4559)	Entropy 0.57979 (0.58284)	Top-1 acc 62.891 (64.798)	Top-5 acc 84.375 (84.556)	lr 0.00490
Train [85][3080/3239]	Time 2.879 (0.682)	Data Time 2.531 (0.138)	Loss 2.4879 (2.4559)	Entropy 0.58000 (0.58283)	Top-1 acc 62.891 (64.798)	Top-5 acc 84.375 (84.556)	lr 0.00490
Train [85][3090/3239]	Time 0.274 (0.683)	Data Time 0.001 (0.139)	Loss 2.3452 (2.4556)	Entropy 0.58015 (0.58282)	Top-1 acc 67.578 (64.805)	Top-5 acc 88.672 (84.560)	lr 0.00490
Train [85][3100/3239]	Time 0.242 (0.683)	Data Time 0.001 (0.139)	Loss 2.5596 (2.4556)	Entropy 0.57991 (0.58281)	Top-1 acc 61.328 (64.805)	Top-5 acc 83.203 (84.562)	lr 0.00490
Train [85][3110/3239]	Time 0.247 (0.682)	Data Time 0.001 (0.139)	Loss 2.4298 (2.4556)	Entropy 0.57999 (0.58280)	Top-1 acc 64.062 (64.808)	Top-5 acc 85.156 (84.563)	lr 0.00490
Train [85][3120/3239]	Time 0.366 (0.683)	Data Time 0.001 (0.139)	Loss 2.8135 (2.4555)	Entropy 0.58002 (0.58279)	Top-1 acc 57.812 (64.811)	Top-5 acc 80.469 (84.566)	lr 0.00490
Train [85][3130/3239]	Time 0.262 (0.684)	Data Time 0.001 (0.141)	Loss 2.6810 (2.4556)	Entropy 0.57994 (0.58278)	Top-1 acc 59.766 (64.808)	Top-5 acc 80.078 (84.563)	lr 0.00490
Train [85][3140/3239]	Time 0.237 (0.683)	Data Time 0.001 (0.140)	Loss 2.5712 (2.4557)	Entropy 0.57964 (0.58277)	Top-1 acc 67.188 (64.806)	Top-5 acc 81.250 (84.560)	lr 0.00490
Train [85][3150/3239]	Time 0.234 (0.683)	Data Time 0.001 (0.141)	Loss 2.2819 (2.4555)	Entropy 0.57912 (0.58276)	Top-1 acc 67.578 (64.807)	Top-5 acc 87.500 (84.562)	lr 0.00490
Train [85][3160/3239]	Time 0.244 (0.683)	Data Time 0.001 (0.142)	Loss 2.4077 (2.4555)	Entropy 0.57949 (0.58275)	Top-1 acc 60.156 (64.809)	Top-5 acc 87.109 (84.562)	lr 0.00490
Train [85][3170/3239]	Time 0.299 (0.684)	Data Time 0.001 (0.142)	Loss 2.4429 (2.4554)	Entropy 0.57972 (0.58274)	Top-1 acc 66.797 (64.812)	Top-5 acc 83.984 (84.564)	lr 0.00490
Train [85][3180/3239]	Time 0.242 (0.683)	Data Time 0.000 (0.142)	Loss 2.5311 (2.4553)	Entropy 0.57972 (0.58273)	Top-1 acc 62.891 (64.816)	Top-5 acc 84.375 (84.564)	lr 0.00490
Train [85][3190/3239]	Time 0.260 (0.684)	Data Time 0.000 (0.143)	Loss 2.6913 (2.4553)	Entropy 0.57991 (0.58272)	Top-1 acc 60.938 (64.821)	Top-5 acc 80.469 (84.566)	lr 0.00489
Train [85][3200/3239]	Time 0.251 (0.684)	Data Time 0.000 (0.143)	Loss 2.3904 (2.4553)	Entropy 0.58009 (0.58272)	Top-1 acc 62.891 (64.820)	Top-5 acc 86.719 (84.567)	lr 0.00489
Train [85][3210/3239]	Time 0.364 (0.685)	Data Time 0.000 (0.144)	Loss 2.3565 (2.4554)	Entropy 0.58011 (0.58271)	Top-1 acc 63.672 (64.816)	Top-5 acc 88.281 (84.565)	lr 0.00489
Train [85][3220/3239]	Time 0.255 (0.685)	Data Time 0.000 (0.144)	Loss 2.3155 (2.4554)	Entropy 0.58032 (0.58270)	Top-1 acc 68.750 (64.816)	Top-5 acc 85.547 (84.563)	lr 0.00489
Train [85][3230/3239]	Time 0.236 (0.684)	Data Time 0.000 (0.144)	Loss 2.3696 (2.4553)	Entropy 0.58054 (0.58269)	Top-1 acc 65.625 (64.819)	Top-5 acc 87.109 (84.567)	lr 0.00489
Train [85][3239/3239]	Time 0.955 (0.683)	Data Time 0.000 (0.144)	Loss 2.4127 (2.4552)	Entropy 0.58036 (0.58269)	Top-1 acc 69.136 (64.821)	Top-5 acc 83.951 (84.569)	lr 0.00489
==========Valid [85/120]	loss 1.257	top-1 acc 71.030 (71.030)	top-5 acc 89.742	Train top-1 64.821	top-5 84.569	Entropy 0.58036	Latency-None: 0.000ms	Flops: 539.00M
Train [86][0/3239]	Time 44.533 (44.533)	Data Time 41.906 (41.906)	Loss 2.3714 (2.3714)	Entropy 0.58049 (0.58049)	Top-1 acc 69.531 (69.531)	Top-5 acc 86.719 (86.719)	lr 0.00489
Train [86][10/3239]	Time 0.312 (4.573)	Data Time 0.002 (3.877)	Loss 2.4559 (2.4764)	Entropy 0.58043 (0.58053)	Top-1 acc 63.672 (64.098)	Top-5 acc 87.109 (84.659)	lr 0.00489
Train [86][20/3239]	Time 0.243 (2.611)	Data Time 0.001 (2.032)	Loss 2.5799 (2.4565)	Entropy 0.58044 (0.58049)	Top-1 acc 62.500 (64.639)	Top-5 acc 81.641 (84.896)	lr 0.00489
Train [86][30/3239]	Time 0.272 (1.909)	Data Time 0.001 (1.377)	Loss 2.2915 (2.4329)	Entropy 0.58077 (0.58050)	Top-1 acc 71.484 (65.323)	Top-5 acc 87.109 (85.207)	lr 0.00489
Train [86][40/3239]	Time 0.261 (1.545)	Data Time 0.001 (1.041)	Loss 2.3388 (2.4307)	Entropy 0.58074 (0.58059)	Top-1 acc 66.797 (65.406)	Top-5 acc 86.719 (85.204)	lr 0.00489
Train [86][50/3239]	Time 0.238 (1.324)	Data Time 0.001 (0.837)	Loss 2.5001 (2.4412)	Entropy 0.58049 (0.58063)	Top-1 acc 63.281 (65.089)	Top-5 acc 84.766 (84.888)	lr 0.00489
Train [86][60/3239]	Time 0.228 (1.173)	Data Time 0.001 (0.700)	Loss 2.5418 (2.4431)	Entropy 0.58029 (0.58059)	Top-1 acc 62.109 (64.946)	Top-5 acc 83.984 (84.926)	lr 0.00489
Train [86][70/3239]	Time 0.226 (1.064)	Data Time 0.001 (0.602)	Loss 2.5785 (2.4429)	Entropy 0.58022 (0.58054)	Top-1 acc 62.500 (64.899)	Top-5 acc 81.641 (84.931)	lr 0.00488
Train [86][80/3239]	Time 0.224 (0.983)	Data Time 0.001 (0.528)	Loss 2.5899 (2.4430)	Entropy 0.58031 (0.58051)	Top-1 acc 63.281 (64.935)	Top-5 acc 82.031 (84.939)	lr 0.00488
Train [86][90/3239]	Time 0.228 (0.922)	Data Time 0.001 (0.470)	Loss 2.5386 (2.4425)	Entropy 0.58005 (0.58047)	Top-1 acc 64.844 (65.106)	Top-5 acc 81.641 (84.907)	lr 0.00488
Train [86][100/3239]	Time 0.240 (0.872)	Data Time 0.001 (0.424)	Loss 2.3221 (2.4376)	Entropy 0.58009 (0.58043)	Top-1 acc 69.141 (65.300)	Top-5 acc 85.156 (84.944)	lr 0.00488
Train [86][110/3239]	Time 0.339 (0.831)	Data Time 0.001 (0.386)	Loss 2.5627 (2.4344)	Entropy 0.57973 (0.58039)	Top-1 acc 59.766 (65.358)	Top-5 acc 82.031 (84.991)	lr 0.00488
Train [86][120/3239]	Time 0.306 (0.800)	Data Time 0.040 (0.354)	Loss 2.3925 (2.4322)	Entropy 0.57990 (0.58034)	Top-1 acc 65.234 (65.438)	Top-5 acc 85.156 (84.998)	lr 0.00488
Train [86][130/3239]	Time 0.282 (0.776)	Data Time 0.002 (0.327)	Loss 2.6557 (2.4383)	Entropy 0.57998 (0.58030)	Top-1 acc 61.719 (65.330)	Top-5 acc 79.297 (84.813)	lr 0.00488
Train [86][140/3239]	Time 0.262 (0.760)	Data Time 0.001 (0.304)	Loss 2.3951 (2.4382)	Entropy 0.58002 (0.58029)	Top-1 acc 66.406 (65.304)	Top-5 acc 84.766 (84.824)	lr 0.00488
Train [86][150/3239]	Time 0.235 (0.736)	Data Time 0.001 (0.284)	Loss 2.3981 (2.4410)	Entropy 0.58008 (0.58028)	Top-1 acc 65.625 (65.221)	Top-5 acc 86.328 (84.760)	lr 0.00488
Train [86][160/3239]	Time 0.234 (0.717)	Data Time 0.001 (0.267)	Loss 2.3484 (2.4419)	Entropy 0.57983 (0.58027)	Top-1 acc 68.359 (65.205)	Top-5 acc 84.766 (84.753)	lr 0.00488
Train [86][170/3239]	Time 0.246 (0.700)	Data Time 0.001 (0.251)	Loss 2.6888 (2.4407)	Entropy 0.58010 (0.58025)	Top-1 acc 60.156 (65.216)	Top-5 acc 79.297 (84.779)	lr 0.00488
Train [86][180/3239]	Time 0.337 (0.686)	Data Time 0.001 (0.237)	Loss 2.4451 (2.4394)	Entropy 0.57979 (0.58023)	Top-1 acc 66.797 (65.278)	Top-5 acc 86.328 (84.837)	lr 0.00488
Train [86][190/3239]	Time 0.268 (0.672)	Data Time 0.001 (0.225)	Loss 2.4170 (2.4387)	Entropy 0.57986 (0.58021)	Top-1 acc 67.188 (65.292)	Top-5 acc 84.375 (84.860)	lr 0.00488
Train [86][200/3239]	Time 0.226 (0.659)	Data Time 0.001 (0.214)	Loss 2.3961 (2.4365)	Entropy 0.57863 (0.58017)	Top-1 acc 65.625 (65.337)	Top-5 acc 87.109 (84.915)	lr 0.00487
Train [86][210/3239]	Time 0.263 (0.649)	Data Time 0.001 (0.204)	Loss 2.2638 (2.4356)	Entropy 0.57849 (0.58010)	Top-1 acc 66.797 (65.388)	Top-5 acc 88.281 (84.930)	lr 0.00487
Train [86][220/3239]	Time 0.232 (0.637)	Data Time 0.001 (0.195)	Loss 2.4117 (2.4381)	Entropy 0.57860 (0.58002)	Top-1 acc 66.797 (65.321)	Top-5 acc 85.938 (84.889)	lr 0.00487
Train [86][230/3239]	Time 0.279 (0.628)	Data Time 0.001 (0.186)	Loss 2.1795 (2.4394)	Entropy 0.57873 (0.57996)	Top-1 acc 71.875 (65.273)	Top-5 acc 91.016 (84.899)	lr 0.00487
Train [86][240/3239]	Time 0.231 (0.620)	Data Time 0.001 (0.179)	Loss 2.5848 (2.4408)	Entropy 0.57857 (0.57991)	Top-1 acc 62.891 (65.225)	Top-5 acc 82.422 (84.897)	lr 0.00487
Train [86][250/3239]	Time 0.237 (0.612)	Data Time 0.001 (0.172)	Loss 2.4733 (2.4420)	Entropy 0.57853 (0.57985)	Top-1 acc 61.328 (65.197)	Top-5 acc 85.938 (84.876)	lr 0.00487
Train [86][260/3239]	Time 0.240 (0.605)	Data Time 0.001 (0.165)	Loss 2.4302 (2.4451)	Entropy 0.57901 (0.57981)	Top-1 acc 64.844 (65.079)	Top-5 acc 84.375 (84.799)	lr 0.00487
Train [86][270/3239]	Time 0.455 (0.599)	Data Time 0.001 (0.159)	Loss 2.4244 (2.4443)	Entropy 0.57850 (0.57977)	Top-1 acc 65.234 (65.076)	Top-5 acc 85.547 (84.820)	lr 0.00487
Train [86][280/3239]	Time 0.265 (0.593)	Data Time 0.001 (0.153)	Loss 2.3662 (2.4440)	Entropy 0.57855 (0.57973)	Top-1 acc 65.625 (65.090)	Top-5 acc 88.672 (84.838)	lr 0.00487
Train [86][290/3239]	Time 0.253 (0.587)	Data Time 0.001 (0.148)	Loss 2.1763 (2.4451)	Entropy 0.57842 (0.57969)	Top-1 acc 70.703 (65.057)	Top-5 acc 89.844 (84.809)	lr 0.00487
Train [86][300/3239]	Time 0.276 (0.582)	Data Time 0.001 (0.143)	Loss 2.5326 (2.4465)	Entropy 0.57834 (0.57965)	Top-1 acc 61.719 (65.022)	Top-5 acc 83.594 (84.801)	lr 0.00487
Train [86][310/3239]	Time 0.237 (0.577)	Data Time 0.001 (0.139)	Loss 2.2926 (2.4444)	Entropy 0.57781 (0.57960)	Top-1 acc 66.797 (65.060)	Top-5 acc 86.328 (84.833)	lr 0.00487
Train [86][320/3239]	Time 0.256 (0.572)	Data Time 0.001 (0.135)	Loss 2.5440 (2.4442)	Entropy 0.57798 (0.57955)	Top-1 acc 64.844 (65.076)	Top-5 acc 83.594 (84.822)	lr 0.00486
Train [86][330/3239]	Time 0.307 (0.726)	Data Time 0.002 (0.131)	Loss 2.8444 (2.4466)	Entropy 0.57796 (0.57950)	Top-1 acc 56.641 (65.025)	Top-5 acc 82.422 (84.788)	lr 0.00486
Train [86][340/3239]	Time 0.360 (0.718)	Data Time 0.002 (0.127)	Loss 2.5896 (2.4454)	Entropy 0.57805 (0.57945)	Top-1 acc 57.812 (65.055)	Top-5 acc 85.156 (84.795)	lr 0.00486
Train [86][350/3239]	Time 0.261 (0.709)	Data Time 0.001 (0.123)	Loss 2.5853 (2.4463)	Entropy 0.57779 (0.57941)	Top-1 acc 57.812 (65.002)	Top-5 acc 82.422 (84.773)	lr 0.00486
Train [86][360/3239]	Time 0.267 (0.701)	Data Time 0.002 (0.120)	Loss 2.4144 (2.4457)	Entropy 0.57783 (0.57937)	Top-1 acc 66.016 (65.013)	Top-5 acc 83.984 (84.769)	lr 0.00486
Train [86][370/3239]	Time 0.234 (0.694)	Data Time 0.002 (0.117)	Loss 2.3929 (2.4443)	Entropy 0.57732 (0.57932)	Top-1 acc 68.359 (65.067)	Top-5 acc 85.547 (84.787)	lr 0.00486
Train [86][380/3239]	Time 0.229 (0.687)	Data Time 0.001 (0.114)	Loss 2.5844 (2.4446)	Entropy 0.57683 (0.57926)	Top-1 acc 60.938 (65.069)	Top-5 acc 82.812 (84.781)	lr 0.00486
Train [86][390/3239]	Time 0.252 (0.681)	Data Time 0.002 (0.111)	Loss 2.4827 (2.4439)	Entropy 0.57698 (0.57920)	Top-1 acc 63.281 (65.088)	Top-5 acc 82.812 (84.793)	lr 0.00486
Train [86][400/3239]	Time 0.245 (0.675)	Data Time 0.001 (0.108)	Loss 2.4468 (2.4429)	Entropy 0.57706 (0.57914)	Top-1 acc 65.234 (65.098)	Top-5 acc 84.766 (84.810)	lr 0.00486
Train [86][410/3239]	Time 0.281 (0.670)	Data Time 0.001 (0.106)	Loss 2.3971 (2.4432)	Entropy 0.57720 (0.57909)	Top-1 acc 66.406 (65.107)	Top-5 acc 86.328 (84.798)	lr 0.00486
Train [86][420/3239]	Time 0.257 (0.664)	Data Time 0.001 (0.103)	Loss 2.3411 (2.4446)	Entropy 0.57684 (0.57904)	Top-1 acc 68.359 (65.097)	Top-5 acc 85.156 (84.767)	lr 0.00486
Train [86][430/3239]	Time 0.338 (0.659)	Data Time 0.002 (0.101)	Loss 2.4944 (2.4444)	Entropy 0.57692 (0.57899)	Top-1 acc 62.109 (65.109)	Top-5 acc 83.203 (84.743)	lr 0.00486
Train [86][440/3239]	Time 0.289 (0.655)	Data Time 0.002 (0.099)	Loss 2.4101 (2.4444)	Entropy 0.57703 (0.57895)	Top-1 acc 65.625 (65.108)	Top-5 acc 84.766 (84.728)	lr 0.00486
Train [86][450/3239]	Time 0.238 (0.650)	Data Time 0.001 (0.096)	Loss 2.5642 (2.4455)	Entropy 0.57681 (0.57890)	Top-1 acc 62.109 (65.073)	Top-5 acc 84.375 (84.725)	lr 0.00485
Train [86][460/3239]	Time 0.236 (0.646)	Data Time 0.001 (0.094)	Loss 2.4801 (2.4448)	Entropy 0.57693 (0.57886)	Top-1 acc 64.062 (65.085)	Top-5 acc 84.766 (84.743)	lr 0.00485
Train [86][470/3239]	Time 0.218 (0.641)	Data Time 0.001 (0.092)	Loss 2.3289 (2.4442)	Entropy 0.57673 (0.57881)	Top-1 acc 67.578 (65.093)	Top-5 acc 87.109 (84.750)	lr 0.00485
Train [86][480/3239]	Time 0.234 (0.637)	Data Time 0.002 (0.091)	Loss 2.4053 (2.4458)	Entropy 0.57692 (0.57877)	Top-1 acc 66.406 (65.058)	Top-5 acc 84.766 (84.727)	lr 0.00485
Train [86][490/3239]	Time 0.245 (0.633)	Data Time 0.001 (0.089)	Loss 2.4659 (2.4458)	Entropy 0.57690 (0.57874)	Top-1 acc 64.844 (65.080)	Top-5 acc 84.375 (84.737)	lr 0.00485
Train [86][500/3239]	Time 0.340 (0.629)	Data Time 0.001 (0.087)	Loss 2.5924 (2.4457)	Entropy 0.57706 (0.57870)	Top-1 acc 62.109 (65.095)	Top-5 acc 81.250 (84.725)	lr 0.00485
Train [86][510/3239]	Time 0.237 (0.625)	Data Time 0.001 (0.085)	Loss 2.4506 (2.4450)	Entropy 0.57704 (0.57867)	Top-1 acc 67.188 (65.117)	Top-5 acc 85.938 (84.738)	lr 0.00485
Train [86][520/3239]	Time 0.295 (0.623)	Data Time 0.002 (0.084)	Loss 2.5076 (2.4442)	Entropy 0.57682 (0.57863)	Top-1 acc 67.188 (65.140)	Top-5 acc 82.422 (84.753)	lr 0.00485
Train [86][530/3239]	Time 0.226 (0.620)	Data Time 0.001 (0.082)	Loss 2.4604 (2.4438)	Entropy 0.57688 (0.57860)	Top-1 acc 62.891 (65.144)	Top-5 acc 84.766 (84.749)	lr 0.00485
Train [86][540/3239]	Time 0.247 (0.616)	Data Time 0.001 (0.081)	Loss 2.4984 (2.4439)	Entropy 0.57700 (0.57857)	Top-1 acc 62.109 (65.140)	Top-5 acc 82.422 (84.737)	lr 0.00485
Train [86][550/3239]	Time 0.286 (0.613)	Data Time 0.002 (0.079)	Loss 2.3940 (2.4420)	Entropy 0.57705 (0.57854)	Top-1 acc 67.188 (65.178)	Top-5 acc 85.547 (84.761)	lr 0.00485
Train [86][560/3239]	Time 0.236 (0.610)	Data Time 0.001 (0.078)	Loss 2.5232 (2.4426)	Entropy 0.57704 (0.57851)	Top-1 acc 64.062 (65.167)	Top-5 acc 83.594 (84.757)	lr 0.00485
Train [86][570/3239]	Time 0.249 (0.607)	Data Time 0.001 (0.077)	Loss 2.3811 (2.4425)	Entropy 0.57699 (0.57848)	Top-1 acc 66.797 (65.180)	Top-5 acc 84.766 (84.757)	lr 0.00484
Train [86][580/3239]	Time 0.237 (0.603)	Data Time 0.001 (0.075)	Loss 2.4342 (2.4422)	Entropy 0.57685 (0.57846)	Top-1 acc 63.281 (65.187)	Top-5 acc 86.328 (84.763)	lr 0.00484
Train [86][590/3239]	Time 0.338 (0.600)	Data Time 0.001 (0.074)	Loss 2.3336 (2.4425)	Entropy 0.57700 (0.57843)	Top-1 acc 66.797 (65.181)	Top-5 acc 87.891 (84.763)	lr 0.00484
Train [86][600/3239]	Time 0.226 (0.598)	Data Time 0.001 (0.073)	Loss 2.4352 (2.4428)	Entropy 0.57713 (0.57841)	Top-1 acc 66.016 (65.162)	Top-5 acc 85.938 (84.752)	lr 0.00484
Train [86][610/3239]	Time 0.238 (0.595)	Data Time 0.001 (0.072)	Loss 2.3973 (2.4420)	Entropy 0.57709 (0.57839)	Top-1 acc 66.406 (65.185)	Top-5 acc 86.328 (84.766)	lr 0.00484
Train [86][620/3239]	Time 0.230 (0.592)	Data Time 0.001 (0.070)	Loss 2.3170 (2.4415)	Entropy 0.57760 (0.57837)	Top-1 acc 68.750 (65.196)	Top-5 acc 86.719 (84.779)	lr 0.00484
Train [86][630/3239]	Time 0.273 (0.590)	Data Time 0.001 (0.069)	Loss 2.5542 (2.4413)	Entropy 0.57770 (0.57836)	Top-1 acc 63.672 (65.207)	Top-5 acc 84.375 (84.787)	lr 0.00484
Train [86][640/3239]	Time 0.251 (0.587)	Data Time 0.001 (0.068)	Loss 2.2951 (2.4414)	Entropy 0.57806 (0.57835)	Top-1 acc 66.406 (65.205)	Top-5 acc 88.281 (84.792)	lr 0.00484
Train [86][650/3239]	Time 0.234 (0.585)	Data Time 0.001 (0.067)	Loss 2.3971 (2.4405)	Entropy 0.57784 (0.57834)	Top-1 acc 65.234 (65.223)	Top-5 acc 85.938 (84.806)	lr 0.00484
Train [86][660/3239]	Time 0.330 (0.582)	Data Time 0.001 (0.066)	Loss 2.2874 (2.4412)	Entropy 0.57780 (0.57833)	Top-1 acc 66.797 (65.197)	Top-5 acc 87.109 (84.790)	lr 0.00484
Train [86][670/3239]	Time 0.271 (0.580)	Data Time 0.003 (0.065)	Loss 2.2904 (2.4408)	Entropy 0.57766 (0.57832)	Top-1 acc 67.188 (65.213)	Top-5 acc 87.109 (84.801)	lr 0.00484
Train [86][680/3239]	Time 0.260 (0.577)	Data Time 0.001 (0.064)	Loss 2.2582 (2.4408)	Entropy 0.57786 (0.57832)	Top-1 acc 68.359 (65.214)	Top-5 acc 86.328 (84.802)	lr 0.00484
Train [86][690/3239]	Time 0.232 (0.575)	Data Time 0.001 (0.064)	Loss 2.3225 (2.4412)	Entropy 0.57793 (0.57831)	Top-1 acc 65.234 (65.193)	Top-5 acc 85.938 (84.792)	lr 0.00484
Train [86][700/3239]	Time 0.237 (0.573)	Data Time 0.001 (0.063)	Loss 2.3986 (2.4402)	Entropy 0.57751 (0.57830)	Top-1 acc 68.750 (65.209)	Top-5 acc 84.375 (84.815)	lr 0.00483
Train [86][710/3239]	Time 0.231 (0.571)	Data Time 0.001 (0.062)	Loss 2.2281 (2.4400)	Entropy 0.57707 (0.57829)	Top-1 acc 69.531 (65.204)	Top-5 acc 88.672 (84.815)	lr 0.00483
Train [86][720/3239]	Time 0.238 (0.568)	Data Time 0.001 (0.061)	Loss 2.5346 (2.4402)	Entropy 0.57715 (0.57827)	Top-1 acc 66.406 (65.203)	Top-5 acc 83.203 (84.815)	lr 0.00483
Train [86][730/3239]	Time 0.234 (0.566)	Data Time 0.001 (0.060)	Loss 2.4054 (2.4400)	Entropy 0.57746 (0.57826)	Top-1 acc 63.672 (65.204)	Top-5 acc 83.203 (84.809)	lr 0.00483
Train [86][740/3239]	Time 0.225 (0.564)	Data Time 0.001 (0.059)	Loss 2.5688 (2.4397)	Entropy 0.57725 (0.57824)	Top-1 acc 62.891 (65.222)	Top-5 acc 80.469 (84.804)	lr 0.00483
Train [86][750/3239]	Time 0.234 (0.562)	Data Time 0.001 (0.059)	Loss 2.2744 (2.4394)	Entropy 0.57765 (0.57823)	Top-1 acc 69.922 (65.212)	Top-5 acc 87.109 (84.812)	lr 0.00483
Train [86][760/3239]	Time 0.280 (0.560)	Data Time 0.001 (0.058)	Loss 2.4813 (2.4398)	Entropy 0.57771 (0.57822)	Top-1 acc 62.891 (65.190)	Top-5 acc 86.719 (84.809)	lr 0.00483
Train [86][770/3239]	Time 0.228 (0.558)	Data Time 0.001 (0.057)	Loss 2.1045 (2.4393)	Entropy 0.57705 (0.57821)	Top-1 acc 70.703 (65.193)	Top-5 acc 92.578 (84.826)	lr 0.00483
Train [86][780/3239]	Time 0.261 (0.557)	Data Time 0.002 (0.056)	Loss 2.3434 (2.4384)	Entropy 0.57699 (0.57820)	Top-1 acc 66.406 (65.201)	Top-5 acc 85.547 (84.834)	lr 0.00483
Train [86][790/3239]	Time 0.332 (0.555)	Data Time 0.002 (0.056)	Loss 2.3721 (2.4387)	Entropy 0.57700 (0.57818)	Top-1 acc 65.234 (65.204)	Top-5 acc 83.594 (84.825)	lr 0.00483
Train [86][800/3239]	Time 0.249 (0.554)	Data Time 0.001 (0.055)	Loss 2.6040 (2.4391)	Entropy 0.57691 (0.57817)	Top-1 acc 60.547 (65.193)	Top-5 acc 80.469 (84.808)	lr 0.00483
Train [86][810/3239]	Time 0.236 (0.552)	Data Time 0.001 (0.054)	Loss 2.3768 (2.4395)	Entropy 0.57698 (0.57815)	Top-1 acc 66.016 (65.179)	Top-5 acc 84.375 (84.804)	lr 0.00483
Train [86][820/3239]	Time 0.334 (0.550)	Data Time 0.001 (0.054)	Loss 2.4487 (2.4390)	Entropy 0.57718 (0.57814)	Top-1 acc 63.672 (65.186)	Top-5 acc 83.203 (84.809)	lr 0.00482
Train [86][830/3239]	Time 0.259 (0.549)	Data Time 0.002 (0.053)	Loss 2.2314 (2.4390)	Entropy 0.57677 (0.57813)	Top-1 acc 68.359 (65.199)	Top-5 acc 88.672 (84.807)	lr 0.00482
Train [86][840/3239]	Time 0.283 (0.548)	Data Time 0.002 (0.053)	Loss 2.3831 (2.4396)	Entropy 0.57684 (0.57811)	Top-1 acc 65.234 (65.180)	Top-5 acc 86.328 (84.797)	lr 0.00482
Train [86][850/3239]	Time 0.220 (0.547)	Data Time 0.001 (0.052)	Loss 2.4411 (2.4399)	Entropy 0.57674 (0.57810)	Top-1 acc 67.969 (65.169)	Top-5 acc 85.938 (84.795)	lr 0.00482
Train [86][860/3239]	Time 0.286 (0.545)	Data Time 0.002 (0.051)	Loss 2.5276 (2.4404)	Entropy 0.57677 (0.57808)	Top-1 acc 63.672 (65.149)	Top-5 acc 82.031 (84.786)	lr 0.00482
Train [86][870/3239]	Time 0.239 (0.544)	Data Time 0.001 (0.051)	Loss 2.3151 (2.4399)	Entropy 0.57698 (0.57807)	Top-1 acc 68.750 (65.167)	Top-5 acc 85.938 (84.792)	lr 0.00482
Train [86][880/3239]	Time 0.235 (0.542)	Data Time 0.001 (0.050)	Loss 2.4664 (2.4398)	Entropy 0.57691 (0.57805)	Top-1 acc 64.062 (65.169)	Top-5 acc 83.594 (84.799)	lr 0.00482
Train [86][890/3239]	Time 0.353 (0.541)	Data Time 0.001 (0.050)	Loss 2.4729 (2.4399)	Entropy 0.57706 (0.57804)	Top-1 acc 67.188 (65.169)	Top-5 acc 84.766 (84.793)	lr 0.00482
Train [86][900/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.049)	Loss 2.4943 (2.4404)	Entropy 0.57716 (0.57803)	Top-1 acc 62.500 (65.145)	Top-5 acc 83.984 (84.780)	lr 0.00482
Train [86][910/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.049)	Loss 2.6130 (2.4408)	Entropy 0.57737 (0.57802)	Top-1 acc 57.422 (65.143)	Top-5 acc 79.688 (84.766)	lr 0.00482
Train [86][920/3239]	Time 0.245 (0.537)	Data Time 0.001 (0.048)	Loss 2.3388 (2.4399)	Entropy 0.57755 (0.57802)	Top-1 acc 68.359 (65.171)	Top-5 acc 89.062 (84.782)	lr 0.00482
Train [86][930/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.048)	Loss 2.4013 (2.4395)	Entropy 0.57764 (0.57801)	Top-1 acc 65.625 (65.174)	Top-5 acc 85.938 (84.789)	lr 0.00482
Train [86][940/3239]	Time 0.239 (0.534)	Data Time 0.002 (0.047)	Loss 2.3818 (2.4398)	Entropy 0.57776 (0.57801)	Top-1 acc 69.141 (65.177)	Top-5 acc 84.375 (84.782)	lr 0.00482
Train [86][950/3239]	Time 0.240 (0.533)	Data Time 0.001 (0.047)	Loss 2.4413 (2.4401)	Entropy 0.57756 (0.57800)	Top-1 acc 65.234 (65.166)	Top-5 acc 86.328 (84.781)	lr 0.00481
Train [86][960/3239]	Time 0.225 (0.532)	Data Time 0.001 (0.046)	Loss 2.6817 (2.4404)	Entropy 0.57749 (0.57800)	Top-1 acc 63.672 (65.160)	Top-5 acc 81.641 (84.779)	lr 0.00481
Train [86][970/3239]	Time 0.238 (0.531)	Data Time 0.001 (0.046)	Loss 2.3504 (2.4399)	Entropy 0.57746 (0.57799)	Top-1 acc 67.969 (65.177)	Top-5 acc 85.156 (84.779)	lr 0.00481
Train [86][980/3239]	Time 0.407 (0.585)	Data Time 0.005 (0.045)	Loss 2.2381 (2.4398)	Entropy 0.57745 (0.57799)	Top-1 acc 66.797 (65.183)	Top-5 acc 88.672 (84.780)	lr 0.00481
Train [86][990/3239]	Time 0.245 (0.583)	Data Time 0.002 (0.045)	Loss 2.4823 (2.4398)	Entropy 0.57686 (0.57798)	Top-1 acc 63.281 (65.172)	Top-5 acc 84.375 (84.779)	lr 0.00481
Train [86][1000/3239]	Time 0.231 (0.582)	Data Time 0.001 (0.044)	Loss 2.4904 (2.4397)	Entropy 0.57666 (0.57797)	Top-1 acc 62.891 (65.171)	Top-5 acc 83.594 (84.784)	lr 0.00481
Train [86][1010/3239]	Time 0.239 (0.580)	Data Time 0.001 (0.044)	Loss 2.5692 (2.4401)	Entropy 0.57646 (0.57796)	Top-1 acc 64.844 (65.153)	Top-5 acc 83.984 (84.768)	lr 0.00481
Train [86][1020/3239]	Time 0.249 (0.579)	Data Time 0.001 (0.044)	Loss 2.1963 (2.4404)	Entropy 0.57602 (0.57794)	Top-1 acc 67.188 (65.143)	Top-5 acc 89.062 (84.755)	lr 0.00481
Train [86][1030/3239]	Time 0.357 (0.578)	Data Time 0.001 (0.043)	Loss 2.2754 (2.4403)	Entropy 0.57600 (0.57792)	Top-1 acc 70.312 (65.149)	Top-5 acc 87.891 (84.759)	lr 0.00481
Train [86][1040/3239]	Time 0.272 (0.577)	Data Time 0.002 (0.043)	Loss 2.2999 (2.4409)	Entropy 0.57573 (0.57790)	Top-1 acc 69.141 (65.129)	Top-5 acc 86.719 (84.746)	lr 0.00481
Train [86][1050/3239]	Time 0.378 (0.576)	Data Time 0.001 (0.042)	Loss 2.3958 (2.4410)	Entropy 0.57595 (0.57788)	Top-1 acc 64.844 (65.142)	Top-5 acc 84.375 (84.734)	lr 0.00481
Train [86][1060/3239]	Time 0.246 (0.574)	Data Time 0.001 (0.042)	Loss 2.4949 (2.4414)	Entropy 0.57598 (0.57787)	Top-1 acc 64.062 (65.132)	Top-5 acc 82.812 (84.726)	lr 0.00481
Train [86][1070/3239]	Time 0.245 (0.573)	Data Time 0.001 (0.042)	Loss 2.4221 (2.4407)	Entropy 0.57592 (0.57785)	Top-1 acc 65.625 (65.137)	Top-5 acc 85.547 (84.743)	lr 0.00481
Train [86][1080/3239]	Time 0.238 (0.572)	Data Time 0.001 (0.041)	Loss 2.5351 (2.4404)	Entropy 0.57594 (0.57783)	Top-1 acc 58.984 (65.138)	Top-5 acc 83.203 (84.743)	lr 0.00480
Train [86][1090/3239]	Time 0.233 (0.570)	Data Time 0.001 (0.041)	Loss 2.3938 (2.4409)	Entropy 0.57562 (0.57781)	Top-1 acc 64.453 (65.114)	Top-5 acc 84.766 (84.732)	lr 0.00480
Train [86][1100/3239]	Time 0.265 (0.569)	Data Time 0.001 (0.041)	Loss 2.4741 (2.4411)	Entropy 0.57568 (0.57779)	Top-1 acc 63.672 (65.113)	Top-5 acc 85.156 (84.729)	lr 0.00480
Train [86][1110/3239]	Time 0.236 (0.568)	Data Time 0.001 (0.040)	Loss 2.3816 (2.4409)	Entropy 0.57574 (0.57777)	Top-1 acc 69.531 (65.118)	Top-5 acc 86.328 (84.729)	lr 0.00480
Train [86][1120/3239]	Time 0.262 (0.567)	Data Time 0.001 (0.040)	Loss 2.4846 (2.4412)	Entropy 0.57592 (0.57776)	Top-1 acc 63.672 (65.126)	Top-5 acc 85.156 (84.725)	lr 0.00480
Train [86][1130/3239]	Time 0.237 (0.565)	Data Time 0.001 (0.040)	Loss 2.3048 (2.4414)	Entropy 0.57577 (0.57774)	Top-1 acc 67.188 (65.119)	Top-5 acc 88.672 (84.720)	lr 0.00480
Train [86][1140/3239]	Time 0.376 (0.564)	Data Time 0.001 (0.039)	Loss 2.4948 (2.4416)	Entropy 0.57583 (0.57772)	Top-1 acc 66.797 (65.113)	Top-5 acc 81.250 (84.715)	lr 0.00480
Train [86][1150/3239]	Time 0.235 (0.563)	Data Time 0.002 (0.039)	Loss 2.4354 (2.4412)	Entropy 0.57602 (0.57771)	Top-1 acc 67.578 (65.126)	Top-5 acc 84.375 (84.718)	lr 0.00480
Train [86][1160/3239]	Time 0.280 (0.562)	Data Time 0.002 (0.039)	Loss 2.6092 (2.4409)	Entropy 0.57596 (0.57769)	Top-1 acc 59.766 (65.131)	Top-5 acc 80.469 (84.726)	lr 0.00480
Train [86][1170/3239]	Time 0.222 (0.561)	Data Time 0.001 (0.038)	Loss 2.4771 (2.4412)	Entropy 0.57570 (0.57768)	Top-1 acc 65.625 (65.126)	Top-5 acc 83.203 (84.723)	lr 0.00480
Train [86][1180/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.038)	Loss 2.5083 (2.4413)	Entropy 0.57588 (0.57766)	Top-1 acc 65.234 (65.125)	Top-5 acc 82.422 (84.722)	lr 0.00480
Train [86][1190/3239]	Time 0.278 (0.559)	Data Time 0.004 (0.038)	Loss 2.4332 (2.4417)	Entropy 0.57597 (0.57764)	Top-1 acc 70.312 (65.118)	Top-5 acc 86.328 (84.713)	lr 0.00480
Train [86][1200/3239]	Time 0.233 (0.558)	Data Time 0.001 (0.037)	Loss 2.4060 (2.4415)	Entropy 0.57587 (0.57763)	Top-1 acc 65.625 (65.129)	Top-5 acc 84.375 (84.719)	lr 0.00479
Train [86][1210/3239]	Time 0.332 (0.557)	Data Time 0.001 (0.037)	Loss 2.2461 (2.4421)	Entropy 0.57597 (0.57762)	Top-1 acc 67.578 (65.117)	Top-5 acc 87.891 (84.711)	lr 0.00479
Train [86][1220/3239]	Time 0.266 (0.555)	Data Time 0.001 (0.037)	Loss 2.3566 (2.4421)	Entropy 0.57569 (0.57760)	Top-1 acc 68.359 (65.115)	Top-5 acc 86.719 (84.715)	lr 0.00479
Train [86][1230/3239]	Time 0.244 (0.554)	Data Time 0.001 (0.036)	Loss 2.5293 (2.4416)	Entropy 0.57571 (0.57759)	Top-1 acc 63.281 (65.140)	Top-5 acc 83.203 (84.725)	lr 0.00479
Train [86][1240/3239]	Time 0.228 (0.553)	Data Time 0.001 (0.036)	Loss 2.3908 (2.4418)	Entropy 0.57594 (0.57757)	Top-1 acc 67.188 (65.130)	Top-5 acc 85.938 (84.727)	lr 0.00479
Train [86][1250/3239]	Time 0.237 (0.552)	Data Time 0.003 (0.036)	Loss 2.3865 (2.4416)	Entropy 0.57603 (0.57756)	Top-1 acc 66.797 (65.138)	Top-5 acc 88.281 (84.733)	lr 0.00479
Train [86][1260/3239]	Time 0.255 (0.552)	Data Time 0.004 (0.036)	Loss 2.5982 (2.4420)	Entropy 0.57608 (0.57755)	Top-1 acc 62.500 (65.141)	Top-5 acc 82.422 (84.728)	lr 0.00479
Train [86][1270/3239]	Time 0.260 (0.551)	Data Time 0.001 (0.035)	Loss 2.5809 (2.4425)	Entropy 0.57620 (0.57754)	Top-1 acc 64.062 (65.129)	Top-5 acc 81.641 (84.719)	lr 0.00479
Train [86][1280/3239]	Time 0.254 (0.550)	Data Time 0.001 (0.035)	Loss 2.2763 (2.4420)	Entropy 0.57645 (0.57753)	Top-1 acc 67.969 (65.141)	Top-5 acc 88.281 (84.728)	lr 0.00479
Train [86][1290/3239]	Time 0.225 (0.549)	Data Time 0.001 (0.035)	Loss 2.3723 (2.4415)	Entropy 0.57631 (0.57752)	Top-1 acc 66.016 (65.151)	Top-5 acc 87.109 (84.734)	lr 0.00479
Train [86][1300/3239]	Time 0.249 (0.548)	Data Time 0.001 (0.035)	Loss 2.3491 (2.4416)	Entropy 0.57603 (0.57751)	Top-1 acc 70.312 (65.147)	Top-5 acc 85.156 (84.732)	lr 0.00479
Train [86][1310/3239]	Time 0.294 (0.547)	Data Time 0.002 (0.034)	Loss 2.1557 (2.4414)	Entropy 0.57603 (0.57750)	Top-1 acc 74.219 (65.152)	Top-5 acc 89.453 (84.736)	lr 0.00479
Train [86][1320/3239]	Time 0.256 (0.546)	Data Time 0.001 (0.034)	Loss 2.6325 (2.4412)	Entropy 0.57614 (0.57749)	Top-1 acc 60.547 (65.159)	Top-5 acc 82.031 (84.739)	lr 0.00479
Train [86][1330/3239]	Time 0.240 (0.545)	Data Time 0.002 (0.034)	Loss 2.2991 (2.4411)	Entropy 0.57642 (0.57748)	Top-1 acc 68.750 (65.164)	Top-5 acc 87.500 (84.741)	lr 0.00478
Train [86][1340/3239]	Time 0.245 (0.544)	Data Time 0.001 (0.034)	Loss 2.3247 (2.4407)	Entropy 0.57630 (0.57747)	Top-1 acc 67.969 (65.172)	Top-5 acc 85.938 (84.748)	lr 0.00478
Train [86][1350/3239]	Time 0.246 (0.543)	Data Time 0.001 (0.033)	Loss 2.2451 (2.4409)	Entropy 0.57695 (0.57746)	Top-1 acc 71.094 (65.169)	Top-5 acc 89.453 (84.745)	lr 0.00478
Train [86][1360/3239]	Time 0.259 (0.543)	Data Time 0.002 (0.033)	Loss 2.3797 (2.4410)	Entropy 0.57741 (0.57746)	Top-1 acc 67.578 (65.170)	Top-5 acc 85.547 (84.748)	lr 0.00478
Train [86][1370/3239]	Time 0.362 (0.542)	Data Time 0.001 (0.033)	Loss 2.3962 (2.4409)	Entropy 0.57725 (0.57746)	Top-1 acc 67.188 (65.172)	Top-5 acc 84.766 (84.747)	lr 0.00478
Train [86][1380/3239]	Time 0.244 (0.541)	Data Time 0.001 (0.033)	Loss 2.3503 (2.4412)	Entropy 0.57701 (0.57746)	Top-1 acc 64.844 (65.157)	Top-5 acc 84.766 (84.742)	lr 0.00478
Train [86][1390/3239]	Time 0.285 (0.540)	Data Time 0.001 (0.032)	Loss 2.6443 (2.4418)	Entropy 0.57721 (0.57745)	Top-1 acc 58.594 (65.142)	Top-5 acc 81.641 (84.731)	lr 0.00478
Train [86][1400/3239]	Time 0.307 (0.539)	Data Time 0.002 (0.032)	Loss 2.2930 (2.4419)	Entropy 0.57712 (0.57745)	Top-1 acc 69.141 (65.141)	Top-5 acc 87.500 (84.730)	lr 0.00478
Train [86][1410/3239]	Time 0.234 (0.539)	Data Time 0.002 (0.032)	Loss 2.2835 (2.4420)	Entropy 0.57684 (0.57745)	Top-1 acc 69.531 (65.133)	Top-5 acc 87.109 (84.725)	lr 0.00478
Train [86][1420/3239]	Time 0.227 (0.538)	Data Time 0.002 (0.032)	Loss 2.5499 (2.4421)	Entropy 0.57663 (0.57744)	Top-1 acc 60.547 (65.131)	Top-5 acc 83.594 (84.722)	lr 0.00478
Train [86][1430/3239]	Time 0.273 (0.537)	Data Time 0.001 (0.032)	Loss 2.3790 (2.4420)	Entropy 0.57694 (0.57744)	Top-1 acc 65.234 (65.128)	Top-5 acc 85.938 (84.729)	lr 0.00478
Train [86][1440/3239]	Time 0.386 (0.536)	Data Time 0.001 (0.031)	Loss 2.5245 (2.4425)	Entropy 0.57727 (0.57743)	Top-1 acc 63.672 (65.116)	Top-5 acc 85.156 (84.723)	lr 0.00478
Train [86][1450/3239]	Time 0.278 (0.535)	Data Time 0.001 (0.031)	Loss 2.2529 (2.4424)	Entropy 0.57771 (0.57743)	Top-1 acc 67.969 (65.124)	Top-5 acc 89.062 (84.726)	lr 0.00477
Train [86][1460/3239]	Time 0.232 (0.535)	Data Time 0.001 (0.031)	Loss 2.5489 (2.4427)	Entropy 0.57781 (0.57744)	Top-1 acc 60.938 (65.112)	Top-5 acc 82.031 (84.712)	lr 0.00477
Train [86][1470/3239]	Time 0.275 (0.534)	Data Time 0.001 (0.031)	Loss 2.4670 (2.4427)	Entropy 0.57824 (0.57744)	Top-1 acc 65.625 (65.115)	Top-5 acc 83.984 (84.714)	lr 0.00477
Train [86][1480/3239]	Time 0.266 (0.533)	Data Time 0.001 (0.031)	Loss 2.4300 (2.4426)	Entropy 0.57818 (0.57745)	Top-1 acc 68.750 (65.120)	Top-5 acc 82.422 (84.717)	lr 0.00477
Train [86][1490/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.030)	Loss 2.4004 (2.4429)	Entropy 0.57807 (0.57745)	Top-1 acc 69.922 (65.118)	Top-5 acc 85.547 (84.711)	lr 0.00477
Train [86][1500/3239]	Time 0.242 (0.532)	Data Time 0.001 (0.030)	Loss 2.4378 (2.4428)	Entropy 0.57809 (0.57745)	Top-1 acc 66.406 (65.119)	Top-5 acc 84.766 (84.709)	lr 0.00477
Train [86][1510/3239]	Time 0.288 (0.531)	Data Time 0.001 (0.030)	Loss 2.2725 (2.4426)	Entropy 0.57825 (0.57746)	Top-1 acc 70.703 (65.123)	Top-5 acc 86.719 (84.713)	lr 0.00477
Train [86][1520/3239]	Time 0.230 (0.531)	Data Time 0.001 (0.030)	Loss 2.3894 (2.4427)	Entropy 0.57808 (0.57746)	Top-1 acc 66.406 (65.119)	Top-5 acc 86.328 (84.712)	lr 0.00477
Train [86][1530/3239]	Time 0.423 (0.530)	Data Time 0.003 (0.030)	Loss 2.3435 (2.4428)	Entropy 0.57797 (0.57747)	Top-1 acc 63.672 (65.120)	Top-5 acc 88.672 (84.715)	lr 0.00477
Train [86][1540/3239]	Time 0.248 (0.530)	Data Time 0.001 (0.029)	Loss 2.3677 (2.4427)	Entropy 0.57785 (0.57747)	Top-1 acc 64.453 (65.119)	Top-5 acc 85.547 (84.713)	lr 0.00477
Train [86][1550/3239]	Time 0.238 (0.529)	Data Time 0.002 (0.029)	Loss 2.4591 (2.4427)	Entropy 0.57777 (0.57747)	Top-1 acc 66.016 (65.126)	Top-5 acc 82.422 (84.709)	lr 0.00477
Train [86][1560/3239]	Time 0.246 (0.528)	Data Time 0.001 (0.029)	Loss 2.4357 (2.4430)	Entropy 0.57781 (0.57747)	Top-1 acc 65.625 (65.118)	Top-5 acc 85.938 (84.705)	lr 0.00477
Train [86][1570/3239]	Time 0.398 (0.528)	Data Time 0.002 (0.029)	Loss 2.3999 (2.4431)	Entropy 0.57797 (0.57748)	Top-1 acc 62.891 (65.108)	Top-5 acc 85.547 (84.710)	lr 0.00477
Train [86][1580/3239]	Time 0.239 (0.528)	Data Time 0.001 (0.029)	Loss 2.3998 (2.4431)	Entropy 0.57779 (0.57748)	Top-1 acc 67.578 (65.108)	Top-5 acc 83.984 (84.711)	lr 0.00476
Train [86][1590/3239]	Time 0.308 (0.527)	Data Time 0.002 (0.029)	Loss 2.4419 (2.4431)	Entropy 0.57793 (0.57748)	Top-1 acc 62.891 (65.108)	Top-5 acc 82.812 (84.710)	lr 0.00476
Train [86][1600/3239]	Time 0.335 (0.526)	Data Time 0.001 (0.028)	Loss 2.6089 (2.4434)	Entropy 0.57784 (0.57749)	Top-1 acc 60.156 (65.100)	Top-5 acc 84.375 (84.706)	lr 0.00476
Train [86][1610/3239]	Time 0.242 (0.526)	Data Time 0.001 (0.028)	Loss 2.4924 (2.4437)	Entropy 0.57746 (0.57749)	Top-1 acc 62.891 (65.090)	Top-5 acc 82.812 (84.701)	lr 0.00476
Train [86][1620/3239]	Time 0.257 (0.525)	Data Time 0.001 (0.028)	Loss 2.3044 (2.4436)	Entropy 0.57748 (0.57749)	Top-1 acc 69.531 (65.092)	Top-5 acc 87.500 (84.701)	lr 0.00476
Train [86][1630/3239]	Time 0.257 (0.525)	Data Time 0.001 (0.028)	Loss 2.5434 (2.4438)	Entropy 0.57743 (0.57749)	Top-1 acc 60.938 (65.088)	Top-5 acc 83.594 (84.697)	lr 0.00476
Train [86][1640/3239]	Time 0.247 (0.560)	Data Time 0.002 (0.028)	Loss 2.4907 (2.4433)	Entropy 0.57691 (0.57749)	Top-1 acc 63.672 (65.103)	Top-5 acc 83.594 (84.704)	lr 0.00476
Train [86][1650/3239]	Time 0.253 (0.560)	Data Time 0.002 (0.028)	Loss 2.3545 (2.4433)	Entropy 0.57695 (0.57748)	Top-1 acc 68.750 (65.100)	Top-5 acc 86.328 (84.703)	lr 0.00476
Train [86][1660/3239]	Time 0.245 (0.559)	Data Time 0.002 (0.027)	Loss 2.3780 (2.4435)	Entropy 0.57688 (0.57748)	Top-1 acc 62.109 (65.092)	Top-5 acc 86.719 (84.701)	lr 0.00476
Train [86][1670/3239]	Time 0.237 (0.558)	Data Time 0.002 (0.027)	Loss 2.4923 (2.4434)	Entropy 0.57696 (0.57747)	Top-1 acc 61.719 (65.095)	Top-5 acc 85.156 (84.705)	lr 0.00476
Train [86][1680/3239]	Time 0.253 (0.558)	Data Time 0.003 (0.027)	Loss 2.6610 (2.4436)	Entropy 0.57731 (0.57747)	Top-1 acc 60.547 (65.090)	Top-5 acc 80.078 (84.702)	lr 0.00476
Train [86][1690/3239]	Time 0.341 (0.557)	Data Time 0.001 (0.027)	Loss 2.5569 (2.4432)	Entropy 0.57728 (0.57747)	Top-1 acc 62.109 (65.097)	Top-5 acc 82.812 (84.707)	lr 0.00476
Train [86][1700/3239]	Time 0.243 (0.556)	Data Time 0.001 (0.027)	Loss 2.4624 (2.4433)	Entropy 0.57695 (0.57747)	Top-1 acc 66.797 (65.095)	Top-5 acc 83.984 (84.706)	lr 0.00475
Train [86][1710/3239]	Time 0.234 (0.555)	Data Time 0.001 (0.027)	Loss 2.4385 (2.4432)	Entropy 0.57694 (0.57747)	Top-1 acc 65.625 (65.100)	Top-5 acc 84.766 (84.706)	lr 0.00475
Train [86][1720/3239]	Time 0.246 (0.555)	Data Time 0.002 (0.027)	Loss 2.5990 (2.4432)	Entropy 0.57700 (0.57746)	Top-1 acc 59.766 (65.101)	Top-5 acc 82.031 (84.704)	lr 0.00475
Train [86][1730/3239]	Time 0.243 (0.554)	Data Time 0.002 (0.026)	Loss 2.3168 (2.4427)	Entropy 0.57728 (0.57746)	Top-1 acc 67.578 (65.107)	Top-5 acc 86.719 (84.713)	lr 0.00475
Train [86][1740/3239]	Time 0.254 (0.553)	Data Time 0.001 (0.026)	Loss 2.3313 (2.4426)	Entropy 0.57737 (0.57746)	Top-1 acc 68.359 (65.108)	Top-5 acc 85.547 (84.716)	lr 0.00475
Train [86][1750/3239]	Time 0.264 (0.552)	Data Time 0.002 (0.026)	Loss 2.3223 (2.4427)	Entropy 0.57769 (0.57746)	Top-1 acc 67.969 (65.108)	Top-5 acc 86.328 (84.711)	lr 0.00475
Train [86][1760/3239]	Time 0.387 (0.552)	Data Time 0.001 (0.026)	Loss 2.4228 (2.4427)	Entropy 0.57768 (0.57746)	Top-1 acc 67.188 (65.109)	Top-5 acc 87.109 (84.710)	lr 0.00475
Train [86][1770/3239]	Time 0.294 (0.551)	Data Time 0.001 (0.026)	Loss 2.4312 (2.4430)	Entropy 0.57734 (0.57746)	Top-1 acc 66.406 (65.104)	Top-5 acc 85.547 (84.704)	lr 0.00475
Train [86][1780/3239]	Time 0.248 (0.550)	Data Time 0.001 (0.026)	Loss 2.3322 (2.4430)	Entropy 0.57720 (0.57746)	Top-1 acc 66.406 (65.100)	Top-5 acc 86.328 (84.703)	lr 0.00475
Train [86][1790/3239]	Time 0.257 (0.550)	Data Time 0.001 (0.026)	Loss 2.6742 (2.4431)	Entropy 0.57727 (0.57746)	Top-1 acc 64.062 (65.105)	Top-5 acc 79.297 (84.705)	lr 0.00475
Train [86][1800/3239]	Time 0.248 (0.549)	Data Time 0.002 (0.025)	Loss 2.2328 (2.4431)	Entropy 0.57749 (0.57746)	Top-1 acc 67.578 (65.107)	Top-5 acc 87.891 (84.707)	lr 0.00475
Train [86][1810/3239]	Time 0.231 (0.549)	Data Time 0.001 (0.025)	Loss 2.4707 (2.4432)	Entropy 0.57725 (0.57746)	Top-1 acc 64.453 (65.107)	Top-5 acc 83.203 (84.708)	lr 0.00475
Train [86][1820/3239]	Time 0.280 (0.548)	Data Time 0.001 (0.025)	Loss 2.4737 (2.4434)	Entropy 0.57736 (0.57746)	Top-1 acc 64.062 (65.102)	Top-5 acc 83.594 (84.706)	lr 0.00475
Train [86][1830/3239]	Time 0.227 (0.547)	Data Time 0.001 (0.025)	Loss 2.3445 (2.4432)	Entropy 0.57691 (0.57746)	Top-1 acc 68.359 (65.105)	Top-5 acc 86.719 (84.710)	lr 0.00474
Train [86][1840/3239]	Time 0.234 (0.547)	Data Time 0.001 (0.025)	Loss 2.4982 (2.4435)	Entropy 0.57659 (0.57746)	Top-1 acc 62.891 (65.099)	Top-5 acc 84.766 (84.707)	lr 0.00474
Train [86][1850/3239]	Time 0.335 (0.546)	Data Time 0.001 (0.025)	Loss 2.3659 (2.4437)	Entropy 0.57662 (0.57745)	Top-1 acc 65.625 (65.095)	Top-5 acc 86.328 (84.703)	lr 0.00474
Train [86][1860/3239]	Time 0.243 (0.545)	Data Time 0.001 (0.025)	Loss 2.2497 (2.4434)	Entropy 0.57676 (0.57745)	Top-1 acc 71.484 (65.102)	Top-5 acc 87.891 (84.706)	lr 0.00474
Train [86][1870/3239]	Time 0.223 (0.545)	Data Time 0.001 (0.025)	Loss 2.5882 (2.4436)	Entropy 0.57695 (0.57744)	Top-1 acc 63.672 (65.099)	Top-5 acc 82.031 (84.708)	lr 0.00474
Train [86][1880/3239]	Time 0.260 (0.544)	Data Time 0.001 (0.024)	Loss 2.5042 (2.4434)	Entropy 0.57698 (0.57744)	Top-1 acc 66.797 (65.101)	Top-5 acc 84.375 (84.712)	lr 0.00474
Train [86][1890/3239]	Time 0.300 (0.544)	Data Time 0.002 (0.024)	Loss 2.2546 (2.4432)	Entropy 0.57679 (0.57744)	Top-1 acc 71.484 (65.108)	Top-5 acc 89.844 (84.718)	lr 0.00474
Train [86][1900/3239]	Time 0.300 (0.543)	Data Time 0.002 (0.024)	Loss 2.3658 (2.4434)	Entropy 0.57635 (0.57743)	Top-1 acc 65.234 (65.100)	Top-5 acc 86.719 (84.719)	lr 0.00474
Train [86][1910/3239]	Time 0.262 (0.542)	Data Time 0.002 (0.024)	Loss 2.6613 (2.4435)	Entropy 0.57648 (0.57743)	Top-1 acc 63.281 (65.103)	Top-5 acc 79.688 (84.718)	lr 0.00474
Train [86][1920/3239]	Time 0.403 (0.542)	Data Time 0.002 (0.024)	Loss 2.4282 (2.4437)	Entropy 0.57665 (0.57742)	Top-1 acc 64.453 (65.098)	Top-5 acc 84.766 (84.716)	lr 0.00474
Train [86][1930/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.024)	Loss 2.5957 (2.4435)	Entropy 0.57680 (0.57742)	Top-1 acc 64.453 (65.106)	Top-5 acc 82.422 (84.718)	lr 0.00474
Train [86][1940/3239]	Time 0.258 (0.541)	Data Time 0.025 (0.024)	Loss 2.3932 (2.4437)	Entropy 0.57693 (0.57742)	Top-1 acc 66.797 (65.108)	Top-5 acc 86.719 (84.718)	lr 0.00474
Train [86][1950/3239]	Time 0.278 (0.541)	Data Time 0.001 (0.024)	Loss 2.3894 (2.4440)	Entropy 0.57710 (0.57742)	Top-1 acc 69.141 (65.099)	Top-5 acc 84.766 (84.716)	lr 0.00474
Train [86][1960/3239]	Time 0.254 (0.540)	Data Time 0.001 (0.024)	Loss 2.3684 (2.4440)	Entropy 0.57691 (0.57741)	Top-1 acc 65.234 (65.101)	Top-5 acc 85.156 (84.716)	lr 0.00473
Train [86][1970/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.023)	Loss 2.4309 (2.4438)	Entropy 0.57688 (0.57741)	Top-1 acc 66.016 (65.104)	Top-5 acc 85.156 (84.720)	lr 0.00473
Train [86][1980/3239]	Time 0.233 (0.539)	Data Time 0.001 (0.023)	Loss 2.5867 (2.4435)	Entropy 0.57699 (0.57741)	Top-1 acc 59.766 (65.111)	Top-5 acc 83.203 (84.726)	lr 0.00473
Train [86][1990/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.023)	Loss 2.8065 (2.4436)	Entropy 0.57719 (0.57741)	Top-1 acc 56.250 (65.109)	Top-5 acc 76.172 (84.723)	lr 0.00473
Train [86][2000/3239]	Time 0.296 (0.538)	Data Time 0.001 (0.023)	Loss 2.4608 (2.4438)	Entropy 0.57751 (0.57741)	Top-1 acc 62.891 (65.105)	Top-5 acc 84.375 (84.720)	lr 0.00473
Train [86][2010/3239]	Time 0.295 (0.537)	Data Time 0.001 (0.023)	Loss 2.6403 (2.4439)	Entropy 0.57736 (0.57741)	Top-1 acc 55.859 (65.106)	Top-5 acc 82.031 (84.716)	lr 0.00473
Train [86][2020/3239]	Time 0.265 (0.537)	Data Time 0.002 (0.023)	Loss 2.5115 (2.4438)	Entropy 0.57748 (0.57741)	Top-1 acc 67.578 (65.110)	Top-5 acc 83.203 (84.716)	lr 0.00473
Train [86][2030/3239]	Time 0.259 (0.536)	Data Time 0.002 (0.023)	Loss 2.4634 (2.4438)	Entropy 0.57761 (0.57741)	Top-1 acc 66.406 (65.115)	Top-5 acc 85.547 (84.721)	lr 0.00473
Train [86][2040/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.023)	Loss 2.4922 (2.4441)	Entropy 0.57736 (0.57741)	Top-1 acc 62.109 (65.101)	Top-5 acc 85.156 (84.719)	lr 0.00473
Train [86][2050/3239]	Time 0.266 (0.535)	Data Time 0.001 (0.023)	Loss 2.4865 (2.4438)	Entropy 0.57701 (0.57741)	Top-1 acc 65.234 (65.103)	Top-5 acc 83.203 (84.726)	lr 0.00473
Train [86][2060/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.023)	Loss 2.3489 (2.4438)	Entropy 0.57696 (0.57740)	Top-1 acc 69.531 (65.105)	Top-5 acc 87.500 (84.728)	lr 0.00473
Train [86][2070/3239]	Time 0.259 (0.534)	Data Time 0.002 (0.022)	Loss 2.3818 (2.4437)	Entropy 0.57682 (0.57740)	Top-1 acc 67.188 (65.111)	Top-5 acc 88.281 (84.733)	lr 0.00473
Train [86][2080/3239]	Time 0.389 (0.534)	Data Time 0.001 (0.022)	Loss 2.4560 (2.4437)	Entropy 0.57675 (0.57740)	Top-1 acc 61.719 (65.108)	Top-5 acc 85.938 (84.732)	lr 0.00472
Train [86][2090/3239]	Time 0.267 (0.533)	Data Time 0.032 (0.022)	Loss 2.2386 (2.4437)	Entropy 0.57681 (0.57740)	Top-1 acc 70.703 (65.107)	Top-5 acc 88.281 (84.733)	lr 0.00472
Train [86][2100/3239]	Time 0.233 (0.532)	Data Time 0.001 (0.022)	Loss 2.2558 (2.4439)	Entropy 0.57733 (0.57739)	Top-1 acc 68.750 (65.102)	Top-5 acc 88.281 (84.733)	lr 0.00472
Train [86][2110/3239]	Time 0.233 (0.532)	Data Time 0.001 (0.022)	Loss 2.5480 (2.4443)	Entropy 0.57704 (0.57739)	Top-1 acc 66.016 (65.093)	Top-5 acc 83.594 (84.723)	lr 0.00472
Train [86][2120/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.022)	Loss 2.5011 (2.4444)	Entropy 0.57732 (0.57739)	Top-1 acc 63.281 (65.090)	Top-5 acc 83.594 (84.722)	lr 0.00472
Train [86][2130/3239]	Time 0.246 (0.531)	Data Time 0.001 (0.022)	Loss 2.5845 (2.4445)	Entropy 0.57727 (0.57739)	Top-1 acc 64.062 (65.087)	Top-5 acc 80.859 (84.719)	lr 0.00472
Train [86][2140/3239]	Time 0.226 (0.530)	Data Time 0.001 (0.022)	Loss 2.4032 (2.4446)	Entropy 0.57712 (0.57739)	Top-1 acc 67.969 (65.088)	Top-5 acc 84.375 (84.717)	lr 0.00472
Train [86][2150/3239]	Time 0.329 (0.530)	Data Time 0.001 (0.022)	Loss 2.3915 (2.4445)	Entropy 0.57726 (0.57739)	Top-1 acc 60.547 (65.089)	Top-5 acc 85.156 (84.718)	lr 0.00472
Train [86][2160/3239]	Time 0.238 (0.529)	Data Time 0.002 (0.022)	Loss 2.4410 (2.4445)	Entropy 0.57708 (0.57739)	Top-1 acc 66.016 (65.091)	Top-5 acc 82.422 (84.714)	lr 0.00472
Train [86][2170/3239]	Time 0.251 (0.529)	Data Time 0.001 (0.021)	Loss 2.7487 (2.4447)	Entropy 0.57731 (0.57739)	Top-1 acc 55.078 (65.085)	Top-5 acc 77.344 (84.709)	lr 0.00472
Train [86][2180/3239]	Time 0.243 (0.528)	Data Time 0.001 (0.021)	Loss 2.4865 (2.4445)	Entropy 0.57767 (0.57739)	Top-1 acc 61.719 (65.083)	Top-5 acc 86.328 (84.715)	lr 0.00472
Train [86][2190/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.021)	Loss 2.4692 (2.4447)	Entropy 0.57774 (0.57739)	Top-1 acc 66.406 (65.078)	Top-5 acc 85.156 (84.715)	lr 0.00472
Train [86][2200/3239]	Time 0.257 (0.528)	Data Time 0.001 (0.021)	Loss 2.5732 (2.4446)	Entropy 0.57785 (0.57739)	Top-1 acc 57.031 (65.076)	Top-5 acc 84.766 (84.720)	lr 0.00472
Train [86][2210/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.021)	Loss 2.5738 (2.4449)	Entropy 0.57794 (0.57739)	Top-1 acc 62.891 (65.070)	Top-5 acc 83.594 (84.716)	lr 0.00471
Train [86][2220/3239]	Time 0.261 (0.527)	Data Time 0.002 (0.021)	Loss 2.6773 (2.4450)	Entropy 0.57786 (0.57740)	Top-1 acc 57.422 (65.066)	Top-5 acc 80.859 (84.716)	lr 0.00471
Train [86][2230/3239]	Time 0.249 (0.527)	Data Time 0.001 (0.021)	Loss 2.4473 (2.4451)	Entropy 0.57818 (0.57740)	Top-1 acc 66.797 (65.065)	Top-5 acc 85.156 (84.712)	lr 0.00471
Train [86][2240/3239]	Time 0.467 (0.526)	Data Time 0.003 (0.021)	Loss 2.4579 (2.4452)	Entropy 0.57816 (0.57740)	Top-1 acc 62.109 (65.061)	Top-5 acc 87.109 (84.712)	lr 0.00471
Train [86][2250/3239]	Time 0.268 (0.526)	Data Time 0.002 (0.021)	Loss 2.5926 (2.4453)	Entropy 0.57814 (0.57740)	Top-1 acc 60.547 (65.057)	Top-5 acc 80.469 (84.713)	lr 0.00471
Train [86][2260/3239]	Time 0.305 (0.526)	Data Time 0.029 (0.021)	Loss 2.6401 (2.4453)	Entropy 0.57822 (0.57741)	Top-1 acc 60.938 (65.057)	Top-5 acc 80.078 (84.711)	lr 0.00471
Train [86][2270/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.021)	Loss 2.3394 (2.4454)	Entropy 0.57832 (0.57741)	Top-1 acc 67.578 (65.051)	Top-5 acc 85.156 (84.707)	lr 0.00471
Train [86][2280/3239]	Time 0.248 (0.525)	Data Time 0.002 (0.021)	Loss 2.5670 (2.4458)	Entropy 0.57843 (0.57742)	Top-1 acc 64.453 (65.043)	Top-5 acc 83.203 (84.702)	lr 0.00471
Train [86][2290/3239]	Time 0.336 (0.548)	Data Time 0.004 (0.020)	Loss 2.6576 (2.4459)	Entropy 0.57822 (0.57742)	Top-1 acc 62.109 (65.047)	Top-5 acc 81.250 (84.697)	lr 0.00471
Train [86][2300/3239]	Time 0.244 (0.548)	Data Time 0.002 (0.020)	Loss 2.5881 (2.4460)	Entropy 0.57844 (0.57742)	Top-1 acc 62.109 (65.042)	Top-5 acc 80.078 (84.693)	lr 0.00471
Train [86][2310/3239]	Time 0.376 (0.547)	Data Time 0.002 (0.020)	Loss 2.3234 (2.4461)	Entropy 0.57865 (0.57743)	Top-1 acc 66.797 (65.039)	Top-5 acc 87.500 (84.698)	lr 0.00471
Train [86][2320/3239]	Time 0.247 (0.547)	Data Time 0.001 (0.020)	Loss 2.3830 (2.4463)	Entropy 0.57881 (0.57743)	Top-1 acc 66.406 (65.033)	Top-5 acc 86.719 (84.691)	lr 0.00471
Train [86][2330/3239]	Time 0.235 (0.546)	Data Time 0.001 (0.020)	Loss 2.4627 (2.4465)	Entropy 0.57887 (0.57744)	Top-1 acc 67.969 (65.031)	Top-5 acc 83.984 (84.692)	lr 0.00471
Train [86][2340/3239]	Time 0.251 (0.546)	Data Time 0.002 (0.020)	Loss 2.3985 (2.4462)	Entropy 0.57887 (0.57745)	Top-1 acc 63.672 (65.039)	Top-5 acc 88.281 (84.698)	lr 0.00470
Train [86][2350/3239]	Time 0.284 (0.545)	Data Time 0.002 (0.020)	Loss 2.4963 (2.4462)	Entropy 0.57881 (0.57745)	Top-1 acc 65.625 (65.039)	Top-5 acc 82.812 (84.699)	lr 0.00470
Train [86][2360/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.020)	Loss 2.5539 (2.4463)	Entropy 0.57891 (0.57746)	Top-1 acc 63.672 (65.037)	Top-5 acc 81.250 (84.695)	lr 0.00470
Train [86][2370/3239]	Time 0.257 (0.544)	Data Time 0.001 (0.020)	Loss 2.3853 (2.4463)	Entropy 0.57866 (0.57746)	Top-1 acc 65.234 (65.034)	Top-5 acc 87.500 (84.697)	lr 0.00470
Train [86][2380/3239]	Time 0.229 (0.544)	Data Time 0.001 (0.020)	Loss 2.4426 (2.4464)	Entropy 0.57853 (0.57747)	Top-1 acc 66.406 (65.028)	Top-5 acc 83.984 (84.693)	lr 0.00470
Train [86][2390/3239]	Time 0.259 (0.544)	Data Time 0.002 (0.020)	Loss 2.4925 (2.4465)	Entropy 0.57872 (0.57747)	Top-1 acc 65.234 (65.025)	Top-5 acc 83.984 (84.693)	lr 0.00470
Train [86][2400/3239]	Time 0.381 (0.543)	Data Time 0.001 (0.020)	Loss 2.4035 (2.4463)	Entropy 0.57901 (0.57748)	Top-1 acc 64.844 (65.029)	Top-5 acc 85.156 (84.693)	lr 0.00470
Train [86][2410/3239]	Time 0.264 (0.543)	Data Time 0.001 (0.020)	Loss 2.4312 (2.4462)	Entropy 0.57902 (0.57749)	Top-1 acc 63.672 (65.026)	Top-5 acc 86.719 (84.695)	lr 0.00470
Train [86][2420/3239]	Time 0.285 (0.542)	Data Time 0.002 (0.019)	Loss 2.3802 (2.4461)	Entropy 0.57902 (0.57749)	Top-1 acc 68.359 (65.030)	Top-5 acc 86.328 (84.696)	lr 0.00470
Train [86][2430/3239]	Time 0.303 (0.542)	Data Time 0.003 (0.019)	Loss 2.4500 (2.4462)	Entropy 0.57901 (0.57750)	Top-1 acc 63.672 (65.026)	Top-5 acc 85.938 (84.698)	lr 0.00470
Train [86][2440/3239]	Time 0.247 (0.542)	Data Time 0.001 (0.019)	Loss 2.5901 (2.4464)	Entropy 0.57901 (0.57750)	Top-1 acc 61.719 (65.022)	Top-5 acc 80.078 (84.694)	lr 0.00470
Train [86][2450/3239]	Time 0.258 (0.541)	Data Time 0.001 (0.019)	Loss 2.4017 (2.4467)	Entropy 0.57912 (0.57751)	Top-1 acc 65.234 (65.017)	Top-5 acc 84.766 (84.687)	lr 0.00470
Train [86][2460/3239]	Time 0.250 (0.541)	Data Time 0.001 (0.019)	Loss 2.3507 (2.4466)	Entropy 0.57933 (0.57752)	Top-1 acc 66.406 (65.022)	Top-5 acc 83.984 (84.687)	lr 0.00469
Train [86][2470/3239]	Time 0.342 (0.541)	Data Time 0.001 (0.019)	Loss 2.2263 (2.4463)	Entropy 0.57899 (0.57752)	Top-1 acc 70.312 (65.028)	Top-5 acc 88.281 (84.693)	lr 0.00469
Train [86][2480/3239]	Time 0.236 (0.540)	Data Time 0.002 (0.019)	Loss 2.5699 (2.4463)	Entropy 0.57890 (0.57753)	Top-1 acc 63.281 (65.027)	Top-5 acc 83.594 (84.694)	lr 0.00469
Train [86][2490/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.019)	Loss 2.7014 (2.4464)	Entropy 0.57919 (0.57754)	Top-1 acc 59.766 (65.023)	Top-5 acc 83.984 (84.692)	lr 0.00469
Train [86][2500/3239]	Time 0.273 (0.539)	Data Time 0.001 (0.019)	Loss 2.4811 (2.4463)	Entropy 0.57921 (0.57754)	Top-1 acc 64.453 (65.025)	Top-5 acc 85.156 (84.693)	lr 0.00469
Train [86][2510/3239]	Time 0.238 (0.539)	Data Time 0.001 (0.019)	Loss 2.5416 (2.4464)	Entropy 0.57937 (0.57755)	Top-1 acc 66.406 (65.025)	Top-5 acc 82.812 (84.693)	lr 0.00469
Train [86][2520/3239]	Time 0.260 (0.538)	Data Time 0.002 (0.019)	Loss 2.3264 (2.4463)	Entropy 0.57885 (0.57756)	Top-1 acc 66.406 (65.025)	Top-5 acc 87.891 (84.692)	lr 0.00469
Train [86][2530/3239]	Time 0.288 (0.538)	Data Time 0.002 (0.019)	Loss 2.6618 (2.4463)	Entropy 0.57869 (0.57756)	Top-1 acc 59.375 (65.024)	Top-5 acc 81.250 (84.694)	lr 0.00469
Train [86][2540/3239]	Time 0.252 (0.538)	Data Time 0.001 (0.019)	Loss 2.6317 (2.4466)	Entropy 0.57843 (0.57757)	Top-1 acc 58.594 (65.018)	Top-5 acc 81.641 (84.692)	lr 0.00469
Train [86][2550/3239]	Time 0.224 (0.537)	Data Time 0.001 (0.019)	Loss 2.7264 (2.4466)	Entropy 0.57861 (0.57757)	Top-1 acc 60.156 (65.016)	Top-5 acc 78.906 (84.690)	lr 0.00469
Train [86][2560/3239]	Time 0.332 (0.537)	Data Time 0.001 (0.018)	Loss 2.3823 (2.4469)	Entropy 0.57866 (0.57757)	Top-1 acc 62.500 (65.008)	Top-5 acc 83.594 (84.687)	lr 0.00469
Train [86][2570/3239]	Time 0.294 (0.536)	Data Time 0.001 (0.018)	Loss 2.3573 (2.4470)	Entropy 0.57868 (0.57758)	Top-1 acc 67.969 (65.005)	Top-5 acc 85.938 (84.683)	lr 0.00469
Train [86][2580/3239]	Time 0.230 (0.536)	Data Time 0.001 (0.018)	Loss 2.4530 (2.4470)	Entropy 0.57838 (0.57758)	Top-1 acc 62.500 (65.002)	Top-5 acc 86.328 (84.685)	lr 0.00469
Train [86][2590/3239]	Time 0.244 (0.536)	Data Time 0.001 (0.018)	Loss 2.5497 (2.4472)	Entropy 0.57800 (0.57758)	Top-1 acc 63.672 (64.999)	Top-5 acc 82.422 (84.682)	lr 0.00468
Train [86][2600/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.018)	Loss 2.5337 (2.4472)	Entropy 0.57787 (0.57758)	Top-1 acc 58.203 (65.001)	Top-5 acc 85.938 (84.682)	lr 0.00468
Train [86][2610/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.018)	Loss 2.1647 (2.4470)	Entropy 0.57816 (0.57759)	Top-1 acc 70.703 (65.005)	Top-5 acc 92.188 (84.687)	lr 0.00468
Train [86][2620/3239]	Time 0.290 (0.534)	Data Time 0.001 (0.018)	Loss 2.3675 (2.4469)	Entropy 0.57824 (0.57759)	Top-1 acc 64.062 (65.008)	Top-5 acc 87.500 (84.691)	lr 0.00468
Train [86][2630/3239]	Time 0.411 (0.534)	Data Time 0.001 (0.018)	Loss 2.3886 (2.4469)	Entropy 0.57822 (0.57759)	Top-1 acc 65.625 (65.011)	Top-5 acc 86.719 (84.689)	lr 0.00468
Train [86][2640/3239]	Time 0.269 (0.534)	Data Time 0.001 (0.018)	Loss 2.4563 (2.4469)	Entropy 0.57839 (0.57759)	Top-1 acc 67.578 (65.012)	Top-5 acc 83.984 (84.689)	lr 0.00468
Train [86][2650/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.018)	Loss 2.5850 (2.4468)	Entropy 0.57830 (0.57760)	Top-1 acc 61.719 (65.014)	Top-5 acc 82.422 (84.691)	lr 0.00468
Train [86][2660/3239]	Time 0.221 (0.533)	Data Time 0.001 (0.018)	Loss 2.5084 (2.4469)	Entropy 0.57826 (0.57760)	Top-1 acc 60.156 (65.007)	Top-5 acc 84.766 (84.690)	lr 0.00468
Train [86][2670/3239]	Time 0.242 (0.532)	Data Time 0.001 (0.018)	Loss 2.5023 (2.4472)	Entropy 0.57776 (0.57760)	Top-1 acc 62.891 (65.000)	Top-5 acc 82.031 (84.684)	lr 0.00468
Train [86][2680/3239]	Time 0.265 (0.532)	Data Time 0.001 (0.018)	Loss 2.5048 (2.4474)	Entropy 0.57768 (0.57760)	Top-1 acc 62.109 (64.994)	Top-5 acc 85.938 (84.680)	lr 0.00468
Train [86][2690/3239]	Time 0.301 (0.532)	Data Time 0.001 (0.018)	Loss 2.3507 (2.4476)	Entropy 0.57774 (0.57760)	Top-1 acc 67.578 (64.990)	Top-5 acc 85.547 (84.678)	lr 0.00468
Train [86][2700/3239]	Time 0.268 (0.532)	Data Time 0.001 (0.018)	Loss 2.5763 (2.4476)	Entropy 0.57781 (0.57760)	Top-1 acc 60.156 (64.990)	Top-5 acc 83.203 (84.677)	lr 0.00468
Train [86][2710/3239]	Time 0.269 (0.531)	Data Time 0.001 (0.018)	Loss 2.2595 (2.4477)	Entropy 0.57784 (0.57760)	Top-1 acc 69.922 (64.989)	Top-5 acc 87.109 (84.677)	lr 0.00468
Train [86][2720/3239]	Time 0.283 (0.531)	Data Time 0.001 (0.018)	Loss 2.3609 (2.4475)	Entropy 0.57782 (0.57760)	Top-1 acc 66.406 (64.995)	Top-5 acc 87.891 (84.680)	lr 0.00467
Train [86][2730/3239]	Time 0.242 (0.531)	Data Time 0.001 (0.017)	Loss 2.5496 (2.4476)	Entropy 0.57788 (0.57760)	Top-1 acc 59.766 (64.996)	Top-5 acc 83.594 (84.678)	lr 0.00467
Train [86][2740/3239]	Time 0.295 (0.530)	Data Time 0.002 (0.017)	Loss 2.9776 (2.4477)	Entropy 0.57796 (0.57761)	Top-1 acc 55.469 (64.993)	Top-5 acc 79.297 (84.676)	lr 0.00467
Train [86][2750/3239]	Time 0.266 (0.530)	Data Time 0.001 (0.017)	Loss 2.5603 (2.4474)	Entropy 0.57824 (0.57761)	Top-1 acc 62.109 (65.002)	Top-5 acc 81.641 (84.684)	lr 0.00467
Train [86][2760/3239]	Time 0.240 (0.530)	Data Time 0.001 (0.017)	Loss 2.3314 (2.4474)	Entropy 0.57823 (0.57761)	Top-1 acc 68.359 (65.004)	Top-5 acc 85.156 (84.682)	lr 0.00467
Train [86][2770/3239]	Time 0.264 (0.529)	Data Time 0.001 (0.017)	Loss 2.3231 (2.4475)	Entropy 0.57844 (0.57761)	Top-1 acc 69.922 (65.002)	Top-5 acc 87.891 (84.677)	lr 0.00467
Train [86][2780/3239]	Time 0.259 (0.529)	Data Time 0.002 (0.017)	Loss 2.2887 (2.4474)	Entropy 0.57849 (0.57761)	Top-1 acc 69.531 (65.003)	Top-5 acc 86.719 (84.679)	lr 0.00467
Train [86][2790/3239]	Time 0.402 (0.529)	Data Time 0.002 (0.017)	Loss 2.2570 (2.4476)	Entropy 0.57840 (0.57762)	Top-1 acc 71.484 (65.003)	Top-5 acc 86.328 (84.675)	lr 0.00467
Train [86][2800/3239]	Time 0.279 (0.528)	Data Time 0.001 (0.017)	Loss 2.6808 (2.4477)	Entropy 0.57865 (0.57762)	Top-1 acc 58.984 (64.999)	Top-5 acc 81.250 (84.672)	lr 0.00467
Train [86][2810/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.017)	Loss 2.3696 (2.4477)	Entropy 0.57917 (0.57762)	Top-1 acc 66.406 (64.999)	Top-5 acc 85.547 (84.673)	lr 0.00467
Train [86][2820/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.017)	Loss 2.3978 (2.4477)	Entropy 0.57896 (0.57763)	Top-1 acc 65.625 (65.001)	Top-5 acc 85.156 (84.672)	lr 0.00467
Train [86][2830/3239]	Time 0.224 (0.527)	Data Time 0.001 (0.017)	Loss 2.4777 (2.4475)	Entropy 0.57881 (0.57763)	Top-1 acc 66.016 (65.004)	Top-5 acc 84.375 (84.674)	lr 0.00467
Train [86][2840/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.017)	Loss 2.4100 (2.4476)	Entropy 0.57879 (0.57764)	Top-1 acc 66.016 (65.004)	Top-5 acc 85.547 (84.674)	lr 0.00466
Train [86][2850/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.017)	Loss 2.6895 (2.4477)	Entropy 0.57850 (0.57764)	Top-1 acc 57.812 (64.999)	Top-5 acc 76.953 (84.670)	lr 0.00466
Train [86][2860/3239]	Time 0.369 (0.526)	Data Time 0.001 (0.017)	Loss 2.5445 (2.4479)	Entropy 0.57845 (0.57764)	Top-1 acc 63.672 (64.994)	Top-5 acc 82.422 (84.667)	lr 0.00466
Train [86][2870/3239]	Time 0.267 (0.526)	Data Time 0.001 (0.017)	Loss 2.2998 (2.4478)	Entropy 0.57870 (0.57765)	Top-1 acc 67.188 (64.997)	Top-5 acc 85.156 (84.670)	lr 0.00466
Train [86][2880/3239]	Time 0.268 (0.525)	Data Time 0.001 (0.017)	Loss 2.5285 (2.4478)	Entropy 0.57855 (0.57765)	Top-1 acc 64.062 (64.993)	Top-5 acc 83.594 (84.669)	lr 0.00466
Train [86][2890/3239]	Time 0.252 (0.525)	Data Time 0.001 (0.017)	Loss 2.1792 (2.4476)	Entropy 0.57872 (0.57765)	Top-1 acc 73.047 (64.998)	Top-5 acc 89.062 (84.673)	lr 0.00466
Train [86][2900/3239]	Time 0.249 (0.525)	Data Time 0.001 (0.017)	Loss 2.2259 (2.4476)	Entropy 0.57873 (0.57766)	Top-1 acc 69.141 (64.995)	Top-5 acc 88.281 (84.673)	lr 0.00466
Train [86][2910/3239]	Time 0.254 (0.524)	Data Time 0.001 (0.016)	Loss 2.4868 (2.4479)	Entropy 0.57896 (0.57766)	Top-1 acc 63.672 (64.991)	Top-5 acc 82.422 (84.668)	lr 0.00466
Train [86][2920/3239]	Time 0.258 (0.524)	Data Time 0.001 (0.016)	Loss 2.4751 (2.4478)	Entropy 0.57903 (0.57767)	Top-1 acc 68.750 (64.992)	Top-5 acc 82.812 (84.667)	lr 0.00466
Train [86][2930/3239]	Time 0.277 (0.524)	Data Time 0.001 (0.016)	Loss 2.4589 (2.4480)	Entropy 0.57917 (0.57767)	Top-1 acc 62.500 (64.988)	Top-5 acc 85.547 (84.663)	lr 0.00466
Train [86][2940/3239]	Time 0.269 (0.523)	Data Time 0.001 (0.016)	Loss 2.4928 (2.4482)	Entropy 0.57938 (0.57768)	Top-1 acc 63.672 (64.985)	Top-5 acc 82.422 (84.656)	lr 0.00466
Train [86][2950/3239]	Time 0.419 (0.541)	Data Time 0.003 (0.016)	Loss 2.2655 (2.4483)	Entropy 0.57942 (0.57768)	Top-1 acc 70.312 (64.980)	Top-5 acc 89.844 (84.655)	lr 0.00466
Train [86][2960/3239]	Time 0.249 (0.541)	Data Time 0.002 (0.016)	Loss 2.5565 (2.4485)	Entropy 0.57938 (0.57769)	Top-1 acc 59.375 (64.974)	Top-5 acc 83.594 (84.651)	lr 0.00466
Train [86][2970/3239]	Time 0.281 (0.540)	Data Time 0.002 (0.016)	Loss 2.4558 (2.4486)	Entropy 0.57964 (0.57770)	Top-1 acc 66.016 (64.973)	Top-5 acc 84.375 (84.648)	lr 0.00465
Train [86][2980/3239]	Time 0.245 (0.540)	Data Time 0.001 (0.016)	Loss 2.2883 (2.4486)	Entropy 0.58000 (0.57770)	Top-1 acc 70.703 (64.974)	Top-5 acc 86.719 (84.647)	lr 0.00465
Train [86][2990/3239]	Time 0.266 (0.540)	Data Time 0.003 (0.016)	Loss 2.5459 (2.4488)	Entropy 0.57998 (0.57771)	Top-1 acc 60.938 (64.968)	Top-5 acc 82.031 (84.645)	lr 0.00465
Train [86][3000/3239]	Time 0.246 (0.539)	Data Time 0.001 (0.016)	Loss 2.5144 (2.4488)	Entropy 0.57993 (0.57772)	Top-1 acc 64.453 (64.974)	Top-5 acc 82.812 (84.643)	lr 0.00465
Train [86][3010/3239]	Time 0.242 (0.539)	Data Time 0.001 (0.016)	Loss 2.3783 (2.4490)	Entropy 0.58012 (0.57772)	Top-1 acc 66.406 (64.974)	Top-5 acc 86.719 (84.643)	lr 0.00465
Train [86][3020/3239]	Time 0.422 (0.539)	Data Time 0.002 (0.016)	Loss 2.3669 (2.4490)	Entropy 0.58045 (0.57773)	Top-1 acc 65.234 (64.974)	Top-5 acc 87.500 (84.640)	lr 0.00465
Train [86][3030/3239]	Time 0.284 (0.539)	Data Time 0.001 (0.016)	Loss 2.3824 (2.4490)	Entropy 0.58055 (0.57774)	Top-1 acc 69.531 (64.976)	Top-5 acc 85.156 (84.642)	lr 0.00465
Train [86][3040/3239]	Time 0.294 (0.538)	Data Time 0.001 (0.016)	Loss 2.3823 (2.4488)	Entropy 0.58093 (0.57775)	Top-1 acc 67.188 (64.982)	Top-5 acc 87.500 (84.644)	lr 0.00465
Train [86][3050/3239]	Time 0.265 (0.538)	Data Time 0.001 (0.016)	Loss 2.6801 (2.4488)	Entropy 0.58114 (0.57776)	Top-1 acc 59.375 (64.980)	Top-5 acc 80.469 (84.646)	lr 0.00465
Train [86][3060/3239]	Time 0.246 (0.538)	Data Time 0.001 (0.016)	Loss 2.2552 (2.4489)	Entropy 0.58122 (0.57777)	Top-1 acc 66.797 (64.977)	Top-5 acc 89.453 (84.646)	lr 0.00465
Train [86][3070/3239]	Time 0.307 (0.538)	Data Time 0.001 (0.016)	Loss 2.5199 (2.4490)	Entropy 0.58108 (0.57779)	Top-1 acc 66.797 (64.977)	Top-5 acc 80.078 (84.643)	lr 0.00465
Train [86][3080/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.016)	Loss 2.1927 (2.4490)	Entropy 0.58119 (0.57780)	Top-1 acc 70.312 (64.973)	Top-5 acc 88.281 (84.642)	lr 0.00465
Train [86][3090/3239]	Time 0.248 (0.537)	Data Time 0.001 (0.016)	Loss 2.3202 (2.4491)	Entropy 0.58145 (0.57781)	Top-1 acc 71.484 (64.970)	Top-5 acc 87.500 (84.639)	lr 0.00465
Train [86][3100/3239]	Time 0.265 (0.537)	Data Time 0.001 (0.016)	Loss 2.3468 (2.4490)	Entropy 0.58119 (0.57782)	Top-1 acc 69.922 (64.973)	Top-5 acc 85.156 (84.639)	lr 0.00464
Train [86][3110/3239]	Time 0.388 (0.536)	Data Time 0.001 (0.016)	Loss 2.5231 (2.4490)	Entropy 0.58109 (0.57783)	Top-1 acc 63.672 (64.974)	Top-5 acc 83.203 (84.639)	lr 0.00464
Train [86][3120/3239]	Time 0.252 (0.536)	Data Time 0.001 (0.016)	Loss 2.3483 (2.4491)	Entropy 0.58086 (0.57784)	Top-1 acc 64.062 (64.975)	Top-5 acc 85.547 (84.639)	lr 0.00464
Train [86][3130/3239]	Time 0.268 (0.536)	Data Time 0.004 (0.015)	Loss 2.3739 (2.4492)	Entropy 0.58112 (0.57785)	Top-1 acc 66.797 (64.970)	Top-5 acc 85.938 (84.638)	lr 0.00464
Train [86][3140/3239]	Time 0.249 (0.536)	Data Time 0.002 (0.015)	Loss 2.3397 (2.4491)	Entropy 0.58139 (0.57786)	Top-1 acc 64.844 (64.974)	Top-5 acc 88.281 (84.640)	lr 0.00464
Train [86][3150/3239]	Time 0.234 (0.535)	Data Time 0.001 (0.015)	Loss 2.4437 (2.4490)	Entropy 0.58156 (0.57787)	Top-1 acc 69.531 (64.977)	Top-5 acc 83.984 (84.640)	lr 0.00464
Train [86][3160/3239]	Time 0.281 (0.535)	Data Time 0.002 (0.015)	Loss 2.4545 (2.4490)	Entropy 0.58176 (0.57788)	Top-1 acc 65.625 (64.972)	Top-5 acc 84.766 (84.642)	lr 0.00464
Train [86][3170/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.015)	Loss 2.1814 (2.4490)	Entropy 0.58182 (0.57790)	Top-1 acc 72.266 (64.974)	Top-5 acc 89.844 (84.642)	lr 0.00464
Train [86][3180/3239]	Time 0.402 (0.534)	Data Time 0.000 (0.015)	Loss 2.5049 (2.4491)	Entropy 0.58188 (0.57791)	Top-1 acc 64.453 (64.972)	Top-5 acc 83.594 (84.641)	lr 0.00464
Train [86][3190/3239]	Time 0.238 (0.534)	Data Time 0.000 (0.015)	Loss 2.5070 (2.4490)	Entropy 0.58201 (0.57792)	Top-1 acc 64.062 (64.973)	Top-5 acc 83.594 (84.641)	lr 0.00464
Train [86][3200/3239]	Time 0.236 (0.534)	Data Time 0.000 (0.015)	Loss 2.3902 (2.4491)	Entropy 0.58221 (0.57793)	Top-1 acc 67.578 (64.972)	Top-5 acc 82.422 (84.637)	lr 0.00464
Train [86][3210/3239]	Time 0.243 (0.533)	Data Time 0.000 (0.015)	Loss 2.3280 (2.4490)	Entropy 0.58278 (0.57795)	Top-1 acc 68.359 (64.975)	Top-5 acc 86.719 (84.639)	lr 0.00464
Train [86][3220/3239]	Time 0.239 (0.533)	Data Time 0.000 (0.015)	Loss 2.5005 (2.4492)	Entropy 0.58297 (0.57796)	Top-1 acc 66.016 (64.970)	Top-5 acc 84.375 (84.635)	lr 0.00464
Train [86][3230/3239]	Time 0.236 (0.532)	Data Time 0.000 (0.015)	Loss 2.4662 (2.4492)	Entropy 0.58320 (0.57798)	Top-1 acc 66.406 (64.972)	Top-5 acc 82.422 (84.635)	lr 0.00463
Train [86][3239/3239]	Time 0.962 (0.532)	Data Time 0.000 (0.015)	Loss 2.7069 (2.4493)	Entropy 0.58316 (0.57799)	Top-1 acc 60.494 (64.969)	Top-5 acc 83.951 (84.632)	lr 0.00463
==========Valid [86/120]	loss 1.252	top-1 acc 71.264 (71.264)	top-5 acc 89.602	Train top-1 64.969	top-5 84.632	Entropy 0.58316	Latency-None: 0.000ms	Flops: 539.00M
Train [87][0/3239]	Time 38.280 (38.280)	Data Time 37.158 (37.158)	Loss 2.4154 (2.4154)	Entropy 0.58321 (0.58321)	Top-1 acc 64.062 (64.062)	Top-5 acc 82.812 (82.812)	lr 0.00463
Train [87][10/3239]	Time 0.380 (4.179)	Data Time 0.001 (3.510)	Loss 2.5142 (2.4236)	Entropy 0.58338 (0.58327)	Top-1 acc 64.062 (64.986)	Top-5 acc 83.203 (84.624)	lr 0.00463
Train [87][20/3239]	Time 0.269 (2.393)	Data Time 0.004 (1.839)	Loss 2.3457 (2.4288)	Entropy 0.58325 (0.58329)	Top-1 acc 69.141 (65.179)	Top-5 acc 86.719 (84.952)	lr 0.00463
Train [87][30/3239]	Time 0.244 (1.767)	Data Time 0.001 (1.247)	Loss 2.5679 (2.4501)	Entropy 0.58291 (0.58322)	Top-1 acc 62.891 (64.970)	Top-5 acc 82.031 (84.589)	lr 0.00463
Train [87][40/3239]	Time 0.250 (1.447)	Data Time 0.001 (0.943)	Loss 2.5304 (2.4680)	Entropy 0.58329 (0.58315)	Top-1 acc 62.500 (64.577)	Top-5 acc 82.031 (84.261)	lr 0.00463
Train [87][50/3239]	Time 0.242 (1.248)	Data Time 0.001 (0.758)	Loss 2.3593 (2.4553)	Entropy 0.58309 (0.58318)	Top-1 acc 68.359 (64.874)	Top-5 acc 89.062 (84.651)	lr 0.00463
Train [87][60/3239]	Time 0.236 (1.114)	Data Time 0.001 (0.634)	Loss 2.5523 (2.4478)	Entropy 0.58313 (0.58318)	Top-1 acc 60.547 (64.978)	Top-5 acc 82.812 (84.810)	lr 0.00463
Train [87][70/3239]	Time 0.236 (1.015)	Data Time 0.001 (0.545)	Loss 2.4436 (2.4447)	Entropy 0.58334 (0.58318)	Top-1 acc 64.844 (65.075)	Top-5 acc 83.984 (84.832)	lr 0.00463
Train [87][80/3239]	Time 0.334 (0.943)	Data Time 0.002 (0.478)	Loss 2.5065 (2.4415)	Entropy 0.58343 (0.58320)	Top-1 acc 62.109 (65.167)	Top-5 acc 85.547 (84.934)	lr 0.00463
Train [87][90/3239]	Time 0.237 (0.887)	Data Time 0.001 (0.426)	Loss 2.4859 (2.4372)	Entropy 0.58332 (0.58323)	Top-1 acc 62.500 (65.282)	Top-5 acc 82.031 (85.075)	lr 0.00463
Train [87][100/3239]	Time 0.242 (0.840)	Data Time 0.001 (0.384)	Loss 2.7100 (2.4321)	Entropy 0.58320 (0.58322)	Top-1 acc 61.328 (65.509)	Top-5 acc 77.734 (85.164)	lr 0.00463
Train [87][110/3239]	Time 0.244 (0.806)	Data Time 0.002 (0.349)	Loss 2.6115 (2.4278)	Entropy 0.58302 (0.58322)	Top-1 acc 62.109 (65.657)	Top-5 acc 82.422 (85.244)	lr 0.00462
Train [87][120/3239]	Time 0.243 (0.783)	Data Time 0.001 (0.321)	Loss 2.4145 (2.4307)	Entropy 0.58283 (0.58321)	Top-1 acc 66.406 (65.544)	Top-5 acc 84.375 (85.127)	lr 0.00462
Train [87][130/3239]	Time 0.228 (0.756)	Data Time 0.001 (0.296)	Loss 2.1735 (2.4345)	Entropy 0.58301 (0.58319)	Top-1 acc 72.656 (65.437)	Top-5 acc 89.453 (85.046)	lr 0.00462
Train [87][140/3239]	Time 0.236 (0.732)	Data Time 0.001 (0.275)	Loss 2.3811 (2.4313)	Entropy 0.58306 (0.58318)	Top-1 acc 65.234 (65.464)	Top-5 acc 84.766 (85.040)	lr 0.00462
Train [87][150/3239]	Time 0.233 (0.711)	Data Time 0.001 (0.257)	Loss 2.5192 (2.4316)	Entropy 0.58278 (0.58316)	Top-1 acc 64.453 (65.444)	Top-5 acc 82.812 (85.006)	lr 0.00462
Train [87][160/3239]	Time 0.231 (0.692)	Data Time 0.001 (0.241)	Loss 2.4185 (2.4321)	Entropy 0.58295 (0.58314)	Top-1 acc 69.531 (65.455)	Top-5 acc 84.766 (85.011)	lr 0.00462
Train [87][170/3239]	Time 0.321 (0.676)	Data Time 0.001 (0.227)	Loss 2.4773 (2.4325)	Entropy 0.58309 (0.58313)	Top-1 acc 64.062 (65.417)	Top-5 acc 87.500 (85.072)	lr 0.00462
Train [87][180/3239]	Time 0.235 (0.661)	Data Time 0.001 (0.215)	Loss 2.3266 (2.4321)	Entropy 0.58331 (0.58313)	Top-1 acc 67.578 (65.455)	Top-5 acc 87.109 (85.038)	lr 0.00462
Train [87][190/3239]	Time 0.236 (0.651)	Data Time 0.001 (0.204)	Loss 2.3140 (2.4320)	Entropy 0.58329 (0.58314)	Top-1 acc 67.188 (65.412)	Top-5 acc 89.062 (85.085)	lr 0.00462
Train [87][200/3239]	Time 0.231 (0.640)	Data Time 0.001 (0.194)	Loss 2.2656 (2.4288)	Entropy 0.58309 (0.58314)	Top-1 acc 71.094 (65.495)	Top-5 acc 86.328 (85.121)	lr 0.00462
Train [87][210/3239]	Time 0.235 (0.629)	Data Time 0.001 (0.184)	Loss 2.6050 (2.4302)	Entropy 0.58325 (0.58314)	Top-1 acc 60.547 (65.482)	Top-5 acc 80.859 (85.110)	lr 0.00462
Train [87][220/3239]	Time 0.236 (0.620)	Data Time 0.001 (0.176)	Loss 2.3881 (2.4320)	Entropy 0.58343 (0.58315)	Top-1 acc 64.453 (65.469)	Top-5 acc 86.328 (85.093)	lr 0.00462
Train [87][230/3239]	Time 0.232 (0.611)	Data Time 0.001 (0.169)	Loss 2.3799 (2.4287)	Entropy 0.58374 (0.58317)	Top-1 acc 63.281 (65.510)	Top-5 acc 87.109 (85.134)	lr 0.00462
Train [87][240/3239]	Time 0.333 (0.603)	Data Time 0.001 (0.162)	Loss 2.3664 (2.4291)	Entropy 0.58407 (0.58320)	Top-1 acc 67.188 (65.461)	Top-5 acc 85.547 (85.132)	lr 0.00461
Train [87][250/3239]	Time 0.227 (0.595)	Data Time 0.001 (0.155)	Loss 2.3284 (2.4280)	Entropy 0.58452 (0.58324)	Top-1 acc 69.531 (65.504)	Top-5 acc 86.719 (85.127)	lr 0.00461
Train [87][260/3239]	Time 0.227 (0.588)	Data Time 0.002 (0.150)	Loss 2.4123 (2.4294)	Entropy 0.58470 (0.58330)	Top-1 acc 63.672 (65.466)	Top-5 acc 83.984 (85.077)	lr 0.00461
Train [87][270/3239]	Time 0.215 (0.582)	Data Time 0.001 (0.144)	Loss 2.2406 (2.4310)	Entropy 0.58460 (0.58334)	Top-1 acc 73.047 (65.416)	Top-5 acc 87.109 (85.044)	lr 0.00461
Train [87][280/3239]	Time 0.236 (0.576)	Data Time 0.001 (0.139)	Loss 2.3407 (2.4307)	Entropy 0.58432 (0.58339)	Top-1 acc 64.844 (65.415)	Top-5 acc 85.156 (85.021)	lr 0.00461
Train [87][290/3239]	Time 0.226 (0.571)	Data Time 0.001 (0.134)	Loss 2.2753 (2.4311)	Entropy 0.58440 (0.58342)	Top-1 acc 67.969 (65.383)	Top-5 acc 88.281 (85.026)	lr 0.00461
Train [87][300/3239]	Time 0.233 (0.566)	Data Time 0.001 (0.130)	Loss 2.4745 (2.4327)	Entropy 0.58440 (0.58345)	Top-1 acc 63.281 (65.349)	Top-5 acc 85.547 (85.006)	lr 0.00461
Train [87][310/3239]	Time 0.234 (0.561)	Data Time 0.001 (0.126)	Loss 2.3560 (2.4318)	Entropy 0.58435 (0.58347)	Top-1 acc 67.578 (65.408)	Top-5 acc 86.328 (85.051)	lr 0.00461
Train [87][320/3239]	Time 0.223 (0.556)	Data Time 0.001 (0.122)	Loss 2.3202 (2.4307)	Entropy 0.58402 (0.58350)	Top-1 acc 69.531 (65.432)	Top-5 acc 87.109 (85.059)	lr 0.00461
Train [87][330/3239]	Time 0.250 (0.552)	Data Time 0.001 (0.118)	Loss 2.4898 (2.4311)	Entropy 0.58404 (0.58351)	Top-1 acc 65.234 (65.426)	Top-5 acc 82.422 (85.054)	lr 0.00461
Train [87][340/3239]	Time 0.231 (0.548)	Data Time 0.001 (0.115)	Loss 2.4512 (2.4328)	Entropy 0.58390 (0.58353)	Top-1 acc 67.188 (65.379)	Top-5 acc 83.203 (85.018)	lr 0.00461
Train [87][350/3239]	Time 0.244 (0.544)	Data Time 0.001 (0.112)	Loss 2.6129 (2.4351)	Entropy 0.58370 (0.58354)	Top-1 acc 62.500 (65.337)	Top-5 acc 80.078 (84.949)	lr 0.00461
Train [87][360/3239]	Time 0.413 (0.687)	Data Time 0.032 (0.109)	Loss 2.5703 (2.4342)	Entropy 0.58383 (0.58354)	Top-1 acc 63.672 (65.361)	Top-5 acc 82.422 (84.958)	lr 0.00461
Train [87][370/3239]	Time 0.243 (0.683)	Data Time 0.002 (0.106)	Loss 2.2477 (2.4329)	Entropy 0.58386 (0.58355)	Top-1 acc 69.531 (65.408)	Top-5 acc 87.500 (84.980)	lr 0.00460
Train [87][380/3239]	Time 0.237 (0.676)	Data Time 0.001 (0.103)	Loss 2.3190 (2.4324)	Entropy 0.58408 (0.58356)	Top-1 acc 67.969 (65.412)	Top-5 acc 85.938 (84.987)	lr 0.00460
Train [87][390/3239]	Time 0.236 (0.670)	Data Time 0.001 (0.100)	Loss 2.5428 (2.4319)	Entropy 0.58393 (0.58357)	Top-1 acc 60.547 (65.412)	Top-5 acc 84.766 (85.008)	lr 0.00460
Train [87][400/3239]	Time 0.342 (0.664)	Data Time 0.001 (0.098)	Loss 2.4297 (2.4323)	Entropy 0.58408 (0.58358)	Top-1 acc 66.406 (65.373)	Top-5 acc 83.984 (85.003)	lr 0.00460
Train [87][410/3239]	Time 0.241 (0.658)	Data Time 0.001 (0.096)	Loss 2.2987 (2.4323)	Entropy 0.58388 (0.58359)	Top-1 acc 66.016 (65.352)	Top-5 acc 86.719 (85.006)	lr 0.00460
Train [87][420/3239]	Time 0.248 (0.653)	Data Time 0.002 (0.093)	Loss 2.4830 (2.4328)	Entropy 0.58380 (0.58360)	Top-1 acc 64.844 (65.331)	Top-5 acc 83.203 (84.983)	lr 0.00460
Train [87][430/3239]	Time 0.238 (0.649)	Data Time 0.001 (0.091)	Loss 2.3243 (2.4320)	Entropy 0.58384 (0.58360)	Top-1 acc 65.625 (65.357)	Top-5 acc 86.328 (84.993)	lr 0.00460
Train [87][440/3239]	Time 0.233 (0.644)	Data Time 0.001 (0.089)	Loss 2.4450 (2.4325)	Entropy 0.58373 (0.58361)	Top-1 acc 64.453 (65.344)	Top-5 acc 85.547 (84.975)	lr 0.00460
Train [87][450/3239]	Time 0.234 (0.639)	Data Time 0.001 (0.087)	Loss 2.5599 (2.4344)	Entropy 0.58386 (0.58361)	Top-1 acc 59.766 (65.305)	Top-5 acc 85.156 (84.952)	lr 0.00460
Train [87][460/3239]	Time 0.245 (0.634)	Data Time 0.001 (0.085)	Loss 2.2510 (2.4330)	Entropy 0.58371 (0.58362)	Top-1 acc 69.922 (65.346)	Top-5 acc 88.281 (84.978)	lr 0.00460
Train [87][470/3239]	Time 0.232 (0.630)	Data Time 0.001 (0.084)	Loss 2.5495 (2.4331)	Entropy 0.58363 (0.58362)	Top-1 acc 63.281 (65.354)	Top-5 acc 81.641 (84.962)	lr 0.00460
Train [87][480/3239]	Time 0.232 (0.626)	Data Time 0.001 (0.082)	Loss 2.3045 (2.4335)	Entropy 0.58339 (0.58362)	Top-1 acc 69.531 (65.334)	Top-5 acc 87.891 (84.960)	lr 0.00460
Train [87][490/3239]	Time 0.247 (0.622)	Data Time 0.001 (0.080)	Loss 2.4383 (2.4351)	Entropy 0.58328 (0.58361)	Top-1 acc 68.750 (65.303)	Top-5 acc 84.766 (84.926)	lr 0.00460
Train [87][500/3239]	Time 0.226 (0.618)	Data Time 0.001 (0.079)	Loss 2.7819 (2.4355)	Entropy 0.58315 (0.58360)	Top-1 acc 59.766 (65.277)	Top-5 acc 80.469 (84.910)	lr 0.00459
Train [87][510/3239]	Time 0.238 (0.614)	Data Time 0.001 (0.077)	Loss 2.3291 (2.4359)	Entropy 0.58344 (0.58360)	Top-1 acc 69.531 (65.279)	Top-5 acc 86.719 (84.892)	lr 0.00459
Train [87][520/3239]	Time 0.261 (0.611)	Data Time 0.001 (0.076)	Loss 2.3645 (2.4361)	Entropy 0.58361 (0.58359)	Top-1 acc 66.016 (65.265)	Top-5 acc 85.156 (84.883)	lr 0.00459
Train [87][530/3239]	Time 0.234 (0.607)	Data Time 0.001 (0.074)	Loss 2.3862 (2.4354)	Entropy 0.58305 (0.58359)	Top-1 acc 68.359 (65.283)	Top-5 acc 85.547 (84.898)	lr 0.00459
Train [87][540/3239]	Time 0.238 (0.604)	Data Time 0.001 (0.073)	Loss 2.4937 (2.4352)	Entropy 0.58295 (0.58358)	Top-1 acc 62.109 (65.301)	Top-5 acc 83.203 (84.904)	lr 0.00459
Train [87][550/3239]	Time 0.237 (0.601)	Data Time 0.001 (0.072)	Loss 2.2970 (2.4354)	Entropy 0.58289 (0.58357)	Top-1 acc 69.531 (65.297)	Top-5 acc 86.328 (84.889)	lr 0.00459
Train [87][560/3239]	Time 0.327 (0.598)	Data Time 0.001 (0.070)	Loss 2.4243 (2.4360)	Entropy 0.58311 (0.58356)	Top-1 acc 67.578 (65.282)	Top-5 acc 85.156 (84.891)	lr 0.00459
Train [87][570/3239]	Time 0.238 (0.595)	Data Time 0.001 (0.069)	Loss 2.4093 (2.4365)	Entropy 0.58302 (0.58355)	Top-1 acc 66.797 (65.290)	Top-5 acc 84.766 (84.884)	lr 0.00459
Train [87][580/3239]	Time 0.232 (0.592)	Data Time 0.001 (0.068)	Loss 2.3394 (2.4361)	Entropy 0.58308 (0.58354)	Top-1 acc 67.969 (65.296)	Top-5 acc 86.719 (84.892)	lr 0.00459
Train [87][590/3239]	Time 0.222 (0.589)	Data Time 0.001 (0.067)	Loss 2.5811 (2.4368)	Entropy 0.58276 (0.58353)	Top-1 acc 64.062 (65.268)	Top-5 acc 82.812 (84.898)	lr 0.00459
Train [87][600/3239]	Time 0.267 (0.587)	Data Time 0.002 (0.066)	Loss 2.3375 (2.4359)	Entropy 0.58289 (0.58352)	Top-1 acc 68.750 (65.283)	Top-5 acc 86.328 (84.908)	lr 0.00459
Train [87][610/3239]	Time 0.238 (0.585)	Data Time 0.002 (0.065)	Loss 2.4007 (2.4351)	Entropy 0.58307 (0.58351)	Top-1 acc 66.016 (65.296)	Top-5 acc 84.766 (84.925)	lr 0.00459
Train [87][620/3239]	Time 0.245 (0.582)	Data Time 0.001 (0.064)	Loss 2.4745 (2.4359)	Entropy 0.58273 (0.58350)	Top-1 acc 64.844 (65.277)	Top-5 acc 85.938 (84.917)	lr 0.00458
Train [87][630/3239]	Time 0.349 (0.580)	Data Time 0.001 (0.063)	Loss 2.4527 (2.4357)	Entropy 0.58270 (0.58349)	Top-1 acc 66.016 (65.294)	Top-5 acc 84.375 (84.907)	lr 0.00458
Train [87][640/3239]	Time 0.268 (0.578)	Data Time 0.002 (0.062)	Loss 2.5162 (2.4354)	Entropy 0.58280 (0.58348)	Top-1 acc 64.062 (65.302)	Top-5 acc 83.594 (84.922)	lr 0.00458
Train [87][650/3239]	Time 0.233 (0.576)	Data Time 0.001 (0.061)	Loss 2.5307 (2.4363)	Entropy 0.58301 (0.58347)	Top-1 acc 62.891 (65.290)	Top-5 acc 82.812 (84.913)	lr 0.00458
Train [87][660/3239]	Time 0.261 (0.574)	Data Time 0.001 (0.060)	Loss 2.3770 (2.4378)	Entropy 0.58319 (0.58346)	Top-1 acc 64.844 (65.260)	Top-5 acc 86.719 (84.884)	lr 0.00458
Train [87][670/3239]	Time 0.248 (0.572)	Data Time 0.001 (0.059)	Loss 2.2635 (2.4373)	Entropy 0.58332 (0.58346)	Top-1 acc 70.703 (65.286)	Top-5 acc 87.891 (84.891)	lr 0.00458
Train [87][680/3239]	Time 0.241 (0.570)	Data Time 0.001 (0.058)	Loss 2.4460 (2.4374)	Entropy 0.58343 (0.58346)	Top-1 acc 65.625 (65.280)	Top-5 acc 82.812 (84.878)	lr 0.00458
Train [87][690/3239]	Time 0.274 (0.568)	Data Time 0.001 (0.058)	Loss 2.5317 (2.4377)	Entropy 0.58329 (0.58346)	Top-1 acc 61.719 (65.261)	Top-5 acc 83.594 (84.865)	lr 0.00458
Train [87][700/3239]	Time 0.236 (0.566)	Data Time 0.001 (0.057)	Loss 2.3697 (2.4372)	Entropy 0.58339 (0.58345)	Top-1 acc 66.016 (65.261)	Top-5 acc 85.156 (84.871)	lr 0.00458
Train [87][710/3239]	Time 0.224 (0.564)	Data Time 0.001 (0.056)	Loss 2.4006 (2.4373)	Entropy 0.58351 (0.58345)	Top-1 acc 67.188 (65.265)	Top-5 acc 87.109 (84.865)	lr 0.00458
Train [87][720/3239]	Time 0.323 (0.563)	Data Time 0.001 (0.055)	Loss 2.4192 (2.4380)	Entropy 0.58381 (0.58346)	Top-1 acc 64.844 (65.249)	Top-5 acc 84.375 (84.863)	lr 0.00458
Train [87][730/3239]	Time 0.233 (0.561)	Data Time 0.001 (0.055)	Loss 2.4466 (2.4369)	Entropy 0.58345 (0.58346)	Top-1 acc 65.625 (65.283)	Top-5 acc 84.766 (84.887)	lr 0.00458
Train [87][740/3239]	Time 0.236 (0.559)	Data Time 0.001 (0.054)	Loss 2.4723 (2.4378)	Entropy 0.58366 (0.58346)	Top-1 acc 65.625 (65.264)	Top-5 acc 81.250 (84.866)	lr 0.00458
Train [87][750/3239]	Time 0.230 (0.557)	Data Time 0.001 (0.053)	Loss 2.2757 (2.4374)	Entropy 0.58378 (0.58346)	Top-1 acc 69.141 (65.281)	Top-5 acc 88.281 (84.871)	lr 0.00457
Train [87][760/3239]	Time 0.236 (0.555)	Data Time 0.001 (0.052)	Loss 2.5063 (2.4379)	Entropy 0.58368 (0.58347)	Top-1 acc 65.234 (65.273)	Top-5 acc 82.812 (84.858)	lr 0.00457
Train [87][770/3239]	Time 0.217 (0.554)	Data Time 0.001 (0.052)	Loss 2.4684 (2.4374)	Entropy 0.58393 (0.58347)	Top-1 acc 62.109 (65.286)	Top-5 acc 83.984 (84.856)	lr 0.00457
Train [87][780/3239]	Time 0.242 (0.552)	Data Time 0.001 (0.051)	Loss 2.3070 (2.4371)	Entropy 0.58424 (0.58348)	Top-1 acc 71.094 (65.287)	Top-5 acc 87.891 (84.860)	lr 0.00457
Train [87][790/3239]	Time 0.356 (0.551)	Data Time 0.001 (0.050)	Loss 2.3677 (2.4367)	Entropy 0.58416 (0.58349)	Top-1 acc 65.625 (65.303)	Top-5 acc 86.719 (84.873)	lr 0.00457
Train [87][800/3239]	Time 0.238 (0.549)	Data Time 0.001 (0.050)	Loss 2.5195 (2.4377)	Entropy 0.58412 (0.58350)	Top-1 acc 63.672 (65.282)	Top-5 acc 82.422 (84.855)	lr 0.00457
Train [87][810/3239]	Time 0.316 (0.548)	Data Time 0.002 (0.049)	Loss 2.4143 (2.4373)	Entropy 0.58392 (0.58350)	Top-1 acc 68.750 (65.289)	Top-5 acc 83.984 (84.855)	lr 0.00457
Train [87][820/3239]	Time 0.242 (0.548)	Data Time 0.001 (0.049)	Loss 2.5111 (2.4378)	Entropy 0.58350 (0.58351)	Top-1 acc 62.109 (65.276)	Top-5 acc 81.250 (84.842)	lr 0.00457
Train [87][830/3239]	Time 0.230 (0.547)	Data Time 0.001 (0.048)	Loss 2.6072 (2.4389)	Entropy 0.58365 (0.58351)	Top-1 acc 57.422 (65.250)	Top-5 acc 82.031 (84.822)	lr 0.00457
Train [87][840/3239]	Time 0.261 (0.546)	Data Time 0.001 (0.048)	Loss 2.3580 (2.4389)	Entropy 0.58375 (0.58351)	Top-1 acc 67.969 (65.236)	Top-5 acc 87.109 (84.815)	lr 0.00457
Train [87][850/3239]	Time 0.227 (0.545)	Data Time 0.001 (0.047)	Loss 2.4621 (2.4386)	Entropy 0.58373 (0.58351)	Top-1 acc 62.500 (65.244)	Top-5 acc 85.156 (84.826)	lr 0.00457
Train [87][860/3239]	Time 0.233 (0.543)	Data Time 0.001 (0.047)	Loss 2.6513 (2.4388)	Entropy 0.58342 (0.58352)	Top-1 acc 59.375 (65.238)	Top-5 acc 83.203 (84.823)	lr 0.00457
Train [87][870/3239]	Time 0.238 (0.542)	Data Time 0.001 (0.046)	Loss 2.4679 (2.4392)	Entropy 0.58368 (0.58351)	Top-1 acc 66.797 (65.228)	Top-5 acc 86.719 (84.824)	lr 0.00457
Train [87][880/3239]	Time 0.271 (0.541)	Data Time 0.001 (0.046)	Loss 2.2463 (2.4388)	Entropy 0.58333 (0.58352)	Top-1 acc 69.141 (65.246)	Top-5 acc 86.328 (84.826)	lr 0.00456
Train [87][890/3239]	Time 0.246 (0.540)	Data Time 0.001 (0.045)	Loss 2.4420 (2.4392)	Entropy 0.58282 (0.58351)	Top-1 acc 67.188 (65.241)	Top-5 acc 85.156 (84.818)	lr 0.00456
Train [87][900/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.045)	Loss 2.4008 (2.4401)	Entropy 0.58294 (0.58350)	Top-1 acc 67.578 (65.221)	Top-5 acc 84.766 (84.792)	lr 0.00456
Train [87][910/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.044)	Loss 2.5102 (2.4399)	Entropy 0.58305 (0.58350)	Top-1 acc 64.453 (65.223)	Top-5 acc 82.812 (84.795)	lr 0.00456
Train [87][920/3239]	Time 0.251 (0.536)	Data Time 0.001 (0.044)	Loss 2.2775 (2.4399)	Entropy 0.58322 (0.58349)	Top-1 acc 68.750 (65.217)	Top-5 acc 88.672 (84.797)	lr 0.00456
Train [87][930/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.043)	Loss 2.7520 (2.4402)	Entropy 0.58337 (0.58349)	Top-1 acc 57.422 (65.209)	Top-5 acc 78.125 (84.790)	lr 0.00456
Train [87][940/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.043)	Loss 2.5828 (2.4412)	Entropy 0.58371 (0.58349)	Top-1 acc 61.719 (65.192)	Top-5 acc 79.297 (84.765)	lr 0.00456
Train [87][950/3239]	Time 0.329 (0.533)	Data Time 0.001 (0.042)	Loss 2.4090 (2.4410)	Entropy 0.58381 (0.58349)	Top-1 acc 63.672 (65.199)	Top-5 acc 84.375 (84.770)	lr 0.00456
Train [87][960/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.042)	Loss 2.3192 (2.4404)	Entropy 0.58362 (0.58350)	Top-1 acc 69.922 (65.215)	Top-5 acc 88.281 (84.790)	lr 0.00456
Train [87][970/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.041)	Loss 2.3648 (2.4401)	Entropy 0.58388 (0.58350)	Top-1 acc 68.750 (65.219)	Top-5 acc 85.156 (84.792)	lr 0.00456
Train [87][980/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.041)	Loss 2.3515 (2.4393)	Entropy 0.58365 (0.58350)	Top-1 acc 70.312 (65.241)	Top-5 acc 86.719 (84.804)	lr 0.00456
Train [87][990/3239]	Time 0.221 (0.528)	Data Time 0.001 (0.041)	Loss 2.5799 (2.4397)	Entropy 0.58356 (0.58350)	Top-1 acc 62.500 (65.234)	Top-5 acc 82.031 (84.802)	lr 0.00456
Train [87][1000/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.040)	Loss 2.2718 (2.4398)	Entropy 0.58360 (0.58350)	Top-1 acc 68.750 (65.226)	Top-5 acc 89.844 (84.796)	lr 0.00456
Train [87][1010/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.040)	Loss 2.7911 (2.4405)	Entropy 0.58384 (0.58350)	Top-1 acc 56.250 (65.199)	Top-5 acc 78.125 (84.790)	lr 0.00455
Train [87][1020/3239]	Time 0.285 (0.578)	Data Time 0.002 (0.040)	Loss 2.4168 (2.4405)	Entropy 0.58380 (0.58351)	Top-1 acc 66.797 (65.194)	Top-5 acc 85.156 (84.789)	lr 0.00455
Train [87][1030/3239]	Time 0.243 (0.576)	Data Time 0.002 (0.039)	Loss 2.3854 (2.4411)	Entropy 0.58425 (0.58351)	Top-1 acc 66.016 (65.182)	Top-5 acc 84.766 (84.779)	lr 0.00455
Train [87][1040/3239]	Time 0.353 (0.575)	Data Time 0.001 (0.039)	Loss 2.4346 (2.4409)	Entropy 0.58422 (0.58352)	Top-1 acc 66.797 (65.189)	Top-5 acc 85.938 (84.787)	lr 0.00455
Train [87][1050/3239]	Time 0.236 (0.574)	Data Time 0.001 (0.038)	Loss 2.3627 (2.4409)	Entropy 0.58445 (0.58352)	Top-1 acc 64.453 (65.193)	Top-5 acc 85.938 (84.792)	lr 0.00455
Train [87][1060/3239]	Time 0.237 (0.573)	Data Time 0.001 (0.038)	Loss 2.3606 (2.4410)	Entropy 0.58447 (0.58353)	Top-1 acc 64.453 (65.198)	Top-5 acc 84.766 (84.787)	lr 0.00455
Train [87][1070/3239]	Time 0.244 (0.571)	Data Time 0.002 (0.038)	Loss 2.6007 (2.4408)	Entropy 0.58461 (0.58354)	Top-1 acc 60.938 (65.205)	Top-5 acc 82.422 (84.790)	lr 0.00455
Train [87][1080/3239]	Time 0.234 (0.570)	Data Time 0.001 (0.037)	Loss 2.3986 (2.4413)	Entropy 0.58501 (0.58355)	Top-1 acc 67.578 (65.195)	Top-5 acc 83.594 (84.780)	lr 0.00455
Train [87][1090/3239]	Time 0.228 (0.569)	Data Time 0.001 (0.037)	Loss 2.5704 (2.4416)	Entropy 0.58492 (0.58357)	Top-1 acc 61.328 (65.182)	Top-5 acc 83.203 (84.774)	lr 0.00455
Train [87][1100/3239]	Time 0.239 (0.568)	Data Time 0.001 (0.037)	Loss 2.4612 (2.4420)	Entropy 0.58523 (0.58358)	Top-1 acc 62.891 (65.179)	Top-5 acc 83.203 (84.767)	lr 0.00455
Train [87][1110/3239]	Time 0.340 (0.566)	Data Time 0.001 (0.036)	Loss 2.3671 (2.4422)	Entropy 0.58520 (0.58360)	Top-1 acc 68.750 (65.165)	Top-5 acc 86.328 (84.771)	lr 0.00455
Train [87][1120/3239]	Time 0.231 (0.565)	Data Time 0.001 (0.036)	Loss 2.3771 (2.4416)	Entropy 0.58553 (0.58361)	Top-1 acc 63.281 (65.175)	Top-5 acc 87.109 (84.787)	lr 0.00455
Train [87][1130/3239]	Time 0.234 (0.564)	Data Time 0.001 (0.036)	Loss 2.3580 (2.4414)	Entropy 0.58536 (0.58363)	Top-1 acc 68.750 (65.182)	Top-5 acc 87.109 (84.793)	lr 0.00455
Train [87][1140/3239]	Time 0.238 (0.563)	Data Time 0.001 (0.036)	Loss 2.5139 (2.4415)	Entropy 0.58539 (0.58364)	Top-1 acc 64.453 (65.172)	Top-5 acc 82.422 (84.788)	lr 0.00454
Train [87][1150/3239]	Time 0.235 (0.562)	Data Time 0.001 (0.035)	Loss 2.4973 (2.4413)	Entropy 0.58546 (0.58366)	Top-1 acc 66.016 (65.185)	Top-5 acc 83.984 (84.795)	lr 0.00454
Train [87][1160/3239]	Time 0.242 (0.561)	Data Time 0.002 (0.035)	Loss 2.3751 (2.4413)	Entropy 0.58540 (0.58368)	Top-1 acc 64.844 (65.189)	Top-5 acc 87.109 (84.789)	lr 0.00454
Train [87][1170/3239]	Time 0.238 (0.560)	Data Time 0.001 (0.035)	Loss 2.8132 (2.4419)	Entropy 0.58534 (0.58369)	Top-1 acc 53.906 (65.170)	Top-5 acc 80.078 (84.778)	lr 0.00454
Train [87][1180/3239]	Time 0.239 (0.559)	Data Time 0.001 (0.034)	Loss 2.4226 (2.4419)	Entropy 0.58530 (0.58370)	Top-1 acc 66.016 (65.163)	Top-5 acc 83.984 (84.774)	lr 0.00454
Train [87][1190/3239]	Time 0.235 (0.558)	Data Time 0.001 (0.034)	Loss 2.3595 (2.4417)	Entropy 0.58497 (0.58372)	Top-1 acc 67.578 (65.172)	Top-5 acc 86.328 (84.773)	lr 0.00454
Train [87][1200/3239]	Time 0.224 (0.557)	Data Time 0.001 (0.034)	Loss 2.2769 (2.4413)	Entropy 0.58508 (0.58373)	Top-1 acc 67.578 (65.177)	Top-5 acc 87.109 (84.783)	lr 0.00454
Train [87][1210/3239]	Time 0.244 (0.556)	Data Time 0.002 (0.034)	Loss 2.4945 (2.4408)	Entropy 0.58495 (0.58374)	Top-1 acc 66.797 (65.187)	Top-5 acc 83.984 (84.793)	lr 0.00454
Train [87][1220/3239]	Time 0.249 (0.555)	Data Time 0.001 (0.033)	Loss 2.2936 (2.4414)	Entropy 0.58508 (0.58375)	Top-1 acc 68.750 (65.173)	Top-5 acc 88.281 (84.778)	lr 0.00454
Train [87][1230/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.033)	Loss 2.7005 (2.4415)	Entropy 0.58528 (0.58376)	Top-1 acc 57.422 (65.170)	Top-5 acc 81.250 (84.776)	lr 0.00454
Train [87][1240/3239]	Time 0.240 (0.553)	Data Time 0.001 (0.033)	Loss 2.2680 (2.4414)	Entropy 0.58540 (0.58377)	Top-1 acc 71.094 (65.171)	Top-5 acc 89.062 (84.774)	lr 0.00454
Train [87][1250/3239]	Time 0.247 (0.553)	Data Time 0.002 (0.033)	Loss 2.6114 (2.4413)	Entropy 0.58550 (0.58379)	Top-1 acc 60.938 (65.172)	Top-5 acc 80.469 (84.775)	lr 0.00454
Train [87][1260/3239]	Time 0.232 (0.552)	Data Time 0.001 (0.032)	Loss 2.5461 (2.4412)	Entropy 0.58571 (0.58380)	Top-1 acc 62.891 (65.176)	Top-5 acc 85.938 (84.771)	lr 0.00454
Train [87][1270/3239]	Time 0.366 (0.551)	Data Time 0.001 (0.032)	Loss 2.3164 (2.4414)	Entropy 0.58588 (0.58382)	Top-1 acc 69.922 (65.173)	Top-5 acc 87.109 (84.770)	lr 0.00453
Train [87][1280/3239]	Time 0.252 (0.550)	Data Time 0.001 (0.032)	Loss 2.4479 (2.4416)	Entropy 0.58605 (0.58383)	Top-1 acc 66.016 (65.172)	Top-5 acc 84.766 (84.760)	lr 0.00453
Train [87][1290/3239]	Time 0.243 (0.550)	Data Time 0.002 (0.032)	Loss 2.4145 (2.4414)	Entropy 0.58562 (0.58385)	Top-1 acc 65.625 (65.176)	Top-5 acc 83.984 (84.764)	lr 0.00453
Train [87][1300/3239]	Time 0.269 (0.549)	Data Time 0.001 (0.031)	Loss 2.6280 (2.4416)	Entropy 0.58554 (0.58386)	Top-1 acc 62.891 (65.179)	Top-5 acc 80.469 (84.755)	lr 0.00453
Train [87][1310/3239]	Time 0.238 (0.548)	Data Time 0.002 (0.031)	Loss 2.4597 (2.4413)	Entropy 0.58527 (0.58388)	Top-1 acc 63.281 (65.180)	Top-5 acc 84.766 (84.764)	lr 0.00453
Train [87][1320/3239]	Time 0.231 (0.547)	Data Time 0.001 (0.031)	Loss 2.4784 (2.4411)	Entropy 0.58548 (0.58389)	Top-1 acc 66.797 (65.188)	Top-5 acc 83.984 (84.766)	lr 0.00453
Train [87][1330/3239]	Time 0.241 (0.546)	Data Time 0.001 (0.031)	Loss 2.3806 (2.4406)	Entropy 0.58577 (0.58390)	Top-1 acc 69.531 (65.202)	Top-5 acc 86.719 (84.779)	lr 0.00453
Train [87][1340/3239]	Time 0.343 (0.545)	Data Time 0.001 (0.030)	Loss 2.5103 (2.4408)	Entropy 0.58558 (0.58391)	Top-1 acc 65.234 (65.199)	Top-5 acc 84.375 (84.772)	lr 0.00453
Train [87][1350/3239]	Time 0.294 (0.545)	Data Time 0.003 (0.030)	Loss 2.4253 (2.4410)	Entropy 0.58537 (0.58393)	Top-1 acc 63.672 (65.193)	Top-5 acc 85.547 (84.766)	lr 0.00453
Train [87][1360/3239]	Time 0.246 (0.544)	Data Time 0.001 (0.030)	Loss 2.4918 (2.4412)	Entropy 0.58502 (0.58394)	Top-1 acc 63.672 (65.190)	Top-5 acc 83.984 (84.762)	lr 0.00453
Train [87][1370/3239]	Time 0.261 (0.543)	Data Time 0.002 (0.030)	Loss 2.2993 (2.4413)	Entropy 0.58496 (0.58394)	Top-1 acc 68.750 (65.187)	Top-5 acc 88.672 (84.762)	lr 0.00453
Train [87][1380/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.030)	Loss 2.4972 (2.4417)	Entropy 0.58526 (0.58395)	Top-1 acc 60.156 (65.170)	Top-5 acc 83.203 (84.749)	lr 0.00453
Train [87][1390/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.029)	Loss 2.2990 (2.4416)	Entropy 0.58500 (0.58396)	Top-1 acc 64.062 (65.169)	Top-5 acc 87.500 (84.752)	lr 0.00452
Train [87][1400/3239]	Time 0.263 (0.541)	Data Time 0.001 (0.029)	Loss 2.5633 (2.4424)	Entropy 0.58483 (0.58397)	Top-1 acc 61.328 (65.155)	Top-5 acc 82.812 (84.737)	lr 0.00452
Train [87][1410/3239]	Time 0.264 (0.540)	Data Time 0.001 (0.029)	Loss 2.6949 (2.4423)	Entropy 0.58445 (0.58397)	Top-1 acc 59.375 (65.147)	Top-5 acc 79.688 (84.742)	lr 0.00452
Train [87][1420/3239]	Time 0.233 (0.539)	Data Time 0.001 (0.029)	Loss 2.5191 (2.4424)	Entropy 0.58474 (0.58398)	Top-1 acc 62.500 (65.138)	Top-5 acc 83.203 (84.745)	lr 0.00452
Train [87][1430/3239]	Time 0.362 (0.539)	Data Time 0.001 (0.029)	Loss 2.4130 (2.4428)	Entropy 0.58505 (0.58398)	Top-1 acc 65.234 (65.125)	Top-5 acc 82.422 (84.733)	lr 0.00452
Train [87][1440/3239]	Time 0.228 (0.538)	Data Time 0.002 (0.028)	Loss 2.3287 (2.4429)	Entropy 0.58483 (0.58399)	Top-1 acc 66.016 (65.121)	Top-5 acc 85.938 (84.730)	lr 0.00452
Train [87][1450/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.028)	Loss 2.4551 (2.4430)	Entropy 0.58487 (0.58400)	Top-1 acc 58.594 (65.115)	Top-5 acc 83.984 (84.728)	lr 0.00452
Train [87][1460/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.028)	Loss 2.5361 (2.4432)	Entropy 0.58500 (0.58400)	Top-1 acc 64.844 (65.110)	Top-5 acc 81.641 (84.727)	lr 0.00452
Train [87][1470/3239]	Time 0.263 (0.535)	Data Time 0.001 (0.028)	Loss 2.3198 (2.4432)	Entropy 0.58533 (0.58401)	Top-1 acc 66.016 (65.116)	Top-5 acc 88.281 (84.726)	lr 0.00452
Train [87][1480/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.028)	Loss 2.4438 (2.4433)	Entropy 0.58557 (0.58402)	Top-1 acc 63.281 (65.107)	Top-5 acc 85.156 (84.723)	lr 0.00452
Train [87][1490/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.028)	Loss 2.3852 (2.4436)	Entropy 0.58533 (0.58403)	Top-1 acc 65.234 (65.098)	Top-5 acc 87.891 (84.721)	lr 0.00452
Train [87][1500/3239]	Time 0.364 (0.533)	Data Time 0.001 (0.027)	Loss 2.5858 (2.4439)	Entropy 0.58508 (0.58404)	Top-1 acc 62.500 (65.093)	Top-5 acc 80.859 (84.714)	lr 0.00452
Train [87][1510/3239]	Time 0.224 (0.532)	Data Time 0.001 (0.027)	Loss 2.8799 (2.4442)	Entropy 0.58482 (0.58404)	Top-1 acc 52.734 (65.083)	Top-5 acc 75.000 (84.712)	lr 0.00452
Train [87][1520/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.027)	Loss 2.4030 (2.4444)	Entropy 0.58486 (0.58405)	Top-1 acc 62.891 (65.071)	Top-5 acc 83.984 (84.714)	lr 0.00451
Train [87][1530/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.027)	Loss 2.4835 (2.4446)	Entropy 0.58490 (0.58406)	Top-1 acc 66.016 (65.067)	Top-5 acc 85.156 (84.710)	lr 0.00451
Train [87][1540/3239]	Time 0.267 (0.530)	Data Time 0.001 (0.027)	Loss 2.3653 (2.4449)	Entropy 0.58484 (0.58406)	Top-1 acc 66.016 (65.059)	Top-5 acc 86.719 (84.706)	lr 0.00451
Train [87][1550/3239]	Time 0.310 (0.530)	Data Time 0.001 (0.027)	Loss 2.2742 (2.4447)	Entropy 0.58480 (0.58407)	Top-1 acc 68.359 (65.060)	Top-5 acc 88.672 (84.711)	lr 0.00451
Train [87][1560/3239]	Time 0.240 (0.530)	Data Time 0.002 (0.026)	Loss 2.4519 (2.4448)	Entropy 0.58497 (0.58407)	Top-1 acc 64.453 (65.052)	Top-5 acc 85.156 (84.708)	lr 0.00451
Train [87][1570/3239]	Time 0.254 (0.529)	Data Time 0.001 (0.026)	Loss 2.3248 (2.4447)	Entropy 0.58501 (0.58408)	Top-1 acc 65.234 (65.053)	Top-5 acc 87.500 (84.708)	lr 0.00451
Train [87][1580/3239]	Time 0.276 (0.528)	Data Time 0.001 (0.026)	Loss 2.3353 (2.4446)	Entropy 0.58516 (0.58408)	Top-1 acc 67.578 (65.060)	Top-5 acc 85.547 (84.709)	lr 0.00451
Train [87][1590/3239]	Time 0.288 (0.528)	Data Time 0.001 (0.026)	Loss 2.3996 (2.4448)	Entropy 0.58542 (0.58409)	Top-1 acc 65.234 (65.057)	Top-5 acc 85.938 (84.705)	lr 0.00451
Train [87][1600/3239]	Time 0.263 (0.527)	Data Time 0.001 (0.026)	Loss 2.3547 (2.4450)	Entropy 0.58558 (0.58410)	Top-1 acc 64.453 (65.052)	Top-5 acc 87.109 (84.702)	lr 0.00451
Train [87][1610/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.026)	Loss 2.4551 (2.4450)	Entropy 0.58560 (0.58411)	Top-1 acc 64.062 (65.056)	Top-5 acc 86.719 (84.707)	lr 0.00451
Train [87][1620/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.025)	Loss 2.1799 (2.4447)	Entropy 0.58578 (0.58412)	Top-1 acc 72.266 (65.068)	Top-5 acc 88.672 (84.710)	lr 0.00451
Train [87][1630/3239]	Time 0.271 (0.525)	Data Time 0.002 (0.025)	Loss 2.4645 (2.4447)	Entropy 0.58535 (0.58413)	Top-1 acc 63.672 (65.072)	Top-5 acc 86.719 (84.711)	lr 0.00451
Train [87][1640/3239]	Time 0.231 (0.524)	Data Time 0.002 (0.025)	Loss 2.5216 (2.4449)	Entropy 0.58533 (0.58413)	Top-1 acc 63.672 (65.067)	Top-5 acc 83.984 (84.706)	lr 0.00451
Train [87][1650/3239]	Time 0.241 (0.524)	Data Time 0.002 (0.025)	Loss 2.6283 (2.4447)	Entropy 0.58511 (0.58414)	Top-1 acc 61.719 (65.071)	Top-5 acc 84.766 (84.712)	lr 0.00450
Train [87][1660/3239]	Time 0.355 (0.523)	Data Time 0.002 (0.025)	Loss 2.6261 (2.4447)	Entropy 0.58442 (0.58414)	Top-1 acc 64.844 (65.078)	Top-5 acc 80.469 (84.706)	lr 0.00450
Train [87][1670/3239]	Time 0.323 (0.555)	Data Time 0.005 (0.025)	Loss 2.3383 (2.4448)	Entropy 0.58451 (0.58415)	Top-1 acc 69.141 (65.074)	Top-5 acc 84.766 (84.708)	lr 0.00450
Train [87][1680/3239]	Time 0.231 (0.554)	Data Time 0.002 (0.025)	Loss 2.6879 (2.4449)	Entropy 0.58434 (0.58415)	Top-1 acc 60.938 (65.077)	Top-5 acc 77.344 (84.706)	lr 0.00450
Train [87][1690/3239]	Time 0.278 (0.553)	Data Time 0.003 (0.024)	Loss 2.3781 (2.4448)	Entropy 0.58390 (0.58415)	Top-1 acc 64.453 (65.079)	Top-5 acc 85.547 (84.706)	lr 0.00450
Train [87][1700/3239]	Time 0.275 (0.553)	Data Time 0.002 (0.024)	Loss 2.4918 (2.4448)	Entropy 0.58388 (0.58415)	Top-1 acc 65.234 (65.078)	Top-5 acc 83.203 (84.703)	lr 0.00450
Train [87][1710/3239]	Time 0.264 (0.552)	Data Time 0.003 (0.024)	Loss 2.3456 (2.4446)	Entropy 0.58405 (0.58414)	Top-1 acc 65.625 (65.078)	Top-5 acc 87.500 (84.709)	lr 0.00450
Train [87][1720/3239]	Time 0.266 (0.552)	Data Time 0.001 (0.024)	Loss 2.1751 (2.4445)	Entropy 0.58406 (0.58414)	Top-1 acc 71.484 (65.077)	Top-5 acc 89.453 (84.713)	lr 0.00450
Train [87][1730/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.024)	Loss 2.4438 (2.4444)	Entropy 0.58418 (0.58414)	Top-1 acc 67.578 (65.083)	Top-5 acc 84.375 (84.716)	lr 0.00450
Train [87][1740/3239]	Time 0.280 (0.550)	Data Time 0.001 (0.024)	Loss 2.3763 (2.4444)	Entropy 0.58395 (0.58414)	Top-1 acc 66.406 (65.089)	Top-5 acc 85.547 (84.716)	lr 0.00450
Train [87][1750/3239]	Time 0.517 (0.550)	Data Time 0.018 (0.024)	Loss 2.5479 (2.4446)	Entropy 0.58374 (0.58414)	Top-1 acc 61.719 (65.080)	Top-5 acc 83.203 (84.713)	lr 0.00450
Train [87][1760/3239]	Time 0.227 (0.550)	Data Time 0.001 (0.024)	Loss 2.3406 (2.4446)	Entropy 0.58366 (0.58414)	Top-1 acc 67.969 (65.081)	Top-5 acc 85.156 (84.708)	lr 0.00450
Train [87][1770/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.023)	Loss 2.6541 (2.4448)	Entropy 0.58339 (0.58414)	Top-1 acc 58.594 (65.074)	Top-5 acc 81.250 (84.703)	lr 0.00450
Train [87][1780/3239]	Time 0.235 (0.549)	Data Time 0.001 (0.023)	Loss 2.3786 (2.4448)	Entropy 0.58338 (0.58413)	Top-1 acc 67.188 (65.074)	Top-5 acc 86.719 (84.700)	lr 0.00449
Train [87][1790/3239]	Time 0.236 (0.548)	Data Time 0.001 (0.023)	Loss 2.3683 (2.4449)	Entropy 0.58365 (0.58413)	Top-1 acc 69.531 (65.078)	Top-5 acc 85.156 (84.696)	lr 0.00449
Train [87][1800/3239]	Time 0.246 (0.548)	Data Time 0.001 (0.023)	Loss 2.7673 (2.4453)	Entropy 0.58361 (0.58413)	Top-1 acc 54.297 (65.064)	Top-5 acc 79.688 (84.689)	lr 0.00449
Train [87][1810/3239]	Time 0.282 (0.547)	Data Time 0.001 (0.023)	Loss 2.3600 (2.4454)	Entropy 0.58378 (0.58412)	Top-1 acc 68.359 (65.061)	Top-5 acc 87.500 (84.690)	lr 0.00449
Train [87][1820/3239]	Time 0.433 (0.547)	Data Time 0.001 (0.023)	Loss 2.4169 (2.4452)	Entropy 0.58383 (0.58412)	Top-1 acc 65.625 (65.064)	Top-5 acc 83.984 (84.690)	lr 0.00449
Train [87][1830/3239]	Time 0.235 (0.546)	Data Time 0.001 (0.023)	Loss 2.5159 (2.4450)	Entropy 0.58396 (0.58412)	Top-1 acc 61.719 (65.066)	Top-5 acc 84.766 (84.693)	lr 0.00449
Train [87][1840/3239]	Time 0.265 (0.546)	Data Time 0.001 (0.023)	Loss 2.6130 (2.4455)	Entropy 0.58392 (0.58412)	Top-1 acc 63.672 (65.054)	Top-5 acc 83.984 (84.690)	lr 0.00449
Train [87][1850/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.023)	Loss 2.4582 (2.4458)	Entropy 0.58374 (0.58412)	Top-1 acc 66.797 (65.054)	Top-5 acc 83.984 (84.683)	lr 0.00449
Train [87][1860/3239]	Time 0.240 (0.544)	Data Time 0.002 (0.022)	Loss 2.2261 (2.4457)	Entropy 0.58391 (0.58412)	Top-1 acc 69.531 (65.050)	Top-5 acc 88.281 (84.684)	lr 0.00449
Train [87][1870/3239]	Time 0.226 (0.544)	Data Time 0.001 (0.022)	Loss 2.4479 (2.4454)	Entropy 0.58366 (0.58412)	Top-1 acc 64.844 (65.058)	Top-5 acc 84.375 (84.693)	lr 0.00449
Train [87][1880/3239]	Time 0.276 (0.543)	Data Time 0.001 (0.022)	Loss 2.5006 (2.4452)	Entropy 0.58375 (0.58411)	Top-1 acc 64.062 (65.061)	Top-5 acc 85.547 (84.700)	lr 0.00449
Train [87][1890/3239]	Time 0.340 (0.543)	Data Time 0.002 (0.022)	Loss 2.4133 (2.4450)	Entropy 0.58383 (0.58411)	Top-1 acc 64.062 (65.062)	Top-5 acc 86.328 (84.702)	lr 0.00449
Train [87][1900/3239]	Time 0.255 (0.542)	Data Time 0.001 (0.022)	Loss 2.4458 (2.4451)	Entropy 0.58369 (0.58411)	Top-1 acc 67.969 (65.060)	Top-5 acc 87.109 (84.697)	lr 0.00449
Train [87][1910/3239]	Time 0.241 (0.541)	Data Time 0.001 (0.022)	Loss 2.6121 (2.4450)	Entropy 0.58382 (0.58411)	Top-1 acc 60.156 (65.063)	Top-5 acc 82.031 (84.702)	lr 0.00448
Train [87][1920/3239]	Time 0.237 (0.541)	Data Time 0.001 (0.022)	Loss 2.3036 (2.4448)	Entropy 0.58350 (0.58411)	Top-1 acc 66.406 (65.067)	Top-5 acc 87.891 (84.707)	lr 0.00448
Train [87][1930/3239]	Time 0.273 (0.540)	Data Time 0.001 (0.022)	Loss 2.3990 (2.4446)	Entropy 0.58373 (0.58410)	Top-1 acc 66.406 (65.072)	Top-5 acc 85.156 (84.711)	lr 0.00448
Train [87][1940/3239]	Time 0.259 (0.540)	Data Time 0.002 (0.022)	Loss 2.2921 (2.4443)	Entropy 0.58380 (0.58410)	Top-1 acc 71.094 (65.078)	Top-5 acc 87.891 (84.716)	lr 0.00448
Train [87][1950/3239]	Time 0.280 (0.539)	Data Time 0.043 (0.021)	Loss 2.3574 (2.4442)	Entropy 0.58397 (0.58410)	Top-1 acc 67.969 (65.078)	Top-5 acc 87.109 (84.719)	lr 0.00448
Train [87][1960/3239]	Time 0.222 (0.539)	Data Time 0.002 (0.021)	Loss 2.7757 (2.4442)	Entropy 0.58424 (0.58410)	Top-1 acc 55.859 (65.081)	Top-5 acc 77.734 (84.720)	lr 0.00448
Train [87][1970/3239]	Time 0.249 (0.538)	Data Time 0.001 (0.021)	Loss 2.8421 (2.4443)	Entropy 0.58472 (0.58410)	Top-1 acc 55.469 (65.080)	Top-5 acc 79.297 (84.719)	lr 0.00448
Train [87][1980/3239]	Time 0.337 (0.538)	Data Time 0.001 (0.021)	Loss 2.3827 (2.4443)	Entropy 0.58484 (0.58410)	Top-1 acc 66.016 (65.081)	Top-5 acc 83.594 (84.720)	lr 0.00448
Train [87][1990/3239]	Time 0.258 (0.537)	Data Time 0.001 (0.021)	Loss 2.5475 (2.4445)	Entropy 0.58500 (0.58411)	Top-1 acc 61.719 (65.076)	Top-5 acc 82.422 (84.718)	lr 0.00448
Train [87][2000/3239]	Time 0.280 (0.537)	Data Time 0.001 (0.021)	Loss 2.3171 (2.4446)	Entropy 0.58465 (0.58411)	Top-1 acc 66.797 (65.073)	Top-5 acc 87.500 (84.721)	lr 0.00448
Train [87][2010/3239]	Time 0.245 (0.536)	Data Time 0.002 (0.021)	Loss 2.4007 (2.4446)	Entropy 0.58483 (0.58411)	Top-1 acc 69.141 (65.076)	Top-5 acc 85.547 (84.720)	lr 0.00448
Train [87][2020/3239]	Time 0.235 (0.536)	Data Time 0.002 (0.021)	Loss 2.4509 (2.4441)	Entropy 0.58466 (0.58412)	Top-1 acc 67.578 (65.087)	Top-5 acc 83.984 (84.729)	lr 0.00448
Train [87][2030/3239]	Time 0.261 (0.535)	Data Time 0.028 (0.021)	Loss 2.4146 (2.4440)	Entropy 0.58466 (0.58412)	Top-1 acc 66.406 (65.093)	Top-5 acc 84.375 (84.730)	lr 0.00448
Train [87][2040/3239]	Time 0.241 (0.535)	Data Time 0.001 (0.021)	Loss 2.3349 (2.4444)	Entropy 0.58483 (0.58412)	Top-1 acc 64.453 (65.086)	Top-5 acc 85.547 (84.725)	lr 0.00447
Train [87][2050/3239]	Time 0.331 (0.534)	Data Time 0.001 (0.021)	Loss 2.4980 (2.4442)	Entropy 0.58450 (0.58413)	Top-1 acc 63.672 (65.088)	Top-5 acc 82.812 (84.728)	lr 0.00447
Train [87][2060/3239]	Time 0.293 (0.534)	Data Time 0.001 (0.020)	Loss 2.3298 (2.4443)	Entropy 0.58427 (0.58413)	Top-1 acc 67.969 (65.084)	Top-5 acc 85.547 (84.729)	lr 0.00447
Train [87][2070/3239]	Time 0.248 (0.533)	Data Time 0.001 (0.020)	Loss 2.4754 (2.4443)	Entropy 0.58443 (0.58413)	Top-1 acc 62.500 (65.079)	Top-5 acc 85.938 (84.731)	lr 0.00447
Train [87][2080/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.020)	Loss 2.4490 (2.4443)	Entropy 0.58418 (0.58413)	Top-1 acc 65.234 (65.079)	Top-5 acc 83.984 (84.730)	lr 0.00447
Train [87][2090/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.020)	Loss 2.2783 (2.4444)	Entropy 0.58397 (0.58413)	Top-1 acc 67.969 (65.082)	Top-5 acc 88.672 (84.727)	lr 0.00447
Train [87][2100/3239]	Time 0.241 (0.532)	Data Time 0.001 (0.020)	Loss 2.5122 (2.4444)	Entropy 0.58420 (0.58413)	Top-1 acc 66.406 (65.084)	Top-5 acc 85.156 (84.728)	lr 0.00447
Train [87][2110/3239]	Time 0.286 (0.531)	Data Time 0.001 (0.020)	Loss 2.2286 (2.4440)	Entropy 0.58438 (0.58413)	Top-1 acc 73.438 (65.092)	Top-5 acc 89.062 (84.736)	lr 0.00447
Train [87][2120/3239]	Time 0.219 (0.531)	Data Time 0.001 (0.020)	Loss 2.4953 (2.4440)	Entropy 0.58405 (0.58413)	Top-1 acc 65.234 (65.092)	Top-5 acc 82.031 (84.734)	lr 0.00447
Train [87][2130/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.020)	Loss 2.2981 (2.4440)	Entropy 0.58344 (0.58413)	Top-1 acc 69.531 (65.093)	Top-5 acc 84.766 (84.733)	lr 0.00447
Train [87][2140/3239]	Time 0.250 (0.530)	Data Time 0.001 (0.020)	Loss 2.4747 (2.4441)	Entropy 0.58333 (0.58413)	Top-1 acc 62.891 (65.094)	Top-5 acc 83.984 (84.730)	lr 0.00447
Train [87][2150/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.020)	Loss 2.5403 (2.4440)	Entropy 0.58317 (0.58412)	Top-1 acc 64.062 (65.096)	Top-5 acc 81.250 (84.733)	lr 0.00447
Train [87][2160/3239]	Time 0.271 (0.529)	Data Time 0.001 (0.020)	Loss 2.2925 (2.4441)	Entropy 0.58325 (0.58412)	Top-1 acc 65.625 (65.091)	Top-5 acc 87.891 (84.732)	lr 0.00447
Train [87][2170/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.020)	Loss 2.6991 (2.4443)	Entropy 0.58343 (0.58412)	Top-1 acc 57.812 (65.084)	Top-5 acc 81.641 (84.731)	lr 0.00446
Train [87][2180/3239]	Time 0.266 (0.528)	Data Time 0.001 (0.019)	Loss 2.4111 (2.4445)	Entropy 0.58335 (0.58411)	Top-1 acc 66.406 (65.079)	Top-5 acc 85.156 (84.729)	lr 0.00446
Train [87][2190/3239]	Time 0.242 (0.527)	Data Time 0.001 (0.019)	Loss 2.3926 (2.4443)	Entropy 0.58329 (0.58411)	Top-1 acc 67.578 (65.081)	Top-5 acc 83.984 (84.729)	lr 0.00446
Train [87][2200/3239]	Time 0.257 (0.527)	Data Time 0.001 (0.019)	Loss 2.7138 (2.4445)	Entropy 0.58356 (0.58411)	Top-1 acc 57.031 (65.076)	Top-5 acc 82.031 (84.724)	lr 0.00446
Train [87][2210/3239]	Time 0.348 (0.526)	Data Time 0.001 (0.019)	Loss 2.6737 (2.4450)	Entropy 0.58355 (0.58410)	Top-1 acc 59.375 (65.065)	Top-5 acc 80.469 (84.717)	lr 0.00446
Train [87][2220/3239]	Time 0.257 (0.526)	Data Time 0.001 (0.019)	Loss 2.4285 (2.4448)	Entropy 0.58349 (0.58410)	Top-1 acc 65.625 (65.072)	Top-5 acc 83.984 (84.721)	lr 0.00446
Train [87][2230/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.019)	Loss 2.4635 (2.4446)	Entropy 0.58322 (0.58410)	Top-1 acc 66.406 (65.078)	Top-5 acc 85.938 (84.725)	lr 0.00446
Train [87][2240/3239]	Time 0.293 (0.525)	Data Time 0.002 (0.019)	Loss 2.4290 (2.4444)	Entropy 0.58319 (0.58409)	Top-1 acc 64.844 (65.082)	Top-5 acc 86.719 (84.728)	lr 0.00446
Train [87][2250/3239]	Time 0.252 (0.525)	Data Time 0.001 (0.019)	Loss 2.3823 (2.4446)	Entropy 0.58332 (0.58409)	Top-1 acc 68.359 (65.082)	Top-5 acc 85.547 (84.724)	lr 0.00446
Train [87][2260/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.019)	Loss 2.3624 (2.4445)	Entropy 0.58333 (0.58409)	Top-1 acc 68.359 (65.079)	Top-5 acc 85.156 (84.725)	lr 0.00446
Train [87][2270/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.019)	Loss 2.5143 (2.4444)	Entropy 0.58332 (0.58408)	Top-1 acc 60.547 (65.083)	Top-5 acc 83.203 (84.726)	lr 0.00446
Train [87][2280/3239]	Time 0.365 (0.524)	Data Time 0.001 (0.019)	Loss 2.4717 (2.4445)	Entropy 0.58321 (0.58408)	Top-1 acc 64.453 (65.082)	Top-5 acc 83.984 (84.722)	lr 0.00446
Train [87][2290/3239]	Time 0.258 (0.523)	Data Time 0.001 (0.019)	Loss 2.5259 (2.4446)	Entropy 0.58314 (0.58408)	Top-1 acc 64.844 (65.079)	Top-5 acc 81.250 (84.720)	lr 0.00446
Train [87][2300/3239]	Time 0.239 (0.523)	Data Time 0.001 (0.018)	Loss 2.3952 (2.4445)	Entropy 0.58281 (0.58407)	Top-1 acc 65.234 (65.083)	Top-5 acc 83.594 (84.718)	lr 0.00445
Train [87][2310/3239]	Time 0.270 (0.522)	Data Time 0.001 (0.018)	Loss 2.6910 (2.4445)	Entropy 0.58260 (0.58407)	Top-1 acc 60.938 (65.079)	Top-5 acc 81.250 (84.720)	lr 0.00445
Train [87][2320/3239]	Time 0.294 (0.522)	Data Time 0.002 (0.018)	Loss 2.2906 (2.4445)	Entropy 0.58273 (0.58406)	Top-1 acc 67.578 (65.079)	Top-5 acc 89.062 (84.718)	lr 0.00445
Train [87][2330/3239]	Time 0.331 (0.546)	Data Time 0.002 (0.018)	Loss 2.4369 (2.4447)	Entropy 0.58293 (0.58405)	Top-1 acc 64.453 (65.073)	Top-5 acc 85.938 (84.716)	lr 0.00445
Train [87][2340/3239]	Time 0.246 (0.546)	Data Time 0.002 (0.018)	Loss 2.5527 (2.4449)	Entropy 0.58295 (0.58405)	Top-1 acc 62.891 (65.069)	Top-5 acc 80.859 (84.710)	lr 0.00445
Train [87][2350/3239]	Time 0.263 (0.545)	Data Time 0.002 (0.018)	Loss 2.3454 (2.4450)	Entropy 0.58278 (0.58404)	Top-1 acc 67.188 (65.070)	Top-5 acc 87.891 (84.711)	lr 0.00445
Train [87][2360/3239]	Time 0.260 (0.545)	Data Time 0.002 (0.018)	Loss 2.3347 (2.4451)	Entropy 0.58265 (0.58404)	Top-1 acc 64.062 (65.061)	Top-5 acc 87.109 (84.708)	lr 0.00445
Train [87][2370/3239]	Time 0.365 (0.545)	Data Time 0.001 (0.018)	Loss 2.4928 (2.4453)	Entropy 0.58284 (0.58403)	Top-1 acc 63.281 (65.056)	Top-5 acc 83.594 (84.706)	lr 0.00445
Train [87][2380/3239]	Time 0.251 (0.544)	Data Time 0.001 (0.018)	Loss 2.4802 (2.4454)	Entropy 0.58288 (0.58403)	Top-1 acc 65.625 (65.051)	Top-5 acc 83.203 (84.702)	lr 0.00445
Train [87][2390/3239]	Time 0.258 (0.544)	Data Time 0.001 (0.018)	Loss 2.4118 (2.4455)	Entropy 0.58263 (0.58402)	Top-1 acc 68.359 (65.050)	Top-5 acc 84.375 (84.698)	lr 0.00445
Train [87][2400/3239]	Time 0.241 (0.544)	Data Time 0.001 (0.018)	Loss 2.5521 (2.4455)	Entropy 0.58279 (0.58402)	Top-1 acc 60.547 (65.049)	Top-5 acc 83.984 (84.699)	lr 0.00445
Train [87][2410/3239]	Time 0.267 (0.543)	Data Time 0.001 (0.018)	Loss 2.4878 (2.4453)	Entropy 0.58275 (0.58401)	Top-1 acc 64.062 (65.049)	Top-5 acc 87.109 (84.705)	lr 0.00445
Train [87][2420/3239]	Time 0.263 (0.543)	Data Time 0.001 (0.018)	Loss 2.4461 (2.4454)	Entropy 0.58264 (0.58401)	Top-1 acc 64.453 (65.044)	Top-5 acc 85.156 (84.705)	lr 0.00445
Train [87][2430/3239]	Time 0.233 (0.543)	Data Time 0.001 (0.018)	Loss 2.2730 (2.4455)	Entropy 0.58242 (0.58400)	Top-1 acc 67.578 (65.045)	Top-5 acc 87.500 (84.702)	lr 0.00444
Train [87][2440/3239]	Time 0.360 (0.542)	Data Time 0.001 (0.018)	Loss 2.4091 (2.4455)	Entropy 0.58247 (0.58399)	Top-1 acc 64.062 (65.044)	Top-5 acc 83.203 (84.701)	lr 0.00444
Train [87][2450/3239]	Time 0.243 (0.542)	Data Time 0.002 (0.017)	Loss 2.5678 (2.4455)	Entropy 0.58263 (0.58399)	Top-1 acc 64.062 (65.046)	Top-5 acc 83.594 (84.703)	lr 0.00444
Train [87][2460/3239]	Time 0.269 (0.542)	Data Time 0.001 (0.017)	Loss 2.7076 (2.4456)	Entropy 0.58229 (0.58398)	Top-1 acc 58.203 (65.042)	Top-5 acc 78.516 (84.696)	lr 0.00444
Train [87][2470/3239]	Time 0.254 (0.541)	Data Time 0.001 (0.017)	Loss 2.3945 (2.4457)	Entropy 0.58235 (0.58397)	Top-1 acc 64.844 (65.039)	Top-5 acc 85.156 (84.695)	lr 0.00444
Train [87][2480/3239]	Time 0.289 (0.541)	Data Time 0.001 (0.017)	Loss 2.3456 (2.4459)	Entropy 0.58247 (0.58397)	Top-1 acc 66.406 (65.035)	Top-5 acc 85.547 (84.693)	lr 0.00444
Train [87][2490/3239]	Time 0.250 (0.541)	Data Time 0.001 (0.017)	Loss 2.2880 (2.4455)	Entropy 0.58239 (0.58396)	Top-1 acc 67.969 (65.038)	Top-5 acc 86.719 (84.699)	lr 0.00444
Train [87][2500/3239]	Time 0.231 (0.540)	Data Time 0.001 (0.017)	Loss 2.3237 (2.4454)	Entropy 0.58249 (0.58396)	Top-1 acc 67.969 (65.040)	Top-5 acc 85.547 (84.701)	lr 0.00444
Train [87][2510/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.017)	Loss 2.6320 (2.4456)	Entropy 0.58243 (0.58395)	Top-1 acc 59.375 (65.032)	Top-5 acc 81.250 (84.698)	lr 0.00444
Train [87][2520/3239]	Time 0.290 (0.540)	Data Time 0.001 (0.017)	Loss 2.4571 (2.4458)	Entropy 0.58245 (0.58394)	Top-1 acc 67.188 (65.030)	Top-5 acc 82.422 (84.696)	lr 0.00444
Train [87][2530/3239]	Time 0.362 (0.540)	Data Time 0.001 (0.017)	Loss 2.6792 (2.4457)	Entropy 0.58295 (0.58394)	Top-1 acc 61.328 (65.027)	Top-5 acc 80.078 (84.698)	lr 0.00444
Train [87][2540/3239]	Time 0.245 (0.539)	Data Time 0.001 (0.017)	Loss 2.5181 (2.4456)	Entropy 0.58273 (0.58393)	Top-1 acc 62.891 (65.031)	Top-5 acc 83.594 (84.696)	lr 0.00444
Train [87][2550/3239]	Time 0.255 (0.539)	Data Time 0.001 (0.017)	Loss 2.2942 (2.4455)	Entropy 0.58292 (0.58393)	Top-1 acc 69.922 (65.035)	Top-5 acc 85.547 (84.697)	lr 0.00444
Train [87][2560/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.017)	Loss 2.3923 (2.4457)	Entropy 0.58300 (0.58393)	Top-1 acc 67.188 (65.033)	Top-5 acc 85.156 (84.695)	lr 0.00443
Train [87][2570/3239]	Time 0.277 (0.539)	Data Time 0.002 (0.018)	Loss 2.2706 (2.4459)	Entropy 0.58298 (0.58392)	Top-1 acc 68.359 (65.026)	Top-5 acc 86.719 (84.691)	lr 0.00443
Train [87][2580/3239]	Time 0.259 (0.540)	Data Time 0.002 (0.018)	Loss 2.3697 (2.4458)	Entropy 0.58329 (0.58392)	Top-1 acc 65.625 (65.030)	Top-5 acc 84.766 (84.693)	lr 0.00443
Train [87][2590/3239]	Time 0.250 (0.539)	Data Time 0.001 (0.018)	Loss 2.4375 (2.4456)	Entropy 0.58339 (0.58392)	Top-1 acc 63.672 (65.033)	Top-5 acc 84.375 (84.697)	lr 0.00443
Train [87][2600/3239]	Time 0.402 (0.540)	Data Time 0.002 (0.019)	Loss 2.5235 (2.4455)	Entropy 0.58375 (0.58392)	Top-1 acc 61.719 (65.033)	Top-5 acc 84.766 (84.700)	lr 0.00443
Train [87][2610/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.019)	Loss 2.3641 (2.4455)	Entropy 0.58368 (0.58391)	Top-1 acc 68.359 (65.038)	Top-5 acc 84.766 (84.702)	lr 0.00443
Train [87][2620/3239]	Time 0.246 (0.539)	Data Time 0.002 (0.019)	Loss 2.2535 (2.4455)	Entropy 0.58383 (0.58391)	Top-1 acc 70.703 (65.037)	Top-5 acc 89.453 (84.702)	lr 0.00443
Train [87][2630/3239]	Time 0.619 (0.539)	Data Time 0.379 (0.020)	Loss 2.5194 (2.4458)	Entropy 0.58386 (0.58391)	Top-1 acc 59.375 (65.028)	Top-5 acc 85.156 (84.696)	lr 0.00443
Train [87][2640/3239]	Time 0.285 (0.540)	Data Time 0.001 (0.020)	Loss 2.4441 (2.4457)	Entropy 0.58383 (0.58391)	Top-1 acc 64.844 (65.028)	Top-5 acc 84.766 (84.696)	lr 0.00443
Train [87][2650/3239]	Time 0.254 (0.540)	Data Time 0.001 (0.020)	Loss 2.4235 (2.4455)	Entropy 0.58391 (0.58391)	Top-1 acc 66.406 (65.036)	Top-5 acc 84.375 (84.699)	lr 0.00443
Train [87][2660/3239]	Time 0.256 (0.541)	Data Time 0.002 (0.021)	Loss 2.1964 (2.4456)	Entropy 0.58376 (0.58391)	Top-1 acc 67.969 (65.033)	Top-5 acc 88.672 (84.698)	lr 0.00443
Train [87][2670/3239]	Time 0.250 (0.541)	Data Time 0.001 (0.022)	Loss 2.4340 (2.4456)	Entropy 0.58381 (0.58391)	Top-1 acc 65.625 (65.036)	Top-5 acc 82.422 (84.696)	lr 0.00443
Train [87][2680/3239]	Time 0.239 (0.541)	Data Time 0.001 (0.022)	Loss 2.4897 (2.4456)	Entropy 0.58378 (0.58391)	Top-1 acc 65.234 (65.037)	Top-5 acc 84.766 (84.698)	lr 0.00442
Train [87][2690/3239]	Time 0.353 (0.540)	Data Time 0.001 (0.022)	Loss 2.4250 (2.4457)	Entropy 0.58416 (0.58391)	Top-1 acc 64.062 (65.035)	Top-5 acc 85.156 (84.699)	lr 0.00442
Train [87][2700/3239]	Time 0.272 (0.541)	Data Time 0.003 (0.022)	Loss 2.5029 (2.4458)	Entropy 0.58424 (0.58391)	Top-1 acc 64.453 (65.035)	Top-5 acc 83.203 (84.696)	lr 0.00442
Train [87][2710/3239]	Time 0.245 (0.540)	Data Time 0.001 (0.022)	Loss 2.3179 (2.4455)	Entropy 0.58419 (0.58391)	Top-1 acc 67.188 (65.045)	Top-5 acc 85.156 (84.702)	lr 0.00442
Train [87][2720/3239]	Time 0.285 (0.542)	Data Time 0.001 (0.024)	Loss 2.5269 (2.4456)	Entropy 0.58420 (0.58392)	Top-1 acc 61.719 (65.040)	Top-5 acc 82.031 (84.700)	lr 0.00442
Train [87][2730/3239]	Time 0.292 (0.541)	Data Time 0.002 (0.024)	Loss 2.3531 (2.4457)	Entropy 0.58406 (0.58392)	Top-1 acc 62.891 (65.036)	Top-5 acc 88.281 (84.702)	lr 0.00442
Train [87][2740/3239]	Time 0.257 (0.541)	Data Time 0.001 (0.023)	Loss 2.5505 (2.4456)	Entropy 0.58404 (0.58392)	Top-1 acc 62.891 (65.042)	Top-5 acc 82.031 (84.704)	lr 0.00442
Train [87][2750/3239]	Time 0.240 (0.541)	Data Time 0.001 (0.023)	Loss 2.5593 (2.4457)	Entropy 0.58359 (0.58392)	Top-1 acc 62.109 (65.041)	Top-5 acc 83.203 (84.703)	lr 0.00442
Train [87][2760/3239]	Time 0.362 (0.541)	Data Time 0.001 (0.024)	Loss 2.6244 (2.4460)	Entropy 0.58372 (0.58392)	Top-1 acc 59.766 (65.036)	Top-5 acc 78.516 (84.695)	lr 0.00442
Train [87][2770/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.024)	Loss 2.5093 (2.4460)	Entropy 0.58410 (0.58392)	Top-1 acc 60.156 (65.032)	Top-5 acc 82.812 (84.695)	lr 0.00442
Train [87][2780/3239]	Time 0.257 (0.540)	Data Time 0.001 (0.024)	Loss 2.3964 (2.4459)	Entropy 0.58420 (0.58392)	Top-1 acc 63.672 (65.033)	Top-5 acc 87.109 (84.698)	lr 0.00442
Train [87][2790/3239]	Time 0.243 (0.540)	Data Time 0.001 (0.024)	Loss 2.3695 (2.4457)	Entropy 0.58458 (0.58392)	Top-1 acc 69.141 (65.038)	Top-5 acc 85.938 (84.700)	lr 0.00442
Train [87][2800/3239]	Time 0.235 (0.540)	Data Time 0.001 (0.024)	Loss 2.6130 (2.4458)	Entropy 0.58493 (0.58392)	Top-1 acc 60.547 (65.038)	Top-5 acc 82.812 (84.698)	lr 0.00442
Train [87][2810/3239]	Time 0.261 (0.540)	Data Time 0.002 (0.024)	Loss 2.3634 (2.4456)	Entropy 0.58480 (0.58392)	Top-1 acc 67.188 (65.041)	Top-5 acc 89.453 (84.702)	lr 0.00441
Train [87][2820/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.024)	Loss 2.6530 (2.4459)	Entropy 0.58501 (0.58393)	Top-1 acc 61.719 (65.035)	Top-5 acc 79.688 (84.694)	lr 0.00441
Train [87][2830/3239]	Time 0.255 (0.539)	Data Time 0.001 (0.024)	Loss 2.4039 (2.4460)	Entropy 0.58510 (0.58393)	Top-1 acc 68.750 (65.034)	Top-5 acc 81.641 (84.690)	lr 0.00441
Train [87][2840/3239]	Time 0.248 (0.539)	Data Time 0.001 (0.024)	Loss 2.5134 (2.4460)	Entropy 0.58495 (0.58394)	Top-1 acc 65.234 (65.033)	Top-5 acc 81.641 (84.689)	lr 0.00441
Train [87][2850/3239]	Time 0.262 (0.539)	Data Time 0.001 (0.023)	Loss 2.2915 (2.4462)	Entropy 0.58456 (0.58394)	Top-1 acc 67.969 (65.028)	Top-5 acc 89.062 (84.688)	lr 0.00441
Train [87][2860/3239]	Time 0.238 (0.539)	Data Time 0.001 (0.024)	Loss 2.5510 (2.4464)	Entropy 0.58430 (0.58394)	Top-1 acc 63.281 (65.021)	Top-5 acc 83.203 (84.687)	lr 0.00441
Train [87][2870/3239]	Time 0.240 (0.538)	Data Time 0.001 (0.024)	Loss 2.2007 (2.4464)	Entropy 0.58407 (0.58394)	Top-1 acc 72.266 (65.016)	Top-5 acc 89.062 (84.687)	lr 0.00441
Train [87][2880/3239]	Time 0.244 (0.539)	Data Time 0.001 (0.024)	Loss 2.3455 (2.4463)	Entropy 0.58396 (0.58394)	Top-1 acc 66.797 (65.013)	Top-5 acc 87.891 (84.688)	lr 0.00441
Train [87][2890/3239]	Time 0.250 (0.539)	Data Time 0.001 (0.025)	Loss 2.5431 (2.4466)	Entropy 0.58423 (0.58394)	Top-1 acc 62.109 (65.006)	Top-5 acc 82.031 (84.682)	lr 0.00441
Train [87][2900/3239]	Time 0.244 (0.539)	Data Time 0.001 (0.025)	Loss 2.6077 (2.4465)	Entropy 0.58430 (0.58394)	Top-1 acc 61.719 (65.003)	Top-5 acc 81.250 (84.684)	lr 0.00441
Train [87][2910/3239]	Time 0.508 (0.539)	Data Time 0.270 (0.025)	Loss 2.3985 (2.4463)	Entropy 0.58424 (0.58394)	Top-1 acc 67.578 (65.009)	Top-5 acc 85.547 (84.685)	lr 0.00441
Train [87][2920/3239]	Time 0.392 (0.540)	Data Time 0.001 (0.026)	Loss 2.2323 (2.4463)	Entropy 0.58421 (0.58395)	Top-1 acc 69.922 (65.013)	Top-5 acc 89.844 (84.689)	lr 0.00441
Train [87][2930/3239]	Time 0.244 (0.539)	Data Time 0.001 (0.026)	Loss 2.4826 (2.4463)	Entropy 0.58408 (0.58395)	Top-1 acc 63.281 (65.012)	Top-5 acc 83.984 (84.687)	lr 0.00441
Train [87][2940/3239]	Time 0.248 (0.539)	Data Time 0.001 (0.026)	Loss 2.4854 (2.4463)	Entropy 0.58432 (0.58395)	Top-1 acc 61.719 (65.008)	Top-5 acc 84.766 (84.686)	lr 0.00440
Train [87][2950/3239]	Time 0.258 (0.540)	Data Time 0.002 (0.028)	Loss 2.4885 (2.4461)	Entropy 0.58406 (0.58395)	Top-1 acc 63.281 (65.013)	Top-5 acc 85.156 (84.691)	lr 0.00440
Train [87][2960/3239]	Time 0.240 (0.540)	Data Time 0.001 (0.028)	Loss 2.3597 (2.4462)	Entropy 0.58417 (0.58395)	Top-1 acc 66.406 (65.010)	Top-5 acc 84.766 (84.687)	lr 0.00440
Train [87][2970/3239]	Time 0.266 (0.540)	Data Time 0.003 (0.027)	Loss 2.2900 (2.4462)	Entropy 0.58391 (0.58395)	Top-1 acc 67.578 (65.011)	Top-5 acc 88.672 (84.686)	lr 0.00440
Train [87][2980/3239]	Time 0.458 (0.558)	Data Time 0.032 (0.029)	Loss 2.2701 (2.4461)	Entropy 0.58353 (0.58395)	Top-1 acc 69.922 (65.013)	Top-5 acc 87.891 (84.689)	lr 0.00440
Train [87][2990/3239]	Time 0.244 (0.558)	Data Time 0.002 (0.029)	Loss 2.4519 (2.4460)	Entropy 0.58371 (0.58395)	Top-1 acc 64.453 (65.016)	Top-5 acc 84.375 (84.689)	lr 0.00440
Train [87][3000/3239]	Time 0.265 (0.557)	Data Time 0.002 (0.028)	Loss 2.4802 (2.4461)	Entropy 0.58372 (0.58395)	Top-1 acc 64.844 (65.018)	Top-5 acc 83.984 (84.688)	lr 0.00440
Train [87][3010/3239]	Time 0.314 (0.557)	Data Time 0.001 (0.028)	Loss 2.5747 (2.4459)	Entropy 0.58356 (0.58395)	Top-1 acc 62.891 (65.023)	Top-5 acc 82.422 (84.691)	lr 0.00440
Train [87][3020/3239]	Time 0.246 (0.556)	Data Time 0.001 (0.028)	Loss 2.3411 (2.4460)	Entropy 0.58354 (0.58394)	Top-1 acc 65.625 (65.019)	Top-5 acc 85.938 (84.690)	lr 0.00440
Train [87][3030/3239]	Time 0.276 (0.556)	Data Time 0.001 (0.028)	Loss 2.4767 (2.4458)	Entropy 0.58339 (0.58394)	Top-1 acc 64.062 (65.020)	Top-5 acc 86.328 (84.694)	lr 0.00440
Train [87][3040/3239]	Time 0.249 (0.556)	Data Time 0.001 (0.028)	Loss 2.3406 (2.4459)	Entropy 0.58321 (0.58394)	Top-1 acc 64.062 (65.014)	Top-5 acc 86.719 (84.694)	lr 0.00440
Train [87][3050/3239]	Time 0.280 (0.555)	Data Time 0.001 (0.028)	Loss 2.2733 (2.4458)	Entropy 0.58306 (0.58394)	Top-1 acc 67.969 (65.019)	Top-5 acc 87.891 (84.697)	lr 0.00440
Train [87][3060/3239]	Time 0.275 (0.555)	Data Time 0.001 (0.028)	Loss 2.4700 (2.4458)	Entropy 0.58288 (0.58394)	Top-1 acc 63.281 (65.018)	Top-5 acc 84.375 (84.698)	lr 0.00440
Train [87][3070/3239]	Time 0.241 (0.555)	Data Time 0.001 (0.028)	Loss 2.4659 (2.4458)	Entropy 0.58273 (0.58393)	Top-1 acc 67.578 (65.019)	Top-5 acc 84.766 (84.697)	lr 0.00439
Train [87][3080/3239]	Time 0.366 (0.555)	Data Time 0.001 (0.028)	Loss 2.5179 (2.4459)	Entropy 0.58282 (0.58393)	Top-1 acc 60.938 (65.016)	Top-5 acc 84.766 (84.696)	lr 0.00439
Train [87][3090/3239]	Time 0.248 (0.554)	Data Time 0.001 (0.028)	Loss 2.2783 (2.4457)	Entropy 0.58247 (0.58392)	Top-1 acc 66.797 (65.020)	Top-5 acc 87.891 (84.698)	lr 0.00439
Train [87][3100/3239]	Time 0.279 (0.554)	Data Time 0.001 (0.028)	Loss 2.3967 (2.4456)	Entropy 0.58221 (0.58392)	Top-1 acc 66.797 (65.022)	Top-5 acc 87.500 (84.700)	lr 0.00439
Train [87][3110/3239]	Time 0.253 (0.554)	Data Time 0.001 (0.028)	Loss 2.3195 (2.4456)	Entropy 0.58201 (0.58391)	Top-1 acc 69.922 (65.022)	Top-5 acc 87.109 (84.700)	lr 0.00439
Train [87][3120/3239]	Time 0.240 (0.554)	Data Time 0.001 (0.027)	Loss 2.3641 (2.4457)	Entropy 0.58177 (0.58391)	Top-1 acc 65.234 (65.021)	Top-5 acc 85.938 (84.699)	lr 0.00439
Train [87][3130/3239]	Time 0.252 (0.553)	Data Time 0.002 (0.027)	Loss 2.3602 (2.4456)	Entropy 0.58161 (0.58390)	Top-1 acc 64.453 (65.019)	Top-5 acc 83.984 (84.699)	lr 0.00439
Train [87][3140/3239]	Time 0.253 (0.553)	Data Time 0.005 (0.027)	Loss 2.5541 (2.4454)	Entropy 0.58178 (0.58389)	Top-1 acc 65.625 (65.025)	Top-5 acc 83.203 (84.703)	lr 0.00439
Train [87][3150/3239]	Time 0.453 (0.553)	Data Time 0.001 (0.027)	Loss 2.2714 (2.4454)	Entropy 0.58149 (0.58389)	Top-1 acc 67.188 (65.025)	Top-5 acc 87.500 (84.702)	lr 0.00439
Train [87][3160/3239]	Time 0.251 (0.553)	Data Time 0.002 (0.027)	Loss 2.4512 (2.4456)	Entropy 0.58143 (0.58388)	Top-1 acc 63.281 (65.021)	Top-5 acc 83.594 (84.699)	lr 0.00439
Train [87][3170/3239]	Time 0.258 (0.552)	Data Time 0.001 (0.027)	Loss 2.4162 (2.4454)	Entropy 0.58151 (0.58387)	Top-1 acc 62.891 (65.024)	Top-5 acc 86.328 (84.703)	lr 0.00439
Train [87][3180/3239]	Time 0.224 (0.552)	Data Time 0.000 (0.027)	Loss 2.3321 (2.4455)	Entropy 0.58151 (0.58386)	Top-1 acc 69.531 (65.021)	Top-5 acc 87.500 (84.701)	lr 0.00439
Train [87][3190/3239]	Time 0.244 (0.552)	Data Time 0.000 (0.027)	Loss 2.4722 (2.4456)	Entropy 0.58090 (0.58386)	Top-1 acc 64.453 (65.019)	Top-5 acc 83.594 (84.699)	lr 0.00439
Train [87][3200/3239]	Time 0.236 (0.551)	Data Time 0.000 (0.027)	Loss 2.5089 (2.4456)	Entropy 0.58093 (0.58385)	Top-1 acc 60.547 (65.016)	Top-5 acc 81.641 (84.699)	lr 0.00438
Train [87][3210/3239]	Time 0.228 (0.551)	Data Time 0.000 (0.027)	Loss 2.3459 (2.4454)	Entropy 0.58116 (0.58384)	Top-1 acc 68.750 (65.022)	Top-5 acc 85.938 (84.702)	lr 0.00438
Train [87][3220/3239]	Time 0.234 (0.551)	Data Time 0.000 (0.027)	Loss 2.3339 (2.4453)	Entropy 0.58111 (0.58383)	Top-1 acc 65.625 (65.025)	Top-5 acc 85.547 (84.703)	lr 0.00438
Train [87][3230/3239]	Time 0.254 (0.550)	Data Time 0.000 (0.027)	Loss 2.3701 (2.4453)	Entropy 0.58146 (0.58382)	Top-1 acc 66.406 (65.026)	Top-5 acc 83.203 (84.703)	lr 0.00438
Train [87][3239/3239]	Time 0.845 (0.550)	Data Time 0.000 (0.026)	Loss 2.7135 (2.4456)	Entropy 0.58164 (0.58382)	Top-1 acc 58.025 (65.021)	Top-5 acc 81.481 (84.697)	lr 0.00438
==========Valid [87/120]	loss 1.256	top-1 acc 71.151 (71.264)	top-5 acc 89.650	Train top-1 65.021	top-5 84.697	Entropy 0.58164	Latency-None: 0.000ms	Flops: 539.00M
Train [88][0/3239]	Time 44.896 (44.896)	Data Time 42.012 (42.012)	Loss 2.2503 (2.2503)	Entropy 0.58181 (0.58181)	Top-1 acc 69.141 (69.141)	Top-5 acc 88.281 (88.281)	lr 0.00438
Train [88][10/3239]	Time 0.245 (4.636)	Data Time 0.001 (3.897)	Loss 2.4107 (2.3885)	Entropy 0.58161 (0.58169)	Top-1 acc 65.234 (66.513)	Top-5 acc 84.766 (85.938)	lr 0.00438
Train [88][20/3239]	Time 0.247 (2.640)	Data Time 0.001 (2.042)	Loss 2.4753 (2.4004)	Entropy 0.58169 (0.58166)	Top-1 acc 64.453 (65.904)	Top-5 acc 83.203 (85.510)	lr 0.00438
Train [88][30/3239]	Time 0.234 (1.935)	Data Time 0.001 (1.384)	Loss 2.4902 (2.4081)	Entropy 0.58136 (0.58165)	Top-1 acc 63.281 (65.247)	Top-5 acc 83.594 (85.358)	lr 0.00438
Train [88][40/3239]	Time 0.232 (1.568)	Data Time 0.001 (1.047)	Loss 2.3552 (2.4083)	Entropy 0.58151 (0.58159)	Top-1 acc 67.969 (65.558)	Top-5 acc 90.234 (85.423)	lr 0.00438
Train [88][50/3239]	Time 0.235 (1.347)	Data Time 0.001 (0.842)	Loss 2.3624 (2.4065)	Entropy 0.58152 (0.58157)	Top-1 acc 67.578 (65.587)	Top-5 acc 86.328 (85.355)	lr 0.00438
Train [88][60/3239]	Time 0.233 (1.203)	Data Time 0.002 (0.704)	Loss 2.3831 (2.4128)	Entropy 0.58168 (0.58157)	Top-1 acc 67.188 (65.503)	Top-5 acc 85.156 (85.297)	lr 0.00438
Train [88][70/3239]	Time 0.275 (1.097)	Data Time 0.001 (0.605)	Loss 2.3058 (2.4057)	Entropy 0.58173 (0.58159)	Top-1 acc 69.141 (65.812)	Top-5 acc 87.500 (85.409)	lr 0.00438
Train [88][80/3239]	Time 0.242 (1.014)	Data Time 0.001 (0.531)	Loss 2.2879 (2.4068)	Entropy 0.58186 (0.58162)	Top-1 acc 67.969 (65.900)	Top-5 acc 88.281 (85.354)	lr 0.00438
Train [88][90/3239]	Time 0.235 (0.948)	Data Time 0.001 (0.473)	Loss 2.3370 (2.4080)	Entropy 0.58194 (0.58165)	Top-1 acc 69.922 (65.930)	Top-5 acc 86.719 (85.367)	lr 0.00437
Train [88][100/3239]	Time 0.237 (0.897)	Data Time 0.001 (0.426)	Loss 2.5108 (2.4083)	Entropy 0.58181 (0.58168)	Top-1 acc 62.500 (65.985)	Top-5 acc 80.859 (85.319)	lr 0.00437
Train [88][110/3239]	Time 0.232 (0.853)	Data Time 0.001 (0.388)	Loss 2.5853 (2.4136)	Entropy 0.58188 (0.58168)	Top-1 acc 61.328 (65.878)	Top-5 acc 80.859 (85.227)	lr 0.00437
Train [88][120/3239]	Time 0.227 (0.817)	Data Time 0.001 (0.356)	Loss 2.6177 (2.4192)	Entropy 0.58195 (0.58170)	Top-1 acc 62.109 (65.754)	Top-5 acc 78.906 (85.108)	lr 0.00437
Train [88][130/3239]	Time 0.235 (0.787)	Data Time 0.001 (0.329)	Loss 2.3858 (2.4257)	Entropy 0.58230 (0.58173)	Top-1 acc 67.188 (65.506)	Top-5 acc 85.156 (84.968)	lr 0.00437
Train [88][140/3239]	Time 0.329 (0.762)	Data Time 0.001 (0.306)	Loss 2.4998 (2.4252)	Entropy 0.58246 (0.58177)	Top-1 acc 63.281 (65.517)	Top-5 acc 83.203 (85.007)	lr 0.00437
Train [88][150/3239]	Time 0.296 (0.739)	Data Time 0.001 (0.286)	Loss 2.6228 (2.4284)	Entropy 0.58242 (0.58181)	Top-1 acc 62.109 (65.423)	Top-5 acc 80.859 (84.957)	lr 0.00437
Train [88][160/3239]	Time 0.236 (0.719)	Data Time 0.001 (0.268)	Loss 2.2927 (2.4316)	Entropy 0.58248 (0.58185)	Top-1 acc 69.922 (65.385)	Top-5 acc 86.719 (84.909)	lr 0.00437
Train [88][170/3239]	Time 0.232 (0.704)	Data Time 0.001 (0.252)	Loss 2.4783 (2.4341)	Entropy 0.58238 (0.58189)	Top-1 acc 63.672 (65.310)	Top-5 acc 83.984 (84.868)	lr 0.00437
Train [88][180/3239]	Time 0.246 (0.688)	Data Time 0.009 (0.239)	Loss 2.3463 (2.4316)	Entropy 0.58198 (0.58191)	Top-1 acc 66.016 (65.308)	Top-5 acc 87.109 (84.910)	lr 0.00437
Train [88][190/3239]	Time 0.249 (0.677)	Data Time 0.001 (0.226)	Loss 2.4501 (2.4334)	Entropy 0.58185 (0.58191)	Top-1 acc 64.453 (65.269)	Top-5 acc 82.031 (84.868)	lr 0.00437
Train [88][200/3239]	Time 0.227 (0.667)	Data Time 0.001 (0.215)	Loss 2.4049 (2.4320)	Entropy 0.58188 (0.58191)	Top-1 acc 66.406 (65.287)	Top-5 acc 85.547 (84.902)	lr 0.00437
Train [88][210/3239]	Time 0.346 (0.655)	Data Time 0.001 (0.205)	Loss 2.3569 (2.4356)	Entropy 0.58174 (0.58190)	Top-1 acc 66.016 (65.253)	Top-5 acc 87.500 (84.893)	lr 0.00437
Train [88][220/3239]	Time 0.235 (0.646)	Data Time 0.001 (0.196)	Loss 2.3527 (2.4369)	Entropy 0.58173 (0.58190)	Top-1 acc 66.797 (65.185)	Top-5 acc 86.719 (84.893)	lr 0.00437
Train [88][230/3239]	Time 0.235 (0.636)	Data Time 0.001 (0.187)	Loss 2.5235 (2.4370)	Entropy 0.58199 (0.58190)	Top-1 acc 62.109 (65.229)	Top-5 acc 83.984 (84.879)	lr 0.00436
Train [88][240/3239]	Time 0.234 (0.628)	Data Time 0.001 (0.180)	Loss 2.5507 (2.4355)	Entropy 0.58162 (0.58189)	Top-1 acc 60.938 (65.272)	Top-5 acc 84.375 (84.877)	lr 0.00436
Train [88][250/3239]	Time 0.248 (0.621)	Data Time 0.001 (0.173)	Loss 2.4137 (2.4391)	Entropy 0.58154 (0.58188)	Top-1 acc 63.281 (65.185)	Top-5 acc 87.500 (84.805)	lr 0.00436
Train [88][260/3239]	Time 0.237 (0.614)	Data Time 0.001 (0.166)	Loss 2.5444 (2.4382)	Entropy 0.58123 (0.58187)	Top-1 acc 64.062 (65.218)	Top-5 acc 84.375 (84.818)	lr 0.00436
Train [88][270/3239]	Time 0.238 (0.607)	Data Time 0.001 (0.160)	Loss 2.7221 (2.4392)	Entropy 0.58101 (0.58184)	Top-1 acc 60.156 (65.223)	Top-5 acc 80.469 (84.796)	lr 0.00436
Train [88][280/3239]	Time 0.238 (0.601)	Data Time 0.001 (0.154)	Loss 2.3779 (2.4375)	Entropy 0.58092 (0.58181)	Top-1 acc 67.578 (65.294)	Top-5 acc 85.156 (84.810)	lr 0.00436
Train [88][290/3239]	Time 0.238 (0.595)	Data Time 0.001 (0.149)	Loss 2.3034 (2.4341)	Entropy 0.58049 (0.58177)	Top-1 acc 70.312 (65.421)	Top-5 acc 86.328 (84.874)	lr 0.00436
Train [88][300/3239]	Time 0.329 (0.589)	Data Time 0.001 (0.144)	Loss 2.6267 (2.4351)	Entropy 0.58046 (0.58173)	Top-1 acc 61.719 (65.398)	Top-5 acc 80.859 (84.855)	lr 0.00436
Train [88][310/3239]	Time 0.226 (0.584)	Data Time 0.001 (0.140)	Loss 2.5182 (2.4353)	Entropy 0.58038 (0.58168)	Top-1 acc 62.891 (65.419)	Top-5 acc 83.203 (84.835)	lr 0.00436
Train [88][320/3239]	Time 0.237 (0.579)	Data Time 0.002 (0.135)	Loss 2.3549 (2.4364)	Entropy 0.58013 (0.58164)	Top-1 acc 66.406 (65.400)	Top-5 acc 87.109 (84.797)	lr 0.00436
Train [88][330/3239]	Time 0.242 (0.575)	Data Time 0.001 (0.131)	Loss 2.5504 (2.4367)	Entropy 0.58021 (0.58160)	Top-1 acc 64.453 (65.401)	Top-5 acc 83.203 (84.792)	lr 0.00436
Train [88][340/3239]	Time 0.228 (0.570)	Data Time 0.001 (0.127)	Loss 2.6254 (2.4377)	Entropy 0.58019 (0.58155)	Top-1 acc 62.109 (65.347)	Top-5 acc 81.250 (84.778)	lr 0.00436
Train [88][350/3239]	Time 0.227 (0.566)	Data Time 0.001 (0.124)	Loss 2.2669 (2.4357)	Entropy 0.58048 (0.58152)	Top-1 acc 67.188 (65.386)	Top-5 acc 87.500 (84.807)	lr 0.00436
Train [88][360/3239]	Time 0.228 (0.562)	Data Time 0.001 (0.120)	Loss 2.6690 (2.4359)	Entropy 0.58062 (0.58149)	Top-1 acc 60.547 (65.378)	Top-5 acc 79.688 (84.789)	lr 0.00435
Train [88][370/3239]	Time 0.330 (0.558)	Data Time 0.001 (0.117)	Loss 2.4659 (2.4361)	Entropy 0.58044 (0.58147)	Top-1 acc 64.844 (65.373)	Top-5 acc 83.594 (84.777)	lr 0.00435
Train [88][380/3239]	Time 0.238 (0.555)	Data Time 0.001 (0.114)	Loss 2.4724 (2.4367)	Entropy 0.58033 (0.58144)	Top-1 acc 64.844 (65.368)	Top-5 acc 82.812 (84.753)	lr 0.00435
Train [88][390/3239]	Time 0.235 (0.551)	Data Time 0.001 (0.111)	Loss 2.4714 (2.4355)	Entropy 0.58012 (0.58141)	Top-1 acc 66.016 (65.382)	Top-5 acc 82.812 (84.786)	lr 0.00435
Train [88][400/3239]	Time 0.258 (0.696)	Data Time 0.002 (0.109)	Loss 2.3446 (2.4339)	Entropy 0.57989 (0.58138)	Top-1 acc 68.359 (65.417)	Top-5 acc 86.328 (84.811)	lr 0.00435
Train [88][410/3239]	Time 0.241 (0.690)	Data Time 0.002 (0.106)	Loss 2.5189 (2.4332)	Entropy 0.57989 (0.58134)	Top-1 acc 61.328 (65.443)	Top-5 acc 83.203 (84.812)	lr 0.00435
Train [88][420/3239]	Time 0.239 (0.684)	Data Time 0.001 (0.104)	Loss 2.5093 (2.4335)	Entropy 0.57962 (0.58131)	Top-1 acc 62.891 (65.433)	Top-5 acc 80.469 (84.795)	lr 0.00435
Train [88][430/3239]	Time 0.244 (0.678)	Data Time 0.001 (0.101)	Loss 2.3200 (2.4331)	Entropy 0.57972 (0.58127)	Top-1 acc 70.312 (65.445)	Top-5 acc 86.719 (84.805)	lr 0.00435
Train [88][440/3239]	Time 0.250 (0.673)	Data Time 0.001 (0.099)	Loss 2.4244 (2.4333)	Entropy 0.57980 (0.58124)	Top-1 acc 66.406 (65.442)	Top-5 acc 83.984 (84.786)	lr 0.00435
Train [88][450/3239]	Time 0.235 (0.668)	Data Time 0.001 (0.097)	Loss 2.3327 (2.4339)	Entropy 0.58000 (0.58121)	Top-1 acc 69.141 (65.414)	Top-5 acc 88.672 (84.790)	lr 0.00435
Train [88][460/3239]	Time 0.335 (0.663)	Data Time 0.001 (0.095)	Loss 2.4556 (2.4344)	Entropy 0.58001 (0.58118)	Top-1 acc 64.453 (65.433)	Top-5 acc 83.984 (84.783)	lr 0.00435
Train [88][470/3239]	Time 0.275 (0.658)	Data Time 0.001 (0.093)	Loss 2.2766 (2.4348)	Entropy 0.57996 (0.58115)	Top-1 acc 68.750 (65.389)	Top-5 acc 86.328 (84.777)	lr 0.00435
Train [88][480/3239]	Time 0.231 (0.653)	Data Time 0.001 (0.091)	Loss 2.5258 (2.4353)	Entropy 0.58006 (0.58113)	Top-1 acc 64.844 (65.386)	Top-5 acc 82.812 (84.774)	lr 0.00435
Train [88][490/3239]	Time 0.235 (0.648)	Data Time 0.001 (0.089)	Loss 2.4430 (2.4355)	Entropy 0.58006 (0.58110)	Top-1 acc 63.672 (65.377)	Top-5 acc 85.156 (84.775)	lr 0.00434
Train [88][500/3239]	Time 0.225 (0.644)	Data Time 0.001 (0.087)	Loss 2.4934 (2.4359)	Entropy 0.58021 (0.58108)	Top-1 acc 62.109 (65.337)	Top-5 acc 84.375 (84.786)	lr 0.00434
Train [88][510/3239]	Time 0.237 (0.640)	Data Time 0.001 (0.086)	Loss 2.3987 (2.4363)	Entropy 0.58010 (0.58107)	Top-1 acc 64.844 (65.311)	Top-5 acc 82.812 (84.769)	lr 0.00434
Train [88][520/3239]	Time 0.233 (0.636)	Data Time 0.001 (0.084)	Loss 2.3978 (2.4364)	Entropy 0.58006 (0.58105)	Top-1 acc 64.844 (65.287)	Top-5 acc 87.891 (84.772)	lr 0.00434
Train [88][530/3239]	Time 0.341 (0.633)	Data Time 0.001 (0.082)	Loss 2.5248 (2.4367)	Entropy 0.58020 (0.58103)	Top-1 acc 65.234 (65.277)	Top-5 acc 84.375 (84.758)	lr 0.00434
Train [88][540/3239]	Time 0.238 (0.629)	Data Time 0.001 (0.081)	Loss 2.5366 (2.4369)	Entropy 0.58033 (0.58102)	Top-1 acc 62.500 (65.289)	Top-5 acc 82.031 (84.748)	lr 0.00434
Train [88][550/3239]	Time 0.236 (0.626)	Data Time 0.001 (0.080)	Loss 2.4278 (2.4367)	Entropy 0.58036 (0.58100)	Top-1 acc 62.500 (65.287)	Top-5 acc 86.719 (84.751)	lr 0.00434
Train [88][560/3239]	Time 0.233 (0.622)	Data Time 0.001 (0.078)	Loss 2.6301 (2.4357)	Entropy 0.58059 (0.58099)	Top-1 acc 59.375 (65.312)	Top-5 acc 83.984 (84.773)	lr 0.00434
Train [88][570/3239]	Time 0.241 (0.619)	Data Time 0.001 (0.077)	Loss 2.4913 (2.4349)	Entropy 0.58028 (0.58098)	Top-1 acc 63.672 (65.339)	Top-5 acc 82.031 (84.797)	lr 0.00434
Train [88][580/3239]	Time 0.230 (0.616)	Data Time 0.001 (0.076)	Loss 3.0921 (2.4371)	Entropy 0.58041 (0.58097)	Top-1 acc 50.781 (65.283)	Top-5 acc 69.141 (84.751)	lr 0.00434
Train [88][590/3239]	Time 0.230 (0.613)	Data Time 0.001 (0.074)	Loss 2.6780 (2.4369)	Entropy 0.58009 (0.58096)	Top-1 acc 60.547 (65.293)	Top-5 acc 80.859 (84.762)	lr 0.00434
Train [88][600/3239]	Time 0.280 (0.610)	Data Time 0.001 (0.073)	Loss 2.3642 (2.4360)	Entropy 0.58025 (0.58095)	Top-1 acc 64.844 (65.318)	Top-5 acc 85.156 (84.784)	lr 0.00434
Train [88][610/3239]	Time 0.237 (0.607)	Data Time 0.001 (0.072)	Loss 2.4417 (2.4361)	Entropy 0.58037 (0.58094)	Top-1 acc 64.062 (65.310)	Top-5 acc 84.766 (84.784)	lr 0.00434
Train [88][620/3239]	Time 0.334 (0.604)	Data Time 0.001 (0.071)	Loss 2.4073 (2.4353)	Entropy 0.58056 (0.58093)	Top-1 acc 67.578 (65.341)	Top-5 acc 85.938 (84.790)	lr 0.00433
Train [88][630/3239]	Time 0.231 (0.602)	Data Time 0.001 (0.070)	Loss 2.2910 (2.4357)	Entropy 0.58048 (0.58093)	Top-1 acc 67.188 (65.324)	Top-5 acc 87.891 (84.777)	lr 0.00433
Train [88][640/3239]	Time 0.237 (0.599)	Data Time 0.001 (0.069)	Loss 2.3144 (2.4351)	Entropy 0.58075 (0.58092)	Top-1 acc 67.969 (65.350)	Top-5 acc 85.938 (84.789)	lr 0.00433
Train [88][650/3239]	Time 0.234 (0.596)	Data Time 0.002 (0.068)	Loss 2.5872 (2.4346)	Entropy 0.58058 (0.58092)	Top-1 acc 60.156 (65.360)	Top-5 acc 83.984 (84.792)	lr 0.00433
Train [88][660/3239]	Time 0.239 (0.594)	Data Time 0.001 (0.067)	Loss 2.3385 (2.4343)	Entropy 0.58042 (0.58091)	Top-1 acc 70.312 (65.384)	Top-5 acc 85.156 (84.785)	lr 0.00433
Train [88][670/3239]	Time 0.239 (0.592)	Data Time 0.001 (0.066)	Loss 2.4315 (2.4344)	Entropy 0.58002 (0.58090)	Top-1 acc 66.406 (65.383)	Top-5 acc 84.375 (84.784)	lr 0.00433
Train [88][680/3239]	Time 0.242 (0.589)	Data Time 0.001 (0.065)	Loss 2.2286 (2.4340)	Entropy 0.57990 (0.58089)	Top-1 acc 69.141 (65.410)	Top-5 acc 89.062 (84.791)	lr 0.00433
Train [88][690/3239]	Time 0.345 (0.587)	Data Time 0.001 (0.064)	Loss 2.3620 (2.4343)	Entropy 0.58014 (0.58088)	Top-1 acc 70.703 (65.404)	Top-5 acc 82.422 (84.781)	lr 0.00433
Train [88][700/3239]	Time 0.239 (0.586)	Data Time 0.001 (0.063)	Loss 2.5648 (2.4341)	Entropy 0.58006 (0.58086)	Top-1 acc 60.156 (65.407)	Top-5 acc 83.594 (84.782)	lr 0.00433
Train [88][710/3239]	Time 0.222 (0.584)	Data Time 0.001 (0.062)	Loss 2.3010 (2.4344)	Entropy 0.58010 (0.58085)	Top-1 acc 67.969 (65.404)	Top-5 acc 87.109 (84.777)	lr 0.00433
Train [88][720/3239]	Time 0.229 (0.582)	Data Time 0.001 (0.061)	Loss 2.4161 (2.4348)	Entropy 0.58021 (0.58084)	Top-1 acc 68.750 (65.402)	Top-5 acc 83.984 (84.766)	lr 0.00433
Train [88][730/3239]	Time 0.233 (0.580)	Data Time 0.001 (0.060)	Loss 2.3749 (2.4354)	Entropy 0.58034 (0.58083)	Top-1 acc 69.141 (65.380)	Top-5 acc 86.328 (84.758)	lr 0.00433
Train [88][740/3239]	Time 0.234 (0.578)	Data Time 0.001 (0.060)	Loss 2.3782 (2.4352)	Entropy 0.58014 (0.58083)	Top-1 acc 70.312 (65.380)	Top-5 acc 85.547 (84.765)	lr 0.00433
Train [88][750/3239]	Time 0.233 (0.576)	Data Time 0.001 (0.059)	Loss 2.5204 (2.4350)	Entropy 0.58027 (0.58082)	Top-1 acc 64.062 (65.373)	Top-5 acc 83.984 (84.766)	lr 0.00432
Train [88][760/3239]	Time 0.236 (0.574)	Data Time 0.001 (0.058)	Loss 2.5287 (2.4356)	Entropy 0.57987 (0.58081)	Top-1 acc 61.719 (65.366)	Top-5 acc 82.422 (84.752)	lr 0.00432
Train [88][770/3239]	Time 0.233 (0.572)	Data Time 0.001 (0.057)	Loss 2.5122 (2.4365)	Entropy 0.57972 (0.58079)	Top-1 acc 62.109 (65.352)	Top-5 acc 82.812 (84.738)	lr 0.00432
Train [88][780/3239]	Time 0.230 (0.570)	Data Time 0.001 (0.057)	Loss 2.4539 (2.4361)	Entropy 0.57976 (0.58078)	Top-1 acc 65.625 (65.359)	Top-5 acc 83.984 (84.751)	lr 0.00432
Train [88][790/3239]	Time 0.234 (0.568)	Data Time 0.001 (0.056)	Loss 2.4385 (2.4360)	Entropy 0.57967 (0.58077)	Top-1 acc 66.406 (65.349)	Top-5 acc 84.375 (84.749)	lr 0.00432
Train [88][800/3239]	Time 0.233 (0.566)	Data Time 0.001 (0.055)	Loss 2.4838 (2.4364)	Entropy 0.57965 (0.58075)	Top-1 acc 60.938 (65.347)	Top-5 acc 86.328 (84.746)	lr 0.00432
Train [88][810/3239]	Time 0.226 (0.564)	Data Time 0.001 (0.055)	Loss 2.4501 (2.4364)	Entropy 0.57973 (0.58074)	Top-1 acc 62.891 (65.330)	Top-5 acc 86.719 (84.745)	lr 0.00432
Train [88][820/3239]	Time 0.229 (0.562)	Data Time 0.001 (0.054)	Loss 2.2714 (2.4365)	Entropy 0.57992 (0.58073)	Top-1 acc 71.484 (65.330)	Top-5 acc 88.281 (84.751)	lr 0.00432
Train [88][830/3239]	Time 0.261 (0.560)	Data Time 0.001 (0.053)	Loss 2.3721 (2.4366)	Entropy 0.57985 (0.58072)	Top-1 acc 63.672 (65.314)	Top-5 acc 87.891 (84.757)	lr 0.00432
Train [88][840/3239]	Time 0.233 (0.559)	Data Time 0.001 (0.053)	Loss 2.4150 (2.4360)	Entropy 0.57961 (0.58071)	Top-1 acc 69.141 (65.338)	Top-5 acc 85.938 (84.764)	lr 0.00432
Train [88][850/3239]	Time 0.313 (0.557)	Data Time 0.001 (0.052)	Loss 2.4345 (2.4365)	Entropy 0.57938 (0.58069)	Top-1 acc 63.672 (65.334)	Top-5 acc 85.156 (84.749)	lr 0.00432
Train [88][860/3239]	Time 0.223 (0.555)	Data Time 0.001 (0.052)	Loss 2.6594 (2.4366)	Entropy 0.57944 (0.58068)	Top-1 acc 61.328 (65.332)	Top-5 acc 80.859 (84.749)	lr 0.00432
Train [88][870/3239]	Time 0.229 (0.553)	Data Time 0.001 (0.051)	Loss 2.5111 (2.4364)	Entropy 0.57939 (0.58066)	Top-1 acc 66.797 (65.336)	Top-5 acc 83.594 (84.750)	lr 0.00432
Train [88][880/3239]	Time 0.268 (0.552)	Data Time 0.002 (0.050)	Loss 2.5448 (2.4366)	Entropy 0.57930 (0.58065)	Top-1 acc 66.797 (65.333)	Top-5 acc 83.984 (84.740)	lr 0.00431
Train [88][890/3239]	Time 0.237 (0.550)	Data Time 0.001 (0.050)	Loss 2.6283 (2.4364)	Entropy 0.57941 (0.58064)	Top-1 acc 61.719 (65.325)	Top-5 acc 78.125 (84.737)	lr 0.00431
Train [88][900/3239]	Time 0.236 (0.549)	Data Time 0.001 (0.049)	Loss 2.4124 (2.4366)	Entropy 0.57914 (0.58062)	Top-1 acc 65.625 (65.323)	Top-5 acc 86.328 (84.732)	lr 0.00431
Train [88][910/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.049)	Loss 2.3948 (2.4366)	Entropy 0.57924 (0.58060)	Top-1 acc 67.578 (65.324)	Top-5 acc 83.594 (84.733)	lr 0.00431
Train [88][920/3239]	Time 0.370 (0.546)	Data Time 0.001 (0.048)	Loss 2.2773 (2.4360)	Entropy 0.57922 (0.58059)	Top-1 acc 67.188 (65.336)	Top-5 acc 88.672 (84.748)	lr 0.00431
Train [88][930/3239]	Time 0.228 (0.545)	Data Time 0.001 (0.048)	Loss 2.3512 (2.4360)	Entropy 0.57957 (0.58058)	Top-1 acc 68.359 (65.337)	Top-5 acc 85.547 (84.747)	lr 0.00431
Train [88][940/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.047)	Loss 2.3327 (2.4367)	Entropy 0.57953 (0.58057)	Top-1 acc 66.797 (65.323)	Top-5 acc 84.766 (84.739)	lr 0.00431
Train [88][950/3239]	Time 0.243 (0.542)	Data Time 0.001 (0.047)	Loss 2.4030 (2.4358)	Entropy 0.57975 (0.58056)	Top-1 acc 62.500 (65.336)	Top-5 acc 87.109 (84.759)	lr 0.00431
Train [88][960/3239]	Time 0.239 (0.541)	Data Time 0.001 (0.046)	Loss 2.3719 (2.4356)	Entropy 0.57964 (0.58055)	Top-1 acc 64.062 (65.339)	Top-5 acc 86.328 (84.762)	lr 0.00431
Train [88][970/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.046)	Loss 2.5635 (2.4355)	Entropy 0.57994 (0.58054)	Top-1 acc 62.109 (65.331)	Top-5 acc 82.812 (84.770)	lr 0.00431
Train [88][980/3239]	Time 0.239 (0.539)	Data Time 0.001 (0.045)	Loss 2.4146 (2.4357)	Entropy 0.57993 (0.58053)	Top-1 acc 62.500 (65.319)	Top-5 acc 85.156 (84.770)	lr 0.00431
Train [88][990/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.045)	Loss 2.3705 (2.4357)	Entropy 0.58008 (0.58053)	Top-1 acc 65.625 (65.312)	Top-5 acc 86.328 (84.771)	lr 0.00431
Train [88][1000/3239]	Time 0.259 (0.537)	Data Time 0.002 (0.045)	Loss 2.4345 (2.4353)	Entropy 0.58022 (0.58052)	Top-1 acc 65.625 (65.317)	Top-5 acc 85.547 (84.782)	lr 0.00431
Train [88][1010/3239]	Time 0.360 (0.536)	Data Time 0.001 (0.044)	Loss 2.3144 (2.4349)	Entropy 0.57976 (0.58052)	Top-1 acc 69.922 (65.332)	Top-5 acc 87.109 (84.797)	lr 0.00430
Train [88][1020/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.044)	Loss 2.2634 (2.4351)	Entropy 0.57986 (0.58051)	Top-1 acc 69.922 (65.330)	Top-5 acc 86.328 (84.789)	lr 0.00430
Train [88][1030/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.043)	Loss 2.4098 (2.4350)	Entropy 0.58014 (0.58051)	Top-1 acc 67.188 (65.326)	Top-5 acc 84.766 (84.790)	lr 0.00430
Train [88][1040/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.043)	Loss 2.4668 (2.4354)	Entropy 0.58028 (0.58050)	Top-1 acc 66.406 (65.312)	Top-5 acc 83.594 (84.785)	lr 0.00430
Train [88][1050/3239]	Time 0.384 (0.580)	Data Time 0.006 (0.042)	Loss 2.3653 (2.4351)	Entropy 0.58045 (0.58050)	Top-1 acc 66.797 (65.317)	Top-5 acc 85.156 (84.791)	lr 0.00430
Train [88][1060/3239]	Time 0.240 (0.580)	Data Time 0.002 (0.042)	Loss 2.4382 (2.4350)	Entropy 0.58011 (0.58050)	Top-1 acc 61.719 (65.309)	Top-5 acc 83.984 (84.801)	lr 0.00430
Train [88][1070/3239]	Time 0.255 (0.579)	Data Time 0.001 (0.042)	Loss 2.5071 (2.4354)	Entropy 0.58026 (0.58050)	Top-1 acc 63.281 (65.306)	Top-5 acc 84.766 (84.794)	lr 0.00430
Train [88][1080/3239]	Time 0.327 (0.577)	Data Time 0.002 (0.041)	Loss 2.4646 (2.4350)	Entropy 0.58032 (0.58050)	Top-1 acc 62.500 (65.316)	Top-5 acc 82.422 (84.798)	lr 0.00430
Train [88][1090/3239]	Time 0.240 (0.576)	Data Time 0.001 (0.041)	Loss 2.5058 (2.4351)	Entropy 0.58028 (0.58049)	Top-1 acc 63.281 (65.319)	Top-5 acc 82.422 (84.797)	lr 0.00430
Train [88][1100/3239]	Time 0.246 (0.575)	Data Time 0.001 (0.041)	Loss 2.4805 (2.4348)	Entropy 0.57985 (0.58049)	Top-1 acc 66.016 (65.328)	Top-5 acc 84.766 (84.801)	lr 0.00430
Train [88][1110/3239]	Time 0.248 (0.574)	Data Time 0.001 (0.040)	Loss 2.3099 (2.4347)	Entropy 0.57988 (0.58049)	Top-1 acc 66.406 (65.340)	Top-5 acc 87.109 (84.803)	lr 0.00430
Train [88][1120/3239]	Time 0.255 (0.572)	Data Time 0.001 (0.040)	Loss 2.5752 (2.4344)	Entropy 0.57992 (0.58048)	Top-1 acc 61.719 (65.344)	Top-5 acc 79.297 (84.803)	lr 0.00430
Train [88][1130/3239]	Time 0.242 (0.571)	Data Time 0.001 (0.040)	Loss 2.5033 (2.4349)	Entropy 0.57970 (0.58048)	Top-1 acc 63.672 (65.327)	Top-5 acc 80.469 (84.790)	lr 0.00430
Train [88][1140/3239]	Time 0.253 (0.570)	Data Time 0.001 (0.039)	Loss 2.2457 (2.4347)	Entropy 0.57963 (0.58047)	Top-1 acc 73.438 (65.336)	Top-5 acc 87.500 (84.792)	lr 0.00429
Train [88][1150/3239]	Time 0.248 (0.569)	Data Time 0.001 (0.039)	Loss 2.4244 (2.4348)	Entropy 0.57946 (0.58046)	Top-1 acc 66.016 (65.331)	Top-5 acc 83.203 (84.788)	lr 0.00429
Train [88][1160/3239]	Time 0.232 (0.568)	Data Time 0.001 (0.039)	Loss 2.3447 (2.4350)	Entropy 0.57989 (0.58045)	Top-1 acc 64.844 (65.324)	Top-5 acc 84.375 (84.788)	lr 0.00429
Train [88][1170/3239]	Time 0.337 (0.567)	Data Time 0.001 (0.038)	Loss 2.3160 (2.4350)	Entropy 0.58018 (0.58045)	Top-1 acc 70.312 (65.325)	Top-5 acc 86.328 (84.788)	lr 0.00429
Train [88][1180/3239]	Time 0.242 (0.566)	Data Time 0.001 (0.038)	Loss 2.3660 (2.4350)	Entropy 0.58034 (0.58045)	Top-1 acc 68.750 (65.315)	Top-5 acc 84.375 (84.784)	lr 0.00429
Train [88][1190/3239]	Time 0.233 (0.565)	Data Time 0.002 (0.038)	Loss 2.3931 (2.4355)	Entropy 0.58041 (0.58045)	Top-1 acc 69.922 (65.301)	Top-5 acc 83.594 (84.776)	lr 0.00429
Train [88][1200/3239]	Time 0.246 (0.564)	Data Time 0.001 (0.037)	Loss 2.6532 (2.4356)	Entropy 0.58045 (0.58045)	Top-1 acc 59.766 (65.292)	Top-5 acc 82.422 (84.783)	lr 0.00429
Train [88][1210/3239]	Time 0.235 (0.563)	Data Time 0.001 (0.037)	Loss 2.9932 (2.4357)	Entropy 0.58085 (0.58045)	Top-1 acc 50.781 (65.280)	Top-5 acc 76.953 (84.784)	lr 0.00429
Train [88][1220/3239]	Time 0.231 (0.562)	Data Time 0.001 (0.037)	Loss 2.4288 (2.4353)	Entropy 0.58091 (0.58045)	Top-1 acc 66.016 (65.288)	Top-5 acc 87.109 (84.792)	lr 0.00429
Train [88][1230/3239]	Time 0.235 (0.561)	Data Time 0.001 (0.037)	Loss 2.4967 (2.4359)	Entropy 0.58068 (0.58045)	Top-1 acc 66.797 (65.280)	Top-5 acc 82.812 (84.784)	lr 0.00429
Train [88][1240/3239]	Time 0.333 (0.560)	Data Time 0.001 (0.036)	Loss 2.4306 (2.4359)	Entropy 0.58076 (0.58045)	Top-1 acc 67.188 (65.284)	Top-5 acc 83.203 (84.787)	lr 0.00429
Train [88][1250/3239]	Time 0.237 (0.559)	Data Time 0.001 (0.036)	Loss 2.4803 (2.4360)	Entropy 0.58062 (0.58046)	Top-1 acc 63.281 (65.284)	Top-5 acc 83.203 (84.780)	lr 0.00429
Train [88][1260/3239]	Time 0.239 (0.558)	Data Time 0.001 (0.036)	Loss 2.3604 (2.4360)	Entropy 0.58057 (0.58046)	Top-1 acc 67.578 (65.284)	Top-5 acc 85.938 (84.784)	lr 0.00429
Train [88][1270/3239]	Time 0.229 (0.557)	Data Time 0.001 (0.035)	Loss 2.5118 (2.4360)	Entropy 0.58086 (0.58046)	Top-1 acc 64.844 (65.288)	Top-5 acc 83.203 (84.782)	lr 0.00428
Train [88][1280/3239]	Time 0.232 (0.556)	Data Time 0.001 (0.035)	Loss 2.3987 (2.4360)	Entropy 0.58095 (0.58046)	Top-1 acc 64.453 (65.281)	Top-5 acc 86.719 (84.785)	lr 0.00428
Train [88][1290/3239]	Time 0.235 (0.555)	Data Time 0.001 (0.035)	Loss 2.4308 (2.4359)	Entropy 0.58099 (0.58047)	Top-1 acc 67.969 (65.282)	Top-5 acc 84.766 (84.787)	lr 0.00428
Train [88][1300/3239]	Time 0.247 (0.554)	Data Time 0.002 (0.035)	Loss 2.2536 (2.4361)	Entropy 0.58087 (0.58047)	Top-1 acc 66.406 (65.276)	Top-5 acc 90.234 (84.791)	lr 0.00428
Train [88][1310/3239]	Time 0.241 (0.553)	Data Time 0.001 (0.034)	Loss 2.4270 (2.4362)	Entropy 0.58113 (0.58047)	Top-1 acc 66.797 (65.273)	Top-5 acc 85.547 (84.794)	lr 0.00428
Train [88][1320/3239]	Time 0.221 (0.552)	Data Time 0.001 (0.034)	Loss 2.6658 (2.4359)	Entropy 0.58105 (0.58048)	Top-1 acc 60.938 (65.283)	Top-5 acc 82.422 (84.802)	lr 0.00428
Train [88][1330/3239]	Time 0.268 (0.551)	Data Time 0.001 (0.034)	Loss 2.6827 (2.4366)	Entropy 0.58090 (0.58048)	Top-1 acc 58.984 (65.265)	Top-5 acc 80.078 (84.794)	lr 0.00428
Train [88][1340/3239]	Time 0.234 (0.550)	Data Time 0.001 (0.034)	Loss 2.2713 (2.4368)	Entropy 0.58073 (0.58049)	Top-1 acc 70.312 (65.258)	Top-5 acc 88.672 (84.793)	lr 0.00428
Train [88][1350/3239]	Time 0.294 (0.550)	Data Time 0.001 (0.033)	Loss 2.4369 (2.4369)	Entropy 0.58032 (0.58049)	Top-1 acc 64.453 (65.253)	Top-5 acc 83.984 (84.790)	lr 0.00428
Train [88][1360/3239]	Time 0.250 (0.550)	Data Time 0.001 (0.033)	Loss 2.3252 (2.4368)	Entropy 0.58046 (0.58049)	Top-1 acc 71.094 (65.254)	Top-5 acc 84.766 (84.787)	lr 0.00428
Train [88][1370/3239]	Time 0.246 (0.549)	Data Time 0.001 (0.033)	Loss 2.2896 (2.4371)	Entropy 0.57989 (0.58048)	Top-1 acc 67.188 (65.239)	Top-5 acc 87.500 (84.784)	lr 0.00428
Train [88][1380/3239]	Time 0.221 (0.549)	Data Time 0.001 (0.033)	Loss 2.7162 (2.4376)	Entropy 0.57955 (0.58048)	Top-1 acc 56.250 (65.224)	Top-5 acc 82.031 (84.779)	lr 0.00428
Train [88][1390/3239]	Time 0.238 (0.548)	Data Time 0.001 (0.033)	Loss 2.3997 (2.4377)	Entropy 0.57956 (0.58047)	Top-1 acc 65.625 (65.222)	Top-5 acc 84.766 (84.773)	lr 0.00428
Train [88][1400/3239]	Time 0.349 (0.547)	Data Time 0.002 (0.032)	Loss 2.5395 (2.4377)	Entropy 0.57990 (0.58047)	Top-1 acc 63.281 (65.226)	Top-5 acc 82.422 (84.766)	lr 0.00427
Train [88][1410/3239]	Time 0.260 (0.546)	Data Time 0.001 (0.032)	Loss 2.5492 (2.4377)	Entropy 0.57985 (0.58046)	Top-1 acc 64.453 (65.231)	Top-5 acc 82.812 (84.767)	lr 0.00427
Train [88][1420/3239]	Time 0.226 (0.545)	Data Time 0.001 (0.032)	Loss 2.3272 (2.4378)	Entropy 0.57967 (0.58046)	Top-1 acc 64.844 (65.228)	Top-5 acc 87.500 (84.768)	lr 0.00427
Train [88][1430/3239]	Time 0.226 (0.544)	Data Time 0.001 (0.032)	Loss 2.6272 (2.4377)	Entropy 0.57970 (0.58045)	Top-1 acc 58.984 (65.228)	Top-5 acc 80.859 (84.769)	lr 0.00427
Train [88][1440/3239]	Time 0.278 (0.543)	Data Time 0.001 (0.031)	Loss 2.5533 (2.4376)	Entropy 0.57976 (0.58045)	Top-1 acc 64.453 (65.236)	Top-5 acc 81.250 (84.769)	lr 0.00427
Train [88][1450/3239]	Time 0.230 (0.543)	Data Time 0.001 (0.031)	Loss 2.3409 (2.4374)	Entropy 0.58003 (0.58044)	Top-1 acc 67.969 (65.238)	Top-5 acc 85.547 (84.773)	lr 0.00427
Train [88][1460/3239]	Time 0.244 (0.542)	Data Time 0.001 (0.031)	Loss 2.3598 (2.4377)	Entropy 0.57969 (0.58044)	Top-1 acc 67.578 (65.236)	Top-5 acc 86.328 (84.766)	lr 0.00427
Train [88][1470/3239]	Time 0.330 (0.541)	Data Time 0.001 (0.031)	Loss 2.2980 (2.4377)	Entropy 0.57997 (0.58043)	Top-1 acc 66.406 (65.241)	Top-5 acc 89.844 (84.769)	lr 0.00427
Train [88][1480/3239]	Time 0.235 (0.540)	Data Time 0.001 (0.031)	Loss 2.4958 (2.4379)	Entropy 0.58008 (0.58043)	Top-1 acc 62.891 (65.234)	Top-5 acc 80.469 (84.762)	lr 0.00427
Train [88][1490/3239]	Time 0.264 (0.539)	Data Time 0.002 (0.030)	Loss 2.3906 (2.4376)	Entropy 0.57991 (0.58043)	Top-1 acc 62.500 (65.239)	Top-5 acc 85.938 (84.764)	lr 0.00427
Train [88][1500/3239]	Time 0.234 (0.538)	Data Time 0.002 (0.030)	Loss 2.5319 (2.4378)	Entropy 0.58003 (0.58043)	Top-1 acc 65.234 (65.230)	Top-5 acc 80.078 (84.763)	lr 0.00427
Train [88][1510/3239]	Time 0.241 (0.538)	Data Time 0.002 (0.030)	Loss 2.4704 (2.4376)	Entropy 0.58015 (0.58042)	Top-1 acc 67.578 (65.237)	Top-5 acc 83.594 (84.772)	lr 0.00427
Train [88][1520/3239]	Time 0.237 (0.537)	Data Time 0.002 (0.030)	Loss 2.4741 (2.4379)	Entropy 0.58024 (0.58042)	Top-1 acc 63.281 (65.236)	Top-5 acc 84.766 (84.765)	lr 0.00427
Train [88][1530/3239]	Time 0.237 (0.536)	Data Time 0.001 (0.030)	Loss 2.6529 (2.4381)	Entropy 0.58019 (0.58042)	Top-1 acc 60.156 (65.227)	Top-5 acc 81.250 (84.759)	lr 0.00427
Train [88][1540/3239]	Time 0.235 (0.536)	Data Time 0.001 (0.030)	Loss 2.6616 (2.4382)	Entropy 0.58012 (0.58042)	Top-1 acc 58.203 (65.219)	Top-5 acc 82.812 (84.762)	lr 0.00426
Train [88][1550/3239]	Time 0.224 (0.535)	Data Time 0.001 (0.029)	Loss 2.4424 (2.4380)	Entropy 0.58000 (0.58042)	Top-1 acc 64.453 (65.228)	Top-5 acc 87.109 (84.770)	lr 0.00426
Train [88][1560/3239]	Time 0.325 (0.534)	Data Time 0.001 (0.029)	Loss 2.4206 (2.4385)	Entropy 0.58013 (0.58041)	Top-1 acc 62.891 (65.213)	Top-5 acc 84.375 (84.762)	lr 0.00426
Train [88][1570/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.029)	Loss 2.4535 (2.4387)	Entropy 0.58002 (0.58041)	Top-1 acc 62.500 (65.210)	Top-5 acc 82.812 (84.756)	lr 0.00426
Train [88][1580/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.029)	Loss 2.2571 (2.4383)	Entropy 0.57994 (0.58041)	Top-1 acc 71.094 (65.216)	Top-5 acc 86.328 (84.764)	lr 0.00426
Train [88][1590/3239]	Time 0.226 (0.532)	Data Time 0.001 (0.029)	Loss 2.2599 (2.4380)	Entropy 0.57977 (0.58041)	Top-1 acc 68.359 (65.220)	Top-5 acc 89.062 (84.771)	lr 0.00426
Train [88][1600/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.028)	Loss 2.4749 (2.4382)	Entropy 0.57980 (0.58040)	Top-1 acc 61.328 (65.216)	Top-5 acc 84.375 (84.768)	lr 0.00426
Train [88][1610/3239]	Time 0.272 (0.530)	Data Time 0.001 (0.028)	Loss 2.3031 (2.4377)	Entropy 0.57981 (0.58040)	Top-1 acc 68.750 (65.224)	Top-5 acc 87.891 (84.775)	lr 0.00426
Train [88][1620/3239]	Time 0.284 (0.530)	Data Time 0.002 (0.028)	Loss 2.4000 (2.4378)	Entropy 0.57973 (0.58039)	Top-1 acc 62.500 (65.223)	Top-5 acc 84.766 (84.773)	lr 0.00426
Train [88][1630/3239]	Time 0.324 (0.530)	Data Time 0.001 (0.028)	Loss 2.4663 (2.4373)	Entropy 0.57964 (0.58039)	Top-1 acc 60.938 (65.228)	Top-5 acc 86.328 (84.784)	lr 0.00426
Train [88][1640/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.028)	Loss 2.4456 (2.4372)	Entropy 0.57975 (0.58039)	Top-1 acc 66.797 (65.242)	Top-5 acc 85.547 (84.782)	lr 0.00426
Train [88][1650/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.028)	Loss 2.3505 (2.4373)	Entropy 0.57965 (0.58038)	Top-1 acc 68.359 (65.239)	Top-5 acc 86.719 (84.781)	lr 0.00426
Train [88][1660/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.028)	Loss 2.3347 (2.4373)	Entropy 0.57908 (0.58038)	Top-1 acc 64.453 (65.238)	Top-5 acc 88.672 (84.780)	lr 0.00426
Train [88][1670/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.027)	Loss 2.4794 (2.4373)	Entropy 0.57893 (0.58037)	Top-1 acc 62.891 (65.234)	Top-5 acc 83.594 (84.779)	lr 0.00425
Train [88][1680/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.027)	Loss 2.2633 (2.4370)	Entropy 0.57890 (0.58036)	Top-1 acc 67.969 (65.237)	Top-5 acc 87.891 (84.786)	lr 0.00425
Train [88][1690/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.027)	Loss 2.4270 (2.4371)	Entropy 0.57895 (0.58035)	Top-1 acc 67.188 (65.237)	Top-5 acc 82.422 (84.785)	lr 0.00425
Train [88][1700/3239]	Time 0.223 (0.525)	Data Time 0.001 (0.027)	Loss 2.4339 (2.4373)	Entropy 0.57900 (0.58034)	Top-1 acc 64.062 (65.228)	Top-5 acc 82.812 (84.779)	lr 0.00425
Train [88][1710/3239]	Time 0.245 (0.555)	Data Time 0.002 (0.027)	Loss 2.6274 (2.4374)	Entropy 0.57901 (0.58034)	Top-1 acc 60.938 (65.224)	Top-5 acc 85.547 (84.781)	lr 0.00425
Train [88][1720/3239]	Time 0.332 (0.554)	Data Time 0.002 (0.027)	Loss 2.3820 (2.4377)	Entropy 0.57880 (0.58033)	Top-1 acc 66.406 (65.216)	Top-5 acc 85.547 (84.773)	lr 0.00425
Train [88][1730/3239]	Time 0.232 (0.553)	Data Time 0.002 (0.026)	Loss 2.5449 (2.4379)	Entropy 0.57892 (0.58032)	Top-1 acc 62.500 (65.215)	Top-5 acc 82.812 (84.772)	lr 0.00425
Train [88][1740/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.026)	Loss 2.3791 (2.4378)	Entropy 0.57878 (0.58031)	Top-1 acc 63.672 (65.221)	Top-5 acc 87.891 (84.770)	lr 0.00425
Train [88][1750/3239]	Time 0.232 (0.552)	Data Time 0.001 (0.026)	Loss 2.2586 (2.4377)	Entropy 0.57905 (0.58030)	Top-1 acc 70.312 (65.225)	Top-5 acc 87.500 (84.775)	lr 0.00425
Train [88][1760/3239]	Time 0.236 (0.551)	Data Time 0.001 (0.026)	Loss 2.4829 (2.4375)	Entropy 0.57884 (0.58030)	Top-1 acc 64.844 (65.228)	Top-5 acc 83.984 (84.780)	lr 0.00425
Train [88][1770/3239]	Time 0.243 (0.550)	Data Time 0.001 (0.026)	Loss 2.3843 (2.4372)	Entropy 0.57898 (0.58029)	Top-1 acc 66.016 (65.232)	Top-5 acc 86.328 (84.784)	lr 0.00425
Train [88][1780/3239]	Time 0.271 (0.550)	Data Time 0.003 (0.026)	Loss 2.3210 (2.4371)	Entropy 0.57898 (0.58028)	Top-1 acc 67.578 (65.234)	Top-5 acc 85.156 (84.786)	lr 0.00425
Train [88][1790/3239]	Time 0.338 (0.549)	Data Time 0.001 (0.026)	Loss 2.2389 (2.4376)	Entropy 0.57871 (0.58027)	Top-1 acc 69.922 (65.229)	Top-5 acc 90.234 (84.779)	lr 0.00425
Train [88][1800/3239]	Time 0.239 (0.549)	Data Time 0.001 (0.026)	Loss 2.5261 (2.4375)	Entropy 0.57865 (0.58027)	Top-1 acc 62.891 (65.231)	Top-5 acc 80.859 (84.777)	lr 0.00424
Train [88][1810/3239]	Time 0.247 (0.548)	Data Time 0.001 (0.025)	Loss 2.5099 (2.4372)	Entropy 0.57853 (0.58026)	Top-1 acc 63.672 (65.236)	Top-5 acc 80.859 (84.783)	lr 0.00424
Train [88][1820/3239]	Time 0.247 (0.548)	Data Time 0.001 (0.025)	Loss 2.4006 (2.4371)	Entropy 0.57878 (0.58025)	Top-1 acc 66.016 (65.237)	Top-5 acc 85.156 (84.786)	lr 0.00424
Train [88][1830/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.025)	Loss 2.4763 (2.4372)	Entropy 0.57881 (0.58024)	Top-1 acc 64.844 (65.228)	Top-5 acc 85.156 (84.788)	lr 0.00424
Train [88][1840/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.025)	Loss 2.2517 (2.4370)	Entropy 0.57889 (0.58023)	Top-1 acc 69.141 (65.234)	Top-5 acc 88.672 (84.790)	lr 0.00424
Train [88][1850/3239]	Time 0.292 (0.546)	Data Time 0.003 (0.025)	Loss 2.2108 (2.4370)	Entropy 0.57887 (0.58022)	Top-1 acc 73.828 (65.233)	Top-5 acc 90.234 (84.790)	lr 0.00424
Train [88][1860/3239]	Time 0.242 (0.545)	Data Time 0.001 (0.025)	Loss 2.4220 (2.4370)	Entropy 0.57918 (0.58022)	Top-1 acc 66.797 (65.232)	Top-5 acc 86.719 (84.793)	lr 0.00424
Train [88][1870/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.025)	Loss 2.4061 (2.4367)	Entropy 0.57896 (0.58021)	Top-1 acc 69.141 (65.236)	Top-5 acc 83.984 (84.793)	lr 0.00424
Train [88][1880/3239]	Time 0.264 (0.544)	Data Time 0.001 (0.024)	Loss 2.5084 (2.4367)	Entropy 0.57886 (0.58021)	Top-1 acc 62.500 (65.233)	Top-5 acc 82.812 (84.793)	lr 0.00424
Train [88][1890/3239]	Time 0.242 (0.544)	Data Time 0.001 (0.024)	Loss 2.4164 (2.4367)	Entropy 0.57874 (0.58020)	Top-1 acc 64.844 (65.232)	Top-5 acc 83.984 (84.790)	lr 0.00424
Train [88][1900/3239]	Time 0.240 (0.543)	Data Time 0.001 (0.024)	Loss 2.4483 (2.4367)	Entropy 0.57871 (0.58019)	Top-1 acc 66.016 (65.228)	Top-5 acc 84.375 (84.790)	lr 0.00424
Train [88][1910/3239]	Time 0.228 (0.542)	Data Time 0.001 (0.024)	Loss 2.3834 (2.4368)	Entropy 0.57883 (0.58018)	Top-1 acc 67.188 (65.225)	Top-5 acc 86.328 (84.787)	lr 0.00424
Train [88][1920/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.024)	Loss 2.4329 (2.4370)	Entropy 0.57866 (0.58018)	Top-1 acc 62.891 (65.219)	Top-5 acc 85.156 (84.787)	lr 0.00424
Train [88][1930/3239]	Time 0.236 (0.541)	Data Time 0.001 (0.024)	Loss 2.4922 (2.4368)	Entropy 0.57886 (0.58017)	Top-1 acc 61.719 (65.224)	Top-5 acc 83.203 (84.788)	lr 0.00423
Train [88][1940/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.024)	Loss 2.4142 (2.4368)	Entropy 0.57838 (0.58016)	Top-1 acc 62.500 (65.216)	Top-5 acc 85.938 (84.793)	lr 0.00423
Train [88][1950/3239]	Time 0.332 (0.540)	Data Time 0.001 (0.024)	Loss 2.2924 (2.4368)	Entropy 0.57820 (0.58015)	Top-1 acc 69.141 (65.216)	Top-5 acc 86.719 (84.792)	lr 0.00423
Train [88][1960/3239]	Time 0.226 (0.540)	Data Time 0.001 (0.024)	Loss 2.4047 (2.4367)	Entropy 0.57837 (0.58014)	Top-1 acc 68.750 (65.219)	Top-5 acc 85.938 (84.798)	lr 0.00423
Train [88][1970/3239]	Time 0.246 (0.539)	Data Time 0.001 (0.023)	Loss 2.2805 (2.4367)	Entropy 0.57816 (0.58013)	Top-1 acc 71.484 (65.220)	Top-5 acc 87.109 (84.799)	lr 0.00423
Train [88][1980/3239]	Time 0.244 (0.539)	Data Time 0.001 (0.023)	Loss 2.3328 (2.4364)	Entropy 0.57819 (0.58012)	Top-1 acc 69.531 (65.225)	Top-5 acc 86.719 (84.806)	lr 0.00423
Train [88][1990/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.023)	Loss 2.6327 (2.4369)	Entropy 0.57796 (0.58011)	Top-1 acc 59.766 (65.214)	Top-5 acc 83.984 (84.798)	lr 0.00423
Train [88][2000/3239]	Time 0.237 (0.538)	Data Time 0.001 (0.023)	Loss 2.2826 (2.4367)	Entropy 0.57812 (0.58010)	Top-1 acc 70.703 (65.224)	Top-5 acc 89.062 (84.804)	lr 0.00423
Train [88][2010/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.023)	Loss 2.3994 (2.4366)	Entropy 0.57837 (0.58009)	Top-1 acc 67.969 (65.227)	Top-5 acc 85.547 (84.803)	lr 0.00423
Train [88][2020/3239]	Time 0.336 (0.536)	Data Time 0.001 (0.023)	Loss 2.6303 (2.4368)	Entropy 0.57872 (0.58008)	Top-1 acc 62.500 (65.222)	Top-5 acc 80.078 (84.802)	lr 0.00423
Train [88][2030/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.023)	Loss 2.3503 (2.4369)	Entropy 0.57890 (0.58008)	Top-1 acc 69.141 (65.221)	Top-5 acc 84.375 (84.800)	lr 0.00423
Train [88][2040/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.023)	Loss 2.5112 (2.4370)	Entropy 0.57864 (0.58007)	Top-1 acc 63.672 (65.215)	Top-5 acc 82.812 (84.795)	lr 0.00423
Train [88][2050/3239]	Time 0.240 (0.535)	Data Time 0.002 (0.023)	Loss 2.5515 (2.4371)	Entropy 0.57865 (0.58006)	Top-1 acc 60.938 (65.212)	Top-5 acc 82.812 (84.796)	lr 0.00423
Train [88][2060/3239]	Time 0.269 (0.534)	Data Time 0.001 (0.023)	Loss 2.4501 (2.4371)	Entropy 0.57905 (0.58006)	Top-1 acc 67.969 (65.210)	Top-5 acc 82.031 (84.797)	lr 0.00422
Train [88][2070/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.022)	Loss 2.7194 (2.4373)	Entropy 0.57905 (0.58005)	Top-1 acc 57.812 (65.205)	Top-5 acc 78.516 (84.792)	lr 0.00422
Train [88][2080/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.022)	Loss 2.5918 (2.4373)	Entropy 0.57871 (0.58005)	Top-1 acc 63.281 (65.208)	Top-5 acc 82.422 (84.795)	lr 0.00422
Train [88][2090/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.022)	Loss 2.3604 (2.4374)	Entropy 0.57878 (0.58004)	Top-1 acc 67.578 (65.200)	Top-5 acc 86.719 (84.794)	lr 0.00422
Train [88][2100/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.022)	Loss 2.9742 (2.4378)	Entropy 0.57884 (0.58003)	Top-1 acc 52.734 (65.188)	Top-5 acc 76.172 (84.788)	lr 0.00422
Train [88][2110/3239]	Time 0.330 (0.532)	Data Time 0.001 (0.022)	Loss 2.3628 (2.4377)	Entropy 0.57911 (0.58003)	Top-1 acc 65.625 (65.193)	Top-5 acc 86.719 (84.790)	lr 0.00422
Train [88][2120/3239]	Time 0.240 (0.531)	Data Time 0.001 (0.022)	Loss 2.5144 (2.4373)	Entropy 0.57891 (0.58002)	Top-1 acc 61.719 (65.203)	Top-5 acc 82.031 (84.798)	lr 0.00422
Train [88][2130/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.022)	Loss 2.2189 (2.4373)	Entropy 0.57918 (0.58002)	Top-1 acc 68.750 (65.199)	Top-5 acc 88.281 (84.799)	lr 0.00422
Train [88][2140/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.022)	Loss 2.5730 (2.4372)	Entropy 0.57894 (0.58001)	Top-1 acc 64.453 (65.203)	Top-5 acc 80.859 (84.801)	lr 0.00422
Train [88][2150/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.022)	Loss 2.5338 (2.4375)	Entropy 0.57889 (0.58001)	Top-1 acc 62.500 (65.196)	Top-5 acc 84.766 (84.794)	lr 0.00422
Train [88][2160/3239]	Time 0.250 (0.529)	Data Time 0.001 (0.022)	Loss 2.3474 (2.4374)	Entropy 0.57901 (0.58000)	Top-1 acc 68.359 (65.201)	Top-5 acc 86.328 (84.797)	lr 0.00422
Train [88][2170/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.021)	Loss 2.4931 (2.4373)	Entropy 0.57895 (0.58000)	Top-1 acc 64.453 (65.208)	Top-5 acc 82.812 (84.802)	lr 0.00422
Train [88][2180/3239]	Time 0.339 (0.529)	Data Time 0.001 (0.021)	Loss 2.4286 (2.4371)	Entropy 0.57876 (0.57999)	Top-1 acc 62.109 (65.213)	Top-5 acc 85.156 (84.803)	lr 0.00422
Train [88][2190/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.021)	Loss 2.2932 (2.4369)	Entropy 0.57887 (0.57999)	Top-1 acc 71.484 (65.216)	Top-5 acc 85.938 (84.806)	lr 0.00421
Train [88][2200/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.021)	Loss 2.4243 (2.4370)	Entropy 0.57887 (0.57998)	Top-1 acc 67.969 (65.216)	Top-5 acc 82.812 (84.802)	lr 0.00421
Train [88][2210/3239]	Time 0.237 (0.527)	Data Time 0.002 (0.021)	Loss 2.3451 (2.4369)	Entropy 0.57903 (0.57998)	Top-1 acc 65.625 (65.221)	Top-5 acc 87.891 (84.806)	lr 0.00421
Train [88][2220/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.021)	Loss 2.3279 (2.4370)	Entropy 0.57915 (0.57997)	Top-1 acc 69.141 (65.223)	Top-5 acc 85.156 (84.800)	lr 0.00421
Train [88][2230/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.021)	Loss 2.4807 (2.4371)	Entropy 0.57898 (0.57997)	Top-1 acc 67.578 (65.225)	Top-5 acc 83.203 (84.801)	lr 0.00421
Train [88][2240/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.021)	Loss 2.3722 (2.4370)	Entropy 0.57884 (0.57997)	Top-1 acc 67.188 (65.223)	Top-5 acc 83.984 (84.803)	lr 0.00421
Train [88][2250/3239]	Time 0.239 (0.525)	Data Time 0.001 (0.021)	Loss 2.4043 (2.4370)	Entropy 0.57904 (0.57996)	Top-1 acc 65.234 (65.223)	Top-5 acc 86.719 (84.806)	lr 0.00421
Train [88][2260/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.021)	Loss 2.5906 (2.4373)	Entropy 0.57913 (0.57996)	Top-1 acc 64.844 (65.216)	Top-5 acc 80.078 (84.800)	lr 0.00421
Train [88][2270/3239]	Time 0.337 (0.524)	Data Time 0.001 (0.021)	Loss 2.4419 (2.4375)	Entropy 0.57895 (0.57995)	Top-1 acc 62.109 (65.206)	Top-5 acc 87.109 (84.799)	lr 0.00421
Train [88][2280/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.020)	Loss 2.4033 (2.4377)	Entropy 0.57890 (0.57995)	Top-1 acc 70.703 (65.206)	Top-5 acc 86.719 (84.797)	lr 0.00421
Train [88][2290/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.020)	Loss 2.4439 (2.4375)	Entropy 0.57885 (0.57994)	Top-1 acc 65.234 (65.212)	Top-5 acc 84.766 (84.802)	lr 0.00421
Train [88][2300/3239]	Time 0.241 (0.523)	Data Time 0.002 (0.020)	Loss 2.2669 (2.4374)	Entropy 0.57860 (0.57994)	Top-1 acc 69.531 (65.214)	Top-5 acc 85.938 (84.801)	lr 0.00421
Train [88][2310/3239]	Time 0.239 (0.522)	Data Time 0.002 (0.020)	Loss 2.4685 (2.4372)	Entropy 0.57863 (0.57993)	Top-1 acc 64.453 (65.219)	Top-5 acc 84.766 (84.803)	lr 0.00421
Train [88][2320/3239]	Time 0.243 (0.522)	Data Time 0.002 (0.020)	Loss 2.5155 (2.4370)	Entropy 0.57851 (0.57993)	Top-1 acc 64.453 (65.221)	Top-5 acc 83.984 (84.807)	lr 0.00421
Train [88][2330/3239]	Time 0.240 (0.522)	Data Time 0.002 (0.020)	Loss 2.4568 (2.4369)	Entropy 0.57873 (0.57992)	Top-1 acc 63.672 (65.219)	Top-5 acc 88.281 (84.813)	lr 0.00420
Train [88][2340/3239]	Time 0.343 (0.521)	Data Time 0.001 (0.020)	Loss 2.3221 (2.4367)	Entropy 0.57886 (0.57992)	Top-1 acc 65.234 (65.225)	Top-5 acc 86.719 (84.816)	lr 0.00420
Train [88][2350/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.020)	Loss 2.3384 (2.4367)	Entropy 0.57880 (0.57991)	Top-1 acc 66.797 (65.223)	Top-5 acc 86.328 (84.816)	lr 0.00420
Train [88][2360/3239]	Time 0.438 (0.544)	Data Time 0.005 (0.020)	Loss 2.3915 (2.4365)	Entropy 0.57927 (0.57991)	Top-1 acc 65.625 (65.230)	Top-5 acc 85.156 (84.821)	lr 0.00420
Train [88][2370/3239]	Time 0.225 (0.544)	Data Time 0.002 (0.020)	Loss 2.5157 (2.4367)	Entropy 0.57957 (0.57991)	Top-1 acc 64.844 (65.224)	Top-5 acc 82.812 (84.817)	lr 0.00420
Train [88][2380/3239]	Time 0.245 (0.544)	Data Time 0.002 (0.020)	Loss 2.5136 (2.4366)	Entropy 0.57975 (0.57991)	Top-1 acc 64.453 (65.229)	Top-5 acc 85.547 (84.821)	lr 0.00420
Train [88][2390/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.020)	Loss 2.3619 (2.4367)	Entropy 0.57992 (0.57991)	Top-1 acc 66.797 (65.226)	Top-5 acc 87.891 (84.820)	lr 0.00420
Train [88][2400/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.020)	Loss 2.3757 (2.4368)	Entropy 0.57989 (0.57991)	Top-1 acc 67.969 (65.224)	Top-5 acc 86.328 (84.820)	lr 0.00420
Train [88][2410/3239]	Time 0.234 (0.542)	Data Time 0.002 (0.019)	Loss 2.3918 (2.4368)	Entropy 0.57995 (0.57991)	Top-1 acc 68.750 (65.221)	Top-5 acc 87.891 (84.823)	lr 0.00420
Train [88][2420/3239]	Time 0.228 (0.542)	Data Time 0.001 (0.019)	Loss 2.1788 (2.4365)	Entropy 0.57992 (0.57991)	Top-1 acc 68.750 (65.228)	Top-5 acc 89.062 (84.826)	lr 0.00420
Train [88][2430/3239]	Time 0.342 (0.541)	Data Time 0.001 (0.019)	Loss 2.3537 (2.4362)	Entropy 0.57971 (0.57991)	Top-1 acc 65.625 (65.236)	Top-5 acc 86.719 (84.832)	lr 0.00420
Train [88][2440/3239]	Time 0.245 (0.541)	Data Time 0.001 (0.019)	Loss 2.7608 (2.4366)	Entropy 0.57961 (0.57990)	Top-1 acc 56.250 (65.224)	Top-5 acc 76.953 (84.824)	lr 0.00420
Train [88][2450/3239]	Time 0.227 (0.540)	Data Time 0.001 (0.019)	Loss 2.4407 (2.4365)	Entropy 0.57932 (0.57990)	Top-1 acc 66.797 (65.230)	Top-5 acc 84.375 (84.824)	lr 0.00420
Train [88][2460/3239]	Time 0.226 (0.540)	Data Time 0.001 (0.019)	Loss 2.4378 (2.4366)	Entropy 0.57926 (0.57990)	Top-1 acc 64.844 (65.228)	Top-5 acc 82.812 (84.823)	lr 0.00419
Train [88][2470/3239]	Time 0.238 (0.540)	Data Time 0.001 (0.019)	Loss 2.3557 (2.4365)	Entropy 0.57900 (0.57990)	Top-1 acc 67.969 (65.229)	Top-5 acc 86.719 (84.823)	lr 0.00419
Train [88][2480/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.019)	Loss 2.3661 (2.4366)	Entropy 0.57891 (0.57989)	Top-1 acc 63.672 (65.225)	Top-5 acc 85.938 (84.823)	lr 0.00419
Train [88][2490/3239]	Time 0.243 (0.539)	Data Time 0.001 (0.019)	Loss 2.2095 (2.4364)	Entropy 0.57894 (0.57989)	Top-1 acc 69.531 (65.231)	Top-5 acc 89.844 (84.825)	lr 0.00419
Train [88][2500/3239]	Time 0.336 (0.539)	Data Time 0.001 (0.019)	Loss 2.3088 (2.4363)	Entropy 0.57910 (0.57989)	Top-1 acc 69.531 (65.234)	Top-5 acc 89.062 (84.827)	lr 0.00419
Train [88][2510/3239]	Time 0.227 (0.538)	Data Time 0.001 (0.019)	Loss 2.4293 (2.4361)	Entropy 0.57919 (0.57988)	Top-1 acc 62.109 (65.240)	Top-5 acc 86.719 (84.831)	lr 0.00419
Train [88][2520/3239]	Time 0.240 (0.538)	Data Time 0.001 (0.019)	Loss 2.4554 (2.4362)	Entropy 0.57910 (0.57988)	Top-1 acc 65.625 (65.239)	Top-5 acc 83.594 (84.828)	lr 0.00419
Train [88][2530/3239]	Time 0.224 (0.537)	Data Time 0.001 (0.019)	Loss 2.5495 (2.4366)	Entropy 0.57888 (0.57988)	Top-1 acc 63.672 (65.230)	Top-5 acc 82.812 (84.822)	lr 0.00419
Train [88][2540/3239]	Time 0.234 (0.537)	Data Time 0.001 (0.019)	Loss 2.3585 (2.4365)	Entropy 0.57887 (0.57987)	Top-1 acc 66.016 (65.237)	Top-5 acc 86.719 (84.825)	lr 0.00419
Train [88][2550/3239]	Time 0.245 (0.536)	Data Time 0.001 (0.019)	Loss 2.3456 (2.4364)	Entropy 0.57863 (0.57987)	Top-1 acc 64.453 (65.236)	Top-5 acc 85.156 (84.825)	lr 0.00419
Train [88][2560/3239]	Time 0.243 (0.536)	Data Time 0.001 (0.018)	Loss 2.3978 (2.4365)	Entropy 0.57880 (0.57986)	Top-1 acc 67.578 (65.234)	Top-5 acc 82.812 (84.822)	lr 0.00419
Train [88][2570/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.018)	Loss 2.8555 (2.4369)	Entropy 0.57831 (0.57986)	Top-1 acc 55.859 (65.224)	Top-5 acc 75.391 (84.816)	lr 0.00419
Train [88][2580/3239]	Time 0.248 (0.535)	Data Time 0.001 (0.018)	Loss 2.2958 (2.4368)	Entropy 0.57810 (0.57985)	Top-1 acc 68.359 (65.224)	Top-5 acc 89.844 (84.817)	lr 0.00419
Train [88][2590/3239]	Time 0.232 (0.535)	Data Time 0.001 (0.018)	Loss 2.4527 (2.4368)	Entropy 0.57812 (0.57985)	Top-1 acc 64.062 (65.224)	Top-5 acc 83.203 (84.817)	lr 0.00418
Train [88][2600/3239]	Time 0.344 (0.535)	Data Time 0.002 (0.018)	Loss 2.5582 (2.4370)	Entropy 0.57790 (0.57984)	Top-1 acc 64.453 (65.224)	Top-5 acc 83.984 (84.815)	lr 0.00418
Train [88][2610/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.018)	Loss 2.2709 (2.4370)	Entropy 0.57806 (0.57983)	Top-1 acc 66.797 (65.225)	Top-5 acc 89.844 (84.818)	lr 0.00418
Train [88][2620/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.018)	Loss 2.6575 (2.4371)	Entropy 0.57824 (0.57982)	Top-1 acc 61.328 (65.229)	Top-5 acc 78.906 (84.815)	lr 0.00418
Train [88][2630/3239]	Time 0.230 (0.534)	Data Time 0.001 (0.018)	Loss 2.8774 (2.4372)	Entropy 0.57806 (0.57982)	Top-1 acc 53.906 (65.225)	Top-5 acc 78.516 (84.812)	lr 0.00418
Train [88][2640/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.018)	Loss 2.3305 (2.4373)	Entropy 0.57841 (0.57981)	Top-1 acc 66.406 (65.224)	Top-5 acc 84.766 (84.810)	lr 0.00418
Train [88][2650/3239]	Time 0.230 (0.534)	Data Time 0.001 (0.018)	Loss 2.4004 (2.4373)	Entropy 0.57823 (0.57981)	Top-1 acc 68.359 (65.222)	Top-5 acc 84.766 (84.807)	lr 0.00418
Train [88][2660/3239]	Time 0.338 (0.533)	Data Time 0.001 (0.018)	Loss 2.4413 (2.4374)	Entropy 0.57810 (0.57980)	Top-1 acc 66.797 (65.218)	Top-5 acc 85.938 (84.806)	lr 0.00418
Train [88][2670/3239]	Time 0.241 (0.533)	Data Time 0.001 (0.018)	Loss 2.3735 (2.4376)	Entropy 0.57805 (0.57979)	Top-1 acc 69.141 (65.218)	Top-5 acc 87.109 (84.805)	lr 0.00418
Train [88][2680/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.018)	Loss 2.5193 (2.4377)	Entropy 0.57813 (0.57979)	Top-1 acc 61.328 (65.213)	Top-5 acc 83.984 (84.802)	lr 0.00418
Train [88][2690/3239]	Time 0.246 (0.532)	Data Time 0.001 (0.018)	Loss 2.4382 (2.4378)	Entropy 0.57815 (0.57978)	Top-1 acc 64.453 (65.212)	Top-5 acc 85.547 (84.802)	lr 0.00418
Train [88][2700/3239]	Time 0.270 (0.532)	Data Time 0.001 (0.018)	Loss 2.5615 (2.4376)	Entropy 0.57787 (0.57978)	Top-1 acc 62.109 (65.217)	Top-5 acc 83.984 (84.805)	lr 0.00418
Train [88][2710/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.018)	Loss 2.2282 (2.4374)	Entropy 0.57807 (0.57977)	Top-1 acc 69.922 (65.222)	Top-5 acc 87.891 (84.809)	lr 0.00418
Train [88][2720/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.017)	Loss 2.6381 (2.4375)	Entropy 0.57865 (0.57976)	Top-1 acc 60.547 (65.222)	Top-5 acc 80.859 (84.807)	lr 0.00417
Train [88][2730/3239]	Time 0.342 (0.530)	Data Time 0.001 (0.017)	Loss 2.5491 (2.4377)	Entropy 0.57846 (0.57976)	Top-1 acc 58.984 (65.218)	Top-5 acc 80.859 (84.805)	lr 0.00417
Train [88][2740/3239]	Time 0.239 (0.530)	Data Time 0.001 (0.017)	Loss 2.2277 (2.4375)	Entropy 0.57826 (0.57975)	Top-1 acc 71.484 (65.224)	Top-5 acc 89.062 (84.809)	lr 0.00417
Train [88][2750/3239]	Time 0.241 (0.530)	Data Time 0.001 (0.017)	Loss 2.4056 (2.4376)	Entropy 0.57843 (0.57975)	Top-1 acc 63.672 (65.223)	Top-5 acc 86.328 (84.808)	lr 0.00417
Train [88][2760/3239]	Time 0.226 (0.531)	Data Time 0.001 (0.017)	Loss 2.6211 (2.4376)	Entropy 0.57863 (0.57974)	Top-1 acc 58.984 (65.222)	Top-5 acc 84.766 (84.807)	lr 0.00417
Train [88][2770/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.017)	Loss 2.2800 (2.4374)	Entropy 0.57878 (0.57974)	Top-1 acc 67.188 (65.229)	Top-5 acc 87.500 (84.812)	lr 0.00417
Train [88][2780/3239]	Time 0.243 (0.530)	Data Time 0.001 (0.017)	Loss 2.3791 (2.4374)	Entropy 0.57873 (0.57974)	Top-1 acc 66.797 (65.227)	Top-5 acc 84.766 (84.815)	lr 0.00417
Train [88][2790/3239]	Time 0.259 (0.529)	Data Time 0.002 (0.017)	Loss 2.3718 (2.4373)	Entropy 0.57878 (0.57973)	Top-1 acc 66.016 (65.229)	Top-5 acc 86.719 (84.816)	lr 0.00417
Train [88][2800/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.017)	Loss 2.5811 (2.4374)	Entropy 0.57900 (0.57973)	Top-1 acc 61.719 (65.229)	Top-5 acc 84.766 (84.815)	lr 0.00417
Train [88][2810/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.017)	Loss 2.3985 (2.4375)	Entropy 0.57882 (0.57973)	Top-1 acc 65.625 (65.227)	Top-5 acc 86.328 (84.814)	lr 0.00417
Train [88][2820/3239]	Time 0.349 (0.529)	Data Time 0.001 (0.017)	Loss 2.3124 (2.4379)	Entropy 0.57878 (0.57972)	Top-1 acc 68.359 (65.214)	Top-5 acc 87.109 (84.809)	lr 0.00417
Train [88][2830/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.017)	Loss 2.2110 (2.4380)	Entropy 0.57840 (0.57972)	Top-1 acc 72.266 (65.214)	Top-5 acc 88.281 (84.810)	lr 0.00417
Train [88][2840/3239]	Time 0.247 (0.528)	Data Time 0.001 (0.017)	Loss 2.4044 (2.4382)	Entropy 0.57834 (0.57971)	Top-1 acc 67.188 (65.211)	Top-5 acc 85.938 (84.807)	lr 0.00417
Train [88][2850/3239]	Time 0.254 (0.528)	Data Time 0.002 (0.017)	Loss 2.6851 (2.4383)	Entropy 0.57817 (0.57971)	Top-1 acc 58.984 (65.208)	Top-5 acc 78.906 (84.805)	lr 0.00417
Train [88][2860/3239]	Time 0.258 (0.527)	Data Time 0.001 (0.017)	Loss 2.4193 (2.4387)	Entropy 0.57823 (0.57970)	Top-1 acc 69.141 (65.198)	Top-5 acc 83.203 (84.799)	lr 0.00416
Train [88][2870/3239]	Time 0.259 (0.527)	Data Time 0.001 (0.017)	Loss 2.3307 (2.4386)	Entropy 0.57825 (0.57970)	Top-1 acc 68.750 (65.199)	Top-5 acc 85.547 (84.799)	lr 0.00416
Train [88][2880/3239]	Time 0.291 (0.527)	Data Time 0.001 (0.017)	Loss 2.3666 (2.4387)	Entropy 0.57817 (0.57969)	Top-1 acc 64.453 (65.197)	Top-5 acc 85.547 (84.800)	lr 0.00416
Train [88][2890/3239]	Time 0.364 (0.527)	Data Time 0.001 (0.017)	Loss 2.4526 (2.4386)	Entropy 0.57793 (0.57969)	Top-1 acc 67.578 (65.203)	Top-5 acc 83.203 (84.801)	lr 0.00416
Train [88][2900/3239]	Time 0.260 (0.526)	Data Time 0.001 (0.017)	Loss 2.6434 (2.4384)	Entropy 0.57784 (0.57968)	Top-1 acc 59.766 (65.206)	Top-5 acc 80.078 (84.804)	lr 0.00416
Train [88][2910/3239]	Time 0.263 (0.526)	Data Time 0.001 (0.016)	Loss 2.5039 (2.4388)	Entropy 0.57795 (0.57968)	Top-1 acc 66.797 (65.196)	Top-5 acc 83.984 (84.797)	lr 0.00416
Train [88][2920/3239]	Time 0.262 (0.526)	Data Time 0.002 (0.016)	Loss 2.4245 (2.4388)	Entropy 0.57796 (0.57967)	Top-1 acc 66.016 (65.196)	Top-5 acc 87.500 (84.800)	lr 0.00416
Train [88][2930/3239]	Time 0.242 (0.526)	Data Time 0.001 (0.016)	Loss 2.2684 (2.4385)	Entropy 0.57802 (0.57966)	Top-1 acc 69.922 (65.204)	Top-5 acc 86.328 (84.802)	lr 0.00416
Train [88][2940/3239]	Time 0.294 (0.526)	Data Time 0.002 (0.016)	Loss 2.2580 (2.4385)	Entropy 0.57822 (0.57966)	Top-1 acc 70.703 (65.206)	Top-5 acc 88.281 (84.802)	lr 0.00416
Train [88][2950/3239]	Time 0.244 (0.525)	Data Time 0.001 (0.016)	Loss 2.5632 (2.4385)	Entropy 0.57804 (0.57965)	Top-1 acc 64.844 (65.205)	Top-5 acc 80.859 (84.801)	lr 0.00416
Train [88][2960/3239]	Time 0.265 (0.525)	Data Time 0.002 (0.016)	Loss 2.2135 (2.4384)	Entropy 0.57780 (0.57965)	Top-1 acc 71.484 (65.208)	Top-5 acc 87.891 (84.802)	lr 0.00416
Train [88][2970/3239]	Time 0.265 (0.525)	Data Time 0.001 (0.016)	Loss 2.4397 (2.4383)	Entropy 0.57816 (0.57964)	Top-1 acc 65.234 (65.211)	Top-5 acc 84.375 (84.804)	lr 0.00416
Train [88][2980/3239]	Time 0.390 (0.525)	Data Time 0.003 (0.016)	Loss 2.3584 (2.4383)	Entropy 0.57812 (0.57964)	Top-1 acc 69.922 (65.208)	Top-5 acc 85.156 (84.804)	lr 0.00416
Train [88][2990/3239]	Time 0.251 (0.524)	Data Time 0.001 (0.016)	Loss 2.4554 (2.4384)	Entropy 0.57803 (0.57963)	Top-1 acc 65.234 (65.204)	Top-5 acc 85.156 (84.801)	lr 0.00415
Train [88][3000/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.016)	Loss 2.4654 (2.4384)	Entropy 0.57796 (0.57963)	Top-1 acc 63.281 (65.200)	Top-5 acc 84.375 (84.801)	lr 0.00415
Train [88][3010/3239]	Time 0.296 (0.524)	Data Time 0.001 (0.016)	Loss 2.3206 (2.4385)	Entropy 0.57826 (0.57962)	Top-1 acc 66.797 (65.197)	Top-5 acc 87.891 (84.800)	lr 0.00415
Train [88][3020/3239]	Time 0.321 (0.543)	Data Time 0.002 (0.016)	Loss 2.5123 (2.4386)	Entropy 0.57840 (0.57962)	Top-1 acc 64.062 (65.196)	Top-5 acc 83.203 (84.795)	lr 0.00415
Train [88][3030/3239]	Time 0.278 (0.543)	Data Time 0.003 (0.016)	Loss 2.3875 (2.4386)	Entropy 0.57826 (0.57961)	Top-1 acc 69.531 (65.200)	Top-5 acc 85.156 (84.796)	lr 0.00415
Train [88][3040/3239]	Time 0.238 (0.542)	Data Time 0.001 (0.016)	Loss 2.5319 (2.4388)	Entropy 0.57855 (0.57961)	Top-1 acc 62.109 (65.195)	Top-5 acc 84.375 (84.790)	lr 0.00415
Train [88][3050/3239]	Time 0.377 (0.542)	Data Time 0.001 (0.016)	Loss 2.4981 (2.4388)	Entropy 0.57867 (0.57961)	Top-1 acc 66.797 (65.195)	Top-5 acc 83.203 (84.792)	lr 0.00415
Train [88][3060/3239]	Time 0.252 (0.542)	Data Time 0.001 (0.016)	Loss 2.4504 (2.4387)	Entropy 0.57871 (0.57960)	Top-1 acc 64.453 (65.199)	Top-5 acc 82.422 (84.795)	lr 0.00415
Train [88][3070/3239]	Time 0.240 (0.541)	Data Time 0.001 (0.016)	Loss 2.5043 (2.4388)	Entropy 0.57880 (0.57960)	Top-1 acc 62.109 (65.194)	Top-5 acc 81.641 (84.792)	lr 0.00415
Train [88][3080/3239]	Time 0.280 (0.541)	Data Time 0.032 (0.016)	Loss 2.3332 (2.4388)	Entropy 0.57885 (0.57960)	Top-1 acc 66.797 (65.193)	Top-5 acc 84.375 (84.792)	lr 0.00415
Train [88][3090/3239]	Time 0.245 (0.541)	Data Time 0.001 (0.016)	Loss 2.5009 (2.4387)	Entropy 0.57918 (0.57960)	Top-1 acc 63.281 (65.198)	Top-5 acc 84.375 (84.793)	lr 0.00415
Train [88][3100/3239]	Time 0.245 (0.541)	Data Time 0.001 (0.016)	Loss 2.4966 (2.4388)	Entropy 0.57917 (0.57959)	Top-1 acc 61.719 (65.193)	Top-5 acc 83.984 (84.791)	lr 0.00415
Train [88][3110/3239]	Time 0.335 (0.540)	Data Time 0.001 (0.016)	Loss 2.6144 (2.4389)	Entropy 0.57933 (0.57959)	Top-1 acc 63.281 (65.191)	Top-5 acc 83.594 (84.792)	lr 0.00415
Train [88][3120/3239]	Time 0.259 (0.540)	Data Time 0.001 (0.016)	Loss 2.4227 (2.4388)	Entropy 0.57932 (0.57959)	Top-1 acc 67.188 (65.193)	Top-5 acc 83.984 (84.795)	lr 0.00414
Train [88][3130/3239]	Time 0.254 (0.540)	Data Time 0.001 (0.016)	Loss 2.6917 (2.4387)	Entropy 0.57939 (0.57959)	Top-1 acc 55.078 (65.193)	Top-5 acc 80.078 (84.797)	lr 0.00414
Train [88][3140/3239]	Time 0.284 (0.540)	Data Time 0.001 (0.016)	Loss 2.2907 (2.4386)	Entropy 0.57945 (0.57959)	Top-1 acc 68.750 (65.194)	Top-5 acc 86.328 (84.798)	lr 0.00414
Train [88][3150/3239]	Time 0.257 (0.539)	Data Time 0.001 (0.016)	Loss 2.3347 (2.4385)	Entropy 0.57978 (0.57959)	Top-1 acc 67.578 (65.198)	Top-5 acc 86.719 (84.800)	lr 0.00414
Train [88][3160/3239]	Time 0.266 (0.539)	Data Time 0.001 (0.016)	Loss 2.4692 (2.4385)	Entropy 0.57966 (0.57959)	Top-1 acc 63.672 (65.199)	Top-5 acc 84.375 (84.800)	lr 0.00414
Train [88][3170/3239]	Time 0.271 (0.539)	Data Time 0.001 (0.016)	Loss 2.4792 (2.4386)	Entropy 0.57968 (0.57959)	Top-1 acc 60.547 (65.191)	Top-5 acc 84.766 (84.801)	lr 0.00414
Train [88][3180/3239]	Time 0.241 (0.539)	Data Time 0.000 (0.016)	Loss 2.5816 (2.4387)	Entropy 0.57948 (0.57959)	Top-1 acc 67.188 (65.189)	Top-5 acc 79.688 (84.801)	lr 0.00414
Train [88][3190/3239]	Time 0.238 (0.539)	Data Time 0.000 (0.016)	Loss 2.4654 (2.4387)	Entropy 0.57913 (0.57959)	Top-1 acc 66.797 (65.191)	Top-5 acc 82.812 (84.802)	lr 0.00414
Train [88][3200/3239]	Time 0.272 (0.538)	Data Time 0.000 (0.016)	Loss 2.3839 (2.4388)	Entropy 0.57946 (0.57959)	Top-1 acc 67.578 (65.189)	Top-5 acc 85.547 (84.799)	lr 0.00414
Train [88][3210/3239]	Time 0.344 (0.538)	Data Time 0.000 (0.015)	Loss 2.4603 (2.4389)	Entropy 0.57930 (0.57959)	Top-1 acc 63.281 (65.190)	Top-5 acc 82.422 (84.798)	lr 0.00414
Train [88][3220/3239]	Time 0.227 (0.538)	Data Time 0.000 (0.015)	Loss 2.4632 (2.4390)	Entropy 0.57908 (0.57959)	Top-1 acc 62.891 (65.184)	Top-5 acc 85.547 (84.797)	lr 0.00414
Train [88][3230/3239]	Time 0.239 (0.537)	Data Time 0.000 (0.015)	Loss 2.4239 (2.4392)	Entropy 0.57859 (0.57959)	Top-1 acc 65.234 (65.172)	Top-5 acc 83.594 (84.792)	lr 0.00414
Train [88][3239/3239]	Time 0.981 (0.537)	Data Time 0.000 (0.015)	Loss 2.3598 (2.4390)	Entropy 0.57878 (0.57958)	Top-1 acc 69.136 (65.179)	Top-5 acc 85.185 (84.796)	lr 0.00414
==========Valid [88/120]	loss 1.249	top-1 acc 71.312 (71.312)	top-5 acc 89.668	Train top-1 65.179	top-5 84.796	Entropy 0.57878	Latency-None: 0.000ms	Flops: 539.00M
Train [89][0/3239]	Time 38.481 (38.481)	Data Time 37.180 (37.180)	Loss 2.2464 (2.2464)	Entropy 0.57882 (0.57882)	Top-1 acc 72.656 (72.656)	Top-5 acc 86.328 (86.328)	lr 0.00414
Train [89][10/3239]	Time 0.231 (4.047)	Data Time 0.001 (3.382)	Loss 2.3015 (2.3194)	Entropy 0.57903 (0.57883)	Top-1 acc 70.312 (68.714)	Top-5 acc 86.328 (86.683)	lr 0.00414
Train [89][20/3239]	Time 0.233 (2.322)	Data Time 0.001 (1.772)	Loss 2.3452 (2.3572)	Entropy 0.57878 (0.57889)	Top-1 acc 69.531 (67.355)	Top-5 acc 85.938 (86.012)	lr 0.00413
Train [89][30/3239]	Time 0.229 (1.714)	Data Time 0.001 (1.201)	Loss 2.5705 (2.3977)	Entropy 0.57893 (0.57888)	Top-1 acc 60.156 (66.230)	Top-5 acc 82.422 (85.534)	lr 0.00413
Train [89][40/3239]	Time 0.328 (1.400)	Data Time 0.001 (0.909)	Loss 2.4614 (2.3958)	Entropy 0.57882 (0.57887)	Top-1 acc 62.109 (66.225)	Top-5 acc 85.938 (85.595)	lr 0.00413
Train [89][50/3239]	Time 0.231 (1.208)	Data Time 0.001 (0.731)	Loss 2.5676 (2.3959)	Entropy 0.57872 (0.57885)	Top-1 acc 63.281 (66.460)	Top-5 acc 82.812 (85.585)	lr 0.00413
Train [89][60/3239]	Time 0.246 (1.080)	Data Time 0.001 (0.611)	Loss 2.3523 (2.4002)	Entropy 0.57870 (0.57883)	Top-1 acc 66.797 (66.534)	Top-5 acc 86.719 (85.425)	lr 0.00413
Train [89][70/3239]	Time 0.286 (0.993)	Data Time 0.003 (0.525)	Loss 2.5353 (2.4068)	Entropy 0.57881 (0.57881)	Top-1 acc 62.500 (66.423)	Top-5 acc 83.203 (85.239)	lr 0.00413
Train [89][80/3239]	Time 0.220 (0.931)	Data Time 0.001 (0.461)	Loss 2.4986 (2.4116)	Entropy 0.57878 (0.57881)	Top-1 acc 63.281 (66.180)	Top-5 acc 84.766 (85.238)	lr 0.00413
Train [89][90/3239]	Time 0.252 (0.877)	Data Time 0.001 (0.410)	Loss 2.3038 (2.4178)	Entropy 0.57842 (0.57880)	Top-1 acc 69.141 (65.973)	Top-5 acc 87.500 (85.092)	lr 0.00413
Train [89][100/3239]	Time 0.233 (0.831)	Data Time 0.001 (0.370)	Loss 2.3375 (2.4204)	Entropy 0.57858 (0.57877)	Top-1 acc 66.797 (65.768)	Top-5 acc 85.547 (85.056)	lr 0.00413
Train [89][110/3239]	Time 0.330 (0.795)	Data Time 0.001 (0.337)	Loss 2.5137 (2.4161)	Entropy 0.57863 (0.57875)	Top-1 acc 64.453 (65.808)	Top-5 acc 85.156 (85.149)	lr 0.00413
Train [89][120/3239]	Time 0.234 (0.763)	Data Time 0.001 (0.309)	Loss 2.4070 (2.4150)	Entropy 0.57878 (0.57875)	Top-1 acc 68.750 (65.825)	Top-5 acc 85.938 (85.234)	lr 0.00413
Train [89][130/3239]	Time 0.239 (0.735)	Data Time 0.001 (0.285)	Loss 2.3914 (2.4149)	Entropy 0.57882 (0.57875)	Top-1 acc 69.531 (65.828)	Top-5 acc 85.156 (85.258)	lr 0.00413
Train [89][140/3239]	Time 0.241 (0.713)	Data Time 0.001 (0.265)	Loss 2.2526 (2.4128)	Entropy 0.57896 (0.57876)	Top-1 acc 71.094 (65.880)	Top-5 acc 89.062 (85.253)	lr 0.00413
Train [89][150/3239]	Time 0.235 (0.693)	Data Time 0.001 (0.248)	Loss 2.2597 (2.4115)	Entropy 0.57849 (0.57877)	Top-1 acc 68.750 (65.904)	Top-5 acc 87.891 (85.244)	lr 0.00412
Train [89][160/3239]	Time 0.231 (0.675)	Data Time 0.001 (0.233)	Loss 2.2348 (2.4119)	Entropy 0.57889 (0.57876)	Top-1 acc 68.359 (65.785)	Top-5 acc 90.625 (85.258)	lr 0.00412
Train [89][170/3239]	Time 0.233 (0.660)	Data Time 0.001 (0.219)	Loss 2.4783 (2.4122)	Entropy 0.57881 (0.57877)	Top-1 acc 64.062 (65.815)	Top-5 acc 83.594 (85.264)	lr 0.00412
Train [89][180/3239]	Time 0.236 (0.646)	Data Time 0.001 (0.207)	Loss 2.4773 (2.4123)	Entropy 0.57843 (0.57877)	Top-1 acc 63.281 (65.793)	Top-5 acc 82.812 (85.247)	lr 0.00412
Train [89][190/3239]	Time 0.237 (0.633)	Data Time 0.001 (0.196)	Loss 2.3563 (2.4165)	Entropy 0.57856 (0.57876)	Top-1 acc 67.969 (65.711)	Top-5 acc 85.938 (85.185)	lr 0.00412
Train [89][200/3239]	Time 0.332 (0.622)	Data Time 0.001 (0.187)	Loss 2.3486 (2.4161)	Entropy 0.57856 (0.57874)	Top-1 acc 66.797 (65.705)	Top-5 acc 87.891 (85.191)	lr 0.00412
Train [89][210/3239]	Time 0.234 (0.611)	Data Time 0.001 (0.178)	Loss 2.4811 (2.4162)	Entropy 0.57869 (0.57873)	Top-1 acc 64.844 (65.668)	Top-5 acc 82.422 (85.191)	lr 0.00412
Train [89][220/3239]	Time 0.246 (0.602)	Data Time 0.001 (0.170)	Loss 2.5040 (2.4146)	Entropy 0.57900 (0.57874)	Top-1 acc 62.500 (65.705)	Top-5 acc 86.719 (85.255)	lr 0.00412
Train [89][230/3239]	Time 0.234 (0.593)	Data Time 0.001 (0.163)	Loss 2.2937 (2.4136)	Entropy 0.57907 (0.57875)	Top-1 acc 73.828 (65.713)	Top-5 acc 86.719 (85.278)	lr 0.00412
Train [89][240/3239]	Time 0.227 (0.585)	Data Time 0.001 (0.156)	Loss 2.5112 (2.4166)	Entropy 0.57910 (0.57876)	Top-1 acc 60.547 (65.623)	Top-5 acc 83.984 (85.211)	lr 0.00412
Train [89][250/3239]	Time 0.230 (0.577)	Data Time 0.001 (0.150)	Loss 2.4641 (2.4173)	Entropy 0.57897 (0.57877)	Top-1 acc 63.281 (65.583)	Top-5 acc 86.328 (85.198)	lr 0.00412
Train [89][260/3239]	Time 0.228 (0.570)	Data Time 0.001 (0.144)	Loss 2.4250 (2.4180)	Entropy 0.57932 (0.57878)	Top-1 acc 62.500 (65.574)	Top-5 acc 87.109 (85.200)	lr 0.00412
Train [89][270/3239]	Time 0.322 (0.564)	Data Time 0.001 (0.139)	Loss 2.5098 (2.4161)	Entropy 0.57952 (0.57881)	Top-1 acc 60.156 (65.618)	Top-5 acc 84.375 (85.256)	lr 0.00412
Train [89][280/3239]	Time 0.233 (0.558)	Data Time 0.001 (0.134)	Loss 2.6904 (2.4169)	Entropy 0.57954 (0.57883)	Top-1 acc 61.328 (65.651)	Top-5 acc 81.250 (85.231)	lr 0.00411
Train [89][290/3239]	Time 0.226 (0.553)	Data Time 0.001 (0.129)	Loss 2.4071 (2.4170)	Entropy 0.57980 (0.57886)	Top-1 acc 69.531 (65.661)	Top-5 acc 85.156 (85.246)	lr 0.00411
Train [89][300/3239]	Time 0.234 (0.549)	Data Time 0.001 (0.125)	Loss 2.3582 (2.4178)	Entropy 0.57979 (0.57889)	Top-1 acc 68.750 (65.639)	Top-5 acc 86.328 (85.234)	lr 0.00411
Train [89][310/3239]	Time 0.235 (0.544)	Data Time 0.001 (0.121)	Loss 2.3972 (2.4161)	Entropy 0.57989 (0.57892)	Top-1 acc 68.359 (65.720)	Top-5 acc 82.812 (85.267)	lr 0.00411
Train [89][320/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.117)	Loss 2.6572 (2.4161)	Entropy 0.57996 (0.57895)	Top-1 acc 59.766 (65.714)	Top-5 acc 80.859 (85.276)	lr 0.00411
Train [89][330/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.114)	Loss 2.4636 (2.4159)	Entropy 0.57995 (0.57898)	Top-1 acc 60.938 (65.722)	Top-5 acc 83.984 (85.278)	lr 0.00411
Train [89][340/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.111)	Loss 2.5718 (2.4166)	Entropy 0.57988 (0.57901)	Top-1 acc 62.891 (65.729)	Top-5 acc 81.250 (85.239)	lr 0.00411
Train [89][350/3239]	Time 0.307 (0.530)	Data Time 0.002 (0.108)	Loss 2.2207 (2.4166)	Entropy 0.57997 (0.57903)	Top-1 acc 71.094 (65.735)	Top-5 acc 87.500 (85.222)	lr 0.00411
Train [89][360/3239]	Time 0.257 (0.529)	Data Time 0.001 (0.105)	Loss 2.3209 (2.4169)	Entropy 0.58010 (0.57906)	Top-1 acc 67.188 (65.715)	Top-5 acc 86.328 (85.219)	lr 0.00411
Train [89][370/3239]	Time 0.236 (0.526)	Data Time 0.001 (0.102)	Loss 2.5414 (2.4188)	Entropy 0.57975 (0.57909)	Top-1 acc 62.109 (65.673)	Top-5 acc 82.812 (85.175)	lr 0.00411
Train [89][380/3239]	Time 0.229 (0.523)	Data Time 0.001 (0.099)	Loss 2.2569 (2.4184)	Entropy 0.57992 (0.57911)	Top-1 acc 70.703 (65.669)	Top-5 acc 87.109 (85.175)	lr 0.00411
Train [89][390/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.097)	Loss 2.4041 (2.4186)	Entropy 0.57964 (0.57913)	Top-1 acc 62.891 (65.641)	Top-5 acc 85.547 (85.170)	lr 0.00411
Train [89][400/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.094)	Loss 2.4065 (2.4175)	Entropy 0.58009 (0.57914)	Top-1 acc 67.188 (65.658)	Top-5 acc 85.547 (85.201)	lr 0.00411
Train [89][410/3239]	Time 0.241 (0.514)	Data Time 0.001 (0.092)	Loss 2.6077 (2.4186)	Entropy 0.57969 (0.57916)	Top-1 acc 60.547 (65.631)	Top-5 acc 82.812 (85.197)	lr 0.00411
Train [89][420/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.090)	Loss 2.4862 (2.4202)	Entropy 0.57958 (0.57918)	Top-1 acc 66.016 (65.582)	Top-5 acc 85.547 (85.179)	lr 0.00410
Train [89][430/3239]	Time 0.466 (0.630)	Data Time 0.004 (0.088)	Loss 2.3731 (2.4193)	Entropy 0.57939 (0.57918)	Top-1 acc 66.797 (65.584)	Top-5 acc 84.375 (85.204)	lr 0.00410
Train [89][440/3239]	Time 0.237 (0.627)	Data Time 0.002 (0.086)	Loss 2.4690 (2.4193)	Entropy 0.57930 (0.57919)	Top-1 acc 60.938 (65.587)	Top-5 acc 83.984 (85.201)	lr 0.00410
Train [89][450/3239]	Time 0.240 (0.622)	Data Time 0.001 (0.084)	Loss 2.3702 (2.4193)	Entropy 0.57925 (0.57919)	Top-1 acc 67.188 (65.586)	Top-5 acc 84.375 (85.200)	lr 0.00410
Train [89][460/3239]	Time 0.294 (0.619)	Data Time 0.001 (0.082)	Loss 2.2728 (2.4187)	Entropy 0.57923 (0.57919)	Top-1 acc 71.875 (65.601)	Top-5 acc 85.938 (85.209)	lr 0.00410
Train [89][470/3239]	Time 0.236 (0.615)	Data Time 0.001 (0.081)	Loss 2.4876 (2.4189)	Entropy 0.57895 (0.57919)	Top-1 acc 69.141 (65.623)	Top-5 acc 82.031 (85.203)	lr 0.00410
Train [89][480/3239]	Time 0.237 (0.611)	Data Time 0.001 (0.079)	Loss 2.4467 (2.4187)	Entropy 0.57874 (0.57918)	Top-1 acc 65.234 (65.640)	Top-5 acc 83.984 (85.207)	lr 0.00410
Train [89][490/3239]	Time 0.234 (0.608)	Data Time 0.005 (0.077)	Loss 2.3471 (2.4177)	Entropy 0.57878 (0.57917)	Top-1 acc 64.844 (65.639)	Top-5 acc 87.891 (85.237)	lr 0.00410
Train [89][500/3239]	Time 0.262 (0.604)	Data Time 0.002 (0.076)	Loss 2.3764 (2.4184)	Entropy 0.57860 (0.57917)	Top-1 acc 66.797 (65.620)	Top-5 acc 85.547 (85.236)	lr 0.00410
Train [89][510/3239]	Time 0.231 (0.601)	Data Time 0.001 (0.074)	Loss 2.4659 (2.4187)	Entropy 0.57831 (0.57915)	Top-1 acc 61.719 (65.619)	Top-5 acc 85.547 (85.232)	lr 0.00410
Train [89][520/3239]	Time 0.284 (0.598)	Data Time 0.001 (0.073)	Loss 2.4276 (2.4194)	Entropy 0.57825 (0.57914)	Top-1 acc 66.406 (65.605)	Top-5 acc 85.547 (85.209)	lr 0.00410
Train [89][530/3239]	Time 0.267 (0.595)	Data Time 0.001 (0.072)	Loss 2.4682 (2.4194)	Entropy 0.57848 (0.57912)	Top-1 acc 65.625 (65.623)	Top-5 acc 84.375 (85.203)	lr 0.00410
Train [89][540/3239]	Time 0.247 (0.592)	Data Time 0.001 (0.070)	Loss 2.4951 (2.4205)	Entropy 0.57857 (0.57911)	Top-1 acc 64.844 (65.603)	Top-5 acc 82.812 (85.189)	lr 0.00410
Train [89][550/3239]	Time 0.240 (0.589)	Data Time 0.001 (0.069)	Loss 2.4497 (2.4209)	Entropy 0.57853 (0.57910)	Top-1 acc 65.625 (65.592)	Top-5 acc 84.766 (85.179)	lr 0.00409
Train [89][560/3239]	Time 0.243 (0.586)	Data Time 0.001 (0.068)	Loss 2.5047 (2.4214)	Entropy 0.57873 (0.57909)	Top-1 acc 64.844 (65.571)	Top-5 acc 80.078 (85.165)	lr 0.00409
Train [89][570/3239]	Time 0.303 (0.584)	Data Time 0.003 (0.067)	Loss 2.5215 (2.4220)	Entropy 0.57883 (0.57908)	Top-1 acc 60.156 (65.551)	Top-5 acc 84.766 (85.171)	lr 0.00409
Train [89][580/3239]	Time 0.242 (0.582)	Data Time 0.001 (0.066)	Loss 2.5195 (2.4215)	Entropy 0.57898 (0.57908)	Top-1 acc 66.797 (65.566)	Top-5 acc 83.984 (85.180)	lr 0.00409
Train [89][590/3239]	Time 0.362 (0.579)	Data Time 0.001 (0.065)	Loss 2.4516 (2.4219)	Entropy 0.57902 (0.57908)	Top-1 acc 66.406 (65.546)	Top-5 acc 83.984 (85.173)	lr 0.00409
Train [89][600/3239]	Time 0.264 (0.577)	Data Time 0.001 (0.064)	Loss 2.3917 (2.4218)	Entropy 0.57904 (0.57908)	Top-1 acc 63.281 (65.543)	Top-5 acc 85.938 (85.182)	lr 0.00409
Train [89][610/3239]	Time 0.233 (0.574)	Data Time 0.001 (0.063)	Loss 2.3568 (2.4220)	Entropy 0.57915 (0.57908)	Top-1 acc 65.234 (65.531)	Top-5 acc 85.938 (85.188)	lr 0.00409
Train [89][620/3239]	Time 0.234 (0.572)	Data Time 0.001 (0.062)	Loss 2.6330 (2.4230)	Entropy 0.57920 (0.57908)	Top-1 acc 55.078 (65.501)	Top-5 acc 80.859 (85.164)	lr 0.00409
Train [89][630/3239]	Time 0.231 (0.569)	Data Time 0.001 (0.061)	Loss 2.3858 (2.4231)	Entropy 0.57900 (0.57908)	Top-1 acc 65.625 (65.495)	Top-5 acc 84.766 (85.150)	lr 0.00409
Train [89][640/3239]	Time 0.232 (0.567)	Data Time 0.001 (0.060)	Loss 2.4587 (2.4237)	Entropy 0.57847 (0.57908)	Top-1 acc 62.109 (65.474)	Top-5 acc 84.375 (85.136)	lr 0.00409
Train [89][650/3239]	Time 0.221 (0.565)	Data Time 0.001 (0.059)	Loss 2.6394 (2.4240)	Entropy 0.57848 (0.57907)	Top-1 acc 58.984 (65.458)	Top-5 acc 83.984 (85.132)	lr 0.00409
Train [89][660/3239]	Time 0.332 (0.562)	Data Time 0.001 (0.058)	Loss 2.3022 (2.4240)	Entropy 0.57836 (0.57906)	Top-1 acc 71.094 (65.474)	Top-5 acc 87.109 (85.129)	lr 0.00409
Train [89][670/3239]	Time 0.322 (0.561)	Data Time 0.002 (0.057)	Loss 2.2746 (2.4237)	Entropy 0.57836 (0.57905)	Top-1 acc 69.141 (65.486)	Top-5 acc 88.672 (85.134)	lr 0.00409
Train [89][680/3239]	Time 0.281 (0.560)	Data Time 0.001 (0.056)	Loss 2.5484 (2.4238)	Entropy 0.57864 (0.57904)	Top-1 acc 63.281 (65.479)	Top-5 acc 82.422 (85.128)	lr 0.00408
Train [89][690/3239]	Time 0.223 (0.560)	Data Time 0.001 (0.055)	Loss 2.2499 (2.4226)	Entropy 0.57930 (0.57904)	Top-1 acc 70.703 (65.512)	Top-5 acc 88.281 (85.153)	lr 0.00408
Train [89][700/3239]	Time 0.231 (0.558)	Data Time 0.001 (0.055)	Loss 2.2440 (2.4217)	Entropy 0.57950 (0.57905)	Top-1 acc 71.094 (65.537)	Top-5 acc 89.844 (85.163)	lr 0.00408
Train [89][710/3239]	Time 0.234 (0.556)	Data Time 0.001 (0.054)	Loss 2.3973 (2.4219)	Entropy 0.57940 (0.57905)	Top-1 acc 64.453 (65.531)	Top-5 acc 85.547 (85.154)	lr 0.00408
Train [89][720/3239]	Time 0.274 (0.555)	Data Time 0.001 (0.053)	Loss 2.4534 (2.4222)	Entropy 0.57932 (0.57906)	Top-1 acc 64.844 (65.523)	Top-5 acc 83.594 (85.143)	lr 0.00408
Train [89][730/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.053)	Loss 2.5344 (2.4231)	Entropy 0.57934 (0.57906)	Top-1 acc 63.672 (65.503)	Top-5 acc 83.594 (85.125)	lr 0.00408
Train [89][740/3239]	Time 0.236 (0.552)	Data Time 0.005 (0.052)	Loss 2.3784 (2.4228)	Entropy 0.57944 (0.57906)	Top-1 acc 65.234 (65.521)	Top-5 acc 84.766 (85.123)	lr 0.00408
Train [89][750/3239]	Time 0.373 (0.551)	Data Time 0.001 (0.051)	Loss 2.4822 (2.4222)	Entropy 0.57952 (0.57907)	Top-1 acc 64.453 (65.529)	Top-5 acc 85.938 (85.140)	lr 0.00408
Train [89][760/3239]	Time 0.229 (0.549)	Data Time 0.001 (0.051)	Loss 2.5239 (2.4226)	Entropy 0.57892 (0.57907)	Top-1 acc 62.891 (65.519)	Top-5 acc 82.812 (85.126)	lr 0.00408
Train [89][770/3239]	Time 0.223 (0.547)	Data Time 0.001 (0.050)	Loss 2.3643 (2.4232)	Entropy 0.57903 (0.57907)	Top-1 acc 66.797 (65.505)	Top-5 acc 84.766 (85.112)	lr 0.00408
Train [89][780/3239]	Time 0.223 (0.546)	Data Time 0.001 (0.049)	Loss 2.3806 (2.4227)	Entropy 0.57822 (0.57907)	Top-1 acc 66.406 (65.501)	Top-5 acc 83.594 (85.111)	lr 0.00408
Train [89][790/3239]	Time 0.238 (0.544)	Data Time 0.001 (0.049)	Loss 2.4900 (2.4238)	Entropy 0.57798 (0.57906)	Top-1 acc 64.062 (65.472)	Top-5 acc 85.938 (85.095)	lr 0.00408
Train [89][800/3239]	Time 0.259 (0.542)	Data Time 0.001 (0.048)	Loss 2.6440 (2.4238)	Entropy 0.57776 (0.57904)	Top-1 acc 61.719 (65.485)	Top-5 acc 81.250 (85.089)	lr 0.00408
Train [89][810/3239]	Time 0.228 (0.541)	Data Time 0.001 (0.048)	Loss 2.3751 (2.4234)	Entropy 0.57773 (0.57903)	Top-1 acc 62.109 (65.490)	Top-5 acc 86.719 (85.097)	lr 0.00408
Train [89][820/3239]	Time 0.388 (0.539)	Data Time 0.001 (0.047)	Loss 2.4770 (2.4238)	Entropy 0.57757 (0.57901)	Top-1 acc 63.281 (65.484)	Top-5 acc 84.375 (85.095)	lr 0.00407
Train [89][830/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.046)	Loss 2.3002 (2.4229)	Entropy 0.57742 (0.57899)	Top-1 acc 65.234 (65.504)	Top-5 acc 87.500 (85.106)	lr 0.00407
Train [89][840/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.046)	Loss 2.4990 (2.4233)	Entropy 0.57762 (0.57897)	Top-1 acc 66.797 (65.497)	Top-5 acc 80.078 (85.101)	lr 0.00407
Train [89][850/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.045)	Loss 2.4279 (2.4236)	Entropy 0.57763 (0.57896)	Top-1 acc 63.672 (65.482)	Top-5 acc 85.547 (85.091)	lr 0.00407
Train [89][860/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.045)	Loss 2.2752 (2.4228)	Entropy 0.57783 (0.57894)	Top-1 acc 70.312 (65.510)	Top-5 acc 86.719 (85.102)	lr 0.00407
Train [89][870/3239]	Time 0.230 (0.532)	Data Time 0.001 (0.044)	Loss 2.4570 (2.4223)	Entropy 0.57773 (0.57893)	Top-1 acc 63.281 (65.527)	Top-5 acc 86.719 (85.115)	lr 0.00407
Train [89][880/3239]	Time 0.246 (0.531)	Data Time 0.001 (0.044)	Loss 2.4385 (2.4218)	Entropy 0.57792 (0.57891)	Top-1 acc 64.062 (65.537)	Top-5 acc 84.375 (85.115)	lr 0.00407
Train [89][890/3239]	Time 0.241 (0.529)	Data Time 0.001 (0.043)	Loss 2.4736 (2.4227)	Entropy 0.57768 (0.57890)	Top-1 acc 64.453 (65.516)	Top-5 acc 85.547 (85.103)	lr 0.00407
Train [89][900/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.043)	Loss 2.4496 (2.4230)	Entropy 0.57777 (0.57889)	Top-1 acc 61.719 (65.498)	Top-5 acc 87.109 (85.101)	lr 0.00407
Train [89][910/3239]	Time 0.244 (0.527)	Data Time 0.001 (0.042)	Loss 2.5155 (2.4229)	Entropy 0.57782 (0.57888)	Top-1 acc 64.453 (65.498)	Top-5 acc 81.250 (85.098)	lr 0.00407
Train [89][920/3239]	Time 0.255 (0.526)	Data Time 0.001 (0.042)	Loss 2.5725 (2.4228)	Entropy 0.57800 (0.57887)	Top-1 acc 58.984 (65.495)	Top-5 acc 81.250 (85.101)	lr 0.00407
Train [89][930/3239]	Time 0.221 (0.525)	Data Time 0.001 (0.042)	Loss 2.3624 (2.4224)	Entropy 0.57776 (0.57886)	Top-1 acc 66.797 (65.508)	Top-5 acc 85.938 (85.112)	lr 0.00407
Train [89][940/3239]	Time 0.265 (0.524)	Data Time 0.001 (0.041)	Loss 2.3913 (2.4221)	Entropy 0.57787 (0.57885)	Top-1 acc 66.016 (65.513)	Top-5 acc 87.500 (85.123)	lr 0.00407
Train [89][950/3239]	Time 0.286 (0.522)	Data Time 0.002 (0.041)	Loss 2.4739 (2.4225)	Entropy 0.57778 (0.57883)	Top-1 acc 64.453 (65.504)	Top-5 acc 83.594 (85.113)	lr 0.00406
Train [89][960/3239]	Time 0.239 (0.521)	Data Time 0.001 (0.040)	Loss 2.5367 (2.4229)	Entropy 0.57798 (0.57882)	Top-1 acc 62.891 (65.504)	Top-5 acc 83.594 (85.107)	lr 0.00406
Train [89][970/3239]	Time 0.263 (0.520)	Data Time 0.001 (0.040)	Loss 2.3244 (2.4224)	Entropy 0.57780 (0.57881)	Top-1 acc 69.922 (65.522)	Top-5 acc 87.109 (85.110)	lr 0.00406
Train [89][980/3239]	Time 0.374 (0.519)	Data Time 0.001 (0.040)	Loss 2.5676 (2.4224)	Entropy 0.57764 (0.57880)	Top-1 acc 58.984 (65.519)	Top-5 acc 82.422 (85.105)	lr 0.00406
Train [89][990/3239]	Time 0.250 (0.518)	Data Time 0.001 (0.039)	Loss 2.3178 (2.4229)	Entropy 0.57749 (0.57879)	Top-1 acc 68.359 (65.509)	Top-5 acc 84.375 (85.091)	lr 0.00406
Train [89][1000/3239]	Time 0.275 (0.518)	Data Time 0.001 (0.039)	Loss 2.5097 (2.4226)	Entropy 0.57746 (0.57878)	Top-1 acc 64.844 (65.509)	Top-5 acc 82.812 (85.095)	lr 0.00406
Train [89][1010/3239]	Time 0.221 (0.517)	Data Time 0.001 (0.038)	Loss 2.5755 (2.4227)	Entropy 0.57735 (0.57877)	Top-1 acc 63.672 (65.511)	Top-5 acc 80.859 (85.092)	lr 0.00406
Train [89][1020/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.038)	Loss 2.5462 (2.4232)	Entropy 0.57695 (0.57875)	Top-1 acc 57.422 (65.503)	Top-5 acc 83.594 (85.080)	lr 0.00406
Train [89][1030/3239]	Time 0.262 (0.515)	Data Time 0.003 (0.038)	Loss 2.3650 (2.4238)	Entropy 0.57716 (0.57873)	Top-1 acc 64.453 (65.484)	Top-5 acc 87.500 (85.072)	lr 0.00406
Train [89][1040/3239]	Time 0.274 (0.514)	Data Time 0.001 (0.037)	Loss 2.4301 (2.4242)	Entropy 0.57696 (0.57872)	Top-1 acc 59.766 (65.466)	Top-5 acc 85.938 (85.068)	lr 0.00406
Train [89][1050/3239]	Time 0.324 (0.513)	Data Time 0.001 (0.037)	Loss 2.4852 (2.4248)	Entropy 0.57695 (0.57870)	Top-1 acc 67.188 (65.449)	Top-5 acc 82.422 (85.062)	lr 0.00406
Train [89][1060/3239]	Time 0.265 (0.512)	Data Time 0.001 (0.037)	Loss 2.3652 (2.4247)	Entropy 0.57722 (0.57869)	Top-1 acc 67.578 (65.445)	Top-5 acc 84.375 (85.065)	lr 0.00406
Train [89][1070/3239]	Time 0.227 (0.511)	Data Time 0.001 (0.036)	Loss 2.4287 (2.4250)	Entropy 0.57727 (0.57867)	Top-1 acc 64.844 (65.443)	Top-5 acc 85.938 (85.059)	lr 0.00406
Train [89][1080/3239]	Time 0.236 (0.510)	Data Time 0.001 (0.036)	Loss 2.3114 (2.4248)	Entropy 0.57741 (0.57866)	Top-1 acc 71.484 (65.448)	Top-5 acc 87.500 (85.069)	lr 0.00406
Train [89][1090/3239]	Time 0.353 (0.561)	Data Time 0.004 (0.036)	Loss 2.2766 (2.4253)	Entropy 0.57740 (0.57865)	Top-1 acc 68.750 (65.438)	Top-5 acc 89.844 (85.071)	lr 0.00405
Train [89][1100/3239]	Time 0.242 (0.560)	Data Time 0.002 (0.035)	Loss 2.3717 (2.4253)	Entropy 0.57739 (0.57864)	Top-1 acc 67.578 (65.445)	Top-5 acc 85.156 (85.068)	lr 0.00405
Train [89][1110/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.035)	Loss 2.4913 (2.4259)	Entropy 0.57752 (0.57863)	Top-1 acc 65.234 (65.437)	Top-5 acc 82.812 (85.059)	lr 0.00405
Train [89][1120/3239]	Time 0.258 (0.558)	Data Time 0.001 (0.035)	Loss 2.4016 (2.4258)	Entropy 0.57748 (0.57862)	Top-1 acc 68.750 (65.450)	Top-5 acc 83.203 (85.057)	lr 0.00405
Train [89][1130/3239]	Time 0.238 (0.557)	Data Time 0.001 (0.035)	Loss 2.3622 (2.4265)	Entropy 0.57729 (0.57861)	Top-1 acc 66.406 (65.433)	Top-5 acc 84.375 (85.043)	lr 0.00405
Train [89][1140/3239]	Time 0.323 (0.556)	Data Time 0.001 (0.034)	Loss 2.3308 (2.4265)	Entropy 0.57671 (0.57859)	Top-1 acc 64.844 (65.430)	Top-5 acc 84.766 (85.041)	lr 0.00405
Train [89][1150/3239]	Time 0.226 (0.555)	Data Time 0.001 (0.034)	Loss 2.4498 (2.4266)	Entropy 0.57676 (0.57858)	Top-1 acc 65.625 (65.425)	Top-5 acc 84.766 (85.038)	lr 0.00405
Train [89][1160/3239]	Time 0.234 (0.554)	Data Time 0.001 (0.034)	Loss 2.3864 (2.4266)	Entropy 0.57664 (0.57856)	Top-1 acc 69.531 (65.421)	Top-5 acc 85.156 (85.046)	lr 0.00405
Train [89][1170/3239]	Time 0.254 (0.553)	Data Time 0.002 (0.033)	Loss 2.3941 (2.4265)	Entropy 0.57707 (0.57855)	Top-1 acc 64.062 (65.425)	Top-5 acc 85.156 (85.040)	lr 0.00405
Train [89][1180/3239]	Time 0.276 (0.552)	Data Time 0.002 (0.033)	Loss 2.2265 (2.4265)	Entropy 0.57729 (0.57853)	Top-1 acc 70.703 (65.424)	Top-5 acc 89.844 (85.036)	lr 0.00405
Train [89][1190/3239]	Time 0.229 (0.551)	Data Time 0.001 (0.033)	Loss 2.3513 (2.4263)	Entropy 0.57662 (0.57852)	Top-1 acc 71.875 (65.432)	Top-5 acc 85.547 (85.035)	lr 0.00405
Train [89][1200/3239]	Time 0.232 (0.550)	Data Time 0.001 (0.033)	Loss 2.3017 (2.4261)	Entropy 0.57651 (0.57850)	Top-1 acc 66.016 (65.431)	Top-5 acc 87.500 (85.036)	lr 0.00405
Train [89][1210/3239]	Time 0.372 (0.549)	Data Time 0.001 (0.032)	Loss 2.4297 (2.4258)	Entropy 0.57665 (0.57849)	Top-1 acc 66.406 (65.435)	Top-5 acc 83.594 (85.038)	lr 0.00405
Train [89][1220/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.032)	Loss 2.4360 (2.4265)	Entropy 0.57631 (0.57847)	Top-1 acc 66.797 (65.426)	Top-5 acc 85.938 (85.032)	lr 0.00404
Train [89][1230/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.032)	Loss 2.2941 (2.4263)	Entropy 0.57658 (0.57845)	Top-1 acc 69.141 (65.435)	Top-5 acc 87.500 (85.036)	lr 0.00404
Train [89][1240/3239]	Time 0.250 (0.546)	Data Time 0.001 (0.032)	Loss 2.5062 (2.4268)	Entropy 0.57640 (0.57844)	Top-1 acc 63.281 (65.429)	Top-5 acc 82.422 (85.026)	lr 0.00404
Train [89][1250/3239]	Time 0.259 (0.545)	Data Time 0.002 (0.031)	Loss 2.3489 (2.4267)	Entropy 0.57634 (0.57842)	Top-1 acc 69.531 (65.436)	Top-5 acc 84.375 (85.026)	lr 0.00404
Train [89][1260/3239]	Time 0.236 (0.544)	Data Time 0.001 (0.031)	Loss 2.6637 (2.4269)	Entropy 0.57645 (0.57841)	Top-1 acc 58.984 (65.432)	Top-5 acc 81.641 (85.021)	lr 0.00404
Train [89][1270/3239]	Time 0.264 (0.544)	Data Time 0.001 (0.031)	Loss 2.2370 (2.4265)	Entropy 0.57631 (0.57839)	Top-1 acc 71.484 (65.447)	Top-5 acc 89.844 (85.032)	lr 0.00404
Train [89][1280/3239]	Time 0.238 (0.543)	Data Time 0.001 (0.031)	Loss 2.5009 (2.4273)	Entropy 0.57598 (0.57837)	Top-1 acc 60.938 (65.423)	Top-5 acc 85.938 (85.019)	lr 0.00404
Train [89][1290/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.030)	Loss 2.4178 (2.4272)	Entropy 0.57609 (0.57835)	Top-1 acc 66.406 (65.427)	Top-5 acc 86.328 (85.021)	lr 0.00404
Train [89][1300/3239]	Time 0.332 (0.541)	Data Time 0.002 (0.030)	Loss 2.3487 (2.4271)	Entropy 0.57611 (0.57834)	Top-1 acc 68.359 (65.436)	Top-5 acc 83.594 (85.020)	lr 0.00404
Train [89][1310/3239]	Time 0.229 (0.540)	Data Time 0.001 (0.030)	Loss 2.4480 (2.4270)	Entropy 0.57611 (0.57832)	Top-1 acc 65.234 (65.441)	Top-5 acc 84.766 (85.015)	lr 0.00404
Train [89][1320/3239]	Time 0.260 (0.539)	Data Time 0.001 (0.030)	Loss 2.3882 (2.4266)	Entropy 0.57616 (0.57830)	Top-1 acc 66.406 (65.452)	Top-5 acc 86.719 (85.021)	lr 0.00404
Train [89][1330/3239]	Time 0.271 (0.538)	Data Time 0.001 (0.030)	Loss 2.4006 (2.4265)	Entropy 0.57588 (0.57829)	Top-1 acc 69.141 (65.448)	Top-5 acc 87.891 (85.026)	lr 0.00404
Train [89][1340/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.029)	Loss 2.4250 (2.4264)	Entropy 0.57594 (0.57827)	Top-1 acc 66.406 (65.450)	Top-5 acc 84.766 (85.031)	lr 0.00404
Train [89][1350/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.029)	Loss 2.3176 (2.4261)	Entropy 0.57603 (0.57825)	Top-1 acc 65.625 (65.456)	Top-5 acc 87.109 (85.032)	lr 0.00404
Train [89][1360/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.029)	Loss 2.4006 (2.4261)	Entropy 0.57649 (0.57824)	Top-1 acc 62.500 (65.450)	Top-5 acc 88.281 (85.033)	lr 0.00403
Train [89][1370/3239]	Time 0.360 (0.535)	Data Time 0.001 (0.029)	Loss 2.3504 (2.4265)	Entropy 0.57664 (0.57822)	Top-1 acc 66.016 (65.441)	Top-5 acc 86.328 (85.025)	lr 0.00403
Train [89][1380/3239]	Time 0.230 (0.534)	Data Time 0.001 (0.029)	Loss 2.1863 (2.4263)	Entropy 0.57669 (0.57821)	Top-1 acc 73.438 (65.441)	Top-5 acc 90.234 (85.026)	lr 0.00403
Train [89][1390/3239]	Time 0.260 (0.533)	Data Time 0.001 (0.028)	Loss 2.3732 (2.4261)	Entropy 0.57671 (0.57820)	Top-1 acc 68.750 (65.450)	Top-5 acc 88.281 (85.031)	lr 0.00403
Train [89][1400/3239]	Time 0.225 (0.533)	Data Time 0.001 (0.028)	Loss 2.4822 (2.4262)	Entropy 0.57683 (0.57819)	Top-1 acc 66.406 (65.442)	Top-5 acc 83.203 (85.030)	lr 0.00403
Train [89][1410/3239]	Time 0.247 (0.532)	Data Time 0.001 (0.028)	Loss 2.4382 (2.4262)	Entropy 0.57666 (0.57818)	Top-1 acc 64.453 (65.435)	Top-5 acc 85.156 (85.037)	lr 0.00403
Train [89][1420/3239]	Time 0.277 (0.531)	Data Time 0.001 (0.028)	Loss 2.5553 (2.4264)	Entropy 0.57620 (0.57817)	Top-1 acc 67.969 (65.438)	Top-5 acc 84.375 (85.033)	lr 0.00403
Train [89][1430/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.028)	Loss 2.3682 (2.4263)	Entropy 0.57633 (0.57816)	Top-1 acc 64.844 (65.438)	Top-5 acc 86.328 (85.037)	lr 0.00403
Train [89][1440/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.027)	Loss 2.6957 (2.4264)	Entropy 0.57637 (0.57814)	Top-1 acc 60.156 (65.431)	Top-5 acc 80.078 (85.037)	lr 0.00403
Train [89][1450/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.027)	Loss 2.3649 (2.4264)	Entropy 0.57617 (0.57813)	Top-1 acc 67.188 (65.437)	Top-5 acc 85.938 (85.041)	lr 0.00403
Train [89][1460/3239]	Time 0.396 (0.528)	Data Time 0.001 (0.027)	Loss 2.9436 (2.4269)	Entropy 0.57632 (0.57812)	Top-1 acc 50.781 (65.424)	Top-5 acc 75.000 (85.032)	lr 0.00403
Train [89][1470/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.027)	Loss 2.6736 (2.4273)	Entropy 0.57622 (0.57810)	Top-1 acc 59.766 (65.409)	Top-5 acc 81.641 (85.027)	lr 0.00403
Train [89][1480/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.027)	Loss 2.4158 (2.4274)	Entropy 0.57591 (0.57809)	Top-1 acc 67.578 (65.408)	Top-5 acc 83.594 (85.021)	lr 0.00403
Train [89][1490/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.027)	Loss 2.4158 (2.4273)	Entropy 0.57600 (0.57808)	Top-1 acc 67.969 (65.404)	Top-5 acc 83.984 (85.019)	lr 0.00402
Train [89][1500/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.026)	Loss 2.5292 (2.4272)	Entropy 0.57582 (0.57806)	Top-1 acc 65.625 (65.411)	Top-5 acc 84.375 (85.016)	lr 0.00402
Train [89][1510/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.026)	Loss 2.4846 (2.4279)	Entropy 0.57583 (0.57805)	Top-1 acc 65.625 (65.394)	Top-5 acc 83.984 (85.009)	lr 0.00402
Train [89][1520/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.026)	Loss 2.5322 (2.4281)	Entropy 0.57568 (0.57803)	Top-1 acc 62.891 (65.395)	Top-5 acc 83.984 (85.003)	lr 0.00402
Train [89][1530/3239]	Time 0.330 (0.523)	Data Time 0.001 (0.026)	Loss 2.3357 (2.4279)	Entropy 0.57581 (0.57802)	Top-1 acc 67.578 (65.398)	Top-5 acc 87.891 (85.007)	lr 0.00402
Train [89][1540/3239]	Time 0.225 (0.522)	Data Time 0.001 (0.026)	Loss 2.2620 (2.4276)	Entropy 0.57596 (0.57800)	Top-1 acc 67.188 (65.405)	Top-5 acc 88.281 (85.007)	lr 0.00402
Train [89][1550/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.026)	Loss 2.3591 (2.4276)	Entropy 0.57605 (0.57799)	Top-1 acc 70.703 (65.403)	Top-5 acc 87.109 (85.005)	lr 0.00402
Train [89][1560/3239]	Time 0.229 (0.521)	Data Time 0.001 (0.025)	Loss 2.4811 (2.4275)	Entropy 0.57606 (0.57798)	Top-1 acc 61.328 (65.404)	Top-5 acc 83.594 (85.006)	lr 0.00402
Train [89][1570/3239]	Time 0.243 (0.520)	Data Time 0.001 (0.025)	Loss 2.4051 (2.4277)	Entropy 0.57610 (0.57797)	Top-1 acc 62.891 (65.400)	Top-5 acc 87.500 (85.003)	lr 0.00402
Train [89][1580/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.025)	Loss 2.3337 (2.4273)	Entropy 0.57611 (0.57795)	Top-1 acc 66.406 (65.410)	Top-5 acc 88.672 (85.014)	lr 0.00402
Train [89][1590/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.025)	Loss 2.2597 (2.4272)	Entropy 0.57599 (0.57794)	Top-1 acc 68.750 (65.411)	Top-5 acc 87.109 (85.014)	lr 0.00402
Train [89][1600/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.025)	Loss 2.4108 (2.4272)	Entropy 0.57591 (0.57793)	Top-1 acc 65.234 (65.407)	Top-5 acc 85.547 (85.017)	lr 0.00402
Train [89][1610/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.025)	Loss 2.4743 (2.4277)	Entropy 0.57623 (0.57792)	Top-1 acc 68.359 (65.401)	Top-5 acc 86.328 (85.006)	lr 0.00402
Train [89][1620/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.025)	Loss 2.3945 (2.4278)	Entropy 0.57631 (0.57791)	Top-1 acc 67.969 (65.395)	Top-5 acc 87.109 (85.008)	lr 0.00401
Train [89][1630/3239]	Time 0.237 (0.517)	Data Time 0.001 (0.024)	Loss 2.3734 (2.4275)	Entropy 0.57608 (0.57790)	Top-1 acc 64.062 (65.410)	Top-5 acc 83.594 (85.013)	lr 0.00401
Train [89][1640/3239]	Time 0.230 (0.516)	Data Time 0.001 (0.024)	Loss 2.4071 (2.4278)	Entropy 0.57579 (0.57788)	Top-1 acc 68.359 (65.400)	Top-5 acc 85.938 (85.009)	lr 0.00401
Train [89][1650/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.024)	Loss 2.4292 (2.4278)	Entropy 0.57559 (0.57787)	Top-1 acc 67.188 (65.406)	Top-5 acc 83.984 (85.015)	lr 0.00401
Train [89][1660/3239]	Time 0.236 (0.515)	Data Time 0.001 (0.024)	Loss 2.4766 (2.4286)	Entropy 0.57544 (0.57786)	Top-1 acc 62.500 (65.383)	Top-5 acc 83.984 (85.000)	lr 0.00401
Train [89][1670/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.024)	Loss 2.6483 (2.4287)	Entropy 0.57526 (0.57784)	Top-1 acc 60.547 (65.381)	Top-5 acc 83.984 (84.998)	lr 0.00401
Train [89][1680/3239]	Time 0.244 (0.514)	Data Time 0.001 (0.024)	Loss 2.4083 (2.4289)	Entropy 0.57476 (0.57783)	Top-1 acc 64.844 (65.377)	Top-5 acc 83.984 (84.996)	lr 0.00401
Train [89][1690/3239]	Time 0.341 (0.513)	Data Time 0.001 (0.024)	Loss 2.4011 (2.4289)	Entropy 0.57469 (0.57781)	Top-1 acc 65.625 (65.370)	Top-5 acc 83.984 (84.995)	lr 0.00401
Train [89][1700/3239]	Time 0.217 (0.513)	Data Time 0.001 (0.023)	Loss 2.4708 (2.4288)	Entropy 0.57454 (0.57779)	Top-1 acc 67.578 (65.374)	Top-5 acc 84.375 (85.000)	lr 0.00401
Train [89][1710/3239]	Time 0.264 (0.512)	Data Time 0.001 (0.023)	Loss 2.3473 (2.4284)	Entropy 0.57422 (0.57777)	Top-1 acc 65.234 (65.381)	Top-5 acc 86.719 (85.004)	lr 0.00401
Train [89][1720/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.023)	Loss 2.4537 (2.4281)	Entropy 0.57423 (0.57775)	Top-1 acc 67.969 (65.391)	Top-5 acc 85.547 (85.005)	lr 0.00401
Train [89][1730/3239]	Time 0.231 (0.511)	Data Time 0.002 (0.023)	Loss 2.4051 (2.4281)	Entropy 0.57430 (0.57773)	Top-1 acc 68.359 (65.397)	Top-5 acc 87.109 (85.003)	lr 0.00401
Train [89][1740/3239]	Time 0.536 (0.543)	Data Time 0.005 (0.023)	Loss 2.3194 (2.4278)	Entropy 0.57434 (0.57771)	Top-1 acc 71.484 (65.410)	Top-5 acc 86.719 (85.012)	lr 0.00401
Train [89][1750/3239]	Time 0.244 (0.544)	Data Time 0.002 (0.023)	Loss 2.2828 (2.4277)	Entropy 0.57436 (0.57769)	Top-1 acc 69.922 (65.414)	Top-5 acc 85.156 (85.013)	lr 0.00401
Train [89][1760/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.023)	Loss 2.4378 (2.4276)	Entropy 0.57421 (0.57767)	Top-1 acc 65.234 (65.418)	Top-5 acc 85.938 (85.013)	lr 0.00400
Train [89][1770/3239]	Time 0.241 (0.542)	Data Time 0.001 (0.023)	Loss 2.3400 (2.4281)	Entropy 0.57428 (0.57765)	Top-1 acc 66.016 (65.405)	Top-5 acc 87.891 (85.002)	lr 0.00400
Train [89][1780/3239]	Time 0.242 (0.542)	Data Time 0.002 (0.023)	Loss 2.6885 (2.4289)	Entropy 0.57418 (0.57763)	Top-1 acc 60.156 (65.396)	Top-5 acc 78.906 (84.987)	lr 0.00400
Train [89][1790/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.022)	Loss 2.3579 (2.4290)	Entropy 0.57422 (0.57761)	Top-1 acc 64.453 (65.395)	Top-5 acc 85.156 (84.984)	lr 0.00400
Train [89][1800/3239]	Time 0.248 (0.540)	Data Time 0.001 (0.022)	Loss 2.4956 (2.4291)	Entropy 0.57404 (0.57759)	Top-1 acc 64.453 (65.389)	Top-5 acc 84.375 (84.983)	lr 0.00400
Train [89][1810/3239]	Time 0.231 (0.540)	Data Time 0.001 (0.022)	Loss 2.1879 (2.4293)	Entropy 0.57392 (0.57757)	Top-1 acc 70.703 (65.386)	Top-5 acc 90.625 (84.979)	lr 0.00400
Train [89][1820/3239]	Time 0.241 (0.539)	Data Time 0.001 (0.022)	Loss 2.2219 (2.4293)	Entropy 0.57407 (0.57755)	Top-1 acc 69.141 (65.384)	Top-5 acc 89.062 (84.982)	lr 0.00400
Train [89][1830/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.022)	Loss 2.4148 (2.4289)	Entropy 0.57387 (0.57754)	Top-1 acc 66.797 (65.394)	Top-5 acc 85.547 (84.989)	lr 0.00400
Train [89][1840/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.022)	Loss 2.5019 (2.4291)	Entropy 0.57377 (0.57752)	Top-1 acc 63.281 (65.390)	Top-5 acc 82.422 (84.987)	lr 0.00400
Train [89][1850/3239]	Time 0.322 (0.537)	Data Time 0.001 (0.022)	Loss 2.5549 (2.4292)	Entropy 0.57332 (0.57749)	Top-1 acc 62.500 (65.388)	Top-5 acc 83.984 (84.984)	lr 0.00400
Train [89][1860/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.022)	Loss 2.3454 (2.4293)	Entropy 0.57338 (0.57747)	Top-1 acc 67.969 (65.387)	Top-5 acc 87.891 (84.985)	lr 0.00400
Train [89][1870/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.022)	Loss 2.3014 (2.4293)	Entropy 0.57322 (0.57745)	Top-1 acc 66.797 (65.386)	Top-5 acc 87.109 (84.985)	lr 0.00400
Train [89][1880/3239]	Time 0.237 (0.535)	Data Time 0.001 (0.021)	Loss 2.4409 (2.4293)	Entropy 0.57321 (0.57743)	Top-1 acc 64.062 (65.380)	Top-5 acc 85.547 (84.987)	lr 0.00400
Train [89][1890/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.021)	Loss 2.5783 (2.4294)	Entropy 0.57275 (0.57740)	Top-1 acc 60.547 (65.371)	Top-5 acc 84.766 (84.989)	lr 0.00399
Train [89][1900/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.021)	Loss 2.2263 (2.4295)	Entropy 0.57288 (0.57738)	Top-1 acc 66.797 (65.367)	Top-5 acc 89.062 (84.985)	lr 0.00399
Train [89][1910/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.021)	Loss 2.3954 (2.4294)	Entropy 0.57292 (0.57736)	Top-1 acc 65.625 (65.368)	Top-5 acc 83.203 (84.987)	lr 0.00399
Train [89][1920/3239]	Time 0.342 (0.533)	Data Time 0.001 (0.021)	Loss 2.3598 (2.4288)	Entropy 0.57317 (0.57733)	Top-1 acc 64.844 (65.383)	Top-5 acc 85.156 (84.995)	lr 0.00399
Train [89][1930/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.021)	Loss 2.4014 (2.4289)	Entropy 0.57351 (0.57731)	Top-1 acc 66.406 (65.383)	Top-5 acc 85.938 (84.994)	lr 0.00399
Train [89][1940/3239]	Time 0.233 (0.532)	Data Time 0.001 (0.021)	Loss 2.3118 (2.4289)	Entropy 0.57337 (0.57729)	Top-1 acc 71.094 (65.383)	Top-5 acc 87.500 (84.993)	lr 0.00399
Train [89][1950/3239]	Time 0.219 (0.531)	Data Time 0.001 (0.021)	Loss 2.3245 (2.4289)	Entropy 0.57323 (0.57727)	Top-1 acc 69.141 (65.384)	Top-5 acc 85.938 (84.995)	lr 0.00399
Train [89][1960/3239]	Time 0.270 (0.531)	Data Time 0.002 (0.021)	Loss 2.5030 (2.4287)	Entropy 0.57349 (0.57725)	Top-1 acc 63.281 (65.387)	Top-5 acc 81.641 (84.999)	lr 0.00399
Train [89][1970/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.021)	Loss 2.4208 (2.4287)	Entropy 0.57372 (0.57723)	Top-1 acc 64.844 (65.383)	Top-5 acc 87.109 (85.001)	lr 0.00399
Train [89][1980/3239]	Time 0.244 (0.530)	Data Time 0.002 (0.020)	Loss 2.3342 (2.4287)	Entropy 0.57406 (0.57722)	Top-1 acc 67.188 (65.385)	Top-5 acc 87.109 (85.002)	lr 0.00399
Train [89][1990/3239]	Time 0.271 (0.530)	Data Time 0.001 (0.020)	Loss 2.0831 (2.4289)	Entropy 0.57395 (0.57720)	Top-1 acc 75.391 (65.382)	Top-5 acc 90.625 (84.996)	lr 0.00399
Train [89][2000/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.020)	Loss 2.2987 (2.4291)	Entropy 0.57424 (0.57718)	Top-1 acc 69.531 (65.382)	Top-5 acc 83.984 (84.993)	lr 0.00399
Train [89][2010/3239]	Time 0.326 (0.529)	Data Time 0.001 (0.020)	Loss 2.4387 (2.4288)	Entropy 0.57424 (0.57717)	Top-1 acc 63.672 (65.391)	Top-5 acc 87.109 (84.997)	lr 0.00399
Train [89][2020/3239]	Time 0.222 (0.528)	Data Time 0.001 (0.020)	Loss 2.5759 (2.4287)	Entropy 0.57428 (0.57716)	Top-1 acc 61.328 (65.392)	Top-5 acc 82.422 (85.002)	lr 0.00399
Train [89][2030/3239]	Time 0.238 (0.528)	Data Time 0.001 (0.020)	Loss 2.5579 (2.4287)	Entropy 0.57435 (0.57714)	Top-1 acc 59.766 (65.392)	Top-5 acc 82.422 (85.005)	lr 0.00398
Train [89][2040/3239]	Time 0.272 (0.527)	Data Time 0.001 (0.020)	Loss 2.5308 (2.4283)	Entropy 0.57447 (0.57713)	Top-1 acc 64.062 (65.400)	Top-5 acc 82.812 (85.010)	lr 0.00398
Train [89][2050/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.020)	Loss 2.3932 (2.4284)	Entropy 0.57449 (0.57712)	Top-1 acc 64.453 (65.400)	Top-5 acc 84.375 (85.007)	lr 0.00398
Train [89][2060/3239]	Time 0.250 (0.526)	Data Time 0.001 (0.020)	Loss 2.3648 (2.4283)	Entropy 0.57459 (0.57710)	Top-1 acc 67.969 (65.403)	Top-5 acc 84.375 (85.009)	lr 0.00398
Train [89][2070/3239]	Time 0.279 (0.526)	Data Time 0.002 (0.020)	Loss 2.4660 (2.4283)	Entropy 0.57438 (0.57709)	Top-1 acc 64.844 (65.404)	Top-5 acc 83.984 (85.010)	lr 0.00398
Train [89][2080/3239]	Time 0.364 (0.526)	Data Time 0.001 (0.020)	Loss 2.4492 (2.4281)	Entropy 0.57423 (0.57708)	Top-1 acc 62.891 (65.404)	Top-5 acc 86.719 (85.016)	lr 0.00398
Train [89][2090/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.019)	Loss 2.6390 (2.4282)	Entropy 0.57431 (0.57706)	Top-1 acc 58.594 (65.395)	Top-5 acc 81.250 (85.015)	lr 0.00398
Train [89][2100/3239]	Time 0.249 (0.525)	Data Time 0.001 (0.019)	Loss 2.5397 (2.4284)	Entropy 0.57419 (0.57705)	Top-1 acc 63.281 (65.394)	Top-5 acc 84.375 (85.009)	lr 0.00398
Train [89][2110/3239]	Time 0.262 (0.524)	Data Time 0.001 (0.019)	Loss 2.6341 (2.4286)	Entropy 0.57404 (0.57704)	Top-1 acc 60.156 (65.389)	Top-5 acc 83.203 (85.006)	lr 0.00398
Train [89][2120/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.019)	Loss 2.5603 (2.4289)	Entropy 0.57435 (0.57702)	Top-1 acc 63.672 (65.389)	Top-5 acc 84.766 (85.002)	lr 0.00398
Train [89][2130/3239]	Time 0.264 (0.523)	Data Time 0.001 (0.019)	Loss 2.4255 (2.4290)	Entropy 0.57422 (0.57701)	Top-1 acc 63.672 (65.389)	Top-5 acc 85.938 (85.002)	lr 0.00398
Train [89][2140/3239]	Time 0.249 (0.523)	Data Time 0.001 (0.019)	Loss 2.2785 (2.4291)	Entropy 0.57401 (0.57700)	Top-1 acc 69.922 (65.390)	Top-5 acc 87.500 (85.000)	lr 0.00398
Train [89][2150/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.019)	Loss 2.5336 (2.4294)	Entropy 0.57379 (0.57698)	Top-1 acc 62.891 (65.380)	Top-5 acc 82.812 (84.996)	lr 0.00398
Train [89][2160/3239]	Time 0.245 (0.522)	Data Time 0.001 (0.019)	Loss 2.2723 (2.4293)	Entropy 0.57368 (0.57697)	Top-1 acc 69.531 (65.382)	Top-5 acc 86.719 (84.996)	lr 0.00398
Train [89][2170/3239]	Time 0.326 (0.522)	Data Time 0.001 (0.019)	Loss 2.2985 (2.4290)	Entropy 0.57344 (0.57695)	Top-1 acc 68.359 (65.393)	Top-5 acc 87.109 (85.002)	lr 0.00397
Train [89][2180/3239]	Time 0.249 (0.522)	Data Time 0.001 (0.020)	Loss 2.5081 (2.4291)	Entropy 0.57348 (0.57694)	Top-1 acc 62.891 (65.387)	Top-5 acc 84.766 (84.999)	lr 0.00397
Train [89][2190/3239]	Time 0.836 (0.522)	Data Time 0.575 (0.020)	Loss 2.6238 (2.4291)	Entropy 0.57355 (0.57692)	Top-1 acc 60.938 (65.389)	Top-5 acc 80.859 (85.002)	lr 0.00397
Train [89][2200/3239]	Time 0.282 (0.524)	Data Time 0.001 (0.022)	Loss 2.5161 (2.4291)	Entropy 0.57357 (0.57691)	Top-1 acc 63.281 (65.387)	Top-5 acc 83.594 (85.003)	lr 0.00397
Train [89][2210/3239]	Time 0.258 (0.525)	Data Time 0.002 (0.024)	Loss 2.3249 (2.4292)	Entropy 0.57397 (0.57689)	Top-1 acc 67.578 (65.384)	Top-5 acc 86.328 (85.003)	lr 0.00397
Train [89][2220/3239]	Time 0.275 (0.525)	Data Time 0.002 (0.023)	Loss 2.4694 (2.4293)	Entropy 0.57379 (0.57688)	Top-1 acc 64.062 (65.380)	Top-5 acc 83.594 (85.001)	lr 0.00397
Train [89][2230/3239]	Time 0.278 (0.526)	Data Time 0.001 (0.024)	Loss 2.5559 (2.4293)	Entropy 0.57362 (0.57686)	Top-1 acc 60.156 (65.378)	Top-5 acc 83.594 (85.003)	lr 0.00397
Train [89][2240/3239]	Time 2.908 (0.526)	Data Time 2.554 (0.025)	Loss 2.6327 (2.4294)	Entropy 0.57368 (0.57685)	Top-1 acc 62.500 (65.376)	Top-5 acc 80.078 (84.999)	lr 0.00397
Train [89][2250/3239]	Time 0.277 (0.526)	Data Time 0.001 (0.025)	Loss 2.4113 (2.4295)	Entropy 0.57357 (0.57683)	Top-1 acc 68.359 (65.375)	Top-5 acc 88.672 (84.999)	lr 0.00397
Train [89][2260/3239]	Time 0.263 (0.526)	Data Time 0.001 (0.026)	Loss 2.4571 (2.4295)	Entropy 0.57373 (0.57682)	Top-1 acc 65.234 (65.376)	Top-5 acc 83.594 (84.999)	lr 0.00397
Train [89][2270/3239]	Time 0.287 (0.526)	Data Time 0.001 (0.026)	Loss 2.4340 (2.4294)	Entropy 0.57367 (0.57681)	Top-1 acc 62.109 (65.372)	Top-5 acc 85.156 (85.000)	lr 0.00397
Train [89][2280/3239]	Time 0.246 (0.526)	Data Time 0.001 (0.026)	Loss 2.3672 (2.4294)	Entropy 0.57337 (0.57679)	Top-1 acc 66.016 (65.372)	Top-5 acc 85.547 (84.997)	lr 0.00397
Train [89][2290/3239]	Time 0.307 (0.526)	Data Time 0.001 (0.026)	Loss 2.4537 (2.4292)	Entropy 0.57315 (0.57678)	Top-1 acc 66.406 (65.380)	Top-5 acc 84.375 (85.002)	lr 0.00397
Train [89][2300/3239]	Time 0.251 (0.525)	Data Time 0.001 (0.026)	Loss 2.5510 (2.4292)	Entropy 0.57327 (0.57676)	Top-1 acc 63.281 (65.379)	Top-5 acc 82.422 (85.002)	lr 0.00396
Train [89][2310/3239]	Time 0.352 (0.525)	Data Time 0.001 (0.025)	Loss 2.3940 (2.4290)	Entropy 0.57341 (0.57675)	Top-1 acc 66.406 (65.382)	Top-5 acc 85.156 (85.001)	lr 0.00396
Train [89][2320/3239]	Time 0.248 (0.525)	Data Time 0.001 (0.025)	Loss 2.5589 (2.4291)	Entropy 0.57374 (0.57673)	Top-1 acc 63.281 (65.384)	Top-5 acc 80.859 (84.999)	lr 0.00396
Train [89][2330/3239]	Time 0.279 (0.526)	Data Time 0.002 (0.026)	Loss 2.3617 (2.4291)	Entropy 0.57377 (0.57672)	Top-1 acc 63.672 (65.384)	Top-5 acc 83.984 (84.999)	lr 0.00396
Train [89][2340/3239]	Time 0.247 (0.525)	Data Time 0.001 (0.026)	Loss 2.5966 (2.4291)	Entropy 0.57397 (0.57671)	Top-1 acc 60.547 (65.383)	Top-5 acc 83.203 (85.000)	lr 0.00396
Train [89][2350/3239]	Time 0.908 (0.525)	Data Time 0.655 (0.026)	Loss 2.3542 (2.4292)	Entropy 0.57393 (0.57670)	Top-1 acc 69.922 (65.383)	Top-5 acc 83.984 (84.997)	lr 0.00396
Train [89][2360/3239]	Time 0.257 (0.528)	Data Time 0.001 (0.030)	Loss 2.4849 (2.4291)	Entropy 0.57425 (0.57668)	Top-1 acc 59.766 (65.383)	Top-5 acc 83.203 (84.996)	lr 0.00396
Train [89][2370/3239]	Time 0.251 (0.528)	Data Time 0.001 (0.029)	Loss 2.3664 (2.4292)	Entropy 0.57426 (0.57667)	Top-1 acc 66.406 (65.381)	Top-5 acc 87.109 (84.995)	lr 0.00396
Train [89][2380/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.029)	Loss 2.5476 (2.4294)	Entropy 0.57411 (0.57666)	Top-1 acc 62.109 (65.378)	Top-5 acc 79.297 (84.992)	lr 0.00396
Train [89][2390/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.032)	Loss 2.4657 (2.4298)	Entropy 0.57396 (0.57665)	Top-1 acc 64.062 (65.370)	Top-5 acc 82.812 (84.985)	lr 0.00396
Train [89][2400/3239]	Time 0.395 (0.552)	Data Time 0.005 (0.032)	Loss 2.3798 (2.4297)	Entropy 0.57397 (0.57664)	Top-1 acc 65.625 (65.371)	Top-5 acc 85.547 (84.987)	lr 0.00396
Train [89][2410/3239]	Time 0.250 (0.551)	Data Time 0.001 (0.032)	Loss 2.3708 (2.4298)	Entropy 0.57391 (0.57663)	Top-1 acc 67.969 (65.367)	Top-5 acc 84.766 (84.985)	lr 0.00396
Train [89][2420/3239]	Time 0.252 (0.551)	Data Time 0.002 (0.031)	Loss 2.2946 (2.4296)	Entropy 0.57418 (0.57662)	Top-1 acc 72.266 (65.376)	Top-5 acc 86.328 (84.992)	lr 0.00396
Train [89][2430/3239]	Time 0.257 (0.550)	Data Time 0.002 (0.031)	Loss 2.3347 (2.4294)	Entropy 0.57380 (0.57661)	Top-1 acc 68.750 (65.381)	Top-5 acc 85.938 (84.994)	lr 0.00396
Train [89][2440/3239]	Time 0.244 (0.550)	Data Time 0.001 (0.031)	Loss 2.3522 (2.4293)	Entropy 0.57371 (0.57660)	Top-1 acc 67.578 (65.382)	Top-5 acc 87.891 (84.997)	lr 0.00395
Train [89][2450/3239]	Time 0.236 (0.549)	Data Time 0.001 (0.031)	Loss 2.3777 (2.4294)	Entropy 0.57356 (0.57659)	Top-1 acc 64.844 (65.378)	Top-5 acc 87.891 (84.993)	lr 0.00395
Train [89][2460/3239]	Time 0.268 (0.549)	Data Time 0.002 (0.031)	Loss 2.4397 (2.4293)	Entropy 0.57359 (0.57657)	Top-1 acc 65.234 (65.385)	Top-5 acc 85.938 (84.997)	lr 0.00395
Train [89][2470/3239]	Time 0.350 (0.549)	Data Time 0.001 (0.031)	Loss 2.4312 (2.4290)	Entropy 0.57386 (0.57656)	Top-1 acc 66.016 (65.391)	Top-5 acc 84.766 (85.001)	lr 0.00395
Train [89][2480/3239]	Time 0.244 (0.548)	Data Time 0.001 (0.031)	Loss 2.3591 (2.4291)	Entropy 0.57395 (0.57655)	Top-1 acc 66.406 (65.388)	Top-5 acc 86.719 (85.000)	lr 0.00395
Train [89][2490/3239]	Time 0.242 (0.548)	Data Time 0.001 (0.031)	Loss 2.4476 (2.4289)	Entropy 0.57398 (0.57654)	Top-1 acc 64.844 (65.394)	Top-5 acc 83.984 (85.002)	lr 0.00395
Train [89][2500/3239]	Time 0.274 (0.548)	Data Time 0.001 (0.030)	Loss 2.3343 (2.4290)	Entropy 0.57404 (0.57653)	Top-1 acc 64.453 (65.394)	Top-5 acc 85.156 (85.002)	lr 0.00395
Train [89][2510/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.031)	Loss 2.5006 (2.4291)	Entropy 0.57411 (0.57652)	Top-1 acc 65.234 (65.390)	Top-5 acc 85.938 (85.001)	lr 0.00395
Train [89][2520/3239]	Time 0.244 (0.548)	Data Time 0.001 (0.031)	Loss 2.5152 (2.4292)	Entropy 0.57399 (0.57651)	Top-1 acc 60.547 (65.387)	Top-5 acc 83.984 (85.001)	lr 0.00395
Train [89][2530/3239]	Time 0.689 (0.548)	Data Time 0.438 (0.032)	Loss 2.3855 (2.4293)	Entropy 0.57391 (0.57650)	Top-1 acc 67.969 (65.381)	Top-5 acc 85.547 (85.001)	lr 0.00395
Train [89][2540/3239]	Time 0.244 (0.550)	Data Time 0.001 (0.034)	Loss 2.3759 (2.4294)	Entropy 0.57401 (0.57649)	Top-1 acc 68.359 (65.381)	Top-5 acc 87.109 (84.997)	lr 0.00395
Train [89][2550/3239]	Time 0.271 (0.549)	Data Time 0.001 (0.034)	Loss 2.4682 (2.4292)	Entropy 0.57402 (0.57648)	Top-1 acc 62.109 (65.384)	Top-5 acc 84.766 (85.003)	lr 0.00395
Train [89][2560/3239]	Time 0.358 (0.550)	Data Time 0.001 (0.035)	Loss 2.4295 (2.4292)	Entropy 0.57363 (0.57647)	Top-1 acc 65.625 (65.383)	Top-5 acc 85.156 (85.004)	lr 0.00395
Train [89][2570/3239]	Time 0.247 (0.552)	Data Time 0.001 (0.037)	Loss 2.5442 (2.4292)	Entropy 0.57338 (0.57646)	Top-1 acc 62.109 (65.382)	Top-5 acc 80.859 (85.003)	lr 0.00394
Train [89][2580/3239]	Time 0.259 (0.552)	Data Time 0.001 (0.037)	Loss 2.4823 (2.4293)	Entropy 0.57342 (0.57645)	Top-1 acc 63.672 (65.382)	Top-5 acc 85.156 (85.001)	lr 0.00394
Train [89][2590/3239]	Time 0.290 (0.553)	Data Time 0.002 (0.038)	Loss 2.3989 (2.4292)	Entropy 0.57352 (0.57644)	Top-1 acc 66.797 (65.386)	Top-5 acc 82.812 (85.002)	lr 0.00394
Train [89][2600/3239]	Time 0.304 (0.555)	Data Time 0.001 (0.041)	Loss 2.2242 (2.4293)	Entropy 0.57363 (0.57643)	Top-1 acc 70.312 (65.388)	Top-5 acc 87.891 (85.002)	lr 0.00394
Train [89][2610/3239]	Time 0.253 (0.555)	Data Time 0.001 (0.041)	Loss 2.2581 (2.4293)	Entropy 0.57352 (0.57641)	Top-1 acc 71.875 (65.386)	Top-5 acc 86.719 (85.000)	lr 0.00394
Train [89][2620/3239]	Time 0.259 (0.554)	Data Time 0.001 (0.040)	Loss 2.5654 (2.4293)	Entropy 0.57347 (0.57640)	Top-1 acc 63.281 (65.391)	Top-5 acc 83.203 (85.000)	lr 0.00394
Train [89][2630/3239]	Time 0.391 (0.554)	Data Time 0.001 (0.041)	Loss 2.4461 (2.4290)	Entropy 0.57350 (0.57639)	Top-1 acc 62.109 (65.394)	Top-5 acc 86.328 (85.008)	lr 0.00394
Train [89][2640/3239]	Time 0.263 (0.554)	Data Time 0.002 (0.041)	Loss 2.4059 (2.4292)	Entropy 0.57332 (0.57638)	Top-1 acc 66.406 (65.391)	Top-5 acc 85.156 (85.001)	lr 0.00394
Train [89][2650/3239]	Time 0.284 (0.554)	Data Time 0.001 (0.040)	Loss 2.4158 (2.4290)	Entropy 0.57310 (0.57637)	Top-1 acc 65.234 (65.394)	Top-5 acc 85.938 (85.003)	lr 0.00394
Train [89][2660/3239]	Time 0.268 (0.554)	Data Time 0.002 (0.040)	Loss 2.4304 (2.4287)	Entropy 0.57313 (0.57636)	Top-1 acc 63.672 (65.400)	Top-5 acc 86.719 (85.010)	lr 0.00394
Train [89][2670/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.040)	Loss 2.3626 (2.4289)	Entropy 0.57317 (0.57634)	Top-1 acc 66.406 (65.395)	Top-5 acc 88.672 (85.010)	lr 0.00394
Train [89][2680/3239]	Time 0.264 (0.553)	Data Time 0.002 (0.040)	Loss 2.5473 (2.4292)	Entropy 0.57318 (0.57633)	Top-1 acc 63.281 (65.387)	Top-5 acc 83.984 (85.009)	lr 0.00394
Train [89][2690/3239]	Time 0.273 (0.552)	Data Time 0.001 (0.040)	Loss 2.4690 (2.4294)	Entropy 0.57305 (0.57632)	Top-1 acc 66.797 (65.384)	Top-5 acc 84.375 (85.005)	lr 0.00394
Train [89][2700/3239]	Time 0.278 (0.553)	Data Time 0.001 (0.041)	Loss 2.4528 (2.4292)	Entropy 0.57314 (0.57631)	Top-1 acc 64.844 (65.389)	Top-5 acc 84.766 (85.009)	lr 0.00394
Train [89][2710/3239]	Time 0.251 (0.553)	Data Time 0.002 (0.041)	Loss 2.4757 (2.4291)	Entropy 0.57295 (0.57630)	Top-1 acc 62.109 (65.394)	Top-5 acc 84.375 (85.011)	lr 0.00393
Train [89][2720/3239]	Time 0.269 (0.553)	Data Time 0.001 (0.041)	Loss 2.4610 (2.4292)	Entropy 0.57295 (0.57628)	Top-1 acc 66.406 (65.394)	Top-5 acc 82.031 (85.006)	lr 0.00393
Train [89][2730/3239]	Time 0.249 (0.556)	Data Time 0.001 (0.044)	Loss 2.3494 (2.4295)	Entropy 0.57299 (0.57627)	Top-1 acc 70.312 (65.390)	Top-5 acc 85.156 (85.000)	lr 0.00393
Train [89][2740/3239]	Time 0.267 (0.555)	Data Time 0.001 (0.044)	Loss 2.3490 (2.4297)	Entropy 0.57317 (0.57626)	Top-1 acc 64.453 (65.384)	Top-5 acc 85.547 (84.995)	lr 0.00393
Train [89][2750/3239]	Time 0.227 (0.555)	Data Time 0.001 (0.044)	Loss 2.2953 (2.4294)	Entropy 0.57332 (0.57625)	Top-1 acc 68.750 (65.390)	Top-5 acc 87.109 (84.999)	lr 0.00393
Train [89][2760/3239]	Time 0.250 (0.557)	Data Time 0.001 (0.047)	Loss 2.5410 (2.4293)	Entropy 0.57376 (0.57624)	Top-1 acc 60.156 (65.391)	Top-5 acc 84.375 (85.000)	lr 0.00393
Train [89][2770/3239]	Time 0.241 (0.557)	Data Time 0.001 (0.047)	Loss 2.4791 (2.4294)	Entropy 0.57320 (0.57623)	Top-1 acc 63.281 (65.389)	Top-5 acc 86.328 (85.002)	lr 0.00393
Train [89][2780/3239]	Time 0.240 (0.556)	Data Time 0.001 (0.046)	Loss 2.2537 (2.4295)	Entropy 0.57319 (0.57622)	Top-1 acc 70.703 (65.386)	Top-5 acc 87.109 (85.002)	lr 0.00393
Train [89][2790/3239]	Time 0.353 (0.558)	Data Time 0.001 (0.048)	Loss 2.5442 (2.4295)	Entropy 0.57302 (0.57621)	Top-1 acc 66.016 (65.390)	Top-5 acc 82.031 (85.005)	lr 0.00393
Train [89][2800/3239]	Time 0.234 (0.558)	Data Time 0.001 (0.049)	Loss 2.5049 (2.4293)	Entropy 0.57289 (0.57620)	Top-1 acc 64.062 (65.395)	Top-5 acc 83.203 (85.010)	lr 0.00393
Train [89][2810/3239]	Time 0.253 (0.558)	Data Time 0.001 (0.048)	Loss 2.3423 (2.4291)	Entropy 0.57283 (0.57618)	Top-1 acc 70.312 (65.401)	Top-5 acc 86.328 (85.011)	lr 0.00393
Train [89][2820/3239]	Time 3.529 (0.559)	Data Time 3.278 (0.050)	Loss 2.3493 (2.4291)	Entropy 0.57267 (0.57617)	Top-1 acc 67.578 (65.401)	Top-5 acc 88.281 (85.009)	lr 0.00393
Train [89][2830/3239]	Time 0.233 (0.559)	Data Time 0.001 (0.050)	Loss 2.3096 (2.4293)	Entropy 0.57275 (0.57616)	Top-1 acc 67.578 (65.400)	Top-5 acc 88.672 (85.006)	lr 0.00393
Train [89][2840/3239]	Time 0.235 (0.559)	Data Time 0.001 (0.051)	Loss 2.3780 (2.4293)	Entropy 0.57294 (0.57615)	Top-1 acc 67.578 (65.400)	Top-5 acc 86.719 (85.007)	lr 0.00392
Train [89][2850/3239]	Time 0.290 (0.559)	Data Time 0.001 (0.051)	Loss 2.4509 (2.4295)	Entropy 0.57338 (0.57614)	Top-1 acc 67.188 (65.395)	Top-5 acc 83.594 (85.005)	lr 0.00392
Train [89][2860/3239]	Time 0.371 (0.559)	Data Time 0.001 (0.051)	Loss 2.8037 (2.4297)	Entropy 0.57322 (0.57613)	Top-1 acc 56.641 (65.390)	Top-5 acc 77.734 (85.000)	lr 0.00392
Train [89][2870/3239]	Time 0.253 (0.561)	Data Time 0.001 (0.053)	Loss 2.4142 (2.4296)	Entropy 0.57311 (0.57612)	Top-1 acc 68.359 (65.392)	Top-5 acc 83.203 (85.000)	lr 0.00392
Train [89][2880/3239]	Time 0.271 (0.560)	Data Time 0.003 (0.053)	Loss 2.4344 (2.4296)	Entropy 0.57282 (0.57611)	Top-1 acc 64.844 (65.392)	Top-5 acc 82.812 (84.997)	lr 0.00392
Train [89][2890/3239]	Time 0.239 (0.560)	Data Time 0.001 (0.053)	Loss 2.4847 (2.4298)	Entropy 0.57297 (0.57610)	Top-1 acc 64.062 (65.387)	Top-5 acc 82.422 (84.993)	lr 0.00392
Train [89][2900/3239]	Time 0.228 (0.562)	Data Time 0.001 (0.055)	Loss 2.4427 (2.4298)	Entropy 0.57314 (0.57609)	Top-1 acc 67.188 (65.389)	Top-5 acc 84.375 (84.996)	lr 0.00392
Train [89][2910/3239]	Time 0.235 (0.561)	Data Time 0.001 (0.054)	Loss 2.5578 (2.4300)	Entropy 0.57329 (0.57608)	Top-1 acc 64.453 (65.386)	Top-5 acc 84.375 (84.991)	lr 0.00392
Train [89][2920/3239]	Time 0.230 (0.561)	Data Time 0.001 (0.054)	Loss 2.1794 (2.4298)	Entropy 0.57318 (0.57607)	Top-1 acc 72.266 (65.394)	Top-5 acc 88.672 (84.995)	lr 0.00392
Train [89][2930/3239]	Time 0.267 (0.563)	Data Time 0.001 (0.057)	Loss 2.5286 (2.4298)	Entropy 0.57297 (0.57606)	Top-1 acc 61.719 (65.393)	Top-5 acc 83.594 (84.992)	lr 0.00392
Train [89][2940/3239]	Time 0.235 (0.563)	Data Time 0.001 (0.057)	Loss 2.4595 (2.4297)	Entropy 0.57281 (0.57604)	Top-1 acc 64.453 (65.395)	Top-5 acc 80.859 (84.992)	lr 0.00392
Train [89][2950/3239]	Time 0.401 (0.564)	Data Time 0.001 (0.058)	Loss 2.6364 (2.4296)	Entropy 0.57289 (0.57603)	Top-1 acc 62.500 (65.399)	Top-5 acc 79.688 (84.993)	lr 0.00392
Train [89][2960/3239]	Time 0.240 (0.565)	Data Time 0.001 (0.059)	Loss 2.6710 (2.4296)	Entropy 0.57286 (0.57602)	Top-1 acc 58.984 (65.399)	Top-5 acc 81.250 (84.993)	lr 0.00392
Train [89][2970/3239]	Time 0.285 (0.564)	Data Time 0.001 (0.059)	Loss 2.4761 (2.4298)	Entropy 0.57276 (0.57601)	Top-1 acc 64.453 (65.395)	Top-5 acc 83.203 (84.989)	lr 0.00392
Train [89][2980/3239]	Time 2.205 (0.564)	Data Time 1.963 (0.059)	Loss 2.6612 (2.4299)	Entropy 0.57294 (0.57600)	Top-1 acc 60.938 (65.390)	Top-5 acc 81.641 (84.987)	lr 0.00391
Train [89][2990/3239]	Time 0.294 (0.564)	Data Time 0.001 (0.059)	Loss 2.3596 (2.4299)	Entropy 0.57278 (0.57599)	Top-1 acc 66.797 (65.389)	Top-5 acc 85.547 (84.985)	lr 0.00391
Train [89][3000/3239]	Time 0.238 (0.565)	Data Time 0.001 (0.060)	Loss 2.3215 (2.4298)	Entropy 0.57294 (0.57598)	Top-1 acc 68.750 (65.391)	Top-5 acc 87.500 (84.987)	lr 0.00391
Train [89][3010/3239]	Time 0.246 (0.565)	Data Time 0.001 (0.060)	Loss 2.4708 (2.4297)	Entropy 0.57285 (0.57597)	Top-1 acc 64.453 (65.393)	Top-5 acc 83.203 (84.989)	lr 0.00391
Train [89][3020/3239]	Time 0.369 (0.565)	Data Time 0.001 (0.060)	Loss 2.4886 (2.4298)	Entropy 0.57241 (0.57596)	Top-1 acc 66.797 (65.391)	Top-5 acc 85.156 (84.985)	lr 0.00391
Train [89][3030/3239]	Time 0.244 (0.566)	Data Time 0.001 (0.062)	Loss 2.6700 (2.4299)	Entropy 0.57262 (0.57595)	Top-1 acc 58.984 (65.383)	Top-5 acc 80.469 (84.984)	lr 0.00391
Train [89][3040/3239]	Time 0.320 (0.566)	Data Time 0.001 (0.062)	Loss 2.8379 (2.4301)	Entropy 0.57237 (0.57594)	Top-1 acc 53.125 (65.375)	Top-5 acc 76.953 (84.981)	lr 0.00391
Train [89][3050/3239]	Time 0.680 (0.583)	Data Time 0.004 (0.061)	Loss 2.4484 (2.4301)	Entropy 0.57223 (0.57592)	Top-1 acc 64.453 (65.379)	Top-5 acc 85.156 (84.979)	lr 0.00391
Train [89][3060/3239]	Time 0.239 (0.583)	Data Time 0.002 (0.061)	Loss 2.3523 (2.4302)	Entropy 0.57252 (0.57591)	Top-1 acc 67.578 (65.379)	Top-5 acc 86.719 (84.979)	lr 0.00391
Train [89][3070/3239]	Time 0.242 (0.583)	Data Time 0.001 (0.061)	Loss 2.4480 (2.4303)	Entropy 0.57265 (0.57590)	Top-1 acc 64.062 (65.381)	Top-5 acc 83.594 (84.976)	lr 0.00391
Train [89][3080/3239]	Time 0.267 (0.582)	Data Time 0.002 (0.061)	Loss 2.3272 (2.4304)	Entropy 0.57276 (0.57589)	Top-1 acc 70.312 (65.379)	Top-5 acc 89.062 (84.974)	lr 0.00391
Train [89][3090/3239]	Time 0.255 (0.582)	Data Time 0.001 (0.061)	Loss 2.4869 (2.4304)	Entropy 0.57312 (0.57588)	Top-1 acc 65.234 (65.379)	Top-5 acc 84.375 (84.973)	lr 0.00391
Train [89][3100/3239]	Time 0.244 (0.581)	Data Time 0.001 (0.060)	Loss 2.4224 (2.4304)	Entropy 0.57288 (0.57587)	Top-1 acc 65.234 (65.378)	Top-5 acc 83.594 (84.974)	lr 0.00391
Train [89][3110/3239]	Time 0.346 (0.581)	Data Time 0.002 (0.060)	Loss 2.4042 (2.4304)	Entropy 0.57296 (0.57586)	Top-1 acc 70.312 (65.380)	Top-5 acc 85.156 (84.976)	lr 0.00391
Train [89][3120/3239]	Time 0.240 (0.580)	Data Time 0.001 (0.060)	Loss 2.4619 (2.4304)	Entropy 0.57283 (0.57585)	Top-1 acc 66.797 (65.378)	Top-5 acc 83.594 (84.974)	lr 0.00390
Train [89][3130/3239]	Time 0.285 (0.580)	Data Time 0.001 (0.060)	Loss 2.3259 (2.4304)	Entropy 0.57276 (0.57584)	Top-1 acc 66.797 (65.379)	Top-5 acc 87.109 (84.974)	lr 0.00390
Train [89][3140/3239]	Time 0.286 (0.580)	Data Time 0.002 (0.060)	Loss 2.4597 (2.4303)	Entropy 0.57283 (0.57583)	Top-1 acc 65.234 (65.380)	Top-5 acc 83.594 (84.976)	lr 0.00390
Train [89][3150/3239]	Time 0.242 (0.580)	Data Time 0.001 (0.060)	Loss 2.6015 (2.4305)	Entropy 0.57231 (0.57582)	Top-1 acc 59.375 (65.374)	Top-5 acc 80.859 (84.972)	lr 0.00390
Train [89][3160/3239]	Time 2.061 (0.581)	Data Time 1.768 (0.062)	Loss 2.2056 (2.4305)	Entropy 0.57231 (0.57581)	Top-1 acc 72.656 (65.374)	Top-5 acc 91.016 (84.972)	lr 0.00390
Train [89][3170/3239]	Time 0.244 (0.584)	Data Time 0.001 (0.064)	Loss 2.2689 (2.4302)	Entropy 0.57252 (0.57580)	Top-1 acc 69.531 (65.382)	Top-5 acc 88.672 (84.978)	lr 0.00390
Train [89][3180/3239]	Time 0.337 (0.583)	Data Time 0.000 (0.064)	Loss 2.2399 (2.4302)	Entropy 0.57219 (0.57579)	Top-1 acc 68.750 (65.381)	Top-5 acc 87.109 (84.979)	lr 0.00390
Train [89][3190/3239]	Time 0.230 (0.589)	Data Time 0.000 (0.070)	Loss 2.3422 (2.4301)	Entropy 0.57231 (0.57578)	Top-1 acc 70.703 (65.382)	Top-5 acc 85.938 (84.983)	lr 0.00390
Train [89][3200/3239]	Time 0.239 (0.588)	Data Time 0.000 (0.070)	Loss 2.2499 (2.4298)	Entropy 0.57162 (0.57577)	Top-1 acc 70.312 (65.388)	Top-5 acc 89.062 (84.989)	lr 0.00390
Train [89][3210/3239]	Time 0.237 (0.589)	Data Time 0.000 (0.071)	Loss 2.4031 (2.4299)	Entropy 0.57123 (0.57576)	Top-1 acc 67.578 (65.384)	Top-5 acc 85.156 (84.987)	lr 0.00390
Train [89][3220/3239]	Time 2.065 (0.591)	Data Time 1.809 (0.073)	Loss 2.4600 (2.4299)	Entropy 0.57125 (0.57574)	Top-1 acc 64.844 (65.383)	Top-5 acc 85.938 (84.988)	lr 0.00390
Train [89][3230/3239]	Time 0.272 (0.593)	Data Time 0.000 (0.075)	Loss 2.2420 (2.4298)	Entropy 0.57070 (0.57573)	Top-1 acc 67.188 (65.384)	Top-5 acc 89.453 (84.990)	lr 0.00390
Train [89][3239/3239]	Time 0.974 (0.593)	Data Time 0.000 (0.075)	Loss 3.0531 (2.4298)	Entropy 0.57058 (0.57571)	Top-1 acc 58.025 (65.389)	Top-5 acc 74.074 (84.989)	lr 0.00390
==========Valid [89/120]	loss 1.237	top-1 acc 71.623 (71.623)	top-5 acc 89.727	Train top-1 65.389	top-5 84.989	Entropy 0.57058	Latency-None: 0.000ms	Flops: 539.00M
Train [90][0/3239]	Time 47.550 (47.550)	Data Time 45.789 (45.789)	Loss 2.5924 (2.5924)	Entropy 0.57071 (0.57071)	Top-1 acc 59.766 (59.766)	Top-5 acc 83.203 (83.203)	lr 0.00390
Train [90][10/3239]	Time 0.343 (4.716)	Data Time 0.001 (4.164)	Loss 2.3172 (2.4725)	Entropy 0.57066 (0.57067)	Top-1 acc 67.578 (63.920)	Top-5 acc 87.109 (83.700)	lr 0.00389
Train [90][20/3239]	Time 0.235 (2.706)	Data Time 0.001 (2.182)	Loss 2.3836 (2.4313)	Entropy 0.57062 (0.57063)	Top-1 acc 65.625 (65.569)	Top-5 acc 85.547 (84.766)	lr 0.00389
Train [90][30/3239]	Time 0.238 (1.969)	Data Time 0.001 (1.479)	Loss 2.5886 (2.4538)	Entropy 0.57079 (0.57066)	Top-1 acc 62.891 (64.869)	Top-5 acc 79.297 (84.173)	lr 0.00389
Train [90][40/3239]	Time 0.248 (1.606)	Data Time 0.002 (1.119)	Loss 2.5643 (2.4658)	Entropy 0.57056 (0.57068)	Top-1 acc 64.844 (64.501)	Top-5 acc 80.469 (84.070)	lr 0.00389
Train [90][50/3239]	Time 0.329 (1.384)	Data Time 0.001 (0.900)	Loss 2.3654 (2.4377)	Entropy 0.57064 (0.57065)	Top-1 acc 67.578 (65.081)	Top-5 acc 86.328 (84.612)	lr 0.00389
Train [90][60/3239]	Time 0.243 (1.230)	Data Time 0.001 (0.752)	Loss 2.4430 (2.4381)	Entropy 0.57071 (0.57066)	Top-1 acc 63.672 (65.100)	Top-5 acc 85.156 (84.657)	lr 0.00389
Train [90][70/3239]	Time 0.262 (1.128)	Data Time 0.001 (0.647)	Loss 2.5180 (2.4356)	Entropy 0.57054 (0.57065)	Top-1 acc 64.453 (65.245)	Top-5 acc 82.031 (84.683)	lr 0.00389
Train [90][80/3239]	Time 0.406 (1.043)	Data Time 0.001 (0.567)	Loss 2.3834 (2.4337)	Entropy 0.57058 (0.57064)	Top-1 acc 69.531 (65.355)	Top-5 acc 83.984 (84.616)	lr 0.00389
Train [90][90/3239]	Time 0.253 (0.977)	Data Time 0.002 (0.505)	Loss 2.2707 (2.4269)	Entropy 0.57029 (0.57062)	Top-1 acc 69.922 (65.591)	Top-5 acc 88.281 (84.748)	lr 0.00389
Train [90][100/3239]	Time 0.257 (0.927)	Data Time 0.001 (0.455)	Loss 2.3716 (2.4288)	Entropy 0.57000 (0.57058)	Top-1 acc 69.141 (65.633)	Top-5 acc 85.547 (84.715)	lr 0.00389
Train [90][110/3239]	Time 0.249 (0.884)	Data Time 0.001 (0.414)	Loss 2.2979 (2.4262)	Entropy 0.56996 (0.57052)	Top-1 acc 70.312 (65.685)	Top-5 acc 85.547 (84.843)	lr 0.00389
Train [90][120/3239]	Time 0.265 (0.847)	Data Time 0.001 (0.380)	Loss 2.3101 (2.4211)	Entropy 0.56991 (0.57047)	Top-1 acc 65.625 (65.767)	Top-5 acc 87.500 (84.959)	lr 0.00389
Train [90][130/3239]	Time 0.244 (0.823)	Data Time 0.001 (0.351)	Loss 2.3410 (2.4179)	Entropy 0.56968 (0.57042)	Top-1 acc 66.016 (65.843)	Top-5 acc 85.156 (85.040)	lr 0.00389
Train [90][140/3239]	Time 0.281 (0.799)	Data Time 0.001 (0.327)	Loss 2.3946 (2.4149)	Entropy 0.56980 (0.57037)	Top-1 acc 64.453 (65.872)	Top-5 acc 85.156 (85.079)	lr 0.00389
Train [90][150/3239]	Time 0.236 (0.774)	Data Time 0.001 (0.305)	Loss 2.3300 (2.4093)	Entropy 0.57010 (0.57034)	Top-1 acc 67.188 (66.008)	Top-5 acc 85.156 (85.185)	lr 0.00388
Train [90][160/3239]	Time 0.318 (0.754)	Data Time 0.001 (0.286)	Loss 2.3362 (2.4094)	Entropy 0.57002 (0.57032)	Top-1 acc 67.969 (65.974)	Top-5 acc 86.719 (85.156)	lr 0.00388
Train [90][170/3239]	Time 0.390 (0.735)	Data Time 0.001 (0.270)	Loss 2.5304 (2.4083)	Entropy 0.57015 (0.57031)	Top-1 acc 61.719 (66.009)	Top-5 acc 87.109 (85.218)	lr 0.00388
Train [90][180/3239]	Time 0.287 (0.718)	Data Time 0.001 (0.255)	Loss 2.4112 (2.4093)	Entropy 0.57022 (0.57030)	Top-1 acc 66.016 (65.960)	Top-5 acc 85.938 (85.197)	lr 0.00388
Train [90][190/3239]	Time 0.231 (0.702)	Data Time 0.001 (0.242)	Loss 2.2931 (2.4081)	Entropy 0.57020 (0.57030)	Top-1 acc 70.703 (66.003)	Top-5 acc 85.938 (85.228)	lr 0.00388
Train [90][200/3239]	Time 0.235 (0.689)	Data Time 0.001 (0.230)	Loss 2.3795 (2.4088)	Entropy 0.57058 (0.57030)	Top-1 acc 69.531 (66.023)	Top-5 acc 85.547 (85.213)	lr 0.00388
Train [90][210/3239]	Time 0.231 (0.677)	Data Time 0.001 (0.219)	Loss 2.2913 (2.4070)	Entropy 0.57043 (0.57031)	Top-1 acc 68.359 (66.012)	Top-5 acc 87.891 (85.260)	lr 0.00388
Train [90][220/3239]	Time 0.289 (0.666)	Data Time 0.001 (0.209)	Loss 2.4226 (2.4081)	Entropy 0.57061 (0.57032)	Top-1 acc 66.406 (66.016)	Top-5 acc 85.938 (85.222)	lr 0.00388
Train [90][230/3239]	Time 0.272 (0.655)	Data Time 0.001 (0.200)	Loss 2.5376 (2.4069)	Entropy 0.57067 (0.57033)	Top-1 acc 64.453 (66.026)	Top-5 acc 82.031 (85.254)	lr 0.00388
Train [90][240/3239]	Time 0.319 (0.646)	Data Time 0.001 (0.192)	Loss 2.2522 (2.4069)	Entropy 0.57042 (0.57034)	Top-1 acc 66.797 (66.038)	Top-5 acc 88.672 (85.258)	lr 0.00388
Train [90][250/3239]	Time 0.249 (0.639)	Data Time 0.001 (0.184)	Loss 2.4279 (2.4083)	Entropy 0.57032 (0.57034)	Top-1 acc 66.797 (66.000)	Top-5 acc 82.031 (85.212)	lr 0.00388
Train [90][260/3239]	Time 0.287 (0.632)	Data Time 0.001 (0.177)	Loss 2.3167 (2.4067)	Entropy 0.57036 (0.57035)	Top-1 acc 66.797 (66.074)	Top-5 acc 86.328 (85.246)	lr 0.00388
Train [90][270/3239]	Time 0.246 (0.625)	Data Time 0.001 (0.171)	Loss 2.4551 (2.4063)	Entropy 0.57011 (0.57034)	Top-1 acc 62.891 (66.037)	Top-5 acc 83.984 (85.261)	lr 0.00388
Train [90][280/3239]	Time 0.238 (0.618)	Data Time 0.001 (0.165)	Loss 2.3190 (2.4072)	Entropy 0.57010 (0.57033)	Top-1 acc 69.922 (66.043)	Top-5 acc 87.500 (85.237)	lr 0.00388
Train [90][290/3239]	Time 0.275 (0.612)	Data Time 0.001 (0.159)	Loss 2.5965 (2.4096)	Entropy 0.57041 (0.57033)	Top-1 acc 61.328 (66.018)	Top-5 acc 80.859 (85.179)	lr 0.00387
Train [90][300/3239]	Time 0.237 (0.606)	Data Time 0.001 (0.154)	Loss 2.3810 (2.4090)	Entropy 0.57061 (0.57034)	Top-1 acc 67.188 (66.026)	Top-5 acc 85.938 (85.193)	lr 0.00387
Train [90][310/3239]	Time 0.234 (0.600)	Data Time 0.001 (0.149)	Loss 2.2415 (2.4052)	Entropy 0.57033 (0.57034)	Top-1 acc 68.750 (66.101)	Top-5 acc 88.672 (85.272)	lr 0.00387
Train [90][320/3239]	Time 0.236 (0.595)	Data Time 0.001 (0.145)	Loss 2.2918 (2.4029)	Entropy 0.57003 (0.57034)	Top-1 acc 68.750 (66.169)	Top-5 acc 86.719 (85.331)	lr 0.00387
Train [90][330/3239]	Time 0.353 (0.591)	Data Time 0.002 (0.140)	Loss 2.5302 (2.4032)	Entropy 0.56997 (0.57033)	Top-1 acc 64.844 (66.162)	Top-5 acc 83.594 (85.343)	lr 0.00387
Train [90][340/3239]	Time 0.233 (0.587)	Data Time 0.001 (0.136)	Loss 2.4307 (2.4037)	Entropy 0.56993 (0.57032)	Top-1 acc 65.234 (66.153)	Top-5 acc 82.031 (85.312)	lr 0.00387
Train [90][350/3239]	Time 0.276 (0.582)	Data Time 0.002 (0.132)	Loss 2.4272 (2.4038)	Entropy 0.56990 (0.57031)	Top-1 acc 66.406 (66.155)	Top-5 acc 83.594 (85.305)	lr 0.00387
Train [90][360/3239]	Time 0.273 (0.579)	Data Time 0.002 (0.129)	Loss 2.2306 (2.4056)	Entropy 0.56988 (0.57029)	Top-1 acc 67.969 (66.102)	Top-5 acc 87.500 (85.275)	lr 0.00387
Train [90][370/3239]	Time 0.245 (0.575)	Data Time 0.001 (0.125)	Loss 2.1320 (2.4050)	Entropy 0.56985 (0.57028)	Top-1 acc 74.219 (66.134)	Top-5 acc 90.625 (85.283)	lr 0.00387
Train [90][380/3239]	Time 0.230 (0.571)	Data Time 0.001 (0.122)	Loss 2.3240 (2.4052)	Entropy 0.56956 (0.57027)	Top-1 acc 68.359 (66.141)	Top-5 acc 87.500 (85.285)	lr 0.00387
Train [90][390/3239]	Time 0.239 (0.568)	Data Time 0.002 (0.119)	Loss 2.2672 (2.4059)	Entropy 0.56981 (0.57025)	Top-1 acc 66.016 (66.148)	Top-5 acc 88.281 (85.279)	lr 0.00387
Train [90][400/3239]	Time 0.362 (0.564)	Data Time 0.001 (0.116)	Loss 2.5559 (2.4067)	Entropy 0.56979 (0.57024)	Top-1 acc 61.719 (66.159)	Top-5 acc 83.203 (85.274)	lr 0.00387
Train [90][410/3239]	Time 0.234 (0.561)	Data Time 0.001 (0.113)	Loss 2.4973 (2.4072)	Entropy 0.56973 (0.57023)	Top-1 acc 62.500 (66.132)	Top-5 acc 83.203 (85.264)	lr 0.00387
Train [90][420/3239]	Time 0.250 (0.558)	Data Time 0.001 (0.111)	Loss 2.3949 (2.4068)	Entropy 0.56964 (0.57022)	Top-1 acc 65.234 (66.138)	Top-5 acc 86.328 (85.274)	lr 0.00386
Train [90][430/3239]	Time 0.288 (0.555)	Data Time 0.001 (0.108)	Loss 2.5144 (2.4067)	Entropy 0.56977 (0.57021)	Top-1 acc 62.891 (66.147)	Top-5 acc 83.594 (85.293)	lr 0.00386
Train [90][440/3239]	Time 0.268 (0.552)	Data Time 0.001 (0.106)	Loss 2.3015 (2.4073)	Entropy 0.56995 (0.57020)	Top-1 acc 69.531 (66.137)	Top-5 acc 87.109 (85.302)	lr 0.00386
Train [90][450/3239]	Time 0.264 (0.550)	Data Time 0.002 (0.103)	Loss 2.2564 (2.4065)	Entropy 0.56982 (0.57019)	Top-1 acc 63.281 (66.126)	Top-5 acc 89.844 (85.318)	lr 0.00386
Train [90][460/3239]	Time 0.225 (0.547)	Data Time 0.001 (0.101)	Loss 2.3031 (2.4063)	Entropy 0.57007 (0.57019)	Top-1 acc 67.969 (66.128)	Top-5 acc 89.062 (85.336)	lr 0.00386
Train [90][470/3239]	Time 0.283 (0.661)	Data Time 0.002 (0.099)	Loss 2.4692 (2.4068)	Entropy 0.56977 (0.57018)	Top-1 acc 64.453 (66.103)	Top-5 acc 85.156 (85.320)	lr 0.00386
Train [90][480/3239]	Time 0.270 (0.656)	Data Time 0.002 (0.097)	Loss 2.8170 (2.4079)	Entropy 0.57023 (0.57018)	Top-1 acc 55.469 (66.066)	Top-5 acc 79.688 (85.306)	lr 0.00386
Train [90][490/3239]	Time 0.330 (0.651)	Data Time 0.002 (0.095)	Loss 2.3633 (2.4076)	Entropy 0.57033 (0.57018)	Top-1 acc 67.188 (66.063)	Top-5 acc 87.109 (85.304)	lr 0.00386
Train [90][500/3239]	Time 0.249 (0.647)	Data Time 0.001 (0.093)	Loss 2.5164 (2.4084)	Entropy 0.57030 (0.57018)	Top-1 acc 64.062 (66.049)	Top-5 acc 84.766 (85.299)	lr 0.00386
Train [90][510/3239]	Time 0.244 (0.644)	Data Time 0.001 (0.092)	Loss 2.4146 (2.4081)	Entropy 0.57042 (0.57018)	Top-1 acc 67.969 (66.055)	Top-5 acc 83.984 (85.297)	lr 0.00386
Train [90][520/3239]	Time 0.270 (0.640)	Data Time 0.002 (0.090)	Loss 2.4762 (2.4075)	Entropy 0.57019 (0.57019)	Top-1 acc 66.016 (66.061)	Top-5 acc 82.812 (85.303)	lr 0.00386
Train [90][530/3239]	Time 0.280 (0.636)	Data Time 0.001 (0.088)	Loss 2.6004 (2.4063)	Entropy 0.56988 (0.57018)	Top-1 acc 63.281 (66.095)	Top-5 acc 82.031 (85.327)	lr 0.00386
Train [90][540/3239]	Time 0.345 (0.633)	Data Time 0.002 (0.087)	Loss 2.4694 (2.4083)	Entropy 0.56975 (0.57018)	Top-1 acc 66.797 (66.055)	Top-5 acc 84.766 (85.294)	lr 0.00386
Train [90][550/3239]	Time 0.229 (0.630)	Data Time 0.001 (0.085)	Loss 2.3284 (2.4081)	Entropy 0.56939 (0.57016)	Top-1 acc 72.266 (66.082)	Top-5 acc 84.766 (85.284)	lr 0.00386
Train [90][560/3239]	Time 0.367 (0.627)	Data Time 0.001 (0.084)	Loss 2.4379 (2.4084)	Entropy 0.56917 (0.57015)	Top-1 acc 69.141 (66.089)	Top-5 acc 86.328 (85.282)	lr 0.00385
Train [90][570/3239]	Time 0.277 (0.624)	Data Time 0.001 (0.082)	Loss 2.4091 (2.4089)	Entropy 0.56928 (0.57013)	Top-1 acc 64.453 (66.084)	Top-5 acc 87.109 (85.275)	lr 0.00385
Train [90][580/3239]	Time 0.238 (0.621)	Data Time 0.001 (0.081)	Loss 2.4724 (2.4085)	Entropy 0.56909 (0.57011)	Top-1 acc 63.672 (66.088)	Top-5 acc 83.984 (85.283)	lr 0.00385
Train [90][590/3239]	Time 0.324 (0.618)	Data Time 0.001 (0.079)	Loss 2.4428 (2.4099)	Entropy 0.56910 (0.57010)	Top-1 acc 66.016 (66.067)	Top-5 acc 85.156 (85.266)	lr 0.00385
Train [90][600/3239]	Time 0.381 (0.615)	Data Time 0.002 (0.078)	Loss 2.3921 (2.4108)	Entropy 0.56903 (0.57008)	Top-1 acc 68.359 (66.049)	Top-5 acc 83.984 (85.245)	lr 0.00385
Train [90][610/3239]	Time 0.246 (0.612)	Data Time 0.001 (0.077)	Loss 2.2308 (2.4113)	Entropy 0.56898 (0.57006)	Top-1 acc 72.266 (66.044)	Top-5 acc 88.672 (85.230)	lr 0.00385
Train [90][620/3239]	Time 0.228 (0.609)	Data Time 0.001 (0.076)	Loss 2.5462 (2.4111)	Entropy 0.56919 (0.57005)	Top-1 acc 62.891 (66.031)	Top-5 acc 81.641 (85.227)	lr 0.00385
Train [90][630/3239]	Time 0.268 (0.607)	Data Time 0.001 (0.074)	Loss 2.4476 (2.4120)	Entropy 0.56923 (0.57003)	Top-1 acc 66.016 (66.025)	Top-5 acc 86.328 (85.216)	lr 0.00385
Train [90][640/3239]	Time 0.294 (0.604)	Data Time 0.007 (0.073)	Loss 2.4321 (2.4119)	Entropy 0.56920 (0.57002)	Top-1 acc 64.844 (66.017)	Top-5 acc 84.766 (85.223)	lr 0.00385
Train [90][650/3239]	Time 0.242 (0.601)	Data Time 0.001 (0.072)	Loss 2.3110 (2.4133)	Entropy 0.56916 (0.57001)	Top-1 acc 66.406 (65.999)	Top-5 acc 84.375 (85.192)	lr 0.00385
Train [90][660/3239]	Time 0.241 (0.599)	Data Time 0.001 (0.071)	Loss 2.3264 (2.4144)	Entropy 0.56947 (0.57000)	Top-1 acc 68.359 (65.971)	Top-5 acc 87.109 (85.175)	lr 0.00385
Train [90][670/3239]	Time 0.245 (0.597)	Data Time 0.001 (0.070)	Loss 2.3679 (2.4153)	Entropy 0.56915 (0.56999)	Top-1 acc 64.844 (65.942)	Top-5 acc 85.547 (85.159)	lr 0.00385
Train [90][680/3239]	Time 0.233 (0.594)	Data Time 0.001 (0.069)	Loss 2.4459 (2.4161)	Entropy 0.56883 (0.56997)	Top-1 acc 64.844 (65.899)	Top-5 acc 85.156 (85.144)	lr 0.00385
Train [90][690/3239]	Time 0.230 (0.591)	Data Time 0.001 (0.068)	Loss 2.4374 (2.4167)	Entropy 0.56878 (0.56996)	Top-1 acc 62.500 (65.869)	Top-5 acc 86.719 (85.132)	lr 0.00385
Train [90][700/3239]	Time 0.248 (0.590)	Data Time 0.001 (0.067)	Loss 2.3907 (2.4164)	Entropy 0.56875 (0.56994)	Top-1 acc 64.844 (65.868)	Top-5 acc 83.594 (85.138)	lr 0.00384
Train [90][710/3239]	Time 0.233 (0.587)	Data Time 0.001 (0.066)	Loss 2.4223 (2.4170)	Entropy 0.56875 (0.56992)	Top-1 acc 67.188 (65.850)	Top-5 acc 83.203 (85.123)	lr 0.00384
Train [90][720/3239]	Time 0.339 (0.585)	Data Time 0.001 (0.065)	Loss 2.2325 (2.4168)	Entropy 0.56869 (0.56991)	Top-1 acc 72.266 (65.837)	Top-5 acc 87.891 (85.133)	lr 0.00384
Train [90][730/3239]	Time 0.274 (0.583)	Data Time 0.001 (0.065)	Loss 2.4373 (2.4161)	Entropy 0.56908 (0.56989)	Top-1 acc 69.141 (65.845)	Top-5 acc 83.203 (85.142)	lr 0.00384
Train [90][740/3239]	Time 0.229 (0.581)	Data Time 0.001 (0.064)	Loss 2.1778 (2.4172)	Entropy 0.56878 (0.56988)	Top-1 acc 71.875 (65.821)	Top-5 acc 89.453 (85.126)	lr 0.00384
Train [90][750/3239]	Time 0.236 (0.579)	Data Time 0.001 (0.063)	Loss 2.4779 (2.4170)	Entropy 0.56870 (0.56986)	Top-1 acc 62.891 (65.825)	Top-5 acc 85.156 (85.125)	lr 0.00384
Train [90][760/3239]	Time 0.290 (0.578)	Data Time 0.002 (0.062)	Loss 2.3017 (2.4175)	Entropy 0.56844 (0.56985)	Top-1 acc 67.969 (65.817)	Top-5 acc 87.891 (85.122)	lr 0.00384
Train [90][770/3239]	Time 0.234 (0.577)	Data Time 0.002 (0.061)	Loss 2.3725 (2.4175)	Entropy 0.56828 (0.56983)	Top-1 acc 69.141 (65.821)	Top-5 acc 84.375 (85.119)	lr 0.00384
Train [90][780/3239]	Time 0.244 (0.575)	Data Time 0.001 (0.061)	Loss 2.5121 (2.4174)	Entropy 0.56845 (0.56981)	Top-1 acc 63.672 (65.822)	Top-5 acc 81.641 (85.115)	lr 0.00384
Train [90][790/3239]	Time 0.400 (0.574)	Data Time 0.002 (0.060)	Loss 2.3399 (2.4171)	Entropy 0.56860 (0.56979)	Top-1 acc 69.922 (65.825)	Top-5 acc 84.375 (85.114)	lr 0.00384
Train [90][800/3239]	Time 0.268 (0.573)	Data Time 0.001 (0.059)	Loss 2.3933 (2.4171)	Entropy 0.56881 (0.56978)	Top-1 acc 63.281 (65.834)	Top-5 acc 86.328 (85.120)	lr 0.00384
Train [90][810/3239]	Time 0.239 (0.571)	Data Time 0.002 (0.058)	Loss 2.2020 (2.4169)	Entropy 0.56912 (0.56977)	Top-1 acc 69.141 (65.844)	Top-5 acc 89.844 (85.130)	lr 0.00384
Train [90][820/3239]	Time 0.297 (0.569)	Data Time 0.002 (0.058)	Loss 2.6517 (2.4171)	Entropy 0.56896 (0.56976)	Top-1 acc 60.156 (65.838)	Top-5 acc 78.516 (85.121)	lr 0.00384
Train [90][830/3239]	Time 0.261 (0.568)	Data Time 0.001 (0.057)	Loss 2.4796 (2.4173)	Entropy 0.56902 (0.56975)	Top-1 acc 68.750 (65.836)	Top-5 acc 82.812 (85.113)	lr 0.00383
Train [90][840/3239]	Time 0.237 (0.566)	Data Time 0.001 (0.056)	Loss 2.5050 (2.4187)	Entropy 0.56921 (0.56974)	Top-1 acc 63.672 (65.801)	Top-5 acc 81.641 (85.095)	lr 0.00383
Train [90][850/3239]	Time 0.245 (0.565)	Data Time 0.003 (0.056)	Loss 2.3692 (2.4192)	Entropy 0.56942 (0.56974)	Top-1 acc 67.969 (65.782)	Top-5 acc 84.375 (85.077)	lr 0.00383
Train [90][860/3239]	Time 0.335 (0.565)	Data Time 0.002 (0.055)	Loss 2.4169 (2.4192)	Entropy 0.56960 (0.56973)	Top-1 acc 64.844 (65.764)	Top-5 acc 83.594 (85.085)	lr 0.00383
Train [90][870/3239]	Time 0.239 (0.564)	Data Time 0.001 (0.055)	Loss 2.4007 (2.4192)	Entropy 0.56993 (0.56973)	Top-1 acc 65.625 (65.760)	Top-5 acc 84.375 (85.080)	lr 0.00383
Train [90][880/3239]	Time 0.342 (0.563)	Data Time 0.001 (0.054)	Loss 2.2624 (2.4191)	Entropy 0.56987 (0.56974)	Top-1 acc 67.578 (65.756)	Top-5 acc 87.500 (85.079)	lr 0.00383
Train [90][890/3239]	Time 0.274 (0.561)	Data Time 0.002 (0.053)	Loss 2.4192 (2.4196)	Entropy 0.56981 (0.56974)	Top-1 acc 64.453 (65.741)	Top-5 acc 84.375 (85.066)	lr 0.00383
Train [90][900/3239]	Time 0.274 (0.560)	Data Time 0.001 (0.053)	Loss 2.3602 (2.4194)	Entropy 0.56999 (0.56974)	Top-1 acc 66.016 (65.736)	Top-5 acc 87.500 (85.068)	lr 0.00383
Train [90][910/3239]	Time 0.293 (0.559)	Data Time 0.001 (0.052)	Loss 2.4717 (2.4196)	Entropy 0.56991 (0.56974)	Top-1 acc 62.500 (65.724)	Top-5 acc 83.203 (85.066)	lr 0.00383
Train [90][920/3239]	Time 0.269 (0.558)	Data Time 0.001 (0.052)	Loss 2.4468 (2.4193)	Entropy 0.56958 (0.56974)	Top-1 acc 62.500 (65.726)	Top-5 acc 82.812 (85.068)	lr 0.00383
Train [90][930/3239]	Time 0.228 (0.556)	Data Time 0.001 (0.051)	Loss 2.3294 (2.4192)	Entropy 0.56946 (0.56974)	Top-1 acc 69.141 (65.729)	Top-5 acc 86.719 (85.075)	lr 0.00383
Train [90][940/3239]	Time 0.252 (0.555)	Data Time 0.001 (0.051)	Loss 2.4426 (2.4194)	Entropy 0.56967 (0.56974)	Top-1 acc 66.016 (65.728)	Top-5 acc 85.156 (85.073)	lr 0.00383
Train [90][950/3239]	Time 0.373 (0.554)	Data Time 0.001 (0.050)	Loss 2.4780 (2.4194)	Entropy 0.56949 (0.56974)	Top-1 acc 64.453 (65.719)	Top-5 acc 83.984 (85.075)	lr 0.00383
Train [90][960/3239]	Time 0.241 (0.553)	Data Time 0.002 (0.050)	Loss 2.3105 (2.4201)	Entropy 0.56918 (0.56974)	Top-1 acc 66.406 (65.708)	Top-5 acc 87.109 (85.057)	lr 0.00383
Train [90][970/3239]	Time 0.229 (0.552)	Data Time 0.001 (0.049)	Loss 2.3652 (2.4203)	Entropy 0.56949 (0.56973)	Top-1 acc 68.359 (65.704)	Top-5 acc 84.766 (85.058)	lr 0.00382
Train [90][980/3239]	Time 0.265 (0.551)	Data Time 0.001 (0.049)	Loss 2.2974 (2.4195)	Entropy 0.56959 (0.56973)	Top-1 acc 67.969 (65.716)	Top-5 acc 87.109 (85.066)	lr 0.00382
Train [90][990/3239]	Time 0.256 (0.549)	Data Time 0.001 (0.048)	Loss 2.4527 (2.4194)	Entropy 0.56927 (0.56973)	Top-1 acc 61.719 (65.716)	Top-5 acc 85.156 (85.067)	lr 0.00382
Train [90][1000/3239]	Time 0.231 (0.548)	Data Time 0.001 (0.048)	Loss 2.4965 (2.4195)	Entropy 0.56916 (0.56972)	Top-1 acc 65.625 (65.713)	Top-5 acc 83.984 (85.063)	lr 0.00382
Train [90][1010/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.047)	Loss 2.3989 (2.4202)	Entropy 0.56952 (0.56972)	Top-1 acc 63.672 (65.708)	Top-5 acc 86.328 (85.047)	lr 0.00382
Train [90][1020/3239]	Time 0.248 (0.546)	Data Time 0.001 (0.047)	Loss 2.3055 (2.4199)	Entropy 0.56936 (0.56971)	Top-1 acc 67.969 (65.713)	Top-5 acc 87.500 (85.056)	lr 0.00382
Train [90][1030/3239]	Time 0.316 (0.545)	Data Time 0.001 (0.046)	Loss 2.2347 (2.4197)	Entropy 0.56944 (0.56971)	Top-1 acc 70.703 (65.712)	Top-5 acc 87.500 (85.055)	lr 0.00382
Train [90][1040/3239]	Time 0.263 (0.544)	Data Time 0.001 (0.046)	Loss 2.2178 (2.4194)	Entropy 0.56967 (0.56971)	Top-1 acc 71.484 (65.726)	Top-5 acc 88.672 (85.059)	lr 0.00382
Train [90][1050/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.046)	Loss 2.4918 (2.4200)	Entropy 0.56977 (0.56971)	Top-1 acc 69.141 (65.713)	Top-5 acc 83.594 (85.049)	lr 0.00382
Train [90][1060/3239]	Time 0.260 (0.541)	Data Time 0.001 (0.045)	Loss 2.3247 (2.4198)	Entropy 0.56987 (0.56971)	Top-1 acc 67.969 (65.722)	Top-5 acc 87.891 (85.049)	lr 0.00382
Train [90][1070/3239]	Time 0.274 (0.541)	Data Time 0.001 (0.045)	Loss 2.4621 (2.4203)	Entropy 0.56960 (0.56971)	Top-1 acc 62.500 (65.699)	Top-5 acc 86.719 (85.047)	lr 0.00382
Train [90][1080/3239]	Time 0.258 (0.540)	Data Time 0.002 (0.044)	Loss 2.2873 (2.4209)	Entropy 0.56968 (0.56971)	Top-1 acc 73.047 (65.688)	Top-5 acc 88.672 (85.031)	lr 0.00382
Train [90][1090/3239]	Time 0.271 (0.539)	Data Time 0.003 (0.044)	Loss 2.3514 (2.4210)	Entropy 0.56994 (0.56971)	Top-1 acc 66.016 (65.683)	Top-5 acc 88.672 (85.032)	lr 0.00382
Train [90][1100/3239]	Time 0.243 (0.538)	Data Time 0.002 (0.044)	Loss 2.5850 (2.4221)	Entropy 0.57013 (0.56971)	Top-1 acc 62.891 (65.656)	Top-5 acc 81.641 (85.018)	lr 0.00382
Train [90][1110/3239]	Time 0.416 (0.537)	Data Time 0.001 (0.043)	Loss 2.5616 (2.4232)	Entropy 0.57004 (0.56972)	Top-1 acc 60.547 (65.625)	Top-5 acc 81.250 (85.006)	lr 0.00381
Train [90][1120/3239]	Time 0.386 (0.584)	Data Time 0.005 (0.043)	Loss 2.3119 (2.4228)	Entropy 0.57025 (0.56972)	Top-1 acc 68.750 (65.646)	Top-5 acc 87.891 (85.016)	lr 0.00381
Train [90][1130/3239]	Time 0.256 (0.583)	Data Time 0.002 (0.042)	Loss 2.4147 (2.4229)	Entropy 0.57022 (0.56973)	Top-1 acc 66.016 (65.641)	Top-5 acc 86.719 (85.016)	lr 0.00381
Train [90][1140/3239]	Time 0.273 (0.582)	Data Time 0.002 (0.042)	Loss 2.4896 (2.4236)	Entropy 0.56997 (0.56973)	Top-1 acc 62.109 (65.621)	Top-5 acc 83.203 (85.006)	lr 0.00381
Train [90][1150/3239]	Time 0.282 (0.581)	Data Time 0.001 (0.042)	Loss 2.3983 (2.4230)	Entropy 0.56992 (0.56973)	Top-1 acc 63.672 (65.629)	Top-5 acc 87.500 (85.015)	lr 0.00381
Train [90][1160/3239]	Time 0.282 (0.580)	Data Time 0.002 (0.041)	Loss 2.2367 (2.4227)	Entropy 0.56987 (0.56973)	Top-1 acc 69.141 (65.639)	Top-5 acc 89.062 (85.023)	lr 0.00381
Train [90][1170/3239]	Time 0.230 (0.579)	Data Time 0.002 (0.041)	Loss 2.5868 (2.4225)	Entropy 0.56994 (0.56973)	Top-1 acc 60.938 (65.651)	Top-5 acc 83.984 (85.031)	lr 0.00381
Train [90][1180/3239]	Time 0.302 (0.578)	Data Time 0.001 (0.041)	Loss 2.2543 (2.4225)	Entropy 0.56985 (0.56973)	Top-1 acc 69.141 (65.644)	Top-5 acc 88.672 (85.034)	lr 0.00381
Train [90][1190/3239]	Time 0.235 (0.576)	Data Time 0.001 (0.040)	Loss 2.3919 (2.4222)	Entropy 0.56972 (0.56974)	Top-1 acc 66.016 (65.652)	Top-5 acc 84.766 (85.038)	lr 0.00381
Train [90][1200/3239]	Time 0.295 (0.575)	Data Time 0.001 (0.040)	Loss 2.2519 (2.4221)	Entropy 0.56969 (0.56973)	Top-1 acc 71.484 (65.656)	Top-5 acc 87.500 (85.035)	lr 0.00381
Train [90][1210/3239]	Time 0.268 (0.574)	Data Time 0.002 (0.040)	Loss 2.3310 (2.4216)	Entropy 0.56980 (0.56974)	Top-1 acc 67.188 (65.658)	Top-5 acc 86.719 (85.047)	lr 0.00381
Train [90][1220/3239]	Time 0.267 (0.573)	Data Time 0.003 (0.039)	Loss 2.5002 (2.4215)	Entropy 0.56968 (0.56974)	Top-1 acc 66.406 (65.661)	Top-5 acc 85.156 (85.056)	lr 0.00381
Train [90][1230/3239]	Time 0.255 (0.572)	Data Time 0.001 (0.039)	Loss 2.4267 (2.4216)	Entropy 0.56979 (0.56974)	Top-1 acc 66.406 (65.658)	Top-5 acc 85.547 (85.054)	lr 0.00381
Train [90][1240/3239]	Time 0.246 (0.571)	Data Time 0.001 (0.039)	Loss 2.4765 (2.4217)	Entropy 0.56988 (0.56974)	Top-1 acc 64.062 (65.655)	Top-5 acc 83.594 (85.055)	lr 0.00381
Train [90][1250/3239]	Time 0.243 (0.570)	Data Time 0.001 (0.039)	Loss 2.3846 (2.4219)	Entropy 0.57001 (0.56974)	Top-1 acc 64.844 (65.653)	Top-5 acc 86.328 (85.051)	lr 0.00380
Train [90][1260/3239]	Time 0.270 (0.569)	Data Time 0.001 (0.038)	Loss 2.8263 (2.4221)	Entropy 0.57030 (0.56974)	Top-1 acc 57.812 (65.653)	Top-5 acc 79.297 (85.051)	lr 0.00380
Train [90][1270/3239]	Time 0.347 (0.568)	Data Time 0.001 (0.038)	Loss 2.2225 (2.4214)	Entropy 0.57063 (0.56975)	Top-1 acc 71.875 (65.673)	Top-5 acc 87.109 (85.060)	lr 0.00380
Train [90][1280/3239]	Time 0.243 (0.567)	Data Time 0.002 (0.038)	Loss 2.2732 (2.4210)	Entropy 0.57071 (0.56975)	Top-1 acc 70.703 (65.680)	Top-5 acc 88.672 (85.074)	lr 0.00380
Train [90][1290/3239]	Time 0.238 (0.566)	Data Time 0.001 (0.037)	Loss 2.4484 (2.4216)	Entropy 0.57062 (0.56976)	Top-1 acc 69.531 (65.665)	Top-5 acc 85.547 (85.065)	lr 0.00380
Train [90][1300/3239]	Time 0.242 (0.565)	Data Time 0.001 (0.037)	Loss 2.1893 (2.4214)	Entropy 0.57081 (0.56977)	Top-1 acc 76.172 (65.672)	Top-5 acc 89.453 (85.072)	lr 0.00380
Train [90][1310/3239]	Time 0.296 (0.564)	Data Time 0.002 (0.037)	Loss 2.5218 (2.4217)	Entropy 0.57098 (0.56978)	Top-1 acc 61.719 (65.657)	Top-5 acc 82.422 (85.074)	lr 0.00380
Train [90][1320/3239]	Time 0.254 (0.564)	Data Time 0.002 (0.037)	Loss 2.4892 (2.4219)	Entropy 0.57047 (0.56979)	Top-1 acc 63.281 (65.646)	Top-5 acc 85.547 (85.066)	lr 0.00380
Train [90][1330/3239]	Time 0.229 (0.563)	Data Time 0.001 (0.036)	Loss 2.4839 (2.4220)	Entropy 0.57059 (0.56979)	Top-1 acc 62.109 (65.648)	Top-5 acc 88.281 (85.068)	lr 0.00380
Train [90][1340/3239]	Time 0.385 (0.562)	Data Time 0.002 (0.036)	Loss 2.3061 (2.4223)	Entropy 0.57031 (0.56980)	Top-1 acc 70.703 (65.638)	Top-5 acc 85.547 (85.063)	lr 0.00380
Train [90][1350/3239]	Time 0.265 (0.561)	Data Time 0.001 (0.036)	Loss 2.3166 (2.4224)	Entropy 0.57016 (0.56980)	Top-1 acc 69.531 (65.634)	Top-5 acc 83.984 (85.056)	lr 0.00380
Train [90][1360/3239]	Time 0.254 (0.560)	Data Time 0.002 (0.036)	Loss 2.3768 (2.4225)	Entropy 0.57012 (0.56980)	Top-1 acc 66.406 (65.633)	Top-5 acc 87.109 (85.052)	lr 0.00380
Train [90][1370/3239]	Time 0.312 (0.559)	Data Time 0.002 (0.035)	Loss 2.3329 (2.4228)	Entropy 0.56989 (0.56980)	Top-1 acc 66.016 (65.629)	Top-5 acc 86.719 (85.044)	lr 0.00380
Train [90][1380/3239]	Time 0.300 (0.559)	Data Time 0.002 (0.035)	Loss 2.4896 (2.4235)	Entropy 0.56990 (0.56980)	Top-1 acc 64.062 (65.612)	Top-5 acc 83.203 (85.027)	lr 0.00379
Train [90][1390/3239]	Time 0.278 (0.559)	Data Time 0.001 (0.035)	Loss 2.3338 (2.4234)	Entropy 0.56988 (0.56980)	Top-1 acc 68.750 (65.617)	Top-5 acc 85.938 (85.033)	lr 0.00379
Train [90][1400/3239]	Time 0.247 (0.558)	Data Time 0.002 (0.035)	Loss 2.5637 (2.4233)	Entropy 0.57000 (0.56980)	Top-1 acc 59.766 (65.609)	Top-5 acc 82.031 (85.039)	lr 0.00379
Train [90][1410/3239]	Time 0.266 (0.557)	Data Time 0.001 (0.034)	Loss 2.4708 (2.4234)	Entropy 0.56977 (0.56981)	Top-1 acc 67.969 (65.609)	Top-5 acc 82.812 (85.036)	lr 0.00379
Train [90][1420/3239]	Time 0.264 (0.556)	Data Time 0.001 (0.034)	Loss 2.3206 (2.4236)	Entropy 0.56975 (0.56981)	Top-1 acc 69.531 (65.605)	Top-5 acc 86.719 (85.031)	lr 0.00379
Train [90][1430/3239]	Time 0.334 (0.555)	Data Time 0.001 (0.034)	Loss 2.3072 (2.4236)	Entropy 0.56969 (0.56981)	Top-1 acc 69.531 (65.610)	Top-5 acc 86.719 (85.034)	lr 0.00379
Train [90][1440/3239]	Time 0.253 (0.555)	Data Time 0.001 (0.034)	Loss 2.5034 (2.4239)	Entropy 0.56985 (0.56980)	Top-1 acc 65.625 (65.599)	Top-5 acc 81.641 (85.030)	lr 0.00379
Train [90][1450/3239]	Time 0.302 (0.554)	Data Time 0.001 (0.033)	Loss 2.4402 (2.4242)	Entropy 0.56977 (0.56981)	Top-1 acc 66.406 (65.592)	Top-5 acc 85.547 (85.024)	lr 0.00379
Train [90][1460/3239]	Time 0.279 (0.553)	Data Time 0.003 (0.033)	Loss 2.5192 (2.4239)	Entropy 0.56973 (0.56981)	Top-1 acc 60.547 (65.592)	Top-5 acc 83.984 (85.032)	lr 0.00379
Train [90][1470/3239]	Time 0.267 (0.552)	Data Time 0.001 (0.033)	Loss 2.4796 (2.4239)	Entropy 0.56943 (0.56980)	Top-1 acc 65.625 (65.606)	Top-5 acc 85.156 (85.033)	lr 0.00379
Train [90][1480/3239]	Time 0.276 (0.552)	Data Time 0.003 (0.033)	Loss 2.4456 (2.4242)	Entropy 0.56961 (0.56980)	Top-1 acc 66.016 (65.588)	Top-5 acc 83.984 (85.025)	lr 0.00379
Train [90][1490/3239]	Time 0.285 (0.551)	Data Time 0.001 (0.033)	Loss 2.5142 (2.4242)	Entropy 0.56956 (0.56980)	Top-1 acc 67.969 (65.586)	Top-5 acc 82.812 (85.024)	lr 0.00379
Train [90][1500/3239]	Time 0.337 (0.550)	Data Time 0.001 (0.032)	Loss 2.2727 (2.4237)	Entropy 0.57004 (0.56980)	Top-1 acc 71.094 (65.602)	Top-5 acc 88.281 (85.030)	lr 0.00379
Train [90][1510/3239]	Time 0.324 (0.549)	Data Time 0.003 (0.032)	Loss 2.4019 (2.4234)	Entropy 0.57025 (0.56980)	Top-1 acc 65.625 (65.607)	Top-5 acc 86.328 (85.034)	lr 0.00379
Train [90][1520/3239]	Time 0.230 (0.548)	Data Time 0.001 (0.032)	Loss 2.1875 (2.4231)	Entropy 0.57033 (0.56981)	Top-1 acc 70.703 (65.610)	Top-5 acc 89.062 (85.035)	lr 0.00378
Train [90][1530/3239]	Time 0.306 (0.548)	Data Time 0.001 (0.032)	Loss 2.3859 (2.4230)	Entropy 0.57091 (0.56981)	Top-1 acc 66.797 (65.619)	Top-5 acc 85.156 (85.034)	lr 0.00378
Train [90][1540/3239]	Time 0.287 (0.547)	Data Time 0.003 (0.032)	Loss 2.3239 (2.4231)	Entropy 0.57101 (0.56982)	Top-1 acc 68.750 (65.615)	Top-5 acc 88.281 (85.031)	lr 0.00378
Train [90][1550/3239]	Time 0.243 (0.546)	Data Time 0.001 (0.031)	Loss 2.4229 (2.4230)	Entropy 0.57116 (0.56983)	Top-1 acc 65.625 (65.618)	Top-5 acc 83.984 (85.032)	lr 0.00378
Train [90][1560/3239]	Time 0.260 (0.546)	Data Time 0.001 (0.031)	Loss 2.5723 (2.4227)	Entropy 0.57108 (0.56983)	Top-1 acc 64.453 (65.628)	Top-5 acc 81.250 (85.036)	lr 0.00378
Train [90][1570/3239]	Time 0.239 (0.545)	Data Time 0.001 (0.031)	Loss 2.3306 (2.4227)	Entropy 0.57044 (0.56984)	Top-1 acc 68.359 (65.629)	Top-5 acc 85.938 (85.033)	lr 0.00378
Train [90][1580/3239]	Time 0.277 (0.544)	Data Time 0.001 (0.031)	Loss 2.4274 (2.4234)	Entropy 0.57048 (0.56984)	Top-1 acc 69.141 (65.611)	Top-5 acc 83.984 (85.026)	lr 0.00378
Train [90][1590/3239]	Time 0.286 (0.544)	Data Time 0.002 (0.031)	Loss 2.1569 (2.4229)	Entropy 0.57034 (0.56985)	Top-1 acc 71.875 (65.621)	Top-5 acc 88.672 (85.033)	lr 0.00378
Train [90][1600/3239]	Time 0.279 (0.543)	Data Time 0.002 (0.030)	Loss 2.7717 (2.4231)	Entropy 0.56989 (0.56985)	Top-1 acc 58.594 (65.624)	Top-5 acc 79.688 (85.029)	lr 0.00378
Train [90][1610/3239]	Time 0.248 (0.542)	Data Time 0.001 (0.030)	Loss 2.3827 (2.4232)	Entropy 0.56998 (0.56985)	Top-1 acc 67.188 (65.627)	Top-5 acc 85.938 (85.027)	lr 0.00378
Train [90][1620/3239]	Time 0.279 (0.542)	Data Time 0.001 (0.030)	Loss 2.3143 (2.4233)	Entropy 0.57017 (0.56985)	Top-1 acc 70.312 (65.628)	Top-5 acc 86.719 (85.029)	lr 0.00378
Train [90][1630/3239]	Time 0.242 (0.541)	Data Time 0.001 (0.030)	Loss 2.3511 (2.4234)	Entropy 0.57046 (0.56985)	Top-1 acc 67.578 (65.629)	Top-5 acc 87.891 (85.031)	lr 0.00378
Train [90][1640/3239]	Time 0.227 (0.540)	Data Time 0.001 (0.030)	Loss 2.1836 (2.4234)	Entropy 0.57070 (0.56986)	Top-1 acc 71.094 (65.625)	Top-5 acc 89.453 (85.032)	lr 0.00378
Train [90][1650/3239]	Time 0.251 (0.540)	Data Time 0.001 (0.030)	Loss 2.2965 (2.4234)	Entropy 0.57078 (0.56986)	Top-1 acc 66.406 (65.621)	Top-5 acc 87.891 (85.031)	lr 0.00378
Train [90][1660/3239]	Time 0.364 (0.539)	Data Time 0.001 (0.029)	Loss 2.4857 (2.4233)	Entropy 0.57088 (0.56987)	Top-1 acc 64.062 (65.625)	Top-5 acc 85.547 (85.035)	lr 0.00377
Train [90][1670/3239]	Time 0.271 (0.539)	Data Time 0.002 (0.029)	Loss 2.5487 (2.4233)	Entropy 0.57071 (0.56987)	Top-1 acc 63.672 (65.623)	Top-5 acc 80.859 (85.036)	lr 0.00377
Train [90][1680/3239]	Time 0.286 (0.538)	Data Time 0.001 (0.029)	Loss 2.2507 (2.4235)	Entropy 0.57102 (0.56988)	Top-1 acc 72.266 (65.620)	Top-5 acc 88.672 (85.033)	lr 0.00377
Train [90][1690/3239]	Time 0.306 (0.538)	Data Time 0.032 (0.029)	Loss 2.3307 (2.4239)	Entropy 0.57100 (0.56989)	Top-1 acc 66.406 (65.602)	Top-5 acc 86.719 (85.030)	lr 0.00377
Train [90][1700/3239]	Time 0.219 (0.537)	Data Time 0.001 (0.029)	Loss 2.4054 (2.4242)	Entropy 0.57114 (0.56989)	Top-1 acc 66.797 (65.595)	Top-5 acc 86.328 (85.027)	lr 0.00377
Train [90][1710/3239]	Time 0.279 (0.537)	Data Time 0.001 (0.029)	Loss 2.5963 (2.4246)	Entropy 0.57132 (0.56990)	Top-1 acc 60.938 (65.589)	Top-5 acc 82.031 (85.021)	lr 0.00377
Train [90][1720/3239]	Time 0.258 (0.536)	Data Time 0.001 (0.028)	Loss 2.6682 (2.4246)	Entropy 0.57127 (0.56991)	Top-1 acc 60.547 (65.589)	Top-5 acc 79.688 (85.019)	lr 0.00377
Train [90][1730/3239]	Time 0.342 (0.535)	Data Time 0.001 (0.028)	Loss 2.5667 (2.4251)	Entropy 0.57126 (0.56992)	Top-1 acc 61.328 (65.576)	Top-5 acc 82.422 (85.009)	lr 0.00377
Train [90][1740/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.028)	Loss 2.4609 (2.4255)	Entropy 0.57137 (0.56993)	Top-1 acc 65.625 (65.564)	Top-5 acc 84.375 (84.999)	lr 0.00377
Train [90][1750/3239]	Time 0.261 (0.534)	Data Time 0.001 (0.028)	Loss 2.3412 (2.4249)	Entropy 0.57182 (0.56993)	Top-1 acc 68.750 (65.576)	Top-5 acc 85.938 (85.009)	lr 0.00377
Train [90][1760/3239]	Time 0.280 (0.534)	Data Time 0.002 (0.028)	Loss 2.3922 (2.4253)	Entropy 0.57182 (0.56995)	Top-1 acc 65.234 (65.568)	Top-5 acc 87.109 (85.003)	lr 0.00377
Train [90][1770/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.028)	Loss 2.5830 (2.4257)	Entropy 0.57210 (0.56996)	Top-1 acc 62.109 (65.564)	Top-5 acc 82.812 (84.995)	lr 0.00377
Train [90][1780/3239]	Time 0.337 (0.562)	Data Time 0.002 (0.028)	Loss 2.1716 (2.4254)	Entropy 0.57232 (0.56997)	Top-1 acc 68.750 (65.568)	Top-5 acc 89.844 (84.999)	lr 0.00377
Train [90][1790/3239]	Time 0.276 (0.561)	Data Time 0.003 (0.027)	Loss 2.3726 (2.4255)	Entropy 0.57234 (0.56998)	Top-1 acc 66.797 (65.558)	Top-5 acc 84.766 (84.995)	lr 0.00377
Train [90][1800/3239]	Time 0.245 (0.560)	Data Time 0.002 (0.027)	Loss 2.4406 (2.4257)	Entropy 0.57238 (0.56999)	Top-1 acc 66.016 (65.553)	Top-5 acc 83.594 (84.992)	lr 0.00376
Train [90][1810/3239]	Time 0.294 (0.560)	Data Time 0.002 (0.027)	Loss 2.4833 (2.4257)	Entropy 0.57259 (0.57001)	Top-1 acc 64.062 (65.551)	Top-5 acc 85.156 (84.989)	lr 0.00376
Train [90][1820/3239]	Time 0.413 (0.559)	Data Time 0.002 (0.027)	Loss 2.3133 (2.4255)	Entropy 0.57262 (0.57002)	Top-1 acc 66.406 (65.552)	Top-5 acc 87.109 (84.993)	lr 0.00376
Train [90][1830/3239]	Time 0.274 (0.559)	Data Time 0.001 (0.027)	Loss 2.3297 (2.4258)	Entropy 0.57264 (0.57004)	Top-1 acc 69.141 (65.549)	Top-5 acc 85.156 (84.989)	lr 0.00376
Train [90][1840/3239]	Time 0.248 (0.558)	Data Time 0.002 (0.027)	Loss 2.2696 (2.4257)	Entropy 0.57249 (0.57005)	Top-1 acc 68.359 (65.557)	Top-5 acc 89.062 (84.993)	lr 0.00376
Train [90][1850/3239]	Time 0.263 (0.557)	Data Time 0.001 (0.027)	Loss 2.3680 (2.4257)	Entropy 0.57230 (0.57006)	Top-1 acc 69.922 (65.561)	Top-5 acc 87.500 (84.991)	lr 0.00376
Train [90][1860/3239]	Time 0.338 (0.557)	Data Time 0.001 (0.027)	Loss 2.4643 (2.4258)	Entropy 0.57242 (0.57007)	Top-1 acc 60.938 (65.558)	Top-5 acc 83.203 (84.991)	lr 0.00376
Train [90][1870/3239]	Time 0.250 (0.557)	Data Time 0.001 (0.026)	Loss 2.3093 (2.4259)	Entropy 0.57266 (0.57009)	Top-1 acc 68.750 (65.552)	Top-5 acc 86.719 (84.991)	lr 0.00376
Train [90][1880/3239]	Time 0.248 (0.556)	Data Time 0.001 (0.026)	Loss 2.2909 (2.4259)	Entropy 0.57246 (0.57010)	Top-1 acc 70.703 (65.553)	Top-5 acc 87.109 (84.991)	lr 0.00376
Train [90][1890/3239]	Time 0.375 (0.556)	Data Time 0.002 (0.026)	Loss 2.4899 (2.4261)	Entropy 0.57239 (0.57011)	Top-1 acc 62.500 (65.550)	Top-5 acc 83.594 (84.985)	lr 0.00376
Train [90][1900/3239]	Time 0.242 (0.555)	Data Time 0.001 (0.026)	Loss 2.2710 (2.4260)	Entropy 0.57235 (0.57013)	Top-1 acc 70.312 (65.555)	Top-5 acc 85.938 (84.986)	lr 0.00376
Train [90][1910/3239]	Time 0.247 (0.554)	Data Time 0.002 (0.026)	Loss 2.5671 (2.4260)	Entropy 0.57232 (0.57014)	Top-1 acc 60.156 (65.546)	Top-5 acc 82.812 (84.984)	lr 0.00376
Train [90][1920/3239]	Time 0.240 (0.554)	Data Time 0.002 (0.026)	Loss 2.2890 (2.4258)	Entropy 0.57252 (0.57015)	Top-1 acc 70.312 (65.549)	Top-5 acc 84.766 (84.985)	lr 0.00376
Train [90][1930/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.026)	Loss 2.4526 (2.4259)	Entropy 0.57262 (0.57016)	Top-1 acc 65.625 (65.549)	Top-5 acc 82.812 (84.986)	lr 0.00376
Train [90][1940/3239]	Time 0.269 (0.553)	Data Time 0.001 (0.025)	Loss 2.2724 (2.4262)	Entropy 0.57268 (0.57017)	Top-1 acc 67.188 (65.537)	Top-5 acc 88.281 (84.986)	lr 0.00375
Train [90][1950/3239]	Time 0.274 (0.552)	Data Time 0.001 (0.025)	Loss 2.4911 (2.4262)	Entropy 0.57289 (0.57019)	Top-1 acc 64.062 (65.533)	Top-5 acc 86.328 (84.992)	lr 0.00375
Train [90][1960/3239]	Time 0.238 (0.551)	Data Time 0.001 (0.025)	Loss 2.5206 (2.4266)	Entropy 0.57286 (0.57020)	Top-1 acc 64.062 (65.519)	Top-5 acc 82.812 (84.985)	lr 0.00375
Train [90][1970/3239]	Time 0.274 (0.551)	Data Time 0.001 (0.025)	Loss 2.4491 (2.4269)	Entropy 0.57261 (0.57021)	Top-1 acc 63.672 (65.510)	Top-5 acc 85.156 (84.983)	lr 0.00375
Train [90][1980/3239]	Time 0.447 (0.550)	Data Time 0.008 (0.025)	Loss 2.5363 (2.4269)	Entropy 0.57278 (0.57023)	Top-1 acc 59.766 (65.507)	Top-5 acc 83.594 (84.985)	lr 0.00375
Train [90][1990/3239]	Time 0.230 (0.550)	Data Time 0.002 (0.025)	Loss 2.6262 (2.4270)	Entropy 0.57294 (0.57024)	Top-1 acc 60.938 (65.508)	Top-5 acc 80.469 (84.980)	lr 0.00375
Train [90][2000/3239]	Time 0.336 (0.549)	Data Time 0.001 (0.025)	Loss 2.6544 (2.4272)	Entropy 0.57298 (0.57025)	Top-1 acc 58.594 (65.501)	Top-5 acc 81.641 (84.976)	lr 0.00375
Train [90][2010/3239]	Time 0.233 (0.549)	Data Time 0.002 (0.025)	Loss 2.4178 (2.4270)	Entropy 0.57301 (0.57027)	Top-1 acc 67.188 (65.509)	Top-5 acc 85.938 (84.978)	lr 0.00375
Train [90][2020/3239]	Time 0.256 (0.548)	Data Time 0.002 (0.025)	Loss 2.3677 (2.4271)	Entropy 0.57310 (0.57028)	Top-1 acc 68.750 (65.508)	Top-5 acc 85.547 (84.975)	lr 0.00375
Train [90][2030/3239]	Time 0.237 (0.548)	Data Time 0.001 (0.024)	Loss 2.5709 (2.4272)	Entropy 0.57337 (0.57029)	Top-1 acc 63.672 (65.505)	Top-5 acc 80.859 (84.970)	lr 0.00375
Train [90][2040/3239]	Time 0.246 (0.547)	Data Time 0.001 (0.024)	Loss 2.4497 (2.4271)	Entropy 0.57316 (0.57031)	Top-1 acc 63.672 (65.502)	Top-5 acc 83.984 (84.971)	lr 0.00375
Train [90][2050/3239]	Time 0.390 (0.547)	Data Time 0.001 (0.024)	Loss 2.3675 (2.4269)	Entropy 0.57308 (0.57032)	Top-1 acc 68.750 (65.508)	Top-5 acc 85.156 (84.975)	lr 0.00375
Train [90][2060/3239]	Time 0.264 (0.546)	Data Time 0.001 (0.024)	Loss 2.6910 (2.4269)	Entropy 0.57297 (0.57034)	Top-1 acc 60.156 (65.504)	Top-5 acc 80.859 (84.977)	lr 0.00375
Train [90][2070/3239]	Time 0.240 (0.546)	Data Time 0.001 (0.024)	Loss 2.4263 (2.4268)	Entropy 0.57304 (0.57035)	Top-1 acc 65.234 (65.513)	Top-5 acc 86.719 (84.980)	lr 0.00375
Train [90][2080/3239]	Time 0.250 (0.545)	Data Time 0.001 (0.024)	Loss 2.3694 (2.4269)	Entropy 0.57313 (0.57036)	Top-1 acc 67.188 (65.512)	Top-5 acc 85.156 (84.975)	lr 0.00374
Train [90][2090/3239]	Time 0.284 (0.545)	Data Time 0.002 (0.024)	Loss 2.5392 (2.4270)	Entropy 0.57337 (0.57038)	Top-1 acc 60.547 (65.509)	Top-5 acc 83.203 (84.970)	lr 0.00374
Train [90][2100/3239]	Time 0.297 (0.545)	Data Time 0.001 (0.024)	Loss 2.4564 (2.4269)	Entropy 0.57363 (0.57039)	Top-1 acc 65.625 (65.513)	Top-5 acc 84.375 (84.975)	lr 0.00374
Train [90][2110/3239]	Time 0.287 (0.544)	Data Time 0.003 (0.024)	Loss 2.3636 (2.4269)	Entropy 0.57369 (0.57041)	Top-1 acc 69.141 (65.516)	Top-5 acc 87.500 (84.978)	lr 0.00374
Train [90][2120/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.023)	Loss 2.3635 (2.4268)	Entropy 0.57351 (0.57042)	Top-1 acc 68.750 (65.518)	Top-5 acc 85.156 (84.978)	lr 0.00374
Train [90][2130/3239]	Time 0.272 (0.543)	Data Time 0.001 (0.023)	Loss 2.3056 (2.4270)	Entropy 0.57382 (0.57044)	Top-1 acc 66.797 (65.511)	Top-5 acc 88.281 (84.976)	lr 0.00374
Train [90][2140/3239]	Time 0.518 (0.543)	Data Time 0.002 (0.023)	Loss 2.5977 (2.4271)	Entropy 0.57404 (0.57045)	Top-1 acc 61.719 (65.510)	Top-5 acc 82.031 (84.972)	lr 0.00374
Train [90][2150/3239]	Time 0.251 (0.543)	Data Time 0.002 (0.023)	Loss 2.5047 (2.4272)	Entropy 0.57408 (0.57047)	Top-1 acc 64.062 (65.510)	Top-5 acc 82.031 (84.970)	lr 0.00374
Train [90][2160/3239]	Time 0.271 (0.542)	Data Time 0.003 (0.023)	Loss 2.5931 (2.4275)	Entropy 0.57433 (0.57049)	Top-1 acc 62.500 (65.501)	Top-5 acc 78.516 (84.963)	lr 0.00374
Train [90][2170/3239]	Time 0.258 (0.542)	Data Time 0.001 (0.023)	Loss 2.5365 (2.4277)	Entropy 0.57433 (0.57050)	Top-1 acc 63.281 (65.498)	Top-5 acc 82.031 (84.962)	lr 0.00374
Train [90][2180/3239]	Time 0.348 (0.541)	Data Time 0.002 (0.023)	Loss 2.4166 (2.4275)	Entropy 0.57414 (0.57052)	Top-1 acc 65.625 (65.504)	Top-5 acc 87.891 (84.964)	lr 0.00374
Train [90][2190/3239]	Time 0.283 (0.541)	Data Time 0.002 (0.023)	Loss 2.4337 (2.4275)	Entropy 0.57402 (0.57054)	Top-1 acc 67.969 (65.507)	Top-5 acc 85.547 (84.966)	lr 0.00374
Train [90][2200/3239]	Time 0.297 (0.541)	Data Time 0.002 (0.023)	Loss 2.2882 (2.4275)	Entropy 0.57373 (0.57055)	Top-1 acc 67.578 (65.507)	Top-5 acc 87.500 (84.965)	lr 0.00374
Train [90][2210/3239]	Time 0.449 (0.540)	Data Time 0.002 (0.023)	Loss 2.5082 (2.4273)	Entropy 0.57364 (0.57057)	Top-1 acc 61.719 (65.513)	Top-5 acc 82.812 (84.966)	lr 0.00374
Train [90][2220/3239]	Time 0.230 (0.540)	Data Time 0.002 (0.022)	Loss 2.4475 (2.4275)	Entropy 0.57392 (0.57058)	Top-1 acc 63.281 (65.509)	Top-5 acc 85.938 (84.964)	lr 0.00373
Train [90][2230/3239]	Time 0.311 (0.540)	Data Time 0.001 (0.022)	Loss 2.5148 (2.4275)	Entropy 0.57420 (0.57060)	Top-1 acc 62.500 (65.507)	Top-5 acc 83.984 (84.962)	lr 0.00373
Train [90][2240/3239]	Time 0.259 (0.540)	Data Time 0.001 (0.022)	Loss 2.4052 (2.4274)	Entropy 0.57443 (0.57061)	Top-1 acc 66.406 (65.508)	Top-5 acc 84.375 (84.962)	lr 0.00373
Train [90][2250/3239]	Time 0.263 (0.539)	Data Time 0.001 (0.022)	Loss 2.4041 (2.4273)	Entropy 0.57456 (0.57063)	Top-1 acc 67.578 (65.516)	Top-5 acc 85.156 (84.962)	lr 0.00373
Train [90][2260/3239]	Time 0.307 (0.539)	Data Time 0.001 (0.022)	Loss 2.6655 (2.4276)	Entropy 0.57461 (0.57065)	Top-1 acc 56.641 (65.505)	Top-5 acc 81.250 (84.957)	lr 0.00373
Train [90][2270/3239]	Time 0.245 (0.538)	Data Time 0.001 (0.022)	Loss 2.4871 (2.4275)	Entropy 0.57452 (0.57066)	Top-1 acc 62.891 (65.507)	Top-5 acc 82.812 (84.958)	lr 0.00373
Train [90][2280/3239]	Time 0.237 (0.538)	Data Time 0.001 (0.022)	Loss 2.5268 (2.4274)	Entropy 0.57447 (0.57068)	Top-1 acc 65.625 (65.505)	Top-5 acc 81.641 (84.959)	lr 0.00373
Train [90][2290/3239]	Time 0.284 (0.537)	Data Time 0.024 (0.022)	Loss 2.5608 (2.4274)	Entropy 0.57453 (0.57070)	Top-1 acc 61.328 (65.502)	Top-5 acc 82.422 (84.963)	lr 0.00373
Train [90][2300/3239]	Time 0.238 (0.537)	Data Time 0.002 (0.022)	Loss 2.5405 (2.4275)	Entropy 0.57440 (0.57071)	Top-1 acc 63.281 (65.504)	Top-5 acc 82.422 (84.961)	lr 0.00373
Train [90][2310/3239]	Time 0.270 (0.536)	Data Time 0.001 (0.022)	Loss 2.3838 (2.4274)	Entropy 0.57442 (0.57073)	Top-1 acc 67.578 (65.499)	Top-5 acc 82.031 (84.961)	lr 0.00373
Train [90][2320/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.022)	Loss 2.6064 (2.4275)	Entropy 0.57453 (0.57075)	Top-1 acc 60.938 (65.498)	Top-5 acc 82.422 (84.960)	lr 0.00373
Train [90][2330/3239]	Time 0.341 (0.536)	Data Time 0.003 (0.022)	Loss 2.3427 (2.4276)	Entropy 0.57465 (0.57076)	Top-1 acc 66.016 (65.494)	Top-5 acc 85.547 (84.956)	lr 0.00373
Train [90][2340/3239]	Time 0.284 (0.535)	Data Time 0.001 (0.021)	Loss 2.4328 (2.4276)	Entropy 0.57481 (0.57078)	Top-1 acc 67.969 (65.499)	Top-5 acc 82.031 (84.955)	lr 0.00373
Train [90][2350/3239]	Time 0.293 (0.535)	Data Time 0.002 (0.021)	Loss 2.3065 (2.4277)	Entropy 0.57509 (0.57080)	Top-1 acc 65.625 (65.494)	Top-5 acc 87.500 (84.953)	lr 0.00372
Train [90][2360/3239]	Time 0.239 (0.534)	Data Time 0.002 (0.021)	Loss 2.4665 (2.4274)	Entropy 0.57501 (0.57082)	Top-1 acc 65.625 (65.501)	Top-5 acc 82.812 (84.956)	lr 0.00372
Train [90][2370/3239]	Time 0.374 (0.534)	Data Time 0.002 (0.021)	Loss 2.3245 (2.4274)	Entropy 0.57496 (0.57083)	Top-1 acc 67.969 (65.503)	Top-5 acc 87.109 (84.953)	lr 0.00372
Train [90][2380/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.021)	Loss 2.4938 (2.4276)	Entropy 0.57493 (0.57085)	Top-1 acc 64.844 (65.499)	Top-5 acc 84.375 (84.953)	lr 0.00372
Train [90][2390/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.021)	Loss 2.3552 (2.4272)	Entropy 0.57498 (0.57087)	Top-1 acc 66.016 (65.505)	Top-5 acc 85.547 (84.961)	lr 0.00372
Train [90][2400/3239]	Time 0.255 (0.533)	Data Time 0.001 (0.021)	Loss 2.6436 (2.4275)	Entropy 0.57491 (0.57088)	Top-1 acc 60.938 (65.499)	Top-5 acc 82.422 (84.957)	lr 0.00372
Train [90][2410/3239]	Time 0.264 (0.532)	Data Time 0.001 (0.021)	Loss 2.3376 (2.4276)	Entropy 0.57469 (0.57090)	Top-1 acc 70.703 (65.501)	Top-5 acc 86.719 (84.953)	lr 0.00372
Train [90][2420/3239]	Time 0.268 (0.532)	Data Time 0.002 (0.021)	Loss 2.2874 (2.4274)	Entropy 0.57435 (0.57092)	Top-1 acc 69.922 (65.507)	Top-5 acc 85.938 (84.954)	lr 0.00372
Train [90][2430/3239]	Time 0.292 (0.553)	Data Time 0.006 (0.021)	Loss 2.3321 (2.4274)	Entropy 0.57408 (0.57093)	Top-1 acc 72.266 (65.504)	Top-5 acc 86.328 (84.955)	lr 0.00372
Train [90][2440/3239]	Time 0.275 (0.553)	Data Time 0.004 (0.021)	Loss 2.4052 (2.4274)	Entropy 0.57408 (0.57094)	Top-1 acc 63.672 (65.504)	Top-5 acc 84.766 (84.957)	lr 0.00372
Train [90][2450/3239]	Time 0.281 (0.553)	Data Time 0.002 (0.021)	Loss 2.5190 (2.4274)	Entropy 0.57441 (0.57096)	Top-1 acc 63.672 (65.501)	Top-5 acc 82.031 (84.955)	lr 0.00372
Train [90][2460/3239]	Time 0.270 (0.553)	Data Time 0.003 (0.021)	Loss 2.4129 (2.4273)	Entropy 0.57469 (0.57097)	Top-1 acc 65.625 (65.503)	Top-5 acc 85.938 (84.956)	lr 0.00372
Train [90][2470/3239]	Time 0.282 (0.552)	Data Time 0.001 (0.020)	Loss 2.3325 (2.4273)	Entropy 0.57474 (0.57098)	Top-1 acc 70.312 (65.504)	Top-5 acc 83.594 (84.956)	lr 0.00372
Train [90][2480/3239]	Time 0.237 (0.552)	Data Time 0.001 (0.020)	Loss 2.6651 (2.4273)	Entropy 0.57465 (0.57100)	Top-1 acc 58.984 (65.506)	Top-5 acc 77.734 (84.954)	lr 0.00372
Train [90][2490/3239]	Time 0.285 (0.551)	Data Time 0.002 (0.020)	Loss 2.5835 (2.4272)	Entropy 0.57455 (0.57101)	Top-1 acc 59.375 (65.508)	Top-5 acc 80.469 (84.956)	lr 0.00371
Train [90][2500/3239]	Time 0.240 (0.551)	Data Time 0.001 (0.020)	Loss 2.3819 (2.4272)	Entropy 0.57459 (0.57103)	Top-1 acc 66.797 (65.504)	Top-5 acc 86.328 (84.956)	lr 0.00371
Train [90][2510/3239]	Time 0.373 (0.551)	Data Time 0.001 (0.020)	Loss 2.6001 (2.4274)	Entropy 0.57460 (0.57104)	Top-1 acc 62.891 (65.500)	Top-5 acc 80.078 (84.953)	lr 0.00371
Train [90][2520/3239]	Time 0.252 (0.550)	Data Time 0.001 (0.020)	Loss 2.5506 (2.4276)	Entropy 0.57462 (0.57106)	Top-1 acc 60.156 (65.499)	Top-5 acc 83.594 (84.951)	lr 0.00371
Train [90][2530/3239]	Time 0.391 (0.550)	Data Time 0.001 (0.020)	Loss 2.3606 (2.4275)	Entropy 0.57470 (0.57107)	Top-1 acc 65.234 (65.499)	Top-5 acc 87.891 (84.955)	lr 0.00371
Train [90][2540/3239]	Time 0.270 (0.550)	Data Time 0.001 (0.020)	Loss 2.2592 (2.4277)	Entropy 0.57459 (0.57109)	Top-1 acc 71.484 (65.492)	Top-5 acc 88.672 (84.953)	lr 0.00371
Train [90][2550/3239]	Time 0.253 (0.549)	Data Time 0.002 (0.020)	Loss 2.3739 (2.4279)	Entropy 0.57448 (0.57110)	Top-1 acc 64.453 (65.486)	Top-5 acc 85.156 (84.947)	lr 0.00371
Train [90][2560/3239]	Time 0.229 (0.549)	Data Time 0.001 (0.020)	Loss 2.4700 (2.4281)	Entropy 0.57444 (0.57111)	Top-1 acc 66.406 (65.481)	Top-5 acc 83.984 (84.942)	lr 0.00371
Train [90][2570/3239]	Time 0.257 (0.548)	Data Time 0.002 (0.020)	Loss 2.5215 (2.4281)	Entropy 0.57440 (0.57112)	Top-1 acc 63.281 (65.483)	Top-5 acc 83.594 (84.939)	lr 0.00371
Train [90][2580/3239]	Time 0.305 (0.548)	Data Time 0.001 (0.020)	Loss 2.5840 (2.4281)	Entropy 0.57458 (0.57114)	Top-1 acc 56.641 (65.478)	Top-5 acc 82.422 (84.938)	lr 0.00371
Train [90][2590/3239]	Time 0.250 (0.548)	Data Time 0.001 (0.020)	Loss 2.5880 (2.4280)	Entropy 0.57454 (0.57115)	Top-1 acc 64.453 (65.484)	Top-5 acc 82.812 (84.939)	lr 0.00371
Train [90][2600/3239]	Time 0.367 (0.547)	Data Time 0.001 (0.020)	Loss 2.4149 (2.4281)	Entropy 0.57443 (0.57116)	Top-1 acc 63.672 (65.485)	Top-5 acc 85.547 (84.936)	lr 0.00371
Train [90][2610/3239]	Time 0.243 (0.547)	Data Time 0.001 (0.019)	Loss 2.3543 (2.4284)	Entropy 0.57449 (0.57118)	Top-1 acc 68.359 (65.479)	Top-5 acc 87.109 (84.931)	lr 0.00371
Train [90][2620/3239]	Time 0.293 (0.547)	Data Time 0.001 (0.019)	Loss 2.2867 (2.4282)	Entropy 0.57419 (0.57119)	Top-1 acc 68.750 (65.483)	Top-5 acc 88.281 (84.934)	lr 0.00371
Train [90][2630/3239]	Time 0.264 (0.546)	Data Time 0.001 (0.019)	Loss 2.1597 (2.4281)	Entropy 0.57426 (0.57120)	Top-1 acc 72.656 (65.487)	Top-5 acc 89.062 (84.937)	lr 0.00370
Train [90][2640/3239]	Time 0.263 (0.546)	Data Time 0.001 (0.019)	Loss 2.4257 (2.4281)	Entropy 0.57425 (0.57121)	Top-1 acc 64.453 (65.483)	Top-5 acc 84.766 (84.935)	lr 0.00370
Train [90][2650/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.019)	Loss 2.3247 (2.4281)	Entropy 0.57408 (0.57122)	Top-1 acc 70.312 (65.485)	Top-5 acc 83.984 (84.935)	lr 0.00370
Train [90][2660/3239]	Time 0.242 (0.545)	Data Time 0.002 (0.019)	Loss 2.4525 (2.4281)	Entropy 0.57416 (0.57123)	Top-1 acc 64.062 (65.486)	Top-5 acc 82.812 (84.932)	lr 0.00370
Train [90][2670/3239]	Time 0.257 (0.544)	Data Time 0.001 (0.019)	Loss 2.5447 (2.4282)	Entropy 0.57379 (0.57124)	Top-1 acc 62.109 (65.484)	Top-5 acc 83.984 (84.932)	lr 0.00370
Train [90][2680/3239]	Time 0.250 (0.544)	Data Time 0.001 (0.019)	Loss 2.4905 (2.4283)	Entropy 0.57357 (0.57125)	Top-1 acc 61.328 (65.484)	Top-5 acc 85.156 (84.931)	lr 0.00370
Train [90][2690/3239]	Time 0.367 (0.544)	Data Time 0.002 (0.019)	Loss 2.3758 (2.4283)	Entropy 0.57339 (0.57126)	Top-1 acc 67.188 (65.484)	Top-5 acc 84.766 (84.930)	lr 0.00370
Train [90][2700/3239]	Time 0.225 (0.544)	Data Time 0.001 (0.019)	Loss 2.6622 (2.4283)	Entropy 0.57360 (0.57127)	Top-1 acc 63.672 (65.481)	Top-5 acc 76.562 (84.929)	lr 0.00370
Train [90][2710/3239]	Time 0.308 (0.543)	Data Time 0.001 (0.019)	Loss 2.5921 (2.4283)	Entropy 0.57367 (0.57128)	Top-1 acc 62.500 (65.479)	Top-5 acc 79.688 (84.930)	lr 0.00370
Train [90][2720/3239]	Time 0.255 (0.543)	Data Time 0.001 (0.019)	Loss 2.2258 (2.4283)	Entropy 0.57340 (0.57129)	Top-1 acc 70.703 (65.479)	Top-5 acc 90.625 (84.931)	lr 0.00370
Train [90][2730/3239]	Time 0.243 (0.543)	Data Time 0.002 (0.019)	Loss 2.3126 (2.4282)	Entropy 0.57314 (0.57129)	Top-1 acc 68.750 (65.481)	Top-5 acc 85.938 (84.932)	lr 0.00370
Train [90][2740/3239]	Time 0.295 (0.543)	Data Time 0.001 (0.019)	Loss 2.3286 (2.4283)	Entropy 0.57310 (0.57130)	Top-1 acc 68.750 (65.477)	Top-5 acc 85.938 (84.929)	lr 0.00370
Train [90][2750/3239]	Time 0.246 (0.542)	Data Time 0.002 (0.019)	Loss 2.3564 (2.4282)	Entropy 0.57330 (0.57131)	Top-1 acc 67.578 (65.477)	Top-5 acc 86.328 (84.932)	lr 0.00370
Train [90][2760/3239]	Time 0.354 (0.542)	Data Time 0.001 (0.018)	Loss 2.4752 (2.4286)	Entropy 0.57324 (0.57131)	Top-1 acc 63.281 (65.471)	Top-5 acc 85.547 (84.928)	lr 0.00370
Train [90][2770/3239]	Time 0.260 (0.541)	Data Time 0.001 (0.018)	Loss 2.5281 (2.4287)	Entropy 0.57332 (0.57132)	Top-1 acc 62.500 (65.468)	Top-5 acc 82.422 (84.925)	lr 0.00369
Train [90][2780/3239]	Time 0.236 (0.541)	Data Time 0.001 (0.018)	Loss 2.6106 (2.4286)	Entropy 0.57339 (0.57133)	Top-1 acc 62.500 (65.474)	Top-5 acc 80.859 (84.927)	lr 0.00369
Train [90][2790/3239]	Time 0.238 (0.541)	Data Time 0.001 (0.018)	Loss 2.6165 (2.4288)	Entropy 0.57342 (0.57134)	Top-1 acc 63.672 (65.469)	Top-5 acc 82.031 (84.925)	lr 0.00369
Train [90][2800/3239]	Time 0.307 (0.540)	Data Time 0.001 (0.018)	Loss 2.3263 (2.4287)	Entropy 0.57326 (0.57134)	Top-1 acc 69.922 (65.470)	Top-5 acc 88.281 (84.928)	lr 0.00369
Train [90][2810/3239]	Time 0.294 (0.540)	Data Time 0.001 (0.018)	Loss 2.4110 (2.4289)	Entropy 0.57333 (0.57135)	Top-1 acc 67.188 (65.467)	Top-5 acc 84.766 (84.922)	lr 0.00369
Train [90][2820/3239]	Time 0.241 (0.540)	Data Time 0.002 (0.018)	Loss 2.3256 (2.4288)	Entropy 0.57330 (0.57136)	Top-1 acc 71.875 (65.472)	Top-5 acc 85.156 (84.922)	lr 0.00369
Train [90][2830/3239]	Time 0.297 (0.539)	Data Time 0.001 (0.018)	Loss 2.3508 (2.4290)	Entropy 0.57348 (0.57136)	Top-1 acc 69.922 (65.470)	Top-5 acc 87.891 (84.920)	lr 0.00369
Train [90][2840/3239]	Time 0.245 (0.539)	Data Time 0.001 (0.018)	Loss 2.2402 (2.4287)	Entropy 0.57388 (0.57137)	Top-1 acc 66.797 (65.476)	Top-5 acc 90.234 (84.926)	lr 0.00369
Train [90][2850/3239]	Time 0.307 (0.538)	Data Time 0.001 (0.018)	Loss 2.4022 (2.4287)	Entropy 0.57437 (0.57138)	Top-1 acc 62.500 (65.473)	Top-5 acc 86.719 (84.928)	lr 0.00369
Train [90][2860/3239]	Time 0.264 (0.538)	Data Time 0.001 (0.018)	Loss 2.5745 (2.4287)	Entropy 0.57431 (0.57139)	Top-1 acc 62.109 (65.474)	Top-5 acc 83.984 (84.929)	lr 0.00369
Train [90][2870/3239]	Time 0.288 (0.538)	Data Time 0.003 (0.018)	Loss 2.5511 (2.4287)	Entropy 0.57438 (0.57140)	Top-1 acc 62.500 (65.475)	Top-5 acc 83.203 (84.930)	lr 0.00369
Train [90][2880/3239]	Time 0.236 (0.537)	Data Time 0.002 (0.018)	Loss 2.3345 (2.4288)	Entropy 0.57389 (0.57141)	Top-1 acc 67.188 (65.472)	Top-5 acc 84.766 (84.930)	lr 0.00369
Train [90][2890/3239]	Time 0.241 (0.537)	Data Time 0.001 (0.018)	Loss 2.6378 (2.4288)	Entropy 0.57397 (0.57142)	Top-1 acc 64.844 (65.472)	Top-5 acc 80.859 (84.928)	lr 0.00369
Train [90][2900/3239]	Time 0.268 (0.537)	Data Time 0.001 (0.018)	Loss 2.2745 (2.4287)	Entropy 0.57394 (0.57143)	Top-1 acc 73.047 (65.478)	Top-5 acc 87.500 (84.932)	lr 0.00369
Train [90][2910/3239]	Time 0.252 (0.536)	Data Time 0.001 (0.018)	Loss 2.3154 (2.4286)	Entropy 0.57384 (0.57144)	Top-1 acc 71.094 (65.481)	Top-5 acc 87.500 (84.933)	lr 0.00368
Train [90][2920/3239]	Time 0.344 (0.536)	Data Time 0.001 (0.018)	Loss 2.4149 (2.4287)	Entropy 0.57385 (0.57145)	Top-1 acc 66.797 (65.477)	Top-5 acc 86.719 (84.933)	lr 0.00368
Train [90][2930/3239]	Time 0.248 (0.536)	Data Time 0.002 (0.018)	Loss 2.4501 (2.4290)	Entropy 0.57412 (0.57146)	Top-1 acc 64.453 (65.473)	Top-5 acc 84.766 (84.930)	lr 0.00368
Train [90][2940/3239]	Time 0.262 (0.535)	Data Time 0.002 (0.017)	Loss 2.5294 (2.4289)	Entropy 0.57405 (0.57146)	Top-1 acc 62.109 (65.473)	Top-5 acc 85.156 (84.931)	lr 0.00368
Train [90][2950/3239]	Time 0.269 (0.535)	Data Time 0.001 (0.017)	Loss 2.5461 (2.4291)	Entropy 0.57365 (0.57147)	Top-1 acc 64.844 (65.468)	Top-5 acc 83.203 (84.927)	lr 0.00368
Train [90][2960/3239]	Time 0.277 (0.535)	Data Time 0.001 (0.017)	Loss 2.3387 (2.4291)	Entropy 0.57384 (0.57148)	Top-1 acc 67.969 (65.470)	Top-5 acc 88.281 (84.926)	lr 0.00368
Train [90][2970/3239]	Time 0.245 (0.534)	Data Time 0.007 (0.017)	Loss 2.4769 (2.4292)	Entropy 0.57389 (0.57149)	Top-1 acc 65.625 (65.468)	Top-5 acc 83.203 (84.926)	lr 0.00368
Train [90][2980/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.017)	Loss 2.4782 (2.4290)	Entropy 0.57394 (0.57150)	Top-1 acc 64.062 (65.472)	Top-5 acc 83.984 (84.929)	lr 0.00368
Train [90][2990/3239]	Time 0.376 (0.534)	Data Time 0.023 (0.017)	Loss 2.5008 (2.4290)	Entropy 0.57399 (0.57150)	Top-1 acc 64.453 (65.473)	Top-5 acc 82.031 (84.928)	lr 0.00368
Train [90][3000/3239]	Time 0.277 (0.533)	Data Time 0.001 (0.017)	Loss 2.6237 (2.4289)	Entropy 0.57406 (0.57151)	Top-1 acc 61.328 (65.471)	Top-5 acc 81.250 (84.928)	lr 0.00368
Train [90][3010/3239]	Time 0.271 (0.533)	Data Time 0.001 (0.017)	Loss 2.6485 (2.4290)	Entropy 0.57383 (0.57152)	Top-1 acc 58.984 (65.468)	Top-5 acc 82.031 (84.927)	lr 0.00368
Train [90][3020/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.017)	Loss 2.7769 (2.4290)	Entropy 0.57386 (0.57153)	Top-1 acc 58.594 (65.468)	Top-5 acc 79.297 (84.926)	lr 0.00368
Train [90][3030/3239]	Time 0.292 (0.532)	Data Time 0.001 (0.017)	Loss 2.3873 (2.4290)	Entropy 0.57400 (0.57154)	Top-1 acc 67.578 (65.467)	Top-5 acc 85.938 (84.928)	lr 0.00368
Train [90][3040/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.017)	Loss 2.5879 (2.4288)	Entropy 0.57376 (0.57154)	Top-1 acc 64.062 (65.473)	Top-5 acc 83.984 (84.931)	lr 0.00368
Train [90][3050/3239]	Time 0.262 (0.532)	Data Time 0.001 (0.017)	Loss 2.4465 (2.4288)	Entropy 0.57392 (0.57155)	Top-1 acc 66.406 (65.472)	Top-5 acc 83.594 (84.930)	lr 0.00367
Train [90][3060/3239]	Time 0.248 (0.532)	Data Time 0.001 (0.017)	Loss 2.3085 (2.4289)	Entropy 0.57392 (0.57156)	Top-1 acc 68.359 (65.470)	Top-5 acc 86.719 (84.931)	lr 0.00367
Train [90][3070/3239]	Time 0.275 (0.531)	Data Time 0.001 (0.017)	Loss 2.2683 (2.4290)	Entropy 0.57384 (0.57157)	Top-1 acc 67.188 (65.466)	Top-5 acc 89.062 (84.929)	lr 0.00367
Train [90][3080/3239]	Time 0.378 (0.531)	Data Time 0.001 (0.017)	Loss 2.2670 (2.4288)	Entropy 0.57377 (0.57157)	Top-1 acc 67.969 (65.470)	Top-5 acc 87.109 (84.933)	lr 0.00367
Train [90][3090/3239]	Time 0.350 (0.548)	Data Time 0.002 (0.017)	Loss 2.2453 (2.4288)	Entropy 0.57389 (0.57158)	Top-1 acc 68.359 (65.467)	Top-5 acc 88.672 (84.932)	lr 0.00367
Train [90][3100/3239]	Time 0.249 (0.548)	Data Time 0.002 (0.017)	Loss 2.2858 (2.4286)	Entropy 0.57379 (0.57159)	Top-1 acc 65.625 (65.467)	Top-5 acc 89.062 (84.935)	lr 0.00367
Train [90][3110/3239]	Time 0.242 (0.547)	Data Time 0.002 (0.017)	Loss 2.3669 (2.4284)	Entropy 0.57400 (0.57160)	Top-1 acc 69.531 (65.474)	Top-5 acc 85.547 (84.937)	lr 0.00367
Train [90][3120/3239]	Time 0.288 (0.547)	Data Time 0.003 (0.017)	Loss 2.4727 (2.4286)	Entropy 0.57387 (0.57160)	Top-1 acc 65.234 (65.468)	Top-5 acc 83.594 (84.933)	lr 0.00367
Train [90][3130/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.017)	Loss 2.4718 (2.4287)	Entropy 0.57398 (0.57161)	Top-1 acc 64.453 (65.465)	Top-5 acc 83.594 (84.930)	lr 0.00367
Train [90][3140/3239]	Time 0.250 (0.546)	Data Time 0.002 (0.016)	Loss 2.3483 (2.4286)	Entropy 0.57398 (0.57162)	Top-1 acc 64.844 (65.465)	Top-5 acc 85.938 (84.933)	lr 0.00367
Train [90][3150/3239]	Time 0.341 (0.546)	Data Time 0.001 (0.016)	Loss 2.3229 (2.4286)	Entropy 0.57387 (0.57163)	Top-1 acc 67.969 (65.464)	Top-5 acc 86.328 (84.932)	lr 0.00367
Train [90][3160/3239]	Time 0.252 (0.546)	Data Time 0.001 (0.016)	Loss 2.5199 (2.4286)	Entropy 0.57355 (0.57163)	Top-1 acc 62.109 (65.460)	Top-5 acc 83.594 (84.932)	lr 0.00367
Train [90][3170/3239]	Time 0.344 (0.546)	Data Time 0.001 (0.016)	Loss 2.2792 (2.4287)	Entropy 0.57345 (0.57164)	Top-1 acc 71.484 (65.456)	Top-5 acc 87.109 (84.931)	lr 0.00367
Train [90][3180/3239]	Time 0.221 (0.545)	Data Time 0.000 (0.016)	Loss 2.5212 (2.4287)	Entropy 0.57343 (0.57164)	Top-1 acc 64.062 (65.458)	Top-5 acc 85.156 (84.931)	lr 0.00367
Train [90][3190/3239]	Time 0.240 (0.545)	Data Time 0.000 (0.016)	Loss 2.6950 (2.4290)	Entropy 0.57326 (0.57165)	Top-1 acc 58.984 (65.452)	Top-5 acc 78.516 (84.924)	lr 0.00366
Train [90][3200/3239]	Time 0.243 (0.545)	Data Time 0.000 (0.016)	Loss 2.5836 (2.4292)	Entropy 0.57332 (0.57165)	Top-1 acc 58.984 (65.446)	Top-5 acc 82.031 (84.922)	lr 0.00366
Train [90][3210/3239]	Time 0.244 (0.544)	Data Time 0.000 (0.016)	Loss 2.3683 (2.4294)	Entropy 0.57348 (0.57166)	Top-1 acc 66.797 (65.441)	Top-5 acc 85.156 (84.918)	lr 0.00366
Train [90][3220/3239]	Time 0.244 (0.544)	Data Time 0.000 (0.016)	Loss 2.5519 (2.4293)	Entropy 0.57352 (0.57167)	Top-1 acc 65.234 (65.442)	Top-5 acc 81.641 (84.922)	lr 0.00366
Train [90][3230/3239]	Time 0.216 (0.543)	Data Time 0.000 (0.016)	Loss 2.7946 (2.4295)	Entropy 0.57334 (0.57167)	Top-1 acc 58.203 (65.438)	Top-5 acc 80.469 (84.919)	lr 0.00366
Train [90][3239/3239]	Time 0.835 (0.543)	Data Time 0.000 (0.016)	Loss 2.4411 (2.4293)	Entropy 0.57326 (0.57168)	Top-1 acc 60.494 (65.442)	Top-5 acc 83.951 (84.923)	lr 0.00366
==========Valid [90/120]	loss 1.240	top-1 acc 71.368 (71.623)	top-5 acc 89.709	Train top-1 65.442	top-5 84.923	Entropy 0.57326	Latency-None: 0.000ms	Flops: 539.00M
Train [91][0/3239]	Time 43.353 (43.353)	Data Time 41.539 (41.539)	Loss 2.3772 (2.3772)	Entropy 0.57340 (0.57340)	Top-1 acc 66.406 (66.406)	Top-5 acc 85.156 (85.156)	lr 0.00366
Train [91][10/3239]	Time 0.236 (4.487)	Data Time 0.001 (3.778)	Loss 2.4779 (2.3797)	Entropy 0.57322 (0.57337)	Top-1 acc 62.109 (66.761)	Top-5 acc 85.156 (85.795)	lr 0.00366
Train [91][20/3239]	Time 0.244 (2.563)	Data Time 0.001 (1.980)	Loss 2.4319 (2.3924)	Entropy 0.57341 (0.57334)	Top-1 acc 61.328 (66.090)	Top-5 acc 86.328 (85.863)	lr 0.00366
Train [91][30/3239]	Time 0.245 (1.881)	Data Time 0.001 (1.342)	Loss 2.4614 (2.4304)	Entropy 0.57324 (0.57335)	Top-1 acc 63.672 (65.386)	Top-5 acc 85.547 (85.156)	lr 0.00366
Train [91][40/3239]	Time 0.236 (1.530)	Data Time 0.001 (1.015)	Loss 2.5156 (2.4195)	Entropy 0.57318 (0.57332)	Top-1 acc 62.500 (65.730)	Top-5 acc 83.984 (85.213)	lr 0.00366
Train [91][50/3239]	Time 0.256 (1.325)	Data Time 0.001 (0.816)	Loss 2.3603 (2.4290)	Entropy 0.57309 (0.57328)	Top-1 acc 67.969 (65.564)	Top-5 acc 86.719 (85.049)	lr 0.00366
Train [91][60/3239]	Time 0.278 (1.193)	Data Time 0.002 (0.683)	Loss 2.1673 (2.4201)	Entropy 0.57327 (0.57325)	Top-1 acc 70.703 (65.676)	Top-5 acc 91.797 (85.195)	lr 0.00366
Train [91][70/3239]	Time 0.293 (1.087)	Data Time 0.001 (0.587)	Loss 2.5254 (2.4225)	Entropy 0.57293 (0.57323)	Top-1 acc 63.281 (65.735)	Top-5 acc 81.641 (85.123)	lr 0.00366
Train [91][80/3239]	Time 0.242 (1.009)	Data Time 0.001 (0.515)	Loss 2.4381 (2.4146)	Entropy 0.57239 (0.57318)	Top-1 acc 65.625 (65.929)	Top-5 acc 86.719 (85.277)	lr 0.00366
Train [91][90/3239]	Time 0.235 (0.947)	Data Time 0.001 (0.458)	Loss 2.3180 (2.4119)	Entropy 0.57210 (0.57308)	Top-1 acc 66.406 (65.973)	Top-5 acc 87.500 (85.315)	lr 0.00365
Train [91][100/3239]	Time 0.231 (0.896)	Data Time 0.001 (0.413)	Loss 2.6621 (2.4101)	Entropy 0.57201 (0.57298)	Top-1 acc 59.766 (65.907)	Top-5 acc 80.078 (85.377)	lr 0.00365
Train [91][110/3239]	Time 0.232 (0.854)	Data Time 0.001 (0.376)	Loss 2.4204 (2.4085)	Entropy 0.57170 (0.57288)	Top-1 acc 66.016 (65.945)	Top-5 acc 84.766 (85.367)	lr 0.00365
Train [91][120/3239]	Time 0.235 (0.822)	Data Time 0.001 (0.345)	Loss 2.3635 (2.4139)	Entropy 0.57168 (0.57278)	Top-1 acc 68.359 (65.809)	Top-5 acc 85.547 (85.237)	lr 0.00365
Train [91][130/3239]	Time 0.237 (0.793)	Data Time 0.001 (0.319)	Loss 2.3905 (2.4101)	Entropy 0.57185 (0.57271)	Top-1 acc 62.891 (65.843)	Top-5 acc 86.719 (85.314)	lr 0.00365
Train [91][140/3239]	Time 0.348 (0.768)	Data Time 0.001 (0.296)	Loss 2.4605 (2.4122)	Entropy 0.57183 (0.57265)	Top-1 acc 65.234 (65.813)	Top-5 acc 85.156 (85.292)	lr 0.00365
Train [91][150/3239]	Time 0.233 (0.746)	Data Time 0.001 (0.277)	Loss 2.4231 (2.4105)	Entropy 0.57208 (0.57260)	Top-1 acc 67.188 (65.891)	Top-5 acc 85.547 (85.273)	lr 0.00365
Train [91][160/3239]	Time 0.244 (0.731)	Data Time 0.001 (0.260)	Loss 2.5645 (2.4151)	Entropy 0.57167 (0.57255)	Top-1 acc 62.109 (65.846)	Top-5 acc 81.250 (85.231)	lr 0.00365
Train [91][170/3239]	Time 0.241 (0.714)	Data Time 0.001 (0.245)	Loss 2.4004 (2.4169)	Entropy 0.57157 (0.57250)	Top-1 acc 66.797 (65.849)	Top-5 acc 85.938 (85.218)	lr 0.00365
Train [91][180/3239]	Time 0.284 (0.699)	Data Time 0.001 (0.231)	Loss 2.3473 (2.4156)	Entropy 0.57161 (0.57244)	Top-1 acc 65.625 (65.890)	Top-5 acc 83.984 (85.240)	lr 0.00365
Train [91][190/3239]	Time 0.236 (0.685)	Data Time 0.001 (0.219)	Loss 2.1629 (2.4150)	Entropy 0.57167 (0.57240)	Top-1 acc 71.484 (65.881)	Top-5 acc 89.453 (85.218)	lr 0.00365
Train [91][200/3239]	Time 0.231 (0.672)	Data Time 0.001 (0.209)	Loss 2.3475 (2.4127)	Entropy 0.57198 (0.57238)	Top-1 acc 69.531 (65.942)	Top-5 acc 86.719 (85.257)	lr 0.00365
Train [91][210/3239]	Time 0.362 (0.660)	Data Time 0.001 (0.199)	Loss 2.3041 (2.4119)	Entropy 0.57204 (0.57236)	Top-1 acc 64.844 (65.969)	Top-5 acc 85.938 (85.251)	lr 0.00365
Train [91][220/3239]	Time 0.234 (0.650)	Data Time 0.001 (0.190)	Loss 2.4013 (2.4108)	Entropy 0.57218 (0.57234)	Top-1 acc 66.406 (66.009)	Top-5 acc 83.984 (85.264)	lr 0.00365
Train [91][230/3239]	Time 0.231 (0.640)	Data Time 0.001 (0.182)	Loss 2.4768 (2.4101)	Entropy 0.57228 (0.57234)	Top-1 acc 67.188 (66.012)	Top-5 acc 82.031 (85.298)	lr 0.00364
Train [91][240/3239]	Time 0.244 (0.631)	Data Time 0.001 (0.174)	Loss 2.1441 (2.4100)	Entropy 0.57274 (0.57234)	Top-1 acc 70.312 (65.988)	Top-5 acc 91.016 (85.263)	lr 0.00364
Train [91][250/3239]	Time 0.261 (0.623)	Data Time 0.001 (0.167)	Loss 2.2611 (2.4110)	Entropy 0.57265 (0.57235)	Top-1 acc 71.875 (65.978)	Top-5 acc 89.453 (85.262)	lr 0.00364
Train [91][260/3239]	Time 0.239 (0.615)	Data Time 0.001 (0.161)	Loss 2.1896 (2.4087)	Entropy 0.57260 (0.57237)	Top-1 acc 71.094 (66.013)	Top-5 acc 89.062 (85.321)	lr 0.00364
Train [91][270/3239]	Time 0.234 (0.608)	Data Time 0.001 (0.155)	Loss 2.5501 (2.4112)	Entropy 0.57256 (0.57237)	Top-1 acc 61.328 (65.912)	Top-5 acc 84.375 (85.276)	lr 0.00364
Train [91][280/3239]	Time 0.269 (0.602)	Data Time 0.002 (0.150)	Loss 2.4821 (2.4127)	Entropy 0.57225 (0.57237)	Top-1 acc 66.797 (65.879)	Top-5 acc 84.766 (85.263)	lr 0.00364
Train [91][290/3239]	Time 0.244 (0.596)	Data Time 0.001 (0.145)	Loss 2.3419 (2.4136)	Entropy 0.57198 (0.57236)	Top-1 acc 64.062 (65.806)	Top-5 acc 88.281 (85.274)	lr 0.00364
Train [91][300/3239]	Time 0.355 (0.590)	Data Time 0.001 (0.140)	Loss 2.8033 (2.4167)	Entropy 0.57212 (0.57235)	Top-1 acc 56.250 (65.705)	Top-5 acc 78.906 (85.239)	lr 0.00364
Train [91][310/3239]	Time 0.241 (0.585)	Data Time 0.001 (0.135)	Loss 2.4599 (2.4179)	Entropy 0.57217 (0.57235)	Top-1 acc 63.281 (65.689)	Top-5 acc 83.203 (85.196)	lr 0.00364
Train [91][320/3239]	Time 0.234 (0.580)	Data Time 0.002 (0.131)	Loss 2.5660 (2.4174)	Entropy 0.57236 (0.57235)	Top-1 acc 65.625 (65.696)	Top-5 acc 82.031 (85.210)	lr 0.00364
Train [91][330/3239]	Time 0.229 (0.576)	Data Time 0.001 (0.127)	Loss 2.4375 (2.4183)	Entropy 0.57198 (0.57234)	Top-1 acc 63.672 (65.682)	Top-5 acc 86.719 (85.186)	lr 0.00364
Train [91][340/3239]	Time 0.234 (0.572)	Data Time 0.001 (0.124)	Loss 2.5461 (2.4177)	Entropy 0.57168 (0.57233)	Top-1 acc 60.938 (65.698)	Top-5 acc 83.594 (85.191)	lr 0.00364
Train [91][350/3239]	Time 0.297 (0.568)	Data Time 0.002 (0.120)	Loss 2.2106 (2.4161)	Entropy 0.57172 (0.57231)	Top-1 acc 71.875 (65.736)	Top-5 acc 90.234 (85.222)	lr 0.00364
Train [91][360/3239]	Time 0.241 (0.565)	Data Time 0.001 (0.117)	Loss 2.3980 (2.4149)	Entropy 0.57175 (0.57229)	Top-1 acc 66.016 (65.767)	Top-5 acc 85.547 (85.237)	lr 0.00364
Train [91][370/3239]	Time 0.338 (0.562)	Data Time 0.001 (0.114)	Loss 2.4212 (2.4157)	Entropy 0.57187 (0.57228)	Top-1 acc 64.062 (65.742)	Top-5 acc 85.156 (85.231)	lr 0.00363
Train [91][380/3239]	Time 0.240 (0.559)	Data Time 0.001 (0.111)	Loss 2.2793 (2.4133)	Entropy 0.57157 (0.57226)	Top-1 acc 69.922 (65.785)	Top-5 acc 86.328 (85.277)	lr 0.00363
Train [91][390/3239]	Time 0.242 (0.555)	Data Time 0.001 (0.108)	Loss 2.4094 (2.4122)	Entropy 0.57148 (0.57225)	Top-1 acc 66.797 (65.804)	Top-5 acc 84.766 (85.288)	lr 0.00363
Train [91][400/3239]	Time 0.231 (0.552)	Data Time 0.001 (0.105)	Loss 2.3886 (2.4132)	Entropy 0.57143 (0.57223)	Top-1 acc 65.625 (65.784)	Top-5 acc 87.109 (85.277)	lr 0.00363
Train [91][410/3239]	Time 0.235 (0.549)	Data Time 0.001 (0.103)	Loss 2.4679 (2.4134)	Entropy 0.57168 (0.57221)	Top-1 acc 67.188 (65.789)	Top-5 acc 83.203 (85.279)	lr 0.00363
Train [91][420/3239]	Time 0.241 (0.546)	Data Time 0.001 (0.101)	Loss 2.5879 (2.4138)	Entropy 0.57215 (0.57220)	Top-1 acc 62.109 (65.803)	Top-5 acc 80.469 (85.278)	lr 0.00363
Train [91][430/3239]	Time 0.229 (0.543)	Data Time 0.001 (0.098)	Loss 2.4043 (2.4141)	Entropy 0.57214 (0.57220)	Top-1 acc 67.578 (65.823)	Top-5 acc 84.766 (85.263)	lr 0.00363
Train [91][440/3239]	Time 0.234 (0.540)	Data Time 0.001 (0.096)	Loss 2.6263 (2.4142)	Entropy 0.57197 (0.57220)	Top-1 acc 60.156 (65.807)	Top-5 acc 81.641 (85.263)	lr 0.00363
Train [91][450/3239]	Time 0.234 (0.537)	Data Time 0.001 (0.094)	Loss 2.4340 (2.4149)	Entropy 0.57138 (0.57219)	Top-1 acc 67.578 (65.794)	Top-5 acc 85.938 (85.254)	lr 0.00363
Train [91][460/3239]	Time 0.257 (0.535)	Data Time 0.001 (0.092)	Loss 2.4383 (2.4155)	Entropy 0.57172 (0.57217)	Top-1 acc 67.188 (65.769)	Top-5 acc 83.984 (85.233)	lr 0.00363
Train [91][470/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.090)	Loss 2.3976 (2.4157)	Entropy 0.57200 (0.57216)	Top-1 acc 66.406 (65.754)	Top-5 acc 83.984 (85.238)	lr 0.00363
Train [91][480/3239]	Time 0.246 (0.529)	Data Time 0.001 (0.088)	Loss 2.4876 (2.4150)	Entropy 0.57219 (0.57216)	Top-1 acc 64.062 (65.762)	Top-5 acc 82.422 (85.239)	lr 0.00363
Train [91][490/3239]	Time 0.241 (0.527)	Data Time 0.001 (0.086)	Loss 2.4208 (2.4154)	Entropy 0.57210 (0.57216)	Top-1 acc 68.359 (65.757)	Top-5 acc 85.938 (85.237)	lr 0.00363
Train [91][500/3239]	Time 0.441 (0.627)	Data Time 0.030 (0.085)	Loss 2.3710 (2.4166)	Entropy 0.57211 (0.57216)	Top-1 acc 67.188 (65.736)	Top-5 acc 87.109 (85.202)	lr 0.00363
Train [91][510/3239]	Time 0.249 (0.627)	Data Time 0.002 (0.083)	Loss 2.2179 (2.4151)	Entropy 0.57182 (0.57215)	Top-1 acc 71.484 (65.779)	Top-5 acc 89.062 (85.233)	lr 0.00362
Train [91][520/3239]	Time 0.245 (0.623)	Data Time 0.001 (0.082)	Loss 2.2014 (2.4147)	Entropy 0.57197 (0.57215)	Top-1 acc 71.875 (65.791)	Top-5 acc 90.234 (85.234)	lr 0.00362
Train [91][530/3239]	Time 0.355 (0.620)	Data Time 0.001 (0.080)	Loss 2.5599 (2.4146)	Entropy 0.57197 (0.57215)	Top-1 acc 60.156 (65.790)	Top-5 acc 81.641 (85.233)	lr 0.00362
Train [91][540/3239]	Time 0.242 (0.617)	Data Time 0.001 (0.079)	Loss 2.3188 (2.4150)	Entropy 0.57198 (0.57215)	Top-1 acc 67.188 (65.785)	Top-5 acc 86.719 (85.217)	lr 0.00362
Train [91][550/3239]	Time 0.276 (0.615)	Data Time 0.002 (0.077)	Loss 2.2931 (2.4146)	Entropy 0.57212 (0.57214)	Top-1 acc 69.922 (65.785)	Top-5 acc 87.891 (85.226)	lr 0.00362
Train [91][560/3239]	Time 0.235 (0.612)	Data Time 0.001 (0.076)	Loss 2.3665 (2.4149)	Entropy 0.57216 (0.57214)	Top-1 acc 70.312 (65.778)	Top-5 acc 88.281 (85.231)	lr 0.00362
Train [91][570/3239]	Time 0.241 (0.609)	Data Time 0.001 (0.075)	Loss 2.3281 (2.4148)	Entropy 0.57246 (0.57215)	Top-1 acc 67.188 (65.780)	Top-5 acc 87.500 (85.236)	lr 0.00362
Train [91][580/3239]	Time 0.258 (0.607)	Data Time 0.001 (0.073)	Loss 2.5384 (2.4153)	Entropy 0.57234 (0.57215)	Top-1 acc 65.625 (65.761)	Top-5 acc 82.812 (85.230)	lr 0.00362
Train [91][590/3239]	Time 0.233 (0.604)	Data Time 0.001 (0.072)	Loss 2.3492 (2.4147)	Entropy 0.57225 (0.57215)	Top-1 acc 68.359 (65.771)	Top-5 acc 88.281 (85.239)	lr 0.00362
Train [91][600/3239]	Time 0.243 (0.602)	Data Time 0.001 (0.071)	Loss 2.3979 (2.4151)	Entropy 0.57219 (0.57215)	Top-1 acc 65.234 (65.763)	Top-5 acc 85.547 (85.237)	lr 0.00362
Train [91][610/3239]	Time 0.248 (0.599)	Data Time 0.001 (0.070)	Loss 2.5750 (2.4153)	Entropy 0.57220 (0.57215)	Top-1 acc 66.016 (65.761)	Top-5 acc 82.031 (85.234)	lr 0.00362
Train [91][620/3239]	Time 0.298 (0.597)	Data Time 0.001 (0.069)	Loss 2.5231 (2.4146)	Entropy 0.57206 (0.57215)	Top-1 acc 63.281 (65.761)	Top-5 acc 84.766 (85.240)	lr 0.00362
Train [91][630/3239]	Time 0.262 (0.594)	Data Time 0.001 (0.068)	Loss 2.3890 (2.4142)	Entropy 0.57199 (0.57215)	Top-1 acc 62.500 (65.758)	Top-5 acc 85.547 (85.232)	lr 0.00362
Train [91][640/3239]	Time 0.243 (0.592)	Data Time 0.001 (0.067)	Loss 2.4594 (2.4141)	Entropy 0.57188 (0.57215)	Top-1 acc 66.016 (65.757)	Top-5 acc 83.984 (85.234)	lr 0.00362
Train [91][650/3239]	Time 0.235 (0.590)	Data Time 0.001 (0.066)	Loss 2.6122 (2.4137)	Entropy 0.57238 (0.57215)	Top-1 acc 56.641 (65.753)	Top-5 acc 82.031 (85.235)	lr 0.00361
Train [91][660/3239]	Time 0.235 (0.587)	Data Time 0.001 (0.065)	Loss 2.5061 (2.4140)	Entropy 0.57248 (0.57215)	Top-1 acc 64.062 (65.736)	Top-5 acc 82.031 (85.226)	lr 0.00361
Train [91][670/3239]	Time 0.243 (0.585)	Data Time 0.001 (0.064)	Loss 2.2666 (2.4142)	Entropy 0.57240 (0.57215)	Top-1 acc 68.750 (65.733)	Top-5 acc 87.891 (85.231)	lr 0.00361
Train [91][680/3239]	Time 0.236 (0.583)	Data Time 0.001 (0.063)	Loss 2.5828 (2.4149)	Entropy 0.57246 (0.57216)	Top-1 acc 63.281 (65.725)	Top-5 acc 82.812 (85.223)	lr 0.00361
Train [91][690/3239]	Time 0.356 (0.581)	Data Time 0.001 (0.062)	Loss 2.4808 (2.4143)	Entropy 0.57247 (0.57216)	Top-1 acc 67.578 (65.744)	Top-5 acc 82.422 (85.231)	lr 0.00361
Train [91][700/3239]	Time 0.247 (0.579)	Data Time 0.001 (0.061)	Loss 2.3805 (2.4139)	Entropy 0.57240 (0.57216)	Top-1 acc 67.969 (65.751)	Top-5 acc 86.719 (85.241)	lr 0.00361
Train [91][710/3239]	Time 0.222 (0.577)	Data Time 0.001 (0.060)	Loss 2.5284 (2.4144)	Entropy 0.57235 (0.57217)	Top-1 acc 60.938 (65.733)	Top-5 acc 83.984 (85.238)	lr 0.00361
Train [91][720/3239]	Time 0.234 (0.575)	Data Time 0.001 (0.059)	Loss 2.6945 (2.4148)	Entropy 0.57253 (0.57217)	Top-1 acc 58.594 (65.721)	Top-5 acc 82.031 (85.235)	lr 0.00361
Train [91][730/3239]	Time 0.244 (0.573)	Data Time 0.001 (0.059)	Loss 2.6144 (2.4148)	Entropy 0.57274 (0.57218)	Top-1 acc 58.984 (65.731)	Top-5 acc 82.422 (85.231)	lr 0.00361
Train [91][740/3239]	Time 0.251 (0.572)	Data Time 0.001 (0.058)	Loss 2.3116 (2.4142)	Entropy 0.57232 (0.57218)	Top-1 acc 67.578 (65.753)	Top-5 acc 85.547 (85.240)	lr 0.00361
Train [91][750/3239]	Time 0.240 (0.570)	Data Time 0.001 (0.057)	Loss 2.3823 (2.4139)	Entropy 0.57247 (0.57218)	Top-1 acc 66.016 (65.760)	Top-5 acc 84.766 (85.244)	lr 0.00361
Train [91][760/3239]	Time 0.360 (0.568)	Data Time 0.001 (0.056)	Loss 2.4521 (2.4139)	Entropy 0.57199 (0.57219)	Top-1 acc 66.406 (65.759)	Top-5 acc 83.594 (85.242)	lr 0.00361
Train [91][770/3239]	Time 0.234 (0.567)	Data Time 0.001 (0.056)	Loss 2.5337 (2.4142)	Entropy 0.57224 (0.57218)	Top-1 acc 62.891 (65.753)	Top-5 acc 83.203 (85.228)	lr 0.00361
Train [91][780/3239]	Time 0.234 (0.565)	Data Time 0.001 (0.055)	Loss 2.2263 (2.4143)	Entropy 0.57198 (0.57219)	Top-1 acc 69.141 (65.741)	Top-5 acc 89.453 (85.227)	lr 0.00361
Train [91][790/3239]	Time 0.241 (0.563)	Data Time 0.001 (0.054)	Loss 2.5132 (2.4140)	Entropy 0.57217 (0.57218)	Top-1 acc 65.234 (65.745)	Top-5 acc 82.812 (85.234)	lr 0.00360
Train [91][800/3239]	Time 0.246 (0.562)	Data Time 0.001 (0.054)	Loss 2.4133 (2.4142)	Entropy 0.57223 (0.57218)	Top-1 acc 64.844 (65.734)	Top-5 acc 85.938 (85.224)	lr 0.00360
Train [91][810/3239]	Time 0.261 (0.561)	Data Time 0.004 (0.053)	Loss 2.4621 (2.4139)	Entropy 0.57214 (0.57218)	Top-1 acc 66.016 (65.747)	Top-5 acc 83.984 (85.240)	lr 0.00360
Train [91][820/3239]	Time 0.235 (0.559)	Data Time 0.001 (0.052)	Loss 2.4238 (2.4139)	Entropy 0.57232 (0.57218)	Top-1 acc 65.234 (65.753)	Top-5 acc 85.547 (85.241)	lr 0.00360
Train [91][830/3239]	Time 0.237 (0.558)	Data Time 0.002 (0.052)	Loss 2.3626 (2.4147)	Entropy 0.57238 (0.57219)	Top-1 acc 68.750 (65.732)	Top-5 acc 86.328 (85.223)	lr 0.00360
Train [91][840/3239]	Time 0.257 (0.557)	Data Time 0.002 (0.051)	Loss 2.3312 (2.4145)	Entropy 0.57245 (0.57219)	Top-1 acc 71.094 (65.760)	Top-5 acc 87.500 (85.224)	lr 0.00360
Train [91][850/3239]	Time 0.358 (0.556)	Data Time 0.001 (0.051)	Loss 2.3019 (2.4137)	Entropy 0.57257 (0.57219)	Top-1 acc 67.969 (65.791)	Top-5 acc 85.547 (85.241)	lr 0.00360
Train [91][860/3239]	Time 0.234 (0.555)	Data Time 0.001 (0.050)	Loss 2.4392 (2.4142)	Entropy 0.57285 (0.57220)	Top-1 acc 63.281 (65.777)	Top-5 acc 85.938 (85.227)	lr 0.00360
Train [91][870/3239]	Time 0.260 (0.554)	Data Time 0.001 (0.050)	Loss 2.4615 (2.4136)	Entropy 0.57255 (0.57220)	Top-1 acc 64.844 (65.794)	Top-5 acc 83.984 (85.237)	lr 0.00360
Train [91][880/3239]	Time 0.239 (0.552)	Data Time 0.001 (0.049)	Loss 2.3803 (2.4141)	Entropy 0.57243 (0.57221)	Top-1 acc 68.359 (65.784)	Top-5 acc 85.156 (85.230)	lr 0.00360
Train [91][890/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.048)	Loss 2.2604 (2.4143)	Entropy 0.57261 (0.57221)	Top-1 acc 72.266 (65.787)	Top-5 acc 89.844 (85.228)	lr 0.00360
Train [91][900/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.048)	Loss 2.3799 (2.4145)	Entropy 0.57200 (0.57221)	Top-1 acc 66.016 (65.779)	Top-5 acc 87.109 (85.226)	lr 0.00360
Train [91][910/3239]	Time 0.246 (0.548)	Data Time 0.002 (0.047)	Loss 2.5942 (2.4155)	Entropy 0.57241 (0.57221)	Top-1 acc 62.109 (65.754)	Top-5 acc 83.594 (85.215)	lr 0.00360
Train [91][920/3239]	Time 0.370 (0.547)	Data Time 0.001 (0.047)	Loss 2.5963 (2.4151)	Entropy 0.57230 (0.57221)	Top-1 acc 61.328 (65.758)	Top-5 acc 82.422 (85.226)	lr 0.00360
Train [91][930/3239]	Time 0.247 (0.546)	Data Time 0.001 (0.046)	Loss 2.3776 (2.4156)	Entropy 0.57230 (0.57221)	Top-1 acc 67.188 (65.761)	Top-5 acc 86.328 (85.226)	lr 0.00359
Train [91][940/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.046)	Loss 2.4177 (2.4157)	Entropy 0.57256 (0.57221)	Top-1 acc 66.797 (65.755)	Top-5 acc 84.766 (85.221)	lr 0.00359
Train [91][950/3239]	Time 0.236 (0.544)	Data Time 0.001 (0.045)	Loss 2.3382 (2.4156)	Entropy 0.57271 (0.57222)	Top-1 acc 67.969 (65.755)	Top-5 acc 86.719 (85.231)	lr 0.00359
Train [91][960/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.045)	Loss 2.3578 (2.4158)	Entropy 0.57241 (0.57222)	Top-1 acc 63.672 (65.736)	Top-5 acc 88.281 (85.231)	lr 0.00359
Train [91][970/3239]	Time 0.239 (0.541)	Data Time 0.002 (0.045)	Loss 2.4783 (2.4165)	Entropy 0.57233 (0.57222)	Top-1 acc 65.625 (65.730)	Top-5 acc 85.938 (85.226)	lr 0.00359
Train [91][980/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.044)	Loss 2.4121 (2.4159)	Entropy 0.57243 (0.57223)	Top-1 acc 66.016 (65.752)	Top-5 acc 87.891 (85.233)	lr 0.00359
Train [91][990/3239]	Time 0.239 (0.539)	Data Time 0.001 (0.044)	Loss 2.3431 (2.4157)	Entropy 0.57239 (0.57223)	Top-1 acc 68.750 (65.760)	Top-5 acc 83.984 (85.236)	lr 0.00359
Train [91][1000/3239]	Time 0.247 (0.538)	Data Time 0.001 (0.043)	Loss 2.3082 (2.4153)	Entropy 0.57224 (0.57223)	Top-1 acc 69.141 (65.773)	Top-5 acc 85.156 (85.252)	lr 0.00359
Train [91][1010/3239]	Time 0.291 (0.537)	Data Time 0.001 (0.043)	Loss 2.4776 (2.4156)	Entropy 0.57218 (0.57223)	Top-1 acc 66.406 (65.764)	Top-5 acc 83.203 (85.247)	lr 0.00359
Train [91][1020/3239]	Time 0.240 (0.536)	Data Time 0.001 (0.042)	Loss 2.4714 (2.4155)	Entropy 0.57219 (0.57223)	Top-1 acc 64.062 (65.769)	Top-5 acc 86.719 (85.250)	lr 0.00359
Train [91][1030/3239]	Time 0.269 (0.535)	Data Time 0.002 (0.042)	Loss 2.2970 (2.4154)	Entropy 0.57247 (0.57223)	Top-1 acc 68.750 (65.763)	Top-5 acc 87.891 (85.253)	lr 0.00359
Train [91][1040/3239]	Time 0.243 (0.534)	Data Time 0.002 (0.042)	Loss 2.5531 (2.4152)	Entropy 0.57248 (0.57223)	Top-1 acc 61.719 (65.768)	Top-5 acc 84.766 (85.260)	lr 0.00359
Train [91][1050/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.041)	Loss 2.2657 (2.4146)	Entropy 0.57247 (0.57223)	Top-1 acc 69.141 (65.780)	Top-5 acc 87.109 (85.270)	lr 0.00359
Train [91][1060/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.041)	Loss 2.4653 (2.4146)	Entropy 0.57255 (0.57224)	Top-1 acc 63.281 (65.774)	Top-5 acc 83.594 (85.264)	lr 0.00359
Train [91][1070/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.041)	Loss 2.2132 (2.4145)	Entropy 0.57241 (0.57224)	Top-1 acc 68.359 (65.769)	Top-5 acc 88.281 (85.257)	lr 0.00359
Train [91][1080/3239]	Time 0.346 (0.530)	Data Time 0.001 (0.040)	Loss 2.5068 (2.4146)	Entropy 0.57225 (0.57224)	Top-1 acc 66.016 (65.776)	Top-5 acc 82.812 (85.257)	lr 0.00358
Train [91][1090/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.040)	Loss 2.3850 (2.4145)	Entropy 0.57222 (0.57224)	Top-1 acc 66.016 (65.774)	Top-5 acc 85.938 (85.263)	lr 0.00358
Train [91][1100/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.039)	Loss 2.4039 (2.4141)	Entropy 0.57231 (0.57224)	Top-1 acc 63.672 (65.778)	Top-5 acc 86.328 (85.269)	lr 0.00358
Train [91][1110/3239]	Time 0.246 (0.527)	Data Time 0.001 (0.039)	Loss 2.4631 (2.4140)	Entropy 0.57219 (0.57224)	Top-1 acc 59.375 (65.776)	Top-5 acc 84.375 (85.266)	lr 0.00358
Train [91][1120/3239]	Time 0.302 (0.527)	Data Time 0.002 (0.039)	Loss 2.3226 (2.4138)	Entropy 0.57222 (0.57224)	Top-1 acc 67.188 (65.776)	Top-5 acc 86.328 (85.269)	lr 0.00358
Train [91][1130/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.038)	Loss 2.4948 (2.4138)	Entropy 0.57251 (0.57224)	Top-1 acc 62.500 (65.779)	Top-5 acc 83.984 (85.271)	lr 0.00358
Train [91][1140/3239]	Time 0.240 (0.526)	Data Time 0.001 (0.038)	Loss 2.3587 (2.4139)	Entropy 0.57224 (0.57224)	Top-1 acc 70.312 (65.781)	Top-5 acc 85.547 (85.270)	lr 0.00358
Train [91][1150/3239]	Time 0.346 (0.526)	Data Time 0.001 (0.038)	Loss 2.4569 (2.4138)	Entropy 0.57247 (0.57224)	Top-1 acc 66.797 (65.791)	Top-5 acc 83.203 (85.272)	lr 0.00358
Train [91][1160/3239]	Time 0.247 (0.572)	Data Time 0.002 (0.038)	Loss 2.1963 (2.4131)	Entropy 0.57256 (0.57225)	Top-1 acc 74.219 (65.815)	Top-5 acc 86.719 (85.279)	lr 0.00358
Train [91][1170/3239]	Time 0.357 (0.571)	Data Time 0.004 (0.037)	Loss 2.4049 (2.4129)	Entropy 0.57269 (0.57225)	Top-1 acc 65.234 (65.818)	Top-5 acc 83.203 (85.284)	lr 0.00358
Train [91][1180/3239]	Time 0.239 (0.569)	Data Time 0.002 (0.037)	Loss 2.3315 (2.4127)	Entropy 0.57262 (0.57225)	Top-1 acc 68.750 (65.816)	Top-5 acc 86.328 (85.288)	lr 0.00358
Train [91][1190/3239]	Time 0.253 (0.568)	Data Time 0.002 (0.037)	Loss 2.5119 (2.4123)	Entropy 0.57291 (0.57225)	Top-1 acc 64.062 (65.826)	Top-5 acc 83.594 (85.298)	lr 0.00358
Train [91][1200/3239]	Time 0.234 (0.567)	Data Time 0.001 (0.036)	Loss 2.4894 (2.4125)	Entropy 0.57327 (0.57226)	Top-1 acc 65.234 (65.824)	Top-5 acc 84.766 (85.291)	lr 0.00358
Train [91][1210/3239]	Time 0.266 (0.566)	Data Time 0.001 (0.036)	Loss 2.7285 (2.4130)	Entropy 0.57281 (0.57227)	Top-1 acc 59.766 (65.813)	Top-5 acc 78.125 (85.280)	lr 0.00358
Train [91][1220/3239]	Time 0.238 (0.565)	Data Time 0.001 (0.036)	Loss 2.5103 (2.4125)	Entropy 0.57260 (0.57227)	Top-1 acc 64.062 (65.828)	Top-5 acc 82.812 (85.285)	lr 0.00357
Train [91][1230/3239]	Time 0.283 (0.564)	Data Time 0.001 (0.036)	Loss 2.4712 (2.4135)	Entropy 0.57263 (0.57227)	Top-1 acc 61.328 (65.808)	Top-5 acc 82.812 (85.264)	lr 0.00357
Train [91][1240/3239]	Time 0.376 (0.563)	Data Time 0.001 (0.035)	Loss 2.3807 (2.4138)	Entropy 0.57256 (0.57228)	Top-1 acc 66.797 (65.806)	Top-5 acc 85.156 (85.263)	lr 0.00357
Train [91][1250/3239]	Time 0.244 (0.562)	Data Time 0.001 (0.035)	Loss 2.5366 (2.4140)	Entropy 0.57242 (0.57228)	Top-1 acc 62.500 (65.802)	Top-5 acc 83.984 (85.257)	lr 0.00357
Train [91][1260/3239]	Time 0.248 (0.561)	Data Time 0.001 (0.035)	Loss 2.6029 (2.4146)	Entropy 0.57221 (0.57228)	Top-1 acc 60.156 (65.789)	Top-5 acc 81.250 (85.245)	lr 0.00357
Train [91][1270/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.034)	Loss 2.4186 (2.4150)	Entropy 0.57222 (0.57228)	Top-1 acc 65.234 (65.785)	Top-5 acc 87.109 (85.239)	lr 0.00357
Train [91][1280/3239]	Time 0.244 (0.559)	Data Time 0.002 (0.034)	Loss 2.3585 (2.4146)	Entropy 0.57235 (0.57228)	Top-1 acc 66.406 (65.797)	Top-5 acc 85.938 (85.244)	lr 0.00357
Train [91][1290/3239]	Time 0.235 (0.559)	Data Time 0.001 (0.034)	Loss 2.3516 (2.4148)	Entropy 0.57222 (0.57228)	Top-1 acc 66.016 (65.792)	Top-5 acc 87.109 (85.242)	lr 0.00357
Train [91][1300/3239]	Time 0.246 (0.558)	Data Time 0.001 (0.034)	Loss 2.7012 (2.4151)	Entropy 0.57258 (0.57228)	Top-1 acc 62.109 (65.784)	Top-5 acc 76.172 (85.237)	lr 0.00357
Train [91][1310/3239]	Time 0.288 (0.557)	Data Time 0.002 (0.033)	Loss 2.3824 (2.4149)	Entropy 0.57251 (0.57228)	Top-1 acc 65.625 (65.796)	Top-5 acc 85.547 (85.240)	lr 0.00357
Train [91][1320/3239]	Time 0.377 (0.557)	Data Time 0.002 (0.033)	Loss 2.3009 (2.4149)	Entropy 0.57285 (0.57229)	Top-1 acc 66.016 (65.794)	Top-5 acc 88.672 (85.240)	lr 0.00357
Train [91][1330/3239]	Time 0.242 (0.557)	Data Time 0.001 (0.033)	Loss 2.3374 (2.4151)	Entropy 0.57294 (0.57229)	Top-1 acc 68.750 (65.784)	Top-5 acc 85.156 (85.238)	lr 0.00357
Train [91][1340/3239]	Time 0.235 (0.556)	Data Time 0.001 (0.033)	Loss 2.3728 (2.4153)	Entropy 0.57306 (0.57230)	Top-1 acc 67.578 (65.775)	Top-5 acc 84.375 (85.230)	lr 0.00357
Train [91][1350/3239]	Time 0.230 (0.555)	Data Time 0.001 (0.033)	Loss 2.5353 (2.4157)	Entropy 0.57295 (0.57230)	Top-1 acc 64.453 (65.767)	Top-5 acc 84.766 (85.220)	lr 0.00357
Train [91][1360/3239]	Time 0.244 (0.554)	Data Time 0.002 (0.032)	Loss 2.4396 (2.4155)	Entropy 0.57287 (0.57231)	Top-1 acc 67.969 (65.777)	Top-5 acc 84.766 (85.221)	lr 0.00356
Train [91][1370/3239]	Time 0.239 (0.553)	Data Time 0.001 (0.032)	Loss 2.2691 (2.4157)	Entropy 0.57230 (0.57231)	Top-1 acc 67.578 (65.773)	Top-5 acc 86.719 (85.216)	lr 0.00356
Train [91][1380/3239]	Time 0.228 (0.552)	Data Time 0.001 (0.032)	Loss 2.5274 (2.4158)	Entropy 0.57234 (0.57231)	Top-1 acc 58.203 (65.766)	Top-5 acc 83.984 (85.217)	lr 0.00356
Train [91][1390/3239]	Time 0.235 (0.551)	Data Time 0.002 (0.032)	Loss 2.3120 (2.4156)	Entropy 0.57251 (0.57231)	Top-1 acc 69.531 (65.769)	Top-5 acc 87.891 (85.223)	lr 0.00356
Train [91][1400/3239]	Time 0.347 (0.551)	Data Time 0.001 (0.031)	Loss 2.5347 (2.4158)	Entropy 0.57272 (0.57231)	Top-1 acc 58.594 (65.761)	Top-5 acc 83.203 (85.220)	lr 0.00356
Train [91][1410/3239]	Time 0.228 (0.550)	Data Time 0.001 (0.031)	Loss 2.3353 (2.4158)	Entropy 0.57247 (0.57231)	Top-1 acc 71.484 (65.756)	Top-5 acc 86.719 (85.217)	lr 0.00356
Train [91][1420/3239]	Time 0.235 (0.549)	Data Time 0.001 (0.031)	Loss 2.4138 (2.4158)	Entropy 0.57262 (0.57232)	Top-1 acc 63.281 (65.759)	Top-5 acc 83.594 (85.216)	lr 0.00356
Train [91][1430/3239]	Time 0.251 (0.549)	Data Time 0.001 (0.031)	Loss 2.2088 (2.4156)	Entropy 0.57259 (0.57232)	Top-1 acc 72.656 (65.767)	Top-5 acc 87.500 (85.224)	lr 0.00356
Train [91][1440/3239]	Time 0.240 (0.548)	Data Time 0.001 (0.031)	Loss 2.1741 (2.4154)	Entropy 0.57263 (0.57232)	Top-1 acc 72.266 (65.772)	Top-5 acc 89.844 (85.231)	lr 0.00356
Train [91][1450/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.030)	Loss 2.3734 (2.4154)	Entropy 0.57223 (0.57232)	Top-1 acc 66.797 (65.774)	Top-5 acc 83.594 (85.230)	lr 0.00356
Train [91][1460/3239]	Time 0.238 (0.547)	Data Time 0.001 (0.030)	Loss 2.4008 (2.4151)	Entropy 0.57223 (0.57232)	Top-1 acc 63.672 (65.781)	Top-5 acc 85.547 (85.235)	lr 0.00356
Train [91][1470/3239]	Time 0.328 (0.546)	Data Time 0.001 (0.030)	Loss 2.5904 (2.4156)	Entropy 0.57171 (0.57232)	Top-1 acc 62.109 (65.771)	Top-5 acc 82.031 (85.225)	lr 0.00356
Train [91][1480/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.030)	Loss 2.4318 (2.4158)	Entropy 0.57149 (0.57232)	Top-1 acc 64.453 (65.765)	Top-5 acc 83.984 (85.220)	lr 0.00356
Train [91][1490/3239]	Time 0.243 (0.544)	Data Time 0.001 (0.030)	Loss 2.3415 (2.4155)	Entropy 0.57173 (0.57231)	Top-1 acc 67.969 (65.775)	Top-5 acc 87.500 (85.226)	lr 0.00356
Train [91][1500/3239]	Time 0.240 (0.544)	Data Time 0.001 (0.029)	Loss 2.4496 (2.4155)	Entropy 0.57151 (0.57231)	Top-1 acc 62.109 (65.775)	Top-5 acc 84.375 (85.226)	lr 0.00355
Train [91][1510/3239]	Time 0.224 (0.543)	Data Time 0.001 (0.029)	Loss 2.3481 (2.4154)	Entropy 0.57178 (0.57230)	Top-1 acc 69.922 (65.790)	Top-5 acc 87.109 (85.231)	lr 0.00355
Train [91][1520/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.029)	Loss 2.4341 (2.4153)	Entropy 0.57188 (0.57230)	Top-1 acc 66.406 (65.793)	Top-5 acc 83.984 (85.231)	lr 0.00355
Train [91][1530/3239]	Time 0.243 (0.542)	Data Time 0.001 (0.029)	Loss 2.4933 (2.4149)	Entropy 0.57167 (0.57229)	Top-1 acc 63.281 (65.802)	Top-5 acc 85.938 (85.235)	lr 0.00355
Train [91][1540/3239]	Time 0.226 (0.541)	Data Time 0.001 (0.029)	Loss 2.4773 (2.4150)	Entropy 0.57158 (0.57229)	Top-1 acc 67.188 (65.807)	Top-5 acc 83.984 (85.230)	lr 0.00355
Train [91][1550/3239]	Time 0.237 (0.540)	Data Time 0.001 (0.029)	Loss 2.4583 (2.4156)	Entropy 0.57133 (0.57228)	Top-1 acc 65.625 (65.794)	Top-5 acc 84.766 (85.223)	lr 0.00355
Train [91][1560/3239]	Time 0.337 (0.539)	Data Time 0.001 (0.028)	Loss 2.3976 (2.4159)	Entropy 0.57111 (0.57228)	Top-1 acc 66.016 (65.782)	Top-5 acc 86.719 (85.220)	lr 0.00355
Train [91][1570/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.028)	Loss 2.3807 (2.4160)	Entropy 0.57079 (0.57227)	Top-1 acc 67.188 (65.779)	Top-5 acc 88.672 (85.220)	lr 0.00355
Train [91][1580/3239]	Time 0.229 (0.538)	Data Time 0.003 (0.028)	Loss 2.4548 (2.4162)	Entropy 0.57083 (0.57226)	Top-1 acc 64.453 (65.772)	Top-5 acc 84.766 (85.218)	lr 0.00355
Train [91][1590/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.028)	Loss 2.7758 (2.4166)	Entropy 0.57121 (0.57225)	Top-1 acc 58.203 (65.768)	Top-5 acc 80.078 (85.213)	lr 0.00355
Train [91][1600/3239]	Time 0.268 (0.537)	Data Time 0.001 (0.028)	Loss 2.5165 (2.4166)	Entropy 0.57127 (0.57225)	Top-1 acc 66.016 (65.772)	Top-5 acc 83.984 (85.213)	lr 0.00355
Train [91][1610/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.028)	Loss 2.4560 (2.4167)	Entropy 0.57107 (0.57224)	Top-1 acc 66.406 (65.770)	Top-5 acc 83.594 (85.212)	lr 0.00355
Train [91][1620/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.027)	Loss 2.5581 (2.4170)	Entropy 0.57061 (0.57223)	Top-1 acc 62.891 (65.759)	Top-5 acc 82.812 (85.207)	lr 0.00355
Train [91][1630/3239]	Time 0.358 (0.535)	Data Time 0.001 (0.027)	Loss 2.5165 (2.4168)	Entropy 0.57079 (0.57222)	Top-1 acc 61.328 (65.765)	Top-5 acc 83.594 (85.208)	lr 0.00355
Train [91][1640/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.027)	Loss 2.3669 (2.4169)	Entropy 0.57076 (0.57221)	Top-1 acc 65.625 (65.760)	Top-5 acc 87.891 (85.208)	lr 0.00354
Train [91][1650/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.027)	Loss 2.3610 (2.4174)	Entropy 0.57085 (0.57221)	Top-1 acc 66.797 (65.741)	Top-5 acc 86.719 (85.202)	lr 0.00354
Train [91][1660/3239]	Time 0.224 (0.533)	Data Time 0.001 (0.027)	Loss 2.5050 (2.4179)	Entropy 0.57125 (0.57220)	Top-1 acc 63.281 (65.731)	Top-5 acc 82.812 (85.194)	lr 0.00354
Train [91][1670/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.027)	Loss 2.2271 (2.4175)	Entropy 0.57139 (0.57219)	Top-1 acc 69.531 (65.734)	Top-5 acc 88.672 (85.199)	lr 0.00354
Train [91][1680/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.026)	Loss 2.2757 (2.4176)	Entropy 0.57126 (0.57219)	Top-1 acc 69.922 (65.737)	Top-5 acc 88.281 (85.196)	lr 0.00354
Train [91][1690/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.026)	Loss 2.4156 (2.4176)	Entropy 0.57130 (0.57218)	Top-1 acc 66.797 (65.740)	Top-5 acc 86.328 (85.193)	lr 0.00354
Train [91][1700/3239]	Time 0.241 (0.530)	Data Time 0.001 (0.026)	Loss 2.3372 (2.4175)	Entropy 0.57157 (0.57218)	Top-1 acc 67.578 (65.742)	Top-5 acc 83.984 (85.195)	lr 0.00354
Train [91][1710/3239]	Time 0.268 (0.530)	Data Time 0.001 (0.026)	Loss 2.3890 (2.4175)	Entropy 0.57176 (0.57217)	Top-1 acc 66.406 (65.739)	Top-5 acc 84.766 (85.197)	lr 0.00354
Train [91][1720/3239]	Time 0.256 (0.529)	Data Time 0.001 (0.026)	Loss 2.3911 (2.4176)	Entropy 0.57189 (0.57217)	Top-1 acc 66.016 (65.736)	Top-5 acc 84.375 (85.198)	lr 0.00354
Train [91][1730/3239]	Time 0.277 (0.529)	Data Time 0.001 (0.026)	Loss 2.4896 (2.4181)	Entropy 0.57203 (0.57217)	Top-1 acc 64.453 (65.719)	Top-5 acc 83.203 (85.190)	lr 0.00354
Train [91][1740/3239]	Time 0.246 (0.529)	Data Time 0.001 (0.026)	Loss 2.4322 (2.4187)	Entropy 0.57216 (0.57217)	Top-1 acc 64.453 (65.702)	Top-5 acc 85.547 (85.185)	lr 0.00354
Train [91][1750/3239]	Time 0.228 (0.528)	Data Time 0.002 (0.025)	Loss 2.2298 (2.4187)	Entropy 0.57244 (0.57217)	Top-1 acc 69.922 (65.700)	Top-5 acc 89.062 (85.183)	lr 0.00354
Train [91][1760/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.025)	Loss 2.3762 (2.4190)	Entropy 0.57252 (0.57217)	Top-1 acc 64.062 (65.694)	Top-5 acc 87.109 (85.176)	lr 0.00354
Train [91][1770/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.025)	Loss 2.3499 (2.4191)	Entropy 0.57253 (0.57218)	Top-1 acc 68.750 (65.692)	Top-5 acc 86.719 (85.175)	lr 0.00354
Train [91][1780/3239]	Time 0.228 (0.526)	Data Time 0.001 (0.025)	Loss 2.4278 (2.4192)	Entropy 0.57265 (0.57218)	Top-1 acc 65.625 (65.685)	Top-5 acc 83.594 (85.171)	lr 0.00353
Train [91][1790/3239]	Time 0.336 (0.526)	Data Time 0.001 (0.025)	Loss 2.2512 (2.4194)	Entropy 0.57279 (0.57218)	Top-1 acc 69.531 (65.681)	Top-5 acc 88.281 (85.167)	lr 0.00353
Train [91][1800/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.025)	Loss 2.3425 (2.4195)	Entropy 0.57280 (0.57218)	Top-1 acc 67.969 (65.676)	Top-5 acc 86.719 (85.168)	lr 0.00353
Train [91][1810/3239]	Time 0.330 (0.554)	Data Time 0.006 (0.025)	Loss 2.4462 (2.4197)	Entropy 0.57284 (0.57219)	Top-1 acc 64.453 (65.674)	Top-5 acc 85.938 (85.165)	lr 0.00353
Train [91][1820/3239]	Time 0.233 (0.553)	Data Time 0.002 (0.025)	Loss 2.5524 (2.4199)	Entropy 0.57245 (0.57219)	Top-1 acc 62.500 (65.668)	Top-5 acc 81.641 (85.160)	lr 0.00353
Train [91][1830/3239]	Time 0.255 (0.553)	Data Time 0.002 (0.024)	Loss 2.2785 (2.4200)	Entropy 0.57232 (0.57219)	Top-1 acc 70.312 (65.666)	Top-5 acc 86.328 (85.159)	lr 0.00353
Train [91][1840/3239]	Time 0.237 (0.552)	Data Time 0.002 (0.024)	Loss 2.6378 (2.4200)	Entropy 0.57221 (0.57219)	Top-1 acc 60.547 (65.659)	Top-5 acc 80.859 (85.159)	lr 0.00353
Train [91][1850/3239]	Time 0.235 (0.551)	Data Time 0.001 (0.024)	Loss 2.3498 (2.4198)	Entropy 0.57231 (0.57219)	Top-1 acc 65.625 (65.665)	Top-5 acc 86.328 (85.160)	lr 0.00353
Train [91][1860/3239]	Time 0.254 (0.551)	Data Time 0.002 (0.024)	Loss 2.3583 (2.4199)	Entropy 0.57222 (0.57219)	Top-1 acc 67.188 (65.666)	Top-5 acc 87.109 (85.160)	lr 0.00353
Train [91][1870/3239]	Time 0.230 (0.550)	Data Time 0.001 (0.024)	Loss 2.3720 (2.4197)	Entropy 0.57237 (0.57219)	Top-1 acc 65.625 (65.667)	Top-5 acc 87.109 (85.162)	lr 0.00353
Train [91][1880/3239]	Time 0.263 (0.550)	Data Time 0.001 (0.024)	Loss 2.4299 (2.4195)	Entropy 0.57253 (0.57220)	Top-1 acc 66.016 (65.674)	Top-5 acc 85.938 (85.167)	lr 0.00353
Train [91][1890/3239]	Time 0.233 (0.549)	Data Time 0.001 (0.024)	Loss 2.5210 (2.4197)	Entropy 0.57208 (0.57220)	Top-1 acc 65.625 (65.672)	Top-5 acc 81.641 (85.162)	lr 0.00353
Train [91][1900/3239]	Time 0.249 (0.548)	Data Time 0.001 (0.024)	Loss 2.4579 (2.4201)	Entropy 0.57218 (0.57220)	Top-1 acc 69.141 (65.658)	Top-5 acc 84.766 (85.155)	lr 0.00353
Train [91][1910/3239]	Time 0.271 (0.548)	Data Time 0.001 (0.023)	Loss 2.3278 (2.4203)	Entropy 0.57238 (0.57220)	Top-1 acc 66.016 (65.648)	Top-5 acc 88.281 (85.155)	lr 0.00353
Train [91][1920/3239]	Time 0.268 (0.548)	Data Time 0.002 (0.023)	Loss 2.5383 (2.4206)	Entropy 0.57203 (0.57220)	Top-1 acc 62.891 (65.638)	Top-5 acc 83.594 (85.153)	lr 0.00353
Train [91][1930/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.023)	Loss 2.3320 (2.4203)	Entropy 0.57203 (0.57220)	Top-1 acc 67.188 (65.646)	Top-5 acc 85.938 (85.158)	lr 0.00352
Train [91][1940/3239]	Time 0.254 (0.547)	Data Time 0.001 (0.023)	Loss 2.2617 (2.4201)	Entropy 0.57208 (0.57219)	Top-1 acc 67.969 (65.651)	Top-5 acc 89.062 (85.162)	lr 0.00352
Train [91][1950/3239]	Time 0.327 (0.546)	Data Time 0.001 (0.023)	Loss 2.4140 (2.4202)	Entropy 0.57211 (0.57219)	Top-1 acc 66.016 (65.645)	Top-5 acc 85.547 (85.164)	lr 0.00352
Train [91][1960/3239]	Time 0.238 (0.546)	Data Time 0.002 (0.023)	Loss 2.3701 (2.4199)	Entropy 0.57214 (0.57219)	Top-1 acc 65.625 (65.653)	Top-5 acc 86.328 (85.170)	lr 0.00352
Train [91][1970/3239]	Time 0.250 (0.545)	Data Time 0.001 (0.023)	Loss 2.4597 (2.4197)	Entropy 0.57221 (0.57219)	Top-1 acc 66.016 (65.652)	Top-5 acc 83.203 (85.173)	lr 0.00352
Train [91][1980/3239]	Time 0.235 (0.545)	Data Time 0.002 (0.023)	Loss 2.4924 (2.4199)	Entropy 0.57227 (0.57219)	Top-1 acc 62.500 (65.649)	Top-5 acc 84.766 (85.172)	lr 0.00352
Train [91][1990/3239]	Time 0.252 (0.544)	Data Time 0.002 (0.023)	Loss 2.3580 (2.4201)	Entropy 0.57235 (0.57219)	Top-1 acc 65.234 (65.638)	Top-5 acc 87.109 (85.165)	lr 0.00352
Train [91][2000/3239]	Time 0.228 (0.544)	Data Time 0.001 (0.023)	Loss 2.4318 (2.4198)	Entropy 0.57259 (0.57220)	Top-1 acc 66.406 (65.641)	Top-5 acc 86.719 (85.170)	lr 0.00352
Train [91][2010/3239]	Time 0.236 (0.543)	Data Time 0.001 (0.022)	Loss 2.5165 (2.4203)	Entropy 0.57287 (0.57220)	Top-1 acc 62.891 (65.632)	Top-5 acc 83.594 (85.163)	lr 0.00352
Train [91][2020/3239]	Time 0.325 (0.542)	Data Time 0.001 (0.022)	Loss 2.4886 (2.4203)	Entropy 0.57281 (0.57220)	Top-1 acc 61.328 (65.630)	Top-5 acc 84.375 (85.160)	lr 0.00352
Train [91][2030/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.022)	Loss 2.3677 (2.4204)	Entropy 0.57307 (0.57221)	Top-1 acc 64.453 (65.627)	Top-5 acc 86.328 (85.155)	lr 0.00352
Train [91][2040/3239]	Time 0.244 (0.541)	Data Time 0.001 (0.022)	Loss 2.4643 (2.4203)	Entropy 0.57359 (0.57221)	Top-1 acc 66.797 (65.637)	Top-5 acc 83.594 (85.155)	lr 0.00352
Train [91][2050/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.022)	Loss 2.3447 (2.4204)	Entropy 0.57364 (0.57222)	Top-1 acc 69.141 (65.632)	Top-5 acc 87.891 (85.155)	lr 0.00352
Train [91][2060/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.022)	Loss 2.4257 (2.4203)	Entropy 0.57340 (0.57222)	Top-1 acc 63.281 (65.631)	Top-5 acc 83.594 (85.156)	lr 0.00352
Train [91][2070/3239]	Time 0.228 (0.540)	Data Time 0.001 (0.022)	Loss 2.3443 (2.4202)	Entropy 0.57340 (0.57223)	Top-1 acc 69.141 (65.636)	Top-5 acc 88.672 (85.162)	lr 0.00351
Train [91][2080/3239]	Time 0.227 (0.539)	Data Time 0.001 (0.022)	Loss 2.5064 (2.4203)	Entropy 0.57355 (0.57224)	Top-1 acc 64.062 (65.634)	Top-5 acc 84.375 (85.162)	lr 0.00351
Train [91][2090/3239]	Time 0.247 (0.539)	Data Time 0.001 (0.022)	Loss 2.3787 (2.4203)	Entropy 0.57337 (0.57224)	Top-1 acc 67.969 (65.631)	Top-5 acc 86.719 (85.165)	lr 0.00351
Train [91][2100/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.022)	Loss 2.2804 (2.4199)	Entropy 0.57313 (0.57225)	Top-1 acc 66.797 (65.644)	Top-5 acc 86.719 (85.170)	lr 0.00351
Train [91][2110/3239]	Time 0.331 (0.538)	Data Time 0.001 (0.021)	Loss 2.5015 (2.4200)	Entropy 0.57326 (0.57225)	Top-1 acc 62.891 (65.645)	Top-5 acc 83.984 (85.169)	lr 0.00351
Train [91][2120/3239]	Time 0.234 (0.537)	Data Time 0.001 (0.021)	Loss 2.4691 (2.4201)	Entropy 0.57348 (0.57226)	Top-1 acc 64.844 (65.644)	Top-5 acc 82.422 (85.166)	lr 0.00351
Train [91][2130/3239]	Time 0.229 (0.537)	Data Time 0.001 (0.021)	Loss 2.2840 (2.4200)	Entropy 0.57361 (0.57226)	Top-1 acc 70.312 (65.643)	Top-5 acc 88.281 (85.165)	lr 0.00351
Train [91][2140/3239]	Time 0.256 (0.537)	Data Time 0.001 (0.021)	Loss 2.3354 (2.4202)	Entropy 0.57347 (0.57227)	Top-1 acc 67.578 (65.639)	Top-5 acc 86.328 (85.165)	lr 0.00351
Train [91][2150/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.021)	Loss 2.3407 (2.4199)	Entropy 0.57347 (0.57227)	Top-1 acc 63.672 (65.640)	Top-5 acc 85.938 (85.171)	lr 0.00351
Train [91][2160/3239]	Time 0.257 (0.536)	Data Time 0.002 (0.021)	Loss 2.4801 (2.4198)	Entropy 0.57304 (0.57228)	Top-1 acc 62.109 (65.644)	Top-5 acc 84.766 (85.171)	lr 0.00351
Train [91][2170/3239]	Time 0.237 (0.535)	Data Time 0.001 (0.021)	Loss 2.3996 (2.4196)	Entropy 0.57298 (0.57228)	Top-1 acc 63.672 (65.645)	Top-5 acc 84.375 (85.175)	lr 0.00351
Train [91][2180/3239]	Time 0.332 (0.535)	Data Time 0.001 (0.021)	Loss 2.2878 (2.4196)	Entropy 0.57308 (0.57229)	Top-1 acc 65.625 (65.644)	Top-5 acc 87.500 (85.173)	lr 0.00351
Train [91][2190/3239]	Time 0.240 (0.534)	Data Time 0.001 (0.021)	Loss 2.2268 (2.4197)	Entropy 0.57328 (0.57229)	Top-1 acc 73.438 (65.646)	Top-5 acc 87.891 (85.171)	lr 0.00351
Train [91][2200/3239]	Time 0.243 (0.534)	Data Time 0.001 (0.021)	Loss 2.5393 (2.4197)	Entropy 0.57314 (0.57229)	Top-1 acc 66.016 (65.654)	Top-5 acc 81.641 (85.170)	lr 0.00351
Train [91][2210/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.021)	Loss 2.2362 (2.4197)	Entropy 0.57310 (0.57230)	Top-1 acc 68.359 (65.658)	Top-5 acc 90.234 (85.170)	lr 0.00350
Train [91][2220/3239]	Time 0.328 (0.533)	Data Time 0.002 (0.020)	Loss 2.4633 (2.4199)	Entropy 0.57335 (0.57230)	Top-1 acc 64.062 (65.652)	Top-5 acc 85.938 (85.169)	lr 0.00350
Train [91][2230/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.020)	Loss 2.1634 (2.4197)	Entropy 0.57321 (0.57231)	Top-1 acc 70.703 (65.656)	Top-5 acc 88.672 (85.171)	lr 0.00350
Train [91][2240/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.020)	Loss 2.2967 (2.4195)	Entropy 0.57345 (0.57231)	Top-1 acc 68.750 (65.656)	Top-5 acc 87.500 (85.175)	lr 0.00350
Train [91][2250/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.020)	Loss 2.3328 (2.4196)	Entropy 0.57372 (0.57232)	Top-1 acc 69.531 (65.655)	Top-5 acc 86.328 (85.174)	lr 0.00350
Train [91][2260/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.020)	Loss 2.4175 (2.4198)	Entropy 0.57406 (0.57232)	Top-1 acc 66.797 (65.650)	Top-5 acc 86.719 (85.167)	lr 0.00350
Train [91][2270/3239]	Time 0.358 (0.531)	Data Time 0.002 (0.020)	Loss 2.4501 (2.4200)	Entropy 0.57399 (0.57233)	Top-1 acc 65.625 (65.647)	Top-5 acc 84.766 (85.162)	lr 0.00350
Train [91][2280/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.020)	Loss 2.5256 (2.4200)	Entropy 0.57424 (0.57234)	Top-1 acc 62.500 (65.648)	Top-5 acc 82.031 (85.159)	lr 0.00350
Train [91][2290/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.020)	Loss 2.3011 (2.4200)	Entropy 0.57411 (0.57235)	Top-1 acc 69.531 (65.643)	Top-5 acc 86.719 (85.162)	lr 0.00350
Train [91][2300/3239]	Time 0.228 (0.530)	Data Time 0.001 (0.020)	Loss 2.1535 (2.4198)	Entropy 0.57407 (0.57235)	Top-1 acc 68.359 (65.647)	Top-5 acc 90.625 (85.167)	lr 0.00350
Train [91][2310/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.020)	Loss 2.4614 (2.4200)	Entropy 0.57405 (0.57236)	Top-1 acc 66.406 (65.642)	Top-5 acc 83.594 (85.163)	lr 0.00350
Train [91][2320/3239]	Time 0.236 (0.529)	Data Time 0.001 (0.020)	Loss 2.5875 (2.4201)	Entropy 0.57397 (0.57237)	Top-1 acc 63.281 (65.641)	Top-5 acc 82.812 (85.160)	lr 0.00350
Train [91][2330/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.020)	Loss 2.4407 (2.4201)	Entropy 0.57401 (0.57238)	Top-1 acc 68.750 (65.643)	Top-5 acc 83.984 (85.158)	lr 0.00350
Train [91][2340/3239]	Time 0.370 (0.528)	Data Time 0.001 (0.019)	Loss 2.3884 (2.4200)	Entropy 0.57408 (0.57238)	Top-1 acc 66.797 (65.647)	Top-5 acc 87.500 (85.158)	lr 0.00350
Train [91][2350/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.019)	Loss 2.3929 (2.4199)	Entropy 0.57393 (0.57239)	Top-1 acc 69.141 (65.649)	Top-5 acc 82.812 (85.158)	lr 0.00349
Train [91][2360/3239]	Time 0.260 (0.527)	Data Time 0.001 (0.019)	Loss 2.2986 (2.4198)	Entropy 0.57390 (0.57240)	Top-1 acc 64.453 (65.651)	Top-5 acc 89.453 (85.160)	lr 0.00349
Train [91][2370/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.019)	Loss 2.3265 (2.4198)	Entropy 0.57409 (0.57240)	Top-1 acc 70.703 (65.647)	Top-5 acc 86.719 (85.164)	lr 0.00349
Train [91][2380/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.019)	Loss 2.3115 (2.4197)	Entropy 0.57429 (0.57241)	Top-1 acc 66.406 (65.649)	Top-5 acc 88.672 (85.166)	lr 0.00349
Train [91][2390/3239]	Time 0.274 (0.526)	Data Time 0.001 (0.019)	Loss 2.6043 (2.4197)	Entropy 0.57406 (0.57242)	Top-1 acc 61.719 (65.648)	Top-5 acc 81.250 (85.166)	lr 0.00349
Train [91][2400/3239]	Time 0.240 (0.525)	Data Time 0.001 (0.019)	Loss 2.5450 (2.4197)	Entropy 0.57408 (0.57243)	Top-1 acc 64.844 (65.646)	Top-5 acc 82.812 (85.167)	lr 0.00349
Train [91][2410/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.019)	Loss 2.2325 (2.4195)	Entropy 0.57389 (0.57243)	Top-1 acc 68.359 (65.652)	Top-5 acc 89.844 (85.171)	lr 0.00349
Train [91][2420/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.019)	Loss 2.3903 (2.4196)	Entropy 0.57380 (0.57244)	Top-1 acc 66.406 (65.651)	Top-5 acc 85.156 (85.170)	lr 0.00349
Train [91][2430/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.019)	Loss 2.5198 (2.4196)	Entropy 0.57328 (0.57244)	Top-1 acc 62.891 (65.651)	Top-5 acc 83.203 (85.171)	lr 0.00349
Train [91][2440/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.019)	Loss 2.4903 (2.4199)	Entropy 0.57311 (0.57245)	Top-1 acc 64.844 (65.646)	Top-5 acc 82.812 (85.166)	lr 0.00349
Train [91][2450/3239]	Time 0.239 (0.523)	Data Time 0.001 (0.019)	Loss 2.3148 (2.4200)	Entropy 0.57324 (0.57245)	Top-1 acc 67.578 (65.646)	Top-5 acc 86.719 (85.167)	lr 0.00349
Train [91][2460/3239]	Time 0.239 (0.523)	Data Time 0.001 (0.019)	Loss 2.3006 (2.4196)	Entropy 0.57317 (0.57245)	Top-1 acc 66.406 (65.658)	Top-5 acc 88.281 (85.167)	lr 0.00349
Train [91][2470/3239]	Time 0.264 (0.544)	Data Time 0.004 (0.019)	Loss 2.3223 (2.4195)	Entropy 0.57325 (0.57245)	Top-1 acc 68.750 (65.667)	Top-5 acc 87.500 (85.169)	lr 0.00349
Train [91][2480/3239]	Time 0.251 (0.544)	Data Time 0.002 (0.018)	Loss 2.5139 (2.4196)	Entropy 0.57356 (0.57246)	Top-1 acc 64.844 (65.664)	Top-5 acc 84.375 (85.168)	lr 0.00349
Train [91][2490/3239]	Time 0.250 (0.543)	Data Time 0.002 (0.018)	Loss 2.1722 (2.4194)	Entropy 0.57366 (0.57246)	Top-1 acc 70.703 (65.669)	Top-5 acc 88.672 (85.174)	lr 0.00349
Train [91][2500/3239]	Time 0.346 (0.543)	Data Time 0.002 (0.018)	Loss 2.3649 (2.4191)	Entropy 0.57373 (0.57247)	Top-1 acc 63.281 (65.676)	Top-5 acc 86.328 (85.178)	lr 0.00348
Train [91][2510/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.018)	Loss 2.5237 (2.4190)	Entropy 0.57397 (0.57247)	Top-1 acc 64.844 (65.681)	Top-5 acc 84.766 (85.181)	lr 0.00348
Train [91][2520/3239]	Time 0.235 (0.542)	Data Time 0.001 (0.018)	Loss 2.3606 (2.4187)	Entropy 0.57379 (0.57248)	Top-1 acc 63.281 (65.685)	Top-5 acc 87.109 (85.186)	lr 0.00348
Train [91][2530/3239]	Time 0.272 (0.542)	Data Time 0.001 (0.018)	Loss 2.5902 (2.4187)	Entropy 0.57369 (0.57248)	Top-1 acc 62.109 (65.685)	Top-5 acc 82.422 (85.185)	lr 0.00348
Train [91][2540/3239]	Time 0.241 (0.541)	Data Time 0.001 (0.018)	Loss 2.2452 (2.4186)	Entropy 0.57345 (0.57249)	Top-1 acc 71.094 (65.686)	Top-5 acc 87.500 (85.186)	lr 0.00348
Train [91][2550/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.018)	Loss 2.4540 (2.4185)	Entropy 0.57363 (0.57249)	Top-1 acc 66.016 (65.687)	Top-5 acc 85.938 (85.185)	lr 0.00348
Train [91][2560/3239]	Time 0.241 (0.541)	Data Time 0.001 (0.018)	Loss 2.3780 (2.4185)	Entropy 0.57396 (0.57250)	Top-1 acc 65.625 (65.688)	Top-5 acc 84.375 (85.183)	lr 0.00348
Train [91][2570/3239]	Time 0.261 (0.540)	Data Time 0.001 (0.018)	Loss 2.3765 (2.4185)	Entropy 0.57434 (0.57250)	Top-1 acc 66.797 (65.685)	Top-5 acc 87.109 (85.182)	lr 0.00348
Train [91][2580/3239]	Time 0.242 (0.540)	Data Time 0.001 (0.018)	Loss 2.4168 (2.4187)	Entropy 0.57377 (0.57251)	Top-1 acc 65.234 (65.682)	Top-5 acc 85.938 (85.178)	lr 0.00348
Train [91][2590/3239]	Time 0.247 (0.539)	Data Time 0.002 (0.018)	Loss 2.5205 (2.4185)	Entropy 0.57293 (0.57251)	Top-1 acc 61.719 (65.686)	Top-5 acc 83.594 (85.181)	lr 0.00348
Train [91][2600/3239]	Time 0.240 (0.539)	Data Time 0.001 (0.018)	Loss 2.6507 (2.4188)	Entropy 0.57332 (0.57252)	Top-1 acc 58.203 (65.676)	Top-5 acc 79.688 (85.177)	lr 0.00348
Train [91][2610/3239]	Time 0.250 (0.539)	Data Time 0.001 (0.018)	Loss 2.6304 (2.4189)	Entropy 0.57268 (0.57252)	Top-1 acc 61.328 (65.673)	Top-5 acc 82.422 (85.174)	lr 0.00348
Train [91][2620/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.018)	Loss 2.7444 (2.4194)	Entropy 0.57277 (0.57252)	Top-1 acc 57.031 (65.659)	Top-5 acc 79.688 (85.162)	lr 0.00348
Train [91][2630/3239]	Time 0.242 (0.538)	Data Time 0.001 (0.018)	Loss 2.3446 (2.4194)	Entropy 0.57266 (0.57252)	Top-1 acc 69.531 (65.660)	Top-5 acc 85.938 (85.163)	lr 0.00348
Train [91][2640/3239]	Time 0.263 (0.538)	Data Time 0.001 (0.017)	Loss 2.6660 (2.4193)	Entropy 0.57209 (0.57252)	Top-1 acc 64.062 (65.663)	Top-5 acc 78.125 (85.163)	lr 0.00347
Train [91][2650/3239]	Time 0.249 (0.537)	Data Time 0.001 (0.017)	Loss 2.4109 (2.4195)	Entropy 0.57192 (0.57252)	Top-1 acc 66.797 (65.660)	Top-5 acc 83.203 (85.160)	lr 0.00347
Train [91][2660/3239]	Time 0.388 (0.537)	Data Time 0.002 (0.017)	Loss 2.3680 (2.4197)	Entropy 0.57188 (0.57251)	Top-1 acc 64.844 (65.654)	Top-5 acc 89.844 (85.157)	lr 0.00347
Train [91][2670/3239]	Time 0.267 (0.537)	Data Time 0.002 (0.017)	Loss 2.2628 (2.4194)	Entropy 0.57201 (0.57251)	Top-1 acc 71.094 (65.659)	Top-5 acc 86.328 (85.160)	lr 0.00347
Train [91][2680/3239]	Time 0.331 (0.537)	Data Time 0.001 (0.017)	Loss 2.4769 (2.4195)	Entropy 0.57179 (0.57251)	Top-1 acc 63.672 (65.656)	Top-5 acc 84.375 (85.160)	lr 0.00347
Train [91][2690/3239]	Time 0.287 (0.537)	Data Time 0.004 (0.017)	Loss 2.3957 (2.4192)	Entropy 0.57169 (0.57251)	Top-1 acc 65.625 (65.665)	Top-5 acc 85.938 (85.166)	lr 0.00347
Train [91][2700/3239]	Time 0.252 (0.537)	Data Time 0.001 (0.017)	Loss 2.5236 (2.4194)	Entropy 0.57156 (0.57250)	Top-1 acc 62.891 (65.661)	Top-5 acc 82.812 (85.163)	lr 0.00347
Train [91][2710/3239]	Time 0.240 (0.537)	Data Time 0.001 (0.017)	Loss 2.3116 (2.4195)	Entropy 0.57164 (0.57250)	Top-1 acc 69.141 (65.658)	Top-5 acc 85.547 (85.163)	lr 0.00347
Train [91][2720/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.017)	Loss 2.5599 (2.4193)	Entropy 0.57151 (0.57250)	Top-1 acc 60.938 (65.661)	Top-5 acc 82.422 (85.164)	lr 0.00347
Train [91][2730/3239]	Time 0.367 (0.536)	Data Time 0.002 (0.017)	Loss 2.3929 (2.4193)	Entropy 0.57142 (0.57249)	Top-1 acc 64.453 (65.661)	Top-5 acc 85.547 (85.167)	lr 0.00347
Train [91][2740/3239]	Time 0.253 (0.536)	Data Time 0.001 (0.017)	Loss 2.3590 (2.4192)	Entropy 0.57142 (0.57249)	Top-1 acc 66.797 (65.664)	Top-5 acc 85.547 (85.169)	lr 0.00347
Train [91][2750/3239]	Time 0.288 (0.535)	Data Time 0.001 (0.017)	Loss 2.3321 (2.4190)	Entropy 0.57148 (0.57249)	Top-1 acc 67.578 (65.664)	Top-5 acc 84.375 (85.171)	lr 0.00347
Train [91][2760/3239]	Time 0.274 (0.535)	Data Time 0.001 (0.017)	Loss 2.7217 (2.4191)	Entropy 0.57147 (0.57248)	Top-1 acc 58.203 (65.663)	Top-5 acc 80.859 (85.171)	lr 0.00347
Train [91][2770/3239]	Time 0.343 (0.535)	Data Time 0.003 (0.017)	Loss 2.5449 (2.4191)	Entropy 0.57155 (0.57248)	Top-1 acc 61.719 (65.665)	Top-5 acc 84.375 (85.172)	lr 0.00347
Train [91][2780/3239]	Time 0.247 (0.535)	Data Time 0.001 (0.017)	Loss 2.4632 (2.4191)	Entropy 0.57163 (0.57248)	Top-1 acc 64.453 (65.668)	Top-5 acc 84.375 (85.172)	lr 0.00346
Train [91][2790/3239]	Time 0.259 (0.534)	Data Time 0.001 (0.017)	Loss 2.3096 (2.4190)	Entropy 0.57169 (0.57247)	Top-1 acc 69.141 (65.672)	Top-5 acc 85.547 (85.174)	lr 0.00346
Train [91][2800/3239]	Time 0.300 (0.534)	Data Time 0.002 (0.017)	Loss 2.3978 (2.4190)	Entropy 0.57181 (0.57247)	Top-1 acc 65.234 (65.672)	Top-5 acc 82.422 (85.172)	lr 0.00346
Train [91][2810/3239]	Time 0.238 (0.534)	Data Time 0.001 (0.017)	Loss 2.4121 (2.4191)	Entropy 0.57207 (0.57247)	Top-1 acc 65.234 (65.669)	Top-5 acc 83.984 (85.168)	lr 0.00346
Train [91][2820/3239]	Time 0.380 (0.534)	Data Time 0.001 (0.016)	Loss 2.2830 (2.4191)	Entropy 0.57200 (0.57247)	Top-1 acc 70.312 (65.674)	Top-5 acc 87.891 (85.170)	lr 0.00346
Train [91][2830/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.016)	Loss 2.2683 (2.4192)	Entropy 0.57170 (0.57246)	Top-1 acc 71.484 (65.673)	Top-5 acc 87.109 (85.166)	lr 0.00346
Train [91][2840/3239]	Time 0.240 (0.533)	Data Time 0.001 (0.016)	Loss 2.3209 (2.4193)	Entropy 0.57136 (0.57246)	Top-1 acc 67.578 (65.674)	Top-5 acc 88.672 (85.165)	lr 0.00346
Train [91][2850/3239]	Time 0.299 (0.533)	Data Time 0.001 (0.016)	Loss 2.4679 (2.4195)	Entropy 0.57143 (0.57246)	Top-1 acc 65.234 (65.666)	Top-5 acc 83.594 (85.161)	lr 0.00346
Train [91][2860/3239]	Time 0.249 (0.533)	Data Time 0.001 (0.016)	Loss 2.7107 (2.4197)	Entropy 0.57133 (0.57245)	Top-1 acc 56.641 (65.659)	Top-5 acc 82.031 (85.157)	lr 0.00346
Train [91][2870/3239]	Time 0.279 (0.532)	Data Time 0.001 (0.016)	Loss 2.3933 (2.4196)	Entropy 0.57143 (0.57245)	Top-1 acc 64.844 (65.661)	Top-5 acc 85.547 (85.160)	lr 0.00346
Train [91][2880/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.016)	Loss 2.5666 (2.4194)	Entropy 0.57131 (0.57245)	Top-1 acc 62.109 (65.667)	Top-5 acc 80.859 (85.163)	lr 0.00346
Train [91][2890/3239]	Time 0.370 (0.532)	Data Time 0.001 (0.016)	Loss 2.3980 (2.4195)	Entropy 0.57136 (0.57244)	Top-1 acc 64.844 (65.665)	Top-5 acc 85.938 (85.164)	lr 0.00346
Train [91][2900/3239]	Time 0.245 (0.531)	Data Time 0.001 (0.016)	Loss 2.2165 (2.4195)	Entropy 0.57135 (0.57244)	Top-1 acc 69.922 (65.664)	Top-5 acc 88.672 (85.161)	lr 0.00346
Train [91][2910/3239]	Time 0.251 (0.531)	Data Time 0.002 (0.016)	Loss 2.5514 (2.4196)	Entropy 0.57127 (0.57243)	Top-1 acc 57.812 (65.661)	Top-5 acc 84.766 (85.159)	lr 0.00346
Train [91][2920/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.016)	Loss 2.3436 (2.4196)	Entropy 0.57138 (0.57243)	Top-1 acc 66.016 (65.660)	Top-5 acc 87.109 (85.156)	lr 0.00346
Train [91][2930/3239]	Time 0.226 (0.530)	Data Time 0.001 (0.016)	Loss 2.4520 (2.4197)	Entropy 0.57119 (0.57243)	Top-1 acc 68.359 (65.660)	Top-5 acc 84.766 (85.153)	lr 0.00345
Train [91][2940/3239]	Time 0.235 (0.530)	Data Time 0.002 (0.016)	Loss 2.5744 (2.4197)	Entropy 0.57118 (0.57242)	Top-1 acc 59.375 (65.660)	Top-5 acc 83.203 (85.154)	lr 0.00345
Train [91][2950/3239]	Time 0.245 (0.530)	Data Time 0.001 (0.016)	Loss 2.6421 (2.4200)	Entropy 0.57122 (0.57242)	Top-1 acc 60.156 (65.654)	Top-5 acc 82.031 (85.144)	lr 0.00345
Train [91][2960/3239]	Time 0.247 (0.530)	Data Time 0.001 (0.016)	Loss 2.3227 (2.4199)	Entropy 0.57129 (0.57242)	Top-1 acc 67.578 (65.653)	Top-5 acc 86.719 (85.147)	lr 0.00345
Train [91][2970/3239]	Time 0.250 (0.529)	Data Time 0.001 (0.016)	Loss 2.7509 (2.4201)	Entropy 0.57149 (0.57241)	Top-1 acc 54.688 (65.647)	Top-5 acc 79.297 (85.141)	lr 0.00345
Train [91][2980/3239]	Time 0.320 (0.529)	Data Time 0.001 (0.016)	Loss 2.4994 (2.4201)	Entropy 0.57140 (0.57241)	Top-1 acc 63.281 (65.648)	Top-5 acc 82.812 (85.141)	lr 0.00345
Train [91][2990/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.016)	Loss 2.2853 (2.4202)	Entropy 0.57115 (0.57240)	Top-1 acc 65.625 (65.644)	Top-5 acc 88.281 (85.138)	lr 0.00345
Train [91][3000/3239]	Time 0.245 (0.528)	Data Time 0.001 (0.016)	Loss 2.2626 (2.4203)	Entropy 0.57112 (0.57240)	Top-1 acc 67.969 (65.643)	Top-5 acc 87.891 (85.136)	lr 0.00345
Train [91][3010/3239]	Time 0.241 (0.528)	Data Time 0.001 (0.016)	Loss 2.4310 (2.4202)	Entropy 0.57150 (0.57240)	Top-1 acc 62.109 (65.646)	Top-5 acc 83.984 (85.137)	lr 0.00345
Train [91][3020/3239]	Time 0.255 (0.528)	Data Time 0.001 (0.015)	Loss 2.5645 (2.4201)	Entropy 0.57141 (0.57239)	Top-1 acc 61.328 (65.649)	Top-5 acc 83.203 (85.141)	lr 0.00345
Train [91][3030/3239]	Time 0.243 (0.528)	Data Time 0.001 (0.015)	Loss 2.4533 (2.4200)	Entropy 0.57156 (0.57239)	Top-1 acc 65.234 (65.653)	Top-5 acc 83.594 (85.143)	lr 0.00345
Train [91][3040/3239]	Time 0.229 (0.527)	Data Time 0.001 (0.015)	Loss 2.2639 (2.4199)	Entropy 0.57222 (0.57239)	Top-1 acc 67.969 (65.654)	Top-5 acc 87.500 (85.143)	lr 0.00345
Train [91][3050/3239]	Time 0.346 (0.527)	Data Time 0.001 (0.015)	Loss 2.2908 (2.4200)	Entropy 0.57248 (0.57239)	Top-1 acc 67.578 (65.653)	Top-5 acc 85.547 (85.141)	lr 0.00345
Train [91][3060/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.015)	Loss 2.4737 (2.4200)	Entropy 0.57252 (0.57239)	Top-1 acc 66.797 (65.655)	Top-5 acc 83.984 (85.139)	lr 0.00345
Train [91][3070/3239]	Time 0.258 (0.527)	Data Time 0.001 (0.015)	Loss 2.4409 (2.4201)	Entropy 0.57259 (0.57239)	Top-1 acc 66.406 (65.655)	Top-5 acc 83.984 (85.136)	lr 0.00344
Train [91][3080/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.015)	Loss 2.5778 (2.4199)	Entropy 0.57278 (0.57239)	Top-1 acc 63.672 (65.660)	Top-5 acc 80.859 (85.136)	lr 0.00344
Train [91][3090/3239]	Time 0.275 (0.526)	Data Time 0.002 (0.015)	Loss 2.6579 (2.4199)	Entropy 0.57256 (0.57239)	Top-1 acc 60.938 (65.658)	Top-5 acc 82.031 (85.138)	lr 0.00344
Train [91][3100/3239]	Time 0.278 (0.526)	Data Time 0.002 (0.015)	Loss 2.2254 (2.4199)	Entropy 0.57249 (0.57239)	Top-1 acc 70.312 (65.659)	Top-5 acc 89.062 (85.139)	lr 0.00344
Train [91][3110/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.015)	Loss 2.4118 (2.4201)	Entropy 0.57266 (0.57239)	Top-1 acc 66.406 (65.653)	Top-5 acc 82.031 (85.135)	lr 0.00344
Train [91][3120/3239]	Time 0.326 (0.542)	Data Time 0.036 (0.015)	Loss 2.4085 (2.4198)	Entropy 0.57249 (0.57239)	Top-1 acc 67.188 (65.658)	Top-5 acc 87.500 (85.139)	lr 0.00344
Train [91][3130/3239]	Time 0.245 (0.542)	Data Time 0.002 (0.015)	Loss 2.4167 (2.4199)	Entropy 0.57235 (0.57239)	Top-1 acc 63.672 (65.657)	Top-5 acc 86.719 (85.139)	lr 0.00344
Train [91][3140/3239]	Time 0.296 (0.542)	Data Time 0.001 (0.015)	Loss 2.2037 (2.4199)	Entropy 0.57253 (0.57239)	Top-1 acc 70.312 (65.657)	Top-5 acc 89.844 (85.139)	lr 0.00344
Train [91][3150/3239]	Time 0.301 (0.542)	Data Time 0.003 (0.015)	Loss 2.2639 (2.4197)	Entropy 0.57275 (0.57239)	Top-1 acc 68.359 (65.661)	Top-5 acc 88.672 (85.143)	lr 0.00344
Train [91][3160/3239]	Time 0.263 (0.541)	Data Time 0.002 (0.015)	Loss 2.3939 (2.4200)	Entropy 0.57320 (0.57240)	Top-1 acc 67.969 (65.652)	Top-5 acc 83.594 (85.138)	lr 0.00344
Train [91][3170/3239]	Time 0.270 (0.541)	Data Time 0.002 (0.015)	Loss 2.3976 (2.4200)	Entropy 0.57322 (0.57240)	Top-1 acc 65.625 (65.654)	Top-5 acc 87.109 (85.140)	lr 0.00344
Train [91][3180/3239]	Time 0.262 (0.541)	Data Time 0.000 (0.015)	Loss 2.3050 (2.4200)	Entropy 0.57287 (0.57240)	Top-1 acc 64.453 (65.653)	Top-5 acc 88.672 (85.139)	lr 0.00344
Train [91][3190/3239]	Time 0.246 (0.541)	Data Time 0.000 (0.015)	Loss 2.6544 (2.4201)	Entropy 0.57222 (0.57240)	Top-1 acc 62.500 (65.653)	Top-5 acc 78.906 (85.137)	lr 0.00344
Train [91][3200/3239]	Time 0.248 (0.540)	Data Time 0.000 (0.015)	Loss 2.4746 (2.4201)	Entropy 0.57250 (0.57240)	Top-1 acc 64.844 (65.652)	Top-5 acc 82.812 (85.136)	lr 0.00344
Train [91][3210/3239]	Time 0.348 (0.540)	Data Time 0.000 (0.015)	Loss 2.4119 (2.4200)	Entropy 0.57277 (0.57240)	Top-1 acc 66.797 (65.655)	Top-5 acc 83.594 (85.135)	lr 0.00343
Train [91][3220/3239]	Time 0.247 (0.539)	Data Time 0.000 (0.015)	Loss 2.4617 (2.4203)	Entropy 0.57285 (0.57240)	Top-1 acc 66.406 (65.649)	Top-5 acc 84.766 (85.131)	lr 0.00343
Train [91][3230/3239]	Time 0.229 (0.539)	Data Time 0.000 (0.015)	Loss 2.3887 (2.4203)	Entropy 0.57311 (0.57241)	Top-1 acc 67.969 (65.651)	Top-5 acc 83.984 (85.130)	lr 0.00343
Train [91][3239/3239]	Time 0.972 (0.539)	Data Time 0.000 (0.015)	Loss 2.7404 (2.4203)	Entropy 0.57309 (0.57241)	Top-1 acc 58.025 (65.654)	Top-5 acc 80.247 (85.129)	lr 0.00343
==========Valid [91/120]	loss 1.236	top-1 acc 71.377 (71.623)	top-5 acc 89.878	Train top-1 65.654	top-5 85.129	Entropy 0.57309	Latency-None: 0.000ms	Flops: 537.50M
Train [92][0/3239]	Time 37.555 (37.555)	Data Time 36.206 (36.206)	Loss 2.2330 (2.2330)	Entropy 0.57305 (0.57305)	Top-1 acc 71.875 (71.875)	Top-5 acc 85.938 (85.938)	lr 0.00343
Train [92][10/3239]	Time 0.234 (4.026)	Data Time 0.001 (3.432)	Loss 2.4731 (2.4149)	Entropy 0.57327 (0.57308)	Top-1 acc 66.797 (65.234)	Top-5 acc 84.375 (85.085)	lr 0.00343
Train [92][20/3239]	Time 0.252 (2.327)	Data Time 0.001 (1.799)	Loss 2.3132 (2.3991)	Entropy 0.57300 (0.57315)	Top-1 acc 68.359 (65.792)	Top-5 acc 86.719 (85.547)	lr 0.00343
Train [92][30/3239]	Time 0.239 (1.722)	Data Time 0.001 (1.219)	Loss 2.6063 (2.4374)	Entropy 0.57298 (0.57311)	Top-1 acc 59.766 (65.045)	Top-5 acc 83.203 (84.841)	lr 0.00343
Train [92][40/3239]	Time 0.502 (1.437)	Data Time 0.002 (0.922)	Loss 2.3553 (2.4245)	Entropy 0.57315 (0.57310)	Top-1 acc 69.531 (65.311)	Top-5 acc 85.938 (85.004)	lr 0.00343
Train [92][50/3239]	Time 0.232 (1.251)	Data Time 0.001 (0.743)	Loss 2.6495 (2.4265)	Entropy 0.57309 (0.57311)	Top-1 acc 60.547 (65.472)	Top-5 acc 80.469 (84.995)	lr 0.00343
Train [92][60/3239]	Time 0.231 (1.116)	Data Time 0.001 (0.621)	Loss 2.4244 (2.4199)	Entropy 0.57300 (0.57310)	Top-1 acc 69.531 (65.663)	Top-5 acc 83.203 (85.131)	lr 0.00343
Train [92][70/3239]	Time 0.234 (1.021)	Data Time 0.001 (0.534)	Loss 2.3035 (2.4143)	Entropy 0.57311 (0.57309)	Top-1 acc 69.922 (65.812)	Top-5 acc 87.109 (85.195)	lr 0.00343
Train [92][80/3239]	Time 0.224 (0.946)	Data Time 0.001 (0.468)	Loss 2.3702 (2.4138)	Entropy 0.57301 (0.57309)	Top-1 acc 64.844 (65.731)	Top-5 acc 84.375 (85.161)	lr 0.00343
Train [92][90/3239]	Time 0.226 (0.889)	Data Time 0.001 (0.417)	Loss 2.5233 (2.4182)	Entropy 0.57327 (0.57308)	Top-1 acc 61.328 (65.702)	Top-5 acc 83.984 (85.062)	lr 0.00343
Train [92][100/3239]	Time 0.235 (0.843)	Data Time 0.001 (0.376)	Loss 2.4088 (2.4157)	Entropy 0.57360 (0.57310)	Top-1 acc 60.547 (65.795)	Top-5 acc 84.375 (85.137)	lr 0.00343
Train [92][110/3239]	Time 0.330 (0.805)	Data Time 0.001 (0.342)	Loss 2.2952 (2.4182)	Entropy 0.57355 (0.57315)	Top-1 acc 72.656 (65.812)	Top-5 acc 87.500 (85.075)	lr 0.00343
Train [92][120/3239]	Time 0.226 (0.775)	Data Time 0.001 (0.314)	Loss 2.4529 (2.4124)	Entropy 0.57392 (0.57320)	Top-1 acc 66.016 (65.948)	Top-5 acc 82.812 (85.153)	lr 0.00342
Train [92][130/3239]	Time 0.241 (0.748)	Data Time 0.001 (0.290)	Loss 2.2717 (2.4128)	Entropy 0.57380 (0.57325)	Top-1 acc 69.531 (65.953)	Top-5 acc 86.719 (85.150)	lr 0.00342
Train [92][140/3239]	Time 0.227 (0.726)	Data Time 0.001 (0.270)	Loss 2.5818 (2.4139)	Entropy 0.57342 (0.57328)	Top-1 acc 64.062 (65.855)	Top-5 acc 80.078 (85.153)	lr 0.00342
Train [92][150/3239]	Time 0.237 (0.705)	Data Time 0.001 (0.252)	Loss 2.4553 (2.4147)	Entropy 0.57358 (0.57329)	Top-1 acc 65.625 (65.803)	Top-5 acc 83.594 (85.112)	lr 0.00342
Train [92][160/3239]	Time 0.228 (0.688)	Data Time 0.001 (0.237)	Loss 2.3731 (2.4141)	Entropy 0.57380 (0.57332)	Top-1 acc 68.750 (65.805)	Top-5 acc 82.422 (85.147)	lr 0.00342
Train [92][170/3239]	Time 0.230 (0.672)	Data Time 0.001 (0.223)	Loss 2.3266 (2.4127)	Entropy 0.57400 (0.57335)	Top-1 acc 69.141 (65.879)	Top-5 acc 85.156 (85.170)	lr 0.00342
Train [92][180/3239]	Time 0.236 (0.659)	Data Time 0.001 (0.211)	Loss 2.5504 (2.4150)	Entropy 0.57400 (0.57339)	Top-1 acc 62.109 (65.817)	Top-5 acc 82.031 (85.143)	lr 0.00342
Train [92][190/3239]	Time 0.251 (0.650)	Data Time 0.001 (0.200)	Loss 2.3744 (2.4194)	Entropy 0.57393 (0.57341)	Top-1 acc 66.016 (65.678)	Top-5 acc 84.766 (85.050)	lr 0.00342
Train [92][200/3239]	Time 0.341 (0.640)	Data Time 0.001 (0.190)	Loss 2.7343 (2.4198)	Entropy 0.57370 (0.57343)	Top-1 acc 57.422 (65.592)	Top-5 acc 80.859 (85.051)	lr 0.00342
Train [92][210/3239]	Time 0.231 (0.629)	Data Time 0.001 (0.181)	Loss 2.3458 (2.4187)	Entropy 0.57387 (0.57345)	Top-1 acc 67.578 (65.660)	Top-5 acc 85.938 (85.091)	lr 0.00342
Train [92][220/3239]	Time 0.236 (0.620)	Data Time 0.001 (0.173)	Loss 2.3122 (2.4173)	Entropy 0.57393 (0.57346)	Top-1 acc 68.359 (65.703)	Top-5 acc 87.500 (85.128)	lr 0.00342
Train [92][230/3239]	Time 0.236 (0.611)	Data Time 0.001 (0.165)	Loss 2.3510 (2.4143)	Entropy 0.57382 (0.57349)	Top-1 acc 69.141 (65.786)	Top-5 acc 86.719 (85.149)	lr 0.00342
Train [92][240/3239]	Time 0.250 (0.603)	Data Time 0.001 (0.159)	Loss 2.4525 (2.4141)	Entropy 0.57363 (0.57350)	Top-1 acc 63.281 (65.766)	Top-5 acc 82.031 (85.150)	lr 0.00342
Train [92][250/3239]	Time 0.250 (0.596)	Data Time 0.001 (0.152)	Loss 2.2610 (2.4160)	Entropy 0.57400 (0.57351)	Top-1 acc 69.141 (65.712)	Top-5 acc 87.891 (85.134)	lr 0.00342
Train [92][260/3239]	Time 0.235 (0.589)	Data Time 0.001 (0.147)	Loss 2.3799 (2.4184)	Entropy 0.57401 (0.57353)	Top-1 acc 66.016 (65.697)	Top-5 acc 83.594 (85.092)	lr 0.00341
Train [92][270/3239]	Time 0.334 (0.583)	Data Time 0.001 (0.141)	Loss 2.3987 (2.4153)	Entropy 0.57392 (0.57354)	Top-1 acc 66.016 (65.795)	Top-5 acc 83.984 (85.149)	lr 0.00341
Train [92][280/3239]	Time 0.240 (0.578)	Data Time 0.001 (0.136)	Loss 2.4256 (2.4168)	Entropy 0.57372 (0.57355)	Top-1 acc 66.016 (65.756)	Top-5 acc 85.938 (85.119)	lr 0.00341
Train [92][290/3239]	Time 0.238 (0.572)	Data Time 0.001 (0.132)	Loss 2.3291 (2.4162)	Entropy 0.57386 (0.57356)	Top-1 acc 67.188 (65.786)	Top-5 acc 86.328 (85.116)	lr 0.00341
Train [92][300/3239]	Time 0.236 (0.567)	Data Time 0.001 (0.127)	Loss 2.3142 (2.4185)	Entropy 0.57365 (0.57357)	Top-1 acc 69.922 (65.772)	Top-5 acc 86.328 (85.087)	lr 0.00341
Train [92][310/3239]	Time 0.229 (0.562)	Data Time 0.001 (0.123)	Loss 2.2638 (2.4177)	Entropy 0.57314 (0.57357)	Top-1 acc 69.141 (65.753)	Top-5 acc 88.672 (85.111)	lr 0.00341
Train [92][320/3239]	Time 0.232 (0.558)	Data Time 0.001 (0.120)	Loss 2.2363 (2.4176)	Entropy 0.57326 (0.57355)	Top-1 acc 71.875 (65.742)	Top-5 acc 87.891 (85.099)	lr 0.00341
Train [92][330/3239]	Time 0.275 (0.554)	Data Time 0.002 (0.116)	Loss 2.5010 (2.4155)	Entropy 0.57324 (0.57354)	Top-1 acc 66.016 (65.823)	Top-5 acc 83.203 (85.122)	lr 0.00341
Train [92][340/3239]	Time 0.271 (0.553)	Data Time 0.002 (0.113)	Loss 2.2776 (2.4155)	Entropy 0.57330 (0.57354)	Top-1 acc 69.922 (65.833)	Top-5 acc 88.281 (85.125)	lr 0.00341
Train [92][350/3239]	Time 0.239 (0.549)	Data Time 0.001 (0.109)	Loss 2.3010 (2.4139)	Entropy 0.57305 (0.57353)	Top-1 acc 66.797 (65.889)	Top-5 acc 88.281 (85.165)	lr 0.00341
Train [92][360/3239]	Time 0.258 (0.545)	Data Time 0.001 (0.106)	Loss 2.2755 (2.4121)	Entropy 0.57303 (0.57351)	Top-1 acc 71.484 (65.930)	Top-5 acc 86.719 (85.197)	lr 0.00341
Train [92][370/3239]	Time 0.237 (0.542)	Data Time 0.001 (0.104)	Loss 2.3898 (2.4124)	Entropy 0.57337 (0.57350)	Top-1 acc 66.797 (65.936)	Top-5 acc 85.938 (85.216)	lr 0.00341
Train [92][380/3239]	Time 0.239 (0.538)	Data Time 0.001 (0.101)	Loss 2.3806 (2.4121)	Entropy 0.57366 (0.57350)	Top-1 acc 67.969 (65.941)	Top-5 acc 85.156 (85.228)	lr 0.00341
Train [92][390/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.098)	Loss 2.2642 (2.4117)	Entropy 0.57379 (0.57350)	Top-1 acc 67.578 (65.946)	Top-5 acc 87.500 (85.231)	lr 0.00341
Train [92][400/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.096)	Loss 2.9225 (2.4123)	Entropy 0.57350 (0.57351)	Top-1 acc 53.906 (65.935)	Top-5 acc 75.391 (85.217)	lr 0.00341
Train [92][410/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.094)	Loss 2.5022 (2.4116)	Entropy 0.57344 (0.57351)	Top-1 acc 65.234 (65.980)	Top-5 acc 84.375 (85.240)	lr 0.00340
Train [92][420/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.092)	Loss 2.3655 (2.4117)	Entropy 0.57365 (0.57351)	Top-1 acc 65.234 (65.984)	Top-5 acc 86.719 (85.245)	lr 0.00340
Train [92][430/3239]	Time 0.327 (0.525)	Data Time 0.001 (0.089)	Loss 2.3456 (2.4124)	Entropy 0.57372 (0.57351)	Top-1 acc 64.453 (65.960)	Top-5 acc 85.547 (85.231)	lr 0.00340
Train [92][440/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.087)	Loss 2.5459 (2.4131)	Entropy 0.57324 (0.57351)	Top-1 acc 62.891 (65.947)	Top-5 acc 82.812 (85.224)	lr 0.00340
Train [92][450/3239]	Time 0.242 (0.520)	Data Time 0.001 (0.086)	Loss 2.3601 (2.4125)	Entropy 0.57288 (0.57350)	Top-1 acc 68.359 (65.954)	Top-5 acc 85.547 (85.244)	lr 0.00340
Train [92][460/3239]	Time 0.246 (0.518)	Data Time 0.001 (0.084)	Loss 2.5719 (2.4133)	Entropy 0.57285 (0.57349)	Top-1 acc 60.156 (65.926)	Top-5 acc 84.375 (85.246)	lr 0.00340
Train [92][470/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.082)	Loss 2.5589 (2.4150)	Entropy 0.57258 (0.57347)	Top-1 acc 64.844 (65.901)	Top-5 acc 82.422 (85.202)	lr 0.00340
Train [92][480/3239]	Time 0.237 (0.514)	Data Time 0.002 (0.080)	Loss 2.5184 (2.4153)	Entropy 0.57284 (0.57345)	Top-1 acc 62.109 (65.891)	Top-5 acc 82.812 (85.200)	lr 0.00340
Train [92][490/3239]	Time 0.239 (0.512)	Data Time 0.001 (0.079)	Loss 2.3722 (2.4153)	Entropy 0.57254 (0.57344)	Top-1 acc 65.625 (65.884)	Top-5 acc 85.156 (85.197)	lr 0.00340
Train [92][500/3239]	Time 0.326 (0.511)	Data Time 0.001 (0.077)	Loss 2.4953 (2.4159)	Entropy 0.57272 (0.57342)	Top-1 acc 64.453 (65.878)	Top-5 acc 81.250 (85.192)	lr 0.00340
Train [92][510/3239]	Time 0.235 (0.509)	Data Time 0.001 (0.076)	Loss 2.4037 (2.4159)	Entropy 0.57255 (0.57341)	Top-1 acc 64.844 (65.860)	Top-5 acc 87.891 (85.200)	lr 0.00340
Train [92][520/3239]	Time 0.243 (0.507)	Data Time 0.001 (0.074)	Loss 2.2146 (2.4164)	Entropy 0.57246 (0.57339)	Top-1 acc 69.531 (65.839)	Top-5 acc 88.281 (85.183)	lr 0.00340
Train [92][530/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.073)	Loss 2.6790 (2.4172)	Entropy 0.57166 (0.57337)	Top-1 acc 59.766 (65.834)	Top-5 acc 80.078 (85.175)	lr 0.00340
Train [92][540/3239]	Time 0.394 (0.606)	Data Time 0.009 (0.072)	Loss 2.2545 (2.4168)	Entropy 0.57179 (0.57334)	Top-1 acc 69.141 (65.827)	Top-5 acc 89.062 (85.205)	lr 0.00340
Train [92][550/3239]	Time 0.249 (0.603)	Data Time 0.002 (0.070)	Loss 2.5160 (2.4178)	Entropy 0.57171 (0.57331)	Top-1 acc 64.844 (65.807)	Top-5 acc 84.766 (85.185)	lr 0.00339
Train [92][560/3239]	Time 0.252 (0.600)	Data Time 0.002 (0.069)	Loss 2.4859 (2.4188)	Entropy 0.57176 (0.57328)	Top-1 acc 61.719 (65.777)	Top-5 acc 82.812 (85.157)	lr 0.00339
Train [92][570/3239]	Time 0.240 (0.597)	Data Time 0.001 (0.068)	Loss 2.3509 (2.4179)	Entropy 0.57193 (0.57325)	Top-1 acc 67.969 (65.811)	Top-5 acc 86.328 (85.169)	lr 0.00339
Train [92][580/3239]	Time 0.241 (0.594)	Data Time 0.001 (0.067)	Loss 2.1874 (2.4184)	Entropy 0.57186 (0.57323)	Top-1 acc 71.875 (65.805)	Top-5 acc 87.500 (85.157)	lr 0.00339
Train [92][590/3239]	Time 0.404 (0.592)	Data Time 0.002 (0.066)	Loss 2.5087 (2.4178)	Entropy 0.57180 (0.57321)	Top-1 acc 62.891 (65.816)	Top-5 acc 83.594 (85.156)	lr 0.00339
Train [92][600/3239]	Time 0.239 (0.589)	Data Time 0.001 (0.065)	Loss 2.6236 (2.4171)	Entropy 0.57156 (0.57318)	Top-1 acc 60.156 (65.837)	Top-5 acc 83.594 (85.172)	lr 0.00339
Train [92][610/3239]	Time 0.237 (0.587)	Data Time 0.002 (0.064)	Loss 2.4188 (2.4182)	Entropy 0.57151 (0.57316)	Top-1 acc 66.406 (65.804)	Top-5 acc 84.375 (85.141)	lr 0.00339
Train [92][620/3239]	Time 0.257 (0.585)	Data Time 0.002 (0.063)	Loss 2.4260 (2.4181)	Entropy 0.57136 (0.57313)	Top-1 acc 64.062 (65.802)	Top-5 acc 83.984 (85.139)	lr 0.00339
Train [92][630/3239]	Time 0.245 (0.584)	Data Time 0.001 (0.062)	Loss 2.7206 (2.4196)	Entropy 0.57161 (0.57310)	Top-1 acc 56.250 (65.769)	Top-5 acc 83.594 (85.122)	lr 0.00339
Train [92][640/3239]	Time 0.237 (0.582)	Data Time 0.001 (0.061)	Loss 2.3301 (2.4185)	Entropy 0.57156 (0.57308)	Top-1 acc 67.188 (65.791)	Top-5 acc 85.938 (85.151)	lr 0.00339
Train [92][650/3239]	Time 0.243 (0.580)	Data Time 0.001 (0.060)	Loss 2.2276 (2.4190)	Entropy 0.57161 (0.57305)	Top-1 acc 71.875 (65.774)	Top-5 acc 88.281 (85.144)	lr 0.00339
Train [92][660/3239]	Time 0.340 (0.578)	Data Time 0.001 (0.059)	Loss 2.5327 (2.4189)	Entropy 0.57162 (0.57303)	Top-1 acc 62.500 (65.772)	Top-5 acc 83.594 (85.148)	lr 0.00339
Train [92][670/3239]	Time 0.232 (0.576)	Data Time 0.001 (0.058)	Loss 2.5644 (2.4187)	Entropy 0.57168 (0.57301)	Top-1 acc 60.547 (65.785)	Top-5 acc 82.031 (85.154)	lr 0.00339
Train [92][680/3239]	Time 0.254 (0.574)	Data Time 0.001 (0.057)	Loss 2.5727 (2.4182)	Entropy 0.57179 (0.57299)	Top-1 acc 63.672 (65.794)	Top-5 acc 83.594 (85.157)	lr 0.00339
Train [92][690/3239]	Time 0.238 (0.572)	Data Time 0.001 (0.057)	Loss 2.3847 (2.4188)	Entropy 0.57200 (0.57297)	Top-1 acc 63.281 (65.765)	Top-5 acc 85.938 (85.142)	lr 0.00338
Train [92][700/3239]	Time 0.252 (0.570)	Data Time 0.002 (0.056)	Loss 2.3577 (2.4182)	Entropy 0.57216 (0.57296)	Top-1 acc 65.625 (65.773)	Top-5 acc 89.453 (85.160)	lr 0.00338
Train [92][710/3239]	Time 0.235 (0.568)	Data Time 0.001 (0.055)	Loss 2.3733 (2.4172)	Entropy 0.57236 (0.57295)	Top-1 acc 65.234 (65.806)	Top-5 acc 85.938 (85.178)	lr 0.00338
Train [92][720/3239]	Time 0.242 (0.566)	Data Time 0.001 (0.054)	Loss 2.5595 (2.4170)	Entropy 0.57236 (0.57294)	Top-1 acc 60.547 (65.801)	Top-5 acc 83.594 (85.183)	lr 0.00338
Train [92][730/3239]	Time 0.259 (0.564)	Data Time 0.001 (0.054)	Loss 2.3812 (2.4160)	Entropy 0.57224 (0.57293)	Top-1 acc 66.406 (65.818)	Top-5 acc 83.203 (85.200)	lr 0.00338
Train [92][740/3239]	Time 0.244 (0.562)	Data Time 0.001 (0.053)	Loss 2.3009 (2.4163)	Entropy 0.57174 (0.57292)	Top-1 acc 70.312 (65.817)	Top-5 acc 86.328 (85.189)	lr 0.00338
Train [92][750/3239]	Time 0.371 (0.561)	Data Time 0.001 (0.052)	Loss 2.4995 (2.4154)	Entropy 0.57172 (0.57291)	Top-1 acc 64.844 (65.833)	Top-5 acc 82.422 (85.215)	lr 0.00338
Train [92][760/3239]	Time 0.228 (0.559)	Data Time 0.001 (0.052)	Loss 2.2748 (2.4149)	Entropy 0.57169 (0.57289)	Top-1 acc 68.359 (65.848)	Top-5 acc 88.281 (85.227)	lr 0.00338
Train [92][770/3239]	Time 0.245 (0.557)	Data Time 0.001 (0.051)	Loss 2.5189 (2.4138)	Entropy 0.57173 (0.57288)	Top-1 acc 63.672 (65.878)	Top-5 acc 81.250 (85.244)	lr 0.00338
Train [92][780/3239]	Time 0.272 (0.556)	Data Time 0.001 (0.050)	Loss 2.3254 (2.4140)	Entropy 0.57188 (0.57286)	Top-1 acc 72.656 (65.881)	Top-5 acc 87.109 (85.240)	lr 0.00338
Train [92][790/3239]	Time 0.240 (0.554)	Data Time 0.001 (0.050)	Loss 2.2534 (2.4138)	Entropy 0.57189 (0.57285)	Top-1 acc 70.703 (65.893)	Top-5 acc 87.891 (85.243)	lr 0.00338
Train [92][800/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.049)	Loss 2.4384 (2.4129)	Entropy 0.57197 (0.57284)	Top-1 acc 66.797 (65.911)	Top-5 acc 84.375 (85.256)	lr 0.00338
Train [92][810/3239]	Time 0.246 (0.551)	Data Time 0.001 (0.049)	Loss 2.2805 (2.4128)	Entropy 0.57185 (0.57283)	Top-1 acc 68.359 (65.915)	Top-5 acc 88.281 (85.259)	lr 0.00338
Train [92][820/3239]	Time 0.387 (0.550)	Data Time 0.002 (0.048)	Loss 2.3997 (2.4126)	Entropy 0.57178 (0.57282)	Top-1 acc 66.016 (65.923)	Top-5 acc 84.766 (85.259)	lr 0.00338
Train [92][830/3239]	Time 0.236 (0.549)	Data Time 0.001 (0.047)	Loss 2.3701 (2.4119)	Entropy 0.57197 (0.57281)	Top-1 acc 65.625 (65.941)	Top-5 acc 84.375 (85.262)	lr 0.00338
Train [92][840/3239]	Time 0.239 (0.547)	Data Time 0.001 (0.047)	Loss 2.4032 (2.4121)	Entropy 0.57160 (0.57279)	Top-1 acc 69.922 (65.939)	Top-5 acc 83.984 (85.254)	lr 0.00337
Train [92][850/3239]	Time 0.248 (0.546)	Data Time 0.001 (0.046)	Loss 2.4757 (2.4117)	Entropy 0.57175 (0.57278)	Top-1 acc 63.281 (65.957)	Top-5 acc 84.375 (85.255)	lr 0.00337
Train [92][860/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.046)	Loss 2.3214 (2.4112)	Entropy 0.57144 (0.57277)	Top-1 acc 69.141 (65.970)	Top-5 acc 85.547 (85.262)	lr 0.00337
Train [92][870/3239]	Time 0.231 (0.544)	Data Time 0.001 (0.045)	Loss 2.2134 (2.4111)	Entropy 0.57165 (0.57275)	Top-1 acc 71.875 (65.971)	Top-5 acc 88.672 (85.268)	lr 0.00337
Train [92][880/3239]	Time 0.242 (0.542)	Data Time 0.001 (0.045)	Loss 2.3977 (2.4107)	Entropy 0.57171 (0.57274)	Top-1 acc 65.625 (65.990)	Top-5 acc 87.109 (85.275)	lr 0.00337
Train [92][890/3239]	Time 0.281 (0.541)	Data Time 0.002 (0.044)	Loss 2.3436 (2.4100)	Entropy 0.57209 (0.57273)	Top-1 acc 69.922 (65.997)	Top-5 acc 87.109 (85.288)	lr 0.00337
Train [92][900/3239]	Time 0.229 (0.540)	Data Time 0.001 (0.044)	Loss 2.4153 (2.4101)	Entropy 0.57126 (0.57272)	Top-1 acc 66.406 (65.996)	Top-5 acc 84.766 (85.291)	lr 0.00337
Train [92][910/3239]	Time 0.282 (0.539)	Data Time 0.001 (0.043)	Loss 2.0921 (2.4101)	Entropy 0.57121 (0.57270)	Top-1 acc 76.562 (65.995)	Top-5 acc 89.844 (85.289)	lr 0.00337
Train [92][920/3239]	Time 0.223 (0.537)	Data Time 0.001 (0.043)	Loss 2.5543 (2.4097)	Entropy 0.57102 (0.57269)	Top-1 acc 61.719 (66.015)	Top-5 acc 83.203 (85.296)	lr 0.00337
Train [92][930/3239]	Time 0.290 (0.537)	Data Time 0.001 (0.043)	Loss 2.3207 (2.4090)	Entropy 0.57079 (0.57267)	Top-1 acc 69.141 (66.035)	Top-5 acc 87.109 (85.308)	lr 0.00337
Train [92][940/3239]	Time 0.234 (0.536)	Data Time 0.001 (0.042)	Loss 2.2314 (2.4097)	Entropy 0.57104 (0.57265)	Top-1 acc 68.359 (66.016)	Top-5 acc 89.453 (85.295)	lr 0.00337
Train [92][950/3239]	Time 0.237 (0.535)	Data Time 0.001 (0.042)	Loss 2.3251 (2.4095)	Entropy 0.57100 (0.57263)	Top-1 acc 66.406 (66.009)	Top-5 acc 87.109 (85.302)	lr 0.00337
Train [92][960/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.041)	Loss 2.2584 (2.4093)	Entropy 0.57056 (0.57262)	Top-1 acc 66.797 (66.014)	Top-5 acc 88.281 (85.301)	lr 0.00337
Train [92][970/3239]	Time 0.255 (0.532)	Data Time 0.001 (0.041)	Loss 2.3205 (2.4089)	Entropy 0.57048 (0.57259)	Top-1 acc 68.359 (66.020)	Top-5 acc 87.109 (85.310)	lr 0.00337
Train [92][980/3239]	Time 0.340 (0.531)	Data Time 0.001 (0.040)	Loss 2.2744 (2.4089)	Entropy 0.57051 (0.57257)	Top-1 acc 67.578 (66.019)	Top-5 acc 87.500 (85.303)	lr 0.00336
Train [92][990/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.040)	Loss 2.3132 (2.4091)	Entropy 0.57053 (0.57255)	Top-1 acc 69.141 (66.011)	Top-5 acc 85.938 (85.298)	lr 0.00336
Train [92][1000/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.040)	Loss 2.3262 (2.4092)	Entropy 0.57069 (0.57253)	Top-1 acc 67.188 (66.009)	Top-5 acc 86.719 (85.293)	lr 0.00336
Train [92][1010/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.039)	Loss 2.6173 (2.4095)	Entropy 0.57053 (0.57251)	Top-1 acc 60.156 (66.004)	Top-5 acc 82.031 (85.289)	lr 0.00336
Train [92][1020/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.039)	Loss 2.3041 (2.4093)	Entropy 0.57079 (0.57249)	Top-1 acc 64.062 (66.013)	Top-5 acc 90.234 (85.293)	lr 0.00336
Train [92][1030/3239]	Time 0.233 (0.526)	Data Time 0.002 (0.039)	Loss 2.6203 (2.4096)	Entropy 0.57087 (0.57248)	Top-1 acc 58.984 (66.004)	Top-5 acc 83.203 (85.290)	lr 0.00336
Train [92][1040/3239]	Time 0.248 (0.525)	Data Time 0.002 (0.038)	Loss 2.3818 (2.4096)	Entropy 0.57061 (0.57246)	Top-1 acc 67.969 (66.004)	Top-5 acc 85.547 (85.291)	lr 0.00336
Train [92][1050/3239]	Time 0.330 (0.524)	Data Time 0.002 (0.038)	Loss 2.3951 (2.4091)	Entropy 0.57069 (0.57244)	Top-1 acc 65.625 (66.020)	Top-5 acc 86.328 (85.295)	lr 0.00336
Train [92][1060/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.038)	Loss 2.4362 (2.4097)	Entropy 0.57075 (0.57243)	Top-1 acc 63.281 (66.005)	Top-5 acc 84.766 (85.286)	lr 0.00336
Train [92][1070/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.037)	Loss 2.3574 (2.4101)	Entropy 0.57080 (0.57241)	Top-1 acc 65.234 (65.987)	Top-5 acc 87.109 (85.288)	lr 0.00336
Train [92][1080/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.037)	Loss 2.2948 (2.4102)	Entropy 0.57054 (0.57240)	Top-1 acc 71.484 (65.985)	Top-5 acc 87.500 (85.287)	lr 0.00336
Train [92][1090/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.037)	Loss 2.5210 (2.4107)	Entropy 0.57047 (0.57238)	Top-1 acc 63.672 (65.976)	Top-5 acc 82.422 (85.277)	lr 0.00336
Train [92][1100/3239]	Time 0.234 (0.519)	Data Time 0.002 (0.036)	Loss 2.3755 (2.4108)	Entropy 0.57069 (0.57236)	Top-1 acc 67.578 (65.976)	Top-5 acc 85.547 (85.276)	lr 0.00336
Train [92][1110/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.036)	Loss 2.6127 (2.4107)	Entropy 0.57052 (0.57235)	Top-1 acc 59.375 (65.979)	Top-5 acc 81.641 (85.268)	lr 0.00336
Train [92][1120/3239]	Time 0.254 (0.517)	Data Time 0.001 (0.036)	Loss 2.5692 (2.4107)	Entropy 0.57069 (0.57233)	Top-1 acc 60.547 (65.983)	Top-5 acc 83.203 (85.270)	lr 0.00336
Train [92][1130/3239]	Time 0.227 (0.517)	Data Time 0.001 (0.035)	Loss 2.3602 (2.4103)	Entropy 0.57104 (0.57232)	Top-1 acc 68.750 (65.996)	Top-5 acc 86.719 (85.287)	lr 0.00335
Train [92][1140/3239]	Time 0.315 (0.516)	Data Time 0.001 (0.035)	Loss 2.6537 (2.4109)	Entropy 0.57121 (0.57231)	Top-1 acc 59.375 (65.973)	Top-5 acc 82.812 (85.290)	lr 0.00335
Train [92][1150/3239]	Time 0.226 (0.515)	Data Time 0.002 (0.035)	Loss 2.5697 (2.4114)	Entropy 0.57129 (0.57230)	Top-1 acc 63.672 (65.961)	Top-5 acc 83.594 (85.284)	lr 0.00335
Train [92][1160/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.034)	Loss 2.4114 (2.4116)	Entropy 0.57074 (0.57229)	Top-1 acc 68.359 (65.956)	Top-5 acc 84.375 (85.285)	lr 0.00335
Train [92][1170/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.034)	Loss 2.6842 (2.4120)	Entropy 0.57074 (0.57227)	Top-1 acc 57.031 (65.936)	Top-5 acc 83.203 (85.276)	lr 0.00335
Train [92][1180/3239]	Time 0.249 (0.512)	Data Time 0.001 (0.034)	Loss 2.5718 (2.4122)	Entropy 0.57079 (0.57226)	Top-1 acc 59.766 (65.928)	Top-5 acc 82.422 (85.271)	lr 0.00335
Train [92][1190/3239]	Time 0.306 (0.556)	Data Time 0.006 (0.034)	Loss 2.6272 (2.4124)	Entropy 0.57072 (0.57225)	Top-1 acc 61.719 (65.924)	Top-5 acc 80.078 (85.269)	lr 0.00335
Train [92][1200/3239]	Time 0.239 (0.555)	Data Time 0.002 (0.033)	Loss 2.3265 (2.4120)	Entropy 0.57054 (0.57223)	Top-1 acc 68.359 (65.938)	Top-5 acc 88.281 (85.281)	lr 0.00335
Train [92][1210/3239]	Time 0.224 (0.554)	Data Time 0.001 (0.033)	Loss 2.6238 (2.4118)	Entropy 0.57073 (0.57222)	Top-1 acc 58.594 (65.939)	Top-5 acc 78.906 (85.286)	lr 0.00335
Train [92][1220/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.033)	Loss 2.4587 (2.4118)	Entropy 0.57073 (0.57221)	Top-1 acc 65.625 (65.945)	Top-5 acc 83.203 (85.291)	lr 0.00335
Train [92][1230/3239]	Time 0.237 (0.552)	Data Time 0.001 (0.033)	Loss 2.6122 (2.4125)	Entropy 0.57046 (0.57220)	Top-1 acc 59.375 (65.922)	Top-5 acc 82.031 (85.279)	lr 0.00335
Train [92][1240/3239]	Time 0.240 (0.551)	Data Time 0.001 (0.032)	Loss 2.3010 (2.4127)	Entropy 0.57075 (0.57218)	Top-1 acc 68.750 (65.915)	Top-5 acc 86.328 (85.275)	lr 0.00335
Train [92][1250/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.032)	Loss 2.4123 (2.4128)	Entropy 0.57065 (0.57217)	Top-1 acc 62.891 (65.910)	Top-5 acc 85.547 (85.268)	lr 0.00335
Train [92][1260/3239]	Time 0.224 (0.549)	Data Time 0.001 (0.032)	Loss 2.2917 (2.4129)	Entropy 0.57028 (0.57216)	Top-1 acc 68.359 (65.909)	Top-5 acc 89.062 (85.264)	lr 0.00335
Train [92][1270/3239]	Time 0.249 (0.548)	Data Time 0.001 (0.032)	Loss 2.3218 (2.4131)	Entropy 0.57010 (0.57214)	Top-1 acc 67.188 (65.911)	Top-5 acc 87.891 (85.258)	lr 0.00335
Train [92][1280/3239]	Time 0.229 (0.547)	Data Time 0.001 (0.031)	Loss 2.2998 (2.4131)	Entropy 0.57023 (0.57213)	Top-1 acc 70.703 (65.910)	Top-5 acc 85.156 (85.258)	lr 0.00334
Train [92][1290/3239]	Time 0.244 (0.546)	Data Time 0.002 (0.031)	Loss 2.3633 (2.4129)	Entropy 0.57037 (0.57211)	Top-1 acc 66.016 (65.915)	Top-5 acc 87.891 (85.265)	lr 0.00334
Train [92][1300/3239]	Time 0.330 (0.545)	Data Time 0.001 (0.031)	Loss 2.2798 (2.4126)	Entropy 0.57068 (0.57210)	Top-1 acc 65.234 (65.920)	Top-5 acc 88.281 (85.269)	lr 0.00334
Train [92][1310/3239]	Time 0.248 (0.545)	Data Time 0.001 (0.031)	Loss 2.2825 (2.4123)	Entropy 0.57079 (0.57209)	Top-1 acc 69.141 (65.924)	Top-5 acc 87.500 (85.277)	lr 0.00334
Train [92][1320/3239]	Time 0.251 (0.544)	Data Time 0.001 (0.031)	Loss 2.8387 (2.4126)	Entropy 0.57044 (0.57208)	Top-1 acc 55.469 (65.917)	Top-5 acc 76.953 (85.272)	lr 0.00334
Train [92][1330/3239]	Time 0.288 (0.543)	Data Time 0.001 (0.030)	Loss 2.3720 (2.4131)	Entropy 0.57072 (0.57207)	Top-1 acc 62.891 (65.899)	Top-5 acc 86.328 (85.263)	lr 0.00334
Train [92][1340/3239]	Time 0.232 (0.543)	Data Time 0.001 (0.030)	Loss 2.3933 (2.4128)	Entropy 0.57035 (0.57206)	Top-1 acc 70.703 (65.912)	Top-5 acc 86.328 (85.267)	lr 0.00334
Train [92][1350/3239]	Time 0.235 (0.542)	Data Time 0.001 (0.030)	Loss 2.3329 (2.4126)	Entropy 0.57006 (0.57204)	Top-1 acc 67.578 (65.918)	Top-5 acc 87.891 (85.271)	lr 0.00334
Train [92][1360/3239]	Time 0.239 (0.541)	Data Time 0.001 (0.030)	Loss 2.2606 (2.4127)	Entropy 0.57012 (0.57203)	Top-1 acc 69.141 (65.916)	Top-5 acc 91.016 (85.274)	lr 0.00334
Train [92][1370/3239]	Time 0.327 (0.540)	Data Time 0.001 (0.029)	Loss 2.4062 (2.4127)	Entropy 0.57031 (0.57201)	Top-1 acc 65.625 (65.912)	Top-5 acc 84.766 (85.274)	lr 0.00334
Train [92][1380/3239]	Time 0.241 (0.539)	Data Time 0.001 (0.029)	Loss 2.3286 (2.4124)	Entropy 0.57049 (0.57200)	Top-1 acc 67.578 (65.923)	Top-5 acc 86.719 (85.279)	lr 0.00334
Train [92][1390/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.029)	Loss 2.3539 (2.4121)	Entropy 0.57046 (0.57199)	Top-1 acc 66.016 (65.927)	Top-5 acc 85.547 (85.284)	lr 0.00334
Train [92][1400/3239]	Time 0.269 (0.538)	Data Time 0.001 (0.029)	Loss 2.3774 (2.4124)	Entropy 0.57068 (0.57198)	Top-1 acc 69.141 (65.921)	Top-5 acc 85.547 (85.282)	lr 0.00334
Train [92][1410/3239]	Time 0.230 (0.537)	Data Time 0.001 (0.029)	Loss 2.2670 (2.4129)	Entropy 0.57067 (0.57197)	Top-1 acc 66.797 (65.914)	Top-5 acc 87.891 (85.276)	lr 0.00334
Train [92][1420/3239]	Time 0.279 (0.536)	Data Time 0.002 (0.028)	Loss 2.5036 (2.4132)	Entropy 0.57072 (0.57196)	Top-1 acc 64.844 (65.900)	Top-5 acc 83.203 (85.271)	lr 0.00333
Train [92][1430/3239]	Time 0.279 (0.536)	Data Time 0.002 (0.028)	Loss 2.2532 (2.4129)	Entropy 0.57044 (0.57195)	Top-1 acc 70.312 (65.914)	Top-5 acc 89.844 (85.274)	lr 0.00333
Train [92][1440/3239]	Time 0.253 (0.536)	Data Time 0.001 (0.028)	Loss 2.2921 (2.4128)	Entropy 0.57051 (0.57194)	Top-1 acc 67.188 (65.920)	Top-5 acc 85.156 (85.274)	lr 0.00333
Train [92][1450/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.028)	Loss 2.4658 (2.4136)	Entropy 0.57063 (0.57193)	Top-1 acc 64.453 (65.901)	Top-5 acc 84.766 (85.259)	lr 0.00333
Train [92][1460/3239]	Time 0.336 (0.534)	Data Time 0.001 (0.028)	Loss 2.3656 (2.4136)	Entropy 0.57063 (0.57192)	Top-1 acc 69.141 (65.898)	Top-5 acc 83.984 (85.258)	lr 0.00333
Train [92][1470/3239]	Time 0.230 (0.534)	Data Time 0.001 (0.028)	Loss 2.5207 (2.4141)	Entropy 0.57051 (0.57191)	Top-1 acc 62.500 (65.880)	Top-5 acc 83.984 (85.256)	lr 0.00333
Train [92][1480/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.027)	Loss 2.1842 (2.4138)	Entropy 0.57032 (0.57190)	Top-1 acc 70.312 (65.880)	Top-5 acc 90.234 (85.268)	lr 0.00333
Train [92][1490/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.027)	Loss 2.2196 (2.4137)	Entropy 0.57041 (0.57189)	Top-1 acc 73.438 (65.886)	Top-5 acc 89.062 (85.270)	lr 0.00333
Train [92][1500/3239]	Time 0.241 (0.532)	Data Time 0.001 (0.027)	Loss 2.3734 (2.4136)	Entropy 0.57056 (0.57188)	Top-1 acc 67.578 (65.890)	Top-5 acc 85.547 (85.273)	lr 0.00333
Train [92][1510/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.027)	Loss 2.5917 (2.4138)	Entropy 0.57042 (0.57187)	Top-1 acc 60.156 (65.885)	Top-5 acc 83.594 (85.272)	lr 0.00333
Train [92][1520/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.027)	Loss 2.4167 (2.4136)	Entropy 0.57046 (0.57187)	Top-1 acc 66.797 (65.892)	Top-5 acc 86.328 (85.273)	lr 0.00333
Train [92][1530/3239]	Time 0.332 (0.530)	Data Time 0.001 (0.027)	Loss 2.3721 (2.4135)	Entropy 0.57009 (0.57186)	Top-1 acc 65.625 (65.889)	Top-5 acc 85.547 (85.276)	lr 0.00333
Train [92][1540/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.026)	Loss 2.4059 (2.4136)	Entropy 0.57012 (0.57184)	Top-1 acc 66.016 (65.877)	Top-5 acc 84.766 (85.275)	lr 0.00333
Train [92][1550/3239]	Time 0.221 (0.528)	Data Time 0.001 (0.026)	Loss 2.5051 (2.4144)	Entropy 0.57007 (0.57183)	Top-1 acc 65.625 (65.869)	Top-5 acc 82.031 (85.258)	lr 0.00333
Train [92][1560/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.026)	Loss 2.3875 (2.4146)	Entropy 0.56967 (0.57182)	Top-1 acc 66.406 (65.870)	Top-5 acc 84.766 (85.251)	lr 0.00333
Train [92][1570/3239]	Time 0.238 (0.527)	Data Time 0.001 (0.026)	Loss 2.1484 (2.4141)	Entropy 0.56981 (0.57181)	Top-1 acc 72.656 (65.886)	Top-5 acc 89.453 (85.255)	lr 0.00332
Train [92][1580/3239]	Time 0.266 (0.526)	Data Time 0.001 (0.026)	Loss 2.3273 (2.4138)	Entropy 0.56958 (0.57179)	Top-1 acc 67.188 (65.890)	Top-5 acc 87.500 (85.260)	lr 0.00332
Train [92][1590/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.026)	Loss 2.5817 (2.4141)	Entropy 0.56956 (0.57178)	Top-1 acc 63.281 (65.882)	Top-5 acc 83.203 (85.259)	lr 0.00332
Train [92][1600/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.026)	Loss 2.2477 (2.4138)	Entropy 0.56985 (0.57177)	Top-1 acc 68.750 (65.889)	Top-5 acc 89.844 (85.264)	lr 0.00332
Train [92][1610/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.025)	Loss 2.3573 (2.4136)	Entropy 0.57005 (0.57176)	Top-1 acc 66.797 (65.895)	Top-5 acc 84.766 (85.266)	lr 0.00332
Train [92][1620/3239]	Time 0.262 (0.524)	Data Time 0.001 (0.025)	Loss 2.6375 (2.4135)	Entropy 0.56979 (0.57175)	Top-1 acc 56.641 (65.887)	Top-5 acc 83.203 (85.270)	lr 0.00332
Train [92][1630/3239]	Time 0.239 (0.523)	Data Time 0.001 (0.025)	Loss 2.4431 (2.4137)	Entropy 0.56948 (0.57173)	Top-1 acc 65.234 (65.881)	Top-5 acc 85.547 (85.265)	lr 0.00332
Train [92][1640/3239]	Time 0.240 (0.522)	Data Time 0.001 (0.025)	Loss 2.4884 (2.4137)	Entropy 0.56913 (0.57172)	Top-1 acc 64.844 (65.880)	Top-5 acc 83.594 (85.265)	lr 0.00332
Train [92][1650/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.025)	Loss 2.4151 (2.4135)	Entropy 0.56902 (0.57170)	Top-1 acc 66.797 (65.881)	Top-5 acc 85.938 (85.274)	lr 0.00332
Train [92][1660/3239]	Time 0.256 (0.521)	Data Time 0.001 (0.025)	Loss 2.2610 (2.4134)	Entropy 0.56897 (0.57169)	Top-1 acc 67.969 (65.886)	Top-5 acc 89.062 (85.271)	lr 0.00332
Train [92][1670/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.025)	Loss 2.4400 (2.4131)	Entropy 0.56912 (0.57167)	Top-1 acc 63.281 (65.891)	Top-5 acc 85.547 (85.277)	lr 0.00332
Train [92][1680/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.024)	Loss 2.5380 (2.4132)	Entropy 0.56902 (0.57166)	Top-1 acc 63.672 (65.891)	Top-5 acc 83.203 (85.275)	lr 0.00332
Train [92][1690/3239]	Time 0.407 (0.519)	Data Time 0.001 (0.024)	Loss 2.5608 (2.4134)	Entropy 0.56881 (0.57164)	Top-1 acc 60.547 (65.888)	Top-5 acc 82.422 (85.268)	lr 0.00332
Train [92][1700/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.024)	Loss 2.4521 (2.4133)	Entropy 0.56877 (0.57162)	Top-1 acc 64.453 (65.893)	Top-5 acc 84.375 (85.267)	lr 0.00332
Train [92][1710/3239]	Time 0.239 (0.518)	Data Time 0.001 (0.024)	Loss 2.6556 (2.4132)	Entropy 0.56835 (0.57160)	Top-1 acc 59.766 (65.903)	Top-5 acc 81.641 (85.266)	lr 0.00331
Train [92][1720/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.024)	Loss 2.4182 (2.4130)	Entropy 0.56824 (0.57159)	Top-1 acc 60.547 (65.897)	Top-5 acc 87.891 (85.270)	lr 0.00331
Train [92][1730/3239]	Time 0.280 (0.517)	Data Time 0.002 (0.024)	Loss 2.2692 (2.4129)	Entropy 0.56756 (0.57156)	Top-1 acc 71.484 (65.900)	Top-5 acc 86.719 (85.268)	lr 0.00331
Train [92][1740/3239]	Time 0.258 (0.517)	Data Time 0.001 (0.024)	Loss 2.3968 (2.4126)	Entropy 0.56772 (0.57154)	Top-1 acc 64.453 (65.901)	Top-5 acc 87.500 (85.274)	lr 0.00331
Train [92][1750/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.023)	Loss 2.3534 (2.4130)	Entropy 0.56748 (0.57152)	Top-1 acc 67.969 (65.894)	Top-5 acc 85.938 (85.269)	lr 0.00331
Train [92][1760/3239]	Time 0.319 (0.516)	Data Time 0.001 (0.023)	Loss 2.5198 (2.4130)	Entropy 0.56760 (0.57150)	Top-1 acc 62.500 (65.893)	Top-5 acc 83.203 (85.267)	lr 0.00331
Train [92][1770/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.023)	Loss 2.3189 (2.4130)	Entropy 0.56744 (0.57148)	Top-1 acc 69.141 (65.893)	Top-5 acc 85.156 (85.263)	lr 0.00331
Train [92][1780/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.023)	Loss 2.6302 (2.4129)	Entropy 0.56744 (0.57145)	Top-1 acc 56.641 (65.893)	Top-5 acc 82.812 (85.265)	lr 0.00331
Train [92][1790/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.023)	Loss 2.4193 (2.4129)	Entropy 0.56737 (0.57143)	Top-1 acc 66.797 (65.897)	Top-5 acc 83.203 (85.260)	lr 0.00331
Train [92][1800/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.023)	Loss 2.3453 (2.4127)	Entropy 0.56735 (0.57141)	Top-1 acc 67.578 (65.896)	Top-5 acc 86.328 (85.265)	lr 0.00331
Train [92][1810/3239]	Time 0.229 (0.513)	Data Time 0.001 (0.023)	Loss 2.5701 (2.4127)	Entropy 0.56717 (0.57139)	Top-1 acc 61.719 (65.898)	Top-5 acc 82.812 (85.267)	lr 0.00331
Train [92][1820/3239]	Time 0.251 (0.513)	Data Time 0.001 (0.023)	Loss 2.3298 (2.4132)	Entropy 0.56711 (0.57136)	Top-1 acc 67.969 (65.887)	Top-5 acc 84.766 (85.254)	lr 0.00331
Train [92][1830/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.023)	Loss 2.6357 (2.4132)	Entropy 0.56751 (0.57134)	Top-1 acc 61.719 (65.886)	Top-5 acc 80.469 (85.258)	lr 0.00331
Train [92][1840/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.022)	Loss 2.5770 (2.4135)	Entropy 0.56762 (0.57132)	Top-1 acc 62.500 (65.869)	Top-5 acc 85.156 (85.253)	lr 0.00331
Train [92][1850/3239]	Time 0.472 (0.539)	Data Time 0.003 (0.022)	Loss 2.3671 (2.4137)	Entropy 0.56781 (0.57130)	Top-1 acc 66.406 (65.865)	Top-5 acc 86.719 (85.250)	lr 0.00331
Train [92][1860/3239]	Time 0.284 (0.539)	Data Time 0.002 (0.022)	Loss 2.3760 (2.4138)	Entropy 0.56789 (0.57128)	Top-1 acc 67.578 (65.863)	Top-5 acc 85.156 (85.248)	lr 0.00330
Train [92][1870/3239]	Time 0.291 (0.539)	Data Time 0.002 (0.022)	Loss 2.5163 (2.4139)	Entropy 0.56753 (0.57126)	Top-1 acc 62.891 (65.866)	Top-5 acc 83.594 (85.245)	lr 0.00330
Train [92][1880/3239]	Time 0.279 (0.539)	Data Time 0.002 (0.022)	Loss 2.4829 (2.4137)	Entropy 0.56739 (0.57124)	Top-1 acc 62.109 (65.871)	Top-5 acc 83.594 (85.246)	lr 0.00330
Train [92][1890/3239]	Time 0.224 (0.538)	Data Time 0.001 (0.022)	Loss 2.7423 (2.4140)	Entropy 0.56737 (0.57122)	Top-1 acc 58.984 (65.858)	Top-5 acc 77.734 (85.239)	lr 0.00330
Train [92][1900/3239]	Time 0.279 (0.538)	Data Time 0.002 (0.022)	Loss 2.3599 (2.4141)	Entropy 0.56737 (0.57120)	Top-1 acc 66.016 (65.855)	Top-5 acc 86.719 (85.237)	lr 0.00330
Train [92][1910/3239]	Time 0.238 (0.537)	Data Time 0.001 (0.022)	Loss 2.3695 (2.4140)	Entropy 0.56754 (0.57118)	Top-1 acc 64.453 (65.861)	Top-5 acc 84.375 (85.236)	lr 0.00330
Train [92][1920/3239]	Time 0.358 (0.537)	Data Time 0.002 (0.022)	Loss 2.4913 (2.4143)	Entropy 0.56750 (0.57116)	Top-1 acc 63.281 (65.851)	Top-5 acc 83.203 (85.230)	lr 0.00330
Train [92][1930/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.022)	Loss 2.5431 (2.4143)	Entropy 0.56735 (0.57114)	Top-1 acc 62.891 (65.854)	Top-5 acc 83.203 (85.227)	lr 0.00330
Train [92][1940/3239]	Time 0.250 (0.536)	Data Time 0.002 (0.021)	Loss 2.3443 (2.4147)	Entropy 0.56754 (0.57112)	Top-1 acc 68.750 (65.847)	Top-5 acc 85.156 (85.221)	lr 0.00330
Train [92][1950/3239]	Time 0.271 (0.535)	Data Time 0.002 (0.021)	Loss 2.2767 (2.4147)	Entropy 0.56765 (0.57111)	Top-1 acc 71.484 (65.847)	Top-5 acc 87.500 (85.222)	lr 0.00330
Train [92][1960/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.021)	Loss 2.5754 (2.4147)	Entropy 0.56777 (0.57109)	Top-1 acc 59.766 (65.843)	Top-5 acc 80.859 (85.224)	lr 0.00330
Train [92][1970/3239]	Time 0.231 (0.534)	Data Time 0.002 (0.021)	Loss 2.3889 (2.4148)	Entropy 0.56787 (0.57107)	Top-1 acc 65.625 (65.837)	Top-5 acc 86.328 (85.218)	lr 0.00330
Train [92][1980/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.021)	Loss 2.5118 (2.4147)	Entropy 0.56765 (0.57105)	Top-1 acc 64.453 (65.840)	Top-5 acc 83.594 (85.219)	lr 0.00330
Train [92][1990/3239]	Time 0.247 (0.533)	Data Time 0.001 (0.021)	Loss 2.3726 (2.4145)	Entropy 0.56749 (0.57104)	Top-1 acc 65.625 (65.848)	Top-5 acc 86.328 (85.224)	lr 0.00330
Train [92][2000/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.021)	Loss 2.4347 (2.4149)	Entropy 0.56712 (0.57102)	Top-1 acc 64.844 (65.833)	Top-5 acc 85.938 (85.215)	lr 0.00329
Train [92][2010/3239]	Time 0.366 (0.532)	Data Time 0.001 (0.021)	Loss 2.2100 (2.4148)	Entropy 0.56706 (0.57100)	Top-1 acc 70.312 (65.831)	Top-5 acc 83.984 (85.214)	lr 0.00329
Train [92][2020/3239]	Time 0.252 (0.532)	Data Time 0.001 (0.021)	Loss 2.5245 (2.4150)	Entropy 0.56694 (0.57098)	Top-1 acc 61.328 (65.823)	Top-5 acc 85.938 (85.214)	lr 0.00329
Train [92][2030/3239]	Time 0.284 (0.531)	Data Time 0.002 (0.021)	Loss 2.5677 (2.4154)	Entropy 0.56673 (0.57096)	Top-1 acc 60.547 (65.810)	Top-5 acc 84.766 (85.210)	lr 0.00329
Train [92][2040/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.020)	Loss 2.3495 (2.4150)	Entropy 0.56721 (0.57094)	Top-1 acc 70.312 (65.821)	Top-5 acc 87.109 (85.214)	lr 0.00329
Train [92][2050/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.020)	Loss 2.4679 (2.4152)	Entropy 0.56739 (0.57092)	Top-1 acc 64.453 (65.818)	Top-5 acc 83.203 (85.209)	lr 0.00329
Train [92][2060/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.020)	Loss 2.4698 (2.4154)	Entropy 0.56699 (0.57090)	Top-1 acc 65.625 (65.806)	Top-5 acc 83.594 (85.208)	lr 0.00329
Train [92][2070/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.020)	Loss 2.2374 (2.4156)	Entropy 0.56691 (0.57088)	Top-1 acc 67.578 (65.797)	Top-5 acc 88.672 (85.205)	lr 0.00329
Train [92][2080/3239]	Time 0.369 (0.529)	Data Time 0.002 (0.020)	Loss 2.4205 (2.4156)	Entropy 0.56676 (0.57086)	Top-1 acc 66.016 (65.796)	Top-5 acc 86.328 (85.205)	lr 0.00329
Train [92][2090/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.020)	Loss 2.3546 (2.4154)	Entropy 0.56686 (0.57085)	Top-1 acc 69.531 (65.803)	Top-5 acc 86.328 (85.211)	lr 0.00329
Train [92][2100/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.020)	Loss 2.4195 (2.4154)	Entropy 0.56680 (0.57083)	Top-1 acc 65.625 (65.802)	Top-5 acc 82.812 (85.206)	lr 0.00329
Train [92][2110/3239]	Time 0.277 (0.528)	Data Time 0.001 (0.020)	Loss 2.4663 (2.4155)	Entropy 0.56734 (0.57081)	Top-1 acc 66.406 (65.802)	Top-5 acc 84.766 (85.204)	lr 0.00329
Train [92][2120/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.020)	Loss 2.2066 (2.4152)	Entropy 0.56725 (0.57079)	Top-1 acc 67.969 (65.807)	Top-5 acc 92.188 (85.213)	lr 0.00329
Train [92][2130/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.020)	Loss 2.3802 (2.4154)	Entropy 0.56742 (0.57077)	Top-1 acc 65.625 (65.802)	Top-5 acc 85.938 (85.211)	lr 0.00329
Train [92][2140/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.020)	Loss 2.6702 (2.4155)	Entropy 0.56768 (0.57076)	Top-1 acc 60.547 (65.799)	Top-5 acc 80.859 (85.207)	lr 0.00329
Train [92][2150/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.019)	Loss 2.3960 (2.4155)	Entropy 0.56762 (0.57075)	Top-1 acc 67.578 (65.804)	Top-5 acc 85.156 (85.210)	lr 0.00328
Train [92][2160/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.019)	Loss 2.6049 (2.4157)	Entropy 0.56777 (0.57073)	Top-1 acc 61.719 (65.806)	Top-5 acc 82.812 (85.203)	lr 0.00328
Train [92][2170/3239]	Time 0.289 (0.525)	Data Time 0.002 (0.019)	Loss 2.5848 (2.4158)	Entropy 0.56818 (0.57072)	Top-1 acc 62.891 (65.805)	Top-5 acc 82.031 (85.200)	lr 0.00328
Train [92][2180/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.019)	Loss 2.5969 (2.4164)	Entropy 0.56835 (0.57071)	Top-1 acc 57.422 (65.795)	Top-5 acc 84.375 (85.189)	lr 0.00328
Train [92][2190/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.019)	Loss 2.6233 (2.4163)	Entropy 0.56814 (0.57069)	Top-1 acc 62.109 (65.801)	Top-5 acc 81.250 (85.189)	lr 0.00328
Train [92][2200/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.019)	Loss 2.4980 (2.4162)	Entropy 0.56864 (0.57068)	Top-1 acc 64.453 (65.807)	Top-5 acc 84.766 (85.192)	lr 0.00328
Train [92][2210/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.019)	Loss 2.5944 (2.4163)	Entropy 0.56848 (0.57067)	Top-1 acc 57.422 (65.804)	Top-5 acc 84.766 (85.191)	lr 0.00328
Train [92][2220/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.019)	Loss 2.4227 (2.4162)	Entropy 0.56846 (0.57066)	Top-1 acc 67.969 (65.803)	Top-5 acc 83.203 (85.191)	lr 0.00328
Train [92][2230/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.019)	Loss 2.4156 (2.4162)	Entropy 0.56875 (0.57065)	Top-1 acc 66.797 (65.804)	Top-5 acc 85.156 (85.193)	lr 0.00328
Train [92][2240/3239]	Time 0.349 (0.521)	Data Time 0.001 (0.019)	Loss 2.4009 (2.4160)	Entropy 0.56885 (0.57065)	Top-1 acc 65.234 (65.807)	Top-5 acc 83.984 (85.195)	lr 0.00328
Train [92][2250/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.019)	Loss 2.2043 (2.4158)	Entropy 0.56897 (0.57064)	Top-1 acc 69.531 (65.813)	Top-5 acc 91.797 (85.199)	lr 0.00328
Train [92][2260/3239]	Time 0.224 (0.520)	Data Time 0.001 (0.019)	Loss 2.3340 (2.4158)	Entropy 0.56896 (0.57063)	Top-1 acc 66.406 (65.816)	Top-5 acc 88.672 (85.199)	lr 0.00328
Train [92][2270/3239]	Time 0.236 (0.520)	Data Time 0.001 (0.019)	Loss 2.5740 (2.4161)	Entropy 0.56905 (0.57062)	Top-1 acc 61.719 (65.810)	Top-5 acc 82.812 (85.193)	lr 0.00328
Train [92][2280/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.018)	Loss 2.4298 (2.4158)	Entropy 0.56916 (0.57062)	Top-1 acc 63.281 (65.815)	Top-5 acc 84.766 (85.197)	lr 0.00328
Train [92][2290/3239]	Time 0.241 (0.519)	Data Time 0.002 (0.018)	Loss 2.3356 (2.4156)	Entropy 0.56905 (0.57061)	Top-1 acc 66.016 (65.825)	Top-5 acc 86.328 (85.202)	lr 0.00328
Train [92][2300/3239]	Time 0.241 (0.519)	Data Time 0.001 (0.018)	Loss 2.4158 (2.4157)	Entropy 0.56889 (0.57060)	Top-1 acc 66.406 (65.824)	Top-5 acc 83.984 (85.200)	lr 0.00327
Train [92][2310/3239]	Time 0.336 (0.518)	Data Time 0.001 (0.018)	Loss 2.5265 (2.4154)	Entropy 0.56866 (0.57060)	Top-1 acc 63.281 (65.831)	Top-5 acc 83.594 (85.206)	lr 0.00327
Train [92][2320/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.018)	Loss 2.4944 (2.4152)	Entropy 0.56856 (0.57059)	Top-1 acc 59.375 (65.837)	Top-5 acc 85.938 (85.205)	lr 0.00327
Train [92][2330/3239]	Time 0.245 (0.517)	Data Time 0.001 (0.018)	Loss 2.4093 (2.4152)	Entropy 0.56825 (0.57058)	Top-1 acc 64.844 (65.836)	Top-5 acc 85.156 (85.203)	lr 0.00327
Train [92][2340/3239]	Time 0.291 (0.518)	Data Time 0.002 (0.018)	Loss 2.4631 (2.4152)	Entropy 0.56848 (0.57057)	Top-1 acc 65.234 (65.838)	Top-5 acc 82.422 (85.200)	lr 0.00327
Train [92][2350/3239]	Time 0.244 (0.517)	Data Time 0.001 (0.018)	Loss 2.4708 (2.4152)	Entropy 0.56816 (0.57056)	Top-1 acc 66.406 (65.836)	Top-5 acc 85.156 (85.202)	lr 0.00327
Train [92][2360/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.018)	Loss 2.4488 (2.4152)	Entropy 0.56804 (0.57055)	Top-1 acc 64.453 (65.833)	Top-5 acc 84.766 (85.202)	lr 0.00327
Train [92][2370/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.018)	Loss 2.3600 (2.4155)	Entropy 0.56785 (0.57054)	Top-1 acc 68.359 (65.830)	Top-5 acc 86.719 (85.196)	lr 0.00327
Train [92][2380/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.018)	Loss 2.4655 (2.4155)	Entropy 0.56794 (0.57053)	Top-1 acc 63.281 (65.833)	Top-5 acc 84.766 (85.195)	lr 0.00327
Train [92][2390/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.018)	Loss 2.3041 (2.4152)	Entropy 0.56797 (0.57052)	Top-1 acc 67.578 (65.835)	Top-5 acc 85.547 (85.199)	lr 0.00327
Train [92][2400/3239]	Time 0.345 (0.515)	Data Time 0.001 (0.018)	Loss 2.2760 (2.4149)	Entropy 0.56805 (0.57051)	Top-1 acc 68.359 (65.842)	Top-5 acc 87.891 (85.204)	lr 0.00327
Train [92][2410/3239]	Time 0.236 (0.515)	Data Time 0.001 (0.018)	Loss 2.4707 (2.4149)	Entropy 0.56789 (0.57050)	Top-1 acc 66.016 (65.840)	Top-5 acc 82.422 (85.202)	lr 0.00327
Train [92][2420/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.018)	Loss 2.3937 (2.4148)	Entropy 0.56800 (0.57048)	Top-1 acc 66.406 (65.845)	Top-5 acc 84.766 (85.202)	lr 0.00327
Train [92][2430/3239]	Time 0.231 (0.514)	Data Time 0.003 (0.017)	Loss 2.3960 (2.4146)	Entropy 0.56808 (0.57047)	Top-1 acc 69.531 (65.849)	Top-5 acc 87.109 (85.207)	lr 0.00327
Train [92][2440/3239]	Time 0.254 (0.514)	Data Time 0.001 (0.017)	Loss 2.2845 (2.4145)	Entropy 0.56840 (0.57047)	Top-1 acc 67.969 (65.850)	Top-5 acc 86.328 (85.207)	lr 0.00326
Train [92][2450/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.017)	Loss 2.4489 (2.4146)	Entropy 0.56862 (0.57046)	Top-1 acc 63.281 (65.851)	Top-5 acc 83.203 (85.201)	lr 0.00326
Train [92][2460/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.017)	Loss 2.2995 (2.4142)	Entropy 0.56885 (0.57045)	Top-1 acc 68.750 (65.863)	Top-5 acc 87.891 (85.204)	lr 0.00326
Train [92][2470/3239]	Time 0.336 (0.513)	Data Time 0.001 (0.017)	Loss 2.5648 (2.4141)	Entropy 0.56895 (0.57044)	Top-1 acc 61.328 (65.865)	Top-5 acc 82.031 (85.206)	lr 0.00326
Train [92][2480/3239]	Time 0.237 (0.512)	Data Time 0.002 (0.017)	Loss 2.4927 (2.4140)	Entropy 0.56916 (0.57044)	Top-1 acc 67.188 (65.871)	Top-5 acc 82.031 (85.205)	lr 0.00326
Train [92][2490/3239]	Time 0.225 (0.512)	Data Time 0.001 (0.017)	Loss 2.4729 (2.4142)	Entropy 0.56887 (0.57043)	Top-1 acc 62.500 (65.866)	Top-5 acc 85.547 (85.203)	lr 0.00326
Train [92][2500/3239]	Time 0.341 (0.532)	Data Time 0.004 (0.017)	Loss 2.3274 (2.4143)	Entropy 0.56873 (0.57043)	Top-1 acc 65.625 (65.862)	Top-5 acc 88.672 (85.201)	lr 0.00326
Train [92][2510/3239]	Time 0.240 (0.532)	Data Time 0.002 (0.017)	Loss 2.5453 (2.4143)	Entropy 0.56867 (0.57042)	Top-1 acc 62.500 (65.863)	Top-5 acc 83.984 (85.205)	lr 0.00326
Train [92][2520/3239]	Time 0.241 (0.532)	Data Time 0.001 (0.017)	Loss 2.4976 (2.4141)	Entropy 0.56871 (0.57041)	Top-1 acc 63.281 (65.867)	Top-5 acc 83.594 (85.206)	lr 0.00326
Train [92][2530/3239]	Time 0.294 (0.531)	Data Time 0.002 (0.017)	Loss 2.1247 (2.4140)	Entropy 0.56846 (0.57040)	Top-1 acc 73.828 (65.873)	Top-5 acc 90.234 (85.206)	lr 0.00326
Train [92][2540/3239]	Time 0.221 (0.531)	Data Time 0.001 (0.017)	Loss 2.8600 (2.4143)	Entropy 0.56869 (0.57040)	Top-1 acc 56.250 (65.868)	Top-5 acc 76.562 (85.200)	lr 0.00326
Train [92][2550/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.017)	Loss 2.4452 (2.4144)	Entropy 0.56865 (0.57039)	Top-1 acc 64.844 (65.865)	Top-5 acc 82.812 (85.194)	lr 0.00326
Train [92][2560/3239]	Time 0.333 (0.531)	Data Time 0.001 (0.017)	Loss 2.3834 (2.4148)	Entropy 0.56880 (0.57038)	Top-1 acc 66.406 (65.856)	Top-5 acc 85.547 (85.188)	lr 0.00326
Train [92][2570/3239]	Time 0.260 (0.530)	Data Time 0.001 (0.017)	Loss 2.4877 (2.4150)	Entropy 0.56818 (0.57038)	Top-1 acc 65.234 (65.852)	Top-5 acc 83.984 (85.185)	lr 0.00326
Train [92][2580/3239]	Time 0.273 (0.530)	Data Time 0.001 (0.017)	Loss 2.2963 (2.4152)	Entropy 0.56753 (0.57037)	Top-1 acc 67.188 (65.844)	Top-5 acc 87.109 (85.182)	lr 0.00326
Train [92][2590/3239]	Time 0.241 (0.529)	Data Time 0.001 (0.017)	Loss 2.4591 (2.4150)	Entropy 0.56755 (0.57036)	Top-1 acc 63.672 (65.850)	Top-5 acc 85.156 (85.182)	lr 0.00325
Train [92][2600/3239]	Time 0.251 (0.529)	Data Time 0.002 (0.016)	Loss 2.3039 (2.4147)	Entropy 0.56721 (0.57035)	Top-1 acc 67.969 (65.854)	Top-5 acc 87.500 (85.186)	lr 0.00325
Train [92][2610/3239]	Time 0.222 (0.529)	Data Time 0.001 (0.016)	Loss 2.7259 (2.4147)	Entropy 0.56730 (0.57033)	Top-1 acc 57.031 (65.854)	Top-5 acc 78.906 (85.184)	lr 0.00325
Train [92][2620/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.016)	Loss 2.3792 (2.4146)	Entropy 0.56730 (0.57032)	Top-1 acc 69.531 (65.858)	Top-5 acc 87.500 (85.187)	lr 0.00325
Train [92][2630/3239]	Time 0.336 (0.528)	Data Time 0.001 (0.016)	Loss 2.2403 (2.4149)	Entropy 0.56701 (0.57031)	Top-1 acc 66.797 (65.852)	Top-5 acc 87.500 (85.180)	lr 0.00325
Train [92][2640/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.016)	Loss 2.5983 (2.4151)	Entropy 0.56705 (0.57030)	Top-1 acc 61.719 (65.850)	Top-5 acc 81.641 (85.178)	lr 0.00325
Train [92][2650/3239]	Time 0.245 (0.527)	Data Time 0.001 (0.016)	Loss 2.2167 (2.4151)	Entropy 0.56741 (0.57029)	Top-1 acc 69.531 (65.851)	Top-5 acc 88.672 (85.177)	lr 0.00325
Train [92][2660/3239]	Time 0.234 (0.527)	Data Time 0.002 (0.016)	Loss 2.5892 (2.4155)	Entropy 0.56775 (0.57028)	Top-1 acc 60.938 (65.840)	Top-5 acc 81.250 (85.172)	lr 0.00325
Train [92][2670/3239]	Time 0.258 (0.527)	Data Time 0.001 (0.016)	Loss 2.4835 (2.4154)	Entropy 0.56796 (0.57027)	Top-1 acc 67.969 (65.839)	Top-5 acc 83.203 (85.173)	lr 0.00325
Train [92][2680/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.016)	Loss 2.6335 (2.4155)	Entropy 0.56805 (0.57026)	Top-1 acc 58.984 (65.838)	Top-5 acc 79.297 (85.168)	lr 0.00325
Train [92][2690/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.016)	Loss 2.2093 (2.4153)	Entropy 0.56838 (0.57025)	Top-1 acc 70.312 (65.841)	Top-5 acc 89.062 (85.171)	lr 0.00325
Train [92][2700/3239]	Time 0.250 (0.526)	Data Time 0.001 (0.016)	Loss 2.3543 (2.4151)	Entropy 0.56838 (0.57024)	Top-1 acc 67.188 (65.844)	Top-5 acc 88.672 (85.173)	lr 0.00325
Train [92][2710/3239]	Time 0.245 (0.525)	Data Time 0.001 (0.016)	Loss 2.2308 (2.4151)	Entropy 0.56841 (0.57024)	Top-1 acc 70.703 (65.848)	Top-5 acc 90.625 (85.175)	lr 0.00325
Train [92][2720/3239]	Time 0.359 (0.525)	Data Time 0.001 (0.016)	Loss 2.4929 (2.4150)	Entropy 0.56841 (0.57023)	Top-1 acc 63.281 (65.850)	Top-5 acc 84.375 (85.178)	lr 0.00325
Train [92][2730/3239]	Time 0.285 (0.525)	Data Time 0.001 (0.016)	Loss 2.4489 (2.4150)	Entropy 0.56828 (0.57022)	Top-1 acc 66.406 (65.852)	Top-5 acc 85.547 (85.176)	lr 0.00325
Train [92][2740/3239]	Time 0.244 (0.524)	Data Time 0.001 (0.016)	Loss 2.1500 (2.4149)	Entropy 0.56858 (0.57022)	Top-1 acc 72.266 (65.853)	Top-5 acc 89.062 (85.176)	lr 0.00324
Train [92][2750/3239]	Time 0.264 (0.524)	Data Time 0.001 (0.016)	Loss 2.6549 (2.4149)	Entropy 0.56844 (0.57021)	Top-1 acc 61.719 (65.852)	Top-5 acc 80.859 (85.175)	lr 0.00324
Train [92][2760/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.016)	Loss 2.1558 (2.4149)	Entropy 0.56849 (0.57021)	Top-1 acc 73.047 (65.851)	Top-5 acc 89.062 (85.173)	lr 0.00324
Train [92][2770/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.016)	Loss 2.2481 (2.4153)	Entropy 0.56845 (0.57020)	Top-1 acc 69.141 (65.839)	Top-5 acc 89.453 (85.165)	lr 0.00324
Train [92][2780/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.016)	Loss 2.4048 (2.4154)	Entropy 0.56868 (0.57019)	Top-1 acc 67.969 (65.838)	Top-5 acc 85.547 (85.164)	lr 0.00324
Train [92][2790/3239]	Time 0.355 (0.523)	Data Time 0.001 (0.015)	Loss 2.4306 (2.4154)	Entropy 0.56880 (0.57019)	Top-1 acc 66.406 (65.837)	Top-5 acc 86.328 (85.164)	lr 0.00324
Train [92][2800/3239]	Time 0.257 (0.522)	Data Time 0.001 (0.015)	Loss 2.3937 (2.4156)	Entropy 0.56854 (0.57018)	Top-1 acc 68.750 (65.833)	Top-5 acc 86.719 (85.163)	lr 0.00324
Train [92][2810/3239]	Time 0.259 (0.522)	Data Time 0.001 (0.015)	Loss 2.3234 (2.4155)	Entropy 0.56835 (0.57018)	Top-1 acc 70.312 (65.837)	Top-5 acc 85.156 (85.165)	lr 0.00324
Train [92][2820/3239]	Time 0.244 (0.522)	Data Time 0.001 (0.015)	Loss 2.3657 (2.4155)	Entropy 0.56816 (0.57017)	Top-1 acc 68.359 (65.837)	Top-5 acc 84.766 (85.162)	lr 0.00324
Train [92][2830/3239]	Time 0.279 (0.522)	Data Time 0.001 (0.015)	Loss 2.4596 (2.4154)	Entropy 0.56821 (0.57016)	Top-1 acc 69.141 (65.837)	Top-5 acc 84.766 (85.166)	lr 0.00324
Train [92][2840/3239]	Time 0.231 (0.522)	Data Time 0.002 (0.015)	Loss 2.4507 (2.4151)	Entropy 0.56824 (0.57016)	Top-1 acc 64.844 (65.841)	Top-5 acc 85.156 (85.170)	lr 0.00324
Train [92][2850/3239]	Time 0.242 (0.522)	Data Time 0.002 (0.015)	Loss 2.5170 (2.4151)	Entropy 0.56797 (0.57015)	Top-1 acc 64.062 (65.843)	Top-5 acc 83.594 (85.169)	lr 0.00324
Train [92][2860/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.015)	Loss 2.1382 (2.4151)	Entropy 0.56838 (0.57014)	Top-1 acc 69.922 (65.839)	Top-5 acc 89.844 (85.170)	lr 0.00324
Train [92][2870/3239]	Time 0.224 (0.521)	Data Time 0.001 (0.015)	Loss 2.3759 (2.4151)	Entropy 0.56838 (0.57014)	Top-1 acc 64.844 (65.838)	Top-5 acc 87.500 (85.172)	lr 0.00324
Train [92][2880/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.015)	Loss 2.3664 (2.4152)	Entropy 0.56841 (0.57013)	Top-1 acc 65.234 (65.835)	Top-5 acc 85.547 (85.171)	lr 0.00324
Train [92][2890/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.015)	Loss 2.4262 (2.4154)	Entropy 0.56846 (0.57012)	Top-1 acc 66.406 (65.833)	Top-5 acc 83.203 (85.168)	lr 0.00323
Train [92][2900/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.015)	Loss 2.3612 (2.4153)	Entropy 0.56858 (0.57012)	Top-1 acc 68.359 (65.837)	Top-5 acc 85.938 (85.172)	lr 0.00323
Train [92][2910/3239]	Time 0.244 (0.520)	Data Time 0.001 (0.015)	Loss 2.4616 (2.4152)	Entropy 0.56838 (0.57011)	Top-1 acc 63.281 (65.839)	Top-5 acc 83.203 (85.173)	lr 0.00323
Train [92][2920/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.015)	Loss 2.4167 (2.4152)	Entropy 0.56853 (0.57011)	Top-1 acc 67.188 (65.839)	Top-5 acc 82.812 (85.173)	lr 0.00323
Train [92][2930/3239]	Time 0.237 (0.519)	Data Time 0.001 (0.015)	Loss 2.4395 (2.4149)	Entropy 0.56837 (0.57010)	Top-1 acc 65.625 (65.843)	Top-5 acc 84.766 (85.178)	lr 0.00323
Train [92][2940/3239]	Time 0.246 (0.519)	Data Time 0.001 (0.015)	Loss 2.5271 (2.4150)	Entropy 0.56847 (0.57010)	Top-1 acc 65.625 (65.842)	Top-5 acc 82.031 (85.177)	lr 0.00323
Train [92][2950/3239]	Time 0.332 (0.518)	Data Time 0.001 (0.015)	Loss 2.4206 (2.4150)	Entropy 0.56858 (0.57009)	Top-1 acc 64.844 (65.843)	Top-5 acc 87.500 (85.178)	lr 0.00323
Train [92][2960/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.015)	Loss 2.3944 (2.4151)	Entropy 0.56862 (0.57009)	Top-1 acc 60.938 (65.839)	Top-5 acc 85.156 (85.176)	lr 0.00323
Train [92][2970/3239]	Time 0.230 (0.518)	Data Time 0.002 (0.015)	Loss 2.4436 (2.4150)	Entropy 0.56849 (0.57008)	Top-1 acc 64.062 (65.841)	Top-5 acc 84.375 (85.177)	lr 0.00323
Train [92][2980/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.015)	Loss 2.5817 (2.4149)	Entropy 0.56910 (0.57008)	Top-1 acc 62.109 (65.846)	Top-5 acc 83.984 (85.180)	lr 0.00323
Train [92][2990/3239]	Time 0.221 (0.517)	Data Time 0.001 (0.015)	Loss 2.7912 (2.4151)	Entropy 0.56875 (0.57007)	Top-1 acc 55.859 (65.842)	Top-5 acc 79.297 (85.175)	lr 0.00323
Train [92][3000/3239]	Time 0.239 (0.517)	Data Time 0.001 (0.015)	Loss 2.2518 (2.4150)	Entropy 0.56888 (0.57007)	Top-1 acc 71.094 (65.846)	Top-5 acc 89.844 (85.176)	lr 0.00323
Train [92][3010/3239]	Time 0.228 (0.516)	Data Time 0.001 (0.014)	Loss 2.7708 (2.4154)	Entropy 0.56865 (0.57006)	Top-1 acc 59.375 (65.836)	Top-5 acc 76.562 (85.169)	lr 0.00323
Train [92][3020/3239]	Time 0.365 (0.516)	Data Time 0.001 (0.014)	Loss 2.4321 (2.4156)	Entropy 0.56845 (0.57006)	Top-1 acc 64.844 (65.830)	Top-5 acc 85.156 (85.163)	lr 0.00323
Train [92][3030/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.014)	Loss 2.7537 (2.4159)	Entropy 0.56818 (0.57005)	Top-1 acc 60.547 (65.826)	Top-5 acc 78.906 (85.160)	lr 0.00322
Train [92][3040/3239]	Time 0.240 (0.516)	Data Time 0.001 (0.014)	Loss 2.4475 (2.4160)	Entropy 0.56832 (0.57005)	Top-1 acc 62.109 (65.824)	Top-5 acc 83.984 (85.160)	lr 0.00322
Train [92][3050/3239]	Time 0.227 (0.515)	Data Time 0.001 (0.014)	Loss 2.4312 (2.4162)	Entropy 0.56856 (0.57004)	Top-1 acc 63.672 (65.817)	Top-5 acc 87.109 (85.157)	lr 0.00322
Train [92][3060/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.014)	Loss 2.4782 (2.4164)	Entropy 0.56866 (0.57004)	Top-1 acc 62.891 (65.811)	Top-5 acc 85.547 (85.153)	lr 0.00322
Train [92][3070/3239]	Time 0.244 (0.515)	Data Time 0.001 (0.014)	Loss 2.4963 (2.4165)	Entropy 0.56855 (0.57003)	Top-1 acc 61.719 (65.805)	Top-5 acc 83.594 (85.151)	lr 0.00322
Train [92][3080/3239]	Time 0.232 (0.514)	Data Time 0.001 (0.014)	Loss 2.3591 (2.4166)	Entropy 0.56877 (0.57003)	Top-1 acc 64.844 (65.804)	Top-5 acc 85.547 (85.152)	lr 0.00322
Train [92][3090/3239]	Time 0.243 (0.514)	Data Time 0.001 (0.014)	Loss 2.5111 (2.4166)	Entropy 0.56866 (0.57002)	Top-1 acc 63.672 (65.802)	Top-5 acc 81.641 (85.149)	lr 0.00322
Train [92][3100/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.014)	Loss 2.7181 (2.4169)	Entropy 0.56873 (0.57002)	Top-1 acc 59.766 (65.794)	Top-5 acc 81.641 (85.146)	lr 0.00322
Train [92][3110/3239]	Time 0.349 (0.514)	Data Time 0.002 (0.014)	Loss 2.6036 (2.4170)	Entropy 0.56886 (0.57001)	Top-1 acc 62.891 (65.794)	Top-5 acc 83.984 (85.146)	lr 0.00322
Train [92][3120/3239]	Time 0.283 (0.513)	Data Time 0.001 (0.014)	Loss 2.4003 (2.4169)	Entropy 0.56870 (0.57001)	Top-1 acc 65.625 (65.796)	Top-5 acc 84.766 (85.146)	lr 0.00322
Train [92][3130/3239]	Time 0.243 (0.513)	Data Time 0.001 (0.014)	Loss 2.3710 (2.4167)	Entropy 0.56851 (0.57001)	Top-1 acc 64.062 (65.801)	Top-5 acc 85.547 (85.146)	lr 0.00322
Train [92][3140/3239]	Time 0.292 (0.513)	Data Time 0.001 (0.014)	Loss 2.4941 (2.4169)	Entropy 0.56858 (0.57000)	Top-1 acc 66.797 (65.797)	Top-5 acc 83.203 (85.142)	lr 0.00322
Train [92][3150/3239]	Time 0.241 (0.513)	Data Time 0.002 (0.014)	Loss 2.6233 (2.4169)	Entropy 0.56867 (0.57000)	Top-1 acc 57.812 (65.798)	Top-5 acc 81.641 (85.140)	lr 0.00322
Train [92][3160/3239]	Time 0.401 (0.529)	Data Time 0.025 (0.014)	Loss 2.5177 (2.4170)	Entropy 0.56877 (0.56999)	Top-1 acc 65.625 (65.795)	Top-5 acc 82.031 (85.139)	lr 0.00322
Train [92][3170/3239]	Time 0.241 (0.529)	Data Time 0.002 (0.014)	Loss 2.4083 (2.4167)	Entropy 0.56893 (0.56999)	Top-1 acc 67.969 (65.803)	Top-5 acc 82.812 (85.141)	lr 0.00322
Train [92][3180/3239]	Time 0.331 (0.528)	Data Time 0.000 (0.014)	Loss 2.4314 (2.4169)	Entropy 0.56858 (0.56998)	Top-1 acc 64.453 (65.797)	Top-5 acc 84.766 (85.140)	lr 0.00321
Train [92][3190/3239]	Time 0.239 (0.528)	Data Time 0.000 (0.014)	Loss 2.2368 (2.4169)	Entropy 0.56866 (0.56998)	Top-1 acc 67.188 (65.790)	Top-5 acc 88.281 (85.138)	lr 0.00321
Train [92][3200/3239]	Time 0.235 (0.528)	Data Time 0.000 (0.014)	Loss 2.2694 (2.4170)	Entropy 0.56836 (0.56998)	Top-1 acc 70.312 (65.791)	Top-5 acc 86.328 (85.136)	lr 0.00321
Train [92][3210/3239]	Time 0.226 (0.527)	Data Time 0.000 (0.014)	Loss 2.3259 (2.4172)	Entropy 0.56884 (0.56997)	Top-1 acc 69.531 (65.783)	Top-5 acc 85.938 (85.133)	lr 0.00321
Train [92][3220/3239]	Time 0.241 (0.527)	Data Time 0.000 (0.014)	Loss 2.1716 (2.4169)	Entropy 0.56903 (0.56997)	Top-1 acc 69.922 (65.787)	Top-5 acc 89.844 (85.136)	lr 0.00321
Train [92][3230/3239]	Time 0.231 (0.526)	Data Time 0.000 (0.014)	Loss 2.3951 (2.4170)	Entropy 0.56893 (0.56997)	Top-1 acc 67.188 (65.786)	Top-5 acc 84.766 (85.135)	lr 0.00321
Train [92][3239/3239]	Time 1.024 (0.526)	Data Time 0.000 (0.014)	Loss 2.4077 (2.4171)	Entropy 0.56896 (0.56996)	Top-1 acc 67.901 (65.785)	Top-5 acc 85.185 (85.135)	lr 0.00321
==========Valid [92/120]	loss 1.228	top-1 acc 71.739 (71.739)	top-5 acc 89.899	Train top-1 65.785	top-5 85.135	Entropy 0.56896	Latency-None: 0.000ms	Flops: 539.00M
Train [93][0/3239]	Time 37.739 (37.739)	Data Time 36.130 (36.130)	Loss 2.4317 (2.4317)	Entropy 0.56906 (0.56906)	Top-1 acc 64.062 (64.062)	Top-5 acc 85.938 (85.938)	lr 0.00321
Train [93][10/3239]	Time 0.335 (4.012)	Data Time 0.001 (3.360)	Loss 2.2512 (2.4009)	Entropy 0.56912 (0.56909)	Top-1 acc 68.750 (65.874)	Top-5 acc 87.109 (86.044)	lr 0.00321
Train [93][20/3239]	Time 0.233 (2.299)	Data Time 0.001 (1.762)	Loss 2.3094 (2.3977)	Entropy 0.56902 (0.56910)	Top-1 acc 70.312 (66.536)	Top-5 acc 85.156 (85.305)	lr 0.00321
Train [93][30/3239]	Time 0.236 (1.697)	Data Time 0.001 (1.195)	Loss 2.4803 (2.3929)	Entropy 0.56906 (0.56907)	Top-1 acc 64.453 (66.784)	Top-5 acc 83.203 (85.383)	lr 0.00321
Train [93][40/3239]	Time 0.255 (1.390)	Data Time 0.001 (0.904)	Loss 2.3265 (2.4005)	Entropy 0.56922 (0.56910)	Top-1 acc 67.188 (66.378)	Top-5 acc 85.547 (85.480)	lr 0.00321
Train [93][50/3239]	Time 0.264 (1.200)	Data Time 0.001 (0.727)	Loss 2.4050 (2.4146)	Entropy 0.56928 (0.56912)	Top-1 acc 67.188 (65.939)	Top-5 acc 85.547 (85.156)	lr 0.00321
Train [93][60/3239]	Time 0.252 (1.073)	Data Time 0.001 (0.608)	Loss 2.3759 (2.4155)	Entropy 0.56898 (0.56913)	Top-1 acc 67.578 (65.856)	Top-5 acc 85.156 (84.996)	lr 0.00321
Train [93][70/3239]	Time 0.236 (0.979)	Data Time 0.001 (0.523)	Loss 2.3957 (2.4066)	Entropy 0.56892 (0.56909)	Top-1 acc 66.016 (66.159)	Top-5 acc 83.594 (85.140)	lr 0.00321
Train [93][80/3239]	Time 0.238 (0.919)	Data Time 0.001 (0.458)	Loss 2.4250 (2.4108)	Entropy 0.56894 (0.56908)	Top-1 acc 64.844 (66.112)	Top-5 acc 87.109 (85.151)	lr 0.00321
Train [93][90/3239]	Time 0.238 (0.864)	Data Time 0.001 (0.408)	Loss 2.6546 (2.4100)	Entropy 0.56924 (0.56908)	Top-1 acc 59.375 (66.162)	Top-5 acc 81.250 (85.165)	lr 0.00320
Train [93][100/3239]	Time 0.240 (0.820)	Data Time 0.001 (0.368)	Loss 2.4156 (2.4106)	Entropy 0.56934 (0.56910)	Top-1 acc 66.797 (66.221)	Top-5 acc 84.375 (85.222)	lr 0.00320
Train [93][110/3239]	Time 0.233 (0.784)	Data Time 0.001 (0.335)	Loss 2.4303 (2.4080)	Entropy 0.56948 (0.56912)	Top-1 acc 64.844 (66.287)	Top-5 acc 83.984 (85.255)	lr 0.00320
Train [93][120/3239]	Time 0.257 (0.754)	Data Time 0.003 (0.307)	Loss 2.5489 (2.4037)	Entropy 0.56950 (0.56915)	Top-1 acc 60.938 (66.296)	Top-5 acc 84.766 (85.347)	lr 0.00320
Train [93][130/3239]	Time 0.232 (0.729)	Data Time 0.001 (0.284)	Loss 2.4189 (2.4071)	Entropy 0.56971 (0.56918)	Top-1 acc 64.453 (66.201)	Top-5 acc 84.766 (85.305)	lr 0.00320
Train [93][140/3239]	Time 0.242 (0.707)	Data Time 0.002 (0.264)	Loss 2.3385 (2.4113)	Entropy 0.56969 (0.56921)	Top-1 acc 68.359 (66.135)	Top-5 acc 87.500 (85.209)	lr 0.00320
Train [93][150/3239]	Time 0.233 (0.688)	Data Time 0.001 (0.247)	Loss 2.2876 (2.4086)	Entropy 0.56993 (0.56925)	Top-1 acc 67.969 (66.230)	Top-5 acc 88.672 (85.231)	lr 0.00320
Train [93][160/3239]	Time 0.268 (0.673)	Data Time 0.001 (0.232)	Loss 2.3887 (2.4103)	Entropy 0.57003 (0.56929)	Top-1 acc 67.578 (66.224)	Top-5 acc 84.375 (85.132)	lr 0.00320
Train [93][170/3239]	Time 0.428 (0.661)	Data Time 0.001 (0.218)	Loss 2.3838 (2.4145)	Entropy 0.57015 (0.56934)	Top-1 acc 66.016 (66.128)	Top-5 acc 86.719 (85.088)	lr 0.00320
Train [93][180/3239]	Time 0.238 (0.647)	Data Time 0.001 (0.206)	Loss 2.3548 (2.4131)	Entropy 0.56990 (0.56938)	Top-1 acc 65.625 (66.173)	Top-5 acc 88.672 (85.128)	lr 0.00320
Train [93][190/3239]	Time 0.246 (0.636)	Data Time 0.001 (0.195)	Loss 2.4152 (2.4129)	Entropy 0.56986 (0.56940)	Top-1 acc 64.844 (66.138)	Top-5 acc 84.375 (85.128)	lr 0.00320
Train [93][200/3239]	Time 0.256 (0.628)	Data Time 0.001 (0.186)	Loss 2.3685 (2.4117)	Entropy 0.56952 (0.56943)	Top-1 acc 67.578 (66.171)	Top-5 acc 83.203 (85.119)	lr 0.00320
Train [93][210/3239]	Time 0.262 (0.620)	Data Time 0.001 (0.177)	Loss 2.4475 (2.4131)	Entropy 0.56946 (0.56943)	Top-1 acc 68.359 (66.191)	Top-5 acc 83.984 (85.101)	lr 0.00320
Train [93][220/3239]	Time 0.276 (0.611)	Data Time 0.001 (0.169)	Loss 2.3518 (2.4139)	Entropy 0.56960 (0.56943)	Top-1 acc 66.797 (66.093)	Top-5 acc 85.156 (85.135)	lr 0.00320
Train [93][230/3239]	Time 0.268 (0.603)	Data Time 0.001 (0.162)	Loss 2.2188 (2.4148)	Entropy 0.56970 (0.56944)	Top-1 acc 66.797 (66.076)	Top-5 acc 88.281 (85.131)	lr 0.00320
Train [93][240/3239]	Time 0.366 (0.596)	Data Time 0.002 (0.155)	Loss 2.5171 (2.4126)	Entropy 0.56948 (0.56944)	Top-1 acc 63.281 (66.082)	Top-5 acc 81.250 (85.179)	lr 0.00319
Train [93][250/3239]	Time 0.231 (0.589)	Data Time 0.001 (0.149)	Loss 2.4131 (2.4128)	Entropy 0.56964 (0.56945)	Top-1 acc 64.844 (66.070)	Top-5 acc 86.328 (85.173)	lr 0.00319
Train [93][260/3239]	Time 0.236 (0.582)	Data Time 0.001 (0.143)	Loss 2.3829 (2.4104)	Entropy 0.56997 (0.56946)	Top-1 acc 66.016 (66.129)	Top-5 acc 84.766 (85.209)	lr 0.00319
Train [93][270/3239]	Time 0.232 (0.576)	Data Time 0.001 (0.138)	Loss 2.5437 (2.4107)	Entropy 0.56980 (0.56948)	Top-1 acc 60.938 (66.134)	Top-5 acc 82.812 (85.214)	lr 0.00319
Train [93][280/3239]	Time 0.229 (0.570)	Data Time 0.001 (0.133)	Loss 2.5806 (2.4131)	Entropy 0.56967 (0.56948)	Top-1 acc 64.062 (66.096)	Top-5 acc 82.812 (85.191)	lr 0.00319
Train [93][290/3239]	Time 0.229 (0.565)	Data Time 0.001 (0.129)	Loss 2.5048 (2.4149)	Entropy 0.56974 (0.56949)	Top-1 acc 62.891 (66.034)	Top-5 acc 82.031 (85.158)	lr 0.00319
Train [93][300/3239]	Time 0.231 (0.560)	Data Time 0.001 (0.125)	Loss 2.3724 (2.4142)	Entropy 0.56922 (0.56949)	Top-1 acc 64.844 (66.044)	Top-5 acc 86.328 (85.180)	lr 0.00319
Train [93][310/3239]	Time 0.258 (0.556)	Data Time 0.001 (0.121)	Loss 2.2255 (2.4138)	Entropy 0.56917 (0.56949)	Top-1 acc 66.406 (66.032)	Top-5 acc 89.062 (85.191)	lr 0.00319
Train [93][320/3239]	Time 0.236 (0.551)	Data Time 0.001 (0.117)	Loss 2.3876 (2.4150)	Entropy 0.56939 (0.56948)	Top-1 acc 67.188 (66.010)	Top-5 acc 84.766 (85.156)	lr 0.00319
Train [93][330/3239]	Time 0.328 (0.547)	Data Time 0.001 (0.113)	Loss 2.4848 (2.4156)	Entropy 0.56868 (0.56947)	Top-1 acc 65.234 (66.007)	Top-5 acc 85.547 (85.144)	lr 0.00319
Train [93][340/3239]	Time 0.232 (0.543)	Data Time 0.001 (0.110)	Loss 2.5186 (2.4173)	Entropy 0.56792 (0.56944)	Top-1 acc 63.281 (65.938)	Top-5 acc 83.203 (85.113)	lr 0.00319
Train [93][350/3239]	Time 0.237 (0.540)	Data Time 0.001 (0.107)	Loss 2.2593 (2.4134)	Entropy 0.56776 (0.56940)	Top-1 acc 68.750 (66.015)	Top-5 acc 87.891 (85.194)	lr 0.00319
Train [93][360/3239]	Time 0.238 (0.537)	Data Time 0.001 (0.104)	Loss 2.3961 (2.4119)	Entropy 0.56741 (0.56935)	Top-1 acc 69.531 (66.051)	Top-5 acc 84.375 (85.215)	lr 0.00319
Train [93][370/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.101)	Loss 2.5791 (2.4122)	Entropy 0.56736 (0.56930)	Top-1 acc 62.109 (66.044)	Top-5 acc 81.250 (85.198)	lr 0.00319
Train [93][380/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.099)	Loss 2.2585 (2.4134)	Entropy 0.56694 (0.56924)	Top-1 acc 70.312 (66.017)	Top-5 acc 89.062 (85.167)	lr 0.00319
Train [93][390/3239]	Time 0.271 (0.528)	Data Time 0.001 (0.096)	Loss 2.2504 (2.4122)	Entropy 0.56685 (0.56918)	Top-1 acc 67.188 (66.018)	Top-5 acc 89.844 (85.194)	lr 0.00318
Train [93][400/3239]	Time 0.379 (0.525)	Data Time 0.001 (0.094)	Loss 2.3287 (2.4124)	Entropy 0.56677 (0.56913)	Top-1 acc 69.531 (66.002)	Top-5 acc 87.500 (85.193)	lr 0.00318
Train [93][410/3239]	Time 0.239 (0.522)	Data Time 0.001 (0.092)	Loss 2.2952 (2.4117)	Entropy 0.56688 (0.56907)	Top-1 acc 67.969 (66.018)	Top-5 acc 86.719 (85.208)	lr 0.00318
Train [93][420/3239]	Time 0.279 (0.520)	Data Time 0.001 (0.090)	Loss 2.5313 (2.4117)	Entropy 0.56674 (0.56902)	Top-1 acc 61.328 (66.020)	Top-5 acc 86.328 (85.226)	lr 0.00318
Train [93][430/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.088)	Loss 2.3718 (2.4117)	Entropy 0.56691 (0.56897)	Top-1 acc 68.359 (66.009)	Top-5 acc 85.938 (85.222)	lr 0.00318
Train [93][440/3239]	Time 0.229 (0.515)	Data Time 0.001 (0.086)	Loss 2.3682 (2.4130)	Entropy 0.56688 (0.56892)	Top-1 acc 65.625 (65.964)	Top-5 acc 86.328 (85.198)	lr 0.00318
Train [93][450/3239]	Time 0.241 (0.513)	Data Time 0.001 (0.084)	Loss 2.3311 (2.4123)	Entropy 0.56707 (0.56888)	Top-1 acc 69.531 (65.979)	Top-5 acc 85.547 (85.216)	lr 0.00318
Train [93][460/3239]	Time 0.245 (0.511)	Data Time 0.001 (0.082)	Loss 2.5449 (2.4133)	Entropy 0.56698 (0.56884)	Top-1 acc 64.844 (65.964)	Top-5 acc 82.031 (85.216)	lr 0.00318
Train [93][470/3239]	Time 0.239 (0.509)	Data Time 0.001 (0.080)	Loss 2.4891 (2.4153)	Entropy 0.56699 (0.56880)	Top-1 acc 65.234 (65.924)	Top-5 acc 85.547 (85.201)	lr 0.00318
Train [93][480/3239]	Time 0.274 (0.508)	Data Time 0.002 (0.079)	Loss 2.3364 (2.4143)	Entropy 0.56688 (0.56876)	Top-1 acc 68.359 (65.938)	Top-5 acc 85.938 (85.226)	lr 0.00318
Train [93][490/3239]	Time 0.309 (0.506)	Data Time 0.001 (0.077)	Loss 2.2210 (2.4132)	Entropy 0.56669 (0.56873)	Top-1 acc 67.969 (65.954)	Top-5 acc 89.844 (85.241)	lr 0.00318
Train [93][500/3239]	Time 0.233 (0.504)	Data Time 0.001 (0.076)	Loss 2.2964 (2.4123)	Entropy 0.56712 (0.56869)	Top-1 acc 64.062 (65.961)	Top-5 acc 88.672 (85.260)	lr 0.00318
Train [93][510/3239]	Time 0.237 (0.503)	Data Time 0.001 (0.074)	Loss 2.3077 (2.4119)	Entropy 0.56718 (0.56866)	Top-1 acc 64.453 (65.971)	Top-5 acc 88.281 (85.265)	lr 0.00318
Train [93][520/3239]	Time 0.282 (0.502)	Data Time 0.002 (0.073)	Loss 2.3111 (2.4129)	Entropy 0.56715 (0.56863)	Top-1 acc 67.578 (65.927)	Top-5 acc 88.672 (85.256)	lr 0.00318
Train [93][530/3239]	Time 0.228 (0.501)	Data Time 0.001 (0.071)	Loss 2.3402 (2.4135)	Entropy 0.56706 (0.56860)	Top-1 acc 67.188 (65.904)	Top-5 acc 87.109 (85.263)	lr 0.00317
Train [93][540/3239]	Time 0.248 (0.500)	Data Time 0.001 (0.070)	Loss 2.3502 (2.4119)	Entropy 0.56716 (0.56857)	Top-1 acc 63.281 (65.926)	Top-5 acc 86.719 (85.275)	lr 0.00317
Train [93][550/3239]	Time 0.259 (0.499)	Data Time 0.001 (0.069)	Loss 2.3542 (2.4125)	Entropy 0.56726 (0.56855)	Top-1 acc 68.750 (65.907)	Top-5 acc 86.719 (85.282)	lr 0.00317
Train [93][560/3239]	Time 0.364 (0.498)	Data Time 0.001 (0.068)	Loss 2.2708 (2.4122)	Entropy 0.56751 (0.56853)	Top-1 acc 68.750 (65.922)	Top-5 acc 87.109 (85.284)	lr 0.00317
Train [93][570/3239]	Time 0.376 (0.584)	Data Time 0.011 (0.067)	Loss 2.2292 (2.4106)	Entropy 0.56782 (0.56851)	Top-1 acc 68.750 (65.955)	Top-5 acc 86.328 (85.304)	lr 0.00317
Train [93][580/3239]	Time 0.241 (0.584)	Data Time 0.002 (0.065)	Loss 2.3510 (2.4106)	Entropy 0.56742 (0.56850)	Top-1 acc 65.625 (65.952)	Top-5 acc 87.109 (85.306)	lr 0.00317
Train [93][590/3239]	Time 0.264 (0.582)	Data Time 0.002 (0.064)	Loss 2.3528 (2.4119)	Entropy 0.56710 (0.56848)	Top-1 acc 69.922 (65.934)	Top-5 acc 88.672 (85.289)	lr 0.00317
Train [93][600/3239]	Time 0.243 (0.579)	Data Time 0.001 (0.063)	Loss 2.3715 (2.4107)	Entropy 0.56733 (0.56846)	Top-1 acc 66.406 (65.962)	Top-5 acc 87.891 (85.300)	lr 0.00317
Train [93][610/3239]	Time 0.240 (0.577)	Data Time 0.001 (0.062)	Loss 2.3235 (2.4105)	Entropy 0.56755 (0.56844)	Top-1 acc 67.578 (65.978)	Top-5 acc 85.938 (85.300)	lr 0.00317
Train [93][620/3239]	Time 0.234 (0.575)	Data Time 0.001 (0.061)	Loss 2.3710 (2.4101)	Entropy 0.56747 (0.56843)	Top-1 acc 65.234 (65.977)	Top-5 acc 86.328 (85.306)	lr 0.00317
Train [93][630/3239]	Time 0.235 (0.572)	Data Time 0.001 (0.060)	Loss 2.4090 (2.4086)	Entropy 0.56762 (0.56841)	Top-1 acc 67.578 (66.015)	Top-5 acc 83.203 (85.325)	lr 0.00317
Train [93][640/3239]	Time 0.272 (0.570)	Data Time 0.001 (0.060)	Loss 2.5019 (2.4085)	Entropy 0.56757 (0.56840)	Top-1 acc 65.234 (66.021)	Top-5 acc 85.156 (85.331)	lr 0.00317
Train [93][650/3239]	Time 0.257 (0.567)	Data Time 0.001 (0.059)	Loss 2.6137 (2.4088)	Entropy 0.56751 (0.56839)	Top-1 acc 63.672 (66.019)	Top-5 acc 81.641 (85.318)	lr 0.00317
Train [93][660/3239]	Time 0.316 (0.565)	Data Time 0.002 (0.058)	Loss 2.3840 (2.4085)	Entropy 0.56726 (0.56837)	Top-1 acc 67.969 (66.019)	Top-5 acc 85.156 (85.314)	lr 0.00317
Train [93][670/3239]	Time 0.278 (0.563)	Data Time 0.001 (0.057)	Loss 2.3084 (2.4082)	Entropy 0.56677 (0.56835)	Top-1 acc 70.703 (66.038)	Top-5 acc 86.328 (85.321)	lr 0.00317
Train [93][680/3239]	Time 0.270 (0.562)	Data Time 0.001 (0.056)	Loss 2.2843 (2.4072)	Entropy 0.56653 (0.56833)	Top-1 acc 69.141 (66.071)	Top-5 acc 85.547 (85.333)	lr 0.00316
Train [93][690/3239]	Time 0.248 (0.560)	Data Time 0.002 (0.055)	Loss 2.2707 (2.4067)	Entropy 0.56684 (0.56830)	Top-1 acc 71.484 (66.081)	Top-5 acc 86.328 (85.343)	lr 0.00316
Train [93][700/3239]	Time 0.328 (0.558)	Data Time 0.002 (0.055)	Loss 2.5027 (2.4069)	Entropy 0.56647 (0.56828)	Top-1 acc 61.719 (66.055)	Top-5 acc 83.984 (85.344)	lr 0.00316
Train [93][710/3239]	Time 0.253 (0.558)	Data Time 0.002 (0.054)	Loss 2.2637 (2.4072)	Entropy 0.56637 (0.56825)	Top-1 acc 71.875 (66.056)	Top-5 acc 85.938 (85.338)	lr 0.00316
Train [93][720/3239]	Time 0.340 (0.556)	Data Time 0.001 (0.053)	Loss 2.2541 (2.4071)	Entropy 0.56670 (0.56823)	Top-1 acc 71.875 (66.044)	Top-5 acc 89.453 (85.337)	lr 0.00316
Train [93][730/3239]	Time 0.236 (0.554)	Data Time 0.001 (0.052)	Loss 2.3254 (2.4072)	Entropy 0.56687 (0.56821)	Top-1 acc 67.188 (66.045)	Top-5 acc 86.328 (85.330)	lr 0.00316
Train [93][740/3239]	Time 0.230 (0.552)	Data Time 0.001 (0.052)	Loss 2.4364 (2.4070)	Entropy 0.56645 (0.56819)	Top-1 acc 65.234 (66.060)	Top-5 acc 85.938 (85.336)	lr 0.00316
Train [93][750/3239]	Time 0.235 (0.550)	Data Time 0.001 (0.051)	Loss 2.4830 (2.4079)	Entropy 0.56615 (0.56817)	Top-1 acc 65.234 (66.034)	Top-5 acc 83.984 (85.320)	lr 0.00316
Train [93][760/3239]	Time 0.232 (0.549)	Data Time 0.001 (0.050)	Loss 2.4588 (2.4075)	Entropy 0.56618 (0.56814)	Top-1 acc 66.016 (66.061)	Top-5 acc 82.812 (85.317)	lr 0.00316
Train [93][770/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.050)	Loss 2.3940 (2.4080)	Entropy 0.56617 (0.56811)	Top-1 acc 66.406 (66.043)	Top-5 acc 83.984 (85.315)	lr 0.00316
Train [93][780/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.049)	Loss 2.4662 (2.4086)	Entropy 0.56635 (0.56809)	Top-1 acc 63.672 (66.030)	Top-5 acc 84.375 (85.299)	lr 0.00316
Train [93][790/3239]	Time 0.335 (0.544)	Data Time 0.001 (0.049)	Loss 2.3903 (2.4079)	Entropy 0.56632 (0.56807)	Top-1 acc 66.797 (66.036)	Top-5 acc 85.938 (85.315)	lr 0.00316
Train [93][800/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.048)	Loss 2.5934 (2.4080)	Entropy 0.56654 (0.56805)	Top-1 acc 62.891 (66.029)	Top-5 acc 83.203 (85.321)	lr 0.00316
Train [93][810/3239]	Time 0.233 (0.541)	Data Time 0.003 (0.047)	Loss 2.6039 (2.4081)	Entropy 0.56626 (0.56803)	Top-1 acc 61.719 (66.019)	Top-5 acc 84.375 (85.324)	lr 0.00316
Train [93][820/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.047)	Loss 2.3642 (2.4080)	Entropy 0.56636 (0.56801)	Top-1 acc 68.359 (66.026)	Top-5 acc 86.719 (85.329)	lr 0.00316
Train [93][830/3239]	Time 0.259 (0.538)	Data Time 0.001 (0.046)	Loss 2.3386 (2.4086)	Entropy 0.56626 (0.56799)	Top-1 acc 70.312 (66.022)	Top-5 acc 87.500 (85.323)	lr 0.00315
Train [93][840/3239]	Time 0.257 (0.537)	Data Time 0.001 (0.046)	Loss 2.5152 (2.4092)	Entropy 0.56632 (0.56797)	Top-1 acc 60.156 (65.998)	Top-5 acc 85.156 (85.310)	lr 0.00315
Train [93][850/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.045)	Loss 2.6976 (2.4107)	Entropy 0.56619 (0.56795)	Top-1 acc 61.719 (65.963)	Top-5 acc 78.516 (85.282)	lr 0.00315
Train [93][860/3239]	Time 0.229 (0.534)	Data Time 0.001 (0.045)	Loss 2.2598 (2.4099)	Entropy 0.56615 (0.56793)	Top-1 acc 70.703 (65.974)	Top-5 acc 87.500 (85.297)	lr 0.00315
Train [93][870/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.044)	Loss 2.3443 (2.4099)	Entropy 0.56614 (0.56791)	Top-1 acc 65.625 (65.971)	Top-5 acc 87.109 (85.305)	lr 0.00315
Train [93][880/3239]	Time 0.332 (0.532)	Data Time 0.001 (0.044)	Loss 2.3418 (2.4096)	Entropy 0.56623 (0.56789)	Top-1 acc 67.188 (65.984)	Top-5 acc 86.719 (85.303)	lr 0.00315
Train [93][890/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.043)	Loss 2.4962 (2.4102)	Entropy 0.56622 (0.56787)	Top-1 acc 66.797 (65.979)	Top-5 acc 82.812 (85.294)	lr 0.00315
Train [93][900/3239]	Time 0.223 (0.529)	Data Time 0.001 (0.043)	Loss 2.4656 (2.4103)	Entropy 0.56637 (0.56785)	Top-1 acc 64.453 (65.980)	Top-5 acc 87.109 (85.296)	lr 0.00315
Train [93][910/3239]	Time 0.269 (0.528)	Data Time 0.001 (0.042)	Loss 2.4563 (2.4103)	Entropy 0.56638 (0.56783)	Top-1 acc 64.844 (65.989)	Top-5 acc 83.984 (85.298)	lr 0.00315
Train [93][920/3239]	Time 0.229 (0.527)	Data Time 0.001 (0.042)	Loss 2.3236 (2.4102)	Entropy 0.56626 (0.56782)	Top-1 acc 66.406 (65.989)	Top-5 acc 88.672 (85.310)	lr 0.00315
Train [93][930/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.041)	Loss 2.3329 (2.4103)	Entropy 0.56632 (0.56780)	Top-1 acc 71.875 (65.994)	Top-5 acc 88.281 (85.311)	lr 0.00315
Train [93][940/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.041)	Loss 2.4209 (2.4095)	Entropy 0.56601 (0.56778)	Top-1 acc 68.359 (66.015)	Top-5 acc 84.766 (85.318)	lr 0.00315
Train [93][950/3239]	Time 0.373 (0.523)	Data Time 0.001 (0.041)	Loss 2.4046 (2.4098)	Entropy 0.56601 (0.56777)	Top-1 acc 67.578 (66.012)	Top-5 acc 86.719 (85.316)	lr 0.00315
Train [93][960/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.040)	Loss 2.2894 (2.4098)	Entropy 0.56585 (0.56775)	Top-1 acc 69.922 (66.007)	Top-5 acc 86.719 (85.314)	lr 0.00315
Train [93][970/3239]	Time 0.237 (0.521)	Data Time 0.001 (0.040)	Loss 2.3790 (2.4094)	Entropy 0.56593 (0.56773)	Top-1 acc 67.969 (66.002)	Top-5 acc 88.672 (85.326)	lr 0.00315
Train [93][980/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.039)	Loss 2.8145 (2.4089)	Entropy 0.56623 (0.56771)	Top-1 acc 59.766 (66.018)	Top-5 acc 80.078 (85.344)	lr 0.00314
Train [93][990/3239]	Time 0.261 (0.519)	Data Time 0.002 (0.039)	Loss 2.2918 (2.4088)	Entropy 0.56576 (0.56769)	Top-1 acc 68.750 (66.015)	Top-5 acc 86.719 (85.341)	lr 0.00314
Train [93][1000/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.039)	Loss 2.2870 (2.4089)	Entropy 0.56580 (0.56767)	Top-1 acc 67.578 (66.007)	Top-5 acc 87.500 (85.341)	lr 0.00314
Train [93][1010/3239]	Time 0.269 (0.518)	Data Time 0.001 (0.038)	Loss 2.7824 (2.4096)	Entropy 0.56578 (0.56765)	Top-1 acc 58.203 (65.985)	Top-5 acc 76.953 (85.323)	lr 0.00314
Train [93][1020/3239]	Time 0.234 (0.517)	Data Time 0.002 (0.038)	Loss 2.1958 (2.4094)	Entropy 0.56566 (0.56763)	Top-1 acc 72.656 (65.987)	Top-5 acc 89.062 (85.329)	lr 0.00314
Train [93][1030/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.038)	Loss 2.3752 (2.4099)	Entropy 0.56543 (0.56762)	Top-1 acc 69.531 (65.974)	Top-5 acc 87.500 (85.327)	lr 0.00314
Train [93][1040/3239]	Time 0.245 (0.515)	Data Time 0.001 (0.037)	Loss 2.5915 (2.4099)	Entropy 0.56534 (0.56759)	Top-1 acc 63.672 (65.960)	Top-5 acc 80.469 (85.328)	lr 0.00314
Train [93][1050/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.037)	Loss 2.4528 (2.4101)	Entropy 0.56545 (0.56757)	Top-1 acc 68.359 (65.969)	Top-5 acc 82.812 (85.321)	lr 0.00314
Train [93][1060/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.037)	Loss 2.4104 (2.4102)	Entropy 0.56563 (0.56755)	Top-1 acc 65.625 (65.966)	Top-5 acc 83.984 (85.318)	lr 0.00314
Train [93][1070/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.036)	Loss 2.2563 (2.4108)	Entropy 0.56554 (0.56753)	Top-1 acc 72.266 (65.955)	Top-5 acc 88.672 (85.312)	lr 0.00314
Train [93][1080/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.036)	Loss 2.3871 (2.4101)	Entropy 0.56538 (0.56751)	Top-1 acc 68.750 (65.980)	Top-5 acc 86.328 (85.330)	lr 0.00314
Train [93][1090/3239]	Time 0.234 (0.511)	Data Time 0.001 (0.036)	Loss 2.3548 (2.4100)	Entropy 0.56537 (0.56749)	Top-1 acc 66.016 (65.987)	Top-5 acc 85.547 (85.335)	lr 0.00314
Train [93][1100/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.035)	Loss 2.2203 (2.4093)	Entropy 0.56537 (0.56748)	Top-1 acc 71.094 (66.002)	Top-5 acc 86.719 (85.341)	lr 0.00314
Train [93][1110/3239]	Time 0.337 (0.509)	Data Time 0.001 (0.035)	Loss 2.2832 (2.4097)	Entropy 0.56552 (0.56746)	Top-1 acc 70.312 (65.993)	Top-5 acc 87.891 (85.336)	lr 0.00314
Train [93][1120/3239]	Time 0.229 (0.508)	Data Time 0.001 (0.035)	Loss 2.3534 (2.4094)	Entropy 0.56540 (0.56744)	Top-1 acc 67.578 (66.001)	Top-5 acc 85.938 (85.342)	lr 0.00314
Train [93][1130/3239]	Time 0.232 (0.507)	Data Time 0.001 (0.034)	Loss 2.4671 (2.4095)	Entropy 0.56553 (0.56742)	Top-1 acc 62.500 (65.987)	Top-5 acc 84.375 (85.342)	lr 0.00313
Train [93][1140/3239]	Time 0.268 (0.507)	Data Time 0.001 (0.034)	Loss 2.3102 (2.4098)	Entropy 0.56549 (0.56740)	Top-1 acc 71.875 (65.980)	Top-5 acc 85.156 (85.336)	lr 0.00313
Train [93][1150/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.034)	Loss 2.4511 (2.4096)	Entropy 0.56530 (0.56739)	Top-1 acc 62.500 (65.983)	Top-5 acc 82.422 (85.344)	lr 0.00313
Train [93][1160/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.034)	Loss 2.5304 (2.4095)	Entropy 0.56550 (0.56737)	Top-1 acc 59.766 (65.983)	Top-5 acc 83.203 (85.343)	lr 0.00313
Train [93][1170/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.033)	Loss 2.4354 (2.4090)	Entropy 0.56519 (0.56735)	Top-1 acc 64.453 (65.988)	Top-5 acc 83.594 (85.346)	lr 0.00313
Train [93][1180/3239]	Time 0.350 (0.504)	Data Time 0.001 (0.033)	Loss 2.4171 (2.4088)	Entropy 0.56527 (0.56733)	Top-1 acc 65.234 (65.993)	Top-5 acc 86.719 (85.353)	lr 0.00313
Train [93][1190/3239]	Time 0.250 (0.503)	Data Time 0.001 (0.033)	Loss 2.4806 (2.4082)	Entropy 0.56507 (0.56732)	Top-1 acc 64.453 (66.015)	Top-5 acc 85.938 (85.364)	lr 0.00313
Train [93][1200/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.033)	Loss 2.3596 (2.4084)	Entropy 0.56483 (0.56730)	Top-1 acc 62.109 (66.006)	Top-5 acc 87.500 (85.356)	lr 0.00313
Train [93][1210/3239]	Time 0.234 (0.501)	Data Time 0.001 (0.032)	Loss 2.2119 (2.4084)	Entropy 0.56467 (0.56728)	Top-1 acc 69.922 (66.000)	Top-5 acc 91.406 (85.361)	lr 0.00313
Train [93][1220/3239]	Time 0.245 (0.500)	Data Time 0.001 (0.032)	Loss 2.4274 (2.4086)	Entropy 0.56471 (0.56726)	Top-1 acc 65.625 (65.993)	Top-5 acc 85.938 (85.357)	lr 0.00313
Train [93][1230/3239]	Time 0.326 (0.543)	Data Time 0.002 (0.032)	Loss 2.3276 (2.4094)	Entropy 0.56460 (0.56723)	Top-1 acc 65.234 (65.971)	Top-5 acc 88.672 (85.348)	lr 0.00313
Train [93][1240/3239]	Time 0.237 (0.542)	Data Time 0.002 (0.032)	Loss 2.6176 (2.4094)	Entropy 0.56437 (0.56721)	Top-1 acc 62.500 (65.969)	Top-5 acc 80.078 (85.348)	lr 0.00313
Train [93][1250/3239]	Time 0.224 (0.542)	Data Time 0.002 (0.031)	Loss 2.4054 (2.4088)	Entropy 0.56434 (0.56719)	Top-1 acc 66.016 (65.981)	Top-5 acc 85.156 (85.352)	lr 0.00313
Train [93][1260/3239]	Time 0.237 (0.541)	Data Time 0.001 (0.031)	Loss 2.5261 (2.4089)	Entropy 0.56439 (0.56717)	Top-1 acc 66.016 (65.984)	Top-5 acc 83.203 (85.352)	lr 0.00313
Train [93][1270/3239]	Time 0.328 (0.540)	Data Time 0.001 (0.031)	Loss 2.3663 (2.4088)	Entropy 0.56438 (0.56714)	Top-1 acc 69.531 (65.994)	Top-5 acc 85.156 (85.353)	lr 0.00313
Train [93][1280/3239]	Time 0.236 (0.539)	Data Time 0.001 (0.031)	Loss 2.2186 (2.4086)	Entropy 0.56422 (0.56712)	Top-1 acc 69.922 (65.993)	Top-5 acc 87.500 (85.354)	lr 0.00312
Train [93][1290/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.030)	Loss 2.3535 (2.4083)	Entropy 0.56436 (0.56710)	Top-1 acc 65.234 (66.005)	Top-5 acc 85.938 (85.355)	lr 0.00312
Train [93][1300/3239]	Time 0.228 (0.537)	Data Time 0.001 (0.030)	Loss 2.3486 (2.4082)	Entropy 0.56421 (0.56708)	Top-1 acc 66.406 (66.002)	Top-5 acc 87.109 (85.356)	lr 0.00312
Train [93][1310/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.030)	Loss 2.2760 (2.4079)	Entropy 0.56421 (0.56706)	Top-1 acc 66.797 (66.010)	Top-5 acc 88.672 (85.356)	lr 0.00312
Train [93][1320/3239]	Time 0.239 (0.536)	Data Time 0.001 (0.030)	Loss 2.4133 (2.4076)	Entropy 0.56386 (0.56703)	Top-1 acc 66.016 (66.017)	Top-5 acc 84.766 (85.362)	lr 0.00312
Train [93][1330/3239]	Time 0.224 (0.535)	Data Time 0.001 (0.030)	Loss 2.4222 (2.4074)	Entropy 0.56373 (0.56701)	Top-1 acc 65.234 (66.018)	Top-5 acc 83.984 (85.368)	lr 0.00312
Train [93][1340/3239]	Time 0.362 (0.535)	Data Time 0.001 (0.029)	Loss 2.4877 (2.4072)	Entropy 0.56373 (0.56699)	Top-1 acc 62.109 (66.027)	Top-5 acc 83.594 (85.365)	lr 0.00312
Train [93][1350/3239]	Time 0.256 (0.534)	Data Time 0.001 (0.029)	Loss 2.2658 (2.4075)	Entropy 0.56364 (0.56696)	Top-1 acc 68.359 (66.020)	Top-5 acc 87.891 (85.362)	lr 0.00312
Train [93][1360/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.029)	Loss 2.5567 (2.4076)	Entropy 0.56355 (0.56694)	Top-1 acc 59.375 (66.016)	Top-5 acc 85.156 (85.363)	lr 0.00312
Train [93][1370/3239]	Time 0.250 (0.532)	Data Time 0.001 (0.029)	Loss 2.3574 (2.4077)	Entropy 0.56333 (0.56691)	Top-1 acc 67.969 (66.010)	Top-5 acc 87.891 (85.358)	lr 0.00312
Train [93][1380/3239]	Time 0.239 (0.532)	Data Time 0.001 (0.029)	Loss 2.4261 (2.4080)	Entropy 0.56313 (0.56689)	Top-1 acc 66.406 (66.009)	Top-5 acc 85.156 (85.351)	lr 0.00312
Train [93][1390/3239]	Time 0.276 (0.531)	Data Time 0.002 (0.028)	Loss 2.1887 (2.4082)	Entropy 0.56316 (0.56686)	Top-1 acc 69.141 (66.002)	Top-5 acc 91.016 (85.349)	lr 0.00312
Train [93][1400/3239]	Time 0.242 (0.530)	Data Time 0.002 (0.028)	Loss 2.3712 (2.4081)	Entropy 0.56332 (0.56683)	Top-1 acc 65.234 (66.007)	Top-5 acc 86.719 (85.353)	lr 0.00312
Train [93][1410/3239]	Time 0.243 (0.529)	Data Time 0.002 (0.028)	Loss 2.3261 (2.4080)	Entropy 0.56339 (0.56681)	Top-1 acc 65.234 (66.006)	Top-5 acc 87.500 (85.354)	lr 0.00312
Train [93][1420/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.028)	Loss 2.7285 (2.4080)	Entropy 0.56351 (0.56678)	Top-1 acc 56.641 (66.004)	Top-5 acc 79.297 (85.352)	lr 0.00312
Train [93][1430/3239]	Time 0.368 (0.528)	Data Time 0.001 (0.028)	Loss 2.4314 (2.4082)	Entropy 0.56337 (0.56676)	Top-1 acc 66.016 (66.001)	Top-5 acc 86.328 (85.350)	lr 0.00311
Train [93][1440/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.027)	Loss 2.2464 (2.4083)	Entropy 0.56312 (0.56674)	Top-1 acc 68.750 (66.000)	Top-5 acc 87.500 (85.350)	lr 0.00311
Train [93][1450/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.027)	Loss 2.2706 (2.4082)	Entropy 0.56304 (0.56671)	Top-1 acc 69.922 (66.005)	Top-5 acc 86.328 (85.357)	lr 0.00311
Train [93][1460/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.027)	Loss 2.3386 (2.4083)	Entropy 0.56249 (0.56669)	Top-1 acc 68.750 (66.005)	Top-5 acc 85.547 (85.356)	lr 0.00311
Train [93][1470/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.027)	Loss 2.4799 (2.4084)	Entropy 0.56206 (0.56666)	Top-1 acc 64.844 (66.011)	Top-5 acc 81.641 (85.355)	lr 0.00311
Train [93][1480/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.027)	Loss 2.7085 (2.4087)	Entropy 0.56186 (0.56663)	Top-1 acc 57.812 (66.005)	Top-5 acc 81.250 (85.351)	lr 0.00311
Train [93][1490/3239]	Time 0.246 (0.524)	Data Time 0.002 (0.027)	Loss 2.1512 (2.4086)	Entropy 0.56211 (0.56659)	Top-1 acc 72.656 (66.007)	Top-5 acc 89.453 (85.351)	lr 0.00311
Train [93][1500/3239]	Time 0.326 (0.523)	Data Time 0.001 (0.026)	Loss 2.6029 (2.4087)	Entropy 0.56237 (0.56656)	Top-1 acc 60.547 (66.007)	Top-5 acc 83.203 (85.351)	lr 0.00311
Train [93][1510/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.026)	Loss 2.2970 (2.4084)	Entropy 0.56252 (0.56654)	Top-1 acc 69.531 (66.017)	Top-5 acc 88.672 (85.360)	lr 0.00311
Train [93][1520/3239]	Time 0.249 (0.522)	Data Time 0.001 (0.026)	Loss 2.2980 (2.4082)	Entropy 0.56257 (0.56651)	Top-1 acc 69.531 (66.020)	Top-5 acc 90.234 (85.365)	lr 0.00311
Train [93][1530/3239]	Time 0.237 (0.521)	Data Time 0.001 (0.026)	Loss 2.3491 (2.4083)	Entropy 0.56245 (0.56649)	Top-1 acc 67.188 (66.013)	Top-5 acc 88.672 (85.367)	lr 0.00311
Train [93][1540/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.026)	Loss 2.5382 (2.4078)	Entropy 0.56196 (0.56646)	Top-1 acc 66.406 (66.025)	Top-5 acc 84.375 (85.377)	lr 0.00311
Train [93][1550/3239]	Time 0.222 (0.519)	Data Time 0.001 (0.026)	Loss 2.4570 (2.4081)	Entropy 0.56183 (0.56643)	Top-1 acc 64.453 (66.014)	Top-5 acc 84.766 (85.372)	lr 0.00311
Train [93][1560/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.025)	Loss 2.4703 (2.4083)	Entropy 0.56190 (0.56640)	Top-1 acc 65.625 (66.005)	Top-5 acc 85.547 (85.368)	lr 0.00311
Train [93][1570/3239]	Time 0.267 (0.518)	Data Time 0.001 (0.025)	Loss 2.3736 (2.4084)	Entropy 0.56172 (0.56637)	Top-1 acc 64.062 (66.001)	Top-5 acc 85.156 (85.368)	lr 0.00311
Train [93][1580/3239]	Time 0.269 (0.517)	Data Time 0.001 (0.025)	Loss 2.2696 (2.4084)	Entropy 0.56165 (0.56634)	Top-1 acc 69.531 (66.001)	Top-5 acc 86.719 (85.364)	lr 0.00310
Train [93][1590/3239]	Time 0.336 (0.517)	Data Time 0.001 (0.025)	Loss 2.4329 (2.4085)	Entropy 0.56201 (0.56631)	Top-1 acc 65.625 (66.003)	Top-5 acc 85.156 (85.360)	lr 0.00310
Train [93][1600/3239]	Time 0.238 (0.516)	Data Time 0.001 (0.025)	Loss 2.3980 (2.4084)	Entropy 0.56180 (0.56628)	Top-1 acc 66.016 (66.008)	Top-5 acc 86.719 (85.364)	lr 0.00310
Train [93][1610/3239]	Time 0.235 (0.516)	Data Time 0.002 (0.025)	Loss 2.6688 (2.4084)	Entropy 0.56175 (0.56625)	Top-1 acc 60.547 (66.008)	Top-5 acc 79.688 (85.363)	lr 0.00310
Train [93][1620/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.025)	Loss 2.6072 (2.4084)	Entropy 0.56160 (0.56623)	Top-1 acc 57.812 (66.001)	Top-5 acc 81.641 (85.360)	lr 0.00310
Train [93][1630/3239]	Time 0.285 (0.515)	Data Time 0.002 (0.024)	Loss 2.2714 (2.4083)	Entropy 0.56181 (0.56620)	Top-1 acc 68.359 (65.998)	Top-5 acc 88.281 (85.362)	lr 0.00310
Train [93][1640/3239]	Time 0.238 (0.514)	Data Time 0.001 (0.024)	Loss 2.1611 (2.4080)	Entropy 0.56144 (0.56617)	Top-1 acc 70.703 (66.002)	Top-5 acc 89.453 (85.369)	lr 0.00310
Train [93][1650/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.024)	Loss 2.3612 (2.4081)	Entropy 0.56132 (0.56614)	Top-1 acc 66.797 (65.997)	Top-5 acc 87.500 (85.374)	lr 0.00310
Train [93][1660/3239]	Time 0.335 (0.513)	Data Time 0.001 (0.024)	Loss 2.4278 (2.4081)	Entropy 0.56151 (0.56611)	Top-1 acc 64.062 (65.997)	Top-5 acc 85.156 (85.374)	lr 0.00310
Train [93][1670/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.024)	Loss 2.1365 (2.4077)	Entropy 0.56162 (0.56609)	Top-1 acc 75.000 (66.011)	Top-5 acc 89.453 (85.378)	lr 0.00310
Train [93][1680/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.024)	Loss 2.3302 (2.4077)	Entropy 0.56171 (0.56606)	Top-1 acc 67.578 (66.009)	Top-5 acc 84.375 (85.376)	lr 0.00310
Train [93][1690/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.024)	Loss 2.4215 (2.4080)	Entropy 0.56171 (0.56603)	Top-1 acc 65.625 (65.999)	Top-5 acc 84.766 (85.366)	lr 0.00310
Train [93][1700/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.023)	Loss 2.4444 (2.4081)	Entropy 0.56169 (0.56601)	Top-1 acc 64.062 (65.996)	Top-5 acc 86.328 (85.368)	lr 0.00310
Train [93][1710/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.023)	Loss 2.3075 (2.4082)	Entropy 0.56159 (0.56598)	Top-1 acc 67.188 (65.996)	Top-5 acc 88.672 (85.368)	lr 0.00310
Train [93][1720/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.023)	Loss 2.3295 (2.4081)	Entropy 0.56170 (0.56596)	Top-1 acc 67.188 (65.990)	Top-5 acc 90.234 (85.372)	lr 0.00310
Train [93][1730/3239]	Time 0.238 (0.509)	Data Time 0.002 (0.023)	Loss 2.6672 (2.4083)	Entropy 0.56159 (0.56593)	Top-1 acc 62.109 (65.984)	Top-5 acc 82.812 (85.365)	lr 0.00309
Train [93][1740/3239]	Time 0.234 (0.509)	Data Time 0.001 (0.023)	Loss 2.4244 (2.4083)	Entropy 0.56142 (0.56591)	Top-1 acc 65.625 (65.990)	Top-5 acc 85.156 (85.365)	lr 0.00309
Train [93][1750/3239]	Time 0.235 (0.508)	Data Time 0.002 (0.023)	Loss 2.6528 (2.4084)	Entropy 0.56129 (0.56588)	Top-1 acc 58.984 (65.994)	Top-5 acc 79.688 (85.363)	lr 0.00309
Train [93][1760/3239]	Time 0.228 (0.508)	Data Time 0.001 (0.023)	Loss 2.3795 (2.4085)	Entropy 0.56142 (0.56586)	Top-1 acc 66.016 (65.990)	Top-5 acc 86.328 (85.361)	lr 0.00309
Train [93][1770/3239]	Time 0.241 (0.507)	Data Time 0.002 (0.023)	Loss 2.3340 (2.4080)	Entropy 0.56140 (0.56583)	Top-1 acc 69.922 (66.003)	Top-5 acc 85.547 (85.368)	lr 0.00309
Train [93][1780/3239]	Time 0.260 (0.507)	Data Time 0.002 (0.023)	Loss 2.2839 (2.4083)	Entropy 0.56163 (0.56581)	Top-1 acc 73.828 (66.002)	Top-5 acc 88.672 (85.366)	lr 0.00309
Train [93][1790/3239]	Time 0.231 (0.506)	Data Time 0.001 (0.022)	Loss 2.3622 (2.4079)	Entropy 0.56189 (0.56578)	Top-1 acc 67.578 (66.014)	Top-5 acc 86.328 (85.377)	lr 0.00309
Train [93][1800/3239]	Time 0.236 (0.506)	Data Time 0.001 (0.022)	Loss 2.3262 (2.4079)	Entropy 0.56211 (0.56576)	Top-1 acc 69.922 (66.010)	Top-5 acc 84.766 (85.376)	lr 0.00309
Train [93][1810/3239]	Time 0.235 (0.505)	Data Time 0.001 (0.022)	Loss 2.3653 (2.4080)	Entropy 0.56233 (0.56574)	Top-1 acc 66.016 (66.009)	Top-5 acc 84.375 (85.372)	lr 0.00309
Train [93][1820/3239]	Time 0.332 (0.505)	Data Time 0.001 (0.022)	Loss 2.3358 (2.4081)	Entropy 0.56257 (0.56572)	Top-1 acc 69.922 (66.001)	Top-5 acc 83.984 (85.372)	lr 0.00309
Train [93][1830/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.022)	Loss 2.4008 (2.4083)	Entropy 0.56270 (0.56571)	Top-1 acc 62.891 (65.994)	Top-5 acc 83.984 (85.370)	lr 0.00309
Train [93][1840/3239]	Time 0.236 (0.504)	Data Time 0.001 (0.022)	Loss 2.3274 (2.4083)	Entropy 0.56272 (0.56569)	Top-1 acc 69.531 (65.993)	Top-5 acc 89.453 (85.371)	lr 0.00309
Train [93][1850/3239]	Time 0.228 (0.503)	Data Time 0.001 (0.022)	Loss 2.6208 (2.4085)	Entropy 0.56265 (0.56568)	Top-1 acc 59.375 (65.987)	Top-5 acc 80.859 (85.365)	lr 0.00309
Train [93][1860/3239]	Time 0.230 (0.503)	Data Time 0.001 (0.022)	Loss 2.4335 (2.4085)	Entropy 0.56245 (0.56566)	Top-1 acc 65.625 (65.988)	Top-5 acc 84.766 (85.363)	lr 0.00309
Train [93][1870/3239]	Time 0.260 (0.502)	Data Time 0.002 (0.022)	Loss 2.4601 (2.4085)	Entropy 0.56236 (0.56564)	Top-1 acc 61.328 (65.987)	Top-5 acc 86.328 (85.364)	lr 0.00309
Train [93][1880/3239]	Time 0.391 (0.530)	Data Time 0.029 (0.021)	Loss 2.3591 (2.4085)	Entropy 0.56249 (0.56562)	Top-1 acc 67.188 (65.990)	Top-5 acc 85.156 (85.361)	lr 0.00308
Train [93][1890/3239]	Time 0.234 (0.529)	Data Time 0.002 (0.021)	Loss 2.2934 (2.4090)	Entropy 0.56230 (0.56561)	Top-1 acc 71.094 (65.984)	Top-5 acc 88.281 (85.355)	lr 0.00308
Train [93][1900/3239]	Time 0.242 (0.529)	Data Time 0.002 (0.021)	Loss 2.3710 (2.4087)	Entropy 0.56266 (0.56559)	Top-1 acc 64.453 (65.988)	Top-5 acc 86.328 (85.359)	lr 0.00308
Train [93][1910/3239]	Time 0.237 (0.528)	Data Time 0.001 (0.021)	Loss 2.5054 (2.4089)	Entropy 0.56250 (0.56557)	Top-1 acc 63.281 (65.983)	Top-5 acc 83.984 (85.352)	lr 0.00308
Train [93][1920/3239]	Time 0.314 (0.528)	Data Time 0.003 (0.021)	Loss 2.3433 (2.4087)	Entropy 0.56263 (0.56556)	Top-1 acc 67.578 (65.987)	Top-5 acc 85.938 (85.353)	lr 0.00308
Train [93][1930/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.021)	Loss 2.4944 (2.4088)	Entropy 0.56252 (0.56554)	Top-1 acc 61.328 (65.980)	Top-5 acc 82.812 (85.349)	lr 0.00308
Train [93][1940/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.021)	Loss 2.2987 (2.4087)	Entropy 0.56247 (0.56553)	Top-1 acc 63.672 (65.979)	Top-5 acc 86.719 (85.349)	lr 0.00308
Train [93][1950/3239]	Time 0.254 (0.527)	Data Time 0.002 (0.021)	Loss 2.3448 (2.4085)	Entropy 0.56232 (0.56551)	Top-1 acc 66.016 (65.985)	Top-5 acc 87.891 (85.353)	lr 0.00308
Train [93][1960/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.021)	Loss 2.3176 (2.4088)	Entropy 0.56198 (0.56550)	Top-1 acc 67.969 (65.977)	Top-5 acc 86.328 (85.346)	lr 0.00308
Train [93][1970/3239]	Time 0.223 (0.526)	Data Time 0.001 (0.021)	Loss 2.7057 (2.4092)	Entropy 0.56179 (0.56548)	Top-1 acc 57.031 (65.964)	Top-5 acc 80.859 (85.342)	lr 0.00308
Train [93][1980/3239]	Time 0.373 (0.526)	Data Time 0.001 (0.020)	Loss 2.3752 (2.4091)	Entropy 0.56203 (0.56546)	Top-1 acc 64.844 (65.969)	Top-5 acc 84.766 (85.345)	lr 0.00308
Train [93][1990/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.020)	Loss 2.5201 (2.4091)	Entropy 0.56208 (0.56544)	Top-1 acc 62.500 (65.968)	Top-5 acc 82.812 (85.340)	lr 0.00308
Train [93][2000/3239]	Time 0.220 (0.525)	Data Time 0.001 (0.020)	Loss 2.3638 (2.4090)	Entropy 0.56229 (0.56543)	Top-1 acc 67.578 (65.969)	Top-5 acc 82.422 (85.343)	lr 0.00308
Train [93][2010/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.020)	Loss 2.4244 (2.4091)	Entropy 0.56230 (0.56541)	Top-1 acc 66.797 (65.971)	Top-5 acc 87.500 (85.344)	lr 0.00308
Train [93][2020/3239]	Time 0.236 (0.524)	Data Time 0.002 (0.020)	Loss 2.3923 (2.4089)	Entropy 0.56247 (0.56540)	Top-1 acc 65.625 (65.979)	Top-5 acc 86.328 (85.348)	lr 0.00308
Train [93][2030/3239]	Time 0.244 (0.523)	Data Time 0.001 (0.020)	Loss 2.8382 (2.4087)	Entropy 0.56269 (0.56538)	Top-1 acc 56.641 (65.984)	Top-5 acc 80.469 (85.354)	lr 0.00307
Train [93][2040/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.020)	Loss 2.2681 (2.4091)	Entropy 0.56267 (0.56537)	Top-1 acc 69.922 (65.971)	Top-5 acc 87.500 (85.345)	lr 0.00307
Train [93][2050/3239]	Time 0.340 (0.522)	Data Time 0.001 (0.020)	Loss 2.2298 (2.4092)	Entropy 0.56282 (0.56536)	Top-1 acc 70.312 (65.970)	Top-5 acc 90.234 (85.342)	lr 0.00307
Train [93][2060/3239]	Time 0.232 (0.522)	Data Time 0.002 (0.020)	Loss 2.4278 (2.4092)	Entropy 0.56284 (0.56534)	Top-1 acc 67.188 (65.971)	Top-5 acc 82.031 (85.339)	lr 0.00307
Train [93][2070/3239]	Time 0.240 (0.522)	Data Time 0.001 (0.020)	Loss 2.4049 (2.4091)	Entropy 0.56309 (0.56533)	Top-1 acc 66.406 (65.974)	Top-5 acc 87.500 (85.339)	lr 0.00307
Train [93][2080/3239]	Time 0.239 (0.521)	Data Time 0.002 (0.020)	Loss 2.3702 (2.4092)	Entropy 0.56298 (0.56532)	Top-1 acc 69.531 (65.972)	Top-5 acc 84.375 (85.333)	lr 0.00307
Train [93][2090/3239]	Time 0.243 (0.521)	Data Time 0.001 (0.019)	Loss 2.6916 (2.4094)	Entropy 0.56264 (0.56531)	Top-1 acc 60.938 (65.972)	Top-5 acc 80.469 (85.328)	lr 0.00307
Train [93][2100/3239]	Time 0.278 (0.520)	Data Time 0.001 (0.019)	Loss 2.5939 (2.4098)	Entropy 0.56239 (0.56529)	Top-1 acc 61.719 (65.961)	Top-5 acc 82.422 (85.322)	lr 0.00307
Train [93][2110/3239]	Time 0.236 (0.520)	Data Time 0.001 (0.019)	Loss 2.3132 (2.4098)	Entropy 0.56262 (0.56528)	Top-1 acc 71.094 (65.960)	Top-5 acc 87.500 (85.323)	lr 0.00307
Train [93][2120/3239]	Time 0.318 (0.520)	Data Time 0.003 (0.019)	Loss 2.3164 (2.4101)	Entropy 0.56228 (0.56527)	Top-1 acc 66.406 (65.955)	Top-5 acc 88.281 (85.319)	lr 0.00307
Train [93][2130/3239]	Time 0.243 (0.520)	Data Time 0.001 (0.019)	Loss 2.3492 (2.4100)	Entropy 0.56256 (0.56525)	Top-1 acc 66.016 (65.956)	Top-5 acc 85.547 (85.316)	lr 0.00307
Train [93][2140/3239]	Time 0.314 (0.519)	Data Time 0.001 (0.019)	Loss 2.6431 (2.4102)	Entropy 0.56275 (0.56524)	Top-1 acc 62.500 (65.950)	Top-5 acc 82.422 (85.315)	lr 0.00307
Train [93][2150/3239]	Time 0.237 (0.519)	Data Time 0.001 (0.019)	Loss 2.3149 (2.4100)	Entropy 0.56303 (0.56523)	Top-1 acc 67.188 (65.951)	Top-5 acc 87.500 (85.318)	lr 0.00307
Train [93][2160/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.019)	Loss 2.3578 (2.4099)	Entropy 0.56318 (0.56522)	Top-1 acc 65.625 (65.957)	Top-5 acc 85.547 (85.322)	lr 0.00307
Train [93][2170/3239]	Time 0.240 (0.518)	Data Time 0.001 (0.019)	Loss 2.5298 (2.4097)	Entropy 0.56267 (0.56521)	Top-1 acc 60.547 (65.960)	Top-5 acc 83.984 (85.325)	lr 0.00307
Train [93][2180/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.019)	Loss 2.3761 (2.4096)	Entropy 0.56277 (0.56520)	Top-1 acc 71.875 (65.960)	Top-5 acc 87.500 (85.327)	lr 0.00306
Train [93][2190/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.019)	Loss 2.4326 (2.4095)	Entropy 0.56302 (0.56519)	Top-1 acc 66.797 (65.958)	Top-5 acc 85.547 (85.331)	lr 0.00306
Train [93][2200/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.019)	Loss 2.5907 (2.4098)	Entropy 0.56316 (0.56518)	Top-1 acc 59.375 (65.953)	Top-5 acc 83.594 (85.325)	lr 0.00306
Train [93][2210/3239]	Time 0.369 (0.517)	Data Time 0.002 (0.019)	Loss 2.5680 (2.4099)	Entropy 0.56334 (0.56517)	Top-1 acc 61.328 (65.948)	Top-5 acc 80.078 (85.321)	lr 0.00306
Train [93][2220/3239]	Time 0.254 (0.516)	Data Time 0.001 (0.018)	Loss 2.2406 (2.4095)	Entropy 0.56332 (0.56516)	Top-1 acc 69.922 (65.957)	Top-5 acc 88.672 (85.328)	lr 0.00306
Train [93][2230/3239]	Time 0.230 (0.516)	Data Time 0.001 (0.018)	Loss 2.3909 (2.4095)	Entropy 0.56328 (0.56515)	Top-1 acc 66.016 (65.958)	Top-5 acc 85.938 (85.329)	lr 0.00306
Train [93][2240/3239]	Time 0.240 (0.515)	Data Time 0.001 (0.018)	Loss 2.4077 (2.4095)	Entropy 0.56336 (0.56515)	Top-1 acc 65.234 (65.960)	Top-5 acc 85.156 (85.326)	lr 0.00306
Train [93][2250/3239]	Time 0.240 (0.515)	Data Time 0.001 (0.018)	Loss 2.3049 (2.4094)	Entropy 0.56344 (0.56514)	Top-1 acc 69.141 (65.958)	Top-5 acc 87.891 (85.332)	lr 0.00306
Train [93][2260/3239]	Time 0.250 (0.515)	Data Time 0.001 (0.018)	Loss 2.5729 (2.4092)	Entropy 0.56341 (0.56513)	Top-1 acc 64.062 (65.967)	Top-5 acc 82.031 (85.336)	lr 0.00306
Train [93][2270/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.018)	Loss 2.5103 (2.4093)	Entropy 0.56353 (0.56512)	Top-1 acc 62.500 (65.964)	Top-5 acc 83.203 (85.335)	lr 0.00306
Train [93][2280/3239]	Time 0.341 (0.514)	Data Time 0.001 (0.018)	Loss 2.4433 (2.4091)	Entropy 0.56337 (0.56512)	Top-1 acc 59.766 (65.967)	Top-5 acc 85.938 (85.337)	lr 0.00306
Train [93][2290/3239]	Time 0.266 (0.513)	Data Time 0.001 (0.018)	Loss 2.4855 (2.4092)	Entropy 0.56356 (0.56511)	Top-1 acc 67.578 (65.973)	Top-5 acc 82.031 (85.332)	lr 0.00306
Train [93][2300/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.018)	Loss 2.2645 (2.4094)	Entropy 0.56330 (0.56510)	Top-1 acc 68.750 (65.967)	Top-5 acc 86.719 (85.326)	lr 0.00306
Train [93][2310/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.018)	Loss 2.4195 (2.4091)	Entropy 0.56325 (0.56509)	Top-1 acc 63.281 (65.973)	Top-5 acc 86.328 (85.328)	lr 0.00306
Train [93][2320/3239]	Time 0.232 (0.512)	Data Time 0.002 (0.018)	Loss 2.3251 (2.4092)	Entropy 0.56324 (0.56509)	Top-1 acc 70.703 (65.974)	Top-5 acc 84.766 (85.322)	lr 0.00306
Train [93][2330/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.018)	Loss 2.3438 (2.4090)	Entropy 0.56325 (0.56508)	Top-1 acc 69.922 (65.976)	Top-5 acc 85.938 (85.328)	lr 0.00305
Train [93][2340/3239]	Time 0.245 (0.511)	Data Time 0.001 (0.018)	Loss 2.1738 (2.4090)	Entropy 0.56356 (0.56507)	Top-1 acc 74.609 (65.977)	Top-5 acc 88.672 (85.329)	lr 0.00305
Train [93][2350/3239]	Time 0.283 (0.511)	Data Time 0.001 (0.018)	Loss 2.4144 (2.4090)	Entropy 0.56376 (0.56506)	Top-1 acc 66.797 (65.980)	Top-5 acc 83.984 (85.326)	lr 0.00305
Train [93][2360/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.017)	Loss 2.4015 (2.4086)	Entropy 0.56401 (0.56506)	Top-1 acc 65.625 (65.990)	Top-5 acc 83.984 (85.332)	lr 0.00305
Train [93][2370/3239]	Time 0.340 (0.510)	Data Time 0.001 (0.017)	Loss 2.4845 (2.4087)	Entropy 0.56399 (0.56505)	Top-1 acc 64.062 (65.991)	Top-5 acc 84.375 (85.332)	lr 0.00305
Train [93][2380/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.017)	Loss 2.4902 (2.4087)	Entropy 0.56379 (0.56505)	Top-1 acc 62.500 (65.990)	Top-5 acc 82.422 (85.331)	lr 0.00305
Train [93][2390/3239]	Time 0.270 (0.510)	Data Time 0.001 (0.017)	Loss 2.2921 (2.4085)	Entropy 0.56392 (0.56504)	Top-1 acc 69.922 (65.991)	Top-5 acc 85.156 (85.333)	lr 0.00305
Train [93][2400/3239]	Time 0.234 (0.509)	Data Time 0.001 (0.017)	Loss 2.3829 (2.4084)	Entropy 0.56417 (0.56504)	Top-1 acc 68.359 (65.995)	Top-5 acc 87.500 (85.337)	lr 0.00305
Train [93][2410/3239]	Time 0.238 (0.509)	Data Time 0.001 (0.017)	Loss 2.3508 (2.4085)	Entropy 0.56423 (0.56504)	Top-1 acc 67.188 (65.994)	Top-5 acc 85.938 (85.336)	lr 0.00305
Train [93][2420/3239]	Time 0.240 (0.509)	Data Time 0.002 (0.017)	Loss 2.3937 (2.4084)	Entropy 0.56444 (0.56503)	Top-1 acc 64.844 (65.998)	Top-5 acc 85.156 (85.338)	lr 0.00305
Train [93][2430/3239]	Time 0.276 (0.509)	Data Time 0.002 (0.017)	Loss 2.5587 (2.4085)	Entropy 0.56441 (0.56503)	Top-1 acc 64.844 (65.998)	Top-5 acc 81.641 (85.335)	lr 0.00305
Train [93][2440/3239]	Time 0.347 (0.509)	Data Time 0.001 (0.017)	Loss 2.3999 (2.4086)	Entropy 0.56435 (0.56503)	Top-1 acc 67.578 (65.995)	Top-5 acc 82.812 (85.333)	lr 0.00305
Train [93][2450/3239]	Time 0.225 (0.508)	Data Time 0.001 (0.017)	Loss 2.3522 (2.4085)	Entropy 0.56415 (0.56503)	Top-1 acc 67.188 (66.000)	Top-5 acc 86.719 (85.335)	lr 0.00305
Train [93][2460/3239]	Time 0.239 (0.508)	Data Time 0.001 (0.017)	Loss 2.4353 (2.4082)	Entropy 0.56396 (0.56502)	Top-1 acc 63.672 (66.006)	Top-5 acc 84.766 (85.341)	lr 0.00305
Train [93][2470/3239]	Time 0.220 (0.507)	Data Time 0.001 (0.017)	Loss 2.4564 (2.4083)	Entropy 0.56410 (0.56502)	Top-1 acc 67.578 (66.004)	Top-5 acc 82.812 (85.340)	lr 0.00305
Train [93][2480/3239]	Time 0.235 (0.507)	Data Time 0.001 (0.017)	Loss 2.3314 (2.4081)	Entropy 0.56420 (0.56502)	Top-1 acc 65.234 (66.008)	Top-5 acc 86.719 (85.341)	lr 0.00304
Train [93][2490/3239]	Time 0.221 (0.507)	Data Time 0.001 (0.017)	Loss 2.3506 (2.4080)	Entropy 0.56451 (0.56501)	Top-1 acc 66.406 (66.011)	Top-5 acc 85.938 (85.339)	lr 0.00304
Train [93][2500/3239]	Time 0.228 (0.506)	Data Time 0.001 (0.017)	Loss 2.6300 (2.4082)	Entropy 0.56438 (0.56501)	Top-1 acc 61.328 (66.005)	Top-5 acc 79.297 (85.336)	lr 0.00304
Train [93][2510/3239]	Time 0.237 (0.506)	Data Time 0.001 (0.017)	Loss 2.6477 (2.4084)	Entropy 0.56411 (0.56501)	Top-1 acc 59.766 (65.999)	Top-5 acc 82.422 (85.332)	lr 0.00304
Train [93][2520/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.016)	Loss 2.5600 (2.4087)	Entropy 0.56424 (0.56500)	Top-1 acc 61.328 (65.993)	Top-5 acc 80.859 (85.326)	lr 0.00304
Train [93][2530/3239]	Time 0.338 (0.505)	Data Time 0.001 (0.016)	Loss 2.3910 (2.4088)	Entropy 0.56421 (0.56500)	Top-1 acc 64.062 (65.992)	Top-5 acc 85.156 (85.324)	lr 0.00304
Train [93][2540/3239]	Time 0.391 (0.527)	Data Time 0.002 (0.016)	Loss 2.2600 (2.4088)	Entropy 0.56420 (0.56500)	Top-1 acc 67.969 (65.992)	Top-5 acc 89.844 (85.325)	lr 0.00304
Train [93][2550/3239]	Time 0.239 (0.527)	Data Time 0.002 (0.016)	Loss 2.1576 (2.4088)	Entropy 0.56444 (0.56500)	Top-1 acc 70.703 (65.991)	Top-5 acc 90.625 (85.325)	lr 0.00304
Train [93][2560/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.016)	Loss 2.6012 (2.4091)	Entropy 0.56459 (0.56499)	Top-1 acc 62.500 (65.984)	Top-5 acc 81.641 (85.319)	lr 0.00304
Train [93][2570/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.016)	Loss 2.5180 (2.4089)	Entropy 0.56420 (0.56499)	Top-1 acc 63.672 (65.990)	Top-5 acc 83.203 (85.323)	lr 0.00304
Train [93][2580/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.016)	Loss 2.4888 (2.4089)	Entropy 0.56386 (0.56499)	Top-1 acc 63.672 (65.989)	Top-5 acc 84.766 (85.322)	lr 0.00304
Train [93][2590/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.016)	Loss 2.5850 (2.4090)	Entropy 0.56384 (0.56498)	Top-1 acc 61.328 (65.987)	Top-5 acc 81.641 (85.321)	lr 0.00304
Train [93][2600/3239]	Time 0.335 (0.525)	Data Time 0.001 (0.016)	Loss 2.3101 (2.4091)	Entropy 0.56384 (0.56498)	Top-1 acc 69.531 (65.976)	Top-5 acc 85.547 (85.318)	lr 0.00304
Train [93][2610/3239]	Time 0.240 (0.525)	Data Time 0.001 (0.016)	Loss 2.4111 (2.4092)	Entropy 0.56381 (0.56498)	Top-1 acc 68.750 (65.977)	Top-5 acc 85.156 (85.316)	lr 0.00304
Train [93][2620/3239]	Time 0.247 (0.524)	Data Time 0.001 (0.016)	Loss 2.5308 (2.4092)	Entropy 0.56422 (0.56497)	Top-1 acc 61.719 (65.975)	Top-5 acc 82.031 (85.315)	lr 0.00304
Train [93][2630/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.016)	Loss 2.3207 (2.4091)	Entropy 0.56423 (0.56497)	Top-1 acc 67.578 (65.981)	Top-5 acc 85.547 (85.318)	lr 0.00304
Train [93][2640/3239]	Time 0.251 (0.524)	Data Time 0.001 (0.016)	Loss 2.6099 (2.4090)	Entropy 0.56430 (0.56497)	Top-1 acc 61.719 (65.984)	Top-5 acc 82.422 (85.322)	lr 0.00303
Train [93][2650/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.016)	Loss 2.3696 (2.4090)	Entropy 0.56432 (0.56496)	Top-1 acc 66.797 (65.984)	Top-5 acc 85.938 (85.322)	lr 0.00303
Train [93][2660/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.016)	Loss 2.3392 (2.4089)	Entropy 0.56451 (0.56496)	Top-1 acc 67.969 (65.987)	Top-5 acc 86.719 (85.326)	lr 0.00303
Train [93][2670/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.016)	Loss 2.2670 (2.4089)	Entropy 0.56447 (0.56496)	Top-1 acc 69.531 (65.984)	Top-5 acc 87.891 (85.326)	lr 0.00303
Train [93][2680/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.016)	Loss 2.4609 (2.4087)	Entropy 0.56448 (0.56496)	Top-1 acc 65.234 (65.986)	Top-5 acc 86.328 (85.333)	lr 0.00303
Train [93][2690/3239]	Time 0.352 (0.522)	Data Time 0.001 (0.016)	Loss 2.3295 (2.4090)	Entropy 0.56444 (0.56496)	Top-1 acc 67.188 (65.980)	Top-5 acc 85.156 (85.327)	lr 0.00303
Train [93][2700/3239]	Time 0.248 (0.522)	Data Time 0.001 (0.015)	Loss 2.3786 (2.4090)	Entropy 0.56452 (0.56495)	Top-1 acc 66.016 (65.980)	Top-5 acc 85.938 (85.328)	lr 0.00303
Train [93][2710/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.015)	Loss 2.3005 (2.4089)	Entropy 0.56482 (0.56495)	Top-1 acc 68.359 (65.986)	Top-5 acc 87.109 (85.329)	lr 0.00303
Train [93][2720/3239]	Time 0.273 (0.521)	Data Time 0.002 (0.015)	Loss 2.3874 (2.4090)	Entropy 0.56469 (0.56495)	Top-1 acc 66.797 (65.983)	Top-5 acc 83.594 (85.329)	lr 0.00303
Train [93][2730/3239]	Time 0.284 (0.521)	Data Time 0.002 (0.015)	Loss 2.4860 (2.4092)	Entropy 0.56480 (0.56495)	Top-1 acc 64.844 (65.976)	Top-5 acc 83.203 (85.326)	lr 0.00303
Train [93][2740/3239]	Time 0.225 (0.521)	Data Time 0.001 (0.015)	Loss 2.3895 (2.4092)	Entropy 0.56466 (0.56495)	Top-1 acc 65.625 (65.975)	Top-5 acc 87.109 (85.325)	lr 0.00303
Train [93][2750/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.015)	Loss 2.3652 (2.4089)	Entropy 0.56430 (0.56495)	Top-1 acc 67.578 (65.980)	Top-5 acc 84.375 (85.329)	lr 0.00303
Train [93][2760/3239]	Time 0.350 (0.520)	Data Time 0.001 (0.015)	Loss 2.5523 (2.4088)	Entropy 0.56434 (0.56495)	Top-1 acc 65.234 (65.984)	Top-5 acc 82.422 (85.331)	lr 0.00303
Train [93][2770/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.015)	Loss 2.5331 (2.4087)	Entropy 0.56443 (0.56495)	Top-1 acc 62.500 (65.984)	Top-5 acc 83.984 (85.333)	lr 0.00303
Train [93][2780/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.015)	Loss 2.4201 (2.4088)	Entropy 0.56419 (0.56494)	Top-1 acc 67.578 (65.980)	Top-5 acc 83.203 (85.328)	lr 0.00303
Train [93][2790/3239]	Time 0.240 (0.519)	Data Time 0.001 (0.015)	Loss 2.3266 (2.4087)	Entropy 0.56417 (0.56494)	Top-1 acc 67.578 (65.980)	Top-5 acc 85.938 (85.330)	lr 0.00302
Train [93][2800/3239]	Time 0.223 (0.519)	Data Time 0.001 (0.015)	Loss 2.4961 (2.4085)	Entropy 0.56393 (0.56494)	Top-1 acc 64.453 (65.986)	Top-5 acc 82.812 (85.333)	lr 0.00302
Train [93][2810/3239]	Time 0.253 (0.519)	Data Time 0.001 (0.015)	Loss 2.4685 (2.4084)	Entropy 0.56372 (0.56493)	Top-1 acc 65.625 (65.989)	Top-5 acc 82.031 (85.334)	lr 0.00302
Train [93][2820/3239]	Time 0.241 (0.519)	Data Time 0.001 (0.015)	Loss 2.3490 (2.4083)	Entropy 0.56399 (0.56493)	Top-1 acc 67.188 (65.993)	Top-5 acc 85.547 (85.333)	lr 0.00302
Train [93][2830/3239]	Time 0.341 (0.518)	Data Time 0.001 (0.015)	Loss 2.4705 (2.4083)	Entropy 0.56401 (0.56493)	Top-1 acc 64.062 (65.994)	Top-5 acc 83.594 (85.332)	lr 0.00302
Train [93][2840/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.015)	Loss 2.3856 (2.4082)	Entropy 0.56408 (0.56492)	Top-1 acc 67.969 (65.997)	Top-5 acc 85.547 (85.334)	lr 0.00302
Train [93][2850/3239]	Time 0.272 (0.518)	Data Time 0.001 (0.015)	Loss 2.4118 (2.4084)	Entropy 0.56405 (0.56492)	Top-1 acc 65.234 (65.994)	Top-5 acc 85.156 (85.329)	lr 0.00302
Train [93][2860/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.015)	Loss 2.4559 (2.4085)	Entropy 0.56447 (0.56492)	Top-1 acc 65.234 (65.990)	Top-5 acc 86.328 (85.328)	lr 0.00302
Train [93][2870/3239]	Time 0.260 (0.517)	Data Time 0.003 (0.015)	Loss 2.5477 (2.4086)	Entropy 0.56425 (0.56492)	Top-1 acc 64.844 (65.993)	Top-5 acc 84.375 (85.325)	lr 0.00302
Train [93][2880/3239]	Time 0.220 (0.517)	Data Time 0.001 (0.015)	Loss 2.4765 (2.4085)	Entropy 0.56440 (0.56491)	Top-1 acc 64.453 (65.994)	Top-5 acc 84.766 (85.325)	lr 0.00302
Train [93][2890/3239]	Time 0.242 (0.517)	Data Time 0.001 (0.015)	Loss 2.4029 (2.4087)	Entropy 0.56441 (0.56491)	Top-1 acc 65.234 (65.988)	Top-5 acc 86.328 (85.320)	lr 0.00302
Train [93][2900/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.015)	Loss 2.1190 (2.4088)	Entropy 0.56388 (0.56491)	Top-1 acc 75.781 (65.989)	Top-5 acc 88.672 (85.321)	lr 0.00302
Train [93][2910/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.014)	Loss 2.2568 (2.4089)	Entropy 0.56351 (0.56491)	Top-1 acc 70.703 (65.984)	Top-5 acc 89.062 (85.322)	lr 0.00302
Train [93][2920/3239]	Time 0.335 (0.516)	Data Time 0.001 (0.014)	Loss 2.5986 (2.4090)	Entropy 0.56346 (0.56490)	Top-1 acc 59.766 (65.983)	Top-5 acc 83.203 (85.322)	lr 0.00302
Train [93][2930/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.014)	Loss 2.3471 (2.4090)	Entropy 0.56335 (0.56490)	Top-1 acc 66.797 (65.980)	Top-5 acc 85.547 (85.320)	lr 0.00302
Train [93][2940/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.014)	Loss 2.3547 (2.4092)	Entropy 0.56297 (0.56489)	Top-1 acc 69.922 (65.978)	Top-5 acc 87.109 (85.317)	lr 0.00301
Train [93][2950/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.014)	Loss 2.3360 (2.4091)	Entropy 0.56282 (0.56488)	Top-1 acc 69.531 (65.976)	Top-5 acc 85.547 (85.318)	lr 0.00301
Train [93][2960/3239]	Time 0.243 (0.514)	Data Time 0.001 (0.014)	Loss 2.5315 (2.4090)	Entropy 0.56257 (0.56487)	Top-1 acc 62.500 (65.977)	Top-5 acc 82.812 (85.321)	lr 0.00301
Train [93][2970/3239]	Time 0.238 (0.514)	Data Time 0.002 (0.014)	Loss 2.4486 (2.4093)	Entropy 0.56244 (0.56487)	Top-1 acc 64.062 (65.973)	Top-5 acc 83.594 (85.316)	lr 0.00301
Train [93][2980/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.014)	Loss 2.4875 (2.4093)	Entropy 0.56258 (0.56486)	Top-1 acc 63.281 (65.972)	Top-5 acc 84.766 (85.317)	lr 0.00301
Train [93][2990/3239]	Time 0.401 (0.514)	Data Time 0.002 (0.014)	Loss 2.8714 (2.4094)	Entropy 0.56277 (0.56485)	Top-1 acc 55.859 (65.968)	Top-5 acc 80.078 (85.317)	lr 0.00301
Train [93][3000/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.014)	Loss 2.3993 (2.4097)	Entropy 0.56265 (0.56484)	Top-1 acc 67.188 (65.963)	Top-5 acc 85.938 (85.312)	lr 0.00301
Train [93][3010/3239]	Time 0.240 (0.513)	Data Time 0.001 (0.014)	Loss 2.2120 (2.4097)	Entropy 0.56244 (0.56484)	Top-1 acc 72.656 (65.964)	Top-5 acc 88.281 (85.313)	lr 0.00301
Train [93][3020/3239]	Time 0.272 (0.513)	Data Time 0.001 (0.014)	Loss 2.4366 (2.4098)	Entropy 0.56221 (0.56483)	Top-1 acc 66.797 (65.963)	Top-5 acc 84.766 (85.310)	lr 0.00301
Train [93][3030/3239]	Time 0.247 (0.513)	Data Time 0.001 (0.014)	Loss 2.5097 (2.4097)	Entropy 0.56219 (0.56482)	Top-1 acc 62.891 (65.963)	Top-5 acc 83.984 (85.311)	lr 0.00301
Train [93][3040/3239]	Time 0.245 (0.513)	Data Time 0.001 (0.014)	Loss 2.5686 (2.4096)	Entropy 0.56230 (0.56481)	Top-1 acc 62.109 (65.966)	Top-5 acc 83.594 (85.311)	lr 0.00301
Train [93][3050/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.014)	Loss 2.3699 (2.4095)	Entropy 0.56263 (0.56480)	Top-1 acc 66.797 (65.968)	Top-5 acc 85.938 (85.312)	lr 0.00301
Train [93][3060/3239]	Time 0.244 (0.512)	Data Time 0.001 (0.014)	Loss 2.4201 (2.4096)	Entropy 0.56257 (0.56480)	Top-1 acc 67.578 (65.967)	Top-5 acc 83.984 (85.309)	lr 0.00301
Train [93][3070/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.014)	Loss 2.2429 (2.4096)	Entropy 0.56275 (0.56479)	Top-1 acc 65.625 (65.968)	Top-5 acc 93.750 (85.310)	lr 0.00301
Train [93][3080/3239]	Time 0.343 (0.511)	Data Time 0.001 (0.014)	Loss 2.3328 (2.4095)	Entropy 0.56271 (0.56478)	Top-1 acc 66.797 (65.970)	Top-5 acc 87.500 (85.311)	lr 0.00301
Train [93][3090/3239]	Time 0.237 (0.511)	Data Time 0.001 (0.014)	Loss 2.4196 (2.4097)	Entropy 0.56275 (0.56478)	Top-1 acc 64.453 (65.962)	Top-5 acc 85.156 (85.308)	lr 0.00300
Train [93][3100/3239]	Time 0.235 (0.511)	Data Time 0.001 (0.014)	Loss 2.3885 (2.4099)	Entropy 0.56257 (0.56477)	Top-1 acc 64.453 (65.955)	Top-5 acc 83.984 (85.302)	lr 0.00300
Train [93][3110/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.014)	Loss 2.2259 (2.4097)	Entropy 0.56290 (0.56476)	Top-1 acc 67.969 (65.960)	Top-5 acc 88.672 (85.306)	lr 0.00300
Train [93][3120/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.014)	Loss 2.3221 (2.4097)	Entropy 0.56275 (0.56476)	Top-1 acc 69.531 (65.962)	Top-5 acc 87.891 (85.304)	lr 0.00300
Train [93][3130/3239]	Time 0.224 (0.510)	Data Time 0.001 (0.014)	Loss 2.2660 (2.4095)	Entropy 0.56270 (0.56475)	Top-1 acc 71.094 (65.969)	Top-5 acc 84.766 (85.307)	lr 0.00300
Train [93][3140/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.014)	Loss 2.3680 (2.4095)	Entropy 0.56250 (0.56474)	Top-1 acc 65.625 (65.970)	Top-5 acc 85.156 (85.306)	lr 0.00300
Train [93][3150/3239]	Time 0.333 (0.510)	Data Time 0.001 (0.013)	Loss 2.3857 (2.4093)	Entropy 0.56269 (0.56474)	Top-1 acc 65.234 (65.974)	Top-5 acc 87.109 (85.308)	lr 0.00300
Train [93][3160/3239]	Time 0.239 (0.509)	Data Time 0.001 (0.013)	Loss 2.2753 (2.4092)	Entropy 0.56296 (0.56473)	Top-1 acc 69.922 (65.977)	Top-5 acc 85.938 (85.310)	lr 0.00300
Train [93][3170/3239]	Time 0.240 (0.509)	Data Time 0.001 (0.013)	Loss 2.3464 (2.4091)	Entropy 0.56307 (0.56473)	Top-1 acc 69.141 (65.984)	Top-5 acc 86.328 (85.312)	lr 0.00300
Train [93][3180/3239]	Time 0.226 (0.509)	Data Time 0.000 (0.013)	Loss 2.4162 (2.4090)	Entropy 0.56272 (0.56472)	Top-1 acc 66.406 (65.989)	Top-5 acc 84.375 (85.310)	lr 0.00300
Train [93][3190/3239]	Time 0.352 (0.524)	Data Time 0.000 (0.013)	Loss 2.3717 (2.4091)	Entropy 0.56281 (0.56471)	Top-1 acc 66.016 (65.989)	Top-5 acc 85.156 (85.309)	lr 0.00300
Train [93][3200/3239]	Time 0.236 (0.524)	Data Time 0.000 (0.013)	Loss 2.3737 (2.4091)	Entropy 0.56323 (0.56471)	Top-1 acc 66.406 (65.991)	Top-5 acc 84.375 (85.310)	lr 0.00300
Train [93][3210/3239]	Time 0.230 (0.524)	Data Time 0.000 (0.013)	Loss 2.4181 (2.4090)	Entropy 0.56300 (0.56470)	Top-1 acc 69.531 (65.994)	Top-5 acc 85.156 (85.312)	lr 0.00300
Train [93][3220/3239]	Time 0.333 (0.524)	Data Time 0.000 (0.013)	Loss 2.5292 (2.4090)	Entropy 0.56297 (0.56470)	Top-1 acc 63.672 (65.995)	Top-5 acc 82.031 (85.311)	lr 0.00300
Train [93][3230/3239]	Time 0.297 (0.524)	Data Time 0.000 (0.013)	Loss 2.2820 (2.4089)	Entropy 0.56300 (0.56469)	Top-1 acc 69.531 (65.999)	Top-5 acc 89.844 (85.314)	lr 0.00300
Train [93][3239/3239]	Time 0.964 (0.523)	Data Time 0.000 (0.013)	Loss 2.8218 (2.4090)	Entropy 0.56279 (0.56469)	Top-1 acc 54.321 (65.996)	Top-5 acc 75.309 (85.310)	lr 0.00299
==========Valid [93/120]	loss 1.219	top-1 acc 71.947 (71.947)	top-5 acc 89.938	Train top-1 65.996	top-5 85.310	Entropy 0.56279	Latency-None: 0.000ms	Flops: 539.00M
Train [94][0/3239]	Time 45.789 (45.789)	Data Time 44.359 (44.359)	Loss 2.3248 (2.3248)	Entropy 0.56285 (0.56285)	Top-1 acc 67.969 (67.969)	Top-5 acc 87.891 (87.891)	lr 0.00299
Train [94][10/3239]	Time 0.226 (4.772)	Data Time 0.001 (4.136)	Loss 2.4547 (2.4356)	Entropy 0.56300 (0.56293)	Top-1 acc 63.672 (65.270)	Top-5 acc 83.203 (85.050)	lr 0.00299
Train [94][20/3239]	Time 0.233 (2.707)	Data Time 0.002 (2.167)	Loss 2.3423 (2.4324)	Entropy 0.56271 (0.56292)	Top-1 acc 70.703 (65.644)	Top-5 acc 86.719 (85.547)	lr 0.00299
Train [94][30/3239]	Time 0.240 (1.982)	Data Time 0.001 (1.469)	Loss 2.2285 (2.4149)	Entropy 0.56295 (0.56289)	Top-1 acc 69.531 (65.814)	Top-5 acc 87.891 (85.496)	lr 0.00299
Train [94][40/3239]	Time 0.240 (1.617)	Data Time 0.001 (1.111)	Loss 2.5030 (2.4301)	Entropy 0.56273 (0.56290)	Top-1 acc 62.500 (65.558)	Top-5 acc 83.203 (85.042)	lr 0.00299
Train [94][50/3239]	Time 0.237 (1.388)	Data Time 0.001 (0.893)	Loss 2.3096 (2.4254)	Entropy 0.56254 (0.56286)	Top-1 acc 68.750 (65.740)	Top-5 acc 87.891 (84.949)	lr 0.00299
Train [94][60/3239]	Time 0.232 (1.231)	Data Time 0.001 (0.747)	Loss 2.4276 (2.4237)	Entropy 0.56260 (0.56281)	Top-1 acc 63.672 (65.753)	Top-5 acc 85.156 (84.964)	lr 0.00299
Train [94][70/3239]	Time 0.245 (1.121)	Data Time 0.001 (0.642)	Loss 2.3521 (2.4187)	Entropy 0.56258 (0.56277)	Top-1 acc 67.578 (65.961)	Top-5 acc 87.109 (85.019)	lr 0.00299
Train [94][80/3239]	Time 0.238 (1.038)	Data Time 0.002 (0.563)	Loss 2.4308 (2.4179)	Entropy 0.56261 (0.56275)	Top-1 acc 67.188 (65.996)	Top-5 acc 84.375 (85.089)	lr 0.00299
Train [94][90/3239]	Time 0.243 (0.974)	Data Time 0.001 (0.501)	Loss 2.5193 (2.4170)	Entropy 0.56290 (0.56276)	Top-1 acc 63.672 (66.037)	Top-5 acc 80.859 (85.109)	lr 0.00299
Train [94][100/3239]	Time 0.259 (0.929)	Data Time 0.002 (0.452)	Loss 2.6664 (2.4152)	Entropy 0.56246 (0.56274)	Top-1 acc 59.375 (66.105)	Top-5 acc 80.859 (85.203)	lr 0.00299
Train [94][110/3239]	Time 0.235 (0.894)	Data Time 0.002 (0.411)	Loss 2.2445 (2.4101)	Entropy 0.56226 (0.56271)	Top-1 acc 71.094 (66.223)	Top-5 acc 89.453 (85.265)	lr 0.00299
Train [94][120/3239]	Time 0.236 (0.856)	Data Time 0.001 (0.378)	Loss 2.4972 (2.4064)	Entropy 0.56239 (0.56267)	Top-1 acc 61.328 (66.300)	Top-5 acc 83.984 (85.366)	lr 0.00299
Train [94][130/3239]	Time 0.221 (0.822)	Data Time 0.001 (0.349)	Loss 2.3177 (2.4043)	Entropy 0.56237 (0.56264)	Top-1 acc 67.188 (66.239)	Top-5 acc 86.328 (85.395)	lr 0.00299
Train [94][140/3239]	Time 0.350 (0.793)	Data Time 0.002 (0.324)	Loss 2.2395 (2.4022)	Entropy 0.56209 (0.56261)	Top-1 acc 73.047 (66.290)	Top-5 acc 88.672 (85.444)	lr 0.00299
Train [94][150/3239]	Time 0.218 (0.767)	Data Time 0.001 (0.303)	Loss 2.5208 (2.4009)	Entropy 0.56213 (0.56258)	Top-1 acc 61.719 (66.313)	Top-5 acc 81.250 (85.464)	lr 0.00299
Train [94][160/3239]	Time 0.239 (0.745)	Data Time 0.002 (0.284)	Loss 2.6767 (2.3996)	Entropy 0.56213 (0.56255)	Top-1 acc 59.375 (66.331)	Top-5 acc 80.078 (85.455)	lr 0.00298
Train [94][170/3239]	Time 0.233 (0.726)	Data Time 0.001 (0.268)	Loss 2.1081 (2.3977)	Entropy 0.56238 (0.56253)	Top-1 acc 70.703 (66.342)	Top-5 acc 90.625 (85.469)	lr 0.00298
Train [94][180/3239]	Time 0.231 (0.709)	Data Time 0.001 (0.253)	Loss 2.2859 (2.3976)	Entropy 0.56230 (0.56253)	Top-1 acc 68.750 (66.285)	Top-5 acc 87.109 (85.448)	lr 0.00298
Train [94][190/3239]	Time 0.241 (0.693)	Data Time 0.001 (0.240)	Loss 2.3857 (2.3984)	Entropy 0.56222 (0.56251)	Top-1 acc 66.797 (66.234)	Top-5 acc 86.328 (85.449)	lr 0.00298
Train [94][200/3239]	Time 0.231 (0.679)	Data Time 0.001 (0.228)	Loss 2.6104 (2.3972)	Entropy 0.56213 (0.56249)	Top-1 acc 61.719 (66.247)	Top-5 acc 81.641 (85.465)	lr 0.00298
Train [94][210/3239]	Time 0.439 (0.667)	Data Time 0.002 (0.217)	Loss 2.2098 (2.3969)	Entropy 0.56211 (0.56247)	Top-1 acc 71.875 (66.269)	Top-5 acc 88.281 (85.482)	lr 0.00298
Train [94][220/3239]	Time 0.230 (0.657)	Data Time 0.002 (0.207)	Loss 2.4791 (2.3941)	Entropy 0.56210 (0.56246)	Top-1 acc 63.281 (66.284)	Top-5 acc 84.766 (85.572)	lr 0.00298
Train [94][230/3239]	Time 0.273 (0.647)	Data Time 0.001 (0.198)	Loss 2.5312 (2.3948)	Entropy 0.56199 (0.56244)	Top-1 acc 65.234 (66.320)	Top-5 acc 82.812 (85.581)	lr 0.00298
Train [94][240/3239]	Time 0.230 (0.638)	Data Time 0.001 (0.190)	Loss 2.4116 (2.3968)	Entropy 0.56207 (0.56242)	Top-1 acc 68.750 (66.294)	Top-5 acc 84.375 (85.549)	lr 0.00298
Train [94][250/3239]	Time 0.295 (0.631)	Data Time 0.002 (0.183)	Loss 2.4788 (2.3952)	Entropy 0.56236 (0.56241)	Top-1 acc 64.844 (66.374)	Top-5 acc 84.766 (85.580)	lr 0.00298
Train [94][260/3239]	Time 0.230 (0.627)	Data Time 0.001 (0.176)	Loss 2.1652 (2.3940)	Entropy 0.56239 (0.56241)	Top-1 acc 74.609 (66.433)	Top-5 acc 89.453 (85.598)	lr 0.00298
Train [94][270/3239]	Time 0.217 (0.619)	Data Time 0.001 (0.169)	Loss 2.4751 (2.3940)	Entropy 0.56254 (0.56241)	Top-1 acc 60.547 (66.389)	Top-5 acc 85.156 (85.594)	lr 0.00298
Train [94][280/3239]	Time 0.221 (0.613)	Data Time 0.001 (0.163)	Loss 2.5345 (2.3941)	Entropy 0.56262 (0.56242)	Top-1 acc 62.500 (66.397)	Top-5 acc 83.203 (85.590)	lr 0.00298
Train [94][290/3239]	Time 0.218 (0.607)	Data Time 0.001 (0.158)	Loss 2.1869 (2.3929)	Entropy 0.56280 (0.56243)	Top-1 acc 69.531 (66.448)	Top-5 acc 89.453 (85.627)	lr 0.00298
Train [94][300/3239]	Time 0.366 (0.601)	Data Time 0.001 (0.153)	Loss 2.4591 (2.3932)	Entropy 0.56236 (0.56243)	Top-1 acc 62.500 (66.441)	Top-5 acc 84.375 (85.625)	lr 0.00298
Train [94][310/3239]	Time 0.233 (0.595)	Data Time 0.001 (0.148)	Loss 2.4107 (2.3943)	Entropy 0.56250 (0.56243)	Top-1 acc 66.406 (66.410)	Top-5 acc 87.109 (85.598)	lr 0.00297
Train [94][320/3239]	Time 0.257 (0.589)	Data Time 0.001 (0.143)	Loss 2.4036 (2.3957)	Entropy 0.56281 (0.56244)	Top-1 acc 66.797 (66.371)	Top-5 acc 86.719 (85.587)	lr 0.00297
Train [94][330/3239]	Time 0.226 (0.584)	Data Time 0.001 (0.139)	Loss 2.4534 (2.3956)	Entropy 0.56267 (0.56245)	Top-1 acc 62.109 (66.360)	Top-5 acc 85.547 (85.576)	lr 0.00297
Train [94][340/3239]	Time 0.247 (0.579)	Data Time 0.002 (0.135)	Loss 2.1564 (2.3955)	Entropy 0.56283 (0.56246)	Top-1 acc 72.266 (66.339)	Top-5 acc 89.062 (85.553)	lr 0.00297
Train [94][350/3239]	Time 0.235 (0.574)	Data Time 0.001 (0.131)	Loss 2.3888 (2.3940)	Entropy 0.56258 (0.56246)	Top-1 acc 66.016 (66.384)	Top-5 acc 85.938 (85.580)	lr 0.00297
Train [94][360/3239]	Time 0.228 (0.570)	Data Time 0.001 (0.128)	Loss 2.3516 (2.3930)	Entropy 0.56253 (0.56246)	Top-1 acc 69.141 (66.392)	Top-5 acc 83.203 (85.601)	lr 0.00297
Train [94][370/3239]	Time 0.345 (0.565)	Data Time 0.001 (0.124)	Loss 2.2632 (2.3926)	Entropy 0.56252 (0.56247)	Top-1 acc 70.703 (66.399)	Top-5 acc 88.672 (85.606)	lr 0.00297
Train [94][380/3239]	Time 0.219 (0.562)	Data Time 0.001 (0.121)	Loss 2.5835 (2.3941)	Entropy 0.56250 (0.56247)	Top-1 acc 61.719 (66.374)	Top-5 acc 84.375 (85.589)	lr 0.00297
Train [94][390/3239]	Time 0.228 (0.558)	Data Time 0.001 (0.118)	Loss 2.3661 (2.3935)	Entropy 0.56238 (0.56246)	Top-1 acc 66.797 (66.379)	Top-5 acc 85.547 (85.606)	lr 0.00297
Train [94][400/3239]	Time 0.259 (0.554)	Data Time 0.001 (0.115)	Loss 2.3241 (2.3933)	Entropy 0.56252 (0.56246)	Top-1 acc 71.094 (66.390)	Top-5 acc 85.938 (85.592)	lr 0.00297
Train [94][410/3239]	Time 0.208 (0.551)	Data Time 0.001 (0.112)	Loss 2.3330 (2.3928)	Entropy 0.56265 (0.56247)	Top-1 acc 67.969 (66.410)	Top-5 acc 85.547 (85.598)	lr 0.00297
Train [94][420/3239]	Time 0.245 (0.548)	Data Time 0.001 (0.110)	Loss 2.2373 (2.3937)	Entropy 0.56251 (0.56247)	Top-1 acc 73.047 (66.429)	Top-5 acc 86.328 (85.579)	lr 0.00297
Train [94][430/3239]	Time 0.229 (0.544)	Data Time 0.001 (0.107)	Loss 2.3927 (2.3940)	Entropy 0.56263 (0.56247)	Top-1 acc 64.844 (66.410)	Top-5 acc 85.938 (85.584)	lr 0.00297
Train [94][440/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.105)	Loss 2.4615 (2.3956)	Entropy 0.56266 (0.56247)	Top-1 acc 64.453 (66.378)	Top-5 acc 83.594 (85.550)	lr 0.00297
Train [94][450/3239]	Time 0.286 (0.540)	Data Time 0.002 (0.102)	Loss 2.3889 (2.3955)	Entropy 0.56251 (0.56247)	Top-1 acc 68.359 (66.378)	Top-5 acc 87.891 (85.565)	lr 0.00297
Train [94][460/3239]	Time 0.281 (0.540)	Data Time 0.001 (0.100)	Loss 2.4215 (2.3959)	Entropy 0.56241 (0.56248)	Top-1 acc 64.062 (66.350)	Top-5 acc 83.984 (85.556)	lr 0.00296
Train [94][470/3239]	Time 0.355 (0.541)	Data Time 0.002 (0.098)	Loss 2.3613 (2.3958)	Entropy 0.56266 (0.56248)	Top-1 acc 68.750 (66.347)	Top-5 acc 88.672 (85.552)	lr 0.00296
Train [94][480/3239]	Time 0.238 (0.539)	Data Time 0.001 (0.096)	Loss 2.6837 (2.3961)	Entropy 0.56288 (0.56248)	Top-1 acc 59.375 (66.317)	Top-5 acc 81.250 (85.542)	lr 0.00296
Train [94][490/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.094)	Loss 2.3616 (2.3964)	Entropy 0.56309 (0.56249)	Top-1 acc 66.016 (66.321)	Top-5 acc 87.500 (85.545)	lr 0.00296
Train [94][500/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.092)	Loss 2.1209 (2.3952)	Entropy 0.56309 (0.56250)	Top-1 acc 76.172 (66.356)	Top-5 acc 91.016 (85.568)	lr 0.00296
Train [94][510/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.091)	Loss 2.3538 (2.3948)	Entropy 0.56266 (0.56251)	Top-1 acc 65.234 (66.358)	Top-5 acc 88.281 (85.571)	lr 0.00296
Train [94][520/3239]	Time 0.231 (0.531)	Data Time 0.001 (0.089)	Loss 2.4358 (2.3956)	Entropy 0.56248 (0.56251)	Top-1 acc 63.672 (66.334)	Top-5 acc 85.156 (85.560)	lr 0.00296
Train [94][530/3239]	Time 0.352 (0.528)	Data Time 0.001 (0.087)	Loss 2.3234 (2.3963)	Entropy 0.56257 (0.56252)	Top-1 acc 67.969 (66.313)	Top-5 acc 85.156 (85.541)	lr 0.00296
Train [94][540/3239]	Time 0.238 (0.527)	Data Time 0.001 (0.086)	Loss 2.3536 (2.3969)	Entropy 0.56241 (0.56252)	Top-1 acc 68.750 (66.296)	Top-5 acc 86.719 (85.534)	lr 0.00296
Train [94][550/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.084)	Loss 2.4700 (2.3968)	Entropy 0.56243 (0.56251)	Top-1 acc 67.578 (66.296)	Top-5 acc 85.547 (85.539)	lr 0.00296
Train [94][560/3239]	Time 0.280 (0.524)	Data Time 0.001 (0.083)	Loss 2.4174 (2.3965)	Entropy 0.56247 (0.56251)	Top-1 acc 66.016 (66.304)	Top-5 acc 83.594 (85.534)	lr 0.00296
Train [94][570/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.081)	Loss 2.2206 (2.3956)	Entropy 0.56265 (0.56251)	Top-1 acc 70.312 (66.326)	Top-5 acc 88.672 (85.549)	lr 0.00296
Train [94][580/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.080)	Loss 2.3322 (2.3960)	Entropy 0.56261 (0.56251)	Top-1 acc 71.875 (66.312)	Top-5 acc 85.547 (85.534)	lr 0.00296
Train [94][590/3239]	Time 0.223 (0.518)	Data Time 0.001 (0.079)	Loss 2.3064 (2.3963)	Entropy 0.56237 (0.56251)	Top-1 acc 70.703 (66.303)	Top-5 acc 86.719 (85.531)	lr 0.00296
Train [94][600/3239]	Time 0.311 (0.516)	Data Time 0.001 (0.077)	Loss 2.2859 (2.3953)	Entropy 0.56254 (0.56251)	Top-1 acc 67.969 (66.330)	Top-5 acc 89.062 (85.553)	lr 0.00296
Train [94][610/3239]	Time 0.268 (0.603)	Data Time 0.002 (0.076)	Loss 2.2371 (2.3942)	Entropy 0.56267 (0.56251)	Top-1 acc 73.047 (66.349)	Top-5 acc 86.719 (85.572)	lr 0.00296
Train [94][620/3239]	Time 0.306 (0.601)	Data Time 0.002 (0.075)	Loss 2.3013 (2.3941)	Entropy 0.56289 (0.56252)	Top-1 acc 67.188 (66.353)	Top-5 acc 87.500 (85.569)	lr 0.00295
Train [94][630/3239]	Time 0.261 (0.598)	Data Time 0.002 (0.074)	Loss 2.2662 (2.3943)	Entropy 0.56279 (0.56252)	Top-1 acc 69.531 (66.351)	Top-5 acc 88.672 (85.562)	lr 0.00295
Train [94][640/3239]	Time 0.234 (0.596)	Data Time 0.002 (0.073)	Loss 2.2422 (2.3943)	Entropy 0.56240 (0.56252)	Top-1 acc 72.266 (66.356)	Top-5 acc 87.891 (85.565)	lr 0.00295
Train [94][650/3239]	Time 0.262 (0.594)	Data Time 0.001 (0.072)	Loss 2.2641 (2.3935)	Entropy 0.56256 (0.56252)	Top-1 acc 69.141 (66.374)	Top-5 acc 88.281 (85.597)	lr 0.00295
Train [94][660/3239]	Time 0.232 (0.591)	Data Time 0.001 (0.070)	Loss 2.3946 (2.3934)	Entropy 0.56276 (0.56252)	Top-1 acc 67.578 (66.381)	Top-5 acc 88.281 (85.597)	lr 0.00295
Train [94][670/3239]	Time 0.230 (0.589)	Data Time 0.001 (0.069)	Loss 2.2397 (2.3939)	Entropy 0.56262 (0.56253)	Top-1 acc 73.828 (66.361)	Top-5 acc 89.062 (85.586)	lr 0.00295
Train [94][680/3239]	Time 0.250 (0.587)	Data Time 0.001 (0.068)	Loss 2.3581 (2.3940)	Entropy 0.56237 (0.56253)	Top-1 acc 63.672 (66.348)	Top-5 acc 87.891 (85.591)	lr 0.00295
Train [94][690/3239]	Time 0.363 (0.585)	Data Time 0.001 (0.068)	Loss 2.4149 (2.3942)	Entropy 0.56205 (0.56252)	Top-1 acc 67.578 (66.335)	Top-5 acc 82.031 (85.589)	lr 0.00295
Train [94][700/3239]	Time 0.237 (0.583)	Data Time 0.001 (0.067)	Loss 2.3650 (2.3937)	Entropy 0.56188 (0.56251)	Top-1 acc 67.578 (66.332)	Top-5 acc 88.281 (85.609)	lr 0.00295
Train [94][710/3239]	Time 0.226 (0.580)	Data Time 0.001 (0.066)	Loss 2.2130 (2.3934)	Entropy 0.56181 (0.56250)	Top-1 acc 68.359 (66.341)	Top-5 acc 89.844 (85.608)	lr 0.00295
Train [94][720/3239]	Time 0.237 (0.578)	Data Time 0.001 (0.065)	Loss 2.5897 (2.3920)	Entropy 0.56137 (0.56249)	Top-1 acc 62.891 (66.376)	Top-5 acc 82.812 (85.629)	lr 0.00295
Train [94][730/3239]	Time 0.233 (0.576)	Data Time 0.001 (0.064)	Loss 2.4738 (2.3921)	Entropy 0.56116 (0.56248)	Top-1 acc 63.281 (66.359)	Top-5 acc 85.547 (85.628)	lr 0.00295
Train [94][740/3239]	Time 0.233 (0.574)	Data Time 0.001 (0.063)	Loss 2.3762 (2.3930)	Entropy 0.56129 (0.56246)	Top-1 acc 67.188 (66.346)	Top-5 acc 87.109 (85.606)	lr 0.00295
Train [94][750/3239]	Time 0.229 (0.572)	Data Time 0.001 (0.062)	Loss 2.3826 (2.3934)	Entropy 0.56147 (0.56244)	Top-1 acc 67.969 (66.341)	Top-5 acc 84.375 (85.609)	lr 0.00295
Train [94][760/3239]	Time 0.339 (0.570)	Data Time 0.001 (0.061)	Loss 2.3179 (2.3948)	Entropy 0.56147 (0.56243)	Top-1 acc 69.141 (66.326)	Top-5 acc 88.281 (85.581)	lr 0.00295
Train [94][770/3239]	Time 0.242 (0.568)	Data Time 0.001 (0.061)	Loss 2.6808 (2.3949)	Entropy 0.56170 (0.56242)	Top-1 acc 57.422 (66.318)	Top-5 acc 81.641 (85.576)	lr 0.00294
Train [94][780/3239]	Time 0.252 (0.567)	Data Time 0.001 (0.060)	Loss 2.0527 (2.3942)	Entropy 0.56166 (0.56241)	Top-1 acc 73.047 (66.338)	Top-5 acc 90.625 (85.585)	lr 0.00294
Train [94][790/3239]	Time 0.251 (0.565)	Data Time 0.003 (0.059)	Loss 2.4621 (2.3954)	Entropy 0.56155 (0.56240)	Top-1 acc 66.406 (66.308)	Top-5 acc 85.156 (85.569)	lr 0.00294
Train [94][800/3239]	Time 0.228 (0.563)	Data Time 0.002 (0.058)	Loss 2.4492 (2.3956)	Entropy 0.56103 (0.56239)	Top-1 acc 63.672 (66.301)	Top-5 acc 85.547 (85.564)	lr 0.00294
Train [94][810/3239]	Time 0.229 (0.562)	Data Time 0.001 (0.058)	Loss 2.5008 (2.3956)	Entropy 0.56075 (0.56237)	Top-1 acc 63.672 (66.306)	Top-5 acc 84.766 (85.572)	lr 0.00294
Train [94][820/3239]	Time 0.234 (0.561)	Data Time 0.001 (0.057)	Loss 2.5340 (2.3956)	Entropy 0.56065 (0.56235)	Top-1 acc 62.891 (66.298)	Top-5 acc 82.031 (85.567)	lr 0.00294
Train [94][830/3239]	Time 0.235 (0.559)	Data Time 0.002 (0.056)	Loss 2.3999 (2.3957)	Entropy 0.56040 (0.56232)	Top-1 acc 66.016 (66.294)	Top-5 acc 83.594 (85.563)	lr 0.00294
Train [94][840/3239]	Time 0.227 (0.558)	Data Time 0.001 (0.056)	Loss 2.2988 (2.3955)	Entropy 0.56043 (0.56230)	Top-1 acc 71.875 (66.300)	Top-5 acc 85.938 (85.569)	lr 0.00294
Train [94][850/3239]	Time 0.349 (0.556)	Data Time 0.001 (0.055)	Loss 2.4334 (2.3960)	Entropy 0.56043 (0.56228)	Top-1 acc 61.719 (66.284)	Top-5 acc 85.547 (85.559)	lr 0.00294
Train [94][860/3239]	Time 0.237 (0.555)	Data Time 0.002 (0.054)	Loss 2.3124 (2.3953)	Entropy 0.56048 (0.56226)	Top-1 acc 70.312 (66.306)	Top-5 acc 87.109 (85.574)	lr 0.00294
Train [94][870/3239]	Time 0.286 (0.554)	Data Time 0.002 (0.054)	Loss 2.3481 (2.3962)	Entropy 0.56046 (0.56224)	Top-1 acc 65.234 (66.275)	Top-5 acc 88.672 (85.558)	lr 0.00294
Train [94][880/3239]	Time 0.247 (0.554)	Data Time 0.001 (0.053)	Loss 2.4143 (2.3960)	Entropy 0.56054 (0.56222)	Top-1 acc 63.672 (66.276)	Top-5 acc 86.719 (85.566)	lr 0.00294
Train [94][890/3239]	Time 0.229 (0.552)	Data Time 0.001 (0.053)	Loss 2.5789 (2.3963)	Entropy 0.56068 (0.56220)	Top-1 acc 61.719 (66.263)	Top-5 acc 80.859 (85.565)	lr 0.00294
Train [94][900/3239]	Time 0.221 (0.551)	Data Time 0.001 (0.052)	Loss 2.2224 (2.3963)	Entropy 0.56068 (0.56218)	Top-1 acc 71.875 (66.270)	Top-5 acc 87.891 (85.564)	lr 0.00294
Train [94][910/3239]	Time 0.236 (0.550)	Data Time 0.002 (0.052)	Loss 2.4126 (2.3964)	Entropy 0.56088 (0.56217)	Top-1 acc 65.625 (66.257)	Top-5 acc 85.547 (85.565)	lr 0.00294
Train [94][920/3239]	Time 0.360 (0.548)	Data Time 0.001 (0.051)	Loss 2.5382 (2.3969)	Entropy 0.56097 (0.56216)	Top-1 acc 61.719 (66.251)	Top-5 acc 82.031 (85.559)	lr 0.00293
Train [94][930/3239]	Time 0.243 (0.547)	Data Time 0.001 (0.051)	Loss 2.3402 (2.3971)	Entropy 0.56098 (0.56214)	Top-1 acc 67.969 (66.244)	Top-5 acc 85.938 (85.547)	lr 0.00293
Train [94][940/3239]	Time 0.267 (0.546)	Data Time 0.001 (0.050)	Loss 2.2928 (2.3963)	Entropy 0.56057 (0.56213)	Top-1 acc 70.703 (66.268)	Top-5 acc 87.891 (85.563)	lr 0.00293
Train [94][950/3239]	Time 0.244 (0.545)	Data Time 0.001 (0.049)	Loss 2.1938 (2.3957)	Entropy 0.56060 (0.56211)	Top-1 acc 71.875 (66.285)	Top-5 acc 87.891 (85.569)	lr 0.00293
Train [94][960/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.049)	Loss 2.3661 (2.3954)	Entropy 0.56070 (0.56210)	Top-1 acc 69.531 (66.289)	Top-5 acc 86.328 (85.574)	lr 0.00293
Train [94][970/3239]	Time 0.238 (0.543)	Data Time 0.001 (0.049)	Loss 2.4858 (2.3958)	Entropy 0.56057 (0.56208)	Top-1 acc 64.844 (66.276)	Top-5 acc 82.422 (85.561)	lr 0.00293
Train [94][980/3239]	Time 0.261 (0.542)	Data Time 0.001 (0.048)	Loss 2.3885 (2.3951)	Entropy 0.56077 (0.56207)	Top-1 acc 66.016 (66.282)	Top-5 acc 86.328 (85.576)	lr 0.00293
Train [94][990/3239]	Time 0.242 (0.541)	Data Time 0.001 (0.048)	Loss 2.1562 (2.3949)	Entropy 0.56061 (0.56206)	Top-1 acc 71.094 (66.282)	Top-5 acc 90.625 (85.580)	lr 0.00293
Train [94][1000/3239]	Time 0.238 (0.540)	Data Time 0.001 (0.047)	Loss 2.3649 (2.3949)	Entropy 0.56049 (0.56204)	Top-1 acc 67.578 (66.283)	Top-5 acc 85.547 (85.581)	lr 0.00293
Train [94][1010/3239]	Time 0.261 (0.539)	Data Time 0.001 (0.047)	Loss 2.5054 (2.3951)	Entropy 0.56079 (0.56203)	Top-1 acc 66.016 (66.271)	Top-5 acc 85.156 (85.582)	lr 0.00293
Train [94][1020/3239]	Time 0.237 (0.538)	Data Time 0.001 (0.046)	Loss 2.4118 (2.3952)	Entropy 0.56128 (0.56202)	Top-1 acc 63.281 (66.266)	Top-5 acc 84.375 (85.580)	lr 0.00293
Train [94][1030/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.046)	Loss 2.5224 (2.3951)	Entropy 0.56136 (0.56201)	Top-1 acc 61.719 (66.262)	Top-5 acc 83.984 (85.579)	lr 0.00293
Train [94][1040/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.045)	Loss 2.4329 (2.3957)	Entropy 0.56162 (0.56200)	Top-1 acc 65.625 (66.255)	Top-5 acc 82.812 (85.565)	lr 0.00293
Train [94][1050/3239]	Time 0.236 (0.535)	Data Time 0.001 (0.045)	Loss 2.3213 (2.3959)	Entropy 0.56147 (0.56200)	Top-1 acc 66.797 (66.245)	Top-5 acc 85.938 (85.565)	lr 0.00293
Train [94][1060/3239]	Time 0.247 (0.534)	Data Time 0.001 (0.045)	Loss 2.5409 (2.3957)	Entropy 0.56173 (0.56199)	Top-1 acc 62.109 (66.247)	Top-5 acc 80.859 (85.566)	lr 0.00293
Train [94][1070/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.044)	Loss 2.4149 (2.3958)	Entropy 0.56170 (0.56199)	Top-1 acc 67.969 (66.245)	Top-5 acc 84.766 (85.571)	lr 0.00293
Train [94][1080/3239]	Time 0.352 (0.532)	Data Time 0.001 (0.044)	Loss 2.2781 (2.3959)	Entropy 0.56153 (0.56199)	Top-1 acc 72.656 (66.250)	Top-5 acc 87.891 (85.575)	lr 0.00292
Train [94][1090/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.043)	Loss 2.5416 (2.3960)	Entropy 0.56115 (0.56199)	Top-1 acc 66.016 (66.250)	Top-5 acc 84.375 (85.572)	lr 0.00292
Train [94][1100/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.043)	Loss 2.2721 (2.3959)	Entropy 0.56147 (0.56198)	Top-1 acc 67.188 (66.257)	Top-5 acc 87.891 (85.565)	lr 0.00292
Train [94][1110/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.043)	Loss 2.4897 (2.3952)	Entropy 0.56156 (0.56197)	Top-1 acc 66.406 (66.280)	Top-5 acc 84.375 (85.581)	lr 0.00292
Train [94][1120/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.042)	Loss 2.4146 (2.3949)	Entropy 0.56178 (0.56197)	Top-1 acc 66.406 (66.299)	Top-5 acc 84.375 (85.582)	lr 0.00292
Train [94][1130/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.042)	Loss 2.3292 (2.3949)	Entropy 0.56170 (0.56197)	Top-1 acc 67.578 (66.304)	Top-5 acc 87.891 (85.579)	lr 0.00292
Train [94][1140/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.042)	Loss 2.5447 (2.3950)	Entropy 0.56141 (0.56197)	Top-1 acc 63.672 (66.307)	Top-5 acc 81.250 (85.571)	lr 0.00292
Train [94][1150/3239]	Time 0.338 (0.526)	Data Time 0.001 (0.041)	Loss 2.3581 (2.3953)	Entropy 0.56143 (0.56196)	Top-1 acc 63.281 (66.294)	Top-5 acc 84.375 (85.568)	lr 0.00292
Train [94][1160/3239]	Time 0.285 (0.526)	Data Time 0.002 (0.041)	Loss 2.2632 (2.3955)	Entropy 0.56124 (0.56195)	Top-1 acc 70.703 (66.290)	Top-5 acc 87.109 (85.563)	lr 0.00292
Train [94][1170/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.041)	Loss 2.4780 (2.3956)	Entropy 0.56139 (0.56195)	Top-1 acc 67.578 (66.280)	Top-5 acc 83.594 (85.561)	lr 0.00292
Train [94][1180/3239]	Time 0.280 (0.524)	Data Time 0.003 (0.040)	Loss 2.2150 (2.3961)	Entropy 0.56160 (0.56194)	Top-1 acc 72.266 (66.259)	Top-5 acc 89.062 (85.554)	lr 0.00292
Train [94][1190/3239]	Time 0.244 (0.524)	Data Time 0.001 (0.040)	Loss 2.3244 (2.3959)	Entropy 0.56154 (0.56194)	Top-1 acc 67.969 (66.263)	Top-5 acc 88.281 (85.554)	lr 0.00292
Train [94][1200/3239]	Time 0.234 (0.523)	Data Time 0.001 (0.040)	Loss 2.5042 (2.3967)	Entropy 0.56123 (0.56194)	Top-1 acc 64.453 (66.240)	Top-5 acc 80.859 (85.543)	lr 0.00292
Train [94][1210/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.039)	Loss 2.6627 (2.3966)	Entropy 0.56146 (0.56193)	Top-1 acc 63.672 (66.249)	Top-5 acc 81.641 (85.539)	lr 0.00292
Train [94][1220/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.039)	Loss 2.2952 (2.3965)	Entropy 0.56138 (0.56193)	Top-1 acc 70.703 (66.261)	Top-5 acc 85.156 (85.541)	lr 0.00292
Train [94][1230/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.039)	Loss 2.3111 (2.3971)	Entropy 0.56157 (0.56192)	Top-1 acc 67.969 (66.242)	Top-5 acc 85.547 (85.528)	lr 0.00291
Train [94][1240/3239]	Time 0.343 (0.520)	Data Time 0.001 (0.038)	Loss 2.2721 (2.3968)	Entropy 0.56138 (0.56192)	Top-1 acc 70.312 (66.253)	Top-5 acc 86.328 (85.535)	lr 0.00291
Train [94][1250/3239]	Time 0.237 (0.519)	Data Time 0.001 (0.038)	Loss 2.4303 (2.3965)	Entropy 0.56129 (0.56192)	Top-1 acc 63.281 (66.263)	Top-5 acc 85.547 (85.542)	lr 0.00291
Train [94][1260/3239]	Time 0.368 (0.558)	Data Time 0.005 (0.038)	Loss 2.5299 (2.3964)	Entropy 0.56068 (0.56191)	Top-1 acc 64.844 (66.260)	Top-5 acc 82.422 (85.544)	lr 0.00291
Train [94][1270/3239]	Time 0.238 (0.558)	Data Time 0.002 (0.037)	Loss 2.4459 (2.3963)	Entropy 0.56087 (0.56190)	Top-1 acc 66.016 (66.253)	Top-5 acc 82.422 (85.544)	lr 0.00291
Train [94][1280/3239]	Time 0.251 (0.557)	Data Time 0.002 (0.037)	Loss 2.2209 (2.3963)	Entropy 0.56100 (0.56189)	Top-1 acc 71.875 (66.251)	Top-5 acc 88.281 (85.546)	lr 0.00291
Train [94][1290/3239]	Time 0.240 (0.556)	Data Time 0.002 (0.037)	Loss 2.3629 (2.3967)	Entropy 0.56105 (0.56189)	Top-1 acc 64.062 (66.245)	Top-5 acc 88.672 (85.541)	lr 0.00291
Train [94][1300/3239]	Time 0.258 (0.555)	Data Time 0.002 (0.037)	Loss 2.4114 (2.3965)	Entropy 0.56109 (0.56188)	Top-1 acc 64.062 (66.255)	Top-5 acc 86.328 (85.542)	lr 0.00291
Train [94][1310/3239]	Time 0.340 (0.555)	Data Time 0.002 (0.036)	Loss 2.4892 (2.3966)	Entropy 0.56115 (0.56187)	Top-1 acc 64.062 (66.253)	Top-5 acc 82.422 (85.534)	lr 0.00291
Train [94][1320/3239]	Time 0.230 (0.554)	Data Time 0.001 (0.036)	Loss 2.4913 (2.3963)	Entropy 0.56123 (0.56187)	Top-1 acc 64.844 (66.253)	Top-5 acc 84.375 (85.532)	lr 0.00291
Train [94][1330/3239]	Time 0.234 (0.553)	Data Time 0.001 (0.036)	Loss 2.3565 (2.3966)	Entropy 0.56084 (0.56186)	Top-1 acc 65.234 (66.245)	Top-5 acc 83.594 (85.522)	lr 0.00291
Train [94][1340/3239]	Time 0.245 (0.552)	Data Time 0.001 (0.036)	Loss 2.2858 (2.3961)	Entropy 0.56068 (0.56186)	Top-1 acc 70.703 (66.257)	Top-5 acc 87.500 (85.524)	lr 0.00291
Train [94][1350/3239]	Time 0.302 (0.552)	Data Time 0.002 (0.035)	Loss 2.4464 (2.3965)	Entropy 0.56079 (0.56185)	Top-1 acc 66.406 (66.248)	Top-5 acc 81.641 (85.511)	lr 0.00291
Train [94][1360/3239]	Time 0.236 (0.551)	Data Time 0.001 (0.035)	Loss 2.4082 (2.3966)	Entropy 0.56059 (0.56184)	Top-1 acc 63.672 (66.246)	Top-5 acc 85.547 (85.513)	lr 0.00291
Train [94][1370/3239]	Time 0.266 (0.550)	Data Time 0.001 (0.035)	Loss 2.6462 (2.3967)	Entropy 0.55995 (0.56183)	Top-1 acc 58.984 (66.241)	Top-5 acc 82.031 (85.503)	lr 0.00291
Train [94][1380/3239]	Time 0.255 (0.550)	Data Time 0.001 (0.035)	Loss 2.3264 (2.3967)	Entropy 0.56000 (0.56181)	Top-1 acc 67.969 (66.239)	Top-5 acc 84.375 (85.502)	lr 0.00290
Train [94][1390/3239]	Time 0.227 (0.549)	Data Time 0.001 (0.034)	Loss 2.5106 (2.3971)	Entropy 0.56000 (0.56180)	Top-1 acc 59.766 (66.231)	Top-5 acc 82.031 (85.497)	lr 0.00290
Train [94][1400/3239]	Time 0.355 (0.548)	Data Time 0.001 (0.034)	Loss 2.2781 (2.3967)	Entropy 0.55997 (0.56179)	Top-1 acc 70.312 (66.230)	Top-5 acc 86.719 (85.507)	lr 0.00290
Train [94][1410/3239]	Time 0.245 (0.547)	Data Time 0.001 (0.034)	Loss 2.3412 (2.3972)	Entropy 0.56022 (0.56178)	Top-1 acc 66.406 (66.218)	Top-5 acc 85.547 (85.496)	lr 0.00290
Train [94][1420/3239]	Time 0.247 (0.546)	Data Time 0.001 (0.034)	Loss 2.4495 (2.3972)	Entropy 0.55997 (0.56176)	Top-1 acc 62.109 (66.221)	Top-5 acc 82.031 (85.500)	lr 0.00290
Train [94][1430/3239]	Time 0.238 (0.546)	Data Time 0.001 (0.034)	Loss 2.3232 (2.3970)	Entropy 0.55989 (0.56175)	Top-1 acc 66.016 (66.227)	Top-5 acc 87.500 (85.504)	lr 0.00290
Train [94][1440/3239]	Time 0.240 (0.545)	Data Time 0.002 (0.033)	Loss 2.5663 (2.3970)	Entropy 0.55964 (0.56174)	Top-1 acc 61.328 (66.228)	Top-5 acc 87.109 (85.501)	lr 0.00290
Train [94][1450/3239]	Time 0.246 (0.544)	Data Time 0.001 (0.033)	Loss 2.3661 (2.3966)	Entropy 0.55983 (0.56172)	Top-1 acc 65.234 (66.239)	Top-5 acc 87.109 (85.509)	lr 0.00290
Train [94][1460/3239]	Time 0.253 (0.544)	Data Time 0.001 (0.033)	Loss 2.3774 (2.3965)	Entropy 0.56005 (0.56171)	Top-1 acc 65.234 (66.233)	Top-5 acc 85.156 (85.512)	lr 0.00290
Train [94][1470/3239]	Time 0.346 (0.543)	Data Time 0.001 (0.033)	Loss 2.3278 (2.3962)	Entropy 0.56012 (0.56170)	Top-1 acc 68.359 (66.241)	Top-5 acc 86.328 (85.520)	lr 0.00290
Train [94][1480/3239]	Time 0.247 (0.542)	Data Time 0.001 (0.032)	Loss 2.4799 (2.3964)	Entropy 0.56040 (0.56169)	Top-1 acc 61.328 (66.225)	Top-5 acc 85.938 (85.519)	lr 0.00290
Train [94][1490/3239]	Time 0.238 (0.542)	Data Time 0.001 (0.032)	Loss 2.3115 (2.3963)	Entropy 0.56034 (0.56168)	Top-1 acc 68.359 (66.228)	Top-5 acc 86.719 (85.523)	lr 0.00290
Train [94][1500/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.032)	Loss 2.3847 (2.3965)	Entropy 0.56035 (0.56167)	Top-1 acc 67.188 (66.221)	Top-5 acc 85.156 (85.520)	lr 0.00290
Train [94][1510/3239]	Time 0.256 (0.540)	Data Time 0.001 (0.032)	Loss 2.3845 (2.3965)	Entropy 0.56021 (0.56166)	Top-1 acc 67.188 (66.220)	Top-5 acc 85.156 (85.518)	lr 0.00290
Train [94][1520/3239]	Time 0.255 (0.539)	Data Time 0.001 (0.032)	Loss 2.2339 (2.3962)	Entropy 0.56038 (0.56165)	Top-1 acc 67.969 (66.229)	Top-5 acc 87.891 (85.522)	lr 0.00290
Train [94][1530/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.031)	Loss 2.3073 (2.3959)	Entropy 0.56010 (0.56164)	Top-1 acc 68.750 (66.236)	Top-5 acc 89.062 (85.533)	lr 0.00290
Train [94][1540/3239]	Time 0.243 (0.538)	Data Time 0.001 (0.031)	Loss 2.1392 (2.3964)	Entropy 0.55977 (0.56163)	Top-1 acc 72.656 (66.227)	Top-5 acc 89.062 (85.523)	lr 0.00289
Train [94][1550/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.031)	Loss 2.6275 (2.3964)	Entropy 0.56006 (0.56162)	Top-1 acc 56.250 (66.222)	Top-5 acc 80.859 (85.525)	lr 0.00289
Train [94][1560/3239]	Time 0.377 (0.537)	Data Time 0.001 (0.031)	Loss 2.2313 (2.3967)	Entropy 0.56019 (0.56161)	Top-1 acc 73.047 (66.224)	Top-5 acc 87.891 (85.515)	lr 0.00289
Train [94][1570/3239]	Time 0.222 (0.536)	Data Time 0.001 (0.031)	Loss 2.4512 (2.3972)	Entropy 0.56032 (0.56160)	Top-1 acc 62.500 (66.205)	Top-5 acc 84.375 (85.513)	lr 0.00289
Train [94][1580/3239]	Time 0.231 (0.535)	Data Time 0.001 (0.030)	Loss 2.4628 (2.3972)	Entropy 0.56059 (0.56160)	Top-1 acc 63.672 (66.210)	Top-5 acc 85.156 (85.516)	lr 0.00289
Train [94][1590/3239]	Time 0.225 (0.535)	Data Time 0.001 (0.030)	Loss 2.8683 (2.3976)	Entropy 0.56087 (0.56159)	Top-1 acc 57.031 (66.204)	Top-5 acc 78.516 (85.506)	lr 0.00289
Train [94][1600/3239]	Time 0.248 (0.534)	Data Time 0.020 (0.030)	Loss 2.3975 (2.3977)	Entropy 0.56116 (0.56159)	Top-1 acc 65.625 (66.203)	Top-5 acc 84.766 (85.502)	lr 0.00289
Train [94][1610/3239]	Time 0.247 (0.533)	Data Time 0.001 (0.030)	Loss 2.4642 (2.3978)	Entropy 0.56142 (0.56158)	Top-1 acc 67.578 (66.202)	Top-5 acc 83.594 (85.501)	lr 0.00289
Train [94][1620/3239]	Time 0.258 (0.533)	Data Time 0.002 (0.030)	Loss 2.4447 (2.3982)	Entropy 0.56155 (0.56158)	Top-1 acc 62.891 (66.195)	Top-5 acc 83.984 (85.497)	lr 0.00289
Train [94][1630/3239]	Time 0.348 (0.532)	Data Time 0.001 (0.030)	Loss 2.4241 (2.3982)	Entropy 0.56174 (0.56158)	Top-1 acc 63.672 (66.193)	Top-5 acc 84.375 (85.500)	lr 0.00289
Train [94][1640/3239]	Time 0.220 (0.531)	Data Time 0.001 (0.029)	Loss 2.3908 (2.3984)	Entropy 0.56212 (0.56159)	Top-1 acc 69.141 (66.193)	Top-5 acc 87.109 (85.494)	lr 0.00289
Train [94][1650/3239]	Time 0.276 (0.531)	Data Time 0.001 (0.029)	Loss 2.2489 (2.3981)	Entropy 0.56178 (0.56159)	Top-1 acc 67.969 (66.199)	Top-5 acc 88.281 (85.501)	lr 0.00289
Train [94][1660/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.029)	Loss 2.8294 (2.3986)	Entropy 0.56170 (0.56159)	Top-1 acc 56.250 (66.187)	Top-5 acc 76.953 (85.493)	lr 0.00289
Train [94][1670/3239]	Time 0.245 (0.530)	Data Time 0.001 (0.029)	Loss 2.4289 (2.3987)	Entropy 0.56134 (0.56159)	Top-1 acc 64.453 (66.188)	Top-5 acc 85.156 (85.488)	lr 0.00289
Train [94][1680/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.029)	Loss 2.6132 (2.3992)	Entropy 0.56177 (0.56159)	Top-1 acc 60.156 (66.177)	Top-5 acc 81.641 (85.480)	lr 0.00289
Train [94][1690/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.029)	Loss 2.3145 (2.3991)	Entropy 0.56147 (0.56159)	Top-1 acc 67.969 (66.179)	Top-5 acc 87.109 (85.478)	lr 0.00288
Train [94][1700/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.028)	Loss 2.5437 (2.3993)	Entropy 0.56153 (0.56159)	Top-1 acc 66.016 (66.178)	Top-5 acc 82.031 (85.475)	lr 0.00288
Train [94][1710/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.028)	Loss 2.5991 (2.3996)	Entropy 0.56182 (0.56159)	Top-1 acc 62.500 (66.170)	Top-5 acc 82.422 (85.469)	lr 0.00288
Train [94][1720/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.028)	Loss 2.6359 (2.4004)	Entropy 0.56163 (0.56159)	Top-1 acc 58.594 (66.155)	Top-5 acc 81.250 (85.454)	lr 0.00288
Train [94][1730/3239]	Time 0.241 (0.527)	Data Time 0.001 (0.028)	Loss 2.1679 (2.4003)	Entropy 0.56167 (0.56159)	Top-1 acc 71.484 (66.156)	Top-5 acc 89.062 (85.456)	lr 0.00288
Train [94][1740/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.028)	Loss 2.5249 (2.4007)	Entropy 0.56163 (0.56159)	Top-1 acc 60.547 (66.150)	Top-5 acc 82.422 (85.454)	lr 0.00288
Train [94][1750/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.028)	Loss 2.3786 (2.4006)	Entropy 0.56173 (0.56159)	Top-1 acc 65.234 (66.146)	Top-5 acc 88.281 (85.458)	lr 0.00288
Train [94][1760/3239]	Time 0.252 (0.525)	Data Time 0.001 (0.028)	Loss 2.5855 (2.4008)	Entropy 0.56191 (0.56159)	Top-1 acc 61.328 (66.141)	Top-5 acc 82.422 (85.460)	lr 0.00288
Train [94][1770/3239]	Time 0.240 (0.525)	Data Time 0.001 (0.027)	Loss 2.4152 (2.4008)	Entropy 0.56196 (0.56159)	Top-1 acc 63.281 (66.140)	Top-5 acc 86.328 (85.459)	lr 0.00288
Train [94][1780/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.027)	Loss 2.2811 (2.4007)	Entropy 0.56203 (0.56159)	Top-1 acc 67.969 (66.146)	Top-5 acc 87.109 (85.460)	lr 0.00288
Train [94][1790/3239]	Time 0.360 (0.524)	Data Time 0.001 (0.027)	Loss 2.1678 (2.4007)	Entropy 0.56214 (0.56160)	Top-1 acc 68.359 (66.143)	Top-5 acc 89.062 (85.458)	lr 0.00288
Train [94][1800/3239]	Time 0.280 (0.523)	Data Time 0.001 (0.027)	Loss 2.2981 (2.4008)	Entropy 0.56204 (0.56160)	Top-1 acc 67.969 (66.147)	Top-5 acc 88.281 (85.456)	lr 0.00288
Train [94][1810/3239]	Time 0.257 (0.523)	Data Time 0.001 (0.027)	Loss 2.2951 (2.4006)	Entropy 0.56231 (0.56160)	Top-1 acc 69.531 (66.149)	Top-5 acc 87.500 (85.461)	lr 0.00288
Train [94][1820/3239]	Time 0.264 (0.523)	Data Time 0.001 (0.027)	Loss 2.4435 (2.4006)	Entropy 0.56240 (0.56161)	Top-1 acc 64.062 (66.152)	Top-5 acc 86.719 (85.465)	lr 0.00288
Train [94][1830/3239]	Time 0.347 (0.523)	Data Time 0.004 (0.027)	Loss 2.3428 (2.4006)	Entropy 0.56266 (0.56161)	Top-1 acc 66.797 (66.152)	Top-5 acc 87.109 (85.463)	lr 0.00288
Train [94][1840/3239]	Time 0.321 (0.523)	Data Time 0.001 (0.026)	Loss 2.4286 (2.4004)	Entropy 0.56270 (0.56162)	Top-1 acc 66.797 (66.155)	Top-5 acc 83.594 (85.463)	lr 0.00288
Train [94][1850/3239]	Time 0.312 (0.523)	Data Time 0.002 (0.026)	Loss 2.2703 (2.4002)	Entropy 0.56283 (0.56162)	Top-1 acc 66.016 (66.158)	Top-5 acc 87.891 (85.463)	lr 0.00287
Train [94][1860/3239]	Time 0.367 (0.523)	Data Time 0.001 (0.026)	Loss 2.2943 (2.4002)	Entropy 0.56272 (0.56163)	Top-1 acc 69.141 (66.160)	Top-5 acc 88.281 (85.465)	lr 0.00287
Train [94][1870/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.026)	Loss 2.4610 (2.4001)	Entropy 0.56309 (0.56164)	Top-1 acc 66.016 (66.162)	Top-5 acc 87.500 (85.470)	lr 0.00287
Train [94][1880/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.026)	Loss 2.3708 (2.3996)	Entropy 0.56286 (0.56164)	Top-1 acc 67.578 (66.173)	Top-5 acc 87.500 (85.476)	lr 0.00287
Train [94][1890/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.026)	Loss 2.4843 (2.3994)	Entropy 0.56248 (0.56165)	Top-1 acc 67.578 (66.179)	Top-5 acc 82.812 (85.475)	lr 0.00287
Train [94][1900/3239]	Time 0.242 (0.521)	Data Time 0.002 (0.026)	Loss 2.2547 (2.3996)	Entropy 0.56245 (0.56165)	Top-1 acc 68.359 (66.171)	Top-5 acc 88.281 (85.471)	lr 0.00287
Train [94][1910/3239]	Time 0.239 (0.521)	Data Time 0.001 (0.026)	Loss 2.2775 (2.3995)	Entropy 0.56242 (0.56166)	Top-1 acc 68.359 (66.177)	Top-5 acc 87.891 (85.473)	lr 0.00287
Train [94][1920/3239]	Time 0.256 (0.548)	Data Time 0.003 (0.025)	Loss 2.5611 (2.3995)	Entropy 0.56237 (0.56166)	Top-1 acc 64.062 (66.183)	Top-5 acc 82.031 (85.473)	lr 0.00287
Train [94][1930/3239]	Time 0.246 (0.548)	Data Time 0.002 (0.025)	Loss 2.3234 (2.3996)	Entropy 0.56240 (0.56167)	Top-1 acc 71.484 (66.183)	Top-5 acc 87.891 (85.473)	lr 0.00287
Train [94][1940/3239]	Time 0.248 (0.547)	Data Time 0.002 (0.025)	Loss 2.3004 (2.3997)	Entropy 0.56258 (0.56167)	Top-1 acc 66.016 (66.178)	Top-5 acc 88.672 (85.471)	lr 0.00287
Train [94][1950/3239]	Time 0.473 (0.547)	Data Time 0.002 (0.025)	Loss 2.5194 (2.4001)	Entropy 0.56225 (0.56168)	Top-1 acc 64.844 (66.169)	Top-5 acc 84.375 (85.466)	lr 0.00287
Train [94][1960/3239]	Time 0.250 (0.547)	Data Time 0.001 (0.025)	Loss 2.5586 (2.4001)	Entropy 0.56227 (0.56168)	Top-1 acc 61.719 (66.165)	Top-5 acc 81.250 (85.466)	lr 0.00287
Train [94][1970/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.025)	Loss 2.1483 (2.3999)	Entropy 0.56252 (0.56168)	Top-1 acc 68.750 (66.172)	Top-5 acc 87.891 (85.469)	lr 0.00287
Train [94][1980/3239]	Time 0.243 (0.546)	Data Time 0.002 (0.025)	Loss 2.4308 (2.3996)	Entropy 0.56213 (0.56168)	Top-1 acc 65.234 (66.181)	Top-5 acc 86.328 (85.474)	lr 0.00287
Train [94][1990/3239]	Time 0.237 (0.546)	Data Time 0.001 (0.025)	Loss 2.3206 (2.3996)	Entropy 0.56250 (0.56169)	Top-1 acc 67.969 (66.177)	Top-5 acc 86.719 (85.475)	lr 0.00287
Train [94][2000/3239]	Time 0.247 (0.545)	Data Time 0.002 (0.024)	Loss 2.2807 (2.3995)	Entropy 0.56259 (0.56169)	Top-1 acc 69.922 (66.178)	Top-5 acc 85.547 (85.475)	lr 0.00286
Train [94][2010/3239]	Time 0.242 (0.545)	Data Time 0.001 (0.024)	Loss 2.4683 (2.3999)	Entropy 0.56230 (0.56170)	Top-1 acc 66.016 (66.173)	Top-5 acc 83.594 (85.467)	lr 0.00286
Train [94][2020/3239]	Time 0.364 (0.544)	Data Time 0.001 (0.024)	Loss 2.4357 (2.3999)	Entropy 0.56236 (0.56170)	Top-1 acc 67.578 (66.170)	Top-5 acc 85.938 (85.470)	lr 0.00286
Train [94][2030/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.024)	Loss 2.3185 (2.3996)	Entropy 0.56236 (0.56170)	Top-1 acc 68.359 (66.174)	Top-5 acc 85.156 (85.474)	lr 0.00286
Train [94][2040/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.024)	Loss 2.2614 (2.3997)	Entropy 0.56231 (0.56170)	Top-1 acc 70.312 (66.173)	Top-5 acc 87.500 (85.473)	lr 0.00286
Train [94][2050/3239]	Time 0.252 (0.543)	Data Time 0.003 (0.024)	Loss 2.5049 (2.3997)	Entropy 0.56238 (0.56171)	Top-1 acc 65.234 (66.174)	Top-5 acc 85.547 (85.474)	lr 0.00286
Train [94][2060/3239]	Time 0.243 (0.542)	Data Time 0.002 (0.024)	Loss 2.2793 (2.3996)	Entropy 0.56239 (0.56171)	Top-1 acc 68.359 (66.175)	Top-5 acc 87.891 (85.474)	lr 0.00286
Train [94][2070/3239]	Time 0.245 (0.542)	Data Time 0.001 (0.024)	Loss 2.2276 (2.3997)	Entropy 0.56227 (0.56171)	Top-1 acc 73.047 (66.172)	Top-5 acc 89.062 (85.472)	lr 0.00286
Train [94][2080/3239]	Time 0.243 (0.541)	Data Time 0.001 (0.024)	Loss 2.4609 (2.3997)	Entropy 0.56220 (0.56172)	Top-1 acc 62.109 (66.173)	Top-5 acc 85.156 (85.472)	lr 0.00286
Train [94][2090/3239]	Time 0.251 (0.541)	Data Time 0.001 (0.023)	Loss 2.4335 (2.3996)	Entropy 0.56204 (0.56172)	Top-1 acc 64.844 (66.174)	Top-5 acc 83.594 (85.471)	lr 0.00286
Train [94][2100/3239]	Time 0.249 (0.540)	Data Time 0.001 (0.023)	Loss 2.5589 (2.3998)	Entropy 0.56190 (0.56172)	Top-1 acc 60.547 (66.165)	Top-5 acc 83.594 (85.470)	lr 0.00286
Train [94][2110/3239]	Time 0.374 (0.540)	Data Time 0.001 (0.023)	Loss 2.3012 (2.3999)	Entropy 0.56206 (0.56172)	Top-1 acc 70.703 (66.161)	Top-5 acc 85.938 (85.470)	lr 0.00286
Train [94][2120/3239]	Time 0.259 (0.539)	Data Time 0.001 (0.023)	Loss 2.2669 (2.3999)	Entropy 0.56221 (0.56172)	Top-1 acc 68.359 (66.163)	Top-5 acc 87.500 (85.469)	lr 0.00286
Train [94][2130/3239]	Time 0.251 (0.539)	Data Time 0.002 (0.023)	Loss 2.4879 (2.4000)	Entropy 0.56214 (0.56172)	Top-1 acc 65.625 (66.162)	Top-5 acc 84.375 (85.466)	lr 0.00286
Train [94][2140/3239]	Time 0.270 (0.538)	Data Time 0.001 (0.023)	Loss 2.2875 (2.4001)	Entropy 0.56191 (0.56173)	Top-1 acc 67.578 (66.155)	Top-5 acc 85.938 (85.464)	lr 0.00286
Train [94][2150/3239]	Time 0.226 (0.538)	Data Time 0.001 (0.023)	Loss 2.3599 (2.4000)	Entropy 0.56208 (0.56173)	Top-1 acc 70.312 (66.161)	Top-5 acc 83.984 (85.466)	lr 0.00286
Train [94][2160/3239]	Time 0.242 (0.537)	Data Time 0.001 (0.023)	Loss 2.3311 (2.4002)	Entropy 0.56232 (0.56173)	Top-1 acc 73.047 (66.157)	Top-5 acc 83.594 (85.461)	lr 0.00285
Train [94][2170/3239]	Time 0.248 (0.537)	Data Time 0.001 (0.023)	Loss 2.4562 (2.3998)	Entropy 0.56228 (0.56173)	Top-1 acc 64.453 (66.164)	Top-5 acc 87.500 (85.469)	lr 0.00285
Train [94][2180/3239]	Time 0.337 (0.536)	Data Time 0.001 (0.023)	Loss 2.4639 (2.4000)	Entropy 0.56209 (0.56174)	Top-1 acc 65.234 (66.163)	Top-5 acc 83.594 (85.465)	lr 0.00285
Train [94][2190/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.022)	Loss 2.2994 (2.4005)	Entropy 0.56207 (0.56174)	Top-1 acc 64.453 (66.147)	Top-5 acc 88.281 (85.457)	lr 0.00285
Train [94][2200/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.022)	Loss 2.4257 (2.4008)	Entropy 0.56225 (0.56174)	Top-1 acc 66.016 (66.139)	Top-5 acc 83.594 (85.457)	lr 0.00285
Train [94][2210/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.022)	Loss 2.8356 (2.4011)	Entropy 0.56201 (0.56174)	Top-1 acc 57.031 (66.129)	Top-5 acc 77.344 (85.450)	lr 0.00285
Train [94][2220/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.022)	Loss 2.3289 (2.4011)	Entropy 0.56206 (0.56174)	Top-1 acc 67.969 (66.126)	Top-5 acc 87.891 (85.451)	lr 0.00285
Train [94][2230/3239]	Time 0.258 (0.534)	Data Time 0.002 (0.022)	Loss 2.3426 (2.4014)	Entropy 0.56208 (0.56174)	Top-1 acc 68.750 (66.123)	Top-5 acc 85.547 (85.446)	lr 0.00285
Train [94][2240/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.022)	Loss 2.3743 (2.4014)	Entropy 0.56228 (0.56174)	Top-1 acc 66.797 (66.124)	Top-5 acc 85.547 (85.446)	lr 0.00285
Train [94][2250/3239]	Time 0.308 (0.534)	Data Time 0.002 (0.022)	Loss 2.4147 (2.4016)	Entropy 0.56234 (0.56175)	Top-1 acc 66.406 (66.124)	Top-5 acc 83.203 (85.442)	lr 0.00285
Train [94][2260/3239]	Time 0.283 (0.534)	Data Time 0.003 (0.022)	Loss 2.2934 (2.4017)	Entropy 0.56216 (0.56175)	Top-1 acc 70.312 (66.124)	Top-5 acc 90.625 (85.440)	lr 0.00285
Train [94][2270/3239]	Time 0.295 (0.533)	Data Time 0.001 (0.022)	Loss 2.2772 (2.4016)	Entropy 0.56229 (0.56175)	Top-1 acc 69.141 (66.124)	Top-5 acc 87.500 (85.439)	lr 0.00285
Train [94][2280/3239]	Time 0.240 (0.533)	Data Time 0.001 (0.022)	Loss 2.3184 (2.4017)	Entropy 0.56177 (0.56175)	Top-1 acc 69.531 (66.128)	Top-5 acc 90.234 (85.439)	lr 0.00285
Train [94][2290/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.022)	Loss 2.4029 (2.4016)	Entropy 0.56188 (0.56175)	Top-1 acc 66.016 (66.130)	Top-5 acc 83.594 (85.439)	lr 0.00285
Train [94][2300/3239]	Time 0.270 (0.532)	Data Time 0.034 (0.022)	Loss 2.6000 (2.4015)	Entropy 0.56181 (0.56175)	Top-1 acc 60.938 (66.135)	Top-5 acc 82.812 (85.442)	lr 0.00285
Train [94][2310/3239]	Time 0.220 (0.531)	Data Time 0.001 (0.021)	Loss 2.3053 (2.4016)	Entropy 0.56170 (0.56175)	Top-1 acc 71.875 (66.138)	Top-5 acc 87.891 (85.440)	lr 0.00285
Train [94][2320/3239]	Time 0.306 (0.531)	Data Time 0.002 (0.021)	Loss 2.3291 (2.4014)	Entropy 0.56201 (0.56175)	Top-1 acc 67.578 (66.140)	Top-5 acc 86.328 (85.443)	lr 0.00284
Train [94][2330/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.021)	Loss 2.5416 (2.4016)	Entropy 0.56196 (0.56175)	Top-1 acc 63.672 (66.131)	Top-5 acc 80.859 (85.440)	lr 0.00284
Train [94][2340/3239]	Time 0.334 (0.530)	Data Time 0.001 (0.021)	Loss 2.2665 (2.4016)	Entropy 0.56210 (0.56175)	Top-1 acc 71.094 (66.131)	Top-5 acc 86.328 (85.440)	lr 0.00284
Train [94][2350/3239]	Time 0.268 (0.530)	Data Time 0.002 (0.021)	Loss 2.5985 (2.4020)	Entropy 0.56226 (0.56176)	Top-1 acc 62.891 (66.126)	Top-5 acc 80.469 (85.428)	lr 0.00284
Train [94][2360/3239]	Time 0.233 (0.529)	Data Time 0.001 (0.021)	Loss 2.3429 (2.4018)	Entropy 0.56208 (0.56176)	Top-1 acc 67.188 (66.128)	Top-5 acc 84.375 (85.434)	lr 0.00284
Train [94][2370/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.021)	Loss 2.5920 (2.4020)	Entropy 0.56205 (0.56176)	Top-1 acc 61.719 (66.128)	Top-5 acc 81.641 (85.430)	lr 0.00284
Train [94][2380/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.021)	Loss 2.5471 (2.4021)	Entropy 0.56185 (0.56176)	Top-1 acc 62.109 (66.122)	Top-5 acc 81.641 (85.428)	lr 0.00284
Train [94][2390/3239]	Time 0.224 (0.528)	Data Time 0.001 (0.021)	Loss 2.3762 (2.4021)	Entropy 0.56228 (0.56176)	Top-1 acc 70.312 (66.120)	Top-5 acc 83.984 (85.428)	lr 0.00284
Train [94][2400/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.021)	Loss 2.2254 (2.4023)	Entropy 0.56242 (0.56176)	Top-1 acc 67.188 (66.115)	Top-5 acc 89.453 (85.423)	lr 0.00284
Train [94][2410/3239]	Time 0.344 (0.527)	Data Time 0.001 (0.021)	Loss 2.3737 (2.4024)	Entropy 0.56268 (0.56177)	Top-1 acc 68.359 (66.109)	Top-5 acc 85.938 (85.419)	lr 0.00284
Train [94][2420/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.021)	Loss 2.3261 (2.4025)	Entropy 0.56295 (0.56177)	Top-1 acc 69.141 (66.104)	Top-5 acc 85.547 (85.418)	lr 0.00284
Train [94][2430/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.020)	Loss 2.2583 (2.4023)	Entropy 0.56262 (0.56177)	Top-1 acc 68.359 (66.111)	Top-5 acc 88.672 (85.423)	lr 0.00284
Train [94][2440/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.020)	Loss 2.3385 (2.4023)	Entropy 0.56250 (0.56178)	Top-1 acc 69.141 (66.111)	Top-5 acc 85.156 (85.422)	lr 0.00284
Train [94][2450/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.020)	Loss 2.3751 (2.4024)	Entropy 0.56197 (0.56178)	Top-1 acc 67.969 (66.109)	Top-5 acc 86.328 (85.419)	lr 0.00284
Train [94][2460/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.020)	Loss 2.3942 (2.4026)	Entropy 0.56199 (0.56178)	Top-1 acc 64.062 (66.099)	Top-5 acc 83.984 (85.415)	lr 0.00284
Train [94][2470/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.020)	Loss 2.3068 (2.4027)	Entropy 0.56226 (0.56178)	Top-1 acc 67.969 (66.091)	Top-5 acc 85.938 (85.412)	lr 0.00283
Train [94][2480/3239]	Time 0.221 (0.524)	Data Time 0.001 (0.020)	Loss 2.3491 (2.4026)	Entropy 0.56236 (0.56178)	Top-1 acc 66.797 (66.091)	Top-5 acc 85.938 (85.414)	lr 0.00283
Train [94][2490/3239]	Time 0.229 (0.524)	Data Time 0.001 (0.020)	Loss 2.3267 (2.4027)	Entropy 0.56224 (0.56179)	Top-1 acc 65.625 (66.084)	Top-5 acc 89.062 (85.414)	lr 0.00283
Train [94][2500/3239]	Time 0.339 (0.523)	Data Time 0.001 (0.020)	Loss 2.6360 (2.4028)	Entropy 0.56249 (0.56179)	Top-1 acc 58.203 (66.080)	Top-5 acc 81.250 (85.413)	lr 0.00283
Train [94][2510/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.020)	Loss 2.3877 (2.4028)	Entropy 0.56233 (0.56179)	Top-1 acc 68.359 (66.082)	Top-5 acc 85.547 (85.413)	lr 0.00283
Train [94][2520/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.020)	Loss 2.4441 (2.4030)	Entropy 0.56242 (0.56179)	Top-1 acc 61.719 (66.075)	Top-5 acc 85.547 (85.409)	lr 0.00283
Train [94][2530/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.020)	Loss 2.3471 (2.4035)	Entropy 0.56272 (0.56180)	Top-1 acc 68.359 (66.064)	Top-5 acc 85.156 (85.403)	lr 0.00283
Train [94][2540/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.020)	Loss 2.4877 (2.4037)	Entropy 0.56298 (0.56180)	Top-1 acc 61.328 (66.061)	Top-5 acc 83.984 (85.400)	lr 0.00283
Train [94][2550/3239]	Time 0.280 (0.521)	Data Time 0.001 (0.020)	Loss 2.3126 (2.4035)	Entropy 0.56303 (0.56181)	Top-1 acc 69.922 (66.068)	Top-5 acc 85.156 (85.405)	lr 0.00283
Train [94][2560/3239]	Time 0.299 (0.521)	Data Time 0.003 (0.020)	Loss 2.2778 (2.4036)	Entropy 0.56324 (0.56181)	Top-1 acc 67.578 (66.066)	Top-5 acc 90.234 (85.405)	lr 0.00283
Train [94][2570/3239]	Time 0.505 (0.542)	Data Time 0.006 (0.019)	Loss 2.2357 (2.4035)	Entropy 0.56332 (0.56182)	Top-1 acc 71.875 (66.069)	Top-5 acc 87.500 (85.408)	lr 0.00283
Train [94][2580/3239]	Time 0.251 (0.542)	Data Time 0.002 (0.019)	Loss 2.5126 (2.4033)	Entropy 0.56312 (0.56182)	Top-1 acc 62.500 (66.070)	Top-5 acc 84.375 (85.411)	lr 0.00283
Train [94][2590/3239]	Time 0.231 (0.541)	Data Time 0.002 (0.019)	Loss 2.3639 (2.4032)	Entropy 0.56313 (0.56183)	Top-1 acc 67.969 (66.072)	Top-5 acc 87.891 (85.412)	lr 0.00283
Train [94][2600/3239]	Time 0.238 (0.541)	Data Time 0.001 (0.019)	Loss 2.3607 (2.4030)	Entropy 0.56313 (0.56183)	Top-1 acc 68.359 (66.079)	Top-5 acc 85.938 (85.413)	lr 0.00283
Train [94][2610/3239]	Time 0.238 (0.540)	Data Time 0.001 (0.019)	Loss 2.3870 (2.4030)	Entropy 0.56295 (0.56184)	Top-1 acc 66.016 (66.080)	Top-5 acc 85.547 (85.411)	lr 0.00283
Train [94][2620/3239]	Time 0.234 (0.540)	Data Time 0.001 (0.019)	Loss 2.5335 (2.4033)	Entropy 0.56280 (0.56184)	Top-1 acc 63.672 (66.069)	Top-5 acc 83.984 (85.407)	lr 0.00283
Train [94][2630/3239]	Time 0.240 (0.540)	Data Time 0.001 (0.019)	Loss 2.4529 (2.4031)	Entropy 0.56299 (0.56185)	Top-1 acc 67.969 (66.073)	Top-5 acc 86.328 (85.410)	lr 0.00282
Train [94][2640/3239]	Time 0.229 (0.539)	Data Time 0.001 (0.019)	Loss 2.5235 (2.4033)	Entropy 0.56289 (0.56185)	Top-1 acc 63.281 (66.068)	Top-5 acc 82.422 (85.405)	lr 0.00282
Train [94][2650/3239]	Time 0.219 (0.539)	Data Time 0.001 (0.019)	Loss 2.3794 (2.4033)	Entropy 0.56274 (0.56185)	Top-1 acc 67.578 (66.071)	Top-5 acc 85.938 (85.407)	lr 0.00282
Train [94][2660/3239]	Time 0.439 (0.539)	Data Time 0.001 (0.019)	Loss 2.6098 (2.4035)	Entropy 0.56293 (0.56186)	Top-1 acc 60.547 (66.065)	Top-5 acc 82.812 (85.403)	lr 0.00282
Train [94][2670/3239]	Time 0.248 (0.538)	Data Time 0.001 (0.019)	Loss 2.4675 (2.4036)	Entropy 0.56259 (0.56186)	Top-1 acc 64.844 (66.062)	Top-5 acc 86.328 (85.404)	lr 0.00282
Train [94][2680/3239]	Time 0.251 (0.538)	Data Time 0.001 (0.019)	Loss 2.4177 (2.4037)	Entropy 0.56252 (0.56186)	Top-1 acc 67.188 (66.059)	Top-5 acc 85.156 (85.404)	lr 0.00282
Train [94][2690/3239]	Time 0.255 (0.538)	Data Time 0.001 (0.019)	Loss 2.3738 (2.4035)	Entropy 0.56217 (0.56187)	Top-1 acc 67.969 (66.065)	Top-5 acc 83.984 (85.407)	lr 0.00282
Train [94][2700/3239]	Time 0.221 (0.537)	Data Time 0.001 (0.019)	Loss 2.5204 (2.4035)	Entropy 0.56204 (0.56187)	Top-1 acc 62.109 (66.060)	Top-5 acc 82.812 (85.406)	lr 0.00282
Train [94][2710/3239]	Time 0.236 (0.537)	Data Time 0.001 (0.019)	Loss 2.3833 (2.4037)	Entropy 0.56213 (0.56187)	Top-1 acc 68.750 (66.059)	Top-5 acc 85.547 (85.405)	lr 0.00282
Train [94][2720/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.018)	Loss 2.3460 (2.4038)	Entropy 0.56222 (0.56187)	Top-1 acc 67.578 (66.060)	Top-5 acc 85.938 (85.400)	lr 0.00282
Train [94][2730/3239]	Time 0.351 (0.536)	Data Time 0.001 (0.018)	Loss 2.6648 (2.4038)	Entropy 0.56225 (0.56187)	Top-1 acc 60.547 (66.062)	Top-5 acc 82.031 (85.399)	lr 0.00282
Train [94][2740/3239]	Time 0.294 (0.536)	Data Time 0.001 (0.018)	Loss 2.5946 (2.4037)	Entropy 0.56205 (0.56187)	Top-1 acc 62.109 (66.061)	Top-5 acc 83.203 (85.399)	lr 0.00282
Train [94][2750/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.018)	Loss 2.3347 (2.4036)	Entropy 0.56221 (0.56187)	Top-1 acc 66.016 (66.060)	Top-5 acc 87.109 (85.404)	lr 0.00282
Train [94][2760/3239]	Time 0.243 (0.535)	Data Time 0.002 (0.018)	Loss 2.4548 (2.4035)	Entropy 0.56225 (0.56187)	Top-1 acc 65.234 (66.061)	Top-5 acc 83.984 (85.404)	lr 0.00282
Train [94][2770/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.018)	Loss 2.1673 (2.4034)	Entropy 0.56210 (0.56187)	Top-1 acc 74.219 (66.067)	Top-5 acc 91.016 (85.408)	lr 0.00282
Train [94][2780/3239]	Time 0.237 (0.535)	Data Time 0.001 (0.018)	Loss 2.4190 (2.4037)	Entropy 0.56233 (0.56187)	Top-1 acc 65.625 (66.060)	Top-5 acc 85.547 (85.404)	lr 0.00281
Train [94][2790/3239]	Time 0.229 (0.534)	Data Time 0.001 (0.018)	Loss 2.5678 (2.4037)	Entropy 0.56177 (0.56188)	Top-1 acc 60.938 (66.061)	Top-5 acc 83.984 (85.408)	lr 0.00281
Train [94][2800/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.018)	Loss 2.4055 (2.4036)	Entropy 0.56176 (0.56188)	Top-1 acc 65.234 (66.062)	Top-5 acc 87.109 (85.410)	lr 0.00281
Train [94][2810/3239]	Time 0.246 (0.534)	Data Time 0.001 (0.018)	Loss 2.3442 (2.4036)	Entropy 0.56172 (0.56188)	Top-1 acc 62.109 (66.061)	Top-5 acc 87.891 (85.409)	lr 0.00281
Train [94][2820/3239]	Time 0.334 (0.533)	Data Time 0.001 (0.018)	Loss 2.4602 (2.4037)	Entropy 0.56168 (0.56188)	Top-1 acc 64.844 (66.061)	Top-5 acc 81.250 (85.405)	lr 0.00281
Train [94][2830/3239]	Time 0.225 (0.533)	Data Time 0.001 (0.018)	Loss 2.4210 (2.4037)	Entropy 0.56179 (0.56187)	Top-1 acc 64.453 (66.061)	Top-5 acc 86.328 (85.408)	lr 0.00281
Train [94][2840/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.018)	Loss 2.2581 (2.4036)	Entropy 0.56185 (0.56187)	Top-1 acc 69.531 (66.064)	Top-5 acc 86.328 (85.407)	lr 0.00281
Train [94][2850/3239]	Time 0.248 (0.532)	Data Time 0.001 (0.018)	Loss 2.2749 (2.4035)	Entropy 0.56198 (0.56187)	Top-1 acc 70.312 (66.068)	Top-5 acc 88.672 (85.410)	lr 0.00281
Train [94][2860/3239]	Time 0.220 (0.532)	Data Time 0.001 (0.018)	Loss 2.5503 (2.4037)	Entropy 0.56191 (0.56187)	Top-1 acc 62.891 (66.064)	Top-5 acc 84.375 (85.407)	lr 0.00281
Train [94][2870/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.018)	Loss 2.3409 (2.4037)	Entropy 0.56209 (0.56188)	Top-1 acc 69.531 (66.063)	Top-5 acc 88.672 (85.407)	lr 0.00281
Train [94][2880/3239]	Time 0.221 (0.531)	Data Time 0.001 (0.018)	Loss 2.3205 (2.4039)	Entropy 0.56194 (0.56188)	Top-1 acc 69.141 (66.059)	Top-5 acc 87.891 (85.404)	lr 0.00281
Train [94][2890/3239]	Time 0.372 (0.531)	Data Time 0.002 (0.017)	Loss 2.3571 (2.4040)	Entropy 0.56185 (0.56188)	Top-1 acc 67.188 (66.058)	Top-5 acc 85.156 (85.403)	lr 0.00281
Train [94][2900/3239]	Time 0.220 (0.530)	Data Time 0.001 (0.017)	Loss 2.5390 (2.4040)	Entropy 0.56220 (0.56188)	Top-1 acc 62.109 (66.055)	Top-5 acc 82.422 (85.402)	lr 0.00281
Train [94][2910/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.017)	Loss 2.4279 (2.4038)	Entropy 0.56204 (0.56188)	Top-1 acc 65.234 (66.062)	Top-5 acc 85.156 (85.406)	lr 0.00281
Train [94][2920/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.017)	Loss 2.2897 (2.4038)	Entropy 0.56201 (0.56188)	Top-1 acc 69.531 (66.066)	Top-5 acc 85.938 (85.406)	lr 0.00281
Train [94][2930/3239]	Time 0.237 (0.529)	Data Time 0.001 (0.017)	Loss 2.5321 (2.4039)	Entropy 0.56170 (0.56188)	Top-1 acc 59.375 (66.062)	Top-5 acc 83.984 (85.403)	lr 0.00281
Train [94][2940/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.017)	Loss 2.7158 (2.4041)	Entropy 0.56136 (0.56188)	Top-1 acc 60.156 (66.060)	Top-5 acc 79.688 (85.399)	lr 0.00280
Train [94][2950/3239]	Time 0.244 (0.528)	Data Time 0.001 (0.017)	Loss 2.4771 (2.4042)	Entropy 0.56105 (0.56187)	Top-1 acc 62.500 (66.056)	Top-5 acc 85.156 (85.396)	lr 0.00280
Train [94][2960/3239]	Time 0.241 (0.528)	Data Time 0.001 (0.017)	Loss 2.3959 (2.4042)	Entropy 0.56126 (0.56187)	Top-1 acc 63.672 (66.055)	Top-5 acc 83.984 (85.396)	lr 0.00280
Train [94][2970/3239]	Time 0.237 (0.528)	Data Time 0.001 (0.017)	Loss 2.3104 (2.4041)	Entropy 0.56114 (0.56187)	Top-1 acc 66.406 (66.057)	Top-5 acc 86.328 (85.398)	lr 0.00280
Train [94][2980/3239]	Time 0.267 (0.527)	Data Time 0.001 (0.017)	Loss 2.4921 (2.4039)	Entropy 0.56134 (0.56187)	Top-1 acc 66.406 (66.062)	Top-5 acc 84.375 (85.401)	lr 0.00280
Train [94][2990/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.017)	Loss 2.2443 (2.4042)	Entropy 0.56141 (0.56186)	Top-1 acc 71.484 (66.059)	Top-5 acc 88.672 (85.398)	lr 0.00280
Train [94][3000/3239]	Time 0.255 (0.527)	Data Time 0.001 (0.017)	Loss 2.4190 (2.4042)	Entropy 0.56109 (0.56186)	Top-1 acc 64.453 (66.058)	Top-5 acc 84.375 (85.396)	lr 0.00280
Train [94][3010/3239]	Time 0.227 (0.526)	Data Time 0.001 (0.017)	Loss 2.4259 (2.4042)	Entropy 0.56119 (0.56186)	Top-1 acc 67.578 (66.061)	Top-5 acc 84.375 (85.395)	lr 0.00280
Train [94][3020/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.017)	Loss 2.6250 (2.4041)	Entropy 0.56112 (0.56186)	Top-1 acc 58.594 (66.064)	Top-5 acc 81.250 (85.395)	lr 0.00280
Train [94][3030/3239]	Time 0.264 (0.526)	Data Time 0.001 (0.017)	Loss 2.4333 (2.4040)	Entropy 0.56116 (0.56186)	Top-1 acc 65.625 (66.070)	Top-5 acc 85.547 (85.396)	lr 0.00280
Train [94][3040/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.2793 (2.4038)	Entropy 0.56078 (0.56185)	Top-1 acc 75.391 (66.077)	Top-5 acc 86.328 (85.401)	lr 0.00280
Train [94][3050/3239]	Time 0.432 (0.525)	Data Time 0.002 (0.017)	Loss 2.4339 (2.4038)	Entropy 0.56068 (0.56185)	Top-1 acc 67.578 (66.077)	Top-5 acc 86.719 (85.401)	lr 0.00280
Train [94][3060/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.017)	Loss 2.4317 (2.4038)	Entropy 0.56090 (0.56185)	Top-1 acc 64.844 (66.078)	Top-5 acc 85.547 (85.402)	lr 0.00280
Train [94][3070/3239]	Time 0.224 (0.525)	Data Time 0.001 (0.017)	Loss 2.3293 (2.4039)	Entropy 0.56096 (0.56184)	Top-1 acc 69.531 (66.073)	Top-5 acc 86.719 (85.398)	lr 0.00280
Train [94][3080/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.017)	Loss 2.6028 (2.4041)	Entropy 0.56099 (0.56184)	Top-1 acc 61.328 (66.067)	Top-5 acc 82.422 (85.392)	lr 0.00280
Train [94][3090/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.016)	Loss 2.3337 (2.4041)	Entropy 0.56136 (0.56184)	Top-1 acc 67.578 (66.072)	Top-5 acc 86.719 (85.392)	lr 0.00280
Train [94][3100/3239]	Time 0.224 (0.524)	Data Time 0.001 (0.016)	Loss 2.5797 (2.4041)	Entropy 0.56126 (0.56184)	Top-1 acc 61.719 (66.071)	Top-5 acc 82.812 (85.393)	lr 0.00279
Train [94][3110/3239]	Time 0.226 (0.523)	Data Time 0.001 (0.016)	Loss 2.4413 (2.4039)	Entropy 0.56156 (0.56183)	Top-1 acc 64.844 (66.078)	Top-5 acc 86.328 (85.397)	lr 0.00279
Train [94][3120/3239]	Time 0.345 (0.523)	Data Time 0.001 (0.016)	Loss 2.3697 (2.4039)	Entropy 0.56125 (0.56183)	Top-1 acc 64.062 (66.076)	Top-5 acc 85.547 (85.398)	lr 0.00279
Train [94][3130/3239]	Time 0.224 (0.523)	Data Time 0.001 (0.016)	Loss 2.2657 (2.4039)	Entropy 0.56118 (0.56183)	Top-1 acc 72.266 (66.076)	Top-5 acc 89.062 (85.398)	lr 0.00279
Train [94][3140/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.016)	Loss 2.5243 (2.4038)	Entropy 0.56135 (0.56183)	Top-1 acc 63.672 (66.080)	Top-5 acc 84.375 (85.401)	lr 0.00279
Train [94][3150/3239]	Time 0.270 (0.522)	Data Time 0.003 (0.016)	Loss 2.3437 (2.4037)	Entropy 0.56115 (0.56183)	Top-1 acc 69.922 (66.083)	Top-5 acc 84.375 (85.404)	lr 0.00279
Train [94][3160/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.016)	Loss 2.2621 (2.4036)	Entropy 0.56093 (0.56182)	Top-1 acc 73.828 (66.086)	Top-5 acc 89.062 (85.406)	lr 0.00279
Train [94][3170/3239]	Time 0.267 (0.521)	Data Time 0.001 (0.016)	Loss 2.5343 (2.4037)	Entropy 0.56024 (0.56182)	Top-1 acc 62.109 (66.082)	Top-5 acc 82.422 (85.403)	lr 0.00279
Train [94][3180/3239]	Time 0.259 (0.521)	Data Time 0.000 (0.016)	Loss 2.3175 (2.4035)	Entropy 0.55997 (0.56182)	Top-1 acc 66.797 (66.085)	Top-5 acc 88.281 (85.406)	lr 0.00279
Train [94][3190/3239]	Time 0.227 (0.521)	Data Time 0.000 (0.016)	Loss 2.4031 (2.4036)	Entropy 0.55963 (0.56181)	Top-1 acc 66.406 (66.085)	Top-5 acc 85.547 (85.405)	lr 0.00279
Train [94][3200/3239]	Time 0.235 (0.520)	Data Time 0.000 (0.016)	Loss 2.4258 (2.4036)	Entropy 0.55960 (0.56180)	Top-1 acc 65.625 (66.086)	Top-5 acc 83.594 (85.405)	lr 0.00279
Train [94][3210/3239]	Time 0.313 (0.520)	Data Time 0.000 (0.016)	Loss 2.5716 (2.4038)	Entropy 0.55964 (0.56180)	Top-1 acc 61.328 (66.083)	Top-5 acc 82.031 (85.403)	lr 0.00279
Train [94][3220/3239]	Time 0.308 (0.520)	Data Time 0.000 (0.016)	Loss 2.3626 (2.4038)	Entropy 0.55979 (0.56179)	Top-1 acc 62.500 (66.080)	Top-5 acc 87.891 (85.402)	lr 0.00279
Train [94][3230/3239]	Time 0.276 (0.537)	Data Time 0.000 (0.016)	Loss 2.4617 (2.4038)	Entropy 0.55951 (0.56178)	Top-1 acc 64.062 (66.079)	Top-5 acc 86.328 (85.402)	lr 0.00279
Train [94][3239/3239]	Time 0.974 (0.536)	Data Time 0.000 (0.016)	Loss 2.6620 (2.4038)	Entropy 0.55955 (0.56178)	Top-1 acc 59.259 (66.080)	Top-5 acc 85.185 (85.403)	lr 0.00279
==========Valid [94/120]	loss 1.221	top-1 acc 71.920 (71.947)	top-5 acc 89.896	Train top-1 66.080	top-5 85.403	Entropy 0.55955	Latency-None: 0.000ms	Flops: 539.00M
Train [95][0/3239]	Time 38.633 (38.633)	Data Time 36.057 (36.057)	Loss 2.5103 (2.5103)	Entropy 0.55966 (0.55966)	Top-1 acc 58.594 (58.594)	Top-5 acc 85.156 (85.156)	lr 0.00279
Train [95][10/3239]	Time 0.232 (3.944)	Data Time 0.001 (3.280)	Loss 2.4034 (2.3995)	Entropy 0.55986 (0.55971)	Top-1 acc 67.188 (66.335)	Top-5 acc 86.328 (85.653)	lr 0.00279
Train [95][20/3239]	Time 0.226 (2.271)	Data Time 0.001 (1.719)	Loss 2.4146 (2.4482)	Entropy 0.55989 (0.55977)	Top-1 acc 66.406 (65.290)	Top-5 acc 85.938 (84.617)	lr 0.00278
Train [95][30/3239]	Time 0.261 (1.673)	Data Time 0.001 (1.165)	Loss 2.3988 (2.4198)	Entropy 0.56010 (0.55982)	Top-1 acc 66.797 (65.965)	Top-5 acc 84.375 (85.005)	lr 0.00278
Train [95][40/3239]	Time 0.313 (1.371)	Data Time 0.001 (0.881)	Loss 2.4545 (2.4080)	Entropy 0.55988 (0.55989)	Top-1 acc 64.844 (66.311)	Top-5 acc 83.984 (85.309)	lr 0.00278
Train [95][50/3239]	Time 0.231 (1.183)	Data Time 0.001 (0.709)	Loss 2.4146 (2.3988)	Entropy 0.56013 (0.55989)	Top-1 acc 67.969 (66.452)	Top-5 acc 85.156 (85.470)	lr 0.00278
Train [95][60/3239]	Time 0.277 (1.064)	Data Time 0.002 (0.593)	Loss 2.2158 (2.4020)	Entropy 0.55982 (0.55991)	Top-1 acc 71.094 (66.419)	Top-5 acc 89.844 (85.406)	lr 0.00278
Train [95][70/3239]	Time 0.233 (0.978)	Data Time 0.001 (0.511)	Loss 2.4768 (2.4014)	Entropy 0.55980 (0.55990)	Top-1 acc 60.938 (66.412)	Top-5 acc 83.594 (85.437)	lr 0.00278
Train [95][80/3239]	Time 0.233 (0.909)	Data Time 0.001 (0.448)	Loss 2.2975 (2.4012)	Entropy 0.55996 (0.55990)	Top-1 acc 68.359 (66.411)	Top-5 acc 87.891 (85.489)	lr 0.00278
Train [95][90/3239]	Time 0.282 (0.859)	Data Time 0.001 (0.399)	Loss 2.3480 (2.3990)	Entropy 0.56015 (0.55992)	Top-1 acc 64.844 (66.346)	Top-5 acc 86.719 (85.547)	lr 0.00278
Train [95][100/3239]	Time 0.254 (0.830)	Data Time 0.002 (0.359)	Loss 2.5519 (2.4002)	Entropy 0.56002 (0.55993)	Top-1 acc 64.062 (66.286)	Top-5 acc 80.469 (85.562)	lr 0.00278
Train [95][110/3239]	Time 0.334 (0.795)	Data Time 0.001 (0.327)	Loss 2.3648 (2.3969)	Entropy 0.55982 (0.55994)	Top-1 acc 61.719 (66.276)	Top-5 acc 87.109 (85.610)	lr 0.00278
Train [95][120/3239]	Time 0.235 (0.763)	Data Time 0.002 (0.300)	Loss 2.3092 (2.3966)	Entropy 0.56009 (0.55994)	Top-1 acc 68.750 (66.284)	Top-5 acc 84.766 (85.618)	lr 0.00278
Train [95][130/3239]	Time 0.236 (0.736)	Data Time 0.002 (0.277)	Loss 2.4026 (2.3962)	Entropy 0.56020 (0.55996)	Top-1 acc 64.062 (66.299)	Top-5 acc 85.547 (85.598)	lr 0.00278
Train [95][140/3239]	Time 0.256 (0.721)	Data Time 0.003 (0.258)	Loss 2.3765 (2.3973)	Entropy 0.56040 (0.55998)	Top-1 acc 65.234 (66.284)	Top-5 acc 86.328 (85.547)	lr 0.00278
Train [95][150/3239]	Time 0.227 (0.705)	Data Time 0.001 (0.241)	Loss 2.4688 (2.3960)	Entropy 0.56048 (0.56001)	Top-1 acc 61.719 (66.220)	Top-5 acc 82.422 (85.555)	lr 0.00278
Train [95][160/3239]	Time 0.219 (0.688)	Data Time 0.001 (0.226)	Loss 2.3407 (2.3953)	Entropy 0.56063 (0.56004)	Top-1 acc 65.234 (66.251)	Top-5 acc 87.891 (85.535)	lr 0.00278
Train [95][170/3239]	Time 0.252 (0.672)	Data Time 0.001 (0.213)	Loss 2.4098 (2.3965)	Entropy 0.56066 (0.56007)	Top-1 acc 65.234 (66.274)	Top-5 acc 84.766 (85.499)	lr 0.00277
Train [95][180/3239]	Time 0.249 (0.660)	Data Time 0.001 (0.201)	Loss 2.4903 (2.3972)	Entropy 0.56055 (0.56010)	Top-1 acc 61.719 (66.236)	Top-5 acc 84.375 (85.489)	lr 0.00277
Train [95][190/3239]	Time 0.245 (0.649)	Data Time 0.001 (0.191)	Loss 2.2947 (2.3934)	Entropy 0.56052 (0.56012)	Top-1 acc 69.531 (66.355)	Top-5 acc 86.719 (85.535)	lr 0.00277
Train [95][200/3239]	Time 0.264 (0.638)	Data Time 0.001 (0.181)	Loss 2.4951 (2.3948)	Entropy 0.56034 (0.56014)	Top-1 acc 62.500 (66.383)	Top-5 acc 85.156 (85.518)	lr 0.00277
Train [95][210/3239]	Time 0.240 (0.629)	Data Time 0.001 (0.173)	Loss 2.2663 (2.3929)	Entropy 0.56043 (0.56015)	Top-1 acc 71.094 (66.414)	Top-5 acc 87.109 (85.554)	lr 0.00277
Train [95][220/3239]	Time 0.250 (0.619)	Data Time 0.001 (0.165)	Loss 2.2900 (2.3915)	Entropy 0.56037 (0.56016)	Top-1 acc 71.484 (66.452)	Top-5 acc 87.109 (85.589)	lr 0.00277
Train [95][230/3239]	Time 0.239 (0.610)	Data Time 0.002 (0.158)	Loss 2.2662 (2.3918)	Entropy 0.56013 (0.56016)	Top-1 acc 67.188 (66.494)	Top-5 acc 88.281 (85.593)	lr 0.00277
Train [95][240/3239]	Time 0.233 (0.602)	Data Time 0.001 (0.152)	Loss 2.3588 (2.3940)	Entropy 0.55990 (0.56016)	Top-1 acc 66.406 (66.453)	Top-5 acc 85.938 (85.527)	lr 0.00277
Train [95][250/3239]	Time 0.226 (0.594)	Data Time 0.001 (0.146)	Loss 2.6657 (2.3958)	Entropy 0.55998 (0.56015)	Top-1 acc 60.156 (66.392)	Top-5 acc 80.859 (85.505)	lr 0.00277
Train [95][260/3239]	Time 0.238 (0.587)	Data Time 0.001 (0.140)	Loss 2.5478 (2.3955)	Entropy 0.55989 (0.56014)	Top-1 acc 61.719 (66.327)	Top-5 acc 83.594 (85.512)	lr 0.00277
Train [95][270/3239]	Time 0.312 (0.581)	Data Time 0.001 (0.135)	Loss 2.5271 (2.3953)	Entropy 0.55974 (0.56013)	Top-1 acc 63.281 (66.307)	Top-5 acc 84.375 (85.515)	lr 0.00277
Train [95][280/3239]	Time 0.230 (0.575)	Data Time 0.001 (0.130)	Loss 2.4211 (2.3939)	Entropy 0.55983 (0.56012)	Top-1 acc 65.625 (66.327)	Top-5 acc 84.766 (85.547)	lr 0.00277
Train [95][290/3239]	Time 0.215 (0.570)	Data Time 0.001 (0.126)	Loss 2.5713 (2.3949)	Entropy 0.55959 (0.56011)	Top-1 acc 65.234 (66.327)	Top-5 acc 83.984 (85.527)	lr 0.00277
Train [95][300/3239]	Time 0.227 (0.565)	Data Time 0.001 (0.122)	Loss 2.4217 (2.3948)	Entropy 0.55959 (0.56009)	Top-1 acc 67.188 (66.310)	Top-5 acc 84.766 (85.531)	lr 0.00277
Train [95][310/3239]	Time 0.242 (0.561)	Data Time 0.001 (0.118)	Loss 2.2085 (2.3941)	Entropy 0.55965 (0.56008)	Top-1 acc 70.703 (66.316)	Top-5 acc 88.672 (85.532)	lr 0.00277
Train [95][320/3239]	Time 0.225 (0.556)	Data Time 0.001 (0.114)	Loss 2.4577 (2.3928)	Entropy 0.55930 (0.56006)	Top-1 acc 62.109 (66.354)	Top-5 acc 85.156 (85.553)	lr 0.00277
Train [95][330/3239]	Time 0.230 (0.551)	Data Time 0.001 (0.111)	Loss 2.3691 (2.3955)	Entropy 0.55922 (0.56004)	Top-1 acc 67.969 (66.287)	Top-5 acc 88.281 (85.532)	lr 0.00276
Train [95][340/3239]	Time 0.315 (0.547)	Data Time 0.001 (0.108)	Loss 2.2599 (2.3952)	Entropy 0.55914 (0.56001)	Top-1 acc 68.359 (66.303)	Top-5 acc 87.891 (85.539)	lr 0.00276
Train [95][350/3239]	Time 0.229 (0.543)	Data Time 0.001 (0.105)	Loss 2.2017 (2.3945)	Entropy 0.55922 (0.55999)	Top-1 acc 70.312 (66.307)	Top-5 acc 87.891 (85.557)	lr 0.00276
Train [95][360/3239]	Time 0.227 (0.539)	Data Time 0.001 (0.102)	Loss 2.3155 (2.3934)	Entropy 0.55906 (0.55996)	Top-1 acc 66.406 (66.342)	Top-5 acc 86.719 (85.569)	lr 0.00276
Train [95][370/3239]	Time 0.223 (0.535)	Data Time 0.001 (0.099)	Loss 2.4038 (2.3935)	Entropy 0.55889 (0.55994)	Top-1 acc 64.844 (66.329)	Top-5 acc 84.375 (85.574)	lr 0.00276
Train [95][380/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.097)	Loss 2.3501 (2.3931)	Entropy 0.55897 (0.55991)	Top-1 acc 67.969 (66.333)	Top-5 acc 87.891 (85.590)	lr 0.00276
Train [95][390/3239]	Time 0.250 (0.529)	Data Time 0.001 (0.094)	Loss 2.4956 (2.3921)	Entropy 0.55923 (0.55989)	Top-1 acc 66.406 (66.376)	Top-5 acc 85.156 (85.599)	lr 0.00276
Train [95][400/3239]	Time 0.228 (0.526)	Data Time 0.001 (0.092)	Loss 2.3767 (2.3922)	Entropy 0.55925 (0.55987)	Top-1 acc 67.188 (66.394)	Top-5 acc 86.328 (85.589)	lr 0.00276
Train [95][410/3239]	Time 0.300 (0.526)	Data Time 0.002 (0.090)	Loss 2.4195 (2.3922)	Entropy 0.55908 (0.55986)	Top-1 acc 66.016 (66.374)	Top-5 acc 85.938 (85.610)	lr 0.00276
Train [95][420/3239]	Time 0.235 (0.525)	Data Time 0.001 (0.087)	Loss 2.5962 (2.3951)	Entropy 0.55902 (0.55984)	Top-1 acc 63.672 (66.309)	Top-5 acc 83.203 (85.557)	lr 0.00276
Train [95][430/3239]	Time 0.327 (0.522)	Data Time 0.001 (0.085)	Loss 2.2567 (2.3957)	Entropy 0.55928 (0.55982)	Top-1 acc 70.312 (66.303)	Top-5 acc 88.281 (85.539)	lr 0.00276
Train [95][440/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.084)	Loss 2.3464 (2.3955)	Entropy 0.55956 (0.55981)	Top-1 acc 67.578 (66.313)	Top-5 acc 85.938 (85.552)	lr 0.00276
Train [95][450/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.082)	Loss 2.3315 (2.3953)	Entropy 0.55966 (0.55980)	Top-1 acc 67.578 (66.310)	Top-5 acc 85.547 (85.550)	lr 0.00276
Train [95][460/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.080)	Loss 2.3183 (2.3938)	Entropy 0.55962 (0.55980)	Top-1 acc 67.578 (66.346)	Top-5 acc 87.891 (85.571)	lr 0.00276
Train [95][470/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.078)	Loss 2.3340 (2.3926)	Entropy 0.55964 (0.55980)	Top-1 acc 66.016 (66.352)	Top-5 acc 83.203 (85.592)	lr 0.00276
Train [95][480/3239]	Time 0.223 (0.510)	Data Time 0.001 (0.077)	Loss 2.3374 (2.3913)	Entropy 0.55989 (0.55979)	Top-1 acc 67.969 (66.376)	Top-5 acc 86.719 (85.613)	lr 0.00276
Train [95][490/3239]	Time 0.228 (0.508)	Data Time 0.001 (0.075)	Loss 2.1029 (2.3905)	Entropy 0.55989 (0.55980)	Top-1 acc 74.609 (66.392)	Top-5 acc 90.625 (85.624)	lr 0.00275
Train [95][500/3239]	Time 0.321 (0.506)	Data Time 0.001 (0.074)	Loss 2.3962 (2.3910)	Entropy 0.55972 (0.55980)	Top-1 acc 65.625 (66.381)	Top-5 acc 86.719 (85.619)	lr 0.00275
Train [95][510/3239]	Time 0.236 (0.504)	Data Time 0.001 (0.072)	Loss 2.2553 (2.3907)	Entropy 0.55979 (0.55979)	Top-1 acc 70.312 (66.383)	Top-5 acc 86.328 (85.621)	lr 0.00275
Train [95][520/3239]	Time 0.247 (0.502)	Data Time 0.001 (0.071)	Loss 2.5028 (2.3912)	Entropy 0.56013 (0.55980)	Top-1 acc 64.062 (66.378)	Top-5 acc 81.641 (85.613)	lr 0.00275
Train [95][530/3239]	Time 0.224 (0.501)	Data Time 0.001 (0.070)	Loss 2.4743 (2.3907)	Entropy 0.55988 (0.55980)	Top-1 acc 65.234 (66.377)	Top-5 acc 83.594 (85.620)	lr 0.00275
Train [95][540/3239]	Time 0.225 (0.499)	Data Time 0.001 (0.068)	Loss 2.5454 (2.3910)	Entropy 0.55981 (0.55980)	Top-1 acc 62.109 (66.367)	Top-5 acc 83.594 (85.611)	lr 0.00275
Train [95][550/3239]	Time 0.232 (0.498)	Data Time 0.001 (0.067)	Loss 2.4046 (2.3914)	Entropy 0.55968 (0.55980)	Top-1 acc 67.188 (66.363)	Top-5 acc 85.938 (85.606)	lr 0.00275
Train [95][560/3239]	Time 0.222 (0.496)	Data Time 0.001 (0.066)	Loss 2.3949 (2.3918)	Entropy 0.55932 (0.55980)	Top-1 acc 63.281 (66.350)	Top-5 acc 83.203 (85.587)	lr 0.00275
Train [95][570/3239]	Time 0.231 (0.495)	Data Time 0.001 (0.065)	Loss 2.2722 (2.3918)	Entropy 0.55918 (0.55979)	Top-1 acc 67.188 (66.343)	Top-5 acc 89.062 (85.589)	lr 0.00275
Train [95][580/3239]	Time 0.231 (0.493)	Data Time 0.001 (0.064)	Loss 2.0887 (2.3905)	Entropy 0.55932 (0.55978)	Top-1 acc 75.391 (66.388)	Top-5 acc 91.016 (85.594)	lr 0.00275
Train [95][590/3239]	Time 0.316 (0.492)	Data Time 0.001 (0.063)	Loss 2.4891 (2.3905)	Entropy 0.55888 (0.55977)	Top-1 acc 64.453 (66.399)	Top-5 acc 82.422 (85.598)	lr 0.00275
Train [95][600/3239]	Time 0.227 (0.490)	Data Time 0.001 (0.062)	Loss 2.2253 (2.3907)	Entropy 0.55876 (0.55976)	Top-1 acc 70.312 (66.398)	Top-5 acc 87.891 (85.607)	lr 0.00275
Train [95][610/3239]	Time 0.244 (0.489)	Data Time 0.001 (0.061)	Loss 2.2560 (2.3907)	Entropy 0.55839 (0.55974)	Top-1 acc 71.875 (66.404)	Top-5 acc 87.500 (85.609)	lr 0.00275
Train [95][620/3239]	Time 0.256 (0.487)	Data Time 0.001 (0.060)	Loss 2.5035 (2.3919)	Entropy 0.55798 (0.55971)	Top-1 acc 67.188 (66.366)	Top-5 acc 84.375 (85.584)	lr 0.00275
Train [95][630/3239]	Time 0.229 (0.486)	Data Time 0.001 (0.059)	Loss 2.2918 (2.3926)	Entropy 0.55800 (0.55969)	Top-1 acc 69.922 (66.349)	Top-5 acc 86.328 (85.575)	lr 0.00275
Train [95][640/3239]	Time 0.358 (0.572)	Data Time 0.006 (0.058)	Loss 2.5661 (2.3928)	Entropy 0.55798 (0.55966)	Top-1 acc 62.891 (66.351)	Top-5 acc 81.641 (85.569)	lr 0.00275
Train [95][650/3239]	Time 0.249 (0.570)	Data Time 0.002 (0.057)	Loss 2.4080 (2.3932)	Entropy 0.55814 (0.55964)	Top-1 acc 67.188 (66.362)	Top-5 acc 88.281 (85.557)	lr 0.00274
Train [95][660/3239]	Time 0.357 (0.568)	Data Time 0.002 (0.056)	Loss 2.3153 (2.3935)	Entropy 0.55793 (0.55961)	Top-1 acc 69.141 (66.348)	Top-5 acc 86.719 (85.553)	lr 0.00274
Train [95][670/3239]	Time 0.236 (0.566)	Data Time 0.002 (0.055)	Loss 2.5156 (2.3933)	Entropy 0.55796 (0.55959)	Top-1 acc 60.156 (66.359)	Top-5 acc 83.594 (85.551)	lr 0.00274
Train [95][680/3239]	Time 0.233 (0.564)	Data Time 0.001 (0.055)	Loss 2.2854 (2.3936)	Entropy 0.55754 (0.55956)	Top-1 acc 67.969 (66.359)	Top-5 acc 89.062 (85.546)	lr 0.00274
Train [95][690/3239]	Time 0.237 (0.562)	Data Time 0.001 (0.054)	Loss 2.5198 (2.3943)	Entropy 0.55730 (0.55953)	Top-1 acc 60.156 (66.329)	Top-5 acc 85.547 (85.536)	lr 0.00274
Train [95][700/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.053)	Loss 2.2323 (2.3935)	Entropy 0.55734 (0.55950)	Top-1 acc 71.094 (66.358)	Top-5 acc 85.938 (85.554)	lr 0.00274
Train [95][710/3239]	Time 0.229 (0.558)	Data Time 0.001 (0.052)	Loss 2.3112 (2.3938)	Entropy 0.55693 (0.55947)	Top-1 acc 67.188 (66.328)	Top-5 acc 87.500 (85.543)	lr 0.00274
Train [95][720/3239]	Time 0.228 (0.556)	Data Time 0.001 (0.052)	Loss 2.4209 (2.3947)	Entropy 0.55684 (0.55943)	Top-1 acc 63.281 (66.292)	Top-5 acc 84.375 (85.529)	lr 0.00274
Train [95][730/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.051)	Loss 2.4686 (2.3959)	Entropy 0.55672 (0.55940)	Top-1 acc 63.672 (66.282)	Top-5 acc 85.547 (85.510)	lr 0.00274
Train [95][740/3239]	Time 0.239 (0.552)	Data Time 0.001 (0.050)	Loss 2.4212 (2.3963)	Entropy 0.55638 (0.55936)	Top-1 acc 65.625 (66.277)	Top-5 acc 84.375 (85.514)	lr 0.00274
Train [95][750/3239]	Time 0.325 (0.551)	Data Time 0.001 (0.050)	Loss 2.5386 (2.3972)	Entropy 0.55665 (0.55932)	Top-1 acc 60.547 (66.240)	Top-5 acc 85.156 (85.501)	lr 0.00274
Train [95][760/3239]	Time 0.228 (0.549)	Data Time 0.001 (0.049)	Loss 2.7231 (2.3982)	Entropy 0.55675 (0.55929)	Top-1 acc 57.812 (66.230)	Top-5 acc 81.250 (85.483)	lr 0.00274
Train [95][770/3239]	Time 0.231 (0.547)	Data Time 0.001 (0.049)	Loss 2.3701 (2.3984)	Entropy 0.55692 (0.55925)	Top-1 acc 68.359 (66.234)	Top-5 acc 86.328 (85.477)	lr 0.00274
Train [95][780/3239]	Time 0.233 (0.546)	Data Time 0.001 (0.048)	Loss 2.2153 (2.3974)	Entropy 0.55728 (0.55923)	Top-1 acc 70.703 (66.270)	Top-5 acc 88.672 (85.488)	lr 0.00274
Train [95][790/3239]	Time 0.238 (0.544)	Data Time 0.001 (0.047)	Loss 2.2303 (2.3970)	Entropy 0.55730 (0.55920)	Top-1 acc 70.312 (66.276)	Top-5 acc 90.625 (85.496)	lr 0.00274
Train [95][800/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.047)	Loss 2.1262 (2.3969)	Entropy 0.55711 (0.55918)	Top-1 acc 73.828 (66.276)	Top-5 acc 90.234 (85.498)	lr 0.00274
Train [95][810/3239]	Time 0.225 (0.541)	Data Time 0.001 (0.046)	Loss 2.4090 (2.3987)	Entropy 0.55679 (0.55915)	Top-1 acc 65.234 (66.229)	Top-5 acc 83.984 (85.460)	lr 0.00273
Train [95][820/3239]	Time 0.325 (0.539)	Data Time 0.001 (0.046)	Loss 2.3664 (2.3986)	Entropy 0.55674 (0.55912)	Top-1 acc 68.750 (66.230)	Top-5 acc 83.984 (85.458)	lr 0.00273
Train [95][830/3239]	Time 0.242 (0.537)	Data Time 0.001 (0.045)	Loss 2.4407 (2.3991)	Entropy 0.55684 (0.55909)	Top-1 acc 65.625 (66.230)	Top-5 acc 83.984 (85.439)	lr 0.00273
Train [95][840/3239]	Time 0.229 (0.536)	Data Time 0.001 (0.045)	Loss 2.2810 (2.3983)	Entropy 0.55664 (0.55906)	Top-1 acc 67.969 (66.246)	Top-5 acc 87.500 (85.453)	lr 0.00273
Train [95][850/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.044)	Loss 2.2743 (2.3984)	Entropy 0.55644 (0.55903)	Top-1 acc 68.359 (66.250)	Top-5 acc 89.062 (85.457)	lr 0.00273
Train [95][860/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.044)	Loss 2.5726 (2.3996)	Entropy 0.55647 (0.55900)	Top-1 acc 65.625 (66.242)	Top-5 acc 83.203 (85.431)	lr 0.00273
Train [95][870/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.043)	Loss 2.3609 (2.3999)	Entropy 0.55628 (0.55897)	Top-1 acc 69.531 (66.254)	Top-5 acc 89.453 (85.433)	lr 0.00273
Train [95][880/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.043)	Loss 2.4728 (2.4001)	Entropy 0.55641 (0.55894)	Top-1 acc 64.453 (66.254)	Top-5 acc 84.375 (85.427)	lr 0.00273
Train [95][890/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.042)	Loss 2.2901 (2.4001)	Entropy 0.55627 (0.55892)	Top-1 acc 67.188 (66.249)	Top-5 acc 85.938 (85.419)	lr 0.00273
Train [95][900/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.042)	Loss 2.5043 (2.4002)	Entropy 0.55625 (0.55889)	Top-1 acc 62.891 (66.238)	Top-5 acc 82.812 (85.412)	lr 0.00273
Train [95][910/3239]	Time 0.243 (0.527)	Data Time 0.001 (0.041)	Loss 2.3002 (2.3992)	Entropy 0.55588 (0.55886)	Top-1 acc 70.703 (66.257)	Top-5 acc 87.500 (85.430)	lr 0.00273
Train [95][920/3239]	Time 0.304 (0.527)	Data Time 0.002 (0.041)	Loss 2.3435 (2.3985)	Entropy 0.55597 (0.55882)	Top-1 acc 68.750 (66.263)	Top-5 acc 86.328 (85.438)	lr 0.00273
Train [95][930/3239]	Time 0.224 (0.527)	Data Time 0.001 (0.040)	Loss 2.4080 (2.3983)	Entropy 0.55583 (0.55879)	Top-1 acc 69.141 (66.268)	Top-5 acc 85.938 (85.450)	lr 0.00273
Train [95][940/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.040)	Loss 2.3697 (2.3989)	Entropy 0.55573 (0.55876)	Top-1 acc 68.750 (66.265)	Top-5 acc 86.719 (85.437)	lr 0.00273
Train [95][950/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.040)	Loss 2.1319 (2.3982)	Entropy 0.55540 (0.55873)	Top-1 acc 73.047 (66.285)	Top-5 acc 89.844 (85.447)	lr 0.00273
Train [95][960/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.039)	Loss 2.1744 (2.3974)	Entropy 0.55574 (0.55869)	Top-1 acc 73.438 (66.308)	Top-5 acc 87.500 (85.466)	lr 0.00272
Train [95][970/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.039)	Loss 2.4420 (2.3972)	Entropy 0.55610 (0.55866)	Top-1 acc 66.016 (66.311)	Top-5 acc 84.766 (85.464)	lr 0.00272
Train [95][980/3239]	Time 0.329 (0.521)	Data Time 0.001 (0.038)	Loss 2.4064 (2.3973)	Entropy 0.55606 (0.55864)	Top-1 acc 67.969 (66.318)	Top-5 acc 87.500 (85.456)	lr 0.00272
Train [95][990/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.038)	Loss 2.3493 (2.3975)	Entropy 0.55609 (0.55861)	Top-1 acc 63.281 (66.305)	Top-5 acc 86.328 (85.448)	lr 0.00272
Train [95][1000/3239]	Time 0.235 (0.519)	Data Time 0.001 (0.038)	Loss 2.5498 (2.3977)	Entropy 0.55583 (0.55859)	Top-1 acc 59.766 (66.295)	Top-5 acc 83.203 (85.449)	lr 0.00272
Train [95][1010/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.037)	Loss 2.3639 (2.3984)	Entropy 0.55602 (0.55856)	Top-1 acc 67.969 (66.269)	Top-5 acc 87.109 (85.447)	lr 0.00272
Train [95][1020/3239]	Time 0.217 (0.517)	Data Time 0.001 (0.037)	Loss 2.4022 (2.3985)	Entropy 0.55587 (0.55854)	Top-1 acc 62.109 (66.265)	Top-5 acc 86.719 (85.445)	lr 0.00272
Train [95][1030/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.037)	Loss 2.3313 (2.3985)	Entropy 0.55546 (0.55851)	Top-1 acc 68.359 (66.261)	Top-5 acc 85.156 (85.451)	lr 0.00272
Train [95][1040/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.036)	Loss 2.2814 (2.3986)	Entropy 0.55556 (0.55848)	Top-1 acc 67.969 (66.251)	Top-5 acc 89.844 (85.456)	lr 0.00272
Train [95][1050/3239]	Time 0.319 (0.514)	Data Time 0.001 (0.036)	Loss 2.6373 (2.3992)	Entropy 0.55537 (0.55845)	Top-1 acc 59.766 (66.235)	Top-5 acc 81.250 (85.443)	lr 0.00272
Train [95][1060/3239]	Time 0.232 (0.513)	Data Time 0.001 (0.036)	Loss 2.3525 (2.3992)	Entropy 0.55486 (0.55842)	Top-1 acc 67.578 (66.239)	Top-5 acc 87.109 (85.450)	lr 0.00272
Train [95][1070/3239]	Time 0.283 (0.512)	Data Time 0.001 (0.035)	Loss 2.2194 (2.3992)	Entropy 0.55513 (0.55839)	Top-1 acc 66.406 (66.226)	Top-5 acc 89.844 (85.452)	lr 0.00272
Train [95][1080/3239]	Time 0.290 (0.512)	Data Time 0.001 (0.035)	Loss 2.4017 (2.3999)	Entropy 0.55532 (0.55836)	Top-1 acc 66.797 (66.207)	Top-5 acc 86.719 (85.442)	lr 0.00272
Train [95][1090/3239]	Time 0.285 (0.513)	Data Time 0.002 (0.035)	Loss 2.3744 (2.3997)	Entropy 0.55538 (0.55833)	Top-1 acc 67.969 (66.219)	Top-5 acc 85.156 (85.442)	lr 0.00272
Train [95][1100/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.034)	Loss 2.4501 (2.3994)	Entropy 0.55518 (0.55830)	Top-1 acc 64.844 (66.224)	Top-5 acc 84.766 (85.453)	lr 0.00272
Train [95][1110/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.034)	Loss 2.4173 (2.3997)	Entropy 0.55540 (0.55828)	Top-1 acc 63.672 (66.210)	Top-5 acc 86.328 (85.451)	lr 0.00272
Train [95][1120/3239]	Time 0.231 (0.511)	Data Time 0.001 (0.034)	Loss 2.3440 (2.3999)	Entropy 0.55534 (0.55825)	Top-1 acc 71.484 (66.212)	Top-5 acc 83.984 (85.441)	lr 0.00271
Train [95][1130/3239]	Time 0.221 (0.510)	Data Time 0.001 (0.034)	Loss 2.5469 (2.4000)	Entropy 0.55535 (0.55823)	Top-1 acc 62.109 (66.211)	Top-5 acc 81.250 (85.441)	lr 0.00271
Train [95][1140/3239]	Time 0.412 (0.509)	Data Time 0.001 (0.033)	Loss 2.2913 (2.3998)	Entropy 0.55542 (0.55820)	Top-1 acc 65.625 (66.217)	Top-5 acc 87.109 (85.449)	lr 0.00271
Train [95][1150/3239]	Time 0.223 (0.508)	Data Time 0.001 (0.033)	Loss 2.6139 (2.4006)	Entropy 0.55563 (0.55818)	Top-1 acc 61.328 (66.197)	Top-5 acc 82.812 (85.439)	lr 0.00271
Train [95][1160/3239]	Time 0.256 (0.507)	Data Time 0.001 (0.033)	Loss 2.3487 (2.3999)	Entropy 0.55566 (0.55816)	Top-1 acc 69.141 (66.211)	Top-5 acc 86.719 (85.451)	lr 0.00271
Train [95][1170/3239]	Time 0.234 (0.507)	Data Time 0.001 (0.032)	Loss 2.3339 (2.3999)	Entropy 0.55577 (0.55813)	Top-1 acc 67.188 (66.215)	Top-5 acc 87.500 (85.454)	lr 0.00271
Train [95][1180/3239]	Time 0.234 (0.506)	Data Time 0.001 (0.032)	Loss 2.4268 (2.3998)	Entropy 0.55595 (0.55811)	Top-1 acc 66.406 (66.223)	Top-5 acc 84.766 (85.454)	lr 0.00271
Train [95][1190/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.032)	Loss 2.7958 (2.4004)	Entropy 0.55520 (0.55809)	Top-1 acc 57.031 (66.204)	Top-5 acc 76.562 (85.440)	lr 0.00271
Train [95][1200/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.032)	Loss 2.2122 (2.4005)	Entropy 0.55505 (0.55807)	Top-1 acc 71.094 (66.204)	Top-5 acc 89.062 (85.438)	lr 0.00271
Train [95][1210/3239]	Time 0.321 (0.503)	Data Time 0.001 (0.031)	Loss 2.3830 (2.4008)	Entropy 0.55508 (0.55804)	Top-1 acc 64.062 (66.196)	Top-5 acc 87.500 (85.427)	lr 0.00271
Train [95][1220/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.031)	Loss 2.5211 (2.4009)	Entropy 0.55533 (0.55802)	Top-1 acc 62.109 (66.195)	Top-5 acc 83.203 (85.422)	lr 0.00271
Train [95][1230/3239]	Time 0.238 (0.502)	Data Time 0.001 (0.031)	Loss 2.2447 (2.4009)	Entropy 0.55562 (0.55800)	Top-1 acc 71.094 (66.201)	Top-5 acc 88.281 (85.424)	lr 0.00271
Train [95][1240/3239]	Time 0.220 (0.501)	Data Time 0.001 (0.031)	Loss 2.5985 (2.4012)	Entropy 0.55559 (0.55798)	Top-1 acc 58.594 (66.195)	Top-5 acc 80.859 (85.419)	lr 0.00271
Train [95][1250/3239]	Time 0.230 (0.500)	Data Time 0.001 (0.030)	Loss 2.2635 (2.4008)	Entropy 0.55606 (0.55796)	Top-1 acc 67.578 (66.203)	Top-5 acc 87.891 (85.426)	lr 0.00271
Train [95][1260/3239]	Time 0.218 (0.499)	Data Time 0.001 (0.030)	Loss 2.2359 (2.4004)	Entropy 0.55585 (0.55795)	Top-1 acc 70.703 (66.209)	Top-5 acc 88.281 (85.433)	lr 0.00271
Train [95][1270/3239]	Time 0.250 (0.499)	Data Time 0.001 (0.030)	Loss 2.3946 (2.4005)	Entropy 0.55556 (0.55793)	Top-1 acc 67.969 (66.211)	Top-5 acc 85.938 (85.429)	lr 0.00271
Train [95][1280/3239]	Time 0.232 (0.498)	Data Time 0.001 (0.030)	Loss 2.5267 (2.4006)	Entropy 0.55546 (0.55791)	Top-1 acc 62.109 (66.217)	Top-5 acc 81.250 (85.425)	lr 0.00270
Train [95][1290/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.030)	Loss 2.3816 (2.4001)	Entropy 0.55535 (0.55789)	Top-1 acc 66.797 (66.232)	Top-5 acc 84.375 (85.430)	lr 0.00270
Train [95][1300/3239]	Time 0.497 (0.538)	Data Time 0.006 (0.029)	Loss 2.2658 (2.3997)	Entropy 0.55535 (0.55787)	Top-1 acc 69.141 (66.247)	Top-5 acc 87.891 (85.440)	lr 0.00270
Train [95][1310/3239]	Time 0.243 (0.538)	Data Time 0.002 (0.029)	Loss 2.3413 (2.3998)	Entropy 0.55550 (0.55785)	Top-1 acc 70.312 (66.245)	Top-5 acc 86.328 (85.438)	lr 0.00270
Train [95][1320/3239]	Time 0.275 (0.537)	Data Time 0.002 (0.029)	Loss 2.5942 (2.3997)	Entropy 0.55546 (0.55783)	Top-1 acc 61.719 (66.249)	Top-5 acc 81.250 (85.444)	lr 0.00270
Train [95][1330/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.029)	Loss 2.5753 (2.3996)	Entropy 0.55580 (0.55782)	Top-1 acc 61.719 (66.245)	Top-5 acc 81.641 (85.450)	lr 0.00270
Train [95][1340/3239]	Time 0.245 (0.536)	Data Time 0.001 (0.029)	Loss 2.2465 (2.3993)	Entropy 0.55573 (0.55780)	Top-1 acc 70.312 (66.253)	Top-5 acc 88.672 (85.459)	lr 0.00270
Train [95][1350/3239]	Time 0.245 (0.535)	Data Time 0.002 (0.028)	Loss 2.4248 (2.3992)	Entropy 0.55562 (0.55779)	Top-1 acc 66.406 (66.257)	Top-5 acc 86.719 (85.464)	lr 0.00270
Train [95][1360/3239]	Time 0.243 (0.535)	Data Time 0.001 (0.028)	Loss 2.1950 (2.3996)	Entropy 0.55560 (0.55777)	Top-1 acc 71.875 (66.250)	Top-5 acc 88.281 (85.454)	lr 0.00270
Train [95][1370/3239]	Time 0.371 (0.534)	Data Time 0.001 (0.028)	Loss 2.3263 (2.3996)	Entropy 0.55573 (0.55775)	Top-1 acc 62.891 (66.250)	Top-5 acc 88.281 (85.452)	lr 0.00270
Train [95][1380/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.028)	Loss 2.5105 (2.3998)	Entropy 0.55559 (0.55774)	Top-1 acc 65.625 (66.247)	Top-5 acc 85.156 (85.447)	lr 0.00270
Train [95][1390/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.028)	Loss 2.3111 (2.3996)	Entropy 0.55561 (0.55772)	Top-1 acc 70.312 (66.248)	Top-5 acc 86.719 (85.449)	lr 0.00270
Train [95][1400/3239]	Time 0.241 (0.532)	Data Time 0.001 (0.027)	Loss 2.3128 (2.3992)	Entropy 0.55581 (0.55771)	Top-1 acc 70.312 (66.260)	Top-5 acc 87.500 (85.454)	lr 0.00270
Train [95][1410/3239]	Time 0.237 (0.531)	Data Time 0.001 (0.027)	Loss 2.5491 (2.3986)	Entropy 0.55553 (0.55770)	Top-1 acc 62.109 (66.274)	Top-5 acc 83.203 (85.461)	lr 0.00270
Train [95][1420/3239]	Time 0.225 (0.531)	Data Time 0.001 (0.027)	Loss 2.5356 (2.3988)	Entropy 0.55537 (0.55768)	Top-1 acc 60.547 (66.273)	Top-5 acc 83.984 (85.458)	lr 0.00270
Train [95][1430/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.027)	Loss 2.2959 (2.3989)	Entropy 0.55521 (0.55766)	Top-1 acc 67.188 (66.267)	Top-5 acc 87.500 (85.457)	lr 0.00270
Train [95][1440/3239]	Time 0.233 (0.529)	Data Time 0.001 (0.027)	Loss 2.5242 (2.3989)	Entropy 0.55498 (0.55765)	Top-1 acc 64.844 (66.270)	Top-5 acc 81.250 (85.451)	lr 0.00269
Train [95][1450/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.027)	Loss 2.3911 (2.3987)	Entropy 0.55516 (0.55763)	Top-1 acc 66.016 (66.278)	Top-5 acc 87.109 (85.452)	lr 0.00269
Train [95][1460/3239]	Time 0.270 (0.528)	Data Time 0.001 (0.026)	Loss 2.3579 (2.3986)	Entropy 0.55525 (0.55761)	Top-1 acc 67.578 (66.276)	Top-5 acc 86.719 (85.456)	lr 0.00269
Train [95][1470/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.026)	Loss 2.2526 (2.3985)	Entropy 0.55510 (0.55759)	Top-1 acc 67.188 (66.275)	Top-5 acc 88.672 (85.459)	lr 0.00269
Train [95][1480/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.026)	Loss 2.1809 (2.3980)	Entropy 0.55495 (0.55758)	Top-1 acc 70.312 (66.279)	Top-5 acc 87.109 (85.464)	lr 0.00269
Train [95][1490/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.026)	Loss 2.4122 (2.3976)	Entropy 0.55504 (0.55756)	Top-1 acc 66.406 (66.287)	Top-5 acc 84.375 (85.467)	lr 0.00269
Train [95][1500/3239]	Time 0.245 (0.525)	Data Time 0.001 (0.026)	Loss 2.1845 (2.3970)	Entropy 0.55513 (0.55754)	Top-1 acc 68.359 (66.304)	Top-5 acc 89.844 (85.475)	lr 0.00269
Train [95][1510/3239]	Time 0.252 (0.525)	Data Time 0.001 (0.026)	Loss 2.3834 (2.3970)	Entropy 0.55562 (0.55753)	Top-1 acc 65.234 (66.307)	Top-5 acc 84.766 (85.472)	lr 0.00269
Train [95][1520/3239]	Time 0.290 (0.525)	Data Time 0.002 (0.025)	Loss 2.4849 (2.3969)	Entropy 0.55572 (0.55752)	Top-1 acc 62.109 (66.314)	Top-5 acc 85.547 (85.475)	lr 0.00269
Train [95][1530/3239]	Time 0.352 (0.525)	Data Time 0.001 (0.025)	Loss 2.5183 (2.3970)	Entropy 0.55580 (0.55750)	Top-1 acc 65.625 (66.315)	Top-5 acc 80.859 (85.470)	lr 0.00269
Train [95][1540/3239]	Time 0.244 (0.524)	Data Time 0.001 (0.025)	Loss 2.3535 (2.3974)	Entropy 0.55587 (0.55749)	Top-1 acc 67.578 (66.313)	Top-5 acc 85.156 (85.466)	lr 0.00269
Train [95][1550/3239]	Time 0.250 (0.523)	Data Time 0.002 (0.025)	Loss 2.5907 (2.3976)	Entropy 0.55558 (0.55748)	Top-1 acc 57.031 (66.301)	Top-5 acc 81.250 (85.464)	lr 0.00269
Train [95][1560/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.025)	Loss 2.4288 (2.3978)	Entropy 0.55533 (0.55747)	Top-1 acc 65.234 (66.296)	Top-5 acc 85.547 (85.462)	lr 0.00269
Train [95][1570/3239]	Time 0.225 (0.522)	Data Time 0.001 (0.025)	Loss 2.6343 (2.3979)	Entropy 0.55533 (0.55746)	Top-1 acc 61.328 (66.295)	Top-5 acc 79.297 (85.456)	lr 0.00269
Train [95][1580/3239]	Time 0.256 (0.522)	Data Time 0.001 (0.024)	Loss 2.4690 (2.3979)	Entropy 0.55523 (0.55744)	Top-1 acc 65.625 (66.284)	Top-5 acc 86.719 (85.459)	lr 0.00269
Train [95][1590/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.024)	Loss 2.2746 (2.3974)	Entropy 0.55546 (0.55743)	Top-1 acc 68.750 (66.294)	Top-5 acc 83.984 (85.464)	lr 0.00269
Train [95][1600/3239]	Time 0.340 (0.520)	Data Time 0.001 (0.024)	Loss 2.2982 (2.3976)	Entropy 0.55524 (0.55742)	Top-1 acc 66.406 (66.283)	Top-5 acc 87.500 (85.460)	lr 0.00268
Train [95][1610/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.024)	Loss 2.4813 (2.3981)	Entropy 0.55512 (0.55740)	Top-1 acc 69.922 (66.276)	Top-5 acc 85.156 (85.454)	lr 0.00268
Train [95][1620/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.024)	Loss 2.2928 (2.3981)	Entropy 0.55513 (0.55739)	Top-1 acc 66.797 (66.276)	Top-5 acc 88.672 (85.455)	lr 0.00268
Train [95][1630/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.024)	Loss 2.4786 (2.3982)	Entropy 0.55501 (0.55737)	Top-1 acc 60.156 (66.266)	Top-5 acc 82.812 (85.453)	lr 0.00268
Train [95][1640/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.024)	Loss 2.3726 (2.3982)	Entropy 0.55514 (0.55736)	Top-1 acc 69.922 (66.262)	Top-5 acc 83.203 (85.452)	lr 0.00268
Train [95][1650/3239]	Time 0.226 (0.517)	Data Time 0.001 (0.024)	Loss 2.1634 (2.3982)	Entropy 0.55527 (0.55735)	Top-1 acc 69.922 (66.261)	Top-5 acc 87.891 (85.452)	lr 0.00268
Train [95][1660/3239]	Time 0.244 (0.517)	Data Time 0.002 (0.023)	Loss 2.1881 (2.3978)	Entropy 0.55538 (0.55733)	Top-1 acc 70.312 (66.271)	Top-5 acc 89.844 (85.458)	lr 0.00268
Train [95][1670/3239]	Time 0.221 (0.516)	Data Time 0.001 (0.023)	Loss 2.2542 (2.3978)	Entropy 0.55549 (0.55732)	Top-1 acc 71.875 (66.272)	Top-5 acc 87.500 (85.461)	lr 0.00268
Train [95][1680/3239]	Time 0.238 (0.515)	Data Time 0.001 (0.023)	Loss 2.2374 (2.3979)	Entropy 0.55566 (0.55731)	Top-1 acc 67.578 (66.270)	Top-5 acc 87.500 (85.461)	lr 0.00268
Train [95][1690/3239]	Time 0.342 (0.515)	Data Time 0.001 (0.023)	Loss 2.4445 (2.3982)	Entropy 0.55555 (0.55730)	Top-1 acc 66.406 (66.259)	Top-5 acc 86.719 (85.457)	lr 0.00268
Train [95][1700/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.023)	Loss 2.3156 (2.3979)	Entropy 0.55561 (0.55729)	Top-1 acc 68.750 (66.260)	Top-5 acc 86.328 (85.464)	lr 0.00268
Train [95][1710/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.023)	Loss 2.2929 (2.3979)	Entropy 0.55576 (0.55728)	Top-1 acc 69.531 (66.260)	Top-5 acc 88.672 (85.468)	lr 0.00268
Train [95][1720/3239]	Time 0.224 (0.513)	Data Time 0.001 (0.023)	Loss 2.6339 (2.3980)	Entropy 0.55563 (0.55727)	Top-1 acc 57.031 (66.254)	Top-5 acc 81.641 (85.464)	lr 0.00268
Train [95][1730/3239]	Time 0.250 (0.512)	Data Time 0.001 (0.023)	Loss 2.5519 (2.3987)	Entropy 0.55572 (0.55726)	Top-1 acc 57.422 (66.232)	Top-5 acc 83.984 (85.451)	lr 0.00268
Train [95][1740/3239]	Time 0.222 (0.512)	Data Time 0.001 (0.022)	Loss 2.5424 (2.3984)	Entropy 0.55565 (0.55725)	Top-1 acc 62.891 (66.239)	Top-5 acc 80.859 (85.456)	lr 0.00268
Train [95][1750/3239]	Time 0.230 (0.511)	Data Time 0.001 (0.022)	Loss 2.5558 (2.3987)	Entropy 0.55554 (0.55725)	Top-1 acc 60.938 (66.233)	Top-5 acc 85.547 (85.454)	lr 0.00268
Train [95][1760/3239]	Time 0.319 (0.511)	Data Time 0.001 (0.022)	Loss 2.3784 (2.3988)	Entropy 0.55556 (0.55724)	Top-1 acc 67.969 (66.227)	Top-5 acc 84.375 (85.455)	lr 0.00267
Train [95][1770/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.022)	Loss 2.4763 (2.3985)	Entropy 0.55570 (0.55723)	Top-1 acc 63.672 (66.232)	Top-5 acc 83.203 (85.458)	lr 0.00267
Train [95][1780/3239]	Time 0.220 (0.509)	Data Time 0.001 (0.022)	Loss 2.2028 (2.3982)	Entropy 0.55553 (0.55722)	Top-1 acc 71.875 (66.240)	Top-5 acc 87.500 (85.464)	lr 0.00267
Train [95][1790/3239]	Time 0.248 (0.509)	Data Time 0.001 (0.022)	Loss 2.2501 (2.3980)	Entropy 0.55559 (0.55721)	Top-1 acc 69.531 (66.245)	Top-5 acc 89.062 (85.466)	lr 0.00267
Train [95][1800/3239]	Time 0.230 (0.508)	Data Time 0.001 (0.022)	Loss 2.3606 (2.3982)	Entropy 0.55520 (0.55720)	Top-1 acc 67.188 (66.240)	Top-5 acc 85.156 (85.462)	lr 0.00267
Train [95][1810/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.022)	Loss 2.2477 (2.3978)	Entropy 0.55536 (0.55719)	Top-1 acc 69.141 (66.250)	Top-5 acc 88.672 (85.468)	lr 0.00267
Train [95][1820/3239]	Time 0.225 (0.507)	Data Time 0.001 (0.021)	Loss 2.3617 (2.3979)	Entropy 0.55545 (0.55718)	Top-1 acc 69.922 (66.256)	Top-5 acc 84.375 (85.464)	lr 0.00267
Train [95][1830/3239]	Time 0.294 (0.507)	Data Time 0.001 (0.021)	Loss 2.3659 (2.3977)	Entropy 0.55529 (0.55717)	Top-1 acc 68.359 (66.262)	Top-5 acc 85.547 (85.469)	lr 0.00267
Train [95][1840/3239]	Time 0.249 (0.507)	Data Time 0.001 (0.021)	Loss 2.3254 (2.3979)	Entropy 0.55524 (0.55716)	Top-1 acc 66.797 (66.262)	Top-5 acc 85.547 (85.459)	lr 0.00267
Train [95][1850/3239]	Time 0.366 (0.506)	Data Time 0.001 (0.021)	Loss 2.3553 (2.3982)	Entropy 0.55534 (0.55715)	Top-1 acc 64.062 (66.252)	Top-5 acc 88.672 (85.451)	lr 0.00267
Train [95][1860/3239]	Time 0.228 (0.506)	Data Time 0.001 (0.021)	Loss 2.3429 (2.3982)	Entropy 0.55506 (0.55714)	Top-1 acc 68.359 (66.251)	Top-5 acc 87.109 (85.454)	lr 0.00267
Train [95][1870/3239]	Time 0.216 (0.506)	Data Time 0.001 (0.021)	Loss 2.3647 (2.3982)	Entropy 0.55506 (0.55713)	Top-1 acc 69.141 (66.247)	Top-5 acc 85.156 (85.454)	lr 0.00267
Train [95][1880/3239]	Time 0.236 (0.505)	Data Time 0.001 (0.021)	Loss 2.5507 (2.3984)	Entropy 0.55493 (0.55712)	Top-1 acc 59.375 (66.242)	Top-5 acc 81.641 (85.449)	lr 0.00267
Train [95][1890/3239]	Time 0.223 (0.505)	Data Time 0.001 (0.021)	Loss 2.5191 (2.3983)	Entropy 0.55523 (0.55711)	Top-1 acc 63.281 (66.245)	Top-5 acc 83.594 (85.452)	lr 0.00267
Train [95][1900/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.021)	Loss 2.4475 (2.3983)	Entropy 0.55506 (0.55710)	Top-1 acc 65.234 (66.246)	Top-5 acc 85.156 (85.452)	lr 0.00267
Train [95][1910/3239]	Time 0.228 (0.504)	Data Time 0.001 (0.021)	Loss 2.4878 (2.3982)	Entropy 0.55472 (0.55708)	Top-1 acc 66.016 (66.251)	Top-5 acc 82.812 (85.453)	lr 0.00267
Train [95][1920/3239]	Time 0.333 (0.503)	Data Time 0.002 (0.020)	Loss 2.4123 (2.3983)	Entropy 0.55501 (0.55707)	Top-1 acc 67.188 (66.249)	Top-5 acc 86.719 (85.452)	lr 0.00266
Train [95][1930/3239]	Time 0.227 (0.503)	Data Time 0.001 (0.020)	Loss 2.3338 (2.3981)	Entropy 0.55487 (0.55706)	Top-1 acc 69.141 (66.256)	Top-5 acc 86.719 (85.452)	lr 0.00266
Train [95][1940/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.020)	Loss 2.2978 (2.3977)	Entropy 0.55464 (0.55705)	Top-1 acc 67.578 (66.266)	Top-5 acc 85.938 (85.457)	lr 0.00266
Train [95][1950/3239]	Time 0.368 (0.529)	Data Time 0.004 (0.020)	Loss 2.2785 (2.3975)	Entropy 0.55463 (0.55704)	Top-1 acc 67.578 (66.271)	Top-5 acc 86.719 (85.464)	lr 0.00266
Train [95][1960/3239]	Time 0.235 (0.529)	Data Time 0.002 (0.020)	Loss 2.5727 (2.3976)	Entropy 0.55425 (0.55702)	Top-1 acc 63.281 (66.269)	Top-5 acc 82.422 (85.462)	lr 0.00266
Train [95][1970/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.020)	Loss 2.3913 (2.3975)	Entropy 0.55450 (0.55701)	Top-1 acc 62.891 (66.270)	Top-5 acc 85.156 (85.460)	lr 0.00266
Train [95][1980/3239]	Time 0.258 (0.528)	Data Time 0.001 (0.020)	Loss 2.4044 (2.3977)	Entropy 0.55470 (0.55700)	Top-1 acc 64.844 (66.263)	Top-5 acc 85.547 (85.458)	lr 0.00266
Train [95][1990/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.020)	Loss 2.3817 (2.3981)	Entropy 0.55471 (0.55699)	Top-1 acc 66.797 (66.254)	Top-5 acc 87.891 (85.453)	lr 0.00266
Train [95][2000/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.020)	Loss 2.2783 (2.3978)	Entropy 0.55488 (0.55698)	Top-1 acc 70.703 (66.267)	Top-5 acc 88.281 (85.457)	lr 0.00266
Train [95][2010/3239]	Time 0.333 (0.527)	Data Time 0.001 (0.020)	Loss 2.3555 (2.3977)	Entropy 0.55498 (0.55697)	Top-1 acc 68.750 (66.266)	Top-5 acc 87.891 (85.458)	lr 0.00266
Train [95][2020/3239]	Time 0.292 (0.526)	Data Time 0.002 (0.020)	Loss 2.2846 (2.3977)	Entropy 0.55493 (0.55696)	Top-1 acc 68.750 (66.271)	Top-5 acc 87.891 (85.459)	lr 0.00266
Train [95][2030/3239]	Time 0.262 (0.526)	Data Time 0.001 (0.019)	Loss 2.4831 (2.3976)	Entropy 0.55446 (0.55694)	Top-1 acc 66.016 (66.273)	Top-5 acc 86.719 (85.462)	lr 0.00266
Train [95][2040/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.019)	Loss 2.3835 (2.3972)	Entropy 0.55482 (0.55693)	Top-1 acc 68.750 (66.287)	Top-5 acc 85.156 (85.472)	lr 0.00266
Train [95][2050/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.019)	Loss 2.5333 (2.3975)	Entropy 0.55482 (0.55692)	Top-1 acc 64.062 (66.286)	Top-5 acc 82.812 (85.467)	lr 0.00266
Train [95][2060/3239]	Time 0.245 (0.525)	Data Time 0.001 (0.019)	Loss 2.2778 (2.3973)	Entropy 0.55424 (0.55691)	Top-1 acc 64.844 (66.286)	Top-5 acc 89.453 (85.470)	lr 0.00266
Train [95][2070/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.019)	Loss 2.4003 (2.3971)	Entropy 0.55437 (0.55690)	Top-1 acc 65.234 (66.294)	Top-5 acc 84.375 (85.476)	lr 0.00266
Train [95][2080/3239]	Time 0.344 (0.524)	Data Time 0.001 (0.019)	Loss 2.1196 (2.3968)	Entropy 0.55464 (0.55689)	Top-1 acc 71.094 (66.303)	Top-5 acc 89.453 (85.478)	lr 0.00265
Train [95][2090/3239]	Time 0.284 (0.524)	Data Time 0.002 (0.019)	Loss 2.1497 (2.3969)	Entropy 0.55466 (0.55688)	Top-1 acc 71.094 (66.294)	Top-5 acc 88.281 (85.473)	lr 0.00265
Train [95][2100/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.019)	Loss 2.3804 (2.3967)	Entropy 0.55442 (0.55687)	Top-1 acc 66.797 (66.300)	Top-5 acc 84.766 (85.480)	lr 0.00265
Train [95][2110/3239]	Time 0.238 (0.523)	Data Time 0.001 (0.019)	Loss 2.3887 (2.3968)	Entropy 0.55422 (0.55685)	Top-1 acc 66.016 (66.299)	Top-5 acc 86.328 (85.479)	lr 0.00265
Train [95][2120/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.019)	Loss 2.3127 (2.3965)	Entropy 0.55405 (0.55684)	Top-1 acc 67.578 (66.303)	Top-5 acc 86.719 (85.484)	lr 0.00265
Train [95][2130/3239]	Time 0.221 (0.522)	Data Time 0.001 (0.019)	Loss 2.1790 (2.3962)	Entropy 0.55403 (0.55683)	Top-1 acc 71.875 (66.315)	Top-5 acc 89.844 (85.486)	lr 0.00265
Train [95][2140/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.019)	Loss 2.3412 (2.3962)	Entropy 0.55422 (0.55682)	Top-1 acc 66.016 (66.314)	Top-5 acc 86.328 (85.489)	lr 0.00265
Train [95][2150/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.018)	Loss 2.4407 (2.3963)	Entropy 0.55424 (0.55680)	Top-1 acc 63.281 (66.309)	Top-5 acc 84.766 (85.487)	lr 0.00265
Train [95][2160/3239]	Time 0.224 (0.521)	Data Time 0.001 (0.018)	Loss 2.4783 (2.3963)	Entropy 0.55418 (0.55679)	Top-1 acc 64.844 (66.310)	Top-5 acc 82.812 (85.488)	lr 0.00265
Train [95][2170/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.018)	Loss 2.2684 (2.3962)	Entropy 0.55407 (0.55678)	Top-1 acc 66.797 (66.308)	Top-5 acc 88.281 (85.489)	lr 0.00265
Train [95][2180/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.018)	Loss 2.4684 (2.3963)	Entropy 0.55429 (0.55677)	Top-1 acc 64.453 (66.305)	Top-5 acc 83.594 (85.486)	lr 0.00265
Train [95][2190/3239]	Time 0.239 (0.519)	Data Time 0.001 (0.018)	Loss 2.3668 (2.3964)	Entropy 0.55436 (0.55676)	Top-1 acc 64.453 (66.301)	Top-5 acc 84.766 (85.482)	lr 0.00265
Train [95][2200/3239]	Time 0.244 (0.519)	Data Time 0.001 (0.018)	Loss 2.4114 (2.3964)	Entropy 0.55440 (0.55675)	Top-1 acc 66.797 (66.300)	Top-5 acc 84.766 (85.482)	lr 0.00265
Train [95][2210/3239]	Time 0.238 (0.518)	Data Time 0.001 (0.018)	Loss 2.2731 (2.3962)	Entropy 0.55446 (0.55673)	Top-1 acc 67.578 (66.307)	Top-5 acc 86.328 (85.484)	lr 0.00265
Train [95][2220/3239]	Time 0.239 (0.518)	Data Time 0.001 (0.018)	Loss 2.3728 (2.3959)	Entropy 0.55438 (0.55672)	Top-1 acc 69.922 (66.315)	Top-5 acc 85.938 (85.490)	lr 0.00265
Train [95][2230/3239]	Time 0.224 (0.517)	Data Time 0.001 (0.018)	Loss 2.4828 (2.3962)	Entropy 0.55441 (0.55671)	Top-1 acc 61.328 (66.309)	Top-5 acc 82.812 (85.484)	lr 0.00265
Train [95][2240/3239]	Time 0.323 (0.517)	Data Time 0.001 (0.018)	Loss 2.5784 (2.3964)	Entropy 0.55440 (0.55670)	Top-1 acc 64.844 (66.305)	Top-5 acc 83.203 (85.485)	lr 0.00264
Train [95][2250/3239]	Time 0.218 (0.517)	Data Time 0.001 (0.018)	Loss 2.4669 (2.3965)	Entropy 0.55451 (0.55669)	Top-1 acc 67.969 (66.307)	Top-5 acc 83.203 (85.483)	lr 0.00264
Train [95][2260/3239]	Time 0.218 (0.516)	Data Time 0.001 (0.018)	Loss 2.4337 (2.3965)	Entropy 0.55438 (0.55668)	Top-1 acc 63.281 (66.301)	Top-5 acc 82.422 (85.483)	lr 0.00264
Train [95][2270/3239]	Time 0.221 (0.516)	Data Time 0.001 (0.018)	Loss 2.6162 (2.3966)	Entropy 0.55453 (0.55667)	Top-1 acc 58.984 (66.297)	Top-5 acc 80.469 (85.479)	lr 0.00264
Train [95][2280/3239]	Time 0.223 (0.515)	Data Time 0.001 (0.017)	Loss 2.4639 (2.3967)	Entropy 0.55466 (0.55667)	Top-1 acc 63.281 (66.297)	Top-5 acc 83.203 (85.472)	lr 0.00264
Train [95][2290/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.017)	Loss 2.4693 (2.3966)	Entropy 0.55491 (0.55666)	Top-1 acc 62.500 (66.303)	Top-5 acc 84.375 (85.476)	lr 0.00264
Train [95][2300/3239]	Time 0.218 (0.514)	Data Time 0.001 (0.017)	Loss 2.2408 (2.3966)	Entropy 0.55450 (0.55665)	Top-1 acc 66.016 (66.304)	Top-5 acc 91.016 (85.475)	lr 0.00264
Train [95][2310/3239]	Time 0.333 (0.514)	Data Time 0.001 (0.017)	Loss 2.6113 (2.3966)	Entropy 0.55479 (0.55664)	Top-1 acc 61.719 (66.303)	Top-5 acc 79.688 (85.475)	lr 0.00264
Train [95][2320/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.017)	Loss 2.3978 (2.3968)	Entropy 0.55490 (0.55663)	Top-1 acc 65.625 (66.297)	Top-5 acc 84.766 (85.473)	lr 0.00264
Train [95][2330/3239]	Time 0.291 (0.513)	Data Time 0.001 (0.017)	Loss 2.3120 (2.3970)	Entropy 0.55521 (0.55663)	Top-1 acc 68.359 (66.291)	Top-5 acc 89.844 (85.471)	lr 0.00264
Train [95][2340/3239]	Time 0.282 (0.513)	Data Time 0.002 (0.017)	Loss 2.5962 (2.3972)	Entropy 0.55475 (0.55662)	Top-1 acc 62.500 (66.285)	Top-5 acc 82.422 (85.467)	lr 0.00264
Train [95][2350/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.017)	Loss 2.4078 (2.3974)	Entropy 0.55499 (0.55661)	Top-1 acc 64.844 (66.279)	Top-5 acc 83.594 (85.461)	lr 0.00264
Train [95][2360/3239]	Time 0.227 (0.513)	Data Time 0.001 (0.017)	Loss 2.3455 (2.3974)	Entropy 0.55472 (0.55660)	Top-1 acc 68.359 (66.282)	Top-5 acc 87.500 (85.462)	lr 0.00264
Train [95][2370/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.017)	Loss 2.5504 (2.3976)	Entropy 0.55462 (0.55660)	Top-1 acc 64.453 (66.278)	Top-5 acc 82.031 (85.458)	lr 0.00264
Train [95][2380/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.017)	Loss 2.4753 (2.3976)	Entropy 0.55443 (0.55659)	Top-1 acc 62.891 (66.277)	Top-5 acc 82.812 (85.460)	lr 0.00264
Train [95][2390/3239]	Time 0.230 (0.511)	Data Time 0.001 (0.017)	Loss 2.3928 (2.3975)	Entropy 0.55453 (0.55658)	Top-1 acc 70.703 (66.280)	Top-5 acc 85.938 (85.461)	lr 0.00264
Train [95][2400/3239]	Time 0.322 (0.511)	Data Time 0.001 (0.017)	Loss 2.3680 (2.3976)	Entropy 0.55456 (0.55657)	Top-1 acc 63.672 (66.274)	Top-5 acc 85.547 (85.459)	lr 0.00263
Train [95][2410/3239]	Time 0.232 (0.510)	Data Time 0.001 (0.017)	Loss 2.5335 (2.3976)	Entropy 0.55462 (0.55656)	Top-1 acc 63.281 (66.275)	Top-5 acc 83.984 (85.459)	lr 0.00263
Train [95][2420/3239]	Time 0.222 (0.510)	Data Time 0.001 (0.017)	Loss 2.5726 (2.3977)	Entropy 0.55448 (0.55655)	Top-1 acc 60.156 (66.266)	Top-5 acc 81.641 (85.455)	lr 0.00263
Train [95][2430/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.016)	Loss 2.3786 (2.3983)	Entropy 0.55458 (0.55654)	Top-1 acc 66.016 (66.254)	Top-5 acc 85.938 (85.442)	lr 0.00263
Train [95][2440/3239]	Time 0.222 (0.509)	Data Time 0.001 (0.016)	Loss 2.4095 (2.3983)	Entropy 0.55465 (0.55654)	Top-1 acc 66.016 (66.257)	Top-5 acc 84.375 (85.442)	lr 0.00263
Train [95][2450/3239]	Time 0.226 (0.509)	Data Time 0.001 (0.016)	Loss 2.3151 (2.3982)	Entropy 0.55436 (0.55653)	Top-1 acc 67.969 (66.262)	Top-5 acc 87.109 (85.443)	lr 0.00263
Train [95][2460/3239]	Time 0.226 (0.508)	Data Time 0.001 (0.016)	Loss 2.4628 (2.3981)	Entropy 0.55419 (0.55652)	Top-1 acc 64.844 (66.265)	Top-5 acc 86.719 (85.444)	lr 0.00263
Train [95][2470/3239]	Time 0.390 (0.508)	Data Time 0.001 (0.016)	Loss 2.2941 (2.3982)	Entropy 0.55431 (0.55651)	Top-1 acc 67.188 (66.262)	Top-5 acc 84.766 (85.442)	lr 0.00263
Train [95][2480/3239]	Time 0.283 (0.508)	Data Time 0.001 (0.016)	Loss 2.3199 (2.3982)	Entropy 0.55445 (0.55650)	Top-1 acc 66.016 (66.258)	Top-5 acc 86.719 (85.440)	lr 0.00263
Train [95][2490/3239]	Time 0.285 (0.508)	Data Time 0.002 (0.016)	Loss 2.3554 (2.3982)	Entropy 0.55426 (0.55649)	Top-1 acc 71.484 (66.261)	Top-5 acc 87.500 (85.444)	lr 0.00263
Train [95][2500/3239]	Time 0.228 (0.508)	Data Time 0.001 (0.016)	Loss 2.2469 (2.3982)	Entropy 0.55438 (0.55648)	Top-1 acc 71.484 (66.260)	Top-5 acc 87.891 (85.442)	lr 0.00263
Train [95][2510/3239]	Time 0.227 (0.508)	Data Time 0.001 (0.016)	Loss 2.2630 (2.3981)	Entropy 0.55448 (0.55648)	Top-1 acc 68.750 (66.262)	Top-5 acc 87.109 (85.443)	lr 0.00263
Train [95][2520/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.016)	Loss 2.3488 (2.3982)	Entropy 0.55472 (0.55647)	Top-1 acc 64.844 (66.259)	Top-5 acc 84.766 (85.442)	lr 0.00263
Train [95][2530/3239]	Time 0.225 (0.507)	Data Time 0.001 (0.016)	Loss 2.2332 (2.3981)	Entropy 0.55478 (0.55646)	Top-1 acc 69.531 (66.261)	Top-5 acc 89.453 (85.447)	lr 0.00263
Train [95][2540/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.016)	Loss 2.2933 (2.3976)	Entropy 0.55462 (0.55646)	Top-1 acc 67.969 (66.275)	Top-5 acc 88.281 (85.457)	lr 0.00263
Train [95][2550/3239]	Time 0.269 (0.506)	Data Time 0.001 (0.016)	Loss 2.4852 (2.3977)	Entropy 0.55471 (0.55645)	Top-1 acc 62.500 (66.272)	Top-5 acc 83.203 (85.454)	lr 0.00263
Train [95][2560/3239]	Time 0.247 (0.506)	Data Time 0.001 (0.016)	Loss 2.3629 (2.3977)	Entropy 0.55485 (0.55644)	Top-1 acc 64.844 (66.271)	Top-5 acc 86.719 (85.456)	lr 0.00263
Train [95][2570/3239]	Time 0.228 (0.506)	Data Time 0.001 (0.016)	Loss 2.4596 (2.3978)	Entropy 0.55485 (0.55644)	Top-1 acc 67.188 (66.269)	Top-5 acc 82.812 (85.451)	lr 0.00262
Train [95][2580/3239]	Time 0.235 (0.505)	Data Time 0.001 (0.016)	Loss 2.3233 (2.3980)	Entropy 0.55491 (0.55643)	Top-1 acc 67.578 (66.268)	Top-5 acc 87.500 (85.450)	lr 0.00262
Train [95][2590/3239]	Time 0.232 (0.505)	Data Time 0.001 (0.016)	Loss 2.3141 (2.3977)	Entropy 0.55530 (0.55642)	Top-1 acc 67.188 (66.273)	Top-5 acc 87.109 (85.458)	lr 0.00262
Train [95][2600/3239]	Time 0.220 (0.504)	Data Time 0.001 (0.016)	Loss 2.3768 (2.3978)	Entropy 0.55531 (0.55642)	Top-1 acc 66.797 (66.271)	Top-5 acc 88.281 (85.457)	lr 0.00262
Train [95][2610/3239]	Time 0.268 (0.525)	Data Time 0.002 (0.015)	Loss 2.4339 (2.3978)	Entropy 0.55505 (0.55642)	Top-1 acc 64.062 (66.270)	Top-5 acc 87.109 (85.459)	lr 0.00262
Train [95][2620/3239]	Time 0.237 (0.524)	Data Time 0.002 (0.015)	Loss 2.3828 (2.3978)	Entropy 0.55518 (0.55641)	Top-1 acc 63.672 (66.267)	Top-5 acc 86.328 (85.459)	lr 0.00262
Train [95][2630/3239]	Time 0.463 (0.524)	Data Time 0.002 (0.015)	Loss 2.2169 (2.3977)	Entropy 0.55548 (0.55641)	Top-1 acc 70.312 (66.271)	Top-5 acc 88.281 (85.462)	lr 0.00262
Train [95][2640/3239]	Time 0.307 (0.524)	Data Time 0.002 (0.015)	Loss 2.3029 (2.3980)	Entropy 0.55551 (0.55640)	Top-1 acc 70.703 (66.268)	Top-5 acc 87.500 (85.456)	lr 0.00262
Train [95][2650/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.015)	Loss 2.3659 (2.3978)	Entropy 0.55551 (0.55640)	Top-1 acc 64.844 (66.270)	Top-5 acc 85.156 (85.459)	lr 0.00262
Train [95][2660/3239]	Time 0.237 (0.524)	Data Time 0.001 (0.015)	Loss 2.5146 (2.3976)	Entropy 0.55516 (0.55640)	Top-1 acc 63.672 (66.276)	Top-5 acc 83.984 (85.461)	lr 0.00262
Train [95][2670/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.015)	Loss 2.3169 (2.3977)	Entropy 0.55543 (0.55639)	Top-1 acc 67.969 (66.273)	Top-5 acc 88.281 (85.459)	lr 0.00262
Train [95][2680/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.015)	Loss 2.4184 (2.3977)	Entropy 0.55537 (0.55639)	Top-1 acc 66.016 (66.278)	Top-5 acc 84.766 (85.461)	lr 0.00262
Train [95][2690/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.015)	Loss 2.1169 (2.3975)	Entropy 0.55529 (0.55638)	Top-1 acc 73.438 (66.281)	Top-5 acc 90.625 (85.465)	lr 0.00262
Train [95][2700/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.015)	Loss 2.3333 (2.3975)	Entropy 0.55507 (0.55638)	Top-1 acc 67.188 (66.284)	Top-5 acc 87.891 (85.466)	lr 0.00262
Train [95][2710/3239]	Time 0.218 (0.522)	Data Time 0.001 (0.015)	Loss 2.3279 (2.3975)	Entropy 0.55508 (0.55637)	Top-1 acc 66.406 (66.284)	Top-5 acc 87.109 (85.467)	lr 0.00262
Train [95][2720/3239]	Time 0.259 (0.522)	Data Time 0.001 (0.015)	Loss 2.4862 (2.3973)	Entropy 0.55503 (0.55637)	Top-1 acc 62.891 (66.289)	Top-5 acc 83.984 (85.469)	lr 0.00262
Train [95][2730/3239]	Time 0.220 (0.521)	Data Time 0.001 (0.015)	Loss 2.3795 (2.3973)	Entropy 0.55472 (0.55636)	Top-1 acc 67.578 (66.291)	Top-5 acc 85.938 (85.469)	lr 0.00261
Train [95][2740/3239]	Time 0.238 (0.521)	Data Time 0.001 (0.015)	Loss 2.4186 (2.3975)	Entropy 0.55463 (0.55636)	Top-1 acc 67.188 (66.290)	Top-5 acc 83.203 (85.463)	lr 0.00261
Train [95][2750/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.015)	Loss 2.2550 (2.3974)	Entropy 0.55489 (0.55635)	Top-1 acc 67.969 (66.288)	Top-5 acc 89.062 (85.468)	lr 0.00261
Train [95][2760/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.015)	Loss 2.1706 (2.3974)	Entropy 0.55454 (0.55635)	Top-1 acc 73.438 (66.287)	Top-5 acc 91.406 (85.468)	lr 0.00261
Train [95][2770/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.015)	Loss 2.7246 (2.3974)	Entropy 0.55450 (0.55634)	Top-1 acc 63.281 (66.291)	Top-5 acc 78.906 (85.469)	lr 0.00261
Train [95][2780/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.015)	Loss 2.4410 (2.3977)	Entropy 0.55466 (0.55633)	Top-1 acc 64.453 (66.285)	Top-5 acc 84.375 (85.465)	lr 0.00261
Train [95][2790/3239]	Time 0.320 (0.519)	Data Time 0.001 (0.015)	Loss 2.3453 (2.3976)	Entropy 0.55460 (0.55633)	Top-1 acc 68.359 (66.283)	Top-5 acc 85.938 (85.465)	lr 0.00261
Train [95][2800/3239]	Time 0.237 (0.519)	Data Time 0.001 (0.015)	Loss 2.2658 (2.3979)	Entropy 0.55427 (0.55632)	Top-1 acc 68.750 (66.276)	Top-5 acc 85.938 (85.460)	lr 0.00261
Train [95][2810/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.014)	Loss 2.5171 (2.3979)	Entropy 0.55427 (0.55632)	Top-1 acc 64.844 (66.276)	Top-5 acc 84.375 (85.458)	lr 0.00261
Train [95][2820/3239]	Time 0.237 (0.518)	Data Time 0.002 (0.014)	Loss 2.3225 (2.3979)	Entropy 0.55423 (0.55631)	Top-1 acc 67.578 (66.277)	Top-5 acc 87.109 (85.460)	lr 0.00261
Train [95][2830/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.014)	Loss 2.1455 (2.3977)	Entropy 0.55400 (0.55630)	Top-1 acc 71.094 (66.278)	Top-5 acc 89.453 (85.463)	lr 0.00261
Train [95][2840/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.014)	Loss 2.3792 (2.3977)	Entropy 0.55413 (0.55629)	Top-1 acc 67.969 (66.276)	Top-5 acc 83.984 (85.462)	lr 0.00261
Train [95][2850/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.014)	Loss 2.4815 (2.3980)	Entropy 0.55403 (0.55628)	Top-1 acc 63.281 (66.272)	Top-5 acc 83.594 (85.456)	lr 0.00261
Train [95][2860/3239]	Time 0.329 (0.517)	Data Time 0.001 (0.014)	Loss 2.5760 (2.3981)	Entropy 0.55432 (0.55628)	Top-1 acc 63.281 (66.271)	Top-5 acc 82.812 (85.454)	lr 0.00261
Train [95][2870/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.014)	Loss 2.3397 (2.3977)	Entropy 0.55435 (0.55627)	Top-1 acc 67.969 (66.279)	Top-5 acc 85.156 (85.460)	lr 0.00261
Train [95][2880/3239]	Time 0.240 (0.516)	Data Time 0.001 (0.014)	Loss 2.4668 (2.3976)	Entropy 0.55434 (0.55626)	Top-1 acc 61.719 (66.278)	Top-5 acc 86.719 (85.460)	lr 0.00261
Train [95][2890/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.014)	Loss 2.4268 (2.3975)	Entropy 0.55443 (0.55626)	Top-1 acc 62.891 (66.276)	Top-5 acc 83.594 (85.463)	lr 0.00260
Train [95][2900/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.014)	Loss 2.5477 (2.3975)	Entropy 0.55430 (0.55625)	Top-1 acc 59.375 (66.272)	Top-5 acc 86.328 (85.464)	lr 0.00260
Train [95][2910/3239]	Time 0.271 (0.515)	Data Time 0.001 (0.014)	Loss 2.2136 (2.3973)	Entropy 0.55412 (0.55624)	Top-1 acc 72.266 (66.278)	Top-5 acc 89.062 (85.469)	lr 0.00260
Train [95][2920/3239]	Time 0.225 (0.515)	Data Time 0.001 (0.014)	Loss 2.4649 (2.3975)	Entropy 0.55464 (0.55624)	Top-1 acc 61.719 (66.271)	Top-5 acc 85.547 (85.466)	lr 0.00260
Train [95][2930/3239]	Time 0.230 (0.514)	Data Time 0.001 (0.014)	Loss 2.3110 (2.3974)	Entropy 0.55460 (0.55623)	Top-1 acc 68.359 (66.272)	Top-5 acc 88.672 (85.467)	lr 0.00260
Train [95][2940/3239]	Time 0.219 (0.514)	Data Time 0.001 (0.014)	Loss 2.6988 (2.3976)	Entropy 0.55411 (0.55623)	Top-1 acc 58.203 (66.269)	Top-5 acc 80.859 (85.465)	lr 0.00260
Train [95][2950/3239]	Time 0.465 (0.514)	Data Time 0.003 (0.014)	Loss 2.2651 (2.3976)	Entropy 0.55434 (0.55622)	Top-1 acc 69.141 (66.266)	Top-5 acc 89.062 (85.464)	lr 0.00260
Train [95][2960/3239]	Time 0.220 (0.514)	Data Time 0.001 (0.014)	Loss 2.2136 (2.3976)	Entropy 0.55438 (0.55621)	Top-1 acc 71.094 (66.261)	Top-5 acc 89.453 (85.463)	lr 0.00260
Train [95][2970/3239]	Time 0.223 (0.513)	Data Time 0.001 (0.014)	Loss 2.3065 (2.3976)	Entropy 0.55432 (0.55621)	Top-1 acc 66.797 (66.259)	Top-5 acc 85.938 (85.462)	lr 0.00260
Train [95][2980/3239]	Time 0.220 (0.513)	Data Time 0.001 (0.014)	Loss 2.3907 (2.3976)	Entropy 0.55406 (0.55620)	Top-1 acc 65.625 (66.259)	Top-5 acc 85.938 (85.461)	lr 0.00260
Train [95][2990/3239]	Time 0.230 (0.513)	Data Time 0.002 (0.014)	Loss 2.3642 (2.3977)	Entropy 0.55417 (0.55619)	Top-1 acc 67.188 (66.256)	Top-5 acc 85.547 (85.459)	lr 0.00260
Train [95][3000/3239]	Time 0.234 (0.512)	Data Time 0.002 (0.014)	Loss 2.2973 (2.3976)	Entropy 0.55381 (0.55619)	Top-1 acc 66.406 (66.258)	Top-5 acc 86.328 (85.461)	lr 0.00260
Train [95][3010/3239]	Time 0.225 (0.512)	Data Time 0.001 (0.014)	Loss 2.4098 (2.3978)	Entropy 0.55381 (0.55618)	Top-1 acc 64.844 (66.252)	Top-5 acc 85.938 (85.461)	lr 0.00260
Train [95][3020/3239]	Time 0.340 (0.512)	Data Time 0.001 (0.014)	Loss 2.3684 (2.3977)	Entropy 0.55401 (0.55617)	Top-1 acc 66.797 (66.251)	Top-5 acc 84.766 (85.459)	lr 0.00260
Train [95][3030/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.014)	Loss 2.4329 (2.3979)	Entropy 0.55393 (0.55616)	Top-1 acc 66.406 (66.250)	Top-5 acc 85.547 (85.457)	lr 0.00260
Train [95][3040/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.014)	Loss 2.2524 (2.3976)	Entropy 0.55419 (0.55616)	Top-1 acc 71.094 (66.259)	Top-5 acc 88.672 (85.461)	lr 0.00260
Train [95][3050/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.013)	Loss 2.2753 (2.3979)	Entropy 0.55401 (0.55615)	Top-1 acc 69.922 (66.252)	Top-5 acc 87.891 (85.458)	lr 0.00259
Train [95][3060/3239]	Time 0.217 (0.511)	Data Time 0.001 (0.013)	Loss 2.4675 (2.3979)	Entropy 0.55426 (0.55614)	Top-1 acc 65.625 (66.252)	Top-5 acc 86.328 (85.457)	lr 0.00259
Train [95][3070/3239]	Time 0.227 (0.510)	Data Time 0.001 (0.013)	Loss 2.0949 (2.3978)	Entropy 0.55424 (0.55614)	Top-1 acc 71.484 (66.255)	Top-5 acc 91.797 (85.460)	lr 0.00259
Train [95][3080/3239]	Time 0.228 (0.510)	Data Time 0.001 (0.013)	Loss 2.3641 (2.3976)	Entropy 0.55404 (0.55613)	Top-1 acc 65.625 (66.262)	Top-5 acc 84.766 (85.461)	lr 0.00259
Train [95][3090/3239]	Time 0.254 (0.510)	Data Time 0.001 (0.013)	Loss 2.8027 (2.3979)	Entropy 0.55390 (0.55612)	Top-1 acc 54.297 (66.254)	Top-5 acc 78.125 (85.457)	lr 0.00259
Train [95][3100/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.013)	Loss 2.4507 (2.3980)	Entropy 0.55346 (0.55612)	Top-1 acc 67.578 (66.254)	Top-5 acc 84.766 (85.455)	lr 0.00259
Train [95][3110/3239]	Time 0.325 (0.509)	Data Time 0.001 (0.013)	Loss 2.3174 (2.3980)	Entropy 0.55371 (0.55611)	Top-1 acc 67.969 (66.254)	Top-5 acc 87.109 (85.454)	lr 0.00259
Train [95][3120/3239]	Time 0.223 (0.509)	Data Time 0.001 (0.013)	Loss 2.3997 (2.3982)	Entropy 0.55396 (0.55610)	Top-1 acc 64.062 (66.250)	Top-5 acc 86.328 (85.451)	lr 0.00259
Train [95][3130/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.013)	Loss 2.5291 (2.3981)	Entropy 0.55398 (0.55609)	Top-1 acc 64.844 (66.251)	Top-5 acc 81.641 (85.452)	lr 0.00259
Train [95][3140/3239]	Time 0.243 (0.508)	Data Time 0.001 (0.013)	Loss 2.4046 (2.3981)	Entropy 0.55411 (0.55609)	Top-1 acc 64.453 (66.251)	Top-5 acc 85.156 (85.455)	lr 0.00259
Train [95][3150/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.013)	Loss 2.4282 (2.3981)	Entropy 0.55426 (0.55608)	Top-1 acc 64.844 (66.251)	Top-5 acc 85.938 (85.454)	lr 0.00259
Train [95][3160/3239]	Time 0.226 (0.507)	Data Time 0.001 (0.013)	Loss 2.4945 (2.3981)	Entropy 0.55441 (0.55607)	Top-1 acc 64.062 (66.251)	Top-5 acc 83.594 (85.452)	lr 0.00259
Train [95][3170/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.013)	Loss 2.6796 (2.3983)	Entropy 0.55462 (0.55607)	Top-1 acc 57.031 (66.247)	Top-5 acc 83.984 (85.449)	lr 0.00259
Train [95][3180/3239]	Time 0.318 (0.507)	Data Time 0.000 (0.013)	Loss 2.6079 (2.3983)	Entropy 0.55412 (0.55606)	Top-1 acc 61.719 (66.246)	Top-5 acc 82.031 (85.450)	lr 0.00259
Train [95][3190/3239]	Time 0.219 (0.506)	Data Time 0.000 (0.013)	Loss 2.3172 (2.3984)	Entropy 0.55378 (0.55606)	Top-1 acc 67.578 (66.245)	Top-5 acc 87.109 (85.448)	lr 0.00259
Train [95][3200/3239]	Time 0.237 (0.506)	Data Time 0.000 (0.013)	Loss 2.5992 (2.3985)	Entropy 0.55377 (0.55605)	Top-1 acc 59.375 (66.241)	Top-5 acc 83.984 (85.445)	lr 0.00259
Train [95][3210/3239]	Time 0.226 (0.505)	Data Time 0.000 (0.013)	Loss 2.3025 (2.3985)	Entropy 0.55388 (0.55604)	Top-1 acc 67.188 (66.238)	Top-5 acc 88.281 (85.446)	lr 0.00258
Train [95][3220/3239]	Time 0.230 (0.505)	Data Time 0.000 (0.013)	Loss 2.1311 (2.3984)	Entropy 0.55391 (0.55604)	Top-1 acc 75.000 (66.246)	Top-5 acc 90.234 (85.448)	lr 0.00258
Train [95][3230/3239]	Time 0.224 (0.505)	Data Time 0.000 (0.013)	Loss 2.4156 (2.3984)	Entropy 0.55422 (0.55603)	Top-1 acc 64.062 (66.245)	Top-5 acc 83.594 (85.448)	lr 0.00258
Train [95][3239/3239]	Time 0.896 (0.504)	Data Time 0.000 (0.013)	Loss 2.7440 (2.3985)	Entropy 0.55441 (0.55603)	Top-1 acc 59.259 (66.243)	Top-5 acc 76.543 (85.447)	lr 0.00258
==========Valid [95/120]	loss 1.214	top-1 acc 71.970 (71.970)	top-5 acc 90.122	Train top-1 66.243	top-5 85.447	Entropy 0.55441	Latency-None: 0.000ms	Flops: 539.00M
Train [96][0/3239]	Time 37.521 (37.521)	Data Time 36.635 (36.635)	Loss 2.3129 (2.3129)	Entropy 0.55451 (0.55451)	Top-1 acc 67.969 (67.969)	Top-5 acc 87.500 (87.500)	lr 0.00258
Train [96][10/3239]	Time 0.324 (3.927)	Data Time 0.001 (3.385)	Loss 2.7146 (2.3237)	Entropy 0.55470 (0.55455)	Top-1 acc 58.203 (67.685)	Top-5 acc 80.859 (86.399)	lr 0.00258
Train [96][20/3239]	Time 0.300 (4.836)	Data Time 0.004 (1.774)	Loss 2.4250 (2.3397)	Entropy 0.55483 (0.55465)	Top-1 acc 66.797 (67.336)	Top-5 acc 86.328 (86.235)	lr 0.00258
Train [96][30/3239]	Time 0.228 (3.420)	Data Time 0.002 (1.202)	Loss 2.4284 (2.3702)	Entropy 0.55510 (0.55475)	Top-1 acc 64.062 (66.646)	Top-5 acc 86.328 (85.824)	lr 0.00258
Train [96][40/3239]	Time 0.220 (2.690)	Data Time 0.001 (0.910)	Loss 2.2869 (2.3619)	Entropy 0.55508 (0.55483)	Top-1 acc 69.531 (66.740)	Top-5 acc 87.109 (85.918)	lr 0.00258
Train [96][50/3239]	Time 0.223 (2.242)	Data Time 0.001 (0.732)	Loss 2.1339 (2.3634)	Entropy 0.55512 (0.55489)	Top-1 acc 74.219 (66.628)	Top-5 acc 91.016 (85.983)	lr 0.00258
Train [96][60/3239]	Time 0.227 (1.942)	Data Time 0.001 (0.613)	Loss 2.4140 (2.3793)	Entropy 0.55484 (0.55492)	Top-1 acc 64.062 (66.099)	Top-5 acc 86.328 (85.739)	lr 0.00258
Train [96][70/3239]	Time 0.228 (1.727)	Data Time 0.001 (0.526)	Loss 2.4079 (2.3785)	Entropy 0.55444 (0.55489)	Top-1 acc 63.281 (66.346)	Top-5 acc 86.719 (85.706)	lr 0.00258
Train [96][80/3239]	Time 0.312 (1.565)	Data Time 0.001 (0.462)	Loss 2.3676 (2.3814)	Entropy 0.55483 (0.55485)	Top-1 acc 69.141 (66.353)	Top-5 acc 83.203 (85.552)	lr 0.00258
Train [96][90/3239]	Time 0.230 (1.438)	Data Time 0.001 (0.411)	Loss 2.2728 (2.3803)	Entropy 0.55491 (0.55485)	Top-1 acc 70.703 (66.531)	Top-5 acc 87.891 (85.543)	lr 0.00258
Train [96][100/3239]	Time 0.226 (1.336)	Data Time 0.001 (0.371)	Loss 2.3322 (2.3769)	Entropy 0.55520 (0.55487)	Top-1 acc 71.875 (66.681)	Top-5 acc 85.156 (85.632)	lr 0.00258
Train [96][110/3239]	Time 0.229 (1.254)	Data Time 0.001 (0.337)	Loss 2.3872 (2.3803)	Entropy 0.55501 (0.55490)	Top-1 acc 67.578 (66.526)	Top-5 acc 85.156 (85.564)	lr 0.00258
Train [96][120/3239]	Time 0.225 (1.183)	Data Time 0.001 (0.310)	Loss 2.5230 (2.3834)	Entropy 0.55524 (0.55491)	Top-1 acc 60.938 (66.442)	Top-5 acc 82.812 (85.589)	lr 0.00258
Train [96][130/3239]	Time 0.235 (1.125)	Data Time 0.001 (0.286)	Loss 2.2998 (2.3848)	Entropy 0.55533 (0.55494)	Top-1 acc 67.969 (66.505)	Top-5 acc 88.281 (85.580)	lr 0.00258
Train [96][140/3239]	Time 0.225 (1.073)	Data Time 0.001 (0.266)	Loss 2.5688 (2.3891)	Entropy 0.55527 (0.55496)	Top-1 acc 60.156 (66.426)	Top-5 acc 83.203 (85.478)	lr 0.00257
Train [96][150/3239]	Time 0.215 (1.030)	Data Time 0.001 (0.248)	Loss 2.5884 (2.3882)	Entropy 0.55547 (0.55498)	Top-1 acc 62.109 (66.497)	Top-5 acc 81.641 (85.462)	lr 0.00257
Train [96][160/3239]	Time 0.226 (0.991)	Data Time 0.001 (0.233)	Loss 2.4287 (2.3841)	Entropy 0.55540 (0.55501)	Top-1 acc 64.844 (66.615)	Top-5 acc 85.156 (85.578)	lr 0.00257
Train [96][170/3239]	Time 0.317 (0.957)	Data Time 0.001 (0.220)	Loss 2.3926 (2.3820)	Entropy 0.55526 (0.55503)	Top-1 acc 69.922 (66.690)	Top-5 acc 86.328 (85.622)	lr 0.00257
Train [96][180/3239]	Time 0.221 (0.927)	Data Time 0.001 (0.208)	Loss 2.4500 (2.3828)	Entropy 0.55533 (0.55504)	Top-1 acc 59.766 (66.676)	Top-5 acc 86.328 (85.659)	lr 0.00257
Train [96][190/3239]	Time 0.252 (0.899)	Data Time 0.001 (0.197)	Loss 2.2474 (2.3849)	Entropy 0.55548 (0.55506)	Top-1 acc 70.312 (66.615)	Top-5 acc 88.672 (85.623)	lr 0.00257
Train [96][200/3239]	Time 0.227 (0.875)	Data Time 0.001 (0.187)	Loss 2.2910 (2.3834)	Entropy 0.55524 (0.55508)	Top-1 acc 68.359 (66.608)	Top-5 acc 87.109 (85.654)	lr 0.00257
Train [96][210/3239]	Time 0.257 (0.854)	Data Time 0.001 (0.178)	Loss 2.2954 (2.3816)	Entropy 0.55513 (0.55508)	Top-1 acc 69.531 (66.665)	Top-5 acc 87.891 (85.675)	lr 0.00257
Train [96][220/3239]	Time 0.226 (0.834)	Data Time 0.001 (0.170)	Loss 2.4353 (2.3812)	Entropy 0.55495 (0.55508)	Top-1 acc 66.406 (66.691)	Top-5 acc 86.719 (85.702)	lr 0.00257
Train [96][230/3239]	Time 0.226 (0.815)	Data Time 0.001 (0.163)	Loss 2.2174 (2.3834)	Entropy 0.55499 (0.55508)	Top-1 acc 67.578 (66.662)	Top-5 acc 89.453 (85.657)	lr 0.00257
Train [96][240/3239]	Time 0.323 (0.799)	Data Time 0.001 (0.156)	Loss 2.2030 (2.3821)	Entropy 0.55465 (0.55507)	Top-1 acc 73.047 (66.692)	Top-5 acc 85.938 (85.678)	lr 0.00257
Train [96][250/3239]	Time 0.289 (0.788)	Data Time 0.002 (0.150)	Loss 2.3875 (2.3829)	Entropy 0.55447 (0.55505)	Top-1 acc 63.672 (66.683)	Top-5 acc 85.156 (85.656)	lr 0.00257
Train [96][260/3239]	Time 0.230 (0.774)	Data Time 0.001 (0.144)	Loss 2.4656 (2.3822)	Entropy 0.55444 (0.55502)	Top-1 acc 63.281 (66.716)	Top-5 acc 85.547 (85.691)	lr 0.00257
Train [96][270/3239]	Time 0.229 (0.762)	Data Time 0.001 (0.139)	Loss 2.2584 (2.3825)	Entropy 0.55458 (0.55500)	Top-1 acc 71.875 (66.728)	Top-5 acc 85.547 (85.671)	lr 0.00257
Train [96][280/3239]	Time 0.233 (0.749)	Data Time 0.001 (0.134)	Loss 2.4009 (2.3819)	Entropy 0.55479 (0.55499)	Top-1 acc 65.234 (66.750)	Top-5 acc 85.156 (85.662)	lr 0.00257
Train [96][290/3239]	Time 0.229 (0.738)	Data Time 0.001 (0.130)	Loss 2.2970 (2.3830)	Entropy 0.55491 (0.55499)	Top-1 acc 70.312 (66.734)	Top-5 acc 87.891 (85.642)	lr 0.00257
Train [96][300/3239]	Time 0.224 (0.727)	Data Time 0.001 (0.125)	Loss 2.3364 (2.3831)	Entropy 0.55515 (0.55499)	Top-1 acc 69.141 (66.702)	Top-5 acc 88.281 (85.657)	lr 0.00256
Train [96][310/3239]	Time 0.231 (0.717)	Data Time 0.001 (0.121)	Loss 2.4249 (2.3831)	Entropy 0.55527 (0.55499)	Top-1 acc 64.062 (66.711)	Top-5 acc 85.938 (85.672)	lr 0.00256
Train [96][320/3239]	Time 0.226 (0.707)	Data Time 0.001 (0.118)	Loss 2.2717 (2.3815)	Entropy 0.55551 (0.55501)	Top-1 acc 69.922 (66.759)	Top-5 acc 87.891 (85.704)	lr 0.00256
Train [96][330/3239]	Time 0.323 (0.698)	Data Time 0.001 (0.114)	Loss 2.2848 (2.3810)	Entropy 0.55562 (0.55502)	Top-1 acc 69.922 (66.759)	Top-5 acc 87.500 (85.735)	lr 0.00256
Train [96][340/3239]	Time 0.224 (0.690)	Data Time 0.001 (0.111)	Loss 2.3746 (2.3814)	Entropy 0.55566 (0.55504)	Top-1 acc 67.188 (66.761)	Top-5 acc 86.328 (85.735)	lr 0.00256
Train [96][350/3239]	Time 0.230 (0.682)	Data Time 0.001 (0.108)	Loss 2.3829 (2.3825)	Entropy 0.55571 (0.55506)	Top-1 acc 60.156 (66.738)	Top-5 acc 86.328 (85.727)	lr 0.00256
Train [96][360/3239]	Time 0.230 (0.675)	Data Time 0.001 (0.105)	Loss 2.3819 (2.3818)	Entropy 0.55556 (0.55507)	Top-1 acc 66.016 (66.773)	Top-5 acc 86.328 (85.738)	lr 0.00256
Train [96][370/3239]	Time 0.241 (0.667)	Data Time 0.001 (0.102)	Loss 2.2913 (2.3825)	Entropy 0.55551 (0.55508)	Top-1 acc 66.406 (66.744)	Top-5 acc 87.109 (85.743)	lr 0.00256
Train [96][380/3239]	Time 0.284 (0.663)	Data Time 0.002 (0.099)	Loss 2.3915 (2.3843)	Entropy 0.55579 (0.55510)	Top-1 acc 66.016 (66.698)	Top-5 acc 85.547 (85.707)	lr 0.00256
Train [96][390/3239]	Time 0.272 (0.661)	Data Time 0.002 (0.097)	Loss 2.4173 (2.3845)	Entropy 0.55572 (0.55512)	Top-1 acc 64.062 (66.690)	Top-5 acc 87.500 (85.701)	lr 0.00256
Train [96][400/3239]	Time 0.308 (0.657)	Data Time 0.001 (0.095)	Loss 2.4044 (2.3847)	Entropy 0.55573 (0.55513)	Top-1 acc 66.797 (66.676)	Top-5 acc 88.281 (85.700)	lr 0.00256
Train [96][410/3239]	Time 0.228 (0.651)	Data Time 0.001 (0.092)	Loss 2.3807 (2.3853)	Entropy 0.55599 (0.55515)	Top-1 acc 67.969 (66.644)	Top-5 acc 86.328 (85.694)	lr 0.00256
Train [96][420/3239]	Time 0.228 (0.645)	Data Time 0.001 (0.090)	Loss 2.4345 (2.3866)	Entropy 0.55586 (0.55517)	Top-1 acc 63.281 (66.619)	Top-5 acc 87.500 (85.673)	lr 0.00256
Train [96][430/3239]	Time 0.233 (0.640)	Data Time 0.001 (0.088)	Loss 2.1845 (2.3874)	Entropy 0.55561 (0.55518)	Top-1 acc 72.266 (66.603)	Top-5 acc 88.672 (85.665)	lr 0.00256
Train [96][440/3239]	Time 0.234 (0.635)	Data Time 0.002 (0.086)	Loss 2.2561 (2.3877)	Entropy 0.55554 (0.55519)	Top-1 acc 71.094 (66.597)	Top-5 acc 88.281 (85.666)	lr 0.00256
Train [96][450/3239]	Time 0.226 (0.630)	Data Time 0.001 (0.084)	Loss 2.4251 (2.3889)	Entropy 0.55582 (0.55520)	Top-1 acc 65.625 (66.577)	Top-5 acc 85.547 (85.654)	lr 0.00256
Train [96][460/3239]	Time 0.212 (0.625)	Data Time 0.001 (0.082)	Loss 2.6590 (2.3910)	Entropy 0.55594 (0.55521)	Top-1 acc 57.812 (66.537)	Top-5 acc 82.422 (85.615)	lr 0.00255
Train [96][470/3239]	Time 0.237 (0.621)	Data Time 0.001 (0.081)	Loss 2.4901 (2.3900)	Entropy 0.55605 (0.55523)	Top-1 acc 63.672 (66.571)	Top-5 acc 86.719 (85.638)	lr 0.00255
Train [96][480/3239]	Time 0.231 (0.616)	Data Time 0.001 (0.079)	Loss 2.2814 (2.3899)	Entropy 0.55615 (0.55525)	Top-1 acc 66.016 (66.571)	Top-5 acc 89.062 (85.641)	lr 0.00255
Train [96][490/3239]	Time 0.232 (0.612)	Data Time 0.001 (0.077)	Loss 2.2619 (2.3912)	Entropy 0.55627 (0.55527)	Top-1 acc 68.750 (66.510)	Top-5 acc 89.453 (85.623)	lr 0.00255
Train [96][500/3239]	Time 0.225 (0.608)	Data Time 0.001 (0.076)	Loss 2.4710 (2.3932)	Entropy 0.55636 (0.55529)	Top-1 acc 64.844 (66.462)	Top-5 acc 84.375 (85.594)	lr 0.00255
Train [96][510/3239]	Time 0.223 (0.603)	Data Time 0.001 (0.074)	Loss 2.4111 (2.3938)	Entropy 0.55661 (0.55531)	Top-1 acc 67.188 (66.444)	Top-5 acc 85.547 (85.586)	lr 0.00255
Train [96][520/3239]	Time 0.223 (0.600)	Data Time 0.001 (0.073)	Loss 2.4552 (2.3951)	Entropy 0.55692 (0.55534)	Top-1 acc 67.578 (66.418)	Top-5 acc 83.984 (85.556)	lr 0.00255
Train [96][530/3239]	Time 0.228 (0.596)	Data Time 0.001 (0.072)	Loss 2.2093 (2.3943)	Entropy 0.55683 (0.55537)	Top-1 acc 71.875 (66.430)	Top-5 acc 89.453 (85.565)	lr 0.00255
Train [96][540/3239]	Time 0.228 (0.593)	Data Time 0.001 (0.070)	Loss 2.5568 (2.3952)	Entropy 0.55673 (0.55540)	Top-1 acc 60.547 (66.401)	Top-5 acc 82.031 (85.543)	lr 0.00255
Train [96][550/3239]	Time 0.225 (0.589)	Data Time 0.001 (0.069)	Loss 2.4066 (2.3946)	Entropy 0.55695 (0.55542)	Top-1 acc 65.625 (66.423)	Top-5 acc 85.156 (85.550)	lr 0.00255
Train [96][560/3239]	Time 0.317 (0.586)	Data Time 0.001 (0.068)	Loss 2.4052 (2.3956)	Entropy 0.55719 (0.55545)	Top-1 acc 67.969 (66.399)	Top-5 acc 83.984 (85.520)	lr 0.00255
Train [96][570/3239]	Time 0.229 (0.583)	Data Time 0.001 (0.067)	Loss 2.2277 (2.3952)	Entropy 0.55727 (0.55548)	Top-1 acc 67.969 (66.412)	Top-5 acc 90.625 (85.538)	lr 0.00255
Train [96][580/3239]	Time 0.232 (0.580)	Data Time 0.001 (0.066)	Loss 2.4357 (2.3961)	Entropy 0.55724 (0.55551)	Top-1 acc 63.281 (66.377)	Top-5 acc 86.328 (85.527)	lr 0.00255
Train [96][590/3239]	Time 0.257 (0.577)	Data Time 0.002 (0.065)	Loss 2.3467 (2.3950)	Entropy 0.55698 (0.55554)	Top-1 acc 68.359 (66.402)	Top-5 acc 82.812 (85.540)	lr 0.00255
Train [96][600/3239]	Time 0.241 (0.574)	Data Time 0.001 (0.064)	Loss 2.3731 (2.3948)	Entropy 0.55658 (0.55556)	Top-1 acc 62.500 (66.388)	Top-5 acc 86.328 (85.548)	lr 0.00255
Train [96][610/3239]	Time 0.226 (0.571)	Data Time 0.001 (0.063)	Loss 2.3616 (2.3954)	Entropy 0.55664 (0.55558)	Top-1 acc 66.016 (66.375)	Top-5 acc 85.547 (85.527)	lr 0.00255
Train [96][620/3239]	Time 0.235 (0.569)	Data Time 0.001 (0.062)	Loss 2.4728 (2.3950)	Entropy 0.55667 (0.55560)	Top-1 acc 62.500 (66.382)	Top-5 acc 83.203 (85.532)	lr 0.00255
Train [96][630/3239]	Time 0.320 (0.566)	Data Time 0.001 (0.061)	Loss 2.4882 (2.3969)	Entropy 0.55685 (0.55561)	Top-1 acc 66.406 (66.339)	Top-5 acc 81.641 (85.490)	lr 0.00254
Train [96][640/3239]	Time 0.237 (0.564)	Data Time 0.001 (0.060)	Loss 2.2433 (2.3963)	Entropy 0.55699 (0.55564)	Top-1 acc 69.922 (66.360)	Top-5 acc 88.281 (85.493)	lr 0.00254
Train [96][650/3239]	Time 0.223 (0.561)	Data Time 0.002 (0.059)	Loss 2.2325 (2.3956)	Entropy 0.55707 (0.55566)	Top-1 acc 70.312 (66.375)	Top-5 acc 86.719 (85.510)	lr 0.00254
Train [96][660/3239]	Time 0.237 (0.559)	Data Time 0.001 (0.058)	Loss 2.3568 (2.3950)	Entropy 0.55684 (0.55568)	Top-1 acc 70.312 (66.389)	Top-5 acc 87.109 (85.525)	lr 0.00254
Train [96][670/3239]	Time 0.283 (0.559)	Data Time 0.001 (0.057)	Loss 2.4625 (2.3948)	Entropy 0.55657 (0.55569)	Top-1 acc 65.625 (66.396)	Top-5 acc 82.812 (85.524)	lr 0.00254
Train [96][680/3239]	Time 0.320 (0.636)	Data Time 0.002 (0.056)	Loss 2.2379 (2.3951)	Entropy 0.55651 (0.55571)	Top-1 acc 71.094 (66.395)	Top-5 acc 87.891 (85.523)	lr 0.00254
Train [96][690/3239]	Time 0.243 (0.633)	Data Time 0.002 (0.056)	Loss 2.6688 (2.3949)	Entropy 0.55662 (0.55572)	Top-1 acc 57.812 (66.412)	Top-5 acc 81.641 (85.529)	lr 0.00254
Train [96][700/3239]	Time 0.237 (0.630)	Data Time 0.001 (0.055)	Loss 2.1984 (2.3951)	Entropy 0.55650 (0.55573)	Top-1 acc 71.875 (66.406)	Top-5 acc 90.625 (85.536)	lr 0.00254
Train [96][710/3239]	Time 0.232 (0.627)	Data Time 0.001 (0.054)	Loss 2.6221 (2.3952)	Entropy 0.55663 (0.55574)	Top-1 acc 64.062 (66.411)	Top-5 acc 79.297 (85.527)	lr 0.00254
Train [96][720/3239]	Time 0.326 (0.624)	Data Time 0.001 (0.053)	Loss 2.5193 (2.3965)	Entropy 0.55670 (0.55575)	Top-1 acc 65.234 (66.372)	Top-5 acc 82.812 (85.499)	lr 0.00254
Train [96][730/3239]	Time 0.225 (0.621)	Data Time 0.001 (0.053)	Loss 2.6521 (2.3969)	Entropy 0.55692 (0.55577)	Top-1 acc 59.766 (66.371)	Top-5 acc 81.250 (85.491)	lr 0.00254
Train [96][740/3239]	Time 0.230 (0.619)	Data Time 0.001 (0.052)	Loss 2.3702 (2.3970)	Entropy 0.55680 (0.55578)	Top-1 acc 69.922 (66.368)	Top-5 acc 82.812 (85.495)	lr 0.00254
Train [96][750/3239]	Time 0.236 (0.616)	Data Time 0.001 (0.051)	Loss 2.1601 (2.3966)	Entropy 0.55686 (0.55580)	Top-1 acc 75.391 (66.372)	Top-5 acc 87.891 (85.497)	lr 0.00254
Train [96][760/3239]	Time 0.236 (0.613)	Data Time 0.001 (0.051)	Loss 2.6080 (2.3970)	Entropy 0.55664 (0.55581)	Top-1 acc 62.109 (66.361)	Top-5 acc 82.422 (85.497)	lr 0.00254
Train [96][770/3239]	Time 0.225 (0.611)	Data Time 0.001 (0.050)	Loss 2.5417 (2.3974)	Entropy 0.55659 (0.55582)	Top-1 acc 62.109 (66.352)	Top-5 acc 83.984 (85.501)	lr 0.00254
Train [96][780/3239]	Time 0.229 (0.608)	Data Time 0.001 (0.049)	Loss 2.2864 (2.3969)	Entropy 0.55659 (0.55583)	Top-1 acc 69.141 (66.356)	Top-5 acc 89.062 (85.501)	lr 0.00254
Train [96][790/3239]	Time 0.324 (0.606)	Data Time 0.001 (0.049)	Loss 2.3048 (2.3964)	Entropy 0.55635 (0.55584)	Top-1 acc 65.625 (66.356)	Top-5 acc 87.500 (85.516)	lr 0.00253
Train [96][800/3239]	Time 0.223 (0.603)	Data Time 0.001 (0.048)	Loss 2.3808 (2.3968)	Entropy 0.55599 (0.55584)	Top-1 acc 66.406 (66.341)	Top-5 acc 85.156 (85.508)	lr 0.00253
Train [96][810/3239]	Time 0.242 (0.601)	Data Time 0.001 (0.048)	Loss 2.2735 (2.3966)	Entropy 0.55591 (0.55585)	Top-1 acc 69.141 (66.352)	Top-5 acc 88.281 (85.510)	lr 0.00253
Train [96][820/3239]	Time 0.230 (0.599)	Data Time 0.001 (0.047)	Loss 2.3466 (2.3967)	Entropy 0.55574 (0.55585)	Top-1 acc 68.750 (66.360)	Top-5 acc 88.281 (85.510)	lr 0.00253
Train [96][830/3239]	Time 0.225 (0.597)	Data Time 0.001 (0.046)	Loss 2.1696 (2.3976)	Entropy 0.55599 (0.55584)	Top-1 acc 74.219 (66.348)	Top-5 acc 89.453 (85.497)	lr 0.00253
Train [96][840/3239]	Time 0.235 (0.595)	Data Time 0.001 (0.046)	Loss 2.3838 (2.3979)	Entropy 0.55625 (0.55585)	Top-1 acc 66.406 (66.333)	Top-5 acc 85.547 (85.494)	lr 0.00253
Train [96][850/3239]	Time 0.224 (0.593)	Data Time 0.001 (0.045)	Loss 2.2855 (2.3973)	Entropy 0.55614 (0.55585)	Top-1 acc 68.359 (66.350)	Top-5 acc 87.109 (85.503)	lr 0.00253
Train [96][860/3239]	Time 0.295 (0.592)	Data Time 0.001 (0.045)	Loss 2.2559 (2.3970)	Entropy 0.55627 (0.55586)	Top-1 acc 70.312 (66.364)	Top-5 acc 87.891 (85.506)	lr 0.00253
Train [96][870/3239]	Time 0.230 (0.591)	Data Time 0.001 (0.044)	Loss 2.3987 (2.3972)	Entropy 0.55614 (0.55586)	Top-1 acc 66.016 (66.361)	Top-5 acc 86.328 (85.501)	lr 0.00253
Train [96][880/3239]	Time 0.341 (0.589)	Data Time 0.001 (0.044)	Loss 2.2302 (2.3966)	Entropy 0.55636 (0.55586)	Top-1 acc 67.578 (66.373)	Top-5 acc 87.109 (85.507)	lr 0.00253
Train [96][890/3239]	Time 0.227 (0.587)	Data Time 0.001 (0.043)	Loss 2.5113 (2.3961)	Entropy 0.55604 (0.55587)	Top-1 acc 62.109 (66.383)	Top-5 acc 85.547 (85.513)	lr 0.00253
Train [96][900/3239]	Time 0.229 (0.585)	Data Time 0.001 (0.043)	Loss 2.3704 (2.3958)	Entropy 0.55609 (0.55587)	Top-1 acc 61.719 (66.378)	Top-5 acc 85.156 (85.517)	lr 0.00253
Train [96][910/3239]	Time 0.233 (0.583)	Data Time 0.001 (0.042)	Loss 2.3764 (2.3951)	Entropy 0.55621 (0.55587)	Top-1 acc 64.453 (66.385)	Top-5 acc 85.938 (85.531)	lr 0.00253
Train [96][920/3239]	Time 0.238 (0.581)	Data Time 0.001 (0.042)	Loss 2.3820 (2.3950)	Entropy 0.55620 (0.55588)	Top-1 acc 65.234 (66.375)	Top-5 acc 83.984 (85.530)	lr 0.00253
Train [96][930/3239]	Time 0.221 (0.580)	Data Time 0.001 (0.042)	Loss 2.7373 (2.3953)	Entropy 0.55604 (0.55588)	Top-1 acc 55.469 (66.363)	Top-5 acc 81.641 (85.533)	lr 0.00253
Train [96][940/3239]	Time 0.234 (0.578)	Data Time 0.001 (0.041)	Loss 2.4701 (2.3954)	Entropy 0.55632 (0.55588)	Top-1 acc 69.141 (66.371)	Top-5 acc 80.469 (85.529)	lr 0.00253
Train [96][950/3239]	Time 0.367 (0.577)	Data Time 0.001 (0.041)	Loss 2.4348 (2.3953)	Entropy 0.55652 (0.55589)	Top-1 acc 64.453 (66.366)	Top-5 acc 85.156 (85.533)	lr 0.00252
Train [96][960/3239]	Time 0.230 (0.575)	Data Time 0.001 (0.040)	Loss 2.3558 (2.3954)	Entropy 0.55652 (0.55589)	Top-1 acc 69.141 (66.372)	Top-5 acc 87.109 (85.531)	lr 0.00252
Train [96][970/3239]	Time 0.236 (0.573)	Data Time 0.001 (0.040)	Loss 2.3084 (2.3954)	Entropy 0.55649 (0.55590)	Top-1 acc 67.969 (66.376)	Top-5 acc 88.281 (85.530)	lr 0.00252
Train [96][980/3239]	Time 0.229 (0.572)	Data Time 0.001 (0.040)	Loss 2.4615 (2.3962)	Entropy 0.55650 (0.55591)	Top-1 acc 65.625 (66.353)	Top-5 acc 82.812 (85.515)	lr 0.00252
Train [96][990/3239]	Time 0.237 (0.570)	Data Time 0.001 (0.039)	Loss 2.1709 (2.3956)	Entropy 0.55641 (0.55591)	Top-1 acc 69.922 (66.366)	Top-5 acc 88.281 (85.528)	lr 0.00252
Train [96][1000/3239]	Time 0.237 (0.569)	Data Time 0.001 (0.039)	Loss 2.3206 (2.3951)	Entropy 0.55627 (0.55592)	Top-1 acc 67.578 (66.375)	Top-5 acc 88.672 (85.541)	lr 0.00252
Train [96][1010/3239]	Time 0.236 (0.567)	Data Time 0.001 (0.038)	Loss 2.2261 (2.3952)	Entropy 0.55625 (0.55592)	Top-1 acc 72.266 (66.370)	Top-5 acc 85.938 (85.532)	lr 0.00252
Train [96][1020/3239]	Time 0.235 (0.566)	Data Time 0.001 (0.038)	Loss 2.3579 (2.3956)	Entropy 0.55636 (0.55592)	Top-1 acc 68.359 (66.369)	Top-5 acc 85.156 (85.525)	lr 0.00252
Train [96][1030/3239]	Time 0.225 (0.564)	Data Time 0.001 (0.038)	Loss 2.3824 (2.3951)	Entropy 0.55668 (0.55593)	Top-1 acc 70.703 (66.380)	Top-5 acc 85.938 (85.528)	lr 0.00252
Train [96][1040/3239]	Time 0.243 (0.563)	Data Time 0.001 (0.037)	Loss 2.4302 (2.3949)	Entropy 0.55671 (0.55594)	Top-1 acc 64.844 (66.380)	Top-5 acc 84.766 (85.530)	lr 0.00252
Train [96][1050/3239]	Time 0.241 (0.561)	Data Time 0.001 (0.037)	Loss 2.5463 (2.3948)	Entropy 0.55654 (0.55594)	Top-1 acc 62.109 (66.389)	Top-5 acc 83.594 (85.531)	lr 0.00252
Train [96][1060/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.037)	Loss 2.2638 (2.3949)	Entropy 0.55677 (0.55595)	Top-1 acc 70.703 (66.390)	Top-5 acc 86.328 (85.527)	lr 0.00252
Train [96][1070/3239]	Time 0.228 (0.558)	Data Time 0.001 (0.036)	Loss 2.3863 (2.3948)	Entropy 0.55652 (0.55596)	Top-1 acc 67.188 (66.387)	Top-5 acc 84.375 (85.528)	lr 0.00252
Train [96][1080/3239]	Time 0.232 (0.557)	Data Time 0.001 (0.036)	Loss 2.2448 (2.3948)	Entropy 0.55675 (0.55596)	Top-1 acc 71.484 (66.394)	Top-5 acc 86.719 (85.524)	lr 0.00252
Train [96][1090/3239]	Time 0.227 (0.555)	Data Time 0.001 (0.036)	Loss 2.6064 (2.3952)	Entropy 0.55665 (0.55597)	Top-1 acc 61.328 (66.387)	Top-5 acc 82.422 (85.514)	lr 0.00252
Train [96][1100/3239]	Time 0.221 (0.554)	Data Time 0.001 (0.035)	Loss 2.4643 (2.3952)	Entropy 0.55680 (0.55598)	Top-1 acc 64.453 (66.377)	Top-5 acc 84.766 (85.517)	lr 0.00252
Train [96][1110/3239]	Time 0.314 (0.553)	Data Time 0.001 (0.035)	Loss 2.2504 (2.3950)	Entropy 0.55696 (0.55598)	Top-1 acc 69.922 (66.378)	Top-5 acc 87.500 (85.519)	lr 0.00252
Train [96][1120/3239]	Time 0.247 (0.551)	Data Time 0.001 (0.035)	Loss 2.4554 (2.3949)	Entropy 0.55664 (0.55599)	Top-1 acc 65.234 (66.384)	Top-5 acc 84.766 (85.520)	lr 0.00251
Train [96][1130/3239]	Time 0.229 (0.550)	Data Time 0.001 (0.035)	Loss 2.3706 (2.3950)	Entropy 0.55665 (0.55600)	Top-1 acc 65.234 (66.380)	Top-5 acc 85.547 (85.518)	lr 0.00251
Train [96][1140/3239]	Time 0.224 (0.549)	Data Time 0.001 (0.034)	Loss 2.2695 (2.3949)	Entropy 0.55689 (0.55600)	Top-1 acc 69.531 (66.377)	Top-5 acc 88.281 (85.516)	lr 0.00251
Train [96][1150/3239]	Time 0.249 (0.548)	Data Time 0.001 (0.034)	Loss 2.2455 (2.3948)	Entropy 0.55700 (0.55601)	Top-1 acc 66.797 (66.379)	Top-5 acc 87.500 (85.522)	lr 0.00251
Train [96][1160/3239]	Time 0.219 (0.547)	Data Time 0.001 (0.034)	Loss 2.4945 (2.3949)	Entropy 0.55678 (0.55602)	Top-1 acc 60.938 (66.370)	Top-5 acc 87.500 (85.522)	lr 0.00251
Train [96][1170/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.033)	Loss 2.5384 (2.3951)	Entropy 0.55663 (0.55603)	Top-1 acc 64.453 (66.356)	Top-5 acc 83.984 (85.521)	lr 0.00251
Train [96][1180/3239]	Time 0.421 (0.545)	Data Time 0.001 (0.033)	Loss 2.2904 (2.3950)	Entropy 0.55663 (0.55603)	Top-1 acc 70.312 (66.355)	Top-5 acc 89.062 (85.529)	lr 0.00251
Train [96][1190/3239]	Time 0.235 (0.544)	Data Time 0.001 (0.033)	Loss 2.3469 (2.3951)	Entropy 0.55692 (0.55604)	Top-1 acc 68.359 (66.349)	Top-5 acc 85.938 (85.533)	lr 0.00251
Train [96][1200/3239]	Time 0.228 (0.543)	Data Time 0.001 (0.033)	Loss 2.1502 (2.3946)	Entropy 0.55704 (0.55605)	Top-1 acc 72.656 (66.362)	Top-5 acc 90.625 (85.545)	lr 0.00251
Train [96][1210/3239]	Time 0.225 (0.542)	Data Time 0.001 (0.032)	Loss 2.4435 (2.3947)	Entropy 0.55694 (0.55605)	Top-1 acc 67.969 (66.359)	Top-5 acc 87.500 (85.546)	lr 0.00251
Train [96][1220/3239]	Time 0.226 (0.541)	Data Time 0.001 (0.032)	Loss 2.5031 (2.3953)	Entropy 0.55718 (0.55606)	Top-1 acc 63.672 (66.342)	Top-5 acc 82.812 (85.534)	lr 0.00251
Train [96][1230/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.032)	Loss 2.1700 (2.3953)	Entropy 0.55726 (0.55607)	Top-1 acc 70.703 (66.347)	Top-5 acc 90.625 (85.532)	lr 0.00251
Train [96][1240/3239]	Time 0.229 (0.539)	Data Time 0.001 (0.032)	Loss 2.3337 (2.3948)	Entropy 0.55711 (0.55608)	Top-1 acc 68.359 (66.361)	Top-5 acc 87.500 (85.540)	lr 0.00251
Train [96][1250/3239]	Time 0.250 (0.538)	Data Time 0.001 (0.031)	Loss 2.3815 (2.3942)	Entropy 0.55733 (0.55609)	Top-1 acc 66.797 (66.373)	Top-5 acc 86.719 (85.549)	lr 0.00251
Train [96][1260/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.031)	Loss 2.3030 (2.3944)	Entropy 0.55723 (0.55610)	Top-1 acc 69.141 (66.368)	Top-5 acc 86.719 (85.550)	lr 0.00251
Train [96][1270/3239]	Time 0.318 (0.535)	Data Time 0.001 (0.031)	Loss 2.2994 (2.3944)	Entropy 0.55750 (0.55611)	Top-1 acc 66.797 (66.364)	Top-5 acc 89.062 (85.551)	lr 0.00251
Train [96][1280/3239]	Time 0.235 (0.535)	Data Time 0.002 (0.031)	Loss 2.4463 (2.3948)	Entropy 0.55778 (0.55612)	Top-1 acc 65.625 (66.353)	Top-5 acc 83.594 (85.546)	lr 0.00250
Train [96][1290/3239]	Time 0.229 (0.534)	Data Time 0.001 (0.030)	Loss 2.4637 (2.3949)	Entropy 0.55813 (0.55613)	Top-1 acc 62.500 (66.351)	Top-5 acc 83.984 (85.543)	lr 0.00250
Train [96][1300/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.030)	Loss 2.4936 (2.3952)	Entropy 0.55800 (0.55615)	Top-1 acc 63.281 (66.340)	Top-5 acc 85.156 (85.538)	lr 0.00250
Train [96][1310/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.030)	Loss 2.4167 (2.3954)	Entropy 0.55815 (0.55616)	Top-1 acc 68.359 (66.337)	Top-5 acc 82.812 (85.537)	lr 0.00250
Train [96][1320/3239]	Time 0.256 (0.531)	Data Time 0.001 (0.030)	Loss 2.2412 (2.3957)	Entropy 0.55821 (0.55618)	Top-1 acc 67.188 (66.329)	Top-5 acc 88.281 (85.531)	lr 0.00250
Train [96][1330/3239]	Time 0.304 (0.571)	Data Time 0.028 (0.030)	Loss 2.7601 (2.3955)	Entropy 0.55797 (0.55619)	Top-1 acc 59.766 (66.335)	Top-5 acc 77.344 (85.534)	lr 0.00250
Train [96][1340/3239]	Time 0.325 (0.570)	Data Time 0.002 (0.029)	Loss 2.2846 (2.3953)	Entropy 0.55808 (0.55620)	Top-1 acc 69.531 (66.339)	Top-5 acc 87.109 (85.539)	lr 0.00250
Train [96][1350/3239]	Time 0.265 (0.569)	Data Time 0.001 (0.029)	Loss 2.2197 (2.3952)	Entropy 0.55810 (0.55622)	Top-1 acc 69.922 (66.343)	Top-5 acc 87.500 (85.536)	lr 0.00250
Train [96][1360/3239]	Time 0.234 (0.568)	Data Time 0.001 (0.029)	Loss 2.1950 (2.3951)	Entropy 0.55776 (0.55623)	Top-1 acc 71.094 (66.347)	Top-5 acc 89.453 (85.542)	lr 0.00250
Train [96][1370/3239]	Time 0.283 (0.567)	Data Time 0.002 (0.029)	Loss 2.2823 (2.3943)	Entropy 0.55793 (0.55624)	Top-1 acc 69.141 (66.364)	Top-5 acc 88.672 (85.560)	lr 0.00250
Train [96][1380/3239]	Time 0.241 (0.567)	Data Time 0.002 (0.029)	Loss 2.3880 (2.3940)	Entropy 0.55804 (0.55626)	Top-1 acc 62.891 (66.376)	Top-5 acc 87.109 (85.569)	lr 0.00250
Train [96][1390/3239]	Time 0.241 (0.566)	Data Time 0.001 (0.028)	Loss 2.3641 (2.3941)	Entropy 0.55794 (0.55627)	Top-1 acc 64.453 (66.373)	Top-5 acc 85.938 (85.565)	lr 0.00250
Train [96][1400/3239]	Time 0.239 (0.565)	Data Time 0.001 (0.028)	Loss 2.4149 (2.3941)	Entropy 0.55797 (0.55628)	Top-1 acc 66.797 (66.374)	Top-5 acc 84.375 (85.565)	lr 0.00250
Train [96][1410/3239]	Time 0.238 (0.564)	Data Time 0.001 (0.028)	Loss 2.3939 (2.3941)	Entropy 0.55797 (0.55629)	Top-1 acc 62.109 (66.373)	Top-5 acc 85.547 (85.566)	lr 0.00250
Train [96][1420/3239]	Time 0.230 (0.563)	Data Time 0.001 (0.028)	Loss 2.4322 (2.3937)	Entropy 0.55778 (0.55630)	Top-1 acc 66.797 (66.379)	Top-5 acc 85.938 (85.572)	lr 0.00250
Train [96][1430/3239]	Time 0.320 (0.562)	Data Time 0.001 (0.028)	Loss 2.4120 (2.3940)	Entropy 0.55814 (0.55632)	Top-1 acc 69.141 (66.376)	Top-5 acc 85.156 (85.568)	lr 0.00250
Train [96][1440/3239]	Time 0.222 (0.561)	Data Time 0.001 (0.028)	Loss 2.5227 (2.3936)	Entropy 0.55796 (0.55633)	Top-1 acc 62.891 (66.388)	Top-5 acc 84.766 (85.572)	lr 0.00250
Train [96][1450/3239]	Time 0.229 (0.560)	Data Time 0.001 (0.027)	Loss 2.3651 (2.3937)	Entropy 0.55777 (0.55634)	Top-1 acc 67.188 (66.387)	Top-5 acc 84.766 (85.571)	lr 0.00249
Train [96][1460/3239]	Time 0.232 (0.559)	Data Time 0.001 (0.027)	Loss 2.2759 (2.3939)	Entropy 0.55756 (0.55635)	Top-1 acc 70.703 (66.382)	Top-5 acc 86.719 (85.563)	lr 0.00249
Train [96][1470/3239]	Time 0.238 (0.558)	Data Time 0.001 (0.027)	Loss 2.5004 (2.3943)	Entropy 0.55796 (0.55636)	Top-1 acc 66.406 (66.371)	Top-5 acc 82.422 (85.554)	lr 0.00249
Train [96][1480/3239]	Time 0.218 (0.557)	Data Time 0.001 (0.027)	Loss 3.0307 (2.3950)	Entropy 0.55777 (0.55637)	Top-1 acc 54.297 (66.351)	Top-5 acc 73.438 (85.540)	lr 0.00249
Train [96][1490/3239]	Time 0.235 (0.556)	Data Time 0.001 (0.027)	Loss 2.3499 (2.3949)	Entropy 0.55817 (0.55638)	Top-1 acc 69.141 (66.358)	Top-5 acc 85.547 (85.547)	lr 0.00249
Train [96][1500/3239]	Time 0.330 (0.555)	Data Time 0.001 (0.026)	Loss 2.4182 (2.3947)	Entropy 0.55827 (0.55639)	Top-1 acc 63.672 (66.358)	Top-5 acc 83.984 (85.550)	lr 0.00249
Train [96][1510/3239]	Time 0.243 (0.554)	Data Time 0.002 (0.026)	Loss 2.3290 (2.3950)	Entropy 0.55820 (0.55640)	Top-1 acc 68.359 (66.358)	Top-5 acc 84.375 (85.545)	lr 0.00249
Train [96][1520/3239]	Time 0.226 (0.553)	Data Time 0.001 (0.026)	Loss 2.3533 (2.3951)	Entropy 0.55789 (0.55641)	Top-1 acc 67.969 (66.357)	Top-5 acc 84.766 (85.547)	lr 0.00249
Train [96][1530/3239]	Time 0.255 (0.552)	Data Time 0.001 (0.026)	Loss 2.4883 (2.3950)	Entropy 0.55816 (0.55642)	Top-1 acc 62.891 (66.359)	Top-5 acc 84.766 (85.552)	lr 0.00249
Train [96][1540/3239]	Time 0.221 (0.551)	Data Time 0.001 (0.026)	Loss 2.3812 (2.3950)	Entropy 0.55831 (0.55644)	Top-1 acc 65.625 (66.357)	Top-5 acc 85.547 (85.551)	lr 0.00249
Train [96][1550/3239]	Time 0.234 (0.551)	Data Time 0.001 (0.026)	Loss 2.2910 (2.3949)	Entropy 0.55840 (0.55645)	Top-1 acc 67.969 (66.356)	Top-5 acc 87.891 (85.554)	lr 0.00249
Train [96][1560/3239]	Time 0.218 (0.550)	Data Time 0.001 (0.026)	Loss 2.4905 (2.3953)	Entropy 0.55865 (0.55646)	Top-1 acc 64.062 (66.348)	Top-5 acc 81.641 (85.545)	lr 0.00249
Train [96][1570/3239]	Time 0.228 (0.549)	Data Time 0.001 (0.025)	Loss 2.3444 (2.3953)	Entropy 0.55882 (0.55647)	Top-1 acc 67.188 (66.349)	Top-5 acc 87.109 (85.544)	lr 0.00249
Train [96][1580/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.025)	Loss 2.3536 (2.3954)	Entropy 0.55886 (0.55649)	Top-1 acc 69.141 (66.350)	Top-5 acc 85.938 (85.544)	lr 0.00249
Train [96][1590/3239]	Time 0.265 (0.547)	Data Time 0.001 (0.025)	Loss 2.1882 (2.3959)	Entropy 0.55894 (0.55651)	Top-1 acc 67.969 (66.335)	Top-5 acc 90.234 (85.531)	lr 0.00249
Train [96][1600/3239]	Time 0.221 (0.546)	Data Time 0.001 (0.025)	Loss 2.4697 (2.3960)	Entropy 0.55909 (0.55652)	Top-1 acc 60.547 (66.325)	Top-5 acc 85.547 (85.532)	lr 0.00249
Train [96][1610/3239]	Time 0.235 (0.546)	Data Time 0.001 (0.025)	Loss 2.3108 (2.3960)	Entropy 0.55848 (0.55654)	Top-1 acc 68.359 (66.327)	Top-5 acc 87.500 (85.529)	lr 0.00248
Train [96][1620/3239]	Time 0.272 (0.545)	Data Time 0.001 (0.025)	Loss 2.6815 (2.3963)	Entropy 0.55834 (0.55655)	Top-1 acc 59.375 (66.314)	Top-5 acc 80.078 (85.525)	lr 0.00248
Train [96][1630/3239]	Time 0.238 (0.544)	Data Time 0.001 (0.024)	Loss 2.2318 (2.3963)	Entropy 0.55828 (0.55656)	Top-1 acc 71.484 (66.314)	Top-5 acc 85.156 (85.527)	lr 0.00248
Train [96][1640/3239]	Time 0.248 (0.543)	Data Time 0.001 (0.024)	Loss 2.5465 (2.3964)	Entropy 0.55825 (0.55657)	Top-1 acc 62.500 (66.305)	Top-5 acc 81.641 (85.526)	lr 0.00248
Train [96][1650/3239]	Time 0.269 (0.543)	Data Time 0.001 (0.024)	Loss 2.3741 (2.3960)	Entropy 0.55856 (0.55658)	Top-1 acc 66.016 (66.313)	Top-5 acc 84.375 (85.527)	lr 0.00248
Train [96][1660/3239]	Time 0.329 (0.542)	Data Time 0.001 (0.024)	Loss 2.3669 (2.3960)	Entropy 0.55904 (0.55659)	Top-1 acc 64.844 (66.312)	Top-5 acc 86.328 (85.529)	lr 0.00248
Train [96][1670/3239]	Time 0.221 (0.541)	Data Time 0.001 (0.024)	Loss 2.5474 (2.3961)	Entropy 0.55889 (0.55661)	Top-1 acc 64.844 (66.310)	Top-5 acc 80.078 (85.522)	lr 0.00248
Train [96][1680/3239]	Time 0.228 (0.540)	Data Time 0.001 (0.024)	Loss 2.4369 (2.3959)	Entropy 0.55878 (0.55662)	Top-1 acc 66.406 (66.312)	Top-5 acc 84.766 (85.522)	lr 0.00248
Train [96][1690/3239]	Time 0.271 (0.540)	Data Time 0.001 (0.024)	Loss 2.5391 (2.3956)	Entropy 0.55857 (0.55663)	Top-1 acc 61.719 (66.321)	Top-5 acc 80.469 (85.530)	lr 0.00248
Train [96][1700/3239]	Time 0.224 (0.540)	Data Time 0.001 (0.024)	Loss 2.4617 (2.3960)	Entropy 0.55836 (0.55664)	Top-1 acc 63.281 (66.309)	Top-5 acc 82.031 (85.523)	lr 0.00248
Train [96][1710/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.023)	Loss 2.3837 (2.3963)	Entropy 0.55825 (0.55665)	Top-1 acc 64.062 (66.297)	Top-5 acc 83.203 (85.516)	lr 0.00248
Train [96][1720/3239]	Time 0.223 (0.538)	Data Time 0.001 (0.023)	Loss 2.2203 (2.3962)	Entropy 0.55867 (0.55666)	Top-1 acc 71.484 (66.298)	Top-5 acc 87.500 (85.518)	lr 0.00248
Train [96][1730/3239]	Time 0.324 (0.538)	Data Time 0.001 (0.023)	Loss 2.3287 (2.3960)	Entropy 0.55899 (0.55668)	Top-1 acc 69.922 (66.303)	Top-5 acc 87.500 (85.521)	lr 0.00248
Train [96][1740/3239]	Time 0.218 (0.537)	Data Time 0.001 (0.023)	Loss 2.6751 (2.3961)	Entropy 0.55924 (0.55669)	Top-1 acc 57.031 (66.301)	Top-5 acc 82.031 (85.520)	lr 0.00248
Train [96][1750/3239]	Time 0.220 (0.536)	Data Time 0.001 (0.023)	Loss 2.2950 (2.3959)	Entropy 0.55935 (0.55670)	Top-1 acc 64.844 (66.305)	Top-5 acc 88.672 (85.525)	lr 0.00248
Train [96][1760/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.023)	Loss 2.4529 (2.3962)	Entropy 0.55971 (0.55672)	Top-1 acc 62.109 (66.299)	Top-5 acc 84.766 (85.522)	lr 0.00248
Train [96][1770/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.023)	Loss 2.4039 (2.3964)	Entropy 0.55929 (0.55674)	Top-1 acc 66.016 (66.292)	Top-5 acc 86.328 (85.518)	lr 0.00248
Train [96][1780/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.023)	Loss 2.3839 (2.3965)	Entropy 0.55902 (0.55675)	Top-1 acc 66.016 (66.291)	Top-5 acc 85.547 (85.517)	lr 0.00247
Train [96][1790/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.022)	Loss 2.3024 (2.3962)	Entropy 0.55903 (0.55676)	Top-1 acc 66.406 (66.296)	Top-5 acc 88.672 (85.521)	lr 0.00247
Train [96][1800/3239]	Time 0.284 (0.533)	Data Time 0.001 (0.022)	Loss 2.2904 (2.3966)	Entropy 0.55911 (0.55678)	Top-1 acc 69.141 (66.282)	Top-5 acc 87.891 (85.513)	lr 0.00247
Train [96][1810/3239]	Time 0.279 (0.533)	Data Time 0.001 (0.022)	Loss 2.2286 (2.3966)	Entropy 0.55941 (0.55679)	Top-1 acc 70.703 (66.285)	Top-5 acc 90.234 (85.513)	lr 0.00247
Train [96][1820/3239]	Time 0.327 (0.532)	Data Time 0.001 (0.022)	Loss 2.4970 (2.3965)	Entropy 0.55939 (0.55680)	Top-1 acc 62.500 (66.290)	Top-5 acc 83.203 (85.513)	lr 0.00247
Train [96][1830/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.022)	Loss 2.3259 (2.3963)	Entropy 0.55907 (0.55682)	Top-1 acc 69.141 (66.294)	Top-5 acc 85.938 (85.517)	lr 0.00247
Train [96][1840/3239]	Time 0.230 (0.531)	Data Time 0.001 (0.022)	Loss 2.4931 (2.3963)	Entropy 0.55857 (0.55683)	Top-1 acc 62.109 (66.294)	Top-5 acc 83.984 (85.519)	lr 0.00247
Train [96][1850/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.022)	Loss 2.3160 (2.3964)	Entropy 0.55857 (0.55684)	Top-1 acc 69.922 (66.295)	Top-5 acc 85.938 (85.518)	lr 0.00247
Train [96][1860/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.022)	Loss 2.3741 (2.3961)	Entropy 0.55839 (0.55685)	Top-1 acc 70.312 (66.304)	Top-5 acc 84.766 (85.517)	lr 0.00247
Train [96][1870/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.022)	Loss 2.5991 (2.3962)	Entropy 0.55814 (0.55685)	Top-1 acc 62.500 (66.300)	Top-5 acc 82.812 (85.515)	lr 0.00247
Train [96][1880/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.021)	Loss 2.4740 (2.3965)	Entropy 0.55829 (0.55686)	Top-1 acc 65.625 (66.296)	Top-5 acc 82.812 (85.509)	lr 0.00247
Train [96][1890/3239]	Time 0.320 (0.528)	Data Time 0.001 (0.021)	Loss 2.5132 (2.3967)	Entropy 0.55813 (0.55687)	Top-1 acc 64.453 (66.296)	Top-5 acc 85.938 (85.507)	lr 0.00247
Train [96][1900/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.021)	Loss 2.3430 (2.3970)	Entropy 0.55833 (0.55687)	Top-1 acc 68.359 (66.283)	Top-5 acc 85.156 (85.505)	lr 0.00247
Train [96][1910/3239]	Time 0.239 (0.527)	Data Time 0.001 (0.021)	Loss 2.4852 (2.3970)	Entropy 0.55849 (0.55688)	Top-1 acc 66.797 (66.285)	Top-5 acc 83.594 (85.507)	lr 0.00247
Train [96][1920/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.021)	Loss 2.4969 (2.3971)	Entropy 0.55813 (0.55689)	Top-1 acc 65.625 (66.287)	Top-5 acc 81.641 (85.503)	lr 0.00247
Train [96][1930/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.021)	Loss 2.3748 (2.3970)	Entropy 0.55805 (0.55690)	Top-1 acc 64.844 (66.293)	Top-5 acc 85.547 (85.508)	lr 0.00247
Train [96][1940/3239]	Time 0.224 (0.525)	Data Time 0.001 (0.021)	Loss 2.4396 (2.3967)	Entropy 0.55841 (0.55690)	Top-1 acc 66.016 (66.301)	Top-5 acc 85.547 (85.512)	lr 0.00247
Train [96][1950/3239]	Time 0.254 (0.525)	Data Time 0.001 (0.021)	Loss 2.2433 (2.3965)	Entropy 0.55826 (0.55691)	Top-1 acc 71.094 (66.308)	Top-5 acc 87.891 (85.517)	lr 0.00246
Train [96][1960/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.021)	Loss 2.3356 (2.3967)	Entropy 0.55842 (0.55692)	Top-1 acc 69.531 (66.304)	Top-5 acc 85.938 (85.512)	lr 0.00246
Train [96][1970/3239]	Time 0.224 (0.524)	Data Time 0.001 (0.021)	Loss 2.5957 (2.3970)	Entropy 0.55849 (0.55692)	Top-1 acc 64.453 (66.300)	Top-5 acc 81.641 (85.506)	lr 0.00246
Train [96][1980/3239]	Time 0.308 (0.523)	Data Time 0.001 (0.020)	Loss 2.4614 (2.3971)	Entropy 0.55829 (0.55693)	Top-1 acc 64.453 (66.299)	Top-5 acc 84.375 (85.503)	lr 0.00246
Train [96][1990/3239]	Time 0.345 (0.551)	Data Time 0.002 (0.020)	Loss 2.5328 (2.3970)	Entropy 0.55846 (0.55694)	Top-1 acc 65.234 (66.295)	Top-5 acc 81.641 (85.504)	lr 0.00246
Train [96][2000/3239]	Time 0.240 (0.551)	Data Time 0.002 (0.020)	Loss 2.2924 (2.3969)	Entropy 0.55870 (0.55695)	Top-1 acc 70.703 (66.290)	Top-5 acc 88.281 (85.509)	lr 0.00246
Train [96][2010/3239]	Time 0.236 (0.550)	Data Time 0.001 (0.020)	Loss 2.4372 (2.3970)	Entropy 0.55892 (0.55696)	Top-1 acc 68.359 (66.292)	Top-5 acc 85.156 (85.504)	lr 0.00246
Train [96][2020/3239]	Time 0.244 (0.549)	Data Time 0.001 (0.020)	Loss 2.3155 (2.3972)	Entropy 0.55886 (0.55697)	Top-1 acc 69.141 (66.287)	Top-5 acc 87.500 (85.501)	lr 0.00246
Train [96][2030/3239]	Time 0.246 (0.549)	Data Time 0.001 (0.020)	Loss 2.5909 (2.3976)	Entropy 0.55872 (0.55698)	Top-1 acc 62.891 (66.276)	Top-5 acc 82.031 (85.494)	lr 0.00246
Train [96][2040/3239]	Time 0.228 (0.548)	Data Time 0.001 (0.020)	Loss 2.3556 (2.3973)	Entropy 0.55881 (0.55698)	Top-1 acc 69.141 (66.286)	Top-5 acc 86.719 (85.498)	lr 0.00246
Train [96][2050/3239]	Time 0.323 (0.547)	Data Time 0.001 (0.020)	Loss 2.3743 (2.3971)	Entropy 0.55858 (0.55699)	Top-1 acc 67.188 (66.294)	Top-5 acc 85.156 (85.500)	lr 0.00246
Train [96][2060/3239]	Time 0.257 (0.547)	Data Time 0.001 (0.020)	Loss 2.3065 (2.3972)	Entropy 0.55857 (0.55700)	Top-1 acc 69.922 (66.288)	Top-5 acc 84.766 (85.496)	lr 0.00246
Train [96][2070/3239]	Time 0.233 (0.546)	Data Time 0.004 (0.020)	Loss 2.4143 (2.3973)	Entropy 0.55841 (0.55701)	Top-1 acc 63.281 (66.286)	Top-5 acc 84.766 (85.494)	lr 0.00246
Train [96][2080/3239]	Time 0.237 (0.546)	Data Time 0.001 (0.020)	Loss 2.7283 (2.3977)	Entropy 0.55832 (0.55701)	Top-1 acc 57.812 (66.278)	Top-5 acc 79.688 (85.490)	lr 0.00246
Train [96][2090/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.019)	Loss 2.4004 (2.3976)	Entropy 0.55887 (0.55702)	Top-1 acc 63.672 (66.284)	Top-5 acc 83.984 (85.489)	lr 0.00246
Train [96][2100/3239]	Time 0.238 (0.544)	Data Time 0.001 (0.019)	Loss 2.2994 (2.3977)	Entropy 0.55896 (0.55703)	Top-1 acc 65.625 (66.276)	Top-5 acc 87.109 (85.493)	lr 0.00246
Train [96][2110/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.019)	Loss 2.3136 (2.3977)	Entropy 0.55897 (0.55704)	Top-1 acc 65.625 (66.271)	Top-5 acc 86.719 (85.495)	lr 0.00245
Train [96][2120/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.019)	Loss 2.3630 (2.3978)	Entropy 0.55853 (0.55705)	Top-1 acc 64.453 (66.268)	Top-5 acc 88.281 (85.494)	lr 0.00245
Train [96][2130/3239]	Time 0.233 (0.543)	Data Time 0.001 (0.019)	Loss 2.3937 (2.3979)	Entropy 0.55861 (0.55706)	Top-1 acc 64.453 (66.267)	Top-5 acc 86.719 (85.494)	lr 0.00245
Train [96][2140/3239]	Time 0.307 (0.542)	Data Time 0.001 (0.019)	Loss 2.7095 (2.3978)	Entropy 0.55852 (0.55706)	Top-1 acc 57.031 (66.269)	Top-5 acc 81.250 (85.493)	lr 0.00245
Train [96][2150/3239]	Time 0.224 (0.541)	Data Time 0.001 (0.019)	Loss 2.1709 (2.3976)	Entropy 0.55865 (0.55707)	Top-1 acc 73.828 (66.276)	Top-5 acc 91.406 (85.495)	lr 0.00245
Train [96][2160/3239]	Time 0.219 (0.541)	Data Time 0.001 (0.019)	Loss 2.4735 (2.3977)	Entropy 0.55861 (0.55708)	Top-1 acc 61.719 (66.269)	Top-5 acc 85.547 (85.497)	lr 0.00245
Train [96][2170/3239]	Time 0.229 (0.540)	Data Time 0.001 (0.019)	Loss 2.2497 (2.3976)	Entropy 0.55873 (0.55708)	Top-1 acc 71.094 (66.270)	Top-5 acc 87.500 (85.498)	lr 0.00245
Train [96][2180/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.019)	Loss 2.6526 (2.3976)	Entropy 0.55854 (0.55709)	Top-1 acc 64.844 (66.272)	Top-5 acc 80.469 (85.501)	lr 0.00245
Train [96][2190/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.019)	Loss 2.4361 (2.3978)	Entropy 0.55843 (0.55710)	Top-1 acc 66.406 (66.267)	Top-5 acc 85.156 (85.497)	lr 0.00245
Train [96][2200/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.019)	Loss 2.4252 (2.3980)	Entropy 0.55820 (0.55710)	Top-1 acc 67.188 (66.262)	Top-5 acc 83.203 (85.492)	lr 0.00245
Train [96][2210/3239]	Time 0.329 (0.538)	Data Time 0.001 (0.018)	Loss 2.2758 (2.3980)	Entropy 0.55813 (0.55711)	Top-1 acc 68.750 (66.261)	Top-5 acc 88.281 (85.493)	lr 0.00245
Train [96][2220/3239]	Time 0.226 (0.537)	Data Time 0.001 (0.018)	Loss 2.3508 (2.3979)	Entropy 0.55795 (0.55711)	Top-1 acc 67.969 (66.265)	Top-5 acc 85.547 (85.492)	lr 0.00245
Train [96][2230/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.018)	Loss 2.3601 (2.3978)	Entropy 0.55821 (0.55712)	Top-1 acc 67.188 (66.268)	Top-5 acc 84.375 (85.497)	lr 0.00245
Train [96][2240/3239]	Time 0.224 (0.536)	Data Time 0.001 (0.018)	Loss 2.3418 (2.3976)	Entropy 0.55793 (0.55712)	Top-1 acc 66.016 (66.271)	Top-5 acc 85.938 (85.498)	lr 0.00245
Train [96][2250/3239]	Time 0.231 (0.536)	Data Time 0.002 (0.018)	Loss 2.2017 (2.3973)	Entropy 0.55765 (0.55713)	Top-1 acc 71.094 (66.275)	Top-5 acc 88.672 (85.502)	lr 0.00245
Train [96][2260/3239]	Time 0.249 (0.535)	Data Time 0.001 (0.018)	Loss 2.1182 (2.3971)	Entropy 0.55801 (0.55713)	Top-1 acc 72.656 (66.285)	Top-5 acc 89.844 (85.508)	lr 0.00245
Train [96][2270/3239]	Time 0.242 (0.535)	Data Time 0.001 (0.018)	Loss 2.5949 (2.3973)	Entropy 0.55806 (0.55713)	Top-1 acc 60.156 (66.282)	Top-5 acc 83.594 (85.506)	lr 0.00245
Train [96][2280/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.018)	Loss 2.3492 (2.3973)	Entropy 0.55828 (0.55714)	Top-1 acc 66.406 (66.282)	Top-5 acc 86.328 (85.505)	lr 0.00244
Train [96][2290/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.018)	Loss 2.1483 (2.3973)	Entropy 0.55861 (0.55714)	Top-1 acc 74.609 (66.282)	Top-5 acc 89.844 (85.509)	lr 0.00244
Train [96][2300/3239]	Time 0.279 (0.533)	Data Time 0.001 (0.018)	Loss 2.2362 (2.3972)	Entropy 0.55863 (0.55715)	Top-1 acc 67.578 (66.284)	Top-5 acc 89.453 (85.507)	lr 0.00244
Train [96][2310/3239]	Time 0.248 (0.533)	Data Time 0.001 (0.018)	Loss 2.2338 (2.3970)	Entropy 0.55853 (0.55716)	Top-1 acc 69.531 (66.287)	Top-5 acc 88.672 (85.513)	lr 0.00244
Train [96][2320/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.018)	Loss 2.3409 (2.3969)	Entropy 0.55876 (0.55716)	Top-1 acc 66.016 (66.291)	Top-5 acc 85.547 (85.514)	lr 0.00244
Train [96][2330/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.018)	Loss 2.5772 (2.3968)	Entropy 0.55889 (0.55717)	Top-1 acc 59.375 (66.296)	Top-5 acc 83.594 (85.516)	lr 0.00244
Train [96][2340/3239]	Time 0.230 (0.532)	Data Time 0.001 (0.018)	Loss 2.4040 (2.3969)	Entropy 0.55884 (0.55718)	Top-1 acc 65.625 (66.291)	Top-5 acc 83.203 (85.517)	lr 0.00244
Train [96][2350/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.017)	Loss 2.3301 (2.3968)	Entropy 0.55861 (0.55718)	Top-1 acc 68.750 (66.295)	Top-5 acc 87.109 (85.520)	lr 0.00244
Train [96][2360/3239]	Time 0.240 (0.531)	Data Time 0.001 (0.017)	Loss 2.3857 (2.3966)	Entropy 0.55872 (0.55719)	Top-1 acc 69.141 (66.303)	Top-5 acc 84.766 (85.521)	lr 0.00244
Train [96][2370/3239]	Time 0.370 (0.530)	Data Time 0.001 (0.017)	Loss 2.2854 (2.3965)	Entropy 0.55874 (0.55720)	Top-1 acc 67.969 (66.305)	Top-5 acc 87.500 (85.522)	lr 0.00244
Train [96][2380/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.017)	Loss 2.6245 (2.3968)	Entropy 0.55870 (0.55720)	Top-1 acc 58.203 (66.297)	Top-5 acc 81.250 (85.518)	lr 0.00244
Train [96][2390/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.017)	Loss 2.4424 (2.3971)	Entropy 0.55863 (0.55721)	Top-1 acc 63.672 (66.296)	Top-5 acc 83.984 (85.514)	lr 0.00244
Train [96][2400/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.017)	Loss 2.3991 (2.3970)	Entropy 0.55864 (0.55721)	Top-1 acc 67.969 (66.295)	Top-5 acc 86.328 (85.517)	lr 0.00244
Train [96][2410/3239]	Time 0.224 (0.528)	Data Time 0.001 (0.017)	Loss 2.3262 (2.3969)	Entropy 0.55857 (0.55722)	Top-1 acc 67.578 (66.297)	Top-5 acc 85.547 (85.520)	lr 0.00244
Train [96][2420/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.017)	Loss 2.4093 (2.3970)	Entropy 0.55840 (0.55723)	Top-1 acc 64.453 (66.294)	Top-5 acc 85.547 (85.517)	lr 0.00244
Train [96][2430/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.017)	Loss 2.4538 (2.3968)	Entropy 0.55837 (0.55723)	Top-1 acc 62.109 (66.295)	Top-5 acc 85.938 (85.520)	lr 0.00244
Train [96][2440/3239]	Time 0.326 (0.527)	Data Time 0.001 (0.017)	Loss 2.3496 (2.3967)	Entropy 0.55835 (0.55724)	Top-1 acc 65.234 (66.299)	Top-5 acc 85.938 (85.522)	lr 0.00243
Train [96][2450/3239]	Time 0.222 (0.526)	Data Time 0.001 (0.017)	Loss 2.4141 (2.3968)	Entropy 0.55842 (0.55724)	Top-1 acc 67.578 (66.299)	Top-5 acc 85.547 (85.522)	lr 0.00243
Train [96][2460/3239]	Time 0.220 (0.526)	Data Time 0.001 (0.017)	Loss 2.3507 (2.3969)	Entropy 0.55804 (0.55724)	Top-1 acc 66.016 (66.295)	Top-5 acc 87.500 (85.519)	lr 0.00243
Train [96][2470/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.4198 (2.3969)	Entropy 0.55769 (0.55725)	Top-1 acc 66.406 (66.292)	Top-5 acc 85.938 (85.521)	lr 0.00243
Train [96][2480/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.017)	Loss 2.3206 (2.3969)	Entropy 0.55766 (0.55725)	Top-1 acc 64.453 (66.292)	Top-5 acc 88.281 (85.522)	lr 0.00243
Train [96][2490/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.017)	Loss 2.6695 (2.3969)	Entropy 0.55785 (0.55725)	Top-1 acc 62.500 (66.291)	Top-5 acc 79.688 (85.522)	lr 0.00243
Train [96][2500/3239]	Time 0.219 (0.524)	Data Time 0.001 (0.016)	Loss 2.5979 (2.3968)	Entropy 0.55794 (0.55725)	Top-1 acc 60.156 (66.291)	Top-5 acc 79.688 (85.523)	lr 0.00243
Train [96][2510/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.016)	Loss 2.3197 (2.3966)	Entropy 0.55770 (0.55726)	Top-1 acc 66.016 (66.294)	Top-5 acc 86.719 (85.526)	lr 0.00243
Train [96][2520/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.016)	Loss 2.4616 (2.3965)	Entropy 0.55784 (0.55726)	Top-1 acc 64.453 (66.295)	Top-5 acc 82.812 (85.526)	lr 0.00243
Train [96][2530/3239]	Time 0.333 (0.522)	Data Time 0.001 (0.016)	Loss 2.4662 (2.3965)	Entropy 0.55771 (0.55726)	Top-1 acc 64.453 (66.293)	Top-5 acc 85.547 (85.526)	lr 0.00243
Train [96][2540/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.016)	Loss 2.3107 (2.3964)	Entropy 0.55789 (0.55726)	Top-1 acc 69.141 (66.298)	Top-5 acc 88.672 (85.527)	lr 0.00243
Train [96][2550/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.016)	Loss 2.3337 (2.3963)	Entropy 0.55819 (0.55726)	Top-1 acc 67.969 (66.297)	Top-5 acc 87.500 (85.530)	lr 0.00243
Train [96][2560/3239]	Time 0.219 (0.521)	Data Time 0.001 (0.016)	Loss 2.5921 (2.3964)	Entropy 0.55807 (0.55727)	Top-1 acc 62.500 (66.296)	Top-5 acc 81.250 (85.531)	lr 0.00243
Train [96][2570/3239]	Time 0.263 (0.521)	Data Time 0.001 (0.016)	Loss 2.4591 (2.3964)	Entropy 0.55797 (0.55727)	Top-1 acc 64.453 (66.297)	Top-5 acc 83.594 (85.529)	lr 0.00243
Train [96][2580/3239]	Time 0.220 (0.520)	Data Time 0.001 (0.016)	Loss 2.6025 (2.3966)	Entropy 0.55780 (0.55727)	Top-1 acc 58.984 (66.290)	Top-5 acc 81.641 (85.527)	lr 0.00243
Train [96][2590/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.016)	Loss 2.4793 (2.3965)	Entropy 0.55788 (0.55728)	Top-1 acc 66.406 (66.290)	Top-5 acc 83.984 (85.529)	lr 0.00243
Train [96][2600/3239]	Time 0.327 (0.519)	Data Time 0.001 (0.016)	Loss 2.3845 (2.3966)	Entropy 0.55777 (0.55728)	Top-1 acc 69.141 (66.290)	Top-5 acc 84.766 (85.528)	lr 0.00243
Train [96][2610/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.016)	Loss 2.4859 (2.3967)	Entropy 0.55782 (0.55728)	Top-1 acc 65.234 (66.286)	Top-5 acc 83.203 (85.529)	lr 0.00242
Train [96][2620/3239]	Time 0.239 (0.519)	Data Time 0.001 (0.016)	Loss 2.4710 (2.3969)	Entropy 0.55810 (0.55728)	Top-1 acc 62.109 (66.279)	Top-5 acc 85.547 (85.525)	lr 0.00242
Train [96][2630/3239]	Time 0.288 (0.519)	Data Time 0.002 (0.016)	Loss 2.3418 (2.3968)	Entropy 0.55772 (0.55728)	Top-1 acc 69.531 (66.282)	Top-5 acc 85.547 (85.524)	lr 0.00242
Train [96][2640/3239]	Time 0.331 (0.538)	Data Time 0.005 (0.016)	Loss 2.9633 (2.3968)	Entropy 0.55772 (0.55729)	Top-1 acc 50.000 (66.278)	Top-5 acc 76.562 (85.526)	lr 0.00242
Train [96][2650/3239]	Time 0.230 (0.538)	Data Time 0.002 (0.016)	Loss 2.3812 (2.3968)	Entropy 0.55751 (0.55729)	Top-1 acc 66.406 (66.284)	Top-5 acc 87.109 (85.525)	lr 0.00242
Train [96][2660/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.016)	Loss 2.3202 (2.3967)	Entropy 0.55757 (0.55729)	Top-1 acc 68.359 (66.285)	Top-5 acc 88.281 (85.527)	lr 0.00242
Train [96][2670/3239]	Time 0.228 (0.537)	Data Time 0.001 (0.016)	Loss 2.4005 (2.3969)	Entropy 0.55778 (0.55729)	Top-1 acc 65.234 (66.282)	Top-5 acc 85.156 (85.524)	lr 0.00242
Train [96][2680/3239]	Time 0.259 (0.537)	Data Time 0.002 (0.015)	Loss 2.4091 (2.3969)	Entropy 0.55785 (0.55729)	Top-1 acc 65.625 (66.283)	Top-5 acc 87.109 (85.523)	lr 0.00242
Train [96][2690/3239]	Time 0.339 (0.537)	Data Time 0.001 (0.015)	Loss 2.3720 (2.3967)	Entropy 0.55791 (0.55729)	Top-1 acc 67.969 (66.288)	Top-5 acc 87.109 (85.529)	lr 0.00242
Train [96][2700/3239]	Time 0.234 (0.536)	Data Time 0.001 (0.015)	Loss 2.3530 (2.3967)	Entropy 0.55782 (0.55730)	Top-1 acc 66.016 (66.290)	Top-5 acc 88.281 (85.530)	lr 0.00242
Train [96][2710/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.015)	Loss 2.3683 (2.3967)	Entropy 0.55791 (0.55730)	Top-1 acc 66.016 (66.296)	Top-5 acc 86.328 (85.528)	lr 0.00242
Train [96][2720/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.015)	Loss 2.3785 (2.3965)	Entropy 0.55804 (0.55730)	Top-1 acc 68.750 (66.300)	Top-5 acc 83.594 (85.531)	lr 0.00242
Train [96][2730/3239]	Time 0.241 (0.535)	Data Time 0.001 (0.015)	Loss 2.3642 (2.3966)	Entropy 0.55816 (0.55730)	Top-1 acc 65.625 (66.296)	Top-5 acc 87.109 (85.528)	lr 0.00242
Train [96][2740/3239]	Time 0.234 (0.535)	Data Time 0.001 (0.015)	Loss 2.4857 (2.3965)	Entropy 0.55832 (0.55731)	Top-1 acc 64.844 (66.297)	Top-5 acc 80.859 (85.529)	lr 0.00242
Train [96][2750/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.015)	Loss 2.3068 (2.3965)	Entropy 0.55819 (0.55731)	Top-1 acc 68.750 (66.295)	Top-5 acc 86.328 (85.530)	lr 0.00242
Train [96][2760/3239]	Time 0.335 (0.534)	Data Time 0.001 (0.015)	Loss 2.4848 (2.3963)	Entropy 0.55820 (0.55731)	Top-1 acc 64.453 (66.298)	Top-5 acc 83.594 (85.532)	lr 0.00242
Train [96][2770/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.015)	Loss 2.2395 (2.3963)	Entropy 0.55866 (0.55732)	Top-1 acc 70.312 (66.302)	Top-5 acc 88.281 (85.531)	lr 0.00242
Train [96][2780/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.015)	Loss 2.4593 (2.3962)	Entropy 0.55841 (0.55732)	Top-1 acc 65.234 (66.307)	Top-5 acc 83.984 (85.531)	lr 0.00241
Train [96][2790/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.015)	Loss 2.4171 (2.3962)	Entropy 0.55827 (0.55733)	Top-1 acc 65.625 (66.302)	Top-5 acc 86.328 (85.531)	lr 0.00241
Train [96][2800/3239]	Time 0.225 (0.532)	Data Time 0.001 (0.015)	Loss 2.4503 (2.3961)	Entropy 0.55799 (0.55733)	Top-1 acc 62.109 (66.304)	Top-5 acc 85.156 (85.532)	lr 0.00241
Train [96][2810/3239]	Time 0.287 (0.532)	Data Time 0.001 (0.015)	Loss 2.2531 (2.3960)	Entropy 0.55831 (0.55733)	Top-1 acc 73.438 (66.310)	Top-5 acc 86.328 (85.535)	lr 0.00241
Train [96][2820/3239]	Time 0.264 (0.532)	Data Time 0.001 (0.015)	Loss 2.1737 (2.3960)	Entropy 0.55836 (0.55733)	Top-1 acc 71.094 (66.306)	Top-5 acc 90.625 (85.534)	lr 0.00241
Train [96][2830/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.015)	Loss 2.3153 (2.3961)	Entropy 0.55826 (0.55734)	Top-1 acc 68.359 (66.297)	Top-5 acc 87.109 (85.531)	lr 0.00241
Train [96][2840/3239]	Time 0.230 (0.531)	Data Time 0.001 (0.015)	Loss 2.6220 (2.3963)	Entropy 0.55853 (0.55734)	Top-1 acc 60.938 (66.290)	Top-5 acc 78.906 (85.525)	lr 0.00241
Train [96][2850/3239]	Time 0.256 (0.531)	Data Time 0.001 (0.015)	Loss 2.3576 (2.3962)	Entropy 0.55861 (0.55735)	Top-1 acc 66.797 (66.290)	Top-5 acc 86.719 (85.527)	lr 0.00241
Train [96][2860/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.015)	Loss 2.3521 (2.3962)	Entropy 0.55827 (0.55735)	Top-1 acc 65.625 (66.289)	Top-5 acc 86.328 (85.528)	lr 0.00241
Train [96][2870/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.015)	Loss 2.2449 (2.3961)	Entropy 0.55813 (0.55735)	Top-1 acc 71.094 (66.292)	Top-5 acc 85.547 (85.530)	lr 0.00241
Train [96][2880/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.015)	Loss 2.0118 (2.3962)	Entropy 0.55822 (0.55736)	Top-1 acc 76.172 (66.289)	Top-5 acc 92.969 (85.529)	lr 0.00241
Train [96][2890/3239]	Time 0.236 (0.529)	Data Time 0.001 (0.014)	Loss 2.2246 (2.3963)	Entropy 0.55823 (0.55736)	Top-1 acc 69.141 (66.290)	Top-5 acc 87.891 (85.529)	lr 0.00241
Train [96][2900/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.014)	Loss 2.6186 (2.3964)	Entropy 0.55826 (0.55736)	Top-1 acc 58.594 (66.286)	Top-5 acc 82.031 (85.528)	lr 0.00241
Train [96][2910/3239]	Time 0.237 (0.529)	Data Time 0.001 (0.014)	Loss 2.3840 (2.3962)	Entropy 0.55792 (0.55736)	Top-1 acc 68.359 (66.289)	Top-5 acc 85.547 (85.530)	lr 0.00241
Train [96][2920/3239]	Time 0.327 (0.528)	Data Time 0.001 (0.014)	Loss 2.3771 (2.3963)	Entropy 0.55805 (0.55737)	Top-1 acc 66.406 (66.290)	Top-5 acc 87.109 (85.528)	lr 0.00241
Train [96][2930/3239]	Time 0.220 (0.528)	Data Time 0.001 (0.014)	Loss 2.5088 (2.3963)	Entropy 0.55797 (0.55737)	Top-1 acc 66.406 (66.294)	Top-5 acc 84.766 (85.529)	lr 0.00241
Train [96][2940/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.014)	Loss 2.4430 (2.3965)	Entropy 0.55813 (0.55737)	Top-1 acc 64.844 (66.288)	Top-5 acc 83.203 (85.523)	lr 0.00241
Train [96][2950/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.014)	Loss 2.4016 (2.3966)	Entropy 0.55788 (0.55737)	Top-1 acc 68.750 (66.290)	Top-5 acc 84.375 (85.521)	lr 0.00240
Train [96][2960/3239]	Time 0.219 (0.527)	Data Time 0.001 (0.014)	Loss 2.3868 (2.3966)	Entropy 0.55763 (0.55737)	Top-1 acc 69.141 (66.289)	Top-5 acc 87.109 (85.521)	lr 0.00240
Train [96][2970/3239]	Time 0.220 (0.526)	Data Time 0.001 (0.014)	Loss 2.7367 (2.3968)	Entropy 0.55749 (0.55738)	Top-1 acc 59.766 (66.283)	Top-5 acc 80.859 (85.519)	lr 0.00240
Train [96][2980/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.014)	Loss 2.2866 (2.3968)	Entropy 0.55746 (0.55738)	Top-1 acc 68.359 (66.284)	Top-5 acc 86.328 (85.520)	lr 0.00240
Train [96][2990/3239]	Time 0.338 (0.526)	Data Time 0.001 (0.014)	Loss 2.0930 (2.3966)	Entropy 0.55717 (0.55737)	Top-1 acc 72.656 (66.289)	Top-5 acc 89.844 (85.525)	lr 0.00240
Train [96][3000/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.014)	Loss 2.2410 (2.3966)	Entropy 0.55734 (0.55737)	Top-1 acc 69.141 (66.289)	Top-5 acc 88.672 (85.523)	lr 0.00240
Train [96][3010/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.014)	Loss 2.2860 (2.3965)	Entropy 0.55700 (0.55737)	Top-1 acc 67.969 (66.291)	Top-5 acc 87.891 (85.525)	lr 0.00240
Train [96][3020/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.014)	Loss 2.3472 (2.3967)	Entropy 0.55686 (0.55737)	Top-1 acc 69.141 (66.285)	Top-5 acc 84.766 (85.519)	lr 0.00240
Train [96][3030/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.014)	Loss 2.4698 (2.3969)	Entropy 0.55677 (0.55737)	Top-1 acc 64.062 (66.283)	Top-5 acc 85.156 (85.517)	lr 0.00240
Train [96][3040/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.014)	Loss 2.3195 (2.3969)	Entropy 0.55684 (0.55737)	Top-1 acc 68.359 (66.283)	Top-5 acc 87.500 (85.516)	lr 0.00240
Train [96][3050/3239]	Time 0.222 (0.523)	Data Time 0.001 (0.014)	Loss 2.3486 (2.3970)	Entropy 0.55680 (0.55737)	Top-1 acc 67.188 (66.278)	Top-5 acc 85.938 (85.513)	lr 0.00240
Train [96][3060/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.014)	Loss 2.4424 (2.3971)	Entropy 0.55688 (0.55736)	Top-1 acc 66.016 (66.276)	Top-5 acc 82.812 (85.512)	lr 0.00240
Train [96][3070/3239]	Time 0.234 (0.523)	Data Time 0.001 (0.014)	Loss 2.2362 (2.3972)	Entropy 0.55704 (0.55736)	Top-1 acc 70.312 (66.273)	Top-5 acc 89.062 (85.511)	lr 0.00240
Train [96][3080/3239]	Time 0.318 (0.522)	Data Time 0.001 (0.014)	Loss 2.3214 (2.3971)	Entropy 0.55681 (0.55736)	Top-1 acc 70.312 (66.275)	Top-5 acc 87.500 (85.513)	lr 0.00240
Train [96][3090/3239]	Time 0.225 (0.522)	Data Time 0.001 (0.014)	Loss 2.3408 (2.3973)	Entropy 0.55674 (0.55736)	Top-1 acc 69.531 (66.274)	Top-5 acc 85.156 (85.508)	lr 0.00240
Train [96][3100/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.014)	Loss 2.2576 (2.3971)	Entropy 0.55703 (0.55736)	Top-1 acc 69.922 (66.273)	Top-5 acc 86.328 (85.510)	lr 0.00240
Train [96][3110/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.014)	Loss 2.4103 (2.3974)	Entropy 0.55731 (0.55736)	Top-1 acc 65.625 (66.270)	Top-5 acc 86.719 (85.507)	lr 0.00240
Train [96][3120/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.014)	Loss 2.4357 (2.3975)	Entropy 0.55725 (0.55736)	Top-1 acc 66.016 (66.264)	Top-5 acc 83.984 (85.505)	lr 0.00239
Train [96][3130/3239]	Time 0.295 (0.521)	Data Time 0.001 (0.013)	Loss 2.5438 (2.3977)	Entropy 0.55743 (0.55736)	Top-1 acc 65.625 (66.260)	Top-5 acc 82.031 (85.503)	lr 0.00239
Train [96][3140/3239]	Time 0.245 (0.521)	Data Time 0.001 (0.013)	Loss 2.2550 (2.3975)	Entropy 0.55724 (0.55736)	Top-1 acc 71.094 (66.267)	Top-5 acc 88.672 (85.506)	lr 0.00239
Train [96][3150/3239]	Time 0.333 (0.520)	Data Time 0.001 (0.013)	Loss 2.4896 (2.3974)	Entropy 0.55726 (0.55736)	Top-1 acc 63.672 (66.268)	Top-5 acc 83.594 (85.511)	lr 0.00239
Train [96][3160/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.013)	Loss 2.4640 (2.3974)	Entropy 0.55716 (0.55736)	Top-1 acc 64.062 (66.265)	Top-5 acc 83.984 (85.510)	lr 0.00239
Train [96][3170/3239]	Time 0.234 (0.520)	Data Time 0.002 (0.013)	Loss 2.4333 (2.3974)	Entropy 0.55728 (0.55736)	Top-1 acc 69.922 (66.265)	Top-5 acc 83.203 (85.513)	lr 0.00239
Train [96][3180/3239]	Time 0.229 (0.519)	Data Time 0.000 (0.013)	Loss 2.3411 (2.3975)	Entropy 0.55725 (0.55736)	Top-1 acc 68.750 (66.263)	Top-5 acc 85.547 (85.512)	lr 0.00239
Train [96][3190/3239]	Time 0.226 (0.519)	Data Time 0.000 (0.013)	Loss 2.3629 (2.3976)	Entropy 0.55728 (0.55736)	Top-1 acc 65.234 (66.257)	Top-5 acc 87.500 (85.511)	lr 0.00239
Train [96][3200/3239]	Time 0.222 (0.518)	Data Time 0.000 (0.013)	Loss 2.3972 (2.3975)	Entropy 0.55741 (0.55735)	Top-1 acc 65.234 (66.259)	Top-5 acc 85.156 (85.514)	lr 0.00239
Train [96][3210/3239]	Time 0.226 (0.518)	Data Time 0.000 (0.013)	Loss 2.5192 (2.3974)	Entropy 0.55740 (0.55736)	Top-1 acc 65.234 (66.261)	Top-5 acc 80.469 (85.516)	lr 0.00239
Train [96][3220/3239]	Time 0.233 (0.518)	Data Time 0.000 (0.013)	Loss 2.3107 (2.3973)	Entropy 0.55689 (0.55735)	Top-1 acc 66.797 (66.264)	Top-5 acc 87.109 (85.519)	lr 0.00239
Train [96][3230/3239]	Time 0.245 (0.517)	Data Time 0.000 (0.013)	Loss 2.2911 (2.3971)	Entropy 0.55683 (0.55735)	Top-1 acc 65.625 (66.266)	Top-5 acc 89.844 (85.522)	lr 0.00239
Train [96][3239/3239]	Time 1.112 (0.517)	Data Time 0.000 (0.013)	Loss 2.4275 (2.3971)	Entropy 0.55688 (0.55735)	Top-1 acc 65.432 (66.267)	Top-5 acc 91.358 (85.522)	lr 0.00239
==========Valid [96/120]	loss 1.212	top-1 acc 72.012 (72.012)	top-5 acc 90.080	Train top-1 66.267	top-5 85.522	Entropy 0.55688	Latency-None: 0.000ms	Flops: 539.00M
Train [97][0/3239]	Time 41.470 (41.470)	Data Time 39.478 (39.478)	Loss 2.2260 (2.2260)	Entropy 0.55685 (0.55685)	Top-1 acc 72.266 (72.266)	Top-5 acc 87.891 (87.891)	lr 0.00239
Train [97][10/3239]	Time 0.228 (4.374)	Data Time 0.001 (3.707)	Loss 2.6157 (2.3443)	Entropy 0.55671 (0.55676)	Top-1 acc 60.156 (68.324)	Top-5 acc 82.422 (86.364)	lr 0.00239
Train [97][20/3239]	Time 0.228 (2.485)	Data Time 0.001 (1.942)	Loss 2.2725 (2.3678)	Entropy 0.55629 (0.55669)	Top-1 acc 70.703 (67.467)	Top-5 acc 85.156 (86.049)	lr 0.00239
Train [97][30/3239]	Time 0.233 (1.818)	Data Time 0.001 (1.316)	Loss 2.2403 (2.3564)	Entropy 0.55627 (0.55657)	Top-1 acc 70.312 (67.603)	Top-5 acc 87.891 (86.366)	lr 0.00239
Train [97][40/3239]	Time 0.235 (1.477)	Data Time 0.001 (0.996)	Loss 2.3242 (2.3580)	Entropy 0.55630 (0.55652)	Top-1 acc 65.234 (67.178)	Top-5 acc 88.672 (86.195)	lr 0.00238
Train [97][50/3239]	Time 0.351 (1.269)	Data Time 0.001 (0.801)	Loss 2.4359 (2.3544)	Entropy 0.55616 (0.55646)	Top-1 acc 65.625 (67.387)	Top-5 acc 83.984 (86.236)	lr 0.00238
Train [97][60/3239]	Time 0.314 (2.024)	Data Time 0.002 (0.671)	Loss 2.3973 (2.3643)	Entropy 0.55628 (0.55643)	Top-1 acc 68.359 (67.188)	Top-5 acc 83.984 (86.021)	lr 0.00238
Train [97][70/3239]	Time 0.273 (1.800)	Data Time 0.002 (0.577)	Loss 2.3884 (2.3672)	Entropy 0.55635 (0.55640)	Top-1 acc 62.891 (67.077)	Top-5 acc 87.109 (86.059)	lr 0.00238
Train [97][80/3239]	Time 0.268 (1.630)	Data Time 0.002 (0.506)	Loss 2.2289 (2.3658)	Entropy 0.55665 (0.55640)	Top-1 acc 70.703 (67.125)	Top-5 acc 87.109 (86.024)	lr 0.00238
Train [97][90/3239]	Time 0.233 (1.496)	Data Time 0.001 (0.450)	Loss 2.4197 (2.3691)	Entropy 0.55607 (0.55640)	Top-1 acc 66.797 (66.990)	Top-5 acc 85.156 (86.079)	lr 0.00238
Train [97][100/3239]	Time 0.218 (1.389)	Data Time 0.001 (0.406)	Loss 2.2881 (2.3690)	Entropy 0.55615 (0.55638)	Top-1 acc 69.922 (67.044)	Top-5 acc 87.109 (86.061)	lr 0.00238
Train [97][110/3239]	Time 0.227 (1.300)	Data Time 0.001 (0.369)	Loss 2.3366 (2.3744)	Entropy 0.55619 (0.55635)	Top-1 acc 67.969 (66.867)	Top-5 acc 85.547 (85.916)	lr 0.00238
Train [97][120/3239]	Time 0.226 (1.227)	Data Time 0.001 (0.339)	Loss 2.3315 (2.3739)	Entropy 0.55619 (0.55634)	Top-1 acc 67.578 (66.923)	Top-5 acc 87.891 (85.967)	lr 0.00238
Train [97][130/3239]	Time 0.229 (1.165)	Data Time 0.001 (0.313)	Loss 2.4157 (2.3742)	Entropy 0.55619 (0.55633)	Top-1 acc 66.406 (66.827)	Top-5 acc 85.938 (85.955)	lr 0.00238
Train [97][140/3239]	Time 0.334 (1.114)	Data Time 0.001 (0.291)	Loss 2.4824 (2.3769)	Entropy 0.55595 (0.55631)	Top-1 acc 62.891 (66.717)	Top-5 acc 83.984 (85.899)	lr 0.00238
Train [97][150/3239]	Time 0.234 (1.068)	Data Time 0.001 (0.272)	Loss 2.4508 (2.3801)	Entropy 0.55602 (0.55629)	Top-1 acc 66.406 (66.629)	Top-5 acc 85.156 (85.875)	lr 0.00238
Train [97][160/3239]	Time 0.237 (1.028)	Data Time 0.001 (0.255)	Loss 2.3998 (2.3804)	Entropy 0.55603 (0.55627)	Top-1 acc 68.750 (66.637)	Top-5 acc 84.766 (85.843)	lr 0.00238
Train [97][170/3239]	Time 0.227 (0.992)	Data Time 0.001 (0.240)	Loss 2.3887 (2.3838)	Entropy 0.55621 (0.55627)	Top-1 acc 66.406 (66.555)	Top-5 acc 83.984 (85.746)	lr 0.00238
Train [97][180/3239]	Time 0.277 (0.965)	Data Time 0.002 (0.227)	Loss 2.5608 (2.3823)	Entropy 0.55645 (0.55627)	Top-1 acc 62.109 (66.613)	Top-5 acc 83.594 (85.741)	lr 0.00238
Train [97][190/3239]	Time 0.248 (0.941)	Data Time 0.002 (0.215)	Loss 2.7003 (2.3803)	Entropy 0.55651 (0.55628)	Top-1 acc 61.328 (66.682)	Top-5 acc 79.688 (85.764)	lr 0.00238
Train [97][200/3239]	Time 0.245 (0.916)	Data Time 0.001 (0.205)	Loss 2.4912 (2.3816)	Entropy 0.55656 (0.55630)	Top-1 acc 61.328 (66.636)	Top-5 acc 83.203 (85.720)	lr 0.00238
Train [97][210/3239]	Time 0.324 (0.892)	Data Time 0.001 (0.195)	Loss 2.4390 (2.3837)	Entropy 0.55641 (0.55631)	Top-1 acc 64.062 (66.590)	Top-5 acc 87.500 (85.702)	lr 0.00237
Train [97][220/3239]	Time 0.233 (0.870)	Data Time 0.001 (0.186)	Loss 2.4392 (2.3854)	Entropy 0.55652 (0.55631)	Top-1 acc 63.281 (66.556)	Top-5 acc 85.156 (85.655)	lr 0.00237
Train [97][230/3239]	Time 0.228 (0.850)	Data Time 0.001 (0.178)	Loss 2.2612 (2.3855)	Entropy 0.55674 (0.55633)	Top-1 acc 64.062 (66.514)	Top-5 acc 87.500 (85.665)	lr 0.00237
Train [97][240/3239]	Time 0.234 (0.832)	Data Time 0.001 (0.171)	Loss 2.2343 (2.3862)	Entropy 0.55705 (0.55635)	Top-1 acc 71.094 (66.531)	Top-5 acc 89.453 (85.654)	lr 0.00237
Train [97][250/3239]	Time 0.230 (0.816)	Data Time 0.001 (0.164)	Loss 2.3923 (2.3827)	Entropy 0.55668 (0.55637)	Top-1 acc 65.625 (66.651)	Top-5 acc 82.812 (85.699)	lr 0.00237
Train [97][260/3239]	Time 0.228 (0.801)	Data Time 0.001 (0.158)	Loss 2.2899 (2.3840)	Entropy 0.55672 (0.55639)	Top-1 acc 70.312 (66.625)	Top-5 acc 87.500 (85.683)	lr 0.00237
Train [97][270/3239]	Time 0.253 (0.787)	Data Time 0.001 (0.152)	Loss 2.3300 (2.3835)	Entropy 0.55660 (0.55640)	Top-1 acc 67.969 (66.625)	Top-5 acc 88.672 (85.703)	lr 0.00237
Train [97][280/3239]	Time 0.235 (0.773)	Data Time 0.001 (0.147)	Loss 2.3597 (2.3829)	Entropy 0.55648 (0.55640)	Top-1 acc 67.188 (66.627)	Top-5 acc 84.375 (85.714)	lr 0.00237
Train [97][290/3239]	Time 0.230 (0.761)	Data Time 0.001 (0.142)	Loss 2.4022 (2.3858)	Entropy 0.55655 (0.55641)	Top-1 acc 65.625 (66.550)	Top-5 acc 87.891 (85.661)	lr 0.00237
Train [97][300/3239]	Time 0.315 (0.750)	Data Time 0.001 (0.137)	Loss 2.3603 (2.3832)	Entropy 0.55672 (0.55641)	Top-1 acc 68.750 (66.623)	Top-5 acc 84.375 (85.697)	lr 0.00237
Train [97][310/3239]	Time 0.227 (0.740)	Data Time 0.001 (0.133)	Loss 2.2419 (2.3820)	Entropy 0.55680 (0.55643)	Top-1 acc 71.484 (66.661)	Top-5 acc 88.672 (85.700)	lr 0.00237
Train [97][320/3239]	Time 0.272 (0.730)	Data Time 0.002 (0.129)	Loss 2.4111 (2.3828)	Entropy 0.55692 (0.55644)	Top-1 acc 66.406 (66.642)	Top-5 acc 85.156 (85.692)	lr 0.00237
Train [97][330/3239]	Time 0.226 (0.720)	Data Time 0.001 (0.125)	Loss 2.4116 (2.3836)	Entropy 0.55689 (0.55645)	Top-1 acc 64.844 (66.621)	Top-5 acc 84.766 (85.648)	lr 0.00237
Train [97][340/3239]	Time 0.235 (0.711)	Data Time 0.001 (0.121)	Loss 2.3104 (2.3832)	Entropy 0.55667 (0.55647)	Top-1 acc 66.797 (66.599)	Top-5 acc 86.719 (85.657)	lr 0.00237
Train [97][350/3239]	Time 0.221 (0.703)	Data Time 0.001 (0.118)	Loss 2.4412 (2.3831)	Entropy 0.55673 (0.55647)	Top-1 acc 62.891 (66.578)	Top-5 acc 85.156 (85.672)	lr 0.00237
Train [97][360/3239]	Time 0.222 (0.695)	Data Time 0.001 (0.115)	Loss 2.6654 (2.3835)	Entropy 0.55651 (0.55648)	Top-1 acc 60.547 (66.547)	Top-5 acc 80.859 (85.672)	lr 0.00237
Train [97][370/3239]	Time 0.342 (0.688)	Data Time 0.001 (0.112)	Loss 2.3654 (2.3834)	Entropy 0.55643 (0.55648)	Top-1 acc 68.359 (66.575)	Top-5 acc 87.500 (85.680)	lr 0.00237
Train [97][380/3239]	Time 0.223 (0.681)	Data Time 0.001 (0.109)	Loss 2.4692 (2.3832)	Entropy 0.55637 (0.55648)	Top-1 acc 66.406 (66.577)	Top-5 acc 85.547 (85.672)	lr 0.00236
Train [97][390/3239]	Time 0.220 (0.674)	Data Time 0.001 (0.106)	Loss 2.2748 (2.3836)	Entropy 0.55662 (0.55647)	Top-1 acc 71.094 (66.582)	Top-5 acc 85.156 (85.656)	lr 0.00236
Train [97][400/3239]	Time 0.232 (0.667)	Data Time 0.001 (0.103)	Loss 2.2245 (2.3814)	Entropy 0.55673 (0.55648)	Top-1 acc 69.141 (66.629)	Top-5 acc 89.062 (85.696)	lr 0.00236
Train [97][410/3239]	Time 0.250 (0.661)	Data Time 0.001 (0.101)	Loss 2.3919 (2.3823)	Entropy 0.55701 (0.55649)	Top-1 acc 64.062 (66.593)	Top-5 acc 87.500 (85.680)	lr 0.00236
Train [97][420/3239]	Time 0.226 (0.655)	Data Time 0.001 (0.098)	Loss 2.4546 (2.3836)	Entropy 0.55700 (0.55650)	Top-1 acc 64.062 (66.569)	Top-5 acc 83.203 (85.656)	lr 0.00236
Train [97][430/3239]	Time 0.228 (0.649)	Data Time 0.001 (0.096)	Loss 2.4138 (2.3849)	Entropy 0.55706 (0.55651)	Top-1 acc 65.234 (66.536)	Top-5 acc 84.375 (85.630)	lr 0.00236
Train [97][440/3239]	Time 0.232 (0.644)	Data Time 0.001 (0.094)	Loss 2.2575 (2.3849)	Entropy 0.55727 (0.55653)	Top-1 acc 69.141 (66.530)	Top-5 acc 88.281 (85.629)	lr 0.00236
Train [97][450/3239]	Time 0.264 (0.639)	Data Time 0.001 (0.092)	Loss 2.6132 (2.3848)	Entropy 0.55739 (0.55654)	Top-1 acc 63.281 (66.554)	Top-5 acc 81.641 (85.640)	lr 0.00236
Train [97][460/3239]	Time 0.303 (0.634)	Data Time 0.001 (0.090)	Loss 2.1402 (2.3847)	Entropy 0.55735 (0.55656)	Top-1 acc 75.000 (66.577)	Top-5 acc 87.109 (85.628)	lr 0.00236
Train [97][470/3239]	Time 0.227 (0.629)	Data Time 0.001 (0.088)	Loss 2.4360 (2.3860)	Entropy 0.55741 (0.55658)	Top-1 acc 64.844 (66.536)	Top-5 acc 87.891 (85.602)	lr 0.00236
Train [97][480/3239]	Time 0.230 (0.624)	Data Time 0.001 (0.086)	Loss 2.4343 (2.3861)	Entropy 0.55728 (0.55660)	Top-1 acc 64.062 (66.535)	Top-5 acc 85.547 (85.596)	lr 0.00236
Train [97][490/3239]	Time 0.225 (0.620)	Data Time 0.001 (0.085)	Loss 2.4295 (2.3861)	Entropy 0.55738 (0.55661)	Top-1 acc 66.406 (66.539)	Top-5 acc 84.375 (85.604)	lr 0.00236
Train [97][500/3239]	Time 0.281 (0.617)	Data Time 0.001 (0.083)	Loss 2.5867 (2.3868)	Entropy 0.55745 (0.55663)	Top-1 acc 60.547 (66.539)	Top-5 acc 84.375 (85.607)	lr 0.00236
Train [97][510/3239]	Time 0.247 (0.615)	Data Time 0.001 (0.081)	Loss 2.4211 (2.3865)	Entropy 0.55734 (0.55665)	Top-1 acc 64.453 (66.541)	Top-5 acc 87.109 (85.601)	lr 0.00236
Train [97][520/3239]	Time 0.240 (0.611)	Data Time 0.001 (0.080)	Loss 2.5037 (2.3860)	Entropy 0.55754 (0.55666)	Top-1 acc 63.672 (66.546)	Top-5 acc 83.203 (85.611)	lr 0.00236
Train [97][530/3239]	Time 0.342 (0.608)	Data Time 0.001 (0.078)	Loss 2.2477 (2.3850)	Entropy 0.55717 (0.55668)	Top-1 acc 69.922 (66.570)	Top-5 acc 86.719 (85.621)	lr 0.00236
Train [97][540/3239]	Time 0.227 (0.605)	Data Time 0.001 (0.077)	Loss 2.3612 (2.3846)	Entropy 0.55717 (0.55669)	Top-1 acc 67.188 (66.579)	Top-5 acc 88.672 (85.618)	lr 0.00236
Train [97][550/3239]	Time 0.225 (0.601)	Data Time 0.001 (0.076)	Loss 2.2752 (2.3852)	Entropy 0.55721 (0.55669)	Top-1 acc 71.484 (66.568)	Top-5 acc 85.156 (85.591)	lr 0.00235
Train [97][560/3239]	Time 0.232 (0.598)	Data Time 0.001 (0.074)	Loss 2.3678 (2.3867)	Entropy 0.55737 (0.55670)	Top-1 acc 69.531 (66.549)	Top-5 acc 85.938 (85.577)	lr 0.00235
Train [97][570/3239]	Time 0.267 (0.595)	Data Time 0.001 (0.073)	Loss 2.3528 (2.3865)	Entropy 0.55746 (0.55672)	Top-1 acc 67.188 (66.562)	Top-5 acc 85.156 (85.572)	lr 0.00235
Train [97][580/3239]	Time 0.226 (0.592)	Data Time 0.001 (0.072)	Loss 2.6140 (2.3865)	Entropy 0.55771 (0.55673)	Top-1 acc 62.500 (66.556)	Top-5 acc 81.641 (85.568)	lr 0.00235
Train [97][590/3239]	Time 0.252 (0.589)	Data Time 0.001 (0.071)	Loss 2.5912 (2.3862)	Entropy 0.55762 (0.55675)	Top-1 acc 62.109 (66.570)	Top-5 acc 81.641 (85.573)	lr 0.00235
Train [97][600/3239]	Time 0.321 (0.586)	Data Time 0.001 (0.069)	Loss 2.5154 (2.3858)	Entropy 0.55730 (0.55676)	Top-1 acc 65.625 (66.574)	Top-5 acc 82.031 (85.594)	lr 0.00235
Train [97][610/3239]	Time 0.274 (0.583)	Data Time 0.001 (0.068)	Loss 2.2396 (2.3848)	Entropy 0.55721 (0.55677)	Top-1 acc 72.266 (66.585)	Top-5 acc 88.281 (85.628)	lr 0.00235
Train [97][620/3239]	Time 0.240 (0.580)	Data Time 0.001 (0.067)	Loss 2.4198 (2.3853)	Entropy 0.55704 (0.55677)	Top-1 acc 64.844 (66.556)	Top-5 acc 83.984 (85.618)	lr 0.00235
Train [97][630/3239]	Time 0.225 (0.578)	Data Time 0.001 (0.066)	Loss 2.1373 (2.3847)	Entropy 0.55687 (0.55678)	Top-1 acc 72.656 (66.575)	Top-5 acc 89.453 (85.619)	lr 0.00235
Train [97][640/3239]	Time 0.226 (0.575)	Data Time 0.001 (0.065)	Loss 2.3641 (2.3848)	Entropy 0.55682 (0.55678)	Top-1 acc 67.188 (66.579)	Top-5 acc 85.547 (85.616)	lr 0.00235
Train [97][650/3239]	Time 0.242 (0.573)	Data Time 0.001 (0.064)	Loss 2.1848 (2.3841)	Entropy 0.55700 (0.55678)	Top-1 acc 71.094 (66.593)	Top-5 acc 90.625 (85.627)	lr 0.00235
Train [97][660/3239]	Time 0.238 (0.570)	Data Time 0.001 (0.063)	Loss 2.4430 (2.3845)	Entropy 0.55639 (0.55678)	Top-1 acc 63.672 (66.578)	Top-5 acc 84.375 (85.621)	lr 0.00235
Train [97][670/3239]	Time 0.237 (0.568)	Data Time 0.002 (0.062)	Loss 2.5446 (2.3848)	Entropy 0.55660 (0.55678)	Top-1 acc 62.891 (66.583)	Top-5 acc 85.156 (85.626)	lr 0.00235
Train [97][680/3239]	Time 0.230 (0.566)	Data Time 0.001 (0.061)	Loss 2.3172 (2.3855)	Entropy 0.55645 (0.55678)	Top-1 acc 65.625 (66.559)	Top-5 acc 87.891 (85.626)	lr 0.00235
Train [97][690/3239]	Time 0.319 (0.564)	Data Time 0.001 (0.061)	Loss 2.4882 (2.3856)	Entropy 0.55656 (0.55677)	Top-1 acc 66.797 (66.561)	Top-5 acc 85.156 (85.618)	lr 0.00235
Train [97][700/3239]	Time 0.230 (0.562)	Data Time 0.001 (0.060)	Loss 2.3777 (2.3861)	Entropy 0.55677 (0.55677)	Top-1 acc 69.141 (66.538)	Top-5 acc 84.766 (85.606)	lr 0.00235
Train [97][710/3239]	Time 0.446 (0.638)	Data Time 0.006 (0.059)	Loss 2.5277 (2.3865)	Entropy 0.55625 (0.55677)	Top-1 acc 61.719 (66.530)	Top-5 acc 81.641 (85.605)	lr 0.00235
Train [97][720/3239]	Time 0.231 (0.636)	Data Time 0.002 (0.058)	Loss 2.4808 (2.3866)	Entropy 0.55622 (0.55676)	Top-1 acc 64.844 (66.531)	Top-5 acc 84.375 (85.603)	lr 0.00234
Train [97][730/3239]	Time 0.276 (0.634)	Data Time 0.002 (0.057)	Loss 2.2672 (2.3869)	Entropy 0.55610 (0.55675)	Top-1 acc 70.312 (66.540)	Top-5 acc 89.453 (85.596)	lr 0.00234
Train [97][740/3239]	Time 0.286 (0.631)	Data Time 0.003 (0.057)	Loss 2.3713 (2.3868)	Entropy 0.55638 (0.55674)	Top-1 acc 65.234 (66.543)	Top-5 acc 83.984 (85.597)	lr 0.00234
Train [97][750/3239]	Time 0.234 (0.629)	Data Time 0.001 (0.056)	Loss 2.3456 (2.3867)	Entropy 0.55636 (0.55674)	Top-1 acc 69.141 (66.558)	Top-5 acc 85.938 (85.593)	lr 0.00234
Train [97][760/3239]	Time 0.232 (0.626)	Data Time 0.002 (0.055)	Loss 2.3209 (2.3863)	Entropy 0.55595 (0.55673)	Top-1 acc 69.531 (66.565)	Top-5 acc 84.766 (85.600)	lr 0.00234
Train [97][770/3239]	Time 0.234 (0.623)	Data Time 0.001 (0.055)	Loss 2.4388 (2.3866)	Entropy 0.55575 (0.55672)	Top-1 acc 64.844 (66.553)	Top-5 acc 82.812 (85.588)	lr 0.00234
Train [97][780/3239]	Time 0.273 (0.621)	Data Time 0.001 (0.054)	Loss 2.3586 (2.3873)	Entropy 0.55566 (0.55671)	Top-1 acc 67.969 (66.530)	Top-5 acc 85.547 (85.582)	lr 0.00234
Train [97][790/3239]	Time 0.240 (0.619)	Data Time 0.001 (0.053)	Loss 2.0943 (2.3870)	Entropy 0.55562 (0.55669)	Top-1 acc 72.266 (66.533)	Top-5 acc 92.969 (85.591)	lr 0.00234
Train [97][800/3239]	Time 0.233 (0.616)	Data Time 0.001 (0.053)	Loss 2.2786 (2.3868)	Entropy 0.55552 (0.55668)	Top-1 acc 68.359 (66.536)	Top-5 acc 86.719 (85.595)	lr 0.00234
Train [97][810/3239]	Time 0.236 (0.614)	Data Time 0.001 (0.052)	Loss 2.3907 (2.3867)	Entropy 0.55575 (0.55666)	Top-1 acc 67.969 (66.538)	Top-5 acc 85.938 (85.602)	lr 0.00234
Train [97][820/3239]	Time 0.251 (0.612)	Data Time 0.001 (0.051)	Loss 2.4941 (2.3877)	Entropy 0.55588 (0.55665)	Top-1 acc 64.062 (66.512)	Top-5 acc 85.547 (85.594)	lr 0.00234
Train [97][830/3239]	Time 0.266 (0.610)	Data Time 0.001 (0.051)	Loss 2.3134 (2.3876)	Entropy 0.55607 (0.55665)	Top-1 acc 68.359 (66.515)	Top-5 acc 87.891 (85.599)	lr 0.00234
Train [97][840/3239]	Time 0.268 (0.608)	Data Time 0.001 (0.050)	Loss 2.0396 (2.3865)	Entropy 0.55629 (0.55664)	Top-1 acc 76.172 (66.539)	Top-5 acc 93.359 (85.611)	lr 0.00234
Train [97][850/3239]	Time 0.320 (0.605)	Data Time 0.001 (0.050)	Loss 2.4090 (2.3861)	Entropy 0.55639 (0.55663)	Top-1 acc 67.188 (66.536)	Top-5 acc 85.156 (85.614)	lr 0.00234
Train [97][860/3239]	Time 0.292 (0.603)	Data Time 0.007 (0.049)	Loss 2.2929 (2.3857)	Entropy 0.55619 (0.55663)	Top-1 acc 71.484 (66.541)	Top-5 acc 87.109 (85.623)	lr 0.00234
Train [97][870/3239]	Time 0.269 (0.601)	Data Time 0.037 (0.048)	Loss 2.3406 (2.3851)	Entropy 0.55638 (0.55663)	Top-1 acc 68.750 (66.554)	Top-5 acc 85.547 (85.636)	lr 0.00234
Train [97][880/3239]	Time 0.230 (0.599)	Data Time 0.001 (0.048)	Loss 2.3963 (2.3855)	Entropy 0.55612 (0.55662)	Top-1 acc 65.625 (66.538)	Top-5 acc 85.547 (85.626)	lr 0.00234
Train [97][890/3239]	Time 0.235 (0.597)	Data Time 0.001 (0.047)	Loss 2.4425 (2.3851)	Entropy 0.55623 (0.55662)	Top-1 acc 63.672 (66.543)	Top-5 acc 83.203 (85.636)	lr 0.00233
Train [97][900/3239]	Time 0.274 (0.595)	Data Time 0.001 (0.047)	Loss 2.3345 (2.3854)	Entropy 0.55620 (0.55661)	Top-1 acc 69.141 (66.543)	Top-5 acc 85.547 (85.633)	lr 0.00233
Train [97][910/3239]	Time 0.246 (0.594)	Data Time 0.001 (0.046)	Loss 2.4278 (2.3854)	Entropy 0.55554 (0.55661)	Top-1 acc 67.188 (66.537)	Top-5 acc 83.203 (85.634)	lr 0.00233
Train [97][920/3239]	Time 0.380 (0.592)	Data Time 0.001 (0.046)	Loss 2.3598 (2.3857)	Entropy 0.55553 (0.55660)	Top-1 acc 63.672 (66.529)	Top-5 acc 85.938 (85.630)	lr 0.00233
Train [97][930/3239]	Time 0.247 (0.590)	Data Time 0.001 (0.045)	Loss 2.3211 (2.3854)	Entropy 0.55533 (0.55658)	Top-1 acc 67.578 (66.534)	Top-5 acc 86.719 (85.634)	lr 0.00233
Train [97][940/3239]	Time 0.233 (0.588)	Data Time 0.001 (0.045)	Loss 2.4446 (2.3862)	Entropy 0.55533 (0.55657)	Top-1 acc 68.359 (66.524)	Top-5 acc 82.422 (85.625)	lr 0.00233
Train [97][950/3239]	Time 0.236 (0.587)	Data Time 0.001 (0.045)	Loss 2.3281 (2.3862)	Entropy 0.55492 (0.55656)	Top-1 acc 66.797 (66.520)	Top-5 acc 87.891 (85.628)	lr 0.00233
Train [97][960/3239]	Time 0.246 (0.585)	Data Time 0.001 (0.044)	Loss 2.4918 (2.3866)	Entropy 0.55526 (0.55654)	Top-1 acc 64.062 (66.508)	Top-5 acc 82.422 (85.629)	lr 0.00233
Train [97][970/3239]	Time 0.255 (0.584)	Data Time 0.002 (0.044)	Loss 2.2782 (2.3866)	Entropy 0.55539 (0.55653)	Top-1 acc 72.266 (66.499)	Top-5 acc 85.938 (85.635)	lr 0.00233
Train [97][980/3239]	Time 0.276 (0.582)	Data Time 0.002 (0.043)	Loss 2.3113 (2.3862)	Entropy 0.55539 (0.55652)	Top-1 acc 64.844 (66.514)	Top-5 acc 87.891 (85.637)	lr 0.00233
Train [97][990/3239]	Time 0.250 (0.581)	Data Time 0.001 (0.043)	Loss 2.5048 (2.3865)	Entropy 0.55537 (0.55651)	Top-1 acc 63.281 (66.500)	Top-5 acc 87.891 (85.636)	lr 0.00233
Train [97][1000/3239]	Time 0.288 (0.580)	Data Time 0.002 (0.042)	Loss 2.3721 (2.3864)	Entropy 0.55554 (0.55649)	Top-1 acc 67.969 (66.500)	Top-5 acc 85.938 (85.639)	lr 0.00233
Train [97][1010/3239]	Time 0.440 (0.579)	Data Time 0.003 (0.042)	Loss 2.6238 (2.3864)	Entropy 0.55549 (0.55649)	Top-1 acc 61.719 (66.497)	Top-5 acc 80.859 (85.643)	lr 0.00233
Train [97][1020/3239]	Time 0.240 (0.578)	Data Time 0.001 (0.042)	Loss 2.3089 (2.3864)	Entropy 0.55558 (0.55648)	Top-1 acc 69.531 (66.508)	Top-5 acc 86.719 (85.639)	lr 0.00233
Train [97][1030/3239]	Time 0.234 (0.577)	Data Time 0.001 (0.041)	Loss 2.2145 (2.3860)	Entropy 0.55571 (0.55647)	Top-1 acc 73.047 (66.520)	Top-5 acc 89.844 (85.650)	lr 0.00233
Train [97][1040/3239]	Time 0.226 (0.575)	Data Time 0.001 (0.041)	Loss 2.4243 (2.3860)	Entropy 0.55567 (0.55646)	Top-1 acc 65.625 (66.523)	Top-5 acc 88.672 (85.654)	lr 0.00233
Train [97][1050/3239]	Time 0.227 (0.574)	Data Time 0.001 (0.040)	Loss 2.6532 (2.3863)	Entropy 0.55546 (0.55645)	Top-1 acc 60.547 (66.517)	Top-5 acc 82.812 (85.644)	lr 0.00233
Train [97][1060/3239]	Time 0.232 (0.572)	Data Time 0.001 (0.040)	Loss 2.5878 (2.3862)	Entropy 0.55567 (0.55644)	Top-1 acc 61.719 (66.521)	Top-5 acc 82.422 (85.647)	lr 0.00232
Train [97][1070/3239]	Time 0.229 (0.571)	Data Time 0.001 (0.040)	Loss 2.4760 (2.3869)	Entropy 0.55608 (0.55644)	Top-1 acc 65.625 (66.508)	Top-5 acc 84.766 (85.634)	lr 0.00232
Train [97][1080/3239]	Time 0.465 (0.571)	Data Time 0.002 (0.039)	Loss 2.3199 (2.3865)	Entropy 0.55641 (0.55643)	Top-1 acc 64.062 (66.512)	Top-5 acc 85.156 (85.646)	lr 0.00232
Train [97][1090/3239]	Time 0.255 (0.571)	Data Time 0.001 (0.039)	Loss 2.4798 (2.3878)	Entropy 0.55672 (0.55643)	Top-1 acc 66.016 (66.485)	Top-5 acc 84.766 (85.627)	lr 0.00232
Train [97][1100/3239]	Time 0.314 (0.571)	Data Time 0.001 (0.039)	Loss 2.3069 (2.3878)	Entropy 0.55685 (0.55644)	Top-1 acc 68.750 (66.493)	Top-5 acc 87.109 (85.628)	lr 0.00232
Train [97][1110/3239]	Time 0.225 (0.570)	Data Time 0.001 (0.038)	Loss 2.5683 (2.3882)	Entropy 0.55711 (0.55644)	Top-1 acc 62.500 (66.485)	Top-5 acc 81.250 (85.624)	lr 0.00232
Train [97][1120/3239]	Time 0.228 (0.569)	Data Time 0.001 (0.038)	Loss 2.4644 (2.3889)	Entropy 0.55713 (0.55645)	Top-1 acc 63.672 (66.475)	Top-5 acc 83.984 (85.612)	lr 0.00232
Train [97][1130/3239]	Time 0.258 (0.568)	Data Time 0.001 (0.038)	Loss 2.3430 (2.3894)	Entropy 0.55736 (0.55645)	Top-1 acc 68.750 (66.462)	Top-5 acc 85.938 (85.605)	lr 0.00232
Train [97][1140/3239]	Time 0.238 (0.566)	Data Time 0.001 (0.037)	Loss 2.3849 (2.3894)	Entropy 0.55724 (0.55646)	Top-1 acc 67.969 (66.460)	Top-5 acc 83.594 (85.605)	lr 0.00232
Train [97][1150/3239]	Time 0.233 (0.565)	Data Time 0.001 (0.037)	Loss 2.3399 (2.3892)	Entropy 0.55739 (0.55647)	Top-1 acc 66.406 (66.462)	Top-5 acc 87.500 (85.617)	lr 0.00232
Train [97][1160/3239]	Time 0.240 (0.564)	Data Time 0.001 (0.037)	Loss 2.2907 (2.3894)	Entropy 0.55720 (0.55648)	Top-1 acc 66.016 (66.454)	Top-5 acc 86.719 (85.613)	lr 0.00232
Train [97][1170/3239]	Time 0.269 (0.563)	Data Time 0.001 (0.037)	Loss 2.6088 (2.3895)	Entropy 0.55735 (0.55648)	Top-1 acc 60.547 (66.454)	Top-5 acc 81.641 (85.609)	lr 0.00232
Train [97][1180/3239]	Time 0.224 (0.561)	Data Time 0.001 (0.036)	Loss 2.5489 (2.3896)	Entropy 0.55727 (0.55649)	Top-1 acc 62.500 (66.457)	Top-5 acc 80.859 (85.603)	lr 0.00232
Train [97][1190/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.036)	Loss 2.1946 (2.3893)	Entropy 0.55695 (0.55650)	Top-1 acc 75.391 (66.465)	Top-5 acc 87.891 (85.605)	lr 0.00232
Train [97][1200/3239]	Time 0.226 (0.559)	Data Time 0.001 (0.036)	Loss 2.3202 (2.3892)	Entropy 0.55701 (0.55650)	Top-1 acc 69.922 (66.464)	Top-5 acc 88.672 (85.610)	lr 0.00232
Train [97][1210/3239]	Time 0.231 (0.558)	Data Time 0.001 (0.035)	Loss 2.3539 (2.3890)	Entropy 0.55719 (0.55651)	Top-1 acc 64.844 (66.466)	Top-5 acc 85.547 (85.615)	lr 0.00232
Train [97][1220/3239]	Time 0.229 (0.556)	Data Time 0.001 (0.035)	Loss 2.4602 (2.3888)	Entropy 0.55725 (0.55651)	Top-1 acc 65.234 (66.470)	Top-5 acc 84.375 (85.622)	lr 0.00232
Train [97][1230/3239]	Time 0.230 (0.555)	Data Time 0.001 (0.035)	Loss 2.2329 (2.3892)	Entropy 0.55724 (0.55652)	Top-1 acc 67.578 (66.462)	Top-5 acc 87.500 (85.609)	lr 0.00231
Train [97][1240/3239]	Time 0.322 (0.554)	Data Time 0.001 (0.035)	Loss 2.4670 (2.3897)	Entropy 0.55684 (0.55652)	Top-1 acc 66.016 (66.445)	Top-5 acc 82.031 (85.599)	lr 0.00231
Train [97][1250/3239]	Time 0.253 (0.553)	Data Time 0.001 (0.034)	Loss 2.3856 (2.3895)	Entropy 0.55660 (0.55653)	Top-1 acc 65.234 (66.449)	Top-5 acc 87.500 (85.609)	lr 0.00231
Train [97][1260/3239]	Time 0.247 (0.552)	Data Time 0.002 (0.034)	Loss 2.3537 (2.3897)	Entropy 0.55666 (0.55653)	Top-1 acc 67.578 (66.447)	Top-5 acc 87.500 (85.612)	lr 0.00231
Train [97][1270/3239]	Time 0.241 (0.551)	Data Time 0.001 (0.034)	Loss 2.4203 (2.3896)	Entropy 0.55675 (0.55653)	Top-1 acc 64.453 (66.442)	Top-5 acc 85.547 (85.616)	lr 0.00231
Train [97][1280/3239]	Time 0.228 (0.550)	Data Time 0.001 (0.034)	Loss 2.2299 (2.3893)	Entropy 0.55674 (0.55653)	Top-1 acc 73.047 (66.453)	Top-5 acc 88.281 (85.619)	lr 0.00231
Train [97][1290/3239]	Time 0.252 (0.549)	Data Time 0.001 (0.033)	Loss 2.3091 (2.3888)	Entropy 0.55696 (0.55653)	Top-1 acc 66.406 (66.463)	Top-5 acc 85.938 (85.631)	lr 0.00231
Train [97][1300/3239]	Time 0.269 (0.548)	Data Time 0.001 (0.033)	Loss 2.3995 (2.3892)	Entropy 0.55734 (0.55654)	Top-1 acc 66.797 (66.455)	Top-5 acc 85.156 (85.621)	lr 0.00231
Train [97][1310/3239]	Time 0.369 (0.547)	Data Time 0.001 (0.033)	Loss 2.3451 (2.3894)	Entropy 0.55747 (0.55654)	Top-1 acc 66.797 (66.451)	Top-5 acc 84.766 (85.614)	lr 0.00231
Train [97][1320/3239]	Time 0.228 (0.546)	Data Time 0.001 (0.033)	Loss 2.2382 (2.3894)	Entropy 0.55766 (0.55655)	Top-1 acc 71.875 (66.454)	Top-5 acc 85.156 (85.612)	lr 0.00231
Train [97][1330/3239]	Time 0.220 (0.544)	Data Time 0.001 (0.032)	Loss 2.3676 (2.3894)	Entropy 0.55771 (0.55656)	Top-1 acc 64.453 (66.459)	Top-5 acc 86.328 (85.608)	lr 0.00231
Train [97][1340/3239]	Time 0.224 (0.544)	Data Time 0.001 (0.032)	Loss 2.5207 (2.3898)	Entropy 0.55770 (0.55657)	Top-1 acc 60.547 (66.441)	Top-5 acc 83.203 (85.603)	lr 0.00231
Train [97][1350/3239]	Time 0.252 (0.543)	Data Time 0.001 (0.032)	Loss 2.3686 (2.3904)	Entropy 0.55783 (0.55658)	Top-1 acc 64.453 (66.431)	Top-5 acc 85.547 (85.598)	lr 0.00231
Train [97][1360/3239]	Time 0.220 (0.542)	Data Time 0.001 (0.032)	Loss 2.4840 (2.3909)	Entropy 0.55746 (0.55659)	Top-1 acc 65.625 (66.420)	Top-5 acc 84.766 (85.592)	lr 0.00231
Train [97][1370/3239]	Time 0.326 (0.581)	Data Time 0.002 (0.031)	Loss 2.1796 (2.3911)	Entropy 0.55737 (0.55659)	Top-1 acc 69.922 (66.416)	Top-5 acc 89.453 (85.588)	lr 0.00231
Train [97][1380/3239]	Time 0.264 (0.580)	Data Time 0.002 (0.031)	Loss 2.6378 (2.3910)	Entropy 0.55745 (0.55660)	Top-1 acc 62.109 (66.425)	Top-5 acc 80.469 (85.592)	lr 0.00231
Train [97][1390/3239]	Time 0.233 (0.579)	Data Time 0.001 (0.031)	Loss 2.4843 (2.3909)	Entropy 0.55740 (0.55660)	Top-1 acc 63.281 (66.430)	Top-5 acc 84.375 (85.597)	lr 0.00231
Train [97][1400/3239]	Time 0.377 (0.578)	Data Time 0.029 (0.031)	Loss 2.4298 (2.3907)	Entropy 0.55753 (0.55661)	Top-1 acc 67.969 (66.434)	Top-5 acc 84.375 (85.595)	lr 0.00230
Train [97][1410/3239]	Time 0.239 (0.577)	Data Time 0.001 (0.031)	Loss 2.1597 (2.3909)	Entropy 0.55765 (0.55662)	Top-1 acc 74.219 (66.432)	Top-5 acc 89.453 (85.591)	lr 0.00230
Train [97][1420/3239]	Time 0.234 (0.576)	Data Time 0.001 (0.030)	Loss 2.3096 (2.3908)	Entropy 0.55809 (0.55662)	Top-1 acc 69.922 (66.440)	Top-5 acc 83.984 (85.586)	lr 0.00230
Train [97][1430/3239]	Time 0.255 (0.575)	Data Time 0.001 (0.030)	Loss 2.3906 (2.3909)	Entropy 0.55818 (0.55663)	Top-1 acc 66.406 (66.441)	Top-5 acc 87.500 (85.587)	lr 0.00230
Train [97][1440/3239]	Time 0.230 (0.574)	Data Time 0.001 (0.030)	Loss 2.4324 (2.3907)	Entropy 0.55828 (0.55665)	Top-1 acc 67.578 (66.447)	Top-5 acc 83.203 (85.584)	lr 0.00230
Train [97][1450/3239]	Time 0.241 (0.573)	Data Time 0.001 (0.030)	Loss 2.4345 (2.3911)	Entropy 0.55819 (0.55666)	Top-1 acc 62.109 (66.438)	Top-5 acc 85.547 (85.579)	lr 0.00230
Train [97][1460/3239]	Time 0.222 (0.572)	Data Time 0.001 (0.030)	Loss 2.4869 (2.3913)	Entropy 0.55845 (0.55667)	Top-1 acc 61.719 (66.428)	Top-5 acc 84.375 (85.576)	lr 0.00230
Train [97][1470/3239]	Time 0.320 (0.571)	Data Time 0.001 (0.029)	Loss 2.1660 (2.3909)	Entropy 0.55810 (0.55668)	Top-1 acc 74.609 (66.443)	Top-5 acc 88.281 (85.582)	lr 0.00230
Train [97][1480/3239]	Time 0.233 (0.570)	Data Time 0.001 (0.029)	Loss 2.3077 (2.3906)	Entropy 0.55814 (0.55669)	Top-1 acc 67.188 (66.451)	Top-5 acc 87.500 (85.584)	lr 0.00230
Train [97][1490/3239]	Time 0.226 (0.569)	Data Time 0.001 (0.029)	Loss 2.3952 (2.3908)	Entropy 0.55813 (0.55670)	Top-1 acc 66.406 (66.447)	Top-5 acc 86.328 (85.582)	lr 0.00230
Train [97][1500/3239]	Time 0.233 (0.568)	Data Time 0.002 (0.029)	Loss 2.2844 (2.3905)	Entropy 0.55818 (0.55671)	Top-1 acc 71.094 (66.455)	Top-5 acc 86.328 (85.587)	lr 0.00230
Train [97][1510/3239]	Time 0.234 (0.567)	Data Time 0.001 (0.029)	Loss 2.2343 (2.3905)	Entropy 0.55815 (0.55672)	Top-1 acc 69.141 (66.454)	Top-5 acc 88.672 (85.586)	lr 0.00230
Train [97][1520/3239]	Time 0.263 (0.566)	Data Time 0.001 (0.029)	Loss 2.2977 (2.3905)	Entropy 0.55847 (0.55673)	Top-1 acc 68.750 (66.462)	Top-5 acc 86.328 (85.584)	lr 0.00230
Train [97][1530/3239]	Time 0.227 (0.565)	Data Time 0.002 (0.028)	Loss 2.3057 (2.3904)	Entropy 0.55809 (0.55674)	Top-1 acc 72.266 (66.462)	Top-5 acc 86.328 (85.583)	lr 0.00230
Train [97][1540/3239]	Time 0.227 (0.564)	Data Time 0.001 (0.028)	Loss 2.1977 (2.3903)	Entropy 0.55796 (0.55675)	Top-1 acc 71.094 (66.460)	Top-5 acc 90.234 (85.583)	lr 0.00230
Train [97][1550/3239]	Time 0.222 (0.563)	Data Time 0.001 (0.028)	Loss 2.3054 (2.3908)	Entropy 0.55784 (0.55675)	Top-1 acc 69.141 (66.448)	Top-5 acc 87.891 (85.582)	lr 0.00230
Train [97][1560/3239]	Time 0.325 (0.563)	Data Time 0.001 (0.028)	Loss 2.5481 (2.3907)	Entropy 0.55755 (0.55676)	Top-1 acc 62.109 (66.450)	Top-5 acc 83.594 (85.584)	lr 0.00230
Train [97][1570/3239]	Time 0.222 (0.562)	Data Time 0.001 (0.028)	Loss 2.2372 (2.3910)	Entropy 0.55732 (0.55676)	Top-1 acc 71.875 (66.444)	Top-5 acc 88.281 (85.579)	lr 0.00229
Train [97][1580/3239]	Time 0.231 (0.561)	Data Time 0.001 (0.028)	Loss 2.2770 (2.3908)	Entropy 0.55735 (0.55677)	Top-1 acc 69.531 (66.452)	Top-5 acc 87.500 (85.581)	lr 0.00229
Train [97][1590/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.027)	Loss 2.5427 (2.3905)	Entropy 0.55707 (0.55677)	Top-1 acc 61.719 (66.460)	Top-5 acc 83.203 (85.580)	lr 0.00229
Train [97][1600/3239]	Time 0.278 (0.559)	Data Time 0.001 (0.027)	Loss 2.4629 (2.3904)	Entropy 0.55743 (0.55677)	Top-1 acc 62.500 (66.455)	Top-5 acc 84.375 (85.586)	lr 0.00229
Train [97][1610/3239]	Time 0.270 (0.558)	Data Time 0.001 (0.027)	Loss 2.5691 (2.3906)	Entropy 0.55693 (0.55678)	Top-1 acc 62.109 (66.446)	Top-5 acc 81.641 (85.582)	lr 0.00229
Train [97][1620/3239]	Time 0.340 (0.558)	Data Time 0.002 (0.027)	Loss 2.4761 (2.3907)	Entropy 0.55684 (0.55678)	Top-1 acc 65.234 (66.453)	Top-5 acc 85.938 (85.582)	lr 0.00229
Train [97][1630/3239]	Time 0.356 (0.558)	Data Time 0.001 (0.027)	Loss 2.4888 (2.3908)	Entropy 0.55667 (0.55678)	Top-1 acc 64.062 (66.450)	Top-5 acc 83.203 (85.578)	lr 0.00229
Train [97][1640/3239]	Time 0.235 (0.557)	Data Time 0.001 (0.027)	Loss 2.3819 (2.3907)	Entropy 0.55616 (0.55678)	Top-1 acc 65.625 (66.451)	Top-5 acc 86.328 (85.582)	lr 0.00229
Train [97][1650/3239]	Time 0.247 (0.556)	Data Time 0.001 (0.026)	Loss 2.3451 (2.3906)	Entropy 0.55586 (0.55677)	Top-1 acc 67.578 (66.446)	Top-5 acc 82.812 (85.587)	lr 0.00229
Train [97][1660/3239]	Time 0.233 (0.556)	Data Time 0.001 (0.026)	Loss 2.2827 (2.3904)	Entropy 0.55582 (0.55676)	Top-1 acc 74.219 (66.457)	Top-5 acc 87.500 (85.591)	lr 0.00229
Train [97][1670/3239]	Time 0.240 (0.555)	Data Time 0.002 (0.026)	Loss 2.3672 (2.3901)	Entropy 0.55580 (0.55676)	Top-1 acc 67.969 (66.470)	Top-5 acc 87.109 (85.595)	lr 0.00229
Train [97][1680/3239]	Time 0.234 (0.554)	Data Time 0.001 (0.026)	Loss 2.2879 (2.3901)	Entropy 0.55556 (0.55675)	Top-1 acc 65.625 (66.463)	Top-5 acc 87.891 (85.592)	lr 0.00229
Train [97][1690/3239]	Time 0.259 (0.553)	Data Time 0.001 (0.026)	Loss 2.4408 (2.3901)	Entropy 0.55556 (0.55675)	Top-1 acc 65.234 (66.471)	Top-5 acc 84.375 (85.594)	lr 0.00229
Train [97][1700/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.026)	Loss 2.4024 (2.3901)	Entropy 0.55580 (0.55674)	Top-1 acc 66.406 (66.466)	Top-5 acc 85.547 (85.598)	lr 0.00229
Train [97][1710/3239]	Time 0.235 (0.552)	Data Time 0.001 (0.026)	Loss 2.0464 (2.3896)	Entropy 0.55573 (0.55673)	Top-1 acc 75.781 (66.483)	Top-5 acc 91.016 (85.609)	lr 0.00229
Train [97][1720/3239]	Time 0.242 (0.551)	Data Time 0.001 (0.025)	Loss 2.2949 (2.3895)	Entropy 0.55546 (0.55673)	Top-1 acc 70.312 (66.489)	Top-5 acc 87.891 (85.606)	lr 0.00229
Train [97][1730/3239]	Time 0.238 (0.551)	Data Time 0.002 (0.025)	Loss 2.3916 (2.3894)	Entropy 0.55546 (0.55672)	Top-1 acc 64.062 (66.493)	Top-5 acc 84.766 (85.608)	lr 0.00229
Train [97][1740/3239]	Time 0.244 (0.550)	Data Time 0.001 (0.025)	Loss 2.3059 (2.3893)	Entropy 0.55567 (0.55671)	Top-1 acc 69.141 (66.491)	Top-5 acc 87.500 (85.606)	lr 0.00228
Train [97][1750/3239]	Time 0.223 (0.549)	Data Time 0.001 (0.025)	Loss 2.3992 (2.3897)	Entropy 0.55613 (0.55671)	Top-1 acc 69.141 (66.486)	Top-5 acc 86.719 (85.600)	lr 0.00228
Train [97][1760/3239]	Time 0.234 (0.548)	Data Time 0.002 (0.025)	Loss 2.2452 (2.3898)	Entropy 0.55628 (0.55670)	Top-1 acc 71.094 (66.484)	Top-5 acc 88.281 (85.598)	lr 0.00228
Train [97][1770/3239]	Time 0.223 (0.548)	Data Time 0.001 (0.025)	Loss 2.3655 (2.3896)	Entropy 0.55622 (0.55670)	Top-1 acc 69.922 (66.494)	Top-5 acc 84.766 (85.599)	lr 0.00228
Train [97][1780/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.025)	Loss 2.1895 (2.3894)	Entropy 0.55574 (0.55670)	Top-1 acc 72.266 (66.503)	Top-5 acc 90.625 (85.597)	lr 0.00228
Train [97][1790/3239]	Time 0.386 (0.546)	Data Time 0.001 (0.024)	Loss 2.1754 (2.3891)	Entropy 0.55542 (0.55669)	Top-1 acc 72.266 (66.513)	Top-5 acc 89.844 (85.604)	lr 0.00228
Train [97][1800/3239]	Time 0.272 (0.546)	Data Time 0.003 (0.024)	Loss 2.3080 (2.3889)	Entropy 0.55548 (0.55669)	Top-1 acc 69.531 (66.521)	Top-5 acc 89.453 (85.605)	lr 0.00228
Train [97][1810/3239]	Time 0.264 (0.545)	Data Time 0.002 (0.024)	Loss 2.4857 (2.3889)	Entropy 0.55560 (0.55668)	Top-1 acc 61.719 (66.518)	Top-5 acc 83.594 (85.608)	lr 0.00228
Train [97][1820/3239]	Time 0.233 (0.544)	Data Time 0.001 (0.024)	Loss 2.5274 (2.3894)	Entropy 0.55581 (0.55667)	Top-1 acc 59.375 (66.508)	Top-5 acc 84.766 (85.603)	lr 0.00228
Train [97][1830/3239]	Time 0.272 (0.543)	Data Time 0.002 (0.024)	Loss 2.3815 (2.3898)	Entropy 0.55603 (0.55667)	Top-1 acc 65.234 (66.500)	Top-5 acc 83.594 (85.594)	lr 0.00228
Train [97][1840/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.024)	Loss 2.4563 (2.3903)	Entropy 0.55609 (0.55667)	Top-1 acc 64.453 (66.495)	Top-5 acc 82.812 (85.584)	lr 0.00228
Train [97][1850/3239]	Time 0.237 (0.542)	Data Time 0.001 (0.024)	Loss 2.3214 (2.3902)	Entropy 0.55606 (0.55666)	Top-1 acc 67.969 (66.497)	Top-5 acc 87.891 (85.584)	lr 0.00228
Train [97][1860/3239]	Time 0.345 (0.541)	Data Time 0.001 (0.024)	Loss 2.4071 (2.3908)	Entropy 0.55611 (0.55666)	Top-1 acc 63.281 (66.482)	Top-5 acc 87.500 (85.580)	lr 0.00228
Train [97][1870/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.023)	Loss 2.2653 (2.3910)	Entropy 0.55648 (0.55666)	Top-1 acc 70.312 (66.478)	Top-5 acc 88.672 (85.580)	lr 0.00228
Train [97][1880/3239]	Time 0.254 (0.540)	Data Time 0.002 (0.023)	Loss 2.3972 (2.3910)	Entropy 0.55671 (0.55666)	Top-1 acc 66.797 (66.476)	Top-5 acc 84.766 (85.579)	lr 0.00228
Train [97][1890/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.023)	Loss 2.4699 (2.3914)	Entropy 0.55685 (0.55666)	Top-1 acc 66.016 (66.469)	Top-5 acc 86.328 (85.573)	lr 0.00228
Train [97][1900/3239]	Time 0.254 (0.539)	Data Time 0.001 (0.023)	Loss 2.6643 (2.3914)	Entropy 0.55676 (0.55666)	Top-1 acc 60.938 (66.469)	Top-5 acc 81.641 (85.574)	lr 0.00228
Train [97][1910/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.023)	Loss 2.3016 (2.3912)	Entropy 0.55695 (0.55666)	Top-1 acc 69.141 (66.471)	Top-5 acc 87.891 (85.581)	lr 0.00228
Train [97][1920/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.023)	Loss 2.3498 (2.3910)	Entropy 0.55716 (0.55666)	Top-1 acc 66.016 (66.480)	Top-5 acc 85.938 (85.587)	lr 0.00227
Train [97][1930/3239]	Time 0.259 (0.537)	Data Time 0.001 (0.023)	Loss 2.4391 (2.3909)	Entropy 0.55728 (0.55666)	Top-1 acc 64.062 (66.481)	Top-5 acc 84.375 (85.594)	lr 0.00227
Train [97][1940/3239]	Time 0.259 (0.537)	Data Time 0.001 (0.023)	Loss 2.3129 (2.3910)	Entropy 0.55722 (0.55667)	Top-1 acc 67.969 (66.481)	Top-5 acc 86.328 (85.592)	lr 0.00227
Train [97][1950/3239]	Time 0.330 (0.536)	Data Time 0.001 (0.023)	Loss 2.5766 (2.3911)	Entropy 0.55744 (0.55667)	Top-1 acc 61.719 (66.477)	Top-5 acc 82.812 (85.591)	lr 0.00227
Train [97][1960/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.022)	Loss 2.4600 (2.3914)	Entropy 0.55761 (0.55667)	Top-1 acc 65.625 (66.475)	Top-5 acc 83.203 (85.584)	lr 0.00227
Train [97][1970/3239]	Time 0.231 (0.535)	Data Time 0.001 (0.022)	Loss 2.4146 (2.3914)	Entropy 0.55785 (0.55668)	Top-1 acc 67.188 (66.474)	Top-5 acc 83.203 (85.582)	lr 0.00227
Train [97][1980/3239]	Time 0.244 (0.534)	Data Time 0.001 (0.022)	Loss 2.4172 (2.3915)	Entropy 0.55820 (0.55668)	Top-1 acc 63.672 (66.477)	Top-5 acc 84.375 (85.582)	lr 0.00227
Train [97][1990/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.022)	Loss 2.4120 (2.3919)	Entropy 0.55808 (0.55669)	Top-1 acc 67.578 (66.470)	Top-5 acc 84.766 (85.575)	lr 0.00227
Train [97][2000/3239]	Time 0.236 (0.533)	Data Time 0.001 (0.022)	Loss 2.2711 (2.3917)	Entropy 0.55804 (0.55670)	Top-1 acc 70.312 (66.473)	Top-5 acc 88.281 (85.580)	lr 0.00227
Train [97][2010/3239]	Time 0.269 (0.533)	Data Time 0.001 (0.022)	Loss 2.3451 (2.3921)	Entropy 0.55811 (0.55671)	Top-1 acc 69.531 (66.466)	Top-5 acc 87.891 (85.575)	lr 0.00227
Train [97][2020/3239]	Time 0.559 (0.558)	Data Time 0.005 (0.022)	Loss 2.4858 (2.3919)	Entropy 0.55844 (0.55671)	Top-1 acc 62.109 (66.473)	Top-5 acc 84.375 (85.576)	lr 0.00227
Train [97][2030/3239]	Time 0.234 (0.558)	Data Time 0.002 (0.022)	Loss 2.2735 (2.3915)	Entropy 0.55874 (0.55672)	Top-1 acc 64.844 (66.484)	Top-5 acc 87.109 (85.582)	lr 0.00227
Train [97][2040/3239]	Time 0.237 (0.557)	Data Time 0.001 (0.022)	Loss 2.5516 (2.3917)	Entropy 0.55853 (0.55673)	Top-1 acc 61.328 (66.481)	Top-5 acc 85.938 (85.581)	lr 0.00227
Train [97][2050/3239]	Time 0.227 (0.556)	Data Time 0.001 (0.022)	Loss 2.5072 (2.3918)	Entropy 0.55869 (0.55674)	Top-1 acc 64.062 (66.481)	Top-5 acc 83.203 (85.576)	lr 0.00227
Train [97][2060/3239]	Time 0.234 (0.556)	Data Time 0.001 (0.021)	Loss 2.5268 (2.3917)	Entropy 0.55873 (0.55675)	Top-1 acc 63.281 (66.482)	Top-5 acc 83.594 (85.579)	lr 0.00227
Train [97][2070/3239]	Time 0.236 (0.555)	Data Time 0.001 (0.021)	Loss 2.5139 (2.3919)	Entropy 0.55881 (0.55676)	Top-1 acc 60.938 (66.482)	Top-5 acc 82.422 (85.575)	lr 0.00227
Train [97][2080/3239]	Time 0.268 (0.554)	Data Time 0.001 (0.021)	Loss 2.3707 (2.3920)	Entropy 0.55913 (0.55677)	Top-1 acc 66.016 (66.478)	Top-5 acc 85.938 (85.577)	lr 0.00227
Train [97][2090/3239]	Time 0.261 (0.554)	Data Time 0.001 (0.021)	Loss 2.5762 (2.3922)	Entropy 0.55903 (0.55678)	Top-1 acc 60.938 (66.471)	Top-5 acc 82.812 (85.577)	lr 0.00226
Train [97][2100/3239]	Time 0.277 (0.553)	Data Time 0.001 (0.021)	Loss 2.3104 (2.3922)	Entropy 0.55901 (0.55679)	Top-1 acc 66.797 (66.468)	Top-5 acc 87.891 (85.575)	lr 0.00226
Train [97][2110/3239]	Time 0.328 (0.553)	Data Time 0.001 (0.021)	Loss 2.3961 (2.3920)	Entropy 0.55939 (0.55680)	Top-1 acc 64.453 (66.468)	Top-5 acc 83.594 (85.576)	lr 0.00226
Train [97][2120/3239]	Time 0.233 (0.552)	Data Time 0.001 (0.021)	Loss 2.3751 (2.3915)	Entropy 0.55938 (0.55682)	Top-1 acc 64.844 (66.483)	Top-5 acc 87.500 (85.585)	lr 0.00226
Train [97][2130/3239]	Time 0.347 (0.552)	Data Time 0.002 (0.021)	Loss 2.5411 (2.3918)	Entropy 0.55934 (0.55683)	Top-1 acc 63.672 (66.478)	Top-5 acc 82.422 (85.579)	lr 0.00226
Train [97][2140/3239]	Time 0.254 (0.552)	Data Time 0.001 (0.021)	Loss 2.5045 (2.3921)	Entropy 0.55953 (0.55684)	Top-1 acc 66.016 (66.473)	Top-5 acc 84.375 (85.575)	lr 0.00226
Train [97][2150/3239]	Time 0.230 (0.551)	Data Time 0.001 (0.021)	Loss 2.4837 (2.3920)	Entropy 0.55927 (0.55685)	Top-1 acc 64.453 (66.474)	Top-5 acc 85.938 (85.576)	lr 0.00226
Train [97][2160/3239]	Time 0.258 (0.551)	Data Time 0.002 (0.021)	Loss 2.2626 (2.3921)	Entropy 0.55895 (0.55686)	Top-1 acc 69.141 (66.478)	Top-5 acc 85.547 (85.576)	lr 0.00226
Train [97][2170/3239]	Time 0.258 (0.550)	Data Time 0.001 (0.020)	Loss 2.4199 (2.3920)	Entropy 0.55895 (0.55687)	Top-1 acc 67.578 (66.482)	Top-5 acc 83.203 (85.577)	lr 0.00226
Train [97][2180/3239]	Time 0.328 (0.549)	Data Time 0.001 (0.020)	Loss 2.2585 (2.3918)	Entropy 0.55921 (0.55688)	Top-1 acc 71.875 (66.489)	Top-5 acc 88.672 (85.577)	lr 0.00226
Train [97][2190/3239]	Time 0.248 (0.549)	Data Time 0.001 (0.020)	Loss 2.3806 (2.3917)	Entropy 0.55908 (0.55689)	Top-1 acc 66.406 (66.492)	Top-5 acc 85.547 (85.576)	lr 0.00226
Train [97][2200/3239]	Time 0.266 (0.548)	Data Time 0.001 (0.020)	Loss 2.3836 (2.3917)	Entropy 0.55897 (0.55690)	Top-1 acc 67.188 (66.488)	Top-5 acc 85.938 (85.575)	lr 0.00226
Train [97][2210/3239]	Time 0.232 (0.548)	Data Time 0.001 (0.020)	Loss 2.1062 (2.3917)	Entropy 0.55862 (0.55691)	Top-1 acc 76.172 (66.493)	Top-5 acc 90.625 (85.573)	lr 0.00226
Train [97][2220/3239]	Time 0.241 (0.547)	Data Time 0.001 (0.020)	Loss 2.6014 (2.3918)	Entropy 0.55867 (0.55692)	Top-1 acc 62.891 (66.486)	Top-5 acc 80.469 (85.570)	lr 0.00226
Train [97][2230/3239]	Time 0.227 (0.547)	Data Time 0.001 (0.020)	Loss 2.3970 (2.3918)	Entropy 0.55881 (0.55693)	Top-1 acc 64.844 (66.488)	Top-5 acc 87.109 (85.571)	lr 0.00226
Train [97][2240/3239]	Time 0.256 (0.546)	Data Time 0.001 (0.020)	Loss 2.3747 (2.3922)	Entropy 0.55881 (0.55694)	Top-1 acc 64.453 (66.475)	Top-5 acc 85.547 (85.564)	lr 0.00226
Train [97][2250/3239]	Time 0.265 (0.546)	Data Time 0.001 (0.020)	Loss 2.3052 (2.3923)	Entropy 0.55882 (0.55694)	Top-1 acc 69.141 (66.471)	Top-5 acc 85.938 (85.566)	lr 0.00226
Train [97][2260/3239]	Time 0.255 (0.546)	Data Time 0.001 (0.020)	Loss 2.6308 (2.3924)	Entropy 0.55837 (0.55695)	Top-1 acc 58.984 (66.464)	Top-5 acc 80.469 (85.564)	lr 0.00225
Train [97][2270/3239]	Time 0.364 (0.545)	Data Time 0.003 (0.020)	Loss 2.4712 (2.3926)	Entropy 0.55820 (0.55696)	Top-1 acc 65.234 (66.459)	Top-5 acc 84.375 (85.563)	lr 0.00225
Train [97][2280/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.020)	Loss 2.1856 (2.3925)	Entropy 0.55826 (0.55696)	Top-1 acc 70.703 (66.463)	Top-5 acc 87.891 (85.561)	lr 0.00225
Train [97][2290/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.019)	Loss 2.0990 (2.3926)	Entropy 0.55835 (0.55697)	Top-1 acc 75.391 (66.458)	Top-5 acc 90.625 (85.561)	lr 0.00225
Train [97][2300/3239]	Time 0.261 (0.544)	Data Time 0.001 (0.019)	Loss 2.4222 (2.3927)	Entropy 0.55848 (0.55697)	Top-1 acc 67.969 (66.454)	Top-5 acc 84.766 (85.561)	lr 0.00225
Train [97][2310/3239]	Time 0.227 (0.544)	Data Time 0.001 (0.019)	Loss 2.5487 (2.3927)	Entropy 0.55806 (0.55698)	Top-1 acc 64.844 (66.454)	Top-5 acc 82.422 (85.559)	lr 0.00225
Train [97][2320/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.019)	Loss 2.3099 (2.3926)	Entropy 0.55801 (0.55698)	Top-1 acc 67.969 (66.464)	Top-5 acc 85.156 (85.559)	lr 0.00225
Train [97][2330/3239]	Time 0.244 (0.543)	Data Time 0.001 (0.019)	Loss 2.3873 (2.3929)	Entropy 0.55751 (0.55699)	Top-1 acc 66.797 (66.462)	Top-5 acc 87.109 (85.554)	lr 0.00225
Train [97][2340/3239]	Time 0.400 (0.542)	Data Time 0.001 (0.019)	Loss 2.4037 (2.3931)	Entropy 0.55731 (0.55699)	Top-1 acc 64.453 (66.458)	Top-5 acc 85.156 (85.548)	lr 0.00225
Train [97][2350/3239]	Time 0.261 (0.542)	Data Time 0.002 (0.019)	Loss 2.3249 (2.3930)	Entropy 0.55726 (0.55699)	Top-1 acc 67.578 (66.465)	Top-5 acc 87.109 (85.549)	lr 0.00225
Train [97][2360/3239]	Time 0.254 (0.542)	Data Time 0.001 (0.019)	Loss 2.3345 (2.3929)	Entropy 0.55706 (0.55699)	Top-1 acc 66.406 (66.465)	Top-5 acc 86.328 (85.552)	lr 0.00225
Train [97][2370/3239]	Time 0.242 (0.541)	Data Time 0.001 (0.019)	Loss 2.5069 (2.3928)	Entropy 0.55689 (0.55699)	Top-1 acc 60.938 (66.469)	Top-5 acc 83.594 (85.553)	lr 0.00225
Train [97][2380/3239]	Time 0.266 (0.541)	Data Time 0.002 (0.019)	Loss 2.4938 (2.3926)	Entropy 0.55712 (0.55699)	Top-1 acc 64.453 (66.474)	Top-5 acc 83.594 (85.554)	lr 0.00225
Train [97][2390/3239]	Time 0.267 (0.540)	Data Time 0.001 (0.019)	Loss 2.4384 (2.3925)	Entropy 0.55715 (0.55699)	Top-1 acc 66.797 (66.477)	Top-5 acc 83.203 (85.554)	lr 0.00225
Train [97][2400/3239]	Time 0.289 (0.540)	Data Time 0.002 (0.019)	Loss 2.3489 (2.3928)	Entropy 0.55672 (0.55699)	Top-1 acc 65.234 (66.474)	Top-5 acc 87.891 (85.548)	lr 0.00225
Train [97][2410/3239]	Time 0.380 (0.540)	Data Time 0.001 (0.019)	Loss 2.4055 (2.3929)	Entropy 0.55687 (0.55699)	Top-1 acc 65.625 (66.471)	Top-5 acc 84.375 (85.543)	lr 0.00225
Train [97][2420/3239]	Time 0.325 (0.540)	Data Time 0.002 (0.019)	Loss 2.2614 (2.3927)	Entropy 0.55701 (0.55699)	Top-1 acc 67.969 (66.476)	Top-5 acc 89.062 (85.544)	lr 0.00225
Train [97][2430/3239]	Time 0.277 (0.540)	Data Time 0.001 (0.018)	Loss 2.5470 (2.3927)	Entropy 0.55690 (0.55699)	Top-1 acc 64.453 (66.478)	Top-5 acc 83.203 (85.542)	lr 0.00224
Train [97][2440/3239]	Time 0.269 (0.539)	Data Time 0.001 (0.018)	Loss 2.4237 (2.3927)	Entropy 0.55665 (0.55699)	Top-1 acc 66.797 (66.475)	Top-5 acc 83.594 (85.542)	lr 0.00224
Train [97][2450/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.018)	Loss 2.5479 (2.3925)	Entropy 0.55666 (0.55699)	Top-1 acc 60.938 (66.479)	Top-5 acc 82.422 (85.545)	lr 0.00224
Train [97][2460/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.018)	Loss 2.5348 (2.3927)	Entropy 0.55666 (0.55699)	Top-1 acc 59.375 (66.476)	Top-5 acc 85.156 (85.541)	lr 0.00224
Train [97][2470/3239]	Time 0.240 (0.538)	Data Time 0.001 (0.018)	Loss 2.4455 (2.3928)	Entropy 0.55650 (0.55699)	Top-1 acc 67.969 (66.471)	Top-5 acc 85.156 (85.539)	lr 0.00224
Train [97][2480/3239]	Time 0.257 (0.538)	Data Time 0.001 (0.018)	Loss 2.3277 (2.3929)	Entropy 0.55668 (0.55699)	Top-1 acc 68.750 (66.470)	Top-5 acc 87.500 (85.539)	lr 0.00224
Train [97][2490/3239]	Time 0.351 (0.538)	Data Time 0.003 (0.018)	Loss 2.3670 (2.3930)	Entropy 0.55674 (0.55698)	Top-1 acc 64.844 (66.467)	Top-5 acc 86.719 (85.541)	lr 0.00224
Train [97][2500/3239]	Time 0.475 (0.538)	Data Time 0.002 (0.018)	Loss 2.4517 (2.3933)	Entropy 0.55648 (0.55698)	Top-1 acc 64.062 (66.459)	Top-5 acc 86.328 (85.538)	lr 0.00224
Train [97][2510/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.018)	Loss 2.3463 (2.3933)	Entropy 0.55650 (0.55698)	Top-1 acc 69.531 (66.459)	Top-5 acc 86.328 (85.537)	lr 0.00224
Train [97][2520/3239]	Time 0.251 (0.538)	Data Time 0.002 (0.018)	Loss 2.3803 (2.3933)	Entropy 0.55642 (0.55698)	Top-1 acc 67.188 (66.457)	Top-5 acc 87.109 (85.538)	lr 0.00224
Train [97][2530/3239]	Time 0.256 (0.537)	Data Time 0.001 (0.018)	Loss 2.2930 (2.3934)	Entropy 0.55595 (0.55698)	Top-1 acc 71.875 (66.456)	Top-5 acc 86.719 (85.537)	lr 0.00224
Train [97][2540/3239]	Time 0.240 (0.537)	Data Time 0.001 (0.018)	Loss 2.5356 (2.3936)	Entropy 0.55603 (0.55697)	Top-1 acc 63.281 (66.451)	Top-5 acc 83.203 (85.531)	lr 0.00224
Train [97][2550/3239]	Time 0.261 (0.537)	Data Time 0.024 (0.018)	Loss 2.3815 (2.3937)	Entropy 0.55600 (0.55697)	Top-1 acc 66.797 (66.452)	Top-5 acc 84.766 (85.527)	lr 0.00224
Train [97][2560/3239]	Time 0.236 (0.536)	Data Time 0.002 (0.018)	Loss 2.3675 (2.3936)	Entropy 0.55567 (0.55696)	Top-1 acc 66.797 (66.453)	Top-5 acc 87.109 (85.531)	lr 0.00224
Train [97][2570/3239]	Time 0.393 (0.536)	Data Time 0.001 (0.018)	Loss 2.1864 (2.3936)	Entropy 0.55558 (0.55696)	Top-1 acc 69.922 (66.453)	Top-5 acc 88.281 (85.532)	lr 0.00224
Train [97][2580/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.017)	Loss 2.9007 (2.3939)	Entropy 0.55578 (0.55695)	Top-1 acc 52.734 (66.445)	Top-5 acc 75.391 (85.526)	lr 0.00224
Train [97][2590/3239]	Time 0.283 (0.535)	Data Time 0.001 (0.017)	Loss 2.3566 (2.3939)	Entropy 0.55602 (0.55695)	Top-1 acc 69.141 (66.446)	Top-5 acc 86.328 (85.526)	lr 0.00224
Train [97][2600/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.017)	Loss 2.4366 (2.3940)	Entropy 0.55567 (0.55695)	Top-1 acc 63.672 (66.442)	Top-5 acc 84.766 (85.524)	lr 0.00224
Train [97][2610/3239]	Time 0.230 (0.534)	Data Time 0.001 (0.017)	Loss 2.5592 (2.3940)	Entropy 0.55551 (0.55694)	Top-1 acc 58.984 (66.433)	Top-5 acc 82.031 (85.523)	lr 0.00223
Train [97][2620/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.017)	Loss 2.3336 (2.3942)	Entropy 0.55547 (0.55694)	Top-1 acc 68.359 (66.431)	Top-5 acc 88.281 (85.522)	lr 0.00223
Train [97][2630/3239]	Time 0.259 (0.533)	Data Time 0.001 (0.017)	Loss 2.4413 (2.3943)	Entropy 0.55578 (0.55693)	Top-1 acc 66.406 (66.427)	Top-5 acc 86.719 (85.522)	lr 0.00223
Train [97][2640/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.017)	Loss 2.1641 (2.3941)	Entropy 0.55608 (0.55693)	Top-1 acc 71.875 (66.430)	Top-5 acc 89.453 (85.525)	lr 0.00223
Train [97][2650/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.017)	Loss 2.3156 (2.3941)	Entropy 0.55640 (0.55692)	Top-1 acc 65.234 (66.429)	Top-5 acc 87.500 (85.525)	lr 0.00223
Train [97][2660/3239]	Time 0.293 (0.532)	Data Time 0.001 (0.017)	Loss 2.3987 (2.3939)	Entropy 0.55656 (0.55692)	Top-1 acc 68.359 (66.432)	Top-5 acc 84.375 (85.527)	lr 0.00223
Train [97][2670/3239]	Time 0.274 (0.532)	Data Time 0.001 (0.017)	Loss 2.3413 (2.3940)	Entropy 0.55629 (0.55692)	Top-1 acc 66.016 (66.433)	Top-5 acc 87.109 (85.527)	lr 0.00223
Train [97][2680/3239]	Time 0.332 (0.551)	Data Time 0.004 (0.017)	Loss 2.5193 (2.3942)	Entropy 0.55609 (0.55692)	Top-1 acc 63.672 (66.429)	Top-5 acc 83.203 (85.522)	lr 0.00223
Train [97][2690/3239]	Time 0.228 (0.550)	Data Time 0.001 (0.017)	Loss 2.6971 (2.3942)	Entropy 0.55621 (0.55692)	Top-1 acc 58.203 (66.429)	Top-5 acc 80.469 (85.524)	lr 0.00223
Train [97][2700/3239]	Time 0.272 (0.550)	Data Time 0.001 (0.017)	Loss 2.2283 (2.3939)	Entropy 0.55627 (0.55691)	Top-1 acc 71.484 (66.433)	Top-5 acc 88.281 (85.530)	lr 0.00223
Train [97][2710/3239]	Time 0.259 (0.550)	Data Time 0.002 (0.017)	Loss 2.3387 (2.3939)	Entropy 0.55632 (0.55691)	Top-1 acc 66.016 (66.430)	Top-5 acc 85.938 (85.532)	lr 0.00223
Train [97][2720/3239]	Time 0.311 (0.550)	Data Time 0.002 (0.017)	Loss 2.4469 (2.3942)	Entropy 0.55601 (0.55691)	Top-1 acc 66.797 (66.425)	Top-5 acc 84.766 (85.529)	lr 0.00223
Train [97][2730/3239]	Time 0.336 (0.549)	Data Time 0.001 (0.017)	Loss 2.3147 (2.3940)	Entropy 0.55597 (0.55690)	Top-1 acc 66.797 (66.428)	Top-5 acc 87.891 (85.531)	lr 0.00223
Train [97][2740/3239]	Time 0.240 (0.549)	Data Time 0.001 (0.017)	Loss 2.3954 (2.3940)	Entropy 0.55575 (0.55690)	Top-1 acc 67.578 (66.429)	Top-5 acc 83.594 (85.530)	lr 0.00223
Train [97][2750/3239]	Time 0.310 (0.548)	Data Time 0.001 (0.017)	Loss 2.5026 (2.3942)	Entropy 0.55602 (0.55690)	Top-1 acc 67.188 (66.425)	Top-5 acc 81.641 (85.525)	lr 0.00223
Train [97][2760/3239]	Time 0.264 (0.548)	Data Time 0.002 (0.016)	Loss 2.3802 (2.3942)	Entropy 0.55643 (0.55689)	Top-1 acc 67.188 (66.425)	Top-5 acc 84.375 (85.524)	lr 0.00223
Train [97][2770/3239]	Time 0.277 (0.548)	Data Time 0.001 (0.016)	Loss 2.2053 (2.3941)	Entropy 0.55639 (0.55689)	Top-1 acc 73.438 (66.432)	Top-5 acc 87.891 (85.527)	lr 0.00223
Train [97][2780/3239]	Time 0.235 (0.547)	Data Time 0.001 (0.016)	Loss 2.6603 (2.3940)	Entropy 0.55622 (0.55689)	Top-1 acc 61.328 (66.433)	Top-5 acc 82.031 (85.530)	lr 0.00222
Train [97][2790/3239]	Time 0.257 (0.547)	Data Time 0.003 (0.016)	Loss 2.5124 (2.3941)	Entropy 0.55634 (0.55689)	Top-1 acc 64.062 (66.429)	Top-5 acc 84.375 (85.530)	lr 0.00222
Train [97][2800/3239]	Time 0.238 (0.547)	Data Time 0.001 (0.016)	Loss 2.2843 (2.3938)	Entropy 0.55626 (0.55689)	Top-1 acc 69.922 (66.434)	Top-5 acc 88.672 (85.536)	lr 0.00222
Train [97][2810/3239]	Time 0.238 (0.546)	Data Time 0.001 (0.016)	Loss 2.2445 (2.3937)	Entropy 0.55630 (0.55688)	Top-1 acc 69.141 (66.436)	Top-5 acc 89.844 (85.538)	lr 0.00222
Train [97][2820/3239]	Time 0.258 (0.546)	Data Time 0.002 (0.016)	Loss 2.4634 (2.3939)	Entropy 0.55665 (0.55688)	Top-1 acc 65.234 (66.435)	Top-5 acc 84.375 (85.538)	lr 0.00222
Train [97][2830/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.016)	Loss 2.3391 (2.3939)	Entropy 0.55674 (0.55688)	Top-1 acc 66.406 (66.434)	Top-5 acc 86.328 (85.538)	lr 0.00222
Train [97][2840/3239]	Time 0.270 (0.545)	Data Time 0.001 (0.016)	Loss 2.3869 (2.3937)	Entropy 0.55666 (0.55688)	Top-1 acc 66.797 (66.440)	Top-5 acc 84.375 (85.542)	lr 0.00222
Train [97][2850/3239]	Time 0.221 (0.544)	Data Time 0.001 (0.016)	Loss 2.6044 (2.3939)	Entropy 0.55668 (0.55688)	Top-1 acc 62.109 (66.433)	Top-5 acc 82.031 (85.537)	lr 0.00222
Train [97][2860/3239]	Time 0.278 (0.544)	Data Time 0.001 (0.016)	Loss 2.5005 (2.3941)	Entropy 0.55645 (0.55688)	Top-1 acc 62.109 (66.426)	Top-5 acc 83.203 (85.536)	lr 0.00222
Train [97][2870/3239]	Time 0.230 (0.544)	Data Time 0.001 (0.016)	Loss 2.4033 (2.3940)	Entropy 0.55627 (0.55688)	Top-1 acc 66.406 (66.427)	Top-5 acc 85.547 (85.539)	lr 0.00222
Train [97][2880/3239]	Time 0.290 (0.543)	Data Time 0.001 (0.016)	Loss 2.5459 (2.3941)	Entropy 0.55623 (0.55688)	Top-1 acc 63.281 (66.421)	Top-5 acc 84.766 (85.536)	lr 0.00222
Train [97][2890/3239]	Time 0.329 (0.543)	Data Time 0.001 (0.016)	Loss 2.4820 (2.3941)	Entropy 0.55649 (0.55687)	Top-1 acc 62.109 (66.417)	Top-5 acc 83.203 (85.535)	lr 0.00222
Train [97][2900/3239]	Time 0.261 (0.542)	Data Time 0.002 (0.016)	Loss 2.7728 (2.3942)	Entropy 0.55656 (0.55687)	Top-1 acc 58.984 (66.413)	Top-5 acc 78.906 (85.534)	lr 0.00222
Train [97][2910/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.016)	Loss 2.3603 (2.3945)	Entropy 0.55647 (0.55687)	Top-1 acc 64.844 (66.409)	Top-5 acc 88.672 (85.530)	lr 0.00222
Train [97][2920/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.016)	Loss 2.2787 (2.3944)	Entropy 0.55609 (0.55687)	Top-1 acc 69.141 (66.411)	Top-5 acc 87.500 (85.530)	lr 0.00222
Train [97][2930/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.016)	Loss 2.5099 (2.3944)	Entropy 0.55594 (0.55687)	Top-1 acc 64.062 (66.413)	Top-5 acc 83.203 (85.532)	lr 0.00222
Train [97][2940/3239]	Time 0.252 (0.541)	Data Time 0.002 (0.016)	Loss 2.3151 (2.3944)	Entropy 0.55608 (0.55686)	Top-1 acc 66.797 (66.414)	Top-5 acc 87.891 (85.528)	lr 0.00222
Train [97][2950/3239]	Time 0.261 (0.541)	Data Time 0.004 (0.016)	Loss 2.1880 (2.3946)	Entropy 0.55642 (0.55686)	Top-1 acc 70.312 (66.408)	Top-5 acc 88.281 (85.525)	lr 0.00222
Train [97][2960/3239]	Time 0.334 (0.540)	Data Time 0.001 (0.015)	Loss 2.4944 (2.3946)	Entropy 0.55647 (0.55686)	Top-1 acc 66.797 (66.411)	Top-5 acc 81.250 (85.523)	lr 0.00221
Train [97][2970/3239]	Time 0.275 (0.540)	Data Time 0.004 (0.015)	Loss 2.5154 (2.3945)	Entropy 0.55617 (0.55686)	Top-1 acc 62.891 (66.413)	Top-5 acc 84.375 (85.527)	lr 0.00221
Train [97][2980/3239]	Time 0.256 (0.540)	Data Time 0.001 (0.015)	Loss 2.4360 (2.3944)	Entropy 0.55640 (0.55686)	Top-1 acc 68.359 (66.418)	Top-5 acc 84.766 (85.526)	lr 0.00221
Train [97][2990/3239]	Time 0.236 (0.539)	Data Time 0.001 (0.015)	Loss 2.1736 (2.3945)	Entropy 0.55655 (0.55686)	Top-1 acc 69.531 (66.415)	Top-5 acc 91.016 (85.524)	lr 0.00221
Train [97][3000/3239]	Time 0.240 (0.539)	Data Time 0.001 (0.015)	Loss 2.3934 (2.3945)	Entropy 0.55680 (0.55686)	Top-1 acc 66.016 (66.413)	Top-5 acc 86.719 (85.521)	lr 0.00221
Train [97][3010/3239]	Time 0.222 (0.539)	Data Time 0.001 (0.015)	Loss 2.5182 (2.3947)	Entropy 0.55696 (0.55685)	Top-1 acc 60.938 (66.408)	Top-5 acc 84.766 (85.518)	lr 0.00221
Train [97][3020/3239]	Time 0.276 (0.538)	Data Time 0.002 (0.015)	Loss 2.3209 (2.3945)	Entropy 0.55673 (0.55686)	Top-1 acc 67.188 (66.411)	Top-5 acc 87.500 (85.521)	lr 0.00221
Train [97][3030/3239]	Time 0.263 (0.538)	Data Time 0.001 (0.015)	Loss 2.6222 (2.3946)	Entropy 0.55695 (0.55686)	Top-1 acc 59.375 (66.406)	Top-5 acc 80.078 (85.522)	lr 0.00221
Train [97][3040/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.015)	Loss 2.3445 (2.3945)	Entropy 0.55701 (0.55686)	Top-1 acc 67.188 (66.409)	Top-5 acc 86.719 (85.522)	lr 0.00221
Train [97][3050/3239]	Time 0.410 (0.537)	Data Time 0.005 (0.015)	Loss 2.2565 (2.3944)	Entropy 0.55713 (0.55686)	Top-1 acc 70.312 (66.414)	Top-5 acc 88.281 (85.526)	lr 0.00221
Train [97][3060/3239]	Time 0.238 (0.537)	Data Time 0.001 (0.015)	Loss 2.2696 (2.3942)	Entropy 0.55683 (0.55686)	Top-1 acc 71.094 (66.417)	Top-5 acc 87.500 (85.530)	lr 0.00221
Train [97][3070/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.015)	Loss 2.4597 (2.3942)	Entropy 0.55691 (0.55686)	Top-1 acc 64.844 (66.413)	Top-5 acc 85.156 (85.534)	lr 0.00221
Train [97][3080/3239]	Time 0.256 (0.536)	Data Time 0.002 (0.015)	Loss 2.4381 (2.3941)	Entropy 0.55701 (0.55686)	Top-1 acc 64.453 (66.417)	Top-5 acc 84.766 (85.536)	lr 0.00221
Train [97][3090/3239]	Time 0.244 (0.536)	Data Time 0.001 (0.015)	Loss 2.3982 (2.3940)	Entropy 0.55687 (0.55686)	Top-1 acc 68.359 (66.413)	Top-5 acc 85.938 (85.539)	lr 0.00221
Train [97][3100/3239]	Time 0.291 (0.535)	Data Time 0.001 (0.015)	Loss 2.5808 (2.3940)	Entropy 0.55696 (0.55686)	Top-1 acc 60.938 (66.410)	Top-5 acc 84.375 (85.541)	lr 0.00221
Train [97][3110/3239]	Time 0.276 (0.535)	Data Time 0.001 (0.015)	Loss 2.5123 (2.3939)	Entropy 0.55705 (0.55686)	Top-1 acc 65.625 (66.413)	Top-5 acc 84.766 (85.543)	lr 0.00221
Train [97][3120/3239]	Time 0.407 (0.535)	Data Time 0.002 (0.015)	Loss 2.2340 (2.3939)	Entropy 0.55717 (0.55686)	Top-1 acc 71.094 (66.412)	Top-5 acc 88.281 (85.544)	lr 0.00221
Train [97][3130/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.015)	Loss 2.3456 (2.3938)	Entropy 0.55686 (0.55686)	Top-1 acc 64.844 (66.412)	Top-5 acc 89.844 (85.545)	lr 0.00220
Train [97][3140/3239]	Time 0.241 (0.534)	Data Time 0.001 (0.015)	Loss 2.3390 (2.3942)	Entropy 0.55633 (0.55686)	Top-1 acc 69.141 (66.407)	Top-5 acc 84.375 (85.537)	lr 0.00220
Train [97][3150/3239]	Time 0.244 (0.534)	Data Time 0.001 (0.015)	Loss 2.2109 (2.3941)	Entropy 0.55632 (0.55686)	Top-1 acc 67.969 (66.406)	Top-5 acc 89.453 (85.539)	lr 0.00220
Train [97][3160/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.015)	Loss 2.5455 (2.3942)	Entropy 0.55631 (0.55686)	Top-1 acc 61.719 (66.403)	Top-5 acc 82.031 (85.537)	lr 0.00220
Train [97][3170/3239]	Time 0.258 (0.533)	Data Time 0.001 (0.015)	Loss 2.3913 (2.3943)	Entropy 0.55632 (0.55685)	Top-1 acc 67.578 (66.399)	Top-5 acc 85.547 (85.534)	lr 0.00220
Train [97][3180/3239]	Time 0.228 (0.532)	Data Time 0.000 (0.015)	Loss 2.5332 (2.3943)	Entropy 0.55560 (0.55685)	Top-1 acc 67.188 (66.400)	Top-5 acc 82.812 (85.533)	lr 0.00220
Train [97][3190/3239]	Time 0.226 (0.532)	Data Time 0.000 (0.014)	Loss 2.4294 (2.3941)	Entropy 0.55528 (0.55685)	Top-1 acc 66.016 (66.402)	Top-5 acc 85.156 (85.535)	lr 0.00220
Train [97][3200/3239]	Time 0.225 (0.532)	Data Time 0.000 (0.014)	Loss 2.6173 (2.3943)	Entropy 0.55519 (0.55684)	Top-1 acc 65.625 (66.400)	Top-5 acc 80.859 (85.532)	lr 0.00220
Train [97][3210/3239]	Time 0.317 (0.531)	Data Time 0.000 (0.014)	Loss 2.4325 (2.3943)	Entropy 0.55518 (0.55684)	Top-1 acc 65.234 (66.403)	Top-5 acc 83.594 (85.531)	lr 0.00220
Train [97][3220/3239]	Time 0.221 (0.531)	Data Time 0.000 (0.014)	Loss 2.3219 (2.3944)	Entropy 0.55553 (0.55683)	Top-1 acc 67.969 (66.403)	Top-5 acc 85.156 (85.528)	lr 0.00220
Train [97][3230/3239]	Time 0.220 (0.530)	Data Time 0.000 (0.014)	Loss 2.5245 (2.3944)	Entropy 0.55544 (0.55683)	Top-1 acc 60.547 (66.401)	Top-5 acc 85.938 (85.530)	lr 0.00220
Train [97][3239/3239]	Time 0.918 (0.530)	Data Time 0.000 (0.014)	Loss 3.0393 (2.3946)	Entropy 0.55527 (0.55682)	Top-1 acc 56.790 (66.397)	Top-5 acc 79.012 (85.527)	lr 0.00220
==========Valid [97/120]	loss 1.216	top-1 acc 72.110 (72.110)	top-5 acc 90.110	Train top-1 66.397	top-5 85.527	Entropy 0.55527	Latency-None: 0.000ms	Flops: 539.00M
Train [98][0/3239]	Time 37.727 (37.727)	Data Time 37.004 (37.004)	Loss 2.2235 (2.2235)	Entropy 0.55527 (0.55527)	Top-1 acc 67.969 (67.969)	Top-5 acc 88.672 (88.672)	lr 0.00220
Train [98][10/3239]	Time 0.347 (3.957)	Data Time 0.034 (3.376)	Loss 2.3323 (2.3649)	Entropy 0.55484 (0.55514)	Top-1 acc 70.703 (67.578)	Top-5 acc 86.719 (86.470)	lr 0.00220
Train [98][20/3239]	Time 0.260 (2.274)	Data Time 0.001 (1.769)	Loss 2.3176 (2.3545)	Entropy 0.55500 (0.55502)	Top-1 acc 64.844 (67.485)	Top-5 acc 85.156 (86.421)	lr 0.00220
Train [98][30/3239]	Time 0.233 (1.673)	Data Time 0.001 (1.199)	Loss 2.1891 (2.3679)	Entropy 0.55521 (0.55505)	Top-1 acc 71.484 (67.465)	Top-5 acc 90.234 (86.164)	lr 0.00220
Train [98][40/3239]	Time 0.243 (1.367)	Data Time 0.001 (0.907)	Loss 2.2566 (2.3696)	Entropy 0.55524 (0.55510)	Top-1 acc 67.188 (67.064)	Top-5 acc 90.234 (86.109)	lr 0.00220
Train [98][50/3239]	Time 0.232 (1.181)	Data Time 0.001 (0.729)	Loss 2.4549 (2.3763)	Entropy 0.55517 (0.55512)	Top-1 acc 67.188 (66.896)	Top-5 acc 84.766 (85.991)	lr 0.00220
Train [98][60/3239]	Time 0.228 (1.056)	Data Time 0.001 (0.610)	Loss 2.2894 (2.3677)	Entropy 0.55498 (0.55511)	Top-1 acc 69.531 (67.117)	Top-5 acc 88.281 (86.168)	lr 0.00219
Train [98][70/3239]	Time 0.269 (0.967)	Data Time 0.001 (0.524)	Loss 2.2825 (2.3583)	Entropy 0.55515 (0.55511)	Top-1 acc 66.406 (67.320)	Top-5 acc 86.328 (86.334)	lr 0.00219
Train [98][80/3239]	Time 0.236 (0.899)	Data Time 0.001 (0.460)	Loss 2.4686 (2.3671)	Entropy 0.55475 (0.55511)	Top-1 acc 64.062 (67.062)	Top-5 acc 83.984 (86.087)	lr 0.00219
Train [98][90/3239]	Time 0.406 (1.446)	Data Time 0.006 (0.410)	Loss 2.7305 (2.3766)	Entropy 0.55508 (0.55508)	Top-1 acc 56.641 (66.814)	Top-5 acc 81.250 (85.938)	lr 0.00219
Train [98][100/3239]	Time 0.223 (1.355)	Data Time 0.002 (0.370)	Loss 2.4284 (2.3775)	Entropy 0.55516 (0.55507)	Top-1 acc 64.453 (66.716)	Top-5 acc 84.375 (85.968)	lr 0.00219
Train [98][110/3239]	Time 0.336 (1.272)	Data Time 0.001 (0.337)	Loss 2.2889 (2.3766)	Entropy 0.55487 (0.55507)	Top-1 acc 70.312 (66.663)	Top-5 acc 87.500 (86.001)	lr 0.00219
Train [98][120/3239]	Time 0.239 (1.203)	Data Time 0.002 (0.309)	Loss 2.3178 (2.3741)	Entropy 0.55508 (0.55506)	Top-1 acc 68.359 (66.752)	Top-5 acc 87.891 (86.057)	lr 0.00219
Train [98][130/3239]	Time 0.221 (1.144)	Data Time 0.001 (0.286)	Loss 2.3631 (2.3732)	Entropy 0.55523 (0.55506)	Top-1 acc 69.141 (66.871)	Top-5 acc 86.328 (86.036)	lr 0.00219
Train [98][140/3239]	Time 0.234 (1.093)	Data Time 0.002 (0.266)	Loss 2.4252 (2.3711)	Entropy 0.55520 (0.55507)	Top-1 acc 65.625 (66.913)	Top-5 acc 82.422 (86.010)	lr 0.00219
Train [98][150/3239]	Time 0.232 (1.048)	Data Time 0.001 (0.248)	Loss 2.2852 (2.3730)	Entropy 0.55522 (0.55508)	Top-1 acc 69.531 (66.869)	Top-5 acc 89.453 (85.948)	lr 0.00219
Train [98][160/3239]	Time 0.265 (1.013)	Data Time 0.001 (0.233)	Loss 2.1579 (2.3709)	Entropy 0.55520 (0.55509)	Top-1 acc 75.391 (66.969)	Top-5 acc 90.234 (85.996)	lr 0.00219
Train [98][170/3239]	Time 0.241 (0.982)	Data Time 0.001 (0.219)	Loss 2.2443 (2.3699)	Entropy 0.55512 (0.55510)	Top-1 acc 68.750 (66.932)	Top-5 acc 86.328 (85.981)	lr 0.00219
Train [98][180/3239]	Time 0.236 (0.952)	Data Time 0.001 (0.207)	Loss 2.3567 (2.3730)	Entropy 0.55472 (0.55509)	Top-1 acc 67.969 (66.797)	Top-5 acc 83.203 (85.920)	lr 0.00219
Train [98][190/3239]	Time 0.233 (0.924)	Data Time 0.001 (0.196)	Loss 2.4183 (2.3703)	Entropy 0.55486 (0.55508)	Top-1 acc 65.234 (66.854)	Top-5 acc 84.375 (85.995)	lr 0.00219
Train [98][200/3239]	Time 0.262 (0.899)	Data Time 0.001 (0.187)	Loss 2.4053 (2.3708)	Entropy 0.55458 (0.55506)	Top-1 acc 66.406 (66.855)	Top-5 acc 83.594 (85.998)	lr 0.00219
Train [98][210/3239]	Time 0.237 (0.876)	Data Time 0.001 (0.178)	Loss 2.4088 (2.3718)	Entropy 0.55465 (0.55504)	Top-1 acc 64.062 (66.828)	Top-5 acc 83.594 (85.971)	lr 0.00219
Train [98][220/3239]	Time 0.226 (0.855)	Data Time 0.001 (0.170)	Loss 2.2678 (2.3699)	Entropy 0.55440 (0.55502)	Top-1 acc 67.969 (66.871)	Top-5 acc 88.672 (85.991)	lr 0.00219
Train [98][230/3239]	Time 0.258 (0.836)	Data Time 0.001 (0.163)	Loss 2.3756 (2.3698)	Entropy 0.55438 (0.55499)	Top-1 acc 64.062 (66.863)	Top-5 acc 85.156 (86.003)	lr 0.00219
Train [98][240/3239]	Time 0.236 (0.819)	Data Time 0.001 (0.156)	Loss 2.3747 (2.3688)	Entropy 0.55403 (0.55496)	Top-1 acc 65.234 (66.878)	Top-5 acc 87.500 (86.017)	lr 0.00218
Train [98][250/3239]	Time 0.248 (0.804)	Data Time 0.001 (0.150)	Loss 2.5943 (2.3695)	Entropy 0.55404 (0.55492)	Top-1 acc 62.109 (66.861)	Top-5 acc 83.203 (86.009)	lr 0.00218
Train [98][260/3239]	Time 0.255 (0.789)	Data Time 0.001 (0.144)	Loss 2.2625 (2.3670)	Entropy 0.55412 (0.55489)	Top-1 acc 71.094 (66.930)	Top-5 acc 86.328 (86.014)	lr 0.00218
Train [98][270/3239]	Time 0.325 (0.776)	Data Time 0.002 (0.139)	Loss 2.2649 (2.3686)	Entropy 0.55430 (0.55486)	Top-1 acc 67.188 (66.882)	Top-5 acc 85.938 (85.992)	lr 0.00218
Train [98][280/3239]	Time 0.274 (0.765)	Data Time 0.002 (0.134)	Loss 2.2912 (2.3695)	Entropy 0.55441 (0.55484)	Top-1 acc 67.578 (66.876)	Top-5 acc 87.109 (85.976)	lr 0.00218
Train [98][290/3239]	Time 0.218 (0.758)	Data Time 0.001 (0.130)	Loss 2.3463 (2.3697)	Entropy 0.55440 (0.55483)	Top-1 acc 63.281 (66.879)	Top-5 acc 86.719 (85.966)	lr 0.00218
Train [98][300/3239]	Time 0.260 (0.747)	Data Time 0.001 (0.125)	Loss 2.5089 (2.3699)	Entropy 0.55445 (0.55481)	Top-1 acc 66.797 (66.870)	Top-5 acc 82.031 (85.948)	lr 0.00218
Train [98][310/3239]	Time 0.231 (0.736)	Data Time 0.001 (0.121)	Loss 2.3312 (2.3696)	Entropy 0.55442 (0.55480)	Top-1 acc 67.578 (66.882)	Top-5 acc 85.156 (85.925)	lr 0.00218
Train [98][320/3239]	Time 0.238 (0.726)	Data Time 0.001 (0.118)	Loss 2.5007 (2.3715)	Entropy 0.55414 (0.55479)	Top-1 acc 63.281 (66.874)	Top-5 acc 84.375 (85.892)	lr 0.00218
Train [98][330/3239]	Time 0.300 (0.717)	Data Time 0.002 (0.114)	Loss 2.5739 (2.3718)	Entropy 0.55429 (0.55477)	Top-1 acc 61.719 (66.871)	Top-5 acc 80.859 (85.891)	lr 0.00218
Train [98][340/3239]	Time 0.454 (0.713)	Data Time 0.002 (0.111)	Loss 2.4369 (2.3700)	Entropy 0.55415 (0.55475)	Top-1 acc 66.016 (66.895)	Top-5 acc 85.156 (85.913)	lr 0.00218
Train [98][350/3239]	Time 0.326 (0.707)	Data Time 0.002 (0.108)	Loss 2.3163 (2.3711)	Entropy 0.55430 (0.55474)	Top-1 acc 67.969 (66.874)	Top-5 acc 88.281 (85.884)	lr 0.00218
Train [98][360/3239]	Time 0.227 (0.701)	Data Time 0.001 (0.105)	Loss 2.4637 (2.3720)	Entropy 0.55433 (0.55473)	Top-1 acc 63.672 (66.844)	Top-5 acc 81.641 (85.859)	lr 0.00218
Train [98][370/3239]	Time 0.235 (0.694)	Data Time 0.001 (0.102)	Loss 2.2614 (2.3703)	Entropy 0.55415 (0.55472)	Top-1 acc 73.438 (66.919)	Top-5 acc 90.234 (85.897)	lr 0.00218
Train [98][380/3239]	Time 0.232 (0.687)	Data Time 0.001 (0.099)	Loss 2.8398 (2.3714)	Entropy 0.55401 (0.55470)	Top-1 acc 58.203 (66.904)	Top-5 acc 75.781 (85.882)	lr 0.00218
Train [98][390/3239]	Time 0.225 (0.680)	Data Time 0.001 (0.097)	Loss 2.3385 (2.3707)	Entropy 0.55402 (0.55468)	Top-1 acc 64.844 (66.900)	Top-5 acc 87.109 (85.899)	lr 0.00218
Train [98][400/3239]	Time 0.232 (0.673)	Data Time 0.001 (0.094)	Loss 2.3094 (2.3704)	Entropy 0.55417 (0.55467)	Top-1 acc 69.141 (66.931)	Top-5 acc 88.672 (85.895)	lr 0.00218
Train [98][410/3239]	Time 0.235 (0.668)	Data Time 0.001 (0.092)	Loss 2.3751 (2.3715)	Entropy 0.55400 (0.55465)	Top-1 acc 66.406 (66.902)	Top-5 acc 84.375 (85.856)	lr 0.00218
Train [98][420/3239]	Time 0.255 (0.662)	Data Time 0.002 (0.090)	Loss 2.3491 (2.3716)	Entropy 0.55446 (0.55464)	Top-1 acc 67.188 (66.904)	Top-5 acc 84.766 (85.865)	lr 0.00217
Train [98][430/3239]	Time 0.336 (0.657)	Data Time 0.001 (0.088)	Loss 2.1642 (2.3721)	Entropy 0.55458 (0.55464)	Top-1 acc 71.484 (66.936)	Top-5 acc 91.016 (85.860)	lr 0.00217
Train [98][440/3239]	Time 0.227 (0.651)	Data Time 0.001 (0.086)	Loss 2.3488 (2.3726)	Entropy 0.55447 (0.55464)	Top-1 acc 65.234 (66.923)	Top-5 acc 87.109 (85.857)	lr 0.00217
Train [98][450/3239]	Time 0.229 (0.645)	Data Time 0.001 (0.084)	Loss 2.5759 (2.3723)	Entropy 0.55433 (0.55463)	Top-1 acc 64.453 (66.961)	Top-5 acc 81.641 (85.861)	lr 0.00217
Train [98][460/3239]	Time 0.256 (0.640)	Data Time 0.001 (0.082)	Loss 2.3375 (2.3717)	Entropy 0.55436 (0.55463)	Top-1 acc 67.188 (66.954)	Top-5 acc 86.719 (85.882)	lr 0.00217
Train [98][470/3239]	Time 0.221 (0.635)	Data Time 0.001 (0.081)	Loss 2.4253 (2.3711)	Entropy 0.55451 (0.55462)	Top-1 acc 68.359 (66.961)	Top-5 acc 84.375 (85.894)	lr 0.00217
Train [98][480/3239]	Time 0.232 (0.631)	Data Time 0.002 (0.079)	Loss 2.5190 (2.3711)	Entropy 0.55445 (0.55462)	Top-1 acc 65.234 (66.954)	Top-5 acc 82.812 (85.907)	lr 0.00217
Train [98][490/3239]	Time 0.228 (0.626)	Data Time 0.001 (0.077)	Loss 2.4247 (2.3702)	Entropy 0.55438 (0.55461)	Top-1 acc 65.234 (66.992)	Top-5 acc 85.547 (85.935)	lr 0.00217
Train [98][500/3239]	Time 0.333 (0.622)	Data Time 0.001 (0.076)	Loss 2.3000 (2.3708)	Entropy 0.55446 (0.55461)	Top-1 acc 69.531 (66.990)	Top-5 acc 86.719 (85.922)	lr 0.00217
Train [98][510/3239]	Time 0.223 (0.618)	Data Time 0.001 (0.074)	Loss 2.3977 (2.3717)	Entropy 0.55462 (0.55461)	Top-1 acc 66.016 (66.956)	Top-5 acc 83.984 (85.903)	lr 0.00217
Train [98][520/3239]	Time 0.239 (0.613)	Data Time 0.002 (0.073)	Loss 2.3349 (2.3714)	Entropy 0.55429 (0.55461)	Top-1 acc 69.141 (66.960)	Top-5 acc 84.375 (85.912)	lr 0.00217
Train [98][530/3239]	Time 0.220 (0.610)	Data Time 0.001 (0.072)	Loss 2.1236 (2.3713)	Entropy 0.55426 (0.55460)	Top-1 acc 71.484 (66.974)	Top-5 acc 91.797 (85.905)	lr 0.00217
Train [98][540/3239]	Time 0.254 (0.606)	Data Time 0.001 (0.070)	Loss 2.2338 (2.3709)	Entropy 0.55422 (0.55460)	Top-1 acc 71.484 (66.962)	Top-5 acc 87.891 (85.899)	lr 0.00217
Train [98][550/3239]	Time 0.227 (0.603)	Data Time 0.001 (0.069)	Loss 2.4651 (2.3730)	Entropy 0.55423 (0.55459)	Top-1 acc 67.969 (66.911)	Top-5 acc 83.984 (85.868)	lr 0.00217
Train [98][560/3239]	Time 0.225 (0.599)	Data Time 0.001 (0.068)	Loss 2.2684 (2.3720)	Entropy 0.55437 (0.55458)	Top-1 acc 70.312 (66.939)	Top-5 acc 86.719 (85.884)	lr 0.00217
Train [98][570/3239]	Time 0.216 (0.596)	Data Time 0.001 (0.067)	Loss 2.4564 (2.3730)	Entropy 0.55409 (0.55458)	Top-1 acc 61.719 (66.915)	Top-5 acc 84.375 (85.864)	lr 0.00217
Train [98][580/3239]	Time 0.231 (0.593)	Data Time 0.001 (0.066)	Loss 2.1995 (2.3724)	Entropy 0.55388 (0.55457)	Top-1 acc 72.266 (66.927)	Top-5 acc 89.453 (85.868)	lr 0.00217
Train [98][590/3239]	Time 0.250 (0.590)	Data Time 0.001 (0.065)	Loss 2.2546 (2.3732)	Entropy 0.55383 (0.55456)	Top-1 acc 71.484 (66.897)	Top-5 acc 87.891 (85.866)	lr 0.00216
Train [98][600/3239]	Time 0.217 (0.587)	Data Time 0.001 (0.063)	Loss 2.4787 (2.3738)	Entropy 0.55356 (0.55454)	Top-1 acc 64.062 (66.881)	Top-5 acc 82.422 (85.863)	lr 0.00216
Train [98][610/3239]	Time 0.261 (0.584)	Data Time 0.028 (0.063)	Loss 2.5881 (2.3752)	Entropy 0.55360 (0.55453)	Top-1 acc 63.281 (66.838)	Top-5 acc 82.422 (85.844)	lr 0.00216
Train [98][620/3239]	Time 0.243 (0.581)	Data Time 0.001 (0.062)	Loss 2.3553 (2.3757)	Entropy 0.55373 (0.55451)	Top-1 acc 66.406 (66.811)	Top-5 acc 86.328 (85.827)	lr 0.00216
Train [98][630/3239]	Time 0.255 (0.578)	Data Time 0.001 (0.061)	Loss 2.4234 (2.3751)	Entropy 0.55372 (0.55450)	Top-1 acc 62.891 (66.814)	Top-5 acc 82.031 (85.839)	lr 0.00216
Train [98][640/3239]	Time 0.225 (0.576)	Data Time 0.001 (0.060)	Loss 2.4441 (2.3762)	Entropy 0.55374 (0.55449)	Top-1 acc 67.578 (66.794)	Top-5 acc 85.156 (85.828)	lr 0.00216
Train [98][650/3239]	Time 0.220 (0.573)	Data Time 0.001 (0.059)	Loss 2.5095 (2.3766)	Entropy 0.55360 (0.55447)	Top-1 acc 63.281 (66.787)	Top-5 acc 82.422 (85.809)	lr 0.00216
Train [98][660/3239]	Time 0.307 (0.571)	Data Time 0.001 (0.058)	Loss 2.4500 (2.3772)	Entropy 0.55381 (0.55446)	Top-1 acc 66.016 (66.773)	Top-5 acc 85.938 (85.793)	lr 0.00216
Train [98][670/3239]	Time 0.220 (0.568)	Data Time 0.001 (0.057)	Loss 2.5242 (2.3776)	Entropy 0.55410 (0.55445)	Top-1 acc 62.109 (66.761)	Top-5 acc 83.984 (85.788)	lr 0.00216
Train [98][680/3239]	Time 0.237 (0.566)	Data Time 0.001 (0.056)	Loss 2.5222 (2.3776)	Entropy 0.55399 (0.55445)	Top-1 acc 60.938 (66.753)	Top-5 acc 81.250 (85.791)	lr 0.00216
Train [98][690/3239]	Time 0.245 (0.564)	Data Time 0.001 (0.055)	Loss 2.3253 (2.3770)	Entropy 0.55393 (0.55444)	Top-1 acc 65.625 (66.765)	Top-5 acc 88.672 (85.806)	lr 0.00216
Train [98][700/3239]	Time 0.230 (0.562)	Data Time 0.001 (0.055)	Loss 2.4771 (2.3777)	Entropy 0.55393 (0.55443)	Top-1 acc 62.109 (66.743)	Top-5 acc 85.156 (85.803)	lr 0.00216
Train [98][710/3239]	Time 0.238 (0.560)	Data Time 0.001 (0.054)	Loss 2.3323 (2.3789)	Entropy 0.55330 (0.55442)	Top-1 acc 69.141 (66.737)	Top-5 acc 87.500 (85.779)	lr 0.00216
Train [98][720/3239]	Time 0.318 (0.559)	Data Time 0.002 (0.053)	Loss 2.3848 (2.3803)	Entropy 0.55313 (0.55441)	Top-1 acc 66.797 (66.690)	Top-5 acc 86.719 (85.762)	lr 0.00216
Train [98][730/3239]	Time 0.321 (0.558)	Data Time 0.001 (0.053)	Loss 2.3329 (2.3806)	Entropy 0.55300 (0.55439)	Top-1 acc 66.797 (66.679)	Top-5 acc 86.719 (85.762)	lr 0.00216
Train [98][740/3239]	Time 0.232 (0.556)	Data Time 0.001 (0.052)	Loss 2.4482 (2.3802)	Entropy 0.55350 (0.55437)	Top-1 acc 64.453 (66.700)	Top-5 acc 82.812 (85.770)	lr 0.00216
Train [98][750/3239]	Time 0.248 (0.628)	Data Time 0.002 (0.051)	Loss 2.3403 (2.3804)	Entropy 0.55337 (0.55436)	Top-1 acc 67.969 (66.713)	Top-5 acc 86.719 (85.767)	lr 0.00216
Train [98][760/3239]	Time 0.233 (0.625)	Data Time 0.001 (0.051)	Loss 2.2452 (2.3801)	Entropy 0.55332 (0.55435)	Top-1 acc 69.141 (66.728)	Top-5 acc 87.109 (85.761)	lr 0.00216
Train [98][770/3239]	Time 0.239 (0.623)	Data Time 0.002 (0.050)	Loss 2.4853 (2.3807)	Entropy 0.55344 (0.55433)	Top-1 acc 64.844 (66.708)	Top-5 acc 86.328 (85.750)	lr 0.00215
Train [98][780/3239]	Time 0.256 (0.620)	Data Time 0.001 (0.049)	Loss 2.3187 (2.3805)	Entropy 0.55344 (0.55432)	Top-1 acc 65.234 (66.721)	Top-5 acc 87.891 (85.753)	lr 0.00215
Train [98][790/3239]	Time 0.223 (0.618)	Data Time 0.001 (0.049)	Loss 2.3252 (2.3808)	Entropy 0.55291 (0.55431)	Top-1 acc 69.531 (66.716)	Top-5 acc 88.281 (85.755)	lr 0.00215
Train [98][800/3239]	Time 0.232 (0.615)	Data Time 0.001 (0.048)	Loss 2.3675 (2.3808)	Entropy 0.55310 (0.55429)	Top-1 acc 66.797 (66.724)	Top-5 acc 85.156 (85.748)	lr 0.00215
Train [98][810/3239]	Time 0.227 (0.613)	Data Time 0.001 (0.048)	Loss 2.3997 (2.3813)	Entropy 0.55312 (0.55428)	Top-1 acc 66.797 (66.708)	Top-5 acc 85.547 (85.737)	lr 0.00215
Train [98][820/3239]	Time 0.351 (0.610)	Data Time 0.001 (0.047)	Loss 2.2845 (2.3805)	Entropy 0.55329 (0.55427)	Top-1 acc 67.578 (66.726)	Top-5 acc 86.328 (85.742)	lr 0.00215
Train [98][830/3239]	Time 0.226 (0.608)	Data Time 0.001 (0.046)	Loss 2.4740 (2.3813)	Entropy 0.55340 (0.55425)	Top-1 acc 63.672 (66.700)	Top-5 acc 85.938 (85.727)	lr 0.00215
Train [98][840/3239]	Time 0.234 (0.606)	Data Time 0.001 (0.046)	Loss 2.2487 (2.3809)	Entropy 0.55325 (0.55424)	Top-1 acc 68.359 (66.710)	Top-5 acc 86.328 (85.723)	lr 0.00215
Train [98][850/3239]	Time 0.235 (0.603)	Data Time 0.001 (0.045)	Loss 2.2490 (2.3808)	Entropy 0.55285 (0.55423)	Top-1 acc 72.656 (66.716)	Top-5 acc 88.281 (85.730)	lr 0.00215
Train [98][860/3239]	Time 0.244 (0.601)	Data Time 0.001 (0.045)	Loss 2.1526 (2.3805)	Entropy 0.55285 (0.55422)	Top-1 acc 72.656 (66.721)	Top-5 acc 89.844 (85.737)	lr 0.00215
Train [98][870/3239]	Time 0.232 (0.599)	Data Time 0.001 (0.044)	Loss 2.4072 (2.3808)	Entropy 0.55285 (0.55420)	Top-1 acc 66.797 (66.717)	Top-5 acc 86.719 (85.729)	lr 0.00215
Train [98][880/3239]	Time 0.228 (0.597)	Data Time 0.001 (0.044)	Loss 2.2839 (2.3809)	Entropy 0.55262 (0.55418)	Top-1 acc 68.359 (66.712)	Top-5 acc 89.453 (85.729)	lr 0.00215
Train [98][890/3239]	Time 0.325 (0.595)	Data Time 0.001 (0.043)	Loss 2.5316 (2.3804)	Entropy 0.55256 (0.55417)	Top-1 acc 65.625 (66.722)	Top-5 acc 81.250 (85.731)	lr 0.00215
Train [98][900/3239]	Time 0.314 (0.593)	Data Time 0.003 (0.043)	Loss 2.5472 (2.3807)	Entropy 0.55233 (0.55415)	Top-1 acc 65.625 (66.717)	Top-5 acc 83.984 (85.729)	lr 0.00215
Train [98][910/3239]	Time 0.268 (0.593)	Data Time 0.001 (0.042)	Loss 2.3129 (2.3803)	Entropy 0.55253 (0.55413)	Top-1 acc 72.266 (66.728)	Top-5 acc 87.500 (85.745)	lr 0.00215
Train [98][920/3239]	Time 0.227 (0.591)	Data Time 0.001 (0.042)	Loss 2.2483 (2.3799)	Entropy 0.55251 (0.55411)	Top-1 acc 68.359 (66.731)	Top-5 acc 89.062 (85.752)	lr 0.00215
Train [98][930/3239]	Time 0.223 (0.589)	Data Time 0.001 (0.042)	Loss 2.6854 (2.3804)	Entropy 0.55267 (0.55409)	Top-1 acc 61.328 (66.730)	Top-5 acc 79.688 (85.737)	lr 0.00215
Train [98][940/3239]	Time 0.228 (0.588)	Data Time 0.001 (0.041)	Loss 2.3507 (2.3817)	Entropy 0.55283 (0.55408)	Top-1 acc 70.312 (66.704)	Top-5 acc 85.547 (85.724)	lr 0.00214
Train [98][950/3239]	Time 0.226 (0.586)	Data Time 0.001 (0.041)	Loss 2.3786 (2.3824)	Entropy 0.55272 (0.55407)	Top-1 acc 67.969 (66.687)	Top-5 acc 84.375 (85.708)	lr 0.00214
Train [98][960/3239]	Time 0.220 (0.584)	Data Time 0.001 (0.040)	Loss 2.5225 (2.3819)	Entropy 0.55271 (0.55405)	Top-1 acc 60.547 (66.689)	Top-5 acc 86.719 (85.722)	lr 0.00214
Train [98][970/3239]	Time 0.228 (0.583)	Data Time 0.001 (0.040)	Loss 2.2808 (2.3818)	Entropy 0.55226 (0.55404)	Top-1 acc 72.266 (66.698)	Top-5 acc 88.672 (85.722)	lr 0.00214
Train [98][980/3239]	Time 0.324 (0.581)	Data Time 0.001 (0.040)	Loss 2.5643 (2.3818)	Entropy 0.55205 (0.55402)	Top-1 acc 60.547 (66.699)	Top-5 acc 82.812 (85.719)	lr 0.00214
Train [98][990/3239]	Time 0.226 (0.579)	Data Time 0.001 (0.039)	Loss 2.5550 (2.3821)	Entropy 0.55198 (0.55400)	Top-1 acc 62.500 (66.696)	Top-5 acc 83.203 (85.716)	lr 0.00214
Train [98][1000/3239]	Time 0.259 (0.578)	Data Time 0.001 (0.039)	Loss 2.3322 (2.3815)	Entropy 0.55198 (0.55398)	Top-1 acc 67.969 (66.708)	Top-5 acc 89.453 (85.728)	lr 0.00214
Train [98][1010/3239]	Time 0.226 (0.576)	Data Time 0.001 (0.038)	Loss 2.3202 (2.3808)	Entropy 0.55171 (0.55396)	Top-1 acc 69.922 (66.727)	Top-5 acc 89.844 (85.747)	lr 0.00214
Train [98][1020/3239]	Time 0.228 (0.575)	Data Time 0.001 (0.038)	Loss 2.8250 (2.3816)	Entropy 0.55191 (0.55393)	Top-1 acc 55.469 (66.708)	Top-5 acc 81.250 (85.738)	lr 0.00214
Train [98][1030/3239]	Time 0.237 (0.573)	Data Time 0.001 (0.038)	Loss 2.4676 (2.3818)	Entropy 0.55179 (0.55392)	Top-1 acc 62.500 (66.693)	Top-5 acc 84.375 (85.732)	lr 0.00214
Train [98][1040/3239]	Time 0.238 (0.572)	Data Time 0.001 (0.037)	Loss 2.5146 (2.3817)	Entropy 0.55198 (0.55390)	Top-1 acc 65.625 (66.699)	Top-5 acc 83.203 (85.734)	lr 0.00214
Train [98][1050/3239]	Time 0.360 (0.571)	Data Time 0.001 (0.037)	Loss 2.3528 (2.3825)	Entropy 0.55241 (0.55388)	Top-1 acc 69.531 (66.686)	Top-5 acc 86.719 (85.719)	lr 0.00214
Train [98][1060/3239]	Time 0.231 (0.569)	Data Time 0.001 (0.037)	Loss 2.4809 (2.3832)	Entropy 0.55246 (0.55387)	Top-1 acc 65.234 (66.672)	Top-5 acc 83.984 (85.704)	lr 0.00214
Train [98][1070/3239]	Time 0.233 (0.568)	Data Time 0.002 (0.036)	Loss 2.3140 (2.3831)	Entropy 0.55257 (0.55385)	Top-1 acc 68.359 (66.677)	Top-5 acc 86.328 (85.705)	lr 0.00214
Train [98][1080/3239]	Time 0.230 (0.567)	Data Time 0.001 (0.036)	Loss 2.1968 (2.3835)	Entropy 0.55264 (0.55384)	Top-1 acc 69.141 (66.662)	Top-5 acc 89.062 (85.704)	lr 0.00214
Train [98][1090/3239]	Time 0.258 (0.565)	Data Time 0.001 (0.036)	Loss 2.5020 (2.3842)	Entropy 0.55280 (0.55383)	Top-1 acc 62.891 (66.638)	Top-5 acc 82.812 (85.690)	lr 0.00214
Train [98][1100/3239]	Time 0.222 (0.564)	Data Time 0.001 (0.035)	Loss 2.3259 (2.3839)	Entropy 0.55253 (0.55382)	Top-1 acc 67.188 (66.640)	Top-5 acc 88.281 (85.698)	lr 0.00214
Train [98][1110/3239]	Time 0.231 (0.562)	Data Time 0.001 (0.035)	Loss 2.3333 (2.3838)	Entropy 0.55253 (0.55381)	Top-1 acc 66.016 (66.642)	Top-5 acc 88.281 (85.705)	lr 0.00214
Train [98][1120/3239]	Time 0.219 (0.561)	Data Time 0.001 (0.035)	Loss 2.3059 (2.3839)	Entropy 0.55290 (0.55380)	Top-1 acc 67.578 (66.643)	Top-5 acc 85.547 (85.694)	lr 0.00213
Train [98][1130/3239]	Time 0.239 (0.560)	Data Time 0.001 (0.034)	Loss 2.5564 (2.3841)	Entropy 0.55282 (0.55379)	Top-1 acc 63.281 (66.639)	Top-5 acc 81.250 (85.693)	lr 0.00213
Train [98][1140/3239]	Time 0.323 (0.559)	Data Time 0.001 (0.034)	Loss 2.3501 (2.3841)	Entropy 0.55286 (0.55378)	Top-1 acc 67.578 (66.642)	Top-5 acc 87.109 (85.692)	lr 0.00213
Train [98][1150/3239]	Time 0.228 (0.557)	Data Time 0.001 (0.034)	Loss 2.2606 (2.3841)	Entropy 0.55316 (0.55377)	Top-1 acc 68.750 (66.634)	Top-5 acc 87.891 (85.698)	lr 0.00213
Train [98][1160/3239]	Time 0.223 (0.556)	Data Time 0.001 (0.034)	Loss 2.3527 (2.3842)	Entropy 0.55322 (0.55377)	Top-1 acc 67.188 (66.626)	Top-5 acc 85.547 (85.691)	lr 0.00213
Train [98][1170/3239]	Time 0.221 (0.555)	Data Time 0.001 (0.033)	Loss 2.4197 (2.3843)	Entropy 0.55329 (0.55376)	Top-1 acc 66.016 (66.624)	Top-5 acc 85.938 (85.689)	lr 0.00213
Train [98][1180/3239]	Time 0.256 (0.553)	Data Time 0.001 (0.033)	Loss 2.4877 (2.3843)	Entropy 0.55367 (0.55376)	Top-1 acc 62.891 (66.627)	Top-5 acc 84.766 (85.691)	lr 0.00213
Train [98][1190/3239]	Time 0.232 (0.552)	Data Time 0.001 (0.033)	Loss 2.2691 (2.3834)	Entropy 0.55344 (0.55376)	Top-1 acc 68.359 (66.644)	Top-5 acc 88.672 (85.709)	lr 0.00213
Train [98][1200/3239]	Time 0.224 (0.551)	Data Time 0.001 (0.033)	Loss 2.6558 (2.3838)	Entropy 0.55307 (0.55376)	Top-1 acc 58.984 (66.630)	Top-5 acc 80.078 (85.702)	lr 0.00213
Train [98][1210/3239]	Time 0.319 (0.550)	Data Time 0.001 (0.032)	Loss 2.3074 (2.3837)	Entropy 0.55307 (0.55375)	Top-1 acc 68.359 (66.631)	Top-5 acc 85.547 (85.699)	lr 0.00213
Train [98][1220/3239]	Time 0.323 (0.549)	Data Time 0.001 (0.032)	Loss 2.3879 (2.3837)	Entropy 0.55294 (0.55374)	Top-1 acc 64.453 (66.631)	Top-5 acc 85.547 (85.699)	lr 0.00213
Train [98][1230/3239]	Time 0.246 (0.549)	Data Time 0.027 (0.032)	Loss 2.3248 (2.3836)	Entropy 0.55314 (0.55374)	Top-1 acc 65.234 (66.633)	Top-5 acc 85.547 (85.697)	lr 0.00213
Train [98][1240/3239]	Time 0.223 (0.548)	Data Time 0.001 (0.032)	Loss 2.4311 (2.3841)	Entropy 0.55313 (0.55373)	Top-1 acc 67.188 (66.628)	Top-5 acc 85.938 (85.688)	lr 0.00213
Train [98][1250/3239]	Time 0.227 (0.547)	Data Time 0.001 (0.031)	Loss 2.3157 (2.3844)	Entropy 0.55334 (0.55373)	Top-1 acc 67.969 (66.617)	Top-5 acc 85.156 (85.676)	lr 0.00213
Train [98][1260/3239]	Time 0.217 (0.546)	Data Time 0.001 (0.031)	Loss 2.4812 (2.3841)	Entropy 0.55374 (0.55373)	Top-1 acc 60.547 (66.618)	Top-5 acc 82.031 (85.679)	lr 0.00213
Train [98][1270/3239]	Time 0.247 (0.545)	Data Time 0.002 (0.031)	Loss 2.3744 (2.3840)	Entropy 0.55339 (0.55373)	Top-1 acc 65.234 (66.620)	Top-5 acc 86.328 (85.686)	lr 0.00213
Train [98][1280/3239]	Time 0.228 (0.544)	Data Time 0.001 (0.031)	Loss 2.3637 (2.3843)	Entropy 0.55319 (0.55372)	Top-1 acc 65.625 (66.608)	Top-5 acc 85.547 (85.681)	lr 0.00213
Train [98][1290/3239]	Time 0.223 (0.543)	Data Time 0.001 (0.030)	Loss 2.6279 (2.3847)	Entropy 0.55236 (0.55372)	Top-1 acc 59.375 (66.596)	Top-5 acc 80.078 (85.672)	lr 0.00213
Train [98][1300/3239]	Time 0.219 (0.542)	Data Time 0.001 (0.030)	Loss 2.3122 (2.3843)	Entropy 0.55251 (0.55371)	Top-1 acc 71.484 (66.609)	Top-5 acc 87.109 (85.684)	lr 0.00212
Train [98][1310/3239]	Time 0.221 (0.541)	Data Time 0.001 (0.030)	Loss 2.4002 (2.3842)	Entropy 0.55252 (0.55370)	Top-1 acc 64.844 (66.609)	Top-5 acc 85.156 (85.682)	lr 0.00212
Train [98][1320/3239]	Time 0.231 (0.540)	Data Time 0.001 (0.030)	Loss 2.5198 (2.3851)	Entropy 0.55230 (0.55369)	Top-1 acc 65.234 (66.587)	Top-5 acc 83.203 (85.669)	lr 0.00212
Train [98][1330/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.030)	Loss 2.7086 (2.3850)	Entropy 0.55267 (0.55368)	Top-1 acc 62.109 (66.591)	Top-5 acc 80.078 (85.673)	lr 0.00212
Train [98][1340/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.029)	Loss 2.3295 (2.3851)	Entropy 0.55278 (0.55367)	Top-1 acc 66.016 (66.587)	Top-5 acc 87.109 (85.676)	lr 0.00212
Train [98][1350/3239]	Time 0.228 (0.537)	Data Time 0.001 (0.029)	Loss 2.2694 (2.3848)	Entropy 0.55266 (0.55367)	Top-1 acc 69.141 (66.592)	Top-5 acc 88.281 (85.684)	lr 0.00212
Train [98][1360/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.029)	Loss 2.1955 (2.3845)	Entropy 0.55257 (0.55366)	Top-1 acc 67.969 (66.605)	Top-5 acc 90.625 (85.689)	lr 0.00212
Train [98][1370/3239]	Time 0.322 (0.535)	Data Time 0.001 (0.029)	Loss 2.5221 (2.3853)	Entropy 0.55228 (0.55365)	Top-1 acc 66.016 (66.591)	Top-5 acc 83.203 (85.678)	lr 0.00212
Train [98][1380/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.029)	Loss 2.3605 (2.3853)	Entropy 0.55214 (0.55364)	Top-1 acc 68.750 (66.592)	Top-5 acc 85.938 (85.677)	lr 0.00212
Train [98][1390/3239]	Time 0.217 (0.533)	Data Time 0.001 (0.028)	Loss 2.7012 (2.3851)	Entropy 0.55210 (0.55363)	Top-1 acc 57.812 (66.601)	Top-5 acc 80.859 (85.683)	lr 0.00212
Train [98][1400/3239]	Time 0.322 (0.571)	Data Time 0.038 (0.028)	Loss 2.3677 (2.3848)	Entropy 0.55183 (0.55362)	Top-1 acc 67.578 (66.604)	Top-5 acc 87.500 (85.687)	lr 0.00212
Train [98][1410/3239]	Time 0.294 (0.571)	Data Time 0.002 (0.028)	Loss 2.4394 (2.3849)	Entropy 0.55174 (0.55360)	Top-1 acc 65.234 (66.605)	Top-5 acc 84.375 (85.683)	lr 0.00212
Train [98][1420/3239]	Time 0.246 (0.571)	Data Time 0.001 (0.028)	Loss 2.2189 (2.3848)	Entropy 0.55176 (0.55359)	Top-1 acc 69.531 (66.600)	Top-5 acc 88.672 (85.685)	lr 0.00212
Train [98][1430/3239]	Time 0.236 (0.570)	Data Time 0.001 (0.028)	Loss 2.3570 (2.3850)	Entropy 0.55186 (0.55358)	Top-1 acc 66.016 (66.592)	Top-5 acc 85.547 (85.681)	lr 0.00212
Train [98][1440/3239]	Time 0.232 (0.569)	Data Time 0.001 (0.028)	Loss 2.3883 (2.3853)	Entropy 0.55192 (0.55357)	Top-1 acc 65.234 (66.584)	Top-5 acc 85.547 (85.672)	lr 0.00212
Train [98][1450/3239]	Time 0.240 (0.568)	Data Time 0.002 (0.027)	Loss 2.5185 (2.3853)	Entropy 0.55123 (0.55355)	Top-1 acc 61.328 (66.585)	Top-5 acc 83.594 (85.674)	lr 0.00212
Train [98][1460/3239]	Time 0.227 (0.567)	Data Time 0.001 (0.027)	Loss 2.6750 (2.3851)	Entropy 0.55107 (0.55354)	Top-1 acc 60.547 (66.588)	Top-5 acc 80.078 (85.681)	lr 0.00212
Train [98][1470/3239]	Time 0.232 (0.566)	Data Time 0.001 (0.027)	Loss 2.3084 (2.3850)	Entropy 0.55096 (0.55352)	Top-1 acc 67.578 (66.595)	Top-5 acc 85.938 (85.683)	lr 0.00212
Train [98][1480/3239]	Time 0.228 (0.565)	Data Time 0.001 (0.027)	Loss 2.4456 (2.3851)	Entropy 0.55093 (0.55350)	Top-1 acc 66.016 (66.591)	Top-5 acc 83.594 (85.687)	lr 0.00211
Train [98][1490/3239]	Time 0.255 (0.564)	Data Time 0.024 (0.027)	Loss 2.7129 (2.3854)	Entropy 0.55065 (0.55348)	Top-1 acc 56.641 (66.583)	Top-5 acc 78.125 (85.681)	lr 0.00211
Train [98][1500/3239]	Time 0.230 (0.563)	Data Time 0.001 (0.026)	Loss 2.6960 (2.3860)	Entropy 0.55102 (0.55347)	Top-1 acc 60.938 (66.567)	Top-5 acc 82.031 (85.671)	lr 0.00211
Train [98][1510/3239]	Time 0.236 (0.563)	Data Time 0.001 (0.026)	Loss 2.4331 (2.3862)	Entropy 0.55050 (0.55345)	Top-1 acc 66.406 (66.566)	Top-5 acc 84.375 (85.668)	lr 0.00211
Train [98][1520/3239]	Time 0.228 (0.562)	Data Time 0.001 (0.026)	Loss 2.2367 (2.3858)	Entropy 0.55050 (0.55343)	Top-1 acc 67.969 (66.569)	Top-5 acc 87.891 (85.677)	lr 0.00211
Train [98][1530/3239]	Time 0.345 (0.561)	Data Time 0.002 (0.026)	Loss 2.3697 (2.3859)	Entropy 0.55066 (0.55341)	Top-1 acc 67.578 (66.573)	Top-5 acc 85.938 (85.682)	lr 0.00211
Train [98][1540/3239]	Time 0.267 (0.560)	Data Time 0.001 (0.026)	Loss 2.2667 (2.3856)	Entropy 0.55035 (0.55339)	Top-1 acc 65.625 (66.579)	Top-5 acc 86.719 (85.686)	lr 0.00211
Train [98][1550/3239]	Time 0.230 (0.559)	Data Time 0.001 (0.026)	Loss 2.3416 (2.3854)	Entropy 0.55047 (0.55337)	Top-1 acc 67.969 (66.587)	Top-5 acc 86.719 (85.692)	lr 0.00211
Train [98][1560/3239]	Time 0.223 (0.558)	Data Time 0.001 (0.026)	Loss 2.4182 (2.3856)	Entropy 0.55047 (0.55336)	Top-1 acc 63.672 (66.579)	Top-5 acc 87.500 (85.690)	lr 0.00211
Train [98][1570/3239]	Time 0.234 (0.557)	Data Time 0.001 (0.025)	Loss 2.2237 (2.3853)	Entropy 0.55075 (0.55334)	Top-1 acc 69.531 (66.577)	Top-5 acc 89.844 (85.699)	lr 0.00211
Train [98][1580/3239]	Time 0.229 (0.556)	Data Time 0.001 (0.025)	Loss 2.2806 (2.3855)	Entropy 0.55085 (0.55332)	Top-1 acc 70.703 (66.581)	Top-5 acc 87.109 (85.696)	lr 0.00211
Train [98][1590/3239]	Time 0.266 (0.555)	Data Time 0.001 (0.025)	Loss 2.3303 (2.3856)	Entropy 0.55094 (0.55331)	Top-1 acc 66.016 (66.579)	Top-5 acc 88.281 (85.700)	lr 0.00211
Train [98][1600/3239]	Time 0.351 (0.555)	Data Time 0.001 (0.025)	Loss 2.3389 (2.3856)	Entropy 0.55066 (0.55329)	Top-1 acc 69.922 (66.584)	Top-5 acc 85.547 (85.696)	lr 0.00211
Train [98][1610/3239]	Time 0.233 (0.554)	Data Time 0.001 (0.025)	Loss 2.4423 (2.3854)	Entropy 0.55090 (0.55327)	Top-1 acc 65.234 (66.591)	Top-5 acc 84.766 (85.700)	lr 0.00211
Train [98][1620/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.025)	Loss 2.3780 (2.3853)	Entropy 0.55092 (0.55326)	Top-1 acc 66.016 (66.596)	Top-5 acc 84.375 (85.706)	lr 0.00211
Train [98][1630/3239]	Time 0.231 (0.552)	Data Time 0.001 (0.025)	Loss 2.4855 (2.3857)	Entropy 0.55076 (0.55325)	Top-1 acc 66.797 (66.592)	Top-5 acc 80.469 (85.699)	lr 0.00211
Train [98][1640/3239]	Time 0.237 (0.551)	Data Time 0.001 (0.024)	Loss 2.3591 (2.3860)	Entropy 0.55083 (0.55323)	Top-1 acc 69.531 (66.589)	Top-5 acc 83.203 (85.693)	lr 0.00211
Train [98][1650/3239]	Time 0.227 (0.551)	Data Time 0.001 (0.024)	Loss 2.6370 (2.3860)	Entropy 0.55113 (0.55322)	Top-1 acc 60.156 (66.590)	Top-5 acc 83.594 (85.695)	lr 0.00210
Train [98][1660/3239]	Time 0.227 (0.550)	Data Time 0.001 (0.024)	Loss 2.4501 (2.3859)	Entropy 0.55136 (0.55320)	Top-1 acc 66.016 (66.597)	Top-5 acc 83.594 (85.699)	lr 0.00210
Train [98][1670/3239]	Time 0.225 (0.549)	Data Time 0.001 (0.024)	Loss 2.3736 (2.3862)	Entropy 0.55157 (0.55319)	Top-1 acc 66.797 (66.586)	Top-5 acc 86.719 (85.697)	lr 0.00210
Train [98][1680/3239]	Time 0.227 (0.548)	Data Time 0.001 (0.024)	Loss 2.4231 (2.3862)	Entropy 0.55185 (0.55318)	Top-1 acc 65.625 (66.582)	Top-5 acc 83.984 (85.697)	lr 0.00210
Train [98][1690/3239]	Time 0.341 (0.548)	Data Time 0.001 (0.024)	Loss 2.3693 (2.3861)	Entropy 0.55171 (0.55318)	Top-1 acc 66.016 (66.591)	Top-5 acc 83.984 (85.697)	lr 0.00210
Train [98][1700/3239]	Time 0.227 (0.547)	Data Time 0.001 (0.024)	Loss 2.4147 (2.3861)	Entropy 0.55190 (0.55317)	Top-1 acc 69.141 (66.596)	Top-5 acc 87.891 (85.698)	lr 0.00210
Train [98][1710/3239]	Time 0.252 (0.546)	Data Time 0.002 (0.023)	Loss 2.5287 (2.3863)	Entropy 0.55172 (0.55316)	Top-1 acc 61.328 (66.591)	Top-5 acc 82.031 (85.691)	lr 0.00210
Train [98][1720/3239]	Time 0.286 (0.546)	Data Time 0.001 (0.023)	Loss 2.3792 (2.3863)	Entropy 0.55156 (0.55315)	Top-1 acc 66.797 (66.593)	Top-5 acc 87.109 (85.687)	lr 0.00210
Train [98][1730/3239]	Time 0.340 (0.546)	Data Time 0.003 (0.023)	Loss 2.3893 (2.3867)	Entropy 0.55180 (0.55314)	Top-1 acc 69.922 (66.586)	Top-5 acc 85.547 (85.680)	lr 0.00210
Train [98][1740/3239]	Time 0.232 (0.545)	Data Time 0.001 (0.023)	Loss 2.4110 (2.3873)	Entropy 0.55193 (0.55313)	Top-1 acc 64.844 (66.569)	Top-5 acc 84.766 (85.669)	lr 0.00210
Train [98][1750/3239]	Time 0.241 (0.545)	Data Time 0.001 (0.023)	Loss 2.2922 (2.3874)	Entropy 0.55208 (0.55313)	Top-1 acc 70.312 (66.570)	Top-5 acc 85.547 (85.666)	lr 0.00210
Train [98][1760/3239]	Time 0.323 (0.544)	Data Time 0.001 (0.023)	Loss 2.2024 (2.3872)	Entropy 0.55235 (0.55312)	Top-1 acc 71.484 (66.575)	Top-5 acc 90.234 (85.670)	lr 0.00210
Train [98][1770/3239]	Time 0.258 (0.543)	Data Time 0.001 (0.023)	Loss 2.5010 (2.3873)	Entropy 0.55237 (0.55312)	Top-1 acc 64.062 (66.570)	Top-5 acc 84.375 (85.670)	lr 0.00210
Train [98][1780/3239]	Time 0.222 (0.543)	Data Time 0.001 (0.023)	Loss 2.6553 (2.3877)	Entropy 0.55237 (0.55311)	Top-1 acc 60.156 (66.556)	Top-5 acc 82.031 (85.663)	lr 0.00210
Train [98][1790/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.022)	Loss 2.1872 (2.3875)	Entropy 0.55217 (0.55311)	Top-1 acc 69.141 (66.559)	Top-5 acc 90.625 (85.666)	lr 0.00210
Train [98][1800/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.022)	Loss 2.4718 (2.3874)	Entropy 0.55216 (0.55311)	Top-1 acc 66.406 (66.559)	Top-5 acc 82.422 (85.664)	lr 0.00210
Train [98][1810/3239]	Time 0.262 (0.541)	Data Time 0.001 (0.022)	Loss 2.3234 (2.3873)	Entropy 0.55213 (0.55310)	Top-1 acc 64.453 (66.560)	Top-5 acc 85.156 (85.664)	lr 0.00210
Train [98][1820/3239]	Time 0.225 (0.540)	Data Time 0.001 (0.022)	Loss 2.2156 (2.3870)	Entropy 0.55162 (0.55309)	Top-1 acc 69.531 (66.565)	Top-5 acc 89.453 (85.668)	lr 0.00210
Train [98][1830/3239]	Time 0.259 (0.540)	Data Time 0.001 (0.022)	Loss 2.5830 (2.3871)	Entropy 0.55169 (0.55309)	Top-1 acc 62.500 (66.559)	Top-5 acc 80.469 (85.670)	lr 0.00209
Train [98][1840/3239]	Time 0.262 (0.539)	Data Time 0.001 (0.022)	Loss 2.5269 (2.3875)	Entropy 0.55129 (0.55308)	Top-1 acc 62.891 (66.555)	Top-5 acc 85.156 (85.667)	lr 0.00209
Train [98][1850/3239]	Time 0.293 (0.539)	Data Time 0.001 (0.022)	Loss 2.5837 (2.3876)	Entropy 0.55084 (0.55307)	Top-1 acc 63.281 (66.559)	Top-5 acc 80.469 (85.660)	lr 0.00209
Train [98][1860/3239]	Time 0.244 (0.538)	Data Time 0.001 (0.022)	Loss 2.4254 (2.3876)	Entropy 0.55089 (0.55306)	Top-1 acc 67.969 (66.561)	Top-5 acc 83.594 (85.656)	lr 0.00209
Train [98][1870/3239]	Time 0.242 (0.538)	Data Time 0.001 (0.022)	Loss 2.3158 (2.3877)	Entropy 0.55097 (0.55304)	Top-1 acc 69.141 (66.555)	Top-5 acc 85.547 (85.655)	lr 0.00209
Train [98][1880/3239]	Time 0.223 (0.537)	Data Time 0.001 (0.021)	Loss 2.5200 (2.3880)	Entropy 0.55071 (0.55303)	Top-1 acc 63.672 (66.548)	Top-5 acc 81.641 (85.646)	lr 0.00209
Train [98][1890/3239]	Time 0.223 (0.536)	Data Time 0.001 (0.021)	Loss 2.2058 (2.3880)	Entropy 0.55063 (0.55302)	Top-1 acc 72.266 (66.547)	Top-5 acc 87.891 (85.644)	lr 0.00209
Train [98][1900/3239]	Time 0.218 (0.536)	Data Time 0.001 (0.021)	Loss 2.4141 (2.3878)	Entropy 0.55038 (0.55301)	Top-1 acc 59.375 (66.548)	Top-5 acc 86.328 (85.646)	lr 0.00209
Train [98][1910/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.021)	Loss 2.3699 (2.3879)	Entropy 0.55009 (0.55299)	Top-1 acc 64.844 (66.550)	Top-5 acc 86.328 (85.642)	lr 0.00209
Train [98][1920/3239]	Time 0.330 (0.534)	Data Time 0.001 (0.021)	Loss 2.2961 (2.3877)	Entropy 0.55018 (0.55298)	Top-1 acc 70.703 (66.557)	Top-5 acc 85.547 (85.641)	lr 0.00209
Train [98][1930/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.021)	Loss 2.4751 (2.3880)	Entropy 0.54999 (0.55296)	Top-1 acc 64.453 (66.554)	Top-5 acc 83.203 (85.634)	lr 0.00209
Train [98][1940/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.021)	Loss 2.3480 (2.3881)	Entropy 0.54980 (0.55295)	Top-1 acc 68.750 (66.549)	Top-5 acc 86.328 (85.635)	lr 0.00209
Train [98][1950/3239]	Time 0.224 (0.532)	Data Time 0.001 (0.021)	Loss 2.4857 (2.3882)	Entropy 0.55023 (0.55293)	Top-1 acc 62.109 (66.545)	Top-5 acc 85.547 (85.631)	lr 0.00209
Train [98][1960/3239]	Time 0.225 (0.532)	Data Time 0.001 (0.021)	Loss 2.5277 (2.3880)	Entropy 0.55046 (0.55292)	Top-1 acc 66.016 (66.553)	Top-5 acc 82.812 (85.633)	lr 0.00209
Train [98][1970/3239]	Time 0.226 (0.531)	Data Time 0.001 (0.021)	Loss 2.5923 (2.3885)	Entropy 0.55042 (0.55291)	Top-1 acc 62.109 (66.541)	Top-5 acc 82.812 (85.629)	lr 0.00209
Train [98][1980/3239]	Time 0.223 (0.531)	Data Time 0.001 (0.020)	Loss 2.5983 (2.3885)	Entropy 0.55045 (0.55290)	Top-1 acc 62.500 (66.541)	Top-5 acc 82.031 (85.630)	lr 0.00209
Train [98][1990/3239]	Time 0.313 (0.530)	Data Time 0.001 (0.020)	Loss 2.1813 (2.3886)	Entropy 0.55046 (0.55288)	Top-1 acc 72.656 (66.541)	Top-5 acc 89.453 (85.628)	lr 0.00209
Train [98][2000/3239]	Time 0.283 (0.529)	Data Time 0.024 (0.020)	Loss 2.3149 (2.3888)	Entropy 0.55061 (0.55287)	Top-1 acc 69.141 (66.538)	Top-5 acc 87.109 (85.624)	lr 0.00209
Train [98][2010/3239]	Time 0.261 (0.529)	Data Time 0.001 (0.020)	Loss 2.5859 (2.3885)	Entropy 0.55091 (0.55286)	Top-1 acc 61.719 (66.542)	Top-5 acc 82.031 (85.630)	lr 0.00208
Train [98][2020/3239]	Time 0.220 (0.528)	Data Time 0.001 (0.020)	Loss 2.4891 (2.3884)	Entropy 0.55085 (0.55285)	Top-1 acc 60.547 (66.539)	Top-5 acc 83.203 (85.634)	lr 0.00208
Train [98][2030/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.020)	Loss 2.1911 (2.3883)	Entropy 0.55094 (0.55284)	Top-1 acc 74.219 (66.540)	Top-5 acc 87.500 (85.633)	lr 0.00208
Train [98][2040/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.020)	Loss 2.2612 (2.3887)	Entropy 0.55083 (0.55283)	Top-1 acc 66.406 (66.531)	Top-5 acc 87.891 (85.630)	lr 0.00208
Train [98][2050/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.020)	Loss 2.4092 (2.3887)	Entropy 0.55096 (0.55282)	Top-1 acc 66.797 (66.530)	Top-5 acc 86.328 (85.630)	lr 0.00208
Train [98][2060/3239]	Time 0.384 (0.553)	Data Time 0.002 (0.020)	Loss 2.3100 (2.3888)	Entropy 0.55054 (0.55281)	Top-1 acc 67.969 (66.528)	Top-5 acc 87.109 (85.628)	lr 0.00208
Train [98][2070/3239]	Time 0.225 (0.553)	Data Time 0.002 (0.020)	Loss 2.6686 (2.3886)	Entropy 0.55060 (0.55280)	Top-1 acc 59.375 (66.529)	Top-5 acc 80.469 (85.632)	lr 0.00208
Train [98][2080/3239]	Time 0.329 (0.552)	Data Time 0.001 (0.020)	Loss 2.3077 (2.3885)	Entropy 0.55051 (0.55279)	Top-1 acc 69.922 (66.533)	Top-5 acc 85.938 (85.633)	lr 0.00208
Train [98][2090/3239]	Time 0.235 (0.552)	Data Time 0.001 (0.019)	Loss 2.4902 (2.3885)	Entropy 0.55051 (0.55278)	Top-1 acc 60.156 (66.533)	Top-5 acc 83.984 (85.633)	lr 0.00208
Train [98][2100/3239]	Time 0.258 (0.551)	Data Time 0.001 (0.019)	Loss 2.2844 (2.3887)	Entropy 0.55083 (0.55277)	Top-1 acc 70.312 (66.530)	Top-5 acc 86.719 (85.630)	lr 0.00208
Train [98][2110/3239]	Time 0.254 (0.551)	Data Time 0.001 (0.019)	Loss 2.4784 (2.3888)	Entropy 0.55114 (0.55276)	Top-1 acc 66.797 (66.531)	Top-5 acc 84.375 (85.631)	lr 0.00208
Train [98][2120/3239]	Time 0.228 (0.550)	Data Time 0.001 (0.019)	Loss 2.4424 (2.3890)	Entropy 0.55107 (0.55275)	Top-1 acc 64.844 (66.523)	Top-5 acc 86.719 (85.632)	lr 0.00208
Train [98][2130/3239]	Time 0.229 (0.549)	Data Time 0.001 (0.019)	Loss 2.2565 (2.3890)	Entropy 0.55102 (0.55274)	Top-1 acc 68.750 (66.523)	Top-5 acc 89.453 (85.631)	lr 0.00208
Train [98][2140/3239]	Time 0.249 (0.549)	Data Time 0.001 (0.019)	Loss 2.4832 (2.3893)	Entropy 0.55084 (0.55274)	Top-1 acc 63.281 (66.512)	Top-5 acc 83.594 (85.629)	lr 0.00208
Train [98][2150/3239]	Time 0.338 (0.548)	Data Time 0.001 (0.019)	Loss 2.5694 (2.3897)	Entropy 0.55091 (0.55273)	Top-1 acc 58.984 (66.501)	Top-5 acc 85.156 (85.624)	lr 0.00208
Train [98][2160/3239]	Time 0.226 (0.548)	Data Time 0.001 (0.019)	Loss 2.4498 (2.3896)	Entropy 0.55068 (0.55272)	Top-1 acc 65.625 (66.505)	Top-5 acc 85.547 (85.625)	lr 0.00208
Train [98][2170/3239]	Time 0.258 (0.547)	Data Time 0.001 (0.019)	Loss 2.2502 (2.3899)	Entropy 0.55052 (0.55271)	Top-1 acc 69.141 (66.501)	Top-5 acc 87.500 (85.621)	lr 0.00208
Train [98][2180/3239]	Time 0.255 (0.546)	Data Time 0.001 (0.019)	Loss 2.3137 (2.3899)	Entropy 0.55041 (0.55270)	Top-1 acc 69.922 (66.506)	Top-5 acc 85.938 (85.621)	lr 0.00208
Train [98][2190/3239]	Time 0.257 (0.546)	Data Time 0.001 (0.019)	Loss 2.4738 (2.3897)	Entropy 0.55055 (0.55269)	Top-1 acc 62.500 (66.506)	Top-5 acc 85.156 (85.625)	lr 0.00207
Train [98][2200/3239]	Time 0.232 (0.545)	Data Time 0.001 (0.019)	Loss 2.2495 (2.3894)	Entropy 0.55062 (0.55268)	Top-1 acc 68.750 (66.513)	Top-5 acc 87.109 (85.629)	lr 0.00207
Train [98][2210/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.019)	Loss 2.5576 (2.3897)	Entropy 0.55056 (0.55267)	Top-1 acc 61.328 (66.506)	Top-5 acc 83.594 (85.626)	lr 0.00207
Train [98][2220/3239]	Time 0.262 (0.544)	Data Time 0.001 (0.018)	Loss 2.3673 (2.3900)	Entropy 0.55069 (0.55266)	Top-1 acc 66.016 (66.500)	Top-5 acc 86.328 (85.620)	lr 0.00207
Train [98][2230/3239]	Time 0.232 (0.544)	Data Time 0.001 (0.018)	Loss 2.4213 (2.3902)	Entropy 0.55046 (0.55265)	Top-1 acc 66.406 (66.497)	Top-5 acc 85.156 (85.619)	lr 0.00207
Train [98][2240/3239]	Time 0.326 (0.543)	Data Time 0.001 (0.018)	Loss 2.4673 (2.3904)	Entropy 0.55069 (0.55264)	Top-1 acc 65.234 (66.493)	Top-5 acc 84.375 (85.616)	lr 0.00207
Train [98][2250/3239]	Time 0.227 (0.543)	Data Time 0.001 (0.018)	Loss 2.2762 (2.3904)	Entropy 0.55065 (0.55263)	Top-1 acc 69.531 (66.492)	Top-5 acc 86.719 (85.615)	lr 0.00207
Train [98][2260/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.018)	Loss 2.4178 (2.3905)	Entropy 0.55082 (0.55262)	Top-1 acc 69.531 (66.495)	Top-5 acc 87.500 (85.612)	lr 0.00207
Train [98][2270/3239]	Time 0.229 (0.542)	Data Time 0.001 (0.018)	Loss 2.3039 (2.3905)	Entropy 0.55100 (0.55262)	Top-1 acc 67.578 (66.497)	Top-5 acc 88.281 (85.612)	lr 0.00207
Train [98][2280/3239]	Time 0.253 (0.541)	Data Time 0.001 (0.018)	Loss 2.3738 (2.3908)	Entropy 0.55099 (0.55261)	Top-1 acc 65.234 (66.492)	Top-5 acc 86.328 (85.605)	lr 0.00207
Train [98][2290/3239]	Time 0.220 (0.541)	Data Time 0.001 (0.018)	Loss 2.4717 (2.3908)	Entropy 0.55086 (0.55260)	Top-1 acc 63.281 (66.489)	Top-5 acc 83.594 (85.603)	lr 0.00207
Train [98][2300/3239]	Time 0.223 (0.540)	Data Time 0.001 (0.018)	Loss 2.2760 (2.3910)	Entropy 0.55117 (0.55259)	Top-1 acc 70.703 (66.482)	Top-5 acc 87.109 (85.601)	lr 0.00207
Train [98][2310/3239]	Time 0.390 (0.540)	Data Time 0.001 (0.018)	Loss 2.5557 (2.3910)	Entropy 0.55102 (0.55259)	Top-1 acc 64.062 (66.482)	Top-5 acc 82.031 (85.599)	lr 0.00207
Train [98][2320/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.018)	Loss 2.3269 (2.3907)	Entropy 0.55107 (0.55258)	Top-1 acc 66.406 (66.485)	Top-5 acc 84.766 (85.606)	lr 0.00207
Train [98][2330/3239]	Time 0.304 (0.539)	Data Time 0.001 (0.018)	Loss 2.2984 (2.3907)	Entropy 0.55073 (0.55257)	Top-1 acc 66.406 (66.484)	Top-5 acc 86.719 (85.605)	lr 0.00207
Train [98][2340/3239]	Time 0.232 (0.539)	Data Time 0.001 (0.018)	Loss 2.3322 (2.3909)	Entropy 0.55105 (0.55257)	Top-1 acc 69.531 (66.481)	Top-5 acc 87.500 (85.600)	lr 0.00207
Train [98][2350/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.017)	Loss 2.4247 (2.3909)	Entropy 0.55136 (0.55256)	Top-1 acc 67.578 (66.479)	Top-5 acc 82.031 (85.596)	lr 0.00207
Train [98][2360/3239]	Time 0.227 (0.538)	Data Time 0.001 (0.017)	Loss 2.3289 (2.3913)	Entropy 0.55135 (0.55256)	Top-1 acc 66.406 (66.470)	Top-5 acc 88.672 (85.591)	lr 0.00207
Train [98][2370/3239]	Time 0.230 (0.537)	Data Time 0.001 (0.017)	Loss 2.3088 (2.3915)	Entropy 0.55160 (0.55255)	Top-1 acc 66.016 (66.465)	Top-5 acc 85.156 (85.587)	lr 0.00206
Train [98][2380/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.017)	Loss 2.6672 (2.3915)	Entropy 0.55132 (0.55255)	Top-1 acc 58.594 (66.464)	Top-5 acc 78.906 (85.588)	lr 0.00206
Train [98][2390/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.017)	Loss 2.5591 (2.3915)	Entropy 0.55149 (0.55254)	Top-1 acc 62.500 (66.461)	Top-5 acc 81.641 (85.592)	lr 0.00206
Train [98][2400/3239]	Time 0.242 (0.536)	Data Time 0.001 (0.017)	Loss 2.3300 (2.3913)	Entropy 0.55112 (0.55254)	Top-1 acc 66.016 (66.464)	Top-5 acc 86.719 (85.594)	lr 0.00206
Train [98][2410/3239]	Time 0.243 (0.535)	Data Time 0.001 (0.017)	Loss 2.2507 (2.3912)	Entropy 0.55134 (0.55253)	Top-1 acc 71.094 (66.463)	Top-5 acc 86.719 (85.594)	lr 0.00206
Train [98][2420/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.017)	Loss 2.5057 (2.3912)	Entropy 0.55101 (0.55253)	Top-1 acc 66.016 (66.464)	Top-5 acc 79.688 (85.592)	lr 0.00206
Train [98][2430/3239]	Time 0.240 (0.534)	Data Time 0.001 (0.017)	Loss 2.1503 (2.3910)	Entropy 0.55119 (0.55252)	Top-1 acc 69.141 (66.471)	Top-5 acc 89.844 (85.594)	lr 0.00206
Train [98][2440/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.017)	Loss 2.3457 (2.3908)	Entropy 0.55117 (0.55252)	Top-1 acc 67.969 (66.476)	Top-5 acc 85.938 (85.595)	lr 0.00206
Train [98][2450/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.017)	Loss 2.2142 (2.3905)	Entropy 0.55112 (0.55251)	Top-1 acc 69.531 (66.483)	Top-5 acc 87.109 (85.600)	lr 0.00206
Train [98][2460/3239]	Time 0.240 (0.533)	Data Time 0.002 (0.017)	Loss 2.2765 (2.3906)	Entropy 0.55117 (0.55250)	Top-1 acc 68.359 (66.479)	Top-5 acc 87.109 (85.598)	lr 0.00206
Train [98][2470/3239]	Time 0.325 (0.532)	Data Time 0.001 (0.017)	Loss 2.4710 (2.3906)	Entropy 0.55126 (0.55250)	Top-1 acc 62.500 (66.479)	Top-5 acc 84.766 (85.599)	lr 0.00206
Train [98][2480/3239]	Time 0.222 (0.532)	Data Time 0.001 (0.017)	Loss 2.4324 (2.3909)	Entropy 0.55149 (0.55249)	Top-1 acc 67.188 (66.469)	Top-5 acc 85.547 (85.594)	lr 0.00206
Train [98][2490/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.017)	Loss 2.3549 (2.3911)	Entropy 0.55154 (0.55249)	Top-1 acc 68.750 (66.467)	Top-5 acc 85.547 (85.592)	lr 0.00206
Train [98][2500/3239]	Time 0.222 (0.531)	Data Time 0.001 (0.017)	Loss 2.4024 (2.3912)	Entropy 0.55140 (0.55249)	Top-1 acc 66.797 (66.463)	Top-5 acc 84.766 (85.589)	lr 0.00206
Train [98][2510/3239]	Time 0.231 (0.530)	Data Time 0.002 (0.016)	Loss 2.4439 (2.3909)	Entropy 0.55125 (0.55248)	Top-1 acc 65.625 (66.471)	Top-5 acc 84.375 (85.594)	lr 0.00206
Train [98][2520/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.016)	Loss 2.2559 (2.3908)	Entropy 0.55144 (0.55248)	Top-1 acc 67.578 (66.476)	Top-5 acc 87.109 (85.596)	lr 0.00206
Train [98][2530/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.016)	Loss 2.4279 (2.3910)	Entropy 0.55176 (0.55247)	Top-1 acc 66.016 (66.470)	Top-5 acc 84.375 (85.590)	lr 0.00206
Train [98][2540/3239]	Time 0.333 (0.529)	Data Time 0.001 (0.016)	Loss 2.1929 (2.3906)	Entropy 0.55213 (0.55247)	Top-1 acc 71.094 (66.481)	Top-5 acc 88.281 (85.597)	lr 0.00206
Train [98][2550/3239]	Time 0.255 (0.529)	Data Time 0.001 (0.016)	Loss 2.3613 (2.3908)	Entropy 0.55225 (0.55247)	Top-1 acc 65.625 (66.472)	Top-5 acc 85.938 (85.592)	lr 0.00205
Train [98][2560/3239]	Time 0.226 (0.528)	Data Time 0.001 (0.016)	Loss 2.2473 (2.3908)	Entropy 0.55216 (0.55247)	Top-1 acc 67.578 (66.467)	Top-5 acc 88.672 (85.591)	lr 0.00205
Train [98][2570/3239]	Time 0.255 (0.528)	Data Time 0.001 (0.016)	Loss 2.3088 (2.3907)	Entropy 0.55176 (0.55247)	Top-1 acc 69.531 (66.467)	Top-5 acc 87.500 (85.593)	lr 0.00205
Train [98][2580/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.016)	Loss 2.3046 (2.3905)	Entropy 0.55189 (0.55246)	Top-1 acc 67.969 (66.472)	Top-5 acc 88.281 (85.595)	lr 0.00205
Train [98][2590/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.016)	Loss 2.5979 (2.3905)	Entropy 0.55168 (0.55246)	Top-1 acc 62.109 (66.470)	Top-5 acc 81.641 (85.595)	lr 0.00205
Train [98][2600/3239]	Time 0.236 (0.526)	Data Time 0.002 (0.016)	Loss 2.4233 (2.3907)	Entropy 0.55157 (0.55246)	Top-1 acc 68.750 (66.466)	Top-5 acc 87.500 (85.594)	lr 0.00205
Train [98][2610/3239]	Time 0.242 (0.526)	Data Time 0.001 (0.016)	Loss 2.4513 (2.3905)	Entropy 0.55140 (0.55246)	Top-1 acc 64.062 (66.470)	Top-5 acc 85.938 (85.598)	lr 0.00205
Train [98][2620/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.016)	Loss 2.4212 (2.3905)	Entropy 0.55139 (0.55245)	Top-1 acc 60.156 (66.467)	Top-5 acc 86.719 (85.600)	lr 0.00205
Train [98][2630/3239]	Time 0.336 (0.525)	Data Time 0.001 (0.016)	Loss 2.5682 (2.3904)	Entropy 0.55153 (0.55245)	Top-1 acc 63.672 (66.469)	Top-5 acc 82.422 (85.603)	lr 0.00205
Train [98][2640/3239]	Time 0.268 (0.525)	Data Time 0.001 (0.016)	Loss 2.4246 (2.3901)	Entropy 0.55146 (0.55244)	Top-1 acc 68.359 (66.478)	Top-5 acc 84.766 (85.608)	lr 0.00205
Train [98][2650/3239]	Time 0.278 (0.525)	Data Time 0.002 (0.016)	Loss 2.2299 (2.3900)	Entropy 0.55136 (0.55244)	Top-1 acc 74.609 (66.479)	Top-5 acc 86.719 (85.611)	lr 0.00205
Train [98][2660/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.016)	Loss 2.3574 (2.3899)	Entropy 0.55130 (0.55244)	Top-1 acc 68.359 (66.480)	Top-5 acc 85.156 (85.610)	lr 0.00205
Train [98][2670/3239]	Time 0.237 (0.524)	Data Time 0.002 (0.016)	Loss 2.4244 (2.3899)	Entropy 0.55166 (0.55243)	Top-1 acc 64.844 (66.478)	Top-5 acc 84.766 (85.611)	lr 0.00205
Train [98][2680/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.016)	Loss 2.3264 (2.3899)	Entropy 0.55171 (0.55243)	Top-1 acc 68.750 (66.479)	Top-5 acc 85.938 (85.612)	lr 0.00205
Train [98][2690/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.015)	Loss 2.4118 (2.3898)	Entropy 0.55133 (0.55243)	Top-1 acc 70.703 (66.486)	Top-5 acc 83.984 (85.613)	lr 0.00205
Train [98][2700/3239]	Time 0.335 (0.523)	Data Time 0.001 (0.015)	Loss 2.1651 (2.3894)	Entropy 0.55123 (0.55242)	Top-1 acc 71.484 (66.490)	Top-5 acc 89.453 (85.617)	lr 0.00205
Train [98][2710/3239]	Time 0.325 (0.542)	Data Time 0.004 (0.015)	Loss 2.5507 (2.3896)	Entropy 0.55098 (0.55242)	Top-1 acc 62.109 (66.488)	Top-5 acc 82.812 (85.614)	lr 0.00205
Train [98][2720/3239]	Time 0.241 (0.542)	Data Time 0.002 (0.015)	Loss 2.4714 (2.3898)	Entropy 0.55067 (0.55241)	Top-1 acc 64.844 (66.484)	Top-5 acc 85.938 (85.609)	lr 0.00205
Train [98][2730/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.015)	Loss 2.4181 (2.3900)	Entropy 0.55096 (0.55241)	Top-1 acc 62.109 (66.480)	Top-5 acc 84.375 (85.601)	lr 0.00204
Train [98][2740/3239]	Time 0.238 (0.541)	Data Time 0.001 (0.015)	Loss 2.2350 (2.3902)	Entropy 0.55040 (0.55240)	Top-1 acc 67.969 (66.473)	Top-5 acc 85.938 (85.597)	lr 0.00204
Train [98][2750/3239]	Time 0.252 (0.541)	Data Time 0.001 (0.015)	Loss 2.6536 (2.3903)	Entropy 0.55031 (0.55239)	Top-1 acc 63.672 (66.470)	Top-5 acc 79.688 (85.594)	lr 0.00204
Train [98][2760/3239]	Time 0.229 (0.541)	Data Time 0.001 (0.015)	Loss 2.2827 (2.3900)	Entropy 0.55017 (0.55239)	Top-1 acc 70.312 (66.479)	Top-5 acc 86.719 (85.600)	lr 0.00204
Train [98][2770/3239]	Time 0.229 (0.540)	Data Time 0.001 (0.015)	Loss 2.4646 (2.3900)	Entropy 0.54998 (0.55238)	Top-1 acc 63.672 (66.476)	Top-5 acc 87.109 (85.599)	lr 0.00204
Train [98][2780/3239]	Time 0.240 (0.540)	Data Time 0.001 (0.015)	Loss 2.4016 (2.3900)	Entropy 0.55010 (0.55237)	Top-1 acc 66.016 (66.477)	Top-5 acc 85.938 (85.602)	lr 0.00204
Train [98][2790/3239]	Time 0.336 (0.539)	Data Time 0.001 (0.015)	Loss 2.3884 (2.3900)	Entropy 0.55005 (0.55236)	Top-1 acc 67.578 (66.478)	Top-5 acc 85.938 (85.605)	lr 0.00204
Train [98][2800/3239]	Time 0.248 (0.539)	Data Time 0.001 (0.015)	Loss 2.4332 (2.3899)	Entropy 0.54979 (0.55235)	Top-1 acc 67.578 (66.479)	Top-5 acc 83.594 (85.604)	lr 0.00204
Train [98][2810/3239]	Time 0.233 (0.539)	Data Time 0.001 (0.015)	Loss 2.4665 (2.3898)	Entropy 0.54978 (0.55234)	Top-1 acc 64.453 (66.482)	Top-5 acc 83.203 (85.606)	lr 0.00204
Train [98][2820/3239]	Time 0.253 (0.538)	Data Time 0.001 (0.015)	Loss 2.3201 (2.3897)	Entropy 0.54938 (0.55233)	Top-1 acc 66.406 (66.478)	Top-5 acc 86.719 (85.605)	lr 0.00204
Train [98][2830/3239]	Time 0.291 (0.538)	Data Time 0.001 (0.015)	Loss 2.5251 (2.3896)	Entropy 0.54945 (0.55232)	Top-1 acc 64.062 (66.481)	Top-5 acc 84.766 (85.606)	lr 0.00204
Train [98][2840/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.015)	Loss 2.4095 (2.3899)	Entropy 0.54955 (0.55231)	Top-1 acc 67.578 (66.476)	Top-5 acc 83.984 (85.601)	lr 0.00204
Train [98][2850/3239]	Time 0.224 (0.538)	Data Time 0.001 (0.015)	Loss 2.4044 (2.3899)	Entropy 0.54966 (0.55230)	Top-1 acc 66.406 (66.475)	Top-5 acc 85.938 (85.601)	lr 0.00204
Train [98][2860/3239]	Time 0.350 (0.537)	Data Time 0.001 (0.015)	Loss 2.2842 (2.3897)	Entropy 0.54965 (0.55229)	Top-1 acc 67.188 (66.483)	Top-5 acc 86.328 (85.605)	lr 0.00204
Train [98][2870/3239]	Time 0.264 (0.537)	Data Time 0.001 (0.015)	Loss 2.4234 (2.3896)	Entropy 0.54994 (0.55229)	Top-1 acc 64.844 (66.481)	Top-5 acc 83.984 (85.606)	lr 0.00204
Train [98][2880/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.015)	Loss 2.6369 (2.3897)	Entropy 0.55008 (0.55228)	Top-1 acc 59.766 (66.475)	Top-5 acc 80.469 (85.604)	lr 0.00204
Train [98][2890/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.015)	Loss 2.5591 (2.3897)	Entropy 0.54981 (0.55227)	Top-1 acc 62.891 (66.476)	Top-5 acc 80.859 (85.597)	lr 0.00204
Train [98][2900/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.014)	Loss 2.4389 (2.3896)	Entropy 0.54989 (0.55226)	Top-1 acc 65.234 (66.478)	Top-5 acc 83.984 (85.600)	lr 0.00204
Train [98][2910/3239]	Time 0.260 (0.535)	Data Time 0.001 (0.014)	Loss 2.4502 (2.3896)	Entropy 0.54981 (0.55225)	Top-1 acc 64.453 (66.475)	Top-5 acc 83.984 (85.600)	lr 0.00203
Train [98][2920/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.014)	Loss 2.3744 (2.3896)	Entropy 0.54985 (0.55224)	Top-1 acc 67.188 (66.472)	Top-5 acc 85.156 (85.602)	lr 0.00203
Train [98][2930/3239]	Time 0.223 (0.534)	Data Time 0.001 (0.014)	Loss 2.2747 (2.3895)	Entropy 0.55006 (0.55224)	Top-1 acc 68.750 (66.474)	Top-5 acc 87.891 (85.602)	lr 0.00203
Train [98][2940/3239]	Time 0.223 (0.534)	Data Time 0.001 (0.014)	Loss 2.3181 (2.3894)	Entropy 0.55013 (0.55223)	Top-1 acc 69.141 (66.477)	Top-5 acc 87.109 (85.601)	lr 0.00203
Train [98][2950/3239]	Time 0.264 (0.534)	Data Time 0.001 (0.014)	Loss 2.5670 (2.3895)	Entropy 0.54974 (0.55222)	Top-1 acc 62.891 (66.474)	Top-5 acc 78.125 (85.600)	lr 0.00203
Train [98][2960/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.014)	Loss 2.5907 (2.3896)	Entropy 0.54982 (0.55221)	Top-1 acc 63.672 (66.470)	Top-5 acc 80.859 (85.597)	lr 0.00203
Train [98][2970/3239]	Time 0.215 (0.533)	Data Time 0.001 (0.014)	Loss 2.4135 (2.3897)	Entropy 0.54957 (0.55221)	Top-1 acc 69.141 (66.468)	Top-5 acc 84.766 (85.596)	lr 0.00203
Train [98][2980/3239]	Time 0.220 (0.532)	Data Time 0.001 (0.014)	Loss 2.6893 (2.3895)	Entropy 0.54963 (0.55220)	Top-1 acc 57.812 (66.470)	Top-5 acc 80.859 (85.599)	lr 0.00203
Train [98][2990/3239]	Time 0.246 (0.532)	Data Time 0.001 (0.014)	Loss 2.3221 (2.3894)	Entropy 0.54952 (0.55219)	Top-1 acc 66.016 (66.477)	Top-5 acc 86.719 (85.601)	lr 0.00203
Train [98][3000/3239]	Time 0.241 (0.532)	Data Time 0.001 (0.014)	Loss 2.3685 (2.3894)	Entropy 0.54981 (0.55218)	Top-1 acc 67.578 (66.474)	Top-5 acc 84.766 (85.599)	lr 0.00203
Train [98][3010/3239]	Time 0.226 (0.531)	Data Time 0.001 (0.014)	Loss 2.1953 (2.3892)	Entropy 0.54997 (0.55217)	Top-1 acc 72.656 (66.478)	Top-5 acc 89.844 (85.606)	lr 0.00203
Train [98][3020/3239]	Time 0.329 (0.531)	Data Time 0.001 (0.014)	Loss 2.5325 (2.3893)	Entropy 0.54994 (0.55216)	Top-1 acc 63.281 (66.475)	Top-5 acc 82.422 (85.604)	lr 0.00203
Train [98][3030/3239]	Time 0.229 (0.531)	Data Time 0.001 (0.014)	Loss 2.4717 (2.3892)	Entropy 0.55030 (0.55216)	Top-1 acc 62.891 (66.478)	Top-5 acc 82.422 (85.606)	lr 0.00203
Train [98][3040/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.014)	Loss 2.4349 (2.3891)	Entropy 0.55021 (0.55215)	Top-1 acc 66.797 (66.478)	Top-5 acc 83.594 (85.607)	lr 0.00203
Train [98][3050/3239]	Time 0.228 (0.530)	Data Time 0.001 (0.014)	Loss 2.5920 (2.3891)	Entropy 0.55027 (0.55215)	Top-1 acc 60.938 (66.477)	Top-5 acc 83.594 (85.608)	lr 0.00203
Train [98][3060/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.014)	Loss 2.3213 (2.3890)	Entropy 0.55030 (0.55214)	Top-1 acc 66.016 (66.475)	Top-5 acc 88.281 (85.610)	lr 0.00203
Train [98][3070/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.014)	Loss 2.4042 (2.3890)	Entropy 0.55040 (0.55213)	Top-1 acc 67.578 (66.473)	Top-5 acc 87.109 (85.612)	lr 0.00203
Train [98][3080/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.014)	Loss 2.2390 (2.3891)	Entropy 0.55043 (0.55213)	Top-1 acc 69.922 (66.471)	Top-5 acc 87.109 (85.610)	lr 0.00203
Train [98][3090/3239]	Time 0.336 (0.528)	Data Time 0.001 (0.014)	Loss 2.5648 (2.3892)	Entropy 0.55055 (0.55212)	Top-1 acc 58.984 (66.468)	Top-5 acc 82.031 (85.610)	lr 0.00202
Train [98][3100/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.014)	Loss 2.2883 (2.3893)	Entropy 0.55041 (0.55212)	Top-1 acc 70.703 (66.468)	Top-5 acc 84.766 (85.606)	lr 0.00202
Train [98][3110/3239]	Time 0.238 (0.528)	Data Time 0.001 (0.014)	Loss 2.5096 (2.3893)	Entropy 0.55049 (0.55211)	Top-1 acc 66.016 (66.465)	Top-5 acc 82.812 (85.607)	lr 0.00202
Train [98][3120/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.014)	Loss 2.3154 (2.3891)	Entropy 0.55044 (0.55211)	Top-1 acc 70.703 (66.472)	Top-5 acc 86.328 (85.612)	lr 0.00202
Train [98][3130/3239]	Time 0.289 (0.527)	Data Time 0.002 (0.014)	Loss 2.2487 (2.3890)	Entropy 0.55061 (0.55210)	Top-1 acc 69.922 (66.476)	Top-5 acc 89.844 (85.616)	lr 0.00202
Train [98][3140/3239]	Time 0.338 (0.527)	Data Time 0.050 (0.013)	Loss 2.4202 (2.3890)	Entropy 0.55066 (0.55210)	Top-1 acc 63.281 (66.476)	Top-5 acc 83.594 (85.614)	lr 0.00202
Train [98][3150/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.013)	Loss 2.3753 (2.3889)	Entropy 0.55059 (0.55209)	Top-1 acc 66.016 (66.476)	Top-5 acc 85.547 (85.616)	lr 0.00202
Train [98][3160/3239]	Time 0.262 (0.527)	Data Time 0.001 (0.013)	Loss 2.3655 (2.3889)	Entropy 0.55056 (0.55209)	Top-1 acc 67.969 (66.481)	Top-5 acc 84.766 (85.617)	lr 0.00202
Train [98][3170/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.013)	Loss 2.5269 (2.3890)	Entropy 0.55043 (0.55208)	Top-1 acc 65.625 (66.478)	Top-5 acc 85.547 (85.617)	lr 0.00202
Train [98][3180/3239]	Time 0.357 (0.526)	Data Time 0.000 (0.013)	Loss 2.4224 (2.3889)	Entropy 0.54978 (0.55208)	Top-1 acc 67.969 (66.481)	Top-5 acc 83.203 (85.618)	lr 0.00202
Train [98][3190/3239]	Time 0.261 (0.526)	Data Time 0.000 (0.013)	Loss 2.3177 (2.3888)	Entropy 0.54951 (0.55207)	Top-1 acc 66.016 (66.482)	Top-5 acc 89.844 (85.623)	lr 0.00202
Train [98][3200/3239]	Time 0.231 (0.525)	Data Time 0.000 (0.013)	Loss 2.5605 (2.3887)	Entropy 0.54928 (0.55206)	Top-1 acc 62.500 (66.483)	Top-5 acc 82.812 (85.625)	lr 0.00202
Train [98][3210/3239]	Time 0.214 (0.525)	Data Time 0.000 (0.013)	Loss 2.5878 (2.3887)	Entropy 0.54961 (0.55205)	Top-1 acc 57.812 (66.480)	Top-5 acc 84.375 (85.626)	lr 0.00202
Train [98][3220/3239]	Time 0.223 (0.524)	Data Time 0.000 (0.013)	Loss 2.3571 (2.3888)	Entropy 0.54954 (0.55204)	Top-1 acc 66.016 (66.477)	Top-5 acc 86.719 (85.625)	lr 0.00202
Train [98][3230/3239]	Time 0.227 (0.524)	Data Time 0.000 (0.013)	Loss 2.5818 (2.3890)	Entropy 0.54952 (0.55204)	Top-1 acc 61.328 (66.472)	Top-5 acc 83.203 (85.621)	lr 0.00202
Train [98][3239/3239]	Time 0.886 (0.524)	Data Time 0.000 (0.013)	Loss 2.9265 (2.3891)	Entropy 0.54945 (0.55203)	Top-1 acc 55.556 (66.472)	Top-5 acc 70.370 (85.620)	lr 0.00202
==========Valid [98/120]	loss 1.201	top-1 acc 72.234 (72.234)	top-5 acc 90.205	Train top-1 66.472	top-5 85.620	Entropy 0.54945	Latency-None: 0.000ms	Flops: 539.00M
Train [99][0/3239]	Time 37.350 (37.350)	Data Time 35.597 (35.597)	Loss 2.1670 (2.1670)	Entropy 0.54957 (0.54957)	Top-1 acc 71.875 (71.875)	Top-5 acc 89.844 (89.844)	lr 0.00202
Train [99][10/3239]	Time 0.251 (3.950)	Data Time 0.001 (3.241)	Loss 2.4405 (2.3403)	Entropy 0.54971 (0.54962)	Top-1 acc 67.578 (67.756)	Top-5 acc 82.812 (86.506)	lr 0.00202
Train [99][20/3239]	Time 0.232 (2.267)	Data Time 0.001 (1.699)	Loss 2.4018 (2.3478)	Entropy 0.54954 (0.54962)	Top-1 acc 64.844 (67.541)	Top-5 acc 85.547 (86.235)	lr 0.00202
Train [99][30/3239]	Time 0.259 (1.708)	Data Time 0.001 (1.151)	Loss 2.2905 (2.3447)	Entropy 0.54949 (0.54961)	Top-1 acc 70.312 (67.729)	Top-5 acc 86.719 (86.379)	lr 0.00201
Train [99][40/3239]	Time 0.231 (1.401)	Data Time 0.001 (0.871)	Loss 2.5522 (2.3726)	Entropy 0.54928 (0.54958)	Top-1 acc 62.109 (66.930)	Top-5 acc 80.859 (85.718)	lr 0.00201
Train [99][50/3239]	Time 0.232 (1.204)	Data Time 0.001 (0.700)	Loss 2.2040 (2.3837)	Entropy 0.54917 (0.54951)	Top-1 acc 71.875 (66.452)	Top-5 acc 89.453 (85.623)	lr 0.00201
Train [99][60/3239]	Time 0.226 (1.079)	Data Time 0.001 (0.586)	Loss 2.3853 (2.3862)	Entropy 0.54923 (0.54945)	Top-1 acc 65.234 (66.381)	Top-5 acc 82.812 (85.489)	lr 0.00201
Train [99][70/3239]	Time 0.228 (0.985)	Data Time 0.001 (0.504)	Loss 2.4496 (2.4003)	Entropy 0.54915 (0.54942)	Top-1 acc 64.062 (66.065)	Top-5 acc 85.156 (85.261)	lr 0.00201
Train [99][80/3239]	Time 0.322 (0.914)	Data Time 0.001 (0.442)	Loss 2.2794 (2.3895)	Entropy 0.54925 (0.54940)	Top-1 acc 67.969 (66.291)	Top-5 acc 87.500 (85.436)	lr 0.00201
Train [99][90/3239]	Time 0.234 (0.858)	Data Time 0.001 (0.393)	Loss 2.3602 (2.3822)	Entropy 0.54935 (0.54938)	Top-1 acc 67.578 (66.488)	Top-5 acc 87.109 (85.538)	lr 0.00201
Train [99][100/3239]	Time 0.226 (0.813)	Data Time 0.001 (0.354)	Loss 2.9191 (2.3930)	Entropy 0.54939 (0.54939)	Top-1 acc 53.125 (66.116)	Top-5 acc 78.125 (85.365)	lr 0.00201
Train [99][110/3239]	Time 0.224 (0.778)	Data Time 0.001 (0.323)	Loss 2.4862 (2.3947)	Entropy 0.54947 (0.54939)	Top-1 acc 63.672 (66.107)	Top-5 acc 82.031 (85.360)	lr 0.00201
Train [99][120/3239]	Time 0.225 (0.746)	Data Time 0.003 (0.296)	Loss 2.3812 (2.3930)	Entropy 0.54946 (0.54940)	Top-1 acc 65.625 (66.154)	Top-5 acc 87.109 (85.421)	lr 0.00201
Train [99][130/3239]	Time 0.262 (1.132)	Data Time 0.003 (0.274)	Loss 2.3793 (2.3873)	Entropy 0.54959 (0.54941)	Top-1 acc 68.750 (66.326)	Top-5 acc 86.719 (85.565)	lr 0.00201
Train [99][140/3239]	Time 0.231 (1.081)	Data Time 0.002 (0.254)	Loss 2.2286 (2.3878)	Entropy 0.54953 (0.54942)	Top-1 acc 69.922 (66.254)	Top-5 acc 87.891 (85.586)	lr 0.00201
Train [99][150/3239]	Time 0.226 (1.037)	Data Time 0.001 (0.238)	Loss 2.5496 (2.3889)	Entropy 0.54956 (0.54943)	Top-1 acc 62.109 (66.318)	Top-5 acc 83.594 (85.547)	lr 0.00201
Train [99][160/3239]	Time 0.233 (0.997)	Data Time 0.001 (0.223)	Loss 2.4015 (2.3871)	Entropy 0.54970 (0.54944)	Top-1 acc 67.188 (66.331)	Top-5 acc 83.984 (85.642)	lr 0.00201
Train [99][170/3239]	Time 0.237 (0.962)	Data Time 0.001 (0.210)	Loss 2.3328 (2.3839)	Entropy 0.55002 (0.54946)	Top-1 acc 71.094 (66.418)	Top-5 acc 85.547 (85.682)	lr 0.00201
Train [99][180/3239]	Time 0.224 (0.932)	Data Time 0.001 (0.199)	Loss 2.6245 (2.3831)	Entropy 0.55019 (0.54949)	Top-1 acc 64.844 (66.426)	Top-5 acc 83.203 (85.696)	lr 0.00201
Train [99][190/3239]	Time 0.223 (0.905)	Data Time 0.001 (0.188)	Loss 2.2551 (2.3843)	Entropy 0.55024 (0.54953)	Top-1 acc 67.969 (66.392)	Top-5 acc 87.500 (85.610)	lr 0.00201
Train [99][200/3239]	Time 0.234 (0.881)	Data Time 0.001 (0.179)	Loss 2.4842 (2.3865)	Entropy 0.54990 (0.54956)	Top-1 acc 61.719 (66.354)	Top-5 acc 83.594 (85.590)	lr 0.00201
Train [99][210/3239]	Time 0.235 (0.858)	Data Time 0.001 (0.171)	Loss 2.3014 (2.3837)	Entropy 0.55012 (0.54958)	Top-1 acc 67.188 (66.456)	Top-5 acc 86.328 (85.638)	lr 0.00201
Train [99][220/3239]	Time 0.273 (0.840)	Data Time 0.001 (0.163)	Loss 2.1454 (2.3828)	Entropy 0.55045 (0.54960)	Top-1 acc 74.219 (66.532)	Top-5 acc 91.016 (85.671)	lr 0.00200
Train [99][230/3239]	Time 0.302 (0.827)	Data Time 0.001 (0.156)	Loss 2.6887 (2.3844)	Entropy 0.55044 (0.54964)	Top-1 acc 61.719 (66.545)	Top-5 acc 79.688 (85.640)	lr 0.00200
Train [99][240/3239]	Time 0.315 (0.810)	Data Time 0.001 (0.150)	Loss 2.4186 (2.3835)	Entropy 0.55040 (0.54967)	Top-1 acc 65.234 (66.599)	Top-5 acc 85.547 (85.667)	lr 0.00200
Train [99][250/3239]	Time 0.227 (0.794)	Data Time 0.001 (0.144)	Loss 2.4591 (2.3802)	Entropy 0.55056 (0.54970)	Top-1 acc 65.234 (66.708)	Top-5 acc 83.594 (85.707)	lr 0.00200
Train [99][260/3239]	Time 0.232 (0.780)	Data Time 0.001 (0.138)	Loss 2.5592 (2.3794)	Entropy 0.55088 (0.54973)	Top-1 acc 60.938 (66.706)	Top-5 acc 80.469 (85.723)	lr 0.00200
Train [99][270/3239]	Time 0.261 (0.767)	Data Time 0.002 (0.133)	Loss 2.3297 (2.3814)	Entropy 0.55081 (0.54978)	Top-1 acc 67.578 (66.667)	Top-5 acc 85.156 (85.688)	lr 0.00200
Train [99][280/3239]	Time 0.256 (0.756)	Data Time 0.001 (0.129)	Loss 2.7446 (2.3829)	Entropy 0.55084 (0.54981)	Top-1 acc 60.156 (66.643)	Top-5 acc 81.250 (85.689)	lr 0.00200
Train [99][290/3239]	Time 0.233 (0.745)	Data Time 0.001 (0.124)	Loss 2.3213 (2.3791)	Entropy 0.55080 (0.54985)	Top-1 acc 67.188 (66.734)	Top-5 acc 85.938 (85.742)	lr 0.00200
Train [99][300/3239]	Time 0.230 (0.734)	Data Time 0.001 (0.120)	Loss 2.3779 (2.3777)	Entropy 0.55008 (0.54987)	Top-1 acc 64.844 (66.779)	Top-5 acc 84.766 (85.784)	lr 0.00200
Train [99][310/3239]	Time 0.321 (0.723)	Data Time 0.001 (0.116)	Loss 2.3892 (2.3778)	Entropy 0.54996 (0.54988)	Top-1 acc 66.797 (66.765)	Top-5 acc 86.719 (85.789)	lr 0.00200
Train [99][320/3239]	Time 0.228 (0.714)	Data Time 0.001 (0.113)	Loss 2.3015 (2.3750)	Entropy 0.54984 (0.54988)	Top-1 acc 69.531 (66.846)	Top-5 acc 86.719 (85.819)	lr 0.00200
Train [99][330/3239]	Time 0.227 (0.704)	Data Time 0.001 (0.109)	Loss 2.4260 (2.3756)	Entropy 0.54984 (0.54988)	Top-1 acc 67.578 (66.819)	Top-5 acc 85.156 (85.802)	lr 0.00200
Train [99][340/3239]	Time 0.232 (0.696)	Data Time 0.001 (0.106)	Loss 2.4489 (2.3754)	Entropy 0.54976 (0.54988)	Top-1 acc 66.797 (66.827)	Top-5 acc 85.547 (85.803)	lr 0.00200
Train [99][350/3239]	Time 0.230 (0.687)	Data Time 0.001 (0.103)	Loss 2.4816 (2.3752)	Entropy 0.54960 (0.54988)	Top-1 acc 66.016 (66.848)	Top-5 acc 85.156 (85.812)	lr 0.00200
Train [99][360/3239]	Time 0.225 (0.680)	Data Time 0.001 (0.100)	Loss 2.1287 (2.3758)	Entropy 0.54982 (0.54987)	Top-1 acc 73.828 (66.843)	Top-5 acc 89.844 (85.820)	lr 0.00200
Train [99][370/3239]	Time 0.225 (0.673)	Data Time 0.001 (0.098)	Loss 2.4161 (2.3748)	Entropy 0.54975 (0.54987)	Top-1 acc 65.625 (66.852)	Top-5 acc 86.328 (85.850)	lr 0.00200
Train [99][380/3239]	Time 0.224 (0.666)	Data Time 0.001 (0.095)	Loss 2.5105 (2.3755)	Entropy 0.54954 (0.54986)	Top-1 acc 65.234 (66.850)	Top-5 acc 82.422 (85.829)	lr 0.00200
Train [99][390/3239]	Time 0.221 (0.660)	Data Time 0.001 (0.093)	Loss 2.3094 (2.3753)	Entropy 0.54979 (0.54986)	Top-1 acc 66.797 (66.812)	Top-5 acc 86.328 (85.843)	lr 0.00200
Train [99][400/3239]	Time 0.356 (0.654)	Data Time 0.001 (0.090)	Loss 2.2493 (2.3755)	Entropy 0.54996 (0.54986)	Top-1 acc 71.094 (66.801)	Top-5 acc 89.453 (85.842)	lr 0.00199
Train [99][410/3239]	Time 0.226 (0.648)	Data Time 0.001 (0.088)	Loss 2.4447 (2.3761)	Entropy 0.55036 (0.54986)	Top-1 acc 65.234 (66.805)	Top-5 acc 82.812 (85.807)	lr 0.00199
Train [99][420/3239]	Time 0.230 (0.642)	Data Time 0.001 (0.086)	Loss 2.2553 (2.3743)	Entropy 0.55043 (0.54988)	Top-1 acc 73.438 (66.854)	Top-5 acc 87.500 (85.845)	lr 0.00199
Train [99][430/3239]	Time 0.225 (0.637)	Data Time 0.001 (0.084)	Loss 2.2140 (2.3737)	Entropy 0.55050 (0.54989)	Top-1 acc 69.531 (66.884)	Top-5 acc 87.891 (85.852)	lr 0.00199
Train [99][440/3239]	Time 0.218 (0.632)	Data Time 0.001 (0.082)	Loss 2.8198 (2.3740)	Entropy 0.55046 (0.54990)	Top-1 acc 54.688 (66.874)	Top-5 acc 78.906 (85.846)	lr 0.00199
Train [99][450/3239]	Time 0.225 (0.627)	Data Time 0.001 (0.081)	Loss 2.4073 (2.3740)	Entropy 0.55054 (0.54992)	Top-1 acc 67.188 (66.884)	Top-5 acc 86.719 (85.839)	lr 0.00199
Train [99][460/3239]	Time 0.224 (0.622)	Data Time 0.001 (0.079)	Loss 2.2278 (2.3757)	Entropy 0.55066 (0.54993)	Top-1 acc 70.312 (66.843)	Top-5 acc 87.109 (85.812)	lr 0.00199
Train [99][470/3239]	Time 0.322 (0.618)	Data Time 0.001 (0.077)	Loss 2.5812 (2.3755)	Entropy 0.55055 (0.54994)	Top-1 acc 60.156 (66.824)	Top-5 acc 82.422 (85.821)	lr 0.00199
Train [99][480/3239]	Time 0.231 (0.613)	Data Time 0.001 (0.076)	Loss 2.2344 (2.3751)	Entropy 0.55063 (0.54996)	Top-1 acc 68.750 (66.849)	Top-5 acc 89.062 (85.825)	lr 0.00199
Train [99][490/3239]	Time 0.225 (0.609)	Data Time 0.001 (0.074)	Loss 2.5527 (2.3761)	Entropy 0.55081 (0.54997)	Top-1 acc 62.891 (66.814)	Top-5 acc 83.594 (85.823)	lr 0.00199
Train [99][500/3239]	Time 0.231 (0.605)	Data Time 0.001 (0.073)	Loss 2.2806 (2.3771)	Entropy 0.55026 (0.54998)	Top-1 acc 70.312 (66.799)	Top-5 acc 88.672 (85.804)	lr 0.00199
Train [99][510/3239]	Time 0.227 (0.601)	Data Time 0.001 (0.071)	Loss 2.2258 (2.3773)	Entropy 0.54992 (0.54998)	Top-1 acc 68.750 (66.797)	Top-5 acc 85.938 (85.794)	lr 0.00199
Train [99][520/3239]	Time 0.233 (0.598)	Data Time 0.001 (0.070)	Loss 2.4056 (2.3767)	Entropy 0.54969 (0.54998)	Top-1 acc 66.797 (66.810)	Top-5 acc 85.547 (85.801)	lr 0.00199
Train [99][530/3239]	Time 0.216 (0.594)	Data Time 0.001 (0.069)	Loss 2.5284 (2.3769)	Entropy 0.54953 (0.54997)	Top-1 acc 63.672 (66.806)	Top-5 acc 84.766 (85.813)	lr 0.00199
Train [99][540/3239]	Time 0.290 (0.592)	Data Time 0.002 (0.068)	Loss 2.2994 (2.3773)	Entropy 0.54923 (0.54996)	Top-1 acc 68.359 (66.805)	Top-5 acc 87.109 (85.802)	lr 0.00199
Train [99][550/3239]	Time 0.229 (0.590)	Data Time 0.001 (0.066)	Loss 2.3357 (2.3779)	Entropy 0.54945 (0.54995)	Top-1 acc 67.188 (66.798)	Top-5 acc 87.891 (85.791)	lr 0.00199
Train [99][560/3239]	Time 0.306 (0.587)	Data Time 0.001 (0.065)	Loss 2.2466 (2.3765)	Entropy 0.54952 (0.54994)	Top-1 acc 71.875 (66.837)	Top-5 acc 88.672 (85.793)	lr 0.00199
Train [99][570/3239]	Time 0.239 (0.584)	Data Time 0.001 (0.064)	Loss 2.2803 (2.3751)	Entropy 0.54935 (0.54993)	Top-1 acc 68.750 (66.873)	Top-5 acc 87.109 (85.819)	lr 0.00199
Train [99][580/3239]	Time 0.228 (0.581)	Data Time 0.001 (0.063)	Loss 2.4938 (2.3760)	Entropy 0.54888 (0.54992)	Top-1 acc 66.016 (66.857)	Top-5 acc 85.547 (85.808)	lr 0.00198
Train [99][590/3239]	Time 0.227 (0.578)	Data Time 0.001 (0.062)	Loss 2.4224 (2.3771)	Entropy 0.54941 (0.54990)	Top-1 acc 66.406 (66.830)	Top-5 acc 83.984 (85.789)	lr 0.00198
Train [99][600/3239]	Time 0.230 (0.575)	Data Time 0.001 (0.061)	Loss 2.2693 (2.3764)	Entropy 0.54931 (0.54989)	Top-1 acc 70.703 (66.854)	Top-5 acc 88.281 (85.802)	lr 0.00198
Train [99][610/3239]	Time 0.239 (0.573)	Data Time 0.001 (0.060)	Loss 2.2713 (2.3762)	Entropy 0.54932 (0.54988)	Top-1 acc 71.094 (66.875)	Top-5 acc 86.328 (85.799)	lr 0.00198
Train [99][620/3239]	Time 0.236 (0.571)	Data Time 0.001 (0.059)	Loss 2.3166 (2.3767)	Entropy 0.54943 (0.54988)	Top-1 acc 67.969 (66.850)	Top-5 acc 85.547 (85.780)	lr 0.00198
Train [99][630/3239]	Time 0.326 (0.568)	Data Time 0.001 (0.058)	Loss 2.2946 (2.3766)	Entropy 0.54851 (0.54986)	Top-1 acc 68.750 (66.836)	Top-5 acc 88.281 (85.792)	lr 0.00198
Train [99][640/3239]	Time 0.228 (0.566)	Data Time 0.001 (0.057)	Loss 2.7750 (2.3779)	Entropy 0.54863 (0.54984)	Top-1 acc 55.078 (66.789)	Top-5 acc 79.297 (85.771)	lr 0.00198
Train [99][650/3239]	Time 0.260 (0.564)	Data Time 0.001 (0.056)	Loss 2.2953 (2.3782)	Entropy 0.54854 (0.54982)	Top-1 acc 70.312 (66.790)	Top-5 acc 87.500 (85.763)	lr 0.00198
Train [99][660/3239]	Time 0.233 (0.562)	Data Time 0.001 (0.056)	Loss 2.2540 (2.3774)	Entropy 0.54841 (0.54980)	Top-1 acc 70.703 (66.803)	Top-5 acc 89.062 (85.773)	lr 0.00198
Train [99][670/3239]	Time 0.239 (0.559)	Data Time 0.001 (0.055)	Loss 2.2879 (2.3770)	Entropy 0.54821 (0.54978)	Top-1 acc 69.531 (66.807)	Top-5 acc 88.281 (85.778)	lr 0.00198
Train [99][680/3239]	Time 0.234 (0.557)	Data Time 0.001 (0.054)	Loss 2.3041 (2.3773)	Entropy 0.54808 (0.54976)	Top-1 acc 68.359 (66.813)	Top-5 acc 85.938 (85.767)	lr 0.00198
Train [99][690/3239]	Time 0.248 (0.555)	Data Time 0.001 (0.053)	Loss 2.2241 (2.3772)	Entropy 0.54786 (0.54973)	Top-1 acc 71.094 (66.812)	Top-5 acc 89.844 (85.782)	lr 0.00198
Train [99][700/3239]	Time 0.245 (0.553)	Data Time 0.001 (0.052)	Loss 2.2538 (2.3768)	Entropy 0.54768 (0.54971)	Top-1 acc 72.266 (66.829)	Top-5 acc 86.719 (85.783)	lr 0.00198
Train [99][710/3239]	Time 0.235 (0.552)	Data Time 0.001 (0.052)	Loss 2.3198 (2.3772)	Entropy 0.54761 (0.54968)	Top-1 acc 67.969 (66.806)	Top-5 acc 87.109 (85.789)	lr 0.00198
Train [99][720/3239]	Time 0.226 (0.550)	Data Time 0.001 (0.051)	Loss 2.5364 (2.3766)	Entropy 0.54756 (0.54965)	Top-1 acc 62.891 (66.821)	Top-5 acc 83.984 (85.812)	lr 0.00198
Train [99][730/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.050)	Loss 2.4897 (2.3769)	Entropy 0.54705 (0.54962)	Top-1 acc 63.281 (66.800)	Top-5 acc 81.641 (85.803)	lr 0.00198
Train [99][740/3239]	Time 0.246 (0.546)	Data Time 0.001 (0.050)	Loss 2.3154 (2.3766)	Entropy 0.54670 (0.54958)	Top-1 acc 68.359 (66.793)	Top-5 acc 88.281 (85.815)	lr 0.00198
Train [99][750/3239]	Time 0.227 (0.544)	Data Time 0.001 (0.049)	Loss 2.3922 (2.3772)	Entropy 0.54671 (0.54954)	Top-1 acc 67.578 (66.782)	Top-5 acc 86.719 (85.803)	lr 0.00198
Train [99][760/3239]	Time 0.228 (0.543)	Data Time 0.001 (0.048)	Loss 2.5799 (2.3777)	Entropy 0.54673 (0.54951)	Top-1 acc 64.062 (66.777)	Top-5 acc 82.422 (85.791)	lr 0.00198
Train [99][770/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.048)	Loss 2.3285 (2.3776)	Entropy 0.54702 (0.54947)	Top-1 acc 69.141 (66.792)	Top-5 acc 86.328 (85.782)	lr 0.00197
Train [99][780/3239]	Time 0.374 (0.611)	Data Time 0.004 (0.047)	Loss 2.4303 (2.3774)	Entropy 0.54672 (0.54944)	Top-1 acc 65.625 (66.812)	Top-5 acc 85.547 (85.780)	lr 0.00197
Train [99][790/3239]	Time 0.325 (0.609)	Data Time 0.002 (0.047)	Loss 2.5504 (2.3775)	Entropy 0.54642 (0.54941)	Top-1 acc 62.109 (66.811)	Top-5 acc 82.422 (85.787)	lr 0.00197
Train [99][800/3239]	Time 0.230 (0.607)	Data Time 0.002 (0.046)	Loss 2.3843 (2.3780)	Entropy 0.54649 (0.54937)	Top-1 acc 62.891 (66.788)	Top-5 acc 87.891 (85.786)	lr 0.00197
Train [99][810/3239]	Time 0.230 (0.605)	Data Time 0.001 (0.046)	Loss 2.4633 (2.3777)	Entropy 0.54639 (0.54933)	Top-1 acc 64.453 (66.798)	Top-5 acc 83.203 (85.786)	lr 0.00197
Train [99][820/3239]	Time 0.236 (0.602)	Data Time 0.001 (0.045)	Loss 2.3405 (2.3774)	Entropy 0.54617 (0.54929)	Top-1 acc 66.406 (66.812)	Top-5 acc 87.500 (85.797)	lr 0.00197
Train [99][830/3239]	Time 0.244 (0.600)	Data Time 0.001 (0.045)	Loss 2.4131 (2.3773)	Entropy 0.54636 (0.54926)	Top-1 acc 65.625 (66.818)	Top-5 acc 85.547 (85.798)	lr 0.00197
Train [99][840/3239]	Time 0.260 (0.598)	Data Time 0.002 (0.044)	Loss 2.5166 (2.3773)	Entropy 0.54652 (0.54922)	Top-1 acc 60.938 (66.817)	Top-5 acc 83.203 (85.790)	lr 0.00197
Train [99][850/3239]	Time 0.228 (0.596)	Data Time 0.001 (0.044)	Loss 2.4069 (2.3779)	Entropy 0.54659 (0.54919)	Top-1 acc 66.016 (66.798)	Top-5 acc 85.547 (85.779)	lr 0.00197
Train [99][860/3239]	Time 0.238 (0.594)	Data Time 0.001 (0.043)	Loss 2.2487 (2.3784)	Entropy 0.54649 (0.54916)	Top-1 acc 70.312 (66.801)	Top-5 acc 90.234 (85.761)	lr 0.00197
Train [99][870/3239]	Time 0.228 (0.592)	Data Time 0.001 (0.043)	Loss 2.1645 (2.3791)	Entropy 0.54604 (0.54913)	Top-1 acc 71.875 (66.783)	Top-5 acc 90.234 (85.753)	lr 0.00197
Train [99][880/3239]	Time 0.230 (0.590)	Data Time 0.001 (0.042)	Loss 2.2817 (2.3788)	Entropy 0.54617 (0.54909)	Top-1 acc 71.094 (66.782)	Top-5 acc 88.281 (85.758)	lr 0.00197
Train [99][890/3239]	Time 0.222 (0.588)	Data Time 0.001 (0.042)	Loss 2.5566 (2.3794)	Entropy 0.54605 (0.54906)	Top-1 acc 63.672 (66.761)	Top-5 acc 84.375 (85.750)	lr 0.00197
Train [99][900/3239]	Time 0.225 (0.586)	Data Time 0.001 (0.041)	Loss 2.6434 (2.3797)	Entropy 0.54618 (0.54903)	Top-1 acc 59.766 (66.754)	Top-5 acc 82.422 (85.758)	lr 0.00197
Train [99][910/3239]	Time 0.234 (0.584)	Data Time 0.001 (0.041)	Loss 2.2310 (2.3789)	Entropy 0.54588 (0.54900)	Top-1 acc 71.094 (66.785)	Top-5 acc 87.500 (85.766)	lr 0.00197
Train [99][920/3239]	Time 0.236 (0.582)	Data Time 0.001 (0.040)	Loss 2.3333 (2.3790)	Entropy 0.54576 (0.54896)	Top-1 acc 69.922 (66.793)	Top-5 acc 85.547 (85.772)	lr 0.00197
Train [99][930/3239]	Time 0.239 (0.581)	Data Time 0.001 (0.040)	Loss 2.4497 (2.3790)	Entropy 0.54570 (0.54893)	Top-1 acc 68.359 (66.796)	Top-5 acc 84.766 (85.773)	lr 0.00197
Train [99][940/3239]	Time 0.230 (0.579)	Data Time 0.001 (0.040)	Loss 2.4971 (2.3800)	Entropy 0.54552 (0.54889)	Top-1 acc 66.797 (66.782)	Top-5 acc 83.984 (85.756)	lr 0.00197
Train [99][950/3239]	Time 0.320 (0.577)	Data Time 0.001 (0.039)	Loss 2.3231 (2.3797)	Entropy 0.54498 (0.54885)	Top-1 acc 64.844 (66.776)	Top-5 acc 89.844 (85.765)	lr 0.00196
Train [99][960/3239]	Time 0.225 (0.576)	Data Time 0.001 (0.039)	Loss 2.4164 (2.3795)	Entropy 0.54518 (0.54881)	Top-1 acc 60.938 (66.777)	Top-5 acc 85.938 (85.766)	lr 0.00196
Train [99][970/3239]	Time 0.230 (0.574)	Data Time 0.001 (0.038)	Loss 2.3936 (2.3797)	Entropy 0.54519 (0.54877)	Top-1 acc 66.406 (66.774)	Top-5 acc 85.547 (85.761)	lr 0.00196
Train [99][980/3239]	Time 0.226 (0.573)	Data Time 0.001 (0.038)	Loss 2.0777 (2.3793)	Entropy 0.54543 (0.54874)	Top-1 acc 68.750 (66.782)	Top-5 acc 91.016 (85.761)	lr 0.00196
Train [99][990/3239]	Time 0.237 (0.571)	Data Time 0.001 (0.038)	Loss 2.8606 (2.3801)	Entropy 0.54554 (0.54871)	Top-1 acc 57.812 (66.761)	Top-5 acc 76.953 (85.751)	lr 0.00196
Train [99][1000/3239]	Time 0.223 (0.569)	Data Time 0.001 (0.037)	Loss 2.5274 (2.3801)	Entropy 0.54574 (0.54868)	Top-1 acc 61.719 (66.756)	Top-5 acc 85.547 (85.754)	lr 0.00196
Train [99][1010/3239]	Time 0.288 (0.569)	Data Time 0.002 (0.037)	Loss 2.3162 (2.3802)	Entropy 0.54554 (0.54865)	Top-1 acc 64.844 (66.749)	Top-5 acc 87.500 (85.756)	lr 0.00196
Train [99][1020/3239]	Time 0.423 (0.569)	Data Time 0.002 (0.037)	Loss 2.4084 (2.3808)	Entropy 0.54536 (0.54861)	Top-1 acc 65.625 (66.741)	Top-5 acc 84.375 (85.743)	lr 0.00196
Train [99][1030/3239]	Time 0.234 (0.568)	Data Time 0.001 (0.036)	Loss 2.2921 (2.3809)	Entropy 0.54536 (0.54858)	Top-1 acc 69.922 (66.740)	Top-5 acc 86.328 (85.739)	lr 0.00196
Train [99][1040/3239]	Time 0.232 (0.567)	Data Time 0.001 (0.036)	Loss 2.2442 (2.3816)	Entropy 0.54537 (0.54855)	Top-1 acc 68.750 (66.723)	Top-5 acc 89.844 (85.730)	lr 0.00196
Train [99][1050/3239]	Time 0.221 (0.566)	Data Time 0.001 (0.036)	Loss 2.5383 (2.3812)	Entropy 0.54534 (0.54852)	Top-1 acc 62.500 (66.734)	Top-5 acc 85.156 (85.738)	lr 0.00196
Train [99][1060/3239]	Time 0.233 (0.564)	Data Time 0.001 (0.035)	Loss 2.2222 (2.3804)	Entropy 0.54507 (0.54849)	Top-1 acc 73.438 (66.754)	Top-5 acc 89.062 (85.743)	lr 0.00196
Train [99][1070/3239]	Time 0.239 (0.563)	Data Time 0.001 (0.035)	Loss 2.3485 (2.3802)	Entropy 0.54532 (0.54846)	Top-1 acc 68.359 (66.759)	Top-5 acc 89.062 (85.748)	lr 0.00196
Train [99][1080/3239]	Time 0.228 (0.562)	Data Time 0.001 (0.035)	Loss 2.2827 (2.3802)	Entropy 0.54536 (0.54843)	Top-1 acc 67.188 (66.760)	Top-5 acc 89.062 (85.747)	lr 0.00196
Train [99][1090/3239]	Time 0.229 (0.560)	Data Time 0.001 (0.034)	Loss 2.2887 (2.3798)	Entropy 0.54504 (0.54840)	Top-1 acc 69.531 (66.771)	Top-5 acc 89.062 (85.755)	lr 0.00196
Train [99][1100/3239]	Time 0.225 (0.559)	Data Time 0.001 (0.034)	Loss 2.3493 (2.3800)	Entropy 0.54488 (0.54837)	Top-1 acc 68.359 (66.767)	Top-5 acc 85.547 (85.749)	lr 0.00196
Train [99][1110/3239]	Time 0.325 (0.558)	Data Time 0.001 (0.034)	Loss 2.3154 (2.3801)	Entropy 0.54477 (0.54834)	Top-1 acc 70.312 (66.770)	Top-5 acc 85.156 (85.748)	lr 0.00196
Train [99][1120/3239]	Time 0.233 (0.557)	Data Time 0.001 (0.033)	Loss 2.3910 (2.3805)	Entropy 0.54483 (0.54831)	Top-1 acc 68.359 (66.757)	Top-5 acc 84.375 (85.745)	lr 0.00196
Train [99][1130/3239]	Time 0.222 (0.555)	Data Time 0.001 (0.033)	Loss 2.4112 (2.3807)	Entropy 0.54451 (0.54828)	Top-1 acc 66.797 (66.756)	Top-5 acc 84.766 (85.742)	lr 0.00195
Train [99][1140/3239]	Time 0.234 (0.554)	Data Time 0.001 (0.033)	Loss 2.3859 (2.3810)	Entropy 0.54456 (0.54825)	Top-1 acc 66.797 (66.751)	Top-5 acc 82.812 (85.739)	lr 0.00195
Train [99][1150/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.033)	Loss 2.3019 (2.3805)	Entropy 0.54463 (0.54821)	Top-1 acc 67.578 (66.766)	Top-5 acc 85.547 (85.743)	lr 0.00195
Train [99][1160/3239]	Time 0.359 (0.552)	Data Time 0.002 (0.032)	Loss 2.2635 (2.3810)	Entropy 0.54484 (0.54818)	Top-1 acc 69.531 (66.748)	Top-5 acc 89.062 (85.737)	lr 0.00195
Train [99][1170/3239]	Time 0.242 (0.551)	Data Time 0.001 (0.032)	Loss 2.3320 (2.3818)	Entropy 0.54491 (0.54816)	Top-1 acc 67.969 (66.732)	Top-5 acc 88.281 (85.735)	lr 0.00195
Train [99][1180/3239]	Time 0.317 (0.550)	Data Time 0.001 (0.032)	Loss 2.3170 (2.3816)	Entropy 0.54476 (0.54813)	Top-1 acc 67.969 (66.734)	Top-5 acc 85.547 (85.739)	lr 0.00195
Train [99][1190/3239]	Time 0.242 (0.549)	Data Time 0.001 (0.032)	Loss 2.5108 (2.3817)	Entropy 0.54458 (0.54810)	Top-1 acc 62.500 (66.723)	Top-5 acc 83.594 (85.735)	lr 0.00195
Train [99][1200/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.031)	Loss 2.3291 (2.3815)	Entropy 0.54421 (0.54807)	Top-1 acc 66.016 (66.728)	Top-5 acc 87.891 (85.736)	lr 0.00195
Train [99][1210/3239]	Time 0.230 (0.547)	Data Time 0.001 (0.031)	Loss 2.2232 (2.3816)	Entropy 0.54426 (0.54804)	Top-1 acc 71.484 (66.725)	Top-5 acc 88.672 (85.734)	lr 0.00195
Train [99][1220/3239]	Time 0.229 (0.546)	Data Time 0.001 (0.031)	Loss 2.4439 (2.3818)	Entropy 0.54437 (0.54800)	Top-1 acc 66.406 (66.725)	Top-5 acc 82.422 (85.729)	lr 0.00195
Train [99][1230/3239]	Time 0.224 (0.545)	Data Time 0.001 (0.031)	Loss 2.3615 (2.3816)	Entropy 0.54428 (0.54797)	Top-1 acc 67.188 (66.732)	Top-5 acc 87.891 (85.735)	lr 0.00195
Train [99][1240/3239]	Time 0.231 (0.543)	Data Time 0.001 (0.030)	Loss 2.1966 (2.3818)	Entropy 0.54443 (0.54794)	Top-1 acc 72.266 (66.729)	Top-5 acc 89.453 (85.736)	lr 0.00195
Train [99][1250/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.030)	Loss 2.2409 (2.3818)	Entropy 0.54458 (0.54792)	Top-1 acc 69.531 (66.728)	Top-5 acc 88.672 (85.737)	lr 0.00195
Train [99][1260/3239]	Time 0.223 (0.541)	Data Time 0.001 (0.030)	Loss 2.4119 (2.3819)	Entropy 0.54475 (0.54789)	Top-1 acc 67.578 (66.727)	Top-5 acc 82.422 (85.731)	lr 0.00195
Train [99][1270/3239]	Time 0.243 (0.540)	Data Time 0.001 (0.030)	Loss 2.4596 (2.3816)	Entropy 0.54466 (0.54787)	Top-1 acc 64.844 (66.722)	Top-5 acc 84.375 (85.741)	lr 0.00195
Train [99][1280/3239]	Time 0.229 (0.539)	Data Time 0.001 (0.029)	Loss 2.3059 (2.3816)	Entropy 0.54462 (0.54784)	Top-1 acc 68.750 (66.722)	Top-5 acc 85.938 (85.741)	lr 0.00195
Train [99][1290/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.029)	Loss 2.4204 (2.3813)	Entropy 0.54490 (0.54782)	Top-1 acc 65.625 (66.726)	Top-5 acc 87.891 (85.747)	lr 0.00195
Train [99][1300/3239]	Time 0.226 (0.537)	Data Time 0.001 (0.029)	Loss 2.2965 (2.3811)	Entropy 0.54507 (0.54779)	Top-1 acc 73.047 (66.734)	Top-5 acc 87.891 (85.754)	lr 0.00195
Train [99][1310/3239]	Time 0.223 (0.536)	Data Time 0.001 (0.029)	Loss 2.2222 (2.3811)	Entropy 0.54534 (0.54777)	Top-1 acc 70.703 (66.741)	Top-5 acc 88.672 (85.760)	lr 0.00195
Train [99][1320/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.029)	Loss 2.4564 (2.3814)	Entropy 0.54539 (0.54775)	Top-1 acc 64.844 (66.728)	Top-5 acc 83.594 (85.758)	lr 0.00194
Train [99][1330/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.028)	Loss 2.4509 (2.3812)	Entropy 0.54520 (0.54774)	Top-1 acc 62.891 (66.731)	Top-5 acc 84.375 (85.758)	lr 0.00194
Train [99][1340/3239]	Time 0.320 (0.534)	Data Time 0.001 (0.028)	Loss 2.3430 (2.3810)	Entropy 0.54502 (0.54772)	Top-1 acc 71.875 (66.739)	Top-5 acc 87.109 (85.764)	lr 0.00194
Train [99][1350/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.028)	Loss 2.3247 (2.3808)	Entropy 0.54512 (0.54770)	Top-1 acc 68.359 (66.738)	Top-5 acc 85.156 (85.767)	lr 0.00194
Train [99][1360/3239]	Time 0.221 (0.532)	Data Time 0.001 (0.028)	Loss 2.5398 (2.3809)	Entropy 0.54505 (0.54768)	Top-1 acc 62.891 (66.738)	Top-5 acc 82.031 (85.764)	lr 0.00194
Train [99][1370/3239]	Time 0.225 (0.531)	Data Time 0.001 (0.028)	Loss 2.5840 (2.3808)	Entropy 0.54503 (0.54766)	Top-1 acc 61.328 (66.737)	Top-5 acc 83.203 (85.768)	lr 0.00194
Train [99][1380/3239]	Time 0.228 (0.530)	Data Time 0.001 (0.027)	Loss 2.7936 (2.3808)	Entropy 0.54487 (0.54764)	Top-1 acc 54.297 (66.730)	Top-5 acc 78.125 (85.768)	lr 0.00194
Train [99][1390/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.027)	Loss 2.2742 (2.3807)	Entropy 0.54491 (0.54762)	Top-1 acc 70.703 (66.728)	Top-5 acc 87.500 (85.775)	lr 0.00194
Train [99][1400/3239]	Time 0.226 (0.528)	Data Time 0.001 (0.027)	Loss 2.3002 (2.3809)	Entropy 0.54487 (0.54760)	Top-1 acc 65.234 (66.714)	Top-5 acc 88.672 (85.776)	lr 0.00194
Train [99][1410/3239]	Time 0.350 (0.528)	Data Time 0.002 (0.027)	Loss 2.6615 (2.3815)	Entropy 0.54496 (0.54758)	Top-1 acc 59.375 (66.705)	Top-5 acc 81.250 (85.771)	lr 0.00194
Train [99][1420/3239]	Time 0.257 (0.527)	Data Time 0.024 (0.027)	Loss 2.3405 (2.3813)	Entropy 0.54503 (0.54756)	Top-1 acc 66.406 (66.706)	Top-5 acc 84.766 (85.774)	lr 0.00194
Train [99][1430/3239]	Time 0.226 (0.526)	Data Time 0.001 (0.027)	Loss 2.5517 (2.3819)	Entropy 0.54493 (0.54755)	Top-1 acc 59.766 (66.686)	Top-5 acc 82.812 (85.769)	lr 0.00194
Train [99][1440/3239]	Time 0.266 (0.564)	Data Time 0.003 (0.026)	Loss 2.5667 (2.3820)	Entropy 0.54471 (0.54753)	Top-1 acc 59.766 (66.683)	Top-5 acc 82.422 (85.771)	lr 0.00194
Train [99][1450/3239]	Time 0.241 (0.563)	Data Time 0.002 (0.026)	Loss 2.3033 (2.3821)	Entropy 0.54499 (0.54751)	Top-1 acc 69.141 (66.682)	Top-5 acc 87.500 (85.766)	lr 0.00194
Train [99][1460/3239]	Time 0.230 (0.562)	Data Time 0.001 (0.026)	Loss 2.3219 (2.3821)	Entropy 0.54502 (0.54749)	Top-1 acc 66.797 (66.678)	Top-5 acc 85.938 (85.766)	lr 0.00194
Train [99][1470/3239]	Time 0.245 (0.561)	Data Time 0.002 (0.026)	Loss 2.3335 (2.3820)	Entropy 0.54488 (0.54747)	Top-1 acc 66.016 (66.685)	Top-5 acc 86.719 (85.770)	lr 0.00194
Train [99][1480/3239]	Time 0.231 (0.560)	Data Time 0.001 (0.026)	Loss 2.3129 (2.3817)	Entropy 0.54494 (0.54746)	Top-1 acc 69.531 (66.694)	Top-5 acc 87.109 (85.774)	lr 0.00194
Train [99][1490/3239]	Time 0.230 (0.559)	Data Time 0.001 (0.026)	Loss 2.2162 (2.3814)	Entropy 0.54509 (0.54744)	Top-1 acc 70.312 (66.701)	Top-5 acc 87.891 (85.782)	lr 0.00194
Train [99][1500/3239]	Time 0.333 (0.558)	Data Time 0.001 (0.025)	Loss 2.4413 (2.3813)	Entropy 0.54525 (0.54743)	Top-1 acc 65.625 (66.713)	Top-5 acc 83.984 (85.782)	lr 0.00193
Train [99][1510/3239]	Time 0.238 (0.557)	Data Time 0.002 (0.025)	Loss 2.3784 (2.3811)	Entropy 0.54554 (0.54741)	Top-1 acc 67.578 (66.716)	Top-5 acc 88.281 (85.787)	lr 0.00193
Train [99][1520/3239]	Time 0.276 (0.556)	Data Time 0.001 (0.025)	Loss 2.2312 (2.3812)	Entropy 0.54559 (0.54740)	Top-1 acc 71.094 (66.714)	Top-5 acc 85.547 (85.783)	lr 0.00193
Train [99][1530/3239]	Time 0.235 (0.555)	Data Time 0.001 (0.025)	Loss 2.4098 (2.3813)	Entropy 0.54539 (0.54739)	Top-1 acc 62.891 (66.715)	Top-5 acc 82.422 (85.779)	lr 0.00193
Train [99][1540/3239]	Time 0.230 (0.555)	Data Time 0.001 (0.025)	Loss 2.2978 (2.3811)	Entropy 0.54520 (0.54737)	Top-1 acc 67.188 (66.714)	Top-5 acc 88.281 (85.785)	lr 0.00193
Train [99][1550/3239]	Time 0.230 (0.554)	Data Time 0.001 (0.025)	Loss 2.3792 (2.3807)	Entropy 0.54525 (0.54736)	Top-1 acc 64.062 (66.721)	Top-5 acc 87.500 (85.793)	lr 0.00193
Train [99][1560/3239]	Time 0.234 (0.553)	Data Time 0.001 (0.024)	Loss 2.2461 (2.3807)	Entropy 0.54489 (0.54735)	Top-1 acc 67.969 (66.725)	Top-5 acc 88.281 (85.799)	lr 0.00193
Train [99][1570/3239]	Time 0.328 (0.552)	Data Time 0.001 (0.024)	Loss 2.5486 (2.3810)	Entropy 0.54491 (0.54733)	Top-1 acc 62.891 (66.718)	Top-5 acc 84.766 (85.795)	lr 0.00193
Train [99][1580/3239]	Time 0.231 (0.551)	Data Time 0.001 (0.024)	Loss 2.3908 (2.3813)	Entropy 0.54468 (0.54731)	Top-1 acc 67.188 (66.706)	Top-5 acc 86.328 (85.791)	lr 0.00193
Train [99][1590/3239]	Time 0.257 (0.550)	Data Time 0.001 (0.024)	Loss 2.4791 (2.3818)	Entropy 0.54485 (0.54730)	Top-1 acc 63.672 (66.696)	Top-5 acc 83.984 (85.781)	lr 0.00193
Train [99][1600/3239]	Time 0.226 (0.550)	Data Time 0.001 (0.024)	Loss 2.4195 (2.3818)	Entropy 0.54476 (0.54728)	Top-1 acc 67.578 (66.698)	Top-5 acc 85.547 (85.777)	lr 0.00193
Train [99][1610/3239]	Time 0.220 (0.549)	Data Time 0.001 (0.024)	Loss 2.2686 (2.3816)	Entropy 0.54478 (0.54727)	Top-1 acc 71.484 (66.706)	Top-5 acc 85.938 (85.779)	lr 0.00193
Train [99][1620/3239]	Time 0.217 (0.548)	Data Time 0.001 (0.024)	Loss 2.7347 (2.3818)	Entropy 0.54485 (0.54725)	Top-1 acc 59.375 (66.697)	Top-5 acc 80.859 (85.780)	lr 0.00193
Train [99][1630/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.023)	Loss 2.3805 (2.3814)	Entropy 0.54487 (0.54724)	Top-1 acc 66.406 (66.705)	Top-5 acc 87.500 (85.787)	lr 0.00193
Train [99][1640/3239]	Time 0.229 (0.546)	Data Time 0.001 (0.023)	Loss 2.5765 (2.3817)	Entropy 0.54449 (0.54722)	Top-1 acc 65.625 (66.694)	Top-5 acc 82.812 (85.779)	lr 0.00193
Train [99][1650/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.023)	Loss 2.2807 (2.3818)	Entropy 0.54466 (0.54720)	Top-1 acc 68.750 (66.694)	Top-5 acc 86.719 (85.778)	lr 0.00193
Train [99][1660/3239]	Time 0.327 (0.545)	Data Time 0.001 (0.023)	Loss 2.3650 (2.3817)	Entropy 0.54448 (0.54719)	Top-1 acc 67.188 (66.701)	Top-5 acc 87.109 (85.779)	lr 0.00193
Train [99][1670/3239]	Time 0.232 (0.544)	Data Time 0.001 (0.023)	Loss 2.3524 (2.3816)	Entropy 0.54457 (0.54717)	Top-1 acc 67.188 (66.703)	Top-5 acc 86.328 (85.776)	lr 0.00193
Train [99][1680/3239]	Time 0.277 (0.544)	Data Time 0.001 (0.023)	Loss 2.2987 (2.3812)	Entropy 0.54484 (0.54716)	Top-1 acc 66.797 (66.708)	Top-5 acc 84.375 (85.779)	lr 0.00193
Train [99][1690/3239]	Time 0.268 (0.544)	Data Time 0.001 (0.023)	Loss 2.5816 (2.3820)	Entropy 0.54459 (0.54714)	Top-1 acc 64.062 (66.686)	Top-5 acc 81.641 (85.769)	lr 0.00192
Train [99][1700/3239]	Time 0.233 (0.543)	Data Time 0.001 (0.023)	Loss 2.3018 (2.3823)	Entropy 0.54466 (0.54713)	Top-1 acc 67.188 (66.678)	Top-5 acc 86.328 (85.763)	lr 0.00192
Train [99][1710/3239]	Time 0.226 (0.542)	Data Time 0.001 (0.022)	Loss 2.3138 (2.3823)	Entropy 0.54445 (0.54711)	Top-1 acc 69.141 (66.684)	Top-5 acc 87.500 (85.759)	lr 0.00192
Train [99][1720/3239]	Time 0.225 (0.542)	Data Time 0.001 (0.022)	Loss 2.4759 (2.3829)	Entropy 0.54456 (0.54710)	Top-1 acc 67.188 (66.664)	Top-5 acc 83.203 (85.752)	lr 0.00192
Train [99][1730/3239]	Time 0.323 (0.541)	Data Time 0.001 (0.022)	Loss 2.2645 (2.3830)	Entropy 0.54433 (0.54708)	Top-1 acc 69.531 (66.664)	Top-5 acc 87.109 (85.749)	lr 0.00192
Train [99][1740/3239]	Time 0.216 (0.540)	Data Time 0.001 (0.022)	Loss 2.6452 (2.3834)	Entropy 0.54429 (0.54707)	Top-1 acc 60.156 (66.651)	Top-5 acc 81.250 (85.743)	lr 0.00192
Train [99][1750/3239]	Time 0.222 (0.539)	Data Time 0.001 (0.022)	Loss 2.4092 (2.3833)	Entropy 0.54421 (0.54705)	Top-1 acc 67.188 (66.656)	Top-5 acc 86.328 (85.743)	lr 0.00192
Train [99][1760/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.022)	Loss 2.5826 (2.3835)	Entropy 0.54439 (0.54704)	Top-1 acc 62.500 (66.656)	Top-5 acc 81.250 (85.737)	lr 0.00192
Train [99][1770/3239]	Time 0.252 (0.538)	Data Time 0.001 (0.022)	Loss 2.4503 (2.3833)	Entropy 0.54463 (0.54702)	Top-1 acc 66.406 (66.662)	Top-5 acc 85.547 (85.742)	lr 0.00192
Train [99][1780/3239]	Time 0.219 (0.537)	Data Time 0.001 (0.022)	Loss 2.4327 (2.3833)	Entropy 0.54474 (0.54701)	Top-1 acc 65.234 (66.669)	Top-5 acc 83.594 (85.738)	lr 0.00192
Train [99][1790/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.022)	Loss 2.3160 (2.3830)	Entropy 0.54476 (0.54700)	Top-1 acc 69.141 (66.678)	Top-5 acc 86.719 (85.743)	lr 0.00192
Train [99][1800/3239]	Time 0.230 (0.536)	Data Time 0.001 (0.021)	Loss 2.6612 (2.3830)	Entropy 0.54500 (0.54698)	Top-1 acc 57.812 (66.676)	Top-5 acc 78.906 (85.735)	lr 0.00192
Train [99][1810/3239]	Time 0.230 (0.535)	Data Time 0.001 (0.021)	Loss 2.5466 (2.3828)	Entropy 0.54524 (0.54697)	Top-1 acc 62.500 (66.678)	Top-5 acc 82.031 (85.737)	lr 0.00192
Train [99][1820/3239]	Time 0.321 (0.535)	Data Time 0.001 (0.021)	Loss 2.3770 (2.3829)	Entropy 0.54518 (0.54696)	Top-1 acc 67.188 (66.675)	Top-5 acc 84.375 (85.738)	lr 0.00192
Train [99][1830/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.021)	Loss 2.3673 (2.3828)	Entropy 0.54511 (0.54695)	Top-1 acc 65.625 (66.676)	Top-5 acc 86.719 (85.741)	lr 0.00192
Train [99][1840/3239]	Time 0.221 (0.533)	Data Time 0.001 (0.021)	Loss 2.5335 (2.3826)	Entropy 0.54542 (0.54694)	Top-1 acc 63.281 (66.678)	Top-5 acc 83.594 (85.743)	lr 0.00192
Train [99][1850/3239]	Time 0.211 (0.533)	Data Time 0.001 (0.021)	Loss 2.4534 (2.3826)	Entropy 0.54567 (0.54694)	Top-1 acc 64.844 (66.672)	Top-5 acc 83.594 (85.743)	lr 0.00192
Train [99][1860/3239]	Time 0.233 (0.532)	Data Time 0.001 (0.021)	Loss 2.1309 (2.3824)	Entropy 0.54574 (0.54693)	Top-1 acc 73.438 (66.672)	Top-5 acc 88.672 (85.746)	lr 0.00192
Train [99][1870/3239]	Time 0.248 (0.531)	Data Time 0.001 (0.021)	Loss 2.3236 (2.3824)	Entropy 0.54566 (0.54692)	Top-1 acc 70.312 (66.681)	Top-5 acc 86.719 (85.741)	lr 0.00191
Train [99][1880/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.021)	Loss 2.3394 (2.3824)	Entropy 0.54587 (0.54692)	Top-1 acc 66.406 (66.679)	Top-5 acc 83.203 (85.737)	lr 0.00191
Train [99][1890/3239]	Time 0.348 (0.530)	Data Time 0.001 (0.020)	Loss 2.6102 (2.3822)	Entropy 0.54597 (0.54691)	Top-1 acc 57.422 (66.687)	Top-5 acc 82.812 (85.739)	lr 0.00191
Train [99][1900/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.020)	Loss 2.3833 (2.3823)	Entropy 0.54585 (0.54691)	Top-1 acc 66.797 (66.683)	Top-5 acc 85.156 (85.737)	lr 0.00191
Train [99][1910/3239]	Time 0.240 (0.529)	Data Time 0.001 (0.020)	Loss 2.2288 (2.3824)	Entropy 0.54582 (0.54690)	Top-1 acc 71.484 (66.683)	Top-5 acc 87.500 (85.734)	lr 0.00191
Train [99][1920/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.020)	Loss 2.4762 (2.3823)	Entropy 0.54584 (0.54690)	Top-1 acc 64.062 (66.687)	Top-5 acc 84.375 (85.739)	lr 0.00191
Train [99][1930/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.020)	Loss 2.1349 (2.3823)	Entropy 0.54582 (0.54689)	Top-1 acc 74.609 (66.689)	Top-5 acc 88.672 (85.736)	lr 0.00191
Train [99][1940/3239]	Time 0.236 (0.528)	Data Time 0.001 (0.020)	Loss 2.4490 (2.3822)	Entropy 0.54579 (0.54689)	Top-1 acc 64.844 (66.698)	Top-5 acc 85.938 (85.735)	lr 0.00191
Train [99][1950/3239]	Time 0.229 (0.527)	Data Time 0.001 (0.020)	Loss 2.5387 (2.3824)	Entropy 0.54596 (0.54688)	Top-1 acc 60.156 (66.685)	Top-5 acc 83.594 (85.727)	lr 0.00191
Train [99][1960/3239]	Time 0.226 (0.526)	Data Time 0.001 (0.020)	Loss 2.5123 (2.3825)	Entropy 0.54614 (0.54688)	Top-1 acc 63.281 (66.684)	Top-5 acc 82.422 (85.726)	lr 0.00191
Train [99][1970/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.020)	Loss 2.4388 (2.3824)	Entropy 0.54639 (0.54687)	Top-1 acc 62.891 (66.687)	Top-5 acc 85.547 (85.733)	lr 0.00191
Train [99][1980/3239]	Time 0.265 (0.525)	Data Time 0.001 (0.020)	Loss 2.4865 (2.3826)	Entropy 0.54660 (0.54687)	Top-1 acc 64.453 (66.679)	Top-5 acc 83.984 (85.731)	lr 0.00191
Train [99][1990/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.020)	Loss 2.4335 (2.3828)	Entropy 0.54611 (0.54687)	Top-1 acc 67.188 (66.681)	Top-5 acc 85.156 (85.727)	lr 0.00191
Train [99][2000/3239]	Time 0.242 (0.524)	Data Time 0.001 (0.019)	Loss 2.4230 (2.3828)	Entropy 0.54604 (0.54686)	Top-1 acc 62.891 (66.675)	Top-5 acc 86.719 (85.724)	lr 0.00191
Train [99][2010/3239]	Time 0.319 (0.524)	Data Time 0.009 (0.019)	Loss 2.1586 (2.3826)	Entropy 0.54590 (0.54686)	Top-1 acc 75.000 (66.682)	Top-5 acc 88.672 (85.726)	lr 0.00191
Train [99][2020/3239]	Time 0.219 (0.524)	Data Time 0.001 (0.019)	Loss 2.5416 (2.3823)	Entropy 0.54607 (0.54686)	Top-1 acc 61.719 (66.691)	Top-5 acc 82.422 (85.732)	lr 0.00191
Train [99][2030/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.019)	Loss 2.3520 (2.3823)	Entropy 0.54597 (0.54685)	Top-1 acc 68.750 (66.691)	Top-5 acc 85.938 (85.733)	lr 0.00191
Train [99][2040/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.019)	Loss 2.4211 (2.3822)	Entropy 0.54631 (0.54685)	Top-1 acc 69.141 (66.697)	Top-5 acc 84.375 (85.734)	lr 0.00191
Train [99][2050/3239]	Time 0.322 (0.522)	Data Time 0.001 (0.019)	Loss 2.4024 (2.3820)	Entropy 0.54621 (0.54684)	Top-1 acc 67.969 (66.701)	Top-5 acc 84.766 (85.735)	lr 0.00191
Train [99][2060/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.019)	Loss 2.2414 (2.3817)	Entropy 0.54600 (0.54684)	Top-1 acc 70.703 (66.707)	Top-5 acc 88.672 (85.740)	lr 0.00190
Train [99][2070/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.019)	Loss 2.5073 (2.3818)	Entropy 0.54569 (0.54684)	Top-1 acc 64.844 (66.706)	Top-5 acc 84.766 (85.738)	lr 0.00190
Train [99][2080/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.019)	Loss 2.4863 (2.3818)	Entropy 0.54585 (0.54683)	Top-1 acc 64.453 (66.704)	Top-5 acc 84.766 (85.738)	lr 0.00190
Train [99][2090/3239]	Time 0.360 (0.546)	Data Time 0.004 (0.019)	Loss 2.2500 (2.3818)	Entropy 0.54571 (0.54683)	Top-1 acc 69.922 (66.705)	Top-5 acc 87.500 (85.738)	lr 0.00190
Train [99][2100/3239]	Time 0.245 (0.546)	Data Time 0.002 (0.019)	Loss 2.4289 (2.3819)	Entropy 0.54561 (0.54682)	Top-1 acc 67.578 (66.704)	Top-5 acc 85.547 (85.738)	lr 0.00190
Train [99][2110/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.019)	Loss 2.3291 (2.3826)	Entropy 0.54556 (0.54682)	Top-1 acc 67.578 (66.689)	Top-5 acc 84.766 (85.730)	lr 0.00190
Train [99][2120/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.018)	Loss 2.2285 (2.3825)	Entropy 0.54548 (0.54681)	Top-1 acc 69.531 (66.682)	Top-5 acc 89.062 (85.734)	lr 0.00190
Train [99][2130/3239]	Time 0.239 (0.544)	Data Time 0.001 (0.018)	Loss 2.3168 (2.3826)	Entropy 0.54563 (0.54680)	Top-1 acc 66.797 (66.675)	Top-5 acc 85.547 (85.733)	lr 0.00190
Train [99][2140/3239]	Time 0.259 (0.544)	Data Time 0.001 (0.018)	Loss 2.2725 (2.3827)	Entropy 0.54538 (0.54680)	Top-1 acc 68.750 (66.672)	Top-5 acc 89.062 (85.731)	lr 0.00190
Train [99][2150/3239]	Time 0.228 (0.543)	Data Time 0.001 (0.018)	Loss 2.3690 (2.3828)	Entropy 0.54502 (0.54679)	Top-1 acc 66.016 (66.665)	Top-5 acc 85.938 (85.728)	lr 0.00190
Train [99][2160/3239]	Time 0.231 (0.543)	Data Time 0.001 (0.018)	Loss 2.2666 (2.3830)	Entropy 0.54486 (0.54678)	Top-1 acc 64.453 (66.661)	Top-5 acc 88.281 (85.725)	lr 0.00190
Train [99][2170/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.018)	Loss 2.2670 (2.3829)	Entropy 0.54481 (0.54677)	Top-1 acc 69.141 (66.663)	Top-5 acc 88.672 (85.726)	lr 0.00190
Train [99][2180/3239]	Time 0.215 (0.541)	Data Time 0.001 (0.018)	Loss 2.4279 (2.3827)	Entropy 0.54504 (0.54676)	Top-1 acc 65.234 (66.668)	Top-5 acc 83.984 (85.732)	lr 0.00190
Train [99][2190/3239]	Time 0.416 (0.541)	Data Time 0.002 (0.018)	Loss 2.3790 (2.3827)	Entropy 0.54519 (0.54676)	Top-1 acc 66.406 (66.664)	Top-5 acc 86.328 (85.729)	lr 0.00190
Train [99][2200/3239]	Time 0.240 (0.541)	Data Time 0.001 (0.018)	Loss 2.2302 (2.3826)	Entropy 0.54547 (0.54675)	Top-1 acc 71.875 (66.669)	Top-5 acc 87.891 (85.732)	lr 0.00190
Train [99][2210/3239]	Time 0.327 (0.540)	Data Time 0.001 (0.018)	Loss 2.3465 (2.3826)	Entropy 0.54548 (0.54674)	Top-1 acc 64.844 (66.665)	Top-5 acc 86.328 (85.729)	lr 0.00190
Train [99][2220/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.018)	Loss 2.3689 (2.3825)	Entropy 0.54568 (0.54674)	Top-1 acc 68.359 (66.666)	Top-5 acc 85.156 (85.725)	lr 0.00190
Train [99][2230/3239]	Time 0.238 (0.539)	Data Time 0.001 (0.018)	Loss 2.4266 (2.3825)	Entropy 0.54539 (0.54673)	Top-1 acc 64.844 (66.668)	Top-5 acc 87.500 (85.726)	lr 0.00190
Train [99][2240/3239]	Time 0.239 (0.539)	Data Time 0.001 (0.018)	Loss 2.5284 (2.3825)	Entropy 0.54538 (0.54673)	Top-1 acc 62.891 (66.668)	Top-5 acc 80.859 (85.725)	lr 0.00190
Train [99][2250/3239]	Time 0.226 (0.538)	Data Time 0.001 (0.017)	Loss 2.3421 (2.3822)	Entropy 0.54557 (0.54672)	Top-1 acc 72.266 (66.677)	Top-5 acc 87.891 (85.732)	lr 0.00189
Train [99][2260/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.017)	Loss 2.2305 (2.3822)	Entropy 0.54544 (0.54672)	Top-1 acc 72.266 (66.680)	Top-5 acc 86.328 (85.731)	lr 0.00189
Train [99][2270/3239]	Time 0.234 (0.537)	Data Time 0.001 (0.017)	Loss 2.6093 (2.3825)	Entropy 0.54587 (0.54671)	Top-1 acc 64.062 (66.676)	Top-5 acc 80.078 (85.727)	lr 0.00189
Train [99][2280/3239]	Time 0.367 (0.537)	Data Time 0.001 (0.017)	Loss 2.4680 (2.3823)	Entropy 0.54609 (0.54671)	Top-1 acc 64.844 (66.678)	Top-5 acc 80.859 (85.727)	lr 0.00189
Train [99][2290/3239]	Time 0.223 (0.537)	Data Time 0.001 (0.017)	Loss 2.3329 (2.3822)	Entropy 0.54574 (0.54670)	Top-1 acc 68.750 (66.684)	Top-5 acc 84.375 (85.727)	lr 0.00189
Train [99][2300/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.017)	Loss 2.4047 (2.3824)	Entropy 0.54559 (0.54670)	Top-1 acc 67.578 (66.678)	Top-5 acc 83.984 (85.721)	lr 0.00189
Train [99][2310/3239]	Time 0.264 (0.536)	Data Time 0.001 (0.017)	Loss 2.2802 (2.3823)	Entropy 0.54577 (0.54670)	Top-1 acc 69.922 (66.674)	Top-5 acc 87.109 (85.722)	lr 0.00189
Train [99][2320/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.017)	Loss 2.4441 (2.3823)	Entropy 0.54599 (0.54669)	Top-1 acc 63.672 (66.675)	Top-5 acc 84.375 (85.718)	lr 0.00189
Train [99][2330/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.017)	Loss 2.2029 (2.3826)	Entropy 0.54565 (0.54669)	Top-1 acc 72.266 (66.672)	Top-5 acc 88.672 (85.711)	lr 0.00189
Train [99][2340/3239]	Time 0.243 (0.534)	Data Time 0.002 (0.017)	Loss 2.2230 (2.3825)	Entropy 0.54583 (0.54668)	Top-1 acc 72.266 (66.673)	Top-5 acc 90.625 (85.714)	lr 0.00189
Train [99][2350/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.017)	Loss 2.2267 (2.3822)	Entropy 0.54621 (0.54668)	Top-1 acc 67.578 (66.680)	Top-5 acc 88.672 (85.722)	lr 0.00189
Train [99][2360/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.017)	Loss 2.3393 (2.3823)	Entropy 0.54629 (0.54668)	Top-1 acc 69.141 (66.676)	Top-5 acc 86.328 (85.719)	lr 0.00189
Train [99][2370/3239]	Time 0.322 (0.533)	Data Time 0.001 (0.017)	Loss 2.3917 (2.3822)	Entropy 0.54609 (0.54668)	Top-1 acc 67.578 (66.679)	Top-5 acc 83.594 (85.721)	lr 0.00189
Train [99][2380/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.017)	Loss 2.3828 (2.3822)	Entropy 0.54596 (0.54667)	Top-1 acc 65.625 (66.679)	Top-5 acc 83.984 (85.719)	lr 0.00189
Train [99][2390/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.017)	Loss 2.4175 (2.3820)	Entropy 0.54591 (0.54667)	Top-1 acc 66.016 (66.681)	Top-5 acc 87.109 (85.723)	lr 0.00189
Train [99][2400/3239]	Time 0.237 (0.531)	Data Time 0.001 (0.016)	Loss 2.5751 (2.3818)	Entropy 0.54554 (0.54667)	Top-1 acc 64.844 (66.690)	Top-5 acc 82.812 (85.726)	lr 0.00189
Train [99][2410/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.016)	Loss 2.2754 (2.3818)	Entropy 0.54555 (0.54666)	Top-1 acc 67.188 (66.691)	Top-5 acc 87.109 (85.727)	lr 0.00189
Train [99][2420/3239]	Time 0.248 (0.530)	Data Time 0.001 (0.016)	Loss 2.2730 (2.3817)	Entropy 0.54531 (0.54666)	Top-1 acc 71.094 (66.693)	Top-5 acc 89.062 (85.729)	lr 0.00189
Train [99][2430/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.016)	Loss 2.2845 (2.3818)	Entropy 0.54562 (0.54665)	Top-1 acc 70.312 (66.691)	Top-5 acc 85.547 (85.726)	lr 0.00188
Train [99][2440/3239]	Time 0.363 (0.530)	Data Time 0.039 (0.016)	Loss 2.4139 (2.3816)	Entropy 0.54576 (0.54665)	Top-1 acc 66.406 (66.689)	Top-5 acc 85.156 (85.730)	lr 0.00188
Train [99][2450/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.016)	Loss 2.2609 (2.3818)	Entropy 0.54560 (0.54665)	Top-1 acc 69.141 (66.681)	Top-5 acc 85.547 (85.729)	lr 0.00188
Train [99][2460/3239]	Time 0.286 (0.529)	Data Time 0.001 (0.016)	Loss 2.3426 (2.3816)	Entropy 0.54545 (0.54664)	Top-1 acc 68.750 (66.686)	Top-5 acc 87.109 (85.735)	lr 0.00188
Train [99][2470/3239]	Time 0.312 (0.529)	Data Time 0.001 (0.016)	Loss 2.5077 (2.3818)	Entropy 0.54522 (0.54664)	Top-1 acc 64.844 (66.683)	Top-5 acc 86.328 (85.733)	lr 0.00188
Train [99][2480/3239]	Time 0.238 (0.529)	Data Time 0.001 (0.016)	Loss 2.1850 (2.3818)	Entropy 0.54505 (0.54663)	Top-1 acc 75.391 (66.677)	Top-5 acc 87.500 (85.731)	lr 0.00188
Train [99][2490/3239]	Time 0.229 (0.528)	Data Time 0.001 (0.016)	Loss 2.3060 (2.3818)	Entropy 0.54488 (0.54662)	Top-1 acc 68.750 (66.676)	Top-5 acc 87.500 (85.730)	lr 0.00188
Train [99][2500/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.016)	Loss 2.3728 (2.3818)	Entropy 0.54491 (0.54662)	Top-1 acc 64.062 (66.678)	Top-5 acc 85.156 (85.731)	lr 0.00188
Train [99][2510/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.016)	Loss 2.1259 (2.3817)	Entropy 0.54478 (0.54661)	Top-1 acc 72.656 (66.676)	Top-5 acc 92.188 (85.734)	lr 0.00188
Train [99][2520/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.016)	Loss 2.3769 (2.3819)	Entropy 0.54501 (0.54660)	Top-1 acc 70.703 (66.672)	Top-5 acc 83.984 (85.729)	lr 0.00188
Train [99][2530/3239]	Time 0.244 (0.527)	Data Time 0.001 (0.016)	Loss 2.2619 (2.3818)	Entropy 0.54510 (0.54660)	Top-1 acc 68.750 (66.673)	Top-5 acc 87.891 (85.731)	lr 0.00188
Train [99][2540/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.016)	Loss 2.4446 (2.3816)	Entropy 0.54471 (0.54659)	Top-1 acc 64.453 (66.676)	Top-5 acc 85.547 (85.734)	lr 0.00188
Train [99][2550/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.016)	Loss 2.3160 (2.3815)	Entropy 0.54425 (0.54658)	Top-1 acc 68.359 (66.679)	Top-5 acc 86.719 (85.738)	lr 0.00188
Train [99][2560/3239]	Time 0.220 (0.525)	Data Time 0.001 (0.016)	Loss 2.2740 (2.3815)	Entropy 0.54439 (0.54657)	Top-1 acc 69.922 (66.677)	Top-5 acc 85.938 (85.737)	lr 0.00188
Train [99][2570/3239]	Time 0.224 (0.525)	Data Time 0.001 (0.016)	Loss 2.3629 (2.3816)	Entropy 0.54439 (0.54657)	Top-1 acc 65.234 (66.674)	Top-5 acc 84.766 (85.735)	lr 0.00188
Train [99][2580/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.015)	Loss 2.1845 (2.3816)	Entropy 0.54433 (0.54656)	Top-1 acc 70.703 (66.672)	Top-5 acc 90.625 (85.736)	lr 0.00188
Train [99][2590/3239]	Time 0.258 (0.524)	Data Time 0.001 (0.015)	Loss 2.3404 (2.3817)	Entropy 0.54447 (0.54655)	Top-1 acc 67.188 (66.667)	Top-5 acc 87.891 (85.737)	lr 0.00188
Train [99][2600/3239]	Time 0.321 (0.524)	Data Time 0.001 (0.015)	Loss 2.4549 (2.3817)	Entropy 0.54444 (0.54654)	Top-1 acc 65.234 (66.669)	Top-5 acc 84.375 (85.739)	lr 0.00188
Train [99][2610/3239]	Time 0.278 (0.523)	Data Time 0.002 (0.015)	Loss 2.2292 (2.3813)	Entropy 0.54409 (0.54653)	Top-1 acc 70.312 (66.676)	Top-5 acc 87.891 (85.749)	lr 0.00188
Train [99][2620/3239]	Time 0.241 (0.523)	Data Time 0.002 (0.015)	Loss 2.5833 (2.3813)	Entropy 0.54390 (0.54652)	Top-1 acc 60.547 (66.676)	Top-5 acc 80.469 (85.748)	lr 0.00187
Train [99][2630/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.015)	Loss 2.0687 (2.3811)	Entropy 0.54364 (0.54651)	Top-1 acc 74.219 (66.681)	Top-5 acc 90.625 (85.750)	lr 0.00187
Train [99][2640/3239]	Time 0.214 (0.523)	Data Time 0.001 (0.015)	Loss 2.6981 (2.3811)	Entropy 0.54358 (0.54650)	Top-1 acc 57.031 (66.677)	Top-5 acc 80.859 (85.748)	lr 0.00187
Train [99][2650/3239]	Time 0.248 (0.522)	Data Time 0.001 (0.015)	Loss 2.2756 (2.3809)	Entropy 0.54331 (0.54649)	Top-1 acc 70.312 (66.686)	Top-5 acc 87.109 (85.750)	lr 0.00187
Train [99][2660/3239]	Time 0.265 (0.522)	Data Time 0.001 (0.015)	Loss 2.2935 (2.3810)	Entropy 0.54336 (0.54648)	Top-1 acc 69.141 (66.681)	Top-5 acc 87.500 (85.749)	lr 0.00187
Train [99][2670/3239]	Time 0.359 (0.521)	Data Time 0.001 (0.015)	Loss 2.3222 (2.3808)	Entropy 0.54320 (0.54647)	Top-1 acc 67.578 (66.687)	Top-5 acc 85.156 (85.753)	lr 0.00187
Train [99][2680/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.015)	Loss 2.4298 (2.3810)	Entropy 0.54316 (0.54645)	Top-1 acc 65.625 (66.683)	Top-5 acc 85.547 (85.748)	lr 0.00187
Train [99][2690/3239]	Time 0.222 (0.521)	Data Time 0.001 (0.015)	Loss 2.2499 (2.3808)	Entropy 0.54294 (0.54644)	Top-1 acc 68.750 (66.683)	Top-5 acc 87.500 (85.749)	lr 0.00187
Train [99][2700/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.015)	Loss 2.4997 (2.3808)	Entropy 0.54278 (0.54643)	Top-1 acc 63.281 (66.686)	Top-5 acc 83.984 (85.750)	lr 0.00187
Train [99][2710/3239]	Time 0.223 (0.520)	Data Time 0.002 (0.015)	Loss 2.3797 (2.3807)	Entropy 0.54286 (0.54642)	Top-1 acc 67.578 (66.684)	Top-5 acc 88.281 (85.752)	lr 0.00187
Train [99][2720/3239]	Time 0.219 (0.520)	Data Time 0.001 (0.015)	Loss 2.5174 (2.3806)	Entropy 0.54240 (0.54640)	Top-1 acc 63.672 (66.687)	Top-5 acc 85.938 (85.754)	lr 0.00187
Train [99][2730/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.015)	Loss 2.4168 (2.3807)	Entropy 0.54235 (0.54639)	Top-1 acc 61.328 (66.683)	Top-5 acc 84.766 (85.754)	lr 0.00187
Train [99][2740/3239]	Time 0.234 (0.519)	Data Time 0.001 (0.015)	Loss 2.1891 (2.3808)	Entropy 0.54200 (0.54637)	Top-1 acc 69.922 (66.679)	Top-5 acc 90.234 (85.754)	lr 0.00187
Train [99][2750/3239]	Time 0.339 (0.538)	Data Time 0.025 (0.015)	Loss 2.3285 (2.3806)	Entropy 0.54194 (0.54636)	Top-1 acc 69.141 (66.688)	Top-5 acc 83.984 (85.756)	lr 0.00187
Train [99][2760/3239]	Time 0.336 (0.537)	Data Time 0.002 (0.015)	Loss 2.2972 (2.3804)	Entropy 0.54175 (0.54634)	Top-1 acc 68.750 (66.693)	Top-5 acc 87.891 (85.758)	lr 0.00187
Train [99][2770/3239]	Time 0.271 (0.537)	Data Time 0.002 (0.015)	Loss 2.2284 (2.3801)	Entropy 0.54200 (0.54632)	Top-1 acc 67.578 (66.698)	Top-5 acc 88.672 (85.760)	lr 0.00187
Train [99][2780/3239]	Time 0.246 (0.537)	Data Time 0.001 (0.014)	Loss 2.3007 (2.3800)	Entropy 0.54220 (0.54631)	Top-1 acc 67.188 (66.699)	Top-5 acc 88.281 (85.762)	lr 0.00187
Train [99][2790/3239]	Time 0.229 (0.536)	Data Time 0.001 (0.014)	Loss 2.4821 (2.3800)	Entropy 0.54249 (0.54629)	Top-1 acc 62.891 (66.699)	Top-5 acc 85.547 (85.762)	lr 0.00187
Train [99][2800/3239]	Time 0.284 (0.536)	Data Time 0.002 (0.014)	Loss 2.4171 (2.3804)	Entropy 0.54276 (0.54628)	Top-1 acc 64.453 (66.689)	Top-5 acc 85.547 (85.754)	lr 0.00187
Train [99][2810/3239]	Time 0.250 (0.536)	Data Time 0.001 (0.014)	Loss 2.6091 (2.3804)	Entropy 0.54299 (0.54627)	Top-1 acc 63.672 (66.688)	Top-5 acc 81.641 (85.755)	lr 0.00186
Train [99][2820/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.014)	Loss 2.3977 (2.3803)	Entropy 0.54290 (0.54626)	Top-1 acc 60.938 (66.687)	Top-5 acc 83.984 (85.754)	lr 0.00186
Train [99][2830/3239]	Time 0.346 (0.535)	Data Time 0.001 (0.014)	Loss 2.2402 (2.3806)	Entropy 0.54257 (0.54624)	Top-1 acc 71.875 (66.681)	Top-5 acc 86.328 (85.751)	lr 0.00186
Train [99][2840/3239]	Time 0.236 (0.535)	Data Time 0.001 (0.014)	Loss 2.2453 (2.3806)	Entropy 0.54294 (0.54623)	Top-1 acc 69.141 (66.682)	Top-5 acc 89.844 (85.752)	lr 0.00186
Train [99][2850/3239]	Time 0.245 (0.535)	Data Time 0.001 (0.014)	Loss 2.2450 (2.3805)	Entropy 0.54318 (0.54622)	Top-1 acc 67.969 (66.684)	Top-5 acc 88.672 (85.754)	lr 0.00186
Train [99][2860/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.014)	Loss 2.6417 (2.3803)	Entropy 0.54325 (0.54621)	Top-1 acc 62.109 (66.687)	Top-5 acc 83.203 (85.758)	lr 0.00186
Train [99][2870/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.014)	Loss 2.2722 (2.3807)	Entropy 0.54358 (0.54620)	Top-1 acc 69.922 (66.681)	Top-5 acc 88.281 (85.751)	lr 0.00186
Train [99][2880/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.014)	Loss 2.3803 (2.3805)	Entropy 0.54316 (0.54619)	Top-1 acc 64.453 (66.685)	Top-5 acc 86.719 (85.751)	lr 0.00186
Train [99][2890/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.014)	Loss 2.5694 (2.3806)	Entropy 0.54321 (0.54618)	Top-1 acc 61.719 (66.679)	Top-5 acc 82.031 (85.747)	lr 0.00186
Train [99][2900/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.014)	Loss 2.3389 (2.3806)	Entropy 0.54314 (0.54617)	Top-1 acc 66.406 (66.680)	Top-5 acc 86.719 (85.749)	lr 0.00186
Train [99][2910/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.014)	Loss 2.2714 (2.3806)	Entropy 0.54335 (0.54616)	Top-1 acc 68.359 (66.681)	Top-5 acc 89.453 (85.751)	lr 0.00186
Train [99][2920/3239]	Time 0.340 (0.532)	Data Time 0.001 (0.014)	Loss 2.3636 (2.3804)	Entropy 0.54325 (0.54615)	Top-1 acc 68.750 (66.684)	Top-5 acc 88.672 (85.755)	lr 0.00186
Train [99][2930/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.014)	Loss 2.4602 (2.3803)	Entropy 0.54310 (0.54614)	Top-1 acc 65.234 (66.684)	Top-5 acc 83.984 (85.755)	lr 0.00186
Train [99][2940/3239]	Time 0.222 (0.531)	Data Time 0.001 (0.014)	Loss 2.4012 (2.3802)	Entropy 0.54336 (0.54613)	Top-1 acc 65.234 (66.687)	Top-5 acc 85.156 (85.755)	lr 0.00186
Train [99][2950/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.014)	Loss 2.3936 (2.3802)	Entropy 0.54349 (0.54612)	Top-1 acc 66.797 (66.684)	Top-5 acc 86.328 (85.754)	lr 0.00186
Train [99][2960/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.014)	Loss 2.4098 (2.3800)	Entropy 0.54394 (0.54611)	Top-1 acc 64.062 (66.688)	Top-5 acc 86.328 (85.759)	lr 0.00186
Train [99][2970/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.014)	Loss 2.2185 (2.3797)	Entropy 0.54407 (0.54611)	Top-1 acc 71.094 (66.695)	Top-5 acc 89.844 (85.764)	lr 0.00186
Train [99][2980/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.014)	Loss 2.2713 (2.3794)	Entropy 0.54412 (0.54610)	Top-1 acc 71.094 (66.703)	Top-5 acc 85.547 (85.771)	lr 0.00186
Train [99][2990/3239]	Time 0.333 (0.529)	Data Time 0.001 (0.014)	Loss 2.5813 (2.3792)	Entropy 0.54411 (0.54609)	Top-1 acc 62.500 (66.705)	Top-5 acc 83.594 (85.775)	lr 0.00186
Train [99][3000/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.014)	Loss 2.5144 (2.3791)	Entropy 0.54426 (0.54609)	Top-1 acc 64.844 (66.706)	Top-5 acc 83.984 (85.779)	lr 0.00185
Train [99][3010/3239]	Time 0.256 (0.529)	Data Time 0.001 (0.014)	Loss 2.1608 (2.3789)	Entropy 0.54449 (0.54608)	Top-1 acc 69.922 (66.711)	Top-5 acc 91.797 (85.782)	lr 0.00185
Train [99][3020/3239]	Time 0.245 (0.528)	Data Time 0.001 (0.013)	Loss 2.2193 (2.3789)	Entropy 0.54480 (0.54607)	Top-1 acc 72.656 (66.712)	Top-5 acc 89.062 (85.781)	lr 0.00185
Train [99][3030/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.013)	Loss 2.4989 (2.3791)	Entropy 0.54434 (0.54607)	Top-1 acc 65.234 (66.708)	Top-5 acc 83.203 (85.777)	lr 0.00185
Train [99][3040/3239]	Time 0.226 (0.528)	Data Time 0.001 (0.013)	Loss 2.5975 (2.3796)	Entropy 0.54453 (0.54606)	Top-1 acc 60.156 (66.695)	Top-5 acc 84.375 (85.768)	lr 0.00185
Train [99][3050/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.013)	Loss 2.1808 (2.3797)	Entropy 0.54489 (0.54606)	Top-1 acc 71.094 (66.690)	Top-5 acc 89.062 (85.766)	lr 0.00185
Train [99][3060/3239]	Time 0.223 (0.527)	Data Time 0.001 (0.013)	Loss 2.2853 (2.3794)	Entropy 0.54496 (0.54606)	Top-1 acc 68.359 (66.699)	Top-5 acc 87.109 (85.770)	lr 0.00185
Train [99][3070/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.013)	Loss 2.4821 (2.3796)	Entropy 0.54496 (0.54605)	Top-1 acc 65.234 (66.691)	Top-5 acc 83.984 (85.767)	lr 0.00185
Train [99][3080/3239]	Time 0.327 (0.526)	Data Time 0.001 (0.013)	Loss 2.3951 (2.3795)	Entropy 0.54514 (0.54605)	Top-1 acc 64.453 (66.695)	Top-5 acc 84.766 (85.770)	lr 0.00185
Train [99][3090/3239]	Time 0.246 (0.526)	Data Time 0.001 (0.013)	Loss 2.5260 (2.3796)	Entropy 0.54532 (0.54605)	Top-1 acc 65.625 (66.695)	Top-5 acc 84.766 (85.770)	lr 0.00185
Train [99][3100/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.013)	Loss 2.3959 (2.3796)	Entropy 0.54582 (0.54604)	Top-1 acc 65.234 (66.694)	Top-5 acc 83.984 (85.768)	lr 0.00185
Train [99][3110/3239]	Time 0.264 (0.525)	Data Time 0.002 (0.013)	Loss 2.5185 (2.3796)	Entropy 0.54564 (0.54604)	Top-1 acc 66.406 (66.693)	Top-5 acc 83.203 (85.769)	lr 0.00185
Train [99][3120/3239]	Time 0.264 (0.525)	Data Time 0.001 (0.013)	Loss 2.5258 (2.3794)	Entropy 0.54571 (0.54604)	Top-1 acc 63.672 (66.700)	Top-5 acc 82.812 (85.770)	lr 0.00185
Train [99][3130/3239]	Time 0.241 (0.525)	Data Time 0.001 (0.013)	Loss 2.3498 (2.3794)	Entropy 0.54563 (0.54604)	Top-1 acc 66.406 (66.700)	Top-5 acc 85.156 (85.769)	lr 0.00185
Train [99][3140/3239]	Time 0.255 (0.525)	Data Time 0.001 (0.013)	Loss 2.3988 (2.3795)	Entropy 0.54535 (0.54604)	Top-1 acc 67.969 (66.700)	Top-5 acc 85.156 (85.767)	lr 0.00185
Train [99][3150/3239]	Time 0.332 (0.524)	Data Time 0.001 (0.013)	Loss 2.5176 (2.3796)	Entropy 0.54504 (0.54604)	Top-1 acc 65.234 (66.696)	Top-5 acc 85.938 (85.768)	lr 0.00185
Train [99][3160/3239]	Time 0.229 (0.524)	Data Time 0.001 (0.013)	Loss 2.4007 (2.3794)	Entropy 0.54523 (0.54603)	Top-1 acc 66.797 (66.701)	Top-5 acc 85.547 (85.771)	lr 0.00185
Train [99][3170/3239]	Time 0.232 (0.524)	Data Time 0.002 (0.013)	Loss 2.2450 (2.3792)	Entropy 0.54542 (0.54603)	Top-1 acc 73.828 (66.708)	Top-5 acc 86.719 (85.774)	lr 0.00185
Train [99][3180/3239]	Time 0.267 (0.523)	Data Time 0.000 (0.013)	Loss 2.3712 (2.3793)	Entropy 0.54523 (0.54603)	Top-1 acc 63.281 (66.706)	Top-5 acc 84.766 (85.773)	lr 0.00185
Train [99][3190/3239]	Time 0.217 (0.523)	Data Time 0.000 (0.013)	Loss 2.5563 (2.3794)	Entropy 0.54497 (0.54603)	Top-1 acc 64.844 (66.706)	Top-5 acc 82.812 (85.771)	lr 0.00184
Train [99][3200/3239]	Time 0.224 (0.522)	Data Time 0.000 (0.013)	Loss 2.2240 (2.3794)	Entropy 0.54497 (0.54602)	Top-1 acc 70.703 (66.704)	Top-5 acc 89.453 (85.771)	lr 0.00184
Train [99][3210/3239]	Time 0.221 (0.522)	Data Time 0.000 (0.013)	Loss 2.3326 (2.3794)	Entropy 0.54520 (0.54602)	Top-1 acc 65.234 (66.702)	Top-5 acc 87.500 (85.770)	lr 0.00184
Train [99][3220/3239]	Time 0.218 (0.522)	Data Time 0.000 (0.013)	Loss 2.4534 (2.3795)	Entropy 0.54534 (0.54602)	Top-1 acc 62.891 (66.697)	Top-5 acc 84.375 (85.766)	lr 0.00184
Train [99][3230/3239]	Time 0.221 (0.521)	Data Time 0.000 (0.013)	Loss 2.4355 (2.3796)	Entropy 0.54549 (0.54601)	Top-1 acc 67.578 (66.697)	Top-5 acc 86.328 (85.764)	lr 0.00184
Train [99][3239/3239]	Time 0.782 (0.521)	Data Time 0.000 (0.013)	Loss 2.4543 (2.3796)	Entropy 0.54529 (0.54601)	Top-1 acc 65.432 (66.694)	Top-5 acc 85.185 (85.767)	lr 0.00184
==========Valid [99/120]	loss 1.196	top-1 acc 72.460 (72.460)	top-5 acc 90.252	Train top-1 66.694	top-5 85.767	Entropy 0.54529	Latency-None: 0.000ms	Flops: 539.00M
Train [100][0/3239]	Time 38.719 (38.719)	Data Time 36.736 (36.736)	Loss 2.5731 (2.5731)	Entropy 0.54541 (0.54541)	Top-1 acc 65.234 (65.234)	Top-5 acc 80.859 (80.859)	lr 0.00184
Train [100][10/3239]	Time 0.235 (4.058)	Data Time 0.001 (3.392)	Loss 2.3158 (2.3729)	Entropy 0.54533 (0.54537)	Top-1 acc 66.797 (65.945)	Top-5 acc 86.328 (86.577)	lr 0.00184
Train [100][20/3239]	Time 0.231 (2.321)	Data Time 0.001 (1.778)	Loss 2.3009 (2.3788)	Entropy 0.54531 (0.54536)	Top-1 acc 70.703 (66.704)	Top-5 acc 87.500 (86.031)	lr 0.00184
Train [100][30/3239]	Time 0.223 (1.701)	Data Time 0.001 (1.205)	Loss 2.2723 (2.3649)	Entropy 0.54536 (0.54538)	Top-1 acc 69.141 (67.074)	Top-5 acc 87.891 (86.278)	lr 0.00184
Train [100][40/3239]	Time 0.227 (1.383)	Data Time 0.001 (0.911)	Loss 2.4567 (2.3913)	Entropy 0.54537 (0.54538)	Top-1 acc 66.016 (66.463)	Top-5 acc 85.547 (85.985)	lr 0.00184
Train [100][50/3239]	Time 0.314 (1.191)	Data Time 0.001 (0.733)	Loss 2.3533 (2.3968)	Entropy 0.54567 (0.54541)	Top-1 acc 69.141 (66.498)	Top-5 acc 85.938 (85.846)	lr 0.00184
Train [100][60/3239]	Time 0.231 (1.062)	Data Time 0.001 (0.613)	Loss 2.3932 (2.3927)	Entropy 0.54544 (0.54544)	Top-1 acc 66.406 (66.560)	Top-5 acc 85.547 (85.912)	lr 0.00184
Train [100][70/3239]	Time 0.238 (0.970)	Data Time 0.001 (0.527)	Loss 2.2538 (2.3809)	Entropy 0.54544 (0.54544)	Top-1 acc 69.531 (66.912)	Top-5 acc 89.453 (85.965)	lr 0.00184
Train [100][80/3239]	Time 0.231 (0.901)	Data Time 0.001 (0.462)	Loss 2.2885 (2.3786)	Entropy 0.54532 (0.54543)	Top-1 acc 67.578 (66.898)	Top-5 acc 85.547 (85.918)	lr 0.00184
Train [100][90/3239]	Time 0.255 (0.848)	Data Time 0.002 (0.412)	Loss 2.4608 (2.3835)	Entropy 0.54538 (0.54543)	Top-1 acc 64.453 (66.883)	Top-5 acc 83.594 (85.852)	lr 0.00184
Train [100][100/3239]	Time 0.228 (0.806)	Data Time 0.001 (0.371)	Loss 2.2072 (2.3812)	Entropy 0.54517 (0.54541)	Top-1 acc 68.750 (66.986)	Top-5 acc 88.281 (85.872)	lr 0.00184
Train [100][110/3239]	Time 0.234 (0.769)	Data Time 0.001 (0.338)	Loss 2.4831 (2.3860)	Entropy 0.54513 (0.54538)	Top-1 acc 65.625 (66.952)	Top-5 acc 82.031 (85.807)	lr 0.00184
Train [100][120/3239]	Time 0.236 (0.739)	Data Time 0.001 (0.310)	Loss 2.4877 (2.3872)	Entropy 0.54479 (0.54534)	Top-1 acc 65.625 (66.884)	Top-5 acc 83.203 (85.805)	lr 0.00184
Train [100][130/3239]	Time 0.237 (0.713)	Data Time 0.001 (0.286)	Loss 2.2723 (2.3834)	Entropy 0.54448 (0.54529)	Top-1 acc 70.703 (66.994)	Top-5 acc 87.891 (85.827)	lr 0.00184
Train [100][140/3239]	Time 0.308 (0.691)	Data Time 0.001 (0.266)	Loss 2.3091 (2.3887)	Entropy 0.54438 (0.54523)	Top-1 acc 66.406 (66.794)	Top-5 acc 88.281 (85.721)	lr 0.00183
Train [100][150/3239]	Time 0.258 (0.673)	Data Time 0.002 (0.249)	Loss 2.1738 (2.3846)	Entropy 0.54446 (0.54517)	Top-1 acc 71.875 (66.908)	Top-5 acc 88.672 (85.775)	lr 0.00183
Train [100][160/3239]	Time 0.375 (0.990)	Data Time 0.006 (0.234)	Loss 2.2791 (2.3822)	Entropy 0.54431 (0.54513)	Top-1 acc 66.406 (66.957)	Top-5 acc 89.062 (85.855)	lr 0.00183
Train [100][170/3239]	Time 0.233 (0.963)	Data Time 0.002 (0.220)	Loss 2.5199 (2.3798)	Entropy 0.54431 (0.54508)	Top-1 acc 62.500 (66.991)	Top-5 acc 82.031 (85.894)	lr 0.00183
Train [100][180/3239]	Time 0.235 (0.933)	Data Time 0.001 (0.208)	Loss 2.3274 (2.3796)	Entropy 0.54415 (0.54504)	Top-1 acc 65.625 (66.924)	Top-5 acc 85.938 (85.905)	lr 0.00183
Train [100][190/3239]	Time 0.236 (0.905)	Data Time 0.001 (0.198)	Loss 2.3488 (2.3785)	Entropy 0.54427 (0.54500)	Top-1 acc 68.359 (67.010)	Top-5 acc 86.719 (85.880)	lr 0.00183
Train [100][200/3239]	Time 0.230 (0.881)	Data Time 0.001 (0.188)	Loss 2.3663 (2.3798)	Entropy 0.54435 (0.54496)	Top-1 acc 67.188 (67.028)	Top-5 acc 86.719 (85.819)	lr 0.00183
Train [100][210/3239]	Time 0.315 (0.858)	Data Time 0.001 (0.179)	Loss 2.7639 (2.3830)	Entropy 0.54433 (0.54493)	Top-1 acc 62.500 (66.986)	Top-5 acc 78.516 (85.756)	lr 0.00183
Train [100][220/3239]	Time 0.247 (0.838)	Data Time 0.001 (0.171)	Loss 2.6219 (2.3837)	Entropy 0.54409 (0.54490)	Top-1 acc 61.719 (66.982)	Top-5 acc 81.641 (85.708)	lr 0.00183
Train [100][230/3239]	Time 0.230 (0.820)	Data Time 0.001 (0.164)	Loss 2.2533 (2.3811)	Entropy 0.54408 (0.54487)	Top-1 acc 71.875 (67.042)	Top-5 acc 86.719 (85.770)	lr 0.00183
Train [100][240/3239]	Time 0.225 (0.803)	Data Time 0.001 (0.157)	Loss 2.3865 (2.3793)	Entropy 0.54419 (0.54484)	Top-1 acc 66.016 (67.095)	Top-5 acc 83.984 (85.771)	lr 0.00183
Train [100][250/3239]	Time 0.235 (0.787)	Data Time 0.001 (0.151)	Loss 2.3069 (2.3789)	Entropy 0.54416 (0.54481)	Top-1 acc 69.922 (67.128)	Top-5 acc 87.500 (85.774)	lr 0.00183
Train [100][260/3239]	Time 0.229 (0.772)	Data Time 0.001 (0.145)	Loss 2.2963 (2.3793)	Entropy 0.54397 (0.54478)	Top-1 acc 67.969 (67.063)	Top-5 acc 88.281 (85.782)	lr 0.00183
Train [100][270/3239]	Time 0.230 (0.759)	Data Time 0.001 (0.140)	Loss 2.2256 (2.3795)	Entropy 0.54409 (0.54476)	Top-1 acc 73.438 (67.077)	Top-5 acc 86.719 (85.795)	lr 0.00183
Train [100][280/3239]	Time 0.270 (0.747)	Data Time 0.001 (0.135)	Loss 2.4761 (2.3790)	Entropy 0.54442 (0.54474)	Top-1 acc 66.797 (67.100)	Top-5 acc 85.156 (85.796)	lr 0.00183
Train [100][290/3239]	Time 0.223 (0.735)	Data Time 0.001 (0.130)	Loss 2.4093 (2.3801)	Entropy 0.54446 (0.54473)	Top-1 acc 63.281 (67.063)	Top-5 acc 86.328 (85.786)	lr 0.00183
Train [100][300/3239]	Time 0.328 (0.725)	Data Time 0.001 (0.126)	Loss 2.4280 (2.3793)	Entropy 0.54453 (0.54472)	Top-1 acc 66.406 (67.056)	Top-5 acc 84.375 (85.784)	lr 0.00183
Train [100][310/3239]	Time 0.224 (0.715)	Data Time 0.001 (0.122)	Loss 2.2203 (2.3783)	Entropy 0.54463 (0.54471)	Top-1 acc 67.969 (67.047)	Top-5 acc 90.234 (85.811)	lr 0.00183
Train [100][320/3239]	Time 0.286 (0.708)	Data Time 0.001 (0.118)	Loss 2.2380 (2.3777)	Entropy 0.54464 (0.54471)	Top-1 acc 69.141 (67.079)	Top-5 acc 87.891 (85.794)	lr 0.00183
Train [100][330/3239]	Time 0.280 (0.704)	Data Time 0.001 (0.115)	Loss 2.2021 (2.3756)	Entropy 0.54423 (0.54470)	Top-1 acc 70.703 (67.111)	Top-5 acc 88.281 (85.836)	lr 0.00182
Train [100][340/3239]	Time 0.226 (0.697)	Data Time 0.001 (0.111)	Loss 2.4362 (2.3727)	Entropy 0.54425 (0.54468)	Top-1 acc 63.672 (67.158)	Top-5 acc 83.203 (85.889)	lr 0.00182
Train [100][350/3239]	Time 0.226 (0.689)	Data Time 0.001 (0.108)	Loss 2.3054 (2.3695)	Entropy 0.54413 (0.54467)	Top-1 acc 64.844 (67.230)	Top-5 acc 87.500 (85.942)	lr 0.00182
Train [100][360/3239]	Time 0.222 (0.681)	Data Time 0.001 (0.105)	Loss 2.3247 (2.3712)	Entropy 0.54403 (0.54465)	Top-1 acc 70.312 (67.167)	Top-5 acc 84.375 (85.894)	lr 0.00182
Train [100][370/3239]	Time 0.316 (0.674)	Data Time 0.001 (0.102)	Loss 2.4034 (2.3708)	Entropy 0.54431 (0.54464)	Top-1 acc 66.016 (67.162)	Top-5 acc 84.766 (85.902)	lr 0.00182
Train [100][380/3239]	Time 0.222 (0.667)	Data Time 0.001 (0.100)	Loss 2.3962 (2.3704)	Entropy 0.54430 (0.54463)	Top-1 acc 66.797 (67.169)	Top-5 acc 84.375 (85.914)	lr 0.00182
Train [100][390/3239]	Time 0.228 (0.660)	Data Time 0.001 (0.097)	Loss 2.0975 (2.3675)	Entropy 0.54426 (0.54462)	Top-1 acc 73.828 (67.257)	Top-5 acc 91.406 (85.967)	lr 0.00182
Train [100][400/3239]	Time 0.262 (0.655)	Data Time 0.001 (0.095)	Loss 2.3238 (2.3670)	Entropy 0.54409 (0.54461)	Top-1 acc 68.359 (67.286)	Top-5 acc 87.109 (85.992)	lr 0.00182
Train [100][410/3239]	Time 0.262 (0.649)	Data Time 0.001 (0.093)	Loss 2.3747 (2.3682)	Entropy 0.54417 (0.54460)	Top-1 acc 70.312 (67.308)	Top-5 acc 85.547 (85.979)	lr 0.00182
Train [100][420/3239]	Time 0.235 (0.643)	Data Time 0.001 (0.090)	Loss 2.2157 (2.3678)	Entropy 0.54418 (0.54459)	Top-1 acc 73.828 (67.321)	Top-5 acc 88.281 (85.987)	lr 0.00182
Train [100][430/3239]	Time 0.222 (0.638)	Data Time 0.001 (0.088)	Loss 2.5427 (2.3679)	Entropy 0.54398 (0.54458)	Top-1 acc 64.453 (67.315)	Top-5 acc 82.031 (85.985)	lr 0.00182
Train [100][440/3239]	Time 0.254 (0.633)	Data Time 0.001 (0.086)	Loss 2.2736 (2.3660)	Entropy 0.54359 (0.54456)	Top-1 acc 68.750 (67.377)	Top-5 acc 87.109 (86.029)	lr 0.00182
Train [100][450/3239]	Time 0.234 (0.628)	Data Time 0.001 (0.085)	Loss 2.3199 (2.3670)	Entropy 0.54352 (0.54454)	Top-1 acc 71.094 (67.355)	Top-5 acc 85.938 (86.006)	lr 0.00182
Train [100][460/3239]	Time 0.244 (0.623)	Data Time 0.001 (0.083)	Loss 2.3924 (2.3665)	Entropy 0.54357 (0.54452)	Top-1 acc 67.578 (67.370)	Top-5 acc 86.328 (86.019)	lr 0.00182
Train [100][470/3239]	Time 0.227 (0.619)	Data Time 0.001 (0.081)	Loss 2.5020 (2.3655)	Entropy 0.54386 (0.54450)	Top-1 acc 62.109 (67.398)	Top-5 acc 83.203 (86.028)	lr 0.00182
Train [100][480/3239]	Time 0.226 (0.614)	Data Time 0.001 (0.079)	Loss 2.5396 (2.3669)	Entropy 0.54406 (0.54449)	Top-1 acc 62.891 (67.360)	Top-5 acc 81.250 (85.998)	lr 0.00182
Train [100][490/3239]	Time 0.232 (0.610)	Data Time 0.001 (0.078)	Loss 2.3611 (2.3655)	Entropy 0.54379 (0.54447)	Top-1 acc 69.531 (67.382)	Top-5 acc 85.156 (86.030)	lr 0.00182
Train [100][500/3239]	Time 0.276 (0.608)	Data Time 0.001 (0.076)	Loss 2.3551 (2.3662)	Entropy 0.54394 (0.54446)	Top-1 acc 69.531 (67.364)	Top-5 acc 84.375 (86.014)	lr 0.00182
Train [100][510/3239]	Time 0.233 (0.605)	Data Time 0.001 (0.075)	Loss 2.2963 (2.3663)	Entropy 0.54340 (0.54445)	Top-1 acc 68.750 (67.338)	Top-5 acc 87.500 (86.022)	lr 0.00182
Train [100][520/3239]	Time 0.229 (0.601)	Data Time 0.001 (0.073)	Loss 2.6387 (2.3678)	Entropy 0.54346 (0.54443)	Top-1 acc 59.766 (67.310)	Top-5 acc 79.297 (85.993)	lr 0.00181
Train [100][530/3239]	Time 0.326 (0.597)	Data Time 0.001 (0.072)	Loss 2.5862 (2.3679)	Entropy 0.54337 (0.54441)	Top-1 acc 63.281 (67.310)	Top-5 acc 80.469 (85.993)	lr 0.00181
Train [100][540/3239]	Time 0.229 (0.594)	Data Time 0.001 (0.071)	Loss 2.5415 (2.3673)	Entropy 0.54347 (0.54439)	Top-1 acc 60.938 (67.328)	Top-5 acc 83.984 (86.004)	lr 0.00181
Train [100][550/3239]	Time 0.229 (0.590)	Data Time 0.001 (0.069)	Loss 2.4882 (2.3662)	Entropy 0.54333 (0.54437)	Top-1 acc 64.844 (67.363)	Top-5 acc 84.766 (86.035)	lr 0.00181
Train [100][560/3239]	Time 0.227 (0.587)	Data Time 0.001 (0.068)	Loss 2.2134 (2.3661)	Entropy 0.54342 (0.54436)	Top-1 acc 68.359 (67.371)	Top-5 acc 88.672 (86.031)	lr 0.00181
Train [100][570/3239]	Time 0.231 (0.583)	Data Time 0.001 (0.067)	Loss 2.4287 (2.3659)	Entropy 0.54358 (0.54434)	Top-1 acc 65.234 (67.376)	Top-5 acc 85.156 (86.039)	lr 0.00181
Train [100][580/3239]	Time 0.226 (0.580)	Data Time 0.001 (0.066)	Loss 2.2720 (2.3668)	Entropy 0.54395 (0.54433)	Top-1 acc 67.969 (67.352)	Top-5 acc 86.328 (86.017)	lr 0.00181
Train [100][590/3239]	Time 0.227 (0.577)	Data Time 0.001 (0.065)	Loss 2.3272 (2.3671)	Entropy 0.54405 (0.54432)	Top-1 acc 68.359 (67.357)	Top-5 acc 85.547 (86.009)	lr 0.00181
Train [100][600/3239]	Time 0.317 (0.574)	Data Time 0.001 (0.064)	Loss 2.4549 (2.3674)	Entropy 0.54411 (0.54432)	Top-1 acc 64.453 (67.340)	Top-5 acc 83.594 (85.996)	lr 0.00181
Train [100][610/3239]	Time 0.233 (0.572)	Data Time 0.001 (0.063)	Loss 2.3377 (2.3680)	Entropy 0.54391 (0.54432)	Top-1 acc 67.188 (67.326)	Top-5 acc 88.672 (86.002)	lr 0.00181
Train [100][620/3239]	Time 0.239 (0.569)	Data Time 0.001 (0.062)	Loss 2.5740 (2.3674)	Entropy 0.54398 (0.54431)	Top-1 acc 61.328 (67.336)	Top-5 acc 83.984 (86.017)	lr 0.00181
Train [100][630/3239]	Time 0.231 (0.567)	Data Time 0.001 (0.061)	Loss 2.3653 (2.3677)	Entropy 0.54421 (0.54431)	Top-1 acc 66.406 (67.309)	Top-5 acc 86.328 (86.010)	lr 0.00181
Train [100][640/3239]	Time 0.238 (0.565)	Data Time 0.001 (0.060)	Loss 2.2369 (2.3689)	Entropy 0.54432 (0.54430)	Top-1 acc 69.531 (67.286)	Top-5 acc 89.453 (85.997)	lr 0.00181
Train [100][650/3239]	Time 0.268 (0.562)	Data Time 0.001 (0.059)	Loss 2.4732 (2.3684)	Entropy 0.54412 (0.54430)	Top-1 acc 62.500 (67.276)	Top-5 acc 83.203 (86.001)	lr 0.00181
Train [100][660/3239]	Time 0.242 (0.560)	Data Time 0.001 (0.058)	Loss 2.6161 (2.3690)	Entropy 0.54442 (0.54430)	Top-1 acc 58.984 (67.262)	Top-5 acc 82.031 (85.989)	lr 0.00181
Train [100][670/3239]	Time 0.227 (0.558)	Data Time 0.001 (0.057)	Loss 2.4686 (2.3696)	Entropy 0.54422 (0.54430)	Top-1 acc 62.109 (67.236)	Top-5 acc 84.766 (85.980)	lr 0.00181
Train [100][680/3239]	Time 0.232 (0.555)	Data Time 0.001 (0.056)	Loss 2.4803 (2.3704)	Entropy 0.54416 (0.54430)	Top-1 acc 60.938 (67.208)	Top-5 acc 83.594 (85.970)	lr 0.00181
Train [100][690/3239]	Time 0.324 (0.553)	Data Time 0.001 (0.056)	Loss 2.4765 (2.3702)	Entropy 0.54411 (0.54430)	Top-1 acc 66.016 (67.216)	Top-5 acc 83.984 (85.967)	lr 0.00181
Train [100][700/3239]	Time 0.232 (0.551)	Data Time 0.001 (0.055)	Loss 2.2913 (2.3700)	Entropy 0.54430 (0.54430)	Top-1 acc 69.531 (67.214)	Top-5 acc 88.672 (85.973)	lr 0.00181
Train [100][710/3239]	Time 0.231 (0.549)	Data Time 0.001 (0.054)	Loss 2.3402 (2.3695)	Entropy 0.54447 (0.54430)	Top-1 acc 66.797 (67.216)	Top-5 acc 88.281 (85.991)	lr 0.00180
Train [100][720/3239]	Time 0.232 (0.547)	Data Time 0.001 (0.053)	Loss 2.3861 (2.3704)	Entropy 0.54448 (0.54430)	Top-1 acc 68.359 (67.197)	Top-5 acc 87.109 (85.977)	lr 0.00180
Train [100][730/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.053)	Loss 2.4093 (2.3699)	Entropy 0.54462 (0.54430)	Top-1 acc 66.016 (67.214)	Top-5 acc 85.938 (85.989)	lr 0.00180
Train [100][740/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.052)	Loss 2.3258 (2.3701)	Entropy 0.54465 (0.54431)	Top-1 acc 71.094 (67.212)	Top-5 acc 84.375 (85.989)	lr 0.00180
Train [100][750/3239]	Time 0.231 (0.541)	Data Time 0.001 (0.051)	Loss 2.2317 (2.3696)	Entropy 0.54447 (0.54431)	Top-1 acc 72.656 (67.228)	Top-5 acc 88.281 (85.999)	lr 0.00180
Train [100][760/3239]	Time 0.333 (0.540)	Data Time 0.001 (0.051)	Loss 2.6403 (2.3701)	Entropy 0.54486 (0.54432)	Top-1 acc 61.719 (67.203)	Top-5 acc 81.250 (85.994)	lr 0.00180
Train [100][770/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.050)	Loss 2.1109 (2.3703)	Entropy 0.54433 (0.54432)	Top-1 acc 71.094 (67.184)	Top-5 acc 91.016 (85.994)	lr 0.00180
Train [100][780/3239]	Time 0.234 (0.536)	Data Time 0.001 (0.049)	Loss 2.0676 (2.3704)	Entropy 0.54390 (0.54432)	Top-1 acc 73.047 (67.181)	Top-5 acc 91.016 (85.999)	lr 0.00180
Train [100][790/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.049)	Loss 2.4210 (2.3704)	Entropy 0.54390 (0.54431)	Top-1 acc 68.750 (67.177)	Top-5 acc 83.594 (86.004)	lr 0.00180
Train [100][800/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.048)	Loss 2.5041 (2.3715)	Entropy 0.54398 (0.54431)	Top-1 acc 65.234 (67.158)	Top-5 acc 82.031 (85.982)	lr 0.00180
Train [100][810/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.048)	Loss 2.5926 (2.3725)	Entropy 0.54386 (0.54430)	Top-1 acc 57.422 (67.126)	Top-5 acc 82.422 (85.970)	lr 0.00180
Train [100][820/3239]	Time 0.253 (0.597)	Data Time 0.002 (0.047)	Loss 2.4296 (2.3725)	Entropy 0.54364 (0.54430)	Top-1 acc 63.672 (67.107)	Top-5 acc 85.156 (85.971)	lr 0.00180
Train [100][830/3239]	Time 0.226 (0.595)	Data Time 0.002 (0.047)	Loss 2.3131 (2.3736)	Entropy 0.54366 (0.54429)	Top-1 acc 66.406 (67.077)	Top-5 acc 88.281 (85.951)	lr 0.00180
Train [100][840/3239]	Time 0.261 (0.593)	Data Time 0.001 (0.046)	Loss 2.3481 (2.3736)	Entropy 0.54351 (0.54428)	Top-1 acc 65.234 (67.064)	Top-5 acc 88.281 (85.945)	lr 0.00180
Train [100][850/3239]	Time 0.328 (0.591)	Data Time 0.001 (0.046)	Loss 2.1837 (2.3739)	Entropy 0.54379 (0.54427)	Top-1 acc 70.312 (67.059)	Top-5 acc 89.844 (85.949)	lr 0.00180
Train [100][860/3239]	Time 0.262 (0.589)	Data Time 0.001 (0.045)	Loss 2.5124 (2.3737)	Entropy 0.54359 (0.54427)	Top-1 acc 66.016 (67.068)	Top-5 acc 84.766 (85.962)	lr 0.00180
Train [100][870/3239]	Time 0.286 (0.587)	Data Time 0.001 (0.045)	Loss 2.4214 (2.3735)	Entropy 0.54349 (0.54426)	Top-1 acc 66.797 (67.066)	Top-5 acc 83.984 (85.964)	lr 0.00180
Train [100][880/3239]	Time 0.231 (0.586)	Data Time 0.001 (0.044)	Loss 2.2415 (2.3731)	Entropy 0.54349 (0.54425)	Top-1 acc 69.531 (67.073)	Top-5 acc 87.109 (85.969)	lr 0.00180
Train [100][890/3239]	Time 0.252 (0.584)	Data Time 0.001 (0.044)	Loss 2.4031 (2.3731)	Entropy 0.54368 (0.54424)	Top-1 acc 63.672 (67.091)	Top-5 acc 85.156 (85.968)	lr 0.00180
Train [100][900/3239]	Time 0.235 (0.582)	Data Time 0.001 (0.043)	Loss 2.3622 (2.3728)	Entropy 0.54402 (0.54424)	Top-1 acc 65.234 (67.101)	Top-5 acc 86.719 (85.972)	lr 0.00179
Train [100][910/3239]	Time 0.231 (0.580)	Data Time 0.001 (0.043)	Loss 2.1456 (2.3732)	Entropy 0.54388 (0.54424)	Top-1 acc 69.922 (67.090)	Top-5 acc 90.625 (85.965)	lr 0.00179
Train [100][920/3239]	Time 0.319 (0.578)	Data Time 0.001 (0.042)	Loss 2.4782 (2.3732)	Entropy 0.54399 (0.54423)	Top-1 acc 64.844 (67.090)	Top-5 acc 83.594 (85.969)	lr 0.00179
Train [100][930/3239]	Time 0.226 (0.576)	Data Time 0.001 (0.042)	Loss 2.2768 (2.3732)	Entropy 0.54393 (0.54423)	Top-1 acc 67.188 (67.088)	Top-5 acc 87.891 (85.966)	lr 0.00179
Train [100][940/3239]	Time 0.257 (0.575)	Data Time 0.001 (0.041)	Loss 2.4394 (2.3738)	Entropy 0.54408 (0.54423)	Top-1 acc 65.234 (67.066)	Top-5 acc 85.547 (85.952)	lr 0.00179
Train [100][950/3239]	Time 0.232 (0.573)	Data Time 0.001 (0.041)	Loss 2.4085 (2.3732)	Entropy 0.54412 (0.54422)	Top-1 acc 64.453 (67.078)	Top-5 acc 83.984 (85.960)	lr 0.00179
Train [100][960/3239]	Time 0.230 (0.571)	Data Time 0.001 (0.041)	Loss 2.3139 (2.3733)	Entropy 0.54441 (0.54422)	Top-1 acc 69.141 (67.074)	Top-5 acc 87.109 (85.956)	lr 0.00179
Train [100][970/3239]	Time 0.223 (0.570)	Data Time 0.001 (0.040)	Loss 2.2197 (2.3734)	Entropy 0.54433 (0.54423)	Top-1 acc 71.875 (67.070)	Top-5 acc 88.281 (85.953)	lr 0.00179
Train [100][980/3239]	Time 0.228 (0.568)	Data Time 0.001 (0.040)	Loss 2.2682 (2.3740)	Entropy 0.54441 (0.54423)	Top-1 acc 71.484 (67.049)	Top-5 acc 88.672 (85.949)	lr 0.00179
Train [100][990/3239]	Time 0.222 (0.567)	Data Time 0.001 (0.039)	Loss 2.3516 (2.3746)	Entropy 0.54432 (0.54423)	Top-1 acc 65.625 (67.029)	Top-5 acc 85.547 (85.938)	lr 0.00179
Train [100][1000/3239]	Time 0.264 (0.565)	Data Time 0.001 (0.039)	Loss 2.4650 (2.3746)	Entropy 0.54356 (0.54423)	Top-1 acc 66.016 (67.019)	Top-5 acc 83.203 (85.935)	lr 0.00179
Train [100][1010/3239]	Time 0.235 (0.564)	Data Time 0.001 (0.039)	Loss 2.3405 (2.3744)	Entropy 0.54349 (0.54422)	Top-1 acc 65.234 (67.014)	Top-5 acc 86.719 (85.941)	lr 0.00179
Train [100][1020/3239]	Time 0.224 (0.562)	Data Time 0.001 (0.038)	Loss 2.2834 (2.3742)	Entropy 0.54358 (0.54421)	Top-1 acc 69.531 (67.025)	Top-5 acc 86.719 (85.944)	lr 0.00179
Train [100][1030/3239]	Time 0.231 (0.561)	Data Time 0.001 (0.038)	Loss 2.5425 (2.3746)	Entropy 0.54365 (0.54421)	Top-1 acc 63.672 (67.015)	Top-5 acc 83.203 (85.939)	lr 0.00179
Train [100][1040/3239]	Time 0.314 (0.560)	Data Time 0.001 (0.038)	Loss 2.6708 (2.3746)	Entropy 0.54387 (0.54420)	Top-1 acc 58.203 (67.006)	Top-5 acc 80.469 (85.937)	lr 0.00179
Train [100][1050/3239]	Time 0.233 (0.558)	Data Time 0.001 (0.037)	Loss 2.2294 (2.3743)	Entropy 0.54387 (0.54420)	Top-1 acc 69.922 (67.013)	Top-5 acc 87.891 (85.945)	lr 0.00179
Train [100][1060/3239]	Time 0.234 (0.557)	Data Time 0.001 (0.037)	Loss 2.2470 (2.3741)	Entropy 0.54412 (0.54420)	Top-1 acc 69.922 (67.007)	Top-5 acc 88.281 (85.944)	lr 0.00179
Train [100][1070/3239]	Time 0.232 (0.556)	Data Time 0.001 (0.037)	Loss 2.4014 (2.3740)	Entropy 0.54417 (0.54420)	Top-1 acc 65.625 (67.018)	Top-5 acc 86.328 (85.952)	lr 0.00179
Train [100][1080/3239]	Time 0.323 (0.555)	Data Time 0.001 (0.036)	Loss 2.1288 (2.3741)	Entropy 0.54444 (0.54420)	Top-1 acc 72.266 (67.016)	Top-5 acc 89.453 (85.948)	lr 0.00179
Train [100][1090/3239]	Time 0.223 (0.553)	Data Time 0.001 (0.036)	Loss 2.5501 (2.3739)	Entropy 0.54473 (0.54420)	Top-1 acc 60.156 (67.009)	Top-5 acc 85.156 (85.956)	lr 0.00178
Train [100][1100/3239]	Time 0.225 (0.552)	Data Time 0.001 (0.036)	Loss 2.5241 (2.3736)	Entropy 0.54493 (0.54421)	Top-1 acc 61.719 (67.018)	Top-5 acc 84.375 (85.966)	lr 0.00178
Train [100][1110/3239]	Time 0.239 (0.551)	Data Time 0.001 (0.035)	Loss 2.3098 (2.3738)	Entropy 0.54493 (0.54421)	Top-1 acc 67.969 (67.020)	Top-5 acc 86.719 (85.962)	lr 0.00178
Train [100][1120/3239]	Time 0.234 (0.550)	Data Time 0.001 (0.035)	Loss 2.3381 (2.3734)	Entropy 0.54475 (0.54422)	Top-1 acc 65.234 (67.025)	Top-5 acc 85.938 (85.969)	lr 0.00178
Train [100][1130/3239]	Time 0.221 (0.548)	Data Time 0.001 (0.035)	Loss 2.2714 (2.3732)	Entropy 0.54432 (0.54422)	Top-1 acc 71.875 (67.036)	Top-5 acc 88.281 (85.976)	lr 0.00178
Train [100][1140/3239]	Time 0.235 (0.547)	Data Time 0.001 (0.034)	Loss 2.5182 (2.3738)	Entropy 0.54423 (0.54422)	Top-1 acc 60.938 (67.015)	Top-5 acc 80.859 (85.963)	lr 0.00178
Train [100][1150/3239]	Time 0.328 (0.546)	Data Time 0.001 (0.034)	Loss 2.3450 (2.3732)	Entropy 0.54410 (0.54422)	Top-1 acc 67.188 (67.029)	Top-5 acc 86.328 (85.968)	lr 0.00178
Train [100][1160/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.034)	Loss 2.0939 (2.3732)	Entropy 0.54407 (0.54422)	Top-1 acc 71.875 (67.025)	Top-5 acc 92.188 (85.969)	lr 0.00178
Train [100][1170/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.034)	Loss 2.3701 (2.3731)	Entropy 0.54389 (0.54422)	Top-1 acc 66.016 (67.025)	Top-5 acc 83.203 (85.967)	lr 0.00178
Train [100][1180/3239]	Time 0.232 (0.543)	Data Time 0.001 (0.033)	Loss 2.4438 (2.3731)	Entropy 0.54370 (0.54422)	Top-1 acc 63.672 (67.032)	Top-5 acc 83.594 (85.959)	lr 0.00178
Train [100][1190/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.033)	Loss 2.4544 (2.3734)	Entropy 0.54359 (0.54421)	Top-1 acc 64.844 (67.027)	Top-5 acc 85.547 (85.955)	lr 0.00178
Train [100][1200/3239]	Time 0.239 (0.540)	Data Time 0.001 (0.033)	Loss 2.3352 (2.3739)	Entropy 0.54374 (0.54421)	Top-1 acc 66.406 (67.014)	Top-5 acc 86.328 (85.942)	lr 0.00178
Train [100][1210/3239]	Time 0.245 (0.539)	Data Time 0.001 (0.033)	Loss 2.2164 (2.3737)	Entropy 0.54316 (0.54420)	Top-1 acc 73.047 (67.014)	Top-5 acc 85.156 (85.943)	lr 0.00178
Train [100][1220/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.032)	Loss 2.3494 (2.3736)	Entropy 0.54301 (0.54419)	Top-1 acc 71.484 (67.021)	Top-5 acc 82.422 (85.945)	lr 0.00178
Train [100][1230/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.032)	Loss 2.2798 (2.3737)	Entropy 0.54300 (0.54418)	Top-1 acc 68.359 (67.019)	Top-5 acc 89.062 (85.942)	lr 0.00178
Train [100][1240/3239]	Time 0.317 (0.536)	Data Time 0.001 (0.032)	Loss 2.7876 (2.3738)	Entropy 0.54331 (0.54417)	Top-1 acc 57.422 (67.012)	Top-5 acc 78.516 (85.944)	lr 0.00178
Train [100][1250/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.032)	Loss 2.3447 (2.3734)	Entropy 0.54318 (0.54417)	Top-1 acc 67.578 (67.012)	Top-5 acc 85.156 (85.951)	lr 0.00178
Train [100][1260/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.031)	Loss 2.2571 (2.3734)	Entropy 0.54322 (0.54416)	Top-1 acc 71.875 (67.014)	Top-5 acc 85.938 (85.953)	lr 0.00178
Train [100][1270/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.031)	Loss 2.2624 (2.3732)	Entropy 0.54320 (0.54415)	Top-1 acc 69.922 (67.024)	Top-5 acc 85.938 (85.950)	lr 0.00178
Train [100][1280/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.031)	Loss 2.3622 (2.3732)	Entropy 0.54319 (0.54414)	Top-1 acc 64.062 (67.020)	Top-5 acc 85.156 (85.946)	lr 0.00178
Train [100][1290/3239]	Time 0.230 (0.531)	Data Time 0.001 (0.031)	Loss 2.2526 (2.3733)	Entropy 0.54321 (0.54414)	Top-1 acc 71.484 (67.014)	Top-5 acc 87.891 (85.945)	lr 0.00177
Train [100][1300/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.030)	Loss 2.3249 (2.3732)	Entropy 0.54289 (0.54413)	Top-1 acc 72.266 (67.024)	Top-5 acc 87.109 (85.946)	lr 0.00177
Train [100][1310/3239]	Time 0.325 (0.529)	Data Time 0.001 (0.030)	Loss 2.4383 (2.3734)	Entropy 0.54304 (0.54412)	Top-1 acc 66.406 (67.023)	Top-5 acc 83.594 (85.942)	lr 0.00177
Train [100][1320/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.030)	Loss 2.4451 (2.3734)	Entropy 0.54319 (0.54411)	Top-1 acc 63.281 (67.015)	Top-5 acc 88.281 (85.942)	lr 0.00177
Train [100][1330/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.030)	Loss 2.3905 (2.3734)	Entropy 0.54292 (0.54410)	Top-1 acc 66.406 (67.007)	Top-5 acc 84.766 (85.944)	lr 0.00177
Train [100][1340/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.030)	Loss 2.3253 (2.3733)	Entropy 0.54280 (0.54410)	Top-1 acc 67.188 (67.010)	Top-5 acc 87.500 (85.948)	lr 0.00177
Train [100][1350/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.029)	Loss 2.6317 (2.3741)	Entropy 0.54308 (0.54409)	Top-1 acc 60.156 (66.980)	Top-5 acc 81.250 (85.931)	lr 0.00177
Train [100][1360/3239]	Time 0.303 (0.525)	Data Time 0.001 (0.029)	Loss 2.4512 (2.3741)	Entropy 0.54278 (0.54408)	Top-1 acc 64.844 (66.986)	Top-5 acc 84.375 (85.927)	lr 0.00177
Train [100][1370/3239]	Time 0.258 (0.525)	Data Time 0.001 (0.029)	Loss 2.4992 (2.3742)	Entropy 0.54281 (0.54407)	Top-1 acc 62.500 (66.985)	Top-5 acc 85.547 (85.927)	lr 0.00177
Train [100][1380/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.029)	Loss 2.2010 (2.3736)	Entropy 0.54254 (0.54406)	Top-1 acc 68.359 (66.995)	Top-5 acc 88.281 (85.936)	lr 0.00177
Train [100][1390/3239]	Time 0.224 (0.523)	Data Time 0.001 (0.029)	Loss 2.4183 (2.3739)	Entropy 0.54232 (0.54405)	Top-1 acc 66.016 (66.984)	Top-5 acc 83.984 (85.928)	lr 0.00177
Train [100][1400/3239]	Time 0.246 (0.522)	Data Time 0.001 (0.028)	Loss 2.3890 (2.3736)	Entropy 0.54202 (0.54403)	Top-1 acc 66.406 (66.991)	Top-5 acc 89.844 (85.937)	lr 0.00177
Train [100][1410/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.028)	Loss 2.3647 (2.3737)	Entropy 0.54187 (0.54402)	Top-1 acc 66.797 (66.985)	Top-5 acc 85.156 (85.932)	lr 0.00177
Train [100][1420/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.028)	Loss 2.2864 (2.3737)	Entropy 0.54191 (0.54400)	Top-1 acc 70.312 (66.984)	Top-5 acc 87.500 (85.932)	lr 0.00177
Train [100][1430/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.028)	Loss 2.3291 (2.3738)	Entropy 0.54187 (0.54399)	Top-1 acc 67.969 (66.982)	Top-5 acc 86.719 (85.928)	lr 0.00177
Train [100][1440/3239]	Time 0.239 (0.519)	Data Time 0.001 (0.028)	Loss 2.3631 (2.3738)	Entropy 0.54204 (0.54397)	Top-1 acc 67.578 (66.979)	Top-5 acc 87.109 (85.932)	lr 0.00177
Train [100][1450/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.027)	Loss 2.3662 (2.3736)	Entropy 0.54190 (0.54396)	Top-1 acc 68.359 (66.983)	Top-5 acc 87.500 (85.936)	lr 0.00177
Train [100][1460/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.027)	Loss 2.2653 (2.3735)	Entropy 0.54203 (0.54395)	Top-1 acc 69.531 (66.982)	Top-5 acc 86.719 (85.941)	lr 0.00177
Train [100][1470/3239]	Time 0.506 (0.552)	Data Time 0.006 (0.027)	Loss 2.2728 (2.3733)	Entropy 0.54222 (0.54394)	Top-1 acc 68.750 (66.984)	Top-5 acc 85.156 (85.945)	lr 0.00177
Train [100][1480/3239]	Time 0.239 (0.552)	Data Time 0.002 (0.027)	Loss 2.4400 (2.3737)	Entropy 0.54233 (0.54392)	Top-1 acc 66.016 (66.979)	Top-5 acc 82.812 (85.934)	lr 0.00176
Train [100][1490/3239]	Time 0.232 (0.551)	Data Time 0.001 (0.027)	Loss 2.1980 (2.3732)	Entropy 0.54243 (0.54391)	Top-1 acc 74.609 (66.989)	Top-5 acc 86.719 (85.944)	lr 0.00176
Train [100][1500/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.027)	Loss 2.3892 (2.3736)	Entropy 0.54255 (0.54390)	Top-1 acc 66.406 (66.976)	Top-5 acc 85.547 (85.936)	lr 0.00176
Train [100][1510/3239]	Time 0.238 (0.549)	Data Time 0.001 (0.026)	Loss 2.3235 (2.3735)	Entropy 0.54242 (0.54390)	Top-1 acc 69.922 (66.980)	Top-5 acc 87.500 (85.940)	lr 0.00176
Train [100][1520/3239]	Time 0.229 (0.548)	Data Time 0.001 (0.026)	Loss 2.6643 (2.3737)	Entropy 0.54220 (0.54389)	Top-1 acc 61.328 (66.977)	Top-5 acc 77.344 (85.941)	lr 0.00176
Train [100][1530/3239]	Time 0.236 (0.548)	Data Time 0.001 (0.026)	Loss 2.4624 (2.3735)	Entropy 0.54197 (0.54387)	Top-1 acc 66.016 (66.990)	Top-5 acc 80.469 (85.940)	lr 0.00176
Train [100][1540/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.026)	Loss 2.3862 (2.3738)	Entropy 0.54175 (0.54386)	Top-1 acc 65.625 (66.977)	Top-5 acc 85.156 (85.937)	lr 0.00176
Train [100][1550/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.026)	Loss 2.3501 (2.3739)	Entropy 0.54191 (0.54385)	Top-1 acc 66.797 (66.972)	Top-5 acc 86.719 (85.933)	lr 0.00176
Train [100][1560/3239]	Time 0.283 (0.545)	Data Time 0.002 (0.026)	Loss 2.2508 (2.3735)	Entropy 0.54200 (0.54384)	Top-1 acc 68.750 (66.982)	Top-5 acc 89.844 (85.944)	lr 0.00176
Train [100][1570/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.025)	Loss 2.4295 (2.3737)	Entropy 0.54175 (0.54382)	Top-1 acc 64.453 (66.982)	Top-5 acc 85.547 (85.936)	lr 0.00176
Train [100][1580/3239]	Time 0.233 (0.544)	Data Time 0.001 (0.025)	Loss 2.3072 (2.3738)	Entropy 0.54174 (0.54381)	Top-1 acc 66.797 (66.980)	Top-5 acc 86.328 (85.934)	lr 0.00176
Train [100][1590/3239]	Time 0.229 (0.543)	Data Time 0.001 (0.025)	Loss 2.2831 (2.3738)	Entropy 0.54183 (0.54380)	Top-1 acc 68.750 (66.973)	Top-5 acc 86.328 (85.937)	lr 0.00176
Train [100][1600/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.025)	Loss 2.3235 (2.3737)	Entropy 0.54188 (0.54379)	Top-1 acc 66.406 (66.970)	Top-5 acc 86.719 (85.937)	lr 0.00176
Train [100][1610/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.025)	Loss 2.3790 (2.3734)	Entropy 0.54179 (0.54377)	Top-1 acc 65.625 (66.980)	Top-5 acc 86.328 (85.946)	lr 0.00176
Train [100][1620/3239]	Time 0.244 (0.541)	Data Time 0.001 (0.025)	Loss 2.4133 (2.3738)	Entropy 0.54167 (0.54376)	Top-1 acc 69.141 (66.965)	Top-5 acc 83.984 (85.940)	lr 0.00176
Train [100][1630/3239]	Time 0.336 (0.540)	Data Time 0.001 (0.025)	Loss 2.1633 (2.3740)	Entropy 0.54154 (0.54375)	Top-1 acc 70.703 (66.956)	Top-5 acc 89.844 (85.940)	lr 0.00176
Train [100][1640/3239]	Time 0.224 (0.539)	Data Time 0.001 (0.024)	Loss 2.6570 (2.3741)	Entropy 0.54169 (0.54373)	Top-1 acc 59.766 (66.952)	Top-5 acc 80.859 (85.937)	lr 0.00176
Train [100][1650/3239]	Time 0.244 (0.539)	Data Time 0.001 (0.024)	Loss 2.4378 (2.3742)	Entropy 0.54190 (0.54372)	Top-1 acc 64.062 (66.952)	Top-5 acc 84.375 (85.932)	lr 0.00176
Train [100][1660/3239]	Time 0.227 (0.538)	Data Time 0.001 (0.024)	Loss 2.5429 (2.3738)	Entropy 0.54207 (0.54371)	Top-1 acc 61.719 (66.960)	Top-5 acc 82.812 (85.938)	lr 0.00176
Train [100][1670/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.024)	Loss 2.3969 (2.3736)	Entropy 0.54231 (0.54370)	Top-1 acc 66.406 (66.963)	Top-5 acc 86.719 (85.940)	lr 0.00175
Train [100][1680/3239]	Time 0.265 (0.536)	Data Time 0.002 (0.024)	Loss 2.5566 (2.3736)	Entropy 0.54247 (0.54369)	Top-1 acc 63.672 (66.969)	Top-5 acc 81.250 (85.939)	lr 0.00175
Train [100][1690/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.024)	Loss 2.4432 (2.3737)	Entropy 0.54264 (0.54369)	Top-1 acc 62.500 (66.952)	Top-5 acc 85.938 (85.942)	lr 0.00175
Train [100][1700/3239]	Time 0.325 (0.535)	Data Time 0.001 (0.024)	Loss 2.4528 (2.3736)	Entropy 0.54236 (0.54368)	Top-1 acc 65.625 (66.962)	Top-5 acc 83.594 (85.943)	lr 0.00175
Train [100][1710/3239]	Time 0.226 (0.534)	Data Time 0.001 (0.023)	Loss 2.7041 (2.3736)	Entropy 0.54245 (0.54367)	Top-1 acc 62.500 (66.959)	Top-5 acc 80.078 (85.946)	lr 0.00175
Train [100][1720/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.023)	Loss 2.2781 (2.3741)	Entropy 0.54231 (0.54367)	Top-1 acc 66.797 (66.947)	Top-5 acc 87.891 (85.940)	lr 0.00175
Train [100][1730/3239]	Time 0.224 (0.533)	Data Time 0.001 (0.023)	Loss 2.4324 (2.3745)	Entropy 0.54187 (0.54366)	Top-1 acc 67.188 (66.941)	Top-5 acc 85.547 (85.936)	lr 0.00175
Train [100][1740/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.023)	Loss 2.3769 (2.3747)	Entropy 0.54209 (0.54365)	Top-1 acc 67.578 (66.932)	Top-5 acc 83.984 (85.931)	lr 0.00175
Train [100][1750/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.023)	Loss 2.2564 (2.3749)	Entropy 0.54206 (0.54364)	Top-1 acc 67.188 (66.926)	Top-5 acc 87.500 (85.927)	lr 0.00175
Train [100][1760/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.023)	Loss 2.3881 (2.3747)	Entropy 0.54228 (0.54363)	Top-1 acc 64.844 (66.927)	Top-5 acc 85.938 (85.930)	lr 0.00175
Train [100][1770/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.023)	Loss 2.1617 (2.3744)	Entropy 0.54229 (0.54362)	Top-1 acc 70.703 (66.927)	Top-5 acc 90.234 (85.935)	lr 0.00175
Train [100][1780/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.023)	Loss 2.4194 (2.3746)	Entropy 0.54181 (0.54361)	Top-1 acc 64.062 (66.915)	Top-5 acc 87.500 (85.935)	lr 0.00175
Train [100][1790/3239]	Time 0.333 (0.529)	Data Time 0.001 (0.022)	Loss 2.4458 (2.3750)	Entropy 0.54194 (0.54360)	Top-1 acc 65.234 (66.903)	Top-5 acc 83.594 (85.929)	lr 0.00175
Train [100][1800/3239]	Time 0.277 (0.528)	Data Time 0.002 (0.022)	Loss 2.2223 (2.3748)	Entropy 0.54177 (0.54359)	Top-1 acc 72.656 (66.911)	Top-5 acc 87.109 (85.931)	lr 0.00175
Train [100][1810/3239]	Time 0.281 (0.528)	Data Time 0.002 (0.022)	Loss 2.4056 (2.3746)	Entropy 0.54130 (0.54358)	Top-1 acc 64.062 (66.913)	Top-5 acc 85.156 (85.933)	lr 0.00175
Train [100][1820/3239]	Time 0.278 (0.528)	Data Time 0.002 (0.022)	Loss 2.2672 (2.3745)	Entropy 0.54129 (0.54357)	Top-1 acc 67.188 (66.911)	Top-5 acc 85.547 (85.935)	lr 0.00175
Train [100][1830/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.022)	Loss 2.3920 (2.3743)	Entropy 0.54142 (0.54356)	Top-1 acc 65.234 (66.918)	Top-5 acc 84.766 (85.937)	lr 0.00175
Train [100][1840/3239]	Time 0.256 (0.527)	Data Time 0.001 (0.022)	Loss 2.4654 (2.3744)	Entropy 0.54156 (0.54355)	Top-1 acc 62.891 (66.913)	Top-5 acc 83.984 (85.936)	lr 0.00175
Train [100][1850/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.022)	Loss 2.4550 (2.3744)	Entropy 0.54185 (0.54354)	Top-1 acc 62.500 (66.909)	Top-5 acc 82.422 (85.933)	lr 0.00175
Train [100][1860/3239]	Time 0.322 (0.526)	Data Time 0.001 (0.022)	Loss 2.4359 (2.3749)	Entropy 0.54155 (0.54353)	Top-1 acc 66.797 (66.897)	Top-5 acc 82.422 (85.926)	lr 0.00175
Train [100][1870/3239]	Time 0.267 (0.525)	Data Time 0.002 (0.022)	Loss 2.2512 (2.3747)	Entropy 0.54174 (0.54352)	Top-1 acc 71.484 (66.898)	Top-5 acc 87.109 (85.929)	lr 0.00174
Train [100][1880/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.021)	Loss 2.4176 (2.3749)	Entropy 0.54186 (0.54351)	Top-1 acc 66.406 (66.895)	Top-5 acc 82.031 (85.925)	lr 0.00174
Train [100][1890/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.021)	Loss 2.2680 (2.3750)	Entropy 0.54218 (0.54350)	Top-1 acc 69.922 (66.899)	Top-5 acc 86.328 (85.923)	lr 0.00174
Train [100][1900/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.021)	Loss 2.3634 (2.3752)	Entropy 0.54227 (0.54349)	Top-1 acc 69.141 (66.898)	Top-5 acc 84.766 (85.922)	lr 0.00174
Train [100][1910/3239]	Time 0.279 (0.523)	Data Time 0.001 (0.021)	Loss 2.4575 (2.3755)	Entropy 0.54239 (0.54349)	Top-1 acc 64.453 (66.888)	Top-5 acc 83.984 (85.917)	lr 0.00174
Train [100][1920/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.021)	Loss 2.4876 (2.3759)	Entropy 0.54246 (0.54348)	Top-1 acc 62.891 (66.880)	Top-5 acc 83.594 (85.912)	lr 0.00174
Train [100][1930/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.021)	Loss 2.4765 (2.3757)	Entropy 0.54256 (0.54348)	Top-1 acc 62.891 (66.885)	Top-5 acc 82.812 (85.917)	lr 0.00174
Train [100][1940/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.021)	Loss 2.4566 (2.3757)	Entropy 0.54244 (0.54347)	Top-1 acc 66.016 (66.886)	Top-5 acc 83.594 (85.915)	lr 0.00174
Train [100][1950/3239]	Time 0.248 (0.521)	Data Time 0.001 (0.021)	Loss 2.3771 (2.3755)	Entropy 0.54253 (0.54347)	Top-1 acc 65.625 (66.890)	Top-5 acc 84.766 (85.917)	lr 0.00174
Train [100][1960/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.021)	Loss 2.3569 (2.3758)	Entropy 0.54249 (0.54346)	Top-1 acc 68.359 (66.884)	Top-5 acc 86.328 (85.911)	lr 0.00174
Train [100][1970/3239]	Time 0.248 (0.520)	Data Time 0.001 (0.021)	Loss 2.3089 (2.3758)	Entropy 0.54276 (0.54346)	Top-1 acc 69.141 (66.886)	Top-5 acc 85.156 (85.911)	lr 0.00174
Train [100][1980/3239]	Time 0.279 (0.519)	Data Time 0.001 (0.020)	Loss 2.5601 (2.3756)	Entropy 0.54265 (0.54345)	Top-1 acc 62.891 (66.889)	Top-5 acc 86.719 (85.916)	lr 0.00174
Train [100][1990/3239]	Time 0.242 (0.518)	Data Time 0.001 (0.020)	Loss 2.3555 (2.3756)	Entropy 0.54275 (0.54345)	Top-1 acc 70.312 (66.890)	Top-5 acc 86.719 (85.915)	lr 0.00174
Train [100][2000/3239]	Time 0.271 (0.519)	Data Time 0.001 (0.020)	Loss 2.2241 (2.3757)	Entropy 0.54271 (0.54344)	Top-1 acc 74.609 (66.890)	Top-5 acc 87.891 (85.912)	lr 0.00174
Train [100][2010/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.020)	Loss 2.2507 (2.3756)	Entropy 0.54282 (0.54344)	Top-1 acc 69.141 (66.892)	Top-5 acc 90.234 (85.914)	lr 0.00174
Train [100][2020/3239]	Time 0.325 (0.517)	Data Time 0.001 (0.020)	Loss 2.3760 (2.3755)	Entropy 0.54244 (0.54344)	Top-1 acc 66.016 (66.893)	Top-5 acc 83.984 (85.913)	lr 0.00174
Train [100][2030/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.020)	Loss 2.6353 (2.3754)	Entropy 0.54258 (0.54343)	Top-1 acc 58.594 (66.889)	Top-5 acc 80.859 (85.914)	lr 0.00174
Train [100][2040/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.020)	Loss 2.3672 (2.3757)	Entropy 0.54286 (0.54343)	Top-1 acc 67.188 (66.886)	Top-5 acc 86.328 (85.906)	lr 0.00174
Train [100][2050/3239]	Time 0.219 (0.516)	Data Time 0.001 (0.020)	Loss 2.5137 (2.3759)	Entropy 0.54302 (0.54343)	Top-1 acc 64.453 (66.883)	Top-5 acc 82.812 (85.902)	lr 0.00174
Train [100][2060/3239]	Time 0.229 (0.515)	Data Time 0.001 (0.020)	Loss 2.3302 (2.3763)	Entropy 0.54303 (0.54342)	Top-1 acc 69.531 (66.873)	Top-5 acc 85.156 (85.895)	lr 0.00173
Train [100][2070/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.020)	Loss 2.3806 (2.3761)	Entropy 0.54292 (0.54342)	Top-1 acc 65.625 (66.878)	Top-5 acc 84.766 (85.894)	lr 0.00173
Train [100][2080/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.020)	Loss 2.2481 (2.3765)	Entropy 0.54282 (0.54342)	Top-1 acc 67.188 (66.866)	Top-5 acc 87.500 (85.883)	lr 0.00173
Train [100][2090/3239]	Time 0.324 (0.514)	Data Time 0.001 (0.019)	Loss 2.2229 (2.3764)	Entropy 0.54290 (0.54342)	Top-1 acc 68.359 (66.868)	Top-5 acc 89.453 (85.887)	lr 0.00173
Train [100][2100/3239]	Time 0.258 (0.513)	Data Time 0.001 (0.019)	Loss 2.4306 (2.3762)	Entropy 0.54295 (0.54341)	Top-1 acc 72.656 (66.873)	Top-5 acc 85.547 (85.890)	lr 0.00173
Train [100][2110/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.019)	Loss 2.4245 (2.3760)	Entropy 0.54295 (0.54341)	Top-1 acc 66.406 (66.880)	Top-5 acc 85.547 (85.891)	lr 0.00173
Train [100][2120/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.019)	Loss 2.4220 (2.3759)	Entropy 0.54323 (0.54341)	Top-1 acc 65.234 (66.883)	Top-5 acc 83.984 (85.894)	lr 0.00173
Train [100][2130/3239]	Time 0.318 (0.537)	Data Time 0.002 (0.019)	Loss 2.4691 (2.3759)	Entropy 0.54342 (0.54341)	Top-1 acc 62.891 (66.881)	Top-5 acc 85.156 (85.892)	lr 0.00173
Train [100][2140/3239]	Time 0.236 (0.536)	Data Time 0.002 (0.019)	Loss 2.3412 (2.3756)	Entropy 0.54343 (0.54341)	Top-1 acc 67.578 (66.883)	Top-5 acc 86.328 (85.900)	lr 0.00173
Train [100][2150/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.019)	Loss 2.3074 (2.3758)	Entropy 0.54369 (0.54341)	Top-1 acc 68.359 (66.881)	Top-5 acc 85.938 (85.897)	lr 0.00173
Train [100][2160/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.019)	Loss 2.2404 (2.3756)	Entropy 0.54395 (0.54341)	Top-1 acc 71.875 (66.882)	Top-5 acc 87.109 (85.898)	lr 0.00173
Train [100][2170/3239]	Time 0.263 (0.535)	Data Time 0.001 (0.019)	Loss 2.3596 (2.3759)	Entropy 0.54412 (0.54342)	Top-1 acc 66.406 (66.874)	Top-5 acc 84.766 (85.894)	lr 0.00173
Train [100][2180/3239]	Time 0.328 (0.534)	Data Time 0.001 (0.019)	Loss 2.5431 (2.3763)	Entropy 0.54419 (0.54342)	Top-1 acc 64.062 (66.867)	Top-5 acc 82.422 (85.885)	lr 0.00173
Train [100][2190/3239]	Time 0.298 (0.534)	Data Time 0.002 (0.019)	Loss 2.1884 (2.3768)	Entropy 0.54395 (0.54342)	Top-1 acc 72.656 (66.855)	Top-5 acc 89.062 (85.878)	lr 0.00173
Train [100][2200/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.019)	Loss 2.5814 (2.3765)	Entropy 0.54404 (0.54342)	Top-1 acc 62.891 (66.860)	Top-5 acc 82.031 (85.882)	lr 0.00173
Train [100][2210/3239]	Time 0.236 (0.533)	Data Time 0.001 (0.019)	Loss 2.2907 (2.3764)	Entropy 0.54420 (0.54343)	Top-1 acc 68.359 (66.868)	Top-5 acc 85.938 (85.882)	lr 0.00173
Train [100][2220/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.018)	Loss 2.3599 (2.3762)	Entropy 0.54418 (0.54343)	Top-1 acc 67.578 (66.871)	Top-5 acc 85.547 (85.883)	lr 0.00173
Train [100][2230/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.018)	Loss 2.2224 (2.3759)	Entropy 0.54367 (0.54343)	Top-1 acc 68.359 (66.876)	Top-5 acc 89.062 (85.889)	lr 0.00173
Train [100][2240/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.018)	Loss 2.3685 (2.3763)	Entropy 0.54381 (0.54344)	Top-1 acc 67.578 (66.870)	Top-5 acc 86.328 (85.882)	lr 0.00173
Train [100][2250/3239]	Time 0.338 (0.531)	Data Time 0.001 (0.018)	Loss 2.4088 (2.3767)	Entropy 0.54384 (0.54344)	Top-1 acc 63.672 (66.859)	Top-5 acc 84.766 (85.873)	lr 0.00173
Train [100][2260/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.018)	Loss 2.3330 (2.3769)	Entropy 0.54373 (0.54344)	Top-1 acc 69.141 (66.858)	Top-5 acc 85.938 (85.865)	lr 0.00172
Train [100][2270/3239]	Time 0.227 (0.530)	Data Time 0.001 (0.018)	Loss 2.3188 (2.3770)	Entropy 0.54375 (0.54344)	Top-1 acc 64.453 (66.854)	Top-5 acc 88.672 (85.863)	lr 0.00172
Train [100][2280/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.018)	Loss 2.3480 (2.3769)	Entropy 0.54388 (0.54344)	Top-1 acc 66.016 (66.861)	Top-5 acc 88.672 (85.867)	lr 0.00172
Train [100][2290/3239]	Time 0.223 (0.529)	Data Time 0.001 (0.018)	Loss 2.6492 (2.3771)	Entropy 0.54432 (0.54344)	Top-1 acc 62.500 (66.857)	Top-5 acc 82.812 (85.862)	lr 0.00172
Train [100][2300/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.018)	Loss 2.2326 (2.3768)	Entropy 0.54403 (0.54345)	Top-1 acc 72.266 (66.865)	Top-5 acc 88.672 (85.869)	lr 0.00172
Train [100][2310/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.018)	Loss 2.4039 (2.3769)	Entropy 0.54416 (0.54345)	Top-1 acc 64.453 (66.864)	Top-5 acc 85.156 (85.867)	lr 0.00172
Train [100][2320/3239]	Time 0.247 (0.528)	Data Time 0.001 (0.018)	Loss 2.3107 (2.3771)	Entropy 0.54413 (0.54345)	Top-1 acc 69.922 (66.857)	Top-5 acc 86.328 (85.861)	lr 0.00172
Train [100][2330/3239]	Time 0.263 (0.527)	Data Time 0.001 (0.018)	Loss 2.2066 (2.3772)	Entropy 0.54397 (0.54346)	Top-1 acc 71.094 (66.859)	Top-5 acc 87.500 (85.860)	lr 0.00172
Train [100][2340/3239]	Time 0.319 (0.527)	Data Time 0.001 (0.018)	Loss 2.5212 (2.3771)	Entropy 0.54411 (0.54346)	Top-1 acc 60.547 (66.862)	Top-5 acc 82.031 (85.859)	lr 0.00172
Train [100][2350/3239]	Time 0.240 (0.526)	Data Time 0.001 (0.018)	Loss 2.3616 (2.3769)	Entropy 0.54442 (0.54346)	Top-1 acc 67.969 (66.866)	Top-5 acc 87.500 (85.861)	lr 0.00172
Train [100][2360/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.017)	Loss 2.5339 (2.3766)	Entropy 0.54412 (0.54346)	Top-1 acc 61.719 (66.875)	Top-5 acc 83.594 (85.867)	lr 0.00172
Train [100][2370/3239]	Time 0.221 (0.525)	Data Time 0.001 (0.017)	Loss 2.3941 (2.3766)	Entropy 0.54446 (0.54347)	Top-1 acc 71.484 (66.877)	Top-5 acc 85.938 (85.867)	lr 0.00172
Train [100][2380/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.017)	Loss 2.4165 (2.3765)	Entropy 0.54469 (0.54347)	Top-1 acc 68.359 (66.879)	Top-5 acc 85.547 (85.870)	lr 0.00172
Train [100][2390/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.017)	Loss 2.3509 (2.3765)	Entropy 0.54439 (0.54348)	Top-1 acc 65.234 (66.876)	Top-5 acc 84.766 (85.869)	lr 0.00172
Train [100][2400/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.017)	Loss 2.2638 (2.3766)	Entropy 0.54431 (0.54348)	Top-1 acc 69.922 (66.870)	Top-5 acc 85.938 (85.867)	lr 0.00172
Train [100][2410/3239]	Time 0.333 (0.523)	Data Time 0.001 (0.017)	Loss 2.2666 (2.3763)	Entropy 0.54458 (0.54348)	Top-1 acc 71.875 (66.878)	Top-5 acc 86.719 (85.873)	lr 0.00172
Train [100][2420/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.017)	Loss 2.5702 (2.3764)	Entropy 0.54463 (0.54349)	Top-1 acc 64.453 (66.878)	Top-5 acc 82.812 (85.874)	lr 0.00172
Train [100][2430/3239]	Time 0.262 (0.523)	Data Time 0.001 (0.017)	Loss 2.3990 (2.3766)	Entropy 0.54452 (0.54349)	Top-1 acc 67.969 (66.873)	Top-5 acc 85.547 (85.869)	lr 0.00172
Train [100][2440/3239]	Time 0.290 (0.522)	Data Time 0.001 (0.017)	Loss 2.4369 (2.3767)	Entropy 0.54454 (0.54350)	Top-1 acc 65.234 (66.872)	Top-5 acc 83.203 (85.868)	lr 0.00172
Train [100][2450/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.017)	Loss 2.3619 (2.3766)	Entropy 0.54457 (0.54350)	Top-1 acc 67.188 (66.872)	Top-5 acc 85.156 (85.869)	lr 0.00171
Train [100][2460/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.017)	Loss 2.5681 (2.3765)	Entropy 0.54411 (0.54351)	Top-1 acc 61.328 (66.877)	Top-5 acc 81.250 (85.868)	lr 0.00171
Train [100][2470/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.017)	Loss 2.4799 (2.3768)	Entropy 0.54398 (0.54351)	Top-1 acc 62.891 (66.868)	Top-5 acc 83.594 (85.862)	lr 0.00171
Train [100][2480/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.017)	Loss 2.3693 (2.3766)	Entropy 0.54387 (0.54351)	Top-1 acc 70.703 (66.877)	Top-5 acc 82.422 (85.861)	lr 0.00171
Train [100][2490/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.017)	Loss 2.3385 (2.3764)	Entropy 0.54403 (0.54351)	Top-1 acc 65.625 (66.879)	Top-5 acc 88.281 (85.869)	lr 0.00171
Train [100][2500/3239]	Time 0.260 (0.520)	Data Time 0.001 (0.017)	Loss 2.6341 (2.3766)	Entropy 0.54414 (0.54351)	Top-1 acc 59.375 (66.871)	Top-5 acc 82.031 (85.868)	lr 0.00171
Train [100][2510/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.016)	Loss 2.2597 (2.3764)	Entropy 0.54442 (0.54352)	Top-1 acc 67.578 (66.874)	Top-5 acc 88.281 (85.870)	lr 0.00171
Train [100][2520/3239]	Time 0.243 (0.519)	Data Time 0.001 (0.016)	Loss 2.2831 (2.3764)	Entropy 0.54442 (0.54352)	Top-1 acc 71.094 (66.870)	Top-5 acc 85.547 (85.868)	lr 0.00171
Train [100][2530/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.016)	Loss 2.5507 (2.3764)	Entropy 0.54453 (0.54353)	Top-1 acc 63.672 (66.872)	Top-5 acc 81.641 (85.870)	lr 0.00171
Train [100][2540/3239]	Time 0.228 (0.518)	Data Time 0.001 (0.016)	Loss 2.3446 (2.3762)	Entropy 0.54421 (0.54353)	Top-1 acc 67.969 (66.876)	Top-5 acc 86.328 (85.875)	lr 0.00171
Train [100][2550/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.016)	Loss 2.3200 (2.3761)	Entropy 0.54417 (0.54353)	Top-1 acc 67.969 (66.879)	Top-5 acc 87.109 (85.876)	lr 0.00171
Train [100][2560/3239]	Time 0.241 (0.517)	Data Time 0.001 (0.016)	Loss 2.3307 (2.3762)	Entropy 0.54406 (0.54353)	Top-1 acc 64.062 (66.878)	Top-5 acc 87.500 (85.878)	lr 0.00171
Train [100][2570/3239]	Time 0.329 (0.517)	Data Time 0.001 (0.016)	Loss 2.4727 (2.3760)	Entropy 0.54415 (0.54354)	Top-1 acc 67.188 (66.880)	Top-5 acc 83.203 (85.881)	lr 0.00171
Train [100][2580/3239]	Time 0.259 (0.516)	Data Time 0.002 (0.016)	Loss 2.2368 (2.3762)	Entropy 0.54447 (0.54354)	Top-1 acc 69.922 (66.876)	Top-5 acc 85.938 (85.876)	lr 0.00171
Train [100][2590/3239]	Time 0.288 (0.516)	Data Time 0.001 (0.016)	Loss 2.2957 (2.3759)	Entropy 0.54446 (0.54354)	Top-1 acc 69.531 (66.883)	Top-5 acc 88.281 (85.879)	lr 0.00171
Train [100][2600/3239]	Time 0.222 (0.516)	Data Time 0.001 (0.016)	Loss 2.3207 (2.3757)	Entropy 0.54456 (0.54355)	Top-1 acc 68.359 (66.885)	Top-5 acc 87.891 (85.885)	lr 0.00171
Train [100][2610/3239]	Time 0.235 (0.515)	Data Time 0.001 (0.016)	Loss 2.1665 (2.3754)	Entropy 0.54469 (0.54355)	Top-1 acc 71.094 (66.894)	Top-5 acc 91.016 (85.888)	lr 0.00171
Train [100][2620/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.016)	Loss 2.5862 (2.3756)	Entropy 0.54458 (0.54355)	Top-1 acc 60.938 (66.890)	Top-5 acc 82.422 (85.885)	lr 0.00171
Train [100][2630/3239]	Time 0.232 (0.514)	Data Time 0.001 (0.016)	Loss 2.3221 (2.3756)	Entropy 0.54445 (0.54356)	Top-1 acc 67.969 (66.891)	Top-5 acc 85.547 (85.884)	lr 0.00171
Train [100][2640/3239]	Time 0.368 (0.514)	Data Time 0.001 (0.016)	Loss 2.2922 (2.3755)	Entropy 0.54440 (0.54356)	Top-1 acc 67.969 (66.892)	Top-5 acc 85.156 (85.884)	lr 0.00171
Train [100][2650/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.016)	Loss 2.2454 (2.3758)	Entropy 0.54413 (0.54356)	Top-1 acc 73.047 (66.887)	Top-5 acc 85.547 (85.880)	lr 0.00170
Train [100][2660/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.016)	Loss 2.4180 (2.3758)	Entropy 0.54386 (0.54357)	Top-1 acc 66.797 (66.886)	Top-5 acc 87.891 (85.881)	lr 0.00170
Train [100][2670/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.016)	Loss 2.4985 (2.3759)	Entropy 0.54352 (0.54357)	Top-1 acc 58.594 (66.883)	Top-5 acc 83.984 (85.882)	lr 0.00170
Train [100][2680/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.016)	Loss 2.2184 (2.3761)	Entropy 0.54343 (0.54357)	Top-1 acc 71.094 (66.881)	Top-5 acc 88.672 (85.879)	lr 0.00170
Train [100][2690/3239]	Time 0.255 (0.512)	Data Time 0.001 (0.015)	Loss 2.4541 (2.3762)	Entropy 0.54359 (0.54357)	Top-1 acc 65.625 (66.876)	Top-5 acc 84.375 (85.878)	lr 0.00170
Train [100][2700/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.015)	Loss 2.3453 (2.3761)	Entropy 0.54335 (0.54357)	Top-1 acc 68.359 (66.877)	Top-5 acc 86.719 (85.881)	lr 0.00170
Train [100][2710/3239]	Time 0.229 (0.511)	Data Time 0.001 (0.015)	Loss 2.3490 (2.3762)	Entropy 0.54351 (0.54356)	Top-1 acc 69.922 (66.875)	Top-5 acc 85.938 (85.881)	lr 0.00170
Train [100][2720/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.015)	Loss 2.3942 (2.3763)	Entropy 0.54305 (0.54356)	Top-1 acc 67.578 (66.876)	Top-5 acc 85.156 (85.875)	lr 0.00170
Train [100][2730/3239]	Time 0.325 (0.511)	Data Time 0.001 (0.015)	Loss 2.3028 (2.3763)	Entropy 0.54325 (0.54356)	Top-1 acc 68.750 (66.875)	Top-5 acc 89.062 (85.873)	lr 0.00170
Train [100][2740/3239]	Time 0.232 (0.510)	Data Time 0.001 (0.015)	Loss 2.2139 (2.3761)	Entropy 0.54331 (0.54356)	Top-1 acc 73.047 (66.879)	Top-5 acc 87.891 (85.877)	lr 0.00170
Train [100][2750/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.015)	Loss 2.3551 (2.3766)	Entropy 0.54326 (0.54356)	Top-1 acc 66.016 (66.867)	Top-5 acc 86.719 (85.869)	lr 0.00170
Train [100][2760/3239]	Time 0.231 (0.509)	Data Time 0.001 (0.015)	Loss 2.3539 (2.3767)	Entropy 0.54320 (0.54356)	Top-1 acc 67.969 (66.866)	Top-5 acc 85.156 (85.866)	lr 0.00170
Train [100][2770/3239]	Time 0.237 (0.509)	Data Time 0.001 (0.015)	Loss 2.2998 (2.3767)	Entropy 0.54326 (0.54356)	Top-1 acc 66.406 (66.867)	Top-5 acc 86.719 (85.865)	lr 0.00170
Train [100][2780/3239]	Time 0.331 (0.528)	Data Time 0.004 (0.015)	Loss 2.2784 (2.3768)	Entropy 0.54317 (0.54356)	Top-1 acc 67.578 (66.861)	Top-5 acc 88.672 (85.862)	lr 0.00170
Train [100][2790/3239]	Time 0.258 (0.528)	Data Time 0.002 (0.015)	Loss 2.2401 (2.3771)	Entropy 0.54298 (0.54355)	Top-1 acc 69.141 (66.853)	Top-5 acc 91.016 (85.856)	lr 0.00170
Train [100][2800/3239]	Time 0.272 (0.528)	Data Time 0.001 (0.015)	Loss 2.4938 (2.3773)	Entropy 0.54340 (0.54355)	Top-1 acc 65.234 (66.852)	Top-5 acc 83.203 (85.851)	lr 0.00170
Train [100][2810/3239]	Time 0.250 (0.527)	Data Time 0.001 (0.015)	Loss 2.4602 (2.3773)	Entropy 0.54367 (0.54355)	Top-1 acc 60.547 (66.851)	Top-5 acc 86.719 (85.853)	lr 0.00170
Train [100][2820/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.015)	Loss 2.4652 (2.3772)	Entropy 0.54302 (0.54355)	Top-1 acc 64.453 (66.850)	Top-5 acc 83.984 (85.854)	lr 0.00170
Train [100][2830/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.015)	Loss 2.2760 (2.3771)	Entropy 0.54268 (0.54355)	Top-1 acc 70.703 (66.854)	Top-5 acc 87.500 (85.855)	lr 0.00170
Train [100][2840/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.015)	Loss 2.4243 (2.3773)	Entropy 0.54295 (0.54355)	Top-1 acc 65.234 (66.847)	Top-5 acc 84.766 (85.852)	lr 0.00169
Train [100][2850/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.015)	Loss 2.2099 (2.3771)	Entropy 0.54318 (0.54355)	Top-1 acc 69.922 (66.852)	Top-5 acc 89.062 (85.855)	lr 0.00169
Train [100][2860/3239]	Time 0.268 (0.525)	Data Time 0.001 (0.015)	Loss 2.3338 (2.3772)	Entropy 0.54326 (0.54354)	Top-1 acc 67.188 (66.846)	Top-5 acc 88.281 (85.853)	lr 0.00169
Train [100][2870/3239]	Time 0.278 (0.525)	Data Time 0.002 (0.015)	Loss 2.3517 (2.3770)	Entropy 0.54313 (0.54354)	Top-1 acc 68.359 (66.849)	Top-5 acc 84.766 (85.855)	lr 0.00169
Train [100][2880/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.015)	Loss 2.3781 (2.3771)	Entropy 0.54316 (0.54354)	Top-1 acc 67.188 (66.847)	Top-5 acc 83.984 (85.852)	lr 0.00169
Train [100][2890/3239]	Time 0.333 (0.524)	Data Time 0.001 (0.015)	Loss 2.3564 (2.3772)	Entropy 0.54314 (0.54354)	Top-1 acc 69.531 (66.847)	Top-5 acc 84.766 (85.849)	lr 0.00169
Train [100][2900/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.015)	Loss 2.2796 (2.3771)	Entropy 0.54305 (0.54354)	Top-1 acc 69.141 (66.848)	Top-5 acc 86.328 (85.851)	lr 0.00169
Train [100][2910/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.014)	Loss 2.5628 (2.3773)	Entropy 0.54328 (0.54354)	Top-1 acc 61.328 (66.848)	Top-5 acc 83.203 (85.848)	lr 0.00169
Train [100][2920/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.014)	Loss 2.3591 (2.3773)	Entropy 0.54337 (0.54354)	Top-1 acc 69.141 (66.845)	Top-5 acc 86.328 (85.849)	lr 0.00169
Train [100][2930/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.014)	Loss 2.3266 (2.3775)	Entropy 0.54309 (0.54354)	Top-1 acc 69.922 (66.842)	Top-5 acc 86.328 (85.845)	lr 0.00169
Train [100][2940/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.014)	Loss 2.1660 (2.3772)	Entropy 0.54316 (0.54353)	Top-1 acc 74.609 (66.849)	Top-5 acc 88.281 (85.851)	lr 0.00169
Train [100][2950/3239]	Time 0.247 (0.522)	Data Time 0.001 (0.014)	Loss 2.2567 (2.3772)	Entropy 0.54306 (0.54353)	Top-1 acc 70.312 (66.849)	Top-5 acc 88.281 (85.851)	lr 0.00169
Train [100][2960/3239]	Time 0.329 (0.522)	Data Time 0.001 (0.014)	Loss 2.3538 (2.3772)	Entropy 0.54310 (0.54353)	Top-1 acc 68.750 (66.850)	Top-5 acc 87.109 (85.851)	lr 0.00169
Train [100][2970/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.014)	Loss 2.4285 (2.3771)	Entropy 0.54307 (0.54353)	Top-1 acc 66.797 (66.852)	Top-5 acc 85.156 (85.852)	lr 0.00169
Train [100][2980/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.014)	Loss 2.1150 (2.3770)	Entropy 0.54317 (0.54353)	Top-1 acc 71.875 (66.855)	Top-5 acc 93.359 (85.854)	lr 0.00169
Train [100][2990/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.014)	Loss 2.1955 (2.3769)	Entropy 0.54325 (0.54353)	Top-1 acc 73.047 (66.858)	Top-5 acc 87.891 (85.856)	lr 0.00169
Train [100][3000/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.014)	Loss 2.4520 (2.3766)	Entropy 0.54302 (0.54353)	Top-1 acc 68.359 (66.864)	Top-5 acc 85.938 (85.861)	lr 0.00169
Train [100][3010/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.014)	Loss 2.5113 (2.3765)	Entropy 0.54295 (0.54352)	Top-1 acc 65.234 (66.865)	Top-5 acc 82.031 (85.862)	lr 0.00169
Train [100][3020/3239]	Time 0.290 (0.520)	Data Time 0.001 (0.014)	Loss 2.4948 (2.3765)	Entropy 0.54309 (0.54352)	Top-1 acc 62.500 (66.863)	Top-5 acc 82.422 (85.863)	lr 0.00169
Train [100][3030/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.014)	Loss 2.3417 (2.3765)	Entropy 0.54322 (0.54352)	Top-1 acc 69.141 (66.863)	Top-5 acc 86.328 (85.864)	lr 0.00169
Train [100][3040/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.014)	Loss 2.2328 (2.3763)	Entropy 0.54317 (0.54352)	Top-1 acc 69.531 (66.869)	Top-5 acc 86.328 (85.868)	lr 0.00168
Train [100][3050/3239]	Time 0.346 (0.519)	Data Time 0.001 (0.014)	Loss 2.2188 (2.3761)	Entropy 0.54346 (0.54352)	Top-1 acc 69.141 (66.876)	Top-5 acc 89.062 (85.872)	lr 0.00168
Train [100][3060/3239]	Time 0.234 (0.519)	Data Time 0.001 (0.014)	Loss 2.2135 (2.3761)	Entropy 0.54382 (0.54352)	Top-1 acc 72.656 (66.875)	Top-5 acc 88.281 (85.872)	lr 0.00168
Train [100][3070/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.014)	Loss 2.4043 (2.3760)	Entropy 0.54365 (0.54352)	Top-1 acc 66.797 (66.877)	Top-5 acc 86.719 (85.875)	lr 0.00168
Train [100][3080/3239]	Time 0.249 (0.518)	Data Time 0.001 (0.014)	Loss 2.3730 (2.3760)	Entropy 0.54361 (0.54352)	Top-1 acc 67.578 (66.875)	Top-5 acc 85.547 (85.874)	lr 0.00168
Train [100][3090/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.014)	Loss 2.3502 (2.3759)	Entropy 0.54381 (0.54352)	Top-1 acc 69.922 (66.876)	Top-5 acc 86.719 (85.875)	lr 0.00168
Train [100][3100/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.014)	Loss 2.3483 (2.3758)	Entropy 0.54393 (0.54352)	Top-1 acc 68.359 (66.882)	Top-5 acc 87.109 (85.877)	lr 0.00168
Train [100][3110/3239]	Time 0.224 (0.517)	Data Time 0.001 (0.014)	Loss 2.3910 (2.3756)	Entropy 0.54418 (0.54352)	Top-1 acc 65.625 (66.884)	Top-5 acc 85.547 (85.881)	lr 0.00168
Train [100][3120/3239]	Time 0.354 (0.517)	Data Time 0.001 (0.014)	Loss 2.2231 (2.3754)	Entropy 0.54417 (0.54353)	Top-1 acc 69.531 (66.887)	Top-5 acc 89.844 (85.885)	lr 0.00168
Train [100][3130/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.014)	Loss 2.1359 (2.3754)	Entropy 0.54426 (0.54353)	Top-1 acc 71.094 (66.890)	Top-5 acc 89.844 (85.885)	lr 0.00168
Train [100][3140/3239]	Time 0.285 (0.516)	Data Time 0.001 (0.014)	Loss 2.3481 (2.3754)	Entropy 0.54399 (0.54353)	Top-1 acc 68.750 (66.891)	Top-5 acc 85.547 (85.885)	lr 0.00168
Train [100][3150/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.014)	Loss 2.5426 (2.3753)	Entropy 0.54408 (0.54353)	Top-1 acc 61.719 (66.893)	Top-5 acc 83.203 (85.888)	lr 0.00168
Train [100][3160/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.013)	Loss 2.3916 (2.3755)	Entropy 0.54427 (0.54353)	Top-1 acc 65.625 (66.885)	Top-5 acc 83.203 (85.884)	lr 0.00168
Train [100][3170/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.013)	Loss 2.4912 (2.3755)	Entropy 0.54422 (0.54354)	Top-1 acc 63.672 (66.882)	Top-5 acc 84.766 (85.883)	lr 0.00168
Train [100][3180/3239]	Time 0.231 (0.515)	Data Time 0.000 (0.013)	Loss 2.3262 (2.3757)	Entropy 0.54410 (0.54354)	Top-1 acc 67.578 (66.879)	Top-5 acc 86.328 (85.879)	lr 0.00168
Train [100][3190/3239]	Time 0.237 (0.515)	Data Time 0.000 (0.013)	Loss 2.3354 (2.3758)	Entropy 0.54414 (0.54354)	Top-1 acc 68.359 (66.876)	Top-5 acc 86.328 (85.875)	lr 0.00168
Train [100][3200/3239]	Time 0.226 (0.514)	Data Time 0.000 (0.013)	Loss 2.3003 (2.3759)	Entropy 0.54376 (0.54354)	Top-1 acc 66.797 (66.873)	Top-5 acc 86.719 (85.871)	lr 0.00168
Train [100][3210/3239]	Time 0.247 (0.514)	Data Time 0.000 (0.013)	Loss 2.3158 (2.3760)	Entropy 0.54368 (0.54354)	Top-1 acc 65.234 (66.870)	Top-5 acc 88.672 (85.867)	lr 0.00168
Train [100][3220/3239]	Time 0.222 (0.513)	Data Time 0.000 (0.013)	Loss 2.3522 (2.3761)	Entropy 0.54377 (0.54354)	Top-1 acc 67.188 (66.870)	Top-5 acc 86.719 (85.867)	lr 0.00168
Train [100][3230/3239]	Time 0.236 (0.513)	Data Time 0.000 (0.013)	Loss 2.4027 (2.3761)	Entropy 0.54406 (0.54354)	Top-1 acc 62.109 (66.873)	Top-5 acc 86.328 (85.866)	lr 0.00168
Train [100][3239/3239]	Time 0.944 (0.513)	Data Time 0.000 (0.013)	Loss 2.8882 (2.3762)	Entropy 0.54399 (0.54354)	Top-1 acc 56.790 (66.870)	Top-5 acc 76.543 (85.863)	lr 0.00167
==========Valid [100/120]	loss 1.196	top-1 acc 72.522 (72.522)	top-5 acc 90.315	Train top-1 66.870	top-5 85.863	Entropy 0.54399	Latency-None: 0.000ms	Flops: 539.00M
Train [101][0/3239]	Time 40.139 (40.139)	Data Time 38.283 (38.283)	Loss 2.2082 (2.2082)	Entropy 0.54415 (0.54415)	Top-1 acc 73.828 (73.828)	Top-5 acc 87.109 (87.109)	lr 0.00167
Train [101][10/3239]	Time 0.227 (4.114)	Data Time 0.001 (3.482)	Loss 2.3891 (2.3458)	Entropy 0.54413 (0.54404)	Top-1 acc 64.062 (68.004)	Top-5 acc 86.719 (86.009)	lr 0.00167
Train [101][20/3239]	Time 0.321 (2.356)	Data Time 0.002 (1.825)	Loss 2.1949 (2.3144)	Entropy 0.54390 (0.54404)	Top-1 acc 67.578 (68.843)	Top-5 acc 88.672 (86.830)	lr 0.00167
Train [101][30/3239]	Time 0.232 (1.727)	Data Time 0.001 (1.237)	Loss 2.4013 (2.3517)	Entropy 0.54402 (0.54399)	Top-1 acc 69.141 (68.271)	Top-5 acc 86.328 (86.001)	lr 0.00167
Train [101][40/3239]	Time 0.230 (1.403)	Data Time 0.001 (0.935)	Loss 2.5769 (2.3522)	Entropy 0.54394 (0.54399)	Top-1 acc 62.109 (68.016)	Top-5 acc 82.812 (86.023)	lr 0.00167
Train [101][50/3239]	Time 0.224 (1.209)	Data Time 0.001 (0.752)	Loss 2.5116 (2.3635)	Entropy 0.54317 (0.54392)	Top-1 acc 61.328 (67.601)	Top-5 acc 83.984 (85.938)	lr 0.00167
Train [101][60/3239]	Time 0.228 (1.076)	Data Time 0.001 (0.630)	Loss 2.4957 (2.3687)	Entropy 0.54321 (0.54381)	Top-1 acc 63.281 (67.309)	Top-5 acc 85.547 (86.014)	lr 0.00167
Train [101][70/3239]	Time 0.235 (0.982)	Data Time 0.001 (0.541)	Loss 2.2779 (2.3617)	Entropy 0.54334 (0.54373)	Top-1 acc 70.312 (67.413)	Top-5 acc 87.109 (86.152)	lr 0.00167
Train [101][80/3239]	Time 0.230 (0.910)	Data Time 0.001 (0.475)	Loss 2.5404 (2.3657)	Entropy 0.54330 (0.54367)	Top-1 acc 59.375 (67.168)	Top-5 acc 82.422 (86.150)	lr 0.00167
Train [101][90/3239]	Time 0.236 (0.856)	Data Time 0.001 (0.423)	Loss 2.3850 (2.3677)	Entropy 0.54346 (0.54364)	Top-1 acc 67.969 (67.179)	Top-5 acc 85.547 (86.036)	lr 0.00167
Train [101][100/3239]	Time 0.224 (0.811)	Data Time 0.001 (0.381)	Loss 2.5392 (2.3687)	Entropy 0.54375 (0.54363)	Top-1 acc 61.719 (67.203)	Top-5 acc 81.641 (85.972)	lr 0.00167
Train [101][110/3239]	Time 0.349 (0.776)	Data Time 0.001 (0.347)	Loss 2.2604 (2.3686)	Entropy 0.54368 (0.54364)	Top-1 acc 70.703 (67.226)	Top-5 acc 87.500 (85.980)	lr 0.00167
Train [101][120/3239]	Time 0.230 (0.745)	Data Time 0.001 (0.318)	Loss 2.2804 (2.3715)	Entropy 0.54400 (0.54365)	Top-1 acc 70.703 (67.149)	Top-5 acc 89.062 (85.957)	lr 0.00167
Train [101][130/3239]	Time 0.215 (0.719)	Data Time 0.001 (0.294)	Loss 2.4363 (2.3674)	Entropy 0.54400 (0.54368)	Top-1 acc 67.188 (67.173)	Top-5 acc 86.328 (86.027)	lr 0.00167
Train [101][140/3239]	Time 0.228 (0.697)	Data Time 0.001 (0.273)	Loss 2.4033 (2.3708)	Entropy 0.54418 (0.54371)	Top-1 acc 66.406 (67.099)	Top-5 acc 86.719 (85.993)	lr 0.00167
Train [101][150/3239]	Time 0.234 (0.677)	Data Time 0.001 (0.255)	Loss 2.4165 (2.3728)	Entropy 0.54411 (0.54374)	Top-1 acc 66.016 (67.012)	Top-5 acc 83.594 (85.927)	lr 0.00167
Train [101][160/3239]	Time 0.229 (0.660)	Data Time 0.001 (0.239)	Loss 2.5045 (2.3717)	Entropy 0.54426 (0.54377)	Top-1 acc 63.281 (67.035)	Top-5 acc 83.594 (85.933)	lr 0.00167
Train [101][170/3239]	Time 0.228 (0.645)	Data Time 0.001 (0.226)	Loss 2.3673 (2.3681)	Entropy 0.54415 (0.54379)	Top-1 acc 66.016 (67.119)	Top-5 acc 87.109 (85.942)	lr 0.00167
Train [101][180/3239]	Time 0.319 (0.631)	Data Time 0.001 (0.213)	Loss 2.2339 (2.3669)	Entropy 0.54428 (0.54381)	Top-1 acc 69.141 (67.168)	Top-5 acc 87.500 (85.955)	lr 0.00167
Train [101][190/3239]	Time 0.224 (0.620)	Data Time 0.001 (0.202)	Loss 2.2603 (2.3654)	Entropy 0.54423 (0.54383)	Top-1 acc 74.609 (67.177)	Top-5 acc 85.938 (85.985)	lr 0.00167
Train [101][200/3239]	Time 0.313 (0.876)	Data Time 0.003 (0.192)	Loss 2.4041 (2.3649)	Entropy 0.54439 (0.54385)	Top-1 acc 67.969 (67.201)	Top-5 acc 84.375 (85.978)	lr 0.00166
Train [101][210/3239]	Time 0.260 (0.855)	Data Time 0.001 (0.183)	Loss 2.3510 (2.3642)	Entropy 0.54449 (0.54388)	Top-1 acc 68.359 (67.215)	Top-5 acc 86.328 (85.971)	lr 0.00166
Train [101][220/3239]	Time 0.239 (0.835)	Data Time 0.001 (0.175)	Loss 2.2423 (2.3622)	Entropy 0.54406 (0.54390)	Top-1 acc 71.484 (67.256)	Top-5 acc 87.891 (86.022)	lr 0.00166
Train [101][230/3239]	Time 0.225 (0.817)	Data Time 0.001 (0.168)	Loss 2.2932 (2.3634)	Entropy 0.54411 (0.54390)	Top-1 acc 69.531 (67.220)	Top-5 acc 87.109 (85.971)	lr 0.00166
Train [101][240/3239]	Time 0.223 (0.801)	Data Time 0.001 (0.161)	Loss 2.3866 (2.3657)	Entropy 0.54447 (0.54392)	Top-1 acc 67.188 (67.186)	Top-5 acc 87.891 (85.962)	lr 0.00166
Train [101][250/3239]	Time 0.269 (0.787)	Data Time 0.002 (0.154)	Loss 2.4222 (2.3657)	Entropy 0.54410 (0.54393)	Top-1 acc 64.453 (67.183)	Top-5 acc 86.719 (85.975)	lr 0.00166
Train [101][260/3239]	Time 0.231 (0.772)	Data Time 0.001 (0.148)	Loss 2.2392 (2.3641)	Entropy 0.54421 (0.54394)	Top-1 acc 71.094 (67.159)	Top-5 acc 89.062 (86.039)	lr 0.00166
Train [101][270/3239]	Time 0.425 (0.762)	Data Time 0.003 (0.143)	Loss 2.4638 (2.3663)	Entropy 0.54432 (0.54396)	Top-1 acc 62.891 (67.117)	Top-5 acc 85.938 (86.021)	lr 0.00166
Train [101][280/3239]	Time 0.226 (0.750)	Data Time 0.001 (0.138)	Loss 2.5192 (2.3668)	Entropy 0.54447 (0.54397)	Top-1 acc 62.500 (67.071)	Top-5 acc 87.109 (86.001)	lr 0.00166
Train [101][290/3239]	Time 0.231 (0.738)	Data Time 0.001 (0.133)	Loss 2.3162 (2.3665)	Entropy 0.54443 (0.54399)	Top-1 acc 68.359 (67.063)	Top-5 acc 85.938 (86.007)	lr 0.00166
Train [101][300/3239]	Time 0.231 (0.727)	Data Time 0.001 (0.129)	Loss 2.2270 (2.3681)	Entropy 0.54433 (0.54401)	Top-1 acc 69.531 (66.985)	Top-5 acc 87.109 (86.006)	lr 0.00166
Train [101][310/3239]	Time 0.232 (0.717)	Data Time 0.001 (0.125)	Loss 2.3573 (2.3689)	Entropy 0.54439 (0.54402)	Top-1 acc 67.578 (66.982)	Top-5 acc 86.328 (85.983)	lr 0.00166
Train [101][320/3239]	Time 0.265 (0.708)	Data Time 0.001 (0.121)	Loss 2.5113 (2.3710)	Entropy 0.54445 (0.54403)	Top-1 acc 61.719 (66.944)	Top-5 acc 82.812 (85.929)	lr 0.00166
Train [101][330/3239]	Time 0.225 (0.698)	Data Time 0.001 (0.117)	Loss 2.4643 (2.3712)	Entropy 0.54450 (0.54404)	Top-1 acc 65.625 (66.944)	Top-5 acc 84.375 (85.919)	lr 0.00166
Train [101][340/3239]	Time 0.315 (0.690)	Data Time 0.001 (0.114)	Loss 2.1836 (2.3702)	Entropy 0.54430 (0.54405)	Top-1 acc 71.484 (66.944)	Top-5 acc 88.281 (85.924)	lr 0.00166
Train [101][350/3239]	Time 0.239 (0.682)	Data Time 0.001 (0.111)	Loss 2.4866 (2.3703)	Entropy 0.54411 (0.54405)	Top-1 acc 65.234 (66.942)	Top-5 acc 84.766 (85.932)	lr 0.00166
Train [101][360/3239]	Time 0.229 (0.675)	Data Time 0.001 (0.108)	Loss 2.2626 (2.3705)	Entropy 0.54439 (0.54406)	Top-1 acc 69.141 (66.936)	Top-5 acc 88.672 (85.943)	lr 0.00166
Train [101][370/3239]	Time 0.229 (0.669)	Data Time 0.001 (0.105)	Loss 2.4179 (2.3700)	Entropy 0.54493 (0.54407)	Top-1 acc 63.672 (66.965)	Top-5 acc 85.156 (85.926)	lr 0.00166
Train [101][380/3239]	Time 0.231 (0.662)	Data Time 0.001 (0.102)	Loss 2.4926 (2.3712)	Entropy 0.54502 (0.54409)	Top-1 acc 63.672 (66.940)	Top-5 acc 81.641 (85.896)	lr 0.00166
Train [101][390/3239]	Time 0.254 (0.656)	Data Time 0.001 (0.100)	Loss 2.2646 (2.3710)	Entropy 0.54517 (0.54412)	Top-1 acc 67.188 (66.944)	Top-5 acc 88.281 (85.901)	lr 0.00166
Train [101][400/3239]	Time 0.274 (0.650)	Data Time 0.001 (0.097)	Loss 2.2385 (2.3709)	Entropy 0.54527 (0.54415)	Top-1 acc 73.047 (66.970)	Top-5 acc 87.891 (85.897)	lr 0.00165
Train [101][410/3239]	Time 0.238 (0.648)	Data Time 0.002 (0.095)	Loss 2.2855 (2.3708)	Entropy 0.54525 (0.54417)	Top-1 acc 69.531 (66.995)	Top-5 acc 87.891 (85.890)	lr 0.00165
Train [101][420/3239]	Time 0.229 (0.642)	Data Time 0.001 (0.093)	Loss 2.2655 (2.3710)	Entropy 0.54511 (0.54420)	Top-1 acc 70.312 (66.984)	Top-5 acc 88.672 (85.899)	lr 0.00165
Train [101][430/3239]	Time 0.324 (0.637)	Data Time 0.001 (0.091)	Loss 2.2658 (2.3723)	Entropy 0.54508 (0.54422)	Top-1 acc 70.703 (66.963)	Top-5 acc 87.891 (85.886)	lr 0.00165
Train [101][440/3239]	Time 0.233 (0.632)	Data Time 0.001 (0.089)	Loss 2.3374 (2.3711)	Entropy 0.54497 (0.54424)	Top-1 acc 69.141 (66.997)	Top-5 acc 82.812 (85.889)	lr 0.00165
Train [101][450/3239]	Time 0.229 (0.627)	Data Time 0.001 (0.087)	Loss 2.2847 (2.3705)	Entropy 0.54494 (0.54425)	Top-1 acc 70.312 (67.008)	Top-5 acc 87.109 (85.885)	lr 0.00165
Train [101][460/3239]	Time 0.247 (0.623)	Data Time 0.001 (0.085)	Loss 2.6120 (2.3708)	Entropy 0.54478 (0.54427)	Top-1 acc 62.109 (67.016)	Top-5 acc 82.031 (85.882)	lr 0.00165
Train [101][470/3239]	Time 0.233 (0.618)	Data Time 0.002 (0.083)	Loss 2.3152 (2.3707)	Entropy 0.54483 (0.54428)	Top-1 acc 66.797 (67.015)	Top-5 acc 87.109 (85.887)	lr 0.00165
Train [101][480/3239]	Time 0.234 (0.614)	Data Time 0.001 (0.081)	Loss 2.2148 (2.3701)	Entropy 0.54439 (0.54429)	Top-1 acc 71.094 (67.038)	Top-5 acc 87.500 (85.893)	lr 0.00165
Train [101][490/3239]	Time 0.230 (0.610)	Data Time 0.001 (0.080)	Loss 2.5085 (2.3712)	Entropy 0.54420 (0.54429)	Top-1 acc 63.281 (67.024)	Top-5 acc 85.547 (85.881)	lr 0.00165
Train [101][500/3239]	Time 0.329 (0.606)	Data Time 0.001 (0.078)	Loss 2.3612 (2.3725)	Entropy 0.54411 (0.54428)	Top-1 acc 66.016 (66.978)	Top-5 acc 87.500 (85.871)	lr 0.00165
Train [101][510/3239]	Time 0.225 (0.602)	Data Time 0.001 (0.077)	Loss 2.4585 (2.3739)	Entropy 0.54407 (0.54428)	Top-1 acc 62.109 (66.948)	Top-5 acc 85.938 (85.863)	lr 0.00165
Train [101][520/3239]	Time 0.229 (0.598)	Data Time 0.001 (0.075)	Loss 2.1944 (2.3738)	Entropy 0.54425 (0.54428)	Top-1 acc 69.141 (66.942)	Top-5 acc 88.672 (85.874)	lr 0.00165
Train [101][530/3239]	Time 0.237 (0.595)	Data Time 0.001 (0.074)	Loss 2.3512 (2.3731)	Entropy 0.54460 (0.54428)	Top-1 acc 63.672 (66.947)	Top-5 acc 87.109 (85.875)	lr 0.00165
Train [101][540/3239]	Time 0.227 (0.592)	Data Time 0.001 (0.072)	Loss 2.3411 (2.3727)	Entropy 0.54440 (0.54428)	Top-1 acc 65.234 (66.956)	Top-5 acc 86.719 (85.880)	lr 0.00165
Train [101][550/3239]	Time 0.245 (0.588)	Data Time 0.001 (0.071)	Loss 2.2214 (2.3719)	Entropy 0.54401 (0.54428)	Top-1 acc 71.094 (66.986)	Top-5 acc 86.719 (85.888)	lr 0.00165
Train [101][560/3239]	Time 0.233 (0.585)	Data Time 0.001 (0.070)	Loss 2.3684 (2.3715)	Entropy 0.54398 (0.54428)	Top-1 acc 69.922 (67.002)	Top-5 acc 85.938 (85.889)	lr 0.00165
Train [101][570/3239]	Time 0.232 (0.582)	Data Time 0.001 (0.069)	Loss 2.4495 (2.3715)	Entropy 0.54409 (0.54427)	Top-1 acc 66.797 (67.023)	Top-5 acc 85.938 (85.899)	lr 0.00165
Train [101][580/3239]	Time 0.219 (0.579)	Data Time 0.001 (0.068)	Loss 2.4641 (2.3702)	Entropy 0.54397 (0.54427)	Top-1 acc 60.547 (67.046)	Top-5 acc 85.938 (85.928)	lr 0.00165
Train [101][590/3239]	Time 0.246 (0.576)	Data Time 0.001 (0.066)	Loss 2.5058 (2.3710)	Entropy 0.54379 (0.54426)	Top-1 acc 62.891 (67.026)	Top-5 acc 81.641 (85.916)	lr 0.00165
Train [101][600/3239]	Time 0.226 (0.573)	Data Time 0.001 (0.065)	Loss 2.3560 (2.3707)	Entropy 0.54392 (0.54426)	Top-1 acc 66.406 (67.033)	Top-5 acc 87.891 (85.922)	lr 0.00164
Train [101][610/3239]	Time 0.228 (0.570)	Data Time 0.001 (0.064)	Loss 2.2091 (2.3696)	Entropy 0.54386 (0.54425)	Top-1 acc 67.578 (67.056)	Top-5 acc 88.672 (85.942)	lr 0.00164
Train [101][620/3239]	Time 0.258 (0.567)	Data Time 0.001 (0.063)	Loss 2.3913 (2.3700)	Entropy 0.54366 (0.54424)	Top-1 acc 67.188 (67.044)	Top-5 acc 85.547 (85.938)	lr 0.00164
Train [101][630/3239]	Time 0.222 (0.565)	Data Time 0.001 (0.062)	Loss 2.3146 (2.3696)	Entropy 0.54391 (0.54423)	Top-1 acc 69.141 (67.054)	Top-5 acc 87.500 (85.946)	lr 0.00164
Train [101][640/3239]	Time 0.227 (0.562)	Data Time 0.001 (0.061)	Loss 2.4096 (2.3696)	Entropy 0.54421 (0.54423)	Top-1 acc 67.188 (67.053)	Top-5 acc 84.766 (85.951)	lr 0.00164
Train [101][650/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.060)	Loss 2.3818 (2.3700)	Entropy 0.54398 (0.54423)	Top-1 acc 66.406 (67.037)	Top-5 acc 85.156 (85.946)	lr 0.00164
Train [101][660/3239]	Time 0.320 (0.557)	Data Time 0.001 (0.060)	Loss 2.5135 (2.3704)	Entropy 0.54409 (0.54423)	Top-1 acc 59.766 (67.020)	Top-5 acc 82.422 (85.941)	lr 0.00164
Train [101][670/3239]	Time 0.223 (0.555)	Data Time 0.001 (0.059)	Loss 2.3796 (2.3701)	Entropy 0.54429 (0.54422)	Top-1 acc 66.406 (67.024)	Top-5 acc 84.375 (85.941)	lr 0.00164
Train [101][680/3239]	Time 0.230 (0.553)	Data Time 0.001 (0.058)	Loss 2.4981 (2.3710)	Entropy 0.54435 (0.54423)	Top-1 acc 62.891 (66.992)	Top-5 acc 82.031 (85.928)	lr 0.00164
Train [101][690/3239]	Time 0.265 (0.551)	Data Time 0.001 (0.057)	Loss 2.3759 (2.3713)	Entropy 0.54452 (0.54423)	Top-1 acc 65.625 (66.978)	Top-5 acc 86.719 (85.919)	lr 0.00164
Train [101][700/3239]	Time 0.233 (0.549)	Data Time 0.001 (0.056)	Loss 2.1979 (2.3705)	Entropy 0.54487 (0.54423)	Top-1 acc 71.094 (67.004)	Top-5 acc 89.844 (85.933)	lr 0.00164
Train [101][710/3239]	Time 0.237 (0.547)	Data Time 0.001 (0.055)	Loss 2.3324 (2.3694)	Entropy 0.54481 (0.54424)	Top-1 acc 67.188 (67.035)	Top-5 acc 87.109 (85.947)	lr 0.00164
Train [101][720/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.055)	Loss 2.5826 (2.3702)	Entropy 0.54466 (0.54425)	Top-1 acc 64.062 (67.032)	Top-5 acc 81.250 (85.935)	lr 0.00164
Train [101][730/3239]	Time 0.406 (0.543)	Data Time 0.001 (0.054)	Loss 2.2080 (2.3698)	Entropy 0.54461 (0.54425)	Top-1 acc 71.094 (67.053)	Top-5 acc 89.453 (85.943)	lr 0.00164
Train [101][740/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.053)	Loss 2.1736 (2.3698)	Entropy 0.54476 (0.54426)	Top-1 acc 69.922 (67.047)	Top-5 acc 89.453 (85.939)	lr 0.00164
Train [101][750/3239]	Time 0.229 (0.541)	Data Time 0.001 (0.053)	Loss 2.4891 (2.3702)	Entropy 0.54450 (0.54427)	Top-1 acc 67.188 (67.048)	Top-5 acc 84.375 (85.939)	lr 0.00164
Train [101][760/3239]	Time 0.224 (0.539)	Data Time 0.001 (0.052)	Loss 2.3143 (2.3700)	Entropy 0.54469 (0.54427)	Top-1 acc 68.359 (67.052)	Top-5 acc 86.328 (85.942)	lr 0.00164
Train [101][770/3239]	Time 0.221 (0.537)	Data Time 0.001 (0.051)	Loss 2.3677 (2.3696)	Entropy 0.54451 (0.54427)	Top-1 acc 67.969 (67.072)	Top-5 acc 85.547 (85.946)	lr 0.00164
Train [101][780/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.051)	Loss 2.3955 (2.3688)	Entropy 0.54424 (0.54428)	Top-1 acc 66.016 (67.088)	Top-5 acc 84.766 (85.962)	lr 0.00164
Train [101][790/3239]	Time 0.234 (0.534)	Data Time 0.001 (0.050)	Loss 2.1906 (2.3679)	Entropy 0.54434 (0.54428)	Top-1 acc 70.312 (67.107)	Top-5 acc 89.453 (85.976)	lr 0.00164
Train [101][800/3239]	Time 0.225 (0.533)	Data Time 0.001 (0.049)	Loss 2.7175 (2.3695)	Entropy 0.54431 (0.54428)	Top-1 acc 56.250 (67.059)	Top-5 acc 79.297 (85.950)	lr 0.00163
Train [101][810/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.049)	Loss 2.3993 (2.3695)	Entropy 0.54463 (0.54428)	Top-1 acc 66.016 (67.041)	Top-5 acc 86.719 (85.952)	lr 0.00163
Train [101][820/3239]	Time 0.330 (0.530)	Data Time 0.002 (0.048)	Loss 2.5871 (2.3698)	Entropy 0.54463 (0.54428)	Top-1 acc 62.500 (67.035)	Top-5 acc 79.297 (85.937)	lr 0.00163
Train [101][830/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.048)	Loss 2.3590 (2.3700)	Entropy 0.54455 (0.54429)	Top-1 acc 67.578 (67.034)	Top-5 acc 85.547 (85.930)	lr 0.00163
Train [101][840/3239]	Time 0.221 (0.527)	Data Time 0.001 (0.047)	Loss 2.2609 (2.3704)	Entropy 0.54452 (0.54429)	Top-1 acc 71.875 (67.037)	Top-5 acc 87.891 (85.922)	lr 0.00163
Train [101][850/3239]	Time 0.322 (0.588)	Data Time 0.034 (0.047)	Loss 2.4422 (2.3717)	Entropy 0.54437 (0.54429)	Top-1 acc 64.453 (67.019)	Top-5 acc 83.984 (85.902)	lr 0.00163
Train [101][860/3239]	Time 0.258 (0.587)	Data Time 0.002 (0.046)	Loss 2.2259 (2.3712)	Entropy 0.54447 (0.54429)	Top-1 acc 69.531 (67.037)	Top-5 acc 90.234 (85.915)	lr 0.00163
Train [101][870/3239]	Time 0.260 (0.585)	Data Time 0.001 (0.046)	Loss 2.4234 (2.3712)	Entropy 0.54404 (0.54429)	Top-1 acc 64.062 (67.036)	Top-5 acc 87.109 (85.915)	lr 0.00163
Train [101][880/3239]	Time 0.262 (0.583)	Data Time 0.001 (0.045)	Loss 2.2555 (2.3708)	Entropy 0.54409 (0.54429)	Top-1 acc 69.922 (67.041)	Top-5 acc 87.109 (85.921)	lr 0.00163
Train [101][890/3239]	Time 0.340 (0.581)	Data Time 0.001 (0.045)	Loss 2.3022 (2.3706)	Entropy 0.54400 (0.54429)	Top-1 acc 71.094 (67.046)	Top-5 acc 87.500 (85.931)	lr 0.00163
Train [101][900/3239]	Time 0.233 (0.580)	Data Time 0.001 (0.044)	Loss 2.5529 (2.3712)	Entropy 0.54390 (0.54429)	Top-1 acc 60.938 (67.026)	Top-5 acc 84.766 (85.920)	lr 0.00163
Train [101][910/3239]	Time 0.223 (0.578)	Data Time 0.001 (0.044)	Loss 2.3220 (2.3710)	Entropy 0.54379 (0.54428)	Top-1 acc 66.406 (67.039)	Top-5 acc 87.109 (85.921)	lr 0.00163
Train [101][920/3239]	Time 0.255 (0.576)	Data Time 0.001 (0.043)	Loss 2.2996 (2.3707)	Entropy 0.54400 (0.54428)	Top-1 acc 71.875 (67.048)	Top-5 acc 86.719 (85.921)	lr 0.00163
Train [101][930/3239]	Time 0.328 (0.574)	Data Time 0.001 (0.043)	Loss 2.3588 (2.3708)	Entropy 0.54394 (0.54427)	Top-1 acc 67.578 (67.044)	Top-5 acc 85.156 (85.912)	lr 0.00163
Train [101][940/3239]	Time 0.261 (0.574)	Data Time 0.002 (0.042)	Loss 2.2639 (2.3714)	Entropy 0.54369 (0.54427)	Top-1 acc 71.094 (67.034)	Top-5 acc 87.891 (85.903)	lr 0.00163
Train [101][950/3239]	Time 0.249 (0.572)	Data Time 0.001 (0.042)	Loss 2.8931 (2.3722)	Entropy 0.54371 (0.54427)	Top-1 acc 53.516 (67.026)	Top-5 acc 76.562 (85.885)	lr 0.00163
Train [101][960/3239]	Time 0.234 (0.571)	Data Time 0.001 (0.041)	Loss 2.4861 (2.3723)	Entropy 0.54389 (0.54426)	Top-1 acc 63.281 (67.017)	Top-5 acc 83.203 (85.883)	lr 0.00163
Train [101][970/3239]	Time 0.229 (0.569)	Data Time 0.001 (0.041)	Loss 2.6007 (2.3721)	Entropy 0.54384 (0.54426)	Top-1 acc 60.938 (67.026)	Top-5 acc 80.859 (85.883)	lr 0.00163
Train [101][980/3239]	Time 0.331 (0.568)	Data Time 0.001 (0.041)	Loss 2.2631 (2.3719)	Entropy 0.54383 (0.54425)	Top-1 acc 70.312 (67.029)	Top-5 acc 87.891 (85.885)	lr 0.00163
Train [101][990/3239]	Time 0.243 (0.566)	Data Time 0.001 (0.040)	Loss 2.6535 (2.3722)	Entropy 0.54365 (0.54425)	Top-1 acc 59.375 (67.020)	Top-5 acc 82.031 (85.883)	lr 0.00163
Train [101][1000/3239]	Time 0.228 (0.565)	Data Time 0.001 (0.040)	Loss 2.2799 (2.3718)	Entropy 0.54372 (0.54424)	Top-1 acc 69.141 (67.027)	Top-5 acc 88.281 (85.897)	lr 0.00162
Train [101][1010/3239]	Time 0.231 (0.563)	Data Time 0.001 (0.039)	Loss 2.4063 (2.3722)	Entropy 0.54362 (0.54424)	Top-1 acc 64.062 (67.011)	Top-5 acc 84.766 (85.894)	lr 0.00162
Train [101][1020/3239]	Time 0.237 (0.562)	Data Time 0.001 (0.039)	Loss 2.3629 (2.3724)	Entropy 0.54336 (0.54423)	Top-1 acc 68.359 (67.004)	Top-5 acc 87.109 (85.897)	lr 0.00162
Train [101][1030/3239]	Time 0.238 (0.560)	Data Time 0.001 (0.039)	Loss 2.3301 (2.3728)	Entropy 0.54302 (0.54422)	Top-1 acc 67.188 (66.983)	Top-5 acc 86.328 (85.892)	lr 0.00162
Train [101][1040/3239]	Time 0.240 (0.559)	Data Time 0.001 (0.038)	Loss 2.4698 (2.3731)	Entropy 0.54309 (0.54421)	Top-1 acc 65.234 (66.983)	Top-5 acc 83.984 (85.889)	lr 0.00162
Train [101][1050/3239]	Time 0.321 (0.558)	Data Time 0.001 (0.038)	Loss 2.3931 (2.3728)	Entropy 0.54294 (0.54420)	Top-1 acc 66.406 (66.986)	Top-5 acc 85.547 (85.895)	lr 0.00162
Train [101][1060/3239]	Time 0.228 (0.556)	Data Time 0.001 (0.038)	Loss 2.3708 (2.3723)	Entropy 0.54268 (0.54419)	Top-1 acc 69.141 (67.006)	Top-5 acc 84.766 (85.898)	lr 0.00162
Train [101][1070/3239]	Time 0.231 (0.555)	Data Time 0.001 (0.037)	Loss 2.4677 (2.3729)	Entropy 0.54263 (0.54417)	Top-1 acc 64.453 (66.992)	Top-5 acc 84.375 (85.897)	lr 0.00162
Train [101][1080/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.037)	Loss 2.2096 (2.3732)	Entropy 0.54266 (0.54416)	Top-1 acc 71.094 (66.977)	Top-5 acc 85.938 (85.884)	lr 0.00162
Train [101][1090/3239]	Time 0.224 (0.552)	Data Time 0.001 (0.037)	Loss 2.3310 (2.3727)	Entropy 0.54211 (0.54414)	Top-1 acc 66.797 (66.986)	Top-5 acc 85.156 (85.891)	lr 0.00162
Train [101][1100/3239]	Time 0.228 (0.551)	Data Time 0.001 (0.036)	Loss 2.2120 (2.3723)	Entropy 0.54240 (0.54412)	Top-1 acc 70.703 (67.001)	Top-5 acc 87.891 (85.902)	lr 0.00162
Train [101][1110/3239]	Time 0.228 (0.550)	Data Time 0.001 (0.036)	Loss 2.4019 (2.3719)	Entropy 0.54234 (0.54411)	Top-1 acc 63.672 (67.006)	Top-5 acc 85.938 (85.910)	lr 0.00162
Train [101][1120/3239]	Time 0.229 (0.549)	Data Time 0.001 (0.036)	Loss 2.4040 (2.3724)	Entropy 0.54233 (0.54409)	Top-1 acc 67.188 (66.994)	Top-5 acc 84.766 (85.901)	lr 0.00162
Train [101][1130/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.035)	Loss 2.4424 (2.3722)	Entropy 0.54220 (0.54408)	Top-1 acc 66.797 (66.999)	Top-5 acc 85.156 (85.904)	lr 0.00162
Train [101][1140/3239]	Time 0.335 (0.546)	Data Time 0.001 (0.035)	Loss 2.2427 (2.3725)	Entropy 0.54228 (0.54406)	Top-1 acc 71.484 (66.978)	Top-5 acc 87.109 (85.902)	lr 0.00162
Train [101][1150/3239]	Time 0.279 (0.546)	Data Time 0.001 (0.035)	Loss 2.2627 (2.3727)	Entropy 0.54226 (0.54404)	Top-1 acc 69.141 (66.977)	Top-5 acc 85.938 (85.895)	lr 0.00162
Train [101][1160/3239]	Time 0.284 (0.546)	Data Time 0.001 (0.035)	Loss 2.3866 (2.3729)	Entropy 0.54204 (0.54403)	Top-1 acc 68.359 (66.976)	Top-5 acc 83.203 (85.889)	lr 0.00162
Train [101][1170/3239]	Time 0.256 (0.545)	Data Time 0.001 (0.034)	Loss 2.3242 (2.3729)	Entropy 0.54186 (0.54401)	Top-1 acc 67.188 (66.975)	Top-5 acc 85.156 (85.890)	lr 0.00162
Train [101][1180/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.034)	Loss 2.2614 (2.3729)	Entropy 0.54194 (0.54399)	Top-1 acc 68.750 (66.977)	Top-5 acc 88.672 (85.893)	lr 0.00162
Train [101][1190/3239]	Time 0.225 (0.543)	Data Time 0.001 (0.034)	Loss 2.3473 (2.3731)	Entropy 0.54214 (0.54398)	Top-1 acc 67.969 (66.978)	Top-5 acc 85.938 (85.892)	lr 0.00162
Train [101][1200/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.033)	Loss 2.5546 (2.3734)	Entropy 0.54216 (0.54396)	Top-1 acc 58.984 (66.969)	Top-5 acc 83.594 (85.887)	lr 0.00161
Train [101][1210/3239]	Time 0.318 (0.541)	Data Time 0.001 (0.033)	Loss 2.1311 (2.3730)	Entropy 0.54209 (0.54394)	Top-1 acc 71.094 (66.975)	Top-5 acc 91.016 (85.898)	lr 0.00161
Train [101][1220/3239]	Time 0.225 (0.540)	Data Time 0.001 (0.033)	Loss 2.2725 (2.3730)	Entropy 0.54199 (0.54393)	Top-1 acc 69.531 (66.975)	Top-5 acc 87.109 (85.897)	lr 0.00161
Train [101][1230/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.033)	Loss 2.4005 (2.3729)	Entropy 0.54207 (0.54391)	Top-1 acc 68.750 (66.981)	Top-5 acc 84.375 (85.901)	lr 0.00161
Train [101][1240/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.032)	Loss 2.2570 (2.3730)	Entropy 0.54198 (0.54390)	Top-1 acc 69.141 (66.978)	Top-5 acc 87.500 (85.900)	lr 0.00161
Train [101][1250/3239]	Time 0.228 (0.537)	Data Time 0.001 (0.032)	Loss 2.3942 (2.3732)	Entropy 0.54244 (0.54388)	Top-1 acc 65.234 (66.968)	Top-5 acc 84.766 (85.893)	lr 0.00161
Train [101][1260/3239]	Time 0.241 (0.536)	Data Time 0.001 (0.032)	Loss 2.3578 (2.3730)	Entropy 0.54224 (0.54387)	Top-1 acc 66.406 (66.973)	Top-5 acc 85.938 (85.900)	lr 0.00161
Train [101][1270/3239]	Time 0.219 (0.535)	Data Time 0.001 (0.032)	Loss 2.2565 (2.3729)	Entropy 0.54203 (0.54386)	Top-1 acc 70.703 (66.964)	Top-5 acc 90.625 (85.904)	lr 0.00161
Train [101][1280/3239]	Time 0.327 (0.534)	Data Time 0.002 (0.032)	Loss 2.7400 (2.3738)	Entropy 0.54244 (0.54385)	Top-1 acc 54.688 (66.937)	Top-5 acc 79.297 (85.888)	lr 0.00161
Train [101][1290/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.031)	Loss 2.3910 (2.3737)	Entropy 0.54265 (0.54384)	Top-1 acc 64.844 (66.936)	Top-5 acc 84.375 (85.892)	lr 0.00161
Train [101][1300/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.031)	Loss 2.4299 (2.3732)	Entropy 0.54235 (0.54383)	Top-1 acc 66.797 (66.946)	Top-5 acc 86.328 (85.901)	lr 0.00161
Train [101][1310/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.031)	Loss 2.7418 (2.3732)	Entropy 0.54234 (0.54382)	Top-1 acc 58.594 (66.938)	Top-5 acc 82.031 (85.904)	lr 0.00161
Train [101][1320/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.031)	Loss 2.3484 (2.3725)	Entropy 0.54250 (0.54380)	Top-1 acc 69.531 (66.960)	Top-5 acc 86.719 (85.917)	lr 0.00161
Train [101][1330/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.030)	Loss 2.2623 (2.3726)	Entropy 0.54231 (0.54379)	Top-1 acc 69.141 (66.954)	Top-5 acc 89.453 (85.915)	lr 0.00161
Train [101][1340/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.030)	Loss 2.4943 (2.3724)	Entropy 0.54202 (0.54378)	Top-1 acc 62.500 (66.958)	Top-5 acc 84.766 (85.920)	lr 0.00161
Train [101][1350/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.030)	Loss 2.3409 (2.3720)	Entropy 0.54206 (0.54377)	Top-1 acc 67.969 (66.975)	Top-5 acc 87.891 (85.930)	lr 0.00161
Train [101][1360/3239]	Time 0.223 (0.526)	Data Time 0.001 (0.030)	Loss 2.4100 (2.3720)	Entropy 0.54196 (0.54376)	Top-1 acc 66.016 (66.970)	Top-5 acc 86.719 (85.929)	lr 0.00161
Train [101][1370/3239]	Time 0.374 (0.526)	Data Time 0.001 (0.030)	Loss 2.2367 (2.3715)	Entropy 0.54202 (0.54374)	Top-1 acc 68.750 (66.977)	Top-5 acc 89.453 (85.941)	lr 0.00161
Train [101][1380/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.029)	Loss 2.4192 (2.3713)	Entropy 0.54172 (0.54373)	Top-1 acc 66.406 (66.982)	Top-5 acc 84.375 (85.943)	lr 0.00161
Train [101][1390/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.029)	Loss 2.3122 (2.3710)	Entropy 0.54207 (0.54372)	Top-1 acc 67.969 (66.986)	Top-5 acc 86.328 (85.949)	lr 0.00161
Train [101][1400/3239]	Time 0.282 (0.524)	Data Time 0.001 (0.029)	Loss 2.1380 (2.3708)	Entropy 0.54228 (0.54370)	Top-1 acc 72.656 (66.995)	Top-5 acc 91.406 (85.953)	lr 0.00160
Train [101][1410/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.029)	Loss 2.2794 (2.3708)	Entropy 0.54239 (0.54369)	Top-1 acc 68.750 (66.989)	Top-5 acc 85.547 (85.948)	lr 0.00160
Train [101][1420/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.029)	Loss 2.4394 (2.3712)	Entropy 0.54243 (0.54369)	Top-1 acc 60.156 (66.968)	Top-5 acc 84.766 (85.943)	lr 0.00160
Train [101][1430/3239]	Time 0.247 (0.522)	Data Time 0.001 (0.028)	Loss 2.5778 (2.3716)	Entropy 0.54246 (0.54368)	Top-1 acc 60.156 (66.960)	Top-5 acc 80.469 (85.933)	lr 0.00160
Train [101][1440/3239]	Time 0.340 (0.521)	Data Time 0.001 (0.028)	Loss 2.2616 (2.3715)	Entropy 0.54240 (0.54367)	Top-1 acc 69.531 (66.958)	Top-5 acc 85.938 (85.931)	lr 0.00160
Train [101][1450/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.028)	Loss 2.2252 (2.3713)	Entropy 0.54247 (0.54366)	Top-1 acc 67.188 (66.961)	Top-5 acc 88.281 (85.941)	lr 0.00160
Train [101][1460/3239]	Time 0.225 (0.519)	Data Time 0.001 (0.028)	Loss 2.6027 (2.3715)	Entropy 0.54245 (0.54365)	Top-1 acc 59.766 (66.954)	Top-5 acc 81.641 (85.934)	lr 0.00160
Train [101][1470/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.028)	Loss 2.3623 (2.3712)	Entropy 0.54219 (0.54364)	Top-1 acc 65.234 (66.961)	Top-5 acc 84.766 (85.936)	lr 0.00160
Train [101][1480/3239]	Time 0.222 (0.518)	Data Time 0.001 (0.027)	Loss 2.3740 (2.3708)	Entropy 0.54196 (0.54363)	Top-1 acc 66.016 (66.970)	Top-5 acc 87.109 (85.941)	lr 0.00160
Train [101][1490/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.027)	Loss 2.4086 (2.3711)	Entropy 0.54215 (0.54362)	Top-1 acc 68.359 (66.965)	Top-5 acc 85.547 (85.935)	lr 0.00160
Train [101][1500/3239]	Time 0.219 (0.516)	Data Time 0.001 (0.027)	Loss 2.4109 (2.3715)	Entropy 0.54210 (0.54361)	Top-1 acc 68.750 (66.958)	Top-5 acc 84.375 (85.932)	lr 0.00160
Train [101][1510/3239]	Time 0.278 (0.550)	Data Time 0.002 (0.027)	Loss 2.2664 (2.3715)	Entropy 0.54233 (0.54360)	Top-1 acc 68.750 (66.953)	Top-5 acc 88.672 (85.933)	lr 0.00160
Train [101][1520/3239]	Time 0.243 (0.549)	Data Time 0.002 (0.027)	Loss 2.1583 (2.3718)	Entropy 0.54218 (0.54359)	Top-1 acc 66.797 (66.940)	Top-5 acc 90.234 (85.933)	lr 0.00160
Train [101][1530/3239]	Time 0.327 (0.549)	Data Time 0.001 (0.027)	Loss 2.3427 (2.3717)	Entropy 0.54235 (0.54359)	Top-1 acc 67.188 (66.939)	Top-5 acc 83.984 (85.931)	lr 0.00160
Train [101][1540/3239]	Time 0.229 (0.548)	Data Time 0.001 (0.027)	Loss 2.3182 (2.3716)	Entropy 0.54252 (0.54358)	Top-1 acc 69.922 (66.939)	Top-5 acc 86.328 (85.928)	lr 0.00160
Train [101][1550/3239]	Time 0.237 (0.547)	Data Time 0.001 (0.026)	Loss 2.5727 (2.3717)	Entropy 0.54277 (0.54357)	Top-1 acc 62.109 (66.937)	Top-5 acc 83.984 (85.936)	lr 0.00160
Train [101][1560/3239]	Time 0.226 (0.546)	Data Time 0.001 (0.026)	Loss 2.4241 (2.3714)	Entropy 0.54306 (0.54357)	Top-1 acc 68.750 (66.947)	Top-5 acc 84.766 (85.933)	lr 0.00160
Train [101][1570/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.026)	Loss 2.2969 (2.3714)	Entropy 0.54276 (0.54356)	Top-1 acc 69.141 (66.950)	Top-5 acc 89.062 (85.930)	lr 0.00160
Train [101][1580/3239]	Time 0.235 (0.545)	Data Time 0.001 (0.026)	Loss 2.3608 (2.3717)	Entropy 0.54251 (0.54356)	Top-1 acc 67.578 (66.946)	Top-5 acc 87.891 (85.928)	lr 0.00160
Train [101][1590/3239]	Time 0.244 (0.544)	Data Time 0.001 (0.026)	Loss 2.2987 (2.3718)	Entropy 0.54268 (0.54355)	Top-1 acc 66.797 (66.945)	Top-5 acc 87.891 (85.921)	lr 0.00160
Train [101][1600/3239]	Time 0.369 (0.543)	Data Time 0.001 (0.026)	Loss 2.0851 (2.3716)	Entropy 0.54252 (0.54355)	Top-1 acc 70.312 (66.941)	Top-5 acc 92.188 (85.925)	lr 0.00159
Train [101][1610/3239]	Time 0.272 (0.543)	Data Time 0.001 (0.025)	Loss 2.3168 (2.3718)	Entropy 0.54285 (0.54354)	Top-1 acc 66.797 (66.936)	Top-5 acc 85.938 (85.921)	lr 0.00159
Train [101][1620/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.025)	Loss 2.3142 (2.3715)	Entropy 0.54250 (0.54354)	Top-1 acc 66.406 (66.940)	Top-5 acc 87.891 (85.931)	lr 0.00159
Train [101][1630/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.025)	Loss 2.4264 (2.3713)	Entropy 0.54272 (0.54353)	Top-1 acc 63.672 (66.945)	Top-5 acc 84.766 (85.929)	lr 0.00159
Train [101][1640/3239]	Time 0.235 (0.541)	Data Time 0.001 (0.025)	Loss 2.3884 (2.3713)	Entropy 0.54306 (0.54353)	Top-1 acc 67.578 (66.947)	Top-5 acc 84.766 (85.927)	lr 0.00159
Train [101][1650/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.025)	Loss 2.3525 (2.3712)	Entropy 0.54307 (0.54352)	Top-1 acc 68.359 (66.947)	Top-5 acc 84.375 (85.929)	lr 0.00159
Train [101][1660/3239]	Time 0.238 (0.539)	Data Time 0.001 (0.025)	Loss 2.3449 (2.3714)	Entropy 0.54302 (0.54352)	Top-1 acc 67.188 (66.943)	Top-5 acc 85.938 (85.926)	lr 0.00159
Train [101][1670/3239]	Time 0.244 (0.538)	Data Time 0.001 (0.025)	Loss 2.4187 (2.3716)	Entropy 0.54286 (0.54352)	Top-1 acc 66.797 (66.935)	Top-5 acc 82.812 (85.920)	lr 0.00159
Train [101][1680/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.025)	Loss 2.4010 (2.3717)	Entropy 0.54270 (0.54351)	Top-1 acc 67.578 (66.932)	Top-5 acc 83.594 (85.918)	lr 0.00159
Train [101][1690/3239]	Time 0.368 (0.537)	Data Time 0.001 (0.024)	Loss 2.3502 (2.3716)	Entropy 0.54284 (0.54351)	Top-1 acc 65.625 (66.932)	Top-5 acc 88.281 (85.921)	lr 0.00159
Train [101][1700/3239]	Time 0.275 (0.537)	Data Time 0.002 (0.024)	Loss 2.4978 (2.3720)	Entropy 0.54304 (0.54351)	Top-1 acc 63.281 (66.925)	Top-5 acc 81.250 (85.911)	lr 0.00159
Train [101][1710/3239]	Time 0.235 (0.536)	Data Time 0.001 (0.024)	Loss 2.2477 (2.3718)	Entropy 0.54335 (0.54350)	Top-1 acc 67.188 (66.930)	Top-5 acc 90.234 (85.911)	lr 0.00159
Train [101][1720/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.024)	Loss 2.3148 (2.3716)	Entropy 0.54337 (0.54350)	Top-1 acc 67.188 (66.932)	Top-5 acc 87.500 (85.916)	lr 0.00159
Train [101][1730/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.024)	Loss 2.3274 (2.3718)	Entropy 0.54341 (0.54350)	Top-1 acc 64.062 (66.929)	Top-5 acc 89.062 (85.913)	lr 0.00159
Train [101][1740/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.024)	Loss 2.6226 (2.3719)	Entropy 0.54354 (0.54350)	Top-1 acc 60.156 (66.926)	Top-5 acc 81.641 (85.911)	lr 0.00159
Train [101][1750/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.024)	Loss 2.5574 (2.3726)	Entropy 0.54370 (0.54350)	Top-1 acc 60.938 (66.909)	Top-5 acc 82.812 (85.894)	lr 0.00159
Train [101][1760/3239]	Time 0.359 (0.533)	Data Time 0.001 (0.023)	Loss 2.3942 (2.3730)	Entropy 0.54367 (0.54350)	Top-1 acc 68.359 (66.902)	Top-5 acc 83.594 (85.884)	lr 0.00159
Train [101][1770/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.023)	Loss 2.3494 (2.3734)	Entropy 0.54364 (0.54350)	Top-1 acc 67.578 (66.887)	Top-5 acc 86.328 (85.878)	lr 0.00159
Train [101][1780/3239]	Time 0.240 (0.531)	Data Time 0.001 (0.023)	Loss 2.2526 (2.3733)	Entropy 0.54355 (0.54350)	Top-1 acc 69.141 (66.889)	Top-5 acc 88.672 (85.884)	lr 0.00159
Train [101][1790/3239]	Time 0.227 (0.530)	Data Time 0.001 (0.023)	Loss 2.3989 (2.3733)	Entropy 0.54354 (0.54350)	Top-1 acc 65.625 (66.888)	Top-5 acc 84.375 (85.882)	lr 0.00159
Train [101][1800/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.023)	Loss 2.4307 (2.3735)	Entropy 0.54365 (0.54351)	Top-1 acc 65.625 (66.879)	Top-5 acc 85.547 (85.877)	lr 0.00158
Train [101][1810/3239]	Time 0.237 (0.529)	Data Time 0.002 (0.023)	Loss 2.2821 (2.3734)	Entropy 0.54380 (0.54351)	Top-1 acc 69.922 (66.887)	Top-5 acc 86.719 (85.879)	lr 0.00158
Train [101][1820/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.023)	Loss 2.3997 (2.3736)	Entropy 0.54364 (0.54351)	Top-1 acc 64.062 (66.878)	Top-5 acc 83.984 (85.873)	lr 0.00158
Train [101][1830/3239]	Time 0.264 (0.528)	Data Time 0.002 (0.023)	Loss 2.3374 (2.3739)	Entropy 0.54379 (0.54351)	Top-1 acc 67.969 (66.872)	Top-5 acc 86.328 (85.871)	lr 0.00158
Train [101][1840/3239]	Time 0.250 (0.527)	Data Time 0.001 (0.023)	Loss 2.4544 (2.3736)	Entropy 0.54366 (0.54351)	Top-1 acc 62.500 (66.875)	Top-5 acc 85.547 (85.875)	lr 0.00158
Train [101][1850/3239]	Time 0.242 (0.527)	Data Time 0.001 (0.022)	Loss 2.3393 (2.3732)	Entropy 0.54400 (0.54351)	Top-1 acc 66.016 (66.886)	Top-5 acc 86.719 (85.882)	lr 0.00158
Train [101][1860/3239]	Time 0.261 (0.526)	Data Time 0.001 (0.022)	Loss 2.6374 (2.3734)	Entropy 0.54417 (0.54352)	Top-1 acc 58.203 (66.881)	Top-5 acc 79.688 (85.876)	lr 0.00158
Train [101][1870/3239]	Time 0.286 (0.526)	Data Time 0.002 (0.022)	Loss 2.4480 (2.3736)	Entropy 0.54440 (0.54352)	Top-1 acc 67.188 (66.877)	Top-5 acc 86.328 (85.872)	lr 0.00158
Train [101][1880/3239]	Time 0.221 (0.525)	Data Time 0.001 (0.022)	Loss 2.2449 (2.3738)	Entropy 0.54455 (0.54352)	Top-1 acc 70.312 (66.873)	Top-5 acc 86.328 (85.866)	lr 0.00158
Train [101][1890/3239]	Time 0.242 (0.525)	Data Time 0.001 (0.022)	Loss 2.4893 (2.3736)	Entropy 0.54431 (0.54353)	Top-1 acc 63.672 (66.872)	Top-5 acc 82.031 (85.870)	lr 0.00158
Train [101][1900/3239]	Time 0.261 (0.524)	Data Time 0.001 (0.022)	Loss 2.4810 (2.3739)	Entropy 0.54413 (0.54353)	Top-1 acc 64.062 (66.867)	Top-5 acc 82.422 (85.864)	lr 0.00158
Train [101][1910/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.022)	Loss 2.3190 (2.3739)	Entropy 0.54393 (0.54354)	Top-1 acc 67.188 (66.871)	Top-5 acc 86.328 (85.864)	lr 0.00158
Train [101][1920/3239]	Time 0.321 (0.523)	Data Time 0.001 (0.022)	Loss 2.4578 (2.3740)	Entropy 0.54425 (0.54354)	Top-1 acc 64.844 (66.869)	Top-5 acc 81.250 (85.860)	lr 0.00158
Train [101][1930/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.022)	Loss 2.4880 (2.3744)	Entropy 0.54443 (0.54354)	Top-1 acc 64.453 (66.862)	Top-5 acc 81.641 (85.851)	lr 0.00158
Train [101][1940/3239]	Time 0.253 (0.522)	Data Time 0.001 (0.021)	Loss 2.2148 (2.3743)	Entropy 0.54480 (0.54355)	Top-1 acc 70.703 (66.866)	Top-5 acc 87.891 (85.849)	lr 0.00158
Train [101][1950/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.021)	Loss 2.3299 (2.3742)	Entropy 0.54459 (0.54355)	Top-1 acc 68.750 (66.877)	Top-5 acc 88.281 (85.851)	lr 0.00158
Train [101][1960/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.021)	Loss 2.4394 (2.3741)	Entropy 0.54490 (0.54356)	Top-1 acc 66.406 (66.881)	Top-5 acc 85.938 (85.853)	lr 0.00158
Train [101][1970/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.021)	Loss 2.2430 (2.3745)	Entropy 0.54485 (0.54357)	Top-1 acc 69.141 (66.872)	Top-5 acc 87.109 (85.843)	lr 0.00158
Train [101][1980/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.021)	Loss 2.3089 (2.3743)	Entropy 0.54472 (0.54357)	Top-1 acc 67.969 (66.875)	Top-5 acc 87.891 (85.846)	lr 0.00158
Train [101][1990/3239]	Time 0.328 (0.519)	Data Time 0.001 (0.021)	Loss 2.3080 (2.3745)	Entropy 0.54477 (0.54358)	Top-1 acc 66.406 (66.866)	Top-5 acc 89.062 (85.844)	lr 0.00158
Train [101][2000/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.021)	Loss 2.3963 (2.3743)	Entropy 0.54489 (0.54358)	Top-1 acc 64.844 (66.873)	Top-5 acc 85.547 (85.848)	lr 0.00158
Train [101][2010/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.021)	Loss 2.4526 (2.3743)	Entropy 0.54504 (0.54359)	Top-1 acc 66.797 (66.874)	Top-5 acc 86.328 (85.848)	lr 0.00157
Train [101][2020/3239]	Time 0.226 (0.517)	Data Time 0.001 (0.021)	Loss 2.3034 (2.3740)	Entropy 0.54515 (0.54360)	Top-1 acc 68.750 (66.883)	Top-5 acc 86.719 (85.854)	lr 0.00157
Train [101][2030/3239]	Time 0.254 (0.517)	Data Time 0.001 (0.021)	Loss 2.6374 (2.3739)	Entropy 0.54521 (0.54361)	Top-1 acc 61.328 (66.884)	Top-5 acc 83.203 (85.855)	lr 0.00157
Train [101][2040/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.020)	Loss 2.4738 (2.3740)	Entropy 0.54474 (0.54361)	Top-1 acc 64.844 (66.884)	Top-5 acc 83.594 (85.856)	lr 0.00157
Train [101][2050/3239]	Time 0.218 (0.516)	Data Time 0.001 (0.020)	Loss 2.5516 (2.3739)	Entropy 0.54477 (0.54362)	Top-1 acc 65.625 (66.882)	Top-5 acc 82.031 (85.858)	lr 0.00157
Train [101][2060/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.020)	Loss 2.5253 (2.3739)	Entropy 0.54461 (0.54362)	Top-1 acc 60.156 (66.882)	Top-5 acc 81.641 (85.854)	lr 0.00157
Train [101][2070/3239]	Time 0.264 (0.514)	Data Time 0.001 (0.020)	Loss 2.1688 (2.3738)	Entropy 0.54446 (0.54363)	Top-1 acc 69.531 (66.878)	Top-5 acc 89.062 (85.855)	lr 0.00157
Train [101][2080/3239]	Time 0.319 (0.514)	Data Time 0.001 (0.020)	Loss 2.3525 (2.3737)	Entropy 0.54443 (0.54363)	Top-1 acc 64.844 (66.875)	Top-5 acc 87.500 (85.857)	lr 0.00157
Train [101][2090/3239]	Time 0.258 (0.514)	Data Time 0.001 (0.020)	Loss 2.3539 (2.3738)	Entropy 0.54447 (0.54364)	Top-1 acc 65.625 (66.872)	Top-5 acc 86.328 (85.856)	lr 0.00157
Train [101][2100/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.020)	Loss 2.3214 (2.3738)	Entropy 0.54420 (0.54364)	Top-1 acc 67.969 (66.875)	Top-5 acc 88.281 (85.854)	lr 0.00157
Train [101][2110/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.020)	Loss 2.1890 (2.3736)	Entropy 0.54415 (0.54364)	Top-1 acc 67.969 (66.874)	Top-5 acc 90.234 (85.856)	lr 0.00157
Train [101][2120/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.020)	Loss 2.4337 (2.3736)	Entropy 0.54443 (0.54365)	Top-1 acc 64.453 (66.877)	Top-5 acc 82.422 (85.856)	lr 0.00157
Train [101][2130/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.020)	Loss 2.1410 (2.3732)	Entropy 0.54411 (0.54365)	Top-1 acc 70.703 (66.880)	Top-5 acc 89.453 (85.864)	lr 0.00157
Train [101][2140/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.020)	Loss 2.3747 (2.3733)	Entropy 0.54375 (0.54365)	Top-1 acc 69.531 (66.881)	Top-5 acc 83.984 (85.860)	lr 0.00157
Train [101][2150/3239]	Time 0.328 (0.511)	Data Time 0.001 (0.019)	Loss 2.3721 (2.3735)	Entropy 0.54368 (0.54365)	Top-1 acc 65.625 (66.876)	Top-5 acc 87.109 (85.859)	lr 0.00157
Train [101][2160/3239]	Time 0.485 (0.535)	Data Time 0.039 (0.019)	Loss 2.2551 (2.3737)	Entropy 0.54334 (0.54365)	Top-1 acc 71.484 (66.876)	Top-5 acc 87.109 (85.855)	lr 0.00157
Train [101][2170/3239]	Time 0.265 (0.534)	Data Time 0.002 (0.019)	Loss 2.5199 (2.3738)	Entropy 0.54336 (0.54365)	Top-1 acc 63.281 (66.874)	Top-5 acc 83.984 (85.852)	lr 0.00157
Train [101][2180/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.019)	Loss 2.4669 (2.3739)	Entropy 0.54379 (0.54365)	Top-1 acc 64.062 (66.870)	Top-5 acc 83.984 (85.852)	lr 0.00157
Train [101][2190/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.019)	Loss 2.2828 (2.3736)	Entropy 0.54336 (0.54365)	Top-1 acc 70.312 (66.872)	Top-5 acc 89.062 (85.859)	lr 0.00157
Train [101][2200/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.019)	Loss 2.4833 (2.3739)	Entropy 0.54321 (0.54365)	Top-1 acc 64.844 (66.860)	Top-5 acc 82.812 (85.853)	lr 0.00157
Train [101][2210/3239]	Time 0.222 (0.532)	Data Time 0.001 (0.019)	Loss 2.2465 (2.3738)	Entropy 0.54308 (0.54365)	Top-1 acc 68.750 (66.859)	Top-5 acc 88.281 (85.858)	lr 0.00156
Train [101][2220/3239]	Time 0.284 (0.532)	Data Time 0.001 (0.019)	Loss 2.4018 (2.3739)	Entropy 0.54279 (0.54364)	Top-1 acc 67.188 (66.860)	Top-5 acc 83.984 (85.857)	lr 0.00156
Train [101][2230/3239]	Time 0.246 (0.531)	Data Time 0.001 (0.019)	Loss 2.4863 (2.3738)	Entropy 0.54280 (0.54364)	Top-1 acc 65.234 (66.859)	Top-5 acc 81.641 (85.856)	lr 0.00156
Train [101][2240/3239]	Time 0.326 (0.531)	Data Time 0.001 (0.019)	Loss 2.4963 (2.3738)	Entropy 0.54270 (0.54363)	Top-1 acc 61.328 (66.859)	Top-5 acc 84.375 (85.858)	lr 0.00156
Train [101][2250/3239]	Time 0.221 (0.530)	Data Time 0.001 (0.019)	Loss 2.4311 (2.3736)	Entropy 0.54284 (0.54363)	Top-1 acc 63.281 (66.863)	Top-5 acc 86.719 (85.866)	lr 0.00156
Train [101][2260/3239]	Time 0.226 (0.530)	Data Time 0.001 (0.019)	Loss 2.3623 (2.3735)	Entropy 0.54287 (0.54363)	Top-1 acc 64.453 (66.859)	Top-5 acc 87.109 (85.866)	lr 0.00156
Train [101][2270/3239]	Time 0.223 (0.529)	Data Time 0.001 (0.019)	Loss 2.5144 (2.3736)	Entropy 0.54275 (0.54362)	Top-1 acc 63.672 (66.855)	Top-5 acc 85.547 (85.867)	lr 0.00156
Train [101][2280/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.018)	Loss 2.4099 (2.3735)	Entropy 0.54268 (0.54362)	Top-1 acc 64.453 (66.856)	Top-5 acc 83.984 (85.869)	lr 0.00156
Train [101][2290/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.018)	Loss 2.2215 (2.3732)	Entropy 0.54281 (0.54362)	Top-1 acc 70.312 (66.863)	Top-5 acc 87.109 (85.872)	lr 0.00156
Train [101][2300/3239]	Time 0.265 (0.528)	Data Time 0.001 (0.018)	Loss 2.2761 (2.3731)	Entropy 0.54275 (0.54361)	Top-1 acc 69.531 (66.862)	Top-5 acc 87.500 (85.872)	lr 0.00156
Train [101][2310/3239]	Time 0.344 (0.527)	Data Time 0.001 (0.018)	Loss 2.3981 (2.3730)	Entropy 0.54254 (0.54361)	Top-1 acc 70.703 (66.868)	Top-5 acc 84.375 (85.872)	lr 0.00156
Train [101][2320/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.018)	Loss 2.4431 (2.3731)	Entropy 0.54260 (0.54360)	Top-1 acc 66.406 (66.867)	Top-5 acc 84.375 (85.872)	lr 0.00156
Train [101][2330/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.018)	Loss 2.4371 (2.3729)	Entropy 0.54233 (0.54360)	Top-1 acc 62.891 (66.863)	Top-5 acc 85.156 (85.877)	lr 0.00156
Train [101][2340/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.018)	Loss 2.2974 (2.3730)	Entropy 0.54222 (0.54359)	Top-1 acc 70.703 (66.860)	Top-5 acc 87.500 (85.876)	lr 0.00156
Train [101][2350/3239]	Time 0.250 (0.525)	Data Time 0.001 (0.018)	Loss 2.6409 (2.3733)	Entropy 0.54203 (0.54359)	Top-1 acc 59.375 (66.847)	Top-5 acc 81.641 (85.872)	lr 0.00156
Train [101][2360/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.018)	Loss 2.1290 (2.3729)	Entropy 0.54202 (0.54358)	Top-1 acc 72.656 (66.854)	Top-5 acc 89.844 (85.878)	lr 0.00156
Train [101][2370/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.018)	Loss 2.4606 (2.3728)	Entropy 0.54213 (0.54357)	Top-1 acc 66.797 (66.856)	Top-5 acc 85.156 (85.882)	lr 0.00156
Train [101][2380/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.018)	Loss 2.4302 (2.3729)	Entropy 0.54241 (0.54357)	Top-1 acc 69.141 (66.857)	Top-5 acc 83.984 (85.885)	lr 0.00156
Train [101][2390/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.018)	Loss 2.4634 (2.3730)	Entropy 0.54223 (0.54356)	Top-1 acc 62.891 (66.855)	Top-5 acc 85.156 (85.884)	lr 0.00156
Train [101][2400/3239]	Time 0.361 (0.524)	Data Time 0.002 (0.018)	Loss 2.2698 (2.3726)	Entropy 0.54210 (0.54356)	Top-1 acc 66.797 (66.865)	Top-5 acc 90.234 (85.891)	lr 0.00156
Train [101][2410/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.018)	Loss 2.2348 (2.3724)	Entropy 0.54201 (0.54355)	Top-1 acc 70.703 (66.872)	Top-5 acc 88.281 (85.894)	lr 0.00156
Train [101][2420/3239]	Time 0.222 (0.523)	Data Time 0.001 (0.018)	Loss 2.3820 (2.3723)	Entropy 0.54226 (0.54354)	Top-1 acc 65.625 (66.875)	Top-5 acc 88.281 (85.901)	lr 0.00155
Train [101][2430/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.017)	Loss 2.4585 (2.3723)	Entropy 0.54227 (0.54354)	Top-1 acc 65.234 (66.875)	Top-5 acc 85.156 (85.902)	lr 0.00155
Train [101][2440/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.017)	Loss 2.4112 (2.3724)	Entropy 0.54249 (0.54353)	Top-1 acc 66.797 (66.875)	Top-5 acc 85.547 (85.902)	lr 0.00155
Train [101][2450/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.017)	Loss 2.4101 (2.3725)	Entropy 0.54279 (0.54353)	Top-1 acc 66.406 (66.875)	Top-5 acc 84.375 (85.896)	lr 0.00155
Train [101][2460/3239]	Time 0.267 (0.521)	Data Time 0.001 (0.017)	Loss 2.4854 (2.3727)	Entropy 0.54260 (0.54353)	Top-1 acc 62.109 (66.868)	Top-5 acc 82.812 (85.895)	lr 0.00155
Train [101][2470/3239]	Time 0.332 (0.521)	Data Time 0.001 (0.017)	Loss 2.2809 (2.3726)	Entropy 0.54267 (0.54352)	Top-1 acc 68.750 (66.868)	Top-5 acc 89.844 (85.896)	lr 0.00155
Train [101][2480/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.017)	Loss 2.2295 (2.3725)	Entropy 0.54269 (0.54352)	Top-1 acc 69.531 (66.872)	Top-5 acc 86.328 (85.899)	lr 0.00155
Train [101][2490/3239]	Time 0.225 (0.520)	Data Time 0.005 (0.017)	Loss 2.2947 (2.3729)	Entropy 0.54285 (0.54352)	Top-1 acc 66.406 (66.860)	Top-5 acc 87.891 (85.892)	lr 0.00155
Train [101][2500/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.017)	Loss 2.6054 (2.3730)	Entropy 0.54328 (0.54351)	Top-1 acc 58.594 (66.854)	Top-5 acc 83.203 (85.891)	lr 0.00155
Train [101][2510/3239]	Time 0.224 (0.519)	Data Time 0.001 (0.017)	Loss 2.4808 (2.3730)	Entropy 0.54308 (0.54351)	Top-1 acc 59.766 (66.849)	Top-5 acc 84.766 (85.891)	lr 0.00155
Train [101][2520/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.017)	Loss 2.5309 (2.3729)	Entropy 0.54312 (0.54351)	Top-1 acc 64.844 (66.855)	Top-5 acc 82.031 (85.890)	lr 0.00155
Train [101][2530/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.017)	Loss 2.5071 (2.3729)	Entropy 0.54275 (0.54351)	Top-1 acc 63.281 (66.856)	Top-5 acc 82.031 (85.888)	lr 0.00155
Train [101][2540/3239]	Time 0.328 (0.518)	Data Time 0.001 (0.017)	Loss 2.2194 (2.3727)	Entropy 0.54272 (0.54351)	Top-1 acc 69.141 (66.858)	Top-5 acc 89.844 (85.890)	lr 0.00155
Train [101][2550/3239]	Time 0.223 (0.517)	Data Time 0.001 (0.017)	Loss 2.2306 (2.3728)	Entropy 0.54248 (0.54350)	Top-1 acc 67.578 (66.856)	Top-5 acc 89.844 (85.888)	lr 0.00155
Train [101][2560/3239]	Time 0.245 (0.517)	Data Time 0.001 (0.017)	Loss 2.3297 (2.3728)	Entropy 0.54240 (0.54350)	Top-1 acc 65.625 (66.855)	Top-5 acc 87.891 (85.887)	lr 0.00155
Train [101][2570/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.017)	Loss 2.2863 (2.3727)	Entropy 0.54261 (0.54349)	Top-1 acc 67.188 (66.859)	Top-5 acc 88.281 (85.890)	lr 0.00155
Train [101][2580/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.017)	Loss 2.2180 (2.3725)	Entropy 0.54233 (0.54349)	Top-1 acc 70.312 (66.863)	Top-5 acc 89.062 (85.892)	lr 0.00155
Train [101][2590/3239]	Time 0.242 (0.516)	Data Time 0.001 (0.016)	Loss 2.4495 (2.3723)	Entropy 0.54230 (0.54349)	Top-1 acc 63.281 (66.870)	Top-5 acc 85.547 (85.896)	lr 0.00155
Train [101][2600/3239]	Time 0.285 (0.515)	Data Time 0.001 (0.016)	Loss 2.4468 (2.3728)	Entropy 0.54216 (0.54348)	Top-1 acc 62.500 (66.858)	Top-5 acc 87.109 (85.888)	lr 0.00155
Train [101][2610/3239]	Time 0.292 (0.516)	Data Time 0.001 (0.016)	Loss 2.3598 (2.3727)	Entropy 0.54222 (0.54348)	Top-1 acc 66.797 (66.857)	Top-5 acc 86.328 (85.889)	lr 0.00155
Train [101][2620/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.016)	Loss 2.3916 (2.3727)	Entropy 0.54260 (0.54347)	Top-1 acc 67.188 (66.858)	Top-5 acc 84.375 (85.890)	lr 0.00154
Train [101][2630/3239]	Time 0.324 (0.515)	Data Time 0.001 (0.016)	Loss 2.5010 (2.3726)	Entropy 0.54236 (0.54347)	Top-1 acc 66.016 (66.862)	Top-5 acc 84.766 (85.893)	lr 0.00154
Train [101][2640/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.016)	Loss 2.3208 (2.3726)	Entropy 0.54234 (0.54346)	Top-1 acc 69.531 (66.863)	Top-5 acc 89.062 (85.894)	lr 0.00154
Train [101][2650/3239]	Time 0.225 (0.514)	Data Time 0.001 (0.016)	Loss 2.2478 (2.3727)	Entropy 0.54191 (0.54346)	Top-1 acc 71.484 (66.864)	Top-5 acc 87.109 (85.888)	lr 0.00154
Train [101][2660/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.016)	Loss 2.3750 (2.3727)	Entropy 0.54199 (0.54345)	Top-1 acc 67.188 (66.862)	Top-5 acc 85.938 (85.892)	lr 0.00154
Train [101][2670/3239]	Time 0.222 (0.513)	Data Time 0.001 (0.016)	Loss 2.5169 (2.3727)	Entropy 0.54208 (0.54345)	Top-1 acc 61.328 (66.861)	Top-5 acc 83.203 (85.891)	lr 0.00154
Train [101][2680/3239]	Time 0.227 (0.513)	Data Time 0.001 (0.016)	Loss 2.2992 (2.3726)	Entropy 0.54205 (0.54344)	Top-1 acc 70.703 (66.865)	Top-5 acc 87.109 (85.894)	lr 0.00154
Train [101][2690/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.016)	Loss 2.3367 (2.3724)	Entropy 0.54187 (0.54344)	Top-1 acc 70.703 (66.874)	Top-5 acc 85.156 (85.901)	lr 0.00154
Train [101][2700/3239]	Time 0.374 (0.512)	Data Time 0.001 (0.016)	Loss 2.3770 (2.3724)	Entropy 0.54174 (0.54343)	Top-1 acc 67.969 (66.868)	Top-5 acc 84.766 (85.900)	lr 0.00154
Train [101][2710/3239]	Time 0.235 (0.512)	Data Time 0.002 (0.016)	Loss 2.4065 (2.3723)	Entropy 0.54175 (0.54343)	Top-1 acc 62.500 (66.868)	Top-5 acc 86.328 (85.905)	lr 0.00154
Train [101][2720/3239]	Time 0.248 (0.512)	Data Time 0.001 (0.016)	Loss 2.2564 (2.3722)	Entropy 0.54162 (0.54342)	Top-1 acc 70.312 (66.872)	Top-5 acc 89.453 (85.906)	lr 0.00154
Train [101][2730/3239]	Time 0.232 (0.511)	Data Time 0.001 (0.016)	Loss 2.2446 (2.3722)	Entropy 0.54145 (0.54341)	Top-1 acc 72.266 (66.874)	Top-5 acc 85.938 (85.907)	lr 0.00154
Train [101][2740/3239]	Time 0.220 (0.511)	Data Time 0.001 (0.016)	Loss 2.2985 (2.3722)	Entropy 0.54129 (0.54341)	Top-1 acc 69.922 (66.877)	Top-5 acc 87.109 (85.905)	lr 0.00154
Train [101][2750/3239]	Time 0.249 (0.510)	Data Time 0.001 (0.016)	Loss 2.3568 (2.3723)	Entropy 0.54098 (0.54340)	Top-1 acc 65.625 (66.875)	Top-5 acc 85.547 (85.905)	lr 0.00154
Train [101][2760/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.016)	Loss 2.5443 (2.3722)	Entropy 0.54063 (0.54339)	Top-1 acc 64.453 (66.880)	Top-5 acc 80.469 (85.905)	lr 0.00154
Train [101][2770/3239]	Time 0.226 (0.510)	Data Time 0.001 (0.016)	Loss 2.4128 (2.3723)	Entropy 0.54053 (0.54338)	Top-1 acc 64.844 (66.879)	Top-5 acc 83.984 (85.903)	lr 0.00154
Train [101][2780/3239]	Time 0.231 (0.509)	Data Time 0.001 (0.015)	Loss 2.3975 (2.3724)	Entropy 0.54042 (0.54337)	Top-1 acc 66.016 (66.874)	Top-5 acc 84.375 (85.902)	lr 0.00154
Train [101][2790/3239]	Time 0.282 (0.509)	Data Time 0.001 (0.015)	Loss 2.2667 (2.3724)	Entropy 0.54033 (0.54336)	Top-1 acc 64.844 (66.875)	Top-5 acc 89.062 (85.902)	lr 0.00154
Train [101][2800/3239]	Time 0.226 (0.509)	Data Time 0.001 (0.015)	Loss 2.3987 (2.3725)	Entropy 0.54023 (0.54335)	Top-1 acc 66.016 (66.873)	Top-5 acc 84.375 (85.899)	lr 0.00154
Train [101][2810/3239]	Time 0.232 (0.508)	Data Time 0.001 (0.015)	Loss 2.2639 (2.3722)	Entropy 0.54034 (0.54333)	Top-1 acc 67.969 (66.878)	Top-5 acc 90.234 (85.905)	lr 0.00154
Train [101][2820/3239]	Time 0.239 (0.528)	Data Time 0.002 (0.015)	Loss 2.4591 (2.3721)	Entropy 0.54053 (0.54332)	Top-1 acc 66.406 (66.881)	Top-5 acc 83.984 (85.906)	lr 0.00154
Train [101][2830/3239]	Time 0.289 (0.528)	Data Time 0.002 (0.015)	Loss 2.4080 (2.3722)	Entropy 0.54053 (0.54331)	Top-1 acc 65.234 (66.878)	Top-5 acc 85.156 (85.902)	lr 0.00153
Train [101][2840/3239]	Time 0.308 (0.528)	Data Time 0.001 (0.015)	Loss 2.3659 (2.3720)	Entropy 0.54034 (0.54330)	Top-1 acc 65.625 (66.884)	Top-5 acc 85.938 (85.905)	lr 0.00153
Train [101][2850/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.015)	Loss 2.3300 (2.3720)	Entropy 0.54041 (0.54329)	Top-1 acc 70.312 (66.887)	Top-5 acc 86.719 (85.907)	lr 0.00153
Train [101][2860/3239]	Time 0.337 (0.527)	Data Time 0.001 (0.015)	Loss 2.2462 (2.3719)	Entropy 0.54033 (0.54328)	Top-1 acc 69.922 (66.889)	Top-5 acc 88.672 (85.909)	lr 0.00153
Train [101][2870/3239]	Time 0.260 (0.527)	Data Time 0.001 (0.015)	Loss 2.3210 (2.3717)	Entropy 0.54054 (0.54327)	Top-1 acc 66.797 (66.890)	Top-5 acc 89.453 (85.915)	lr 0.00153
Train [101][2880/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.015)	Loss 2.5527 (2.3717)	Entropy 0.54048 (0.54326)	Top-1 acc 60.938 (66.888)	Top-5 acc 81.250 (85.914)	lr 0.00153
Train [101][2890/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.015)	Loss 2.3302 (2.3718)	Entropy 0.54044 (0.54325)	Top-1 acc 69.922 (66.887)	Top-5 acc 85.156 (85.913)	lr 0.00153
Train [101][2900/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.015)	Loss 2.3586 (2.3718)	Entropy 0.54049 (0.54324)	Top-1 acc 64.453 (66.885)	Top-5 acc 85.938 (85.912)	lr 0.00153
Train [101][2910/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.015)	Loss 2.1538 (2.3717)	Entropy 0.54010 (0.54323)	Top-1 acc 73.047 (66.887)	Top-5 acc 89.844 (85.914)	lr 0.00153
Train [101][2920/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.015)	Loss 2.3665 (2.3715)	Entropy 0.53988 (0.54322)	Top-1 acc 66.406 (66.894)	Top-5 acc 84.766 (85.918)	lr 0.00153
Train [101][2930/3239]	Time 0.309 (0.524)	Data Time 0.001 (0.015)	Loss 2.3441 (2.3715)	Entropy 0.53985 (0.54321)	Top-1 acc 67.578 (66.893)	Top-5 acc 85.547 (85.919)	lr 0.00153
Train [101][2940/3239]	Time 0.299 (0.524)	Data Time 0.001 (0.015)	Loss 2.4015 (2.3716)	Entropy 0.54003 (0.54320)	Top-1 acc 63.281 (66.891)	Top-5 acc 85.938 (85.920)	lr 0.00153
Train [101][2950/3239]	Time 0.438 (0.524)	Data Time 0.002 (0.015)	Loss 2.2800 (2.3715)	Entropy 0.54019 (0.54319)	Top-1 acc 68.750 (66.892)	Top-5 acc 86.328 (85.921)	lr 0.00153
Train [101][2960/3239]	Time 0.251 (0.524)	Data Time 0.001 (0.015)	Loss 2.4624 (2.3715)	Entropy 0.54036 (0.54318)	Top-1 acc 63.672 (66.893)	Top-5 acc 85.547 (85.921)	lr 0.00153
Train [101][2970/3239]	Time 0.305 (0.523)	Data Time 0.001 (0.015)	Loss 2.2640 (2.3716)	Entropy 0.54052 (0.54317)	Top-1 acc 72.266 (66.892)	Top-5 acc 85.938 (85.921)	lr 0.00153
Train [101][2980/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.015)	Loss 2.3939 (2.3714)	Entropy 0.54034 (0.54316)	Top-1 acc 70.703 (66.900)	Top-5 acc 86.719 (85.925)	lr 0.00153
Train [101][2990/3239]	Time 0.245 (0.523)	Data Time 0.001 (0.015)	Loss 2.4519 (2.3714)	Entropy 0.54057 (0.54315)	Top-1 acc 62.500 (66.897)	Top-5 acc 84.375 (85.926)	lr 0.00153
Train [101][3000/3239]	Time 0.335 (0.523)	Data Time 0.001 (0.014)	Loss 2.3777 (2.3715)	Entropy 0.54105 (0.54315)	Top-1 acc 68.359 (66.895)	Top-5 acc 85.156 (85.924)	lr 0.00153
Train [101][3010/3239]	Time 0.384 (0.523)	Data Time 0.003 (0.014)	Loss 2.3569 (2.3716)	Entropy 0.54131 (0.54314)	Top-1 acc 66.406 (66.894)	Top-5 acc 85.156 (85.925)	lr 0.00153
Train [101][3020/3239]	Time 0.318 (0.523)	Data Time 0.001 (0.014)	Loss 2.5387 (2.3716)	Entropy 0.54124 (0.54313)	Top-1 acc 59.375 (66.891)	Top-5 acc 83.203 (85.925)	lr 0.00153
Train [101][3030/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.014)	Loss 2.4852 (2.3716)	Entropy 0.54130 (0.54313)	Top-1 acc 64.453 (66.889)	Top-5 acc 85.156 (85.925)	lr 0.00152
Train [101][3040/3239]	Time 0.238 (0.522)	Data Time 0.002 (0.014)	Loss 2.2022 (2.3714)	Entropy 0.54106 (0.54312)	Top-1 acc 70.703 (66.895)	Top-5 acc 88.281 (85.927)	lr 0.00152
Train [101][3050/3239]	Time 0.244 (0.522)	Data Time 0.001 (0.014)	Loss 2.4210 (2.3715)	Entropy 0.54093 (0.54311)	Top-1 acc 66.406 (66.891)	Top-5 acc 84.766 (85.926)	lr 0.00152
Train [101][3060/3239]	Time 0.225 (0.521)	Data Time 0.001 (0.014)	Loss 2.5268 (2.3714)	Entropy 0.54072 (0.54311)	Top-1 acc 63.672 (66.897)	Top-5 acc 84.375 (85.929)	lr 0.00152
Train [101][3070/3239]	Time 0.263 (0.521)	Data Time 0.001 (0.014)	Loss 2.3464 (2.3714)	Entropy 0.54075 (0.54310)	Top-1 acc 67.969 (66.899)	Top-5 acc 83.984 (85.930)	lr 0.00152
Train [101][3080/3239]	Time 0.244 (0.521)	Data Time 0.001 (0.014)	Loss 2.4840 (2.3714)	Entropy 0.54077 (0.54309)	Top-1 acc 65.625 (66.900)	Top-5 acc 85.547 (85.929)	lr 0.00152
Train [101][3090/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.014)	Loss 2.2307 (2.3714)	Entropy 0.54084 (0.54308)	Top-1 acc 71.484 (66.902)	Top-5 acc 85.547 (85.930)	lr 0.00152
Train [101][3100/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.014)	Loss 2.4190 (2.3714)	Entropy 0.54086 (0.54308)	Top-1 acc 65.234 (66.904)	Top-5 acc 84.766 (85.931)	lr 0.00152
Train [101][3110/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.014)	Loss 2.4155 (2.3710)	Entropy 0.54091 (0.54307)	Top-1 acc 67.578 (66.911)	Top-5 acc 84.766 (85.937)	lr 0.00152
Train [101][3120/3239]	Time 0.264 (0.519)	Data Time 0.001 (0.014)	Loss 2.2467 (2.3711)	Entropy 0.54071 (0.54306)	Top-1 acc 68.359 (66.907)	Top-5 acc 87.109 (85.936)	lr 0.00152
Train [101][3130/3239]	Time 0.241 (0.519)	Data Time 0.001 (0.014)	Loss 2.3822 (2.3711)	Entropy 0.54059 (0.54305)	Top-1 acc 68.359 (66.907)	Top-5 acc 86.328 (85.937)	lr 0.00152
Train [101][3140/3239]	Time 0.235 (0.519)	Data Time 0.001 (0.014)	Loss 2.3383 (2.3711)	Entropy 0.54027 (0.54305)	Top-1 acc 65.625 (66.906)	Top-5 acc 86.719 (85.937)	lr 0.00152
Train [101][3150/3239]	Time 0.252 (0.518)	Data Time 0.001 (0.014)	Loss 2.2029 (2.3711)	Entropy 0.53993 (0.54304)	Top-1 acc 65.625 (66.902)	Top-5 acc 87.891 (85.936)	lr 0.00152
Train [101][3160/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.014)	Loss 2.3696 (2.3711)	Entropy 0.54001 (0.54303)	Top-1 acc 67.188 (66.899)	Top-5 acc 87.500 (85.937)	lr 0.00152
Train [101][3170/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.014)	Loss 2.3282 (2.3710)	Entropy 0.54002 (0.54302)	Top-1 acc 69.922 (66.903)	Top-5 acc 87.109 (85.938)	lr 0.00152
Train [101][3180/3239]	Time 0.318 (0.517)	Data Time 0.000 (0.014)	Loss 2.4604 (2.3711)	Entropy 0.53972 (0.54301)	Top-1 acc 62.109 (66.900)	Top-5 acc 85.156 (85.934)	lr 0.00152
Train [101][3190/3239]	Time 0.237 (0.517)	Data Time 0.000 (0.014)	Loss 2.3268 (2.3710)	Entropy 0.53990 (0.54300)	Top-1 acc 68.750 (66.902)	Top-5 acc 87.891 (85.936)	lr 0.00152
Train [101][3200/3239]	Time 0.227 (0.516)	Data Time 0.000 (0.014)	Loss 2.2964 (2.3709)	Entropy 0.53986 (0.54299)	Top-1 acc 67.578 (66.903)	Top-5 acc 87.500 (85.938)	lr 0.00152
Train [101][3210/3239]	Time 0.230 (0.516)	Data Time 0.000 (0.014)	Loss 2.3020 (2.3711)	Entropy 0.53991 (0.54298)	Top-1 acc 68.359 (66.899)	Top-5 acc 89.062 (85.936)	lr 0.00152
Train [101][3220/3239]	Time 0.233 (0.516)	Data Time 0.000 (0.014)	Loss 2.4308 (2.3710)	Entropy 0.53997 (0.54297)	Top-1 acc 64.453 (66.900)	Top-5 acc 85.938 (85.939)	lr 0.00152
Train [101][3230/3239]	Time 0.219 (0.515)	Data Time 0.000 (0.014)	Loss 2.5397 (2.3710)	Entropy 0.54010 (0.54296)	Top-1 acc 60.156 (66.900)	Top-5 acc 85.156 (85.941)	lr 0.00152
Train [101][3239/3239]	Time 0.895 (0.515)	Data Time 0.000 (0.013)	Loss 2.4682 (2.3711)	Entropy 0.54026 (0.54295)	Top-1 acc 65.432 (66.897)	Top-5 acc 86.420 (85.940)	lr 0.00151
==========Valid [101/120]	loss 1.190	top-1 acc 72.644 (72.644)	top-5 acc 90.297	Train top-1 66.897	top-5 85.940	Entropy 0.54026	Latency-None: 0.000ms	Flops: 539.00M
Train [102][0/3239]	Time 38.836 (38.836)	Data Time 37.231 (37.231)	Loss 2.2925 (2.2925)	Entropy 0.54018 (0.54018)	Top-1 acc 67.188 (67.188)	Top-5 acc 87.500 (87.500)	lr 0.00151
Train [102][10/3239]	Time 0.361 (3.984)	Data Time 0.001 (3.395)	Loss 2.3582 (2.3683)	Entropy 0.54027 (0.54026)	Top-1 acc 69.531 (66.619)	Top-5 acc 85.156 (86.435)	lr 0.00151
Train [102][20/3239]	Time 0.230 (2.281)	Data Time 0.001 (1.779)	Loss 2.3640 (2.3599)	Entropy 0.54016 (0.54023)	Top-1 acc 69.141 (67.448)	Top-5 acc 87.500 (86.347)	lr 0.00151
Train [102][30/3239]	Time 0.226 (1.673)	Data Time 0.001 (1.206)	Loss 2.5581 (2.3864)	Entropy 0.54047 (0.54024)	Top-1 acc 63.281 (66.961)	Top-5 acc 82.812 (85.736)	lr 0.00151
Train [102][40/3239]	Time 0.225 (1.364)	Data Time 0.001 (0.912)	Loss 2.3793 (2.3910)	Entropy 0.54031 (0.54028)	Top-1 acc 67.578 (66.749)	Top-5 acc 85.547 (85.623)	lr 0.00151
Train [102][50/3239]	Time 0.229 (1.177)	Data Time 0.001 (0.734)	Loss 2.2532 (2.3877)	Entropy 0.54040 (0.54030)	Top-1 acc 69.922 (66.896)	Top-5 acc 89.062 (85.593)	lr 0.00151
Train [102][60/3239]	Time 0.234 (1.054)	Data Time 0.001 (0.614)	Loss 2.3128 (2.3718)	Entropy 0.54037 (0.54030)	Top-1 acc 67.578 (67.290)	Top-5 acc 88.281 (85.963)	lr 0.00151
Train [102][70/3239]	Time 0.246 (0.965)	Data Time 0.001 (0.527)	Loss 2.4073 (2.3667)	Entropy 0.54045 (0.54030)	Top-1 acc 66.016 (67.518)	Top-5 acc 85.156 (86.081)	lr 0.00151
Train [102][80/3239]	Time 0.321 (0.899)	Data Time 0.001 (0.462)	Loss 2.3643 (2.3738)	Entropy 0.54048 (0.54031)	Top-1 acc 69.922 (67.356)	Top-5 acc 85.547 (85.904)	lr 0.00151
Train [102][90/3239]	Time 0.275 (0.848)	Data Time 0.002 (0.412)	Loss 2.3683 (2.3708)	Entropy 0.54012 (0.54032)	Top-1 acc 68.359 (67.419)	Top-5 acc 84.375 (85.903)	lr 0.00151
Train [102][100/3239]	Time 0.228 (0.812)	Data Time 0.001 (0.371)	Loss 2.3439 (2.3713)	Entropy 0.54019 (0.54030)	Top-1 acc 70.703 (67.276)	Top-5 acc 85.938 (85.938)	lr 0.00151
Train [102][110/3239]	Time 0.243 (0.777)	Data Time 0.001 (0.338)	Loss 2.2195 (2.3709)	Entropy 0.54022 (0.54029)	Top-1 acc 73.438 (67.318)	Top-5 acc 88.672 (85.948)	lr 0.00151
Train [102][120/3239]	Time 0.234 (0.745)	Data Time 0.001 (0.310)	Loss 2.2959 (2.3730)	Entropy 0.54030 (0.54029)	Top-1 acc 71.094 (67.271)	Top-5 acc 85.938 (85.857)	lr 0.00151
Train [102][130/3239]	Time 0.250 (0.720)	Data Time 0.001 (0.287)	Loss 2.4768 (2.3694)	Entropy 0.54023 (0.54029)	Top-1 acc 63.672 (67.286)	Top-5 acc 83.594 (85.929)	lr 0.00151
Train [102][140/3239]	Time 0.227 (0.698)	Data Time 0.001 (0.266)	Loss 2.4491 (2.3707)	Entropy 0.54006 (0.54028)	Top-1 acc 67.578 (67.185)	Top-5 acc 83.203 (85.874)	lr 0.00151
Train [102][150/3239]	Time 0.227 (0.679)	Data Time 0.001 (0.249)	Loss 2.3408 (2.3711)	Entropy 0.54006 (0.54026)	Top-1 acc 67.969 (67.172)	Top-5 acc 85.156 (85.862)	lr 0.00151
Train [102][160/3239]	Time 0.229 (0.663)	Data Time 0.001 (0.233)	Loss 2.5446 (2.3725)	Entropy 0.53988 (0.54025)	Top-1 acc 64.062 (67.161)	Top-5 acc 83.984 (85.843)	lr 0.00151
Train [102][170/3239]	Time 0.232 (0.647)	Data Time 0.001 (0.220)	Loss 2.4004 (2.3733)	Entropy 0.54008 (0.54023)	Top-1 acc 64.062 (67.112)	Top-5 acc 85.938 (85.860)	lr 0.00151
Train [102][180/3239]	Time 0.233 (0.634)	Data Time 0.001 (0.208)	Loss 2.2679 (2.3721)	Entropy 0.54011 (0.54023)	Top-1 acc 69.922 (67.125)	Top-5 acc 88.281 (85.875)	lr 0.00151
Train [102][190/3239]	Time 0.231 (0.622)	Data Time 0.001 (0.197)	Loss 2.4754 (2.3713)	Entropy 0.53995 (0.54021)	Top-1 acc 66.797 (67.122)	Top-5 acc 83.594 (85.868)	lr 0.00151
Train [102][200/3239]	Time 0.230 (0.611)	Data Time 0.001 (0.187)	Loss 2.3772 (2.3717)	Entropy 0.54003 (0.54020)	Top-1 acc 64.453 (67.168)	Top-5 acc 85.156 (85.834)	lr 0.00151
Train [102][210/3239]	Time 0.227 (0.601)	Data Time 0.001 (0.178)	Loss 2.1736 (2.3719)	Entropy 0.54031 (0.54019)	Top-1 acc 73.438 (67.167)	Top-5 acc 87.891 (85.801)	lr 0.00150
Train [102][220/3239]	Time 0.234 (0.592)	Data Time 0.001 (0.170)	Loss 2.5587 (2.3700)	Entropy 0.54066 (0.54020)	Top-1 acc 59.375 (67.175)	Top-5 acc 85.938 (85.867)	lr 0.00150
Train [102][230/3239]	Time 0.408 (0.813)	Data Time 0.005 (0.163)	Loss 2.3519 (2.3672)	Entropy 0.54046 (0.54022)	Top-1 acc 67.188 (67.255)	Top-5 acc 85.156 (85.916)	lr 0.00150
Train [102][240/3239]	Time 0.321 (0.799)	Data Time 0.002 (0.156)	Loss 2.4656 (2.3689)	Entropy 0.54033 (0.54023)	Top-1 acc 67.188 (67.168)	Top-5 acc 83.594 (85.861)	lr 0.00150
Train [102][250/3239]	Time 0.255 (0.784)	Data Time 0.002 (0.150)	Loss 2.7316 (2.3697)	Entropy 0.54013 (0.54023)	Top-1 acc 58.203 (67.186)	Top-5 acc 79.688 (85.847)	lr 0.00150
Train [102][260/3239]	Time 0.229 (0.770)	Data Time 0.001 (0.145)	Loss 2.4041 (2.3735)	Entropy 0.54004 (0.54023)	Top-1 acc 65.234 (67.083)	Top-5 acc 87.109 (85.816)	lr 0.00150
Train [102][270/3239]	Time 0.257 (0.757)	Data Time 0.001 (0.139)	Loss 2.4040 (2.3720)	Entropy 0.54004 (0.54022)	Top-1 acc 67.969 (67.110)	Top-5 acc 82.422 (85.829)	lr 0.00150
Train [102][280/3239]	Time 0.267 (0.744)	Data Time 0.001 (0.134)	Loss 2.1560 (2.3724)	Entropy 0.54027 (0.54022)	Top-1 acc 72.266 (67.096)	Top-5 acc 88.281 (85.825)	lr 0.00150
Train [102][290/3239]	Time 0.313 (0.737)	Data Time 0.002 (0.130)	Loss 2.2742 (2.3712)	Entropy 0.54007 (0.54022)	Top-1 acc 69.922 (67.108)	Top-5 acc 86.328 (85.848)	lr 0.00150
Train [102][300/3239]	Time 0.260 (0.728)	Data Time 0.001 (0.126)	Loss 2.3018 (2.3687)	Entropy 0.54000 (0.54021)	Top-1 acc 69.531 (67.133)	Top-5 acc 86.719 (85.871)	lr 0.00150
Train [102][310/3239]	Time 0.233 (0.718)	Data Time 0.001 (0.122)	Loss 2.2857 (2.3666)	Entropy 0.53977 (0.54021)	Top-1 acc 67.578 (67.188)	Top-5 acc 87.891 (85.904)	lr 0.00150
Train [102][320/3239]	Time 0.242 (0.709)	Data Time 0.001 (0.118)	Loss 2.5291 (2.3690)	Entropy 0.53995 (0.54020)	Top-1 acc 61.328 (67.130)	Top-5 acc 80.078 (85.863)	lr 0.00150
Train [102][330/3239]	Time 0.228 (0.700)	Data Time 0.001 (0.114)	Loss 2.6666 (2.3710)	Entropy 0.54002 (0.54019)	Top-1 acc 58.203 (67.100)	Top-5 acc 82.812 (85.842)	lr 0.00150
Train [102][340/3239]	Time 0.225 (0.692)	Data Time 0.001 (0.111)	Loss 2.4604 (2.3727)	Entropy 0.54012 (0.54019)	Top-1 acc 65.625 (67.032)	Top-5 acc 85.156 (85.838)	lr 0.00150
Train [102][350/3239]	Time 0.238 (0.683)	Data Time 0.001 (0.108)	Loss 2.3822 (2.3730)	Entropy 0.54040 (0.54019)	Top-1 acc 67.578 (67.028)	Top-5 acc 85.938 (85.841)	lr 0.00150
Train [102][360/3239]	Time 0.230 (0.676)	Data Time 0.001 (0.105)	Loss 2.2888 (2.3745)	Entropy 0.54043 (0.54019)	Top-1 acc 68.750 (66.972)	Top-5 acc 85.156 (85.825)	lr 0.00150
Train [102][370/3239]	Time 0.234 (0.669)	Data Time 0.001 (0.102)	Loss 2.3815 (2.3727)	Entropy 0.54049 (0.54020)	Top-1 acc 67.969 (67.033)	Top-5 acc 87.891 (85.869)	lr 0.00150
Train [102][380/3239]	Time 0.235 (0.662)	Data Time 0.001 (0.100)	Loss 2.3484 (2.3739)	Entropy 0.54072 (0.54021)	Top-1 acc 69.922 (67.000)	Top-5 acc 85.547 (85.852)	lr 0.00150
Train [102][390/3239]	Time 0.272 (0.656)	Data Time 0.001 (0.097)	Loss 2.5796 (2.3742)	Entropy 0.54024 (0.54022)	Top-1 acc 61.328 (66.989)	Top-5 acc 81.641 (85.837)	lr 0.00150
Train [102][400/3239]	Time 0.320 (0.651)	Data Time 0.001 (0.095)	Loss 2.3367 (2.3736)	Entropy 0.54013 (0.54022)	Top-1 acc 64.844 (66.994)	Top-5 acc 89.453 (85.854)	lr 0.00150
Train [102][410/3239]	Time 0.253 (0.645)	Data Time 0.001 (0.092)	Loss 2.6579 (2.3739)	Entropy 0.54039 (0.54022)	Top-1 acc 60.156 (66.982)	Top-5 acc 79.688 (85.845)	lr 0.00150
Train [102][420/3239]	Time 0.241 (0.639)	Data Time 0.001 (0.090)	Loss 2.2265 (2.3737)	Entropy 0.54040 (0.54022)	Top-1 acc 68.750 (66.977)	Top-5 acc 88.672 (85.851)	lr 0.00149
Train [102][430/3239]	Time 0.223 (0.634)	Data Time 0.001 (0.088)	Loss 2.5484 (2.3732)	Entropy 0.54043 (0.54023)	Top-1 acc 65.625 (66.967)	Top-5 acc 81.250 (85.856)	lr 0.00149
Train [102][440/3239]	Time 0.226 (0.629)	Data Time 0.001 (0.086)	Loss 2.4268 (2.3723)	Entropy 0.54032 (0.54023)	Top-1 acc 65.625 (66.969)	Top-5 acc 87.109 (85.875)	lr 0.00149
Train [102][450/3239]	Time 0.234 (0.624)	Data Time 0.001 (0.084)	Loss 2.4114 (2.3721)	Entropy 0.54021 (0.54023)	Top-1 acc 64.844 (66.967)	Top-5 acc 84.375 (85.864)	lr 0.00149
Train [102][460/3239]	Time 0.232 (0.619)	Data Time 0.001 (0.083)	Loss 2.3432 (2.3708)	Entropy 0.54035 (0.54023)	Top-1 acc 67.188 (66.996)	Top-5 acc 88.281 (85.901)	lr 0.00149
Train [102][470/3239]	Time 0.380 (0.615)	Data Time 0.002 (0.081)	Loss 2.5161 (2.3697)	Entropy 0.54032 (0.54023)	Top-1 acc 64.062 (67.026)	Top-5 acc 80.469 (85.906)	lr 0.00149
Train [102][480/3239]	Time 0.282 (0.613)	Data Time 0.002 (0.079)	Loss 2.4117 (2.3697)	Entropy 0.54040 (0.54023)	Top-1 acc 69.141 (67.031)	Top-5 acc 85.938 (85.907)	lr 0.00149
Train [102][490/3239]	Time 0.292 (0.611)	Data Time 0.002 (0.078)	Loss 2.3754 (2.3690)	Entropy 0.54032 (0.54024)	Top-1 acc 66.016 (67.058)	Top-5 acc 84.375 (85.908)	lr 0.00149
Train [102][500/3239]	Time 0.224 (0.608)	Data Time 0.001 (0.076)	Loss 2.5399 (2.3697)	Entropy 0.54049 (0.54024)	Top-1 acc 59.766 (67.042)	Top-5 acc 84.766 (85.915)	lr 0.00149
Train [102][510/3239]	Time 0.235 (0.605)	Data Time 0.001 (0.075)	Loss 2.2696 (2.3721)	Entropy 0.54051 (0.54025)	Top-1 acc 71.484 (67.000)	Top-5 acc 87.109 (85.868)	lr 0.00149
Train [102][520/3239]	Time 0.270 (0.601)	Data Time 0.002 (0.073)	Loss 2.4940 (2.3730)	Entropy 0.54078 (0.54026)	Top-1 acc 67.578 (66.984)	Top-5 acc 85.156 (85.867)	lr 0.00149
Train [102][530/3239]	Time 0.229 (0.598)	Data Time 0.001 (0.072)	Loss 2.3442 (2.3736)	Entropy 0.54066 (0.54027)	Top-1 acc 67.969 (66.972)	Top-5 acc 87.891 (85.848)	lr 0.00149
Train [102][540/3239]	Time 0.226 (0.595)	Data Time 0.001 (0.071)	Loss 2.3882 (2.3735)	Entropy 0.54048 (0.54027)	Top-1 acc 65.625 (66.968)	Top-5 acc 87.500 (85.847)	lr 0.00149
Train [102][550/3239]	Time 0.228 (0.591)	Data Time 0.001 (0.069)	Loss 2.2775 (2.3725)	Entropy 0.54033 (0.54027)	Top-1 acc 68.750 (66.977)	Top-5 acc 86.719 (85.860)	lr 0.00149
Train [102][560/3239]	Time 0.324 (0.588)	Data Time 0.001 (0.068)	Loss 2.2261 (2.3719)	Entropy 0.54057 (0.54028)	Top-1 acc 73.828 (67.009)	Top-5 acc 88.281 (85.864)	lr 0.00149
Train [102][570/3239]	Time 0.225 (0.585)	Data Time 0.001 (0.067)	Loss 2.1743 (2.3716)	Entropy 0.54046 (0.54028)	Top-1 acc 71.094 (67.013)	Top-5 acc 87.500 (85.868)	lr 0.00149
Train [102][580/3239]	Time 0.231 (0.581)	Data Time 0.001 (0.066)	Loss 2.4282 (2.3726)	Entropy 0.54077 (0.54029)	Top-1 acc 67.969 (66.988)	Top-5 acc 84.766 (85.853)	lr 0.00149
Train [102][590/3239]	Time 0.237 (0.579)	Data Time 0.001 (0.065)	Loss 2.3316 (2.3726)	Entropy 0.54061 (0.54030)	Top-1 acc 67.969 (66.978)	Top-5 acc 85.547 (85.846)	lr 0.00149
Train [102][600/3239]	Time 0.220 (0.576)	Data Time 0.001 (0.064)	Loss 2.3815 (2.3720)	Entropy 0.54055 (0.54030)	Top-1 acc 65.234 (66.993)	Top-5 acc 85.156 (85.862)	lr 0.00149
Train [102][610/3239]	Time 0.226 (0.573)	Data Time 0.001 (0.063)	Loss 2.3207 (2.3707)	Entropy 0.54040 (0.54030)	Top-1 acc 66.406 (67.021)	Top-5 acc 86.328 (85.890)	lr 0.00149
Train [102][620/3239]	Time 0.246 (0.570)	Data Time 0.001 (0.062)	Loss 2.5581 (2.3717)	Entropy 0.54048 (0.54030)	Top-1 acc 64.062 (66.993)	Top-5 acc 80.859 (85.870)	lr 0.00149
Train [102][630/3239]	Time 0.322 (0.568)	Data Time 0.001 (0.061)	Loss 2.4447 (2.3709)	Entropy 0.54056 (0.54031)	Top-1 acc 62.891 (67.016)	Top-5 acc 83.203 (85.881)	lr 0.00148
Train [102][640/3239]	Time 0.225 (0.565)	Data Time 0.001 (0.060)	Loss 2.2450 (2.3704)	Entropy 0.54040 (0.54031)	Top-1 acc 71.484 (67.022)	Top-5 acc 86.719 (85.885)	lr 0.00148
Train [102][650/3239]	Time 0.227 (0.563)	Data Time 0.001 (0.059)	Loss 2.5106 (2.3697)	Entropy 0.54063 (0.54031)	Top-1 acc 62.109 (67.047)	Top-5 acc 85.156 (85.909)	lr 0.00148
Train [102][660/3239]	Time 0.221 (0.560)	Data Time 0.001 (0.058)	Loss 2.4354 (2.3702)	Entropy 0.54094 (0.54032)	Top-1 acc 62.891 (67.031)	Top-5 acc 83.984 (85.894)	lr 0.00148
Train [102][670/3239]	Time 0.239 (0.558)	Data Time 0.001 (0.057)	Loss 2.2313 (2.3700)	Entropy 0.54113 (0.54033)	Top-1 acc 73.047 (67.040)	Top-5 acc 87.109 (85.896)	lr 0.00148
Train [102][680/3239]	Time 0.235 (0.556)	Data Time 0.001 (0.056)	Loss 2.3962 (2.3692)	Entropy 0.54110 (0.54034)	Top-1 acc 62.109 (67.050)	Top-5 acc 83.984 (85.911)	lr 0.00148
Train [102][690/3239]	Time 0.234 (0.554)	Data Time 0.001 (0.056)	Loss 2.3381 (2.3686)	Entropy 0.54098 (0.54035)	Top-1 acc 67.188 (67.065)	Top-5 acc 87.109 (85.919)	lr 0.00148
Train [102][700/3239]	Time 0.260 (0.552)	Data Time 0.001 (0.055)	Loss 2.6382 (2.3698)	Entropy 0.54121 (0.54036)	Top-1 acc 60.547 (67.038)	Top-5 acc 82.812 (85.904)	lr 0.00148
Train [102][710/3239]	Time 0.232 (0.550)	Data Time 0.001 (0.054)	Loss 2.3530 (2.3694)	Entropy 0.54121 (0.54037)	Top-1 acc 69.141 (67.061)	Top-5 acc 86.719 (85.916)	lr 0.00148
Train [102][720/3239]	Time 0.379 (0.548)	Data Time 0.002 (0.053)	Loss 2.2256 (2.3684)	Entropy 0.54143 (0.54039)	Top-1 acc 71.875 (67.087)	Top-5 acc 87.891 (85.933)	lr 0.00148
Train [102][730/3239]	Time 0.224 (0.547)	Data Time 0.001 (0.053)	Loss 2.3725 (2.3686)	Entropy 0.54173 (0.54040)	Top-1 acc 66.406 (67.072)	Top-5 acc 85.547 (85.931)	lr 0.00148
Train [102][740/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.052)	Loss 2.2368 (2.3681)	Entropy 0.54156 (0.54042)	Top-1 acc 71.875 (67.075)	Top-5 acc 89.453 (85.951)	lr 0.00148
Train [102][750/3239]	Time 0.227 (0.544)	Data Time 0.001 (0.051)	Loss 2.3892 (2.3683)	Entropy 0.54141 (0.54043)	Top-1 acc 66.406 (67.062)	Top-5 acc 85.156 (85.955)	lr 0.00148
Train [102][760/3239]	Time 0.221 (0.542)	Data Time 0.001 (0.051)	Loss 2.6906 (2.3689)	Entropy 0.54136 (0.54045)	Top-1 acc 56.641 (67.058)	Top-5 acc 78.516 (85.943)	lr 0.00148
Train [102][770/3239]	Time 0.218 (0.540)	Data Time 0.001 (0.050)	Loss 2.3479 (2.3685)	Entropy 0.54137 (0.54046)	Top-1 acc 70.312 (67.062)	Top-5 acc 86.328 (85.949)	lr 0.00148
Train [102][780/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.049)	Loss 2.4013 (2.3695)	Entropy 0.54130 (0.54047)	Top-1 acc 64.844 (67.033)	Top-5 acc 86.719 (85.933)	lr 0.00148
Train [102][790/3239]	Time 0.319 (0.537)	Data Time 0.001 (0.049)	Loss 2.3390 (2.3704)	Entropy 0.54129 (0.54048)	Top-1 acc 63.281 (67.006)	Top-5 acc 87.891 (85.923)	lr 0.00148
Train [102][800/3239]	Time 0.223 (0.535)	Data Time 0.001 (0.048)	Loss 2.3958 (2.3701)	Entropy 0.54102 (0.54049)	Top-1 acc 65.625 (66.996)	Top-5 acc 85.156 (85.926)	lr 0.00148
Train [102][810/3239]	Time 0.218 (0.533)	Data Time 0.001 (0.048)	Loss 2.7871 (2.3711)	Entropy 0.54093 (0.54050)	Top-1 acc 57.812 (66.990)	Top-5 acc 78.906 (85.907)	lr 0.00148
Train [102][820/3239]	Time 0.226 (0.532)	Data Time 0.001 (0.047)	Loss 2.4307 (2.3708)	Entropy 0.54073 (0.54050)	Top-1 acc 66.406 (67.010)	Top-5 acc 82.812 (85.910)	lr 0.00148
Train [102][830/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.046)	Loss 2.5183 (2.3717)	Entropy 0.54086 (0.54050)	Top-1 acc 64.844 (66.999)	Top-5 acc 83.203 (85.892)	lr 0.00148
Train [102][840/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.046)	Loss 2.5937 (2.3722)	Entropy 0.54089 (0.54051)	Top-1 acc 61.328 (66.987)	Top-5 acc 80.859 (85.884)	lr 0.00147
Train [102][850/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.045)	Loss 2.4140 (2.3726)	Entropy 0.54107 (0.54051)	Top-1 acc 66.406 (66.973)	Top-5 acc 84.766 (85.878)	lr 0.00147
Train [102][860/3239]	Time 0.322 (0.526)	Data Time 0.001 (0.045)	Loss 2.3760 (2.3730)	Entropy 0.54099 (0.54052)	Top-1 acc 64.453 (66.957)	Top-5 acc 84.375 (85.869)	lr 0.00147
Train [102][870/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.044)	Loss 2.5843 (2.3731)	Entropy 0.54065 (0.54052)	Top-1 acc 60.156 (66.953)	Top-5 acc 82.812 (85.869)	lr 0.00147
Train [102][880/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.044)	Loss 2.4305 (2.3727)	Entropy 0.54080 (0.54053)	Top-1 acc 66.016 (66.967)	Top-5 acc 84.375 (85.877)	lr 0.00147
Train [102][890/3239]	Time 0.269 (0.583)	Data Time 0.002 (0.043)	Loss 2.3708 (2.3727)	Entropy 0.54069 (0.54053)	Top-1 acc 68.359 (66.971)	Top-5 acc 83.594 (85.876)	lr 0.00147
Train [102][900/3239]	Time 0.299 (0.581)	Data Time 0.002 (0.043)	Loss 2.6103 (2.3726)	Entropy 0.54047 (0.54053)	Top-1 acc 58.594 (66.968)	Top-5 acc 82.031 (85.879)	lr 0.00147
Train [102][910/3239]	Time 0.232 (0.581)	Data Time 0.001 (0.043)	Loss 2.2390 (2.3726)	Entropy 0.54023 (0.54053)	Top-1 acc 74.609 (66.971)	Top-5 acc 86.719 (85.875)	lr 0.00147
Train [102][920/3239]	Time 0.225 (0.579)	Data Time 0.001 (0.042)	Loss 2.5884 (2.3731)	Entropy 0.54018 (0.54052)	Top-1 acc 60.547 (66.964)	Top-5 acc 82.422 (85.873)	lr 0.00147
Train [102][930/3239]	Time 0.236 (0.577)	Data Time 0.001 (0.042)	Loss 2.2980 (2.3726)	Entropy 0.54033 (0.54052)	Top-1 acc 69.141 (66.981)	Top-5 acc 87.109 (85.880)	lr 0.00147
Train [102][940/3239]	Time 0.236 (0.576)	Data Time 0.001 (0.041)	Loss 2.1015 (2.3722)	Entropy 0.54038 (0.54052)	Top-1 acc 73.438 (66.982)	Top-5 acc 89.844 (85.887)	lr 0.00147
Train [102][950/3239]	Time 0.364 (0.574)	Data Time 0.001 (0.041)	Loss 2.2725 (2.3722)	Entropy 0.54042 (0.54052)	Top-1 acc 68.750 (66.985)	Top-5 acc 87.109 (85.889)	lr 0.00147
Train [102][960/3239]	Time 0.239 (0.573)	Data Time 0.001 (0.040)	Loss 2.3325 (2.3722)	Entropy 0.54033 (0.54052)	Top-1 acc 67.188 (66.992)	Top-5 acc 86.719 (85.885)	lr 0.00147
Train [102][970/3239]	Time 0.226 (0.571)	Data Time 0.001 (0.040)	Loss 2.4066 (2.3722)	Entropy 0.54043 (0.54052)	Top-1 acc 65.234 (66.998)	Top-5 acc 85.156 (85.887)	lr 0.00147
Train [102][980/3239]	Time 0.228 (0.569)	Data Time 0.001 (0.040)	Loss 2.3247 (2.3727)	Entropy 0.54040 (0.54051)	Top-1 acc 66.797 (66.980)	Top-5 acc 87.500 (85.880)	lr 0.00147
Train [102][990/3239]	Time 0.226 (0.568)	Data Time 0.001 (0.039)	Loss 2.1804 (2.3726)	Entropy 0.54058 (0.54051)	Top-1 acc 70.703 (66.979)	Top-5 acc 89.062 (85.886)	lr 0.00147
Train [102][1000/3239]	Time 0.228 (0.566)	Data Time 0.001 (0.039)	Loss 2.4360 (2.3725)	Entropy 0.54058 (0.54051)	Top-1 acc 67.578 (66.988)	Top-5 acc 85.156 (85.889)	lr 0.00147
Train [102][1010/3239]	Time 0.233 (0.565)	Data Time 0.001 (0.039)	Loss 2.3018 (2.3726)	Entropy 0.54049 (0.54051)	Top-1 acc 69.141 (67.000)	Top-5 acc 88.281 (85.888)	lr 0.00147
Train [102][1020/3239]	Time 0.359 (0.563)	Data Time 0.001 (0.038)	Loss 2.5392 (2.3734)	Entropy 0.54000 (0.54051)	Top-1 acc 62.891 (66.970)	Top-5 acc 85.156 (85.876)	lr 0.00147
Train [102][1030/3239]	Time 0.245 (0.562)	Data Time 0.001 (0.038)	Loss 2.2565 (2.3732)	Entropy 0.53987 (0.54051)	Top-1 acc 70.312 (66.975)	Top-5 acc 88.281 (85.881)	lr 0.00147
Train [102][1040/3239]	Time 0.233 (0.560)	Data Time 0.001 (0.037)	Loss 2.5000 (2.3735)	Entropy 0.53961 (0.54050)	Top-1 acc 63.672 (66.974)	Top-5 acc 85.547 (85.879)	lr 0.00147
Train [102][1050/3239]	Time 0.268 (0.559)	Data Time 0.001 (0.037)	Loss 2.3715 (2.3739)	Entropy 0.53966 (0.54049)	Top-1 acc 69.141 (66.975)	Top-5 acc 87.109 (85.863)	lr 0.00146
Train [102][1060/3239]	Time 0.235 (0.558)	Data Time 0.001 (0.037)	Loss 2.3486 (2.3736)	Entropy 0.53948 (0.54048)	Top-1 acc 70.312 (66.988)	Top-5 acc 86.719 (85.866)	lr 0.00146
Train [102][1070/3239]	Time 0.230 (0.557)	Data Time 0.001 (0.036)	Loss 2.4214 (2.3735)	Entropy 0.53945 (0.54047)	Top-1 acc 62.500 (66.992)	Top-5 acc 87.109 (85.865)	lr 0.00146
Train [102][1080/3239]	Time 0.239 (0.555)	Data Time 0.001 (0.036)	Loss 2.4202 (2.3736)	Entropy 0.53978 (0.54046)	Top-1 acc 64.062 (66.992)	Top-5 acc 85.547 (85.859)	lr 0.00146
Train [102][1090/3239]	Time 0.247 (0.554)	Data Time 0.001 (0.036)	Loss 2.3338 (2.3741)	Entropy 0.54027 (0.54046)	Top-1 acc 68.359 (66.974)	Top-5 acc 87.891 (85.854)	lr 0.00146
Train [102][1100/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.036)	Loss 2.1917 (2.3745)	Entropy 0.54015 (0.54045)	Top-1 acc 70.312 (66.965)	Top-5 acc 89.844 (85.842)	lr 0.00146
Train [102][1110/3239]	Time 0.351 (0.552)	Data Time 0.001 (0.035)	Loss 2.2322 (2.3744)	Entropy 0.53988 (0.54045)	Top-1 acc 66.797 (66.973)	Top-5 acc 88.672 (85.848)	lr 0.00146
Train [102][1120/3239]	Time 0.235 (0.551)	Data Time 0.001 (0.035)	Loss 2.4433 (2.3745)	Entropy 0.54000 (0.54045)	Top-1 acc 62.500 (66.966)	Top-5 acc 83.984 (85.845)	lr 0.00146
Train [102][1130/3239]	Time 0.236 (0.549)	Data Time 0.001 (0.035)	Loss 2.4077 (2.3748)	Entropy 0.54005 (0.54044)	Top-1 acc 67.578 (66.954)	Top-5 acc 86.719 (85.842)	lr 0.00146
Train [102][1140/3239]	Time 0.230 (0.548)	Data Time 0.001 (0.034)	Loss 2.3744 (2.3747)	Entropy 0.54020 (0.54044)	Top-1 acc 66.797 (66.950)	Top-5 acc 85.547 (85.848)	lr 0.00146
Train [102][1150/3239]	Time 0.228 (0.547)	Data Time 0.001 (0.034)	Loss 2.4111 (2.3749)	Entropy 0.54022 (0.54044)	Top-1 acc 67.969 (66.946)	Top-5 acc 85.156 (85.840)	lr 0.00146
Train [102][1160/3239]	Time 0.246 (0.546)	Data Time 0.001 (0.034)	Loss 2.5395 (2.3745)	Entropy 0.54013 (0.54044)	Top-1 acc 61.328 (66.954)	Top-5 acc 83.203 (85.850)	lr 0.00146
Train [102][1170/3239]	Time 0.229 (0.545)	Data Time 0.001 (0.033)	Loss 2.5263 (2.3744)	Entropy 0.53989 (0.54043)	Top-1 acc 62.500 (66.959)	Top-5 acc 82.812 (85.853)	lr 0.00146
Train [102][1180/3239]	Time 0.426 (0.544)	Data Time 0.001 (0.033)	Loss 2.5692 (2.3739)	Entropy 0.53978 (0.54043)	Top-1 acc 63.281 (66.971)	Top-5 acc 84.375 (85.860)	lr 0.00146
Train [102][1190/3239]	Time 0.275 (0.543)	Data Time 0.001 (0.033)	Loss 2.2714 (2.3741)	Entropy 0.53993 (0.54042)	Top-1 acc 70.703 (66.970)	Top-5 acc 87.891 (85.860)	lr 0.00146
Train [102][1200/3239]	Time 0.229 (0.541)	Data Time 0.001 (0.033)	Loss 2.2588 (2.3738)	Entropy 0.53993 (0.54042)	Top-1 acc 70.312 (66.984)	Top-5 acc 87.500 (85.866)	lr 0.00146
Train [102][1210/3239]	Time 0.249 (0.541)	Data Time 0.001 (0.032)	Loss 2.6158 (2.3737)	Entropy 0.54017 (0.54041)	Top-1 acc 62.500 (66.990)	Top-5 acc 81.641 (85.868)	lr 0.00146
Train [102][1220/3239]	Time 0.234 (0.540)	Data Time 0.001 (0.032)	Loss 2.4438 (2.3735)	Entropy 0.53999 (0.54041)	Top-1 acc 64.453 (66.991)	Top-5 acc 83.594 (85.868)	lr 0.00146
Train [102][1230/3239]	Time 0.236 (0.539)	Data Time 0.001 (0.032)	Loss 2.4294 (2.3738)	Entropy 0.54015 (0.54041)	Top-1 acc 67.188 (66.982)	Top-5 acc 84.375 (85.867)	lr 0.00146
Train [102][1240/3239]	Time 0.238 (0.538)	Data Time 0.001 (0.032)	Loss 2.3444 (2.3737)	Entropy 0.54029 (0.54040)	Top-1 acc 70.312 (66.980)	Top-5 acc 86.328 (85.869)	lr 0.00146
Train [102][1250/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.031)	Loss 2.1420 (2.3739)	Entropy 0.54019 (0.54040)	Top-1 acc 73.047 (66.980)	Top-5 acc 91.016 (85.868)	lr 0.00146
Train [102][1260/3239]	Time 0.219 (0.536)	Data Time 0.001 (0.031)	Loss 2.4317 (2.3741)	Entropy 0.53998 (0.54040)	Top-1 acc 62.891 (66.972)	Top-5 acc 85.547 (85.867)	lr 0.00145
Train [102][1270/3239]	Time 0.318 (0.535)	Data Time 0.001 (0.031)	Loss 2.3914 (2.3744)	Entropy 0.54019 (0.54040)	Top-1 acc 67.188 (66.959)	Top-5 acc 84.766 (85.859)	lr 0.00145
Train [102][1280/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.031)	Loss 2.4312 (2.3751)	Entropy 0.54009 (0.54040)	Top-1 acc 64.453 (66.937)	Top-5 acc 85.156 (85.847)	lr 0.00145
Train [102][1290/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.031)	Loss 2.3112 (2.3746)	Entropy 0.53988 (0.54039)	Top-1 acc 65.625 (66.948)	Top-5 acc 85.938 (85.853)	lr 0.00145
Train [102][1300/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.030)	Loss 2.4353 (2.3748)	Entropy 0.53998 (0.54039)	Top-1 acc 64.453 (66.940)	Top-5 acc 86.328 (85.856)	lr 0.00145
Train [102][1310/3239]	Time 0.238 (0.531)	Data Time 0.001 (0.030)	Loss 2.3158 (2.3747)	Entropy 0.54022 (0.54039)	Top-1 acc 69.922 (66.947)	Top-5 acc 88.281 (85.863)	lr 0.00145
Train [102][1320/3239]	Time 0.254 (0.530)	Data Time 0.001 (0.030)	Loss 2.3015 (2.3746)	Entropy 0.53999 (0.54038)	Top-1 acc 65.625 (66.940)	Top-5 acc 88.281 (85.868)	lr 0.00145
Train [102][1330/3239]	Time 0.236 (0.529)	Data Time 0.001 (0.030)	Loss 2.2977 (2.3747)	Entropy 0.53998 (0.54038)	Top-1 acc 71.875 (66.943)	Top-5 acc 86.719 (85.867)	lr 0.00145
Train [102][1340/3239]	Time 0.321 (0.528)	Data Time 0.001 (0.029)	Loss 2.3468 (2.3745)	Entropy 0.53978 (0.54038)	Top-1 acc 66.016 (66.948)	Top-5 acc 86.719 (85.874)	lr 0.00145
Train [102][1350/3239]	Time 0.229 (0.527)	Data Time 0.001 (0.029)	Loss 2.4345 (2.3748)	Entropy 0.53977 (0.54037)	Top-1 acc 66.797 (66.939)	Top-5 acc 83.594 (85.865)	lr 0.00145
Train [102][1360/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.029)	Loss 2.3361 (2.3746)	Entropy 0.53970 (0.54037)	Top-1 acc 68.750 (66.935)	Top-5 acc 87.109 (85.869)	lr 0.00145
Train [102][1370/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.029)	Loss 2.4358 (2.3748)	Entropy 0.53961 (0.54036)	Top-1 acc 67.969 (66.927)	Top-5 acc 83.594 (85.863)	lr 0.00145
Train [102][1380/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.029)	Loss 2.4413 (2.3754)	Entropy 0.53965 (0.54036)	Top-1 acc 63.281 (66.911)	Top-5 acc 85.156 (85.851)	lr 0.00145
Train [102][1390/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.028)	Loss 2.2653 (2.3748)	Entropy 0.53966 (0.54035)	Top-1 acc 67.188 (66.914)	Top-5 acc 89.453 (85.861)	lr 0.00145
Train [102][1400/3239]	Time 0.220 (0.523)	Data Time 0.001 (0.028)	Loss 2.3858 (2.3752)	Entropy 0.53970 (0.54035)	Top-1 acc 68.359 (66.910)	Top-5 acc 83.984 (85.853)	lr 0.00145
Train [102][1410/3239]	Time 0.222 (0.523)	Data Time 0.001 (0.028)	Loss 2.6467 (2.3754)	Entropy 0.53959 (0.54034)	Top-1 acc 59.375 (66.906)	Top-5 acc 78.906 (85.845)	lr 0.00145
Train [102][1420/3239]	Time 0.216 (0.522)	Data Time 0.001 (0.028)	Loss 2.3545 (2.3750)	Entropy 0.53955 (0.54034)	Top-1 acc 67.969 (66.914)	Top-5 acc 85.156 (85.851)	lr 0.00145
Train [102][1430/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.028)	Loss 2.4687 (2.3751)	Entropy 0.53992 (0.54033)	Top-1 acc 65.234 (66.910)	Top-5 acc 84.375 (85.852)	lr 0.00145
Train [102][1440/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.028)	Loss 2.3470 (2.3750)	Entropy 0.54004 (0.54033)	Top-1 acc 70.312 (66.913)	Top-5 acc 84.766 (85.859)	lr 0.00145
Train [102][1450/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.027)	Loss 2.2361 (2.3748)	Entropy 0.53973 (0.54033)	Top-1 acc 69.922 (66.919)	Top-5 acc 89.062 (85.868)	lr 0.00145
Train [102][1460/3239]	Time 0.220 (0.518)	Data Time 0.001 (0.027)	Loss 2.9445 (2.3749)	Entropy 0.53974 (0.54032)	Top-1 acc 51.953 (66.917)	Top-5 acc 76.953 (85.870)	lr 0.00145
Train [102][1470/3239]	Time 0.228 (0.517)	Data Time 0.001 (0.027)	Loss 2.2913 (2.3750)	Entropy 0.53961 (0.54032)	Top-1 acc 71.094 (66.913)	Top-5 acc 89.062 (85.867)	lr 0.00144
Train [102][1480/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.027)	Loss 2.4687 (2.3752)	Entropy 0.53971 (0.54032)	Top-1 acc 64.453 (66.907)	Top-5 acc 85.156 (85.863)	lr 0.00144
Train [102][1490/3239]	Time 0.228 (0.516)	Data Time 0.002 (0.027)	Loss 2.3897 (2.3757)	Entropy 0.53956 (0.54031)	Top-1 acc 66.797 (66.894)	Top-5 acc 85.938 (85.855)	lr 0.00144
Train [102][1500/3239]	Time 0.323 (0.515)	Data Time 0.001 (0.027)	Loss 2.4986 (2.3757)	Entropy 0.53941 (0.54031)	Top-1 acc 62.500 (66.892)	Top-5 acc 82.422 (85.855)	lr 0.00144
Train [102][1510/3239]	Time 0.275 (0.515)	Data Time 0.001 (0.026)	Loss 2.3171 (2.3758)	Entropy 0.53971 (0.54030)	Top-1 acc 68.750 (66.885)	Top-5 acc 85.156 (85.854)	lr 0.00144
Train [102][1520/3239]	Time 0.224 (0.514)	Data Time 0.001 (0.026)	Loss 2.1875 (2.3756)	Entropy 0.53994 (0.54030)	Top-1 acc 75.391 (66.888)	Top-5 acc 86.719 (85.856)	lr 0.00144
Train [102][1530/3239]	Time 0.258 (0.514)	Data Time 0.001 (0.026)	Loss 2.2482 (2.3754)	Entropy 0.54019 (0.54030)	Top-1 acc 67.578 (66.889)	Top-5 acc 88.672 (85.858)	lr 0.00144
Train [102][1540/3239]	Time 0.441 (0.547)	Data Time 0.005 (0.026)	Loss 2.5567 (2.3755)	Entropy 0.54023 (0.54029)	Top-1 acc 64.453 (66.886)	Top-5 acc 80.859 (85.855)	lr 0.00144
Train [102][1550/3239]	Time 0.235 (0.546)	Data Time 0.002 (0.026)	Loss 2.2153 (2.3755)	Entropy 0.54048 (0.54029)	Top-1 acc 70.312 (66.891)	Top-5 acc 87.891 (85.856)	lr 0.00144
Train [102][1560/3239]	Time 0.238 (0.546)	Data Time 0.002 (0.026)	Loss 2.2458 (2.3755)	Entropy 0.54057 (0.54030)	Top-1 acc 70.312 (66.889)	Top-5 acc 88.672 (85.859)	lr 0.00144
Train [102][1570/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.025)	Loss 2.3797 (2.3754)	Entropy 0.54070 (0.54030)	Top-1 acc 64.844 (66.896)	Top-5 acc 86.719 (85.862)	lr 0.00144
Train [102][1580/3239]	Time 0.235 (0.544)	Data Time 0.001 (0.025)	Loss 2.2785 (2.3756)	Entropy 0.54032 (0.54030)	Top-1 acc 69.141 (66.889)	Top-5 acc 89.062 (85.856)	lr 0.00144
Train [102][1590/3239]	Time 0.288 (0.543)	Data Time 0.001 (0.025)	Loss 2.3145 (2.3757)	Entropy 0.54046 (0.54030)	Top-1 acc 68.359 (66.887)	Top-5 acc 85.156 (85.856)	lr 0.00144
Train [102][1600/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.025)	Loss 2.5114 (2.3758)	Entropy 0.54057 (0.54030)	Top-1 acc 62.500 (66.881)	Top-5 acc 85.156 (85.855)	lr 0.00144
Train [102][1610/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.025)	Loss 2.3901 (2.3761)	Entropy 0.54069 (0.54030)	Top-1 acc 68.750 (66.878)	Top-5 acc 83.594 (85.847)	lr 0.00144
Train [102][1620/3239]	Time 0.229 (0.541)	Data Time 0.001 (0.025)	Loss 2.5206 (2.3761)	Entropy 0.54071 (0.54031)	Top-1 acc 62.500 (66.880)	Top-5 acc 86.719 (85.847)	lr 0.00144
Train [102][1630/3239]	Time 0.246 (0.540)	Data Time 0.001 (0.025)	Loss 2.5161 (2.3761)	Entropy 0.54074 (0.54031)	Top-1 acc 63.672 (66.884)	Top-5 acc 84.375 (85.849)	lr 0.00144
Train [102][1640/3239]	Time 0.242 (0.539)	Data Time 0.001 (0.024)	Loss 2.5633 (2.3761)	Entropy 0.54072 (0.54031)	Top-1 acc 59.375 (66.879)	Top-5 acc 84.375 (85.848)	lr 0.00144
Train [102][1650/3239]	Time 0.232 (0.539)	Data Time 0.001 (0.024)	Loss 2.3202 (2.3762)	Entropy 0.54068 (0.54031)	Top-1 acc 70.312 (66.874)	Top-5 acc 85.156 (85.846)	lr 0.00144
Train [102][1660/3239]	Time 0.322 (0.538)	Data Time 0.001 (0.024)	Loss 2.4883 (2.3762)	Entropy 0.54044 (0.54032)	Top-1 acc 63.281 (66.868)	Top-5 acc 85.938 (85.845)	lr 0.00144
Train [102][1670/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.024)	Loss 2.3014 (2.3759)	Entropy 0.54043 (0.54032)	Top-1 acc 68.750 (66.875)	Top-5 acc 86.719 (85.851)	lr 0.00144
Train [102][1680/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.024)	Loss 2.3233 (2.3759)	Entropy 0.54041 (0.54032)	Top-1 acc 63.672 (66.867)	Top-5 acc 87.500 (85.850)	lr 0.00143
Train [102][1690/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.024)	Loss 2.2151 (2.3757)	Entropy 0.54072 (0.54032)	Top-1 acc 68.750 (66.874)	Top-5 acc 89.844 (85.857)	lr 0.00143
Train [102][1700/3239]	Time 0.226 (0.535)	Data Time 0.001 (0.024)	Loss 2.3998 (2.3755)	Entropy 0.54043 (0.54032)	Top-1 acc 68.750 (66.882)	Top-5 acc 85.547 (85.857)	lr 0.00143
Train [102][1710/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.024)	Loss 2.7011 (2.3758)	Entropy 0.54006 (0.54032)	Top-1 acc 57.031 (66.872)	Top-5 acc 78.906 (85.851)	lr 0.00143
Train [102][1720/3239]	Time 0.257 (0.534)	Data Time 0.001 (0.023)	Loss 2.4234 (2.3757)	Entropy 0.54011 (0.54032)	Top-1 acc 66.016 (66.869)	Top-5 acc 82.812 (85.852)	lr 0.00143
Train [102][1730/3239]	Time 0.327 (0.533)	Data Time 0.001 (0.023)	Loss 2.3169 (2.3754)	Entropy 0.54027 (0.54032)	Top-1 acc 72.266 (66.876)	Top-5 acc 85.547 (85.855)	lr 0.00143
Train [102][1740/3239]	Time 0.258 (0.532)	Data Time 0.001 (0.023)	Loss 2.6744 (2.3755)	Entropy 0.54025 (0.54032)	Top-1 acc 58.984 (66.873)	Top-5 acc 80.469 (85.849)	lr 0.00143
Train [102][1750/3239]	Time 0.230 (0.532)	Data Time 0.001 (0.023)	Loss 2.1708 (2.3753)	Entropy 0.54030 (0.54032)	Top-1 acc 71.484 (66.881)	Top-5 acc 88.281 (85.851)	lr 0.00143
Train [102][1760/3239]	Time 0.281 (0.532)	Data Time 0.001 (0.023)	Loss 2.0997 (2.3752)	Entropy 0.54045 (0.54032)	Top-1 acc 73.828 (66.886)	Top-5 acc 90.625 (85.851)	lr 0.00143
Train [102][1770/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.023)	Loss 2.3940 (2.3751)	Entropy 0.54040 (0.54032)	Top-1 acc 66.406 (66.888)	Top-5 acc 82.812 (85.854)	lr 0.00143
Train [102][1780/3239]	Time 0.231 (0.531)	Data Time 0.001 (0.023)	Loss 2.5240 (2.3752)	Entropy 0.54037 (0.54032)	Top-1 acc 61.328 (66.883)	Top-5 acc 82.031 (85.849)	lr 0.00143
Train [102][1790/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.023)	Loss 2.6806 (2.3754)	Entropy 0.54024 (0.54032)	Top-1 acc 62.109 (66.881)	Top-5 acc 80.469 (85.844)	lr 0.00143
Train [102][1800/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.022)	Loss 2.5184 (2.3753)	Entropy 0.54039 (0.54032)	Top-1 acc 60.938 (66.881)	Top-5 acc 83.984 (85.847)	lr 0.00143
Train [102][1810/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.022)	Loss 2.2872 (2.3747)	Entropy 0.54018 (0.54032)	Top-1 acc 69.141 (66.900)	Top-5 acc 87.500 (85.858)	lr 0.00143
Train [102][1820/3239]	Time 0.317 (0.528)	Data Time 0.001 (0.022)	Loss 2.2583 (2.3748)	Entropy 0.54056 (0.54032)	Top-1 acc 69.922 (66.896)	Top-5 acc 86.719 (85.855)	lr 0.00143
Train [102][1830/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.022)	Loss 2.1266 (2.3744)	Entropy 0.54053 (0.54032)	Top-1 acc 71.875 (66.906)	Top-5 acc 89.453 (85.859)	lr 0.00143
Train [102][1840/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.022)	Loss 2.4311 (2.3745)	Entropy 0.54071 (0.54032)	Top-1 acc 66.797 (66.897)	Top-5 acc 83.984 (85.855)	lr 0.00143
Train [102][1850/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.022)	Loss 2.3395 (2.3745)	Entropy 0.54057 (0.54032)	Top-1 acc 66.406 (66.896)	Top-5 acc 87.500 (85.854)	lr 0.00143
Train [102][1860/3239]	Time 0.222 (0.526)	Data Time 0.001 (0.022)	Loss 2.5370 (2.3747)	Entropy 0.54061 (0.54032)	Top-1 acc 61.719 (66.882)	Top-5 acc 83.594 (85.855)	lr 0.00143
Train [102][1870/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.022)	Loss 2.4966 (2.3745)	Entropy 0.54066 (0.54033)	Top-1 acc 64.453 (66.888)	Top-5 acc 83.594 (85.859)	lr 0.00143
Train [102][1880/3239]	Time 0.260 (0.525)	Data Time 0.001 (0.022)	Loss 2.3491 (2.3745)	Entropy 0.54033 (0.54033)	Top-1 acc 66.797 (66.883)	Top-5 acc 86.328 (85.862)	lr 0.00143
Train [102][1890/3239]	Time 0.341 (0.524)	Data Time 0.001 (0.021)	Loss 2.1479 (2.3740)	Entropy 0.54053 (0.54033)	Top-1 acc 72.656 (66.896)	Top-5 acc 89.062 (85.872)	lr 0.00142
Train [102][1900/3239]	Time 0.227 (0.524)	Data Time 0.001 (0.021)	Loss 2.2710 (2.3741)	Entropy 0.54082 (0.54033)	Top-1 acc 68.750 (66.890)	Top-5 acc 86.328 (85.872)	lr 0.00142
Train [102][1910/3239]	Time 0.229 (0.523)	Data Time 0.001 (0.021)	Loss 2.2458 (2.3739)	Entropy 0.54096 (0.54033)	Top-1 acc 71.094 (66.894)	Top-5 acc 87.109 (85.873)	lr 0.00142
Train [102][1920/3239]	Time 0.276 (0.523)	Data Time 0.002 (0.021)	Loss 2.6608 (2.3740)	Entropy 0.54079 (0.54034)	Top-1 acc 58.984 (66.897)	Top-5 acc 82.031 (85.869)	lr 0.00142
Train [102][1930/3239]	Time 0.349 (0.523)	Data Time 0.001 (0.021)	Loss 2.2658 (2.3740)	Entropy 0.54094 (0.54034)	Top-1 acc 71.094 (66.897)	Top-5 acc 85.547 (85.867)	lr 0.00142
Train [102][1940/3239]	Time 0.240 (0.523)	Data Time 0.001 (0.021)	Loss 2.2414 (2.3739)	Entropy 0.54083 (0.54034)	Top-1 acc 70.703 (66.899)	Top-5 acc 89.062 (85.870)	lr 0.00142
Train [102][1950/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.021)	Loss 2.2776 (2.3737)	Entropy 0.54073 (0.54034)	Top-1 acc 67.969 (66.905)	Top-5 acc 85.938 (85.872)	lr 0.00142
Train [102][1960/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.021)	Loss 2.1686 (2.3734)	Entropy 0.54066 (0.54035)	Top-1 acc 71.875 (66.911)	Top-5 acc 90.234 (85.876)	lr 0.00142
Train [102][1970/3239]	Time 0.239 (0.521)	Data Time 0.001 (0.021)	Loss 2.2679 (2.3730)	Entropy 0.54053 (0.54035)	Top-1 acc 70.703 (66.920)	Top-5 acc 87.500 (85.879)	lr 0.00142
Train [102][1980/3239]	Time 0.258 (0.521)	Data Time 0.001 (0.021)	Loss 2.4985 (2.3732)	Entropy 0.54042 (0.54035)	Top-1 acc 67.578 (66.914)	Top-5 acc 82.812 (85.874)	lr 0.00142
Train [102][1990/3239]	Time 0.249 (0.520)	Data Time 0.001 (0.020)	Loss 2.3455 (2.3733)	Entropy 0.54063 (0.54035)	Top-1 acc 65.625 (66.906)	Top-5 acc 86.328 (85.874)	lr 0.00142
Train [102][2000/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.020)	Loss 2.1664 (2.3732)	Entropy 0.54052 (0.54035)	Top-1 acc 72.266 (66.907)	Top-5 acc 91.016 (85.879)	lr 0.00142
Train [102][2010/3239]	Time 0.245 (0.519)	Data Time 0.001 (0.020)	Loss 2.3214 (2.3731)	Entropy 0.54062 (0.54035)	Top-1 acc 68.750 (66.910)	Top-5 acc 86.328 (85.880)	lr 0.00142
Train [102][2020/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.020)	Loss 2.4217 (2.3732)	Entropy 0.54056 (0.54035)	Top-1 acc 63.672 (66.905)	Top-5 acc 83.594 (85.879)	lr 0.00142
Train [102][2030/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.020)	Loss 2.2652 (2.3732)	Entropy 0.54083 (0.54035)	Top-1 acc 68.359 (66.900)	Top-5 acc 86.719 (85.877)	lr 0.00142
Train [102][2040/3239]	Time 0.224 (0.517)	Data Time 0.001 (0.020)	Loss 2.6195 (2.3736)	Entropy 0.54079 (0.54036)	Top-1 acc 59.766 (66.890)	Top-5 acc 80.859 (85.867)	lr 0.00142
Train [102][2050/3239]	Time 0.320 (0.517)	Data Time 0.001 (0.020)	Loss 2.4059 (2.3737)	Entropy 0.54081 (0.54036)	Top-1 acc 67.969 (66.890)	Top-5 acc 84.766 (85.864)	lr 0.00142
Train [102][2060/3239]	Time 0.228 (0.516)	Data Time 0.001 (0.020)	Loss 2.3418 (2.3737)	Entropy 0.54043 (0.54036)	Top-1 acc 66.406 (66.896)	Top-5 acc 85.547 (85.858)	lr 0.00142
Train [102][2070/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.020)	Loss 2.2319 (2.3735)	Entropy 0.54027 (0.54036)	Top-1 acc 70.312 (66.901)	Top-5 acc 89.062 (85.858)	lr 0.00142
Train [102][2080/3239]	Time 0.250 (0.515)	Data Time 0.001 (0.020)	Loss 2.3582 (2.3734)	Entropy 0.54005 (0.54036)	Top-1 acc 70.312 (66.903)	Top-5 acc 84.766 (85.859)	lr 0.00142
Train [102][2090/3239]	Time 0.234 (0.515)	Data Time 0.001 (0.020)	Loss 2.3639 (2.3737)	Entropy 0.54018 (0.54036)	Top-1 acc 67.969 (66.900)	Top-5 acc 85.156 (85.852)	lr 0.00142
Train [102][2100/3239]	Time 0.229 (0.514)	Data Time 0.001 (0.019)	Loss 2.4324 (2.3739)	Entropy 0.54017 (0.54036)	Top-1 acc 64.453 (66.896)	Top-5 acc 85.547 (85.849)	lr 0.00142
Train [102][2110/3239]	Time 0.236 (0.514)	Data Time 0.001 (0.019)	Loss 2.5303 (2.3742)	Entropy 0.54030 (0.54036)	Top-1 acc 63.672 (66.889)	Top-5 acc 84.375 (85.846)	lr 0.00141
Train [102][2120/3239]	Time 0.319 (0.513)	Data Time 0.001 (0.019)	Loss 2.6074 (2.3741)	Entropy 0.54049 (0.54036)	Top-1 acc 59.766 (66.889)	Top-5 acc 81.250 (85.844)	lr 0.00141
Train [102][2130/3239]	Time 0.229 (0.513)	Data Time 0.001 (0.019)	Loss 2.4923 (2.3742)	Entropy 0.54061 (0.54036)	Top-1 acc 62.891 (66.884)	Top-5 acc 85.938 (85.842)	lr 0.00141
Train [102][2140/3239]	Time 0.260 (0.512)	Data Time 0.001 (0.019)	Loss 2.5498 (2.3742)	Entropy 0.54096 (0.54036)	Top-1 acc 63.672 (66.888)	Top-5 acc 83.594 (85.842)	lr 0.00141
Train [102][2150/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.019)	Loss 2.4217 (2.3742)	Entropy 0.54116 (0.54036)	Top-1 acc 67.969 (66.882)	Top-5 acc 85.938 (85.843)	lr 0.00141
Train [102][2160/3239]	Time 0.234 (0.511)	Data Time 0.001 (0.019)	Loss 2.2367 (2.3742)	Entropy 0.54095 (0.54037)	Top-1 acc 70.312 (66.884)	Top-5 acc 87.891 (85.843)	lr 0.00141
Train [102][2170/3239]	Time 0.238 (0.511)	Data Time 0.001 (0.019)	Loss 2.3524 (2.3741)	Entropy 0.54088 (0.54037)	Top-1 acc 69.141 (66.888)	Top-5 acc 87.109 (85.846)	lr 0.00141
Train [102][2180/3239]	Time 0.280 (0.511)	Data Time 0.002 (0.019)	Loss 2.1601 (2.3739)	Entropy 0.54086 (0.54037)	Top-1 acc 70.312 (66.892)	Top-5 acc 89.062 (85.847)	lr 0.00141
Train [102][2190/3239]	Time 0.220 (0.511)	Data Time 0.001 (0.019)	Loss 2.6713 (2.3742)	Entropy 0.54109 (0.54037)	Top-1 acc 60.156 (66.884)	Top-5 acc 79.688 (85.843)	lr 0.00141
Train [102][2200/3239]	Time 0.302 (0.534)	Data Time 0.002 (0.019)	Loss 2.5194 (2.3741)	Entropy 0.54085 (0.54038)	Top-1 acc 63.281 (66.889)	Top-5 acc 83.203 (85.843)	lr 0.00141
Train [102][2210/3239]	Time 0.335 (0.534)	Data Time 0.002 (0.019)	Loss 2.2002 (2.3744)	Entropy 0.54091 (0.54038)	Top-1 acc 71.875 (66.883)	Top-5 acc 88.672 (85.840)	lr 0.00141
Train [102][2220/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.019)	Loss 2.2724 (2.3742)	Entropy 0.54083 (0.54038)	Top-1 acc 71.875 (66.888)	Top-5 acc 89.453 (85.842)	lr 0.00141
Train [102][2230/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.018)	Loss 2.2167 (2.3745)	Entropy 0.54098 (0.54038)	Top-1 acc 73.438 (66.889)	Top-5 acc 88.281 (85.836)	lr 0.00141
Train [102][2240/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.018)	Loss 2.1808 (2.3744)	Entropy 0.54111 (0.54039)	Top-1 acc 72.266 (66.889)	Top-5 acc 87.500 (85.839)	lr 0.00141
Train [102][2250/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.018)	Loss 2.4694 (2.3745)	Entropy 0.54094 (0.54039)	Top-1 acc 63.672 (66.889)	Top-5 acc 83.203 (85.837)	lr 0.00141
Train [102][2260/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.018)	Loss 2.4195 (2.3744)	Entropy 0.54111 (0.54039)	Top-1 acc 64.453 (66.894)	Top-5 acc 87.109 (85.839)	lr 0.00141
Train [102][2270/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.018)	Loss 2.3856 (2.3744)	Entropy 0.54115 (0.54039)	Top-1 acc 68.750 (66.898)	Top-5 acc 83.594 (85.837)	lr 0.00141
Train [102][2280/3239]	Time 0.331 (0.530)	Data Time 0.001 (0.018)	Loss 2.3620 (2.3749)	Entropy 0.54121 (0.54040)	Top-1 acc 68.359 (66.891)	Top-5 acc 84.375 (85.827)	lr 0.00141
Train [102][2290/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.018)	Loss 2.2735 (2.3753)	Entropy 0.54125 (0.54040)	Top-1 acc 70.703 (66.884)	Top-5 acc 89.062 (85.822)	lr 0.00141
Train [102][2300/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.018)	Loss 2.3932 (2.3753)	Entropy 0.54080 (0.54040)	Top-1 acc 65.234 (66.885)	Top-5 acc 86.328 (85.820)	lr 0.00141
Train [102][2310/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.018)	Loss 2.3712 (2.3753)	Entropy 0.54069 (0.54041)	Top-1 acc 67.188 (66.882)	Top-5 acc 82.812 (85.818)	lr 0.00141
Train [102][2320/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.018)	Loss 2.4537 (2.3753)	Entropy 0.54053 (0.54041)	Top-1 acc 66.016 (66.880)	Top-5 acc 85.938 (85.823)	lr 0.00140
Train [102][2330/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.018)	Loss 2.5328 (2.3752)	Entropy 0.54051 (0.54041)	Top-1 acc 66.406 (66.884)	Top-5 acc 81.250 (85.823)	lr 0.00140
Train [102][2340/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.018)	Loss 2.3145 (2.3750)	Entropy 0.54033 (0.54041)	Top-1 acc 68.359 (66.886)	Top-5 acc 86.719 (85.827)	lr 0.00140
Train [102][2350/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.018)	Loss 2.2109 (2.3750)	Entropy 0.54038 (0.54041)	Top-1 acc 70.703 (66.888)	Top-5 acc 86.328 (85.823)	lr 0.00140
Train [102][2360/3239]	Time 0.282 (0.527)	Data Time 0.001 (0.018)	Loss 2.2244 (2.3750)	Entropy 0.54041 (0.54041)	Top-1 acc 70.312 (66.886)	Top-5 acc 86.328 (85.821)	lr 0.00140
Train [102][2370/3239]	Time 0.326 (0.527)	Data Time 0.001 (0.017)	Loss 2.2313 (2.3749)	Entropy 0.54030 (0.54041)	Top-1 acc 67.188 (66.884)	Top-5 acc 88.281 (85.824)	lr 0.00140
Train [102][2380/3239]	Time 0.219 (0.526)	Data Time 0.001 (0.017)	Loss 2.5862 (2.3752)	Entropy 0.54013 (0.54041)	Top-1 acc 64.062 (66.875)	Top-5 acc 82.031 (85.819)	lr 0.00140
Train [102][2390/3239]	Time 0.236 (0.526)	Data Time 0.001 (0.017)	Loss 2.3639 (2.3753)	Entropy 0.54002 (0.54041)	Top-1 acc 66.016 (66.870)	Top-5 acc 83.984 (85.819)	lr 0.00140
Train [102][2400/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.017)	Loss 2.3231 (2.3753)	Entropy 0.53991 (0.54040)	Top-1 acc 70.703 (66.873)	Top-5 acc 86.328 (85.818)	lr 0.00140
Train [102][2410/3239]	Time 0.223 (0.525)	Data Time 0.001 (0.017)	Loss 2.4786 (2.3755)	Entropy 0.53986 (0.54040)	Top-1 acc 65.234 (66.862)	Top-5 acc 83.984 (85.813)	lr 0.00140
Train [102][2420/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.4423 (2.3756)	Entropy 0.53989 (0.54040)	Top-1 acc 67.578 (66.862)	Top-5 acc 82.812 (85.811)	lr 0.00140
Train [102][2430/3239]	Time 0.268 (0.524)	Data Time 0.001 (0.017)	Loss 2.3384 (2.3755)	Entropy 0.53994 (0.54040)	Top-1 acc 64.844 (66.863)	Top-5 acc 86.719 (85.814)	lr 0.00140
Train [102][2440/3239]	Time 0.321 (0.524)	Data Time 0.001 (0.017)	Loss 2.4015 (2.3754)	Entropy 0.54005 (0.54040)	Top-1 acc 64.844 (66.867)	Top-5 acc 85.156 (85.817)	lr 0.00140
Train [102][2450/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.017)	Loss 2.3829 (2.3753)	Entropy 0.54007 (0.54039)	Top-1 acc 60.156 (66.866)	Top-5 acc 85.156 (85.820)	lr 0.00140
Train [102][2460/3239]	Time 0.226 (0.523)	Data Time 0.001 (0.017)	Loss 2.4205 (2.3754)	Entropy 0.54043 (0.54039)	Top-1 acc 67.188 (66.868)	Top-5 acc 81.250 (85.816)	lr 0.00140
Train [102][2470/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.017)	Loss 2.5321 (2.3752)	Entropy 0.54027 (0.54039)	Top-1 acc 62.500 (66.870)	Top-5 acc 83.594 (85.818)	lr 0.00140
Train [102][2480/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.017)	Loss 2.3284 (2.3751)	Entropy 0.54011 (0.54039)	Top-1 acc 69.531 (66.874)	Top-5 acc 87.109 (85.820)	lr 0.00140
Train [102][2490/3239]	Time 0.223 (0.522)	Data Time 0.001 (0.017)	Loss 2.4275 (2.3751)	Entropy 0.54023 (0.54039)	Top-1 acc 64.844 (66.871)	Top-5 acc 84.375 (85.820)	lr 0.00140
Train [102][2500/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.017)	Loss 2.1738 (2.3749)	Entropy 0.54018 (0.54039)	Top-1 acc 71.484 (66.877)	Top-5 acc 87.891 (85.823)	lr 0.00140
Train [102][2510/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.017)	Loss 2.4700 (2.3751)	Entropy 0.54057 (0.54039)	Top-1 acc 66.016 (66.872)	Top-5 acc 85.156 (85.820)	lr 0.00140
Train [102][2520/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.016)	Loss 2.4046 (2.3750)	Entropy 0.54036 (0.54039)	Top-1 acc 66.016 (66.875)	Top-5 acc 87.109 (85.823)	lr 0.00140
Train [102][2530/3239]	Time 0.327 (0.520)	Data Time 0.001 (0.016)	Loss 2.3428 (2.3751)	Entropy 0.54026 (0.54039)	Top-1 acc 69.922 (66.878)	Top-5 acc 83.984 (85.820)	lr 0.00140
Train [102][2540/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.016)	Loss 2.2389 (2.3748)	Entropy 0.54046 (0.54039)	Top-1 acc 69.531 (66.887)	Top-5 acc 86.719 (85.823)	lr 0.00139
Train [102][2550/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.016)	Loss 2.3820 (2.3745)	Entropy 0.54062 (0.54039)	Top-1 acc 67.188 (66.896)	Top-5 acc 86.719 (85.832)	lr 0.00139
Train [102][2560/3239]	Time 0.225 (0.518)	Data Time 0.001 (0.016)	Loss 2.3803 (2.3745)	Entropy 0.54025 (0.54039)	Top-1 acc 67.969 (66.897)	Top-5 acc 86.719 (85.831)	lr 0.00139
Train [102][2570/3239]	Time 0.235 (0.518)	Data Time 0.001 (0.016)	Loss 2.4148 (2.3745)	Entropy 0.54011 (0.54039)	Top-1 acc 66.406 (66.898)	Top-5 acc 86.328 (85.833)	lr 0.00139
Train [102][2580/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.016)	Loss 2.3260 (2.3744)	Entropy 0.54006 (0.54039)	Top-1 acc 70.703 (66.904)	Top-5 acc 84.766 (85.834)	lr 0.00139
Train [102][2590/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.016)	Loss 2.1986 (2.3741)	Entropy 0.53985 (0.54039)	Top-1 acc 71.484 (66.909)	Top-5 acc 86.719 (85.838)	lr 0.00139
Train [102][2600/3239]	Time 0.333 (0.517)	Data Time 0.001 (0.016)	Loss 2.3646 (2.3740)	Entropy 0.53991 (0.54039)	Top-1 acc 65.625 (66.914)	Top-5 acc 86.328 (85.839)	lr 0.00139
Train [102][2610/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.016)	Loss 2.2549 (2.3739)	Entropy 0.53967 (0.54038)	Top-1 acc 68.359 (66.911)	Top-5 acc 89.062 (85.841)	lr 0.00139
Train [102][2620/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.016)	Loss 2.4589 (2.3740)	Entropy 0.53980 (0.54038)	Top-1 acc 66.797 (66.911)	Top-5 acc 82.812 (85.841)	lr 0.00139
Train [102][2630/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.016)	Loss 2.3660 (2.3739)	Entropy 0.53998 (0.54038)	Top-1 acc 67.578 (66.914)	Top-5 acc 85.938 (85.844)	lr 0.00139
Train [102][2640/3239]	Time 0.250 (0.515)	Data Time 0.001 (0.016)	Loss 2.4679 (2.3738)	Entropy 0.53945 (0.54038)	Top-1 acc 66.797 (66.919)	Top-5 acc 83.203 (85.846)	lr 0.00139
Train [102][2650/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.016)	Loss 2.4231 (2.3737)	Entropy 0.53944 (0.54037)	Top-1 acc 66.016 (66.920)	Top-5 acc 85.547 (85.847)	lr 0.00139
Train [102][2660/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.016)	Loss 2.3552 (2.3738)	Entropy 0.53931 (0.54037)	Top-1 acc 65.625 (66.917)	Top-5 acc 86.719 (85.846)	lr 0.00139
Train [102][2670/3239]	Time 0.217 (0.514)	Data Time 0.001 (0.016)	Loss 2.4649 (2.3736)	Entropy 0.53939 (0.54037)	Top-1 acc 60.156 (66.915)	Top-5 acc 85.938 (85.851)	lr 0.00139
Train [102][2680/3239]	Time 0.279 (0.514)	Data Time 0.002 (0.016)	Loss 2.2474 (2.3734)	Entropy 0.53915 (0.54036)	Top-1 acc 70.703 (66.918)	Top-5 acc 89.844 (85.857)	lr 0.00139
Train [102][2690/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.016)	Loss 2.2580 (2.3735)	Entropy 0.53924 (0.54036)	Top-1 acc 69.531 (66.917)	Top-5 acc 89.453 (85.856)	lr 0.00139
Train [102][2700/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.016)	Loss 2.3698 (2.3737)	Entropy 0.53916 (0.54035)	Top-1 acc 66.406 (66.913)	Top-5 acc 86.328 (85.854)	lr 0.00139
Train [102][2710/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.015)	Loss 2.4863 (2.3734)	Entropy 0.53923 (0.54035)	Top-1 acc 60.547 (66.922)	Top-5 acc 84.375 (85.859)	lr 0.00139
Train [102][2720/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.015)	Loss 2.3369 (2.3732)	Entropy 0.53940 (0.54035)	Top-1 acc 65.625 (66.922)	Top-5 acc 85.547 (85.860)	lr 0.00139
Train [102][2730/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.015)	Loss 2.1927 (2.3730)	Entropy 0.53936 (0.54034)	Top-1 acc 75.391 (66.928)	Top-5 acc 91.016 (85.865)	lr 0.00139
Train [102][2740/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.015)	Loss 2.4116 (2.3731)	Entropy 0.53966 (0.54034)	Top-1 acc 65.234 (66.926)	Top-5 acc 86.328 (85.864)	lr 0.00139
Train [102][2750/3239]	Time 0.230 (0.511)	Data Time 0.001 (0.015)	Loss 2.3166 (2.3731)	Entropy 0.53961 (0.54034)	Top-1 acc 71.094 (66.928)	Top-5 acc 85.938 (85.864)	lr 0.00138
Train [102][2760/3239]	Time 0.332 (0.511)	Data Time 0.001 (0.015)	Loss 2.2988 (2.3728)	Entropy 0.53963 (0.54033)	Top-1 acc 69.922 (66.935)	Top-5 acc 86.328 (85.870)	lr 0.00138
Train [102][2770/3239]	Time 0.235 (0.511)	Data Time 0.001 (0.015)	Loss 2.2064 (2.3727)	Entropy 0.53967 (0.54033)	Top-1 acc 70.703 (66.938)	Top-5 acc 88.281 (85.874)	lr 0.00138
Train [102][2780/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.015)	Loss 2.1438 (2.3724)	Entropy 0.53961 (0.54033)	Top-1 acc 75.781 (66.946)	Top-5 acc 89.453 (85.880)	lr 0.00138
Train [102][2790/3239]	Time 0.226 (0.510)	Data Time 0.001 (0.015)	Loss 2.4789 (2.3726)	Entropy 0.53974 (0.54033)	Top-1 acc 71.094 (66.943)	Top-5 acc 84.375 (85.876)	lr 0.00138
Train [102][2800/3239]	Time 0.226 (0.510)	Data Time 0.001 (0.015)	Loss 2.5782 (2.3724)	Entropy 0.53998 (0.54032)	Top-1 acc 61.719 (66.949)	Top-5 acc 81.250 (85.878)	lr 0.00138
Train [102][2810/3239]	Time 0.225 (0.509)	Data Time 0.001 (0.015)	Loss 2.4736 (2.3724)	Entropy 0.54015 (0.54032)	Top-1 acc 63.281 (66.947)	Top-5 acc 83.984 (85.878)	lr 0.00138
Train [102][2820/3239]	Time 0.226 (0.509)	Data Time 0.001 (0.015)	Loss 2.4428 (2.3723)	Entropy 0.54010 (0.54032)	Top-1 acc 64.844 (66.947)	Top-5 acc 85.156 (85.880)	lr 0.00138
Train [102][2830/3239]	Time 0.329 (0.509)	Data Time 0.001 (0.015)	Loss 2.3827 (2.3723)	Entropy 0.54014 (0.54032)	Top-1 acc 63.281 (66.947)	Top-5 acc 87.891 (85.880)	lr 0.00138
Train [102][2840/3239]	Time 0.217 (0.508)	Data Time 0.001 (0.015)	Loss 2.4925 (2.3724)	Entropy 0.53977 (0.54032)	Top-1 acc 61.719 (66.940)	Top-5 acc 84.375 (85.878)	lr 0.00138
Train [102][2850/3239]	Time 0.358 (0.527)	Data Time 0.005 (0.015)	Loss 2.4018 (2.3724)	Entropy 0.53978 (0.54032)	Top-1 acc 63.672 (66.938)	Top-5 acc 85.938 (85.880)	lr 0.00138
Train [102][2860/3239]	Time 0.251 (0.526)	Data Time 0.002 (0.015)	Loss 2.3468 (2.3725)	Entropy 0.53931 (0.54032)	Top-1 acc 68.750 (66.935)	Top-5 acc 85.938 (85.877)	lr 0.00138
Train [102][2870/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.015)	Loss 2.4045 (2.3725)	Entropy 0.53882 (0.54031)	Top-1 acc 66.016 (66.935)	Top-5 acc 86.328 (85.878)	lr 0.00138
Train [102][2880/3239]	Time 0.267 (0.526)	Data Time 0.002 (0.015)	Loss 2.1414 (2.3724)	Entropy 0.53883 (0.54031)	Top-1 acc 72.266 (66.936)	Top-5 acc 89.453 (85.881)	lr 0.00138
Train [102][2890/3239]	Time 0.301 (0.526)	Data Time 0.002 (0.015)	Loss 2.8214 (2.3726)	Entropy 0.53880 (0.54030)	Top-1 acc 54.688 (66.931)	Top-5 acc 80.469 (85.880)	lr 0.00138
Train [102][2900/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.015)	Loss 2.3598 (2.3726)	Entropy 0.53887 (0.54030)	Top-1 acc 67.578 (66.930)	Top-5 acc 84.375 (85.880)	lr 0.00138
Train [102][2910/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.015)	Loss 2.3934 (2.3728)	Entropy 0.53890 (0.54029)	Top-1 acc 68.750 (66.926)	Top-5 acc 85.156 (85.878)	lr 0.00138
Train [102][2920/3239]	Time 0.342 (0.525)	Data Time 0.001 (0.014)	Loss 2.3533 (2.3730)	Entropy 0.53888 (0.54029)	Top-1 acc 66.797 (66.920)	Top-5 acc 86.719 (85.876)	lr 0.00138
Train [102][2930/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.014)	Loss 2.2806 (2.3730)	Entropy 0.53903 (0.54028)	Top-1 acc 69.141 (66.919)	Top-5 acc 84.766 (85.877)	lr 0.00138
Train [102][2940/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.014)	Loss 2.2942 (2.3733)	Entropy 0.53899 (0.54028)	Top-1 acc 69.922 (66.914)	Top-5 acc 85.156 (85.872)	lr 0.00138
Train [102][2950/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.014)	Loss 2.3773 (2.3731)	Entropy 0.53906 (0.54027)	Top-1 acc 69.531 (66.919)	Top-5 acc 83.594 (85.877)	lr 0.00138
Train [102][2960/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.014)	Loss 2.4885 (2.3731)	Entropy 0.53899 (0.54027)	Top-1 acc 67.188 (66.919)	Top-5 acc 82.812 (85.878)	lr 0.00138
Train [102][2970/3239]	Time 0.229 (0.523)	Data Time 0.001 (0.014)	Loss 2.3828 (2.3730)	Entropy 0.53908 (0.54027)	Top-1 acc 67.188 (66.918)	Top-5 acc 85.156 (85.878)	lr 0.00137
Train [102][2980/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.014)	Loss 2.1897 (2.3729)	Entropy 0.53948 (0.54026)	Top-1 acc 71.484 (66.920)	Top-5 acc 87.891 (85.877)	lr 0.00137
Train [102][2990/3239]	Time 0.326 (0.522)	Data Time 0.001 (0.014)	Loss 2.4900 (2.3729)	Entropy 0.53945 (0.54026)	Top-1 acc 65.234 (66.921)	Top-5 acc 85.547 (85.876)	lr 0.00137
Train [102][3000/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.014)	Loss 2.5809 (2.3730)	Entropy 0.53964 (0.54026)	Top-1 acc 63.672 (66.917)	Top-5 acc 82.031 (85.872)	lr 0.00137
Train [102][3010/3239]	Time 0.223 (0.522)	Data Time 0.001 (0.014)	Loss 2.2713 (2.3730)	Entropy 0.53974 (0.54025)	Top-1 acc 67.969 (66.917)	Top-5 acc 86.719 (85.874)	lr 0.00137
Train [102][3020/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.014)	Loss 2.5541 (2.3731)	Entropy 0.53971 (0.54025)	Top-1 acc 64.062 (66.914)	Top-5 acc 83.203 (85.874)	lr 0.00137
Train [102][3030/3239]	Time 0.240 (0.521)	Data Time 0.001 (0.014)	Loss 2.4000 (2.3730)	Entropy 0.53969 (0.54025)	Top-1 acc 68.359 (66.918)	Top-5 acc 83.984 (85.876)	lr 0.00137
Train [102][3040/3239]	Time 0.235 (0.521)	Data Time 0.001 (0.014)	Loss 2.3253 (2.3733)	Entropy 0.53984 (0.54025)	Top-1 acc 67.969 (66.912)	Top-5 acc 86.719 (85.873)	lr 0.00137
Train [102][3050/3239]	Time 0.240 (0.520)	Data Time 0.001 (0.014)	Loss 2.3877 (2.3733)	Entropy 0.53976 (0.54025)	Top-1 acc 64.062 (66.911)	Top-5 acc 85.156 (85.872)	lr 0.00137
Train [102][3060/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.014)	Loss 2.5699 (2.3735)	Entropy 0.53984 (0.54025)	Top-1 acc 64.844 (66.906)	Top-5 acc 83.203 (85.869)	lr 0.00137
Train [102][3070/3239]	Time 0.237 (0.520)	Data Time 0.001 (0.014)	Loss 2.2762 (2.3734)	Entropy 0.53954 (0.54025)	Top-1 acc 70.703 (66.907)	Top-5 acc 87.109 (85.870)	lr 0.00137
Train [102][3080/3239]	Time 0.247 (0.519)	Data Time 0.001 (0.014)	Loss 2.6569 (2.3734)	Entropy 0.53971 (0.54024)	Top-1 acc 61.719 (66.907)	Top-5 acc 80.078 (85.873)	lr 0.00137
Train [102][3090/3239]	Time 0.223 (0.519)	Data Time 0.001 (0.014)	Loss 2.2974 (2.3735)	Entropy 0.53969 (0.54024)	Top-1 acc 69.531 (66.906)	Top-5 acc 87.500 (85.872)	lr 0.00137
Train [102][3100/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.014)	Loss 2.4254 (2.3733)	Entropy 0.53972 (0.54024)	Top-1 acc 63.672 (66.907)	Top-5 acc 86.328 (85.875)	lr 0.00137
Train [102][3110/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.014)	Loss 2.5906 (2.3734)	Entropy 0.53974 (0.54024)	Top-1 acc 61.328 (66.907)	Top-5 acc 83.594 (85.875)	lr 0.00137
Train [102][3120/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.014)	Loss 2.3054 (2.3734)	Entropy 0.53984 (0.54024)	Top-1 acc 66.797 (66.905)	Top-5 acc 87.891 (85.875)	lr 0.00137
Train [102][3130/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.014)	Loss 2.2532 (2.3733)	Entropy 0.53971 (0.54023)	Top-1 acc 70.703 (66.907)	Top-5 acc 84.766 (85.875)	lr 0.00137
Train [102][3140/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.014)	Loss 2.5925 (2.3733)	Entropy 0.53979 (0.54023)	Top-1 acc 61.328 (66.907)	Top-5 acc 84.375 (85.875)	lr 0.00137
Train [102][3150/3239]	Time 0.328 (0.517)	Data Time 0.001 (0.014)	Loss 2.2689 (2.3734)	Entropy 0.53967 (0.54023)	Top-1 acc 70.312 (66.906)	Top-5 acc 89.844 (85.873)	lr 0.00137
Train [102][3160/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.013)	Loss 2.4150 (2.3735)	Entropy 0.53986 (0.54023)	Top-1 acc 66.406 (66.905)	Top-5 acc 84.766 (85.872)	lr 0.00137
Train [102][3170/3239]	Time 0.247 (0.516)	Data Time 0.001 (0.013)	Loss 2.3275 (2.3735)	Entropy 0.54006 (0.54023)	Top-1 acc 69.922 (66.908)	Top-5 acc 86.328 (85.872)	lr 0.00137
Train [102][3180/3239]	Time 0.237 (0.516)	Data Time 0.000 (0.013)	Loss 2.4246 (2.3734)	Entropy 0.54000 (0.54023)	Top-1 acc 68.359 (66.912)	Top-5 acc 84.766 (85.873)	lr 0.00137
Train [102][3190/3239]	Time 0.234 (0.516)	Data Time 0.000 (0.013)	Loss 2.3792 (2.3735)	Entropy 0.54030 (0.54023)	Top-1 acc 66.016 (66.904)	Top-5 acc 85.938 (85.872)	lr 0.00136
Train [102][3200/3239]	Time 0.266 (0.516)	Data Time 0.000 (0.013)	Loss 2.3612 (2.3735)	Entropy 0.54034 (0.54023)	Top-1 acc 68.359 (66.905)	Top-5 acc 85.156 (85.871)	lr 0.00136
Train [102][3210/3239]	Time 0.248 (0.515)	Data Time 0.000 (0.013)	Loss 2.4295 (2.3736)	Entropy 0.54037 (0.54023)	Top-1 acc 66.797 (66.902)	Top-5 acc 82.812 (85.869)	lr 0.00136
Train [102][3220/3239]	Time 0.322 (0.515)	Data Time 0.000 (0.013)	Loss 2.2558 (2.3737)	Entropy 0.54053 (0.54023)	Top-1 acc 72.266 (66.899)	Top-5 acc 87.109 (85.868)	lr 0.00136
Train [102][3230/3239]	Time 0.226 (0.514)	Data Time 0.000 (0.013)	Loss 2.3918 (2.3737)	Entropy 0.54053 (0.54023)	Top-1 acc 66.406 (66.903)	Top-5 acc 86.328 (85.869)	lr 0.00136
Train [102][3239/3239]	Time 0.847 (0.514)	Data Time 0.000 (0.013)	Loss 2.6042 (2.3738)	Entropy 0.54043 (0.54023)	Top-1 acc 60.494 (66.901)	Top-5 acc 83.951 (85.869)	lr 0.00136
==========Valid [102/120]	loss 1.189	top-1 acc 72.786 (72.786)	top-5 acc 90.445	Train top-1 66.901	top-5 85.869	Entropy 0.54043	Latency-None: 0.000ms	Flops: 539.00M
Train [103][0/3239]	Time 39.349 (39.349)	Data Time 38.202 (38.202)	Loss 2.3453 (2.3453)	Entropy 0.54051 (0.54051)	Top-1 acc 67.578 (67.578)	Top-5 acc 87.109 (87.109)	lr 0.00136
Train [103][10/3239]	Time 0.228 (4.014)	Data Time 0.001 (3.475)	Loss 2.3378 (2.3256)	Entropy 0.54037 (0.54055)	Top-1 acc 68.750 (69.212)	Top-5 acc 85.156 (86.222)	lr 0.00136
Train [103][20/3239]	Time 0.231 (2.295)	Data Time 0.001 (1.821)	Loss 2.4712 (2.3894)	Entropy 0.54048 (0.54049)	Top-1 acc 65.234 (67.448)	Top-5 acc 85.938 (85.584)	lr 0.00136
Train [103][30/3239]	Time 0.221 (1.680)	Data Time 0.001 (1.234)	Loss 2.3958 (2.4014)	Entropy 0.54033 (0.54046)	Top-1 acc 67.969 (66.746)	Top-5 acc 83.984 (85.446)	lr 0.00136
Train [103][40/3239]	Time 0.231 (1.368)	Data Time 0.002 (0.933)	Loss 2.4034 (2.3895)	Entropy 0.53967 (0.54035)	Top-1 acc 68.359 (66.978)	Top-5 acc 84.766 (85.490)	lr 0.00136
Train [103][50/3239]	Time 0.319 (1.180)	Data Time 0.001 (0.751)	Loss 2.1466 (2.3755)	Entropy 0.53963 (0.54020)	Top-1 acc 73.438 (67.080)	Top-5 acc 89.844 (85.807)	lr 0.00136
Train [103][60/3239]	Time 0.234 (1.052)	Data Time 0.001 (0.628)	Loss 2.1835 (2.3628)	Entropy 0.53960 (0.54011)	Top-1 acc 72.656 (67.412)	Top-5 acc 87.891 (86.034)	lr 0.00136
Train [103][70/3239]	Time 0.235 (0.958)	Data Time 0.001 (0.540)	Loss 2.2874 (2.3567)	Entropy 0.53953 (0.54004)	Top-1 acc 67.578 (67.617)	Top-5 acc 85.938 (86.042)	lr 0.00136
Train [103][80/3239]	Time 0.275 (0.907)	Data Time 0.001 (0.473)	Loss 2.4854 (2.3525)	Entropy 0.53993 (0.54000)	Top-1 acc 64.844 (67.631)	Top-5 acc 81.641 (86.212)	lr 0.00136
Train [103][90/3239]	Time 0.223 (0.859)	Data Time 0.001 (0.421)	Loss 2.2464 (2.3653)	Entropy 0.54009 (0.53999)	Top-1 acc 71.875 (67.153)	Top-5 acc 87.891 (86.041)	lr 0.00136
Train [103][100/3239]	Time 0.233 (0.814)	Data Time 0.001 (0.380)	Loss 2.3437 (2.3662)	Entropy 0.54023 (0.54000)	Top-1 acc 64.844 (67.021)	Top-5 acc 86.719 (86.046)	lr 0.00136
Train [103][110/3239]	Time 0.235 (0.777)	Data Time 0.001 (0.346)	Loss 2.5035 (2.3634)	Entropy 0.54013 (0.54002)	Top-1 acc 61.719 (67.163)	Top-5 acc 83.594 (86.120)	lr 0.00136
Train [103][120/3239]	Time 0.226 (0.746)	Data Time 0.001 (0.317)	Loss 2.3329 (2.3679)	Entropy 0.53999 (0.54003)	Top-1 acc 67.578 (67.107)	Top-5 acc 88.281 (86.025)	lr 0.00136
Train [103][130/3239]	Time 0.218 (0.720)	Data Time 0.001 (0.293)	Loss 2.5452 (2.3690)	Entropy 0.54018 (0.54003)	Top-1 acc 66.797 (67.152)	Top-5 acc 85.156 (85.994)	lr 0.00136
Train [103][140/3239]	Time 0.244 (0.698)	Data Time 0.001 (0.273)	Loss 2.7096 (2.3753)	Entropy 0.54034 (0.54004)	Top-1 acc 58.203 (66.955)	Top-5 acc 78.516 (85.838)	lr 0.00136
Train [103][150/3239]	Time 0.238 (0.678)	Data Time 0.001 (0.255)	Loss 2.3692 (2.3733)	Entropy 0.54011 (0.54005)	Top-1 acc 68.359 (67.032)	Top-5 acc 86.719 (85.881)	lr 0.00136
Train [103][160/3239]	Time 0.230 (0.661)	Data Time 0.001 (0.239)	Loss 2.4617 (2.3692)	Entropy 0.54023 (0.54006)	Top-1 acc 60.547 (67.112)	Top-5 acc 85.156 (85.938)	lr 0.00136
Train [103][170/3239]	Time 0.233 (0.648)	Data Time 0.001 (0.225)	Loss 2.3877 (2.3678)	Entropy 0.54037 (0.54007)	Top-1 acc 67.578 (67.126)	Top-5 acc 82.812 (85.969)	lr 0.00135
Train [103][180/3239]	Time 0.234 (0.634)	Data Time 0.001 (0.213)	Loss 2.3287 (2.3670)	Entropy 0.54012 (0.54008)	Top-1 acc 68.359 (67.149)	Top-5 acc 85.938 (85.970)	lr 0.00135
Train [103][190/3239]	Time 0.255 (0.623)	Data Time 0.001 (0.202)	Loss 2.3605 (2.3661)	Entropy 0.54009 (0.54009)	Top-1 acc 65.625 (67.112)	Top-5 acc 84.375 (85.964)	lr 0.00135
Train [103][200/3239]	Time 0.228 (0.612)	Data Time 0.001 (0.192)	Loss 2.3709 (2.3634)	Entropy 0.54036 (0.54009)	Top-1 acc 66.797 (67.184)	Top-5 acc 85.547 (86.000)	lr 0.00135
Train [103][210/3239]	Time 0.328 (0.602)	Data Time 0.001 (0.183)	Loss 2.2150 (2.3632)	Entropy 0.54043 (0.54010)	Top-1 acc 73.047 (67.176)	Top-5 acc 89.844 (86.030)	lr 0.00135
Train [103][220/3239]	Time 0.277 (0.594)	Data Time 0.001 (0.174)	Loss 2.2584 (2.3629)	Entropy 0.54047 (0.54012)	Top-1 acc 69.922 (67.168)	Top-5 acc 87.109 (86.042)	lr 0.00135
Train [103][230/3239]	Time 0.225 (0.586)	Data Time 0.001 (0.167)	Loss 2.1432 (2.3596)	Entropy 0.54052 (0.54013)	Top-1 acc 73.438 (67.301)	Top-5 acc 91.797 (86.105)	lr 0.00135
Train [103][240/3239]	Time 0.217 (0.579)	Data Time 0.001 (0.160)	Loss 2.3532 (2.3580)	Entropy 0.54016 (0.54014)	Top-1 acc 65.625 (67.327)	Top-5 acc 86.719 (86.114)	lr 0.00135
Train [103][250/3239]	Time 0.219 (0.571)	Data Time 0.001 (0.154)	Loss 2.2566 (2.3570)	Entropy 0.54033 (0.54014)	Top-1 acc 68.750 (67.385)	Top-5 acc 90.625 (86.160)	lr 0.00135
Train [103][260/3239]	Time 0.229 (0.564)	Data Time 0.001 (0.148)	Loss 2.3728 (2.3565)	Entropy 0.54041 (0.54015)	Top-1 acc 66.797 (67.413)	Top-5 acc 85.156 (86.152)	lr 0.00135
Train [103][270/3239]	Time 0.573 (0.766)	Data Time 0.005 (0.143)	Loss 2.6048 (2.3581)	Entropy 0.54064 (0.54016)	Top-1 acc 58.984 (67.350)	Top-5 acc 82.422 (86.097)	lr 0.00135
Train [103][280/3239]	Time 0.226 (0.755)	Data Time 0.002 (0.138)	Loss 2.1525 (2.3584)	Entropy 0.54120 (0.54019)	Top-1 acc 68.750 (67.313)	Top-5 acc 89.844 (86.100)	lr 0.00135
Train [103][290/3239]	Time 0.235 (0.743)	Data Time 0.001 (0.133)	Loss 2.3155 (2.3566)	Entropy 0.54128 (0.54022)	Top-1 acc 68.359 (67.335)	Top-5 acc 88.281 (86.131)	lr 0.00135
Train [103][300/3239]	Time 0.247 (0.732)	Data Time 0.001 (0.129)	Loss 2.2738 (2.3572)	Entropy 0.54101 (0.54025)	Top-1 acc 74.219 (67.356)	Top-5 acc 85.938 (86.122)	lr 0.00135
Train [103][310/3239]	Time 0.237 (0.722)	Data Time 0.001 (0.125)	Loss 2.1800 (2.3556)	Entropy 0.54121 (0.54028)	Top-1 acc 73.828 (67.375)	Top-5 acc 91.016 (86.170)	lr 0.00135
Train [103][320/3239]	Time 0.233 (0.712)	Data Time 0.001 (0.121)	Loss 2.2935 (2.3550)	Entropy 0.54143 (0.54031)	Top-1 acc 69.922 (67.413)	Top-5 acc 88.672 (86.167)	lr 0.00135
Train [103][330/3239]	Time 0.227 (0.703)	Data Time 0.001 (0.117)	Loss 2.2520 (2.3548)	Entropy 0.54165 (0.54035)	Top-1 acc 70.703 (67.414)	Top-5 acc 88.281 (86.161)	lr 0.00135
Train [103][340/3239]	Time 0.228 (0.694)	Data Time 0.001 (0.114)	Loss 2.4007 (2.3566)	Entropy 0.54173 (0.54038)	Top-1 acc 65.234 (67.377)	Top-5 acc 84.766 (86.131)	lr 0.00135
Train [103][350/3239]	Time 0.261 (0.686)	Data Time 0.001 (0.111)	Loss 2.3473 (2.3558)	Entropy 0.54185 (0.54042)	Top-1 acc 68.750 (67.392)	Top-5 acc 87.500 (86.147)	lr 0.00135
Train [103][360/3239]	Time 0.224 (0.678)	Data Time 0.001 (0.108)	Loss 2.3803 (2.3558)	Entropy 0.54173 (0.54046)	Top-1 acc 68.359 (67.376)	Top-5 acc 86.328 (86.145)	lr 0.00135
Train [103][370/3239]	Time 0.326 (0.672)	Data Time 0.001 (0.105)	Loss 2.1054 (2.3559)	Entropy 0.54179 (0.54049)	Top-1 acc 71.875 (67.368)	Top-5 acc 92.188 (86.143)	lr 0.00135
Train [103][380/3239]	Time 0.226 (0.665)	Data Time 0.001 (0.102)	Loss 2.8327 (2.3576)	Entropy 0.54163 (0.54053)	Top-1 acc 56.641 (67.320)	Top-5 acc 76.562 (86.116)	lr 0.00135
Train [103][390/3239]	Time 0.232 (0.658)	Data Time 0.001 (0.099)	Loss 2.3203 (2.3577)	Entropy 0.54184 (0.54056)	Top-1 acc 65.625 (67.328)	Top-5 acc 85.156 (86.100)	lr 0.00134
Train [103][400/3239]	Time 0.222 (0.652)	Data Time 0.001 (0.097)	Loss 2.7591 (2.3592)	Entropy 0.54163 (0.54059)	Top-1 acc 58.594 (67.293)	Top-5 acc 80.078 (86.080)	lr 0.00134
Train [103][410/3239]	Time 0.230 (0.646)	Data Time 0.001 (0.095)	Loss 2.4116 (2.3583)	Entropy 0.54171 (0.54061)	Top-1 acc 63.281 (67.302)	Top-5 acc 83.594 (86.091)	lr 0.00134
Train [103][420/3239]	Time 0.228 (0.641)	Data Time 0.001 (0.092)	Loss 2.8211 (2.3599)	Entropy 0.54166 (0.54064)	Top-1 acc 53.906 (67.241)	Top-5 acc 79.688 (86.063)	lr 0.00134
Train [103][430/3239]	Time 0.221 (0.636)	Data Time 0.001 (0.090)	Loss 2.3241 (2.3597)	Entropy 0.54177 (0.54067)	Top-1 acc 66.406 (67.243)	Top-5 acc 85.547 (86.058)	lr 0.00134
Train [103][440/3239]	Time 0.354 (0.631)	Data Time 0.001 (0.088)	Loss 2.4978 (2.3615)	Entropy 0.54134 (0.54069)	Top-1 acc 64.062 (67.197)	Top-5 acc 83.203 (86.027)	lr 0.00134
Train [103][450/3239]	Time 0.231 (0.626)	Data Time 0.001 (0.086)	Loss 2.2075 (2.3621)	Entropy 0.54147 (0.54070)	Top-1 acc 71.875 (67.188)	Top-5 acc 89.453 (86.009)	lr 0.00134
Train [103][460/3239]	Time 0.234 (0.622)	Data Time 0.001 (0.085)	Loss 2.3051 (2.3609)	Entropy 0.54137 (0.54072)	Top-1 acc 68.750 (67.207)	Top-5 acc 85.938 (86.030)	lr 0.00134
Train [103][470/3239]	Time 0.237 (0.617)	Data Time 0.001 (0.083)	Loss 2.4591 (2.3602)	Entropy 0.54141 (0.54073)	Top-1 acc 66.016 (67.227)	Top-5 acc 84.766 (86.045)	lr 0.00134
Train [103][480/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.081)	Loss 2.2290 (2.3598)	Entropy 0.54142 (0.54074)	Top-1 acc 69.531 (67.248)	Top-5 acc 88.281 (86.041)	lr 0.00134
Train [103][490/3239]	Time 0.231 (0.609)	Data Time 0.001 (0.080)	Loss 2.3772 (2.3604)	Entropy 0.54142 (0.54076)	Top-1 acc 64.844 (67.214)	Top-5 acc 87.109 (86.034)	lr 0.00134
Train [103][500/3239]	Time 0.230 (0.605)	Data Time 0.001 (0.078)	Loss 2.4057 (2.3599)	Entropy 0.54145 (0.54077)	Top-1 acc 65.625 (67.219)	Top-5 acc 83.984 (86.046)	lr 0.00134
Train [103][510/3239]	Time 0.228 (0.602)	Data Time 0.001 (0.076)	Loss 2.3570 (2.3607)	Entropy 0.54133 (0.54078)	Top-1 acc 68.750 (67.212)	Top-5 acc 85.156 (86.027)	lr 0.00134
Train [103][520/3239]	Time 0.228 (0.598)	Data Time 0.001 (0.075)	Loss 2.2922 (2.3613)	Entropy 0.54130 (0.54079)	Top-1 acc 68.359 (67.204)	Top-5 acc 86.328 (86.010)	lr 0.00134
Train [103][530/3239]	Time 0.335 (0.595)	Data Time 0.001 (0.074)	Loss 2.1329 (2.3615)	Entropy 0.54128 (0.54080)	Top-1 acc 73.047 (67.188)	Top-5 acc 89.062 (86.005)	lr 0.00134
Train [103][540/3239]	Time 0.233 (0.591)	Data Time 0.001 (0.072)	Loss 2.2909 (2.3618)	Entropy 0.54085 (0.54081)	Top-1 acc 68.750 (67.194)	Top-5 acc 87.500 (86.003)	lr 0.00134
Train [103][550/3239]	Time 0.218 (0.588)	Data Time 0.001 (0.071)	Loss 2.6466 (2.3606)	Entropy 0.54105 (0.54081)	Top-1 acc 59.375 (67.227)	Top-5 acc 78.516 (86.012)	lr 0.00134
Train [103][560/3239]	Time 0.237 (0.585)	Data Time 0.001 (0.070)	Loss 2.1987 (2.3600)	Entropy 0.54117 (0.54082)	Top-1 acc 70.703 (67.231)	Top-5 acc 88.281 (86.029)	lr 0.00134
Train [103][570/3239]	Time 0.227 (0.582)	Data Time 0.001 (0.069)	Loss 2.3533 (2.3597)	Entropy 0.54135 (0.54083)	Top-1 acc 69.531 (67.229)	Top-5 acc 87.891 (86.035)	lr 0.00134
Train [103][580/3239]	Time 0.310 (0.580)	Data Time 0.002 (0.067)	Loss 2.4088 (2.3612)	Entropy 0.54138 (0.54084)	Top-1 acc 65.234 (67.200)	Top-5 acc 85.547 (86.008)	lr 0.00134
Train [103][590/3239]	Time 0.280 (0.579)	Data Time 0.001 (0.066)	Loss 2.3751 (2.3622)	Entropy 0.54137 (0.54085)	Top-1 acc 73.047 (67.191)	Top-5 acc 86.328 (85.988)	lr 0.00134
Train [103][600/3239]	Time 0.323 (0.576)	Data Time 0.001 (0.065)	Loss 2.6059 (2.3628)	Entropy 0.54153 (0.54086)	Top-1 acc 64.453 (67.182)	Top-5 acc 81.250 (85.981)	lr 0.00134
Train [103][610/3239]	Time 0.228 (0.574)	Data Time 0.001 (0.064)	Loss 2.3513 (2.3626)	Entropy 0.54138 (0.54087)	Top-1 acc 67.578 (67.186)	Top-5 acc 85.547 (85.996)	lr 0.00133
Train [103][620/3239]	Time 0.269 (0.571)	Data Time 0.001 (0.063)	Loss 2.2875 (2.3629)	Entropy 0.54160 (0.54088)	Top-1 acc 70.312 (67.195)	Top-5 acc 85.547 (85.999)	lr 0.00133
Train [103][630/3239]	Time 0.221 (0.568)	Data Time 0.001 (0.062)	Loss 2.3795 (2.3630)	Entropy 0.54101 (0.54089)	Top-1 acc 67.188 (67.188)	Top-5 acc 88.281 (85.995)	lr 0.00133
Train [103][640/3239]	Time 0.226 (0.566)	Data Time 0.002 (0.061)	Loss 2.4130 (2.3636)	Entropy 0.54126 (0.54089)	Top-1 acc 63.672 (67.166)	Top-5 acc 87.891 (85.991)	lr 0.00133
Train [103][650/3239]	Time 0.233 (0.564)	Data Time 0.001 (0.060)	Loss 2.2934 (2.3631)	Entropy 0.54154 (0.54090)	Top-1 acc 67.969 (67.172)	Top-5 acc 87.109 (86.004)	lr 0.00133
Train [103][660/3239]	Time 0.228 (0.561)	Data Time 0.001 (0.059)	Loss 2.2192 (2.3627)	Entropy 0.54169 (0.54091)	Top-1 acc 70.312 (67.183)	Top-5 acc 89.062 (86.005)	lr 0.00133
Train [103][670/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.059)	Loss 2.2843 (2.3621)	Entropy 0.54123 (0.54092)	Top-1 acc 70.312 (67.193)	Top-5 acc 87.891 (86.018)	lr 0.00133
Train [103][680/3239]	Time 0.226 (0.557)	Data Time 0.001 (0.058)	Loss 2.5048 (2.3623)	Entropy 0.54107 (0.54092)	Top-1 acc 66.406 (67.188)	Top-5 acc 83.203 (86.010)	lr 0.00133
Train [103][690/3239]	Time 0.330 (0.555)	Data Time 0.001 (0.057)	Loss 2.6087 (2.3627)	Entropy 0.54125 (0.54092)	Top-1 acc 57.422 (67.182)	Top-5 acc 84.375 (86.002)	lr 0.00133
Train [103][700/3239]	Time 0.240 (0.553)	Data Time 0.001 (0.056)	Loss 2.3277 (2.3632)	Entropy 0.54153 (0.54093)	Top-1 acc 66.016 (67.156)	Top-5 acc 85.547 (85.994)	lr 0.00133
Train [103][710/3239]	Time 0.240 (0.551)	Data Time 0.001 (0.055)	Loss 2.3304 (2.3646)	Entropy 0.54163 (0.54094)	Top-1 acc 67.188 (67.120)	Top-5 acc 83.594 (85.971)	lr 0.00133
Train [103][720/3239]	Time 0.237 (0.549)	Data Time 0.001 (0.055)	Loss 2.3858 (2.3646)	Entropy 0.54181 (0.54095)	Top-1 acc 67.188 (67.116)	Top-5 acc 87.500 (85.971)	lr 0.00133
Train [103][730/3239]	Time 0.226 (0.547)	Data Time 0.001 (0.054)	Loss 2.3938 (2.3649)	Entropy 0.54189 (0.54096)	Top-1 acc 66.016 (67.112)	Top-5 acc 83.984 (85.963)	lr 0.00133
Train [103][740/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.053)	Loss 2.2183 (2.3656)	Entropy 0.54179 (0.54097)	Top-1 acc 71.094 (67.089)	Top-5 acc 89.062 (85.950)	lr 0.00133
Train [103][750/3239]	Time 0.232 (0.543)	Data Time 0.001 (0.053)	Loss 2.3784 (2.3660)	Entropy 0.54207 (0.54098)	Top-1 acc 65.234 (67.076)	Top-5 acc 85.547 (85.957)	lr 0.00133
Train [103][760/3239]	Time 0.328 (0.541)	Data Time 0.001 (0.052)	Loss 2.7189 (2.3665)	Entropy 0.54217 (0.54100)	Top-1 acc 61.719 (67.075)	Top-5 acc 80.859 (85.945)	lr 0.00133
Train [103][770/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.051)	Loss 2.5442 (2.3672)	Entropy 0.54250 (0.54102)	Top-1 acc 62.109 (67.053)	Top-5 acc 83.594 (85.932)	lr 0.00133
Train [103][780/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.051)	Loss 2.6323 (2.3667)	Entropy 0.54227 (0.54103)	Top-1 acc 62.109 (67.066)	Top-5 acc 80.078 (85.938)	lr 0.00133
Train [103][790/3239]	Time 0.229 (0.536)	Data Time 0.001 (0.050)	Loss 2.3659 (2.3666)	Entropy 0.54260 (0.54105)	Top-1 acc 67.969 (67.066)	Top-5 acc 87.109 (85.938)	lr 0.00133
Train [103][800/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.049)	Loss 2.2324 (2.3666)	Entropy 0.54278 (0.54107)	Top-1 acc 72.656 (67.064)	Top-5 acc 87.500 (85.939)	lr 0.00133
Train [103][810/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.049)	Loss 2.3142 (2.3670)	Entropy 0.54257 (0.54109)	Top-1 acc 68.359 (67.055)	Top-5 acc 86.719 (85.929)	lr 0.00133
Train [103][820/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.048)	Loss 2.4074 (2.3667)	Entropy 0.54221 (0.54111)	Top-1 acc 64.453 (67.065)	Top-5 acc 83.984 (85.937)	lr 0.00133
Train [103][830/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.048)	Loss 2.3593 (2.3667)	Entropy 0.54180 (0.54112)	Top-1 acc 68.750 (67.063)	Top-5 acc 85.156 (85.941)	lr 0.00132
Train [103][840/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.047)	Loss 2.3105 (2.3667)	Entropy 0.54177 (0.54112)	Top-1 acc 65.625 (67.072)	Top-5 acc 87.891 (85.940)	lr 0.00132
Train [103][850/3239]	Time 0.229 (0.527)	Data Time 0.001 (0.047)	Loss 2.2498 (2.3661)	Entropy 0.54189 (0.54113)	Top-1 acc 69.922 (67.090)	Top-5 acc 87.500 (85.949)	lr 0.00132
Train [103][860/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.046)	Loss 2.4035 (2.3665)	Entropy 0.54172 (0.54114)	Top-1 acc 64.453 (67.080)	Top-5 acc 83.594 (85.945)	lr 0.00132
Train [103][870/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.045)	Loss 2.6078 (2.3668)	Entropy 0.54184 (0.54115)	Top-1 acc 64.062 (67.084)	Top-5 acc 82.031 (85.938)	lr 0.00132
Train [103][880/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.045)	Loss 2.6007 (2.3666)	Entropy 0.54195 (0.54116)	Top-1 acc 60.547 (67.089)	Top-5 acc 83.594 (85.945)	lr 0.00132
Train [103][890/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.044)	Loss 2.2432 (2.3665)	Entropy 0.54213 (0.54117)	Top-1 acc 69.922 (67.095)	Top-5 acc 87.500 (85.945)	lr 0.00132
Train [103][900/3239]	Time 0.333 (0.521)	Data Time 0.003 (0.044)	Loss 2.7737 (2.3674)	Entropy 0.54209 (0.54118)	Top-1 acc 57.812 (67.083)	Top-5 acc 79.688 (85.927)	lr 0.00132
Train [103][910/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.044)	Loss 2.2303 (2.3668)	Entropy 0.54226 (0.54119)	Top-1 acc 69.922 (67.107)	Top-5 acc 89.062 (85.937)	lr 0.00132
Train [103][920/3239]	Time 0.565 (0.577)	Data Time 0.037 (0.043)	Loss 2.4988 (2.3677)	Entropy 0.54262 (0.54120)	Top-1 acc 62.500 (67.084)	Top-5 acc 84.375 (85.924)	lr 0.00132
Train [103][930/3239]	Time 0.239 (0.577)	Data Time 0.002 (0.043)	Loss 2.2569 (2.3669)	Entropy 0.54294 (0.54122)	Top-1 acc 68.750 (67.101)	Top-5 acc 89.844 (85.939)	lr 0.00132
Train [103][940/3239]	Time 0.231 (0.575)	Data Time 0.001 (0.042)	Loss 2.3631 (2.3673)	Entropy 0.54296 (0.54123)	Top-1 acc 68.750 (67.078)	Top-5 acc 84.375 (85.938)	lr 0.00132
Train [103][950/3239]	Time 0.236 (0.573)	Data Time 0.001 (0.042)	Loss 2.5029 (2.3681)	Entropy 0.54274 (0.54125)	Top-1 acc 65.625 (67.060)	Top-5 acc 83.594 (85.929)	lr 0.00132
Train [103][960/3239]	Time 0.233 (0.572)	Data Time 0.001 (0.041)	Loss 2.1441 (2.3679)	Entropy 0.54295 (0.54127)	Top-1 acc 70.312 (67.067)	Top-5 acc 90.234 (85.934)	lr 0.00132
Train [103][970/3239]	Time 0.235 (0.570)	Data Time 0.001 (0.041)	Loss 2.3688 (2.3674)	Entropy 0.54287 (0.54128)	Top-1 acc 68.750 (67.078)	Top-5 acc 85.547 (85.942)	lr 0.00132
Train [103][980/3239]	Time 0.243 (0.568)	Data Time 0.001 (0.041)	Loss 2.4147 (2.3677)	Entropy 0.54257 (0.54130)	Top-1 acc 64.844 (67.070)	Top-5 acc 87.500 (85.950)	lr 0.00132
Train [103][990/3239]	Time 0.226 (0.567)	Data Time 0.001 (0.040)	Loss 2.4429 (2.3678)	Entropy 0.54267 (0.54131)	Top-1 acc 64.453 (67.057)	Top-5 acc 85.156 (85.956)	lr 0.00132
Train [103][1000/3239]	Time 0.228 (0.566)	Data Time 0.001 (0.040)	Loss 2.2549 (2.3668)	Entropy 0.54271 (0.54133)	Top-1 acc 69.922 (67.080)	Top-5 acc 87.500 (85.968)	lr 0.00132
Train [103][1010/3239]	Time 0.234 (0.564)	Data Time 0.001 (0.039)	Loss 2.3741 (2.3669)	Entropy 0.54286 (0.54134)	Top-1 acc 64.844 (67.074)	Top-5 acc 83.984 (85.961)	lr 0.00132
Train [103][1020/3239]	Time 0.235 (0.563)	Data Time 0.001 (0.039)	Loss 2.3537 (2.3671)	Entropy 0.54306 (0.54136)	Top-1 acc 67.578 (67.072)	Top-5 acc 84.375 (85.958)	lr 0.00132
Train [103][1030/3239]	Time 0.228 (0.561)	Data Time 0.001 (0.039)	Loss 2.3075 (2.3667)	Entropy 0.54252 (0.54137)	Top-1 acc 70.312 (67.089)	Top-5 acc 87.500 (85.964)	lr 0.00132
Train [103][1040/3239]	Time 0.260 (0.560)	Data Time 0.001 (0.038)	Loss 2.4397 (2.3671)	Entropy 0.54264 (0.54138)	Top-1 acc 63.281 (67.076)	Top-5 acc 82.422 (85.961)	lr 0.00132
Train [103][1050/3239]	Time 0.224 (0.559)	Data Time 0.001 (0.038)	Loss 2.4260 (2.3666)	Entropy 0.54258 (0.54139)	Top-1 acc 68.750 (67.090)	Top-5 acc 84.766 (85.970)	lr 0.00131
Train [103][1060/3239]	Time 0.223 (0.557)	Data Time 0.001 (0.038)	Loss 2.1890 (2.3672)	Entropy 0.54214 (0.54140)	Top-1 acc 71.484 (67.078)	Top-5 acc 87.109 (85.958)	lr 0.00131
Train [103][1070/3239]	Time 0.227 (0.556)	Data Time 0.001 (0.037)	Loss 2.3684 (2.3671)	Entropy 0.54208 (0.54141)	Top-1 acc 68.750 (67.080)	Top-5 acc 87.109 (85.959)	lr 0.00131
Train [103][1080/3239]	Time 0.354 (0.555)	Data Time 0.001 (0.037)	Loss 2.2407 (2.3666)	Entropy 0.54241 (0.54142)	Top-1 acc 70.703 (67.091)	Top-5 acc 89.062 (85.966)	lr 0.00131
Train [103][1090/3239]	Time 0.227 (0.554)	Data Time 0.001 (0.037)	Loss 2.3599 (2.3671)	Entropy 0.54237 (0.54143)	Top-1 acc 66.016 (67.079)	Top-5 acc 86.719 (85.958)	lr 0.00131
Train [103][1100/3239]	Time 0.274 (0.553)	Data Time 0.001 (0.036)	Loss 2.3570 (2.3667)	Entropy 0.54238 (0.54144)	Top-1 acc 69.922 (67.091)	Top-5 acc 87.891 (85.972)	lr 0.00131
Train [103][1110/3239]	Time 0.264 (0.552)	Data Time 0.001 (0.036)	Loss 2.5065 (2.3670)	Entropy 0.54219 (0.54144)	Top-1 acc 65.625 (67.077)	Top-5 acc 82.031 (85.962)	lr 0.00131
Train [103][1120/3239]	Time 0.232 (0.551)	Data Time 0.001 (0.036)	Loss 2.2653 (2.3666)	Entropy 0.54212 (0.54145)	Top-1 acc 69.531 (67.091)	Top-5 acc 89.453 (85.973)	lr 0.00131
Train [103][1130/3239]	Time 0.223 (0.550)	Data Time 0.001 (0.035)	Loss 2.3667 (2.3667)	Entropy 0.54245 (0.54146)	Top-1 acc 69.141 (67.096)	Top-5 acc 85.938 (85.973)	lr 0.00131
Train [103][1140/3239]	Time 0.234 (0.549)	Data Time 0.001 (0.035)	Loss 2.0664 (2.3661)	Entropy 0.54243 (0.54146)	Top-1 acc 74.219 (67.111)	Top-5 acc 92.578 (85.991)	lr 0.00131
Train [103][1150/3239]	Time 0.366 (0.548)	Data Time 0.001 (0.035)	Loss 2.2808 (2.3660)	Entropy 0.54257 (0.54147)	Top-1 acc 65.625 (67.112)	Top-5 acc 87.891 (85.992)	lr 0.00131
Train [103][1160/3239]	Time 0.228 (0.547)	Data Time 0.001 (0.035)	Loss 2.5724 (2.3658)	Entropy 0.54195 (0.54148)	Top-1 acc 62.500 (67.113)	Top-5 acc 83.203 (86.000)	lr 0.00131
Train [103][1170/3239]	Time 0.227 (0.546)	Data Time 0.001 (0.034)	Loss 2.6671 (2.3660)	Entropy 0.54206 (0.54149)	Top-1 acc 61.328 (67.107)	Top-5 acc 81.641 (86.002)	lr 0.00131
Train [103][1180/3239]	Time 0.221 (0.545)	Data Time 0.001 (0.034)	Loss 2.5279 (2.3668)	Entropy 0.54190 (0.54149)	Top-1 acc 60.547 (67.087)	Top-5 acc 84.766 (85.994)	lr 0.00131
Train [103][1190/3239]	Time 0.261 (0.543)	Data Time 0.001 (0.034)	Loss 2.3022 (2.3667)	Entropy 0.54207 (0.54149)	Top-1 acc 65.234 (67.081)	Top-5 acc 89.062 (85.997)	lr 0.00131
Train [103][1200/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.034)	Loss 2.7262 (2.3671)	Entropy 0.54192 (0.54150)	Top-1 acc 58.203 (67.067)	Top-5 acc 79.297 (85.989)	lr 0.00131
Train [103][1210/3239]	Time 0.219 (0.541)	Data Time 0.001 (0.033)	Loss 2.2024 (2.3671)	Entropy 0.54228 (0.54150)	Top-1 acc 69.531 (67.068)	Top-5 acc 90.625 (85.993)	lr 0.00131
Train [103][1220/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.033)	Loss 2.1504 (2.3676)	Entropy 0.54235 (0.54151)	Top-1 acc 73.828 (67.052)	Top-5 acc 89.062 (85.980)	lr 0.00131
Train [103][1230/3239]	Time 0.283 (0.540)	Data Time 0.001 (0.033)	Loss 2.2300 (2.3669)	Entropy 0.54223 (0.54152)	Top-1 acc 68.359 (67.067)	Top-5 acc 88.672 (85.991)	lr 0.00131
Train [103][1240/3239]	Time 0.455 (0.540)	Data Time 0.002 (0.033)	Loss 2.3944 (2.3665)	Entropy 0.54221 (0.54152)	Top-1 acc 63.281 (67.072)	Top-5 acc 87.109 (85.997)	lr 0.00131
Train [103][1250/3239]	Time 0.244 (0.540)	Data Time 0.002 (0.032)	Loss 2.2671 (2.3660)	Entropy 0.54178 (0.54152)	Top-1 acc 73.828 (67.089)	Top-5 acc 83.984 (86.001)	lr 0.00131
Train [103][1260/3239]	Time 0.228 (0.539)	Data Time 0.001 (0.032)	Loss 2.3509 (2.3658)	Entropy 0.54187 (0.54153)	Top-1 acc 64.453 (67.084)	Top-5 acc 89.453 (86.009)	lr 0.00131
Train [103][1270/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.032)	Loss 2.3862 (2.3660)	Entropy 0.54188 (0.54153)	Top-1 acc 65.625 (67.080)	Top-5 acc 86.719 (86.005)	lr 0.00130
Train [103][1280/3239]	Time 0.226 (0.537)	Data Time 0.001 (0.032)	Loss 2.3039 (2.3658)	Entropy 0.54185 (0.54153)	Top-1 acc 69.141 (67.087)	Top-5 acc 86.328 (86.000)	lr 0.00130
Train [103][1290/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.031)	Loss 2.6475 (2.3668)	Entropy 0.54203 (0.54154)	Top-1 acc 59.375 (67.060)	Top-5 acc 80.469 (85.979)	lr 0.00130
Train [103][1300/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.031)	Loss 2.2286 (2.3672)	Entropy 0.54203 (0.54154)	Top-1 acc 71.875 (67.058)	Top-5 acc 89.062 (85.974)	lr 0.00130
Train [103][1310/3239]	Time 0.326 (0.534)	Data Time 0.001 (0.031)	Loss 2.5640 (2.3674)	Entropy 0.54208 (0.54154)	Top-1 acc 62.500 (67.053)	Top-5 acc 80.859 (85.965)	lr 0.00130
Train [103][1320/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.031)	Loss 2.2304 (2.3679)	Entropy 0.54183 (0.54154)	Top-1 acc 68.359 (67.034)	Top-5 acc 86.328 (85.957)	lr 0.00130
Train [103][1330/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.030)	Loss 2.2248 (2.3683)	Entropy 0.54224 (0.54155)	Top-1 acc 71.875 (67.028)	Top-5 acc 88.672 (85.953)	lr 0.00130
Train [103][1340/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.030)	Loss 2.3976 (2.3680)	Entropy 0.54232 (0.54155)	Top-1 acc 66.406 (67.039)	Top-5 acc 85.547 (85.962)	lr 0.00130
Train [103][1350/3239]	Time 0.220 (0.530)	Data Time 0.001 (0.030)	Loss 2.4008 (2.3681)	Entropy 0.54206 (0.54156)	Top-1 acc 66.406 (67.045)	Top-5 acc 85.938 (85.963)	lr 0.00130
Train [103][1360/3239]	Time 0.223 (0.529)	Data Time 0.001 (0.030)	Loss 2.5877 (2.3683)	Entropy 0.54195 (0.54156)	Top-1 acc 62.891 (67.045)	Top-5 acc 80.859 (85.952)	lr 0.00130
Train [103][1370/3239]	Time 0.223 (0.528)	Data Time 0.001 (0.030)	Loss 2.3364 (2.3683)	Entropy 0.54230 (0.54156)	Top-1 acc 66.797 (67.046)	Top-5 acc 88.672 (85.952)	lr 0.00130
Train [103][1380/3239]	Time 0.220 (0.528)	Data Time 0.001 (0.029)	Loss 2.0784 (2.3679)	Entropy 0.54195 (0.54157)	Top-1 acc 72.656 (67.058)	Top-5 acc 89.844 (85.959)	lr 0.00130
Train [103][1390/3239]	Time 0.247 (0.527)	Data Time 0.002 (0.029)	Loss 2.3592 (2.3682)	Entropy 0.54187 (0.54157)	Top-1 acc 66.016 (67.048)	Top-5 acc 85.156 (85.952)	lr 0.00130
Train [103][1400/3239]	Time 0.265 (0.526)	Data Time 0.001 (0.029)	Loss 2.2375 (2.3688)	Entropy 0.54202 (0.54157)	Top-1 acc 67.578 (67.034)	Top-5 acc 87.500 (85.939)	lr 0.00130
Train [103][1410/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.029)	Loss 2.4178 (2.3694)	Entropy 0.54216 (0.54158)	Top-1 acc 66.797 (67.015)	Top-5 acc 83.984 (85.929)	lr 0.00130
Train [103][1420/3239]	Time 0.215 (0.524)	Data Time 0.001 (0.029)	Loss 2.4818 (2.3692)	Entropy 0.54221 (0.54158)	Top-1 acc 64.062 (67.028)	Top-5 acc 82.812 (85.931)	lr 0.00130
Train [103][1430/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.028)	Loss 2.3150 (2.3690)	Entropy 0.54233 (0.54159)	Top-1 acc 66.797 (67.031)	Top-5 acc 87.891 (85.941)	lr 0.00130
Train [103][1440/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.028)	Loss 2.3967 (2.3691)	Entropy 0.54225 (0.54159)	Top-1 acc 69.141 (67.032)	Top-5 acc 86.328 (85.941)	lr 0.00130
Train [103][1450/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.028)	Loss 2.3112 (2.3689)	Entropy 0.54217 (0.54160)	Top-1 acc 68.359 (67.037)	Top-5 acc 87.891 (85.945)	lr 0.00130
Train [103][1460/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.028)	Loss 2.3699 (2.3689)	Entropy 0.54152 (0.54160)	Top-1 acc 68.359 (67.038)	Top-5 acc 85.547 (85.945)	lr 0.00130
Train [103][1470/3239]	Time 0.338 (0.520)	Data Time 0.001 (0.028)	Loss 2.2769 (2.3690)	Entropy 0.54160 (0.54160)	Top-1 acc 71.875 (67.035)	Top-5 acc 88.281 (85.948)	lr 0.00130
Train [103][1480/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.027)	Loss 2.2193 (2.3689)	Entropy 0.54131 (0.54160)	Top-1 acc 68.750 (67.040)	Top-5 acc 89.062 (85.951)	lr 0.00130
Train [103][1490/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.027)	Loss 2.4141 (2.3688)	Entropy 0.54096 (0.54159)	Top-1 acc 67.578 (67.043)	Top-5 acc 84.375 (85.949)	lr 0.00129
Train [103][1500/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.027)	Loss 2.4755 (2.3691)	Entropy 0.54081 (0.54159)	Top-1 acc 64.844 (67.040)	Top-5 acc 84.375 (85.945)	lr 0.00129
Train [103][1510/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.027)	Loss 2.3204 (2.3694)	Entropy 0.54051 (0.54158)	Top-1 acc 66.406 (67.030)	Top-5 acc 85.938 (85.938)	lr 0.00129
Train [103][1520/3239]	Time 0.227 (0.517)	Data Time 0.001 (0.027)	Loss 2.2751 (2.3693)	Entropy 0.54061 (0.54158)	Top-1 acc 70.312 (67.039)	Top-5 acc 85.547 (85.940)	lr 0.00129
Train [103][1530/3239]	Time 0.222 (0.516)	Data Time 0.001 (0.027)	Loss 2.4056 (2.3695)	Entropy 0.54073 (0.54157)	Top-1 acc 62.891 (67.031)	Top-5 acc 85.156 (85.933)	lr 0.00129
Train [103][1540/3239]	Time 0.407 (0.516)	Data Time 0.001 (0.026)	Loss 2.1859 (2.3695)	Entropy 0.54079 (0.54156)	Top-1 acc 73.828 (67.035)	Top-5 acc 88.672 (85.931)	lr 0.00129
Train [103][1550/3239]	Time 0.229 (0.515)	Data Time 0.001 (0.026)	Loss 2.2721 (2.3692)	Entropy 0.54101 (0.54156)	Top-1 acc 69.922 (67.042)	Top-5 acc 86.719 (85.935)	lr 0.00129
Train [103][1560/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.026)	Loss 2.2749 (2.3689)	Entropy 0.54077 (0.54156)	Top-1 acc 67.969 (67.046)	Top-5 acc 87.500 (85.942)	lr 0.00129
Train [103][1570/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.026)	Loss 2.2221 (2.3693)	Entropy 0.54080 (0.54155)	Top-1 acc 71.094 (67.041)	Top-5 acc 90.234 (85.937)	lr 0.00129
Train [103][1580/3239]	Time 0.330 (0.547)	Data Time 0.002 (0.026)	Loss 2.2875 (2.3689)	Entropy 0.54082 (0.54155)	Top-1 acc 70.703 (67.051)	Top-5 acc 87.891 (85.941)	lr 0.00129
Train [103][1590/3239]	Time 0.236 (0.546)	Data Time 0.002 (0.026)	Loss 2.2885 (2.3688)	Entropy 0.54095 (0.54154)	Top-1 acc 70.703 (67.058)	Top-5 acc 89.453 (85.940)	lr 0.00129
Train [103][1600/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.026)	Loss 2.3062 (2.3691)	Entropy 0.54106 (0.54154)	Top-1 acc 69.141 (67.051)	Top-5 acc 84.766 (85.938)	lr 0.00129
Train [103][1610/3239]	Time 0.237 (0.544)	Data Time 0.001 (0.025)	Loss 2.5230 (2.3687)	Entropy 0.54126 (0.54154)	Top-1 acc 63.281 (67.064)	Top-5 acc 82.812 (85.946)	lr 0.00129
Train [103][1620/3239]	Time 0.226 (0.544)	Data Time 0.001 (0.025)	Loss 2.4610 (2.3686)	Entropy 0.54102 (0.54153)	Top-1 acc 63.281 (67.062)	Top-5 acc 83.984 (85.948)	lr 0.00129
Train [103][1630/3239]	Time 0.318 (0.543)	Data Time 0.001 (0.025)	Loss 2.4163 (2.3688)	Entropy 0.54148 (0.54153)	Top-1 acc 65.234 (67.056)	Top-5 acc 85.938 (85.945)	lr 0.00129
Train [103][1640/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.025)	Loss 2.3374 (2.3684)	Entropy 0.54171 (0.54153)	Top-1 acc 67.188 (67.067)	Top-5 acc 87.109 (85.953)	lr 0.00129
Train [103][1650/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.025)	Loss 2.4565 (2.3682)	Entropy 0.54168 (0.54153)	Top-1 acc 63.281 (67.071)	Top-5 acc 83.203 (85.956)	lr 0.00129
Train [103][1660/3239]	Time 0.228 (0.541)	Data Time 0.001 (0.025)	Loss 2.2740 (2.3681)	Entropy 0.54134 (0.54153)	Top-1 acc 70.703 (67.073)	Top-5 acc 85.547 (85.957)	lr 0.00129
Train [103][1670/3239]	Time 0.277 (0.540)	Data Time 0.002 (0.025)	Loss 2.2367 (2.3681)	Entropy 0.54164 (0.54153)	Top-1 acc 70.703 (67.075)	Top-5 acc 88.672 (85.958)	lr 0.00129
Train [103][1680/3239]	Time 0.235 (0.539)	Data Time 0.001 (0.024)	Loss 2.3384 (2.3681)	Entropy 0.54162 (0.54153)	Top-1 acc 65.234 (67.071)	Top-5 acc 88.281 (85.957)	lr 0.00129
Train [103][1690/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.024)	Loss 2.3578 (2.3680)	Entropy 0.54192 (0.54153)	Top-1 acc 67.188 (67.079)	Top-5 acc 85.938 (85.953)	lr 0.00129
Train [103][1700/3239]	Time 0.326 (0.538)	Data Time 0.001 (0.024)	Loss 2.3081 (2.3680)	Entropy 0.54172 (0.54154)	Top-1 acc 67.969 (67.083)	Top-5 acc 88.672 (85.956)	lr 0.00129
Train [103][1710/3239]	Time 0.281 (0.538)	Data Time 0.002 (0.024)	Loss 2.2255 (2.3679)	Entropy 0.54163 (0.54154)	Top-1 acc 70.703 (67.084)	Top-5 acc 87.500 (85.954)	lr 0.00129
Train [103][1720/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.024)	Loss 2.3405 (2.3678)	Entropy 0.54167 (0.54154)	Top-1 acc 67.578 (67.086)	Top-5 acc 86.328 (85.953)	lr 0.00128
Train [103][1730/3239]	Time 0.249 (0.537)	Data Time 0.001 (0.024)	Loss 2.2607 (2.3677)	Entropy 0.54144 (0.54154)	Top-1 acc 68.750 (67.077)	Top-5 acc 87.109 (85.953)	lr 0.00128
Train [103][1740/3239]	Time 0.218 (0.536)	Data Time 0.001 (0.024)	Loss 2.5597 (2.3675)	Entropy 0.54125 (0.54154)	Top-1 acc 59.766 (67.075)	Top-5 acc 82.422 (85.954)	lr 0.00128
Train [103][1750/3239]	Time 0.261 (0.535)	Data Time 0.001 (0.023)	Loss 2.3112 (2.3674)	Entropy 0.54086 (0.54154)	Top-1 acc 66.797 (67.079)	Top-5 acc 88.672 (85.958)	lr 0.00128
Train [103][1760/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.023)	Loss 2.2279 (2.3672)	Entropy 0.54097 (0.54153)	Top-1 acc 71.094 (67.086)	Top-5 acc 90.625 (85.959)	lr 0.00128
Train [103][1770/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.023)	Loss 2.4523 (2.3672)	Entropy 0.54067 (0.54153)	Top-1 acc 66.797 (67.084)	Top-5 acc 85.938 (85.956)	lr 0.00128
Train [103][1780/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.023)	Loss 2.3907 (2.3673)	Entropy 0.54073 (0.54152)	Top-1 acc 67.188 (67.084)	Top-5 acc 85.156 (85.954)	lr 0.00128
Train [103][1790/3239]	Time 0.343 (0.533)	Data Time 0.001 (0.023)	Loss 2.3032 (2.3673)	Entropy 0.54082 (0.54152)	Top-1 acc 67.188 (67.085)	Top-5 acc 86.328 (85.958)	lr 0.00128
Train [103][1800/3239]	Time 0.226 (0.532)	Data Time 0.001 (0.023)	Loss 2.3202 (2.3679)	Entropy 0.54077 (0.54152)	Top-1 acc 67.969 (67.071)	Top-5 acc 86.719 (85.947)	lr 0.00128
Train [103][1810/3239]	Time 0.224 (0.532)	Data Time 0.001 (0.023)	Loss 2.2648 (2.3679)	Entropy 0.54102 (0.54151)	Top-1 acc 70.703 (67.067)	Top-5 acc 90.625 (85.947)	lr 0.00128
Train [103][1820/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.023)	Loss 2.4246 (2.3678)	Entropy 0.54086 (0.54151)	Top-1 acc 64.062 (67.064)	Top-5 acc 86.328 (85.951)	lr 0.00128
Train [103][1830/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.023)	Loss 2.4084 (2.3677)	Entropy 0.54096 (0.54150)	Top-1 acc 67.578 (67.068)	Top-5 acc 83.984 (85.954)	lr 0.00128
Train [103][1840/3239]	Time 0.226 (0.530)	Data Time 0.001 (0.022)	Loss 2.2952 (2.3677)	Entropy 0.54063 (0.54150)	Top-1 acc 71.484 (67.072)	Top-5 acc 86.328 (85.957)	lr 0.00128
Train [103][1850/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.022)	Loss 2.3318 (2.3672)	Entropy 0.54040 (0.54150)	Top-1 acc 68.359 (67.088)	Top-5 acc 87.891 (85.965)	lr 0.00128
Train [103][1860/3239]	Time 0.383 (0.529)	Data Time 0.001 (0.022)	Loss 2.2243 (2.3674)	Entropy 0.54043 (0.54149)	Top-1 acc 67.188 (67.082)	Top-5 acc 89.844 (85.962)	lr 0.00128
Train [103][1870/3239]	Time 0.225 (0.528)	Data Time 0.001 (0.022)	Loss 2.2484 (2.3674)	Entropy 0.54013 (0.54148)	Top-1 acc 71.875 (67.085)	Top-5 acc 86.328 (85.959)	lr 0.00128
Train [103][1880/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.022)	Loss 2.4810 (2.3672)	Entropy 0.54012 (0.54148)	Top-1 acc 63.672 (67.088)	Top-5 acc 84.766 (85.961)	lr 0.00128
Train [103][1890/3239]	Time 0.222 (0.527)	Data Time 0.001 (0.022)	Loss 2.6231 (2.3673)	Entropy 0.54013 (0.54147)	Top-1 acc 60.156 (67.088)	Top-5 acc 79.688 (85.959)	lr 0.00128
Train [103][1900/3239]	Time 0.228 (0.526)	Data Time 0.001 (0.022)	Loss 2.2911 (2.3672)	Entropy 0.54007 (0.54146)	Top-1 acc 67.969 (67.089)	Top-5 acc 86.328 (85.962)	lr 0.00128
Train [103][1910/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.022)	Loss 2.4944 (2.3672)	Entropy 0.54020 (0.54145)	Top-1 acc 64.453 (67.088)	Top-5 acc 82.422 (85.963)	lr 0.00128
Train [103][1920/3239]	Time 0.223 (0.525)	Data Time 0.001 (0.022)	Loss 2.6093 (2.3675)	Entropy 0.54015 (0.54145)	Top-1 acc 63.281 (67.077)	Top-5 acc 82.422 (85.955)	lr 0.00128
Train [103][1930/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.021)	Loss 2.2154 (2.3672)	Entropy 0.54008 (0.54144)	Top-1 acc 71.484 (67.085)	Top-5 acc 87.891 (85.960)	lr 0.00128
Train [103][1940/3239]	Time 0.222 (0.524)	Data Time 0.001 (0.021)	Loss 2.5342 (2.3672)	Entropy 0.54009 (0.54143)	Top-1 acc 62.891 (67.085)	Top-5 acc 83.203 (85.959)	lr 0.00127
Train [103][1950/3239]	Time 0.252 (0.523)	Data Time 0.001 (0.021)	Loss 2.3702 (2.3668)	Entropy 0.53977 (0.54143)	Top-1 acc 67.578 (67.095)	Top-5 acc 87.891 (85.967)	lr 0.00127
Train [103][1960/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.021)	Loss 2.3626 (2.3669)	Entropy 0.53983 (0.54142)	Top-1 acc 65.234 (67.096)	Top-5 acc 86.719 (85.965)	lr 0.00127
Train [103][1970/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.021)	Loss 2.3137 (2.3671)	Entropy 0.54000 (0.54141)	Top-1 acc 68.359 (67.091)	Top-5 acc 86.719 (85.962)	lr 0.00127
Train [103][1980/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.021)	Loss 2.4086 (2.3671)	Entropy 0.53983 (0.54140)	Top-1 acc 64.062 (67.088)	Top-5 acc 83.203 (85.965)	lr 0.00127
Train [103][1990/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.021)	Loss 2.5484 (2.3669)	Entropy 0.53984 (0.54140)	Top-1 acc 64.062 (67.090)	Top-5 acc 82.422 (85.971)	lr 0.00127
Train [103][2000/3239]	Time 0.245 (0.520)	Data Time 0.001 (0.021)	Loss 2.1178 (2.3667)	Entropy 0.54005 (0.54139)	Top-1 acc 75.000 (67.098)	Top-5 acc 89.844 (85.970)	lr 0.00127
Train [103][2010/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.021)	Loss 2.4931 (2.3669)	Entropy 0.53963 (0.54138)	Top-1 acc 63.672 (67.095)	Top-5 acc 83.594 (85.966)	lr 0.00127
Train [103][2020/3239]	Time 0.365 (0.519)	Data Time 0.001 (0.021)	Loss 2.2135 (2.3668)	Entropy 0.53936 (0.54137)	Top-1 acc 69.531 (67.100)	Top-5 acc 87.500 (85.967)	lr 0.00127
Train [103][2030/3239]	Time 0.314 (0.519)	Data Time 0.002 (0.020)	Loss 2.3458 (2.3670)	Entropy 0.53943 (0.54136)	Top-1 acc 68.359 (67.095)	Top-5 acc 83.984 (85.962)	lr 0.00127
Train [103][2040/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.020)	Loss 2.4163 (2.3670)	Entropy 0.53926 (0.54135)	Top-1 acc 67.188 (67.097)	Top-5 acc 83.594 (85.959)	lr 0.00127
Train [103][2050/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.020)	Loss 2.3237 (2.3668)	Entropy 0.53941 (0.54134)	Top-1 acc 67.188 (67.104)	Top-5 acc 87.891 (85.960)	lr 0.00127
Train [103][2060/3239]	Time 0.217 (0.518)	Data Time 0.001 (0.020)	Loss 2.3501 (2.3668)	Entropy 0.53967 (0.54133)	Top-1 acc 64.453 (67.103)	Top-5 acc 85.156 (85.963)	lr 0.00127
Train [103][2070/3239]	Time 0.219 (0.517)	Data Time 0.001 (0.020)	Loss 2.3135 (2.3666)	Entropy 0.53971 (0.54132)	Top-1 acc 68.750 (67.105)	Top-5 acc 85.938 (85.966)	lr 0.00127
Train [103][2080/3239]	Time 0.227 (0.517)	Data Time 0.001 (0.020)	Loss 2.3136 (2.3662)	Entropy 0.53962 (0.54132)	Top-1 acc 71.875 (67.117)	Top-5 acc 86.328 (85.970)	lr 0.00127
Train [103][2090/3239]	Time 0.319 (0.516)	Data Time 0.001 (0.020)	Loss 2.5787 (2.3664)	Entropy 0.53949 (0.54131)	Top-1 acc 63.281 (67.116)	Top-5 acc 82.422 (85.966)	lr 0.00127
Train [103][2100/3239]	Time 0.228 (0.516)	Data Time 0.001 (0.020)	Loss 2.3937 (2.3663)	Entropy 0.53939 (0.54130)	Top-1 acc 65.625 (67.114)	Top-5 acc 86.719 (85.964)	lr 0.00127
Train [103][2110/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.020)	Loss 2.4883 (2.3662)	Entropy 0.53930 (0.54129)	Top-1 acc 66.406 (67.111)	Top-5 acc 83.594 (85.969)	lr 0.00127
Train [103][2120/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.020)	Loss 2.2310 (2.3663)	Entropy 0.53891 (0.54128)	Top-1 acc 71.484 (67.105)	Top-5 acc 88.672 (85.968)	lr 0.00127
Train [103][2130/3239]	Time 0.238 (0.514)	Data Time 0.001 (0.020)	Loss 2.1784 (2.3664)	Entropy 0.53921 (0.54127)	Top-1 acc 72.266 (67.106)	Top-5 acc 92.188 (85.966)	lr 0.00127
Train [103][2140/3239]	Time 0.245 (0.514)	Data Time 0.001 (0.019)	Loss 2.6060 (2.3668)	Entropy 0.53927 (0.54126)	Top-1 acc 62.109 (67.098)	Top-5 acc 82.422 (85.959)	lr 0.00127
Train [103][2150/3239]	Time 0.222 (0.513)	Data Time 0.001 (0.019)	Loss 2.7819 (2.3674)	Entropy 0.53942 (0.54125)	Top-1 acc 53.906 (67.079)	Top-5 acc 78.906 (85.949)	lr 0.00127
Train [103][2160/3239]	Time 0.251 (0.513)	Data Time 0.002 (0.019)	Loss 2.6344 (2.3673)	Entropy 0.53963 (0.54124)	Top-1 acc 62.109 (67.084)	Top-5 acc 82.031 (85.950)	lr 0.00127
Train [103][2170/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.019)	Loss 2.4537 (2.3673)	Entropy 0.53973 (0.54124)	Top-1 acc 63.672 (67.079)	Top-5 acc 85.547 (85.950)	lr 0.00126
Train [103][2180/3239]	Time 0.320 (0.512)	Data Time 0.001 (0.019)	Loss 2.5720 (2.3676)	Entropy 0.53975 (0.54123)	Top-1 acc 59.766 (67.077)	Top-5 acc 85.938 (85.947)	lr 0.00126
Train [103][2190/3239]	Time 0.216 (0.511)	Data Time 0.001 (0.019)	Loss 2.4440 (2.3679)	Entropy 0.53960 (0.54122)	Top-1 acc 66.797 (67.069)	Top-5 acc 83.594 (85.942)	lr 0.00126
Train [103][2200/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.019)	Loss 2.1249 (2.3678)	Entropy 0.53971 (0.54121)	Top-1 acc 74.219 (67.073)	Top-5 acc 91.016 (85.944)	lr 0.00126
Train [103][2210/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.019)	Loss 2.3892 (2.3679)	Entropy 0.53970 (0.54121)	Top-1 acc 67.578 (67.072)	Top-5 acc 85.547 (85.942)	lr 0.00126
Train [103][2220/3239]	Time 0.234 (0.510)	Data Time 0.001 (0.019)	Loss 2.2498 (2.3678)	Entropy 0.53931 (0.54120)	Top-1 acc 70.312 (67.074)	Top-5 acc 87.500 (85.942)	lr 0.00126
Train [103][2230/3239]	Time 0.464 (0.534)	Data Time 0.006 (0.019)	Loss 2.2246 (2.3679)	Entropy 0.53956 (0.54119)	Top-1 acc 69.531 (67.073)	Top-5 acc 87.500 (85.941)	lr 0.00126
Train [103][2240/3239]	Time 0.237 (0.534)	Data Time 0.002 (0.019)	Loss 2.4062 (2.3679)	Entropy 0.53992 (0.54119)	Top-1 acc 69.531 (67.070)	Top-5 acc 86.719 (85.940)	lr 0.00126
Train [103][2250/3239]	Time 0.374 (0.534)	Data Time 0.002 (0.019)	Loss 2.4502 (2.3680)	Entropy 0.53979 (0.54118)	Top-1 acc 63.281 (67.069)	Top-5 acc 82.422 (85.938)	lr 0.00126
Train [103][2260/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.019)	Loss 2.4178 (2.3678)	Entropy 0.54007 (0.54117)	Top-1 acc 62.109 (67.071)	Top-5 acc 87.891 (85.944)	lr 0.00126
Train [103][2270/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.018)	Loss 2.5689 (2.3681)	Entropy 0.53994 (0.54117)	Top-1 acc 63.672 (67.061)	Top-5 acc 80.469 (85.939)	lr 0.00126
Train [103][2280/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.018)	Loss 2.2705 (2.3682)	Entropy 0.53998 (0.54116)	Top-1 acc 69.922 (67.055)	Top-5 acc 89.062 (85.940)	lr 0.00126
Train [103][2290/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.018)	Loss 2.4499 (2.3682)	Entropy 0.54009 (0.54116)	Top-1 acc 66.016 (67.057)	Top-5 acc 84.766 (85.939)	lr 0.00126
Train [103][2300/3239]	Time 0.228 (0.531)	Data Time 0.001 (0.018)	Loss 2.3975 (2.3684)	Entropy 0.54036 (0.54115)	Top-1 acc 66.406 (67.051)	Top-5 acc 85.156 (85.938)	lr 0.00126
Train [103][2310/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.018)	Loss 2.3515 (2.3685)	Entropy 0.54031 (0.54115)	Top-1 acc 65.625 (67.049)	Top-5 acc 84.766 (85.935)	lr 0.00126
Train [103][2320/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.018)	Loss 2.4876 (2.3689)	Entropy 0.54047 (0.54115)	Top-1 acc 64.844 (67.042)	Top-5 acc 85.547 (85.927)	lr 0.00126
Train [103][2330/3239]	Time 0.247 (0.530)	Data Time 0.001 (0.018)	Loss 2.2975 (2.3687)	Entropy 0.54057 (0.54114)	Top-1 acc 68.750 (67.044)	Top-5 acc 86.719 (85.930)	lr 0.00126
Train [103][2340/3239]	Time 0.336 (0.529)	Data Time 0.001 (0.018)	Loss 2.3702 (2.3688)	Entropy 0.54039 (0.54114)	Top-1 acc 66.016 (67.039)	Top-5 acc 87.500 (85.929)	lr 0.00126
Train [103][2350/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.018)	Loss 2.2722 (2.3686)	Entropy 0.54021 (0.54114)	Top-1 acc 69.531 (67.040)	Top-5 acc 87.891 (85.930)	lr 0.00126
Train [103][2360/3239]	Time 0.239 (0.528)	Data Time 0.001 (0.018)	Loss 2.6103 (2.3688)	Entropy 0.53993 (0.54113)	Top-1 acc 60.938 (67.034)	Top-5 acc 82.422 (85.926)	lr 0.00126
Train [103][2370/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.018)	Loss 2.1267 (2.3688)	Entropy 0.53997 (0.54113)	Top-1 acc 74.609 (67.038)	Top-5 acc 90.625 (85.927)	lr 0.00126
Train [103][2380/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.018)	Loss 2.2945 (2.3689)	Entropy 0.53962 (0.54112)	Top-1 acc 66.406 (67.035)	Top-5 acc 88.672 (85.926)	lr 0.00126
Train [103][2390/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.018)	Loss 2.3215 (2.3689)	Entropy 0.53945 (0.54112)	Top-1 acc 71.484 (67.036)	Top-5 acc 87.891 (85.930)	lr 0.00125
Train [103][2400/3239]	Time 0.244 (0.526)	Data Time 0.001 (0.018)	Loss 2.4864 (2.3690)	Entropy 0.53951 (0.54111)	Top-1 acc 64.062 (67.031)	Top-5 acc 84.766 (85.930)	lr 0.00125
Train [103][2410/3239]	Time 0.333 (0.526)	Data Time 0.001 (0.017)	Loss 2.2575 (2.3691)	Entropy 0.53953 (0.54110)	Top-1 acc 69.141 (67.031)	Top-5 acc 87.500 (85.926)	lr 0.00125
Train [103][2420/3239]	Time 0.240 (0.526)	Data Time 0.001 (0.017)	Loss 2.2851 (2.3695)	Entropy 0.53948 (0.54110)	Top-1 acc 68.359 (67.023)	Top-5 acc 87.500 (85.918)	lr 0.00125
Train [103][2430/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.017)	Loss 2.1923 (2.3694)	Entropy 0.53965 (0.54109)	Top-1 acc 72.266 (67.024)	Top-5 acc 89.062 (85.920)	lr 0.00125
Train [103][2440/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.2269 (2.3691)	Entropy 0.53949 (0.54108)	Top-1 acc 69.141 (67.029)	Top-5 acc 89.062 (85.925)	lr 0.00125
Train [103][2450/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.017)	Loss 2.4373 (2.3689)	Entropy 0.53969 (0.54108)	Top-1 acc 64.453 (67.033)	Top-5 acc 83.594 (85.926)	lr 0.00125
Train [103][2460/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.017)	Loss 2.3728 (2.3688)	Entropy 0.53919 (0.54107)	Top-1 acc 64.453 (67.031)	Top-5 acc 86.328 (85.927)	lr 0.00125
Train [103][2470/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.017)	Loss 2.4726 (2.3690)	Entropy 0.53873 (0.54106)	Top-1 acc 66.016 (67.029)	Top-5 acc 84.766 (85.926)	lr 0.00125
Train [103][2480/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.017)	Loss 2.1261 (2.3689)	Entropy 0.53817 (0.54105)	Top-1 acc 72.266 (67.030)	Top-5 acc 89.844 (85.925)	lr 0.00125
Train [103][2490/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.017)	Loss 2.3133 (2.3689)	Entropy 0.53827 (0.54104)	Top-1 acc 67.188 (67.025)	Top-5 acc 84.766 (85.923)	lr 0.00125
Train [103][2500/3239]	Time 0.327 (0.522)	Data Time 0.001 (0.017)	Loss 2.1968 (2.3687)	Entropy 0.53832 (0.54103)	Top-1 acc 70.312 (67.032)	Top-5 acc 89.844 (85.923)	lr 0.00125
Train [103][2510/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.017)	Loss 2.2719 (2.3687)	Entropy 0.53848 (0.54102)	Top-1 acc 70.312 (67.034)	Top-5 acc 85.938 (85.924)	lr 0.00125
Train [103][2520/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.017)	Loss 2.5060 (2.3687)	Entropy 0.53839 (0.54101)	Top-1 acc 63.281 (67.037)	Top-5 acc 81.250 (85.924)	lr 0.00125
Train [103][2530/3239]	Time 0.218 (0.521)	Data Time 0.001 (0.017)	Loss 2.3259 (2.3685)	Entropy 0.53878 (0.54100)	Top-1 acc 67.578 (67.044)	Top-5 acc 86.719 (85.927)	lr 0.00125
Train [103][2540/3239]	Time 0.268 (0.521)	Data Time 0.001 (0.017)	Loss 2.3127 (2.3687)	Entropy 0.53878 (0.54099)	Top-1 acc 67.188 (67.037)	Top-5 acc 85.156 (85.925)	lr 0.00125
Train [103][2550/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.017)	Loss 2.3064 (2.3685)	Entropy 0.53904 (0.54098)	Top-1 acc 68.750 (67.040)	Top-5 acc 87.109 (85.928)	lr 0.00125
Train [103][2560/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.017)	Loss 2.2493 (2.3684)	Entropy 0.53921 (0.54098)	Top-1 acc 70.703 (67.039)	Top-5 acc 87.891 (85.928)	lr 0.00125
Train [103][2570/3239]	Time 0.320 (0.520)	Data Time 0.001 (0.017)	Loss 2.1397 (2.3685)	Entropy 0.53908 (0.54097)	Top-1 acc 74.219 (67.035)	Top-5 acc 89.062 (85.927)	lr 0.00125
Train [103][2580/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.016)	Loss 2.4676 (2.3684)	Entropy 0.53926 (0.54096)	Top-1 acc 64.453 (67.038)	Top-5 acc 84.766 (85.931)	lr 0.00125
Train [103][2590/3239]	Time 0.224 (0.519)	Data Time 0.001 (0.016)	Loss 2.2140 (2.3684)	Entropy 0.53929 (0.54095)	Top-1 acc 70.703 (67.038)	Top-5 acc 90.234 (85.931)	lr 0.00125
Train [103][2600/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.016)	Loss 2.3566 (2.3684)	Entropy 0.53927 (0.54095)	Top-1 acc 69.531 (67.039)	Top-5 acc 84.375 (85.933)	lr 0.00125
Train [103][2610/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.016)	Loss 2.1147 (2.3680)	Entropy 0.53904 (0.54094)	Top-1 acc 74.609 (67.047)	Top-5 acc 90.625 (85.940)	lr 0.00125
Train [103][2620/3239]	Time 0.245 (0.518)	Data Time 0.001 (0.016)	Loss 2.5174 (2.3682)	Entropy 0.53872 (0.54093)	Top-1 acc 62.109 (67.046)	Top-5 acc 83.594 (85.936)	lr 0.00124
Train [103][2630/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.016)	Loss 2.5218 (2.3682)	Entropy 0.53869 (0.54093)	Top-1 acc 64.062 (67.043)	Top-5 acc 83.594 (85.933)	lr 0.00124
Train [103][2640/3239]	Time 0.237 (0.517)	Data Time 0.001 (0.016)	Loss 2.4550 (2.3682)	Entropy 0.53856 (0.54092)	Top-1 acc 62.500 (67.040)	Top-5 acc 82.422 (85.935)	lr 0.00124
Train [103][2650/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.016)	Loss 2.4908 (2.3683)	Entropy 0.53898 (0.54091)	Top-1 acc 64.453 (67.038)	Top-5 acc 81.250 (85.935)	lr 0.00124
Train [103][2660/3239]	Time 0.224 (0.516)	Data Time 0.001 (0.016)	Loss 2.3180 (2.3685)	Entropy 0.53893 (0.54090)	Top-1 acc 67.578 (67.035)	Top-5 acc 85.156 (85.933)	lr 0.00124
Train [103][2670/3239]	Time 0.307 (0.516)	Data Time 0.003 (0.016)	Loss 2.5291 (2.3687)	Entropy 0.53913 (0.54089)	Top-1 acc 62.891 (67.026)	Top-5 acc 82.031 (85.928)	lr 0.00124
Train [103][2680/3239]	Time 0.278 (0.516)	Data Time 0.001 (0.016)	Loss 2.1630 (2.3686)	Entropy 0.53889 (0.54089)	Top-1 acc 72.656 (67.028)	Top-5 acc 89.062 (85.932)	lr 0.00124
Train [103][2690/3239]	Time 0.227 (0.516)	Data Time 0.001 (0.016)	Loss 2.2223 (2.3685)	Entropy 0.53899 (0.54088)	Top-1 acc 73.047 (67.038)	Top-5 acc 89.453 (85.933)	lr 0.00124
Train [103][2700/3239]	Time 0.251 (0.515)	Data Time 0.001 (0.016)	Loss 2.3041 (2.3686)	Entropy 0.53928 (0.54087)	Top-1 acc 66.406 (67.035)	Top-5 acc 87.109 (85.931)	lr 0.00124
Train [103][2710/3239]	Time 0.249 (0.515)	Data Time 0.001 (0.016)	Loss 2.3156 (2.3687)	Entropy 0.53936 (0.54087)	Top-1 acc 69.922 (67.034)	Top-5 acc 85.547 (85.930)	lr 0.00124
Train [103][2720/3239]	Time 0.322 (0.515)	Data Time 0.001 (0.016)	Loss 2.3712 (2.3688)	Entropy 0.53956 (0.54086)	Top-1 acc 65.625 (67.031)	Top-5 acc 83.203 (85.926)	lr 0.00124
Train [103][2730/3239]	Time 0.361 (0.514)	Data Time 0.002 (0.016)	Loss 2.4307 (2.3687)	Entropy 0.53938 (0.54086)	Top-1 acc 66.016 (67.033)	Top-5 acc 84.766 (85.927)	lr 0.00124
Train [103][2740/3239]	Time 0.262 (0.514)	Data Time 0.001 (0.016)	Loss 2.3021 (2.3687)	Entropy 0.53935 (0.54085)	Top-1 acc 67.578 (67.034)	Top-5 acc 87.891 (85.928)	lr 0.00124
Train [103][2750/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.016)	Loss 2.4522 (2.3687)	Entropy 0.53940 (0.54085)	Top-1 acc 67.578 (67.041)	Top-5 acc 81.641 (85.926)	lr 0.00124
Train [103][2760/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.015)	Loss 2.2774 (2.3688)	Entropy 0.53904 (0.54084)	Top-1 acc 69.141 (67.035)	Top-5 acc 87.500 (85.924)	lr 0.00124
Train [103][2770/3239]	Time 0.288 (0.513)	Data Time 0.002 (0.015)	Loss 2.5025 (2.3690)	Entropy 0.53907 (0.54084)	Top-1 acc 64.844 (67.032)	Top-5 acc 85.156 (85.921)	lr 0.00124
Train [103][2780/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.015)	Loss 2.2652 (2.3689)	Entropy 0.53936 (0.54083)	Top-1 acc 67.578 (67.032)	Top-5 acc 89.844 (85.924)	lr 0.00124
Train [103][2790/3239]	Time 0.223 (0.513)	Data Time 0.001 (0.015)	Loss 2.3162 (2.3687)	Entropy 0.53920 (0.54082)	Top-1 acc 68.359 (67.038)	Top-5 acc 85.547 (85.927)	lr 0.00124
Train [103][2800/3239]	Time 0.326 (0.512)	Data Time 0.001 (0.015)	Loss 2.3769 (2.3687)	Entropy 0.53920 (0.54082)	Top-1 acc 67.188 (67.043)	Top-5 acc 86.328 (85.926)	lr 0.00124
Train [103][2810/3239]	Time 0.238 (0.512)	Data Time 0.001 (0.015)	Loss 2.3171 (2.3684)	Entropy 0.53934 (0.54081)	Top-1 acc 66.016 (67.047)	Top-5 acc 86.719 (85.932)	lr 0.00124
Train [103][2820/3239]	Time 0.247 (0.511)	Data Time 0.001 (0.015)	Loss 2.4317 (2.3682)	Entropy 0.53910 (0.54081)	Top-1 acc 69.141 (67.052)	Top-5 acc 82.812 (85.933)	lr 0.00124
Train [103][2830/3239]	Time 0.225 (0.511)	Data Time 0.001 (0.015)	Loss 2.3554 (2.3683)	Entropy 0.53916 (0.54080)	Top-1 acc 66.016 (67.051)	Top-5 acc 87.500 (85.931)	lr 0.00124
Train [103][2840/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.015)	Loss 2.1936 (2.3682)	Entropy 0.53923 (0.54079)	Top-1 acc 71.875 (67.055)	Top-5 acc 87.500 (85.933)	lr 0.00124
Train [103][2850/3239]	Time 0.225 (0.511)	Data Time 0.001 (0.015)	Loss 2.2511 (2.3685)	Entropy 0.53931 (0.54079)	Top-1 acc 67.188 (67.042)	Top-5 acc 89.062 (85.932)	lr 0.00123
Train [103][2860/3239]	Time 0.258 (0.510)	Data Time 0.002 (0.015)	Loss 2.4728 (2.3686)	Entropy 0.53848 (0.54078)	Top-1 acc 62.109 (67.042)	Top-5 acc 87.109 (85.932)	lr 0.00123
Train [103][2870/3239]	Time 0.298 (0.510)	Data Time 0.033 (0.015)	Loss 2.3095 (2.3685)	Entropy 0.53863 (0.54078)	Top-1 acc 67.969 (67.044)	Top-5 acc 85.156 (85.933)	lr 0.00123
Train [103][2880/3239]	Time 0.228 (0.510)	Data Time 0.001 (0.015)	Loss 2.2674 (2.3685)	Entropy 0.53864 (0.54077)	Top-1 acc 67.578 (67.043)	Top-5 acc 88.672 (85.932)	lr 0.00123
Train [103][2890/3239]	Time 0.337 (0.529)	Data Time 0.002 (0.015)	Loss 2.1327 (2.3684)	Entropy 0.53848 (0.54076)	Top-1 acc 72.266 (67.044)	Top-5 acc 91.016 (85.933)	lr 0.00123
Train [103][2900/3239]	Time 0.249 (0.528)	Data Time 0.002 (0.015)	Loss 2.4495 (2.3682)	Entropy 0.53849 (0.54075)	Top-1 acc 67.578 (67.053)	Top-5 acc 86.328 (85.937)	lr 0.00123
Train [103][2910/3239]	Time 0.237 (0.528)	Data Time 0.001 (0.015)	Loss 2.4780 (2.3684)	Entropy 0.53848 (0.54074)	Top-1 acc 60.156 (67.044)	Top-5 acc 87.500 (85.935)	lr 0.00123
Train [103][2920/3239]	Time 0.240 (0.528)	Data Time 0.002 (0.015)	Loss 2.3697 (2.3683)	Entropy 0.53819 (0.54074)	Top-1 acc 67.969 (67.048)	Top-5 acc 82.031 (85.935)	lr 0.00123
Train [103][2930/3239]	Time 0.260 (0.527)	Data Time 0.001 (0.015)	Loss 2.3072 (2.3684)	Entropy 0.53855 (0.54073)	Top-1 acc 66.406 (67.046)	Top-5 acc 85.156 (85.928)	lr 0.00123
Train [103][2940/3239]	Time 0.270 (0.527)	Data Time 0.002 (0.015)	Loss 2.5112 (2.3683)	Entropy 0.53892 (0.54072)	Top-1 acc 64.844 (67.051)	Top-5 acc 82.422 (85.930)	lr 0.00123
Train [103][2950/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.015)	Loss 2.5417 (2.3683)	Entropy 0.53905 (0.54071)	Top-1 acc 62.891 (67.049)	Top-5 acc 82.422 (85.929)	lr 0.00123
Train [103][2960/3239]	Time 0.328 (0.526)	Data Time 0.001 (0.015)	Loss 2.4258 (2.3685)	Entropy 0.53828 (0.54071)	Top-1 acc 65.625 (67.040)	Top-5 acc 85.938 (85.927)	lr 0.00123
Train [103][2970/3239]	Time 0.286 (0.526)	Data Time 0.003 (0.015)	Loss 2.0791 (2.3683)	Entropy 0.53800 (0.54070)	Top-1 acc 71.094 (67.043)	Top-5 acc 92.188 (85.932)	lr 0.00123
Train [103][2980/3239]	Time 0.271 (0.526)	Data Time 0.001 (0.015)	Loss 2.2363 (2.3681)	Entropy 0.53808 (0.54069)	Top-1 acc 69.531 (67.049)	Top-5 acc 88.281 (85.935)	lr 0.00123
Train [103][2990/3239]	Time 0.262 (0.525)	Data Time 0.001 (0.014)	Loss 2.3543 (2.3681)	Entropy 0.53813 (0.54068)	Top-1 acc 64.453 (67.050)	Top-5 acc 85.547 (85.936)	lr 0.00123
Train [103][3000/3239]	Time 0.225 (0.525)	Data Time 0.001 (0.014)	Loss 2.3768 (2.3681)	Entropy 0.53796 (0.54067)	Top-1 acc 65.234 (67.049)	Top-5 acc 87.891 (85.936)	lr 0.00123
Train [103][3010/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.014)	Loss 2.4451 (2.3682)	Entropy 0.53785 (0.54066)	Top-1 acc 63.281 (67.046)	Top-5 acc 85.938 (85.935)	lr 0.00123
Train [103][3020/3239]	Time 0.247 (0.524)	Data Time 0.001 (0.014)	Loss 2.2473 (2.3684)	Entropy 0.53767 (0.54066)	Top-1 acc 69.531 (67.044)	Top-5 acc 87.500 (85.932)	lr 0.00123
Train [103][3030/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.014)	Loss 2.3686 (2.3684)	Entropy 0.53749 (0.54065)	Top-1 acc 67.578 (67.044)	Top-5 acc 85.547 (85.930)	lr 0.00123
Train [103][3040/3239]	Time 0.273 (0.524)	Data Time 0.001 (0.014)	Loss 2.4867 (2.3685)	Entropy 0.53763 (0.54064)	Top-1 acc 65.625 (67.042)	Top-5 acc 81.641 (85.926)	lr 0.00123
Train [103][3050/3239]	Time 0.346 (0.523)	Data Time 0.001 (0.014)	Loss 2.3210 (2.3683)	Entropy 0.53761 (0.54063)	Top-1 acc 69.531 (67.047)	Top-5 acc 85.156 (85.929)	lr 0.00123
Train [103][3060/3239]	Time 0.254 (0.523)	Data Time 0.001 (0.014)	Loss 2.3845 (2.3683)	Entropy 0.53751 (0.54062)	Top-1 acc 69.531 (67.047)	Top-5 acc 85.547 (85.927)	lr 0.00123
Train [103][3070/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.014)	Loss 2.5122 (2.3685)	Entropy 0.53743 (0.54061)	Top-1 acc 66.406 (67.042)	Top-5 acc 84.766 (85.924)	lr 0.00123
Train [103][3080/3239]	Time 0.277 (0.522)	Data Time 0.001 (0.014)	Loss 2.2858 (2.3686)	Entropy 0.53759 (0.54060)	Top-1 acc 71.875 (67.038)	Top-5 acc 88.281 (85.923)	lr 0.00122
Train [103][3090/3239]	Time 0.271 (0.522)	Data Time 0.001 (0.014)	Loss 2.5699 (2.3689)	Entropy 0.53750 (0.54059)	Top-1 acc 59.766 (67.030)	Top-5 acc 81.641 (85.918)	lr 0.00122
Train [103][3100/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.014)	Loss 2.3454 (2.3689)	Entropy 0.53770 (0.54058)	Top-1 acc 66.016 (67.027)	Top-5 acc 84.766 (85.917)	lr 0.00122
Train [103][3110/3239]	Time 0.247 (0.521)	Data Time 0.001 (0.014)	Loss 2.3495 (2.3688)	Entropy 0.53757 (0.54057)	Top-1 acc 67.969 (67.029)	Top-5 acc 87.109 (85.921)	lr 0.00122
Train [103][3120/3239]	Time 0.327 (0.521)	Data Time 0.001 (0.014)	Loss 2.3760 (2.3690)	Entropy 0.53761 (0.54056)	Top-1 acc 68.359 (67.030)	Top-5 acc 86.719 (85.918)	lr 0.00122
Train [103][3130/3239]	Time 0.242 (0.521)	Data Time 0.001 (0.014)	Loss 2.4439 (2.3691)	Entropy 0.53719 (0.54055)	Top-1 acc 64.453 (67.027)	Top-5 acc 83.203 (85.916)	lr 0.00122
Train [103][3140/3239]	Time 0.278 (0.521)	Data Time 0.002 (0.014)	Loss 2.5874 (2.3694)	Entropy 0.53741 (0.54054)	Top-1 acc 58.594 (67.019)	Top-5 acc 82.031 (85.911)	lr 0.00122
Train [103][3150/3239]	Time 0.273 (0.521)	Data Time 0.001 (0.014)	Loss 2.3343 (2.3694)	Entropy 0.53714 (0.54053)	Top-1 acc 66.016 (67.018)	Top-5 acc 89.844 (85.913)	lr 0.00122
Train [103][3160/3239]	Time 0.257 (0.520)	Data Time 0.001 (0.014)	Loss 2.2642 (2.3694)	Entropy 0.53748 (0.54052)	Top-1 acc 68.750 (67.018)	Top-5 acc 90.234 (85.913)	lr 0.00122
Train [103][3170/3239]	Time 0.243 (0.520)	Data Time 0.002 (0.014)	Loss 2.3681 (2.3691)	Entropy 0.53757 (0.54051)	Top-1 acc 65.625 (67.024)	Top-5 acc 85.938 (85.918)	lr 0.00122
Train [103][3180/3239]	Time 0.225 (0.520)	Data Time 0.000 (0.014)	Loss 2.4558 (2.3693)	Entropy 0.53768 (0.54050)	Top-1 acc 62.500 (67.016)	Top-5 acc 82.812 (85.913)	lr 0.00122
Train [103][3190/3239]	Time 0.228 (0.519)	Data Time 0.000 (0.014)	Loss 2.7786 (2.3694)	Entropy 0.53779 (0.54049)	Top-1 acc 56.641 (67.014)	Top-5 acc 77.734 (85.912)	lr 0.00122
Train [103][3200/3239]	Time 0.227 (0.519)	Data Time 0.000 (0.014)	Loss 2.5468 (2.3695)	Entropy 0.53780 (0.54048)	Top-1 acc 60.547 (67.010)	Top-5 acc 83.594 (85.912)	lr 0.00122
Train [103][3210/3239]	Time 0.248 (0.519)	Data Time 0.000 (0.014)	Loss 2.3638 (2.3696)	Entropy 0.53797 (0.54047)	Top-1 acc 64.062 (67.006)	Top-5 acc 85.547 (85.908)	lr 0.00122
Train [103][3220/3239]	Time 0.228 (0.518)	Data Time 0.000 (0.014)	Loss 2.3149 (2.3697)	Entropy 0.53807 (0.54046)	Top-1 acc 67.969 (67.003)	Top-5 acc 87.500 (85.908)	lr 0.00122
Train [103][3230/3239]	Time 0.231 (0.518)	Data Time 0.000 (0.014)	Loss 2.2996 (2.3699)	Entropy 0.53827 (0.54046)	Top-1 acc 68.750 (67.002)	Top-5 acc 86.719 (85.905)	lr 0.00122
Train [103][3239/3239]	Time 0.900 (0.517)	Data Time 0.000 (0.013)	Loss 2.4063 (2.3698)	Entropy 0.53845 (0.54045)	Top-1 acc 67.901 (67.005)	Top-5 acc 87.654 (85.906)	lr 0.00122
==========Valid [103/120]	loss 1.187	top-1 acc 72.727 (72.786)	top-5 acc 90.484	Train top-1 67.005	top-5 85.906	Entropy 0.53845	Latency-None: 0.000ms	Flops: 539.00M
Train [104][0/3239]	Time 39.812 (39.812)	Data Time 37.670 (37.670)	Loss 2.4493 (2.4493)	Entropy 0.53856 (0.53856)	Top-1 acc 65.234 (65.234)	Top-5 acc 83.203 (83.203)	lr 0.00122
Train [104][10/3239]	Time 0.233 (4.102)	Data Time 0.001 (3.427)	Loss 2.5414 (2.3670)	Entropy 0.53832 (0.53838)	Top-1 acc 63.281 (67.578)	Top-5 acc 80.469 (86.257)	lr 0.00122
Train [104][20/3239]	Time 0.228 (2.355)	Data Time 0.001 (1.796)	Loss 2.7671 (2.3441)	Entropy 0.53841 (0.53834)	Top-1 acc 61.719 (68.155)	Top-5 acc 78.516 (86.272)	lr 0.00122
Train [104][30/3239]	Time 0.244 (1.732)	Data Time 0.001 (1.217)	Loss 2.4337 (2.3453)	Entropy 0.53880 (0.53841)	Top-1 acc 64.062 (67.893)	Top-5 acc 86.719 (86.366)	lr 0.00122
Train [104][40/3239]	Time 0.235 (1.411)	Data Time 0.001 (0.920)	Loss 2.2182 (2.3474)	Entropy 0.53861 (0.53847)	Top-1 acc 70.703 (68.102)	Top-5 acc 87.500 (86.338)	lr 0.00122
Train [104][50/3239]	Time 0.224 (1.214)	Data Time 0.001 (0.740)	Loss 2.3787 (2.3479)	Entropy 0.53847 (0.53848)	Top-1 acc 69.531 (68.038)	Top-5 acc 83.984 (86.297)	lr 0.00122
Train [104][60/3239]	Time 0.257 (1.082)	Data Time 0.001 (0.619)	Loss 2.3031 (2.3414)	Entropy 0.53866 (0.53849)	Top-1 acc 65.234 (68.142)	Top-5 acc 88.281 (86.514)	lr 0.00122
Train [104][70/3239]	Time 0.231 (0.990)	Data Time 0.001 (0.532)	Loss 2.2182 (2.3447)	Entropy 0.53857 (0.53849)	Top-1 acc 67.578 (67.886)	Top-5 acc 86.719 (86.449)	lr 0.00121
Train [104][80/3239]	Time 0.230 (0.917)	Data Time 0.001 (0.467)	Loss 2.4018 (2.3471)	Entropy 0.53847 (0.53850)	Top-1 acc 67.969 (67.742)	Top-5 acc 86.719 (86.381)	lr 0.00121
Train [104][90/3239]	Time 0.233 (0.862)	Data Time 0.001 (0.416)	Loss 2.3914 (2.3474)	Entropy 0.53846 (0.53849)	Top-1 acc 65.234 (67.703)	Top-5 acc 85.156 (86.320)	lr 0.00121
Train [104][100/3239]	Time 0.234 (0.817)	Data Time 0.001 (0.375)	Loss 2.2640 (2.3484)	Entropy 0.53848 (0.53849)	Top-1 acc 68.750 (67.551)	Top-5 acc 87.891 (86.405)	lr 0.00121
Train [104][110/3239]	Time 0.323 (0.781)	Data Time 0.001 (0.341)	Loss 2.2890 (2.3477)	Entropy 0.53876 (0.53850)	Top-1 acc 68.750 (67.585)	Top-5 acc 87.109 (86.430)	lr 0.00121
Train [104][120/3239]	Time 0.235 (0.751)	Data Time 0.001 (0.313)	Loss 2.1908 (2.3438)	Entropy 0.53867 (0.53852)	Top-1 acc 71.875 (67.723)	Top-5 acc 85.547 (86.460)	lr 0.00121
Train [104][130/3239]	Time 0.218 (0.724)	Data Time 0.001 (0.289)	Loss 2.3468 (2.3478)	Entropy 0.53900 (0.53854)	Top-1 acc 63.281 (67.554)	Top-5 acc 87.891 (86.382)	lr 0.00121
Train [104][140/3239]	Time 0.234 (0.703)	Data Time 0.001 (0.269)	Loss 2.1332 (2.3459)	Entropy 0.53907 (0.53857)	Top-1 acc 76.172 (67.636)	Top-5 acc 89.062 (86.384)	lr 0.00121
Train [104][150/3239]	Time 0.228 (0.683)	Data Time 0.001 (0.251)	Loss 2.3630 (2.3465)	Entropy 0.53904 (0.53861)	Top-1 acc 66.797 (67.607)	Top-5 acc 85.156 (86.367)	lr 0.00121
Train [104][160/3239]	Time 0.230 (0.667)	Data Time 0.001 (0.236)	Loss 2.2143 (2.3480)	Entropy 0.53864 (0.53863)	Top-1 acc 69.531 (67.542)	Top-5 acc 87.891 (86.318)	lr 0.00121
Train [104][170/3239]	Time 0.229 (0.652)	Data Time 0.001 (0.222)	Loss 2.3790 (2.3462)	Entropy 0.53842 (0.53863)	Top-1 acc 61.328 (67.487)	Top-5 acc 87.500 (86.333)	lr 0.00121
Train [104][180/3239]	Time 0.321 (0.638)	Data Time 0.001 (0.210)	Loss 2.5658 (2.3475)	Entropy 0.53827 (0.53862)	Top-1 acc 58.203 (67.494)	Top-5 acc 82.422 (86.326)	lr 0.00121
Train [104][190/3239]	Time 0.221 (0.625)	Data Time 0.001 (0.199)	Loss 2.2702 (2.3499)	Entropy 0.53793 (0.53860)	Top-1 acc 67.969 (67.384)	Top-5 acc 89.844 (86.293)	lr 0.00121
Train [104][200/3239]	Time 0.264 (0.615)	Data Time 0.001 (0.189)	Loss 2.4932 (2.3510)	Entropy 0.53822 (0.53857)	Top-1 acc 64.453 (67.331)	Top-5 acc 81.250 (86.246)	lr 0.00121
Train [104][210/3239]	Time 0.227 (0.606)	Data Time 0.001 (0.180)	Loss 2.7058 (2.3537)	Entropy 0.53831 (0.53855)	Top-1 acc 59.375 (67.275)	Top-5 acc 80.469 (86.210)	lr 0.00121
Train [104][220/3239]	Time 0.229 (0.597)	Data Time 0.001 (0.172)	Loss 2.2461 (2.3539)	Entropy 0.53823 (0.53854)	Top-1 acc 70.703 (67.317)	Top-5 acc 86.328 (86.178)	lr 0.00121
Train [104][230/3239]	Time 0.239 (0.589)	Data Time 0.001 (0.165)	Loss 2.2658 (2.3548)	Entropy 0.53850 (0.53853)	Top-1 acc 67.969 (67.309)	Top-5 acc 89.062 (86.178)	lr 0.00121
Train [104][240/3239]	Time 0.282 (0.585)	Data Time 0.002 (0.158)	Loss 2.2554 (2.3544)	Entropy 0.53831 (0.53852)	Top-1 acc 71.875 (67.311)	Top-5 acc 87.109 (86.185)	lr 0.00121
Train [104][250/3239]	Time 0.227 (0.581)	Data Time 0.001 (0.152)	Loss 2.3447 (2.3548)	Entropy 0.53812 (0.53851)	Top-1 acc 65.234 (67.286)	Top-5 acc 87.109 (86.182)	lr 0.00121
Train [104][260/3239]	Time 0.240 (0.574)	Data Time 0.001 (0.146)	Loss 2.3524 (2.3540)	Entropy 0.53797 (0.53849)	Top-1 acc 67.578 (67.303)	Top-5 acc 85.938 (86.202)	lr 0.00121
Train [104][270/3239]	Time 0.326 (0.569)	Data Time 0.001 (0.141)	Loss 2.3139 (2.3524)	Entropy 0.53786 (0.53847)	Top-1 acc 69.922 (67.316)	Top-5 acc 87.500 (86.237)	lr 0.00121
Train [104][280/3239]	Time 0.221 (0.562)	Data Time 0.001 (0.136)	Loss 2.5228 (2.3549)	Entropy 0.53802 (0.53845)	Top-1 acc 64.453 (67.296)	Top-5 acc 82.422 (86.184)	lr 0.00121
Train [104][290/3239]	Time 0.232 (0.557)	Data Time 0.001 (0.131)	Loss 2.1858 (2.3553)	Entropy 0.53764 (0.53842)	Top-1 acc 72.266 (67.271)	Top-5 acc 88.672 (86.187)	lr 0.00121
Train [104][300/3239]	Time 0.379 (0.724)	Data Time 0.005 (0.127)	Loss 2.3599 (2.3556)	Entropy 0.53771 (0.53840)	Top-1 acc 65.625 (67.264)	Top-5 acc 83.984 (86.180)	lr 0.00120
Train [104][310/3239]	Time 0.282 (0.719)	Data Time 0.002 (0.123)	Loss 2.1498 (2.3523)	Entropy 0.53758 (0.53838)	Top-1 acc 75.000 (67.381)	Top-5 acc 89.453 (86.233)	lr 0.00120
Train [104][320/3239]	Time 0.217 (0.710)	Data Time 0.001 (0.119)	Loss 2.7130 (2.3532)	Entropy 0.53753 (0.53835)	Top-1 acc 57.812 (67.364)	Top-5 acc 79.688 (86.221)	lr 0.00120
Train [104][330/3239]	Time 0.234 (0.701)	Data Time 0.001 (0.116)	Loss 2.3636 (2.3539)	Entropy 0.53756 (0.53832)	Top-1 acc 63.672 (67.354)	Top-5 acc 86.719 (86.221)	lr 0.00120
Train [104][340/3239]	Time 0.320 (0.692)	Data Time 0.001 (0.112)	Loss 2.2090 (2.3544)	Entropy 0.53744 (0.53830)	Top-1 acc 70.312 (67.326)	Top-5 acc 89.062 (86.220)	lr 0.00120
Train [104][350/3239]	Time 0.261 (0.685)	Data Time 0.001 (0.109)	Loss 2.2846 (2.3540)	Entropy 0.53759 (0.53828)	Top-1 acc 66.406 (67.338)	Top-5 acc 88.672 (86.230)	lr 0.00120
Train [104][360/3239]	Time 0.237 (0.677)	Data Time 0.001 (0.106)	Loss 2.4126 (2.3536)	Entropy 0.53743 (0.53826)	Top-1 acc 66.406 (67.368)	Top-5 acc 85.938 (86.234)	lr 0.00120
Train [104][370/3239]	Time 0.230 (0.670)	Data Time 0.001 (0.103)	Loss 2.3826 (2.3540)	Entropy 0.53779 (0.53824)	Top-1 acc 65.234 (67.334)	Top-5 acc 84.375 (86.218)	lr 0.00120
Train [104][380/3239]	Time 0.232 (0.664)	Data Time 0.001 (0.101)	Loss 2.3338 (2.3562)	Entropy 0.53789 (0.53823)	Top-1 acc 67.578 (67.292)	Top-5 acc 86.328 (86.175)	lr 0.00120
Train [104][390/3239]	Time 0.226 (0.658)	Data Time 0.001 (0.098)	Loss 2.3481 (2.3567)	Entropy 0.53756 (0.53822)	Top-1 acc 66.406 (67.276)	Top-5 acc 87.500 (86.176)	lr 0.00120
Train [104][400/3239]	Time 0.248 (0.652)	Data Time 0.001 (0.096)	Loss 2.4612 (2.3580)	Entropy 0.53741 (0.53820)	Top-1 acc 64.844 (67.250)	Top-5 acc 85.547 (86.154)	lr 0.00120
Train [104][410/3239]	Time 0.227 (0.646)	Data Time 0.001 (0.093)	Loss 2.4413 (2.3584)	Entropy 0.53749 (0.53818)	Top-1 acc 63.672 (67.245)	Top-5 acc 85.547 (86.150)	lr 0.00120
Train [104][420/3239]	Time 0.222 (0.641)	Data Time 0.001 (0.091)	Loss 2.4170 (2.3587)	Entropy 0.53733 (0.53816)	Top-1 acc 62.109 (67.242)	Top-5 acc 85.547 (86.130)	lr 0.00120
Train [104][430/3239]	Time 0.398 (0.638)	Data Time 0.001 (0.089)	Loss 2.3005 (2.3588)	Entropy 0.53738 (0.53814)	Top-1 acc 69.141 (67.247)	Top-5 acc 87.109 (86.153)	lr 0.00120
Train [104][440/3239]	Time 0.214 (0.634)	Data Time 0.001 (0.087)	Loss 2.7001 (2.3596)	Entropy 0.53734 (0.53812)	Top-1 acc 58.594 (67.202)	Top-5 acc 81.641 (86.148)	lr 0.00120
Train [104][450/3239]	Time 0.230 (0.629)	Data Time 0.001 (0.085)	Loss 2.3196 (2.3595)	Entropy 0.53755 (0.53811)	Top-1 acc 69.922 (67.200)	Top-5 acc 87.109 (86.155)	lr 0.00120
Train [104][460/3239]	Time 0.232 (0.624)	Data Time 0.001 (0.083)	Loss 2.2776 (2.3601)	Entropy 0.53772 (0.53810)	Top-1 acc 71.094 (67.176)	Top-5 acc 88.672 (86.155)	lr 0.00120
Train [104][470/3239]	Time 0.226 (0.620)	Data Time 0.001 (0.082)	Loss 2.4547 (2.3612)	Entropy 0.53767 (0.53809)	Top-1 acc 60.938 (67.139)	Top-5 acc 84.375 (86.127)	lr 0.00120
Train [104][480/3239]	Time 0.229 (0.616)	Data Time 0.002 (0.080)	Loss 2.3461 (2.3613)	Entropy 0.53773 (0.53808)	Top-1 acc 68.359 (67.151)	Top-5 acc 86.719 (86.134)	lr 0.00120
Train [104][490/3239]	Time 0.232 (0.612)	Data Time 0.001 (0.078)	Loss 2.4247 (2.3610)	Entropy 0.53785 (0.53807)	Top-1 acc 70.312 (67.164)	Top-5 acc 84.375 (86.134)	lr 0.00120
Train [104][500/3239]	Time 0.340 (0.608)	Data Time 0.001 (0.077)	Loss 2.2293 (2.3595)	Entropy 0.53768 (0.53807)	Top-1 acc 66.406 (67.212)	Top-5 acc 87.500 (86.166)	lr 0.00120
Train [104][510/3239]	Time 0.236 (0.604)	Data Time 0.001 (0.075)	Loss 2.3447 (2.3583)	Entropy 0.53760 (0.53806)	Top-1 acc 68.750 (67.239)	Top-5 acc 85.938 (86.195)	lr 0.00120
Train [104][520/3239]	Time 0.233 (0.601)	Data Time 0.001 (0.074)	Loss 2.2975 (2.3576)	Entropy 0.53730 (0.53805)	Top-1 acc 68.359 (67.242)	Top-5 acc 87.500 (86.195)	lr 0.00120
Train [104][530/3239]	Time 0.300 (0.598)	Data Time 0.002 (0.073)	Loss 2.1674 (2.3578)	Entropy 0.53728 (0.53803)	Top-1 acc 69.531 (67.234)	Top-5 acc 91.406 (86.199)	lr 0.00119
Train [104][540/3239]	Time 0.280 (0.597)	Data Time 0.002 (0.071)	Loss 2.3093 (2.3586)	Entropy 0.53724 (0.53802)	Top-1 acc 69.922 (67.224)	Top-5 acc 85.938 (86.188)	lr 0.00119
Train [104][550/3239]	Time 0.221 (0.595)	Data Time 0.001 (0.070)	Loss 2.2525 (2.3572)	Entropy 0.53727 (0.53801)	Top-1 acc 70.312 (67.255)	Top-5 acc 87.891 (86.203)	lr 0.00119
Train [104][560/3239]	Time 0.231 (0.592)	Data Time 0.001 (0.069)	Loss 2.5460 (2.3580)	Entropy 0.53726 (0.53799)	Top-1 acc 62.891 (67.234)	Top-5 acc 83.203 (86.179)	lr 0.00119
Train [104][570/3239]	Time 0.227 (0.589)	Data Time 0.001 (0.068)	Loss 2.4114 (2.3573)	Entropy 0.53696 (0.53798)	Top-1 acc 66.016 (67.254)	Top-5 acc 86.719 (86.201)	lr 0.00119
Train [104][580/3239]	Time 0.226 (0.586)	Data Time 0.001 (0.067)	Loss 2.3540 (2.3574)	Entropy 0.53712 (0.53797)	Top-1 acc 69.141 (67.263)	Top-5 acc 86.719 (86.199)	lr 0.00119
Train [104][590/3239]	Time 0.247 (0.583)	Data Time 0.001 (0.065)	Loss 2.2004 (2.3576)	Entropy 0.53720 (0.53795)	Top-1 acc 70.703 (67.259)	Top-5 acc 89.844 (86.197)	lr 0.00119
Train [104][600/3239]	Time 0.233 (0.581)	Data Time 0.001 (0.064)	Loss 2.5524 (2.3577)	Entropy 0.53718 (0.53794)	Top-1 acc 60.938 (67.258)	Top-5 acc 82.031 (86.183)	lr 0.00119
Train [104][610/3239]	Time 0.231 (0.578)	Data Time 0.001 (0.063)	Loss 2.2722 (2.3568)	Entropy 0.53730 (0.53793)	Top-1 acc 67.578 (67.282)	Top-5 acc 87.891 (86.208)	lr 0.00119
Train [104][620/3239]	Time 0.223 (0.576)	Data Time 0.001 (0.062)	Loss 2.4793 (2.3574)	Entropy 0.53724 (0.53792)	Top-1 acc 63.672 (67.250)	Top-5 acc 84.766 (86.207)	lr 0.00119
Train [104][630/3239]	Time 0.239 (0.573)	Data Time 0.001 (0.061)	Loss 2.4558 (2.3575)	Entropy 0.53709 (0.53790)	Top-1 acc 63.672 (67.253)	Top-5 acc 84.766 (86.214)	lr 0.00119
Train [104][640/3239]	Time 0.222 (0.570)	Data Time 0.001 (0.060)	Loss 2.3578 (2.3579)	Entropy 0.53737 (0.53789)	Top-1 acc 67.578 (67.237)	Top-5 acc 86.328 (86.209)	lr 0.00119
Train [104][650/3239]	Time 0.236 (0.568)	Data Time 0.001 (0.060)	Loss 2.3710 (2.3575)	Entropy 0.53761 (0.53789)	Top-1 acc 67.578 (67.251)	Top-5 acc 86.719 (86.207)	lr 0.00119
Train [104][660/3239]	Time 0.317 (0.565)	Data Time 0.001 (0.059)	Loss 2.3461 (2.3570)	Entropy 0.53756 (0.53788)	Top-1 acc 67.578 (67.259)	Top-5 acc 87.500 (86.216)	lr 0.00119
Train [104][670/3239]	Time 0.262 (0.563)	Data Time 0.001 (0.058)	Loss 2.3465 (2.3581)	Entropy 0.53778 (0.53788)	Top-1 acc 69.141 (67.247)	Top-5 acc 86.328 (86.194)	lr 0.00119
Train [104][680/3239]	Time 0.240 (0.561)	Data Time 0.001 (0.057)	Loss 2.3040 (2.3591)	Entropy 0.53780 (0.53788)	Top-1 acc 67.969 (67.217)	Top-5 acc 89.062 (86.182)	lr 0.00119
Train [104][690/3239]	Time 0.268 (0.559)	Data Time 0.001 (0.056)	Loss 2.3272 (2.3603)	Entropy 0.53739 (0.53787)	Top-1 acc 65.625 (67.202)	Top-5 acc 87.500 (86.156)	lr 0.00119
Train [104][700/3239]	Time 0.229 (0.557)	Data Time 0.001 (0.055)	Loss 2.3715 (2.3615)	Entropy 0.53729 (0.53787)	Top-1 acc 67.578 (67.180)	Top-5 acc 84.375 (86.141)	lr 0.00119
Train [104][710/3239]	Time 0.235 (0.555)	Data Time 0.001 (0.055)	Loss 2.4038 (2.3609)	Entropy 0.53677 (0.53785)	Top-1 acc 68.359 (67.196)	Top-5 acc 84.766 (86.153)	lr 0.00119
Train [104][720/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.054)	Loss 2.4729 (2.3602)	Entropy 0.53678 (0.53784)	Top-1 acc 60.938 (67.195)	Top-5 acc 86.328 (86.167)	lr 0.00119
Train [104][730/3239]	Time 0.321 (0.551)	Data Time 0.001 (0.053)	Loss 2.3029 (2.3601)	Entropy 0.53713 (0.53783)	Top-1 acc 68.750 (67.198)	Top-5 acc 88.281 (86.169)	lr 0.00119
Train [104][740/3239]	Time 0.231 (0.549)	Data Time 0.001 (0.052)	Loss 2.1006 (2.3604)	Entropy 0.53706 (0.53782)	Top-1 acc 73.438 (67.186)	Top-5 acc 89.453 (86.166)	lr 0.00119
Train [104][750/3239]	Time 0.228 (0.547)	Data Time 0.001 (0.052)	Loss 2.5369 (2.3621)	Entropy 0.53665 (0.53781)	Top-1 acc 64.453 (67.150)	Top-5 acc 81.250 (86.133)	lr 0.00119
Train [104][760/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.051)	Loss 2.3525 (2.3616)	Entropy 0.53666 (0.53779)	Top-1 acc 69.141 (67.159)	Top-5 acc 87.109 (86.144)	lr 0.00118
Train [104][770/3239]	Time 0.230 (0.543)	Data Time 0.001 (0.051)	Loss 2.3781 (2.3628)	Entropy 0.53672 (0.53778)	Top-1 acc 65.625 (67.135)	Top-5 acc 86.719 (86.120)	lr 0.00118
Train [104][780/3239]	Time 0.226 (0.542)	Data Time 0.001 (0.050)	Loss 2.4057 (2.3630)	Entropy 0.53674 (0.53776)	Top-1 acc 67.188 (67.125)	Top-5 acc 85.156 (86.129)	lr 0.00118
Train [104][790/3239]	Time 0.252 (0.540)	Data Time 0.001 (0.049)	Loss 2.5947 (2.3628)	Entropy 0.53660 (0.53775)	Top-1 acc 59.375 (67.126)	Top-5 acc 83.984 (86.131)	lr 0.00118
Train [104][800/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.049)	Loss 2.4618 (2.3616)	Entropy 0.53673 (0.53774)	Top-1 acc 64.453 (67.167)	Top-5 acc 85.156 (86.149)	lr 0.00118
Train [104][810/3239]	Time 0.234 (0.537)	Data Time 0.001 (0.048)	Loss 2.3950 (2.3612)	Entropy 0.53659 (0.53772)	Top-1 acc 67.969 (67.184)	Top-5 acc 86.328 (86.153)	lr 0.00118
Train [104][820/3239]	Time 0.326 (0.535)	Data Time 0.001 (0.048)	Loss 2.0739 (2.3619)	Entropy 0.53647 (0.53771)	Top-1 acc 75.391 (67.168)	Top-5 acc 92.188 (86.147)	lr 0.00118
Train [104][830/3239]	Time 0.251 (0.534)	Data Time 0.001 (0.047)	Loss 2.4095 (2.3621)	Entropy 0.53641 (0.53769)	Top-1 acc 63.281 (67.164)	Top-5 acc 82.812 (86.135)	lr 0.00118
Train [104][840/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.046)	Loss 2.3291 (2.3621)	Entropy 0.53637 (0.53768)	Top-1 acc 65.625 (67.163)	Top-5 acc 87.109 (86.141)	lr 0.00118
Train [104][850/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.046)	Loss 2.4727 (2.3624)	Entropy 0.53657 (0.53766)	Top-1 acc 65.234 (67.145)	Top-5 acc 82.031 (86.128)	lr 0.00118
Train [104][860/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.045)	Loss 2.3862 (2.3624)	Entropy 0.53681 (0.53765)	Top-1 acc 66.797 (67.142)	Top-5 acc 85.938 (86.129)	lr 0.00118
Train [104][870/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.045)	Loss 2.3945 (2.3627)	Entropy 0.53667 (0.53764)	Top-1 acc 64.453 (67.119)	Top-5 acc 84.766 (86.116)	lr 0.00118
Train [104][880/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.044)	Loss 2.1506 (2.3629)	Entropy 0.53663 (0.53763)	Top-1 acc 73.438 (67.109)	Top-5 acc 88.672 (86.112)	lr 0.00118
Train [104][890/3239]	Time 0.314 (0.526)	Data Time 0.001 (0.044)	Loss 2.3880 (2.3632)	Entropy 0.53642 (0.53762)	Top-1 acc 69.531 (67.111)	Top-5 acc 88.672 (86.116)	lr 0.00118
Train [104][900/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.043)	Loss 2.3368 (2.3635)	Entropy 0.53657 (0.53761)	Top-1 acc 64.844 (67.090)	Top-5 acc 85.938 (86.108)	lr 0.00118
Train [104][910/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.043)	Loss 2.3989 (2.3641)	Entropy 0.53654 (0.53759)	Top-1 acc 67.578 (67.090)	Top-5 acc 87.109 (86.092)	lr 0.00118
Train [104][920/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.043)	Loss 2.3753 (2.3643)	Entropy 0.53660 (0.53758)	Top-1 acc 64.062 (67.087)	Top-5 acc 84.766 (86.097)	lr 0.00118
Train [104][930/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.042)	Loss 2.7124 (2.3654)	Entropy 0.53666 (0.53757)	Top-1 acc 58.594 (67.065)	Top-5 acc 83.594 (86.086)	lr 0.00118
Train [104][940/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.042)	Loss 2.1570 (2.3646)	Entropy 0.53667 (0.53756)	Top-1 acc 71.875 (67.089)	Top-5 acc 90.234 (86.103)	lr 0.00118
Train [104][950/3239]	Time 0.225 (0.519)	Data Time 0.001 (0.041)	Loss 2.2340 (2.3651)	Entropy 0.53639 (0.53755)	Top-1 acc 68.750 (67.081)	Top-5 acc 88.672 (86.093)	lr 0.00118
Train [104][960/3239]	Time 0.405 (0.573)	Data Time 0.002 (0.041)	Loss 2.4610 (2.3656)	Entropy 0.53640 (0.53754)	Top-1 acc 63.281 (67.070)	Top-5 acc 82.812 (86.077)	lr 0.00118
Train [104][970/3239]	Time 0.236 (0.572)	Data Time 0.002 (0.041)	Loss 2.5313 (2.3662)	Entropy 0.53591 (0.53753)	Top-1 acc 60.156 (67.054)	Top-5 acc 83.203 (86.070)	lr 0.00118
Train [104][980/3239]	Time 0.323 (0.571)	Data Time 0.001 (0.040)	Loss 2.3772 (2.3662)	Entropy 0.53582 (0.53751)	Top-1 acc 66.406 (67.059)	Top-5 acc 85.547 (86.061)	lr 0.00118
Train [104][990/3239]	Time 0.238 (0.569)	Data Time 0.001 (0.040)	Loss 2.4485 (2.3665)	Entropy 0.53575 (0.53749)	Top-1 acc 66.797 (67.049)	Top-5 acc 83.984 (86.062)	lr 0.00117
Train [104][1000/3239]	Time 0.229 (0.568)	Data Time 0.001 (0.039)	Loss 2.2580 (2.3664)	Entropy 0.53605 (0.53748)	Top-1 acc 73.828 (67.051)	Top-5 acc 87.891 (86.063)	lr 0.00117
Train [104][1010/3239]	Time 0.235 (0.567)	Data Time 0.001 (0.039)	Loss 2.4456 (2.3667)	Entropy 0.53603 (0.53747)	Top-1 acc 64.844 (67.046)	Top-5 acc 83.984 (86.057)	lr 0.00117
Train [104][1020/3239]	Time 0.277 (0.565)	Data Time 0.002 (0.039)	Loss 2.4344 (2.3668)	Entropy 0.53635 (0.53745)	Top-1 acc 64.062 (67.044)	Top-5 acc 87.109 (86.060)	lr 0.00117
Train [104][1030/3239]	Time 0.239 (0.565)	Data Time 0.001 (0.038)	Loss 2.2042 (2.3662)	Entropy 0.53668 (0.53744)	Top-1 acc 67.969 (67.065)	Top-5 acc 87.891 (86.069)	lr 0.00117
Train [104][1040/3239]	Time 0.256 (0.564)	Data Time 0.001 (0.038)	Loss 2.2542 (2.3662)	Entropy 0.53661 (0.53744)	Top-1 acc 69.531 (67.071)	Top-5 acc 88.281 (86.064)	lr 0.00117
Train [104][1050/3239]	Time 0.319 (0.562)	Data Time 0.001 (0.038)	Loss 2.2815 (2.3664)	Entropy 0.53633 (0.53743)	Top-1 acc 66.797 (67.063)	Top-5 acc 88.281 (86.063)	lr 0.00117
Train [104][1060/3239]	Time 0.222 (0.561)	Data Time 0.001 (0.037)	Loss 2.5311 (2.3664)	Entropy 0.53631 (0.53742)	Top-1 acc 62.109 (67.064)	Top-5 acc 84.375 (86.061)	lr 0.00117
Train [104][1070/3239]	Time 0.232 (0.560)	Data Time 0.001 (0.037)	Loss 2.3446 (2.3659)	Entropy 0.53596 (0.53741)	Top-1 acc 67.578 (67.069)	Top-5 acc 86.328 (86.071)	lr 0.00117
Train [104][1080/3239]	Time 0.232 (0.558)	Data Time 0.001 (0.037)	Loss 2.4347 (2.3660)	Entropy 0.53594 (0.53739)	Top-1 acc 67.969 (67.076)	Top-5 acc 84.766 (86.071)	lr 0.00117
Train [104][1090/3239]	Time 0.228 (0.557)	Data Time 0.001 (0.036)	Loss 2.2666 (2.3661)	Entropy 0.53638 (0.53738)	Top-1 acc 67.578 (67.075)	Top-5 acc 89.453 (86.064)	lr 0.00117
Train [104][1100/3239]	Time 0.226 (0.556)	Data Time 0.001 (0.036)	Loss 2.3056 (2.3659)	Entropy 0.53624 (0.53737)	Top-1 acc 64.844 (67.081)	Top-5 acc 88.281 (86.062)	lr 0.00117
Train [104][1110/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.036)	Loss 2.3204 (2.3658)	Entropy 0.53611 (0.53736)	Top-1 acc 70.312 (67.079)	Top-5 acc 87.500 (86.067)	lr 0.00117
Train [104][1120/3239]	Time 0.229 (0.553)	Data Time 0.001 (0.035)	Loss 2.3906 (2.3659)	Entropy 0.53608 (0.53735)	Top-1 acc 63.281 (67.071)	Top-5 acc 85.547 (86.067)	lr 0.00117
Train [104][1130/3239]	Time 0.228 (0.552)	Data Time 0.001 (0.035)	Loss 2.3496 (2.3662)	Entropy 0.53623 (0.53734)	Top-1 acc 68.750 (67.058)	Top-5 acc 86.328 (86.067)	lr 0.00117
Train [104][1140/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.035)	Loss 2.4012 (2.3660)	Entropy 0.53620 (0.53733)	Top-1 acc 66.406 (67.065)	Top-5 acc 85.938 (86.065)	lr 0.00117
Train [104][1150/3239]	Time 0.251 (0.550)	Data Time 0.001 (0.034)	Loss 2.4760 (2.3658)	Entropy 0.53648 (0.53732)	Top-1 acc 66.016 (67.067)	Top-5 acc 84.375 (86.065)	lr 0.00117
Train [104][1160/3239]	Time 0.229 (0.549)	Data Time 0.001 (0.034)	Loss 2.2225 (2.3659)	Entropy 0.53668 (0.53731)	Top-1 acc 70.312 (67.066)	Top-5 acc 88.281 (86.062)	lr 0.00117
Train [104][1170/3239]	Time 0.233 (0.548)	Data Time 0.001 (0.034)	Loss 2.2680 (2.3653)	Entropy 0.53671 (0.53731)	Top-1 acc 67.188 (67.081)	Top-5 acc 87.500 (86.067)	lr 0.00117
Train [104][1180/3239]	Time 0.254 (0.547)	Data Time 0.002 (0.034)	Loss 2.1597 (2.3648)	Entropy 0.53671 (0.53730)	Top-1 acc 69.922 (67.091)	Top-5 acc 89.453 (86.077)	lr 0.00117
Train [104][1190/3239]	Time 0.264 (0.546)	Data Time 0.001 (0.033)	Loss 2.2378 (2.3645)	Entropy 0.53701 (0.53730)	Top-1 acc 71.875 (67.103)	Top-5 acc 87.891 (86.079)	lr 0.00117
Train [104][1200/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.033)	Loss 2.2353 (2.3642)	Entropy 0.53693 (0.53730)	Top-1 acc 68.750 (67.109)	Top-5 acc 89.062 (86.082)	lr 0.00117
Train [104][1210/3239]	Time 0.348 (0.544)	Data Time 0.001 (0.033)	Loss 2.3026 (2.3640)	Entropy 0.53663 (0.53729)	Top-1 acc 65.234 (67.114)	Top-5 acc 86.328 (86.090)	lr 0.00117
Train [104][1220/3239]	Time 0.241 (0.543)	Data Time 0.001 (0.033)	Loss 2.3139 (2.3641)	Entropy 0.53688 (0.53729)	Top-1 acc 68.750 (67.110)	Top-5 acc 87.891 (86.084)	lr 0.00117
Train [104][1230/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.032)	Loss 2.4949 (2.3639)	Entropy 0.53655 (0.53729)	Top-1 acc 67.969 (67.118)	Top-5 acc 83.594 (86.088)	lr 0.00116
Train [104][1240/3239]	Time 0.252 (0.541)	Data Time 0.001 (0.032)	Loss 2.2023 (2.3636)	Entropy 0.53652 (0.53728)	Top-1 acc 71.875 (67.127)	Top-5 acc 89.062 (86.096)	lr 0.00116
Train [104][1250/3239]	Time 0.247 (0.540)	Data Time 0.001 (0.032)	Loss 2.2548 (2.3632)	Entropy 0.53663 (0.53727)	Top-1 acc 67.969 (67.139)	Top-5 acc 86.719 (86.104)	lr 0.00116
Train [104][1260/3239]	Time 0.233 (0.540)	Data Time 0.001 (0.032)	Loss 2.3343 (2.3634)	Entropy 0.53649 (0.53727)	Top-1 acc 70.312 (67.139)	Top-5 acc 85.938 (86.093)	lr 0.00116
Train [104][1270/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.031)	Loss 2.2214 (2.3633)	Entropy 0.53629 (0.53726)	Top-1 acc 71.094 (67.138)	Top-5 acc 88.281 (86.094)	lr 0.00116
Train [104][1280/3239]	Time 0.337 (0.538)	Data Time 0.001 (0.031)	Loss 2.4307 (2.3631)	Entropy 0.53654 (0.53725)	Top-1 acc 66.797 (67.147)	Top-5 acc 85.156 (86.093)	lr 0.00116
Train [104][1290/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.031)	Loss 2.3116 (2.3632)	Entropy 0.53623 (0.53725)	Top-1 acc 66.016 (67.142)	Top-5 acc 87.109 (86.091)	lr 0.00116
Train [104][1300/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.031)	Loss 2.2911 (2.3633)	Entropy 0.53613 (0.53724)	Top-1 acc 68.359 (67.144)	Top-5 acc 86.328 (86.096)	lr 0.00116
Train [104][1310/3239]	Time 0.227 (0.535)	Data Time 0.001 (0.030)	Loss 2.3333 (2.3629)	Entropy 0.53645 (0.53723)	Top-1 acc 69.141 (67.161)	Top-5 acc 84.766 (86.098)	lr 0.00116
Train [104][1320/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.030)	Loss 2.1953 (2.3626)	Entropy 0.53600 (0.53722)	Top-1 acc 71.875 (67.176)	Top-5 acc 88.281 (86.099)	lr 0.00116
Train [104][1330/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.030)	Loss 2.5156 (2.3628)	Entropy 0.53539 (0.53721)	Top-1 acc 64.453 (67.165)	Top-5 acc 83.594 (86.100)	lr 0.00116
Train [104][1340/3239]	Time 0.253 (0.533)	Data Time 0.001 (0.030)	Loss 2.2397 (2.3628)	Entropy 0.53563 (0.53720)	Top-1 acc 68.750 (67.167)	Top-5 acc 88.672 (86.101)	lr 0.00116
Train [104][1350/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.030)	Loss 2.4406 (2.3626)	Entropy 0.53570 (0.53719)	Top-1 acc 63.672 (67.169)	Top-5 acc 84.375 (86.101)	lr 0.00116
Train [104][1360/3239]	Time 0.254 (0.532)	Data Time 0.001 (0.029)	Loss 2.3396 (2.3626)	Entropy 0.53608 (0.53718)	Top-1 acc 67.969 (67.174)	Top-5 acc 87.500 (86.104)	lr 0.00116
Train [104][1370/3239]	Time 0.332 (0.531)	Data Time 0.001 (0.029)	Loss 2.5107 (2.3629)	Entropy 0.53612 (0.53717)	Top-1 acc 62.891 (67.164)	Top-5 acc 84.766 (86.100)	lr 0.00116
Train [104][1380/3239]	Time 0.258 (0.530)	Data Time 0.001 (0.029)	Loss 2.2797 (2.3627)	Entropy 0.53615 (0.53717)	Top-1 acc 71.094 (67.165)	Top-5 acc 87.500 (86.102)	lr 0.00116
Train [104][1390/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.029)	Loss 2.4451 (2.3627)	Entropy 0.53628 (0.53716)	Top-1 acc 63.672 (67.160)	Top-5 acc 83.984 (86.101)	lr 0.00116
Train [104][1400/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.029)	Loss 2.4633 (2.3628)	Entropy 0.53599 (0.53715)	Top-1 acc 66.797 (67.158)	Top-5 acc 83.203 (86.095)	lr 0.00116
Train [104][1410/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.028)	Loss 2.2977 (2.3628)	Entropy 0.53640 (0.53714)	Top-1 acc 71.484 (67.157)	Top-5 acc 85.938 (86.090)	lr 0.00116
Train [104][1420/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.028)	Loss 2.4099 (2.3631)	Entropy 0.53635 (0.53714)	Top-1 acc 67.578 (67.151)	Top-5 acc 86.719 (86.087)	lr 0.00116
Train [104][1430/3239]	Time 0.241 (0.526)	Data Time 0.001 (0.028)	Loss 2.3817 (2.3633)	Entropy 0.53642 (0.53713)	Top-1 acc 69.141 (67.150)	Top-5 acc 85.547 (86.088)	lr 0.00116
Train [104][1440/3239]	Time 0.337 (0.526)	Data Time 0.001 (0.028)	Loss 2.4642 (2.3631)	Entropy 0.53668 (0.53713)	Top-1 acc 66.016 (67.152)	Top-5 acc 85.547 (86.091)	lr 0.00116
Train [104][1450/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.028)	Loss 2.4306 (2.3634)	Entropy 0.53700 (0.53713)	Top-1 acc 66.797 (67.140)	Top-5 acc 85.156 (86.084)	lr 0.00116
Train [104][1460/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.027)	Loss 2.1882 (2.3632)	Entropy 0.53684 (0.53713)	Top-1 acc 73.047 (67.142)	Top-5 acc 89.062 (86.087)	lr 0.00115
Train [104][1470/3239]	Time 0.222 (0.523)	Data Time 0.001 (0.027)	Loss 2.4614 (2.3635)	Entropy 0.53696 (0.53712)	Top-1 acc 65.625 (67.135)	Top-5 acc 83.984 (86.080)	lr 0.00115
Train [104][1480/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.027)	Loss 2.2921 (2.3634)	Entropy 0.53700 (0.53712)	Top-1 acc 66.406 (67.135)	Top-5 acc 88.281 (86.081)	lr 0.00115
Train [104][1490/3239]	Time 0.222 (0.522)	Data Time 0.001 (0.027)	Loss 2.4985 (2.3637)	Entropy 0.53691 (0.53712)	Top-1 acc 64.062 (67.124)	Top-5 acc 84.766 (86.079)	lr 0.00115
Train [104][1500/3239]	Time 0.250 (0.522)	Data Time 0.001 (0.027)	Loss 2.5485 (2.3641)	Entropy 0.53689 (0.53712)	Top-1 acc 62.891 (67.121)	Top-5 acc 82.812 (86.072)	lr 0.00115
Train [104][1510/3239]	Time 0.238 (0.521)	Data Time 0.001 (0.027)	Loss 2.1904 (2.3639)	Entropy 0.53693 (0.53712)	Top-1 acc 68.750 (67.120)	Top-5 acc 89.453 (86.075)	lr 0.00115
Train [104][1520/3239]	Time 0.222 (0.520)	Data Time 0.001 (0.026)	Loss 2.4388 (2.3641)	Entropy 0.53735 (0.53712)	Top-1 acc 66.016 (67.115)	Top-5 acc 84.766 (86.073)	lr 0.00115
Train [104][1530/3239]	Time 0.337 (0.520)	Data Time 0.001 (0.026)	Loss 2.4653 (2.3648)	Entropy 0.53734 (0.53712)	Top-1 acc 63.672 (67.097)	Top-5 acc 83.594 (86.060)	lr 0.00115
Train [104][1540/3239]	Time 0.223 (0.519)	Data Time 0.001 (0.026)	Loss 2.4314 (2.3648)	Entropy 0.53757 (0.53712)	Top-1 acc 65.625 (67.105)	Top-5 acc 84.375 (86.060)	lr 0.00115
Train [104][1550/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.026)	Loss 2.4091 (2.3650)	Entropy 0.53769 (0.53712)	Top-1 acc 67.969 (67.102)	Top-5 acc 86.328 (86.053)	lr 0.00115
Train [104][1560/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.026)	Loss 2.3566 (2.3648)	Entropy 0.53749 (0.53713)	Top-1 acc 70.703 (67.110)	Top-5 acc 83.594 (86.060)	lr 0.00115
Train [104][1570/3239]	Time 0.239 (0.517)	Data Time 0.001 (0.026)	Loss 2.3411 (2.3651)	Entropy 0.53779 (0.53713)	Top-1 acc 64.844 (67.104)	Top-5 acc 87.500 (86.056)	lr 0.00115
Train [104][1580/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.025)	Loss 2.4114 (2.3653)	Entropy 0.53779 (0.53713)	Top-1 acc 64.453 (67.097)	Top-5 acc 84.766 (86.051)	lr 0.00115
Train [104][1590/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.025)	Loss 2.5108 (2.3651)	Entropy 0.53763 (0.53714)	Top-1 acc 62.891 (67.106)	Top-5 acc 84.375 (86.053)	lr 0.00115
Train [104][1600/3239]	Time 0.339 (0.515)	Data Time 0.001 (0.025)	Loss 2.3770 (2.3655)	Entropy 0.53743 (0.53714)	Top-1 acc 68.359 (67.097)	Top-5 acc 87.109 (86.044)	lr 0.00115
Train [104][1610/3239]	Time 0.379 (0.548)	Data Time 0.007 (0.025)	Loss 2.4090 (2.3657)	Entropy 0.53691 (0.53714)	Top-1 acc 64.844 (67.087)	Top-5 acc 83.203 (86.035)	lr 0.00115
Train [104][1620/3239]	Time 0.243 (0.547)	Data Time 0.002 (0.025)	Loss 2.0982 (2.3656)	Entropy 0.53707 (0.53714)	Top-1 acc 75.000 (67.088)	Top-5 acc 91.016 (86.039)	lr 0.00115
Train [104][1630/3239]	Time 0.231 (0.547)	Data Time 0.001 (0.025)	Loss 2.5600 (2.3662)	Entropy 0.53712 (0.53714)	Top-1 acc 65.234 (67.073)	Top-5 acc 81.250 (86.026)	lr 0.00115
Train [104][1640/3239]	Time 0.245 (0.546)	Data Time 0.001 (0.025)	Loss 2.7825 (2.3669)	Entropy 0.53716 (0.53714)	Top-1 acc 56.641 (67.055)	Top-5 acc 76.562 (86.011)	lr 0.00115
Train [104][1650/3239]	Time 0.311 (0.545)	Data Time 0.001 (0.025)	Loss 2.4050 (2.3669)	Entropy 0.53692 (0.53714)	Top-1 acc 64.062 (67.055)	Top-5 acc 87.109 (86.010)	lr 0.00115
Train [104][1660/3239]	Time 0.233 (0.545)	Data Time 0.001 (0.024)	Loss 2.6464 (2.3670)	Entropy 0.53695 (0.53714)	Top-1 acc 56.641 (67.050)	Top-5 acc 83.594 (86.006)	lr 0.00115
Train [104][1670/3239]	Time 0.247 (0.544)	Data Time 0.002 (0.024)	Loss 2.2476 (2.3670)	Entropy 0.53658 (0.53714)	Top-1 acc 71.875 (67.053)	Top-5 acc 87.891 (86.008)	lr 0.00115
Train [104][1680/3239]	Time 0.238 (0.543)	Data Time 0.001 (0.024)	Loss 2.5857 (2.3674)	Entropy 0.53659 (0.53713)	Top-1 acc 62.109 (67.042)	Top-5 acc 82.422 (86.002)	lr 0.00115
Train [104][1690/3239]	Time 0.331 (0.542)	Data Time 0.001 (0.024)	Loss 2.6141 (2.3671)	Entropy 0.53654 (0.53713)	Top-1 acc 60.547 (67.051)	Top-5 acc 80.078 (86.005)	lr 0.00115
Train [104][1700/3239]	Time 0.223 (0.542)	Data Time 0.001 (0.024)	Loss 2.4219 (2.3672)	Entropy 0.53651 (0.53713)	Top-1 acc 64.844 (67.049)	Top-5 acc 81.641 (86.002)	lr 0.00114
Train [104][1710/3239]	Time 0.236 (0.541)	Data Time 0.001 (0.024)	Loss 2.1243 (2.3668)	Entropy 0.53663 (0.53712)	Top-1 acc 71.094 (67.062)	Top-5 acc 92.578 (86.009)	lr 0.00114
Train [104][1720/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.024)	Loss 3.0663 (2.3676)	Entropy 0.53665 (0.53712)	Top-1 acc 52.344 (67.049)	Top-5 acc 75.391 (85.995)	lr 0.00114
Train [104][1730/3239]	Time 0.273 (0.540)	Data Time 0.001 (0.023)	Loss 2.4289 (2.3675)	Entropy 0.53654 (0.53712)	Top-1 acc 63.281 (67.051)	Top-5 acc 85.938 (85.996)	lr 0.00114
Train [104][1740/3239]	Time 0.243 (0.539)	Data Time 0.002 (0.023)	Loss 2.4522 (2.3673)	Entropy 0.53603 (0.53711)	Top-1 acc 65.234 (67.063)	Top-5 acc 84.375 (86.000)	lr 0.00114
Train [104][1750/3239]	Time 0.236 (0.538)	Data Time 0.001 (0.023)	Loss 2.4736 (2.3673)	Entropy 0.53596 (0.53711)	Top-1 acc 67.578 (67.063)	Top-5 acc 82.422 (85.999)	lr 0.00114
Train [104][1760/3239]	Time 0.331 (0.537)	Data Time 0.001 (0.023)	Loss 2.3096 (2.3673)	Entropy 0.53593 (0.53710)	Top-1 acc 69.141 (67.059)	Top-5 acc 85.156 (85.995)	lr 0.00114
Train [104][1770/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.023)	Loss 2.2589 (2.3669)	Entropy 0.53620 (0.53709)	Top-1 acc 73.828 (67.070)	Top-5 acc 87.891 (86.001)	lr 0.00114
Train [104][1780/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.023)	Loss 2.4939 (2.3671)	Entropy 0.53611 (0.53709)	Top-1 acc 67.188 (67.066)	Top-5 acc 83.203 (86.000)	lr 0.00114
Train [104][1790/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.023)	Loss 2.3799 (2.3670)	Entropy 0.53645 (0.53708)	Top-1 acc 65.625 (67.071)	Top-5 acc 85.547 (86.004)	lr 0.00114
Train [104][1800/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.023)	Loss 2.2227 (2.3670)	Entropy 0.53662 (0.53708)	Top-1 acc 73.047 (67.072)	Top-5 acc 89.844 (86.006)	lr 0.00114
Train [104][1810/3239]	Time 0.220 (0.534)	Data Time 0.001 (0.022)	Loss 2.8181 (2.3671)	Entropy 0.53641 (0.53708)	Top-1 acc 56.250 (67.069)	Top-5 acc 81.250 (86.007)	lr 0.00114
Train [104][1820/3239]	Time 0.223 (0.534)	Data Time 0.001 (0.022)	Loss 2.3173 (2.3672)	Entropy 0.53629 (0.53707)	Top-1 acc 69.141 (67.065)	Top-5 acc 85.938 (86.001)	lr 0.00114
Train [104][1830/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.022)	Loss 2.3824 (2.3669)	Entropy 0.53618 (0.53707)	Top-1 acc 67.969 (67.075)	Top-5 acc 85.938 (86.009)	lr 0.00114
Train [104][1840/3239]	Time 0.221 (0.532)	Data Time 0.001 (0.022)	Loss 2.3361 (2.3668)	Entropy 0.53601 (0.53706)	Top-1 acc 66.797 (67.079)	Top-5 acc 86.719 (86.006)	lr 0.00114
Train [104][1850/3239]	Time 0.283 (0.532)	Data Time 0.001 (0.022)	Loss 2.4954 (2.3667)	Entropy 0.53603 (0.53706)	Top-1 acc 68.359 (67.082)	Top-5 acc 84.766 (86.009)	lr 0.00114
Train [104][1860/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.022)	Loss 2.4227 (2.3661)	Entropy 0.53606 (0.53705)	Top-1 acc 66.016 (67.097)	Top-5 acc 84.766 (86.019)	lr 0.00114
Train [104][1870/3239]	Time 0.226 (0.531)	Data Time 0.001 (0.022)	Loss 2.6096 (2.3663)	Entropy 0.53576 (0.53705)	Top-1 acc 63.281 (67.092)	Top-5 acc 80.469 (86.018)	lr 0.00114
Train [104][1880/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.022)	Loss 2.3849 (2.3663)	Entropy 0.53563 (0.53704)	Top-1 acc 67.969 (67.089)	Top-5 acc 86.719 (86.020)	lr 0.00114
Train [104][1890/3239]	Time 0.228 (0.530)	Data Time 0.001 (0.022)	Loss 2.1228 (2.3664)	Entropy 0.53572 (0.53703)	Top-1 acc 72.266 (67.084)	Top-5 acc 89.453 (86.019)	lr 0.00114
Train [104][1900/3239]	Time 0.225 (0.529)	Data Time 0.001 (0.021)	Loss 2.1332 (2.3667)	Entropy 0.53584 (0.53703)	Top-1 acc 71.484 (67.078)	Top-5 acc 90.234 (86.014)	lr 0.00114
Train [104][1910/3239]	Time 0.225 (0.529)	Data Time 0.001 (0.021)	Loss 2.2019 (2.3665)	Entropy 0.53599 (0.53702)	Top-1 acc 71.875 (67.082)	Top-5 acc 86.719 (86.020)	lr 0.00114
Train [104][1920/3239]	Time 0.327 (0.528)	Data Time 0.001 (0.021)	Loss 2.4753 (2.3664)	Entropy 0.53615 (0.53701)	Top-1 acc 63.281 (67.080)	Top-5 acc 83.984 (86.021)	lr 0.00114
Train [104][1930/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.021)	Loss 2.3285 (2.3663)	Entropy 0.53621 (0.53701)	Top-1 acc 65.625 (67.082)	Top-5 acc 87.109 (86.027)	lr 0.00114
Train [104][1940/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.021)	Loss 2.2933 (2.3659)	Entropy 0.53625 (0.53701)	Top-1 acc 70.312 (67.093)	Top-5 acc 87.500 (86.033)	lr 0.00113
Train [104][1950/3239]	Time 0.287 (0.527)	Data Time 0.001 (0.021)	Loss 2.8581 (2.3662)	Entropy 0.53618 (0.53700)	Top-1 acc 56.641 (67.089)	Top-5 acc 76.172 (86.030)	lr 0.00113
Train [104][1960/3239]	Time 0.283 (0.527)	Data Time 0.001 (0.021)	Loss 2.4901 (2.3667)	Entropy 0.53609 (0.53700)	Top-1 acc 65.625 (67.077)	Top-5 acc 83.594 (86.021)	lr 0.00113
Train [104][1970/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.021)	Loss 2.2636 (2.3670)	Entropy 0.53563 (0.53699)	Top-1 acc 70.703 (67.067)	Top-5 acc 87.109 (86.015)	lr 0.00113
Train [104][1980/3239]	Time 0.227 (0.526)	Data Time 0.001 (0.021)	Loss 2.3394 (2.3669)	Entropy 0.53601 (0.53699)	Top-1 acc 70.312 (67.073)	Top-5 acc 85.156 (86.017)	lr 0.00113
Train [104][1990/3239]	Time 0.352 (0.525)	Data Time 0.001 (0.021)	Loss 2.5430 (2.3669)	Entropy 0.53626 (0.53698)	Top-1 acc 68.359 (67.075)	Top-5 acc 82.031 (86.017)	lr 0.00113
Train [104][2000/3239]	Time 0.265 (0.525)	Data Time 0.001 (0.020)	Loss 2.2451 (2.3668)	Entropy 0.53628 (0.53698)	Top-1 acc 68.359 (67.074)	Top-5 acc 89.062 (86.017)	lr 0.00113
Train [104][2010/3239]	Time 0.243 (0.525)	Data Time 0.001 (0.020)	Loss 2.3115 (2.3671)	Entropy 0.53638 (0.53697)	Top-1 acc 69.922 (67.068)	Top-5 acc 85.547 (86.012)	lr 0.00113
Train [104][2020/3239]	Time 0.224 (0.524)	Data Time 0.001 (0.020)	Loss 2.6012 (2.3672)	Entropy 0.53652 (0.53697)	Top-1 acc 60.156 (67.060)	Top-5 acc 80.859 (86.007)	lr 0.00113
Train [104][2030/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.020)	Loss 2.2247 (2.3669)	Entropy 0.53621 (0.53697)	Top-1 acc 69.922 (67.069)	Top-5 acc 87.891 (86.010)	lr 0.00113
Train [104][2040/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.020)	Loss 2.5944 (2.3672)	Entropy 0.53633 (0.53697)	Top-1 acc 62.500 (67.064)	Top-5 acc 81.641 (86.003)	lr 0.00113
Train [104][2050/3239]	Time 0.245 (0.523)	Data Time 0.001 (0.020)	Loss 2.3966 (2.3669)	Entropy 0.53637 (0.53696)	Top-1 acc 65.625 (67.071)	Top-5 acc 87.109 (86.008)	lr 0.00113
Train [104][2060/3239]	Time 0.240 (0.522)	Data Time 0.001 (0.020)	Loss 2.2214 (2.3669)	Entropy 0.53562 (0.53696)	Top-1 acc 70.703 (67.072)	Top-5 acc 87.891 (86.008)	lr 0.00113
Train [104][2070/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.020)	Loss 2.3554 (2.3671)	Entropy 0.53554 (0.53695)	Top-1 acc 66.016 (67.067)	Top-5 acc 87.891 (86.003)	lr 0.00113
Train [104][2080/3239]	Time 0.356 (0.521)	Data Time 0.001 (0.020)	Loss 2.2911 (2.3671)	Entropy 0.53534 (0.53695)	Top-1 acc 68.750 (67.067)	Top-5 acc 87.109 (86.000)	lr 0.00113
Train [104][2090/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.020)	Loss 2.3426 (2.3671)	Entropy 0.53568 (0.53694)	Top-1 acc 67.578 (67.070)	Top-5 acc 82.812 (85.999)	lr 0.00113
Train [104][2100/3239]	Time 0.263 (0.520)	Data Time 0.001 (0.020)	Loss 2.3336 (2.3671)	Entropy 0.53561 (0.53693)	Top-1 acc 65.625 (67.069)	Top-5 acc 85.547 (85.996)	lr 0.00113
Train [104][2110/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.020)	Loss 2.3518 (2.3671)	Entropy 0.53585 (0.53693)	Top-1 acc 69.141 (67.070)	Top-5 acc 85.547 (85.991)	lr 0.00113
Train [104][2120/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.019)	Loss 2.3324 (2.3674)	Entropy 0.53556 (0.53692)	Top-1 acc 67.578 (67.066)	Top-5 acc 86.719 (85.986)	lr 0.00113
Train [104][2130/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.019)	Loss 2.3325 (2.3672)	Entropy 0.53597 (0.53692)	Top-1 acc 68.359 (67.078)	Top-5 acc 87.500 (85.989)	lr 0.00113
Train [104][2140/3239]	Time 0.220 (0.518)	Data Time 0.001 (0.019)	Loss 2.5675 (2.3673)	Entropy 0.53558 (0.53691)	Top-1 acc 58.984 (67.069)	Top-5 acc 80.859 (85.981)	lr 0.00113
Train [104][2150/3239]	Time 0.323 (0.517)	Data Time 0.001 (0.019)	Loss 2.2208 (2.3673)	Entropy 0.53566 (0.53690)	Top-1 acc 71.875 (67.070)	Top-5 acc 87.891 (85.981)	lr 0.00113
Train [104][2160/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.019)	Loss 2.2822 (2.3673)	Entropy 0.53526 (0.53690)	Top-1 acc 70.312 (67.065)	Top-5 acc 86.719 (85.981)	lr 0.00113
Train [104][2170/3239]	Time 0.240 (0.516)	Data Time 0.001 (0.019)	Loss 2.5138 (2.3677)	Entropy 0.53538 (0.53689)	Top-1 acc 62.891 (67.055)	Top-5 acc 81.250 (85.969)	lr 0.00113
Train [104][2180/3239]	Time 0.230 (0.516)	Data Time 0.001 (0.019)	Loss 2.1032 (2.3675)	Entropy 0.53550 (0.53688)	Top-1 acc 70.312 (67.057)	Top-5 acc 92.188 (85.974)	lr 0.00112
Train [104][2190/3239]	Time 0.222 (0.515)	Data Time 0.001 (0.019)	Loss 2.2568 (2.3674)	Entropy 0.53554 (0.53688)	Top-1 acc 72.656 (67.062)	Top-5 acc 86.719 (85.973)	lr 0.00112
Train [104][2200/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.019)	Loss 2.3770 (2.3673)	Entropy 0.53557 (0.53687)	Top-1 acc 66.797 (67.067)	Top-5 acc 86.719 (85.978)	lr 0.00112
Train [104][2210/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.019)	Loss 2.4539 (2.3678)	Entropy 0.53588 (0.53687)	Top-1 acc 66.797 (67.057)	Top-5 acc 83.984 (85.968)	lr 0.00112
Train [104][2220/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.019)	Loss 2.3110 (2.3683)	Entropy 0.53558 (0.53686)	Top-1 acc 67.578 (67.046)	Top-5 acc 85.156 (85.959)	lr 0.00112
Train [104][2230/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.019)	Loss 2.2111 (2.3683)	Entropy 0.53542 (0.53686)	Top-1 acc 71.094 (67.044)	Top-5 acc 89.844 (85.959)	lr 0.00112
Train [104][2240/3239]	Time 0.255 (0.513)	Data Time 0.001 (0.018)	Loss 2.4701 (2.3683)	Entropy 0.53540 (0.53685)	Top-1 acc 62.109 (67.041)	Top-5 acc 85.156 (85.960)	lr 0.00112
Train [104][2250/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.018)	Loss 2.1845 (2.3683)	Entropy 0.53525 (0.53684)	Top-1 acc 70.703 (67.040)	Top-5 acc 88.672 (85.961)	lr 0.00112
Train [104][2260/3239]	Time 0.224 (0.512)	Data Time 0.001 (0.018)	Loss 2.3618 (2.3684)	Entropy 0.53493 (0.53684)	Top-1 acc 67.578 (67.038)	Top-5 acc 85.547 (85.958)	lr 0.00112
Train [104][2270/3239]	Time 0.336 (0.535)	Data Time 0.029 (0.018)	Loss 2.4480 (2.3686)	Entropy 0.53525 (0.53683)	Top-1 acc 64.453 (67.037)	Top-5 acc 83.984 (85.954)	lr 0.00112
Train [104][2280/3239]	Time 0.239 (0.535)	Data Time 0.002 (0.018)	Loss 2.4983 (2.3688)	Entropy 0.53504 (0.53682)	Top-1 acc 63.281 (67.028)	Top-5 acc 80.859 (85.948)	lr 0.00112
Train [104][2290/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.018)	Loss 2.2874 (2.3689)	Entropy 0.53512 (0.53681)	Top-1 acc 67.188 (67.023)	Top-5 acc 88.672 (85.944)	lr 0.00112
Train [104][2300/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.018)	Loss 2.2895 (2.3686)	Entropy 0.53537 (0.53681)	Top-1 acc 67.188 (67.032)	Top-5 acc 89.453 (85.950)	lr 0.00112
Train [104][2310/3239]	Time 0.334 (0.533)	Data Time 0.001 (0.018)	Loss 2.3486 (2.3685)	Entropy 0.53568 (0.53680)	Top-1 acc 67.969 (67.031)	Top-5 acc 88.281 (85.954)	lr 0.00112
Train [104][2320/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.018)	Loss 2.3695 (2.3685)	Entropy 0.53548 (0.53680)	Top-1 acc 64.453 (67.029)	Top-5 acc 85.156 (85.956)	lr 0.00112
Train [104][2330/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.018)	Loss 2.2291 (2.3684)	Entropy 0.53541 (0.53679)	Top-1 acc 71.094 (67.027)	Top-5 acc 87.109 (85.956)	lr 0.00112
Train [104][2340/3239]	Time 0.223 (0.532)	Data Time 0.001 (0.018)	Loss 2.3257 (2.3685)	Entropy 0.53527 (0.53678)	Top-1 acc 70.312 (67.026)	Top-5 acc 87.891 (85.959)	lr 0.00112
Train [104][2350/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.018)	Loss 2.4506 (2.3684)	Entropy 0.53538 (0.53678)	Top-1 acc 64.062 (67.026)	Top-5 acc 83.203 (85.960)	lr 0.00112
Train [104][2360/3239]	Time 0.247 (0.531)	Data Time 0.001 (0.018)	Loss 2.3392 (2.3684)	Entropy 0.53553 (0.53677)	Top-1 acc 64.453 (67.025)	Top-5 acc 86.719 (85.965)	lr 0.00112
Train [104][2370/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.018)	Loss 2.4424 (2.3681)	Entropy 0.53514 (0.53677)	Top-1 acc 64.062 (67.028)	Top-5 acc 85.938 (85.969)	lr 0.00112
Train [104][2380/3239]	Time 0.253 (0.530)	Data Time 0.001 (0.017)	Loss 2.2363 (2.3681)	Entropy 0.53529 (0.53676)	Top-1 acc 74.219 (67.028)	Top-5 acc 89.062 (85.971)	lr 0.00112
Train [104][2390/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.017)	Loss 2.4266 (2.3680)	Entropy 0.53502 (0.53675)	Top-1 acc 65.625 (67.033)	Top-5 acc 84.766 (85.974)	lr 0.00112
Train [104][2400/3239]	Time 0.250 (0.529)	Data Time 0.001 (0.017)	Loss 2.4537 (2.3684)	Entropy 0.53456 (0.53674)	Top-1 acc 62.500 (67.023)	Top-5 acc 83.594 (85.967)	lr 0.00112
Train [104][2410/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.017)	Loss 2.3994 (2.3683)	Entropy 0.53470 (0.53673)	Top-1 acc 65.625 (67.028)	Top-5 acc 83.203 (85.967)	lr 0.00112
Train [104][2420/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.017)	Loss 2.2552 (2.3684)	Entropy 0.53466 (0.53673)	Top-1 acc 69.141 (67.026)	Top-5 acc 90.625 (85.967)	lr 0.00111
Train [104][2430/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.017)	Loss 2.4353 (2.3682)	Entropy 0.53450 (0.53672)	Top-1 acc 65.234 (67.030)	Top-5 acc 86.719 (85.970)	lr 0.00111
Train [104][2440/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.017)	Loss 2.4140 (2.3680)	Entropy 0.53464 (0.53671)	Top-1 acc 69.922 (67.041)	Top-5 acc 85.938 (85.973)	lr 0.00111
Train [104][2450/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.017)	Loss 2.3159 (2.3678)	Entropy 0.53496 (0.53670)	Top-1 acc 68.359 (67.044)	Top-5 acc 85.938 (85.976)	lr 0.00111
Train [104][2460/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.017)	Loss 2.3681 (2.3679)	Entropy 0.53511 (0.53669)	Top-1 acc 65.625 (67.041)	Top-5 acc 87.500 (85.977)	lr 0.00111
Train [104][2470/3239]	Time 0.406 (0.526)	Data Time 0.001 (0.017)	Loss 2.4435 (2.3679)	Entropy 0.53528 (0.53669)	Top-1 acc 65.625 (67.041)	Top-5 acc 86.328 (85.976)	lr 0.00111
Train [104][2480/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.017)	Loss 2.4193 (2.3680)	Entropy 0.53493 (0.53668)	Top-1 acc 67.969 (67.043)	Top-5 acc 84.766 (85.974)	lr 0.00111
Train [104][2490/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.3027 (2.3679)	Entropy 0.53504 (0.53667)	Top-1 acc 71.875 (67.050)	Top-5 acc 86.328 (85.976)	lr 0.00111
Train [104][2500/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.017)	Loss 2.1864 (2.3678)	Entropy 0.53513 (0.53667)	Top-1 acc 71.875 (67.053)	Top-5 acc 90.234 (85.978)	lr 0.00111
Train [104][2510/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.017)	Loss 2.4431 (2.3677)	Entropy 0.53524 (0.53666)	Top-1 acc 64.453 (67.059)	Top-5 acc 83.594 (85.978)	lr 0.00111
Train [104][2520/3239]	Time 0.278 (0.524)	Data Time 0.001 (0.017)	Loss 2.3068 (2.3677)	Entropy 0.53523 (0.53666)	Top-1 acc 68.750 (67.055)	Top-5 acc 87.891 (85.977)	lr 0.00111
Train [104][2530/3239]	Time 0.229 (0.524)	Data Time 0.001 (0.017)	Loss 2.5238 (2.3679)	Entropy 0.53497 (0.53665)	Top-1 acc 64.844 (67.054)	Top-5 acc 85.156 (85.975)	lr 0.00111
Train [104][2540/3239]	Time 0.333 (0.523)	Data Time 0.001 (0.016)	Loss 2.2651 (2.3680)	Entropy 0.53498 (0.53664)	Top-1 acc 70.312 (67.051)	Top-5 acc 86.328 (85.972)	lr 0.00111
Train [104][2550/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.016)	Loss 2.3383 (2.3681)	Entropy 0.53464 (0.53664)	Top-1 acc 69.531 (67.050)	Top-5 acc 86.719 (85.970)	lr 0.00111
Train [104][2560/3239]	Time 0.244 (0.522)	Data Time 0.001 (0.016)	Loss 2.2784 (2.3683)	Entropy 0.53507 (0.53663)	Top-1 acc 69.531 (67.042)	Top-5 acc 89.062 (85.968)	lr 0.00111
Train [104][2570/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.016)	Loss 2.3096 (2.3683)	Entropy 0.53527 (0.53662)	Top-1 acc 67.578 (67.042)	Top-5 acc 90.625 (85.972)	lr 0.00111
Train [104][2580/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.016)	Loss 2.3935 (2.3683)	Entropy 0.53511 (0.53662)	Top-1 acc 63.672 (67.041)	Top-5 acc 85.547 (85.972)	lr 0.00111
Train [104][2590/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.016)	Loss 2.4141 (2.3684)	Entropy 0.53531 (0.53661)	Top-1 acc 65.625 (67.038)	Top-5 acc 85.156 (85.972)	lr 0.00111
Train [104][2600/3239]	Time 0.221 (0.521)	Data Time 0.001 (0.016)	Loss 2.4829 (2.3684)	Entropy 0.53515 (0.53661)	Top-1 acc 61.328 (67.041)	Top-5 acc 83.203 (85.973)	lr 0.00111
Train [104][2610/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.016)	Loss 2.4478 (2.3685)	Entropy 0.53530 (0.53660)	Top-1 acc 65.625 (67.038)	Top-5 acc 83.203 (85.972)	lr 0.00111
Train [104][2620/3239]	Time 0.246 (0.520)	Data Time 0.001 (0.016)	Loss 2.3274 (2.3685)	Entropy 0.53537 (0.53660)	Top-1 acc 69.531 (67.035)	Top-5 acc 85.547 (85.971)	lr 0.00111
Train [104][2630/3239]	Time 0.334 (0.520)	Data Time 0.001 (0.016)	Loss 2.2192 (2.3685)	Entropy 0.53568 (0.53659)	Top-1 acc 68.359 (67.033)	Top-5 acc 88.672 (85.972)	lr 0.00111
Train [104][2640/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.016)	Loss 2.3637 (2.3687)	Entropy 0.53560 (0.53659)	Top-1 acc 67.578 (67.028)	Top-5 acc 85.938 (85.966)	lr 0.00111
Train [104][2650/3239]	Time 0.234 (0.519)	Data Time 0.001 (0.016)	Loss 2.3382 (2.3686)	Entropy 0.53559 (0.53659)	Top-1 acc 66.406 (67.032)	Top-5 acc 87.109 (85.967)	lr 0.00111
Train [104][2660/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.016)	Loss 2.4595 (2.3686)	Entropy 0.53567 (0.53658)	Top-1 acc 67.578 (67.037)	Top-5 acc 85.547 (85.969)	lr 0.00110
Train [104][2670/3239]	Time 0.228 (0.518)	Data Time 0.001 (0.016)	Loss 2.2276 (2.3686)	Entropy 0.53571 (0.53658)	Top-1 acc 69.531 (67.035)	Top-5 acc 86.719 (85.967)	lr 0.00110
Train [104][2680/3239]	Time 0.216 (0.517)	Data Time 0.001 (0.016)	Loss 2.2568 (2.3685)	Entropy 0.53573 (0.53657)	Top-1 acc 69.141 (67.038)	Top-5 acc 87.500 (85.970)	lr 0.00110
Train [104][2690/3239]	Time 0.223 (0.517)	Data Time 0.001 (0.016)	Loss 2.4246 (2.3685)	Entropy 0.53553 (0.53657)	Top-1 acc 66.406 (67.039)	Top-5 acc 85.938 (85.969)	lr 0.00110
Train [104][2700/3239]	Time 0.325 (0.517)	Data Time 0.001 (0.016)	Loss 2.3516 (2.3685)	Entropy 0.53552 (0.53657)	Top-1 acc 68.750 (67.044)	Top-5 acc 86.328 (85.968)	lr 0.00110
Train [104][2710/3239]	Time 0.276 (0.516)	Data Time 0.001 (0.016)	Loss 2.2707 (2.3684)	Entropy 0.53562 (0.53656)	Top-1 acc 71.484 (67.047)	Top-5 acc 87.500 (85.969)	lr 0.00110
Train [104][2720/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.015)	Loss 2.3237 (2.3684)	Entropy 0.53559 (0.53656)	Top-1 acc 71.094 (67.054)	Top-5 acc 86.719 (85.971)	lr 0.00110
Train [104][2730/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.015)	Loss 2.2426 (2.3683)	Entropy 0.53577 (0.53656)	Top-1 acc 69.531 (67.056)	Top-5 acc 87.109 (85.971)	lr 0.00110
Train [104][2740/3239]	Time 0.225 (0.515)	Data Time 0.001 (0.015)	Loss 2.5763 (2.3681)	Entropy 0.53560 (0.53655)	Top-1 acc 62.500 (67.064)	Top-5 acc 83.203 (85.975)	lr 0.00110
Train [104][2750/3239]	Time 0.226 (0.515)	Data Time 0.001 (0.015)	Loss 2.3310 (2.3680)	Entropy 0.53546 (0.53655)	Top-1 acc 66.406 (67.067)	Top-5 acc 85.938 (85.978)	lr 0.00110
Train [104][2760/3239]	Time 0.220 (0.514)	Data Time 0.001 (0.015)	Loss 2.3864 (2.3681)	Entropy 0.53557 (0.53655)	Top-1 acc 64.844 (67.060)	Top-5 acc 86.719 (85.977)	lr 0.00110
Train [104][2770/3239]	Time 0.236 (0.514)	Data Time 0.001 (0.015)	Loss 2.3453 (2.3678)	Entropy 0.53579 (0.53654)	Top-1 acc 68.750 (67.067)	Top-5 acc 86.328 (85.985)	lr 0.00110
Train [104][2780/3239]	Time 0.239 (0.513)	Data Time 0.001 (0.015)	Loss 2.3931 (2.3681)	Entropy 0.53561 (0.53654)	Top-1 acc 66.406 (67.063)	Top-5 acc 83.203 (85.980)	lr 0.00110
Train [104][2790/3239]	Time 0.333 (0.513)	Data Time 0.001 (0.015)	Loss 2.1113 (2.3680)	Entropy 0.53589 (0.53654)	Top-1 acc 71.094 (67.068)	Top-5 acc 91.797 (85.986)	lr 0.00110
Train [104][2800/3239]	Time 0.275 (0.513)	Data Time 0.001 (0.015)	Loss 2.4979 (2.3682)	Entropy 0.53603 (0.53654)	Top-1 acc 63.281 (67.062)	Top-5 acc 82.812 (85.981)	lr 0.00110
Train [104][2810/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.015)	Loss 2.3358 (2.3682)	Entropy 0.53627 (0.53653)	Top-1 acc 68.359 (67.065)	Top-5 acc 86.328 (85.982)	lr 0.00110
Train [104][2820/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.015)	Loss 2.2469 (2.3682)	Entropy 0.53604 (0.53653)	Top-1 acc 69.922 (67.066)	Top-5 acc 89.062 (85.982)	lr 0.00110
Train [104][2830/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.015)	Loss 2.3212 (2.3680)	Entropy 0.53578 (0.53653)	Top-1 acc 69.531 (67.071)	Top-5 acc 86.719 (85.987)	lr 0.00110
Train [104][2840/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.015)	Loss 2.2459 (2.3679)	Entropy 0.53604 (0.53653)	Top-1 acc 67.188 (67.075)	Top-5 acc 87.891 (85.987)	lr 0.00110
Train [104][2850/3239]	Time 0.227 (0.511)	Data Time 0.001 (0.015)	Loss 2.4616 (2.3680)	Entropy 0.53602 (0.53653)	Top-1 acc 63.281 (67.073)	Top-5 acc 84.766 (85.985)	lr 0.00110
Train [104][2860/3239]	Time 0.330 (0.511)	Data Time 0.001 (0.015)	Loss 2.2880 (2.3680)	Entropy 0.53639 (0.53653)	Top-1 acc 67.578 (67.073)	Top-5 acc 88.281 (85.987)	lr 0.00110
Train [104][2870/3239]	Time 0.219 (0.511)	Data Time 0.001 (0.015)	Loss 2.4127 (2.3684)	Entropy 0.53652 (0.53653)	Top-1 acc 69.141 (67.065)	Top-5 acc 84.375 (85.979)	lr 0.00110
Train [104][2880/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.015)	Loss 2.3337 (2.3685)	Entropy 0.53676 (0.53653)	Top-1 acc 68.750 (67.064)	Top-5 acc 85.156 (85.975)	lr 0.00110
Train [104][2890/3239]	Time 0.234 (0.510)	Data Time 0.002 (0.015)	Loss 2.2418 (2.3684)	Entropy 0.53674 (0.53653)	Top-1 acc 71.094 (67.067)	Top-5 acc 88.672 (85.976)	lr 0.00110
Train [104][2900/3239]	Time 0.225 (0.510)	Data Time 0.001 (0.015)	Loss 2.3748 (2.3683)	Entropy 0.53655 (0.53653)	Top-1 acc 65.234 (67.070)	Top-5 acc 85.156 (85.976)	lr 0.00109
Train [104][2910/3239]	Time 0.230 (0.509)	Data Time 0.001 (0.015)	Loss 2.4892 (2.3684)	Entropy 0.53656 (0.53653)	Top-1 acc 66.406 (67.068)	Top-5 acc 84.375 (85.974)	lr 0.00109
Train [104][2920/3239]	Time 0.382 (0.527)	Data Time 0.005 (0.015)	Loss 2.6763 (2.3683)	Entropy 0.53648 (0.53653)	Top-1 acc 58.984 (67.069)	Top-5 acc 78.906 (85.974)	lr 0.00109
Train [104][2930/3239]	Time 0.236 (0.527)	Data Time 0.002 (0.015)	Loss 2.3878 (2.3682)	Entropy 0.53682 (0.53653)	Top-1 acc 65.625 (67.065)	Top-5 acc 84.375 (85.975)	lr 0.00109
Train [104][2940/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.014)	Loss 2.3118 (2.3679)	Entropy 0.53694 (0.53653)	Top-1 acc 67.578 (67.073)	Top-5 acc 88.281 (85.979)	lr 0.00109
Train [104][2950/3239]	Time 0.326 (0.526)	Data Time 0.001 (0.014)	Loss 2.4752 (2.3680)	Entropy 0.53692 (0.53653)	Top-1 acc 64.844 (67.072)	Top-5 acc 84.766 (85.979)	lr 0.00109
Train [104][2960/3239]	Time 0.266 (0.526)	Data Time 0.001 (0.014)	Loss 2.1907 (2.3679)	Entropy 0.53710 (0.53653)	Top-1 acc 72.656 (67.075)	Top-5 acc 91.016 (85.980)	lr 0.00109
Train [104][2970/3239]	Time 0.281 (0.525)	Data Time 0.001 (0.014)	Loss 2.2523 (2.3678)	Entropy 0.53728 (0.53653)	Top-1 acc 69.141 (67.077)	Top-5 acc 89.062 (85.983)	lr 0.00109
Train [104][2980/3239]	Time 0.224 (0.525)	Data Time 0.001 (0.014)	Loss 2.5630 (2.3678)	Entropy 0.53738 (0.53654)	Top-1 acc 60.938 (67.074)	Top-5 acc 83.203 (85.985)	lr 0.00109
Train [104][2990/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.014)	Loss 2.2958 (2.3677)	Entropy 0.53754 (0.53654)	Top-1 acc 69.531 (67.078)	Top-5 acc 87.500 (85.989)	lr 0.00109
Train [104][3000/3239]	Time 0.290 (0.525)	Data Time 0.002 (0.014)	Loss 2.3340 (2.3678)	Entropy 0.53775 (0.53654)	Top-1 acc 69.922 (67.075)	Top-5 acc 89.062 (85.987)	lr 0.00109
Train [104][3010/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.014)	Loss 2.3403 (2.3679)	Entropy 0.53764 (0.53655)	Top-1 acc 66.016 (67.068)	Top-5 acc 87.500 (85.987)	lr 0.00109
Train [104][3020/3239]	Time 0.335 (0.524)	Data Time 0.001 (0.014)	Loss 2.4835 (2.3680)	Entropy 0.53762 (0.53655)	Top-1 acc 61.328 (67.063)	Top-5 acc 83.203 (85.989)	lr 0.00109
Train [104][3030/3239]	Time 0.229 (0.524)	Data Time 0.001 (0.014)	Loss 2.3886 (2.3679)	Entropy 0.53774 (0.53655)	Top-1 acc 68.750 (67.067)	Top-5 acc 87.500 (85.992)	lr 0.00109
Train [104][3040/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.014)	Loss 2.1877 (2.3677)	Entropy 0.53779 (0.53656)	Top-1 acc 71.094 (67.073)	Top-5 acc 90.234 (85.994)	lr 0.00109
Train [104][3050/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.014)	Loss 2.4569 (2.3676)	Entropy 0.53783 (0.53656)	Top-1 acc 65.234 (67.074)	Top-5 acc 85.156 (85.998)	lr 0.00109
Train [104][3060/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.014)	Loss 2.3678 (2.3675)	Entropy 0.53804 (0.53657)	Top-1 acc 66.797 (67.075)	Top-5 acc 86.719 (86.000)	lr 0.00109
Train [104][3070/3239]	Time 0.222 (0.522)	Data Time 0.001 (0.014)	Loss 2.3365 (2.3674)	Entropy 0.53789 (0.53657)	Top-1 acc 68.359 (67.078)	Top-5 acc 84.766 (86.002)	lr 0.00109
Train [104][3080/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.014)	Loss 2.3571 (2.3676)	Entropy 0.53769 (0.53658)	Top-1 acc 68.359 (67.073)	Top-5 acc 86.719 (85.998)	lr 0.00109
Train [104][3090/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.014)	Loss 2.4182 (2.3679)	Entropy 0.53762 (0.53658)	Top-1 acc 65.234 (67.065)	Top-5 acc 83.984 (85.994)	lr 0.00109
Train [104][3100/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.014)	Loss 2.4887 (2.3678)	Entropy 0.53773 (0.53658)	Top-1 acc 63.672 (67.067)	Top-5 acc 84.766 (85.997)	lr 0.00109
Train [104][3110/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.014)	Loss 2.2031 (2.3676)	Entropy 0.53794 (0.53659)	Top-1 acc 71.875 (67.069)	Top-5 acc 89.062 (86.001)	lr 0.00109
Train [104][3120/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.014)	Loss 2.4167 (2.3676)	Entropy 0.53782 (0.53659)	Top-1 acc 71.094 (67.072)	Top-5 acc 87.500 (86.001)	lr 0.00109
Train [104][3130/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.014)	Loss 2.3472 (2.3676)	Entropy 0.53767 (0.53659)	Top-1 acc 65.625 (67.070)	Top-5 acc 87.500 (86.001)	lr 0.00109
Train [104][3140/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.014)	Loss 2.3129 (2.3678)	Entropy 0.53768 (0.53660)	Top-1 acc 66.406 (67.063)	Top-5 acc 85.547 (85.997)	lr 0.00108
Train [104][3150/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.014)	Loss 2.4444 (2.3677)	Entropy 0.53757 (0.53660)	Top-1 acc 64.062 (67.063)	Top-5 acc 84.766 (86.000)	lr 0.00108
Train [104][3160/3239]	Time 0.245 (0.520)	Data Time 0.001 (0.014)	Loss 2.2710 (2.3677)	Entropy 0.53784 (0.53660)	Top-1 acc 67.188 (67.061)	Top-5 acc 89.062 (86.002)	lr 0.00108
Train [104][3170/3239]	Time 0.259 (0.519)	Data Time 0.001 (0.014)	Loss 2.3913 (2.3677)	Entropy 0.53783 (0.53661)	Top-1 acc 64.844 (67.061)	Top-5 acc 86.719 (86.001)	lr 0.00108
Train [104][3180/3239]	Time 0.314 (0.519)	Data Time 0.000 (0.014)	Loss 2.2668 (2.3675)	Entropy 0.53771 (0.53661)	Top-1 acc 68.750 (67.066)	Top-5 acc 87.500 (86.005)	lr 0.00108
Train [104][3190/3239]	Time 0.221 (0.519)	Data Time 0.000 (0.013)	Loss 2.2662 (2.3676)	Entropy 0.53757 (0.53662)	Top-1 acc 69.141 (67.063)	Top-5 acc 87.500 (86.003)	lr 0.00108
Train [104][3200/3239]	Time 0.228 (0.518)	Data Time 0.000 (0.013)	Loss 2.3900 (2.3676)	Entropy 0.53754 (0.53662)	Top-1 acc 66.016 (67.063)	Top-5 acc 87.109 (86.004)	lr 0.00108
Train [104][3210/3239]	Time 0.242 (0.518)	Data Time 0.000 (0.013)	Loss 2.4982 (2.3677)	Entropy 0.53747 (0.53662)	Top-1 acc 64.062 (67.061)	Top-5 acc 83.203 (86.001)	lr 0.00108
Train [104][3220/3239]	Time 0.224 (0.517)	Data Time 0.000 (0.013)	Loss 2.2378 (2.3675)	Entropy 0.53775 (0.53663)	Top-1 acc 71.875 (67.068)	Top-5 acc 87.891 (86.005)	lr 0.00108
Train [104][3230/3239]	Time 0.224 (0.517)	Data Time 0.000 (0.013)	Loss 2.2747 (2.3674)	Entropy 0.53776 (0.53663)	Top-1 acc 67.578 (67.068)	Top-5 acc 87.891 (86.009)	lr 0.00108
Train [104][3239/3239]	Time 0.990 (0.517)	Data Time 0.000 (0.013)	Loss 2.1447 (2.3674)	Entropy 0.53781 (0.53663)	Top-1 acc 74.074 (67.068)	Top-5 acc 88.889 (86.009)	lr 0.00108
==========Valid [104/120]	loss 1.184	top-1 acc 72.561 (72.786)	top-5 acc 90.525	Train top-1 67.068	top-5 86.009	Entropy 0.53781	Latency-None: 0.000ms	Flops: 539.00M
Train [105][0/3239]	Time 36.015 (36.015)	Data Time 33.807 (33.807)	Loss 2.2860 (2.2860)	Entropy 0.53770 (0.53770)	Top-1 acc 68.750 (68.750)	Top-5 acc 89.062 (89.062)	lr 0.00108
Train [105][10/3239]	Time 0.347 (3.945)	Data Time 0.001 (3.229)	Loss 2.4139 (2.3471)	Entropy 0.53784 (0.53777)	Top-1 acc 66.406 (68.182)	Top-5 acc 83.984 (86.399)	lr 0.00108
Train [105][20/3239]	Time 0.235 (2.257)	Data Time 0.002 (1.692)	Loss 2.4031 (2.3855)	Entropy 0.53792 (0.53781)	Top-1 acc 64.062 (66.815)	Top-5 acc 83.594 (85.900)	lr 0.00108
Train [105][30/3239]	Time 0.226 (1.659)	Data Time 0.001 (1.147)	Loss 2.2946 (2.3956)	Entropy 0.53771 (0.53780)	Top-1 acc 70.703 (66.658)	Top-5 acc 86.328 (85.660)	lr 0.00108
Train [105][40/3239]	Time 0.226 (1.353)	Data Time 0.001 (0.867)	Loss 2.2997 (2.3924)	Entropy 0.53800 (0.53780)	Top-1 acc 66.797 (66.502)	Top-5 acc 86.719 (85.528)	lr 0.00108
Train [105][50/3239]	Time 0.224 (1.166)	Data Time 0.001 (0.698)	Loss 2.4333 (2.3948)	Entropy 0.53825 (0.53785)	Top-1 acc 67.188 (66.567)	Top-5 acc 86.719 (85.555)	lr 0.00108
Train [105][60/3239]	Time 0.233 (1.044)	Data Time 0.001 (0.583)	Loss 2.3103 (2.3838)	Entropy 0.53855 (0.53794)	Top-1 acc 68.750 (66.810)	Top-5 acc 87.891 (85.726)	lr 0.00108
Train [105][70/3239]	Time 0.227 (0.953)	Data Time 0.001 (0.501)	Loss 2.2610 (2.3861)	Entropy 0.53875 (0.53803)	Top-1 acc 68.359 (66.621)	Top-5 acc 90.234 (85.695)	lr 0.00108
Train [105][80/3239]	Time 0.313 (0.886)	Data Time 0.001 (0.440)	Loss 2.5892 (2.4005)	Entropy 0.53881 (0.53812)	Top-1 acc 64.453 (66.276)	Top-5 acc 80.859 (85.344)	lr 0.00108
Train [105][90/3239]	Time 0.232 (0.832)	Data Time 0.001 (0.392)	Loss 2.2111 (2.3911)	Entropy 0.53899 (0.53820)	Top-1 acc 75.000 (66.647)	Top-5 acc 88.672 (85.521)	lr 0.00108
Train [105][100/3239]	Time 0.228 (0.789)	Data Time 0.001 (0.353)	Loss 2.6254 (2.3907)	Entropy 0.53908 (0.53828)	Top-1 acc 61.719 (66.600)	Top-5 acc 79.688 (85.508)	lr 0.00108
Train [105][110/3239]	Time 0.236 (0.755)	Data Time 0.001 (0.321)	Loss 2.1126 (2.3912)	Entropy 0.53916 (0.53836)	Top-1 acc 70.312 (66.719)	Top-5 acc 90.625 (85.494)	lr 0.00108
Train [105][120/3239]	Time 0.238 (0.726)	Data Time 0.001 (0.295)	Loss 2.3902 (2.3922)	Entropy 0.53910 (0.53843)	Top-1 acc 66.016 (66.658)	Top-5 acc 84.766 (85.476)	lr 0.00108
Train [105][130/3239]	Time 0.223 (0.700)	Data Time 0.001 (0.272)	Loss 2.2229 (2.3926)	Entropy 0.53900 (0.53848)	Top-1 acc 72.656 (66.630)	Top-5 acc 87.891 (85.437)	lr 0.00108
Train [105][140/3239]	Time 0.235 (0.680)	Data Time 0.001 (0.253)	Loss 2.3617 (2.3900)	Entropy 0.53914 (0.53852)	Top-1 acc 67.188 (66.658)	Top-5 acc 86.719 (85.525)	lr 0.00107
Train [105][150/3239]	Time 0.232 (0.662)	Data Time 0.001 (0.237)	Loss 2.3024 (2.3878)	Entropy 0.53943 (0.53856)	Top-1 acc 70.312 (66.699)	Top-5 acc 87.891 (85.583)	lr 0.00107
Train [105][160/3239]	Time 0.225 (0.646)	Data Time 0.001 (0.222)	Loss 2.1691 (2.3847)	Entropy 0.53938 (0.53862)	Top-1 acc 73.047 (66.833)	Top-5 acc 90.625 (85.629)	lr 0.00107
Train [105][170/3239]	Time 0.231 (0.631)	Data Time 0.001 (0.209)	Loss 2.2212 (2.3794)	Entropy 0.53936 (0.53866)	Top-1 acc 69.531 (66.929)	Top-5 acc 88.672 (85.732)	lr 0.00107
Train [105][180/3239]	Time 0.248 (0.619)	Data Time 0.001 (0.198)	Loss 2.0779 (2.3790)	Entropy 0.53936 (0.53870)	Top-1 acc 74.609 (66.933)	Top-5 acc 93.359 (85.748)	lr 0.00107
Train [105][190/3239]	Time 0.227 (0.608)	Data Time 0.001 (0.187)	Loss 2.5456 (2.3787)	Entropy 0.53948 (0.53874)	Top-1 acc 63.672 (66.915)	Top-5 acc 80.469 (85.772)	lr 0.00107
Train [105][200/3239]	Time 0.285 (0.605)	Data Time 0.001 (0.178)	Loss 2.3973 (2.3753)	Entropy 0.53944 (0.53877)	Top-1 acc 66.406 (66.976)	Top-5 acc 83.203 (85.784)	lr 0.00107
Train [105][210/3239]	Time 0.231 (0.597)	Data Time 0.001 (0.170)	Loss 2.2338 (2.3719)	Entropy 0.53972 (0.53881)	Top-1 acc 69.922 (67.071)	Top-5 acc 88.281 (85.852)	lr 0.00107
Train [105][220/3239]	Time 0.265 (0.588)	Data Time 0.001 (0.162)	Loss 2.2863 (2.3738)	Entropy 0.53937 (0.53884)	Top-1 acc 66.797 (67.009)	Top-5 acc 88.672 (85.837)	lr 0.00107
Train [105][230/3239]	Time 0.240 (0.581)	Data Time 0.001 (0.155)	Loss 2.3267 (2.3764)	Entropy 0.53995 (0.53887)	Top-1 acc 67.188 (66.961)	Top-5 acc 86.328 (85.797)	lr 0.00107
Train [105][240/3239]	Time 0.331 (0.574)	Data Time 0.001 (0.149)	Loss 2.3540 (2.3782)	Entropy 0.53987 (0.53892)	Top-1 acc 68.750 (66.909)	Top-5 acc 86.328 (85.764)	lr 0.00107
Train [105][250/3239]	Time 0.256 (0.567)	Data Time 0.002 (0.143)	Loss 2.3379 (2.3800)	Entropy 0.54006 (0.53896)	Top-1 acc 68.359 (66.853)	Top-5 acc 86.719 (85.709)	lr 0.00107
Train [105][260/3239]	Time 0.226 (0.561)	Data Time 0.001 (0.138)	Loss 2.3539 (2.3833)	Entropy 0.53969 (0.53899)	Top-1 acc 66.406 (66.767)	Top-5 acc 88.281 (85.650)	lr 0.00107
Train [105][270/3239]	Time 0.216 (0.555)	Data Time 0.001 (0.132)	Loss 2.5401 (2.3834)	Entropy 0.53990 (0.53902)	Top-1 acc 63.281 (66.784)	Top-5 acc 81.641 (85.651)	lr 0.00107
Train [105][280/3239]	Time 0.239 (0.550)	Data Time 0.001 (0.128)	Loss 2.4891 (2.3841)	Entropy 0.53991 (0.53905)	Top-1 acc 64.062 (66.783)	Top-5 acc 83.203 (85.647)	lr 0.00107
Train [105][290/3239]	Time 0.226 (0.545)	Data Time 0.001 (0.123)	Loss 2.1216 (2.3799)	Entropy 0.53997 (0.53907)	Top-1 acc 73.828 (66.863)	Top-5 acc 91.016 (85.725)	lr 0.00107
Train [105][300/3239]	Time 0.224 (0.541)	Data Time 0.001 (0.119)	Loss 2.2174 (2.3768)	Entropy 0.53985 (0.53910)	Top-1 acc 72.656 (66.959)	Top-5 acc 88.672 (85.774)	lr 0.00107
Train [105][310/3239]	Time 0.326 (0.536)	Data Time 0.001 (0.116)	Loss 2.2311 (2.3753)	Entropy 0.54025 (0.53913)	Top-1 acc 67.578 (67.008)	Top-5 acc 87.109 (85.782)	lr 0.00107
Train [105][320/3239]	Time 0.230 (0.532)	Data Time 0.001 (0.112)	Loss 2.4938 (2.3767)	Entropy 0.54014 (0.53916)	Top-1 acc 64.844 (66.992)	Top-5 acc 84.766 (85.738)	lr 0.00107
Train [105][330/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.109)	Loss 2.5949 (2.3768)	Entropy 0.54001 (0.53919)	Top-1 acc 59.766 (66.983)	Top-5 acc 82.422 (85.759)	lr 0.00107
Train [105][340/3239]	Time 0.285 (0.681)	Data Time 0.003 (0.106)	Loss 2.3931 (2.3778)	Entropy 0.53990 (0.53921)	Top-1 acc 67.578 (66.982)	Top-5 acc 86.719 (85.742)	lr 0.00107
Train [105][350/3239]	Time 0.228 (0.674)	Data Time 0.002 (0.103)	Loss 2.1686 (2.3786)	Entropy 0.54013 (0.53923)	Top-1 acc 72.266 (66.954)	Top-5 acc 87.891 (85.716)	lr 0.00107
Train [105][360/3239]	Time 0.229 (0.667)	Data Time 0.001 (0.100)	Loss 2.2110 (2.3757)	Entropy 0.53996 (0.53926)	Top-1 acc 71.094 (67.005)	Top-5 acc 87.109 (85.764)	lr 0.00107
Train [105][370/3239]	Time 0.242 (0.660)	Data Time 0.001 (0.097)	Loss 2.4435 (2.3758)	Entropy 0.54015 (0.53928)	Top-1 acc 65.234 (67.014)	Top-5 acc 81.250 (85.737)	lr 0.00107
Train [105][380/3239]	Time 0.236 (0.654)	Data Time 0.001 (0.095)	Loss 2.5412 (2.3771)	Entropy 0.54014 (0.53930)	Top-1 acc 62.500 (66.975)	Top-5 acc 84.766 (85.726)	lr 0.00107
Train [105][390/3239]	Time 0.232 (0.647)	Data Time 0.001 (0.092)	Loss 2.2308 (2.3768)	Entropy 0.54069 (0.53933)	Top-1 acc 67.969 (66.950)	Top-5 acc 88.672 (85.743)	lr 0.00106
Train [105][400/3239]	Time 0.479 (0.642)	Data Time 0.003 (0.090)	Loss 2.4554 (2.3768)	Entropy 0.54071 (0.53936)	Top-1 acc 66.797 (66.961)	Top-5 acc 84.375 (85.751)	lr 0.00106
Train [105][410/3239]	Time 0.235 (0.639)	Data Time 0.001 (0.088)	Loss 2.2461 (2.3758)	Entropy 0.54065 (0.53939)	Top-1 acc 69.922 (66.979)	Top-5 acc 87.500 (85.754)	lr 0.00106
Train [105][420/3239]	Time 0.215 (0.634)	Data Time 0.001 (0.086)	Loss 2.9519 (2.3761)	Entropy 0.54077 (0.53942)	Top-1 acc 53.516 (66.973)	Top-5 acc 77.734 (85.762)	lr 0.00106
Train [105][430/3239]	Time 0.242 (0.629)	Data Time 0.001 (0.084)	Loss 2.3574 (2.3764)	Entropy 0.54074 (0.53945)	Top-1 acc 66.797 (66.978)	Top-5 acc 83.594 (85.747)	lr 0.00106
Train [105][440/3239]	Time 0.247 (0.624)	Data Time 0.001 (0.082)	Loss 2.2479 (2.3759)	Entropy 0.54089 (0.53948)	Top-1 acc 74.219 (66.994)	Top-5 acc 88.672 (85.757)	lr 0.00106
Train [105][450/3239]	Time 0.238 (0.619)	Data Time 0.001 (0.080)	Loss 2.3945 (2.3765)	Entropy 0.54081 (0.53952)	Top-1 acc 64.453 (66.980)	Top-5 acc 84.766 (85.743)	lr 0.00106
Train [105][460/3239]	Time 0.276 (0.615)	Data Time 0.001 (0.079)	Loss 2.4235 (2.3765)	Entropy 0.54118 (0.53954)	Top-1 acc 67.578 (66.968)	Top-5 acc 87.109 (85.749)	lr 0.00106
Train [105][470/3239]	Time 0.315 (0.611)	Data Time 0.001 (0.077)	Loss 2.1366 (2.3759)	Entropy 0.54137 (0.53958)	Top-1 acc 69.531 (66.980)	Top-5 acc 89.844 (85.765)	lr 0.00106
Train [105][480/3239]	Time 0.225 (0.607)	Data Time 0.001 (0.075)	Loss 2.5173 (2.3753)	Entropy 0.54149 (0.53962)	Top-1 acc 67.188 (67.007)	Top-5 acc 83.203 (85.766)	lr 0.00106
Train [105][490/3239]	Time 0.220 (0.603)	Data Time 0.001 (0.074)	Loss 2.3477 (2.3746)	Entropy 0.54158 (0.53966)	Top-1 acc 66.797 (67.013)	Top-5 acc 86.719 (85.769)	lr 0.00106
Train [105][500/3239]	Time 0.283 (0.599)	Data Time 0.001 (0.073)	Loss 2.2075 (2.3744)	Entropy 0.54122 (0.53969)	Top-1 acc 69.141 (67.025)	Top-5 acc 88.672 (85.785)	lr 0.00106
Train [105][510/3239]	Time 0.272 (0.596)	Data Time 0.001 (0.071)	Loss 2.3042 (2.3740)	Entropy 0.54099 (0.53972)	Top-1 acc 67.969 (67.024)	Top-5 acc 85.938 (85.798)	lr 0.00106
Train [105][520/3239]	Time 0.226 (0.592)	Data Time 0.001 (0.070)	Loss 2.2871 (2.3746)	Entropy 0.54103 (0.53975)	Top-1 acc 68.750 (67.014)	Top-5 acc 86.328 (85.791)	lr 0.00106
Train [105][530/3239]	Time 0.223 (0.589)	Data Time 0.001 (0.069)	Loss 2.3758 (2.3745)	Entropy 0.54081 (0.53977)	Top-1 acc 67.188 (67.011)	Top-5 acc 86.328 (85.796)	lr 0.00106
Train [105][540/3239]	Time 0.243 (0.586)	Data Time 0.001 (0.067)	Loss 2.3822 (2.3751)	Entropy 0.54075 (0.53979)	Top-1 acc 69.141 (67.015)	Top-5 acc 85.547 (85.792)	lr 0.00106
Train [105][550/3239]	Time 0.234 (0.583)	Data Time 0.001 (0.066)	Loss 2.2920 (2.3745)	Entropy 0.54076 (0.53980)	Top-1 acc 69.531 (67.041)	Top-5 acc 83.984 (85.795)	lr 0.00106
Train [105][560/3239]	Time 0.329 (0.579)	Data Time 0.001 (0.065)	Loss 2.3296 (2.3743)	Entropy 0.54038 (0.53982)	Top-1 acc 68.750 (67.036)	Top-5 acc 87.891 (85.797)	lr 0.00106
Train [105][570/3239]	Time 0.230 (0.576)	Data Time 0.001 (0.064)	Loss 2.2846 (2.3724)	Entropy 0.53969 (0.53982)	Top-1 acc 69.531 (67.083)	Top-5 acc 86.328 (85.828)	lr 0.00106
Train [105][580/3239]	Time 0.230 (0.573)	Data Time 0.001 (0.063)	Loss 2.4499 (2.3721)	Entropy 0.53991 (0.53982)	Top-1 acc 62.891 (67.097)	Top-5 acc 85.156 (85.843)	lr 0.00106
Train [105][590/3239]	Time 0.227 (0.571)	Data Time 0.001 (0.062)	Loss 2.4084 (2.3710)	Entropy 0.53995 (0.53982)	Top-1 acc 66.016 (67.135)	Top-5 acc 85.547 (85.872)	lr 0.00106
Train [105][600/3239]	Time 0.233 (0.568)	Data Time 0.001 (0.061)	Loss 2.2588 (2.3709)	Entropy 0.54008 (0.53983)	Top-1 acc 66.797 (67.136)	Top-5 acc 89.844 (85.869)	lr 0.00106
Train [105][610/3239]	Time 0.229 (0.565)	Data Time 0.001 (0.060)	Loss 2.2705 (2.3723)	Entropy 0.53996 (0.53983)	Top-1 acc 67.188 (67.081)	Top-5 acc 87.500 (85.849)	lr 0.00106
Train [105][620/3239]	Time 0.241 (0.563)	Data Time 0.001 (0.059)	Loss 2.1626 (2.3717)	Entropy 0.54033 (0.53983)	Top-1 acc 72.266 (67.094)	Top-5 acc 90.234 (85.861)	lr 0.00106
Train [105][630/3239]	Time 0.357 (0.561)	Data Time 0.001 (0.058)	Loss 2.3612 (2.3705)	Entropy 0.54040 (0.53984)	Top-1 acc 67.969 (67.122)	Top-5 acc 86.328 (85.881)	lr 0.00105
Train [105][640/3239]	Time 0.223 (0.559)	Data Time 0.001 (0.057)	Loss 2.4053 (2.3703)	Entropy 0.54037 (0.53985)	Top-1 acc 69.141 (67.131)	Top-5 acc 83.203 (85.892)	lr 0.00105
Train [105][650/3239]	Time 0.235 (0.556)	Data Time 0.001 (0.056)	Loss 2.2649 (2.3698)	Entropy 0.54054 (0.53986)	Top-1 acc 69.141 (67.146)	Top-5 acc 86.719 (85.891)	lr 0.00105
Train [105][660/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.055)	Loss 3.1064 (2.3709)	Entropy 0.54047 (0.53987)	Top-1 acc 50.000 (67.096)	Top-5 acc 71.875 (85.863)	lr 0.00105
Train [105][670/3239]	Time 0.234 (0.552)	Data Time 0.001 (0.055)	Loss 2.3822 (2.3704)	Entropy 0.54023 (0.53988)	Top-1 acc 67.188 (67.114)	Top-5 acc 83.594 (85.866)	lr 0.00105
Train [105][680/3239]	Time 0.232 (0.550)	Data Time 0.001 (0.054)	Loss 2.3815 (2.3692)	Entropy 0.54001 (0.53988)	Top-1 acc 68.359 (67.141)	Top-5 acc 84.375 (85.879)	lr 0.00105
Train [105][690/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.053)	Loss 2.3757 (2.3684)	Entropy 0.54026 (0.53989)	Top-1 acc 64.453 (67.152)	Top-5 acc 86.328 (85.896)	lr 0.00105
Train [105][700/3239]	Time 0.245 (0.546)	Data Time 0.001 (0.052)	Loss 2.4681 (2.3683)	Entropy 0.53995 (0.53989)	Top-1 acc 65.234 (67.145)	Top-5 acc 85.156 (85.899)	lr 0.00105
Train [105][710/3239]	Time 0.224 (0.544)	Data Time 0.001 (0.052)	Loss 2.6282 (2.3699)	Entropy 0.54016 (0.53989)	Top-1 acc 60.938 (67.107)	Top-5 acc 80.859 (85.874)	lr 0.00105
Train [105][720/3239]	Time 0.359 (0.543)	Data Time 0.001 (0.051)	Loss 2.5196 (2.3688)	Entropy 0.54008 (0.53989)	Top-1 acc 63.672 (67.145)	Top-5 acc 83.984 (85.894)	lr 0.00105
Train [105][730/3239]	Time 0.279 (0.543)	Data Time 0.001 (0.050)	Loss 2.2522 (2.3681)	Entropy 0.54012 (0.53990)	Top-1 acc 69.531 (67.163)	Top-5 acc 91.406 (85.901)	lr 0.00105
Train [105][740/3239]	Time 0.222 (0.541)	Data Time 0.001 (0.050)	Loss 2.3431 (2.3678)	Entropy 0.54070 (0.53990)	Top-1 acc 71.875 (67.173)	Top-5 acc 85.547 (85.901)	lr 0.00105
Train [105][750/3239]	Time 0.236 (0.539)	Data Time 0.001 (0.049)	Loss 2.2760 (2.3679)	Entropy 0.54104 (0.53991)	Top-1 acc 66.016 (67.167)	Top-5 acc 86.328 (85.897)	lr 0.00105
Train [105][760/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.048)	Loss 2.5170 (2.3700)	Entropy 0.54110 (0.53993)	Top-1 acc 64.453 (67.120)	Top-5 acc 82.031 (85.863)	lr 0.00105
Train [105][770/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.048)	Loss 2.3832 (2.3698)	Entropy 0.54104 (0.53994)	Top-1 acc 67.578 (67.123)	Top-5 acc 87.109 (85.867)	lr 0.00105
Train [105][780/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.047)	Loss 2.3624 (2.3700)	Entropy 0.54108 (0.53996)	Top-1 acc 67.969 (67.121)	Top-5 acc 83.984 (85.852)	lr 0.00105
Train [105][790/3239]	Time 0.325 (0.533)	Data Time 0.002 (0.047)	Loss 2.1833 (2.3708)	Entropy 0.54152 (0.53997)	Top-1 acc 70.703 (67.101)	Top-5 acc 89.844 (85.841)	lr 0.00105
Train [105][800/3239]	Time 0.225 (0.531)	Data Time 0.001 (0.046)	Loss 2.2554 (2.3706)	Entropy 0.54147 (0.53999)	Top-1 acc 68.359 (67.102)	Top-5 acc 88.672 (85.855)	lr 0.00105
Train [105][810/3239]	Time 0.220 (0.529)	Data Time 0.001 (0.045)	Loss 2.3748 (2.3702)	Entropy 0.54119 (0.54001)	Top-1 acc 65.625 (67.112)	Top-5 acc 86.328 (85.869)	lr 0.00105
Train [105][820/3239]	Time 0.222 (0.528)	Data Time 0.001 (0.045)	Loss 2.5651 (2.3699)	Entropy 0.54118 (0.54002)	Top-1 acc 59.766 (67.126)	Top-5 acc 81.641 (85.870)	lr 0.00105
Train [105][830/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.044)	Loss 2.2508 (2.3695)	Entropy 0.54094 (0.54004)	Top-1 acc 72.656 (67.138)	Top-5 acc 88.672 (85.886)	lr 0.00105
Train [105][840/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.044)	Loss 2.4232 (2.3698)	Entropy 0.54115 (0.54005)	Top-1 acc 64.062 (67.131)	Top-5 acc 86.328 (85.880)	lr 0.00105
Train [105][850/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.043)	Loss 2.3467 (2.3699)	Entropy 0.54112 (0.54006)	Top-1 acc 67.578 (67.137)	Top-5 acc 86.719 (85.879)	lr 0.00105
Train [105][860/3239]	Time 0.323 (0.522)	Data Time 0.001 (0.043)	Loss 2.4764 (2.3697)	Entropy 0.54117 (0.54007)	Top-1 acc 67.578 (67.146)	Top-5 acc 83.594 (85.880)	lr 0.00105
Train [105][870/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.042)	Loss 2.3585 (2.3699)	Entropy 0.54083 (0.54009)	Top-1 acc 64.844 (67.144)	Top-5 acc 87.891 (85.886)	lr 0.00105
Train [105][880/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.042)	Loss 2.2389 (2.3693)	Entropy 0.54066 (0.54009)	Top-1 acc 71.484 (67.166)	Top-5 acc 87.109 (85.894)	lr 0.00104
Train [105][890/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.042)	Loss 2.4019 (2.3689)	Entropy 0.54105 (0.54010)	Top-1 acc 66.406 (67.172)	Top-5 acc 83.594 (85.896)	lr 0.00104
Train [105][900/3239]	Time 0.236 (0.517)	Data Time 0.001 (0.041)	Loss 2.3724 (2.3694)	Entropy 0.54101 (0.54011)	Top-1 acc 63.672 (67.154)	Top-5 acc 85.547 (85.884)	lr 0.00104
Train [105][910/3239]	Time 0.246 (0.516)	Data Time 0.017 (0.041)	Loss 2.3078 (2.3689)	Entropy 0.54107 (0.54012)	Top-1 acc 67.578 (67.170)	Top-5 acc 87.109 (85.890)	lr 0.00104
Train [105][920/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.040)	Loss 2.4079 (2.3686)	Entropy 0.54105 (0.54013)	Top-1 acc 71.484 (67.181)	Top-5 acc 87.109 (85.896)	lr 0.00104
Train [105][930/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.040)	Loss 2.3867 (2.3676)	Entropy 0.54056 (0.54014)	Top-1 acc 66.797 (67.206)	Top-5 acc 84.766 (85.911)	lr 0.00104
Train [105][940/3239]	Time 0.233 (0.512)	Data Time 0.001 (0.039)	Loss 2.2961 (2.3675)	Entropy 0.54074 (0.54014)	Top-1 acc 63.672 (67.198)	Top-5 acc 86.719 (85.916)	lr 0.00104
Train [105][950/3239]	Time 0.328 (0.511)	Data Time 0.002 (0.039)	Loss 2.2968 (2.3663)	Entropy 0.54099 (0.54015)	Top-1 acc 67.188 (67.225)	Top-5 acc 86.328 (85.932)	lr 0.00104
Train [105][960/3239]	Time 0.232 (0.510)	Data Time 0.001 (0.039)	Loss 2.2676 (2.3657)	Entropy 0.54082 (0.54016)	Top-1 acc 71.484 (67.233)	Top-5 acc 86.328 (85.946)	lr 0.00104
Train [105][970/3239]	Time 0.230 (0.509)	Data Time 0.001 (0.038)	Loss 2.2733 (2.3660)	Entropy 0.54065 (0.54016)	Top-1 acc 70.703 (67.224)	Top-5 acc 87.891 (85.933)	lr 0.00104
Train [105][980/3239]	Time 0.224 (0.508)	Data Time 0.001 (0.038)	Loss 2.4772 (2.3655)	Entropy 0.54078 (0.54017)	Top-1 acc 66.797 (67.246)	Top-5 acc 85.156 (85.942)	lr 0.00104
Train [105][990/3239]	Time 0.404 (0.561)	Data Time 0.006 (0.037)	Loss 2.3611 (2.3657)	Entropy 0.54072 (0.54017)	Top-1 acc 67.969 (67.245)	Top-5 acc 85.547 (85.942)	lr 0.00104
Train [105][1000/3239]	Time 0.270 (0.561)	Data Time 0.003 (0.037)	Loss 2.1899 (2.3651)	Entropy 0.54095 (0.54018)	Top-1 acc 72.266 (67.264)	Top-5 acc 90.625 (85.947)	lr 0.00104
Train [105][1010/3239]	Time 0.224 (0.559)	Data Time 0.002 (0.037)	Loss 2.4337 (2.3655)	Entropy 0.54089 (0.54019)	Top-1 acc 67.188 (67.248)	Top-5 acc 85.547 (85.942)	lr 0.00104
Train [105][1020/3239]	Time 0.326 (0.558)	Data Time 0.001 (0.036)	Loss 2.1842 (2.3653)	Entropy 0.54075 (0.54019)	Top-1 acc 69.531 (67.240)	Top-5 acc 90.234 (85.949)	lr 0.00104
Train [105][1030/3239]	Time 0.227 (0.556)	Data Time 0.001 (0.036)	Loss 2.5153 (2.3654)	Entropy 0.54107 (0.54020)	Top-1 acc 64.062 (67.239)	Top-5 acc 83.203 (85.950)	lr 0.00104
Train [105][1040/3239]	Time 0.223 (0.555)	Data Time 0.001 (0.036)	Loss 2.3977 (2.3654)	Entropy 0.54113 (0.54021)	Top-1 acc 64.453 (67.231)	Top-5 acc 84.766 (85.945)	lr 0.00104
Train [105][1050/3239]	Time 0.227 (0.554)	Data Time 0.001 (0.035)	Loss 2.4729 (2.3653)	Entropy 0.54076 (0.54022)	Top-1 acc 64.844 (67.232)	Top-5 acc 83.594 (85.949)	lr 0.00104
Train [105][1060/3239]	Time 0.231 (0.552)	Data Time 0.001 (0.035)	Loss 2.2924 (2.3659)	Entropy 0.54092 (0.54022)	Top-1 acc 65.625 (67.215)	Top-5 acc 86.719 (85.937)	lr 0.00104
Train [105][1070/3239]	Time 0.235 (0.551)	Data Time 0.002 (0.035)	Loss 2.1079 (2.3661)	Entropy 0.54071 (0.54023)	Top-1 acc 74.219 (67.215)	Top-5 acc 91.406 (85.933)	lr 0.00104
Train [105][1080/3239]	Time 0.259 (0.550)	Data Time 0.001 (0.035)	Loss 2.4797 (2.3666)	Entropy 0.54082 (0.54023)	Top-1 acc 66.406 (67.209)	Top-5 acc 84.375 (85.923)	lr 0.00104
Train [105][1090/3239]	Time 0.253 (0.549)	Data Time 0.001 (0.034)	Loss 2.2156 (2.3671)	Entropy 0.54078 (0.54024)	Top-1 acc 69.922 (67.198)	Top-5 acc 87.109 (85.909)	lr 0.00104
Train [105][1100/3239]	Time 0.245 (0.548)	Data Time 0.001 (0.034)	Loss 2.7763 (2.3674)	Entropy 0.54104 (0.54024)	Top-1 acc 55.859 (67.193)	Top-5 acc 79.297 (85.906)	lr 0.00104
Train [105][1110/3239]	Time 0.368 (0.546)	Data Time 0.001 (0.034)	Loss 2.2645 (2.3671)	Entropy 0.54099 (0.54025)	Top-1 acc 68.750 (67.200)	Top-5 acc 89.453 (85.915)	lr 0.00104
Train [105][1120/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.033)	Loss 2.4427 (2.3663)	Entropy 0.54066 (0.54026)	Top-1 acc 66.406 (67.228)	Top-5 acc 84.766 (85.929)	lr 0.00104
Train [105][1130/3239]	Time 0.281 (0.545)	Data Time 0.001 (0.033)	Loss 2.2233 (2.3656)	Entropy 0.54089 (0.54026)	Top-1 acc 71.094 (67.246)	Top-5 acc 89.453 (85.941)	lr 0.00103
Train [105][1140/3239]	Time 0.268 (0.544)	Data Time 0.002 (0.033)	Loss 2.4873 (2.3656)	Entropy 0.54035 (0.54026)	Top-1 acc 65.625 (67.237)	Top-5 acc 85.938 (85.946)	lr 0.00103
Train [105][1150/3239]	Time 0.251 (0.543)	Data Time 0.001 (0.033)	Loss 2.0540 (2.3656)	Entropy 0.54026 (0.54026)	Top-1 acc 71.484 (67.234)	Top-5 acc 93.750 (85.946)	lr 0.00103
Train [105][1160/3239]	Time 0.295 (0.542)	Data Time 0.001 (0.032)	Loss 2.4755 (2.3655)	Entropy 0.54049 (0.54026)	Top-1 acc 65.234 (67.240)	Top-5 acc 82.031 (85.950)	lr 0.00103
Train [105][1170/3239]	Time 0.230 (0.541)	Data Time 0.001 (0.032)	Loss 2.4401 (2.3656)	Entropy 0.54017 (0.54027)	Top-1 acc 64.453 (67.236)	Top-5 acc 86.719 (85.947)	lr 0.00103
Train [105][1180/3239]	Time 0.339 (0.540)	Data Time 0.001 (0.032)	Loss 2.2140 (2.3657)	Entropy 0.54044 (0.54026)	Top-1 acc 69.141 (67.237)	Top-5 acc 87.500 (85.948)	lr 0.00103
Train [105][1190/3239]	Time 0.247 (0.539)	Data Time 0.001 (0.032)	Loss 2.4799 (2.3662)	Entropy 0.54011 (0.54027)	Top-1 acc 64.062 (67.218)	Top-5 acc 83.203 (85.937)	lr 0.00103
Train [105][1200/3239]	Time 0.229 (0.538)	Data Time 0.003 (0.031)	Loss 2.6837 (2.3664)	Entropy 0.53988 (0.54026)	Top-1 acc 60.938 (67.215)	Top-5 acc 79.297 (85.933)	lr 0.00103
Train [105][1210/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.031)	Loss 2.1143 (2.3665)	Entropy 0.54011 (0.54026)	Top-1 acc 73.828 (67.211)	Top-5 acc 91.797 (85.941)	lr 0.00103
Train [105][1220/3239]	Time 0.224 (0.536)	Data Time 0.001 (0.031)	Loss 2.5191 (2.3666)	Entropy 0.54019 (0.54026)	Top-1 acc 65.625 (67.201)	Top-5 acc 82.031 (85.938)	lr 0.00103
Train [105][1230/3239]	Time 0.258 (0.535)	Data Time 0.001 (0.031)	Loss 2.4837 (2.3671)	Entropy 0.54032 (0.54026)	Top-1 acc 64.453 (67.191)	Top-5 acc 84.375 (85.934)	lr 0.00103
Train [105][1240/3239]	Time 0.252 (0.534)	Data Time 0.002 (0.030)	Loss 2.1584 (2.3665)	Entropy 0.54016 (0.54026)	Top-1 acc 75.391 (67.204)	Top-5 acc 87.500 (85.942)	lr 0.00103
Train [105][1250/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.030)	Loss 2.3937 (2.3667)	Entropy 0.54003 (0.54026)	Top-1 acc 68.750 (67.196)	Top-5 acc 88.281 (85.943)	lr 0.00103
Train [105][1260/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.030)	Loss 2.3795 (2.3666)	Entropy 0.54011 (0.54026)	Top-1 acc 67.188 (67.195)	Top-5 acc 84.375 (85.942)	lr 0.00103
Train [105][1270/3239]	Time 0.384 (0.532)	Data Time 0.001 (0.030)	Loss 2.2993 (2.3661)	Entropy 0.54023 (0.54026)	Top-1 acc 68.750 (67.204)	Top-5 acc 84.766 (85.957)	lr 0.00103
Train [105][1280/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.029)	Loss 2.1065 (2.3660)	Entropy 0.54000 (0.54025)	Top-1 acc 74.219 (67.214)	Top-5 acc 89.844 (85.956)	lr 0.00103
Train [105][1290/3239]	Time 0.266 (0.530)	Data Time 0.001 (0.029)	Loss 2.4743 (2.3660)	Entropy 0.54017 (0.54025)	Top-1 acc 61.328 (67.204)	Top-5 acc 85.547 (85.961)	lr 0.00103
Train [105][1300/3239]	Time 0.287 (0.530)	Data Time 0.003 (0.029)	Loss 2.3592 (2.3658)	Entropy 0.54036 (0.54025)	Top-1 acc 67.578 (67.218)	Top-5 acc 85.938 (85.962)	lr 0.00103
Train [105][1310/3239]	Time 0.239 (0.530)	Data Time 0.001 (0.029)	Loss 2.3150 (2.3655)	Entropy 0.54033 (0.54025)	Top-1 acc 69.922 (67.227)	Top-5 acc 85.156 (85.966)	lr 0.00103
Train [105][1320/3239]	Time 0.258 (0.529)	Data Time 0.001 (0.029)	Loss 2.4904 (2.3654)	Entropy 0.54061 (0.54025)	Top-1 acc 64.062 (67.228)	Top-5 acc 84.766 (85.970)	lr 0.00103
Train [105][1330/3239]	Time 0.238 (0.528)	Data Time 0.001 (0.028)	Loss 2.3387 (2.3651)	Entropy 0.54070 (0.54026)	Top-1 acc 68.750 (67.237)	Top-5 acc 87.109 (85.972)	lr 0.00103
Train [105][1340/3239]	Time 0.378 (0.528)	Data Time 0.001 (0.028)	Loss 2.2510 (2.3650)	Entropy 0.54089 (0.54026)	Top-1 acc 71.094 (67.245)	Top-5 acc 88.281 (85.973)	lr 0.00103
Train [105][1350/3239]	Time 0.244 (0.527)	Data Time 0.001 (0.028)	Loss 2.3933 (2.3650)	Entropy 0.54050 (0.54027)	Top-1 acc 67.969 (67.246)	Top-5 acc 85.547 (85.972)	lr 0.00103
Train [105][1360/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.028)	Loss 2.1524 (2.3647)	Entropy 0.54045 (0.54027)	Top-1 acc 69.531 (67.249)	Top-5 acc 90.625 (85.974)	lr 0.00103
Train [105][1370/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.028)	Loss 2.3543 (2.3653)	Entropy 0.54031 (0.54027)	Top-1 acc 64.844 (67.239)	Top-5 acc 84.766 (85.959)	lr 0.00103
Train [105][1380/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.027)	Loss 2.4469 (2.3649)	Entropy 0.54038 (0.54027)	Top-1 acc 64.844 (67.246)	Top-5 acc 85.156 (85.966)	lr 0.00102
Train [105][1390/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.027)	Loss 2.3269 (2.3653)	Entropy 0.54060 (0.54027)	Top-1 acc 68.750 (67.241)	Top-5 acc 85.547 (85.961)	lr 0.00102
Train [105][1400/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.027)	Loss 2.3356 (2.3652)	Entropy 0.54074 (0.54027)	Top-1 acc 71.094 (67.248)	Top-5 acc 87.891 (85.964)	lr 0.00102
Train [105][1410/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.027)	Loss 2.2749 (2.3651)	Entropy 0.54075 (0.54027)	Top-1 acc 70.312 (67.246)	Top-5 acc 87.109 (85.971)	lr 0.00102
Train [105][1420/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.027)	Loss 2.3926 (2.3648)	Entropy 0.54053 (0.54028)	Top-1 acc 68.359 (67.255)	Top-5 acc 85.938 (85.974)	lr 0.00102
Train [105][1430/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.027)	Loss 2.3594 (2.3644)	Entropy 0.54046 (0.54028)	Top-1 acc 74.609 (67.265)	Top-5 acc 85.156 (85.980)	lr 0.00102
Train [105][1440/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.026)	Loss 2.1797 (2.3640)	Entropy 0.54075 (0.54028)	Top-1 acc 67.578 (67.267)	Top-5 acc 91.797 (85.988)	lr 0.00102
Train [105][1450/3239]	Time 0.243 (0.520)	Data Time 0.001 (0.026)	Loss 2.3260 (2.3635)	Entropy 0.54081 (0.54028)	Top-1 acc 66.797 (67.278)	Top-5 acc 87.891 (85.999)	lr 0.00102
Train [105][1460/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.026)	Loss 2.3732 (2.3633)	Entropy 0.54067 (0.54029)	Top-1 acc 66.406 (67.276)	Top-5 acc 85.156 (86.001)	lr 0.00102
Train [105][1470/3239]	Time 0.248 (0.518)	Data Time 0.002 (0.026)	Loss 2.4504 (2.3632)	Entropy 0.54082 (0.54029)	Top-1 acc 65.234 (67.276)	Top-5 acc 83.594 (86.000)	lr 0.00102
Train [105][1480/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.026)	Loss 2.2183 (2.3632)	Entropy 0.54057 (0.54029)	Top-1 acc 69.141 (67.277)	Top-5 acc 89.062 (86.003)	lr 0.00102
Train [105][1490/3239]	Time 0.227 (0.517)	Data Time 0.001 (0.026)	Loss 2.2523 (2.3633)	Entropy 0.54069 (0.54030)	Top-1 acc 72.656 (67.274)	Top-5 acc 87.109 (86.003)	lr 0.00102
Train [105][1500/3239]	Time 0.353 (0.516)	Data Time 0.001 (0.025)	Loss 2.2752 (2.3631)	Entropy 0.54069 (0.54030)	Top-1 acc 68.750 (67.282)	Top-5 acc 87.891 (86.007)	lr 0.00102
Train [105][1510/3239]	Time 0.263 (0.515)	Data Time 0.002 (0.025)	Loss 2.6343 (2.3632)	Entropy 0.54032 (0.54030)	Top-1 acc 63.672 (67.278)	Top-5 acc 82.422 (86.009)	lr 0.00102
Train [105][1520/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.025)	Loss 2.2902 (2.3629)	Entropy 0.54018 (0.54030)	Top-1 acc 71.875 (67.290)	Top-5 acc 87.891 (86.008)	lr 0.00102
Train [105][1530/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.025)	Loss 2.4214 (2.3635)	Entropy 0.54018 (0.54030)	Top-1 acc 67.969 (67.280)	Top-5 acc 85.547 (85.995)	lr 0.00102
Train [105][1540/3239]	Time 0.240 (0.513)	Data Time 0.001 (0.025)	Loss 2.3671 (2.3635)	Entropy 0.54023 (0.54030)	Top-1 acc 67.188 (67.281)	Top-5 acc 85.547 (85.996)	lr 0.00102
Train [105][1550/3239]	Time 0.265 (0.513)	Data Time 0.001 (0.025)	Loss 2.3711 (2.3640)	Entropy 0.54044 (0.54030)	Top-1 acc 64.844 (67.262)	Top-5 acc 87.891 (85.995)	lr 0.00102
Train [105][1560/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.024)	Loss 2.2405 (2.3644)	Entropy 0.54063 (0.54030)	Top-1 acc 69.141 (67.252)	Top-5 acc 87.500 (85.988)	lr 0.00102
Train [105][1570/3239]	Time 0.335 (0.511)	Data Time 0.001 (0.024)	Loss 2.4235 (2.3642)	Entropy 0.54029 (0.54030)	Top-1 acc 64.453 (67.260)	Top-5 acc 84.766 (85.988)	lr 0.00102
Train [105][1580/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.024)	Loss 2.3981 (2.3641)	Entropy 0.53992 (0.54030)	Top-1 acc 67.578 (67.261)	Top-5 acc 84.375 (85.989)	lr 0.00102
Train [105][1590/3239]	Time 0.253 (0.510)	Data Time 0.001 (0.024)	Loss 2.3363 (2.3639)	Entropy 0.54006 (0.54030)	Top-1 acc 69.141 (67.267)	Top-5 acc 85.547 (85.992)	lr 0.00102
Train [105][1600/3239]	Time 0.228 (0.510)	Data Time 0.001 (0.024)	Loss 2.3629 (2.3639)	Entropy 0.54008 (0.54030)	Top-1 acc 68.359 (67.267)	Top-5 acc 87.500 (85.998)	lr 0.00102
Train [105][1610/3239]	Time 0.274 (0.509)	Data Time 0.001 (0.024)	Loss 2.5087 (2.3643)	Entropy 0.53999 (0.54029)	Top-1 acc 62.500 (67.253)	Top-5 acc 84.375 (85.991)	lr 0.00102
Train [105][1620/3239]	Time 0.229 (0.508)	Data Time 0.001 (0.024)	Loss 2.5163 (2.3644)	Entropy 0.53986 (0.54029)	Top-1 acc 64.062 (67.247)	Top-5 acc 82.031 (85.986)	lr 0.00102
Train [105][1630/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.023)	Loss 2.6992 (2.3644)	Entropy 0.53987 (0.54029)	Top-1 acc 58.984 (67.253)	Top-5 acc 80.469 (85.985)	lr 0.00101
Train [105][1640/3239]	Time 0.288 (0.507)	Data Time 0.001 (0.023)	Loss 2.2011 (2.3645)	Entropy 0.53953 (0.54029)	Top-1 acc 73.828 (67.252)	Top-5 acc 89.062 (85.981)	lr 0.00101
Train [105][1650/3239]	Time 0.383 (0.540)	Data Time 0.003 (0.023)	Loss 2.4612 (2.3648)	Entropy 0.53963 (0.54028)	Top-1 acc 65.234 (67.241)	Top-5 acc 86.719 (85.979)	lr 0.00101
Train [105][1660/3239]	Time 0.328 (0.539)	Data Time 0.002 (0.023)	Loss 2.3575 (2.3643)	Entropy 0.53972 (0.54028)	Top-1 acc 67.969 (67.254)	Top-5 acc 85.938 (85.991)	lr 0.00101
Train [105][1670/3239]	Time 0.253 (0.539)	Data Time 0.002 (0.023)	Loss 2.3887 (2.3637)	Entropy 0.53989 (0.54028)	Top-1 acc 67.188 (67.267)	Top-5 acc 83.594 (86.002)	lr 0.00101
Train [105][1680/3239]	Time 0.250 (0.538)	Data Time 0.001 (0.023)	Loss 2.2961 (2.3639)	Entropy 0.53998 (0.54027)	Top-1 acc 72.266 (67.261)	Top-5 acc 86.719 (85.993)	lr 0.00101
Train [105][1690/3239]	Time 0.241 (0.538)	Data Time 0.001 (0.023)	Loss 2.2980 (2.3637)	Entropy 0.54007 (0.54027)	Top-1 acc 67.188 (67.262)	Top-5 acc 87.891 (85.997)	lr 0.00101
Train [105][1700/3239]	Time 0.253 (0.537)	Data Time 0.001 (0.023)	Loss 2.3705 (2.3640)	Entropy 0.54018 (0.54027)	Top-1 acc 67.969 (67.260)	Top-5 acc 85.547 (85.991)	lr 0.00101
Train [105][1710/3239]	Time 0.296 (0.536)	Data Time 0.001 (0.022)	Loss 2.3015 (2.3639)	Entropy 0.54029 (0.54027)	Top-1 acc 67.188 (67.263)	Top-5 acc 86.719 (85.993)	lr 0.00101
Train [105][1720/3239]	Time 0.277 (0.536)	Data Time 0.001 (0.022)	Loss 2.3592 (2.3637)	Entropy 0.54036 (0.54027)	Top-1 acc 65.625 (67.266)	Top-5 acc 85.156 (85.992)	lr 0.00101
Train [105][1730/3239]	Time 0.355 (0.535)	Data Time 0.001 (0.022)	Loss 2.3356 (2.3639)	Entropy 0.54056 (0.54027)	Top-1 acc 65.234 (67.262)	Top-5 acc 88.281 (85.991)	lr 0.00101
Train [105][1740/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.022)	Loss 2.1738 (2.3636)	Entropy 0.54064 (0.54027)	Top-1 acc 73.438 (67.266)	Top-5 acc 90.234 (85.996)	lr 0.00101
Train [105][1750/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.022)	Loss 2.3143 (2.3636)	Entropy 0.54030 (0.54028)	Top-1 acc 71.094 (67.267)	Top-5 acc 86.328 (85.996)	lr 0.00101
Train [105][1760/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.022)	Loss 2.6235 (2.3641)	Entropy 0.54048 (0.54028)	Top-1 acc 60.547 (67.256)	Top-5 acc 81.641 (85.985)	lr 0.00101
Train [105][1770/3239]	Time 0.242 (0.533)	Data Time 0.001 (0.022)	Loss 2.3514 (2.3643)	Entropy 0.54037 (0.54028)	Top-1 acc 68.359 (67.251)	Top-5 acc 85.938 (85.984)	lr 0.00101
Train [105][1780/3239]	Time 0.266 (0.532)	Data Time 0.002 (0.022)	Loss 2.4021 (2.3643)	Entropy 0.54026 (0.54028)	Top-1 acc 64.062 (67.248)	Top-5 acc 85.938 (85.981)	lr 0.00101
Train [105][1790/3239]	Time 0.237 (0.531)	Data Time 0.001 (0.022)	Loss 2.3363 (2.3646)	Entropy 0.54013 (0.54028)	Top-1 acc 68.750 (67.244)	Top-5 acc 86.328 (85.976)	lr 0.00101
Train [105][1800/3239]	Time 0.253 (0.531)	Data Time 0.001 (0.021)	Loss 2.3201 (2.3644)	Entropy 0.54039 (0.54028)	Top-1 acc 66.016 (67.247)	Top-5 acc 87.109 (85.979)	lr 0.00101
Train [105][1810/3239]	Time 0.244 (0.530)	Data Time 0.001 (0.021)	Loss 2.3447 (2.3643)	Entropy 0.54040 (0.54028)	Top-1 acc 67.578 (67.245)	Top-5 acc 85.547 (85.984)	lr 0.00101
Train [105][1820/3239]	Time 0.362 (0.530)	Data Time 0.001 (0.021)	Loss 2.3452 (2.3641)	Entropy 0.54033 (0.54028)	Top-1 acc 67.188 (67.246)	Top-5 acc 85.938 (85.988)	lr 0.00101
Train [105][1830/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.021)	Loss 2.7156 (2.3646)	Entropy 0.54033 (0.54028)	Top-1 acc 57.031 (67.235)	Top-5 acc 80.859 (85.979)	lr 0.00101
Train [105][1840/3239]	Time 0.242 (0.529)	Data Time 0.001 (0.021)	Loss 2.3339 (2.3652)	Entropy 0.54010 (0.54028)	Top-1 acc 73.438 (67.225)	Top-5 acc 85.156 (85.971)	lr 0.00101
Train [105][1850/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.021)	Loss 2.2524 (2.3655)	Entropy 0.53999 (0.54028)	Top-1 acc 70.703 (67.218)	Top-5 acc 87.891 (85.969)	lr 0.00101
Train [105][1860/3239]	Time 0.280 (0.528)	Data Time 0.002 (0.021)	Loss 2.2401 (2.3651)	Entropy 0.54016 (0.54028)	Top-1 acc 68.359 (67.227)	Top-5 acc 89.844 (85.972)	lr 0.00101
Train [105][1870/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.021)	Loss 2.3387 (2.3650)	Entropy 0.54039 (0.54028)	Top-1 acc 64.062 (67.226)	Top-5 acc 89.844 (85.976)	lr 0.00101
Train [105][1880/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.021)	Loss 2.3118 (2.3649)	Entropy 0.54065 (0.54028)	Top-1 acc 66.797 (67.226)	Top-5 acc 87.500 (85.975)	lr 0.00100
Train [105][1890/3239]	Time 0.345 (0.526)	Data Time 0.001 (0.021)	Loss 2.4181 (2.3648)	Entropy 0.54079 (0.54028)	Top-1 acc 66.016 (67.227)	Top-5 acc 84.766 (85.980)	lr 0.00100
Train [105][1900/3239]	Time 0.226 (0.526)	Data Time 0.001 (0.020)	Loss 2.4802 (2.3647)	Entropy 0.54058 (0.54028)	Top-1 acc 66.406 (67.232)	Top-5 acc 85.156 (85.983)	lr 0.00100
Train [105][1910/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.020)	Loss 2.4670 (2.3650)	Entropy 0.54066 (0.54028)	Top-1 acc 62.500 (67.223)	Top-5 acc 83.594 (85.981)	lr 0.00100
Train [105][1920/3239]	Time 0.263 (0.524)	Data Time 0.001 (0.020)	Loss 2.3581 (2.3647)	Entropy 0.54066 (0.54029)	Top-1 acc 66.406 (67.230)	Top-5 acc 87.109 (85.983)	lr 0.00100
Train [105][1930/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.020)	Loss 2.3201 (2.3649)	Entropy 0.54062 (0.54029)	Top-1 acc 63.672 (67.220)	Top-5 acc 87.500 (85.984)	lr 0.00100
Train [105][1940/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.020)	Loss 2.4363 (2.3650)	Entropy 0.54071 (0.54029)	Top-1 acc 66.016 (67.218)	Top-5 acc 83.203 (85.978)	lr 0.00100
Train [105][1950/3239]	Time 0.250 (0.523)	Data Time 0.001 (0.020)	Loss 2.4650 (2.3651)	Entropy 0.54139 (0.54029)	Top-1 acc 64.844 (67.213)	Top-5 acc 85.547 (85.976)	lr 0.00100
Train [105][1960/3239]	Time 0.299 (0.522)	Data Time 0.002 (0.020)	Loss 2.2671 (2.3650)	Entropy 0.54149 (0.54030)	Top-1 acc 69.922 (67.214)	Top-5 acc 87.109 (85.978)	lr 0.00100
Train [105][1970/3239]	Time 0.260 (0.522)	Data Time 0.001 (0.020)	Loss 2.3043 (2.3651)	Entropy 0.54156 (0.54030)	Top-1 acc 67.578 (67.208)	Top-5 acc 87.109 (85.975)	lr 0.00100
Train [105][1980/3239]	Time 0.255 (0.521)	Data Time 0.001 (0.020)	Loss 2.4118 (2.3654)	Entropy 0.54159 (0.54031)	Top-1 acc 65.234 (67.203)	Top-5 acc 85.156 (85.970)	lr 0.00100
Train [105][1990/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.020)	Loss 2.3922 (2.3655)	Entropy 0.54168 (0.54032)	Top-1 acc 67.578 (67.201)	Top-5 acc 85.547 (85.968)	lr 0.00100
Train [105][2000/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.019)	Loss 2.2657 (2.3655)	Entropy 0.54155 (0.54032)	Top-1 acc 72.266 (67.209)	Top-5 acc 87.500 (85.970)	lr 0.00100
Train [105][2010/3239]	Time 0.274 (0.520)	Data Time 0.001 (0.019)	Loss 2.3644 (2.3655)	Entropy 0.54172 (0.54033)	Top-1 acc 68.750 (67.214)	Top-5 acc 85.938 (85.967)	lr 0.00100
Train [105][2020/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.019)	Loss 2.6930 (2.3655)	Entropy 0.54165 (0.54034)	Top-1 acc 64.844 (67.210)	Top-5 acc 80.469 (85.970)	lr 0.00100
Train [105][2030/3239]	Time 0.242 (0.519)	Data Time 0.001 (0.019)	Loss 2.1759 (2.3656)	Entropy 0.54181 (0.54034)	Top-1 acc 75.000 (67.206)	Top-5 acc 87.891 (85.970)	lr 0.00100
Train [105][2040/3239]	Time 0.239 (0.518)	Data Time 0.001 (0.019)	Loss 2.4775 (2.3653)	Entropy 0.54161 (0.54035)	Top-1 acc 62.500 (67.210)	Top-5 acc 83.203 (85.975)	lr 0.00100
Train [105][2050/3239]	Time 0.384 (0.518)	Data Time 0.001 (0.019)	Loss 2.2182 (2.3651)	Entropy 0.54119 (0.54036)	Top-1 acc 71.875 (67.216)	Top-5 acc 87.500 (85.980)	lr 0.00100
Train [105][2060/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.019)	Loss 2.3822 (2.3652)	Entropy 0.54156 (0.54036)	Top-1 acc 65.234 (67.211)	Top-5 acc 85.547 (85.975)	lr 0.00100
Train [105][2070/3239]	Time 0.241 (0.517)	Data Time 0.001 (0.019)	Loss 2.5339 (2.3651)	Entropy 0.54137 (0.54037)	Top-1 acc 63.672 (67.217)	Top-5 acc 81.250 (85.975)	lr 0.00100
Train [105][2080/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.019)	Loss 2.3607 (2.3650)	Entropy 0.54151 (0.54037)	Top-1 acc 64.062 (67.214)	Top-5 acc 85.547 (85.976)	lr 0.00100
Train [105][2090/3239]	Time 0.235 (0.516)	Data Time 0.001 (0.019)	Loss 2.2845 (2.3650)	Entropy 0.54134 (0.54038)	Top-1 acc 71.094 (67.217)	Top-5 acc 86.328 (85.975)	lr 0.00100
Train [105][2100/3239]	Time 0.273 (0.516)	Data Time 0.001 (0.019)	Loss 2.2110 (2.3647)	Entropy 0.54077 (0.54038)	Top-1 acc 68.750 (67.218)	Top-5 acc 89.062 (85.983)	lr 0.00100
Train [105][2110/3239]	Time 0.235 (0.515)	Data Time 0.001 (0.019)	Loss 2.4101 (2.3645)	Entropy 0.54098 (0.54038)	Top-1 acc 67.188 (67.227)	Top-5 acc 83.203 (85.990)	lr 0.00100
Train [105][2120/3239]	Time 0.332 (0.515)	Data Time 0.001 (0.018)	Loss 2.2167 (2.3645)	Entropy 0.54110 (0.54038)	Top-1 acc 67.969 (67.232)	Top-5 acc 89.062 (85.991)	lr 0.00100
Train [105][2130/3239]	Time 0.225 (0.514)	Data Time 0.001 (0.018)	Loss 2.2892 (2.3642)	Entropy 0.54127 (0.54039)	Top-1 acc 70.703 (67.238)	Top-5 acc 85.938 (85.999)	lr 0.00099
Train [105][2140/3239]	Time 0.238 (0.514)	Data Time 0.001 (0.018)	Loss 2.3486 (2.3643)	Entropy 0.54102 (0.54039)	Top-1 acc 67.188 (67.233)	Top-5 acc 88.281 (85.996)	lr 0.00099
Train [105][2150/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.018)	Loss 2.6079 (2.3643)	Entropy 0.54116 (0.54039)	Top-1 acc 62.500 (67.229)	Top-5 acc 83.203 (85.992)	lr 0.00099
Train [105][2160/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.018)	Loss 2.4270 (2.3643)	Entropy 0.54107 (0.54040)	Top-1 acc 66.406 (67.231)	Top-5 acc 84.375 (85.993)	lr 0.00099
Train [105][2170/3239]	Time 0.222 (0.512)	Data Time 0.001 (0.018)	Loss 2.3521 (2.3644)	Entropy 0.54133 (0.54040)	Top-1 acc 65.625 (67.225)	Top-5 acc 86.719 (85.991)	lr 0.00099
Train [105][2180/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.018)	Loss 2.4072 (2.3645)	Entropy 0.54140 (0.54041)	Top-1 acc 67.578 (67.230)	Top-5 acc 83.984 (85.986)	lr 0.00099
Train [105][2190/3239]	Time 0.224 (0.511)	Data Time 0.001 (0.018)	Loss 2.2842 (2.3644)	Entropy 0.54106 (0.54041)	Top-1 acc 65.625 (67.229)	Top-5 acc 86.328 (85.987)	lr 0.00099
Train [105][2200/3239]	Time 0.232 (0.511)	Data Time 0.001 (0.018)	Loss 2.4400 (2.3646)	Entropy 0.54069 (0.54041)	Top-1 acc 64.453 (67.222)	Top-5 acc 84.766 (85.989)	lr 0.00099
Train [105][2210/3239]	Time 0.324 (0.510)	Data Time 0.001 (0.018)	Loss 2.2596 (2.3643)	Entropy 0.54068 (0.54041)	Top-1 acc 71.875 (67.232)	Top-5 acc 86.328 (85.995)	lr 0.00099
Train [105][2220/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.018)	Loss 2.5937 (2.3644)	Entropy 0.54029 (0.54041)	Top-1 acc 59.766 (67.227)	Top-5 acc 84.375 (85.996)	lr 0.00099
Train [105][2230/3239]	Time 0.227 (0.509)	Data Time 0.001 (0.018)	Loss 2.4020 (2.3644)	Entropy 0.54043 (0.54041)	Top-1 acc 66.797 (67.232)	Top-5 acc 85.156 (85.995)	lr 0.00099
Train [105][2240/3239]	Time 0.284 (0.509)	Data Time 0.002 (0.018)	Loss 2.2911 (2.3642)	Entropy 0.54016 (0.54041)	Top-1 acc 68.750 (67.238)	Top-5 acc 88.672 (86.003)	lr 0.00099
Train [105][2250/3239]	Time 0.247 (0.509)	Data Time 0.001 (0.017)	Loss 2.4277 (2.3640)	Entropy 0.54031 (0.54041)	Top-1 acc 67.188 (67.248)	Top-5 acc 85.547 (86.008)	lr 0.00099
Train [105][2260/3239]	Time 0.226 (0.508)	Data Time 0.001 (0.017)	Loss 2.2249 (2.3637)	Entropy 0.54042 (0.54041)	Top-1 acc 72.656 (67.254)	Top-5 acc 87.500 (86.010)	lr 0.00099
Train [105][2270/3239]	Time 0.222 (0.508)	Data Time 0.001 (0.017)	Loss 2.3587 (2.3639)	Entropy 0.54060 (0.54041)	Top-1 acc 67.188 (67.244)	Top-5 acc 87.109 (86.009)	lr 0.00099
Train [105][2280/3239]	Time 0.331 (0.507)	Data Time 0.001 (0.017)	Loss 2.3972 (2.3640)	Entropy 0.54094 (0.54041)	Top-1 acc 66.797 (67.243)	Top-5 acc 84.766 (86.007)	lr 0.00099
Train [105][2290/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.017)	Loss 2.1703 (2.3638)	Entropy 0.54094 (0.54042)	Top-1 acc 71.875 (67.248)	Top-5 acc 90.625 (86.014)	lr 0.00099
Train [105][2300/3239]	Time 0.307 (0.530)	Data Time 0.005 (0.017)	Loss 2.6108 (2.3638)	Entropy 0.54123 (0.54042)	Top-1 acc 60.938 (67.248)	Top-5 acc 81.641 (86.016)	lr 0.00099
Train [105][2310/3239]	Time 0.277 (0.530)	Data Time 0.002 (0.017)	Loss 2.2956 (2.3640)	Entropy 0.54162 (0.54042)	Top-1 acc 68.750 (67.243)	Top-5 acc 86.328 (86.015)	lr 0.00099
Train [105][2320/3239]	Time 0.237 (0.529)	Data Time 0.001 (0.017)	Loss 2.4543 (2.3643)	Entropy 0.54135 (0.54043)	Top-1 acc 65.234 (67.235)	Top-5 acc 83.594 (86.009)	lr 0.00099
Train [105][2330/3239]	Time 0.243 (0.529)	Data Time 0.001 (0.017)	Loss 2.2792 (2.3642)	Entropy 0.54128 (0.54043)	Top-1 acc 70.312 (67.238)	Top-5 acc 87.500 (86.009)	lr 0.00099
Train [105][2340/3239]	Time 0.282 (0.528)	Data Time 0.002 (0.017)	Loss 2.2647 (2.3640)	Entropy 0.54159 (0.54044)	Top-1 acc 69.922 (67.239)	Top-5 acc 89.062 (86.011)	lr 0.00099
Train [105][2350/3239]	Time 0.250 (0.528)	Data Time 0.001 (0.017)	Loss 2.4013 (2.3641)	Entropy 0.54182 (0.54044)	Top-1 acc 67.578 (67.238)	Top-5 acc 82.812 (86.008)	lr 0.00099
Train [105][2360/3239]	Time 0.263 (0.528)	Data Time 0.001 (0.017)	Loss 2.2887 (2.3640)	Entropy 0.54179 (0.54045)	Top-1 acc 70.703 (67.240)	Top-5 acc 87.500 (86.011)	lr 0.00099
Train [105][2370/3239]	Time 0.375 (0.528)	Data Time 0.001 (0.017)	Loss 2.2947 (2.3642)	Entropy 0.54091 (0.54045)	Top-1 acc 68.359 (67.238)	Top-5 acc 86.719 (86.009)	lr 0.00099
Train [105][2380/3239]	Time 0.276 (0.527)	Data Time 0.001 (0.017)	Loss 2.2075 (2.3642)	Entropy 0.54082 (0.54045)	Top-1 acc 72.656 (67.238)	Top-5 acc 89.453 (86.010)	lr 0.00099
Train [105][2390/3239]	Time 0.270 (0.527)	Data Time 0.003 (0.017)	Loss 2.4156 (2.3641)	Entropy 0.54095 (0.54046)	Top-1 acc 66.797 (67.239)	Top-5 acc 83.203 (86.009)	lr 0.00098
Train [105][2400/3239]	Time 0.255 (0.527)	Data Time 0.001 (0.016)	Loss 2.7073 (2.3641)	Entropy 0.54080 (0.54046)	Top-1 acc 60.547 (67.239)	Top-5 acc 78.906 (86.009)	lr 0.00098
Train [105][2410/3239]	Time 0.252 (0.526)	Data Time 0.001 (0.016)	Loss 2.3474 (2.3640)	Entropy 0.54097 (0.54046)	Top-1 acc 66.406 (67.242)	Top-5 acc 86.328 (86.011)	lr 0.00098
Train [105][2420/3239]	Time 0.324 (0.526)	Data Time 0.003 (0.016)	Loss 2.3635 (2.3642)	Entropy 0.54113 (0.54046)	Top-1 acc 67.578 (67.235)	Top-5 acc 85.938 (86.009)	lr 0.00098
Train [105][2430/3239]	Time 0.323 (0.526)	Data Time 0.002 (0.016)	Loss 2.2485 (2.3644)	Entropy 0.54094 (0.54046)	Top-1 acc 69.141 (67.230)	Top-5 acc 87.891 (86.007)	lr 0.00098
Train [105][2440/3239]	Time 0.345 (0.526)	Data Time 0.002 (0.016)	Loss 2.2962 (2.3643)	Entropy 0.54068 (0.54047)	Top-1 acc 69.922 (67.233)	Top-5 acc 85.938 (86.008)	lr 0.00098
Train [105][2450/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.016)	Loss 2.3136 (2.3645)	Entropy 0.54086 (0.54047)	Top-1 acc 67.578 (67.223)	Top-5 acc 84.375 (86.002)	lr 0.00098
Train [105][2460/3239]	Time 0.239 (0.525)	Data Time 0.001 (0.016)	Loss 2.2201 (2.3647)	Entropy 0.54092 (0.54047)	Top-1 acc 73.047 (67.217)	Top-5 acc 89.062 (85.999)	lr 0.00098
Train [105][2470/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.016)	Loss 2.4247 (2.3649)	Entropy 0.54104 (0.54047)	Top-1 acc 64.453 (67.215)	Top-5 acc 85.156 (85.997)	lr 0.00098
Train [105][2480/3239]	Time 0.222 (0.524)	Data Time 0.001 (0.016)	Loss 2.4715 (2.3647)	Entropy 0.54088 (0.54047)	Top-1 acc 64.062 (67.219)	Top-5 acc 83.594 (85.999)	lr 0.00098
Train [105][2490/3239]	Time 0.253 (0.524)	Data Time 0.001 (0.016)	Loss 2.2136 (2.3649)	Entropy 0.54089 (0.54047)	Top-1 acc 72.266 (67.216)	Top-5 acc 87.109 (85.994)	lr 0.00098
Train [105][2500/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.016)	Loss 2.3895 (2.3650)	Entropy 0.54046 (0.54048)	Top-1 acc 69.141 (67.213)	Top-5 acc 86.328 (85.992)	lr 0.00098
Train [105][2510/3239]	Time 0.270 (0.523)	Data Time 0.002 (0.016)	Loss 2.5090 (2.3649)	Entropy 0.54036 (0.54048)	Top-1 acc 65.234 (67.214)	Top-5 acc 82.422 (85.993)	lr 0.00098
Train [105][2520/3239]	Time 0.254 (0.523)	Data Time 0.001 (0.016)	Loss 2.3769 (2.3648)	Entropy 0.54005 (0.54047)	Top-1 acc 63.281 (67.217)	Top-5 acc 86.719 (85.996)	lr 0.00098
Train [105][2530/3239]	Time 0.357 (0.522)	Data Time 0.001 (0.016)	Loss 2.3386 (2.3647)	Entropy 0.54016 (0.54047)	Top-1 acc 67.188 (67.222)	Top-5 acc 84.766 (85.997)	lr 0.00098
Train [105][2540/3239]	Time 0.246 (0.522)	Data Time 0.001 (0.016)	Loss 2.4358 (2.3648)	Entropy 0.54020 (0.54047)	Top-1 acc 64.453 (67.222)	Top-5 acc 84.766 (85.996)	lr 0.00098
Train [105][2550/3239]	Time 0.264 (0.522)	Data Time 0.001 (0.016)	Loss 2.2751 (2.3651)	Entropy 0.54036 (0.54047)	Top-1 acc 67.578 (67.214)	Top-5 acc 87.891 (85.987)	lr 0.00098
Train [105][2560/3239]	Time 0.230 (0.521)	Data Time 0.002 (0.016)	Loss 2.3470 (2.3650)	Entropy 0.54017 (0.54047)	Top-1 acc 66.016 (67.221)	Top-5 acc 87.109 (85.989)	lr 0.00098
Train [105][2570/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.016)	Loss 2.4122 (2.3649)	Entropy 0.53995 (0.54047)	Top-1 acc 64.844 (67.222)	Top-5 acc 82.031 (85.990)	lr 0.00098
Train [105][2580/3239]	Time 0.270 (0.521)	Data Time 0.003 (0.015)	Loss 2.3828 (2.3648)	Entropy 0.53995 (0.54047)	Top-1 acc 66.016 (67.224)	Top-5 acc 84.375 (85.989)	lr 0.00098
Train [105][2590/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.015)	Loss 2.2964 (2.3648)	Entropy 0.54007 (0.54046)	Top-1 acc 69.531 (67.220)	Top-5 acc 87.500 (85.992)	lr 0.00098
Train [105][2600/3239]	Time 0.445 (0.520)	Data Time 0.002 (0.015)	Loss 2.4845 (2.3652)	Entropy 0.54013 (0.54046)	Top-1 acc 63.672 (67.212)	Top-5 acc 82.812 (85.983)	lr 0.00098
Train [105][2610/3239]	Time 0.244 (0.520)	Data Time 0.001 (0.015)	Loss 2.3578 (2.3650)	Entropy 0.54013 (0.54046)	Top-1 acc 67.188 (67.220)	Top-5 acc 87.109 (85.985)	lr 0.00098
Train [105][2620/3239]	Time 0.240 (0.519)	Data Time 0.001 (0.015)	Loss 2.3229 (2.3650)	Entropy 0.53980 (0.54046)	Top-1 acc 68.750 (67.220)	Top-5 acc 85.156 (85.985)	lr 0.00098
Train [105][2630/3239]	Time 0.224 (0.519)	Data Time 0.001 (0.015)	Loss 2.9578 (2.3652)	Entropy 0.53977 (0.54046)	Top-1 acc 51.562 (67.216)	Top-5 acc 76.172 (85.982)	lr 0.00098
Train [105][2640/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.015)	Loss 2.4360 (2.3650)	Entropy 0.53998 (0.54046)	Top-1 acc 66.406 (67.221)	Top-5 acc 83.594 (85.985)	lr 0.00097
Train [105][2650/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.015)	Loss 2.2361 (2.3647)	Entropy 0.53985 (0.54045)	Top-1 acc 70.312 (67.226)	Top-5 acc 87.109 (85.989)	lr 0.00097
Train [105][2660/3239]	Time 0.253 (0.518)	Data Time 0.001 (0.015)	Loss 2.2633 (2.3647)	Entropy 0.53974 (0.54045)	Top-1 acc 67.188 (67.223)	Top-5 acc 86.719 (85.988)	lr 0.00097
Train [105][2670/3239]	Time 0.240 (0.518)	Data Time 0.001 (0.015)	Loss 2.1808 (2.3645)	Entropy 0.53977 (0.54045)	Top-1 acc 69.141 (67.228)	Top-5 acc 88.672 (85.990)	lr 0.00097
Train [105][2680/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.015)	Loss 2.3286 (2.3646)	Entropy 0.53993 (0.54045)	Top-1 acc 68.750 (67.229)	Top-5 acc 85.938 (85.990)	lr 0.00097
Train [105][2690/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.015)	Loss 2.3060 (2.3644)	Entropy 0.53961 (0.54044)	Top-1 acc 68.750 (67.234)	Top-5 acc 87.500 (85.995)	lr 0.00097
Train [105][2700/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.015)	Loss 2.5111 (2.3649)	Entropy 0.53971 (0.54044)	Top-1 acc 66.016 (67.221)	Top-5 acc 83.203 (85.984)	lr 0.00097
Train [105][2710/3239]	Time 0.243 (0.516)	Data Time 0.001 (0.015)	Loss 2.2611 (2.3651)	Entropy 0.53991 (0.54044)	Top-1 acc 69.531 (67.214)	Top-5 acc 87.891 (85.981)	lr 0.00097
Train [105][2720/3239]	Time 0.222 (0.516)	Data Time 0.001 (0.015)	Loss 2.3586 (2.3650)	Entropy 0.53992 (0.54044)	Top-1 acc 69.141 (67.219)	Top-5 acc 86.328 (85.983)	lr 0.00097
Train [105][2730/3239]	Time 0.240 (0.515)	Data Time 0.001 (0.015)	Loss 2.2513 (2.3648)	Entropy 0.53990 (0.54044)	Top-1 acc 69.922 (67.227)	Top-5 acc 89.453 (85.988)	lr 0.00097
Train [105][2740/3239]	Time 0.253 (0.515)	Data Time 0.002 (0.015)	Loss 2.3148 (2.3648)	Entropy 0.54029 (0.54043)	Top-1 acc 69.922 (67.226)	Top-5 acc 87.109 (85.988)	lr 0.00097
Train [105][2750/3239]	Time 0.243 (0.515)	Data Time 0.001 (0.015)	Loss 2.5180 (2.3649)	Entropy 0.54039 (0.54043)	Top-1 acc 61.719 (67.225)	Top-5 acc 83.203 (85.986)	lr 0.00097
Train [105][2760/3239]	Time 0.395 (0.515)	Data Time 0.001 (0.015)	Loss 2.2406 (2.3649)	Entropy 0.54057 (0.54043)	Top-1 acc 67.188 (67.225)	Top-5 acc 89.453 (85.987)	lr 0.00097
Train [105][2770/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.015)	Loss 2.4108 (2.3650)	Entropy 0.54052 (0.54043)	Top-1 acc 65.625 (67.221)	Top-5 acc 85.156 (85.987)	lr 0.00097
Train [105][2780/3239]	Time 0.246 (0.514)	Data Time 0.001 (0.014)	Loss 2.3274 (2.3650)	Entropy 0.54064 (0.54043)	Top-1 acc 68.750 (67.221)	Top-5 acc 84.766 (85.985)	lr 0.00097
Train [105][2790/3239]	Time 0.251 (0.514)	Data Time 0.001 (0.014)	Loss 2.3994 (2.3651)	Entropy 0.54017 (0.54043)	Top-1 acc 66.406 (67.221)	Top-5 acc 86.328 (85.983)	lr 0.00097
Train [105][2800/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.014)	Loss 2.4726 (2.3650)	Entropy 0.54021 (0.54043)	Top-1 acc 68.359 (67.225)	Top-5 acc 86.328 (85.986)	lr 0.00097
Train [105][2810/3239]	Time 0.267 (0.513)	Data Time 0.001 (0.014)	Loss 2.2493 (2.3649)	Entropy 0.54006 (0.54043)	Top-1 acc 71.094 (67.228)	Top-5 acc 89.844 (85.987)	lr 0.00097
Train [105][2820/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.014)	Loss 2.7078 (2.3648)	Entropy 0.54027 (0.54043)	Top-1 acc 57.422 (67.230)	Top-5 acc 79.688 (85.988)	lr 0.00097
Train [105][2830/3239]	Time 0.339 (0.512)	Data Time 0.001 (0.014)	Loss 2.4078 (2.3648)	Entropy 0.53999 (0.54043)	Top-1 acc 66.406 (67.231)	Top-5 acc 86.328 (85.987)	lr 0.00097
Train [105][2840/3239]	Time 0.255 (0.512)	Data Time 0.001 (0.014)	Loss 2.3873 (2.3646)	Entropy 0.54000 (0.54043)	Top-1 acc 66.797 (67.232)	Top-5 acc 85.938 (85.992)	lr 0.00097
Train [105][2850/3239]	Time 0.236 (0.512)	Data Time 0.001 (0.014)	Loss 2.2842 (2.3647)	Entropy 0.53981 (0.54043)	Top-1 acc 69.141 (67.229)	Top-5 acc 89.453 (85.994)	lr 0.00097
Train [105][2860/3239]	Time 0.223 (0.511)	Data Time 0.001 (0.014)	Loss 2.3602 (2.3646)	Entropy 0.53996 (0.54042)	Top-1 acc 64.453 (67.230)	Top-5 acc 85.938 (85.996)	lr 0.00097
Train [105][2870/3239]	Time 0.235 (0.511)	Data Time 0.001 (0.014)	Loss 2.4443 (2.3649)	Entropy 0.54010 (0.54042)	Top-1 acc 62.109 (67.222)	Top-5 acc 84.375 (85.991)	lr 0.00097
Train [105][2880/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.014)	Loss 2.3120 (2.3648)	Entropy 0.54012 (0.54042)	Top-1 acc 67.188 (67.225)	Top-5 acc 84.766 (85.993)	lr 0.00097
Train [105][2890/3239]	Time 0.222 (0.510)	Data Time 0.001 (0.014)	Loss 2.3407 (2.3648)	Entropy 0.54017 (0.54042)	Top-1 acc 67.969 (67.225)	Top-5 acc 87.500 (85.991)	lr 0.00097
Train [105][2900/3239]	Time 0.234 (0.510)	Data Time 0.001 (0.014)	Loss 2.6354 (2.3649)	Entropy 0.53991 (0.54042)	Top-1 acc 60.156 (67.223)	Top-5 acc 82.422 (85.990)	lr 0.00096
Train [105][2910/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.014)	Loss 2.3852 (2.3652)	Entropy 0.53988 (0.54042)	Top-1 acc 67.188 (67.216)	Top-5 acc 85.156 (85.985)	lr 0.00096
Train [105][2920/3239]	Time 0.381 (0.509)	Data Time 0.001 (0.014)	Loss 2.1038 (2.3650)	Entropy 0.53985 (0.54042)	Top-1 acc 69.922 (67.222)	Top-5 acc 89.844 (85.987)	lr 0.00096
Train [105][2930/3239]	Time 0.236 (0.509)	Data Time 0.001 (0.014)	Loss 2.3208 (2.3646)	Entropy 0.53981 (0.54041)	Top-1 acc 67.969 (67.233)	Top-5 acc 85.938 (85.993)	lr 0.00096
Train [105][2940/3239]	Time 0.245 (0.509)	Data Time 0.001 (0.014)	Loss 2.1313 (2.3645)	Entropy 0.54019 (0.54041)	Top-1 acc 75.000 (67.237)	Top-5 acc 89.062 (85.995)	lr 0.00096
Train [105][2950/3239]	Time 0.240 (0.509)	Data Time 0.001 (0.014)	Loss 2.1378 (2.3644)	Entropy 0.54025 (0.54041)	Top-1 acc 72.656 (67.241)	Top-5 acc 90.234 (85.996)	lr 0.00096
Train [105][2960/3239]	Time 0.268 (0.527)	Data Time 0.002 (0.014)	Loss 2.3552 (2.3646)	Entropy 0.53998 (0.54041)	Top-1 acc 66.797 (67.235)	Top-5 acc 86.719 (85.994)	lr 0.00096
Train [105][2970/3239]	Time 0.241 (0.527)	Data Time 0.002 (0.014)	Loss 2.3619 (2.3645)	Entropy 0.53999 (0.54041)	Top-1 acc 68.359 (67.236)	Top-5 acc 86.719 (85.996)	lr 0.00096
Train [105][2980/3239]	Time 0.260 (0.526)	Data Time 0.001 (0.014)	Loss 2.3093 (2.3646)	Entropy 0.54011 (0.54041)	Top-1 acc 65.625 (67.229)	Top-5 acc 86.328 (85.994)	lr 0.00096
Train [105][2990/3239]	Time 0.353 (0.526)	Data Time 0.001 (0.014)	Loss 2.1689 (2.3646)	Entropy 0.54020 (0.54041)	Top-1 acc 73.438 (67.230)	Top-5 acc 88.672 (85.994)	lr 0.00096
Train [105][3000/3239]	Time 0.248 (0.526)	Data Time 0.001 (0.014)	Loss 2.1533 (2.3645)	Entropy 0.54026 (0.54041)	Top-1 acc 69.531 (67.232)	Top-5 acc 89.844 (85.998)	lr 0.00096
Train [105][3010/3239]	Time 0.266 (0.525)	Data Time 0.028 (0.014)	Loss 2.3242 (2.3643)	Entropy 0.54057 (0.54041)	Top-1 acc 66.797 (67.235)	Top-5 acc 87.500 (86.002)	lr 0.00096
Train [105][3020/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.013)	Loss 2.3349 (2.3642)	Entropy 0.54090 (0.54041)	Top-1 acc 69.922 (67.241)	Top-5 acc 86.719 (86.004)	lr 0.00096
Train [105][3030/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.013)	Loss 2.3289 (2.3640)	Entropy 0.54118 (0.54041)	Top-1 acc 70.312 (67.252)	Top-5 acc 83.984 (86.004)	lr 0.00096
Train [105][3040/3239]	Time 0.260 (0.524)	Data Time 0.001 (0.013)	Loss 2.2294 (2.3640)	Entropy 0.54126 (0.54041)	Top-1 acc 69.922 (67.253)	Top-5 acc 85.938 (86.001)	lr 0.00096
Train [105][3050/3239]	Time 0.243 (0.524)	Data Time 0.001 (0.013)	Loss 2.2954 (2.3641)	Entropy 0.54056 (0.54041)	Top-1 acc 70.703 (67.250)	Top-5 acc 87.891 (86.000)	lr 0.00096
Train [105][3060/3239]	Time 0.242 (0.524)	Data Time 0.001 (0.013)	Loss 2.2840 (2.3640)	Entropy 0.54077 (0.54041)	Top-1 acc 73.828 (67.258)	Top-5 acc 87.109 (86.000)	lr 0.00096
Train [105][3070/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.013)	Loss 2.2910 (2.3638)	Entropy 0.54056 (0.54042)	Top-1 acc 68.750 (67.262)	Top-5 acc 87.109 (86.005)	lr 0.00096
Train [105][3080/3239]	Time 0.321 (0.523)	Data Time 0.005 (0.013)	Loss 2.4647 (2.3638)	Entropy 0.54030 (0.54042)	Top-1 acc 64.453 (67.260)	Top-5 acc 85.547 (86.004)	lr 0.00096
Train [105][3090/3239]	Time 0.263 (0.523)	Data Time 0.001 (0.013)	Loss 2.4217 (2.3640)	Entropy 0.54055 (0.54042)	Top-1 acc 64.844 (67.252)	Top-5 acc 85.156 (86.001)	lr 0.00096
Train [105][3100/3239]	Time 0.241 (0.522)	Data Time 0.001 (0.013)	Loss 2.3376 (2.3640)	Entropy 0.54069 (0.54042)	Top-1 acc 69.531 (67.254)	Top-5 acc 85.547 (86.000)	lr 0.00096
Train [105][3110/3239]	Time 0.290 (0.522)	Data Time 0.001 (0.013)	Loss 2.2947 (2.3640)	Entropy 0.54083 (0.54042)	Top-1 acc 68.750 (67.255)	Top-5 acc 87.109 (86.003)	lr 0.00096
Train [105][3120/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.013)	Loss 2.4825 (2.3641)	Entropy 0.54091 (0.54042)	Top-1 acc 64.453 (67.256)	Top-5 acc 83.594 (86.003)	lr 0.00096
Train [105][3130/3239]	Time 0.244 (0.522)	Data Time 0.001 (0.013)	Loss 2.2984 (2.3640)	Entropy 0.54106 (0.54042)	Top-1 acc 67.578 (67.255)	Top-5 acc 86.328 (86.007)	lr 0.00096
Train [105][3140/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.013)	Loss 2.2677 (2.3641)	Entropy 0.54113 (0.54042)	Top-1 acc 70.703 (67.254)	Top-5 acc 89.062 (86.006)	lr 0.00096
Train [105][3150/3239]	Time 0.377 (0.521)	Data Time 0.002 (0.013)	Loss 2.4697 (2.3641)	Entropy 0.54089 (0.54042)	Top-1 acc 64.062 (67.252)	Top-5 acc 84.766 (86.008)	lr 0.00095
Train [105][3160/3239]	Time 0.277 (0.521)	Data Time 0.002 (0.013)	Loss 2.4022 (2.3640)	Entropy 0.54110 (0.54043)	Top-1 acc 67.969 (67.254)	Top-5 acc 83.984 (86.010)	lr 0.00095
Train [105][3170/3239]	Time 0.277 (0.520)	Data Time 0.001 (0.013)	Loss 2.3625 (2.3640)	Entropy 0.54098 (0.54043)	Top-1 acc 64.453 (67.251)	Top-5 acc 88.281 (86.009)	lr 0.00095
Train [105][3180/3239]	Time 0.303 (0.520)	Data Time 0.000 (0.013)	Loss 2.4560 (2.3641)	Entropy 0.54070 (0.54043)	Top-1 acc 64.453 (67.250)	Top-5 acc 84.766 (86.008)	lr 0.00095
Train [105][3190/3239]	Time 0.237 (0.520)	Data Time 0.000 (0.013)	Loss 2.5544 (2.3640)	Entropy 0.54042 (0.54043)	Top-1 acc 60.938 (67.250)	Top-5 acc 81.641 (86.008)	lr 0.00095
Train [105][3200/3239]	Time 0.232 (0.520)	Data Time 0.000 (0.013)	Loss 2.1664 (2.3637)	Entropy 0.54042 (0.54043)	Top-1 acc 71.484 (67.259)	Top-5 acc 87.500 (86.013)	lr 0.00095
Train [105][3210/3239]	Time 0.249 (0.519)	Data Time 0.000 (0.013)	Loss 2.5568 (2.3637)	Entropy 0.54005 (0.54043)	Top-1 acc 60.547 (67.257)	Top-5 acc 80.469 (86.014)	lr 0.00095
Train [105][3220/3239]	Time 0.322 (0.519)	Data Time 0.000 (0.013)	Loss 2.5689 (2.3639)	Entropy 0.54001 (0.54043)	Top-1 acc 61.719 (67.253)	Top-5 acc 82.812 (86.012)	lr 0.00095
Train [105][3230/3239]	Time 0.233 (0.519)	Data Time 0.000 (0.013)	Loss 2.3270 (2.3638)	Entropy 0.53972 (0.54043)	Top-1 acc 67.969 (67.256)	Top-5 acc 88.281 (86.014)	lr 0.00095
Train [105][3239/3239]	Time 0.813 (0.518)	Data Time 0.000 (0.013)	Loss 2.9545 (2.3638)	Entropy 0.53953 (0.54042)	Top-1 acc 51.852 (67.255)	Top-5 acc 79.012 (86.016)	lr 0.00095
==========Valid [105/120]	loss 1.181	top-1 acc 72.774 (72.786)	top-5 acc 90.427	Train top-1 67.255	top-5 86.016	Entropy 0.53953	Latency-None: 0.000ms	Flops: 539.00M
Train [106][0/3239]	Time 41.812 (41.812)	Data Time 37.818 (37.818)	Loss 2.4526 (2.4526)	Entropy 0.53985 (0.53985)	Top-1 acc 65.234 (65.234)	Top-5 acc 84.375 (84.375)	lr 0.00095
Train [106][10/3239]	Time 0.231 (4.317)	Data Time 0.001 (3.440)	Loss 2.8286 (2.3821)	Entropy 0.53981 (0.53986)	Top-1 acc 54.297 (66.229)	Top-5 acc 78.516 (86.328)	lr 0.00095
Train [106][20/3239]	Time 0.261 (2.458)	Data Time 0.002 (1.803)	Loss 2.1780 (2.3430)	Entropy 0.53969 (0.53984)	Top-1 acc 74.219 (67.504)	Top-5 acc 87.500 (86.551)	lr 0.00095
Train [106][30/3239]	Time 0.249 (1.821)	Data Time 0.001 (1.222)	Loss 2.1673 (2.3382)	Entropy 0.53960 (0.53977)	Top-1 acc 72.656 (67.629)	Top-5 acc 89.844 (86.542)	lr 0.00095
Train [106][40/3239]	Time 0.252 (1.490)	Data Time 0.001 (0.925)	Loss 2.2658 (2.3422)	Entropy 0.53961 (0.53972)	Top-1 acc 68.750 (67.340)	Top-5 acc 85.156 (86.471)	lr 0.00095
Train [106][50/3239]	Time 0.345 (1.280)	Data Time 0.001 (0.744)	Loss 2.2700 (2.3336)	Entropy 0.53954 (0.53969)	Top-1 acc 72.656 (67.616)	Top-5 acc 86.719 (86.680)	lr 0.00095
Train [106][60/3239]	Time 0.250 (1.143)	Data Time 0.001 (0.622)	Loss 2.3526 (2.3270)	Entropy 0.53972 (0.53969)	Top-1 acc 67.188 (67.796)	Top-5 acc 83.594 (86.744)	lr 0.00095
Train [106][70/3239]	Time 0.227 (1.040)	Data Time 0.001 (0.535)	Loss 2.3142 (2.3318)	Entropy 0.53950 (0.53969)	Top-1 acc 63.281 (67.595)	Top-5 acc 87.109 (86.686)	lr 0.00095
Train [106][80/3239]	Time 0.247 (0.961)	Data Time 0.002 (0.469)	Loss 2.5492 (2.3366)	Entropy 0.53942 (0.53965)	Top-1 acc 63.281 (67.612)	Top-5 acc 81.641 (86.613)	lr 0.00095
Train [106][90/3239]	Time 0.230 (0.900)	Data Time 0.001 (0.417)	Loss 2.3505 (2.3326)	Entropy 0.53902 (0.53961)	Top-1 acc 69.531 (67.634)	Top-5 acc 86.328 (86.697)	lr 0.00095
Train [106][100/3239]	Time 0.226 (0.853)	Data Time 0.001 (0.377)	Loss 2.4898 (2.3326)	Entropy 0.53887 (0.53954)	Top-1 acc 62.109 (67.632)	Top-5 acc 85.547 (86.634)	lr 0.00095
Train [106][110/3239]	Time 0.234 (0.811)	Data Time 0.001 (0.343)	Loss 2.3068 (2.3262)	Entropy 0.53886 (0.53948)	Top-1 acc 67.969 (67.832)	Top-5 acc 85.938 (86.733)	lr 0.00095
Train [106][120/3239]	Time 0.267 (0.779)	Data Time 0.001 (0.315)	Loss 2.4876 (2.3280)	Entropy 0.53861 (0.53942)	Top-1 acc 67.969 (67.782)	Top-5 acc 84.766 (86.725)	lr 0.00095
Train [106][130/3239]	Time 0.234 (0.751)	Data Time 0.001 (0.291)	Loss 2.3502 (2.3347)	Entropy 0.53847 (0.53936)	Top-1 acc 69.141 (67.563)	Top-5 acc 85.938 (86.611)	lr 0.00095
Train [106][140/3239]	Time 0.233 (0.726)	Data Time 0.001 (0.270)	Loss 2.4501 (2.3333)	Entropy 0.53868 (0.53930)	Top-1 acc 61.719 (67.595)	Top-5 acc 83.594 (86.597)	lr 0.00095
Train [106][150/3239]	Time 0.236 (0.704)	Data Time 0.001 (0.252)	Loss 2.4594 (2.3352)	Entropy 0.53845 (0.53926)	Top-1 acc 64.062 (67.539)	Top-5 acc 85.547 (86.587)	lr 0.00095
Train [106][160/3239]	Time 0.245 (0.687)	Data Time 0.001 (0.237)	Loss 2.1738 (2.3337)	Entropy 0.53846 (0.53920)	Top-1 acc 70.703 (67.612)	Top-5 acc 89.844 (86.656)	lr 0.00095
Train [106][170/3239]	Time 0.228 (0.670)	Data Time 0.001 (0.223)	Loss 2.2319 (2.3344)	Entropy 0.53872 (0.53916)	Top-1 acc 70.312 (67.569)	Top-5 acc 87.891 (86.611)	lr 0.00094
Train [106][180/3239]	Time 0.234 (0.655)	Data Time 0.001 (0.211)	Loss 2.3163 (2.3360)	Entropy 0.53853 (0.53914)	Top-1 acc 64.844 (67.550)	Top-5 acc 89.062 (86.626)	lr 0.00094
Train [106][190/3239]	Time 0.229 (0.643)	Data Time 0.001 (0.200)	Loss 2.4907 (2.3392)	Entropy 0.53850 (0.53910)	Top-1 acc 63.672 (67.502)	Top-5 acc 85.547 (86.565)	lr 0.00094
Train [106][200/3239]	Time 0.232 (0.632)	Data Time 0.001 (0.190)	Loss 2.2191 (2.3404)	Entropy 0.53834 (0.53907)	Top-1 acc 70.312 (67.475)	Top-5 acc 89.844 (86.540)	lr 0.00094
Train [106][210/3239]	Time 0.326 (0.622)	Data Time 0.001 (0.181)	Loss 2.3021 (2.3404)	Entropy 0.53858 (0.53904)	Top-1 acc 69.922 (67.504)	Top-5 acc 87.109 (86.537)	lr 0.00094
Train [106][220/3239]	Time 0.241 (0.612)	Data Time 0.002 (0.173)	Loss 2.2799 (2.3419)	Entropy 0.53884 (0.53902)	Top-1 acc 68.750 (67.483)	Top-5 acc 89.453 (86.510)	lr 0.00094
Train [106][230/3239]	Time 0.230 (0.604)	Data Time 0.001 (0.166)	Loss 2.1704 (2.3417)	Entropy 0.53917 (0.53902)	Top-1 acc 72.656 (67.507)	Top-5 acc 88.281 (86.524)	lr 0.00094
Train [106][240/3239]	Time 0.236 (0.596)	Data Time 0.001 (0.159)	Loss 2.4481 (2.3404)	Entropy 0.53898 (0.53903)	Top-1 acc 66.406 (67.557)	Top-5 acc 85.547 (86.560)	lr 0.00094
Train [106][250/3239]	Time 0.237 (0.590)	Data Time 0.001 (0.152)	Loss 2.1684 (2.3373)	Entropy 0.53889 (0.53902)	Top-1 acc 68.359 (67.620)	Top-5 acc 88.281 (86.608)	lr 0.00094
Train [106][260/3239]	Time 0.236 (0.583)	Data Time 0.001 (0.147)	Loss 2.3872 (2.3378)	Entropy 0.53868 (0.53902)	Top-1 acc 68.750 (67.607)	Top-5 acc 83.594 (86.590)	lr 0.00094
Train [106][270/3239]	Time 0.276 (0.578)	Data Time 0.001 (0.141)	Loss 2.0219 (2.3363)	Entropy 0.53850 (0.53900)	Top-1 acc 77.734 (67.659)	Top-5 acc 91.406 (86.603)	lr 0.00094
Train [106][280/3239]	Time 0.311 (0.572)	Data Time 0.001 (0.136)	Loss 2.3776 (2.3350)	Entropy 0.53841 (0.53898)	Top-1 acc 66.406 (67.696)	Top-5 acc 87.500 (86.627)	lr 0.00094
Train [106][290/3239]	Time 0.227 (0.567)	Data Time 0.001 (0.132)	Loss 2.4666 (2.3358)	Entropy 0.53814 (0.53895)	Top-1 acc 64.453 (67.711)	Top-5 acc 82.812 (86.609)	lr 0.00094
Train [106][300/3239]	Time 0.238 (0.561)	Data Time 0.001 (0.127)	Loss 2.7184 (2.3381)	Entropy 0.53788 (0.53892)	Top-1 acc 57.422 (67.640)	Top-5 acc 80.469 (86.567)	lr 0.00094
Train [106][310/3239]	Time 0.229 (0.556)	Data Time 0.001 (0.123)	Loss 2.2594 (2.3398)	Entropy 0.53820 (0.53889)	Top-1 acc 67.188 (67.626)	Top-5 acc 88.281 (86.527)	lr 0.00094
Train [106][320/3239]	Time 0.220 (0.551)	Data Time 0.001 (0.120)	Loss 2.5468 (2.3397)	Entropy 0.53799 (0.53887)	Top-1 acc 62.891 (67.639)	Top-5 acc 82.812 (86.528)	lr 0.00094
Train [106][330/3239]	Time 0.215 (0.546)	Data Time 0.001 (0.116)	Loss 2.3540 (2.3397)	Entropy 0.53822 (0.53885)	Top-1 acc 66.406 (67.638)	Top-5 acc 85.547 (86.520)	lr 0.00094
Train [106][340/3239]	Time 0.227 (0.542)	Data Time 0.001 (0.113)	Loss 2.3271 (2.3403)	Entropy 0.53855 (0.53884)	Top-1 acc 68.750 (67.630)	Top-5 acc 87.891 (86.514)	lr 0.00094
Train [106][350/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.109)	Loss 2.2459 (2.3415)	Entropy 0.53882 (0.53883)	Top-1 acc 68.359 (67.601)	Top-5 acc 87.109 (86.482)	lr 0.00094
Train [106][360/3239]	Time 0.232 (0.535)	Data Time 0.001 (0.106)	Loss 2.1648 (2.3409)	Entropy 0.53904 (0.53883)	Top-1 acc 73.438 (67.621)	Top-5 acc 87.891 (86.497)	lr 0.00094
Train [106][370/3239]	Time 0.635 (0.674)	Data Time 0.045 (0.104)	Loss 2.4089 (2.3418)	Entropy 0.53932 (0.53884)	Top-1 acc 66.016 (67.602)	Top-5 acc 85.156 (86.483)	lr 0.00094
Train [106][380/3239]	Time 0.275 (0.671)	Data Time 0.002 (0.101)	Loss 2.3295 (2.3403)	Entropy 0.53963 (0.53885)	Top-1 acc 68.750 (67.652)	Top-5 acc 86.719 (86.511)	lr 0.00094
Train [106][390/3239]	Time 0.247 (0.664)	Data Time 0.002 (0.099)	Loss 2.1699 (2.3427)	Entropy 0.53951 (0.53887)	Top-1 acc 69.531 (67.594)	Top-5 acc 89.844 (86.450)	lr 0.00094
Train [106][400/3239]	Time 0.227 (0.659)	Data Time 0.001 (0.096)	Loss 2.3756 (2.3436)	Entropy 0.53971 (0.53889)	Top-1 acc 65.625 (67.582)	Top-5 acc 85.156 (86.428)	lr 0.00094
Train [106][410/3239]	Time 0.225 (0.652)	Data Time 0.001 (0.094)	Loss 2.2970 (2.3438)	Entropy 0.53959 (0.53891)	Top-1 acc 68.359 (67.568)	Top-5 acc 85.938 (86.415)	lr 0.00094
Train [106][420/3239]	Time 0.242 (0.648)	Data Time 0.002 (0.092)	Loss 2.4425 (2.3434)	Entropy 0.53988 (0.53893)	Top-1 acc 69.141 (67.573)	Top-5 acc 86.328 (86.433)	lr 0.00094
Train [106][430/3239]	Time 0.241 (0.645)	Data Time 0.001 (0.090)	Loss 2.3308 (2.3441)	Entropy 0.53996 (0.53895)	Top-1 acc 71.875 (67.565)	Top-5 acc 85.156 (86.433)	lr 0.00093
Train [106][440/3239]	Time 0.314 (0.640)	Data Time 0.001 (0.088)	Loss 2.1473 (2.3437)	Entropy 0.53983 (0.53897)	Top-1 acc 75.781 (67.591)	Top-5 acc 88.672 (86.440)	lr 0.00093
Train [106][450/3239]	Time 0.240 (0.635)	Data Time 0.001 (0.086)	Loss 2.3897 (2.3426)	Entropy 0.53989 (0.53899)	Top-1 acc 67.578 (67.615)	Top-5 acc 85.547 (86.452)	lr 0.00093
Train [106][460/3239]	Time 0.244 (0.630)	Data Time 0.001 (0.084)	Loss 2.3391 (2.3424)	Entropy 0.53946 (0.53901)	Top-1 acc 66.406 (67.604)	Top-5 acc 87.109 (86.453)	lr 0.00093
Train [106][470/3239]	Time 0.271 (0.626)	Data Time 0.001 (0.082)	Loss 2.3031 (2.3416)	Entropy 0.53932 (0.53902)	Top-1 acc 69.531 (67.609)	Top-5 acc 88.281 (86.474)	lr 0.00093
Train [106][480/3239]	Time 0.273 (0.622)	Data Time 0.004 (0.081)	Loss 2.1357 (2.3406)	Entropy 0.53937 (0.53903)	Top-1 acc 70.703 (67.620)	Top-5 acc 90.625 (86.490)	lr 0.00093
Train [106][490/3239]	Time 0.228 (0.619)	Data Time 0.001 (0.079)	Loss 2.3453 (2.3393)	Entropy 0.53963 (0.53904)	Top-1 acc 68.750 (67.658)	Top-5 acc 84.766 (86.502)	lr 0.00093
Train [106][500/3239]	Time 0.234 (0.615)	Data Time 0.001 (0.078)	Loss 2.2648 (2.3381)	Entropy 0.53991 (0.53905)	Top-1 acc 68.359 (67.676)	Top-5 acc 86.328 (86.520)	lr 0.00093
Train [106][510/3239]	Time 0.235 (0.611)	Data Time 0.001 (0.076)	Loss 2.2109 (2.3384)	Entropy 0.53962 (0.53906)	Top-1 acc 71.094 (67.673)	Top-5 acc 87.109 (86.509)	lr 0.00093
Train [106][520/3239]	Time 0.270 (0.608)	Data Time 0.001 (0.075)	Loss 2.4059 (2.3399)	Entropy 0.53983 (0.53907)	Top-1 acc 66.016 (67.639)	Top-5 acc 83.594 (86.484)	lr 0.00093
Train [106][530/3239]	Time 0.393 (0.606)	Data Time 0.001 (0.073)	Loss 2.6177 (2.3402)	Entropy 0.53957 (0.53908)	Top-1 acc 58.984 (67.640)	Top-5 acc 82.812 (86.466)	lr 0.00093
Train [106][540/3239]	Time 0.243 (0.603)	Data Time 0.001 (0.072)	Loss 2.2913 (2.3405)	Entropy 0.53936 (0.53909)	Top-1 acc 69.141 (67.640)	Top-5 acc 87.109 (86.455)	lr 0.00093
Train [106][550/3239]	Time 0.230 (0.600)	Data Time 0.001 (0.071)	Loss 2.4276 (2.3404)	Entropy 0.53933 (0.53910)	Top-1 acc 64.844 (67.641)	Top-5 acc 83.984 (86.454)	lr 0.00093
Train [106][560/3239]	Time 0.245 (0.597)	Data Time 0.001 (0.069)	Loss 2.5230 (2.3416)	Entropy 0.53933 (0.53910)	Top-1 acc 66.016 (67.623)	Top-5 acc 83.594 (86.432)	lr 0.00093
Train [106][570/3239]	Time 0.277 (0.594)	Data Time 0.001 (0.068)	Loss 2.3479 (2.3424)	Entropy 0.53901 (0.53911)	Top-1 acc 69.922 (67.608)	Top-5 acc 85.156 (86.416)	lr 0.00093
Train [106][580/3239]	Time 0.236 (0.591)	Data Time 0.001 (0.067)	Loss 2.2959 (2.3425)	Entropy 0.53916 (0.53910)	Top-1 acc 69.141 (67.612)	Top-5 acc 87.891 (86.426)	lr 0.00093
Train [106][590/3239]	Time 0.247 (0.589)	Data Time 0.001 (0.066)	Loss 2.4562 (2.3425)	Entropy 0.53900 (0.53910)	Top-1 acc 69.141 (67.630)	Top-5 acc 85.156 (86.415)	lr 0.00093
Train [106][600/3239]	Time 0.378 (0.586)	Data Time 0.002 (0.065)	Loss 2.3561 (2.3428)	Entropy 0.53886 (0.53910)	Top-1 acc 66.016 (67.615)	Top-5 acc 84.766 (86.404)	lr 0.00093
Train [106][610/3239]	Time 0.248 (0.584)	Data Time 0.001 (0.064)	Loss 2.5046 (2.3441)	Entropy 0.53860 (0.53910)	Top-1 acc 65.625 (67.591)	Top-5 acc 83.203 (86.380)	lr 0.00093
Train [106][620/3239]	Time 0.243 (0.581)	Data Time 0.001 (0.063)	Loss 2.1976 (2.3429)	Entropy 0.53847 (0.53909)	Top-1 acc 69.531 (67.635)	Top-5 acc 90.234 (86.397)	lr 0.00093
Train [106][630/3239]	Time 0.235 (0.579)	Data Time 0.001 (0.062)	Loss 2.3308 (2.3424)	Entropy 0.53833 (0.53908)	Top-1 acc 71.484 (67.654)	Top-5 acc 86.328 (86.406)	lr 0.00093
Train [106][640/3239]	Time 0.289 (0.577)	Data Time 0.001 (0.061)	Loss 2.2276 (2.3429)	Entropy 0.53820 (0.53907)	Top-1 acc 73.047 (67.633)	Top-5 acc 88.281 (86.405)	lr 0.00093
Train [106][650/3239]	Time 0.248 (0.575)	Data Time 0.001 (0.060)	Loss 2.2409 (2.3426)	Entropy 0.53826 (0.53905)	Top-1 acc 69.531 (67.625)	Top-5 acc 89.062 (86.416)	lr 0.00093
Train [106][660/3239]	Time 0.246 (0.573)	Data Time 0.001 (0.059)	Loss 2.2403 (2.3428)	Entropy 0.53817 (0.53904)	Top-1 acc 69.141 (67.610)	Top-5 acc 87.109 (86.407)	lr 0.00093
Train [106][670/3239]	Time 0.238 (0.571)	Data Time 0.001 (0.058)	Loss 2.4337 (2.3444)	Entropy 0.53824 (0.53903)	Top-1 acc 61.719 (67.573)	Top-5 acc 83.594 (86.376)	lr 0.00093
Train [106][680/3239]	Time 0.255 (0.569)	Data Time 0.001 (0.057)	Loss 2.2220 (2.3456)	Entropy 0.53819 (0.53901)	Top-1 acc 68.750 (67.541)	Top-5 acc 85.938 (86.353)	lr 0.00093
Train [106][690/3239]	Time 0.376 (0.567)	Data Time 0.001 (0.057)	Loss 2.3349 (2.3452)	Entropy 0.53797 (0.53900)	Top-1 acc 69.922 (67.550)	Top-5 acc 85.547 (86.352)	lr 0.00093
Train [106][700/3239]	Time 0.222 (0.565)	Data Time 0.001 (0.056)	Loss 2.6379 (2.3459)	Entropy 0.53787 (0.53898)	Top-1 acc 57.422 (67.529)	Top-5 acc 81.641 (86.345)	lr 0.00092
Train [106][710/3239]	Time 0.278 (0.563)	Data Time 0.027 (0.055)	Loss 2.3543 (2.3464)	Entropy 0.53767 (0.53897)	Top-1 acc 64.453 (67.524)	Top-5 acc 85.938 (86.337)	lr 0.00092
Train [106][720/3239]	Time 0.231 (0.561)	Data Time 0.001 (0.054)	Loss 2.3694 (2.3470)	Entropy 0.53752 (0.53895)	Top-1 acc 69.922 (67.525)	Top-5 acc 85.547 (86.324)	lr 0.00092
Train [106][730/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.054)	Loss 2.3782 (2.3470)	Entropy 0.53705 (0.53893)	Top-1 acc 67.188 (67.521)	Top-5 acc 84.766 (86.322)	lr 0.00092
Train [106][740/3239]	Time 0.239 (0.557)	Data Time 0.001 (0.053)	Loss 2.3443 (2.3471)	Entropy 0.53746 (0.53890)	Top-1 acc 68.750 (67.511)	Top-5 acc 85.938 (86.324)	lr 0.00092
Train [106][750/3239]	Time 0.239 (0.555)	Data Time 0.001 (0.052)	Loss 2.1773 (2.3471)	Entropy 0.53723 (0.53888)	Top-1 acc 73.828 (67.525)	Top-5 acc 90.625 (86.320)	lr 0.00092
Train [106][760/3239]	Time 0.344 (0.554)	Data Time 0.001 (0.052)	Loss 2.4169 (2.3477)	Entropy 0.53728 (0.53886)	Top-1 acc 62.109 (67.492)	Top-5 acc 86.719 (86.312)	lr 0.00092
Train [106][770/3239]	Time 0.241 (0.552)	Data Time 0.001 (0.051)	Loss 2.3763 (2.3485)	Entropy 0.53722 (0.53884)	Top-1 acc 67.578 (67.475)	Top-5 acc 86.719 (86.295)	lr 0.00092
Train [106][780/3239]	Time 0.235 (0.550)	Data Time 0.001 (0.050)	Loss 2.4689 (2.3489)	Entropy 0.53744 (0.53882)	Top-1 acc 67.969 (67.470)	Top-5 acc 83.594 (86.292)	lr 0.00092
Train [106][790/3239]	Time 0.254 (0.549)	Data Time 0.001 (0.050)	Loss 2.6511 (2.3488)	Entropy 0.53753 (0.53881)	Top-1 acc 58.203 (67.477)	Top-5 acc 83.984 (86.296)	lr 0.00092
Train [106][800/3239]	Time 0.235 (0.547)	Data Time 0.001 (0.049)	Loss 2.2730 (2.3482)	Entropy 0.53768 (0.53879)	Top-1 acc 71.484 (67.498)	Top-5 acc 87.891 (86.298)	lr 0.00092
Train [106][810/3239]	Time 0.261 (0.546)	Data Time 0.001 (0.049)	Loss 2.2659 (2.3482)	Entropy 0.53779 (0.53878)	Top-1 acc 70.312 (67.489)	Top-5 acc 88.281 (86.302)	lr 0.00092
Train [106][820/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.048)	Loss 2.2250 (2.3478)	Entropy 0.53756 (0.53876)	Top-1 acc 69.531 (67.494)	Top-5 acc 86.719 (86.308)	lr 0.00092
Train [106][830/3239]	Time 0.274 (0.543)	Data Time 0.003 (0.047)	Loss 2.2990 (2.3471)	Entropy 0.53780 (0.53875)	Top-1 acc 72.266 (67.524)	Top-5 acc 86.719 (86.317)	lr 0.00092
Train [106][840/3239]	Time 0.232 (0.542)	Data Time 0.001 (0.047)	Loss 2.4720 (2.3474)	Entropy 0.53780 (0.53874)	Top-1 acc 64.844 (67.515)	Top-5 acc 84.766 (86.311)	lr 0.00092
Train [106][850/3239]	Time 0.275 (0.541)	Data Time 0.002 (0.046)	Loss 2.6496 (2.3483)	Entropy 0.53788 (0.53873)	Top-1 acc 57.812 (67.487)	Top-5 acc 78.516 (86.294)	lr 0.00092
Train [106][860/3239]	Time 0.221 (0.540)	Data Time 0.001 (0.046)	Loss 2.3980 (2.3481)	Entropy 0.53747 (0.53871)	Top-1 acc 66.797 (67.493)	Top-5 acc 86.328 (86.300)	lr 0.00092
Train [106][870/3239]	Time 0.225 (0.538)	Data Time 0.001 (0.045)	Loss 2.3168 (2.3477)	Entropy 0.53785 (0.53870)	Top-1 acc 71.875 (67.512)	Top-5 acc 85.938 (86.311)	lr 0.00092
Train [106][880/3239]	Time 0.249 (0.537)	Data Time 0.001 (0.045)	Loss 2.2355 (2.3475)	Entropy 0.53803 (0.53869)	Top-1 acc 70.703 (67.527)	Top-5 acc 89.453 (86.313)	lr 0.00092
Train [106][890/3239]	Time 0.231 (0.535)	Data Time 0.001 (0.044)	Loss 2.2882 (2.3470)	Entropy 0.53789 (0.53869)	Top-1 acc 68.750 (67.545)	Top-5 acc 87.891 (86.324)	lr 0.00092
Train [106][900/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.044)	Loss 2.5851 (2.3474)	Entropy 0.53813 (0.53868)	Top-1 acc 62.891 (67.534)	Top-5 acc 83.594 (86.320)	lr 0.00092
Train [106][910/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.043)	Loss 2.3220 (2.3477)	Entropy 0.53800 (0.53867)	Top-1 acc 67.578 (67.525)	Top-5 acc 86.328 (86.314)	lr 0.00092
Train [106][920/3239]	Time 0.346 (0.531)	Data Time 0.001 (0.043)	Loss 2.3310 (2.3473)	Entropy 0.53821 (0.53866)	Top-1 acc 63.672 (67.533)	Top-5 acc 88.281 (86.327)	lr 0.00092
Train [106][930/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.043)	Loss 2.2891 (2.3471)	Entropy 0.53774 (0.53866)	Top-1 acc 71.875 (67.538)	Top-5 acc 85.547 (86.327)	lr 0.00092
Train [106][940/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.042)	Loss 2.3810 (2.3474)	Entropy 0.53782 (0.53865)	Top-1 acc 66.016 (67.522)	Top-5 acc 85.938 (86.327)	lr 0.00092
Train [106][950/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.042)	Loss 2.3696 (2.3475)	Entropy 0.53811 (0.53864)	Top-1 acc 66.406 (67.530)	Top-5 acc 85.547 (86.323)	lr 0.00092
Train [106][960/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.041)	Loss 2.1714 (2.3469)	Entropy 0.53815 (0.53864)	Top-1 acc 68.750 (67.535)	Top-5 acc 90.625 (86.336)	lr 0.00091
Train [106][970/3239]	Time 0.268 (0.524)	Data Time 0.001 (0.041)	Loss 2.5237 (2.3467)	Entropy 0.53828 (0.53863)	Top-1 acc 63.281 (67.546)	Top-5 acc 83.984 (86.339)	lr 0.00091
Train [106][980/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.040)	Loss 2.2225 (2.3465)	Entropy 0.53797 (0.53863)	Top-1 acc 65.625 (67.548)	Top-5 acc 89.844 (86.336)	lr 0.00091
Train [106][990/3239]	Time 0.315 (0.522)	Data Time 0.001 (0.040)	Loss 2.3974 (2.3469)	Entropy 0.53788 (0.53862)	Top-1 acc 64.844 (67.526)	Top-5 acc 82.812 (86.330)	lr 0.00091
Train [106][1000/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.040)	Loss 2.1580 (2.3470)	Entropy 0.53770 (0.53861)	Top-1 acc 73.438 (67.526)	Top-5 acc 89.062 (86.321)	lr 0.00091
Train [106][1010/3239]	Time 0.266 (0.519)	Data Time 0.001 (0.039)	Loss 2.6060 (2.3471)	Entropy 0.53782 (0.53860)	Top-1 acc 58.594 (67.514)	Top-5 acc 81.641 (86.316)	lr 0.00091
Train [106][1020/3239]	Time 0.224 (0.519)	Data Time 0.001 (0.039)	Loss 2.3926 (2.3477)	Entropy 0.53787 (0.53859)	Top-1 acc 64.062 (67.505)	Top-5 acc 86.719 (86.307)	lr 0.00091
Train [106][1030/3239]	Time 0.345 (0.570)	Data Time 0.003 (0.039)	Loss 2.2842 (2.3479)	Entropy 0.53801 (0.53859)	Top-1 acc 67.578 (67.493)	Top-5 acc 87.109 (86.311)	lr 0.00091
Train [106][1040/3239]	Time 0.234 (0.569)	Data Time 0.002 (0.038)	Loss 2.4506 (2.3492)	Entropy 0.53822 (0.53858)	Top-1 acc 65.234 (67.461)	Top-5 acc 83.984 (86.280)	lr 0.00091
Train [106][1050/3239]	Time 0.239 (0.568)	Data Time 0.001 (0.038)	Loss 2.2675 (2.3486)	Entropy 0.53837 (0.53858)	Top-1 acc 71.484 (67.474)	Top-5 acc 88.281 (86.290)	lr 0.00091
Train [106][1060/3239]	Time 0.233 (0.566)	Data Time 0.001 (0.038)	Loss 2.4252 (2.3482)	Entropy 0.53852 (0.53858)	Top-1 acc 65.625 (67.484)	Top-5 acc 86.328 (86.300)	lr 0.00091
Train [106][1070/3239]	Time 0.228 (0.565)	Data Time 0.001 (0.037)	Loss 2.2688 (2.3484)	Entropy 0.53860 (0.53858)	Top-1 acc 70.703 (67.472)	Top-5 acc 87.891 (86.304)	lr 0.00091
Train [106][1080/3239]	Time 0.324 (0.563)	Data Time 0.001 (0.037)	Loss 2.3327 (2.3484)	Entropy 0.53873 (0.53858)	Top-1 acc 64.844 (67.473)	Top-5 acc 84.766 (86.306)	lr 0.00091
Train [106][1090/3239]	Time 0.222 (0.562)	Data Time 0.001 (0.037)	Loss 2.2912 (2.3487)	Entropy 0.53895 (0.53858)	Top-1 acc 71.484 (67.462)	Top-5 acc 88.672 (86.300)	lr 0.00091
Train [106][1100/3239]	Time 0.251 (0.561)	Data Time 0.001 (0.036)	Loss 2.3482 (2.3485)	Entropy 0.53867 (0.53859)	Top-1 acc 66.797 (67.468)	Top-5 acc 86.719 (86.305)	lr 0.00091
Train [106][1110/3239]	Time 0.240 (0.560)	Data Time 0.001 (0.036)	Loss 2.2627 (2.3482)	Entropy 0.53864 (0.53859)	Top-1 acc 73.047 (67.483)	Top-5 acc 88.672 (86.307)	lr 0.00091
Train [106][1120/3239]	Time 0.237 (0.558)	Data Time 0.001 (0.036)	Loss 2.2537 (2.3478)	Entropy 0.53823 (0.53858)	Top-1 acc 69.531 (67.493)	Top-5 acc 89.844 (86.315)	lr 0.00091
Train [106][1130/3239]	Time 0.237 (0.557)	Data Time 0.001 (0.035)	Loss 2.3935 (2.3482)	Entropy 0.53764 (0.53858)	Top-1 acc 65.234 (67.479)	Top-5 acc 87.109 (86.312)	lr 0.00091
Train [106][1140/3239]	Time 0.267 (0.556)	Data Time 0.001 (0.035)	Loss 2.4041 (2.3491)	Entropy 0.53789 (0.53857)	Top-1 acc 67.969 (67.457)	Top-5 acc 84.766 (86.291)	lr 0.00091
Train [106][1150/3239]	Time 0.338 (0.556)	Data Time 0.001 (0.035)	Loss 2.5477 (2.3488)	Entropy 0.53800 (0.53857)	Top-1 acc 63.672 (67.465)	Top-5 acc 83.984 (86.299)	lr 0.00091
Train [106][1160/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.034)	Loss 2.2448 (2.3489)	Entropy 0.53809 (0.53856)	Top-1 acc 67.969 (67.462)	Top-5 acc 89.062 (86.296)	lr 0.00091
Train [106][1170/3239]	Time 0.236 (0.553)	Data Time 0.001 (0.034)	Loss 2.3756 (2.3487)	Entropy 0.53811 (0.53856)	Top-1 acc 69.141 (67.469)	Top-5 acc 85.156 (86.298)	lr 0.00091
Train [106][1180/3239]	Time 0.225 (0.552)	Data Time 0.001 (0.034)	Loss 2.5536 (2.3491)	Entropy 0.53784 (0.53855)	Top-1 acc 65.234 (67.460)	Top-5 acc 83.594 (86.292)	lr 0.00091
Train [106][1190/3239]	Time 0.240 (0.551)	Data Time 0.001 (0.034)	Loss 2.3203 (2.3491)	Entropy 0.53778 (0.53855)	Top-1 acc 68.359 (67.458)	Top-5 acc 85.547 (86.293)	lr 0.00091
Train [106][1200/3239]	Time 0.234 (0.550)	Data Time 0.001 (0.033)	Loss 2.4730 (2.3492)	Entropy 0.53791 (0.53854)	Top-1 acc 59.375 (67.450)	Top-5 acc 85.938 (86.285)	lr 0.00091
Train [106][1210/3239]	Time 0.232 (0.549)	Data Time 0.001 (0.033)	Loss 2.2357 (2.3490)	Entropy 0.53770 (0.53854)	Top-1 acc 67.578 (67.459)	Top-5 acc 89.844 (86.290)	lr 0.00091
Train [106][1220/3239]	Time 0.234 (0.548)	Data Time 0.001 (0.033)	Loss 2.4238 (2.3496)	Entropy 0.53762 (0.53853)	Top-1 acc 64.453 (67.446)	Top-5 acc 84.766 (86.283)	lr 0.00090
Train [106][1230/3239]	Time 0.231 (0.546)	Data Time 0.001 (0.033)	Loss 2.2267 (2.3493)	Entropy 0.53744 (0.53852)	Top-1 acc 68.359 (67.454)	Top-5 acc 88.281 (86.288)	lr 0.00090
Train [106][1240/3239]	Time 0.328 (0.545)	Data Time 0.001 (0.032)	Loss 2.2285 (2.3492)	Entropy 0.53762 (0.53851)	Top-1 acc 68.750 (67.454)	Top-5 acc 87.500 (86.292)	lr 0.00090
Train [106][1250/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.032)	Loss 2.4271 (2.3492)	Entropy 0.53740 (0.53851)	Top-1 acc 69.922 (67.462)	Top-5 acc 86.328 (86.293)	lr 0.00090
Train [106][1260/3239]	Time 0.230 (0.543)	Data Time 0.001 (0.032)	Loss 2.2697 (2.3493)	Entropy 0.53715 (0.53850)	Top-1 acc 66.016 (67.452)	Top-5 acc 90.625 (86.291)	lr 0.00090
Train [106][1270/3239]	Time 0.225 (0.542)	Data Time 0.001 (0.032)	Loss 2.2611 (2.3494)	Entropy 0.53728 (0.53849)	Top-1 acc 69.531 (67.442)	Top-5 acc 90.234 (86.292)	lr 0.00090
Train [106][1280/3239]	Time 0.215 (0.541)	Data Time 0.001 (0.031)	Loss 2.5022 (2.3495)	Entropy 0.53717 (0.53848)	Top-1 acc 62.500 (67.435)	Top-5 acc 85.156 (86.290)	lr 0.00090
Train [106][1290/3239]	Time 0.251 (0.540)	Data Time 0.001 (0.031)	Loss 2.2415 (2.3497)	Entropy 0.53727 (0.53847)	Top-1 acc 70.703 (67.426)	Top-5 acc 87.500 (86.282)	lr 0.00090
Train [106][1300/3239]	Time 0.221 (0.539)	Data Time 0.001 (0.031)	Loss 2.5356 (2.3496)	Entropy 0.53748 (0.53846)	Top-1 acc 61.719 (67.434)	Top-5 acc 80.859 (86.282)	lr 0.00090
Train [106][1310/3239]	Time 0.310 (0.538)	Data Time 0.001 (0.031)	Loss 2.1998 (2.3497)	Entropy 0.53735 (0.53845)	Top-1 acc 71.875 (67.430)	Top-5 acc 89.062 (86.283)	lr 0.00090
Train [106][1320/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.031)	Loss 2.4404 (2.3497)	Entropy 0.53729 (0.53844)	Top-1 acc 61.328 (67.428)	Top-5 acc 85.156 (86.283)	lr 0.00090
Train [106][1330/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.030)	Loss 2.3437 (2.3492)	Entropy 0.53748 (0.53844)	Top-1 acc 67.969 (67.440)	Top-5 acc 83.984 (86.292)	lr 0.00090
Train [106][1340/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.030)	Loss 2.1788 (2.3489)	Entropy 0.53756 (0.53843)	Top-1 acc 70.312 (67.443)	Top-5 acc 89.453 (86.293)	lr 0.00090
Train [106][1350/3239]	Time 0.236 (0.535)	Data Time 0.001 (0.030)	Loss 2.2175 (2.3485)	Entropy 0.53737 (0.53842)	Top-1 acc 73.828 (67.458)	Top-5 acc 87.109 (86.302)	lr 0.00090
Train [106][1360/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.030)	Loss 2.3272 (2.3487)	Entropy 0.53750 (0.53841)	Top-1 acc 68.359 (67.456)	Top-5 acc 87.109 (86.298)	lr 0.00090
Train [106][1370/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.029)	Loss 2.2681 (2.3481)	Entropy 0.53748 (0.53841)	Top-1 acc 69.922 (67.470)	Top-5 acc 86.719 (86.311)	lr 0.00090
Train [106][1380/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.029)	Loss 2.5533 (2.3482)	Entropy 0.53793 (0.53840)	Top-1 acc 64.062 (67.467)	Top-5 acc 82.422 (86.313)	lr 0.00090
Train [106][1390/3239]	Time 0.238 (0.531)	Data Time 0.001 (0.029)	Loss 2.3203 (2.3481)	Entropy 0.53756 (0.53840)	Top-1 acc 67.188 (67.466)	Top-5 acc 85.938 (86.314)	lr 0.00090
Train [106][1400/3239]	Time 0.243 (0.530)	Data Time 0.001 (0.029)	Loss 2.1863 (2.3480)	Entropy 0.53712 (0.53839)	Top-1 acc 76.562 (67.477)	Top-5 acc 87.891 (86.315)	lr 0.00090
Train [106][1410/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.029)	Loss 2.2079 (2.3478)	Entropy 0.53709 (0.53838)	Top-1 acc 67.578 (67.486)	Top-5 acc 89.062 (86.314)	lr 0.00090
Train [106][1420/3239]	Time 0.233 (0.529)	Data Time 0.001 (0.028)	Loss 2.3688 (2.3477)	Entropy 0.53735 (0.53837)	Top-1 acc 66.016 (67.488)	Top-5 acc 85.938 (86.320)	lr 0.00090
Train [106][1430/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.028)	Loss 2.4307 (2.3478)	Entropy 0.53746 (0.53837)	Top-1 acc 66.406 (67.491)	Top-5 acc 85.156 (86.322)	lr 0.00090
Train [106][1440/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.028)	Loss 2.2994 (2.3480)	Entropy 0.53699 (0.53836)	Top-1 acc 68.750 (67.484)	Top-5 acc 87.109 (86.323)	lr 0.00090
Train [106][1450/3239]	Time 0.261 (0.526)	Data Time 0.001 (0.028)	Loss 2.4347 (2.3482)	Entropy 0.53677 (0.53835)	Top-1 acc 68.750 (67.484)	Top-5 acc 85.156 (86.317)	lr 0.00090
Train [106][1460/3239]	Time 0.221 (0.525)	Data Time 0.001 (0.028)	Loss 2.4265 (2.3485)	Entropy 0.53691 (0.53834)	Top-1 acc 63.281 (67.474)	Top-5 acc 87.109 (86.313)	lr 0.00090
Train [106][1470/3239]	Time 0.321 (0.524)	Data Time 0.001 (0.028)	Loss 2.4610 (2.3484)	Entropy 0.53679 (0.53833)	Top-1 acc 66.016 (67.478)	Top-5 acc 84.375 (86.316)	lr 0.00090
Train [106][1480/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.027)	Loss 2.3825 (2.3484)	Entropy 0.53718 (0.53832)	Top-1 acc 67.969 (67.481)	Top-5 acc 85.156 (86.315)	lr 0.00090
Train [106][1490/3239]	Time 0.228 (0.523)	Data Time 0.002 (0.027)	Loss 2.4125 (2.3485)	Entropy 0.53716 (0.53831)	Top-1 acc 66.406 (67.483)	Top-5 acc 85.547 (86.313)	lr 0.00089
Train [106][1500/3239]	Time 0.225 (0.522)	Data Time 0.001 (0.027)	Loss 2.2562 (2.3486)	Entropy 0.53752 (0.53830)	Top-1 acc 68.359 (67.482)	Top-5 acc 89.453 (86.311)	lr 0.00089
Train [106][1510/3239]	Time 0.215 (0.521)	Data Time 0.001 (0.027)	Loss 2.5478 (2.3485)	Entropy 0.53738 (0.53830)	Top-1 acc 62.109 (67.488)	Top-5 acc 82.812 (86.311)	lr 0.00089
Train [106][1520/3239]	Time 0.228 (0.520)	Data Time 0.001 (0.027)	Loss 2.4313 (2.3485)	Entropy 0.53747 (0.53829)	Top-1 acc 66.797 (67.492)	Top-5 acc 84.375 (86.315)	lr 0.00089
Train [106][1530/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.027)	Loss 2.3062 (2.3487)	Entropy 0.53719 (0.53829)	Top-1 acc 69.141 (67.491)	Top-5 acc 87.500 (86.314)	lr 0.00089
Train [106][1540/3239]	Time 0.318 (0.518)	Data Time 0.001 (0.026)	Loss 2.3150 (2.3491)	Entropy 0.53709 (0.53828)	Top-1 acc 68.750 (67.487)	Top-5 acc 86.328 (86.310)	lr 0.00089
Train [106][1550/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.026)	Loss 2.4079 (2.3495)	Entropy 0.53727 (0.53827)	Top-1 acc 67.969 (67.481)	Top-5 acc 84.766 (86.302)	lr 0.00089
Train [106][1560/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.026)	Loss 2.4573 (2.3496)	Entropy 0.53756 (0.53827)	Top-1 acc 68.359 (67.482)	Top-5 acc 85.938 (86.305)	lr 0.00089
Train [106][1570/3239]	Time 0.224 (0.516)	Data Time 0.001 (0.026)	Loss 2.5166 (2.3498)	Entropy 0.53773 (0.53826)	Top-1 acc 62.109 (67.473)	Top-5 acc 83.203 (86.298)	lr 0.00089
Train [106][1580/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.026)	Loss 2.3133 (2.3497)	Entropy 0.53766 (0.53826)	Top-1 acc 66.797 (67.469)	Top-5 acc 85.938 (86.301)	lr 0.00089
Train [106][1590/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.026)	Loss 2.1486 (2.3495)	Entropy 0.53775 (0.53826)	Top-1 acc 72.656 (67.476)	Top-5 acc 90.625 (86.307)	lr 0.00089
Train [106][1600/3239]	Time 0.252 (0.514)	Data Time 0.001 (0.025)	Loss 2.2964 (2.3495)	Entropy 0.53786 (0.53825)	Top-1 acc 67.969 (67.477)	Top-5 acc 85.938 (86.308)	lr 0.00089
Train [106][1610/3239]	Time 0.246 (0.514)	Data Time 0.001 (0.025)	Loss 2.3100 (2.3497)	Entropy 0.53769 (0.53825)	Top-1 acc 70.703 (67.473)	Top-5 acc 85.938 (86.303)	lr 0.00089
Train [106][1620/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.025)	Loss 2.3896 (2.3496)	Entropy 0.53783 (0.53825)	Top-1 acc 65.625 (67.474)	Top-5 acc 87.109 (86.304)	lr 0.00089
Train [106][1630/3239]	Time 0.320 (0.512)	Data Time 0.001 (0.025)	Loss 2.5355 (2.3500)	Entropy 0.53831 (0.53825)	Top-1 acc 66.797 (67.464)	Top-5 acc 82.031 (86.296)	lr 0.00089
Train [106][1640/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.025)	Loss 2.4415 (2.3501)	Entropy 0.53838 (0.53825)	Top-1 acc 65.625 (67.462)	Top-5 acc 83.594 (86.295)	lr 0.00089
Train [106][1650/3239]	Time 0.251 (0.511)	Data Time 0.001 (0.025)	Loss 2.4312 (2.3499)	Entropy 0.53796 (0.53825)	Top-1 acc 61.719 (67.470)	Top-5 acc 84.375 (86.301)	lr 0.00089
Train [106][1660/3239]	Time 0.288 (0.512)	Data Time 0.002 (0.025)	Loss 2.1552 (2.3499)	Entropy 0.53793 (0.53824)	Top-1 acc 74.219 (67.474)	Top-5 acc 89.062 (86.300)	lr 0.00089
Train [106][1670/3239]	Time 0.233 (0.511)	Data Time 0.002 (0.024)	Loss 2.2889 (2.3502)	Entropy 0.53792 (0.53824)	Top-1 acc 71.484 (67.468)	Top-5 acc 84.766 (86.290)	lr 0.00089
Train [106][1680/3239]	Time 0.292 (0.543)	Data Time 0.004 (0.024)	Loss 2.3372 (2.3503)	Entropy 0.53777 (0.53824)	Top-1 acc 65.234 (67.462)	Top-5 acc 88.672 (86.291)	lr 0.00089
Train [106][1690/3239]	Time 0.231 (0.542)	Data Time 0.002 (0.024)	Loss 2.3962 (2.3504)	Entropy 0.53768 (0.53824)	Top-1 acc 66.797 (67.458)	Top-5 acc 86.328 (86.289)	lr 0.00089
Train [106][1700/3239]	Time 0.324 (0.541)	Data Time 0.001 (0.024)	Loss 2.3892 (2.3508)	Entropy 0.53745 (0.53823)	Top-1 acc 66.797 (67.446)	Top-5 acc 87.109 (86.285)	lr 0.00089
Train [106][1710/3239]	Time 0.235 (0.540)	Data Time 0.001 (0.024)	Loss 2.2383 (2.3509)	Entropy 0.53737 (0.53823)	Top-1 acc 70.703 (67.443)	Top-5 acc 87.891 (86.283)	lr 0.00089
Train [106][1720/3239]	Time 0.236 (0.540)	Data Time 0.001 (0.024)	Loss 2.2338 (2.3511)	Entropy 0.53754 (0.53822)	Top-1 acc 68.750 (67.436)	Top-5 acc 86.719 (86.282)	lr 0.00089
Train [106][1730/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.024)	Loss 2.5630 (2.3515)	Entropy 0.53763 (0.53822)	Top-1 acc 59.375 (67.421)	Top-5 acc 83.594 (86.282)	lr 0.00089
Train [106][1740/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.024)	Loss 2.7555 (2.3519)	Entropy 0.53780 (0.53822)	Top-1 acc 55.859 (67.414)	Top-5 acc 78.906 (86.271)	lr 0.00089
Train [106][1750/3239]	Time 0.245 (0.538)	Data Time 0.001 (0.023)	Loss 2.5179 (2.3520)	Entropy 0.53792 (0.53822)	Top-1 acc 66.016 (67.418)	Top-5 acc 83.594 (86.269)	lr 0.00089
Train [106][1760/3239]	Time 0.236 (0.537)	Data Time 0.001 (0.023)	Loss 2.2636 (2.3520)	Entropy 0.53760 (0.53821)	Top-1 acc 67.578 (67.414)	Top-5 acc 85.547 (86.264)	lr 0.00088
Train [106][1770/3239]	Time 0.229 (0.536)	Data Time 0.001 (0.023)	Loss 2.9257 (2.3522)	Entropy 0.53747 (0.53821)	Top-1 acc 51.953 (67.410)	Top-5 acc 76.562 (86.257)	lr 0.00088
Train [106][1780/3239]	Time 0.234 (0.536)	Data Time 0.001 (0.023)	Loss 2.2188 (2.3523)	Entropy 0.53761 (0.53821)	Top-1 acc 68.750 (67.404)	Top-5 acc 89.062 (86.252)	lr 0.00088
Train [106][1790/3239]	Time 0.329 (0.535)	Data Time 0.001 (0.023)	Loss 2.3532 (2.3522)	Entropy 0.53751 (0.53820)	Top-1 acc 67.969 (67.407)	Top-5 acc 86.719 (86.252)	lr 0.00088
Train [106][1800/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.023)	Loss 2.2461 (2.3523)	Entropy 0.53751 (0.53820)	Top-1 acc 67.969 (67.405)	Top-5 acc 86.719 (86.253)	lr 0.00088
Train [106][1810/3239]	Time 0.292 (0.534)	Data Time 0.003 (0.023)	Loss 2.3714 (2.3522)	Entropy 0.53745 (0.53819)	Top-1 acc 66.016 (67.401)	Top-5 acc 87.891 (86.255)	lr 0.00088
Train [106][1820/3239]	Time 0.275 (0.534)	Data Time 0.001 (0.023)	Loss 2.2710 (2.3519)	Entropy 0.53753 (0.53819)	Top-1 acc 67.969 (67.410)	Top-5 acc 87.109 (86.258)	lr 0.00088
Train [106][1830/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.022)	Loss 2.3742 (2.3522)	Entropy 0.53766 (0.53819)	Top-1 acc 63.672 (67.398)	Top-5 acc 85.938 (86.249)	lr 0.00088
Train [106][1840/3239]	Time 0.264 (0.533)	Data Time 0.001 (0.022)	Loss 2.2275 (2.3526)	Entropy 0.53775 (0.53819)	Top-1 acc 69.531 (67.389)	Top-5 acc 87.500 (86.244)	lr 0.00088
Train [106][1850/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.022)	Loss 2.3120 (2.3527)	Entropy 0.53788 (0.53818)	Top-1 acc 72.656 (67.393)	Top-5 acc 88.281 (86.245)	lr 0.00088
Train [106][1860/3239]	Time 0.326 (0.531)	Data Time 0.001 (0.022)	Loss 2.3082 (2.3528)	Entropy 0.53807 (0.53818)	Top-1 acc 70.703 (67.391)	Top-5 acc 88.281 (86.241)	lr 0.00088
Train [106][1870/3239]	Time 0.229 (0.531)	Data Time 0.001 (0.022)	Loss 2.3572 (2.3528)	Entropy 0.53810 (0.53818)	Top-1 acc 67.188 (67.390)	Top-5 acc 86.719 (86.243)	lr 0.00088
Train [106][1880/3239]	Time 0.236 (0.530)	Data Time 0.001 (0.022)	Loss 2.3447 (2.3528)	Entropy 0.53826 (0.53818)	Top-1 acc 63.281 (67.388)	Top-5 acc 85.547 (86.243)	lr 0.00088
Train [106][1890/3239]	Time 0.224 (0.529)	Data Time 0.001 (0.022)	Loss 2.6544 (2.3529)	Entropy 0.53830 (0.53818)	Top-1 acc 58.203 (67.388)	Top-5 acc 82.422 (86.242)	lr 0.00088
Train [106][1900/3239]	Time 0.255 (0.529)	Data Time 0.001 (0.022)	Loss 2.5116 (2.3529)	Entropy 0.53835 (0.53818)	Top-1 acc 62.500 (67.390)	Top-5 acc 83.984 (86.242)	lr 0.00088
Train [106][1910/3239]	Time 0.224 (0.528)	Data Time 0.001 (0.022)	Loss 2.5242 (2.3530)	Entropy 0.53852 (0.53818)	Top-1 acc 63.672 (67.392)	Top-5 acc 81.250 (86.242)	lr 0.00088
Train [106][1920/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.021)	Loss 2.1085 (2.3528)	Entropy 0.53853 (0.53818)	Top-1 acc 69.922 (67.399)	Top-5 acc 91.797 (86.249)	lr 0.00088
Train [106][1930/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.021)	Loss 2.5377 (2.3528)	Entropy 0.53826 (0.53819)	Top-1 acc 65.234 (67.401)	Top-5 acc 82.422 (86.252)	lr 0.00088
Train [106][1940/3239]	Time 0.298 (0.527)	Data Time 0.001 (0.021)	Loss 2.3688 (2.3527)	Entropy 0.53838 (0.53819)	Top-1 acc 65.625 (67.405)	Top-5 acc 85.938 (86.253)	lr 0.00088
Train [106][1950/3239]	Time 0.460 (0.526)	Data Time 0.001 (0.021)	Loss 2.4634 (2.3530)	Entropy 0.53836 (0.53819)	Top-1 acc 66.406 (67.400)	Top-5 acc 85.938 (86.249)	lr 0.00088
Train [106][1960/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.021)	Loss 2.2906 (2.3526)	Entropy 0.53790 (0.53819)	Top-1 acc 71.484 (67.407)	Top-5 acc 87.500 (86.255)	lr 0.00088
Train [106][1970/3239]	Time 0.227 (0.526)	Data Time 0.001 (0.021)	Loss 2.3174 (2.3530)	Entropy 0.53801 (0.53819)	Top-1 acc 69.141 (67.402)	Top-5 acc 87.500 (86.248)	lr 0.00088
Train [106][1980/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.021)	Loss 2.4660 (2.3533)	Entropy 0.53760 (0.53819)	Top-1 acc 62.500 (67.397)	Top-5 acc 83.984 (86.238)	lr 0.00088
Train [106][1990/3239]	Time 0.247 (0.524)	Data Time 0.001 (0.021)	Loss 2.2413 (2.3532)	Entropy 0.53743 (0.53818)	Top-1 acc 70.703 (67.396)	Top-5 acc 88.672 (86.241)	lr 0.00088
Train [106][2000/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.021)	Loss 2.4423 (2.3533)	Entropy 0.53705 (0.53818)	Top-1 acc 64.062 (67.394)	Top-5 acc 84.766 (86.237)	lr 0.00088
Train [106][2010/3239]	Time 0.234 (0.523)	Data Time 0.001 (0.021)	Loss 2.2771 (2.3535)	Entropy 0.53697 (0.53817)	Top-1 acc 71.094 (67.389)	Top-5 acc 88.281 (86.235)	lr 0.00088
Train [106][2020/3239]	Time 0.324 (0.523)	Data Time 0.001 (0.020)	Loss 2.0787 (2.3538)	Entropy 0.53719 (0.53817)	Top-1 acc 74.219 (67.380)	Top-5 acc 90.625 (86.230)	lr 0.00087
Train [106][2030/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.020)	Loss 2.5172 (2.3541)	Entropy 0.53700 (0.53816)	Top-1 acc 61.719 (67.368)	Top-5 acc 84.766 (86.229)	lr 0.00087
Train [106][2040/3239]	Time 0.221 (0.521)	Data Time 0.001 (0.020)	Loss 2.5380 (2.3541)	Entropy 0.53728 (0.53816)	Top-1 acc 64.453 (67.368)	Top-5 acc 84.375 (86.227)	lr 0.00087
Train [106][2050/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.020)	Loss 2.3021 (2.3542)	Entropy 0.53738 (0.53815)	Top-1 acc 67.188 (67.370)	Top-5 acc 88.672 (86.225)	lr 0.00087
Train [106][2060/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.020)	Loss 2.3225 (2.3540)	Entropy 0.53747 (0.53815)	Top-1 acc 68.750 (67.371)	Top-5 acc 86.719 (86.228)	lr 0.00087
Train [106][2070/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.020)	Loss 2.2250 (2.3537)	Entropy 0.53742 (0.53815)	Top-1 acc 69.531 (67.379)	Top-5 acc 87.891 (86.234)	lr 0.00087
Train [106][2080/3239]	Time 0.222 (0.519)	Data Time 0.001 (0.020)	Loss 2.2984 (2.3535)	Entropy 0.53742 (0.53814)	Top-1 acc 64.844 (67.386)	Top-5 acc 87.891 (86.235)	lr 0.00087
Train [106][2090/3239]	Time 0.314 (0.519)	Data Time 0.001 (0.020)	Loss 2.4046 (2.3536)	Entropy 0.53760 (0.53814)	Top-1 acc 65.234 (67.385)	Top-5 acc 86.328 (86.234)	lr 0.00087
Train [106][2100/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.020)	Loss 2.2643 (2.3533)	Entropy 0.53779 (0.53814)	Top-1 acc 69.922 (67.393)	Top-5 acc 87.891 (86.239)	lr 0.00087
Train [106][2110/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.020)	Loss 2.2492 (2.3530)	Entropy 0.53788 (0.53814)	Top-1 acc 70.703 (67.398)	Top-5 acc 86.719 (86.246)	lr 0.00087
Train [106][2120/3239]	Time 0.224 (0.517)	Data Time 0.001 (0.020)	Loss 2.3370 (2.3532)	Entropy 0.53776 (0.53813)	Top-1 acc 67.578 (67.390)	Top-5 acc 86.719 (86.243)	lr 0.00087
Train [106][2130/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.019)	Loss 2.3494 (2.3532)	Entropy 0.53756 (0.53813)	Top-1 acc 65.234 (67.388)	Top-5 acc 87.500 (86.240)	lr 0.00087
Train [106][2140/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.019)	Loss 2.3429 (2.3532)	Entropy 0.53764 (0.53813)	Top-1 acc 66.797 (67.391)	Top-5 acc 85.156 (86.236)	lr 0.00087
Train [106][2150/3239]	Time 0.239 (0.515)	Data Time 0.001 (0.019)	Loss 2.1903 (2.3535)	Entropy 0.53713 (0.53813)	Top-1 acc 70.703 (67.389)	Top-5 acc 88.281 (86.233)	lr 0.00087
Train [106][2160/3239]	Time 0.270 (0.515)	Data Time 0.001 (0.019)	Loss 2.5379 (2.3535)	Entropy 0.53693 (0.53812)	Top-1 acc 60.547 (67.384)	Top-5 acc 82.422 (86.231)	lr 0.00087
Train [106][2170/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.019)	Loss 2.3324 (2.3536)	Entropy 0.53707 (0.53812)	Top-1 acc 66.406 (67.382)	Top-5 acc 85.156 (86.229)	lr 0.00087
Train [106][2180/3239]	Time 0.333 (0.514)	Data Time 0.001 (0.019)	Loss 2.7426 (2.3536)	Entropy 0.53721 (0.53811)	Top-1 acc 54.688 (67.381)	Top-5 acc 76.953 (86.228)	lr 0.00087
Train [106][2190/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.019)	Loss 2.3221 (2.3537)	Entropy 0.53723 (0.53811)	Top-1 acc 66.797 (67.375)	Top-5 acc 87.500 (86.227)	lr 0.00087
Train [106][2200/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.019)	Loss 2.4688 (2.3538)	Entropy 0.53748 (0.53810)	Top-1 acc 65.625 (67.378)	Top-5 acc 85.156 (86.226)	lr 0.00087
Train [106][2210/3239]	Time 0.224 (0.513)	Data Time 0.001 (0.019)	Loss 2.1976 (2.3535)	Entropy 0.53738 (0.53810)	Top-1 acc 72.656 (67.387)	Top-5 acc 88.672 (86.231)	lr 0.00087
Train [106][2220/3239]	Time 0.272 (0.512)	Data Time 0.001 (0.019)	Loss 2.3392 (2.3536)	Entropy 0.53753 (0.53810)	Top-1 acc 68.750 (67.383)	Top-5 acc 87.891 (86.232)	lr 0.00087
Train [106][2230/3239]	Time 0.225 (0.512)	Data Time 0.001 (0.019)	Loss 2.4306 (2.3537)	Entropy 0.53761 (0.53810)	Top-1 acc 67.969 (67.384)	Top-5 acc 83.594 (86.232)	lr 0.00087
Train [106][2240/3239]	Time 0.224 (0.511)	Data Time 0.001 (0.019)	Loss 2.4518 (2.3538)	Entropy 0.53764 (0.53809)	Top-1 acc 63.672 (67.382)	Top-5 acc 83.203 (86.231)	lr 0.00087
Train [106][2250/3239]	Time 0.323 (0.511)	Data Time 0.001 (0.019)	Loss 2.3949 (2.3540)	Entropy 0.53742 (0.53809)	Top-1 acc 66.797 (67.376)	Top-5 acc 83.203 (86.225)	lr 0.00087
Train [106][2260/3239]	Time 0.243 (0.510)	Data Time 0.001 (0.018)	Loss 2.2637 (2.3542)	Entropy 0.53724 (0.53809)	Top-1 acc 71.875 (67.372)	Top-5 acc 87.500 (86.223)	lr 0.00087
Train [106][2270/3239]	Time 0.232 (0.510)	Data Time 0.001 (0.018)	Loss 2.2575 (2.3540)	Entropy 0.53729 (0.53808)	Top-1 acc 71.094 (67.380)	Top-5 acc 87.109 (86.229)	lr 0.00087
Train [106][2280/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.018)	Loss 2.3167 (2.3541)	Entropy 0.53757 (0.53808)	Top-1 acc 69.922 (67.377)	Top-5 acc 86.719 (86.228)	lr 0.00087
Train [106][2290/3239]	Time 0.235 (0.509)	Data Time 0.001 (0.018)	Loss 2.2269 (2.3539)	Entropy 0.53777 (0.53808)	Top-1 acc 70.312 (67.381)	Top-5 acc 87.891 (86.233)	lr 0.00086
Train [106][2300/3239]	Time 0.229 (0.509)	Data Time 0.001 (0.018)	Loss 2.3756 (2.3539)	Entropy 0.53790 (0.53808)	Top-1 acc 65.625 (67.376)	Top-5 acc 83.203 (86.229)	lr 0.00086
Train [106][2310/3239]	Time 0.227 (0.508)	Data Time 0.001 (0.018)	Loss 2.3844 (2.3538)	Entropy 0.53793 (0.53808)	Top-1 acc 66.406 (67.379)	Top-5 acc 88.281 (86.232)	lr 0.00086
Train [106][2320/3239]	Time 0.277 (0.508)	Data Time 0.001 (0.018)	Loss 2.5663 (2.3539)	Entropy 0.53787 (0.53808)	Top-1 acc 65.625 (67.373)	Top-5 acc 83.594 (86.230)	lr 0.00086
Train [106][2330/3239]	Time 0.224 (0.507)	Data Time 0.001 (0.018)	Loss 2.3251 (2.3539)	Entropy 0.53783 (0.53808)	Top-1 acc 66.797 (67.374)	Top-5 acc 86.719 (86.231)	lr 0.00086
Train [106][2340/3239]	Time 0.447 (0.530)	Data Time 0.029 (0.018)	Loss 2.5775 (2.3540)	Entropy 0.53789 (0.53807)	Top-1 acc 62.891 (67.371)	Top-5 acc 83.594 (86.232)	lr 0.00086
Train [106][2350/3239]	Time 0.267 (0.530)	Data Time 0.002 (0.018)	Loss 2.2710 (2.3537)	Entropy 0.53791 (0.53807)	Top-1 acc 69.531 (67.378)	Top-5 acc 86.328 (86.239)	lr 0.00086
Train [106][2360/3239]	Time 0.246 (0.529)	Data Time 0.002 (0.018)	Loss 2.3522 (2.3536)	Entropy 0.53781 (0.53807)	Top-1 acc 67.188 (67.381)	Top-5 acc 84.375 (86.236)	lr 0.00086
Train [106][2370/3239]	Time 0.247 (0.529)	Data Time 0.001 (0.018)	Loss 2.3538 (2.3537)	Entropy 0.53782 (0.53807)	Top-1 acc 70.312 (67.383)	Top-5 acc 85.156 (86.232)	lr 0.00086
Train [106][2380/3239]	Time 0.252 (0.528)	Data Time 0.002 (0.018)	Loss 2.4687 (2.3539)	Entropy 0.53794 (0.53807)	Top-1 acc 63.281 (67.377)	Top-5 acc 83.594 (86.225)	lr 0.00086
Train [106][2390/3239]	Time 0.246 (0.528)	Data Time 0.001 (0.018)	Loss 2.4160 (2.3539)	Entropy 0.53816 (0.53807)	Top-1 acc 66.016 (67.373)	Top-5 acc 85.547 (86.226)	lr 0.00086
Train [106][2400/3239]	Time 0.244 (0.527)	Data Time 0.001 (0.018)	Loss 2.2934 (2.3542)	Entropy 0.53853 (0.53807)	Top-1 acc 67.578 (67.364)	Top-5 acc 87.891 (86.223)	lr 0.00086
Train [106][2410/3239]	Time 0.347 (0.527)	Data Time 0.001 (0.017)	Loss 2.7242 (2.3544)	Entropy 0.53868 (0.53807)	Top-1 acc 56.250 (67.362)	Top-5 acc 80.859 (86.223)	lr 0.00086
Train [106][2420/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.017)	Loss 2.6486 (2.3547)	Entropy 0.53890 (0.53808)	Top-1 acc 62.109 (67.356)	Top-5 acc 80.859 (86.216)	lr 0.00086
Train [106][2430/3239]	Time 0.227 (0.526)	Data Time 0.001 (0.017)	Loss 2.4051 (2.3545)	Entropy 0.53873 (0.53808)	Top-1 acc 67.578 (67.357)	Top-5 acc 84.375 (86.217)	lr 0.00086
Train [106][2440/3239]	Time 0.255 (0.526)	Data Time 0.001 (0.017)	Loss 2.4177 (2.3550)	Entropy 0.53849 (0.53808)	Top-1 acc 64.453 (67.348)	Top-5 acc 85.156 (86.212)	lr 0.00086
Train [106][2450/3239]	Time 0.287 (0.526)	Data Time 0.002 (0.017)	Loss 2.3969 (2.3549)	Entropy 0.53869 (0.53808)	Top-1 acc 66.406 (67.352)	Top-5 acc 88.672 (86.216)	lr 0.00086
Train [106][2460/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.017)	Loss 2.3219 (2.3550)	Entropy 0.53831 (0.53809)	Top-1 acc 67.188 (67.351)	Top-5 acc 87.891 (86.216)	lr 0.00086
Train [106][2470/3239]	Time 0.263 (0.525)	Data Time 0.001 (0.017)	Loss 2.2961 (2.3549)	Entropy 0.53832 (0.53809)	Top-1 acc 67.578 (67.349)	Top-5 acc 89.453 (86.216)	lr 0.00086
Train [106][2480/3239]	Time 0.242 (0.525)	Data Time 0.001 (0.017)	Loss 2.4397 (2.3549)	Entropy 0.53858 (0.53809)	Top-1 acc 65.234 (67.346)	Top-5 acc 84.766 (86.219)	lr 0.00086
Train [106][2490/3239]	Time 0.228 (0.525)	Data Time 0.001 (0.017)	Loss 2.6169 (2.3550)	Entropy 0.53877 (0.53809)	Top-1 acc 62.500 (67.349)	Top-5 acc 81.641 (86.215)	lr 0.00086
Train [106][2500/3239]	Time 0.274 (0.524)	Data Time 0.001 (0.017)	Loss 2.2933 (2.3549)	Entropy 0.53875 (0.53809)	Top-1 acc 68.359 (67.349)	Top-5 acc 89.844 (86.216)	lr 0.00086
Train [106][2510/3239]	Time 0.259 (0.524)	Data Time 0.001 (0.017)	Loss 2.3481 (2.3548)	Entropy 0.53874 (0.53810)	Top-1 acc 68.359 (67.349)	Top-5 acc 88.281 (86.221)	lr 0.00086
Train [106][2520/3239]	Time 0.244 (0.523)	Data Time 0.001 (0.017)	Loss 2.2225 (2.3545)	Entropy 0.53881 (0.53810)	Top-1 acc 68.750 (67.353)	Top-5 acc 89.844 (86.224)	lr 0.00086
Train [106][2530/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.017)	Loss 2.3101 (2.3545)	Entropy 0.53878 (0.53810)	Top-1 acc 66.797 (67.355)	Top-5 acc 88.281 (86.224)	lr 0.00086
Train [106][2540/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.017)	Loss 2.5389 (2.3545)	Entropy 0.53894 (0.53810)	Top-1 acc 65.625 (67.356)	Top-5 acc 82.422 (86.226)	lr 0.00086
Train [106][2550/3239]	Time 0.277 (0.522)	Data Time 0.002 (0.017)	Loss 2.4496 (2.3547)	Entropy 0.53880 (0.53811)	Top-1 acc 65.625 (67.352)	Top-5 acc 85.156 (86.223)	lr 0.00086
Train [106][2560/3239]	Time 0.250 (0.522)	Data Time 0.001 (0.017)	Loss 2.2905 (2.3546)	Entropy 0.53881 (0.53811)	Top-1 acc 69.141 (67.355)	Top-5 acc 86.328 (86.223)	lr 0.00086
Train [106][2570/3239]	Time 0.316 (0.521)	Data Time 0.001 (0.016)	Loss 2.4567 (2.3545)	Entropy 0.53888 (0.53811)	Top-1 acc 63.281 (67.355)	Top-5 acc 85.547 (86.226)	lr 0.00085
Train [106][2580/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.016)	Loss 2.0937 (2.3541)	Entropy 0.53866 (0.53812)	Top-1 acc 77.734 (67.367)	Top-5 acc 91.406 (86.232)	lr 0.00085
Train [106][2590/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.016)	Loss 2.4194 (2.3542)	Entropy 0.53899 (0.53812)	Top-1 acc 68.750 (67.369)	Top-5 acc 86.328 (86.234)	lr 0.00085
Train [106][2600/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.016)	Loss 2.5554 (2.3542)	Entropy 0.53932 (0.53812)	Top-1 acc 60.938 (67.368)	Top-5 acc 83.984 (86.233)	lr 0.00085
Train [106][2610/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.016)	Loss 2.3225 (2.3540)	Entropy 0.53929 (0.53813)	Top-1 acc 67.969 (67.375)	Top-5 acc 86.328 (86.234)	lr 0.00085
Train [106][2620/3239]	Time 0.240 (0.519)	Data Time 0.001 (0.016)	Loss 2.4226 (2.3542)	Entropy 0.53933 (0.53813)	Top-1 acc 66.797 (67.367)	Top-5 acc 83.594 (86.231)	lr 0.00085
Train [106][2630/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.016)	Loss 2.2543 (2.3543)	Entropy 0.53875 (0.53814)	Top-1 acc 66.797 (67.367)	Top-5 acc 88.672 (86.229)	lr 0.00085
Train [106][2640/3239]	Time 0.358 (0.519)	Data Time 0.001 (0.016)	Loss 2.1943 (2.3545)	Entropy 0.53841 (0.53814)	Top-1 acc 72.266 (67.362)	Top-5 acc 90.234 (86.226)	lr 0.00085
Train [106][2650/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.016)	Loss 2.3509 (2.3548)	Entropy 0.53827 (0.53814)	Top-1 acc 70.703 (67.356)	Top-5 acc 83.203 (86.218)	lr 0.00085
Train [106][2660/3239]	Time 0.237 (0.518)	Data Time 0.001 (0.016)	Loss 2.3062 (2.3546)	Entropy 0.53851 (0.53814)	Top-1 acc 67.578 (67.361)	Top-5 acc 86.328 (86.219)	lr 0.00085
Train [106][2670/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.016)	Loss 2.4378 (2.3546)	Entropy 0.53813 (0.53814)	Top-1 acc 65.625 (67.364)	Top-5 acc 84.766 (86.220)	lr 0.00085
Train [106][2680/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.016)	Loss 2.1748 (2.3544)	Entropy 0.53780 (0.53814)	Top-1 acc 73.047 (67.368)	Top-5 acc 87.891 (86.224)	lr 0.00085
Train [106][2690/3239]	Time 0.218 (0.517)	Data Time 0.001 (0.016)	Loss 2.4465 (2.3544)	Entropy 0.53798 (0.53814)	Top-1 acc 64.844 (67.369)	Top-5 acc 84.375 (86.221)	lr 0.00085
Train [106][2700/3239]	Time 0.217 (0.516)	Data Time 0.001 (0.016)	Loss 2.4322 (2.3543)	Entropy 0.53780 (0.53814)	Top-1 acc 67.188 (67.373)	Top-5 acc 85.547 (86.223)	lr 0.00085
Train [106][2710/3239]	Time 0.254 (0.516)	Data Time 0.024 (0.016)	Loss 2.3286 (2.3544)	Entropy 0.53797 (0.53814)	Top-1 acc 69.922 (67.372)	Top-5 acc 85.156 (86.218)	lr 0.00085
Train [106][2720/3239]	Time 0.254 (0.516)	Data Time 0.001 (0.016)	Loss 2.2108 (2.3546)	Entropy 0.53818 (0.53814)	Top-1 acc 70.312 (67.366)	Top-5 acc 88.672 (86.215)	lr 0.00085
Train [106][2730/3239]	Time 0.330 (0.515)	Data Time 0.001 (0.016)	Loss 2.4026 (2.3546)	Entropy 0.53789 (0.53814)	Top-1 acc 65.234 (67.365)	Top-5 acc 83.203 (86.217)	lr 0.00085
Train [106][2740/3239]	Time 0.257 (0.515)	Data Time 0.001 (0.016)	Loss 2.3079 (2.3543)	Entropy 0.53780 (0.53814)	Top-1 acc 68.750 (67.372)	Top-5 acc 87.109 (86.219)	lr 0.00085
Train [106][2750/3239]	Time 0.227 (0.515)	Data Time 0.001 (0.015)	Loss 2.3946 (2.3545)	Entropy 0.53778 (0.53813)	Top-1 acc 66.406 (67.370)	Top-5 acc 86.328 (86.214)	lr 0.00085
Train [106][2760/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.015)	Loss 2.7212 (2.3546)	Entropy 0.53790 (0.53813)	Top-1 acc 59.375 (67.371)	Top-5 acc 78.906 (86.209)	lr 0.00085
Train [106][2770/3239]	Time 0.345 (0.515)	Data Time 0.002 (0.015)	Loss 2.3577 (2.3546)	Entropy 0.53797 (0.53813)	Top-1 acc 66.797 (67.370)	Top-5 acc 84.766 (86.207)	lr 0.00085
Train [106][2780/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.015)	Loss 2.4197 (2.3544)	Entropy 0.53788 (0.53813)	Top-1 acc 65.234 (67.376)	Top-5 acc 83.984 (86.212)	lr 0.00085
Train [106][2790/3239]	Time 0.232 (0.514)	Data Time 0.001 (0.015)	Loss 2.6230 (2.3544)	Entropy 0.53806 (0.53813)	Top-1 acc 60.156 (67.379)	Top-5 acc 83.203 (86.213)	lr 0.00085
Train [106][2800/3239]	Time 0.324 (0.514)	Data Time 0.001 (0.015)	Loss 2.2473 (2.3547)	Entropy 0.53813 (0.53813)	Top-1 acc 70.312 (67.373)	Top-5 acc 87.109 (86.210)	lr 0.00085
Train [106][2810/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.015)	Loss 2.5022 (2.3547)	Entropy 0.53803 (0.53813)	Top-1 acc 60.547 (67.373)	Top-5 acc 84.375 (86.210)	lr 0.00085
Train [106][2820/3239]	Time 0.232 (0.513)	Data Time 0.001 (0.015)	Loss 2.3214 (2.3548)	Entropy 0.53819 (0.53813)	Top-1 acc 66.797 (67.371)	Top-5 acc 87.109 (86.209)	lr 0.00085
Train [106][2830/3239]	Time 0.246 (0.513)	Data Time 0.001 (0.015)	Loss 2.3851 (2.3547)	Entropy 0.53802 (0.53813)	Top-1 acc 66.016 (67.370)	Top-5 acc 85.156 (86.209)	lr 0.00085
Train [106][2840/3239]	Time 0.242 (0.512)	Data Time 0.001 (0.015)	Loss 2.4644 (2.3547)	Entropy 0.53788 (0.53813)	Top-1 acc 64.453 (67.371)	Top-5 acc 83.984 (86.209)	lr 0.00084
Train [106][2850/3239]	Time 0.282 (0.512)	Data Time 0.001 (0.015)	Loss 2.3480 (2.3550)	Entropy 0.53755 (0.53813)	Top-1 acc 69.141 (67.369)	Top-5 acc 85.547 (86.202)	lr 0.00084
Train [106][2860/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.015)	Loss 2.4411 (2.3550)	Entropy 0.53766 (0.53813)	Top-1 acc 67.188 (67.372)	Top-5 acc 83.203 (86.201)	lr 0.00084
Train [106][2870/3239]	Time 0.235 (0.511)	Data Time 0.001 (0.015)	Loss 2.3728 (2.3552)	Entropy 0.53728 (0.53813)	Top-1 acc 67.578 (67.362)	Top-5 acc 85.938 (86.197)	lr 0.00084
Train [106][2880/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.015)	Loss 2.2906 (2.3549)	Entropy 0.53729 (0.53812)	Top-1 acc 66.406 (67.369)	Top-5 acc 87.891 (86.202)	lr 0.00084
Train [106][2890/3239]	Time 0.315 (0.511)	Data Time 0.001 (0.015)	Loss 2.3889 (2.3547)	Entropy 0.53748 (0.53812)	Top-1 acc 67.578 (67.373)	Top-5 acc 84.375 (86.205)	lr 0.00084
Train [106][2900/3239]	Time 0.234 (0.510)	Data Time 0.001 (0.015)	Loss 2.2182 (2.3546)	Entropy 0.53761 (0.53812)	Top-1 acc 69.922 (67.371)	Top-5 acc 89.062 (86.208)	lr 0.00084
Train [106][2910/3239]	Time 0.262 (0.510)	Data Time 0.001 (0.015)	Loss 2.2683 (2.3547)	Entropy 0.53751 (0.53812)	Top-1 acc 69.141 (67.373)	Top-5 acc 86.328 (86.207)	lr 0.00084
Train [106][2920/3239]	Time 0.249 (0.510)	Data Time 0.001 (0.015)	Loss 2.3541 (2.3549)	Entropy 0.53786 (0.53811)	Top-1 acc 65.234 (67.366)	Top-5 acc 87.109 (86.201)	lr 0.00084
Train [106][2930/3239]	Time 0.230 (0.509)	Data Time 0.001 (0.015)	Loss 2.4153 (2.3550)	Entropy 0.53783 (0.53811)	Top-1 acc 67.969 (67.367)	Top-5 acc 84.766 (86.197)	lr 0.00084
Train [106][2940/3239]	Time 0.255 (0.509)	Data Time 0.001 (0.015)	Loss 2.3363 (2.3551)	Entropy 0.53794 (0.53811)	Top-1 acc 66.797 (67.362)	Top-5 acc 87.109 (86.194)	lr 0.00084
Train [106][2950/3239]	Time 0.242 (0.509)	Data Time 0.001 (0.015)	Loss 2.2496 (2.3552)	Entropy 0.53821 (0.53811)	Top-1 acc 69.922 (67.361)	Top-5 acc 88.672 (86.191)	lr 0.00084
Train [106][2960/3239]	Time 0.385 (0.508)	Data Time 0.001 (0.015)	Loss 2.2822 (2.3552)	Entropy 0.53834 (0.53811)	Top-1 acc 66.797 (67.358)	Top-5 acc 88.672 (86.193)	lr 0.00084
Train [106][2970/3239]	Time 0.243 (0.508)	Data Time 0.001 (0.014)	Loss 2.2342 (2.3552)	Entropy 0.53852 (0.53811)	Top-1 acc 71.875 (67.355)	Top-5 acc 89.453 (86.195)	lr 0.00084
Train [106][2980/3239]	Time 0.225 (0.508)	Data Time 0.001 (0.014)	Loss 2.5358 (2.3552)	Entropy 0.53845 (0.53812)	Top-1 acc 62.109 (67.354)	Top-5 acc 83.203 (86.196)	lr 0.00084
Train [106][2990/3239]	Time 0.297 (0.525)	Data Time 0.029 (0.014)	Loss 2.4005 (2.3554)	Entropy 0.53861 (0.53812)	Top-1 acc 64.844 (67.350)	Top-5 acc 87.500 (86.192)	lr 0.00084
Train [106][3000/3239]	Time 0.246 (0.525)	Data Time 0.002 (0.014)	Loss 2.1596 (2.3551)	Entropy 0.53870 (0.53812)	Top-1 acc 71.875 (67.357)	Top-5 acc 90.234 (86.199)	lr 0.00084
Train [106][3010/3239]	Time 0.263 (0.524)	Data Time 0.002 (0.014)	Loss 2.5857 (2.3555)	Entropy 0.53840 (0.53812)	Top-1 acc 64.453 (67.347)	Top-5 acc 82.031 (86.190)	lr 0.00084
Train [106][3020/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.014)	Loss 2.3785 (2.3556)	Entropy 0.53832 (0.53812)	Top-1 acc 62.891 (67.346)	Top-5 acc 84.766 (86.187)	lr 0.00084
Train [106][3030/3239]	Time 0.260 (0.524)	Data Time 0.001 (0.014)	Loss 2.5674 (2.3556)	Entropy 0.53808 (0.53812)	Top-1 acc 60.156 (67.345)	Top-5 acc 83.984 (86.188)	lr 0.00084
Train [106][3040/3239]	Time 0.258 (0.523)	Data Time 0.003 (0.014)	Loss 2.3522 (2.3558)	Entropy 0.53782 (0.53812)	Top-1 acc 67.969 (67.341)	Top-5 acc 83.984 (86.185)	lr 0.00084
Train [106][3050/3239]	Time 0.334 (0.523)	Data Time 0.001 (0.014)	Loss 2.3123 (2.3557)	Entropy 0.53780 (0.53812)	Top-1 acc 67.188 (67.338)	Top-5 acc 85.938 (86.186)	lr 0.00084
Train [106][3060/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.014)	Loss 2.2912 (2.3558)	Entropy 0.53775 (0.53812)	Top-1 acc 67.578 (67.336)	Top-5 acc 87.109 (86.184)	lr 0.00084
Train [106][3070/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.014)	Loss 2.3106 (2.3558)	Entropy 0.53792 (0.53812)	Top-1 acc 70.312 (67.338)	Top-5 acc 86.328 (86.183)	lr 0.00084
Train [106][3080/3239]	Time 0.289 (0.522)	Data Time 0.001 (0.014)	Loss 2.5106 (2.3560)	Entropy 0.53807 (0.53812)	Top-1 acc 68.750 (67.333)	Top-5 acc 82.812 (86.178)	lr 0.00084
Train [106][3090/3239]	Time 0.270 (0.522)	Data Time 0.001 (0.014)	Loss 2.2258 (2.3562)	Entropy 0.53793 (0.53812)	Top-1 acc 67.969 (67.326)	Top-5 acc 89.844 (86.175)	lr 0.00084
Train [106][3100/3239]	Time 0.242 (0.522)	Data Time 0.001 (0.014)	Loss 2.3987 (2.3562)	Entropy 0.53785 (0.53812)	Top-1 acc 67.578 (67.326)	Top-5 acc 82.422 (86.173)	lr 0.00084
Train [106][3110/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.014)	Loss 2.3413 (2.3562)	Entropy 0.53782 (0.53812)	Top-1 acc 68.750 (67.326)	Top-5 acc 85.156 (86.173)	lr 0.00083
Train [106][3120/3239]	Time 0.357 (0.521)	Data Time 0.001 (0.014)	Loss 2.3538 (2.3564)	Entropy 0.53782 (0.53812)	Top-1 acc 66.797 (67.322)	Top-5 acc 87.500 (86.173)	lr 0.00083
Train [106][3130/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.014)	Loss 2.2585 (2.3564)	Entropy 0.53787 (0.53811)	Top-1 acc 70.703 (67.321)	Top-5 acc 88.672 (86.171)	lr 0.00083
Train [106][3140/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.014)	Loss 2.5239 (2.3565)	Entropy 0.53772 (0.53811)	Top-1 acc 62.891 (67.323)	Top-5 acc 82.812 (86.170)	lr 0.00083
Train [106][3150/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.014)	Loss 2.3785 (2.3567)	Entropy 0.53803 (0.53811)	Top-1 acc 67.188 (67.316)	Top-5 acc 86.719 (86.169)	lr 0.00083
Train [106][3160/3239]	Time 0.240 (0.520)	Data Time 0.001 (0.014)	Loss 2.2613 (2.3567)	Entropy 0.53798 (0.53811)	Top-1 acc 68.359 (67.315)	Top-5 acc 87.500 (86.171)	lr 0.00083
Train [106][3170/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.014)	Loss 2.4246 (2.3569)	Entropy 0.53805 (0.53811)	Top-1 acc 67.578 (67.310)	Top-5 acc 85.938 (86.167)	lr 0.00083
Train [106][3180/3239]	Time 0.230 (0.519)	Data Time 0.000 (0.014)	Loss 2.2755 (2.3568)	Entropy 0.53803 (0.53811)	Top-1 acc 67.188 (67.310)	Top-5 acc 87.891 (86.169)	lr 0.00083
Train [106][3190/3239]	Time 0.231 (0.519)	Data Time 0.000 (0.014)	Loss 2.5456 (2.3567)	Entropy 0.53802 (0.53811)	Top-1 acc 65.625 (67.313)	Top-5 acc 80.469 (86.171)	lr 0.00083
Train [106][3200/3239]	Time 0.222 (0.518)	Data Time 0.000 (0.014)	Loss 2.4274 (2.3565)	Entropy 0.53804 (0.53811)	Top-1 acc 67.578 (67.314)	Top-5 acc 83.984 (86.174)	lr 0.00083
Train [106][3210/3239]	Time 0.228 (0.518)	Data Time 0.000 (0.014)	Loss 2.4177 (2.3566)	Entropy 0.53763 (0.53811)	Top-1 acc 66.016 (67.311)	Top-5 acc 84.375 (86.173)	lr 0.00083
Train [106][3220/3239]	Time 0.224 (0.517)	Data Time 0.000 (0.013)	Loss 2.5748 (2.3567)	Entropy 0.53745 (0.53811)	Top-1 acc 65.234 (67.309)	Top-5 acc 81.641 (86.173)	lr 0.00083
Train [106][3230/3239]	Time 0.231 (0.517)	Data Time 0.000 (0.013)	Loss 2.2326 (2.3568)	Entropy 0.53743 (0.53811)	Top-1 acc 71.875 (67.306)	Top-5 acc 89.453 (86.170)	lr 0.00083
Train [106][3239/3239]	Time 0.955 (0.517)	Data Time 0.000 (0.013)	Loss 2.6614 (2.3569)	Entropy 0.53778 (0.53810)	Top-1 acc 56.790 (67.304)	Top-5 acc 80.247 (86.169)	lr 0.00083
==========Valid [106/120]	loss 1.181	top-1 acc 72.893 (72.893)	top-5 acc 90.501	Train top-1 67.304	top-5 86.169	Entropy 0.53778	Latency-None: 0.000ms	Flops: 539.00M
Train [107][0/3239]	Time 39.127 (39.127)	Data Time 37.889 (37.889)	Loss 2.3921 (2.3921)	Entropy 0.53785 (0.53785)	Top-1 acc 66.797 (66.797)	Top-5 acc 85.156 (85.156)	lr 0.00083
Train [107][10/3239]	Time 0.246 (4.032)	Data Time 0.002 (3.446)	Loss 2.2644 (2.3674)	Entropy 0.53795 (0.53797)	Top-1 acc 72.266 (67.472)	Top-5 acc 86.719 (86.044)	lr 0.00083
Train [107][20/3239]	Time 0.345 (2.319)	Data Time 0.001 (1.806)	Loss 2.4310 (2.3703)	Entropy 0.53817 (0.53800)	Top-1 acc 64.844 (66.704)	Top-5 acc 83.984 (86.012)	lr 0.00083
Train [107][30/3239]	Time 0.368 (1.727)	Data Time 0.002 (1.224)	Loss 2.2914 (2.3572)	Entropy 0.53825 (0.53806)	Top-1 acc 72.656 (66.948)	Top-5 acc 87.500 (86.303)	lr 0.00083
Train [107][40/3239]	Time 0.225 (1.414)	Data Time 0.001 (0.926)	Loss 2.3961 (2.3697)	Entropy 0.53837 (0.53812)	Top-1 acc 64.453 (66.702)	Top-5 acc 87.109 (86.119)	lr 0.00083
Train [107][50/3239]	Time 0.224 (1.219)	Data Time 0.001 (0.745)	Loss 2.3135 (2.3701)	Entropy 0.53843 (0.53818)	Top-1 acc 69.531 (66.674)	Top-5 acc 86.719 (86.160)	lr 0.00083
Train [107][60/3239]	Time 0.254 (1.091)	Data Time 0.001 (0.623)	Loss 2.2589 (2.3656)	Entropy 0.53847 (0.53822)	Top-1 acc 69.141 (66.733)	Top-5 acc 85.938 (86.181)	lr 0.00083
Train [107][70/3239]	Time 0.243 (1.014)	Data Time 0.001 (0.535)	Loss 2.3532 (2.3578)	Entropy 0.53833 (0.53825)	Top-1 acc 66.016 (66.885)	Top-5 acc 85.938 (86.361)	lr 0.00083
Train [107][80/3239]	Time 0.244 (0.942)	Data Time 0.001 (0.470)	Loss 2.4412 (2.3543)	Entropy 0.53846 (0.53827)	Top-1 acc 65.625 (67.009)	Top-5 acc 85.547 (86.425)	lr 0.00083
Train [107][90/3239]	Time 0.263 (0.887)	Data Time 0.001 (0.418)	Loss 2.4908 (2.3533)	Entropy 0.53869 (0.53830)	Top-1 acc 66.016 (67.200)	Top-5 acc 85.156 (86.414)	lr 0.00083
Train [107][100/3239]	Time 0.266 (0.841)	Data Time 0.001 (0.377)	Loss 2.4348 (2.3574)	Entropy 0.53896 (0.53834)	Top-1 acc 66.016 (67.122)	Top-5 acc 83.984 (86.317)	lr 0.00083
Train [107][110/3239]	Time 0.330 (0.804)	Data Time 0.001 (0.343)	Loss 2.3456 (2.3569)	Entropy 0.53895 (0.53840)	Top-1 acc 71.094 (67.114)	Top-5 acc 84.375 (86.314)	lr 0.00083
Train [107][120/3239]	Time 0.248 (0.772)	Data Time 0.001 (0.315)	Loss 2.3464 (2.3556)	Entropy 0.53848 (0.53843)	Top-1 acc 66.406 (67.194)	Top-5 acc 86.719 (86.335)	lr 0.00083
Train [107][130/3239]	Time 0.231 (0.744)	Data Time 0.001 (0.291)	Loss 2.5335 (2.3531)	Entropy 0.53832 (0.53844)	Top-1 acc 59.766 (67.161)	Top-5 acc 85.547 (86.388)	lr 0.00083
Train [107][140/3239]	Time 0.249 (0.721)	Data Time 0.001 (0.270)	Loss 2.4042 (2.3531)	Entropy 0.53825 (0.53843)	Top-1 acc 66.797 (67.201)	Top-5 acc 83.203 (86.370)	lr 0.00083
Train [107][150/3239]	Time 0.226 (0.701)	Data Time 0.001 (0.253)	Loss 2.4554 (2.3518)	Entropy 0.53865 (0.53843)	Top-1 acc 64.844 (67.185)	Top-5 acc 83.984 (86.357)	lr 0.00082
Train [107][160/3239]	Time 0.227 (0.682)	Data Time 0.001 (0.237)	Loss 2.3930 (2.3545)	Entropy 0.53818 (0.53843)	Top-1 acc 69.531 (67.107)	Top-5 acc 86.719 (86.323)	lr 0.00082
Train [107][170/3239]	Time 0.243 (0.666)	Data Time 0.001 (0.223)	Loss 2.2299 (2.3513)	Entropy 0.53831 (0.53842)	Top-1 acc 71.484 (67.201)	Top-5 acc 86.328 (86.365)	lr 0.00082
Train [107][180/3239]	Time 0.317 (0.651)	Data Time 0.001 (0.211)	Loss 2.4791 (2.3499)	Entropy 0.53843 (0.53842)	Top-1 acc 64.062 (67.233)	Top-5 acc 84.375 (86.354)	lr 0.00082
Train [107][190/3239]	Time 0.230 (0.637)	Data Time 0.001 (0.200)	Loss 2.1779 (2.3527)	Entropy 0.53802 (0.53841)	Top-1 acc 71.875 (67.165)	Top-5 acc 88.281 (86.299)	lr 0.00082
Train [107][200/3239]	Time 0.228 (0.625)	Data Time 0.001 (0.190)	Loss 2.3090 (2.3524)	Entropy 0.53815 (0.53839)	Top-1 acc 68.359 (67.189)	Top-5 acc 87.500 (86.289)	lr 0.00082
Train [107][210/3239]	Time 0.234 (0.615)	Data Time 0.001 (0.181)	Loss 2.1927 (2.3516)	Entropy 0.53839 (0.53839)	Top-1 acc 70.703 (67.252)	Top-5 acc 90.234 (86.332)	lr 0.00082
Train [107][220/3239]	Time 0.229 (0.606)	Data Time 0.001 (0.173)	Loss 2.3705 (2.3511)	Entropy 0.53804 (0.53838)	Top-1 acc 61.719 (67.242)	Top-5 acc 85.547 (86.353)	lr 0.00082
Train [107][230/3239]	Time 0.228 (0.597)	Data Time 0.001 (0.166)	Loss 2.2712 (2.3483)	Entropy 0.53789 (0.53836)	Top-1 acc 69.141 (67.291)	Top-5 acc 86.328 (86.418)	lr 0.00082
Train [107][240/3239]	Time 0.238 (0.590)	Data Time 0.001 (0.159)	Loss 2.3369 (2.3493)	Entropy 0.53793 (0.53834)	Top-1 acc 72.656 (67.293)	Top-5 acc 86.328 (86.383)	lr 0.00082
Train [107][250/3239]	Time 0.222 (0.583)	Data Time 0.001 (0.153)	Loss 2.2857 (2.3488)	Entropy 0.53800 (0.53833)	Top-1 acc 66.797 (67.298)	Top-5 acc 87.891 (86.381)	lr 0.00082
Train [107][260/3239]	Time 0.264 (0.576)	Data Time 0.001 (0.147)	Loss 2.3629 (2.3473)	Entropy 0.53787 (0.53831)	Top-1 acc 65.234 (67.363)	Top-5 acc 86.719 (86.389)	lr 0.00082
Train [107][270/3239]	Time 0.270 (0.570)	Data Time 0.001 (0.142)	Loss 2.2922 (2.3494)	Entropy 0.53746 (0.53829)	Top-1 acc 67.969 (67.329)	Top-5 acc 85.156 (86.354)	lr 0.00082
Train [107][280/3239]	Time 0.231 (0.565)	Data Time 0.001 (0.137)	Loss 2.4692 (2.3481)	Entropy 0.53740 (0.53825)	Top-1 acc 66.406 (67.358)	Top-5 acc 85.547 (86.382)	lr 0.00082
Train [107][290/3239]	Time 0.261 (0.561)	Data Time 0.001 (0.132)	Loss 2.4301 (2.3479)	Entropy 0.53743 (0.53822)	Top-1 acc 65.625 (67.351)	Top-5 acc 85.938 (86.378)	lr 0.00082
Train [107][300/3239]	Time 0.230 (0.556)	Data Time 0.001 (0.128)	Loss 2.3869 (2.3466)	Entropy 0.53730 (0.53819)	Top-1 acc 68.359 (67.382)	Top-5 acc 86.719 (86.431)	lr 0.00082
Train [107][310/3239]	Time 0.227 (0.551)	Data Time 0.001 (0.123)	Loss 2.3363 (2.3482)	Entropy 0.53743 (0.53817)	Top-1 acc 68.750 (67.353)	Top-5 acc 87.891 (86.381)	lr 0.00082
Train [107][320/3239]	Time 0.258 (0.547)	Data Time 0.002 (0.120)	Loss 2.1639 (2.3478)	Entropy 0.53755 (0.53814)	Top-1 acc 71.094 (67.388)	Top-5 acc 88.672 (86.384)	lr 0.00082
Train [107][330/3239]	Time 0.236 (0.543)	Data Time 0.001 (0.116)	Loss 2.3614 (2.3497)	Entropy 0.53762 (0.53813)	Top-1 acc 70.703 (67.385)	Top-5 acc 85.938 (86.343)	lr 0.00082
Train [107][340/3239]	Time 0.353 (0.540)	Data Time 0.001 (0.113)	Loss 2.2628 (2.3506)	Entropy 0.53735 (0.53811)	Top-1 acc 68.750 (67.362)	Top-5 acc 87.500 (86.344)	lr 0.00082
Train [107][350/3239]	Time 0.244 (0.536)	Data Time 0.004 (0.110)	Loss 2.3122 (2.3521)	Entropy 0.53717 (0.53809)	Top-1 acc 68.750 (67.334)	Top-5 acc 86.719 (86.321)	lr 0.00082
Train [107][360/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.107)	Loss 2.1318 (2.3522)	Entropy 0.53730 (0.53806)	Top-1 acc 74.609 (67.360)	Top-5 acc 91.016 (86.325)	lr 0.00082
Train [107][370/3239]	Time 0.258 (0.530)	Data Time 0.002 (0.104)	Loss 2.3453 (2.3524)	Entropy 0.53732 (0.53804)	Top-1 acc 66.016 (67.372)	Top-5 acc 87.500 (86.345)	lr 0.00082
Train [107][380/3239]	Time 0.263 (0.527)	Data Time 0.001 (0.101)	Loss 2.4285 (2.3514)	Entropy 0.53717 (0.53802)	Top-1 acc 66.797 (67.404)	Top-5 acc 85.156 (86.361)	lr 0.00082
Train [107][390/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.099)	Loss 2.2264 (2.3531)	Entropy 0.53690 (0.53800)	Top-1 acc 71.484 (67.369)	Top-5 acc 85.156 (86.314)	lr 0.00082
Train [107][400/3239]	Time 0.249 (0.522)	Data Time 0.001 (0.096)	Loss 2.3642 (2.3545)	Entropy 0.53695 (0.53797)	Top-1 acc 66.406 (67.327)	Top-5 acc 86.328 (86.286)	lr 0.00082
Train [107][410/3239]	Time 0.334 (0.650)	Data Time 0.002 (0.094)	Loss 2.4703 (2.3532)	Entropy 0.53684 (0.53794)	Top-1 acc 64.453 (67.362)	Top-5 acc 80.859 (86.292)	lr 0.00082
Train [107][420/3239]	Time 0.236 (0.645)	Data Time 0.002 (0.092)	Loss 2.2839 (2.3532)	Entropy 0.53690 (0.53792)	Top-1 acc 66.797 (67.371)	Top-5 acc 86.328 (86.307)	lr 0.00082
Train [107][430/3239]	Time 0.235 (0.639)	Data Time 0.001 (0.090)	Loss 2.2754 (2.3525)	Entropy 0.53697 (0.53790)	Top-1 acc 66.016 (67.383)	Top-5 acc 88.281 (86.305)	lr 0.00081
Train [107][440/3239]	Time 0.245 (0.634)	Data Time 0.002 (0.088)	Loss 2.3387 (2.3530)	Entropy 0.53688 (0.53788)	Top-1 acc 67.969 (67.375)	Top-5 acc 84.766 (86.279)	lr 0.00081
Train [107][450/3239]	Time 0.232 (0.629)	Data Time 0.002 (0.086)	Loss 2.4340 (2.3531)	Entropy 0.53686 (0.53785)	Top-1 acc 66.406 (67.396)	Top-5 acc 85.938 (86.278)	lr 0.00081
Train [107][460/3239]	Time 0.258 (0.625)	Data Time 0.001 (0.084)	Loss 2.3564 (2.3529)	Entropy 0.53692 (0.53783)	Top-1 acc 69.141 (67.400)	Top-5 acc 85.938 (86.285)	lr 0.00081
Train [107][470/3239]	Time 0.242 (0.621)	Data Time 0.001 (0.082)	Loss 2.2233 (2.3544)	Entropy 0.53695 (0.53781)	Top-1 acc 71.484 (67.374)	Top-5 acc 86.719 (86.263)	lr 0.00081
Train [107][480/3239]	Time 0.285 (0.617)	Data Time 0.001 (0.081)	Loss 2.2886 (2.3532)	Entropy 0.53691 (0.53779)	Top-1 acc 71.484 (67.412)	Top-5 acc 86.719 (86.274)	lr 0.00081
Train [107][490/3239]	Time 0.274 (0.613)	Data Time 0.001 (0.079)	Loss 2.4073 (2.3539)	Entropy 0.53702 (0.53778)	Top-1 acc 70.312 (67.390)	Top-5 acc 87.500 (86.267)	lr 0.00081
Train [107][500/3239]	Time 0.340 (0.610)	Data Time 0.001 (0.078)	Loss 2.3236 (2.3554)	Entropy 0.53753 (0.53777)	Top-1 acc 69.531 (67.347)	Top-5 acc 88.281 (86.238)	lr 0.00081
Train [107][510/3239]	Time 0.284 (0.606)	Data Time 0.009 (0.076)	Loss 2.1808 (2.3561)	Entropy 0.53719 (0.53776)	Top-1 acc 74.609 (67.352)	Top-5 acc 90.625 (86.230)	lr 0.00081
Train [107][520/3239]	Time 0.228 (0.603)	Data Time 0.001 (0.075)	Loss 2.1287 (2.3567)	Entropy 0.53743 (0.53775)	Top-1 acc 72.656 (67.334)	Top-5 acc 89.453 (86.213)	lr 0.00081
Train [107][530/3239]	Time 0.242 (0.600)	Data Time 0.001 (0.073)	Loss 2.2201 (2.3562)	Entropy 0.53752 (0.53774)	Top-1 acc 72.656 (67.350)	Top-5 acc 87.891 (86.225)	lr 0.00081
Train [107][540/3239]	Time 0.231 (0.596)	Data Time 0.001 (0.072)	Loss 2.1730 (2.3556)	Entropy 0.53752 (0.53774)	Top-1 acc 73.828 (67.371)	Top-5 acc 89.844 (86.236)	lr 0.00081
Train [107][550/3239]	Time 0.313 (0.595)	Data Time 0.002 (0.071)	Loss 2.3163 (2.3550)	Entropy 0.53709 (0.53773)	Top-1 acc 68.359 (67.378)	Top-5 acc 87.891 (86.247)	lr 0.00081
Train [107][560/3239]	Time 0.239 (0.592)	Data Time 0.001 (0.070)	Loss 2.3049 (2.3554)	Entropy 0.53702 (0.53772)	Top-1 acc 68.359 (67.387)	Top-5 acc 87.109 (86.229)	lr 0.00081
Train [107][570/3239]	Time 0.400 (0.590)	Data Time 0.001 (0.068)	Loss 2.2234 (2.3550)	Entropy 0.53734 (0.53771)	Top-1 acc 70.312 (67.385)	Top-5 acc 87.500 (86.229)	lr 0.00081
Train [107][580/3239]	Time 0.240 (0.587)	Data Time 0.001 (0.067)	Loss 2.2435 (2.3552)	Entropy 0.53703 (0.53770)	Top-1 acc 73.047 (67.395)	Top-5 acc 88.672 (86.231)	lr 0.00081
Train [107][590/3239]	Time 0.232 (0.584)	Data Time 0.001 (0.066)	Loss 2.5916 (2.3558)	Entropy 0.53686 (0.53769)	Top-1 acc 62.109 (67.402)	Top-5 acc 80.078 (86.232)	lr 0.00081
Train [107][600/3239]	Time 0.230 (0.582)	Data Time 0.001 (0.065)	Loss 2.5860 (2.3548)	Entropy 0.53694 (0.53767)	Top-1 acc 59.766 (67.426)	Top-5 acc 84.766 (86.249)	lr 0.00081
Train [107][610/3239]	Time 0.223 (0.579)	Data Time 0.001 (0.064)	Loss 2.2809 (2.3554)	Entropy 0.53698 (0.53766)	Top-1 acc 70.312 (67.406)	Top-5 acc 87.109 (86.242)	lr 0.00081
Train [107][620/3239]	Time 0.290 (0.578)	Data Time 0.001 (0.063)	Loss 2.4142 (2.3553)	Entropy 0.53704 (0.53765)	Top-1 acc 67.578 (67.413)	Top-5 acc 85.938 (86.246)	lr 0.00081
Train [107][630/3239]	Time 0.230 (0.575)	Data Time 0.001 (0.062)	Loss 2.3098 (2.3555)	Entropy 0.53716 (0.53764)	Top-1 acc 69.531 (67.394)	Top-5 acc 86.719 (86.240)	lr 0.00081
Train [107][640/3239]	Time 0.277 (0.573)	Data Time 0.001 (0.061)	Loss 2.3454 (2.3559)	Entropy 0.53742 (0.53763)	Top-1 acc 64.844 (67.377)	Top-5 acc 87.891 (86.228)	lr 0.00081
Train [107][650/3239]	Time 0.232 (0.571)	Data Time 0.001 (0.060)	Loss 2.2688 (2.3566)	Entropy 0.53737 (0.53763)	Top-1 acc 69.141 (67.380)	Top-5 acc 87.109 (86.213)	lr 0.00081
Train [107][660/3239]	Time 0.318 (0.569)	Data Time 0.001 (0.059)	Loss 2.5330 (2.3568)	Entropy 0.53745 (0.53763)	Top-1 acc 65.234 (67.394)	Top-5 acc 83.594 (86.216)	lr 0.00081
Train [107][670/3239]	Time 0.238 (0.566)	Data Time 0.001 (0.058)	Loss 2.5170 (2.3567)	Entropy 0.53717 (0.53762)	Top-1 acc 62.891 (67.382)	Top-5 acc 82.031 (86.225)	lr 0.00081
Train [107][680/3239]	Time 0.234 (0.564)	Data Time 0.001 (0.058)	Loss 2.2567 (2.3566)	Entropy 0.53712 (0.53762)	Top-1 acc 71.875 (67.381)	Top-5 acc 87.891 (86.229)	lr 0.00081
Train [107][690/3239]	Time 0.234 (0.562)	Data Time 0.001 (0.057)	Loss 2.2370 (2.3568)	Entropy 0.53735 (0.53761)	Top-1 acc 71.484 (67.372)	Top-5 acc 87.500 (86.224)	lr 0.00081
Train [107][700/3239]	Time 0.240 (0.560)	Data Time 0.001 (0.056)	Loss 2.4078 (2.3571)	Entropy 0.53747 (0.53761)	Top-1 acc 67.578 (67.355)	Top-5 acc 85.156 (86.212)	lr 0.00081
Train [107][710/3239]	Time 0.234 (0.558)	Data Time 0.001 (0.055)	Loss 2.2691 (2.3574)	Entropy 0.53728 (0.53760)	Top-1 acc 68.750 (67.344)	Top-5 acc 89.062 (86.211)	lr 0.00080
Train [107][720/3239]	Time 0.237 (0.556)	Data Time 0.001 (0.055)	Loss 2.3283 (2.3573)	Entropy 0.53735 (0.53760)	Top-1 acc 64.844 (67.346)	Top-5 acc 85.547 (86.209)	lr 0.00080
Train [107][730/3239]	Time 0.343 (0.554)	Data Time 0.001 (0.054)	Loss 2.2896 (2.3575)	Entropy 0.53726 (0.53759)	Top-1 acc 67.969 (67.337)	Top-5 acc 86.719 (86.203)	lr 0.00080
Train [107][740/3239]	Time 0.231 (0.552)	Data Time 0.001 (0.053)	Loss 2.3490 (2.3582)	Entropy 0.53709 (0.53759)	Top-1 acc 69.531 (67.317)	Top-5 acc 85.938 (86.192)	lr 0.00080
Train [107][750/3239]	Time 0.285 (0.551)	Data Time 0.002 (0.052)	Loss 2.3706 (2.3590)	Entropy 0.53713 (0.53758)	Top-1 acc 67.188 (67.309)	Top-5 acc 86.719 (86.179)	lr 0.00080
Train [107][760/3239]	Time 0.272 (0.550)	Data Time 0.003 (0.052)	Loss 2.5579 (2.3588)	Entropy 0.53723 (0.53758)	Top-1 acc 62.109 (67.309)	Top-5 acc 83.203 (86.173)	lr 0.00080
Train [107][770/3239]	Time 0.233 (0.549)	Data Time 0.001 (0.051)	Loss 2.2355 (2.3585)	Entropy 0.53718 (0.53757)	Top-1 acc 71.094 (67.323)	Top-5 acc 85.938 (86.177)	lr 0.00080
Train [107][780/3239]	Time 0.258 (0.547)	Data Time 0.001 (0.050)	Loss 2.2269 (2.3590)	Entropy 0.53754 (0.53757)	Top-1 acc 71.094 (67.309)	Top-5 acc 86.719 (86.168)	lr 0.00080
Train [107][790/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.050)	Loss 2.2973 (2.3590)	Entropy 0.53764 (0.53757)	Top-1 acc 69.141 (67.313)	Top-5 acc 85.938 (86.170)	lr 0.00080
Train [107][800/3239]	Time 0.256 (0.544)	Data Time 0.001 (0.049)	Loss 2.4451 (2.3586)	Entropy 0.53756 (0.53757)	Top-1 acc 62.500 (67.314)	Top-5 acc 84.375 (86.184)	lr 0.00080
Train [107][810/3239]	Time 0.263 (0.542)	Data Time 0.001 (0.049)	Loss 2.2356 (2.3589)	Entropy 0.53775 (0.53757)	Top-1 acc 68.359 (67.303)	Top-5 acc 90.625 (86.179)	lr 0.00080
Train [107][820/3239]	Time 0.328 (0.541)	Data Time 0.001 (0.048)	Loss 2.3445 (2.3598)	Entropy 0.53748 (0.53757)	Top-1 acc 65.625 (67.274)	Top-5 acc 88.672 (86.166)	lr 0.00080
Train [107][830/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.047)	Loss 2.3390 (2.3591)	Entropy 0.53775 (0.53757)	Top-1 acc 67.188 (67.283)	Top-5 acc 89.062 (86.188)	lr 0.00080
Train [107][840/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.047)	Loss 2.4476 (2.3590)	Entropy 0.53784 (0.53758)	Top-1 acc 62.891 (67.282)	Top-5 acc 85.547 (86.188)	lr 0.00080
Train [107][850/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.046)	Loss 2.7956 (2.3598)	Entropy 0.53754 (0.53758)	Top-1 acc 57.422 (67.255)	Top-5 acc 78.516 (86.173)	lr 0.00080
Train [107][860/3239]	Time 0.236 (0.535)	Data Time 0.001 (0.046)	Loss 2.2434 (2.3589)	Entropy 0.53763 (0.53758)	Top-1 acc 68.359 (67.270)	Top-5 acc 87.500 (86.183)	lr 0.00080
Train [107][870/3239]	Time 0.258 (0.533)	Data Time 0.001 (0.045)	Loss 2.6362 (2.3588)	Entropy 0.53740 (0.53758)	Top-1 acc 58.203 (67.271)	Top-5 acc 81.641 (86.172)	lr 0.00080
Train [107][880/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.045)	Loss 2.3767 (2.3593)	Entropy 0.53773 (0.53758)	Top-1 acc 68.359 (67.258)	Top-5 acc 83.594 (86.169)	lr 0.00080
Train [107][890/3239]	Time 0.348 (0.531)	Data Time 0.001 (0.044)	Loss 2.2860 (2.3587)	Entropy 0.53803 (0.53758)	Top-1 acc 65.625 (67.259)	Top-5 acc 90.625 (86.188)	lr 0.00080
Train [107][900/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.044)	Loss 2.3812 (2.3585)	Entropy 0.53783 (0.53758)	Top-1 acc 69.141 (67.265)	Top-5 acc 86.328 (86.192)	lr 0.00080
Train [107][910/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.043)	Loss 2.3479 (2.3583)	Entropy 0.53753 (0.53759)	Top-1 acc 66.406 (67.277)	Top-5 acc 84.375 (86.198)	lr 0.00080
Train [107][920/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.043)	Loss 2.2391 (2.3581)	Entropy 0.53792 (0.53759)	Top-1 acc 70.312 (67.287)	Top-5 acc 87.891 (86.199)	lr 0.00080
Train [107][930/3239]	Time 0.343 (0.527)	Data Time 0.001 (0.043)	Loss 2.2085 (2.3578)	Entropy 0.53795 (0.53759)	Top-1 acc 72.656 (67.296)	Top-5 acc 87.109 (86.207)	lr 0.00080
Train [107][940/3239]	Time 0.258 (0.528)	Data Time 0.001 (0.042)	Loss 2.3935 (2.3579)	Entropy 0.53790 (0.53759)	Top-1 acc 66.406 (67.297)	Top-5 acc 85.938 (86.214)	lr 0.00080
Train [107][950/3239]	Time 0.239 (0.527)	Data Time 0.001 (0.042)	Loss 2.2976 (2.3576)	Entropy 0.53775 (0.53760)	Top-1 acc 71.094 (67.310)	Top-5 acc 87.500 (86.214)	lr 0.00080
Train [107][960/3239]	Time 0.241 (0.526)	Data Time 0.001 (0.041)	Loss 2.4413 (2.3574)	Entropy 0.53778 (0.53760)	Top-1 acc 62.891 (67.310)	Top-5 acc 85.547 (86.216)	lr 0.00080
Train [107][970/3239]	Time 0.264 (0.525)	Data Time 0.002 (0.041)	Loss 2.3263 (2.3581)	Entropy 0.53771 (0.53760)	Top-1 acc 67.188 (67.297)	Top-5 acc 87.500 (86.204)	lr 0.00080
Train [107][980/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.040)	Loss 2.2100 (2.3574)	Entropy 0.53771 (0.53760)	Top-1 acc 70.312 (67.305)	Top-5 acc 89.844 (86.210)	lr 0.00080
Train [107][990/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.040)	Loss 2.4037 (2.3571)	Entropy 0.53715 (0.53760)	Top-1 acc 65.625 (67.314)	Top-5 acc 84.766 (86.213)	lr 0.00079
Train [107][1000/3239]	Time 0.237 (0.521)	Data Time 0.001 (0.040)	Loss 2.5512 (2.3572)	Entropy 0.53731 (0.53760)	Top-1 acc 62.500 (67.314)	Top-5 acc 81.641 (86.213)	lr 0.00079
Train [107][1010/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.039)	Loss 2.2962 (2.3570)	Entropy 0.53753 (0.53760)	Top-1 acc 69.922 (67.321)	Top-5 acc 86.719 (86.221)	lr 0.00079
Train [107][1020/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.039)	Loss 2.4754 (2.3566)	Entropy 0.53725 (0.53759)	Top-1 acc 64.062 (67.332)	Top-5 acc 83.203 (86.226)	lr 0.00079
Train [107][1030/3239]	Time 0.260 (0.519)	Data Time 0.001 (0.039)	Loss 2.2695 (2.3560)	Entropy 0.53735 (0.53759)	Top-1 acc 74.219 (67.354)	Top-5 acc 83.594 (86.227)	lr 0.00079
Train [107][1040/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.038)	Loss 2.3072 (2.3555)	Entropy 0.53701 (0.53759)	Top-1 acc 69.531 (67.369)	Top-5 acc 85.547 (86.238)	lr 0.00079
Train [107][1050/3239]	Time 0.365 (0.517)	Data Time 0.001 (0.038)	Loss 2.4475 (2.3559)	Entropy 0.53653 (0.53758)	Top-1 acc 66.406 (67.354)	Top-5 acc 83.594 (86.229)	lr 0.00079
Train [107][1060/3239]	Time 0.369 (0.566)	Data Time 0.004 (0.038)	Loss 2.2873 (2.3555)	Entropy 0.53653 (0.53757)	Top-1 acc 68.750 (67.366)	Top-5 acc 87.891 (86.234)	lr 0.00079
Train [107][1070/3239]	Time 0.304 (0.566)	Data Time 0.002 (0.037)	Loss 2.2362 (2.3555)	Entropy 0.53669 (0.53756)	Top-1 acc 69.531 (67.368)	Top-5 acc 89.062 (86.234)	lr 0.00079
Train [107][1080/3239]	Time 0.237 (0.565)	Data Time 0.001 (0.037)	Loss 2.3601 (2.3554)	Entropy 0.53692 (0.53755)	Top-1 acc 68.750 (67.371)	Top-5 acc 87.500 (86.235)	lr 0.00079
Train [107][1090/3239]	Time 0.250 (0.564)	Data Time 0.001 (0.037)	Loss 2.4383 (2.3553)	Entropy 0.53693 (0.53755)	Top-1 acc 64.453 (67.375)	Top-5 acc 84.766 (86.233)	lr 0.00079
Train [107][1100/3239]	Time 0.256 (0.563)	Data Time 0.002 (0.036)	Loss 2.2532 (2.3548)	Entropy 0.53683 (0.53754)	Top-1 acc 68.359 (67.388)	Top-5 acc 87.500 (86.245)	lr 0.00079
Train [107][1110/3239]	Time 0.229 (0.561)	Data Time 0.001 (0.036)	Loss 2.3666 (2.3547)	Entropy 0.53712 (0.53753)	Top-1 acc 67.578 (67.389)	Top-5 acc 87.109 (86.247)	lr 0.00079
Train [107][1120/3239]	Time 0.291 (0.561)	Data Time 0.002 (0.036)	Loss 2.4856 (2.3549)	Entropy 0.53722 (0.53753)	Top-1 acc 66.406 (67.385)	Top-5 acc 83.594 (86.248)	lr 0.00079
Train [107][1130/3239]	Time 0.233 (0.560)	Data Time 0.001 (0.035)	Loss 2.4674 (2.3548)	Entropy 0.53709 (0.53753)	Top-1 acc 65.234 (67.382)	Top-5 acc 84.375 (86.251)	lr 0.00079
Train [107][1140/3239]	Time 0.268 (0.559)	Data Time 0.001 (0.035)	Loss 2.2504 (2.3551)	Entropy 0.53728 (0.53752)	Top-1 acc 74.219 (67.383)	Top-5 acc 89.062 (86.251)	lr 0.00079
Train [107][1150/3239]	Time 0.230 (0.558)	Data Time 0.001 (0.035)	Loss 2.2013 (2.3551)	Entropy 0.53755 (0.53752)	Top-1 acc 71.094 (67.387)	Top-5 acc 88.281 (86.247)	lr 0.00079
Train [107][1160/3239]	Time 0.244 (0.557)	Data Time 0.001 (0.035)	Loss 2.4665 (2.3548)	Entropy 0.53733 (0.53752)	Top-1 acc 63.281 (67.396)	Top-5 acc 85.156 (86.251)	lr 0.00079
Train [107][1170/3239]	Time 0.316 (0.556)	Data Time 0.002 (0.034)	Loss 2.2461 (2.3546)	Entropy 0.53744 (0.53752)	Top-1 acc 68.750 (67.399)	Top-5 acc 89.062 (86.261)	lr 0.00079
Train [107][1180/3239]	Time 0.300 (0.555)	Data Time 0.002 (0.034)	Loss 2.7275 (2.3553)	Entropy 0.53756 (0.53752)	Top-1 acc 57.031 (67.387)	Top-5 acc 77.734 (86.238)	lr 0.00079
Train [107][1190/3239]	Time 0.238 (0.554)	Data Time 0.001 (0.034)	Loss 2.4078 (2.3558)	Entropy 0.53772 (0.53752)	Top-1 acc 67.188 (67.383)	Top-5 acc 83.203 (86.223)	lr 0.00079
Train [107][1200/3239]	Time 0.225 (0.553)	Data Time 0.001 (0.033)	Loss 2.2030 (2.3555)	Entropy 0.53749 (0.53752)	Top-1 acc 69.922 (67.389)	Top-5 acc 89.453 (86.227)	lr 0.00079
Train [107][1210/3239]	Time 0.376 (0.552)	Data Time 0.001 (0.033)	Loss 2.4328 (2.3552)	Entropy 0.53737 (0.53752)	Top-1 acc 66.016 (67.408)	Top-5 acc 86.719 (86.236)	lr 0.00079
Train [107][1220/3239]	Time 0.226 (0.551)	Data Time 0.001 (0.033)	Loss 2.2846 (2.3553)	Entropy 0.53731 (0.53752)	Top-1 acc 70.703 (67.411)	Top-5 acc 87.891 (86.232)	lr 0.00079
Train [107][1230/3239]	Time 0.251 (0.550)	Data Time 0.001 (0.033)	Loss 2.3251 (2.3558)	Entropy 0.53726 (0.53752)	Top-1 acc 67.969 (67.406)	Top-5 acc 86.328 (86.221)	lr 0.00079
Train [107][1240/3239]	Time 0.225 (0.549)	Data Time 0.001 (0.032)	Loss 2.2272 (2.3557)	Entropy 0.53739 (0.53751)	Top-1 acc 71.094 (67.406)	Top-5 acc 88.672 (86.221)	lr 0.00079
Train [107][1250/3239]	Time 0.228 (0.548)	Data Time 0.001 (0.032)	Loss 2.4991 (2.3561)	Entropy 0.53762 (0.53751)	Top-1 acc 65.234 (67.399)	Top-5 acc 85.938 (86.217)	lr 0.00079
Train [107][1260/3239]	Time 0.238 (0.547)	Data Time 0.001 (0.032)	Loss 2.3524 (2.3569)	Entropy 0.53775 (0.53752)	Top-1 acc 66.016 (67.374)	Top-5 acc 87.500 (86.208)	lr 0.00079
Train [107][1270/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.032)	Loss 2.2913 (2.3568)	Entropy 0.53772 (0.53752)	Top-1 acc 68.750 (67.374)	Top-5 acc 87.891 (86.211)	lr 0.00078
Train [107][1280/3239]	Time 0.330 (0.545)	Data Time 0.001 (0.031)	Loss 2.4082 (2.3577)	Entropy 0.53781 (0.53752)	Top-1 acc 65.234 (67.350)	Top-5 acc 86.328 (86.198)	lr 0.00078
Train [107][1290/3239]	Time 0.224 (0.544)	Data Time 0.001 (0.031)	Loss 2.6201 (2.3586)	Entropy 0.53769 (0.53752)	Top-1 acc 62.891 (67.334)	Top-5 acc 81.250 (86.186)	lr 0.00078
Train [107][1300/3239]	Time 0.227 (0.543)	Data Time 0.001 (0.031)	Loss 2.5346 (2.3591)	Entropy 0.53808 (0.53752)	Top-1 acc 62.500 (67.317)	Top-5 acc 82.031 (86.179)	lr 0.00078
Train [107][1310/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.031)	Loss 2.3203 (2.3598)	Entropy 0.53816 (0.53753)	Top-1 acc 65.625 (67.295)	Top-5 acc 85.156 (86.168)	lr 0.00078
Train [107][1320/3239]	Time 0.322 (0.542)	Data Time 0.001 (0.031)	Loss 2.3928 (2.3601)	Entropy 0.53836 (0.53753)	Top-1 acc 67.188 (67.286)	Top-5 acc 86.719 (86.162)	lr 0.00078
Train [107][1330/3239]	Time 0.244 (0.542)	Data Time 0.001 (0.030)	Loss 2.2264 (2.3597)	Entropy 0.53839 (0.53754)	Top-1 acc 71.094 (67.296)	Top-5 acc 87.500 (86.166)	lr 0.00078
Train [107][1340/3239]	Time 0.241 (0.541)	Data Time 0.002 (0.030)	Loss 2.2490 (2.3596)	Entropy 0.53843 (0.53755)	Top-1 acc 67.969 (67.301)	Top-5 acc 89.453 (86.165)	lr 0.00078
Train [107][1350/3239]	Time 0.234 (0.540)	Data Time 0.001 (0.030)	Loss 2.8287 (2.3597)	Entropy 0.53872 (0.53755)	Top-1 acc 56.641 (67.303)	Top-5 acc 76.953 (86.163)	lr 0.00078
Train [107][1360/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.030)	Loss 2.5221 (2.3600)	Entropy 0.53839 (0.53756)	Top-1 acc 61.328 (67.293)	Top-5 acc 83.984 (86.158)	lr 0.00078
Train [107][1370/3239]	Time 0.326 (0.538)	Data Time 0.001 (0.029)	Loss 2.5124 (2.3607)	Entropy 0.53846 (0.53757)	Top-1 acc 64.844 (67.269)	Top-5 acc 82.422 (86.149)	lr 0.00078
Train [107][1380/3239]	Time 0.223 (0.537)	Data Time 0.001 (0.029)	Loss 2.3542 (2.3611)	Entropy 0.53815 (0.53757)	Top-1 acc 66.797 (67.258)	Top-5 acc 87.500 (86.145)	lr 0.00078
Train [107][1390/3239]	Time 0.221 (0.536)	Data Time 0.001 (0.029)	Loss 2.2738 (2.3607)	Entropy 0.53819 (0.53758)	Top-1 acc 68.750 (67.267)	Top-5 acc 88.281 (86.150)	lr 0.00078
Train [107][1400/3239]	Time 0.223 (0.535)	Data Time 0.001 (0.029)	Loss 2.3807 (2.3613)	Entropy 0.53816 (0.53758)	Top-1 acc 69.531 (67.258)	Top-5 acc 83.984 (86.137)	lr 0.00078
Train [107][1410/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.029)	Loss 2.1877 (2.3610)	Entropy 0.53842 (0.53758)	Top-1 acc 70.703 (67.265)	Top-5 acc 87.109 (86.137)	lr 0.00078
Train [107][1420/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.028)	Loss 2.4194 (2.3609)	Entropy 0.53852 (0.53759)	Top-1 acc 66.406 (67.275)	Top-5 acc 86.328 (86.137)	lr 0.00078
Train [107][1430/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.028)	Loss 2.4580 (2.3607)	Entropy 0.53862 (0.53760)	Top-1 acc 65.234 (67.284)	Top-5 acc 84.766 (86.144)	lr 0.00078
Train [107][1440/3239]	Time 0.323 (0.532)	Data Time 0.001 (0.028)	Loss 2.3202 (2.3604)	Entropy 0.53880 (0.53761)	Top-1 acc 70.312 (67.292)	Top-5 acc 83.984 (86.151)	lr 0.00078
Train [107][1450/3239]	Time 0.260 (0.531)	Data Time 0.001 (0.028)	Loss 2.1742 (2.3607)	Entropy 0.53895 (0.53761)	Top-1 acc 71.094 (67.282)	Top-5 acc 86.719 (86.146)	lr 0.00078
Train [107][1460/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.028)	Loss 2.1604 (2.3602)	Entropy 0.53916 (0.53762)	Top-1 acc 69.531 (67.291)	Top-5 acc 90.234 (86.154)	lr 0.00078
Train [107][1470/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.028)	Loss 2.6078 (2.3600)	Entropy 0.53834 (0.53763)	Top-1 acc 59.766 (67.297)	Top-5 acc 80.859 (86.154)	lr 0.00078
Train [107][1480/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.027)	Loss 2.0711 (2.3601)	Entropy 0.53803 (0.53764)	Top-1 acc 72.656 (67.291)	Top-5 acc 90.234 (86.150)	lr 0.00078
Train [107][1490/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.027)	Loss 2.3693 (2.3599)	Entropy 0.53795 (0.53764)	Top-1 acc 67.188 (67.302)	Top-5 acc 86.328 (86.154)	lr 0.00078
Train [107][1500/3239]	Time 0.236 (0.526)	Data Time 0.002 (0.027)	Loss 2.4105 (2.3602)	Entropy 0.53789 (0.53764)	Top-1 acc 64.453 (67.295)	Top-5 acc 85.156 (86.151)	lr 0.00078
Train [107][1510/3239]	Time 0.243 (0.526)	Data Time 0.001 (0.027)	Loss 2.2128 (2.3600)	Entropy 0.53785 (0.53764)	Top-1 acc 73.828 (67.299)	Top-5 acc 89.062 (86.158)	lr 0.00078
Train [107][1520/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.027)	Loss 2.4671 (2.3598)	Entropy 0.53773 (0.53764)	Top-1 acc 65.625 (67.302)	Top-5 acc 85.938 (86.161)	lr 0.00078
Train [107][1530/3239]	Time 0.425 (0.525)	Data Time 0.002 (0.027)	Loss 2.3766 (2.3594)	Entropy 0.53775 (0.53764)	Top-1 acc 66.797 (67.314)	Top-5 acc 84.766 (86.167)	lr 0.00078
Train [107][1540/3239]	Time 0.283 (0.525)	Data Time 0.001 (0.026)	Loss 2.3345 (2.3590)	Entropy 0.53765 (0.53764)	Top-1 acc 69.141 (67.326)	Top-5 acc 87.109 (86.174)	lr 0.00078
Train [107][1550/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.026)	Loss 2.1700 (2.3590)	Entropy 0.53779 (0.53764)	Top-1 acc 72.656 (67.328)	Top-5 acc 89.844 (86.172)	lr 0.00078
Train [107][1560/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.026)	Loss 2.1623 (2.3586)	Entropy 0.53754 (0.53764)	Top-1 acc 69.922 (67.330)	Top-5 acc 88.281 (86.179)	lr 0.00077
Train [107][1570/3239]	Time 0.277 (0.523)	Data Time 0.001 (0.026)	Loss 2.4674 (2.3590)	Entropy 0.53750 (0.53764)	Top-1 acc 63.672 (67.313)	Top-5 acc 85.156 (86.171)	lr 0.00077
Train [107][1580/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.026)	Loss 2.3071 (2.3590)	Entropy 0.53760 (0.53764)	Top-1 acc 67.578 (67.304)	Top-5 acc 86.328 (86.173)	lr 0.00077
Train [107][1590/3239]	Time 0.239 (0.522)	Data Time 0.001 (0.026)	Loss 2.4912 (2.3591)	Entropy 0.53770 (0.53764)	Top-1 acc 61.719 (67.306)	Top-5 acc 84.766 (86.170)	lr 0.00077
Train [107][1600/3239]	Time 0.340 (0.521)	Data Time 0.001 (0.025)	Loss 2.3581 (2.3590)	Entropy 0.53735 (0.53764)	Top-1 acc 69.531 (67.314)	Top-5 acc 83.984 (86.169)	lr 0.00077
Train [107][1610/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.025)	Loss 2.4394 (2.3590)	Entropy 0.53712 (0.53764)	Top-1 acc 67.578 (67.314)	Top-5 acc 84.766 (86.167)	lr 0.00077
Train [107][1620/3239]	Time 0.214 (0.519)	Data Time 0.001 (0.025)	Loss 2.2753 (2.3592)	Entropy 0.53689 (0.53764)	Top-1 acc 69.922 (67.307)	Top-5 acc 89.844 (86.166)	lr 0.00077
Train [107][1630/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.025)	Loss 2.2664 (2.3591)	Entropy 0.53661 (0.53763)	Top-1 acc 68.750 (67.310)	Top-5 acc 85.547 (86.168)	lr 0.00077
Train [107][1640/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.025)	Loss 2.2395 (2.3590)	Entropy 0.53665 (0.53763)	Top-1 acc 69.141 (67.313)	Top-5 acc 89.062 (86.166)	lr 0.00077
Train [107][1650/3239]	Time 0.262 (0.517)	Data Time 0.001 (0.025)	Loss 2.2636 (2.3590)	Entropy 0.53676 (0.53762)	Top-1 acc 66.797 (67.314)	Top-5 acc 87.500 (86.164)	lr 0.00077
Train [107][1660/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.025)	Loss 2.4015 (2.3593)	Entropy 0.53702 (0.53761)	Top-1 acc 66.797 (67.304)	Top-5 acc 82.812 (86.156)	lr 0.00077
Train [107][1670/3239]	Time 0.340 (0.516)	Data Time 0.001 (0.024)	Loss 2.3891 (2.3590)	Entropy 0.53703 (0.53761)	Top-1 acc 68.359 (67.311)	Top-5 acc 85.547 (86.159)	lr 0.00077
Train [107][1680/3239]	Time 0.220 (0.516)	Data Time 0.001 (0.024)	Loss 2.3247 (2.3591)	Entropy 0.53707 (0.53761)	Top-1 acc 67.578 (67.307)	Top-5 acc 84.766 (86.152)	lr 0.00077
Train [107][1690/3239]	Time 0.223 (0.515)	Data Time 0.001 (0.024)	Loss 2.6616 (2.3594)	Entropy 0.53685 (0.53760)	Top-1 acc 58.594 (67.303)	Top-5 acc 81.641 (86.150)	lr 0.00077
Train [107][1700/3239]	Time 0.225 (0.514)	Data Time 0.001 (0.024)	Loss 2.4140 (2.3593)	Entropy 0.53675 (0.53760)	Top-1 acc 68.359 (67.310)	Top-5 acc 84.375 (86.150)	lr 0.00077
Train [107][1710/3239]	Time 0.256 (0.514)	Data Time 0.001 (0.024)	Loss 2.3523 (2.3591)	Entropy 0.53683 (0.53759)	Top-1 acc 67.578 (67.315)	Top-5 acc 85.547 (86.152)	lr 0.00077
Train [107][1720/3239]	Time 0.301 (0.545)	Data Time 0.026 (0.024)	Loss 2.6066 (2.3593)	Entropy 0.53672 (0.53759)	Top-1 acc 60.938 (67.306)	Top-5 acc 82.031 (86.150)	lr 0.00077
Train [107][1730/3239]	Time 0.219 (0.544)	Data Time 0.002 (0.024)	Loss 2.2213 (2.3591)	Entropy 0.53678 (0.53758)	Top-1 acc 69.141 (67.308)	Top-5 acc 88.672 (86.155)	lr 0.00077
Train [107][1740/3239]	Time 0.245 (0.544)	Data Time 0.001 (0.024)	Loss 2.4008 (2.3591)	Entropy 0.53644 (0.53758)	Top-1 acc 70.703 (67.309)	Top-5 acc 85.938 (86.153)	lr 0.00077
Train [107][1750/3239]	Time 0.252 (0.543)	Data Time 0.001 (0.023)	Loss 2.4124 (2.3591)	Entropy 0.53669 (0.53757)	Top-1 acc 67.578 (67.314)	Top-5 acc 84.766 (86.153)	lr 0.00077
Train [107][1760/3239]	Time 0.375 (0.543)	Data Time 0.002 (0.023)	Loss 2.4070 (2.3591)	Entropy 0.53660 (0.53757)	Top-1 acc 67.969 (67.317)	Top-5 acc 83.594 (86.152)	lr 0.00077
Train [107][1770/3239]	Time 0.242 (0.542)	Data Time 0.001 (0.023)	Loss 2.3755 (2.3594)	Entropy 0.53663 (0.53756)	Top-1 acc 67.578 (67.311)	Top-5 acc 86.328 (86.148)	lr 0.00077
Train [107][1780/3239]	Time 0.289 (0.541)	Data Time 0.002 (0.023)	Loss 2.2759 (2.3591)	Entropy 0.53659 (0.53756)	Top-1 acc 66.016 (67.314)	Top-5 acc 88.672 (86.153)	lr 0.00077
Train [107][1790/3239]	Time 0.266 (0.541)	Data Time 0.001 (0.023)	Loss 2.1579 (2.3593)	Entropy 0.53630 (0.53755)	Top-1 acc 71.094 (67.308)	Top-5 acc 88.281 (86.148)	lr 0.00077
Train [107][1800/3239]	Time 0.235 (0.541)	Data Time 0.001 (0.023)	Loss 2.4865 (2.3594)	Entropy 0.53602 (0.53754)	Top-1 acc 65.234 (67.299)	Top-5 acc 82.812 (86.144)	lr 0.00077
Train [107][1810/3239]	Time 0.248 (0.540)	Data Time 0.001 (0.023)	Loss 2.6313 (2.3598)	Entropy 0.53651 (0.53754)	Top-1 acc 63.672 (67.290)	Top-5 acc 81.641 (86.142)	lr 0.00077
Train [107][1820/3239]	Time 0.320 (0.540)	Data Time 0.004 (0.023)	Loss 2.2182 (2.3592)	Entropy 0.53616 (0.53753)	Top-1 acc 71.094 (67.307)	Top-5 acc 89.062 (86.153)	lr 0.00077
Train [107][1830/3239]	Time 0.393 (0.539)	Data Time 0.001 (0.023)	Loss 2.5913 (2.3592)	Entropy 0.53618 (0.53752)	Top-1 acc 60.547 (67.306)	Top-5 acc 82.031 (86.153)	lr 0.00077
Train [107][1840/3239]	Time 0.228 (0.539)	Data Time 0.001 (0.022)	Loss 2.4433 (2.3592)	Entropy 0.53661 (0.53752)	Top-1 acc 62.500 (67.305)	Top-5 acc 87.109 (86.154)	lr 0.00076
Train [107][1850/3239]	Time 0.245 (0.538)	Data Time 0.002 (0.022)	Loss 2.5142 (2.3594)	Entropy 0.53668 (0.53751)	Top-1 acc 63.281 (67.300)	Top-5 acc 82.812 (86.153)	lr 0.00076
Train [107][1860/3239]	Time 0.261 (0.538)	Data Time 0.002 (0.022)	Loss 2.6030 (2.3592)	Entropy 0.53657 (0.53751)	Top-1 acc 61.719 (67.301)	Top-5 acc 81.250 (86.156)	lr 0.00076
Train [107][1870/3239]	Time 0.241 (0.537)	Data Time 0.001 (0.022)	Loss 2.5153 (2.3593)	Entropy 0.53657 (0.53750)	Top-1 acc 62.891 (67.300)	Top-5 acc 82.422 (86.158)	lr 0.00076
Train [107][1880/3239]	Time 0.237 (0.536)	Data Time 0.001 (0.022)	Loss 2.3994 (2.3594)	Entropy 0.53653 (0.53750)	Top-1 acc 64.062 (67.291)	Top-5 acc 85.547 (86.158)	lr 0.00076
Train [107][1890/3239]	Time 0.240 (0.536)	Data Time 0.001 (0.022)	Loss 2.1947 (2.3593)	Entropy 0.53654 (0.53749)	Top-1 acc 67.969 (67.287)	Top-5 acc 89.453 (86.157)	lr 0.00076
Train [107][1900/3239]	Time 0.264 (0.535)	Data Time 0.002 (0.022)	Loss 2.2259 (2.3589)	Entropy 0.53630 (0.53749)	Top-1 acc 73.828 (67.297)	Top-5 acc 88.281 (86.161)	lr 0.00076
Train [107][1910/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.022)	Loss 2.3783 (2.3590)	Entropy 0.53655 (0.53748)	Top-1 acc 64.062 (67.297)	Top-5 acc 87.109 (86.161)	lr 0.00076
Train [107][1920/3239]	Time 0.354 (0.535)	Data Time 0.002 (0.022)	Loss 2.2315 (2.3586)	Entropy 0.53627 (0.53747)	Top-1 acc 71.484 (67.306)	Top-5 acc 87.500 (86.164)	lr 0.00076
Train [107][1930/3239]	Time 0.246 (0.535)	Data Time 0.001 (0.021)	Loss 2.3080 (2.3588)	Entropy 0.53632 (0.53747)	Top-1 acc 67.969 (67.306)	Top-5 acc 87.891 (86.156)	lr 0.00076
Train [107][1940/3239]	Time 0.248 (0.534)	Data Time 0.001 (0.021)	Loss 2.1634 (2.3588)	Entropy 0.53647 (0.53746)	Top-1 acc 71.094 (67.301)	Top-5 acc 88.672 (86.158)	lr 0.00076
Train [107][1950/3239]	Time 0.268 (0.534)	Data Time 0.001 (0.021)	Loss 2.3369 (2.3592)	Entropy 0.53647 (0.53746)	Top-1 acc 65.234 (67.289)	Top-5 acc 86.719 (86.152)	lr 0.00076
Train [107][1960/3239]	Time 0.249 (0.533)	Data Time 0.001 (0.021)	Loss 2.1597 (2.3586)	Entropy 0.53675 (0.53745)	Top-1 acc 73.438 (67.303)	Top-5 acc 89.062 (86.162)	lr 0.00076
Train [107][1970/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.021)	Loss 2.2903 (2.3586)	Entropy 0.53637 (0.53745)	Top-1 acc 68.359 (67.302)	Top-5 acc 88.672 (86.163)	lr 0.00076
Train [107][1980/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.021)	Loss 2.5280 (2.3582)	Entropy 0.53623 (0.53744)	Top-1 acc 65.625 (67.309)	Top-5 acc 84.375 (86.169)	lr 0.00076
Train [107][1990/3239]	Time 0.337 (0.531)	Data Time 0.001 (0.021)	Loss 2.2833 (2.3582)	Entropy 0.53626 (0.53744)	Top-1 acc 69.531 (67.313)	Top-5 acc 87.500 (86.166)	lr 0.00076
Train [107][2000/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.021)	Loss 2.3818 (2.3583)	Entropy 0.53618 (0.53743)	Top-1 acc 64.062 (67.312)	Top-5 acc 85.156 (86.166)	lr 0.00076
Train [107][2010/3239]	Time 0.290 (0.531)	Data Time 0.002 (0.021)	Loss 2.2991 (2.3583)	Entropy 0.53605 (0.53742)	Top-1 acc 70.703 (67.315)	Top-5 acc 84.766 (86.166)	lr 0.00076
Train [107][2020/3239]	Time 0.272 (0.531)	Data Time 0.002 (0.021)	Loss 2.2382 (2.3580)	Entropy 0.53600 (0.53742)	Top-1 acc 68.750 (67.321)	Top-5 acc 87.500 (86.171)	lr 0.00076
Train [107][2030/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.021)	Loss 2.4913 (2.3583)	Entropy 0.53606 (0.53741)	Top-1 acc 62.500 (67.313)	Top-5 acc 84.375 (86.170)	lr 0.00076
Train [107][2040/3239]	Time 0.258 (0.529)	Data Time 0.001 (0.020)	Loss 2.3715 (2.3583)	Entropy 0.53633 (0.53740)	Top-1 acc 67.969 (67.318)	Top-5 acc 84.766 (86.170)	lr 0.00076
Train [107][2050/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.020)	Loss 2.3589 (2.3581)	Entropy 0.53600 (0.53740)	Top-1 acc 64.844 (67.320)	Top-5 acc 89.453 (86.173)	lr 0.00076
Train [107][2060/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.020)	Loss 2.3832 (2.3580)	Entropy 0.53647 (0.53739)	Top-1 acc 67.188 (67.323)	Top-5 acc 84.375 (86.176)	lr 0.00076
Train [107][2070/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.020)	Loss 2.3961 (2.3583)	Entropy 0.53644 (0.53739)	Top-1 acc 66.016 (67.315)	Top-5 acc 87.109 (86.171)	lr 0.00076
Train [107][2080/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.020)	Loss 2.5731 (2.3582)	Entropy 0.53654 (0.53738)	Top-1 acc 60.938 (67.316)	Top-5 acc 83.594 (86.172)	lr 0.00076
Train [107][2090/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.020)	Loss 2.4291 (2.3581)	Entropy 0.53671 (0.53738)	Top-1 acc 67.188 (67.319)	Top-5 acc 82.812 (86.172)	lr 0.00076
Train [107][2100/3239]	Time 0.245 (0.526)	Data Time 0.001 (0.020)	Loss 2.2334 (2.3581)	Entropy 0.53651 (0.53738)	Top-1 acc 71.094 (67.321)	Top-5 acc 88.672 (86.173)	lr 0.00076
Train [107][2110/3239]	Time 0.276 (0.526)	Data Time 0.002 (0.020)	Loss 2.0558 (2.3577)	Entropy 0.53647 (0.53737)	Top-1 acc 75.391 (67.329)	Top-5 acc 90.625 (86.178)	lr 0.00076
Train [107][2120/3239]	Time 0.290 (0.526)	Data Time 0.002 (0.020)	Loss 2.2596 (2.3579)	Entropy 0.53636 (0.53737)	Top-1 acc 71.484 (67.328)	Top-5 acc 86.719 (86.172)	lr 0.00076
Train [107][2130/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.020)	Loss 2.3176 (2.3584)	Entropy 0.53650 (0.53736)	Top-1 acc 66.797 (67.317)	Top-5 acc 85.938 (86.161)	lr 0.00075
Train [107][2140/3239]	Time 0.230 (0.524)	Data Time 0.001 (0.020)	Loss 2.2899 (2.3584)	Entropy 0.53645 (0.53736)	Top-1 acc 70.312 (67.315)	Top-5 acc 85.938 (86.164)	lr 0.00075
Train [107][2150/3239]	Time 0.322 (0.524)	Data Time 0.001 (0.019)	Loss 2.2206 (2.3583)	Entropy 0.53666 (0.53735)	Top-1 acc 73.438 (67.318)	Top-5 acc 88.672 (86.166)	lr 0.00075
Train [107][2160/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.019)	Loss 2.5378 (2.3586)	Entropy 0.53674 (0.53735)	Top-1 acc 63.672 (67.312)	Top-5 acc 82.812 (86.159)	lr 0.00075
Train [107][2170/3239]	Time 0.231 (0.523)	Data Time 0.002 (0.019)	Loss 2.2475 (2.3585)	Entropy 0.53670 (0.53735)	Top-1 acc 68.359 (67.313)	Top-5 acc 86.328 (86.161)	lr 0.00075
Train [107][2180/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.019)	Loss 2.4116 (2.3580)	Entropy 0.53652 (0.53735)	Top-1 acc 64.844 (67.326)	Top-5 acc 86.328 (86.170)	lr 0.00075
Train [107][2190/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.019)	Loss 2.3092 (2.3580)	Entropy 0.53643 (0.53734)	Top-1 acc 68.750 (67.326)	Top-5 acc 87.500 (86.169)	lr 0.00075
Train [107][2200/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.019)	Loss 2.2603 (2.3582)	Entropy 0.53658 (0.53734)	Top-1 acc 71.094 (67.320)	Top-5 acc 88.672 (86.166)	lr 0.00075
Train [107][2210/3239]	Time 0.225 (0.521)	Data Time 0.001 (0.019)	Loss 2.2780 (2.3580)	Entropy 0.53614 (0.53733)	Top-1 acc 67.188 (67.322)	Top-5 acc 88.281 (86.170)	lr 0.00075
Train [107][2220/3239]	Time 0.335 (0.520)	Data Time 0.002 (0.019)	Loss 2.2858 (2.3579)	Entropy 0.53609 (0.53733)	Top-1 acc 71.094 (67.329)	Top-5 acc 87.500 (86.172)	lr 0.00075
Train [107][2230/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.019)	Loss 2.2277 (2.3581)	Entropy 0.53629 (0.53732)	Top-1 acc 69.922 (67.326)	Top-5 acc 88.672 (86.168)	lr 0.00075
Train [107][2240/3239]	Time 0.224 (0.519)	Data Time 0.001 (0.019)	Loss 2.4469 (2.3584)	Entropy 0.53622 (0.53732)	Top-1 acc 66.406 (67.319)	Top-5 acc 84.375 (86.166)	lr 0.00075
Train [107][2250/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.019)	Loss 2.4753 (2.3585)	Entropy 0.53612 (0.53731)	Top-1 acc 64.844 (67.316)	Top-5 acc 82.812 (86.159)	lr 0.00075
Train [107][2260/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.019)	Loss 2.2579 (2.3587)	Entropy 0.53618 (0.53731)	Top-1 acc 68.359 (67.310)	Top-5 acc 87.109 (86.155)	lr 0.00075
Train [107][2270/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.019)	Loss 2.5802 (2.3590)	Entropy 0.53615 (0.53730)	Top-1 acc 61.328 (67.305)	Top-5 acc 82.812 (86.148)	lr 0.00075
Train [107][2280/3239]	Time 0.223 (0.517)	Data Time 0.001 (0.018)	Loss 2.2144 (2.3590)	Entropy 0.53594 (0.53730)	Top-1 acc 71.484 (67.309)	Top-5 acc 87.109 (86.148)	lr 0.00075
Train [107][2290/3239]	Time 0.256 (0.517)	Data Time 0.001 (0.018)	Loss 2.4222 (2.3589)	Entropy 0.53564 (0.53729)	Top-1 acc 66.406 (67.312)	Top-5 acc 85.156 (86.152)	lr 0.00075
Train [107][2300/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.018)	Loss 2.2468 (2.3590)	Entropy 0.53538 (0.53728)	Top-1 acc 69.531 (67.309)	Top-5 acc 86.328 (86.150)	lr 0.00075
Train [107][2310/3239]	Time 0.324 (0.516)	Data Time 0.001 (0.018)	Loss 2.6765 (2.3592)	Entropy 0.53556 (0.53728)	Top-1 acc 62.109 (67.305)	Top-5 acc 82.031 (86.146)	lr 0.00075
Train [107][2320/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.018)	Loss 2.6879 (2.3592)	Entropy 0.53567 (0.53727)	Top-1 acc 57.031 (67.302)	Top-5 acc 82.031 (86.150)	lr 0.00075
Train [107][2330/3239]	Time 0.332 (0.515)	Data Time 0.002 (0.018)	Loss 2.2548 (2.3593)	Entropy 0.53574 (0.53726)	Top-1 acc 67.188 (67.302)	Top-5 acc 90.234 (86.152)	lr 0.00075
Train [107][2340/3239]	Time 0.247 (0.516)	Data Time 0.001 (0.018)	Loss 2.2143 (2.3592)	Entropy 0.53590 (0.53726)	Top-1 acc 68.750 (67.304)	Top-5 acc 88.672 (86.155)	lr 0.00075
Train [107][2350/3239]	Time 0.242 (0.515)	Data Time 0.001 (0.018)	Loss 2.5938 (2.3594)	Entropy 0.53607 (0.53725)	Top-1 acc 62.109 (67.300)	Top-5 acc 84.766 (86.153)	lr 0.00075
Train [107][2360/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.018)	Loss 2.3098 (2.3592)	Entropy 0.53597 (0.53725)	Top-1 acc 66.016 (67.304)	Top-5 acc 86.328 (86.154)	lr 0.00075
Train [107][2370/3239]	Time 0.340 (0.537)	Data Time 0.033 (0.018)	Loss 2.3399 (2.3592)	Entropy 0.53621 (0.53724)	Top-1 acc 67.188 (67.308)	Top-5 acc 88.281 (86.153)	lr 0.00075
Train [107][2380/3239]	Time 0.352 (0.537)	Data Time 0.002 (0.018)	Loss 2.3231 (2.3592)	Entropy 0.53628 (0.53724)	Top-1 acc 64.062 (67.306)	Top-5 acc 84.766 (86.155)	lr 0.00075
Train [107][2390/3239]	Time 0.236 (0.537)	Data Time 0.001 (0.018)	Loss 2.1551 (2.3593)	Entropy 0.53644 (0.53723)	Top-1 acc 72.656 (67.301)	Top-5 acc 87.891 (86.154)	lr 0.00075
Train [107][2400/3239]	Time 0.268 (0.536)	Data Time 0.001 (0.018)	Loss 2.8190 (2.3592)	Entropy 0.53647 (0.53723)	Top-1 acc 57.812 (67.305)	Top-5 acc 81.250 (86.156)	lr 0.00075
Train [107][2410/3239]	Time 0.247 (0.536)	Data Time 0.001 (0.018)	Loss 2.2657 (2.3591)	Entropy 0.53634 (0.53723)	Top-1 acc 72.266 (67.309)	Top-5 acc 87.500 (86.158)	lr 0.00075
Train [107][2420/3239]	Time 0.302 (0.536)	Data Time 0.003 (0.018)	Loss 2.2933 (2.3591)	Entropy 0.53576 (0.53722)	Top-1 acc 67.188 (67.304)	Top-5 acc 84.766 (86.159)	lr 0.00074
Train [107][2430/3239]	Time 0.262 (0.536)	Data Time 0.002 (0.018)	Loss 2.3347 (2.3589)	Entropy 0.53626 (0.53722)	Top-1 acc 66.797 (67.307)	Top-5 acc 87.109 (86.163)	lr 0.00074
Train [107][2440/3239]	Time 0.292 (0.535)	Data Time 0.002 (0.017)	Loss 2.1899 (2.3590)	Entropy 0.53615 (0.53721)	Top-1 acc 72.266 (67.307)	Top-5 acc 89.453 (86.163)	lr 0.00074
Train [107][2450/3239]	Time 0.300 (0.536)	Data Time 0.002 (0.017)	Loss 2.5039 (2.3591)	Entropy 0.53611 (0.53721)	Top-1 acc 64.844 (67.303)	Top-5 acc 83.594 (86.159)	lr 0.00074
Train [107][2460/3239]	Time 0.240 (0.535)	Data Time 0.001 (0.017)	Loss 2.2770 (2.3591)	Entropy 0.53603 (0.53720)	Top-1 acc 69.531 (67.299)	Top-5 acc 85.938 (86.157)	lr 0.00074
Train [107][2470/3239]	Time 0.346 (0.535)	Data Time 0.001 (0.017)	Loss 2.2728 (2.3593)	Entropy 0.53587 (0.53720)	Top-1 acc 70.312 (67.295)	Top-5 acc 87.109 (86.158)	lr 0.00074
Train [107][2480/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.017)	Loss 2.2404 (2.3594)	Entropy 0.53599 (0.53719)	Top-1 acc 70.703 (67.287)	Top-5 acc 89.453 (86.157)	lr 0.00074
Train [107][2490/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.017)	Loss 2.4421 (2.3593)	Entropy 0.53623 (0.53719)	Top-1 acc 64.844 (67.286)	Top-5 acc 84.766 (86.157)	lr 0.00074
Train [107][2500/3239]	Time 0.225 (0.533)	Data Time 0.001 (0.017)	Loss 2.2459 (2.3591)	Entropy 0.53626 (0.53719)	Top-1 acc 70.312 (67.293)	Top-5 acc 89.844 (86.160)	lr 0.00074
Train [107][2510/3239]	Time 0.263 (0.533)	Data Time 0.003 (0.017)	Loss 2.4532 (2.3591)	Entropy 0.53653 (0.53718)	Top-1 acc 64.453 (67.295)	Top-5 acc 83.984 (86.159)	lr 0.00074
Train [107][2520/3239]	Time 0.226 (0.532)	Data Time 0.001 (0.017)	Loss 2.7430 (2.3593)	Entropy 0.53679 (0.53718)	Top-1 acc 54.688 (67.288)	Top-5 acc 80.078 (86.156)	lr 0.00074
Train [107][2530/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.017)	Loss 2.1458 (2.3593)	Entropy 0.53698 (0.53718)	Top-1 acc 72.656 (67.288)	Top-5 acc 89.062 (86.158)	lr 0.00074
Train [107][2540/3239]	Time 0.322 (0.531)	Data Time 0.001 (0.017)	Loss 2.4774 (2.3593)	Entropy 0.53730 (0.53718)	Top-1 acc 66.016 (67.288)	Top-5 acc 85.547 (86.158)	lr 0.00074
Train [107][2550/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.017)	Loss 2.1878 (2.3594)	Entropy 0.53693 (0.53718)	Top-1 acc 71.094 (67.289)	Top-5 acc 89.453 (86.158)	lr 0.00074
Train [107][2560/3239]	Time 0.268 (0.531)	Data Time 0.001 (0.017)	Loss 2.4216 (2.3590)	Entropy 0.53696 (0.53718)	Top-1 acc 67.188 (67.293)	Top-5 acc 82.812 (86.163)	lr 0.00074
Train [107][2570/3239]	Time 0.226 (0.530)	Data Time 0.001 (0.017)	Loss 2.5191 (2.3590)	Entropy 0.53692 (0.53718)	Top-1 acc 65.234 (67.296)	Top-5 acc 83.203 (86.161)	lr 0.00074
Train [107][2580/3239]	Time 0.238 (0.530)	Data Time 0.001 (0.017)	Loss 2.3811 (2.3591)	Entropy 0.53729 (0.53718)	Top-1 acc 62.891 (67.293)	Top-5 acc 88.281 (86.163)	lr 0.00074
Train [107][2590/3239]	Time 0.246 (0.529)	Data Time 0.001 (0.017)	Loss 2.2151 (2.3592)	Entropy 0.53725 (0.53718)	Top-1 acc 69.531 (67.290)	Top-5 acc 88.281 (86.161)	lr 0.00074
Train [107][2600/3239]	Time 0.230 (0.529)	Data Time 0.001 (0.016)	Loss 2.3240 (2.3592)	Entropy 0.53702 (0.53718)	Top-1 acc 67.578 (67.289)	Top-5 acc 87.891 (86.163)	lr 0.00074
Train [107][2610/3239]	Time 0.298 (0.529)	Data Time 0.002 (0.016)	Loss 2.3303 (2.3591)	Entropy 0.53717 (0.53718)	Top-1 acc 66.016 (67.285)	Top-5 acc 86.719 (86.164)	lr 0.00074
Train [107][2620/3239]	Time 0.286 (0.529)	Data Time 0.001 (0.016)	Loss 2.5134 (2.3592)	Entropy 0.53707 (0.53718)	Top-1 acc 60.156 (67.280)	Top-5 acc 81.250 (86.161)	lr 0.00074
Train [107][2630/3239]	Time 0.285 (0.529)	Data Time 0.001 (0.016)	Loss 2.0789 (2.3590)	Entropy 0.53678 (0.53718)	Top-1 acc 74.219 (67.284)	Top-5 acc 91.016 (86.165)	lr 0.00074
Train [107][2640/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.016)	Loss 2.2465 (2.3588)	Entropy 0.53657 (0.53717)	Top-1 acc 74.219 (67.287)	Top-5 acc 88.281 (86.166)	lr 0.00074
Train [107][2650/3239]	Time 0.226 (0.528)	Data Time 0.004 (0.016)	Loss 2.6690 (2.3588)	Entropy 0.53681 (0.53717)	Top-1 acc 58.984 (67.288)	Top-5 acc 81.250 (86.167)	lr 0.00074
Train [107][2660/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.016)	Loss 2.3111 (2.3588)	Entropy 0.53674 (0.53717)	Top-1 acc 67.578 (67.290)	Top-5 acc 87.109 (86.164)	lr 0.00074
Train [107][2670/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.016)	Loss 2.1929 (2.3586)	Entropy 0.53682 (0.53717)	Top-1 acc 69.922 (67.295)	Top-5 acc 90.234 (86.165)	lr 0.00074
Train [107][2680/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.016)	Loss 2.4435 (2.3588)	Entropy 0.53717 (0.53717)	Top-1 acc 67.188 (67.296)	Top-5 acc 84.375 (86.161)	lr 0.00074
Train [107][2690/3239]	Time 0.232 (0.526)	Data Time 0.005 (0.016)	Loss 2.3969 (2.3590)	Entropy 0.53698 (0.53717)	Top-1 acc 66.797 (67.293)	Top-5 acc 87.500 (86.157)	lr 0.00074
Train [107][2700/3239]	Time 0.318 (0.526)	Data Time 0.001 (0.016)	Loss 2.3536 (2.3587)	Entropy 0.53691 (0.53717)	Top-1 acc 66.797 (67.297)	Top-5 acc 86.328 (86.159)	lr 0.00074
Train [107][2710/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.016)	Loss 2.2958 (2.3585)	Entropy 0.53706 (0.53717)	Top-1 acc 69.922 (67.303)	Top-5 acc 85.938 (86.162)	lr 0.00073
Train [107][2720/3239]	Time 0.269 (0.525)	Data Time 0.001 (0.016)	Loss 2.3509 (2.3584)	Entropy 0.53684 (0.53717)	Top-1 acc 66.406 (67.302)	Top-5 acc 86.328 (86.163)	lr 0.00073
Train [107][2730/3239]	Time 0.227 (0.524)	Data Time 0.001 (0.016)	Loss 2.4616 (2.3585)	Entropy 0.53679 (0.53716)	Top-1 acc 62.891 (67.300)	Top-5 acc 84.375 (86.163)	lr 0.00073
Train [107][2740/3239]	Time 0.246 (0.524)	Data Time 0.002 (0.016)	Loss 2.3162 (2.3583)	Entropy 0.53662 (0.53716)	Top-1 acc 69.531 (67.308)	Top-5 acc 86.719 (86.166)	lr 0.00073
Train [107][2750/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.016)	Loss 2.6198 (2.3582)	Entropy 0.53664 (0.53716)	Top-1 acc 58.203 (67.312)	Top-5 acc 82.031 (86.168)	lr 0.00073
Train [107][2760/3239]	Time 0.248 (0.523)	Data Time 0.001 (0.016)	Loss 2.4475 (2.3580)	Entropy 0.53661 (0.53716)	Top-1 acc 64.844 (67.314)	Top-5 acc 84.375 (86.174)	lr 0.00073
Train [107][2770/3239]	Time 0.327 (0.523)	Data Time 0.001 (0.016)	Loss 2.3915 (2.3581)	Entropy 0.53673 (0.53716)	Top-1 acc 67.969 (67.317)	Top-5 acc 85.547 (86.171)	lr 0.00073
Train [107][2780/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.016)	Loss 2.4035 (2.3582)	Entropy 0.53644 (0.53715)	Top-1 acc 70.312 (67.316)	Top-5 acc 84.375 (86.169)	lr 0.00073
Train [107][2790/3239]	Time 0.275 (0.522)	Data Time 0.001 (0.015)	Loss 2.3383 (2.3580)	Entropy 0.53629 (0.53715)	Top-1 acc 64.062 (67.323)	Top-5 acc 86.719 (86.172)	lr 0.00073
Train [107][2800/3239]	Time 0.223 (0.522)	Data Time 0.001 (0.015)	Loss 2.6560 (2.3579)	Entropy 0.53608 (0.53715)	Top-1 acc 59.766 (67.323)	Top-5 acc 82.422 (86.174)	lr 0.00073
Train [107][2810/3239]	Time 0.222 (0.522)	Data Time 0.001 (0.015)	Loss 2.3432 (2.3579)	Entropy 0.53582 (0.53714)	Top-1 acc 71.484 (67.331)	Top-5 acc 87.109 (86.173)	lr 0.00073
Train [107][2820/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.015)	Loss 2.1533 (2.3578)	Entropy 0.53570 (0.53714)	Top-1 acc 73.828 (67.331)	Top-5 acc 89.844 (86.175)	lr 0.00073
Train [107][2830/3239]	Time 0.229 (0.521)	Data Time 0.001 (0.015)	Loss 2.4104 (2.3576)	Entropy 0.53551 (0.53713)	Top-1 acc 67.188 (67.333)	Top-5 acc 86.328 (86.176)	lr 0.00073
Train [107][2840/3239]	Time 0.244 (0.520)	Data Time 0.001 (0.015)	Loss 2.5171 (2.3577)	Entropy 0.53577 (0.53713)	Top-1 acc 62.891 (67.328)	Top-5 acc 82.422 (86.172)	lr 0.00073
Train [107][2850/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.015)	Loss 2.3177 (2.3576)	Entropy 0.53590 (0.53712)	Top-1 acc 70.703 (67.331)	Top-5 acc 86.719 (86.173)	lr 0.00073
Train [107][2860/3239]	Time 0.348 (0.520)	Data Time 0.001 (0.015)	Loss 2.3427 (2.3577)	Entropy 0.53630 (0.53712)	Top-1 acc 67.969 (67.331)	Top-5 acc 85.938 (86.171)	lr 0.00073
Train [107][2870/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.015)	Loss 2.5414 (2.3580)	Entropy 0.53635 (0.53712)	Top-1 acc 63.281 (67.321)	Top-5 acc 81.250 (86.165)	lr 0.00073
Train [107][2880/3239]	Time 0.234 (0.519)	Data Time 0.002 (0.015)	Loss 2.4811 (2.3583)	Entropy 0.53598 (0.53711)	Top-1 acc 64.844 (67.318)	Top-5 acc 82.812 (86.161)	lr 0.00073
Train [107][2890/3239]	Time 0.225 (0.519)	Data Time 0.001 (0.015)	Loss 2.2058 (2.3582)	Entropy 0.53597 (0.53711)	Top-1 acc 67.969 (67.318)	Top-5 acc 89.062 (86.161)	lr 0.00073
Train [107][2900/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.015)	Loss 2.3090 (2.3583)	Entropy 0.53619 (0.53711)	Top-1 acc 66.016 (67.312)	Top-5 acc 86.719 (86.160)	lr 0.00073
Train [107][2910/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.015)	Loss 2.2369 (2.3582)	Entropy 0.53629 (0.53710)	Top-1 acc 70.312 (67.312)	Top-5 acc 87.109 (86.162)	lr 0.00073
Train [107][2920/3239]	Time 0.350 (0.518)	Data Time 0.003 (0.015)	Loss 2.4202 (2.3582)	Entropy 0.53639 (0.53710)	Top-1 acc 67.578 (67.314)	Top-5 acc 83.984 (86.162)	lr 0.00073
Train [107][2930/3239]	Time 0.346 (0.518)	Data Time 0.002 (0.015)	Loss 2.4652 (2.3581)	Entropy 0.53642 (0.53710)	Top-1 acc 61.719 (67.312)	Top-5 acc 85.547 (86.163)	lr 0.00073
Train [107][2940/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.015)	Loss 2.2272 (2.3580)	Entropy 0.53599 (0.53709)	Top-1 acc 72.656 (67.314)	Top-5 acc 88.281 (86.166)	lr 0.00073
Train [107][2950/3239]	Time 0.242 (0.517)	Data Time 0.001 (0.015)	Loss 2.2830 (2.3580)	Entropy 0.53630 (0.53709)	Top-1 acc 69.922 (67.317)	Top-5 acc 87.500 (86.166)	lr 0.00073
Train [107][2960/3239]	Time 0.240 (0.517)	Data Time 0.001 (0.015)	Loss 2.3154 (2.3580)	Entropy 0.53669 (0.53709)	Top-1 acc 66.406 (67.316)	Top-5 acc 87.891 (86.166)	lr 0.00073
Train [107][2970/3239]	Time 0.236 (0.517)	Data Time 0.001 (0.015)	Loss 2.1546 (2.3578)	Entropy 0.53655 (0.53709)	Top-1 acc 73.438 (67.320)	Top-5 acc 88.281 (86.169)	lr 0.00073
Train [107][2980/3239]	Time 0.228 (0.516)	Data Time 0.001 (0.015)	Loss 2.3788 (2.3581)	Entropy 0.53669 (0.53709)	Top-1 acc 65.234 (67.311)	Top-5 acc 85.938 (86.164)	lr 0.00073
Train [107][2990/3239]	Time 0.223 (0.516)	Data Time 0.001 (0.015)	Loss 2.3610 (2.3581)	Entropy 0.53645 (0.53708)	Top-1 acc 67.969 (67.311)	Top-5 acc 85.938 (86.163)	lr 0.00073
Train [107][3000/3239]	Time 0.263 (0.516)	Data Time 0.001 (0.015)	Loss 2.4490 (2.3580)	Entropy 0.53645 (0.53708)	Top-1 acc 65.234 (67.309)	Top-5 acc 83.594 (86.163)	lr 0.00073
Train [107][3010/3239]	Time 0.227 (0.515)	Data Time 0.001 (0.014)	Loss 2.5478 (2.3583)	Entropy 0.53641 (0.53708)	Top-1 acc 58.984 (67.300)	Top-5 acc 80.469 (86.158)	lr 0.00072
Train [107][3020/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.014)	Loss 2.5555 (2.3585)	Entropy 0.53660 (0.53708)	Top-1 acc 63.672 (67.296)	Top-5 acc 82.422 (86.156)	lr 0.00072
Train [107][3030/3239]	Time 0.308 (0.532)	Data Time 0.002 (0.014)	Loss 2.4327 (2.3584)	Entropy 0.53686 (0.53708)	Top-1 acc 66.016 (67.300)	Top-5 acc 83.203 (86.157)	lr 0.00072
Train [107][3040/3239]	Time 0.252 (0.532)	Data Time 0.002 (0.014)	Loss 2.3466 (2.3585)	Entropy 0.53713 (0.53708)	Top-1 acc 67.188 (67.298)	Top-5 acc 86.719 (86.158)	lr 0.00072
Train [107][3050/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.014)	Loss 2.2408 (2.3586)	Entropy 0.53713 (0.53708)	Top-1 acc 67.578 (67.294)	Top-5 acc 86.328 (86.155)	lr 0.00072
Train [107][3060/3239]	Time 0.239 (0.532)	Data Time 0.001 (0.014)	Loss 2.3482 (2.3587)	Entropy 0.53721 (0.53708)	Top-1 acc 66.406 (67.291)	Top-5 acc 87.500 (86.156)	lr 0.00072
Train [107][3070/3239]	Time 0.249 (0.531)	Data Time 0.002 (0.014)	Loss 2.3451 (2.3587)	Entropy 0.53739 (0.53708)	Top-1 acc 66.797 (67.294)	Top-5 acc 86.719 (86.153)	lr 0.00072
Train [107][3080/3239]	Time 0.233 (0.531)	Data Time 0.001 (0.014)	Loss 2.6189 (2.3589)	Entropy 0.53735 (0.53708)	Top-1 acc 62.500 (67.286)	Top-5 acc 84.375 (86.152)	lr 0.00072
Train [107][3090/3239]	Time 0.395 (0.531)	Data Time 0.001 (0.014)	Loss 2.1313 (2.3588)	Entropy 0.53748 (0.53708)	Top-1 acc 71.875 (67.290)	Top-5 acc 89.453 (86.154)	lr 0.00072
Train [107][3100/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.014)	Loss 2.5260 (2.3589)	Entropy 0.53738 (0.53708)	Top-1 acc 62.891 (67.288)	Top-5 acc 83.984 (86.154)	lr 0.00072
Train [107][3110/3239]	Time 0.286 (0.530)	Data Time 0.002 (0.014)	Loss 2.3102 (2.3588)	Entropy 0.53707 (0.53708)	Top-1 acc 67.188 (67.287)	Top-5 acc 85.156 (86.155)	lr 0.00072
Train [107][3120/3239]	Time 0.240 (0.530)	Data Time 0.001 (0.014)	Loss 2.1553 (2.3589)	Entropy 0.53727 (0.53708)	Top-1 acc 67.969 (67.284)	Top-5 acc 90.625 (86.152)	lr 0.00072
Train [107][3130/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.014)	Loss 2.3209 (2.3588)	Entropy 0.53746 (0.53708)	Top-1 acc 64.844 (67.285)	Top-5 acc 88.672 (86.154)	lr 0.00072
Train [107][3140/3239]	Time 0.264 (0.529)	Data Time 0.001 (0.014)	Loss 2.1842 (2.3589)	Entropy 0.53745 (0.53708)	Top-1 acc 71.094 (67.284)	Top-5 acc 89.062 (86.154)	lr 0.00072
Train [107][3150/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.014)	Loss 2.3308 (2.3591)	Entropy 0.53733 (0.53708)	Top-1 acc 66.797 (67.277)	Top-5 acc 87.500 (86.150)	lr 0.00072
Train [107][3160/3239]	Time 0.278 (0.529)	Data Time 0.001 (0.014)	Loss 2.2628 (2.3590)	Entropy 0.53705 (0.53708)	Top-1 acc 69.141 (67.280)	Top-5 acc 88.281 (86.152)	lr 0.00072
Train [107][3170/3239]	Time 0.227 (0.528)	Data Time 0.001 (0.014)	Loss 2.1598 (2.3588)	Entropy 0.53716 (0.53708)	Top-1 acc 70.703 (67.280)	Top-5 acc 89.062 (86.153)	lr 0.00072
Train [107][3180/3239]	Time 0.252 (0.528)	Data Time 0.000 (0.014)	Loss 2.4192 (2.3590)	Entropy 0.53739 (0.53709)	Top-1 acc 67.578 (67.279)	Top-5 acc 85.156 (86.152)	lr 0.00072
Train [107][3190/3239]	Time 0.258 (0.528)	Data Time 0.000 (0.014)	Loss 2.4342 (2.3589)	Entropy 0.53670 (0.53709)	Top-1 acc 66.406 (67.281)	Top-5 acc 85.938 (86.154)	lr 0.00072
Train [107][3200/3239]	Time 0.246 (0.527)	Data Time 0.000 (0.014)	Loss 2.1804 (2.3591)	Entropy 0.53658 (0.53708)	Top-1 acc 70.703 (67.275)	Top-5 acc 88.672 (86.150)	lr 0.00072
Train [107][3210/3239]	Time 0.281 (0.527)	Data Time 0.000 (0.014)	Loss 2.1835 (2.3590)	Entropy 0.53650 (0.53708)	Top-1 acc 72.266 (67.277)	Top-5 acc 90.625 (86.151)	lr 0.00072
Train [107][3220/3239]	Time 0.251 (0.527)	Data Time 0.000 (0.014)	Loss 2.2872 (2.3589)	Entropy 0.53643 (0.53708)	Top-1 acc 67.969 (67.281)	Top-5 acc 86.719 (86.153)	lr 0.00072
Train [107][3230/3239]	Time 0.239 (0.527)	Data Time 0.000 (0.014)	Loss 2.3039 (2.3591)	Entropy 0.53674 (0.53708)	Top-1 acc 69.531 (67.279)	Top-5 acc 86.719 (86.148)	lr 0.00072
Train [107][3239/3239]	Time 1.020 (0.526)	Data Time 0.000 (0.014)	Loss 2.9083 (2.3590)	Entropy 0.53686 (0.53708)	Top-1 acc 49.383 (67.281)	Top-5 acc 74.074 (86.149)	lr 0.00072
==========Valid [107/120]	loss 1.179	top-1 acc 72.688 (72.893)	top-5 acc 90.573	Train top-1 67.281	top-5 86.149	Entropy 0.53686	Latency-None: 0.000ms	Flops: 539.00M
Train [108][0/3239]	Time 36.714 (36.714)	Data Time 34.299 (34.299)	Loss 2.3603 (2.3603)	Entropy 0.53701 (0.53701)	Top-1 acc 71.484 (71.484)	Top-5 acc 85.938 (85.938)	lr 0.00072
Train [108][10/3239]	Time 0.246 (3.955)	Data Time 0.001 (3.266)	Loss 2.5797 (2.3442)	Entropy 0.53650 (0.53678)	Top-1 acc 64.453 (68.999)	Top-5 acc 83.594 (86.399)	lr 0.00072
Train [108][20/3239]	Time 0.236 (2.271)	Data Time 0.002 (1.712)	Loss 2.2580 (2.3563)	Entropy 0.53604 (0.53661)	Top-1 acc 71.484 (68.173)	Top-5 acc 87.109 (85.993)	lr 0.00072
Train [108][30/3239]	Time 0.235 (1.669)	Data Time 0.001 (1.160)	Loss 2.1544 (2.3360)	Entropy 0.53639 (0.53648)	Top-1 acc 71.484 (68.246)	Top-5 acc 89.453 (86.391)	lr 0.00072
Train [108][40/3239]	Time 0.227 (1.366)	Data Time 0.001 (0.878)	Loss 2.5013 (2.3428)	Entropy 0.53650 (0.53649)	Top-1 acc 67.969 (68.245)	Top-5 acc 84.766 (86.471)	lr 0.00072
Train [108][50/3239]	Time 0.232 (1.178)	Data Time 0.001 (0.706)	Loss 2.8199 (2.3442)	Entropy 0.53648 (0.53650)	Top-1 acc 58.203 (68.183)	Top-5 acc 76.562 (86.343)	lr 0.00072
Train [108][60/3239]	Time 0.226 (1.052)	Data Time 0.001 (0.590)	Loss 2.2840 (2.3522)	Entropy 0.53649 (0.53652)	Top-1 acc 70.703 (67.879)	Top-5 acc 86.328 (86.194)	lr 0.00071
Train [108][70/3239]	Time 0.233 (0.964)	Data Time 0.001 (0.507)	Loss 2.2421 (2.3557)	Entropy 0.53713 (0.53654)	Top-1 acc 66.406 (67.837)	Top-5 acc 89.844 (86.141)	lr 0.00071
Train [108][80/3239]	Time 0.346 (0.897)	Data Time 0.001 (0.445)	Loss 2.3618 (2.3495)	Entropy 0.53732 (0.53662)	Top-1 acc 69.531 (67.843)	Top-5 acc 86.328 (86.236)	lr 0.00071
Train [108][90/3239]	Time 0.258 (0.845)	Data Time 0.001 (0.396)	Loss 2.2524 (2.3434)	Entropy 0.53737 (0.53670)	Top-1 acc 73.438 (67.977)	Top-5 acc 87.500 (86.328)	lr 0.00071
Train [108][100/3239]	Time 0.221 (0.817)	Data Time 0.001 (0.357)	Loss 2.2501 (2.3428)	Entropy 0.53737 (0.53677)	Top-1 acc 69.531 (68.019)	Top-5 acc 89.062 (86.336)	lr 0.00071
Train [108][110/3239]	Time 0.221 (0.787)	Data Time 0.001 (0.325)	Loss 2.4335 (2.3476)	Entropy 0.53749 (0.53683)	Top-1 acc 66.016 (67.832)	Top-5 acc 84.766 (86.303)	lr 0.00071
Train [108][120/3239]	Time 0.234 (0.755)	Data Time 0.002 (0.298)	Loss 2.3335 (2.3525)	Entropy 0.53770 (0.53690)	Top-1 acc 68.359 (67.688)	Top-5 acc 85.156 (86.251)	lr 0.00071
Train [108][130/3239]	Time 0.228 (0.728)	Data Time 0.001 (0.276)	Loss 2.3543 (2.3522)	Entropy 0.53772 (0.53696)	Top-1 acc 68.359 (67.697)	Top-5 acc 84.375 (86.215)	lr 0.00071
Train [108][140/3239]	Time 0.225 (0.705)	Data Time 0.001 (0.256)	Loss 2.1385 (2.3492)	Entropy 0.53766 (0.53701)	Top-1 acc 71.484 (67.711)	Top-5 acc 89.453 (86.242)	lr 0.00071
Train [108][150/3239]	Time 0.351 (0.687)	Data Time 0.001 (0.239)	Loss 2.4476 (2.3500)	Entropy 0.53793 (0.53706)	Top-1 acc 63.672 (67.669)	Top-5 acc 84.766 (86.245)	lr 0.00071
Train [108][160/3239]	Time 0.235 (0.670)	Data Time 0.001 (0.225)	Loss 2.2326 (2.3469)	Entropy 0.53791 (0.53712)	Top-1 acc 67.188 (67.729)	Top-5 acc 89.453 (86.314)	lr 0.00071
Train [108][170/3239]	Time 0.257 (0.659)	Data Time 0.001 (0.212)	Loss 2.4055 (2.3472)	Entropy 0.53754 (0.53715)	Top-1 acc 67.578 (67.749)	Top-5 acc 83.594 (86.246)	lr 0.00071
Train [108][180/3239]	Time 0.228 (0.646)	Data Time 0.001 (0.200)	Loss 2.2853 (2.3492)	Entropy 0.53732 (0.53717)	Top-1 acc 71.875 (67.716)	Top-5 acc 86.719 (86.179)	lr 0.00071
Train [108][190/3239]	Time 0.223 (0.633)	Data Time 0.001 (0.190)	Loss 2.4013 (2.3474)	Entropy 0.53729 (0.53718)	Top-1 acc 63.281 (67.725)	Top-5 acc 84.766 (86.205)	lr 0.00071
Train [108][200/3239]	Time 0.234 (0.621)	Data Time 0.001 (0.180)	Loss 2.2963 (2.3453)	Entropy 0.53759 (0.53719)	Top-1 acc 68.750 (67.743)	Top-5 acc 86.328 (86.235)	lr 0.00071
Train [108][210/3239]	Time 0.226 (0.611)	Data Time 0.001 (0.172)	Loss 2.1962 (2.3463)	Entropy 0.53736 (0.53720)	Top-1 acc 69.531 (67.673)	Top-5 acc 90.625 (86.234)	lr 0.00071
Train [108][220/3239]	Time 0.234 (0.602)	Data Time 0.001 (0.164)	Loss 2.3034 (2.3429)	Entropy 0.53735 (0.53721)	Top-1 acc 69.141 (67.780)	Top-5 acc 87.891 (86.314)	lr 0.00071
Train [108][230/3239]	Time 0.225 (0.594)	Data Time 0.001 (0.157)	Loss 2.3333 (2.3440)	Entropy 0.53761 (0.53722)	Top-1 acc 67.969 (67.757)	Top-5 acc 84.766 (86.277)	lr 0.00071
Train [108][240/3239]	Time 0.231 (0.586)	Data Time 0.001 (0.151)	Loss 2.1629 (2.3440)	Entropy 0.53799 (0.53724)	Top-1 acc 68.750 (67.719)	Top-5 acc 91.016 (86.291)	lr 0.00071
Train [108][250/3239]	Time 0.230 (0.579)	Data Time 0.001 (0.145)	Loss 2.5460 (2.3441)	Entropy 0.53802 (0.53727)	Top-1 acc 62.891 (67.738)	Top-5 acc 83.594 (86.316)	lr 0.00071
Train [108][260/3239]	Time 0.240 (0.572)	Data Time 0.001 (0.139)	Loss 2.2451 (2.3447)	Entropy 0.53763 (0.53729)	Top-1 acc 64.453 (67.702)	Top-5 acc 91.016 (86.318)	lr 0.00071
Train [108][270/3239]	Time 0.228 (0.567)	Data Time 0.001 (0.134)	Loss 2.1576 (2.3437)	Entropy 0.53789 (0.53731)	Top-1 acc 72.656 (67.755)	Top-5 acc 89.062 (86.338)	lr 0.00071
Train [108][280/3239]	Time 0.225 (0.561)	Data Time 0.001 (0.129)	Loss 2.3416 (2.3444)	Entropy 0.53758 (0.53733)	Top-1 acc 66.016 (67.734)	Top-5 acc 86.328 (86.318)	lr 0.00071
Train [108][290/3239]	Time 0.262 (0.556)	Data Time 0.003 (0.125)	Loss 2.2672 (2.3429)	Entropy 0.53717 (0.53734)	Top-1 acc 70.703 (67.773)	Top-5 acc 89.062 (86.346)	lr 0.00071
Train [108][300/3239]	Time 0.234 (0.551)	Data Time 0.001 (0.121)	Loss 2.2430 (2.3414)	Entropy 0.53738 (0.53733)	Top-1 acc 68.750 (67.810)	Top-5 acc 87.500 (86.357)	lr 0.00071
Train [108][310/3239]	Time 0.361 (0.546)	Data Time 0.001 (0.117)	Loss 2.1997 (2.3427)	Entropy 0.53766 (0.53734)	Top-1 acc 69.531 (67.789)	Top-5 acc 91.406 (86.343)	lr 0.00071
Train [108][320/3239]	Time 0.238 (0.543)	Data Time 0.001 (0.113)	Loss 2.4178 (2.3425)	Entropy 0.53748 (0.53734)	Top-1 acc 62.891 (67.789)	Top-5 acc 86.328 (86.366)	lr 0.00071
Train [108][330/3239]	Time 0.242 (0.539)	Data Time 0.001 (0.110)	Loss 2.4734 (2.3410)	Entropy 0.53769 (0.53735)	Top-1 acc 64.453 (67.792)	Top-5 acc 85.156 (86.394)	lr 0.00071
Train [108][340/3239]	Time 0.239 (0.536)	Data Time 0.001 (0.107)	Loss 2.1061 (2.3395)	Entropy 0.53773 (0.53736)	Top-1 acc 74.609 (67.828)	Top-5 acc 90.234 (86.435)	lr 0.00071
Train [108][350/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.104)	Loss 2.3110 (2.3385)	Entropy 0.53796 (0.53737)	Top-1 acc 68.750 (67.843)	Top-5 acc 86.328 (86.448)	lr 0.00071
Train [108][360/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.101)	Loss 2.4543 (2.3389)	Entropy 0.53819 (0.53739)	Top-1 acc 64.453 (67.825)	Top-5 acc 83.984 (86.438)	lr 0.00070
Train [108][370/3239]	Time 0.257 (0.526)	Data Time 0.001 (0.098)	Loss 2.3393 (2.3397)	Entropy 0.53836 (0.53741)	Top-1 acc 65.625 (67.832)	Top-5 acc 87.500 (86.440)	lr 0.00070
Train [108][380/3239]	Time 0.368 (0.524)	Data Time 0.001 (0.096)	Loss 2.2361 (2.3391)	Entropy 0.53795 (0.53743)	Top-1 acc 70.312 (67.852)	Top-5 acc 87.109 (86.443)	lr 0.00070
Train [108][390/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.093)	Loss 2.4454 (2.3397)	Entropy 0.53777 (0.53744)	Top-1 acc 64.453 (67.810)	Top-5 acc 84.766 (86.449)	lr 0.00070
Train [108][400/3239]	Time 0.237 (0.518)	Data Time 0.001 (0.091)	Loss 2.7600 (2.3419)	Entropy 0.53775 (0.53745)	Top-1 acc 58.984 (67.754)	Top-5 acc 78.125 (86.404)	lr 0.00070
Train [108][410/3239]	Time 0.308 (0.518)	Data Time 0.001 (0.089)	Loss 2.4984 (2.3431)	Entropy 0.53754 (0.53746)	Top-1 acc 58.984 (67.684)	Top-5 acc 85.547 (86.391)	lr 0.00070
Train [108][420/3239]	Time 0.222 (0.516)	Data Time 0.001 (0.087)	Loss 2.4994 (2.3430)	Entropy 0.53726 (0.53746)	Top-1 acc 65.234 (67.670)	Top-5 acc 85.547 (86.396)	lr 0.00070
Train [108][430/3239]	Time 0.222 (0.514)	Data Time 0.001 (0.085)	Loss 2.1934 (2.3441)	Entropy 0.53697 (0.53745)	Top-1 acc 72.656 (67.643)	Top-5 acc 89.453 (86.392)	lr 0.00070
Train [108][440/3239]	Time 0.410 (0.628)	Data Time 0.007 (0.083)	Loss 2.2574 (2.3439)	Entropy 0.53710 (0.53744)	Top-1 acc 65.234 (67.645)	Top-5 acc 88.281 (86.387)	lr 0.00070
Train [108][450/3239]	Time 0.238 (0.625)	Data Time 0.002 (0.081)	Loss 2.4832 (2.3440)	Entropy 0.53701 (0.53743)	Top-1 acc 63.672 (67.638)	Top-5 acc 85.156 (86.379)	lr 0.00070
Train [108][460/3239]	Time 0.252 (0.622)	Data Time 0.001 (0.080)	Loss 2.2916 (2.3434)	Entropy 0.53695 (0.53743)	Top-1 acc 69.922 (67.646)	Top-5 acc 86.719 (86.389)	lr 0.00070
Train [108][470/3239]	Time 0.478 (0.620)	Data Time 0.002 (0.078)	Loss 2.3420 (2.3432)	Entropy 0.53670 (0.53741)	Top-1 acc 63.281 (67.623)	Top-5 acc 87.109 (86.396)	lr 0.00070
Train [108][480/3239]	Time 0.234 (0.617)	Data Time 0.001 (0.076)	Loss 2.4456 (2.3450)	Entropy 0.53630 (0.53739)	Top-1 acc 65.625 (67.585)	Top-5 acc 82.812 (86.347)	lr 0.00070
Train [108][490/3239]	Time 0.246 (0.613)	Data Time 0.001 (0.075)	Loss 2.2154 (2.3455)	Entropy 0.53640 (0.53737)	Top-1 acc 73.438 (67.572)	Top-5 acc 89.453 (86.327)	lr 0.00070
Train [108][500/3239]	Time 0.228 (0.609)	Data Time 0.001 (0.073)	Loss 2.3891 (2.3456)	Entropy 0.53653 (0.53736)	Top-1 acc 68.359 (67.583)	Top-5 acc 87.109 (86.323)	lr 0.00070
Train [108][510/3239]	Time 0.231 (0.606)	Data Time 0.001 (0.072)	Loss 2.3134 (2.3460)	Entropy 0.53685 (0.53734)	Top-1 acc 65.625 (67.567)	Top-5 acc 86.719 (86.320)	lr 0.00070
Train [108][520/3239]	Time 0.249 (0.602)	Data Time 0.001 (0.071)	Loss 2.2413 (2.3454)	Entropy 0.53716 (0.53733)	Top-1 acc 69.922 (67.566)	Top-5 acc 89.062 (86.336)	lr 0.00070
Train [108][530/3239]	Time 0.292 (0.599)	Data Time 0.002 (0.069)	Loss 2.1854 (2.3454)	Entropy 0.53745 (0.53733)	Top-1 acc 72.656 (67.573)	Top-5 acc 88.281 (86.339)	lr 0.00070
Train [108][540/3239]	Time 0.364 (0.596)	Data Time 0.002 (0.068)	Loss 2.5205 (2.3451)	Entropy 0.53786 (0.53734)	Top-1 acc 63.281 (67.582)	Top-5 acc 84.375 (86.349)	lr 0.00070
Train [108][550/3239]	Time 0.276 (0.593)	Data Time 0.002 (0.067)	Loss 2.4064 (2.3463)	Entropy 0.53802 (0.53735)	Top-1 acc 67.578 (67.572)	Top-5 acc 85.547 (86.323)	lr 0.00070
Train [108][560/3239]	Time 0.225 (0.590)	Data Time 0.001 (0.066)	Loss 2.4426 (2.3460)	Entropy 0.53809 (0.53736)	Top-1 acc 64.844 (67.581)	Top-5 acc 87.109 (86.334)	lr 0.00070
Train [108][570/3239]	Time 0.232 (0.588)	Data Time 0.001 (0.065)	Loss 2.2801 (2.3463)	Entropy 0.53818 (0.53737)	Top-1 acc 67.188 (67.572)	Top-5 acc 87.500 (86.321)	lr 0.00070
Train [108][580/3239]	Time 0.236 (0.585)	Data Time 0.002 (0.064)	Loss 2.4103 (2.3458)	Entropy 0.53794 (0.53738)	Top-1 acc 66.406 (67.578)	Top-5 acc 87.500 (86.334)	lr 0.00070
Train [108][590/3239]	Time 0.271 (0.583)	Data Time 0.002 (0.062)	Loss 2.1821 (2.3460)	Entropy 0.53800 (0.53739)	Top-1 acc 70.703 (67.567)	Top-5 acc 88.672 (86.325)	lr 0.00070
Train [108][600/3239]	Time 0.265 (0.580)	Data Time 0.001 (0.061)	Loss 2.3992 (2.3458)	Entropy 0.53762 (0.53740)	Top-1 acc 66.406 (67.587)	Top-5 acc 82.812 (86.326)	lr 0.00070
Train [108][610/3239]	Time 0.263 (0.578)	Data Time 0.001 (0.060)	Loss 2.4617 (2.3457)	Entropy 0.53744 (0.53740)	Top-1 acc 66.016 (67.592)	Top-5 acc 83.984 (86.327)	lr 0.00070
Train [108][620/3239]	Time 0.232 (0.575)	Data Time 0.001 (0.060)	Loss 2.3814 (2.3456)	Entropy 0.53771 (0.53740)	Top-1 acc 66.797 (67.605)	Top-5 acc 85.156 (86.327)	lr 0.00070
Train [108][630/3239]	Time 0.345 (0.573)	Data Time 0.001 (0.059)	Loss 2.3882 (2.3456)	Entropy 0.53763 (0.53741)	Top-1 acc 67.578 (67.597)	Top-5 acc 84.375 (86.329)	lr 0.00070
Train [108][640/3239]	Time 0.238 (0.570)	Data Time 0.001 (0.058)	Loss 2.3454 (2.3462)	Entropy 0.53815 (0.53741)	Top-1 acc 69.531 (67.596)	Top-5 acc 85.156 (86.320)	lr 0.00070
Train [108][650/3239]	Time 0.272 (0.568)	Data Time 0.001 (0.057)	Loss 2.3565 (2.3469)	Entropy 0.53801 (0.53742)	Top-1 acc 68.359 (67.578)	Top-5 acc 84.375 (86.299)	lr 0.00070
Train [108][660/3239]	Time 0.240 (0.566)	Data Time 0.001 (0.056)	Loss 2.2505 (2.3473)	Entropy 0.53791 (0.53743)	Top-1 acc 70.312 (67.561)	Top-5 acc 85.156 (86.285)	lr 0.00069
Train [108][670/3239]	Time 0.231 (0.564)	Data Time 0.001 (0.055)	Loss 2.3506 (2.3485)	Entropy 0.53818 (0.53744)	Top-1 acc 66.797 (67.523)	Top-5 acc 86.719 (86.266)	lr 0.00069
Train [108][680/3239]	Time 0.240 (0.562)	Data Time 0.001 (0.054)	Loss 2.2662 (2.3480)	Entropy 0.53818 (0.53745)	Top-1 acc 69.531 (67.547)	Top-5 acc 88.672 (86.274)	lr 0.00069
Train [108][690/3239]	Time 0.227 (0.561)	Data Time 0.001 (0.054)	Loss 2.2523 (2.3469)	Entropy 0.53827 (0.53746)	Top-1 acc 71.094 (67.576)	Top-5 acc 87.500 (86.292)	lr 0.00069
Train [108][700/3239]	Time 0.341 (0.558)	Data Time 0.001 (0.053)	Loss 2.1625 (2.3481)	Entropy 0.53805 (0.53747)	Top-1 acc 73.828 (67.551)	Top-5 acc 90.234 (86.269)	lr 0.00069
Train [108][710/3239]	Time 0.241 (0.556)	Data Time 0.001 (0.052)	Loss 2.4019 (2.3481)	Entropy 0.53778 (0.53748)	Top-1 acc 66.016 (67.553)	Top-5 acc 86.328 (86.266)	lr 0.00069
Train [108][720/3239]	Time 0.235 (0.555)	Data Time 0.001 (0.052)	Loss 2.1875 (2.3476)	Entropy 0.53785 (0.53748)	Top-1 acc 66.797 (67.570)	Top-5 acc 91.016 (86.271)	lr 0.00069
Train [108][730/3239]	Time 0.235 (0.553)	Data Time 0.001 (0.051)	Loss 2.4005 (2.3491)	Entropy 0.53793 (0.53749)	Top-1 acc 66.016 (67.549)	Top-5 acc 85.547 (86.243)	lr 0.00069
Train [108][740/3239]	Time 0.232 (0.551)	Data Time 0.001 (0.050)	Loss 2.4280 (2.3492)	Entropy 0.53724 (0.53749)	Top-1 acc 64.062 (67.546)	Top-5 acc 83.594 (86.242)	lr 0.00069
Train [108][750/3239]	Time 0.228 (0.549)	Data Time 0.001 (0.050)	Loss 2.3674 (2.3499)	Entropy 0.53719 (0.53749)	Top-1 acc 66.797 (67.526)	Top-5 acc 86.328 (86.235)	lr 0.00069
Train [108][760/3239]	Time 0.234 (0.548)	Data Time 0.001 (0.049)	Loss 2.1228 (2.3510)	Entropy 0.53747 (0.53748)	Top-1 acc 71.094 (67.489)	Top-5 acc 90.625 (86.224)	lr 0.00069
Train [108][770/3239]	Time 0.263 (0.547)	Data Time 0.002 (0.048)	Loss 2.3530 (2.3523)	Entropy 0.53716 (0.53748)	Top-1 acc 64.453 (67.440)	Top-5 acc 83.203 (86.203)	lr 0.00069
Train [108][780/3239]	Time 0.269 (0.545)	Data Time 0.002 (0.048)	Loss 2.5032 (2.3527)	Entropy 0.53730 (0.53748)	Top-1 acc 65.234 (67.429)	Top-5 acc 84.766 (86.198)	lr 0.00069
Train [108][790/3239]	Time 0.295 (0.544)	Data Time 0.001 (0.047)	Loss 2.1692 (2.3526)	Entropy 0.53697 (0.53748)	Top-1 acc 71.484 (67.430)	Top-5 acc 87.500 (86.198)	lr 0.00069
Train [108][800/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.047)	Loss 2.3233 (2.3530)	Entropy 0.53716 (0.53747)	Top-1 acc 67.578 (67.425)	Top-5 acc 86.719 (86.190)	lr 0.00069
Train [108][810/3239]	Time 0.238 (0.541)	Data Time 0.001 (0.046)	Loss 2.3986 (2.3526)	Entropy 0.53710 (0.53747)	Top-1 acc 65.234 (67.432)	Top-5 acc 86.328 (86.202)	lr 0.00069
Train [108][820/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.045)	Loss 2.4316 (2.3533)	Entropy 0.53737 (0.53746)	Top-1 acc 66.797 (67.424)	Top-5 acc 87.500 (86.198)	lr 0.00069
Train [108][830/3239]	Time 0.239 (0.538)	Data Time 0.001 (0.045)	Loss 2.2750 (2.3531)	Entropy 0.53782 (0.53746)	Top-1 acc 68.750 (67.425)	Top-5 acc 87.891 (86.202)	lr 0.00069
Train [108][840/3239]	Time 0.302 (0.537)	Data Time 0.001 (0.044)	Loss 2.4210 (2.3540)	Entropy 0.53763 (0.53747)	Top-1 acc 64.062 (67.416)	Top-5 acc 83.594 (86.182)	lr 0.00069
Train [108][850/3239]	Time 0.236 (0.535)	Data Time 0.001 (0.044)	Loss 2.3125 (2.3541)	Entropy 0.53756 (0.53747)	Top-1 acc 69.922 (67.409)	Top-5 acc 87.891 (86.183)	lr 0.00069
Train [108][860/3239]	Time 0.335 (0.534)	Data Time 0.001 (0.043)	Loss 2.1740 (2.3545)	Entropy 0.53745 (0.53747)	Top-1 acc 72.656 (67.404)	Top-5 acc 89.844 (86.176)	lr 0.00069
Train [108][870/3239]	Time 0.239 (0.533)	Data Time 0.001 (0.043)	Loss 2.4766 (2.3540)	Entropy 0.53763 (0.53747)	Top-1 acc 63.672 (67.408)	Top-5 acc 84.375 (86.180)	lr 0.00069
Train [108][880/3239]	Time 0.307 (0.532)	Data Time 0.002 (0.042)	Loss 2.3753 (2.3547)	Entropy 0.53758 (0.53747)	Top-1 acc 68.359 (67.407)	Top-5 acc 84.766 (86.164)	lr 0.00069
Train [108][890/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.042)	Loss 2.4628 (2.3541)	Entropy 0.53788 (0.53747)	Top-1 acc 61.719 (67.403)	Top-5 acc 84.375 (86.173)	lr 0.00069
Train [108][900/3239]	Time 0.224 (0.530)	Data Time 0.001 (0.042)	Loss 2.4870 (2.3545)	Entropy 0.53819 (0.53748)	Top-1 acc 64.062 (67.386)	Top-5 acc 83.984 (86.166)	lr 0.00069
Train [108][910/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.041)	Loss 2.6599 (2.3549)	Entropy 0.53840 (0.53749)	Top-1 acc 60.156 (67.388)	Top-5 acc 80.859 (86.158)	lr 0.00069
Train [108][920/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.041)	Loss 2.4327 (2.3547)	Entropy 0.53805 (0.53750)	Top-1 acc 66.797 (67.397)	Top-5 acc 84.766 (86.156)	lr 0.00069
Train [108][930/3239]	Time 0.413 (0.526)	Data Time 0.001 (0.040)	Loss 2.5823 (2.3557)	Entropy 0.53791 (0.53750)	Top-1 acc 59.766 (67.378)	Top-5 acc 81.641 (86.138)	lr 0.00069
Train [108][940/3239]	Time 0.239 (0.525)	Data Time 0.001 (0.040)	Loss 2.2689 (2.3555)	Entropy 0.53813 (0.53751)	Top-1 acc 69.531 (67.381)	Top-5 acc 85.938 (86.137)	lr 0.00069
Train [108][950/3239]	Time 0.239 (0.524)	Data Time 0.001 (0.039)	Loss 2.2701 (2.3556)	Entropy 0.53844 (0.53751)	Top-1 acc 71.875 (67.385)	Top-5 acc 85.547 (86.135)	lr 0.00069
Train [108][960/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.039)	Loss 2.4676 (2.3553)	Entropy 0.53822 (0.53752)	Top-1 acc 69.922 (67.398)	Top-5 acc 82.812 (86.138)	lr 0.00068
Train [108][970/3239]	Time 0.253 (0.522)	Data Time 0.001 (0.039)	Loss 2.5286 (2.3556)	Entropy 0.53811 (0.53753)	Top-1 acc 64.844 (67.392)	Top-5 acc 83.984 (86.133)	lr 0.00068
Train [108][980/3239]	Time 0.263 (0.521)	Data Time 0.001 (0.038)	Loss 2.5813 (2.3559)	Entropy 0.53841 (0.53754)	Top-1 acc 63.281 (67.375)	Top-5 acc 81.641 (86.123)	lr 0.00068
Train [108][990/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.038)	Loss 2.2232 (2.3562)	Entropy 0.53827 (0.53754)	Top-1 acc 70.703 (67.372)	Top-5 acc 87.500 (86.123)	lr 0.00068
Train [108][1000/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.038)	Loss 2.3250 (2.3563)	Entropy 0.53819 (0.53755)	Top-1 acc 66.406 (67.374)	Top-5 acc 86.719 (86.119)	lr 0.00068
Train [108][1010/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.037)	Loss 2.3194 (2.3562)	Entropy 0.53751 (0.53755)	Top-1 acc 69.141 (67.384)	Top-5 acc 85.938 (86.117)	lr 0.00068
Train [108][1020/3239]	Time 0.353 (0.516)	Data Time 0.001 (0.037)	Loss 2.2935 (2.3564)	Entropy 0.53719 (0.53755)	Top-1 acc 69.922 (67.381)	Top-5 acc 87.109 (86.118)	lr 0.00068
Train [108][1030/3239]	Time 0.244 (0.515)	Data Time 0.001 (0.037)	Loss 2.0060 (2.3562)	Entropy 0.53727 (0.53755)	Top-1 acc 75.781 (67.388)	Top-5 acc 90.234 (86.124)	lr 0.00068
Train [108][1040/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.036)	Loss 2.0639 (2.3561)	Entropy 0.53719 (0.53755)	Top-1 acc 73.438 (67.395)	Top-5 acc 90.234 (86.124)	lr 0.00068
Train [108][1050/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.036)	Loss 2.2388 (2.3568)	Entropy 0.53720 (0.53754)	Top-1 acc 69.141 (67.361)	Top-5 acc 85.938 (86.113)	lr 0.00068
Train [108][1060/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.036)	Loss 2.3750 (2.3567)	Entropy 0.53667 (0.53754)	Top-1 acc 68.750 (67.369)	Top-5 acc 86.328 (86.118)	lr 0.00068
Train [108][1070/3239]	Time 0.248 (0.512)	Data Time 0.001 (0.035)	Loss 2.3910 (2.3569)	Entropy 0.53684 (0.53753)	Top-1 acc 64.453 (67.359)	Top-5 acc 87.500 (86.122)	lr 0.00068
Train [108][1080/3239]	Time 0.254 (0.511)	Data Time 0.001 (0.035)	Loss 2.6135 (2.3570)	Entropy 0.53699 (0.53753)	Top-1 acc 59.766 (67.351)	Top-5 acc 80.078 (86.117)	lr 0.00068
Train [108][1090/3239]	Time 0.385 (0.510)	Data Time 0.025 (0.035)	Loss 2.1018 (2.3561)	Entropy 0.53685 (0.53752)	Top-1 acc 71.484 (67.369)	Top-5 acc 89.844 (86.131)	lr 0.00068
Train [108][1100/3239]	Time 0.252 (0.559)	Data Time 0.002 (0.034)	Loss 2.4293 (2.3558)	Entropy 0.53677 (0.53751)	Top-1 acc 65.234 (67.372)	Top-5 acc 82.812 (86.140)	lr 0.00068
Train [108][1110/3239]	Time 0.247 (0.558)	Data Time 0.002 (0.034)	Loss 2.3970 (2.3560)	Entropy 0.53704 (0.53751)	Top-1 acc 66.797 (67.361)	Top-5 acc 84.766 (86.134)	lr 0.00068
Train [108][1120/3239]	Time 0.243 (0.557)	Data Time 0.001 (0.034)	Loss 2.3181 (2.3555)	Entropy 0.53724 (0.53750)	Top-1 acc 68.359 (67.372)	Top-5 acc 87.109 (86.143)	lr 0.00068
Train [108][1130/3239]	Time 0.245 (0.556)	Data Time 0.001 (0.033)	Loss 2.3221 (2.3549)	Entropy 0.53744 (0.53750)	Top-1 acc 71.094 (67.393)	Top-5 acc 87.500 (86.147)	lr 0.00068
Train [108][1140/3239]	Time 0.239 (0.555)	Data Time 0.001 (0.033)	Loss 2.3597 (2.3546)	Entropy 0.53721 (0.53750)	Top-1 acc 70.312 (67.405)	Top-5 acc 84.766 (86.151)	lr 0.00068
Train [108][1150/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.033)	Loss 2.3703 (2.3541)	Entropy 0.53729 (0.53750)	Top-1 acc 66.016 (67.416)	Top-5 acc 84.375 (86.156)	lr 0.00068
Train [108][1160/3239]	Time 0.252 (0.553)	Data Time 0.001 (0.033)	Loss 2.1948 (2.3544)	Entropy 0.53772 (0.53750)	Top-1 acc 72.266 (67.406)	Top-5 acc 90.625 (86.152)	lr 0.00068
Train [108][1170/3239]	Time 0.233 (0.551)	Data Time 0.002 (0.032)	Loss 2.6995 (2.3546)	Entropy 0.53793 (0.53750)	Top-1 acc 57.031 (67.401)	Top-5 acc 80.078 (86.147)	lr 0.00068
Train [108][1180/3239]	Time 0.390 (0.551)	Data Time 0.001 (0.032)	Loss 2.3609 (2.3550)	Entropy 0.53808 (0.53751)	Top-1 acc 69.141 (67.398)	Top-5 acc 84.766 (86.137)	lr 0.00068
Train [108][1190/3239]	Time 0.257 (0.550)	Data Time 0.001 (0.032)	Loss 2.1789 (2.3551)	Entropy 0.53813 (0.53751)	Top-1 acc 69.922 (67.398)	Top-5 acc 89.453 (86.134)	lr 0.00068
Train [108][1200/3239]	Time 0.232 (0.548)	Data Time 0.001 (0.032)	Loss 2.3881 (2.3550)	Entropy 0.53829 (0.53752)	Top-1 acc 66.797 (67.402)	Top-5 acc 87.891 (86.139)	lr 0.00068
Train [108][1210/3239]	Time 0.231 (0.547)	Data Time 0.001 (0.031)	Loss 2.2712 (2.3549)	Entropy 0.53830 (0.53753)	Top-1 acc 69.531 (67.401)	Top-5 acc 87.891 (86.143)	lr 0.00068
Train [108][1220/3239]	Time 0.241 (0.546)	Data Time 0.001 (0.031)	Loss 2.4636 (2.3548)	Entropy 0.53867 (0.53753)	Top-1 acc 68.359 (67.409)	Top-5 acc 84.766 (86.143)	lr 0.00068
Train [108][1230/3239]	Time 0.242 (0.546)	Data Time 0.001 (0.031)	Loss 2.3086 (2.3540)	Entropy 0.53847 (0.53754)	Top-1 acc 73.047 (67.435)	Top-5 acc 83.594 (86.155)	lr 0.00068
Train [108][1240/3239]	Time 0.240 (0.545)	Data Time 0.002 (0.031)	Loss 2.3633 (2.3538)	Entropy 0.53823 (0.53755)	Top-1 acc 66.797 (67.441)	Top-5 acc 85.156 (86.162)	lr 0.00068
Train [108][1250/3239]	Time 0.331 (0.544)	Data Time 0.002 (0.030)	Loss 2.2259 (2.3538)	Entropy 0.53831 (0.53755)	Top-1 acc 71.875 (67.444)	Top-5 acc 87.891 (86.157)	lr 0.00068
Train [108][1260/3239]	Time 0.242 (0.543)	Data Time 0.001 (0.030)	Loss 2.4385 (2.3538)	Entropy 0.53885 (0.53756)	Top-1 acc 64.062 (67.447)	Top-5 acc 85.547 (86.161)	lr 0.00068
Train [108][1270/3239]	Time 0.307 (0.543)	Data Time 0.002 (0.030)	Loss 2.8369 (2.3541)	Entropy 0.53866 (0.53757)	Top-1 acc 54.297 (67.430)	Top-5 acc 78.516 (86.158)	lr 0.00067
Train [108][1280/3239]	Time 0.244 (0.543)	Data Time 0.001 (0.030)	Loss 2.3857 (2.3542)	Entropy 0.53891 (0.53758)	Top-1 acc 64.844 (67.422)	Top-5 acc 85.156 (86.153)	lr 0.00067
Train [108][1290/3239]	Time 0.237 (0.542)	Data Time 0.001 (0.030)	Loss 2.5672 (2.3552)	Entropy 0.53874 (0.53759)	Top-1 acc 60.938 (67.401)	Top-5 acc 83.203 (86.140)	lr 0.00067
Train [108][1300/3239]	Time 0.239 (0.541)	Data Time 0.002 (0.029)	Loss 2.5772 (2.3561)	Entropy 0.53889 (0.53760)	Top-1 acc 62.500 (67.377)	Top-5 acc 84.375 (86.129)	lr 0.00067
Train [108][1310/3239]	Time 0.256 (0.541)	Data Time 0.001 (0.029)	Loss 2.4536 (2.3559)	Entropy 0.53896 (0.53761)	Top-1 acc 66.797 (67.381)	Top-5 acc 83.594 (86.126)	lr 0.00067
Train [108][1320/3239]	Time 0.237 (0.540)	Data Time 0.001 (0.029)	Loss 2.1954 (2.3557)	Entropy 0.53898 (0.53762)	Top-1 acc 71.484 (67.394)	Top-5 acc 87.891 (86.126)	lr 0.00067
Train [108][1330/3239]	Time 0.241 (0.539)	Data Time 0.001 (0.029)	Loss 2.5257 (2.3565)	Entropy 0.53907 (0.53763)	Top-1 acc 59.766 (67.368)	Top-5 acc 84.375 (86.116)	lr 0.00067
Train [108][1340/3239]	Time 0.270 (0.538)	Data Time 0.001 (0.029)	Loss 2.3520 (2.3567)	Entropy 0.53902 (0.53764)	Top-1 acc 66.016 (67.361)	Top-5 acc 87.500 (86.115)	lr 0.00067
Train [108][1350/3239]	Time 0.233 (0.537)	Data Time 0.001 (0.028)	Loss 2.4767 (2.3565)	Entropy 0.53874 (0.53765)	Top-1 acc 64.844 (67.367)	Top-5 acc 83.984 (86.121)	lr 0.00067
Train [108][1360/3239]	Time 0.239 (0.537)	Data Time 0.001 (0.028)	Loss 2.2637 (2.3568)	Entropy 0.53885 (0.53766)	Top-1 acc 68.359 (67.356)	Top-5 acc 85.547 (86.117)	lr 0.00067
Train [108][1370/3239]	Time 0.261 (0.536)	Data Time 0.001 (0.028)	Loss 2.2564 (2.3568)	Entropy 0.53893 (0.53767)	Top-1 acc 67.969 (67.362)	Top-5 acc 88.281 (86.119)	lr 0.00067
Train [108][1380/3239]	Time 0.250 (0.535)	Data Time 0.001 (0.028)	Loss 2.4297 (2.3567)	Entropy 0.53915 (0.53768)	Top-1 acc 63.672 (67.363)	Top-5 acc 84.375 (86.121)	lr 0.00067
Train [108][1390/3239]	Time 0.248 (0.534)	Data Time 0.001 (0.028)	Loss 2.4253 (2.3574)	Entropy 0.53904 (0.53769)	Top-1 acc 64.062 (67.348)	Top-5 acc 85.547 (86.110)	lr 0.00067
Train [108][1400/3239]	Time 0.224 (0.533)	Data Time 0.001 (0.027)	Loss 2.2961 (2.3571)	Entropy 0.53874 (0.53770)	Top-1 acc 67.188 (67.357)	Top-5 acc 87.891 (86.116)	lr 0.00067
Train [108][1410/3239]	Time 0.335 (0.533)	Data Time 0.001 (0.027)	Loss 2.4250 (2.3570)	Entropy 0.53898 (0.53771)	Top-1 acc 65.234 (67.356)	Top-5 acc 85.938 (86.121)	lr 0.00067
Train [108][1420/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.027)	Loss 2.3232 (2.3570)	Entropy 0.53920 (0.53772)	Top-1 acc 67.578 (67.358)	Top-5 acc 84.375 (86.121)	lr 0.00067
Train [108][1430/3239]	Time 0.226 (0.531)	Data Time 0.001 (0.027)	Loss 2.2211 (2.3568)	Entropy 0.53921 (0.53773)	Top-1 acc 71.094 (67.360)	Top-5 acc 89.844 (86.127)	lr 0.00067
Train [108][1440/3239]	Time 0.240 (0.530)	Data Time 0.001 (0.027)	Loss 2.2784 (2.3564)	Entropy 0.53929 (0.53774)	Top-1 acc 68.750 (67.371)	Top-5 acc 87.109 (86.133)	lr 0.00067
Train [108][1450/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.027)	Loss 2.8725 (2.3566)	Entropy 0.53930 (0.53775)	Top-1 acc 57.031 (67.366)	Top-5 acc 77.344 (86.134)	lr 0.00067
Train [108][1460/3239]	Time 0.271 (0.529)	Data Time 0.001 (0.026)	Loss 2.3470 (2.3570)	Entropy 0.53907 (0.53776)	Top-1 acc 65.625 (67.358)	Top-5 acc 84.766 (86.123)	lr 0.00067
Train [108][1470/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.026)	Loss 2.1705 (2.3572)	Entropy 0.53908 (0.53777)	Top-1 acc 71.875 (67.352)	Top-5 acc 89.062 (86.122)	lr 0.00067
Train [108][1480/3239]	Time 0.472 (0.528)	Data Time 0.002 (0.026)	Loss 2.3893 (2.3574)	Entropy 0.53910 (0.53778)	Top-1 acc 66.016 (67.346)	Top-5 acc 85.156 (86.119)	lr 0.00067
Train [108][1490/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.026)	Loss 2.2773 (2.3570)	Entropy 0.53917 (0.53779)	Top-1 acc 66.797 (67.359)	Top-5 acc 88.281 (86.123)	lr 0.00067
Train [108][1500/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.026)	Loss 2.3323 (2.3569)	Entropy 0.53907 (0.53779)	Top-1 acc 67.578 (67.362)	Top-5 acc 89.062 (86.125)	lr 0.00067
Train [108][1510/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.026)	Loss 2.2114 (2.3572)	Entropy 0.53892 (0.53780)	Top-1 acc 68.359 (67.354)	Top-5 acc 89.062 (86.124)	lr 0.00067
Train [108][1520/3239]	Time 0.261 (0.525)	Data Time 0.001 (0.025)	Loss 2.4588 (2.3574)	Entropy 0.53862 (0.53781)	Top-1 acc 65.625 (67.348)	Top-5 acc 85.547 (86.118)	lr 0.00067
Train [108][1530/3239]	Time 0.266 (0.524)	Data Time 0.001 (0.025)	Loss 2.2677 (2.3571)	Entropy 0.53864 (0.53781)	Top-1 acc 69.531 (67.357)	Top-5 acc 88.281 (86.122)	lr 0.00067
Train [108][1540/3239]	Time 0.240 (0.524)	Data Time 0.001 (0.025)	Loss 2.2967 (2.3572)	Entropy 0.53880 (0.53782)	Top-1 acc 68.750 (67.355)	Top-5 acc 87.500 (86.123)	lr 0.00067
Train [108][1550/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.025)	Loss 2.4186 (2.3572)	Entropy 0.53856 (0.53783)	Top-1 acc 67.578 (67.363)	Top-5 acc 85.938 (86.124)	lr 0.00067
Train [108][1560/3239]	Time 0.247 (0.522)	Data Time 0.001 (0.025)	Loss 2.4657 (2.3574)	Entropy 0.53848 (0.53783)	Top-1 acc 63.672 (67.355)	Top-5 acc 85.938 (86.121)	lr 0.00067
Train [108][1570/3239]	Time 0.375 (0.522)	Data Time 0.001 (0.025)	Loss 2.5317 (2.3575)	Entropy 0.53831 (0.53783)	Top-1 acc 62.109 (67.356)	Top-5 acc 80.469 (86.117)	lr 0.00066
Train [108][1580/3239]	Time 0.291 (0.521)	Data Time 0.001 (0.024)	Loss 2.4162 (2.3576)	Entropy 0.53814 (0.53784)	Top-1 acc 63.281 (67.355)	Top-5 acc 84.375 (86.111)	lr 0.00066
Train [108][1590/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.024)	Loss 2.4661 (2.3578)	Entropy 0.53845 (0.53784)	Top-1 acc 67.188 (67.353)	Top-5 acc 83.203 (86.110)	lr 0.00066
Train [108][1600/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.024)	Loss 2.2406 (2.3579)	Entropy 0.53877 (0.53784)	Top-1 acc 66.406 (67.349)	Top-5 acc 90.234 (86.110)	lr 0.00066
Train [108][1610/3239]	Time 0.234 (0.519)	Data Time 0.001 (0.024)	Loss 2.4134 (2.3578)	Entropy 0.53871 (0.53785)	Top-1 acc 64.453 (67.348)	Top-5 acc 84.375 (86.113)	lr 0.00066
Train [108][1620/3239]	Time 0.271 (0.519)	Data Time 0.001 (0.024)	Loss 2.4077 (2.3574)	Entropy 0.53900 (0.53786)	Top-1 acc 64.453 (67.352)	Top-5 acc 86.719 (86.123)	lr 0.00066
Train [108][1630/3239]	Time 0.261 (0.518)	Data Time 0.001 (0.024)	Loss 2.3768 (2.3572)	Entropy 0.53921 (0.53786)	Top-1 acc 67.188 (67.354)	Top-5 acc 85.156 (86.123)	lr 0.00066
Train [108][1640/3239]	Time 0.352 (0.518)	Data Time 0.001 (0.024)	Loss 2.3272 (2.3577)	Entropy 0.53890 (0.53787)	Top-1 acc 70.703 (67.339)	Top-5 acc 87.109 (86.117)	lr 0.00066
Train [108][1650/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.023)	Loss 2.4188 (2.3581)	Entropy 0.53909 (0.53788)	Top-1 acc 65.625 (67.328)	Top-5 acc 83.594 (86.109)	lr 0.00066
Train [108][1660/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.023)	Loss 2.4782 (2.3579)	Entropy 0.53919 (0.53789)	Top-1 acc 65.625 (67.334)	Top-5 acc 83.203 (86.111)	lr 0.00066
Train [108][1670/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.023)	Loss 2.4938 (2.3581)	Entropy 0.53926 (0.53789)	Top-1 acc 63.672 (67.321)	Top-5 acc 84.766 (86.116)	lr 0.00066
Train [108][1680/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.023)	Loss 2.4512 (2.3581)	Entropy 0.53930 (0.53790)	Top-1 acc 66.797 (67.321)	Top-5 acc 83.594 (86.113)	lr 0.00066
Train [108][1690/3239]	Time 0.238 (0.515)	Data Time 0.001 (0.023)	Loss 2.3049 (2.3586)	Entropy 0.53941 (0.53791)	Top-1 acc 71.094 (67.308)	Top-5 acc 86.719 (86.107)	lr 0.00066
Train [108][1700/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.023)	Loss 3.0070 (2.3587)	Entropy 0.53904 (0.53792)	Top-1 acc 48.047 (67.306)	Top-5 acc 77.734 (86.110)	lr 0.00066
Train [108][1710/3239]	Time 0.242 (0.514)	Data Time 0.002 (0.023)	Loss 2.1640 (2.3583)	Entropy 0.53890 (0.53793)	Top-1 acc 70.703 (67.315)	Top-5 acc 90.625 (86.118)	lr 0.00066
Train [108][1720/3239]	Time 0.222 (0.513)	Data Time 0.001 (0.023)	Loss 2.1434 (2.3581)	Entropy 0.53909 (0.53793)	Top-1 acc 72.266 (67.320)	Top-5 acc 90.625 (86.125)	lr 0.00066
Train [108][1730/3239]	Time 0.399 (0.513)	Data Time 0.001 (0.023)	Loss 2.3133 (2.3581)	Entropy 0.53911 (0.53794)	Top-1 acc 68.359 (67.320)	Top-5 acc 86.719 (86.125)	lr 0.00066
Train [108][1740/3239]	Time 0.249 (0.512)	Data Time 0.001 (0.022)	Loss 2.4257 (2.3585)	Entropy 0.53908 (0.53795)	Top-1 acc 65.625 (67.315)	Top-5 acc 83.984 (86.118)	lr 0.00066
Train [108][1750/3239]	Time 0.401 (0.542)	Data Time 0.032 (0.022)	Loss 2.2519 (2.3583)	Entropy 0.53916 (0.53795)	Top-1 acc 73.047 (67.322)	Top-5 acc 86.719 (86.119)	lr 0.00066
Train [108][1760/3239]	Time 0.312 (0.542)	Data Time 0.002 (0.022)	Loss 2.4747 (2.3584)	Entropy 0.53919 (0.53796)	Top-1 acc 63.281 (67.321)	Top-5 acc 83.594 (86.116)	lr 0.00066
Train [108][1770/3239]	Time 0.250 (0.541)	Data Time 0.001 (0.022)	Loss 2.3804 (2.3584)	Entropy 0.53946 (0.53797)	Top-1 acc 65.625 (67.321)	Top-5 acc 85.938 (86.116)	lr 0.00066
Train [108][1780/3239]	Time 0.241 (0.541)	Data Time 0.001 (0.022)	Loss 2.4067 (2.3582)	Entropy 0.53944 (0.53797)	Top-1 acc 67.188 (67.324)	Top-5 acc 85.938 (86.123)	lr 0.00066
Train [108][1790/3239]	Time 0.244 (0.540)	Data Time 0.001 (0.022)	Loss 2.4635 (2.3579)	Entropy 0.53935 (0.53798)	Top-1 acc 62.891 (67.329)	Top-5 acc 83.594 (86.127)	lr 0.00066
Train [108][1800/3239]	Time 0.350 (0.539)	Data Time 0.001 (0.022)	Loss 2.3678 (2.3582)	Entropy 0.53924 (0.53799)	Top-1 acc 68.359 (67.327)	Top-5 acc 86.719 (86.121)	lr 0.00066
Train [108][1810/3239]	Time 0.298 (0.539)	Data Time 0.001 (0.022)	Loss 2.4020 (2.3583)	Entropy 0.53893 (0.53800)	Top-1 acc 64.062 (67.327)	Top-5 acc 84.766 (86.118)	lr 0.00066
Train [108][1820/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.022)	Loss 2.4644 (2.3586)	Entropy 0.53888 (0.53800)	Top-1 acc 66.797 (67.318)	Top-5 acc 83.203 (86.117)	lr 0.00066
Train [108][1830/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.021)	Loss 2.1375 (2.3585)	Entropy 0.53876 (0.53801)	Top-1 acc 72.656 (67.325)	Top-5 acc 90.625 (86.118)	lr 0.00066
Train [108][1840/3239]	Time 0.227 (0.537)	Data Time 0.001 (0.021)	Loss 2.1993 (2.3582)	Entropy 0.53899 (0.53801)	Top-1 acc 70.312 (67.336)	Top-5 acc 88.672 (86.123)	lr 0.00066
Train [108][1850/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.021)	Loss 2.2427 (2.3579)	Entropy 0.53903 (0.53801)	Top-1 acc 69.531 (67.337)	Top-5 acc 85.547 (86.128)	lr 0.00066
Train [108][1860/3239]	Time 0.228 (0.536)	Data Time 0.001 (0.021)	Loss 2.6231 (2.3582)	Entropy 0.53916 (0.53802)	Top-1 acc 64.453 (67.336)	Top-5 acc 79.688 (86.123)	lr 0.00066
Train [108][1870/3239]	Time 0.269 (0.535)	Data Time 0.001 (0.021)	Loss 2.2171 (2.3582)	Entropy 0.53932 (0.53803)	Top-1 acc 68.359 (67.333)	Top-5 acc 89.453 (86.122)	lr 0.00066
Train [108][1880/3239]	Time 0.223 (0.535)	Data Time 0.001 (0.021)	Loss 2.2850 (2.3583)	Entropy 0.53969 (0.53803)	Top-1 acc 67.578 (67.324)	Top-5 acc 87.500 (86.122)	lr 0.00065
Train [108][1890/3239]	Time 0.316 (0.534)	Data Time 0.001 (0.021)	Loss 2.3957 (2.3582)	Entropy 0.53963 (0.53804)	Top-1 acc 64.062 (67.324)	Top-5 acc 86.328 (86.122)	lr 0.00065
Train [108][1900/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.021)	Loss 2.3197 (2.3579)	Entropy 0.53985 (0.53805)	Top-1 acc 66.797 (67.329)	Top-5 acc 87.891 (86.128)	lr 0.00065
Train [108][1910/3239]	Time 0.251 (0.533)	Data Time 0.002 (0.021)	Loss 2.3624 (2.3580)	Entropy 0.53985 (0.53806)	Top-1 acc 63.672 (67.326)	Top-5 acc 86.719 (86.129)	lr 0.00065
Train [108][1920/3239]	Time 0.245 (0.532)	Data Time 0.001 (0.020)	Loss 2.3388 (2.3580)	Entropy 0.53961 (0.53807)	Top-1 acc 69.531 (67.319)	Top-5 acc 85.938 (86.129)	lr 0.00065
Train [108][1930/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.020)	Loss 2.4806 (2.3583)	Entropy 0.53975 (0.53808)	Top-1 acc 64.062 (67.319)	Top-5 acc 83.203 (86.124)	lr 0.00065
Train [108][1940/3239]	Time 0.244 (0.531)	Data Time 0.001 (0.020)	Loss 2.4745 (2.3588)	Entropy 0.53949 (0.53809)	Top-1 acc 64.844 (67.313)	Top-5 acc 81.641 (86.115)	lr 0.00065
Train [108][1950/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.020)	Loss 2.2315 (2.3584)	Entropy 0.53965 (0.53809)	Top-1 acc 69.531 (67.323)	Top-5 acc 87.891 (86.125)	lr 0.00065
Train [108][1960/3239]	Time 0.336 (0.530)	Data Time 0.001 (0.020)	Loss 2.3297 (2.3584)	Entropy 0.53927 (0.53810)	Top-1 acc 67.188 (67.319)	Top-5 acc 83.984 (86.123)	lr 0.00065
Train [108][1970/3239]	Time 0.274 (0.530)	Data Time 0.002 (0.020)	Loss 2.3353 (2.3584)	Entropy 0.53946 (0.53811)	Top-1 acc 67.969 (67.319)	Top-5 acc 87.500 (86.127)	lr 0.00065
Train [108][1980/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.020)	Loss 2.3198 (2.3580)	Entropy 0.53919 (0.53811)	Top-1 acc 67.578 (67.327)	Top-5 acc 86.719 (86.132)	lr 0.00065
Train [108][1990/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.020)	Loss 2.2979 (2.3582)	Entropy 0.53896 (0.53812)	Top-1 acc 70.703 (67.323)	Top-5 acc 87.500 (86.128)	lr 0.00065
Train [108][2000/3239]	Time 0.229 (0.528)	Data Time 0.002 (0.020)	Loss 2.2144 (2.3578)	Entropy 0.53867 (0.53812)	Top-1 acc 73.828 (67.334)	Top-5 acc 89.062 (86.132)	lr 0.00065
Train [108][2010/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.020)	Loss 2.4427 (2.3578)	Entropy 0.53855 (0.53813)	Top-1 acc 63.672 (67.333)	Top-5 acc 84.375 (86.131)	lr 0.00065
Train [108][2020/3239]	Time 0.225 (0.527)	Data Time 0.001 (0.020)	Loss 2.4618 (2.3575)	Entropy 0.53844 (0.53813)	Top-1 acc 64.062 (67.340)	Top-5 acc 82.422 (86.136)	lr 0.00065
Train [108][2030/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.019)	Loss 2.4387 (2.3577)	Entropy 0.53835 (0.53813)	Top-1 acc 63.672 (67.335)	Top-5 acc 87.109 (86.135)	lr 0.00065
Train [108][2040/3239]	Time 0.243 (0.526)	Data Time 0.001 (0.019)	Loss 2.4314 (2.3579)	Entropy 0.53855 (0.53813)	Top-1 acc 67.578 (67.335)	Top-5 acc 82.422 (86.129)	lr 0.00065
Train [108][2050/3239]	Time 0.292 (0.525)	Data Time 0.001 (0.019)	Loss 2.3313 (2.3580)	Entropy 0.53849 (0.53813)	Top-1 acc 70.703 (67.333)	Top-5 acc 89.062 (86.127)	lr 0.00065
Train [108][2060/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.019)	Loss 2.5336 (2.3581)	Entropy 0.53836 (0.53813)	Top-1 acc 64.453 (67.337)	Top-5 acc 83.594 (86.125)	lr 0.00065
Train [108][2070/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.019)	Loss 2.2358 (2.3579)	Entropy 0.53826 (0.53813)	Top-1 acc 72.656 (67.349)	Top-5 acc 86.719 (86.126)	lr 0.00065
Train [108][2080/3239]	Time 0.239 (0.524)	Data Time 0.001 (0.019)	Loss 2.4262 (2.3579)	Entropy 0.53821 (0.53814)	Top-1 acc 63.281 (67.349)	Top-5 acc 85.938 (86.125)	lr 0.00065
Train [108][2090/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.019)	Loss 2.3138 (2.3579)	Entropy 0.53833 (0.53814)	Top-1 acc 67.969 (67.352)	Top-5 acc 87.109 (86.122)	lr 0.00065
Train [108][2100/3239]	Time 0.266 (0.523)	Data Time 0.001 (0.019)	Loss 2.3532 (2.3580)	Entropy 0.53826 (0.53814)	Top-1 acc 69.922 (67.354)	Top-5 acc 85.547 (86.118)	lr 0.00065
Train [108][2110/3239]	Time 0.257 (0.523)	Data Time 0.028 (0.019)	Loss 2.3823 (2.3579)	Entropy 0.53808 (0.53814)	Top-1 acc 66.797 (67.352)	Top-5 acc 85.938 (86.121)	lr 0.00065
Train [108][2120/3239]	Time 0.346 (0.522)	Data Time 0.002 (0.019)	Loss 2.1867 (2.3579)	Entropy 0.53830 (0.53814)	Top-1 acc 72.656 (67.350)	Top-5 acc 89.453 (86.122)	lr 0.00065
Train [108][2130/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.019)	Loss 2.5363 (2.3580)	Entropy 0.53832 (0.53814)	Top-1 acc 63.281 (67.344)	Top-5 acc 82.812 (86.120)	lr 0.00065
Train [108][2140/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.019)	Loss 2.2630 (2.3579)	Entropy 0.53834 (0.53814)	Top-1 acc 70.312 (67.352)	Top-5 acc 87.500 (86.116)	lr 0.00065
Train [108][2150/3239]	Time 0.253 (0.521)	Data Time 0.001 (0.018)	Loss 2.4404 (2.3579)	Entropy 0.53840 (0.53814)	Top-1 acc 65.234 (67.356)	Top-5 acc 85.156 (86.115)	lr 0.00065
Train [108][2160/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.018)	Loss 2.4320 (2.3580)	Entropy 0.53839 (0.53814)	Top-1 acc 67.578 (67.355)	Top-5 acc 83.594 (86.112)	lr 0.00065
Train [108][2170/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.018)	Loss 2.3972 (2.3579)	Entropy 0.53832 (0.53814)	Top-1 acc 68.359 (67.358)	Top-5 acc 83.594 (86.111)	lr 0.00065
Train [108][2180/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.018)	Loss 2.5460 (2.3579)	Entropy 0.53857 (0.53814)	Top-1 acc 61.719 (67.356)	Top-5 acc 82.031 (86.109)	lr 0.00065
Train [108][2190/3239]	Time 0.322 (0.519)	Data Time 0.001 (0.018)	Loss 2.3325 (2.3579)	Entropy 0.53826 (0.53814)	Top-1 acc 67.578 (67.359)	Top-5 acc 87.109 (86.107)	lr 0.00064
Train [108][2200/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.018)	Loss 2.2695 (2.3580)	Entropy 0.53820 (0.53815)	Top-1 acc 68.359 (67.357)	Top-5 acc 86.719 (86.104)	lr 0.00064
Train [108][2210/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.018)	Loss 2.2981 (2.3578)	Entropy 0.53842 (0.53815)	Top-1 acc 69.922 (67.358)	Top-5 acc 89.844 (86.108)	lr 0.00064
Train [108][2220/3239]	Time 0.221 (0.517)	Data Time 0.001 (0.018)	Loss 2.1724 (2.3578)	Entropy 0.53856 (0.53815)	Top-1 acc 71.484 (67.362)	Top-5 acc 89.062 (86.109)	lr 0.00064
Train [108][2230/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.018)	Loss 2.3313 (2.3577)	Entropy 0.53881 (0.53815)	Top-1 acc 66.797 (67.362)	Top-5 acc 87.891 (86.110)	lr 0.00064
Train [108][2240/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.018)	Loss 2.2885 (2.3577)	Entropy 0.53830 (0.53815)	Top-1 acc 69.141 (67.363)	Top-5 acc 88.672 (86.113)	lr 0.00064
Train [108][2250/3239]	Time 0.223 (0.516)	Data Time 0.001 (0.018)	Loss 2.5867 (2.3577)	Entropy 0.53854 (0.53815)	Top-1 acc 62.891 (67.364)	Top-5 acc 82.031 (86.112)	lr 0.00064
Train [108][2260/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.018)	Loss 2.3262 (2.3578)	Entropy 0.53845 (0.53815)	Top-1 acc 69.531 (67.363)	Top-5 acc 86.719 (86.111)	lr 0.00064
Train [108][2270/3239]	Time 0.238 (0.515)	Data Time 0.001 (0.018)	Loss 2.3147 (2.3577)	Entropy 0.53847 (0.53816)	Top-1 acc 68.359 (67.369)	Top-5 acc 85.547 (86.111)	lr 0.00064
Train [108][2280/3239]	Time 0.361 (0.514)	Data Time 0.001 (0.018)	Loss 2.4677 (2.3580)	Entropy 0.53845 (0.53816)	Top-1 acc 66.406 (67.365)	Top-5 acc 85.938 (86.106)	lr 0.00064
Train [108][2290/3239]	Time 0.229 (0.514)	Data Time 0.001 (0.017)	Loss 2.2189 (2.3578)	Entropy 0.53843 (0.53816)	Top-1 acc 70.703 (67.373)	Top-5 acc 87.109 (86.107)	lr 0.00064
Train [108][2300/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.017)	Loss 2.3899 (2.3583)	Entropy 0.53864 (0.53816)	Top-1 acc 65.234 (67.361)	Top-5 acc 86.328 (86.101)	lr 0.00064
Train [108][2310/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.017)	Loss 2.4286 (2.3581)	Entropy 0.53868 (0.53816)	Top-1 acc 64.844 (67.366)	Top-5 acc 86.328 (86.104)	lr 0.00064
Train [108][2320/3239]	Time 0.232 (0.513)	Data Time 0.001 (0.017)	Loss 2.3194 (2.3581)	Entropy 0.53852 (0.53816)	Top-1 acc 68.359 (67.368)	Top-5 acc 87.500 (86.106)	lr 0.00064
Train [108][2330/3239]	Time 0.222 (0.512)	Data Time 0.001 (0.017)	Loss 2.4394 (2.3580)	Entropy 0.53845 (0.53817)	Top-1 acc 65.625 (67.368)	Top-5 acc 87.109 (86.105)	lr 0.00064
Train [108][2340/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.017)	Loss 2.2059 (2.3576)	Entropy 0.53854 (0.53817)	Top-1 acc 73.828 (67.377)	Top-5 acc 88.672 (86.112)	lr 0.00064
Train [108][2350/3239]	Time 0.319 (0.511)	Data Time 0.001 (0.017)	Loss 2.6292 (2.3579)	Entropy 0.53838 (0.53817)	Top-1 acc 60.547 (67.370)	Top-5 acc 82.031 (86.106)	lr 0.00064
Train [108][2360/3239]	Time 0.222 (0.511)	Data Time 0.001 (0.017)	Loss 2.3877 (2.3578)	Entropy 0.53822 (0.53817)	Top-1 acc 67.578 (67.375)	Top-5 acc 84.766 (86.110)	lr 0.00064
Train [108][2370/3239]	Time 0.248 (0.510)	Data Time 0.001 (0.017)	Loss 2.2171 (2.3579)	Entropy 0.53835 (0.53817)	Top-1 acc 73.047 (67.373)	Top-5 acc 88.281 (86.110)	lr 0.00064
Train [108][2380/3239]	Time 0.234 (0.510)	Data Time 0.001 (0.017)	Loss 2.2186 (2.3580)	Entropy 0.53886 (0.53817)	Top-1 acc 71.094 (67.367)	Top-5 acc 89.453 (86.112)	lr 0.00064
Train [108][2390/3239]	Time 0.231 (0.509)	Data Time 0.001 (0.017)	Loss 2.4112 (2.3580)	Entropy 0.53881 (0.53817)	Top-1 acc 64.844 (67.362)	Top-5 acc 83.594 (86.112)	lr 0.00064
Train [108][2400/3239]	Time 0.264 (0.509)	Data Time 0.001 (0.017)	Loss 2.2876 (2.3583)	Entropy 0.53888 (0.53818)	Top-1 acc 71.875 (67.355)	Top-5 acc 87.891 (86.106)	lr 0.00064
Train [108][2410/3239]	Time 0.306 (0.532)	Data Time 0.004 (0.017)	Loss 2.4887 (2.3585)	Entropy 0.53891 (0.53818)	Top-1 acc 65.234 (67.344)	Top-5 acc 83.203 (86.104)	lr 0.00064
Train [108][2420/3239]	Time 0.236 (0.532)	Data Time 0.002 (0.017)	Loss 2.6875 (2.3585)	Entropy 0.53930 (0.53818)	Top-1 acc 58.984 (67.340)	Top-5 acc 81.641 (86.106)	lr 0.00064
Train [108][2430/3239]	Time 0.244 (0.531)	Data Time 0.001 (0.017)	Loss 2.3332 (2.3586)	Entropy 0.53918 (0.53819)	Top-1 acc 65.625 (67.337)	Top-5 acc 86.328 (86.104)	lr 0.00064
Train [108][2440/3239]	Time 0.340 (0.531)	Data Time 0.001 (0.016)	Loss 2.3096 (2.3585)	Entropy 0.53940 (0.53819)	Top-1 acc 69.141 (67.340)	Top-5 acc 86.719 (86.104)	lr 0.00064
Train [108][2450/3239]	Time 0.285 (0.531)	Data Time 0.002 (0.016)	Loss 2.1483 (2.3587)	Entropy 0.53962 (0.53820)	Top-1 acc 73.047 (67.338)	Top-5 acc 89.453 (86.103)	lr 0.00064
Train [108][2460/3239]	Time 0.238 (0.530)	Data Time 0.001 (0.016)	Loss 2.4517 (2.3585)	Entropy 0.53960 (0.53820)	Top-1 acc 66.016 (67.343)	Top-5 acc 85.156 (86.104)	lr 0.00064
Train [108][2470/3239]	Time 0.230 (0.530)	Data Time 0.001 (0.016)	Loss 2.1958 (2.3584)	Entropy 0.53995 (0.53821)	Top-1 acc 70.703 (67.346)	Top-5 acc 88.672 (86.108)	lr 0.00064
Train [108][2480/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.016)	Loss 2.1710 (2.3584)	Entropy 0.53998 (0.53822)	Top-1 acc 71.484 (67.346)	Top-5 acc 89.844 (86.106)	lr 0.00064
Train [108][2490/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.016)	Loss 2.1878 (2.3585)	Entropy 0.54021 (0.53822)	Top-1 acc 67.578 (67.343)	Top-5 acc 90.234 (86.103)	lr 0.00064
Train [108][2500/3239]	Time 0.222 (0.528)	Data Time 0.001 (0.016)	Loss 2.4279 (2.3581)	Entropy 0.54036 (0.53823)	Top-1 acc 67.578 (67.351)	Top-5 acc 85.156 (86.110)	lr 0.00064
Train [108][2510/3239]	Time 0.318 (0.528)	Data Time 0.001 (0.016)	Loss 2.3635 (2.3579)	Entropy 0.54001 (0.53824)	Top-1 acc 66.016 (67.353)	Top-5 acc 85.547 (86.113)	lr 0.00063
Train [108][2520/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.016)	Loss 2.4605 (2.3581)	Entropy 0.54009 (0.53825)	Top-1 acc 64.062 (67.346)	Top-5 acc 84.375 (86.108)	lr 0.00063
Train [108][2530/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.016)	Loss 2.5482 (2.3582)	Entropy 0.54021 (0.53825)	Top-1 acc 64.844 (67.343)	Top-5 acc 80.859 (86.108)	lr 0.00063
Train [108][2540/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.016)	Loss 2.2590 (2.3581)	Entropy 0.54050 (0.53826)	Top-1 acc 69.531 (67.348)	Top-5 acc 88.672 (86.111)	lr 0.00063
Train [108][2550/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.016)	Loss 2.2475 (2.3582)	Entropy 0.54073 (0.53827)	Top-1 acc 69.922 (67.346)	Top-5 acc 87.500 (86.110)	lr 0.00063
Train [108][2560/3239]	Time 0.265 (0.526)	Data Time 0.001 (0.016)	Loss 2.3063 (2.3578)	Entropy 0.54108 (0.53828)	Top-1 acc 64.844 (67.353)	Top-5 acc 86.719 (86.117)	lr 0.00063
Train [108][2570/3239]	Time 0.223 (0.525)	Data Time 0.001 (0.016)	Loss 2.3530 (2.3582)	Entropy 0.54134 (0.53829)	Top-1 acc 69.141 (67.346)	Top-5 acc 87.109 (86.113)	lr 0.00063
Train [108][2580/3239]	Time 0.267 (0.525)	Data Time 0.001 (0.016)	Loss 2.3305 (2.3579)	Entropy 0.54145 (0.53830)	Top-1 acc 69.141 (67.349)	Top-5 acc 85.156 (86.114)	lr 0.00063
Train [108][2590/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.016)	Loss 2.3941 (2.3580)	Entropy 0.54085 (0.53831)	Top-1 acc 65.234 (67.352)	Top-5 acc 86.719 (86.114)	lr 0.00063
Train [108][2600/3239]	Time 0.252 (0.524)	Data Time 0.001 (0.016)	Loss 2.3160 (2.3577)	Entropy 0.54086 (0.53832)	Top-1 acc 68.359 (67.360)	Top-5 acc 89.453 (86.121)	lr 0.00063
Train [108][2610/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.016)	Loss 2.3241 (2.3575)	Entropy 0.54090 (0.53833)	Top-1 acc 69.141 (67.362)	Top-5 acc 86.328 (86.122)	lr 0.00063
Train [108][2620/3239]	Time 0.296 (0.523)	Data Time 0.001 (0.015)	Loss 2.2462 (2.3576)	Entropy 0.54100 (0.53834)	Top-1 acc 67.188 (67.359)	Top-5 acc 88.281 (86.124)	lr 0.00063
Train [108][2630/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.015)	Loss 2.2657 (2.3577)	Entropy 0.54116 (0.53835)	Top-1 acc 69.531 (67.356)	Top-5 acc 88.281 (86.122)	lr 0.00063
Train [108][2640/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.015)	Loss 2.4813 (2.3576)	Entropy 0.54099 (0.53836)	Top-1 acc 64.453 (67.361)	Top-5 acc 84.375 (86.123)	lr 0.00063
Train [108][2650/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.015)	Loss 2.1663 (2.3577)	Entropy 0.54110 (0.53838)	Top-1 acc 75.000 (67.363)	Top-5 acc 90.625 (86.122)	lr 0.00063
Train [108][2660/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.015)	Loss 2.3764 (2.3577)	Entropy 0.54091 (0.53839)	Top-1 acc 64.453 (67.358)	Top-5 acc 89.844 (86.124)	lr 0.00063
Train [108][2670/3239]	Time 0.320 (0.521)	Data Time 0.001 (0.015)	Loss 2.2837 (2.3576)	Entropy 0.54092 (0.53840)	Top-1 acc 69.922 (67.361)	Top-5 acc 88.281 (86.127)	lr 0.00063
Train [108][2680/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.015)	Loss 2.3742 (2.3576)	Entropy 0.54085 (0.53840)	Top-1 acc 67.578 (67.366)	Top-5 acc 86.719 (86.127)	lr 0.00063
Train [108][2690/3239]	Time 0.254 (0.521)	Data Time 0.001 (0.015)	Loss 2.3041 (2.3574)	Entropy 0.54097 (0.53841)	Top-1 acc 68.359 (67.371)	Top-5 acc 86.328 (86.130)	lr 0.00063
Train [108][2700/3239]	Time 0.219 (0.520)	Data Time 0.001 (0.015)	Loss 2.4749 (2.3574)	Entropy 0.54117 (0.53842)	Top-1 acc 67.188 (67.370)	Top-5 acc 84.375 (86.130)	lr 0.00063
Train [108][2710/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.015)	Loss 2.3803 (2.3575)	Entropy 0.54147 (0.53843)	Top-1 acc 61.719 (67.367)	Top-5 acc 88.281 (86.129)	lr 0.00063
Train [108][2720/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.015)	Loss 2.4151 (2.3573)	Entropy 0.54158 (0.53845)	Top-1 acc 64.453 (67.370)	Top-5 acc 86.328 (86.133)	lr 0.00063
Train [108][2730/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.015)	Loss 2.2613 (2.3573)	Entropy 0.54189 (0.53846)	Top-1 acc 69.922 (67.369)	Top-5 acc 89.453 (86.135)	lr 0.00063
Train [108][2740/3239]	Time 0.320 (0.519)	Data Time 0.001 (0.015)	Loss 2.3953 (2.3573)	Entropy 0.54120 (0.53847)	Top-1 acc 64.062 (67.362)	Top-5 acc 85.156 (86.134)	lr 0.00063
Train [108][2750/3239]	Time 0.239 (0.518)	Data Time 0.001 (0.015)	Loss 2.3992 (2.3574)	Entropy 0.54131 (0.53848)	Top-1 acc 67.578 (67.361)	Top-5 acc 87.109 (86.135)	lr 0.00063
Train [108][2760/3239]	Time 0.235 (0.518)	Data Time 0.001 (0.015)	Loss 2.1978 (2.3574)	Entropy 0.54120 (0.53849)	Top-1 acc 71.484 (67.359)	Top-5 acc 89.453 (86.132)	lr 0.00063
Train [108][2770/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.015)	Loss 2.6231 (2.3576)	Entropy 0.54066 (0.53850)	Top-1 acc 62.109 (67.356)	Top-5 acc 80.078 (86.129)	lr 0.00063
Train [108][2780/3239]	Time 0.251 (0.517)	Data Time 0.001 (0.015)	Loss 2.2649 (2.3575)	Entropy 0.54075 (0.53851)	Top-1 acc 68.359 (67.357)	Top-5 acc 87.891 (86.129)	lr 0.00063
Train [108][2790/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.015)	Loss 2.3444 (2.3576)	Entropy 0.54082 (0.53851)	Top-1 acc 69.922 (67.355)	Top-5 acc 86.328 (86.128)	lr 0.00063
Train [108][2800/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.015)	Loss 2.1717 (2.3575)	Entropy 0.54100 (0.53852)	Top-1 acc 73.438 (67.357)	Top-5 acc 89.062 (86.128)	lr 0.00063
Train [108][2810/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.015)	Loss 2.5895 (2.3575)	Entropy 0.54121 (0.53853)	Top-1 acc 62.500 (67.353)	Top-5 acc 84.766 (86.130)	lr 0.00063
Train [108][2820/3239]	Time 0.230 (0.516)	Data Time 0.001 (0.014)	Loss 2.2563 (2.3575)	Entropy 0.54115 (0.53854)	Top-1 acc 70.703 (67.350)	Top-5 acc 86.328 (86.132)	lr 0.00062
Train [108][2830/3239]	Time 0.320 (0.515)	Data Time 0.001 (0.014)	Loss 2.4136 (2.3576)	Entropy 0.54121 (0.53855)	Top-1 acc 64.062 (67.344)	Top-5 acc 84.375 (86.130)	lr 0.00062
Train [108][2840/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.014)	Loss 2.4702 (2.3581)	Entropy 0.54130 (0.53856)	Top-1 acc 65.234 (67.332)	Top-5 acc 83.594 (86.120)	lr 0.00062
Train [108][2850/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.014)	Loss 2.2857 (2.3580)	Entropy 0.54096 (0.53857)	Top-1 acc 64.453 (67.332)	Top-5 acc 89.453 (86.123)	lr 0.00062
Train [108][2860/3239]	Time 0.252 (0.514)	Data Time 0.001 (0.014)	Loss 2.2678 (2.3580)	Entropy 0.54117 (0.53858)	Top-1 acc 70.703 (67.329)	Top-5 acc 85.547 (86.121)	lr 0.00062
Train [108][2870/3239]	Time 0.230 (0.514)	Data Time 0.001 (0.014)	Loss 2.1929 (2.3581)	Entropy 0.54119 (0.53859)	Top-1 acc 71.484 (67.327)	Top-5 acc 89.453 (86.120)	lr 0.00062
Train [108][2880/3239]	Time 0.259 (0.513)	Data Time 0.001 (0.014)	Loss 2.3503 (2.3581)	Entropy 0.54133 (0.53860)	Top-1 acc 67.578 (67.329)	Top-5 acc 85.547 (86.120)	lr 0.00062
Train [108][2890/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.014)	Loss 2.2534 (2.3581)	Entropy 0.54175 (0.53861)	Top-1 acc 69.922 (67.328)	Top-5 acc 87.109 (86.117)	lr 0.00062
Train [108][2900/3239]	Time 0.315 (0.513)	Data Time 0.001 (0.014)	Loss 2.6740 (2.3582)	Entropy 0.54158 (0.53862)	Top-1 acc 59.375 (67.327)	Top-5 acc 81.641 (86.117)	lr 0.00062
Train [108][2910/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.014)	Loss 2.3271 (2.3582)	Entropy 0.54211 (0.53863)	Top-1 acc 70.312 (67.330)	Top-5 acc 87.891 (86.116)	lr 0.00062
Train [108][2920/3239]	Time 0.245 (0.512)	Data Time 0.001 (0.014)	Loss 2.3935 (2.3582)	Entropy 0.54186 (0.53864)	Top-1 acc 63.672 (67.328)	Top-5 acc 86.719 (86.117)	lr 0.00062
Train [108][2930/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.014)	Loss 2.2698 (2.3581)	Entropy 0.54178 (0.53865)	Top-1 acc 67.969 (67.332)	Top-5 acc 87.109 (86.118)	lr 0.00062
Train [108][2940/3239]	Time 0.283 (0.511)	Data Time 0.001 (0.014)	Loss 2.2513 (2.3582)	Entropy 0.54143 (0.53866)	Top-1 acc 71.484 (67.330)	Top-5 acc 87.109 (86.115)	lr 0.00062
Train [108][2950/3239]	Time 0.242 (0.511)	Data Time 0.001 (0.014)	Loss 2.2268 (2.3580)	Entropy 0.54148 (0.53867)	Top-1 acc 69.922 (67.332)	Top-5 acc 88.281 (86.118)	lr 0.00062
Train [108][2960/3239]	Time 0.240 (0.511)	Data Time 0.001 (0.014)	Loss 2.4387 (2.3580)	Entropy 0.54196 (0.53868)	Top-1 acc 64.453 (67.333)	Top-5 acc 82.812 (86.115)	lr 0.00062
Train [108][2970/3239]	Time 0.244 (0.511)	Data Time 0.001 (0.014)	Loss 2.5626 (2.3581)	Entropy 0.54208 (0.53869)	Top-1 acc 61.328 (67.333)	Top-5 acc 83.203 (86.114)	lr 0.00062
Train [108][2980/3239]	Time 0.234 (0.510)	Data Time 0.001 (0.014)	Loss 2.0617 (2.3579)	Entropy 0.54234 (0.53870)	Top-1 acc 75.000 (67.337)	Top-5 acc 91.406 (86.120)	lr 0.00062
Train [108][2990/3239]	Time 0.455 (0.510)	Data Time 0.001 (0.014)	Loss 2.4680 (2.3579)	Entropy 0.54266 (0.53872)	Top-1 acc 67.578 (67.337)	Top-5 acc 84.766 (86.120)	lr 0.00062
Train [108][3000/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.014)	Loss 2.1661 (2.3579)	Entropy 0.54251 (0.53873)	Top-1 acc 69.531 (67.335)	Top-5 acc 91.406 (86.122)	lr 0.00062
Train [108][3010/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.014)	Loss 2.4178 (2.3584)	Entropy 0.54248 (0.53874)	Top-1 acc 62.500 (67.322)	Top-5 acc 85.938 (86.115)	lr 0.00062
Train [108][3020/3239]	Time 0.228 (0.509)	Data Time 0.001 (0.014)	Loss 2.2678 (2.3584)	Entropy 0.54228 (0.53875)	Top-1 acc 70.703 (67.324)	Top-5 acc 87.109 (86.115)	lr 0.00062
Train [108][3030/3239]	Time 0.230 (0.509)	Data Time 0.001 (0.014)	Loss 2.1625 (2.3583)	Entropy 0.54229 (0.53876)	Top-1 acc 69.531 (67.323)	Top-5 acc 88.281 (86.116)	lr 0.00062
Train [108][3040/3239]	Time 0.277 (0.508)	Data Time 0.001 (0.014)	Loss 2.3495 (2.3582)	Entropy 0.54267 (0.53878)	Top-1 acc 68.359 (67.325)	Top-5 acc 85.547 (86.119)	lr 0.00062
Train [108][3050/3239]	Time 0.260 (0.508)	Data Time 0.001 (0.013)	Loss 2.4109 (2.3581)	Entropy 0.54261 (0.53879)	Top-1 acc 68.359 (67.331)	Top-5 acc 83.984 (86.122)	lr 0.00062
Train [108][3060/3239]	Time 0.564 (0.526)	Data Time 0.005 (0.013)	Loss 2.5340 (2.3582)	Entropy 0.54250 (0.53880)	Top-1 acc 60.156 (67.327)	Top-5 acc 81.641 (86.120)	lr 0.00062
Train [108][3070/3239]	Time 0.296 (0.525)	Data Time 0.002 (0.013)	Loss 2.2826 (2.3583)	Entropy 0.54245 (0.53881)	Top-1 acc 67.578 (67.324)	Top-5 acc 86.328 (86.116)	lr 0.00062
Train [108][3080/3239]	Time 0.256 (0.525)	Data Time 0.002 (0.013)	Loss 2.3144 (2.3582)	Entropy 0.54276 (0.53883)	Top-1 acc 67.969 (67.327)	Top-5 acc 87.891 (86.118)	lr 0.00062
Train [108][3090/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.013)	Loss 2.3891 (2.3582)	Entropy 0.54293 (0.53884)	Top-1 acc 66.797 (67.329)	Top-5 acc 83.203 (86.118)	lr 0.00062
Train [108][3100/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.013)	Loss 2.5183 (2.3582)	Entropy 0.54291 (0.53885)	Top-1 acc 64.062 (67.331)	Top-5 acc 79.297 (86.117)	lr 0.00062
Train [108][3110/3239]	Time 0.271 (0.524)	Data Time 0.001 (0.013)	Loss 2.2325 (2.3580)	Entropy 0.54325 (0.53887)	Top-1 acc 70.312 (67.336)	Top-5 acc 88.672 (86.122)	lr 0.00062
Train [108][3120/3239]	Time 0.225 (0.524)	Data Time 0.001 (0.013)	Loss 2.4118 (2.3579)	Entropy 0.54306 (0.53888)	Top-1 acc 65.234 (67.337)	Top-5 acc 84.375 (86.122)	lr 0.00062
Train [108][3130/3239]	Time 0.260 (0.523)	Data Time 0.001 (0.013)	Loss 2.4249 (2.3578)	Entropy 0.54322 (0.53889)	Top-1 acc 65.625 (67.339)	Top-5 acc 84.375 (86.125)	lr 0.00062
Train [108][3140/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.013)	Loss 2.0000 (2.3576)	Entropy 0.54348 (0.53891)	Top-1 acc 76.172 (67.344)	Top-5 acc 91.797 (86.130)	lr 0.00061
Train [108][3150/3239]	Time 0.321 (0.523)	Data Time 0.001 (0.013)	Loss 2.3158 (2.3577)	Entropy 0.54344 (0.53892)	Top-1 acc 66.406 (67.341)	Top-5 acc 87.500 (86.128)	lr 0.00061
Train [108][3160/3239]	Time 0.261 (0.522)	Data Time 0.001 (0.013)	Loss 2.4569 (2.3577)	Entropy 0.54372 (0.53894)	Top-1 acc 63.672 (67.345)	Top-5 acc 86.719 (86.129)	lr 0.00061
Train [108][3170/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.013)	Loss 2.3542 (2.3576)	Entropy 0.54354 (0.53895)	Top-1 acc 68.359 (67.350)	Top-5 acc 86.328 (86.131)	lr 0.00061
Train [108][3180/3239]	Time 0.259 (0.522)	Data Time 0.000 (0.013)	Loss 2.2801 (2.3577)	Entropy 0.54354 (0.53896)	Top-1 acc 68.750 (67.345)	Top-5 acc 86.328 (86.128)	lr 0.00061
Train [108][3190/3239]	Time 0.231 (0.521)	Data Time 0.000 (0.013)	Loss 2.3324 (2.3577)	Entropy 0.54359 (0.53898)	Top-1 acc 67.188 (67.344)	Top-5 acc 85.156 (86.124)	lr 0.00061
Train [108][3200/3239]	Time 0.236 (0.521)	Data Time 0.000 (0.013)	Loss 2.3000 (2.3577)	Entropy 0.54378 (0.53899)	Top-1 acc 66.797 (67.342)	Top-5 acc 88.281 (86.125)	lr 0.00061
Train [108][3210/3239]	Time 0.228 (0.521)	Data Time 0.000 (0.013)	Loss 2.1191 (2.3576)	Entropy 0.54360 (0.53901)	Top-1 acc 75.391 (67.346)	Top-5 acc 91.406 (86.127)	lr 0.00061
Train [108][3220/3239]	Time 0.308 (0.520)	Data Time 0.000 (0.013)	Loss 2.3284 (2.3578)	Entropy 0.54362 (0.53902)	Top-1 acc 66.406 (67.340)	Top-5 acc 85.938 (86.126)	lr 0.00061
Train [108][3230/3239]	Time 0.237 (0.520)	Data Time 0.000 (0.013)	Loss 2.2848 (2.3578)	Entropy 0.54350 (0.53904)	Top-1 acc 70.703 (67.342)	Top-5 acc 87.109 (86.126)	lr 0.00061
Train [108][3239/3239]	Time 0.835 (0.519)	Data Time 0.000 (0.013)	Loss 2.5972 (2.3577)	Entropy 0.54364 (0.53905)	Top-1 acc 60.494 (67.345)	Top-5 acc 80.247 (86.129)	lr 0.00061
==========Valid [108/120]	loss 1.178	top-1 acc 72.772 (72.893)	top-5 acc 90.558	Train top-1 67.345	top-5 86.129	Entropy 0.54364	Latency-None: 0.000ms	Flops: 539.00M
Train [109][0/3239]	Time 39.297 (39.297)	Data Time 37.185 (37.185)	Loss 2.5088 (2.5088)	Entropy 0.54367 (0.54367)	Top-1 acc 61.719 (61.719)	Top-5 acc 83.594 (83.594)	lr 0.00061
Train [109][10/3239]	Time 0.235 (4.062)	Data Time 0.001 (3.382)	Loss 2.4533 (2.3613)	Entropy 0.54362 (0.54362)	Top-1 acc 58.984 (66.335)	Top-5 acc 85.938 (86.328)	lr 0.00061
Train [109][20/3239]	Time 0.242 (2.322)	Data Time 0.001 (1.772)	Loss 2.3096 (2.3269)	Entropy 0.54339 (0.54362)	Top-1 acc 68.359 (67.374)	Top-5 acc 87.891 (86.626)	lr 0.00061
Train [109][30/3239]	Time 0.274 (1.723)	Data Time 0.001 (1.201)	Loss 2.3101 (2.3341)	Entropy 0.54350 (0.54358)	Top-1 acc 68.750 (67.616)	Top-5 acc 86.719 (86.353)	lr 0.00061
Train [109][40/3239]	Time 0.304 (1.457)	Data Time 0.002 (0.909)	Loss 2.4294 (2.3366)	Entropy 0.54312 (0.54353)	Top-1 acc 65.625 (67.397)	Top-5 acc 83.984 (86.433)	lr 0.00061
Train [109][50/3239]	Time 0.360 (1.269)	Data Time 0.001 (0.731)	Loss 2.3230 (2.3330)	Entropy 0.54341 (0.54348)	Top-1 acc 70.312 (67.394)	Top-5 acc 87.109 (86.665)	lr 0.00061
Train [109][60/3239]	Time 0.232 (1.133)	Data Time 0.001 (0.611)	Loss 2.2625 (2.3282)	Entropy 0.54367 (0.54349)	Top-1 acc 69.141 (67.565)	Top-5 acc 88.672 (86.648)	lr 0.00061
Train [109][70/3239]	Time 0.236 (1.033)	Data Time 0.001 (0.525)	Loss 2.3577 (2.3309)	Entropy 0.54351 (0.54350)	Top-1 acc 66.797 (67.485)	Top-5 acc 85.938 (86.625)	lr 0.00061
Train [109][80/3239]	Time 0.245 (0.960)	Data Time 0.001 (0.461)	Loss 2.1859 (2.3352)	Entropy 0.54324 (0.54350)	Top-1 acc 69.141 (67.578)	Top-5 acc 91.016 (86.569)	lr 0.00061
Train [109][90/3239]	Time 0.238 (0.901)	Data Time 0.001 (0.410)	Loss 2.3835 (2.3372)	Entropy 0.54322 (0.54347)	Top-1 acc 67.578 (67.621)	Top-5 acc 84.766 (86.538)	lr 0.00061
Train [109][100/3239]	Time 0.241 (0.854)	Data Time 0.001 (0.370)	Loss 2.3849 (2.3496)	Entropy 0.54311 (0.54344)	Top-1 acc 63.672 (67.365)	Top-5 acc 87.500 (86.378)	lr 0.00061
Train [109][110/3239]	Time 0.228 (0.816)	Data Time 0.001 (0.337)	Loss 2.4096 (2.3548)	Entropy 0.54255 (0.54341)	Top-1 acc 65.234 (67.173)	Top-5 acc 85.938 (86.307)	lr 0.00061
Train [109][120/3239]	Time 0.316 (0.782)	Data Time 0.001 (0.309)	Loss 2.2571 (2.3542)	Entropy 0.54270 (0.54334)	Top-1 acc 73.047 (67.204)	Top-5 acc 89.062 (86.364)	lr 0.00061
Train [109][130/3239]	Time 0.238 (0.752)	Data Time 0.002 (0.286)	Loss 2.5010 (2.3634)	Entropy 0.54268 (0.54329)	Top-1 acc 64.844 (67.012)	Top-5 acc 83.594 (86.230)	lr 0.00061
Train [109][140/3239]	Time 0.232 (0.731)	Data Time 0.001 (0.265)	Loss 2.3364 (2.3584)	Entropy 0.54251 (0.54325)	Top-1 acc 70.312 (67.168)	Top-5 acc 85.547 (86.256)	lr 0.00061
Train [109][150/3239]	Time 0.245 (0.712)	Data Time 0.002 (0.248)	Loss 2.5844 (2.3542)	Entropy 0.54234 (0.54319)	Top-1 acc 58.984 (67.224)	Top-5 acc 82.031 (86.300)	lr 0.00061
Train [109][160/3239]	Time 0.242 (0.694)	Data Time 0.001 (0.233)	Loss 2.4455 (2.3575)	Entropy 0.54243 (0.54314)	Top-1 acc 67.188 (67.226)	Top-5 acc 84.766 (86.265)	lr 0.00061
Train [109][170/3239]	Time 0.270 (0.679)	Data Time 0.001 (0.219)	Loss 2.4767 (2.3565)	Entropy 0.54237 (0.54310)	Top-1 acc 60.547 (67.270)	Top-5 acc 83.984 (86.280)	lr 0.00061
Train [109][180/3239]	Time 0.247 (0.664)	Data Time 0.002 (0.207)	Loss 2.7150 (2.3572)	Entropy 0.54240 (0.54306)	Top-1 acc 64.453 (67.267)	Top-5 acc 79.297 (86.253)	lr 0.00061
Train [109][190/3239]	Time 0.240 (0.653)	Data Time 0.001 (0.196)	Loss 2.6192 (2.3557)	Entropy 0.54230 (0.54302)	Top-1 acc 62.500 (67.310)	Top-5 acc 83.594 (86.302)	lr 0.00061
Train [109][200/3239]	Time 0.238 (0.641)	Data Time 0.001 (0.187)	Loss 2.1497 (2.3569)	Entropy 0.54217 (0.54298)	Top-1 acc 72.266 (67.308)	Top-5 acc 91.406 (86.276)	lr 0.00061
Train [109][210/3239]	Time 0.360 (0.631)	Data Time 0.001 (0.178)	Loss 2.3855 (2.3568)	Entropy 0.54204 (0.54294)	Top-1 acc 65.234 (67.323)	Top-5 acc 86.328 (86.265)	lr 0.00061
Train [109][220/3239]	Time 0.229 (0.620)	Data Time 0.001 (0.170)	Loss 2.3612 (2.3543)	Entropy 0.54225 (0.54291)	Top-1 acc 65.234 (67.366)	Top-5 acc 85.938 (86.291)	lr 0.00060
Train [109][230/3239]	Time 0.227 (0.612)	Data Time 0.001 (0.163)	Loss 2.2566 (2.3518)	Entropy 0.54222 (0.54287)	Top-1 acc 66.016 (67.411)	Top-5 acc 90.234 (86.352)	lr 0.00060
Train [109][240/3239]	Time 0.259 (0.604)	Data Time 0.002 (0.156)	Loss 2.4636 (2.3523)	Entropy 0.54210 (0.54285)	Top-1 acc 62.109 (67.408)	Top-5 acc 82.422 (86.343)	lr 0.00060
Train [109][250/3239]	Time 0.253 (0.597)	Data Time 0.001 (0.150)	Loss 2.3028 (2.3520)	Entropy 0.54217 (0.54282)	Top-1 acc 69.531 (67.465)	Top-5 acc 85.547 (86.317)	lr 0.00060
Train [109][260/3239]	Time 0.224 (0.591)	Data Time 0.001 (0.144)	Loss 2.3901 (2.3536)	Entropy 0.54229 (0.54280)	Top-1 acc 67.188 (67.409)	Top-5 acc 84.375 (86.301)	lr 0.00060
Train [109][270/3239]	Time 0.224 (0.584)	Data Time 0.001 (0.139)	Loss 2.3935 (2.3548)	Entropy 0.54234 (0.54278)	Top-1 acc 65.234 (67.404)	Top-5 acc 84.766 (86.298)	lr 0.00060
Train [109][280/3239]	Time 0.317 (0.578)	Data Time 0.001 (0.134)	Loss 2.3513 (2.3556)	Entropy 0.54277 (0.54277)	Top-1 acc 67.969 (67.360)	Top-5 acc 87.500 (86.271)	lr 0.00060
Train [109][290/3239]	Time 0.236 (0.571)	Data Time 0.001 (0.129)	Loss 2.3038 (2.3562)	Entropy 0.54282 (0.54277)	Top-1 acc 67.578 (67.292)	Top-5 acc 87.500 (86.257)	lr 0.00060
Train [109][300/3239]	Time 0.232 (0.565)	Data Time 0.001 (0.125)	Loss 2.2322 (2.3538)	Entropy 0.54256 (0.54277)	Top-1 acc 67.188 (67.334)	Top-5 acc 88.672 (86.293)	lr 0.00060
Train [109][310/3239]	Time 0.231 (0.560)	Data Time 0.001 (0.121)	Loss 2.2262 (2.3537)	Entropy 0.54282 (0.54277)	Top-1 acc 71.094 (67.336)	Top-5 acc 87.500 (86.279)	lr 0.00060
Train [109][320/3239]	Time 0.248 (0.555)	Data Time 0.001 (0.117)	Loss 2.3218 (2.3539)	Entropy 0.54268 (0.54277)	Top-1 acc 66.797 (67.329)	Top-5 acc 87.500 (86.284)	lr 0.00060
Train [109][330/3239]	Time 0.265 (0.551)	Data Time 0.001 (0.114)	Loss 2.2688 (2.3531)	Entropy 0.54298 (0.54277)	Top-1 acc 72.266 (67.347)	Top-5 acc 87.500 (86.318)	lr 0.00060
Train [109][340/3239]	Time 0.237 (0.548)	Data Time 0.001 (0.111)	Loss 2.1509 (2.3526)	Entropy 0.54314 (0.54278)	Top-1 acc 71.875 (67.368)	Top-5 acc 88.672 (86.326)	lr 0.00060
Train [109][350/3239]	Time 0.232 (0.545)	Data Time 0.001 (0.108)	Loss 2.3690 (2.3534)	Entropy 0.54276 (0.54278)	Top-1 acc 70.312 (67.344)	Top-5 acc 83.594 (86.290)	lr 0.00060
Train [109][360/3239]	Time 0.269 (0.541)	Data Time 0.001 (0.105)	Loss 2.2963 (2.3538)	Entropy 0.54269 (0.54278)	Top-1 acc 68.359 (67.339)	Top-5 acc 87.109 (86.270)	lr 0.00060
Train [109][370/3239]	Time 0.244 (0.537)	Data Time 0.001 (0.102)	Loss 2.4089 (2.3551)	Entropy 0.54248 (0.54278)	Top-1 acc 64.844 (67.277)	Top-5 acc 83.984 (86.255)	lr 0.00060
Train [109][380/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.099)	Loss 2.3677 (2.3561)	Entropy 0.54221 (0.54277)	Top-1 acc 67.188 (67.259)	Top-5 acc 83.594 (86.207)	lr 0.00060
Train [109][390/3239]	Time 0.248 (0.530)	Data Time 0.009 (0.097)	Loss 2.3756 (2.3560)	Entropy 0.54220 (0.54275)	Top-1 acc 67.969 (67.261)	Top-5 acc 84.766 (86.205)	lr 0.00060
Train [109][400/3239]	Time 0.262 (0.527)	Data Time 0.001 (0.094)	Loss 2.3359 (2.3572)	Entropy 0.54226 (0.54274)	Top-1 acc 67.188 (67.234)	Top-5 acc 85.938 (86.193)	lr 0.00060
Train [109][410/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.092)	Loss 2.5439 (2.3559)	Entropy 0.54201 (0.54272)	Top-1 acc 62.109 (67.256)	Top-5 acc 81.250 (86.210)	lr 0.00060
Train [109][420/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.090)	Loss 2.4660 (2.3583)	Entropy 0.54158 (0.54270)	Top-1 acc 66.797 (67.200)	Top-5 acc 85.547 (86.175)	lr 0.00060
Train [109][430/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.088)	Loss 2.3156 (2.3572)	Entropy 0.54159 (0.54268)	Top-1 acc 68.750 (67.231)	Top-5 acc 85.547 (86.187)	lr 0.00060
Train [109][440/3239]	Time 0.336 (0.517)	Data Time 0.001 (0.086)	Loss 2.1616 (2.3555)	Entropy 0.54149 (0.54265)	Top-1 acc 73.828 (67.267)	Top-5 acc 87.500 (86.204)	lr 0.00060
Train [109][450/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.084)	Loss 2.2552 (2.3555)	Entropy 0.54174 (0.54262)	Top-1 acc 70.312 (67.262)	Top-5 acc 85.938 (86.202)	lr 0.00060
Train [109][460/3239]	Time 0.243 (0.512)	Data Time 0.001 (0.082)	Loss 2.3843 (2.3565)	Entropy 0.54176 (0.54261)	Top-1 acc 66.797 (67.232)	Top-5 acc 84.766 (86.187)	lr 0.00060
Train [109][470/3239]	Time 0.250 (0.511)	Data Time 0.001 (0.081)	Loss 2.3213 (2.3569)	Entropy 0.54170 (0.54259)	Top-1 acc 66.797 (67.222)	Top-5 acc 89.844 (86.194)	lr 0.00060
Train [109][480/3239]	Time 0.238 (0.617)	Data Time 0.002 (0.079)	Loss 2.2539 (2.3561)	Entropy 0.54187 (0.54257)	Top-1 acc 72.656 (67.238)	Top-5 acc 86.328 (86.195)	lr 0.00060
Train [109][490/3239]	Time 0.220 (0.613)	Data Time 0.002 (0.077)	Loss 2.2427 (2.3569)	Entropy 0.54174 (0.54256)	Top-1 acc 70.703 (67.238)	Top-5 acc 88.672 (86.164)	lr 0.00060
Train [109][500/3239]	Time 0.236 (0.609)	Data Time 0.001 (0.076)	Loss 2.4480 (2.3581)	Entropy 0.54165 (0.54254)	Top-1 acc 66.797 (67.215)	Top-5 acc 83.984 (86.144)	lr 0.00060
Train [109][510/3239]	Time 0.235 (0.605)	Data Time 0.001 (0.074)	Loss 2.3151 (2.3573)	Entropy 0.54188 (0.54252)	Top-1 acc 69.531 (67.256)	Top-5 acc 89.453 (86.162)	lr 0.00060
Train [109][520/3239]	Time 0.268 (0.602)	Data Time 0.001 (0.073)	Loss 2.5081 (2.3571)	Entropy 0.54190 (0.54251)	Top-1 acc 66.406 (67.274)	Top-5 acc 82.422 (86.166)	lr 0.00060
Train [109][530/3239]	Time 0.342 (0.599)	Data Time 0.002 (0.072)	Loss 2.2821 (2.3570)	Entropy 0.54153 (0.54250)	Top-1 acc 70.703 (67.282)	Top-5 acc 85.156 (86.169)	lr 0.00060
Train [109][540/3239]	Time 0.269 (0.596)	Data Time 0.001 (0.070)	Loss 2.3871 (2.3568)	Entropy 0.54129 (0.54248)	Top-1 acc 67.969 (67.299)	Top-5 acc 84.766 (86.173)	lr 0.00060
Train [109][550/3239]	Time 0.245 (0.593)	Data Time 0.001 (0.069)	Loss 2.1661 (2.3563)	Entropy 0.54117 (0.54245)	Top-1 acc 70.312 (67.316)	Top-5 acc 91.406 (86.177)	lr 0.00059
Train [109][560/3239]	Time 0.275 (0.590)	Data Time 0.001 (0.068)	Loss 2.4007 (2.3585)	Entropy 0.54120 (0.54243)	Top-1 acc 64.844 (67.261)	Top-5 acc 85.156 (86.134)	lr 0.00059
Train [109][570/3239]	Time 0.243 (0.587)	Data Time 0.001 (0.067)	Loss 2.4457 (2.3584)	Entropy 0.54071 (0.54241)	Top-1 acc 62.109 (67.265)	Top-5 acc 84.375 (86.131)	lr 0.00059
Train [109][580/3239]	Time 0.236 (0.584)	Data Time 0.001 (0.066)	Loss 2.5301 (2.3586)	Entropy 0.54074 (0.54238)	Top-1 acc 64.062 (67.268)	Top-5 acc 83.203 (86.134)	lr 0.00059
Train [109][590/3239]	Time 0.237 (0.582)	Data Time 0.001 (0.065)	Loss 2.2732 (2.3588)	Entropy 0.54079 (0.54235)	Top-1 acc 70.703 (67.279)	Top-5 acc 87.109 (86.125)	lr 0.00059
Train [109][600/3239]	Time 0.344 (0.579)	Data Time 0.001 (0.064)	Loss 2.3573 (2.3579)	Entropy 0.54073 (0.54232)	Top-1 acc 66.406 (67.288)	Top-5 acc 88.281 (86.152)	lr 0.00059
Train [109][610/3239]	Time 0.247 (0.577)	Data Time 0.001 (0.063)	Loss 2.3038 (2.3572)	Entropy 0.54062 (0.54230)	Top-1 acc 69.531 (67.290)	Top-5 acc 86.719 (86.166)	lr 0.00059
Train [109][620/3239]	Time 0.253 (0.575)	Data Time 0.001 (0.062)	Loss 2.1812 (2.3570)	Entropy 0.54040 (0.54227)	Top-1 acc 73.047 (67.294)	Top-5 acc 88.672 (86.168)	lr 0.00059
Train [109][630/3239]	Time 0.235 (0.573)	Data Time 0.001 (0.061)	Loss 2.4753 (2.3573)	Entropy 0.54063 (0.54224)	Top-1 acc 66.797 (67.284)	Top-5 acc 83.203 (86.152)	lr 0.00059
Train [109][640/3239]	Time 0.226 (0.571)	Data Time 0.001 (0.060)	Loss 2.4282 (2.3574)	Entropy 0.54055 (0.54221)	Top-1 acc 64.844 (67.275)	Top-5 acc 86.719 (86.156)	lr 0.00059
Train [109][650/3239]	Time 0.244 (0.569)	Data Time 0.001 (0.059)	Loss 2.2411 (2.3569)	Entropy 0.54010 (0.54219)	Top-1 acc 69.141 (67.287)	Top-5 acc 87.109 (86.163)	lr 0.00059
Train [109][660/3239]	Time 0.249 (0.566)	Data Time 0.001 (0.058)	Loss 2.3458 (2.3584)	Entropy 0.54018 (0.54215)	Top-1 acc 68.359 (67.272)	Top-5 acc 87.109 (86.131)	lr 0.00059
Train [109][670/3239]	Time 0.350 (0.564)	Data Time 0.002 (0.057)	Loss 2.5786 (2.3589)	Entropy 0.54033 (0.54213)	Top-1 acc 60.938 (67.257)	Top-5 acc 83.203 (86.121)	lr 0.00059
Train [109][680/3239]	Time 0.243 (0.562)	Data Time 0.001 (0.056)	Loss 2.1677 (2.3606)	Entropy 0.54037 (0.54210)	Top-1 acc 71.094 (67.222)	Top-5 acc 89.844 (86.098)	lr 0.00059
Train [109][690/3239]	Time 0.225 (0.560)	Data Time 0.001 (0.055)	Loss 2.1934 (2.3600)	Entropy 0.54039 (0.54208)	Top-1 acc 73.438 (67.236)	Top-5 acc 89.453 (86.113)	lr 0.00059
Train [109][700/3239]	Time 0.241 (0.558)	Data Time 0.001 (0.055)	Loss 2.4859 (2.3593)	Entropy 0.54039 (0.54205)	Top-1 acc 64.453 (67.244)	Top-5 acc 86.328 (86.137)	lr 0.00059
Train [109][710/3239]	Time 0.231 (0.555)	Data Time 0.001 (0.054)	Loss 2.3790 (2.3595)	Entropy 0.54036 (0.54203)	Top-1 acc 63.281 (67.241)	Top-5 acc 87.891 (86.124)	lr 0.00059
Train [109][720/3239]	Time 0.225 (0.554)	Data Time 0.001 (0.053)	Loss 2.5427 (2.3600)	Entropy 0.54051 (0.54200)	Top-1 acc 64.453 (67.234)	Top-5 acc 83.594 (86.120)	lr 0.00059
Train [109][730/3239]	Time 0.228 (0.551)	Data Time 0.001 (0.053)	Loss 2.3561 (2.3599)	Entropy 0.54011 (0.54198)	Top-1 acc 66.797 (67.230)	Top-5 acc 83.594 (86.122)	lr 0.00059
Train [109][740/3239]	Time 0.235 (0.550)	Data Time 0.001 (0.052)	Loss 2.3448 (2.3593)	Entropy 0.54010 (0.54196)	Top-1 acc 65.234 (67.232)	Top-5 acc 87.891 (86.133)	lr 0.00059
Train [109][750/3239]	Time 0.223 (0.548)	Data Time 0.001 (0.051)	Loss 2.5981 (2.3602)	Entropy 0.53983 (0.54193)	Top-1 acc 66.016 (67.216)	Top-5 acc 82.031 (86.105)	lr 0.00059
Train [109][760/3239]	Time 0.318 (0.546)	Data Time 0.001 (0.051)	Loss 2.2182 (2.3596)	Entropy 0.53964 (0.54190)	Top-1 acc 71.094 (67.250)	Top-5 acc 88.672 (86.115)	lr 0.00059
Train [109][770/3239]	Time 0.232 (0.544)	Data Time 0.001 (0.050)	Loss 2.1898 (2.3596)	Entropy 0.53960 (0.54187)	Top-1 acc 72.266 (67.259)	Top-5 acc 88.672 (86.111)	lr 0.00059
Train [109][780/3239]	Time 0.226 (0.542)	Data Time 0.001 (0.049)	Loss 2.2448 (2.3587)	Entropy 0.53982 (0.54185)	Top-1 acc 68.750 (67.268)	Top-5 acc 87.500 (86.132)	lr 0.00059
Train [109][790/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.049)	Loss 2.3744 (2.3592)	Entropy 0.54003 (0.54182)	Top-1 acc 64.844 (67.255)	Top-5 acc 87.500 (86.128)	lr 0.00059
Train [109][800/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.048)	Loss 2.4465 (2.3596)	Entropy 0.53973 (0.54180)	Top-1 acc 64.453 (67.244)	Top-5 acc 81.641 (86.114)	lr 0.00059
Train [109][810/3239]	Time 0.256 (0.538)	Data Time 0.001 (0.048)	Loss 2.6771 (2.3604)	Entropy 0.54003 (0.54178)	Top-1 acc 62.109 (67.224)	Top-5 acc 83.594 (86.104)	lr 0.00059
Train [109][820/3239]	Time 0.226 (0.536)	Data Time 0.001 (0.047)	Loss 2.2595 (2.3592)	Entropy 0.54023 (0.54176)	Top-1 acc 68.750 (67.252)	Top-5 acc 88.672 (86.117)	lr 0.00059
Train [109][830/3239]	Time 0.336 (0.535)	Data Time 0.004 (0.046)	Loss 2.3583 (2.3587)	Entropy 0.54048 (0.54174)	Top-1 acc 65.625 (67.266)	Top-5 acc 87.891 (86.132)	lr 0.00059
Train [109][840/3239]	Time 0.268 (0.533)	Data Time 0.001 (0.046)	Loss 2.2445 (2.3584)	Entropy 0.54038 (0.54172)	Top-1 acc 69.922 (67.268)	Top-5 acc 89.844 (86.139)	lr 0.00059
Train [109][850/3239]	Time 0.284 (0.532)	Data Time 0.002 (0.045)	Loss 2.6277 (2.3582)	Entropy 0.54025 (0.54170)	Top-1 acc 60.156 (67.268)	Top-5 acc 80.859 (86.141)	lr 0.00059
Train [109][860/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.045)	Loss 2.3722 (2.3580)	Entropy 0.54034 (0.54169)	Top-1 acc 67.969 (67.279)	Top-5 acc 86.328 (86.138)	lr 0.00059
Train [109][870/3239]	Time 0.225 (0.531)	Data Time 0.001 (0.044)	Loss 2.4017 (2.3573)	Entropy 0.53998 (0.54167)	Top-1 acc 71.484 (67.308)	Top-5 acc 83.594 (86.143)	lr 0.00058
Train [109][880/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.044)	Loss 2.5496 (2.3579)	Entropy 0.54022 (0.54165)	Top-1 acc 63.672 (67.298)	Top-5 acc 81.641 (86.133)	lr 0.00058
Train [109][890/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.043)	Loss 2.2997 (2.3582)	Entropy 0.54004 (0.54163)	Top-1 acc 70.703 (67.291)	Top-5 acc 84.766 (86.122)	lr 0.00058
Train [109][900/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.043)	Loss 2.1842 (2.3584)	Entropy 0.53970 (0.54162)	Top-1 acc 71.875 (67.287)	Top-5 acc 88.672 (86.122)	lr 0.00058
Train [109][910/3239]	Time 0.231 (0.525)	Data Time 0.001 (0.042)	Loss 2.4220 (2.3585)	Entropy 0.53955 (0.54159)	Top-1 acc 66.797 (67.288)	Top-5 acc 85.547 (86.119)	lr 0.00058
Train [109][920/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.042)	Loss 2.5193 (2.3577)	Entropy 0.54005 (0.54157)	Top-1 acc 62.891 (67.311)	Top-5 acc 82.031 (86.129)	lr 0.00058
Train [109][930/3239]	Time 0.219 (0.522)	Data Time 0.001 (0.042)	Loss 2.4742 (2.3577)	Entropy 0.53988 (0.54156)	Top-1 acc 68.750 (67.314)	Top-5 acc 84.766 (86.129)	lr 0.00058
Train [109][940/3239]	Time 0.218 (0.521)	Data Time 0.001 (0.041)	Loss 2.6450 (2.3577)	Entropy 0.54008 (0.54154)	Top-1 acc 58.203 (67.305)	Top-5 acc 81.250 (86.131)	lr 0.00058
Train [109][950/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.041)	Loss 2.2252 (2.3578)	Entropy 0.53984 (0.54152)	Top-1 acc 69.922 (67.295)	Top-5 acc 87.891 (86.127)	lr 0.00058
Train [109][960/3239]	Time 0.235 (0.518)	Data Time 0.001 (0.040)	Loss 2.3914 (2.3576)	Entropy 0.53975 (0.54151)	Top-1 acc 65.625 (67.297)	Top-5 acc 86.328 (86.126)	lr 0.00058
Train [109][970/3239]	Time 0.275 (0.518)	Data Time 0.001 (0.040)	Loss 2.1359 (2.3570)	Entropy 0.53955 (0.54149)	Top-1 acc 75.391 (67.313)	Top-5 acc 89.062 (86.132)	lr 0.00058
Train [109][980/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.040)	Loss 2.2077 (2.3574)	Entropy 0.53981 (0.54147)	Top-1 acc 73.047 (67.308)	Top-5 acc 87.891 (86.117)	lr 0.00058
Train [109][990/3239]	Time 0.360 (0.515)	Data Time 0.001 (0.039)	Loss 2.1223 (2.3567)	Entropy 0.53940 (0.54145)	Top-1 acc 70.312 (67.325)	Top-5 acc 91.016 (86.131)	lr 0.00058
Train [109][1000/3239]	Time 0.244 (0.514)	Data Time 0.001 (0.039)	Loss 2.3474 (2.3567)	Entropy 0.53973 (0.54143)	Top-1 acc 68.359 (67.324)	Top-5 acc 87.500 (86.132)	lr 0.00058
Train [109][1010/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.038)	Loss 2.4451 (2.3569)	Entropy 0.53936 (0.54141)	Top-1 acc 62.891 (67.307)	Top-5 acc 85.156 (86.131)	lr 0.00058
Train [109][1020/3239]	Time 0.240 (0.513)	Data Time 0.001 (0.038)	Loss 2.5388 (2.3571)	Entropy 0.53941 (0.54139)	Top-1 acc 62.500 (67.309)	Top-5 acc 83.203 (86.126)	lr 0.00058
Train [109][1030/3239]	Time 0.248 (0.512)	Data Time 0.002 (0.038)	Loss 2.1559 (2.3567)	Entropy 0.53954 (0.54137)	Top-1 acc 71.094 (67.319)	Top-5 acc 91.016 (86.131)	lr 0.00058
Train [109][1040/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.037)	Loss 2.2491 (2.3567)	Entropy 0.53919 (0.54135)	Top-1 acc 70.312 (67.321)	Top-5 acc 88.281 (86.129)	lr 0.00058
Train [109][1050/3239]	Time 0.247 (0.511)	Data Time 0.001 (0.037)	Loss 2.7037 (2.3572)	Entropy 0.53907 (0.54133)	Top-1 acc 59.375 (67.317)	Top-5 acc 79.297 (86.118)	lr 0.00058
Train [109][1060/3239]	Time 0.324 (0.510)	Data Time 0.001 (0.037)	Loss 2.2069 (2.3569)	Entropy 0.53911 (0.54131)	Top-1 acc 69.531 (67.319)	Top-5 acc 87.500 (86.124)	lr 0.00058
Train [109][1070/3239]	Time 0.278 (0.509)	Data Time 0.001 (0.036)	Loss 2.3582 (2.3568)	Entropy 0.53913 (0.54129)	Top-1 acc 69.922 (67.321)	Top-5 acc 85.547 (86.124)	lr 0.00058
Train [109][1080/3239]	Time 0.230 (0.508)	Data Time 0.001 (0.036)	Loss 2.5031 (2.3566)	Entropy 0.53902 (0.54127)	Top-1 acc 60.938 (67.327)	Top-5 acc 82.812 (86.120)	lr 0.00058
Train [109][1090/3239]	Time 0.230 (0.507)	Data Time 0.001 (0.036)	Loss 2.1725 (2.3566)	Entropy 0.53939 (0.54125)	Top-1 acc 71.875 (67.332)	Top-5 acc 89.062 (86.117)	lr 0.00058
Train [109][1100/3239]	Time 0.244 (0.506)	Data Time 0.001 (0.035)	Loss 2.2592 (2.3564)	Entropy 0.53964 (0.54123)	Top-1 acc 69.531 (67.330)	Top-5 acc 87.109 (86.120)	lr 0.00058
Train [109][1110/3239]	Time 0.217 (0.506)	Data Time 0.001 (0.035)	Loss 2.7108 (2.3568)	Entropy 0.53942 (0.54122)	Top-1 acc 60.156 (67.320)	Top-5 acc 82.031 (86.118)	lr 0.00058
Train [109][1120/3239]	Time 0.239 (0.505)	Data Time 0.001 (0.035)	Loss 2.1962 (2.3560)	Entropy 0.53956 (0.54120)	Top-1 acc 71.094 (67.345)	Top-5 acc 87.500 (86.128)	lr 0.00058
Train [109][1130/3239]	Time 0.399 (0.548)	Data Time 0.005 (0.035)	Loss 2.0525 (2.3559)	Entropy 0.53944 (0.54119)	Top-1 acc 76.562 (67.345)	Top-5 acc 92.188 (86.127)	lr 0.00058
Train [109][1140/3239]	Time 0.239 (0.548)	Data Time 0.002 (0.034)	Loss 2.5104 (2.3563)	Entropy 0.53947 (0.54117)	Top-1 acc 58.594 (67.336)	Top-5 acc 85.547 (86.127)	lr 0.00058
Train [109][1150/3239]	Time 0.339 (0.547)	Data Time 0.001 (0.034)	Loss 2.4155 (2.3562)	Entropy 0.53966 (0.54116)	Top-1 acc 66.016 (67.343)	Top-5 acc 86.328 (86.134)	lr 0.00058
Train [109][1160/3239]	Time 0.294 (0.547)	Data Time 0.002 (0.034)	Loss 2.2581 (2.3564)	Entropy 0.53970 (0.54115)	Top-1 acc 69.531 (67.339)	Top-5 acc 87.109 (86.129)	lr 0.00058
Train [109][1170/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.033)	Loss 2.3346 (2.3566)	Entropy 0.53976 (0.54113)	Top-1 acc 67.969 (67.336)	Top-5 acc 87.500 (86.128)	lr 0.00058
Train [109][1180/3239]	Time 0.234 (0.545)	Data Time 0.001 (0.033)	Loss 2.3665 (2.3563)	Entropy 0.54003 (0.54112)	Top-1 acc 67.969 (67.344)	Top-5 acc 86.328 (86.131)	lr 0.00058
Train [109][1190/3239]	Time 0.233 (0.544)	Data Time 0.001 (0.033)	Loss 2.2351 (2.3568)	Entropy 0.54000 (0.54112)	Top-1 acc 69.141 (67.335)	Top-5 acc 89.453 (86.118)	lr 0.00058
Train [109][1200/3239]	Time 0.227 (0.543)	Data Time 0.001 (0.033)	Loss 2.2630 (2.3569)	Entropy 0.53985 (0.54111)	Top-1 acc 70.312 (67.329)	Top-5 acc 87.891 (86.114)	lr 0.00057
Train [109][1210/3239]	Time 0.224 (0.542)	Data Time 0.001 (0.032)	Loss 2.4090 (2.3566)	Entropy 0.53976 (0.54109)	Top-1 acc 66.016 (67.336)	Top-5 acc 85.156 (86.121)	lr 0.00057
Train [109][1220/3239]	Time 0.357 (0.541)	Data Time 0.001 (0.032)	Loss 2.5721 (2.3564)	Entropy 0.53921 (0.54108)	Top-1 acc 62.109 (67.338)	Top-5 acc 83.594 (86.127)	lr 0.00057
Train [109][1230/3239]	Time 0.234 (0.540)	Data Time 0.001 (0.032)	Loss 2.3380 (2.3559)	Entropy 0.53904 (0.54107)	Top-1 acc 69.531 (67.348)	Top-5 acc 86.328 (86.136)	lr 0.00057
Train [109][1240/3239]	Time 0.226 (0.539)	Data Time 0.001 (0.032)	Loss 2.5172 (2.3561)	Entropy 0.53920 (0.54105)	Top-1 acc 60.547 (67.342)	Top-5 acc 85.547 (86.130)	lr 0.00057
Train [109][1250/3239]	Time 0.221 (0.538)	Data Time 0.001 (0.031)	Loss 2.2678 (2.3563)	Entropy 0.53956 (0.54104)	Top-1 acc 69.922 (67.336)	Top-5 acc 87.500 (86.127)	lr 0.00057
Train [109][1260/3239]	Time 0.225 (0.537)	Data Time 0.001 (0.031)	Loss 2.3342 (2.3562)	Entropy 0.53980 (0.54103)	Top-1 acc 68.359 (67.336)	Top-5 acc 87.500 (86.129)	lr 0.00057
Train [109][1270/3239]	Time 0.218 (0.536)	Data Time 0.001 (0.031)	Loss 2.5833 (2.3565)	Entropy 0.53969 (0.54102)	Top-1 acc 62.891 (67.331)	Top-5 acc 81.250 (86.126)	lr 0.00057
Train [109][1280/3239]	Time 0.227 (0.534)	Data Time 0.001 (0.031)	Loss 2.3288 (2.3567)	Entropy 0.53983 (0.54101)	Top-1 acc 68.359 (67.327)	Top-5 acc 86.328 (86.123)	lr 0.00057
Train [109][1290/3239]	Time 0.256 (0.534)	Data Time 0.001 (0.030)	Loss 2.5353 (2.3565)	Entropy 0.53996 (0.54100)	Top-1 acc 64.062 (67.334)	Top-5 acc 83.203 (86.139)	lr 0.00057
Train [109][1300/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.030)	Loss 2.3346 (2.3562)	Entropy 0.53984 (0.54099)	Top-1 acc 64.453 (67.340)	Top-5 acc 87.891 (86.141)	lr 0.00057
Train [109][1310/3239]	Time 0.401 (0.532)	Data Time 0.001 (0.030)	Loss 2.2098 (2.3561)	Entropy 0.53982 (0.54098)	Top-1 acc 72.656 (67.338)	Top-5 acc 87.891 (86.142)	lr 0.00057
Train [109][1320/3239]	Time 0.270 (0.531)	Data Time 0.001 (0.030)	Loss 2.3380 (2.3558)	Entropy 0.53969 (0.54097)	Top-1 acc 66.797 (67.357)	Top-5 acc 85.156 (86.144)	lr 0.00057
Train [109][1330/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.030)	Loss 2.5934 (2.3568)	Entropy 0.53973 (0.54096)	Top-1 acc 58.594 (67.329)	Top-5 acc 82.812 (86.132)	lr 0.00057
Train [109][1340/3239]	Time 0.275 (0.530)	Data Time 0.001 (0.029)	Loss 2.3174 (2.3570)	Entropy 0.53940 (0.54095)	Top-1 acc 69.922 (67.328)	Top-5 acc 87.891 (86.132)	lr 0.00057
Train [109][1350/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.029)	Loss 2.4965 (2.3565)	Entropy 0.53948 (0.54094)	Top-1 acc 65.234 (67.339)	Top-5 acc 83.203 (86.138)	lr 0.00057
Train [109][1360/3239]	Time 0.248 (0.528)	Data Time 0.001 (0.029)	Loss 2.1574 (2.3563)	Entropy 0.53914 (0.54093)	Top-1 acc 74.609 (67.341)	Top-5 acc 90.625 (86.144)	lr 0.00057
Train [109][1370/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.029)	Loss 2.4336 (2.3562)	Entropy 0.53894 (0.54091)	Top-1 acc 67.188 (67.346)	Top-5 acc 86.719 (86.147)	lr 0.00057
Train [109][1380/3239]	Time 0.332 (0.527)	Data Time 0.001 (0.029)	Loss 2.1370 (2.3561)	Entropy 0.53871 (0.54090)	Top-1 acc 73.047 (67.353)	Top-5 acc 87.500 (86.146)	lr 0.00057
Train [109][1390/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.028)	Loss 2.8292 (2.3566)	Entropy 0.53856 (0.54088)	Top-1 acc 54.688 (67.342)	Top-5 acc 76.953 (86.140)	lr 0.00057
Train [109][1400/3239]	Time 0.254 (0.525)	Data Time 0.001 (0.028)	Loss 2.3626 (2.3569)	Entropy 0.53858 (0.54087)	Top-1 acc 67.578 (67.337)	Top-5 acc 84.375 (86.131)	lr 0.00057
Train [109][1410/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.028)	Loss 2.2753 (2.3568)	Entropy 0.53854 (0.54085)	Top-1 acc 71.484 (67.338)	Top-5 acc 88.672 (86.137)	lr 0.00057
Train [109][1420/3239]	Time 0.238 (0.524)	Data Time 0.001 (0.028)	Loss 2.3474 (2.3567)	Entropy 0.53867 (0.54083)	Top-1 acc 64.844 (67.343)	Top-5 acc 87.500 (86.140)	lr 0.00057
Train [109][1430/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.028)	Loss 2.7460 (2.3567)	Entropy 0.53863 (0.54082)	Top-1 acc 57.812 (67.339)	Top-5 acc 79.688 (86.141)	lr 0.00057
Train [109][1440/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.027)	Loss 2.3782 (2.3564)	Entropy 0.53869 (0.54080)	Top-1 acc 69.531 (67.350)	Top-5 acc 87.891 (86.151)	lr 0.00057
Train [109][1450/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.027)	Loss 2.3007 (2.3563)	Entropy 0.53849 (0.54079)	Top-1 acc 66.797 (67.344)	Top-5 acc 88.281 (86.152)	lr 0.00057
Train [109][1460/3239]	Time 0.239 (0.521)	Data Time 0.001 (0.027)	Loss 2.2835 (2.3560)	Entropy 0.53848 (0.54077)	Top-1 acc 70.703 (67.348)	Top-5 acc 88.672 (86.155)	lr 0.00057
Train [109][1470/3239]	Time 0.316 (0.520)	Data Time 0.001 (0.027)	Loss 2.3463 (2.3559)	Entropy 0.53867 (0.54076)	Top-1 acc 67.578 (67.350)	Top-5 acc 85.938 (86.156)	lr 0.00057
Train [109][1480/3239]	Time 0.236 (0.520)	Data Time 0.001 (0.027)	Loss 2.2140 (2.3559)	Entropy 0.53854 (0.54074)	Top-1 acc 71.875 (67.352)	Top-5 acc 89.453 (86.153)	lr 0.00057
Train [109][1490/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.027)	Loss 2.3173 (2.3559)	Entropy 0.53832 (0.54073)	Top-1 acc 71.094 (67.351)	Top-5 acc 85.547 (86.147)	lr 0.00057
Train [109][1500/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.026)	Loss 2.1827 (2.3556)	Entropy 0.53850 (0.54071)	Top-1 acc 72.266 (67.357)	Top-5 acc 87.500 (86.145)	lr 0.00057
Train [109][1510/3239]	Time 0.226 (0.517)	Data Time 0.001 (0.026)	Loss 2.3399 (2.3553)	Entropy 0.53864 (0.54070)	Top-1 acc 67.188 (67.358)	Top-5 acc 83.984 (86.148)	lr 0.00057
Train [109][1520/3239]	Time 0.263 (0.517)	Data Time 0.001 (0.026)	Loss 2.2329 (2.3555)	Entropy 0.53879 (0.54068)	Top-1 acc 71.484 (67.356)	Top-5 acc 88.672 (86.150)	lr 0.00057
Train [109][1530/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.026)	Loss 2.3071 (2.3557)	Entropy 0.53839 (0.54067)	Top-1 acc 68.750 (67.347)	Top-5 acc 86.719 (86.148)	lr 0.00056
Train [109][1540/3239]	Time 0.317 (0.515)	Data Time 0.001 (0.026)	Loss 2.5421 (2.3562)	Entropy 0.53839 (0.54066)	Top-1 acc 61.719 (67.336)	Top-5 acc 83.203 (86.139)	lr 0.00056
Train [109][1550/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.026)	Loss 2.2525 (2.3565)	Entropy 0.53826 (0.54064)	Top-1 acc 69.141 (67.326)	Top-5 acc 87.500 (86.134)	lr 0.00056
Train [109][1560/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.025)	Loss 2.3768 (2.3565)	Entropy 0.53812 (0.54062)	Top-1 acc 67.188 (67.325)	Top-5 acc 85.156 (86.131)	lr 0.00056
Train [109][1570/3239]	Time 0.229 (0.513)	Data Time 0.001 (0.025)	Loss 2.3234 (2.3566)	Entropy 0.53815 (0.54061)	Top-1 acc 65.625 (67.324)	Top-5 acc 86.719 (86.131)	lr 0.00056
Train [109][1580/3239]	Time 0.229 (0.512)	Data Time 0.001 (0.025)	Loss 2.4091 (2.3566)	Entropy 0.53851 (0.54059)	Top-1 acc 65.234 (67.320)	Top-5 acc 83.594 (86.130)	lr 0.00056
Train [109][1590/3239]	Time 0.255 (0.512)	Data Time 0.001 (0.025)	Loss 2.2408 (2.3561)	Entropy 0.53857 (0.54058)	Top-1 acc 71.094 (67.332)	Top-5 acc 85.938 (86.132)	lr 0.00056
Train [109][1600/3239]	Time 0.256 (0.511)	Data Time 0.001 (0.025)	Loss 2.2962 (2.3560)	Entropy 0.53844 (0.54057)	Top-1 acc 69.922 (67.338)	Top-5 acc 89.453 (86.134)	lr 0.00056
Train [109][1610/3239]	Time 0.256 (0.511)	Data Time 0.001 (0.025)	Loss 2.2353 (2.3559)	Entropy 0.53871 (0.54056)	Top-1 acc 72.266 (67.335)	Top-5 acc 87.891 (86.137)	lr 0.00056
Train [109][1620/3239]	Time 0.219 (0.510)	Data Time 0.001 (0.025)	Loss 2.1329 (2.3559)	Entropy 0.53874 (0.54055)	Top-1 acc 73.438 (67.334)	Top-5 acc 90.625 (86.138)	lr 0.00056
Train [109][1630/3239]	Time 0.228 (0.509)	Data Time 0.001 (0.024)	Loss 2.3941 (2.3563)	Entropy 0.53856 (0.54053)	Top-1 acc 68.750 (67.322)	Top-5 acc 83.984 (86.130)	lr 0.00056
Train [109][1640/3239]	Time 0.228 (0.509)	Data Time 0.001 (0.024)	Loss 2.3538 (2.3562)	Entropy 0.53875 (0.54052)	Top-1 acc 66.797 (67.322)	Top-5 acc 86.328 (86.127)	lr 0.00056
Train [109][1650/3239]	Time 0.228 (0.508)	Data Time 0.001 (0.024)	Loss 2.4262 (2.3561)	Entropy 0.53853 (0.54051)	Top-1 acc 65.234 (67.325)	Top-5 acc 84.766 (86.126)	lr 0.00056
Train [109][1660/3239]	Time 0.249 (0.507)	Data Time 0.001 (0.024)	Loss 2.3195 (2.3563)	Entropy 0.53889 (0.54050)	Top-1 acc 66.797 (67.321)	Top-5 acc 85.547 (86.122)	lr 0.00056
Train [109][1670/3239]	Time 0.236 (0.507)	Data Time 0.001 (0.024)	Loss 2.2132 (2.3561)	Entropy 0.53880 (0.54049)	Top-1 acc 69.922 (67.326)	Top-5 acc 88.281 (86.127)	lr 0.00056
Train [109][1680/3239]	Time 0.220 (0.506)	Data Time 0.001 (0.024)	Loss 2.3051 (2.3559)	Entropy 0.53878 (0.54048)	Top-1 acc 64.844 (67.326)	Top-5 acc 87.891 (86.127)	lr 0.00056
Train [109][1690/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.024)	Loss 2.3931 (2.3557)	Entropy 0.53904 (0.54047)	Top-1 acc 67.969 (67.331)	Top-5 acc 84.375 (86.133)	lr 0.00056
Train [109][1700/3239]	Time 0.321 (0.505)	Data Time 0.001 (0.024)	Loss 2.2796 (2.3554)	Entropy 0.53947 (0.54046)	Top-1 acc 69.141 (67.339)	Top-5 acc 86.719 (86.141)	lr 0.00056
Train [109][1710/3239]	Time 0.225 (0.504)	Data Time 0.001 (0.023)	Loss 2.2718 (2.3554)	Entropy 0.53957 (0.54046)	Top-1 acc 69.922 (67.334)	Top-5 acc 87.500 (86.139)	lr 0.00056
Train [109][1720/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.023)	Loss 2.4765 (2.3554)	Entropy 0.53930 (0.54045)	Top-1 acc 66.016 (67.335)	Top-5 acc 83.984 (86.143)	lr 0.00056
Train [109][1730/3239]	Time 0.227 (0.503)	Data Time 0.001 (0.023)	Loss 2.2500 (2.3553)	Entropy 0.53956 (0.54045)	Top-1 acc 68.750 (67.338)	Top-5 acc 86.328 (86.141)	lr 0.00056
Train [109][1740/3239]	Time 0.232 (0.503)	Data Time 0.001 (0.023)	Loss 2.2878 (2.3552)	Entropy 0.53937 (0.54044)	Top-1 acc 70.312 (67.338)	Top-5 acc 87.109 (86.144)	lr 0.00056
Train [109][1750/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.023)	Loss 2.2852 (2.3553)	Entropy 0.53896 (0.54043)	Top-1 acc 66.797 (67.332)	Top-5 acc 88.281 (86.143)	lr 0.00056
Train [109][1760/3239]	Time 0.233 (0.502)	Data Time 0.001 (0.023)	Loss 2.4483 (2.3559)	Entropy 0.53897 (0.54042)	Top-1 acc 68.750 (67.317)	Top-5 acc 83.594 (86.134)	lr 0.00056
Train [109][1770/3239]	Time 0.325 (0.501)	Data Time 0.001 (0.023)	Loss 2.3182 (2.3558)	Entropy 0.53861 (0.54042)	Top-1 acc 71.484 (67.317)	Top-5 acc 85.547 (86.133)	lr 0.00056
Train [109][1780/3239]	Time 0.231 (0.501)	Data Time 0.001 (0.023)	Loss 2.2210 (2.3558)	Entropy 0.53868 (0.54041)	Top-1 acc 69.531 (67.316)	Top-5 acc 88.672 (86.133)	lr 0.00056
Train [109][1790/3239]	Time 0.295 (0.529)	Data Time 0.002 (0.022)	Loss 2.2813 (2.3560)	Entropy 0.53894 (0.54040)	Top-1 acc 71.094 (67.317)	Top-5 acc 85.938 (86.129)	lr 0.00056
Train [109][1800/3239]	Time 0.242 (0.529)	Data Time 0.002 (0.022)	Loss 2.2524 (2.3558)	Entropy 0.53925 (0.54039)	Top-1 acc 65.234 (67.320)	Top-5 acc 88.281 (86.129)	lr 0.00056
Train [109][1810/3239]	Time 0.237 (0.528)	Data Time 0.001 (0.022)	Loss 2.3173 (2.3558)	Entropy 0.53913 (0.54038)	Top-1 acc 72.656 (67.324)	Top-5 acc 85.938 (86.129)	lr 0.00056
Train [109][1820/3239]	Time 0.252 (0.527)	Data Time 0.001 (0.022)	Loss 2.1587 (2.3554)	Entropy 0.53949 (0.54038)	Top-1 acc 73.047 (67.334)	Top-5 acc 87.109 (86.139)	lr 0.00056
Train [109][1830/3239]	Time 0.255 (0.527)	Data Time 0.001 (0.022)	Loss 2.2828 (2.3550)	Entropy 0.53918 (0.54037)	Top-1 acc 68.359 (67.342)	Top-5 acc 88.672 (86.147)	lr 0.00056
Train [109][1840/3239]	Time 0.235 (0.526)	Data Time 0.001 (0.022)	Loss 2.4471 (2.3549)	Entropy 0.53921 (0.54036)	Top-1 acc 65.625 (67.338)	Top-5 acc 83.594 (86.148)	lr 0.00056
Train [109][1850/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.022)	Loss 2.4436 (2.3551)	Entropy 0.53957 (0.54036)	Top-1 acc 66.797 (67.330)	Top-5 acc 85.156 (86.150)	lr 0.00056
Train [109][1860/3239]	Time 0.352 (0.525)	Data Time 0.001 (0.022)	Loss 2.2964 (2.3551)	Entropy 0.53954 (0.54035)	Top-1 acc 68.359 (67.325)	Top-5 acc 85.156 (86.151)	lr 0.00056
Train [109][1870/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.022)	Loss 2.4353 (2.3556)	Entropy 0.53950 (0.54035)	Top-1 acc 67.969 (67.318)	Top-5 acc 84.375 (86.146)	lr 0.00055
Train [109][1880/3239]	Time 0.227 (0.524)	Data Time 0.001 (0.021)	Loss 2.1326 (2.3552)	Entropy 0.53965 (0.54035)	Top-1 acc 71.484 (67.325)	Top-5 acc 88.672 (86.152)	lr 0.00055
Train [109][1890/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.021)	Loss 2.2474 (2.3549)	Entropy 0.53973 (0.54034)	Top-1 acc 69.922 (67.334)	Top-5 acc 89.062 (86.159)	lr 0.00055
Train [109][1900/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.021)	Loss 2.2579 (2.3548)	Entropy 0.53978 (0.54034)	Top-1 acc 71.875 (67.335)	Top-5 acc 89.062 (86.160)	lr 0.00055
Train [109][1910/3239]	Time 0.245 (0.522)	Data Time 0.002 (0.021)	Loss 2.4796 (2.3548)	Entropy 0.53997 (0.54034)	Top-1 acc 65.234 (67.340)	Top-5 acc 83.594 (86.163)	lr 0.00055
Train [109][1920/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.021)	Loss 2.3921 (2.3548)	Entropy 0.53999 (0.54033)	Top-1 acc 62.891 (67.336)	Top-5 acc 85.156 (86.160)	lr 0.00055
Train [109][1930/3239]	Time 0.311 (0.521)	Data Time 0.001 (0.021)	Loss 2.0752 (2.3547)	Entropy 0.53929 (0.54033)	Top-1 acc 77.344 (67.338)	Top-5 acc 91.016 (86.161)	lr 0.00055
Train [109][1940/3239]	Time 0.225 (0.520)	Data Time 0.001 (0.021)	Loss 2.3532 (2.3549)	Entropy 0.53879 (0.54032)	Top-1 acc 67.578 (67.332)	Top-5 acc 86.719 (86.158)	lr 0.00055
Train [109][1950/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.021)	Loss 2.3140 (2.3551)	Entropy 0.53879 (0.54032)	Top-1 acc 67.969 (67.330)	Top-5 acc 87.891 (86.155)	lr 0.00055
Train [109][1960/3239]	Time 0.266 (0.519)	Data Time 0.001 (0.021)	Loss 2.2442 (2.3553)	Entropy 0.53884 (0.54031)	Top-1 acc 67.578 (67.326)	Top-5 acc 89.062 (86.152)	lr 0.00055
Train [109][1970/3239]	Time 0.342 (0.519)	Data Time 0.002 (0.021)	Loss 2.5724 (2.3555)	Entropy 0.53851 (0.54030)	Top-1 acc 64.844 (67.321)	Top-5 acc 83.203 (86.155)	lr 0.00055
Train [109][1980/3239]	Time 0.315 (0.520)	Data Time 0.002 (0.020)	Loss 2.2746 (2.3559)	Entropy 0.53866 (0.54029)	Top-1 acc 65.625 (67.313)	Top-5 acc 90.625 (86.150)	lr 0.00055
Train [109][1990/3239]	Time 0.246 (0.519)	Data Time 0.001 (0.020)	Loss 2.2975 (2.3556)	Entropy 0.53850 (0.54028)	Top-1 acc 68.750 (67.318)	Top-5 acc 87.891 (86.155)	lr 0.00055
Train [109][2000/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.020)	Loss 2.4660 (2.3559)	Entropy 0.53852 (0.54027)	Top-1 acc 62.500 (67.312)	Top-5 acc 85.938 (86.156)	lr 0.00055
Train [109][2010/3239]	Time 0.238 (0.518)	Data Time 0.001 (0.020)	Loss 2.4262 (2.3562)	Entropy 0.53844 (0.54026)	Top-1 acc 63.281 (67.302)	Top-5 acc 85.547 (86.150)	lr 0.00055
Train [109][2020/3239]	Time 0.245 (0.518)	Data Time 0.001 (0.020)	Loss 2.4990 (2.3566)	Entropy 0.53793 (0.54025)	Top-1 acc 62.891 (67.291)	Top-5 acc 84.375 (86.142)	lr 0.00055
Train [109][2030/3239]	Time 0.236 (0.517)	Data Time 0.001 (0.020)	Loss 2.5384 (2.3567)	Entropy 0.53794 (0.54024)	Top-1 acc 62.500 (67.291)	Top-5 acc 82.812 (86.141)	lr 0.00055
Train [109][2040/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.020)	Loss 2.3938 (2.3569)	Entropy 0.53810 (0.54023)	Top-1 acc 61.328 (67.285)	Top-5 acc 85.156 (86.136)	lr 0.00055
Train [109][2050/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.020)	Loss 2.3903 (2.3567)	Entropy 0.53830 (0.54022)	Top-1 acc 67.188 (67.287)	Top-5 acc 83.203 (86.135)	lr 0.00055
Train [109][2060/3239]	Time 0.243 (0.516)	Data Time 0.001 (0.020)	Loss 2.6540 (2.3570)	Entropy 0.53803 (0.54021)	Top-1 acc 62.891 (67.277)	Top-5 acc 83.984 (86.136)	lr 0.00055
Train [109][2070/3239]	Time 0.226 (0.515)	Data Time 0.001 (0.020)	Loss 2.7337 (2.3571)	Entropy 0.53774 (0.54020)	Top-1 acc 56.641 (67.274)	Top-5 acc 77.344 (86.134)	lr 0.00055
Train [109][2080/3239]	Time 0.235 (0.515)	Data Time 0.001 (0.020)	Loss 2.1995 (2.3570)	Entropy 0.53736 (0.54019)	Top-1 acc 71.484 (67.276)	Top-5 acc 86.328 (86.135)	lr 0.00055
Train [109][2090/3239]	Time 0.345 (0.514)	Data Time 0.001 (0.019)	Loss 2.4783 (2.3569)	Entropy 0.53745 (0.54017)	Top-1 acc 67.578 (67.282)	Top-5 acc 83.594 (86.136)	lr 0.00055
Train [109][2100/3239]	Time 0.228 (0.514)	Data Time 0.001 (0.019)	Loss 2.4375 (2.3570)	Entropy 0.53722 (0.54016)	Top-1 acc 65.625 (67.284)	Top-5 acc 83.594 (86.134)	lr 0.00055
Train [109][2110/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.019)	Loss 2.3340 (2.3569)	Entropy 0.53706 (0.54015)	Top-1 acc 66.016 (67.283)	Top-5 acc 86.719 (86.137)	lr 0.00055
Train [109][2120/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.019)	Loss 2.1121 (2.3569)	Entropy 0.53678 (0.54013)	Top-1 acc 72.266 (67.280)	Top-5 acc 91.016 (86.138)	lr 0.00055
Train [109][2130/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.019)	Loss 2.2017 (2.3567)	Entropy 0.53704 (0.54012)	Top-1 acc 76.172 (67.290)	Top-5 acc 89.453 (86.138)	lr 0.00055
Train [109][2140/3239]	Time 0.241 (0.512)	Data Time 0.001 (0.019)	Loss 2.2821 (2.3568)	Entropy 0.53680 (0.54010)	Top-1 acc 65.234 (67.287)	Top-5 acc 87.109 (86.138)	lr 0.00055
Train [109][2150/3239]	Time 0.270 (0.511)	Data Time 0.001 (0.019)	Loss 2.3570 (2.3568)	Entropy 0.53709 (0.54009)	Top-1 acc 63.672 (67.283)	Top-5 acc 85.547 (86.137)	lr 0.00055
Train [109][2160/3239]	Time 0.355 (0.511)	Data Time 0.001 (0.019)	Loss 2.3209 (2.3567)	Entropy 0.53699 (0.54007)	Top-1 acc 70.703 (67.289)	Top-5 acc 86.328 (86.138)	lr 0.00055
Train [109][2170/3239]	Time 0.231 (0.511)	Data Time 0.001 (0.019)	Loss 2.4674 (2.3568)	Entropy 0.53690 (0.54006)	Top-1 acc 66.406 (67.290)	Top-5 acc 82.812 (86.136)	lr 0.00055
Train [109][2180/3239]	Time 0.237 (0.510)	Data Time 0.001 (0.019)	Loss 2.3301 (2.3568)	Entropy 0.53681 (0.54004)	Top-1 acc 69.141 (67.288)	Top-5 acc 84.766 (86.135)	lr 0.00055
Train [109][2190/3239]	Time 0.261 (0.510)	Data Time 0.001 (0.019)	Loss 3.0834 (2.3574)	Entropy 0.53694 (0.54003)	Top-1 acc 52.734 (67.276)	Top-5 acc 73.828 (86.126)	lr 0.00055
Train [109][2200/3239]	Time 0.236 (0.509)	Data Time 0.001 (0.019)	Loss 2.2856 (2.3574)	Entropy 0.53700 (0.54002)	Top-1 acc 70.703 (67.278)	Top-5 acc 86.719 (86.124)	lr 0.00055
Train [109][2210/3239]	Time 0.225 (0.509)	Data Time 0.001 (0.019)	Loss 2.1520 (2.3573)	Entropy 0.53715 (0.54000)	Top-1 acc 73.047 (67.284)	Top-5 acc 91.406 (86.124)	lr 0.00054
Train [109][2220/3239]	Time 0.248 (0.509)	Data Time 0.001 (0.018)	Loss 2.2910 (2.3574)	Entropy 0.53690 (0.53999)	Top-1 acc 69.531 (67.277)	Top-5 acc 87.500 (86.123)	lr 0.00054
Train [109][2230/3239]	Time 0.227 (0.508)	Data Time 0.001 (0.018)	Loss 2.1841 (2.3571)	Entropy 0.53658 (0.53997)	Top-1 acc 67.969 (67.282)	Top-5 acc 90.625 (86.130)	lr 0.00054
Train [109][2240/3239]	Time 0.298 (0.508)	Data Time 0.001 (0.018)	Loss 2.2277 (2.3573)	Entropy 0.53680 (0.53996)	Top-1 acc 71.484 (67.281)	Top-5 acc 88.672 (86.128)	lr 0.00054
Train [109][2250/3239]	Time 0.321 (0.507)	Data Time 0.001 (0.018)	Loss 2.3443 (2.3571)	Entropy 0.53684 (0.53995)	Top-1 acc 67.969 (67.286)	Top-5 acc 84.766 (86.132)	lr 0.00054
Train [109][2260/3239]	Time 0.232 (0.507)	Data Time 0.001 (0.018)	Loss 2.2078 (2.3571)	Entropy 0.53661 (0.53993)	Top-1 acc 71.094 (67.285)	Top-5 acc 85.938 (86.131)	lr 0.00054
Train [109][2270/3239]	Time 0.228 (0.506)	Data Time 0.001 (0.018)	Loss 2.2635 (2.3571)	Entropy 0.53621 (0.53992)	Top-1 acc 71.875 (67.289)	Top-5 acc 84.766 (86.128)	lr 0.00054
Train [109][2280/3239]	Time 0.230 (0.506)	Data Time 0.001 (0.018)	Loss 2.4235 (2.3571)	Entropy 0.53599 (0.53990)	Top-1 acc 64.844 (67.289)	Top-5 acc 83.594 (86.126)	lr 0.00054
Train [109][2290/3239]	Time 0.237 (0.506)	Data Time 0.001 (0.018)	Loss 2.2285 (2.3571)	Entropy 0.53593 (0.53988)	Top-1 acc 72.656 (67.286)	Top-5 acc 87.109 (86.128)	lr 0.00054
Train [109][2300/3239]	Time 0.235 (0.505)	Data Time 0.001 (0.018)	Loss 2.1034 (2.3570)	Entropy 0.53564 (0.53987)	Top-1 acc 73.828 (67.290)	Top-5 acc 89.062 (86.129)	lr 0.00054
Train [109][2310/3239]	Time 0.236 (0.505)	Data Time 0.001 (0.018)	Loss 2.2321 (2.3570)	Entropy 0.53588 (0.53985)	Top-1 acc 70.703 (67.292)	Top-5 acc 89.453 (86.128)	lr 0.00054
Train [109][2320/3239]	Time 0.321 (0.505)	Data Time 0.001 (0.018)	Loss 2.4121 (2.3571)	Entropy 0.53562 (0.53983)	Top-1 acc 69.141 (67.294)	Top-5 acc 85.547 (86.127)	lr 0.00054
Train [109][2330/3239]	Time 0.233 (0.504)	Data Time 0.001 (0.018)	Loss 2.2554 (2.3569)	Entropy 0.53575 (0.53981)	Top-1 acc 69.531 (67.293)	Top-5 acc 88.281 (86.131)	lr 0.00054
Train [109][2340/3239]	Time 0.225 (0.504)	Data Time 0.001 (0.018)	Loss 2.4155 (2.3572)	Entropy 0.53576 (0.53979)	Top-1 acc 66.016 (67.282)	Top-5 acc 85.547 (86.125)	lr 0.00054
Train [109][2350/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.018)	Loss 2.3728 (2.3572)	Entropy 0.53569 (0.53978)	Top-1 acc 65.625 (67.281)	Top-5 acc 86.719 (86.125)	lr 0.00054
Train [109][2360/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.017)	Loss 2.6278 (2.3574)	Entropy 0.53563 (0.53976)	Top-1 acc 62.109 (67.274)	Top-5 acc 82.031 (86.123)	lr 0.00054
Train [109][2370/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.017)	Loss 2.3555 (2.3573)	Entropy 0.53544 (0.53974)	Top-1 acc 63.672 (67.274)	Top-5 acc 87.109 (86.124)	lr 0.00054
Train [109][2380/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.017)	Loss 2.4077 (2.3571)	Entropy 0.53562 (0.53972)	Top-1 acc 66.406 (67.281)	Top-5 acc 85.938 (86.127)	lr 0.00054
Train [109][2390/3239]	Time 0.222 (0.502)	Data Time 0.001 (0.017)	Loss 2.4438 (2.3570)	Entropy 0.53588 (0.53971)	Top-1 acc 67.578 (67.286)	Top-5 acc 84.375 (86.124)	lr 0.00054
Train [109][2400/3239]	Time 0.270 (0.501)	Data Time 0.001 (0.017)	Loss 2.2962 (2.3567)	Entropy 0.53609 (0.53969)	Top-1 acc 67.578 (67.294)	Top-5 acc 87.891 (86.130)	lr 0.00054
Train [109][2410/3239]	Time 0.248 (0.501)	Data Time 0.001 (0.017)	Loss 2.1982 (2.3564)	Entropy 0.53613 (0.53968)	Top-1 acc 69.141 (67.302)	Top-5 acc 89.844 (86.137)	lr 0.00054
Train [109][2420/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.017)	Loss 2.3943 (2.3565)	Entropy 0.53584 (0.53966)	Top-1 acc 66.016 (67.302)	Top-5 acc 85.938 (86.138)	lr 0.00054
Train [109][2430/3239]	Time 0.231 (0.500)	Data Time 0.001 (0.017)	Loss 2.2721 (2.3564)	Entropy 0.53542 (0.53965)	Top-1 acc 68.750 (67.304)	Top-5 acc 85.547 (86.136)	lr 0.00054
Train [109][2440/3239]	Time 0.422 (0.522)	Data Time 0.004 (0.017)	Loss 2.4164 (2.3564)	Entropy 0.53526 (0.53963)	Top-1 acc 67.969 (67.306)	Top-5 acc 83.594 (86.134)	lr 0.00054
Train [109][2450/3239]	Time 0.229 (0.521)	Data Time 0.002 (0.017)	Loss 2.8796 (2.3566)	Entropy 0.53492 (0.53961)	Top-1 acc 50.781 (67.305)	Top-5 acc 78.125 (86.131)	lr 0.00054
Train [109][2460/3239]	Time 0.231 (0.521)	Data Time 0.001 (0.017)	Loss 2.4983 (2.3566)	Entropy 0.53480 (0.53959)	Top-1 acc 63.281 (67.305)	Top-5 acc 84.766 (86.131)	lr 0.00054
Train [109][2470/3239]	Time 0.236 (0.520)	Data Time 0.001 (0.017)	Loss 2.3380 (2.3563)	Entropy 0.53480 (0.53957)	Top-1 acc 69.531 (67.311)	Top-5 acc 85.938 (86.139)	lr 0.00054
Train [109][2480/3239]	Time 0.346 (0.520)	Data Time 0.001 (0.017)	Loss 2.4316 (2.3564)	Entropy 0.53473 (0.53955)	Top-1 acc 68.750 (67.313)	Top-5 acc 85.938 (86.137)	lr 0.00054
Train [109][2490/3239]	Time 0.240 (0.519)	Data Time 0.001 (0.017)	Loss 2.4160 (2.3569)	Entropy 0.53487 (0.53953)	Top-1 acc 65.234 (67.300)	Top-5 acc 85.938 (86.129)	lr 0.00054
Train [109][2500/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.017)	Loss 2.2686 (2.3570)	Entropy 0.53505 (0.53952)	Top-1 acc 66.406 (67.295)	Top-5 acc 86.328 (86.125)	lr 0.00054
Train [109][2510/3239]	Time 0.221 (0.519)	Data Time 0.001 (0.016)	Loss 2.4304 (2.3567)	Entropy 0.53505 (0.53950)	Top-1 acc 64.453 (67.300)	Top-5 acc 85.938 (86.131)	lr 0.00054
Train [109][2520/3239]	Time 0.219 (0.518)	Data Time 0.001 (0.016)	Loss 2.2105 (2.3565)	Entropy 0.53459 (0.53948)	Top-1 acc 70.703 (67.308)	Top-5 acc 89.453 (86.135)	lr 0.00054
Train [109][2530/3239]	Time 0.265 (0.518)	Data Time 0.002 (0.016)	Loss 2.2944 (2.3564)	Entropy 0.53431 (0.53946)	Top-1 acc 70.703 (67.317)	Top-5 acc 86.719 (86.139)	lr 0.00054
Train [109][2540/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.016)	Loss 2.4260 (2.3562)	Entropy 0.53407 (0.53944)	Top-1 acc 65.234 (67.317)	Top-5 acc 85.938 (86.142)	lr 0.00054
Train [109][2550/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.016)	Loss 2.4145 (2.3563)	Entropy 0.53411 (0.53942)	Top-1 acc 65.234 (67.315)	Top-5 acc 85.156 (86.140)	lr 0.00053
Train [109][2560/3239]	Time 0.237 (0.517)	Data Time 0.001 (0.016)	Loss 2.4406 (2.3560)	Entropy 0.53404 (0.53940)	Top-1 acc 62.891 (67.324)	Top-5 acc 85.156 (86.147)	lr 0.00053
Train [109][2570/3239]	Time 0.248 (0.516)	Data Time 0.001 (0.016)	Loss 2.3096 (2.3559)	Entropy 0.53341 (0.53938)	Top-1 acc 67.188 (67.327)	Top-5 acc 88.672 (86.145)	lr 0.00053
Train [109][2580/3239]	Time 0.253 (0.516)	Data Time 0.001 (0.016)	Loss 2.1669 (2.3557)	Entropy 0.53316 (0.53935)	Top-1 acc 69.141 (67.331)	Top-5 acc 91.016 (86.148)	lr 0.00053
Train [109][2590/3239]	Time 0.301 (0.516)	Data Time 0.002 (0.016)	Loss 2.3784 (2.3556)	Entropy 0.53316 (0.53933)	Top-1 acc 64.062 (67.332)	Top-5 acc 84.375 (86.148)	lr 0.00053
Train [109][2600/3239]	Time 0.235 (0.516)	Data Time 0.001 (0.016)	Loss 2.2980 (2.3556)	Entropy 0.53338 (0.53931)	Top-1 acc 66.797 (67.331)	Top-5 acc 86.328 (86.148)	lr 0.00053
Train [109][2610/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.016)	Loss 2.6003 (2.3560)	Entropy 0.53339 (0.53928)	Top-1 acc 61.328 (67.324)	Top-5 acc 83.203 (86.140)	lr 0.00053
Train [109][2620/3239]	Time 0.227 (0.515)	Data Time 0.001 (0.016)	Loss 2.3182 (2.3559)	Entropy 0.53347 (0.53926)	Top-1 acc 67.188 (67.327)	Top-5 acc 85.938 (86.143)	lr 0.00053
Train [109][2630/3239]	Time 0.229 (0.515)	Data Time 0.001 (0.016)	Loss 2.3463 (2.3559)	Entropy 0.53367 (0.53924)	Top-1 acc 67.188 (67.321)	Top-5 acc 85.156 (86.144)	lr 0.00053
Train [109][2640/3239]	Time 0.399 (0.515)	Data Time 0.002 (0.016)	Loss 2.5159 (2.3560)	Entropy 0.53345 (0.53922)	Top-1 acc 62.500 (67.319)	Top-5 acc 83.594 (86.144)	lr 0.00053
Train [109][2650/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.016)	Loss 2.2531 (2.3560)	Entropy 0.53325 (0.53919)	Top-1 acc 71.875 (67.318)	Top-5 acc 86.719 (86.146)	lr 0.00053
Train [109][2660/3239]	Time 0.256 (0.514)	Data Time 0.001 (0.016)	Loss 2.1756 (2.3559)	Entropy 0.53334 (0.53917)	Top-1 acc 67.969 (67.322)	Top-5 acc 90.234 (86.150)	lr 0.00053
Train [109][2670/3239]	Time 0.223 (0.514)	Data Time 0.001 (0.016)	Loss 2.1689 (2.3559)	Entropy 0.53332 (0.53915)	Top-1 acc 72.656 (67.327)	Top-5 acc 91.797 (86.152)	lr 0.00053
Train [109][2680/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.016)	Loss 2.2431 (2.3557)	Entropy 0.53350 (0.53913)	Top-1 acc 68.750 (67.332)	Top-5 acc 88.281 (86.156)	lr 0.00053
Train [109][2690/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.016)	Loss 2.4405 (2.3559)	Entropy 0.53358 (0.53911)	Top-1 acc 63.672 (67.328)	Top-5 acc 85.547 (86.153)	lr 0.00053
Train [109][2700/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.015)	Loss 2.3707 (2.3558)	Entropy 0.53365 (0.53909)	Top-1 acc 65.625 (67.327)	Top-5 acc 85.547 (86.154)	lr 0.00053
Train [109][2710/3239]	Time 0.328 (0.512)	Data Time 0.001 (0.015)	Loss 2.2367 (2.3558)	Entropy 0.53403 (0.53907)	Top-1 acc 69.531 (67.328)	Top-5 acc 89.844 (86.152)	lr 0.00053
Train [109][2720/3239]	Time 0.239 (0.512)	Data Time 0.001 (0.015)	Loss 2.7753 (2.3558)	Entropy 0.53413 (0.53905)	Top-1 acc 57.812 (67.326)	Top-5 acc 80.078 (86.153)	lr 0.00053
Train [109][2730/3239]	Time 0.232 (0.511)	Data Time 0.001 (0.015)	Loss 2.3093 (2.3557)	Entropy 0.53422 (0.53903)	Top-1 acc 68.750 (67.327)	Top-5 acc 85.156 (86.153)	lr 0.00053
Train [109][2740/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.015)	Loss 2.5710 (2.3558)	Entropy 0.53420 (0.53901)	Top-1 acc 63.281 (67.328)	Top-5 acc 81.641 (86.153)	lr 0.00053
Train [109][2750/3239]	Time 0.222 (0.511)	Data Time 0.001 (0.015)	Loss 2.3812 (2.3556)	Entropy 0.53441 (0.53900)	Top-1 acc 67.969 (67.334)	Top-5 acc 84.375 (86.156)	lr 0.00053
Train [109][2760/3239]	Time 0.239 (0.510)	Data Time 0.001 (0.015)	Loss 2.2291 (2.3556)	Entropy 0.53437 (0.53898)	Top-1 acc 69.531 (67.336)	Top-5 acc 89.062 (86.155)	lr 0.00053
Train [109][2770/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.015)	Loss 2.2651 (2.3556)	Entropy 0.53441 (0.53896)	Top-1 acc 67.188 (67.339)	Top-5 acc 90.234 (86.155)	lr 0.00053
Train [109][2780/3239]	Time 0.229 (0.509)	Data Time 0.001 (0.015)	Loss 2.2691 (2.3557)	Entropy 0.53447 (0.53895)	Top-1 acc 69.531 (67.338)	Top-5 acc 87.500 (86.153)	lr 0.00053
Train [109][2790/3239]	Time 0.228 (0.509)	Data Time 0.001 (0.015)	Loss 2.4739 (2.3560)	Entropy 0.53440 (0.53893)	Top-1 acc 66.797 (67.333)	Top-5 acc 83.984 (86.147)	lr 0.00053
Train [109][2800/3239]	Time 0.338 (0.509)	Data Time 0.001 (0.015)	Loss 2.2540 (2.3560)	Entropy 0.53415 (0.53891)	Top-1 acc 66.406 (67.330)	Top-5 acc 89.062 (86.145)	lr 0.00053
Train [109][2810/3239]	Time 0.231 (0.508)	Data Time 0.001 (0.015)	Loss 2.3020 (2.3561)	Entropy 0.53421 (0.53890)	Top-1 acc 69.922 (67.331)	Top-5 acc 86.719 (86.144)	lr 0.00053
Train [109][2820/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.015)	Loss 2.3664 (2.3560)	Entropy 0.53421 (0.53888)	Top-1 acc 65.625 (67.333)	Top-5 acc 86.328 (86.145)	lr 0.00053
Train [109][2830/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.015)	Loss 2.3890 (2.3560)	Entropy 0.53448 (0.53886)	Top-1 acc 66.406 (67.334)	Top-5 acc 87.891 (86.145)	lr 0.00053
Train [109][2840/3239]	Time 0.259 (0.507)	Data Time 0.001 (0.015)	Loss 2.5209 (2.3561)	Entropy 0.53457 (0.53885)	Top-1 acc 63.281 (67.329)	Top-5 acc 85.156 (86.143)	lr 0.00053
Train [109][2850/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.015)	Loss 2.4204 (2.3561)	Entropy 0.53477 (0.53883)	Top-1 acc 67.578 (67.331)	Top-5 acc 87.109 (86.145)	lr 0.00053
Train [109][2860/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.015)	Loss 2.3511 (2.3561)	Entropy 0.53470 (0.53882)	Top-1 acc 66.406 (67.329)	Top-5 acc 86.328 (86.145)	lr 0.00053
Train [109][2870/3239]	Time 0.336 (0.506)	Data Time 0.001 (0.015)	Loss 2.2839 (2.3561)	Entropy 0.53459 (0.53881)	Top-1 acc 72.656 (67.331)	Top-5 acc 86.719 (86.147)	lr 0.00053
Train [109][2880/3239]	Time 0.223 (0.506)	Data Time 0.001 (0.015)	Loss 2.4007 (2.3561)	Entropy 0.53417 (0.53879)	Top-1 acc 66.016 (67.331)	Top-5 acc 83.594 (86.148)	lr 0.00053
Train [109][2890/3239]	Time 0.230 (0.506)	Data Time 0.001 (0.015)	Loss 2.4049 (2.3562)	Entropy 0.53429 (0.53878)	Top-1 acc 68.359 (67.325)	Top-5 acc 85.547 (86.145)	lr 0.00052
Train [109][2900/3239]	Time 0.290 (0.505)	Data Time 0.002 (0.015)	Loss 2.2392 (2.3563)	Entropy 0.53437 (0.53876)	Top-1 acc 71.094 (67.324)	Top-5 acc 86.719 (86.145)	lr 0.00052
Train [109][2910/3239]	Time 0.221 (0.505)	Data Time 0.001 (0.014)	Loss 2.4492 (2.3561)	Entropy 0.53431 (0.53874)	Top-1 acc 65.625 (67.331)	Top-5 acc 83.984 (86.151)	lr 0.00052
Train [109][2920/3239]	Time 0.259 (0.505)	Data Time 0.001 (0.014)	Loss 2.4001 (2.3559)	Entropy 0.53463 (0.53873)	Top-1 acc 69.922 (67.339)	Top-5 acc 83.984 (86.154)	lr 0.00052
Train [109][2930/3239]	Time 0.239 (0.504)	Data Time 0.001 (0.014)	Loss 2.3658 (2.3561)	Entropy 0.53462 (0.53872)	Top-1 acc 63.281 (67.331)	Top-5 acc 85.938 (86.152)	lr 0.00052
Train [109][2940/3239]	Time 0.227 (0.504)	Data Time 0.001 (0.014)	Loss 2.2887 (2.3559)	Entropy 0.53412 (0.53870)	Top-1 acc 72.266 (67.339)	Top-5 acc 86.328 (86.159)	lr 0.00052
Train [109][2950/3239]	Time 0.229 (0.504)	Data Time 0.001 (0.014)	Loss 2.3558 (2.3561)	Entropy 0.53440 (0.53869)	Top-1 acc 67.578 (67.331)	Top-5 acc 85.156 (86.155)	lr 0.00052
Train [109][2960/3239]	Time 0.328 (0.503)	Data Time 0.001 (0.014)	Loss 2.6001 (2.3561)	Entropy 0.53451 (0.53867)	Top-1 acc 62.109 (67.332)	Top-5 acc 82.031 (86.156)	lr 0.00052
Train [109][2970/3239]	Time 0.227 (0.503)	Data Time 0.001 (0.014)	Loss 2.3885 (2.3561)	Entropy 0.53453 (0.53866)	Top-1 acc 69.531 (67.333)	Top-5 acc 87.109 (86.155)	lr 0.00052
Train [109][2980/3239]	Time 0.234 (0.503)	Data Time 0.001 (0.014)	Loss 2.6959 (2.3564)	Entropy 0.53442 (0.53864)	Top-1 acc 61.328 (67.327)	Top-5 acc 82.812 (86.152)	lr 0.00052
Train [109][2990/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.014)	Loss 2.4805 (2.3564)	Entropy 0.53431 (0.53863)	Top-1 acc 60.938 (67.329)	Top-5 acc 84.766 (86.152)	lr 0.00052
Train [109][3000/3239]	Time 0.227 (0.502)	Data Time 0.001 (0.014)	Loss 2.4669 (2.3565)	Entropy 0.53410 (0.53861)	Top-1 acc 66.406 (67.323)	Top-5 acc 84.766 (86.149)	lr 0.00052
Train [109][3010/3239]	Time 0.222 (0.502)	Data Time 0.001 (0.014)	Loss 2.3712 (2.3565)	Entropy 0.53368 (0.53860)	Top-1 acc 67.969 (67.323)	Top-5 acc 83.203 (86.148)	lr 0.00052
Train [109][3020/3239]	Time 0.241 (0.502)	Data Time 0.001 (0.014)	Loss 2.1520 (2.3564)	Entropy 0.53347 (0.53858)	Top-1 acc 75.000 (67.327)	Top-5 acc 90.234 (86.149)	lr 0.00052
Train [109][3030/3239]	Time 0.323 (0.501)	Data Time 0.001 (0.014)	Loss 2.3414 (2.3566)	Entropy 0.53290 (0.53856)	Top-1 acc 66.797 (67.322)	Top-5 acc 85.547 (86.146)	lr 0.00052
Train [109][3040/3239]	Time 0.231 (0.501)	Data Time 0.001 (0.014)	Loss 2.1683 (2.3564)	Entropy 0.53278 (0.53855)	Top-1 acc 67.188 (67.324)	Top-5 acc 89.453 (86.146)	lr 0.00052
Train [109][3050/3239]	Time 0.225 (0.501)	Data Time 0.001 (0.014)	Loss 2.3124 (2.3565)	Entropy 0.53232 (0.53853)	Top-1 acc 66.406 (67.323)	Top-5 acc 87.500 (86.143)	lr 0.00052
Train [109][3060/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.014)	Loss 2.2691 (2.3565)	Entropy 0.53238 (0.53851)	Top-1 acc 67.969 (67.325)	Top-5 acc 88.281 (86.145)	lr 0.00052
Train [109][3070/3239]	Time 0.226 (0.500)	Data Time 0.001 (0.014)	Loss 2.2519 (2.3564)	Entropy 0.53247 (0.53849)	Top-1 acc 70.312 (67.329)	Top-5 acc 87.500 (86.144)	lr 0.00052
Train [109][3080/3239]	Time 0.238 (0.500)	Data Time 0.001 (0.014)	Loss 2.1721 (2.3566)	Entropy 0.53242 (0.53847)	Top-1 acc 69.531 (67.327)	Top-5 acc 90.625 (86.143)	lr 0.00052
Train [109][3090/3239]	Time 0.221 (0.500)	Data Time 0.001 (0.014)	Loss 2.4877 (2.3571)	Entropy 0.53250 (0.53845)	Top-1 acc 66.406 (67.317)	Top-5 acc 82.422 (86.134)	lr 0.00052
Train [109][3100/3239]	Time 0.285 (0.517)	Data Time 0.002 (0.014)	Loss 2.3471 (2.3570)	Entropy 0.53277 (0.53843)	Top-1 acc 66.016 (67.314)	Top-5 acc 85.547 (86.136)	lr 0.00052
Train [109][3110/3239]	Time 0.233 (0.517)	Data Time 0.002 (0.014)	Loss 2.4119 (2.3570)	Entropy 0.53294 (0.53841)	Top-1 acc 65.234 (67.314)	Top-5 acc 84.375 (86.134)	lr 0.00052
Train [109][3120/3239]	Time 0.327 (0.517)	Data Time 0.001 (0.014)	Loss 2.0662 (2.3567)	Entropy 0.53320 (0.53839)	Top-1 acc 74.219 (67.316)	Top-5 acc 89.844 (86.139)	lr 0.00052
Train [109][3130/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.014)	Loss 2.0787 (2.3567)	Entropy 0.53327 (0.53838)	Top-1 acc 75.391 (67.316)	Top-5 acc 91.406 (86.140)	lr 0.00052
Train [109][3140/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.014)	Loss 2.3285 (2.3566)	Entropy 0.53343 (0.53836)	Top-1 acc 70.703 (67.320)	Top-5 acc 85.156 (86.140)	lr 0.00052
Train [109][3150/3239]	Time 0.258 (0.516)	Data Time 0.001 (0.014)	Loss 2.2455 (2.3564)	Entropy 0.53328 (0.53834)	Top-1 acc 69.922 (67.327)	Top-5 acc 88.281 (86.142)	lr 0.00052
Train [109][3160/3239]	Time 0.257 (0.515)	Data Time 0.001 (0.013)	Loss 2.3740 (2.3563)	Entropy 0.53293 (0.53833)	Top-1 acc 66.406 (67.324)	Top-5 acc 87.109 (86.145)	lr 0.00052
Train [109][3170/3239]	Time 0.236 (0.515)	Data Time 0.001 (0.013)	Loss 2.3811 (2.3563)	Entropy 0.53287 (0.53831)	Top-1 acc 65.234 (67.323)	Top-5 acc 84.375 (86.143)	lr 0.00052
Train [109][3180/3239]	Time 0.231 (0.515)	Data Time 0.000 (0.013)	Loss 2.1339 (2.3561)	Entropy 0.53309 (0.53829)	Top-1 acc 71.094 (67.328)	Top-5 acc 89.844 (86.146)	lr 0.00052
Train [109][3190/3239]	Time 0.326 (0.514)	Data Time 0.000 (0.013)	Loss 2.4108 (2.3561)	Entropy 0.53285 (0.53828)	Top-1 acc 67.188 (67.329)	Top-5 acc 84.375 (86.146)	lr 0.00052
Train [109][3200/3239]	Time 0.233 (0.514)	Data Time 0.000 (0.013)	Loss 2.4289 (2.3559)	Entropy 0.53269 (0.53826)	Top-1 acc 66.797 (67.337)	Top-5 acc 85.156 (86.149)	lr 0.00052
Train [109][3210/3239]	Time 0.231 (0.514)	Data Time 0.000 (0.013)	Loss 2.2135 (2.3557)	Entropy 0.53240 (0.53824)	Top-1 acc 70.703 (67.344)	Top-5 acc 87.891 (86.152)	lr 0.00052
Train [109][3220/3239]	Time 0.234 (0.513)	Data Time 0.000 (0.013)	Loss 2.2684 (2.3556)	Entropy 0.53243 (0.53822)	Top-1 acc 68.359 (67.345)	Top-5 acc 86.328 (86.153)	lr 0.00052
Train [109][3230/3239]	Time 0.226 (0.513)	Data Time 0.000 (0.013)	Loss 2.5330 (2.3555)	Entropy 0.53254 (0.53821)	Top-1 acc 62.891 (67.349)	Top-5 acc 83.594 (86.156)	lr 0.00052
Train [109][3239/3239]	Time 0.923 (0.513)	Data Time 0.000 (0.013)	Loss 2.7207 (2.3555)	Entropy 0.53274 (0.53819)	Top-1 acc 58.025 (67.351)	Top-5 acc 75.309 (86.156)	lr 0.00051
==========Valid [109/120]	loss 1.175	top-1 acc 72.923 (72.923)	top-5 acc 90.540	Train top-1 67.351	top-5 86.156	Entropy 0.53274	Latency-None: 0.000ms	Flops: 539.00M
Train [110][0/3239]	Time 36.809 (36.809)	Data Time 34.059 (34.059)	Loss 2.3250 (2.3250)	Entropy 0.53292 (0.53292)	Top-1 acc 70.312 (70.312)	Top-5 acc 88.281 (88.281)	lr 0.00051
Train [110][10/3239]	Time 0.232 (4.014)	Data Time 0.001 (3.225)	Loss 2.3349 (2.2340)	Entropy 0.53290 (0.53287)	Top-1 acc 68.750 (70.881)	Top-5 acc 86.328 (88.281)	lr 0.00051
Train [110][20/3239]	Time 0.396 (2.311)	Data Time 0.001 (1.690)	Loss 2.2745 (2.2840)	Entropy 0.53322 (0.53295)	Top-1 acc 72.266 (69.308)	Top-5 acc 85.547 (87.165)	lr 0.00051
Train [110][30/3239]	Time 0.229 (1.698)	Data Time 0.001 (1.145)	Loss 2.2836 (2.3064)	Entropy 0.53320 (0.53305)	Top-1 acc 69.141 (68.561)	Top-5 acc 85.547 (86.643)	lr 0.00051
Train [110][40/3239]	Time 0.227 (1.385)	Data Time 0.001 (0.866)	Loss 2.5495 (2.3215)	Entropy 0.53301 (0.53306)	Top-1 acc 62.891 (67.940)	Top-5 acc 83.984 (86.595)	lr 0.00051
Train [110][50/3239]	Time 0.226 (1.194)	Data Time 0.001 (0.697)	Loss 2.7890 (2.3296)	Entropy 0.53288 (0.53304)	Top-1 acc 60.547 (68.015)	Top-5 acc 76.562 (86.382)	lr 0.00051
Train [110][60/3239]	Time 0.238 (1.066)	Data Time 0.001 (0.583)	Loss 2.3666 (2.3311)	Entropy 0.53300 (0.53302)	Top-1 acc 66.016 (67.937)	Top-5 acc 85.156 (86.418)	lr 0.00051
Train [110][70/3239]	Time 0.228 (0.974)	Data Time 0.001 (0.501)	Loss 2.3588 (2.3302)	Entropy 0.53308 (0.53302)	Top-1 acc 63.672 (68.013)	Top-5 acc 85.547 (86.422)	lr 0.00051
Train [110][80/3239]	Time 0.227 (0.904)	Data Time 0.001 (0.439)	Loss 2.3485 (2.3299)	Entropy 0.53305 (0.53302)	Top-1 acc 68.359 (67.959)	Top-5 acc 85.156 (86.420)	lr 0.00051
Train [110][90/3239]	Time 0.315 (0.850)	Data Time 0.001 (0.391)	Loss 2.4887 (2.3289)	Entropy 0.53275 (0.53301)	Top-1 acc 64.844 (67.943)	Top-5 acc 80.859 (86.448)	lr 0.00051
Train [110][100/3239]	Time 0.228 (0.806)	Data Time 0.001 (0.353)	Loss 2.3120 (2.3301)	Entropy 0.53277 (0.53299)	Top-1 acc 69.922 (67.918)	Top-5 acc 87.109 (86.467)	lr 0.00051
Train [110][110/3239]	Time 0.259 (0.770)	Data Time 0.001 (0.321)	Loss 2.2812 (2.3265)	Entropy 0.53293 (0.53298)	Top-1 acc 67.578 (67.979)	Top-5 acc 86.328 (86.458)	lr 0.00051
Train [110][120/3239]	Time 0.230 (0.740)	Data Time 0.001 (0.294)	Loss 2.4200 (2.3260)	Entropy 0.53276 (0.53297)	Top-1 acc 66.797 (67.966)	Top-5 acc 86.719 (86.519)	lr 0.00051
Train [110][130/3239]	Time 0.227 (0.714)	Data Time 0.001 (0.272)	Loss 2.2859 (2.3280)	Entropy 0.53293 (0.53296)	Top-1 acc 67.578 (67.981)	Top-5 acc 86.328 (86.453)	lr 0.00051
Train [110][140/3239]	Time 0.220 (0.693)	Data Time 0.001 (0.253)	Loss 2.2625 (2.3358)	Entropy 0.53292 (0.53296)	Top-1 acc 68.359 (67.761)	Top-5 acc 87.109 (86.325)	lr 0.00051
Train [110][150/3239]	Time 0.236 (0.675)	Data Time 0.001 (0.236)	Loss 2.5098 (2.3413)	Entropy 0.53302 (0.53296)	Top-1 acc 62.891 (67.674)	Top-5 acc 86.328 (86.289)	lr 0.00051
Train [110][160/3239]	Time 0.291 (0.660)	Data Time 0.030 (0.222)	Loss 2.3822 (2.3419)	Entropy 0.53245 (0.53296)	Top-1 acc 67.578 (67.707)	Top-5 acc 85.938 (86.289)	lr 0.00051
Train [110][170/3239]	Time 0.250 (0.647)	Data Time 0.001 (0.209)	Loss 2.1133 (2.3440)	Entropy 0.53282 (0.53293)	Top-1 acc 72.266 (67.644)	Top-5 acc 89.844 (86.273)	lr 0.00051
Train [110][180/3239]	Time 0.317 (0.635)	Data Time 0.001 (0.198)	Loss 2.5593 (2.3479)	Entropy 0.53244 (0.53292)	Top-1 acc 61.719 (67.537)	Top-5 acc 82.031 (86.227)	lr 0.00051
Train [110][190/3239]	Time 0.233 (0.624)	Data Time 0.001 (0.187)	Loss 2.2017 (2.3501)	Entropy 0.53283 (0.53290)	Top-1 acc 71.875 (67.498)	Top-5 acc 88.281 (86.191)	lr 0.00051
Train [110][200/3239]	Time 0.226 (0.612)	Data Time 0.001 (0.178)	Loss 2.2961 (2.3475)	Entropy 0.53317 (0.53291)	Top-1 acc 69.531 (67.559)	Top-5 acc 86.719 (86.256)	lr 0.00051
Train [110][210/3239]	Time 0.234 (0.603)	Data Time 0.001 (0.170)	Loss 2.3362 (2.3471)	Entropy 0.53331 (0.53292)	Top-1 acc 67.578 (67.543)	Top-5 acc 85.547 (86.269)	lr 0.00051
Train [110][220/3239]	Time 0.229 (0.594)	Data Time 0.001 (0.162)	Loss 2.4418 (2.3461)	Entropy 0.53361 (0.53294)	Top-1 acc 65.625 (67.552)	Top-5 acc 83.984 (86.305)	lr 0.00051
Train [110][230/3239]	Time 0.280 (0.587)	Data Time 0.001 (0.155)	Loss 2.4468 (2.3443)	Entropy 0.53396 (0.53297)	Top-1 acc 61.719 (67.544)	Top-5 acc 84.766 (86.332)	lr 0.00051
Train [110][240/3239]	Time 0.230 (0.580)	Data Time 0.001 (0.149)	Loss 2.2559 (2.3459)	Entropy 0.53384 (0.53301)	Top-1 acc 69.141 (67.481)	Top-5 acc 86.328 (86.301)	lr 0.00051
Train [110][250/3239]	Time 0.331 (0.574)	Data Time 0.001 (0.143)	Loss 2.4919 (2.3460)	Entropy 0.53399 (0.53305)	Top-1 acc 63.672 (67.458)	Top-5 acc 85.547 (86.333)	lr 0.00051
Train [110][260/3239]	Time 0.231 (0.567)	Data Time 0.001 (0.137)	Loss 2.5789 (2.3477)	Entropy 0.53372 (0.53307)	Top-1 acc 62.891 (67.419)	Top-5 acc 82.422 (86.316)	lr 0.00051
Train [110][270/3239]	Time 0.273 (0.563)	Data Time 0.001 (0.132)	Loss 2.5833 (2.3521)	Entropy 0.53349 (0.53309)	Top-1 acc 62.109 (67.316)	Top-5 acc 83.203 (86.266)	lr 0.00051
Train [110][280/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.128)	Loss 2.2725 (2.3518)	Entropy 0.53372 (0.53311)	Top-1 acc 68.750 (67.288)	Top-5 acc 85.938 (86.273)	lr 0.00051
Train [110][290/3239]	Time 0.229 (0.553)	Data Time 0.001 (0.123)	Loss 2.6506 (2.3514)	Entropy 0.53386 (0.53314)	Top-1 acc 63.281 (67.307)	Top-5 acc 80.469 (86.277)	lr 0.00051
Train [110][300/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.119)	Loss 2.3152 (2.3501)	Entropy 0.53390 (0.53316)	Top-1 acc 69.531 (67.346)	Top-5 acc 85.156 (86.255)	lr 0.00051
Train [110][310/3239]	Time 0.228 (0.544)	Data Time 0.001 (0.116)	Loss 2.4932 (2.3497)	Entropy 0.53393 (0.53318)	Top-1 acc 62.109 (67.370)	Top-5 acc 83.984 (86.234)	lr 0.00051
Train [110][320/3239]	Time 0.227 (0.539)	Data Time 0.001 (0.112)	Loss 2.1641 (2.3510)	Entropy 0.53422 (0.53321)	Top-1 acc 72.266 (67.331)	Top-5 acc 89.844 (86.223)	lr 0.00051
Train [110][330/3239]	Time 0.304 (0.536)	Data Time 0.001 (0.109)	Loss 2.4579 (2.3517)	Entropy 0.53411 (0.53325)	Top-1 acc 68.750 (67.313)	Top-5 acc 83.203 (86.215)	lr 0.00051
Train [110][340/3239]	Time 0.380 (0.534)	Data Time 0.001 (0.106)	Loss 2.2760 (2.3518)	Entropy 0.53382 (0.53327)	Top-1 acc 71.875 (67.348)	Top-5 acc 85.938 (86.212)	lr 0.00051
Train [110][350/3239]	Time 0.222 (0.531)	Data Time 0.001 (0.103)	Loss 2.3575 (2.3503)	Entropy 0.53360 (0.53329)	Top-1 acc 67.188 (67.392)	Top-5 acc 85.938 (86.234)	lr 0.00050
Train [110][360/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.100)	Loss 2.3980 (2.3520)	Entropy 0.53383 (0.53330)	Top-1 acc 69.922 (67.374)	Top-5 acc 85.156 (86.215)	lr 0.00050
Train [110][370/3239]	Time 0.283 (0.524)	Data Time 0.001 (0.097)	Loss 2.2633 (2.3503)	Entropy 0.53356 (0.53331)	Top-1 acc 71.875 (67.410)	Top-5 acc 86.719 (86.243)	lr 0.00050
Train [110][380/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.095)	Loss 2.1596 (2.3491)	Entropy 0.53361 (0.53332)	Top-1 acc 73.438 (67.436)	Top-5 acc 88.281 (86.258)	lr 0.00050
Train [110][390/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.092)	Loss 2.5337 (2.3499)	Entropy 0.53340 (0.53333)	Top-1 acc 64.453 (67.419)	Top-5 acc 82.422 (86.230)	lr 0.00050
Train [110][400/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.090)	Loss 2.3396 (2.3491)	Entropy 0.53335 (0.53333)	Top-1 acc 69.922 (67.473)	Top-5 acc 85.938 (86.241)	lr 0.00050
Train [110][410/3239]	Time 0.321 (0.513)	Data Time 0.001 (0.088)	Loss 2.4199 (2.3493)	Entropy 0.53358 (0.53333)	Top-1 acc 65.625 (67.468)	Top-5 acc 83.203 (86.225)	lr 0.00050
Train [110][420/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.086)	Loss 2.3945 (2.3492)	Entropy 0.53364 (0.53334)	Top-1 acc 67.969 (67.470)	Top-5 acc 84.375 (86.226)	lr 0.00050
Train [110][430/3239]	Time 0.243 (0.507)	Data Time 0.001 (0.084)	Loss 2.2694 (2.3491)	Entropy 0.53378 (0.53335)	Top-1 acc 71.094 (67.468)	Top-5 acc 85.547 (86.225)	lr 0.00050
Train [110][440/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.082)	Loss 2.1386 (2.3485)	Entropy 0.53376 (0.53336)	Top-1 acc 73.438 (67.476)	Top-5 acc 91.016 (86.246)	lr 0.00050
Train [110][450/3239]	Time 0.241 (0.504)	Data Time 0.001 (0.080)	Loss 2.1978 (2.3477)	Entropy 0.53323 (0.53336)	Top-1 acc 73.047 (67.494)	Top-5 acc 90.625 (86.269)	lr 0.00050
Train [110][460/3239]	Time 0.234 (0.502)	Data Time 0.001 (0.078)	Loss 2.2299 (2.3472)	Entropy 0.53343 (0.53336)	Top-1 acc 68.750 (67.514)	Top-5 acc 90.234 (86.275)	lr 0.00050
Train [110][470/3239]	Time 0.247 (0.500)	Data Time 0.001 (0.077)	Loss 2.3930 (2.3457)	Entropy 0.53352 (0.53336)	Top-1 acc 65.234 (67.545)	Top-5 acc 87.109 (86.286)	lr 0.00050
Train [110][480/3239]	Time 0.274 (0.499)	Data Time 0.001 (0.075)	Loss 2.7460 (2.3462)	Entropy 0.53336 (0.53336)	Top-1 acc 57.422 (67.529)	Top-5 acc 80.078 (86.282)	lr 0.00050
Train [110][490/3239]	Time 0.247 (0.497)	Data Time 0.001 (0.074)	Loss 2.4569 (2.3464)	Entropy 0.53343 (0.53337)	Top-1 acc 62.500 (67.511)	Top-5 acc 85.156 (86.298)	lr 0.00050
Train [110][500/3239]	Time 0.236 (0.496)	Data Time 0.001 (0.072)	Loss 2.5118 (2.3459)	Entropy 0.53362 (0.53337)	Top-1 acc 62.109 (67.508)	Top-5 acc 82.422 (86.295)	lr 0.00050
Train [110][510/3239]	Time 0.318 (0.595)	Data Time 0.006 (0.071)	Loss 2.3438 (2.3478)	Entropy 0.53385 (0.53337)	Top-1 acc 66.797 (67.457)	Top-5 acc 87.109 (86.265)	lr 0.00050
Train [110][520/3239]	Time 0.244 (0.593)	Data Time 0.002 (0.070)	Loss 2.4813 (2.3482)	Entropy 0.53381 (0.53338)	Top-1 acc 63.672 (67.445)	Top-5 acc 85.547 (86.260)	lr 0.00050
Train [110][530/3239]	Time 0.240 (0.590)	Data Time 0.002 (0.068)	Loss 2.1981 (2.3466)	Entropy 0.53362 (0.53339)	Top-1 acc 70.312 (67.489)	Top-5 acc 88.672 (86.280)	lr 0.00050
Train [110][540/3239]	Time 0.244 (0.587)	Data Time 0.002 (0.067)	Loss 2.3760 (2.3475)	Entropy 0.53373 (0.53339)	Top-1 acc 67.578 (67.479)	Top-5 acc 84.766 (86.264)	lr 0.00050
Train [110][550/3239]	Time 0.240 (0.585)	Data Time 0.001 (0.066)	Loss 2.3142 (2.3477)	Entropy 0.53370 (0.53340)	Top-1 acc 67.969 (67.470)	Top-5 acc 86.719 (86.276)	lr 0.00050
Train [110][560/3239]	Time 0.291 (0.583)	Data Time 0.002 (0.065)	Loss 2.2989 (2.3471)	Entropy 0.53334 (0.53340)	Top-1 acc 69.531 (67.482)	Top-5 acc 85.156 (86.291)	lr 0.00050
Train [110][570/3239]	Time 0.339 (0.580)	Data Time 0.001 (0.064)	Loss 2.2950 (2.3468)	Entropy 0.53354 (0.53340)	Top-1 acc 67.578 (67.473)	Top-5 acc 86.328 (86.309)	lr 0.00050
Train [110][580/3239]	Time 0.250 (0.578)	Data Time 0.001 (0.063)	Loss 2.3627 (2.3462)	Entropy 0.53373 (0.53341)	Top-1 acc 67.969 (67.505)	Top-5 acc 86.328 (86.323)	lr 0.00050
Train [110][590/3239]	Time 0.237 (0.575)	Data Time 0.002 (0.062)	Loss 2.2219 (2.3462)	Entropy 0.53412 (0.53341)	Top-1 acc 67.578 (67.518)	Top-5 acc 86.328 (86.318)	lr 0.00050
Train [110][600/3239]	Time 0.241 (0.573)	Data Time 0.001 (0.061)	Loss 2.3786 (2.3456)	Entropy 0.53404 (0.53342)	Top-1 acc 67.188 (67.540)	Top-5 acc 83.984 (86.327)	lr 0.00050
Train [110][610/3239]	Time 0.240 (0.570)	Data Time 0.002 (0.060)	Loss 2.3267 (2.3455)	Entropy 0.53438 (0.53344)	Top-1 acc 69.141 (67.552)	Top-5 acc 85.156 (86.324)	lr 0.00050
Train [110][620/3239]	Time 0.279 (0.568)	Data Time 0.002 (0.059)	Loss 2.6108 (2.3477)	Entropy 0.53434 (0.53345)	Top-1 acc 63.281 (67.502)	Top-5 acc 80.859 (86.283)	lr 0.00050
Train [110][630/3239]	Time 0.236 (0.566)	Data Time 0.001 (0.058)	Loss 2.3732 (2.3481)	Entropy 0.53437 (0.53347)	Top-1 acc 66.797 (67.493)	Top-5 acc 88.281 (86.267)	lr 0.00050
Train [110][640/3239]	Time 0.239 (0.564)	Data Time 0.001 (0.057)	Loss 2.2340 (2.3484)	Entropy 0.53469 (0.53348)	Top-1 acc 68.750 (67.477)	Top-5 acc 88.672 (86.270)	lr 0.00050
Train [110][650/3239]	Time 0.264 (0.562)	Data Time 0.001 (0.056)	Loss 2.3395 (2.3478)	Entropy 0.53495 (0.53350)	Top-1 acc 65.234 (67.486)	Top-5 acc 83.984 (86.274)	lr 0.00050
Train [110][660/3239]	Time 0.252 (0.559)	Data Time 0.001 (0.055)	Loss 2.3654 (2.3474)	Entropy 0.53514 (0.53353)	Top-1 acc 64.844 (67.498)	Top-5 acc 87.109 (86.284)	lr 0.00050
Train [110][670/3239]	Time 0.241 (0.557)	Data Time 0.001 (0.055)	Loss 2.2896 (2.3465)	Entropy 0.53493 (0.53355)	Top-1 acc 69.141 (67.525)	Top-5 acc 89.453 (86.300)	lr 0.00050
Train [110][680/3239]	Time 0.246 (0.555)	Data Time 0.001 (0.054)	Loss 2.2695 (2.3469)	Entropy 0.53471 (0.53357)	Top-1 acc 69.922 (67.516)	Top-5 acc 86.719 (86.289)	lr 0.00050
Train [110][690/3239]	Time 0.234 (0.554)	Data Time 0.004 (0.053)	Loss 2.3703 (2.3471)	Entropy 0.53476 (0.53358)	Top-1 acc 66.406 (67.519)	Top-5 acc 83.203 (86.277)	lr 0.00050
Train [110][700/3239]	Time 0.231 (0.551)	Data Time 0.001 (0.052)	Loss 2.2998 (2.3478)	Entropy 0.53476 (0.53360)	Top-1 acc 66.797 (67.506)	Top-5 acc 87.891 (86.265)	lr 0.00049
Train [110][710/3239]	Time 0.250 (0.550)	Data Time 0.001 (0.052)	Loss 2.2419 (2.3478)	Entropy 0.53495 (0.53362)	Top-1 acc 69.531 (67.512)	Top-5 acc 86.328 (86.274)	lr 0.00049
Train [110][720/3239]	Time 0.233 (0.548)	Data Time 0.001 (0.051)	Loss 2.5830 (2.3486)	Entropy 0.53436 (0.53364)	Top-1 acc 62.500 (67.500)	Top-5 acc 84.375 (86.261)	lr 0.00049
Train [110][730/3239]	Time 0.349 (0.547)	Data Time 0.001 (0.050)	Loss 2.2047 (2.3481)	Entropy 0.53409 (0.53365)	Top-1 acc 71.094 (67.507)	Top-5 acc 87.500 (86.263)	lr 0.00049
Train [110][740/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.050)	Loss 2.2685 (2.3476)	Entropy 0.53438 (0.53365)	Top-1 acc 72.266 (67.525)	Top-5 acc 87.109 (86.271)	lr 0.00049
Train [110][750/3239]	Time 0.238 (0.543)	Data Time 0.001 (0.049)	Loss 2.2749 (2.3474)	Entropy 0.53452 (0.53367)	Top-1 acc 68.750 (67.525)	Top-5 acc 85.938 (86.275)	lr 0.00049
Train [110][760/3239]	Time 0.367 (0.543)	Data Time 0.002 (0.048)	Loss 2.2855 (2.3481)	Entropy 0.53453 (0.53368)	Top-1 acc 66.406 (67.506)	Top-5 acc 87.500 (86.265)	lr 0.00049
Train [110][770/3239]	Time 0.298 (0.545)	Data Time 0.002 (0.048)	Loss 2.2481 (2.3479)	Entropy 0.53477 (0.53369)	Top-1 acc 69.922 (67.505)	Top-5 acc 85.547 (86.262)	lr 0.00049
Train [110][780/3239]	Time 0.245 (0.543)	Data Time 0.001 (0.047)	Loss 2.5845 (2.3479)	Entropy 0.53494 (0.53370)	Top-1 acc 64.453 (67.503)	Top-5 acc 80.859 (86.265)	lr 0.00049
Train [110][790/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.047)	Loss 2.4409 (2.3496)	Entropy 0.53511 (0.53372)	Top-1 acc 64.062 (67.470)	Top-5 acc 86.719 (86.243)	lr 0.00049
Train [110][800/3239]	Time 0.359 (0.540)	Data Time 0.001 (0.046)	Loss 2.2203 (2.3496)	Entropy 0.53471 (0.53374)	Top-1 acc 70.312 (67.470)	Top-5 acc 88.281 (86.245)	lr 0.00049
Train [110][810/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.045)	Loss 2.2377 (2.3486)	Entropy 0.53479 (0.53375)	Top-1 acc 72.656 (67.493)	Top-5 acc 88.281 (86.259)	lr 0.00049
Train [110][820/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.045)	Loss 2.3614 (2.3485)	Entropy 0.53479 (0.53376)	Top-1 acc 67.578 (67.496)	Top-5 acc 87.500 (86.265)	lr 0.00049
Train [110][830/3239]	Time 0.237 (0.536)	Data Time 0.001 (0.044)	Loss 2.2130 (2.3484)	Entropy 0.53456 (0.53377)	Top-1 acc 71.484 (67.499)	Top-5 acc 86.719 (86.261)	lr 0.00049
Train [110][840/3239]	Time 0.223 (0.534)	Data Time 0.001 (0.044)	Loss 2.2489 (2.3478)	Entropy 0.53453 (0.53378)	Top-1 acc 69.141 (67.517)	Top-5 acc 87.891 (86.262)	lr 0.00049
Train [110][850/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.043)	Loss 2.3561 (2.3480)	Entropy 0.53449 (0.53379)	Top-1 acc 69.531 (67.518)	Top-5 acc 85.938 (86.257)	lr 0.00049
Train [110][860/3239]	Time 0.225 (0.532)	Data Time 0.001 (0.043)	Loss 2.3840 (2.3485)	Entropy 0.53481 (0.53380)	Top-1 acc 66.406 (67.509)	Top-5 acc 83.203 (86.237)	lr 0.00049
Train [110][870/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.042)	Loss 2.4166 (2.3482)	Entropy 0.53474 (0.53381)	Top-1 acc 66.016 (67.525)	Top-5 acc 84.375 (86.246)	lr 0.00049
Train [110][880/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.042)	Loss 2.4801 (2.3476)	Entropy 0.53476 (0.53382)	Top-1 acc 63.672 (67.539)	Top-5 acc 82.812 (86.259)	lr 0.00049
Train [110][890/3239]	Time 0.318 (0.528)	Data Time 0.001 (0.042)	Loss 2.4732 (2.3473)	Entropy 0.53441 (0.53383)	Top-1 acc 64.844 (67.536)	Top-5 acc 85.156 (86.270)	lr 0.00049
Train [110][900/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.041)	Loss 2.5023 (2.3486)	Entropy 0.53432 (0.53383)	Top-1 acc 61.328 (67.506)	Top-5 acc 84.375 (86.244)	lr 0.00049
Train [110][910/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.041)	Loss 2.2592 (2.3481)	Entropy 0.53443 (0.53384)	Top-1 acc 71.094 (67.523)	Top-5 acc 87.891 (86.256)	lr 0.00049
Train [110][920/3239]	Time 0.229 (0.524)	Data Time 0.002 (0.040)	Loss 2.4304 (2.3478)	Entropy 0.53481 (0.53385)	Top-1 acc 65.625 (67.526)	Top-5 acc 85.156 (86.256)	lr 0.00049
Train [110][930/3239]	Time 0.225 (0.523)	Data Time 0.001 (0.040)	Loss 2.0664 (2.3471)	Entropy 0.53497 (0.53386)	Top-1 acc 73.438 (67.542)	Top-5 acc 93.359 (86.274)	lr 0.00049
Train [110][940/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.039)	Loss 2.1701 (2.3466)	Entropy 0.53472 (0.53387)	Top-1 acc 71.094 (67.560)	Top-5 acc 90.234 (86.287)	lr 0.00049
Train [110][950/3239]	Time 0.250 (0.521)	Data Time 0.002 (0.039)	Loss 2.4378 (2.3468)	Entropy 0.53464 (0.53388)	Top-1 acc 65.234 (67.553)	Top-5 acc 86.719 (86.288)	lr 0.00049
Train [110][960/3239]	Time 0.382 (0.520)	Data Time 0.001 (0.039)	Loss 2.4295 (2.3468)	Entropy 0.53474 (0.53389)	Top-1 acc 66.797 (67.554)	Top-5 acc 86.328 (86.291)	lr 0.00049
Train [110][970/3239]	Time 0.235 (0.519)	Data Time 0.001 (0.038)	Loss 2.4639 (2.3463)	Entropy 0.53463 (0.53390)	Top-1 acc 61.328 (67.562)	Top-5 acc 83.203 (86.300)	lr 0.00049
Train [110][980/3239]	Time 0.258 (0.518)	Data Time 0.001 (0.038)	Loss 2.1957 (2.3466)	Entropy 0.53477 (0.53390)	Top-1 acc 69.922 (67.557)	Top-5 acc 89.844 (86.301)	lr 0.00049
Train [110][990/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.038)	Loss 2.3794 (2.3460)	Entropy 0.53437 (0.53391)	Top-1 acc 67.578 (67.567)	Top-5 acc 85.547 (86.310)	lr 0.00049
Train [110][1000/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.037)	Loss 2.3912 (2.3456)	Entropy 0.53415 (0.53392)	Top-1 acc 62.500 (67.575)	Top-5 acc 84.375 (86.318)	lr 0.00049
Train [110][1010/3239]	Time 0.243 (0.515)	Data Time 0.001 (0.037)	Loss 2.3572 (2.3456)	Entropy 0.53423 (0.53392)	Top-1 acc 67.578 (67.569)	Top-5 acc 85.547 (86.317)	lr 0.00049
Train [110][1020/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.036)	Loss 2.4102 (2.3457)	Entropy 0.53437 (0.53392)	Top-1 acc 66.016 (67.565)	Top-5 acc 84.375 (86.313)	lr 0.00049
Train [110][1030/3239]	Time 0.279 (0.513)	Data Time 0.002 (0.036)	Loss 2.3853 (2.3447)	Entropy 0.53426 (0.53393)	Top-1 acc 64.844 (67.591)	Top-5 acc 82.422 (86.320)	lr 0.00049
Train [110][1040/3239]	Time 0.218 (0.512)	Data Time 0.001 (0.036)	Loss 2.8419 (2.3456)	Entropy 0.53420 (0.53393)	Top-1 acc 56.641 (67.574)	Top-5 acc 77.344 (86.306)	lr 0.00049
Train [110][1050/3239]	Time 0.256 (0.512)	Data Time 0.001 (0.035)	Loss 2.3589 (2.3453)	Entropy 0.53411 (0.53393)	Top-1 acc 68.359 (67.587)	Top-5 acc 84.375 (86.309)	lr 0.00049
Train [110][1060/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.035)	Loss 2.4682 (2.3453)	Entropy 0.53359 (0.53393)	Top-1 acc 66.797 (67.592)	Top-5 acc 83.984 (86.306)	lr 0.00048
Train [110][1070/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.035)	Loss 2.1687 (2.3452)	Entropy 0.53355 (0.53393)	Top-1 acc 72.266 (67.596)	Top-5 acc 88.672 (86.311)	lr 0.00048
Train [110][1080/3239]	Time 0.244 (0.509)	Data Time 0.001 (0.035)	Loss 2.3683 (2.3452)	Entropy 0.53341 (0.53392)	Top-1 acc 66.406 (67.598)	Top-5 acc 84.375 (86.306)	lr 0.00048
Train [110][1090/3239]	Time 0.223 (0.508)	Data Time 0.001 (0.034)	Loss 2.4208 (2.3453)	Entropy 0.53317 (0.53392)	Top-1 acc 65.234 (67.592)	Top-5 acc 83.594 (86.300)	lr 0.00048
Train [110][1100/3239]	Time 0.250 (0.507)	Data Time 0.001 (0.034)	Loss 2.1361 (2.3453)	Entropy 0.53335 (0.53391)	Top-1 acc 74.219 (67.587)	Top-5 acc 89.453 (86.304)	lr 0.00048
Train [110][1110/3239]	Time 0.243 (0.506)	Data Time 0.001 (0.034)	Loss 2.1039 (2.3454)	Entropy 0.53397 (0.53391)	Top-1 acc 76.172 (67.590)	Top-5 acc 90.234 (86.302)	lr 0.00048
Train [110][1120/3239]	Time 0.325 (0.506)	Data Time 0.001 (0.033)	Loss 2.4467 (2.3456)	Entropy 0.53380 (0.53391)	Top-1 acc 64.453 (67.580)	Top-5 acc 85.156 (86.306)	lr 0.00048
Train [110][1130/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.033)	Loss 2.5511 (2.3465)	Entropy 0.53378 (0.53391)	Top-1 acc 65.234 (67.561)	Top-5 acc 83.203 (86.289)	lr 0.00048
Train [110][1140/3239]	Time 0.223 (0.504)	Data Time 0.001 (0.033)	Loss 2.2991 (2.3468)	Entropy 0.53352 (0.53391)	Top-1 acc 66.406 (67.547)	Top-5 acc 85.938 (86.283)	lr 0.00048
Train [110][1150/3239]	Time 0.237 (0.503)	Data Time 0.001 (0.033)	Loss 2.0931 (2.3465)	Entropy 0.53388 (0.53391)	Top-1 acc 72.266 (67.548)	Top-5 acc 92.188 (86.290)	lr 0.00048
Train [110][1160/3239]	Time 0.239 (0.502)	Data Time 0.001 (0.032)	Loss 2.3831 (2.3467)	Entropy 0.53402 (0.53391)	Top-1 acc 66.797 (67.545)	Top-5 acc 87.891 (86.288)	lr 0.00048
Train [110][1170/3239]	Time 0.324 (0.547)	Data Time 0.030 (0.032)	Loss 2.3699 (2.3474)	Entropy 0.53415 (0.53391)	Top-1 acc 68.750 (67.535)	Top-5 acc 85.547 (86.278)	lr 0.00048
Train [110][1180/3239]	Time 0.239 (0.546)	Data Time 0.002 (0.032)	Loss 2.4038 (2.3471)	Entropy 0.53418 (0.53391)	Top-1 acc 64.453 (67.538)	Top-5 acc 85.156 (86.283)	lr 0.00048
Train [110][1190/3239]	Time 0.233 (0.544)	Data Time 0.001 (0.032)	Loss 2.5176 (2.3471)	Entropy 0.53413 (0.53391)	Top-1 acc 64.062 (67.534)	Top-5 acc 82.812 (86.282)	lr 0.00048
Train [110][1200/3239]	Time 0.251 (0.543)	Data Time 0.002 (0.031)	Loss 2.2105 (2.3474)	Entropy 0.53410 (0.53391)	Top-1 acc 73.047 (67.536)	Top-5 acc 87.891 (86.283)	lr 0.00048
Train [110][1210/3239]	Time 0.225 (0.542)	Data Time 0.001 (0.031)	Loss 2.3626 (2.3479)	Entropy 0.53381 (0.53391)	Top-1 acc 66.406 (67.526)	Top-5 acc 85.938 (86.270)	lr 0.00048
Train [110][1220/3239]	Time 0.227 (0.541)	Data Time 0.001 (0.031)	Loss 2.4424 (2.3475)	Entropy 0.53357 (0.53391)	Top-1 acc 65.234 (67.537)	Top-5 acc 85.156 (86.278)	lr 0.00048
Train [110][1230/3239]	Time 0.232 (0.540)	Data Time 0.001 (0.031)	Loss 2.3920 (2.3473)	Entropy 0.53382 (0.53391)	Top-1 acc 66.797 (67.543)	Top-5 acc 85.547 (86.280)	lr 0.00048
Train [110][1240/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.030)	Loss 2.3320 (2.3471)	Entropy 0.53382 (0.53391)	Top-1 acc 66.016 (67.538)	Top-5 acc 86.328 (86.284)	lr 0.00048
Train [110][1250/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.030)	Loss 2.2915 (2.3471)	Entropy 0.53390 (0.53391)	Top-1 acc 69.922 (67.549)	Top-5 acc 86.719 (86.283)	lr 0.00048
Train [110][1260/3239]	Time 0.284 (0.537)	Data Time 0.001 (0.030)	Loss 2.1276 (2.3479)	Entropy 0.53439 (0.53391)	Top-1 acc 74.219 (67.529)	Top-5 acc 89.844 (86.268)	lr 0.00048
Train [110][1270/3239]	Time 0.240 (0.537)	Data Time 0.001 (0.030)	Loss 2.3882 (2.3480)	Entropy 0.53463 (0.53392)	Top-1 acc 69.531 (67.536)	Top-5 acc 85.547 (86.264)	lr 0.00048
Train [110][1280/3239]	Time 0.370 (0.536)	Data Time 0.001 (0.029)	Loss 2.2105 (2.3481)	Entropy 0.53446 (0.53392)	Top-1 acc 68.750 (67.524)	Top-5 acc 87.109 (86.261)	lr 0.00048
Train [110][1290/3239]	Time 0.242 (0.535)	Data Time 0.002 (0.029)	Loss 2.5287 (2.3486)	Entropy 0.53437 (0.53393)	Top-1 acc 62.891 (67.506)	Top-5 acc 82.031 (86.256)	lr 0.00048
Train [110][1300/3239]	Time 0.242 (0.534)	Data Time 0.001 (0.029)	Loss 2.3331 (2.3484)	Entropy 0.53460 (0.53393)	Top-1 acc 67.969 (67.509)	Top-5 acc 87.891 (86.259)	lr 0.00048
Train [110][1310/3239]	Time 0.243 (0.533)	Data Time 0.001 (0.029)	Loss 2.3630 (2.3483)	Entropy 0.53466 (0.53394)	Top-1 acc 66.016 (67.507)	Top-5 acc 87.500 (86.261)	lr 0.00048
Train [110][1320/3239]	Time 0.268 (0.533)	Data Time 0.002 (0.029)	Loss 2.3771 (2.3481)	Entropy 0.53434 (0.53394)	Top-1 acc 65.234 (67.512)	Top-5 acc 86.328 (86.264)	lr 0.00048
Train [110][1330/3239]	Time 0.255 (0.532)	Data Time 0.001 (0.028)	Loss 2.4911 (2.3484)	Entropy 0.53440 (0.53394)	Top-1 acc 64.844 (67.504)	Top-5 acc 82.422 (86.261)	lr 0.00048
Train [110][1340/3239]	Time 0.261 (0.532)	Data Time 0.002 (0.028)	Loss 2.3727 (2.3490)	Entropy 0.53420 (0.53395)	Top-1 acc 67.188 (67.483)	Top-5 acc 85.156 (86.254)	lr 0.00048
Train [110][1350/3239]	Time 0.338 (0.531)	Data Time 0.001 (0.028)	Loss 2.4386 (2.3494)	Entropy 0.53370 (0.53395)	Top-1 acc 62.109 (67.474)	Top-5 acc 85.156 (86.244)	lr 0.00048
Train [110][1360/3239]	Time 0.279 (0.530)	Data Time 0.001 (0.028)	Loss 2.3787 (2.3499)	Entropy 0.53381 (0.53395)	Top-1 acc 67.969 (67.464)	Top-5 acc 85.547 (86.235)	lr 0.00048
Train [110][1370/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.028)	Loss 2.3922 (2.3500)	Entropy 0.53393 (0.53395)	Top-1 acc 66.406 (67.458)	Top-5 acc 85.547 (86.234)	lr 0.00048
Train [110][1380/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.027)	Loss 2.2153 (2.3500)	Entropy 0.53391 (0.53394)	Top-1 acc 71.875 (67.455)	Top-5 acc 87.500 (86.237)	lr 0.00048
Train [110][1390/3239]	Time 0.225 (0.528)	Data Time 0.001 (0.027)	Loss 2.3103 (2.3498)	Entropy 0.53382 (0.53394)	Top-1 acc 68.359 (67.466)	Top-5 acc 88.281 (86.236)	lr 0.00048
Train [110][1400/3239]	Time 0.265 (0.527)	Data Time 0.003 (0.027)	Loss 2.2951 (2.3503)	Entropy 0.53359 (0.53394)	Top-1 acc 68.750 (67.459)	Top-5 acc 84.375 (86.221)	lr 0.00048
Train [110][1410/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.027)	Loss 2.6311 (2.3501)	Entropy 0.53371 (0.53394)	Top-1 acc 60.547 (67.460)	Top-5 acc 81.250 (86.227)	lr 0.00048
Train [110][1420/3239]	Time 0.282 (0.526)	Data Time 0.002 (0.027)	Loss 2.2280 (2.3499)	Entropy 0.53385 (0.53394)	Top-1 acc 69.922 (67.463)	Top-5 acc 87.891 (86.229)	lr 0.00047
Train [110][1430/3239]	Time 0.243 (0.525)	Data Time 0.002 (0.027)	Loss 2.2528 (2.3498)	Entropy 0.53385 (0.53394)	Top-1 acc 72.266 (67.468)	Top-5 acc 88.672 (86.230)	lr 0.00047
Train [110][1440/3239]	Time 0.346 (0.524)	Data Time 0.001 (0.026)	Loss 2.5037 (2.3499)	Entropy 0.53327 (0.53394)	Top-1 acc 62.891 (67.468)	Top-5 acc 84.766 (86.227)	lr 0.00047
Train [110][1450/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.026)	Loss 2.3228 (2.3500)	Entropy 0.53325 (0.53393)	Top-1 acc 66.406 (67.462)	Top-5 acc 85.938 (86.229)	lr 0.00047
Train [110][1460/3239]	Time 0.244 (0.523)	Data Time 0.001 (0.026)	Loss 2.3312 (2.3499)	Entropy 0.53308 (0.53393)	Top-1 acc 69.531 (67.466)	Top-5 acc 85.156 (86.227)	lr 0.00047
Train [110][1470/3239]	Time 0.242 (0.522)	Data Time 0.001 (0.026)	Loss 2.2865 (2.3500)	Entropy 0.53296 (0.53392)	Top-1 acc 69.922 (67.465)	Top-5 acc 85.938 (86.227)	lr 0.00047
Train [110][1480/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.026)	Loss 2.1707 (2.3500)	Entropy 0.53270 (0.53391)	Top-1 acc 73.828 (67.473)	Top-5 acc 89.453 (86.224)	lr 0.00047
Train [110][1490/3239]	Time 0.274 (0.521)	Data Time 0.002 (0.026)	Loss 2.2310 (2.3500)	Entropy 0.53271 (0.53391)	Top-1 acc 71.094 (67.474)	Top-5 acc 89.062 (86.228)	lr 0.00047
Train [110][1500/3239]	Time 0.220 (0.520)	Data Time 0.001 (0.025)	Loss 2.4592 (2.3503)	Entropy 0.53278 (0.53390)	Top-1 acc 65.625 (67.464)	Top-5 acc 85.156 (86.227)	lr 0.00047
Train [110][1510/3239]	Time 0.364 (0.520)	Data Time 0.001 (0.025)	Loss 2.4095 (2.3501)	Entropy 0.53288 (0.53389)	Top-1 acc 66.406 (67.466)	Top-5 acc 83.594 (86.228)	lr 0.00047
Train [110][1520/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.025)	Loss 2.2267 (2.3500)	Entropy 0.53246 (0.53388)	Top-1 acc 69.531 (67.471)	Top-5 acc 89.844 (86.229)	lr 0.00047
Train [110][1530/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.025)	Loss 2.3741 (2.3500)	Entropy 0.53244 (0.53387)	Top-1 acc 67.578 (67.466)	Top-5 acc 87.500 (86.232)	lr 0.00047
Train [110][1540/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.025)	Loss 2.2867 (2.3496)	Entropy 0.53264 (0.53387)	Top-1 acc 69.922 (67.484)	Top-5 acc 85.156 (86.238)	lr 0.00047
Train [110][1550/3239]	Time 0.233 (0.517)	Data Time 0.001 (0.025)	Loss 2.3895 (2.3496)	Entropy 0.53261 (0.53386)	Top-1 acc 67.578 (67.492)	Top-5 acc 84.766 (86.237)	lr 0.00047
Train [110][1560/3239]	Time 0.264 (0.516)	Data Time 0.001 (0.024)	Loss 2.3728 (2.3491)	Entropy 0.53293 (0.53385)	Top-1 acc 65.625 (67.502)	Top-5 acc 85.938 (86.246)	lr 0.00047
Train [110][1570/3239]	Time 0.238 (0.516)	Data Time 0.001 (0.024)	Loss 2.1781 (2.3492)	Entropy 0.53295 (0.53384)	Top-1 acc 69.922 (67.492)	Top-5 acc 89.062 (86.243)	lr 0.00047
Train [110][1580/3239]	Time 0.267 (0.515)	Data Time 0.001 (0.024)	Loss 2.3221 (2.3495)	Entropy 0.53332 (0.53384)	Top-1 acc 66.016 (67.482)	Top-5 acc 85.938 (86.232)	lr 0.00047
Train [110][1590/3239]	Time 0.329 (0.515)	Data Time 0.002 (0.024)	Loss 2.5992 (2.3499)	Entropy 0.53298 (0.53384)	Top-1 acc 65.234 (67.476)	Top-5 acc 82.031 (86.224)	lr 0.00047
Train [110][1600/3239]	Time 0.257 (0.515)	Data Time 0.001 (0.024)	Loss 2.4534 (2.3500)	Entropy 0.53311 (0.53383)	Top-1 acc 64.062 (67.468)	Top-5 acc 83.984 (86.221)	lr 0.00047
Train [110][1610/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.024)	Loss 2.4133 (2.3497)	Entropy 0.53300 (0.53383)	Top-1 acc 66.016 (67.478)	Top-5 acc 87.109 (86.221)	lr 0.00047
Train [110][1620/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.024)	Loss 2.3487 (2.3493)	Entropy 0.53323 (0.53382)	Top-1 acc 68.750 (67.486)	Top-5 acc 83.594 (86.221)	lr 0.00047
Train [110][1630/3239]	Time 0.248 (0.513)	Data Time 0.001 (0.023)	Loss 2.1022 (2.3494)	Entropy 0.53304 (0.53382)	Top-1 acc 74.219 (67.485)	Top-5 acc 89.844 (86.224)	lr 0.00047
Train [110][1640/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.023)	Loss 2.3069 (2.3495)	Entropy 0.53293 (0.53381)	Top-1 acc 71.875 (67.479)	Top-5 acc 85.156 (86.222)	lr 0.00047
Train [110][1650/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.023)	Loss 2.5521 (2.3499)	Entropy 0.53303 (0.53381)	Top-1 acc 62.500 (67.468)	Top-5 acc 82.422 (86.212)	lr 0.00047
Train [110][1660/3239]	Time 0.271 (0.511)	Data Time 0.001 (0.023)	Loss 2.3707 (2.3499)	Entropy 0.53311 (0.53380)	Top-1 acc 67.578 (67.463)	Top-5 acc 84.375 (86.213)	lr 0.00047
Train [110][1670/3239]	Time 0.348 (0.511)	Data Time 0.001 (0.023)	Loss 2.4507 (2.3500)	Entropy 0.53320 (0.53380)	Top-1 acc 65.625 (67.460)	Top-5 acc 85.938 (86.211)	lr 0.00047
Train [110][1680/3239]	Time 0.269 (0.510)	Data Time 0.001 (0.023)	Loss 2.3357 (2.3500)	Entropy 0.53276 (0.53379)	Top-1 acc 69.531 (67.461)	Top-5 acc 86.328 (86.208)	lr 0.00047
Train [110][1690/3239]	Time 0.266 (0.510)	Data Time 0.001 (0.023)	Loss 2.3709 (2.3498)	Entropy 0.53272 (0.53379)	Top-1 acc 66.797 (67.465)	Top-5 acc 85.938 (86.211)	lr 0.00047
Train [110][1700/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.023)	Loss 2.2772 (2.3500)	Entropy 0.53256 (0.53378)	Top-1 acc 63.672 (67.454)	Top-5 acc 86.719 (86.205)	lr 0.00047
Train [110][1710/3239]	Time 0.235 (0.509)	Data Time 0.001 (0.022)	Loss 2.2917 (2.3500)	Entropy 0.53285 (0.53378)	Top-1 acc 69.922 (67.457)	Top-5 acc 85.547 (86.203)	lr 0.00047
Train [110][1720/3239]	Time 0.232 (0.508)	Data Time 0.001 (0.022)	Loss 2.6857 (2.3500)	Entropy 0.53300 (0.53377)	Top-1 acc 58.984 (67.452)	Top-5 acc 81.250 (86.204)	lr 0.00047
Train [110][1730/3239]	Time 0.222 (0.507)	Data Time 0.001 (0.022)	Loss 2.3418 (2.3499)	Entropy 0.53312 (0.53377)	Top-1 acc 66.797 (67.457)	Top-5 acc 86.719 (86.203)	lr 0.00047
Train [110][1740/3239]	Time 0.343 (0.507)	Data Time 0.001 (0.022)	Loss 2.3758 (2.3504)	Entropy 0.53283 (0.53376)	Top-1 acc 67.188 (67.449)	Top-5 acc 87.500 (86.195)	lr 0.00047
Train [110][1750/3239]	Time 0.283 (0.507)	Data Time 0.002 (0.022)	Loss 2.5944 (2.3503)	Entropy 0.53297 (0.53376)	Top-1 acc 60.156 (67.456)	Top-5 acc 81.250 (86.197)	lr 0.00047
Train [110][1760/3239]	Time 0.232 (0.506)	Data Time 0.001 (0.022)	Loss 2.3608 (2.3504)	Entropy 0.53265 (0.53375)	Top-1 acc 67.969 (67.457)	Top-5 acc 86.328 (86.193)	lr 0.00047
Train [110][1770/3239]	Time 0.225 (0.506)	Data Time 0.001 (0.022)	Loss 2.2068 (2.3498)	Entropy 0.53288 (0.53374)	Top-1 acc 72.656 (67.473)	Top-5 acc 86.719 (86.202)	lr 0.00047
Train [110][1780/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.022)	Loss 2.1689 (2.3498)	Entropy 0.53286 (0.53374)	Top-1 acc 71.094 (67.471)	Top-5 acc 89.453 (86.202)	lr 0.00046
Train [110][1790/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.022)	Loss 2.2810 (2.3494)	Entropy 0.53295 (0.53374)	Top-1 acc 67.969 (67.484)	Top-5 acc 85.547 (86.209)	lr 0.00046
Train [110][1800/3239]	Time 0.235 (0.505)	Data Time 0.001 (0.021)	Loss 2.2402 (2.3495)	Entropy 0.53306 (0.53373)	Top-1 acc 70.312 (67.484)	Top-5 acc 87.891 (86.210)	lr 0.00046
Train [110][1810/3239]	Time 0.271 (0.504)	Data Time 0.001 (0.021)	Loss 2.5103 (2.3498)	Entropy 0.53288 (0.53373)	Top-1 acc 62.500 (67.477)	Top-5 acc 83.203 (86.209)	lr 0.00046
Train [110][1820/3239]	Time 0.450 (0.532)	Data Time 0.006 (0.021)	Loss 2.3697 (2.3497)	Entropy 0.53308 (0.53372)	Top-1 acc 67.188 (67.479)	Top-5 acc 84.766 (86.211)	lr 0.00046
Train [110][1830/3239]	Time 0.376 (0.532)	Data Time 0.002 (0.021)	Loss 2.2708 (2.3494)	Entropy 0.53285 (0.53372)	Top-1 acc 67.578 (67.485)	Top-5 acc 87.500 (86.216)	lr 0.00046
Train [110][1840/3239]	Time 0.278 (0.531)	Data Time 0.004 (0.021)	Loss 2.4873 (2.3492)	Entropy 0.53285 (0.53371)	Top-1 acc 64.844 (67.487)	Top-5 acc 82.422 (86.216)	lr 0.00046
Train [110][1850/3239]	Time 0.275 (0.531)	Data Time 0.003 (0.021)	Loss 2.4549 (2.3496)	Entropy 0.53270 (0.53371)	Top-1 acc 64.062 (67.475)	Top-5 acc 85.938 (86.212)	lr 0.00046
Train [110][1860/3239]	Time 0.274 (0.530)	Data Time 0.002 (0.021)	Loss 2.5763 (2.3501)	Entropy 0.53262 (0.53370)	Top-1 acc 59.766 (67.463)	Top-5 acc 82.031 (86.205)	lr 0.00046
Train [110][1870/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.021)	Loss 2.2635 (2.3500)	Entropy 0.53317 (0.53370)	Top-1 acc 67.578 (67.466)	Top-5 acc 85.938 (86.201)	lr 0.00046
Train [110][1880/3239]	Time 0.251 (0.529)	Data Time 0.001 (0.021)	Loss 2.2949 (2.3499)	Entropy 0.53338 (0.53370)	Top-1 acc 71.484 (67.467)	Top-5 acc 86.719 (86.200)	lr 0.00046
Train [110][1890/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.021)	Loss 2.4645 (2.3496)	Entropy 0.53341 (0.53370)	Top-1 acc 66.016 (67.474)	Top-5 acc 82.031 (86.202)	lr 0.00046
Train [110][1900/3239]	Time 0.362 (0.528)	Data Time 0.001 (0.020)	Loss 2.3161 (2.3495)	Entropy 0.53292 (0.53369)	Top-1 acc 69.922 (67.479)	Top-5 acc 87.891 (86.203)	lr 0.00046
Train [110][1910/3239]	Time 0.250 (0.528)	Data Time 0.002 (0.020)	Loss 2.4488 (2.3496)	Entropy 0.53304 (0.53369)	Top-1 acc 65.234 (67.484)	Top-5 acc 83.594 (86.203)	lr 0.00046
Train [110][1920/3239]	Time 0.245 (0.527)	Data Time 0.001 (0.020)	Loss 2.2882 (2.3493)	Entropy 0.53312 (0.53369)	Top-1 acc 70.703 (67.488)	Top-5 acc 85.547 (86.207)	lr 0.00046
Train [110][1930/3239]	Time 0.238 (0.527)	Data Time 0.001 (0.020)	Loss 2.2281 (2.3493)	Entropy 0.53297 (0.53368)	Top-1 acc 71.875 (67.484)	Top-5 acc 89.844 (86.210)	lr 0.00046
Train [110][1940/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.020)	Loss 2.4224 (2.3494)	Entropy 0.53317 (0.53368)	Top-1 acc 67.188 (67.481)	Top-5 acc 83.203 (86.207)	lr 0.00046
Train [110][1950/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.020)	Loss 2.3248 (2.3493)	Entropy 0.53296 (0.53368)	Top-1 acc 69.922 (67.485)	Top-5 acc 87.500 (86.214)	lr 0.00046
Train [110][1960/3239]	Time 0.235 (0.525)	Data Time 0.001 (0.020)	Loss 2.4484 (2.3493)	Entropy 0.53297 (0.53367)	Top-1 acc 63.672 (67.488)	Top-5 acc 87.109 (86.217)	lr 0.00046
Train [110][1970/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.020)	Loss 2.3339 (2.3493)	Entropy 0.53289 (0.53367)	Top-1 acc 67.188 (67.490)	Top-5 acc 87.109 (86.215)	lr 0.00046
Train [110][1980/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.020)	Loss 2.3673 (2.3494)	Entropy 0.53292 (0.53367)	Top-1 acc 65.234 (67.486)	Top-5 acc 85.547 (86.209)	lr 0.00046
Train [110][1990/3239]	Time 0.366 (0.524)	Data Time 0.003 (0.020)	Loss 2.3283 (2.3495)	Entropy 0.53285 (0.53366)	Top-1 acc 68.750 (67.486)	Top-5 acc 85.547 (86.207)	lr 0.00046
Train [110][2000/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.019)	Loss 2.1321 (2.3495)	Entropy 0.53273 (0.53366)	Top-1 acc 72.656 (67.481)	Top-5 acc 90.625 (86.210)	lr 0.00046
Train [110][2010/3239]	Time 0.218 (0.523)	Data Time 0.001 (0.019)	Loss 2.5824 (2.3496)	Entropy 0.53279 (0.53365)	Top-1 acc 60.938 (67.479)	Top-5 acc 82.422 (86.212)	lr 0.00046
Train [110][2020/3239]	Time 0.266 (0.522)	Data Time 0.003 (0.019)	Loss 2.4687 (2.3498)	Entropy 0.53235 (0.53365)	Top-1 acc 65.625 (67.475)	Top-5 acc 85.938 (86.208)	lr 0.00046
Train [110][2030/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.019)	Loss 2.2966 (2.3498)	Entropy 0.53201 (0.53364)	Top-1 acc 72.656 (67.483)	Top-5 acc 85.938 (86.205)	lr 0.00046
Train [110][2040/3239]	Time 0.251 (0.522)	Data Time 0.001 (0.019)	Loss 2.2575 (2.3499)	Entropy 0.53207 (0.53363)	Top-1 acc 69.531 (67.480)	Top-5 acc 88.281 (86.206)	lr 0.00046
Train [110][2050/3239]	Time 0.250 (0.521)	Data Time 0.001 (0.019)	Loss 2.4677 (2.3500)	Entropy 0.53173 (0.53362)	Top-1 acc 62.891 (67.475)	Top-5 acc 83.984 (86.200)	lr 0.00046
Train [110][2060/3239]	Time 0.373 (0.521)	Data Time 0.001 (0.019)	Loss 2.5308 (2.3502)	Entropy 0.53179 (0.53362)	Top-1 acc 65.234 (67.477)	Top-5 acc 83.203 (86.196)	lr 0.00046
Train [110][2070/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.019)	Loss 2.2061 (2.3501)	Entropy 0.53171 (0.53361)	Top-1 acc 69.141 (67.477)	Top-5 acc 86.328 (86.197)	lr 0.00046
Train [110][2080/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.019)	Loss 2.4257 (2.3502)	Entropy 0.53138 (0.53360)	Top-1 acc 66.406 (67.473)	Top-5 acc 82.422 (86.189)	lr 0.00046
Train [110][2090/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.019)	Loss 2.4012 (2.3504)	Entropy 0.53131 (0.53359)	Top-1 acc 68.359 (67.474)	Top-5 acc 85.547 (86.190)	lr 0.00046
Train [110][2100/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.019)	Loss 2.4476 (2.3507)	Entropy 0.53128 (0.53357)	Top-1 acc 64.844 (67.470)	Top-5 acc 83.594 (86.182)	lr 0.00046
Train [110][2110/3239]	Time 0.261 (0.518)	Data Time 0.001 (0.019)	Loss 2.4096 (2.3507)	Entropy 0.53125 (0.53356)	Top-1 acc 62.891 (67.473)	Top-5 acc 85.547 (86.184)	lr 0.00046
Train [110][2120/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.018)	Loss 2.5305 (2.3506)	Entropy 0.53132 (0.53355)	Top-1 acc 63.672 (67.475)	Top-5 acc 83.594 (86.186)	lr 0.00046
Train [110][2130/3239]	Time 0.238 (0.518)	Data Time 0.001 (0.018)	Loss 2.2764 (2.3506)	Entropy 0.53124 (0.53354)	Top-1 acc 70.312 (67.473)	Top-5 acc 86.719 (86.186)	lr 0.00046
Train [110][2140/3239]	Time 0.238 (0.517)	Data Time 0.001 (0.018)	Loss 2.3552 (2.3506)	Entropy 0.53092 (0.53353)	Top-1 acc 69.922 (67.473)	Top-5 acc 85.938 (86.189)	lr 0.00046
Train [110][2150/3239]	Time 0.317 (0.517)	Data Time 0.001 (0.018)	Loss 2.1473 (2.3505)	Entropy 0.53085 (0.53352)	Top-1 acc 76.172 (67.477)	Top-5 acc 90.234 (86.190)	lr 0.00045
Train [110][2160/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.018)	Loss 2.2236 (2.3506)	Entropy 0.53049 (0.53351)	Top-1 acc 70.703 (67.479)	Top-5 acc 89.453 (86.190)	lr 0.00045
Train [110][2170/3239]	Time 0.304 (0.516)	Data Time 0.002 (0.018)	Loss 2.2946 (2.3507)	Entropy 0.53049 (0.53349)	Top-1 acc 67.969 (67.476)	Top-5 acc 88.281 (86.192)	lr 0.00045
Train [110][2180/3239]	Time 0.256 (0.516)	Data Time 0.001 (0.018)	Loss 2.6057 (2.3510)	Entropy 0.53052 (0.53348)	Top-1 acc 63.281 (67.472)	Top-5 acc 82.031 (86.185)	lr 0.00045
Train [110][2190/3239]	Time 0.235 (0.515)	Data Time 0.001 (0.018)	Loss 2.3906 (2.3512)	Entropy 0.53058 (0.53347)	Top-1 acc 66.016 (67.465)	Top-5 acc 87.500 (86.180)	lr 0.00045
Train [110][2200/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.018)	Loss 2.1296 (2.3514)	Entropy 0.53049 (0.53345)	Top-1 acc 73.047 (67.459)	Top-5 acc 90.625 (86.178)	lr 0.00045
Train [110][2210/3239]	Time 0.232 (0.514)	Data Time 0.001 (0.018)	Loss 2.4899 (2.3514)	Entropy 0.53045 (0.53344)	Top-1 acc 62.891 (67.456)	Top-5 acc 83.984 (86.178)	lr 0.00045
Train [110][2220/3239]	Time 0.331 (0.514)	Data Time 0.001 (0.018)	Loss 2.5487 (2.3517)	Entropy 0.53036 (0.53342)	Top-1 acc 64.453 (67.446)	Top-5 acc 81.250 (86.174)	lr 0.00045
Train [110][2230/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.018)	Loss 2.3594 (2.3519)	Entropy 0.53045 (0.53341)	Top-1 acc 68.750 (67.443)	Top-5 acc 85.938 (86.173)	lr 0.00045
Train [110][2240/3239]	Time 0.244 (0.513)	Data Time 0.001 (0.018)	Loss 2.2027 (2.3518)	Entropy 0.53067 (0.53340)	Top-1 acc 69.141 (67.444)	Top-5 acc 86.719 (86.171)	lr 0.00045
Train [110][2250/3239]	Time 0.230 (0.512)	Data Time 0.002 (0.017)	Loss 2.3766 (2.3519)	Entropy 0.53075 (0.53339)	Top-1 acc 70.312 (67.442)	Top-5 acc 86.719 (86.170)	lr 0.00045
Train [110][2260/3239]	Time 0.228 (0.512)	Data Time 0.001 (0.017)	Loss 2.5080 (2.3520)	Entropy 0.53071 (0.53338)	Top-1 acc 61.719 (67.442)	Top-5 acc 85.156 (86.169)	lr 0.00045
Train [110][2270/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.017)	Loss 2.2373 (2.3521)	Entropy 0.53077 (0.53336)	Top-1 acc 68.750 (67.438)	Top-5 acc 89.062 (86.168)	lr 0.00045
Train [110][2280/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.017)	Loss 2.4666 (2.3521)	Entropy 0.53049 (0.53335)	Top-1 acc 64.453 (67.434)	Top-5 acc 84.766 (86.169)	lr 0.00045
Train [110][2290/3239]	Time 0.334 (0.511)	Data Time 0.001 (0.017)	Loss 2.2734 (2.3518)	Entropy 0.53057 (0.53334)	Top-1 acc 69.922 (67.445)	Top-5 acc 87.500 (86.172)	lr 0.00045
Train [110][2300/3239]	Time 0.241 (0.510)	Data Time 0.001 (0.017)	Loss 2.0527 (2.3517)	Entropy 0.53055 (0.53333)	Top-1 acc 75.391 (67.449)	Top-5 acc 91.016 (86.176)	lr 0.00045
Train [110][2310/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.017)	Loss 2.2778 (2.3516)	Entropy 0.53058 (0.53332)	Top-1 acc 73.047 (67.455)	Top-5 acc 87.891 (86.176)	lr 0.00045
Train [110][2320/3239]	Time 0.248 (0.509)	Data Time 0.001 (0.017)	Loss 2.4617 (2.3517)	Entropy 0.53046 (0.53330)	Top-1 acc 62.109 (67.454)	Top-5 acc 84.375 (86.175)	lr 0.00045
Train [110][2330/3239]	Time 0.235 (0.509)	Data Time 0.001 (0.017)	Loss 2.4353 (2.3516)	Entropy 0.53025 (0.53329)	Top-1 acc 64.062 (67.457)	Top-5 acc 88.281 (86.179)	lr 0.00045
Train [110][2340/3239]	Time 0.260 (0.509)	Data Time 0.001 (0.017)	Loss 2.1861 (2.3513)	Entropy 0.53041 (0.53328)	Top-1 acc 68.359 (67.461)	Top-5 acc 89.453 (86.185)	lr 0.00045
Train [110][2350/3239]	Time 0.252 (0.508)	Data Time 0.001 (0.017)	Loss 2.2931 (2.3516)	Entropy 0.53033 (0.53327)	Top-1 acc 67.188 (67.456)	Top-5 acc 87.891 (86.181)	lr 0.00045
Train [110][2360/3239]	Time 0.249 (0.508)	Data Time 0.001 (0.017)	Loss 2.2130 (2.3513)	Entropy 0.53055 (0.53325)	Top-1 acc 71.484 (67.463)	Top-5 acc 89.844 (86.187)	lr 0.00045
Train [110][2370/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.017)	Loss 2.3167 (2.3515)	Entropy 0.53029 (0.53324)	Top-1 acc 65.234 (67.457)	Top-5 acc 84.766 (86.183)	lr 0.00045
Train [110][2380/3239]	Time 0.325 (0.507)	Data Time 0.001 (0.017)	Loss 2.1342 (2.3514)	Entropy 0.53036 (0.53323)	Top-1 acc 70.703 (67.457)	Top-5 acc 90.625 (86.186)	lr 0.00045
Train [110][2390/3239]	Time 0.255 (0.507)	Data Time 0.001 (0.017)	Loss 2.3397 (2.3515)	Entropy 0.53036 (0.53322)	Top-1 acc 69.531 (67.458)	Top-5 acc 86.719 (86.187)	lr 0.00045
Train [110][2400/3239]	Time 0.244 (0.506)	Data Time 0.002 (0.016)	Loss 2.3052 (2.3513)	Entropy 0.53023 (0.53321)	Top-1 acc 64.844 (67.461)	Top-5 acc 88.672 (86.191)	lr 0.00045
Train [110][2410/3239]	Time 0.237 (0.506)	Data Time 0.001 (0.016)	Loss 2.2051 (2.3514)	Entropy 0.52993 (0.53319)	Top-1 acc 72.656 (67.457)	Top-5 acc 89.062 (86.191)	lr 0.00045
Train [110][2420/3239]	Time 0.234 (0.506)	Data Time 0.001 (0.016)	Loss 2.1814 (2.3513)	Entropy 0.53013 (0.53318)	Top-1 acc 75.000 (67.460)	Top-5 acc 87.109 (86.192)	lr 0.00045
Train [110][2430/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.016)	Loss 2.4767 (2.3514)	Entropy 0.53045 (0.53317)	Top-1 acc 65.234 (67.457)	Top-5 acc 83.984 (86.190)	lr 0.00045
Train [110][2440/3239]	Time 0.242 (0.505)	Data Time 0.001 (0.016)	Loss 2.2052 (2.3513)	Entropy 0.53036 (0.53316)	Top-1 acc 71.094 (67.461)	Top-5 acc 89.844 (86.191)	lr 0.00045
Train [110][2450/3239]	Time 0.326 (0.505)	Data Time 0.001 (0.016)	Loss 2.8163 (2.3515)	Entropy 0.53075 (0.53315)	Top-1 acc 55.469 (67.459)	Top-5 acc 79.297 (86.189)	lr 0.00045
Train [110][2460/3239]	Time 0.223 (0.504)	Data Time 0.001 (0.016)	Loss 2.2710 (2.3514)	Entropy 0.53076 (0.53314)	Top-1 acc 67.188 (67.464)	Top-5 acc 88.672 (86.190)	lr 0.00045
Train [110][2470/3239]	Time 0.248 (0.504)	Data Time 0.001 (0.016)	Loss 2.2097 (2.3513)	Entropy 0.53074 (0.53313)	Top-1 acc 71.875 (67.468)	Top-5 acc 87.109 (86.192)	lr 0.00045
Train [110][2480/3239]	Time 0.242 (0.525)	Data Time 0.002 (0.016)	Loss 2.8297 (2.3515)	Entropy 0.53047 (0.53312)	Top-1 acc 53.906 (67.461)	Top-5 acc 80.469 (86.189)	lr 0.00045
Train [110][2490/3239]	Time 0.246 (0.525)	Data Time 0.002 (0.016)	Loss 2.3030 (2.3515)	Entropy 0.53026 (0.53311)	Top-1 acc 68.359 (67.462)	Top-5 acc 88.672 (86.189)	lr 0.00045
Train [110][2500/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.016)	Loss 2.5218 (2.3511)	Entropy 0.53031 (0.53309)	Top-1 acc 60.156 (67.467)	Top-5 acc 83.203 (86.196)	lr 0.00045
Train [110][2510/3239]	Time 0.223 (0.524)	Data Time 0.001 (0.016)	Loss 2.2416 (2.3512)	Entropy 0.53010 (0.53308)	Top-1 acc 70.312 (67.467)	Top-5 acc 87.500 (86.194)	lr 0.00045
Train [110][2520/3239]	Time 0.244 (0.523)	Data Time 0.002 (0.016)	Loss 2.4565 (2.3510)	Entropy 0.52978 (0.53307)	Top-1 acc 64.844 (67.470)	Top-5 acc 85.547 (86.198)	lr 0.00044
Train [110][2530/3239]	Time 0.253 (0.523)	Data Time 0.001 (0.016)	Loss 2.3133 (2.3511)	Entropy 0.52928 (0.53306)	Top-1 acc 67.969 (67.467)	Top-5 acc 87.500 (86.196)	lr 0.00044
Train [110][2540/3239]	Time 0.380 (0.523)	Data Time 0.001 (0.016)	Loss 2.2115 (2.3508)	Entropy 0.52932 (0.53304)	Top-1 acc 71.484 (67.476)	Top-5 acc 89.453 (86.201)	lr 0.00044
Train [110][2550/3239]	Time 0.245 (0.522)	Data Time 0.001 (0.016)	Loss 2.3069 (2.3508)	Entropy 0.52901 (0.53303)	Top-1 acc 68.359 (67.482)	Top-5 acc 86.328 (86.202)	lr 0.00044
Train [110][2560/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.016)	Loss 2.3359 (2.3508)	Entropy 0.52894 (0.53301)	Top-1 acc 66.406 (67.483)	Top-5 acc 85.156 (86.200)	lr 0.00044
Train [110][2570/3239]	Time 0.269 (0.521)	Data Time 0.001 (0.016)	Loss 2.6016 (2.3508)	Entropy 0.52879 (0.53300)	Top-1 acc 63.281 (67.489)	Top-5 acc 80.469 (86.200)	lr 0.00044
Train [110][2580/3239]	Time 0.251 (0.521)	Data Time 0.001 (0.015)	Loss 2.4270 (2.3510)	Entropy 0.52868 (0.53298)	Top-1 acc 68.359 (67.486)	Top-5 acc 85.156 (86.200)	lr 0.00044
Train [110][2590/3239]	Time 0.241 (0.521)	Data Time 0.001 (0.015)	Loss 2.6837 (2.3511)	Entropy 0.52880 (0.53296)	Top-1 acc 60.938 (67.483)	Top-5 acc 82.812 (86.197)	lr 0.00044
Train [110][2600/3239]	Time 0.243 (0.520)	Data Time 0.001 (0.015)	Loss 2.3131 (2.3509)	Entropy 0.52898 (0.53295)	Top-1 acc 69.922 (67.491)	Top-5 acc 85.547 (86.201)	lr 0.00044
Train [110][2610/3239]	Time 0.380 (0.520)	Data Time 0.001 (0.015)	Loss 2.1916 (2.3509)	Entropy 0.52893 (0.53293)	Top-1 acc 73.047 (67.493)	Top-5 acc 89.453 (86.202)	lr 0.00044
Train [110][2620/3239]	Time 0.244 (0.520)	Data Time 0.001 (0.015)	Loss 2.1196 (2.3508)	Entropy 0.52885 (0.53292)	Top-1 acc 71.875 (67.496)	Top-5 acc 91.406 (86.204)	lr 0.00044
Train [110][2630/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.015)	Loss 2.1598 (2.3511)	Entropy 0.52907 (0.53290)	Top-1 acc 73.047 (67.493)	Top-5 acc 90.625 (86.201)	lr 0.00044
Train [110][2640/3239]	Time 0.239 (0.519)	Data Time 0.001 (0.015)	Loss 2.3069 (2.3510)	Entropy 0.52869 (0.53289)	Top-1 acc 66.797 (67.490)	Top-5 acc 85.156 (86.200)	lr 0.00044
Train [110][2650/3239]	Time 0.243 (0.519)	Data Time 0.001 (0.015)	Loss 2.4219 (2.3509)	Entropy 0.52902 (0.53287)	Top-1 acc 65.625 (67.491)	Top-5 acc 85.938 (86.200)	lr 0.00044
Train [110][2660/3239]	Time 0.267 (0.518)	Data Time 0.001 (0.015)	Loss 2.9486 (2.3512)	Entropy 0.52900 (0.53286)	Top-1 acc 54.297 (67.484)	Top-5 acc 75.781 (86.194)	lr 0.00044
Train [110][2670/3239]	Time 0.246 (0.518)	Data Time 0.001 (0.015)	Loss 2.3502 (2.3513)	Entropy 0.52903 (0.53284)	Top-1 acc 69.922 (67.481)	Top-5 acc 85.938 (86.194)	lr 0.00044
Train [110][2680/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.015)	Loss 2.3058 (2.3513)	Entropy 0.52905 (0.53283)	Top-1 acc 67.188 (67.479)	Top-5 acc 85.938 (86.197)	lr 0.00044
Train [110][2690/3239]	Time 0.259 (0.517)	Data Time 0.002 (0.015)	Loss 2.0960 (2.3514)	Entropy 0.52894 (0.53281)	Top-1 acc 77.344 (67.477)	Top-5 acc 87.891 (86.193)	lr 0.00044
Train [110][2700/3239]	Time 0.503 (0.517)	Data Time 0.002 (0.015)	Loss 2.3640 (2.3517)	Entropy 0.52895 (0.53280)	Top-1 acc 67.969 (67.473)	Top-5 acc 85.156 (86.188)	lr 0.00044
Train [110][2710/3239]	Time 0.248 (0.518)	Data Time 0.002 (0.015)	Loss 2.2324 (2.3516)	Entropy 0.52922 (0.53279)	Top-1 acc 71.484 (67.474)	Top-5 acc 86.328 (86.190)	lr 0.00044
Train [110][2720/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.015)	Loss 2.4022 (2.3516)	Entropy 0.52930 (0.53277)	Top-1 acc 64.062 (67.473)	Top-5 acc 85.547 (86.192)	lr 0.00044
Train [110][2730/3239]	Time 0.263 (0.517)	Data Time 0.002 (0.015)	Loss 2.2615 (2.3516)	Entropy 0.52922 (0.53276)	Top-1 acc 70.312 (67.473)	Top-5 acc 87.109 (86.192)	lr 0.00044
Train [110][2740/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.015)	Loss 2.3059 (2.3516)	Entropy 0.52928 (0.53275)	Top-1 acc 66.016 (67.473)	Top-5 acc 88.281 (86.193)	lr 0.00044
Train [110][2750/3239]	Time 0.279 (0.516)	Data Time 0.001 (0.015)	Loss 2.3508 (2.3515)	Entropy 0.52891 (0.53273)	Top-1 acc 66.406 (67.473)	Top-5 acc 86.328 (86.192)	lr 0.00044
Train [110][2760/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.015)	Loss 2.2843 (2.3514)	Entropy 0.52928 (0.53272)	Top-1 acc 66.406 (67.475)	Top-5 acc 88.672 (86.192)	lr 0.00044
Train [110][2770/3239]	Time 0.330 (0.515)	Data Time 0.001 (0.015)	Loss 2.3887 (2.3516)	Entropy 0.52928 (0.53271)	Top-1 acc 62.500 (67.466)	Top-5 acc 86.719 (86.191)	lr 0.00044
Train [110][2780/3239]	Time 0.229 (0.515)	Data Time 0.001 (0.014)	Loss 2.5143 (2.3515)	Entropy 0.52897 (0.53269)	Top-1 acc 63.281 (67.466)	Top-5 acc 82.031 (86.190)	lr 0.00044
Train [110][2790/3239]	Time 0.265 (0.515)	Data Time 0.001 (0.014)	Loss 2.2547 (2.3515)	Entropy 0.52885 (0.53268)	Top-1 acc 71.484 (67.465)	Top-5 acc 87.500 (86.192)	lr 0.00044
Train [110][2800/3239]	Time 0.234 (0.515)	Data Time 0.001 (0.014)	Loss 2.3340 (2.3514)	Entropy 0.52864 (0.53267)	Top-1 acc 64.844 (67.467)	Top-5 acc 86.328 (86.194)	lr 0.00044
Train [110][2810/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.014)	Loss 2.3166 (2.3515)	Entropy 0.52870 (0.53265)	Top-1 acc 69.922 (67.458)	Top-5 acc 85.547 (86.194)	lr 0.00044
Train [110][2820/3239]	Time 0.229 (0.514)	Data Time 0.001 (0.014)	Loss 2.3466 (2.3516)	Entropy 0.52881 (0.53264)	Top-1 acc 68.359 (67.454)	Top-5 acc 82.422 (86.191)	lr 0.00044
Train [110][2830/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.014)	Loss 2.3757 (2.3516)	Entropy 0.52883 (0.53263)	Top-1 acc 66.797 (67.455)	Top-5 acc 88.281 (86.192)	lr 0.00044
Train [110][2840/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.014)	Loss 2.1284 (2.3516)	Entropy 0.52875 (0.53261)	Top-1 acc 73.438 (67.454)	Top-5 acc 87.500 (86.191)	lr 0.00044
Train [110][2850/3239]	Time 0.226 (0.513)	Data Time 0.001 (0.014)	Loss 2.2104 (2.3515)	Entropy 0.52863 (0.53260)	Top-1 acc 71.484 (67.456)	Top-5 acc 87.500 (86.192)	lr 0.00044
Train [110][2860/3239]	Time 0.261 (0.512)	Data Time 0.001 (0.014)	Loss 2.3750 (2.3515)	Entropy 0.52861 (0.53258)	Top-1 acc 67.578 (67.456)	Top-5 acc 84.766 (86.192)	lr 0.00044
Train [110][2870/3239]	Time 0.236 (0.512)	Data Time 0.001 (0.014)	Loss 2.2672 (2.3515)	Entropy 0.52864 (0.53257)	Top-1 acc 70.312 (67.458)	Top-5 acc 89.062 (86.195)	lr 0.00044
Train [110][2880/3239]	Time 0.250 (0.512)	Data Time 0.001 (0.014)	Loss 2.5156 (2.3515)	Entropy 0.52880 (0.53256)	Top-1 acc 65.625 (67.462)	Top-5 acc 84.766 (86.195)	lr 0.00044
Train [110][2890/3239]	Time 0.232 (0.511)	Data Time 0.001 (0.014)	Loss 2.2611 (2.3515)	Entropy 0.52899 (0.53254)	Top-1 acc 66.016 (67.464)	Top-5 acc 86.328 (86.191)	lr 0.00044
Train [110][2900/3239]	Time 0.236 (0.511)	Data Time 0.001 (0.014)	Loss 2.2369 (2.3514)	Entropy 0.52926 (0.53253)	Top-1 acc 73.047 (67.468)	Top-5 acc 88.281 (86.196)	lr 0.00043
Train [110][2910/3239]	Time 0.247 (0.511)	Data Time 0.001 (0.014)	Loss 2.3148 (2.3515)	Entropy 0.52932 (0.53252)	Top-1 acc 67.969 (67.462)	Top-5 acc 86.328 (86.192)	lr 0.00043
Train [110][2920/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.014)	Loss 2.4738 (2.3515)	Entropy 0.52931 (0.53251)	Top-1 acc 65.234 (67.464)	Top-5 acc 84.766 (86.194)	lr 0.00043
Train [110][2930/3239]	Time 0.335 (0.510)	Data Time 0.001 (0.014)	Loss 2.1072 (2.3512)	Entropy 0.52928 (0.53250)	Top-1 acc 72.656 (67.471)	Top-5 acc 90.234 (86.199)	lr 0.00043
Train [110][2940/3239]	Time 0.236 (0.510)	Data Time 0.001 (0.014)	Loss 2.5328 (2.3513)	Entropy 0.52959 (0.53249)	Top-1 acc 64.062 (67.470)	Top-5 acc 80.859 (86.197)	lr 0.00043
Train [110][2950/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.014)	Loss 2.5719 (2.3513)	Entropy 0.52929 (0.53248)	Top-1 acc 64.453 (67.475)	Top-5 acc 82.031 (86.197)	lr 0.00043
Train [110][2960/3239]	Time 0.248 (0.509)	Data Time 0.001 (0.014)	Loss 2.5731 (2.3513)	Entropy 0.52924 (0.53247)	Top-1 acc 63.672 (67.475)	Top-5 acc 82.422 (86.195)	lr 0.00043
Train [110][2970/3239]	Time 0.270 (0.509)	Data Time 0.001 (0.014)	Loss 2.1747 (2.3513)	Entropy 0.52964 (0.53246)	Top-1 acc 71.875 (67.475)	Top-5 acc 87.891 (86.197)	lr 0.00043
Train [110][2980/3239]	Time 0.271 (0.508)	Data Time 0.001 (0.014)	Loss 2.4431 (2.3515)	Entropy 0.52954 (0.53245)	Top-1 acc 64.062 (67.469)	Top-5 acc 84.766 (86.194)	lr 0.00043
Train [110][2990/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.014)	Loss 2.5515 (2.3517)	Entropy 0.52983 (0.53244)	Top-1 acc 63.281 (67.466)	Top-5 acc 82.031 (86.190)	lr 0.00043
Train [110][3000/3239]	Time 0.341 (0.508)	Data Time 0.002 (0.014)	Loss 2.2953 (2.3515)	Entropy 0.52994 (0.53243)	Top-1 acc 71.094 (67.471)	Top-5 acc 86.719 (86.191)	lr 0.00043
Train [110][3010/3239]	Time 0.318 (0.508)	Data Time 0.001 (0.014)	Loss 2.3661 (2.3517)	Entropy 0.52992 (0.53242)	Top-1 acc 66.016 (67.467)	Top-5 acc 84.375 (86.187)	lr 0.00043
Train [110][3020/3239]	Time 0.224 (0.507)	Data Time 0.001 (0.014)	Loss 2.5040 (2.3517)	Entropy 0.53020 (0.53241)	Top-1 acc 66.016 (67.471)	Top-5 acc 83.203 (86.188)	lr 0.00043
Train [110][3030/3239]	Time 0.229 (0.507)	Data Time 0.001 (0.013)	Loss 2.4790 (2.3517)	Entropy 0.53015 (0.53241)	Top-1 acc 62.891 (67.471)	Top-5 acc 84.375 (86.186)	lr 0.00043
Train [110][3040/3239]	Time 0.246 (0.507)	Data Time 0.001 (0.013)	Loss 2.3046 (2.3516)	Entropy 0.53004 (0.53240)	Top-1 acc 69.922 (67.477)	Top-5 acc 87.109 (86.188)	lr 0.00043
Train [110][3050/3239]	Time 0.235 (0.506)	Data Time 0.001 (0.013)	Loss 2.3088 (2.3517)	Entropy 0.52996 (0.53239)	Top-1 acc 71.484 (67.475)	Top-5 acc 86.719 (86.184)	lr 0.00043
Train [110][3060/3239]	Time 0.231 (0.506)	Data Time 0.002 (0.013)	Loss 2.4176 (2.3516)	Entropy 0.53016 (0.53238)	Top-1 acc 64.453 (67.479)	Top-5 acc 86.328 (86.185)	lr 0.00043
Train [110][3070/3239]	Time 0.232 (0.506)	Data Time 0.001 (0.013)	Loss 2.7184 (2.3517)	Entropy 0.53028 (0.53238)	Top-1 acc 57.812 (67.475)	Top-5 acc 79.297 (86.185)	lr 0.00043
Train [110][3080/3239]	Time 0.259 (0.505)	Data Time 0.001 (0.013)	Loss 2.3977 (2.3517)	Entropy 0.53033 (0.53237)	Top-1 acc 66.016 (67.481)	Top-5 acc 85.547 (86.185)	lr 0.00043
Train [110][3090/3239]	Time 0.331 (0.505)	Data Time 0.001 (0.013)	Loss 2.4285 (2.3516)	Entropy 0.53045 (0.53236)	Top-1 acc 66.406 (67.482)	Top-5 acc 85.547 (86.183)	lr 0.00043
Train [110][3100/3239]	Time 0.231 (0.505)	Data Time 0.001 (0.013)	Loss 2.3974 (2.3516)	Entropy 0.53069 (0.53236)	Top-1 acc 67.578 (67.482)	Top-5 acc 84.375 (86.184)	lr 0.00043
Train [110][3110/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.013)	Loss 2.3356 (2.3517)	Entropy 0.53024 (0.53235)	Top-1 acc 67.969 (67.480)	Top-5 acc 88.281 (86.184)	lr 0.00043
Train [110][3120/3239]	Time 0.236 (0.504)	Data Time 0.001 (0.013)	Loss 2.3338 (2.3518)	Entropy 0.52991 (0.53234)	Top-1 acc 66.797 (67.482)	Top-5 acc 87.109 (86.182)	lr 0.00043
Train [110][3130/3239]	Time 0.436 (0.520)	Data Time 0.006 (0.013)	Loss 2.3721 (2.3520)	Entropy 0.52996 (0.53234)	Top-1 acc 66.406 (67.475)	Top-5 acc 86.719 (86.180)	lr 0.00043
Train [110][3140/3239]	Time 0.276 (0.521)	Data Time 0.002 (0.013)	Loss 2.3665 (2.3518)	Entropy 0.52986 (0.53233)	Top-1 acc 64.062 (67.478)	Top-5 acc 85.156 (86.182)	lr 0.00043
Train [110][3150/3239]	Time 0.238 (0.520)	Data Time 0.002 (0.013)	Loss 2.3589 (2.3519)	Entropy 0.52989 (0.53232)	Top-1 acc 66.406 (67.473)	Top-5 acc 85.156 (86.180)	lr 0.00043
Train [110][3160/3239]	Time 0.330 (0.520)	Data Time 0.001 (0.013)	Loss 2.3297 (2.3521)	Entropy 0.52993 (0.53231)	Top-1 acc 70.703 (67.469)	Top-5 acc 83.203 (86.178)	lr 0.00043
Train [110][3170/3239]	Time 0.251 (0.520)	Data Time 0.001 (0.013)	Loss 2.3286 (2.3520)	Entropy 0.53022 (0.53231)	Top-1 acc 66.016 (67.472)	Top-5 acc 86.328 (86.178)	lr 0.00043
Train [110][3180/3239]	Time 0.241 (0.519)	Data Time 0.000 (0.013)	Loss 2.1482 (2.3519)	Entropy 0.53029 (0.53230)	Top-1 acc 71.875 (67.473)	Top-5 acc 87.500 (86.181)	lr 0.00043
Train [110][3190/3239]	Time 0.227 (0.519)	Data Time 0.000 (0.013)	Loss 2.4875 (2.3520)	Entropy 0.53051 (0.53229)	Top-1 acc 64.453 (67.467)	Top-5 acc 84.375 (86.180)	lr 0.00043
Train [110][3200/3239]	Time 0.222 (0.519)	Data Time 0.000 (0.013)	Loss 2.3000 (2.3520)	Entropy 0.53055 (0.53229)	Top-1 acc 68.750 (67.465)	Top-5 acc 85.938 (86.179)	lr 0.00043
Train [110][3210/3239]	Time 0.242 (0.518)	Data Time 0.000 (0.013)	Loss 2.4053 (2.3522)	Entropy 0.53044 (0.53228)	Top-1 acc 66.797 (67.461)	Top-5 acc 83.203 (86.179)	lr 0.00043
Train [110][3220/3239]	Time 0.235 (0.518)	Data Time 0.000 (0.013)	Loss 2.4415 (2.3521)	Entropy 0.53029 (0.53228)	Top-1 acc 64.844 (67.462)	Top-5 acc 83.984 (86.181)	lr 0.00043
Train [110][3230/3239]	Time 0.235 (0.517)	Data Time 0.000 (0.013)	Loss 2.3564 (2.3522)	Entropy 0.53018 (0.53227)	Top-1 acc 69.531 (67.462)	Top-5 acc 86.719 (86.178)	lr 0.00043
Train [110][3239/3239]	Time 0.918 (0.517)	Data Time 0.000 (0.013)	Loss 2.5087 (2.3523)	Entropy 0.53014 (0.53226)	Top-1 acc 66.667 (67.461)	Top-5 acc 82.716 (86.176)	lr 0.00043
==========Valid [110/120]	loss 1.174	top-1 acc 73.154 (73.154)	top-5 acc 90.507	Train top-1 67.461	top-5 86.176	Entropy 0.53014	Latency-None: 0.000ms	Flops: 539.00M
Train [111][0/3239]	Time 37.194 (37.194)	Data Time 35.056 (35.056)	Loss 2.3071 (2.3071)	Entropy 0.53010 (0.53010)	Top-1 acc 66.406 (66.406)	Top-5 acc 85.938 (85.938)	lr 0.00043
Train [111][10/3239]	Time 0.295 (3.973)	Data Time 0.001 (3.303)	Loss 2.2005 (2.2919)	Entropy 0.53006 (0.53008)	Top-1 acc 74.219 (68.892)	Top-5 acc 90.625 (87.571)	lr 0.00043
Train [111][20/3239]	Time 0.241 (2.284)	Data Time 0.001 (1.731)	Loss 2.3554 (2.2979)	Entropy 0.53022 (0.53012)	Top-1 acc 67.969 (69.159)	Top-5 acc 87.891 (87.444)	lr 0.00043
Train [111][30/3239]	Time 0.237 (1.688)	Data Time 0.001 (1.173)	Loss 2.2249 (2.3064)	Entropy 0.52993 (0.53011)	Top-1 acc 71.484 (68.599)	Top-5 acc 90.625 (87.261)	lr 0.00043
Train [111][40/3239]	Time 0.249 (1.386)	Data Time 0.002 (0.887)	Loss 2.3702 (2.3099)	Entropy 0.53010 (0.53007)	Top-1 acc 65.625 (68.474)	Top-5 acc 85.156 (87.071)	lr 0.00042
Train [111][50/3239]	Time 0.232 (1.209)	Data Time 0.001 (0.714)	Loss 2.4785 (2.3147)	Entropy 0.53014 (0.53007)	Top-1 acc 66.016 (68.390)	Top-5 acc 82.812 (86.887)	lr 0.00042
Train [111][60/3239]	Time 0.239 (1.083)	Data Time 0.001 (0.597)	Loss 2.2472 (2.3103)	Entropy 0.53012 (0.53008)	Top-1 acc 71.484 (68.539)	Top-5 acc 87.891 (86.962)	lr 0.00042
Train [111][70/3239]	Time 0.234 (0.991)	Data Time 0.001 (0.513)	Loss 2.4393 (2.3151)	Entropy 0.52988 (0.53008)	Top-1 acc 67.578 (68.409)	Top-5 acc 85.156 (86.939)	lr 0.00042
Train [111][80/3239]	Time 0.229 (0.920)	Data Time 0.001 (0.450)	Loss 2.2757 (2.3204)	Entropy 0.52962 (0.53003)	Top-1 acc 69.141 (68.292)	Top-5 acc 86.328 (86.849)	lr 0.00042
Train [111][90/3239]	Time 0.272 (0.866)	Data Time 0.001 (0.401)	Loss 2.1669 (2.3222)	Entropy 0.52947 (0.52999)	Top-1 acc 72.656 (68.209)	Top-5 acc 92.188 (86.817)	lr 0.00042
Train [111][100/3239]	Time 0.235 (0.820)	Data Time 0.001 (0.361)	Loss 2.0878 (2.3169)	Entropy 0.52956 (0.52995)	Top-1 acc 73.828 (68.367)	Top-5 acc 91.406 (86.881)	lr 0.00042
Train [111][110/3239]	Time 0.238 (0.784)	Data Time 0.001 (0.329)	Loss 2.1295 (2.3164)	Entropy 0.52955 (0.52991)	Top-1 acc 69.141 (68.373)	Top-5 acc 89.453 (86.870)	lr 0.00042
Train [111][120/3239]	Time 0.230 (0.752)	Data Time 0.001 (0.302)	Loss 2.2952 (2.3161)	Entropy 0.52971 (0.52989)	Top-1 acc 69.922 (68.443)	Top-5 acc 85.938 (86.822)	lr 0.00042
Train [111][130/3239]	Time 0.237 (0.727)	Data Time 0.001 (0.279)	Loss 2.2117 (2.3147)	Entropy 0.52949 (0.52986)	Top-1 acc 69.531 (68.443)	Top-5 acc 90.625 (86.877)	lr 0.00042
Train [111][140/3239]	Time 0.230 (0.704)	Data Time 0.001 (0.259)	Loss 2.4665 (2.3172)	Entropy 0.52950 (0.52984)	Top-1 acc 65.234 (68.329)	Top-5 acc 85.156 (86.838)	lr 0.00042
Train [111][150/3239]	Time 0.376 (0.688)	Data Time 0.002 (0.242)	Loss 2.3914 (2.3200)	Entropy 0.52962 (0.52982)	Top-1 acc 66.016 (68.269)	Top-5 acc 83.984 (86.781)	lr 0.00042
Train [111][160/3239]	Time 0.260 (0.670)	Data Time 0.001 (0.227)	Loss 2.5719 (2.3184)	Entropy 0.52951 (0.52980)	Top-1 acc 60.156 (68.289)	Top-5 acc 80.469 (86.799)	lr 0.00042
Train [111][170/3239]	Time 0.219 (0.655)	Data Time 0.001 (0.214)	Loss 2.3249 (2.3225)	Entropy 0.52935 (0.52978)	Top-1 acc 65.234 (68.167)	Top-5 acc 89.062 (86.780)	lr 0.00042
Train [111][180/3239]	Time 0.229 (0.641)	Data Time 0.001 (0.202)	Loss 2.4399 (2.3232)	Entropy 0.52932 (0.52976)	Top-1 acc 64.453 (68.139)	Top-5 acc 85.938 (86.779)	lr 0.00042
Train [111][190/3239]	Time 0.259 (0.629)	Data Time 0.001 (0.192)	Loss 2.3225 (2.3239)	Entropy 0.52956 (0.52975)	Top-1 acc 69.922 (68.122)	Top-5 acc 88.672 (86.792)	lr 0.00042
Train [111][200/3239]	Time 0.232 (0.618)	Data Time 0.001 (0.182)	Loss 2.3823 (2.3255)	Entropy 0.52899 (0.52972)	Top-1 acc 65.234 (68.027)	Top-5 acc 86.328 (86.762)	lr 0.00042
Train [111][210/3239]	Time 0.232 (0.608)	Data Time 0.001 (0.174)	Loss 2.4020 (2.3285)	Entropy 0.52884 (0.52968)	Top-1 acc 66.797 (67.974)	Top-5 acc 87.109 (86.691)	lr 0.00042
Train [111][220/3239]	Time 0.334 (0.599)	Data Time 0.001 (0.166)	Loss 2.1523 (2.3258)	Entropy 0.52890 (0.52964)	Top-1 acc 71.094 (68.002)	Top-5 acc 90.625 (86.758)	lr 0.00042
Train [111][230/3239]	Time 0.249 (0.592)	Data Time 0.002 (0.159)	Loss 2.5973 (2.3287)	Entropy 0.52896 (0.52961)	Top-1 acc 60.156 (67.935)	Top-5 acc 79.297 (86.676)	lr 0.00042
Train [111][240/3239]	Time 0.234 (0.585)	Data Time 0.001 (0.152)	Loss 2.3319 (2.3283)	Entropy 0.52906 (0.52959)	Top-1 acc 67.969 (67.948)	Top-5 acc 85.547 (86.649)	lr 0.00042
Train [111][250/3239]	Time 0.234 (0.579)	Data Time 0.001 (0.146)	Loss 2.2373 (2.3266)	Entropy 0.52919 (0.52957)	Top-1 acc 69.922 (67.959)	Top-5 acc 87.109 (86.669)	lr 0.00042
Train [111][260/3239]	Time 0.227 (0.571)	Data Time 0.001 (0.141)	Loss 2.4407 (2.3290)	Entropy 0.52915 (0.52955)	Top-1 acc 67.578 (67.957)	Top-5 acc 85.156 (86.620)	lr 0.00042
Train [111][270/3239]	Time 0.234 (0.565)	Data Time 0.001 (0.135)	Loss 2.2348 (2.3278)	Entropy 0.52961 (0.52954)	Top-1 acc 68.359 (67.944)	Top-5 acc 88.281 (86.635)	lr 0.00042
Train [111][280/3239]	Time 0.234 (0.559)	Data Time 0.001 (0.131)	Loss 2.2778 (2.3279)	Entropy 0.52981 (0.52955)	Top-1 acc 70.312 (67.959)	Top-5 acc 87.891 (86.633)	lr 0.00042
Train [111][290/3239]	Time 0.252 (0.555)	Data Time 0.002 (0.126)	Loss 2.2773 (2.3284)	Entropy 0.52981 (0.52956)	Top-1 acc 66.016 (67.939)	Top-5 acc 85.547 (86.611)	lr 0.00042
Train [111][300/3239]	Time 0.235 (0.550)	Data Time 0.001 (0.122)	Loss 2.2075 (2.3280)	Entropy 0.52981 (0.52956)	Top-1 acc 72.266 (67.964)	Top-5 acc 89.844 (86.632)	lr 0.00042
Train [111][310/3239]	Time 0.357 (0.546)	Data Time 0.001 (0.118)	Loss 2.1571 (2.3286)	Entropy 0.52978 (0.52957)	Top-1 acc 73.828 (67.964)	Top-5 acc 90.234 (86.621)	lr 0.00042
Train [111][320/3239]	Time 0.239 (0.542)	Data Time 0.001 (0.115)	Loss 2.7878 (2.3307)	Entropy 0.52951 (0.52958)	Top-1 acc 55.078 (67.912)	Top-5 acc 81.250 (86.587)	lr 0.00042
Train [111][330/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.111)	Loss 2.4221 (2.3325)	Entropy 0.52967 (0.52958)	Top-1 acc 66.797 (67.876)	Top-5 acc 85.547 (86.545)	lr 0.00042
Train [111][340/3239]	Time 0.229 (0.535)	Data Time 0.002 (0.108)	Loss 2.2751 (2.3306)	Entropy 0.52909 (0.52957)	Top-1 acc 67.188 (67.917)	Top-5 acc 89.453 (86.588)	lr 0.00042
Train [111][350/3239]	Time 0.234 (0.532)	Data Time 0.002 (0.105)	Loss 2.3982 (2.3308)	Entropy 0.52871 (0.52956)	Top-1 acc 64.453 (67.926)	Top-5 acc 86.719 (86.583)	lr 0.00042
Train [111][360/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.102)	Loss 2.2635 (2.3313)	Entropy 0.52863 (0.52953)	Top-1 acc 68.750 (67.908)	Top-5 acc 87.500 (86.579)	lr 0.00042
Train [111][370/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.100)	Loss 2.4410 (2.3342)	Entropy 0.52894 (0.52951)	Top-1 acc 63.672 (67.818)	Top-5 acc 85.547 (86.536)	lr 0.00042
Train [111][380/3239]	Time 0.301 (0.523)	Data Time 0.001 (0.097)	Loss 2.2620 (2.3342)	Entropy 0.52902 (0.52950)	Top-1 acc 66.406 (67.816)	Top-5 acc 89.062 (86.532)	lr 0.00042
Train [111][390/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.095)	Loss 2.3637 (2.3337)	Entropy 0.52931 (0.52949)	Top-1 acc 68.359 (67.828)	Top-5 acc 85.547 (86.527)	lr 0.00042
Train [111][400/3239]	Time 0.228 (0.517)	Data Time 0.001 (0.092)	Loss 2.3254 (2.3337)	Entropy 0.52916 (0.52948)	Top-1 acc 68.750 (67.844)	Top-5 acc 89.062 (86.535)	lr 0.00042
Train [111][410/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.090)	Loss 2.2360 (2.3347)	Entropy 0.52931 (0.52947)	Top-1 acc 71.875 (67.821)	Top-5 acc 87.891 (86.534)	lr 0.00042
Train [111][420/3239]	Time 0.238 (0.512)	Data Time 0.001 (0.088)	Loss 2.5433 (2.3365)	Entropy 0.52965 (0.52947)	Top-1 acc 64.062 (67.795)	Top-5 acc 83.594 (86.520)	lr 0.00042
Train [111][430/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.086)	Loss 2.3339 (2.3377)	Entropy 0.52963 (0.52948)	Top-1 acc 69.531 (67.753)	Top-5 acc 87.109 (86.514)	lr 0.00041
Train [111][440/3239]	Time 0.231 (0.508)	Data Time 0.001 (0.084)	Loss 2.2116 (2.3365)	Entropy 0.52934 (0.52948)	Top-1 acc 69.531 (67.783)	Top-5 acc 88.672 (86.534)	lr 0.00041
Train [111][450/3239]	Time 0.234 (0.507)	Data Time 0.001 (0.082)	Loss 2.4628 (2.3369)	Entropy 0.52928 (0.52947)	Top-1 acc 64.453 (67.780)	Top-5 acc 86.328 (86.533)	lr 0.00041
Train [111][460/3239]	Time 0.231 (0.505)	Data Time 0.001 (0.081)	Loss 2.3309 (2.3376)	Entropy 0.52930 (0.52947)	Top-1 acc 64.062 (67.764)	Top-5 acc 87.500 (86.521)	lr 0.00041
Train [111][470/3239]	Time 0.232 (0.503)	Data Time 0.001 (0.079)	Loss 2.3434 (2.3375)	Entropy 0.52934 (0.52947)	Top-1 acc 68.750 (67.783)	Top-5 acc 86.719 (86.535)	lr 0.00041
Train [111][480/3239]	Time 0.227 (0.501)	Data Time 0.001 (0.077)	Loss 2.2833 (2.3374)	Entropy 0.52962 (0.52947)	Top-1 acc 67.969 (67.770)	Top-5 acc 88.281 (86.539)	lr 0.00041
Train [111][490/3239]	Time 0.222 (0.499)	Data Time 0.001 (0.076)	Loss 2.5054 (2.3389)	Entropy 0.52954 (0.52947)	Top-1 acc 66.797 (67.747)	Top-5 acc 85.156 (86.510)	lr 0.00041
Train [111][500/3239]	Time 0.228 (0.497)	Data Time 0.001 (0.074)	Loss 2.4346 (2.3388)	Entropy 0.52962 (0.52947)	Top-1 acc 67.969 (67.757)	Top-5 acc 84.375 (86.506)	lr 0.00041
Train [111][510/3239]	Time 0.232 (0.495)	Data Time 0.001 (0.073)	Loss 2.2143 (2.3383)	Entropy 0.52965 (0.52947)	Top-1 acc 69.531 (67.771)	Top-5 acc 87.891 (86.512)	lr 0.00041
Train [111][520/3239]	Time 0.220 (0.493)	Data Time 0.001 (0.072)	Loss 2.5318 (2.3391)	Entropy 0.52994 (0.52948)	Top-1 acc 64.453 (67.747)	Top-5 acc 83.203 (86.513)	lr 0.00041
Train [111][530/3239]	Time 0.226 (0.491)	Data Time 0.001 (0.070)	Loss 2.6892 (2.3404)	Entropy 0.53005 (0.52949)	Top-1 acc 60.156 (67.734)	Top-5 acc 81.641 (86.490)	lr 0.00041
Train [111][540/3239]	Time 0.312 (0.490)	Data Time 0.001 (0.069)	Loss 2.3600 (2.3420)	Entropy 0.52958 (0.52950)	Top-1 acc 67.188 (67.706)	Top-5 acc 85.938 (86.462)	lr 0.00041
Train [111][550/3239]	Time 0.301 (0.584)	Data Time 0.002 (0.068)	Loss 2.4733 (2.3427)	Entropy 0.52938 (0.52950)	Top-1 acc 66.406 (67.684)	Top-5 acc 84.766 (86.452)	lr 0.00041
Train [111][560/3239]	Time 0.242 (0.581)	Data Time 0.002 (0.067)	Loss 2.1103 (2.3420)	Entropy 0.52923 (0.52949)	Top-1 acc 76.172 (67.720)	Top-5 acc 89.844 (86.465)	lr 0.00041
Train [111][570/3239]	Time 0.238 (0.579)	Data Time 0.001 (0.065)	Loss 2.3855 (2.3410)	Entropy 0.52921 (0.52949)	Top-1 acc 64.844 (67.756)	Top-5 acc 85.156 (86.480)	lr 0.00041
Train [111][580/3239]	Time 0.235 (0.576)	Data Time 0.001 (0.064)	Loss 2.4326 (2.3418)	Entropy 0.52926 (0.52948)	Top-1 acc 64.453 (67.753)	Top-5 acc 84.375 (86.461)	lr 0.00041
Train [111][590/3239]	Time 0.231 (0.573)	Data Time 0.001 (0.063)	Loss 2.3694 (2.3419)	Entropy 0.52892 (0.52948)	Top-1 acc 67.969 (67.739)	Top-5 acc 83.984 (86.458)	lr 0.00041
Train [111][600/3239]	Time 0.225 (0.570)	Data Time 0.001 (0.062)	Loss 2.2904 (2.3423)	Entropy 0.52907 (0.52947)	Top-1 acc 69.922 (67.725)	Top-5 acc 86.719 (86.443)	lr 0.00041
Train [111][610/3239]	Time 0.226 (0.568)	Data Time 0.001 (0.061)	Loss 2.2882 (2.3417)	Entropy 0.52872 (0.52946)	Top-1 acc 69.141 (67.742)	Top-5 acc 85.938 (86.450)	lr 0.00041
Train [111][620/3239]	Time 0.226 (0.565)	Data Time 0.001 (0.060)	Loss 2.4884 (2.3423)	Entropy 0.52838 (0.52945)	Top-1 acc 65.625 (67.733)	Top-5 acc 84.766 (86.444)	lr 0.00041
Train [111][630/3239]	Time 0.230 (0.563)	Data Time 0.001 (0.059)	Loss 2.1809 (2.3413)	Entropy 0.52835 (0.52943)	Top-1 acc 66.797 (67.750)	Top-5 acc 88.281 (86.454)	lr 0.00041
Train [111][640/3239]	Time 0.216 (0.560)	Data Time 0.001 (0.059)	Loss 2.4096 (2.3404)	Entropy 0.52840 (0.52941)	Top-1 acc 65.625 (67.767)	Top-5 acc 85.547 (86.471)	lr 0.00041
Train [111][650/3239]	Time 0.246 (0.558)	Data Time 0.001 (0.058)	Loss 2.2735 (2.3406)	Entropy 0.52881 (0.52940)	Top-1 acc 67.969 (67.762)	Top-5 acc 87.891 (86.465)	lr 0.00041
Train [111][660/3239]	Time 0.257 (0.555)	Data Time 0.002 (0.057)	Loss 2.2989 (2.3410)	Entropy 0.52880 (0.52939)	Top-1 acc 67.969 (67.750)	Top-5 acc 87.500 (86.465)	lr 0.00041
Train [111][670/3239]	Time 0.233 (0.553)	Data Time 0.001 (0.056)	Loss 2.3982 (2.3405)	Entropy 0.52857 (0.52938)	Top-1 acc 67.969 (67.762)	Top-5 acc 87.109 (86.469)	lr 0.00041
Train [111][680/3239]	Time 0.225 (0.552)	Data Time 0.001 (0.055)	Loss 2.4440 (2.3404)	Entropy 0.52858 (0.52937)	Top-1 acc 64.844 (67.770)	Top-5 acc 86.328 (86.478)	lr 0.00041
Train [111][690/3239]	Time 0.216 (0.550)	Data Time 0.001 (0.054)	Loss 2.5343 (2.3412)	Entropy 0.52815 (0.52935)	Top-1 acc 60.938 (67.752)	Top-5 acc 85.547 (86.468)	lr 0.00041
Train [111][700/3239]	Time 0.364 (0.548)	Data Time 0.001 (0.054)	Loss 2.3235 (2.3416)	Entropy 0.52792 (0.52934)	Top-1 acc 68.359 (67.747)	Top-5 acc 87.109 (86.456)	lr 0.00041
Train [111][710/3239]	Time 0.227 (0.546)	Data Time 0.001 (0.053)	Loss 2.3904 (2.3421)	Entropy 0.52793 (0.52932)	Top-1 acc 65.625 (67.734)	Top-5 acc 87.891 (86.446)	lr 0.00041
Train [111][720/3239]	Time 0.230 (0.544)	Data Time 0.001 (0.052)	Loss 2.3879 (2.3413)	Entropy 0.52783 (0.52930)	Top-1 acc 70.703 (67.742)	Top-5 acc 85.156 (86.466)	lr 0.00041
Train [111][730/3239]	Time 0.234 (0.542)	Data Time 0.001 (0.052)	Loss 2.2872 (2.3413)	Entropy 0.52735 (0.52928)	Top-1 acc 68.359 (67.742)	Top-5 acc 88.281 (86.470)	lr 0.00041
Train [111][740/3239]	Time 0.251 (0.541)	Data Time 0.001 (0.051)	Loss 2.3569 (2.3411)	Entropy 0.52735 (0.52925)	Top-1 acc 67.578 (67.753)	Top-5 acc 85.938 (86.469)	lr 0.00041
Train [111][750/3239]	Time 0.280 (0.540)	Data Time 0.001 (0.050)	Loss 2.3292 (2.3410)	Entropy 0.52697 (0.52922)	Top-1 acc 67.969 (67.750)	Top-5 acc 85.156 (86.476)	lr 0.00041
Train [111][760/3239]	Time 0.296 (0.539)	Data Time 0.002 (0.050)	Loss 2.3563 (2.3407)	Entropy 0.52706 (0.52919)	Top-1 acc 66.016 (67.759)	Top-5 acc 85.547 (86.473)	lr 0.00041
Train [111][770/3239]	Time 0.326 (0.538)	Data Time 0.001 (0.049)	Loss 2.3285 (2.3417)	Entropy 0.52723 (0.52917)	Top-1 acc 69.141 (67.734)	Top-5 acc 85.938 (86.461)	lr 0.00041
Train [111][780/3239]	Time 0.265 (0.536)	Data Time 0.001 (0.048)	Loss 2.3696 (2.3424)	Entropy 0.52700 (0.52914)	Top-1 acc 71.484 (67.719)	Top-5 acc 85.547 (86.448)	lr 0.00041
Train [111][790/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.048)	Loss 2.6170 (2.3424)	Entropy 0.52731 (0.52912)	Top-1 acc 58.984 (67.712)	Top-5 acc 82.812 (86.453)	lr 0.00041
Train [111][800/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.047)	Loss 2.5174 (2.3430)	Entropy 0.52727 (0.52909)	Top-1 acc 63.672 (67.689)	Top-5 acc 84.375 (86.436)	lr 0.00041
Train [111][810/3239]	Time 0.271 (0.531)	Data Time 0.001 (0.047)	Loss 2.7828 (2.3434)	Entropy 0.52715 (0.52907)	Top-1 acc 57.422 (67.663)	Top-5 acc 78.906 (86.423)	lr 0.00041
Train [111][820/3239]	Time 0.266 (0.530)	Data Time 0.003 (0.046)	Loss 2.2567 (2.3433)	Entropy 0.52751 (0.52905)	Top-1 acc 69.922 (67.657)	Top-5 acc 88.281 (86.423)	lr 0.00040
Train [111][830/3239]	Time 0.233 (0.529)	Data Time 0.001 (0.046)	Loss 2.4649 (2.3434)	Entropy 0.52760 (0.52903)	Top-1 acc 65.625 (67.658)	Top-5 acc 83.984 (86.421)	lr 0.00040
Train [111][840/3239]	Time 0.273 (0.528)	Data Time 0.002 (0.045)	Loss 2.4471 (2.3439)	Entropy 0.52757 (0.52901)	Top-1 acc 66.797 (67.635)	Top-5 acc 83.594 (86.415)	lr 0.00040
Train [111][850/3239]	Time 0.266 (0.527)	Data Time 0.002 (0.044)	Loss 2.2822 (2.3441)	Entropy 0.52758 (0.52900)	Top-1 acc 66.797 (67.631)	Top-5 acc 87.891 (86.416)	lr 0.00040
Train [111][860/3239]	Time 0.383 (0.526)	Data Time 0.001 (0.044)	Loss 2.2971 (2.3438)	Entropy 0.52771 (0.52898)	Top-1 acc 69.141 (67.632)	Top-5 acc 87.500 (86.424)	lr 0.00040
Train [111][870/3239]	Time 0.249 (0.525)	Data Time 0.001 (0.044)	Loss 2.3863 (2.3447)	Entropy 0.52817 (0.52897)	Top-1 acc 67.188 (67.613)	Top-5 acc 84.766 (86.408)	lr 0.00040
Train [111][880/3239]	Time 0.239 (0.524)	Data Time 0.001 (0.043)	Loss 2.2351 (2.3446)	Entropy 0.52827 (0.52896)	Top-1 acc 72.266 (67.624)	Top-5 acc 89.062 (86.413)	lr 0.00040
Train [111][890/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.043)	Loss 2.3258 (2.3451)	Entropy 0.52835 (0.52895)	Top-1 acc 70.312 (67.612)	Top-5 acc 87.891 (86.401)	lr 0.00040
Train [111][900/3239]	Time 0.229 (0.521)	Data Time 0.001 (0.042)	Loss 2.3498 (2.3449)	Entropy 0.52828 (0.52895)	Top-1 acc 67.969 (67.621)	Top-5 acc 85.156 (86.405)	lr 0.00040
Train [111][910/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.042)	Loss 2.1015 (2.3454)	Entropy 0.52855 (0.52894)	Top-1 acc 75.781 (67.612)	Top-5 acc 92.969 (86.411)	lr 0.00040
Train [111][920/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.041)	Loss 2.3182 (2.3460)	Entropy 0.52860 (0.52893)	Top-1 acc 69.141 (67.599)	Top-5 acc 85.156 (86.407)	lr 0.00040
Train [111][930/3239]	Time 0.302 (0.517)	Data Time 0.001 (0.041)	Loss 2.4303 (2.3455)	Entropy 0.52818 (0.52893)	Top-1 acc 67.969 (67.615)	Top-5 acc 86.328 (86.424)	lr 0.00040
Train [111][940/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.040)	Loss 2.7324 (2.3458)	Entropy 0.52814 (0.52892)	Top-1 acc 58.594 (67.608)	Top-5 acc 81.250 (86.416)	lr 0.00040
Train [111][950/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.040)	Loss 2.5004 (2.3462)	Entropy 0.52841 (0.52891)	Top-1 acc 60.156 (67.590)	Top-5 acc 83.594 (86.407)	lr 0.00040
Train [111][960/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.040)	Loss 2.6555 (2.3465)	Entropy 0.52839 (0.52891)	Top-1 acc 60.547 (67.581)	Top-5 acc 82.812 (86.394)	lr 0.00040
Train [111][970/3239]	Time 0.261 (0.512)	Data Time 0.002 (0.039)	Loss 2.4700 (2.3465)	Entropy 0.52800 (0.52890)	Top-1 acc 66.406 (67.585)	Top-5 acc 85.938 (86.396)	lr 0.00040
Train [111][980/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.039)	Loss 2.1621 (2.3463)	Entropy 0.52813 (0.52889)	Top-1 acc 72.656 (67.586)	Top-5 acc 88.672 (86.401)	lr 0.00040
Train [111][990/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.039)	Loss 2.3241 (2.3464)	Entropy 0.52784 (0.52888)	Top-1 acc 67.578 (67.577)	Top-5 acc 87.500 (86.405)	lr 0.00040
Train [111][1000/3239]	Time 0.275 (0.510)	Data Time 0.002 (0.038)	Loss 2.1536 (2.3461)	Entropy 0.52783 (0.52887)	Top-1 acc 71.094 (67.588)	Top-5 acc 88.672 (86.409)	lr 0.00040
Train [111][1010/3239]	Time 0.278 (0.510)	Data Time 0.002 (0.038)	Loss 2.2133 (2.3459)	Entropy 0.52802 (0.52886)	Top-1 acc 68.750 (67.593)	Top-5 acc 89.453 (86.416)	lr 0.00040
Train [111][1020/3239]	Time 0.312 (0.509)	Data Time 0.001 (0.037)	Loss 2.2775 (2.3461)	Entropy 0.52839 (0.52886)	Top-1 acc 68.750 (67.588)	Top-5 acc 87.500 (86.408)	lr 0.00040
Train [111][1030/3239]	Time 0.222 (0.508)	Data Time 0.001 (0.037)	Loss 2.5904 (2.3465)	Entropy 0.52767 (0.52885)	Top-1 acc 63.281 (67.575)	Top-5 acc 82.812 (86.402)	lr 0.00040
Train [111][1040/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.037)	Loss 2.3386 (2.3468)	Entropy 0.52747 (0.52884)	Top-1 acc 65.625 (67.571)	Top-5 acc 86.719 (86.402)	lr 0.00040
Train [111][1050/3239]	Time 0.229 (0.506)	Data Time 0.001 (0.036)	Loss 2.2559 (2.3466)	Entropy 0.52746 (0.52883)	Top-1 acc 70.703 (67.574)	Top-5 acc 88.281 (86.407)	lr 0.00040
Train [111][1060/3239]	Time 0.219 (0.505)	Data Time 0.001 (0.036)	Loss 2.3598 (2.3463)	Entropy 0.52782 (0.52881)	Top-1 acc 65.625 (67.570)	Top-5 acc 85.938 (86.409)	lr 0.00040
Train [111][1070/3239]	Time 0.224 (0.504)	Data Time 0.001 (0.036)	Loss 2.2758 (2.3463)	Entropy 0.52771 (0.52880)	Top-1 acc 70.703 (67.576)	Top-5 acc 86.719 (86.406)	lr 0.00040
Train [111][1080/3239]	Time 0.229 (0.503)	Data Time 0.001 (0.035)	Loss 2.2337 (2.3461)	Entropy 0.52723 (0.52879)	Top-1 acc 73.828 (67.589)	Top-5 acc 88.281 (86.405)	lr 0.00040
Train [111][1090/3239]	Time 0.311 (0.502)	Data Time 0.001 (0.035)	Loss 2.2729 (2.3457)	Entropy 0.52729 (0.52878)	Top-1 acc 67.969 (67.599)	Top-5 acc 88.672 (86.414)	lr 0.00040
Train [111][1100/3239]	Time 0.235 (0.501)	Data Time 0.001 (0.035)	Loss 2.2597 (2.3456)	Entropy 0.52733 (0.52876)	Top-1 acc 68.750 (67.608)	Top-5 acc 87.500 (86.421)	lr 0.00040
Train [111][1110/3239]	Time 0.226 (0.500)	Data Time 0.001 (0.035)	Loss 2.5972 (2.3458)	Entropy 0.52756 (0.52875)	Top-1 acc 62.109 (67.606)	Top-5 acc 82.812 (86.420)	lr 0.00040
Train [111][1120/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.034)	Loss 2.3977 (2.3458)	Entropy 0.52751 (0.52874)	Top-1 acc 64.453 (67.603)	Top-5 acc 85.938 (86.426)	lr 0.00040
Train [111][1130/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.034)	Loss 2.3344 (2.3459)	Entropy 0.52773 (0.52873)	Top-1 acc 66.406 (67.605)	Top-5 acc 86.719 (86.427)	lr 0.00040
Train [111][1140/3239]	Time 0.231 (0.498)	Data Time 0.001 (0.034)	Loss 2.2751 (2.3457)	Entropy 0.52781 (0.52872)	Top-1 acc 69.141 (67.602)	Top-5 acc 86.719 (86.439)	lr 0.00040
Train [111][1150/3239]	Time 0.238 (0.497)	Data Time 0.001 (0.033)	Loss 2.4420 (2.3460)	Entropy 0.52790 (0.52872)	Top-1 acc 65.625 (67.601)	Top-5 acc 85.938 (86.433)	lr 0.00040
Train [111][1160/3239]	Time 0.317 (0.496)	Data Time 0.001 (0.033)	Loss 2.3559 (2.3458)	Entropy 0.52789 (0.52871)	Top-1 acc 69.141 (67.603)	Top-5 acc 86.328 (86.428)	lr 0.00040
Train [111][1170/3239]	Time 0.260 (0.495)	Data Time 0.001 (0.033)	Loss 2.2821 (2.3461)	Entropy 0.52744 (0.52870)	Top-1 acc 67.969 (67.603)	Top-5 acc 88.281 (86.417)	lr 0.00040
Train [111][1180/3239]	Time 0.252 (0.495)	Data Time 0.001 (0.033)	Loss 2.3778 (2.3467)	Entropy 0.52746 (0.52869)	Top-1 acc 66.016 (67.584)	Top-5 acc 86.328 (86.403)	lr 0.00040
Train [111][1190/3239]	Time 0.236 (0.494)	Data Time 0.001 (0.032)	Loss 2.1999 (2.3461)	Entropy 0.52748 (0.52868)	Top-1 acc 71.094 (67.598)	Top-5 acc 90.234 (86.412)	lr 0.00040
Train [111][1200/3239]	Time 0.382 (0.537)	Data Time 0.005 (0.032)	Loss 2.1435 (2.3457)	Entropy 0.52761 (0.52867)	Top-1 acc 71.875 (67.612)	Top-5 acc 92.969 (86.420)	lr 0.00040
Train [111][1210/3239]	Time 0.222 (0.536)	Data Time 0.002 (0.032)	Loss 2.3505 (2.3451)	Entropy 0.52768 (0.52866)	Top-1 acc 69.922 (67.628)	Top-5 acc 85.938 (86.428)	lr 0.00039
Train [111][1220/3239]	Time 0.234 (0.535)	Data Time 0.002 (0.032)	Loss 2.4027 (2.3462)	Entropy 0.52778 (0.52865)	Top-1 acc 63.672 (67.604)	Top-5 acc 85.547 (86.410)	lr 0.00039
Train [111][1230/3239]	Time 0.273 (0.534)	Data Time 0.001 (0.031)	Loss 2.2887 (2.3461)	Entropy 0.52763 (0.52864)	Top-1 acc 67.188 (67.600)	Top-5 acc 85.938 (86.408)	lr 0.00039
Train [111][1240/3239]	Time 0.222 (0.533)	Data Time 0.001 (0.031)	Loss 2.6865 (2.3464)	Entropy 0.52756 (0.52863)	Top-1 acc 61.719 (67.595)	Top-5 acc 79.688 (86.407)	lr 0.00039
Train [111][1250/3239]	Time 0.328 (0.532)	Data Time 0.001 (0.031)	Loss 2.3428 (2.3464)	Entropy 0.52715 (0.52862)	Top-1 acc 70.312 (67.598)	Top-5 acc 83.984 (86.406)	lr 0.00039
Train [111][1260/3239]	Time 0.231 (0.531)	Data Time 0.001 (0.031)	Loss 2.4066 (2.3468)	Entropy 0.52721 (0.52861)	Top-1 acc 64.844 (67.590)	Top-5 acc 85.938 (86.400)	lr 0.00039
Train [111][1270/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.030)	Loss 2.2266 (2.3465)	Entropy 0.52716 (0.52860)	Top-1 acc 73.438 (67.588)	Top-5 acc 86.719 (86.404)	lr 0.00039
Train [111][1280/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.030)	Loss 2.2035 (2.3462)	Entropy 0.52717 (0.52859)	Top-1 acc 70.703 (67.595)	Top-5 acc 87.500 (86.406)	lr 0.00039
Train [111][1290/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.030)	Loss 2.2122 (2.3461)	Entropy 0.52718 (0.52858)	Top-1 acc 71.094 (67.597)	Top-5 acc 88.672 (86.403)	lr 0.00039
Train [111][1300/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.030)	Loss 2.3560 (2.3463)	Entropy 0.52740 (0.52857)	Top-1 acc 67.969 (67.585)	Top-5 acc 86.328 (86.397)	lr 0.00039
Train [111][1310/3239]	Time 0.226 (0.527)	Data Time 0.001 (0.030)	Loss 2.2391 (2.3457)	Entropy 0.52714 (0.52856)	Top-1 acc 70.703 (67.610)	Top-5 acc 89.062 (86.408)	lr 0.00039
Train [111][1320/3239]	Time 0.327 (0.526)	Data Time 0.001 (0.029)	Loss 2.3556 (2.3461)	Entropy 0.52724 (0.52855)	Top-1 acc 67.578 (67.601)	Top-5 acc 84.766 (86.396)	lr 0.00039
Train [111][1330/3239]	Time 0.221 (0.525)	Data Time 0.001 (0.029)	Loss 2.3421 (2.3459)	Entropy 0.52722 (0.52854)	Top-1 acc 66.797 (67.603)	Top-5 acc 86.328 (86.402)	lr 0.00039
Train [111][1340/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.029)	Loss 2.1547 (2.3456)	Entropy 0.52722 (0.52853)	Top-1 acc 73.047 (67.606)	Top-5 acc 91.016 (86.410)	lr 0.00039
Train [111][1350/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.029)	Loss 2.3389 (2.3452)	Entropy 0.52724 (0.52852)	Top-1 acc 69.922 (67.618)	Top-5 acc 86.719 (86.413)	lr 0.00039
Train [111][1360/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.029)	Loss 2.1986 (2.3457)	Entropy 0.52730 (0.52851)	Top-1 acc 72.266 (67.606)	Top-5 acc 90.234 (86.406)	lr 0.00039
Train [111][1370/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.028)	Loss 2.1580 (2.3450)	Entropy 0.52743 (0.52850)	Top-1 acc 70.703 (67.619)	Top-5 acc 88.281 (86.415)	lr 0.00039
Train [111][1380/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.028)	Loss 2.2658 (2.3445)	Entropy 0.52721 (0.52849)	Top-1 acc 71.484 (67.628)	Top-5 acc 87.500 (86.421)	lr 0.00039
Train [111][1390/3239]	Time 0.263 (0.521)	Data Time 0.001 (0.028)	Loss 2.2487 (2.3441)	Entropy 0.52752 (0.52848)	Top-1 acc 72.266 (67.636)	Top-5 acc 86.328 (86.428)	lr 0.00039
Train [111][1400/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.028)	Loss 2.3018 (2.3443)	Entropy 0.52758 (0.52848)	Top-1 acc 67.578 (67.629)	Top-5 acc 87.500 (86.429)	lr 0.00039
Train [111][1410/3239]	Time 0.346 (0.520)	Data Time 0.002 (0.028)	Loss 2.2427 (2.3445)	Entropy 0.52748 (0.52847)	Top-1 acc 69.922 (67.627)	Top-5 acc 89.062 (86.432)	lr 0.00039
Train [111][1420/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.027)	Loss 2.3922 (2.3448)	Entropy 0.52734 (0.52846)	Top-1 acc 64.453 (67.623)	Top-5 acc 85.938 (86.425)	lr 0.00039
Train [111][1430/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.027)	Loss 2.3367 (2.3452)	Entropy 0.52765 (0.52846)	Top-1 acc 71.094 (67.620)	Top-5 acc 86.719 (86.417)	lr 0.00039
Train [111][1440/3239]	Time 0.248 (0.517)	Data Time 0.001 (0.027)	Loss 2.2688 (2.3450)	Entropy 0.52750 (0.52845)	Top-1 acc 71.484 (67.624)	Top-5 acc 86.719 (86.415)	lr 0.00039
Train [111][1450/3239]	Time 0.227 (0.517)	Data Time 0.001 (0.027)	Loss 2.3341 (2.3453)	Entropy 0.52772 (0.52844)	Top-1 acc 66.797 (67.610)	Top-5 acc 86.719 (86.409)	lr 0.00039
Train [111][1460/3239]	Time 0.269 (0.516)	Data Time 0.001 (0.027)	Loss 2.3028 (2.3456)	Entropy 0.52792 (0.52844)	Top-1 acc 66.406 (67.605)	Top-5 acc 87.500 (86.400)	lr 0.00039
Train [111][1470/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.026)	Loss 2.6038 (2.3458)	Entropy 0.52772 (0.52844)	Top-1 acc 64.844 (67.609)	Top-5 acc 83.984 (86.396)	lr 0.00039
Train [111][1480/3239]	Time 0.385 (0.515)	Data Time 0.002 (0.026)	Loss 2.4522 (2.3458)	Entropy 0.52732 (0.52843)	Top-1 acc 64.844 (67.615)	Top-5 acc 84.766 (86.395)	lr 0.00039
Train [111][1490/3239]	Time 0.220 (0.514)	Data Time 0.001 (0.026)	Loss 2.3483 (2.3458)	Entropy 0.52744 (0.52842)	Top-1 acc 67.578 (67.614)	Top-5 acc 86.328 (86.396)	lr 0.00039
Train [111][1500/3239]	Time 0.239 (0.514)	Data Time 0.001 (0.026)	Loss 2.1397 (2.3456)	Entropy 0.52757 (0.52842)	Top-1 acc 74.219 (67.621)	Top-5 acc 88.672 (86.397)	lr 0.00039
Train [111][1510/3239]	Time 0.223 (0.513)	Data Time 0.001 (0.026)	Loss 2.2780 (2.3460)	Entropy 0.52735 (0.52841)	Top-1 acc 68.750 (67.606)	Top-5 acc 88.281 (86.395)	lr 0.00039
Train [111][1520/3239]	Time 0.225 (0.512)	Data Time 0.001 (0.026)	Loss 2.3028 (2.3461)	Entropy 0.52738 (0.52840)	Top-1 acc 66.016 (67.602)	Top-5 acc 89.453 (86.392)	lr 0.00039
Train [111][1530/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.025)	Loss 2.3218 (2.3460)	Entropy 0.52746 (0.52840)	Top-1 acc 68.750 (67.606)	Top-5 acc 84.766 (86.391)	lr 0.00039
Train [111][1540/3239]	Time 0.222 (0.511)	Data Time 0.001 (0.025)	Loss 2.2718 (2.3459)	Entropy 0.52729 (0.52839)	Top-1 acc 64.062 (67.599)	Top-5 acc 88.672 (86.397)	lr 0.00039
Train [111][1550/3239]	Time 0.259 (0.511)	Data Time 0.001 (0.025)	Loss 2.3309 (2.3457)	Entropy 0.52745 (0.52839)	Top-1 acc 64.844 (67.606)	Top-5 acc 86.719 (86.394)	lr 0.00039
Train [111][1560/3239]	Time 0.255 (0.510)	Data Time 0.001 (0.025)	Loss 2.2928 (2.3461)	Entropy 0.52697 (0.52838)	Top-1 acc 67.188 (67.600)	Top-5 acc 88.281 (86.385)	lr 0.00039
Train [111][1570/3239]	Time 0.365 (0.509)	Data Time 0.001 (0.025)	Loss 2.5760 (2.3466)	Entropy 0.52697 (0.52837)	Top-1 acc 63.281 (67.596)	Top-5 acc 83.984 (86.378)	lr 0.00039
Train [111][1580/3239]	Time 0.224 (0.509)	Data Time 0.001 (0.025)	Loss 2.3224 (2.3466)	Entropy 0.52705 (0.52836)	Top-1 acc 66.406 (67.596)	Top-5 acc 87.500 (86.380)	lr 0.00039
Train [111][1590/3239]	Time 0.224 (0.508)	Data Time 0.001 (0.025)	Loss 2.4455 (2.3466)	Entropy 0.52689 (0.52835)	Top-1 acc 64.062 (67.599)	Top-5 acc 85.547 (86.379)	lr 0.00039
Train [111][1600/3239]	Time 0.224 (0.507)	Data Time 0.001 (0.024)	Loss 2.3738 (2.3467)	Entropy 0.52641 (0.52834)	Top-1 acc 67.188 (67.597)	Top-5 acc 85.938 (86.374)	lr 0.00039
Train [111][1610/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.024)	Loss 2.2805 (2.3467)	Entropy 0.52631 (0.52833)	Top-1 acc 70.312 (67.594)	Top-5 acc 85.547 (86.374)	lr 0.00038
Train [111][1620/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.024)	Loss 2.3000 (2.3465)	Entropy 0.52576 (0.52831)	Top-1 acc 70.703 (67.603)	Top-5 acc 86.719 (86.376)	lr 0.00038
Train [111][1630/3239]	Time 0.250 (0.505)	Data Time 0.001 (0.024)	Loss 2.6059 (2.3473)	Entropy 0.52590 (0.52830)	Top-1 acc 62.109 (67.584)	Top-5 acc 81.641 (86.369)	lr 0.00038
Train [111][1640/3239]	Time 0.327 (0.505)	Data Time 0.001 (0.024)	Loss 2.4459 (2.3475)	Entropy 0.52605 (0.52829)	Top-1 acc 69.141 (67.580)	Top-5 acc 85.547 (86.367)	lr 0.00038
Train [111][1650/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.024)	Loss 2.1644 (2.3474)	Entropy 0.52564 (0.52827)	Top-1 acc 71.875 (67.588)	Top-5 acc 89.453 (86.370)	lr 0.00038
Train [111][1660/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.024)	Loss 2.3022 (2.3476)	Entropy 0.52568 (0.52826)	Top-1 acc 71.484 (67.588)	Top-5 acc 88.281 (86.366)	lr 0.00038
Train [111][1670/3239]	Time 0.276 (0.503)	Data Time 0.001 (0.023)	Loss 2.2964 (2.3478)	Entropy 0.52585 (0.52824)	Top-1 acc 65.625 (67.584)	Top-5 acc 86.328 (86.359)	lr 0.00038
Train [111][1680/3239]	Time 0.241 (0.503)	Data Time 0.001 (0.023)	Loss 2.5850 (2.3486)	Entropy 0.52560 (0.52823)	Top-1 acc 61.719 (67.563)	Top-5 acc 81.250 (86.344)	lr 0.00038
Train [111][1690/3239]	Time 0.234 (0.502)	Data Time 0.001 (0.023)	Loss 2.3762 (2.3486)	Entropy 0.52554 (0.52821)	Top-1 acc 62.891 (67.558)	Top-5 acc 85.938 (86.341)	lr 0.00038
Train [111][1700/3239]	Time 0.268 (0.502)	Data Time 0.001 (0.023)	Loss 2.4813 (2.3488)	Entropy 0.52536 (0.52819)	Top-1 acc 64.453 (67.551)	Top-5 acc 86.328 (86.341)	lr 0.00038
Train [111][1710/3239]	Time 0.241 (0.501)	Data Time 0.001 (0.023)	Loss 2.2346 (2.3483)	Entropy 0.52577 (0.52818)	Top-1 acc 69.141 (67.565)	Top-5 acc 88.672 (86.347)	lr 0.00038
Train [111][1720/3239]	Time 0.234 (0.501)	Data Time 0.001 (0.023)	Loss 2.3003 (2.3485)	Entropy 0.52600 (0.52817)	Top-1 acc 71.875 (67.563)	Top-5 acc 86.719 (86.346)	lr 0.00038
Train [111][1730/3239]	Time 0.232 (0.500)	Data Time 0.001 (0.023)	Loss 2.5696 (2.3484)	Entropy 0.52629 (0.52815)	Top-1 acc 60.156 (67.563)	Top-5 acc 82.812 (86.342)	lr 0.00038
Train [111][1740/3239]	Time 0.229 (0.500)	Data Time 0.001 (0.023)	Loss 2.2176 (2.3486)	Entropy 0.52648 (0.52814)	Top-1 acc 68.359 (67.557)	Top-5 acc 88.281 (86.338)	lr 0.00038
Train [111][1750/3239]	Time 0.274 (0.499)	Data Time 0.001 (0.022)	Loss 2.5032 (2.3487)	Entropy 0.52650 (0.52813)	Top-1 acc 62.500 (67.556)	Top-5 acc 82.812 (86.336)	lr 0.00038
Train [111][1760/3239]	Time 0.282 (0.499)	Data Time 0.002 (0.022)	Loss 2.1693 (2.3485)	Entropy 0.52686 (0.52813)	Top-1 acc 73.438 (67.560)	Top-5 acc 89.453 (86.339)	lr 0.00038
Train [111][1770/3239]	Time 0.224 (0.498)	Data Time 0.001 (0.022)	Loss 2.4853 (2.3485)	Entropy 0.52677 (0.52812)	Top-1 acc 65.625 (67.561)	Top-5 acc 82.422 (86.333)	lr 0.00038
Train [111][1780/3239]	Time 0.225 (0.498)	Data Time 0.001 (0.022)	Loss 2.2407 (2.3486)	Entropy 0.52675 (0.52811)	Top-1 acc 69.922 (67.559)	Top-5 acc 90.234 (86.337)	lr 0.00038
Train [111][1790/3239]	Time 0.240 (0.497)	Data Time 0.001 (0.022)	Loss 2.1383 (2.3484)	Entropy 0.52637 (0.52810)	Top-1 acc 73.438 (67.564)	Top-5 acc 89.844 (86.336)	lr 0.00038
Train [111][1800/3239]	Time 0.355 (0.497)	Data Time 0.001 (0.022)	Loss 2.4275 (2.3484)	Entropy 0.52618 (0.52809)	Top-1 acc 61.328 (67.558)	Top-5 acc 85.938 (86.331)	lr 0.00038
Train [111][1810/3239]	Time 0.257 (0.497)	Data Time 0.001 (0.022)	Loss 2.3172 (2.3479)	Entropy 0.52599 (0.52808)	Top-1 acc 68.750 (67.569)	Top-5 acc 87.109 (86.341)	lr 0.00038
Train [111][1820/3239]	Time 0.244 (0.496)	Data Time 0.001 (0.022)	Loss 2.1561 (2.3478)	Entropy 0.52584 (0.52807)	Top-1 acc 73.047 (67.570)	Top-5 acc 89.453 (86.345)	lr 0.00038
Train [111][1830/3239]	Time 0.223 (0.496)	Data Time 0.001 (0.022)	Loss 2.3705 (2.3479)	Entropy 0.52598 (0.52806)	Top-1 acc 65.234 (67.565)	Top-5 acc 86.719 (86.341)	lr 0.00038
Train [111][1840/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.021)	Loss 2.3986 (2.3477)	Entropy 0.52595 (0.52805)	Top-1 acc 64.844 (67.570)	Top-5 acc 85.547 (86.346)	lr 0.00038
Train [111][1850/3239]	Time 0.258 (0.495)	Data Time 0.001 (0.021)	Loss 2.4736 (2.3475)	Entropy 0.52601 (0.52804)	Top-1 acc 64.453 (67.573)	Top-5 acc 83.203 (86.349)	lr 0.00038
Train [111][1860/3239]	Time 0.322 (0.522)	Data Time 0.026 (0.021)	Loss 2.5277 (2.3477)	Entropy 0.52633 (0.52802)	Top-1 acc 63.281 (67.563)	Top-5 acc 83.203 (86.346)	lr 0.00038
Train [111][1870/3239]	Time 0.232 (0.522)	Data Time 0.002 (0.021)	Loss 2.3444 (2.3480)	Entropy 0.52643 (0.52802)	Top-1 acc 66.797 (67.557)	Top-5 acc 86.719 (86.343)	lr 0.00038
Train [111][1880/3239]	Time 0.240 (0.521)	Data Time 0.001 (0.021)	Loss 2.1737 (2.3478)	Entropy 0.52614 (0.52801)	Top-1 acc 73.438 (67.564)	Top-5 acc 89.062 (86.348)	lr 0.00038
Train [111][1890/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.021)	Loss 2.3195 (2.3475)	Entropy 0.52638 (0.52800)	Top-1 acc 68.359 (67.568)	Top-5 acc 87.500 (86.352)	lr 0.00038
Train [111][1900/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.021)	Loss 2.4577 (2.3477)	Entropy 0.52648 (0.52799)	Top-1 acc 62.109 (67.561)	Top-5 acc 84.375 (86.350)	lr 0.00038
Train [111][1910/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.021)	Loss 2.2700 (2.3477)	Entropy 0.52659 (0.52798)	Top-1 acc 71.484 (67.560)	Top-5 acc 87.500 (86.353)	lr 0.00038
Train [111][1920/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.021)	Loss 2.2204 (2.3477)	Entropy 0.52656 (0.52797)	Top-1 acc 73.438 (67.562)	Top-5 acc 88.281 (86.352)	lr 0.00038
Train [111][1930/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.021)	Loss 2.3264 (2.3474)	Entropy 0.52707 (0.52797)	Top-1 acc 69.922 (67.569)	Top-5 acc 86.328 (86.357)	lr 0.00038
Train [111][1940/3239]	Time 0.245 (0.518)	Data Time 0.001 (0.020)	Loss 2.4177 (2.3474)	Entropy 0.52705 (0.52796)	Top-1 acc 66.406 (67.568)	Top-5 acc 86.328 (86.354)	lr 0.00038
Train [111][1950/3239]	Time 0.236 (0.517)	Data Time 0.001 (0.020)	Loss 2.2935 (2.3476)	Entropy 0.52688 (0.52796)	Top-1 acc 63.672 (67.563)	Top-5 acc 87.500 (86.353)	lr 0.00038
Train [111][1960/3239]	Time 0.332 (0.517)	Data Time 0.001 (0.020)	Loss 2.3768 (2.3477)	Entropy 0.52704 (0.52795)	Top-1 acc 67.578 (67.557)	Top-5 acc 83.984 (86.351)	lr 0.00038
Train [111][1970/3239]	Time 0.294 (0.516)	Data Time 0.001 (0.020)	Loss 2.2343 (2.3477)	Entropy 0.52716 (0.52795)	Top-1 acc 72.266 (67.558)	Top-5 acc 87.500 (86.349)	lr 0.00038
Train [111][1980/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.020)	Loss 2.2653 (2.3475)	Entropy 0.52721 (0.52794)	Top-1 acc 69.922 (67.559)	Top-5 acc 87.500 (86.349)	lr 0.00038
Train [111][1990/3239]	Time 0.275 (0.516)	Data Time 0.001 (0.020)	Loss 2.1975 (2.3473)	Entropy 0.52746 (0.52794)	Top-1 acc 73.828 (67.563)	Top-5 acc 87.500 (86.350)	lr 0.00038
Train [111][2000/3239]	Time 0.253 (0.515)	Data Time 0.001 (0.020)	Loss 2.0930 (2.3473)	Entropy 0.52727 (0.52794)	Top-1 acc 71.094 (67.561)	Top-5 acc 91.406 (86.348)	lr 0.00038
Train [111][2010/3239]	Time 0.254 (0.515)	Data Time 0.001 (0.020)	Loss 2.6039 (2.3476)	Entropy 0.52727 (0.52794)	Top-1 acc 66.406 (67.561)	Top-5 acc 81.641 (86.343)	lr 0.00037
Train [111][2020/3239]	Time 0.225 (0.514)	Data Time 0.001 (0.020)	Loss 2.3263 (2.3473)	Entropy 0.52750 (0.52793)	Top-1 acc 65.625 (67.567)	Top-5 acc 89.062 (86.348)	lr 0.00037
Train [111][2030/3239]	Time 0.322 (0.514)	Data Time 0.001 (0.020)	Loss 2.2797 (2.3471)	Entropy 0.52752 (0.52793)	Top-1 acc 69.922 (67.566)	Top-5 acc 87.891 (86.351)	lr 0.00037
Train [111][2040/3239]	Time 0.224 (0.513)	Data Time 0.001 (0.020)	Loss 2.3953 (2.3471)	Entropy 0.52781 (0.52793)	Top-1 acc 66.016 (67.565)	Top-5 acc 85.547 (86.352)	lr 0.00037
Train [111][2050/3239]	Time 0.232 (0.513)	Data Time 0.002 (0.019)	Loss 2.3215 (2.3475)	Entropy 0.52808 (0.52793)	Top-1 acc 66.406 (67.558)	Top-5 acc 88.672 (86.341)	lr 0.00037
Train [111][2060/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.019)	Loss 2.3559 (2.3479)	Entropy 0.52780 (0.52793)	Top-1 acc 69.531 (67.545)	Top-5 acc 84.375 (86.329)	lr 0.00037
Train [111][2070/3239]	Time 0.223 (0.512)	Data Time 0.001 (0.019)	Loss 2.1576 (2.3479)	Entropy 0.52799 (0.52793)	Top-1 acc 71.875 (67.545)	Top-5 acc 87.891 (86.329)	lr 0.00037
Train [111][2080/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.019)	Loss 2.5629 (2.3481)	Entropy 0.52793 (0.52793)	Top-1 acc 64.453 (67.539)	Top-5 acc 82.422 (86.326)	lr 0.00037
Train [111][2090/3239]	Time 0.234 (0.511)	Data Time 0.001 (0.019)	Loss 2.4628 (2.3482)	Entropy 0.52809 (0.52793)	Top-1 acc 64.062 (67.536)	Top-5 acc 85.547 (86.322)	lr 0.00037
Train [111][2100/3239]	Time 0.291 (0.511)	Data Time 0.001 (0.019)	Loss 2.2670 (2.3482)	Entropy 0.52796 (0.52793)	Top-1 acc 67.188 (67.535)	Top-5 acc 89.453 (86.323)	lr 0.00037
Train [111][2110/3239]	Time 0.215 (0.510)	Data Time 0.001 (0.019)	Loss 3.0126 (2.3487)	Entropy 0.52810 (0.52793)	Top-1 acc 51.562 (67.521)	Top-5 acc 75.391 (86.315)	lr 0.00037
Train [111][2120/3239]	Time 0.365 (0.510)	Data Time 0.001 (0.019)	Loss 2.2900 (2.3486)	Entropy 0.52826 (0.52793)	Top-1 acc 68.359 (67.520)	Top-5 acc 88.281 (86.313)	lr 0.00037
Train [111][2130/3239]	Time 0.227 (0.509)	Data Time 0.001 (0.019)	Loss 2.4577 (2.3487)	Entropy 0.52827 (0.52793)	Top-1 acc 68.359 (67.519)	Top-5 acc 83.984 (86.311)	lr 0.00037
Train [111][2140/3239]	Time 0.234 (0.509)	Data Time 0.001 (0.019)	Loss 2.3136 (2.3485)	Entropy 0.52804 (0.52793)	Top-1 acc 69.922 (67.523)	Top-5 acc 86.719 (86.315)	lr 0.00037
Train [111][2150/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.019)	Loss 2.2907 (2.3484)	Entropy 0.52805 (0.52793)	Top-1 acc 68.359 (67.531)	Top-5 acc 86.328 (86.313)	lr 0.00037
Train [111][2160/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.019)	Loss 2.3579 (2.3487)	Entropy 0.52777 (0.52793)	Top-1 acc 67.188 (67.522)	Top-5 acc 85.547 (86.308)	lr 0.00037
Train [111][2170/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.018)	Loss 2.2716 (2.3486)	Entropy 0.52777 (0.52793)	Top-1 acc 71.094 (67.524)	Top-5 acc 90.234 (86.310)	lr 0.00037
Train [111][2180/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.018)	Loss 2.3408 (2.3484)	Entropy 0.52817 (0.52793)	Top-1 acc 68.750 (67.535)	Top-5 acc 85.547 (86.312)	lr 0.00037
Train [111][2190/3239]	Time 0.316 (0.507)	Data Time 0.001 (0.018)	Loss 2.3790 (2.3486)	Entropy 0.52795 (0.52793)	Top-1 acc 67.969 (67.533)	Top-5 acc 85.156 (86.305)	lr 0.00037
Train [111][2200/3239]	Time 0.219 (0.506)	Data Time 0.001 (0.018)	Loss 2.6580 (2.3490)	Entropy 0.52785 (0.52793)	Top-1 acc 62.109 (67.524)	Top-5 acc 79.297 (86.297)	lr 0.00037
Train [111][2210/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.018)	Loss 2.3572 (2.3489)	Entropy 0.52775 (0.52793)	Top-1 acc 64.844 (67.526)	Top-5 acc 86.719 (86.298)	lr 0.00037
Train [111][2220/3239]	Time 0.219 (0.505)	Data Time 0.001 (0.018)	Loss 2.7042 (2.3492)	Entropy 0.52795 (0.52793)	Top-1 acc 60.547 (67.516)	Top-5 acc 78.516 (86.294)	lr 0.00037
Train [111][2230/3239]	Time 0.239 (0.505)	Data Time 0.002 (0.018)	Loss 2.2044 (2.3492)	Entropy 0.52798 (0.52793)	Top-1 acc 69.141 (67.515)	Top-5 acc 89.844 (86.293)	lr 0.00037
Train [111][2240/3239]	Time 0.237 (0.504)	Data Time 0.001 (0.018)	Loss 2.3315 (2.3496)	Entropy 0.52788 (0.52793)	Top-1 acc 67.969 (67.507)	Top-5 acc 85.156 (86.283)	lr 0.00037
Train [111][2250/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.018)	Loss 2.3800 (2.3493)	Entropy 0.52751 (0.52793)	Top-1 acc 67.969 (67.514)	Top-5 acc 86.719 (86.287)	lr 0.00037
Train [111][2260/3239]	Time 0.271 (0.504)	Data Time 0.003 (0.018)	Loss 2.5504 (2.3493)	Entropy 0.52750 (0.52793)	Top-1 acc 64.844 (67.516)	Top-5 acc 83.984 (86.289)	lr 0.00037
Train [111][2270/3239]	Time 0.229 (0.503)	Data Time 0.001 (0.018)	Loss 2.5565 (2.3495)	Entropy 0.52729 (0.52793)	Top-1 acc 61.328 (67.511)	Top-5 acc 79.688 (86.286)	lr 0.00037
Train [111][2280/3239]	Time 0.251 (0.503)	Data Time 0.001 (0.018)	Loss 2.2806 (2.3491)	Entropy 0.52754 (0.52792)	Top-1 acc 70.312 (67.524)	Top-5 acc 87.500 (86.291)	lr 0.00037
Train [111][2290/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.018)	Loss 2.5836 (2.3493)	Entropy 0.52769 (0.52792)	Top-1 acc 60.156 (67.519)	Top-5 acc 82.812 (86.287)	lr 0.00037
Train [111][2300/3239]	Time 0.239 (0.502)	Data Time 0.001 (0.018)	Loss 2.1771 (2.3495)	Entropy 0.52749 (0.52792)	Top-1 acc 71.484 (67.513)	Top-5 acc 91.406 (86.287)	lr 0.00037
Train [111][2310/3239]	Time 0.295 (0.502)	Data Time 0.001 (0.017)	Loss 2.3468 (2.3493)	Entropy 0.52766 (0.52792)	Top-1 acc 67.578 (67.514)	Top-5 acc 85.547 (86.288)	lr 0.00037
Train [111][2320/3239]	Time 0.233 (0.501)	Data Time 0.001 (0.017)	Loss 2.1114 (2.3491)	Entropy 0.52756 (0.52792)	Top-1 acc 74.219 (67.512)	Top-5 acc 89.844 (86.290)	lr 0.00037
Train [111][2330/3239]	Time 0.247 (0.501)	Data Time 0.001 (0.017)	Loss 2.3760 (2.3492)	Entropy 0.52776 (0.52792)	Top-1 acc 67.578 (67.515)	Top-5 acc 86.328 (86.290)	lr 0.00037
Train [111][2340/3239]	Time 0.232 (0.500)	Data Time 0.001 (0.017)	Loss 2.3449 (2.3492)	Entropy 0.52768 (0.52792)	Top-1 acc 66.797 (67.515)	Top-5 acc 85.547 (86.288)	lr 0.00037
Train [111][2350/3239]	Time 0.329 (0.500)	Data Time 0.001 (0.017)	Loss 2.3718 (2.3494)	Entropy 0.52780 (0.52792)	Top-1 acc 66.797 (67.508)	Top-5 acc 85.938 (86.284)	lr 0.00037
Train [111][2360/3239]	Time 0.233 (0.499)	Data Time 0.001 (0.017)	Loss 2.3703 (2.3496)	Entropy 0.52798 (0.52792)	Top-1 acc 66.016 (67.507)	Top-5 acc 84.375 (86.280)	lr 0.00037
Train [111][2370/3239]	Time 0.228 (0.499)	Data Time 0.001 (0.017)	Loss 2.2820 (2.3494)	Entropy 0.52826 (0.52792)	Top-1 acc 66.016 (67.510)	Top-5 acc 89.453 (86.280)	lr 0.00037
Train [111][2380/3239]	Time 0.234 (0.499)	Data Time 0.001 (0.017)	Loss 2.4779 (2.3494)	Entropy 0.52814 (0.52792)	Top-1 acc 67.188 (67.514)	Top-5 acc 85.547 (86.283)	lr 0.00037
Train [111][2390/3239]	Time 0.242 (0.498)	Data Time 0.001 (0.017)	Loss 2.1509 (2.3496)	Entropy 0.52788 (0.52792)	Top-1 acc 70.703 (67.505)	Top-5 acc 90.625 (86.280)	lr 0.00037
Train [111][2400/3239]	Time 0.224 (0.498)	Data Time 0.001 (0.017)	Loss 2.3744 (2.3500)	Entropy 0.52795 (0.52792)	Top-1 acc 67.578 (67.491)	Top-5 acc 86.719 (86.275)	lr 0.00037
Train [111][2410/3239]	Time 0.229 (0.498)	Data Time 0.001 (0.017)	Loss 2.1473 (2.3498)	Entropy 0.52793 (0.52792)	Top-1 acc 74.219 (67.494)	Top-5 acc 89.844 (86.279)	lr 0.00037
Train [111][2420/3239]	Time 0.342 (0.497)	Data Time 0.001 (0.017)	Loss 2.4570 (2.3496)	Entropy 0.52774 (0.52792)	Top-1 acc 63.672 (67.496)	Top-5 acc 84.375 (86.284)	lr 0.00036
Train [111][2430/3239]	Time 0.328 (0.497)	Data Time 0.002 (0.017)	Loss 2.3688 (2.3494)	Entropy 0.52741 (0.52792)	Top-1 acc 64.844 (67.497)	Top-5 acc 84.375 (86.287)	lr 0.00036
Train [111][2440/3239]	Time 0.225 (0.497)	Data Time 0.001 (0.017)	Loss 2.1662 (2.3496)	Entropy 0.52721 (0.52791)	Top-1 acc 73.438 (67.490)	Top-5 acc 88.281 (86.282)	lr 0.00036
Train [111][2450/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.017)	Loss 2.1749 (2.3495)	Entropy 0.52746 (0.52791)	Top-1 acc 69.141 (67.485)	Top-5 acc 88.281 (86.284)	lr 0.00036
Train [111][2460/3239]	Time 0.228 (0.497)	Data Time 0.001 (0.016)	Loss 2.3178 (2.3492)	Entropy 0.52775 (0.52791)	Top-1 acc 64.844 (67.489)	Top-5 acc 85.938 (86.288)	lr 0.00036
Train [111][2470/3239]	Time 0.227 (0.496)	Data Time 0.001 (0.016)	Loss 2.4075 (2.3493)	Entropy 0.52821 (0.52791)	Top-1 acc 66.016 (67.489)	Top-5 acc 87.109 (86.286)	lr 0.00036
Train [111][2480/3239]	Time 0.228 (0.496)	Data Time 0.001 (0.016)	Loss 2.5445 (2.3492)	Entropy 0.52813 (0.52791)	Top-1 acc 64.844 (67.487)	Top-5 acc 84.375 (86.289)	lr 0.00036
Train [111][2490/3239]	Time 0.245 (0.496)	Data Time 0.001 (0.016)	Loss 2.3771 (2.3492)	Entropy 0.52789 (0.52791)	Top-1 acc 71.094 (67.490)	Top-5 acc 87.891 (86.289)	lr 0.00036
Train [111][2500/3239]	Time 0.251 (0.495)	Data Time 0.001 (0.016)	Loss 2.1772 (2.3489)	Entropy 0.52791 (0.52791)	Top-1 acc 71.875 (67.496)	Top-5 acc 88.281 (86.294)	lr 0.00036
Train [111][2510/3239]	Time 0.451 (0.515)	Data Time 0.006 (0.016)	Loss 2.2243 (2.3489)	Entropy 0.52761 (0.52791)	Top-1 acc 70.703 (67.494)	Top-5 acc 88.281 (86.295)	lr 0.00036
Train [111][2520/3239]	Time 0.238 (0.515)	Data Time 0.002 (0.016)	Loss 2.3641 (2.3487)	Entropy 0.52781 (0.52791)	Top-1 acc 68.359 (67.498)	Top-5 acc 83.594 (86.297)	lr 0.00036
Train [111][2530/3239]	Time 0.231 (0.515)	Data Time 0.001 (0.016)	Loss 2.2785 (2.3487)	Entropy 0.52792 (0.52791)	Top-1 acc 71.484 (67.501)	Top-5 acc 87.109 (86.296)	lr 0.00036
Train [111][2540/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.016)	Loss 2.3118 (2.3487)	Entropy 0.52802 (0.52791)	Top-1 acc 67.969 (67.496)	Top-5 acc 86.719 (86.294)	lr 0.00036
Train [111][2550/3239]	Time 0.259 (0.514)	Data Time 0.001 (0.016)	Loss 2.3259 (2.3489)	Entropy 0.52809 (0.52791)	Top-1 acc 71.094 (67.492)	Top-5 acc 86.719 (86.290)	lr 0.00036
Train [111][2560/3239]	Time 0.255 (0.514)	Data Time 0.002 (0.016)	Loss 2.3414 (2.3490)	Entropy 0.52807 (0.52791)	Top-1 acc 69.531 (67.493)	Top-5 acc 84.375 (86.289)	lr 0.00036
Train [111][2570/3239]	Time 0.251 (0.513)	Data Time 0.002 (0.016)	Loss 2.2894 (2.3489)	Entropy 0.52810 (0.52791)	Top-1 acc 65.625 (67.495)	Top-5 acc 86.328 (86.290)	lr 0.00036
Train [111][2580/3239]	Time 0.333 (0.513)	Data Time 0.001 (0.016)	Loss 2.4888 (2.3487)	Entropy 0.52797 (0.52791)	Top-1 acc 63.281 (67.499)	Top-5 acc 85.547 (86.295)	lr 0.00036
Train [111][2590/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.016)	Loss 2.4104 (2.3490)	Entropy 0.52825 (0.52791)	Top-1 acc 64.453 (67.488)	Top-5 acc 85.547 (86.285)	lr 0.00036
Train [111][2600/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.016)	Loss 2.4280 (2.3492)	Entropy 0.52811 (0.52791)	Top-1 acc 65.625 (67.482)	Top-5 acc 85.156 (86.284)	lr 0.00036
Train [111][2610/3239]	Time 0.235 (0.512)	Data Time 0.002 (0.016)	Loss 2.2889 (2.3492)	Entropy 0.52824 (0.52792)	Top-1 acc 69.922 (67.481)	Top-5 acc 84.375 (86.280)	lr 0.00036
Train [111][2620/3239]	Time 0.236 (0.512)	Data Time 0.001 (0.016)	Loss 2.4670 (2.3496)	Entropy 0.52803 (0.52792)	Top-1 acc 64.844 (67.467)	Top-5 acc 82.812 (86.270)	lr 0.00036
Train [111][2630/3239]	Time 0.230 (0.511)	Data Time 0.001 (0.016)	Loss 2.1727 (2.3495)	Entropy 0.52811 (0.52792)	Top-1 acc 72.656 (67.473)	Top-5 acc 88.672 (86.274)	lr 0.00036
Train [111][2640/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.015)	Loss 2.5430 (2.3497)	Entropy 0.52835 (0.52792)	Top-1 acc 64.062 (67.470)	Top-5 acc 82.422 (86.269)	lr 0.00036
Train [111][2650/3239]	Time 0.244 (0.511)	Data Time 0.002 (0.015)	Loss 2.4623 (2.3496)	Entropy 0.52825 (0.52792)	Top-1 acc 62.109 (67.468)	Top-5 acc 83.594 (86.272)	lr 0.00036
Train [111][2660/3239]	Time 0.281 (0.510)	Data Time 0.001 (0.015)	Loss 2.1733 (2.3495)	Entropy 0.52831 (0.52792)	Top-1 acc 70.703 (67.474)	Top-5 acc 89.453 (86.273)	lr 0.00036
Train [111][2670/3239]	Time 0.366 (0.510)	Data Time 0.001 (0.015)	Loss 2.1469 (2.3494)	Entropy 0.52849 (0.52792)	Top-1 acc 70.703 (67.478)	Top-5 acc 89.844 (86.272)	lr 0.00036
Train [111][2680/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.015)	Loss 2.4351 (2.3496)	Entropy 0.52833 (0.52792)	Top-1 acc 63.672 (67.470)	Top-5 acc 85.547 (86.268)	lr 0.00036
Train [111][2690/3239]	Time 0.246 (0.510)	Data Time 0.001 (0.015)	Loss 2.4730 (2.3499)	Entropy 0.52839 (0.52793)	Top-1 acc 64.844 (67.459)	Top-5 acc 83.984 (86.263)	lr 0.00036
Train [111][2700/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.015)	Loss 2.2248 (2.3500)	Entropy 0.52887 (0.52793)	Top-1 acc 69.141 (67.457)	Top-5 acc 87.891 (86.261)	lr 0.00036
Train [111][2710/3239]	Time 0.238 (0.509)	Data Time 0.001 (0.015)	Loss 2.4454 (2.3498)	Entropy 0.52886 (0.52793)	Top-1 acc 67.578 (67.463)	Top-5 acc 85.156 (86.264)	lr 0.00036
Train [111][2720/3239]	Time 0.229 (0.509)	Data Time 0.001 (0.015)	Loss 2.1677 (2.3496)	Entropy 0.52875 (0.52794)	Top-1 acc 73.828 (67.468)	Top-5 acc 89.453 (86.267)	lr 0.00036
Train [111][2730/3239]	Time 0.239 (0.508)	Data Time 0.001 (0.015)	Loss 2.4898 (2.3497)	Entropy 0.52910 (0.52794)	Top-1 acc 64.453 (67.468)	Top-5 acc 82.422 (86.265)	lr 0.00036
Train [111][2740/3239]	Time 0.326 (0.508)	Data Time 0.001 (0.015)	Loss 2.5870 (2.3499)	Entropy 0.52872 (0.52794)	Top-1 acc 62.109 (67.461)	Top-5 acc 81.250 (86.264)	lr 0.00036
Train [111][2750/3239]	Time 0.231 (0.508)	Data Time 0.001 (0.015)	Loss 2.3035 (2.3501)	Entropy 0.52867 (0.52794)	Top-1 acc 71.094 (67.457)	Top-5 acc 88.672 (86.261)	lr 0.00036
Train [111][2760/3239]	Time 0.233 (0.507)	Data Time 0.001 (0.015)	Loss 2.1747 (2.3498)	Entropy 0.52876 (0.52795)	Top-1 acc 71.094 (67.464)	Top-5 acc 89.453 (86.267)	lr 0.00036
Train [111][2770/3239]	Time 0.224 (0.507)	Data Time 0.001 (0.015)	Loss 2.2367 (2.3497)	Entropy 0.52868 (0.52795)	Top-1 acc 70.703 (67.464)	Top-5 acc 89.062 (86.268)	lr 0.00036
Train [111][2780/3239]	Time 0.230 (0.506)	Data Time 0.001 (0.015)	Loss 2.2570 (2.3498)	Entropy 0.52862 (0.52795)	Top-1 acc 66.406 (67.461)	Top-5 acc 88.281 (86.267)	lr 0.00036
Train [111][2790/3239]	Time 0.231 (0.506)	Data Time 0.001 (0.015)	Loss 2.2908 (2.3498)	Entropy 0.52864 (0.52795)	Top-1 acc 69.922 (67.457)	Top-5 acc 89.844 (86.267)	lr 0.00036
Train [111][2800/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.015)	Loss 2.3910 (2.3498)	Entropy 0.52871 (0.52796)	Top-1 acc 68.750 (67.460)	Top-5 acc 85.156 (86.268)	lr 0.00036
Train [111][2810/3239]	Time 0.239 (0.505)	Data Time 0.001 (0.015)	Loss 2.2460 (2.3497)	Entropy 0.52849 (0.52796)	Top-1 acc 73.438 (67.464)	Top-5 acc 89.453 (86.270)	lr 0.00036
Train [111][2820/3239]	Time 0.241 (0.505)	Data Time 0.001 (0.015)	Loss 2.2047 (2.3495)	Entropy 0.52887 (0.52796)	Top-1 acc 68.750 (67.468)	Top-5 acc 90.625 (86.273)	lr 0.00036
Train [111][2830/3239]	Time 0.379 (0.505)	Data Time 0.001 (0.015)	Loss 2.3035 (2.3494)	Entropy 0.52911 (0.52797)	Top-1 acc 66.406 (67.470)	Top-5 acc 90.234 (86.275)	lr 0.00036
Train [111][2840/3239]	Time 0.236 (0.505)	Data Time 0.001 (0.015)	Loss 2.3103 (2.3498)	Entropy 0.52926 (0.52797)	Top-1 acc 68.359 (67.463)	Top-5 acc 86.719 (86.266)	lr 0.00035
Train [111][2850/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.014)	Loss 2.3770 (2.3499)	Entropy 0.52907 (0.52797)	Top-1 acc 67.188 (67.460)	Top-5 acc 85.547 (86.264)	lr 0.00035
Train [111][2860/3239]	Time 0.235 (0.504)	Data Time 0.001 (0.014)	Loss 2.2623 (2.3497)	Entropy 0.52925 (0.52798)	Top-1 acc 68.359 (67.462)	Top-5 acc 87.109 (86.268)	lr 0.00035
Train [111][2870/3239]	Time 0.233 (0.504)	Data Time 0.001 (0.014)	Loss 2.3679 (2.3497)	Entropy 0.52922 (0.52798)	Top-1 acc 63.281 (67.462)	Top-5 acc 88.281 (86.267)	lr 0.00035
Train [111][2880/3239]	Time 0.223 (0.503)	Data Time 0.001 (0.014)	Loss 2.4546 (2.3496)	Entropy 0.52925 (0.52799)	Top-1 acc 65.625 (67.469)	Top-5 acc 85.156 (86.268)	lr 0.00035
Train [111][2890/3239]	Time 0.258 (0.503)	Data Time 0.001 (0.014)	Loss 2.6433 (2.3497)	Entropy 0.52893 (0.52799)	Top-1 acc 61.719 (67.466)	Top-5 acc 82.422 (86.268)	lr 0.00035
Train [111][2900/3239]	Time 0.343 (0.503)	Data Time 0.001 (0.014)	Loss 2.2368 (2.3501)	Entropy 0.52898 (0.52799)	Top-1 acc 69.141 (67.454)	Top-5 acc 89.844 (86.260)	lr 0.00035
Train [111][2910/3239]	Time 0.268 (0.502)	Data Time 0.001 (0.014)	Loss 2.2992 (2.3504)	Entropy 0.52921 (0.52800)	Top-1 acc 69.531 (67.450)	Top-5 acc 87.109 (86.257)	lr 0.00035
Train [111][2920/3239]	Time 0.233 (0.502)	Data Time 0.001 (0.014)	Loss 2.1556 (2.3504)	Entropy 0.52934 (0.52800)	Top-1 acc 72.656 (67.449)	Top-5 acc 90.234 (86.257)	lr 0.00035
Train [111][2930/3239]	Time 0.237 (0.502)	Data Time 0.001 (0.014)	Loss 2.2393 (2.3503)	Entropy 0.52920 (0.52801)	Top-1 acc 67.969 (67.453)	Top-5 acc 87.109 (86.258)	lr 0.00035
Train [111][2940/3239]	Time 0.228 (0.502)	Data Time 0.001 (0.014)	Loss 2.3384 (2.3500)	Entropy 0.52942 (0.52801)	Top-1 acc 68.359 (67.463)	Top-5 acc 85.938 (86.259)	lr 0.00035
Train [111][2950/3239]	Time 0.241 (0.501)	Data Time 0.001 (0.014)	Loss 2.4493 (2.3502)	Entropy 0.52950 (0.52802)	Top-1 acc 64.062 (67.456)	Top-5 acc 83.203 (86.258)	lr 0.00035
Train [111][2960/3239]	Time 0.231 (0.501)	Data Time 0.001 (0.014)	Loss 2.3051 (2.3502)	Entropy 0.52958 (0.52802)	Top-1 acc 70.703 (67.456)	Top-5 acc 86.719 (86.257)	lr 0.00035
Train [111][2970/3239]	Time 0.262 (0.501)	Data Time 0.001 (0.014)	Loss 2.4326 (2.3504)	Entropy 0.52950 (0.52803)	Top-1 acc 60.156 (67.450)	Top-5 acc 86.328 (86.254)	lr 0.00035
Train [111][2980/3239]	Time 0.243 (0.500)	Data Time 0.001 (0.014)	Loss 2.2414 (2.3504)	Entropy 0.52941 (0.52803)	Top-1 acc 66.406 (67.449)	Top-5 acc 88.281 (86.253)	lr 0.00035
Train [111][2990/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.014)	Loss 2.4420 (2.3505)	Entropy 0.52927 (0.52804)	Top-1 acc 66.797 (67.448)	Top-5 acc 85.547 (86.253)	lr 0.00035
Train [111][3000/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.014)	Loss 2.2255 (2.3503)	Entropy 0.52917 (0.52804)	Top-1 acc 70.312 (67.452)	Top-5 acc 89.062 (86.257)	lr 0.00035
Train [111][3010/3239]	Time 0.236 (0.499)	Data Time 0.001 (0.014)	Loss 2.2384 (2.3504)	Entropy 0.52909 (0.52804)	Top-1 acc 69.922 (67.449)	Top-5 acc 87.891 (86.255)	lr 0.00035
Train [111][3020/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.014)	Loss 2.3021 (2.3503)	Entropy 0.52888 (0.52805)	Top-1 acc 69.141 (67.452)	Top-5 acc 87.109 (86.253)	lr 0.00035
Train [111][3030/3239]	Time 0.238 (0.499)	Data Time 0.001 (0.014)	Loss 2.2749 (2.3502)	Entropy 0.52882 (0.52805)	Top-1 acc 69.141 (67.453)	Top-5 acc 87.500 (86.256)	lr 0.00035
Train [111][3040/3239]	Time 0.237 (0.498)	Data Time 0.001 (0.014)	Loss 2.1260 (2.3502)	Entropy 0.52865 (0.52805)	Top-1 acc 73.828 (67.454)	Top-5 acc 89.453 (86.257)	lr 0.00035
Train [111][3050/3239]	Time 0.235 (0.498)	Data Time 0.001 (0.014)	Loss 2.4132 (2.3501)	Entropy 0.52879 (0.52805)	Top-1 acc 64.844 (67.455)	Top-5 acc 87.109 (86.259)	lr 0.00035
Train [111][3060/3239]	Time 0.325 (0.498)	Data Time 0.001 (0.014)	Loss 2.3902 (2.3500)	Entropy 0.52858 (0.52806)	Top-1 acc 66.406 (67.456)	Top-5 acc 85.938 (86.259)	lr 0.00035
Train [111][3070/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.014)	Loss 2.7771 (2.3500)	Entropy 0.52879 (0.52806)	Top-1 acc 56.641 (67.455)	Top-5 acc 80.469 (86.259)	lr 0.00035
Train [111][3080/3239]	Time 0.236 (0.497)	Data Time 0.001 (0.014)	Loss 2.4521 (2.3503)	Entropy 0.52891 (0.52806)	Top-1 acc 65.234 (67.446)	Top-5 acc 85.156 (86.255)	lr 0.00035
Train [111][3090/3239]	Time 0.229 (0.497)	Data Time 0.001 (0.013)	Loss 2.2674 (2.3504)	Entropy 0.52886 (0.52806)	Top-1 acc 70.312 (67.446)	Top-5 acc 87.109 (86.251)	lr 0.00035
Train [111][3100/3239]	Time 0.232 (0.497)	Data Time 0.001 (0.013)	Loss 2.6342 (2.3504)	Entropy 0.52872 (0.52807)	Top-1 acc 63.672 (67.447)	Top-5 acc 82.812 (86.250)	lr 0.00035
Train [111][3110/3239]	Time 0.248 (0.496)	Data Time 0.001 (0.013)	Loss 2.2907 (2.3504)	Entropy 0.52859 (0.52807)	Top-1 acc 70.703 (67.448)	Top-5 acc 87.109 (86.252)	lr 0.00035
Train [111][3120/3239]	Time 0.266 (0.496)	Data Time 0.001 (0.013)	Loss 2.2897 (2.3503)	Entropy 0.52838 (0.52807)	Top-1 acc 71.094 (67.450)	Top-5 acc 87.109 (86.253)	lr 0.00035
Train [111][3130/3239]	Time 0.492 (0.496)	Data Time 0.002 (0.013)	Loss 2.3930 (2.3503)	Entropy 0.52872 (0.52807)	Top-1 acc 67.969 (67.452)	Top-5 acc 83.984 (86.251)	lr 0.00035
Train [111][3140/3239]	Time 0.229 (0.496)	Data Time 0.001 (0.013)	Loss 2.4031 (2.3502)	Entropy 0.52825 (0.52807)	Top-1 acc 66.016 (67.453)	Top-5 acc 84.766 (86.253)	lr 0.00035
Train [111][3150/3239]	Time 0.247 (0.496)	Data Time 0.001 (0.013)	Loss 2.4454 (2.3502)	Entropy 0.52837 (0.52807)	Top-1 acc 64.844 (67.454)	Top-5 acc 85.156 (86.253)	lr 0.00035
Train [111][3160/3239]	Time 0.238 (0.495)	Data Time 0.001 (0.013)	Loss 2.3588 (2.3501)	Entropy 0.52824 (0.52807)	Top-1 acc 66.797 (67.454)	Top-5 acc 85.156 (86.254)	lr 0.00035
Train [111][3170/3239]	Time 0.309 (0.511)	Data Time 0.002 (0.013)	Loss 2.7878 (2.3503)	Entropy 0.52851 (0.52807)	Top-1 acc 55.859 (67.452)	Top-5 acc 80.469 (86.252)	lr 0.00035
Train [111][3180/3239]	Time 0.236 (0.511)	Data Time 0.000 (0.013)	Loss 2.3469 (2.3502)	Entropy 0.52832 (0.52807)	Top-1 acc 66.406 (67.452)	Top-5 acc 85.938 (86.254)	lr 0.00035
Train [111][3190/3239]	Time 0.234 (0.511)	Data Time 0.000 (0.013)	Loss 2.3771 (2.3503)	Entropy 0.52813 (0.52808)	Top-1 acc 68.359 (67.450)	Top-5 acc 85.938 (86.253)	lr 0.00035
Train [111][3200/3239]	Time 0.233 (0.510)	Data Time 0.000 (0.013)	Loss 2.6169 (2.3505)	Entropy 0.52776 (0.52808)	Top-1 acc 63.672 (67.445)	Top-5 acc 82.031 (86.251)	lr 0.00035
Train [111][3210/3239]	Time 0.220 (0.510)	Data Time 0.000 (0.013)	Loss 2.3499 (2.3507)	Entropy 0.52756 (0.52807)	Top-1 acc 69.531 (67.437)	Top-5 acc 85.156 (86.244)	lr 0.00035
Train [111][3220/3239]	Time 0.324 (0.510)	Data Time 0.000 (0.013)	Loss 2.2599 (2.3507)	Entropy 0.52771 (0.52807)	Top-1 acc 68.750 (67.439)	Top-5 acc 87.891 (86.243)	lr 0.00035
Train [111][3230/3239]	Time 0.230 (0.509)	Data Time 0.000 (0.013)	Loss 2.3518 (2.3506)	Entropy 0.52791 (0.52807)	Top-1 acc 69.531 (67.443)	Top-5 acc 87.500 (86.244)	lr 0.00035
Train [111][3239/3239]	Time 0.846 (0.509)	Data Time 0.000 (0.013)	Loss 2.6801 (2.3509)	Entropy 0.52816 (0.52807)	Top-1 acc 62.963 (67.437)	Top-5 acc 83.951 (86.240)	lr 0.00035
==========Valid [111/120]	loss 1.172	top-1 acc 72.861 (73.154)	top-5 acc 90.549	Train top-1 67.437	top-5 86.240	Entropy 0.52816	Latency-None: 0.000ms	Flops: 539.00M
Train [112][0/3239]	Time 36.057 (36.057)	Data Time 34.328 (34.328)	Loss 2.3806 (2.3806)	Entropy 0.52816 (0.52816)	Top-1 acc 70.312 (70.312)	Top-5 acc 83.984 (83.984)	lr 0.00035
Train [112][10/3239]	Time 0.234 (3.985)	Data Time 0.001 (3.266)	Loss 2.4295 (2.3600)	Entropy 0.52800 (0.52816)	Top-1 acc 67.188 (68.111)	Top-5 acc 85.938 (86.151)	lr 0.00035
Train [112][20/3239]	Time 0.254 (2.284)	Data Time 0.001 (1.711)	Loss 2.3445 (2.3796)	Entropy 0.52791 (0.52810)	Top-1 acc 68.359 (67.615)	Top-5 acc 86.719 (86.105)	lr 0.00034
Train [112][30/3239]	Time 0.249 (1.684)	Data Time 0.001 (1.160)	Loss 2.4413 (2.3591)	Entropy 0.52789 (0.52804)	Top-1 acc 66.406 (67.528)	Top-5 acc 85.156 (86.555)	lr 0.00034
Train [112][40/3239]	Time 0.229 (1.371)	Data Time 0.001 (0.878)	Loss 2.4301 (2.3859)	Entropy 0.52809 (0.52804)	Top-1 acc 67.188 (66.816)	Top-5 acc 83.984 (85.918)	lr 0.00034
Train [112][50/3239]	Time 0.322 (1.183)	Data Time 0.001 (0.706)	Loss 2.1244 (2.3751)	Entropy 0.52828 (0.52806)	Top-1 acc 73.047 (67.272)	Top-5 acc 88.672 (85.945)	lr 0.00034
Train [112][60/3239]	Time 0.226 (1.058)	Data Time 0.001 (0.591)	Loss 2.1215 (2.3808)	Entropy 0.52841 (0.52809)	Top-1 acc 71.484 (67.111)	Top-5 acc 90.234 (85.880)	lr 0.00034
Train [112][70/3239]	Time 0.252 (0.987)	Data Time 0.001 (0.508)	Loss 2.3978 (2.3719)	Entropy 0.52837 (0.52813)	Top-1 acc 66.797 (67.320)	Top-5 acc 84.375 (85.844)	lr 0.00034
Train [112][80/3239]	Time 0.243 (0.916)	Data Time 0.001 (0.445)	Loss 2.1521 (2.3749)	Entropy 0.52857 (0.52816)	Top-1 acc 74.219 (67.149)	Top-5 acc 86.719 (85.812)	lr 0.00034
Train [112][90/3239]	Time 0.233 (0.861)	Data Time 0.001 (0.396)	Loss 2.3553 (2.3703)	Entropy 0.52884 (0.52822)	Top-1 acc 68.359 (67.273)	Top-5 acc 86.328 (85.890)	lr 0.00034
Train [112][100/3239]	Time 0.229 (0.816)	Data Time 0.001 (0.357)	Loss 2.2776 (2.3642)	Entropy 0.52873 (0.52828)	Top-1 acc 68.359 (67.450)	Top-5 acc 86.719 (85.941)	lr 0.00034
Train [112][110/3239]	Time 0.236 (0.781)	Data Time 0.001 (0.325)	Loss 2.3000 (2.3596)	Entropy 0.52913 (0.52833)	Top-1 acc 68.359 (67.525)	Top-5 acc 86.328 (85.969)	lr 0.00034
Train [112][120/3239]	Time 0.354 (0.752)	Data Time 0.001 (0.298)	Loss 2.4009 (2.3558)	Entropy 0.52916 (0.52840)	Top-1 acc 66.406 (67.652)	Top-5 acc 85.938 (86.041)	lr 0.00034
Train [112][130/3239]	Time 0.259 (0.727)	Data Time 0.001 (0.276)	Loss 2.3070 (2.3513)	Entropy 0.52876 (0.52844)	Top-1 acc 68.750 (67.718)	Top-5 acc 86.719 (86.093)	lr 0.00034
Train [112][140/3239]	Time 0.231 (0.705)	Data Time 0.001 (0.256)	Loss 2.1921 (2.3452)	Entropy 0.52871 (0.52845)	Top-1 acc 68.750 (67.866)	Top-5 acc 89.844 (86.187)	lr 0.00034
Train [112][150/3239]	Time 0.223 (0.687)	Data Time 0.001 (0.239)	Loss 2.2001 (2.3391)	Entropy 0.52875 (0.52847)	Top-1 acc 71.484 (68.002)	Top-5 acc 87.500 (86.310)	lr 0.00034
Train [112][160/3239]	Time 0.278 (0.672)	Data Time 0.001 (0.225)	Loss 2.0972 (2.3390)	Entropy 0.52837 (0.52849)	Top-1 acc 72.656 (68.012)	Top-5 acc 91.016 (86.348)	lr 0.00034
Train [112][170/3239]	Time 0.235 (0.658)	Data Time 0.001 (0.212)	Loss 2.1061 (2.3394)	Entropy 0.52851 (0.52848)	Top-1 acc 75.391 (67.939)	Top-5 acc 91.016 (86.353)	lr 0.00034
Train [112][180/3239]	Time 0.254 (0.645)	Data Time 0.001 (0.200)	Loss 2.1440 (2.3405)	Entropy 0.52877 (0.52849)	Top-1 acc 72.656 (67.891)	Top-5 acc 90.625 (86.369)	lr 0.00034
Train [112][190/3239]	Time 0.234 (0.636)	Data Time 0.001 (0.190)	Loss 2.3302 (2.3391)	Entropy 0.52880 (0.52851)	Top-1 acc 66.797 (67.954)	Top-5 acc 86.328 (86.381)	lr 0.00034
Train [112][200/3239]	Time 0.286 (0.629)	Data Time 0.001 (0.180)	Loss 2.4694 (2.3379)	Entropy 0.52905 (0.52853)	Top-1 acc 65.625 (67.990)	Top-5 acc 85.156 (86.419)	lr 0.00034
Train [112][210/3239]	Time 0.224 (0.619)	Data Time 0.001 (0.172)	Loss 2.2767 (2.3383)	Entropy 0.52906 (0.52856)	Top-1 acc 69.531 (67.959)	Top-5 acc 88.281 (86.413)	lr 0.00034
Train [112][220/3239]	Time 0.224 (0.610)	Data Time 0.001 (0.164)	Loss 2.2644 (2.3357)	Entropy 0.52904 (0.52858)	Top-1 acc 67.188 (68.011)	Top-5 acc 87.500 (86.459)	lr 0.00034
Train [112][230/3239]	Time 0.218 (0.601)	Data Time 0.001 (0.157)	Loss 2.4154 (2.3365)	Entropy 0.52889 (0.52859)	Top-1 acc 68.750 (68.014)	Top-5 acc 86.719 (86.468)	lr 0.00034
Train [112][240/3239]	Time 0.236 (0.594)	Data Time 0.001 (0.151)	Loss 2.5475 (2.3389)	Entropy 0.52912 (0.52861)	Top-1 acc 63.281 (67.946)	Top-5 acc 80.469 (86.422)	lr 0.00034
Train [112][250/3239]	Time 0.234 (0.586)	Data Time 0.001 (0.145)	Loss 2.2302 (2.3430)	Entropy 0.52911 (0.52863)	Top-1 acc 70.312 (67.824)	Top-5 acc 89.062 (86.361)	lr 0.00034
Train [112][260/3239]	Time 0.229 (0.579)	Data Time 0.001 (0.139)	Loss 2.5191 (2.3450)	Entropy 0.52936 (0.52865)	Top-1 acc 66.797 (67.794)	Top-5 acc 83.984 (86.312)	lr 0.00034
Train [112][270/3239]	Time 0.273 (0.573)	Data Time 0.002 (0.134)	Loss 2.2879 (2.3428)	Entropy 0.52925 (0.52868)	Top-1 acc 68.359 (67.852)	Top-5 acc 85.547 (86.325)	lr 0.00034
Train [112][280/3239]	Time 0.323 (0.568)	Data Time 0.001 (0.129)	Loss 2.5209 (2.3443)	Entropy 0.52923 (0.52870)	Top-1 acc 64.844 (67.841)	Top-5 acc 82.031 (86.298)	lr 0.00034
Train [112][290/3239]	Time 0.246 (0.563)	Data Time 0.001 (0.125)	Loss 2.3574 (2.3435)	Entropy 0.52929 (0.52872)	Top-1 acc 71.484 (67.864)	Top-5 acc 85.156 (86.315)	lr 0.00034
Train [112][300/3239]	Time 0.236 (0.559)	Data Time 0.001 (0.121)	Loss 2.3495 (2.3418)	Entropy 0.52944 (0.52874)	Top-1 acc 69.531 (67.891)	Top-5 acc 87.500 (86.350)	lr 0.00034
Train [112][310/3239]	Time 0.225 (0.554)	Data Time 0.001 (0.117)	Loss 2.3410 (2.3436)	Entropy 0.52916 (0.52876)	Top-1 acc 67.969 (67.819)	Top-5 acc 88.281 (86.346)	lr 0.00034
Train [112][320/3239]	Time 0.244 (0.550)	Data Time 0.002 (0.113)	Loss 2.4361 (2.3457)	Entropy 0.52900 (0.52877)	Top-1 acc 63.281 (67.742)	Top-5 acc 83.203 (86.300)	lr 0.00034
Train [112][330/3239]	Time 0.239 (0.546)	Data Time 0.001 (0.110)	Loss 2.1341 (2.3429)	Entropy 0.52878 (0.52878)	Top-1 acc 71.875 (67.818)	Top-5 acc 91.797 (86.341)	lr 0.00034
Train [112][340/3239]	Time 0.250 (0.542)	Data Time 0.001 (0.107)	Loss 2.3001 (2.3408)	Entropy 0.52886 (0.52878)	Top-1 acc 68.359 (67.850)	Top-5 acc 86.719 (86.375)	lr 0.00034
Train [112][350/3239]	Time 0.350 (0.539)	Data Time 0.001 (0.104)	Loss 2.4039 (2.3412)	Entropy 0.52884 (0.52878)	Top-1 acc 64.062 (67.847)	Top-5 acc 84.375 (86.346)	lr 0.00034
Train [112][360/3239]	Time 0.225 (0.536)	Data Time 0.001 (0.101)	Loss 2.6127 (2.3435)	Entropy 0.52879 (0.52878)	Top-1 acc 60.938 (67.782)	Top-5 acc 81.641 (86.300)	lr 0.00034
Train [112][370/3239]	Time 0.229 (0.533)	Data Time 0.001 (0.098)	Loss 2.3611 (2.3422)	Entropy 0.52871 (0.52878)	Top-1 acc 66.406 (67.784)	Top-5 acc 88.672 (86.333)	lr 0.00034
Train [112][380/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.096)	Loss 2.2937 (2.3420)	Entropy 0.52815 (0.52878)	Top-1 acc 70.312 (67.787)	Top-5 acc 87.891 (86.344)	lr 0.00034
Train [112][390/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.093)	Loss 2.3517 (2.3414)	Entropy 0.52829 (0.52876)	Top-1 acc 64.844 (67.812)	Top-5 acc 86.719 (86.363)	lr 0.00034
Train [112][400/3239]	Time 0.235 (0.525)	Data Time 0.001 (0.091)	Loss 2.2657 (2.3423)	Entropy 0.52862 (0.52875)	Top-1 acc 68.750 (67.784)	Top-5 acc 89.062 (86.352)	lr 0.00034
Train [112][410/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.089)	Loss 2.2015 (2.3410)	Entropy 0.52863 (0.52875)	Top-1 acc 72.266 (67.813)	Top-5 acc 86.328 (86.373)	lr 0.00034
Train [112][420/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.087)	Loss 2.5417 (2.3418)	Entropy 0.52863 (0.52875)	Top-1 acc 64.844 (67.788)	Top-5 acc 81.250 (86.359)	lr 0.00034
Train [112][430/3239]	Time 0.229 (0.516)	Data Time 0.001 (0.085)	Loss 2.4037 (2.3426)	Entropy 0.52876 (0.52875)	Top-1 acc 67.578 (67.752)	Top-5 acc 85.547 (86.340)	lr 0.00034
Train [112][440/3239]	Time 0.330 (0.514)	Data Time 0.001 (0.083)	Loss 2.3155 (2.3427)	Entropy 0.52890 (0.52875)	Top-1 acc 68.359 (67.744)	Top-5 acc 88.281 (86.342)	lr 0.00034
Train [112][450/3239]	Time 0.223 (0.511)	Data Time 0.001 (0.081)	Loss 2.6052 (2.3440)	Entropy 0.52906 (0.52876)	Top-1 acc 64.453 (67.748)	Top-5 acc 81.250 (86.312)	lr 0.00033
Train [112][460/3239]	Time 0.220 (0.509)	Data Time 0.001 (0.079)	Loss 2.3253 (2.3462)	Entropy 0.52922 (0.52876)	Top-1 acc 66.797 (67.693)	Top-5 acc 87.891 (86.271)	lr 0.00033
Train [112][470/3239]	Time 0.258 (0.507)	Data Time 0.001 (0.078)	Loss 2.2109 (2.3448)	Entropy 0.52958 (0.52878)	Top-1 acc 71.875 (67.719)	Top-5 acc 89.844 (86.294)	lr 0.00033
Train [112][480/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.076)	Loss 2.2941 (2.3448)	Entropy 0.52956 (0.52879)	Top-1 acc 67.578 (67.731)	Top-5 acc 87.891 (86.305)	lr 0.00033
Train [112][490/3239]	Time 0.223 (0.503)	Data Time 0.001 (0.075)	Loss 2.2478 (2.3455)	Entropy 0.52943 (0.52881)	Top-1 acc 72.266 (67.731)	Top-5 acc 87.500 (86.273)	lr 0.00033
Train [112][500/3239]	Time 0.232 (0.502)	Data Time 0.002 (0.073)	Loss 2.2588 (2.3452)	Entropy 0.52946 (0.52882)	Top-1 acc 70.703 (67.744)	Top-5 acc 89.844 (86.288)	lr 0.00033
Train [112][510/3239]	Time 0.318 (0.500)	Data Time 0.001 (0.072)	Loss 2.2124 (2.3446)	Entropy 0.52963 (0.52883)	Top-1 acc 69.141 (67.755)	Top-5 acc 87.500 (86.291)	lr 0.00033
Train [112][520/3239]	Time 0.241 (0.498)	Data Time 0.002 (0.071)	Loss 2.2898 (2.3445)	Entropy 0.52973 (0.52885)	Top-1 acc 68.750 (67.772)	Top-5 acc 86.328 (86.294)	lr 0.00033
Train [112][530/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.069)	Loss 2.2835 (2.3440)	Entropy 0.52944 (0.52886)	Top-1 acc 70.312 (67.789)	Top-5 acc 87.109 (86.299)	lr 0.00033
Train [112][540/3239]	Time 0.259 (0.496)	Data Time 0.002 (0.068)	Loss 2.1830 (2.3441)	Entropy 0.52928 (0.52887)	Top-1 acc 70.703 (67.772)	Top-5 acc 89.844 (86.304)	lr 0.00033
Train [112][550/3239]	Time 0.265 (0.494)	Data Time 0.002 (0.067)	Loss 2.4131 (2.3443)	Entropy 0.52906 (0.52888)	Top-1 acc 63.281 (67.763)	Top-5 acc 86.328 (86.301)	lr 0.00033
Train [112][560/3239]	Time 0.269 (0.493)	Data Time 0.002 (0.066)	Loss 2.1764 (2.3430)	Entropy 0.52922 (0.52888)	Top-1 acc 71.875 (67.772)	Top-5 acc 88.672 (86.319)	lr 0.00033
Train [112][570/3239]	Time 0.232 (0.492)	Data Time 0.001 (0.064)	Loss 2.3624 (2.3434)	Entropy 0.52907 (0.52888)	Top-1 acc 66.016 (67.757)	Top-5 acc 86.719 (86.313)	lr 0.00033
Train [112][580/3239]	Time 0.353 (0.585)	Data Time 0.006 (0.063)	Loss 2.4113 (2.3436)	Entropy 0.52915 (0.52889)	Top-1 acc 66.016 (67.746)	Top-5 acc 83.984 (86.305)	lr 0.00033
Train [112][590/3239]	Time 0.231 (0.583)	Data Time 0.002 (0.063)	Loss 2.5553 (2.3449)	Entropy 0.52921 (0.52889)	Top-1 acc 64.062 (67.718)	Top-5 acc 84.375 (86.282)	lr 0.00033
Train [112][600/3239]	Time 0.347 (0.581)	Data Time 0.001 (0.062)	Loss 2.6781 (2.3460)	Entropy 0.52920 (0.52890)	Top-1 acc 61.328 (67.715)	Top-5 acc 81.250 (86.267)	lr 0.00033
Train [112][610/3239]	Time 0.233 (0.578)	Data Time 0.001 (0.061)	Loss 2.2359 (2.3457)	Entropy 0.52940 (0.52891)	Top-1 acc 72.656 (67.729)	Top-5 acc 86.328 (86.269)	lr 0.00033
Train [112][620/3239]	Time 0.233 (0.575)	Data Time 0.001 (0.060)	Loss 2.3911 (2.3465)	Entropy 0.52976 (0.52892)	Top-1 acc 67.188 (67.709)	Top-5 acc 83.594 (86.258)	lr 0.00033
Train [112][630/3239]	Time 0.232 (0.573)	Data Time 0.001 (0.059)	Loss 2.2136 (2.3456)	Entropy 0.52994 (0.52893)	Top-1 acc 70.312 (67.723)	Top-5 acc 87.109 (86.261)	lr 0.00033
Train [112][640/3239]	Time 0.234 (0.570)	Data Time 0.001 (0.058)	Loss 2.3774 (2.3455)	Entropy 0.52981 (0.52895)	Top-1 acc 65.625 (67.729)	Top-5 acc 85.547 (86.260)	lr 0.00033
Train [112][650/3239]	Time 0.254 (0.568)	Data Time 0.001 (0.057)	Loss 2.3487 (2.3457)	Entropy 0.52995 (0.52896)	Top-1 acc 65.625 (67.714)	Top-5 acc 88.281 (86.262)	lr 0.00033
Train [112][660/3239]	Time 0.231 (0.565)	Data Time 0.001 (0.056)	Loss 2.3576 (2.3446)	Entropy 0.52965 (0.52897)	Top-1 acc 69.922 (67.753)	Top-5 acc 84.375 (86.286)	lr 0.00033
Train [112][670/3239]	Time 0.316 (0.563)	Data Time 0.001 (0.055)	Loss 2.2272 (2.3437)	Entropy 0.52921 (0.52898)	Top-1 acc 69.922 (67.776)	Top-5 acc 88.672 (86.305)	lr 0.00033
Train [112][680/3239]	Time 0.235 (0.561)	Data Time 0.001 (0.055)	Loss 2.1595 (2.3435)	Entropy 0.52876 (0.52898)	Top-1 acc 73.438 (67.793)	Top-5 acc 88.672 (86.297)	lr 0.00033
Train [112][690/3239]	Time 0.228 (0.559)	Data Time 0.002 (0.054)	Loss 2.1554 (2.3429)	Entropy 0.52882 (0.52898)	Top-1 acc 70.703 (67.792)	Top-5 acc 88.281 (86.309)	lr 0.00033
Train [112][700/3239]	Time 0.235 (0.557)	Data Time 0.001 (0.053)	Loss 2.4712 (2.3423)	Entropy 0.52871 (0.52898)	Top-1 acc 65.234 (67.803)	Top-5 acc 85.156 (86.324)	lr 0.00033
Train [112][710/3239]	Time 0.230 (0.555)	Data Time 0.001 (0.052)	Loss 2.8031 (2.3436)	Entropy 0.52884 (0.52897)	Top-1 acc 54.297 (67.764)	Top-5 acc 80.859 (86.307)	lr 0.00033
Train [112][720/3239]	Time 0.227 (0.553)	Data Time 0.001 (0.052)	Loss 2.4029 (2.3440)	Entropy 0.52850 (0.52897)	Top-1 acc 64.062 (67.747)	Top-5 acc 88.281 (86.299)	lr 0.00033
Train [112][730/3239]	Time 0.238 (0.551)	Data Time 0.001 (0.051)	Loss 2.3517 (2.3446)	Entropy 0.52877 (0.52897)	Top-1 acc 68.750 (67.731)	Top-5 acc 86.719 (86.293)	lr 0.00033
Train [112][740/3239]	Time 0.232 (0.549)	Data Time 0.001 (0.050)	Loss 2.3655 (2.3453)	Entropy 0.52898 (0.52896)	Top-1 acc 69.531 (67.707)	Top-5 acc 87.109 (86.282)	lr 0.00033
Train [112][750/3239]	Time 0.236 (0.547)	Data Time 0.001 (0.050)	Loss 2.2419 (2.3457)	Entropy 0.52904 (0.52897)	Top-1 acc 69.531 (67.713)	Top-5 acc 88.281 (86.268)	lr 0.00033
Train [112][760/3239]	Time 0.239 (0.546)	Data Time 0.002 (0.049)	Loss 2.0719 (2.3453)	Entropy 0.52884 (0.52896)	Top-1 acc 72.266 (67.717)	Top-5 acc 91.406 (86.273)	lr 0.00033
Train [112][770/3239]	Time 0.237 (0.544)	Data Time 0.001 (0.048)	Loss 2.4214 (2.3453)	Entropy 0.52884 (0.52896)	Top-1 acc 66.016 (67.716)	Top-5 acc 84.375 (86.269)	lr 0.00033
Train [112][780/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.048)	Loss 2.1359 (2.3445)	Entropy 0.52839 (0.52896)	Top-1 acc 72.656 (67.738)	Top-5 acc 90.234 (86.281)	lr 0.00033
Train [112][790/3239]	Time 0.225 (0.541)	Data Time 0.001 (0.047)	Loss 2.1595 (2.3442)	Entropy 0.52853 (0.52895)	Top-1 acc 72.656 (67.755)	Top-5 acc 88.672 (86.286)	lr 0.00033
Train [112][800/3239]	Time 0.223 (0.539)	Data Time 0.001 (0.047)	Loss 2.3877 (2.3440)	Entropy 0.52846 (0.52895)	Top-1 acc 66.016 (67.766)	Top-5 acc 85.547 (86.294)	lr 0.00033
Train [112][810/3239]	Time 0.295 (0.539)	Data Time 0.001 (0.046)	Loss 2.4200 (2.3435)	Entropy 0.52856 (0.52894)	Top-1 acc 67.188 (67.770)	Top-5 acc 83.203 (86.307)	lr 0.00033
Train [112][820/3239]	Time 0.243 (0.537)	Data Time 0.001 (0.046)	Loss 2.5139 (2.3434)	Entropy 0.52848 (0.52893)	Top-1 acc 61.719 (67.774)	Top-5 acc 84.375 (86.307)	lr 0.00033
Train [112][830/3239]	Time 0.328 (0.536)	Data Time 0.001 (0.045)	Loss 2.2832 (2.3436)	Entropy 0.52866 (0.52893)	Top-1 acc 72.266 (67.772)	Top-5 acc 86.328 (86.304)	lr 0.00033
Train [112][840/3239]	Time 0.233 (0.534)	Data Time 0.001 (0.044)	Loss 2.3194 (2.3439)	Entropy 0.52851 (0.52893)	Top-1 acc 67.969 (67.758)	Top-5 acc 85.938 (86.295)	lr 0.00033
Train [112][850/3239]	Time 0.226 (0.533)	Data Time 0.001 (0.044)	Loss 2.4505 (2.3441)	Entropy 0.52861 (0.52892)	Top-1 acc 66.406 (67.764)	Top-5 acc 85.547 (86.298)	lr 0.00033
Train [112][860/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.043)	Loss 2.5182 (2.3451)	Entropy 0.52891 (0.52892)	Top-1 acc 65.625 (67.739)	Top-5 acc 82.422 (86.278)	lr 0.00033
Train [112][870/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.043)	Loss 2.3157 (2.3452)	Entropy 0.52916 (0.52892)	Top-1 acc 66.016 (67.734)	Top-5 acc 85.547 (86.267)	lr 0.00033
Train [112][880/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.043)	Loss 2.5152 (2.3455)	Entropy 0.52896 (0.52892)	Top-1 acc 65.625 (67.727)	Top-5 acc 81.641 (86.262)	lr 0.00032
Train [112][890/3239]	Time 0.221 (0.527)	Data Time 0.001 (0.042)	Loss 2.2381 (2.3458)	Entropy 0.52921 (0.52892)	Top-1 acc 69.141 (67.720)	Top-5 acc 89.062 (86.261)	lr 0.00032
Train [112][900/3239]	Time 0.332 (0.526)	Data Time 0.001 (0.042)	Loss 2.1454 (2.3455)	Entropy 0.52928 (0.52893)	Top-1 acc 75.000 (67.719)	Top-5 acc 91.016 (86.261)	lr 0.00032
Train [112][910/3239]	Time 0.222 (0.525)	Data Time 0.001 (0.041)	Loss 2.2818 (2.3454)	Entropy 0.52935 (0.52893)	Top-1 acc 67.969 (67.710)	Top-5 acc 85.938 (86.256)	lr 0.00032
Train [112][920/3239]	Time 0.237 (0.524)	Data Time 0.001 (0.041)	Loss 2.1711 (2.3452)	Entropy 0.52927 (0.52894)	Top-1 acc 73.047 (67.719)	Top-5 acc 89.844 (86.254)	lr 0.00032
Train [112][930/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.040)	Loss 2.4834 (2.3453)	Entropy 0.52926 (0.52894)	Top-1 acc 59.375 (67.701)	Top-5 acc 83.594 (86.251)	lr 0.00032
Train [112][940/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.040)	Loss 2.2582 (2.3446)	Entropy 0.52922 (0.52894)	Top-1 acc 71.094 (67.717)	Top-5 acc 88.672 (86.269)	lr 0.00032
Train [112][950/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.039)	Loss 2.3617 (2.3455)	Entropy 0.52943 (0.52895)	Top-1 acc 67.969 (67.689)	Top-5 acc 85.156 (86.247)	lr 0.00032
Train [112][960/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.039)	Loss 2.3419 (2.3448)	Entropy 0.52932 (0.52895)	Top-1 acc 69.531 (67.697)	Top-5 acc 86.719 (86.257)	lr 0.00032
Train [112][970/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.039)	Loss 2.3016 (2.3446)	Entropy 0.52926 (0.52896)	Top-1 acc 66.016 (67.702)	Top-5 acc 86.719 (86.256)	lr 0.00032
Train [112][980/3239]	Time 0.235 (0.517)	Data Time 0.001 (0.038)	Loss 2.4276 (2.3443)	Entropy 0.52891 (0.52896)	Top-1 acc 66.797 (67.704)	Top-5 acc 85.938 (86.264)	lr 0.00032
Train [112][990/3239]	Time 0.340 (0.516)	Data Time 0.001 (0.038)	Loss 2.2352 (2.3439)	Entropy 0.52875 (0.52896)	Top-1 acc 68.750 (67.706)	Top-5 acc 87.891 (86.275)	lr 0.00032
Train [112][1000/3239]	Time 0.263 (0.515)	Data Time 0.001 (0.038)	Loss 2.1617 (2.3433)	Entropy 0.52881 (0.52896)	Top-1 acc 69.922 (67.717)	Top-5 acc 90.625 (86.281)	lr 0.00032
Train [112][1010/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.037)	Loss 2.3359 (2.3432)	Entropy 0.52877 (0.52895)	Top-1 acc 65.625 (67.718)	Top-5 acc 86.328 (86.288)	lr 0.00032
Train [112][1020/3239]	Time 0.233 (0.513)	Data Time 0.001 (0.037)	Loss 2.3909 (2.3430)	Entropy 0.52856 (0.52895)	Top-1 acc 64.844 (67.720)	Top-5 acc 85.938 (86.292)	lr 0.00032
Train [112][1030/3239]	Time 0.226 (0.511)	Data Time 0.001 (0.037)	Loss 2.2523 (2.3423)	Entropy 0.52856 (0.52895)	Top-1 acc 70.703 (67.743)	Top-5 acc 88.672 (86.302)	lr 0.00032
Train [112][1040/3239]	Time 0.223 (0.510)	Data Time 0.001 (0.036)	Loss 2.3382 (2.3422)	Entropy 0.52841 (0.52894)	Top-1 acc 68.750 (67.745)	Top-5 acc 86.328 (86.299)	lr 0.00032
Train [112][1050/3239]	Time 0.218 (0.509)	Data Time 0.001 (0.036)	Loss 2.2208 (2.3423)	Entropy 0.52768 (0.52893)	Top-1 acc 70.703 (67.747)	Top-5 acc 89.844 (86.307)	lr 0.00032
Train [112][1060/3239]	Time 0.318 (0.508)	Data Time 0.001 (0.036)	Loss 2.1749 (2.3421)	Entropy 0.52762 (0.52892)	Top-1 acc 69.922 (67.746)	Top-5 acc 90.625 (86.311)	lr 0.00032
Train [112][1070/3239]	Time 0.216 (0.507)	Data Time 0.001 (0.035)	Loss 2.3244 (2.3422)	Entropy 0.52758 (0.52891)	Top-1 acc 70.703 (67.741)	Top-5 acc 87.500 (86.311)	lr 0.00032
Train [112][1080/3239]	Time 0.225 (0.506)	Data Time 0.001 (0.035)	Loss 2.2502 (2.3422)	Entropy 0.52756 (0.52890)	Top-1 acc 69.531 (67.734)	Top-5 acc 85.938 (86.307)	lr 0.00032
Train [112][1090/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.035)	Loss 2.1419 (2.3425)	Entropy 0.52708 (0.52889)	Top-1 acc 70.703 (67.724)	Top-5 acc 90.625 (86.304)	lr 0.00032
Train [112][1100/3239]	Time 0.242 (0.504)	Data Time 0.001 (0.034)	Loss 2.2218 (2.3428)	Entropy 0.52698 (0.52887)	Top-1 acc 69.922 (67.717)	Top-5 acc 87.109 (86.295)	lr 0.00032
Train [112][1110/3239]	Time 0.227 (0.503)	Data Time 0.001 (0.034)	Loss 2.2611 (2.3429)	Entropy 0.52734 (0.52885)	Top-1 acc 72.656 (67.726)	Top-5 acc 86.719 (86.292)	lr 0.00032
Train [112][1120/3239]	Time 0.226 (0.502)	Data Time 0.001 (0.034)	Loss 2.2238 (2.3426)	Entropy 0.52760 (0.52884)	Top-1 acc 72.656 (67.734)	Top-5 acc 89.062 (86.301)	lr 0.00032
Train [112][1130/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.033)	Loss 2.3778 (2.3429)	Entropy 0.52777 (0.52883)	Top-1 acc 66.797 (67.724)	Top-5 acc 86.719 (86.297)	lr 0.00032
Train [112][1140/3239]	Time 0.229 (0.501)	Data Time 0.001 (0.033)	Loss 2.1945 (2.3434)	Entropy 0.52795 (0.52882)	Top-1 acc 71.484 (67.705)	Top-5 acc 89.062 (86.296)	lr 0.00032
Train [112][1150/3239]	Time 0.273 (0.500)	Data Time 0.001 (0.033)	Loss 2.2100 (2.3436)	Entropy 0.52812 (0.52881)	Top-1 acc 73.438 (67.710)	Top-5 acc 85.938 (86.292)	lr 0.00032
Train [112][1160/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.033)	Loss 2.4092 (2.3441)	Entropy 0.52808 (0.52881)	Top-1 acc 63.672 (67.700)	Top-5 acc 85.547 (86.290)	lr 0.00032
Train [112][1170/3239]	Time 0.227 (0.499)	Data Time 0.001 (0.032)	Loss 2.2373 (2.3442)	Entropy 0.52789 (0.52880)	Top-1 acc 72.266 (67.695)	Top-5 acc 88.281 (86.286)	lr 0.00032
Train [112][1180/3239]	Time 0.223 (0.498)	Data Time 0.001 (0.032)	Loss 2.1010 (2.3435)	Entropy 0.52812 (0.52879)	Top-1 acc 73.438 (67.701)	Top-5 acc 89.844 (86.299)	lr 0.00032
Train [112][1190/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.032)	Loss 2.2342 (2.3432)	Entropy 0.52785 (0.52879)	Top-1 acc 69.141 (67.709)	Top-5 acc 87.891 (86.305)	lr 0.00032
Train [112][1200/3239]	Time 0.228 (0.496)	Data Time 0.001 (0.032)	Loss 2.5134 (2.3431)	Entropy 0.52777 (0.52878)	Top-1 acc 64.453 (67.711)	Top-5 acc 84.766 (86.303)	lr 0.00032
Train [112][1210/3239]	Time 0.227 (0.495)	Data Time 0.001 (0.031)	Loss 2.1662 (2.3434)	Entropy 0.52740 (0.52877)	Top-1 acc 72.656 (67.705)	Top-5 acc 88.672 (86.302)	lr 0.00032
Train [112][1220/3239]	Time 0.336 (0.495)	Data Time 0.001 (0.031)	Loss 2.2510 (2.3428)	Entropy 0.52713 (0.52876)	Top-1 acc 71.875 (67.725)	Top-5 acc 86.719 (86.314)	lr 0.00032
Train [112][1230/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.031)	Loss 2.1973 (2.3426)	Entropy 0.52697 (0.52874)	Top-1 acc 72.656 (67.722)	Top-5 acc 87.891 (86.318)	lr 0.00032
Train [112][1240/3239]	Time 0.296 (0.534)	Data Time 0.002 (0.031)	Loss 2.3743 (2.3433)	Entropy 0.52710 (0.52873)	Top-1 acc 65.234 (67.705)	Top-5 acc 84.375 (86.302)	lr 0.00032
Train [112][1250/3239]	Time 0.231 (0.533)	Data Time 0.002 (0.030)	Loss 2.3691 (2.3432)	Entropy 0.52710 (0.52872)	Top-1 acc 65.625 (67.703)	Top-5 acc 86.328 (86.307)	lr 0.00032
Train [112][1260/3239]	Time 0.239 (0.532)	Data Time 0.001 (0.030)	Loss 2.1975 (2.3432)	Entropy 0.52706 (0.52870)	Top-1 acc 75.391 (67.707)	Top-5 acc 89.844 (86.306)	lr 0.00032
Train [112][1270/3239]	Time 0.237 (0.531)	Data Time 0.002 (0.030)	Loss 2.3259 (2.3430)	Entropy 0.52686 (0.52869)	Top-1 acc 67.188 (67.713)	Top-5 acc 88.672 (86.310)	lr 0.00032
Train [112][1280/3239]	Time 0.278 (0.531)	Data Time 0.001 (0.030)	Loss 2.2035 (2.3426)	Entropy 0.52674 (0.52868)	Top-1 acc 70.703 (67.721)	Top-5 acc 88.672 (86.319)	lr 0.00032
Train [112][1290/3239]	Time 0.264 (0.530)	Data Time 0.003 (0.030)	Loss 2.2401 (2.3427)	Entropy 0.52684 (0.52866)	Top-1 acc 69.922 (67.717)	Top-5 acc 84.766 (86.318)	lr 0.00032
Train [112][1300/3239]	Time 0.247 (0.529)	Data Time 0.001 (0.029)	Loss 2.5395 (2.3431)	Entropy 0.52707 (0.52865)	Top-1 acc 61.719 (67.702)	Top-5 acc 82.031 (86.308)	lr 0.00032
Train [112][1310/3239]	Time 0.248 (0.528)	Data Time 0.001 (0.029)	Loss 2.6407 (2.3432)	Entropy 0.52726 (0.52864)	Top-1 acc 61.328 (67.696)	Top-5 acc 81.250 (86.305)	lr 0.00032
Train [112][1320/3239]	Time 0.223 (0.527)	Data Time 0.001 (0.029)	Loss 2.4636 (2.3435)	Entropy 0.52683 (0.52862)	Top-1 acc 66.797 (67.688)	Top-5 acc 85.547 (86.304)	lr 0.00031
Train [112][1330/3239]	Time 0.280 (0.528)	Data Time 0.002 (0.029)	Loss 2.2983 (2.3435)	Entropy 0.52631 (0.52861)	Top-1 acc 69.922 (67.683)	Top-5 acc 85.156 (86.304)	lr 0.00031
Train [112][1340/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.029)	Loss 2.4631 (2.3440)	Entropy 0.52613 (0.52859)	Top-1 acc 65.625 (67.672)	Top-5 acc 82.812 (86.299)	lr 0.00031
Train [112][1350/3239]	Time 0.241 (0.527)	Data Time 0.001 (0.028)	Loss 2.1026 (2.3439)	Entropy 0.52616 (0.52857)	Top-1 acc 74.219 (67.672)	Top-5 acc 91.406 (86.299)	lr 0.00031
Train [112][1360/3239]	Time 0.233 (0.526)	Data Time 0.001 (0.028)	Loss 2.2088 (2.3433)	Entropy 0.52624 (0.52856)	Top-1 acc 71.484 (67.695)	Top-5 acc 87.891 (86.311)	lr 0.00031
Train [112][1370/3239]	Time 0.224 (0.525)	Data Time 0.001 (0.028)	Loss 2.2524 (2.3432)	Entropy 0.52639 (0.52854)	Top-1 acc 70.312 (67.701)	Top-5 acc 87.500 (86.313)	lr 0.00031
Train [112][1380/3239]	Time 0.326 (0.524)	Data Time 0.001 (0.028)	Loss 2.2099 (2.3428)	Entropy 0.52651 (0.52852)	Top-1 acc 71.484 (67.721)	Top-5 acc 90.234 (86.320)	lr 0.00031
Train [112][1390/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.028)	Loss 2.2633 (2.3428)	Entropy 0.52635 (0.52851)	Top-1 acc 67.188 (67.716)	Top-5 acc 89.844 (86.322)	lr 0.00031
Train [112][1400/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.027)	Loss 2.3399 (2.3429)	Entropy 0.52641 (0.52849)	Top-1 acc 68.359 (67.716)	Top-5 acc 87.109 (86.321)	lr 0.00031
Train [112][1410/3239]	Time 0.220 (0.522)	Data Time 0.001 (0.027)	Loss 2.3993 (2.3427)	Entropy 0.52655 (0.52848)	Top-1 acc 66.406 (67.717)	Top-5 acc 86.328 (86.321)	lr 0.00031
Train [112][1420/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.027)	Loss 2.1544 (2.3427)	Entropy 0.52631 (0.52846)	Top-1 acc 72.266 (67.720)	Top-5 acc 91.406 (86.325)	lr 0.00031
Train [112][1430/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.027)	Loss 2.3373 (2.3429)	Entropy 0.52609 (0.52845)	Top-1 acc 68.750 (67.713)	Top-5 acc 85.156 (86.315)	lr 0.00031
Train [112][1440/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.027)	Loss 2.2392 (2.3431)	Entropy 0.52609 (0.52843)	Top-1 acc 71.094 (67.707)	Top-5 acc 85.938 (86.309)	lr 0.00031
Train [112][1450/3239]	Time 0.344 (0.519)	Data Time 0.001 (0.026)	Loss 2.4487 (2.3429)	Entropy 0.52631 (0.52842)	Top-1 acc 63.672 (67.711)	Top-5 acc 84.375 (86.317)	lr 0.00031
Train [112][1460/3239]	Time 0.282 (0.518)	Data Time 0.001 (0.026)	Loss 2.1705 (2.3428)	Entropy 0.52617 (0.52840)	Top-1 acc 71.484 (67.713)	Top-5 acc 87.891 (86.318)	lr 0.00031
Train [112][1470/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.026)	Loss 2.5210 (2.3431)	Entropy 0.52606 (0.52839)	Top-1 acc 61.719 (67.709)	Top-5 acc 82.812 (86.308)	lr 0.00031
Train [112][1480/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.026)	Loss 2.2729 (2.3433)	Entropy 0.52585 (0.52837)	Top-1 acc 69.922 (67.701)	Top-5 acc 86.328 (86.305)	lr 0.00031
Train [112][1490/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.026)	Loss 2.2637 (2.3428)	Entropy 0.52550 (0.52835)	Top-1 acc 67.188 (67.709)	Top-5 acc 89.062 (86.312)	lr 0.00031
Train [112][1500/3239]	Time 0.236 (0.516)	Data Time 0.002 (0.026)	Loss 2.3653 (2.3427)	Entropy 0.52543 (0.52833)	Top-1 acc 67.188 (67.702)	Top-5 acc 87.109 (86.318)	lr 0.00031
Train [112][1510/3239]	Time 0.259 (0.515)	Data Time 0.001 (0.026)	Loss 2.4623 (2.3428)	Entropy 0.52485 (0.52831)	Top-1 acc 62.891 (67.703)	Top-5 acc 83.594 (86.319)	lr 0.00031
Train [112][1520/3239]	Time 0.227 (0.514)	Data Time 0.001 (0.025)	Loss 2.2573 (2.3427)	Entropy 0.52500 (0.52829)	Top-1 acc 69.531 (67.702)	Top-5 acc 87.500 (86.320)	lr 0.00031
Train [112][1530/3239]	Time 0.234 (0.514)	Data Time 0.001 (0.025)	Loss 2.1423 (2.3422)	Entropy 0.52517 (0.52827)	Top-1 acc 73.047 (67.717)	Top-5 acc 89.062 (86.324)	lr 0.00031
Train [112][1540/3239]	Time 0.327 (0.513)	Data Time 0.001 (0.025)	Loss 2.2231 (2.3422)	Entropy 0.52514 (0.52825)	Top-1 acc 67.188 (67.717)	Top-5 acc 89.453 (86.328)	lr 0.00031
Train [112][1550/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.025)	Loss 2.2455 (2.3423)	Entropy 0.52489 (0.52823)	Top-1 acc 72.656 (67.715)	Top-5 acc 87.500 (86.327)	lr 0.00031
Train [112][1560/3239]	Time 0.224 (0.512)	Data Time 0.001 (0.025)	Loss 2.6571 (2.3427)	Entropy 0.52472 (0.52821)	Top-1 acc 60.156 (67.706)	Top-5 acc 83.203 (86.327)	lr 0.00031
Train [112][1570/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.025)	Loss 2.3566 (2.3429)	Entropy 0.52462 (0.52818)	Top-1 acc 68.750 (67.694)	Top-5 acc 86.328 (86.321)	lr 0.00031
Train [112][1580/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.024)	Loss 2.0812 (2.3430)	Entropy 0.52441 (0.52816)	Top-1 acc 73.047 (67.695)	Top-5 acc 89.062 (86.323)	lr 0.00031
Train [112][1590/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.024)	Loss 2.3146 (2.3433)	Entropy 0.52441 (0.52814)	Top-1 acc 67.188 (67.689)	Top-5 acc 86.719 (86.316)	lr 0.00031
Train [112][1600/3239]	Time 0.245 (0.509)	Data Time 0.002 (0.024)	Loss 2.3595 (2.3430)	Entropy 0.52440 (0.52811)	Top-1 acc 63.672 (67.697)	Top-5 acc 86.328 (86.323)	lr 0.00031
Train [112][1610/3239]	Time 0.325 (0.509)	Data Time 0.001 (0.024)	Loss 2.3976 (2.3432)	Entropy 0.52457 (0.52809)	Top-1 acc 67.578 (67.695)	Top-5 acc 84.375 (86.320)	lr 0.00031
Train [112][1620/3239]	Time 0.232 (0.508)	Data Time 0.001 (0.024)	Loss 2.2517 (2.3426)	Entropy 0.52445 (0.52807)	Top-1 acc 69.141 (67.706)	Top-5 acc 87.500 (86.329)	lr 0.00031
Train [112][1630/3239]	Time 0.238 (0.507)	Data Time 0.001 (0.024)	Loss 2.1632 (2.3422)	Entropy 0.52454 (0.52805)	Top-1 acc 74.219 (67.714)	Top-5 acc 88.281 (86.335)	lr 0.00031
Train [112][1640/3239]	Time 0.307 (0.507)	Data Time 0.002 (0.024)	Loss 2.4648 (2.3421)	Entropy 0.52455 (0.52803)	Top-1 acc 65.625 (67.718)	Top-5 acc 84.766 (86.335)	lr 0.00031
Train [112][1650/3239]	Time 0.232 (0.507)	Data Time 0.001 (0.023)	Loss 2.3501 (2.3422)	Entropy 0.52461 (0.52801)	Top-1 acc 69.922 (67.722)	Top-5 acc 89.062 (86.342)	lr 0.00031
Train [112][1660/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.023)	Loss 2.2179 (2.3424)	Entropy 0.52469 (0.52799)	Top-1 acc 71.484 (67.711)	Top-5 acc 88.672 (86.340)	lr 0.00031
Train [112][1670/3239]	Time 0.283 (0.505)	Data Time 0.001 (0.023)	Loss 2.2944 (2.3421)	Entropy 0.52442 (0.52797)	Top-1 acc 69.141 (67.720)	Top-5 acc 87.109 (86.343)	lr 0.00031
Train [112][1680/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.023)	Loss 2.1764 (2.3417)	Entropy 0.52419 (0.52794)	Top-1 acc 73.047 (67.729)	Top-5 acc 90.625 (86.348)	lr 0.00031
Train [112][1690/3239]	Time 0.236 (0.504)	Data Time 0.001 (0.023)	Loss 2.2486 (2.3413)	Entropy 0.52427 (0.52792)	Top-1 acc 72.656 (67.741)	Top-5 acc 90.234 (86.361)	lr 0.00031
Train [112][1700/3239]	Time 0.254 (0.504)	Data Time 0.001 (0.023)	Loss 2.4012 (2.3418)	Entropy 0.52447 (0.52790)	Top-1 acc 66.406 (67.730)	Top-5 acc 85.547 (86.352)	lr 0.00031
Train [112][1710/3239]	Time 0.267 (0.503)	Data Time 0.001 (0.023)	Loss 2.3345 (2.3415)	Entropy 0.52487 (0.52788)	Top-1 acc 65.625 (67.735)	Top-5 acc 85.938 (86.358)	lr 0.00031
Train [112][1720/3239]	Time 0.230 (0.503)	Data Time 0.001 (0.023)	Loss 2.1993 (2.3414)	Entropy 0.52447 (0.52786)	Top-1 acc 73.438 (67.741)	Top-5 acc 90.625 (86.361)	lr 0.00031
Train [112][1730/3239]	Time 0.222 (0.502)	Data Time 0.001 (0.022)	Loss 2.4059 (2.3415)	Entropy 0.52431 (0.52784)	Top-1 acc 65.234 (67.740)	Top-5 acc 84.375 (86.355)	lr 0.00031
Train [112][1740/3239]	Time 0.233 (0.502)	Data Time 0.001 (0.022)	Loss 2.2416 (2.3412)	Entropy 0.52437 (0.52782)	Top-1 acc 72.656 (67.752)	Top-5 acc 89.062 (86.361)	lr 0.00031
Train [112][1750/3239]	Time 0.260 (0.501)	Data Time 0.001 (0.022)	Loss 2.2369 (2.3408)	Entropy 0.52402 (0.52780)	Top-1 acc 72.656 (67.763)	Top-5 acc 87.891 (86.369)	lr 0.00031
Train [112][1760/3239]	Time 0.224 (0.501)	Data Time 0.001 (0.022)	Loss 2.1611 (2.3409)	Entropy 0.52373 (0.52778)	Top-1 acc 69.141 (67.755)	Top-5 acc 90.625 (86.369)	lr 0.00031
Train [112][1770/3239]	Time 0.351 (0.501)	Data Time 0.002 (0.022)	Loss 2.2176 (2.3409)	Entropy 0.52357 (0.52776)	Top-1 acc 69.141 (67.751)	Top-5 acc 88.281 (86.369)	lr 0.00030
Train [112][1780/3239]	Time 0.229 (0.500)	Data Time 0.001 (0.022)	Loss 2.2238 (2.3406)	Entropy 0.52342 (0.52773)	Top-1 acc 71.094 (67.762)	Top-5 acc 89.062 (86.374)	lr 0.00030
Train [112][1790/3239]	Time 0.235 (0.499)	Data Time 0.001 (0.022)	Loss 2.2440 (2.3405)	Entropy 0.52362 (0.52771)	Top-1 acc 71.094 (67.765)	Top-5 acc 87.109 (86.373)	lr 0.00030
Train [112][1800/3239]	Time 0.268 (0.499)	Data Time 0.001 (0.022)	Loss 2.2264 (2.3405)	Entropy 0.52375 (0.52769)	Top-1 acc 71.094 (67.770)	Top-5 acc 88.672 (86.374)	lr 0.00030
Train [112][1810/3239]	Time 0.229 (0.498)	Data Time 0.001 (0.022)	Loss 2.3641 (2.3407)	Entropy 0.52372 (0.52767)	Top-1 acc 67.188 (67.769)	Top-5 acc 87.500 (86.375)	lr 0.00030
Train [112][1820/3239]	Time 0.233 (0.498)	Data Time 0.001 (0.021)	Loss 2.1595 (2.3408)	Entropy 0.52379 (0.52764)	Top-1 acc 71.484 (67.767)	Top-5 acc 89.844 (86.375)	lr 0.00030
Train [112][1830/3239]	Time 0.227 (0.498)	Data Time 0.001 (0.021)	Loss 2.3795 (2.3411)	Entropy 0.52358 (0.52762)	Top-1 acc 65.234 (67.760)	Top-5 acc 86.328 (86.376)	lr 0.00030
Train [112][1840/3239]	Time 0.333 (0.497)	Data Time 0.001 (0.021)	Loss 2.6603 (2.3410)	Entropy 0.52331 (0.52760)	Top-1 acc 58.203 (67.760)	Top-5 acc 82.812 (86.381)	lr 0.00030
Train [112][1850/3239]	Time 0.228 (0.497)	Data Time 0.001 (0.021)	Loss 2.5418 (2.3410)	Entropy 0.52312 (0.52758)	Top-1 acc 67.188 (67.759)	Top-5 acc 82.422 (86.380)	lr 0.00030
Train [112][1860/3239]	Time 0.231 (0.496)	Data Time 0.001 (0.021)	Loss 2.2991 (2.3410)	Entropy 0.52278 (0.52755)	Top-1 acc 67.969 (67.756)	Top-5 acc 85.156 (86.380)	lr 0.00030
Train [112][1870/3239]	Time 0.222 (0.496)	Data Time 0.001 (0.021)	Loss 2.2385 (2.3412)	Entropy 0.52289 (0.52753)	Top-1 acc 70.312 (67.748)	Top-5 acc 89.062 (86.381)	lr 0.00030
Train [112][1880/3239]	Time 0.218 (0.495)	Data Time 0.001 (0.021)	Loss 2.4101 (2.3416)	Entropy 0.52290 (0.52750)	Top-1 acc 63.672 (67.735)	Top-5 acc 85.547 (86.376)	lr 0.00030
Train [112][1890/3239]	Time 0.341 (0.521)	Data Time 0.004 (0.021)	Loss 2.2326 (2.3415)	Entropy 0.52308 (0.52748)	Top-1 acc 69.141 (67.737)	Top-5 acc 87.500 (86.377)	lr 0.00030
Train [112][1900/3239]	Time 0.236 (0.521)	Data Time 0.002 (0.021)	Loss 2.3310 (2.3411)	Entropy 0.52285 (0.52746)	Top-1 acc 66.406 (67.748)	Top-5 acc 85.547 (86.381)	lr 0.00030
Train [112][1910/3239]	Time 0.235 (0.520)	Data Time 0.001 (0.021)	Loss 2.4690 (2.3411)	Entropy 0.52318 (0.52743)	Top-1 acc 64.453 (67.745)	Top-5 acc 80.859 (86.380)	lr 0.00030
Train [112][1920/3239]	Time 0.260 (0.520)	Data Time 0.002 (0.020)	Loss 2.2683 (2.3411)	Entropy 0.52329 (0.52741)	Top-1 acc 70.703 (67.751)	Top-5 acc 87.500 (86.378)	lr 0.00030
Train [112][1930/3239]	Time 0.339 (0.520)	Data Time 0.001 (0.020)	Loss 2.2649 (2.3409)	Entropy 0.52337 (0.52739)	Top-1 acc 68.750 (67.749)	Top-5 acc 87.109 (86.377)	lr 0.00030
Train [112][1940/3239]	Time 0.240 (0.519)	Data Time 0.001 (0.020)	Loss 2.2689 (2.3407)	Entropy 0.52342 (0.52737)	Top-1 acc 68.359 (67.753)	Top-5 acc 86.719 (86.373)	lr 0.00030
Train [112][1950/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.020)	Loss 2.4885 (2.3405)	Entropy 0.52331 (0.52735)	Top-1 acc 65.625 (67.755)	Top-5 acc 82.812 (86.370)	lr 0.00030
Train [112][1960/3239]	Time 0.229 (0.518)	Data Time 0.001 (0.020)	Loss 2.3337 (2.3403)	Entropy 0.52338 (0.52733)	Top-1 acc 67.969 (67.761)	Top-5 acc 88.672 (86.379)	lr 0.00030
Train [112][1970/3239]	Time 0.226 (0.518)	Data Time 0.001 (0.020)	Loss 2.5379 (2.3404)	Entropy 0.52349 (0.52731)	Top-1 acc 64.062 (67.761)	Top-5 acc 82.031 (86.376)	lr 0.00030
Train [112][1980/3239]	Time 0.238 (0.517)	Data Time 0.001 (0.020)	Loss 2.2753 (2.3403)	Entropy 0.52375 (0.52729)	Top-1 acc 69.141 (67.762)	Top-5 acc 85.547 (86.378)	lr 0.00030
Train [112][1990/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.020)	Loss 2.5467 (2.3403)	Entropy 0.52372 (0.52727)	Top-1 acc 60.156 (67.765)	Top-5 acc 83.594 (86.379)	lr 0.00030
Train [112][2000/3239]	Time 0.249 (0.516)	Data Time 0.001 (0.020)	Loss 2.2408 (2.3403)	Entropy 0.52358 (0.52725)	Top-1 acc 71.484 (67.767)	Top-5 acc 87.109 (86.378)	lr 0.00030
Train [112][2010/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.020)	Loss 2.4782 (2.3406)	Entropy 0.52355 (0.52724)	Top-1 acc 64.844 (67.756)	Top-5 acc 83.203 (86.371)	lr 0.00030
Train [112][2020/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.020)	Loss 2.3958 (2.3402)	Entropy 0.52352 (0.52722)	Top-1 acc 67.188 (67.765)	Top-5 acc 84.375 (86.378)	lr 0.00030
Train [112][2030/3239]	Time 0.230 (0.514)	Data Time 0.001 (0.019)	Loss 2.4848 (2.3400)	Entropy 0.52348 (0.52720)	Top-1 acc 64.844 (67.771)	Top-5 acc 83.203 (86.380)	lr 0.00030
Train [112][2040/3239]	Time 0.216 (0.514)	Data Time 0.001 (0.019)	Loss 2.4743 (2.3405)	Entropy 0.52337 (0.52718)	Top-1 acc 64.453 (67.756)	Top-5 acc 84.375 (86.371)	lr 0.00030
Train [112][2050/3239]	Time 0.232 (0.513)	Data Time 0.001 (0.019)	Loss 2.3344 (2.3405)	Entropy 0.52317 (0.52716)	Top-1 acc 66.406 (67.752)	Top-5 acc 88.281 (86.371)	lr 0.00030
Train [112][2060/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.019)	Loss 2.6132 (2.3411)	Entropy 0.52350 (0.52714)	Top-1 acc 63.672 (67.738)	Top-5 acc 82.422 (86.361)	lr 0.00030
Train [112][2070/3239]	Time 0.259 (0.512)	Data Time 0.001 (0.019)	Loss 2.3232 (2.3409)	Entropy 0.52395 (0.52713)	Top-1 acc 69.531 (67.746)	Top-5 acc 87.891 (86.365)	lr 0.00030
Train [112][2080/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.019)	Loss 2.3508 (2.3407)	Entropy 0.52391 (0.52711)	Top-1 acc 67.188 (67.748)	Top-5 acc 86.719 (86.367)	lr 0.00030
Train [112][2090/3239]	Time 0.319 (0.511)	Data Time 0.001 (0.019)	Loss 2.2857 (2.3405)	Entropy 0.52375 (0.52710)	Top-1 acc 69.141 (67.753)	Top-5 acc 86.328 (86.372)	lr 0.00030
Train [112][2100/3239]	Time 0.232 (0.511)	Data Time 0.001 (0.019)	Loss 2.2535 (2.3403)	Entropy 0.52383 (0.52708)	Top-1 acc 67.969 (67.760)	Top-5 acc 89.453 (86.376)	lr 0.00030
Train [112][2110/3239]	Time 0.238 (0.510)	Data Time 0.001 (0.019)	Loss 2.2434 (2.3402)	Entropy 0.52392 (0.52707)	Top-1 acc 71.875 (67.759)	Top-5 acc 86.328 (86.378)	lr 0.00030
Train [112][2120/3239]	Time 0.233 (0.510)	Data Time 0.001 (0.019)	Loss 2.4350 (2.3402)	Entropy 0.52386 (0.52705)	Top-1 acc 65.625 (67.761)	Top-5 acc 83.594 (86.375)	lr 0.00030
Train [112][2130/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.019)	Loss 2.2919 (2.3404)	Entropy 0.52390 (0.52704)	Top-1 acc 68.359 (67.762)	Top-5 acc 85.156 (86.374)	lr 0.00030
Train [112][2140/3239]	Time 0.245 (0.509)	Data Time 0.001 (0.019)	Loss 2.4642 (2.3403)	Entropy 0.52387 (0.52702)	Top-1 acc 64.844 (67.760)	Top-5 acc 83.984 (86.377)	lr 0.00030
Train [112][2150/3239]	Time 0.233 (0.509)	Data Time 0.001 (0.018)	Loss 2.0715 (2.3399)	Entropy 0.52421 (0.52701)	Top-1 acc 74.609 (67.765)	Top-5 acc 92.188 (86.386)	lr 0.00030
Train [112][2160/3239]	Time 0.324 (0.508)	Data Time 0.001 (0.018)	Loss 2.3596 (2.3401)	Entropy 0.52418 (0.52699)	Top-1 acc 65.625 (67.753)	Top-5 acc 85.938 (86.382)	lr 0.00030
Train [112][2170/3239]	Time 0.235 (0.508)	Data Time 0.001 (0.018)	Loss 2.3854 (2.3400)	Entropy 0.52432 (0.52698)	Top-1 acc 67.188 (67.752)	Top-5 acc 83.594 (86.385)	lr 0.00030
Train [112][2180/3239]	Time 0.232 (0.507)	Data Time 0.001 (0.018)	Loss 2.4024 (2.3398)	Entropy 0.52426 (0.52697)	Top-1 acc 69.141 (67.758)	Top-5 acc 83.594 (86.388)	lr 0.00030
Train [112][2190/3239]	Time 0.229 (0.507)	Data Time 0.001 (0.018)	Loss 2.4504 (2.3399)	Entropy 0.52437 (0.52696)	Top-1 acc 63.281 (67.755)	Top-5 acc 82.422 (86.384)	lr 0.00030
Train [112][2200/3239]	Time 0.238 (0.506)	Data Time 0.001 (0.018)	Loss 2.1248 (2.3397)	Entropy 0.52444 (0.52695)	Top-1 acc 71.094 (67.763)	Top-5 acc 91.406 (86.386)	lr 0.00030
Train [112][2210/3239]	Time 0.232 (0.506)	Data Time 0.001 (0.018)	Loss 2.3052 (2.3398)	Entropy 0.52441 (0.52694)	Top-1 acc 66.797 (67.761)	Top-5 acc 85.938 (86.383)	lr 0.00030
Train [112][2220/3239]	Time 0.255 (0.505)	Data Time 0.001 (0.018)	Loss 2.5707 (2.3398)	Entropy 0.52468 (0.52692)	Top-1 acc 63.672 (67.759)	Top-5 acc 83.594 (86.384)	lr 0.00029
Train [112][2230/3239]	Time 0.228 (0.505)	Data Time 0.001 (0.018)	Loss 2.3378 (2.3398)	Entropy 0.52479 (0.52691)	Top-1 acc 66.016 (67.763)	Top-5 acc 87.109 (86.383)	lr 0.00029
Train [112][2240/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.018)	Loss 2.5021 (2.3401)	Entropy 0.52465 (0.52690)	Top-1 acc 64.062 (67.755)	Top-5 acc 85.547 (86.379)	lr 0.00029
Train [112][2250/3239]	Time 0.246 (0.504)	Data Time 0.001 (0.018)	Loss 2.2511 (2.3404)	Entropy 0.52463 (0.52689)	Top-1 acc 72.266 (67.749)	Top-5 acc 87.109 (86.372)	lr 0.00029
Train [112][2260/3239]	Time 0.285 (0.504)	Data Time 0.001 (0.018)	Loss 2.1971 (2.3403)	Entropy 0.52430 (0.52688)	Top-1 acc 73.438 (67.758)	Top-5 acc 86.719 (86.373)	lr 0.00029
Train [112][2270/3239]	Time 0.288 (0.503)	Data Time 0.002 (0.018)	Loss 2.2170 (2.3407)	Entropy 0.52422 (0.52687)	Top-1 acc 73.047 (67.749)	Top-5 acc 86.719 (86.365)	lr 0.00029
Train [112][2280/3239]	Time 0.263 (0.503)	Data Time 0.001 (0.017)	Loss 2.4743 (2.3408)	Entropy 0.52431 (0.52686)	Top-1 acc 65.625 (67.748)	Top-5 acc 83.203 (86.364)	lr 0.00029
Train [112][2290/3239]	Time 0.234 (0.503)	Data Time 0.001 (0.017)	Loss 2.6269 (2.3411)	Entropy 0.52441 (0.52685)	Top-1 acc 60.938 (67.742)	Top-5 acc 81.641 (86.358)	lr 0.00029
Train [112][2300/3239]	Time 0.266 (0.502)	Data Time 0.001 (0.017)	Loss 2.1789 (2.3410)	Entropy 0.52425 (0.52684)	Top-1 acc 69.141 (67.743)	Top-5 acc 89.844 (86.357)	lr 0.00029
Train [112][2310/3239]	Time 0.222 (0.502)	Data Time 0.001 (0.017)	Loss 2.4696 (2.3409)	Entropy 0.52423 (0.52683)	Top-1 acc 66.016 (67.747)	Top-5 acc 87.500 (86.361)	lr 0.00029
Train [112][2320/3239]	Time 0.330 (0.501)	Data Time 0.001 (0.017)	Loss 2.3804 (2.3409)	Entropy 0.52396 (0.52682)	Top-1 acc 64.844 (67.743)	Top-5 acc 86.328 (86.362)	lr 0.00029
Train [112][2330/3239]	Time 0.235 (0.501)	Data Time 0.001 (0.017)	Loss 2.5649 (2.3409)	Entropy 0.52388 (0.52680)	Top-1 acc 62.109 (67.741)	Top-5 acc 82.031 (86.361)	lr 0.00029
Train [112][2340/3239]	Time 0.233 (0.501)	Data Time 0.001 (0.017)	Loss 2.3143 (2.3408)	Entropy 0.52393 (0.52679)	Top-1 acc 71.484 (67.742)	Top-5 acc 87.500 (86.363)	lr 0.00029
Train [112][2350/3239]	Time 0.258 (0.500)	Data Time 0.001 (0.017)	Loss 2.3131 (2.3406)	Entropy 0.52391 (0.52678)	Top-1 acc 69.141 (67.751)	Top-5 acc 87.891 (86.366)	lr 0.00029
Train [112][2360/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.017)	Loss 2.4521 (2.3406)	Entropy 0.52393 (0.52677)	Top-1 acc 62.500 (67.748)	Top-5 acc 87.891 (86.370)	lr 0.00029
Train [112][2370/3239]	Time 0.233 (0.500)	Data Time 0.001 (0.017)	Loss 2.3027 (2.3404)	Entropy 0.52396 (0.52676)	Top-1 acc 69.531 (67.756)	Top-5 acc 85.938 (86.373)	lr 0.00029
Train [112][2380/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.017)	Loss 2.4689 (2.3407)	Entropy 0.52411 (0.52674)	Top-1 acc 65.625 (67.750)	Top-5 acc 84.766 (86.371)	lr 0.00029
Train [112][2390/3239]	Time 0.319 (0.499)	Data Time 0.001 (0.017)	Loss 2.4341 (2.3408)	Entropy 0.52416 (0.52673)	Top-1 acc 64.453 (67.746)	Top-5 acc 80.469 (86.367)	lr 0.00029
Train [112][2400/3239]	Time 0.225 (0.498)	Data Time 0.001 (0.017)	Loss 2.3984 (2.3410)	Entropy 0.52424 (0.52672)	Top-1 acc 63.672 (67.740)	Top-5 acc 86.719 (86.366)	lr 0.00029
Train [112][2410/3239]	Time 0.231 (0.498)	Data Time 0.001 (0.017)	Loss 2.2917 (2.3411)	Entropy 0.52412 (0.52671)	Top-1 acc 71.094 (67.739)	Top-5 acc 85.156 (86.364)	lr 0.00029
Train [112][2420/3239]	Time 0.231 (0.498)	Data Time 0.001 (0.017)	Loss 2.3475 (2.3411)	Entropy 0.52424 (0.52670)	Top-1 acc 63.281 (67.738)	Top-5 acc 87.109 (86.364)	lr 0.00029
Train [112][2430/3239]	Time 0.233 (0.497)	Data Time 0.001 (0.016)	Loss 2.3905 (2.3413)	Entropy 0.52420 (0.52669)	Top-1 acc 66.406 (67.733)	Top-5 acc 86.719 (86.360)	lr 0.00029
Train [112][2440/3239]	Time 0.236 (0.497)	Data Time 0.002 (0.016)	Loss 2.2352 (2.3413)	Entropy 0.52416 (0.52668)	Top-1 acc 70.312 (67.732)	Top-5 acc 88.281 (86.359)	lr 0.00029
Train [112][2450/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.016)	Loss 2.2334 (2.3412)	Entropy 0.52454 (0.52667)	Top-1 acc 70.703 (67.735)	Top-5 acc 89.453 (86.361)	lr 0.00029
Train [112][2460/3239]	Time 0.229 (0.496)	Data Time 0.001 (0.016)	Loss 2.3477 (2.3415)	Entropy 0.52470 (0.52666)	Top-1 acc 69.141 (67.731)	Top-5 acc 85.938 (86.358)	lr 0.00029
Train [112][2470/3239]	Time 0.233 (0.496)	Data Time 0.001 (0.016)	Loss 2.4375 (2.3414)	Entropy 0.52486 (0.52666)	Top-1 acc 62.891 (67.733)	Top-5 acc 84.375 (86.358)	lr 0.00029
Train [112][2480/3239]	Time 0.310 (0.495)	Data Time 0.001 (0.016)	Loss 2.3294 (2.3413)	Entropy 0.52486 (0.52665)	Top-1 acc 66.016 (67.738)	Top-5 acc 88.281 (86.359)	lr 0.00029
Train [112][2490/3239]	Time 0.236 (0.495)	Data Time 0.001 (0.016)	Loss 2.2056 (2.3418)	Entropy 0.52497 (0.52664)	Top-1 acc 67.188 (67.729)	Top-5 acc 90.234 (86.351)	lr 0.00029
Train [112][2500/3239]	Time 0.226 (0.495)	Data Time 0.001 (0.016)	Loss 2.4231 (2.3417)	Entropy 0.52488 (0.52663)	Top-1 acc 67.578 (67.737)	Top-5 acc 83.594 (86.353)	lr 0.00029
Train [112][2510/3239]	Time 0.237 (0.494)	Data Time 0.001 (0.016)	Loss 2.3323 (2.3414)	Entropy 0.52500 (0.52663)	Top-1 acc 68.750 (67.741)	Top-5 acc 83.594 (86.357)	lr 0.00029
Train [112][2520/3239]	Time 0.237 (0.494)	Data Time 0.001 (0.016)	Loss 2.6179 (2.3414)	Entropy 0.52501 (0.52662)	Top-1 acc 62.500 (67.736)	Top-5 acc 82.422 (86.356)	lr 0.00029
Train [112][2530/3239]	Time 0.229 (0.494)	Data Time 0.001 (0.016)	Loss 2.4906 (2.3412)	Entropy 0.52534 (0.52662)	Top-1 acc 69.141 (67.746)	Top-5 acc 85.547 (86.358)	lr 0.00029
Train [112][2540/3239]	Time 0.233 (0.493)	Data Time 0.001 (0.016)	Loss 2.5151 (2.3410)	Entropy 0.52507 (0.52661)	Top-1 acc 64.062 (67.750)	Top-5 acc 81.250 (86.364)	lr 0.00029
Train [112][2550/3239]	Time 0.405 (0.514)	Data Time 0.002 (0.016)	Loss 2.2923 (2.3409)	Entropy 0.52490 (0.52660)	Top-1 acc 66.797 (67.751)	Top-5 acc 87.109 (86.368)	lr 0.00029
Train [112][2560/3239]	Time 0.237 (0.514)	Data Time 0.002 (0.016)	Loss 2.3354 (2.3408)	Entropy 0.52489 (0.52660)	Top-1 acc 68.359 (67.755)	Top-5 acc 86.328 (86.371)	lr 0.00029
Train [112][2570/3239]	Time 0.241 (0.513)	Data Time 0.001 (0.016)	Loss 2.3251 (2.3409)	Entropy 0.52506 (0.52659)	Top-1 acc 66.406 (67.755)	Top-5 acc 87.500 (86.367)	lr 0.00029
Train [112][2580/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.016)	Loss 2.5556 (2.3409)	Entropy 0.52529 (0.52658)	Top-1 acc 56.250 (67.753)	Top-5 acc 84.375 (86.369)	lr 0.00029
Train [112][2590/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.016)	Loss 2.4065 (2.3409)	Entropy 0.52550 (0.52658)	Top-1 acc 62.891 (67.748)	Top-5 acc 87.109 (86.371)	lr 0.00029
Train [112][2600/3239]	Time 0.258 (0.512)	Data Time 0.001 (0.016)	Loss 2.4008 (2.3409)	Entropy 0.52515 (0.52658)	Top-1 acc 66.406 (67.742)	Top-5 acc 85.156 (86.372)	lr 0.00029
Train [112][2610/3239]	Time 0.233 (0.512)	Data Time 0.001 (0.015)	Loss 2.3007 (2.3411)	Entropy 0.52526 (0.52657)	Top-1 acc 69.922 (67.737)	Top-5 acc 87.891 (86.370)	lr 0.00029
Train [112][2620/3239]	Time 0.223 (0.512)	Data Time 0.001 (0.015)	Loss 2.4371 (2.3415)	Entropy 0.52526 (0.52657)	Top-1 acc 67.188 (67.731)	Top-5 acc 86.328 (86.366)	lr 0.00029
Train [112][2630/3239]	Time 0.228 (0.511)	Data Time 0.001 (0.015)	Loss 2.1569 (2.3413)	Entropy 0.52528 (0.52656)	Top-1 acc 69.141 (67.733)	Top-5 acc 91.016 (86.367)	lr 0.00029
Train [112][2640/3239]	Time 0.327 (0.511)	Data Time 0.001 (0.015)	Loss 2.3181 (2.3412)	Entropy 0.52530 (0.52656)	Top-1 acc 67.969 (67.737)	Top-5 acc 86.719 (86.368)	lr 0.00029
Train [112][2650/3239]	Time 0.263 (0.511)	Data Time 0.003 (0.015)	Loss 2.2393 (2.3412)	Entropy 0.52530 (0.52655)	Top-1 acc 69.531 (67.738)	Top-5 acc 88.281 (86.366)	lr 0.00029
Train [112][2660/3239]	Time 0.237 (0.510)	Data Time 0.001 (0.015)	Loss 2.5006 (2.3413)	Entropy 0.52531 (0.52655)	Top-1 acc 62.891 (67.735)	Top-5 acc 85.938 (86.364)	lr 0.00029
Train [112][2670/3239]	Time 0.235 (0.510)	Data Time 0.001 (0.015)	Loss 2.4807 (2.3411)	Entropy 0.52523 (0.52654)	Top-1 acc 63.672 (67.740)	Top-5 acc 81.641 (86.367)	lr 0.00029
Train [112][2680/3239]	Time 0.240 (0.510)	Data Time 0.001 (0.015)	Loss 2.3681 (2.3415)	Entropy 0.52551 (0.52654)	Top-1 acc 67.578 (67.730)	Top-5 acc 87.109 (86.364)	lr 0.00029
Train [112][2690/3239]	Time 0.283 (0.509)	Data Time 0.001 (0.015)	Loss 2.2794 (2.3415)	Entropy 0.52532 (0.52653)	Top-1 acc 71.484 (67.734)	Top-5 acc 87.109 (86.362)	lr 0.00028
Train [112][2700/3239]	Time 0.254 (0.509)	Data Time 0.002 (0.015)	Loss 2.3305 (2.3416)	Entropy 0.52513 (0.52653)	Top-1 acc 69.922 (67.733)	Top-5 acc 87.500 (86.359)	lr 0.00028
Train [112][2710/3239]	Time 0.360 (0.509)	Data Time 0.002 (0.015)	Loss 2.3930 (2.3419)	Entropy 0.52525 (0.52652)	Top-1 acc 66.406 (67.727)	Top-5 acc 85.156 (86.354)	lr 0.00028
Train [112][2720/3239]	Time 0.272 (0.508)	Data Time 0.002 (0.015)	Loss 2.6756 (2.3420)	Entropy 0.52516 (0.52652)	Top-1 acc 63.281 (67.726)	Top-5 acc 81.641 (86.356)	lr 0.00028
Train [112][2730/3239]	Time 0.275 (0.508)	Data Time 0.001 (0.015)	Loss 2.3568 (2.3421)	Entropy 0.52506 (0.52651)	Top-1 acc 65.234 (67.724)	Top-5 acc 85.547 (86.354)	lr 0.00028
Train [112][2740/3239]	Time 0.230 (0.508)	Data Time 0.001 (0.015)	Loss 2.4095 (2.3421)	Entropy 0.52523 (0.52651)	Top-1 acc 70.703 (67.724)	Top-5 acc 85.156 (86.352)	lr 0.00028
Train [112][2750/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.015)	Loss 2.1944 (2.3420)	Entropy 0.52510 (0.52650)	Top-1 acc 71.094 (67.729)	Top-5 acc 87.891 (86.353)	lr 0.00028
Train [112][2760/3239]	Time 0.253 (0.507)	Data Time 0.001 (0.015)	Loss 2.2203 (2.3417)	Entropy 0.52494 (0.52650)	Top-1 acc 67.188 (67.736)	Top-5 acc 89.062 (86.355)	lr 0.00028
Train [112][2770/3239]	Time 0.229 (0.507)	Data Time 0.001 (0.015)	Loss 2.3659 (2.3419)	Entropy 0.52494 (0.52649)	Top-1 acc 67.188 (67.733)	Top-5 acc 85.938 (86.350)	lr 0.00028
Train [112][2780/3239]	Time 0.290 (0.507)	Data Time 0.001 (0.015)	Loss 2.3249 (2.3419)	Entropy 0.52544 (0.52649)	Top-1 acc 69.922 (67.732)	Top-5 acc 85.938 (86.349)	lr 0.00028
Train [112][2790/3239]	Time 0.253 (0.507)	Data Time 0.001 (0.015)	Loss 2.1886 (2.3420)	Entropy 0.52496 (0.52648)	Top-1 acc 71.484 (67.728)	Top-5 acc 89.453 (86.348)	lr 0.00028
Train [112][2800/3239]	Time 0.292 (0.507)	Data Time 0.001 (0.015)	Loss 2.2350 (2.3421)	Entropy 0.52500 (0.52648)	Top-1 acc 71.875 (67.725)	Top-5 acc 89.062 (86.347)	lr 0.00028
Train [112][2810/3239]	Time 0.220 (0.506)	Data Time 0.001 (0.015)	Loss 2.4707 (2.3424)	Entropy 0.52488 (0.52647)	Top-1 acc 64.844 (67.718)	Top-5 acc 85.938 (86.342)	lr 0.00028
Train [112][2820/3239]	Time 0.215 (0.506)	Data Time 0.001 (0.014)	Loss 2.5004 (2.3424)	Entropy 0.52492 (0.52647)	Top-1 acc 64.844 (67.719)	Top-5 acc 82.422 (86.337)	lr 0.00028
Train [112][2830/3239]	Time 0.264 (0.506)	Data Time 0.001 (0.014)	Loss 2.3910 (2.3425)	Entropy 0.52500 (0.52646)	Top-1 acc 67.188 (67.712)	Top-5 acc 85.156 (86.334)	lr 0.00028
Train [112][2840/3239]	Time 0.232 (0.505)	Data Time 0.001 (0.014)	Loss 2.2897 (2.3426)	Entropy 0.52469 (0.52646)	Top-1 acc 70.312 (67.711)	Top-5 acc 87.109 (86.334)	lr 0.00028
Train [112][2850/3239]	Time 0.272 (0.505)	Data Time 0.001 (0.014)	Loss 2.6051 (2.3426)	Entropy 0.52468 (0.52645)	Top-1 acc 60.547 (67.712)	Top-5 acc 82.031 (86.334)	lr 0.00028
Train [112][2860/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.014)	Loss 2.2555 (2.3426)	Entropy 0.52480 (0.52644)	Top-1 acc 68.750 (67.713)	Top-5 acc 88.672 (86.331)	lr 0.00028
Train [112][2870/3239]	Time 0.332 (0.504)	Data Time 0.001 (0.014)	Loss 2.2624 (2.3426)	Entropy 0.52474 (0.52644)	Top-1 acc 72.266 (67.713)	Top-5 acc 88.672 (86.332)	lr 0.00028
Train [112][2880/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.014)	Loss 2.3004 (2.3426)	Entropy 0.52497 (0.52643)	Top-1 acc 70.312 (67.713)	Top-5 acc 85.938 (86.332)	lr 0.00028
Train [112][2890/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.014)	Loss 2.5234 (2.3427)	Entropy 0.52481 (0.52643)	Top-1 acc 60.938 (67.712)	Top-5 acc 83.594 (86.328)	lr 0.00028
Train [112][2900/3239]	Time 0.239 (0.504)	Data Time 0.001 (0.014)	Loss 2.4298 (2.3425)	Entropy 0.52481 (0.52642)	Top-1 acc 66.406 (67.716)	Top-5 acc 86.719 (86.331)	lr 0.00028
Train [112][2910/3239]	Time 0.238 (0.503)	Data Time 0.001 (0.014)	Loss 2.2617 (2.3424)	Entropy 0.52484 (0.52642)	Top-1 acc 66.016 (67.714)	Top-5 acc 88.281 (86.333)	lr 0.00028
Train [112][2920/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.014)	Loss 2.2445 (2.3423)	Entropy 0.52438 (0.52641)	Top-1 acc 73.047 (67.716)	Top-5 acc 88.672 (86.336)	lr 0.00028
Train [112][2930/3239]	Time 0.232 (0.503)	Data Time 0.002 (0.014)	Loss 2.2687 (2.3423)	Entropy 0.52445 (0.52640)	Top-1 acc 69.531 (67.718)	Top-5 acc 86.328 (86.339)	lr 0.00028
Train [112][2940/3239]	Time 0.331 (0.502)	Data Time 0.001 (0.014)	Loss 2.4816 (2.3423)	Entropy 0.52440 (0.52640)	Top-1 acc 64.062 (67.718)	Top-5 acc 87.109 (86.340)	lr 0.00028
Train [112][2950/3239]	Time 0.235 (0.502)	Data Time 0.001 (0.014)	Loss 2.4482 (2.3424)	Entropy 0.52428 (0.52639)	Top-1 acc 66.797 (67.716)	Top-5 acc 83.984 (86.338)	lr 0.00028
Train [112][2960/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.014)	Loss 2.2978 (2.3425)	Entropy 0.52429 (0.52638)	Top-1 acc 69.922 (67.715)	Top-5 acc 88.281 (86.336)	lr 0.00028
Train [112][2970/3239]	Time 0.341 (0.502)	Data Time 0.003 (0.014)	Loss 2.4361 (2.3426)	Entropy 0.52431 (0.52638)	Top-1 acc 66.016 (67.712)	Top-5 acc 84.375 (86.333)	lr 0.00028
Train [112][2980/3239]	Time 0.232 (0.501)	Data Time 0.001 (0.014)	Loss 2.2051 (2.3427)	Entropy 0.52442 (0.52637)	Top-1 acc 72.266 (67.712)	Top-5 acc 87.500 (86.330)	lr 0.00028
Train [112][2990/3239]	Time 0.264 (0.501)	Data Time 0.001 (0.014)	Loss 2.5201 (2.3428)	Entropy 0.52420 (0.52636)	Top-1 acc 65.234 (67.709)	Top-5 acc 81.641 (86.327)	lr 0.00028
Train [112][3000/3239]	Time 0.240 (0.501)	Data Time 0.001 (0.014)	Loss 2.2577 (2.3429)	Entropy 0.52429 (0.52635)	Top-1 acc 69.922 (67.708)	Top-5 acc 88.672 (86.327)	lr 0.00028
Train [112][3010/3239]	Time 0.228 (0.501)	Data Time 0.001 (0.014)	Loss 2.4324 (2.3430)	Entropy 0.52414 (0.52635)	Top-1 acc 66.797 (67.711)	Top-5 acc 85.547 (86.328)	lr 0.00028
Train [112][3020/3239]	Time 0.225 (0.500)	Data Time 0.001 (0.014)	Loss 2.2916 (2.3430)	Entropy 0.52411 (0.52634)	Top-1 acc 67.188 (67.714)	Top-5 acc 85.938 (86.325)	lr 0.00028
Train [112][3030/3239]	Time 0.397 (0.500)	Data Time 0.001 (0.014)	Loss 2.2750 (2.3432)	Entropy 0.52417 (0.52633)	Top-1 acc 68.750 (67.710)	Top-5 acc 89.062 (86.321)	lr 0.00028
Train [112][3040/3239]	Time 0.260 (0.500)	Data Time 0.001 (0.014)	Loss 2.3878 (2.3435)	Entropy 0.52416 (0.52633)	Top-1 acc 66.797 (67.706)	Top-5 acc 85.156 (86.316)	lr 0.00028
Train [112][3050/3239]	Time 0.247 (0.500)	Data Time 0.001 (0.014)	Loss 2.3027 (2.3434)	Entropy 0.52412 (0.52632)	Top-1 acc 71.875 (67.704)	Top-5 acc 84.766 (86.317)	lr 0.00028
Train [112][3060/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.013)	Loss 2.2268 (2.3432)	Entropy 0.52414 (0.52631)	Top-1 acc 71.484 (67.709)	Top-5 acc 89.453 (86.323)	lr 0.00028
Train [112][3070/3239]	Time 0.233 (0.499)	Data Time 0.001 (0.013)	Loss 2.3835 (2.3433)	Entropy 0.52404 (0.52630)	Top-1 acc 66.797 (67.707)	Top-5 acc 85.547 (86.322)	lr 0.00028
Train [112][3080/3239]	Time 0.226 (0.499)	Data Time 0.001 (0.013)	Loss 2.3657 (2.3433)	Entropy 0.52358 (0.52630)	Top-1 acc 68.750 (67.710)	Top-5 acc 86.328 (86.324)	lr 0.00028
Train [112][3090/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.013)	Loss 2.4938 (2.3433)	Entropy 0.52380 (0.52629)	Top-1 acc 64.453 (67.707)	Top-5 acc 85.156 (86.328)	lr 0.00028
Train [112][3100/3239]	Time 0.323 (0.498)	Data Time 0.001 (0.013)	Loss 2.2371 (2.3432)	Entropy 0.52392 (0.52628)	Top-1 acc 71.094 (67.706)	Top-5 acc 88.281 (86.330)	lr 0.00028
Train [112][3110/3239]	Time 0.239 (0.498)	Data Time 0.001 (0.013)	Loss 2.3968 (2.3432)	Entropy 0.52402 (0.52627)	Top-1 acc 62.891 (67.707)	Top-5 acc 85.547 (86.333)	lr 0.00028
Train [112][3120/3239]	Time 0.249 (0.498)	Data Time 0.001 (0.013)	Loss 2.1814 (2.3430)	Entropy 0.52405 (0.52626)	Top-1 acc 73.047 (67.712)	Top-5 acc 87.891 (86.334)	lr 0.00028
Train [112][3130/3239]	Time 0.230 (0.498)	Data Time 0.001 (0.013)	Loss 2.3611 (2.3428)	Entropy 0.52418 (0.52626)	Top-1 acc 66.016 (67.715)	Top-5 acc 85.547 (86.338)	lr 0.00028
Train [112][3140/3239]	Time 0.258 (0.497)	Data Time 0.002 (0.013)	Loss 2.5530 (2.3429)	Entropy 0.52429 (0.52625)	Top-1 acc 61.328 (67.712)	Top-5 acc 85.547 (86.336)	lr 0.00028
Train [112][3150/3239]	Time 0.285 (0.497)	Data Time 0.002 (0.013)	Loss 2.2258 (2.3430)	Entropy 0.52423 (0.52625)	Top-1 acc 73.047 (67.711)	Top-5 acc 87.500 (86.337)	lr 0.00028
Train [112][3160/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.013)	Loss 2.5482 (2.3429)	Entropy 0.52441 (0.52624)	Top-1 acc 61.328 (67.709)	Top-5 acc 85.156 (86.340)	lr 0.00027
Train [112][3170/3239]	Time 0.325 (0.497)	Data Time 0.002 (0.013)	Loss 2.4495 (2.3432)	Entropy 0.52469 (0.52623)	Top-1 acc 65.234 (67.703)	Top-5 acc 81.641 (86.335)	lr 0.00027
Train [112][3180/3239]	Time 0.219 (0.497)	Data Time 0.000 (0.013)	Loss 2.2911 (2.3431)	Entropy 0.52448 (0.52623)	Top-1 acc 72.266 (67.704)	Top-5 acc 84.766 (86.336)	lr 0.00027
Train [112][3190/3239]	Time 0.315 (0.497)	Data Time 0.000 (0.013)	Loss 2.6195 (2.3428)	Entropy 0.52442 (0.52622)	Top-1 acc 58.984 (67.711)	Top-5 acc 82.031 (86.340)	lr 0.00027
Train [112][3200/3239]	Time 0.324 (0.512)	Data Time 0.000 (0.013)	Loss 2.4485 (2.3427)	Entropy 0.52461 (0.52622)	Top-1 acc 64.453 (67.712)	Top-5 acc 83.594 (86.340)	lr 0.00027
Train [112][3210/3239]	Time 0.228 (0.512)	Data Time 0.000 (0.013)	Loss 2.3855 (2.3426)	Entropy 0.52476 (0.52621)	Top-1 acc 65.234 (67.715)	Top-5 acc 85.547 (86.340)	lr 0.00027
Train [112][3220/3239]	Time 0.227 (0.512)	Data Time 0.000 (0.013)	Loss 2.3364 (2.3426)	Entropy 0.52465 (0.52621)	Top-1 acc 68.750 (67.718)	Top-5 acc 86.328 (86.339)	lr 0.00027
Train [112][3230/3239]	Time 0.235 (0.511)	Data Time 0.000 (0.013)	Loss 2.3112 (2.3426)	Entropy 0.52476 (0.52620)	Top-1 acc 68.359 (67.714)	Top-5 acc 87.891 (86.338)	lr 0.00027
Train [112][3239/3239]	Time 0.961 (0.511)	Data Time 0.000 (0.013)	Loss 2.6336 (2.3426)	Entropy 0.52468 (0.52620)	Top-1 acc 59.259 (67.715)	Top-5 acc 82.716 (86.341)	lr 0.00027
==========Valid [112/120]	loss 1.172	top-1 acc 73.003 (73.154)	top-5 acc 90.608	Train top-1 67.715	top-5 86.341	Entropy 0.52468	Latency-None: 0.000ms	Flops: 539.00M
Train [113][0/3239]	Time 41.470 (41.470)	Data Time 39.169 (39.169)	Loss 2.3109 (2.3109)	Entropy 0.52473 (0.52473)	Top-1 acc 67.578 (67.578)	Top-5 acc 85.547 (85.547)	lr 0.00027
Train [113][10/3239]	Time 0.236 (4.194)	Data Time 0.001 (3.562)	Loss 2.2724 (2.3722)	Entropy 0.52447 (0.52457)	Top-1 acc 68.359 (66.406)	Top-5 acc 89.453 (86.186)	lr 0.00027
Train [113][20/3239]	Time 0.337 (2.402)	Data Time 0.001 (1.867)	Loss 2.3589 (2.3701)	Entropy 0.52457 (0.52452)	Top-1 acc 69.922 (67.020)	Top-5 acc 85.938 (86.235)	lr 0.00027
Train [113][30/3239]	Time 0.241 (1.764)	Data Time 0.001 (1.265)	Loss 2.1643 (2.3672)	Entropy 0.52453 (0.52454)	Top-1 acc 70.312 (66.860)	Top-5 acc 89.844 (86.341)	lr 0.00027
Train [113][40/3239]	Time 0.240 (1.439)	Data Time 0.001 (0.957)	Loss 2.3829 (2.3698)	Entropy 0.52462 (0.52455)	Top-1 acc 64.062 (66.806)	Top-5 acc 87.109 (86.109)	lr 0.00027
Train [113][50/3239]	Time 0.235 (1.241)	Data Time 0.001 (0.770)	Loss 2.1939 (2.3622)	Entropy 0.52486 (0.52458)	Top-1 acc 69.922 (67.103)	Top-5 acc 92.578 (86.221)	lr 0.00027
Train [113][60/3239]	Time 0.245 (1.108)	Data Time 0.001 (0.644)	Loss 2.1805 (2.3665)	Entropy 0.52443 (0.52461)	Top-1 acc 69.922 (66.874)	Top-5 acc 88.281 (86.110)	lr 0.00027
Train [113][70/3239]	Time 0.249 (1.012)	Data Time 0.001 (0.554)	Loss 2.3487 (2.3601)	Entropy 0.52436 (0.52458)	Top-1 acc 68.359 (67.072)	Top-5 acc 86.719 (86.229)	lr 0.00027
Train [113][80/3239]	Time 0.236 (0.940)	Data Time 0.001 (0.485)	Loss 2.3152 (2.3588)	Entropy 0.52432 (0.52455)	Top-1 acc 69.141 (67.183)	Top-5 acc 87.109 (86.265)	lr 0.00027
Train [113][90/3239]	Time 0.337 (0.882)	Data Time 0.001 (0.432)	Loss 2.3700 (2.3609)	Entropy 0.52456 (0.52453)	Top-1 acc 69.141 (67.136)	Top-5 acc 85.156 (86.217)	lr 0.00027
Train [113][100/3239]	Time 0.241 (0.836)	Data Time 0.001 (0.390)	Loss 2.1599 (2.3601)	Entropy 0.52444 (0.52452)	Top-1 acc 72.656 (67.218)	Top-5 acc 91.797 (86.243)	lr 0.00027
Train [113][110/3239]	Time 0.269 (0.799)	Data Time 0.002 (0.355)	Loss 2.2404 (2.3529)	Entropy 0.52461 (0.52451)	Top-1 acc 70.703 (67.349)	Top-5 acc 87.891 (86.307)	lr 0.00027
Train [113][120/3239]	Time 0.230 (0.772)	Data Time 0.001 (0.325)	Loss 2.3112 (2.3476)	Entropy 0.52422 (0.52451)	Top-1 acc 68.359 (67.504)	Top-5 acc 87.891 (86.409)	lr 0.00027
Train [113][130/3239]	Time 0.230 (0.751)	Data Time 0.001 (0.301)	Loss 2.2864 (2.3435)	Entropy 0.52440 (0.52449)	Top-1 acc 69.141 (67.593)	Top-5 acc 88.672 (86.468)	lr 0.00027
Train [113][140/3239]	Time 0.270 (0.728)	Data Time 0.001 (0.280)	Loss 2.2553 (2.3389)	Entropy 0.52444 (0.52448)	Top-1 acc 69.141 (67.717)	Top-5 acc 88.281 (86.553)	lr 0.00027
Train [113][150/3239]	Time 0.253 (0.708)	Data Time 0.001 (0.261)	Loss 2.3400 (2.3387)	Entropy 0.52434 (0.52448)	Top-1 acc 71.484 (67.754)	Top-5 acc 85.156 (86.540)	lr 0.00027
Train [113][160/3239]	Time 0.231 (0.690)	Data Time 0.001 (0.245)	Loss 2.1612 (2.3344)	Entropy 0.52423 (0.52446)	Top-1 acc 73.438 (67.833)	Top-5 acc 88.672 (86.631)	lr 0.00027
Train [113][170/3239]	Time 0.235 (0.672)	Data Time 0.001 (0.231)	Loss 2.2372 (2.3359)	Entropy 0.52414 (0.52445)	Top-1 acc 67.969 (67.781)	Top-5 acc 89.844 (86.559)	lr 0.00027
Train [113][180/3239]	Time 0.238 (0.657)	Data Time 0.001 (0.218)	Loss 2.4070 (2.3391)	Entropy 0.52374 (0.52442)	Top-1 acc 65.625 (67.703)	Top-5 acc 83.203 (86.481)	lr 0.00027
Train [113][190/3239]	Time 0.232 (0.644)	Data Time 0.001 (0.207)	Loss 2.5261 (2.3387)	Entropy 0.52390 (0.52439)	Top-1 acc 62.109 (67.717)	Top-5 acc 83.594 (86.500)	lr 0.00027
Train [113][200/3239]	Time 0.230 (0.632)	Data Time 0.001 (0.196)	Loss 2.1712 (2.3354)	Entropy 0.52398 (0.52436)	Top-1 acc 74.219 (67.840)	Top-5 acc 91.406 (86.575)	lr 0.00027
Train [113][210/3239]	Time 0.324 (0.624)	Data Time 0.001 (0.187)	Loss 2.4509 (2.3351)	Entropy 0.52392 (0.52434)	Top-1 acc 66.406 (67.874)	Top-5 acc 84.766 (86.576)	lr 0.00027
Train [113][220/3239]	Time 0.235 (0.615)	Data Time 0.001 (0.179)	Loss 2.3708 (2.3390)	Entropy 0.52395 (0.52432)	Top-1 acc 67.578 (67.790)	Top-5 acc 86.328 (86.512)	lr 0.00027
Train [113][230/3239]	Time 0.231 (0.607)	Data Time 0.001 (0.171)	Loss 2.3402 (2.3428)	Entropy 0.52432 (0.52431)	Top-1 acc 71.094 (67.705)	Top-5 acc 87.109 (86.484)	lr 0.00027
Train [113][240/3239]	Time 0.223 (0.599)	Data Time 0.001 (0.164)	Loss 2.2806 (2.3402)	Entropy 0.52436 (0.52432)	Top-1 acc 67.188 (67.732)	Top-5 acc 87.891 (86.519)	lr 0.00027
Train [113][250/3239]	Time 0.311 (0.592)	Data Time 0.001 (0.158)	Loss 2.3588 (2.3392)	Entropy 0.52442 (0.52432)	Top-1 acc 68.750 (67.782)	Top-5 acc 87.109 (86.540)	lr 0.00027
Train [113][260/3239]	Time 0.226 (0.584)	Data Time 0.001 (0.152)	Loss 2.3013 (2.3415)	Entropy 0.52448 (0.52432)	Top-1 acc 69.141 (67.740)	Top-5 acc 87.500 (86.529)	lr 0.00027
Train [113][270/3239]	Time 0.218 (0.578)	Data Time 0.001 (0.146)	Loss 2.5907 (2.3420)	Entropy 0.52442 (0.52433)	Top-1 acc 62.891 (67.691)	Top-5 acc 85.938 (86.546)	lr 0.00027
Train [113][280/3239]	Time 0.233 (0.573)	Data Time 0.001 (0.141)	Loss 2.2736 (2.3397)	Entropy 0.52467 (0.52433)	Top-1 acc 67.969 (67.755)	Top-5 acc 86.328 (86.588)	lr 0.00027
Train [113][290/3239]	Time 0.237 (0.568)	Data Time 0.001 (0.136)	Loss 2.2481 (2.3394)	Entropy 0.52476 (0.52434)	Top-1 acc 68.359 (67.781)	Top-5 acc 87.500 (86.576)	lr 0.00027
Train [113][300/3239]	Time 0.240 (0.563)	Data Time 0.001 (0.132)	Loss 2.4679 (2.3387)	Entropy 0.52509 (0.52436)	Top-1 acc 66.406 (67.779)	Top-5 acc 80.859 (86.585)	lr 0.00027
Train [113][310/3239]	Time 0.232 (0.558)	Data Time 0.001 (0.128)	Loss 2.2805 (2.3371)	Entropy 0.52531 (0.52439)	Top-1 acc 69.141 (67.807)	Top-5 acc 88.281 (86.606)	lr 0.00027
Train [113][320/3239]	Time 0.338 (0.554)	Data Time 0.001 (0.124)	Loss 2.5960 (2.3382)	Entropy 0.52529 (0.52442)	Top-1 acc 62.891 (67.775)	Top-5 acc 83.594 (86.584)	lr 0.00027
Train [113][330/3239]	Time 0.234 (0.549)	Data Time 0.001 (0.120)	Loss 2.3926 (2.3383)	Entropy 0.52525 (0.52444)	Top-1 acc 69.531 (67.760)	Top-5 acc 84.766 (86.590)	lr 0.00027
Train [113][340/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.117)	Loss 2.3728 (2.3375)	Entropy 0.52529 (0.52447)	Top-1 acc 67.188 (67.792)	Top-5 acc 86.719 (86.592)	lr 0.00027
Train [113][350/3239]	Time 0.240 (0.541)	Data Time 0.001 (0.113)	Loss 2.4213 (2.3385)	Entropy 0.52479 (0.52448)	Top-1 acc 67.578 (67.763)	Top-5 acc 83.203 (86.570)	lr 0.00027
Train [113][360/3239]	Time 0.229 (0.537)	Data Time 0.001 (0.110)	Loss 2.3258 (2.3391)	Entropy 0.52499 (0.52449)	Top-1 acc 67.969 (67.729)	Top-5 acc 86.719 (86.539)	lr 0.00027
Train [113][370/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.107)	Loss 2.3113 (2.3390)	Entropy 0.52437 (0.52450)	Top-1 acc 67.188 (67.754)	Top-5 acc 87.891 (86.540)	lr 0.00027
Train [113][380/3239]	Time 0.247 (0.531)	Data Time 0.001 (0.105)	Loss 2.3303 (2.3389)	Entropy 0.52414 (0.52450)	Top-1 acc 67.969 (67.763)	Top-5 acc 83.594 (86.535)	lr 0.00027
Train [113][390/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.102)	Loss 2.2778 (2.3390)	Entropy 0.52447 (0.52449)	Top-1 acc 66.016 (67.773)	Top-5 acc 87.500 (86.497)	lr 0.00027
Train [113][400/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.099)	Loss 2.2927 (2.3410)	Entropy 0.52469 (0.52449)	Top-1 acc 71.094 (67.723)	Top-5 acc 87.891 (86.469)	lr 0.00026
Train [113][410/3239]	Time 0.343 (0.522)	Data Time 0.001 (0.097)	Loss 2.2909 (2.3415)	Entropy 0.52492 (0.52450)	Top-1 acc 69.531 (67.700)	Top-5 acc 87.500 (86.455)	lr 0.00026
Train [113][420/3239]	Time 0.308 (0.521)	Data Time 0.002 (0.095)	Loss 2.0478 (2.3407)	Entropy 0.52455 (0.52451)	Top-1 acc 76.172 (67.721)	Top-5 acc 91.016 (86.468)	lr 0.00026
Train [113][430/3239]	Time 0.299 (0.524)	Data Time 0.002 (0.093)	Loss 2.1966 (2.3411)	Entropy 0.52468 (0.52451)	Top-1 acc 75.781 (67.718)	Top-5 acc 88.281 (86.466)	lr 0.00026
Train [113][440/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.091)	Loss 2.3551 (2.3423)	Entropy 0.52475 (0.52451)	Top-1 acc 66.797 (67.681)	Top-5 acc 86.328 (86.445)	lr 0.00026
Train [113][450/3239]	Time 0.222 (0.519)	Data Time 0.001 (0.089)	Loss 2.3617 (2.3416)	Entropy 0.52514 (0.52452)	Top-1 acc 69.141 (67.709)	Top-5 acc 87.109 (86.466)	lr 0.00026
Train [113][460/3239]	Time 0.227 (0.516)	Data Time 0.001 (0.087)	Loss 2.3774 (2.3409)	Entropy 0.52508 (0.52453)	Top-1 acc 66.406 (67.741)	Top-5 acc 84.766 (86.461)	lr 0.00026
Train [113][470/3239]	Time 0.225 (0.514)	Data Time 0.001 (0.085)	Loss 2.2520 (2.3411)	Entropy 0.52509 (0.52454)	Top-1 acc 71.484 (67.751)	Top-5 acc 88.281 (86.456)	lr 0.00026
Train [113][480/3239]	Time 0.321 (0.511)	Data Time 0.001 (0.083)	Loss 2.3740 (2.3418)	Entropy 0.52493 (0.52455)	Top-1 acc 67.578 (67.752)	Top-5 acc 85.547 (86.443)	lr 0.00026
Train [113][490/3239]	Time 0.247 (0.510)	Data Time 0.001 (0.082)	Loss 2.4992 (2.3418)	Entropy 0.52517 (0.52456)	Top-1 acc 62.500 (67.741)	Top-5 acc 84.766 (86.442)	lr 0.00026
Train [113][500/3239]	Time 0.226 (0.508)	Data Time 0.001 (0.080)	Loss 2.4909 (2.3434)	Entropy 0.52546 (0.52458)	Top-1 acc 64.844 (67.710)	Top-5 acc 83.594 (86.414)	lr 0.00026
Train [113][510/3239]	Time 0.249 (0.506)	Data Time 0.001 (0.078)	Loss 2.2032 (2.3430)	Entropy 0.52536 (0.52459)	Top-1 acc 70.312 (67.697)	Top-5 acc 88.672 (86.416)	lr 0.00026
Train [113][520/3239]	Time 0.234 (0.504)	Data Time 0.001 (0.077)	Loss 2.4981 (2.3429)	Entropy 0.52557 (0.52461)	Top-1 acc 65.625 (67.701)	Top-5 acc 83.984 (86.417)	lr 0.00026
Train [113][530/3239]	Time 0.273 (0.502)	Data Time 0.002 (0.076)	Loss 2.1919 (2.3422)	Entropy 0.52556 (0.52463)	Top-1 acc 70.703 (67.719)	Top-5 acc 88.281 (86.436)	lr 0.00026
Train [113][540/3239]	Time 0.241 (0.500)	Data Time 0.001 (0.074)	Loss 2.2858 (2.3428)	Entropy 0.52595 (0.52465)	Top-1 acc 72.266 (67.724)	Top-5 acc 86.719 (86.423)	lr 0.00026
Train [113][550/3239]	Time 0.244 (0.499)	Data Time 0.002 (0.073)	Loss 2.4097 (2.3430)	Entropy 0.52593 (0.52467)	Top-1 acc 65.234 (67.708)	Top-5 acc 86.719 (86.412)	lr 0.00026
Train [113][560/3239]	Time 0.230 (0.498)	Data Time 0.001 (0.072)	Loss 2.5012 (2.3425)	Entropy 0.52607 (0.52469)	Top-1 acc 66.016 (67.717)	Top-5 acc 84.766 (86.427)	lr 0.00026
Train [113][570/3239]	Time 0.243 (0.496)	Data Time 0.001 (0.070)	Loss 2.2171 (2.3422)	Entropy 0.52614 (0.52472)	Top-1 acc 69.922 (67.728)	Top-5 acc 86.328 (86.423)	lr 0.00026
Train [113][580/3239]	Time 0.227 (0.494)	Data Time 0.001 (0.069)	Loss 2.2460 (2.3422)	Entropy 0.52615 (0.52474)	Top-1 acc 68.359 (67.725)	Top-5 acc 88.281 (86.424)	lr 0.00026
Train [113][590/3239]	Time 0.227 (0.493)	Data Time 0.001 (0.068)	Loss 2.3818 (2.3431)	Entropy 0.52610 (0.52476)	Top-1 acc 66.406 (67.686)	Top-5 acc 86.719 (86.413)	lr 0.00026
Train [113][600/3239]	Time 0.230 (0.491)	Data Time 0.001 (0.067)	Loss 2.5576 (2.3434)	Entropy 0.52621 (0.52479)	Top-1 acc 60.547 (67.668)	Top-5 acc 85.156 (86.408)	lr 0.00026
Train [113][610/3239]	Time 0.245 (0.490)	Data Time 0.001 (0.066)	Loss 2.4462 (2.3448)	Entropy 0.52621 (0.52481)	Top-1 acc 63.281 (67.621)	Top-5 acc 84.766 (86.399)	lr 0.00026
Train [113][620/3239]	Time 0.274 (0.574)	Data Time 0.002 (0.065)	Loss 2.4271 (2.3449)	Entropy 0.52624 (0.52483)	Top-1 acc 65.625 (67.612)	Top-5 acc 85.547 (86.400)	lr 0.00026
Train [113][630/3239]	Time 0.257 (0.571)	Data Time 0.002 (0.064)	Loss 2.2584 (2.3455)	Entropy 0.52589 (0.52485)	Top-1 acc 72.266 (67.615)	Top-5 acc 88.281 (86.386)	lr 0.00026
Train [113][640/3239]	Time 0.364 (0.569)	Data Time 0.002 (0.063)	Loss 2.4555 (2.3460)	Entropy 0.52586 (0.52487)	Top-1 acc 66.797 (67.620)	Top-5 acc 85.156 (86.384)	lr 0.00026
Train [113][650/3239]	Time 0.244 (0.567)	Data Time 0.002 (0.062)	Loss 2.2686 (2.3450)	Entropy 0.52624 (0.52488)	Top-1 acc 68.750 (67.654)	Top-5 acc 89.062 (86.401)	lr 0.00026
Train [113][660/3239]	Time 0.234 (0.565)	Data Time 0.001 (0.061)	Loss 2.4399 (2.3458)	Entropy 0.52642 (0.52491)	Top-1 acc 64.844 (67.638)	Top-5 acc 85.938 (86.395)	lr 0.00026
Train [113][670/3239]	Time 0.233 (0.563)	Data Time 0.001 (0.060)	Loss 2.2640 (2.3456)	Entropy 0.52645 (0.52493)	Top-1 acc 72.656 (67.635)	Top-5 acc 90.234 (86.397)	lr 0.00026
Train [113][680/3239]	Time 0.229 (0.561)	Data Time 0.001 (0.059)	Loss 2.4606 (2.3466)	Entropy 0.52672 (0.52495)	Top-1 acc 62.500 (67.602)	Top-5 acc 82.031 (86.375)	lr 0.00026
Train [113][690/3239]	Time 0.258 (0.559)	Data Time 0.001 (0.059)	Loss 2.4972 (2.3477)	Entropy 0.52673 (0.52498)	Top-1 acc 63.281 (67.580)	Top-5 acc 84.766 (86.354)	lr 0.00026
Train [113][700/3239]	Time 0.229 (0.557)	Data Time 0.001 (0.058)	Loss 2.4403 (2.3477)	Entropy 0.52667 (0.52500)	Top-1 acc 64.453 (67.592)	Top-5 acc 83.594 (86.354)	lr 0.00026
Train [113][710/3239]	Time 0.244 (0.555)	Data Time 0.002 (0.057)	Loss 2.2120 (2.3466)	Entropy 0.52657 (0.52502)	Top-1 acc 70.312 (67.625)	Top-5 acc 88.281 (86.364)	lr 0.00026
Train [113][720/3239]	Time 0.230 (0.553)	Data Time 0.001 (0.056)	Loss 2.2700 (2.3465)	Entropy 0.52619 (0.52504)	Top-1 acc 70.312 (67.644)	Top-5 acc 87.891 (86.369)	lr 0.00026
Train [113][730/3239]	Time 0.340 (0.551)	Data Time 0.001 (0.055)	Loss 2.3716 (2.3466)	Entropy 0.52631 (0.52506)	Top-1 acc 67.578 (67.649)	Top-5 acc 88.672 (86.366)	lr 0.00026
Train [113][740/3239]	Time 0.237 (0.550)	Data Time 0.001 (0.055)	Loss 2.2664 (2.3463)	Entropy 0.52627 (0.52508)	Top-1 acc 70.703 (67.654)	Top-5 acc 88.672 (86.374)	lr 0.00026
Train [113][750/3239]	Time 0.243 (0.548)	Data Time 0.001 (0.054)	Loss 2.1530 (2.3467)	Entropy 0.52599 (0.52509)	Top-1 acc 69.531 (67.635)	Top-5 acc 91.797 (86.373)	lr 0.00026
Train [113][760/3239]	Time 0.241 (0.547)	Data Time 0.001 (0.053)	Loss 2.3085 (2.3470)	Entropy 0.52626 (0.52510)	Top-1 acc 66.016 (67.632)	Top-5 acc 87.891 (86.370)	lr 0.00026
Train [113][770/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.053)	Loss 2.5328 (2.3479)	Entropy 0.52585 (0.52512)	Top-1 acc 62.891 (67.617)	Top-5 acc 81.641 (86.352)	lr 0.00026
Train [113][780/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.052)	Loss 2.3284 (2.3473)	Entropy 0.52601 (0.52513)	Top-1 acc 69.922 (67.621)	Top-5 acc 85.156 (86.357)	lr 0.00026
Train [113][790/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.051)	Loss 2.3488 (2.3483)	Entropy 0.52608 (0.52514)	Top-1 acc 67.969 (67.601)	Top-5 acc 87.891 (86.340)	lr 0.00026
Train [113][800/3239]	Time 0.319 (0.540)	Data Time 0.001 (0.051)	Loss 2.2763 (2.3486)	Entropy 0.52593 (0.52515)	Top-1 acc 67.188 (67.592)	Top-5 acc 89.062 (86.334)	lr 0.00026
Train [113][810/3239]	Time 0.227 (0.538)	Data Time 0.001 (0.050)	Loss 2.2330 (2.3478)	Entropy 0.52618 (0.52516)	Top-1 acc 69.531 (67.606)	Top-5 acc 90.234 (86.349)	lr 0.00026
Train [113][820/3239]	Time 0.225 (0.537)	Data Time 0.001 (0.050)	Loss 2.2615 (2.3481)	Entropy 0.52618 (0.52517)	Top-1 acc 68.750 (67.606)	Top-5 acc 87.500 (86.336)	lr 0.00026
Train [113][830/3239]	Time 0.235 (0.535)	Data Time 0.001 (0.049)	Loss 2.5737 (2.3486)	Entropy 0.52619 (0.52519)	Top-1 acc 63.281 (67.603)	Top-5 acc 84.766 (86.321)	lr 0.00026
Train [113][840/3239]	Time 0.224 (0.534)	Data Time 0.001 (0.048)	Loss 2.3835 (2.3489)	Entropy 0.52591 (0.52520)	Top-1 acc 66.797 (67.588)	Top-5 acc 85.938 (86.322)	lr 0.00026
Train [113][850/3239]	Time 0.225 (0.532)	Data Time 0.001 (0.048)	Loss 2.4710 (2.3500)	Entropy 0.52577 (0.52520)	Top-1 acc 66.016 (67.568)	Top-5 acc 85.938 (86.301)	lr 0.00026
Train [113][860/3239]	Time 0.254 (0.531)	Data Time 0.001 (0.047)	Loss 2.1896 (2.3497)	Entropy 0.52615 (0.52521)	Top-1 acc 73.438 (67.563)	Top-5 acc 88.672 (86.309)	lr 0.00026
Train [113][870/3239]	Time 0.259 (0.530)	Data Time 0.002 (0.047)	Loss 2.2641 (2.3496)	Entropy 0.52644 (0.52522)	Top-1 acc 73.438 (67.572)	Top-5 acc 85.547 (86.310)	lr 0.00026
Train [113][880/3239]	Time 0.235 (0.529)	Data Time 0.004 (0.046)	Loss 2.3451 (2.3498)	Entropy 0.52632 (0.52524)	Top-1 acc 69.531 (67.572)	Top-5 acc 85.938 (86.308)	lr 0.00025
Train [113][890/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.046)	Loss 2.4989 (2.3508)	Entropy 0.52613 (0.52525)	Top-1 acc 65.234 (67.553)	Top-5 acc 84.766 (86.289)	lr 0.00025
Train [113][900/3239]	Time 0.263 (0.527)	Data Time 0.001 (0.045)	Loss 2.1657 (2.3500)	Entropy 0.52591 (0.52526)	Top-1 acc 67.969 (67.570)	Top-5 acc 93.359 (86.306)	lr 0.00025
Train [113][910/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.045)	Loss 2.3440 (2.3498)	Entropy 0.52576 (0.52526)	Top-1 acc 68.359 (67.573)	Top-5 acc 83.594 (86.309)	lr 0.00025
Train [113][920/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.044)	Loss 2.2501 (2.3498)	Entropy 0.52570 (0.52527)	Top-1 acc 67.578 (67.570)	Top-5 acc 85.938 (86.314)	lr 0.00025
Train [113][930/3239]	Time 0.283 (0.524)	Data Time 0.002 (0.044)	Loss 2.5391 (2.3499)	Entropy 0.52581 (0.52527)	Top-1 acc 61.328 (67.565)	Top-5 acc 84.375 (86.326)	lr 0.00025
Train [113][940/3239]	Time 0.294 (0.524)	Data Time 0.002 (0.044)	Loss 2.2891 (2.3495)	Entropy 0.52604 (0.52528)	Top-1 acc 70.703 (67.567)	Top-5 acc 86.328 (86.329)	lr 0.00025
Train [113][950/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.043)	Loss 2.4592 (2.3499)	Entropy 0.52613 (0.52529)	Top-1 acc 63.281 (67.555)	Top-5 acc 84.375 (86.320)	lr 0.00025
Train [113][960/3239]	Time 0.326 (0.522)	Data Time 0.001 (0.043)	Loss 2.2772 (2.3499)	Entropy 0.52603 (0.52530)	Top-1 acc 68.359 (67.553)	Top-5 acc 88.281 (86.326)	lr 0.00025
Train [113][970/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.042)	Loss 2.2712 (2.3498)	Entropy 0.52606 (0.52530)	Top-1 acc 71.094 (67.550)	Top-5 acc 85.938 (86.327)	lr 0.00025
Train [113][980/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.042)	Loss 2.5205 (2.3502)	Entropy 0.52625 (0.52531)	Top-1 acc 65.234 (67.539)	Top-5 acc 86.719 (86.328)	lr 0.00025
Train [113][990/3239]	Time 0.230 (0.519)	Data Time 0.001 (0.041)	Loss 2.3454 (2.3506)	Entropy 0.52643 (0.52532)	Top-1 acc 68.359 (67.534)	Top-5 acc 84.375 (86.315)	lr 0.00025
Train [113][1000/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.041)	Loss 2.1907 (2.3509)	Entropy 0.52670 (0.52533)	Top-1 acc 70.312 (67.521)	Top-5 acc 90.625 (86.313)	lr 0.00025
Train [113][1010/3239]	Time 0.233 (0.516)	Data Time 0.001 (0.041)	Loss 2.4320 (2.3505)	Entropy 0.52658 (0.52535)	Top-1 acc 67.188 (67.527)	Top-5 acc 83.984 (86.322)	lr 0.00025
Train [113][1020/3239]	Time 0.328 (0.516)	Data Time 0.002 (0.040)	Loss 2.2186 (2.3500)	Entropy 0.52657 (0.52536)	Top-1 acc 69.922 (67.544)	Top-5 acc 89.062 (86.327)	lr 0.00025
Train [113][1030/3239]	Time 0.319 (0.517)	Data Time 0.001 (0.040)	Loss 2.2946 (2.3499)	Entropy 0.52678 (0.52537)	Top-1 acc 70.703 (67.552)	Top-5 acc 85.547 (86.328)	lr 0.00025
Train [113][1040/3239]	Time 0.227 (0.516)	Data Time 0.001 (0.039)	Loss 2.3210 (2.3501)	Entropy 0.52683 (0.52539)	Top-1 acc 67.969 (67.563)	Top-5 acc 86.719 (86.324)	lr 0.00025
Train [113][1050/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.039)	Loss 2.2013 (2.3496)	Entropy 0.52691 (0.52540)	Top-1 acc 70.703 (67.566)	Top-5 acc 89.062 (86.342)	lr 0.00025
Train [113][1060/3239]	Time 0.247 (0.515)	Data Time 0.001 (0.039)	Loss 2.2739 (2.3493)	Entropy 0.52669 (0.52541)	Top-1 acc 71.484 (67.571)	Top-5 acc 87.109 (86.345)	lr 0.00025
Train [113][1070/3239]	Time 0.265 (0.514)	Data Time 0.001 (0.038)	Loss 2.2467 (2.3493)	Entropy 0.52672 (0.52542)	Top-1 acc 68.359 (67.565)	Top-5 acc 87.891 (86.346)	lr 0.00025
Train [113][1080/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.038)	Loss 2.3629 (2.3492)	Entropy 0.52688 (0.52543)	Top-1 acc 68.750 (67.554)	Top-5 acc 84.375 (86.343)	lr 0.00025
Train [113][1090/3239]	Time 0.240 (0.512)	Data Time 0.001 (0.038)	Loss 2.3261 (2.3493)	Entropy 0.52673 (0.52545)	Top-1 acc 67.969 (67.563)	Top-5 acc 86.719 (86.339)	lr 0.00025
Train [113][1100/3239]	Time 0.237 (0.511)	Data Time 0.001 (0.037)	Loss 2.1323 (2.3486)	Entropy 0.52686 (0.52546)	Top-1 acc 72.656 (67.581)	Top-5 acc 90.625 (86.355)	lr 0.00025
Train [113][1110/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.037)	Loss 2.8314 (2.3488)	Entropy 0.52674 (0.52547)	Top-1 acc 61.328 (67.584)	Top-5 acc 78.906 (86.353)	lr 0.00025
Train [113][1120/3239]	Time 0.238 (0.509)	Data Time 0.001 (0.037)	Loss 2.2892 (2.3490)	Entropy 0.52671 (0.52548)	Top-1 acc 67.188 (67.574)	Top-5 acc 88.281 (86.354)	lr 0.00025
Train [113][1130/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.036)	Loss 2.2523 (2.3488)	Entropy 0.52646 (0.52549)	Top-1 acc 71.875 (67.579)	Top-5 acc 89.062 (86.360)	lr 0.00025
Train [113][1140/3239]	Time 0.241 (0.507)	Data Time 0.001 (0.036)	Loss 2.2672 (2.3484)	Entropy 0.52629 (0.52550)	Top-1 acc 68.359 (67.579)	Top-5 acc 91.016 (86.369)	lr 0.00025
Train [113][1150/3239]	Time 0.231 (0.506)	Data Time 0.001 (0.036)	Loss 2.3753 (2.3478)	Entropy 0.52661 (0.52551)	Top-1 acc 64.062 (67.583)	Top-5 acc 86.328 (86.377)	lr 0.00025
Train [113][1160/3239]	Time 0.227 (0.505)	Data Time 0.001 (0.036)	Loss 2.2203 (2.3483)	Entropy 0.52652 (0.52552)	Top-1 acc 71.094 (67.573)	Top-5 acc 87.500 (86.371)	lr 0.00025
Train [113][1170/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.035)	Loss 2.1934 (2.3486)	Entropy 0.52633 (0.52553)	Top-1 acc 75.391 (67.564)	Top-5 acc 89.062 (86.372)	lr 0.00025
Train [113][1180/3239]	Time 0.235 (0.504)	Data Time 0.001 (0.035)	Loss 2.2051 (2.3481)	Entropy 0.52645 (0.52553)	Top-1 acc 68.750 (67.571)	Top-5 acc 89.453 (86.380)	lr 0.00025
Train [113][1190/3239]	Time 0.364 (0.503)	Data Time 0.001 (0.035)	Loss 2.2958 (2.3485)	Entropy 0.52622 (0.52554)	Top-1 acc 69.141 (67.556)	Top-5 acc 85.156 (86.371)	lr 0.00025
Train [113][1200/3239]	Time 0.255 (0.502)	Data Time 0.001 (0.034)	Loss 2.4501 (2.3489)	Entropy 0.52590 (0.52555)	Top-1 acc 64.453 (67.547)	Top-5 acc 82.422 (86.356)	lr 0.00025
Train [113][1210/3239]	Time 0.243 (0.502)	Data Time 0.001 (0.034)	Loss 2.1984 (2.3492)	Entropy 0.52578 (0.52555)	Top-1 acc 74.609 (67.540)	Top-5 acc 88.281 (86.351)	lr 0.00025
Train [113][1220/3239]	Time 0.241 (0.501)	Data Time 0.002 (0.034)	Loss 2.2068 (2.3489)	Entropy 0.52599 (0.52555)	Top-1 acc 68.750 (67.544)	Top-5 acc 89.062 (86.355)	lr 0.00025
Train [113][1230/3239]	Time 0.234 (0.500)	Data Time 0.002 (0.034)	Loss 2.2795 (2.3490)	Entropy 0.52621 (0.52555)	Top-1 acc 70.703 (67.537)	Top-5 acc 87.500 (86.357)	lr 0.00025
Train [113][1240/3239]	Time 0.234 (0.500)	Data Time 0.001 (0.033)	Loss 2.3146 (2.3485)	Entropy 0.52621 (0.52556)	Top-1 acc 70.312 (67.550)	Top-5 acc 85.547 (86.362)	lr 0.00025
Train [113][1250/3239]	Time 0.234 (0.499)	Data Time 0.001 (0.033)	Loss 2.3194 (2.3481)	Entropy 0.52638 (0.52557)	Top-1 acc 66.797 (67.561)	Top-5 acc 87.891 (86.364)	lr 0.00025
Train [113][1260/3239]	Time 0.325 (0.499)	Data Time 0.001 (0.033)	Loss 2.0832 (2.3484)	Entropy 0.52635 (0.52557)	Top-1 acc 74.609 (67.556)	Top-5 acc 90.234 (86.354)	lr 0.00025
Train [113][1270/3239]	Time 0.393 (0.537)	Data Time 0.006 (0.033)	Loss 2.2830 (2.3482)	Entropy 0.52651 (0.52558)	Top-1 acc 68.359 (67.566)	Top-5 acc 89.062 (86.358)	lr 0.00025
Train [113][1280/3239]	Time 0.273 (0.537)	Data Time 0.004 (0.032)	Loss 2.4221 (2.3479)	Entropy 0.52664 (0.52559)	Top-1 acc 65.234 (67.575)	Top-5 acc 86.719 (86.357)	lr 0.00025
Train [113][1290/3239]	Time 0.236 (0.536)	Data Time 0.001 (0.032)	Loss 2.4203 (2.3479)	Entropy 0.52670 (0.52560)	Top-1 acc 67.188 (67.578)	Top-5 acc 85.938 (86.356)	lr 0.00025
Train [113][1300/3239]	Time 0.254 (0.535)	Data Time 0.001 (0.032)	Loss 2.6233 (2.3481)	Entropy 0.52648 (0.52561)	Top-1 acc 62.109 (67.577)	Top-5 acc 81.641 (86.350)	lr 0.00025
Train [113][1310/3239]	Time 0.235 (0.534)	Data Time 0.001 (0.032)	Loss 2.2656 (2.3481)	Entropy 0.52615 (0.52561)	Top-1 acc 68.359 (67.572)	Top-5 acc 86.328 (86.350)	lr 0.00025
Train [113][1320/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.031)	Loss 2.2832 (2.3482)	Entropy 0.52639 (0.52562)	Top-1 acc 70.703 (67.571)	Top-5 acc 87.109 (86.344)	lr 0.00025
Train [113][1330/3239]	Time 0.241 (0.533)	Data Time 0.001 (0.031)	Loss 2.1120 (2.3483)	Entropy 0.52630 (0.52562)	Top-1 acc 71.094 (67.563)	Top-5 acc 91.406 (86.343)	lr 0.00025
Train [113][1340/3239]	Time 0.236 (0.532)	Data Time 0.001 (0.031)	Loss 2.4173 (2.3484)	Entropy 0.52625 (0.52563)	Top-1 acc 66.016 (67.558)	Top-5 acc 84.375 (86.336)	lr 0.00025
Train [113][1350/3239]	Time 0.330 (0.532)	Data Time 0.001 (0.031)	Loss 2.3757 (2.3483)	Entropy 0.52666 (0.52563)	Top-1 acc 67.188 (67.567)	Top-5 acc 83.594 (86.332)	lr 0.00025
Train [113][1360/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.031)	Loss 2.2972 (2.3486)	Entropy 0.52693 (0.52564)	Top-1 acc 67.578 (67.554)	Top-5 acc 86.328 (86.321)	lr 0.00025
Train [113][1370/3239]	Time 0.242 (0.530)	Data Time 0.001 (0.030)	Loss 2.2450 (2.3485)	Entropy 0.52708 (0.52565)	Top-1 acc 73.047 (67.557)	Top-5 acc 89.453 (86.318)	lr 0.00025
Train [113][1380/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.030)	Loss 2.2340 (2.3481)	Entropy 0.52727 (0.52566)	Top-1 acc 70.312 (67.569)	Top-5 acc 89.062 (86.328)	lr 0.00024
Train [113][1390/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.030)	Loss 2.2267 (2.3481)	Entropy 0.52740 (0.52567)	Top-1 acc 70.703 (67.569)	Top-5 acc 89.453 (86.329)	lr 0.00024
Train [113][1400/3239]	Time 0.268 (0.528)	Data Time 0.001 (0.030)	Loss 2.1579 (2.3484)	Entropy 0.52750 (0.52569)	Top-1 acc 69.141 (67.559)	Top-5 acc 90.234 (86.326)	lr 0.00024
Train [113][1410/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.030)	Loss 2.1850 (2.3483)	Entropy 0.52727 (0.52570)	Top-1 acc 67.188 (67.557)	Top-5 acc 90.625 (86.333)	lr 0.00024
Train [113][1420/3239]	Time 0.307 (0.526)	Data Time 0.001 (0.029)	Loss 2.5671 (2.3485)	Entropy 0.52740 (0.52571)	Top-1 acc 62.891 (67.552)	Top-5 acc 81.641 (86.327)	lr 0.00024
Train [113][1430/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.029)	Loss 2.1532 (2.3484)	Entropy 0.52745 (0.52572)	Top-1 acc 69.531 (67.556)	Top-5 acc 90.625 (86.331)	lr 0.00024
Train [113][1440/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.029)	Loss 2.4901 (2.3480)	Entropy 0.52744 (0.52573)	Top-1 acc 63.281 (67.570)	Top-5 acc 81.250 (86.332)	lr 0.00024
Train [113][1450/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.029)	Loss 2.2148 (2.3471)	Entropy 0.52762 (0.52575)	Top-1 acc 72.266 (67.597)	Top-5 acc 89.062 (86.346)	lr 0.00024
Train [113][1460/3239]	Time 0.244 (0.523)	Data Time 0.001 (0.029)	Loss 2.4415 (2.3465)	Entropy 0.52767 (0.52576)	Top-1 acc 65.234 (67.610)	Top-5 acc 84.766 (86.359)	lr 0.00024
Train [113][1470/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.028)	Loss 2.3965 (2.3464)	Entropy 0.52766 (0.52577)	Top-1 acc 65.234 (67.611)	Top-5 acc 86.719 (86.357)	lr 0.00024
Train [113][1480/3239]	Time 0.228 (0.521)	Data Time 0.001 (0.028)	Loss 2.4410 (2.3466)	Entropy 0.52760 (0.52579)	Top-1 acc 63.672 (67.608)	Top-5 acc 84.766 (86.351)	lr 0.00024
Train [113][1490/3239]	Time 0.249 (0.520)	Data Time 0.001 (0.028)	Loss 2.3225 (2.3465)	Entropy 0.52750 (0.52580)	Top-1 acc 66.406 (67.612)	Top-5 acc 88.281 (86.354)	lr 0.00024
Train [113][1500/3239]	Time 0.224 (0.520)	Data Time 0.001 (0.028)	Loss 2.5093 (2.3461)	Entropy 0.52821 (0.52581)	Top-1 acc 64.453 (67.624)	Top-5 acc 84.375 (86.360)	lr 0.00024
Train [113][1510/3239]	Time 0.320 (0.519)	Data Time 0.001 (0.028)	Loss 2.3009 (2.3461)	Entropy 0.52845 (0.52583)	Top-1 acc 68.750 (67.618)	Top-5 acc 85.938 (86.358)	lr 0.00024
Train [113][1520/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.028)	Loss 2.6597 (2.3462)	Entropy 0.52869 (0.52584)	Top-1 acc 60.547 (67.615)	Top-5 acc 80.469 (86.354)	lr 0.00024
Train [113][1530/3239]	Time 0.235 (0.518)	Data Time 0.001 (0.027)	Loss 2.2023 (2.3454)	Entropy 0.52887 (0.52586)	Top-1 acc 70.703 (67.632)	Top-5 acc 90.625 (86.369)	lr 0.00024
Train [113][1540/3239]	Time 0.244 (0.517)	Data Time 0.001 (0.027)	Loss 2.1084 (2.3453)	Entropy 0.52885 (0.52588)	Top-1 acc 71.875 (67.642)	Top-5 acc 89.844 (86.371)	lr 0.00024
Train [113][1550/3239]	Time 0.294 (0.516)	Data Time 0.001 (0.027)	Loss 2.2915 (2.3452)	Entropy 0.52881 (0.52590)	Top-1 acc 68.750 (67.648)	Top-5 acc 90.234 (86.379)	lr 0.00024
Train [113][1560/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.027)	Loss 2.4602 (2.3452)	Entropy 0.52897 (0.52592)	Top-1 acc 67.188 (67.655)	Top-5 acc 83.594 (86.378)	lr 0.00024
Train [113][1570/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.027)	Loss 2.2073 (2.3448)	Entropy 0.52887 (0.52594)	Top-1 acc 69.531 (67.658)	Top-5 acc 91.016 (86.389)	lr 0.00024
Train [113][1580/3239]	Time 0.336 (0.515)	Data Time 0.001 (0.027)	Loss 2.4096 (2.3450)	Entropy 0.52872 (0.52596)	Top-1 acc 64.844 (67.651)	Top-5 acc 85.938 (86.386)	lr 0.00024
Train [113][1590/3239]	Time 0.252 (0.514)	Data Time 0.001 (0.026)	Loss 2.3835 (2.3451)	Entropy 0.52892 (0.52598)	Top-1 acc 65.625 (67.647)	Top-5 acc 84.375 (86.388)	lr 0.00024
Train [113][1600/3239]	Time 0.239 (0.513)	Data Time 0.001 (0.026)	Loss 2.3400 (2.3455)	Entropy 0.52917 (0.52599)	Top-1 acc 68.750 (67.632)	Top-5 acc 85.156 (86.376)	lr 0.00024
Train [113][1610/3239]	Time 0.229 (0.513)	Data Time 0.001 (0.026)	Loss 2.4692 (2.3458)	Entropy 0.52925 (0.52601)	Top-1 acc 62.891 (67.624)	Top-5 acc 85.156 (86.372)	lr 0.00024
Train [113][1620/3239]	Time 0.232 (0.512)	Data Time 0.001 (0.026)	Loss 2.6031 (2.3460)	Entropy 0.52879 (0.52603)	Top-1 acc 63.281 (67.621)	Top-5 acc 80.469 (86.369)	lr 0.00024
Train [113][1630/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.026)	Loss 2.2436 (2.3457)	Entropy 0.52890 (0.52605)	Top-1 acc 72.656 (67.634)	Top-5 acc 89.453 (86.375)	lr 0.00024
Train [113][1640/3239]	Time 0.237 (0.511)	Data Time 0.001 (0.026)	Loss 2.4193 (2.3455)	Entropy 0.52922 (0.52607)	Top-1 acc 64.844 (67.634)	Top-5 acc 83.984 (86.381)	lr 0.00024
Train [113][1650/3239]	Time 0.226 (0.510)	Data Time 0.001 (0.025)	Loss 2.1981 (2.3459)	Entropy 0.52954 (0.52609)	Top-1 acc 69.922 (67.625)	Top-5 acc 88.281 (86.372)	lr 0.00024
Train [113][1660/3239]	Time 0.236 (0.510)	Data Time 0.001 (0.025)	Loss 2.3739 (2.3463)	Entropy 0.52971 (0.52611)	Top-1 acc 68.359 (67.619)	Top-5 acc 84.766 (86.367)	lr 0.00024
Train [113][1670/3239]	Time 0.330 (0.509)	Data Time 0.001 (0.025)	Loss 2.3187 (2.3463)	Entropy 0.52981 (0.52613)	Top-1 acc 67.188 (67.622)	Top-5 acc 87.891 (86.369)	lr 0.00024
Train [113][1680/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.025)	Loss 2.3618 (2.3459)	Entropy 0.52968 (0.52615)	Top-1 acc 64.844 (67.628)	Top-5 acc 89.062 (86.380)	lr 0.00024
Train [113][1690/3239]	Time 0.219 (0.508)	Data Time 0.001 (0.025)	Loss 2.2710 (2.3458)	Entropy 0.52937 (0.52617)	Top-1 acc 71.875 (67.626)	Top-5 acc 88.672 (86.384)	lr 0.00024
Train [113][1700/3239]	Time 0.266 (0.507)	Data Time 0.001 (0.025)	Loss 2.5083 (2.3460)	Entropy 0.52913 (0.52619)	Top-1 acc 65.234 (67.624)	Top-5 acc 82.422 (86.380)	lr 0.00024
Train [113][1710/3239]	Time 0.228 (0.506)	Data Time 0.001 (0.025)	Loss 2.3650 (2.3463)	Entropy 0.52926 (0.52621)	Top-1 acc 69.531 (67.625)	Top-5 acc 85.156 (86.375)	lr 0.00024
Train [113][1720/3239]	Time 0.238 (0.506)	Data Time 0.001 (0.024)	Loss 2.3724 (2.3464)	Entropy 0.52909 (0.52623)	Top-1 acc 68.359 (67.621)	Top-5 acc 85.156 (86.369)	lr 0.00024
Train [113][1730/3239]	Time 0.232 (0.505)	Data Time 0.001 (0.024)	Loss 2.2509 (2.3468)	Entropy 0.52953 (0.52624)	Top-1 acc 73.438 (67.616)	Top-5 acc 86.719 (86.366)	lr 0.00024
Train [113][1740/3239]	Time 0.322 (0.505)	Data Time 0.001 (0.024)	Loss 2.3946 (2.3470)	Entropy 0.52947 (0.52626)	Top-1 acc 68.359 (67.612)	Top-5 acc 85.547 (86.360)	lr 0.00024
Train [113][1750/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.024)	Loss 2.0868 (2.3469)	Entropy 0.52928 (0.52628)	Top-1 acc 71.094 (67.614)	Top-5 acc 91.406 (86.360)	lr 0.00024
Train [113][1760/3239]	Time 0.231 (0.504)	Data Time 0.002 (0.024)	Loss 2.5200 (2.3471)	Entropy 0.52955 (0.52630)	Top-1 acc 62.109 (67.605)	Top-5 acc 83.594 (86.359)	lr 0.00024
Train [113][1770/3239]	Time 0.224 (0.503)	Data Time 0.001 (0.024)	Loss 2.3306 (2.3469)	Entropy 0.52975 (0.52632)	Top-1 acc 71.094 (67.612)	Top-5 acc 85.938 (86.361)	lr 0.00024
Train [113][1780/3239]	Time 0.234 (0.503)	Data Time 0.001 (0.024)	Loss 2.4834 (2.3471)	Entropy 0.52973 (0.52634)	Top-1 acc 65.625 (67.610)	Top-5 acc 86.328 (86.361)	lr 0.00024
Train [113][1790/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.024)	Loss 2.1547 (2.3470)	Entropy 0.52967 (0.52636)	Top-1 acc 69.531 (67.611)	Top-5 acc 89.844 (86.361)	lr 0.00024
Train [113][1800/3239]	Time 0.234 (0.502)	Data Time 0.001 (0.023)	Loss 2.2677 (2.3469)	Entropy 0.52957 (0.52637)	Top-1 acc 71.094 (67.621)	Top-5 acc 87.109 (86.365)	lr 0.00024
Train [113][1810/3239]	Time 0.248 (0.501)	Data Time 0.001 (0.023)	Loss 2.3304 (2.3468)	Entropy 0.52970 (0.52639)	Top-1 acc 66.797 (67.624)	Top-5 acc 85.547 (86.368)	lr 0.00024
Train [113][1820/3239]	Time 0.227 (0.500)	Data Time 0.001 (0.023)	Loss 2.2973 (2.3467)	Entropy 0.52975 (0.52641)	Top-1 acc 68.359 (67.625)	Top-5 acc 88.281 (86.368)	lr 0.00024
Train [113][1830/3239]	Time 0.231 (0.500)	Data Time 0.001 (0.023)	Loss 2.3617 (2.3468)	Entropy 0.52972 (0.52643)	Top-1 acc 68.750 (67.617)	Top-5 acc 85.156 (86.370)	lr 0.00024
Train [113][1840/3239]	Time 0.223 (0.499)	Data Time 0.001 (0.023)	Loss 2.4899 (2.3466)	Entropy 0.52987 (0.52645)	Top-1 acc 64.062 (67.624)	Top-5 acc 86.328 (86.371)	lr 0.00024
Train [113][1850/3239]	Time 0.248 (0.499)	Data Time 0.001 (0.023)	Loss 2.4235 (2.3462)	Entropy 0.52931 (0.52646)	Top-1 acc 66.406 (67.639)	Top-5 acc 87.500 (86.379)	lr 0.00024
Train [113][1860/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.023)	Loss 2.3107 (2.3465)	Entropy 0.52896 (0.52648)	Top-1 acc 68.359 (67.637)	Top-5 acc 86.719 (86.371)	lr 0.00024
Train [113][1870/3239]	Time 0.224 (0.498)	Data Time 0.001 (0.023)	Loss 2.3230 (2.3461)	Entropy 0.52906 (0.52649)	Top-1 acc 71.484 (67.653)	Top-5 acc 87.109 (86.378)	lr 0.00024
Train [113][1880/3239]	Time 0.227 (0.498)	Data Time 0.001 (0.023)	Loss 2.4441 (2.3464)	Entropy 0.52935 (0.52651)	Top-1 acc 64.453 (67.644)	Top-5 acc 83.203 (86.371)	lr 0.00024
Train [113][1890/3239]	Time 0.234 (0.497)	Data Time 0.001 (0.022)	Loss 2.3244 (2.3462)	Entropy 0.52919 (0.52652)	Top-1 acc 68.750 (67.651)	Top-5 acc 84.375 (86.376)	lr 0.00023
Train [113][1900/3239]	Time 0.355 (0.497)	Data Time 0.001 (0.022)	Loss 2.2107 (2.3460)	Entropy 0.52963 (0.52654)	Top-1 acc 70.703 (67.652)	Top-5 acc 87.500 (86.380)	lr 0.00023
Train [113][1910/3239]	Time 0.230 (0.496)	Data Time 0.001 (0.022)	Loss 2.3522 (2.3460)	Entropy 0.52957 (0.52655)	Top-1 acc 70.703 (67.647)	Top-5 acc 87.500 (86.382)	lr 0.00023
Train [113][1920/3239]	Time 0.222 (0.496)	Data Time 0.001 (0.022)	Loss 2.3585 (2.3464)	Entropy 0.52981 (0.52657)	Top-1 acc 69.141 (67.636)	Top-5 acc 86.719 (86.378)	lr 0.00023
Train [113][1930/3239]	Time 0.365 (0.522)	Data Time 0.003 (0.022)	Loss 2.2180 (2.3460)	Entropy 0.52959 (0.52659)	Top-1 acc 70.703 (67.646)	Top-5 acc 88.672 (86.384)	lr 0.00023
Train [113][1940/3239]	Time 0.251 (0.521)	Data Time 0.002 (0.022)	Loss 2.3229 (2.3462)	Entropy 0.52987 (0.52660)	Top-1 acc 68.359 (67.642)	Top-5 acc 87.500 (86.382)	lr 0.00023
Train [113][1950/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.022)	Loss 2.3486 (2.3458)	Entropy 0.53006 (0.52662)	Top-1 acc 66.406 (67.651)	Top-5 acc 84.375 (86.385)	lr 0.00023
Train [113][1960/3239]	Time 0.237 (0.520)	Data Time 0.001 (0.022)	Loss 2.2306 (2.3459)	Entropy 0.53015 (0.52664)	Top-1 acc 71.484 (67.649)	Top-5 acc 87.500 (86.383)	lr 0.00023
Train [113][1970/3239]	Time 0.270 (0.520)	Data Time 0.001 (0.022)	Loss 2.3599 (2.3459)	Entropy 0.53037 (0.52665)	Top-1 acc 67.578 (67.653)	Top-5 acc 83.984 (86.379)	lr 0.00023
Train [113][1980/3239]	Time 0.241 (0.519)	Data Time 0.001 (0.022)	Loss 2.3150 (2.3457)	Entropy 0.53010 (0.52667)	Top-1 acc 70.312 (67.661)	Top-5 acc 87.891 (86.380)	lr 0.00023
Train [113][1990/3239]	Time 0.244 (0.519)	Data Time 0.001 (0.021)	Loss 2.1932 (2.3457)	Entropy 0.52984 (0.52669)	Top-1 acc 69.141 (67.658)	Top-5 acc 88.672 (86.383)	lr 0.00023
Train [113][2000/3239]	Time 0.238 (0.519)	Data Time 0.001 (0.021)	Loss 2.3703 (2.3457)	Entropy 0.52992 (0.52671)	Top-1 acc 69.141 (67.662)	Top-5 acc 84.766 (86.385)	lr 0.00023
Train [113][2010/3239]	Time 0.237 (0.518)	Data Time 0.001 (0.021)	Loss 2.2786 (2.3455)	Entropy 0.52999 (0.52672)	Top-1 acc 70.312 (67.670)	Top-5 acc 86.328 (86.386)	lr 0.00023
Train [113][2020/3239]	Time 0.239 (0.517)	Data Time 0.001 (0.021)	Loss 2.3033 (2.3455)	Entropy 0.53022 (0.52674)	Top-1 acc 70.703 (67.671)	Top-5 acc 86.328 (86.386)	lr 0.00023
Train [113][2030/3239]	Time 0.426 (0.517)	Data Time 0.002 (0.021)	Loss 2.2482 (2.3455)	Entropy 0.53034 (0.52676)	Top-1 acc 67.969 (67.673)	Top-5 acc 89.062 (86.385)	lr 0.00023
Train [113][2040/3239]	Time 0.257 (0.517)	Data Time 0.001 (0.021)	Loss 2.3989 (2.3455)	Entropy 0.53037 (0.52677)	Top-1 acc 60.547 (67.668)	Top-5 acc 88.281 (86.384)	lr 0.00023
Train [113][2050/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.021)	Loss 2.4984 (2.3453)	Entropy 0.53025 (0.52679)	Top-1 acc 60.547 (67.672)	Top-5 acc 84.375 (86.386)	lr 0.00023
Train [113][2060/3239]	Time 0.321 (0.516)	Data Time 0.001 (0.021)	Loss 2.4521 (2.3452)	Entropy 0.53024 (0.52681)	Top-1 acc 67.578 (67.677)	Top-5 acc 82.812 (86.385)	lr 0.00023
Train [113][2070/3239]	Time 0.235 (0.515)	Data Time 0.001 (0.021)	Loss 2.2873 (2.3456)	Entropy 0.53077 (0.52683)	Top-1 acc 66.406 (67.663)	Top-5 acc 89.062 (86.379)	lr 0.00023
Train [113][2080/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.021)	Loss 2.3070 (2.3455)	Entropy 0.53021 (0.52684)	Top-1 acc 70.703 (67.664)	Top-5 acc 85.938 (86.383)	lr 0.00023
Train [113][2090/3239]	Time 0.254 (0.515)	Data Time 0.002 (0.021)	Loss 2.3290 (2.3457)	Entropy 0.52947 (0.52686)	Top-1 acc 71.094 (67.666)	Top-5 acc 86.719 (86.377)	lr 0.00023
Train [113][2100/3239]	Time 0.230 (0.514)	Data Time 0.001 (0.020)	Loss 2.3429 (2.3456)	Entropy 0.52900 (0.52687)	Top-1 acc 67.188 (67.667)	Top-5 acc 88.281 (86.378)	lr 0.00023
Train [113][2110/3239]	Time 0.256 (0.514)	Data Time 0.001 (0.020)	Loss 2.4761 (2.3453)	Entropy 0.52896 (0.52688)	Top-1 acc 65.234 (67.677)	Top-5 acc 85.156 (86.384)	lr 0.00023
Train [113][2120/3239]	Time 0.236 (0.513)	Data Time 0.001 (0.020)	Loss 2.2731 (2.3453)	Entropy 0.52932 (0.52689)	Top-1 acc 69.141 (67.676)	Top-5 acc 86.719 (86.384)	lr 0.00023
Train [113][2130/3239]	Time 0.321 (0.513)	Data Time 0.001 (0.020)	Loss 2.5201 (2.3452)	Entropy 0.52963 (0.52690)	Top-1 acc 66.016 (67.678)	Top-5 acc 85.938 (86.386)	lr 0.00023
Train [113][2140/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.020)	Loss 2.0990 (2.3448)	Entropy 0.52960 (0.52692)	Top-1 acc 73.828 (67.691)	Top-5 acc 91.406 (86.393)	lr 0.00023
Train [113][2150/3239]	Time 0.227 (0.512)	Data Time 0.001 (0.020)	Loss 2.0433 (2.3446)	Entropy 0.52988 (0.52693)	Top-1 acc 74.609 (67.696)	Top-5 acc 90.625 (86.397)	lr 0.00023
Train [113][2160/3239]	Time 0.259 (0.512)	Data Time 0.001 (0.020)	Loss 2.3240 (2.3450)	Entropy 0.53009 (0.52694)	Top-1 acc 68.750 (67.683)	Top-5 acc 83.984 (86.391)	lr 0.00023
Train [113][2170/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.020)	Loss 2.2966 (2.3451)	Entropy 0.53020 (0.52696)	Top-1 acc 71.484 (67.683)	Top-5 acc 86.719 (86.387)	lr 0.00023
Train [113][2180/3239]	Time 0.230 (0.511)	Data Time 0.001 (0.020)	Loss 2.3543 (2.3452)	Entropy 0.53022 (0.52697)	Top-1 acc 62.500 (67.674)	Top-5 acc 85.547 (86.386)	lr 0.00023
Train [113][2190/3239]	Time 0.251 (0.510)	Data Time 0.001 (0.020)	Loss 2.3656 (2.3453)	Entropy 0.53039 (0.52699)	Top-1 acc 68.750 (67.673)	Top-5 acc 87.109 (86.382)	lr 0.00023
Train [113][2200/3239]	Time 0.230 (0.510)	Data Time 0.001 (0.020)	Loss 2.2674 (2.3452)	Entropy 0.53026 (0.52700)	Top-1 acc 67.969 (67.669)	Top-5 acc 88.672 (86.385)	lr 0.00023
Train [113][2210/3239]	Time 0.224 (0.509)	Data Time 0.001 (0.019)	Loss 2.2612 (2.3451)	Entropy 0.53031 (0.52702)	Top-1 acc 67.578 (67.670)	Top-5 acc 88.281 (86.387)	lr 0.00023
Train [113][2220/3239]	Time 0.354 (0.509)	Data Time 0.001 (0.019)	Loss 2.4018 (2.3451)	Entropy 0.53024 (0.52703)	Top-1 acc 64.453 (67.669)	Top-5 acc 85.547 (86.385)	lr 0.00023
Train [113][2230/3239]	Time 0.235 (0.508)	Data Time 0.002 (0.019)	Loss 2.1940 (2.3452)	Entropy 0.53048 (0.52705)	Top-1 acc 72.266 (67.672)	Top-5 acc 87.891 (86.385)	lr 0.00023
Train [113][2240/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.019)	Loss 2.4375 (2.3453)	Entropy 0.53018 (0.52706)	Top-1 acc 67.188 (67.666)	Top-5 acc 84.766 (86.381)	lr 0.00023
Train [113][2250/3239]	Time 0.235 (0.508)	Data Time 0.001 (0.019)	Loss 2.2133 (2.3454)	Entropy 0.52988 (0.52707)	Top-1 acc 71.484 (67.668)	Top-5 acc 89.062 (86.379)	lr 0.00023
Train [113][2260/3239]	Time 0.264 (0.507)	Data Time 0.001 (0.019)	Loss 2.1124 (2.3452)	Entropy 0.53005 (0.52709)	Top-1 acc 76.953 (67.669)	Top-5 acc 89.844 (86.380)	lr 0.00023
Train [113][2270/3239]	Time 0.226 (0.507)	Data Time 0.001 (0.019)	Loss 2.5335 (2.3453)	Entropy 0.53007 (0.52710)	Top-1 acc 67.578 (67.672)	Top-5 acc 83.594 (86.378)	lr 0.00023
Train [113][2280/3239]	Time 0.224 (0.506)	Data Time 0.001 (0.019)	Loss 2.5277 (2.3454)	Entropy 0.53007 (0.52711)	Top-1 acc 66.016 (67.668)	Top-5 acc 83.203 (86.375)	lr 0.00023
Train [113][2290/3239]	Time 0.322 (0.506)	Data Time 0.001 (0.019)	Loss 2.1596 (2.3453)	Entropy 0.52984 (0.52713)	Top-1 acc 68.359 (67.671)	Top-5 acc 91.406 (86.375)	lr 0.00023
Train [113][2300/3239]	Time 0.231 (0.505)	Data Time 0.001 (0.019)	Loss 2.3654 (2.3454)	Entropy 0.52992 (0.52714)	Top-1 acc 68.359 (67.668)	Top-5 acc 83.203 (86.373)	lr 0.00023
Train [113][2310/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.019)	Loss 2.3651 (2.3453)	Entropy 0.52996 (0.52715)	Top-1 acc 66.797 (67.671)	Top-5 acc 83.984 (86.372)	lr 0.00023
Train [113][2320/3239]	Time 0.223 (0.504)	Data Time 0.001 (0.019)	Loss 2.5711 (2.3455)	Entropy 0.53007 (0.52716)	Top-1 acc 60.547 (67.666)	Top-5 acc 83.203 (86.367)	lr 0.00023
Train [113][2330/3239]	Time 0.233 (0.504)	Data Time 0.001 (0.019)	Loss 2.4679 (2.3454)	Entropy 0.53015 (0.52717)	Top-1 acc 64.453 (67.669)	Top-5 acc 84.375 (86.367)	lr 0.00023
Train [113][2340/3239]	Time 0.240 (0.504)	Data Time 0.001 (0.018)	Loss 2.3883 (2.3454)	Entropy 0.53018 (0.52719)	Top-1 acc 69.141 (67.671)	Top-5 acc 83.594 (86.364)	lr 0.00023
Train [113][2350/3239]	Time 0.290 (0.504)	Data Time 0.001 (0.018)	Loss 2.2580 (2.3455)	Entropy 0.53004 (0.52720)	Top-1 acc 66.797 (67.667)	Top-5 acc 88.281 (86.364)	lr 0.00023
Train [113][2360/3239]	Time 0.270 (0.503)	Data Time 0.002 (0.018)	Loss 2.3060 (2.3452)	Entropy 0.53026 (0.52721)	Top-1 acc 72.656 (67.675)	Top-5 acc 85.547 (86.367)	lr 0.00023
Train [113][2370/3239]	Time 0.232 (0.503)	Data Time 0.001 (0.018)	Loss 2.3716 (2.3452)	Entropy 0.53017 (0.52722)	Top-1 acc 69.141 (67.677)	Top-5 acc 83.984 (86.366)	lr 0.00023
Train [113][2380/3239]	Time 0.245 (0.503)	Data Time 0.001 (0.018)	Loss 2.5708 (2.3454)	Entropy 0.52992 (0.52723)	Top-1 acc 64.453 (67.672)	Top-5 acc 82.812 (86.360)	lr 0.00023
Train [113][2390/3239]	Time 0.243 (0.502)	Data Time 0.001 (0.018)	Loss 2.6674 (2.3455)	Entropy 0.52996 (0.52725)	Top-1 acc 60.547 (67.666)	Top-5 acc 78.516 (86.357)	lr 0.00023
Train [113][2400/3239]	Time 0.238 (0.502)	Data Time 0.001 (0.018)	Loss 2.1476 (2.3458)	Entropy 0.53000 (0.52726)	Top-1 acc 74.219 (67.662)	Top-5 acc 89.062 (86.354)	lr 0.00023
Train [113][2410/3239]	Time 0.236 (0.501)	Data Time 0.001 (0.018)	Loss 2.2549 (2.3459)	Entropy 0.52994 (0.52727)	Top-1 acc 74.219 (67.662)	Top-5 acc 87.109 (86.353)	lr 0.00022
Train [113][2420/3239]	Time 0.249 (0.501)	Data Time 0.001 (0.018)	Loss 2.3001 (2.3458)	Entropy 0.52999 (0.52728)	Top-1 acc 67.969 (67.658)	Top-5 acc 89.062 (86.353)	lr 0.00022
Train [113][2430/3239]	Time 0.231 (0.501)	Data Time 0.001 (0.018)	Loss 2.3721 (2.3458)	Entropy 0.53015 (0.52729)	Top-1 acc 66.016 (67.660)	Top-5 acc 86.719 (86.354)	lr 0.00022
Train [113][2440/3239]	Time 0.229 (0.500)	Data Time 0.001 (0.018)	Loss 2.2243 (2.3456)	Entropy 0.52989 (0.52730)	Top-1 acc 71.875 (67.663)	Top-5 acc 88.281 (86.360)	lr 0.00022
Train [113][2450/3239]	Time 0.327 (0.500)	Data Time 0.001 (0.018)	Loss 2.2574 (2.3455)	Entropy 0.52999 (0.52731)	Top-1 acc 70.312 (67.668)	Top-5 acc 88.672 (86.363)	lr 0.00022
Train [113][2460/3239]	Time 0.243 (0.499)	Data Time 0.001 (0.018)	Loss 2.2684 (2.3453)	Entropy 0.52995 (0.52732)	Top-1 acc 67.969 (67.671)	Top-5 acc 87.500 (86.364)	lr 0.00022
Train [113][2470/3239]	Time 0.232 (0.499)	Data Time 0.001 (0.018)	Loss 2.3444 (2.3452)	Entropy 0.53004 (0.52733)	Top-1 acc 67.188 (67.673)	Top-5 acc 85.156 (86.364)	lr 0.00022
Train [113][2480/3239]	Time 0.266 (0.499)	Data Time 0.001 (0.018)	Loss 2.4018 (2.3450)	Entropy 0.52993 (0.52735)	Top-1 acc 66.016 (67.676)	Top-5 acc 85.547 (86.367)	lr 0.00022
Train [113][2490/3239]	Time 0.228 (0.498)	Data Time 0.001 (0.017)	Loss 2.4888 (2.3449)	Entropy 0.52996 (0.52736)	Top-1 acc 64.453 (67.676)	Top-5 acc 83.203 (86.369)	lr 0.00022
Train [113][2500/3239]	Time 0.236 (0.498)	Data Time 0.001 (0.017)	Loss 2.3797 (2.3450)	Entropy 0.53012 (0.52737)	Top-1 acc 66.797 (67.671)	Top-5 acc 86.719 (86.365)	lr 0.00022
Train [113][2510/3239]	Time 0.227 (0.498)	Data Time 0.001 (0.017)	Loss 2.3754 (2.3449)	Entropy 0.53010 (0.52738)	Top-1 acc 66.406 (67.675)	Top-5 acc 86.719 (86.366)	lr 0.00022
Train [113][2520/3239]	Time 0.326 (0.497)	Data Time 0.001 (0.017)	Loss 2.1145 (2.3447)	Entropy 0.53034 (0.52739)	Top-1 acc 76.172 (67.683)	Top-5 acc 89.844 (86.368)	lr 0.00022
Train [113][2530/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.017)	Loss 2.1918 (2.3446)	Entropy 0.53058 (0.52740)	Top-1 acc 73.047 (67.686)	Top-5 acc 86.719 (86.367)	lr 0.00022
Train [113][2540/3239]	Time 0.240 (0.497)	Data Time 0.001 (0.017)	Loss 2.2445 (2.3448)	Entropy 0.53072 (0.52741)	Top-1 acc 69.531 (67.681)	Top-5 acc 88.281 (86.365)	lr 0.00022
Train [113][2550/3239]	Time 0.225 (0.496)	Data Time 0.001 (0.017)	Loss 2.1713 (2.3452)	Entropy 0.53075 (0.52743)	Top-1 acc 73.438 (67.671)	Top-5 acc 89.844 (86.358)	lr 0.00022
Train [113][2560/3239]	Time 0.251 (0.496)	Data Time 0.001 (0.017)	Loss 2.4433 (2.3453)	Entropy 0.53028 (0.52744)	Top-1 acc 69.922 (67.669)	Top-5 acc 85.547 (86.358)	lr 0.00022
Train [113][2570/3239]	Time 0.229 (0.496)	Data Time 0.001 (0.017)	Loss 2.2519 (2.3453)	Entropy 0.53055 (0.52745)	Top-1 acc 69.922 (67.665)	Top-5 acc 85.547 (86.357)	lr 0.00022
Train [113][2580/3239]	Time 0.277 (0.515)	Data Time 0.005 (0.017)	Loss 2.4682 (2.3450)	Entropy 0.53073 (0.52746)	Top-1 acc 64.453 (67.669)	Top-5 acc 86.719 (86.362)	lr 0.00022
Train [113][2590/3239]	Time 0.235 (0.515)	Data Time 0.002 (0.017)	Loss 2.3640 (2.3450)	Entropy 0.53094 (0.52748)	Top-1 acc 69.922 (67.668)	Top-5 acc 85.547 (86.363)	lr 0.00022
Train [113][2600/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.017)	Loss 2.3468 (2.3449)	Entropy 0.53098 (0.52749)	Top-1 acc 66.016 (67.666)	Top-5 acc 87.109 (86.370)	lr 0.00022
Train [113][2610/3239]	Time 0.324 (0.514)	Data Time 0.001 (0.017)	Loss 2.4494 (2.3449)	Entropy 0.53077 (0.52750)	Top-1 acc 65.625 (67.668)	Top-5 acc 86.328 (86.371)	lr 0.00022
Train [113][2620/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.017)	Loss 2.2898 (2.3448)	Entropy 0.53063 (0.52751)	Top-1 acc 69.531 (67.669)	Top-5 acc 86.719 (86.372)	lr 0.00022
Train [113][2630/3239]	Time 0.239 (0.514)	Data Time 0.001 (0.017)	Loss 2.4447 (2.3446)	Entropy 0.53073 (0.52753)	Top-1 acc 65.234 (67.672)	Top-5 acc 87.109 (86.374)	lr 0.00022
Train [113][2640/3239]	Time 0.226 (0.513)	Data Time 0.001 (0.017)	Loss 2.3512 (2.3446)	Entropy 0.53074 (0.52754)	Top-1 acc 71.875 (67.676)	Top-5 acc 85.938 (86.372)	lr 0.00022
Train [113][2650/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.017)	Loss 2.2588 (2.3443)	Entropy 0.53070 (0.52755)	Top-1 acc 70.703 (67.686)	Top-5 acc 87.891 (86.378)	lr 0.00022
Train [113][2660/3239]	Time 0.228 (0.513)	Data Time 0.001 (0.016)	Loss 2.0619 (2.3441)	Entropy 0.53053 (0.52756)	Top-1 acc 77.344 (67.690)	Top-5 acc 92.188 (86.381)	lr 0.00022
Train [113][2670/3239]	Time 0.282 (0.513)	Data Time 0.002 (0.016)	Loss 2.1024 (2.3440)	Entropy 0.53058 (0.52757)	Top-1 acc 73.047 (67.694)	Top-5 acc 91.016 (86.382)	lr 0.00022
Train [113][2680/3239]	Time 0.320 (0.512)	Data Time 0.001 (0.016)	Loss 2.5733 (2.3441)	Entropy 0.53042 (0.52758)	Top-1 acc 60.156 (67.692)	Top-5 acc 84.766 (86.380)	lr 0.00022
Train [113][2690/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.016)	Loss 2.2230 (2.3441)	Entropy 0.53023 (0.52759)	Top-1 acc 71.484 (67.691)	Top-5 acc 88.281 (86.379)	lr 0.00022
Train [113][2700/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.016)	Loss 2.3504 (2.3442)	Entropy 0.53006 (0.52760)	Top-1 acc 65.234 (67.686)	Top-5 acc 85.547 (86.375)	lr 0.00022
Train [113][2710/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.016)	Loss 2.1506 (2.3442)	Entropy 0.52990 (0.52761)	Top-1 acc 75.000 (67.685)	Top-5 acc 88.281 (86.373)	lr 0.00022
Train [113][2720/3239]	Time 0.231 (0.511)	Data Time 0.001 (0.016)	Loss 2.4295 (2.3445)	Entropy 0.53003 (0.52762)	Top-1 acc 67.188 (67.680)	Top-5 acc 84.766 (86.368)	lr 0.00022
Train [113][2730/3239]	Time 0.225 (0.511)	Data Time 0.001 (0.016)	Loss 2.3216 (2.3445)	Entropy 0.52981 (0.52763)	Top-1 acc 66.016 (67.677)	Top-5 acc 87.109 (86.370)	lr 0.00022
Train [113][2740/3239]	Time 0.262 (0.510)	Data Time 0.001 (0.016)	Loss 2.1788 (2.3442)	Entropy 0.52992 (0.52764)	Top-1 acc 73.047 (67.681)	Top-5 acc 86.719 (86.373)	lr 0.00022
Train [113][2750/3239]	Time 0.227 (0.510)	Data Time 0.001 (0.016)	Loss 2.1902 (2.3442)	Entropy 0.53009 (0.52765)	Top-1 acc 69.922 (67.685)	Top-5 acc 87.500 (86.374)	lr 0.00022
Train [113][2760/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.016)	Loss 2.4810 (2.3443)	Entropy 0.52988 (0.52765)	Top-1 acc 64.453 (67.688)	Top-5 acc 80.859 (86.371)	lr 0.00022
Train [113][2770/3239]	Time 0.324 (0.509)	Data Time 0.001 (0.016)	Loss 2.3090 (2.3442)	Entropy 0.52980 (0.52766)	Top-1 acc 70.312 (67.692)	Top-5 acc 85.547 (86.371)	lr 0.00022
Train [113][2780/3239]	Time 0.231 (0.509)	Data Time 0.001 (0.016)	Loss 2.4168 (2.3442)	Entropy 0.52986 (0.52767)	Top-1 acc 66.406 (67.692)	Top-5 acc 85.938 (86.372)	lr 0.00022
Train [113][2790/3239]	Time 0.225 (0.508)	Data Time 0.001 (0.016)	Loss 2.3086 (2.3442)	Entropy 0.53001 (0.52768)	Top-1 acc 69.141 (67.693)	Top-5 acc 85.156 (86.369)	lr 0.00022
Train [113][2800/3239]	Time 0.233 (0.508)	Data Time 0.001 (0.016)	Loss 2.3438 (2.3442)	Entropy 0.53016 (0.52769)	Top-1 acc 64.453 (67.689)	Top-5 acc 85.156 (86.370)	lr 0.00022
Train [113][2810/3239]	Time 0.234 (0.508)	Data Time 0.001 (0.016)	Loss 2.3928 (2.3442)	Entropy 0.53019 (0.52770)	Top-1 acc 62.109 (67.688)	Top-5 acc 86.328 (86.368)	lr 0.00022
Train [113][2820/3239]	Time 0.223 (0.507)	Data Time 0.001 (0.016)	Loss 2.5277 (2.3443)	Entropy 0.53030 (0.52770)	Top-1 acc 60.547 (67.684)	Top-5 acc 83.984 (86.367)	lr 0.00022
Train [113][2830/3239]	Time 0.228 (0.507)	Data Time 0.001 (0.016)	Loss 2.5321 (2.3443)	Entropy 0.53067 (0.52771)	Top-1 acc 64.844 (67.683)	Top-5 acc 81.250 (86.366)	lr 0.00022
Train [113][2840/3239]	Time 0.325 (0.507)	Data Time 0.001 (0.016)	Loss 2.3146 (2.3443)	Entropy 0.53086 (0.52773)	Top-1 acc 70.703 (67.685)	Top-5 acc 87.891 (86.368)	lr 0.00022
Train [113][2850/3239]	Time 0.236 (0.506)	Data Time 0.001 (0.015)	Loss 2.3377 (2.3440)	Entropy 0.53100 (0.52774)	Top-1 acc 69.531 (67.690)	Top-5 acc 84.766 (86.371)	lr 0.00022
Train [113][2860/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.015)	Loss 2.3329 (2.3441)	Entropy 0.53078 (0.52775)	Top-1 acc 71.484 (67.691)	Top-5 acc 87.109 (86.371)	lr 0.00022
Train [113][2870/3239]	Time 0.229 (0.506)	Data Time 0.001 (0.015)	Loss 2.3969 (2.3441)	Entropy 0.53078 (0.52776)	Top-1 acc 69.141 (67.690)	Top-5 acc 83.984 (86.367)	lr 0.00022
Train [113][2880/3239]	Time 0.224 (0.505)	Data Time 0.001 (0.015)	Loss 2.2076 (2.3440)	Entropy 0.53068 (0.52777)	Top-1 acc 70.703 (67.692)	Top-5 acc 89.062 (86.372)	lr 0.00022
Train [113][2890/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.015)	Loss 2.3583 (2.3440)	Entropy 0.53081 (0.52778)	Top-1 acc 67.578 (67.693)	Top-5 acc 86.719 (86.372)	lr 0.00022
Train [113][2900/3239]	Time 0.229 (0.505)	Data Time 0.001 (0.015)	Loss 2.0821 (2.3440)	Entropy 0.53073 (0.52779)	Top-1 acc 73.828 (67.693)	Top-5 acc 91.797 (86.372)	lr 0.00022
Train [113][2910/3239]	Time 0.228 (0.505)	Data Time 0.001 (0.015)	Loss 2.3869 (2.3443)	Entropy 0.53014 (0.52780)	Top-1 acc 69.531 (67.689)	Top-5 acc 87.109 (86.370)	lr 0.00022
Train [113][2920/3239]	Time 0.232 (0.504)	Data Time 0.001 (0.015)	Loss 2.4841 (2.3442)	Entropy 0.53020 (0.52781)	Top-1 acc 63.672 (67.693)	Top-5 acc 83.203 (86.369)	lr 0.00022
Train [113][2930/3239]	Time 0.333 (0.504)	Data Time 0.001 (0.015)	Loss 2.5780 (2.3443)	Entropy 0.53007 (0.52781)	Top-1 acc 63.281 (67.691)	Top-5 acc 83.203 (86.367)	lr 0.00022
Train [113][2940/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.015)	Loss 2.2907 (2.3441)	Entropy 0.52960 (0.52782)	Top-1 acc 65.625 (67.695)	Top-5 acc 89.062 (86.371)	lr 0.00021
Train [113][2950/3239]	Time 0.229 (0.503)	Data Time 0.001 (0.015)	Loss 2.4537 (2.3444)	Entropy 0.52975 (0.52783)	Top-1 acc 62.891 (67.688)	Top-5 acc 84.766 (86.368)	lr 0.00021
Train [113][2960/3239]	Time 0.222 (0.503)	Data Time 0.001 (0.015)	Loss 2.6144 (2.3443)	Entropy 0.52986 (0.52783)	Top-1 acc 58.984 (67.688)	Top-5 acc 81.250 (86.370)	lr 0.00021
Train [113][2970/3239]	Time 0.261 (0.503)	Data Time 0.001 (0.015)	Loss 2.2597 (2.3442)	Entropy 0.52940 (0.52784)	Top-1 acc 71.484 (67.689)	Top-5 acc 87.500 (86.369)	lr 0.00021
Train [113][2980/3239]	Time 0.232 (0.503)	Data Time 0.001 (0.015)	Loss 2.5260 (2.3442)	Entropy 0.52937 (0.52785)	Top-1 acc 66.406 (67.690)	Top-5 acc 81.250 (86.371)	lr 0.00021
Train [113][2990/3239]	Time 0.254 (0.503)	Data Time 0.001 (0.015)	Loss 2.3158 (2.3442)	Entropy 0.52921 (0.52785)	Top-1 acc 67.578 (67.690)	Top-5 acc 89.453 (86.370)	lr 0.00021
Train [113][3000/3239]	Time 0.320 (0.502)	Data Time 0.001 (0.015)	Loss 2.4021 (2.3443)	Entropy 0.52964 (0.52786)	Top-1 acc 68.750 (67.690)	Top-5 acc 85.547 (86.367)	lr 0.00021
Train [113][3010/3239]	Time 0.232 (0.502)	Data Time 0.001 (0.015)	Loss 2.2340 (2.3443)	Entropy 0.52980 (0.52786)	Top-1 acc 69.141 (67.692)	Top-5 acc 87.891 (86.368)	lr 0.00021
Train [113][3020/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.015)	Loss 2.6656 (2.3445)	Entropy 0.52964 (0.52787)	Top-1 acc 59.766 (67.682)	Top-5 acc 79.297 (86.363)	lr 0.00021
Train [113][3030/3239]	Time 0.227 (0.501)	Data Time 0.001 (0.015)	Loss 2.2982 (2.3444)	Entropy 0.52959 (0.52787)	Top-1 acc 69.531 (67.685)	Top-5 acc 87.891 (86.365)	lr 0.00021
Train [113][3040/3239]	Time 0.235 (0.501)	Data Time 0.001 (0.015)	Loss 2.3757 (2.3445)	Entropy 0.52917 (0.52788)	Top-1 acc 66.797 (67.681)	Top-5 acc 84.375 (86.364)	lr 0.00021
Train [113][3050/3239]	Time 0.234 (0.501)	Data Time 0.001 (0.015)	Loss 2.3859 (2.3446)	Entropy 0.52938 (0.52788)	Top-1 acc 64.844 (67.680)	Top-5 acc 83.984 (86.362)	lr 0.00021
Train [113][3060/3239]	Time 0.229 (0.500)	Data Time 0.001 (0.015)	Loss 2.2954 (2.3445)	Entropy 0.52929 (0.52789)	Top-1 acc 71.484 (67.683)	Top-5 acc 87.891 (86.361)	lr 0.00021
Train [113][3070/3239]	Time 0.239 (0.500)	Data Time 0.001 (0.014)	Loss 2.3921 (2.3444)	Entropy 0.52941 (0.52789)	Top-1 acc 66.797 (67.684)	Top-5 acc 87.109 (86.362)	lr 0.00021
Train [113][3080/3239]	Time 0.235 (0.500)	Data Time 0.001 (0.014)	Loss 2.1393 (2.3443)	Entropy 0.52954 (0.52790)	Top-1 acc 71.094 (67.688)	Top-5 acc 89.844 (86.363)	lr 0.00021
Train [113][3090/3239]	Time 0.231 (0.500)	Data Time 0.001 (0.014)	Loss 2.3618 (2.3443)	Entropy 0.52973 (0.52790)	Top-1 acc 65.234 (67.688)	Top-5 acc 87.109 (86.363)	lr 0.00021
Train [113][3100/3239]	Time 0.225 (0.499)	Data Time 0.001 (0.014)	Loss 2.3817 (2.3445)	Entropy 0.53007 (0.52791)	Top-1 acc 66.016 (67.686)	Top-5 acc 87.109 (86.358)	lr 0.00021
Train [113][3110/3239]	Time 0.229 (0.499)	Data Time 0.001 (0.014)	Loss 2.5053 (2.3445)	Entropy 0.53022 (0.52792)	Top-1 acc 65.234 (67.685)	Top-5 acc 83.594 (86.356)	lr 0.00021
Train [113][3120/3239]	Time 0.227 (0.499)	Data Time 0.001 (0.014)	Loss 2.2734 (2.3445)	Entropy 0.53032 (0.52792)	Top-1 acc 69.141 (67.684)	Top-5 acc 87.500 (86.355)	lr 0.00021
Train [113][3130/3239]	Time 0.228 (0.498)	Data Time 0.001 (0.014)	Loss 2.2848 (2.3442)	Entropy 0.53058 (0.52793)	Top-1 acc 71.484 (67.689)	Top-5 acc 84.766 (86.357)	lr 0.00021
Train [113][3140/3239]	Time 0.267 (0.498)	Data Time 0.001 (0.014)	Loss 2.0730 (2.3443)	Entropy 0.53067 (0.52794)	Top-1 acc 73.828 (67.688)	Top-5 acc 92.969 (86.356)	lr 0.00021
Train [113][3150/3239]	Time 0.246 (0.498)	Data Time 0.001 (0.014)	Loss 2.2048 (2.3443)	Entropy 0.53057 (0.52795)	Top-1 acc 73.047 (67.686)	Top-5 acc 88.281 (86.355)	lr 0.00021
Train [113][3160/3239]	Time 0.329 (0.497)	Data Time 0.001 (0.014)	Loss 2.2277 (2.3444)	Entropy 0.53081 (0.52796)	Top-1 acc 74.609 (67.685)	Top-5 acc 89.453 (86.353)	lr 0.00021
Train [113][3170/3239]	Time 0.235 (0.497)	Data Time 0.001 (0.014)	Loss 2.3356 (2.3444)	Entropy 0.53072 (0.52797)	Top-1 acc 69.922 (67.684)	Top-5 acc 85.156 (86.352)	lr 0.00021
Train [113][3180/3239]	Time 0.222 (0.497)	Data Time 0.000 (0.014)	Loss 2.2975 (2.3444)	Entropy 0.53077 (0.52798)	Top-1 acc 69.922 (67.684)	Top-5 acc 89.062 (86.356)	lr 0.00021
Train [113][3190/3239]	Time 0.230 (0.497)	Data Time 0.000 (0.014)	Loss 2.1557 (2.3444)	Entropy 0.53063 (0.52798)	Top-1 acc 74.609 (67.681)	Top-5 acc 87.500 (86.354)	lr 0.00021
Train [113][3200/3239]	Time 0.217 (0.496)	Data Time 0.000 (0.014)	Loss 2.2522 (2.3443)	Entropy 0.53101 (0.52799)	Top-1 acc 69.141 (67.682)	Top-5 acc 89.062 (86.354)	lr 0.00021
Train [113][3210/3239]	Time 0.222 (0.496)	Data Time 0.000 (0.014)	Loss 2.3697 (2.3446)	Entropy 0.53038 (0.52800)	Top-1 acc 65.234 (67.673)	Top-5 acc 84.375 (86.349)	lr 0.00021
Train [113][3220/3239]	Time 0.222 (0.495)	Data Time 0.000 (0.014)	Loss 2.3142 (2.3446)	Entropy 0.53033 (0.52801)	Top-1 acc 69.141 (67.673)	Top-5 acc 87.109 (86.350)	lr 0.00021
Train [113][3230/3239]	Time 0.303 (0.495)	Data Time 0.000 (0.014)	Loss 2.5242 (2.3447)	Entropy 0.53024 (0.52802)	Top-1 acc 60.547 (67.670)	Top-5 acc 85.156 (86.350)	lr 0.00021
Train [113][3239/3239]	Time 1.332 (0.510)	Data Time 0.000 (0.014)	Loss 2.7243 (2.3447)	Entropy 0.53001 (0.52802)	Top-1 acc 59.259 (67.670)	Top-5 acc 81.481 (86.351)	lr 0.00021
==========Valid [113/120]	loss 1.170	top-1 acc 72.973 (73.154)	top-5 acc 90.585	Train top-1 67.670	top-5 86.351	Entropy 0.53001	Latency-None: 0.000ms	Flops: 539.00M
Train [114][0/3239]	Time 37.825 (37.825)	Data Time 36.878 (36.878)	Loss 2.2736 (2.2736)	Entropy 0.52997 (0.52997)	Top-1 acc 71.484 (71.484)	Top-5 acc 87.500 (87.500)	lr 0.00021
Train [114][10/3239]	Time 0.247 (4.075)	Data Time 0.001 (3.462)	Loss 2.2678 (2.3812)	Entropy 0.53014 (0.53002)	Top-1 acc 67.188 (66.371)	Top-5 acc 87.109 (85.298)	lr 0.00021
Train [114][20/3239]	Time 0.230 (2.331)	Data Time 0.001 (1.814)	Loss 2.1003 (2.3064)	Entropy 0.53041 (0.53012)	Top-1 acc 75.391 (68.080)	Top-5 acc 89.062 (86.849)	lr 0.00021
Train [114][30/3239]	Time 0.240 (1.713)	Data Time 0.001 (1.229)	Loss 2.3458 (2.3179)	Entropy 0.53073 (0.53024)	Top-1 acc 66.797 (67.755)	Top-5 acc 84.375 (86.593)	lr 0.00021
Train [114][40/3239]	Time 0.236 (1.399)	Data Time 0.001 (0.930)	Loss 2.1696 (2.3063)	Entropy 0.53079 (0.53038)	Top-1 acc 74.219 (68.331)	Top-5 acc 89.453 (86.766)	lr 0.00021
Train [114][50/3239]	Time 0.235 (1.210)	Data Time 0.001 (0.748)	Loss 2.5800 (2.3101)	Entropy 0.53068 (0.53044)	Top-1 acc 60.938 (68.421)	Top-5 acc 83.203 (86.734)	lr 0.00021
Train [114][60/3239]	Time 0.369 (1.083)	Data Time 0.001 (0.626)	Loss 2.3523 (2.3245)	Entropy 0.53051 (0.53046)	Top-1 acc 69.531 (68.135)	Top-5 acc 85.938 (86.507)	lr 0.00021
Train [114][70/3239]	Time 0.244 (0.991)	Data Time 0.001 (0.538)	Loss 2.2112 (2.3161)	Entropy 0.53065 (0.53047)	Top-1 acc 68.359 (68.139)	Top-5 acc 89.453 (86.812)	lr 0.00021
Train [114][80/3239]	Time 0.235 (0.921)	Data Time 0.001 (0.472)	Loss 2.3197 (2.3248)	Entropy 0.53071 (0.53050)	Top-1 acc 65.234 (67.848)	Top-5 acc 86.719 (86.651)	lr 0.00021
Train [114][90/3239]	Time 0.244 (0.868)	Data Time 0.001 (0.420)	Loss 2.2725 (2.3200)	Entropy 0.53064 (0.53053)	Top-1 acc 68.750 (67.866)	Top-5 acc 87.891 (86.779)	lr 0.00021
Train [114][100/3239]	Time 0.270 (0.823)	Data Time 0.001 (0.378)	Loss 2.1281 (2.3300)	Entropy 0.53056 (0.53053)	Top-1 acc 72.266 (67.586)	Top-5 acc 90.234 (86.665)	lr 0.00021
Train [114][110/3239]	Time 0.270 (0.787)	Data Time 0.001 (0.345)	Loss 2.2178 (2.3299)	Entropy 0.53051 (0.53053)	Top-1 acc 72.266 (67.568)	Top-5 acc 87.891 (86.666)	lr 0.00021
Train [114][120/3239]	Time 0.258 (0.757)	Data Time 0.001 (0.316)	Loss 2.2562 (2.3280)	Entropy 0.53039 (0.53053)	Top-1 acc 69.531 (67.543)	Top-5 acc 89.062 (86.728)	lr 0.00021
Train [114][130/3239]	Time 0.234 (0.733)	Data Time 0.001 (0.292)	Loss 2.4930 (2.3282)	Entropy 0.53042 (0.53052)	Top-1 acc 64.062 (67.539)	Top-5 acc 83.984 (86.749)	lr 0.00021
Train [114][140/3239]	Time 0.241 (0.712)	Data Time 0.001 (0.272)	Loss 2.2013 (2.3285)	Entropy 0.53020 (0.53051)	Top-1 acc 70.312 (67.553)	Top-5 acc 88.672 (86.694)	lr 0.00021
Train [114][150/3239]	Time 0.372 (0.699)	Data Time 0.004 (0.254)	Loss 2.3682 (2.3273)	Entropy 0.53026 (0.53049)	Top-1 acc 69.531 (67.617)	Top-5 acc 86.328 (86.662)	lr 0.00021
Train [114][160/3239]	Time 0.228 (0.680)	Data Time 0.001 (0.238)	Loss 2.5076 (2.3310)	Entropy 0.52995 (0.53047)	Top-1 acc 62.500 (67.564)	Top-5 acc 82.812 (86.595)	lr 0.00021
Train [114][170/3239]	Time 0.235 (0.664)	Data Time 0.002 (0.224)	Loss 2.3103 (2.3277)	Entropy 0.53017 (0.53045)	Top-1 acc 67.578 (67.667)	Top-5 acc 86.719 (86.634)	lr 0.00021
Train [114][180/3239]	Time 0.233 (0.651)	Data Time 0.001 (0.212)	Loss 2.3282 (2.3289)	Entropy 0.53027 (0.53044)	Top-1 acc 67.969 (67.682)	Top-5 acc 85.547 (86.591)	lr 0.00021
Train [114][190/3239]	Time 0.232 (0.639)	Data Time 0.001 (0.201)	Loss 2.2823 (2.3263)	Entropy 0.53051 (0.53043)	Top-1 acc 65.625 (67.760)	Top-5 acc 86.719 (86.623)	lr 0.00021
Train [114][200/3239]	Time 0.235 (0.627)	Data Time 0.001 (0.191)	Loss 2.2122 (2.3263)	Entropy 0.52967 (0.53042)	Top-1 acc 71.875 (67.772)	Top-5 acc 89.844 (86.620)	lr 0.00021
Train [114][210/3239]	Time 0.297 (0.622)	Data Time 0.002 (0.182)	Loss 2.3699 (2.3259)	Entropy 0.52952 (0.53039)	Top-1 acc 65.234 (67.761)	Top-5 acc 86.719 (86.656)	lr 0.00021
Train [114][220/3239]	Time 0.403 (0.618)	Data Time 0.002 (0.174)	Loss 2.1476 (2.3240)	Entropy 0.52952 (0.53035)	Top-1 acc 75.000 (67.806)	Top-5 acc 90.234 (86.675)	lr 0.00021
Train [114][230/3239]	Time 0.227 (0.610)	Data Time 0.001 (0.167)	Loss 2.6150 (2.3250)	Entropy 0.52954 (0.53032)	Top-1 acc 63.672 (67.793)	Top-5 acc 80.078 (86.665)	lr 0.00021
Train [114][240/3239]	Time 0.232 (0.602)	Data Time 0.001 (0.160)	Loss 2.3343 (2.3272)	Entropy 0.52953 (0.53028)	Top-1 acc 67.188 (67.782)	Top-5 acc 85.938 (86.628)	lr 0.00020
Train [114][250/3239]	Time 0.223 (0.595)	Data Time 0.001 (0.153)	Loss 2.2282 (2.3269)	Entropy 0.52954 (0.53025)	Top-1 acc 69.531 (67.798)	Top-5 acc 87.891 (86.619)	lr 0.00020
Train [114][260/3239]	Time 0.229 (0.588)	Data Time 0.001 (0.148)	Loss 2.3504 (2.3278)	Entropy 0.52949 (0.53022)	Top-1 acc 66.016 (67.803)	Top-5 acc 85.547 (86.599)	lr 0.00020
Train [114][270/3239]	Time 0.244 (0.582)	Data Time 0.001 (0.142)	Loss 2.4970 (2.3296)	Entropy 0.52960 (0.53020)	Top-1 acc 67.188 (67.816)	Top-5 acc 82.812 (86.566)	lr 0.00020
Train [114][280/3239]	Time 0.239 (0.576)	Data Time 0.001 (0.137)	Loss 2.0541 (2.3315)	Entropy 0.52930 (0.53018)	Top-1 acc 73.438 (67.770)	Top-5 acc 94.141 (86.553)	lr 0.00020
Train [114][290/3239]	Time 0.231 (0.571)	Data Time 0.001 (0.133)	Loss 2.3885 (2.3336)	Entropy 0.52940 (0.53015)	Top-1 acc 67.188 (67.753)	Top-5 acc 83.984 (86.513)	lr 0.00020
Train [114][300/3239]	Time 0.239 (0.567)	Data Time 0.001 (0.128)	Loss 2.1987 (2.3321)	Entropy 0.52963 (0.53013)	Top-1 acc 69.531 (67.781)	Top-5 acc 88.281 (86.527)	lr 0.00020
Train [114][310/3239]	Time 0.265 (0.562)	Data Time 0.003 (0.124)	Loss 2.3908 (2.3322)	Entropy 0.52968 (0.53011)	Top-1 acc 67.188 (67.788)	Top-5 acc 84.375 (86.518)	lr 0.00020
Train [114][320/3239]	Time 0.234 (0.558)	Data Time 0.001 (0.120)	Loss 2.5535 (2.3345)	Entropy 0.52946 (0.53010)	Top-1 acc 58.594 (67.738)	Top-5 acc 82.422 (86.474)	lr 0.00020
Train [114][330/3239]	Time 0.284 (0.554)	Data Time 0.002 (0.117)	Loss 2.4643 (2.3336)	Entropy 0.52930 (0.53007)	Top-1 acc 64.062 (67.760)	Top-5 acc 84.375 (86.502)	lr 0.00020
Train [114][340/3239]	Time 0.232 (0.552)	Data Time 0.001 (0.113)	Loss 2.1362 (2.3333)	Entropy 0.52894 (0.53005)	Top-1 acc 69.922 (67.757)	Top-5 acc 90.234 (86.515)	lr 0.00020
Train [114][350/3239]	Time 0.234 (0.548)	Data Time 0.001 (0.110)	Loss 2.3954 (2.3325)	Entropy 0.52919 (0.53002)	Top-1 acc 68.750 (67.783)	Top-5 acc 83.594 (86.525)	lr 0.00020
Train [114][360/3239]	Time 0.229 (0.544)	Data Time 0.001 (0.107)	Loss 2.3540 (2.3350)	Entropy 0.52927 (0.52999)	Top-1 acc 66.016 (67.727)	Top-5 acc 85.938 (86.489)	lr 0.00020
Train [114][370/3239]	Time 0.229 (0.540)	Data Time 0.001 (0.104)	Loss 2.2980 (2.3336)	Entropy 0.52932 (0.52998)	Top-1 acc 67.188 (67.756)	Top-5 acc 86.328 (86.497)	lr 0.00020
Train [114][380/3239]	Time 0.327 (0.537)	Data Time 0.001 (0.102)	Loss 2.3060 (2.3331)	Entropy 0.52949 (0.52996)	Top-1 acc 66.406 (67.757)	Top-5 acc 86.328 (86.497)	lr 0.00020
Train [114][390/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.099)	Loss 2.4262 (2.3333)	Entropy 0.52920 (0.52995)	Top-1 acc 68.750 (67.770)	Top-5 acc 84.766 (86.476)	lr 0.00020
Train [114][400/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.097)	Loss 2.6475 (2.3337)	Entropy 0.52896 (0.52992)	Top-1 acc 56.250 (67.766)	Top-5 acc 83.594 (86.479)	lr 0.00020
Train [114][410/3239]	Time 0.265 (0.528)	Data Time 0.001 (0.094)	Loss 2.3261 (2.3327)	Entropy 0.52872 (0.52990)	Top-1 acc 70.703 (67.810)	Top-5 acc 87.109 (86.493)	lr 0.00020
Train [114][420/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.092)	Loss 2.3570 (2.3326)	Entropy 0.52905 (0.52987)	Top-1 acc 66.016 (67.818)	Top-5 acc 85.938 (86.490)	lr 0.00020
Train [114][430/3239]	Time 0.245 (0.522)	Data Time 0.001 (0.090)	Loss 2.1970 (2.3341)	Entropy 0.52904 (0.52986)	Top-1 acc 67.969 (67.786)	Top-5 acc 87.891 (86.462)	lr 0.00020
Train [114][440/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.088)	Loss 2.2558 (2.3339)	Entropy 0.52911 (0.52984)	Top-1 acc 71.094 (67.790)	Top-5 acc 89.453 (86.468)	lr 0.00020
Train [114][450/3239]	Time 0.312 (0.517)	Data Time 0.001 (0.086)	Loss 2.1831 (2.3346)	Entropy 0.52901 (0.52982)	Top-1 acc 67.969 (67.770)	Top-5 acc 90.625 (86.438)	lr 0.00020
Train [114][460/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.084)	Loss 2.3748 (2.3340)	Entropy 0.52938 (0.52980)	Top-1 acc 66.797 (67.787)	Top-5 acc 81.641 (86.441)	lr 0.00020
Train [114][470/3239]	Time 0.231 (0.512)	Data Time 0.001 (0.082)	Loss 2.4986 (2.3351)	Entropy 0.52925 (0.52979)	Top-1 acc 63.672 (67.732)	Top-5 acc 83.203 (86.414)	lr 0.00020
Train [114][480/3239]	Time 0.229 (0.510)	Data Time 0.001 (0.081)	Loss 2.5736 (2.3370)	Entropy 0.52927 (0.52978)	Top-1 acc 61.719 (67.690)	Top-5 acc 82.031 (86.374)	lr 0.00020
Train [114][490/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.079)	Loss 2.4415 (2.3370)	Entropy 0.52945 (0.52977)	Top-1 acc 67.188 (67.703)	Top-5 acc 83.203 (86.369)	lr 0.00020
Train [114][500/3239]	Time 0.230 (0.505)	Data Time 0.001 (0.078)	Loss 2.3324 (2.3376)	Entropy 0.52964 (0.52977)	Top-1 acc 67.578 (67.682)	Top-5 acc 88.672 (86.375)	lr 0.00020
Train [114][510/3239]	Time 0.226 (0.503)	Data Time 0.001 (0.076)	Loss 2.4878 (2.3391)	Entropy 0.52988 (0.52977)	Top-1 acc 62.500 (67.658)	Top-5 acc 83.594 (86.339)	lr 0.00020
Train [114][520/3239]	Time 0.232 (0.501)	Data Time 0.001 (0.075)	Loss 2.3819 (2.3394)	Entropy 0.52975 (0.52977)	Top-1 acc 68.359 (67.679)	Top-5 acc 85.938 (86.342)	lr 0.00020
Train [114][530/3239]	Time 0.221 (0.499)	Data Time 0.001 (0.073)	Loss 2.4792 (2.3393)	Entropy 0.52996 (0.52977)	Top-1 acc 66.406 (67.700)	Top-5 acc 82.422 (86.334)	lr 0.00020
Train [114][540/3239]	Time 0.312 (0.498)	Data Time 0.001 (0.072)	Loss 2.4099 (2.3398)	Entropy 0.53040 (0.52978)	Top-1 acc 64.453 (67.681)	Top-5 acc 83.203 (86.333)	lr 0.00020
Train [114][550/3239]	Time 0.237 (0.496)	Data Time 0.002 (0.071)	Loss 2.4136 (2.3394)	Entropy 0.53007 (0.52979)	Top-1 acc 62.891 (67.692)	Top-5 acc 83.984 (86.342)	lr 0.00020
Train [114][560/3239]	Time 0.234 (0.494)	Data Time 0.001 (0.070)	Loss 2.5002 (2.3397)	Entropy 0.52987 (0.52979)	Top-1 acc 64.453 (67.687)	Top-5 acc 81.641 (86.336)	lr 0.00020
Train [114][570/3239]	Time 0.223 (0.493)	Data Time 0.001 (0.068)	Loss 2.7868 (2.3398)	Entropy 0.52993 (0.52980)	Top-1 acc 58.594 (67.698)	Top-5 acc 80.469 (86.341)	lr 0.00020
Train [114][580/3239]	Time 0.222 (0.492)	Data Time 0.001 (0.067)	Loss 2.4710 (2.3403)	Entropy 0.52967 (0.52980)	Top-1 acc 63.672 (67.680)	Top-5 acc 82.422 (86.335)	lr 0.00020
Train [114][590/3239]	Time 0.236 (0.491)	Data Time 0.001 (0.066)	Loss 2.4471 (2.3408)	Entropy 0.52998 (0.52980)	Top-1 acc 67.188 (67.680)	Top-5 acc 82.812 (86.329)	lr 0.00020
Train [114][600/3239]	Time 0.227 (0.489)	Data Time 0.001 (0.065)	Loss 2.4453 (2.3400)	Entropy 0.53017 (0.52981)	Top-1 acc 65.625 (67.711)	Top-5 acc 84.375 (86.342)	lr 0.00020
Train [114][610/3239]	Time 0.432 (0.488)	Data Time 0.002 (0.064)	Loss 2.1530 (2.3392)	Entropy 0.53006 (0.52981)	Top-1 acc 73.438 (67.737)	Top-5 acc 91.016 (86.359)	lr 0.00020
Train [114][620/3239]	Time 0.284 (0.487)	Data Time 0.002 (0.063)	Loss 2.3220 (2.3380)	Entropy 0.52995 (0.52981)	Top-1 acc 69.141 (67.764)	Top-5 acc 88.281 (86.386)	lr 0.00020
Train [114][630/3239]	Time 0.233 (0.486)	Data Time 0.001 (0.062)	Loss 2.3878 (2.3380)	Entropy 0.52989 (0.52982)	Top-1 acc 65.234 (67.766)	Top-5 acc 85.938 (86.378)	lr 0.00020
Train [114][640/3239]	Time 0.238 (0.485)	Data Time 0.001 (0.061)	Loss 2.3873 (2.3383)	Entropy 0.53002 (0.52982)	Top-1 acc 64.453 (67.759)	Top-5 acc 85.938 (86.376)	lr 0.00020
Train [114][650/3239]	Time 0.307 (0.561)	Data Time 0.005 (0.060)	Loss 2.5938 (2.3377)	Entropy 0.53011 (0.52982)	Top-1 acc 58.984 (67.777)	Top-5 acc 84.375 (86.391)	lr 0.00020
Train [114][660/3239]	Time 0.239 (0.560)	Data Time 0.002 (0.059)	Loss 2.1478 (2.3368)	Entropy 0.53012 (0.52983)	Top-1 acc 75.000 (67.789)	Top-5 acc 88.281 (86.407)	lr 0.00020
Train [114][670/3239]	Time 0.234 (0.558)	Data Time 0.001 (0.058)	Loss 2.4315 (2.3388)	Entropy 0.53017 (0.52983)	Top-1 acc 62.109 (67.739)	Top-5 acc 87.109 (86.385)	lr 0.00020
Train [114][680/3239]	Time 0.234 (0.556)	Data Time 0.001 (0.058)	Loss 2.3184 (2.3384)	Entropy 0.53028 (0.52983)	Top-1 acc 69.531 (67.749)	Top-5 acc 86.719 (86.387)	lr 0.00020
Train [114][690/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.057)	Loss 2.3919 (2.3383)	Entropy 0.53020 (0.52984)	Top-1 acc 65.625 (67.743)	Top-5 acc 85.938 (86.395)	lr 0.00020
Train [114][700/3239]	Time 0.342 (0.552)	Data Time 0.001 (0.056)	Loss 2.4903 (2.3374)	Entropy 0.53007 (0.52984)	Top-1 acc 62.109 (67.780)	Top-5 acc 83.594 (86.408)	lr 0.00020
Train [114][710/3239]	Time 0.240 (0.550)	Data Time 0.001 (0.055)	Loss 2.7303 (2.3386)	Entropy 0.52998 (0.52985)	Top-1 acc 61.719 (67.754)	Top-5 acc 79.297 (86.387)	lr 0.00020
Train [114][720/3239]	Time 0.248 (0.549)	Data Time 0.001 (0.055)	Loss 2.3640 (2.3380)	Entropy 0.53020 (0.52985)	Top-1 acc 67.188 (67.767)	Top-5 acc 85.938 (86.397)	lr 0.00020
Train [114][730/3239]	Time 0.318 (0.548)	Data Time 0.002 (0.054)	Loss 2.2209 (2.3380)	Entropy 0.52981 (0.52985)	Top-1 acc 69.531 (67.764)	Top-5 acc 87.109 (86.403)	lr 0.00020
Train [114][740/3239]	Time 0.234 (0.547)	Data Time 0.001 (0.053)	Loss 2.1597 (2.3383)	Entropy 0.52986 (0.52985)	Top-1 acc 70.703 (67.750)	Top-5 acc 88.281 (86.403)	lr 0.00020
Train [114][750/3239]	Time 0.234 (0.545)	Data Time 0.001 (0.052)	Loss 2.4081 (2.3391)	Entropy 0.52976 (0.52985)	Top-1 acc 67.188 (67.739)	Top-5 acc 86.328 (86.385)	lr 0.00020
Train [114][760/3239]	Time 0.232 (0.543)	Data Time 0.001 (0.052)	Loss 2.1774 (2.3391)	Entropy 0.52986 (0.52985)	Top-1 acc 70.703 (67.744)	Top-5 acc 89.062 (86.380)	lr 0.00020
Train [114][770/3239]	Time 0.317 (0.541)	Data Time 0.001 (0.051)	Loss 2.3815 (2.3398)	Entropy 0.52998 (0.52985)	Top-1 acc 62.891 (67.735)	Top-5 acc 84.375 (86.368)	lr 0.00020
Train [114][780/3239]	Time 0.228 (0.540)	Data Time 0.001 (0.051)	Loss 2.4042 (2.3401)	Entropy 0.53014 (0.52985)	Top-1 acc 64.062 (67.723)	Top-5 acc 86.328 (86.365)	lr 0.00020
Train [114][790/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.050)	Loss 2.2306 (2.3404)	Entropy 0.53013 (0.52986)	Top-1 acc 70.312 (67.714)	Top-5 acc 88.281 (86.372)	lr 0.00020
Train [114][800/3239]	Time 0.226 (0.536)	Data Time 0.001 (0.049)	Loss 2.3303 (2.3404)	Entropy 0.52991 (0.52986)	Top-1 acc 64.844 (67.693)	Top-5 acc 87.500 (86.376)	lr 0.00019
Train [114][810/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.049)	Loss 2.3155 (2.3408)	Entropy 0.52967 (0.52986)	Top-1 acc 71.484 (67.687)	Top-5 acc 87.109 (86.373)	lr 0.00019
Train [114][820/3239]	Time 0.258 (0.533)	Data Time 0.001 (0.048)	Loss 2.2992 (2.3406)	Entropy 0.52980 (0.52986)	Top-1 acc 65.234 (67.689)	Top-5 acc 88.281 (86.373)	lr 0.00019
Train [114][830/3239]	Time 0.228 (0.532)	Data Time 0.001 (0.048)	Loss 2.2890 (2.3398)	Entropy 0.53008 (0.52986)	Top-1 acc 67.578 (67.696)	Top-5 acc 86.328 (86.385)	lr 0.00019
Train [114][840/3239]	Time 0.239 (0.530)	Data Time 0.001 (0.047)	Loss 2.3326 (2.3397)	Entropy 0.52997 (0.52986)	Top-1 acc 64.844 (67.705)	Top-5 acc 87.109 (86.391)	lr 0.00019
Train [114][850/3239]	Time 0.228 (0.529)	Data Time 0.001 (0.046)	Loss 2.2979 (2.3400)	Entropy 0.53007 (0.52986)	Top-1 acc 69.531 (67.682)	Top-5 acc 86.328 (86.382)	lr 0.00019
Train [114][860/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.046)	Loss 2.2966 (2.3400)	Entropy 0.53007 (0.52986)	Top-1 acc 72.656 (67.679)	Top-5 acc 87.109 (86.388)	lr 0.00019
Train [114][870/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.045)	Loss 2.4712 (2.3405)	Entropy 0.53028 (0.52987)	Top-1 acc 64.062 (67.662)	Top-5 acc 82.812 (86.377)	lr 0.00019
Train [114][880/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.045)	Loss 2.3942 (2.3407)	Entropy 0.53043 (0.52987)	Top-1 acc 62.891 (67.648)	Top-5 acc 85.156 (86.365)	lr 0.00019
Train [114][890/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.044)	Loss 2.3415 (2.3405)	Entropy 0.53040 (0.52988)	Top-1 acc 67.969 (67.657)	Top-5 acc 87.500 (86.370)	lr 0.00019
Train [114][900/3239]	Time 0.237 (0.523)	Data Time 0.001 (0.044)	Loss 2.1048 (2.3398)	Entropy 0.53033 (0.52988)	Top-1 acc 74.219 (67.675)	Top-5 acc 90.625 (86.384)	lr 0.00019
Train [114][910/3239]	Time 0.236 (0.522)	Data Time 0.001 (0.044)	Loss 2.2984 (2.3401)	Entropy 0.53033 (0.52989)	Top-1 acc 70.703 (67.663)	Top-5 acc 85.547 (86.373)	lr 0.00019
Train [114][920/3239]	Time 0.244 (0.521)	Data Time 0.001 (0.043)	Loss 2.2860 (2.3391)	Entropy 0.53044 (0.52989)	Top-1 acc 67.969 (67.699)	Top-5 acc 85.938 (86.387)	lr 0.00019
Train [114][930/3239]	Time 0.316 (0.520)	Data Time 0.001 (0.043)	Loss 2.2306 (2.3386)	Entropy 0.53019 (0.52990)	Top-1 acc 71.094 (67.710)	Top-5 acc 89.844 (86.395)	lr 0.00019
Train [114][940/3239]	Time 0.235 (0.519)	Data Time 0.001 (0.042)	Loss 2.2408 (2.3384)	Entropy 0.53027 (0.52990)	Top-1 acc 70.703 (67.711)	Top-5 acc 89.062 (86.395)	lr 0.00019
Train [114][950/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.042)	Loss 2.3871 (2.3380)	Entropy 0.53062 (0.52991)	Top-1 acc 67.578 (67.728)	Top-5 acc 84.766 (86.407)	lr 0.00019
Train [114][960/3239]	Time 0.228 (0.517)	Data Time 0.001 (0.041)	Loss 2.3499 (2.3382)	Entropy 0.53093 (0.52992)	Top-1 acc 66.797 (67.728)	Top-5 acc 85.547 (86.408)	lr 0.00019
Train [114][970/3239]	Time 0.227 (0.516)	Data Time 0.001 (0.041)	Loss 2.4043 (2.3379)	Entropy 0.53098 (0.52993)	Top-1 acc 67.969 (67.739)	Top-5 acc 84.766 (86.415)	lr 0.00019
Train [114][980/3239]	Time 0.230 (0.515)	Data Time 0.001 (0.041)	Loss 2.5116 (2.3378)	Entropy 0.53055 (0.52994)	Top-1 acc 60.547 (67.739)	Top-5 acc 81.641 (86.412)	lr 0.00019
Train [114][990/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.040)	Loss 2.1462 (2.3376)	Entropy 0.53072 (0.52994)	Top-1 acc 71.484 (67.752)	Top-5 acc 89.062 (86.411)	lr 0.00019
Train [114][1000/3239]	Time 0.323 (0.512)	Data Time 0.001 (0.040)	Loss 2.3558 (2.3389)	Entropy 0.53031 (0.52995)	Top-1 acc 69.531 (67.725)	Top-5 acc 83.594 (86.384)	lr 0.00019
Train [114][1010/3239]	Time 0.229 (0.511)	Data Time 0.001 (0.039)	Loss 2.3421 (2.3394)	Entropy 0.53059 (0.52995)	Top-1 acc 68.359 (67.713)	Top-5 acc 85.938 (86.375)	lr 0.00019
Train [114][1020/3239]	Time 0.231 (0.510)	Data Time 0.001 (0.039)	Loss 2.3595 (2.3395)	Entropy 0.53088 (0.52996)	Top-1 acc 67.188 (67.717)	Top-5 acc 83.594 (86.376)	lr 0.00019
Train [114][1030/3239]	Time 0.223 (0.509)	Data Time 0.001 (0.039)	Loss 2.3223 (2.3391)	Entropy 0.53092 (0.52997)	Top-1 acc 67.578 (67.727)	Top-5 acc 85.938 (86.377)	lr 0.00019
Train [114][1040/3239]	Time 0.231 (0.508)	Data Time 0.001 (0.038)	Loss 2.2364 (2.3396)	Entropy 0.53050 (0.52998)	Top-1 acc 70.312 (67.719)	Top-5 acc 86.719 (86.365)	lr 0.00019
Train [114][1050/3239]	Time 0.226 (0.507)	Data Time 0.001 (0.038)	Loss 2.3000 (2.3401)	Entropy 0.53050 (0.52998)	Top-1 acc 67.188 (67.706)	Top-5 acc 87.891 (86.356)	lr 0.00019
Train [114][1060/3239]	Time 0.249 (0.506)	Data Time 0.001 (0.038)	Loss 2.2443 (2.3401)	Entropy 0.53063 (0.52999)	Top-1 acc 66.016 (67.697)	Top-5 acc 88.672 (86.359)	lr 0.00019
Train [114][1070/3239]	Time 0.227 (0.505)	Data Time 0.001 (0.037)	Loss 2.6670 (2.3407)	Entropy 0.53105 (0.52999)	Top-1 acc 58.594 (67.683)	Top-5 acc 85.547 (86.347)	lr 0.00019
Train [114][1080/3239]	Time 0.243 (0.504)	Data Time 0.001 (0.037)	Loss 2.2713 (2.3407)	Entropy 0.53064 (0.53000)	Top-1 acc 71.484 (67.685)	Top-5 acc 88.281 (86.353)	lr 0.00019
Train [114][1090/3239]	Time 0.320 (0.503)	Data Time 0.001 (0.037)	Loss 2.3228 (2.3404)	Entropy 0.53039 (0.53001)	Top-1 acc 69.141 (67.696)	Top-5 acc 85.938 (86.355)	lr 0.00019
Train [114][1100/3239]	Time 0.241 (0.503)	Data Time 0.001 (0.036)	Loss 2.3415 (2.3405)	Entropy 0.53050 (0.53001)	Top-1 acc 69.922 (67.698)	Top-5 acc 84.375 (86.350)	lr 0.00019
Train [114][1110/3239]	Time 0.238 (0.502)	Data Time 0.001 (0.036)	Loss 2.3983 (2.3405)	Entropy 0.53062 (0.53002)	Top-1 acc 65.234 (67.696)	Top-5 acc 86.719 (86.357)	lr 0.00019
Train [114][1120/3239]	Time 0.255 (0.501)	Data Time 0.001 (0.036)	Loss 2.3426 (2.3406)	Entropy 0.53040 (0.53002)	Top-1 acc 68.359 (67.698)	Top-5 acc 87.500 (86.358)	lr 0.00019
Train [114][1130/3239]	Time 0.235 (0.500)	Data Time 0.001 (0.035)	Loss 2.6506 (2.3407)	Entropy 0.53033 (0.53002)	Top-1 acc 59.766 (67.701)	Top-5 acc 78.516 (86.356)	lr 0.00019
Train [114][1140/3239]	Time 0.278 (0.500)	Data Time 0.001 (0.035)	Loss 2.3511 (2.3411)	Entropy 0.53040 (0.53003)	Top-1 acc 69.141 (67.693)	Top-5 acc 86.719 (86.349)	lr 0.00019
Train [114][1150/3239]	Time 0.226 (0.499)	Data Time 0.002 (0.035)	Loss 2.4289 (2.3413)	Entropy 0.53025 (0.53003)	Top-1 acc 66.406 (67.694)	Top-5 acc 86.719 (86.350)	lr 0.00019
Train [114][1160/3239]	Time 0.325 (0.498)	Data Time 0.001 (0.034)	Loss 2.5486 (2.3413)	Entropy 0.53042 (0.53003)	Top-1 acc 60.547 (67.684)	Top-5 acc 83.594 (86.348)	lr 0.00019
Train [114][1170/3239]	Time 0.237 (0.497)	Data Time 0.001 (0.034)	Loss 2.5475 (2.3416)	Entropy 0.52997 (0.53003)	Top-1 acc 64.062 (67.677)	Top-5 acc 82.812 (86.340)	lr 0.00019
Train [114][1180/3239]	Time 0.281 (0.497)	Data Time 0.002 (0.034)	Loss 2.4479 (2.3415)	Entropy 0.52984 (0.53003)	Top-1 acc 62.500 (67.680)	Top-5 acc 84.375 (86.339)	lr 0.00019
Train [114][1190/3239]	Time 0.249 (0.497)	Data Time 0.001 (0.034)	Loss 2.4840 (2.3418)	Entropy 0.53002 (0.53003)	Top-1 acc 65.234 (67.676)	Top-5 acc 85.156 (86.335)	lr 0.00019
Train [114][1200/3239]	Time 0.228 (0.496)	Data Time 0.001 (0.033)	Loss 2.5141 (2.3419)	Entropy 0.53000 (0.53003)	Top-1 acc 60.156 (67.668)	Top-5 acc 83.984 (86.335)	lr 0.00019
Train [114][1210/3239]	Time 0.242 (0.496)	Data Time 0.001 (0.033)	Loss 2.2935 (2.3419)	Entropy 0.52986 (0.53003)	Top-1 acc 68.750 (67.667)	Top-5 acc 87.500 (86.337)	lr 0.00019
Train [114][1220/3239]	Time 0.223 (0.495)	Data Time 0.001 (0.033)	Loss 2.4651 (2.3418)	Entropy 0.53021 (0.53003)	Top-1 acc 66.016 (67.669)	Top-5 acc 84.375 (86.342)	lr 0.00019
Train [114][1230/3239]	Time 0.236 (0.494)	Data Time 0.001 (0.033)	Loss 2.3490 (2.3423)	Entropy 0.52990 (0.53003)	Top-1 acc 67.969 (67.652)	Top-5 acc 84.375 (86.328)	lr 0.00019
Train [114][1240/3239]	Time 0.232 (0.493)	Data Time 0.001 (0.032)	Loss 2.1879 (2.3429)	Entropy 0.52987 (0.53003)	Top-1 acc 73.047 (67.641)	Top-5 acc 87.891 (86.324)	lr 0.00019
Train [114][1250/3239]	Time 0.255 (0.492)	Data Time 0.001 (0.032)	Loss 2.2099 (2.3428)	Entropy 0.52979 (0.53003)	Top-1 acc 69.531 (67.643)	Top-5 acc 91.797 (86.334)	lr 0.00019
Train [114][1260/3239]	Time 0.231 (0.492)	Data Time 0.001 (0.032)	Loss 2.3275 (2.3428)	Entropy 0.52981 (0.53003)	Top-1 acc 71.484 (67.651)	Top-5 acc 85.938 (86.340)	lr 0.00019
Train [114][1270/3239]	Time 0.231 (0.491)	Data Time 0.001 (0.032)	Loss 2.3782 (2.3430)	Entropy 0.52976 (0.53003)	Top-1 acc 69.531 (67.650)	Top-5 acc 84.766 (86.338)	lr 0.00019
Train [114][1280/3239]	Time 0.242 (0.491)	Data Time 0.002 (0.031)	Loss 2.1770 (2.3423)	Entropy 0.52954 (0.53002)	Top-1 acc 72.266 (67.665)	Top-5 acc 92.969 (86.354)	lr 0.00019
Train [114][1290/3239]	Time 0.230 (0.490)	Data Time 0.001 (0.031)	Loss 2.7151 (2.3427)	Entropy 0.52960 (0.53002)	Top-1 acc 55.469 (67.653)	Top-5 acc 79.688 (86.344)	lr 0.00019
Train [114][1300/3239]	Time 0.220 (0.489)	Data Time 0.001 (0.031)	Loss 2.2973 (2.3425)	Entropy 0.53004 (0.53002)	Top-1 acc 68.359 (67.656)	Top-5 acc 89.062 (86.352)	lr 0.00019
Train [114][1310/3239]	Time 0.231 (0.528)	Data Time 0.002 (0.031)	Loss 2.3650 (2.3427)	Entropy 0.53005 (0.53002)	Top-1 acc 66.016 (67.657)	Top-5 acc 86.719 (86.348)	lr 0.00019
Train [114][1320/3239]	Time 0.362 (0.527)	Data Time 0.002 (0.030)	Loss 2.4737 (2.3424)	Entropy 0.53024 (0.53002)	Top-1 acc 63.281 (67.664)	Top-5 acc 83.203 (86.356)	lr 0.00019
Train [114][1330/3239]	Time 0.235 (0.527)	Data Time 0.001 (0.030)	Loss 2.1946 (2.3423)	Entropy 0.53066 (0.53002)	Top-1 acc 72.656 (67.664)	Top-5 acc 87.109 (86.358)	lr 0.00019
Train [114][1340/3239]	Time 0.248 (0.526)	Data Time 0.002 (0.030)	Loss 2.1895 (2.3424)	Entropy 0.53089 (0.53003)	Top-1 acc 73.047 (67.665)	Top-5 acc 88.672 (86.350)	lr 0.00019
Train [114][1350/3239]	Time 0.321 (0.525)	Data Time 0.003 (0.030)	Loss 2.2900 (2.3427)	Entropy 0.53092 (0.53003)	Top-1 acc 68.359 (67.665)	Top-5 acc 85.938 (86.341)	lr 0.00019
Train [114][1360/3239]	Time 0.249 (0.525)	Data Time 0.001 (0.030)	Loss 2.4352 (2.3426)	Entropy 0.53085 (0.53004)	Top-1 acc 64.453 (67.670)	Top-5 acc 85.156 (86.342)	lr 0.00019
Train [114][1370/3239]	Time 0.253 (0.525)	Data Time 0.001 (0.029)	Loss 2.5091 (2.3427)	Entropy 0.53091 (0.53005)	Top-1 acc 62.109 (67.672)	Top-5 acc 84.375 (86.340)	lr 0.00018
Train [114][1380/3239]	Time 0.243 (0.524)	Data Time 0.001 (0.029)	Loss 2.3934 (2.3429)	Entropy 0.53103 (0.53005)	Top-1 acc 69.141 (67.670)	Top-5 acc 85.938 (86.335)	lr 0.00018
Train [114][1390/3239]	Time 0.254 (0.523)	Data Time 0.001 (0.029)	Loss 2.3948 (2.3427)	Entropy 0.53083 (0.53006)	Top-1 acc 68.750 (67.677)	Top-5 acc 83.594 (86.339)	lr 0.00018
Train [114][1400/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.029)	Loss 2.3271 (2.3429)	Entropy 0.53120 (0.53006)	Top-1 acc 70.312 (67.679)	Top-5 acc 87.109 (86.336)	lr 0.00018
Train [114][1410/3239]	Time 0.241 (0.521)	Data Time 0.001 (0.029)	Loss 2.3050 (2.3431)	Entropy 0.53131 (0.53007)	Top-1 acc 67.188 (67.674)	Top-5 acc 85.938 (86.334)	lr 0.00018
Train [114][1420/3239]	Time 0.258 (0.521)	Data Time 0.001 (0.028)	Loss 2.3292 (2.3430)	Entropy 0.53120 (0.53008)	Top-1 acc 69.141 (67.677)	Top-5 acc 87.109 (86.341)	lr 0.00018
Train [114][1430/3239]	Time 0.231 (0.520)	Data Time 0.001 (0.028)	Loss 2.2813 (2.3426)	Entropy 0.53126 (0.53009)	Top-1 acc 69.141 (67.677)	Top-5 acc 87.109 (86.346)	lr 0.00018
Train [114][1440/3239]	Time 0.219 (0.519)	Data Time 0.001 (0.028)	Loss 2.3534 (2.3431)	Entropy 0.53136 (0.53010)	Top-1 acc 70.703 (67.668)	Top-5 acc 86.328 (86.339)	lr 0.00018
Train [114][1450/3239]	Time 0.227 (0.518)	Data Time 0.001 (0.028)	Loss 2.3285 (2.3429)	Entropy 0.53122 (0.53011)	Top-1 acc 65.625 (67.669)	Top-5 acc 87.500 (86.340)	lr 0.00018
Train [114][1460/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.028)	Loss 2.1433 (2.3430)	Entropy 0.53123 (0.53011)	Top-1 acc 77.344 (67.671)	Top-5 acc 88.672 (86.338)	lr 0.00018
Train [114][1470/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.028)	Loss 2.2120 (2.3427)	Entropy 0.53172 (0.53012)	Top-1 acc 69.922 (67.675)	Top-5 acc 89.062 (86.342)	lr 0.00018
Train [114][1480/3239]	Time 0.327 (0.516)	Data Time 0.001 (0.027)	Loss 2.1335 (2.3427)	Entropy 0.53188 (0.53013)	Top-1 acc 71.484 (67.671)	Top-5 acc 91.016 (86.342)	lr 0.00018
Train [114][1490/3239]	Time 0.286 (0.516)	Data Time 0.001 (0.027)	Loss 2.1418 (2.3425)	Entropy 0.53213 (0.53014)	Top-1 acc 76.562 (67.677)	Top-5 acc 89.453 (86.341)	lr 0.00018
Train [114][1500/3239]	Time 0.222 (0.515)	Data Time 0.001 (0.027)	Loss 2.3183 (2.3425)	Entropy 0.53224 (0.53016)	Top-1 acc 70.312 (67.688)	Top-5 acc 87.891 (86.341)	lr 0.00018
Train [114][1510/3239]	Time 0.230 (0.514)	Data Time 0.001 (0.027)	Loss 2.2838 (2.3424)	Entropy 0.53232 (0.53017)	Top-1 acc 70.703 (67.683)	Top-5 acc 85.547 (86.347)	lr 0.00018
Train [114][1520/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.027)	Loss 2.2178 (2.3421)	Entropy 0.53245 (0.53019)	Top-1 acc 73.828 (67.694)	Top-5 acc 86.328 (86.345)	lr 0.00018
Train [114][1530/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.027)	Loss 2.3314 (2.3417)	Entropy 0.53265 (0.53020)	Top-1 acc 67.188 (67.710)	Top-5 acc 85.547 (86.351)	lr 0.00018
Train [114][1540/3239]	Time 0.230 (0.513)	Data Time 0.001 (0.026)	Loss 2.2614 (2.3419)	Entropy 0.53224 (0.53022)	Top-1 acc 70.312 (67.701)	Top-5 acc 86.719 (86.349)	lr 0.00018
Train [114][1550/3239]	Time 0.333 (0.512)	Data Time 0.001 (0.026)	Loss 2.4067 (2.3418)	Entropy 0.53229 (0.53023)	Top-1 acc 66.797 (67.704)	Top-5 acc 84.375 (86.350)	lr 0.00018
Train [114][1560/3239]	Time 0.234 (0.512)	Data Time 0.001 (0.026)	Loss 2.2616 (2.3421)	Entropy 0.53255 (0.53024)	Top-1 acc 69.922 (67.692)	Top-5 acc 87.891 (86.349)	lr 0.00018
Train [114][1570/3239]	Time 0.229 (0.511)	Data Time 0.001 (0.026)	Loss 2.2009 (2.3419)	Entropy 0.53232 (0.53026)	Top-1 acc 73.828 (67.707)	Top-5 acc 88.281 (86.348)	lr 0.00018
Train [114][1580/3239]	Time 0.236 (0.510)	Data Time 0.001 (0.026)	Loss 2.4229 (2.3421)	Entropy 0.53267 (0.53027)	Top-1 acc 66.406 (67.701)	Top-5 acc 85.938 (86.344)	lr 0.00018
Train [114][1590/3239]	Time 0.257 (0.510)	Data Time 0.001 (0.026)	Loss 2.4461 (2.3423)	Entropy 0.53277 (0.53029)	Top-1 acc 65.234 (67.703)	Top-5 acc 85.156 (86.344)	lr 0.00018
Train [114][1600/3239]	Time 0.232 (0.509)	Data Time 0.001 (0.025)	Loss 2.1478 (2.3425)	Entropy 0.53281 (0.53030)	Top-1 acc 72.266 (67.704)	Top-5 acc 89.844 (86.340)	lr 0.00018
Train [114][1610/3239]	Time 0.220 (0.509)	Data Time 0.001 (0.025)	Loss 2.2273 (2.3422)	Entropy 0.53290 (0.53032)	Top-1 acc 68.359 (67.711)	Top-5 acc 89.844 (86.346)	lr 0.00018
Train [114][1620/3239]	Time 0.230 (0.508)	Data Time 0.001 (0.025)	Loss 2.3361 (2.3422)	Entropy 0.53324 (0.53034)	Top-1 acc 68.750 (67.716)	Top-5 acc 85.938 (86.346)	lr 0.00018
Train [114][1630/3239]	Time 0.275 (0.508)	Data Time 0.001 (0.025)	Loss 2.4878 (2.3424)	Entropy 0.53367 (0.53035)	Top-1 acc 63.672 (67.713)	Top-5 acc 84.766 (86.345)	lr 0.00018
Train [114][1640/3239]	Time 0.402 (0.508)	Data Time 0.001 (0.025)	Loss 2.5793 (2.3425)	Entropy 0.53347 (0.53037)	Top-1 acc 63.672 (67.711)	Top-5 acc 82.031 (86.346)	lr 0.00018
Train [114][1650/3239]	Time 0.220 (0.507)	Data Time 0.001 (0.025)	Loss 2.6042 (2.3426)	Entropy 0.53332 (0.53039)	Top-1 acc 61.719 (67.713)	Top-5 acc 78.906 (86.344)	lr 0.00018
Train [114][1660/3239]	Time 0.233 (0.506)	Data Time 0.001 (0.025)	Loss 2.5161 (2.3431)	Entropy 0.53341 (0.53041)	Top-1 acc 62.109 (67.698)	Top-5 acc 83.594 (86.336)	lr 0.00018
Train [114][1670/3239]	Time 0.229 (0.506)	Data Time 0.001 (0.024)	Loss 2.2948 (2.3434)	Entropy 0.53337 (0.53043)	Top-1 acc 66.406 (67.695)	Top-5 acc 87.500 (86.331)	lr 0.00018
Train [114][1680/3239]	Time 0.231 (0.505)	Data Time 0.001 (0.024)	Loss 2.2885 (2.3432)	Entropy 0.53350 (0.53045)	Top-1 acc 68.750 (67.703)	Top-5 acc 86.328 (86.332)	lr 0.00018
Train [114][1690/3239]	Time 0.228 (0.505)	Data Time 0.001 (0.024)	Loss 2.3748 (2.3432)	Entropy 0.53377 (0.53046)	Top-1 acc 65.625 (67.706)	Top-5 acc 87.109 (86.332)	lr 0.00018
Train [114][1700/3239]	Time 0.227 (0.504)	Data Time 0.001 (0.024)	Loss 2.3272 (2.3432)	Entropy 0.53376 (0.53048)	Top-1 acc 71.094 (67.707)	Top-5 acc 87.109 (86.333)	lr 0.00018
Train [114][1710/3239]	Time 0.323 (0.504)	Data Time 0.001 (0.024)	Loss 2.3467 (2.3430)	Entropy 0.53361 (0.53050)	Top-1 acc 66.406 (67.704)	Top-5 acc 87.109 (86.341)	lr 0.00018
Train [114][1720/3239]	Time 0.240 (0.503)	Data Time 0.001 (0.024)	Loss 2.3439 (2.3432)	Entropy 0.53343 (0.53052)	Top-1 acc 66.797 (67.699)	Top-5 acc 85.938 (86.338)	lr 0.00018
Train [114][1730/3239]	Time 0.217 (0.502)	Data Time 0.001 (0.024)	Loss 2.4411 (2.3433)	Entropy 0.53337 (0.53054)	Top-1 acc 66.016 (67.703)	Top-5 acc 85.547 (86.339)	lr 0.00018
Train [114][1740/3239]	Time 0.226 (0.502)	Data Time 0.001 (0.024)	Loss 2.6677 (2.3438)	Entropy 0.53366 (0.53055)	Top-1 acc 56.641 (67.695)	Top-5 acc 84.766 (86.334)	lr 0.00018
Train [114][1750/3239]	Time 0.232 (0.501)	Data Time 0.001 (0.023)	Loss 2.1627 (2.3437)	Entropy 0.53380 (0.53057)	Top-1 acc 73.438 (67.698)	Top-5 acc 89.453 (86.333)	lr 0.00018
Train [114][1760/3239]	Time 0.234 (0.501)	Data Time 0.001 (0.023)	Loss 2.4544 (2.3437)	Entropy 0.53394 (0.53059)	Top-1 acc 64.062 (67.697)	Top-5 acc 85.547 (86.329)	lr 0.00018
Train [114][1770/3239]	Time 0.238 (0.500)	Data Time 0.001 (0.023)	Loss 2.3585 (2.3440)	Entropy 0.53390 (0.53061)	Top-1 acc 68.359 (67.693)	Top-5 acc 87.109 (86.329)	lr 0.00018
Train [114][1780/3239]	Time 0.237 (0.500)	Data Time 0.001 (0.023)	Loss 2.4374 (2.3442)	Entropy 0.53371 (0.53063)	Top-1 acc 62.500 (67.687)	Top-5 acc 83.984 (86.326)	lr 0.00018
Train [114][1790/3239]	Time 0.243 (0.499)	Data Time 0.002 (0.023)	Loss 2.5181 (2.3442)	Entropy 0.53371 (0.53064)	Top-1 acc 63.672 (67.685)	Top-5 acc 82.031 (86.326)	lr 0.00018
Train [114][1800/3239]	Time 0.233 (0.499)	Data Time 0.001 (0.023)	Loss 2.3381 (2.3440)	Entropy 0.53381 (0.53066)	Top-1 acc 68.359 (67.685)	Top-5 acc 88.672 (86.331)	lr 0.00018
Train [114][1810/3239]	Time 0.228 (0.498)	Data Time 0.001 (0.023)	Loss 2.3921 (2.3441)	Entropy 0.53401 (0.53068)	Top-1 acc 66.016 (67.679)	Top-5 acc 85.547 (86.329)	lr 0.00018
Train [114][1820/3239]	Time 0.243 (0.498)	Data Time 0.001 (0.023)	Loss 2.2658 (2.3441)	Entropy 0.53383 (0.53070)	Top-1 acc 68.750 (67.675)	Top-5 acc 87.891 (86.329)	lr 0.00018
Train [114][1830/3239]	Time 0.224 (0.497)	Data Time 0.001 (0.022)	Loss 2.2218 (2.3439)	Entropy 0.53364 (0.53071)	Top-1 acc 70.312 (67.680)	Top-5 acc 87.500 (86.329)	lr 0.00018
Train [114][1840/3239]	Time 0.251 (0.497)	Data Time 0.001 (0.022)	Loss 2.1522 (2.3436)	Entropy 0.53379 (0.53073)	Top-1 acc 70.703 (67.686)	Top-5 acc 89.453 (86.335)	lr 0.00018
Train [114][1850/3239]	Time 0.236 (0.496)	Data Time 0.001 (0.022)	Loss 2.2856 (2.3441)	Entropy 0.53361 (0.53075)	Top-1 acc 67.188 (67.673)	Top-5 acc 89.453 (86.329)	lr 0.00018
Train [114][1860/3239]	Time 0.234 (0.496)	Data Time 0.001 (0.022)	Loss 2.1890 (2.3444)	Entropy 0.53355 (0.53076)	Top-1 acc 70.312 (67.665)	Top-5 acc 88.672 (86.327)	lr 0.00018
Train [114][1870/3239]	Time 0.330 (0.495)	Data Time 0.001 (0.022)	Loss 2.3316 (2.3440)	Entropy 0.53297 (0.53077)	Top-1 acc 69.531 (67.670)	Top-5 acc 84.375 (86.334)	lr 0.00018
Train [114][1880/3239]	Time 0.234 (0.495)	Data Time 0.001 (0.022)	Loss 2.3697 (2.3438)	Entropy 0.53281 (0.53079)	Top-1 acc 66.016 (67.674)	Top-5 acc 85.938 (86.339)	lr 0.00018
Train [114][1890/3239]	Time 0.221 (0.494)	Data Time 0.001 (0.022)	Loss 2.4798 (2.3440)	Entropy 0.53254 (0.53080)	Top-1 acc 67.578 (67.672)	Top-5 acc 84.375 (86.336)	lr 0.00018
Train [114][1900/3239]	Time 0.233 (0.494)	Data Time 0.001 (0.022)	Loss 2.3028 (2.3438)	Entropy 0.53278 (0.53081)	Top-1 acc 69.141 (67.683)	Top-5 acc 86.719 (86.339)	lr 0.00018
Train [114][1910/3239]	Time 0.224 (0.494)	Data Time 0.001 (0.022)	Loss 2.4255 (2.3439)	Entropy 0.53262 (0.53082)	Top-1 acc 65.234 (67.677)	Top-5 acc 86.328 (86.339)	lr 0.00018
Train [114][1920/3239]	Time 0.231 (0.493)	Data Time 0.001 (0.021)	Loss 2.2787 (2.3438)	Entropy 0.53247 (0.53083)	Top-1 acc 66.016 (67.678)	Top-5 acc 85.156 (86.336)	lr 0.00018
Train [114][1930/3239]	Time 0.222 (0.493)	Data Time 0.001 (0.021)	Loss 2.4340 (2.3443)	Entropy 0.53265 (0.53083)	Top-1 acc 64.062 (67.670)	Top-5 acc 85.938 (86.328)	lr 0.00018
Train [114][1940/3239]	Time 0.315 (0.492)	Data Time 0.001 (0.021)	Loss 2.3400 (2.3441)	Entropy 0.53273 (0.53084)	Top-1 acc 71.484 (67.674)	Top-5 acc 88.672 (86.332)	lr 0.00018
Train [114][1950/3239]	Time 0.229 (0.492)	Data Time 0.001 (0.021)	Loss 2.2527 (2.3438)	Entropy 0.53269 (0.53085)	Top-1 acc 67.578 (67.682)	Top-5 acc 89.453 (86.337)	lr 0.00017
Train [114][1960/3239]	Time 0.481 (0.517)	Data Time 0.029 (0.021)	Loss 2.2465 (2.3438)	Entropy 0.53248 (0.53086)	Top-1 acc 71.094 (67.683)	Top-5 acc 86.719 (86.339)	lr 0.00017
Train [114][1970/3239]	Time 0.234 (0.517)	Data Time 0.002 (0.021)	Loss 2.3669 (2.3437)	Entropy 0.53230 (0.53087)	Top-1 acc 67.188 (67.685)	Top-5 acc 85.938 (86.341)	lr 0.00017
Train [114][1980/3239]	Time 0.315 (0.516)	Data Time 0.002 (0.021)	Loss 2.1749 (2.3433)	Entropy 0.53262 (0.53088)	Top-1 acc 72.266 (67.692)	Top-5 acc 91.016 (86.348)	lr 0.00017
Train [114][1990/3239]	Time 0.225 (0.516)	Data Time 0.001 (0.021)	Loss 2.2237 (2.3434)	Entropy 0.53288 (0.53089)	Top-1 acc 69.922 (67.687)	Top-5 acc 87.109 (86.348)	lr 0.00017
Train [114][2000/3239]	Time 0.279 (0.515)	Data Time 0.003 (0.021)	Loss 2.3816 (2.3438)	Entropy 0.53309 (0.53090)	Top-1 acc 65.625 (67.670)	Top-5 acc 85.547 (86.343)	lr 0.00017
Train [114][2010/3239]	Time 0.288 (0.515)	Data Time 0.002 (0.021)	Loss 2.1918 (2.3438)	Entropy 0.53301 (0.53091)	Top-1 acc 67.969 (67.668)	Top-5 acc 90.625 (86.341)	lr 0.00017
Train [114][2020/3239]	Time 0.270 (0.515)	Data Time 0.001 (0.021)	Loss 2.1256 (2.3438)	Entropy 0.53320 (0.53092)	Top-1 acc 73.438 (67.674)	Top-5 acc 87.891 (86.340)	lr 0.00017
Train [114][2030/3239]	Time 0.330 (0.514)	Data Time 0.001 (0.020)	Loss 2.3257 (2.3440)	Entropy 0.53340 (0.53093)	Top-1 acc 66.406 (67.670)	Top-5 acc 86.328 (86.338)	lr 0.00017
Train [114][2040/3239]	Time 0.260 (0.514)	Data Time 0.001 (0.020)	Loss 2.2311 (2.3440)	Entropy 0.53335 (0.53094)	Top-1 acc 69.922 (67.670)	Top-5 acc 87.109 (86.341)	lr 0.00017
Train [114][2050/3239]	Time 0.252 (0.513)	Data Time 0.001 (0.020)	Loss 2.1305 (2.3440)	Entropy 0.53334 (0.53096)	Top-1 acc 70.312 (67.668)	Top-5 acc 88.281 (86.339)	lr 0.00017
Train [114][2060/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.020)	Loss 2.3855 (2.3437)	Entropy 0.53361 (0.53097)	Top-1 acc 65.234 (67.677)	Top-5 acc 85.938 (86.340)	lr 0.00017
Train [114][2070/3239]	Time 0.239 (0.512)	Data Time 0.001 (0.020)	Loss 2.3997 (2.3437)	Entropy 0.53335 (0.53098)	Top-1 acc 68.750 (67.677)	Top-5 acc 85.938 (86.341)	lr 0.00017
Train [114][2080/3239]	Time 0.226 (0.512)	Data Time 0.001 (0.020)	Loss 2.5542 (2.3436)	Entropy 0.53327 (0.53099)	Top-1 acc 66.016 (67.679)	Top-5 acc 80.078 (86.340)	lr 0.00017
Train [114][2090/3239]	Time 0.230 (0.512)	Data Time 0.001 (0.020)	Loss 2.1549 (2.3435)	Entropy 0.53327 (0.53100)	Top-1 acc 74.609 (67.682)	Top-5 acc 89.453 (86.344)	lr 0.00017
Train [114][2100/3239]	Time 0.239 (0.511)	Data Time 0.001 (0.020)	Loss 2.3209 (2.3436)	Entropy 0.53288 (0.53101)	Top-1 acc 69.531 (67.679)	Top-5 acc 86.328 (86.342)	lr 0.00017
Train [114][2110/3239]	Time 0.229 (0.511)	Data Time 0.001 (0.020)	Loss 2.4460 (2.3437)	Entropy 0.53298 (0.53102)	Top-1 acc 61.328 (67.671)	Top-5 acc 84.766 (86.338)	lr 0.00017
Train [114][2120/3239]	Time 0.240 (0.510)	Data Time 0.001 (0.020)	Loss 2.3253 (2.3437)	Entropy 0.53312 (0.53103)	Top-1 acc 69.141 (67.669)	Top-5 acc 87.500 (86.339)	lr 0.00017
Train [114][2130/3239]	Time 0.228 (0.510)	Data Time 0.001 (0.020)	Loss 2.4409 (2.3440)	Entropy 0.53308 (0.53104)	Top-1 acc 64.844 (67.658)	Top-5 acc 85.547 (86.333)	lr 0.00017
Train [114][2140/3239]	Time 0.226 (0.509)	Data Time 0.001 (0.019)	Loss 2.4778 (2.3441)	Entropy 0.53269 (0.53105)	Top-1 acc 64.062 (67.657)	Top-5 acc 86.328 (86.333)	lr 0.00017
Train [114][2150/3239]	Time 0.223 (0.509)	Data Time 0.001 (0.019)	Loss 2.0336 (2.3438)	Entropy 0.53260 (0.53106)	Top-1 acc 73.047 (67.668)	Top-5 acc 91.016 (86.338)	lr 0.00017
Train [114][2160/3239]	Time 0.221 (0.508)	Data Time 0.001 (0.019)	Loss 2.6674 (2.3438)	Entropy 0.53251 (0.53106)	Top-1 acc 60.938 (67.667)	Top-5 acc 79.297 (86.339)	lr 0.00017
Train [114][2170/3239]	Time 0.227 (0.508)	Data Time 0.001 (0.019)	Loss 2.3070 (2.3436)	Entropy 0.53230 (0.53107)	Top-1 acc 67.578 (67.665)	Top-5 acc 86.719 (86.343)	lr 0.00017
Train [114][2180/3239]	Time 0.231 (0.507)	Data Time 0.001 (0.019)	Loss 2.5247 (2.3433)	Entropy 0.53250 (0.53108)	Top-1 acc 63.672 (67.674)	Top-5 acc 82.422 (86.349)	lr 0.00017
Train [114][2190/3239]	Time 0.327 (0.507)	Data Time 0.001 (0.019)	Loss 2.2995 (2.3438)	Entropy 0.53226 (0.53108)	Top-1 acc 68.359 (67.662)	Top-5 acc 87.500 (86.339)	lr 0.00017
Train [114][2200/3239]	Time 0.227 (0.506)	Data Time 0.001 (0.019)	Loss 2.5469 (2.3438)	Entropy 0.53255 (0.53109)	Top-1 acc 65.234 (67.665)	Top-5 acc 82.812 (86.339)	lr 0.00017
Train [114][2210/3239]	Time 0.231 (0.506)	Data Time 0.001 (0.019)	Loss 2.4688 (2.3436)	Entropy 0.53229 (0.53110)	Top-1 acc 65.234 (67.669)	Top-5 acc 85.156 (86.344)	lr 0.00017
Train [114][2220/3239]	Time 0.230 (0.506)	Data Time 0.001 (0.019)	Loss 2.3482 (2.3435)	Entropy 0.53241 (0.53110)	Top-1 acc 66.406 (67.667)	Top-5 acc 88.672 (86.349)	lr 0.00017
Train [114][2230/3239]	Time 0.234 (0.505)	Data Time 0.001 (0.019)	Loss 2.1454 (2.3437)	Entropy 0.53275 (0.53111)	Top-1 acc 69.531 (67.661)	Top-5 acc 88.672 (86.346)	lr 0.00017
Train [114][2240/3239]	Time 0.233 (0.505)	Data Time 0.001 (0.019)	Loss 2.3804 (2.3438)	Entropy 0.53290 (0.53112)	Top-1 acc 66.016 (67.654)	Top-5 acc 84.375 (86.344)	lr 0.00017
Train [114][2250/3239]	Time 0.328 (0.504)	Data Time 0.001 (0.019)	Loss 2.2838 (2.3436)	Entropy 0.53276 (0.53112)	Top-1 acc 72.266 (67.655)	Top-5 acc 87.891 (86.344)	lr 0.00017
Train [114][2260/3239]	Time 0.337 (0.504)	Data Time 0.001 (0.018)	Loss 2.3145 (2.3434)	Entropy 0.53261 (0.53113)	Top-1 acc 67.578 (67.656)	Top-5 acc 84.375 (86.348)	lr 0.00017
Train [114][2270/3239]	Time 0.241 (0.504)	Data Time 0.002 (0.018)	Loss 2.4755 (2.3438)	Entropy 0.53273 (0.53114)	Top-1 acc 64.844 (67.647)	Top-5 acc 85.547 (86.341)	lr 0.00017
Train [114][2280/3239]	Time 0.235 (0.504)	Data Time 0.001 (0.018)	Loss 2.2865 (2.3437)	Entropy 0.53283 (0.53114)	Top-1 acc 69.922 (67.653)	Top-5 acc 90.234 (86.343)	lr 0.00017
Train [114][2290/3239]	Time 0.232 (0.503)	Data Time 0.001 (0.018)	Loss 2.3752 (2.3440)	Entropy 0.53270 (0.53115)	Top-1 acc 65.234 (67.647)	Top-5 acc 87.109 (86.338)	lr 0.00017
Train [114][2300/3239]	Time 0.235 (0.503)	Data Time 0.002 (0.018)	Loss 2.3575 (2.3441)	Entropy 0.53312 (0.53116)	Top-1 acc 65.625 (67.642)	Top-5 acc 85.156 (86.338)	lr 0.00017
Train [114][2310/3239]	Time 0.254 (0.503)	Data Time 0.001 (0.018)	Loss 2.4402 (2.3441)	Entropy 0.53314 (0.53117)	Top-1 acc 64.453 (67.644)	Top-5 acc 86.719 (86.338)	lr 0.00017
Train [114][2320/3239]	Time 0.230 (0.502)	Data Time 0.001 (0.018)	Loss 2.3562 (2.3442)	Entropy 0.53346 (0.53118)	Top-1 acc 66.797 (67.647)	Top-5 acc 87.109 (86.335)	lr 0.00017
Train [114][2330/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.018)	Loss 2.5142 (2.3440)	Entropy 0.53371 (0.53119)	Top-1 acc 64.062 (67.650)	Top-5 acc 80.859 (86.337)	lr 0.00017
Train [114][2340/3239]	Time 0.227 (0.501)	Data Time 0.001 (0.018)	Loss 2.2380 (2.3438)	Entropy 0.53381 (0.53120)	Top-1 acc 67.578 (67.655)	Top-5 acc 87.500 (86.339)	lr 0.00017
Train [114][2350/3239]	Time 0.326 (0.501)	Data Time 0.001 (0.018)	Loss 2.1867 (2.3440)	Entropy 0.53403 (0.53121)	Top-1 acc 70.703 (67.649)	Top-5 acc 90.625 (86.337)	lr 0.00017
Train [114][2360/3239]	Time 0.233 (0.501)	Data Time 0.001 (0.018)	Loss 2.3050 (2.3439)	Entropy 0.53413 (0.53122)	Top-1 acc 67.969 (67.652)	Top-5 acc 88.281 (86.342)	lr 0.00017
Train [114][2370/3239]	Time 0.238 (0.500)	Data Time 0.001 (0.018)	Loss 2.3558 (2.3437)	Entropy 0.53389 (0.53123)	Top-1 acc 68.750 (67.661)	Top-5 acc 86.719 (86.346)	lr 0.00017
Train [114][2380/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.018)	Loss 2.2344 (2.3439)	Entropy 0.53408 (0.53124)	Top-1 acc 72.656 (67.659)	Top-5 acc 89.062 (86.344)	lr 0.00017
Train [114][2390/3239]	Time 0.260 (0.500)	Data Time 0.001 (0.018)	Loss 2.4266 (2.3439)	Entropy 0.53398 (0.53126)	Top-1 acc 67.188 (67.659)	Top-5 acc 86.328 (86.345)	lr 0.00017
Train [114][2400/3239]	Time 0.234 (0.499)	Data Time 0.001 (0.018)	Loss 2.5165 (2.3441)	Entropy 0.53388 (0.53127)	Top-1 acc 62.891 (67.652)	Top-5 acc 85.547 (86.343)	lr 0.00017
Train [114][2410/3239]	Time 0.228 (0.499)	Data Time 0.001 (0.017)	Loss 2.2251 (2.3440)	Entropy 0.53389 (0.53128)	Top-1 acc 72.266 (67.653)	Top-5 acc 88.281 (86.345)	lr 0.00017
Train [114][2420/3239]	Time 0.326 (0.498)	Data Time 0.001 (0.017)	Loss 2.1677 (2.3440)	Entropy 0.53354 (0.53129)	Top-1 acc 75.000 (67.661)	Top-5 acc 89.062 (86.344)	lr 0.00017
Train [114][2430/3239]	Time 0.226 (0.498)	Data Time 0.001 (0.017)	Loss 2.6474 (2.3443)	Entropy 0.53332 (0.53130)	Top-1 acc 59.375 (67.654)	Top-5 acc 82.422 (86.337)	lr 0.00017
Train [114][2440/3239]	Time 0.233 (0.498)	Data Time 0.001 (0.017)	Loss 2.2795 (2.3444)	Entropy 0.53340 (0.53131)	Top-1 acc 68.750 (67.648)	Top-5 acc 85.547 (86.335)	lr 0.00017
Train [114][2450/3239]	Time 0.230 (0.497)	Data Time 0.001 (0.017)	Loss 2.2998 (2.3441)	Entropy 0.53326 (0.53131)	Top-1 acc 66.797 (67.655)	Top-5 acc 87.891 (86.343)	lr 0.00017
Train [114][2460/3239]	Time 0.236 (0.497)	Data Time 0.001 (0.017)	Loss 2.3287 (2.3439)	Entropy 0.53322 (0.53132)	Top-1 acc 69.922 (67.658)	Top-5 acc 85.547 (86.344)	lr 0.00017
Train [114][2470/3239]	Time 0.228 (0.496)	Data Time 0.001 (0.017)	Loss 2.3621 (2.3444)	Entropy 0.53328 (0.53133)	Top-1 acc 66.016 (67.651)	Top-5 acc 85.938 (86.336)	lr 0.00017
Train [114][2480/3239]	Time 0.239 (0.496)	Data Time 0.001 (0.017)	Loss 2.3553 (2.3442)	Entropy 0.53318 (0.53134)	Top-1 acc 69.141 (67.654)	Top-5 acc 85.938 (86.340)	lr 0.00017
Train [114][2490/3239]	Time 0.232 (0.496)	Data Time 0.001 (0.017)	Loss 2.3520 (2.3444)	Entropy 0.53327 (0.53135)	Top-1 acc 66.016 (67.652)	Top-5 acc 85.156 (86.336)	lr 0.00017
Train [114][2500/3239]	Time 0.239 (0.495)	Data Time 0.001 (0.017)	Loss 2.1165 (2.3446)	Entropy 0.53333 (0.53135)	Top-1 acc 74.219 (67.649)	Top-5 acc 89.844 (86.336)	lr 0.00017
Train [114][2510/3239]	Time 0.247 (0.495)	Data Time 0.001 (0.017)	Loss 2.3112 (2.3446)	Entropy 0.53352 (0.53136)	Top-1 acc 67.578 (67.646)	Top-5 acc 87.500 (86.336)	lr 0.00017
Train [114][2520/3239]	Time 0.230 (0.495)	Data Time 0.001 (0.017)	Loss 2.5789 (2.3447)	Entropy 0.53378 (0.53137)	Top-1 acc 62.891 (67.644)	Top-5 acc 82.422 (86.337)	lr 0.00017
Train [114][2530/3239]	Time 0.231 (0.494)	Data Time 0.001 (0.017)	Loss 2.2713 (2.3446)	Entropy 0.53354 (0.53138)	Top-1 acc 70.312 (67.646)	Top-5 acc 88.672 (86.339)	lr 0.00017
Train [114][2540/3239]	Time 0.247 (0.494)	Data Time 0.001 (0.017)	Loss 2.4667 (2.3446)	Entropy 0.53346 (0.53139)	Top-1 acc 63.672 (67.648)	Top-5 acc 85.938 (86.338)	lr 0.00017
Train [114][2550/3239]	Time 0.241 (0.494)	Data Time 0.001 (0.017)	Loss 2.2573 (2.3448)	Entropy 0.53346 (0.53140)	Top-1 acc 70.703 (67.645)	Top-5 acc 87.500 (86.333)	lr 0.00016
Train [114][2560/3239]	Time 0.242 (0.493)	Data Time 0.001 (0.017)	Loss 2.1661 (2.3448)	Entropy 0.53348 (0.53140)	Top-1 acc 73.047 (67.645)	Top-5 acc 87.891 (86.332)	lr 0.00016
Train [114][2570/3239]	Time 0.238 (0.493)	Data Time 0.001 (0.016)	Loss 2.7435 (2.3448)	Entropy 0.53324 (0.53141)	Top-1 acc 55.859 (67.642)	Top-5 acc 78.516 (86.330)	lr 0.00016
Train [114][2580/3239]	Time 0.329 (0.493)	Data Time 0.001 (0.016)	Loss 2.3209 (2.3448)	Entropy 0.53285 (0.53142)	Top-1 acc 68.359 (67.638)	Top-5 acc 85.547 (86.331)	lr 0.00016
Train [114][2590/3239]	Time 0.239 (0.492)	Data Time 0.001 (0.016)	Loss 2.1120 (2.3445)	Entropy 0.53260 (0.53142)	Top-1 acc 69.531 (67.644)	Top-5 acc 89.453 (86.334)	lr 0.00016
Train [114][2600/3239]	Time 0.234 (0.492)	Data Time 0.001 (0.016)	Loss 2.1996 (2.3445)	Entropy 0.53261 (0.53143)	Top-1 acc 73.047 (67.644)	Top-5 acc 87.500 (86.332)	lr 0.00016
Train [114][2610/3239]	Time 0.229 (0.492)	Data Time 0.001 (0.016)	Loss 2.3552 (2.3445)	Entropy 0.53235 (0.53143)	Top-1 acc 68.359 (67.651)	Top-5 acc 86.328 (86.333)	lr 0.00016
Train [114][2620/3239]	Time 0.309 (0.510)	Data Time 0.002 (0.016)	Loss 2.3789 (2.3443)	Entropy 0.53176 (0.53144)	Top-1 acc 66.016 (67.656)	Top-5 acc 85.156 (86.333)	lr 0.00016
Train [114][2630/3239]	Time 0.235 (0.510)	Data Time 0.002 (0.016)	Loss 2.3055 (2.3444)	Entropy 0.53178 (0.53144)	Top-1 acc 69.531 (67.652)	Top-5 acc 89.453 (86.334)	lr 0.00016
Train [114][2640/3239]	Time 0.226 (0.510)	Data Time 0.001 (0.016)	Loss 2.3253 (2.3445)	Entropy 0.53195 (0.53144)	Top-1 acc 68.359 (67.647)	Top-5 acc 85.156 (86.329)	lr 0.00016
Train [114][2650/3239]	Time 0.357 (0.509)	Data Time 0.001 (0.016)	Loss 2.4116 (2.3445)	Entropy 0.53207 (0.53144)	Top-1 acc 63.672 (67.649)	Top-5 acc 85.156 (86.328)	lr 0.00016
Train [114][2660/3239]	Time 0.241 (0.509)	Data Time 0.001 (0.016)	Loss 2.1806 (2.3442)	Entropy 0.53207 (0.53144)	Top-1 acc 71.484 (67.655)	Top-5 acc 87.891 (86.333)	lr 0.00016
Train [114][2670/3239]	Time 0.241 (0.508)	Data Time 0.001 (0.016)	Loss 2.3425 (2.3443)	Entropy 0.53239 (0.53145)	Top-1 acc 69.141 (67.649)	Top-5 acc 84.375 (86.331)	lr 0.00016
Train [114][2680/3239]	Time 0.243 (0.508)	Data Time 0.001 (0.016)	Loss 2.1643 (2.3441)	Entropy 0.53236 (0.53145)	Top-1 acc 74.609 (67.656)	Top-5 acc 89.062 (86.335)	lr 0.00016
Train [114][2690/3239]	Time 0.245 (0.508)	Data Time 0.001 (0.016)	Loss 2.3062 (2.3442)	Entropy 0.53254 (0.53145)	Top-1 acc 70.312 (67.654)	Top-5 acc 87.891 (86.335)	lr 0.00016
Train [114][2700/3239]	Time 0.236 (0.508)	Data Time 0.001 (0.016)	Loss 2.2125 (2.3441)	Entropy 0.53250 (0.53146)	Top-1 acc 73.828 (67.658)	Top-5 acc 87.891 (86.337)	lr 0.00016
Train [114][2710/3239]	Time 0.227 (0.507)	Data Time 0.001 (0.016)	Loss 2.2570 (2.3438)	Entropy 0.53254 (0.53146)	Top-1 acc 71.094 (67.663)	Top-5 acc 85.938 (86.341)	lr 0.00016
Train [114][2720/3239]	Time 0.269 (0.507)	Data Time 0.001 (0.016)	Loss 2.4990 (2.3437)	Entropy 0.53225 (0.53146)	Top-1 acc 62.891 (67.660)	Top-5 acc 82.812 (86.344)	lr 0.00016
Train [114][2730/3239]	Time 0.230 (0.507)	Data Time 0.001 (0.016)	Loss 2.2273 (2.3438)	Entropy 0.53169 (0.53147)	Top-1 acc 70.312 (67.657)	Top-5 acc 89.453 (86.341)	lr 0.00016
Train [114][2740/3239]	Time 0.322 (0.506)	Data Time 0.001 (0.016)	Loss 2.1841 (2.3436)	Entropy 0.53181 (0.53147)	Top-1 acc 70.312 (67.666)	Top-5 acc 91.406 (86.345)	lr 0.00016
Train [114][2750/3239]	Time 0.225 (0.506)	Data Time 0.001 (0.016)	Loss 2.4025 (2.3435)	Entropy 0.53187 (0.53147)	Top-1 acc 66.016 (67.665)	Top-5 acc 85.938 (86.347)	lr 0.00016
Train [114][2760/3239]	Time 0.222 (0.506)	Data Time 0.001 (0.015)	Loss 2.3198 (2.3434)	Entropy 0.53190 (0.53147)	Top-1 acc 70.703 (67.669)	Top-5 acc 87.500 (86.350)	lr 0.00016
Train [114][2770/3239]	Time 0.228 (0.505)	Data Time 0.001 (0.015)	Loss 2.2217 (2.3433)	Entropy 0.53180 (0.53147)	Top-1 acc 71.875 (67.672)	Top-5 acc 86.328 (86.353)	lr 0.00016
Train [114][2780/3239]	Time 0.232 (0.505)	Data Time 0.001 (0.015)	Loss 2.1753 (2.3431)	Entropy 0.53179 (0.53147)	Top-1 acc 73.828 (67.678)	Top-5 acc 87.500 (86.353)	lr 0.00016
Train [114][2790/3239]	Time 0.228 (0.505)	Data Time 0.001 (0.015)	Loss 2.2479 (2.3432)	Entropy 0.53153 (0.53147)	Top-1 acc 65.625 (67.676)	Top-5 acc 88.672 (86.350)	lr 0.00016
Train [114][2800/3239]	Time 0.230 (0.504)	Data Time 0.001 (0.015)	Loss 2.2459 (2.3429)	Entropy 0.53172 (0.53147)	Top-1 acc 70.312 (67.680)	Top-5 acc 89.062 (86.354)	lr 0.00016
Train [114][2810/3239]	Time 0.338 (0.504)	Data Time 0.001 (0.015)	Loss 2.1901 (2.3429)	Entropy 0.53198 (0.53147)	Top-1 acc 69.922 (67.676)	Top-5 acc 87.891 (86.356)	lr 0.00016
Train [114][2820/3239]	Time 0.238 (0.504)	Data Time 0.001 (0.015)	Loss 2.3824 (2.3429)	Entropy 0.53222 (0.53148)	Top-1 acc 66.406 (67.673)	Top-5 acc 85.938 (86.359)	lr 0.00016
Train [114][2830/3239]	Time 0.233 (0.503)	Data Time 0.001 (0.015)	Loss 2.2116 (2.3430)	Entropy 0.53247 (0.53148)	Top-1 acc 73.438 (67.674)	Top-5 acc 87.891 (86.355)	lr 0.00016
Train [114][2840/3239]	Time 0.269 (0.503)	Data Time 0.001 (0.015)	Loss 2.3230 (2.3432)	Entropy 0.53249 (0.53148)	Top-1 acc 70.703 (67.670)	Top-5 acc 86.719 (86.354)	lr 0.00016
Train [114][2850/3239]	Time 0.228 (0.503)	Data Time 0.001 (0.015)	Loss 2.4136 (2.3432)	Entropy 0.53226 (0.53149)	Top-1 acc 67.578 (67.669)	Top-5 acc 84.766 (86.353)	lr 0.00016
Train [114][2860/3239]	Time 0.236 (0.502)	Data Time 0.001 (0.015)	Loss 2.1514 (2.3429)	Entropy 0.53234 (0.53149)	Top-1 acc 69.922 (67.675)	Top-5 acc 88.672 (86.358)	lr 0.00016
Train [114][2870/3239]	Time 0.251 (0.502)	Data Time 0.001 (0.015)	Loss 2.1122 (2.3428)	Entropy 0.53245 (0.53149)	Top-1 acc 71.875 (67.673)	Top-5 acc 90.234 (86.359)	lr 0.00016
Train [114][2880/3239]	Time 0.261 (0.502)	Data Time 0.001 (0.015)	Loss 2.2016 (2.3428)	Entropy 0.53243 (0.53150)	Top-1 acc 72.266 (67.674)	Top-5 acc 87.109 (86.359)	lr 0.00016
Train [114][2890/3239]	Time 0.251 (0.502)	Data Time 0.001 (0.015)	Loss 2.1915 (2.3428)	Entropy 0.53251 (0.53150)	Top-1 acc 70.312 (67.671)	Top-5 acc 88.281 (86.358)	lr 0.00016
Train [114][2900/3239]	Time 0.414 (0.501)	Data Time 0.002 (0.015)	Loss 2.5828 (2.3428)	Entropy 0.53263 (0.53150)	Top-1 acc 60.938 (67.671)	Top-5 acc 83.203 (86.359)	lr 0.00016
Train [114][2910/3239]	Time 0.268 (0.501)	Data Time 0.001 (0.015)	Loss 2.4585 (2.3430)	Entropy 0.53289 (0.53151)	Top-1 acc 67.969 (67.668)	Top-5 acc 83.594 (86.355)	lr 0.00016
Train [114][2920/3239]	Time 0.253 (0.501)	Data Time 0.001 (0.015)	Loss 2.6130 (2.3432)	Entropy 0.53283 (0.53151)	Top-1 acc 63.281 (67.667)	Top-5 acc 80.859 (86.352)	lr 0.00016
Train [114][2930/3239]	Time 0.226 (0.501)	Data Time 0.001 (0.015)	Loss 2.3907 (2.3432)	Entropy 0.53245 (0.53152)	Top-1 acc 65.234 (67.668)	Top-5 acc 84.375 (86.352)	lr 0.00016
Train [114][2940/3239]	Time 0.241 (0.500)	Data Time 0.001 (0.015)	Loss 2.2146 (2.3432)	Entropy 0.53255 (0.53152)	Top-1 acc 70.703 (67.669)	Top-5 acc 88.281 (86.353)	lr 0.00016
Train [114][2950/3239]	Time 0.253 (0.500)	Data Time 0.002 (0.015)	Loss 2.1342 (2.3430)	Entropy 0.53239 (0.53152)	Top-1 acc 72.266 (67.674)	Top-5 acc 89.844 (86.357)	lr 0.00016
Train [114][2960/3239]	Time 0.228 (0.500)	Data Time 0.001 (0.015)	Loss 2.2313 (2.3429)	Entropy 0.53237 (0.53153)	Top-1 acc 71.484 (67.678)	Top-5 acc 85.156 (86.357)	lr 0.00016
Train [114][2970/3239]	Time 0.335 (0.499)	Data Time 0.001 (0.014)	Loss 2.3685 (2.3426)	Entropy 0.53263 (0.53153)	Top-1 acc 65.625 (67.681)	Top-5 acc 86.719 (86.363)	lr 0.00016
Train [114][2980/3239]	Time 0.228 (0.499)	Data Time 0.001 (0.014)	Loss 2.4426 (2.3427)	Entropy 0.53276 (0.53153)	Top-1 acc 64.844 (67.681)	Top-5 acc 83.984 (86.365)	lr 0.00016
Train [114][2990/3239]	Time 0.235 (0.499)	Data Time 0.001 (0.014)	Loss 2.3946 (2.3426)	Entropy 0.53204 (0.53154)	Top-1 acc 65.625 (67.682)	Top-5 acc 86.719 (86.368)	lr 0.00016
Train [114][3000/3239]	Time 0.270 (0.498)	Data Time 0.001 (0.014)	Loss 2.2607 (2.3427)	Entropy 0.53211 (0.53154)	Top-1 acc 69.922 (67.680)	Top-5 acc 87.891 (86.364)	lr 0.00016
Train [114][3010/3239]	Time 0.232 (0.498)	Data Time 0.002 (0.014)	Loss 2.3926 (2.3428)	Entropy 0.53209 (0.53154)	Top-1 acc 64.844 (67.678)	Top-5 acc 86.328 (86.362)	lr 0.00016
Train [114][3020/3239]	Time 0.242 (0.498)	Data Time 0.002 (0.014)	Loss 2.3146 (2.3425)	Entropy 0.53228 (0.53154)	Top-1 acc 68.359 (67.684)	Top-5 acc 87.891 (86.367)	lr 0.00016
Train [114][3030/3239]	Time 0.264 (0.498)	Data Time 0.002 (0.014)	Loss 2.1350 (2.3424)	Entropy 0.53221 (0.53154)	Top-1 acc 74.219 (67.687)	Top-5 acc 90.234 (86.372)	lr 0.00016
Train [114][3040/3239]	Time 0.249 (0.498)	Data Time 0.001 (0.014)	Loss 2.1863 (2.3423)	Entropy 0.53217 (0.53155)	Top-1 acc 70.703 (67.688)	Top-5 acc 89.062 (86.374)	lr 0.00016
Train [114][3050/3239]	Time 0.247 (0.497)	Data Time 0.001 (0.014)	Loss 2.2415 (2.3423)	Entropy 0.53156 (0.53155)	Top-1 acc 72.266 (67.691)	Top-5 acc 89.453 (86.375)	lr 0.00016
Train [114][3060/3239]	Time 0.258 (0.497)	Data Time 0.001 (0.014)	Loss 2.5101 (2.3424)	Entropy 0.53172 (0.53155)	Top-1 acc 62.500 (67.689)	Top-5 acc 83.203 (86.375)	lr 0.00016
Train [114][3070/3239]	Time 0.231 (0.497)	Data Time 0.001 (0.014)	Loss 2.3041 (2.3423)	Entropy 0.53186 (0.53155)	Top-1 acc 66.016 (67.691)	Top-5 acc 87.109 (86.375)	lr 0.00016
Train [114][3080/3239]	Time 0.282 (0.497)	Data Time 0.001 (0.014)	Loss 2.2117 (2.3421)	Entropy 0.53137 (0.53155)	Top-1 acc 70.312 (67.695)	Top-5 acc 87.891 (86.376)	lr 0.00016
Train [114][3090/3239]	Time 0.248 (0.497)	Data Time 0.001 (0.014)	Loss 2.2838 (2.3421)	Entropy 0.53148 (0.53155)	Top-1 acc 68.750 (67.696)	Top-5 acc 85.156 (86.378)	lr 0.00016
Train [114][3100/3239]	Time 0.238 (0.496)	Data Time 0.001 (0.014)	Loss 2.2770 (2.3421)	Entropy 0.53161 (0.53155)	Top-1 acc 68.359 (67.697)	Top-5 acc 85.547 (86.376)	lr 0.00016
Train [114][3110/3239]	Time 0.254 (0.496)	Data Time 0.002 (0.014)	Loss 2.4197 (2.3420)	Entropy 0.53157 (0.53155)	Top-1 acc 66.797 (67.699)	Top-5 acc 85.156 (86.378)	lr 0.00016
Train [114][3120/3239]	Time 0.235 (0.496)	Data Time 0.001 (0.014)	Loss 2.2848 (2.3420)	Entropy 0.53185 (0.53155)	Top-1 acc 71.484 (67.699)	Top-5 acc 87.891 (86.378)	lr 0.00016
Train [114][3130/3239]	Time 0.327 (0.496)	Data Time 0.001 (0.014)	Loss 2.0735 (2.3420)	Entropy 0.53184 (0.53155)	Top-1 acc 75.000 (67.702)	Top-5 acc 91.406 (86.375)	lr 0.00016
Train [114][3140/3239]	Time 0.231 (0.495)	Data Time 0.001 (0.014)	Loss 2.6685 (2.3422)	Entropy 0.53201 (0.53155)	Top-1 acc 57.422 (67.695)	Top-5 acc 83.203 (86.373)	lr 0.00016
Train [114][3150/3239]	Time 0.259 (0.495)	Data Time 0.001 (0.014)	Loss 2.4305 (2.3422)	Entropy 0.53177 (0.53155)	Top-1 acc 66.797 (67.696)	Top-5 acc 85.938 (86.374)	lr 0.00016
Train [114][3160/3239]	Time 0.240 (0.495)	Data Time 0.001 (0.014)	Loss 2.2774 (2.3423)	Entropy 0.53148 (0.53155)	Top-1 acc 70.312 (67.692)	Top-5 acc 85.938 (86.374)	lr 0.00016
Train [114][3170/3239]	Time 0.231 (0.495)	Data Time 0.001 (0.014)	Loss 2.2748 (2.3421)	Entropy 0.53168 (0.53155)	Top-1 acc 64.844 (67.697)	Top-5 acc 87.891 (86.376)	lr 0.00016
Train [114][3180/3239]	Time 0.232 (0.494)	Data Time 0.000 (0.014)	Loss 2.1684 (2.3420)	Entropy 0.53195 (0.53155)	Top-1 acc 70.312 (67.701)	Top-5 acc 89.844 (86.379)	lr 0.00015
Train [114][3190/3239]	Time 0.255 (0.494)	Data Time 0.000 (0.014)	Loss 2.2420 (2.3421)	Entropy 0.53243 (0.53155)	Top-1 acc 72.656 (67.703)	Top-5 acc 87.891 (86.379)	lr 0.00015
Train [114][3200/3239]	Time 0.314 (0.493)	Data Time 0.000 (0.014)	Loss 2.2725 (2.3419)	Entropy 0.53259 (0.53156)	Top-1 acc 68.359 (67.704)	Top-5 acc 87.500 (86.382)	lr 0.00015
Train [114][3210/3239]	Time 0.227 (0.493)	Data Time 0.000 (0.014)	Loss 2.1147 (2.3418)	Entropy 0.53259 (0.53156)	Top-1 acc 74.219 (67.705)	Top-5 acc 89.844 (86.384)	lr 0.00015
Train [114][3220/3239]	Time 0.222 (0.493)	Data Time 0.000 (0.014)	Loss 2.1862 (2.3417)	Entropy 0.53264 (0.53156)	Top-1 acc 74.219 (67.710)	Top-5 acc 89.844 (86.387)	lr 0.00015
Train [114][3230/3239]	Time 0.259 (0.492)	Data Time 0.000 (0.013)	Loss 2.3677 (2.3416)	Entropy 0.53271 (0.53157)	Top-1 acc 66.406 (67.712)	Top-5 acc 84.766 (86.389)	lr 0.00015
Train [114][3239/3239]	Time 0.917 (0.492)	Data Time 0.000 (0.013)	Loss 2.5255 (2.3417)	Entropy 0.53282 (0.53157)	Top-1 acc 61.728 (67.708)	Top-5 acc 85.185 (86.387)	lr 0.00015
==========Valid [114/120]	loss 1.170	top-1 acc 72.929 (73.154)	top-5 acc 90.623	Train top-1 67.708	top-5 86.387	Entropy 0.53282	Latency-None: 0.000ms	Flops: 539.00M
Train [115][0/3239]	Time 37.584 (37.584)	Data Time 36.221 (36.221)	Loss 2.2137 (2.2137)	Entropy 0.53278 (0.53278)	Top-1 acc 71.484 (71.484)	Top-5 acc 87.109 (87.109)	lr 0.00015
Train [115][10/3239]	Time 0.224 (3.932)	Data Time 0.001 (3.295)	Loss 2.6356 (2.3741)	Entropy 0.53319 (0.53290)	Top-1 acc 62.500 (67.152)	Top-5 acc 82.031 (86.328)	lr 0.00015
Train [115][20/3239]	Time 0.230 (2.246)	Data Time 0.001 (1.727)	Loss 2.6171 (2.3548)	Entropy 0.53294 (0.53301)	Top-1 acc 60.156 (67.801)	Top-5 acc 80.859 (86.384)	lr 0.00015
Train [115][30/3239]	Time 0.468 (3.278)	Data Time 0.006 (1.170)	Loss 2.2858 (2.3281)	Entropy 0.53308 (0.53299)	Top-1 acc 67.969 (68.347)	Top-5 acc 91.016 (86.757)	lr 0.00015
Train [115][40/3239]	Time 0.225 (2.593)	Data Time 0.002 (0.886)	Loss 2.3250 (2.3217)	Entropy 0.53318 (0.53303)	Top-1 acc 67.578 (68.645)	Top-5 acc 88.281 (86.785)	lr 0.00015
Train [115][50/3239]	Time 0.229 (2.162)	Data Time 0.001 (0.712)	Loss 2.2188 (2.3266)	Entropy 0.53282 (0.53302)	Top-1 acc 69.922 (68.421)	Top-5 acc 88.672 (86.803)	lr 0.00015
Train [115][60/3239]	Time 0.265 (1.878)	Data Time 0.001 (0.596)	Loss 2.6207 (2.3355)	Entropy 0.53282 (0.53299)	Top-1 acc 60.938 (68.180)	Top-5 acc 81.641 (86.584)	lr 0.00015
Train [115][70/3239]	Time 0.232 (1.671)	Data Time 0.001 (0.512)	Loss 2.0798 (2.3363)	Entropy 0.53281 (0.53297)	Top-1 acc 75.391 (68.315)	Top-5 acc 90.625 (86.581)	lr 0.00015
Train [115][80/3239]	Time 0.227 (1.517)	Data Time 0.001 (0.449)	Loss 2.3748 (2.3393)	Entropy 0.53273 (0.53294)	Top-1 acc 65.234 (68.123)	Top-5 acc 87.500 (86.540)	lr 0.00015
Train [115][90/3239]	Time 0.224 (1.393)	Data Time 0.001 (0.400)	Loss 2.2533 (2.3387)	Entropy 0.53256 (0.53291)	Top-1 acc 69.141 (68.063)	Top-5 acc 89.844 (86.573)	lr 0.00015
Train [115][100/3239]	Time 0.212 (1.296)	Data Time 0.001 (0.361)	Loss 2.3730 (2.3390)	Entropy 0.53262 (0.53287)	Top-1 acc 66.016 (67.988)	Top-5 acc 85.938 (86.564)	lr 0.00015
Train [115][110/3239]	Time 0.230 (1.217)	Data Time 0.001 (0.328)	Loss 2.2647 (2.3319)	Entropy 0.53286 (0.53285)	Top-1 acc 67.578 (68.120)	Top-5 acc 87.891 (86.624)	lr 0.00015
Train [115][120/3239]	Time 0.255 (1.151)	Data Time 0.001 (0.301)	Loss 2.3904 (2.3346)	Entropy 0.53283 (0.53286)	Top-1 acc 64.453 (67.962)	Top-5 acc 85.156 (86.580)	lr 0.00015
Train [115][130/3239]	Time 0.237 (1.094)	Data Time 0.001 (0.278)	Loss 2.3399 (2.3338)	Entropy 0.53297 (0.53285)	Top-1 acc 70.703 (67.987)	Top-5 acc 85.938 (86.576)	lr 0.00015
Train [115][140/3239]	Time 0.232 (1.046)	Data Time 0.001 (0.259)	Loss 2.3312 (2.3371)	Entropy 0.53316 (0.53287)	Top-1 acc 67.578 (67.866)	Top-5 acc 88.281 (86.511)	lr 0.00015
Train [115][150/3239]	Time 0.281 (1.005)	Data Time 0.002 (0.242)	Loss 2.5135 (2.3426)	Entropy 0.53314 (0.53289)	Top-1 acc 63.672 (67.741)	Top-5 acc 85.156 (86.388)	lr 0.00015
Train [115][160/3239]	Time 0.233 (0.971)	Data Time 0.001 (0.227)	Loss 2.3974 (2.3429)	Entropy 0.53328 (0.53291)	Top-1 acc 66.797 (67.719)	Top-5 acc 84.766 (86.379)	lr 0.00015
Train [115][170/3239]	Time 0.225 (0.938)	Data Time 0.001 (0.214)	Loss 2.2759 (2.3395)	Entropy 0.53293 (0.53293)	Top-1 acc 69.141 (67.777)	Top-5 acc 87.891 (86.424)	lr 0.00015
Train [115][180/3239]	Time 0.269 (0.910)	Data Time 0.001 (0.202)	Loss 2.4398 (2.3375)	Entropy 0.53290 (0.53292)	Top-1 acc 65.234 (67.848)	Top-5 acc 83.984 (86.473)	lr 0.00015
Train [115][190/3239]	Time 0.381 (0.886)	Data Time 0.001 (0.191)	Loss 2.3773 (2.3353)	Entropy 0.53318 (0.53292)	Top-1 acc 66.016 (67.879)	Top-5 acc 85.156 (86.518)	lr 0.00015
Train [115][200/3239]	Time 0.227 (0.863)	Data Time 0.001 (0.182)	Loss 2.1412 (2.3360)	Entropy 0.53291 (0.53293)	Top-1 acc 73.047 (67.850)	Top-5 acc 92.188 (86.522)	lr 0.00015
Train [115][210/3239]	Time 0.223 (0.842)	Data Time 0.002 (0.173)	Loss 2.5599 (2.3363)	Entropy 0.53291 (0.53292)	Top-1 acc 64.844 (67.872)	Top-5 acc 85.156 (86.523)	lr 0.00015
Train [115][220/3239]	Time 0.230 (0.822)	Data Time 0.001 (0.166)	Loss 2.1521 (2.3375)	Entropy 0.53285 (0.53292)	Top-1 acc 72.266 (67.820)	Top-5 acc 88.672 (86.487)	lr 0.00015
Train [115][230/3239]	Time 0.228 (0.804)	Data Time 0.001 (0.159)	Loss 2.1407 (2.3346)	Entropy 0.53299 (0.53292)	Top-1 acc 72.266 (67.886)	Top-5 acc 88.672 (86.541)	lr 0.00015
Train [115][240/3239]	Time 0.234 (0.788)	Data Time 0.001 (0.152)	Loss 2.5174 (2.3348)	Entropy 0.53328 (0.53293)	Top-1 acc 63.281 (67.889)	Top-5 acc 84.375 (86.526)	lr 0.00015
Train [115][250/3239]	Time 0.230 (0.773)	Data Time 0.001 (0.146)	Loss 2.1921 (2.3314)	Entropy 0.53322 (0.53294)	Top-1 acc 67.578 (67.980)	Top-5 acc 89.844 (86.591)	lr 0.00015
Train [115][260/3239]	Time 0.326 (0.759)	Data Time 0.001 (0.141)	Loss 2.1502 (2.3324)	Entropy 0.53325 (0.53295)	Top-1 acc 72.656 (67.948)	Top-5 acc 89.062 (86.566)	lr 0.00015
Train [115][270/3239]	Time 0.226 (0.746)	Data Time 0.001 (0.135)	Loss 2.2834 (2.3308)	Entropy 0.53289 (0.53296)	Top-1 acc 64.062 (67.975)	Top-5 acc 87.109 (86.579)	lr 0.00015
Train [115][280/3239]	Time 0.258 (0.734)	Data Time 0.001 (0.131)	Loss 2.3996 (2.3303)	Entropy 0.53319 (0.53296)	Top-1 acc 66.016 (67.992)	Top-5 acc 85.547 (86.578)	lr 0.00015
Train [115][290/3239]	Time 0.260 (0.724)	Data Time 0.001 (0.126)	Loss 2.1499 (2.3303)	Entropy 0.53299 (0.53296)	Top-1 acc 71.094 (67.997)	Top-5 acc 87.109 (86.554)	lr 0.00015
Train [115][300/3239]	Time 0.229 (0.712)	Data Time 0.001 (0.122)	Loss 2.4196 (2.3304)	Entropy 0.53274 (0.53296)	Top-1 acc 64.453 (67.996)	Top-5 acc 85.547 (86.555)	lr 0.00015
Train [115][310/3239]	Time 0.273 (0.704)	Data Time 0.002 (0.118)	Loss 2.2580 (2.3302)	Entropy 0.53286 (0.53295)	Top-1 acc 69.531 (68.005)	Top-5 acc 87.891 (86.549)	lr 0.00015
Train [115][320/3239]	Time 0.234 (0.695)	Data Time 0.001 (0.115)	Loss 2.2352 (2.3309)	Entropy 0.53298 (0.53295)	Top-1 acc 71.094 (68.003)	Top-5 acc 90.625 (86.546)	lr 0.00015
Train [115][330/3239]	Time 0.282 (0.686)	Data Time 0.001 (0.111)	Loss 2.3303 (2.3310)	Entropy 0.53314 (0.53295)	Top-1 acc 67.188 (67.986)	Top-5 acc 85.938 (86.546)	lr 0.00015
Train [115][340/3239]	Time 0.224 (0.678)	Data Time 0.001 (0.108)	Loss 2.4116 (2.3298)	Entropy 0.53316 (0.53295)	Top-1 acc 66.406 (68.037)	Top-5 acc 85.156 (86.578)	lr 0.00015
Train [115][350/3239]	Time 0.317 (0.671)	Data Time 0.001 (0.105)	Loss 2.3808 (2.3333)	Entropy 0.53323 (0.53296)	Top-1 acc 68.750 (67.992)	Top-5 acc 86.328 (86.508)	lr 0.00015
Train [115][360/3239]	Time 0.230 (0.664)	Data Time 0.001 (0.102)	Loss 2.3129 (2.3328)	Entropy 0.53314 (0.53297)	Top-1 acc 66.406 (67.998)	Top-5 acc 87.891 (86.521)	lr 0.00015
Train [115][370/3239]	Time 0.226 (0.657)	Data Time 0.001 (0.099)	Loss 2.2655 (2.3342)	Entropy 0.53315 (0.53297)	Top-1 acc 68.750 (67.987)	Top-5 acc 90.625 (86.500)	lr 0.00015
Train [115][380/3239]	Time 0.246 (0.651)	Data Time 0.002 (0.097)	Loss 2.3342 (2.3347)	Entropy 0.53312 (0.53298)	Top-1 acc 70.312 (67.977)	Top-5 acc 84.766 (86.508)	lr 0.00015
Train [115][390/3239]	Time 0.228 (0.645)	Data Time 0.001 (0.094)	Loss 2.3714 (2.3359)	Entropy 0.53291 (0.53298)	Top-1 acc 66.406 (67.944)	Top-5 acc 85.938 (86.484)	lr 0.00015
Train [115][400/3239]	Time 0.225 (0.639)	Data Time 0.001 (0.092)	Loss 2.2255 (2.3370)	Entropy 0.53287 (0.53298)	Top-1 acc 71.875 (67.909)	Top-5 acc 88.672 (86.472)	lr 0.00015
Train [115][410/3239]	Time 0.232 (0.633)	Data Time 0.001 (0.090)	Loss 2.3741 (2.3374)	Entropy 0.53324 (0.53298)	Top-1 acc 67.188 (67.869)	Top-5 acc 87.500 (86.461)	lr 0.00015
Train [115][420/3239]	Time 0.309 (0.627)	Data Time 0.001 (0.088)	Loss 2.4575 (2.3377)	Entropy 0.53326 (0.53299)	Top-1 acc 65.234 (67.862)	Top-5 acc 89.062 (86.473)	lr 0.00015
Train [115][430/3239]	Time 0.226 (0.622)	Data Time 0.001 (0.086)	Loss 2.3668 (2.3393)	Entropy 0.53335 (0.53299)	Top-1 acc 67.578 (67.826)	Top-5 acc 88.672 (86.451)	lr 0.00015
Train [115][440/3239]	Time 0.238 (0.617)	Data Time 0.002 (0.084)	Loss 2.4609 (2.3390)	Entropy 0.53337 (0.53300)	Top-1 acc 66.016 (67.831)	Top-5 acc 85.156 (86.466)	lr 0.00015
Train [115][450/3239]	Time 0.243 (0.613)	Data Time 0.001 (0.082)	Loss 2.4940 (2.3404)	Entropy 0.53313 (0.53300)	Top-1 acc 58.984 (67.786)	Top-5 acc 85.156 (86.455)	lr 0.00015
Train [115][460/3239]	Time 0.231 (0.609)	Data Time 0.001 (0.080)	Loss 2.2576 (2.3392)	Entropy 0.53331 (0.53301)	Top-1 acc 69.922 (67.840)	Top-5 acc 90.234 (86.480)	lr 0.00015
Train [115][470/3239]	Time 0.249 (0.605)	Data Time 0.001 (0.079)	Loss 2.3801 (2.3407)	Entropy 0.53314 (0.53302)	Top-1 acc 61.719 (67.787)	Top-5 acc 85.156 (86.444)	lr 0.00015
Train [115][480/3239]	Time 0.240 (0.601)	Data Time 0.001 (0.077)	Loss 2.2475 (2.3402)	Entropy 0.53311 (0.53302)	Top-1 acc 66.797 (67.816)	Top-5 acc 88.672 (86.442)	lr 0.00015
Train [115][490/3239]	Time 0.236 (0.598)	Data Time 0.001 (0.076)	Loss 2.3015 (2.3402)	Entropy 0.53304 (0.53302)	Top-1 acc 69.531 (67.814)	Top-5 acc 88.281 (86.446)	lr 0.00015
Train [115][500/3239]	Time 0.245 (0.594)	Data Time 0.001 (0.074)	Loss 2.3399 (2.3406)	Entropy 0.53302 (0.53302)	Top-1 acc 69.922 (67.800)	Top-5 acc 84.375 (86.442)	lr 0.00015
Train [115][510/3239]	Time 0.342 (0.592)	Data Time 0.001 (0.073)	Loss 2.3378 (2.3414)	Entropy 0.53238 (0.53301)	Top-1 acc 69.922 (67.791)	Top-5 acc 86.719 (86.431)	lr 0.00015
Train [115][520/3239]	Time 0.239 (0.588)	Data Time 0.001 (0.071)	Loss 2.4688 (2.3415)	Entropy 0.53245 (0.53300)	Top-1 acc 69.531 (67.795)	Top-5 acc 83.984 (86.429)	lr 0.00015
Train [115][530/3239]	Time 0.235 (0.585)	Data Time 0.001 (0.070)	Loss 2.2996 (2.3412)	Entropy 0.53241 (0.53299)	Top-1 acc 66.406 (67.777)	Top-5 acc 86.719 (86.437)	lr 0.00015
Train [115][540/3239]	Time 0.230 (0.581)	Data Time 0.001 (0.069)	Loss 2.1659 (2.3408)	Entropy 0.53264 (0.53298)	Top-1 acc 71.484 (67.782)	Top-5 acc 91.797 (86.448)	lr 0.00015
Train [115][550/3239]	Time 0.232 (0.578)	Data Time 0.001 (0.067)	Loss 2.3330 (2.3430)	Entropy 0.53282 (0.53298)	Top-1 acc 64.453 (67.718)	Top-5 acc 86.328 (86.419)	lr 0.00015
Train [115][560/3239]	Time 0.261 (0.575)	Data Time 0.002 (0.066)	Loss 2.2967 (2.3440)	Entropy 0.53268 (0.53297)	Top-1 acc 70.703 (67.680)	Top-5 acc 86.719 (86.400)	lr 0.00015
Train [115][570/3239]	Time 0.278 (0.572)	Data Time 0.001 (0.065)	Loss 2.1730 (2.3445)	Entropy 0.53271 (0.53297)	Top-1 acc 74.219 (67.679)	Top-5 acc 88.672 (86.388)	lr 0.00015
Train [115][580/3239]	Time 0.317 (0.570)	Data Time 0.001 (0.064)	Loss 2.2031 (2.3466)	Entropy 0.53259 (0.53296)	Top-1 acc 71.484 (67.618)	Top-5 acc 87.891 (86.350)	lr 0.00014
Train [115][590/3239]	Time 0.228 (0.567)	Data Time 0.001 (0.063)	Loss 2.4336 (2.3466)	Entropy 0.53242 (0.53295)	Top-1 acc 62.891 (67.604)	Top-5 acc 84.766 (86.348)	lr 0.00014
Train [115][600/3239]	Time 0.227 (0.564)	Data Time 0.001 (0.062)	Loss 2.5073 (2.3468)	Entropy 0.53235 (0.53294)	Top-1 acc 63.281 (67.591)	Top-5 acc 84.375 (86.345)	lr 0.00014
Train [115][610/3239]	Time 0.232 (0.562)	Data Time 0.002 (0.061)	Loss 2.4841 (2.3465)	Entropy 0.53216 (0.53293)	Top-1 acc 66.016 (67.601)	Top-5 acc 82.812 (86.339)	lr 0.00014
Train [115][620/3239]	Time 0.230 (0.559)	Data Time 0.001 (0.060)	Loss 2.2015 (2.3465)	Entropy 0.53230 (0.53292)	Top-1 acc 69.922 (67.588)	Top-5 acc 89.844 (86.346)	lr 0.00014
Train [115][630/3239]	Time 0.225 (0.557)	Data Time 0.001 (0.059)	Loss 2.2621 (2.3462)	Entropy 0.53251 (0.53291)	Top-1 acc 69.531 (67.593)	Top-5 acc 88.672 (86.354)	lr 0.00014
Train [115][640/3239]	Time 0.223 (0.554)	Data Time 0.001 (0.058)	Loss 2.3550 (2.3465)	Entropy 0.53223 (0.53290)	Top-1 acc 66.797 (67.573)	Top-5 acc 87.109 (86.360)	lr 0.00014
Train [115][650/3239]	Time 0.228 (0.552)	Data Time 0.001 (0.057)	Loss 2.2951 (2.3457)	Entropy 0.53231 (0.53289)	Top-1 acc 67.188 (67.599)	Top-5 acc 88.281 (86.380)	lr 0.00014
Train [115][660/3239]	Time 0.221 (0.550)	Data Time 0.001 (0.057)	Loss 2.3142 (2.3463)	Entropy 0.53225 (0.53288)	Top-1 acc 67.188 (67.589)	Top-5 acc 88.672 (86.362)	lr 0.00014
Train [115][670/3239]	Time 0.245 (0.548)	Data Time 0.001 (0.056)	Loss 2.4053 (2.3463)	Entropy 0.53223 (0.53288)	Top-1 acc 67.188 (67.588)	Top-5 acc 85.156 (86.365)	lr 0.00014
Train [115][680/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.055)	Loss 2.3092 (2.3459)	Entropy 0.53251 (0.53287)	Top-1 acc 69.922 (67.588)	Top-5 acc 86.719 (86.381)	lr 0.00014
Train [115][690/3239]	Time 0.410 (0.619)	Data Time 0.006 (0.054)	Loss 2.2877 (2.3459)	Entropy 0.53192 (0.53286)	Top-1 acc 69.922 (67.587)	Top-5 acc 87.109 (86.368)	lr 0.00014
Train [115][700/3239]	Time 0.231 (0.616)	Data Time 0.002 (0.053)	Loss 2.1938 (2.3452)	Entropy 0.53202 (0.53285)	Top-1 acc 75.000 (67.605)	Top-5 acc 89.453 (86.373)	lr 0.00014
Train [115][710/3239]	Time 0.230 (0.613)	Data Time 0.001 (0.053)	Loss 2.3390 (2.3455)	Entropy 0.53216 (0.53284)	Top-1 acc 68.359 (67.601)	Top-5 acc 87.109 (86.373)	lr 0.00014
Train [115][720/3239]	Time 0.233 (0.611)	Data Time 0.001 (0.052)	Loss 2.3511 (2.3459)	Entropy 0.53236 (0.53283)	Top-1 acc 66.406 (67.589)	Top-5 acc 85.938 (86.369)	lr 0.00014
Train [115][730/3239]	Time 0.229 (0.608)	Data Time 0.001 (0.051)	Loss 2.4091 (2.3462)	Entropy 0.53248 (0.53282)	Top-1 acc 67.188 (67.596)	Top-5 acc 86.328 (86.364)	lr 0.00014
Train [115][740/3239]	Time 0.343 (0.606)	Data Time 0.001 (0.051)	Loss 2.7163 (2.3465)	Entropy 0.53181 (0.53281)	Top-1 acc 58.594 (67.581)	Top-5 acc 83.984 (86.361)	lr 0.00014
Train [115][750/3239]	Time 0.226 (0.603)	Data Time 0.001 (0.050)	Loss 2.3205 (2.3460)	Entropy 0.53189 (0.53280)	Top-1 acc 67.969 (67.600)	Top-5 acc 86.719 (86.374)	lr 0.00014
Train [115][760/3239]	Time 0.232 (0.601)	Data Time 0.001 (0.049)	Loss 2.3934 (2.3455)	Entropy 0.53205 (0.53279)	Top-1 acc 65.625 (67.607)	Top-5 acc 86.719 (86.375)	lr 0.00014
Train [115][770/3239]	Time 0.225 (0.598)	Data Time 0.001 (0.049)	Loss 2.8945 (2.3460)	Entropy 0.53211 (0.53278)	Top-1 acc 53.906 (67.610)	Top-5 acc 78.516 (86.363)	lr 0.00014
Train [115][780/3239]	Time 0.237 (0.596)	Data Time 0.001 (0.048)	Loss 2.8537 (2.3483)	Entropy 0.53215 (0.53277)	Top-1 acc 58.203 (67.563)	Top-5 acc 77.344 (86.319)	lr 0.00014
Train [115][790/3239]	Time 0.229 (0.594)	Data Time 0.001 (0.048)	Loss 2.3436 (2.3483)	Entropy 0.53212 (0.53276)	Top-1 acc 67.578 (67.554)	Top-5 acc 87.500 (86.332)	lr 0.00014
Train [115][800/3239]	Time 0.234 (0.591)	Data Time 0.001 (0.047)	Loss 2.3165 (2.3483)	Entropy 0.53198 (0.53275)	Top-1 acc 69.531 (67.558)	Top-5 acc 85.938 (86.331)	lr 0.00014
Train [115][810/3239]	Time 0.245 (0.589)	Data Time 0.001 (0.046)	Loss 2.7576 (2.3487)	Entropy 0.53229 (0.53275)	Top-1 acc 58.984 (67.558)	Top-5 acc 78.125 (86.320)	lr 0.00014
Train [115][820/3239]	Time 0.233 (0.587)	Data Time 0.001 (0.046)	Loss 2.2132 (2.3488)	Entropy 0.53239 (0.53274)	Top-1 acc 71.484 (67.553)	Top-5 acc 87.891 (86.321)	lr 0.00014
Train [115][830/3239]	Time 0.248 (0.585)	Data Time 0.001 (0.045)	Loss 2.2376 (2.3481)	Entropy 0.53237 (0.53274)	Top-1 acc 71.094 (67.576)	Top-5 acc 88.672 (86.334)	lr 0.00014
Train [115][840/3239]	Time 0.238 (0.583)	Data Time 0.001 (0.045)	Loss 2.3270 (2.3473)	Entropy 0.53274 (0.53273)	Top-1 acc 67.969 (67.600)	Top-5 acc 85.938 (86.336)	lr 0.00014
Train [115][850/3239]	Time 0.228 (0.581)	Data Time 0.001 (0.044)	Loss 2.3909 (2.3476)	Entropy 0.53235 (0.53273)	Top-1 acc 68.750 (67.596)	Top-5 acc 85.547 (86.330)	lr 0.00014
Train [115][860/3239]	Time 0.228 (0.579)	Data Time 0.001 (0.044)	Loss 2.3662 (2.3476)	Entropy 0.53229 (0.53273)	Top-1 acc 67.578 (67.594)	Top-5 acc 86.328 (86.337)	lr 0.00014
Train [115][870/3239]	Time 0.241 (0.577)	Data Time 0.001 (0.043)	Loss 2.6533 (2.3478)	Entropy 0.53239 (0.53272)	Top-1 acc 58.594 (67.576)	Top-5 acc 80.859 (86.334)	lr 0.00014
Train [115][880/3239]	Time 0.285 (0.576)	Data Time 0.001 (0.043)	Loss 2.2204 (2.3474)	Entropy 0.53222 (0.53272)	Top-1 acc 69.141 (67.599)	Top-5 acc 88.281 (86.342)	lr 0.00014
Train [115][890/3239]	Time 0.247 (0.574)	Data Time 0.001 (0.042)	Loss 2.3235 (2.3478)	Entropy 0.53203 (0.53271)	Top-1 acc 65.625 (67.587)	Top-5 acc 89.062 (86.341)	lr 0.00014
Train [115][900/3239]	Time 0.321 (0.572)	Data Time 0.001 (0.042)	Loss 2.6104 (2.3480)	Entropy 0.53216 (0.53271)	Top-1 acc 61.328 (67.571)	Top-5 acc 81.250 (86.335)	lr 0.00014
Train [115][910/3239]	Time 0.226 (0.571)	Data Time 0.001 (0.042)	Loss 2.3407 (2.3475)	Entropy 0.53225 (0.53270)	Top-1 acc 66.016 (67.584)	Top-5 acc 83.203 (86.337)	lr 0.00014
Train [115][920/3239]	Time 0.237 (0.569)	Data Time 0.001 (0.041)	Loss 2.2963 (2.3475)	Entropy 0.53206 (0.53270)	Top-1 acc 70.312 (67.588)	Top-5 acc 86.719 (86.335)	lr 0.00014
Train [115][930/3239]	Time 0.236 (0.567)	Data Time 0.002 (0.041)	Loss 2.4165 (2.3477)	Entropy 0.53213 (0.53269)	Top-1 acc 63.281 (67.577)	Top-5 acc 84.766 (86.334)	lr 0.00014
Train [115][940/3239]	Time 0.287 (0.566)	Data Time 0.002 (0.040)	Loss 2.3098 (2.3475)	Entropy 0.53244 (0.53268)	Top-1 acc 71.094 (67.576)	Top-5 acc 85.156 (86.343)	lr 0.00014
Train [115][950/3239]	Time 0.278 (0.566)	Data Time 0.002 (0.040)	Loss 2.4264 (2.3469)	Entropy 0.53244 (0.53268)	Top-1 acc 64.453 (67.590)	Top-5 acc 84.766 (86.349)	lr 0.00014
Train [115][960/3239]	Time 0.227 (0.565)	Data Time 0.001 (0.039)	Loss 2.2813 (2.3467)	Entropy 0.53223 (0.53268)	Top-1 acc 67.578 (67.603)	Top-5 acc 86.328 (86.351)	lr 0.00014
Train [115][970/3239]	Time 0.322 (0.563)	Data Time 0.001 (0.039)	Loss 2.3847 (2.3465)	Entropy 0.53213 (0.53267)	Top-1 acc 67.969 (67.609)	Top-5 acc 87.109 (86.365)	lr 0.00014
Train [115][980/3239]	Time 0.228 (0.562)	Data Time 0.001 (0.039)	Loss 2.1799 (2.3464)	Entropy 0.53236 (0.53267)	Top-1 acc 69.922 (67.604)	Top-5 acc 90.625 (86.364)	lr 0.00014
Train [115][990/3239]	Time 0.246 (0.560)	Data Time 0.001 (0.038)	Loss 2.3895 (2.3469)	Entropy 0.53220 (0.53267)	Top-1 acc 68.750 (67.597)	Top-5 acc 83.594 (86.349)	lr 0.00014
Train [115][1000/3239]	Time 0.272 (0.559)	Data Time 0.002 (0.038)	Loss 2.3100 (2.3470)	Entropy 0.53176 (0.53266)	Top-1 acc 67.188 (67.595)	Top-5 acc 87.891 (86.349)	lr 0.00014
Train [115][1010/3239]	Time 0.230 (0.558)	Data Time 0.001 (0.038)	Loss 2.2452 (2.3467)	Entropy 0.53151 (0.53265)	Top-1 acc 67.969 (67.597)	Top-5 acc 87.500 (86.355)	lr 0.00014
Train [115][1020/3239]	Time 0.230 (0.556)	Data Time 0.001 (0.037)	Loss 2.3986 (2.3472)	Entropy 0.53172 (0.53264)	Top-1 acc 66.797 (67.582)	Top-5 acc 85.156 (86.345)	lr 0.00014
Train [115][1030/3239]	Time 0.226 (0.555)	Data Time 0.001 (0.037)	Loss 2.5384 (2.3473)	Entropy 0.53178 (0.53263)	Top-1 acc 63.281 (67.576)	Top-5 acc 83.984 (86.340)	lr 0.00014
Train [115][1040/3239]	Time 0.223 (0.553)	Data Time 0.001 (0.037)	Loss 2.6991 (2.3475)	Entropy 0.53193 (0.53262)	Top-1 acc 60.156 (67.573)	Top-5 acc 78.906 (86.335)	lr 0.00014
Train [115][1050/3239]	Time 0.231 (0.552)	Data Time 0.001 (0.036)	Loss 2.4008 (2.3470)	Entropy 0.53141 (0.53261)	Top-1 acc 66.797 (67.575)	Top-5 acc 85.547 (86.341)	lr 0.00014
Train [115][1060/3239]	Time 0.358 (0.551)	Data Time 0.001 (0.036)	Loss 2.1294 (2.3466)	Entropy 0.53180 (0.53260)	Top-1 acc 72.266 (67.587)	Top-5 acc 93.359 (86.354)	lr 0.00014
Train [115][1070/3239]	Time 0.242 (0.549)	Data Time 0.002 (0.036)	Loss 2.2535 (2.3465)	Entropy 0.53197 (0.53260)	Top-1 acc 71.484 (67.596)	Top-5 acc 90.234 (86.361)	lr 0.00014
Train [115][1080/3239]	Time 0.231 (0.548)	Data Time 0.001 (0.035)	Loss 2.4465 (2.3467)	Entropy 0.53170 (0.53259)	Top-1 acc 64.453 (67.589)	Top-5 acc 86.328 (86.365)	lr 0.00014
Train [115][1090/3239]	Time 0.238 (0.547)	Data Time 0.001 (0.035)	Loss 2.3505 (2.3464)	Entropy 0.53199 (0.53258)	Top-1 acc 66.016 (67.599)	Top-5 acc 86.328 (86.368)	lr 0.00014
Train [115][1100/3239]	Time 0.241 (0.546)	Data Time 0.001 (0.035)	Loss 2.2775 (2.3469)	Entropy 0.53172 (0.53258)	Top-1 acc 67.969 (67.584)	Top-5 acc 87.109 (86.353)	lr 0.00014
Train [115][1110/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.034)	Loss 2.5357 (2.3474)	Entropy 0.53144 (0.53257)	Top-1 acc 60.938 (67.567)	Top-5 acc 83.984 (86.343)	lr 0.00014
Train [115][1120/3239]	Time 0.237 (0.543)	Data Time 0.001 (0.034)	Loss 2.3582 (2.3473)	Entropy 0.53165 (0.53256)	Top-1 acc 67.578 (67.579)	Top-5 acc 84.766 (86.345)	lr 0.00014
Train [115][1130/3239]	Time 0.337 (0.542)	Data Time 0.001 (0.034)	Loss 2.3334 (2.3472)	Entropy 0.53153 (0.53255)	Top-1 acc 68.359 (67.577)	Top-5 acc 85.547 (86.344)	lr 0.00014
Train [115][1140/3239]	Time 0.242 (0.541)	Data Time 0.001 (0.034)	Loss 2.2257 (2.3473)	Entropy 0.53177 (0.53254)	Top-1 acc 70.703 (67.579)	Top-5 acc 89.453 (86.348)	lr 0.00014
Train [115][1150/3239]	Time 0.240 (0.540)	Data Time 0.001 (0.033)	Loss 2.3260 (2.3480)	Entropy 0.53149 (0.53254)	Top-1 acc 66.016 (67.568)	Top-5 acc 87.891 (86.331)	lr 0.00014
Train [115][1160/3239]	Time 0.245 (0.539)	Data Time 0.001 (0.033)	Loss 2.5162 (2.3483)	Entropy 0.53169 (0.53253)	Top-1 acc 62.891 (67.560)	Top-5 acc 83.984 (86.321)	lr 0.00014
Train [115][1170/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.033)	Loss 2.4084 (2.3482)	Entropy 0.53214 (0.53252)	Top-1 acc 64.844 (67.569)	Top-5 acc 85.938 (86.325)	lr 0.00014
Train [115][1180/3239]	Time 0.240 (0.537)	Data Time 0.001 (0.032)	Loss 2.3656 (2.3478)	Entropy 0.53221 (0.53252)	Top-1 acc 67.578 (67.575)	Top-5 acc 85.156 (86.330)	lr 0.00014
Train [115][1190/3239]	Time 0.232 (0.536)	Data Time 0.001 (0.032)	Loss 2.3028 (2.3475)	Entropy 0.53194 (0.53251)	Top-1 acc 64.062 (67.579)	Top-5 acc 87.109 (86.337)	lr 0.00014
Train [115][1200/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.032)	Loss 2.5145 (2.3475)	Entropy 0.53128 (0.53251)	Top-1 acc 60.938 (67.577)	Top-5 acc 82.812 (86.337)	lr 0.00014
Train [115][1210/3239]	Time 0.239 (0.534)	Data Time 0.001 (0.032)	Loss 2.2385 (2.3475)	Entropy 0.53140 (0.53250)	Top-1 acc 73.438 (67.580)	Top-5 acc 87.891 (86.333)	lr 0.00014
Train [115][1220/3239]	Time 0.262 (0.533)	Data Time 0.001 (0.031)	Loss 2.5115 (2.3482)	Entropy 0.53121 (0.53249)	Top-1 acc 64.453 (67.561)	Top-5 acc 81.641 (86.317)	lr 0.00014
Train [115][1230/3239]	Time 0.237 (0.532)	Data Time 0.001 (0.031)	Loss 2.4283 (2.3482)	Entropy 0.53136 (0.53248)	Top-1 acc 67.969 (67.560)	Top-5 acc 85.938 (86.318)	lr 0.00014
Train [115][1240/3239]	Time 0.247 (0.531)	Data Time 0.001 (0.031)	Loss 2.4998 (2.3491)	Entropy 0.53136 (0.53247)	Top-1 acc 60.156 (67.528)	Top-5 acc 83.203 (86.298)	lr 0.00013
Train [115][1250/3239]	Time 0.270 (0.531)	Data Time 0.001 (0.031)	Loss 2.3574 (2.3493)	Entropy 0.53146 (0.53246)	Top-1 acc 68.359 (67.522)	Top-5 acc 85.938 (86.294)	lr 0.00013
Train [115][1260/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.030)	Loss 2.2205 (2.3492)	Entropy 0.53141 (0.53245)	Top-1 acc 66.797 (67.522)	Top-5 acc 87.891 (86.295)	lr 0.00013
Train [115][1270/3239]	Time 0.237 (0.529)	Data Time 0.001 (0.030)	Loss 2.1270 (2.3488)	Entropy 0.53112 (0.53244)	Top-1 acc 72.266 (67.532)	Top-5 acc 88.672 (86.301)	lr 0.00013
Train [115][1280/3239]	Time 0.258 (0.528)	Data Time 0.001 (0.030)	Loss 2.5142 (2.3489)	Entropy 0.53148 (0.53243)	Top-1 acc 64.062 (67.529)	Top-5 acc 83.984 (86.302)	lr 0.00013
Train [115][1290/3239]	Time 0.329 (0.527)	Data Time 0.001 (0.030)	Loss 2.6892 (2.3495)	Entropy 0.53170 (0.53243)	Top-1 acc 58.594 (67.514)	Top-5 acc 80.859 (86.295)	lr 0.00013
Train [115][1300/3239]	Time 0.245 (0.526)	Data Time 0.002 (0.030)	Loss 2.2149 (2.3491)	Entropy 0.53194 (0.53242)	Top-1 acc 69.922 (67.526)	Top-5 acc 87.891 (86.303)	lr 0.00013
Train [115][1310/3239]	Time 0.235 (0.525)	Data Time 0.001 (0.029)	Loss 2.3124 (2.3491)	Entropy 0.53151 (0.53242)	Top-1 acc 67.969 (67.523)	Top-5 acc 87.109 (86.301)	lr 0.00013
Train [115][1320/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.029)	Loss 2.2529 (2.3490)	Entropy 0.53152 (0.53241)	Top-1 acc 68.750 (67.525)	Top-5 acc 89.453 (86.308)	lr 0.00013
Train [115][1330/3239]	Time 0.236 (0.524)	Data Time 0.001 (0.029)	Loss 2.3494 (2.3499)	Entropy 0.53143 (0.53240)	Top-1 acc 68.750 (67.498)	Top-5 acc 84.766 (86.291)	lr 0.00013
Train [115][1340/3239]	Time 0.356 (0.561)	Data Time 0.004 (0.029)	Loss 2.2034 (2.3497)	Entropy 0.53167 (0.53240)	Top-1 acc 68.750 (67.502)	Top-5 acc 88.281 (86.293)	lr 0.00013
Train [115][1350/3239]	Time 0.292 (0.561)	Data Time 0.003 (0.029)	Loss 2.3651 (2.3497)	Entropy 0.53159 (0.53239)	Top-1 acc 65.234 (67.507)	Top-5 acc 86.328 (86.291)	lr 0.00013
Train [115][1360/3239]	Time 0.245 (0.560)	Data Time 0.002 (0.028)	Loss 2.4347 (2.3492)	Entropy 0.53162 (0.53239)	Top-1 acc 64.062 (67.522)	Top-5 acc 83.203 (86.298)	lr 0.00013
Train [115][1370/3239]	Time 0.238 (0.559)	Data Time 0.001 (0.028)	Loss 2.1294 (2.3492)	Entropy 0.53159 (0.53238)	Top-1 acc 75.000 (67.524)	Top-5 acc 90.625 (86.295)	lr 0.00013
Train [115][1380/3239]	Time 0.317 (0.558)	Data Time 0.002 (0.028)	Loss 2.4570 (2.3494)	Entropy 0.53131 (0.53237)	Top-1 acc 64.844 (67.517)	Top-5 acc 89.062 (86.293)	lr 0.00013
Train [115][1390/3239]	Time 0.243 (0.557)	Data Time 0.001 (0.028)	Loss 2.3136 (2.3491)	Entropy 0.53171 (0.53237)	Top-1 acc 67.578 (67.525)	Top-5 acc 85.938 (86.300)	lr 0.00013
Train [115][1400/3239]	Time 0.269 (0.556)	Data Time 0.001 (0.028)	Loss 2.1390 (2.3489)	Entropy 0.53169 (0.53236)	Top-1 acc 71.484 (67.530)	Top-5 acc 88.672 (86.301)	lr 0.00013
Train [115][1410/3239]	Time 0.239 (0.555)	Data Time 0.001 (0.027)	Loss 2.3669 (2.3490)	Entropy 0.53149 (0.53236)	Top-1 acc 68.359 (67.531)	Top-5 acc 85.938 (86.297)	lr 0.00013
Train [115][1420/3239]	Time 0.240 (0.555)	Data Time 0.001 (0.027)	Loss 2.2932 (2.3486)	Entropy 0.53174 (0.53235)	Top-1 acc 66.797 (67.536)	Top-5 acc 87.891 (86.306)	lr 0.00013
Train [115][1430/3239]	Time 0.261 (0.554)	Data Time 0.002 (0.027)	Loss 2.3394 (2.3481)	Entropy 0.53135 (0.53235)	Top-1 acc 66.797 (67.547)	Top-5 acc 84.375 (86.316)	lr 0.00013
Train [115][1440/3239]	Time 0.255 (0.553)	Data Time 0.001 (0.027)	Loss 2.1234 (2.3475)	Entropy 0.53123 (0.53234)	Top-1 acc 73.438 (67.559)	Top-5 acc 90.234 (86.328)	lr 0.00013
Train [115][1450/3239]	Time 0.428 (0.552)	Data Time 0.001 (0.027)	Loss 2.2925 (2.3469)	Entropy 0.53114 (0.53233)	Top-1 acc 68.359 (67.575)	Top-5 acc 87.500 (86.339)	lr 0.00013
Train [115][1460/3239]	Time 0.289 (0.552)	Data Time 0.002 (0.027)	Loss 2.5010 (2.3466)	Entropy 0.53120 (0.53232)	Top-1 acc 63.672 (67.580)	Top-5 acc 81.250 (86.345)	lr 0.00013
Train [115][1470/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.026)	Loss 2.5425 (2.3469)	Entropy 0.53119 (0.53232)	Top-1 acc 64.062 (67.578)	Top-5 acc 82.031 (86.340)	lr 0.00013
Train [115][1480/3239]	Time 0.236 (0.550)	Data Time 0.001 (0.026)	Loss 2.5291 (2.3477)	Entropy 0.53113 (0.53231)	Top-1 acc 64.453 (67.556)	Top-5 acc 83.203 (86.327)	lr 0.00013
Train [115][1490/3239]	Time 0.240 (0.549)	Data Time 0.001 (0.026)	Loss 2.5484 (2.3472)	Entropy 0.53112 (0.53230)	Top-1 acc 59.375 (67.569)	Top-5 acc 84.766 (86.339)	lr 0.00013
Train [115][1500/3239]	Time 0.223 (0.549)	Data Time 0.001 (0.026)	Loss 2.4854 (2.3471)	Entropy 0.53141 (0.53229)	Top-1 acc 65.234 (67.570)	Top-5 acc 84.375 (86.339)	lr 0.00013
Train [115][1510/3239]	Time 0.255 (0.548)	Data Time 0.001 (0.026)	Loss 2.3618 (2.3472)	Entropy 0.53135 (0.53229)	Top-1 acc 66.797 (67.568)	Top-5 acc 88.672 (86.339)	lr 0.00013
Train [115][1520/3239]	Time 0.342 (0.547)	Data Time 0.001 (0.026)	Loss 2.2794 (2.3470)	Entropy 0.53111 (0.53228)	Top-1 acc 67.188 (67.576)	Top-5 acc 86.719 (86.338)	lr 0.00013
Train [115][1530/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.025)	Loss 2.5917 (2.3473)	Entropy 0.53102 (0.53227)	Top-1 acc 59.375 (67.562)	Top-5 acc 82.422 (86.337)	lr 0.00013
Train [115][1540/3239]	Time 0.238 (0.545)	Data Time 0.001 (0.025)	Loss 2.2385 (2.3470)	Entropy 0.53064 (0.53226)	Top-1 acc 69.141 (67.571)	Top-5 acc 86.719 (86.340)	lr 0.00013
Train [115][1550/3239]	Time 0.241 (0.545)	Data Time 0.001 (0.025)	Loss 2.6602 (2.3471)	Entropy 0.53104 (0.53225)	Top-1 acc 59.766 (67.567)	Top-5 acc 80.469 (86.337)	lr 0.00013
Train [115][1560/3239]	Time 0.229 (0.544)	Data Time 0.001 (0.025)	Loss 2.5760 (2.3478)	Entropy 0.53108 (0.53224)	Top-1 acc 64.062 (67.553)	Top-5 acc 82.812 (86.324)	lr 0.00013
Train [115][1570/3239]	Time 0.273 (0.543)	Data Time 0.001 (0.025)	Loss 2.3849 (2.3478)	Entropy 0.53122 (0.53224)	Top-1 acc 66.797 (67.550)	Top-5 acc 87.109 (86.328)	lr 0.00013
Train [115][1580/3239]	Time 0.243 (0.542)	Data Time 0.001 (0.025)	Loss 2.3526 (2.3478)	Entropy 0.53146 (0.53223)	Top-1 acc 68.359 (67.548)	Top-5 acc 84.766 (86.329)	lr 0.00013
Train [115][1590/3239]	Time 0.237 (0.542)	Data Time 0.001 (0.025)	Loss 2.2376 (2.3471)	Entropy 0.53165 (0.53223)	Top-1 acc 69.141 (67.564)	Top-5 acc 86.328 (86.342)	lr 0.00013
Train [115][1600/3239]	Time 0.225 (0.541)	Data Time 0.001 (0.024)	Loss 2.2864 (2.3472)	Entropy 0.53135 (0.53222)	Top-1 acc 69.922 (67.560)	Top-5 acc 87.109 (86.338)	lr 0.00013
Train [115][1610/3239]	Time 0.442 (0.540)	Data Time 0.002 (0.024)	Loss 2.7648 (2.3479)	Entropy 0.53161 (0.53222)	Top-1 acc 58.984 (67.543)	Top-5 acc 82.812 (86.328)	lr 0.00013
Train [115][1620/3239]	Time 0.233 (0.540)	Data Time 0.002 (0.024)	Loss 2.2330 (2.3476)	Entropy 0.53153 (0.53221)	Top-1 acc 70.312 (67.550)	Top-5 acc 85.156 (86.333)	lr 0.00013
Train [115][1630/3239]	Time 0.240 (0.540)	Data Time 0.001 (0.024)	Loss 2.2672 (2.3480)	Entropy 0.53147 (0.53221)	Top-1 acc 72.656 (67.549)	Top-5 acc 87.500 (86.324)	lr 0.00013
Train [115][1640/3239]	Time 0.233 (0.539)	Data Time 0.001 (0.024)	Loss 2.4021 (2.3483)	Entropy 0.53160 (0.53221)	Top-1 acc 64.062 (67.546)	Top-5 acc 85.547 (86.321)	lr 0.00013
Train [115][1650/3239]	Time 0.234 (0.538)	Data Time 0.001 (0.024)	Loss 2.4030 (2.3485)	Entropy 0.53171 (0.53220)	Top-1 acc 67.969 (67.543)	Top-5 acc 82.812 (86.315)	lr 0.00013
Train [115][1660/3239]	Time 0.248 (0.538)	Data Time 0.002 (0.024)	Loss 2.4616 (2.3488)	Entropy 0.53181 (0.53220)	Top-1 acc 67.578 (67.541)	Top-5 acc 86.719 (86.311)	lr 0.00013
Train [115][1670/3239]	Time 0.230 (0.537)	Data Time 0.001 (0.023)	Loss 2.4273 (2.3486)	Entropy 0.53172 (0.53220)	Top-1 acc 66.406 (67.545)	Top-5 acc 84.766 (86.315)	lr 0.00013
Train [115][1680/3239]	Time 0.323 (0.536)	Data Time 0.001 (0.023)	Loss 2.3038 (2.3489)	Entropy 0.53185 (0.53220)	Top-1 acc 68.750 (67.537)	Top-5 acc 85.938 (86.310)	lr 0.00013
Train [115][1690/3239]	Time 0.234 (0.535)	Data Time 0.001 (0.023)	Loss 2.4766 (2.3487)	Entropy 0.53183 (0.53219)	Top-1 acc 63.672 (67.536)	Top-5 acc 83.594 (86.312)	lr 0.00013
Train [115][1700/3239]	Time 0.242 (0.535)	Data Time 0.002 (0.023)	Loss 2.2942 (2.3485)	Entropy 0.53173 (0.53219)	Top-1 acc 69.141 (67.541)	Top-5 acc 88.672 (86.316)	lr 0.00013
Train [115][1710/3239]	Time 0.276 (0.534)	Data Time 0.002 (0.023)	Loss 2.3659 (2.3485)	Entropy 0.53207 (0.53219)	Top-1 acc 64.453 (67.540)	Top-5 acc 88.281 (86.322)	lr 0.00013
Train [115][1720/3239]	Time 0.224 (0.533)	Data Time 0.001 (0.023)	Loss 2.3649 (2.3487)	Entropy 0.53182 (0.53219)	Top-1 acc 67.578 (67.539)	Top-5 acc 86.719 (86.318)	lr 0.00013
Train [115][1730/3239]	Time 0.223 (0.533)	Data Time 0.001 (0.023)	Loss 2.4998 (2.3484)	Entropy 0.53177 (0.53219)	Top-1 acc 64.453 (67.548)	Top-5 acc 83.203 (86.324)	lr 0.00013
Train [115][1740/3239]	Time 0.230 (0.532)	Data Time 0.001 (0.023)	Loss 2.2382 (2.3482)	Entropy 0.53177 (0.53218)	Top-1 acc 67.188 (67.551)	Top-5 acc 87.500 (86.324)	lr 0.00013
Train [115][1750/3239]	Time 0.239 (0.531)	Data Time 0.001 (0.022)	Loss 2.2159 (2.3477)	Entropy 0.53167 (0.53218)	Top-1 acc 69.141 (67.570)	Top-5 acc 89.844 (86.331)	lr 0.00013
Train [115][1760/3239]	Time 0.235 (0.531)	Data Time 0.001 (0.022)	Loss 2.2157 (2.3472)	Entropy 0.53183 (0.53218)	Top-1 acc 71.875 (67.584)	Top-5 acc 88.672 (86.337)	lr 0.00013
Train [115][1770/3239]	Time 0.292 (0.530)	Data Time 0.002 (0.022)	Loss 2.4121 (2.3468)	Entropy 0.53222 (0.53218)	Top-1 acc 63.281 (67.591)	Top-5 acc 84.766 (86.345)	lr 0.00013
Train [115][1780/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.022)	Loss 2.1550 (2.3468)	Entropy 0.53237 (0.53218)	Top-1 acc 73.047 (67.592)	Top-5 acc 89.453 (86.343)	lr 0.00013
Train [115][1790/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.022)	Loss 2.4275 (2.3466)	Entropy 0.53209 (0.53218)	Top-1 acc 64.453 (67.600)	Top-5 acc 83.203 (86.345)	lr 0.00013
Train [115][1800/3239]	Time 0.228 (0.528)	Data Time 0.001 (0.022)	Loss 2.0995 (2.3463)	Entropy 0.53200 (0.53218)	Top-1 acc 71.094 (67.608)	Top-5 acc 91.016 (86.354)	lr 0.00013
Train [115][1810/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.022)	Loss 2.2491 (2.3463)	Entropy 0.53212 (0.53218)	Top-1 acc 69.922 (67.611)	Top-5 acc 87.109 (86.352)	lr 0.00013
Train [115][1820/3239]	Time 0.284 (0.527)	Data Time 0.031 (0.022)	Loss 2.3403 (2.3466)	Entropy 0.53216 (0.53218)	Top-1 acc 66.406 (67.604)	Top-5 acc 85.156 (86.350)	lr 0.00013
Train [115][1830/3239]	Time 0.261 (0.526)	Data Time 0.002 (0.022)	Loss 2.1739 (2.3464)	Entropy 0.53190 (0.53217)	Top-1 acc 75.781 (67.611)	Top-5 acc 86.719 (86.347)	lr 0.00013
Train [115][1840/3239]	Time 0.358 (0.526)	Data Time 0.001 (0.021)	Loss 2.2823 (2.3463)	Entropy 0.53195 (0.53217)	Top-1 acc 67.578 (67.612)	Top-5 acc 88.672 (86.354)	lr 0.00013
Train [115][1850/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.021)	Loss 2.2973 (2.3462)	Entropy 0.53239 (0.53217)	Top-1 acc 71.875 (67.606)	Top-5 acc 85.547 (86.355)	lr 0.00013
Train [115][1860/3239]	Time 0.238 (0.525)	Data Time 0.001 (0.021)	Loss 2.3917 (2.3463)	Entropy 0.53260 (0.53217)	Top-1 acc 67.578 (67.605)	Top-5 acc 82.422 (86.351)	lr 0.00013
Train [115][1870/3239]	Time 0.236 (0.524)	Data Time 0.002 (0.021)	Loss 2.6312 (2.3463)	Entropy 0.53272 (0.53218)	Top-1 acc 58.594 (67.609)	Top-5 acc 81.250 (86.350)	lr 0.00013
Train [115][1880/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.021)	Loss 2.5458 (2.3459)	Entropy 0.53267 (0.53218)	Top-1 acc 60.938 (67.617)	Top-5 acc 82.422 (86.354)	lr 0.00013
Train [115][1890/3239]	Time 0.288 (0.523)	Data Time 0.001 (0.021)	Loss 2.4024 (2.3461)	Entropy 0.53196 (0.53218)	Top-1 acc 65.234 (67.615)	Top-5 acc 84.375 (86.349)	lr 0.00013
Train [115][1900/3239]	Time 0.236 (0.523)	Data Time 0.001 (0.021)	Loss 2.3911 (2.3460)	Entropy 0.53205 (0.53218)	Top-1 acc 70.703 (67.619)	Top-5 acc 85.938 (86.351)	lr 0.00013
Train [115][1910/3239]	Time 0.387 (0.522)	Data Time 0.001 (0.021)	Loss 2.2818 (2.3457)	Entropy 0.53185 (0.53218)	Top-1 acc 69.531 (67.624)	Top-5 acc 87.500 (86.357)	lr 0.00013
Train [115][1920/3239]	Time 0.228 (0.522)	Data Time 0.001 (0.021)	Loss 2.2517 (2.3457)	Entropy 0.53168 (0.53218)	Top-1 acc 70.312 (67.628)	Top-5 acc 87.109 (86.359)	lr 0.00013
Train [115][1930/3239]	Time 0.236 (0.521)	Data Time 0.001 (0.021)	Loss 2.3613 (2.3458)	Entropy 0.53152 (0.53217)	Top-1 acc 67.188 (67.624)	Top-5 acc 85.547 (86.358)	lr 0.00012
Train [115][1940/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.020)	Loss 2.4466 (2.3455)	Entropy 0.53146 (0.53217)	Top-1 acc 66.016 (67.631)	Top-5 acc 83.594 (86.364)	lr 0.00012
Train [115][1950/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.020)	Loss 2.4479 (2.3455)	Entropy 0.53139 (0.53217)	Top-1 acc 66.797 (67.629)	Top-5 acc 82.422 (86.365)	lr 0.00012
Train [115][1960/3239]	Time 0.289 (0.520)	Data Time 0.001 (0.020)	Loss 2.1828 (2.3451)	Entropy 0.53105 (0.53216)	Top-1 acc 76.172 (67.639)	Top-5 acc 87.500 (86.370)	lr 0.00012
Train [115][1970/3239]	Time 0.264 (0.519)	Data Time 0.001 (0.020)	Loss 2.1789 (2.3449)	Entropy 0.53115 (0.53216)	Top-1 acc 72.266 (67.641)	Top-5 acc 89.453 (86.368)	lr 0.00012
Train [115][1980/3239]	Time 0.286 (0.519)	Data Time 0.001 (0.020)	Loss 2.3845 (2.3452)	Entropy 0.53106 (0.53215)	Top-1 acc 64.062 (67.635)	Top-5 acc 87.500 (86.366)	lr 0.00012
Train [115][1990/3239]	Time 0.261 (0.518)	Data Time 0.001 (0.020)	Loss 2.0685 (2.3449)	Entropy 0.53137 (0.53215)	Top-1 acc 76.562 (67.642)	Top-5 acc 92.188 (86.371)	lr 0.00012
Train [115][2000/3239]	Time 0.518 (0.543)	Data Time 0.005 (0.020)	Loss 2.3655 (2.3452)	Entropy 0.53081 (0.53214)	Top-1 acc 67.188 (67.639)	Top-5 acc 84.766 (86.366)	lr 0.00012
Train [115][2010/3239]	Time 0.243 (0.542)	Data Time 0.002 (0.020)	Loss 2.3825 (2.3453)	Entropy 0.53069 (0.53213)	Top-1 acc 67.969 (67.639)	Top-5 acc 85.156 (86.364)	lr 0.00012
Train [115][2020/3239]	Time 0.251 (0.542)	Data Time 0.002 (0.020)	Loss 2.1231 (2.3456)	Entropy 0.53069 (0.53213)	Top-1 acc 72.266 (67.630)	Top-5 acc 88.672 (86.362)	lr 0.00012
Train [115][2030/3239]	Time 0.289 (0.542)	Data Time 0.002 (0.020)	Loss 2.2551 (2.3452)	Entropy 0.53069 (0.53212)	Top-1 acc 69.922 (67.638)	Top-5 acc 87.500 (86.369)	lr 0.00012
Train [115][2040/3239]	Time 0.266 (0.541)	Data Time 0.002 (0.020)	Loss 2.1913 (2.3454)	Entropy 0.53098 (0.53211)	Top-1 acc 69.531 (67.635)	Top-5 acc 88.281 (86.368)	lr 0.00012
Train [115][2050/3239]	Time 0.343 (0.541)	Data Time 0.002 (0.019)	Loss 2.2364 (2.3452)	Entropy 0.53100 (0.53211)	Top-1 acc 69.531 (67.637)	Top-5 acc 87.891 (86.369)	lr 0.00012
Train [115][2060/3239]	Time 0.247 (0.540)	Data Time 0.001 (0.019)	Loss 2.5372 (2.3457)	Entropy 0.53108 (0.53210)	Top-1 acc 65.625 (67.629)	Top-5 acc 80.859 (86.362)	lr 0.00012
Train [115][2070/3239]	Time 0.334 (0.540)	Data Time 0.001 (0.019)	Loss 2.2178 (2.3456)	Entropy 0.53127 (0.53210)	Top-1 acc 69.531 (67.636)	Top-5 acc 88.672 (86.362)	lr 0.00012
Train [115][2080/3239]	Time 0.230 (0.539)	Data Time 0.001 (0.019)	Loss 2.4301 (2.3455)	Entropy 0.53149 (0.53209)	Top-1 acc 66.016 (67.635)	Top-5 acc 87.109 (86.365)	lr 0.00012
Train [115][2090/3239]	Time 0.240 (0.539)	Data Time 0.001 (0.019)	Loss 2.3240 (2.3455)	Entropy 0.53150 (0.53209)	Top-1 acc 68.359 (67.641)	Top-5 acc 86.719 (86.366)	lr 0.00012
Train [115][2100/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.019)	Loss 2.3132 (2.3458)	Entropy 0.53181 (0.53209)	Top-1 acc 67.969 (67.633)	Top-5 acc 86.719 (86.359)	lr 0.00012
Train [115][2110/3239]	Time 0.256 (0.538)	Data Time 0.002 (0.019)	Loss 2.2004 (2.3458)	Entropy 0.53141 (0.53209)	Top-1 acc 72.656 (67.634)	Top-5 acc 89.844 (86.363)	lr 0.00012
Train [115][2120/3239]	Time 0.244 (0.537)	Data Time 0.001 (0.019)	Loss 2.1749 (2.3460)	Entropy 0.53111 (0.53208)	Top-1 acc 71.875 (67.629)	Top-5 acc 87.891 (86.359)	lr 0.00012
Train [115][2130/3239]	Time 0.259 (0.537)	Data Time 0.001 (0.019)	Loss 2.3766 (2.3460)	Entropy 0.53081 (0.53208)	Top-1 acc 67.188 (67.631)	Top-5 acc 84.375 (86.358)	lr 0.00012
Train [115][2140/3239]	Time 0.268 (0.536)	Data Time 0.001 (0.019)	Loss 2.4987 (2.3461)	Entropy 0.53098 (0.53207)	Top-1 acc 60.547 (67.623)	Top-5 acc 84.766 (86.354)	lr 0.00012
Train [115][2150/3239]	Time 0.240 (0.536)	Data Time 0.001 (0.019)	Loss 2.1492 (2.3462)	Entropy 0.53096 (0.53207)	Top-1 acc 71.094 (67.624)	Top-5 acc 91.016 (86.351)	lr 0.00012
Train [115][2160/3239]	Time 0.393 (0.535)	Data Time 0.001 (0.019)	Loss 2.2391 (2.3463)	Entropy 0.53163 (0.53206)	Top-1 acc 71.875 (67.623)	Top-5 acc 86.719 (86.347)	lr 0.00012
Train [115][2170/3239]	Time 0.242 (0.535)	Data Time 0.001 (0.019)	Loss 2.2336 (2.3461)	Entropy 0.53187 (0.53206)	Top-1 acc 69.531 (67.631)	Top-5 acc 89.453 (86.352)	lr 0.00012
Train [115][2180/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.018)	Loss 2.1290 (2.3460)	Entropy 0.53210 (0.53206)	Top-1 acc 73.047 (67.638)	Top-5 acc 90.625 (86.353)	lr 0.00012
Train [115][2190/3239]	Time 0.248 (0.534)	Data Time 0.001 (0.018)	Loss 2.2017 (2.3459)	Entropy 0.53216 (0.53206)	Top-1 acc 72.656 (67.644)	Top-5 acc 89.062 (86.354)	lr 0.00012
Train [115][2200/3239]	Time 0.280 (0.533)	Data Time 0.002 (0.018)	Loss 2.2419 (2.3457)	Entropy 0.53209 (0.53206)	Top-1 acc 69.922 (67.652)	Top-5 acc 89.453 (86.355)	lr 0.00012
Train [115][2210/3239]	Time 0.258 (0.533)	Data Time 0.001 (0.018)	Loss 2.2766 (2.3459)	Entropy 0.53225 (0.53206)	Top-1 acc 66.797 (67.648)	Top-5 acc 88.672 (86.350)	lr 0.00012
Train [115][2220/3239]	Time 0.229 (0.532)	Data Time 0.001 (0.018)	Loss 2.2960 (2.3460)	Entropy 0.53228 (0.53206)	Top-1 acc 68.750 (67.644)	Top-5 acc 86.719 (86.348)	lr 0.00012
Train [115][2230/3239]	Time 0.399 (0.532)	Data Time 0.002 (0.018)	Loss 2.4319 (2.3459)	Entropy 0.53205 (0.53206)	Top-1 acc 63.672 (67.645)	Top-5 acc 85.547 (86.349)	lr 0.00012
Train [115][2240/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.018)	Loss 2.2390 (2.3457)	Entropy 0.53206 (0.53206)	Top-1 acc 71.875 (67.646)	Top-5 acc 88.281 (86.352)	lr 0.00012
Train [115][2250/3239]	Time 0.250 (0.531)	Data Time 0.001 (0.018)	Loss 2.4607 (2.3457)	Entropy 0.53152 (0.53206)	Top-1 acc 64.453 (67.646)	Top-5 acc 84.375 (86.356)	lr 0.00012
Train [115][2260/3239]	Time 0.256 (0.531)	Data Time 0.002 (0.018)	Loss 2.4283 (2.3458)	Entropy 0.53176 (0.53206)	Top-1 acc 65.234 (67.637)	Top-5 acc 86.328 (86.354)	lr 0.00012
Train [115][2270/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.018)	Loss 2.2959 (2.3458)	Entropy 0.53200 (0.53206)	Top-1 acc 69.922 (67.637)	Top-5 acc 87.500 (86.357)	lr 0.00012
Train [115][2280/3239]	Time 0.225 (0.530)	Data Time 0.001 (0.018)	Loss 2.7163 (2.3459)	Entropy 0.53207 (0.53206)	Top-1 acc 55.859 (67.632)	Top-5 acc 81.641 (86.352)	lr 0.00012
Train [115][2290/3239]	Time 0.224 (0.529)	Data Time 0.001 (0.018)	Loss 2.5632 (2.3458)	Entropy 0.53216 (0.53206)	Top-1 acc 63.672 (67.638)	Top-5 acc 81.250 (86.348)	lr 0.00012
Train [115][2300/3239]	Time 0.260 (0.529)	Data Time 0.001 (0.018)	Loss 2.4008 (2.3459)	Entropy 0.53182 (0.53206)	Top-1 acc 65.625 (67.640)	Top-5 acc 85.938 (86.349)	lr 0.00012
Train [115][2310/3239]	Time 0.241 (0.528)	Data Time 0.001 (0.018)	Loss 2.1609 (2.3457)	Entropy 0.53220 (0.53206)	Top-1 acc 69.141 (67.644)	Top-5 acc 89.844 (86.353)	lr 0.00012
Train [115][2320/3239]	Time 0.335 (0.528)	Data Time 0.001 (0.017)	Loss 2.2564 (2.3455)	Entropy 0.53193 (0.53206)	Top-1 acc 69.531 (67.649)	Top-5 acc 86.328 (86.357)	lr 0.00012
Train [115][2330/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.017)	Loss 2.3904 (2.3457)	Entropy 0.53184 (0.53206)	Top-1 acc 65.625 (67.641)	Top-5 acc 88.281 (86.352)	lr 0.00012
Train [115][2340/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.017)	Loss 2.2259 (2.3456)	Entropy 0.53178 (0.53206)	Top-1 acc 69.922 (67.650)	Top-5 acc 88.672 (86.354)	lr 0.00012
Train [115][2350/3239]	Time 0.244 (0.526)	Data Time 0.001 (0.017)	Loss 2.2368 (2.3455)	Entropy 0.53196 (0.53206)	Top-1 acc 69.531 (67.651)	Top-5 acc 89.453 (86.353)	lr 0.00012
Train [115][2360/3239]	Time 0.230 (0.526)	Data Time 0.001 (0.017)	Loss 2.2887 (2.3454)	Entropy 0.53205 (0.53206)	Top-1 acc 66.406 (67.651)	Top-5 acc 87.500 (86.357)	lr 0.00012
Train [115][2370/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.017)	Loss 2.6099 (2.3455)	Entropy 0.53210 (0.53206)	Top-1 acc 62.891 (67.646)	Top-5 acc 81.250 (86.355)	lr 0.00012
Train [115][2380/3239]	Time 0.243 (0.525)	Data Time 0.002 (0.017)	Loss 2.2875 (2.3453)	Entropy 0.53231 (0.53206)	Top-1 acc 67.188 (67.655)	Top-5 acc 86.719 (86.355)	lr 0.00012
Train [115][2390/3239]	Time 0.350 (0.525)	Data Time 0.001 (0.017)	Loss 2.2344 (2.3454)	Entropy 0.53241 (0.53206)	Top-1 acc 67.969 (67.650)	Top-5 acc 91.797 (86.355)	lr 0.00012
Train [115][2400/3239]	Time 0.241 (0.524)	Data Time 0.001 (0.017)	Loss 2.2983 (2.3451)	Entropy 0.53232 (0.53206)	Top-1 acc 69.922 (67.657)	Top-5 acc 87.500 (86.358)	lr 0.00012
Train [115][2410/3239]	Time 0.240 (0.524)	Data Time 0.001 (0.017)	Loss 2.3186 (2.3451)	Entropy 0.53256 (0.53206)	Top-1 acc 68.359 (67.657)	Top-5 acc 84.375 (86.357)	lr 0.00012
Train [115][2420/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.017)	Loss 2.2898 (2.3452)	Entropy 0.53265 (0.53207)	Top-1 acc 70.312 (67.653)	Top-5 acc 86.328 (86.354)	lr 0.00012
Train [115][2430/3239]	Time 0.262 (0.523)	Data Time 0.001 (0.017)	Loss 2.4466 (2.3451)	Entropy 0.53273 (0.53207)	Top-1 acc 64.062 (67.658)	Top-5 acc 85.156 (86.359)	lr 0.00012
Train [115][2440/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.017)	Loss 2.2878 (2.3450)	Entropy 0.53258 (0.53207)	Top-1 acc 68.359 (67.658)	Top-5 acc 87.500 (86.359)	lr 0.00012
Train [115][2450/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.017)	Loss 2.2571 (2.3451)	Entropy 0.53273 (0.53207)	Top-1 acc 67.188 (67.661)	Top-5 acc 87.891 (86.356)	lr 0.00012
Train [115][2460/3239]	Time 0.255 (0.522)	Data Time 0.001 (0.017)	Loss 2.3274 (2.3451)	Entropy 0.53300 (0.53208)	Top-1 acc 67.578 (67.661)	Top-5 acc 85.547 (86.356)	lr 0.00012
Train [115][2470/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.016)	Loss 2.2232 (2.3452)	Entropy 0.53285 (0.53208)	Top-1 acc 69.531 (67.658)	Top-5 acc 89.453 (86.353)	lr 0.00012
Train [115][2480/3239]	Time 0.241 (0.521)	Data Time 0.001 (0.016)	Loss 2.1188 (2.3452)	Entropy 0.53316 (0.53208)	Top-1 acc 73.438 (67.657)	Top-5 acc 85.938 (86.351)	lr 0.00012
Train [115][2490/3239]	Time 0.273 (0.521)	Data Time 0.001 (0.016)	Loss 2.2189 (2.3452)	Entropy 0.53302 (0.53209)	Top-1 acc 69.922 (67.659)	Top-5 acc 87.109 (86.352)	lr 0.00012
Train [115][2500/3239]	Time 0.227 (0.520)	Data Time 0.001 (0.016)	Loss 2.4776 (2.3455)	Entropy 0.53312 (0.53209)	Top-1 acc 62.891 (67.648)	Top-5 acc 84.375 (86.347)	lr 0.00012
Train [115][2510/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.016)	Loss 2.4558 (2.3454)	Entropy 0.53310 (0.53209)	Top-1 acc 65.234 (67.653)	Top-5 acc 83.203 (86.345)	lr 0.00012
Train [115][2520/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.016)	Loss 2.2514 (2.3456)	Entropy 0.53336 (0.53210)	Top-1 acc 68.750 (67.653)	Top-5 acc 89.453 (86.343)	lr 0.00012
Train [115][2530/3239]	Time 0.276 (0.519)	Data Time 0.001 (0.016)	Loss 2.1995 (2.3456)	Entropy 0.53324 (0.53210)	Top-1 acc 71.875 (67.656)	Top-5 acc 88.672 (86.342)	lr 0.00012
Train [115][2540/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.016)	Loss 2.1671 (2.3456)	Entropy 0.53346 (0.53211)	Top-1 acc 71.094 (67.653)	Top-5 acc 88.281 (86.338)	lr 0.00012
Train [115][2550/3239]	Time 0.326 (0.518)	Data Time 0.001 (0.016)	Loss 2.2001 (2.3455)	Entropy 0.53341 (0.53211)	Top-1 acc 69.922 (67.658)	Top-5 acc 86.719 (86.341)	lr 0.00012
Train [115][2560/3239]	Time 0.236 (0.518)	Data Time 0.001 (0.016)	Loss 2.2213 (2.3454)	Entropy 0.53355 (0.53212)	Top-1 acc 69.141 (67.660)	Top-5 acc 89.062 (86.340)	lr 0.00012
Train [115][2570/3239]	Time 0.232 (0.517)	Data Time 0.001 (0.016)	Loss 2.4218 (2.3452)	Entropy 0.53306 (0.53212)	Top-1 acc 64.844 (67.661)	Top-5 acc 83.594 (86.341)	lr 0.00012
Train [115][2580/3239]	Time 0.226 (0.517)	Data Time 0.002 (0.016)	Loss 2.2819 (2.3449)	Entropy 0.53298 (0.53213)	Top-1 acc 69.141 (67.664)	Top-5 acc 88.281 (86.345)	lr 0.00012
Train [115][2590/3239]	Time 0.239 (0.517)	Data Time 0.001 (0.016)	Loss 2.2044 (2.3449)	Entropy 0.53289 (0.53213)	Top-1 acc 71.875 (67.667)	Top-5 acc 88.672 (86.344)	lr 0.00012
Train [115][2600/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.016)	Loss 2.4587 (2.3448)	Entropy 0.53289 (0.53213)	Top-1 acc 64.453 (67.666)	Top-5 acc 84.375 (86.343)	lr 0.00012
Train [115][2610/3239]	Time 0.299 (0.516)	Data Time 0.001 (0.016)	Loss 2.4915 (2.3451)	Entropy 0.53300 (0.53214)	Top-1 acc 64.453 (67.657)	Top-5 acc 82.812 (86.336)	lr 0.00012
Train [115][2620/3239]	Time 0.357 (0.515)	Data Time 0.001 (0.016)	Loss 2.5115 (2.3451)	Entropy 0.53296 (0.53214)	Top-1 acc 65.234 (67.661)	Top-5 acc 84.375 (86.338)	lr 0.00012
Train [115][2630/3239]	Time 0.223 (0.515)	Data Time 0.001 (0.016)	Loss 2.5310 (2.3450)	Entropy 0.53301 (0.53214)	Top-1 acc 62.891 (67.665)	Top-5 acc 83.984 (86.337)	lr 0.00012
Train [115][2640/3239]	Time 0.233 (0.515)	Data Time 0.001 (0.016)	Loss 2.2427 (2.3451)	Entropy 0.53314 (0.53215)	Top-1 acc 73.047 (67.663)	Top-5 acc 89.453 (86.335)	lr 0.00011
Train [115][2650/3239]	Time 0.307 (0.533)	Data Time 0.005 (0.015)	Loss 2.3690 (2.3453)	Entropy 0.53308 (0.53215)	Top-1 acc 66.406 (67.657)	Top-5 acc 85.547 (86.333)	lr 0.00011
Train [115][2660/3239]	Time 0.250 (0.533)	Data Time 0.002 (0.015)	Loss 2.2745 (2.3452)	Entropy 0.53322 (0.53215)	Top-1 acc 68.359 (67.662)	Top-5 acc 87.109 (86.335)	lr 0.00011
Train [115][2670/3239]	Time 0.245 (0.533)	Data Time 0.001 (0.015)	Loss 2.4074 (2.3453)	Entropy 0.53356 (0.53216)	Top-1 acc 65.234 (67.656)	Top-5 acc 84.375 (86.335)	lr 0.00011
Train [115][2680/3239]	Time 0.235 (0.532)	Data Time 0.001 (0.015)	Loss 2.2387 (2.3451)	Entropy 0.53310 (0.53216)	Top-1 acc 67.188 (67.662)	Top-5 acc 86.328 (86.337)	lr 0.00011
Train [115][2690/3239]	Time 0.268 (0.532)	Data Time 0.029 (0.015)	Loss 2.2668 (2.3451)	Entropy 0.53300 (0.53217)	Top-1 acc 67.578 (67.662)	Top-5 acc 86.719 (86.338)	lr 0.00011
Train [115][2700/3239]	Time 0.275 (0.532)	Data Time 0.002 (0.015)	Loss 2.2402 (2.3452)	Entropy 0.53327 (0.53217)	Top-1 acc 69.922 (67.662)	Top-5 acc 87.891 (86.337)	lr 0.00011
Train [115][2710/3239]	Time 0.354 (0.531)	Data Time 0.001 (0.015)	Loss 2.4097 (2.3452)	Entropy 0.53312 (0.53217)	Top-1 acc 66.016 (67.664)	Top-5 acc 85.938 (86.339)	lr 0.00011
Train [115][2720/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.015)	Loss 2.7057 (2.3455)	Entropy 0.53237 (0.53218)	Top-1 acc 55.469 (67.659)	Top-5 acc 78.125 (86.330)	lr 0.00011
Train [115][2730/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.015)	Loss 2.1933 (2.3456)	Entropy 0.53229 (0.53218)	Top-1 acc 67.969 (67.658)	Top-5 acc 88.672 (86.327)	lr 0.00011
Train [115][2740/3239]	Time 0.261 (0.530)	Data Time 0.002 (0.015)	Loss 2.2452 (2.3453)	Entropy 0.53250 (0.53218)	Top-1 acc 71.484 (67.665)	Top-5 acc 87.109 (86.330)	lr 0.00011
Train [115][2750/3239]	Time 0.225 (0.530)	Data Time 0.001 (0.015)	Loss 2.5397 (2.3452)	Entropy 0.53251 (0.53218)	Top-1 acc 62.891 (67.666)	Top-5 acc 81.250 (86.329)	lr 0.00011
Train [115][2760/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.015)	Loss 2.3965 (2.3452)	Entropy 0.53241 (0.53218)	Top-1 acc 66.406 (67.669)	Top-5 acc 87.891 (86.331)	lr 0.00011
Train [115][2770/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.015)	Loss 2.4351 (2.3453)	Entropy 0.53254 (0.53218)	Top-1 acc 64.062 (67.665)	Top-5 acc 87.500 (86.331)	lr 0.00011
Train [115][2780/3239]	Time 0.409 (0.529)	Data Time 0.001 (0.015)	Loss 2.9456 (2.3454)	Entropy 0.53253 (0.53218)	Top-1 acc 53.125 (67.661)	Top-5 acc 73.828 (86.325)	lr 0.00011
Train [115][2790/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.015)	Loss 2.4542 (2.3452)	Entropy 0.53244 (0.53218)	Top-1 acc 64.062 (67.667)	Top-5 acc 84.375 (86.328)	lr 0.00011
Train [115][2800/3239]	Time 0.278 (0.528)	Data Time 0.001 (0.015)	Loss 2.3027 (2.3450)	Entropy 0.53227 (0.53218)	Top-1 acc 66.797 (67.670)	Top-5 acc 85.938 (86.331)	lr 0.00011
Train [115][2810/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.015)	Loss 2.2499 (2.3449)	Entropy 0.53216 (0.53218)	Top-1 acc 67.969 (67.675)	Top-5 acc 88.281 (86.330)	lr 0.00011
Train [115][2820/3239]	Time 0.264 (0.527)	Data Time 0.002 (0.015)	Loss 2.3446 (2.3451)	Entropy 0.53200 (0.53218)	Top-1 acc 66.797 (67.671)	Top-5 acc 86.719 (86.329)	lr 0.00011
Train [115][2830/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.015)	Loss 2.4297 (2.3450)	Entropy 0.53184 (0.53218)	Top-1 acc 66.016 (67.671)	Top-5 acc 86.719 (86.330)	lr 0.00011
Train [115][2840/3239]	Time 0.243 (0.527)	Data Time 0.001 (0.015)	Loss 2.2882 (2.3450)	Entropy 0.53184 (0.53218)	Top-1 acc 68.750 (67.669)	Top-5 acc 87.891 (86.331)	lr 0.00011
Train [115][2850/3239]	Time 0.280 (0.526)	Data Time 0.001 (0.015)	Loss 2.2545 (2.3451)	Entropy 0.53195 (0.53218)	Top-1 acc 70.703 (67.666)	Top-5 acc 89.844 (86.330)	lr 0.00011
Train [115][2860/3239]	Time 0.253 (0.526)	Data Time 0.001 (0.014)	Loss 2.3654 (2.3451)	Entropy 0.53196 (0.53218)	Top-1 acc 69.141 (67.667)	Top-5 acc 83.594 (86.329)	lr 0.00011
Train [115][2870/3239]	Time 0.384 (0.526)	Data Time 0.001 (0.014)	Loss 2.3905 (2.3453)	Entropy 0.53225 (0.53218)	Top-1 acc 68.750 (67.660)	Top-5 acc 84.766 (86.324)	lr 0.00011
Train [115][2880/3239]	Time 0.263 (0.525)	Data Time 0.001 (0.014)	Loss 2.2502 (2.3454)	Entropy 0.53210 (0.53218)	Top-1 acc 67.969 (67.656)	Top-5 acc 85.938 (86.324)	lr 0.00011
Train [115][2890/3239]	Time 0.249 (0.525)	Data Time 0.001 (0.014)	Loss 2.3540 (2.3453)	Entropy 0.53223 (0.53218)	Top-1 acc 67.188 (67.657)	Top-5 acc 83.984 (86.327)	lr 0.00011
Train [115][2900/3239]	Time 0.260 (0.525)	Data Time 0.001 (0.014)	Loss 2.3087 (2.3455)	Entropy 0.53181 (0.53218)	Top-1 acc 66.797 (67.654)	Top-5 acc 88.672 (86.324)	lr 0.00011
Train [115][2910/3239]	Time 0.269 (0.525)	Data Time 0.001 (0.014)	Loss 2.4415 (2.3453)	Entropy 0.53174 (0.53218)	Top-1 acc 66.406 (67.656)	Top-5 acc 86.719 (86.328)	lr 0.00011
Train [115][2920/3239]	Time 0.243 (0.524)	Data Time 0.001 (0.014)	Loss 2.3060 (2.3450)	Entropy 0.53208 (0.53218)	Top-1 acc 69.141 (67.665)	Top-5 acc 88.281 (86.334)	lr 0.00011
Train [115][2930/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.014)	Loss 2.5056 (2.3448)	Entropy 0.53156 (0.53217)	Top-1 acc 65.625 (67.666)	Top-5 acc 83.594 (86.335)	lr 0.00011
Train [115][2940/3239]	Time 0.327 (0.523)	Data Time 0.001 (0.014)	Loss 2.1084 (2.3447)	Entropy 0.53175 (0.53217)	Top-1 acc 74.219 (67.674)	Top-5 acc 91.406 (86.338)	lr 0.00011
Train [115][2950/3239]	Time 0.238 (0.523)	Data Time 0.001 (0.014)	Loss 2.3028 (2.3446)	Entropy 0.53167 (0.53217)	Top-1 acc 66.406 (67.678)	Top-5 acc 87.109 (86.339)	lr 0.00011
Train [115][2960/3239]	Time 0.231 (0.523)	Data Time 0.001 (0.014)	Loss 2.3236 (2.3445)	Entropy 0.53169 (0.53217)	Top-1 acc 67.578 (67.675)	Top-5 acc 87.109 (86.339)	lr 0.00011
Train [115][2970/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.014)	Loss 2.2762 (2.3445)	Entropy 0.53189 (0.53217)	Top-1 acc 69.922 (67.679)	Top-5 acc 85.547 (86.339)	lr 0.00011
Train [115][2980/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.014)	Loss 2.2903 (2.3445)	Entropy 0.53192 (0.53217)	Top-1 acc 71.484 (67.680)	Top-5 acc 87.891 (86.339)	lr 0.00011
Train [115][2990/3239]	Time 0.264 (0.522)	Data Time 0.001 (0.014)	Loss 2.2796 (2.3444)	Entropy 0.53201 (0.53217)	Top-1 acc 70.703 (67.682)	Top-5 acc 87.500 (86.342)	lr 0.00011
Train [115][3000/3239]	Time 0.229 (0.521)	Data Time 0.001 (0.014)	Loss 2.2586 (2.3443)	Entropy 0.53209 (0.53217)	Top-1 acc 70.312 (67.681)	Top-5 acc 89.844 (86.343)	lr 0.00011
Train [115][3010/3239]	Time 0.232 (0.521)	Data Time 0.001 (0.014)	Loss 2.3849 (2.3445)	Entropy 0.53249 (0.53217)	Top-1 acc 66.797 (67.673)	Top-5 acc 85.938 (86.343)	lr 0.00011
Train [115][3020/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.014)	Loss 2.2803 (2.3443)	Entropy 0.53251 (0.53217)	Top-1 acc 69.531 (67.677)	Top-5 acc 88.672 (86.345)	lr 0.00011
Train [115][3030/3239]	Time 0.278 (0.520)	Data Time 0.002 (0.014)	Loss 2.2085 (2.3442)	Entropy 0.53238 (0.53217)	Top-1 acc 66.797 (67.679)	Top-5 acc 89.062 (86.347)	lr 0.00011
Train [115][3040/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.014)	Loss 2.2768 (2.3442)	Entropy 0.53243 (0.53217)	Top-1 acc 66.406 (67.682)	Top-5 acc 87.891 (86.347)	lr 0.00011
Train [115][3050/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.014)	Loss 2.3962 (2.3443)	Entropy 0.53222 (0.53217)	Top-1 acc 67.578 (67.680)	Top-5 acc 85.547 (86.346)	lr 0.00011
Train [115][3060/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.014)	Loss 2.3067 (2.3442)	Entropy 0.53211 (0.53217)	Top-1 acc 64.844 (67.683)	Top-5 acc 86.719 (86.348)	lr 0.00011
Train [115][3070/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.014)	Loss 2.2883 (2.3443)	Entropy 0.53189 (0.53217)	Top-1 acc 68.750 (67.679)	Top-5 acc 85.156 (86.347)	lr 0.00011
Train [115][3080/3239]	Time 0.260 (0.519)	Data Time 0.001 (0.014)	Loss 2.3254 (2.3442)	Entropy 0.53190 (0.53217)	Top-1 acc 66.016 (67.681)	Top-5 acc 85.938 (86.347)	lr 0.00011
Train [115][3090/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.014)	Loss 2.2555 (2.3442)	Entropy 0.53186 (0.53217)	Top-1 acc 67.578 (67.681)	Top-5 acc 88.672 (86.346)	lr 0.00011
Train [115][3100/3239]	Time 0.329 (0.518)	Data Time 0.001 (0.014)	Loss 2.5124 (2.3440)	Entropy 0.53174 (0.53217)	Top-1 acc 60.547 (67.684)	Top-5 acc 83.203 (86.349)	lr 0.00011
Train [115][3110/3239]	Time 0.226 (0.517)	Data Time 0.001 (0.013)	Loss 2.3015 (2.3438)	Entropy 0.53172 (0.53217)	Top-1 acc 69.922 (67.687)	Top-5 acc 85.938 (86.351)	lr 0.00011
Train [115][3120/3239]	Time 0.231 (0.517)	Data Time 0.001 (0.013)	Loss 2.2279 (2.3438)	Entropy 0.53180 (0.53216)	Top-1 acc 69.141 (67.688)	Top-5 acc 87.891 (86.353)	lr 0.00011
Train [115][3130/3239]	Time 0.238 (0.517)	Data Time 0.001 (0.013)	Loss 2.3661 (2.3442)	Entropy 0.53175 (0.53216)	Top-1 acc 69.922 (67.679)	Top-5 acc 84.766 (86.345)	lr 0.00011
Train [115][3140/3239]	Time 0.222 (0.516)	Data Time 0.001 (0.013)	Loss 2.2622 (2.3440)	Entropy 0.53164 (0.53216)	Top-1 acc 67.969 (67.681)	Top-5 acc 87.500 (86.346)	lr 0.00011
Train [115][3150/3239]	Time 0.240 (0.516)	Data Time 0.001 (0.013)	Loss 2.6680 (2.3440)	Entropy 0.53146 (0.53216)	Top-1 acc 59.766 (67.684)	Top-5 acc 79.297 (86.347)	lr 0.00011
Train [115][3160/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.013)	Loss 2.6321 (2.3444)	Entropy 0.53148 (0.53216)	Top-1 acc 58.203 (67.677)	Top-5 acc 83.203 (86.341)	lr 0.00011
Train [115][3170/3239]	Time 0.325 (0.515)	Data Time 0.001 (0.013)	Loss 2.5740 (2.3444)	Entropy 0.53136 (0.53216)	Top-1 acc 58.984 (67.676)	Top-5 acc 81.641 (86.340)	lr 0.00011
Train [115][3180/3239]	Time 0.226 (0.515)	Data Time 0.000 (0.013)	Loss 2.1617 (2.3444)	Entropy 0.53137 (0.53215)	Top-1 acc 72.656 (67.675)	Top-5 acc 91.797 (86.341)	lr 0.00011
Train [115][3190/3239]	Time 0.223 (0.515)	Data Time 0.000 (0.013)	Loss 2.3146 (2.3444)	Entropy 0.53179 (0.53215)	Top-1 acc 66.797 (67.674)	Top-5 acc 85.547 (86.341)	lr 0.00011
Train [115][3200/3239]	Time 0.218 (0.514)	Data Time 0.000 (0.013)	Loss 2.3627 (2.3443)	Entropy 0.53155 (0.53215)	Top-1 acc 64.453 (67.673)	Top-5 acc 87.500 (86.343)	lr 0.00011
Train [115][3210/3239]	Time 0.220 (0.514)	Data Time 0.000 (0.013)	Loss 2.2453 (2.3441)	Entropy 0.53180 (0.53215)	Top-1 acc 71.875 (67.680)	Top-5 acc 89.844 (86.346)	lr 0.00011
Train [115][3220/3239]	Time 0.229 (0.513)	Data Time 0.000 (0.013)	Loss 2.0903 (2.3441)	Entropy 0.53211 (0.53215)	Top-1 acc 73.438 (67.682)	Top-5 acc 90.234 (86.348)	lr 0.00011
Train [115][3230/3239]	Time 0.223 (0.513)	Data Time 0.000 (0.013)	Loss 2.4592 (2.3440)	Entropy 0.53237 (0.53215)	Top-1 acc 62.109 (67.682)	Top-5 acc 84.766 (86.349)	lr 0.00011
Train [115][3239/3239]	Time 0.885 (0.513)	Data Time 0.000 (0.013)	Loss 2.8148 (2.3440)	Entropy 0.53254 (0.53215)	Top-1 acc 58.025 (67.685)	Top-5 acc 80.247 (86.348)	lr 0.00011
==========Valid [115/120]	loss 1.168	top-1 acc 73.116 (73.154)	top-5 acc 90.671	Train top-1 67.685	top-5 86.348	Entropy 0.53254	Latency-None: 0.000ms	Flops: 539.00M
Train [116][0/3239]	Time 38.205 (38.205)	Data Time 36.546 (36.546)	Loss 2.2709 (2.2709)	Entropy 0.53250 (0.53250)	Top-1 acc 68.750 (68.750)	Top-5 acc 88.281 (88.281)	lr 0.00011
Train [116][10/3239]	Time 0.375 (4.021)	Data Time 0.001 (3.383)	Loss 2.3910 (2.3015)	Entropy 0.53257 (0.53255)	Top-1 acc 65.625 (68.146)	Top-5 acc 85.547 (87.145)	lr 0.00011
Train [116][20/3239]	Time 0.243 (2.298)	Data Time 0.001 (1.773)	Loss 2.3637 (2.3311)	Entropy 0.53283 (0.53259)	Top-1 acc 67.188 (67.485)	Top-5 acc 82.812 (86.272)	lr 0.00011
Train [116][30/3239]	Time 0.234 (1.689)	Data Time 0.001 (1.201)	Loss 2.3082 (2.3353)	Entropy 0.53270 (0.53266)	Top-1 acc 71.094 (67.566)	Top-5 acc 85.547 (86.379)	lr 0.00011
Train [116][40/3239]	Time 0.237 (1.381)	Data Time 0.001 (0.909)	Loss 2.2793 (2.3432)	Entropy 0.53273 (0.53267)	Top-1 acc 69.531 (67.597)	Top-5 acc 87.109 (86.290)	lr 0.00011
Train [116][50/3239]	Time 0.233 (1.194)	Data Time 0.001 (0.731)	Loss 2.1544 (2.3346)	Entropy 0.53259 (0.53268)	Top-1 acc 75.781 (67.907)	Top-5 acc 86.328 (86.497)	lr 0.00011
Train [116][60/3239]	Time 0.232 (1.065)	Data Time 0.001 (0.612)	Loss 2.3747 (2.3379)	Entropy 0.53280 (0.53268)	Top-1 acc 67.578 (67.719)	Top-5 acc 84.375 (86.405)	lr 0.00011
Train [116][70/3239]	Time 0.226 (1.697)	Data Time 0.002 (0.527)	Loss 2.6475 (2.3415)	Entropy 0.53309 (0.53270)	Top-1 acc 55.078 (67.490)	Top-5 acc 83.594 (86.449)	lr 0.00011
Train [116][80/3239]	Time 0.242 (1.539)	Data Time 0.002 (0.462)	Loss 2.3346 (2.3433)	Entropy 0.53340 (0.53277)	Top-1 acc 64.844 (67.491)	Top-5 acc 85.547 (86.343)	lr 0.00011
Train [116][90/3239]	Time 0.353 (1.421)	Data Time 0.003 (0.411)	Loss 2.3641 (2.3510)	Entropy 0.53369 (0.53285)	Top-1 acc 68.750 (67.333)	Top-5 acc 86.328 (86.208)	lr 0.00011
Train [116][100/3239]	Time 0.243 (1.325)	Data Time 0.001 (0.371)	Loss 2.4214 (2.3609)	Entropy 0.53315 (0.53291)	Top-1 acc 66.016 (66.986)	Top-5 acc 85.938 (86.050)	lr 0.00011
Train [116][110/3239]	Time 0.234 (1.243)	Data Time 0.001 (0.338)	Loss 2.3491 (2.3570)	Entropy 0.53346 (0.53294)	Top-1 acc 71.484 (67.089)	Top-5 acc 85.938 (86.149)	lr 0.00011
Train [116][120/3239]	Time 0.225 (1.174)	Data Time 0.001 (0.310)	Loss 2.5053 (2.3584)	Entropy 0.53365 (0.53298)	Top-1 acc 59.766 (67.042)	Top-5 acc 85.156 (86.089)	lr 0.00011
Train [116][130/3239]	Time 0.224 (1.116)	Data Time 0.001 (0.286)	Loss 2.3868 (2.3577)	Entropy 0.53364 (0.53304)	Top-1 acc 66.797 (67.062)	Top-5 acc 83.594 (86.084)	lr 0.00011
Train [116][140/3239]	Time 0.261 (1.066)	Data Time 0.001 (0.266)	Loss 2.2956 (2.3536)	Entropy 0.53356 (0.53307)	Top-1 acc 70.703 (67.240)	Top-5 acc 86.719 (86.098)	lr 0.00011
Train [116][150/3239]	Time 0.232 (1.022)	Data Time 0.001 (0.249)	Loss 2.1907 (2.3502)	Entropy 0.53351 (0.53311)	Top-1 acc 73.438 (67.348)	Top-5 acc 91.016 (86.181)	lr 0.00010
Train [116][160/3239]	Time 0.320 (0.984)	Data Time 0.001 (0.233)	Loss 2.3918 (2.3524)	Entropy 0.53294 (0.53312)	Top-1 acc 65.234 (67.297)	Top-5 acc 85.938 (86.149)	lr 0.00010
Train [116][170/3239]	Time 0.229 (0.950)	Data Time 0.001 (0.220)	Loss 2.2132 (2.3481)	Entropy 0.53318 (0.53311)	Top-1 acc 71.094 (67.370)	Top-5 acc 87.109 (86.202)	lr 0.00010
Train [116][180/3239]	Time 0.234 (0.921)	Data Time 0.001 (0.208)	Loss 2.2027 (2.3484)	Entropy 0.53332 (0.53312)	Top-1 acc 70.703 (67.354)	Top-5 acc 88.672 (86.237)	lr 0.00010
Train [116][190/3239]	Time 0.316 (0.900)	Data Time 0.002 (0.197)	Loss 2.2192 (2.3467)	Entropy 0.53305 (0.53313)	Top-1 acc 68.359 (67.384)	Top-5 acc 89.453 (86.275)	lr 0.00010
Train [116][200/3239]	Time 0.224 (0.878)	Data Time 0.001 (0.187)	Loss 2.4995 (2.3448)	Entropy 0.53303 (0.53312)	Top-1 acc 61.719 (67.413)	Top-5 acc 83.984 (86.303)	lr 0.00010
Train [116][210/3239]	Time 0.234 (0.856)	Data Time 0.001 (0.178)	Loss 2.5416 (2.3468)	Entropy 0.53311 (0.53312)	Top-1 acc 62.500 (67.393)	Top-5 acc 85.938 (86.278)	lr 0.00010
Train [116][220/3239]	Time 0.231 (0.835)	Data Time 0.001 (0.170)	Loss 2.4898 (2.3472)	Entropy 0.53347 (0.53313)	Top-1 acc 61.719 (67.393)	Top-5 acc 85.938 (86.261)	lr 0.00010
Train [116][230/3239]	Time 0.230 (0.817)	Data Time 0.001 (0.163)	Loss 2.4396 (2.3470)	Entropy 0.53324 (0.53314)	Top-1 acc 67.188 (67.406)	Top-5 acc 83.984 (86.245)	lr 0.00010
Train [116][240/3239]	Time 0.259 (0.800)	Data Time 0.001 (0.156)	Loss 2.2267 (2.3469)	Entropy 0.53336 (0.53314)	Top-1 acc 70.703 (67.397)	Top-5 acc 88.281 (86.241)	lr 0.00010
Train [116][250/3239]	Time 0.359 (0.785)	Data Time 0.001 (0.150)	Loss 2.1908 (2.3457)	Entropy 0.53316 (0.53315)	Top-1 acc 72.656 (67.429)	Top-5 acc 87.891 (86.288)	lr 0.00010
Train [116][260/3239]	Time 0.240 (0.771)	Data Time 0.001 (0.144)	Loss 2.4803 (2.3492)	Entropy 0.53300 (0.53315)	Top-1 acc 66.797 (67.354)	Top-5 acc 83.594 (86.229)	lr 0.00010
Train [116][270/3239]	Time 0.216 (0.757)	Data Time 0.001 (0.139)	Loss 2.6100 (2.3487)	Entropy 0.53313 (0.53315)	Top-1 acc 62.109 (67.378)	Top-5 acc 82.422 (86.236)	lr 0.00010
Train [116][280/3239]	Time 0.235 (0.745)	Data Time 0.001 (0.134)	Loss 2.2414 (2.3490)	Entropy 0.53273 (0.53315)	Top-1 acc 70.312 (67.378)	Top-5 acc 85.938 (86.235)	lr 0.00010
Train [116][290/3239]	Time 0.220 (0.733)	Data Time 0.001 (0.130)	Loss 2.3055 (2.3490)	Entropy 0.53267 (0.53313)	Top-1 acc 71.484 (67.385)	Top-5 acc 88.672 (86.241)	lr 0.00010
Train [116][300/3239]	Time 0.269 (0.723)	Data Time 0.003 (0.125)	Loss 2.1354 (2.3479)	Entropy 0.53259 (0.53311)	Top-1 acc 73.828 (67.425)	Top-5 acc 91.406 (86.259)	lr 0.00010
Train [116][310/3239]	Time 0.218 (0.714)	Data Time 0.001 (0.121)	Loss 2.5116 (2.3490)	Entropy 0.53251 (0.53309)	Top-1 acc 63.672 (67.417)	Top-5 acc 83.984 (86.244)	lr 0.00010
Train [116][320/3239]	Time 0.366 (0.705)	Data Time 0.001 (0.118)	Loss 2.3072 (2.3484)	Entropy 0.53195 (0.53307)	Top-1 acc 69.141 (67.441)	Top-5 acc 87.500 (86.258)	lr 0.00010
Train [116][330/3239]	Time 0.225 (0.697)	Data Time 0.001 (0.114)	Loss 2.3702 (2.3512)	Entropy 0.53194 (0.53304)	Top-1 acc 67.188 (67.380)	Top-5 acc 87.109 (86.189)	lr 0.00010
Train [116][340/3239]	Time 0.250 (0.689)	Data Time 0.001 (0.111)	Loss 2.2920 (2.3504)	Entropy 0.53214 (0.53301)	Top-1 acc 68.750 (67.380)	Top-5 acc 87.891 (86.224)	lr 0.00010
Train [116][350/3239]	Time 0.230 (0.681)	Data Time 0.001 (0.108)	Loss 2.6110 (2.3534)	Entropy 0.53252 (0.53299)	Top-1 acc 58.984 (67.318)	Top-5 acc 79.297 (86.185)	lr 0.00010
Train [116][360/3239]	Time 0.235 (0.674)	Data Time 0.001 (0.105)	Loss 2.6176 (2.3533)	Entropy 0.53262 (0.53298)	Top-1 acc 60.547 (67.309)	Top-5 acc 82.422 (86.184)	lr 0.00010
Train [116][370/3239]	Time 0.268 (0.668)	Data Time 0.028 (0.102)	Loss 2.4768 (2.3523)	Entropy 0.53276 (0.53297)	Top-1 acc 66.016 (67.353)	Top-5 acc 82.031 (86.195)	lr 0.00010
Train [116][380/3239]	Time 0.224 (0.662)	Data Time 0.001 (0.100)	Loss 2.7709 (2.3529)	Entropy 0.53262 (0.53296)	Top-1 acc 58.594 (67.355)	Top-5 acc 79.297 (86.186)	lr 0.00010
Train [116][390/3239]	Time 0.316 (0.655)	Data Time 0.001 (0.097)	Loss 2.2267 (2.3518)	Entropy 0.53264 (0.53295)	Top-1 acc 72.656 (67.390)	Top-5 acc 85.938 (86.191)	lr 0.00010
Train [116][400/3239]	Time 0.220 (0.649)	Data Time 0.001 (0.095)	Loss 2.2688 (2.3519)	Entropy 0.53266 (0.53295)	Top-1 acc 71.484 (67.396)	Top-5 acc 86.328 (86.191)	lr 0.00010
Train [116][410/3239]	Time 0.229 (0.643)	Data Time 0.001 (0.092)	Loss 2.0821 (2.3505)	Entropy 0.53238 (0.53294)	Top-1 acc 75.000 (67.457)	Top-5 acc 90.234 (86.190)	lr 0.00010
Train [116][420/3239]	Time 0.234 (0.637)	Data Time 0.001 (0.090)	Loss 2.1732 (2.3511)	Entropy 0.53187 (0.53292)	Top-1 acc 69.531 (67.423)	Top-5 acc 88.281 (86.181)	lr 0.00010
Train [116][430/3239]	Time 0.218 (0.632)	Data Time 0.001 (0.088)	Loss 2.3782 (2.3505)	Entropy 0.53194 (0.53290)	Top-1 acc 67.578 (67.421)	Top-5 acc 86.328 (86.202)	lr 0.00010
Train [116][440/3239]	Time 0.236 (0.626)	Data Time 0.001 (0.086)	Loss 2.2790 (2.3501)	Entropy 0.53232 (0.53288)	Top-1 acc 67.578 (67.442)	Top-5 acc 85.547 (86.204)	lr 0.00010
Train [116][450/3239]	Time 0.227 (0.621)	Data Time 0.001 (0.084)	Loss 2.1065 (2.3497)	Entropy 0.53215 (0.53287)	Top-1 acc 71.875 (67.430)	Top-5 acc 91.016 (86.220)	lr 0.00010
Train [116][460/3239]	Time 0.229 (0.617)	Data Time 0.001 (0.083)	Loss 2.2326 (2.3515)	Entropy 0.53216 (0.53285)	Top-1 acc 67.969 (67.384)	Top-5 acc 89.453 (86.208)	lr 0.00010
Train [116][470/3239]	Time 0.258 (0.613)	Data Time 0.001 (0.081)	Loss 2.3422 (2.3527)	Entropy 0.53216 (0.53284)	Top-1 acc 67.188 (67.345)	Top-5 acc 85.547 (86.181)	lr 0.00010
Train [116][480/3239]	Time 0.328 (0.609)	Data Time 0.001 (0.079)	Loss 2.2966 (2.3523)	Entropy 0.53215 (0.53282)	Top-1 acc 68.750 (67.376)	Top-5 acc 89.062 (86.188)	lr 0.00010
Train [116][490/3239]	Time 0.232 (0.605)	Data Time 0.001 (0.078)	Loss 2.2724 (2.3518)	Entropy 0.53218 (0.53281)	Top-1 acc 73.047 (67.396)	Top-5 acc 86.719 (86.187)	lr 0.00010
Train [116][500/3239]	Time 0.234 (0.601)	Data Time 0.001 (0.076)	Loss 2.2240 (2.3505)	Entropy 0.53212 (0.53279)	Top-1 acc 71.094 (67.434)	Top-5 acc 87.109 (86.219)	lr 0.00010
Train [116][510/3239]	Time 0.242 (0.597)	Data Time 0.002 (0.075)	Loss 2.2278 (2.3499)	Entropy 0.53246 (0.53278)	Top-1 acc 67.578 (67.444)	Top-5 acc 89.062 (86.223)	lr 0.00010
Train [116][520/3239]	Time 0.221 (0.594)	Data Time 0.001 (0.073)	Loss 2.4104 (2.3508)	Entropy 0.53241 (0.53278)	Top-1 acc 65.234 (67.436)	Top-5 acc 86.328 (86.212)	lr 0.00010
Train [116][530/3239]	Time 0.253 (0.590)	Data Time 0.001 (0.072)	Loss 2.2833 (2.3512)	Entropy 0.53208 (0.53277)	Top-1 acc 69.141 (67.427)	Top-5 acc 88.281 (86.215)	lr 0.00010
Train [116][540/3239]	Time 0.242 (0.587)	Data Time 0.001 (0.071)	Loss 2.1925 (2.3508)	Entropy 0.53194 (0.53275)	Top-1 acc 70.312 (67.437)	Top-5 acc 89.453 (86.226)	lr 0.00010
Train [116][550/3239]	Time 0.322 (0.583)	Data Time 0.001 (0.069)	Loss 2.2159 (2.3493)	Entropy 0.53207 (0.53274)	Top-1 acc 71.484 (67.480)	Top-5 acc 87.109 (86.247)	lr 0.00010
Train [116][560/3239]	Time 0.231 (0.580)	Data Time 0.001 (0.068)	Loss 2.5218 (2.3499)	Entropy 0.53228 (0.53273)	Top-1 acc 60.156 (67.461)	Top-5 acc 83.594 (86.242)	lr 0.00010
Train [116][570/3239]	Time 0.222 (0.577)	Data Time 0.001 (0.067)	Loss 2.2615 (2.3498)	Entropy 0.53222 (0.53272)	Top-1 acc 69.531 (67.468)	Top-5 acc 87.500 (86.236)	lr 0.00010
Train [116][580/3239]	Time 0.244 (0.574)	Data Time 0.001 (0.066)	Loss 2.3797 (2.3496)	Entropy 0.53215 (0.53271)	Top-1 acc 66.016 (67.475)	Top-5 acc 85.156 (86.230)	lr 0.00010
Train [116][590/3239]	Time 0.228 (0.571)	Data Time 0.001 (0.065)	Loss 2.7509 (2.3499)	Entropy 0.53233 (0.53271)	Top-1 acc 57.812 (67.469)	Top-5 acc 78.125 (86.211)	lr 0.00010
Train [116][600/3239]	Time 0.246 (0.568)	Data Time 0.001 (0.064)	Loss 2.5175 (2.3500)	Entropy 0.53187 (0.53270)	Top-1 acc 61.719 (67.447)	Top-5 acc 84.766 (86.221)	lr 0.00010
Train [116][610/3239]	Time 0.231 (0.565)	Data Time 0.001 (0.063)	Loss 2.3811 (2.3504)	Entropy 0.53165 (0.53269)	Top-1 acc 69.141 (67.457)	Top-5 acc 83.594 (86.202)	lr 0.00010
Train [116][620/3239]	Time 0.252 (0.563)	Data Time 0.001 (0.062)	Loss 2.3378 (2.3494)	Entropy 0.53170 (0.53267)	Top-1 acc 68.750 (67.473)	Top-5 acc 86.328 (86.214)	lr 0.00010
Train [116][630/3239]	Time 0.269 (0.561)	Data Time 0.001 (0.061)	Loss 2.1881 (2.3488)	Entropy 0.53187 (0.53265)	Top-1 acc 71.094 (67.470)	Top-5 acc 89.062 (86.215)	lr 0.00010
Train [116][640/3239]	Time 0.250 (0.559)	Data Time 0.001 (0.060)	Loss 2.2942 (2.3492)	Entropy 0.53192 (0.53264)	Top-1 acc 67.578 (67.464)	Top-5 acc 88.672 (86.212)	lr 0.00010
Train [116][650/3239]	Time 0.236 (0.556)	Data Time 0.001 (0.059)	Loss 2.4700 (2.3491)	Entropy 0.53215 (0.53263)	Top-1 acc 65.234 (67.477)	Top-5 acc 83.984 (86.211)	lr 0.00010
Train [116][660/3239]	Time 0.238 (0.554)	Data Time 0.001 (0.058)	Loss 2.3901 (2.3494)	Entropy 0.53235 (0.53263)	Top-1 acc 67.969 (67.479)	Top-5 acc 85.156 (86.192)	lr 0.00010
Train [116][670/3239]	Time 0.230 (0.552)	Data Time 0.001 (0.057)	Loss 2.3172 (2.3497)	Entropy 0.53251 (0.53262)	Top-1 acc 66.016 (67.468)	Top-5 acc 87.500 (86.186)	lr 0.00010
Train [116][680/3239]	Time 0.242 (0.550)	Data Time 0.001 (0.056)	Loss 2.2109 (2.3495)	Entropy 0.53262 (0.53262)	Top-1 acc 71.094 (67.477)	Top-5 acc 89.453 (86.181)	lr 0.00010
Train [116][690/3239]	Time 0.228 (0.549)	Data Time 0.002 (0.056)	Loss 2.4097 (2.3502)	Entropy 0.53287 (0.53262)	Top-1 acc 64.844 (67.462)	Top-5 acc 83.594 (86.169)	lr 0.00010
Train [116][700/3239]	Time 0.237 (0.547)	Data Time 0.001 (0.055)	Loss 2.3463 (2.3499)	Entropy 0.53305 (0.53263)	Top-1 acc 66.797 (67.480)	Top-5 acc 84.375 (86.170)	lr 0.00010
Train [116][710/3239]	Time 0.324 (0.545)	Data Time 0.001 (0.054)	Loss 2.3131 (2.3494)	Entropy 0.53257 (0.53263)	Top-1 acc 69.922 (67.500)	Top-5 acc 86.328 (86.181)	lr 0.00010
Train [116][720/3239]	Time 0.393 (0.612)	Data Time 0.005 (0.053)	Loss 2.1858 (2.3488)	Entropy 0.53249 (0.53263)	Top-1 acc 71.875 (67.511)	Top-5 acc 88.281 (86.192)	lr 0.00010
Train [116][730/3239]	Time 0.283 (0.610)	Data Time 0.002 (0.053)	Loss 2.3220 (2.3486)	Entropy 0.53261 (0.53263)	Top-1 acc 69.141 (67.515)	Top-5 acc 85.156 (86.187)	lr 0.00010
Train [116][740/3239]	Time 0.248 (0.608)	Data Time 0.001 (0.052)	Loss 2.3079 (2.3475)	Entropy 0.53278 (0.53263)	Top-1 acc 69.531 (67.543)	Top-5 acc 86.328 (86.195)	lr 0.00010
Train [116][750/3239]	Time 0.228 (0.605)	Data Time 0.001 (0.051)	Loss 2.2406 (2.3469)	Entropy 0.53311 (0.53263)	Top-1 acc 69.922 (67.556)	Top-5 acc 89.453 (86.203)	lr 0.00010
Train [116][760/3239]	Time 0.263 (0.603)	Data Time 0.002 (0.051)	Loss 2.3815 (2.3470)	Entropy 0.53319 (0.53264)	Top-1 acc 67.188 (67.555)	Top-5 acc 84.375 (86.200)	lr 0.00010
Train [116][770/3239]	Time 0.245 (0.601)	Data Time 0.001 (0.050)	Loss 2.0101 (2.3466)	Entropy 0.53315 (0.53265)	Top-1 acc 77.734 (67.569)	Top-5 acc 90.625 (86.211)	lr 0.00010
Train [116][780/3239]	Time 0.277 (0.599)	Data Time 0.001 (0.049)	Loss 2.5889 (2.3470)	Entropy 0.53355 (0.53265)	Top-1 acc 61.719 (67.561)	Top-5 acc 82.422 (86.203)	lr 0.00010
Train [116][790/3239]	Time 0.226 (0.596)	Data Time 0.001 (0.049)	Loss 2.3212 (2.3468)	Entropy 0.53318 (0.53266)	Top-1 acc 66.406 (67.560)	Top-5 acc 88.672 (86.210)	lr 0.00010
Train [116][800/3239]	Time 0.252 (0.594)	Data Time 0.001 (0.048)	Loss 2.4604 (2.3462)	Entropy 0.53307 (0.53267)	Top-1 acc 66.016 (67.577)	Top-5 acc 84.766 (86.219)	lr 0.00010
Train [116][810/3239]	Time 0.229 (0.592)	Data Time 0.001 (0.048)	Loss 2.8523 (2.3472)	Entropy 0.53301 (0.53268)	Top-1 acc 54.297 (67.546)	Top-5 acc 78.906 (86.202)	lr 0.00010
Train [116][820/3239]	Time 0.250 (0.590)	Data Time 0.001 (0.047)	Loss 2.3268 (2.3463)	Entropy 0.53292 (0.53268)	Top-1 acc 66.797 (67.576)	Top-5 acc 85.547 (86.213)	lr 0.00010
Train [116][830/3239]	Time 0.238 (0.588)	Data Time 0.001 (0.047)	Loss 2.3251 (2.3462)	Entropy 0.53304 (0.53268)	Top-1 acc 66.016 (67.577)	Top-5 acc 86.719 (86.224)	lr 0.00010
Train [116][840/3239]	Time 0.234 (0.586)	Data Time 0.001 (0.046)	Loss 2.5747 (2.3457)	Entropy 0.53279 (0.53269)	Top-1 acc 62.891 (67.589)	Top-5 acc 82.031 (86.229)	lr 0.00010
Train [116][850/3239]	Time 0.272 (0.584)	Data Time 0.001 (0.045)	Loss 2.6414 (2.3469)	Entropy 0.53220 (0.53269)	Top-1 acc 64.062 (67.569)	Top-5 acc 81.250 (86.202)	lr 0.00010
Train [116][860/3239]	Time 0.264 (0.582)	Data Time 0.001 (0.045)	Loss 2.6238 (2.3475)	Entropy 0.53210 (0.53268)	Top-1 acc 61.328 (67.547)	Top-5 acc 82.031 (86.199)	lr 0.00010
Train [116][870/3239]	Time 0.367 (0.580)	Data Time 0.001 (0.044)	Loss 2.3042 (2.3480)	Entropy 0.53225 (0.53267)	Top-1 acc 73.828 (67.541)	Top-5 acc 84.766 (86.190)	lr 0.00010
Train [116][880/3239]	Time 0.238 (0.578)	Data Time 0.001 (0.044)	Loss 2.2880 (2.3474)	Entropy 0.53237 (0.53267)	Top-1 acc 68.750 (67.563)	Top-5 acc 86.328 (86.200)	lr 0.00010
Train [116][890/3239]	Time 0.241 (0.577)	Data Time 0.001 (0.044)	Loss 2.1798 (2.3466)	Entropy 0.53245 (0.53267)	Top-1 acc 70.703 (67.589)	Top-5 acc 89.844 (86.211)	lr 0.00010
Train [116][900/3239]	Time 0.228 (0.575)	Data Time 0.001 (0.043)	Loss 2.3424 (2.3458)	Entropy 0.53280 (0.53266)	Top-1 acc 66.016 (67.599)	Top-5 acc 85.547 (86.226)	lr 0.00010
Train [116][910/3239]	Time 0.233 (0.573)	Data Time 0.001 (0.043)	Loss 2.2303 (2.3453)	Entropy 0.53284 (0.53267)	Top-1 acc 70.703 (67.611)	Top-5 acc 87.891 (86.233)	lr 0.00010
Train [116][920/3239]	Time 0.230 (0.572)	Data Time 0.001 (0.042)	Loss 2.4357 (2.3453)	Entropy 0.53319 (0.53267)	Top-1 acc 62.500 (67.609)	Top-5 acc 85.547 (86.228)	lr 0.00010
Train [116][930/3239]	Time 0.245 (0.570)	Data Time 0.001 (0.042)	Loss 2.3294 (2.3448)	Entropy 0.53288 (0.53267)	Top-1 acc 69.141 (67.625)	Top-5 acc 86.328 (86.244)	lr 0.00010
Train [116][940/3239]	Time 0.316 (0.569)	Data Time 0.001 (0.041)	Loss 2.1479 (2.3444)	Entropy 0.53302 (0.53268)	Top-1 acc 69.922 (67.638)	Top-5 acc 91.016 (86.252)	lr 0.00009
Train [116][950/3239]	Time 0.237 (0.567)	Data Time 0.001 (0.041)	Loss 2.3661 (2.3437)	Entropy 0.53288 (0.53268)	Top-1 acc 70.312 (67.662)	Top-5 acc 83.984 (86.256)	lr 0.00009
Train [116][960/3239]	Time 0.234 (0.566)	Data Time 0.001 (0.040)	Loss 2.2635 (2.3434)	Entropy 0.53309 (0.53268)	Top-1 acc 68.359 (67.666)	Top-5 acc 89.844 (86.265)	lr 0.00009
Train [116][970/3239]	Time 0.228 (0.564)	Data Time 0.001 (0.040)	Loss 2.3320 (2.3432)	Entropy 0.53315 (0.53269)	Top-1 acc 68.359 (67.678)	Top-5 acc 87.500 (86.267)	lr 0.00009
Train [116][980/3239]	Time 0.247 (0.563)	Data Time 0.001 (0.040)	Loss 2.2100 (2.3432)	Entropy 0.53302 (0.53269)	Top-1 acc 73.047 (67.674)	Top-5 acc 86.719 (86.269)	lr 0.00009
Train [116][990/3239]	Time 0.227 (0.561)	Data Time 0.001 (0.039)	Loss 2.2467 (2.3429)	Entropy 0.53276 (0.53269)	Top-1 acc 71.094 (67.685)	Top-5 acc 85.547 (86.270)	lr 0.00009
Train [116][1000/3239]	Time 0.224 (0.560)	Data Time 0.001 (0.039)	Loss 2.3309 (2.3424)	Entropy 0.53234 (0.53269)	Top-1 acc 69.922 (67.705)	Top-5 acc 85.156 (86.281)	lr 0.00009
Train [116][1010/3239]	Time 0.252 (0.558)	Data Time 0.001 (0.039)	Loss 2.3379 (2.3418)	Entropy 0.53226 (0.53269)	Top-1 acc 69.922 (67.715)	Top-5 acc 86.719 (86.287)	lr 0.00009
Train [116][1020/3239]	Time 0.227 (0.557)	Data Time 0.001 (0.038)	Loss 2.4746 (2.3433)	Entropy 0.53236 (0.53268)	Top-1 acc 62.891 (67.679)	Top-5 acc 83.203 (86.263)	lr 0.00009
Train [116][1030/3239]	Time 0.321 (0.555)	Data Time 0.001 (0.038)	Loss 2.3208 (2.3434)	Entropy 0.53243 (0.53268)	Top-1 acc 69.141 (67.683)	Top-5 acc 87.109 (86.266)	lr 0.00009
Train [116][1040/3239]	Time 0.252 (0.554)	Data Time 0.001 (0.038)	Loss 2.4644 (2.3440)	Entropy 0.53258 (0.53268)	Top-1 acc 65.234 (67.673)	Top-5 acc 84.375 (86.256)	lr 0.00009
Train [116][1050/3239]	Time 0.234 (0.553)	Data Time 0.001 (0.037)	Loss 2.3912 (2.3447)	Entropy 0.53267 (0.53268)	Top-1 acc 64.844 (67.660)	Top-5 acc 84.766 (86.251)	lr 0.00009
Train [116][1060/3239]	Time 0.228 (0.551)	Data Time 0.001 (0.037)	Loss 2.7348 (2.3452)	Entropy 0.53260 (0.53268)	Top-1 acc 57.031 (67.639)	Top-5 acc 78.516 (86.239)	lr 0.00009
Train [116][1070/3239]	Time 0.224 (0.550)	Data Time 0.001 (0.037)	Loss 2.3858 (2.3455)	Entropy 0.53313 (0.53268)	Top-1 acc 68.359 (67.633)	Top-5 acc 84.766 (86.234)	lr 0.00009
Train [116][1080/3239]	Time 0.241 (0.549)	Data Time 0.001 (0.036)	Loss 2.4595 (2.3456)	Entropy 0.53324 (0.53268)	Top-1 acc 67.969 (67.637)	Top-5 acc 82.422 (86.236)	lr 0.00009
Train [116][1090/3239]	Time 0.235 (0.547)	Data Time 0.001 (0.036)	Loss 2.1253 (2.3460)	Entropy 0.53302 (0.53269)	Top-1 acc 70.703 (67.629)	Top-5 acc 90.234 (86.231)	lr 0.00009
Train [116][1100/3239]	Time 0.358 (0.546)	Data Time 0.002 (0.036)	Loss 2.4764 (2.3466)	Entropy 0.53321 (0.53269)	Top-1 acc 62.109 (67.607)	Top-5 acc 85.547 (86.227)	lr 0.00009
Train [116][1110/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.035)	Loss 2.1944 (2.3459)	Entropy 0.53325 (0.53269)	Top-1 acc 73.047 (67.623)	Top-5 acc 88.281 (86.235)	lr 0.00009
Train [116][1120/3239]	Time 0.247 (0.544)	Data Time 0.001 (0.035)	Loss 2.2657 (2.3470)	Entropy 0.53321 (0.53270)	Top-1 acc 72.266 (67.598)	Top-5 acc 88.281 (86.221)	lr 0.00009
Train [116][1130/3239]	Time 0.222 (0.543)	Data Time 0.001 (0.035)	Loss 2.1665 (2.3467)	Entropy 0.53321 (0.53270)	Top-1 acc 69.922 (67.600)	Top-5 acc 91.016 (86.224)	lr 0.00009
Train [116][1140/3239]	Time 0.220 (0.541)	Data Time 0.001 (0.034)	Loss 2.1728 (2.3464)	Entropy 0.53291 (0.53271)	Top-1 acc 70.312 (67.606)	Top-5 acc 90.234 (86.233)	lr 0.00009
Train [116][1150/3239]	Time 0.224 (0.540)	Data Time 0.001 (0.034)	Loss 2.3465 (2.3470)	Entropy 0.53311 (0.53271)	Top-1 acc 70.312 (67.592)	Top-5 acc 86.719 (86.232)	lr 0.00009
Train [116][1160/3239]	Time 0.235 (0.539)	Data Time 0.001 (0.034)	Loss 2.3464 (2.3465)	Entropy 0.53289 (0.53271)	Top-1 acc 67.578 (67.604)	Top-5 acc 87.500 (86.250)	lr 0.00009
Train [116][1170/3239]	Time 0.228 (0.538)	Data Time 0.001 (0.034)	Loss 2.1180 (2.3462)	Entropy 0.53242 (0.53271)	Top-1 acc 73.047 (67.616)	Top-5 acc 92.578 (86.258)	lr 0.00009
Train [116][1180/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.033)	Loss 2.3183 (2.3460)	Entropy 0.53221 (0.53271)	Top-1 acc 68.750 (67.618)	Top-5 acc 88.281 (86.264)	lr 0.00009
Train [116][1190/3239]	Time 0.323 (0.535)	Data Time 0.001 (0.033)	Loss 2.2097 (2.3464)	Entropy 0.53212 (0.53271)	Top-1 acc 70.703 (67.611)	Top-5 acc 88.672 (86.258)	lr 0.00009
Train [116][1200/3239]	Time 0.251 (0.534)	Data Time 0.001 (0.033)	Loss 2.5859 (2.3466)	Entropy 0.53191 (0.53270)	Top-1 acc 64.062 (67.614)	Top-5 acc 82.812 (86.251)	lr 0.00009
Train [116][1210/3239]	Time 0.228 (0.534)	Data Time 0.001 (0.032)	Loss 2.3737 (2.3461)	Entropy 0.53220 (0.53269)	Top-1 acc 69.141 (67.621)	Top-5 acc 87.109 (86.263)	lr 0.00009
Train [116][1220/3239]	Time 0.221 (0.532)	Data Time 0.001 (0.032)	Loss 2.3779 (2.3456)	Entropy 0.53183 (0.53269)	Top-1 acc 67.969 (67.629)	Top-5 acc 85.547 (86.276)	lr 0.00009
Train [116][1230/3239]	Time 0.229 (0.531)	Data Time 0.001 (0.032)	Loss 2.2908 (2.3459)	Entropy 0.53161 (0.53268)	Top-1 acc 65.234 (67.612)	Top-5 acc 89.844 (86.274)	lr 0.00009
Train [116][1240/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.032)	Loss 2.3266 (2.3458)	Entropy 0.53178 (0.53267)	Top-1 acc 67.969 (67.620)	Top-5 acc 87.109 (86.279)	lr 0.00009
Train [116][1250/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.031)	Loss 2.2040 (2.3458)	Entropy 0.53146 (0.53266)	Top-1 acc 72.656 (67.623)	Top-5 acc 88.672 (86.280)	lr 0.00009
Train [116][1260/3239]	Time 0.318 (0.528)	Data Time 0.001 (0.031)	Loss 2.4698 (2.3454)	Entropy 0.53147 (0.53265)	Top-1 acc 64.062 (67.630)	Top-5 acc 85.156 (86.289)	lr 0.00009
Train [116][1270/3239]	Time 0.231 (0.527)	Data Time 0.001 (0.031)	Loss 2.3157 (2.3452)	Entropy 0.53142 (0.53264)	Top-1 acc 68.750 (67.632)	Top-5 acc 86.328 (86.295)	lr 0.00009
Train [116][1280/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.031)	Loss 2.4711 (2.3456)	Entropy 0.53115 (0.53263)	Top-1 acc 62.500 (67.618)	Top-5 acc 85.938 (86.295)	lr 0.00009
Train [116][1290/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.031)	Loss 2.3015 (2.3452)	Entropy 0.53090 (0.53262)	Top-1 acc 68.750 (67.627)	Top-5 acc 88.672 (86.306)	lr 0.00009
Train [116][1300/3239]	Time 0.237 (0.525)	Data Time 0.001 (0.030)	Loss 2.4465 (2.3454)	Entropy 0.53097 (0.53261)	Top-1 acc 65.234 (67.625)	Top-5 acc 83.984 (86.302)	lr 0.00009
Train [116][1310/3239]	Time 0.305 (0.524)	Data Time 0.002 (0.030)	Loss 2.4348 (2.3455)	Entropy 0.53139 (0.53260)	Top-1 acc 66.797 (67.628)	Top-5 acc 83.203 (86.297)	lr 0.00009
Train [116][1320/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.030)	Loss 2.2272 (2.3452)	Entropy 0.53127 (0.53259)	Top-1 acc 71.875 (67.639)	Top-5 acc 88.672 (86.301)	lr 0.00009
Train [116][1330/3239]	Time 0.249 (0.523)	Data Time 0.001 (0.030)	Loss 2.3279 (2.3451)	Entropy 0.53140 (0.53258)	Top-1 acc 68.359 (67.648)	Top-5 acc 86.328 (86.301)	lr 0.00009
Train [116][1340/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.029)	Loss 2.2569 (2.3453)	Entropy 0.53161 (0.53257)	Top-1 acc 68.359 (67.644)	Top-5 acc 87.109 (86.299)	lr 0.00009
Train [116][1350/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.029)	Loss 2.3316 (2.3453)	Entropy 0.53146 (0.53256)	Top-1 acc 69.141 (67.637)	Top-5 acc 87.109 (86.301)	lr 0.00009
Train [116][1360/3239]	Time 0.226 (0.520)	Data Time 0.001 (0.029)	Loss 2.2479 (2.3455)	Entropy 0.53162 (0.53256)	Top-1 acc 69.531 (67.632)	Top-5 acc 89.062 (86.299)	lr 0.00009
Train [116][1370/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.029)	Loss 2.4702 (2.3460)	Entropy 0.53165 (0.53255)	Top-1 acc 62.500 (67.621)	Top-5 acc 82.812 (86.285)	lr 0.00009
Train [116][1380/3239]	Time 0.334 (0.554)	Data Time 0.004 (0.029)	Loss 2.1140 (2.3462)	Entropy 0.53149 (0.53254)	Top-1 acc 76.562 (67.620)	Top-5 acc 89.453 (86.282)	lr 0.00009
Train [116][1390/3239]	Time 0.233 (0.554)	Data Time 0.002 (0.029)	Loss 2.2461 (2.3461)	Entropy 0.53155 (0.53254)	Top-1 acc 67.188 (67.626)	Top-5 acc 88.281 (86.284)	lr 0.00009
Train [116][1400/3239]	Time 0.231 (0.553)	Data Time 0.001 (0.028)	Loss 2.4117 (2.3464)	Entropy 0.53137 (0.53253)	Top-1 acc 68.359 (67.617)	Top-5 acc 83.984 (86.277)	lr 0.00009
Train [116][1410/3239]	Time 0.396 (0.552)	Data Time 0.002 (0.028)	Loss 2.2877 (2.3464)	Entropy 0.53127 (0.53252)	Top-1 acc 71.484 (67.623)	Top-5 acc 88.281 (86.274)	lr 0.00009
Train [116][1420/3239]	Time 0.451 (0.553)	Data Time 0.002 (0.028)	Loss 2.2059 (2.3466)	Entropy 0.53097 (0.53251)	Top-1 acc 71.484 (67.612)	Top-5 acc 87.891 (86.267)	lr 0.00009
Train [116][1430/3239]	Time 0.237 (0.552)	Data Time 0.001 (0.028)	Loss 2.4241 (2.3462)	Entropy 0.53118 (0.53250)	Top-1 acc 65.234 (67.616)	Top-5 acc 85.156 (86.274)	lr 0.00009
Train [116][1440/3239]	Time 0.234 (0.551)	Data Time 0.001 (0.028)	Loss 2.2346 (2.3462)	Entropy 0.53070 (0.53249)	Top-1 acc 69.922 (67.615)	Top-5 acc 87.891 (86.271)	lr 0.00009
Train [116][1450/3239]	Time 0.238 (0.550)	Data Time 0.001 (0.027)	Loss 2.3045 (2.3462)	Entropy 0.53106 (0.53248)	Top-1 acc 66.406 (67.618)	Top-5 acc 87.109 (86.273)	lr 0.00009
Train [116][1460/3239]	Time 0.235 (0.549)	Data Time 0.001 (0.027)	Loss 2.4268 (2.3461)	Entropy 0.53107 (0.53247)	Top-1 acc 66.016 (67.625)	Top-5 acc 85.547 (86.278)	lr 0.00009
Train [116][1470/3239]	Time 0.279 (0.548)	Data Time 0.001 (0.027)	Loss 2.2650 (2.3462)	Entropy 0.53106 (0.53246)	Top-1 acc 69.141 (67.617)	Top-5 acc 87.891 (86.274)	lr 0.00009
Train [116][1480/3239]	Time 0.228 (0.547)	Data Time 0.001 (0.027)	Loss 2.5111 (2.3464)	Entropy 0.53121 (0.53245)	Top-1 acc 64.453 (67.614)	Top-5 acc 83.203 (86.275)	lr 0.00009
Train [116][1490/3239]	Time 0.233 (0.546)	Data Time 0.001 (0.027)	Loss 2.3596 (2.3463)	Entropy 0.53109 (0.53244)	Top-1 acc 65.625 (67.612)	Top-5 acc 85.938 (86.280)	lr 0.00009
Train [116][1500/3239]	Time 0.228 (0.545)	Data Time 0.001 (0.027)	Loss 2.1805 (2.3468)	Entropy 0.53079 (0.53243)	Top-1 acc 71.094 (67.608)	Top-5 acc 90.234 (86.273)	lr 0.00009
Train [116][1510/3239]	Time 0.230 (0.544)	Data Time 0.001 (0.026)	Loss 2.3238 (2.3473)	Entropy 0.53095 (0.53242)	Top-1 acc 67.578 (67.590)	Top-5 acc 85.938 (86.259)	lr 0.00009
Train [116][1520/3239]	Time 0.229 (0.543)	Data Time 0.001 (0.026)	Loss 2.1998 (2.3473)	Entropy 0.53054 (0.53241)	Top-1 acc 73.438 (67.595)	Top-5 acc 88.281 (86.265)	lr 0.00009
Train [116][1530/3239]	Time 0.230 (0.542)	Data Time 0.001 (0.026)	Loss 2.2212 (2.3467)	Entropy 0.53084 (0.53240)	Top-1 acc 70.312 (67.607)	Top-5 acc 91.016 (86.273)	lr 0.00009
Train [116][1540/3239]	Time 0.227 (0.542)	Data Time 0.001 (0.026)	Loss 2.1834 (2.3469)	Entropy 0.53068 (0.53239)	Top-1 acc 72.656 (67.602)	Top-5 acc 88.281 (86.268)	lr 0.00009
Train [116][1550/3239]	Time 0.233 (0.541)	Data Time 0.001 (0.026)	Loss 2.5236 (2.3472)	Entropy 0.53069 (0.53238)	Top-1 acc 64.844 (67.593)	Top-5 acc 85.156 (86.265)	lr 0.00009
Train [116][1560/3239]	Time 0.240 (0.540)	Data Time 0.002 (0.026)	Loss 2.4389 (2.3471)	Entropy 0.53052 (0.53236)	Top-1 acc 67.188 (67.596)	Top-5 acc 84.375 (86.270)	lr 0.00009
Train [116][1570/3239]	Time 0.264 (0.539)	Data Time 0.001 (0.025)	Loss 2.1563 (2.3467)	Entropy 0.53050 (0.53235)	Top-1 acc 71.484 (67.604)	Top-5 acc 88.672 (86.278)	lr 0.00009
Train [116][1580/3239]	Time 0.365 (0.539)	Data Time 0.002 (0.025)	Loss 2.4770 (2.3467)	Entropy 0.53014 (0.53234)	Top-1 acc 61.328 (67.607)	Top-5 acc 82.422 (86.279)	lr 0.00009
Train [116][1590/3239]	Time 0.266 (0.538)	Data Time 0.001 (0.025)	Loss 2.3000 (2.3469)	Entropy 0.52966 (0.53233)	Top-1 acc 68.359 (67.599)	Top-5 acc 85.547 (86.276)	lr 0.00009
Train [116][1600/3239]	Time 0.282 (0.537)	Data Time 0.001 (0.025)	Loss 2.2949 (2.3470)	Entropy 0.52936 (0.53231)	Top-1 acc 67.578 (67.591)	Top-5 acc 88.672 (86.275)	lr 0.00009
Train [116][1610/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.025)	Loss 2.5209 (2.3474)	Entropy 0.52928 (0.53229)	Top-1 acc 60.938 (67.582)	Top-5 acc 82.812 (86.267)	lr 0.00009
Train [116][1620/3239]	Time 0.352 (0.537)	Data Time 0.002 (0.025)	Loss 2.7946 (2.3480)	Entropy 0.52917 (0.53227)	Top-1 acc 58.203 (67.567)	Top-5 acc 77.734 (86.262)	lr 0.00009
Train [116][1630/3239]	Time 0.299 (0.537)	Data Time 0.002 (0.025)	Loss 2.3218 (2.3477)	Entropy 0.52902 (0.53225)	Top-1 acc 71.875 (67.576)	Top-5 acc 84.766 (86.265)	lr 0.00009
Train [116][1640/3239]	Time 0.227 (0.536)	Data Time 0.001 (0.024)	Loss 2.2490 (2.3475)	Entropy 0.52924 (0.53223)	Top-1 acc 71.875 (67.578)	Top-5 acc 86.328 (86.267)	lr 0.00009
Train [116][1650/3239]	Time 0.339 (0.535)	Data Time 0.002 (0.024)	Loss 2.4773 (2.3476)	Entropy 0.52948 (0.53221)	Top-1 acc 67.969 (67.581)	Top-5 acc 82.812 (86.265)	lr 0.00009
Train [116][1660/3239]	Time 0.228 (0.535)	Data Time 0.001 (0.024)	Loss 2.2099 (2.3478)	Entropy 0.52929 (0.53220)	Top-1 acc 69.922 (67.569)	Top-5 acc 89.062 (86.263)	lr 0.00009
Train [116][1670/3239]	Time 0.232 (0.534)	Data Time 0.001 (0.024)	Loss 2.0706 (2.3476)	Entropy 0.52950 (0.53218)	Top-1 acc 77.734 (67.575)	Top-5 acc 91.016 (86.265)	lr 0.00009
Train [116][1680/3239]	Time 0.223 (0.533)	Data Time 0.001 (0.024)	Loss 2.5306 (2.3478)	Entropy 0.52956 (0.53217)	Top-1 acc 66.016 (67.569)	Top-5 acc 81.641 (86.262)	lr 0.00009
Train [116][1690/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.024)	Loss 2.3537 (2.3476)	Entropy 0.52931 (0.53215)	Top-1 acc 65.625 (67.572)	Top-5 acc 86.719 (86.268)	lr 0.00009
Train [116][1700/3239]	Time 0.244 (0.532)	Data Time 0.001 (0.024)	Loss 2.4092 (2.3478)	Entropy 0.52940 (0.53213)	Top-1 acc 64.844 (67.568)	Top-5 acc 83.203 (86.265)	lr 0.00009
Train [116][1710/3239]	Time 0.231 (0.531)	Data Time 0.001 (0.023)	Loss 2.4038 (2.3483)	Entropy 0.52945 (0.53212)	Top-1 acc 62.891 (67.549)	Top-5 acc 87.109 (86.259)	lr 0.00009
Train [116][1720/3239]	Time 0.230 (0.531)	Data Time 0.001 (0.023)	Loss 2.3591 (2.3481)	Entropy 0.52984 (0.53210)	Top-1 acc 67.578 (67.553)	Top-5 acc 89.062 (86.267)	lr 0.00009
Train [116][1730/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.023)	Loss 2.2437 (2.3479)	Entropy 0.52976 (0.53209)	Top-1 acc 69.922 (67.562)	Top-5 acc 88.281 (86.272)	lr 0.00009
Train [116][1740/3239]	Time 0.379 (0.529)	Data Time 0.002 (0.023)	Loss 2.4034 (2.3480)	Entropy 0.52998 (0.53208)	Top-1 acc 66.797 (67.558)	Top-5 acc 84.766 (86.270)	lr 0.00009
Train [116][1750/3239]	Time 0.245 (0.529)	Data Time 0.001 (0.023)	Loss 2.4255 (2.3481)	Entropy 0.52999 (0.53207)	Top-1 acc 66.406 (67.549)	Top-5 acc 85.156 (86.272)	lr 0.00009
Train [116][1760/3239]	Time 0.249 (0.528)	Data Time 0.002 (0.023)	Loss 2.4296 (2.3478)	Entropy 0.53000 (0.53205)	Top-1 acc 64.062 (67.547)	Top-5 acc 84.766 (86.278)	lr 0.00008
Train [116][1770/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.023)	Loss 2.3255 (2.3480)	Entropy 0.53019 (0.53204)	Top-1 acc 66.797 (67.553)	Top-5 acc 87.109 (86.274)	lr 0.00008
Train [116][1780/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.023)	Loss 2.3683 (2.3480)	Entropy 0.53055 (0.53203)	Top-1 acc 66.797 (67.549)	Top-5 acc 86.719 (86.275)	lr 0.00008
Train [116][1790/3239]	Time 0.241 (0.526)	Data Time 0.001 (0.023)	Loss 2.2645 (2.3477)	Entropy 0.53070 (0.53202)	Top-1 acc 69.922 (67.552)	Top-5 acc 88.672 (86.281)	lr 0.00008
Train [116][1800/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.022)	Loss 2.2283 (2.3477)	Entropy 0.53083 (0.53202)	Top-1 acc 67.578 (67.550)	Top-5 acc 87.500 (86.280)	lr 0.00008
Train [116][1810/3239]	Time 0.317 (0.525)	Data Time 0.001 (0.022)	Loss 2.2308 (2.3472)	Entropy 0.53118 (0.53201)	Top-1 acc 71.094 (67.562)	Top-5 acc 87.891 (86.287)	lr 0.00008
Train [116][1820/3239]	Time 0.232 (0.524)	Data Time 0.001 (0.022)	Loss 2.1940 (2.3468)	Entropy 0.53071 (0.53201)	Top-1 acc 70.703 (67.568)	Top-5 acc 87.109 (86.294)	lr 0.00008
Train [116][1830/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.022)	Loss 2.6222 (2.3469)	Entropy 0.53104 (0.53200)	Top-1 acc 59.766 (67.564)	Top-5 acc 82.422 (86.292)	lr 0.00008
Train [116][1840/3239]	Time 0.340 (0.524)	Data Time 0.002 (0.022)	Loss 2.3452 (2.3470)	Entropy 0.53127 (0.53200)	Top-1 acc 64.844 (67.560)	Top-5 acc 87.109 (86.291)	lr 0.00008
Train [116][1850/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.022)	Loss 2.2749 (2.3470)	Entropy 0.53168 (0.53199)	Top-1 acc 72.656 (67.558)	Top-5 acc 87.500 (86.289)	lr 0.00008
Train [116][1860/3239]	Time 0.233 (0.523)	Data Time 0.001 (0.022)	Loss 2.9007 (2.3474)	Entropy 0.53117 (0.53199)	Top-1 acc 53.906 (67.544)	Top-5 acc 75.781 (86.282)	lr 0.00008
Train [116][1870/3239]	Time 0.240 (0.522)	Data Time 0.001 (0.022)	Loss 2.1629 (2.3473)	Entropy 0.53083 (0.53199)	Top-1 acc 71.094 (67.544)	Top-5 acc 89.844 (86.288)	lr 0.00008
Train [116][1880/3239]	Time 0.238 (0.521)	Data Time 0.001 (0.022)	Loss 2.3937 (2.3477)	Entropy 0.53097 (0.53198)	Top-1 acc 63.281 (67.534)	Top-5 acc 84.766 (86.282)	lr 0.00008
Train [116][1890/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.021)	Loss 2.8063 (2.3473)	Entropy 0.53064 (0.53197)	Top-1 acc 57.031 (67.546)	Top-5 acc 79.688 (86.293)	lr 0.00008
Train [116][1900/3239]	Time 0.243 (0.520)	Data Time 0.001 (0.021)	Loss 2.6229 (2.3473)	Entropy 0.53036 (0.53197)	Top-1 acc 64.844 (67.549)	Top-5 acc 82.812 (86.291)	lr 0.00008
Train [116][1910/3239]	Time 0.229 (0.520)	Data Time 0.001 (0.021)	Loss 2.2994 (2.3470)	Entropy 0.53078 (0.53196)	Top-1 acc 64.453 (67.550)	Top-5 acc 88.672 (86.297)	lr 0.00008
Train [116][1920/3239]	Time 0.229 (0.519)	Data Time 0.001 (0.021)	Loss 2.3889 (2.3473)	Entropy 0.53072 (0.53195)	Top-1 acc 67.188 (67.547)	Top-5 acc 86.719 (86.292)	lr 0.00008
Train [116][1930/3239]	Time 0.225 (0.518)	Data Time 0.001 (0.021)	Loss 2.4286 (2.3471)	Entropy 0.53070 (0.53195)	Top-1 acc 63.672 (67.551)	Top-5 acc 86.719 (86.296)	lr 0.00008
Train [116][1940/3239]	Time 0.231 (0.518)	Data Time 0.001 (0.021)	Loss 2.2268 (2.3468)	Entropy 0.53051 (0.53194)	Top-1 acc 69.922 (67.558)	Top-5 acc 87.500 (86.300)	lr 0.00008
Train [116][1950/3239]	Time 0.258 (0.517)	Data Time 0.001 (0.021)	Loss 2.1540 (2.3466)	Entropy 0.53048 (0.53193)	Top-1 acc 73.047 (67.562)	Top-5 acc 90.625 (86.304)	lr 0.00008
Train [116][1960/3239]	Time 0.240 (0.517)	Data Time 0.001 (0.021)	Loss 2.2880 (2.3468)	Entropy 0.53057 (0.53193)	Top-1 acc 66.016 (67.551)	Top-5 acc 88.672 (86.303)	lr 0.00008
Train [116][1970/3239]	Time 0.327 (0.516)	Data Time 0.001 (0.021)	Loss 2.2908 (2.3465)	Entropy 0.53055 (0.53192)	Top-1 acc 69.531 (67.556)	Top-5 acc 86.719 (86.308)	lr 0.00008
Train [116][1980/3239]	Time 0.235 (0.516)	Data Time 0.001 (0.021)	Loss 2.3745 (2.3467)	Entropy 0.53026 (0.53191)	Top-1 acc 65.234 (67.546)	Top-5 acc 85.547 (86.301)	lr 0.00008
Train [116][1990/3239]	Time 0.238 (0.515)	Data Time 0.001 (0.020)	Loss 2.2836 (2.3467)	Entropy 0.53042 (0.53190)	Top-1 acc 67.578 (67.540)	Top-5 acc 87.891 (86.301)	lr 0.00008
Train [116][2000/3239]	Time 0.236 (0.515)	Data Time 0.001 (0.020)	Loss 2.1427 (2.3464)	Entropy 0.53064 (0.53190)	Top-1 acc 73.438 (67.550)	Top-5 acc 89.844 (86.309)	lr 0.00008
Train [116][2010/3239]	Time 0.226 (0.514)	Data Time 0.001 (0.020)	Loss 2.0585 (2.3464)	Entropy 0.53098 (0.53189)	Top-1 acc 76.953 (67.554)	Top-5 acc 91.406 (86.309)	lr 0.00008
Train [116][2020/3239]	Time 0.232 (0.514)	Data Time 0.001 (0.020)	Loss 2.5244 (2.3466)	Entropy 0.53090 (0.53189)	Top-1 acc 63.281 (67.547)	Top-5 acc 83.984 (86.303)	lr 0.00008
Train [116][2030/3239]	Time 0.398 (0.540)	Data Time 0.005 (0.020)	Loss 2.3894 (2.3470)	Entropy 0.53078 (0.53188)	Top-1 acc 60.938 (67.536)	Top-5 acc 85.156 (86.298)	lr 0.00008
Train [116][2040/3239]	Time 0.238 (0.540)	Data Time 0.002 (0.020)	Loss 2.2814 (2.3469)	Entropy 0.53085 (0.53187)	Top-1 acc 69.141 (67.540)	Top-5 acc 87.109 (86.298)	lr 0.00008
Train [116][2050/3239]	Time 0.248 (0.539)	Data Time 0.002 (0.020)	Loss 2.3874 (2.3469)	Entropy 0.53052 (0.53187)	Top-1 acc 71.875 (67.541)	Top-5 acc 85.547 (86.294)	lr 0.00008
Train [116][2060/3239]	Time 0.254 (0.539)	Data Time 0.001 (0.020)	Loss 2.3387 (2.3471)	Entropy 0.53068 (0.53186)	Top-1 acc 67.578 (67.535)	Top-5 acc 86.719 (86.294)	lr 0.00008
Train [116][2070/3239]	Time 0.245 (0.538)	Data Time 0.001 (0.020)	Loss 2.1891 (2.3474)	Entropy 0.53094 (0.53186)	Top-1 acc 70.703 (67.529)	Top-5 acc 88.672 (86.289)	lr 0.00008
Train [116][2080/3239]	Time 0.243 (0.537)	Data Time 0.001 (0.020)	Loss 2.4605 (2.3472)	Entropy 0.53110 (0.53185)	Top-1 acc 64.844 (67.536)	Top-5 acc 84.375 (86.291)	lr 0.00008
Train [116][2090/3239]	Time 0.270 (0.537)	Data Time 0.035 (0.020)	Loss 2.4875 (2.3474)	Entropy 0.53141 (0.53185)	Top-1 acc 64.453 (67.528)	Top-5 acc 84.375 (86.288)	lr 0.00008
Train [116][2100/3239]	Time 0.247 (0.536)	Data Time 0.001 (0.019)	Loss 2.2875 (2.3474)	Entropy 0.53109 (0.53185)	Top-1 acc 68.359 (67.526)	Top-5 acc 86.719 (86.287)	lr 0.00008
Train [116][2110/3239]	Time 0.226 (0.536)	Data Time 0.001 (0.019)	Loss 2.3919 (2.3474)	Entropy 0.53115 (0.53184)	Top-1 acc 67.188 (67.531)	Top-5 acc 85.156 (86.285)	lr 0.00008
Train [116][2120/3239]	Time 0.231 (0.535)	Data Time 0.001 (0.019)	Loss 2.3242 (2.3474)	Entropy 0.53113 (0.53184)	Top-1 acc 67.578 (67.530)	Top-5 acc 86.719 (86.285)	lr 0.00008
Train [116][2130/3239]	Time 0.318 (0.535)	Data Time 0.001 (0.019)	Loss 2.5181 (2.3475)	Entropy 0.53129 (0.53184)	Top-1 acc 65.234 (67.530)	Top-5 acc 80.859 (86.280)	lr 0.00008
Train [116][2140/3239]	Time 0.254 (0.534)	Data Time 0.001 (0.019)	Loss 2.1370 (2.3473)	Entropy 0.53140 (0.53184)	Top-1 acc 75.391 (67.539)	Top-5 acc 90.234 (86.284)	lr 0.00008
Train [116][2150/3239]	Time 0.252 (0.534)	Data Time 0.002 (0.019)	Loss 2.4559 (2.3470)	Entropy 0.53149 (0.53183)	Top-1 acc 62.500 (67.541)	Top-5 acc 85.156 (86.289)	lr 0.00008
Train [116][2160/3239]	Time 0.227 (0.533)	Data Time 0.001 (0.019)	Loss 2.4938 (2.3472)	Entropy 0.53152 (0.53183)	Top-1 acc 67.578 (67.539)	Top-5 acc 82.812 (86.286)	lr 0.00008
Train [116][2170/3239]	Time 0.236 (0.533)	Data Time 0.001 (0.019)	Loss 2.4002 (2.3475)	Entropy 0.53166 (0.53183)	Top-1 acc 66.797 (67.529)	Top-5 acc 83.594 (86.281)	lr 0.00008
Train [116][2180/3239]	Time 0.232 (0.532)	Data Time 0.001 (0.019)	Loss 2.4048 (2.3474)	Entropy 0.53153 (0.53183)	Top-1 acc 66.797 (67.532)	Top-5 acc 86.719 (86.286)	lr 0.00008
Train [116][2190/3239]	Time 0.227 (0.532)	Data Time 0.001 (0.019)	Loss 2.3588 (2.3475)	Entropy 0.53142 (0.53183)	Top-1 acc 69.141 (67.528)	Top-5 acc 87.109 (86.284)	lr 0.00008
Train [116][2200/3239]	Time 0.368 (0.531)	Data Time 0.001 (0.019)	Loss 2.1054 (2.3474)	Entropy 0.53162 (0.53183)	Top-1 acc 72.266 (67.529)	Top-5 acc 89.844 (86.287)	lr 0.00008
Train [116][2210/3239]	Time 0.234 (0.531)	Data Time 0.001 (0.019)	Loss 2.4728 (2.3474)	Entropy 0.53163 (0.53183)	Top-1 acc 63.281 (67.529)	Top-5 acc 83.203 (86.286)	lr 0.00008
Train [116][2220/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.018)	Loss 2.1123 (2.3473)	Entropy 0.53165 (0.53183)	Top-1 acc 74.219 (67.532)	Top-5 acc 88.281 (86.286)	lr 0.00008
Train [116][2230/3239]	Time 0.227 (0.530)	Data Time 0.001 (0.018)	Loss 2.0929 (2.3468)	Entropy 0.53174 (0.53182)	Top-1 acc 73.438 (67.545)	Top-5 acc 89.844 (86.293)	lr 0.00008
Train [116][2240/3239]	Time 0.238 (0.529)	Data Time 0.001 (0.018)	Loss 2.1730 (2.3466)	Entropy 0.53142 (0.53182)	Top-1 acc 69.531 (67.548)	Top-5 acc 87.500 (86.296)	lr 0.00008
Train [116][2250/3239]	Time 0.236 (0.529)	Data Time 0.001 (0.018)	Loss 2.1433 (2.3465)	Entropy 0.53139 (0.53182)	Top-1 acc 71.875 (67.548)	Top-5 acc 88.281 (86.297)	lr 0.00008
Train [116][2260/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.018)	Loss 2.2841 (2.3467)	Entropy 0.53171 (0.53182)	Top-1 acc 68.359 (67.546)	Top-5 acc 87.891 (86.291)	lr 0.00008
Train [116][2270/3239]	Time 0.232 (0.528)	Data Time 0.001 (0.018)	Loss 2.1158 (2.3464)	Entropy 0.53151 (0.53182)	Top-1 acc 70.312 (67.549)	Top-5 acc 91.797 (86.296)	lr 0.00008
Train [116][2280/3239]	Time 0.232 (0.527)	Data Time 0.001 (0.018)	Loss 2.2945 (2.3463)	Entropy 0.53150 (0.53182)	Top-1 acc 69.922 (67.554)	Top-5 acc 88.672 (86.298)	lr 0.00008
Train [116][2290/3239]	Time 0.324 (0.527)	Data Time 0.001 (0.018)	Loss 2.2893 (2.3461)	Entropy 0.53178 (0.53182)	Top-1 acc 65.625 (67.554)	Top-5 acc 87.500 (86.300)	lr 0.00008
Train [116][2300/3239]	Time 0.228 (0.526)	Data Time 0.001 (0.018)	Loss 2.2669 (2.3462)	Entropy 0.53215 (0.53182)	Top-1 acc 70.703 (67.548)	Top-5 acc 87.500 (86.299)	lr 0.00008
Train [116][2310/3239]	Time 0.224 (0.526)	Data Time 0.001 (0.018)	Loss 2.2810 (2.3461)	Entropy 0.53195 (0.53182)	Top-1 acc 66.016 (67.550)	Top-5 acc 86.719 (86.297)	lr 0.00008
Train [116][2320/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.018)	Loss 2.1716 (2.3461)	Entropy 0.53224 (0.53182)	Top-1 acc 69.922 (67.553)	Top-5 acc 88.672 (86.298)	lr 0.00008
Train [116][2330/3239]	Time 0.228 (0.525)	Data Time 0.002 (0.018)	Loss 2.4007 (2.3464)	Entropy 0.53216 (0.53182)	Top-1 acc 67.188 (67.541)	Top-5 acc 83.984 (86.294)	lr 0.00008
Train [116][2340/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.018)	Loss 2.2640 (2.3464)	Entropy 0.53199 (0.53182)	Top-1 acc 69.141 (67.543)	Top-5 acc 86.328 (86.295)	lr 0.00008
Train [116][2350/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.018)	Loss 2.0703 (2.3460)	Entropy 0.53215 (0.53182)	Top-1 acc 77.344 (67.556)	Top-5 acc 91.406 (86.301)	lr 0.00008
Train [116][2360/3239]	Time 0.333 (0.523)	Data Time 0.001 (0.017)	Loss 2.4390 (2.3460)	Entropy 0.53172 (0.53182)	Top-1 acc 66.406 (67.555)	Top-5 acc 84.375 (86.299)	lr 0.00008
Train [116][2370/3239]	Time 0.238 (0.523)	Data Time 0.001 (0.017)	Loss 2.3751 (2.3462)	Entropy 0.53219 (0.53182)	Top-1 acc 66.797 (67.548)	Top-5 acc 87.109 (86.297)	lr 0.00008
Train [116][2380/3239]	Time 0.227 (0.522)	Data Time 0.001 (0.017)	Loss 2.4490 (2.3462)	Entropy 0.53231 (0.53183)	Top-1 acc 61.328 (67.547)	Top-5 acc 85.547 (86.295)	lr 0.00008
Train [116][2390/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.017)	Loss 2.1743 (2.3459)	Entropy 0.53225 (0.53183)	Top-1 acc 70.703 (67.552)	Top-5 acc 90.625 (86.301)	lr 0.00008
Train [116][2400/3239]	Time 0.223 (0.521)	Data Time 0.001 (0.017)	Loss 2.1551 (2.3457)	Entropy 0.53247 (0.53183)	Top-1 acc 72.266 (67.559)	Top-5 acc 90.234 (86.305)	lr 0.00008
Train [116][2410/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.017)	Loss 2.2632 (2.3454)	Entropy 0.53210 (0.53183)	Top-1 acc 72.656 (67.568)	Top-5 acc 87.891 (86.315)	lr 0.00008
Train [116][2420/3239]	Time 0.233 (0.520)	Data Time 0.001 (0.017)	Loss 2.2648 (2.3452)	Entropy 0.53207 (0.53183)	Top-1 acc 69.141 (67.573)	Top-5 acc 89.453 (86.321)	lr 0.00008
Train [116][2430/3239]	Time 0.275 (0.520)	Data Time 0.002 (0.017)	Loss 2.3837 (2.3452)	Entropy 0.53232 (0.53183)	Top-1 acc 66.016 (67.581)	Top-5 acc 85.547 (86.322)	lr 0.00008
Train [116][2440/3239]	Time 0.223 (0.520)	Data Time 0.001 (0.017)	Loss 2.2164 (2.3451)	Entropy 0.53249 (0.53184)	Top-1 acc 69.531 (67.583)	Top-5 acc 89.844 (86.323)	lr 0.00008
Train [116][2450/3239]	Time 0.248 (0.519)	Data Time 0.001 (0.017)	Loss 2.3358 (2.3455)	Entropy 0.53258 (0.53184)	Top-1 acc 67.188 (67.571)	Top-5 acc 86.328 (86.315)	lr 0.00008
Train [116][2460/3239]	Time 0.226 (0.519)	Data Time 0.001 (0.017)	Loss 2.3590 (2.3456)	Entropy 0.53258 (0.53184)	Top-1 acc 70.312 (67.570)	Top-5 acc 86.719 (86.316)	lr 0.00008
Train [116][2470/3239]	Time 0.224 (0.518)	Data Time 0.001 (0.017)	Loss 2.7267 (2.3459)	Entropy 0.53267 (0.53184)	Top-1 acc 54.688 (67.563)	Top-5 acc 78.906 (86.312)	lr 0.00008
Train [116][2480/3239]	Time 0.218 (0.518)	Data Time 0.001 (0.017)	Loss 2.3131 (2.3463)	Entropy 0.53233 (0.53185)	Top-1 acc 68.359 (67.558)	Top-5 acc 88.672 (86.307)	lr 0.00008
Train [116][2490/3239]	Time 0.215 (0.517)	Data Time 0.001 (0.017)	Loss 2.2235 (2.3461)	Entropy 0.53247 (0.53185)	Top-1 acc 69.531 (67.567)	Top-5 acc 87.500 (86.309)	lr 0.00008
Train [116][2500/3239]	Time 0.247 (0.517)	Data Time 0.001 (0.017)	Loss 2.7663 (2.3464)	Entropy 0.53260 (0.53185)	Top-1 acc 58.203 (67.562)	Top-5 acc 78.516 (86.302)	lr 0.00008
Train [116][2510/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.017)	Loss 2.1434 (2.3461)	Entropy 0.53258 (0.53185)	Top-1 acc 73.828 (67.570)	Top-5 acc 88.672 (86.308)	lr 0.00008
Train [116][2520/3239]	Time 0.325 (0.516)	Data Time 0.001 (0.016)	Loss 2.3468 (2.3461)	Entropy 0.53257 (0.53186)	Top-1 acc 68.750 (67.575)	Top-5 acc 85.547 (86.312)	lr 0.00008
Train [116][2530/3239]	Time 0.227 (0.516)	Data Time 0.001 (0.016)	Loss 2.3384 (2.3461)	Entropy 0.53234 (0.53186)	Top-1 acc 69.141 (67.576)	Top-5 acc 85.156 (86.311)	lr 0.00008
Train [116][2540/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.016)	Loss 2.5331 (2.3460)	Entropy 0.53234 (0.53186)	Top-1 acc 63.281 (67.575)	Top-5 acc 83.203 (86.313)	lr 0.00008
Train [116][2550/3239]	Time 0.227 (0.515)	Data Time 0.001 (0.016)	Loss 2.3409 (2.3456)	Entropy 0.53255 (0.53186)	Top-1 acc 68.359 (67.586)	Top-5 acc 85.547 (86.320)	lr 0.00008
Train [116][2560/3239]	Time 0.223 (0.514)	Data Time 0.001 (0.016)	Loss 2.4840 (2.3455)	Entropy 0.53263 (0.53187)	Top-1 acc 63.281 (67.585)	Top-5 acc 83.594 (86.322)	lr 0.00008
Train [116][2570/3239]	Time 0.231 (0.514)	Data Time 0.001 (0.016)	Loss 2.4279 (2.3454)	Entropy 0.53243 (0.53187)	Top-1 acc 63.672 (67.590)	Top-5 acc 86.328 (86.326)	lr 0.00008
Train [116][2580/3239]	Time 0.234 (0.513)	Data Time 0.001 (0.016)	Loss 2.4727 (2.3453)	Entropy 0.53254 (0.53187)	Top-1 acc 64.844 (67.593)	Top-5 acc 82.422 (86.326)	lr 0.00008
Train [116][2590/3239]	Time 0.346 (0.513)	Data Time 0.001 (0.016)	Loss 2.2619 (2.3453)	Entropy 0.53239 (0.53187)	Top-1 acc 69.531 (67.595)	Top-5 acc 89.453 (86.328)	lr 0.00008
Train [116][2600/3239]	Time 0.227 (0.513)	Data Time 0.001 (0.016)	Loss 2.7351 (2.3454)	Entropy 0.53259 (0.53188)	Top-1 acc 57.031 (67.591)	Top-5 acc 79.688 (86.323)	lr 0.00008
Train [116][2610/3239]	Time 0.280 (0.512)	Data Time 0.001 (0.016)	Loss 2.3077 (2.3455)	Entropy 0.53270 (0.53188)	Top-1 acc 67.969 (67.586)	Top-5 acc 85.547 (86.321)	lr 0.00008
Train [116][2620/3239]	Time 0.225 (0.512)	Data Time 0.001 (0.016)	Loss 2.7707 (2.3457)	Entropy 0.53301 (0.53188)	Top-1 acc 58.984 (67.587)	Top-5 acc 77.344 (86.319)	lr 0.00008
Train [116][2630/3239]	Time 0.225 (0.511)	Data Time 0.001 (0.016)	Loss 2.3239 (2.3457)	Entropy 0.53334 (0.53189)	Top-1 acc 65.625 (67.585)	Top-5 acc 89.062 (86.318)	lr 0.00008
Train [116][2640/3239]	Time 0.273 (0.511)	Data Time 0.001 (0.016)	Loss 2.2532 (2.3455)	Entropy 0.53352 (0.53189)	Top-1 acc 69.531 (67.591)	Top-5 acc 87.500 (86.320)	lr 0.00007
Train [116][2650/3239]	Time 0.306 (0.511)	Data Time 0.002 (0.016)	Loss 2.5293 (2.3458)	Entropy 0.53379 (0.53190)	Top-1 acc 63.672 (67.585)	Top-5 acc 82.812 (86.317)	lr 0.00007
Train [116][2660/3239]	Time 0.227 (0.511)	Data Time 0.001 (0.016)	Loss 2.4210 (2.3457)	Entropy 0.53348 (0.53191)	Top-1 acc 66.406 (67.583)	Top-5 acc 85.547 (86.320)	lr 0.00007
Train [116][2670/3239]	Time 0.233 (0.511)	Data Time 0.001 (0.016)	Loss 2.1448 (2.3456)	Entropy 0.53383 (0.53191)	Top-1 acc 71.094 (67.584)	Top-5 acc 91.016 (86.320)	lr 0.00007
Train [116][2680/3239]	Time 0.327 (0.510)	Data Time 0.001 (0.016)	Loss 2.4568 (2.3456)	Entropy 0.53390 (0.53192)	Top-1 acc 66.016 (67.583)	Top-5 acc 82.812 (86.317)	lr 0.00007
Train [116][2690/3239]	Time 0.376 (0.528)	Data Time 0.003 (0.016)	Loss 2.3066 (2.3457)	Entropy 0.53347 (0.53193)	Top-1 acc 67.578 (67.582)	Top-5 acc 86.328 (86.316)	lr 0.00007
Train [116][2700/3239]	Time 0.236 (0.528)	Data Time 0.002 (0.016)	Loss 2.1146 (2.3457)	Entropy 0.53349 (0.53193)	Top-1 acc 75.781 (67.580)	Top-5 acc 90.625 (86.315)	lr 0.00007
Train [116][2710/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.015)	Loss 2.7721 (2.3458)	Entropy 0.53365 (0.53194)	Top-1 acc 58.984 (67.581)	Top-5 acc 78.125 (86.311)	lr 0.00007
Train [116][2720/3239]	Time 0.241 (0.527)	Data Time 0.001 (0.015)	Loss 2.4540 (2.3457)	Entropy 0.53319 (0.53194)	Top-1 acc 61.328 (67.584)	Top-5 acc 83.203 (86.312)	lr 0.00007
Train [116][2730/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.015)	Loss 2.0751 (2.3460)	Entropy 0.53331 (0.53195)	Top-1 acc 71.094 (67.574)	Top-5 acc 91.797 (86.307)	lr 0.00007
Train [116][2740/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.015)	Loss 2.0952 (2.3461)	Entropy 0.53319 (0.53195)	Top-1 acc 72.266 (67.573)	Top-5 acc 91.797 (86.307)	lr 0.00007
Train [116][2750/3239]	Time 0.329 (0.526)	Data Time 0.001 (0.015)	Loss 2.1592 (2.3464)	Entropy 0.53285 (0.53196)	Top-1 acc 68.359 (67.567)	Top-5 acc 90.625 (86.303)	lr 0.00007
Train [116][2760/3239]	Time 0.226 (0.526)	Data Time 0.001 (0.015)	Loss 2.2044 (2.3465)	Entropy 0.53310 (0.53196)	Top-1 acc 71.094 (67.570)	Top-5 acc 89.062 (86.298)	lr 0.00007
Train [116][2770/3239]	Time 0.235 (0.525)	Data Time 0.001 (0.015)	Loss 2.3436 (2.3466)	Entropy 0.53275 (0.53196)	Top-1 acc 66.797 (67.564)	Top-5 acc 85.156 (86.297)	lr 0.00007
Train [116][2780/3239]	Time 0.230 (0.525)	Data Time 0.001 (0.015)	Loss 2.5456 (2.3466)	Entropy 0.53277 (0.53197)	Top-1 acc 62.109 (67.568)	Top-5 acc 82.422 (86.295)	lr 0.00007
Train [116][2790/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.015)	Loss 2.4388 (2.3468)	Entropy 0.53282 (0.53197)	Top-1 acc 63.672 (67.559)	Top-5 acc 84.766 (86.290)	lr 0.00007
Train [116][2800/3239]	Time 0.281 (0.524)	Data Time 0.001 (0.015)	Loss 2.2114 (2.3468)	Entropy 0.53303 (0.53197)	Top-1 acc 71.875 (67.562)	Top-5 acc 87.891 (86.288)	lr 0.00007
Train [116][2810/3239]	Time 0.231 (0.524)	Data Time 0.001 (0.015)	Loss 2.2798 (2.3466)	Entropy 0.53288 (0.53198)	Top-1 acc 68.359 (67.565)	Top-5 acc 87.109 (86.291)	lr 0.00007
Train [116][2820/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.015)	Loss 2.3916 (2.3466)	Entropy 0.53283 (0.53198)	Top-1 acc 66.406 (67.564)	Top-5 acc 83.594 (86.290)	lr 0.00007
Train [116][2830/3239]	Time 0.232 (0.523)	Data Time 0.001 (0.015)	Loss 2.2330 (2.3466)	Entropy 0.53279 (0.53198)	Top-1 acc 66.016 (67.565)	Top-5 acc 88.672 (86.293)	lr 0.00007
Train [116][2840/3239]	Time 0.355 (0.523)	Data Time 0.001 (0.015)	Loss 2.2001 (2.3469)	Entropy 0.53291 (0.53199)	Top-1 acc 72.266 (67.559)	Top-5 acc 89.062 (86.285)	lr 0.00007
Train [116][2850/3239]	Time 0.234 (0.522)	Data Time 0.001 (0.015)	Loss 2.3381 (2.3468)	Entropy 0.53258 (0.53199)	Top-1 acc 67.188 (67.560)	Top-5 acc 86.328 (86.286)	lr 0.00007
Train [116][2860/3239]	Time 0.228 (0.522)	Data Time 0.002 (0.015)	Loss 2.3016 (2.3468)	Entropy 0.53280 (0.53199)	Top-1 acc 69.531 (67.562)	Top-5 acc 89.453 (86.286)	lr 0.00007
Train [116][2870/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.015)	Loss 2.1792 (2.3467)	Entropy 0.53273 (0.53199)	Top-1 acc 72.656 (67.563)	Top-5 acc 88.672 (86.288)	lr 0.00007
Train [116][2880/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.015)	Loss 2.5936 (2.3469)	Entropy 0.53273 (0.53200)	Top-1 acc 56.250 (67.555)	Top-5 acc 81.250 (86.285)	lr 0.00007
Train [116][2890/3239]	Time 0.226 (0.521)	Data Time 0.001 (0.015)	Loss 2.2340 (2.3469)	Entropy 0.53297 (0.53200)	Top-1 acc 69.141 (67.557)	Top-5 acc 89.062 (86.283)	lr 0.00007
Train [116][2900/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.015)	Loss 2.4404 (2.3471)	Entropy 0.53299 (0.53200)	Top-1 acc 67.969 (67.554)	Top-5 acc 84.375 (86.280)	lr 0.00007
Train [116][2910/3239]	Time 0.325 (0.520)	Data Time 0.001 (0.015)	Loss 2.3749 (2.3472)	Entropy 0.53277 (0.53201)	Top-1 acc 65.625 (67.553)	Top-5 acc 89.062 (86.281)	lr 0.00007
Train [116][2920/3239]	Time 0.268 (0.520)	Data Time 0.003 (0.014)	Loss 2.3070 (2.3471)	Entropy 0.53280 (0.53201)	Top-1 acc 67.188 (67.555)	Top-5 acc 86.719 (86.281)	lr 0.00007
Train [116][2930/3239]	Time 0.237 (0.519)	Data Time 0.001 (0.014)	Loss 2.3784 (2.3470)	Entropy 0.53314 (0.53201)	Top-1 acc 66.016 (67.560)	Top-5 acc 84.766 (86.282)	lr 0.00007
Train [116][2940/3239]	Time 0.231 (0.519)	Data Time 0.001 (0.014)	Loss 2.3260 (2.3470)	Entropy 0.53321 (0.53201)	Top-1 acc 66.797 (67.559)	Top-5 acc 87.109 (86.284)	lr 0.00007
Train [116][2950/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.014)	Loss 2.4876 (2.3468)	Entropy 0.53320 (0.53202)	Top-1 acc 65.234 (67.563)	Top-5 acc 82.031 (86.285)	lr 0.00007
Train [116][2960/3239]	Time 0.228 (0.518)	Data Time 0.001 (0.014)	Loss 2.1847 (2.3468)	Entropy 0.53316 (0.53202)	Top-1 acc 73.438 (67.566)	Top-5 acc 89.062 (86.288)	lr 0.00007
Train [116][2970/3239]	Time 0.220 (0.518)	Data Time 0.001 (0.014)	Loss 2.5057 (2.3467)	Entropy 0.53304 (0.53203)	Top-1 acc 65.234 (67.563)	Top-5 acc 84.375 (86.289)	lr 0.00007
Train [116][2980/3239]	Time 0.264 (0.518)	Data Time 0.001 (0.014)	Loss 2.3917 (2.3465)	Entropy 0.53346 (0.53203)	Top-1 acc 66.406 (67.571)	Top-5 acc 87.891 (86.295)	lr 0.00007
Train [116][2990/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.014)	Loss 2.4618 (2.3465)	Entropy 0.53358 (0.53204)	Top-1 acc 68.359 (67.571)	Top-5 acc 83.203 (86.296)	lr 0.00007
Train [116][3000/3239]	Time 0.392 (0.517)	Data Time 0.001 (0.014)	Loss 2.2074 (2.3466)	Entropy 0.53375 (0.53204)	Top-1 acc 72.266 (67.568)	Top-5 acc 89.453 (86.296)	lr 0.00007
Train [116][3010/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.014)	Loss 2.4046 (2.3467)	Entropy 0.53398 (0.53205)	Top-1 acc 67.578 (67.564)	Top-5 acc 84.375 (86.294)	lr 0.00007
Train [116][3020/3239]	Time 0.228 (0.516)	Data Time 0.001 (0.014)	Loss 2.1445 (2.3465)	Entropy 0.53394 (0.53205)	Top-1 acc 75.391 (67.571)	Top-5 acc 89.062 (86.298)	lr 0.00007
Train [116][3030/3239]	Time 0.347 (0.517)	Data Time 0.002 (0.014)	Loss 2.4002 (2.3465)	Entropy 0.53364 (0.53206)	Top-1 acc 65.234 (67.570)	Top-5 acc 88.281 (86.299)	lr 0.00007
Train [116][3040/3239]	Time 0.281 (0.517)	Data Time 0.003 (0.014)	Loss 2.3000 (2.3465)	Entropy 0.53344 (0.53206)	Top-1 acc 68.359 (67.570)	Top-5 acc 87.109 (86.298)	lr 0.00007
Train [116][3050/3239]	Time 0.234 (0.517)	Data Time 0.001 (0.014)	Loss 2.5331 (2.3464)	Entropy 0.53362 (0.53207)	Top-1 acc 62.500 (67.577)	Top-5 acc 83.203 (86.300)	lr 0.00007
Train [116][3060/3239]	Time 0.232 (0.516)	Data Time 0.001 (0.014)	Loss 2.0727 (2.3463)	Entropy 0.53343 (0.53207)	Top-1 acc 76.953 (67.583)	Top-5 acc 89.453 (86.301)	lr 0.00007
Train [116][3070/3239]	Time 0.332 (0.516)	Data Time 0.001 (0.014)	Loss 2.3016 (2.3462)	Entropy 0.53332 (0.53208)	Top-1 acc 68.359 (67.585)	Top-5 acc 85.938 (86.302)	lr 0.00007
Train [116][3080/3239]	Time 0.234 (0.516)	Data Time 0.001 (0.014)	Loss 2.3145 (2.3462)	Entropy 0.53329 (0.53208)	Top-1 acc 71.094 (67.583)	Top-5 acc 85.938 (86.300)	lr 0.00007
Train [116][3090/3239]	Time 0.232 (0.515)	Data Time 0.001 (0.014)	Loss 2.4496 (2.3464)	Entropy 0.53313 (0.53209)	Top-1 acc 60.938 (67.576)	Top-5 acc 85.547 (86.296)	lr 0.00007
Train [116][3100/3239]	Time 0.252 (0.515)	Data Time 0.001 (0.014)	Loss 2.3616 (2.3465)	Entropy 0.53311 (0.53209)	Top-1 acc 68.750 (67.573)	Top-5 acc 86.719 (86.296)	lr 0.00007
Train [116][3110/3239]	Time 0.237 (0.515)	Data Time 0.001 (0.014)	Loss 2.2438 (2.3465)	Entropy 0.53329 (0.53209)	Top-1 acc 71.094 (67.570)	Top-5 acc 85.547 (86.295)	lr 0.00007
Train [116][3120/3239]	Time 0.229 (0.514)	Data Time 0.001 (0.014)	Loss 2.3915 (2.3466)	Entropy 0.53355 (0.53210)	Top-1 acc 64.453 (67.567)	Top-5 acc 86.719 (86.294)	lr 0.00007
Train [116][3130/3239]	Time 0.237 (0.514)	Data Time 0.001 (0.014)	Loss 2.2418 (2.3466)	Entropy 0.53368 (0.53210)	Top-1 acc 71.094 (67.567)	Top-5 acc 87.109 (86.294)	lr 0.00007
Train [116][3140/3239]	Time 0.233 (0.514)	Data Time 0.001 (0.014)	Loss 2.3620 (2.3465)	Entropy 0.53335 (0.53211)	Top-1 acc 64.844 (67.571)	Top-5 acc 85.156 (86.294)	lr 0.00007
Train [116][3150/3239]	Time 0.255 (0.513)	Data Time 0.001 (0.014)	Loss 2.1888 (2.3467)	Entropy 0.53338 (0.53211)	Top-1 acc 71.484 (67.567)	Top-5 acc 88.281 (86.288)	lr 0.00007
Train [116][3160/3239]	Time 0.275 (0.513)	Data Time 0.003 (0.014)	Loss 2.4386 (2.3467)	Entropy 0.53321 (0.53211)	Top-1 acc 66.797 (67.572)	Top-5 acc 86.719 (86.291)	lr 0.00007
Train [116][3170/3239]	Time 0.266 (0.513)	Data Time 0.001 (0.013)	Loss 2.5018 (2.3467)	Entropy 0.53342 (0.53212)	Top-1 acc 64.453 (67.574)	Top-5 acc 83.203 (86.292)	lr 0.00007
Train [116][3180/3239]	Time 0.218 (0.512)	Data Time 0.000 (0.013)	Loss 2.1410 (2.3468)	Entropy 0.53342 (0.53212)	Top-1 acc 70.312 (67.574)	Top-5 acc 91.016 (86.290)	lr 0.00007
Train [116][3190/3239]	Time 0.214 (0.512)	Data Time 0.000 (0.013)	Loss 2.4294 (2.3468)	Entropy 0.53330 (0.53213)	Top-1 acc 61.328 (67.574)	Top-5 acc 85.547 (86.291)	lr 0.00007
Train [116][3200/3239]	Time 0.217 (0.511)	Data Time 0.000 (0.013)	Loss 2.1673 (2.3467)	Entropy 0.53363 (0.53213)	Top-1 acc 74.609 (67.577)	Top-5 acc 88.672 (86.291)	lr 0.00007
Train [116][3210/3239]	Time 0.225 (0.511)	Data Time 0.000 (0.013)	Loss 2.2787 (2.3465)	Entropy 0.53350 (0.53213)	Top-1 acc 69.922 (67.584)	Top-5 acc 85.156 (86.293)	lr 0.00007
Train [116][3220/3239]	Time 0.215 (0.511)	Data Time 0.000 (0.013)	Loss 2.5510 (2.3463)	Entropy 0.53320 (0.53214)	Top-1 acc 64.062 (67.592)	Top-5 acc 81.641 (86.295)	lr 0.00007
Train [116][3230/3239]	Time 0.308 (0.510)	Data Time 0.000 (0.013)	Loss 2.2336 (2.3460)	Entropy 0.53290 (0.53214)	Top-1 acc 70.312 (67.599)	Top-5 acc 87.500 (86.300)	lr 0.00007
Train [116][3239/3239]	Time 0.852 (0.510)	Data Time 0.000 (0.013)	Loss 2.2623 (2.3458)	Entropy 0.53281 (0.53214)	Top-1 acc 66.667 (67.605)	Top-5 acc 91.358 (86.302)	lr 0.00007
==========Valid [116/120]	loss 1.170	top-1 acc 73.071 (73.154)	top-5 acc 90.665	Train top-1 67.605	top-5 86.302	Entropy 0.53281	Latency-None: 0.000ms	Flops: 539.00M
Train [117][0/3239]	Time 34.028 (34.028)	Data Time 32.278 (32.278)	Loss 2.5942 (2.5942)	Entropy 0.53254 (0.53254)	Top-1 acc 63.281 (63.281)	Top-5 acc 80.078 (80.078)	lr 0.00007
Train [117][10/3239]	Time 0.236 (3.693)	Data Time 0.001 (3.032)	Loss 2.5362 (2.4442)	Entropy 0.53230 (0.53242)	Top-1 acc 62.891 (65.554)	Top-5 acc 83.203 (84.446)	lr 0.00007
Train [117][20/3239]	Time 0.244 (2.140)	Data Time 0.001 (1.589)	Loss 2.2125 (2.3730)	Entropy 0.53230 (0.53235)	Top-1 acc 74.219 (67.169)	Top-5 acc 88.281 (85.770)	lr 0.00007
Train [117][30/3239]	Time 0.237 (1.585)	Data Time 0.002 (1.077)	Loss 2.4468 (2.3750)	Entropy 0.53222 (0.53236)	Top-1 acc 61.328 (66.998)	Top-5 acc 84.375 (85.723)	lr 0.00007
Train [117][40/3239]	Time 0.227 (1.308)	Data Time 0.001 (0.815)	Loss 2.6131 (2.3605)	Entropy 0.53248 (0.53236)	Top-1 acc 61.719 (67.426)	Top-5 acc 80.859 (85.938)	lr 0.00007
Train [117][50/3239]	Time 0.256 (1.133)	Data Time 0.001 (0.655)	Loss 2.3447 (2.3650)	Entropy 0.53237 (0.53235)	Top-1 acc 69.531 (67.356)	Top-5 acc 83.594 (85.853)	lr 0.00007
Train [117][60/3239]	Time 0.311 (1.016)	Data Time 0.001 (0.548)	Loss 2.2275 (2.3597)	Entropy 0.53263 (0.53238)	Top-1 acc 68.359 (67.450)	Top-5 acc 89.453 (85.982)	lr 0.00007
Train [117][70/3239]	Time 0.231 (0.929)	Data Time 0.001 (0.471)	Loss 2.3862 (2.3542)	Entropy 0.53283 (0.53242)	Top-1 acc 66.406 (67.529)	Top-5 acc 85.547 (86.136)	lr 0.00007
Train [117][80/3239]	Time 0.230 (0.864)	Data Time 0.001 (0.413)	Loss 2.2830 (2.3538)	Entropy 0.53248 (0.53246)	Top-1 acc 68.750 (67.511)	Top-5 acc 86.719 (86.169)	lr 0.00007
Train [117][90/3239]	Time 0.253 (0.815)	Data Time 0.001 (0.368)	Loss 2.3934 (2.3519)	Entropy 0.53232 (0.53245)	Top-1 acc 66.016 (67.497)	Top-5 acc 84.766 (86.161)	lr 0.00007
Train [117][100/3239]	Time 0.370 (1.261)	Data Time 0.030 (0.332)	Loss 2.2527 (2.3489)	Entropy 0.53221 (0.53243)	Top-1 acc 69.141 (67.563)	Top-5 acc 86.328 (86.231)	lr 0.00007
Train [117][110/3239]	Time 0.233 (1.195)	Data Time 0.002 (0.302)	Loss 2.4630 (2.3441)	Entropy 0.53251 (0.53242)	Top-1 acc 67.188 (67.684)	Top-5 acc 83.594 (86.247)	lr 0.00007
Train [117][120/3239]	Time 0.237 (1.132)	Data Time 0.002 (0.278)	Loss 2.5819 (2.3423)	Entropy 0.53251 (0.53243)	Top-1 acc 65.625 (67.749)	Top-5 acc 82.422 (86.234)	lr 0.00007
Train [117][130/3239]	Time 0.322 (1.077)	Data Time 0.001 (0.257)	Loss 2.3249 (2.3418)	Entropy 0.53207 (0.53243)	Top-1 acc 68.750 (67.745)	Top-5 acc 86.328 (86.248)	lr 0.00007
Train [117][140/3239]	Time 0.232 (1.031)	Data Time 0.002 (0.238)	Loss 2.6143 (2.3466)	Entropy 0.53099 (0.53238)	Top-1 acc 60.547 (67.611)	Top-5 acc 81.641 (86.159)	lr 0.00007
Train [117][150/3239]	Time 0.219 (0.990)	Data Time 0.001 (0.223)	Loss 2.5240 (2.3492)	Entropy 0.53098 (0.53229)	Top-1 acc 62.891 (67.516)	Top-5 acc 85.547 (86.111)	lr 0.00007
Train [117][160/3239]	Time 0.232 (0.955)	Data Time 0.001 (0.209)	Loss 2.4010 (2.3511)	Entropy 0.53098 (0.53221)	Top-1 acc 67.188 (67.503)	Top-5 acc 86.328 (86.069)	lr 0.00007
Train [117][170/3239]	Time 0.261 (0.924)	Data Time 0.001 (0.197)	Loss 2.2087 (2.3484)	Entropy 0.53065 (0.53213)	Top-1 acc 71.094 (67.590)	Top-5 acc 88.672 (86.145)	lr 0.00007
Train [117][180/3239]	Time 0.236 (0.897)	Data Time 0.001 (0.186)	Loss 2.5825 (2.3506)	Entropy 0.53092 (0.53206)	Top-1 acc 61.328 (67.541)	Top-5 acc 81.250 (86.108)	lr 0.00007
Train [117][190/3239]	Time 0.239 (0.872)	Data Time 0.001 (0.177)	Loss 2.2714 (2.3497)	Entropy 0.53088 (0.53200)	Top-1 acc 71.875 (67.533)	Top-5 acc 87.891 (86.101)	lr 0.00007
Train [117][200/3239]	Time 0.266 (0.850)	Data Time 0.001 (0.168)	Loss 2.5394 (2.3471)	Entropy 0.53078 (0.53194)	Top-1 acc 65.625 (67.615)	Top-5 acc 82.422 (86.175)	lr 0.00007
Train [117][210/3239]	Time 0.235 (0.830)	Data Time 0.002 (0.160)	Loss 2.5701 (2.3500)	Entropy 0.53079 (0.53188)	Top-1 acc 61.328 (67.547)	Top-5 acc 82.422 (86.110)	lr 0.00007
Train [117][220/3239]	Time 0.330 (0.812)	Data Time 0.001 (0.153)	Loss 2.5399 (2.3522)	Entropy 0.53109 (0.53184)	Top-1 acc 62.891 (67.488)	Top-5 acc 83.203 (86.093)	lr 0.00007
Train [117][230/3239]	Time 0.236 (0.796)	Data Time 0.001 (0.146)	Loss 2.6238 (2.3528)	Entropy 0.53126 (0.53181)	Top-1 acc 57.812 (67.436)	Top-5 acc 82.422 (86.088)	lr 0.00007
Train [117][240/3239]	Time 0.252 (0.784)	Data Time 0.001 (0.140)	Loss 2.3421 (2.3537)	Entropy 0.53160 (0.53179)	Top-1 acc 67.188 (67.424)	Top-5 acc 86.719 (86.090)	lr 0.00007
Train [117][250/3239]	Time 0.237 (0.773)	Data Time 0.001 (0.135)	Loss 2.0891 (2.3502)	Entropy 0.53168 (0.53178)	Top-1 acc 71.484 (67.472)	Top-5 acc 91.797 (86.148)	lr 0.00007
Train [117][260/3239]	Time 0.238 (0.759)	Data Time 0.001 (0.130)	Loss 2.4670 (2.3493)	Entropy 0.53202 (0.53178)	Top-1 acc 64.453 (67.520)	Top-5 acc 82.812 (86.144)	lr 0.00007
Train [117][270/3239]	Time 0.271 (0.746)	Data Time 0.001 (0.125)	Loss 2.3462 (2.3509)	Entropy 0.53215 (0.53179)	Top-1 acc 67.578 (67.464)	Top-5 acc 83.984 (86.115)	lr 0.00007
Train [117][280/3239]	Time 0.230 (0.734)	Data Time 0.001 (0.121)	Loss 2.1599 (2.3503)	Entropy 0.53237 (0.53181)	Top-1 acc 73.047 (67.499)	Top-5 acc 89.453 (86.111)	lr 0.00007
Train [117][290/3239]	Time 0.323 (0.723)	Data Time 0.001 (0.116)	Loss 2.3666 (2.3502)	Entropy 0.53253 (0.53183)	Top-1 acc 67.188 (67.492)	Top-5 acc 86.719 (86.123)	lr 0.00007
Train [117][300/3239]	Time 0.233 (0.713)	Data Time 0.001 (0.113)	Loss 2.2753 (2.3489)	Entropy 0.53262 (0.53185)	Top-1 acc 71.484 (67.511)	Top-5 acc 87.109 (86.136)	lr 0.00007
Train [117][310/3239]	Time 0.237 (0.704)	Data Time 0.001 (0.109)	Loss 2.6086 (2.3513)	Entropy 0.53232 (0.53187)	Top-1 acc 61.328 (67.436)	Top-5 acc 82.031 (86.078)	lr 0.00007
Train [117][320/3239]	Time 0.236 (0.695)	Data Time 0.001 (0.106)	Loss 2.1342 (2.3545)	Entropy 0.53228 (0.53188)	Top-1 acc 71.484 (67.377)	Top-5 acc 90.625 (86.042)	lr 0.00007
Train [117][330/3239]	Time 0.232 (0.687)	Data Time 0.001 (0.103)	Loss 2.1031 (2.3534)	Entropy 0.53228 (0.53190)	Top-1 acc 71.094 (67.409)	Top-5 acc 89.844 (86.051)	lr 0.00007
Train [117][340/3239]	Time 0.248 (0.680)	Data Time 0.002 (0.100)	Loss 2.2760 (2.3533)	Entropy 0.53236 (0.53191)	Top-1 acc 66.797 (67.391)	Top-5 acc 87.891 (86.068)	lr 0.00006
Train [117][350/3239]	Time 0.244 (0.673)	Data Time 0.001 (0.097)	Loss 2.4429 (2.3537)	Entropy 0.53255 (0.53192)	Top-1 acc 67.578 (67.396)	Top-5 acc 83.594 (86.052)	lr 0.00006
Train [117][360/3239]	Time 0.237 (0.666)	Data Time 0.001 (0.094)	Loss 2.4014 (2.3532)	Entropy 0.53257 (0.53194)	Top-1 acc 69.531 (67.411)	Top-5 acc 82.031 (86.057)	lr 0.00006
Train [117][370/3239]	Time 0.241 (0.660)	Data Time 0.001 (0.092)	Loss 2.2191 (2.3542)	Entropy 0.53305 (0.53196)	Top-1 acc 71.875 (67.392)	Top-5 acc 89.453 (86.047)	lr 0.00006
Train [117][380/3239]	Time 0.272 (0.654)	Data Time 0.001 (0.089)	Loss 2.4543 (2.3544)	Entropy 0.53315 (0.53199)	Top-1 acc 65.234 (67.398)	Top-5 acc 85.547 (86.030)	lr 0.00006
Train [117][390/3239]	Time 0.231 (0.648)	Data Time 0.001 (0.087)	Loss 2.5630 (2.3556)	Entropy 0.53298 (0.53202)	Top-1 acc 64.062 (67.393)	Top-5 acc 82.422 (85.999)	lr 0.00006
Train [117][400/3239]	Time 0.239 (0.642)	Data Time 0.006 (0.085)	Loss 2.2459 (2.3549)	Entropy 0.53295 (0.53204)	Top-1 acc 71.875 (67.423)	Top-5 acc 87.500 (86.014)	lr 0.00006
Train [117][410/3239]	Time 0.234 (0.637)	Data Time 0.001 (0.083)	Loss 2.5830 (2.3543)	Entropy 0.53309 (0.53206)	Top-1 acc 58.984 (67.422)	Top-5 acc 83.203 (86.034)	lr 0.00006
Train [117][420/3239]	Time 0.240 (0.632)	Data Time 0.001 (0.081)	Loss 2.2933 (2.3542)	Entropy 0.53317 (0.53208)	Top-1 acc 67.578 (67.406)	Top-5 acc 87.891 (86.039)	lr 0.00006
Train [117][430/3239]	Time 0.226 (0.627)	Data Time 0.001 (0.079)	Loss 2.1070 (2.3520)	Entropy 0.53280 (0.53211)	Top-1 acc 71.484 (67.440)	Top-5 acc 89.844 (86.077)	lr 0.00006
Train [117][440/3239]	Time 0.231 (0.623)	Data Time 0.002 (0.077)	Loss 2.4302 (2.3542)	Entropy 0.53269 (0.53212)	Top-1 acc 66.797 (67.422)	Top-5 acc 85.156 (86.032)	lr 0.00006
Train [117][450/3239]	Time 0.356 (0.619)	Data Time 0.001 (0.076)	Loss 2.3262 (2.3537)	Entropy 0.53243 (0.53213)	Top-1 acc 69.531 (67.446)	Top-5 acc 87.891 (86.039)	lr 0.00006
Train [117][460/3239]	Time 0.242 (0.614)	Data Time 0.001 (0.074)	Loss 2.2786 (2.3542)	Entropy 0.53222 (0.53214)	Top-1 acc 70.312 (67.423)	Top-5 acc 85.938 (86.035)	lr 0.00006
Train [117][470/3239]	Time 0.237 (0.609)	Data Time 0.001 (0.073)	Loss 2.3278 (2.3542)	Entropy 0.53241 (0.53214)	Top-1 acc 67.969 (67.416)	Top-5 acc 86.719 (86.058)	lr 0.00006
Train [117][480/3239]	Time 0.228 (0.605)	Data Time 0.001 (0.071)	Loss 2.8073 (2.3549)	Entropy 0.53251 (0.53215)	Top-1 acc 58.594 (67.386)	Top-5 acc 77.734 (86.045)	lr 0.00006
Train [117][490/3239]	Time 0.234 (0.602)	Data Time 0.001 (0.070)	Loss 2.2797 (2.3537)	Entropy 0.53271 (0.53216)	Top-1 acc 70.312 (67.421)	Top-5 acc 85.156 (86.054)	lr 0.00006
Train [117][500/3239]	Time 0.234 (0.598)	Data Time 0.001 (0.068)	Loss 2.4216 (2.3531)	Entropy 0.53262 (0.53217)	Top-1 acc 66.406 (67.448)	Top-5 acc 85.156 (86.055)	lr 0.00006
Train [117][510/3239]	Time 0.248 (0.595)	Data Time 0.001 (0.067)	Loss 2.3119 (2.3527)	Entropy 0.53221 (0.53217)	Top-1 acc 67.969 (67.458)	Top-5 acc 85.938 (86.057)	lr 0.00006
Train [117][520/3239]	Time 0.346 (0.592)	Data Time 0.002 (0.066)	Loss 2.3769 (2.3529)	Entropy 0.53250 (0.53218)	Top-1 acc 66.797 (67.463)	Top-5 acc 85.938 (86.056)	lr 0.00006
Train [117][530/3239]	Time 0.234 (0.589)	Data Time 0.001 (0.065)	Loss 2.1719 (2.3507)	Entropy 0.53223 (0.53218)	Top-1 acc 71.875 (67.516)	Top-5 acc 88.672 (86.092)	lr 0.00006
Train [117][540/3239]	Time 0.245 (0.585)	Data Time 0.001 (0.063)	Loss 2.5094 (2.3507)	Entropy 0.53215 (0.53218)	Top-1 acc 62.500 (67.515)	Top-5 acc 84.766 (86.096)	lr 0.00006
Train [117][550/3239]	Time 0.232 (0.583)	Data Time 0.001 (0.062)	Loss 2.4876 (2.3502)	Entropy 0.53222 (0.53218)	Top-1 acc 67.188 (67.535)	Top-5 acc 83.984 (86.106)	lr 0.00006
Train [117][560/3239]	Time 0.230 (0.580)	Data Time 0.001 (0.061)	Loss 2.4122 (2.3496)	Entropy 0.53219 (0.53218)	Top-1 acc 67.188 (67.552)	Top-5 acc 87.109 (86.121)	lr 0.00006
Train [117][570/3239]	Time 0.230 (0.577)	Data Time 0.001 (0.060)	Loss 2.1804 (2.3491)	Entropy 0.53222 (0.53218)	Top-1 acc 71.875 (67.554)	Top-5 acc 88.281 (86.126)	lr 0.00006
Train [117][580/3239]	Time 0.236 (0.574)	Data Time 0.001 (0.059)	Loss 2.3348 (2.3487)	Entropy 0.53200 (0.53218)	Top-1 acc 68.359 (67.570)	Top-5 acc 85.938 (86.128)	lr 0.00006
Train [117][590/3239]	Time 0.260 (0.572)	Data Time 0.001 (0.058)	Loss 2.3703 (2.3479)	Entropy 0.53241 (0.53218)	Top-1 acc 70.312 (67.602)	Top-5 acc 86.719 (86.139)	lr 0.00006
Train [117][600/3239]	Time 0.228 (0.569)	Data Time 0.001 (0.057)	Loss 2.5647 (2.3473)	Entropy 0.53231 (0.53218)	Top-1 acc 60.156 (67.598)	Top-5 acc 81.250 (86.155)	lr 0.00006
Train [117][610/3239]	Time 0.333 (0.566)	Data Time 0.001 (0.056)	Loss 2.2538 (2.3463)	Entropy 0.53181 (0.53218)	Top-1 acc 68.359 (67.606)	Top-5 acc 87.109 (86.163)	lr 0.00006
Train [117][620/3239]	Time 0.228 (0.564)	Data Time 0.001 (0.055)	Loss 2.3329 (2.3473)	Entropy 0.53174 (0.53217)	Top-1 acc 68.359 (67.572)	Top-5 acc 86.328 (86.138)	lr 0.00006
Train [117][630/3239]	Time 0.259 (0.561)	Data Time 0.001 (0.055)	Loss 2.5898 (2.3494)	Entropy 0.53176 (0.53216)	Top-1 acc 64.453 (67.522)	Top-5 acc 83.594 (86.108)	lr 0.00006
Train [117][640/3239]	Time 0.233 (0.559)	Data Time 0.001 (0.054)	Loss 2.3500 (2.3485)	Entropy 0.53174 (0.53216)	Top-1 acc 68.359 (67.537)	Top-5 acc 85.938 (86.125)	lr 0.00006
Train [117][650/3239]	Time 0.222 (0.557)	Data Time 0.001 (0.053)	Loss 3.1404 (2.3492)	Entropy 0.53191 (0.53215)	Top-1 acc 51.953 (67.532)	Top-5 acc 73.438 (86.119)	lr 0.00006
Train [117][660/3239]	Time 0.236 (0.554)	Data Time 0.001 (0.052)	Loss 2.3260 (2.3489)	Entropy 0.53193 (0.53215)	Top-1 acc 71.094 (67.543)	Top-5 acc 87.500 (86.123)	lr 0.00006
Train [117][670/3239]	Time 0.225 (0.552)	Data Time 0.001 (0.051)	Loss 2.4401 (2.3484)	Entropy 0.53171 (0.53214)	Top-1 acc 65.625 (67.553)	Top-5 acc 84.766 (86.133)	lr 0.00006
Train [117][680/3239]	Time 0.354 (0.550)	Data Time 0.002 (0.051)	Loss 2.3637 (2.3482)	Entropy 0.53198 (0.53214)	Top-1 acc 70.312 (67.564)	Top-5 acc 87.109 (86.139)	lr 0.00006
Train [117][690/3239]	Time 0.243 (0.548)	Data Time 0.001 (0.050)	Loss 2.4946 (2.3479)	Entropy 0.53235 (0.53214)	Top-1 acc 64.844 (67.552)	Top-5 acc 83.594 (86.148)	lr 0.00006
Train [117][700/3239]	Time 0.243 (0.546)	Data Time 0.001 (0.049)	Loss 2.4686 (2.3472)	Entropy 0.53246 (0.53214)	Top-1 acc 61.328 (67.557)	Top-5 acc 83.594 (86.162)	lr 0.00006
Train [117][710/3239]	Time 0.240 (0.545)	Data Time 0.001 (0.049)	Loss 2.4487 (2.3466)	Entropy 0.53247 (0.53214)	Top-1 acc 67.578 (67.574)	Top-5 acc 83.594 (86.166)	lr 0.00006
Train [117][720/3239]	Time 0.234 (0.543)	Data Time 0.001 (0.048)	Loss 2.6960 (2.3470)	Entropy 0.53226 (0.53215)	Top-1 acc 58.203 (67.576)	Top-5 acc 82.812 (86.161)	lr 0.00006
Train [117][730/3239]	Time 0.245 (0.542)	Data Time 0.002 (0.047)	Loss 2.3715 (2.3466)	Entropy 0.53228 (0.53215)	Top-1 acc 69.141 (67.594)	Top-5 acc 85.547 (86.177)	lr 0.00006
Train [117][740/3239]	Time 0.238 (0.540)	Data Time 0.001 (0.047)	Loss 2.3960 (2.3466)	Entropy 0.53225 (0.53215)	Top-1 acc 67.969 (67.584)	Top-5 acc 85.156 (86.182)	lr 0.00006
Train [117][750/3239]	Time 0.242 (0.539)	Data Time 0.001 (0.046)	Loss 2.4838 (2.3471)	Entropy 0.53245 (0.53215)	Top-1 acc 63.672 (67.568)	Top-5 acc 83.594 (86.180)	lr 0.00006
Train [117][760/3239]	Time 0.316 (0.606)	Data Time 0.007 (0.046)	Loss 2.2520 (2.3466)	Entropy 0.53235 (0.53215)	Top-1 acc 69.922 (67.583)	Top-5 acc 88.672 (86.191)	lr 0.00006
Train [117][770/3239]	Time 0.508 (0.604)	Data Time 0.002 (0.045)	Loss 2.2967 (2.3461)	Entropy 0.53245 (0.53216)	Top-1 acc 69.531 (67.587)	Top-5 acc 85.547 (86.193)	lr 0.00006
Train [117][780/3239]	Time 0.235 (0.602)	Data Time 0.001 (0.044)	Loss 2.2752 (2.3459)	Entropy 0.53247 (0.53216)	Top-1 acc 73.047 (67.595)	Top-5 acc 86.328 (86.200)	lr 0.00006
Train [117][790/3239]	Time 0.237 (0.600)	Data Time 0.001 (0.044)	Loss 2.5439 (2.3467)	Entropy 0.53258 (0.53217)	Top-1 acc 62.109 (67.574)	Top-5 acc 83.594 (86.195)	lr 0.00006
Train [117][800/3239]	Time 0.242 (0.598)	Data Time 0.001 (0.043)	Loss 2.4057 (2.3474)	Entropy 0.53264 (0.53217)	Top-1 acc 65.234 (67.558)	Top-5 acc 88.281 (86.194)	lr 0.00006
Train [117][810/3239]	Time 0.235 (0.596)	Data Time 0.001 (0.043)	Loss 2.2682 (2.3469)	Entropy 0.53242 (0.53217)	Top-1 acc 69.531 (67.598)	Top-5 acc 87.109 (86.203)	lr 0.00006
Train [117][820/3239]	Time 0.239 (0.593)	Data Time 0.001 (0.042)	Loss 2.1100 (2.3470)	Entropy 0.53240 (0.53218)	Top-1 acc 74.219 (67.593)	Top-5 acc 89.062 (86.209)	lr 0.00006
Train [117][830/3239]	Time 0.234 (0.591)	Data Time 0.001 (0.042)	Loss 2.4416 (2.3467)	Entropy 0.53202 (0.53218)	Top-1 acc 62.891 (67.594)	Top-5 acc 85.156 (86.221)	lr 0.00006
Train [117][840/3239]	Time 0.321 (0.589)	Data Time 0.001 (0.041)	Loss 2.4103 (2.3467)	Entropy 0.53250 (0.53218)	Top-1 acc 63.672 (67.595)	Top-5 acc 85.938 (86.225)	lr 0.00006
Train [117][850/3239]	Time 0.232 (0.587)	Data Time 0.001 (0.041)	Loss 2.2263 (2.3463)	Entropy 0.53277 (0.53218)	Top-1 acc 71.094 (67.607)	Top-5 acc 88.281 (86.240)	lr 0.00006
Train [117][860/3239]	Time 0.225 (0.585)	Data Time 0.001 (0.040)	Loss 2.5151 (2.3468)	Entropy 0.53293 (0.53219)	Top-1 acc 62.109 (67.590)	Top-5 acc 84.375 (86.228)	lr 0.00006
Train [117][870/3239]	Time 0.252 (0.583)	Data Time 0.002 (0.040)	Loss 2.3385 (2.3468)	Entropy 0.53271 (0.53220)	Top-1 acc 69.922 (67.598)	Top-5 acc 87.891 (86.236)	lr 0.00006
Train [117][880/3239]	Time 0.262 (0.581)	Data Time 0.001 (0.040)	Loss 2.1787 (2.3478)	Entropy 0.53268 (0.53220)	Top-1 acc 71.484 (67.574)	Top-5 acc 89.453 (86.223)	lr 0.00006
Train [117][890/3239]	Time 0.236 (0.580)	Data Time 0.001 (0.039)	Loss 2.3617 (2.3473)	Entropy 0.53277 (0.53221)	Top-1 acc 69.922 (67.587)	Top-5 acc 87.109 (86.235)	lr 0.00006
Train [117][900/3239]	Time 0.234 (0.578)	Data Time 0.001 (0.039)	Loss 2.4347 (2.3475)	Entropy 0.53273 (0.53221)	Top-1 acc 64.453 (67.586)	Top-5 acc 87.109 (86.231)	lr 0.00006
Train [117][910/3239]	Time 0.231 (0.577)	Data Time 0.001 (0.038)	Loss 2.4039 (2.3476)	Entropy 0.53285 (0.53222)	Top-1 acc 62.500 (67.586)	Top-5 acc 87.109 (86.232)	lr 0.00006
Train [117][920/3239]	Time 0.223 (0.575)	Data Time 0.001 (0.038)	Loss 2.3828 (2.3474)	Entropy 0.53257 (0.53223)	Top-1 acc 68.359 (67.596)	Top-5 acc 85.547 (86.225)	lr 0.00006
Train [117][930/3239]	Time 0.246 (0.574)	Data Time 0.001 (0.038)	Loss 2.2813 (2.3473)	Entropy 0.53276 (0.53223)	Top-1 acc 71.875 (67.598)	Top-5 acc 87.109 (86.234)	lr 0.00006
Train [117][940/3239]	Time 0.243 (0.572)	Data Time 0.001 (0.037)	Loss 2.3866 (2.3470)	Entropy 0.53238 (0.53224)	Top-1 acc 67.969 (67.593)	Top-5 acc 84.766 (86.248)	lr 0.00006
Train [117][950/3239]	Time 0.266 (0.571)	Data Time 0.001 (0.037)	Loss 2.4331 (2.3471)	Entropy 0.53251 (0.53224)	Top-1 acc 64.844 (67.589)	Top-5 acc 84.766 (86.247)	lr 0.00006
Train [117][960/3239]	Time 0.281 (0.569)	Data Time 0.003 (0.036)	Loss 2.0668 (2.3466)	Entropy 0.53262 (0.53224)	Top-1 acc 75.781 (67.603)	Top-5 acc 90.234 (86.262)	lr 0.00006
Train [117][970/3239]	Time 0.246 (0.568)	Data Time 0.001 (0.036)	Loss 2.1697 (2.3466)	Entropy 0.53257 (0.53225)	Top-1 acc 75.391 (67.610)	Top-5 acc 87.891 (86.257)	lr 0.00006
Train [117][980/3239]	Time 0.277 (0.567)	Data Time 0.001 (0.036)	Loss 2.2947 (2.3461)	Entropy 0.53280 (0.53225)	Top-1 acc 71.875 (67.622)	Top-5 acc 87.500 (86.271)	lr 0.00006
Train [117][990/3239]	Time 0.246 (0.565)	Data Time 0.001 (0.035)	Loss 2.4455 (2.3459)	Entropy 0.53285 (0.53226)	Top-1 acc 64.453 (67.622)	Top-5 acc 84.766 (86.274)	lr 0.00006
Train [117][1000/3239]	Time 0.330 (0.564)	Data Time 0.001 (0.035)	Loss 2.4367 (2.3455)	Entropy 0.53288 (0.53226)	Top-1 acc 62.500 (67.624)	Top-5 acc 84.375 (86.277)	lr 0.00006
Train [117][1010/3239]	Time 0.233 (0.562)	Data Time 0.001 (0.035)	Loss 2.1857 (2.3463)	Entropy 0.53310 (0.53227)	Top-1 acc 70.703 (67.601)	Top-5 acc 89.844 (86.275)	lr 0.00006
Train [117][1020/3239]	Time 0.231 (0.561)	Data Time 0.001 (0.034)	Loss 2.4542 (2.3465)	Entropy 0.53309 (0.53228)	Top-1 acc 65.625 (67.588)	Top-5 acc 83.984 (86.272)	lr 0.00006
Train [117][1030/3239]	Time 0.233 (0.560)	Data Time 0.001 (0.034)	Loss 2.3374 (2.3457)	Entropy 0.53334 (0.53229)	Top-1 acc 66.797 (67.608)	Top-5 acc 87.500 (86.288)	lr 0.00006
Train [117][1040/3239]	Time 0.242 (0.558)	Data Time 0.001 (0.034)	Loss 2.2353 (2.3457)	Entropy 0.53346 (0.53230)	Top-1 acc 67.188 (67.611)	Top-5 acc 88.672 (86.289)	lr 0.00006
Train [117][1050/3239]	Time 0.230 (0.557)	Data Time 0.001 (0.033)	Loss 2.4821 (2.3460)	Entropy 0.53350 (0.53231)	Top-1 acc 64.453 (67.602)	Top-5 acc 81.250 (86.290)	lr 0.00006
Train [117][1060/3239]	Time 0.238 (0.556)	Data Time 0.001 (0.033)	Loss 2.1615 (2.3464)	Entropy 0.53351 (0.53232)	Top-1 acc 73.828 (67.602)	Top-5 acc 89.453 (86.280)	lr 0.00006
Train [117][1070/3239]	Time 0.358 (0.554)	Data Time 0.001 (0.033)	Loss 2.2932 (2.3465)	Entropy 0.53316 (0.53233)	Top-1 acc 71.094 (67.612)	Top-5 acc 85.156 (86.280)	lr 0.00006
Train [117][1080/3239]	Time 0.238 (0.553)	Data Time 0.001 (0.033)	Loss 2.5743 (2.3461)	Entropy 0.53312 (0.53234)	Top-1 acc 61.328 (67.624)	Top-5 acc 82.031 (86.285)	lr 0.00006
Train [117][1090/3239]	Time 0.249 (0.552)	Data Time 0.001 (0.032)	Loss 2.6363 (2.3463)	Entropy 0.53345 (0.53235)	Top-1 acc 62.500 (67.630)	Top-5 acc 79.688 (86.278)	lr 0.00006
Train [117][1100/3239]	Time 0.238 (0.551)	Data Time 0.001 (0.032)	Loss 2.3722 (2.3460)	Entropy 0.53324 (0.53235)	Top-1 acc 67.969 (67.637)	Top-5 acc 82.422 (86.277)	lr 0.00006
Train [117][1110/3239]	Time 0.240 (0.549)	Data Time 0.001 (0.032)	Loss 2.3157 (2.3462)	Entropy 0.53329 (0.53236)	Top-1 acc 68.750 (67.630)	Top-5 acc 87.109 (86.277)	lr 0.00006
Train [117][1120/3239]	Time 0.224 (0.548)	Data Time 0.001 (0.031)	Loss 2.1850 (2.3459)	Entropy 0.53325 (0.53237)	Top-1 acc 71.484 (67.641)	Top-5 acc 87.109 (86.279)	lr 0.00006
Train [117][1130/3239]	Time 0.242 (0.547)	Data Time 0.001 (0.031)	Loss 2.4981 (2.3462)	Entropy 0.53317 (0.53238)	Top-1 acc 64.844 (67.625)	Top-5 acc 82.422 (86.276)	lr 0.00006
Train [117][1140/3239]	Time 0.231 (0.546)	Data Time 0.001 (0.031)	Loss 2.2715 (2.3460)	Entropy 0.53301 (0.53238)	Top-1 acc 68.750 (67.622)	Top-5 acc 90.625 (86.281)	lr 0.00006
Train [117][1150/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.031)	Loss 2.3762 (2.3460)	Entropy 0.53287 (0.53239)	Top-1 acc 68.359 (67.616)	Top-5 acc 82.422 (86.277)	lr 0.00006
Train [117][1160/3239]	Time 0.331 (0.544)	Data Time 0.001 (0.030)	Loss 2.2858 (2.3452)	Entropy 0.53279 (0.53239)	Top-1 acc 69.922 (67.629)	Top-5 acc 86.719 (86.288)	lr 0.00006
Train [117][1170/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.030)	Loss 2.3577 (2.3456)	Entropy 0.53275 (0.53240)	Top-1 acc 68.750 (67.612)	Top-5 acc 85.938 (86.280)	lr 0.00006
Train [117][1180/3239]	Time 0.228 (0.541)	Data Time 0.001 (0.030)	Loss 2.3120 (2.3457)	Entropy 0.53286 (0.53240)	Top-1 acc 70.312 (67.610)	Top-5 acc 88.281 (86.285)	lr 0.00006
Train [117][1190/3239]	Time 0.259 (0.540)	Data Time 0.001 (0.030)	Loss 2.3402 (2.3453)	Entropy 0.53275 (0.53240)	Top-1 acc 66.016 (67.622)	Top-5 acc 85.156 (86.293)	lr 0.00006
Train [117][1200/3239]	Time 0.232 (0.539)	Data Time 0.001 (0.029)	Loss 2.5028 (2.3455)	Entropy 0.53293 (0.53241)	Top-1 acc 64.062 (67.620)	Top-5 acc 83.203 (86.286)	lr 0.00006
Train [117][1210/3239]	Time 0.235 (0.538)	Data Time 0.001 (0.029)	Loss 2.2650 (2.3454)	Entropy 0.53314 (0.53241)	Top-1 acc 69.141 (67.624)	Top-5 acc 86.719 (86.288)	lr 0.00006
Train [117][1220/3239]	Time 0.228 (0.537)	Data Time 0.001 (0.029)	Loss 2.6323 (2.3457)	Entropy 0.53336 (0.53242)	Top-1 acc 59.375 (67.618)	Top-5 acc 80.078 (86.278)	lr 0.00006
Train [117][1230/3239]	Time 0.322 (0.536)	Data Time 0.001 (0.029)	Loss 2.4276 (2.3461)	Entropy 0.53341 (0.53242)	Top-1 acc 64.453 (67.609)	Top-5 acc 87.500 (86.270)	lr 0.00006
Train [117][1240/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.029)	Loss 2.2399 (2.3454)	Entropy 0.53314 (0.53243)	Top-1 acc 70.703 (67.628)	Top-5 acc 86.719 (86.283)	lr 0.00006
Train [117][1250/3239]	Time 0.229 (0.534)	Data Time 0.001 (0.028)	Loss 2.3522 (2.3448)	Entropy 0.53327 (0.53244)	Top-1 acc 66.797 (67.643)	Top-5 acc 84.766 (86.296)	lr 0.00006
Train [117][1260/3239]	Time 0.221 (0.533)	Data Time 0.001 (0.028)	Loss 2.4015 (2.3448)	Entropy 0.53329 (0.53244)	Top-1 acc 65.625 (67.642)	Top-5 acc 85.156 (86.295)	lr 0.00006
Train [117][1270/3239]	Time 0.221 (0.532)	Data Time 0.001 (0.028)	Loss 2.2497 (2.3447)	Entropy 0.53332 (0.53245)	Top-1 acc 71.094 (67.644)	Top-5 acc 89.062 (86.299)	lr 0.00006
Train [117][1280/3239]	Time 0.240 (0.531)	Data Time 0.001 (0.028)	Loss 2.5950 (2.3449)	Entropy 0.53342 (0.53246)	Top-1 acc 58.984 (67.646)	Top-5 acc 82.422 (86.300)	lr 0.00006
Train [117][1290/3239]	Time 0.222 (0.530)	Data Time 0.001 (0.028)	Loss 2.5851 (2.3454)	Entropy 0.53322 (0.53246)	Top-1 acc 59.766 (67.635)	Top-5 acc 81.641 (86.296)	lr 0.00006
Train [117][1300/3239]	Time 0.218 (0.529)	Data Time 0.001 (0.027)	Loss 2.2322 (2.3457)	Entropy 0.53326 (0.53247)	Top-1 acc 72.656 (67.623)	Top-5 acc 87.891 (86.290)	lr 0.00006
Train [117][1310/3239]	Time 0.233 (0.528)	Data Time 0.001 (0.027)	Loss 2.2872 (2.3451)	Entropy 0.53325 (0.53248)	Top-1 acc 67.969 (67.639)	Top-5 acc 86.719 (86.296)	lr 0.00006
Train [117][1320/3239]	Time 0.349 (0.527)	Data Time 0.001 (0.027)	Loss 2.1640 (2.3448)	Entropy 0.53285 (0.53248)	Top-1 acc 73.047 (67.648)	Top-5 acc 87.500 (86.299)	lr 0.00006
Train [117][1330/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.027)	Loss 2.1922 (2.3442)	Entropy 0.53274 (0.53248)	Top-1 acc 71.484 (67.669)	Top-5 acc 87.891 (86.304)	lr 0.00006
Train [117][1340/3239]	Time 0.229 (0.525)	Data Time 0.001 (0.027)	Loss 2.3287 (2.3443)	Entropy 0.53264 (0.53248)	Top-1 acc 67.578 (67.664)	Top-5 acc 86.719 (86.300)	lr 0.00006
Train [117][1350/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.026)	Loss 2.4130 (2.3443)	Entropy 0.53273 (0.53249)	Top-1 acc 65.625 (67.666)	Top-5 acc 85.938 (86.299)	lr 0.00005
Train [117][1360/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.026)	Loss 2.4048 (2.3444)	Entropy 0.53282 (0.53249)	Top-1 acc 66.016 (67.662)	Top-5 acc 85.547 (86.296)	lr 0.00005
Train [117][1370/3239]	Time 0.241 (0.523)	Data Time 0.001 (0.026)	Loss 2.3899 (2.3444)	Entropy 0.53256 (0.53249)	Top-1 acc 66.406 (67.659)	Top-5 acc 84.766 (86.293)	lr 0.00005
Train [117][1380/3239]	Time 0.229 (0.522)	Data Time 0.001 (0.026)	Loss 2.2972 (2.3446)	Entropy 0.53251 (0.53249)	Top-1 acc 69.141 (67.652)	Top-5 acc 87.109 (86.292)	lr 0.00005
Train [117][1390/3239]	Time 0.312 (0.521)	Data Time 0.001 (0.026)	Loss 2.2190 (2.3444)	Entropy 0.53244 (0.53249)	Top-1 acc 69.531 (67.656)	Top-5 acc 87.891 (86.291)	lr 0.00005
Train [117][1400/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.025)	Loss 2.4501 (2.3444)	Entropy 0.53279 (0.53249)	Top-1 acc 63.281 (67.655)	Top-5 acc 83.594 (86.290)	lr 0.00005
Train [117][1410/3239]	Time 0.413 (0.555)	Data Time 0.006 (0.025)	Loss 2.2944 (2.3443)	Entropy 0.53336 (0.53249)	Top-1 acc 67.578 (67.658)	Top-5 acc 88.672 (86.290)	lr 0.00005
Train [117][1420/3239]	Time 0.235 (0.555)	Data Time 0.002 (0.025)	Loss 2.4315 (2.3446)	Entropy 0.53381 (0.53250)	Top-1 acc 64.844 (67.658)	Top-5 acc 86.719 (86.284)	lr 0.00005
Train [117][1430/3239]	Time 0.265 (0.554)	Data Time 0.002 (0.025)	Loss 2.1749 (2.3446)	Entropy 0.53393 (0.53251)	Top-1 acc 69.141 (67.658)	Top-5 acc 89.453 (86.283)	lr 0.00005
Train [117][1440/3239]	Time 0.262 (0.553)	Data Time 0.003 (0.025)	Loss 2.3082 (2.3443)	Entropy 0.53371 (0.53252)	Top-1 acc 71.875 (67.663)	Top-5 acc 89.062 (86.288)	lr 0.00005
Train [117][1450/3239]	Time 0.217 (0.552)	Data Time 0.001 (0.025)	Loss 2.8751 (2.3447)	Entropy 0.53370 (0.53253)	Top-1 acc 57.422 (67.654)	Top-5 acc 79.688 (86.286)	lr 0.00005
Train [117][1460/3239]	Time 0.248 (0.551)	Data Time 0.001 (0.025)	Loss 2.5072 (2.3452)	Entropy 0.53363 (0.53254)	Top-1 acc 64.453 (67.652)	Top-5 acc 84.375 (86.279)	lr 0.00005
Train [117][1470/3239]	Time 0.239 (0.550)	Data Time 0.001 (0.024)	Loss 2.1286 (2.3452)	Entropy 0.53366 (0.53254)	Top-1 acc 72.656 (67.648)	Top-5 acc 92.578 (86.278)	lr 0.00005
Train [117][1480/3239]	Time 0.353 (0.549)	Data Time 0.001 (0.024)	Loss 2.5380 (2.3450)	Entropy 0.53386 (0.53255)	Top-1 acc 63.672 (67.653)	Top-5 acc 83.984 (86.279)	lr 0.00005
Train [117][1490/3239]	Time 0.252 (0.549)	Data Time 0.001 (0.024)	Loss 2.2176 (2.3450)	Entropy 0.53377 (0.53256)	Top-1 acc 70.703 (67.649)	Top-5 acc 88.281 (86.280)	lr 0.00005
Train [117][1500/3239]	Time 0.239 (0.548)	Data Time 0.001 (0.024)	Loss 2.4460 (2.3448)	Entropy 0.53361 (0.53257)	Top-1 acc 67.969 (67.653)	Top-5 acc 83.594 (86.286)	lr 0.00005
Train [117][1510/3239]	Time 0.254 (0.547)	Data Time 0.001 (0.024)	Loss 2.2788 (2.3445)	Entropy 0.53377 (0.53258)	Top-1 acc 69.141 (67.659)	Top-5 acc 87.109 (86.289)	lr 0.00005
Train [117][1520/3239]	Time 0.249 (0.546)	Data Time 0.001 (0.024)	Loss 2.3944 (2.3442)	Entropy 0.53394 (0.53258)	Top-1 acc 68.750 (67.670)	Top-5 acc 85.156 (86.292)	lr 0.00005
Train [117][1530/3239]	Time 0.294 (0.546)	Data Time 0.001 (0.023)	Loss 2.5889 (2.3438)	Entropy 0.53395 (0.53259)	Top-1 acc 62.500 (67.675)	Top-5 acc 83.984 (86.301)	lr 0.00005
Train [117][1540/3239]	Time 0.236 (0.545)	Data Time 0.001 (0.023)	Loss 2.3189 (2.3441)	Entropy 0.53407 (0.53260)	Top-1 acc 68.359 (67.672)	Top-5 acc 85.938 (86.292)	lr 0.00005
Train [117][1550/3239]	Time 0.336 (0.544)	Data Time 0.001 (0.023)	Loss 2.4884 (2.3440)	Entropy 0.53430 (0.53261)	Top-1 acc 62.109 (67.677)	Top-5 acc 84.766 (86.298)	lr 0.00005
Train [117][1560/3239]	Time 0.262 (0.544)	Data Time 0.001 (0.023)	Loss 2.3083 (2.3445)	Entropy 0.53456 (0.53262)	Top-1 acc 67.188 (67.663)	Top-5 acc 87.500 (86.286)	lr 0.00005
Train [117][1570/3239]	Time 0.236 (0.543)	Data Time 0.001 (0.023)	Loss 2.3710 (2.3442)	Entropy 0.53474 (0.53264)	Top-1 acc 66.016 (67.677)	Top-5 acc 87.500 (86.292)	lr 0.00005
Train [117][1580/3239]	Time 0.260 (0.542)	Data Time 0.001 (0.023)	Loss 2.2221 (2.3443)	Entropy 0.53458 (0.53265)	Top-1 acc 69.922 (67.680)	Top-5 acc 89.453 (86.287)	lr 0.00005
Train [117][1590/3239]	Time 0.268 (0.542)	Data Time 0.001 (0.023)	Loss 2.3275 (2.3440)	Entropy 0.53456 (0.53266)	Top-1 acc 67.188 (67.690)	Top-5 acc 86.719 (86.288)	lr 0.00005
Train [117][1600/3239]	Time 0.232 (0.541)	Data Time 0.001 (0.023)	Loss 2.2939 (2.3444)	Entropy 0.53439 (0.53267)	Top-1 acc 69.141 (67.681)	Top-5 acc 86.719 (86.279)	lr 0.00005
Train [117][1610/3239]	Time 0.243 (0.540)	Data Time 0.001 (0.022)	Loss 2.3608 (2.3446)	Entropy 0.53448 (0.53268)	Top-1 acc 67.188 (67.682)	Top-5 acc 88.672 (86.276)	lr 0.00005
Train [117][1620/3239]	Time 0.289 (0.540)	Data Time 0.002 (0.022)	Loss 2.3483 (2.3447)	Entropy 0.53427 (0.53269)	Top-1 acc 66.406 (67.682)	Top-5 acc 86.719 (86.273)	lr 0.00005
Train [117][1630/3239]	Time 0.242 (0.540)	Data Time 0.001 (0.022)	Loss 2.2702 (2.3445)	Entropy 0.53414 (0.53270)	Top-1 acc 71.875 (67.692)	Top-5 acc 88.281 (86.278)	lr 0.00005
Train [117][1640/3239]	Time 0.234 (0.539)	Data Time 0.001 (0.022)	Loss 2.2969 (2.3446)	Entropy 0.53355 (0.53271)	Top-1 acc 67.969 (67.688)	Top-5 acc 86.719 (86.276)	lr 0.00005
Train [117][1650/3239]	Time 0.229 (0.538)	Data Time 0.001 (0.022)	Loss 2.3188 (2.3445)	Entropy 0.53380 (0.53272)	Top-1 acc 71.484 (67.698)	Top-5 acc 90.625 (86.280)	lr 0.00005
Train [117][1660/3239]	Time 0.248 (0.538)	Data Time 0.002 (0.022)	Loss 2.1695 (2.3442)	Entropy 0.53401 (0.53272)	Top-1 acc 71.875 (67.703)	Top-5 acc 89.844 (86.288)	lr 0.00005
Train [117][1670/3239]	Time 0.262 (0.537)	Data Time 0.001 (0.022)	Loss 2.2869 (2.3441)	Entropy 0.53386 (0.53273)	Top-1 acc 67.188 (67.700)	Top-5 acc 85.547 (86.287)	lr 0.00005
Train [117][1680/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.022)	Loss 2.3471 (2.3441)	Entropy 0.53400 (0.53274)	Top-1 acc 66.406 (67.699)	Top-5 acc 87.500 (86.290)	lr 0.00005
Train [117][1690/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.021)	Loss 2.2261 (2.3442)	Entropy 0.53424 (0.53274)	Top-1 acc 68.359 (67.699)	Top-5 acc 87.500 (86.287)	lr 0.00005
Train [117][1700/3239]	Time 0.289 (0.535)	Data Time 0.001 (0.021)	Loss 2.1648 (2.3438)	Entropy 0.53454 (0.53275)	Top-1 acc 70.312 (67.701)	Top-5 acc 90.625 (86.291)	lr 0.00005
Train [117][1710/3239]	Time 0.405 (0.535)	Data Time 0.003 (0.021)	Loss 2.2755 (2.3439)	Entropy 0.53463 (0.53276)	Top-1 acc 66.406 (67.699)	Top-5 acc 87.891 (86.287)	lr 0.00005
Train [117][1720/3239]	Time 0.243 (0.534)	Data Time 0.001 (0.021)	Loss 2.4547 (2.3441)	Entropy 0.53474 (0.53278)	Top-1 acc 66.406 (67.695)	Top-5 acc 83.594 (86.283)	lr 0.00005
Train [117][1730/3239]	Time 0.246 (0.533)	Data Time 0.001 (0.021)	Loss 2.2841 (2.3442)	Entropy 0.53471 (0.53279)	Top-1 acc 67.969 (67.690)	Top-5 acc 87.109 (86.277)	lr 0.00005
Train [117][1740/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.021)	Loss 2.3298 (2.3441)	Entropy 0.53448 (0.53280)	Top-1 acc 68.750 (67.692)	Top-5 acc 87.500 (86.280)	lr 0.00005
Train [117][1750/3239]	Time 0.236 (0.532)	Data Time 0.001 (0.021)	Loss 2.0911 (2.3442)	Entropy 0.53480 (0.53281)	Top-1 acc 73.828 (67.697)	Top-5 acc 91.406 (86.278)	lr 0.00005
Train [117][1760/3239]	Time 0.270 (0.531)	Data Time 0.001 (0.021)	Loss 2.1811 (2.3440)	Entropy 0.53458 (0.53282)	Top-1 acc 71.875 (67.696)	Top-5 acc 89.062 (86.283)	lr 0.00005
Train [117][1770/3239]	Time 0.239 (0.531)	Data Time 0.001 (0.021)	Loss 2.2998 (2.3440)	Entropy 0.53459 (0.53283)	Top-1 acc 67.578 (67.695)	Top-5 acc 88.281 (86.288)	lr 0.00005
Train [117][1780/3239]	Time 0.338 (0.530)	Data Time 0.001 (0.020)	Loss 2.2295 (2.3437)	Entropy 0.53448 (0.53284)	Top-1 acc 66.016 (67.697)	Top-5 acc 87.891 (86.293)	lr 0.00005
Train [117][1790/3239]	Time 0.267 (0.530)	Data Time 0.002 (0.020)	Loss 2.3170 (2.3438)	Entropy 0.53415 (0.53285)	Top-1 acc 73.047 (67.701)	Top-5 acc 87.500 (86.291)	lr 0.00005
Train [117][1800/3239]	Time 0.240 (0.529)	Data Time 0.001 (0.020)	Loss 2.2489 (2.3441)	Entropy 0.53416 (0.53285)	Top-1 acc 69.531 (67.691)	Top-5 acc 87.109 (86.283)	lr 0.00005
Train [117][1810/3239]	Time 0.251 (0.528)	Data Time 0.001 (0.020)	Loss 2.2196 (2.3438)	Entropy 0.53420 (0.53286)	Top-1 acc 71.484 (67.699)	Top-5 acc 87.891 (86.288)	lr 0.00005
Train [117][1820/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.020)	Loss 2.3847 (2.3441)	Entropy 0.53427 (0.53287)	Top-1 acc 62.500 (67.689)	Top-5 acc 86.328 (86.280)	lr 0.00005
Train [117][1830/3239]	Time 0.238 (0.527)	Data Time 0.001 (0.020)	Loss 2.2871 (2.3442)	Entropy 0.53418 (0.53288)	Top-1 acc 69.531 (67.684)	Top-5 acc 85.156 (86.277)	lr 0.00005
Train [117][1840/3239]	Time 0.239 (0.527)	Data Time 0.001 (0.020)	Loss 2.4016 (2.3444)	Entropy 0.53455 (0.53288)	Top-1 acc 66.797 (67.680)	Top-5 acc 86.328 (86.274)	lr 0.00005
Train [117][1850/3239]	Time 0.257 (0.526)	Data Time 0.001 (0.020)	Loss 2.3881 (2.3446)	Entropy 0.53426 (0.53289)	Top-1 acc 68.750 (67.676)	Top-5 acc 85.156 (86.275)	lr 0.00005
Train [117][1860/3239]	Time 0.241 (0.525)	Data Time 0.001 (0.020)	Loss 2.2051 (2.3445)	Entropy 0.53412 (0.53290)	Top-1 acc 72.266 (67.679)	Top-5 acc 89.453 (86.276)	lr 0.00005
Train [117][1870/3239]	Time 0.338 (0.525)	Data Time 0.001 (0.020)	Loss 2.2317 (2.3445)	Entropy 0.53403 (0.53290)	Top-1 acc 71.875 (67.681)	Top-5 acc 87.891 (86.278)	lr 0.00005
Train [117][1880/3239]	Time 0.257 (0.524)	Data Time 0.001 (0.019)	Loss 2.5405 (2.3450)	Entropy 0.53421 (0.53291)	Top-1 acc 60.938 (67.664)	Top-5 acc 80.859 (86.269)	lr 0.00005
Train [117][1890/3239]	Time 0.253 (0.524)	Data Time 0.001 (0.019)	Loss 2.3171 (2.3452)	Entropy 0.53445 (0.53292)	Top-1 acc 68.359 (67.659)	Top-5 acc 86.719 (86.265)	lr 0.00005
Train [117][1900/3239]	Time 0.243 (0.523)	Data Time 0.001 (0.019)	Loss 2.4774 (2.3456)	Entropy 0.53447 (0.53293)	Top-1 acc 58.594 (67.649)	Top-5 acc 83.984 (86.260)	lr 0.00005
Train [117][1910/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.019)	Loss 2.2642 (2.3456)	Entropy 0.53473 (0.53293)	Top-1 acc 70.703 (67.650)	Top-5 acc 85.938 (86.259)	lr 0.00005
Train [117][1920/3239]	Time 0.248 (0.522)	Data Time 0.002 (0.019)	Loss 2.5102 (2.3455)	Entropy 0.53453 (0.53294)	Top-1 acc 62.109 (67.650)	Top-5 acc 83.984 (86.261)	lr 0.00005
Train [117][1930/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.019)	Loss 2.4829 (2.3457)	Entropy 0.53443 (0.53295)	Top-1 acc 65.625 (67.648)	Top-5 acc 80.859 (86.256)	lr 0.00005
Train [117][1940/3239]	Time 0.353 (0.521)	Data Time 0.001 (0.019)	Loss 2.2163 (2.3458)	Entropy 0.53449 (0.53296)	Top-1 acc 69.141 (67.644)	Top-5 acc 89.844 (86.256)	lr 0.00005
Train [117][1950/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.019)	Loss 2.2599 (2.3461)	Entropy 0.53440 (0.53297)	Top-1 acc 68.359 (67.637)	Top-5 acc 86.328 (86.252)	lr 0.00005
Train [117][1960/3239]	Time 0.241 (0.520)	Data Time 0.001 (0.019)	Loss 2.2495 (2.3464)	Entropy 0.53411 (0.53297)	Top-1 acc 69.141 (67.637)	Top-5 acc 89.453 (86.244)	lr 0.00005
Train [117][1970/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.019)	Loss 2.2196 (2.3464)	Entropy 0.53386 (0.53298)	Top-1 acc 70.703 (67.638)	Top-5 acc 88.672 (86.243)	lr 0.00005
Train [117][1980/3239]	Time 0.241 (0.519)	Data Time 0.001 (0.019)	Loss 2.4202 (2.3466)	Entropy 0.53390 (0.53298)	Top-1 acc 66.016 (67.634)	Top-5 acc 84.766 (86.241)	lr 0.00005
Train [117][1990/3239]	Time 0.225 (0.519)	Data Time 0.001 (0.018)	Loss 2.6544 (2.3468)	Entropy 0.53406 (0.53299)	Top-1 acc 58.984 (67.628)	Top-5 acc 80.078 (86.239)	lr 0.00005
Train [117][2000/3239]	Time 0.222 (0.518)	Data Time 0.001 (0.018)	Loss 2.3861 (2.3469)	Entropy 0.53422 (0.53300)	Top-1 acc 66.016 (67.623)	Top-5 acc 87.500 (86.242)	lr 0.00005
Train [117][2010/3239]	Time 0.262 (0.518)	Data Time 0.001 (0.018)	Loss 2.3505 (2.3467)	Entropy 0.53430 (0.53300)	Top-1 acc 64.844 (67.626)	Top-5 acc 85.547 (86.245)	lr 0.00005
Train [117][2020/3239]	Time 0.236 (0.517)	Data Time 0.001 (0.018)	Loss 2.3698 (2.3466)	Entropy 0.53467 (0.53301)	Top-1 acc 69.141 (67.632)	Top-5 acc 85.547 (86.247)	lr 0.00005
Train [117][2030/3239]	Time 0.245 (0.517)	Data Time 0.001 (0.018)	Loss 2.6217 (2.3471)	Entropy 0.53463 (0.53302)	Top-1 acc 62.109 (67.619)	Top-5 acc 81.641 (86.240)	lr 0.00005
Train [117][2040/3239]	Time 0.231 (0.516)	Data Time 0.001 (0.018)	Loss 2.3207 (2.3472)	Entropy 0.53444 (0.53303)	Top-1 acc 67.188 (67.611)	Top-5 acc 86.328 (86.237)	lr 0.00005
Train [117][2050/3239]	Time 0.242 (0.516)	Data Time 0.001 (0.018)	Loss 2.5124 (2.3472)	Entropy 0.53415 (0.53303)	Top-1 acc 65.625 (67.613)	Top-5 acc 85.156 (86.240)	lr 0.00005
Train [117][2060/3239]	Time 0.240 (0.515)	Data Time 0.001 (0.018)	Loss 2.5774 (2.3471)	Entropy 0.53413 (0.53304)	Top-1 acc 65.625 (67.620)	Top-5 acc 82.812 (86.241)	lr 0.00005
Train [117][2070/3239]	Time 0.493 (0.539)	Data Time 0.005 (0.018)	Loss 2.2081 (2.3469)	Entropy 0.53424 (0.53304)	Top-1 acc 72.266 (67.628)	Top-5 acc 89.844 (86.245)	lr 0.00005
Train [117][2080/3239]	Time 0.355 (0.539)	Data Time 0.004 (0.018)	Loss 2.2478 (2.3468)	Entropy 0.53420 (0.53305)	Top-1 acc 71.094 (67.633)	Top-5 acc 87.109 (86.247)	lr 0.00005
Train [117][2090/3239]	Time 0.256 (0.539)	Data Time 0.002 (0.018)	Loss 2.2957 (2.3469)	Entropy 0.53400 (0.53305)	Top-1 acc 67.578 (67.625)	Top-5 acc 87.891 (86.246)	lr 0.00005
Train [117][2100/3239]	Time 0.382 (0.538)	Data Time 0.001 (0.018)	Loss 2.5533 (2.3471)	Entropy 0.53376 (0.53306)	Top-1 acc 57.812 (67.620)	Top-5 acc 85.938 (86.245)	lr 0.00005
Train [117][2110/3239]	Time 0.313 (0.538)	Data Time 0.002 (0.018)	Loss 2.1564 (2.3472)	Entropy 0.53396 (0.53306)	Top-1 acc 70.312 (67.616)	Top-5 acc 88.672 (86.243)	lr 0.00005
Train [117][2120/3239]	Time 0.271 (0.538)	Data Time 0.004 (0.018)	Loss 2.2563 (2.3472)	Entropy 0.53406 (0.53307)	Top-1 acc 71.875 (67.620)	Top-5 acc 88.281 (86.244)	lr 0.00005
Train [117][2130/3239]	Time 0.265 (0.537)	Data Time 0.001 (0.017)	Loss 2.2880 (2.3470)	Entropy 0.53392 (0.53307)	Top-1 acc 68.750 (67.621)	Top-5 acc 87.891 (86.244)	lr 0.00005
Train [117][2140/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.017)	Loss 2.1939 (2.3469)	Entropy 0.53408 (0.53308)	Top-1 acc 70.703 (67.624)	Top-5 acc 89.453 (86.251)	lr 0.00005
Train [117][2150/3239]	Time 0.221 (0.536)	Data Time 0.001 (0.017)	Loss 2.7930 (2.3468)	Entropy 0.53388 (0.53308)	Top-1 acc 56.641 (67.625)	Top-5 acc 78.125 (86.254)	lr 0.00005
Train [117][2160/3239]	Time 0.251 (0.536)	Data Time 0.001 (0.017)	Loss 2.2122 (2.3471)	Entropy 0.53393 (0.53308)	Top-1 acc 70.703 (67.618)	Top-5 acc 89.453 (86.249)	lr 0.00005
Train [117][2170/3239]	Time 0.246 (0.535)	Data Time 0.001 (0.017)	Loss 2.5685 (2.3472)	Entropy 0.53394 (0.53309)	Top-1 acc 60.156 (67.612)	Top-5 acc 80.859 (86.250)	lr 0.00005
Train [117][2180/3239]	Time 0.257 (0.535)	Data Time 0.001 (0.017)	Loss 2.2950 (2.3469)	Entropy 0.53429 (0.53309)	Top-1 acc 69.141 (67.623)	Top-5 acc 89.062 (86.256)	lr 0.00005
Train [117][2190/3239]	Time 0.242 (0.534)	Data Time 0.001 (0.017)	Loss 2.4023 (2.3473)	Entropy 0.53419 (0.53310)	Top-1 acc 66.406 (67.616)	Top-5 acc 85.547 (86.251)	lr 0.00005
Train [117][2200/3239]	Time 0.242 (0.534)	Data Time 0.001 (0.017)	Loss 2.2685 (2.3474)	Entropy 0.53391 (0.53310)	Top-1 acc 68.359 (67.615)	Top-5 acc 88.672 (86.251)	lr 0.00005
Train [117][2210/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.017)	Loss 2.2878 (2.3478)	Entropy 0.53368 (0.53310)	Top-1 acc 69.531 (67.610)	Top-5 acc 86.328 (86.244)	lr 0.00005
Train [117][2220/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.017)	Loss 2.4970 (2.3478)	Entropy 0.53318 (0.53311)	Top-1 acc 67.578 (67.606)	Top-5 acc 82.422 (86.243)	lr 0.00005
Train [117][2230/3239]	Time 0.274 (0.532)	Data Time 0.001 (0.017)	Loss 2.1460 (2.3476)	Entropy 0.53298 (0.53311)	Top-1 acc 75.781 (67.612)	Top-5 acc 90.625 (86.244)	lr 0.00005
Train [117][2240/3239]	Time 0.269 (0.532)	Data Time 0.001 (0.017)	Loss 2.3091 (2.3475)	Entropy 0.53314 (0.53311)	Top-1 acc 67.578 (67.616)	Top-5 acc 88.672 (86.250)	lr 0.00005
Train [117][2250/3239]	Time 0.240 (0.532)	Data Time 0.001 (0.017)	Loss 2.4945 (2.3477)	Entropy 0.53306 (0.53311)	Top-1 acc 61.328 (67.608)	Top-5 acc 85.156 (86.249)	lr 0.00005
Train [117][2260/3239]	Time 0.350 (0.531)	Data Time 0.001 (0.017)	Loss 2.2892 (2.3476)	Entropy 0.53329 (0.53311)	Top-1 acc 66.406 (67.614)	Top-5 acc 86.328 (86.255)	lr 0.00005
Train [117][2270/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.016)	Loss 2.2708 (2.3476)	Entropy 0.53350 (0.53311)	Top-1 acc 69.531 (67.611)	Top-5 acc 86.719 (86.253)	lr 0.00005
Train [117][2280/3239]	Time 0.239 (0.531)	Data Time 0.001 (0.016)	Loss 2.3543 (2.3474)	Entropy 0.53363 (0.53311)	Top-1 acc 68.750 (67.617)	Top-5 acc 87.500 (86.260)	lr 0.00005
Train [117][2290/3239]	Time 0.271 (0.530)	Data Time 0.001 (0.016)	Loss 2.1849 (2.3471)	Entropy 0.53316 (0.53311)	Top-1 acc 70.312 (67.625)	Top-5 acc 90.234 (86.267)	lr 0.00005
Train [117][2300/3239]	Time 0.239 (0.530)	Data Time 0.001 (0.016)	Loss 2.5721 (2.3473)	Entropy 0.53304 (0.53311)	Top-1 acc 62.109 (67.623)	Top-5 acc 82.812 (86.264)	lr 0.00005
Train [117][2310/3239]	Time 0.315 (0.529)	Data Time 0.002 (0.016)	Loss 2.4774 (2.3475)	Entropy 0.53285 (0.53311)	Top-1 acc 67.188 (67.619)	Top-5 acc 82.812 (86.259)	lr 0.00005
Train [117][2320/3239]	Time 0.244 (0.529)	Data Time 0.001 (0.016)	Loss 2.1894 (2.3475)	Entropy 0.53232 (0.53311)	Top-1 acc 74.609 (67.619)	Top-5 acc 86.719 (86.260)	lr 0.00005
Train [117][2330/3239]	Time 0.421 (0.529)	Data Time 0.002 (0.016)	Loss 2.3551 (2.3475)	Entropy 0.53224 (0.53310)	Top-1 acc 68.359 (67.618)	Top-5 acc 84.766 (86.258)	lr 0.00005
Train [117][2340/3239]	Time 0.279 (0.528)	Data Time 0.001 (0.016)	Loss 2.4211 (2.3475)	Entropy 0.53199 (0.53310)	Top-1 acc 66.797 (67.617)	Top-5 acc 84.375 (86.257)	lr 0.00005
Train [117][2350/3239]	Time 0.239 (0.528)	Data Time 0.001 (0.016)	Loss 2.4416 (2.3478)	Entropy 0.53193 (0.53310)	Top-1 acc 66.797 (67.610)	Top-5 acc 87.109 (86.257)	lr 0.00005
Train [117][2360/3239]	Time 0.274 (0.528)	Data Time 0.001 (0.016)	Loss 2.2832 (2.3476)	Entropy 0.53162 (0.53309)	Top-1 acc 69.531 (67.614)	Top-5 acc 88.672 (86.264)	lr 0.00005
Train [117][2370/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.016)	Loss 2.5257 (2.3477)	Entropy 0.53189 (0.53308)	Top-1 acc 65.234 (67.609)	Top-5 acc 85.938 (86.264)	lr 0.00005
Train [117][2380/3239]	Time 0.220 (0.527)	Data Time 0.001 (0.016)	Loss 2.6103 (2.3482)	Entropy 0.53174 (0.53308)	Top-1 acc 65.234 (67.601)	Top-5 acc 83.594 (86.255)	lr 0.00005
Train [117][2390/3239]	Time 0.238 (0.526)	Data Time 0.001 (0.016)	Loss 2.5999 (2.3484)	Entropy 0.53191 (0.53307)	Top-1 acc 63.281 (67.598)	Top-5 acc 83.203 (86.252)	lr 0.00005
Train [117][2400/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.016)	Loss 2.2392 (2.3485)	Entropy 0.53201 (0.53307)	Top-1 acc 68.750 (67.595)	Top-5 acc 89.453 (86.249)	lr 0.00005
Train [117][2410/3239]	Time 0.233 (0.525)	Data Time 0.001 (0.016)	Loss 2.2478 (2.3485)	Entropy 0.53178 (0.53306)	Top-1 acc 70.312 (67.592)	Top-5 acc 88.672 (86.248)	lr 0.00005
Train [117][2420/3239]	Time 0.335 (0.525)	Data Time 0.002 (0.016)	Loss 2.2615 (2.3486)	Entropy 0.53111 (0.53306)	Top-1 acc 72.266 (67.590)	Top-5 acc 87.109 (86.245)	lr 0.00005
Train [117][2430/3239]	Time 0.238 (0.525)	Data Time 0.001 (0.016)	Loss 2.1077 (2.3487)	Entropy 0.53088 (0.53305)	Top-1 acc 73.828 (67.588)	Top-5 acc 91.406 (86.244)	lr 0.00005
Train [117][2440/3239]	Time 0.237 (0.524)	Data Time 0.001 (0.015)	Loss 2.3131 (2.3487)	Entropy 0.53087 (0.53304)	Top-1 acc 67.578 (67.586)	Top-5 acc 87.500 (86.245)	lr 0.00005
Train [117][2450/3239]	Time 0.262 (0.524)	Data Time 0.001 (0.015)	Loss 2.3325 (2.3486)	Entropy 0.53127 (0.53303)	Top-1 acc 68.359 (67.589)	Top-5 acc 87.500 (86.247)	lr 0.00005
Train [117][2460/3239]	Time 0.251 (0.523)	Data Time 0.001 (0.015)	Loss 2.3369 (2.3485)	Entropy 0.53153 (0.53303)	Top-1 acc 66.406 (67.595)	Top-5 acc 88.281 (86.251)	lr 0.00004
Train [117][2470/3239]	Time 0.258 (0.523)	Data Time 0.001 (0.015)	Loss 2.2963 (2.3489)	Entropy 0.53155 (0.53302)	Top-1 acc 70.703 (67.587)	Top-5 acc 85.938 (86.246)	lr 0.00004
Train [117][2480/3239]	Time 0.260 (0.523)	Data Time 0.002 (0.015)	Loss 2.2535 (2.3485)	Entropy 0.53170 (0.53302)	Top-1 acc 68.359 (67.594)	Top-5 acc 87.891 (86.252)	lr 0.00004
Train [117][2490/3239]	Time 0.380 (0.522)	Data Time 0.002 (0.015)	Loss 2.3784 (2.3484)	Entropy 0.53204 (0.53301)	Top-1 acc 66.797 (67.597)	Top-5 acc 85.156 (86.253)	lr 0.00004
Train [117][2500/3239]	Time 0.316 (0.522)	Data Time 0.002 (0.015)	Loss 2.3133 (2.3484)	Entropy 0.53180 (0.53301)	Top-1 acc 70.703 (67.600)	Top-5 acc 87.500 (86.256)	lr 0.00004
Train [117][2510/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.015)	Loss 2.3217 (2.3483)	Entropy 0.53213 (0.53300)	Top-1 acc 69.141 (67.602)	Top-5 acc 84.375 (86.252)	lr 0.00004
Train [117][2520/3239]	Time 0.233 (0.521)	Data Time 0.001 (0.015)	Loss 2.1277 (2.3482)	Entropy 0.53218 (0.53300)	Top-1 acc 73.438 (67.608)	Top-5 acc 91.016 (86.255)	lr 0.00004
Train [117][2530/3239]	Time 0.241 (0.521)	Data Time 0.001 (0.015)	Loss 2.1830 (2.3478)	Entropy 0.53190 (0.53300)	Top-1 acc 68.359 (67.612)	Top-5 acc 88.672 (86.260)	lr 0.00004
Train [117][2540/3239]	Time 0.275 (0.520)	Data Time 0.001 (0.015)	Loss 2.2919 (2.3478)	Entropy 0.53185 (0.53299)	Top-1 acc 69.141 (67.611)	Top-5 acc 88.672 (86.263)	lr 0.00004
Train [117][2550/3239]	Time 0.281 (0.520)	Data Time 0.002 (0.015)	Loss 2.3620 (2.3478)	Entropy 0.53209 (0.53299)	Top-1 acc 67.969 (67.614)	Top-5 acc 88.281 (86.264)	lr 0.00004
Train [117][2560/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.015)	Loss 2.3280 (2.3477)	Entropy 0.53203 (0.53298)	Top-1 acc 71.094 (67.613)	Top-5 acc 87.891 (86.265)	lr 0.00004
Train [117][2570/3239]	Time 0.242 (0.519)	Data Time 0.001 (0.015)	Loss 2.3570 (2.3476)	Entropy 0.53228 (0.53298)	Top-1 acc 69.531 (67.615)	Top-5 acc 88.672 (86.270)	lr 0.00004
Train [117][2580/3239]	Time 0.248 (0.519)	Data Time 0.001 (0.015)	Loss 2.9153 (2.3479)	Entropy 0.53213 (0.53298)	Top-1 acc 55.859 (67.612)	Top-5 acc 72.656 (86.264)	lr 0.00004
Train [117][2590/3239]	Time 0.239 (0.519)	Data Time 0.001 (0.015)	Loss 2.3750 (2.3479)	Entropy 0.53258 (0.53297)	Top-1 acc 66.016 (67.610)	Top-5 acc 85.547 (86.263)	lr 0.00004
Train [117][2600/3239]	Time 0.258 (0.518)	Data Time 0.002 (0.015)	Loss 2.1983 (2.3477)	Entropy 0.53298 (0.53297)	Top-1 acc 71.484 (67.617)	Top-5 acc 88.672 (86.267)	lr 0.00004
Train [117][2610/3239]	Time 0.237 (0.518)	Data Time 0.001 (0.015)	Loss 2.3708 (2.3475)	Entropy 0.53313 (0.53297)	Top-1 acc 68.750 (67.622)	Top-5 acc 86.328 (86.270)	lr 0.00004
Train [117][2620/3239]	Time 0.230 (0.518)	Data Time 0.001 (0.015)	Loss 2.5223 (2.3474)	Entropy 0.53316 (0.53297)	Top-1 acc 61.328 (67.624)	Top-5 acc 82.031 (86.270)	lr 0.00004
Train [117][2630/3239]	Time 0.229 (0.517)	Data Time 0.001 (0.014)	Loss 2.3714 (2.3475)	Entropy 0.53266 (0.53297)	Top-1 acc 67.188 (67.619)	Top-5 acc 85.938 (86.271)	lr 0.00004
Train [117][2640/3239]	Time 0.230 (0.517)	Data Time 0.001 (0.014)	Loss 2.3043 (2.3475)	Entropy 0.53250 (0.53297)	Top-1 acc 68.750 (67.619)	Top-5 acc 87.109 (86.269)	lr 0.00004
Train [117][2650/3239]	Time 0.343 (0.517)	Data Time 0.001 (0.014)	Loss 2.1199 (2.3475)	Entropy 0.53272 (0.53297)	Top-1 acc 71.875 (67.616)	Top-5 acc 92.188 (86.272)	lr 0.00004
Train [117][2660/3239]	Time 0.238 (0.516)	Data Time 0.001 (0.014)	Loss 2.0439 (2.3474)	Entropy 0.53246 (0.53297)	Top-1 acc 75.000 (67.621)	Top-5 acc 91.406 (86.274)	lr 0.00004
Train [117][2670/3239]	Time 0.237 (0.516)	Data Time 0.001 (0.014)	Loss 2.2983 (2.3473)	Entropy 0.53234 (0.53297)	Top-1 acc 67.969 (67.622)	Top-5 acc 87.891 (86.279)	lr 0.00004
Train [117][2680/3239]	Time 0.261 (0.515)	Data Time 0.001 (0.014)	Loss 2.1289 (2.3473)	Entropy 0.53189 (0.53296)	Top-1 acc 72.656 (67.621)	Top-5 acc 89.844 (86.278)	lr 0.00004
Train [117][2690/3239]	Time 0.272 (0.515)	Data Time 0.001 (0.014)	Loss 2.3073 (2.3472)	Entropy 0.53173 (0.53296)	Top-1 acc 69.922 (67.623)	Top-5 acc 86.328 (86.281)	lr 0.00004
Train [117][2700/3239]	Time 0.268 (0.515)	Data Time 0.001 (0.014)	Loss 2.1013 (2.3471)	Entropy 0.53170 (0.53296)	Top-1 acc 75.000 (67.625)	Top-5 acc 87.109 (86.279)	lr 0.00004
Train [117][2710/3239]	Time 0.235 (0.514)	Data Time 0.001 (0.014)	Loss 2.1142 (2.3470)	Entropy 0.53176 (0.53295)	Top-1 acc 74.219 (67.628)	Top-5 acc 90.625 (86.282)	lr 0.00004
Train [117][2720/3239]	Time 0.322 (0.533)	Data Time 0.005 (0.014)	Loss 2.3559 (2.3467)	Entropy 0.53210 (0.53295)	Top-1 acc 68.750 (67.636)	Top-5 acc 85.938 (86.286)	lr 0.00004
Train [117][2730/3239]	Time 0.237 (0.533)	Data Time 0.002 (0.014)	Loss 2.1949 (2.3465)	Entropy 0.53230 (0.53295)	Top-1 acc 71.875 (67.637)	Top-5 acc 89.844 (86.289)	lr 0.00004
Train [117][2740/3239]	Time 0.275 (0.532)	Data Time 0.002 (0.014)	Loss 2.2695 (2.3466)	Entropy 0.53211 (0.53294)	Top-1 acc 67.578 (67.633)	Top-5 acc 88.281 (86.290)	lr 0.00004
Train [117][2750/3239]	Time 0.256 (0.532)	Data Time 0.001 (0.014)	Loss 2.2730 (2.3468)	Entropy 0.53217 (0.53294)	Top-1 acc 68.359 (67.627)	Top-5 acc 87.891 (86.288)	lr 0.00004
Train [117][2760/3239]	Time 0.242 (0.532)	Data Time 0.001 (0.014)	Loss 2.2985 (2.3470)	Entropy 0.53251 (0.53294)	Top-1 acc 67.188 (67.623)	Top-5 acc 88.672 (86.287)	lr 0.00004
Train [117][2770/3239]	Time 0.244 (0.531)	Data Time 0.001 (0.014)	Loss 2.1075 (2.3470)	Entropy 0.53234 (0.53294)	Top-1 acc 73.828 (67.623)	Top-5 acc 90.234 (86.283)	lr 0.00004
Train [117][2780/3239]	Time 0.241 (0.531)	Data Time 0.001 (0.014)	Loss 2.2900 (2.3472)	Entropy 0.53245 (0.53293)	Top-1 acc 71.875 (67.615)	Top-5 acc 87.500 (86.281)	lr 0.00004
Train [117][2790/3239]	Time 0.297 (0.531)	Data Time 0.001 (0.014)	Loss 2.1994 (2.3471)	Entropy 0.53261 (0.53293)	Top-1 acc 71.094 (67.619)	Top-5 acc 89.844 (86.286)	lr 0.00004
Train [117][2800/3239]	Time 0.238 (0.531)	Data Time 0.001 (0.014)	Loss 2.3524 (2.3470)	Entropy 0.53270 (0.53293)	Top-1 acc 68.750 (67.622)	Top-5 acc 85.156 (86.288)	lr 0.00004
Train [117][2810/3239]	Time 0.418 (0.530)	Data Time 0.001 (0.014)	Loss 2.1883 (2.3471)	Entropy 0.53287 (0.53293)	Top-1 acc 69.922 (67.618)	Top-5 acc 88.672 (86.287)	lr 0.00004
Train [117][2820/3239]	Time 0.245 (0.530)	Data Time 0.001 (0.014)	Loss 2.4345 (2.3469)	Entropy 0.53279 (0.53293)	Top-1 acc 66.406 (67.623)	Top-5 acc 84.375 (86.288)	lr 0.00004
Train [117][2830/3239]	Time 0.237 (0.530)	Data Time 0.001 (0.014)	Loss 2.3030 (2.3466)	Entropy 0.53292 (0.53293)	Top-1 acc 67.578 (67.630)	Top-5 acc 87.500 (86.292)	lr 0.00004
Train [117][2840/3239]	Time 0.273 (0.529)	Data Time 0.001 (0.014)	Loss 2.1754 (2.3468)	Entropy 0.53261 (0.53293)	Top-1 acc 71.484 (67.629)	Top-5 acc 88.672 (86.289)	lr 0.00004
Train [117][2850/3239]	Time 0.246 (0.529)	Data Time 0.001 (0.013)	Loss 2.4947 (2.3469)	Entropy 0.53260 (0.53293)	Top-1 acc 63.281 (67.624)	Top-5 acc 82.422 (86.289)	lr 0.00004
Train [117][2860/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.013)	Loss 2.2170 (2.3468)	Entropy 0.53287 (0.53293)	Top-1 acc 69.141 (67.631)	Top-5 acc 89.844 (86.289)	lr 0.00004
Train [117][2870/3239]	Time 0.289 (0.528)	Data Time 0.001 (0.013)	Loss 2.3758 (2.3470)	Entropy 0.53292 (0.53293)	Top-1 acc 67.188 (67.627)	Top-5 acc 85.156 (86.285)	lr 0.00004
Train [117][2880/3239]	Time 0.345 (0.528)	Data Time 0.001 (0.013)	Loss 2.1044 (2.3471)	Entropy 0.53305 (0.53293)	Top-1 acc 73.438 (67.623)	Top-5 acc 90.234 (86.284)	lr 0.00004
Train [117][2890/3239]	Time 0.281 (0.528)	Data Time 0.001 (0.013)	Loss 2.2516 (2.3469)	Entropy 0.53308 (0.53293)	Top-1 acc 67.578 (67.626)	Top-5 acc 89.062 (86.289)	lr 0.00004
Train [117][2900/3239]	Time 0.239 (0.527)	Data Time 0.001 (0.013)	Loss 2.2963 (2.3469)	Entropy 0.53313 (0.53293)	Top-1 acc 68.750 (67.624)	Top-5 acc 85.547 (86.290)	lr 0.00004
Train [117][2910/3239]	Time 0.243 (0.527)	Data Time 0.001 (0.013)	Loss 2.1927 (2.3467)	Entropy 0.53272 (0.53293)	Top-1 acc 70.703 (67.626)	Top-5 acc 91.016 (86.296)	lr 0.00004
Train [117][2920/3239]	Time 0.249 (0.527)	Data Time 0.001 (0.013)	Loss 2.2432 (2.3467)	Entropy 0.53259 (0.53293)	Top-1 acc 71.484 (67.628)	Top-5 acc 86.328 (86.297)	lr 0.00004
Train [117][2930/3239]	Time 0.247 (0.526)	Data Time 0.002 (0.013)	Loss 2.3296 (2.3465)	Entropy 0.53246 (0.53293)	Top-1 acc 69.141 (67.632)	Top-5 acc 85.938 (86.297)	lr 0.00004
Train [117][2940/3239]	Time 0.241 (0.526)	Data Time 0.001 (0.013)	Loss 2.3310 (2.3466)	Entropy 0.53245 (0.53293)	Top-1 acc 69.141 (67.632)	Top-5 acc 87.891 (86.297)	lr 0.00004
Train [117][2950/3239]	Time 0.239 (0.526)	Data Time 0.001 (0.013)	Loss 2.3524 (2.3468)	Entropy 0.53246 (0.53292)	Top-1 acc 65.625 (67.628)	Top-5 acc 86.719 (86.295)	lr 0.00004
Train [117][2960/3239]	Time 0.248 (0.525)	Data Time 0.001 (0.013)	Loss 2.2475 (2.3466)	Entropy 0.53232 (0.53292)	Top-1 acc 68.750 (67.631)	Top-5 acc 89.844 (86.298)	lr 0.00004
Train [117][2970/3239]	Time 0.419 (0.525)	Data Time 0.001 (0.013)	Loss 2.3571 (2.3465)	Entropy 0.53222 (0.53292)	Top-1 acc 66.016 (67.635)	Top-5 acc 84.766 (86.301)	lr 0.00004
Train [117][2980/3239]	Time 0.269 (0.525)	Data Time 0.001 (0.013)	Loss 2.3763 (2.3465)	Entropy 0.53234 (0.53292)	Top-1 acc 66.797 (67.636)	Top-5 acc 85.547 (86.299)	lr 0.00004
Train [117][2990/3239]	Time 0.263 (0.525)	Data Time 0.002 (0.013)	Loss 2.4198 (2.3462)	Entropy 0.53265 (0.53292)	Top-1 acc 67.188 (67.641)	Top-5 acc 84.766 (86.303)	lr 0.00004
Train [117][3000/3239]	Time 0.242 (0.524)	Data Time 0.001 (0.013)	Loss 2.1492 (2.3463)	Entropy 0.53265 (0.53292)	Top-1 acc 72.656 (67.634)	Top-5 acc 90.625 (86.302)	lr 0.00004
Train [117][3010/3239]	Time 0.241 (0.524)	Data Time 0.001 (0.013)	Loss 2.3968 (2.3462)	Entropy 0.53225 (0.53291)	Top-1 acc 68.359 (67.635)	Top-5 acc 86.719 (86.302)	lr 0.00004
Train [117][3020/3239]	Time 0.261 (0.524)	Data Time 0.001 (0.013)	Loss 2.2756 (2.3461)	Entropy 0.53188 (0.53291)	Top-1 acc 72.266 (67.640)	Top-5 acc 86.719 (86.305)	lr 0.00004
Train [117][3030/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.013)	Loss 2.0919 (2.3460)	Entropy 0.53155 (0.53291)	Top-1 acc 73.438 (67.639)	Top-5 acc 89.453 (86.303)	lr 0.00004
Train [117][3040/3239]	Time 0.345 (0.523)	Data Time 0.001 (0.013)	Loss 2.4447 (2.3458)	Entropy 0.53138 (0.53290)	Top-1 acc 65.234 (67.644)	Top-5 acc 85.547 (86.309)	lr 0.00004
Train [117][3050/3239]	Time 0.246 (0.523)	Data Time 0.001 (0.013)	Loss 2.4181 (2.3459)	Entropy 0.53127 (0.53290)	Top-1 acc 66.016 (67.645)	Top-5 acc 85.156 (86.308)	lr 0.00004
Train [117][3060/3239]	Time 0.238 (0.522)	Data Time 0.001 (0.013)	Loss 2.3341 (2.3458)	Entropy 0.53141 (0.53289)	Top-1 acc 69.531 (67.647)	Top-5 acc 85.547 (86.308)	lr 0.00004
Train [117][3070/3239]	Time 0.223 (0.522)	Data Time 0.001 (0.013)	Loss 2.2465 (2.3457)	Entropy 0.53168 (0.53289)	Top-1 acc 72.656 (67.651)	Top-5 acc 85.156 (86.311)	lr 0.00004
Train [117][3080/3239]	Time 0.235 (0.522)	Data Time 0.001 (0.013)	Loss 2.2998 (2.3457)	Entropy 0.53155 (0.53288)	Top-1 acc 69.141 (67.650)	Top-5 acc 88.281 (86.313)	lr 0.00004
Train [117][3090/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.013)	Loss 2.3206 (2.3457)	Entropy 0.53155 (0.53288)	Top-1 acc 68.750 (67.648)	Top-5 acc 84.766 (86.313)	lr 0.00004
Train [117][3100/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.013)	Loss 2.3183 (2.3458)	Entropy 0.53179 (0.53288)	Top-1 acc 66.406 (67.645)	Top-5 acc 85.938 (86.312)	lr 0.00004
Train [117][3110/3239]	Time 0.230 (0.521)	Data Time 0.001 (0.012)	Loss 2.3450 (2.3457)	Entropy 0.53164 (0.53287)	Top-1 acc 67.969 (67.646)	Top-5 acc 87.109 (86.312)	lr 0.00004
Train [117][3120/3239]	Time 0.238 (0.520)	Data Time 0.002 (0.012)	Loss 2.6273 (2.3458)	Entropy 0.53180 (0.53287)	Top-1 acc 60.156 (67.645)	Top-5 acc 81.250 (86.310)	lr 0.00004
Train [117][3130/3239]	Time 0.298 (0.520)	Data Time 0.001 (0.012)	Loss 2.3546 (2.3460)	Entropy 0.53176 (0.53286)	Top-1 acc 63.672 (67.644)	Top-5 acc 87.109 (86.307)	lr 0.00004
Train [117][3140/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.012)	Loss 2.2984 (2.3459)	Entropy 0.53190 (0.53286)	Top-1 acc 71.875 (67.646)	Top-5 acc 86.719 (86.307)	lr 0.00004
Train [117][3150/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.012)	Loss 2.5849 (2.3460)	Entropy 0.53188 (0.53286)	Top-1 acc 61.328 (67.644)	Top-5 acc 81.250 (86.306)	lr 0.00004
Train [117][3160/3239]	Time 0.227 (0.519)	Data Time 0.001 (0.012)	Loss 2.3895 (2.3460)	Entropy 0.53159 (0.53285)	Top-1 acc 68.359 (67.644)	Top-5 acc 84.375 (86.306)	lr 0.00004
Train [117][3170/3239]	Time 0.232 (0.519)	Data Time 0.003 (0.012)	Loss 2.2431 (2.3459)	Entropy 0.53144 (0.53285)	Top-1 acc 71.484 (67.648)	Top-5 acc 89.062 (86.310)	lr 0.00004
Train [117][3180/3239]	Time 0.221 (0.518)	Data Time 0.000 (0.012)	Loss 2.2865 (2.3461)	Entropy 0.53166 (0.53285)	Top-1 acc 66.406 (67.645)	Top-5 acc 84.766 (86.304)	lr 0.00004
Train [117][3190/3239]	Time 0.220 (0.518)	Data Time 0.000 (0.012)	Loss 2.1788 (2.3459)	Entropy 0.53165 (0.53284)	Top-1 acc 69.922 (67.651)	Top-5 acc 89.453 (86.308)	lr 0.00004
Train [117][3200/3239]	Time 0.317 (0.517)	Data Time 0.000 (0.012)	Loss 2.4027 (2.3459)	Entropy 0.53180 (0.53284)	Top-1 acc 65.234 (67.649)	Top-5 acc 83.984 (86.309)	lr 0.00004
Train [117][3210/3239]	Time 0.226 (0.517)	Data Time 0.000 (0.012)	Loss 2.4260 (2.3461)	Entropy 0.53175 (0.53284)	Top-1 acc 66.016 (67.646)	Top-5 acc 83.203 (86.307)	lr 0.00004
Train [117][3220/3239]	Time 0.216 (0.516)	Data Time 0.000 (0.012)	Loss 2.1473 (2.3461)	Entropy 0.53200 (0.53283)	Top-1 acc 73.047 (67.648)	Top-5 acc 89.844 (86.308)	lr 0.00004
Train [117][3230/3239]	Time 0.225 (0.516)	Data Time 0.000 (0.012)	Loss 2.2493 (2.3460)	Entropy 0.53186 (0.53283)	Top-1 acc 70.312 (67.649)	Top-5 acc 88.281 (86.306)	lr 0.00004
Train [117][3239/3239]	Time 0.873 (0.516)	Data Time 0.000 (0.012)	Loss 2.7251 (2.3460)	Entropy 0.53189 (0.53283)	Top-1 acc 60.494 (67.651)	Top-5 acc 77.778 (86.306)	lr 0.00004
==========Valid [117/120]	loss 1.168	top-1 acc 73.178 (73.178)	top-5 acc 90.620	Train top-1 67.651	top-5 86.306	Entropy 0.53189	Latency-None: 0.000ms	Flops: 539.00M
Train [118][0/3239]	Time 36.476 (36.476)	Data Time 35.284 (35.284)	Loss 2.2129 (2.2129)	Entropy 0.53184 (0.53184)	Top-1 acc 73.047 (73.047)	Top-5 acc 89.453 (89.453)	lr 0.00004
Train [118][10/3239]	Time 0.273 (3.816)	Data Time 0.001 (3.209)	Loss 2.3233 (2.3048)	Entropy 0.53153 (0.53179)	Top-1 acc 71.094 (69.673)	Top-5 acc 85.938 (87.038)	lr 0.00004
Train [118][20/3239]	Time 0.241 (2.191)	Data Time 0.001 (1.682)	Loss 2.2787 (2.3460)	Entropy 0.53153 (0.53166)	Top-1 acc 69.141 (68.062)	Top-5 acc 85.547 (86.086)	lr 0.00004
Train [118][30/3239]	Time 0.332 (1.617)	Data Time 0.001 (1.140)	Loss 2.4813 (2.3357)	Entropy 0.53159 (0.53165)	Top-1 acc 62.109 (68.385)	Top-5 acc 83.203 (86.341)	lr 0.00004
Train [118][40/3239]	Time 0.237 (1.323)	Data Time 0.001 (0.862)	Loss 2.1270 (2.3334)	Entropy 0.53173 (0.53165)	Top-1 acc 69.141 (68.226)	Top-5 acc 91.406 (86.366)	lr 0.00004
Train [118][50/3239]	Time 0.224 (1.147)	Data Time 0.001 (0.694)	Loss 2.2563 (2.3362)	Entropy 0.53154 (0.53165)	Top-1 acc 69.531 (68.137)	Top-5 acc 87.500 (86.435)	lr 0.00004
Train [118][60/3239]	Time 0.231 (1.028)	Data Time 0.001 (0.580)	Loss 2.4870 (2.3418)	Entropy 0.53161 (0.53164)	Top-1 acc 66.016 (67.975)	Top-5 acc 83.203 (86.277)	lr 0.00004
Train [118][70/3239]	Time 0.234 (0.942)	Data Time 0.001 (0.499)	Loss 2.4208 (2.3426)	Entropy 0.53171 (0.53163)	Top-1 acc 69.141 (68.013)	Top-5 acc 84.375 (86.174)	lr 0.00004
Train [118][80/3239]	Time 0.243 (0.874)	Data Time 0.001 (0.437)	Loss 2.4979 (2.3437)	Entropy 0.53168 (0.53163)	Top-1 acc 60.547 (67.964)	Top-5 acc 86.328 (86.227)	lr 0.00004
Train [118][90/3239]	Time 0.228 (0.821)	Data Time 0.001 (0.389)	Loss 2.0119 (2.3436)	Entropy 0.53175 (0.53163)	Top-1 acc 78.516 (67.952)	Top-5 acc 91.016 (86.229)	lr 0.00004
Train [118][100/3239]	Time 0.350 (0.782)	Data Time 0.001 (0.351)	Loss 2.4425 (2.3399)	Entropy 0.53157 (0.53163)	Top-1 acc 62.891 (67.969)	Top-5 acc 86.719 (86.332)	lr 0.00004
Train [118][110/3239]	Time 0.236 (0.749)	Data Time 0.001 (0.320)	Loss 2.2934 (2.3334)	Entropy 0.53161 (0.53163)	Top-1 acc 70.312 (68.120)	Top-5 acc 86.328 (86.406)	lr 0.00004
Train [118][120/3239]	Time 0.226 (0.721)	Data Time 0.001 (0.293)	Loss 2.3167 (2.3358)	Entropy 0.53148 (0.53162)	Top-1 acc 66.016 (68.053)	Top-5 acc 86.719 (86.402)	lr 0.00004
Train [118][130/3239]	Time 0.237 (0.699)	Data Time 0.002 (0.271)	Loss 2.9980 (2.3421)	Entropy 0.53163 (0.53161)	Top-1 acc 53.906 (67.927)	Top-5 acc 75.781 (86.292)	lr 0.00004
Train [118][140/3239]	Time 0.238 (1.068)	Data Time 0.002 (0.252)	Loss 2.2268 (2.3485)	Entropy 0.53143 (0.53160)	Top-1 acc 71.094 (67.794)	Top-5 acc 85.938 (86.181)	lr 0.00004
Train [118][150/3239]	Time 0.234 (1.026)	Data Time 0.002 (0.236)	Loss 2.4428 (2.3484)	Entropy 0.53127 (0.53158)	Top-1 acc 63.672 (67.741)	Top-5 acc 83.203 (86.199)	lr 0.00004
Train [118][160/3239]	Time 0.234 (0.989)	Data Time 0.001 (0.221)	Loss 2.6457 (2.3514)	Entropy 0.53135 (0.53157)	Top-1 acc 60.547 (67.668)	Top-5 acc 83.203 (86.185)	lr 0.00004
Train [118][170/3239]	Time 0.248 (0.957)	Data Time 0.001 (0.208)	Loss 2.7346 (2.3523)	Entropy 0.53157 (0.53156)	Top-1 acc 56.641 (67.633)	Top-5 acc 80.469 (86.171)	lr 0.00004
Train [118][180/3239]	Time 0.259 (0.927)	Data Time 0.001 (0.197)	Loss 2.4365 (2.3517)	Entropy 0.53210 (0.53158)	Top-1 acc 64.062 (67.658)	Top-5 acc 85.156 (86.181)	lr 0.00004
Train [118][190/3239]	Time 0.332 (0.900)	Data Time 0.001 (0.187)	Loss 2.3154 (2.3527)	Entropy 0.53228 (0.53161)	Top-1 acc 71.094 (67.621)	Top-5 acc 87.109 (86.162)	lr 0.00004
Train [118][200/3239]	Time 0.228 (0.876)	Data Time 0.001 (0.177)	Loss 2.3316 (2.3522)	Entropy 0.53219 (0.53164)	Top-1 acc 67.188 (67.603)	Top-5 acc 87.109 (86.200)	lr 0.00004
Train [118][210/3239]	Time 0.234 (0.855)	Data Time 0.001 (0.169)	Loss 2.5108 (2.3537)	Entropy 0.53221 (0.53166)	Top-1 acc 63.281 (67.573)	Top-5 acc 82.031 (86.156)	lr 0.00004
Train [118][220/3239]	Time 0.244 (0.836)	Data Time 0.001 (0.161)	Loss 2.5132 (2.3526)	Entropy 0.53188 (0.53168)	Top-1 acc 60.938 (67.562)	Top-5 acc 82.812 (86.171)	lr 0.00004
Train [118][230/3239]	Time 0.248 (0.818)	Data Time 0.001 (0.155)	Loss 2.3162 (2.3496)	Entropy 0.53231 (0.53170)	Top-1 acc 67.188 (67.644)	Top-5 acc 90.234 (86.266)	lr 0.00004
Train [118][240/3239]	Time 0.241 (0.802)	Data Time 0.001 (0.148)	Loss 2.3401 (2.3468)	Entropy 0.53227 (0.53172)	Top-1 acc 66.406 (67.687)	Top-5 acc 87.500 (86.304)	lr 0.00004
Train [118][250/3239]	Time 0.239 (0.787)	Data Time 0.001 (0.142)	Loss 2.3006 (2.3455)	Entropy 0.53245 (0.53175)	Top-1 acc 68.359 (67.712)	Top-5 acc 86.719 (86.317)	lr 0.00004
Train [118][260/3239]	Time 0.412 (0.773)	Data Time 0.002 (0.137)	Loss 2.3887 (2.3480)	Entropy 0.53301 (0.53178)	Top-1 acc 64.453 (67.680)	Top-5 acc 85.156 (86.255)	lr 0.00004
Train [118][270/3239]	Time 0.224 (0.760)	Data Time 0.001 (0.132)	Loss 2.4649 (2.3485)	Entropy 0.53289 (0.53182)	Top-1 acc 62.109 (67.680)	Top-5 acc 83.984 (86.250)	lr 0.00004
Train [118][280/3239]	Time 0.235 (0.748)	Data Time 0.001 (0.127)	Loss 2.2972 (2.3485)	Entropy 0.53300 (0.53186)	Top-1 acc 66.406 (67.675)	Top-5 acc 85.938 (86.228)	lr 0.00004
Train [118][290/3239]	Time 0.307 (0.739)	Data Time 0.002 (0.123)	Loss 2.3499 (2.3496)	Entropy 0.53292 (0.53190)	Top-1 acc 66.406 (67.622)	Top-5 acc 83.203 (86.219)	lr 0.00004
Train [118][300/3239]	Time 0.238 (0.729)	Data Time 0.001 (0.119)	Loss 2.4047 (2.3491)	Entropy 0.53272 (0.53193)	Top-1 acc 65.234 (67.613)	Top-5 acc 86.328 (86.242)	lr 0.00004
Train [118][310/3239]	Time 0.254 (0.720)	Data Time 0.001 (0.115)	Loss 2.3185 (2.3478)	Entropy 0.53242 (0.53195)	Top-1 acc 68.359 (67.640)	Top-5 acc 86.719 (86.268)	lr 0.00004
Train [118][320/3239]	Time 0.244 (0.711)	Data Time 0.001 (0.112)	Loss 2.2629 (2.3490)	Entropy 0.53238 (0.53196)	Top-1 acc 71.875 (67.639)	Top-5 acc 85.938 (86.243)	lr 0.00004
Train [118][330/3239]	Time 0.228 (0.702)	Data Time 0.001 (0.108)	Loss 2.3969 (2.3492)	Entropy 0.53213 (0.53197)	Top-1 acc 67.188 (67.637)	Top-5 acc 84.766 (86.229)	lr 0.00004
Train [118][340/3239]	Time 0.241 (0.694)	Data Time 0.001 (0.105)	Loss 2.2633 (2.3470)	Entropy 0.53183 (0.53197)	Top-1 acc 69.922 (67.681)	Top-5 acc 87.891 (86.263)	lr 0.00004
Train [118][350/3239]	Time 0.328 (0.687)	Data Time 0.001 (0.102)	Loss 2.1053 (2.3467)	Entropy 0.53138 (0.53197)	Top-1 acc 73.828 (67.706)	Top-5 acc 90.625 (86.276)	lr 0.00004
Train [118][360/3239]	Time 0.230 (0.680)	Data Time 0.001 (0.100)	Loss 2.7968 (2.3487)	Entropy 0.53171 (0.53196)	Top-1 acc 56.641 (67.645)	Top-5 acc 80.078 (86.237)	lr 0.00004
Train [118][370/3239]	Time 0.241 (0.672)	Data Time 0.001 (0.097)	Loss 2.5032 (2.3499)	Entropy 0.53165 (0.53195)	Top-1 acc 63.672 (67.627)	Top-5 acc 83.203 (86.221)	lr 0.00004
Train [118][380/3239]	Time 0.232 (0.666)	Data Time 0.001 (0.094)	Loss 2.2590 (2.3490)	Entropy 0.53186 (0.53194)	Top-1 acc 71.484 (67.640)	Top-5 acc 87.109 (86.239)	lr 0.00004
Train [118][390/3239]	Time 0.235 (0.660)	Data Time 0.001 (0.092)	Loss 2.4484 (2.3499)	Entropy 0.53177 (0.53194)	Top-1 acc 67.188 (67.624)	Top-5 acc 83.203 (86.214)	lr 0.00004
Train [118][400/3239]	Time 0.314 (0.655)	Data Time 0.001 (0.090)	Loss 2.3336 (2.3479)	Entropy 0.53189 (0.53194)	Top-1 acc 68.359 (67.678)	Top-5 acc 85.156 (86.245)	lr 0.00004
Train [118][410/3239]	Time 0.256 (0.649)	Data Time 0.003 (0.088)	Loss 2.4159 (2.3486)	Entropy 0.53187 (0.53194)	Top-1 acc 66.016 (67.666)	Top-5 acc 83.594 (86.211)	lr 0.00004
Train [118][420/3239]	Time 0.349 (0.644)	Data Time 0.001 (0.086)	Loss 2.3440 (2.3505)	Entropy 0.53149 (0.53193)	Top-1 acc 65.625 (67.633)	Top-5 acc 87.891 (86.190)	lr 0.00004
Train [118][430/3239]	Time 0.234 (0.639)	Data Time 0.001 (0.084)	Loss 2.2394 (2.3503)	Entropy 0.53155 (0.53192)	Top-1 acc 69.141 (67.641)	Top-5 acc 88.281 (86.196)	lr 0.00004
Train [118][440/3239]	Time 0.235 (0.634)	Data Time 0.001 (0.082)	Loss 2.0883 (2.3503)	Entropy 0.53188 (0.53192)	Top-1 acc 72.656 (67.640)	Top-5 acc 91.797 (86.199)	lr 0.00004
Train [118][450/3239]	Time 0.231 (0.630)	Data Time 0.001 (0.080)	Loss 2.2588 (2.3500)	Entropy 0.53149 (0.53192)	Top-1 acc 68.750 (67.642)	Top-5 acc 87.500 (86.190)	lr 0.00004
Train [118][460/3239]	Time 0.241 (0.625)	Data Time 0.001 (0.078)	Loss 2.3405 (2.3489)	Entropy 0.53169 (0.53191)	Top-1 acc 67.969 (67.673)	Top-5 acc 86.719 (86.215)	lr 0.00003
Train [118][470/3239]	Time 0.268 (0.621)	Data Time 0.001 (0.077)	Loss 2.3835 (2.3508)	Entropy 0.53188 (0.53191)	Top-1 acc 65.625 (67.632)	Top-5 acc 86.719 (86.168)	lr 0.00003
Train [118][480/3239]	Time 0.249 (0.617)	Data Time 0.001 (0.075)	Loss 2.2358 (2.3520)	Entropy 0.53170 (0.53190)	Top-1 acc 70.312 (67.603)	Top-5 acc 90.234 (86.153)	lr 0.00003
Train [118][490/3239]	Time 0.432 (0.615)	Data Time 0.002 (0.074)	Loss 2.2766 (2.3522)	Entropy 0.53179 (0.53190)	Top-1 acc 66.406 (67.590)	Top-5 acc 85.938 (86.158)	lr 0.00003
Train [118][500/3239]	Time 0.230 (0.610)	Data Time 0.001 (0.072)	Loss 2.4455 (2.3527)	Entropy 0.53147 (0.53190)	Top-1 acc 64.062 (67.565)	Top-5 acc 84.375 (86.149)	lr 0.00003
Train [118][510/3239]	Time 0.228 (0.606)	Data Time 0.001 (0.071)	Loss 2.5724 (2.3556)	Entropy 0.53152 (0.53189)	Top-1 acc 64.062 (67.489)	Top-5 acc 80.469 (86.106)	lr 0.00003
Train [118][520/3239]	Time 0.240 (0.603)	Data Time 0.001 (0.070)	Loss 2.2347 (2.3558)	Entropy 0.53145 (0.53188)	Top-1 acc 70.312 (67.490)	Top-5 acc 87.891 (86.102)	lr 0.00003
Train [118][530/3239]	Time 0.253 (0.600)	Data Time 0.001 (0.068)	Loss 2.5313 (2.3569)	Entropy 0.53174 (0.53187)	Top-1 acc 60.938 (67.460)	Top-5 acc 83.203 (86.090)	lr 0.00003
Train [118][540/3239]	Time 0.273 (0.596)	Data Time 0.002 (0.067)	Loss 2.4131 (2.3578)	Entropy 0.53162 (0.53187)	Top-1 acc 66.797 (67.446)	Top-5 acc 85.156 (86.068)	lr 0.00003
Train [118][550/3239]	Time 0.238 (0.593)	Data Time 0.002 (0.066)	Loss 2.2163 (2.3578)	Entropy 0.53174 (0.53187)	Top-1 acc 69.922 (67.467)	Top-5 acc 92.188 (86.074)	lr 0.00003
Train [118][560/3239]	Time 0.239 (0.590)	Data Time 0.001 (0.065)	Loss 2.2707 (2.3574)	Entropy 0.53163 (0.53186)	Top-1 acc 72.266 (67.490)	Top-5 acc 86.719 (86.079)	lr 0.00003
Train [118][570/3239]	Time 0.236 (0.587)	Data Time 0.001 (0.064)	Loss 2.4824 (2.3576)	Entropy 0.53157 (0.53186)	Top-1 acc 65.234 (67.488)	Top-5 acc 85.156 (86.077)	lr 0.00003
Train [118][580/3239]	Time 0.363 (0.584)	Data Time 0.001 (0.063)	Loss 2.3111 (2.3580)	Entropy 0.53111 (0.53185)	Top-1 acc 68.359 (67.464)	Top-5 acc 86.328 (86.063)	lr 0.00003
Train [118][590/3239]	Time 0.294 (0.582)	Data Time 0.001 (0.062)	Loss 2.2009 (2.3573)	Entropy 0.53099 (0.53184)	Top-1 acc 71.094 (67.474)	Top-5 acc 89.062 (86.083)	lr 0.00003
Train [118][600/3239]	Time 0.283 (0.579)	Data Time 0.002 (0.061)	Loss 2.2692 (2.3565)	Entropy 0.53129 (0.53183)	Top-1 acc 70.703 (67.501)	Top-5 acc 87.109 (86.098)	lr 0.00003
Train [118][610/3239]	Time 0.233 (0.577)	Data Time 0.001 (0.060)	Loss 2.5294 (2.3557)	Entropy 0.53089 (0.53181)	Top-1 acc 60.156 (67.514)	Top-5 acc 81.250 (86.109)	lr 0.00003
Train [118][620/3239]	Time 0.235 (0.574)	Data Time 0.001 (0.059)	Loss 2.7340 (2.3562)	Entropy 0.53092 (0.53180)	Top-1 acc 58.203 (67.499)	Top-5 acc 80.078 (86.114)	lr 0.00003
Train [118][630/3239]	Time 0.239 (0.572)	Data Time 0.001 (0.058)	Loss 2.2719 (2.3551)	Entropy 0.53079 (0.53179)	Top-1 acc 68.359 (67.521)	Top-5 acc 88.672 (86.131)	lr 0.00003
Train [118][640/3239]	Time 0.308 (0.570)	Data Time 0.003 (0.057)	Loss 2.5171 (2.3547)	Entropy 0.53075 (0.53177)	Top-1 acc 63.672 (67.522)	Top-5 acc 84.375 (86.132)	lr 0.00003
Train [118][650/3239]	Time 0.387 (0.569)	Data Time 0.001 (0.056)	Loss 2.5737 (2.3553)	Entropy 0.53104 (0.53176)	Top-1 acc 61.328 (67.525)	Top-5 acc 81.250 (86.125)	lr 0.00003
Train [118][660/3239]	Time 0.234 (0.566)	Data Time 0.001 (0.055)	Loss 2.4040 (2.3561)	Entropy 0.53094 (0.53175)	Top-1 acc 66.406 (67.494)	Top-5 acc 84.766 (86.094)	lr 0.00003
Train [118][670/3239]	Time 0.261 (0.564)	Data Time 0.001 (0.054)	Loss 2.4211 (2.3548)	Entropy 0.53068 (0.53173)	Top-1 acc 66.016 (67.537)	Top-5 acc 85.156 (86.112)	lr 0.00003
Train [118][680/3239]	Time 0.233 (0.562)	Data Time 0.002 (0.054)	Loss 2.4236 (2.3549)	Entropy 0.53095 (0.53172)	Top-1 acc 67.578 (67.537)	Top-5 acc 83.984 (86.105)	lr 0.00003
Train [118][690/3239]	Time 0.242 (0.560)	Data Time 0.001 (0.053)	Loss 2.2533 (2.3547)	Entropy 0.53088 (0.53171)	Top-1 acc 67.578 (67.541)	Top-5 acc 90.625 (86.109)	lr 0.00003
Train [118][700/3239]	Time 0.238 (0.558)	Data Time 0.001 (0.052)	Loss 2.2728 (2.3542)	Entropy 0.53115 (0.53169)	Top-1 acc 66.797 (67.551)	Top-5 acc 89.062 (86.128)	lr 0.00003
Train [118][710/3239]	Time 0.215 (0.556)	Data Time 0.001 (0.051)	Loss 2.4978 (2.3544)	Entropy 0.53087 (0.53169)	Top-1 acc 63.281 (67.553)	Top-5 acc 82.422 (86.130)	lr 0.00003
Train [118][720/3239]	Time 0.244 (0.554)	Data Time 0.002 (0.051)	Loss 2.3490 (2.3534)	Entropy 0.53043 (0.53167)	Top-1 acc 66.016 (67.562)	Top-5 acc 85.938 (86.148)	lr 0.00003
Train [118][730/3239]	Time 0.226 (0.552)	Data Time 0.001 (0.050)	Loss 2.5600 (2.3538)	Entropy 0.53042 (0.53165)	Top-1 acc 63.281 (67.557)	Top-5 acc 83.594 (86.141)	lr 0.00003
Train [118][740/3239]	Time 0.340 (0.550)	Data Time 0.001 (0.049)	Loss 2.1807 (2.3529)	Entropy 0.53046 (0.53164)	Top-1 acc 73.047 (67.567)	Top-5 acc 89.453 (86.159)	lr 0.00003
Train [118][750/3239]	Time 0.245 (0.549)	Data Time 0.001 (0.049)	Loss 2.2471 (2.3526)	Entropy 0.53030 (0.53162)	Top-1 acc 68.359 (67.571)	Top-5 acc 89.062 (86.167)	lr 0.00003
Train [118][760/3239]	Time 0.240 (0.547)	Data Time 0.001 (0.048)	Loss 2.2462 (2.3531)	Entropy 0.53059 (0.53160)	Top-1 acc 68.750 (67.549)	Top-5 acc 87.500 (86.159)	lr 0.00003
Train [118][770/3239]	Time 0.264 (0.546)	Data Time 0.002 (0.048)	Loss 2.4163 (2.3532)	Entropy 0.53069 (0.53159)	Top-1 acc 67.969 (67.550)	Top-5 acc 85.547 (86.146)	lr 0.00003
Train [118][780/3239]	Time 0.267 (0.545)	Data Time 0.001 (0.047)	Loss 2.2566 (2.3523)	Entropy 0.53074 (0.53158)	Top-1 acc 66.797 (67.565)	Top-5 acc 86.719 (86.161)	lr 0.00003
Train [118][790/3239]	Time 0.354 (0.606)	Data Time 0.005 (0.047)	Loss 2.6527 (2.3529)	Entropy 0.53055 (0.53157)	Top-1 acc 60.156 (67.550)	Top-5 acc 80.859 (86.151)	lr 0.00003
Train [118][800/3239]	Time 0.246 (0.605)	Data Time 0.002 (0.046)	Loss 2.4335 (2.3531)	Entropy 0.53052 (0.53156)	Top-1 acc 62.109 (67.539)	Top-5 acc 86.719 (86.158)	lr 0.00003
Train [118][810/3239]	Time 0.323 (0.603)	Data Time 0.002 (0.045)	Loss 2.4087 (2.3531)	Entropy 0.53051 (0.53154)	Top-1 acc 68.359 (67.539)	Top-5 acc 82.812 (86.157)	lr 0.00003
Train [118][820/3239]	Time 0.231 (0.600)	Data Time 0.001 (0.045)	Loss 2.5358 (2.3534)	Entropy 0.53035 (0.53153)	Top-1 acc 62.891 (67.533)	Top-5 acc 82.812 (86.158)	lr 0.00003
Train [118][830/3239]	Time 0.263 (0.599)	Data Time 0.002 (0.044)	Loss 2.2226 (2.3525)	Entropy 0.53026 (0.53152)	Top-1 acc 71.875 (67.554)	Top-5 acc 87.109 (86.178)	lr 0.00003
Train [118][840/3239]	Time 0.237 (0.596)	Data Time 0.001 (0.044)	Loss 2.3134 (2.3524)	Entropy 0.53025 (0.53150)	Top-1 acc 69.531 (67.561)	Top-5 acc 88.672 (86.181)	lr 0.00003
Train [118][850/3239]	Time 0.240 (0.594)	Data Time 0.001 (0.043)	Loss 2.2525 (2.3521)	Entropy 0.52993 (0.53148)	Top-1 acc 70.703 (67.568)	Top-5 acc 86.719 (86.185)	lr 0.00003
Train [118][860/3239]	Time 0.229 (0.593)	Data Time 0.001 (0.043)	Loss 2.1686 (2.3516)	Entropy 0.53013 (0.53147)	Top-1 acc 73.047 (67.579)	Top-5 acc 87.891 (86.179)	lr 0.00003
Train [118][870/3239]	Time 0.276 (0.591)	Data Time 0.001 (0.042)	Loss 2.2128 (2.3510)	Entropy 0.53020 (0.53145)	Top-1 acc 71.875 (67.586)	Top-5 acc 87.891 (86.183)	lr 0.00003
Train [118][880/3239]	Time 0.240 (0.589)	Data Time 0.001 (0.042)	Loss 2.4367 (2.3503)	Entropy 0.53011 (0.53144)	Top-1 acc 65.234 (67.608)	Top-5 acc 83.594 (86.204)	lr 0.00003
Train [118][890/3239]	Time 0.224 (0.587)	Data Time 0.001 (0.042)	Loss 2.3689 (2.3505)	Entropy 0.52999 (0.53142)	Top-1 acc 67.578 (67.594)	Top-5 acc 85.547 (86.202)	lr 0.00003
Train [118][900/3239]	Time 0.330 (0.585)	Data Time 0.001 (0.041)	Loss 2.3460 (2.3508)	Entropy 0.53013 (0.53141)	Top-1 acc 69.141 (67.585)	Top-5 acc 86.719 (86.199)	lr 0.00003
Train [118][910/3239]	Time 0.233 (0.583)	Data Time 0.001 (0.041)	Loss 2.2506 (2.3508)	Entropy 0.52988 (0.53139)	Top-1 acc 70.703 (67.588)	Top-5 acc 85.156 (86.193)	lr 0.00003
Train [118][920/3239]	Time 0.227 (0.581)	Data Time 0.001 (0.040)	Loss 2.4351 (2.3509)	Entropy 0.52985 (0.53138)	Top-1 acc 66.797 (67.594)	Top-5 acc 84.766 (86.191)	lr 0.00003
Train [118][930/3239]	Time 0.226 (0.579)	Data Time 0.001 (0.040)	Loss 2.2930 (2.3505)	Entropy 0.52950 (0.53136)	Top-1 acc 69.141 (67.595)	Top-5 acc 87.500 (86.204)	lr 0.00003
Train [118][940/3239]	Time 0.235 (0.578)	Data Time 0.001 (0.039)	Loss 2.1618 (2.3496)	Entropy 0.52964 (0.53134)	Top-1 acc 72.656 (67.616)	Top-5 acc 91.406 (86.224)	lr 0.00003
Train [118][950/3239]	Time 0.232 (0.576)	Data Time 0.001 (0.039)	Loss 2.5793 (2.3503)	Entropy 0.52970 (0.53132)	Top-1 acc 58.594 (67.599)	Top-5 acc 82.422 (86.208)	lr 0.00003
Train [118][960/3239]	Time 0.237 (0.574)	Data Time 0.001 (0.039)	Loss 2.2915 (2.3500)	Entropy 0.52958 (0.53130)	Top-1 acc 65.625 (67.595)	Top-5 acc 86.719 (86.211)	lr 0.00003
Train [118][970/3239]	Time 0.394 (0.573)	Data Time 0.001 (0.038)	Loss 2.1734 (2.3492)	Entropy 0.52968 (0.53129)	Top-1 acc 71.484 (67.609)	Top-5 acc 89.453 (86.230)	lr 0.00003
Train [118][980/3239]	Time 0.248 (0.571)	Data Time 0.001 (0.038)	Loss 2.2350 (2.3487)	Entropy 0.52975 (0.53127)	Top-1 acc 69.531 (67.614)	Top-5 acc 91.797 (86.248)	lr 0.00003
Train [118][990/3239]	Time 0.247 (0.570)	Data Time 0.001 (0.037)	Loss 2.3093 (2.3493)	Entropy 0.52988 (0.53126)	Top-1 acc 69.922 (67.597)	Top-5 acc 87.891 (86.239)	lr 0.00003
Train [118][1000/3239]	Time 0.254 (0.569)	Data Time 0.001 (0.037)	Loss 2.3638 (2.3498)	Entropy 0.53007 (0.53124)	Top-1 acc 67.188 (67.581)	Top-5 acc 85.938 (86.228)	lr 0.00003
Train [118][1010/3239]	Time 0.244 (0.567)	Data Time 0.001 (0.037)	Loss 2.1897 (2.3507)	Entropy 0.53034 (0.53123)	Top-1 acc 69.141 (67.558)	Top-5 acc 91.016 (86.220)	lr 0.00003
Train [118][1020/3239]	Time 0.269 (0.566)	Data Time 0.001 (0.036)	Loss 2.8215 (2.3506)	Entropy 0.53012 (0.53122)	Top-1 acc 58.203 (67.567)	Top-5 acc 79.297 (86.220)	lr 0.00003
Train [118][1030/3239]	Time 0.246 (0.565)	Data Time 0.001 (0.036)	Loss 2.4909 (2.3508)	Entropy 0.53035 (0.53121)	Top-1 acc 65.234 (67.554)	Top-5 acc 84.766 (86.213)	lr 0.00003
Train [118][1040/3239]	Time 0.236 (0.564)	Data Time 0.001 (0.036)	Loss 2.5208 (2.3501)	Entropy 0.52990 (0.53120)	Top-1 acc 64.453 (67.574)	Top-5 acc 82.812 (86.228)	lr 0.00003
Train [118][1050/3239]	Time 0.266 (0.562)	Data Time 0.001 (0.035)	Loss 2.2555 (2.3498)	Entropy 0.52971 (0.53119)	Top-1 acc 65.625 (67.578)	Top-5 acc 86.719 (86.231)	lr 0.00003
Train [118][1060/3239]	Time 0.230 (0.561)	Data Time 0.001 (0.035)	Loss 2.2342 (2.3496)	Entropy 0.52975 (0.53118)	Top-1 acc 70.703 (67.570)	Top-5 acc 85.938 (86.231)	lr 0.00003
Train [118][1070/3239]	Time 0.235 (0.560)	Data Time 0.001 (0.035)	Loss 2.4811 (2.3493)	Entropy 0.52991 (0.53117)	Top-1 acc 62.891 (67.579)	Top-5 acc 86.328 (86.239)	lr 0.00003
Train [118][1080/3239]	Time 0.220 (0.558)	Data Time 0.001 (0.034)	Loss 2.4222 (2.3493)	Entropy 0.52989 (0.53115)	Top-1 acc 67.969 (67.582)	Top-5 acc 85.156 (86.242)	lr 0.00003
Train [118][1090/3239]	Time 0.227 (0.557)	Data Time 0.001 (0.034)	Loss 2.3895 (2.3492)	Entropy 0.52984 (0.53114)	Top-1 acc 63.672 (67.582)	Top-5 acc 85.938 (86.248)	lr 0.00003
Train [118][1100/3239]	Time 0.227 (0.556)	Data Time 0.001 (0.034)	Loss 2.1952 (2.3490)	Entropy 0.52970 (0.53113)	Top-1 acc 70.312 (67.587)	Top-5 acc 88.672 (86.251)	lr 0.00003
Train [118][1110/3239]	Time 0.233 (0.555)	Data Time 0.001 (0.034)	Loss 2.2088 (2.3488)	Entropy 0.52940 (0.53111)	Top-1 acc 71.484 (67.601)	Top-5 acc 87.891 (86.261)	lr 0.00003
Train [118][1120/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.033)	Loss 2.3625 (2.3490)	Entropy 0.52954 (0.53110)	Top-1 acc 69.531 (67.601)	Top-5 acc 87.500 (86.260)	lr 0.00003
Train [118][1130/3239]	Time 0.331 (0.552)	Data Time 0.001 (0.033)	Loss 2.3118 (2.3485)	Entropy 0.52973 (0.53108)	Top-1 acc 69.531 (67.612)	Top-5 acc 86.719 (86.268)	lr 0.00003
Train [118][1140/3239]	Time 0.241 (0.551)	Data Time 0.002 (0.033)	Loss 2.2543 (2.3488)	Entropy 0.52989 (0.53107)	Top-1 acc 69.922 (67.607)	Top-5 acc 87.891 (86.262)	lr 0.00003
Train [118][1150/3239]	Time 0.238 (0.550)	Data Time 0.001 (0.032)	Loss 2.1719 (2.3489)	Entropy 0.53003 (0.53106)	Top-1 acc 70.703 (67.602)	Top-5 acc 89.062 (86.257)	lr 0.00003
Train [118][1160/3239]	Time 0.232 (0.549)	Data Time 0.001 (0.032)	Loss 2.1643 (2.3484)	Entropy 0.53004 (0.53106)	Top-1 acc 70.312 (67.618)	Top-5 acc 89.062 (86.262)	lr 0.00003
Train [118][1170/3239]	Time 0.243 (0.547)	Data Time 0.001 (0.032)	Loss 2.2683 (2.3490)	Entropy 0.52960 (0.53105)	Top-1 acc 70.703 (67.603)	Top-5 acc 91.016 (86.257)	lr 0.00003
Train [118][1180/3239]	Time 0.234 (0.546)	Data Time 0.001 (0.032)	Loss 2.3410 (2.3491)	Entropy 0.52920 (0.53103)	Top-1 acc 65.234 (67.598)	Top-5 acc 87.891 (86.254)	lr 0.00003
Train [118][1190/3239]	Time 0.226 (0.545)	Data Time 0.001 (0.031)	Loss 2.5129 (2.3487)	Entropy 0.52912 (0.53102)	Top-1 acc 62.500 (67.596)	Top-5 acc 86.328 (86.262)	lr 0.00003
Train [118][1200/3239]	Time 0.323 (0.544)	Data Time 0.001 (0.031)	Loss 2.4632 (2.3488)	Entropy 0.52946 (0.53100)	Top-1 acc 63.672 (67.591)	Top-5 acc 84.375 (86.257)	lr 0.00003
Train [118][1210/3239]	Time 0.235 (0.543)	Data Time 0.001 (0.031)	Loss 2.6038 (2.3495)	Entropy 0.52930 (0.53099)	Top-1 acc 58.984 (67.578)	Top-5 acc 85.938 (86.244)	lr 0.00003
Train [118][1220/3239]	Time 0.236 (0.542)	Data Time 0.001 (0.031)	Loss 2.3464 (2.3495)	Entropy 0.52961 (0.53097)	Top-1 acc 67.188 (67.581)	Top-5 acc 86.328 (86.244)	lr 0.00003
Train [118][1230/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.031)	Loss 2.2787 (2.3495)	Entropy 0.52960 (0.53096)	Top-1 acc 70.312 (67.579)	Top-5 acc 87.891 (86.243)	lr 0.00003
Train [118][1240/3239]	Time 0.237 (0.540)	Data Time 0.001 (0.030)	Loss 2.2196 (2.3497)	Entropy 0.52948 (0.53095)	Top-1 acc 67.969 (67.577)	Top-5 acc 88.281 (86.241)	lr 0.00003
Train [118][1250/3239]	Time 0.249 (0.539)	Data Time 0.001 (0.030)	Loss 2.4144 (2.3494)	Entropy 0.52967 (0.53094)	Top-1 acc 62.109 (67.580)	Top-5 acc 87.109 (86.246)	lr 0.00003
Train [118][1260/3239]	Time 0.241 (0.538)	Data Time 0.001 (0.030)	Loss 2.2675 (2.3488)	Entropy 0.53009 (0.53093)	Top-1 acc 67.969 (67.594)	Top-5 acc 87.109 (86.256)	lr 0.00003
Train [118][1270/3239]	Time 0.275 (0.537)	Data Time 0.001 (0.030)	Loss 2.0981 (2.3486)	Entropy 0.53009 (0.53093)	Top-1 acc 73.438 (67.599)	Top-5 acc 90.234 (86.260)	lr 0.00003
Train [118][1280/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.029)	Loss 2.2624 (2.3485)	Entropy 0.53026 (0.53092)	Top-1 acc 72.266 (67.601)	Top-5 acc 86.328 (86.260)	lr 0.00003
Train [118][1290/3239]	Time 0.366 (0.535)	Data Time 0.001 (0.029)	Loss 2.3453 (2.3487)	Entropy 0.52981 (0.53091)	Top-1 acc 66.406 (67.600)	Top-5 acc 87.500 (86.251)	lr 0.00003
Train [118][1300/3239]	Time 0.225 (0.534)	Data Time 0.001 (0.029)	Loss 2.7196 (2.3490)	Entropy 0.52995 (0.53091)	Top-1 acc 55.078 (67.589)	Top-5 acc 81.250 (86.246)	lr 0.00003
Train [118][1310/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.029)	Loss 2.2899 (2.3490)	Entropy 0.53029 (0.53090)	Top-1 acc 68.359 (67.585)	Top-5 acc 88.281 (86.248)	lr 0.00003
Train [118][1320/3239]	Time 0.236 (0.532)	Data Time 0.001 (0.029)	Loss 2.5115 (2.3494)	Entropy 0.53056 (0.53090)	Top-1 acc 62.109 (67.570)	Top-5 acc 85.156 (86.235)	lr 0.00003
Train [118][1330/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.028)	Loss 2.4626 (2.3492)	Entropy 0.53058 (0.53089)	Top-1 acc 65.625 (67.577)	Top-5 acc 82.422 (86.240)	lr 0.00003
Train [118][1340/3239]	Time 0.221 (0.531)	Data Time 0.001 (0.028)	Loss 2.4181 (2.3492)	Entropy 0.53069 (0.53089)	Top-1 acc 66.016 (67.575)	Top-5 acc 83.984 (86.237)	lr 0.00003
Train [118][1350/3239]	Time 0.231 (0.530)	Data Time 0.001 (0.028)	Loss 2.3799 (2.3490)	Entropy 0.53034 (0.53089)	Top-1 acc 65.234 (67.579)	Top-5 acc 85.156 (86.241)	lr 0.00003
Train [118][1360/3239]	Time 0.340 (0.529)	Data Time 0.001 (0.028)	Loss 2.3842 (2.3491)	Entropy 0.53030 (0.53088)	Top-1 acc 64.062 (67.576)	Top-5 acc 86.719 (86.244)	lr 0.00003
Train [118][1370/3239]	Time 0.235 (0.528)	Data Time 0.001 (0.028)	Loss 2.2660 (2.3497)	Entropy 0.53048 (0.53088)	Top-1 acc 69.922 (67.565)	Top-5 acc 88.281 (86.236)	lr 0.00003
Train [118][1380/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.027)	Loss 2.3867 (2.3495)	Entropy 0.53024 (0.53088)	Top-1 acc 68.750 (67.570)	Top-5 acc 86.328 (86.240)	lr 0.00003
Train [118][1390/3239]	Time 0.227 (0.527)	Data Time 0.001 (0.027)	Loss 2.4640 (2.3502)	Entropy 0.53023 (0.53087)	Top-1 acc 60.938 (67.553)	Top-5 acc 85.156 (86.231)	lr 0.00003
Train [118][1400/3239]	Time 0.229 (0.526)	Data Time 0.001 (0.027)	Loss 2.2088 (2.3503)	Entropy 0.53040 (0.53087)	Top-1 acc 71.484 (67.551)	Top-5 acc 89.062 (86.231)	lr 0.00003
Train [118][1410/3239]	Time 0.238 (0.525)	Data Time 0.001 (0.027)	Loss 2.3361 (2.3502)	Entropy 0.52986 (0.53086)	Top-1 acc 67.188 (67.549)	Top-5 acc 87.109 (86.235)	lr 0.00003
Train [118][1420/3239]	Time 0.226 (0.524)	Data Time 0.001 (0.027)	Loss 2.3817 (2.3504)	Entropy 0.52979 (0.53086)	Top-1 acc 69.141 (67.543)	Top-5 acc 83.203 (86.230)	lr 0.00003
Train [118][1430/3239]	Time 0.244 (0.524)	Data Time 0.002 (0.026)	Loss 2.4001 (2.3503)	Entropy 0.52995 (0.53085)	Top-1 acc 66.016 (67.546)	Top-5 acc 85.156 (86.233)	lr 0.00003
Train [118][1440/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.026)	Loss 2.5605 (2.3497)	Entropy 0.52987 (0.53084)	Top-1 acc 61.328 (67.560)	Top-5 acc 83.594 (86.242)	lr 0.00003
Train [118][1450/3239]	Time 0.362 (0.557)	Data Time 0.002 (0.026)	Loss 2.2753 (2.3494)	Entropy 0.52986 (0.53084)	Top-1 acc 68.750 (67.568)	Top-5 acc 89.062 (86.246)	lr 0.00003
Train [118][1460/3239]	Time 0.302 (0.557)	Data Time 0.002 (0.026)	Loss 2.3245 (2.3490)	Entropy 0.52978 (0.53083)	Top-1 acc 67.578 (67.577)	Top-5 acc 86.328 (86.256)	lr 0.00003
Train [118][1470/3239]	Time 0.356 (0.557)	Data Time 0.002 (0.026)	Loss 2.3388 (2.3490)	Entropy 0.52976 (0.53082)	Top-1 acc 66.016 (67.565)	Top-5 acc 85.938 (86.259)	lr 0.00003
Train [118][1480/3239]	Time 0.242 (0.557)	Data Time 0.002 (0.026)	Loss 2.2022 (2.3490)	Entropy 0.52947 (0.53081)	Top-1 acc 71.875 (67.568)	Top-5 acc 85.938 (86.253)	lr 0.00003
Train [118][1490/3239]	Time 0.229 (0.556)	Data Time 0.001 (0.025)	Loss 2.4372 (2.3491)	Entropy 0.52929 (0.53080)	Top-1 acc 62.891 (67.562)	Top-5 acc 84.766 (86.252)	lr 0.00003
Train [118][1500/3239]	Time 0.237 (0.555)	Data Time 0.001 (0.025)	Loss 2.4708 (2.3484)	Entropy 0.52942 (0.53079)	Top-1 acc 63.672 (67.577)	Top-5 acc 85.938 (86.264)	lr 0.00003
Train [118][1510/3239]	Time 0.256 (0.554)	Data Time 0.001 (0.025)	Loss 2.3547 (2.3484)	Entropy 0.52879 (0.53078)	Top-1 acc 66.016 (67.578)	Top-5 acc 86.328 (86.267)	lr 0.00003
Train [118][1520/3239]	Time 0.314 (0.553)	Data Time 0.001 (0.025)	Loss 2.3161 (2.3483)	Entropy 0.52876 (0.53077)	Top-1 acc 67.578 (67.583)	Top-5 acc 87.500 (86.269)	lr 0.00003
Train [118][1530/3239]	Time 0.234 (0.552)	Data Time 0.001 (0.025)	Loss 2.2576 (2.3483)	Entropy 0.52895 (0.53076)	Top-1 acc 69.531 (67.586)	Top-5 acc 88.281 (86.275)	lr 0.00003
Train [118][1540/3239]	Time 0.238 (0.551)	Data Time 0.001 (0.025)	Loss 2.2746 (2.3476)	Entropy 0.52868 (0.53074)	Top-1 acc 70.312 (67.610)	Top-5 acc 86.719 (86.285)	lr 0.00003
Train [118][1550/3239]	Time 0.242 (0.551)	Data Time 0.001 (0.025)	Loss 2.4516 (2.3476)	Entropy 0.52873 (0.53073)	Top-1 acc 63.672 (67.607)	Top-5 acc 85.156 (86.290)	lr 0.00003
Train [118][1560/3239]	Time 0.229 (0.550)	Data Time 0.001 (0.024)	Loss 2.3899 (2.3475)	Entropy 0.52822 (0.53072)	Top-1 acc 66.016 (67.610)	Top-5 acc 85.156 (86.295)	lr 0.00003
Train [118][1570/3239]	Time 0.238 (0.549)	Data Time 0.001 (0.024)	Loss 2.4301 (2.3474)	Entropy 0.52810 (0.53070)	Top-1 acc 68.359 (67.612)	Top-5 acc 84.375 (86.295)	lr 0.00003
Train [118][1580/3239]	Time 0.228 (0.548)	Data Time 0.001 (0.024)	Loss 2.2945 (2.3475)	Entropy 0.52842 (0.53069)	Top-1 acc 71.094 (67.608)	Top-5 acc 88.281 (86.294)	lr 0.00003
Train [118][1590/3239]	Time 0.259 (0.548)	Data Time 0.002 (0.024)	Loss 2.3529 (2.3478)	Entropy 0.52889 (0.53067)	Top-1 acc 65.625 (67.601)	Top-5 acc 86.328 (86.293)	lr 0.00003
Train [118][1600/3239]	Time 0.229 (0.547)	Data Time 0.001 (0.024)	Loss 2.3523 (2.3476)	Entropy 0.52909 (0.53066)	Top-1 acc 67.969 (67.605)	Top-5 acc 83.594 (86.294)	lr 0.00003
Train [118][1610/3239]	Time 0.292 (0.546)	Data Time 0.001 (0.024)	Loss 2.3919 (2.3475)	Entropy 0.52918 (0.53065)	Top-1 acc 66.016 (67.606)	Top-5 acc 84.766 (86.294)	lr 0.00003
Train [118][1620/3239]	Time 0.223 (0.545)	Data Time 0.001 (0.024)	Loss 2.3178 (2.3473)	Entropy 0.52925 (0.53064)	Top-1 acc 64.844 (67.611)	Top-5 acc 89.062 (86.299)	lr 0.00003
Train [118][1630/3239]	Time 0.220 (0.544)	Data Time 0.001 (0.023)	Loss 2.3825 (2.3473)	Entropy 0.52917 (0.53063)	Top-1 acc 69.141 (67.608)	Top-5 acc 85.547 (86.296)	lr 0.00003
Train [118][1640/3239]	Time 0.222 (0.543)	Data Time 0.001 (0.023)	Loss 2.6719 (2.3474)	Entropy 0.52883 (0.53062)	Top-1 acc 58.984 (67.607)	Top-5 acc 82.812 (86.297)	lr 0.00003
Train [118][1650/3239]	Time 0.229 (0.543)	Data Time 0.001 (0.023)	Loss 2.4705 (2.3478)	Entropy 0.52894 (0.53061)	Top-1 acc 63.672 (67.596)	Top-5 acc 85.938 (86.292)	lr 0.00003
Train [118][1660/3239]	Time 0.233 (0.542)	Data Time 0.001 (0.023)	Loss 2.2790 (2.3476)	Entropy 0.52903 (0.53060)	Top-1 acc 70.703 (67.606)	Top-5 acc 87.500 (86.294)	lr 0.00003
Train [118][1670/3239]	Time 0.235 (0.542)	Data Time 0.001 (0.023)	Loss 2.0982 (2.3477)	Entropy 0.52938 (0.53059)	Top-1 acc 73.828 (67.602)	Top-5 acc 89.453 (86.290)	lr 0.00003
Train [118][1680/3239]	Time 0.329 (0.541)	Data Time 0.001 (0.023)	Loss 2.2063 (2.3472)	Entropy 0.52943 (0.53059)	Top-1 acc 70.703 (67.617)	Top-5 acc 89.062 (86.300)	lr 0.00003
Train [118][1690/3239]	Time 0.236 (0.540)	Data Time 0.001 (0.023)	Loss 2.1876 (2.3473)	Entropy 0.52959 (0.53058)	Top-1 acc 71.484 (67.615)	Top-5 acc 89.453 (86.300)	lr 0.00003
Train [118][1700/3239]	Time 0.222 (0.539)	Data Time 0.001 (0.023)	Loss 2.3409 (2.3467)	Entropy 0.52927 (0.53058)	Top-1 acc 67.578 (67.625)	Top-5 acc 87.109 (86.316)	lr 0.00003
Train [118][1710/3239]	Time 0.232 (0.539)	Data Time 0.004 (0.022)	Loss 2.2861 (2.3468)	Entropy 0.52918 (0.53057)	Top-1 acc 68.750 (67.627)	Top-5 acc 85.156 (86.313)	lr 0.00003
Train [118][1720/3239]	Time 0.231 (0.538)	Data Time 0.001 (0.022)	Loss 2.5647 (2.3469)	Entropy 0.52924 (0.53056)	Top-1 acc 64.453 (67.625)	Top-5 acc 82.031 (86.311)	lr 0.00003
Train [118][1730/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.022)	Loss 2.2370 (2.3467)	Entropy 0.52906 (0.53055)	Top-1 acc 70.312 (67.636)	Top-5 acc 88.281 (86.317)	lr 0.00003
Train [118][1740/3239]	Time 0.243 (0.536)	Data Time 0.001 (0.022)	Loss 2.3254 (2.3469)	Entropy 0.52915 (0.53054)	Top-1 acc 69.922 (67.631)	Top-5 acc 87.500 (86.315)	lr 0.00003
Train [118][1750/3239]	Time 0.366 (0.536)	Data Time 0.001 (0.022)	Loss 2.1468 (2.3469)	Entropy 0.52929 (0.53054)	Top-1 acc 71.875 (67.627)	Top-5 acc 87.109 (86.313)	lr 0.00003
Train [118][1760/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.022)	Loss 2.2082 (2.3466)	Entropy 0.52912 (0.53053)	Top-1 acc 72.266 (67.635)	Top-5 acc 87.891 (86.315)	lr 0.00003
Train [118][1770/3239]	Time 0.252 (0.535)	Data Time 0.001 (0.022)	Loss 2.2480 (2.3466)	Entropy 0.52908 (0.53052)	Top-1 acc 71.484 (67.637)	Top-5 acc 86.719 (86.314)	lr 0.00003
Train [118][1780/3239]	Time 0.244 (0.534)	Data Time 0.001 (0.022)	Loss 2.8985 (2.3468)	Entropy 0.52906 (0.53051)	Top-1 acc 55.859 (67.633)	Top-5 acc 76.562 (86.315)	lr 0.00003
Train [118][1790/3239]	Time 0.220 (0.533)	Data Time 0.001 (0.021)	Loss 2.2285 (2.3467)	Entropy 0.52916 (0.53050)	Top-1 acc 70.312 (67.636)	Top-5 acc 88.281 (86.320)	lr 0.00003
Train [118][1800/3239]	Time 0.214 (0.533)	Data Time 0.001 (0.021)	Loss 2.8251 (2.3471)	Entropy 0.52940 (0.53050)	Top-1 acc 52.734 (67.619)	Top-5 acc 81.250 (86.311)	lr 0.00003
Train [118][1810/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.021)	Loss 2.3264 (2.3475)	Entropy 0.52939 (0.53049)	Top-1 acc 68.359 (67.610)	Top-5 acc 85.547 (86.310)	lr 0.00003
Train [118][1820/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.021)	Loss 2.6781 (2.3478)	Entropy 0.52949 (0.53049)	Top-1 acc 60.938 (67.606)	Top-5 acc 78.906 (86.303)	lr 0.00003
Train [118][1830/3239]	Time 0.231 (0.531)	Data Time 0.001 (0.021)	Loss 2.5959 (2.3478)	Entropy 0.52961 (0.53048)	Top-1 acc 62.500 (67.606)	Top-5 acc 82.422 (86.301)	lr 0.00003
Train [118][1840/3239]	Time 0.327 (0.530)	Data Time 0.001 (0.021)	Loss 2.4423 (2.3477)	Entropy 0.52940 (0.53047)	Top-1 acc 67.188 (67.609)	Top-5 acc 83.203 (86.300)	lr 0.00003
Train [118][1850/3239]	Time 0.225 (0.529)	Data Time 0.001 (0.021)	Loss 2.2324 (2.3476)	Entropy 0.52928 (0.53047)	Top-1 acc 68.359 (67.604)	Top-5 acc 87.109 (86.301)	lr 0.00003
Train [118][1860/3239]	Time 0.233 (0.529)	Data Time 0.001 (0.021)	Loss 2.4781 (2.3473)	Entropy 0.52943 (0.53046)	Top-1 acc 66.016 (67.610)	Top-5 acc 83.984 (86.304)	lr 0.00003
Train [118][1870/3239]	Time 0.224 (0.528)	Data Time 0.001 (0.021)	Loss 2.2442 (2.3473)	Entropy 0.52946 (0.53046)	Top-1 acc 69.531 (67.605)	Top-5 acc 87.500 (86.303)	lr 0.00003
Train [118][1880/3239]	Time 0.256 (0.528)	Data Time 0.001 (0.021)	Loss 2.2197 (2.3475)	Entropy 0.52968 (0.53045)	Top-1 acc 70.312 (67.598)	Top-5 acc 88.281 (86.299)	lr 0.00003
Train [118][1890/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.020)	Loss 2.2477 (2.3472)	Entropy 0.52971 (0.53045)	Top-1 acc 68.359 (67.608)	Top-5 acc 88.281 (86.308)	lr 0.00003
Train [118][1900/3239]	Time 0.223 (0.527)	Data Time 0.001 (0.020)	Loss 2.4233 (2.3468)	Entropy 0.52999 (0.53044)	Top-1 acc 63.281 (67.616)	Top-5 acc 85.938 (86.318)	lr 0.00002
Train [118][1910/3239]	Time 0.313 (0.526)	Data Time 0.001 (0.020)	Loss 2.2723 (2.3470)	Entropy 0.52998 (0.53044)	Top-1 acc 67.578 (67.609)	Top-5 acc 88.672 (86.317)	lr 0.00002
Train [118][1920/3239]	Time 0.241 (0.525)	Data Time 0.002 (0.020)	Loss 2.2339 (2.3468)	Entropy 0.53020 (0.53044)	Top-1 acc 69.531 (67.613)	Top-5 acc 89.453 (86.318)	lr 0.00002
Train [118][1930/3239]	Time 0.227 (0.525)	Data Time 0.001 (0.020)	Loss 2.3191 (2.3468)	Entropy 0.53022 (0.53044)	Top-1 acc 66.016 (67.614)	Top-5 acc 86.328 (86.314)	lr 0.00002
Train [118][1940/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.020)	Loss 2.4152 (2.3470)	Entropy 0.53057 (0.53044)	Top-1 acc 64.453 (67.612)	Top-5 acc 85.156 (86.311)	lr 0.00002
Train [118][1950/3239]	Time 0.227 (0.523)	Data Time 0.001 (0.020)	Loss 2.5744 (2.3472)	Entropy 0.53084 (0.53044)	Top-1 acc 61.328 (67.608)	Top-5 acc 83.203 (86.307)	lr 0.00002
Train [118][1960/3239]	Time 0.208 (0.523)	Data Time 0.001 (0.020)	Loss 2.6902 (2.3471)	Entropy 0.53087 (0.53044)	Top-1 acc 57.812 (67.607)	Top-5 acc 83.594 (86.309)	lr 0.00002
Train [118][1970/3239]	Time 0.245 (0.522)	Data Time 0.006 (0.020)	Loss 2.3811 (2.3473)	Entropy 0.53112 (0.53044)	Top-1 acc 67.969 (67.602)	Top-5 acc 86.328 (86.307)	lr 0.00002
Train [118][1980/3239]	Time 0.245 (0.522)	Data Time 0.002 (0.020)	Loss 2.2092 (2.3470)	Entropy 0.53124 (0.53045)	Top-1 acc 71.875 (67.603)	Top-5 acc 88.672 (86.314)	lr 0.00002
Train [118][1990/3239]	Time 0.240 (0.521)	Data Time 0.001 (0.019)	Loss 2.1789 (2.3469)	Entropy 0.53094 (0.53045)	Top-1 acc 73.047 (67.611)	Top-5 acc 89.844 (86.317)	lr 0.00002
Train [118][2000/3239]	Time 0.261 (0.521)	Data Time 0.001 (0.019)	Loss 2.0726 (2.3466)	Entropy 0.53088 (0.53045)	Top-1 acc 72.266 (67.615)	Top-5 acc 90.234 (86.317)	lr 0.00002
Train [118][2010/3239]	Time 0.238 (0.520)	Data Time 0.001 (0.019)	Loss 2.2025 (2.3467)	Entropy 0.53096 (0.53046)	Top-1 acc 69.141 (67.609)	Top-5 acc 88.281 (86.317)	lr 0.00002
Train [118][2020/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.019)	Loss 2.4208 (2.3472)	Entropy 0.53048 (0.53046)	Top-1 acc 65.234 (67.597)	Top-5 acc 83.984 (86.310)	lr 0.00002
Train [118][2030/3239]	Time 0.236 (0.519)	Data Time 0.001 (0.019)	Loss 2.3149 (2.3472)	Entropy 0.53071 (0.53046)	Top-1 acc 66.016 (67.594)	Top-5 acc 85.547 (86.309)	lr 0.00002
Train [118][2040/3239]	Time 0.244 (0.519)	Data Time 0.001 (0.019)	Loss 2.3750 (2.3474)	Entropy 0.53054 (0.53046)	Top-1 acc 66.797 (67.589)	Top-5 acc 86.328 (86.308)	lr 0.00002
Train [118][2050/3239]	Time 0.232 (0.518)	Data Time 0.001 (0.019)	Loss 2.4106 (2.3476)	Entropy 0.53035 (0.53046)	Top-1 acc 64.062 (67.583)	Top-5 acc 83.984 (86.303)	lr 0.00002
Train [118][2060/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.019)	Loss 2.3453 (2.3474)	Entropy 0.53029 (0.53046)	Top-1 acc 63.672 (67.586)	Top-5 acc 85.547 (86.309)	lr 0.00002
Train [118][2070/3239]	Time 0.342 (0.518)	Data Time 0.001 (0.019)	Loss 2.0841 (2.3470)	Entropy 0.53005 (0.53046)	Top-1 acc 75.000 (67.591)	Top-5 acc 91.406 (86.313)	lr 0.00002
Train [118][2080/3239]	Time 0.238 (0.517)	Data Time 0.001 (0.019)	Loss 2.4386 (2.3470)	Entropy 0.52980 (0.53045)	Top-1 acc 61.719 (67.589)	Top-5 acc 85.547 (86.315)	lr 0.00002
Train [118][2090/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.019)	Loss 2.4303 (2.3470)	Entropy 0.53001 (0.53045)	Top-1 acc 67.188 (67.591)	Top-5 acc 86.328 (86.318)	lr 0.00002
Train [118][2100/3239]	Time 0.342 (0.540)	Data Time 0.035 (0.019)	Loss 2.3252 (2.3472)	Entropy 0.52983 (0.53045)	Top-1 acc 71.094 (67.581)	Top-5 acc 85.156 (86.318)	lr 0.00002
Train [118][2110/3239]	Time 0.238 (0.540)	Data Time 0.002 (0.019)	Loss 2.2670 (2.3469)	Entropy 0.52976 (0.53045)	Top-1 acc 70.312 (67.589)	Top-5 acc 88.672 (86.326)	lr 0.00002
Train [118][2120/3239]	Time 0.237 (0.539)	Data Time 0.001 (0.018)	Loss 2.3349 (2.3470)	Entropy 0.52971 (0.53044)	Top-1 acc 69.922 (67.584)	Top-5 acc 86.719 (86.326)	lr 0.00002
Train [118][2130/3239]	Time 0.227 (0.538)	Data Time 0.001 (0.018)	Loss 2.2797 (2.3471)	Entropy 0.53011 (0.53044)	Top-1 acc 68.359 (67.583)	Top-5 acc 88.672 (86.324)	lr 0.00002
Train [118][2140/3239]	Time 0.238 (0.538)	Data Time 0.002 (0.018)	Loss 2.1499 (2.3469)	Entropy 0.53060 (0.53044)	Top-1 acc 71.875 (67.589)	Top-5 acc 89.844 (86.328)	lr 0.00002
Train [118][2150/3239]	Time 0.248 (0.538)	Data Time 0.002 (0.018)	Loss 2.2583 (2.3468)	Entropy 0.53105 (0.53044)	Top-1 acc 68.359 (67.588)	Top-5 acc 87.891 (86.326)	lr 0.00002
Train [118][2160/3239]	Time 0.311 (0.537)	Data Time 0.001 (0.018)	Loss 2.3104 (2.3466)	Entropy 0.53072 (0.53044)	Top-1 acc 67.578 (67.593)	Top-5 acc 87.891 (86.330)	lr 0.00002
Train [118][2170/3239]	Time 0.308 (0.537)	Data Time 0.002 (0.018)	Loss 2.3217 (2.3465)	Entropy 0.53065 (0.53044)	Top-1 acc 69.531 (67.596)	Top-5 acc 87.109 (86.333)	lr 0.00002
Train [118][2180/3239]	Time 0.238 (0.536)	Data Time 0.001 (0.018)	Loss 2.2725 (2.3462)	Entropy 0.53070 (0.53045)	Top-1 acc 70.312 (67.606)	Top-5 acc 89.844 (86.339)	lr 0.00002
Train [118][2190/3239]	Time 0.257 (0.536)	Data Time 0.001 (0.018)	Loss 2.3396 (2.3462)	Entropy 0.53078 (0.53045)	Top-1 acc 67.188 (67.603)	Top-5 acc 86.328 (86.337)	lr 0.00002
Train [118][2200/3239]	Time 0.230 (0.535)	Data Time 0.001 (0.018)	Loss 2.3928 (2.3459)	Entropy 0.53062 (0.53045)	Top-1 acc 64.844 (67.612)	Top-5 acc 86.328 (86.344)	lr 0.00002
Train [118][2210/3239]	Time 0.267 (0.535)	Data Time 0.001 (0.018)	Loss 2.2186 (2.3458)	Entropy 0.53068 (0.53045)	Top-1 acc 72.656 (67.618)	Top-5 acc 89.062 (86.344)	lr 0.00002
Train [118][2220/3239]	Time 0.231 (0.534)	Data Time 0.001 (0.018)	Loss 2.2393 (2.3457)	Entropy 0.53083 (0.53045)	Top-1 acc 69.922 (67.625)	Top-5 acc 87.891 (86.349)	lr 0.00002
Train [118][2230/3239]	Time 0.341 (0.534)	Data Time 0.001 (0.018)	Loss 2.3073 (2.3454)	Entropy 0.53084 (0.53045)	Top-1 acc 68.750 (67.630)	Top-5 acc 85.547 (86.352)	lr 0.00002
Train [118][2240/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.018)	Loss 2.4008 (2.3455)	Entropy 0.53108 (0.53045)	Top-1 acc 67.578 (67.625)	Top-5 acc 86.719 (86.353)	lr 0.00002
Train [118][2250/3239]	Time 0.231 (0.533)	Data Time 0.001 (0.017)	Loss 2.3396 (2.3455)	Entropy 0.53124 (0.53046)	Top-1 acc 66.797 (67.626)	Top-5 acc 86.719 (86.355)	lr 0.00002
Train [118][2260/3239]	Time 0.318 (0.532)	Data Time 0.002 (0.017)	Loss 2.4691 (2.3456)	Entropy 0.53127 (0.53046)	Top-1 acc 65.625 (67.626)	Top-5 acc 84.375 (86.355)	lr 0.00002
Train [118][2270/3239]	Time 0.260 (0.532)	Data Time 0.001 (0.017)	Loss 2.3850 (2.3457)	Entropy 0.53139 (0.53047)	Top-1 acc 71.094 (67.622)	Top-5 acc 83.984 (86.350)	lr 0.00002
Train [118][2280/3239]	Time 0.249 (0.532)	Data Time 0.001 (0.017)	Loss 2.4723 (2.3456)	Entropy 0.53117 (0.53047)	Top-1 acc 61.719 (67.623)	Top-5 acc 84.375 (86.356)	lr 0.00002
Train [118][2290/3239]	Time 0.223 (0.531)	Data Time 0.001 (0.017)	Loss 2.5604 (2.3463)	Entropy 0.53101 (0.53047)	Top-1 acc 58.594 (67.605)	Top-5 acc 81.250 (86.349)	lr 0.00002
Train [118][2300/3239]	Time 0.349 (0.531)	Data Time 0.001 (0.017)	Loss 2.3550 (2.3463)	Entropy 0.53093 (0.53047)	Top-1 acc 66.016 (67.602)	Top-5 acc 87.109 (86.347)	lr 0.00002
Train [118][2310/3239]	Time 0.229 (0.530)	Data Time 0.001 (0.017)	Loss 2.2546 (2.3463)	Entropy 0.53084 (0.53048)	Top-1 acc 71.484 (67.608)	Top-5 acc 87.500 (86.347)	lr 0.00002
Train [118][2320/3239]	Time 0.233 (0.530)	Data Time 0.001 (0.017)	Loss 2.2809 (2.3462)	Entropy 0.53081 (0.53048)	Top-1 acc 68.750 (67.610)	Top-5 acc 88.672 (86.344)	lr 0.00002
Train [118][2330/3239]	Time 0.234 (0.529)	Data Time 0.001 (0.017)	Loss 2.2864 (2.3465)	Entropy 0.53103 (0.53048)	Top-1 acc 70.703 (67.601)	Top-5 acc 85.547 (86.339)	lr 0.00002
Train [118][2340/3239]	Time 0.230 (0.528)	Data Time 0.001 (0.017)	Loss 2.1579 (2.3465)	Entropy 0.53090 (0.53048)	Top-1 acc 69.922 (67.597)	Top-5 acc 87.500 (86.336)	lr 0.00002
Train [118][2350/3239]	Time 0.261 (0.528)	Data Time 0.001 (0.017)	Loss 2.2810 (2.3466)	Entropy 0.53117 (0.53048)	Top-1 acc 69.531 (67.594)	Top-5 acc 86.719 (86.339)	lr 0.00002
Train [118][2360/3239]	Time 0.225 (0.528)	Data Time 0.001 (0.017)	Loss 2.3245 (2.3464)	Entropy 0.53144 (0.53049)	Top-1 acc 70.312 (67.601)	Top-5 acc 86.328 (86.343)	lr 0.00002
Train [118][2370/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.017)	Loss 2.2551 (2.3464)	Entropy 0.53149 (0.53049)	Top-1 acc 72.266 (67.599)	Top-5 acc 89.062 (86.343)	lr 0.00002
Train [118][2380/3239]	Time 0.284 (0.527)	Data Time 0.001 (0.017)	Loss 2.2962 (2.3462)	Entropy 0.53153 (0.53050)	Top-1 acc 70.703 (67.605)	Top-5 acc 86.719 (86.346)	lr 0.00002
Train [118][2390/3239]	Time 0.343 (0.526)	Data Time 0.001 (0.017)	Loss 2.6311 (2.3463)	Entropy 0.53126 (0.53050)	Top-1 acc 61.328 (67.608)	Top-5 acc 81.250 (86.342)	lr 0.00002
Train [118][2400/3239]	Time 0.226 (0.526)	Data Time 0.001 (0.016)	Loss 2.3686 (2.3466)	Entropy 0.53115 (0.53050)	Top-1 acc 66.797 (67.598)	Top-5 acc 85.938 (86.337)	lr 0.00002
Train [118][2410/3239]	Time 0.256 (0.526)	Data Time 0.001 (0.016)	Loss 2.4237 (2.3466)	Entropy 0.53114 (0.53050)	Top-1 acc 66.797 (67.600)	Top-5 acc 82.422 (86.335)	lr 0.00002
Train [118][2420/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.016)	Loss 2.2489 (2.3466)	Entropy 0.53103 (0.53051)	Top-1 acc 65.625 (67.600)	Top-5 acc 88.281 (86.336)	lr 0.00002
Train [118][2430/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.016)	Loss 2.4045 (2.3465)	Entropy 0.53091 (0.53051)	Top-1 acc 67.969 (67.602)	Top-5 acc 85.938 (86.335)	lr 0.00002
Train [118][2440/3239]	Time 0.221 (0.524)	Data Time 0.001 (0.016)	Loss 2.7655 (2.3466)	Entropy 0.53112 (0.53051)	Top-1 acc 58.594 (67.598)	Top-5 acc 78.906 (86.333)	lr 0.00002
Train [118][2450/3239]	Time 0.234 (0.524)	Data Time 0.001 (0.016)	Loss 2.3622 (2.3465)	Entropy 0.53132 (0.53051)	Top-1 acc 70.312 (67.606)	Top-5 acc 82.812 (86.334)	lr 0.00002
Train [118][2460/3239]	Time 0.332 (0.523)	Data Time 0.001 (0.016)	Loss 2.2990 (2.3465)	Entropy 0.53118 (0.53052)	Top-1 acc 67.578 (67.609)	Top-5 acc 88.281 (86.334)	lr 0.00002
Train [118][2470/3239]	Time 0.229 (0.523)	Data Time 0.001 (0.016)	Loss 2.2799 (2.3468)	Entropy 0.53120 (0.53052)	Top-1 acc 68.750 (67.596)	Top-5 acc 88.672 (86.327)	lr 0.00002
Train [118][2480/3239]	Time 0.233 (0.522)	Data Time 0.001 (0.016)	Loss 2.2555 (2.3467)	Entropy 0.53135 (0.53052)	Top-1 acc 71.484 (67.604)	Top-5 acc 88.281 (86.329)	lr 0.00002
Train [118][2490/3239]	Time 0.266 (0.522)	Data Time 0.001 (0.016)	Loss 2.4322 (2.3468)	Entropy 0.53109 (0.53053)	Top-1 acc 66.797 (67.602)	Top-5 acc 85.156 (86.326)	lr 0.00002
Train [118][2500/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.016)	Loss 2.3721 (2.3469)	Entropy 0.53138 (0.53053)	Top-1 acc 67.188 (67.601)	Top-5 acc 83.203 (86.324)	lr 0.00002
Train [118][2510/3239]	Time 0.270 (0.521)	Data Time 0.001 (0.016)	Loss 2.3672 (2.3468)	Entropy 0.53138 (0.53053)	Top-1 acc 69.531 (67.603)	Top-5 acc 85.156 (86.326)	lr 0.00002
Train [118][2520/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.016)	Loss 2.6997 (2.3470)	Entropy 0.53152 (0.53053)	Top-1 acc 59.766 (67.602)	Top-5 acc 80.078 (86.321)	lr 0.00002
Train [118][2530/3239]	Time 0.267 (0.520)	Data Time 0.001 (0.016)	Loss 2.2490 (2.3471)	Entropy 0.53145 (0.53054)	Top-1 acc 70.312 (67.598)	Top-5 acc 87.109 (86.320)	lr 0.00002
Train [118][2540/3239]	Time 0.230 (0.520)	Data Time 0.001 (0.016)	Loss 2.5716 (2.3471)	Entropy 0.53159 (0.53054)	Top-1 acc 64.062 (67.597)	Top-5 acc 85.156 (86.322)	lr 0.00002
Train [118][2550/3239]	Time 0.245 (0.519)	Data Time 0.001 (0.016)	Loss 2.7780 (2.3472)	Entropy 0.53207 (0.53055)	Top-1 acc 57.031 (67.592)	Top-5 acc 80.078 (86.318)	lr 0.00002
Train [118][2560/3239]	Time 0.232 (0.519)	Data Time 0.001 (0.016)	Loss 2.2476 (2.3472)	Entropy 0.53221 (0.53055)	Top-1 acc 71.094 (67.594)	Top-5 acc 86.719 (86.318)	lr 0.00002
Train [118][2570/3239]	Time 0.233 (0.519)	Data Time 0.001 (0.016)	Loss 2.2895 (2.3473)	Entropy 0.53213 (0.53056)	Top-1 acc 67.969 (67.587)	Top-5 acc 87.891 (86.317)	lr 0.00002
Train [118][2580/3239]	Time 0.234 (0.518)	Data Time 0.001 (0.015)	Loss 2.2248 (2.3471)	Entropy 0.53205 (0.53057)	Top-1 acc 71.094 (67.590)	Top-5 acc 88.672 (86.320)	lr 0.00002
Train [118][2590/3239]	Time 0.223 (0.518)	Data Time 0.001 (0.015)	Loss 2.1611 (2.3468)	Entropy 0.53223 (0.53057)	Top-1 acc 73.047 (67.598)	Top-5 acc 90.625 (86.326)	lr 0.00002
Train [118][2600/3239]	Time 0.239 (0.517)	Data Time 0.001 (0.015)	Loss 2.3242 (2.3469)	Entropy 0.53222 (0.53058)	Top-1 acc 66.406 (67.595)	Top-5 acc 86.719 (86.323)	lr 0.00002
Train [118][2610/3239]	Time 0.225 (0.517)	Data Time 0.001 (0.015)	Loss 2.2480 (2.3470)	Entropy 0.53249 (0.53059)	Top-1 acc 69.141 (67.596)	Top-5 acc 87.891 (86.321)	lr 0.00002
Train [118][2620/3239]	Time 0.322 (0.516)	Data Time 0.001 (0.015)	Loss 2.3973 (2.3470)	Entropy 0.53268 (0.53059)	Top-1 acc 68.359 (67.596)	Top-5 acc 85.156 (86.320)	lr 0.00002
Train [118][2630/3239]	Time 0.226 (0.516)	Data Time 0.001 (0.015)	Loss 2.3568 (2.3471)	Entropy 0.53292 (0.53060)	Top-1 acc 66.406 (67.596)	Top-5 acc 86.328 (86.319)	lr 0.00002
Train [118][2640/3239]	Time 0.236 (0.516)	Data Time 0.001 (0.015)	Loss 2.4232 (2.3472)	Entropy 0.53301 (0.53061)	Top-1 acc 64.844 (67.592)	Top-5 acc 85.156 (86.317)	lr 0.00002
Train [118][2650/3239]	Time 0.228 (0.515)	Data Time 0.001 (0.015)	Loss 2.4192 (2.3472)	Entropy 0.53262 (0.53062)	Top-1 acc 63.281 (67.594)	Top-5 acc 85.938 (86.316)	lr 0.00002
Train [118][2660/3239]	Time 0.224 (0.515)	Data Time 0.001 (0.015)	Loss 2.7578 (2.3473)	Entropy 0.53206 (0.53063)	Top-1 acc 55.859 (67.590)	Top-5 acc 80.859 (86.312)	lr 0.00002
Train [118][2670/3239]	Time 0.230 (0.515)	Data Time 0.002 (0.015)	Loss 2.4691 (2.3474)	Entropy 0.53213 (0.53063)	Top-1 acc 66.406 (67.591)	Top-5 acc 84.375 (86.309)	lr 0.00002
Train [118][2680/3239]	Time 0.221 (0.514)	Data Time 0.001 (0.015)	Loss 2.1486 (2.3477)	Entropy 0.53201 (0.53064)	Top-1 acc 69.531 (67.584)	Top-5 acc 89.062 (86.303)	lr 0.00002
Train [118][2690/3239]	Time 0.331 (0.514)	Data Time 0.001 (0.015)	Loss 2.3622 (2.3480)	Entropy 0.53187 (0.53064)	Top-1 acc 65.625 (67.572)	Top-5 acc 86.719 (86.297)	lr 0.00002
Train [118][2700/3239]	Time 0.225 (0.513)	Data Time 0.001 (0.015)	Loss 2.2893 (2.3479)	Entropy 0.53184 (0.53065)	Top-1 acc 68.750 (67.577)	Top-5 acc 87.109 (86.298)	lr 0.00002
Train [118][2710/3239]	Time 0.231 (0.513)	Data Time 0.001 (0.015)	Loss 2.1961 (2.3480)	Entropy 0.53194 (0.53065)	Top-1 acc 71.875 (67.569)	Top-5 acc 87.891 (86.297)	lr 0.00002
Train [118][2720/3239]	Time 0.237 (0.513)	Data Time 0.001 (0.015)	Loss 2.2984 (2.3481)	Entropy 0.53181 (0.53065)	Top-1 acc 69.531 (67.569)	Top-5 acc 87.500 (86.295)	lr 0.00002
Train [118][2730/3239]	Time 0.237 (0.512)	Data Time 0.001 (0.015)	Loss 2.3575 (2.3480)	Entropy 0.53180 (0.53066)	Top-1 acc 66.797 (67.564)	Top-5 acc 85.938 (86.297)	lr 0.00002
Train [118][2740/3239]	Time 0.219 (0.512)	Data Time 0.001 (0.015)	Loss 2.5222 (2.3479)	Entropy 0.53155 (0.53066)	Top-1 acc 60.547 (67.566)	Top-5 acc 83.984 (86.301)	lr 0.00002
Train [118][2750/3239]	Time 0.239 (0.511)	Data Time 0.001 (0.015)	Loss 2.2623 (2.3480)	Entropy 0.53145 (0.53067)	Top-1 acc 67.969 (67.564)	Top-5 acc 87.891 (86.300)	lr 0.00002
Train [118][2760/3239]	Time 0.356 (0.530)	Data Time 0.004 (0.015)	Loss 2.1394 (2.3482)	Entropy 0.53132 (0.53067)	Top-1 acc 70.312 (67.560)	Top-5 acc 90.625 (86.295)	lr 0.00002
Train [118][2770/3239]	Time 0.256 (0.530)	Data Time 0.002 (0.015)	Loss 2.3462 (2.3482)	Entropy 0.53134 (0.53067)	Top-1 acc 67.969 (67.563)	Top-5 acc 87.500 (86.294)	lr 0.00002
Train [118][2780/3239]	Time 0.334 (0.530)	Data Time 0.001 (0.014)	Loss 2.2580 (2.3485)	Entropy 0.53142 (0.53067)	Top-1 acc 69.922 (67.556)	Top-5 acc 86.328 (86.290)	lr 0.00002
Train [118][2790/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.014)	Loss 2.3987 (2.3486)	Entropy 0.53135 (0.53068)	Top-1 acc 66.797 (67.556)	Top-5 acc 85.156 (86.290)	lr 0.00002
Train [118][2800/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.014)	Loss 2.4505 (2.3488)	Entropy 0.53152 (0.53068)	Top-1 acc 62.500 (67.548)	Top-5 acc 85.156 (86.285)	lr 0.00002
Train [118][2810/3239]	Time 0.241 (0.528)	Data Time 0.001 (0.014)	Loss 2.4281 (2.3489)	Entropy 0.53162 (0.53068)	Top-1 acc 64.844 (67.544)	Top-5 acc 85.938 (86.288)	lr 0.00002
Train [118][2820/3239]	Time 0.247 (0.528)	Data Time 0.001 (0.014)	Loss 2.2484 (2.3489)	Entropy 0.53181 (0.53068)	Top-1 acc 71.875 (67.546)	Top-5 acc 86.719 (86.288)	lr 0.00002
Train [118][2830/3239]	Time 0.275 (0.528)	Data Time 0.003 (0.014)	Loss 2.4940 (2.3488)	Entropy 0.53147 (0.53069)	Top-1 acc 62.109 (67.551)	Top-5 acc 82.422 (86.291)	lr 0.00002
Train [118][2840/3239]	Time 0.276 (0.528)	Data Time 0.001 (0.014)	Loss 2.1353 (2.3484)	Entropy 0.53143 (0.53069)	Top-1 acc 71.484 (67.559)	Top-5 acc 90.234 (86.296)	lr 0.00002
Train [118][2850/3239]	Time 0.401 (0.527)	Data Time 0.002 (0.014)	Loss 2.0953 (2.3482)	Entropy 0.53148 (0.53069)	Top-1 acc 71.875 (67.565)	Top-5 acc 91.016 (86.301)	lr 0.00002
Train [118][2860/3239]	Time 0.254 (0.527)	Data Time 0.001 (0.014)	Loss 2.2631 (2.3480)	Entropy 0.53110 (0.53070)	Top-1 acc 68.359 (67.568)	Top-5 acc 87.891 (86.301)	lr 0.00002
Train [118][2870/3239]	Time 0.286 (0.527)	Data Time 0.002 (0.014)	Loss 2.2979 (2.3479)	Entropy 0.53126 (0.53070)	Top-1 acc 69.922 (67.573)	Top-5 acc 87.891 (86.304)	lr 0.00002
Train [118][2880/3239]	Time 0.294 (0.527)	Data Time 0.002 (0.014)	Loss 2.3316 (2.3479)	Entropy 0.53118 (0.53070)	Top-1 acc 66.406 (67.572)	Top-5 acc 87.500 (86.306)	lr 0.00002
Train [118][2890/3239]	Time 0.239 (0.527)	Data Time 0.001 (0.014)	Loss 2.8451 (2.3478)	Entropy 0.53114 (0.53070)	Top-1 acc 55.078 (67.573)	Top-5 acc 77.344 (86.307)	lr 0.00002
Train [118][2900/3239]	Time 0.234 (0.526)	Data Time 0.001 (0.014)	Loss 2.2223 (2.3478)	Entropy 0.53093 (0.53070)	Top-1 acc 75.391 (67.577)	Top-5 acc 88.281 (86.307)	lr 0.00002
Train [118][2910/3239]	Time 0.262 (0.526)	Data Time 0.001 (0.014)	Loss 2.4401 (2.3479)	Entropy 0.53070 (0.53070)	Top-1 acc 64.453 (67.572)	Top-5 acc 85.938 (86.305)	lr 0.00002
Train [118][2920/3239]	Time 0.305 (0.526)	Data Time 0.008 (0.014)	Loss 2.3398 (2.3478)	Entropy 0.53098 (0.53070)	Top-1 acc 65.234 (67.575)	Top-5 acc 88.281 (86.305)	lr 0.00002
Train [118][2930/3239]	Time 0.240 (0.525)	Data Time 0.001 (0.014)	Loss 2.6410 (2.3480)	Entropy 0.53132 (0.53070)	Top-1 acc 60.938 (67.571)	Top-5 acc 80.859 (86.300)	lr 0.00002
Train [118][2940/3239]	Time 0.352 (0.525)	Data Time 0.001 (0.014)	Loss 2.2589 (2.3482)	Entropy 0.53141 (0.53071)	Top-1 acc 71.484 (67.570)	Top-5 acc 89.062 (86.298)	lr 0.00002
Train [118][2950/3239]	Time 0.303 (0.525)	Data Time 0.002 (0.014)	Loss 2.6296 (2.3482)	Entropy 0.53127 (0.53071)	Top-1 acc 65.234 (67.572)	Top-5 acc 82.031 (86.297)	lr 0.00002
Train [118][2960/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.014)	Loss 2.3237 (2.3482)	Entropy 0.53078 (0.53071)	Top-1 acc 69.531 (67.574)	Top-5 acc 87.109 (86.298)	lr 0.00002
Train [118][2970/3239]	Time 0.239 (0.524)	Data Time 0.001 (0.014)	Loss 2.2881 (2.3479)	Entropy 0.53096 (0.53071)	Top-1 acc 69.141 (67.585)	Top-5 acc 87.500 (86.305)	lr 0.00002
Train [118][2980/3239]	Time 0.247 (0.524)	Data Time 0.002 (0.014)	Loss 2.5742 (2.3480)	Entropy 0.53075 (0.53071)	Top-1 acc 63.281 (67.583)	Top-5 acc 82.422 (86.302)	lr 0.00002
Train [118][2990/3239]	Time 0.287 (0.524)	Data Time 0.002 (0.014)	Loss 2.2590 (2.3482)	Entropy 0.53093 (0.53071)	Top-1 acc 75.000 (67.582)	Top-5 acc 87.500 (86.297)	lr 0.00002
Train [118][3000/3239]	Time 0.229 (0.523)	Data Time 0.001 (0.014)	Loss 2.2558 (2.3483)	Entropy 0.53123 (0.53071)	Top-1 acc 68.359 (67.582)	Top-5 acc 86.719 (86.293)	lr 0.00002
Train [118][3010/3239]	Time 0.365 (0.523)	Data Time 0.001 (0.014)	Loss 2.4184 (2.3484)	Entropy 0.53138 (0.53071)	Top-1 acc 64.062 (67.582)	Top-5 acc 85.156 (86.289)	lr 0.00002
Train [118][3020/3239]	Time 0.235 (0.523)	Data Time 0.001 (0.013)	Loss 2.6230 (2.3483)	Entropy 0.53111 (0.53072)	Top-1 acc 57.031 (67.583)	Top-5 acc 82.812 (86.292)	lr 0.00002
Train [118][3030/3239]	Time 0.285 (0.523)	Data Time 0.001 (0.013)	Loss 2.3451 (2.3483)	Entropy 0.53120 (0.53072)	Top-1 acc 65.625 (67.583)	Top-5 acc 85.938 (86.292)	lr 0.00002
Train [118][3040/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.013)	Loss 2.6700 (2.3486)	Entropy 0.53128 (0.53072)	Top-1 acc 58.203 (67.576)	Top-5 acc 82.031 (86.288)	lr 0.00002
Train [118][3050/3239]	Time 0.257 (0.522)	Data Time 0.001 (0.013)	Loss 2.3507 (2.3486)	Entropy 0.53129 (0.53072)	Top-1 acc 67.969 (67.573)	Top-5 acc 85.547 (86.286)	lr 0.00002
Train [118][3060/3239]	Time 0.293 (0.522)	Data Time 0.003 (0.013)	Loss 2.4555 (2.3488)	Entropy 0.53113 (0.53072)	Top-1 acc 66.406 (67.569)	Top-5 acc 84.766 (86.285)	lr 0.00002
Train [118][3070/3239]	Time 0.240 (0.521)	Data Time 0.001 (0.013)	Loss 2.3278 (2.3488)	Entropy 0.53096 (0.53072)	Top-1 acc 66.797 (67.567)	Top-5 acc 87.500 (86.287)	lr 0.00002
Train [118][3080/3239]	Time 0.276 (0.521)	Data Time 0.001 (0.013)	Loss 2.4155 (2.3487)	Entropy 0.53081 (0.53072)	Top-1 acc 68.359 (67.571)	Top-5 acc 83.594 (86.286)	lr 0.00002
Train [118][3090/3239]	Time 0.227 (0.521)	Data Time 0.001 (0.013)	Loss 2.4007 (2.3486)	Entropy 0.53089 (0.53072)	Top-1 acc 67.969 (67.577)	Top-5 acc 85.547 (86.291)	lr 0.00002
Train [118][3100/3239]	Time 0.416 (0.521)	Data Time 0.001 (0.013)	Loss 2.5172 (2.3484)	Entropy 0.53110 (0.53073)	Top-1 acc 67.969 (67.587)	Top-5 acc 85.156 (86.293)	lr 0.00002
Train [118][3110/3239]	Time 0.244 (0.520)	Data Time 0.001 (0.013)	Loss 3.0548 (2.3487)	Entropy 0.53099 (0.53073)	Top-1 acc 50.781 (67.576)	Top-5 acc 73.828 (86.287)	lr 0.00002
Train [118][3120/3239]	Time 0.300 (0.520)	Data Time 0.002 (0.013)	Loss 2.2467 (2.3486)	Entropy 0.53121 (0.53073)	Top-1 acc 69.922 (67.577)	Top-5 acc 87.891 (86.291)	lr 0.00002
Train [118][3130/3239]	Time 0.263 (0.520)	Data Time 0.001 (0.013)	Loss 2.3556 (2.3489)	Entropy 0.53127 (0.53073)	Top-1 acc 67.969 (67.572)	Top-5 acc 85.938 (86.286)	lr 0.00002
Train [118][3140/3239]	Time 0.240 (0.520)	Data Time 0.001 (0.013)	Loss 2.5214 (2.3489)	Entropy 0.53099 (0.53073)	Top-1 acc 57.812 (67.571)	Top-5 acc 83.984 (86.286)	lr 0.00002
Train [118][3150/3239]	Time 0.356 (0.520)	Data Time 0.002 (0.013)	Loss 2.4722 (2.3491)	Entropy 0.53155 (0.53073)	Top-1 acc 63.281 (67.567)	Top-5 acc 83.984 (86.282)	lr 0.00002
Train [118][3160/3239]	Time 0.237 (0.520)	Data Time 0.001 (0.013)	Loss 2.3496 (2.3488)	Entropy 0.53169 (0.53074)	Top-1 acc 67.188 (67.576)	Top-5 acc 85.156 (86.285)	lr 0.00002
Train [118][3170/3239]	Time 0.358 (0.520)	Data Time 0.001 (0.013)	Loss 2.2719 (2.3487)	Entropy 0.53172 (0.53074)	Top-1 acc 73.828 (67.579)	Top-5 acc 87.109 (86.287)	lr 0.00002
Train [118][3180/3239]	Time 0.239 (0.519)	Data Time 0.000 (0.013)	Loss 2.1961 (2.3485)	Entropy 0.53181 (0.53074)	Top-1 acc 71.875 (67.587)	Top-5 acc 85.938 (86.289)	lr 0.00002
Train [118][3190/3239]	Time 0.236 (0.519)	Data Time 0.000 (0.013)	Loss 2.2497 (2.3485)	Entropy 0.53168 (0.53075)	Top-1 acc 69.531 (67.588)	Top-5 acc 88.281 (86.289)	lr 0.00002
Train [118][3200/3239]	Time 0.228 (0.519)	Data Time 0.000 (0.013)	Loss 2.2254 (2.3486)	Entropy 0.53178 (0.53075)	Top-1 acc 67.969 (67.586)	Top-5 acc 86.328 (86.288)	lr 0.00002
Train [118][3210/3239]	Time 0.225 (0.518)	Data Time 0.000 (0.013)	Loss 2.2543 (2.3484)	Entropy 0.53184 (0.53075)	Top-1 acc 70.312 (67.588)	Top-5 acc 87.500 (86.289)	lr 0.00002
Train [118][3220/3239]	Time 0.234 (0.518)	Data Time 0.000 (0.013)	Loss 2.2720 (2.3484)	Entropy 0.53177 (0.53076)	Top-1 acc 67.969 (67.590)	Top-5 acc 89.844 (86.289)	lr 0.00002
Train [118][3230/3239]	Time 0.229 (0.517)	Data Time 0.000 (0.013)	Loss 2.3328 (2.3484)	Entropy 0.53198 (0.53076)	Top-1 acc 67.969 (67.587)	Top-5 acc 86.328 (86.290)	lr 0.00002
Train [118][3239/3239]	Time 0.986 (0.517)	Data Time 0.000 (0.013)	Loss 2.7892 (2.3484)	Entropy 0.53214 (0.53076)	Top-1 acc 61.728 (67.588)	Top-5 acc 75.309 (86.288)	lr 0.00002
==========Valid [118/120]	loss 1.169	top-1 acc 73.053 (73.178)	top-5 acc 90.617	Train top-1 67.588	top-5 86.288	Entropy 0.53214	Latency-None: 0.000ms	Flops: 539.00M
Train [119][0/3239]	Time 40.770 (40.770)	Data Time 39.310 (39.310)	Loss 2.4020 (2.4020)	Entropy 0.53198 (0.53198)	Top-1 acc 69.531 (69.531)	Top-5 acc 85.938 (85.938)	lr 0.00002
Train [119][10/3239]	Time 0.282 (4.228)	Data Time 0.002 (3.596)	Loss 2.3818 (2.3806)	Entropy 0.53207 (0.53203)	Top-1 acc 66.016 (67.188)	Top-5 acc 88.281 (86.435)	lr 0.00002
Train [119][20/3239]	Time 0.242 (2.419)	Data Time 0.001 (1.885)	Loss 2.2774 (2.3407)	Entropy 0.53209 (0.53209)	Top-1 acc 71.875 (68.099)	Top-5 acc 87.500 (86.626)	lr 0.00002
Train [119][30/3239]	Time 0.250 (1.778)	Data Time 0.001 (1.277)	Loss 2.1870 (2.3321)	Entropy 0.53195 (0.53211)	Top-1 acc 71.484 (67.956)	Top-5 acc 89.453 (86.668)	lr 0.00002
Train [119][40/3239]	Time 0.245 (1.447)	Data Time 0.001 (0.966)	Loss 2.3737 (2.3459)	Entropy 0.53167 (0.53204)	Top-1 acc 69.531 (67.759)	Top-5 acc 87.500 (86.538)	lr 0.00002
Train [119][50/3239]	Time 0.239 (1.249)	Data Time 0.001 (0.777)	Loss 2.3266 (2.3453)	Entropy 0.53121 (0.53193)	Top-1 acc 70.312 (67.961)	Top-5 acc 85.938 (86.451)	lr 0.00002
Train [119][60/3239]	Time 0.242 (1.113)	Data Time 0.002 (0.650)	Loss 2.0846 (2.3354)	Entropy 0.53093 (0.53180)	Top-1 acc 76.953 (68.257)	Top-5 acc 89.844 (86.629)	lr 0.00002
Train [119][70/3239]	Time 0.318 (1.016)	Data Time 0.001 (0.559)	Loss 2.4238 (2.3402)	Entropy 0.53098 (0.53168)	Top-1 acc 64.062 (67.875)	Top-5 acc 85.547 (86.543)	lr 0.00002
Train [119][80/3239]	Time 0.230 (0.941)	Data Time 0.001 (0.490)	Loss 2.2225 (2.3528)	Entropy 0.53108 (0.53160)	Top-1 acc 72.656 (67.646)	Top-5 acc 87.891 (86.347)	lr 0.00002
Train [119][90/3239]	Time 0.232 (0.880)	Data Time 0.001 (0.436)	Loss 2.4158 (2.3581)	Entropy 0.53132 (0.53156)	Top-1 acc 61.328 (67.363)	Top-5 acc 85.547 (86.307)	lr 0.00002
Train [119][100/3239]	Time 0.243 (0.835)	Data Time 0.001 (0.393)	Loss 2.3620 (2.3633)	Entropy 0.53193 (0.53155)	Top-1 acc 67.969 (67.195)	Top-5 acc 83.594 (86.173)	lr 0.00002
Train [119][110/3239]	Time 0.229 (0.796)	Data Time 0.001 (0.358)	Loss 2.4611 (2.3667)	Entropy 0.53160 (0.53157)	Top-1 acc 66.406 (67.082)	Top-5 acc 83.203 (86.099)	lr 0.00002
Train [119][120/3239]	Time 0.227 (0.763)	Data Time 0.001 (0.328)	Loss 2.1916 (2.3597)	Entropy 0.53151 (0.53157)	Top-1 acc 71.875 (67.239)	Top-5 acc 89.844 (86.163)	lr 0.00002
Train [119][130/3239]	Time 0.245 (0.737)	Data Time 0.001 (0.303)	Loss 2.2481 (2.3673)	Entropy 0.53148 (0.53157)	Top-1 acc 72.656 (67.113)	Top-5 acc 88.672 (86.033)	lr 0.00002
Train [119][140/3239]	Time 0.236 (0.714)	Data Time 0.001 (0.282)	Loss 2.1409 (2.3708)	Entropy 0.53144 (0.53156)	Top-1 acc 72.266 (67.010)	Top-5 acc 91.016 (85.982)	lr 0.00002
Train [119][150/3239]	Time 0.213 (0.694)	Data Time 0.001 (0.263)	Loss 2.5313 (2.3668)	Entropy 0.53116 (0.53154)	Top-1 acc 64.062 (67.128)	Top-5 acc 82.812 (86.036)	lr 0.00002
Train [119][160/3239]	Time 0.314 (0.676)	Data Time 0.001 (0.247)	Loss 2.4017 (2.3665)	Entropy 0.53120 (0.53152)	Top-1 acc 66.797 (67.056)	Top-5 acc 84.766 (86.076)	lr 0.00002
Train [119][170/3239]	Time 0.288 (0.957)	Data Time 0.004 (0.233)	Loss 2.6682 (2.3636)	Entropy 0.53122 (0.53150)	Top-1 acc 59.375 (67.133)	Top-5 acc 79.688 (86.093)	lr 0.00002
Train [119][180/3239]	Time 0.237 (0.929)	Data Time 0.002 (0.220)	Loss 2.4331 (2.3648)	Entropy 0.53127 (0.53148)	Top-1 acc 64.062 (67.093)	Top-5 acc 84.375 (86.069)	lr 0.00002
Train [119][190/3239]	Time 0.236 (0.904)	Data Time 0.001 (0.209)	Loss 2.4587 (2.3604)	Entropy 0.53110 (0.53147)	Top-1 acc 64.062 (67.188)	Top-5 acc 84.375 (86.160)	lr 0.00002
Train [119][200/3239]	Time 0.228 (0.880)	Data Time 0.001 (0.199)	Loss 2.1892 (2.3615)	Entropy 0.53134 (0.53145)	Top-1 acc 70.312 (67.149)	Top-5 acc 88.281 (86.122)	lr 0.00002
Train [119][210/3239]	Time 0.227 (0.858)	Data Time 0.001 (0.189)	Loss 2.4322 (2.3590)	Entropy 0.53135 (0.53145)	Top-1 acc 66.016 (67.163)	Top-5 acc 83.203 (86.178)	lr 0.00002
Train [119][220/3239]	Time 0.231 (0.838)	Data Time 0.001 (0.181)	Loss 2.2490 (2.3567)	Entropy 0.53074 (0.53144)	Top-1 acc 72.266 (67.281)	Top-5 acc 86.328 (86.196)	lr 0.00002
Train [119][230/3239]	Time 0.317 (0.819)	Data Time 0.001 (0.173)	Loss 2.3957 (2.3590)	Entropy 0.53091 (0.53141)	Top-1 acc 66.406 (67.270)	Top-5 acc 85.938 (86.156)	lr 0.00002
Train [119][240/3239]	Time 0.228 (0.802)	Data Time 0.001 (0.166)	Loss 2.2108 (2.3586)	Entropy 0.53121 (0.53139)	Top-1 acc 68.359 (67.244)	Top-5 acc 87.500 (86.130)	lr 0.00002
Train [119][250/3239]	Time 0.225 (0.786)	Data Time 0.001 (0.159)	Loss 2.5438 (2.3588)	Entropy 0.53121 (0.53139)	Top-1 acc 66.797 (67.270)	Top-5 acc 81.250 (86.126)	lr 0.00002
Train [119][260/3239]	Time 0.278 (0.773)	Data Time 0.003 (0.153)	Loss 2.2767 (2.3612)	Entropy 0.53118 (0.53138)	Top-1 acc 67.578 (67.214)	Top-5 acc 86.719 (86.105)	lr 0.00002
Train [119][270/3239]	Time 0.240 (0.760)	Data Time 0.001 (0.148)	Loss 2.2275 (2.3628)	Entropy 0.53112 (0.53138)	Top-1 acc 73.828 (67.205)	Top-5 acc 87.500 (86.086)	lr 0.00002
Train [119][280/3239]	Time 0.265 (0.749)	Data Time 0.001 (0.143)	Loss 2.4714 (2.3629)	Entropy 0.53141 (0.53137)	Top-1 acc 65.234 (67.178)	Top-5 acc 82.031 (86.065)	lr 0.00002
Train [119][290/3239]	Time 0.252 (0.738)	Data Time 0.001 (0.138)	Loss 2.0978 (2.3615)	Entropy 0.53145 (0.53138)	Top-1 acc 74.219 (67.208)	Top-5 acc 89.844 (86.112)	lr 0.00002
Train [119][300/3239]	Time 0.257 (0.728)	Data Time 0.001 (0.133)	Loss 2.3775 (2.3614)	Entropy 0.53185 (0.53139)	Top-1 acc 64.453 (67.230)	Top-5 acc 84.766 (86.120)	lr 0.00002
Train [119][310/3239]	Time 0.237 (0.718)	Data Time 0.001 (0.129)	Loss 2.4149 (2.3589)	Entropy 0.53198 (0.53140)	Top-1 acc 66.406 (67.268)	Top-5 acc 84.766 (86.146)	lr 0.00002
Train [119][320/3239]	Time 0.517 (0.710)	Data Time 0.026 (0.125)	Loss 2.3332 (2.3593)	Entropy 0.53191 (0.53142)	Top-1 acc 68.750 (67.256)	Top-5 acc 87.500 (86.141)	lr 0.00002
Train [119][330/3239]	Time 0.230 (0.701)	Data Time 0.001 (0.121)	Loss 2.1273 (2.3600)	Entropy 0.53199 (0.53144)	Top-1 acc 71.875 (67.236)	Top-5 acc 89.844 (86.118)	lr 0.00002
Train [119][340/3239]	Time 0.231 (0.693)	Data Time 0.001 (0.118)	Loss 2.4560 (2.3576)	Entropy 0.53215 (0.53145)	Top-1 acc 66.016 (67.299)	Top-5 acc 84.375 (86.155)	lr 0.00002
Train [119][350/3239]	Time 0.233 (0.685)	Data Time 0.001 (0.115)	Loss 2.3969 (2.3553)	Entropy 0.53188 (0.53147)	Top-1 acc 65.234 (67.329)	Top-5 acc 85.547 (86.202)	lr 0.00002
Train [119][360/3239]	Time 0.236 (0.678)	Data Time 0.001 (0.112)	Loss 2.3221 (2.3565)	Entropy 0.53181 (0.53148)	Top-1 acc 65.625 (67.296)	Top-5 acc 88.281 (86.197)	lr 0.00002
Train [119][370/3239]	Time 0.227 (0.671)	Data Time 0.001 (0.109)	Loss 2.3440 (2.3553)	Entropy 0.53135 (0.53148)	Top-1 acc 66.016 (67.344)	Top-5 acc 87.500 (86.221)	lr 0.00002
Train [119][380/3239]	Time 0.242 (0.665)	Data Time 0.001 (0.106)	Loss 2.2334 (2.3545)	Entropy 0.53136 (0.53148)	Top-1 acc 70.703 (67.349)	Top-5 acc 89.062 (86.235)	lr 0.00002
Train [119][390/3239]	Time 0.346 (0.659)	Data Time 0.001 (0.103)	Loss 2.0967 (2.3527)	Entropy 0.53142 (0.53148)	Top-1 acc 73.438 (67.386)	Top-5 acc 90.625 (86.279)	lr 0.00002
Train [119][400/3239]	Time 0.236 (0.653)	Data Time 0.001 (0.101)	Loss 2.2193 (2.3540)	Entropy 0.53137 (0.53148)	Top-1 acc 72.656 (67.358)	Top-5 acc 88.672 (86.241)	lr 0.00002
Train [119][410/3239]	Time 0.368 (0.650)	Data Time 0.002 (0.098)	Loss 2.1953 (2.3528)	Entropy 0.53164 (0.53147)	Top-1 acc 73.438 (67.363)	Top-5 acc 89.844 (86.263)	lr 0.00002
Train [119][420/3239]	Time 0.239 (0.649)	Data Time 0.001 (0.096)	Loss 2.3776 (2.3522)	Entropy 0.53185 (0.53148)	Top-1 acc 67.969 (67.401)	Top-5 acc 86.719 (86.269)	lr 0.00001
Train [119][430/3239]	Time 0.245 (0.644)	Data Time 0.001 (0.094)	Loss 2.4330 (2.3523)	Entropy 0.53191 (0.53149)	Top-1 acc 67.578 (67.411)	Top-5 acc 83.594 (86.266)	lr 0.00001
Train [119][440/3239]	Time 0.244 (0.640)	Data Time 0.001 (0.092)	Loss 2.1262 (2.3514)	Entropy 0.53216 (0.53150)	Top-1 acc 73.047 (67.423)	Top-5 acc 90.625 (86.292)	lr 0.00001
Train [119][450/3239]	Time 0.238 (0.635)	Data Time 0.001 (0.090)	Loss 2.1461 (2.3522)	Entropy 0.53194 (0.53151)	Top-1 acc 72.656 (67.407)	Top-5 acc 89.844 (86.275)	lr 0.00001
Train [119][460/3239]	Time 0.268 (0.631)	Data Time 0.001 (0.088)	Loss 2.2292 (2.3524)	Entropy 0.53188 (0.53152)	Top-1 acc 68.750 (67.415)	Top-5 acc 89.062 (86.275)	lr 0.00001
Train [119][470/3239]	Time 0.243 (0.626)	Data Time 0.001 (0.086)	Loss 2.0844 (2.3526)	Entropy 0.53190 (0.53153)	Top-1 acc 73.047 (67.401)	Top-5 acc 91.016 (86.267)	lr 0.00001
Train [119][480/3239]	Time 0.265 (0.622)	Data Time 0.001 (0.084)	Loss 2.4282 (2.3519)	Entropy 0.53213 (0.53154)	Top-1 acc 65.625 (67.398)	Top-5 acc 86.328 (86.294)	lr 0.00001
Train [119][490/3239]	Time 0.233 (0.618)	Data Time 0.001 (0.082)	Loss 2.7126 (2.3518)	Entropy 0.53234 (0.53155)	Top-1 acc 56.641 (67.400)	Top-5 acc 78.906 (86.271)	lr 0.00001
Train [119][500/3239]	Time 0.260 (0.614)	Data Time 0.001 (0.081)	Loss 2.2167 (2.3528)	Entropy 0.53222 (0.53157)	Top-1 acc 71.484 (67.394)	Top-5 acc 88.281 (86.258)	lr 0.00001
Train [119][510/3239]	Time 0.232 (0.611)	Data Time 0.001 (0.079)	Loss 2.5733 (2.3530)	Entropy 0.53248 (0.53158)	Top-1 acc 60.156 (67.393)	Top-5 acc 83.594 (86.246)	lr 0.00001
Train [119][520/3239]	Time 0.225 (0.607)	Data Time 0.001 (0.078)	Loss 2.3725 (2.3539)	Entropy 0.53220 (0.53160)	Top-1 acc 66.016 (67.373)	Top-5 acc 87.109 (86.236)	lr 0.00001
Train [119][530/3239]	Time 0.236 (0.603)	Data Time 0.001 (0.076)	Loss 2.2764 (2.3531)	Entropy 0.53253 (0.53161)	Top-1 acc 69.531 (67.385)	Top-5 acc 87.109 (86.255)	lr 0.00001
Train [119][540/3239]	Time 0.267 (0.600)	Data Time 0.002 (0.075)	Loss 2.3112 (2.3520)	Entropy 0.53254 (0.53163)	Top-1 acc 69.141 (67.421)	Top-5 acc 85.938 (86.269)	lr 0.00001
Train [119][550/3239]	Time 0.368 (0.597)	Data Time 0.001 (0.074)	Loss 2.3686 (2.3514)	Entropy 0.53263 (0.53164)	Top-1 acc 69.531 (67.434)	Top-5 acc 87.109 (86.288)	lr 0.00001
Train [119][560/3239]	Time 0.241 (0.594)	Data Time 0.001 (0.072)	Loss 2.5730 (2.3519)	Entropy 0.53261 (0.53166)	Top-1 acc 63.672 (67.431)	Top-5 acc 82.812 (86.277)	lr 0.00001
Train [119][570/3239]	Time 0.234 (0.591)	Data Time 0.001 (0.071)	Loss 2.3619 (2.3511)	Entropy 0.53272 (0.53168)	Top-1 acc 69.922 (67.447)	Top-5 acc 85.938 (86.290)	lr 0.00001
Train [119][580/3239]	Time 0.229 (0.588)	Data Time 0.001 (0.070)	Loss 2.2326 (2.3504)	Entropy 0.53261 (0.53169)	Top-1 acc 68.750 (67.471)	Top-5 acc 87.891 (86.298)	lr 0.00001
Train [119][590/3239]	Time 0.233 (0.585)	Data Time 0.001 (0.069)	Loss 2.3626 (2.3505)	Entropy 0.53298 (0.53171)	Top-1 acc 69.531 (67.457)	Top-5 acc 85.547 (86.288)	lr 0.00001
Train [119][600/3239]	Time 0.229 (0.582)	Data Time 0.001 (0.068)	Loss 2.3546 (2.3503)	Entropy 0.53264 (0.53173)	Top-1 acc 64.453 (67.462)	Top-5 acc 89.844 (86.298)	lr 0.00001
Train [119][610/3239]	Time 0.236 (0.579)	Data Time 0.001 (0.067)	Loss 2.4460 (2.3498)	Entropy 0.53273 (0.53174)	Top-1 acc 63.281 (67.465)	Top-5 acc 85.938 (86.297)	lr 0.00001
Train [119][620/3239]	Time 0.469 (0.577)	Data Time 0.002 (0.066)	Loss 2.3433 (2.3488)	Entropy 0.53298 (0.53176)	Top-1 acc 70.703 (67.486)	Top-5 acc 87.109 (86.308)	lr 0.00001
Train [119][630/3239]	Time 0.237 (0.576)	Data Time 0.001 (0.065)	Loss 2.3332 (2.3478)	Entropy 0.53312 (0.53178)	Top-1 acc 66.406 (67.510)	Top-5 acc 85.938 (86.326)	lr 0.00001
Train [119][640/3239]	Time 0.238 (0.573)	Data Time 0.001 (0.064)	Loss 2.3071 (2.3481)	Entropy 0.53356 (0.53181)	Top-1 acc 64.453 (67.494)	Top-5 acc 87.891 (86.320)	lr 0.00001
Train [119][650/3239]	Time 0.234 (0.571)	Data Time 0.001 (0.063)	Loss 2.2455 (2.3473)	Entropy 0.53367 (0.53183)	Top-1 acc 70.703 (67.520)	Top-5 acc 87.109 (86.337)	lr 0.00001
Train [119][660/3239]	Time 0.238 (0.568)	Data Time 0.001 (0.062)	Loss 2.4769 (2.3464)	Entropy 0.53360 (0.53186)	Top-1 acc 62.500 (67.537)	Top-5 acc 84.766 (86.356)	lr 0.00001
Train [119][670/3239]	Time 0.265 (0.566)	Data Time 0.001 (0.061)	Loss 2.3824 (2.3459)	Entropy 0.53378 (0.53189)	Top-1 acc 65.625 (67.540)	Top-5 acc 86.328 (86.376)	lr 0.00001
Train [119][680/3239]	Time 0.241 (0.564)	Data Time 0.001 (0.060)	Loss 2.3682 (2.3455)	Entropy 0.53390 (0.53191)	Top-1 acc 68.750 (67.559)	Top-5 acc 86.328 (86.383)	lr 0.00001
Train [119][690/3239]	Time 0.226 (0.562)	Data Time 0.001 (0.059)	Loss 2.3770 (2.3452)	Entropy 0.53391 (0.53194)	Top-1 acc 69.531 (67.567)	Top-5 acc 85.547 (86.385)	lr 0.00001
Train [119][700/3239]	Time 0.229 (0.560)	Data Time 0.001 (0.058)	Loss 2.1871 (2.3453)	Entropy 0.53408 (0.53197)	Top-1 acc 71.484 (67.554)	Top-5 acc 89.844 (86.386)	lr 0.00001
Train [119][710/3239]	Time 0.316 (0.558)	Data Time 0.001 (0.057)	Loss 2.4579 (2.3453)	Entropy 0.53412 (0.53200)	Top-1 acc 65.234 (67.542)	Top-5 acc 85.547 (86.387)	lr 0.00001
Train [119][720/3239]	Time 0.310 (0.556)	Data Time 0.002 (0.057)	Loss 2.3248 (2.3453)	Entropy 0.53400 (0.53203)	Top-1 acc 69.141 (67.549)	Top-5 acc 86.719 (86.379)	lr 0.00001
Train [119][730/3239]	Time 0.239 (0.555)	Data Time 0.001 (0.056)	Loss 2.2190 (2.3459)	Entropy 0.53406 (0.53206)	Top-1 acc 70.703 (67.543)	Top-5 acc 88.672 (86.366)	lr 0.00001
Train [119][740/3239]	Time 0.232 (0.553)	Data Time 0.001 (0.055)	Loss 2.3453 (2.3459)	Entropy 0.53410 (0.53208)	Top-1 acc 67.578 (67.555)	Top-5 acc 85.156 (86.359)	lr 0.00001
Train [119][750/3239]	Time 0.245 (0.551)	Data Time 0.001 (0.054)	Loss 2.2983 (2.3451)	Entropy 0.53397 (0.53211)	Top-1 acc 69.922 (67.573)	Top-5 acc 87.109 (86.378)	lr 0.00001
Train [119][760/3239]	Time 0.244 (0.549)	Data Time 0.001 (0.054)	Loss 2.4337 (2.3447)	Entropy 0.53411 (0.53213)	Top-1 acc 65.625 (67.583)	Top-5 acc 84.375 (86.389)	lr 0.00001
Train [119][770/3239]	Time 0.229 (0.547)	Data Time 0.001 (0.053)	Loss 2.4151 (2.3455)	Entropy 0.53391 (0.53216)	Top-1 acc 67.188 (67.549)	Top-5 acc 86.719 (86.370)	lr 0.00001
Train [119][780/3239]	Time 0.360 (0.546)	Data Time 0.001 (0.052)	Loss 2.3074 (2.3450)	Entropy 0.53377 (0.53218)	Top-1 acc 68.750 (67.555)	Top-5 acc 86.719 (86.380)	lr 0.00001
Train [119][790/3239]	Time 0.228 (0.544)	Data Time 0.001 (0.052)	Loss 2.3029 (2.3455)	Entropy 0.53346 (0.53220)	Top-1 acc 67.969 (67.536)	Top-5 acc 88.672 (86.382)	lr 0.00001
Train [119][800/3239]	Time 0.242 (0.542)	Data Time 0.001 (0.051)	Loss 2.3515 (2.3453)	Entropy 0.53323 (0.53221)	Top-1 acc 70.703 (67.549)	Top-5 acc 84.375 (86.374)	lr 0.00001
Train [119][810/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.051)	Loss 2.4794 (2.3461)	Entropy 0.53320 (0.53223)	Top-1 acc 63.281 (67.520)	Top-5 acc 84.766 (86.363)	lr 0.00001
Train [119][820/3239]	Time 0.350 (0.541)	Data Time 0.002 (0.050)	Loss 2.0956 (2.3459)	Entropy 0.53342 (0.53224)	Top-1 acc 73.438 (67.529)	Top-5 acc 90.234 (86.371)	lr 0.00001
Train [119][830/3239]	Time 0.272 (0.604)	Data Time 0.032 (0.049)	Loss 2.3911 (2.3460)	Entropy 0.53336 (0.53225)	Top-1 acc 64.844 (67.525)	Top-5 acc 86.719 (86.372)	lr 0.00001
Train [119][840/3239]	Time 0.235 (0.602)	Data Time 0.002 (0.049)	Loss 2.5558 (2.3463)	Entropy 0.53365 (0.53227)	Top-1 acc 62.891 (67.526)	Top-5 acc 83.594 (86.360)	lr 0.00001
Train [119][850/3239]	Time 0.264 (0.600)	Data Time 0.002 (0.048)	Loss 2.2296 (2.3460)	Entropy 0.53322 (0.53228)	Top-1 acc 71.094 (67.523)	Top-5 acc 87.500 (86.364)	lr 0.00001
Train [119][860/3239]	Time 0.218 (0.597)	Data Time 0.002 (0.048)	Loss 2.4571 (2.3456)	Entropy 0.53310 (0.53229)	Top-1 acc 65.625 (67.532)	Top-5 acc 84.766 (86.360)	lr 0.00001
Train [119][870/3239]	Time 0.345 (0.595)	Data Time 0.001 (0.047)	Loss 2.3600 (2.3458)	Entropy 0.53314 (0.53230)	Top-1 acc 70.312 (67.539)	Top-5 acc 85.156 (86.357)	lr 0.00001
Train [119][880/3239]	Time 0.267 (0.593)	Data Time 0.001 (0.047)	Loss 2.4660 (2.3462)	Entropy 0.53335 (0.53231)	Top-1 acc 64.844 (67.532)	Top-5 acc 83.984 (86.351)	lr 0.00001
Train [119][890/3239]	Time 0.230 (0.591)	Data Time 0.001 (0.046)	Loss 2.3508 (2.3463)	Entropy 0.53344 (0.53232)	Top-1 acc 66.016 (67.520)	Top-5 acc 85.938 (86.353)	lr 0.00001
Train [119][900/3239]	Time 0.237 (0.590)	Data Time 0.001 (0.046)	Loss 2.3652 (2.3457)	Entropy 0.53291 (0.53234)	Top-1 acc 67.969 (67.543)	Top-5 acc 85.156 (86.359)	lr 0.00001
Train [119][910/3239]	Time 0.235 (0.588)	Data Time 0.001 (0.045)	Loss 2.4321 (2.3463)	Entropy 0.53262 (0.53234)	Top-1 acc 65.234 (67.533)	Top-5 acc 82.812 (86.336)	lr 0.00001
Train [119][920/3239]	Time 0.226 (0.586)	Data Time 0.001 (0.045)	Loss 2.6174 (2.3460)	Entropy 0.53301 (0.53235)	Top-1 acc 60.156 (67.548)	Top-5 acc 80.859 (86.341)	lr 0.00001
Train [119][930/3239]	Time 0.237 (0.584)	Data Time 0.001 (0.044)	Loss 2.3001 (2.3467)	Entropy 0.53294 (0.53235)	Top-1 acc 68.750 (67.518)	Top-5 acc 85.547 (86.331)	lr 0.00001
Train [119][940/3239]	Time 0.328 (0.582)	Data Time 0.001 (0.044)	Loss 2.3449 (2.3471)	Entropy 0.53220 (0.53235)	Top-1 acc 64.844 (67.506)	Top-5 acc 86.328 (86.328)	lr 0.00001
Train [119][950/3239]	Time 0.229 (0.580)	Data Time 0.001 (0.043)	Loss 2.4331 (2.3464)	Entropy 0.53216 (0.53235)	Top-1 acc 66.016 (67.527)	Top-5 acc 84.375 (86.334)	lr 0.00001
Train [119][960/3239]	Time 0.279 (0.579)	Data Time 0.001 (0.043)	Loss 2.3116 (2.3461)	Entropy 0.53214 (0.53235)	Top-1 acc 68.359 (67.541)	Top-5 acc 85.938 (86.336)	lr 0.00001
Train [119][970/3239]	Time 0.238 (0.577)	Data Time 0.001 (0.043)	Loss 2.3204 (2.3453)	Entropy 0.53224 (0.53235)	Top-1 acc 67.578 (67.556)	Top-5 acc 89.453 (86.358)	lr 0.00001
Train [119][980/3239]	Time 0.279 (0.575)	Data Time 0.001 (0.042)	Loss 2.3564 (2.3455)	Entropy 0.53259 (0.53235)	Top-1 acc 66.016 (67.551)	Top-5 acc 87.500 (86.353)	lr 0.00001
Train [119][990/3239]	Time 0.253 (0.575)	Data Time 0.001 (0.042)	Loss 2.3341 (2.3456)	Entropy 0.53300 (0.53235)	Top-1 acc 65.234 (67.543)	Top-5 acc 87.109 (86.352)	lr 0.00001
Train [119][1000/3239]	Time 0.291 (0.574)	Data Time 0.002 (0.041)	Loss 2.3984 (2.3457)	Entropy 0.53292 (0.53236)	Top-1 acc 66.797 (67.550)	Top-5 acc 83.984 (86.347)	lr 0.00001
Train [119][1010/3239]	Time 0.243 (0.573)	Data Time 0.001 (0.041)	Loss 2.2830 (2.3452)	Entropy 0.53270 (0.53236)	Top-1 acc 68.359 (67.570)	Top-5 acc 85.938 (86.351)	lr 0.00001
Train [119][1020/3239]	Time 0.246 (0.572)	Data Time 0.001 (0.041)	Loss 2.2372 (2.3445)	Entropy 0.53259 (0.53237)	Top-1 acc 71.094 (67.585)	Top-5 acc 89.453 (86.363)	lr 0.00001
Train [119][1030/3239]	Time 0.368 (0.571)	Data Time 0.001 (0.040)	Loss 2.4172 (2.3447)	Entropy 0.53261 (0.53237)	Top-1 acc 64.844 (67.583)	Top-5 acc 86.328 (86.362)	lr 0.00001
Train [119][1040/3239]	Time 0.266 (0.569)	Data Time 0.001 (0.040)	Loss 2.2942 (2.3449)	Entropy 0.53258 (0.53237)	Top-1 acc 67.188 (67.582)	Top-5 acc 87.500 (86.356)	lr 0.00001
Train [119][1050/3239]	Time 0.242 (0.568)	Data Time 0.001 (0.040)	Loss 2.5648 (2.3447)	Entropy 0.53248 (0.53237)	Top-1 acc 61.719 (67.586)	Top-5 acc 80.469 (86.356)	lr 0.00001
Train [119][1060/3239]	Time 0.264 (0.567)	Data Time 0.001 (0.039)	Loss 2.7735 (2.3457)	Entropy 0.53271 (0.53237)	Top-1 acc 57.031 (67.560)	Top-5 acc 79.297 (86.336)	lr 0.00001
Train [119][1070/3239]	Time 0.239 (0.565)	Data Time 0.001 (0.039)	Loss 2.4077 (2.3456)	Entropy 0.53274 (0.53238)	Top-1 acc 69.531 (67.567)	Top-5 acc 84.766 (86.340)	lr 0.00001
Train [119][1080/3239]	Time 0.237 (0.564)	Data Time 0.001 (0.038)	Loss 2.2811 (2.3455)	Entropy 0.53278 (0.53238)	Top-1 acc 71.094 (67.576)	Top-5 acc 88.672 (86.347)	lr 0.00001
Train [119][1090/3239]	Time 0.236 (0.563)	Data Time 0.002 (0.038)	Loss 2.3386 (2.3454)	Entropy 0.53288 (0.53239)	Top-1 acc 67.969 (67.578)	Top-5 acc 85.938 (86.344)	lr 0.00001
Train [119][1100/3239]	Time 0.333 (0.561)	Data Time 0.001 (0.038)	Loss 2.1450 (2.3456)	Entropy 0.53283 (0.53239)	Top-1 acc 71.484 (67.569)	Top-5 acc 91.016 (86.340)	lr 0.00001
Train [119][1110/3239]	Time 0.249 (0.560)	Data Time 0.001 (0.037)	Loss 2.1157 (2.3456)	Entropy 0.53294 (0.53239)	Top-1 acc 72.656 (67.563)	Top-5 acc 91.406 (86.347)	lr 0.00001
Train [119][1120/3239]	Time 0.242 (0.559)	Data Time 0.001 (0.037)	Loss 2.3309 (2.3466)	Entropy 0.53312 (0.53240)	Top-1 acc 64.453 (67.543)	Top-5 acc 86.328 (86.339)	lr 0.00001
Train [119][1130/3239]	Time 0.235 (0.558)	Data Time 0.001 (0.037)	Loss 2.4371 (2.3468)	Entropy 0.53364 (0.53241)	Top-1 acc 68.359 (67.551)	Top-5 acc 81.641 (86.324)	lr 0.00001
Train [119][1140/3239]	Time 0.241 (0.556)	Data Time 0.001 (0.037)	Loss 2.2602 (2.3463)	Entropy 0.53409 (0.53242)	Top-1 acc 67.188 (67.559)	Top-5 acc 87.109 (86.339)	lr 0.00001
Train [119][1150/3239]	Time 0.273 (0.555)	Data Time 0.003 (0.036)	Loss 2.2850 (2.3464)	Entropy 0.53419 (0.53243)	Top-1 acc 69.922 (67.559)	Top-5 acc 85.938 (86.334)	lr 0.00001
Train [119][1160/3239]	Time 0.227 (0.554)	Data Time 0.001 (0.036)	Loss 2.1298 (2.3465)	Entropy 0.53431 (0.53245)	Top-1 acc 73.047 (67.563)	Top-5 acc 88.281 (86.335)	lr 0.00001
Train [119][1170/3239]	Time 0.227 (0.553)	Data Time 0.001 (0.036)	Loss 2.2900 (2.3464)	Entropy 0.53438 (0.53247)	Top-1 acc 68.359 (67.567)	Top-5 acc 86.719 (86.339)	lr 0.00001
Train [119][1180/3239]	Time 0.236 (0.552)	Data Time 0.001 (0.035)	Loss 2.4571 (2.3461)	Entropy 0.53457 (0.53248)	Top-1 acc 60.938 (67.569)	Top-5 acc 84.375 (86.346)	lr 0.00001
Train [119][1190/3239]	Time 0.257 (0.550)	Data Time 0.001 (0.035)	Loss 2.6447 (2.3460)	Entropy 0.53437 (0.53250)	Top-1 acc 62.109 (67.572)	Top-5 acc 79.297 (86.347)	lr 0.00001
Train [119][1200/3239]	Time 0.250 (0.550)	Data Time 0.001 (0.035)	Loss 2.3361 (2.3462)	Entropy 0.53433 (0.53252)	Top-1 acc 67.578 (67.567)	Top-5 acc 88.281 (86.345)	lr 0.00001
Train [119][1210/3239]	Time 0.240 (0.549)	Data Time 0.001 (0.035)	Loss 2.2139 (2.3462)	Entropy 0.53413 (0.53253)	Top-1 acc 73.047 (67.572)	Top-5 acc 85.938 (86.340)	lr 0.00001
Train [119][1220/3239]	Time 0.247 (0.548)	Data Time 0.001 (0.034)	Loss 2.1926 (2.3469)	Entropy 0.53452 (0.53254)	Top-1 acc 72.656 (67.560)	Top-5 acc 89.062 (86.329)	lr 0.00001
Train [119][1230/3239]	Time 0.228 (0.546)	Data Time 0.001 (0.034)	Loss 2.3069 (2.3464)	Entropy 0.53458 (0.53256)	Top-1 acc 66.016 (67.574)	Top-5 acc 87.109 (86.334)	lr 0.00001
Train [119][1240/3239]	Time 0.230 (0.545)	Data Time 0.001 (0.034)	Loss 2.1865 (2.3461)	Entropy 0.53463 (0.53258)	Top-1 acc 73.047 (67.581)	Top-5 acc 89.844 (86.336)	lr 0.00001
Train [119][1250/3239]	Time 0.246 (0.544)	Data Time 0.001 (0.033)	Loss 2.4776 (2.3458)	Entropy 0.53466 (0.53259)	Top-1 acc 62.891 (67.578)	Top-5 acc 82.422 (86.342)	lr 0.00001
Train [119][1260/3239]	Time 0.332 (0.543)	Data Time 0.001 (0.033)	Loss 2.4411 (2.3457)	Entropy 0.53463 (0.53261)	Top-1 acc 64.453 (67.582)	Top-5 acc 84.766 (86.345)	lr 0.00001
Train [119][1270/3239]	Time 0.269 (0.542)	Data Time 0.001 (0.033)	Loss 2.6648 (2.3457)	Entropy 0.53434 (0.53263)	Top-1 acc 59.766 (67.580)	Top-5 acc 81.250 (86.346)	lr 0.00001
Train [119][1280/3239]	Time 0.235 (0.541)	Data Time 0.001 (0.033)	Loss 2.3470 (2.3452)	Entropy 0.53443 (0.53264)	Top-1 acc 63.672 (67.590)	Top-5 acc 85.547 (86.356)	lr 0.00001
Train [119][1290/3239]	Time 0.241 (0.540)	Data Time 0.001 (0.032)	Loss 2.2403 (2.3451)	Entropy 0.53462 (0.53265)	Top-1 acc 69.531 (67.597)	Top-5 acc 88.672 (86.357)	lr 0.00001
Train [119][1300/3239]	Time 0.243 (0.539)	Data Time 0.001 (0.032)	Loss 2.4168 (2.3455)	Entropy 0.53453 (0.53267)	Top-1 acc 69.141 (67.588)	Top-5 acc 83.594 (86.347)	lr 0.00001
Train [119][1310/3239]	Time 0.320 (0.539)	Data Time 0.002 (0.032)	Loss 2.2932 (2.3458)	Entropy 0.53431 (0.53268)	Top-1 acc 69.922 (67.588)	Top-5 acc 86.719 (86.340)	lr 0.00001
Train [119][1320/3239]	Time 0.224 (0.538)	Data Time 0.001 (0.032)	Loss 2.2969 (2.3452)	Entropy 0.53393 (0.53269)	Top-1 acc 67.578 (67.599)	Top-5 acc 86.328 (86.350)	lr 0.00001
Train [119][1330/3239]	Time 0.359 (0.537)	Data Time 0.001 (0.032)	Loss 2.2704 (2.3450)	Entropy 0.53388 (0.53270)	Top-1 acc 64.844 (67.605)	Top-5 acc 87.109 (86.353)	lr 0.00001
Train [119][1340/3239]	Time 0.235 (0.536)	Data Time 0.001 (0.031)	Loss 2.0983 (2.3448)	Entropy 0.53383 (0.53271)	Top-1 acc 72.656 (67.611)	Top-5 acc 91.016 (86.357)	lr 0.00001
Train [119][1350/3239]	Time 0.249 (0.535)	Data Time 0.009 (0.031)	Loss 2.3676 (2.3442)	Entropy 0.53388 (0.53272)	Top-1 acc 66.797 (67.630)	Top-5 acc 85.938 (86.365)	lr 0.00001
Train [119][1360/3239]	Time 0.235 (0.534)	Data Time 0.002 (0.031)	Loss 2.2858 (2.3448)	Entropy 0.53408 (0.53273)	Top-1 acc 70.703 (67.617)	Top-5 acc 86.328 (86.354)	lr 0.00001
Train [119][1370/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.031)	Loss 2.6423 (2.3446)	Entropy 0.53427 (0.53274)	Top-1 acc 59.766 (67.626)	Top-5 acc 83.203 (86.359)	lr 0.00001
Train [119][1380/3239]	Time 0.232 (0.533)	Data Time 0.001 (0.030)	Loss 2.3677 (2.3451)	Entropy 0.53434 (0.53275)	Top-1 acc 66.797 (67.617)	Top-5 acc 89.062 (86.349)	lr 0.00001
Train [119][1390/3239]	Time 0.236 (0.532)	Data Time 0.001 (0.030)	Loss 2.3511 (2.3453)	Entropy 0.53424 (0.53276)	Top-1 acc 67.969 (67.609)	Top-5 acc 83.594 (86.341)	lr 0.00001
Train [119][1400/3239]	Time 0.259 (0.532)	Data Time 0.001 (0.030)	Loss 2.1352 (2.3448)	Entropy 0.53437 (0.53277)	Top-1 acc 72.266 (67.620)	Top-5 acc 89.844 (86.352)	lr 0.00001
Train [119][1410/3239]	Time 0.242 (0.531)	Data Time 0.001 (0.030)	Loss 2.3525 (2.3450)	Entropy 0.53419 (0.53278)	Top-1 acc 67.969 (67.620)	Top-5 acc 85.938 (86.346)	lr 0.00001
Train [119][1420/3239]	Time 0.368 (0.530)	Data Time 0.001 (0.030)	Loss 2.4212 (2.3452)	Entropy 0.53399 (0.53279)	Top-1 acc 63.672 (67.610)	Top-5 acc 83.984 (86.339)	lr 0.00001
Train [119][1430/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.029)	Loss 2.2574 (2.3449)	Entropy 0.53416 (0.53280)	Top-1 acc 71.094 (67.621)	Top-5 acc 88.672 (86.341)	lr 0.00001
Train [119][1440/3239]	Time 0.236 (0.529)	Data Time 0.001 (0.029)	Loss 2.3750 (2.3448)	Entropy 0.53390 (0.53281)	Top-1 acc 66.016 (67.624)	Top-5 acc 88.281 (86.344)	lr 0.00001
Train [119][1450/3239]	Time 0.251 (0.528)	Data Time 0.001 (0.029)	Loss 2.3191 (2.3442)	Entropy 0.53404 (0.53282)	Top-1 acc 67.578 (67.638)	Top-5 acc 85.156 (86.355)	lr 0.00001
Train [119][1460/3239]	Time 0.236 (0.527)	Data Time 0.001 (0.029)	Loss 2.3775 (2.3443)	Entropy 0.53428 (0.53283)	Top-1 acc 64.844 (67.635)	Top-5 acc 87.891 (86.353)	lr 0.00001
Train [119][1470/3239]	Time 0.239 (0.526)	Data Time 0.002 (0.029)	Loss 2.3048 (2.3446)	Entropy 0.53430 (0.53284)	Top-1 acc 66.406 (67.625)	Top-5 acc 87.500 (86.348)	lr 0.00001
Train [119][1480/3239]	Time 0.351 (0.560)	Data Time 0.004 (0.029)	Loss 2.5691 (2.3451)	Entropy 0.53433 (0.53285)	Top-1 acc 61.719 (67.614)	Top-5 acc 82.031 (86.339)	lr 0.00001
Train [119][1490/3239]	Time 0.484 (0.560)	Data Time 0.002 (0.028)	Loss 2.2075 (2.3447)	Entropy 0.53455 (0.53286)	Top-1 acc 70.703 (67.626)	Top-5 acc 87.500 (86.345)	lr 0.00001
Train [119][1500/3239]	Time 0.311 (0.560)	Data Time 0.002 (0.028)	Loss 2.3509 (2.3445)	Entropy 0.53433 (0.53287)	Top-1 acc 70.312 (67.637)	Top-5 acc 87.500 (86.350)	lr 0.00001
Train [119][1510/3239]	Time 0.250 (0.560)	Data Time 0.001 (0.028)	Loss 2.3465 (2.3451)	Entropy 0.53444 (0.53288)	Top-1 acc 68.750 (67.631)	Top-5 acc 86.328 (86.338)	lr 0.00001
Train [119][1520/3239]	Time 0.285 (0.559)	Data Time 0.002 (0.028)	Loss 2.1122 (2.3453)	Entropy 0.53391 (0.53289)	Top-1 acc 73.438 (67.629)	Top-5 acc 88.281 (86.335)	lr 0.00001
Train [119][1530/3239]	Time 0.241 (0.558)	Data Time 0.001 (0.028)	Loss 2.4410 (2.3449)	Entropy 0.53386 (0.53290)	Top-1 acc 66.016 (67.639)	Top-5 acc 85.938 (86.344)	lr 0.00001
Train [119][1540/3239]	Time 0.245 (0.557)	Data Time 0.001 (0.028)	Loss 2.3345 (2.3450)	Entropy 0.53409 (0.53290)	Top-1 acc 67.969 (67.634)	Top-5 acc 88.672 (86.347)	lr 0.00001
Train [119][1550/3239]	Time 0.266 (0.557)	Data Time 0.001 (0.027)	Loss 2.2720 (2.3451)	Entropy 0.53368 (0.53291)	Top-1 acc 69.531 (67.639)	Top-5 acc 89.062 (86.349)	lr 0.00001
Train [119][1560/3239]	Time 0.271 (0.556)	Data Time 0.001 (0.027)	Loss 2.3497 (2.3450)	Entropy 0.53371 (0.53291)	Top-1 acc 65.234 (67.640)	Top-5 acc 84.766 (86.347)	lr 0.00001
Train [119][1570/3239]	Time 0.234 (0.555)	Data Time 0.001 (0.027)	Loss 2.4026 (2.3450)	Entropy 0.53371 (0.53292)	Top-1 acc 66.016 (67.638)	Top-5 acc 86.719 (86.347)	lr 0.00001
Train [119][1580/3239]	Time 0.356 (0.554)	Data Time 0.001 (0.027)	Loss 2.5661 (2.3452)	Entropy 0.53357 (0.53293)	Top-1 acc 60.938 (67.631)	Top-5 acc 85.938 (86.348)	lr 0.00001
Train [119][1590/3239]	Time 0.238 (0.553)	Data Time 0.001 (0.027)	Loss 2.1611 (2.3448)	Entropy 0.53360 (0.53293)	Top-1 acc 72.656 (67.647)	Top-5 acc 91.016 (86.359)	lr 0.00001
Train [119][1600/3239]	Time 0.266 (0.553)	Data Time 0.001 (0.027)	Loss 2.3650 (2.3446)	Entropy 0.53317 (0.53293)	Top-1 acc 67.578 (67.645)	Top-5 acc 85.938 (86.364)	lr 0.00001
Train [119][1610/3239]	Time 0.237 (0.552)	Data Time 0.001 (0.026)	Loss 2.4674 (2.3446)	Entropy 0.53267 (0.53293)	Top-1 acc 64.844 (67.645)	Top-5 acc 85.938 (86.367)	lr 0.00001
Train [119][1620/3239]	Time 0.232 (0.551)	Data Time 0.001 (0.026)	Loss 2.3109 (2.3453)	Entropy 0.53281 (0.53293)	Top-1 acc 67.969 (67.630)	Top-5 acc 86.719 (86.356)	lr 0.00001
Train [119][1630/3239]	Time 0.229 (0.550)	Data Time 0.001 (0.026)	Loss 2.2733 (2.3454)	Entropy 0.53305 (0.53293)	Top-1 acc 72.266 (67.629)	Top-5 acc 85.547 (86.354)	lr 0.00001
Train [119][1640/3239]	Time 0.238 (0.549)	Data Time 0.002 (0.026)	Loss 2.3119 (2.3456)	Entropy 0.53316 (0.53293)	Top-1 acc 68.359 (67.622)	Top-5 acc 85.156 (86.350)	lr 0.00001
Train [119][1650/3239]	Time 0.321 (0.549)	Data Time 0.001 (0.026)	Loss 2.3923 (2.3457)	Entropy 0.53284 (0.53293)	Top-1 acc 66.016 (67.616)	Top-5 acc 83.984 (86.346)	lr 0.00001
Train [119][1660/3239]	Time 0.225 (0.548)	Data Time 0.001 (0.026)	Loss 2.2431 (2.3453)	Entropy 0.53295 (0.53293)	Top-1 acc 66.406 (67.619)	Top-5 acc 88.281 (86.353)	lr 0.00001
Train [119][1670/3239]	Time 0.230 (0.547)	Data Time 0.001 (0.026)	Loss 2.4805 (2.3454)	Entropy 0.53280 (0.53293)	Top-1 acc 64.844 (67.619)	Top-5 acc 83.984 (86.350)	lr 0.00001
Train [119][1680/3239]	Time 0.225 (0.546)	Data Time 0.001 (0.025)	Loss 2.1876 (2.3460)	Entropy 0.53270 (0.53293)	Top-1 acc 73.828 (67.609)	Top-5 acc 88.672 (86.340)	lr 0.00001
Train [119][1690/3239]	Time 0.247 (0.545)	Data Time 0.001 (0.025)	Loss 2.1871 (2.3462)	Entropy 0.53255 (0.53293)	Top-1 acc 69.922 (67.602)	Top-5 acc 88.281 (86.334)	lr 0.00001
Train [119][1700/3239]	Time 0.308 (0.545)	Data Time 0.002 (0.025)	Loss 2.2118 (2.3462)	Entropy 0.53268 (0.53293)	Top-1 acc 70.703 (67.607)	Top-5 acc 88.281 (86.335)	lr 0.00001
Train [119][1710/3239]	Time 0.253 (0.545)	Data Time 0.001 (0.025)	Loss 2.4064 (2.3460)	Entropy 0.53276 (0.53293)	Top-1 acc 66.797 (67.610)	Top-5 acc 85.938 (86.336)	lr 0.00001
Train [119][1720/3239]	Time 0.234 (0.544)	Data Time 0.001 (0.025)	Loss 2.3521 (2.3461)	Entropy 0.53295 (0.53293)	Top-1 acc 67.969 (67.613)	Top-5 acc 87.891 (86.336)	lr 0.00001
Train [119][1730/3239]	Time 0.239 (0.543)	Data Time 0.001 (0.025)	Loss 2.2374 (2.3462)	Entropy 0.53318 (0.53293)	Top-1 acc 66.797 (67.605)	Top-5 acc 89.844 (86.336)	lr 0.00001
Train [119][1740/3239]	Time 0.254 (0.543)	Data Time 0.001 (0.025)	Loss 2.4575 (2.3462)	Entropy 0.53282 (0.53293)	Top-1 acc 66.406 (67.606)	Top-5 acc 82.812 (86.336)	lr 0.00001
Train [119][1750/3239]	Time 0.254 (0.542)	Data Time 0.002 (0.024)	Loss 2.3860 (2.3463)	Entropy 0.53266 (0.53293)	Top-1 acc 64.844 (67.600)	Top-5 acc 83.594 (86.333)	lr 0.00001
Train [119][1760/3239]	Time 0.255 (0.541)	Data Time 0.001 (0.024)	Loss 2.5953 (2.3464)	Entropy 0.53220 (0.53292)	Top-1 acc 64.062 (67.599)	Top-5 acc 81.250 (86.329)	lr 0.00001
Train [119][1770/3239]	Time 0.279 (0.541)	Data Time 0.002 (0.024)	Loss 2.2091 (2.3461)	Entropy 0.53241 (0.53292)	Top-1 acc 73.047 (67.610)	Top-5 acc 87.500 (86.332)	lr 0.00001
Train [119][1780/3239]	Time 0.241 (0.540)	Data Time 0.001 (0.024)	Loss 2.2752 (2.3465)	Entropy 0.53231 (0.53292)	Top-1 acc 67.578 (67.597)	Top-5 acc 86.719 (86.325)	lr 0.00001
Train [119][1790/3239]	Time 0.270 (0.540)	Data Time 0.001 (0.024)	Loss 2.4619 (2.3468)	Entropy 0.53236 (0.53291)	Top-1 acc 63.281 (67.591)	Top-5 acc 83.594 (86.318)	lr 0.00001
Train [119][1800/3239]	Time 0.293 (0.540)	Data Time 0.002 (0.024)	Loss 2.3059 (2.3468)	Entropy 0.53236 (0.53291)	Top-1 acc 70.312 (67.596)	Top-5 acc 86.719 (86.317)	lr 0.00001
Train [119][1810/3239]	Time 0.333 (0.539)	Data Time 0.001 (0.024)	Loss 2.2650 (2.3464)	Entropy 0.53263 (0.53291)	Top-1 acc 69.922 (67.607)	Top-5 acc 87.891 (86.325)	lr 0.00001
Train [119][1820/3239]	Time 0.232 (0.539)	Data Time 0.001 (0.024)	Loss 2.2708 (2.3462)	Entropy 0.53264 (0.53291)	Top-1 acc 68.359 (67.614)	Top-5 acc 88.281 (86.327)	lr 0.00001
Train [119][1830/3239]	Time 0.250 (0.538)	Data Time 0.001 (0.023)	Loss 2.4415 (2.3459)	Entropy 0.53262 (0.53290)	Top-1 acc 63.281 (67.612)	Top-5 acc 83.984 (86.331)	lr 0.00001
Train [119][1840/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.023)	Loss 2.3274 (2.3461)	Entropy 0.53205 (0.53290)	Top-1 acc 67.188 (67.608)	Top-5 acc 87.109 (86.329)	lr 0.00001
Train [119][1850/3239]	Time 0.288 (0.537)	Data Time 0.002 (0.023)	Loss 2.3253 (2.3467)	Entropy 0.53243 (0.53290)	Top-1 acc 65.625 (67.593)	Top-5 acc 85.547 (86.312)	lr 0.00001
Train [119][1860/3239]	Time 0.249 (0.536)	Data Time 0.002 (0.023)	Loss 2.2169 (2.3466)	Entropy 0.53209 (0.53290)	Top-1 acc 72.266 (67.599)	Top-5 acc 87.109 (86.311)	lr 0.00001
Train [119][1870/3239]	Time 0.231 (0.536)	Data Time 0.001 (0.023)	Loss 2.3468 (2.3466)	Entropy 0.53220 (0.53289)	Top-1 acc 67.188 (67.593)	Top-5 acc 85.938 (86.313)	lr 0.00001
Train [119][1880/3239]	Time 0.342 (0.535)	Data Time 0.001 (0.023)	Loss 2.3898 (2.3465)	Entropy 0.53228 (0.53289)	Top-1 acc 64.453 (67.595)	Top-5 acc 85.938 (86.314)	lr 0.00001
Train [119][1890/3239]	Time 0.279 (0.534)	Data Time 0.001 (0.023)	Loss 2.2703 (2.3464)	Entropy 0.53227 (0.53289)	Top-1 acc 67.188 (67.600)	Top-5 acc 87.109 (86.314)	lr 0.00001
Train [119][1900/3239]	Time 0.242 (0.534)	Data Time 0.001 (0.023)	Loss 2.3439 (2.3462)	Entropy 0.53252 (0.53288)	Top-1 acc 64.062 (67.600)	Top-5 acc 87.500 (86.318)	lr 0.00001
Train [119][1910/3239]	Time 0.237 (0.533)	Data Time 0.001 (0.023)	Loss 2.5461 (2.3467)	Entropy 0.53273 (0.53288)	Top-1 acc 63.672 (67.587)	Top-5 acc 84.375 (86.312)	lr 0.00001
Train [119][1920/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.022)	Loss 2.3388 (2.3466)	Entropy 0.53238 (0.53288)	Top-1 acc 68.359 (67.589)	Top-5 acc 87.891 (86.314)	lr 0.00001
Train [119][1930/3239]	Time 0.231 (0.532)	Data Time 0.001 (0.022)	Loss 2.2204 (2.3467)	Entropy 0.53260 (0.53288)	Top-1 acc 69.531 (67.582)	Top-5 acc 87.891 (86.314)	lr 0.00001
Train [119][1940/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.022)	Loss 2.4623 (2.3472)	Entropy 0.53262 (0.53288)	Top-1 acc 67.969 (67.569)	Top-5 acc 84.766 (86.306)	lr 0.00001
Train [119][1950/3239]	Time 0.236 (0.531)	Data Time 0.001 (0.022)	Loss 2.2287 (2.3472)	Entropy 0.53245 (0.53288)	Top-1 acc 69.141 (67.567)	Top-5 acc 89.062 (86.306)	lr 0.00001
Train [119][1960/3239]	Time 0.255 (0.530)	Data Time 0.001 (0.022)	Loss 2.3497 (2.3472)	Entropy 0.53265 (0.53287)	Top-1 acc 68.750 (67.571)	Top-5 acc 86.328 (86.307)	lr 0.00001
Train [119][1970/3239]	Time 0.329 (0.530)	Data Time 0.001 (0.022)	Loss 2.6111 (2.3483)	Entropy 0.53281 (0.53287)	Top-1 acc 59.375 (67.538)	Top-5 acc 83.594 (86.288)	lr 0.00001
Train [119][1980/3239]	Time 0.291 (0.529)	Data Time 0.002 (0.022)	Loss 2.5034 (2.3484)	Entropy 0.53262 (0.53287)	Top-1 acc 66.016 (67.537)	Top-5 acc 85.156 (86.289)	lr 0.00001
Train [119][1990/3239]	Time 0.260 (0.529)	Data Time 0.002 (0.022)	Loss 2.1391 (2.3480)	Entropy 0.53293 (0.53287)	Top-1 acc 73.438 (67.548)	Top-5 acc 89.844 (86.294)	lr 0.00001
Train [119][2000/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.022)	Loss 2.1310 (2.3479)	Entropy 0.53297 (0.53287)	Top-1 acc 70.703 (67.551)	Top-5 acc 91.016 (86.296)	lr 0.00001
Train [119][2010/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.022)	Loss 2.3483 (2.3484)	Entropy 0.53256 (0.53287)	Top-1 acc 65.625 (67.540)	Top-5 acc 86.719 (86.287)	lr 0.00001
Train [119][2020/3239]	Time 0.263 (0.527)	Data Time 0.002 (0.021)	Loss 2.5687 (2.3486)	Entropy 0.53262 (0.53287)	Top-1 acc 65.234 (67.537)	Top-5 acc 81.641 (86.283)	lr 0.00001
Train [119][2030/3239]	Time 0.240 (0.527)	Data Time 0.001 (0.021)	Loss 2.3493 (2.3488)	Entropy 0.53263 (0.53287)	Top-1 acc 66.406 (67.535)	Top-5 acc 87.500 (86.284)	lr 0.00001
Train [119][2040/3239]	Time 0.386 (0.526)	Data Time 0.001 (0.021)	Loss 2.4066 (2.3487)	Entropy 0.53235 (0.53287)	Top-1 acc 64.844 (67.533)	Top-5 acc 86.328 (86.285)	lr 0.00001
Train [119][2050/3239]	Time 0.232 (0.526)	Data Time 0.001 (0.021)	Loss 2.3639 (2.3488)	Entropy 0.53244 (0.53286)	Top-1 acc 67.969 (67.533)	Top-5 acc 82.812 (86.283)	lr 0.00001
Train [119][2060/3239]	Time 0.232 (0.525)	Data Time 0.001 (0.021)	Loss 2.4840 (2.3487)	Entropy 0.53240 (0.53286)	Top-1 acc 66.406 (67.538)	Top-5 acc 82.812 (86.285)	lr 0.00001
Train [119][2070/3239]	Time 0.234 (0.525)	Data Time 0.001 (0.021)	Loss 2.2132 (2.3485)	Entropy 0.53256 (0.53286)	Top-1 acc 69.141 (67.540)	Top-5 acc 88.672 (86.286)	lr 0.00001
Train [119][2080/3239]	Time 0.235 (0.524)	Data Time 0.001 (0.021)	Loss 2.3085 (2.3481)	Entropy 0.53283 (0.53286)	Top-1 acc 69.922 (67.552)	Top-5 acc 87.891 (86.293)	lr 0.00001
Train [119][2090/3239]	Time 0.227 (0.524)	Data Time 0.001 (0.021)	Loss 2.5146 (2.3479)	Entropy 0.53281 (0.53286)	Top-1 acc 59.766 (67.558)	Top-5 acc 84.375 (86.295)	lr 0.00001
Train [119][2100/3239]	Time 0.227 (0.523)	Data Time 0.002 (0.021)	Loss 2.3046 (2.3481)	Entropy 0.53262 (0.53286)	Top-1 acc 66.797 (67.551)	Top-5 acc 85.156 (86.290)	lr 0.00001
Train [119][2110/3239]	Time 0.320 (0.523)	Data Time 0.002 (0.021)	Loss 2.2422 (2.3480)	Entropy 0.53252 (0.53286)	Top-1 acc 69.531 (67.553)	Top-5 acc 87.891 (86.291)	lr 0.00001
Train [119][2120/3239]	Time 0.234 (0.523)	Data Time 0.001 (0.021)	Loss 2.3264 (2.3479)	Entropy 0.53237 (0.53285)	Top-1 acc 67.188 (67.553)	Top-5 acc 87.891 (86.297)	lr 0.00001
Train [119][2130/3239]	Time 0.233 (0.522)	Data Time 0.005 (0.020)	Loss 2.3676 (2.3477)	Entropy 0.53237 (0.53285)	Top-1 acc 65.625 (67.555)	Top-5 acc 85.938 (86.301)	lr 0.00001
Train [119][2140/3239]	Time 0.287 (0.547)	Data Time 0.004 (0.020)	Loss 2.3042 (2.3477)	Entropy 0.53235 (0.53285)	Top-1 acc 69.531 (67.554)	Top-5 acc 88.672 (86.302)	lr 0.00001
Train [119][2150/3239]	Time 0.245 (0.547)	Data Time 0.002 (0.020)	Loss 2.1234 (2.3475)	Entropy 0.53219 (0.53285)	Top-1 acc 73.047 (67.563)	Top-5 acc 89.062 (86.306)	lr 0.00001
Train [119][2160/3239]	Time 0.230 (0.546)	Data Time 0.001 (0.020)	Loss 2.3550 (2.3474)	Entropy 0.53256 (0.53285)	Top-1 acc 71.094 (67.563)	Top-5 acc 86.719 (86.307)	lr 0.00001
Train [119][2170/3239]	Time 0.250 (0.546)	Data Time 0.002 (0.020)	Loss 2.1929 (2.3472)	Entropy 0.53264 (0.53284)	Top-1 acc 66.797 (67.562)	Top-5 acc 88.281 (86.312)	lr 0.00001
Train [119][2180/3239]	Time 0.299 (0.545)	Data Time 0.002 (0.020)	Loss 2.3072 (2.3475)	Entropy 0.53264 (0.53284)	Top-1 acc 69.141 (67.557)	Top-5 acc 85.938 (86.307)	lr 0.00001
Train [119][2190/3239]	Time 0.253 (0.545)	Data Time 0.001 (0.020)	Loss 2.4041 (2.3475)	Entropy 0.53271 (0.53284)	Top-1 acc 65.625 (67.557)	Top-5 acc 85.156 (86.307)	lr 0.00001
Train [119][2200/3239]	Time 0.332 (0.544)	Data Time 0.002 (0.020)	Loss 2.1590 (2.3474)	Entropy 0.53237 (0.53284)	Top-1 acc 73.828 (67.565)	Top-5 acc 91.016 (86.307)	lr 0.00001
Train [119][2210/3239]	Time 0.250 (0.544)	Data Time 0.002 (0.020)	Loss 2.5042 (2.3476)	Entropy 0.53260 (0.53284)	Top-1 acc 64.844 (67.561)	Top-5 acc 82.812 (86.302)	lr 0.00001
Train [119][2220/3239]	Time 0.253 (0.543)	Data Time 0.001 (0.020)	Loss 2.3439 (2.3476)	Entropy 0.53279 (0.53284)	Top-1 acc 65.625 (67.563)	Top-5 acc 87.109 (86.303)	lr 0.00001
Train [119][2230/3239]	Time 0.226 (0.543)	Data Time 0.001 (0.020)	Loss 2.3927 (2.3477)	Entropy 0.53282 (0.53284)	Top-1 acc 65.625 (67.563)	Top-5 acc 86.328 (86.301)	lr 0.00001
Train [119][2240/3239]	Time 0.257 (0.542)	Data Time 0.001 (0.020)	Loss 2.4825 (2.3478)	Entropy 0.53286 (0.53284)	Top-1 acc 65.234 (67.559)	Top-5 acc 82.422 (86.298)	lr 0.00001
Train [119][2250/3239]	Time 0.277 (0.542)	Data Time 0.001 (0.019)	Loss 2.4152 (2.3473)	Entropy 0.53256 (0.53284)	Top-1 acc 67.578 (67.571)	Top-5 acc 84.766 (86.307)	lr 0.00001
Train [119][2260/3239]	Time 0.239 (0.541)	Data Time 0.001 (0.019)	Loss 2.2507 (2.3470)	Entropy 0.53210 (0.53284)	Top-1 acc 74.219 (67.577)	Top-5 acc 86.719 (86.311)	lr 0.00001
Train [119][2270/3239]	Time 0.338 (0.541)	Data Time 0.002 (0.019)	Loss 2.3285 (2.3470)	Entropy 0.53172 (0.53283)	Top-1 acc 69.141 (67.578)	Top-5 acc 85.156 (86.311)	lr 0.00001
Train [119][2280/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.019)	Loss 2.4601 (2.3471)	Entropy 0.53202 (0.53283)	Top-1 acc 63.281 (67.573)	Top-5 acc 83.203 (86.309)	lr 0.00001
Train [119][2290/3239]	Time 0.244 (0.540)	Data Time 0.001 (0.019)	Loss 2.1718 (2.3469)	Entropy 0.53205 (0.53282)	Top-1 acc 70.312 (67.579)	Top-5 acc 91.406 (86.309)	lr 0.00001
Train [119][2300/3239]	Time 0.232 (0.539)	Data Time 0.002 (0.019)	Loss 2.3560 (2.3474)	Entropy 0.53168 (0.53282)	Top-1 acc 64.062 (67.568)	Top-5 acc 89.062 (86.299)	lr 0.00001
Train [119][2310/3239]	Time 0.231 (0.539)	Data Time 0.001 (0.019)	Loss 2.3768 (2.3475)	Entropy 0.53182 (0.53282)	Top-1 acc 68.750 (67.570)	Top-5 acc 83.984 (86.298)	lr 0.00001
Train [119][2320/3239]	Time 0.229 (0.538)	Data Time 0.001 (0.019)	Loss 2.3129 (2.3473)	Entropy 0.53195 (0.53281)	Top-1 acc 69.531 (67.576)	Top-5 acc 86.719 (86.300)	lr 0.00001
Train [119][2330/3239]	Time 0.225 (0.538)	Data Time 0.001 (0.019)	Loss 2.3954 (2.3474)	Entropy 0.53240 (0.53281)	Top-1 acc 64.844 (67.570)	Top-5 acc 84.766 (86.297)	lr 0.00001
Train [119][2340/3239]	Time 0.223 (0.537)	Data Time 0.001 (0.019)	Loss 2.2901 (2.3474)	Entropy 0.53225 (0.53281)	Top-1 acc 69.141 (67.570)	Top-5 acc 88.672 (86.299)	lr 0.00001
Train [119][2350/3239]	Time 0.230 (0.537)	Data Time 0.001 (0.019)	Loss 2.4094 (2.3474)	Entropy 0.53244 (0.53280)	Top-1 acc 63.281 (67.566)	Top-5 acc 85.938 (86.300)	lr 0.00001
Train [119][2360/3239]	Time 0.388 (0.536)	Data Time 0.001 (0.019)	Loss 2.2944 (2.3476)	Entropy 0.53269 (0.53280)	Top-1 acc 68.750 (67.561)	Top-5 acc 87.109 (86.297)	lr 0.00001
Train [119][2370/3239]	Time 0.242 (0.536)	Data Time 0.001 (0.019)	Loss 2.2647 (2.3473)	Entropy 0.53265 (0.53280)	Top-1 acc 68.750 (67.568)	Top-5 acc 89.062 (86.303)	lr 0.00001
Train [119][2380/3239]	Time 0.223 (0.535)	Data Time 0.001 (0.018)	Loss 2.3969 (2.3475)	Entropy 0.53266 (0.53280)	Top-1 acc 65.625 (67.560)	Top-5 acc 83.594 (86.297)	lr 0.00001
Train [119][2390/3239]	Time 0.233 (0.535)	Data Time 0.001 (0.018)	Loss 2.3741 (2.3474)	Entropy 0.53220 (0.53280)	Top-1 acc 66.016 (67.559)	Top-5 acc 86.328 (86.297)	lr 0.00001
Train [119][2400/3239]	Time 0.310 (0.535)	Data Time 0.002 (0.018)	Loss 2.1618 (2.3471)	Entropy 0.53208 (0.53280)	Top-1 acc 71.484 (67.570)	Top-5 acc 89.453 (86.305)	lr 0.00001
Train [119][2410/3239]	Time 0.226 (0.534)	Data Time 0.001 (0.018)	Loss 2.3329 (2.3471)	Entropy 0.53177 (0.53279)	Top-1 acc 68.359 (67.571)	Top-5 acc 87.109 (86.307)	lr 0.00001
Train [119][2420/3239]	Time 0.237 (0.534)	Data Time 0.001 (0.018)	Loss 2.2010 (2.3467)	Entropy 0.53199 (0.53279)	Top-1 acc 75.000 (67.584)	Top-5 acc 89.062 (86.317)	lr 0.00001
Train [119][2430/3239]	Time 0.328 (0.533)	Data Time 0.001 (0.018)	Loss 2.4782 (2.3465)	Entropy 0.53179 (0.53279)	Top-1 acc 63.281 (67.584)	Top-5 acc 84.375 (86.318)	lr 0.00001
Train [119][2440/3239]	Time 0.258 (0.533)	Data Time 0.001 (0.018)	Loss 2.5834 (2.3468)	Entropy 0.53199 (0.53278)	Top-1 acc 60.547 (67.580)	Top-5 acc 83.203 (86.310)	lr 0.00001
Train [119][2450/3239]	Time 0.224 (0.532)	Data Time 0.001 (0.018)	Loss 2.5948 (2.3471)	Entropy 0.53203 (0.53278)	Top-1 acc 62.109 (67.574)	Top-5 acc 83.203 (86.307)	lr 0.00001
Train [119][2460/3239]	Time 0.223 (0.532)	Data Time 0.001 (0.018)	Loss 2.3850 (2.3471)	Entropy 0.53227 (0.53278)	Top-1 acc 69.141 (67.572)	Top-5 acc 83.594 (86.307)	lr 0.00001
Train [119][2470/3239]	Time 0.304 (0.532)	Data Time 0.003 (0.018)	Loss 2.3663 (2.3473)	Entropy 0.53251 (0.53278)	Top-1 acc 69.141 (67.571)	Top-5 acc 86.328 (86.305)	lr 0.00001
Train [119][2480/3239]	Time 0.224 (0.531)	Data Time 0.001 (0.018)	Loss 2.3495 (2.3471)	Entropy 0.53290 (0.53277)	Top-1 acc 66.797 (67.579)	Top-5 acc 86.328 (86.308)	lr 0.00001
Train [119][2490/3239]	Time 0.242 (0.531)	Data Time 0.001 (0.018)	Loss 2.4366 (2.3469)	Entropy 0.53304 (0.53278)	Top-1 acc 66.016 (67.583)	Top-5 acc 83.594 (86.310)	lr 0.00001
Train [119][2500/3239]	Time 0.270 (0.531)	Data Time 0.003 (0.018)	Loss 2.4788 (2.3469)	Entropy 0.53316 (0.53278)	Top-1 acc 65.234 (67.584)	Top-5 acc 82.031 (86.310)	lr 0.00001
Train [119][2510/3239]	Time 0.225 (0.530)	Data Time 0.001 (0.018)	Loss 2.3138 (2.3468)	Entropy 0.53335 (0.53278)	Top-1 acc 69.922 (67.585)	Top-5 acc 88.672 (86.314)	lr 0.00001
Train [119][2520/3239]	Time 0.318 (0.530)	Data Time 0.001 (0.018)	Loss 2.4098 (2.3469)	Entropy 0.53343 (0.53278)	Top-1 acc 65.625 (67.579)	Top-5 acc 84.375 (86.310)	lr 0.00001
Train [119][2530/3239]	Time 0.244 (0.529)	Data Time 0.001 (0.017)	Loss 2.2422 (2.3467)	Entropy 0.53344 (0.53278)	Top-1 acc 69.531 (67.583)	Top-5 acc 87.109 (86.311)	lr 0.00001
Train [119][2540/3239]	Time 0.238 (0.529)	Data Time 0.001 (0.017)	Loss 2.3771 (2.3468)	Entropy 0.53339 (0.53279)	Top-1 acc 67.188 (67.581)	Top-5 acc 85.156 (86.307)	lr 0.00001
Train [119][2550/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.017)	Loss 2.0698 (2.3467)	Entropy 0.53346 (0.53279)	Top-1 acc 76.172 (67.586)	Top-5 acc 89.062 (86.308)	lr 0.00001
Train [119][2560/3239]	Time 0.229 (0.528)	Data Time 0.001 (0.017)	Loss 2.5159 (2.3468)	Entropy 0.53362 (0.53279)	Top-1 acc 64.453 (67.583)	Top-5 acc 82.031 (86.308)	lr 0.00001
Train [119][2570/3239]	Time 0.287 (0.528)	Data Time 0.001 (0.017)	Loss 2.3101 (2.3468)	Entropy 0.53376 (0.53279)	Top-1 acc 68.750 (67.579)	Top-5 acc 86.328 (86.309)	lr 0.00001
Train [119][2580/3239]	Time 0.233 (0.527)	Data Time 0.001 (0.017)	Loss 2.3337 (2.3468)	Entropy 0.53384 (0.53280)	Top-1 acc 69.531 (67.580)	Top-5 acc 85.156 (86.308)	lr 0.00001
Train [119][2590/3239]	Time 0.328 (0.527)	Data Time 0.001 (0.017)	Loss 2.2042 (2.3469)	Entropy 0.53400 (0.53280)	Top-1 acc 74.219 (67.573)	Top-5 acc 89.062 (86.306)	lr 0.00001
Train [119][2600/3239]	Time 0.245 (0.526)	Data Time 0.001 (0.017)	Loss 2.4799 (2.3473)	Entropy 0.53432 (0.53281)	Top-1 acc 65.234 (67.564)	Top-5 acc 83.594 (86.298)	lr 0.00001
Train [119][2610/3239]	Time 0.231 (0.526)	Data Time 0.001 (0.017)	Loss 2.3590 (2.3472)	Entropy 0.53420 (0.53281)	Top-1 acc 66.797 (67.564)	Top-5 acc 87.500 (86.297)	lr 0.00001
Train [119][2620/3239]	Time 0.236 (0.525)	Data Time 0.001 (0.017)	Loss 2.4735 (2.3472)	Entropy 0.53412 (0.53282)	Top-1 acc 65.234 (67.565)	Top-5 acc 81.250 (86.293)	lr 0.00001
Train [119][2630/3239]	Time 0.215 (0.525)	Data Time 0.001 (0.017)	Loss 2.7357 (2.3474)	Entropy 0.53403 (0.53282)	Top-1 acc 58.594 (67.566)	Top-5 acc 79.297 (86.287)	lr 0.00001
Train [119][2640/3239]	Time 0.228 (0.524)	Data Time 0.001 (0.017)	Loss 2.2230 (2.3475)	Entropy 0.53402 (0.53283)	Top-1 acc 70.703 (67.560)	Top-5 acc 88.281 (86.284)	lr 0.00001
Train [119][2650/3239]	Time 0.227 (0.524)	Data Time 0.001 (0.017)	Loss 2.4352 (2.3474)	Entropy 0.53419 (0.53283)	Top-1 acc 65.234 (67.566)	Top-5 acc 84.766 (86.285)	lr 0.00001
Train [119][2660/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.017)	Loss 2.3573 (2.3476)	Entropy 0.53436 (0.53284)	Top-1 acc 66.797 (67.561)	Top-5 acc 85.547 (86.283)	lr 0.00001
Train [119][2670/3239]	Time 0.226 (0.523)	Data Time 0.001 (0.017)	Loss 2.3700 (2.3473)	Entropy 0.53398 (0.53284)	Top-1 acc 66.406 (67.565)	Top-5 acc 86.328 (86.288)	lr 0.00001
Train [119][2680/3239]	Time 0.421 (0.523)	Data Time 0.002 (0.017)	Loss 2.4203 (2.3473)	Entropy 0.53375 (0.53285)	Top-1 acc 65.625 (67.561)	Top-5 acc 83.984 (86.289)	lr 0.00001
Train [119][2690/3239]	Time 0.226 (0.523)	Data Time 0.001 (0.017)	Loss 2.1388 (2.3475)	Entropy 0.53354 (0.53285)	Top-1 acc 71.484 (67.558)	Top-5 acc 89.844 (86.284)	lr 0.00001
Train [119][2700/3239]	Time 0.281 (0.522)	Data Time 0.002 (0.016)	Loss 2.4336 (2.3475)	Entropy 0.53311 (0.53285)	Top-1 acc 64.062 (67.557)	Top-5 acc 85.938 (86.285)	lr 0.00001
Train [119][2710/3239]	Time 0.230 (0.522)	Data Time 0.001 (0.016)	Loss 2.4691 (2.3476)	Entropy 0.53332 (0.53285)	Top-1 acc 63.672 (67.555)	Top-5 acc 84.375 (86.284)	lr 0.00001
Train [119][2720/3239]	Time 0.231 (0.522)	Data Time 0.001 (0.016)	Loss 2.0723 (2.3475)	Entropy 0.53307 (0.53286)	Top-1 acc 72.656 (67.561)	Top-5 acc 92.578 (86.286)	lr 0.00001
Train [119][2730/3239]	Time 0.256 (0.522)	Data Time 0.001 (0.016)	Loss 2.4213 (2.3475)	Entropy 0.53297 (0.53286)	Top-1 acc 64.062 (67.558)	Top-5 acc 84.766 (86.286)	lr 0.00001
Train [119][2740/3239]	Time 0.280 (0.521)	Data Time 0.002 (0.016)	Loss 2.4483 (2.3473)	Entropy 0.53264 (0.53286)	Top-1 acc 65.625 (67.562)	Top-5 acc 83.594 (86.290)	lr 0.00001
Train [119][2750/3239]	Time 0.371 (0.521)	Data Time 0.002 (0.016)	Loss 2.4333 (2.3473)	Entropy 0.53257 (0.53285)	Top-1 acc 67.578 (67.562)	Top-5 acc 83.984 (86.289)	lr 0.00001
Train [119][2760/3239]	Time 0.248 (0.521)	Data Time 0.001 (0.016)	Loss 2.2896 (2.3471)	Entropy 0.53240 (0.53285)	Top-1 acc 68.750 (67.566)	Top-5 acc 87.500 (86.292)	lr 0.00001
Train [119][2770/3239]	Time 0.260 (0.520)	Data Time 0.001 (0.016)	Loss 2.4559 (2.3469)	Entropy 0.53208 (0.53285)	Top-1 acc 66.797 (67.574)	Top-5 acc 83.594 (86.295)	lr 0.00001
Train [119][2780/3239]	Time 0.239 (0.520)	Data Time 0.001 (0.016)	Loss 2.6449 (2.3470)	Entropy 0.53191 (0.53285)	Top-1 acc 58.203 (67.571)	Top-5 acc 82.031 (86.292)	lr 0.00001
Train [119][2790/3239]	Time 0.387 (0.538)	Data Time 0.005 (0.016)	Loss 2.4248 (2.3468)	Entropy 0.53197 (0.53284)	Top-1 acc 65.234 (67.574)	Top-5 acc 83.984 (86.294)	lr 0.00001
Train [119][2800/3239]	Time 0.241 (0.538)	Data Time 0.002 (0.016)	Loss 2.1565 (2.3469)	Entropy 0.53161 (0.53284)	Top-1 acc 73.047 (67.572)	Top-5 acc 89.062 (86.289)	lr 0.00001
Train [119][2810/3239]	Time 0.245 (0.537)	Data Time 0.001 (0.016)	Loss 2.1023 (2.3467)	Entropy 0.53186 (0.53284)	Top-1 acc 74.219 (67.576)	Top-5 acc 91.797 (86.293)	lr 0.00001
Train [119][2820/3239]	Time 0.237 (0.537)	Data Time 0.001 (0.016)	Loss 2.4160 (2.3467)	Entropy 0.53136 (0.53283)	Top-1 acc 64.062 (67.575)	Top-5 acc 84.766 (86.295)	lr 0.00001
Train [119][2830/3239]	Time 0.239 (0.537)	Data Time 0.001 (0.016)	Loss 2.3737 (2.3466)	Entropy 0.53155 (0.53283)	Top-1 acc 68.750 (67.577)	Top-5 acc 83.984 (86.295)	lr 0.00001
Train [119][2840/3239]	Time 0.431 (0.537)	Data Time 0.002 (0.016)	Loss 2.3463 (2.3467)	Entropy 0.53177 (0.53282)	Top-1 acc 66.797 (67.575)	Top-5 acc 87.109 (86.293)	lr 0.00001
Train [119][2850/3239]	Time 0.254 (0.537)	Data Time 0.001 (0.016)	Loss 2.2636 (2.3468)	Entropy 0.53200 (0.53282)	Top-1 acc 70.703 (67.569)	Top-5 acc 88.281 (86.289)	lr 0.00001
Train [119][2860/3239]	Time 0.242 (0.536)	Data Time 0.001 (0.016)	Loss 2.2741 (2.3470)	Entropy 0.53209 (0.53282)	Top-1 acc 69.531 (67.567)	Top-5 acc 86.328 (86.287)	lr 0.00001
Train [119][2870/3239]	Time 0.278 (0.536)	Data Time 0.001 (0.016)	Loss 2.3124 (2.3469)	Entropy 0.53160 (0.53281)	Top-1 acc 68.359 (67.571)	Top-5 acc 87.109 (86.288)	lr 0.00001
Train [119][2880/3239]	Time 0.390 (0.536)	Data Time 0.001 (0.016)	Loss 2.5170 (2.3469)	Entropy 0.53160 (0.53281)	Top-1 acc 64.062 (67.574)	Top-5 acc 84.375 (86.288)	lr 0.00001
Train [119][2890/3239]	Time 0.243 (0.536)	Data Time 0.001 (0.016)	Loss 2.1403 (2.3468)	Entropy 0.53194 (0.53281)	Top-1 acc 71.875 (67.577)	Top-5 acc 90.234 (86.293)	lr 0.00001
Train [119][2900/3239]	Time 0.238 (0.535)	Data Time 0.001 (0.015)	Loss 2.4394 (2.3466)	Entropy 0.53210 (0.53280)	Top-1 acc 67.969 (67.582)	Top-5 acc 83.594 (86.294)	lr 0.00001
Train [119][2910/3239]	Time 0.381 (0.535)	Data Time 0.001 (0.015)	Loss 2.1758 (2.3464)	Entropy 0.53137 (0.53280)	Top-1 acc 70.703 (67.589)	Top-5 acc 89.062 (86.298)	lr 0.00001
Train [119][2920/3239]	Time 0.237 (0.535)	Data Time 0.002 (0.015)	Loss 2.3442 (2.3466)	Entropy 0.53092 (0.53279)	Top-1 acc 65.625 (67.585)	Top-5 acc 85.938 (86.292)	lr 0.00001
Train [119][2930/3239]	Time 0.245 (0.534)	Data Time 0.001 (0.015)	Loss 2.3899 (2.3469)	Entropy 0.53084 (0.53279)	Top-1 acc 69.531 (67.577)	Top-5 acc 85.547 (86.289)	lr 0.00001
Train [119][2940/3239]	Time 0.241 (0.534)	Data Time 0.001 (0.015)	Loss 2.4574 (2.3471)	Entropy 0.53085 (0.53278)	Top-1 acc 66.797 (67.575)	Top-5 acc 85.938 (86.286)	lr 0.00001
Train [119][2950/3239]	Time 0.236 (0.533)	Data Time 0.001 (0.015)	Loss 2.2298 (2.3471)	Entropy 0.53069 (0.53277)	Top-1 acc 69.922 (67.574)	Top-5 acc 88.281 (86.285)	lr 0.00001
Train [119][2960/3239]	Time 0.235 (0.533)	Data Time 0.001 (0.015)	Loss 2.2926 (2.3470)	Entropy 0.53023 (0.53277)	Top-1 acc 67.188 (67.580)	Top-5 acc 86.719 (86.289)	lr 0.00001
Train [119][2970/3239]	Time 0.249 (0.533)	Data Time 0.001 (0.015)	Loss 2.3898 (2.3470)	Entropy 0.53040 (0.53276)	Top-1 acc 67.969 (67.581)	Top-5 acc 87.500 (86.289)	lr 0.00001
Train [119][2980/3239]	Time 0.351 (0.532)	Data Time 0.002 (0.015)	Loss 2.3659 (2.3470)	Entropy 0.53052 (0.53275)	Top-1 acc 66.406 (67.581)	Top-5 acc 86.328 (86.287)	lr 0.00000
Train [119][2990/3239]	Time 0.245 (0.532)	Data Time 0.002 (0.015)	Loss 2.2026 (2.3468)	Entropy 0.53043 (0.53274)	Top-1 acc 71.484 (67.588)	Top-5 acc 88.281 (86.289)	lr 0.00000
Train [119][3000/3239]	Time 0.257 (0.532)	Data Time 0.002 (0.015)	Loss 2.3648 (2.3468)	Entropy 0.53029 (0.53274)	Top-1 acc 69.531 (67.590)	Top-5 acc 85.156 (86.288)	lr 0.00000
Train [119][3010/3239]	Time 0.238 (0.532)	Data Time 0.001 (0.015)	Loss 2.4458 (2.3469)	Entropy 0.53026 (0.53273)	Top-1 acc 62.500 (67.587)	Top-5 acc 85.938 (86.286)	lr 0.00000
Train [119][3020/3239]	Time 0.244 (0.531)	Data Time 0.001 (0.015)	Loss 2.2105 (2.3466)	Entropy 0.53022 (0.53272)	Top-1 acc 71.094 (67.594)	Top-5 acc 89.062 (86.293)	lr 0.00000
Train [119][3030/3239]	Time 0.277 (0.531)	Data Time 0.003 (0.015)	Loss 2.4159 (2.3467)	Entropy 0.53013 (0.53271)	Top-1 acc 67.188 (67.593)	Top-5 acc 86.328 (86.294)	lr 0.00000
Train [119][3040/3239]	Time 0.295 (0.531)	Data Time 0.001 (0.015)	Loss 2.6803 (2.3468)	Entropy 0.53023 (0.53270)	Top-1 acc 58.203 (67.591)	Top-5 acc 85.547 (86.294)	lr 0.00000
Train [119][3050/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.015)	Loss 2.3158 (2.3469)	Entropy 0.53004 (0.53270)	Top-1 acc 67.578 (67.591)	Top-5 acc 89.062 (86.292)	lr 0.00000
Train [119][3060/3239]	Time 0.255 (0.530)	Data Time 0.001 (0.015)	Loss 2.4165 (2.3469)	Entropy 0.52996 (0.53269)	Top-1 acc 65.625 (67.591)	Top-5 acc 85.938 (86.293)	lr 0.00000
Train [119][3070/3239]	Time 0.378 (0.530)	Data Time 0.001 (0.015)	Loss 2.4590 (2.3467)	Entropy 0.53024 (0.53268)	Top-1 acc 63.672 (67.595)	Top-5 acc 86.328 (86.297)	lr 0.00000
Train [119][3080/3239]	Time 0.235 (0.530)	Data Time 0.001 (0.015)	Loss 2.3483 (2.3468)	Entropy 0.53006 (0.53267)	Top-1 acc 65.625 (67.594)	Top-5 acc 84.766 (86.297)	lr 0.00000
Train [119][3090/3239]	Time 0.238 (0.529)	Data Time 0.001 (0.015)	Loss 2.1611 (2.3472)	Entropy 0.53031 (0.53266)	Top-1 acc 73.438 (67.586)	Top-5 acc 87.500 (86.288)	lr 0.00000
Train [119][3100/3239]	Time 0.227 (0.529)	Data Time 0.001 (0.015)	Loss 2.6482 (2.3473)	Entropy 0.53036 (0.53265)	Top-1 acc 61.328 (67.578)	Top-5 acc 79.688 (86.287)	lr 0.00000
Train [119][3110/3239]	Time 0.232 (0.529)	Data Time 0.001 (0.015)	Loss 2.3190 (2.3474)	Entropy 0.53041 (0.53265)	Top-1 acc 71.875 (67.579)	Top-5 acc 86.719 (86.286)	lr 0.00000
Train [119][3120/3239]	Time 0.237 (0.528)	Data Time 0.001 (0.015)	Loss 2.6208 (2.3476)	Entropy 0.53055 (0.53264)	Top-1 acc 61.328 (67.576)	Top-5 acc 80.078 (86.278)	lr 0.00000
Train [119][3130/3239]	Time 0.231 (0.528)	Data Time 0.001 (0.015)	Loss 2.2397 (2.3476)	Entropy 0.53063 (0.53263)	Top-1 acc 73.047 (67.577)	Top-5 acc 89.062 (86.279)	lr 0.00000
Train [119][3140/3239]	Time 0.332 (0.527)	Data Time 0.001 (0.014)	Loss 2.4973 (2.3476)	Entropy 0.53067 (0.53263)	Top-1 acc 64.844 (67.577)	Top-5 acc 85.938 (86.279)	lr 0.00000
Train [119][3150/3239]	Time 0.242 (0.527)	Data Time 0.001 (0.014)	Loss 2.4953 (2.3475)	Entropy 0.53029 (0.53262)	Top-1 acc 62.500 (67.578)	Top-5 acc 83.203 (86.278)	lr 0.00000
Train [119][3160/3239]	Time 0.230 (0.527)	Data Time 0.001 (0.014)	Loss 2.2327 (2.3476)	Entropy 0.53033 (0.53261)	Top-1 acc 69.531 (67.578)	Top-5 acc 86.719 (86.277)	lr 0.00000
Train [119][3170/3239]	Time 0.237 (0.526)	Data Time 0.001 (0.014)	Loss 2.2515 (2.3473)	Entropy 0.53067 (0.53261)	Top-1 acc 68.750 (67.586)	Top-5 acc 85.547 (86.280)	lr 0.00000
Train [119][3180/3239]	Time 0.280 (0.526)	Data Time 0.000 (0.014)	Loss 2.3211 (2.3473)	Entropy 0.53090 (0.53260)	Top-1 acc 69.141 (67.587)	Top-5 acc 86.719 (86.282)	lr 0.00000
Train [119][3190/3239]	Time 0.222 (0.526)	Data Time 0.000 (0.014)	Loss 2.4495 (2.3473)	Entropy 0.53087 (0.53259)	Top-1 acc 61.719 (67.585)	Top-5 acc 84.375 (86.282)	lr 0.00000
Train [119][3200/3239]	Time 0.233 (0.526)	Data Time 0.000 (0.014)	Loss 2.0528 (2.3472)	Entropy 0.53090 (0.53259)	Top-1 acc 76.953 (67.584)	Top-5 acc 91.406 (86.283)	lr 0.00000
Train [119][3210/3239]	Time 0.233 (0.526)	Data Time 0.000 (0.014)	Loss 2.2954 (2.3470)	Entropy 0.53103 (0.53258)	Top-1 acc 65.234 (67.585)	Top-5 acc 86.328 (86.286)	lr 0.00000
Train [119][3220/3239]	Time 0.231 (0.525)	Data Time 0.000 (0.014)	Loss 2.3418 (2.3468)	Entropy 0.53086 (0.53258)	Top-1 acc 65.234 (67.591)	Top-5 acc 87.109 (86.290)	lr 0.00000
Train [119][3230/3239]	Time 0.240 (0.525)	Data Time 0.000 (0.014)	Loss 2.8835 (2.3471)	Entropy 0.53112 (0.53257)	Top-1 acc 56.641 (67.587)	Top-5 acc 74.609 (86.284)	lr 0.00000
Train [119][3239/3239]	Time 1.093 (0.524)	Data Time 0.000 (0.014)	Loss 2.2551 (2.3472)	Entropy 0.53135 (0.53257)	Top-1 acc 71.605 (67.582)	Top-5 acc 87.654 (86.281)	lr 0.00000
==========Valid [119/120]	loss 1.167	top-1 acc 73.142 (73.178)	top-5 acc 90.727	Train top-1 67.582	top-5 86.281	Entropy 0.53135	Latency-None: 0.000ms	Flops: 539.00M
Train [120][0/3239]	Time 37.609 (37.609)	Data Time 34.962 (34.962)	Loss 2.3940 (2.3940)	Entropy 0.53116 (0.53116)	Top-1 acc 68.750 (68.750)	Top-5 acc 86.328 (86.328)	lr 0.00000
Train [120][10/3239]	Time 0.305 (4.094)	Data Time 0.002 (3.219)	Loss 2.2005 (2.3337)	Entropy 0.53160 (0.53135)	Top-1 acc 73.438 (67.365)	Top-5 acc 87.109 (87.074)	lr 0.00000
Train [120][20/3239]	Time 0.229 (2.367)	Data Time 0.001 (1.687)	Loss 2.6170 (2.3470)	Entropy 0.53163 (0.53148)	Top-1 acc 64.062 (67.299)	Top-5 acc 82.422 (86.533)	lr 0.00000
Train [120][30/3239]	Time 0.232 (1.731)	Data Time 0.001 (1.144)	Loss 2.2996 (2.3648)	Entropy 0.53169 (0.53153)	Top-1 acc 70.312 (66.898)	Top-5 acc 88.281 (86.177)	lr 0.00000
Train [120][40/3239]	Time 0.335 (1.415)	Data Time 0.001 (0.865)	Loss 2.0680 (2.3693)	Entropy 0.53175 (0.53158)	Top-1 acc 75.781 (66.883)	Top-5 acc 92.969 (86.071)	lr 0.00000
Train [120][50/3239]	Time 0.256 (1.216)	Data Time 0.001 (0.696)	Loss 2.3523 (2.3607)	Entropy 0.53146 (0.53161)	Top-1 acc 71.094 (67.057)	Top-5 acc 83.984 (86.014)	lr 0.00000
Train [120][60/3239]	Time 0.233 (1.084)	Data Time 0.001 (0.582)	Loss 2.2062 (2.3483)	Entropy 0.53192 (0.53161)	Top-1 acc 72.266 (67.392)	Top-5 acc 89.062 (86.142)	lr 0.00000
Train [120][70/3239]	Time 0.235 (0.992)	Data Time 0.001 (0.500)	Loss 2.1883 (2.3424)	Entropy 0.53158 (0.53162)	Top-1 acc 69.922 (67.529)	Top-5 acc 89.062 (86.251)	lr 0.00000
Train [120][80/3239]	Time 0.241 (0.922)	Data Time 0.001 (0.439)	Loss 2.4683 (2.3574)	Entropy 0.53183 (0.53162)	Top-1 acc 67.188 (67.081)	Top-5 acc 85.547 (86.029)	lr 0.00000
Train [120][90/3239]	Time 0.228 (0.867)	Data Time 0.001 (0.391)	Loss 2.1727 (2.3561)	Entropy 0.53208 (0.53165)	Top-1 acc 73.828 (67.239)	Top-5 acc 88.281 (86.019)	lr 0.00000
Train [120][100/3239]	Time 0.324 (0.835)	Data Time 0.002 (0.352)	Loss 2.3287 (2.3524)	Entropy 0.53176 (0.53169)	Top-1 acc 68.359 (67.327)	Top-5 acc 85.156 (86.108)	lr 0.00000
Train [120][110/3239]	Time 0.265 (0.798)	Data Time 0.001 (0.321)	Loss 2.3184 (2.3571)	Entropy 0.53144 (0.53169)	Top-1 acc 67.578 (67.237)	Top-5 acc 85.938 (86.036)	lr 0.00000
Train [120][120/3239]	Time 0.236 (0.767)	Data Time 0.001 (0.294)	Loss 2.2317 (2.3512)	Entropy 0.53157 (0.53168)	Top-1 acc 68.359 (67.330)	Top-5 acc 90.625 (86.157)	lr 0.00000
Train [120][130/3239]	Time 0.346 (0.741)	Data Time 0.001 (0.272)	Loss 2.1508 (2.3527)	Entropy 0.53130 (0.53166)	Top-1 acc 73.828 (67.337)	Top-5 acc 88.672 (86.137)	lr 0.00000
Train [120][140/3239]	Time 0.248 (0.717)	Data Time 0.001 (0.253)	Loss 2.3882 (2.3530)	Entropy 0.53117 (0.53163)	Top-1 acc 66.406 (67.365)	Top-5 acc 84.375 (86.129)	lr 0.00000
Train [120][150/3239]	Time 0.329 (0.698)	Data Time 0.002 (0.236)	Loss 2.3704 (2.3581)	Entropy 0.53111 (0.53159)	Top-1 acc 66.016 (67.237)	Top-5 acc 86.328 (86.041)	lr 0.00000
Train [120][160/3239]	Time 0.253 (0.685)	Data Time 0.001 (0.221)	Loss 2.2718 (2.3601)	Entropy 0.53126 (0.53157)	Top-1 acc 70.312 (67.200)	Top-5 acc 87.891 (85.979)	lr 0.00000
Train [120][170/3239]	Time 0.227 (0.670)	Data Time 0.001 (0.209)	Loss 2.3280 (2.3559)	Entropy 0.53105 (0.53154)	Top-1 acc 66.016 (67.318)	Top-5 acc 85.156 (86.022)	lr 0.00000
Train [120][180/3239]	Time 0.241 (0.656)	Data Time 0.001 (0.197)	Loss 2.2400 (2.3525)	Entropy 0.53086 (0.53152)	Top-1 acc 67.969 (67.403)	Top-5 acc 88.281 (86.095)	lr 0.00000
Train [120][190/3239]	Time 0.224 (0.643)	Data Time 0.001 (0.187)	Loss 2.2172 (2.3545)	Entropy 0.53075 (0.53148)	Top-1 acc 72.266 (67.343)	Top-5 acc 86.719 (86.089)	lr 0.00000
Train [120][200/3239]	Time 0.402 (0.632)	Data Time 0.002 (0.178)	Loss 2.3023 (2.3518)	Entropy 0.53076 (0.53144)	Top-1 acc 69.922 (67.407)	Top-5 acc 87.109 (86.130)	lr 0.00000
Train [120][210/3239]	Time 0.399 (0.863)	Data Time 0.004 (0.170)	Loss 2.1375 (2.3521)	Entropy 0.53076 (0.53141)	Top-1 acc 70.703 (67.387)	Top-5 acc 89.453 (86.152)	lr 0.00000
Train [120][220/3239]	Time 0.346 (0.851)	Data Time 0.002 (0.162)	Loss 2.1654 (2.3500)	Entropy 0.53055 (0.53137)	Top-1 acc 69.141 (67.428)	Top-5 acc 86.328 (86.160)	lr 0.00000
Train [120][230/3239]	Time 0.271 (0.833)	Data Time 0.002 (0.155)	Loss 2.5127 (2.3517)	Entropy 0.53049 (0.53134)	Top-1 acc 65.625 (67.387)	Top-5 acc 81.250 (86.095)	lr 0.00000
Train [120][240/3239]	Time 0.262 (0.817)	Data Time 0.001 (0.149)	Loss 2.5647 (2.3519)	Entropy 0.53041 (0.53130)	Top-1 acc 60.938 (67.358)	Top-5 acc 80.859 (86.066)	lr 0.00000
Train [120][250/3239]	Time 0.315 (0.802)	Data Time 0.002 (0.143)	Loss 2.4406 (2.3504)	Entropy 0.53081 (0.53127)	Top-1 acc 61.719 (67.393)	Top-5 acc 82.031 (86.106)	lr 0.00000
Train [120][260/3239]	Time 0.314 (0.793)	Data Time 0.003 (0.138)	Loss 2.2683 (2.3502)	Entropy 0.53093 (0.53126)	Top-1 acc 68.359 (67.390)	Top-5 acc 87.109 (86.104)	lr 0.00000
Train [120][270/3239]	Time 0.282 (0.780)	Data Time 0.003 (0.133)	Loss 2.2878 (2.3490)	Entropy 0.53089 (0.53124)	Top-1 acc 71.094 (67.437)	Top-5 acc 87.500 (86.122)	lr 0.00000
Train [120][280/3239]	Time 0.238 (0.768)	Data Time 0.001 (0.128)	Loss 2.3181 (2.3480)	Entropy 0.53109 (0.53123)	Top-1 acc 67.188 (67.486)	Top-5 acc 86.328 (86.121)	lr 0.00000
Train [120][290/3239]	Time 0.353 (0.756)	Data Time 0.001 (0.124)	Loss 2.1353 (2.3477)	Entropy 0.53126 (0.53123)	Top-1 acc 71.094 (67.496)	Top-5 acc 92.969 (86.152)	lr 0.00000
Train [120][300/3239]	Time 0.231 (0.745)	Data Time 0.001 (0.120)	Loss 2.4278 (2.3483)	Entropy 0.53125 (0.53123)	Top-1 acc 67.188 (67.498)	Top-5 acc 84.375 (86.145)	lr 0.00000
Train [120][310/3239]	Time 0.238 (0.734)	Data Time 0.002 (0.116)	Loss 2.4764 (2.3495)	Entropy 0.53127 (0.53123)	Top-1 acc 62.891 (67.424)	Top-5 acc 84.766 (86.143)	lr 0.00000
Train [120][320/3239]	Time 0.243 (0.725)	Data Time 0.001 (0.112)	Loss 2.4873 (2.3513)	Entropy 0.53155 (0.53123)	Top-1 acc 67.188 (67.377)	Top-5 acc 83.984 (86.115)	lr 0.00000
Train [120][330/3239]	Time 0.271 (0.716)	Data Time 0.001 (0.109)	Loss 2.5151 (2.3533)	Entropy 0.53141 (0.53124)	Top-1 acc 66.797 (67.341)	Top-5 acc 83.594 (86.090)	lr 0.00000
Train [120][340/3239]	Time 0.251 (0.707)	Data Time 0.002 (0.106)	Loss 2.2445 (2.3523)	Entropy 0.53126 (0.53125)	Top-1 acc 74.609 (67.370)	Top-5 acc 87.109 (86.109)	lr 0.00000
Train [120][350/3239]	Time 0.245 (0.699)	Data Time 0.002 (0.103)	Loss 2.2035 (2.3528)	Entropy 0.53108 (0.53125)	Top-1 acc 73.047 (67.337)	Top-5 acc 89.062 (86.099)	lr 0.00000
Train [120][360/3239]	Time 0.345 (0.692)	Data Time 0.001 (0.100)	Loss 2.3613 (2.3528)	Entropy 0.53134 (0.53125)	Top-1 acc 66.016 (67.345)	Top-5 acc 86.719 (86.106)	lr 0.00000
Train [120][370/3239]	Time 0.241 (0.684)	Data Time 0.001 (0.097)	Loss 2.3817 (2.3516)	Entropy 0.53130 (0.53125)	Top-1 acc 65.625 (67.370)	Top-5 acc 86.719 (86.129)	lr 0.00000
Train [120][380/3239]	Time 0.234 (0.677)	Data Time 0.001 (0.095)	Loss 2.2787 (2.3507)	Entropy 0.53076 (0.53124)	Top-1 acc 63.281 (67.381)	Top-5 acc 88.672 (86.155)	lr 0.00000
Train [120][390/3239]	Time 0.238 (0.672)	Data Time 0.001 (0.092)	Loss 2.3848 (2.3504)	Entropy 0.53091 (0.53123)	Top-1 acc 68.359 (67.406)	Top-5 acc 85.547 (86.152)	lr 0.00000
Train [120][400/3239]	Time 0.232 (0.665)	Data Time 0.001 (0.090)	Loss 2.4791 (2.3513)	Entropy 0.53068 (0.53122)	Top-1 acc 62.500 (67.403)	Top-5 acc 85.938 (86.136)	lr 0.00000
Train [120][410/3239]	Time 0.240 (0.660)	Data Time 0.001 (0.088)	Loss 2.4117 (2.3511)	Entropy 0.53043 (0.53121)	Top-1 acc 66.406 (67.407)	Top-5 acc 84.766 (86.142)	lr 0.00000
Train [120][420/3239]	Time 0.236 (0.654)	Data Time 0.001 (0.086)	Loss 2.4579 (2.3528)	Entropy 0.53059 (0.53119)	Top-1 acc 65.625 (67.361)	Top-5 acc 84.766 (86.135)	lr 0.00000
Train [120][430/3239]	Time 0.253 (0.649)	Data Time 0.001 (0.084)	Loss 2.3525 (2.3532)	Entropy 0.53059 (0.53118)	Top-1 acc 62.109 (67.327)	Top-5 acc 87.500 (86.134)	lr 0.00000
Train [120][440/3239]	Time 0.234 (0.644)	Data Time 0.001 (0.082)	Loss 2.2763 (2.3520)	Entropy 0.53025 (0.53116)	Top-1 acc 67.188 (67.350)	Top-5 acc 88.281 (86.145)	lr 0.00000
Train [120][450/3239]	Time 0.236 (0.639)	Data Time 0.001 (0.080)	Loss 2.4917 (2.3503)	Entropy 0.52985 (0.53114)	Top-1 acc 61.719 (67.375)	Top-5 acc 83.984 (86.182)	lr 0.00000
Train [120][460/3239]	Time 0.293 (0.635)	Data Time 0.002 (0.079)	Loss 2.3205 (2.3487)	Entropy 0.52992 (0.53111)	Top-1 acc 68.359 (67.415)	Top-5 acc 88.281 (86.221)	lr 0.00000
Train [120][470/3239]	Time 0.236 (0.632)	Data Time 0.001 (0.077)	Loss 2.5099 (2.3495)	Entropy 0.53015 (0.53108)	Top-1 acc 62.109 (67.386)	Top-5 acc 83.594 (86.203)	lr 0.00000
Train [120][480/3239]	Time 0.244 (0.628)	Data Time 0.002 (0.075)	Loss 2.4914 (2.3494)	Entropy 0.53054 (0.53107)	Top-1 acc 62.109 (67.378)	Top-5 acc 84.766 (86.220)	lr 0.00000
Train [120][490/3239]	Time 0.243 (0.624)	Data Time 0.002 (0.074)	Loss 2.2033 (2.3505)	Entropy 0.53041 (0.53106)	Top-1 acc 72.656 (67.361)	Top-5 acc 87.109 (86.199)	lr 0.00000
Train [120][500/3239]	Time 0.281 (0.622)	Data Time 0.001 (0.073)	Loss 2.2733 (2.3498)	Entropy 0.53065 (0.53105)	Top-1 acc 70.703 (67.381)	Top-5 acc 90.625 (86.213)	lr 0.00000
Train [120][510/3239]	Time 0.235 (0.620)	Data Time 0.001 (0.071)	Loss 2.3425 (2.3493)	Entropy 0.53022 (0.53103)	Top-1 acc 69.531 (67.385)	Top-5 acc 87.500 (86.226)	lr 0.00000
Train [120][520/3239]	Time 0.367 (0.616)	Data Time 0.002 (0.070)	Loss 2.4185 (2.3492)	Entropy 0.53031 (0.53102)	Top-1 acc 64.844 (67.376)	Top-5 acc 88.281 (86.242)	lr 0.00000
Train [120][530/3239]	Time 0.240 (0.612)	Data Time 0.001 (0.069)	Loss 2.4950 (2.3495)	Entropy 0.53048 (0.53101)	Top-1 acc 63.672 (67.390)	Top-5 acc 83.984 (86.235)	lr 0.00000
Train [120][540/3239]	Time 0.276 (0.609)	Data Time 0.001 (0.067)	Loss 2.4220 (2.3489)	Entropy 0.53061 (0.53100)	Top-1 acc 65.625 (67.390)	Top-5 acc 85.938 (86.242)	lr 0.00000
Train [120][550/3239]	Time 0.242 (0.605)	Data Time 0.001 (0.066)	Loss 2.1600 (2.3489)	Entropy 0.53077 (0.53099)	Top-1 acc 69.922 (67.384)	Top-5 acc 89.453 (86.237)	lr 0.00000
Train [120][560/3239]	Time 0.238 (0.602)	Data Time 0.001 (0.065)	Loss 2.3866 (2.3488)	Entropy 0.53046 (0.53099)	Top-1 acc 64.844 (67.386)	Top-5 acc 85.547 (86.238)	lr 0.00000
Train [120][570/3239]	Time 0.258 (0.599)	Data Time 0.001 (0.064)	Loss 2.1460 (2.3486)	Entropy 0.52982 (0.53097)	Top-1 acc 72.656 (67.384)	Top-5 acc 89.062 (86.249)	lr 0.00000
Train [120][580/3239]	Time 0.229 (0.595)	Data Time 0.001 (0.063)	Loss 2.7183 (2.3496)	Entropy 0.53031 (0.53095)	Top-1 acc 62.109 (67.382)	Top-5 acc 78.125 (86.221)	lr 0.00000
Train [120][590/3239]	Time 0.377 (0.592)	Data Time 0.002 (0.062)	Loss 2.3622 (2.3511)	Entropy 0.53023 (0.53094)	Top-1 acc 65.625 (67.346)	Top-5 acc 84.375 (86.195)	lr 0.00000
Train [120][600/3239]	Time 0.270 (0.589)	Data Time 0.001 (0.061)	Loss 2.3151 (2.3509)	Entropy 0.53038 (0.53093)	Top-1 acc 70.312 (67.364)	Top-5 acc 86.719 (86.202)	lr 0.00000
Train [120][610/3239]	Time 0.220 (0.586)	Data Time 0.001 (0.060)	Loss 2.6769 (2.3516)	Entropy 0.53073 (0.53093)	Top-1 acc 61.719 (67.365)	Top-5 acc 80.859 (86.181)	lr 0.00000
Train [120][620/3239]	Time 0.249 (0.584)	Data Time 0.001 (0.059)	Loss 2.3084 (2.3516)	Entropy 0.53076 (0.53092)	Top-1 acc 64.844 (67.354)	Top-5 acc 89.844 (86.192)	lr 0.00000
Train [120][630/3239]	Time 0.251 (0.581)	Data Time 0.001 (0.058)	Loss 2.2602 (2.3519)	Entropy 0.53091 (0.53092)	Top-1 acc 70.312 (67.347)	Top-5 acc 88.281 (86.183)	lr 0.00000
Train [120][640/3239]	Time 0.224 (0.579)	Data Time 0.001 (0.057)	Loss 2.5676 (2.3519)	Entropy 0.53098 (0.53092)	Top-1 acc 63.672 (67.354)	Top-5 acc 83.984 (86.187)	lr 0.00000
Train [120][650/3239]	Time 0.226 (0.576)	Data Time 0.001 (0.056)	Loss 2.2934 (2.3513)	Entropy 0.53091 (0.53092)	Top-1 acc 66.016 (67.360)	Top-5 acc 87.109 (86.200)	lr 0.00000
Train [120][660/3239]	Time 0.268 (0.575)	Data Time 0.002 (0.055)	Loss 2.4876 (2.3525)	Entropy 0.53106 (0.53092)	Top-1 acc 62.109 (67.338)	Top-5 acc 85.547 (86.186)	lr 0.00000
Train [120][670/3239]	Time 0.227 (0.573)	Data Time 0.001 (0.055)	Loss 2.3729 (2.3521)	Entropy 0.53138 (0.53093)	Top-1 acc 68.359 (67.357)	Top-5 acc 85.938 (86.195)	lr 0.00000
Train [120][680/3239]	Time 0.240 (0.571)	Data Time 0.001 (0.054)	Loss 2.3499 (2.3522)	Entropy 0.53133 (0.53093)	Top-1 acc 68.750 (67.362)	Top-5 acc 86.719 (86.198)	lr 0.00000
Train [120][690/3239]	Time 0.255 (0.568)	Data Time 0.001 (0.053)	Loss 2.1768 (2.3515)	Entropy 0.53123 (0.53094)	Top-1 acc 69.141 (67.364)	Top-5 acc 91.406 (86.214)	lr 0.00000
Train [120][700/3239]	Time 0.238 (0.566)	Data Time 0.001 (0.052)	Loss 2.6036 (2.3520)	Entropy 0.53157 (0.53094)	Top-1 acc 59.766 (67.350)	Top-5 acc 82.812 (86.210)	lr 0.00000
Train [120][710/3239]	Time 0.253 (0.564)	Data Time 0.001 (0.052)	Loss 2.3944 (2.3513)	Entropy 0.53195 (0.53096)	Top-1 acc 63.672 (67.371)	Top-5 acc 85.938 (86.214)	lr 0.00000
Train [120][720/3239]	Time 0.235 (0.562)	Data Time 0.001 (0.051)	Loss 2.1495 (2.3508)	Entropy 0.53201 (0.53097)	Top-1 acc 69.531 (67.381)	Top-5 acc 89.062 (86.230)	lr 0.00000
Train [120][730/3239]	Time 0.234 (0.560)	Data Time 0.001 (0.050)	Loss 2.1886 (2.3504)	Entropy 0.53205 (0.53098)	Top-1 acc 70.703 (67.388)	Top-5 acc 89.062 (86.232)	lr 0.00000
Train [120][740/3239]	Time 0.222 (0.558)	Data Time 0.001 (0.050)	Loss 2.4201 (2.3501)	Entropy 0.53193 (0.53100)	Top-1 acc 67.578 (67.399)	Top-5 acc 84.375 (86.233)	lr 0.00000
Train [120][750/3239]	Time 0.337 (0.556)	Data Time 0.001 (0.049)	Loss 2.4591 (2.3495)	Entropy 0.53188 (0.53101)	Top-1 acc 66.016 (67.413)	Top-5 acc 85.547 (86.239)	lr 0.00000
Train [120][760/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.048)	Loss 2.1452 (2.3495)	Entropy 0.53187 (0.53102)	Top-1 acc 71.094 (67.396)	Top-5 acc 89.844 (86.239)	lr 0.00000
Train [120][770/3239]	Time 0.229 (0.552)	Data Time 0.001 (0.048)	Loss 2.3163 (2.3497)	Entropy 0.53197 (0.53103)	Top-1 acc 70.703 (67.400)	Top-5 acc 87.109 (86.237)	lr 0.00000
Train [120][780/3239]	Time 0.231 (0.550)	Data Time 0.001 (0.047)	Loss 2.3479 (2.3498)	Entropy 0.53212 (0.53105)	Top-1 acc 68.359 (67.404)	Top-5 acc 83.984 (86.232)	lr 0.00000
Train [120][790/3239]	Time 0.235 (0.548)	Data Time 0.001 (0.047)	Loss 2.2029 (2.3491)	Entropy 0.53212 (0.53106)	Top-1 acc 74.609 (67.422)	Top-5 acc 86.328 (86.232)	lr 0.00000
Train [120][800/3239]	Time 0.230 (0.546)	Data Time 0.001 (0.046)	Loss 2.4317 (2.3501)	Entropy 0.53220 (0.53107)	Top-1 acc 66.797 (67.395)	Top-5 acc 82.422 (86.218)	lr 0.00000
Train [120][810/3239]	Time 0.230 (0.544)	Data Time 0.001 (0.045)	Loss 2.3244 (2.3497)	Entropy 0.53224 (0.53109)	Top-1 acc 66.406 (67.405)	Top-5 acc 85.156 (86.225)	lr 0.00000
Train [120][820/3239]	Time 0.442 (0.544)	Data Time 0.002 (0.045)	Loss 2.3006 (2.3499)	Entropy 0.53210 (0.53110)	Top-1 acc 69.922 (67.409)	Top-5 acc 85.938 (86.222)	lr 0.00000
Train [120][830/3239]	Time 0.250 (0.542)	Data Time 0.001 (0.044)	Loss 2.2896 (2.3494)	Entropy 0.53181 (0.53111)	Top-1 acc 69.141 (67.415)	Top-5 acc 85.938 (86.229)	lr 0.00000
Train [120][840/3239]	Time 0.234 (0.541)	Data Time 0.001 (0.044)	Loss 2.3119 (2.3491)	Entropy 0.53179 (0.53112)	Top-1 acc 70.312 (67.419)	Top-5 acc 86.719 (86.232)	lr 0.00000
Train [120][850/3239]	Time 0.227 (0.539)	Data Time 0.001 (0.043)	Loss 2.3433 (2.3494)	Entropy 0.53181 (0.53113)	Top-1 acc 71.094 (67.412)	Top-5 acc 86.719 (86.233)	lr 0.00000
Train [120][860/3239]	Time 0.358 (0.597)	Data Time 0.010 (0.043)	Loss 2.2925 (2.3496)	Entropy 0.53214 (0.53114)	Top-1 acc 67.188 (67.403)	Top-5 acc 87.500 (86.232)	lr 0.00000
Train [120][870/3239]	Time 0.271 (0.596)	Data Time 0.002 (0.042)	Loss 2.1276 (2.3498)	Entropy 0.53184 (0.53115)	Top-1 acc 72.656 (67.402)	Top-5 acc 90.234 (86.221)	lr 0.00000
Train [120][880/3239]	Time 0.231 (0.594)	Data Time 0.001 (0.042)	Loss 2.4015 (2.3492)	Entropy 0.53187 (0.53115)	Top-1 acc 65.234 (67.414)	Top-5 acc 86.719 (86.233)	lr 0.00000
Train [120][890/3239]	Time 0.237 (0.592)	Data Time 0.001 (0.042)	Loss 2.1160 (2.3491)	Entropy 0.53208 (0.53116)	Top-1 acc 70.703 (67.413)	Top-5 acc 91.016 (86.231)	lr 0.00000
Train [120][900/3239]	Time 0.228 (0.591)	Data Time 0.001 (0.041)	Loss 2.3115 (2.3495)	Entropy 0.53218 (0.53117)	Top-1 acc 67.969 (67.402)	Top-5 acc 87.109 (86.230)	lr 0.00000
Train [120][910/3239]	Time 0.339 (0.589)	Data Time 0.001 (0.041)	Loss 2.3597 (2.3491)	Entropy 0.53227 (0.53118)	Top-1 acc 64.844 (67.411)	Top-5 acc 86.719 (86.238)	lr 0.00000
Train [120][920/3239]	Time 0.234 (0.587)	Data Time 0.001 (0.040)	Loss 2.5280 (2.3492)	Entropy 0.53205 (0.53119)	Top-1 acc 60.156 (67.408)	Top-5 acc 83.984 (86.234)	lr 0.00000
Train [120][930/3239]	Time 0.259 (0.585)	Data Time 0.001 (0.040)	Loss 2.2079 (2.3486)	Entropy 0.53215 (0.53120)	Top-1 acc 71.484 (67.430)	Top-5 acc 89.062 (86.247)	lr 0.00000
Train [120][940/3239]	Time 0.242 (0.583)	Data Time 0.001 (0.039)	Loss 2.3129 (2.3486)	Entropy 0.53241 (0.53122)	Top-1 acc 70.703 (67.429)	Top-5 acc 86.719 (86.249)	lr 0.00000
Train [120][950/3239]	Time 0.234 (0.582)	Data Time 0.001 (0.039)	Loss 2.3579 (2.3485)	Entropy 0.53256 (0.53123)	Top-1 acc 69.922 (67.440)	Top-5 acc 86.328 (86.245)	lr 0.00000
Train [120][960/3239]	Time 0.295 (0.581)	Data Time 0.002 (0.039)	Loss 2.0882 (2.3483)	Entropy 0.53256 (0.53124)	Top-1 acc 75.000 (67.447)	Top-5 acc 89.844 (86.251)	lr 0.00000
Train [120][970/3239]	Time 0.251 (0.580)	Data Time 0.001 (0.038)	Loss 2.1881 (2.3482)	Entropy 0.53251 (0.53126)	Top-1 acc 72.656 (67.447)	Top-5 acc 88.281 (86.250)	lr 0.00000
Train [120][980/3239]	Time 0.362 (0.578)	Data Time 0.001 (0.038)	Loss 2.1342 (2.3478)	Entropy 0.53225 (0.53127)	Top-1 acc 76.172 (67.461)	Top-5 acc 89.453 (86.257)	lr 0.00000
Train [120][990/3239]	Time 0.235 (0.577)	Data Time 0.001 (0.038)	Loss 2.3613 (2.3479)	Entropy 0.53221 (0.53128)	Top-1 acc 67.969 (67.459)	Top-5 acc 84.766 (86.254)	lr 0.00000
Train [120][1000/3239]	Time 0.226 (0.575)	Data Time 0.001 (0.037)	Loss 2.3893 (2.3482)	Entropy 0.53256 (0.53129)	Top-1 acc 65.234 (67.447)	Top-5 acc 86.328 (86.249)	lr 0.00000
Train [120][1010/3239]	Time 0.317 (0.575)	Data Time 0.002 (0.037)	Loss 2.3320 (2.3479)	Entropy 0.53254 (0.53131)	Top-1 acc 69.922 (67.452)	Top-5 acc 86.328 (86.252)	lr 0.00000
Train [120][1020/3239]	Time 0.240 (0.574)	Data Time 0.001 (0.037)	Loss 2.2978 (2.3480)	Entropy 0.53264 (0.53132)	Top-1 acc 68.359 (67.450)	Top-5 acc 86.328 (86.246)	lr 0.00000
Train [120][1030/3239]	Time 0.232 (0.573)	Data Time 0.001 (0.036)	Loss 2.1651 (2.3481)	Entropy 0.53250 (0.53133)	Top-1 acc 71.484 (67.447)	Top-5 acc 89.062 (86.247)	lr 0.00000
Train [120][1040/3239]	Time 0.237 (0.572)	Data Time 0.001 (0.036)	Loss 2.3275 (2.3483)	Entropy 0.53290 (0.53134)	Top-1 acc 67.188 (67.444)	Top-5 acc 83.594 (86.245)	lr 0.00000
Train [120][1050/3239]	Time 0.234 (0.570)	Data Time 0.001 (0.036)	Loss 2.1389 (2.3489)	Entropy 0.53312 (0.53136)	Top-1 acc 73.438 (67.430)	Top-5 acc 87.500 (86.240)	lr 0.00000
Train [120][1060/3239]	Time 0.229 (0.569)	Data Time 0.001 (0.035)	Loss 2.1294 (2.3490)	Entropy 0.53307 (0.53137)	Top-1 acc 73.047 (67.439)	Top-5 acc 91.797 (86.242)	lr 0.00000
Train [120][1070/3239]	Time 0.339 (0.568)	Data Time 0.001 (0.035)	Loss 2.3796 (2.3490)	Entropy 0.53312 (0.53139)	Top-1 acc 68.750 (67.448)	Top-5 acc 84.766 (86.245)	lr 0.00000
Train [120][1080/3239]	Time 0.221 (0.567)	Data Time 0.001 (0.035)	Loss 2.4430 (2.3493)	Entropy 0.53280 (0.53140)	Top-1 acc 66.016 (67.448)	Top-5 acc 83.594 (86.244)	lr 0.00000
Train [120][1090/3239]	Time 0.234 (0.565)	Data Time 0.001 (0.034)	Loss 2.2924 (2.3491)	Entropy 0.53301 (0.53142)	Top-1 acc 70.312 (67.457)	Top-5 acc 85.547 (86.246)	lr 0.00000
Train [120][1100/3239]	Time 0.223 (0.564)	Data Time 0.001 (0.034)	Loss 2.1790 (2.3484)	Entropy 0.53280 (0.53143)	Top-1 acc 72.656 (67.480)	Top-5 acc 90.234 (86.253)	lr 0.00000
Train [120][1110/3239]	Time 0.229 (0.563)	Data Time 0.001 (0.034)	Loss 2.3990 (2.3488)	Entropy 0.53271 (0.53145)	Top-1 acc 67.188 (67.474)	Top-5 acc 86.328 (86.250)	lr 0.00000
Train [120][1120/3239]	Time 0.273 (0.561)	Data Time 0.001 (0.033)	Loss 2.4327 (2.3489)	Entropy 0.53258 (0.53146)	Top-1 acc 65.234 (67.472)	Top-5 acc 84.375 (86.248)	lr 0.00000
Train [120][1130/3239]	Time 0.228 (0.560)	Data Time 0.001 (0.033)	Loss 2.1931 (2.3491)	Entropy 0.53252 (0.53146)	Top-1 acc 69.922 (67.474)	Top-5 acc 89.844 (86.247)	lr 0.00000
Train [120][1140/3239]	Time 0.328 (0.559)	Data Time 0.001 (0.033)	Loss 2.1650 (2.3494)	Entropy 0.53257 (0.53147)	Top-1 acc 74.219 (67.470)	Top-5 acc 89.062 (86.243)	lr 0.00000
Train [120][1150/3239]	Time 0.220 (0.557)	Data Time 0.001 (0.033)	Loss 2.4798 (2.3498)	Entropy 0.53234 (0.53148)	Top-1 acc 60.938 (67.464)	Top-5 acc 84.375 (86.240)	lr 0.00000
Train [120][1160/3239]	Time 0.230 (0.556)	Data Time 0.001 (0.032)	Loss 2.3827 (2.3496)	Entropy 0.53232 (0.53149)	Top-1 acc 64.062 (67.464)	Top-5 acc 86.328 (86.244)	lr 0.00000
Train [120][1170/3239]	Time 0.229 (0.555)	Data Time 0.001 (0.032)	Loss 2.3301 (2.3496)	Entropy 0.53226 (0.53150)	Top-1 acc 66.406 (67.468)	Top-5 acc 85.547 (86.243)	lr 0.00000
Train [120][1180/3239]	Time 0.237 (0.554)	Data Time 0.001 (0.032)	Loss 2.3776 (2.3497)	Entropy 0.53194 (0.53150)	Top-1 acc 64.453 (67.460)	Top-5 acc 86.719 (86.243)	lr 0.00000
Train [120][1190/3239]	Time 0.229 (0.553)	Data Time 0.001 (0.032)	Loss 2.3887 (2.3502)	Entropy 0.53245 (0.53151)	Top-1 acc 67.969 (67.452)	Top-5 acc 87.500 (86.241)	lr 0.00000
Train [120][1200/3239]	Time 0.222 (0.551)	Data Time 0.001 (0.031)	Loss 2.1270 (2.3507)	Entropy 0.53234 (0.53152)	Top-1 acc 73.828 (67.440)	Top-5 acc 90.234 (86.232)	lr 0.00000
Train [120][1210/3239]	Time 0.253 (0.550)	Data Time 0.003 (0.031)	Loss 2.0291 (2.3508)	Entropy 0.53249 (0.53152)	Top-1 acc 77.344 (67.445)	Top-5 acc 91.406 (86.237)	lr 0.00000
Train [120][1220/3239]	Time 0.232 (0.549)	Data Time 0.001 (0.031)	Loss 2.4258 (2.3507)	Entropy 0.53256 (0.53153)	Top-1 acc 64.453 (67.453)	Top-5 acc 84.766 (86.237)	lr 0.00000
Train [120][1230/3239]	Time 0.257 (0.548)	Data Time 0.002 (0.031)	Loss 2.4679 (2.3505)	Entropy 0.53300 (0.53154)	Top-1 acc 68.750 (67.469)	Top-5 acc 84.766 (86.234)	lr 0.00000
Train [120][1240/3239]	Time 0.253 (0.547)	Data Time 0.002 (0.030)	Loss 2.1675 (2.3502)	Entropy 0.53277 (0.53155)	Top-1 acc 72.656 (67.479)	Top-5 acc 88.672 (86.239)	lr 0.00000
Train [120][1250/3239]	Time 0.249 (0.546)	Data Time 0.001 (0.030)	Loss 2.3426 (2.3502)	Entropy 0.53266 (0.53156)	Top-1 acc 66.406 (67.478)	Top-5 acc 86.328 (86.236)	lr 0.00000
Train [120][1260/3239]	Time 0.335 (0.545)	Data Time 0.002 (0.030)	Loss 2.2848 (2.3497)	Entropy 0.53302 (0.53157)	Top-1 acc 69.141 (67.489)	Top-5 acc 87.109 (86.247)	lr 0.00000
Train [120][1270/3239]	Time 0.248 (0.545)	Data Time 0.001 (0.030)	Loss 2.4410 (2.3498)	Entropy 0.53307 (0.53158)	Top-1 acc 64.844 (67.487)	Top-5 acc 83.594 (86.244)	lr 0.00000
Train [120][1280/3239]	Time 0.239 (0.544)	Data Time 0.001 (0.029)	Loss 2.1245 (2.3495)	Entropy 0.53287 (0.53159)	Top-1 acc 71.875 (67.492)	Top-5 acc 88.672 (86.248)	lr 0.00000
Train [120][1290/3239]	Time 0.241 (0.543)	Data Time 0.001 (0.029)	Loss 2.4231 (2.3497)	Entropy 0.53293 (0.53160)	Top-1 acc 64.453 (67.486)	Top-5 acc 85.938 (86.245)	lr 0.00000
Train [120][1300/3239]	Time 0.321 (0.542)	Data Time 0.001 (0.029)	Loss 2.1896 (2.3494)	Entropy 0.53287 (0.53161)	Top-1 acc 72.656 (67.499)	Top-5 acc 88.672 (86.248)	lr 0.00000
Train [120][1310/3239]	Time 0.302 (0.541)	Data Time 0.002 (0.029)	Loss 2.0903 (2.3491)	Entropy 0.53289 (0.53162)	Top-1 acc 74.609 (67.509)	Top-5 acc 90.625 (86.255)	lr 0.00000
Train [120][1320/3239]	Time 0.225 (0.540)	Data Time 0.001 (0.029)	Loss 2.3185 (2.3488)	Entropy 0.53322 (0.53163)	Top-1 acc 70.312 (67.511)	Top-5 acc 85.547 (86.256)	lr 0.00000
Train [120][1330/3239]	Time 0.228 (0.539)	Data Time 0.001 (0.028)	Loss 2.3367 (2.3484)	Entropy 0.53334 (0.53165)	Top-1 acc 67.578 (67.521)	Top-5 acc 88.281 (86.260)	lr 0.00000
Train [120][1340/3239]	Time 0.230 (0.538)	Data Time 0.001 (0.028)	Loss 2.1605 (2.3486)	Entropy 0.53320 (0.53166)	Top-1 acc 71.484 (67.520)	Top-5 acc 89.062 (86.258)	lr 0.00000
Train [120][1350/3239]	Time 0.231 (0.537)	Data Time 0.001 (0.028)	Loss 2.3465 (2.3483)	Entropy 0.53325 (0.53167)	Top-1 acc 67.578 (67.523)	Top-5 acc 85.938 (86.263)	lr 0.00000
Train [120][1360/3239]	Time 0.297 (0.537)	Data Time 0.003 (0.028)	Loss 2.4266 (2.3484)	Entropy 0.53321 (0.53168)	Top-1 acc 62.891 (67.515)	Top-5 acc 86.719 (86.270)	lr 0.00000
Train [120][1370/3239]	Time 0.446 (0.537)	Data Time 0.001 (0.028)	Loss 2.2421 (2.3480)	Entropy 0.53352 (0.53169)	Top-1 acc 70.312 (67.515)	Top-5 acc 89.062 (86.283)	lr 0.00000
Train [120][1380/3239]	Time 0.226 (0.536)	Data Time 0.001 (0.027)	Loss 2.1890 (2.3478)	Entropy 0.53304 (0.53171)	Top-1 acc 69.141 (67.516)	Top-5 acc 86.719 (86.289)	lr 0.00000
Train [120][1390/3239]	Time 0.224 (0.535)	Data Time 0.001 (0.027)	Loss 2.4237 (2.3483)	Entropy 0.53308 (0.53171)	Top-1 acc 66.406 (67.504)	Top-5 acc 83.203 (86.282)	lr 0.00000
Train [120][1400/3239]	Time 0.231 (0.535)	Data Time 0.001 (0.027)	Loss 2.4481 (2.3479)	Entropy 0.53316 (0.53173)	Top-1 acc 62.500 (67.515)	Top-5 acc 83.594 (86.290)	lr 0.00000
Train [120][1410/3239]	Time 0.229 (0.534)	Data Time 0.001 (0.027)	Loss 2.5183 (2.3483)	Entropy 0.53303 (0.53174)	Top-1 acc 64.062 (67.501)	Top-5 acc 81.250 (86.289)	lr 0.00000
Train [120][1420/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.027)	Loss 2.4620 (2.3484)	Entropy 0.53315 (0.53174)	Top-1 acc 66.797 (67.503)	Top-5 acc 84.766 (86.286)	lr 0.00000
Train [120][1430/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.027)	Loss 2.3314 (2.3482)	Entropy 0.53318 (0.53175)	Top-1 acc 68.359 (67.511)	Top-5 acc 85.156 (86.286)	lr 0.00000
Train [120][1440/3239]	Time 0.290 (0.532)	Data Time 0.001 (0.026)	Loss 2.4537 (2.3479)	Entropy 0.53289 (0.53176)	Top-1 acc 64.062 (67.522)	Top-5 acc 81.641 (86.283)	lr 0.00000
Train [120][1450/3239]	Time 0.314 (0.532)	Data Time 0.002 (0.026)	Loss 2.2903 (2.3475)	Entropy 0.53292 (0.53177)	Top-1 acc 69.531 (67.530)	Top-5 acc 86.719 (86.288)	lr 0.00000
Train [120][1460/3239]	Time 0.360 (0.531)	Data Time 0.001 (0.026)	Loss 2.4121 (2.3472)	Entropy 0.53235 (0.53178)	Top-1 acc 64.062 (67.535)	Top-5 acc 84.375 (86.292)	lr 0.00000
Train [120][1470/3239]	Time 0.276 (0.530)	Data Time 0.002 (0.026)	Loss 2.2923 (2.3473)	Entropy 0.53186 (0.53178)	Top-1 acc 71.875 (67.532)	Top-5 acc 87.891 (86.289)	lr 0.00000
Train [120][1480/3239]	Time 0.240 (0.530)	Data Time 0.001 (0.026)	Loss 2.3386 (2.3471)	Entropy 0.53188 (0.53178)	Top-1 acc 68.750 (67.537)	Top-5 acc 86.328 (86.291)	lr 0.00000
Train [120][1490/3239]	Time 0.250 (0.529)	Data Time 0.001 (0.026)	Loss 2.3249 (2.3473)	Entropy 0.53190 (0.53178)	Top-1 acc 65.234 (67.527)	Top-5 acc 88.672 (86.291)	lr 0.00000
Train [120][1500/3239]	Time 0.240 (0.528)	Data Time 0.001 (0.025)	Loss 2.3335 (2.3467)	Entropy 0.53171 (0.53178)	Top-1 acc 66.016 (67.539)	Top-5 acc 87.500 (86.304)	lr 0.00000
Train [120][1510/3239]	Time 0.276 (0.528)	Data Time 0.003 (0.025)	Loss 2.3395 (2.3464)	Entropy 0.53145 (0.53178)	Top-1 acc 62.891 (67.545)	Top-5 acc 88.281 (86.313)	lr 0.00000
Train [120][1520/3239]	Time 0.421 (0.561)	Data Time 0.028 (0.025)	Loss 2.3090 (2.3466)	Entropy 0.53140 (0.53178)	Top-1 acc 73.438 (67.542)	Top-5 acc 87.109 (86.307)	lr 0.00000
Train [120][1530/3239]	Time 0.490 (0.561)	Data Time 0.002 (0.025)	Loss 2.4905 (2.3466)	Entropy 0.53177 (0.53177)	Top-1 acc 66.797 (67.540)	Top-5 acc 83.594 (86.307)	lr 0.00000
Train [120][1540/3239]	Time 0.263 (0.561)	Data Time 0.002 (0.025)	Loss 2.2360 (2.3471)	Entropy 0.53147 (0.53177)	Top-1 acc 69.141 (67.526)	Top-5 acc 89.062 (86.302)	lr 0.00000
Train [120][1550/3239]	Time 0.240 (0.560)	Data Time 0.001 (0.025)	Loss 2.1283 (2.3467)	Entropy 0.53186 (0.53177)	Top-1 acc 74.219 (67.537)	Top-5 acc 90.234 (86.308)	lr 0.00000
Train [120][1560/3239]	Time 0.243 (0.559)	Data Time 0.001 (0.025)	Loss 2.2980 (2.3466)	Entropy 0.53221 (0.53177)	Top-1 acc 68.359 (67.541)	Top-5 acc 87.500 (86.305)	lr 0.00000
Train [120][1570/3239]	Time 0.290 (0.559)	Data Time 0.002 (0.024)	Loss 2.1985 (2.3463)	Entropy 0.53233 (0.53178)	Top-1 acc 74.219 (67.547)	Top-5 acc 87.500 (86.304)	lr 0.00000
Train [120][1580/3239]	Time 0.254 (0.558)	Data Time 0.002 (0.024)	Loss 2.4323 (2.3465)	Entropy 0.53252 (0.53178)	Top-1 acc 63.672 (67.541)	Top-5 acc 84.375 (86.300)	lr 0.00000
Train [120][1590/3239]	Time 0.227 (0.557)	Data Time 0.001 (0.024)	Loss 2.3636 (2.3462)	Entropy 0.53255 (0.53178)	Top-1 acc 67.578 (67.547)	Top-5 acc 87.500 (86.304)	lr 0.00000
Train [120][1600/3239]	Time 0.241 (0.556)	Data Time 0.001 (0.024)	Loss 2.3645 (2.3460)	Entropy 0.53250 (0.53179)	Top-1 acc 64.453 (67.555)	Top-5 acc 83.594 (86.306)	lr 0.00000
Train [120][1610/3239]	Time 0.239 (0.556)	Data Time 0.001 (0.024)	Loss 2.3652 (2.3464)	Entropy 0.53230 (0.53179)	Top-1 acc 64.062 (67.542)	Top-5 acc 84.766 (86.299)	lr 0.00000
Train [120][1620/3239]	Time 0.338 (0.555)	Data Time 0.001 (0.024)	Loss 2.2763 (2.3464)	Entropy 0.53258 (0.53180)	Top-1 acc 67.969 (67.541)	Top-5 acc 87.891 (86.301)	lr 0.00000
Train [120][1630/3239]	Time 0.229 (0.554)	Data Time 0.001 (0.024)	Loss 2.2399 (2.3463)	Entropy 0.53220 (0.53180)	Top-1 acc 71.094 (67.547)	Top-5 acc 85.547 (86.302)	lr 0.00000
Train [120][1640/3239]	Time 0.226 (0.553)	Data Time 0.001 (0.023)	Loss 2.4867 (2.3461)	Entropy 0.53258 (0.53181)	Top-1 acc 66.406 (67.556)	Top-5 acc 84.766 (86.305)	lr 0.00000
Train [120][1650/3239]	Time 0.246 (0.552)	Data Time 0.001 (0.023)	Loss 2.3438 (2.3459)	Entropy 0.53235 (0.53181)	Top-1 acc 69.531 (67.563)	Top-5 acc 86.328 (86.311)	lr 0.00000
Train [120][1660/3239]	Time 0.241 (0.551)	Data Time 0.001 (0.023)	Loss 2.0974 (2.3462)	Entropy 0.53216 (0.53181)	Top-1 acc 77.344 (67.555)	Top-5 acc 89.844 (86.308)	lr 0.00000
Train [120][1670/3239]	Time 0.226 (0.551)	Data Time 0.001 (0.023)	Loss 2.1901 (2.3461)	Entropy 0.53203 (0.53181)	Top-1 acc 73.047 (67.559)	Top-5 acc 88.672 (86.305)	lr 0.00000
Train [120][1680/3239]	Time 0.238 (0.550)	Data Time 0.001 (0.023)	Loss 2.5189 (2.3463)	Entropy 0.53175 (0.53181)	Top-1 acc 65.234 (67.555)	Top-5 acc 85.156 (86.304)	lr 0.00000
Train [120][1690/3239]	Time 0.328 (0.549)	Data Time 0.001 (0.023)	Loss 2.2410 (2.3460)	Entropy 0.53146 (0.53181)	Top-1 acc 70.703 (67.559)	Top-5 acc 88.281 (86.305)	lr 0.00000
Train [120][1700/3239]	Time 0.232 (0.548)	Data Time 0.001 (0.023)	Loss 2.2536 (2.3455)	Entropy 0.53120 (0.53181)	Top-1 acc 69.531 (67.580)	Top-5 acc 87.891 (86.313)	lr 0.00000
Train [120][1710/3239]	Time 0.231 (0.548)	Data Time 0.001 (0.022)	Loss 2.4121 (2.3459)	Entropy 0.53136 (0.53181)	Top-1 acc 66.016 (67.574)	Top-5 acc 84.766 (86.307)	lr 0.00000
Train [120][1720/3239]	Time 0.293 (0.547)	Data Time 0.001 (0.022)	Loss 2.1869 (2.3458)	Entropy 0.53118 (0.53180)	Top-1 acc 71.094 (67.576)	Top-5 acc 88.281 (86.306)	lr 0.00000
Train [120][1730/3239]	Time 0.254 (0.547)	Data Time 0.001 (0.022)	Loss 2.3897 (2.3459)	Entropy 0.53090 (0.53180)	Top-1 acc 68.750 (67.577)	Top-5 acc 87.500 (86.303)	lr 0.00000
Train [120][1740/3239]	Time 0.271 (0.546)	Data Time 0.002 (0.022)	Loss 2.1645 (2.3457)	Entropy 0.53123 (0.53179)	Top-1 acc 69.922 (67.588)	Top-5 acc 88.281 (86.303)	lr 0.00000
Train [120][1750/3239]	Time 0.231 (0.545)	Data Time 0.001 (0.022)	Loss 2.7759 (2.3459)	Entropy 0.53130 (0.53179)	Top-1 acc 59.766 (67.583)	Top-5 acc 81.641 (86.300)	lr 0.00000
Train [120][1760/3239]	Time 0.237 (0.545)	Data Time 0.001 (0.022)	Loss 2.2207 (2.3461)	Entropy 0.53152 (0.53179)	Top-1 acc 74.219 (67.586)	Top-5 acc 88.672 (86.298)	lr 0.00000
Train [120][1770/3239]	Time 0.224 (0.544)	Data Time 0.001 (0.022)	Loss 2.4484 (2.3463)	Entropy 0.53136 (0.53179)	Top-1 acc 63.281 (67.577)	Top-5 acc 85.938 (86.294)	lr 0.00000
Train [120][1780/3239]	Time 0.327 (0.543)	Data Time 0.001 (0.022)	Loss 2.1879 (2.3461)	Entropy 0.53115 (0.53178)	Top-1 acc 69.922 (67.586)	Top-5 acc 87.109 (86.296)	lr 0.00000
Train [120][1790/3239]	Time 0.219 (0.542)	Data Time 0.001 (0.022)	Loss 2.4234 (2.3458)	Entropy 0.53128 (0.53178)	Top-1 acc 66.016 (67.593)	Top-5 acc 84.375 (86.300)	lr 0.00000
Train [120][1800/3239]	Time 0.231 (0.542)	Data Time 0.001 (0.021)	Loss 2.2510 (2.3464)	Entropy 0.53093 (0.53178)	Top-1 acc 73.438 (67.580)	Top-5 acc 87.109 (86.291)	lr 0.00000
Train [120][1810/3239]	Time 0.258 (0.541)	Data Time 0.001 (0.021)	Loss 2.2423 (2.3461)	Entropy 0.53077 (0.53177)	Top-1 acc 68.750 (67.592)	Top-5 acc 88.281 (86.295)	lr 0.00000
Train [120][1820/3239]	Time 0.227 (0.540)	Data Time 0.001 (0.021)	Loss 2.0909 (2.3459)	Entropy 0.53064 (0.53177)	Top-1 acc 73.047 (67.599)	Top-5 acc 90.234 (86.303)	lr 0.00000
Train [120][1830/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.021)	Loss 2.4148 (2.3459)	Entropy 0.53057 (0.53176)	Top-1 acc 65.625 (67.595)	Top-5 acc 83.594 (86.303)	lr 0.00000
Train [120][1840/3239]	Time 0.216 (0.539)	Data Time 0.001 (0.021)	Loss 2.3873 (2.3457)	Entropy 0.53075 (0.53176)	Top-1 acc 66.406 (67.602)	Top-5 acc 84.375 (86.306)	lr 0.00000
Train [120][1850/3239]	Time 0.324 (0.538)	Data Time 0.001 (0.021)	Loss 2.1957 (2.3455)	Entropy 0.53069 (0.53175)	Top-1 acc 71.484 (67.611)	Top-5 acc 88.672 (86.313)	lr 0.00000
Train [120][1860/3239]	Time 0.220 (0.537)	Data Time 0.001 (0.021)	Loss 2.2629 (2.3451)	Entropy 0.53058 (0.53174)	Top-1 acc 69.141 (67.616)	Top-5 acc 90.234 (86.324)	lr 0.00000
Train [120][1870/3239]	Time 0.224 (0.537)	Data Time 0.001 (0.021)	Loss 2.5707 (2.3451)	Entropy 0.53071 (0.53174)	Top-1 acc 65.234 (67.614)	Top-5 acc 82.031 (86.325)	lr 0.00000
Train [120][1880/3239]	Time 0.276 (0.536)	Data Time 0.001 (0.021)	Loss 2.3154 (2.3454)	Entropy 0.53079 (0.53173)	Top-1 acc 70.703 (67.606)	Top-5 acc 85.938 (86.323)	lr 0.00000
Train [120][1890/3239]	Time 0.252 (0.536)	Data Time 0.001 (0.021)	Loss 2.2001 (2.3453)	Entropy 0.53104 (0.53173)	Top-1 acc 71.094 (67.607)	Top-5 acc 89.844 (86.327)	lr 0.00000
Train [120][1900/3239]	Time 0.229 (0.535)	Data Time 0.001 (0.020)	Loss 2.2826 (2.3452)	Entropy 0.53112 (0.53172)	Top-1 acc 71.484 (67.609)	Top-5 acc 86.328 (86.329)	lr 0.00000
Train [120][1910/3239]	Time 0.239 (0.535)	Data Time 0.001 (0.020)	Loss 2.2218 (2.3450)	Entropy 0.53128 (0.53172)	Top-1 acc 70.312 (67.618)	Top-5 acc 89.453 (86.332)	lr 0.00000
Train [120][1920/3239]	Time 0.459 (0.534)	Data Time 0.001 (0.020)	Loss 2.8242 (2.3449)	Entropy 0.53097 (0.53172)	Top-1 acc 58.594 (67.618)	Top-5 acc 77.734 (86.334)	lr 0.00000
Train [120][1930/3239]	Time 0.261 (0.534)	Data Time 0.001 (0.020)	Loss 2.3476 (2.3446)	Entropy 0.53092 (0.53171)	Top-1 acc 66.797 (67.626)	Top-5 acc 86.328 (86.339)	lr 0.00000
Train [120][1940/3239]	Time 0.238 (0.534)	Data Time 0.001 (0.020)	Loss 2.4677 (2.3449)	Entropy 0.53071 (0.53171)	Top-1 acc 68.750 (67.621)	Top-5 acc 83.594 (86.332)	lr 0.00000
Train [120][1950/3239]	Time 0.233 (0.533)	Data Time 0.001 (0.020)	Loss 2.4027 (2.3450)	Entropy 0.53064 (0.53171)	Top-1 acc 68.359 (67.621)	Top-5 acc 85.156 (86.332)	lr 0.00000
Train [120][1960/3239]	Time 0.274 (0.532)	Data Time 0.001 (0.020)	Loss 2.3537 (2.3448)	Entropy 0.53064 (0.53170)	Top-1 acc 67.578 (67.626)	Top-5 acc 84.766 (86.332)	lr 0.00000
Train [120][1970/3239]	Time 0.248 (0.532)	Data Time 0.001 (0.020)	Loss 2.3844 (2.3454)	Entropy 0.53080 (0.53170)	Top-1 acc 66.797 (67.615)	Top-5 acc 86.719 (86.325)	lr 0.00000
Train [120][1980/3239]	Time 0.286 (0.532)	Data Time 0.002 (0.020)	Loss 2.2742 (2.3455)	Entropy 0.53039 (0.53169)	Top-1 acc 66.797 (67.612)	Top-5 acc 87.109 (86.321)	lr 0.00000
Train [120][1990/3239]	Time 0.227 (0.531)	Data Time 0.001 (0.020)	Loss 2.3451 (2.3454)	Entropy 0.53040 (0.53168)	Top-1 acc 68.750 (67.610)	Top-5 acc 85.156 (86.321)	lr 0.00000
Train [120][2000/3239]	Time 0.215 (0.531)	Data Time 0.001 (0.020)	Loss 2.3622 (2.3454)	Entropy 0.53060 (0.53168)	Top-1 acc 66.797 (67.614)	Top-5 acc 85.547 (86.321)	lr 0.00000
Train [120][2010/3239]	Time 0.322 (0.530)	Data Time 0.001 (0.019)	Loss 2.6133 (2.3457)	Entropy 0.53061 (0.53167)	Top-1 acc 60.547 (67.608)	Top-5 acc 81.250 (86.316)	lr 0.00000
Train [120][2020/3239]	Time 0.226 (0.529)	Data Time 0.001 (0.019)	Loss 2.7924 (2.3460)	Entropy 0.53080 (0.53167)	Top-1 acc 59.375 (67.601)	Top-5 acc 80.078 (86.312)	lr 0.00000
Train [120][2030/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.019)	Loss 2.1855 (2.3463)	Entropy 0.53049 (0.53166)	Top-1 acc 71.484 (67.600)	Top-5 acc 89.844 (86.308)	lr 0.00000
Train [120][2040/3239]	Time 0.252 (0.528)	Data Time 0.001 (0.019)	Loss 2.3747 (2.3464)	Entropy 0.53073 (0.53166)	Top-1 acc 66.406 (67.601)	Top-5 acc 89.062 (86.306)	lr 0.00000
Train [120][2050/3239]	Time 0.253 (0.528)	Data Time 0.001 (0.019)	Loss 2.2088 (2.3460)	Entropy 0.53110 (0.53165)	Top-1 acc 69.141 (67.609)	Top-5 acc 89.844 (86.312)	lr 0.00000
Train [120][2060/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.019)	Loss 2.3489 (2.3460)	Entropy 0.53100 (0.53165)	Top-1 acc 67.578 (67.611)	Top-5 acc 85.938 (86.312)	lr 0.00000
Train [120][2070/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.019)	Loss 2.4425 (2.3463)	Entropy 0.53118 (0.53165)	Top-1 acc 66.406 (67.605)	Top-5 acc 84.766 (86.308)	lr 0.00000
Train [120][2080/3239]	Time 0.359 (0.526)	Data Time 0.001 (0.019)	Loss 2.2137 (2.3465)	Entropy 0.53124 (0.53164)	Top-1 acc 71.484 (67.600)	Top-5 acc 88.672 (86.304)	lr 0.00000
Train [120][2090/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.019)	Loss 2.2047 (2.3463)	Entropy 0.53098 (0.53164)	Top-1 acc 71.484 (67.604)	Top-5 acc 91.406 (86.306)	lr 0.00000
Train [120][2100/3239]	Time 0.263 (0.525)	Data Time 0.001 (0.019)	Loss 2.3516 (2.3463)	Entropy 0.53043 (0.53164)	Top-1 acc 68.750 (67.607)	Top-5 acc 84.375 (86.302)	lr 0.00000
Train [120][2110/3239]	Time 0.233 (0.524)	Data Time 0.001 (0.019)	Loss 2.3134 (2.3462)	Entropy 0.53024 (0.53163)	Top-1 acc 69.531 (67.610)	Top-5 acc 90.234 (86.306)	lr 0.00000
Train [120][2120/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.019)	Loss 2.1675 (2.3466)	Entropy 0.53027 (0.53162)	Top-1 acc 73.047 (67.598)	Top-5 acc 88.672 (86.301)	lr 0.00000
Train [120][2130/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.018)	Loss 2.2576 (2.3467)	Entropy 0.52970 (0.53162)	Top-1 acc 68.359 (67.592)	Top-5 acc 88.281 (86.302)	lr 0.00000
Train [120][2140/3239]	Time 0.226 (0.522)	Data Time 0.001 (0.018)	Loss 2.3951 (2.3468)	Entropy 0.52947 (0.53161)	Top-1 acc 64.062 (67.590)	Top-5 acc 85.938 (86.299)	lr 0.00000
Train [120][2150/3239]	Time 0.223 (0.522)	Data Time 0.001 (0.018)	Loss 2.5771 (2.3469)	Entropy 0.52958 (0.53160)	Top-1 acc 63.672 (67.589)	Top-5 acc 83.984 (86.300)	lr 0.00000
Train [120][2160/3239]	Time 0.234 (0.521)	Data Time 0.001 (0.018)	Loss 2.1241 (2.3469)	Entropy 0.52942 (0.53159)	Top-1 acc 73.438 (67.586)	Top-5 acc 89.062 (86.298)	lr 0.00000
Train [120][2170/3239]	Time 0.451 (0.545)	Data Time 0.004 (0.018)	Loss 2.3286 (2.3469)	Entropy 0.52911 (0.53158)	Top-1 acc 66.406 (67.589)	Top-5 acc 85.156 (86.295)	lr 0.00000
Train [120][2180/3239]	Time 0.249 (0.545)	Data Time 0.002 (0.018)	Loss 2.2342 (2.3471)	Entropy 0.52876 (0.53157)	Top-1 acc 68.750 (67.584)	Top-5 acc 87.891 (86.292)	lr 0.00000
Train [120][2190/3239]	Time 0.236 (0.544)	Data Time 0.002 (0.018)	Loss 2.5583 (2.3475)	Entropy 0.52887 (0.53155)	Top-1 acc 63.672 (67.577)	Top-5 acc 81.250 (86.283)	lr 0.00000
Train [120][2200/3239]	Time 0.239 (0.544)	Data Time 0.001 (0.018)	Loss 2.4001 (2.3477)	Entropy 0.52891 (0.53154)	Top-1 acc 65.625 (67.570)	Top-5 acc 85.547 (86.280)	lr 0.00000
Train [120][2210/3239]	Time 0.239 (0.543)	Data Time 0.001 (0.018)	Loss 2.2736 (2.3475)	Entropy 0.52903 (0.53153)	Top-1 acc 67.188 (67.576)	Top-5 acc 87.109 (86.284)	lr 0.00000
Train [120][2220/3239]	Time 0.228 (0.543)	Data Time 0.002 (0.018)	Loss 2.3613 (2.3477)	Entropy 0.52917 (0.53152)	Top-1 acc 66.016 (67.569)	Top-5 acc 86.719 (86.281)	lr 0.00000
Train [120][2230/3239]	Time 0.222 (0.542)	Data Time 0.001 (0.018)	Loss 2.6898 (2.3479)	Entropy 0.52937 (0.53151)	Top-1 acc 56.641 (67.564)	Top-5 acc 79.688 (86.274)	lr 0.00000
Train [120][2240/3239]	Time 0.355 (0.542)	Data Time 0.001 (0.018)	Loss 2.4266 (2.3481)	Entropy 0.52933 (0.53150)	Top-1 acc 65.234 (67.558)	Top-5 acc 85.547 (86.272)	lr 0.00000
Train [120][2250/3239]	Time 0.230 (0.541)	Data Time 0.001 (0.018)	Loss 2.2776 (2.3478)	Entropy 0.52930 (0.53149)	Top-1 acc 69.531 (67.572)	Top-5 acc 89.062 (86.278)	lr 0.00000
Train [120][2260/3239]	Time 0.230 (0.540)	Data Time 0.001 (0.018)	Loss 2.1355 (2.3477)	Entropy 0.52934 (0.53148)	Top-1 acc 71.094 (67.574)	Top-5 acc 90.234 (86.277)	lr 0.00000
Train [120][2270/3239]	Time 0.247 (0.540)	Data Time 0.001 (0.017)	Loss 2.3353 (2.3477)	Entropy 0.52935 (0.53147)	Top-1 acc 67.188 (67.571)	Top-5 acc 86.328 (86.277)	lr 0.00000
Train [120][2280/3239]	Time 0.257 (0.539)	Data Time 0.001 (0.017)	Loss 2.8565 (2.3481)	Entropy 0.52943 (0.53146)	Top-1 acc 57.812 (67.561)	Top-5 acc 75.781 (86.268)	lr 0.00000
Train [120][2290/3239]	Time 0.294 (0.539)	Data Time 0.002 (0.017)	Loss 2.1644 (2.3480)	Entropy 0.52962 (0.53145)	Top-1 acc 69.922 (67.563)	Top-5 acc 89.062 (86.270)	lr 0.00000
Train [120][2300/3239]	Time 0.316 (0.539)	Data Time 0.001 (0.017)	Loss 2.4989 (2.3483)	Entropy 0.52973 (0.53145)	Top-1 acc 62.500 (67.553)	Top-5 acc 83.594 (86.264)	lr 0.00000
Train [120][2310/3239]	Time 0.223 (0.539)	Data Time 0.001 (0.017)	Loss 2.5471 (2.3483)	Entropy 0.52974 (0.53144)	Top-1 acc 64.844 (67.552)	Top-5 acc 84.375 (86.263)	lr 0.00000
Train [120][2320/3239]	Time 0.232 (0.538)	Data Time 0.001 (0.017)	Loss 2.4903 (2.3485)	Entropy 0.52962 (0.53143)	Top-1 acc 65.234 (67.546)	Top-5 acc 84.766 (86.261)	lr 0.00000
Train [120][2330/3239]	Time 0.337 (0.538)	Data Time 0.001 (0.017)	Loss 2.1500 (2.3485)	Entropy 0.52966 (0.53142)	Top-1 acc 72.266 (67.549)	Top-5 acc 89.062 (86.261)	lr 0.00000
Train [120][2340/3239]	Time 0.236 (0.537)	Data Time 0.001 (0.017)	Loss 2.4461 (2.3484)	Entropy 0.52977 (0.53142)	Top-1 acc 64.453 (67.554)	Top-5 acc 86.328 (86.264)	lr 0.00000
Train [120][2350/3239]	Time 0.232 (0.537)	Data Time 0.001 (0.017)	Loss 2.3990 (2.3482)	Entropy 0.52963 (0.53141)	Top-1 acc 63.672 (67.555)	Top-5 acc 83.984 (86.268)	lr 0.00000
Train [120][2360/3239]	Time 0.229 (0.536)	Data Time 0.001 (0.017)	Loss 2.2930 (2.3482)	Entropy 0.52964 (0.53140)	Top-1 acc 67.188 (67.549)	Top-5 acc 85.156 (86.270)	lr 0.00000
Train [120][2370/3239]	Time 0.283 (0.536)	Data Time 0.001 (0.017)	Loss 2.3057 (2.3482)	Entropy 0.52947 (0.53139)	Top-1 acc 66.406 (67.557)	Top-5 acc 85.938 (86.269)	lr 0.00000
Train [120][2380/3239]	Time 0.224 (0.536)	Data Time 0.001 (0.017)	Loss 2.5857 (2.3484)	Entropy 0.52944 (0.53139)	Top-1 acc 64.453 (67.555)	Top-5 acc 82.031 (86.265)	lr 0.00000
Train [120][2390/3239]	Time 0.243 (0.535)	Data Time 0.001 (0.017)	Loss 2.3370 (2.3485)	Entropy 0.52941 (0.53138)	Top-1 acc 66.016 (67.552)	Top-5 acc 86.328 (86.266)	lr 0.00000
Train [120][2400/3239]	Time 0.343 (0.535)	Data Time 0.001 (0.017)	Loss 2.3581 (2.3484)	Entropy 0.52860 (0.53137)	Top-1 acc 65.234 (67.554)	Top-5 acc 87.500 (86.267)	lr 0.00000
Train [120][2410/3239]	Time 0.236 (0.534)	Data Time 0.001 (0.017)	Loss 2.3009 (2.3484)	Entropy 0.52849 (0.53136)	Top-1 acc 69.531 (67.555)	Top-5 acc 85.938 (86.268)	lr 0.00000
Train [120][2420/3239]	Time 0.241 (0.534)	Data Time 0.001 (0.017)	Loss 2.5484 (2.3484)	Entropy 0.52841 (0.53135)	Top-1 acc 62.500 (67.553)	Top-5 acc 82.812 (86.265)	lr 0.00000
Train [120][2430/3239]	Time 0.238 (0.533)	Data Time 0.001 (0.016)	Loss 2.2704 (2.3486)	Entropy 0.52834 (0.53133)	Top-1 acc 69.531 (67.551)	Top-5 acc 85.938 (86.261)	lr 0.00000
Train [120][2440/3239]	Time 0.234 (0.533)	Data Time 0.001 (0.016)	Loss 2.5337 (2.3486)	Entropy 0.52818 (0.53132)	Top-1 acc 61.719 (67.546)	Top-5 acc 81.641 (86.260)	lr 0.00000
Train [120][2450/3239]	Time 0.252 (0.532)	Data Time 0.001 (0.016)	Loss 2.2157 (2.3485)	Entropy 0.52828 (0.53131)	Top-1 acc 72.656 (67.547)	Top-5 acc 87.891 (86.263)	lr 0.00000
Train [120][2460/3239]	Time 0.266 (0.532)	Data Time 0.002 (0.016)	Loss 2.3524 (2.3485)	Entropy 0.52856 (0.53130)	Top-1 acc 67.969 (67.550)	Top-5 acc 86.328 (86.265)	lr 0.00000
Train [120][2470/3239]	Time 0.254 (0.532)	Data Time 0.001 (0.016)	Loss 2.2905 (2.3485)	Entropy 0.52879 (0.53129)	Top-1 acc 66.797 (67.551)	Top-5 acc 87.500 (86.266)	lr 0.00000
Train [120][2480/3239]	Time 0.248 (0.531)	Data Time 0.001 (0.016)	Loss 2.4168 (2.3484)	Entropy 0.52899 (0.53128)	Top-1 acc 64.453 (67.552)	Top-5 acc 82.422 (86.267)	lr 0.00000
Train [120][2490/3239]	Time 0.260 (0.531)	Data Time 0.001 (0.016)	Loss 2.2325 (2.3481)	Entropy 0.52911 (0.53127)	Top-1 acc 66.797 (67.561)	Top-5 acc 89.844 (86.273)	lr 0.00000
Train [120][2500/3239]	Time 0.232 (0.531)	Data Time 0.001 (0.016)	Loss 2.3716 (2.3484)	Entropy 0.52855 (0.53126)	Top-1 acc 69.922 (67.556)	Top-5 acc 85.547 (86.269)	lr 0.00000
Train [120][2510/3239]	Time 0.249 (0.530)	Data Time 0.001 (0.016)	Loss 2.2817 (2.3482)	Entropy 0.52880 (0.53125)	Top-1 acc 69.141 (67.561)	Top-5 acc 86.719 (86.272)	lr 0.00000
Train [120][2520/3239]	Time 0.234 (0.530)	Data Time 0.001 (0.016)	Loss 2.1056 (2.3482)	Entropy 0.52884 (0.53124)	Top-1 acc 72.656 (67.563)	Top-5 acc 90.625 (86.270)	lr 0.00000
Train [120][2530/3239]	Time 0.235 (0.529)	Data Time 0.001 (0.016)	Loss 2.2401 (2.3481)	Entropy 0.52889 (0.53123)	Top-1 acc 68.750 (67.564)	Top-5 acc 87.891 (86.273)	lr 0.00000
Train [120][2540/3239]	Time 0.231 (0.529)	Data Time 0.001 (0.016)	Loss 2.4215 (2.3481)	Entropy 0.52885 (0.53122)	Top-1 acc 65.625 (67.566)	Top-5 acc 84.766 (86.274)	lr 0.00000
Train [120][2550/3239]	Time 0.221 (0.528)	Data Time 0.001 (0.016)	Loss 2.0750 (2.3483)	Entropy 0.52887 (0.53121)	Top-1 acc 76.953 (67.561)	Top-5 acc 91.797 (86.271)	lr 0.00000
Train [120][2560/3239]	Time 0.340 (0.528)	Data Time 0.001 (0.016)	Loss 2.2141 (2.3480)	Entropy 0.52904 (0.53120)	Top-1 acc 72.656 (67.565)	Top-5 acc 90.625 (86.275)	lr 0.00000
Train [120][2570/3239]	Time 0.223 (0.527)	Data Time 0.001 (0.016)	Loss 2.7753 (2.3482)	Entropy 0.52938 (0.53119)	Top-1 acc 57.422 (67.561)	Top-5 acc 78.516 (86.274)	lr 0.00000
Train [120][2580/3239]	Time 0.237 (0.527)	Data Time 0.001 (0.016)	Loss 2.3280 (2.3481)	Entropy 0.52926 (0.53119)	Top-1 acc 66.406 (67.565)	Top-5 acc 89.062 (86.278)	lr 0.00000
Train [120][2590/3239]	Time 0.228 (0.527)	Data Time 0.001 (0.016)	Loss 2.3216 (2.3482)	Entropy 0.52927 (0.53118)	Top-1 acc 67.969 (67.561)	Top-5 acc 85.547 (86.277)	lr 0.00000
Train [120][2600/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.015)	Loss 2.4328 (2.3482)	Entropy 0.52963 (0.53117)	Top-1 acc 63.672 (67.562)	Top-5 acc 87.109 (86.273)	lr 0.00000
Train [120][2610/3239]	Time 0.225 (0.526)	Data Time 0.001 (0.015)	Loss 2.1905 (2.3480)	Entropy 0.52976 (0.53117)	Top-1 acc 71.094 (67.566)	Top-5 acc 89.844 (86.277)	lr 0.00000
Train [120][2620/3239]	Time 0.226 (0.525)	Data Time 0.001 (0.015)	Loss 2.4175 (2.3479)	Entropy 0.52984 (0.53116)	Top-1 acc 64.844 (67.569)	Top-5 acc 83.594 (86.276)	lr 0.00000
Train [120][2630/3239]	Time 0.316 (0.525)	Data Time 0.001 (0.015)	Loss 2.2950 (2.3481)	Entropy 0.52959 (0.53116)	Top-1 acc 66.797 (67.563)	Top-5 acc 88.672 (86.273)	lr 0.00000
Train [120][2640/3239]	Time 0.229 (0.524)	Data Time 0.001 (0.015)	Loss 2.2564 (2.3480)	Entropy 0.52955 (0.53115)	Top-1 acc 69.141 (67.568)	Top-5 acc 87.891 (86.276)	lr 0.00000
Train [120][2650/3239]	Time 0.237 (0.524)	Data Time 0.001 (0.015)	Loss 2.4728 (2.3480)	Entropy 0.52955 (0.53114)	Top-1 acc 64.062 (67.566)	Top-5 acc 86.328 (86.278)	lr 0.00000
Train [120][2660/3239]	Time 0.230 (0.523)	Data Time 0.001 (0.015)	Loss 2.9359 (2.3482)	Entropy 0.52976 (0.53114)	Top-1 acc 52.344 (67.565)	Top-5 acc 75.000 (86.275)	lr 0.00000
Train [120][2670/3239]	Time 0.228 (0.523)	Data Time 0.001 (0.015)	Loss 2.7319 (2.3484)	Entropy 0.52974 (0.53113)	Top-1 acc 56.250 (67.555)	Top-5 acc 80.469 (86.274)	lr 0.00000
Train [120][2680/3239]	Time 0.322 (0.522)	Data Time 0.002 (0.015)	Loss 2.2783 (2.3485)	Entropy 0.52981 (0.53113)	Top-1 acc 69.141 (67.553)	Top-5 acc 87.109 (86.273)	lr 0.00000
Train [120][2690/3239]	Time 0.316 (0.522)	Data Time 0.003 (0.015)	Loss 2.4781 (2.3481)	Entropy 0.52990 (0.53112)	Top-1 acc 66.797 (67.561)	Top-5 acc 85.156 (86.281)	lr 0.00000
Train [120][2700/3239]	Time 0.344 (0.523)	Data Time 0.002 (0.015)	Loss 2.1367 (2.3481)	Entropy 0.53004 (0.53112)	Top-1 acc 73.047 (67.561)	Top-5 acc 89.062 (86.283)	lr 0.00000
Train [120][2710/3239]	Time 0.237 (0.522)	Data Time 0.001 (0.015)	Loss 2.4665 (2.3481)	Entropy 0.53012 (0.53111)	Top-1 acc 64.844 (67.559)	Top-5 acc 85.938 (86.283)	lr 0.00000
Train [120][2720/3239]	Time 0.340 (0.522)	Data Time 0.001 (0.015)	Loss 2.3663 (2.3480)	Entropy 0.52984 (0.53111)	Top-1 acc 64.844 (67.558)	Top-5 acc 87.109 (86.287)	lr 0.00000
Train [120][2730/3239]	Time 0.232 (0.522)	Data Time 0.001 (0.015)	Loss 2.3588 (2.3480)	Entropy 0.52977 (0.53110)	Top-1 acc 69.141 (67.562)	Top-5 acc 84.766 (86.287)	lr 0.00000
Train [120][2740/3239]	Time 0.239 (0.521)	Data Time 0.001 (0.015)	Loss 2.2032 (2.3477)	Entropy 0.52982 (0.53110)	Top-1 acc 70.703 (67.563)	Top-5 acc 87.109 (86.290)	lr 0.00000
Train [120][2750/3239]	Time 0.223 (0.521)	Data Time 0.001 (0.015)	Loss 2.3921 (2.3475)	Entropy 0.52977 (0.53110)	Top-1 acc 68.750 (67.571)	Top-5 acc 84.766 (86.294)	lr 0.00000
Train [120][2760/3239]	Time 0.262 (0.521)	Data Time 0.001 (0.015)	Loss 2.1620 (2.3474)	Entropy 0.52975 (0.53109)	Top-1 acc 73.438 (67.573)	Top-5 acc 88.672 (86.295)	lr 0.00000
Train [120][2770/3239]	Time 0.234 (0.520)	Data Time 0.001 (0.015)	Loss 2.3666 (2.3476)	Entropy 0.53018 (0.53109)	Top-1 acc 67.969 (67.567)	Top-5 acc 87.109 (86.292)	lr 0.00000
Train [120][2780/3239]	Time 0.232 (0.520)	Data Time 0.001 (0.015)	Loss 2.0860 (2.3475)	Entropy 0.53040 (0.53108)	Top-1 acc 72.266 (67.567)	Top-5 acc 90.625 (86.289)	lr 0.00000
Train [120][2790/3239]	Time 0.335 (0.519)	Data Time 0.001 (0.015)	Loss 2.3629 (2.3476)	Entropy 0.53016 (0.53108)	Top-1 acc 65.234 (67.561)	Top-5 acc 88.281 (86.291)	lr 0.00000
Train [120][2800/3239]	Time 0.335 (0.519)	Data Time 0.003 (0.015)	Loss 2.5096 (2.3478)	Entropy 0.53040 (0.53108)	Top-1 acc 62.500 (67.554)	Top-5 acc 81.641 (86.285)	lr 0.00000
Train [120][2810/3239]	Time 0.228 (0.519)	Data Time 0.001 (0.014)	Loss 2.3641 (2.3479)	Entropy 0.53061 (0.53108)	Top-1 acc 66.797 (67.550)	Top-5 acc 87.500 (86.282)	lr 0.00000
Train [120][2820/3239]	Time 0.233 (0.518)	Data Time 0.001 (0.014)	Loss 2.1645 (2.3480)	Entropy 0.53096 (0.53107)	Top-1 acc 74.609 (67.552)	Top-5 acc 91.406 (86.280)	lr 0.00000
Train [120][2830/3239]	Time 0.423 (0.538)	Data Time 0.003 (0.014)	Loss 2.3054 (2.3480)	Entropy 0.53104 (0.53107)	Top-1 acc 66.797 (67.552)	Top-5 acc 87.500 (86.280)	lr 0.00000
Train [120][2840/3239]	Time 0.269 (0.538)	Data Time 0.002 (0.014)	Loss 2.2924 (2.3480)	Entropy 0.53110 (0.53107)	Top-1 acc 66.797 (67.546)	Top-5 acc 87.500 (86.281)	lr 0.00000
Train [120][2850/3239]	Time 0.230 (0.537)	Data Time 0.001 (0.014)	Loss 2.3298 (2.3479)	Entropy 0.53112 (0.53107)	Top-1 acc 65.625 (67.554)	Top-5 acc 85.156 (86.281)	lr 0.00000
Train [120][2860/3239]	Time 0.235 (0.537)	Data Time 0.001 (0.014)	Loss 2.2378 (2.3479)	Entropy 0.53105 (0.53107)	Top-1 acc 65.625 (67.552)	Top-5 acc 89.844 (86.282)	lr 0.00000
Train [120][2870/3239]	Time 0.236 (0.537)	Data Time 0.001 (0.014)	Loss 2.6299 (2.3477)	Entropy 0.53116 (0.53107)	Top-1 acc 56.641 (67.555)	Top-5 acc 82.031 (86.283)	lr 0.00000
Train [120][2880/3239]	Time 0.353 (0.536)	Data Time 0.001 (0.014)	Loss 2.1999 (2.3477)	Entropy 0.53124 (0.53107)	Top-1 acc 66.406 (67.557)	Top-5 acc 89.844 (86.284)	lr 0.00000
Train [120][2890/3239]	Time 0.233 (0.536)	Data Time 0.001 (0.014)	Loss 2.1781 (2.3477)	Entropy 0.53081 (0.53107)	Top-1 acc 70.703 (67.558)	Top-5 acc 91.016 (86.286)	lr 0.00000
Train [120][2900/3239]	Time 0.240 (0.535)	Data Time 0.001 (0.014)	Loss 2.2135 (2.3475)	Entropy 0.53081 (0.53107)	Top-1 acc 67.578 (67.560)	Top-5 acc 87.891 (86.288)	lr 0.00000
Train [120][2910/3239]	Time 0.230 (0.535)	Data Time 0.001 (0.014)	Loss 2.3528 (2.3479)	Entropy 0.53088 (0.53107)	Top-1 acc 68.750 (67.554)	Top-5 acc 87.109 (86.281)	lr 0.00000
Train [120][2920/3239]	Time 0.250 (0.535)	Data Time 0.001 (0.014)	Loss 2.1159 (2.3478)	Entropy 0.53069 (0.53107)	Top-1 acc 73.438 (67.554)	Top-5 acc 91.406 (86.282)	lr 0.00000
Train [120][2930/3239]	Time 0.269 (0.534)	Data Time 0.001 (0.014)	Loss 2.7431 (2.3478)	Entropy 0.53092 (0.53107)	Top-1 acc 54.688 (67.555)	Top-5 acc 78.906 (86.283)	lr 0.00000
Train [120][2940/3239]	Time 0.257 (0.534)	Data Time 0.001 (0.014)	Loss 2.1150 (2.3477)	Entropy 0.53067 (0.53107)	Top-1 acc 72.266 (67.555)	Top-5 acc 92.578 (86.285)	lr 0.00000
Train [120][2950/3239]	Time 0.333 (0.533)	Data Time 0.001 (0.014)	Loss 2.3779 (2.3480)	Entropy 0.53098 (0.53107)	Top-1 acc 64.844 (67.549)	Top-5 acc 83.594 (86.281)	lr 0.00000
Train [120][2960/3239]	Time 0.230 (0.533)	Data Time 0.001 (0.014)	Loss 2.2094 (2.3477)	Entropy 0.53110 (0.53107)	Top-1 acc 72.656 (67.558)	Top-5 acc 88.281 (86.285)	lr 0.00000
Train [120][2970/3239]	Time 0.306 (0.533)	Data Time 0.002 (0.014)	Loss 2.2122 (2.3476)	Entropy 0.53059 (0.53107)	Top-1 acc 70.312 (67.560)	Top-5 acc 88.672 (86.286)	lr 0.00000
Train [120][2980/3239]	Time 0.228 (0.533)	Data Time 0.001 (0.014)	Loss 2.3278 (2.3478)	Entropy 0.53076 (0.53107)	Top-1 acc 67.578 (67.556)	Top-5 acc 88.281 (86.284)	lr 0.00000
Train [120][2990/3239]	Time 0.234 (0.532)	Data Time 0.001 (0.014)	Loss 2.3158 (2.3475)	Entropy 0.53061 (0.53107)	Top-1 acc 66.016 (67.561)	Top-5 acc 85.938 (86.287)	lr 0.00000
Train [120][3000/3239]	Time 0.243 (0.532)	Data Time 0.001 (0.014)	Loss 2.0922 (2.3473)	Entropy 0.53072 (0.53106)	Top-1 acc 75.781 (67.567)	Top-5 acc 89.844 (86.291)	lr 0.00000
Train [120][3010/3239]	Time 0.253 (0.531)	Data Time 0.001 (0.014)	Loss 2.3640 (2.3475)	Entropy 0.53037 (0.53106)	Top-1 acc 64.844 (67.566)	Top-5 acc 84.766 (86.288)	lr 0.00000
Train [120][3020/3239]	Time 0.261 (0.531)	Data Time 0.001 (0.014)	Loss 2.1994 (2.3473)	Entropy 0.53052 (0.53106)	Top-1 acc 69.531 (67.569)	Top-5 acc 89.844 (86.290)	lr 0.00000
Train [120][3030/3239]	Time 0.243 (0.531)	Data Time 0.001 (0.014)	Loss 2.4749 (2.3473)	Entropy 0.53031 (0.53106)	Top-1 acc 65.234 (67.567)	Top-5 acc 83.594 (86.289)	lr 0.00000
Train [120][3040/3239]	Time 0.246 (0.530)	Data Time 0.001 (0.014)	Loss 2.3541 (2.3474)	Entropy 0.53033 (0.53106)	Top-1 acc 66.797 (67.563)	Top-5 acc 86.719 (86.286)	lr 0.00000
Train [120][3050/3239]	Time 0.304 (0.530)	Data Time 0.001 (0.014)	Loss 2.1740 (2.3475)	Entropy 0.53050 (0.53105)	Top-1 acc 71.875 (67.561)	Top-5 acc 87.109 (86.286)	lr 0.00000
Train [120][3060/3239]	Time 0.221 (0.530)	Data Time 0.001 (0.013)	Loss 2.3794 (2.3478)	Entropy 0.53041 (0.53105)	Top-1 acc 68.359 (67.556)	Top-5 acc 85.547 (86.280)	lr 0.00000
Train [120][3070/3239]	Time 0.232 (0.530)	Data Time 0.001 (0.013)	Loss 2.3138 (2.3477)	Entropy 0.53042 (0.53105)	Top-1 acc 69.922 (67.555)	Top-5 acc 87.500 (86.280)	lr 0.00000
Train [120][3080/3239]	Time 0.225 (0.529)	Data Time 0.001 (0.013)	Loss 2.3454 (2.3479)	Entropy 0.53014 (0.53105)	Top-1 acc 65.234 (67.550)	Top-5 acc 86.719 (86.277)	lr 0.00000
Train [120][3090/3239]	Time 0.258 (0.529)	Data Time 0.001 (0.013)	Loss 2.2053 (2.3478)	Entropy 0.53010 (0.53104)	Top-1 acc 67.578 (67.556)	Top-5 acc 90.234 (86.279)	lr 0.00000
Train [120][3100/3239]	Time 0.229 (0.529)	Data Time 0.001 (0.013)	Loss 2.2163 (2.3476)	Entropy 0.53051 (0.53104)	Top-1 acc 67.578 (67.562)	Top-5 acc 90.625 (86.282)	lr 0.00000
Train [120][3110/3239]	Time 0.327 (0.528)	Data Time 0.001 (0.013)	Loss 2.3812 (2.3477)	Entropy 0.53037 (0.53104)	Top-1 acc 64.844 (67.558)	Top-5 acc 85.938 (86.281)	lr 0.00000
Train [120][3120/3239]	Time 0.234 (0.528)	Data Time 0.001 (0.013)	Loss 2.3339 (2.3476)	Entropy 0.53008 (0.53104)	Top-1 acc 67.578 (67.559)	Top-5 acc 85.938 (86.282)	lr 0.00000
Train [120][3130/3239]	Time 0.220 (0.528)	Data Time 0.001 (0.013)	Loss 2.4157 (2.3474)	Entropy 0.52991 (0.53103)	Top-1 acc 69.531 (67.565)	Top-5 acc 85.156 (86.284)	lr 0.00000
Train [120][3140/3239]	Time 0.234 (0.527)	Data Time 0.001 (0.013)	Loss 2.2912 (2.3473)	Entropy 0.53005 (0.53103)	Top-1 acc 67.578 (67.570)	Top-5 acc 87.109 (86.284)	lr 0.00000
Train [120][3150/3239]	Time 0.265 (0.527)	Data Time 0.001 (0.013)	Loss 2.2466 (2.3471)	Entropy 0.52978 (0.53103)	Top-1 acc 74.609 (67.575)	Top-5 acc 88.281 (86.286)	lr 0.00000
Train [120][3160/3239]	Time 0.224 (0.527)	Data Time 0.001 (0.013)	Loss 2.1659 (2.3472)	Entropy 0.52941 (0.53102)	Top-1 acc 73.828 (67.574)	Top-5 acc 88.281 (86.285)	lr 0.00000
Train [120][3170/3239]	Time 0.222 (0.526)	Data Time 0.001 (0.013)	Loss 2.5600 (2.3473)	Entropy 0.52947 (0.53102)	Top-1 acc 63.281 (67.573)	Top-5 acc 84.375 (86.284)	lr 0.00000
Train [120][3180/3239]	Time 0.318 (0.526)	Data Time 0.000 (0.013)	Loss 2.1464 (2.3471)	Entropy 0.52926 (0.53101)	Top-1 acc 71.094 (67.577)	Top-5 acc 87.500 (86.286)	lr 0.00000
Train [120][3190/3239]	Time 0.231 (0.525)	Data Time 0.000 (0.013)	Loss 2.2298 (2.3471)	Entropy 0.52934 (0.53101)	Top-1 acc 68.359 (67.578)	Top-5 acc 88.672 (86.289)	lr 0.00000
Train [120][3200/3239]	Time 0.232 (0.525)	Data Time 0.000 (0.013)	Loss 2.4522 (2.3473)	Entropy 0.52917 (0.53100)	Top-1 acc 64.062 (67.572)	Top-5 acc 85.156 (86.287)	lr 0.00000
Train [120][3210/3239]	Time 0.225 (0.525)	Data Time 0.000 (0.013)	Loss 2.5483 (2.3474)	Entropy 0.52924 (0.53100)	Top-1 acc 60.938 (67.566)	Top-5 acc 82.031 (86.284)	lr 0.00000
Train [120][3220/3239]	Time 0.236 (0.524)	Data Time 0.000 (0.013)	Loss 2.2393 (2.3476)	Entropy 0.52918 (0.53099)	Top-1 acc 68.750 (67.563)	Top-5 acc 88.281 (86.281)	lr 0.00000
Train [120][3230/3239]	Time 0.240 (0.524)	Data Time 0.000 (0.013)	Loss 2.3221 (2.3476)	Entropy 0.52894 (0.53098)	Top-1 acc 69.531 (67.565)	Top-5 acc 86.719 (86.284)	lr 0.00000
Train [120][3239/3239]	Time 0.940 (0.523)	Data Time 0.000 (0.013)	Loss 2.6921 (2.3476)	Entropy 0.52913 (0.53098)	Top-1 acc 60.494 (67.566)	Top-5 acc 85.185 (86.284)	lr 0.00000
==========Valid [120/120]	loss 1.166	top-1 acc 73.193 (73.193)	top-5 acc 90.685	Train top-1 67.566	top-5 86.284	Entropy 0.52913	Latency-None: 0.000ms	Flops: 539.00M
